diff --git a/xdl/CMakeLists.txt b/xdl/CMakeLists.txt
index 639a207c..7d4df997 100644
--- a/xdl/CMakeLists.txt
+++ b/xdl/CMakeLists.txt
@@ -1,10 +1,12 @@
 project(xdl)
-cmake_minimum_required(VERSION 2.8)
+cmake_minimum_required(VERSION 3.0.0 FATAL_ERROR)
 
+SET(CMAKE_MODULE_PATH "${PROJECT_SOURCE_DIR}/cmake")
 include(${PROJECT_SOURCE_DIR}/cmake/Utils.cmake)
 
 xdl_option(test      "Build all tests."          ON)
 xdl_option(USE_GPU "use gpu" off)
+xdl_option(USE_PS_PLUS "use ps-plus" ON)
 xdl_option(coverage  "Generate coverage analysis"  off)
 
 enable_testing()
@@ -46,12 +48,21 @@ include_directories(
 
 include(cmake/Dependencies.cmake)
 
+set(TBB_ROOT "${PROJECT_SOURCE_DIR}/third_party/tbb/")
+include(${TBB_ROOT}/cmake/TBBBuild.cmake)
+set(CMAKE_CXX_FLAGS "-std=c++1y ${CMAKE_CXX_FLAGS}")
+tbb_build(TBB_ROOT ${TBB_ROOT} CONFIG_DIR TBB_DIR MAKE_ARGS)
+find_package(TBB REQUIRED)
+include_directories("${TBB_ROOT}/include")
+
 IF (USE_GPU)
+   set(CUDA_PATH "/usr/local/cuda-9.0/")
    set(CUDA_TOOLKIT_ROOT_DIR ${CUDA_PATH})
    find_package(CUDA REQUIRED)
    message("-- CUDA_PATH = ${CUDA_PATH} ")
    include(${PROJECT_SOURCE_DIR}/cmake/Cuda.cmake)
    include_directories(
+     ${CUDA_PATH}/targets/x86_64-linux/include/
      ${CUDA_PATH}/include/
      )
    link_directories(
@@ -62,7 +73,7 @@ ENDIF ()
 
 # PS_PLUS
 set(SEASTAR_LIBRARYS -Wl,--whole-archive seastar_service ps_network_static seastar -Wl,--no-whole-archive -L/usr/local/lib64/boost -lboost_timer -lboost_chrono  -laio -lboost_program_options -lboost_system -lboost_filesystem -lm -lboost_thread -lcryptopp -lrt -lgnutls -lgnutlsxx -llz4 -ldl -lgcc_s -lunwind -lhwloc -lnuma -lpciaccess -lxml2 -lz -lcares-seastar libstdc++.a)
-set(PS_LIBRARYS -Wl,--whole-archive libzookeeper.a libhashtable.a ps_common ps_client ps_server ps_model_server ps_plugin_hdfs libevent_core.a glog -Wl,--no-whole-archive ${SEASTAR_LIBRARYS})
+set(PS_LIBRARYS -Wl,--whole-archive libzookeeper.a libhashtable.a ps_common ps_client ps_server ps_scheduler ps_model_server ps_plugin_hdfs libevent_core.a -Wl,--no-whole-archive ${SEASTAR_LIBRARYS})
 include_directories(${PROJECT_SOURCE_DIR}/ps-plus/)
 include_directories(${PROJECT_SOURCE_DIR}/third_party/zookeeper-client/include)
 include_directories(${PROJECT_SOURCE_DIR}/third_party/zookeeper-client/generated)
@@ -96,11 +107,12 @@ IF (MXNET_BACKEND)
 ENDIF()
 
 IF (USE_GPU)
-   set(XDL_CORE_DEPEND_LIB libprotobuf ${PS_LIBRARYS} ${BACKEND_LIB} python2.7 cudart dl)
+   set(XDL_CORE_DEPEND_LIB libprotobuf ${PS_LIBRARYS} ${BACKEND_LIB} python2.7 cudart dl ${TBB_IMPORTED_TARGETS})
 ELSE ()
-   set(XDL_CORE_DEPEND_LIB libprotobuf ${PS_LIBRARYS} ${BACKEND_LIB} python2.7 dl)
+   set(XDL_CORE_DEPEND_LIB libprotobuf ${PS_LIBRARYS} ${BACKEND_LIB} python2.7 dl ${TBB_IMPORTED_TARGETS})
 ENDIF ()
 
+set(XDL_IO_DEPEND_LIB dl rdkafka++ jsoncpp)
 set(XDL_CORE_LIB -Wl,--whole-archive xdl_core -Wl,--no-whole-archive ${XDL_CORE_DEPEND_LIB})
 set(XDL_IO_LIB -Wl,--whole-archive xdl_io -Wl,--no-whole-archive)
 
diff --git a/xdl/cmake/FindNumPy.cmake b/xdl/cmake/FindNumPy.cmake
new file mode 100644
index 00000000..229ff63c
--- /dev/null
+++ b/xdl/cmake/FindNumPy.cmake
@@ -0,0 +1,42 @@
+# Find the Python NumPy package
+# PYTHON_NUMPY_INCLUDE_DIR
+# PYTHON_NUMPY_FOUND
+# will be set by this script
+
+cmake_minimum_required(VERSION 2.6)
+
+if(NOT PYTHON_EXECUTABLE)
+  if(NumPy_FIND_QUIETLY)
+    find_package(PythonInterp QUIET)
+  else()
+    find_package(PythonInterp)
+    set(__numpy_out 1)
+  endif()
+endif()
+
+if (PYTHON_EXECUTABLE)
+  # Find out the include path
+  execute_process(
+    COMMAND "${PYTHON_EXECUTABLE}" -c
+            "from __future__ import print_function\ntry: import numpy; print(numpy.get_include(), end='')\nexcept:pass\n"
+            OUTPUT_VARIABLE __numpy_path)
+  # And the version
+  execute_process(
+    COMMAND "${PYTHON_EXECUTABLE}" -c
+            "from __future__ import print_function\ntry: import numpy; print(numpy.__version__, end='')\nexcept:pass\n"
+    OUTPUT_VARIABLE __numpy_version)
+elseif(__numpy_out)
+  message(STATUS "Python executable not found.")
+endif(PYTHON_EXECUTABLE)
+
+find_path(PYTHON_NUMPY_INCLUDE_DIR numpy/arrayobject.h
+  HINTS "${__numpy_path}" "${PYTHON_INCLUDE_PATH}" NO_DEFAULT_PATH)
+
+if(PYTHON_NUMPY_INCLUDE_DIR)
+  set(PYTHON_NUMPY_FOUND 1 CACHE INTERNAL "Python numpy found")
+endif(PYTHON_NUMPY_INCLUDE_DIR)
+
+include(FindPackageHandleStandardArgs)
+find_package_handle_standard_args(NumPy REQUIRED_VARS PYTHON_NUMPY_INCLUDE_DIR
+                                        VERSION_VAR __numpy_version)
+
diff --git a/xdl/cmake/Utils.cmake b/xdl/cmake/Utils.cmake
index 2f410602..d04165a6 100644
--- a/xdl/cmake/Utils.cmake
+++ b/xdl/cmake/Utils.cmake
@@ -414,6 +414,26 @@ function(xdl_add_test dir extension)
   endforeach()
 endfunction()
 
+function(xdl_add_test_exclude dir extension exclude)
+  file(GLOB TEST_SOURCE "${dir}/*${extension}")
+  foreach(file ${TEST_SOURCE})
+    get_filename_component(file_name ${file} NAME)
+    get_filename_component(file_exe ${file} NAME_WE)
+    if ("${file_name}" STREQUAL "${exclude}" OR "${file_exe}" STREQUAL "${exclude}")
+            message(STATUS "Skip " ${exclude})
+        continue()
+    endif()
+    #message(${extension})
+    #message(${file})
+    #message(${file_exe})
+    #message(${exclude})
+    add_executable(${file_exe} ${file})
+    target_link_libraries(${file_exe} ${ARGN} gcov)
+    set_target_properties(${file_exe} PROPERTIES COMPILE_FLAGS "-g -O0 --coverage")
+    add_test(${file_exe} ${file_exe} COMMAND ${file_exe})
+  endforeach()
+endfunction()
+
 function(xdl_add_cuda_test dir extension)
   file(GLOB TEST_SOURCE "${dir}/*${extension}")
   foreach(file ${TEST_SOURCE})
diff --git a/xdl/distributed/install_xdl_submit.sh b/xdl/distributed/install_xdl_submit.sh
index b8c03ab1..739fa44e 100644
--- a/xdl/distributed/install_xdl_submit.sh
+++ b/xdl/distributed/install_xdl_submit.sh
@@ -22,4 +22,6 @@ fi
 
 cd $(dirname ${BASH_SOURCE[0]})
 cp ./xdl_submit/xdl_submit.py /usr/bin/xdl_submit.py
+chmod 777 /usr/bin/xdl_submit.py
 cp ./xdl_yarn_scheduler/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar /usr/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar
+chmod 777 /usr/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar
diff --git a/xdl/distributed/xdl_yarn_scheduler/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar b/xdl/distributed/xdl_yarn_scheduler/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar
index 4ae183e0..b106e363 100644
Binary files a/xdl/distributed/xdl_yarn_scheduler/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar and b/xdl/distributed/xdl_yarn_scheduler/bin/xdl-yarn-scheduler-1.0.0-SNAPSHOT-jar-with-dependencies.jar differ
diff --git a/xdl/distributed/xdl_yarn_scheduler/pom.xml b/xdl/distributed/xdl_yarn_scheduler/pom.xml
index 0b007d8b..43ce157a 100644
--- a/xdl/distributed/xdl_yarn_scheduler/pom.xml
+++ b/xdl/distributed/xdl_yarn_scheduler/pom.xml
@@ -76,7 +76,7 @@
 		<dependency>
 			<groupId>com.alibaba</groupId>
 			<artifactId>fastjson</artifactId>
-			<version>1.2.28</version>
+			<version>1.2.58</version>
 		</dependency>
 	</dependencies>
 
diff --git a/xdl/examples/mnist/mnist.py b/xdl/examples/mnist/mnist.py
index c14f4a34..bef5484f 100644
--- a/xdl/examples/mnist/mnist.py
+++ b/xdl/examples/mnist/mnist.py
@@ -80,7 +80,7 @@ def model(images, labels):
 
 @xdl.tf_wrapper(is_training=False)
 def eval_model(images, labels):
-    with tf.variable_scope("train", reuse=True):
+    with tf.variable_scope("train", reuse=tf.AUTO_REUSE):
         eval_y = fc(images, [784, 10], [10])
         labels_test = tf.cast(labels, tf.int64)
         correct_prediction = tf.equal(tf.argmax(eval_y, 1), labels_test)
diff --git a/xdl/ps-plus/CMakeLists.txt b/xdl/ps-plus/CMakeLists.txt
index cb896f6b..4761d25a 100755
--- a/xdl/ps-plus/CMakeLists.txt
+++ b/xdl/ps-plus/CMakeLists.txt
@@ -1,28 +1,90 @@
-cmake_minimum_required(VERSION 2.8)
+cmake_minimum_required(VERSION 3.0.0 FATAL_ERROR)
 project(ps-plus)
 
 if (DEBUG)
    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -fPIC -std=c++1y -D_GLIBCXX_USE_CXX11_ABI=0")
 else ()
-     set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -fPIC -std=c++1y -g -DNDEBUG -D_GLIBCXX_USE_CXX11_ABI=0")
+   set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -fPIC -std=c++1y -g -DNDEBUG -D_GLIBCXX_USE_CXX11_ABI=0")
 endif ()
 
 if (APPLE)
   set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS}")
 elseif (UNIX)
   set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -pthread")
-endif()
+endif ()
+
+include_directories(.)
+
+set(CMAKE_SKIP_BUILD_RPATH FALSE)
+set(CMAKE_BUILD_WITH_INSTALL_RPATH TRUE)
+set(CMAKE_INSTALL_RPATH "/usr/local/lib:/usr/local/lib64/boost:/usr/local/gcc-5.3.0/lib64")
+set(CMAKE_INSTALL_RPATH_USE_LINK_PATH TRUE)
+
+# build third_party libraries using cmake
+function (third_party_library_builder_cmake arg)
+list(LENGTH ARGV  argv_len)
+    set(i 0)
+    while( i LESS ${argv_len})
+        list(GET ARGV ${i} argv_value)
+        message(STATUS "start build third_party library:${argv_value}")
+        execute_process(COMMAND bash -c "cd ${PROJECT_SOURCE_DIR}/third_party/${argv_value}; mkdir -p build; cd build; cmake .. -DCMAKE_INSTALL_PREFIX=. -DCMAKE_CXX_FLAGS=-D_GLIBCXX_USE_CXX11_ABI=0; make; make install; cd ${PROJECT_SOURCE_DIR}")
+        IF(EXISTS "${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/include")
+          include_directories("${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/include")
+        ENDIF()
+        IF(EXISTS "${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib")
+            link_directories("${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib")
+        ENDIF()
+        IF(EXISTS "${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib64")
+            link_directories("${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib64")
+        ENDIF()
+        math(EXPR i "${i} + 1")
+    endwhile()
+endfunction ()
+
+# build third_party libraries using autotools
+function (third_party_library_builder_autotools arg)
+    list(LENGTH ARGV argv_len)
+    set(i 0)
+    while (i LESS ${argv_len})
+        list(GET ARGV ${i} argv_value)
+	message(STATUS "Start to build third_party library: ${argv_value}")
+	execute_process(COMMAND bash -c "
+	    cd ${PROJECT_SOURCE_DIR}/third_party/${argv_value};
+            mkdir -p build;
+            ./configure --prefix=$(pwd)/build CXXFLAGS='-D_GLIBCXX_USE_CXX11_ABI=0' LDFLAGS='-D_GLIBCXX_USE_CXX11_ABI=0';
+            make;
+            make install;
+            cd ${PROJECT_SOURCE_DIR}")
+	if (EXISTS "${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/include")
+    include_directories("${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/include")
+	endif ()
+	if (EXISTS "${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib")
+            link_directories("${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib")
+	endif ()
+	if (EXISTS "${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib64")
+            link_directories("${PROJECT_SOURCE_DIR}/third_party/${argv_value}/build/lib64")
+	endif ()
+	math(EXPR i "${i} + 1")
+    endwhile ()
+endfunction ()
 
 set(CMAKE_SHARED_LIBRARY_SUFFIX ".so")
+function (compile_protobuf dir)
+  file(GLOB pbs ${PROJECT_SOURCE_DIR}/${dir}/*.proto)
+  execute_process(COMMAND ${PROTOBUF_PROTOC_EXECUTABLE} ${pbs} --cpp_out=${PROJECT_SOURCE_DIR} --proto_path=${PROJECT_SOURCE_DIR})
+endfunction()
 
-include_directories(.)
+find_package(NumPy REQUIRED)
+find_package(PythonLibs REQUIRED)
 
 link_directories(${PROJECT_BINARY_DIR}/third_party/googletest/)
 link_directories(${PROJECT_BINARY_DIR}/third_party/zookeeper-client/)
-link_directories(${PROJECT_BINARY_DIR}/third_party/glog/)
+include_directories("${PYTHON_NUMPY_INCLUDE_DIR}")
+include_directories("${PYTHON_INCLUDE_DIRS}")
 
-include_directories(${PROJECT_SOURCE_DIR}/third_party/glog/)
 include_directories(${PROJECT_SOURCE_DIR}/third_party/hdfs/)
+include_directories(${PROJECT_SOURCE_DIR}/third_party/seastar/ ${PROJECT_SOURCE_DIR}/third_party/seastar/fmt ${PROJECT_SOURCE_DIR}/third_party/seastar/c-ares)
+link_directories("${PROJECT_SOURCE_DIR}/third_party/seastar/lib")
 
 aux_source_directory(ps-plus/service/seastar/lib SEASTAR_LIB)
 add_library(seastar_service STATIC ${SEASTAR_LIB})
@@ -35,7 +97,7 @@ if (USE_HDFS OR NOT DEFINED USE_HDFS)
   SET(PLUGINS ${PLUGINS} ps_plugin_hdfs)
 endif()
 
-set(LIBRARYS  -Wl,--whole-archive ps_common ps_server ps_model_server ps_client ps_scheduler libhashtable.a libzookeeper.a libevent_core.a ${PLUGINS} glog -Wl,--no-whole-archive ${PLUGINS_DEPENDENCY} ${SEASTAR_LIBRARYS})
+set(LIBRARYS  -Wl,--whole-archive ps_common ps_server ps_model_server ps_client ps_scheduler libhashtable.a libzookeeper.a libevent_core.a ${PLUGINS} -Wl,--no-whole-archive ${PLUGINS_DEPENDENCY} ${SEASTAR_LIBRARYS} ${PYTHON_LIBRARIES})
 
 aux_source_directory(ps-plus/common COMMON)
 aux_source_directory(ps-plus/common/initializer COMMON_INITIALIZER)
@@ -52,7 +114,6 @@ aux_source_directory(ps-plus/scheduler/test SCHEDULER_TEST)
 aux_source_directory(ps-plus/main MAIN)
 aux_source_directory(ps-plus/model_server MODEL_SERVER)
 aux_source_directory(ps-plus/model_server/test MODEL_SERVER_TEST)
-aux_source_directory(ps-plus/tool CLIENT_TOOL)
 aux_source_directory(ps-plus/profiler PROFILER)
 aux_source_directory(ps-plus/common/test COMMON_TEST)
 aux_source_directory(ps-plus/common/initializer/test COMMON_INITIALIZER_TEST)
@@ -72,7 +133,7 @@ add_library(ps_client STATIC ${CLIENT} ${CLIENT_PARTITIONER})
 add_library(ps_plugin_hdfs STATIC ${PLUGINS_HDFS})
 
 add_executable(ps ${MAIN})
-add_executable(tool ${CLIENT_TOOL})
+add_executable(tool ps-plus/tool/client_tool.cpp)
 
 # tests
 add_executable(ps_common_test ${COMMON_TEST} ${COMMON_INITIALIZER_TEST} ${SRC_TEST_UTIL})
@@ -85,15 +146,15 @@ add_executable(ps_scheduler_test ${SCHEDULER_TEST})
 # profiler
 add_executable(ps_profiler ${PROFILER})
 
-target_link_libraries(ps ${LIBRARYS} libjemalloc.a)
-target_link_libraries(tool ${LIBRARYS} libjemalloc.a)
-target_link_libraries(ps_common_test ${LIBRARYS} gtest gtest_main libjemalloc.a)
-target_link_libraries(ps_message_test ${LIBRARYS} gtest gtest_main libjemalloc.a)
-target_link_libraries(ps_model_server_test ${LIBRARYS} gtest gtest_main libjemalloc.a)
-target_link_libraries(ps_server_test ${LIBRARYS} gtest gtest_main libjemalloc.a)
-target_link_libraries(ps_client_test ${LIBRARYS} gtest gtest_main libjemalloc.a)
-target_link_libraries(ps_scheduler_test ${LIBRARYS} gtest gtest_main libjemalloc.a)
-target_link_libraries(ps_profiler ${LIBRARYS} libjemalloc.a)
+target_link_libraries(ps ${LIBRARYS} libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(tool ${LIBRARYS} libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_common_test ${LIBRARYS} gtest gtest_main libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_message_test ${LIBRARYS} gtest gtest_main libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_model_server_test ${LIBRARYS} gtest gtest_main libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_server_test ${LIBRARYS} gtest gtest_main libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_client_test ${LIBRARYS} gtest gtest_main libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_scheduler_test ${LIBRARYS} gtest gtest_main libjemalloc.a ${TBB_IMPORTED_TARGETS})
+target_link_libraries(ps_profiler ${LIBRARYS} libjemalloc.a ${TBB_IMPORTED_TARGETS})
 
 enable_testing()
 add_test(NAME ps_common_test COMMAND ps_common_test)
diff --git a/xdl/ps-plus/README.md b/xdl/ps-plus/README.md
index 8461cf40..14861b37 100644
--- a/xdl/ps-plus/README.md
+++ b/xdl/ps-plus/README.md
@@ -1,3 +1,18 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
 #ps-plus使用
 
 ps-plus是底层的ps组件，可单独介入到其他的业务系统中。简单实用如下：
diff --git a/xdl/ps-plus/ps-plus/client/base_client.h b/xdl/ps-plus/ps-plus/client/base_client.h
index edb96a98..92ab3cd6 100644
--- a/xdl/ps-plus/ps-plus/client/base_client.h
+++ b/xdl/ps-plus/ps-plus/client/base_client.h
@@ -22,9 +22,11 @@ limitations under the License.
 #include "ps-plus/common/status.h"
 #include "ps-plus/common/tensor.h"
 #include "ps-plus/message/variable_info.h"
+#include "ps-plus/message/worker_state.h"
 
 #include "ps-plus/client/udf.h"
 #include "ps-plus/client/partitioner.h"
+#include "ps-plus/client/merged_partitioner.h"
 
 namespace ps {
 namespace client {
@@ -37,17 +39,35 @@ class BaseClient {
   virtual Status Init() = 0;
   virtual void Save(const std::string& name, const Callback& cb) = 0;
   virtual void Restore(const std::string& name, const Callback& cb) = 0;
-  virtual void TriggerStreamingModelDense(const Callback& cb) = 0;
-  virtual void TriggerStreamingModelSparse(const Callback& cb) = 0;
-  virtual void TriggerStreamingModelHash(const Callback& cb) = 0;
-
+  virtual void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) = 0;
+  virtual void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) = 0;
+  virtual void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) = 0;
+  virtual Status InitGlobalQueue(
+      const std::string& name,
+      const std::vector<std::string>& paths,
+      size_t epochs,
+      bool epoch_isolate = false) = 0;
+  virtual Status GetNextFile(
+      const std::string& name,
+      size_t worker_id,
+      std::string* path,
+      size_t* begin,
+      size_t* epoch) = 0;
+  virtual Status ReportWorkerState(
+      const std::string& name,
+      size_t worker_id,
+      const std::vector<WorkerState>& worker_states) = 0;
+  virtual Status RestoreWorkerState(
+      const std::string& name,
+      size_t worker_id) = 0;
   virtual Status RegisterVariable(const std::string& name, const VariableInfo& info) = 0;
-
   virtual void AsynchronizeEnter(int id, int staleness, int worker_count, const Callback& cb) = 0; 
   virtual void SynchronizeEnter(int id, int worker_count, const Callback& cb) = 0;
   virtual void SynchronizeLeave(int id, const Callback& cb) = 0;
   virtual void WorkerReportFinish(int id, const Callback& cb) = 0;
+  virtual void GetWorkerFinishCount(int64_t* count, const Callback& cb) = 0;  
   virtual void WorkerBarrier(int id, int worker_count, const Callback& cb) = 0;
+  virtual void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) = 0;
   virtual void ModelServerForward(int type, const Tensor& ids, Tensor* rst, const Callback& cb) = 0;
   virtual void ModelServerBackward(int type, const Tensor& ids, const Tensor& grads, const Callback& cb) = 0;
 
@@ -58,7 +78,7 @@ class BaseClient {
                                    const Tensor& init, 
                                    const Callback& cb) = 0;
   virtual void HashInitializer(const std::string& variable_name, 
-                               Initializer* init, 
+                               Initializer* init,
                                const Callback& cb) = 0;
   virtual void IsInitialized(const std::string& variable_name, 
                              bool* inited, 
@@ -80,23 +100,54 @@ class BaseClient {
                           const std::vector<Data*>& data, 
                           const Callback& cb) = 0;
   virtual void HashPull(const std::string& variable_name, 
-                        const Tensor& ids, 
-                        double add_probability,
+                        const Tensor& ids,
+                        const float& save_ratio,
                         Tensor* result, 
                         const Callback& cb) = 0;
+  virtual void MergedHashPull(const std::vector<std::string>& var_names, 
+                              const std::vector<Tensor>& ids,
+                              const std::vector<float>& save_ratios,
+                              std::vector<Tensor>* result, 
+                              const Callback& cb) = 0;
   virtual void HashPush(const std::string& variable_name, 
-                        const Tensor& ids, 
-                        const std::string& updater, 
+                        const Tensor& ids,
+                        const float& save_ratio,
+                        const bool& insertable,
+                        const std::string& updater,
                         const std::vector<Data*>& data, 
                         const Callback& cb) = 0;
+  virtual void MergedHashPush(const std::vector<std::string>& var_names,
+                              const std::vector<Tensor>& ids,
+                              const std::vector<float>& save_ratios,
+                              const std::string& updater,
+                              const std::vector<Data*>& data,
+                              const Callback& cb) = 0;
+  virtual void MergedHashStatis(const std::vector<std::string>& var_names,
+                                const std::vector<Tensor>& ids,
+                                const std::vector<float>& save_ratios,
+                                const std::vector<Tensor>& clicks,
+                                const Tensor& global_step,
+                                const Tensor& statis_decay,
+                                const Tensor& statis_decay_period,
+                                const std::string& statis_type,
+                                std::vector<Tensor>* result,
+                                const Callback& cb) = 0;
+
+  virtual void Process(const UdfChain& udf, 
+               const std::string& var_name,
+               const std::vector<Data*>& datas,
+               const std::vector<Partitioner*>& splitter,
+               const std::vector<Partitioner*>& combiner,
+               std::vector<std::unique_ptr<Data>>* results,
+               const Callback& cb) = 0;
 
   virtual void Process(const UdfChain& udf, 
-		       const std::string& var_name,
-		       const std::vector<Data*>& datas,
-		       const std::vector<Partitioner*>& splitter,
-		       const std::vector<Partitioner*>& combiner,
-		       std::vector<std::unique_ptr<Data>>* results,
-		       const Callback& cb) = 0;
+           const std::vector<std::string>& var_names,
+           const std::vector<Data*>& datas,
+           const std::vector<MergedPartitioner*>& splitter,
+           const std::vector<MergedPartitioner*>& combiner,
+           std::vector<std::vector<std::unique_ptr<Data>>>* results,
+           const Callback& cb) = 0;
 
   template <typename... Targs>
   std::vector<Data*> Args(Targs&&... args) {
diff --git a/xdl/ps-plus/ps-plus/client/client.cc b/xdl/ps-plus/ps-plus/client/client.cc
index 736add32..bdcff71a 100644
--- a/xdl/ps-plus/ps-plus/client/client.cc
+++ b/xdl/ps-plus/ps-plus/client/client.cc
@@ -18,8 +18,10 @@ limitations under the License.
 #include "ps-plus/client/partitioner/logic.h"
 #include "ps-plus/client/partitioner/sparse.h"
 #include "ps-plus/client/partitioner/broadcast.h"
+#include "ps-plus/client/partitioner/merged_broadcast.h"
 #include "ps-plus/client/partitioner/index.h"
 #include "ps-plus/client/partitioner/hash.h"
+#include "ps-plus/client/partitioner/merged_hash.h"
 
 #include <iostream>
 #include <cstdlib>
@@ -91,18 +93,26 @@ void Client::IdentityInitializer(const std::string& variable_name,
 }
 
 void Client::HashInitializer(const std::string& variable_name, 
-                             Initializer* init, 
+                             Initializer* init,
                              const Client::Callback& cb) {
-  std::vector<Data*> inputs = Args(0, 0, std::unique_ptr<Initializer>(init));
+  VariableInfo info;
+  CHECK_ASYNC(GetVariableInfo(variable_name, &info));
+  std::string extra_info;
+  for (auto& arg : info.args) {
+    extra_info += arg.first + "=" + arg.second + "&";
+  }
+  if (!extra_info.empty()) { extra_info.pop_back(); }
+  std::vector<Data*> inputs = Args(0, 0, extra_info, std::unique_ptr<Initializer>(init));
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
   std::vector<Partitioner*> splitter = {
     new partitioner::HashDataType, 
     new partitioner::HashShape, 
+    new partitioner::Broadcast,
     new partitioner::Broadcast
   };
   std::vector<Partitioner*> combiner = {};
-  UdfData udf("HashVariableInitializer", UdfData(0), UdfData(1), UdfData(2));
+  UdfData udf("HashVariableInitializer", UdfData(0), UdfData(1), UdfData(2), UdfData(3));
   Callback realcb = [cb, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
     cb(st);
@@ -150,7 +160,7 @@ void Client::DensePull(const std::string& variable_name,
   std::vector<Partitioner*> combiner = { new partitioner::Dense };
   UdfData udf("BuildDenseSlice", UdfData(0));
   UdfData udf_chain("TransSlice", udf);
-  Callback realcb = [this, cb, result, outputs, &variable_name](const Status& st) {
+  Callback realcb = [this, cb, result, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
     if (!st.IsOk()) {
       cb(st);
@@ -217,7 +227,8 @@ void Client::DensePush(const std::string& variable_name,
 
   inputs.insert(inputs.end(), data.begin(), data.end());
   for (size_t i = start_index; i < inputs.size(); i++) {
-    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr) {
+    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr
+      || dynamic_cast<WrapperData<std::vector<Tensor>>*>(inputs[i]) != nullptr) {
       splitter.push_back(new partitioner::Dense);
     } else {
       splitter.push_back(new partitioner::Broadcast);
@@ -323,7 +334,8 @@ void Client::SparsePush(const std::string& variable_name,
   
   inputs.insert(inputs.end(), data.begin(), data.end());
   for (size_t i = start_index; i < inputs.size(); i++) {
-    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr) {
+    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr
+      || dynamic_cast<WrapperData<std::vector<Tensor>>*>(inputs[i]) != nullptr) {
       splitter.push_back(new partitioner::SparseData);
     } else {
       splitter.push_back(new partitioner::Broadcast);
@@ -342,22 +354,27 @@ void Client::SparsePush(const std::string& variable_name,
 }
 
 void Client::HashPull(const std::string& variable_name, 
-                      const Tensor& ids, 
-                      double add_probability, 
-                      Tensor* result, 
+                      const Tensor& ids,
+                      const float& save_ratio,
+                      Tensor* result,
                       const Client::Callback& cb) {
-  std::vector<Data*> inputs = Args(ids, false, add_probability);
+  std::vector<Tensor> ids_vec = {ids};
+  std::vector<std::string> name_vec = {variable_name};
+  std::vector<float> save_ratio_vec = {save_ratio};  
+  std::vector<Data*> inputs = Args(ids_vec, name_vec, save_ratio_vec, false, true);
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
   std::vector<Partitioner*> splitter = {
     new partitioner::HashId, 
     new partitioner::Broadcast, 
-    new partitioner::Broadcast
+    new partitioner::Broadcast,
+    new partitioner::Broadcast,    
+    new partitioner::Broadcast    
   };
   std::vector<Partitioner*> combiner = {
     new partitioner::HashData
   };
-  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2));
+  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4));
   UdfData udf_chain("TransSlice", udf);
   Callback realcb = [cb, result, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
@@ -393,23 +410,81 @@ void Client::HashPull(const std::string& variable_name,
   }
 }
 
+void Client::MergedHashPull(const std::vector<std::string>& var_names, 
+                            const std::vector<Tensor>& ids,
+                            const std::vector<float>& save_ratios,
+                            std::vector<Tensor>* result, 
+                            const Client::Callback& cb) {
+  std::vector<Data*> inputs = Args(ids, var_names, save_ratios, false, true);
+  std::vector<std::vector<std::unique_ptr<Data>>>* outputs = 
+    new std::vector<std::vector<std::unique_ptr<Data>>>;
+  std::vector<MergedPartitioner*> splitter = {
+    new partitioner::MergedHashId, 
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast
+  };
+  std::vector<MergedPartitioner*> combiner = {
+    new partitioner::MergedHashData
+  };
+  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4));
+  Callback realcb = [cb, result, outputs, var_names](const Status& st) {
+    std::unique_ptr<std::vector<std::vector<std::unique_ptr<Data>>>> deleter(outputs);
+    if (!st.IsOk()) {
+      cb(st);
+      return;
+    }
+
+    if (outputs->size() != 1) {
+      cb(Status::ArgumentError("Output Size Should be 1 on MergedHashPull"));
+      return;
+    }
+
+    std::vector<std::unique_ptr<Data>>& output_vec = (*outputs)[0];
+    if (output_vec.size() != var_names.size()) {
+      cb(Status::ArgumentError("Output[0] Size Should be the Same with Variable Number"));
+      return;
+    }
+    for (auto& output : output_vec) {
+      WrapperData<Tensor>* output_ptr = dynamic_cast<WrapperData<Tensor>*>(output.get());
+      if (output_ptr == nullptr) {
+        cb(Status::ArgumentError("Output[0] should be tensor vector"));
+        return;
+      }
+      (*result).push_back(output_ptr->Internal());   
+    }
+    cb(Status::Ok());
+  };
+
+  Process(udf, var_names, inputs, splitter, 
+          combiner, outputs, realcb);
+}
+
 void Client::HashPush(const std::string& variable_name, 
-                      const Tensor& ids, 
-                      const std::string& updater, 
+                      const Tensor& ids,
+                      const float& save_ratio,
+                      const bool& insertable,
+                      const std::string& updater,
                       const std::vector<Data*>& data, 
                       const Client::Callback& cb) {
-  std::vector<Data*> inputs = Args(ids, true, 0.0);
-  size_t start_index = 3;
+  std::vector<Tensor> ids_vec = {ids};
+  std::vector<std::string> name_vec = {variable_name};
+  std::vector<float> save_ratio_vec = {save_ratio};  
+  std::vector<Data*> inputs = Args(ids_vec, name_vec, save_ratio_vec, true, insertable);
+  size_t start_index = 5;
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
   std::vector<Partitioner*> splitter = {
     new partitioner::HashId, 
-    new partitioner::Broadcast, 
-    new partitioner::Broadcast
+    new partitioner::Broadcast,
+    new partitioner::Broadcast,     
+    new partitioner::Broadcast,
+    new partitioner::Broadcast    
   };
   std::vector<Partitioner*> combiner = {};
   std::vector<UdfData> next_udf_inputs = {
-    UdfData("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2))
+    UdfData("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4))
   };
 
   if (sync_mode_ && 
@@ -419,20 +494,21 @@ void Client::HashPush(const std::string& variable_name,
       updater != "MovingAverageUpdater") {    
     inputs.push_back(Args(token_)[0]);
     inputs.push_back(Args(worker_count_)[0]);
-    next_udf_inputs.push_back(UdfData(3));
-    next_udf_inputs.push_back(UdfData(4));
-    next_udf_inputs.push_back(UdfData(5));    
+    next_udf_inputs.push_back(UdfData(5));
+    next_udf_inputs.push_back(UdfData(6));
+    next_udf_inputs.push_back(UdfData(7));    
     splitter.push_back(new partitioner::Broadcast);
     splitter.push_back(new partitioner::Broadcast);
     splitter.push_back(new partitioner::HashData);    
     UdfData aggregate("AggregateSlice", next_udf_inputs);
     next_udf_inputs = {aggregate};
-    start_index = 6;
+    start_index = 8;
   }
   
   inputs.insert(inputs.end(), data.begin(), data.end());
   for (size_t i = start_index; i < inputs.size(); i++) {
-    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr) {
+    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr
+      || dynamic_cast<WrapperData<std::vector<Tensor>>*>(inputs[i]) != nullptr) {
       splitter.push_back(new partitioner::HashData);
     } else {
       splitter.push_back(new partitioner::Broadcast);
@@ -450,5 +526,128 @@ void Client::HashPush(const std::string& variable_name,
           combiner, outputs, realcb);
 }
 
+void Client::MergedHashPush(const std::vector<std::string>& var_names,
+                            const std::vector<Tensor>& ids,
+                            const std::vector<float>& save_ratios,
+                            const std::string& updater,
+                            const std::vector<Data*>& data,
+                            const Client::Callback& cb) {
+  std::vector<Data*> inputs = Args(ids, var_names, save_ratios, true, false);
+  size_t start_index = 5;
+  std::vector<std::vector<std::unique_ptr<Data>>>* outputs = 
+    new std::vector<std::vector<std::unique_ptr<Data>>>;
+  std::vector<MergedPartitioner*> splitter = {
+    new partitioner::MergedHashId,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,    
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast
+  };
+  std::vector<MergedPartitioner*> combiner = {};
+  std::vector<UdfData> next_udf_inputs = {
+    UdfData("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4))
+  };
+
+  if (sync_mode_ && 
+      updater != "AssignUpdater" && 
+      updater != "AssignAddUpdater" && 
+      updater != "AssignSubUpdater" &&
+      updater != "MovingAverageUpdater") {    
+    inputs.push_back(Args(token_)[0]);
+    inputs.push_back(Args(worker_count_)[0]);
+    next_udf_inputs.push_back(UdfData(5));
+    next_udf_inputs.push_back(UdfData(6));
+    next_udf_inputs.push_back(UdfData(7));    
+    splitter.push_back(new partitioner::MergedBroadcast);
+    splitter.push_back(new partitioner::MergedBroadcast);
+    splitter.push_back(new partitioner::MergedHashData);    
+    UdfData aggregate("AggregateSlice", next_udf_inputs);
+    next_udf_inputs = {aggregate};
+    start_index = 8;
+  }
+  
+  inputs.insert(inputs.end(), data.begin(), data.end());
+  for (size_t i = start_index; i < inputs.size(); i++) {
+    if (dynamic_cast<WrapperData<Tensor>*>(inputs[i]) != nullptr
+      || dynamic_cast<WrapperData<std::vector<Tensor>>*>(inputs[i]) != nullptr) {
+      splitter.push_back(new partitioner::MergedHashData);
+    } else {
+      splitter.push_back(new partitioner::MergedBroadcast);
+    }
+    next_udf_inputs.push_back(UdfData(i));
+  }
+
+  UdfData udf(updater, next_udf_inputs);
+  Callback realcb = [cb, outputs](const Status& st) {
+    std::unique_ptr<std::vector<std::vector<std::unique_ptr<Data>>>> deleter(outputs);
+    cb(st);
+  };
+
+  Process(udf, var_names, inputs, splitter, 
+          combiner, outputs, realcb);
+}
+
+void Client::MergedHashStatis(const std::vector<std::string>& var_names,
+                              const std::vector<Tensor>& ids,
+                              const std::vector<float>& save_ratios,
+                              const std::vector<Tensor>& clicks,
+                              const Tensor& global_step,
+                              const Tensor& statis_decay,
+                              const Tensor& statis_decay_period,
+                              const std::string& statis_type,
+                              std::vector<Tensor>* result,
+                              const Client::Callback& cb) {
+  std::vector<Data*> inputs = Args(ids, var_names, save_ratios, clicks, global_step, statis_decay, statis_decay_period, statis_type, false, true);
+  std::vector<std::vector<std::unique_ptr<Data>>>* outputs =
+    new std::vector<std::vector<std::unique_ptr<Data>>>;
+  std::vector<MergedPartitioner*> splitter = {
+    new partitioner::MergedHashId,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,    
+    new partitioner::MergedHashData,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,
+    new partitioner::MergedBroadcast,    
+    new partitioner::MergedBroadcast
+  };
+  std::vector<MergedPartitioner*> combiner = {
+    new partitioner::MergedHashData
+  };
+  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(8), UdfData(9));
+  UdfData udf_chain("StatisSlice", udf, UdfData(3), UdfData(4), UdfData(5), UdfData(6), UdfData(7));
+  Callback realcb = [cb, result, outputs, var_names](const Status& st) {
+    std::unique_ptr<std::vector<std::vector<std::unique_ptr<Data>>>> deleter(outputs);
+    if (!st.IsOk()) {
+      cb(st);
+      return;
+    }
+
+    if (outputs->size() != 1) {
+      cb(Status::ArgumentError("Output Size Should be 1 on MergedHashStatis"));
+      return;
+    }
+
+    std::vector<std::unique_ptr<Data>>& output_vec = (*outputs)[0];
+    if (output_vec.size() != var_names.size()) {
+      cb(Status::ArgumentError("Output[0] Size Should be the Same with Variable Number"));
+      return;
+    }
+    for (auto& output : output_vec) {
+      WrapperData<Tensor>* output_ptr = dynamic_cast<WrapperData<Tensor>*>(output.get());
+      if (output_ptr == nullptr) {
+        cb(Status::ArgumentError("Output[0] should be tensor vector"));
+        return;
+      }
+      result->push_back(output_ptr->Internal());
+    }
+    cb(Status::Ok());
+  };
+
+  Process(udf_chain, var_names, inputs, splitter,
+          combiner, outputs, realcb);
+}
+
 } //namespace client
 } //namespace ps
diff --git a/xdl/ps-plus/ps-plus/client/client.h b/xdl/ps-plus/ps-plus/client/client.h
index 1579106d..57660e7f 100644
--- a/xdl/ps-plus/ps-plus/client/client.h
+++ b/xdl/ps-plus/ps-plus/client/client.h
@@ -19,6 +19,7 @@ limitations under the License.
 #include <iostream>
 #include <memory>
 
+#include "ps-plus/common/logging.h"
 #include "ps-plus/client/raw_client.h"
 #include "ps-plus/client/base_client.h"
 #include "ps-plus/common/tensor.h"
@@ -44,11 +45,22 @@ class Client: public BaseClient {
     const std::vector<Data*>& datas,
     const std::vector<Partitioner*>& splitter,
     const std::vector<Partitioner*>& combiner,
-    std::vector<std::unique_ptr<Data>>* results,
+    std::vector<std::unique_ptr<Data> >* results,
     const Callback& cb) override {
     return raw_->Process(udf, var_name, datas, splitter, combiner, results, cb);
   }
 
+  void Process(
+    const UdfChain& udf, 
+    const std::vector<std::string>& var_names,
+    const std::vector<Data*>& datas,
+    const std::vector<MergedPartitioner*>& splitter,
+    const std::vector<MergedPartitioner*>& combiner,
+    std::vector<std::vector<std::unique_ptr<Data> > >* results,
+    const Callback& cb) override {
+    return raw_->Process(udf, var_names, datas, splitter, combiner, results, cb);
+  }
+
   void Save(const std::string& name, const Callback& cb) override {
     return raw_->Save(name, cb);
   }
@@ -57,16 +69,46 @@ class Client: public BaseClient {
     return raw_->Restore(name, cb);
   }
 
-  void TriggerStreamingModelDense(const Callback& cb) override {
-    return raw_->TriggerStreamingModelDense(cb);
+  void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) override {
+    return raw_->TriggerStreamingModelDense(stream_ver, cb);
+  }
+
+  Status InitGlobalQueue(
+      const std::string& name,
+      const std::vector<std::string>& paths,
+      size_t epochs,
+      bool epoch_isolate = false) override {
+    return raw_->InitGlobalQueue(name, paths, epochs, epoch_isolate);
+  }
+
+  Status GetNextFile(
+      const std::string& name,
+      size_t worker_id,
+      std::string* path,
+      size_t* begin,
+      size_t* epoch) override {
+    return raw_->GetNextFile(name, worker_id, path, begin, epoch);
+  }
+
+  Status ReportWorkerState(
+      const std::string& name,
+      size_t worker_id,
+      const std::vector<WorkerState>& worker_states) override {
+    return raw_->ReportWorkerState(name, worker_id, worker_states);
   }
 
-  void TriggerStreamingModelSparse(const Callback& cb) override {
-    return raw_->TriggerStreamingModelSparse(cb);
+  Status RestoreWorkerState(
+      const std::string& name,
+      size_t worker_id) override {
+    return raw_->RestoreWorkerState(name, worker_id);
   }
 
-  void TriggerStreamingModelHash(const Callback& cb) override {
-    return raw_->TriggerStreamingModelHash(cb);
+  void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) override {
+    return raw_->TriggerStreamingModelSparse(stream_ver, cb);
+  }
+
+  void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) override {
+    return raw_->TriggerStreamingModelHash(stream_ver, cb);
   }
 
   Status RegisterVariable(const std::string& name, const VariableInfo& info) override {
@@ -91,9 +133,17 @@ class Client: public BaseClient {
     raw_->WorkerReportFinish(id, cb);        
   }
 
+  void GetWorkerFinishCount(int64_t* count, const Callback& cb) {
+    raw_->GetWorkerFinishCount(count, cb);
+  }  
+
   void WorkerBarrier(int id, int worker_count, const Callback& cb) override {
     raw_->WorkerBarrier(id, worker_count, cb);
-  }    
+  }
+
+  void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) override {
+    raw_->WorkerBarrierV2(barrier_id, task_id, task_num, token, cb);
+  }
 
   Status UpdateVariableVisitInfo(const std::string& name, int64_t id_num) {
     return raw_->UpdateVariableVisitInfo(name, id_num);
@@ -119,7 +169,7 @@ class Client: public BaseClient {
                            const Tensor& init, 
                            const Callback& cb) override;
   void HashInitializer(const std::string& variable_name, 
-                       Initializer* init, 
+                       Initializer* init,
                        const Callback& cb) override;
   void IsInitialized(const std::string& variable_name, 
                      bool* inited, 
@@ -141,15 +191,43 @@ class Client: public BaseClient {
                   const std::vector<Data*>& data, 
                   const Callback& cb) override;
   void HashPull(const std::string& variable_name, 
-                const Tensor& ids, 
-                double add_probability, 
+                const Tensor& ids,
+                const float& save_ratio,
                 Tensor* result, 
                 const Callback& cb) override;
+  void MergedHashPull(const std::vector<std::string>& var_names, 
+                      const std::vector<Tensor>& ids,
+                      const std::vector<float>& save_ratios,
+                      std::vector<Tensor>* result, 
+                      const Callback& cb) override;
   void HashPush(const std::string& variable_name, 
-                const Tensor& ids, 
-                const std::string& updater, 
+                const Tensor& ids,
+                const float& save_ratio,                
+                const bool& insertable,
+                const std::string& updater,
                 const std::vector<Data*>& data, 
                 const Callback& cb) override;
+  void MergedHashPush(const std::vector<std::string>& var_names,
+                      const std::vector<Tensor>& ids,
+                      const std::vector<float>& save_ratios,                      
+                      const std::string& updater,
+                      const std::vector<Data*>& data,
+                      const Callback& cb) override;
+  void MergedHashStatis(const std::vector<std::string>& var_names,
+                        const std::vector<Tensor>& ids,
+                        const std::vector<float>& save_ratios,
+                        const std::vector<Tensor>& clicks,
+                        const Tensor& global_step,
+                        const Tensor& statis_decay,
+                        const Tensor& statis_decay_period,
+                        const std::string& statis_type,
+                        std::vector<Tensor>* result,
+                        const Callback& cb) override;
+
+ private:
+  Status GetVariableInfo(const std::string& name, VariableInfo* info) {
+    return raw_->GetVariableInfo(name, info);
+  }
 
  private:
   std::unique_ptr<RawClient> raw_;
diff --git a/xdl/ps-plus/ps-plus/client/client_wrapper.h b/xdl/ps-plus/ps-plus/client/client_wrapper.h
index f8b50f74..166c1d80 100644
--- a/xdl/ps-plus/ps-plus/client/client_wrapper.h
+++ b/xdl/ps-plus/ps-plus/client/client_wrapper.h
@@ -20,7 +20,9 @@ limitations under the License.
 #include "ps-plus/common/status.h"
 #include "ps-plus/client/udf.h"
 #include "ps-plus/client/partitioner.h"
+#include "ps-plus/client/merged_partitioner.h"
 #include "ps-plus/common/tensor.h"
+#include "ps-plus/message/worker_state.h"
 #include <vector>
 #include <functional>
 
@@ -43,16 +45,22 @@ class ClientWrapper {
   virtual void RegisterUdf(size_t server_id, const UdfChain& def, const Callback& cb) = 0;
   virtual void Save(const std::string& version, const Callback& cb) = 0;
   virtual void Restore(const std::string& version, const Callback& cb) = 0;
+  virtual Status InitGlobalQueue(const std::string& name, const std::vector<std::string>& paths, size_t epochs, bool epoch_isolate = false) = 0;
+  virtual Status GetNextFile(const std::string& name, size_t worker_id, std::string* path, size_t* begin, size_t* epoch) = 0;
+  virtual Status ReportWorkerState(const std::string& name, size_t worker_id, const std::vector<WorkerState>& worker_states) = 0;
+  virtual Status RestoreWorkerState(const std::string& name, size_t worker_id) = 0;
   virtual void ModelServerForward(int server_type, int server_id, const Tensor& ids, std::unique_ptr<Tensor>* rst, const Callback& cb) = 0;
   virtual void ModelServerBackward(int server_type, int server_id, const Tensor& ids, const Tensor& grads, const Callback& cb) = 0;
-  virtual void TriggerStreamingModelDense(const Callback& cb) = 0;
-  virtual void TriggerStreamingModelSparse(const Callback& cb) = 0;
-  virtual void TriggerStreamingModelHash(const Callback& cb) = 0;
+  virtual void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) = 0;
+  virtual void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) = 0;
+  virtual void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) = 0;
   virtual void AsynchronizeEnter(int id, int staleness, int worker_count, const Callback& cb) = 0;
   virtual void SynchronizeEnter(int id, int worker_count, int64_t* token, const Callback& cb) = 0;    
   virtual void SynchronizeLeave(int id, int64_t token, const Callback& cb) = 0;
   virtual void WorkerReportFinish(int id, const Callback& cb) = 0;
+  virtual void GetWorkerFinishCount(int64_t* count, const Callback& cb) = 0;
   virtual void WorkerBarrier(int id, int worker_count, const Callback& cb) = 0;    
+  virtual void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) = 0;
   virtual int ServerSize(int id) = 0;
   virtual int ServerTypeSize() = 0;
 };
diff --git a/xdl/ps-plus/ps-plus/client/client_wrapper_impl.cc b/xdl/ps-plus/ps-plus/client/client_wrapper_impl.cc
index 51a8ba06..115fed50 100644
--- a/xdl/ps-plus/ps-plus/client/client_wrapper_impl.cc
+++ b/xdl/ps-plus/ps-plus/client/client_wrapper_impl.cc
@@ -21,6 +21,7 @@ limitations under the License.
 
 using ps::service::seastar::CallBackClosure;
 using ps::service::seastar::SeastarClientLib;
+using ps::service::seastar::EventClientLib;
 using ps::service::seastar::SeastarStatus;
 
 namespace ps {
@@ -227,6 +228,125 @@ void ClientWrapperImpl::Restore(const std::string& version, const Callback& cb)
   client_lib_->Request(0, func_ids::kSchedulerRestore, request_datas, cb_closure);
 }
 
+Status ClientWrapperImpl::InitGlobalQueue(
+    const std::string& name, 
+    const std::vector<std::string>& paths, 
+    size_t epochs, 
+    bool epoch_isolate) {
+  std::vector<Data*> request_datas = {
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(name),
+    new WrapperData<std::vector<std::string> >(paths),
+    new WrapperData<size_t>(epochs),
+    new WrapperData<bool>(epoch_isolate)
+  };
+
+  std::promise<Status> p;
+  CallBackClosure* cb_closure =
+    new CallBackClosure([&p](const SeastarStatus& sst,
+                             const std::vector<Data*>& response) {
+      Status st = GetNetworkStatus(sst, response);
+      p.set_value(st);
+    });
+
+  client_lib_->Request(0, func_ids::kSchedulerInitGlobalFileQueue,
+                       request_datas, cb_closure);
+  return p.get_future().get();
+}
+
+Status ClientWrapperImpl::GetNextFile(
+    const std::string& name, 
+    size_t worker_id, 
+    std::string* path, 
+    size_t* begin, 
+    size_t* epoch) {
+  std::vector<Data*> request_datas = {
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(name),
+    new WrapperData<size_t>(worker_id)
+  };
+
+  std::promise<Status> p;
+  CallBackClosure* cb_closure = 
+    new CallBackClosure([&p, path, begin, epoch, this](
+                            const SeastarStatus& sst, 
+                            const std::vector<Data*>& response) {
+    Status st = GetNetworkStatus(sst, response);
+    if (!st.IsOk()) {
+      p.set_value(st);
+      return;
+    }
+
+    if (response.size() != 4) {
+      p.set_value(Status::Unknown("response data not match"));
+      return;
+    }
+
+    WrapperData<std::string>* path_data = dynamic_cast<WrapperData<std::string>* >(response[1]);
+    WrapperData<size_t>* begin_data = dynamic_cast<WrapperData<size_t>* >(response[2]);    
+    WrapperData<size_t>* epoch_data = dynamic_cast<WrapperData<size_t>* >(response[3]);    
+    if (path_data == nullptr || begin_data == nullptr || epoch_data == nullptr) {
+      p.set_value(Status::Unknown("reponse data type not match"));
+      return;
+    }
+
+    *path = path_data->Internal();
+    *begin = begin_data->Internal();
+    *epoch = epoch_data->Internal();
+    p.set_value(Status::Ok());
+  });
+
+  client_lib_->Request(0, func_ids::kSchedulerGetNextFile,
+                       request_datas, cb_closure);
+  return p.get_future().get();
+}
+
+Status ClientWrapperImpl::ReportWorkerState(
+    const std::string& name,
+    size_t worker_id, 
+    const std::vector<WorkerState>& worker_states) {
+  std::vector<Data*> request_datas = {
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(name),
+    new WrapperData<size_t>(worker_id),
+    new WrapperData<std::vector<WorkerState> >(worker_states)
+  };
+
+  std::promise<Status> p;
+  CallBackClosure* cb_closure =
+    new CallBackClosure([&p](const SeastarStatus& sst,
+                             const std::vector<Data*>& response) {
+      Status st = GetNetworkStatus(sst, response);
+      p.set_value(st);
+    });
+
+  client_lib_->Request(0, func_ids::kSchedulerReportWorkerState,
+                       request_datas, cb_closure);
+  return p.get_future().get();
+}
+
+Status ClientWrapperImpl::RestoreWorkerState(
+    const std::string& name,
+    size_t worker_id) {
+  std::vector<Data*> request_datas = {
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(name),
+    new WrapperData<size_t>(worker_id)
+  };
+
+  std::promise<Status> p;
+  CallBackClosure* cb_closure =
+    new CallBackClosure([&p](const SeastarStatus& sst,
+                             const std::vector<Data*>& response) {
+      Status st = GetNetworkStatus(sst, response);
+      p.set_value(st);
+    });
+
+  client_lib_->Request(0, func_ids::kSchedulerRestoreWorkerState,
+                       request_datas, cb_closure);
+  return p.get_future().get();
+}
+
 void ClientWrapperImpl::ModelServerForward(int server_type, int server_id, const Tensor& ids, std::unique_ptr<Tensor>* rst, const Callback& cb) {
   std::vector<Data*> request_datas = {
     new WrapperData<Version>(scheduler_version_),
@@ -268,9 +388,10 @@ void ClientWrapperImpl::ModelServerBackward(int server_type, int server_id, cons
     request_datas, cb_closure);
 }
 
-void ClientWrapperImpl::TriggerStreamingModelDense(const Callback& cb) {
+void ClientWrapperImpl::TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) {
   std::vector<Data*> request_datas = {
-    new WrapperData<Version>(scheduler_version_)
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(stream_ver)
   };
 
   CallBackClosure* cb_closure = new CallBackClosure([cb](const SeastarStatus& sst, const std::vector<Data*>& response) {
@@ -280,9 +401,10 @@ void ClientWrapperImpl::TriggerStreamingModelDense(const Callback& cb) {
   client_lib_->Request(0, func_ids::kSchedulerTriggerStreamingDense, request_datas, cb_closure);
 }
 
-void ClientWrapperImpl::TriggerStreamingModelSparse(const Callback& cb) {
+void ClientWrapperImpl::TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) {
   std::vector<Data*> request_datas = {
-    new WrapperData<Version>(scheduler_version_)
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(stream_ver)
   };
 
   CallBackClosure* cb_closure = new CallBackClosure([cb](const SeastarStatus& sst, const std::vector<Data*>& response) {
@@ -292,9 +414,10 @@ void ClientWrapperImpl::TriggerStreamingModelSparse(const Callback& cb) {
   client_lib_->Request(0, func_ids::kSchedulerTriggerStreamingSparse, request_datas, cb_closure);
 }
 
-void ClientWrapperImpl::TriggerStreamingModelHash(const Callback& cb) {
+void ClientWrapperImpl::TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) {
   std::vector<Data*> request_datas = {
-    new WrapperData<Version>(scheduler_version_)
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<std::string>(stream_ver)
   };
 
   CallBackClosure* cb_closure = new CallBackClosure([cb](const SeastarStatus& sst, const std::vector<Data*>& response) {
@@ -376,6 +499,28 @@ void ClientWrapperImpl::WorkerReportFinish(int id, const Callback& cb) {
                        request_datas, cb_closure);
 }
 
+void ClientWrapperImpl::GetWorkerFinishCount(int64_t* count, const Callback& cb) {
+  std::vector<Data*> request_datas = {
+    new WrapperData<Version>(scheduler_version_)
+  };
+  CallBackClosure* cb_closure =
+    new CallBackClosure([count, cb](const SeastarStatus& sst,
+                                    const std::vector<Data*>& response) {
+      Status st = GetNetworkStatus(sst, response);
+      if (!st.IsOk()) {
+        cb(st);
+        return;
+      }
+      if (count) {
+        WrapperData<int64_t>* res = dynamic_cast<WrapperData<int64_t>*>(response[1]);
+        *count = res->Internal();
+      }
+      cb(Status::Ok());
+    });
+  client_lib_->Request(0, func_ids::kSchedulerGetWorkerFinishCount,
+                       request_datas, cb_closure);
+}    
+
 void ClientWrapperImpl::WorkerBarrier(int id, int worker_count, const Callback& cb) {
   std::vector<Data*> request_datas = {
     new WrapperData<Version>(scheduler_version_),
@@ -391,10 +536,32 @@ void ClientWrapperImpl::WorkerBarrier(int id, int worker_count, const Callback&
                        request_datas, cb_closure);
 }
 
+void ClientWrapperImpl::WorkerBarrierV2(
+    int barrier_id, 
+    int task_id, 
+    int task_num,
+    int token,
+    const Callback& cb) {
+  std::vector<Data*> request_datas = {
+    new WrapperData<Version>(scheduler_version_),
+    new WrapperData<int>(barrier_id),
+    new WrapperData<int>(task_id),
+    new WrapperData<int>(task_num),
+    new WrapperData<int>(token)    
+  };
+  CallBackClosure* cb_closure =
+    new CallBackClosure([cb](const SeastarStatus& sst,
+                             const std::vector<Data*>& response) {
+      cb(GetNetworkStatus(sst, response));
+    });
+  client_lib_->Request(0, func_ids::kSchedulerWorkerBarrierV2,
+                       request_datas, cb_closure);
+}
+
 Status ClientWrapperImpl::CreateServerLib() {
   if (client_lib_singleton_ == nullptr) {
     std::vector<std::tuple<int64_t, std::string>> server_addrs = {};
-    client_lib_singleton_ = new ClientLib(server_addrs, 100, 1);
+    client_lib_singleton_ = new ClientLib(server_addrs, 100, std::thread::hardware_concurrency());
     client_lib_ = client_lib_singleton_;
     client_lib_->Start();
   } else {
diff --git a/xdl/ps-plus/ps-plus/client/client_wrapper_impl.h b/xdl/ps-plus/ps-plus/client/client_wrapper_impl.h
index 7ee8cecd..fbe9251b 100644
--- a/xdl/ps-plus/ps-plus/client/client_wrapper_impl.h
+++ b/xdl/ps-plus/ps-plus/client/client_wrapper_impl.h
@@ -37,19 +37,26 @@ class ClientWrapperImpl : public ClientWrapper {
   void RegisterUdf(size_t server_id, const UdfChain& def, const Callback& cb) override;
   void Save(const std::string& version, const Callback& cb) override;
   void Restore(const std::string& version, const Callback& cb) override;
+  Status InitGlobalQueue(const std::string& name, const std::vector<std::string>& paths, size_t epochs, bool epoch_isolate = false) override;
+  Status GetNextFile(const std::string& name, size_t worker_id, std::string* path, size_t* begin, size_t* epoch) override;
+  Status ReportWorkerState(const std::string& name, size_t worker_id, const std::vector<WorkerState>& worker_states) override;
+  Status RestoreWorkerState(const std::string& name, size_t worker_id) override;
   void ModelServerForward(int server_type, int server_id, const Tensor& ids, std::unique_ptr<Tensor>* rst, const Callback& cb) override;
   void ModelServerBackward(int server_type, int server_id, const Tensor& ids, const Tensor& grads, const Callback& cb) override;
-  void TriggerStreamingModelDense(const Callback& cb) override;
-  void TriggerStreamingModelSparse(const Callback& cb) override;
-  void TriggerStreamingModelHash(const Callback& cb) override;
+  void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) override;
+  void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) override;
+  void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) override;
   void AsynchronizeEnter(int id, int staleness, int worker_count, const Callback& cb) override;
   void SynchronizeEnter(int id, int worker_count, int64_t* token, const Callback& cb) override;    
   void SynchronizeLeave(int id, int64_t token, const Callback& cb) override;
   void WorkerReportFinish(int id, const Callback& cb) override;
+  void GetWorkerFinishCount(int64_t* count, const Callback& cb);
   void WorkerBarrier(int id, int worker_count, const Callback& cb) override;    
+  void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) override;
   int ServerSize(int id) override;
   int ServerTypeSize() override;
 
+  //using ClientLib = ps::service::seastar::SeastarClientLib;
   using ClientLib = ps::service::seastar::EventClientLib;
  private:
   Status CreateServerLib();
diff --git a/xdl/ps-plus/ps-plus/client/local_client.cc b/xdl/ps-plus/ps-plus/client/local_client.cc
index 28b8d16e..a1778c51 100644
--- a/xdl/ps-plus/ps-plus/client/local_client.cc
+++ b/xdl/ps-plus/ps-plus/client/local_client.cc
@@ -87,20 +87,26 @@ void LocalClient::IdentityInitializer(const std::string& variable_name,
 }
 
 void LocalClient::HashInitializer(const std::string& variable_name, 
-                                  Initializer* init, 
+                                  Initializer* init,
                                   const LocalClient::Callback& cb) {
   VariableInfo info;
   CHECK_ASYNC(local_server_->GetVariableInfo(variable_name, &info));
   std::vector<size_t> dims(info.shape.begin(), info.shape.end());
   size_t k = info.shape[0];
   dims[0] = k + 10 * sqrt(k) + 10;
+  std::string extra_info;
+  for (auto& arg : info.args) {
+    extra_info += arg.first + "=" + arg.second + "&";
+  }
+  if (!extra_info.empty()) { extra_info.pop_back(); }
   std::vector<Data*> inputs = Args(
       info.datatype, 
       TensorShape(dims), 
+      extra_info,
       std::unique_ptr<Initializer>(init));
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
-  UdfData udf("HashVariableInitializer", UdfData(0), UdfData(1), UdfData(2));
+  UdfData udf("HashVariableInitializer", UdfData(0), UdfData(1), UdfData(2), UdfData(3));
   Callback realcb = [cb, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
     cb(st);
@@ -143,8 +149,8 @@ void LocalClient::DensePull(const std::string& variable_name,
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
   UdfData udf("BuildDenseSlice", UdfData(0));
-  UdfData udf_chain("SliceToTensor", UdfData("TransSlice", udf));
-  Callback realcb = [this, cb, result, outputs, &variable_name](const Status& st) {
+  UdfData udf_chain("SliceToTensor", udf);
+  Callback realcb = [this, cb, result, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
     if (!st.IsOk()) {
       cb(st);
@@ -156,13 +162,19 @@ void LocalClient::DensePull(const std::string& variable_name,
       return;
     }
 
-    WrapperData<Tensor>* output_ptr = dynamic_cast<WrapperData<Tensor>*>((*outputs)[0].get());
+    WrapperData<std::vector<Tensor>>* output_ptr = 
+      dynamic_cast<WrapperData<std::vector<Tensor>>*>((*outputs)[0].get());
     if (output_ptr == nullptr) {
-      cb(Status::ArgumentError("Output[0] should be tensor"));
+      cb(Status::ArgumentError("Output[0] should be tensor vector"));
       return;
     }
 
-    *result = output_ptr->Internal();
+    if (output_ptr->Internal().size() != 1) {
+      cb(Status::ArgumentError("Output[0] size should be 1"));
+      return;
+    }
+
+    *result = output_ptr->Internal()[0];
     cb(Status::Ok());
   };
 
@@ -199,8 +211,8 @@ void LocalClient::SparsePull(const std::string& variable_name,
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
   UdfData udf("BuildSparseSlice", UdfData(0), UdfData(1));
-  UdfData udf_chain("SliceToTensor", UdfData("TransSlice", udf));
-  Callback realcb = [cb, result, outputs](const Status& st) {
+  UdfData udf_chain("SliceToTensor", udf);
+  Callback realcb = [this, cb, result, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
     if (!st.IsOk()) {
       cb(st);
@@ -212,14 +224,19 @@ void LocalClient::SparsePull(const std::string& variable_name,
       return;
     }
 
-    WrapperData<Tensor>* output_ptr = 
-      dynamic_cast<WrapperData<Tensor>*>((*outputs)[0].get());
+    WrapperData<std::vector<Tensor>>* output_ptr = 
+      dynamic_cast<WrapperData<std::vector<Tensor>>*>((*outputs)[0].get());
     if (output_ptr == nullptr) {
-      cb(Status::ArgumentError("Output[0] should be tensor"));
+      cb(Status::ArgumentError("Output[0] should be tensor vector"));
       return;
     }
 
-    *result = output_ptr->Internal();
+    if (output_ptr->Internal().size() != 1) {
+      cb(Status::ArgumentError("Output[0] size should be 1"));
+      return;
+    }
+
+    *result = output_ptr->Internal()[0];
     cb(Status::Ok());
   };
 
@@ -252,16 +269,19 @@ void LocalClient::SparsePush(const std::string& variable_name,
 }
 
 void LocalClient::HashPull(const std::string& variable_name, 
-                           const Tensor& ids, 
-                           double filter_ratio,
+                           const Tensor& ids,
+                           const float& save_ratio,
                            Tensor* result, 
                            const LocalClient::Callback& cb) {
-  std::vector<Data*> inputs = Args(ids, false, 1.0);
+  std::vector<Tensor> ids_vec = {ids};
+  std::vector<std::string> name_vec = {variable_name};
+  std::vector<float> save_ratio_vec = {save_ratio};  
+  std::vector<Data*> inputs = Args(ids_vec, name_vec, save_ratio_vec, false, true);
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
-  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2));
-  UdfData udf_chain("SliceToTensor", UdfData("TransSlice", udf));
-  Callback realcb = [cb, result, outputs](const Status& st) {
+  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4));
+  UdfData udf_chain("SliceToTensor", udf);
+  Callback realcb = [this, cb, result, outputs](const Status& st) {
     std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
     if (!st.IsOk()) {
       cb(st);
@@ -273,33 +293,84 @@ void LocalClient::HashPull(const std::string& variable_name,
       return;
     }
 
-    WrapperData<Tensor>* output_ptr = 
-      dynamic_cast<WrapperData<Tensor>*>((*outputs)[0].get());
+    WrapperData<std::vector<Tensor>>* output_ptr = 
+      dynamic_cast<WrapperData<std::vector<Tensor>>*>((*outputs)[0].get());
     if (output_ptr == nullptr) {
-      cb(Status::ArgumentError("Output[0] should be tensor"));
+      cb(Status::ArgumentError("Output[0] should be tensor vector"));
       return;
     }
 
-    *result = output_ptr->Internal();
+    if (output_ptr->Internal().size() != 1) {
+      cb(Status::ArgumentError("Output[0] size should be 1"));
+      return;
+    }
+
+    *result = output_ptr->Internal()[0];
     cb(Status::Ok());
   };
 
   Process(udf_chain, variable_name, inputs, outputs, realcb);
 }
 
+void LocalClient::MergedHashPull(const std::vector<std::string>& var_names, 
+                                 const std::vector<Tensor>& ids,
+                                 const std::vector<float>& save_ratios,
+                                 std::vector<Tensor>* result, 
+                                 const Callback& cb) {
+  std::vector<Data*> inputs = Args(ids, var_names, save_ratios, false, true);
+  std::vector<std::unique_ptr<Data>>* outputs = 
+    new std::vector<std::unique_ptr<Data>>;
+  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4));
+  UdfData udf_chain("SliceToTensor", udf);
+  Callback realcb = [this, cb, result, outputs, var_names](const Status& st) {
+    std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
+    if (!st.IsOk()) {
+      cb(st);
+      return;
+    }
+
+    if (outputs->size() != 1) {
+      cb(Status::ArgumentError("Output Size Should be 1 on HashPull"));
+      return;
+    }
+
+    WrapperData<std::vector<Tensor>>* output_ptr = 
+      dynamic_cast<WrapperData<std::vector<Tensor>>*>((*outputs)[0].get());
+    if (output_ptr == nullptr) {
+      cb(Status::ArgumentError("Output[0] should be tensor vector"));
+      return;
+    }
+
+    if (output_ptr->Internal().size() != var_names.size()) {
+      cb(Status::ArgumentError("Output[0] Size Should be the Same with Variable Number"));
+      return;
+    }
+
+    *result = output_ptr->Internal();
+    cb(Status::Ok());
+  };
+
+  Process(udf_chain, "^hash_variable", inputs, outputs, realcb);
+}
+
 void LocalClient::HashPush(const std::string& variable_name, 
-                           const Tensor& ids, 
-                           const std::string& updater, 
+                           const Tensor& ids,
+                           const float& save_ratio,
+                           const bool& insertable,
+                           const std::string& updater,
                            const std::vector<Data*>& data, 
                            const LocalClient::Callback& cb) {
-  std::vector<Data*> inputs = Args(ids, true, 0.0);
+  std::vector<Tensor> ids_vec = {ids};
+  std::vector<std::string> name_vec = {variable_name};
+  std::vector<float> save_ratio_vec = {save_ratio};  
+  std::vector<Data*> inputs = Args(ids_vec, name_vec, save_ratio_vec, true, insertable);
   inputs.insert(inputs.end(), data.begin(), data.end());
   std::vector<std::unique_ptr<Data>>* outputs = 
     new std::vector<std::unique_ptr<Data>>;
   std::vector<UdfData> updater_inputs = {
-    UdfData("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2))
+    UdfData("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4))
   };
-  for (size_t i = 3; i < inputs.size(); i++) {
+  for (size_t i = 5; i < inputs.size(); i++) {
     updater_inputs.push_back(UdfData(i));
   }
 
@@ -312,6 +383,78 @@ void LocalClient::HashPush(const std::string& variable_name,
   Process(udf, variable_name, inputs, outputs, realcb);
 }
 
+void LocalClient::MergedHashPush(const std::vector<std::string>& var_names,
+                                 const std::vector<Tensor>& ids,
+                                 const std::vector<float>& save_ratios,
+                                 const std::string& updater,
+                                 const std::vector<Data*>& data,
+                                 const Callback& cb) {
+  std::vector<Data*> inputs = Args(ids, var_names, save_ratios, true, false);
+  inputs.insert(inputs.end(), data.begin(), data.end());
+  std::vector<std::unique_ptr<Data>>* outputs = 
+    new std::vector<std::unique_ptr<Data>>;
+  std::vector<UdfData> updater_inputs = {
+    UdfData("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4))
+  };
+  for (size_t i = 5; i < inputs.size(); i++) {
+    updater_inputs.push_back(UdfData(i));
+  }
+
+  UdfData udf(updater, updater_inputs);
+  Callback realcb = [cb, outputs](const Status& st) {
+    std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
+    cb(st);
+  };
+
+  Process(udf, "^hash_variable", inputs, outputs, realcb);
+}
+
+void LocalClient::MergedHashStatis(const std::vector<std::string>& var_names,
+                                   const std::vector<Tensor>& ids,
+                                   const std::vector<float>& save_ratios,
+                                   const std::vector<Tensor>& clicks,
+                                   const Tensor& global_step,
+                                   const Tensor& statis_decay,
+                                   const Tensor& statis_decay_period,
+                                   const std::string& statis_type,
+                                   std::vector<Tensor>* result,
+                                   const Callback& cb) {
+  std::vector<Data*> inputs = Args(ids, var_names, save_ratios, false, true);
+  std::vector<std::unique_ptr<Data>>* outputs =
+    new std::vector<std::unique_ptr<Data>>;
+  UdfData udf("BuildHashSlice", UdfData(0), UdfData(1), UdfData(2), UdfData(3), UdfData(4));
+  UdfData udf_chain("SliceToTensor", udf);
+  Callback realcb = [this, cb, result, outputs, var_names](const Status& st) {
+    std::unique_ptr<std::vector<std::unique_ptr<Data>>> deleter(outputs);
+    if (!st.IsOk()) {
+      cb(st);
+      return;
+    }
+
+    if (outputs->size() != 1) {
+      cb(Status::ArgumentError("Output Size Should be 1 on MergedHashStatis"));
+      return;
+    }
+
+    WrapperData<std::vector<Tensor>>* output_ptr =
+      dynamic_cast<WrapperData<std::vector<Tensor>>*>((*outputs)[0].get());
+    if (output_ptr == nullptr) {
+      cb(Status::ArgumentError("Output[0] should be tensor vector"));
+      return;
+    }
+
+    if (output_ptr->Internal().size() != var_names.size()) {
+      cb(Status::ArgumentError("Output[0] Size Should be the Same with Variable Number"));
+      return;
+    }
+
+    *result = output_ptr->Internal();
+    cb(Status::Ok());
+  };
+
+  Process(udf_chain, "^hash_variable", inputs, outputs, realcb);
+}
+
 void LocalClient::Process(const UdfChain& udf, 
                           const std::string& var_name,
                           const std::vector<Data*>& datas,
@@ -337,3 +480,4 @@ void LocalClient::Process(const UdfChain& udf,
 
 } //namespace client
 } //namespace ps
+
diff --git a/xdl/ps-plus/ps-plus/client/local_client.h b/xdl/ps-plus/ps-plus/client/local_client.h
index e7503547..9a177b13 100644
--- a/xdl/ps-plus/ps-plus/client/local_client.h
+++ b/xdl/ps-plus/ps-plus/client/local_client.h
@@ -17,9 +17,12 @@ limitations under the License.
 #define PS_PLUS_CLIENT_LOCAL_CLIENT_H_
 
 #include <memory>
+#include <unordered_map>
+#include <mutex>
 
 #include "ps-plus/server/local_server.h"
 #include "ps-plus/client/base_client.h"
+#include "ps-plus/common/global_file_queue.h"
 
 namespace ps {
 namespace client {
@@ -43,17 +46,28 @@ class LocalClient: public BaseClient {
 	       const std::vector<Data*>& datas,
 	       const std::vector<Partitioner*>& splitter,
 	       const std::vector<Partitioner*>& combiner,
-	       std::vector<std::unique_ptr<Data>>* results,
+	       std::vector<std::unique_ptr<Data> >* results,
 	       const Callback& cb) override {
     return Process(udf, var_name, datas, results, cb);
   }
+  
+  void Process(const UdfChain& udf, 
+           const std::vector<std::string>& var_names,
+           const std::vector<Data*>& datas,
+           const std::vector<MergedPartitioner*>& splitter,
+           const std::vector<MergedPartitioner*>& combiner,
+           std::vector<std::vector<std::unique_ptr<Data> > >* results,
+           const Callback& cb) override {
+    results->emplace_back();
+    Process(udf, "^hash_variable", datas, &((*results)[0]), cb);
+  }
 
   void Process(const UdfChain& udf, 
                const std::string& var_name,
                const std::vector<Data*>& datas,
-               std::vector<std::unique_ptr<Data>>* results,
+               std::vector<std::unique_ptr<Data> >* results,
                const Callback& cb);
-
+               
   void Save(const std::string& name, const Callback& cb) override {
     Status st = local_server_->Save(name);
     cb(st);
@@ -64,6 +78,53 @@ class LocalClient: public BaseClient {
     cb(st);
   }
 
+  Status InitGlobalQueue(
+      const std::string& name,
+      const std::vector<std::string>& paths,
+      size_t epochs,
+      bool epoch_isolate = false) override {
+    std::unique_lock<std::mutex> lock(mu_);
+    auto it = global_file_queues_.find(name);
+    if (it == global_file_queues_.end()) {
+      global_file_queues_[name].reset(new GlobalFileQueue());
+    }
+
+    return global_file_queues_[name]->Init(
+        paths, epochs, epoch_isolate);
+  }
+
+  Status GetNextFile(
+      const std::string& name,
+      size_t worker_id,
+      std::string* path,
+      size_t* begin,
+      size_t* epoch) override {
+    std::unique_lock<std::mutex> lock(mu_);
+    WorkerState file;
+    Status st = global_file_queues_[name]->GetNextFile(
+        worker_id, & file);
+    *path = file.path_;
+    *begin = file.begin_;
+    *epoch = file.epoch_;
+    return st;
+  }
+
+  Status ReportWorkerState(
+      const std::string& name,
+      size_t worker_id,
+      const std::vector<WorkerState>& worker_states) override {
+    std::unique_lock<std::mutex> lock(mu_);
+    return global_file_queues_[name]->ReportWorkerState(
+        worker_id, worker_states);
+  }
+
+  Status RestoreWorkerState(
+      const std::string& name,
+      size_t worker_id) override {
+    std::unique_lock<std::mutex> lock(mu_);
+    return global_file_queues_[name]->RestoreWorkerState(worker_id);
+  }
+               
   Status RegisterVariable(const std::string& name, 
                           const VariableInfo& info) override {
     return local_server_->RegisterVariable(name, info);
@@ -106,17 +167,43 @@ class LocalClient: public BaseClient {
                   const Callback& cb) override;
 
   void HashPull(const std::string& variable_name, 
-                const Tensor& ids, 
-                double add_probability,
+                const Tensor& ids,
+                const float& save_ratio,
                 Tensor* result, 
                 const Callback& cb) override;
 
+  void MergedHashPull(const std::vector<std::string>& var_names, 
+                      const std::vector<Tensor>& ids,
+                      const std::vector<float>& save_ratio,
+                      std::vector<Tensor>* result, 
+                      const Callback& cb) override;
+
   void HashPush(const std::string& variable_name, 
-                const Tensor& ids, 
-                const std::string& updater, 
+                const Tensor& ids,
+                const float& save_ratio,
+                const bool& insertable,
+                const std::string& updater,
                 const std::vector<Data*>& data, 
                 const Callback& cb) override;
 
+  void MergedHashPush(const std::vector<std::string>& var_names,
+                      const std::vector<Tensor>& ids,
+                      const std::vector<float>& save_ratio,
+                      const std::string& updater,
+                      const std::vector<Data*>& data,
+                      const Callback& cb) override;
+
+  void MergedHashStatis(const std::vector<std::string>& var_names,
+                        const std::vector<Tensor>& ids,
+                        const std::vector<float>& save_ratio,
+                        const std::vector<Tensor>& clicks,
+                        const Tensor& global_step,
+                        const Tensor& statis_decay,
+                        const Tensor& statis_decay_period,
+                        const std::string& statis_type,
+                        std::vector<Tensor>* result,
+                        const Callback& cb) override;
+
   void ModelServerForward(int type, const Tensor& ids, Tensor* rst, const Callback& cb) override {
     cb(Status::ArgumentError("Not Supported in Local"));
   }
@@ -125,18 +212,17 @@ class LocalClient: public BaseClient {
   }
 
   /* not used in inference and local train */
-  void TriggerStreamingModelDense(const Callback& cb) override {
+  void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) override {
     cb(Status::Ok());
   }
 
-  void TriggerStreamingModelSparse(const Callback& cb) override {
+  void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) override {
     cb(Status::Ok());
   }
 
-  void TriggerStreamingModelHash(const Callback& cb) override {
+  void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) override {
     cb(Status::Ok());
   }
-
   void AsynchronizeEnter(int id, 
                          int staleness, 
                          int worker_count, 
@@ -158,10 +244,18 @@ class LocalClient: public BaseClient {
     cb(Status::Ok());
   }
 
+  void GetWorkerFinishCount(int64_t* id, const Callback& cb) override {
+    cb(Status::Ok());
+  }
+               
   void WorkerBarrier(int id, int worker_count, const Callback& cb) override {
     cb(Status::Ok());
   }    
 
+  void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) override {
+    cb(Status::Ok());
+  }
+
  private:
   Status GetVariableInfo(const std::string& name, VariableInfo* info) {
     return local_server_->GetVariableInfo(name, info);
@@ -171,6 +265,8 @@ class LocalClient: public BaseClient {
   // a local server holds all variables in memory
   std::unique_ptr<ps::server::LocalServer> local_server_;
   std::string ckpt_path_;
+  std::mutex mu_;
+  std::unordered_map<std::string, std::unique_ptr<GlobalFileQueue> > global_file_queues_;
 };
 
 } //namespace client
diff --git a/xdl/ps-plus/ps-plus/client/merged_partitioner.cc b/xdl/ps-plus/ps-plus/client/merged_partitioner.cc
new file mode 100644
index 00000000..831c3e0e
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/merged_partitioner.cc
@@ -0,0 +1,79 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/merged_partitioner.h"
+
+namespace ps {
+namespace client {
+
+MergedPartitionerContext::MergedPartitionerContext() {}
+
+Data* MergedPartitionerContext::GetData(std::size_t id) {
+  if (id >= datas_.size()) {
+    return nullptr;
+  } else {
+    return datas_[id].get();
+  }
+}
+
+void MergedPartitionerContext::SetData(std::size_t id, Data* data) {
+  datas_.resize(std::max(id + 1, datas_.size()));
+  datas_[id].reset(data);
+}
+
+void MergedPartitionerContext::AddDeleter(Data* data) {
+  deleter_.emplace_back(data);
+}
+
+void MergedPartitionerContext::SetContext(std::size_t id, PartitionerContext* context) {
+  context_.resize(std::max(id + 1, context_.size()));
+  context_[id].reset(context);
+}
+
+PartitionerContext* MergedPartitionerContext::GetContext(std::size_t id) {
+  if (id >= context_.size()) {
+    return nullptr;
+  } else {
+    return context_[id].get();
+  } 
+}
+
+void MergedPartitionerContext::AddContext(PartitionerContext* context) {
+  context_.emplace_back(context);
+}
+
+size_t MergedPartitionerContext::ContextSize() {
+  return context_.size();
+}
+
+Status MergedPartitioner::Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
+  return Status::NotImplemented("MergedPartitioner do not implement default Split");
+}
+
+Status MergedPartitioner::Combine(MergedPartitionerContext* ctx, Data* src, size_t server_id, std::vector<std::unique_ptr<Data>>* output) {
+  return Status::NotImplemented("MergedPartitioner do not implement default Combine");
+}
+
+Status MergedPartitioner::Init(MergedPartitionerContext* ctx, Data* src) {
+  return Status::Ok();
+}
+
+Status MergedPartitioner::CombineInit(MergedPartitionerContext* ctx, std::vector<std::unique_ptr<Data>>* output) {
+  return Status::Ok();
+}
+
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/client/merged_partitioner.h b/xdl/ps-plus/ps-plus/client/merged_partitioner.h
new file mode 100644
index 00000000..2ff77a8b
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/merged_partitioner.h
@@ -0,0 +1,60 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_CLIENT_MERGED_PARTITIONER_H_
+#define PS_PLUS_CLIENT_MERGED_PARTITIONER_H_
+
+#include "ps-plus/common/status.h"
+#include "ps-plus/common/data.h"
+#include "ps-plus/message/variable_info.h"
+#include "ps-plus/client/partitioner.h"
+
+#include <memory>
+#include <vector>
+
+namespace ps {
+namespace client {
+
+class MergedPartitionerContext {
+ public:
+  MergedPartitionerContext();
+  Data* GetData(std::size_t id);
+  void SetData(std::size_t id, Data* data);
+  void AddDeleter(Data* data);
+  void SetContext(std::size_t id, PartitionerContext* context);
+  PartitionerContext* GetContext(std::size_t id);
+  void AddContext(PartitionerContext* context);
+  size_t ContextSize();
+ private:
+  std::vector<std::unique_ptr<Data>> datas_;
+  std::vector<std::unique_ptr<Data>> deleter_;
+  std::vector<std::unique_ptr<PartitionerContext>> context_;
+};
+
+class MergedPartitioner {
+ public:
+  virtual ~MergedPartitioner() {}
+  virtual Status Init(MergedPartitionerContext* ctx, Data* src);
+  virtual Status CombineInit(MergedPartitionerContext* ctx, std::vector<std::unique_ptr<Data>>* output);
+  virtual Status Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst);
+  virtual Status Combine(MergedPartitionerContext* ctx, Data* src, size_t server_id, std::vector<std::unique_ptr<Data>>* output);
+};
+
+}
+}
+
+#define CHECK_COUNTER(COUNTER, OK) do { if (--COUNTER == 0) {OK.set_value(true);} return;} while(0);
+
+#endif
diff --git a/xdl/ps-plus/ps-plus/client/merged_process_context.h b/xdl/ps-plus/ps-plus/client/merged_process_context.h
new file mode 100644
index 00000000..24dac199
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/merged_process_context.h
@@ -0,0 +1,74 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_CLIENT_MERGED_PROCESS_CONTEXT_H
+#define PS_PLUS_CLIENT_MERGED_PROCESS_CONTEXT_H
+
+#include <iostream>
+#include <future>
+
+namespace ps {
+namespace client {
+
+class MergedProcessContext {
+ public:
+  using Callback = std::function<void (const Status&)>;
+  MergedProcessContext(size_t count) : count_(count), st_(Status::Ok()) {}
+  void Collect(const std::vector<MergedPartitioner*>& combiner,
+               MergedPartitionerContext* ctx,
+               std::vector<Data*>* server_results,
+               std::vector<std::vector<std::unique_ptr<Data> > >* results,
+               size_t server_id,
+               const Status& resp_st,
+               const Callback& cb) {
+    if (!resp_st.IsOk()) {
+      st_ = resp_st;
+    } else {
+      if ((*server_results).size() != combiner.size()) {
+        st_ = Status::ArgumentError("Combiner Size Error");
+      } else {
+        for (size_t i = 0; i < combiner.size(); ++i) {
+          Status st = combiner[i]->Combine(ctx, (*server_results)[i], server_id, &(*results)[i]);
+          if (!st.IsOk()) {
+            st_ = st;
+          }
+        }
+      }
+    }
+    delete server_results;
+    if (--count_ == 0) {
+      cb(st_);
+      delete this;
+    }
+  }
+  Callback CollectResults(const std::vector<MergedPartitioner*>& combiner,
+                          MergedPartitionerContext* ctx,
+                          std::vector<Data*>* server_results,
+                          std::vector<std::vector<std::unique_ptr<Data> > >* results,
+                          size_t server_id,
+                          const Callback& cb) {
+    return [combiner, ctx, server_results, results, server_id, cb, this](Status resp_st){
+      this->Collect(combiner, ctx, server_results, results, server_id, resp_st, cb);
+    };
+  }
+ private:
+  std::atomic<size_t> count_;
+  Status st_;
+};
+
+}  
+}
+
+#endif
diff --git a/xdl/ps-plus/ps-plus/client/partitioner.cc b/xdl/ps-plus/ps-plus/client/partitioner.cc
index 780dd797..2c3e0f4f 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner.cc
+++ b/xdl/ps-plus/ps-plus/client/partitioner.cc
@@ -21,9 +21,11 @@ namespace client {
 PartitionerContext::PartitionerContext() {}
 
 PartitionerContext::PartitionerContext(const VariableInfo& variable_info)
-  : variable_info_(variable_info) {}
+  : variable_info_(variable_info) {
+  deleter_.resize(variable_info_.parts.size());
+}
 
-Data* PartitionerContext::GetData(std::size_t id) {
+Data* PartitionerContext::GetData(size_t id) {
   if (id >= datas_.size()) {
     return nullptr;
   } else {
@@ -31,17 +33,22 @@ Data* PartitionerContext::GetData(std::size_t id) {
   }
 }
 
-void PartitionerContext::SetData(std::size_t id, Data* data) {
+void PartitionerContext::SetData(size_t id, Data* data) {
   datas_.resize(std::max(id + 1, datas_.size()));
   datas_[id].reset(data);
 }
 
 void PartitionerContext::AddDeleter(Data* data) {
-  deleter_.emplace_back(data);
+  deleter_[0].emplace_back(data);
+}
+
+void PartitionerContext::AddDeleter(Data* data, size_t index) {
+  deleter_[index].emplace_back(data);
 }
 
 void PartitionerContext::SetVariableInfo(const VariableInfo& info) {
   variable_info_ = info;
+  deleter_.resize(variable_info_.parts.size());
 }
 
 VariableInfo* PartitionerContext::GetVariableInfo() {
@@ -60,6 +67,10 @@ Status Partitioner::Init(PartitionerContext* ctx, Data* src) {
   return Status::Ok();
 }
 
+Status Partitioner::CombineInit(PartitionerContext* ctx, std::unique_ptr<Data>* output) {
+  return Status::Ok();
+}
+
 }
 }
 
diff --git a/xdl/ps-plus/ps-plus/client/partitioner.h b/xdl/ps-plus/ps-plus/client/partitioner.h
index cba1e9b7..d5236afc 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner.h
+++ b/xdl/ps-plus/ps-plus/client/partitioner.h
@@ -30,14 +30,15 @@ class PartitionerContext {
  public:
   PartitionerContext();
   PartitionerContext(const VariableInfo& variable_info);
-  Data* GetData(std::size_t id);
-  void SetData(std::size_t id, Data* data);
+  Data* GetData(size_t id);
+  void SetData(size_t id, Data* data);
   void AddDeleter(Data* data);
+  void AddDeleter(Data* data, size_t index);
   void SetVariableInfo(const VariableInfo& info);
   VariableInfo* GetVariableInfo();
  private:
   std::vector<std::unique_ptr<Data>> datas_;
-  std::vector<std::unique_ptr<Data>> deleter_;
+  std::vector<std::vector<std::unique_ptr<Data>>> deleter_;
   VariableInfo variable_info_;
 };
 
@@ -45,6 +46,7 @@ class Partitioner {
  public:
   virtual ~Partitioner() {}
   virtual Status Init(PartitionerContext* ctx, Data* src);
+  virtual Status CombineInit(PartitionerContext* ctx, std::unique_ptr<Data>* output);
   virtual Status Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst);
   virtual Status Combine(PartitionerContext* ctx, Data* src, size_t server_id, std::unique_ptr<Data>* output);
 };
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/dense.cc b/xdl/ps-plus/ps-plus/client/partitioner/dense.cc
index 939b0fef..ebe44185 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner/dense.cc
+++ b/xdl/ps-plus/ps-plus/client/partitioner/dense.cc
@@ -17,25 +17,21 @@ limitations under the License.
 #include "ps-plus/common/tensor.h"
 #include "ps-plus/common/initializer/none_initializer.h"
 #include "ps-plus/common/thread_pool.h"
+#include "xdl/core/utils/logging.h"
 #include <cstring>
 
 namespace ps {
 namespace client {
 namespace partitioner {
 
-Status Dense::Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
-  VariableInfo* info = ctx->GetVariableInfo();
-  if (info->type != VariableInfo::kIndex) {
-    return Status::ArgumentError("Dense Partitioner Only Allow by kIndex");
-  }
-  WrapperData<Tensor>* data_wrapper = dynamic_cast<WrapperData<Tensor>*>(src);
-  if (data_wrapper == nullptr) {
-    return Status::ArgumentError("Dense Partitioner Only Allow the Tensor Data");
-  }
-  Tensor& data = data_wrapper->Internal();
+namespace {
 
+Status SplitSingleTensor(PartitionerContext* ctx, const Tensor& data, std::vector<Data*>* dst) {
+  VariableInfo* info = ctx->GetVariableInfo();
   if (info->parts.size() == 1 && info->shape.empty()) {
     dst->clear();
+    WrapperData<Tensor>* src = new WrapperData<Tensor>(data);
+    ctx->AddDeleter(src);
     dst->push_back(src);
     return Status::Ok();
   }
@@ -67,6 +63,40 @@ Status Dense::Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst)
   return Status::Ok();
 }
 
+}
+
+Status Dense::Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
+  VariableInfo* info = ctx->GetVariableInfo();
+  if (info->type != VariableInfo::kIndex) {
+    return Status::ArgumentError("Dense Partitioner Only Allow by kIndex");
+  }
+  if (dynamic_cast<WrapperData<Tensor>*>(src) != nullptr) {
+    Tensor& data = dynamic_cast<WrapperData<Tensor>*>(src)->Internal();
+    return SplitSingleTensor(ctx, data, dst);
+  } else if (dynamic_cast<WrapperData<std::vector<Tensor>>*>(src) != nullptr) {
+    std::vector<Tensor>& data_vec = dynamic_cast<WrapperData<std::vector<Tensor>>*>(src)->Internal();
+    dst->clear();
+    for (size_t i = 0; i < info->parts.size(); ++i) {
+      WrapperData<std::vector<Tensor>>* result = new WrapperData<std::vector<Tensor>>();
+      dst->emplace_back(result);
+      ctx->AddDeleter(result);
+    }
+    for (size_t i = 0; i < data_vec.size(); ++i) {
+      std::vector<Data*> one_dst;
+      Status one_status = SplitSingleTensor(ctx, data_vec[i], &one_dst);
+      if (!one_status.IsOk()) {
+        return one_status;
+      }
+      for(size_t j = 0; j < one_dst.size(); ++j) {
+        dynamic_cast<WrapperData<std::vector<Tensor>>*>((*dst)[j])->Internal().push_back(dynamic_cast<WrapperData<Tensor>*>(one_dst[j])->Internal());
+      }
+    }
+    return Status::Ok();
+  } else {
+    return Status::ArgumentError("Dense Partitioner Only Allow the Tensor Data or Tensor Data Vector");
+  }
+}
+
 Status Dense::Combine(PartitionerContext* ctx, Data* src, size_t server_id, std::unique_ptr<Data>* output) {
   VariableInfo* info = ctx->GetVariableInfo();
   if (info->type != VariableInfo::kIndex) {
@@ -95,6 +125,7 @@ Status Dense::Combine(PartitionerContext* ctx, Data* src, size_t server_id, std:
     shape.Set(0, combined_size);
   }
   Tensor* result;
+  /*
   if (output->get() == nullptr) {
     output->reset(new WrapperData<Tensor>(type, shape, new initializer::NoneInitializer));
     WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
@@ -106,6 +137,12 @@ Status Dense::Combine(PartitionerContext* ctx, Data* src, size_t server_id, std:
     }
     result = &(raw_output->Internal());
   }
+  */
+  WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
+  if (raw_output == nullptr) {
+    return Status::ArgumentError("Dense Partitioner Combiner output is not Tensor");
+  }
+  result = &(raw_output->Internal());
   size_t offset = 0;
   for (size_t i = 0; i < server_id; i++) {
     offset += info->parts[i].size;
@@ -119,6 +156,26 @@ Status Dense::Combine(PartitionerContext* ctx, Data* src, size_t server_id, std:
   return Status::Ok();
 }
 
+Status Dense::CombineInit(PartitionerContext* ctx, std::unique_ptr<Data>* output) {
+  VariableInfo* info = ctx->GetVariableInfo();
+  size_t combined_size = 0;
+  for (auto part : info->parts) {
+    combined_size += part.size;
+  }
+  std::vector<size_t> dims;
+  if (!info->shape.empty()) {
+    dims.push_back(combined_size);
+    for (size_t i = 1; i < info->shape.size(); ++i) {
+      dims.push_back(info->shape[i]);
+    }
+  }
+
+  TensorShape shape(dims);
+  DataType type = info->datatype;
+  output->reset(new WrapperData<Tensor>(type, shape, new initializer::NoneInitializer));
+  return Status::Ok();
+}
+
 }
 }
 }
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/dense.h b/xdl/ps-plus/ps-plus/client/partitioner/dense.h
index 93add65f..d3f64477 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner/dense.h
+++ b/xdl/ps-plus/ps-plus/client/partitioner/dense.h
@@ -26,6 +26,7 @@ class Dense : public Partitioner {
  public:
   virtual Status Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst) override;
   virtual Status Combine(PartitionerContext* ctx, Data* src, size_t server_id, std::unique_ptr<Data>* output) override;
+  virtual Status CombineInit(PartitionerContext* ctx, std::unique_ptr<Data>* output) override;
 };
 
 }
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/merged_broadcast.cc b/xdl/ps-plus/ps-plus/client/partitioner/merged_broadcast.cc
new file mode 100644
index 00000000..cdd75193
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/merged_broadcast.cc
@@ -0,0 +1,39 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/partitioner/merged_broadcast.h"
+
+namespace ps {
+namespace client {
+namespace partitioner {
+
+Status MergedBroadcast::Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
+  size_t part_size = ctx->GetContext(0)->GetVariableInfo()->parts.size();
+  for (size_t i = 0; i < ctx->ContextSize(); ++i) {
+    if (ctx->GetContext(i)->GetVariableInfo()->parts.size() != part_size) {
+      return Status::ArgumentError("Merged Hash Variable Should Have the Same Parts Size");
+    }
+  }
+  dst->clear();
+  for (size_t i = 0; i < part_size; ++i) {
+    dst->push_back(src);
+  }
+  return Status::Ok();
+}
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/merged_broadcast.h b/xdl/ps-plus/ps-plus/client/partitioner/merged_broadcast.h
new file mode 100644
index 00000000..33ce832c
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/merged_broadcast.h
@@ -0,0 +1,35 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_CLIENT_PARTITIONER_MERGED_BROADCAST_H_
+#define PS_PLUS_CLIENT_PARTITIONER_MERGED_BROADCAST_H_
+
+#include "ps-plus/client/merged_partitioner.h"
+
+namespace ps {
+namespace client {
+namespace partitioner {
+
+class MergedBroadcast : public MergedPartitioner {
+ public:
+  virtual Status Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) override;
+};
+
+}
+}
+}
+
+#endif
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/merged_hash.cc b/xdl/ps-plus/ps-plus/client/partitioner/merged_hash.cc
new file mode 100644
index 00000000..318a1fa8
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/merged_hash.cc
@@ -0,0 +1,126 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/partitioner/merged_hash.h"
+#include "ps-plus/common/thread_pool.h"
+#include "ps-plus/common/hasher.h"
+#include "ps-plus/common/logging.h"
+#include <cstring>
+#include <iostream>
+#include <future>
+
+namespace ps {
+namespace client {
+namespace partitioner {
+
+Status MergedHashData::Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
+  WrapperData<std::vector<Tensor>>* data_wrapper = dynamic_cast<WrapperData<std::vector<Tensor>>*>(src);
+  if (data_wrapper == nullptr) {
+    return Status::ArgumentError("MergedHashData Partitioner Only Allow the Tensor Data Vector");
+  }
+  std::vector<Tensor>& data_vec = data_wrapper->Internal();
+  if (data_vec.size() != ctx->ContextSize()) {
+    return Status::ArgumentError("Merged Variable Number Should be the Same With Data Number");
+  }
+  size_t part_size = ctx->GetContext(0)->GetVariableInfo()->parts.size();
+  dst->clear();
+  for (size_t i = 0; i < part_size; ++i) {
+    WrapperData<std::vector<Tensor>>* result = new WrapperData<std::vector<Tensor>>();
+    dynamic_cast<WrapperData<std::vector<Tensor>>*>(result)->Internal().resize(ctx->ContextSize());
+    dst->emplace_back(result);
+    ctx->AddDeleter(result);
+  }
+  Status status = Status::Ok();
+  std::vector<std::vector<Data*>> dst_arr(ctx->ContextSize());
+  for (size_t i = 0; i < ctx->ContextSize(); ++i) {
+    WrapperData<Tensor>* one_src = new WrapperData<Tensor>(data_vec[i]);
+    ctx->GetContext(i)->AddDeleter(one_src);
+    Status one_status = data_partitioner_.Split(ctx->GetContext(i), one_src, &dst_arr[i]);
+    if (!one_status.IsOk()) {
+      status = one_status;
+    }
+    for(size_t j = 0; j < dst_arr[i].size(); ++j) {
+      dynamic_cast<WrapperData<std::vector<Tensor>>*>((*dst)[j])->Internal()[i] = dynamic_cast<WrapperData<Tensor>*>(dst_arr[i][j])->Internal();
+    }
+  }
+  return status;
+}
+
+Status MergedHashData::Combine(MergedPartitionerContext* ctx, Data* src, size_t server_id, std::vector<std::unique_ptr<Data>>* output) {
+  WrapperData<std::vector<Tensor>>* data_wrapper = dynamic_cast<WrapperData<std::vector<Tensor>>*>(src);
+  if (data_wrapper == nullptr) {
+    return Status::ArgumentError("MergedHashData Partitioner Combine src Only Allow the Tensor Data Vector");
+  }
+  std::vector<Tensor>& data_vec = data_wrapper->Internal();
+  if (data_vec.size() != ctx->ContextSize() || data_vec.size() != output->size()) {
+    return Status::ArgumentError("Merged Variable Number Should be the Same With Data Number");
+  }
+  Status status = Status::Ok();
+  for (size_t i = 0; i < ctx->ContextSize(); ++i) {
+    WrapperData<Tensor>* one_src = new WrapperData<Tensor>(data_vec[i]);
+    ctx->GetContext(i)->AddDeleter(one_src, server_id);
+    Status one_status = data_partitioner_.Combine(ctx->GetContext(i), one_src, server_id, &(*output)[i]);
+    if (!one_status.IsOk()) {
+      status = one_status;
+    }
+  }
+  return status;
+}
+
+Status MergedHashId::Init(MergedPartitionerContext* ctx, Data* src) {
+  WrapperData<std::vector<Tensor>>* data_wrapper = dynamic_cast<WrapperData<std::vector<Tensor>>*>(src);
+  if (data_wrapper == nullptr) {
+    return Status::ArgumentError("MergedHashId Partitioner Only Allow the Tensor Data Vector");
+  }
+  std::vector<Tensor>& id_vec = data_wrapper->Internal();
+  if (id_vec.size() != ctx->ContextSize()) {
+    return Status::ArgumentError("Merged Variable Number Should be the Same With Id Number");
+  }
+  size_t part_size = ctx->GetContext(0)->GetVariableInfo()->parts.size();
+  return MultiThreadDo(ctx->ContextSize(), [&](const Range& r) {
+        for (size_t i = r.begin; i < r.end; i++) {
+          if (ctx->GetContext(i)->GetVariableInfo()->parts.size() != part_size) {
+            return Status::ArgumentError("Merged Hash Variable Should Have the Same Parts Size");
+          }
+          if (ctx->GetContext(i)->GetVariableInfo()->type != VariableInfo::kHash128 && 
+              ctx->GetContext(i)->GetVariableInfo()->type != VariableInfo::kHash64) {
+            return Status::ArgumentError("HashId Partitioner Only Allow by kHash");
+          }
+          WrapperData<Tensor>* one_src = new WrapperData<Tensor>(id_vec[i]);
+          ctx->GetContext(i)->AddDeleter(one_src);
+          Status st = id_partitioner_.Init(ctx->GetContext(i), one_src);
+          if (!st.IsOk()) {
+            return st;
+          }
+        }
+        return Status::Ok();
+      }, 1);
+}
+
+Status MergedHashData::CombineInit(MergedPartitionerContext* ctx, std::vector<std::unique_ptr<Data>>* output) {
+  Status status = Status::Ok();
+  for (size_t i = 0; i < ctx->ContextSize(); ++i) {
+    Status one_status = data_partitioner_.CombineInit(ctx->GetContext(i), &(*output)[i]);
+    if (!one_status.IsOk()) {
+      status = one_status;
+    }
+  }
+  return status;
+}
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/merged_hash.h b/xdl/ps-plus/ps-plus/client/partitioner/merged_hash.h
new file mode 100644
index 00000000..29b098e1
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/merged_hash.h
@@ -0,0 +1,51 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_CLIENT_PARTITIONER_MERGED_HASH_H_
+#define PS_PLUS_CLIENT_PARTITIONER_MERGED_HASH_H_
+
+#include "ps-plus/client/merged_partitioner.h"
+#include "ps-plus/client/partitioner/sparse.h"
+#include "ps-plus/common/tensor.h"
+#include "ps-plus/common/tensor_shape.h"
+
+namespace ps {
+namespace client {
+namespace partitioner {
+
+class MergedHashData : public MergedPartitioner {
+ public:
+  MergedHashData(size_t id = 0) : id_(id) {}
+  virtual Status Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) override;
+  virtual Status Combine(MergedPartitionerContext* ctx, Data* src, size_t server_id, std::vector<std::unique_ptr<Data>>* output) override;
+  virtual Status CombineInit(MergedPartitionerContext* ctx, std::vector<std::unique_ptr<Data>>* output) override;
+ protected:
+  size_t id_;
+  HashId id_partitioner_;
+  HashData data_partitioner_;
+};
+
+class MergedHashId : public MergedHashData {
+ public:
+  MergedHashId(size_t id = 0) : MergedHashData(id) {}
+  virtual Status Init(MergedPartitionerContext* ctx, Data* src) override;
+};
+
+}
+}
+}
+
+#endif
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/merged_slice.h b/xdl/ps-plus/ps-plus/client/partitioner/merged_slice.h
new file mode 100644
index 00000000..dc7ec754
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/merged_slice.h
@@ -0,0 +1,99 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_CLIENT_PARTITIONER_MERGED_SLICE_H_
+#define PS_PLUS_CLIENT_PARTITIONER_MERGED_SLICE_H_
+
+#include "ps-plus/client/merged_partitioner.h"
+#include "ps-plus/client/partitioner/sparse.h"
+#include "ps-plus/common/tensor.h"
+#include "ps-plus/common/tensor_shape.h"
+
+namespace ps {
+namespace client {
+namespace partitioner {
+
+class MergedSliceBegin : public MergedPartitioner {
+ public:
+  MergedSliceBegin() {}
+  virtual Status Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) override {
+    WrapperData<std::vector<int>>* data_wrapper = dynamic_cast<WrapperData<std::vector<int>>*>(src);
+    if (data_wrapper == nullptr) {
+      return Status::ArgumentError("MergedSliceBegin Partitioner Only Allow the IntVector");
+    }
+    auto& data = data_wrapper->Internal();
+    if (data.size() != ctx->ContextSize()) {
+      return Status::ArgumentError("MergedSliceBegin Partitioner IntVector Size should be equal to variable size");
+    }
+    std::vector<std::vector<int>> raw_result(ctx->GetContext(0)->GetVariableInfo()->parts.size());
+    for (size_t i = 0; i < ctx->ContextSize(); i++) {
+      VariableInfo* info = ctx->GetContext(0)->GetVariableInfo();
+      if (info->parts.size() != raw_result.size()) {
+        return Status::ArgumentError("Merged Variable Number Should be the Same With Data Number");
+      }
+      int k = 0;
+      for (size_t j = 0; j < info->parts.size(); j++) {
+        raw_result[j].push_back(k);
+        k += info->parts[j].size;
+      }
+    }
+    for (auto&& item : raw_result) {
+      auto rst = new WrapperData<std::vector<int>>(item);
+      dst->push_back(rst);
+      ctx->AddDeleter(rst);
+    }
+    return Status::Ok();
+  }
+};
+
+class MergedSliceEnd : public MergedPartitioner {
+ public:
+  MergedSliceEnd() {}
+  virtual Status Split(MergedPartitionerContext* ctx, Data* src, std::vector<Data*>* dst) override {
+    WrapperData<std::vector<int>>* data_wrapper = dynamic_cast<WrapperData<std::vector<int>>*>(src);
+    if (data_wrapper == nullptr) {
+      return Status::ArgumentError("MergedSliceBegin Partitioner Only Allow the IntVector");
+    }
+    auto& data = data_wrapper->Internal();
+    if (data.size() != ctx->ContextSize()) {
+      return Status::ArgumentError("MergedSliceBegin Partitioner IntVector Size should be equal to variable size");
+    }
+    std::vector<std::vector<int>> raw_result(ctx->GetContext(0)->GetVariableInfo()->parts.size());
+    for (size_t i = 0; i < ctx->ContextSize(); i++) {
+      VariableInfo* info = ctx->GetContext(0)->GetVariableInfo();
+      if (info->parts.size() != raw_result.size()) {
+        return Status::ArgumentError("Merged Variable Number Should be the Same With Data Number");
+      }
+      int k = 0;
+      for (size_t j = 0; j < info->parts.size(); j++) {
+        k += info->parts[j].size;
+        raw_result[j].push_back(k);
+      }
+    }
+    for (auto&& item : raw_result) {
+      auto rst = new WrapperData<std::vector<int>>(item);
+      dst->push_back(rst);
+      ctx->AddDeleter(rst);
+    }
+    return Status::Ok();
+  }
+};
+
+}
+}
+}
+
+#endif
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/reduce.cc b/xdl/ps-plus/ps-plus/client/partitioner/reduce.cc
new file mode 100644
index 00000000..dd9241d7
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/reduce.cc
@@ -0,0 +1,31 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/partitioner/reduce.h"
+
+namespace ps {
+namespace client {
+namespace partitioner {
+namespace reduce_impl {
+
+constexpr int AddFunctor::default_value;
+constexpr int MulFunctor::default_value;
+constexpr bool AndFunctor::default_value;
+constexpr bool OrFunctor::default_value;
+
+}
+}
+}
+}
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/reduce.h b/xdl/ps-plus/ps-plus/client/partitioner/reduce.h
new file mode 100644
index 00000000..b8a7de83
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/reduce.h
@@ -0,0 +1,100 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_CLIENT_PARTITIONER_REDUCE_H_
+#define PS_PLUS_CLIENT_PARTITIONER_REDUCE_H_
+
+#include "ps-plus/client/partitioner.h"
+
+namespace ps {
+namespace client {
+namespace partitioner {
+namespace reduce_impl {
+
+template <typename T, typename Functor>
+class Reduce : public Partitioner {
+ public:
+  virtual Status Combine(PartitionerContext* ctx, Data* src, size_t server_id, std::unique_ptr<Data>* output) override {
+    WrapperData<T>* raw_src = dynamic_cast<WrapperData<T>*>(src);
+    if (raw_src == nullptr) {
+      return Status::ArgumentError("Logic Partitioner Combine src should be bool");
+    }
+
+    if (output->get() == nullptr) {
+      output->reset(new WrapperData<T>(Functor::default_value));
+    } 
+
+    WrapperData<T>* dst = dynamic_cast<WrapperData<T>*>(output->get());
+    Functor::Run(raw_src->Internal(), &dst->Internal());
+
+    return Status::Ok();
+  }
+};
+
+struct AddFunctor {
+  static constexpr int default_value = 0;
+  template<typename T>
+  static void Run(T x, T* y) {
+    *y += x;
+  }
+};
+
+struct MulFunctor {
+  static constexpr int default_value = 1;
+  template<typename T>
+  static void Run(T x, T* y) {
+    *y *= x;
+  }
+};
+
+struct AndFunctor {
+  static constexpr bool default_value = true;
+  template<typename T>
+  static void Run(T x, T* y) {
+    *y &= x;
+  }
+};
+
+struct OrFunctor {
+  static constexpr bool default_value = false;
+  template<typename T>
+  static void Run(T x, T* y) {
+    *y |= x;
+  }
+};
+
+template<typename T>
+class ReduceSum : public Reduce<T, AddFunctor> {};
+
+template<typename T>
+class ReduceMul : public Reduce<T, MulFunctor> {};
+
+class ReduceAnd : public Reduce<bool, AndFunctor> {};
+
+class ReduceOr : public Reduce<bool, OrFunctor> {};
+
+}
+
+using reduce_impl::ReduceSum;
+using reduce_impl::ReduceMul;
+using reduce_impl::ReduceAnd;
+using reduce_impl::ReduceOr;
+
+}
+}
+}
+
+#endif
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/sparse.cc b/xdl/ps-plus/ps-plus/client/partitioner/sparse.cc
index d88121b8..952568e1 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner/sparse.cc
+++ b/xdl/ps-plus/ps-plus/client/partitioner/sparse.cc
@@ -30,20 +30,58 @@ struct SparseSlices {
   size_t id_size;
 };
 
-}
+Status SplitOneHashId(PartitionerContext* ctx, const Tensor& id, size_t index) {
+  VariableInfo* info = ctx->GetVariableInfo();
+  if (info->type == VariableInfo::kHash128) {
+    if (id.Shape().Size() != 2 || id.Shape()[1] != 2) {
+      return Status::ArgumentError("HashId Parttioner: Hash128 ID Should be 2-D, ID Shape should be [?, 2], variable[" + info->name + "]");
+    }
+  } else {
+    if (id.Shape().Size() != 1) {
+      return Status::ArgumentError("HashId Parttioner: Hash64 ID Should be 1-D, variable[" + info->name + "]");
+    }
+  }
 
-Status SparseData::Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
-  WrapperData<Tensor>* data_wrapper = dynamic_cast<WrapperData<Tensor>*>(src);
-  if (data_wrapper == nullptr) {
-    return Status::ArgumentError("Sparse Partitioner Only Allow the Tensor Data");
+  size_t limit = 0;
+  // We need to use lower_bound(splits, id) to find server about id
+  std::vector<size_t> splits;
+  for (auto& item : info->parts) {
+    limit += item.size;
+    splits.push_back(limit - 1);
   }
-  Tensor& data = data_wrapper->Internal();
 
+  if (limit != Hasher::kTargetRange) {
+    return Status::ArgumentError("HashId Parttioner: Variable Info Error, Check the Placementer");
+  }
+
+  SparseSlices slices;
+  slices.ids.resize(info->parts.size());
+  slices.id_size = id.Shape()[0];
+
+  CASES(id.Type(), do {
+    T* raw_ids = id.Raw<T>();
+    for (size_t i = 0; i < id.Shape()[0]; i++) {
+      size_t x;
+      if (info->type == VariableInfo::kHash128) {
+        x = Hasher::Hash128(raw_ids[i * 2], raw_ids[i * 2 + 1]);
+      } else {
+        x = Hasher::Hash64(raw_ids[i]);
+      }
+      int split_id = std::lower_bound(splits.begin(), splits.end(), x) - splits.begin();
+      slices.ids[split_id].push_back(i);
+    }
+  } while(0));
+
+  ctx->SetData(index, new WrapperData<SparseSlices>(std::move(slices)));
+  return Status::Ok();
+}
+
+Status SplitOneSparseData(PartitionerContext* ctx, const Tensor& data, std::vector<Data*>* dst, size_t id) {
   if (data.Shape().IsScalar()) {
     return Status::ArgumentError("Sparse Partitioner Doesn't Accept Scalar Type");
   }
 
-  WrapperData<SparseSlices>* id_wrapper = dynamic_cast<WrapperData<SparseSlices>*>(ctx->GetData(id_));
+  WrapperData<SparseSlices>* id_wrapper = dynamic_cast<WrapperData<SparseSlices>*>(ctx->GetData(id));
   if (id_wrapper == nullptr) {
     return Status::ArgumentError("Sparse Partitioner Init Error");
   }
@@ -53,25 +91,61 @@ Status SparseData::Split(PartitionerContext* ctx, Data* src, std::vector<Data*>*
     return Status::ArgumentError("Data's Shape Does Not Match the ID Size");
   }
 
-  dst->clear();
-
+  dst->resize(slices.ids.size());
+  
   TensorShape shape = data.Shape();
   DataType type = data.Type();
   shape.Set(0, 1);
   size_t single_size = shape.NumElements() * SizeOfType(type);
-  for (auto item : slices.ids) {
-    shape.Set(0, item.size());
-    WrapperData<Tensor>* result = new WrapperData<Tensor>(type, shape, new initializer::NoneInitializer);
-    char* res_ptr = result->Internal().Raw<char>();
-    char* src_ptr = data.Raw<char>();
-    for (auto id : item) {
-      memcpy(res_ptr, src_ptr + id * single_size, single_size);
-      res_ptr += single_size;
+  MultiThreadDoTBB(slices.ids.size(), [&](const Range& r) {
+        for (size_t i = r.begin; i < r.end; i++) {
+          auto& item = slices.ids[i];
+          TensorShape shape = data.Shape();
+          shape.Set(0, item.size());
+          WrapperData<Tensor>* result = new WrapperData<Tensor>(data.Type(), shape, new initializer::NoneInitializer);
+          char* res_ptr = result->Internal().Raw<char>();
+          char* src_ptr = data.Raw<char>();
+          for (auto id : item) {
+            memcpy(res_ptr, src_ptr + id * single_size, single_size);
+            res_ptr += single_size;
+          }
+          ctx->AddDeleter(result, i);
+          (*dst)[i] = result;
+        }
+        return Status::Ok();
+      });
+  return Status::Ok();
+}
+
+}
+
+Status SparseData::Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst) {
+  if (dynamic_cast<WrapperData<Tensor>*>(src) != nullptr) {
+    Tensor& data = dynamic_cast<WrapperData<Tensor>*>(src)->Internal();
+    return SplitOneSparseData(ctx, data, dst, id_);
+  } else if (dynamic_cast<WrapperData<std::vector<Tensor>>*>(src) != nullptr) {
+    VariableInfo* info = ctx->GetVariableInfo();
+    std::vector<Tensor>& data_vec = dynamic_cast<WrapperData<std::vector<Tensor>>*>(src)->Internal();
+    dst->clear();
+    for (size_t i = 0; i < info->parts.size(); ++i) {
+      WrapperData<std::vector<Tensor>>* result = new WrapperData<std::vector<Tensor>>();
+      dst->emplace_back(result);
+      ctx->AddDeleter(result);
+    }
+    for (size_t i = 0; i < data_vec.size(); ++i) {
+      std::vector<Data*> one_dst;
+      Status one_status = SplitOneSparseData(ctx, data_vec[i], &one_dst, i);
+      if (!one_status.IsOk()) {
+        return one_status;
+      }
+      for(size_t j = 0; j < one_dst.size(); ++j) {
+        dynamic_cast<WrapperData<std::vector<Tensor>>*>((*dst)[j])->Internal().push_back(dynamic_cast<WrapperData<Tensor>*>(one_dst[j])->Internal());
+      }
     }
-    ctx->AddDeleter(result);
-    dst->push_back(result);
+    return Status::Ok();
+  } else {
+    return Status::ArgumentError("SparseData Partitioner Only Allow the Tensor Data or Tensor Data Vector");
   }
-  return Status::Ok();
 }
 
 Status SparseData::Combine(PartitionerContext* ctx, Data* src, size_t server_id, std::unique_ptr<Data>* output) {
@@ -95,29 +169,43 @@ Status SparseData::Combine(PartitionerContext* ctx, Data* src, size_t server_id,
     return Status::ArgumentError("Sparse Partitioner Combiner src shape error");
   }
  
-  shape.Set(0, slices.id_size);
-  
   Tensor* result;
-  if (output->get() == nullptr) {
-    output->reset(new WrapperData<Tensor>(type, shape, new initializer::NoneInitializer));
-    WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
-    result = &(raw_output->Internal());
-  } else {
-    WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
-    if (raw_output == nullptr) {
-      return Status::ArgumentError("Sparse Partitioner Combiner output is not Tensor");
+  shape.Set(0, slices.id_size);
+
+  /*
+  {
+    QRWLocker lock(lock_, QRWLocker::kWrite);
+    if (output->get() == nullptr) {
+      output->reset(new WrapperData<Tensor>(type, shape, new initializer::NoneInitializer));
+      WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
+      result = &(raw_output->Internal());
+    } else {
+      WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
+      if (raw_output == nullptr) {
+        return Status::ArgumentError("Sparse Partitioner Combiner output is not Tensor");
+      }
+      result = &(raw_output->Internal());
     }
-    result = &(raw_output->Internal());
   }
+  */
+  WrapperData<Tensor>* raw_output = dynamic_cast<WrapperData<Tensor>*>(output->get());
+  if (raw_output == nullptr) {
+    return Status::ArgumentError("Sparse Partitioner Combiner output is not Tensor");
+  }
+  result = &(raw_output->Internal());
 
-  char* src_ptr = data.Raw<char>();
   char* res_ptr = result->Raw<char>();
   shape.Set(0, 1);
   size_t single_size = shape.NumElements() * SizeOfType(type);
-  for (auto item : slices.ids[server_id]) {
-    memcpy(res_ptr + item * single_size, src_ptr, single_size);
-    src_ptr += single_size;
-  }
+  MultiThreadDo(slices.ids[server_id].size(), [&](const Range& r) {
+        char* src_ptr = data.Raw<char>() + r.begin * single_size;
+        for (size_t i = r.begin; i < r.end; ++i) {
+          size_t item = slices.ids[server_id][i];
+          memcpy(res_ptr + item * single_size, src_ptr, single_size);
+          src_ptr += single_size;
+        }
+        return Status::Ok();
+      }, 1000);
   return Status::Ok();
 }
 
@@ -169,45 +257,44 @@ Status SparseId::Init(PartitionerContext* ctx, Data* src) {
 
 Status HashId::Init(PartitionerContext* ctx, Data* src) {
   VariableInfo* info = ctx->GetVariableInfo();
-  if (info->type != VariableInfo::kHash) {
+  if (info->type != VariableInfo::kHash128 && info->type != VariableInfo::kHash64) {
     return Status::ArgumentError("HashId Partitioner Only Allow by kHash");
   }
-  WrapperData<Tensor>* data_wrapper = dynamic_cast<WrapperData<Tensor>*>(src);
-  if (data_wrapper == nullptr) {
-    return Status::ArgumentError("Sparse Partitioner Only Allow the Tensor Data");
+  if (dynamic_cast<WrapperData<Tensor>*>(src) != nullptr) {
+    Tensor& id = dynamic_cast<WrapperData<Tensor>*>(src)->Internal();
+    return SplitOneHashId(ctx, id, id_);
+  } else if (dynamic_cast<WrapperData<std::vector<Tensor>>*>(src) != nullptr) {
+    std::vector<Tensor>& id_vec = dynamic_cast<WrapperData<std::vector<Tensor>>*>(src)->Internal();
+    for (size_t i = 0; i < id_vec.size(); ++i) {
+      Status one_status = SplitOneHashId(ctx, id_vec[i], i);
+      if (!one_status.IsOk()) {
+        return one_status;
+      }
+    }
+    return Status::Ok();
+  } else {
+    return Status::ArgumentError("HashId Partitioner Only Allow the Tensor Data or Tensor Data Vector");
   }
-  Tensor& id = data_wrapper->Internal();
+}
 
-  if (id.Shape().Size() != 2 || id.Shape()[1] != 2) {
-    return Status::ArgumentError("Sparse Parttioner: ID Should be 2-D, ID Shape should be [?, 2]");
+Status SparseData::CombineInit(PartitionerContext* ctx, std::unique_ptr<Data>* output) {
+  WrapperData<SparseSlices>* id_wrapper = dynamic_cast<WrapperData<SparseSlices>*>(ctx->GetData(id_));
+  if (id_wrapper == nullptr) {
+    return Status::ArgumentError("Sparse Partitioner Init Error");
   }
+  SparseSlices& slices = id_wrapper->Internal();
 
-  size_t limit = 0;
-  // We need to use lower_bound(splits, id) to find server about id
-  std::vector<size_t> splits;
-  for (auto item : info->parts) {
-    limit += item.size;
-    splits.push_back(limit - 1);
-  }
+  VariableInfo* info = ctx->GetVariableInfo();
 
-  if (limit != Hasher::kTargetRange) {
-    return Status::ArgumentError("HashId Parttioner: Variable Info Error, Check the Placementer");
+  std::vector<size_t> dims;
+  dims.push_back(slices.id_size);
+  for (size_t i = 1; i < info->shape.size(); ++i) {
+    dims.push_back(info->shape[i]);
   }
+  TensorShape shape(dims);
+  DataType type = info->datatype;
+  output->reset(new WrapperData<Tensor>(type, shape, new initializer::NoneInitializer));
 
-  SparseSlices slices;
-  slices.ids.resize(info->parts.size());
-  slices.id_size = id.Shape()[0];
-
-  CASES(id.Type(), do {
-    T* raw_ids = id.Raw<T>();
-    for (size_t i = 0; i < id.Shape()[0]; i++) {
-      size_t x = Hasher::Hash128(raw_ids[i * 2], raw_ids[i * 2 + 1]);
-      int split_id = std::lower_bound(splits.begin(), splits.end(), x) - splits.begin();
-      slices.ids[split_id].push_back(i);
-    }
-  } while(0));
-
-  ctx->SetData(id_, new WrapperData<SparseSlices>(std::move(slices)));
   return Status::Ok();
 }
 
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/sparse.h b/xdl/ps-plus/ps-plus/client/partitioner/sparse.h
index 07d39df6..76e7b1e2 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner/sparse.h
+++ b/xdl/ps-plus/ps-plus/client/partitioner/sparse.h
@@ -19,6 +19,7 @@ limitations under the License.
 #include "ps-plus/client/partitioner.h"
 #include "ps-plus/common/tensor.h"
 #include "ps-plus/common/tensor_shape.h"
+#include "ps-plus/common/qrw_lock.h"
 
 namespace ps {
 namespace client {
@@ -29,8 +30,10 @@ class SparseData : public Partitioner {
   SparseData(size_t id = 0) : id_(id) {}
   virtual Status Split(PartitionerContext* ctx, Data* src, std::vector<Data*>* dst) override;
   virtual Status Combine(PartitionerContext* ctx, Data* src, size_t server_id, std::unique_ptr<Data>* output) override;
+  virtual Status CombineInit(PartitionerContext* ctx, std::unique_ptr<Data>* output) override;
  protected:
   size_t id_;
+  QRWLock lock_;
 };
 
 class SparseId : public SparseData {
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/test/dense_test.cc b/xdl/ps-plus/ps-plus/client/partitioner/test/dense_test.cc
index 374cc538..982d7a24 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner/test/dense_test.cc
+++ b/xdl/ps-plus/ps-plus/client/partitioner/test/dense_test.cc
@@ -34,8 +34,10 @@ TEST(DensePartitionerTest, SimpleSplitAndCombine) {
   info.parts.push_back(VariableInfo::Part{.server = 1, .size = 2});
   info.parts.push_back(VariableInfo::Part{.server = 2, .size = 4});
   info.parts.push_back(VariableInfo::Part{.server = 3, .size = 3});
-  info.shape.push_back(0);
+  info.shape.push_back(10);
+  info.shape.push_back(2);
   info.type = VariableInfo::kIndex;
+  info.datatype = DataType::kInt64;
   PartitionerContext ctx(info);
   std::unique_ptr<WrapperData<Tensor>> data(new WrapperData<Tensor>(DataType::kInt64, TensorShape({10, 2}), new NoneInitializer)); for (int i = 0; i < 20; i++) {
     data->Internal().Raw<int64_t>()[i] = i;
@@ -67,6 +69,7 @@ TEST(DensePartitionerTest, SimpleSplitAndCombine) {
   }
 
   std::unique_ptr<Data> data2;
+  EXPECT_TRUE(partitioner.CombineInit(&ctx, &data2).IsOk());
   EXPECT_TRUE(partitioner.Combine(&ctx, result[1], 1, &data2).IsOk());
   EXPECT_TRUE(partitioner.Combine(&ctx, result[3], 3, &data2).IsOk());
   EXPECT_TRUE(partitioner.Combine(&ctx, result[0], 0, &data2).IsOk());
@@ -80,8 +83,11 @@ TEST(DensePartitionerTest, SimpleSplitAndCombine) {
 
 TEST(DensePartitionerTest, ScalarSplitAndCombine) {
   VariableInfo info;
-  info.parts.push_back(VariableInfo::Part{.server = 0, .size = 1});
+  info.parts.push_back(VariableInfo::Part{.server = 0, .size = 10});
   info.type = VariableInfo::kIndex;
+  info.shape.push_back(10);
+  info.shape.push_back(2);
+  info.datatype = DataType::kInt64;
   PartitionerContext ctx(info);
   std::unique_ptr<WrapperData<Tensor>> data(new WrapperData<Tensor>(DataType::kInt64, TensorShape({10, 2}), new NoneInitializer));
   for (int i = 0; i < 20; i++) {
@@ -98,6 +104,7 @@ TEST(DensePartitionerTest, ScalarSplitAndCombine) {
     EXPECT_EQ(i, dynamic_cast<WrapperData<Tensor>*>(result[0])->Internal().Raw<int64_t>()[i]);
   }
   std::unique_ptr<Data> data2;
+  EXPECT_TRUE(partitioner.CombineInit(&ctx, &data2).IsOk());
   EXPECT_TRUE(partitioner.Combine(&ctx, result[0], 0, &data2).IsOk());
   EXPECT_EQ(TensorShape({10, 2}), dynamic_cast<WrapperData<Tensor>*>(data2.get())->Internal().Shape());
   EXPECT_EQ(DataType::kInt64, dynamic_cast<WrapperData<Tensor>*>(data2.get())->Internal().Type());
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/test/merged_broadcast_test.cc b/xdl/ps-plus/ps-plus/client/partitioner/test/merged_broadcast_test.cc
new file mode 100644
index 00000000..def4cec5
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/client/partitioner/test/merged_broadcast_test.cc
@@ -0,0 +1,54 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/client/partitioner/merged_broadcast.h"
+
+using ps::client::PartitionerContext;
+using ps::client::MergedPartitionerContext;
+using ps::client::partitioner::MergedBroadcast;
+using ps::VariableInfo;
+using ps::Data;
+using ps::WrapperData;
+
+TEST(MergedBroadcastPartitionerTest, MergedBroadcastPartitionerTest) {
+  VariableInfo info1;
+  info1.parts.push_back(VariableInfo::Part{.server = 0, .size = 1});
+  info1.parts.push_back(VariableInfo::Part{.server = 1, .size = 1});
+  info1.parts.push_back(VariableInfo::Part{.server = 2, .size = 1});
+  info1.parts.push_back(VariableInfo::Part{.server = 3, .size = 1});
+  PartitionerContext* ctx1 = new PartitionerContext(info1);
+  VariableInfo info2;
+  info2.parts.push_back(VariableInfo::Part{.server = 0, .size = 1});
+  info2.parts.push_back(VariableInfo::Part{.server = 1, .size = 1});
+  info2.parts.push_back(VariableInfo::Part{.server = 2, .size = 1});
+  info2.parts.push_back(VariableInfo::Part{.server = 3, .size = 1});
+  PartitionerContext* ctx2 = new PartitionerContext(info2);
+  WrapperData<int>* data = new WrapperData<int>(10);
+  std::vector<Data*> result;
+  MergedBroadcast splitter; 
+  MergedPartitionerContext ctx;
+  ctx.AddContext(ctx1);
+  ctx.AddContext(ctx2);
+  EXPECT_TRUE(splitter.Init(&ctx, data).IsOk());
+  EXPECT_TRUE(splitter.Split(&ctx, data, &result).IsOk());
+  EXPECT_EQ(4u, result.size());
+  EXPECT_EQ(10, dynamic_cast<WrapperData<int>*>(result[0])->Internal());
+  EXPECT_EQ(10, dynamic_cast<WrapperData<int>*>(result[1])->Internal());
+  EXPECT_EQ(10, dynamic_cast<WrapperData<int>*>(result[2])->Internal());
+  EXPECT_EQ(10, dynamic_cast<WrapperData<int>*>(result[3])->Internal());
+  delete data;
+}
+
diff --git a/xdl/ps-plus/ps-plus/client/partitioner/test/sparse_test.cc b/xdl/ps-plus/ps-plus/client/partitioner/test/sparse_test.cc
index 3be3b81d..ded9a9b0 100644
--- a/xdl/ps-plus/ps-plus/client/partitioner/test/sparse_test.cc
+++ b/xdl/ps-plus/ps-plus/client/partitioner/test/sparse_test.cc
@@ -35,8 +35,9 @@ TEST(SparsePartitionerTest, SplitAndCombine) {
   info.parts.push_back(VariableInfo::Part{.server = 2, .size = 4});
   info.parts.push_back(VariableInfo::Part{.server = 3, .size = 3});
   info.parts.push_back(VariableInfo::Part{.server = 4, .size = 5});
-  info.shape.push_back(0);
+  info.shape.push_back(15);
   info.type = VariableInfo::kIndex;
+  info.datatype = DataType::kInt64;
   PartitionerContext ctx(info);
 
   std::unique_ptr<WrapperData<Tensor>> data(new WrapperData<Tensor>(DataType::kInt64, TensorShape({5, 2}), new NoneInitializer));
@@ -78,6 +79,7 @@ TEST(SparsePartitionerTest, SplitAndCombine) {
   EXPECT_EQ(11, dynamic_cast<WrapperData<Tensor>*>(id_result[4])->Internal().Raw<int64_t>()[1]);
 
   std::unique_ptr<Data> ids2;
+  EXPECT_TRUE(id_partitioner.CombineInit(&ctx, &ids2).IsOk());
   EXPECT_TRUE(id_partitioner.Combine(&ctx, id_result[1], 1, &ids2).IsOk());
   EXPECT_TRUE(id_partitioner.Combine(&ctx, id_result[4], 4, &ids2).IsOk());
   EXPECT_TRUE(id_partitioner.Combine(&ctx, id_result[2], 2, &ids2).IsOk());
@@ -114,6 +116,9 @@ TEST(SparsePartitionerTest, SplitAndCombine) {
   }
 
   std::unique_ptr<Data> data2;
+  info.shape.push_back(2);
+  ctx.SetVariableInfo(info);
+  EXPECT_TRUE(data_partitioner.CombineInit(&ctx, &data2).IsOk());
   EXPECT_TRUE(data_partitioner.Combine(&ctx, result[1], 1, &data2).IsOk());
   EXPECT_TRUE(data_partitioner.Combine(&ctx, result[4], 4, &data2).IsOk());
   EXPECT_TRUE(data_partitioner.Combine(&ctx, result[2], 2, &data2).IsOk());
diff --git a/xdl/ps-plus/ps-plus/client/process_context.h b/xdl/ps-plus/ps-plus/client/process_context.h
index ca0ef2be..d712b72c 100644
--- a/xdl/ps-plus/ps-plus/client/process_context.h
+++ b/xdl/ps-plus/ps-plus/client/process_context.h
@@ -24,38 +24,30 @@ namespace client {
 class ProcessContext {
  public:
   using Callback = std::function<void (const Status&)>;
-  ProcessContext(int count) : count_(count), st_(Status::Ok()) {}
+  ProcessContext(size_t count) : count_(count), st_(Status::Ok()) {}
   void Collect(const std::vector<Partitioner*>& combiner,
-                      PartitionerContext* ctx,
-                      std::vector<Data*>* server_results,
-                      std::vector<std::unique_ptr<Data>>* results,
-                      size_t server_id,
-                      Status resp_st,
-                      Callback cb) {
-    bool run_done = false;
-    {
-      std::lock_guard<std::mutex> lock(mu_);
-      if (!resp_st.IsOk()) {
-        st_ = resp_st;
+               PartitionerContext* ctx,
+               std::vector<Data*>* server_results,
+               std::vector<std::unique_ptr<Data>>* results,
+               size_t server_id,
+               const Status& resp_st,
+               const Callback& cb) {
+    if (!resp_st.IsOk()) {
+      st_ = resp_st;
+    } else {
+      if ((*server_results).size() != combiner.size()) {
+        st_ = Status::ArgumentError("Combiner Size Error");
       } else {
-        if ((*server_results).size() != combiner.size()) {
-          st_ = Status::ArgumentError("Combiner Size Error");
-        } else {
-          for (size_t i = 0; i < combiner.size(); ++i) {
-            Status st = combiner[i]->Combine(ctx, (*server_results)[i], server_id, &(*results)[i]);
-            if (!st.IsOk()) {
-              st_ = st;
-            }
+        for (size_t i = 0; i < combiner.size(); ++i) {
+          Status st = combiner[i]->Combine(ctx, (*server_results)[i], server_id, &(*results)[i]);
+          if (!st.IsOk()) {
+            st_ = st;
           }
         }
       }
-      delete server_results;
-      count_--;
-      if (count_ == 0) {
-        run_done = true;
-      }
     }
-    if (run_done == true) {
+    delete server_results;
+    if (--count_ == 0) {
       cb(st_);
       delete this;
     }
@@ -65,14 +57,13 @@ class ProcessContext {
                           std::vector<Data*>* server_results,
                           std::vector<std::unique_ptr<Data>>* results,
                           size_t server_id,
-                          Callback cb) {
+                          const Callback& cb) {
     return [combiner, ctx, server_results, results, server_id, cb, this](Status resp_st){
       this->Collect(combiner, ctx, server_results, results, server_id, resp_st, cb);
     };
   }
  private:
-  int count_;
-  std::mutex mu_;
+  std::atomic<size_t> count_;
   Status st_;
 };
 
diff --git a/xdl/ps-plus/ps-plus/client/raw_client.cc b/xdl/ps-plus/ps-plus/client/raw_client.cc
index b4162ca6..f3020a92 100644
--- a/xdl/ps-plus/ps-plus/client/raw_client.cc
+++ b/xdl/ps-plus/ps-plus/client/raw_client.cc
@@ -15,12 +15,14 @@ limitations under the License.
 
 #include "ps-plus/client/raw_client.h"
 #include "ps-plus/client/process_context.h"
+#include "ps-plus/client/merged_process_context.h"
 #include "ps-plus/client/model_server_splitter.h"
 
+#include "ps-plus/common/logging.h"
+
 #include <iostream>
 #include <sstream>
 #include <sys/time.h>
-#include <glog/logging.h>
 
 #define RETURN_ASYNC(STATUS) do { cb(STATUS); return; } while (0)
 
@@ -48,6 +50,81 @@ Status RawClient::Init() {
   return client_wrapper_->ConnectToCluster(args_.scheduler_addr);
 }
 
+void RawClient::Process(
+  const UdfChain& udf, 
+  const std::vector<std::string>& var_names,
+  const std::vector<Data*>& datas,
+  const std::vector<MergedPartitioner*>& splitter,
+  const std::vector<MergedPartitioner*>& combiner,
+  std::vector<std::vector<std::unique_ptr<Data>>>* results,
+  const Callback& cb_internal) {
+
+  MergedPartitionerContext* ctx = new MergedPartitionerContext;
+  Callback cb = [this, ctx, splitter, combiner, datas, cb_internal](Status s){
+    cb_internal(s);
+    delete ctx;
+    for (auto item : splitter) {
+      delete item;
+    }
+    for (auto item : combiner) {
+      delete item;
+    }
+    for (auto item : datas) {
+      delete item;
+    }
+  };
+  for (size_t i = 0; i < var_names.size(); ++i) {
+    PartitionerContext* one_ctx = new PartitionerContext;
+    VariableInfo info;
+    CHECK_ASYNC(GetVariableInfo(var_names[i], &info));
+    one_ctx->SetVariableInfo(info);
+    ctx->AddContext(one_ctx);
+  }
+  const std::vector<VariableInfo::Part>& server_to_send = ctx->GetContext(0)->GetVariableInfo()->parts;
+  size_t servers = server_to_send.size();
+
+  if (splitter.size() != datas.size()) {
+    RETURN_ASYNC(Status::ArgumentError("Splitter has the wrong size."));
+  }
+
+  std::vector<std::vector<Data*>> split_results;
+  for (size_t i = 0; i < datas.size(); ++i) {
+    CHECK_ASYNC(splitter[i]->Init(ctx, datas[i]));
+  }
+  for (size_t i = 0; i < datas.size(); ++i) {
+    split_results.emplace_back();
+    CHECK_ASYNC(splitter[i]->Split(ctx, datas[i], &split_results.back()));
+  }
+
+  std::vector<std::vector<Data*>> request(servers);  
+  for (size_t i = 0; i < split_results.size(); ++i) {
+    if (split_results[i].size() != servers) {
+      RETURN_ASYNC(Status::ArgumentError("Splitter result size error"));
+    }
+    for (size_t j = 0; j < split_results[i].size(); ++j) {
+      request[j].push_back(split_results[i][j]);
+    }
+  }
+  
+  MergedProcessContext* pctx = new MergedProcessContext(servers);
+  (*results).clear();
+  (*results).resize(combiner.size());
+  for (auto& result_vec : (*results)) {
+    result_vec.resize(var_names.size());
+  }
+
+  for (size_t i = 0; i < combiner.size(); ++i) {
+    combiner[i]->CombineInit(ctx, &(*results)[i]);
+  }
+
+  for (size_t i = 0; i < servers; ++i) {
+    size_t server_id = server_to_send[i].server;
+    std::vector<Data*>* server_results = new std::vector<Data*>();
+    Process("^hash_variable", server_id, udf, request[i], server_results, 
+      pctx->CollectResults(combiner, ctx, server_results, results, i, cb));
+  }
+}
+
 void RawClient::Process(
   const UdfChain& udf, 
   const std::string& var_name,
@@ -106,6 +183,10 @@ void RawClient::Process(
   (*results).clear();
   (*results).resize(combiner.size());
 
+  for (size_t i = 0; i < combiner.size(); ++i) {
+    combiner[i]->CombineInit(ctx, &(*results)[i]);
+  }
+
   for (size_t i = 0; i < servers; ++i) {
     size_t server_id = server_to_send[i].server;
     std::vector<Data*>* server_results = new std::vector<Data*>();
@@ -201,16 +282,16 @@ void RawClient::ModelServerBackward(int type, const Tensor& ids, const Tensor& g
   }
 }
 
-void RawClient::TriggerStreamingModelDense(const Callback& cb) {
-  client_wrapper_->TriggerStreamingModelDense(cb);
+void RawClient::TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) {
+  client_wrapper_->TriggerStreamingModelDense(stream_ver, cb);
 }
 
-void RawClient::TriggerStreamingModelSparse(const Callback& cb) {
-  client_wrapper_->TriggerStreamingModelSparse(cb);
+void RawClient::TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) {
+  client_wrapper_->TriggerStreamingModelSparse(stream_ver, cb);
 }
 
-void RawClient::TriggerStreamingModelHash(const Callback& cb) {
-  client_wrapper_->TriggerStreamingModelHash(cb);
+void RawClient::TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) {
+  client_wrapper_->TriggerStreamingModelHash(stream_ver, cb);
 }
 
 void RawClient::AsynchronizeEnter(int id, int staleness, int worker_count, const Callback& cb) {
@@ -229,10 +310,19 @@ void RawClient::WorkerReportFinish(int id, const Callback& cb) {
   client_wrapper_->WorkerReportFinish(id, cb);
 }
 
+void RawClient::GetWorkerFinishCount(int64_t* count, const Callback& cb) {
+  client_wrapper_->GetWorkerFinishCount(count, cb);
+}
+
 void RawClient::WorkerBarrier(int id, int worker_count, const Callback& cb) {
   client_wrapper_->WorkerBarrier(id, worker_count, cb);
 }
 
+
+void RawClient::WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) {
+  client_wrapper_->WorkerBarrierV2(barrier_id, task_id, task_num, token, cb);    
+}
+
 void RawClient::Process(const std::string& var_name, size_t server_id, const UdfChain& udf, const std::vector<Data*>& input, std::vector<Data*>* output, const Callback& cb) {
   client_wrapper_->Process(var_name, server_id, udf.hash(), input, output, [var_name, server_id, udf, input, output, cb, this](Status st) {
     if (st.Code() == Status::kUdfNotRegistered) {
diff --git a/xdl/ps-plus/ps-plus/client/raw_client.h b/xdl/ps-plus/ps-plus/client/raw_client.h
index d45e66b0..9170a14d 100644
--- a/xdl/ps-plus/ps-plus/client/raw_client.h
+++ b/xdl/ps-plus/ps-plus/client/raw_client.h
@@ -52,7 +52,16 @@ class RawClient {
     const std::vector<Data*>& datas,
     const std::vector<Partitioner*>& splitter,
     const std::vector<Partitioner*>& combiner,
-    std::vector<std::unique_ptr<Data>>* results,
+    std::vector<std::unique_ptr<Data> >* results,
+    const Callback& cb);
+
+  void Process(
+    const UdfChain& udf, 
+    const std::vector<std::string>& var_names,
+    const std::vector<Data*>& datas,
+    const std::vector<MergedPartitioner*>& splitter,
+    const std::vector<MergedPartitioner*>& combiner,
+    std::vector<std::vector<std::unique_ptr<Data> > >* results,
     const Callback& cb);
 
   void ModelServerForward(int type, const Tensor& ids, Tensor* rst, const Callback& cb);
@@ -62,19 +71,55 @@ class RawClient {
 
   void Save(const std::string& name, const Callback& cb);
   void Restore(const std::string& name, const Callback& cb);
-  void TriggerStreamingModelDense(const Callback& cb);
-  void TriggerStreamingModelSparse(const Callback& cb);
-  void TriggerStreamingModelHash(const Callback& cb);
+  void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb);
+  void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb);
+  void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb);
+
+  Status InitGlobalQueue(
+      const std::string& name,
+      const std::vector<std::string>& paths,
+      size_t epochs,
+      bool epoch_isolate = false) {
+    return client_wrapper_->InitGlobalQueue(
+        name, paths, epochs, epoch_isolate);
+  }
+
+  Status GetNextFile(
+      const std::string& name,
+      size_t worker_id,
+      std::string* path,
+      size_t* begin,
+      size_t* epoch) {
+    return client_wrapper_->GetNextFile(
+        name, worker_id, path, begin, epoch);
+  }
+
+  Status ReportWorkerState(
+      const std::string& name,
+      size_t worker_id,
+      const std::vector<WorkerState>& worker_states) {
+    return client_wrapper_->ReportWorkerState(
+        name, worker_id, worker_states);
+  }
+
+  Status RestoreWorkerState(
+      const std::string& name,
+      size_t worker_id) {
+    return client_wrapper_->RestoreWorkerState(
+        name, worker_id);
+  }
 
   void AsynchronizeEnter(int id, int staleness, int worker_count, const Callback& cb);
   void SynchronizeEnter(int id, int worker_count, int64_t* token, const Callback& cb);    
   void SynchronizeLeave(int id, int64_t token, const Callback& cb);
-  void WorkerReportFinish(int id, const Callback& cb);    
+  void WorkerReportFinish(int id, const Callback& cb);
+  void GetWorkerFinishCount(int64_t* count, const Callback& cb);
   void WorkerBarrier(int id, int worker_count, const Callback& cb);
+  void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb);
   Status UpdateVariableVisitInfo(const std::string& name, int64_t id_num);
+  Status GetVariableInfo(const std::string& name, VariableInfo* info);
 
  private:
-  Status GetVariableInfo(const std::string& name, VariableInfo* info);
   void Process(const std::string& var_name, size_t server_id, const UdfChain& udf, const std::vector<Data*>& input, std::vector<Data*>* output, const Callback& cb);
 
   ClientArgs args_;
diff --git a/xdl/ps-plus/ps-plus/client/test/client_test.cc b/xdl/ps-plus/ps-plus/client/test/client_test.cc
index c3390cc7..4de7989f 100644
--- a/xdl/ps-plus/ps-plus/client/test/client_test.cc
+++ b/xdl/ps-plus/ps-plus/client/test/client_test.cc
@@ -21,6 +21,7 @@ limitations under the License.
 #include "ps-plus/common/initializer.h"
 #include "ps-plus/common/initializer/constant_initializer.h"
 #include "ps-plus/common/initializer/none_initializer.h"
+#include "ps-plus/message/worker_state.h"
 #include <thread>
 
 using ps::Data;
@@ -37,6 +38,7 @@ using ps::client::PartitionerContext;
 using ps::client::UdfData;
 using ps::client::UdfChain;
 using ps::VariableInfo;
+using ps::WorkerState;
 using ps::initializer::ConstantInitializer;
 using ps::initializer::NoneInitializer;
 
@@ -159,15 +161,42 @@ class MockClientWrapper : public ClientWrapper {
     ReturnAsync(Status::Ok(), cb);
     return;
   };
-  void TriggerStreamingModelDense(const Callback& cb) {
+  void TriggerStreamingModelDense(const std::string& stream_ver, const Callback& cb) {
     ReturnAsync(Status::Ok(), cb);
     return;
-  };
-  void TriggerStreamingModelSparse(const Callback& cb) {
+  }
+
+  Status InitGlobalQueue(
+      const std::string& name,
+      const std::vector<std::string>& paths, 
+      size_t epochs, 
+      bool epoch_isolate = false) {
+    return Status::Ok();
+  }
+  Status GetNextFile(
+      const std::string& name,
+      size_t worker_id, 
+      std::string* path, 
+      size_t* begin, 
+      size_t* epoch) {
+    return Status::Ok();
+  }
+  Status ReportWorkerState(
+      const std::string& name,
+      size_t worker_id, 
+      const std::vector<WorkerState>& worker_states) {
+    return Status::Ok();
+  }
+  Status RestoreWorkerState(
+      const std::string& name,
+      size_t worker_id) {
+    return Status::Ok();
+  }
+  void TriggerStreamingModelSparse(const std::string& stream_ver, const Callback& cb) {
     ReturnAsync(Status::Ok(), cb);
     return;
   };
-  void TriggerStreamingModelHash(const Callback& cb) {
+  void TriggerStreamingModelHash(const std::string& stream_ver, const Callback& cb) {
     ReturnAsync(Status::Ok(), cb);
     return;
   };
@@ -187,10 +216,19 @@ class MockClientWrapper : public ClientWrapper {
     ReturnAsync(Status::Ok(), cb);
     return;
   }
+  void GetWorkerFinishCount(int64_t* count, const Callback& cb) {
+    *count = 0;
+    ReturnAsync(Status::Ok(), cb);
+    return;
+  }  
   void WorkerBarrier(int id, int worker_count, const Callback& cb) {
     ReturnAsync(Status::Ok(), cb);
     return;
   }
+  void WorkerBarrierV2(int barrier_id, int task_id, int task_num, int token, const Callback& cb) {
+    ReturnAsync(Status::Ok(), cb);
+    return;
+  }
   virtual void ModelServerForward(int server_type, int server_id, const Tensor& ids, std::unique_ptr<Tensor>* rst, const Callback& cb) {}
   virtual void ModelServerBackward(int server_type, int server_id, const Tensor& ids, const Tensor& grads, const Callback& cb) {}
   virtual int ServerSize(int id) { return 0; }
@@ -215,6 +253,7 @@ class MockPartitioner : public Partitioner {
     return Status::Ok();
   }
   Status Combine(PartitionerContext* ctx, Data* src, size_t id, std::unique_ptr<Data>* dst) {
+    std::lock_guard<std::mutex> lock(mu_);
     MockData data = dynamic_cast<WrapperData<MockData>*>(src)->Internal();
     if ((*dst) == nullptr) {
       int dim = data.GetDim();
@@ -228,6 +267,7 @@ class MockPartitioner : public Partitioner {
     }
     return Status::Ok();
   }
+  std::mutex mu_;
 };
 
 void MockArgument(std::vector<VariableInfo>& remote_info,
@@ -532,22 +572,23 @@ TEST(ClientTest, OtherTest) {
   st = st_promise1.get_future().get();
   EXPECT_EQ(Status::Ok(), st);
 
+  std::string ver("inc-test99");
   std::promise<Status> st_promise2;
-  client->TriggerStreamingModelDense([&st_promise2](Status st){
+  client->TriggerStreamingModelDense(ver, [&st_promise2](Status st){
     st_promise2.set_value(st);
   });
   st = st_promise2.get_future().get();
   EXPECT_EQ(Status::Ok(), st);
 
   std::promise<Status> st_promise3;
-  client->TriggerStreamingModelSparse([&st_promise3](Status st){
+  client->TriggerStreamingModelSparse(ver, [&st_promise3](Status st){
     st_promise3.set_value(st);
   });
   st = st_promise3.get_future().get();
   EXPECT_EQ(Status::Ok(), st);
 
   std::promise<Status> st_promise4;
-  client->TriggerStreamingModelHash([&st_promise4](Status st){
+  client->TriggerStreamingModelHash(ver, [&st_promise4](Status st){
     st_promise4.set_value(st);
   });
   st = st_promise4.get_future().get();
@@ -665,7 +706,7 @@ TEST(ClientTest, OtherRemoteTest) {
   EXPECT_EQ(Status::kArgumentError, st.Code());
 
   std::promise<Status> st_promise9;
-  client->HashPull("var4", id, 0.02, &tensor, [&st_promise9](Status st){
+  client->HashPull("var4", id, 1.0, &tensor, [&st_promise9](Status st){
     st_promise9.set_value(st);
   });
   st = st_promise9.get_future().get();
@@ -673,7 +714,7 @@ TEST(ClientTest, OtherRemoteTest) {
 
   std::vector<Data*> datas2;
   std::promise<Status> st_promise10;
-  client->HashPush("var4", id, "update", datas2, [&st_promise10](Status st){
+  client->HashPush("var4", id, 0.0, false, "update", datas2, [&st_promise10](Status st){
     st_promise10.set_value(st);
   });
   st = st_promise10.get_future().get();
@@ -713,22 +754,23 @@ TEST(LocalClientTest, LocalTest) {
   st = st_promise3.get_future().get();
   EXPECT_NE(Status::Ok(), st);
 
+  std::string ver("inc-test99");
   std::promise<Status> st_promise4;
-  client->TriggerStreamingModelDense([&st_promise4](Status st) {
+  client->TriggerStreamingModelDense(ver, [&st_promise4](Status st) {
     st_promise4.set_value(st);
   });
   st = st_promise4.get_future().get();
   EXPECT_EQ(Status::Ok(), st);
 
   std::promise<Status> st_promise5;
-  client->TriggerStreamingModelSparse([&st_promise5](Status st) {
+  client->TriggerStreamingModelSparse(ver, [&st_promise5](Status st) {
     st_promise5.set_value(st);
   });
   st = st_promise5.get_future().get();
   EXPECT_EQ(Status::Ok(), st);
 
   std::promise<Status> st_promise6;
-  client->TriggerStreamingModelHash([&st_promise6](Status st) {
+  client->TriggerStreamingModelHash(ver, [&st_promise6](Status st) {
     st_promise6.set_value(st);
   });
   st = st_promise6.get_future().get();
@@ -769,7 +811,7 @@ TEST(LocalClientTest, LocalTest) {
   Tensor ids1;
   std::promise<Status> st_promise12;
 
-  client->HashPull("hello", ids1, 0.1, &ids1, [&st_promise12](Status st) {
+  client->HashPull("hello", ids1, 1.0, &ids1, [&st_promise12](Status st) {
     st_promise12.set_value(st);
   });
   st = st_promise12.get_future().get();
@@ -778,7 +820,7 @@ TEST(LocalClientTest, LocalTest) {
   Tensor ids2;
   std::promise<Status> st_promise13;
 
-  client->HashPull("hello", ids2, 0.1, &ids2, [&st_promise13](Status st) {
+  client->HashPull("hello", ids2, 1.0, &ids2, [&st_promise13](Status st) {
     st_promise13.set_value(st);
   });
   st = st_promise13.get_future().get();
diff --git a/xdl/ps-plus/ps-plus/client/test/model_server_splitter_test.cc b/xdl/ps-plus/ps-plus/client/test/model_server_splitter_test.cc
index 04c8b009..466a0072 100644
--- a/xdl/ps-plus/ps-plus/client/test/model_server_splitter_test.cc
+++ b/xdl/ps-plus/ps-plus/client/test/model_server_splitter_test.cc
@@ -30,23 +30,23 @@ TEST(ModelServerSplitterTest, ModelServerSplitter) {
   EXPECT_NE(mss, nullptr);
 
   {
-    Tensor tensor(DataType::kInt16, TensorShape({32, 1024}), new ConstantInitializer(0), true);
+    Tensor tensor(DataType::kInt16, TensorShape({32, 1024}), new ConstantInitializer(0));
     Status st = mss->Init(1, tensor);
     EXPECT_NE(st, Status::Ok());
   }
 
   {
-    Tensor tensor(DataType::kInt16, TensorShape({1024}), new ConstantInitializer(0), true);
+    Tensor tensor(DataType::kInt16, TensorShape({1024}), new ConstantInitializer(0));
     Status st = mss->Init(1, tensor);
     EXPECT_NE(st, Status::Ok());
   }
 
   {
-    Tensor tensor(DataType::kInt64, TensorShape({1024}), new ConstantInitializer(0), true);
+    Tensor tensor(DataType::kInt64, TensorShape({1024}), new ConstantInitializer(0));
     Status st = mss->Init(2, tensor);
     EXPECT_EQ(st, Status::Ok());
 
-    Tensor tensor2(DataType::kInt64, TensorShape({1024, 512}), new ConstantInitializer(0), true);
+    Tensor tensor2(DataType::kInt64, TensorShape({1024, 512}), new ConstantInitializer(0));
     std::vector<Tensor> vec;
     st = mss->Split(tensor2, &vec);
     EXPECT_EQ(st, Status::Ok());
@@ -54,12 +54,12 @@ TEST(ModelServerSplitterTest, ModelServerSplitter) {
   }
 
   {
-    Tensor tensor(DataType::kInt64, TensorShape({1024}), new ConstantInitializer(0), true);
+    Tensor tensor(DataType::kInt64, TensorShape({1024}), new ConstantInitializer(0));
     Status st = mss->Init(2, tensor);
     EXPECT_EQ(st, Status::Ok());
 
-    Tensor tensor2(DataType::kInt64, TensorShape({1024, 512}), new ConstantInitializer(0), true);
-    Tensor rst(DataType::kInt64, TensorShape({1024, 512}), new ConstantInitializer(0), false);;
+    Tensor tensor2(DataType::kInt64, TensorShape({1024, 512}), new ConstantInitializer(0));
+    Tensor rst(DataType::kInt64, TensorShape({1024, 512}), new ConstantInitializer(0), Tensor::TType::kSegment, false);;
     st = mss->Combine(0, tensor2, &rst);
     EXPECT_EQ(st, Status::Ok());
   }
diff --git a/xdl/ps-plus/ps-plus/common/bloom_filter.cpp b/xdl/ps-plus/ps-plus/common/bloom_filter.cpp
new file mode 100644
index 00000000..23ca18f1
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/bloom_filter.cpp
@@ -0,0 +1,115 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "bloom_filter.h"
+
+#include <cmath>
+#include <set>
+#include <random>
+#include <limits>
+
+#include "murmurhash.h"
+#include "ps-plus/common/logging.h"
+
+namespace ps {
+
+template <typename CType>
+CountingBloomFilter<CType>::CountingBloomFilter(double fpp,
+                                                uint64_t element_size)
+  : false_positive_probability_(fpp),
+    element_size_(element_size) {
+  bucket_size_ = static_cast<uint64_t>(std::ceil(
+          std::abs(std::log(fpp) / std::pow(std::log(2.0), 2)) * element_size));
+  hash_function_number_ = static_cast<uint32_t>(std::ceil(
+          std::abs(std::log2(fpp))));
+  std::set<uint32_t> seeds;
+  std::random_device rd;
+  std::mt19937 gen(rd());
+  std::uniform_int_distribution<uint32_t> dist(0, std::numeric_limits<uint32_t>::max());
+  while (seeds.size() != hash_function_number_) {
+    seeds.insert(dist(gen));
+  }
+  for (const auto& seed : seeds) {
+    hash_functions_.push_back(MurmurHash(seed));
+  }
+  buf_.resize(bucket_size_, CType{});
+  LOG(INFO) << "optimal bloom filter parameters: false_positive_probability=" << false_positive_probability_ \
+            << " element_size=" << element_size_ << ", bucket_size=" << bucket_size_ << " hash_function_number=" << hash_function_number_;
+}
+
+template <typename CType>
+void CountingBloomFilter<CType>::Insert(const void* key, int len) {
+  if (key == nullptr) return;
+  uint64_t mur_res[2];
+  for (auto&& fn : hash_functions_) {
+    fn(key, len, mur_res);
+    uint64_t index = mur_res[1] % bucket_size_;
+    if (buf_[index] != std::numeric_limits<CType>::max()) {
+      buf_[index] += 1;
+    }
+  }
+}
+
+template <typename CType>
+bool CountingBloomFilter<CType>::Exists(const void* key, int len,
+                                        uint32_t max_count) const {
+  if (max_count == 0) return true;
+  if (key == nullptr) return false;
+  uint64_t mur_res[2];
+  for (auto&& fn : hash_functions_) {
+    fn(key, len, mur_res);
+    uint64_t index = mur_res[1] % bucket_size_;
+    if (buf_[index] < max_count) return false;
+  }
+  return true;
+}
+
+template <typename CType>
+bool CountingBloomFilter<CType>::InsertedLookup(const void* key, int len,
+                                                uint32_t max_count) {
+  Insert(key, len);
+  return Exists(key, len, max_count);
+}
+
+BloomFilterBase* GlobalBloomFilter::Instance() {
+  if (filter == nullptr) {
+    lock.lock();
+    if (filter == nullptr) {
+      if (max_threthold < 240) {
+        filter = new CountingBloomFilter<uint8_t>();
+      } else {
+        filter = new CountingBloomFilter<uint16_t>();
+      }
+    }
+    lock.unlock();
+  }
+  return filter;
+}
+
+void GlobalBloomFilter::SetThrethold(int32_t threthold) {
+  if (threthold > max_threthold) {
+    lock.lock();
+    if (threthold > max_threthold) {
+      max_threthold = threthold;
+    }
+    lock.unlock();
+  }
+}
+
+BloomFilterBase* GlobalBloomFilter::filter = nullptr;
+int32_t GlobalBloomFilter::max_threthold = 0;
+std::mutex GlobalBloomFilter::lock;
+
+}  // namespace ps
diff --git a/xdl/ps-plus/ps-plus/common/bloom_filter.h b/xdl/ps-plus/ps-plus/common/bloom_filter.h
new file mode 100644
index 00000000..fa1a311f
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/bloom_filter.h
@@ -0,0 +1,84 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_COMMON_BLOOM_FILTER_H_
+#define PS_PLUS_COMMON_BLOOM_FILTER_H_
+
+#include <mutex>
+#include <vector>
+#include <memory>
+#include <functional>
+
+namespace ps {
+
+class BloomFilterBase {
+ public: 
+  virtual void Insert(const void* key, int len) = 0;
+  virtual bool Exists(const void* key, int len, uint32_t max_count=1u) const = 0;
+  virtual bool InsertedLookup(const void* key, int len, uint32_t max_count=1u) = 0;
+};
+
+template <typename CType>
+class CountingBloomFilter : public BloomFilterBase {
+ public:
+  using Hasher = std::function<void(const void*, int, void*)>;
+  CountingBloomFilter(double fpp=0.01, uint64_t element_size=1000000000);
+  ~CountingBloomFilter() {}
+  virtual void Insert(const void* key, int len);
+  virtual bool Exists(const void* key, int len, uint32_t max_count=1u) const;
+  virtual bool InsertedLookup(const void* key, int len, uint32_t max_count=1u);
+  double false_positive_probability() const {
+    return false_positive_probability_;
+  }
+  uint64_t element_size() const {
+    return element_size_;
+  }
+  uint64_t bucket_size() const {
+    return bucket_size_;
+  }
+  uint32_t hash_function_number() const {
+    return hash_function_number_;
+  }
+ private:
+  CountingBloomFilter(const CountingBloomFilter&) = delete;
+  CountingBloomFilter& operator=(const CountingBloomFilter&) = delete;
+
+  double false_positive_probability_;
+  uint64_t element_size_;
+  uint64_t bucket_size_;
+  uint32_t hash_function_number_;
+  std::vector<Hasher> hash_functions_;
+
+  std::vector<CType> buf_;
+};
+
+class GlobalBloomFilter {
+ public: 
+  static void SetThrethold(int32_t threthold);
+  static BloomFilterBase* Instance();
+ private:
+  GlobalBloomFilter(const GlobalBloomFilter&) = delete;
+  GlobalBloomFilter& operator=(const GlobalBloomFilter&) = delete;
+  static int32_t max_threthold;
+  static BloomFilterBase* filter;
+  static std::mutex lock;
+};
+
+template class CountingBloomFilter<uint8_t>;
+template class CountingBloomFilter<uint16_t>;
+
+}  // namespace ps
+
+#endif  // PS_PLUS_COMMON_BLOOM_FILTER_H_
diff --git a/xdl/ps-plus/ps-plus/common/file_system.cc b/xdl/ps-plus/ps-plus/common/file_system.cc
index 7f93fe6a..676fdfe7 100644
--- a/xdl/ps-plus/ps-plus/common/file_system.cc
+++ b/xdl/ps-plus/ps-plus/common/file_system.cc
@@ -17,14 +17,35 @@ limitations under the License.
 
 namespace ps {
 
-constexpr size_t FileSystem::MAX_READ_WRITE;
+constexpr size_t FileSystem::BUFFER_SIZE;
 
 Status FileSystem::ReadStream::Read(void* buf, size_t size) {
   char* raw_buf = (char*)buf;
   size_t remain = size;
+  while (remain > 0) {
+    if (buffer_size_ == buffer_ptr_) {
+      PS_CHECK_STATUS(ReadBuffer());
+    }
+
+    int64_t read = std::min((int64_t)remain, (int64_t)(buffer_size_ - buffer_ptr_));
+    memcpy(raw_buf, buffer_ + buffer_ptr_, read);
+    buffer_ptr_ += read;
+    remain -= read;
+    raw_buf += read;
+  }
+  return Status::Ok();
+}
+
+Status FileSystem::ReadStream::ReadBuffer() {
+  if (buffer_size_ >= 0 && buffer_size_ < BUFFER_SIZE) {
+    return Status::DataLoss("File exhausted");
+  }
+  char* raw_buf = buffer_;
+  size_t remain = BUFFER_SIZE;
   size_t last = 0;
+  int64_t read = 0;
   while (remain > 0) {
-    int64_t read = ReadSimple(raw_buf, std::min(remain, MAX_READ_WRITE));
+    int64_t read = ReadSimple(raw_buf, remain);
     if (read < 0 || (last == 0 && read == 0)) {
       break;
     }
@@ -32,9 +53,26 @@ Status FileSystem::ReadStream::Read(void* buf, size_t size) {
     raw_buf += read;
     last = read;
   }
-  if (remain > 0) {
-    return Status::DataLoss("File exhausted");
+  if (read < 0) {
+    return Status::DataLoss("File Read Error");
   }
+  buffer_size_ = raw_buf - buffer_;
+  buffer_ptr_ = 0;
+  return Status::Ok();
+}
+
+Status FileSystem::ReadStream::Eof(bool* eof) {
+  if (buffer_size_ == buffer_ptr_) {
+    if (buffer_size_ >= 0 && buffer_size_ < BUFFER_SIZE) {
+      *eof = true;
+      return Status::Ok();
+    } else {
+      PS_CHECK_STATUS(ReadBuffer());
+      *eof = buffer_size_ == 0;
+      return Status::Ok();
+    }
+  }
+  *eof = false;
   return Status::Ok();
 }
 
@@ -50,7 +88,7 @@ Status FileSystem::WriteStream::Write(const void* buf, size_t size) {
   size_t remain = size;
   size_t last = 0;
   while (remain > 0) {
-    int64_t write = WriteSimple(raw_buf, std::min(remain, MAX_READ_WRITE));
+    int64_t write = WriteSimple(raw_buf, std::min(remain, BUFFER_SIZE));
     if (write < 0 || (last == 0 && write == 0)) {
       break;
     }
@@ -147,5 +185,18 @@ Status FileSystem::WriteStream::WriteStr(const std::string& data) {
   return Write((&data[0]), sizeof(char) * size);
 }
 
+Status FileSystem::ReadStream::ReadShortStr(std::string* data) {
+  int size;
+  PS_CHECK_STATUS(ReadRaw(&size));
+  data->resize(size);
+  return Read((&(*data)[0]), sizeof(char) * size);
+}
+
+Status FileSystem::WriteStream::WriteShortStr(const std::string& data) {
+  int size = data.size();
+  PS_CHECK_STATUS(WriteRaw(size));
+  return Write((&data[0]), sizeof(char) * size);
+}
+
 }
 
diff --git a/xdl/ps-plus/ps-plus/common/file_system.h b/xdl/ps-plus/ps-plus/common/file_system.h
index 748dd1cf..ce59707f 100644
--- a/xdl/ps-plus/ps-plus/common/file_system.h
+++ b/xdl/ps-plus/ps-plus/common/file_system.h
@@ -18,6 +18,7 @@ limitations under the License.
 
 #include "ps-plus/common/status.h"
 #include "ps-plus/common/plugin.h"
+#include "tbb/concurrent_vector.h"
 
 #include <vector>
 #include <string>
@@ -25,24 +26,34 @@ limitations under the License.
 namespace ps {
 
 class FileSystem {
+ private:
+  static constexpr size_t BUFFER_SIZE = 1048576;
  public:
   class ReadStream {
    public:
-    ReadStream() : close_(false) {}
+    ReadStream() : close_(false), buffer_ptr_(-1), buffer_size_(-1) {}
     virtual ~ReadStream() {Close();}
     Status Read(void* buf, size_t size);
+    Status ReadBuffer();
     virtual int64_t ReadSimple(void* buf, size_t size) = 0;
     void Close();
+    Status Eof(bool* eof);
 
     template <typename T>
     Status ReadRaw(T* data);
     template <typename T>
     Status ReadVec(std::vector<T>* data);
+    template <typename T>    
+    Status ReadTBBVec(tbb::concurrent_vector<T>* data);
     Status ReadStr(std::string* data);
+    Status ReadShortStr(std::string* data);
    protected:
     virtual void CloseInternal() = 0;
    private:
     bool close_;
+    char buffer_[BUFFER_SIZE];
+    int buffer_ptr_;
+    int buffer_size_;
   };
 
   class WriteStream {
@@ -50,6 +61,7 @@ class FileSystem {
     WriteStream() : close_(false) {}
     virtual ~WriteStream() {Close();}
     Status Write(const void* buf, size_t size);
+    Status WriteBuffer();
     virtual int64_t WriteSimple(const void* buf, size_t size) = 0;
     virtual void Flush() = 0;
     void Close();
@@ -58,7 +70,10 @@ class FileSystem {
     Status WriteRaw(T data);
     template <typename T>
     Status WriteVec(const std::vector<T>& data);
+    template <typename T>
+    Status WriteTBBVec(const tbb::concurrent_vector<T>& data);
     Status WriteStr(const std::string& data);
+    Status WriteShortStr(const std::string& data);
    protected:
     virtual void CloseInternal() = 0;
    private:
@@ -97,8 +112,6 @@ class FileSystem {
   static Status ListDirectoryAny(const std::string& dir, std::vector<std::string>* files);
   static Status RemoveAny(const std::string& name);
   static Status RenameAny(const std::string& src_name, const std::string& dst_name);
- private:
-  static constexpr size_t MAX_READ_WRITE = 1048576;
 };
 
 template <typename T>
@@ -114,6 +127,17 @@ Status FileSystem::ReadStream::ReadVec(std::vector<T>* data) {
   return Read((&(*data)[0]), sizeof(T) * size);
 }
 
+template <typename T>
+Status FileSystem::ReadStream::ReadTBBVec(tbb::concurrent_vector<T>* data) {
+  size_t size;
+  PS_CHECK_STATUS(ReadRaw(&size));
+  data->resize(size);
+  for (size_t i = 0; i < data->size(); i++) {
+    PS_CHECK_STATUS(Read((&(*data)[i]), sizeof(T)));
+  }
+  return Status::Ok();
+}
+
 template <typename T>
 Status FileSystem::WriteStream::WriteRaw(T data) {
   return Write(&data, sizeof(T));
@@ -126,6 +150,15 @@ Status FileSystem::WriteStream::WriteVec(const std::vector<T>& data) {
   return Write((&data[0]), sizeof(T) * size);
 }
 
+template <typename T>
+Status FileSystem::WriteStream::WriteTBBVec(const tbb::concurrent_vector<T>& data) {
+  size_t size = data.size();
+  PS_CHECK_STATUS(WriteRaw(size));
+  for (size_t i = 0; i < data.size(); i++) {
+    PS_CHECK_STATUS(Write((&data[i]), sizeof(T)));
+  }
+  return Status::Ok();
+}
 }
 
 #endif
diff --git a/xdl/ps-plus/ps-plus/common/file_system/file_file_system.cc b/xdl/ps-plus/ps-plus/common/file_system/file_file_system.cc
index a8baf5bf..045186ec 100644
--- a/xdl/ps-plus/ps-plus/common/file_system/file_file_system.cc
+++ b/xdl/ps-plus/ps-plus/common/file_system/file_file_system.cc
@@ -92,7 +92,9 @@ class FileFileSystem : public FileSystem {
         std::string current_dir = real_dir.substr(0, i);
         if(access(current_dir.c_str(), F_OK) != 0) {
           if(mkdir(current_dir.c_str(), 0755) != 0) {
-            return Status::Unknown("Mkdir Error " + current_dir);
+            if(access(current_dir.c_str(), F_OK) != 0) {
+              return Status::Unknown("Mkdir Error " + current_dir);
+            }
           }
         }
       }
diff --git a/xdl/ps-plus/ps-plus/common/global_file_queue.cc b/xdl/ps-plus/ps-plus/common/global_file_queue.cc
new file mode 100644
index 00000000..328befc5
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/global_file_queue.cc
@@ -0,0 +1,232 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "global_file_queue.h"
+
+#include "ps-plus/common/logging.h"
+#include "ps-plus/common/status.h"
+
+#include <string>
+#include <iostream>
+
+using namespace std;
+using namespace std::chrono;
+using namespace ps;
+
+namespace ps {
+
+const int GlobalFileQueue::MAX_WORKER_COUNT = 10000;
+
+GlobalFileQueue::GlobalFileQueue() 
+  : epochs_(1)
+  , cur_epoch_(0)
+  , cur_file_index_(0)
+  , epoch_isolate_(false)
+  , initialized_(false) {
+}
+
+GlobalFileQueue::~GlobalFileQueue() {
+}
+
+Status GlobalFileQueue::Init(
+    const std::vector<std::string>& paths,
+    int epochs, 
+    bool epoch_isolate) {
+  std::unique_lock<std::mutex> lock(mu_);
+  if (!initialized_) {
+    epochs_ = epochs;
+    epoch_isolate_ = epoch_isolate;
+    files_ = paths;
+    used_files_.resize(MAX_WORKER_COUNT);
+    restored_files_.resize(MAX_WORKER_COUNT);
+    last_report_.resize(MAX_WORKER_COUNT);
+    for (size_t i = 0; i < files_.size(); ++i) {
+      file_index_[files_[i]] = i;
+    }
+
+    initialized_ = true;
+  }
+
+  return Status::Ok();
+}
+
+Status GlobalFileQueue::GetNextFile(
+    int worker_id , 
+    WorkerState* file) {
+  std::unique_lock<std::mutex> lock(mu_);
+  if (!initialized_) {
+    return Status::FileQueueNeedWait("not initialized");
+  } 
+
+  std::deque<WorkerState>& restored_files = restored_files_[worker_id];
+  if (!restored_files.empty()) {
+    *file = restored_files.front();
+    restored_files.pop_front();
+    used_files_[worker_id].push_back(
+        FileInfo{.index_ = file_index_[file->path_],
+            .epoch_ = file->epoch_});
+  } else {
+    if (cur_file_index_ >= files_.size()) {
+      if (cur_epoch_ + 1 == epochs_) {
+        file->path_ = "";
+        return Status::Ok();
+      }
+
+      if (epoch_isolate_ && !IsAllWorkerFinishCurEpoch()) {
+        return Status::FileQueueNeedWait("not all worker finish current epoch");
+      } 
+      
+      ++cur_epoch_;
+      cur_file_index_ = 0;
+    } 
+
+    file->path_ = files_[cur_file_index_];
+    file->begin_ = 0;
+    file->end_ = 0;
+    file->epoch_ = cur_epoch_;
+    used_files_[worker_id].push_back(
+        FileInfo{.index_ = cur_file_index_,
+            .epoch_ = cur_epoch_});
+    ++cur_file_index_;
+  }
+
+  return Status::Ok();
+}
+
+bool GlobalFileQueue::IsAllWorkerFinishCurEpoch() {
+  return true;
+}
+
+Status GlobalFileQueue::ReportWorkerState(
+    int worker_id, 
+    const std::vector<ps::WorkerState>& worker_states) {
+  if (worker_id >= MAX_WORKER_COUNT) {
+    return Status::ArgumentError("worker_id exceed MAX_WORKER_COUNT:10000");
+  }
+
+  std::unique_lock<std::mutex> lock(mu_);
+  last_report_[worker_id] = worker_states;
+  return Status::Ok();
+}
+
+Status GlobalFileQueue::RestoreWorkerState(
+    int worker_id) {
+  std::set<std::pair<size_t, size_t> > last_report;
+  for (auto& worker_state: last_report_[worker_id]) {
+    last_report.insert({file_index_[worker_state.path_], 
+        worker_state.epoch_});
+  }
+
+  std::unique_lock<std::mutex> lock(mu_);
+  std::deque<WorkerState>& restored_files = 
+    restored_files_[worker_id];
+  restored_files.clear();  
+  restored_files.insert(
+      restored_files.end(), 
+      last_report_[worker_id].begin(),
+      last_report_[worker_id].end());
+  for (auto it = used_files_[worker_id].rbegin(); 
+       it != used_files_[worker_id].rend(); 
+       ++it) {
+    if (last_report.find({it->index_, it->epoch_}) == 
+        last_report.end()) {
+      WorkerState ws;
+      ws.path_ = files_[it->index_];
+      ws.begin_ = 0;
+      ws.end_ = 0;
+      ws.epoch_ = it->epoch_;
+      restored_files.push_back(ws);      
+    } else {
+      break;
+    }
+  }
+
+  used_files_[worker_id].clear();
+  return Status::Ok();
+}
+
+Status GlobalFileQueue::Serialize(std::string* buf) {
+  unique_lock<std::mutex> lock(mu_);
+  buf->append((char*)&cur_epoch_, sizeof(size_t));
+  buf->append((char*)&cur_file_index_, sizeof(size_t));  
+  SerializeFileInfos(used_files_, buf);
+  SerializeWorkerStates<std::vector<WorkerState> >(
+      last_report_, buf);
+  SerializeWorkerStates<std::deque<WorkerState> >(
+      restored_files_, buf);
+  return Status::Ok();
+}
+
+void GlobalFileQueue::SerializeFileInfos(
+    const std::vector<std::vector<FileInfo> >& file_infos,
+    std::string* buf) {
+  size_t len = file_infos.size();
+  buf->append((char*)&len, sizeof(size_t));    
+  for (size_t i = 0; i < len; ++i) {
+    auto& it = file_infos[i];
+    size_t sub_len = it.size();
+    buf->append((char*)&sub_len, sizeof(size_t));    
+    for (size_t j = 0; j < sub_len; ++j) {
+      auto& sub_it = it[j];
+      buf->append((char*)&sub_it.index_, sizeof(size_t));        
+      buf->append((char*)&sub_it.epoch_, sizeof(size_t));        
+    }
+  }
+}
+
+Status GlobalFileQueue::Deserialize(const std::string& buf) {
+  unique_lock<std::mutex> lock(mu_);
+  char* ptr = const_cast<char*>(buf.data());
+  cur_epoch_ = *(reinterpret_cast<size_t*>(ptr));  
+  ptr += sizeof(size_t);
+  cur_file_index_ = *(reinterpret_cast<size_t*>(ptr));    
+  ptr += sizeof(size_t);
+  ptr += DeserializeFileInfos(ptr, &used_files_);
+  ptr += DeserializeWorkerStates<std::vector<WorkerState> >(
+      ptr, &last_report_);
+  ptr += DeserializeWorkerStates<std::deque<WorkerState> >(
+      ptr, &restored_files_);
+  if (ptr - buf.data() == buf.size()) {
+    return Status::Ok();
+  }
+
+  return Status::DataLoss("global_file_queue deserialize error");
+}
+
+size_t GlobalFileQueue::DeserializeFileInfos(
+      char* base,
+      std::vector<std::vector<FileInfo> >* file_infos) {
+  file_infos->clear();
+  char* ptr = base;
+  size_t len = *(reinterpret_cast<size_t*>(ptr));
+  ptr += sizeof(size_t);
+  for (size_t i = 0; i < len; ++i) {
+    file_infos->emplace_back();
+    size_t sub_len = *(reinterpret_cast<size_t*>(ptr));
+    ptr += sizeof(size_t);
+    for (size_t j = 0; j < sub_len; ++j) {
+      FileInfo file_info;
+      file_info.index_ = *(reinterpret_cast<size_t*>(ptr));
+      ptr += sizeof(size_t);
+      file_info.epoch_ = *(reinterpret_cast<size_t*>(ptr));
+      ptr += sizeof(size_t);
+      (*file_infos)[i].push_back(file_info);
+    }
+  }
+
+  return ptr - base;
+}
+
+} // namespace ps
diff --git a/xdl/ps-plus/ps-plus/common/global_file_queue.h b/xdl/ps-plus/ps-plus/common/global_file_queue.h
new file mode 100644
index 00000000..f7e5880d
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/global_file_queue.h
@@ -0,0 +1,146 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_SCHEDULER_GLOBAL_FILE_QUEUE_H_
+#define PS_SCHEDULER_GLOBAL_FILE_QUEUE_H_
+
+#include <chrono>
+#include <functional>
+#include <map>
+#include <mutex>
+#include <memory>
+#include <set>
+#include <thread>
+#include <atomic>
+#include <deque>
+#include <unordered_map>
+
+#include "ps-plus/common/status.h"
+#include "ps-plus/message/worker_state.h"
+
+namespace ps {
+
+class GlobalFileQueue {
+public:    
+  GlobalFileQueue();
+  ~GlobalFileQueue();
+  Status Init(const std::vector<std::string>& paths,
+              int epochs = 1, 
+              bool epoch_isolate = false);
+  Status GetNextFile(int worker_id, WorkerState* file);
+  Status ReportWorkerState(
+      int worker_id, 
+      const std::vector<WorkerState>& worker_states);
+  Status RestoreWorkerState(int worker_id);
+  Status Serialize(std::string* buf);
+  Status Deserialize(const std::string& buf);
+  bool IsInitialized() const {
+    std::unique_lock<std::mutex> lock(mu_);
+    return initialized_;
+  }
+
+ private:
+  bool IsAllWorkerFinishCurEpoch();
+  struct FileInfo {
+    size_t index_;
+    size_t epoch_;
+  };
+
+  void SerializeFileInfos(
+    const std::vector<std::vector<FileInfo> >& file_infos,
+    std::string* buf);
+  template <typename T>
+  void SerializeWorkerStates(
+      const std::vector<T>& worker_states,
+      std::string* buf);
+  size_t DeserializeFileInfos(
+      char* buf,
+      std::vector<std::vector<FileInfo> >* file_infos);
+  template <typename T>  
+  size_t DeserializeWorkerStates(
+      char* buf,
+      std::vector<T>* file_infos);  
+
+ private:
+  static const int MAX_WORKER_COUNT;
+  mutable std::mutex mu_;
+  std::vector<std::string> files_;
+  std::unordered_map<std::string, size_t> file_index_;
+  int epochs_;
+  size_t cur_epoch_;
+  size_t cur_file_index_;
+  bool epoch_isolate_;
+  bool initialized_;
+  std::vector<std::vector<FileInfo> > used_files_;
+  std::vector<std::vector<WorkerState> > last_report_;
+  std::vector<std::deque<WorkerState> > restored_files_;
+};
+
+template <typename T>
+void GlobalFileQueue::SerializeWorkerStates(
+    const std::vector<T>& worker_states,
+    std::string* buf) {
+  size_t len = worker_states.size();
+  buf->append((char*)&len, sizeof(size_t));    
+  for (size_t i = 0; i < len; ++i) {
+    auto& it = worker_states[i];
+    size_t sub_len = it.size();
+    buf->append((char*)&sub_len, sizeof(size_t));    
+    for (auto& sub_it: it) {
+      buf->append((char*)&sub_it.begin_, sizeof(size_t));        
+      buf->append((char*)&sub_it.end_, sizeof(size_t));        
+      buf->append((char*)&sub_it.epoch_, sizeof(size_t));        
+      size_t path_len = sub_it.path_.size();
+      buf->append((char*)&path_len, sizeof(size_t));            
+      buf->append(sub_it.path_.data(), sub_it.path_.size());                
+    }
+  }
+}
+
+template <typename T>  
+size_t GlobalFileQueue::DeserializeWorkerStates(
+    char* base,
+    std::vector<T>* worker_states) {
+  worker_states->clear();
+  char* ptr = base;
+  size_t len = *(reinterpret_cast<size_t*>(ptr));
+  ptr += sizeof(size_t);
+  for (size_t i = 0; i < len; ++i) {
+    worker_states->emplace_back();
+    size_t sub_len = *(reinterpret_cast<size_t*>(ptr));
+    ptr += sizeof(size_t);
+    for (size_t j = 0; j < sub_len; ++j) {
+      WorkerState worker_state;
+      worker_state.begin_ = *(reinterpret_cast<size_t*>(ptr));
+      ptr += sizeof(size_t);
+      worker_state.end_ = *(reinterpret_cast<size_t*>(ptr));
+      ptr += sizeof(size_t);
+      worker_state.epoch_ = *(reinterpret_cast<size_t*>(ptr));
+      ptr += sizeof(size_t);
+      size_t path_len = *(reinterpret_cast<size_t*>(ptr));
+      ptr += sizeof(size_t);
+      worker_state.path_.assign(ptr, path_len);
+      ptr += path_len;
+      (*worker_states)[i].push_back(worker_state);
+    }
+  }
+
+  return ptr - base;
+}
+
+
+} // namespace ps
+
+#endif // PS_SCHEDULER_GLOBAL_FILE_QUEUE_H_
diff --git a/xdl/ps-plus/ps-plus/common/hasher.h b/xdl/ps-plus/ps-plus/common/hasher.h
index 43500c11..a1857236 100644
--- a/xdl/ps-plus/ps-plus/common/hasher.h
+++ b/xdl/ps-plus/ps-plus/common/hasher.h
@@ -47,6 +47,10 @@ class Hasher {
     p = ((p ^ s) * kP) & 0xFFFF;
     return p;
   }
+  static uint32_t Hash64(int64_t x_) {
+    int p = x_ % kTargetRange;
+    return p >= 0 ? p : p + kTargetRange;
+  }
  private:
   static const int kP = 397; // Prime
 };
diff --git a/xdl/ps-plus/ps-plus/common/hashmap.cc b/xdl/ps-plus/ps-plus/common/hashmap.cc
index 3bf2e5ce..2d808126 100644
--- a/xdl/ps-plus/ps-plus/common/hashmap.cc
+++ b/xdl/ps-plus/ps-plus/common/hashmap.cc
@@ -20,326 +20,25 @@ limitations under the License.
 
 namespace ps {
 
-int64_t qmul(int64_t a, int64_t n, int64_t m) {
-  int64_t ans = 0;
-  while (n > 0) {
-    if(n % 2 == 1) ans = (ans + a) % m;
-    a = (a + a) % m;
-    n /= 2;
-  }
-  return ans;
-}
-
-int64_t qpow(int64_t a, int64_t n, int64_t m) {
-  int64_t ans = 1;
-  while (n > 0) {
-    if(n % 2 == 1) ans = qmul(ans, a, m);
-    a = qmul(a, a, m);
-    n /= 2;
-  }
-  return ans;
-}
-
-bool Miller_Rabbin(int64_t n, int64_t a) {
-  int64_t r = 0, s = n - 1, j;
-  if(n % a == 0) {
-    return false;
-  }
-  while(s % 2 == 1) {
-    s /= 2;
-    r++;
-  }
-  int64_t k = qpow(a, s, n);
-  if (k == 1) {
-    return true;
-  }
-  for (j = 0; j < r; j++, k = qmul(k, k, n)) {
-    if (k == n - 1) {
-      return true;
-    }
-  }
-  return false;
-}
-
-bool IsPrime(int n) {
-  static const int tab[] = {2, 3, 5, 7};
-  for(int i = 0;i < 4; i++) {
-    if(n == tab[i])
-      return true;
-    if(!Miller_Rabbin(n, tab[i]))
-      return false;
-  }
-  return true;
-}
-
-HashMap::HashMap(int64_t hint) :
-    counter_(0),
-    hint_(hint),
-    update_counter_(0),
-    max_cache_(MAX_CACHED),
-    current_ver_(0) {
-  int64_t actual_size = GetHashSize(hint);
-  for (int i = 0; i < VERSIONS; i++) {
-    nodes_vec_[i].resize(actual_size);
-    data_pool_vec_[i] = new MemBlockPool<ITEM_SIZE>(
-        actual_size * 0.5);
-  }
+HashMap::HashMap() : offset_(0), urd(0.0, 1.0), max_count_(0) {
 }
 
 HashMap::~HashMap() {
-  for (int i = 0; i < VERSIONS; i++) {
-    nodes_vec_[i].clear();
-    if (data_pool_vec_[i]) {
-      delete data_pool_vec_[i];
-    }
-  }
-}
-
-int64_t HashMap::GetHashSize(int64_t hint, bool scale) {
-  int64_t x = hint;
-  if (scale) {
-    x = hint * 2 + 1;
-  } else {
-    if ((x & 1) == 0) {
-      x += 1;
-    } 
-  } 
-  while (!IsPrime(x)) {x += 2;}
-  return x;
-}
-
-int HashMap::ExpandSpace(int ver) {
-  int64_t new_size = GetHashSize(nodes_vec_[ver].size() * 2);
-  HashNode tmp_nodes(new_size); 
-  int pool_size = data_pool_vec_[ver]->Size();
-  MemBlockPool<ITEM_SIZE>* new_data_pool =
-    new MemBlockPool<ITEM_SIZE>(pool_size * 2);
-  // swap the space between origin space and new one 
-  tmp_nodes.swap(nodes_vec_[ver]);
-  int64_t tmp_size = tmp_nodes.size();
-  MemBlockPool<ITEM_SIZE>* tmp_data_pool = data_pool_vec_[ver]; 
-  data_pool_vec_[ver] = new_data_pool;
-
-  // do rehash
-  bool id_reused;
-  std::cerr<<"ExpandSpace, old_size: "<<tmp_size<<" new size:"<<new_size<<" ver:"<<ver<<std::endl;
-  for (int i = 0; i < tmp_size; i++) {
-    auto cur_block = &(tmp_nodes[i]);
-    while (cur_block) {
-      HashMapItem* item_array = cur_block->Array();
-      if (nullptr == item_array) {
-        return -1;
-      }
-      for (int i = 0; i < ITEM_SIZE; ++i) {
-        if (item_array[i].id < 0) {
-          continue;
-        }
-        int64_t id = AddOne(ver, item_array[i].x, item_array[i].y, item_array[i].id, &id_reused);
-        if (INVALID_ID == id) {
-          return -1; 
-        }
-      }  
-      cur_block = cur_block->Next(); 
-    }
-  }
-
-  // release old space 
-  tmp_nodes.clear(); 
-  delete tmp_data_pool;
-  return 0;
 }
 
-int HashMap::ReplayLogs(int ver) {
-  bool id_reused;
-  for (int i = 0; i < VERSIONS; i++) {
-    if (i != ver) {
-      for (const LogNode& node : logs_[i]) {
-        if (ADD_OP == node.type) {
-          if (INVALID_ID == AddOne(ver, node.x, node.y, node.id, &id_reused)) {
-            return -1; 
-          } 
-        } else if (DEL_OP == node.type) {
-          DelOne(ver, node.x, node.y, node.id);
-        }
-      }
-    }
-  }
-  return 0;
+bool HashMap::FloatEqual(float v1, float v2) {
+  return (v1 <= (v2 + FLOAT_EPSILON)) && (v1 >= (v2 - FLOAT_EPSILON));
 }
-
-void HashMap::ResetVer(int ver) {
-  logs_[(ver + 1) % VERSIONS].clear();
-  current_ver_.store(ver);
-  update_counter_ = 0;
-  ver = (current_ver_.load() + 1) % VERSIONS;
-  rwlock_[ver].wrlock();
-  ReplayLogs(ver);
-  rwlock_[ver].unlock();
-}
-
-int HashMap::Get(int64_t* keys, int64_t size, int64_t jump,
-          std::vector<int64_t>* ids, std::vector<int64_t>* reused_ids) {
-    return GetWithAddProbability(keys, size, jump, 1, ids, reused_ids);
-}
-
-int HashMap::GetWithAddProbability(int64_t* keys, int64_t size, int64_t jump, double add_probability,
-          std::vector<int64_t>* ids, std::vector<int64_t>* reused_ids) {
-  int ver = current_ver_.load();
-  ids->resize(size);
-  reused_ids->clear();
-  int64_t insert_list = -1;
-  rwlock_[ver].rdlock();
-  for (int64_t i = 0; i < size; i++) {
-    int64_t x = keys[i * jump];
-    int64_t y = keys[i * jump + 1];
-    int64_t rst = TryGetOne(ver, x, y);
-    if (INVALID_ID == rst) {
-        (*ids)[i] = insert_list;
-        insert_list = i;
-    } else {
-        (*ids)[i] = rst;
-    }
-  }
-  rwlock_[ver].unlock();
-  if (insert_list != -1) {
-    write_lock_.lock();
-    ver = (current_ver_.load() + 1) % VERSIONS;
-    rwlock_[ver].wrlock();
-    bool id_reused;
-    while (insert_list != -1) {
-      int64_t x = keys[insert_list * jump];
-      int64_t y = keys[insert_list * jump + 1];
-      int64_t next = (*ids)[insert_list];
-      //need to search this ver too to make sure x,y not in hash list
-      int64_t rst = TryGetOne(ver, x, y);
-      if (rst < 0) {
-          if (urd(dre) <= add_probability) {
-              int64_t new_id = AddOne(ver, x, y, -1, &id_reused);
-              if (new_id < 0) {
-                  return -1; 
-              }
-              (*ids)[insert_list] = new_id;
-              if (id_reused) {
-                  reused_ids->push_back(new_id);
-              }
-          } else {
-              (*ids)[insert_list] = NOT_ADD_ID;
-          }
-      } else {
-          (*ids)[insert_list] = rst;
-      }
-      insert_list = next;
-      update_counter_++;
-    }
-    rwlock_[ver].unlock();
-    if (update_counter_ > max_cache_) {
-      ResetVer(ver);
-    }  
-    write_lock_.unlock();
-  }
-  return 0;
-}
-
-int HashMap::GetWithoutAdd(int64_t* keys, int64_t size, int64_t jump, std::vector<int64_t>* ids) {
-  write_lock_.lock();
-  int ver = (current_ver_.load() + 1) % VERSIONS;
-  ResetVer(ver);
-  write_lock_.unlock();
-
-  ids->resize(size);
-  rwlock_[ver].rdlock();
-  for (int64_t i = 0; i < size; i++) {
-    int64_t x = keys[i * jump];
-    int64_t y = keys[i * jump + 1];
-    int64_t rst = TryGetOne(ver, x, y);
-    if (INVALID_ID == rst) {
-        (*ids)[i] = -1;
-    } else {
-        (*ids)[i] = rst;
-    }
-  }
-  rwlock_[ver].unlock();
-  return 0;
-}
-
-int HashMap::Del(int64_t* keys, int64_t size, int64_t jump) {
-  write_lock_.lock();
-  int ver = (current_ver_.load() + 1) % VERSIONS;
-  rwlock_[ver].wrlock();
-  for (int64_t i = 0; i < size; i++) {
-    int64_t x = keys[i * jump];
-    int64_t y = keys[i * jump + 1];
-    DelOne(ver, x, y);  
-    update_counter_++;
-  }
-  rwlock_[ver].unlock();
-  if (update_counter_ > max_cache_) {
-    ResetVer(ver);
-  }  
-  write_lock_.unlock();
-  return 0;
-}
-
-int HashMap::GetHashKeys(HashMap::HashMapStruct* data) {
-  write_lock_.lock();
-  int ver = (current_ver_.load() + 1) % VERSIONS;
-  ResetVer(ver);
-  data->counter = counter_;
-  write_lock_.unlock();
-
-  ver = current_ver_.load();
-  rwlock_[ver].rdlock();
-  for (auto&& item : nodes_vec_[ver]) {
-    for (auto iter = & item; iter != nullptr; iter = iter->Next()) {
-      auto items = iter->Array();
-      for (size_t i = 0; i < ITEM_SIZE; i++) {
-        if (items[i].id != INVALID_ID) {
-          data->items.push_back(items[i]);
-        }
-      }
-    }
-  }
-  rwlock_[ver].unlock();
-  return 0;
+  
+void HashMap::SetBloomFilterThrethold(int32_t max_count) {
+  max_count_ = max_count;
 }
 
-int HashMap::SetHashKeys(const HashMap::HashMapStruct& data) {
-  std::unordered_set<size_t> ids;
-  for (auto item : data.items) {
-    ids.insert(item.id);
-    for (int ver = 0; ver < VERSIONS; ver++) {
-      SMemBlock<ITEM_SIZE>* cur_block = GetHashBlockList(ver, item.x, item.y); 
-      while (cur_block->Next()) {
-        cur_block = cur_block->Next();
-      }
-      bool add_new_node = true;
-      for (int i = 0; i < ITEM_SIZE; i++) {
-        if (cur_block->Array()[i].id == INVALID_ID) {
-          cur_block->Array()[i] = item;
-          add_new_node = false;
-          break;
-        }
-      }
-      if (add_new_node) {
-        SMemBlock<ITEM_SIZE>* tmp = data_pool_vec_[ver]->Borrow();
-        if (tmp == nullptr) {
-          return -1;
-        }
-        cur_block->Next() = tmp;
-        tmp->Array()[0] = item;
-      }
-    }
-  }
-  for (size_t i = 0; i < data.counter; i++) {
-    if (ids.find(i) == ids.end()) {
-      reused_ids_list_.push_back(i);
-    }
-  }
-  counter_ = data.counter;
-  return 0;
+std::ostream& operator<<(std::ostream& os, const Hash128Key& key) {
+  os << key.hash1 << "," << key.hash2;
+  return os;
 }
 
-std::default_random_engine HashMap::dre;
-std::uniform_real_distribution<double> HashMap::urd(0.0, 1.0);
-const int64_t HashMap::NOT_ADD_ID = -2;
+const float HashMap::FLOAT_EPSILON = 1.192092896e-07f;
+const size_t HashMap::NOT_ADD_ID = -2;
 } //ps
diff --git a/xdl/ps-plus/ps-plus/common/hashmap.h b/xdl/ps-plus/ps-plus/common/hashmap.h
index 4eb3ba58..21022395 100644
--- a/xdl/ps-plus/ps-plus/common/hashmap.h
+++ b/xdl/ps-plus/ps-plus/common/hashmap.h
@@ -21,227 +21,277 @@ limitations under the License.
 #include <deque>
 #include <mutex>
 #include <random>
+#include <iostream>
+#include <assert.h>
+#include <unordered_set>
 #include "rd_lock.h" 
-#include "memblock.h"
+#include "ps-plus/common/qrw_lock.h"
+#include "ps-plus/common/bloom_filter.h"
+#include "tbb/parallel_for_each.h"
+#include "tbb/concurrent_unordered_map.h"
+#include "tbb/concurrent_queue.h"
+#include "tbb/concurrent_vector.h"
+#include "ps-plus/common/thread_pool.h"
+#include "ps-plus/common/logging.h"
 
 namespace ps {
-
-#define ITEM_SIZE 2
-
-class HashMap {
- public:
-
-  HashMap(int64_t hint);
-  ~HashMap();
-  void SetMaxCache(int max_cache) {
-    max_cache_ = max_cache;    
+struct Hash128Key {
+  int64_t hash1;
+  int64_t hash2;
+  bool operator ==(const Hash128Key& rhs) const {
+    return hash1 == rhs.hash1 && hash2 == rhs.hash2;
   }
+  friend std::ostream& operator<<(std::ostream& os, const Hash128Key& key);
+};
 
-  int Get(int64_t* keys, int64_t size, int64_t jump,
-          std::vector<int64_t>* ids, std::vector<int64_t>* reused_ids);
-
-  int GetWithAddProbability(int64_t* keys, int64_t size, int64_t jump, double add_probability,
-          std::vector<int64_t>* ids, std::vector<int64_t>* reused_ids);
-    
-  int GetWithoutAdd(int64_t* keys, int64_t size, int64_t jump, std::vector<int64_t>* ids);
+template<typename T>
+struct HashMapItem {
+  T key;
+  size_t id;
+};
 
-  int Del(int64_t* keys, int64_t size, int64_t jump); 
+template<typename T>
+struct HashMapStruct {
+  tbb::concurrent_vector<HashMapItem<T> > items;
+  std::atomic<int64_t> count;
+};
+}
 
-  struct HashMapStruct {
-    std::vector<HashMapItem> items;
-    size_t counter;
-  };
-  int GetHashKeys(HashMapStruct* result);
-  // Only be used in clear hashmap
-  int SetHashKeys(const HashMapStruct& result);
-  static const int64_t NOT_ADD_ID;
- private:
-  inline int64_t GetHashKey(int64_t x, int64_t y) {
+namespace tbb {
+template <> struct tbb_hash_compare<ps::Hash128Key> {
+  static size_t hash(const ps::Hash128Key& k) {
+    return GetHashKey(k.hash1, k.hash2);
+  }
+  static bool equal(const ps::Hash128Key& k1, const ps::Hash128Key& k2) {
+    return k1 == k2;
+  }
+  static inline int64_t GetHashKey(int64_t x, int64_t y) {
+    if (x == y) {
+      return x;
+    }
     x = ((x & 0xAAAAAAAAAAAAAAAAL) >> 1) + ((x & 0x5555555555555555L) << 1);
-    y = ((y & 0xFFFFFFFF00000000L) >> 32) + ((y & 0x00000000FFFFFFFFL) << 32);
+    y = ((y & 0xCCCCCCCCCCCCCCCCL) >> 2) + ((y & 0x3333333333333333L) << 2);
     int64_t h = x ^ y;
     return h == 0 ? -1 : h;
   }
+};
 
-  inline SMemBlock<ITEM_SIZE>* GetHashBlockList(int ver, int64_t x, int64_t y) {
-    int64_t pos = GetHashKey(x, y) % nodes_vec_[ver].size();
-    pos = pos >= 0 ? pos : pos + nodes_vec_[ver].size();
-    return &(nodes_vec_[ver][pos]);
+template <> struct tbb_hash<ps::Hash128Key> {
+  size_t operator()(const ps::Hash128Key& k) const {
+    return tbb_hash_compare<ps::Hash128Key>::GetHashKey(k.hash1, k.hash2);
   }
+};
 
-  inline int64_t TryGetOne(int ver, int64_t x, int64_t y);
-  inline int64_t AddOne(int ver, int64_t x, int64_t y, int64_t id, bool* id_reused);
-  inline void DelOne(int ver, int64_t x, int64_t y, int64_t id = -1);
-  inline int64_t GetId(bool* id_reused); 
-  int ReplayLogs(int ver);
-  void ResetVer(int ver);
-  // expand space when there is not enough space to fill data
-  int ExpandSpace(int ver);
-  static int64_t GetHashSize(int64_t hint, bool scale = false);
-
-  static const int VERSIONS = 2; 
-  static const int MAX_CACHED = 10000;
-  static const int64_t INVALID_ID = -1;
-  static std::default_random_engine dre;
-  static std::uniform_real_distribution<double> urd;
-
-  using HashNode = std::vector<SMemBlock<ITEM_SIZE>>;
-
-  enum OperateType {
-    ADD_OP = 0,
-    DEL_OP
-  };
-
-  struct LogNode {
-    LogNode() {
-    }
+}
 
-    LogNode(int64_t x, int64_t y, int64_t id, OperateType type) {
-      this->x = x;
-      this->y = y;
-      this->id = id;
-      this->type = type;
-    }
+namespace ps {
 
-    int64_t x;
-    int64_t y;
-    int64_t id;
-    OperateType type;
-  };
-
-  int64_t counter_;
-  int64_t hint_;
-  int update_counter_;
-  int max_cache_;
-  std::atomic<int> current_ver_;
-  ReadWriteLock rwlock_[VERSIONS];
-  std::mutex write_lock_;
-  // hash table node
-  HashNode nodes_vec_[VERSIONS];
-  MemBlockPool<ITEM_SIZE>* data_pool_vec_[VERSIONS]; 
-  std::deque<int64_t> reused_ids_list_;
-
-  // log for adding or removing  
-  std::vector<LogNode> logs_[VERSIONS];  
+class HashMap {
+ public:  
+  HashMap();
+  virtual ~HashMap();
+  HashMap(const HashMap&) = delete;
+  HashMap& operator=(const HashMap&) = delete;
+  virtual int64_t Get(const int64_t* keys, size_t size, bool not_insert, float add_probability, std::vector<size_t>* ids, tbb::concurrent_vector<size_t>* reused_ids, size_t* filtered_keys, size_t block_size = 500) = 0;
+  virtual void Erase(const int64_t* keys, size_t size) = 0;
+  virtual size_t EraseById(const std::string& variable_name, const std::vector<size_t>& ids, tbb::concurrent_vector<size_t>* unfiltered_ids) = 0;
+  void SetBloomFilterThrethold(int32_t max_count);  
+  static const size_t NOT_ADD_ID;
+  static const float FLOAT_EPSILON;
+  std::default_random_engine dre;
+  std::uniform_real_distribution<float> urd;
+  size_t GetSize() {return offset_;}
+  virtual size_t GetBucketCount(const std::string& variable_name) = 0;
+ protected:
+  bool FloatEqual(float v1, float v2);
+  std::atomic<size_t> offset_;
+  tbb::concurrent_queue<size_t> free_list_;
+  int32_t max_count_;
 };
 
-int64_t HashMap::TryGetOne(int ver, int64_t x, int64_t y) {
-  SMemBlock<ITEM_SIZE>* cur_block = GetHashBlockList(ver, x, y); 
-  HashMapItem* item;
-  while (cur_block) {
-    item = cur_block->Get(x, y);
-    if (nullptr != item) {
-      // found
-      return item->id;  
-    }
-    cur_block = cur_block->Next();
-  } 
-  return INVALID_ID;
-}
-
-int64_t HashMap::GetId(bool* id_reused) {
-  // first, check reused_ids_list_
-  *id_reused = false;
-  if (!reused_ids_list_.empty()) {
-    int64_t id = reused_ids_list_.front();
-    reused_ids_list_.pop_front();
-    *id_reused = true;
-    return id;
+template <typename KeyType> class HashMapImpl : public HashMap {
+ public:
+  HashMapImpl(size_t hint): HashMap(), table_(hint) {}  
+  typedef tbb::concurrent_unordered_map<KeyType, size_t, tbb::tbb_hash<KeyType>, std::equal_to<KeyType> > HashTable;
+  typedef std::unordered_set<KeyType, tbb::tbb_hash<KeyType>, std::equal_to<KeyType> > NonCocurrentHashTable;
+  virtual int64_t Get(const int64_t* keys, size_t size, bool not_insert, float add_probability, std::vector<size_t>* ids, tbb::concurrent_vector<size_t>* reused_ids, size_t* filtered_keys, size_t block_size = 500) {
+    ids->resize(size);
+    std::atomic<size_t> total_filtered_count(0);
+    MultiThreadDo(size, [&](const Range& r) {
+          size_t filtered_count = 0;
+          for (size_t i = r.begin; i < r.end; i++) {
+            KeyType key;
+            GetKey(keys, i, &key);
+            auto iter = table_.find(key);
+            if (iter != table_.end()) {
+              (*ids)[i] = iter->second;
+              //only not_insert is false(pull request), we use add_probability or bloom filter;
+            } else if (!not_insert) {
+              if ((FloatEqual(add_probability, 1.0) || urd(dre) <= add_probability)
+                && (max_count_ == 0 || GlobalBloomFilter::Instance()->InsertedLookup(&key, sizeof(key), max_count_))
+                && (black_list_ == nullptr || black_list_->find(key) == black_list_->end())
+                && (white_list_ == nullptr || white_list_->find(key) != white_list_->end())) {
+                auto insert = table_.insert(std::make_pair(key, 0));
+                if (insert.second) {
+                  size_t id;
+                  if (free_list_.try_pop(id)) {
+                    (*ids)[i] = id;
+                    insert.first->second = (*ids)[i];
+                    reused_ids->push_back(id);
+                  } else {
+                    (*ids)[i] = offset_++;
+                    insert.first->second = (*ids)[i];
+                  }
+                } else {
+                  (*ids)[i] = insert.first->second;
+                }
+              } else {
+                filtered_count++;
+                (*ids)[i] = NOT_ADD_ID;
+              }
+            }
+          }
+          total_filtered_count += filtered_count;
+          return Status::Ok();
+        }, block_size);
+    *filtered_keys = total_filtered_count.load();
+    return offset_.load();
   }
-  // second, produce new id
-  return counter_++; 
-}
 
-int64_t HashMap::AddOne(int ver, int64_t x, int64_t y, int64_t id,
-    bool* id_reused) {
-  *id_reused = false;
-  int64_t old_id = TryGetOne(ver, x, y);
-  if (INVALID_ID != old_id) {
-    return old_id;
-  }
-  int64_t new_id;
-  if (id < 0) {
-    new_id = GetId(id_reused);
-  } else {
-    new_id = id;
-  }
-  
-  SMemBlock<ITEM_SIZE>* cur_block = GetHashBlockList(ver, x, y);
-  int ret = 0;
-  while (cur_block) {
-    ret = cur_block->Push(x, y, new_id); 
-    if (0 == ret) {
-      if (id < 0) {
-        // will need replay log
-        logs_[ver].emplace_back(x, y, new_id, ADD_OP);
+  virtual void Erase(const int64_t* keys, size_t size) {
+    for (size_t i = 0; i < size; i++) {
+      KeyType key;
+      GetKey(keys, i, &key);
+      auto iter = table_.find(key);
+      if (iter != table_.end()) {
+        size_t wait_erase = iter->second;
+        if (table_.unsafe_erase(key)) {
+          free_list_.push(wait_erase);
+        }
       }
-      return new_id;
     }
-    if (nullptr == cur_block->Next()) {
-      SMemBlock<ITEM_SIZE>* tmp = data_pool_vec_[ver]->Borrow();
-      if (nullptr == tmp) {
-        // need expand space
-        if (0 != ExpandSpace(ver)) {
-          return INVALID_ID;
-        }
-        // NOTE: should get hash block list again
-        SMemBlock<ITEM_SIZE>* new_head = GetHashBlockList(ver, x, y);
-        if (nullptr == new_head) {
-          return INVALID_ID;
+  }
+
+  virtual size_t GetBucketCount(const std::string& variable_name) {
+    /*
+    LOG_INFO("%s, load_factor %f, max_load_factor %f", variable_name.c_str(), table_.load_factor(), table_.max_load_factor());
+    size_t bucket_count = table_.unsafe_bucket_count();
+    std::map<size_t, size_t> count_map;
+    bool first = true;
+    for (size_t i = 0; i < bucket_count; i++) {
+      size_t size = table_.unsafe_bucket_size(i);
+      if (size != 0 && first) {
+        auto iter = table_.unsafe_begin(i);
+        first = false;
+        while (iter != table_.unsafe_end(i)) {
+          std::cout << iter->first << std::endl;
+          ++iter;
         }
-        cur_block = new_head;
+      }
+      if (count_map.find(size) == count_map.end()) {
+        count_map[size] = 1;
       } else {
-        cur_block->Next() = tmp;
-        cur_block = cur_block->Next();
+        count_map[size] = count_map[size]+1;
       }
-    } else {
-      cur_block = cur_block->Next();
     }
+    size_t total = 0;
+    for (auto& iter : count_map) {
+      total += iter.first * iter.second;
+      LOG_INFO("%s, %ld, %ld", variable_name.c_str(), iter.first, iter.second);
+    }
+    LOG_INFO("%s, total is %ld", variable_name.c_str(), total);
+    */
+    return table_.unsafe_bucket_count();
   }
-  return INVALID_ID;
-}
 
-void HashMap::DelOne(int ver, int64_t x, int64_t y, int64_t id) {
-  SMemBlock<ITEM_SIZE>* head = GetHashBlockList(ver, x, y);
-  SMemBlock<ITEM_SIZE>* cur_block = head;
-  int64_t old_id;
-  while (cur_block) {
-    if (0 == cur_block->Del(x, y, &old_id)) {
-      if (-1 == id) {
-        if (old_id >= 0) {
-          // release id
-          reused_ids_list_.push_back(old_id);
-          logs_[ver].emplace_back(x, y, old_id, DEL_OP);
-        } else {
-          // do nothing, because it has been logical deleted
-        }
-      }
-      break;
-    }  
-    cur_block = cur_block->Next(); 
+  inline void GetItems(HashMapStruct<KeyType>* result) {
+    tbb::parallel_for_each(begin(table_), end(table_), [=](const std::pair<KeyType, size_t>& pr) {
+          result->items.push_back(HashMapItem<KeyType>{.key=pr.first, .id=pr.second});
+        });
+    result->count = result->items.size();
+    return;
   }
-  // return MemBlock to pool if it's empty
-  SMemBlock<ITEM_SIZE>* tmp = head;
-  while (tmp && tmp->Next()) {
-    if (tmp->Next()->Empty()) {
-      SMemBlock<ITEM_SIZE>* next = tmp->Next()->Next();
-      data_pool_vec_[ver]->Return(tmp->Next());
-      tmp->Next() = next; 
+
+  virtual size_t EraseById(const std::string& variable_name, const std::vector<size_t>& ids, tbb::concurrent_vector<size_t>* unfiltered_ids) {
+    std::atomic<size_t> size(0);
+    tbb::concurrent_vector<KeyType> keys;
+    tbb::parallel_for_each(begin(table_), end(table_), [&](const std::pair<KeyType, size_t>& pr) {
+      auto iter = std::lower_bound(ids.begin(), ids.end(), pr.second);
+      if (iter != ids.end() && *iter == pr.second) {
+        keys.push_back(pr.first);
+        free_list_.push(pr.second);
+        size++;
+      } else {
+        unfiltered_ids->push_back(pr.second);
+      }
+    });
+    for (auto&& key : keys) {
+      table_.unsafe_erase(key);
     }
-    tmp = tmp->Next();
+    LOG(INFO) << "Filter for " << variable_name << ", clear=" << keys.size() << ", left=" << table_.size();
+    return size;
   }
 
-  // do logical deletion to read buffer
-  int read_ver = current_ver_.load();
-  SMemBlock<ITEM_SIZE>* read_cur_block = GetHashBlockList(read_ver, x, y);
-  while (read_cur_block) {
-    HashMapItem* item = read_cur_block->Get(x, y);
-    if (nullptr != item) {
-      item->id = INVALID_ID;
-      break;
-    }
-    read_cur_block = read_cur_block->Next();
-  } 
+ //只应调用偏特化版本
+ inline void GetKey(const int64_t* keys, int index, KeyType* result) {
+   throw std::invalid_argument("GetKey for HashMap base should not be called");    
+ }
+
+ NonCocurrentHashTable* NewBlackList() {
+   black_list_.reset(new NonCocurrentHashTable);
+   return black_list_.get();
+ }
+
+ NonCocurrentHashTable* NewWhiteList() {
+   white_list_.reset(new NonCocurrentHashTable);
+   return white_list_.get();
+ }
+
+ NonCocurrentHashTable* GetBlackList() {
+   return black_list_.get();
+ }
+
+ NonCocurrentHashTable* GetWhiteList() {
+   return white_list_.get();
+ }
+
+ size_t FilterByBlackList() {
+   size_t size = 0;
+   for (auto key : *black_list_) {
+     size += table_.unsafe_erase(key);
+   }
+   return size;
+ }
+
+ size_t FilterByWhiteList() {
+   HashTable new_table;
+   std::atomic<size_t> size(0);
+   tbb::parallel_for_each(begin(table_), end(table_), [&](const std::pair<KeyType, size_t>& pr) {
+     if (white_list_->find(pr.first) != white_list_->end()) {
+       new_table.insert(pr);
+     } else {
+       size++;
+     }
+   });
+   table_ = std::move(new_table);
+   return size;
+ }
+
+ private:
+  HashTable table_;
+  std::unique_ptr<NonCocurrentHashTable> black_list_, white_list_;
+  QRWLock lock_;
+};
+
+template<>
+inline void HashMapImpl<int64_t>::GetKey(const int64_t* keys, int index, int64_t* result) {
+  *result = keys[index];
+}
+
+template<>
+inline void HashMapImpl<Hash128Key>::GetKey(const int64_t* keys, int index, Hash128Key* result) {
+  result->hash1 = keys[2*index];
+  result->hash2 = keys[2*index+1];
 }
 
 } //ps
diff --git a/xdl/ps-plus/ps-plus/common/hdfs_data_source.cc b/xdl/ps-plus/ps-plus/common/hdfs_data_source.cc
index 762a46e4..fa402592 100644
--- a/xdl/ps-plus/ps-plus/common/hdfs_data_source.cc
+++ b/xdl/ps-plus/ps-plus/common/hdfs_data_source.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -32,7 +17,6 @@ limitations under the License.
 #include "ps-plus/common/hdfs_data_source.h"
 
 #include <thread>
-#include <iostream>
 #include <memory>
 #include <cstring>
 #include <atomic>
@@ -42,6 +26,14 @@ limitations under the License.
 
 namespace ps {
 
+namespace {
+void LOG_TIME(std::string name) {
+  struct timeval tv;
+  gettimeofday(&tv,NULL);
+  std::cout << name + ":" + std::to_string(1000000 * tv.tv_sec + tv.tv_usec) + "\n";
+}
+}
+
 Status HdfsDataSource::Init(int rank, int worker_num, 
                           size_t default_value_length) {
   default_value_length_ = default_value_length;
diff --git a/xdl/ps-plus/ps-plus/common/initializer.cc b/xdl/ps-plus/ps-plus/common/initializer.cc
index b8f5587c..b5debac7 100644
--- a/xdl/ps-plus/ps-plus/common/initializer.cc
+++ b/xdl/ps-plus/ps-plus/common/initializer.cc
@@ -15,7 +15,7 @@ limitations under the License.
 
 #include "ps-plus/common/initializer.h"
 #include "ps-plus/common/thread_pool.h"
-
+#include "tbb/parallel_for.h"
 #include <future>
 
 namespace ps {
@@ -29,21 +29,11 @@ void Initializer::MultiThreadInit(void* data, DataType type, size_t size) {
   if (size < block_size * 2) {
     Init(data, type, size);
   } else {
-    char* ptr = (char*)data;
-    std::promise<bool> ok;
-    std::atomic<size_t> counter(size / block_size);
-    while (size > 0) {
-      size_t s = size < block_size * 2 ? size : block_size;
-      ThreadPool::Global()->Schedule([=, &ok, &counter]{
-        Init(ptr, type, s);
-        if (--counter == 0) {
-          ok.set_value(true);
-        }
-      });
-      ptr += SizeOfType(type) * s;
-      size -= s;
-    }
-    ok.get_future().wait();
+    parallel_for(tbb::blocked_range<size_t>(0, size), [&](tbb::blocked_range<size_t>& r) {
+          size_t start = r.begin();
+          size_t end = r.end();
+          Init(data + (start * SizeOfType(type)), type, end-start);
+        });
   }
 }
 
diff --git a/xdl/ps-plus/ps-plus/common/initializer/orthogonal_initializer.cpp b/xdl/ps-plus/ps-plus/common/initializer/orthogonal_initializer.cpp
new file mode 100644
index 00000000..957587cc
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/initializer/orthogonal_initializer.cpp
@@ -0,0 +1,107 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "orthogonal_initializer.h"
+
+#include <string>
+#include <cstring>
+#include <cmath>
+#include <memory>
+#include <Eigen/SVD>  
+#include <Eigen/Dense>    
+
+#include "ps-plus/common/types.h"
+#include "random/random.h"
+#include "random/random_ops.h"
+#include "normal_initializer.h"
+
+using namespace Eigen;    
+using namespace Eigen::internal;    
+using namespace Eigen::Architecture;    
+
+namespace ps {
+namespace initializer {
+
+OrthogonalInitializer::OrthogonalInitializer(
+    int64_t dim, int seed, float gain)
+  : dim_(dim)
+  , seed_(seed)
+  , gain_(gain) {
+  normal_initializer_.reset(new NormalInitializer(seed, 0.0, 1.0));
+}
+
+bool OrthogonalInitializer::Accept(DataType type) {
+  if (type == DataType::kFloat || 
+      type == DataType::kDouble) {
+    return true;
+  }
+
+  return false;
+}
+
+void OrthogonalInitializer::Init(void* data, 
+                                 DataType type, 
+                                 size_t size) {
+  if (size % dim_ != 0) {
+    printf("error size\n");
+    abort();
+  }
+
+  normal_initializer_->Init(data, type, size);
+  int64_t row = size / dim_;
+  int64_t col = dim_;
+  if (type == DataType::kFloat) {
+    Eigen::Map<Eigen::Matrix<float, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>> m((float*)data, row, col);  
+    Eigen::JacobiSVD<Eigen::MatrixXf> svd(m, Eigen::ComputeThinV | Eigen::ComputeThinU);
+    Eigen::MatrixXf u = svd.matrixU() * gain_;
+    Eigen::MatrixXf v = svd.matrixV() * gain_;      
+    if ((row == u.rows() && col == u.cols()) ||
+        (row == u.cols() && col == u.rows())) {
+      Eigen::MatrixXf trans_u = u.transpose();
+      memcpy(data, trans_u.data(), size * sizeof(float));
+    } else if ((row == v.rows() && col == v.cols()) ||
+               (row == v.cols() && col == v.rows())) {
+      memcpy(data, v.data(), size * sizeof(float));       
+    } else {
+      printf("svd result shape[%d,%d|%d,%d] not match\n", u.rows(), u.cols(), v.rows(), v.cols());
+      abort();
+    }
+  } else {
+    Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>> m((double*)data, row, col);      
+    Eigen::JacobiSVD<Eigen::MatrixXd> svd(m, Eigen::ComputeThinV | Eigen::ComputeThinU);
+    Eigen::MatrixXd u = svd.matrixU() * gain_;
+    Eigen::MatrixXd v = svd.matrixV() * gain_;
+    if ((row == u.rows() && col == u.cols()) ||
+        (row == u.cols() && col == u.rows())) {
+      Eigen::MatrixXd trans_u = u.transpose();
+      memcpy(data, trans_u.data(), size * sizeof(double));
+    } else if ((row == v.rows() && col == v.cols()) ||
+               (row == v.cols() && col == v.rows())) {
+      memcpy(data, v.data(), size * sizeof(double));       
+    } else {
+      printf("svd result shape[%d,%d|%d,%d] not match\n", u.rows(), u.cols(), v.rows(), v.cols());
+      abort();
+    }
+  }
+}
+
+Initializer* OrthogonalInitializer::Clone() {
+  return new OrthogonalInitializer(
+      dim_, seed_, gain_);
+}
+
+} //namespace initializer
+} //ps
+
diff --git a/xdl/ps-plus/ps-plus/common/initializer/orthogonal_initializer.h b/xdl/ps-plus/ps-plus/common/initializer/orthogonal_initializer.h
new file mode 100644
index 00000000..d4791cae
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/initializer/orthogonal_initializer.h
@@ -0,0 +1,45 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_COMMON_INITIALIZER_ORTHOGONAL_INITIALIZER_H
+#define PS_COMMON_INITIALIZER_ORTHOGONAL_INITIALIZER_H
+
+#include "ps-plus/common/initializer.h"
+#include "ps-plus/common/tensor_shape.h"
+
+namespace ps {
+namespace initializer {
+
+class NormalInitializer;
+
+class OrthogonalInitializer: public Initializer {
+ public:
+  OrthogonalInitializer(int64_t dim, int seed = 0, float gain = 1.0);
+  bool Accept(DataType type) override;
+  void Init(void* data, DataType type, size_t size) override;
+  Initializer* Clone() override;
+
+ private:
+  int64_t dim_;
+  int seed_;
+  float gain_;
+  std::vector<int64_t> shape_;
+  std::unique_ptr<NormalInitializer> normal_initializer_;
+};
+
+} //namespace initializer
+} //ps
+
+#endif  // PS_COMMON_INITIALIZER_TRUNCATED_ORTHOGONAL_INITIALIZER_H
diff --git a/xdl/ps-plus/ps-plus/common/initializer/test/orthogonal_initializer_test.cc b/xdl/ps-plus/ps-plus/common/initializer/test/orthogonal_initializer_test.cc
new file mode 100644
index 00000000..87ba2a1c
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/initializer/test/orthogonal_initializer_test.cc
@@ -0,0 +1,35 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/common/initializer/orthogonal_initializer.h"
+
+using ps::DataType;
+using ps::Initializer;
+using ps::initializer::OrthogonalInitializer;
+
+TEST(OrthogonalInitializer, OrthogonalInitializer) {
+  float data[6] = {0};
+  Initializer* init = new OrthogonalInitializer(3);
+  init->Init(data, DataType::kFloat, 6);
+  float sum = 0.0;
+  for (size_t i = 0; i < 3; ++i) {
+    sum += data[i] * data[i+3];
+  }
+
+  static const float eps = 1e-6;
+  EXPECT_TRUE(abs(sum) < eps);
+}
+
diff --git a/xdl/ps-plus/ps-plus/common/logging.cc b/xdl/ps-plus/ps-plus/common/logging.cc
new file mode 100644
index 00000000..3c330e2c
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/logging.cc
@@ -0,0 +1,69 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "logging.h"
+
+#include <iostream>
+#include <sstream>
+#include <cstring>
+#include <stdlib.h>
+#include <time.h>
+
+#include "time_utils.h"
+
+namespace ps {
+
+LogMessage::LogMessage(const char* fname, int line, int severity)
+  : fname_(fname), line_(line), severity_(severity) {}
+
+void LogMessage::GenerateLogMessage() {
+  uint64_t now_micros = TimeUtils::NowMicros();
+  time_t now_seconds = static_cast<time_t>(now_micros / 1000000);
+  int32_t micros_remainder = static_cast<int32_t>(now_micros % 1000000);
+  const size_t time_buffer_size = 30;
+  char time_buffer[time_buffer_size];
+  strftime(time_buffer, time_buffer_size, "%Y-%m-%d %H:%M:%S",
+           localtime(&now_seconds));
+  fprintf(stderr, "%s.%06d: %c %s:%d] %s\n", time_buffer, micros_remainder,
+          "IWEF"[severity_], fname_, line_, str().c_str());
+}
+
+namespace {
+int64_t GetLogLevelFromEnv() {
+  const char* log_level = getenv("XDL_CPP_LOG_LEVEL");
+  if (log_level == nullptr) {
+    return INFO;
+  }
+
+  return atoi(log_level);
+}
+}
+
+LogMessage::~LogMessage() {
+  static int64_t min_log_level = GetLogLevelFromEnv();
+  if (likely(severity_ >= min_log_level)) {
+    GenerateLogMessage();
+  }
+}
+
+LogMessageFatal::LogMessageFatal(const char* file, int line)
+    : LogMessage(file, line, FATAL) {}
+
+LogMessageFatal::~LogMessageFatal() {
+  GenerateLogMessage();
+  abort();
+}
+
+} // namespace xdl
diff --git a/xdl/ps-plus/ps-plus/common/logging.h b/xdl/ps-plus/ps-plus/common/logging.h
new file mode 100644
index 00000000..b5df8ebe
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/logging.h
@@ -0,0 +1,86 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_COMMON_LOGGING_H_
+#define PS_COMMON_LOGGING_H_
+
+#include <limits>
+#include <sstream>
+
+namespace ps {
+const int DEBUG = 0;         
+const int INFO = 1;          
+const int WARNING = 2;       
+const int ERROR = 3;         
+const int FATAL = 4;         
+const int NUM_SEVERITIES = 5;
+
+class LogMessage : public std::basic_ostringstream<char> {
+ public:
+  LogMessage(const char* fname, int line, int severity);
+  ~LogMessage();
+
+ protected:
+  void GenerateLogMessage();
+
+ private:
+  const char* fname_;
+  int line_;
+  int severity_;
+};
+
+class LogMessageFatal : public LogMessage {
+ public:
+  LogMessageFatal(const char* file, int line);
+  ~LogMessageFatal();
+};
+
+#define _PS_LOG_INFO \
+  ::ps::LogMessage(__FILE__, __LINE__, ::ps::INFO)
+#define _PS_LOG_DEBUG \
+  ::ps::LogMessage(__FILE__, __LINE__, ::ps::DEBUG)
+#define _PS_LOG_WARNING \
+  ::ps::LogMessage(__FILE__, __LINE__, ::ps::WARNING)
+#define _PS_LOG_ERROR \
+  ::ps::LogMessage(__FILE__, __LINE__, ::ps::ERROR)
+#define _PS_LOG_FATAL \
+  ::ps::LogMessageFatal(__FILE__, __LINE__)
+
+#define LOG(severity) _PS_LOG_##severity
+
+#define DLOG(severity) PS_LOG(severity)
+
+#ifndef likely
+#define likely(x) __builtin_expect(!!(x), 1)
+#endif
+
+#ifndef unlikely
+#define unlikely(x) __builtin_expect(!!(x), 0)
+#endif
+
+#define PS_CHECK(condition)                    \
+  if (unlikely(!(condition)))                   \
+    LOG(FATAL) << "Check failed: " #condition " "
+
+#define PS_CHECK_EQ(lhs, rhs)                          \
+  if (unlikely(((lhs) != (rhs))))                       \
+    LOG(FATAL) << "Check failed: " #lhs " == " #rhs
+
+
+#define DCHECK(condition) PS_CHECK(condition)
+
+}  // ps
+
+#endif  // PS_COMMON_LOGGING_H_
diff --git a/xdl/ps-plus/ps-plus/common/murmurhash.cpp b/xdl/ps-plus/ps-plus/common/murmurhash.cpp
new file mode 100644
index 00000000..74d175e7
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/murmurhash.cpp
@@ -0,0 +1,100 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "murmurhash.h"
+
+namespace ps {
+
+namespace {
+
+inline uint64_t rotl64(uint64_t x, int8_t r) {
+  return (x << r) | (x >> (64 - r));
+}
+
+inline uint64_t fmix64(uint64_t k) {
+  k ^= k >> 33;
+  k *= 0xff51afd7ed558ccdULL;
+  k ^= k >> 33;
+  k *= 0xc4ceb9fe1a85ec53ULL;
+  k ^= k >> 33;
+
+  return k;
+}
+
+}  // namespace
+
+// smhasher implementation:
+// https://github.com/aappleby/smhasher/blob/master/src/MurmurHash3.cpp
+void MurmurHash::operator()(const void* key, const int len, void* out) {
+  const uint8_t* data = (const uint8_t*)(key);
+  const int nblocks = len / 16;
+
+  uint64_t h1 = seed_, h2 = seed_;
+
+  const uint64_t c1 = 0x87c37b91114253d5ULL;
+  const uint64_t c2 = 0x4cf5ad432745937fULL;
+
+  const uint64_t* blocks = (const uint64_t*)(data);
+  for (int i = 0; i < nblocks; ++i) {
+    uint64_t k1 = blocks[i*2];
+    uint64_t k2 = blocks[i*2+1];
+
+    k1 *= c1; k1 = rotl64(k1, 31); k1 *= c2; h1 ^= k1;
+
+    h1 = rotl64(h1, 27); h1 += h2; h1 = h1*5+0x52dce729;
+
+    k2 *= c2; k2 = rotl64(k2, 33); k2 *= c1; h2 ^= k2;
+
+    h2 = rotl64(h2, 31); h2 += h1; h2 = h2*5+0x38495ab5;
+  }
+
+  const uint8_t* tail = (const uint8_t*)(data + nblocks*16);
+
+  uint64_t k1 = 0, k2 = 0;
+  switch(len & 15) {
+    case 15: k2 ^= ((uint64_t)tail[14]) << 48;
+    case 14: k2 ^= ((uint64_t)tail[13]) << 40;
+    case 13: k2 ^= ((uint64_t)tail[12]) << 32;
+    case 12: k2 ^= ((uint64_t)tail[11]) << 24;
+    case 11: k2 ^= ((uint64_t)tail[10]) << 16;
+    case 10: k2 ^= ((uint64_t)tail[9]) << 8;
+    case 9: k2 ^= ((uint64_t)tail[8]) << 0;
+            k2 *= c2; k2 = rotl64(k2, 33); k2 *= c1; h2 ^= k2;
+    case 8: k1 ^= ((uint64_t)tail[7]) << 56;
+    case 7: k1 ^= ((uint64_t)tail[6]) << 48;
+    case 6: k1 ^= ((uint64_t)tail[5]) << 40;
+    case 5: k1 ^= ((uint64_t)tail[4]) << 32;
+    case 4: k1 ^= ((uint64_t)tail[3]) << 24;
+    case 3: k1 ^= ((uint64_t)tail[2]) << 16;
+    case 2: k1 ^= ((uint64_t)tail[1]) << 8;
+    case 1: k1 ^= ((uint64_t)tail[0]) << 0;
+            k1 *= c1; k1 = rotl64(k1, 31); k1 *= c2; h1 ^= k1;
+  }
+
+  h1 ^= len; h2 ^= len;
+  h1 += h2;
+  h2 += h1;
+
+  h1 = fmix64(h1);
+  h2 = fmix64(h2);
+
+  h1 += h2;
+  h2 += h1;
+
+  ((uint64_t*)out)[0] = h1;
+  ((uint64_t*)out)[1] = h2;
+}
+
+}  // namespace ps
diff --git a/xdl/ps-plus/ps-plus/common/murmurhash.h b/xdl/ps-plus/ps-plus/common/murmurhash.h
new file mode 100644
index 00000000..fe9c2223
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/murmurhash.h
@@ -0,0 +1,33 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_COMMON_MURMURHASH_H_
+#define PS_PLUS_COMMON_MURMURHASH_H_
+
+#include <cstdint>
+
+namespace ps {
+
+class MurmurHash {
+ public:
+  MurmurHash(uint32_t seed) : seed_(seed) {}
+  void operator()(const void* key, int len, void* out);
+ private:
+  uint32_t seed_;
+};
+
+}  // namespace ps
+
+#endif  // PS_PLUS_COMMON_MURMURHASH_H_
diff --git a/xdl/ps-plus/ps-plus/common/net_utils.cc b/xdl/ps-plus/ps-plus/common/net_utils.cc
index cbbee71e..8e1cd952 100644
--- a/xdl/ps-plus/ps-plus/common/net_utils.cc
+++ b/xdl/ps-plus/ps-plus/common/net_utils.cc
@@ -25,7 +25,7 @@ limitations under the License.
 #include <ifaddrs.h>
 #include <netinet/in.h>
 #include <cstring>
-#include <glog/logging.h>
+#include "ps-plus/common/logging.h"
 
 namespace ps {
 
diff --git a/xdl/ps-plus/ps-plus/common/serialize_helper.h b/xdl/ps-plus/ps-plus/common/serialize_helper.h
index 55e1d121..414139c4 100644
--- a/xdl/ps-plus/ps-plus/common/serialize_helper.h
+++ b/xdl/ps-plus/ps-plus/common/serialize_helper.h
@@ -18,6 +18,7 @@ limitations under the License.
 
 #include <cstring>
 #include <limits>
+#include "ps-plus/common/logging.h"
 
 #define private public
 
@@ -31,6 +32,7 @@ limitations under the License.
 #include "ps-plus/common/initializer/truncated_normal_initializer.h"
 #include "ps-plus/common/initializer/variance_scaling_initializer.h"
 #include "ps-plus/common/initializer/uniform_unit_scaling_initializer.h"
+#include "ps-plus/common/initializer/orthogonal_initializer.h"
 #include "ps-plus/common/hashmap.h"
 
 #undef private
@@ -48,15 +50,26 @@ class SerializeHelper {
   static ps::Status Serialize(const T* data, 
                               std::vector<Fragment>* bufs, 
                               MemGuard& mem_guard) {
-    T* buf = const_cast<T*>(data);
-    Fragment frag(reinterpret_cast<char*>(buf), sizeof(T));
+    Fragment frag(reinterpret_cast<char*>(mem_guard.AllocateElement<T>(*data)), sizeof(T));
     bufs->push_back(frag);
     return ps::Status::Ok();
   }
 
+  template <typename T>  
+  static ps::Status SerializeVec(const std::vector<T>* data, 
+                              std::vector<Fragment>* bufs, 
+                              MemGuard& mem_guard) {
+    size_t size = data->size();
+    PS_CHECK_STATUS(SerializeHelper::Serialize<size_t>(&size, bufs, mem_guard));
+    for (size_t i = 0; i < size; i++) {
+      PS_CHECK_STATUS(SerializeHelper::Serialize<T>(&(*data)[i], bufs, mem_guard));
+    }
+    return ps::Status::Ok();
+  }
+
   template <typename T>
   static ps::Status Deserialize(const char* buf, 
-                                T* data, 
+                                T* data,
                                 size_t* len, 
                                 MemGuard& mem_guard) {
     *data = *(reinterpret_cast<const T*>(buf));
@@ -64,6 +77,24 @@ class SerializeHelper {
     return ps::Status::Ok();
   }
 
+  template <typename T>
+  static ps::Status DeserializeVec(const char* buf, 
+                                   std::vector<T>* data,
+                                   size_t* len, 
+                                   MemGuard& mem_guard) {
+    size_t size;
+    size_t field_len;
+    PS_CHECK_STATUS(Deserialize<size_t>(buf, &size, &field_len, mem_guard));
+    size_t offset = 0;
+    for (size_t i = 0; i < size; i++) {
+      offset += field_len;
+      T t;
+      PS_CHECK_STATUS(Deserialize<T>(buf + offset, &t, &field_len, mem_guard));
+      data->push_back(std::move(t));
+    }
+    *len = offset + field_len;
+    return ps::Status::Ok();
+  }
 };
 
 // specification for SerializeHelper
@@ -91,6 +122,182 @@ ps::Status SerializeHelper::Deserialize<std::string>(const char* buf,
   return ps::Status::Ok();
 }
 
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<std::string> >(
+    const std::vector<std::string>* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t buffer_size = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    buffer_size += sizeof(size_t) + data->at(i).size();
+  }
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);
+  *(size_t*)buffer = data->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    *(size_t*)(buffer+offset) = data->at(i).size();
+    offset += sizeof(size_t);
+    memcpy(buffer + offset, data->at(i).c_str(), data->at(i).size());
+    offset += data->at(i).size();
+  }
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});
+  return ps::Status::Ok();
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<std::string> >(
+    const char* buf, 
+    std::vector<std::string>* data, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  return SerializeHelper::DeserializeVec(buf, data, len, mem_guard);
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<bool> >(
+    const std::vector<bool>* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t buffer_size = sizeof(size_t) + data->size();
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);  
+  *(size_t*)buffer = data->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    buffer[offset++] = (*data)[i];
+  }
+  Fragment buf(buffer, buffer_size);
+  bufs->push_back(std::move(buf));
+  return ps::Status::Ok();
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<bool> >(
+    const char* buf, 
+    std::vector<bool>* data, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  size_t size;
+  size_t field_len;
+  PS_CHECK_STATUS(Deserialize<size_t>(buf, &size, &field_len, mem_guard));
+  size_t offset = 0;
+  for (size_t i = 0; i < size; i++) {
+    offset += field_len;
+    bool t;
+    PS_CHECK_STATUS(Deserialize<bool>(buf + offset, &t, &field_len, mem_guard));
+    data->push_back(t);
+  }
+  *len = offset + field_len;
+  return ps::Status::Ok();  
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<double> >(
+    const std::vector<double>* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t buffer_size = sizeof(size_t);
+  buffer_size += data->size() * sizeof(double);
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);  
+  *(size_t*)buffer = data->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    *(double*)(buffer + offset) = data->at(i);
+    offset += sizeof(double);
+  }
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});  
+  return Status::Ok();
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<float> >(
+    const std::vector<float>* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t buffer_size = sizeof(size_t);
+  buffer_size += data->size() * sizeof(float);
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);  
+  *(size_t*)buffer = data->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    *(float*)(buffer + offset) = data->at(i);
+    offset += sizeof(float);
+  }
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});  
+  return Status::Ok();
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<int64_t> >(
+    const std::vector<int64_t>* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t buffer_size = sizeof(size_t);
+  buffer_size += data->size() * sizeof(int64_t);
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);  
+  *(size_t*)buffer = data->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    *(int64_t*)(buffer + offset) = data->at(i);
+    offset += sizeof(int64_t);
+  }
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});  
+  return Status::Ok();
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<int64_t> >(
+    const char* buf, 
+    std::vector<int64_t>* data, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  return SerializeHelper::DeserializeVec<int64_t>(buf, data, len, mem_guard);
+}
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<int> >(
+    const std::vector<int>* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t buffer_size = sizeof(size_t);
+  buffer_size += data->size() * sizeof(int);
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);  
+  *(size_t*)buffer = data->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < data->size(); i++) {
+    *(int*)(buffer + offset) = data->at(i);
+    offset += sizeof(int);
+  }
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});  
+  return Status::Ok();
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<int> >(
+    const char* buf, 
+    std::vector<int>* data, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  return SerializeHelper::DeserializeVec<int>(buf, data, len, mem_guard);
+}
+
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<double> >(
+    const char* buf, 
+    std::vector<double>* data, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  return SerializeHelper::DeserializeVec<double>(buf, data, len, mem_guard);
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<float> >(
+    const char* buf, 
+    std::vector<float>* data, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  return SerializeHelper::DeserializeVec<float>(buf, data, len, mem_guard);
+}
+
 template <>  
 ps::Status SerializeHelper::Serialize<ps::Status>(const ps::Status* st, 
                                                   std::vector<Fragment>* bufs,
@@ -123,7 +330,6 @@ ps::Status SerializeHelper::Deserialize<ps::Status>(const char* buf,
   } else {
     *st = ps::Status();
   }
-
   return ps::Status::Ok();
 }
 
@@ -132,7 +338,7 @@ ps::Status SerializeHelper::Serialize<ps::DataType>(
     const ps::DataType* dt, 
     std::vector<Fragment>* bufs,
     MemGuard& mem_guard) {
-  Serialize<int32_t>((int32_t*)dt, bufs, mem_guard);  
+  Serialize<int32_t>((int32_t*)dt, bufs, mem_guard);
   return ps::Status::Ok();
 }
 
@@ -201,18 +407,104 @@ ps::Status SerializeHelper::Serialize<ps::Tensor>(
     const ps::Tensor* t, 
     std::vector<Fragment>* bufs,
     MemGuard& mem_guard) {
-  Serialize<ps::DataType>(&t->state_->type, bufs, mem_guard);
-  Serialize<ps::TensorShape>(&t->state_->shape, bufs, mem_guard);
-  size_t size = 0;
-  CASES(t->Type(), {
-    size = t->Shape().NumElements() * sizeof(T);
-  });
-  Fragment frag(t->state_->buffer, size);
-  bufs->push_back(frag);
+  if (t->tensor_type_ != Tensor::TType::kContinuous) {
+    return Status::ArgumentError("SegmentTensor can't be serialized");
+  }
+  size_t buffer_size = sizeof(ps::DataType) + (1 + t->state_->shape.Size()) * sizeof(size_t);
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);
+  *(ps::DataType*)buffer = t->state_->type;
+  *(size_t*)(buffer + sizeof(ps::DataType)) = t->state_->shape.Size();
+  memcpy(buffer + sizeof(ps::DataType) + sizeof(size_t), &(t->state_->shape.dims_[0]), t->state_->shape.Size() * sizeof(size_t));
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});
+  ps::Tensor::ContinuousState* state = dynamic_cast<ps::Tensor::ContinuousState*>(t->state_);
+  size_t size = t->Shape().NumElements() * SizeOfType(t->Type());
+  bufs->push_back(Fragment{.base=state->buffer, .size=size});
   Serialize<std::unique_ptr<ps::Initializer> >(&t->state_->initializer, 
-                                               bufs, 
-                                               mem_guard);
-  return ps::Status::Ok();
+      bufs, 
+      mem_guard);
+  return ps::Status::Ok();  
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<ps::Tensor> >(
+    const std::vector<ps::Tensor>* tvec, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  if (tvec->size() == 1) {
+    return SerializeHelper::SerializeVec<ps::Tensor>(tvec, bufs, mem_guard);
+  }
+  size_t buffer_size = sizeof(size_t);
+  for (size_t i = 0; i < tvec->size(); i++) {
+    const ps::Tensor* t = &tvec->at(i);
+    buffer_size += sizeof(ps::DataType) + (1 + t->state_->shape.Size()) * sizeof(size_t);
+    buffer_size += t->Shape().NumElements() * SizeOfType(t->Type());
+  }
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);
+  *(size_t*)buffer = tvec->size();
+  size_t offset = sizeof(size_t);
+  for (size_t i = 0; i < tvec->size(); i++) {
+    const ps::Tensor* t = &tvec->at(i);
+    if (t->tensor_type_ != Tensor::TType::kContinuous) {
+      return Status::ArgumentError("SegmentTensor can't be serialized");
+    }
+    *(ps::DataType*)(buffer+offset) = t->state_->type;
+    offset += sizeof(ps::DataType);
+    *(size_t*)(buffer + offset) = t->state_->shape.Size();
+    offset += sizeof(size_t);
+    memcpy(buffer + offset, &(t->state_->shape.dims_[0]), t->state_->shape.Size() * sizeof(size_t));
+    offset += t->state_->shape.Size() * sizeof(size_t);
+    ps::Tensor::ContinuousState* state = dynamic_cast<ps::Tensor::ContinuousState*>(t->state_);
+    size_t size = t->Shape().NumElements() * SizeOfType(t->Type());    
+    memcpy(buffer + offset, state->buffer, size);
+    offset += size;
+  }
+  bufs->push_back(Fragment{.base=buffer, .size=buffer_size});
+  return Status::Ok();
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<ps::server::TensorSlices> (
+    const ps::server::TensorSlices* data, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  const ps::server::TensorSlices& s = *data;
+  const ps::Tensor* t = &s.tensor;
+  size_t buffer_size = sizeof(ps::DataType) + sizeof(size_t);
+  if (s.dim_part < 0) {
+    buffer_size += s.tensor.Shape().Size() * sizeof(size_t);
+  } else {
+    buffer_size += (s.tensor.Shape().Size() - s.dim_part + 1) * sizeof(size_t);
+  }
+  buffer_size += s.slice_id.size() * s.slice_size * SizeOfType(t->Type());
+  char* buffer = mem_guard.AllocateBuffer(buffer_size);
+  *(ps::DataType*)(buffer) = t->state_->type;
+  size_t offset = sizeof(ps::DataType);
+  ps::TensorShape new_shape;
+  if (s.dim_part < 0) {
+    new_shape = t->state_->shape;
+  } else {
+    std::vector<size_t> dims(1, s.slice_id.size());
+    if ((size_t)s.dim_part >= t->state_->shape.Size()) {
+      return Status::ArgumentError("Slice dim_part Error");
+    }
+    dims.insert(dims.end(), t->state_->shape.Dims().begin() + s.dim_part, t->state_->shape.Dims().end());
+    new_shape = TensorShape(dims);
+  }
+  *(size_t*)(buffer + offset) = new_shape.Size();
+  offset += sizeof(size_t);
+  memcpy(buffer + offset, &(new_shape.dims_[0]), new_shape.Size() * sizeof(size_t));
+  offset += new_shape.Size() * sizeof(size_t);
+  
+  size_t chunk_size = s.slice_size * SizeOfType(t->Type());
+  for (size_t j = 0; j < s.slice_id.size(); ++j) {
+    if ((int64_t)s.slice_id[j] == ps::HashMap::NOT_ADD_ID) {
+      memset(buffer + offset + j * chunk_size, 0, chunk_size);
+    } else {
+      memcpy(buffer + offset + j * chunk_size, t->Raw<void>(s.slice_id[j]), chunk_size);
+    }
+  }
+  bufs->push_back(Fragment({.base=buffer, .size=buffer_size}));
+  return ps::Status::Ok();  
 }
 
 template <>
@@ -225,7 +517,7 @@ ps::Status SerializeHelper::Deserialize<ps::Tensor>(const char* buf,
   PS_CHECK_STATUS(Deserialize<ps::DataType>(buf, &type, &field_len, mem_guard));
   *len = field_len;
   ps::TensorShape shape({0});
-  PS_CHECK_STATUS(Deserialize<ps::TensorShape>(buf + *len, &shape, &field_len, mem_guard));  
+  PS_CHECK_STATUS(Deserialize<ps::TensorShape>(buf + *len, &shape, &field_len, mem_guard));
   *len += field_len;
   const char* tensor_buffer = buf + *len;
   size_t buffer_len = 0;
@@ -238,12 +530,25 @@ ps::Status SerializeHelper::Deserialize<ps::Tensor>(const char* buf,
   *len += field_len;
   ps::Initializer* iz = nullptr;
   Fragment frag({.base=(char*)buf, .size=*len});
-  DeserializeAny<ps::Initializer>(serialize_id, &frag, *len, &iz, &field_len, mem_guard);
-  *len += field_len;
+  //Allow no initializer(for Slices & TensorSlices)
+  Status st = DeserializeAny<ps::Initializer>(serialize_id, &frag, *len, &iz, &field_len, mem_guard);
+  if (st.IsOk()) {
+    *len += field_len;
+  } else {
+    *len -= sizeof(size_t);
+  }
   *t = Tensor(type, std::move(shape), const_cast<char*>(tensor_buffer), iz);
   return ps::Status::Ok();
 }
 
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<ps::Tensor> >(const char* buf, 
+    std::vector<ps::Tensor>* t, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  return SerializeHelper::DeserializeVec(buf, t, len, mem_guard);
+}
+
 // Serialzier for ps::Initializer
 using Initializer = ps::Initializer;
 using NoneInitializer = ps::initializer::NoneInitializer;
@@ -252,6 +557,7 @@ using TruncatedNormalInitializer = ps::initializer::TruncatedNormalInitializer;
 using NormalInitializer = ps::initializer::NormalInitializer;
 using VarianceScalingInitializer = ps::initializer::VarianceScalingInitializer;
 using UniformUnitScalingInitializer = ps::initializer::UniformUnitScalingInitializer;
+using OrthogonalInitializer = ps::initializer::OrthogonalInitializer;
 
 class NoneInitializerSerializer: 
     public Serializer<Initializer, NoneInitializer> {
@@ -413,6 +719,58 @@ class NormalInitializerDeserializer:
   }
 };
 
+class OrthogonalInitializerSerializer: 
+    public Serializer<Initializer, OrthogonalInitializer> {
+ public:
+  virtual ps::Status Serialize(OrthogonalInitializer* data, 
+                               std::vector<Fragment>* bufs,
+                               MemGuard& mem_guard) {
+    SerializeHelper::Serialize<int>(&data->seed_, 
+                                    bufs, 
+                                    mem_guard);
+    SerializeHelper::Serialize<float>(&data->gain_, 
+                                      bufs, 
+                                      mem_guard);
+    SerializeHelper::Serialize<int64_t>(&data->dim_, 
+                                      bufs, 
+                                      mem_guard);
+    return ps::Status::Ok();
+  }
+};
+
+class OrthogonalInitializerDeserializer: 
+    public Deserializer<Initializer, OrthogonalInitializer> {
+ public:
+  virtual ps::Status Deserialize(Fragment* buf, 
+                                 size_t offset, 
+                                 OrthogonalInitializer** result, 
+                                 size_t* len,
+                                 MemGuard& mem_guard) {
+    size_t field_len;
+    int seed;
+    char* base = buf->base + offset;
+    SerializeHelper::Deserialize<int>(base, 
+                                      &seed, 
+                                      &field_len, 
+                                      mem_guard);
+    *len = field_len;
+    float gain;
+    SerializeHelper::Deserialize<float>(base + *len, 
+                                        &gain, 
+                                        &field_len, 
+                                        mem_guard);
+    *len += field_len;
+    int64_t dim;
+    SerializeHelper::Deserialize<int64_t>(base + *len, 
+                                          &dim, 
+                                          &field_len, 
+                                          mem_guard);
+    *len += field_len;    
+    *result = new OrthogonalInitializer(dim, seed, gain);
+    return ps::Status::Ok();
+  }
+};
+
 class UniformUnitScalingInitializerSerializer: 
     public Serializer<Initializer, UniformUnitScalingInitializer> {
  public:
@@ -474,7 +832,7 @@ class VarianceScalingInitializerSerializer:
                                std::vector<Fragment>* bufs,
                                MemGuard& mem_guard) {
     SerializeHelper::Serialize<int>(&data->seed_, 
-                                    bufs, 
+                                    bufs,
                                     mem_guard);
     SerializeHelper::Serialize<double>(&data->scale_, 
                                        bufs, 
@@ -598,111 +956,129 @@ class WrapperDataDerializer<ps::TensorShape>:
 };
 
 template <>
-class WrapperDataSerializer<ps::server::Slices>: 
-    public Serializer<ps::Data, ps::WrapperData<ps::server::Slices>, ps::WrapperData<ps::Tensor> > {
+class WrapperDataSerializer<ps::server::TensorSlices>: 
+    public Serializer<ps::Data, ps::WrapperData<ps::server::TensorSlices>, ps::WrapperData<ps::Tensor> > {
  public:
-  virtual ps::Status Serialize(ps::WrapperData<ps::server::Slices>* data, 
+  virtual ps::Status Serialize(ps::WrapperData<ps::server::TensorSlices>* data, 
                                std::vector<Fragment>* bufs,
                                MemGuard& mem_guard) {
-    ps::server::Slices& s = data->Internal();
-    ps::Tensor* t = s.variable->data_.get();
-    SerializeHelper::Serialize<ps::DataType>(
-        &t->state_->type, bufs, mem_guard);
-    ps::TensorShape new_shape;
-    if (s.dim_part < 0) {
-      new_shape = t->state_->shape;
-    } else {
-      std::vector<size_t> dims(1, s.slice_size);
-      if ((size_t)s.dim_part > t->state_->shape.Size()) {
-        return Status::ArgumentError("Slice dim_part Error");
+    return SerializeHelper::Serialize<ps::server::TensorSlices>(&data->Internal(), bufs, mem_guard);
+  }
+};
+
+template <>
+class WrapperDataSerializer<std::vector<ps::server::TensorSlices> >:
+    public Serializer<ps::Data, ps::WrapperData<std::vector<ps::server::TensorSlices> >, ps::WrapperData<std::vector<ps::Tensor> > > {
+public:
+  virtual ps::Status Serialize(ps::WrapperData<std::vector<ps::server::TensorSlices> >* data, 
+                               std::vector<Fragment>* bufs,
+                               MemGuard& mem_guard) {
+    size_t buffer_size = sizeof(size_t);
+    for (size_t i = 0; i < data->Internal().size(); i++) {
+      buffer_size += sizeof(ps::DataType) + sizeof(size_t);
+      const ps::server::TensorSlices& s = data->Internal()[i];
+      if (s.dim_part < 0) {
+        buffer_size += s.tensor.Shape().Size() * sizeof(size_t);
+      } else {
+        buffer_size += (s.tensor.Shape().Size() - s.dim_part + 1) * sizeof(size_t);
       }
-      dims.insert(dims.end(), t->state_->shape.Dims().begin() + s.dim_part, t->state_->shape.Dims().end());
-      new_shape = TensorShape(dims);
-      new_shape.Set(0, s.slice_id.size());
+      buffer_size += s.slice_id.size() * s.slice_size * SizeOfType(s.tensor.Type());
     }
-    SerializeHelper::Serialize<size_t>(
-        mem_guard.AllocateElement<size_t>(new_shape.Size()),
-        bufs, mem_guard);
-    size_t buf_size = t->Shape().Size() * sizeof(size_t);
-    char* shape_buf = mem_guard.AllocateBuffer(buf_size);
-    memcpy(shape_buf, &(new_shape.dims_[0]), buf_size);
-    bufs->push_back(Fragment({.base=shape_buf, .size=buf_size}));
-    char* base = t->Raw<char>();
-    for (size_t i = 0; i < s.slice_id.size(); ++i) {
-      CASES(t->Type(), {
-        bufs->push_back(Fragment({.base=base + s.slice_id[i] * s.slice_size * sizeof(T), 
-            .size=sizeof(T) * s.slice_size}));
-      });
+    char* buffer = mem_guard.AllocateBuffer(buffer_size);
+    *((size_t*)buffer) = data->Internal().size();
+    size_t offset = sizeof(size_t);
+    for (size_t i = 0; i < data->Internal().size(); i++) {
+      const ps::server::TensorSlices& s = data->Internal()[i];
+      const ps::Tensor* t = &s.tensor;
+      *(ps::DataType*)(buffer + offset) = t->state_->type;
+      offset += sizeof(ps::DataType);
+      ps::TensorShape new_shape;
+      if (s.dim_part < 0) {
+        new_shape = t->state_->shape;
+      } else {
+        std::vector<size_t> dims(1, s.slice_id.size());
+        if ((size_t)s.dim_part >= t->state_->shape.Size()) {
+          return Status::ArgumentError("Slice dim_part Error");
+        }
+        dims.insert(dims.end(), t->state_->shape.Dims().begin() + s.dim_part, t->state_->shape.Dims().end());
+        new_shape = TensorShape(dims);
+      }
+      *(size_t*)(buffer + offset) = new_shape.Size();
+      offset += sizeof(size_t);
+      memcpy(buffer + offset, &(new_shape.dims_[0]), new_shape.Size() * sizeof(size_t));
+      offset += new_shape.Size() * sizeof(size_t);
+
+      size_t chunk_size = s.slice_size * SizeOfType(t->Type());
+      for (size_t j = 0; j < s.slice_id.size(); ++j) {
+        if ((int64_t)s.slice_id[j] == ps::HashMap::NOT_ADD_ID) {
+          memset(buffer + offset + j * chunk_size, 0, chunk_size);
+        } else {
+          memcpy(buffer + offset + j * chunk_size, t->Raw<void>(s.slice_id[j]), chunk_size);
+        }
+      }
+      offset += s.slice_id.size() * chunk_size;
     }
-
+    Fragment buf(buffer, buffer_size);
+    bufs->push_back(std::move(buf));
     return ps::Status::Ok();
   }
 };
 
 template <>
-class WrapperDataSerializer<ps::server::TensorSlices>: 
-    public Serializer<ps::Data, ps::WrapperData<ps::server::TensorSlices>, ps::WrapperData<ps::Tensor> > {
- public:
-  virtual ps::Status Serialize(ps::WrapperData<ps::server::TensorSlices>* data, 
+class WrapperDataSerializer<std::vector<ps::server::Slices> >:
+    public Serializer<ps::Data, ps::WrapperData<std::vector<ps::server::Slices> >, ps::WrapperData<std::vector<ps::Tensor> > > {
+public:
+  virtual ps::Status Serialize(ps::WrapperData<std::vector<ps::server::Slices> >* data, 
                                std::vector<Fragment>* bufs,
                                MemGuard& mem_guard) {
-    static char zero_buffer[1<<16] = {0};
-    ps::server::TensorSlices& s = data->Internal();
-    ps::Tensor* t = &s.tensor;
-    SerializeHelper::Serialize<ps::DataType>(
-        &t->state_->type, bufs, mem_guard);
-    ps::TensorShape new_shape;
-    if (s.dim_part < 0) {
-      new_shape = t->state_->shape;
-    } else {
-      std::vector<size_t> dims(1, s.slice_size);
-      if ((size_t)s.dim_part > t->state_->shape.Size()) {
-        return Status::ArgumentError("Slice dim_part Error");
+    size_t buffer_size = sizeof(size_t);
+    for (size_t i = 0; i < data->Internal().size(); i++) {
+      buffer_size += sizeof(ps::DataType) + sizeof(size_t);
+      const ps::server::Slices& s = data->Internal()[i];
+      ps::Tensor* tensor = s.variable->GetData();
+      if (s.dim_part < 0) {
+        buffer_size += tensor->Shape().Size() * sizeof(size_t);
+      } else {
+        buffer_size += (tensor->Shape().Size() - s.dim_part + 1) * sizeof(size_t);
       }
-      dims.insert(dims.end(), t->state_->shape.Dims().begin() + s.dim_part, t->state_->shape.Dims().end());
-      new_shape = TensorShape(dims);
-      new_shape.Set(0, s.slice_id.size());
+      buffer_size += s.slice_id.size() * s.slice_size * SizeOfType(tensor->Type());
     }
-    SerializeHelper::Serialize<size_t>(
-        mem_guard.AllocateElement<size_t>(new_shape.Size()),
-        bufs, mem_guard);
-    size_t buf_size = t->Shape().Size() * sizeof(size_t);
-    char* shape_buf = mem_guard.AllocateBuffer(buf_size);
-    memcpy(shape_buf, &(new_shape.dims_[0]), buf_size);
-    bufs->push_back(Fragment({.base=shape_buf, .size=buf_size}));
-
-    if (s.slice_id.size() <= 16) {
-      char* base = t->Raw<char>();
-      CASES(t->Type(), {
-	  for (size_t i = 0; i < s.slice_id.size(); ++i) {
-          if ((int64_t)s.slice_id[i] == ps::HashMap::NOT_ADD_ID) {
-          bufs->push_back(Fragment({.base=zero_buffer, .size=sizeof(T) * s.slice_size}));
-        } else {
-          bufs->push_back(Fragment({.base=base + s.slice_id[i] * s.slice_size * sizeof(T), 
-		    .size=sizeof(T) * s.slice_size}));
+    char* buffer = mem_guard.AllocateBuffer(buffer_size);
+    *((size_t*)buffer) = data->Internal().size();
+    size_t offset = sizeof(size_t);
+    for (size_t i = 0; i < data->Internal().size(); i++) {
+      const ps::server::Slices& s = data->Internal()[i];
+      const ps::Tensor* t = s.variable->GetData();
+      *(ps::DataType*)(buffer + offset) = t->state_->type;
+      offset += sizeof(ps::DataType);
+      ps::TensorShape new_shape;
+      if (s.dim_part < 0) {
+        new_shape = t->state_->shape;
+      } else {
+        std::vector<size_t> dims(1, s.slice_id.size());
+        if ((size_t)s.dim_part >= t->state_->shape.Size()) {
+          return Status::ArgumentError("Slice dim_part Error");
         }
-	  }
-	});
-    } else {
-      size_t buf_size = 0;
-      CASES(t->Type(), {
-	  buf_size = s.slice_id.size() * s.slice_size * sizeof(T);
-	});
-      char* slice_buf = mem_guard.AllocateBuffer(buf_size);
-      char* base = t->Raw<char>();
-      CASES(t->Type(), {
-	  size_t chunk_size = s.slice_size * sizeof(T);
-	  for (size_t i = 0; i < s.slice_id.size(); ++i) {
-        if ((int64_t)s.slice_id[i] == ps::HashMap::NOT_ADD_ID) {
-          memset(slice_buf + i * chunk_size, 0, chunk_size);
+        dims.insert(dims.end(), t->state_->shape.Dims().begin() + s.dim_part, t->state_->shape.Dims().end());
+        new_shape = TensorShape(dims);
+      }
+      *(size_t*)(buffer + offset) = new_shape.Size();
+      offset += sizeof(size_t);
+      memcpy(buffer + offset, &(new_shape.dims_[0]), new_shape.Size() * sizeof(size_t));
+      offset += new_shape.Size() * sizeof(size_t);
+
+      size_t chunk_size = s.slice_size * SizeOfType(t->Type());
+      for (size_t j = 0; j < s.slice_id.size(); ++j) {
+        if ((int64_t)s.slice_id[j] == ps::HashMap::NOT_ADD_ID) {
+          memset(buffer + offset + j * chunk_size, 0, chunk_size);
         } else {
-          memcpy(slice_buf + i * chunk_size, base + s.slice_id[i] * chunk_size, chunk_size);
+          memcpy(buffer + offset + j * chunk_size, t->Raw<void>(s.slice_id[j]), chunk_size);
         }
       }
-	});
-      bufs->push_back(Fragment({.base=slice_buf, .size=buf_size}));
+      offset += s.slice_id.size() * chunk_size;
     }
-
+    Fragment buf(buffer, buffer_size);
+    bufs->push_back(std::move(buf));
     return ps::Status::Ok();
   }
 };
@@ -760,9 +1136,23 @@ DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<double>);
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<bool>);
 DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<bool>);
 
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<double> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<double> >);
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<float> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<float> >);
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<bool> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<bool> >);
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<int64_t> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<int64_t> >);
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<int> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<int> >);
+
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::string>);
 DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::string>);
 
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<std::string> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<std::string> >);
+
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<ps::Status>);
 DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<ps::Status>);
 
@@ -775,11 +1165,16 @@ DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<ps::TensorShape>);
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<ps::Tensor>);
 DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<ps::Tensor>);
 
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<ps::Tensor> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<ps::Tensor> >);
+
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::unique_ptr<ps::Initializer> >);
 DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::unique_ptr<ps::Initializer> >);
 
-SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<ps::server::Slices>);
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<ps::server::TensorSlices>);
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<ps::server::TensorSlices> >);
+
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<ps::server::Slices> >);
 
 SERIALIZER_REGISTER(ps::serializer::NoneInitializerSerializer);
 DESERIALIZER_REGISTER(ps::serializer::NoneInitializerDeserializer);
@@ -793,6 +1188,9 @@ DESERIALIZER_REGISTER(ps::serializer::TruncatedNormalInitializerDeserializer);
 SERIALIZER_REGISTER(ps::serializer::NormalInitializerSerializer);
 DESERIALIZER_REGISTER(ps::serializer::NormalInitializerDeserializer);
 
+SERIALIZER_REGISTER(ps::serializer::OrthogonalInitializerSerializer);
+DESERIALIZER_REGISTER(ps::serializer::OrthogonalInitializerDeserializer);
+
 SERIALIZER_REGISTER(ps::serializer::UniformUnitScalingInitializerSerializer);
 DESERIALIZER_REGISTER(ps::serializer::UniformUnitScalingInitializerDeserializer);
 
diff --git a/xdl/ps-plus/ps-plus/common/status.h b/xdl/ps-plus/ps-plus/common/status.h
index dbff1508..ccaceaa7 100644
--- a/xdl/ps-plus/ps-plus/common/status.h
+++ b/xdl/ps-plus/ps-plus/common/status.h
@@ -47,6 +47,7 @@ class Status {
     kServerDeserializeFailed,
     kClientSerializeFailed,
     kClientDeserializeFailed,
+    kFileQueueNeedWait,
     kUnknown
   };
 
@@ -109,7 +110,9 @@ class Status {
   static Status ServerDeserializeFailed(const std::string& msg) { return Status(kServerDeserializeFailed, msg);}
   static Status ClientSerializeFailed(const std::string& msg) { return Status(kClientSerializeFailed, msg);}
   static Status ClientDeserializeFailed(const std::string& msg) { return Status(kClientDeserializeFailed, msg);}
+  static Status FileQueueNeedWait(const std::string& msg) { return Status(kFileQueueNeedWait, msg);}
   static Status Unknown(const std::string& msg) { return Status(kUnknown, msg); }
+  
 
  private:
   friend class ps::serializer::SerializeHelper;
diff --git a/xdl/ps-plus/ps-plus/common/tensor.cc b/xdl/ps-plus/ps-plus/common/tensor.cc
index 824a2531..acf4faba 100644
--- a/xdl/ps-plus/ps-plus/common/tensor.cc
+++ b/xdl/ps-plus/ps-plus/common/tensor.cc
@@ -14,41 +14,33 @@ limitations under the License.
 ==============================================================================*/
 
 #include "ps-plus/common/tensor.h"
+#include "ps-plus/common/logging.h"
 #include <cstring>
 
 namespace ps {
 
-Tensor::Tensor() : state_(nullptr) {}
+Tensor::Tensor(TType tensor_type) : state_(nullptr), tensor_type_(tensor_type) {}
 
-Tensor::Tensor(DataType type, const TensorShape& shape, Initializer* initializer, bool init)
-  : state_(new State(
-        new char[SizeOfType(type) * shape.NumElements()],
-        type, shape, initializer, true)) {
-  if (init) {
-    state_->initializer->MultiThreadInit(state_->buffer, state_->type, state_->shape.NumElements());
-  }
-}
-
-Tensor::Tensor(DataType type, TensorShape&& shape, Initializer* initializer, bool init)
-  : state_(new State(
-        new char[SizeOfType(type) * shape.NumElements()],
-        type, std::move(shape), initializer, true)) {
-  if (init) {
-    state_->initializer->MultiThreadInit(state_->buffer, state_->type, state_->shape.NumElements());
+Tensor::Tensor(DataType type, const TensorShape& shape, Initializer* initializer, TType tensor_type, bool init) {
+  tensor_type_ = tensor_type;
+  if (tensor_type == TType::kContinuous) {
+    state_ = new ContinuousState(new char[SizeOfType(type) * shape.NumElements()], type, shape, initializer, true, init);
+  } else {
+    state_ = new SegmentState(type, shape, initializer, init, DEFAULT_SEGMENT_SIZE);
   }
 }
 
 Tensor::Tensor(DataType type, const TensorShape& shape, char* buffer, Initializer* initializer)
-  : state_(new State(buffer, type, shape, initializer, false)) {}
+  : state_(new ContinuousState(buffer, type, shape, initializer, false, false)), tensor_type_(TType::kContinuous) {}
 
-Tensor::Tensor(DataType type, TensorShape&& shape, char* buffer, Initializer* initializer)
-  : state_(new State(buffer, type, std::move(shape), initializer, false)) {}
+Tensor::Tensor(DataType type, const TensorShape& shape, Initializer* initializer, bool init, size_t segment_size)
+  : state_(new SegmentState(type, shape, initializer, init, segment_size)), tensor_type_(TType::kSegment) {}
 
-Tensor::Tensor(const Tensor& rhs) : state_(rhs.state_) {
+Tensor::Tensor(const Tensor& rhs) : state_(rhs.state_), tensor_type_(rhs.tensor_type_) {
   Ref();
 }
 
-Tensor::Tensor(Tensor&& rhs) : state_(rhs.state_) {
+Tensor::Tensor(Tensor&& rhs) : state_(rhs.state_), tensor_type_(rhs.tensor_type_) {
   rhs.state_ = nullptr;
 }
 
@@ -59,46 +51,113 @@ Tensor::~Tensor() {
 Tensor& Tensor::operator=(const Tensor& rhs) {
   UnRef();
   state_ = rhs.state_;
+  tensor_type_ = rhs.tensor_type_;
   Ref();
   return *this;
 }
 
 Tensor& Tensor::operator=(Tensor&& rhs) {
   std::swap(state_, rhs.state_);
+  std::swap(tensor_type_, rhs.tensor_type_);
   return *this;
 }
 
-void Tensor::ReShape(const TensorShape& shape) {
-  size_t old_size = state_->shape.NumElements() * SizeOfType(state_->type);
-  size_t new_size = shape.NumElements() * SizeOfType(state_->type);
+Status Tensor::InitChunkFrom(const size_t& start_index) {
+  if (tensor_type_ == TType::kContinuous) {
+    return Status::NotImplemented("ContinuousTensor can't support InitChunkFrom function");
+  }
+  SegmentState* state = dynamic_cast<SegmentState*>(state_);
+  size_t trunk_start = start_index % state->segment_size;
+  if (trunk_start == 0) {
+    return Status::Ok();
+  }
+  void* ptr = state->Raw(start_index);
+  state->initializer->MultiThreadInit(ptr, state->type, (state->segment_size - trunk_start) * state->slice_size);
+  //LOG_INFO("Call InitChunkFrom in tensor, start %ld, trunk_start %ld, size %ld", start_index, trunk_start, (state->segment_size - trunk_start) * state->slice_size);
+  return Status::Ok();
+}
 
-  State* new_state = new State(new char[new_size], state_->type, shape, state_->initializer->Clone(), true);
-  if (new_size <= old_size) {
-    QuickMemcpy(new_state->buffer, state_->buffer, new_size);
+void Tensor::ReShape(const TensorShape& shape) {
+  if (tensor_type_ == TType::kContinuous) {
+    size_t old_size = state_->shape.NumElements() * SizeOfType(state_->type);
+    size_t new_size = shape.NumElements() * SizeOfType(state_->type);
+    ContinuousState* new_state = new ContinuousState(new char[new_size], state_->type, shape, state_->initializer->Clone(), true, false);
+    ContinuousState* old_state = dynamic_cast<ContinuousState*>(state_);
+    if (new_size <= old_size) {
+      QuickMemcpy(new_state->buffer, old_state->buffer, new_size);
+    } else {
+      QuickMemcpy(new_state->buffer, old_state->buffer, old_size);
+      new_state->initializer->MultiThreadInit(new_state->buffer + old_size, new_state->type, new_state->shape.NumElements() - state_->shape.NumElements());
+    }
+    UnRef();
+    state_ = new_state;
   } else {
-    QuickMemcpy(new_state->buffer, state_->buffer, old_size);
-    new_state->initializer->MultiThreadInit(new_state->buffer + old_size, new_state->type, new_state->shape.NumElements() - state_->shape.NumElements());
+    SegmentState* state = dynamic_cast<SegmentState*>(state_);
+    if (state == nullptr) {
+      std::cerr << "state_ for segment tensor is nullptr\n";
+      abort();
+    }
+    size_t index = shape[0]/state->segment_size;
+    if (state->buffers.size() > index && state->buffers[index] != nullptr) {
+      return;
+    }
+    while (state->buffers.size() <= index) {
+      char* ptr = new char[state->chunk_size];
+      state->initializer->MultiThreadInit(ptr, state->type, state->slice_size * state->segment_size);
+      state->buffers.push_back(ptr);
+    }
+    while (state->buffers[index] == nullptr) {
+    }
+    state->shape.Set(0, state->buffers.size() * state->segment_size);
   }
-  UnRef();
-  state_ = new_state;
 }
 
-void Tensor::Clear(size_t beg, size_t size) {
-  state_->initializer->MultiThreadInit(state_->buffer + beg * SizeOfType(state_->type), state_->type, size);
+void Tensor::ClearId(size_t id) {
+  SegmentState* state = dynamic_cast<SegmentState*>(state_);
+  state_->initializer->MultiThreadInit(state->Raw(id), state->type, state->slice_size);
 }
 
-void Tensor::ClearId(size_t id) {
-  size_t size = state_->shape.NumElements() / state_->shape[0];
-  Clear(id * size, size);
+size_t Tensor::SegmentSize() const {
+  SegmentState* state = dynamic_cast<SegmentState*>(state_);
+  if (state == nullptr) {
+    std::cerr << "Only Segment tensor can call SegmentSize\n";
+    abort();
+  }
+  return state->segment_size;
+}
+
+void Tensor::SetOwnBuffer(bool own) {
+  ContinuousState* state = dynamic_cast<ContinuousState*>(state_);
+  if (state == nullptr) {
+    std::cerr << "Only Continuous tensor can call SetOwnBuffer\n";
+    abort();
+  }
+  state->own_buffer = own;
 }
 
-Tensor Tensor::Clone() {
+Tensor Tensor::Clone() const {
   if (state_ == nullptr) {
     return Tensor();
   }
-  Tensor ret(state_->type, state_->shape, state_->initializer->Clone(), false);
-  memcpy(ret.state_->buffer, state_->buffer, state_->shape.NumElements() * SizeOfType(state_->type));
-  return ret;
+  Initializer* init = nullptr;
+  if (state_->initializer != nullptr) {
+    init = state_->initializer->Clone();
+  }
+  if (tensor_type_ == TType::kContinuous) {
+    Tensor ret(state_->type, state_->shape, init, TType::kContinuous, false);
+    ContinuousState* this_state = dynamic_cast<ContinuousState*>(state_);
+    ContinuousState* ret_state = dynamic_cast<ContinuousState*>(ret.state_);
+    memcpy(ret_state->buffer, this_state->buffer, state_->shape.NumElements() * SizeOfType(state_->type));
+    return ret;
+  } else {
+    Tensor ret(state_->type, state_->shape, init, TType::kSegment, false);
+    SegmentState* this_state = dynamic_cast<SegmentState*>(state_);
+    SegmentState* ret_state = dynamic_cast<SegmentState*>(ret.state_);
+    for (size_t i = 0; i < this_state->buffers.size(); i++) {
+      memcpy(ret_state->buffers[i], this_state->buffers[i], this_state->chunk_size);
+    }
+    return ret;
+  }
 }
 
 void Tensor::UnRef() {
@@ -106,9 +165,6 @@ void Tensor::UnRef() {
     return;
   }
   if (--state_->ref == 0) {
-    if (state_->own_buffer) {
-      delete [] state_->buffer;
-    }
     delete state_;
     state_ = nullptr;
   }
@@ -121,5 +177,7 @@ void Tensor::Ref() {
   state_->ref++;
 }
 
+const int64_t Tensor::DEFAULT_SEGMENT_SIZE = 1 << 12;
+
 }
 
diff --git a/xdl/ps-plus/ps-plus/common/tensor.h b/xdl/ps-plus/ps-plus/common/tensor.h
index 597e4655..87c18c1f 100644
--- a/xdl/ps-plus/ps-plus/common/tensor.h
+++ b/xdl/ps-plus/ps-plus/common/tensor.h
@@ -16,76 +16,150 @@ limitations under the License.
 #ifndef PS_PLUS_COMMON_TENSOR_H_
 #define PS_PLUS_COMMON_TENSOR_H_
 
+#include <memory>
+#include <atomic>
+#include <iostream>
+#include "tbb/parallel_for.h"
+#include "tbb/concurrent_vector.h"
+
 #include "ps-plus/common/types.h"
 #include "ps-plus/common/tensor_shape.h"
 #include "ps-plus/common/initializer.h"
 #include "ps-plus/common/thread_pool.h"
 
-#include <memory>
-#include <atomic>
-
 namespace ps {
 
 class Tensor {
  public:
-  Tensor();
-
-  Tensor(DataType type, const TensorShape& shape, Initializer* initializer, bool init = true);
-
-  Tensor(DataType type, TensorShape&& shape, Initializer* initializer, bool init = true);
-
+  enum TType {
+    kContinuous,
+    kSegment,
+  };
+  Tensor(TType tensor_type = TType::kContinuous);
+  Tensor(DataType type, const TensorShape& shape, Initializer* initializer, TType tensor_type = TType::kContinuous, bool init = true);
+  // used for only kContinuous tensor
   Tensor(DataType type, const TensorShape& shape, char* buffer, Initializer* initializer);
-
-  Tensor(DataType type, TensorShape&& shape, char* buffer, Initializer* initializer);
-
+  // used for only kSegment tensor  
+  Tensor(DataType type, const TensorShape& shape, Initializer* initializer, bool init, size_t segment_size);
+  
   Tensor(const Tensor& rhs);
-
   Tensor(Tensor&& rhs);
-
   ~Tensor();
 
   Tensor& operator=(const Tensor& rhs);
-
   Tensor& operator=(Tensor&& rhs);
 
-  bool Initialized() { return state_ != nullptr; }
+  bool Initialized() const { return state_ != nullptr; }
   DataType Type() const { return state_->type; }
-  const TensorShape& Shape() const { return state_->shape; }
   Initializer* GetInitializer() const { return state_->initializer.get(); }
+  const TensorShape& Shape() const { return state_->shape; }
+  TType TensorType() const {return tensor_type_;}
+  void SetInititalizer(Initializer* init) {state_->initializer.reset(init);}
+  Status InitChunkFrom(const size_t& start_index);
 
   // Note: We don't check the type_. Everyone who call following method
   // should use CASES or just check the type_;
+  // Not safe to use for Segment Tensor;
   template<typename T>
   T* Raw() const {
-    return reinterpret_cast<T*>(state_->buffer);
+    return reinterpret_cast<T*>(state_->Raw(0));
   }
 
-  void ReShape(const TensorShape& shape);
-
-  // Note: We don't check the beg and size
-  void Clear(size_t beg, size_t size);
+  template<typename T>
+  T* Raw(size_t id) const {
+    return reinterpret_cast<T*>(state_->Raw(id));
+  }
 
+  void ReShape(const TensorShape& shape);
   // Note: We don't check id
   void ClearId(size_t id);
+  Tensor Clone() const;
 
-  Tensor Clone();
+  size_t SegmentSize() const;
+  void SetOwnBuffer(bool own);
+  const static int64_t DEFAULT_SEGMENT_SIZE;
  private:
   void UnRef();
   void Ref();
 
   struct State {
-    State(char* buffer_, DataType type_, const TensorShape& shape_, Initializer* initializer_, bool own_buffer_)
-      : buffer(buffer_), type(type_), shape(shape_), initializer(initializer_), own_buffer(own_buffer_), ref(1) {}
-    State(char* buffer_, DataType type_, TensorShape&& shape_, Initializer* initializer_, bool own_buffer_)
-      : buffer(buffer_), type(type_), shape(std::move(shape_)), initializer(initializer_), own_buffer(own_buffer_), ref(1) {}
-    char* buffer;
+    State(DataType type_, const TensorShape& shape_, Initializer* initializer_)
+      : type(type_), shape(shape_), initializer(initializer_), ref(1) {
+    }
+    virtual void* Raw(size_t id) = 0;
     DataType type;
     TensorShape shape;
     std::unique_ptr<Initializer> initializer;
-    bool own_buffer;
     std::atomic<size_t> ref;
+    virtual ~State() {}
+  };
+
+  struct ContinuousState: public State {
+    ContinuousState(char* buffer_, DataType type_, const TensorShape& shape_, Initializer* initializer_, bool own_buffer_, bool init_)
+      : State(type_, shape_, initializer_), buffer(buffer_), own_buffer(own_buffer_) {
+      if (init_) {
+        initializer->MultiThreadInit(buffer, type, shape.NumElements());
+      }
+    }
+    virtual void* Raw(size_t id) {
+      if (id == 0) {
+        return buffer;
+      }
+      if (shape.IsScalar()) {
+        return nullptr;
+      }
+      return buffer + id * shape.NumElements() / shape[0] * SizeOfType(type);
+    }
+    virtual ~ContinuousState() {
+      if (own_buffer) {
+        delete [] buffer;
+        buffer = nullptr;
+      }
+    }
+    bool own_buffer;
+    char* buffer;
+  };
+
+  struct SegmentState: public State {
+    SegmentState(DataType type_, const TensorShape& shape_, Initializer* initializer_, bool init_, size_t segment_size_)
+      : State(type_, shape_, initializer_), segment_size(segment_size_) {
+      if (shape_.IsScalar()) {
+        throw std::invalid_argument("SegmentState don't allow scalar variable");
+      }
+      slice_size = shape_.NumElements() / shape_[0];
+      chunk_size = segment_size_ * SizeOfType(type_) * slice_size;
+      buffers.grow_to_at_least(shape_[0]/segment_size + (shape_[0] % segment_size == 0 ? 0 : 1), nullptr);
+      for (size_t i = 0; i < buffers.size(); i++) {
+        buffers[i] = new char[chunk_size];
+      }
+      if (init_) {
+        tbb::parallel_for(tbb::blocked_range<size_t>(0, buffers.size() - 1), [&](tbb::blocked_range<size_t>& r) {
+              for (size_t i = r.begin(); i < r.end(); i++) {
+                initializer_->MultiThreadInit(buffers[i], type_, segment_size * slice_size);
+              }
+            });
+      }
+      // 因为我们有预留的空间，所以最后一个buffer必须初始化
+      if (initializer_ != nullptr) {
+        initializer_->MultiThreadInit(buffers[buffers.size()-1], type_, segment_size * slice_size);
+      }
+      shape.Set(0, buffers.size() * segment_size);
+    }
+    virtual ~SegmentState() {
+      for (size_t i = 0; i < buffers.size(); i++) {
+        delete [] buffers[i];
+      }
+    }
+    virtual void* Raw(size_t id) {
+      return buffers[id/segment_size] + (id%segment_size) * slice_size * SizeOfType(type);
+    }
+    size_t segment_size;
+    size_t chunk_size;
+    size_t slice_size;
+    tbb::concurrent_vector<char*> buffers;
   };
   State* state_;
+  TType tensor_type_;
 };
 
 }
diff --git a/xdl/ps-plus/ps-plus/common/tensor_shape.h b/xdl/ps-plus/ps-plus/common/tensor_shape.h
index a171119e..ebb565c3 100644
--- a/xdl/ps-plus/ps-plus/common/tensor_shape.h
+++ b/xdl/ps-plus/ps-plus/common/tensor_shape.h
@@ -40,6 +40,11 @@ class TensorShape {
     ComputeNumElements();
   }
 
+  TensorShape(const TensorShape& rhs)
+      : dims_(rhs.dims_) {
+    ComputeNumElements();
+  }
+
   const std::vector<std::size_t>& Dims() const {
     return dims_;
   }
@@ -81,6 +86,15 @@ class TensorShape {
     return !(*this == rhs);
   }
 
+  std::string ToString() const {
+    std::string s;
+    for (auto& item : dims_) {
+      s += std::to_string(item) + ",";
+    }
+    if (!s.empty()) { s.pop_back(); }
+    return s;
+  }
+
  private:
   void ComputeNumElements() {
     num_elements_ = 1;
diff --git a/xdl/ps-plus/ps-plus/common/test/INIParser_test.cc b/xdl/ps-plus/ps-plus/common/test/INIParser_test.cc
index 35c15b27..8fddb0c7 100644
--- a/xdl/ps-plus/ps-plus/common/test/INIParser_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/INIParser_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include <fstream>
 
 #include "gtest/gtest.h"
diff --git a/xdl/ps-plus/ps-plus/common/test/bloom_filter_test.cc b/xdl/ps-plus/ps-plus/common/test/bloom_filter_test.cc
new file mode 100644
index 00000000..b27458df
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/test/bloom_filter_test.cc
@@ -0,0 +1,62 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/common/bloom_filter.h"
+#include <vector>
+
+TEST(BloomFilter, CountingBloomFilter) {
+  double fpp = 0.001;
+  uint64_t elem_size = 1000;
+  ps::CountingBloomFilter<uint8_t> cbf(fpp, elem_size);
+  ASSERT_EQ(cbf.hash_function_number(), 10);
+  ASSERT_GE(cbf.bucket_size(), 14378);
+  
+  std::vector<uint64_t> keys = { 1ul, 2ul, 3ul, 4ul, 1ul, 2ul, 2ul };
+  int sz1 = sizeof(uint64_t);
+  int sz2 = sz1 * 2;
+  ASSERT_TRUE(cbf.Exists(nullptr, 0, 0));
+  ASSERT_FALSE(cbf.Exists(nullptr, 0, 1));
+  ASSERT_TRUE(cbf.Exists(&keys[0], sz1, 0));
+  cbf.Insert(&keys[0], sz1);
+  ASSERT_TRUE(cbf.Exists(&keys[0], sz1, 1));
+  // must be false
+  ASSERT_FALSE(cbf.Exists(&keys[0], sz1, 2));
+  // may be false
+  EXPECT_FALSE(cbf.Exists(&keys[1], sz1, 1));
+  // may be false 
+  EXPECT_FALSE(cbf.Exists(&keys[0], sz2, 1));
+  cbf.Insert(&keys[1], sz1);
+  cbf.Insert(&keys[2], sz1);
+  cbf.Insert(&keys[3], sz1);
+  cbf.Insert(&keys[4], sz1);
+  ASSERT_TRUE(cbf.Exists(&keys[4], sz1, 2));
+  cbf.Insert(&keys[5], sz1);
+  cbf.Insert(&keys[6], sz1);
+  ASSERT_TRUE(cbf.Exists(&keys[1], sz1, 3));
+}
+
+TEST(BloomFilter, InsertedLookup) {
+  double fpp = 0.001;
+  uint64_t elem_size = 1000;
+  ps::CountingBloomFilter<uint8_t> cbf(fpp, elem_size);
+  uint64_t key = 123;
+  for (int i = 0; i < 300; ++i) {
+    bool res = cbf.InsertedLookup(&key, sizeof(key), 255);
+    if (i >= 255) ASSERT_TRUE(res);
+  }
+  ASSERT_FALSE(cbf.InsertedLookup(&key, sizeof(key), 256));
+}
+
diff --git a/xdl/ps-plus/ps-plus/common/test/data_test.cc b/xdl/ps-plus/ps-plus/common/test/data_test.cc
index ee722c26..136a390c 100644
--- a/xdl/ps-plus/ps-plus/common/test/data_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/data_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/data.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/filesystem_test.cc b/xdl/ps-plus/ps-plus/common/test/filesystem_test.cc
deleted file mode 100644
index cc1fdb6b..00000000
--- a/xdl/ps-plus/ps-plus/common/test/filesystem_test.cc
+++ /dev/null
@@ -1,181 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include "gtest/gtest.h"
-#include "test/util/hdfs_launcher.h"
-#include "ps-plus/common/file_system.h"
-
-using ps::FileSystem;
-using ps::Status;
-
-class FileSystemTest : public testing::Test {
-  public:
-    void SetUp() override {
-      if (false == ps::HDFSLauncher::Start()) {
-        skip_ = true;
-      }
-      if (skip_) {
-        GTEST_SKIP();
-      }
-    }
-
-    void TearDown() override {
-      if (!skip_) {
-        ps::HDFSLauncher::Stop();
-      }
-    }
-
-  private:
-    bool skip_ = false;
-};
-
-TEST_F(FileSystemTest, FileSystem) {
-  {
-    FileSystem::WriteStream *stream = nullptr;
-    FileSystem::OpenWriteStreamAny("./ows.txt",  &stream, false);
-    ASSERT_NE(stream, nullptr);
-  }
-
-  {
-    FileSystem::ReadStream *stream = nullptr;
-    FileSystem::OpenReadStreamAny("./ows.txt",  &stream);
-    ASSERT_NE(stream, nullptr);
-  }
-
-  {
-    Status st = FileSystem::MkdirAny("./any");
-    ASSERT_TRUE(st.IsOk());
-
-    std::vector<std::string> files;
-    st = FileSystem::ListDirectoryAny("./any", &files);
-    ASSERT_TRUE(st.IsOk());
-    ASSERT_EQ(files.size(), 0);
-  }
-
-  {
-    FileSystem::WriteStream *stream = nullptr;
-    FileSystem::OpenWriteStreamAny("./os.txt", &stream, false);
-    ASSERT_NE(stream, nullptr);
-    delete stream;
-
-    Status st = FileSystem::RenameAny("./os.txt", "./so.txt");
-    ASSERT_TRUE(st.IsOk());
-
-    st = FileSystem::RemoveAny("./so.txt");
-    ASSERT_TRUE(st.IsOk());
-  }
-
-  { /* Test MemoryFileSystem */
-    auto fs = ps::GetPlugin<FileSystem>("memory");
-    ASSERT_NE(fs, nullptr);
-    Status st = fs->Mkdir("./Wednesday");
-    ASSERT_EQ(st, Status::Ok());
-
-    std::vector<std::string> files;
-    st = fs->ListDirectory("./Wednesday", &files);
-    ASSERT_EQ(st, Status::Ok());
-    ASSERT_EQ(files.size(), 0);
-
-    FileSystem::WriteStream *stream = nullptr;
-    FileSystem::OpenWriteStreamAny("./Wed.txt", &stream, false);
-    ASSERT_NE(stream, nullptr);
-    delete stream;
-
-    st = fs->Remove("./Wed.txt");
-    ASSERT_EQ(st, Status::Ok());
-
-    st = fs->Rename("./Wed.txt", "./Thurs.txt");
-    ASSERT_EQ(st, Status::Ok());
-  }
-
-  { /* Test FileFileSystem */
-    auto fs = ps::GetPlugin<FileSystem>("file");
-    FileSystem::WriteStream *ws = nullptr;
-    Status st = fs->OpenWriteStream("ffs.txt", &ws);
-    ASSERT_EQ(st, Status::Ok());
-    ASSERT_NE(ws, nullptr);
-
-    int64_t sz = ws->WriteSimple("hello", 5);
-    ASSERT_EQ(sz, 5);
-    ws->Flush();
-
-    FileSystem::ReadStream *rs = nullptr;
-    st = fs->OpenReadStream("ffs.txt", &rs);
-    ASSERT_EQ(st, Status::Ok());
-    ASSERT_NE(rs, nullptr);
-    char buf[32];
-    sz = rs->ReadSimple(buf, sizeof(buf));
-    ASSERT_EQ(sz, 5);
-    delete rs;
-  }
-
-  { /* Test NoneFileSystem */
-    auto fs = ps::GetPlugin<FileSystem>("none");
-    FileSystem::WriteStream *ws = nullptr;
-    Status st = fs->OpenWriteStream("nfs.txt", &ws);
-    ASSERT_EQ(st, Status::Ok());
-    ASSERT_NE(ws, nullptr);
-
-    FileSystem::ReadStream *rs = nullptr;
-    st = fs->OpenReadStream("ffs.txt", &rs);
-    ASSERT_NE(st, Status::Ok());
-    ASSERT_EQ(rs, nullptr);
-
-    st = fs->Mkdir("hello");
-    ASSERT_EQ(st, Status::Ok());
-    st = fs->ListDirectory("hello", nullptr);
-    ASSERT_EQ(st, Status::Ok());
-    st = fs->Remove("hello");
-    ASSERT_EQ(st, Status::Ok());
-    st = fs->Rename("hello", "world");
-    ASSERT_EQ(st, Status::Ok());
-  }
-
-  { /* Test HdfsFileSystem */
-    auto fs = ps::GetPlugin<FileSystem>("hdfs");
-    FileSystem::WriteStream *ws = nullptr;
-    Status st = fs->OpenWriteStream("hdfs://127.0.0.1:9090/hfs.txt", &ws);
-    ASSERT_EQ(st, Status::Ok());
-    ASSERT_NE(ws, nullptr);
-
-    int64_t sz = ws->WriteSimple("hello", 5);
-    ASSERT_EQ(sz, 5);
-    ws->Flush();
-    delete ws;
-
-    FileSystem::ReadStream *rs = nullptr;
-    st = fs->OpenReadStream("hdfs://127.0.0.1:9090/hfs.txt", &rs);
-    ASSERT_EQ(st, Status::Ok());
-    ASSERT_NE(rs, nullptr);
-    char buf[32];
-    sz = rs->ReadSimple(buf, sizeof(buf));
-    ASSERT_EQ(sz, 5);
-    delete rs;
-
-    st = fs->Mkdir("test_dir");
-    ASSERT_NE(st, Status::Ok());
-
-    std::vector<std::string> files;
-    fs->ListDirectory("test_dir", &files);
-    ASSERT_EQ(files.size(), 0);
-
-    st = fs->Remove("not_exist");
-    ASSERT_NE(st, Status::Ok());
-
-    st = fs->Rename("left", "right");
-    ASSERT_NE(st, Status::Ok());
-  }
-
-}
diff --git a/xdl/ps-plus/ps-plus/common/test/global_file_queue_test.cc b/xdl/ps-plus/ps-plus/common/test/global_file_queue_test.cc
new file mode 100644
index 00000000..5d3790df
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/test/global_file_queue_test.cc
@@ -0,0 +1,280 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/common/global_file_queue.h"
+
+TEST(GlobalFileQueueTest, TestNotInit) {
+  ps::GlobalFileQueue queue;
+  ps::WorkerState file;
+  ps::Status st = queue.GetNextFile(0, &file);
+  ASSERT_EQ(ps::Status::kFileQueueNeedWait, st.Code());
+}
+
+TEST(GlobalFileQueueTest, TestSimple) {
+  ps::GlobalFileQueue queue;
+  std::vector<std::string> paths = {"1.txt", "2.txt"};
+  queue.Init(paths, 2, false);
+  ps::WorkerState file;
+  queue.GetNextFile(0, &file);
+  ASSERT_EQ("1.txt", file.path_);
+  ASSERT_EQ(0, file.begin_);
+  ASSERT_EQ(0, file.end_);
+  ASSERT_EQ(0, file.epoch_);
+  queue.GetNextFile(0, &file);
+  ASSERT_EQ("2.txt", file.path_);
+  ASSERT_EQ(0, file.begin_);
+  ASSERT_EQ(0, file.end_);
+  ASSERT_EQ(0, file.epoch_);
+  queue.GetNextFile(0, &file);
+  ASSERT_EQ("1.txt", file.path_);
+  ASSERT_EQ(0, file.begin_);
+  ASSERT_EQ(0, file.end_);
+  ASSERT_EQ(1, file.epoch_);
+  queue.GetNextFile(0, &file);
+  ASSERT_EQ("2.txt", file.path_);
+  ASSERT_EQ(0, file.begin_);
+  ASSERT_EQ(0, file.end_);
+  ASSERT_EQ(1, file.epoch_);
+  queue.GetNextFile(0, &file);
+  ASSERT_EQ("", file.path_);
+}
+
+TEST(GlobalFileQueueTest, TestRestore) {
+  {
+    ps::GlobalFileQueue queue;
+    std::vector<std::string> paths = {"1.txt", "2.txt", "3.txt", "4.txt"};
+    ASSERT_TRUE(queue.Init(paths, 2, false).IsOk());
+    ps::WorkerState file;
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    std::vector<ps::WorkerState> worker_states;
+    worker_states.push_back(ps::WorkerState(1, 11, 0, "1.txt"));
+    worker_states.push_back(ps::WorkerState(3, 13, 0, "3.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(0, worker_states).IsOk());
+    worker_states.clear();
+    worker_states.push_back(ps::WorkerState(2, 12, 0, "2.txt"));
+    worker_states.push_back(ps::WorkerState(4, 14, 0, "4.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(1, worker_states).IsOk());
+    ASSERT_TRUE(queue.RestoreWorkerState(0).IsOk());
+    ASSERT_TRUE(queue.RestoreWorkerState(1).IsOk());
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(1, file.begin_);
+    ASSERT_EQ(11, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("3.txt", file.path_);
+    ASSERT_EQ(3, file.begin_);
+    ASSERT_EQ(13, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(2, file.begin_);
+    ASSERT_EQ(12, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("4.txt", file.path_);
+    ASSERT_EQ(4, file.begin_);
+    ASSERT_EQ(14, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("3.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("4.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("", file.path_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("", file.path_);
+  }
+
+  {
+    ps::GlobalFileQueue queue;
+    std::vector<std::string> paths = {"1.txt", "2.txt", "3.txt", "4.txt"};
+    ASSERT_TRUE(queue.Init(paths, 2, false).IsOk());
+    ps::WorkerState file;
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    std::vector<ps::WorkerState> worker_states;
+    worker_states.push_back(ps::WorkerState(1, 11, 0, "1.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(0, worker_states).IsOk());
+    worker_states.clear();
+    worker_states.push_back(ps::WorkerState(2, 12, 0, "2.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(1, worker_states).IsOk());
+    ASSERT_TRUE(queue.RestoreWorkerState(0).IsOk());
+    ASSERT_TRUE(queue.RestoreWorkerState(1).IsOk());
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(1, file.begin_);
+    ASSERT_EQ(11, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("3.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(2, file.begin_);
+    ASSERT_EQ(12, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("4.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("3.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("4.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("", file.path_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("", file.path_);
+  }
+}
+
+TEST(GlobalFileQueueTest, TestSerialize) {
+  {
+    ps::GlobalFileQueue queue;
+    std::vector<std::string> paths = {"1.txt", "2.txt", "3.txt", "4.txt"};
+    ASSERT_TRUE(queue.Init(paths, 2, false).IsOk());
+    ps::WorkerState file;
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    std::string buf;
+    ASSERT_TRUE(queue.Serialize(&buf).IsOk());
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    ASSERT_TRUE(queue.Deserialize(buf).IsOk());
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+  }
+
+  {
+    ps::GlobalFileQueue queue;
+    std::vector<std::string> paths = {"1.txt", "2.txt", "3.txt", "4.txt"};
+    ASSERT_TRUE(queue.Init(paths, 2, false).IsOk());
+    ps::WorkerState file;
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    queue.GetNextFile(0, &file);
+    queue.GetNextFile(1, &file);
+    std::vector<ps::WorkerState> worker_states;
+    worker_states.push_back(ps::WorkerState(1, 11, 0, "1.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(0, worker_states).IsOk());
+    worker_states.clear();
+    worker_states.push_back(ps::WorkerState(2, 12, 0, "2.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(1, worker_states).IsOk());
+    std::string buf;
+    ASSERT_TRUE(queue.Serialize(&buf).IsOk());
+
+    worker_states.clear();
+    worker_states.push_back(ps::WorkerState(3, 13, 0, "3.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(0, worker_states).IsOk());
+    worker_states.clear();
+    worker_states.push_back(ps::WorkerState(4, 14, 0, "4.txt"));
+    ASSERT_TRUE(queue.ReportWorkerState(1, worker_states).IsOk());
+
+    ASSERT_TRUE(queue.Deserialize(buf).IsOk());
+    ASSERT_TRUE(queue.RestoreWorkerState(0).IsOk());
+    ASSERT_TRUE(queue.RestoreWorkerState(1).IsOk());
+
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(1, file.begin_);
+    ASSERT_EQ(11, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(1, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(2, file.begin_);
+    ASSERT_EQ(12, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("3.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(0, file.epoch_);
+    queue.GetNextFile(1, &file);
+    EXPECT_EQ("4.txt", file.path_);
+    EXPECT_EQ(0, file.begin_);
+    EXPECT_EQ(0, file.end_);
+    EXPECT_EQ(0, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("1.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+    queue.GetNextFile(0, &file);
+    ASSERT_EQ("2.txt", file.path_);
+    ASSERT_EQ(0, file.begin_);
+    ASSERT_EQ(0, file.end_);
+    ASSERT_EQ(1, file.epoch_);
+  }
+}
diff --git a/xdl/ps-plus/ps-plus/common/test/hasher_test.cc b/xdl/ps-plus/ps-plus/common/test/hasher_test.cc
index 6a50aaa3..237fbc92 100644
--- a/xdl/ps-plus/ps-plus/common/test/hasher_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/hasher_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/hasher.h"
 
@@ -22,4 +7,13 @@ TEST(HasherTest, Hasher) {
   int value = Hasher::Hash128(123456789, 987654321);
   ASSERT_NE(value, 0);
   ASSERT_NE(value, 1);
+
+  value = Hasher::Hash64(123456789);
+  ASSERT_EQ(value, 52501);
+  value = Hasher::Hash64(-123456789);
+  ASSERT_EQ(value, 13035);
+  value = Hasher::Hash64(0);
+  ASSERT_EQ(value, 0);
+  value = Hasher::Hash64(65536);
+  ASSERT_EQ(value, 0);
 }
diff --git a/xdl/ps-plus/ps-plus/common/test/hashmap_test.cc b/xdl/ps-plus/ps-plus/common/test/hashmap_test.cc
index 2767c396..74593912 100644
--- a/xdl/ps-plus/ps-plus/common/test/hashmap_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/hashmap_test.cc
@@ -1,269 +1,162 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include <iostream>
 #include "gtest/gtest.h"
 #include "ps-plus/common/hashmap.h"
+#include "ps-plus/common/thread_pool.h"
 
+using ps::Hash128Key;
 using ps::HashMap;
-using ps::HashMapItem;
+using ps::Range;
+using ps::Status;
 using std::vector;
 
-TEST(HashMapTest, Get) {
-  HashMap hashmap(1280);
-  int64_t keys[] = {1, 2, 3, 4}; 
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  int ret = hashmap.Get(keys, 2, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(2u, ids.size());
+TEST(HashMap64Test, Get) {
+  std::unique_ptr<HashMap> hashmap(new ps::HashMapImpl<int64_t>(1));  
+  int64_t keys[] = {1, 2, 3, 4};
+  vector<size_t> ids;
+  tbb::concurrent_vector<size_t> reused_ids;
+  size_t filtered;
+  int64_t max = hashmap->Get((const int64_t*)keys, 4ul, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(4, max);
+  EXPECT_EQ(4u, ids.size());
   // NOTE: the latter part of keys would get id first
-  EXPECT_EQ(0, ids[1]);
-  EXPECT_EQ(1, ids[0]);
-  EXPECT_EQ(0u, reused_ids.size());
-
-  int64_t keys1[] = {1, 2, 3, 4, 13, 14};
-  ret = hashmap.Get(keys1, 3, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(3u, ids.size());
-  // alloc new id
-  EXPECT_EQ(2, ids[2]);
-  // old id
-  EXPECT_EQ(0, ids[1]);
-  EXPECT_EQ(1, ids[0]);
+  size_t total = 0;
+  for (size_t i = 0; i < 4; i++) {
+    total += ids[i];
+  }
+  EXPECT_EQ(6ul, total);
+  EXPECT_EQ(0ul, reused_ids.size());
+
+  int64_t keys1[] = {4, 3, 2, 1, 13, 14};
+  max = hashmap->Get((const int64_t*)keys1, 6ul, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(6, max);
+  EXPECT_EQ(6u, ids.size());
+  total = 0;
+  for (size_t i = 0; i < 4; i++) {
+    total += ids[i];
+  }
+  EXPECT_EQ(6ul, total);
+  total = 0;
+  for (size_t i = 4; i < 6; i++) {
+    total += ids[i];
+  }
+  EXPECT_EQ(9u, total);  
   EXPECT_EQ(0u, reused_ids.size());
 }
 
-TEST(HashMapTest, GetWithVerChange) {
-  HashMap hashmap(1280);
-  hashmap.SetMaxCache(2);
-  int64_t keys[] = {1, 2, 3, 4, 5, 6}; 
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  int ret = hashmap.Get(keys, 3, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(3u, ids.size());
+TEST(HashMap128Test, Get) {
+  std::unique_ptr<HashMap> hashmap(new ps::HashMapImpl<Hash128Key>(1));
+  int64_t keys[] = {1, 2, 3, 4};
+  vector<size_t> ids;
+  tbb::concurrent_vector<size_t> reused_ids;
+  size_t filtered;
+  int64_t max = hashmap->Get((const int64_t*)keys, 2ul, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(2, max);
+  EXPECT_EQ(2u, ids.size());
   // NOTE: the latter part of keys would get id first
-  EXPECT_EQ(0, ids[2]);
-  EXPECT_EQ(1, ids[1]);
-  EXPECT_EQ(2, ids[0]);
+  size_t total = 0;
+  for (size_t i = 0; i < 2; i++) {
+    total += ids[i];
+  }
+  EXPECT_EQ(1, total);  
   EXPECT_EQ(0u, reused_ids.size());
 
-  int64_t keys1[] = {1, 2, 3, 4, 7, 8}; 
-  ret = hashmap.Get(keys1, 3, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
+  int64_t keys1[] = {4, 3, 2, 1, 13, 14};
+  max = hashmap->Get((const int64_t*)keys1, 3ul, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(5, max);
   EXPECT_EQ(3u, ids.size());
-  // <7, 8> new id:3
-  EXPECT_EQ(3, ids[2]);
-  EXPECT_EQ(1, ids[1]);
-  EXPECT_EQ(2, ids[0]);
+  total = 0;
+  for (size_t i = 0; i < 3; i++) {
+    total += ids[i];
+  }
+  EXPECT_EQ(9, total);
   EXPECT_EQ(0u, reused_ids.size());
-} 
+}
 
-TEST(HashMapTest, Del) {
-  HashMap hashmap(1280);
+TEST(HashMap128Test, BloomFilter) {
+  std::unique_ptr<HashMap> hashmap(new ps::HashMapImpl<Hash128Key>(1));
+  hashmap->SetBloomFilterThrethold(2);
   int64_t keys[] = {1, 2, 3, 4};
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  int ret = hashmap.Get(keys, 2, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);  
+  vector<size_t> ids;
+  tbb::concurrent_vector<size_t> reused_ids;
+  size_t filtered;
+  int64_t max = hashmap->Get((const int64_t*)keys, 2ul, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(max, 0);
+  max = hashmap->Get((const int64_t*)keys, 2ul, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(max, 2);  
+}
+
+
+TEST(HashMap128Test, Erase) {
+  std::unique_ptr<HashMap> hashmap(new ps::HashMapImpl<Hash128Key>(1));
+  int64_t keys[] = {1, 2};
+  vector<size_t> ids;
+  tbb::concurrent_vector<size_t> reused_ids;
+  size_t filtered;
+  int64_t max = hashmap->Get(keys, 1ul, false, 1.0, &ids, &reused_ids, &filtered);
+  ASSERT_EQ(1, max);
+  ASSERT_EQ(1, ids.size());
+  ASSERT_EQ(0, ids[0]);
+  ASSERT_EQ(0, reused_ids.size());   
+  int64_t keys2[] = {3, 4};
+  max = hashmap->Get(keys2, 1ul, false, 1.0, &ids, &reused_ids, &filtered);
+  ASSERT_EQ(2, max);
+  ASSERT_EQ(1, ids.size());
+  ASSERT_EQ(1, ids[0]);
+  ASSERT_EQ(0, reused_ids.size());
   int64_t del_keys[] = {3, 4};
-  ret = hashmap.Del(del_keys, 1, 2);
-  ASSERT_EQ(0, ret);
-  int64_t keys1[] = {1, 2, 5, 6};
-  ret = hashmap.Get(keys1, 2, 2, &ids, &reused_ids);
+  hashmap->Erase(del_keys, 1);
+  int64_t keys3[] = {1, 2, 5, 6};
+  max = hashmap->Get(keys3, 2, false, 1.0, &ids, &reused_ids, &filtered);
+  ASSERT_EQ(2, max);
   EXPECT_EQ(2u, ids.size());
-  EXPECT_EQ(1, ids[0]);
+  EXPECT_EQ(0, ids[0]);
   // reuse id:0 
-  EXPECT_EQ(0, ids[1]);
-  EXPECT_EQ(1u, reused_ids.size());
-  EXPECT_EQ(0, reused_ids[0]);
-  
-  int64_t del_keys1[] = {1, 2};
-  ret = hashmap.Del(del_keys1, 1, 2);
-  ASSERT_EQ(0, ret);
-  int64_t keys2[] = {1, 2, 3, 4, 5, 6, 7, 8};
-  ret = hashmap.Get(keys2, 4, 2, &ids, &reused_ids);
-  EXPECT_EQ(4u, ids.size());
-  // <7, 8> reuse id:1
-  EXPECT_EQ(1, ids[3]);
-  // <5, 6> old id:0
-  EXPECT_EQ(0, ids[2]);
-  // <3, 4> new id:2
-  EXPECT_EQ(2, ids[1]); 
-  // <1, 2> new id:3
-  EXPECT_EQ(3, ids[0]);
+  EXPECT_EQ(1, ids[1]);
   EXPECT_EQ(1u, reused_ids.size());
   EXPECT_EQ(1, reused_ids[0]);
 
-  int64_t del_keys2[] = {3, 4, 5, 6};
-  ret = hashmap.Del(del_keys2, 2, 2);
-  ASSERT_EQ(0, ret);
-  int64_t keys3[] = {7, 8, 9, 10, 11, 12};
-  ret = hashmap.Get(keys3, 3, 2, &ids, &reused_ids);
-  EXPECT_EQ(3u, ids.size());
-  // <11, 12> reuse id:2
-  EXPECT_EQ(2, ids[2]);
-  // <9, 10> reuse id:0
-  EXPECT_EQ(0, ids[1]);
-  // <7, 8> old id:1
-  EXPECT_EQ(1, ids[0]); 
-  EXPECT_EQ(2u, reused_ids.size());
-  EXPECT_EQ(2, reused_ids[0]);
-  EXPECT_EQ(0, reused_ids[1]);
-}
-
-TEST(HashMapTest, DelWithVerChange) {
-  HashMap hashmap(1280);
-  hashmap.SetMaxCache(2);
-  int64_t keys[] = {1, 2, 3, 4, 5, 6, 7, 8}; 
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  // alloc id: 3->2->1->0
-  int ret = hashmap.Get(keys, 4, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-
-  int64_t del_keys[] = {1, 2, 3, 4, 7, 8};
-  // release id: 3->2->0
-  ret = hashmap.Del(del_keys, 3, 2);
-  ASSERT_EQ(0, ret);
- 
-  int64_t keys1[] = {5, 6, 3, 4, 9, 10};
-  ret = hashmap.Get(keys1, 3, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);  
-  EXPECT_EQ(3u, ids.size());
-  // <9, 10> reuse id: 3
-  EXPECT_EQ(3, ids[2]); 
-  // <3, 4> reuse id: 2
-  EXPECT_EQ(2, ids[1]); 
-  // <5, 6> old id: 1
-  EXPECT_EQ(1, ids[0]); 
-}
-
-TEST(HashMapTest, ExpandSpace) {
-  HashMap hashmap(1);
-  hashmap.SetMaxCache(100);
-  int test_cnt = 140;
-  int64_t keys[test_cnt*2];
-  for (int i = 0; i < test_cnt; i++) {
-    keys[i*2] = i*2;
-    keys[i*2+1] = i*2+1;
-  }
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  int ret = hashmap.Get(keys, test_cnt, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);
-  EXPECT_EQ(test_cnt*1u, ids.size());
-  for (int i = 0; i < test_cnt; i++) {
-    EXPECT_EQ(i, ids[test_cnt - 1 - i]);
-  }
-
-  int64_t keys1[] = {0, 1, 2, 3, 278, 279, 300, 301};
-  ret = hashmap.Get(keys1, 4, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);
+  int64_t del_keys1[] = {1, 2};
+  hashmap->Erase(del_keys1, 1);
+  int64_t keys4[] = {5, 6, 1, 2, 3, 4, 7, 8};
+  max = hashmap->Get(keys4, 4, false, 1.0, &ids, &reused_ids, &filtered);
+  EXPECT_EQ(4u, max);
   EXPECT_EQ(4u, ids.size());
-  EXPECT_EQ(139, ids[0]);
-  EXPECT_EQ(138, ids[1]);
-  EXPECT_EQ(0, ids[2]);
-  EXPECT_EQ(140, ids[3]);
-}
-
-TEST(HashMapTest, GetKeysAndSetKeys) {
-  HashMap hashmap(1280);
-  int64_t keys[] = {1, 2, 3, 4}; 
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  int ret = hashmap.Get(keys, 2, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(2u, ids.size());
-  // NOTE: the latter part of keys would get id first
-  EXPECT_EQ(0, ids[1]);
+  // <5, 6> old id:1
   EXPECT_EQ(1, ids[0]);
-  EXPECT_EQ(0u, reused_ids.size());
-
-  HashMap::HashMapStruct items;
-  EXPECT_EQ(0, hashmap.GetHashKeys(&items));
-
-  EXPECT_EQ(2u, items.items.size());
-  EXPECT_EQ(2u, items.counter);
-  if (items.items[0].x == 1) {
-    EXPECT_EQ(1, items.items[0].x);
-    EXPECT_EQ(2, items.items[0].y);
-    EXPECT_EQ(1, items.items[0].id);
-    EXPECT_EQ(3, items.items[1].x);
-    EXPECT_EQ(4, items.items[1].y);
-    EXPECT_EQ(0, items.items[1].id);
-  } else {
-    EXPECT_EQ(1, items.items[1].x);
-    EXPECT_EQ(2, items.items[1].y);
-    EXPECT_EQ(1, items.items[1].id);
-    EXPECT_EQ(3, items.items[0].x);
-    EXPECT_EQ(4, items.items[0].y);
-    EXPECT_EQ(0, items.items[0].id);
+  size_t total = 0;
+  for (size_t i = 0; i < 3; i++) {
+    total += ids[i+1];
   }
-
-  HashMap hashmap1(2);
-  EXPECT_EQ(0, hashmap1.SetHashKeys(items));
-
-  int64_t keys1[] = {1, 2, 3, 4, 13, 14};
-  ret = hashmap1.Get(keys1, 3, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(3u, ids.size());
-  // alloc new id
-  EXPECT_EQ(2, ids[2]);
-  // old id
-  EXPECT_EQ(0, ids[1]);
-  EXPECT_EQ(1, ids[0]);
-  EXPECT_EQ(0u, reused_ids.size());
+  EXPECT_EQ(5, total);
 }
 
-TEST(HashMapTest, GetKeysAndSetKeysWithDel) {
-  HashMap hashmap(1280);
-  int64_t keys[] = {1, 2, 3, 4}; 
-  vector<int64_t> ids;
-  vector<int64_t> reused_ids;
-  int ret = hashmap.Get(keys, 2, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(2u, ids.size());
-  // NOTE: the latter part of keys would get id first
-  EXPECT_EQ(0, ids[1]);
-  EXPECT_EQ(1, ids[0]);
-  EXPECT_EQ(0u, reused_ids.size());
-  
-  int64_t del_keys1[] = {1, 2};
-  EXPECT_EQ(0, hashmap.Del(del_keys1, 1, 2));
-
-  HashMap::HashMapStruct items;
-  EXPECT_EQ(0, hashmap.GetHashKeys(&items));
-
-  EXPECT_EQ(1u, items.items.size());
-  EXPECT_EQ(2u, items.counter);
-  EXPECT_EQ(3, items.items[0].x);
-  EXPECT_EQ(4, items.items[0].y);
-  EXPECT_EQ(0, items.items[0].id);
-
-  HashMap hashmap1(2);
-  EXPECT_EQ(0, hashmap1.SetHashKeys(items));
-
-  int64_t keys1[] = {1, 2, 3, 4, 13, 14};
-  ret = hashmap1.Get(keys1, 3, 2, &ids, &reused_ids);
-  ASSERT_EQ(0, ret);   
-  EXPECT_EQ(3u, ids.size());
-  EXPECT_EQ(1, ids[2]);
-  EXPECT_EQ(0, ids[1]);
-  EXPECT_EQ(2, ids[0]);
-  EXPECT_EQ(1u, reused_ids.size());
-  EXPECT_EQ(1, reused_ids[0]);
+TEST(HashMap128Test, MultiThread) {
+  int thread_count = 10;
+  size_t key_count = 20000l;
+  std::unique_ptr<HashMap> hashmap(new ps::HashMapImpl<Hash128Key>(key_count));
+  int64_t* keys = new int64_t[key_count];
+  for (size_t i = 0; i < key_count; i++) {
+    keys[i] = i;
+  }
+  std::atomic<size_t> total(0);
+  auto start = std::chrono::system_clock::now();
+  ps::MultiThreadDoTBB(thread_count, [&](const Range& r) {
+        for (size_t i = r.begin; i < r.end; i++) {
+          vector<size_t> ids;
+          tbb::concurrent_vector<size_t> reused_ids;
+          size_t filtered;
+          hashmap->Get(keys + i* key_count/thread_count, key_count/2/thread_count, false, 1.0, &ids, &reused_ids, &filtered);
+          EXPECT_EQ(key_count/2/thread_count, ids.size());
+          size_t sub_total = 0;
+          for (size_t j = 0; j < ids.size(); j++) {
+            sub_total += ids[j];
+          }
+          total.fetch_add(sub_total);
+        }
+        return Status::Ok();
+      });
+  EXPECT_EQ(49995000, total);
+  auto end = std::chrono::system_clock::now();
+  std::cout << "insert " << key_count/2 << " keys, takes " << (end-start).count()/1000000 << "ms" <<std::endl;
+  delete [] keys;
 }
diff --git a/xdl/ps-plus/ps-plus/common/test/hdfs_test.cc b/xdl/ps-plus/ps-plus/common/test/hdfs_test.cc
index 6ab6bfe5..b30068e9 100644
--- a/xdl/ps-plus/ps-plus/common/test/hdfs_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/hdfs_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/data_source.h"
 #include "ps-plus/common/hdfs_data_source.h"
@@ -32,28 +17,16 @@ class MockHdfsDS : public HdfsDataSource {
 
 class HdfsDataSourceTest : public testing::Test {
   public:
-    void SetUp() override {
-      if (false == ps::HDFSLauncher::Start()) {
-        skip_ = true;
-      }
-      if (skip_) {
-        GTEST_SKIP();
-      }
-    }
-
-    void TearDown() override {
-      if (!skip_) {
-        ps::HDFSLauncher::Stop();
-      }
-    }
-
-  private:
-    bool skip_ = false;
+  static void SetUpTestCase() {}
+  static void TearDownTestCase() {}
 };
 
 TEST_F(HdfsDataSourceTest, HdfsDataSource) {
+  int hdfs_port = xdl::HDFSLauncher::Instance()->GetPort();
+  std::string hdfs_prefix = "hdfs://127.0.0.1:" + std::to_string(hdfs_port);
+  std::string dir = hdfs_prefix + "/test_data/data_io/";
   {
-    std::unique_ptr<HdfsDataSource> hds(new HdfsDataSource("hdfs://127.0.0.1:9090/test_data/data_io/", 1));
+    std::unique_ptr<HdfsDataSource> hds(new HdfsDataSource(dir, 1));
     ASSERT_NE(hds, nullptr);
 
     Status st = hds->Init(1, 1, 100);
@@ -76,8 +49,8 @@ TEST_F(HdfsDataSourceTest, HdfsDataSource) {
   }
 
   {
-    auto ds = new MockHdfsDS("hdfs://127.0.0.1:9090/test_data/data_io/", 1);
-    Status st = ds->Call("hdfs://127.0.0.1:9090/test_data/data_io/");
+    auto ds = new MockHdfsDS(dir, 1);
+    Status st = ds->Call(dir);
     ASSERT_NE(st, Status::Ok());
     delete ds;
   }
diff --git a/xdl/ps-plus/ps-plus/common/test/kv_test.cc b/xdl/ps-plus/ps-plus/common/test/kv_test.cc
index 9ae07149..b33c025a 100644
--- a/xdl/ps-plus/ps-plus/common/test/kv_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/kv_test.cc
@@ -1,50 +1,46 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/reliable_kv.h"
+#include "test/util/zookeeper_launcher.h"
 
 using ps::ReliableKV;
 using ps::Status;
 
-TEST(ReliableKVTest, Reliable) {
-  // {
-  //   auto kv = ps::GetPlugin<ReliableKV>("zfs");
-  //   ASSERT_NE(kv, nullptr);
+class ReliableKVTest : public testing::Test {
+  public:
+    static void SetUpTestCase() {}
+    static void TearDownTestCase() {}
+};
+
+TEST_F(ReliableKVTest, Reliable) {
+  int zk_port = xdl::ZookeeperLauncher::Instance()->GetPort();
+  std::string zk_prefix = "zfs://127.0.0.1:" + std::to_string(zk_port);
+  std::string dir = zk_prefix + "/";
+  std::cout << dir + "kva.test" << "\n";
+  {
+    auto kv = ps::GetPlugin<ReliableKV>("zfs");
+    ASSERT_NE(kv, nullptr);
 
-  //   Status st = kv->WriteAny("zfs://127.0.0.1:2181/kva.test", "waterfall", 1);
-  //   ASSERT_EQ(st, Status::Ok());
+    Status st = kv->WriteAny(dir + "kva.test", "waterfall", 1);
+    ASSERT_EQ(st, Status::Ok());
 
     
-  //   std::string value;
-  //   st = kv->ReadAny("zfs://127.0.0.1:2181/kva.test", &value, 1);
-  //   ASSERT_EQ(st, Status::Ok());
-  //   ASSERT_EQ(value, "waterfall");
-  // }
+    std::string value;
+    st = kv->ReadAny(dir + "kva.test", &value, 1);
+    ASSERT_EQ(st, Status::Ok());
+    ASSERT_EQ(value, "waterfall");
+  }
 
-  // {
-  //   auto kv = ps::GetPlugin<ReliableKV>("zfs");
-  //   ASSERT_NE(kv, nullptr);
+  {
+    auto kv = ps::GetPlugin<ReliableKV>("zfs");
+    ASSERT_NE(kv, nullptr);
 
-  //   Status st = kv->Write("zfs://127.0.0.1:2181/kv.test", "waterfall", 1);
-  //   ASSERT_EQ(st, Status::Ok());
+    Status st = kv->Write(dir + "kv.test", "waterfall", 1);
+    ASSERT_EQ(st, Status::Ok());
 
     
-  //   std::string value;
-  //   st = kv->Read("zfs://127.0.0.1:2181/kv.test", &value, 1);
-  //   ASSERT_EQ(st, Status::Ok());
-  //   ASSERT_EQ(value, "waterfall");
-  // }
+    std::string value;
+    st = kv->Read(dir + "kv.test", &value, 1);
+    ASSERT_EQ(st, Status::Ok());
+    ASSERT_EQ(value, "waterfall");
+  }
 }
diff --git a/xdl/ps-plus/ps-plus/common/test/memguard_test.cc b/xdl/ps-plus/ps-plus/common/test/memguard_test.cc
index 7e21e290..05be94ac 100644
--- a/xdl/ps-plus/ps-plus/common/test/memguard_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/memguard_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/memguard.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/murmurhash_test.cc b/xdl/ps-plus/ps-plus/common/test/murmurhash_test.cc
new file mode 100644
index 00000000..0f02899b
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/test/murmurhash_test.cc
@@ -0,0 +1,57 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/common/murmurhash.h"
+#include <iomanip>
+#include <sstream>
+
+using ps::MurmurHash;
+
+std::string uint128_2_string(uint64_t res[2]) {
+  std::ostringstream oss;
+  oss << std::setw(16) << std::setfill('0') << std::hex << res[0];
+  oss << std::setw(16) << std::setfill('0') << std::hex << res[1];
+  return oss.str();
+}
+
+TEST(MurmurHashTest, MurmurHash) {
+  uint64_t res[2];
+  // default seed
+  {
+    MurmurHash hash_fn(0);
+    std::string key0("");
+    std::string val0("00000000000000000000000000000000");
+    std::string key1("this is a test line");
+    std::string val1("097eec3aaefa7332e0d14cf2d59d26c3");
+    hash_fn(key0.c_str(), key0.size(), res);
+    ASSERT_EQ(uint128_2_string(res), val0);
+    hash_fn(key1.c_str(), key1.size(), res);
+    ASSERT_EQ(uint128_2_string(res), val1);
+  }
+  
+  // use seed
+  {
+    MurmurHash hash_fn(7621U);
+    std::string key0("");
+    std::string val0("2087cc3f33e14ed78d8fdd6d054f1c2c");
+    std::string key1("this is a test line");
+    std::string val1("b3c8e4d2b3806183bc117d2cd9cf9a3e");
+    hash_fn(key0.c_str(), key0.size(), res);
+    ASSERT_EQ(uint128_2_string(res), val0);
+    hash_fn(key1.c_str(), key1.size(), res);
+    ASSERT_EQ(uint128_2_string(res), val1);
+  }
+}
diff --git a/xdl/ps-plus/ps-plus/common/test/netutils_test.cc b/xdl/ps-plus/ps-plus/common/test/netutils_test.cc
index dc66c0f0..53f04f71 100644
--- a/xdl/ps-plus/ps-plus/common/test/netutils_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/netutils_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/net_utils.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/option_parser_test.cc b/xdl/ps-plus/ps-plus/common/test/option_parser_test.cc
index 27abcec9..90608b21 100644
--- a/xdl/ps-plus/ps-plus/common/test/option_parser_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/option_parser_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/option_parser.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/plugin_test.cc b/xdl/ps-plus/ps-plus/common/test/plugin_test.cc
index 8f8ac899..8dbaf76d 100644
--- a/xdl/ps-plus/ps-plus/common/test/plugin_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/plugin_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/plugin.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/qrw_lock_test.cc b/xdl/ps-plus/ps-plus/common/test/qrw_lock_test.cc
index 981ea324..d1a0d21b 100644
--- a/xdl/ps-plus/ps-plus/common/test/qrw_lock_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/qrw_lock_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/qrw_lock.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/serializer_test.cc b/xdl/ps-plus/ps-plus/common/test/serializer_test.cc
index e0934c0d..4eb44895 100644
--- a/xdl/ps-plus/ps-plus/common/test/serializer_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/serializer_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include <cstring>
 
 #include "gtest/gtest.h"
@@ -62,7 +47,6 @@ void FragmentConcat(const std::vector<Fragment>& bufs, Fragment* merge) {
     std::memcpy(merge->base + offset, item.base, item.size);
     offset += item.size;
   }
-
   merge->size = total_size;
 }
 
@@ -73,8 +57,7 @@ TEST(SerializerTest, Serializer) {
     size_t id;
     std::vector<Fragment> bufs;
     EXPECT_TRUE(SerializeAny<Data>(data, &id, &bufs, mem_guard).IsOk());
-
-    ps::Data* result = nullptr;    
+    ps::Data* result = nullptr;
     size_t len;
     Status s = DeserializeAny<Data>(id, &bufs[0], 0, &result, &len, mem_guard);
     EXPECT_TRUE(s.IsOk());
@@ -410,6 +393,7 @@ TEST(SerializerTest, Serializer) {
   }
 
   {
+    //vector<Slices> to vector<Tensor>
     MemGuard mem_guard;
     Slices slice;
     slice.slice_size = 2;
@@ -418,19 +402,68 @@ TEST(SerializerTest, Serializer) {
     slice.slice_id.push_back(2);
     slice.slice_id.push_back(3);
     int32_t buf[] = {1, 2, 3, 4, 5, 6, 7, 8};
-    ps::Tensor t(DataType::kInt32, ps::TensorShape({4,2}), (char*)&buf, nullptr);
-    slice.variable = new ps::server::Variable(&t, nullptr);
+    ps::Tensor t(DataType::kInt32, ps::TensorShape({4,2}), nullptr, false, ps::Tensor::DEFAULT_SEGMENT_SIZE);
+    for (size_t i = 0; i < 4; i++) {
+      int32_t* p = t.Raw<int32_t>(i);
+      p[0] = buf[i*2];
+      p[1] = buf[i*2+1];
+    }
+    slice.variable = new ps::server::Variable(&t, nullptr, "");
     
-    WrapperData<ps::server::Slices>* data = new WrapperData<ps::server::Slices>(slice);
+    WrapperData<std::vector<ps::server::Slices> >* data = new WrapperData<std::vector<ps::server::Slices> >(std::vector<ps::server::Slices>{slice});
     size_t id;
     std::vector<Fragment> bufs;
-    EXPECT_TRUE(SerializeAny<Data>(data, &id, &bufs, mem_guard).IsOk());
+    Status st = SerializeAny<Data>(data, &id, &bufs, mem_guard);
+    EXPECT_TRUE(st.IsOk());
 
-    ps::Data* result = nullptr;    
+    ps::Data* result = nullptr;
     size_t len;
     Fragment deserialize_buf;
     FragmentConcat(bufs, &deserialize_buf);
-    ps::Status st = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
+    st = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
+    EXPECT_TRUE(st.IsOk());
+    WrapperData<std::vector<ps::Tensor> >* r = dynamic_cast<WrapperData<std::vector<ps::Tensor> >*>(result);
+    EXPECT_EQ(1, r->Internal().size());
+    ps::Tensor& rt = r->Internal()[0];
+    EXPECT_EQ(DataType::kInt32, rt.Type());
+    EXPECT_EQ(ps::TensorShape({3,2}), rt.Shape());
+    int32_t expected[] = {1, 2, 5, 6, 7, 8};
+    for (size_t i = 0; i < 6; ++i) {
+      EXPECT_EQ(expected[i], *(rt.Raw<int32_t>() + i));
+    }  
+    delete data;
+    delete result;
+    delete[] deserialize_buf.base;
+  }
+
+  {
+    //TensorSlices to Tensor
+    MemGuard mem_guard;
+    ps::server::TensorSlices slice;
+    slice.slice_size = 2;
+    slice.dim_part = 1;
+    slice.slice_id.push_back(0);
+    slice.slice_id.push_back(2);
+    slice.slice_id.push_back(3);
+    int32_t buf[] = {1, 2, 3, 4, 5, 6, 7, 8};
+    ps::Tensor t(DataType::kInt32, ps::TensorShape({4,2}), nullptr, false, ps::Tensor::DEFAULT_SEGMENT_SIZE);
+    for (size_t i = 0; i < 4; i++) {
+      int32_t* p = t.Raw<int32_t>(i);
+      p[0] = buf[i*2];
+      p[1] = buf[i*2+1];      
+    }
+    slice.tensor = t;
+    WrapperData<ps::server::TensorSlices>* data = new WrapperData<ps::server::TensorSlices>(slice);
+    size_t id;
+    std::vector<Fragment> bufs;
+    Status st = SerializeAny<Data>(data, &id, &bufs, mem_guard);
+    EXPECT_TRUE(st.IsOk());
+
+    ps::Data* result = nullptr;
+    size_t len;
+    Fragment deserialize_buf;
+    FragmentConcat(bufs, &deserialize_buf);
+    st = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
     EXPECT_TRUE(st.IsOk());
     WrapperData<ps::Tensor>* r = dynamic_cast<WrapperData<ps::Tensor>*>(result);
     EXPECT_EQ(DataType::kInt32, r->Internal().Type());
@@ -439,7 +472,71 @@ TEST(SerializerTest, Serializer) {
     for (size_t i = 0; i < 6; ++i) {
       EXPECT_EQ(expected[i], *(r->Internal().Raw<int32_t>() + i));
     }  
-  
+    delete data;
+    delete result;
+    delete[] deserialize_buf.base;
+  }  
+
+  {
+    //vector<TensorSlices> to vector<Tensor>
+    MemGuard mem_guard;
+    ps::server::TensorSlices slice;
+    slice.slice_size = 2;
+    slice.dim_part = 1;
+    slice.slice_id.push_back(0);
+    slice.slice_id.push_back(2);
+    slice.slice_id.push_back(3);
+    int32_t buf[] = {1, 2, 3, 4, 5, 6, 7, 8};
+    ps::Tensor t(DataType::kInt32, ps::TensorShape({4,2}), nullptr, false, ps::Tensor::DEFAULT_SEGMENT_SIZE);
+    for (size_t i = 0; i < 4; i++) {
+      int32_t* p = t.Raw<int32_t>(i);
+      p[0] = buf[i*2];
+      p[1] = buf[i*2+1];
+    }
+    slice.tensor = t;
+
+    ps::server::TensorSlices slice2;
+    slice2.slice_size = 2;
+    slice2.dim_part = 1;
+    slice2.slice_id.push_back(0);
+    slice2.slice_id.push_back(3);
+    int32_t buf2[] = {9, 10, 11, 12, 13, 14, 15, 16};
+    ps::Tensor t2(DataType::kInt32, ps::TensorShape({4,2}), nullptr, false, ps::Tensor::DEFAULT_SEGMENT_SIZE);
+    for (size_t i = 0; i < 4; i++) {
+      int32_t* p = t2.Raw<int32_t>(i);
+      p[0] = buf2[i*2];
+      p[1] = buf2[i*2+1];
+    }
+    slice2.tensor = t2;
+    WrapperData<std::vector<ps::server::TensorSlices> >* data = new WrapperData<std::vector<ps::server::TensorSlices> >(std::vector<ps::server::TensorSlices>{slice, slice2});
+    size_t id;
+    std::vector<Fragment> bufs;
+    Status st = SerializeAny<Data>(data, &id, &bufs, mem_guard);
+    EXPECT_TRUE(st.IsOk());
+
+    ps::Data* result = nullptr;
+    size_t len;
+    Fragment deserialize_buf;
+    FragmentConcat(bufs, &deserialize_buf);
+    st = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
+    EXPECT_TRUE(st.IsOk());
+    WrapperData<std::vector<ps::Tensor> >* r = dynamic_cast<WrapperData<std::vector<ps::Tensor> >*>(result);
+    EXPECT_EQ(2, r->Internal().size());
+    ps::Tensor& rt = r->Internal()[0];
+    EXPECT_EQ(DataType::kInt32, rt.Type());
+    EXPECT_EQ(ps::TensorShape({3,2}), rt.Shape());
+    int32_t expected[] = {1, 2, 5, 6, 7, 8};
+    for (size_t i = 0; i < 6; ++i) {
+      EXPECT_EQ(expected[i], *(rt.Raw<int32_t>() + i));
+    }
+
+    ps::Tensor& rt2 = r->Internal()[1];
+    EXPECT_EQ(DataType::kInt32, rt2.Type());
+    EXPECT_EQ(ps::TensorShape({2,2}), rt2.Shape());
+    int32_t expected2[] = {9, 10, 15, 16};
+    for (size_t i = 0; i < 4; ++i) {
+      EXPECT_EQ(expected2[i], *(rt2.Raw<int32_t>() + i));
+    }      
     delete data;
     delete result;
     delete[] deserialize_buf.base;
@@ -676,3 +773,106 @@ TEST(MessageSerializerTest, UdfChainRegisterTest) {
     delete[] deserialize_buf.base;
   }
 }
+
+TEST(MessageSerializerTest, VecStringTest) {
+  {
+    MemGuard mem_guard;
+    using StringVec = std::vector<std::string>;
+    WrapperData<StringVec>* data = new WrapperData<StringVec>();
+    data->Internal().push_back("this");
+    data->Internal().push_back("is");
+    data->Internal().push_back("a");
+    data->Internal().push_back("test");
+    size_t id;
+    std::vector<Fragment> bufs;
+    EXPECT_TRUE(SerializeAny<Data>(data, &id, &bufs, mem_guard).IsOk());
+
+    Fragment deserialize_buf;
+    FragmentConcat(bufs, &deserialize_buf);
+
+    ps::Data* result = nullptr;    
+    size_t len;
+    Status s = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
+    EXPECT_TRUE(s.IsOk());
+    WrapperData<StringVec>* r = dynamic_cast<WrapperData<StringVec>*>(result);    
+    EXPECT_TRUE(r != nullptr);
+    const StringVec& ret = r->Internal();
+    EXPECT_EQ(4, ret.size());
+    EXPECT_EQ("this", ret[0]);
+    EXPECT_EQ("is", ret[1]);
+    EXPECT_EQ("a", ret[2]);
+    EXPECT_EQ("test", ret[3]);
+    delete data;
+    delete result;
+  }
+}
+
+TEST(MessageSerializerTest, VecDoubleTest) {
+  {
+    MemGuard mem_guard;
+    using DoubleVec = std::vector<double>;
+    WrapperData<DoubleVec>* data = new WrapperData<DoubleVec>();
+    data->Internal().push_back(1.67);
+    data->Internal().push_back(-2.31);
+    data->Internal().push_back(0);
+    data->Internal().push_back(-0.0000001);
+    size_t id;
+    std::vector<Fragment> bufs;
+    EXPECT_TRUE(SerializeAny<Data>(data, &id, &bufs, mem_guard).IsOk());
+
+    Fragment deserialize_buf;
+    FragmentConcat(bufs, &deserialize_buf);
+
+    ps::Data* result = nullptr;    
+    size_t len;
+    Status s = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
+    EXPECT_TRUE(s.IsOk());
+    WrapperData<DoubleVec>* r = dynamic_cast<WrapperData<DoubleVec>*>(result);    
+    EXPECT_TRUE(r != nullptr);
+    const DoubleVec& ret = r->Internal();
+    EXPECT_EQ(4, ret.size());
+    EXPECT_EQ(1.67, ret[0]);
+    EXPECT_EQ(-2.31, ret[1]);
+    EXPECT_EQ(0, ret[2]);
+    EXPECT_FLOAT_EQ(-0.0000001, ret[3]);
+    delete data;
+    delete result;
+  }
+}
+
+TEST(MessageSerializerTest, VecBoolTest) {
+  {
+    MemGuard mem_guard;
+    using BoolVec = std::vector<bool>;
+    WrapperData<BoolVec>* data = new WrapperData<BoolVec>();
+    data->Internal().push_back(true);
+    data->Internal().push_back(false);
+    data->Internal().push_back(false);
+    data->Internal().push_back(true);
+    data->Internal().push_back(true);
+    data->Internal().push_back(true);    
+    size_t id;
+    std::vector<Fragment> bufs;
+    EXPECT_TRUE(SerializeAny<Data>(data, &id, &bufs, mem_guard).IsOk());
+
+    Fragment deserialize_buf;
+    FragmentConcat(bufs, &deserialize_buf);
+
+    ps::Data* result = nullptr;    
+    size_t len;
+    Status s = DeserializeAny<Data>(id, &deserialize_buf, 0, &result, &len, mem_guard);
+    EXPECT_TRUE(s.IsOk());
+    WrapperData<BoolVec>* r = dynamic_cast<WrapperData<BoolVec>*>(result);    
+    EXPECT_TRUE(r != nullptr);
+    const BoolVec& ret = r->Internal();
+    EXPECT_EQ(6, ret.size());
+    EXPECT_EQ(true, ret[0]);
+    EXPECT_EQ(false, ret[1]);
+    EXPECT_EQ(false, ret[2]);
+    EXPECT_EQ(true, ret[3]);
+    EXPECT_EQ(true, ret[4]);
+    EXPECT_EQ(true, ret[5]);    
+    delete data;
+    delete result;
+  }
+}
diff --git a/xdl/ps-plus/ps-plus/common/test/status_test.cc b/xdl/ps-plus/ps-plus/common/test/status_test.cc
index ab1e8a9d..42aafe74 100644
--- a/xdl/ps-plus/ps-plus/common/test/status_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/status_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/status.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/string_test.cc b/xdl/ps-plus/ps-plus/common/test/string_test.cc
index 3465a172..8a148076 100644
--- a/xdl/ps-plus/ps-plus/common/test/string_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/string_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/string_utils.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/tensor_test.cc b/xdl/ps-plus/ps-plus/common/test/tensor_test.cc
index f1d830f6..a02382c8 100644
--- a/xdl/ps-plus/ps-plus/common/test/tensor_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/tensor_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/tensor.h"
 #include "ps-plus/common/initializer/constant_initializer.h"
@@ -27,7 +12,7 @@ using ps::initializer::ConstantInitializer;
 TEST(TensorTest, Contructor) {
   TensorShape shape({10, 5});
   Tensor x(DataType::kInt8, shape, new ConstantInitializer(1));
-  Tensor y(DataType::kInt8, std::move(shape), new ConstantInitializer(1));
+  Tensor y(DataType::kInt8, shape, new ConstantInitializer(1));
   for (int i = 0; i < 50; i++) {
     x.Raw<int8_t>()[i] = i;
     y.Raw<int8_t>()[i] = i + 10;
@@ -46,7 +31,7 @@ TEST(TensorTest, Contructor) {
 
 TEST(TensorTest, Initializer) {
   TensorShape shape({4, 8});
-  Tensor x(DataType::kInt8, shape, new ConstantInitializer(1));
+  Tensor x(DataType::kInt8, shape, new ConstantInitializer(1), Tensor::TType::kSegment, true);
   EXPECT_EQ(0x0101010101010101, x.Raw<int64_t>()[0]);
   EXPECT_EQ(0x0101010101010101, x.Raw<int64_t>()[1]);
   EXPECT_EQ(0x0101010101010101, x.Raw<int64_t>()[2]);
@@ -67,8 +52,8 @@ TEST(TensorTest, Initializer) {
   x.ReShape(TensorShape({4, 8}));
   EXPECT_EQ(0x0706050403020100, x.Raw<int64_t>()[0]);
   EXPECT_EQ(0x0F0E0D0C0B0A0908, x.Raw<int64_t>()[1]);
-  EXPECT_EQ(0x0101010101010101, x.Raw<int64_t>()[2]);
-  EXPECT_EQ(0x0101010101010101, x.Raw<int64_t>()[3]);
+  EXPECT_EQ(0x1716151413121110, x.Raw<int64_t>()[2]);
+  EXPECT_EQ(0x1F1E1D1C1B1A1918, x.Raw<int64_t>()[3]);
 
   for (size_t i = 0; i < 32; i++) {
     x.Raw<int8_t>()[i] = i;
@@ -78,14 +63,8 @@ TEST(TensorTest, Initializer) {
   EXPECT_EQ(0x1716151413121110, x.Raw<int64_t>()[2]);
   EXPECT_EQ(0x1F1E1D1C1B1A1918, x.Raw<int64_t>()[3]);
 
-  x.Clear(4, 4);
-  EXPECT_EQ(0x0101010103020100, x.Raw<int64_t>()[0]);
-  EXPECT_EQ(0x0F0E0D0C0B0A0908, x.Raw<int64_t>()[1]);
-  EXPECT_EQ(0x1716151413121110, x.Raw<int64_t>()[2]);
-  EXPECT_EQ(0x1F1E1D1C1B1A1918, x.Raw<int64_t>()[3]);
-
   x.ClearId(2);
-  EXPECT_EQ(0x0101010103020100, x.Raw<int64_t>()[0]);
+  EXPECT_EQ(0x0706050403020100, x.Raw<int64_t>()[0]);  
   EXPECT_EQ(0x0F0E0D0C0B0A0908, x.Raw<int64_t>()[1]);
   EXPECT_EQ(0x0101010101010101, x.Raw<int64_t>()[2]);
   EXPECT_EQ(0x1F1E1D1C1B1A1918, x.Raw<int64_t>()[3]);
diff --git a/xdl/ps-plus/ps-plus/common/test/threadpool_test.cc b/xdl/ps-plus/ps-plus/common/test/threadpool_test.cc
index 6e04b60b..21614ccc 100644
--- a/xdl/ps-plus/ps-plus/common/test/threadpool_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/threadpool_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/thread_pool.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/types_test.cc b/xdl/ps-plus/ps-plus/common/test/types_test.cc
index 3b993d11..81a90db4 100644
--- a/xdl/ps-plus/ps-plus/common/test/types_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/types_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/types.h"
 
diff --git a/xdl/ps-plus/ps-plus/common/test/zk_wrapper_test.cc b/xdl/ps-plus/ps-plus/common/test/zk_wrapper_test.cc
index 1e71d2ba..25b92400 100644
--- a/xdl/ps-plus/ps-plus/common/test/zk_wrapper_test.cc
+++ b/xdl/ps-plus/ps-plus/common/test/zk_wrapper_test.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 #include "gtest/gtest.h"
 #include "ps-plus/common/zk_wrapper.h"
 #include "test/util/zookeeper_launcher.h"
@@ -21,13 +6,8 @@ using ps::ZkWrapper;
 
 class ZkWrapperTest : public testing::Test {
   public:
-    static void SetUpTestCase() {
-      ps::ZookeeperLauncher::Start();
-    }
-
-    static void TearDownTestCase() {
-      ps::ZookeeperLauncher::Stop();
-    }
+    static void SetUpTestCase() {}
+    static void TearDownTestCase() {}
 };
 
 void call_back(ZkWrapper *zw, const std::string & msg, ZkWrapper::ZkStatus) {
@@ -35,8 +15,10 @@ void call_back(ZkWrapper *zw, const std::string & msg, ZkWrapper::ZkStatus) {
 }
 
 TEST_F(ZkWrapperTest, ZkWrapper) {
+  int zk_port = xdl::ZookeeperLauncher::Instance()->GetPort();
+  std::string dir = "127.0.0.1:" + std::to_string(zk_port);
   {
-    auto zk = new ZkWrapper("127.0.0.1:2181", 1000);
+    auto zk = new ZkWrapper(dir, 1000);
     ASSERT_NE(zk, nullptr);
 
     zk->SetConnCallback(call_back);
diff --git a/xdl/ps-plus/ps-plus/common/thread_pool.h b/xdl/ps-plus/ps-plus/common/thread_pool.h
index 48e5c522..5a3727da 100644
--- a/xdl/ps-plus/ps-plus/common/thread_pool.h
+++ b/xdl/ps-plus/ps-plus/common/thread_pool.h
@@ -24,6 +24,8 @@ limitations under the License.
 #include <functional>
 #include <future>
 #include <cstring>
+#include "ps-plus/common/status.h"
+#include "tbb/parallel_for.h"
 
 namespace ps {
 
@@ -70,6 +72,71 @@ inline void QuickMemcpy(void* dest, const void* src, size_t count) {
   }
 }
 
+struct Range {
+  size_t begin;
+  size_t end;
+};
+
+inline Status MultiThreadDo(size_t size, const std::function<Status(const Range&)>& func, size_t block_size = 500) {
+  static size_t thread_nums = std::thread::hardware_concurrency();
+  if (size == 0) {
+    return Status::Ok();
+  }
+  if (size < block_size) {
+    Range range{.begin=0, .end=size};
+    return func(range);
+  } else {
+    std::promise<bool> ok;
+    if (size / block_size > thread_nums) {
+      block_size = size / thread_nums;
+    }
+    size_t round = size / block_size;
+    if (size % block_size != 0) {
+      ++round;
+    }
+    std::atomic<size_t> counter(round);
+    block_size = size / round;
+    if (size % round != 0) {
+      ++block_size;
+    }
+    Status st = Status::Ok();
+    for (size_t i = 0; i < round; i++) {
+      ThreadPool::Global()->Schedule([&, i]{
+            Range range{.begin=i*block_size, .end=std::min(size, (i+1)*block_size)};
+            Status ret = func(range);
+            if (!ret.IsOk()) {
+              st = ret;
+            }
+            if (--counter == 0) {
+              ok.set_value(true);
+            }});
+    }
+    ok.get_future().wait();
+    return st;
+  }
+}
+
+inline Status MultiThreadDoTBB(size_t size, const std::function<Status(const Range&)>& func, size_t block_size = 1) {
+  static size_t thread_nums = std::thread::hardware_concurrency();
+  if (size == 0) {
+    return Status::Ok();
+  }
+  if (size < block_size) {
+    Range range{.begin=0, .end=size};
+    return func(range);
+  } else {
+    Status st = Status::Ok();
+    parallel_for(tbb::blocked_range<size_t>(0, size), [&](tbb::blocked_range<size_t>& r) {
+          Range range{.begin=r.begin(), .end=r.end()};
+          Status ret = func(range);
+          if (!ret.IsOk()) {
+            st = ret;
+          }
+        });
+    return st;
+  }
+}
+
 }
 
 #endif
diff --git a/xdl/ps-plus/ps-plus/common/time_utils.h b/xdl/ps-plus/ps-plus/common/time_utils.h
new file mode 100644
index 00000000..11653966
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/common/time_utils.h
@@ -0,0 +1,36 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_COMMON_TIME_UTILS_H
+#define PS_COMMON_TIME_UTILS_H
+
+#include <sys/time.h>
+#include <time.h>
+#include <cstdint>
+
+namespace ps {
+
+class TimeUtils {
+ public:
+  static uint64_t NowMicros() {
+    struct timeval  tv;
+    gettimeofday(&tv, NULL);
+    return static_cast<uint64_t>(tv.tv_sec) * 1000000 + tv.tv_usec;
+  }
+};
+
+} //ps
+
+#endif  // PS_COMMON_TIME_UTILS_H
diff --git a/xdl/ps-plus/ps-plus/common/zk_wrapper.cpp b/xdl/ps-plus/ps-plus/common/zk_wrapper.cpp
index 06680f29..f72257ed 100644
--- a/xdl/ps-plus/ps-plus/common/zk_wrapper.cpp
+++ b/xdl/ps-plus/ps-plus/common/zk_wrapper.cpp
@@ -18,7 +18,7 @@ limitations under the License.
 #include "ps-plus/common/string_utils.h"
 
 #include <iostream>
-#include <glog/logging.h>
+#include "ps-plus/common/logging.h"
 
 #define SEQIDLENGTH 128
 
diff --git a/xdl/ps-plus/ps-plus/main/main.cc b/xdl/ps-plus/ps-plus/main/main.cc
index 798ba917..9ef4bdd8 100644
--- a/xdl/ps-plus/ps-plus/main/main.cc
+++ b/xdl/ps-plus/ps-plus/main/main.cc
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+#include "ps-plus/common/logging.h"
 #include "ps-plus/common/option_parser.h"
 #include "ps-plus/server/server_service.h"
 #include "ps-plus/scheduler/scheduler_impl.h"
@@ -20,11 +21,8 @@ limitations under the License.
 
 #include <dlfcn.h>
 #include <thread>
-#include <glog/logging.h>
 
 int ServerRun(int argc, char** argv) {
-  google::InitGoogleLogging("ps-plus");
-//  FLAGS_logtostderr = 1;
   ps::OptionParser optParser;
   optParser.addOption("-sp", "--scheduler_kv_path", "scheduler_kv_path", ps::OptionParser::OPT_STRING, true);
   optParser.addOption("-si", "--server_id", "server_id", ps::OptionParser::OPT_INT32, true);
@@ -43,20 +41,20 @@ int ServerRun(int argc, char** argv) {
   std::string streaming_model_sparse;
   std::string streaming_model_hash;
   std::string bind_cores;
-
+  
   optParser.getOptionValue("scheduler_kv_path", scheduler_kv_path);
   optParser.getOptionValue("server_id", server_id);
   optParser.getOptionValue("streaming_model_dense", streaming_model_dense);
   optParser.getOptionValue("streaming_model_sparse", streaming_model_sparse);
   optParser.getOptionValue("streaming_model_hash", streaming_model_hash);
   optParser.getOptionValue("bind_cores", bind_cores);
-  ps::server::ServerService service(
-      scheduler_kv_path, server_id,
-      streaming_model_dense, streaming_model_sparse, 
-      streaming_model_hash, bind_cores == "True" ? true : false);
+
+  ps::server::ServerService service(scheduler_kv_path, server_id,
+                                    streaming_model_dense, streaming_model_sparse, streaming_model_hash,
+                                    bind_cores == "True" ? true : false);
   ps::Status st = service.Init();
   if (!st.IsOk()) {
-    LOG(ERROR) << "ERROR ON Server Init:" << st.ToString();
+    LOG(ERROR) << "ERROR ON Server Init: " << st.ToString();
     return -1;
   }
   while (true) {
@@ -113,11 +111,10 @@ int SchedulerRun(int argc, char** argv) {
 
   ps::scheduler::SchedulerImpl service(
       server_num, scheduler_kv_path, checkpoint_path, placement_arg,
-      streaming_model_dense, streaming_model_sparse, 
-      streaming_model_hash, bind_cores == "True" ? true : false);
+      streaming_model_dense, streaming_model_sparse, streaming_model_hash, bind_cores == "True" ? true : false);
   ps::Status st = service.Start();
   if (!st.IsOk()) {
-    LOG(ERROR) << "ERROR ON Server Init:" << st.ToString();
+    LOG(ERROR) << "ERROR ON Server Init: " << st.ToString();
     return -1;
   }
   while (true) {
diff --git a/xdl/ps-plus/ps-plus/message/func_ids.h b/xdl/ps-plus/ps-plus/message/func_ids.h
index f75f6f95..fbc532a3 100644
--- a/xdl/ps-plus/ps-plus/message/func_ids.h
+++ b/xdl/ps-plus/ps-plus/message/func_ids.h
@@ -33,7 +33,13 @@ static const int kSchedulerWorkerReportFinish       = 0x0001000b;
 static const int kSchedulerSynchronizeEnter         = 0x0001000c;
 static const int kSchedulerSynchronizeLeave         = 0x0001000d;
 static const int kSchedulerUpdateVariableVisitInfo  = 0x0001000e;
-static const int kSchedulerWorkerBarrier            = 0x0001000f;
+static const int kSchedulerGetWorkerFinishCount     = 0x0001000f;
+static const int kSchedulerWorkerBarrier            = 0x00010010;
+static const int kSchedulerInitGlobalFileQueue      = 0x00010011;
+static const int kSchedulerGetNextFile              = 0x00010012;
+static const int kSchedulerReportWorkerState        = 0x00010013;
+static const int kSchedulerRestoreWorkerState       = 0x00010014;
+static const int kSchedulerWorkerBarrierV2          = 0x00010015;
 
 static const int kServerRegisterUdfChain            = 0x00020001;
 static const int kServerProcess                     = 0x00020002;
diff --git a/xdl/ps-plus/ps-plus/message/message_serializer.cpp b/xdl/ps-plus/ps-plus/message/message_serializer.cpp
index 5d7477a7..f665d283 100644
--- a/xdl/ps-plus/ps-plus/message/message_serializer.cpp
+++ b/xdl/ps-plus/ps-plus/message/message_serializer.cpp
@@ -39,3 +39,9 @@ DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<ps::DenseVarNames>);
 SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<ps::DenseVarValues>);
 DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<ps::DenseVarValues>);
 
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<ps::WorkerState>);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<ps::WorkerState>);
+
+SERIALIZER_REGISTER(ps::serializer::WrapperDataSerializer<std::vector<ps::WorkerState> >);
+DESERIALIZER_REGISTER(ps::serializer::WrapperDataDerializer<std::vector<ps::WorkerState> >);
+
diff --git a/xdl/ps-plus/ps-plus/message/message_serializer.h b/xdl/ps-plus/ps-plus/message/message_serializer.h
index 7044a976..b70ff441 100644
--- a/xdl/ps-plus/ps-plus/message/message_serializer.h
+++ b/xdl/ps-plus/ps-plus/message/message_serializer.h
@@ -23,6 +23,7 @@ limitations under the License.
 #include "variable_info.h"
 #include "udf_chain_register.h"
 #include "streaming_model_infos.h"
+#include "worker_state.h"
 
 namespace ps {
 namespace serializer {
@@ -402,6 +403,79 @@ ps::Status SerializeHelper::Deserialize<ps::DenseVarValues>(
   return ps::Status::Ok();
 }
 
+template <>  
+ps::Status SerializeHelper::Serialize<ps::WorkerState>(
+    const ps::WorkerState* ws, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  Serialize<size_t>(&(ws->begin_), bufs, mem_guard);
+  Serialize<size_t>(&(ws->end_), bufs, mem_guard);
+  Serialize<size_t>(&(ws->epoch_), bufs, mem_guard);
+  Serialize<std::string>(&(ws->path_), bufs, mem_guard);
+  return ps::Status::Ok();
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<ps::WorkerState>(
+    const char* buf, 
+    ps::WorkerState* ws, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  size_t field_len;
+  Deserialize<size_t>(buf, &(ws->begin_), &field_len, mem_guard);
+  *len = field_len;
+  Deserialize<size_t>(buf + *len, &(ws->end_), &field_len, mem_guard);
+  *len += field_len;
+  Deserialize<size_t>(buf + *len, &(ws->epoch_), &field_len, mem_guard);
+  *len += field_len;
+  Deserialize<std::string>(buf + *len, &(ws->path_), &field_len, mem_guard);
+  *len += field_len;
+  return ps::Status::Ok();
+}
+
+template <>  
+ps::Status SerializeHelper::Serialize<std::vector<ps::WorkerState> >(
+    const std::vector<ps::WorkerState>* vws, 
+    std::vector<Fragment>* bufs,
+    MemGuard& mem_guard) {
+  size_t vec_len = vws->size();
+  Serialize<size_t>(&vec_len, bufs, mem_guard);  
+  for (auto& ws: *vws) {
+    Serialize<size_t>(&(ws.begin_), bufs, mem_guard);
+    Serialize<size_t>(&(ws.end_), bufs, mem_guard);
+    Serialize<size_t>(&(ws.epoch_), bufs, mem_guard);
+    Serialize<std::string>(&(ws.path_), bufs, mem_guard);
+  }
+
+  return ps::Status::Ok();
+}
+
+template <>
+ps::Status SerializeHelper::Deserialize<std::vector<ps::WorkerState> >(
+    const char* buf, 
+    std::vector<ps::WorkerState>* vws, 
+    size_t* len,
+    MemGuard& mem_guard) {
+  size_t vec_len = 0;
+  size_t field_len;
+  Deserialize<size_t>(buf, &(vec_len), &field_len, mem_guard);
+  *len = field_len;
+  for (size_t i = 0; i < vec_len; ++i) {
+    ps::WorkerState ws;
+    Deserialize<size_t>(buf, &(ws.begin_), &field_len, mem_guard);
+    *len += field_len;
+    Deserialize<size_t>(buf + *len, &(ws.end_), &field_len, mem_guard);
+    *len += field_len;
+    Deserialize<size_t>(buf + *len, &(ws.epoch_), &field_len, mem_guard);
+    *len += field_len;
+    Deserialize<std::string>(buf + *len, &(ws.path_), &field_len, mem_guard);
+    *len += field_len;
+    vws->push_back(ws);
+  }
+
+  return ps::Status::Ok();
+}
+
 } // namespace serializer
 } // namespace ps
 
diff --git a/xdl/ps-plus/ps-plus/message/streaming_model_manager.h b/xdl/ps-plus/ps-plus/message/streaming_model_manager.h
index acb3f4af..3879d670 100644
--- a/xdl/ps-plus/ps-plus/message/streaming_model_manager.h
+++ b/xdl/ps-plus/ps-plus/message/streaming_model_manager.h
@@ -42,9 +42,9 @@ class StreamingModelWriter {
     std::vector<std::pair<int64_t, int64_t>> del_ids;
   };
   virtual ~StreamingModelWriter() {}
-  virtual Status WriteDenseModel(const std::vector<DenseModel>& val) = 0;
-  virtual Status WriteSparseModel(const std::vector<SparseModel>& val) = 0;
-  virtual Status WriteHashModel(const std::vector<HashModel>& val) = 0;
+  virtual Status WriteDenseModel(const std::vector<DenseModel>& val, const std::string& stream_version) = 0;
+  virtual Status WriteSparseModel(const std::vector<SparseModel>& val, const std::string& stream_version, const int& server_id) = 0;
+  virtual Status WriteHashModel(const std::vector<HashModel>& val, const std::string& stream_version, const int& server_id) = 0;
 };
 
 class StreamingModelManager {
diff --git a/xdl/ps-plus/ps-plus/message/test/streaming_test.cc b/xdl/ps-plus/ps-plus/message/test/streaming_test.cc
new file mode 100644
index 00000000..4d1d2a29
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/message/test/streaming_test.cc
@@ -0,0 +1,73 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/message/streaming_model_infos.h"
+#include "ps-plus/message/streaming_model_manager.h"
+
+using ps::StreamingModelManager;
+using ps::StreamingModelWriter;
+using ps::DenseVarNames;
+using ps::DenseVarValues;
+using ps::Tensor;
+using ps::Status;
+
+TEST(StreamingTest, Streaming) {
+  {
+    auto dvn = new DenseVarNames();
+    dvn->names.push_back("hello");
+    dvn->names.push_back("world");
+    ASSERT_EQ(dvn->names.size(), 2);
+    delete dvn;
+  }
+
+  {
+    auto dvv = new DenseVarValues();
+    struct DenseVarValues::DenseVarValue vv;
+    vv.name = "robin";
+    vv.offset = 0;
+    Tensor tensor;
+    vv.data = tensor;
+    dvv->values.push_back(vv);
+    ASSERT_EQ(dvv->values.size(), 1);
+    delete dvv;
+  }
+
+  {
+    Tensor tensor;
+
+    auto dm = new StreamingModelWriter::DenseModel();
+    dm->name = "first";
+    dm->data = tensor;
+    ASSERT_NE(dm, nullptr);
+    delete dm;
+
+    auto sm = new StreamingModelWriter::SparseModel();
+    sm->name = "second";
+    sm->data = tensor;
+    sm->ids.push_back(1);
+    sm->ids.push_back(2);
+    sm->offsets.push_back(3);
+    sm->offsets.push_back(4);
+    ASSERT_EQ(sm->ids.size(), 2);
+    delete sm;
+
+    auto hm = new StreamingModelWriter::HashModel();
+    hm->ids.push_back(std::make_pair(3, 9));
+    hm->ids.push_back(std::make_pair(9, 81));
+    ASSERT_EQ(hm->ids.size(), 2);
+    delete hm;
+  }
+}
diff --git a/xdl/ps-plus/ps-plus/message/variable_info.cc b/xdl/ps-plus/ps-plus/message/variable_info.cc
new file mode 100644
index 00000000..6d955644
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/message/variable_info.cc
@@ -0,0 +1,23 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "variable_info.h"
+
+namespace ps {
+
+const std::string VariableInfo::ORIGIN_FILE_PATH = "origin_file_path";
+const std::string VariableInfo::ORIGIN_NAME = "oname";
+
+}
diff --git a/xdl/ps-plus/ps-plus/message/variable_info.h b/xdl/ps-plus/ps-plus/message/variable_info.h
index e361c78a..8c109744 100644
--- a/xdl/ps-plus/ps-plus/message/variable_info.h
+++ b/xdl/ps-plus/ps-plus/message/variable_info.h
@@ -27,8 +27,9 @@ namespace ps {
 
 struct VariableInfo {
   enum Type {
-    kIndex,
-    kHash
+    kIndex = 0,
+    kHash128 = 1,
+    kHash64 = 2,
   };
   struct Part {
     size_t server;
@@ -43,6 +44,9 @@ struct VariableInfo {
   size_t visit_time;
   int64_t dense_visit_ids;
   int64_t sparse_visit_ids;
+
+  static const std::string ORIGIN_FILE_PATH;
+  static const std::string ORIGIN_NAME;
 };
 
 struct VariableInfoCollection {
diff --git a/xdl/ps-plus/ps-plus/message/worker_state.cc b/xdl/ps-plus/ps-plus/message/worker_state.cc
new file mode 100644
index 00000000..8fb57ad7
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/message/worker_state.cc
@@ -0,0 +1,37 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "worker_state.h"
+
+namespace ps {
+
+WorkerState::WorkerState() 
+  : begin_(0)
+  , end_(0)
+  , epoch_(0) {
+}
+
+WorkerState::WorkerState(
+      size_t begin, 
+      size_t end, 
+      size_t epoch, 
+      const std::string& path)
+  : begin_(begin)
+  , end_(end)
+  , epoch_(epoch)
+  , path_(path) {
+}
+
+}
diff --git a/xdl/ps-plus/ps-plus/message/worker_state.h b/xdl/ps-plus/ps-plus/message/worker_state.h
new file mode 100644
index 00000000..a133d6b1
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/message/worker_state.h
@@ -0,0 +1,40 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_COMMON_WORKER_STATE_H_
+#define PS_COMMON_WORKER_STATE_H_
+
+#include <cstdint>
+#include <string>
+#include <cstdio>
+
+namespace ps {
+
+struct WorkerState {
+  size_t begin_;
+  size_t end_;
+  size_t epoch_;
+  std::string path_;
+  WorkerState();
+  WorkerState(
+      size_t begin, 
+      size_t end, 
+      size_t epoch, 
+      const std::string& path);
+};
+
+}
+
+#endif // PS_COMMON_WORKER_STATE_H_
diff --git a/xdl/ps-plus/ps-plus/model_server/model_server_service.cc b/xdl/ps-plus/ps-plus/model_server/model_server_service.cc
index 9f81b258..ec419ce5 100644
--- a/xdl/ps-plus/ps-plus/model_server/model_server_service.cc
+++ b/xdl/ps-plus/ps-plus/model_server/model_server_service.cc
@@ -24,7 +24,7 @@ limitations under the License.
 #include <tuple>
 #include <future>
 #include <tuple>
-#include <glog/logging.h>
+#include "ps-plus/common/logging.h"
 
 namespace ps {
 namespace modelserver {
diff --git a/xdl/ps-plus/ps-plus/model_server/test/forward_test.cc b/xdl/ps-plus/ps-plus/model_server/test/forward_test.cc
index 90e9ffa2..8d95be44 100644
--- a/xdl/ps-plus/ps-plus/model_server/test/forward_test.cc
+++ b/xdl/ps-plus/ps-plus/model_server/test/forward_test.cc
@@ -53,7 +53,7 @@ TEST(ForwardSimpleCacheTest, ForwardSimpleCache) {
   auto factory = ps::GetPlugin<ForwardRegistry>("simple_cache");
   ASSERT_NE(factory, nullptr);
   {
-    Tensor tensor(DataType::kInt64, TensorShape({1, 1024}), new ConstantInitializer(0), false);
+    Tensor tensor(DataType::kInt64, TensorShape({1, 1024}), new ConstantInitializer(0), Tensor::TType::kContinuous, false);
     ForwardCache::Callback callback = [&tensor](Status st, Tensor tensor) {
       st = Status::Ok();
     };
diff --git a/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.cc b/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.cc
index ec241480..e034c908 100644
--- a/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.cc
+++ b/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.cc
@@ -74,11 +74,11 @@ Status LibHDFS::LoadAndBind() {
   const char* hdfs_root = getenv("HADOOP_HDFS_HOME");
   if (hdfs_root == nullptr) {
     return Status::NotFound("HADOOP_HDFS_HOME is not set");
-  } 
+  }
   const std::string& libhdfs = std::string(hdfs_root) + "/lib/native/libhdfs.so";
   void* dl = dlopen(libhdfs.c_str(), RTLD_LAZY);
   if (dl == nullptr) {
-    return Status::NotFound(dlerror());
+    return Status::NotFound("cannot find $HADOOP_HDFS_HOME/lib/native/libhdfs.so");
   }
   return LoadSymbols(dl);
 }
diff --git a/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.h b/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.h
index 55ba2ee2..f6f70a0b 100644
--- a/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.h
+++ b/xdl/ps-plus/ps-plus/plugins/hdfs/libhdfs.h
@@ -16,9 +16,9 @@ limitations under the License.
 #ifndef PLUGINS_HDFS_LIBHDFS_H_
 #define PLUGINS_HDFS_LIBHDFS_H_
 
+#include "third_party/hdfs/hdfs.h"
 #include "ps-plus/common/status.h"
 #include <functional>
-#include <hdfs.h>
 
 namespace ps {
 namespace hdfs {
diff --git a/xdl/ps-plus/ps-plus/profiler/hashmap.cc b/xdl/ps-plus/ps-plus/profiler/hashmap.cc
index 9f6d5d38..14dd479c 100644
--- a/xdl/ps-plus/ps-plus/profiler/hashmap.cc
+++ b/xdl/ps-plus/ps-plus/profiler/hashmap.cc
@@ -26,6 +26,7 @@ const int hint = 1 << 10;
 std::vector<std::unique_ptr<std::mt19937>> rands;
 std::random_device rd;
 
+#if 0
 PROFILE(hashmap, 32, 100000).Init([](size_t threads){
   rands.clear();
   for (size_t i = 0; i < threads; i++) {
@@ -55,3 +56,4 @@ PROFILE(hashmap, 32, 100000).Init([](size_t threads){
     }
   }
 });
+#endif
diff --git a/xdl/ps-plus/ps-plus/scheduler/anneal_placementer.cc b/xdl/ps-plus/ps-plus/scheduler/anneal_placementer.cc
index 44fe64ea..665aab8f 100644
--- a/xdl/ps-plus/ps-plus/scheduler/anneal_placementer.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/anneal_placementer.cc
@@ -301,7 +301,7 @@ class AnnealPlacementer : public Placementer {
           x.slice_mem = SizeOfType(info.datatype) * slice_size * mem_ratio;
           x.slice_net = SizeOfType(info.datatype) * slice_size * ratio;
         }
-      } else if (info.type == VariableInfo::kHash) {
+      } else if (info.type == VariableInfo::kHash128 || info.type == VariableInfo::kHash64) {
         if (info.shape.empty()) {
           return Status::ArgumentError("Hash Should at least 1 dim");
         }
diff --git a/xdl/ps-plus/ps-plus/scheduler/balance_placementer.cc b/xdl/ps-plus/ps-plus/scheduler/balance_placementer.cc
index c21ad83f..aea64413 100644
--- a/xdl/ps-plus/ps-plus/scheduler/balance_placementer.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/balance_placementer.cc
@@ -23,7 +23,7 @@ limitations under the License.
 #include <sstream>
 #include <unordered_map>
 #include <cstdlib>
-#include <glog/logging.h>
+#include "ps-plus/common/logging.h"
 
 namespace ps {
 namespace scheduler {
@@ -46,6 +46,7 @@ struct VariableInfos {
     int64_t dense_visit_ids;
     int64_t sparse_visit_ids;
     bool no_split;
+    int64_t dimension;
   };
 
   struct ServerInfo {
@@ -184,7 +185,7 @@ class BalancePlacementer : public Placementer {
     std::string meta_addr = meta_var;
     std::unique_ptr<FileSystem::ReadStream> s;
     PS_CHECK_STATUS(FileSystem::OpenReadStreamAny(meta_addr, &s));
-    LOG(INFO) << "Load Placement Meta Info From:" << meta_addr;
+    LOG(INFO) << "Load Placement Meta Info From: " << meta_addr;
     size_t meta_size;
     size_t max_visit = 0;
     PS_CHECK_STATUS(s->ReadRaw(&meta_size));
@@ -193,9 +194,9 @@ class BalancePlacementer : public Placementer {
       std::string meta_data;
       PS_CHECK_STATUS(s->ReadStr(&meta_data));
       std::istringstream is(meta_data);
-      is >> x.name >> x.visit_time >> x.dense_visit_ids >> x.sparse_visit_ids;
+      is >> x.name >> x.visit_time >> x.dense_visit_ids >> x.sparse_visit_ids >> x.dimension;
       if (x.visit_time > max_visit) { max_visit = x.visit_time; }
-      var_map[x.name] = x;   
+      var_map[x.name] = x;
     }
 
     infos.mem = arg.mem;
@@ -217,7 +218,7 @@ class BalancePlacementer : public Placementer {
       x.no_split = argiter == info.args.end() ? false : true;
       if (info.type == VariableInfo::kIndex) {
         if (info.shape.empty()) {
-          x.slice_num = 1;
+          x.slice_num = x.dimension;
           x.slice_mem = SizeOfType(info.datatype) * mem_ratio;
           if (x.visit_time == 0) { slice_ratio = 0; }
           else { slice_ratio = double(x.dense_visit_ids + x.sparse_visit_ids) / max_visit / x.slice_num; }
@@ -228,14 +229,14 @@ class BalancePlacementer : public Placementer {
           for (size_t i = 1; i < info.shape.size(); i++) {
             slice_size *= info.shape[i];
           }
-          x.slice_num = info.shape[0];
+          x.slice_num = x.dimension;
           x.slice_mem = SizeOfType(info.datatype) * slice_size * mem_ratio;
           if (x.visit_time == 0) { slice_ratio = 0; }
           else { slice_ratio = double(x.dense_visit_ids + x.sparse_visit_ids) / max_visit / x.slice_num; }
           x.slice_net = SizeOfType(info.datatype) * slice_size * slice_ratio;
           x.slice_cpu = x.dense_visit_ids == 0 ? slice_size * slice_ratio : slice_size * kSparseCpuRatio * slice_ratio;
         }
-      } else if (info.type == VariableInfo::kHash) {
+      } else if (info.type == VariableInfo::kHash128 || info.type == VariableInfo::kHash64) {
         if (info.shape.empty()) {
           return Status::ArgumentError("Hash Should at least 1 dim");
         }
@@ -244,11 +245,11 @@ class BalancePlacementer : public Placementer {
           slice_size *= info.shape[i];
         }
         x.slice_num = Hasher::kTargetRange;
-        x.slice_mem = double((SizeOfType(info.datatype) * slice_size * mem_ratio + kHashMem) * info.shape[0]) * 2 / Hasher::kTargetRange;
+        x.slice_mem = double((SizeOfType(info.datatype) * slice_size * mem_ratio + kHashMem) * x.dimension) * 2 / Hasher::kTargetRange;
         if (x.visit_time == 0) { slice_ratio = 0; }
-        else { slice_ratio = double(x.dense_visit_ids + x.sparse_visit_ids) / max_visit / info.shape[0]; }
-        x.slice_net = double(SizeOfType(info.datatype) * slice_size * info.shape[0] * slice_ratio) / Hasher::kTargetRange;
-        x.slice_cpu = double(kHashCpuRatio * slice_size * info.shape[0] * slice_ratio) / Hasher::kTargetRange;
+        else { slice_ratio = double(x.dense_visit_ids + x.sparse_visit_ids) / max_visit / x.dimension; }
+        x.slice_net = double(SizeOfType(info.datatype) * slice_size * x.dimension * slice_ratio) / Hasher::kTargetRange;
+        x.slice_cpu = double(kHashCpuRatio * slice_size * x.dimension * slice_ratio) / Hasher::kTargetRange;
       } else {
         return Status::NotImplemented("Balance Placementer not support type: " + std::to_string(info.type) + " @ " + info.name);
       }
@@ -283,6 +284,10 @@ class BalancePlacementer : public Placementer {
         }
         ptr++;
       }
+      if (!info.shape.empty()) {
+        auto iter = var_map.find(info.name);
+        info.shape[0] = iter->second.dimension;
+      }
       outputs->push_back(info);
     }
     return Status::Ok();
diff --git a/xdl/ps-plus/ps-plus/scheduler/balance_placementer_v2.cc b/xdl/ps-plus/ps-plus/scheduler/balance_placementer_v2.cc
new file mode 100644
index 00000000..28a4e84d
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/scheduler/balance_placementer_v2.cc
@@ -0,0 +1,321 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/scheduler/placementer.h"
+#include "ps-plus/common/hasher.h"
+#include "ps-plus/common/logging.h"
+
+#include <map>
+#include <vector>
+#include <algorithm>
+
+namespace ps {
+namespace scheduler {
+
+static const double kHashMem = 128;
+static const double kDefaultMemRatio = 2;
+
+namespace {
+
+struct VariableInfos {
+  struct Variable {
+    enum Type {
+      kDense,
+      kSparse,
+      kHash
+    };
+    Type type;
+    std::string name;
+    double slice_mem;
+    double slice_net;
+    size_t slice_num;
+    bool no_split;
+  };
+
+  struct ServerInfo {
+    double mem;
+    double net;
+    size_t socket;
+  };
+
+  std::vector<Variable> dense_vars;
+  std::vector<Variable> sparse_vars;
+  std::vector<Variable> hash_vars;
+  std::vector<ServerInfo> servers;
+  size_t mem;
+  double avg_net;
+  double avg_sparse_mem;
+};
+
+struct Solution {
+  struct Part {
+    size_t server;
+    size_t size;
+  };
+  struct Server {
+    double mem;
+    double net;
+    size_t socket;
+  };
+  std::unordered_map<std::string, std::vector<Part>> parts_map;
+  std::vector<Server> servers;
+};
+
+bool CreateBase(const VariableInfos& infos, Solution* solution) {
+  for (auto server : infos.servers) {
+    solution->servers.push_back(Solution::Server{.mem = server.mem, .net = server.net, .socket = server.socket});
+  }
+  std::vector<VariableInfos::Variable> vars;
+  vars.insert(vars.end(), infos.dense_vars.begin(), infos.dense_vars.end());
+  vars.insert(vars.end(), infos.sparse_vars.begin(), infos.sparse_vars.end());
+  vars.insert(vars.end(), infos.hash_vars.begin(), infos.hash_vars.end());
+  //solution->parts.resize(vars.size());
+  size_t s = 0;
+  for (size_t i = 0; i < vars.size(); i++) {
+    size_t a = vars[i].slice_num;
+    while (a > 0 && s < solution->servers.size()) {
+      size_t size = std::min((size_t)((infos.mem - solution->servers[s].mem) / vars[i].slice_mem + 1), a);
+      solution->servers[s].mem += vars[i].slice_mem * size;
+      //solution->parts[i].push_back(Solution::Part{.server = s, .size = size});
+      a -= size;
+      if (solution->servers[s].mem >= infos.mem) {
+        s++;
+      }
+    }
+    if (s >= solution->servers.size()) {
+      break;
+    }
+  }
+  if (s >= solution->servers.size()) {
+    return false;
+  }
+  return true;
+}
+
+void CreateBalance(const VariableInfos& infos, Solution* solution) {
+  for (auto server : infos.servers) {
+    solution->servers.push_back(Solution::Server{.mem = server.mem, .net = server.net, .socket = server.socket});
+  }
+  size_t s = 0;
+  size_t total_socket = infos.dense_vars.size() + infos.sparse_vars.size() + infos.hash_vars.size();
+  double avg_net = infos.avg_net;
+  double avg_sparse_mem = infos.avg_sparse_mem;
+  for (size_t i = 0; i < infos.hash_vars.size(); ++i) {
+    size_t a = infos.hash_vars[i].slice_num;
+    solution->parts_map[infos.hash_vars[i].name] = std::vector<Solution::Part>();
+    for (size_t j = 0; j < solution->servers.size(); ++j) {
+      size_t size = std::min((size_t)(Hasher::kTargetRange / solution->servers.size()) + 1, a);
+      solution->servers[j].mem += infos.hash_vars[i].slice_mem * size;
+      solution->servers[j].socket++;
+      if (a != size) { total_socket++; }
+      solution->parts_map[infos.hash_vars[i].name].push_back(Solution::Part{.server = j, .size = size});
+      a -= size;
+      if (a == 0) { break; }
+    }
+  }
+  s = 0;
+  for (size_t i = 0; i < infos.sparse_vars.size(); ++i) {
+    size_t a = infos.sparse_vars[i].slice_num;
+    solution->parts_map[infos.sparse_vars[i].name] = std::vector<Solution::Part>();
+    while (a > 0 && s < solution->servers.size()) {
+      size_t size;
+      if (infos.avg_sparse_mem < solution->servers[s].mem) {
+        s++;
+        continue;
+      };
+      size = std::min((size_t)((infos.avg_sparse_mem - solution->servers[s].mem) / infos.sparse_vars[i].slice_mem + 1) , a);
+      solution->servers[s].mem += infos.sparse_vars[i].slice_mem * size;
+      solution->servers[s].socket++;
+      if (a != size) { total_socket++; }
+      solution->parts_map[infos.sparse_vars[i].name].push_back(Solution::Part{.server = s, .size = size});
+      a -= size;
+      if (solution->servers[s].mem >= infos.avg_sparse_mem) {
+        s++;
+      }
+    }
+    if (s >= solution->servers.size()) {
+      break;
+    }
+  }
+  if (s >= solution->servers.size()) {
+    LOG(INFO) << "Sparse variable memory out of range";
+  }
+  s = 0;
+  for (size_t i = 0; i < infos.dense_vars.size(); ++i) {
+    size_t a = infos.dense_vars[i].slice_num;
+    solution->parts_map[infos.dense_vars[i].name] = std::vector<Solution::Part>();
+    while (a > 0 && s < solution->servers.size()) {
+      size_t size;
+      if (infos.dense_vars[i].slice_net == 0) {
+        size = std::min((size_t)((infos.mem - solution->servers[s].mem) / infos.dense_vars[i].slice_mem) , a);
+        if ((double)(size * solution->servers.size()) / a < 0.2) {
+          s++;
+          if (s >= solution->servers.size()) { s = 0; total_socket += solution->servers.size(); avg_net *= 1.1; }
+          continue;
+        }
+      } else {
+        size = std::min((size_t)((avg_net - solution->servers[s].net) / infos.dense_vars[i].slice_net) , a);
+        size = std::min((size_t)((infos.mem - solution->servers[s].mem) / infos.dense_vars[i].slice_mem) , size);
+        if ((double)(size * solution->servers.size()) / a < 0.2) {
+          s++;
+          if (s >= solution->servers.size()) { s = 0; total_socket += solution->servers.size(); avg_net *= 1.1; }
+          continue;
+        }
+      }
+      if (infos.dense_vars[i].no_split == true && size != a) {
+        s++;
+        if (s >= solution->servers.size()) { s = 0; total_socket += solution->servers.size(); avg_net *= 1.1; }
+        continue;
+      }
+      solution->servers[s].mem += infos.dense_vars[i].slice_mem * size;
+      solution->servers[s].net += infos.dense_vars[i].slice_net * size;
+      if (infos.dense_vars[i].slice_net != 0) { solution->servers[s].socket++; }
+      if (a != size) { total_socket++; }
+      size_t iter;
+      for (iter = 0; iter < solution->parts_map[infos.dense_vars[i].name].size(); ++iter) {
+        if (s == solution->parts_map[infos.dense_vars[i].name][iter].server) {
+          solution->parts_map[infos.dense_vars[i].name][iter].size += size;
+          break;
+        }
+      }
+      if (iter == solution->parts_map[infos.dense_vars[i].name].size()) {
+        solution->parts_map[infos.dense_vars[i].name].push_back(Solution::Part{.server = s, .size = size});
+      }
+      a -= size;
+      if (solution->servers[s].mem >= infos.mem || solution->servers[s].net >= avg_net 
+        || solution->servers[s].socket >= total_socket / solution->servers.size() + 2) {
+        s++;
+      }
+      if (s >= solution->servers.size()) { s = 0; total_socket += solution->servers.size(); avg_net *= 1.1; }
+    }
+  }     
+}
+
+bool Get(const VariableInfos& infos, Solution* solution) {
+  Solution sol;
+  if (!CreateBase(infos, &sol)) {
+    return false;
+  }
+  CreateBalance(infos, solution);
+  return true;
+}
+
+}
+
+class BalancePlacementerV2 : public Placementer {
+ public:
+  virtual Status Placement(const std::vector<VariableInfo>& inputs, std::vector<VariableInfo>* outputs, const Arg& arg, size_t server) override {
+    VariableInfos infos;
+    infos.mem = arg.mem;
+    double total_net = 0;
+    double total_sparse_mem = 0;
+    for (size_t i = 0; i < server; ++i) {
+      infos.servers.push_back(VariableInfos::ServerInfo{.mem = 0, .net = 0, .socket = 0});
+    }
+    for (const VariableInfo& info : inputs) {
+      VariableInfos::Variable x;
+      x.name = info.name;
+      auto argiter = info.args.find("mem_ratio");
+      double mem_ratio = argiter == info.args.end() ? kDefaultMemRatio : atof(argiter->second.c_str());
+      argiter = info.args.find("no_split");
+      x.no_split = argiter == info.args.end() ? false : true;
+      if (info.type == VariableInfo::kIndex) {
+        if (info.shape.empty()) {
+          x.slice_num = 1;
+          x.slice_mem = SizeOfType(info.datatype) * mem_ratio;
+          x.slice_net = SizeOfType(info.datatype);
+          x.type = VariableInfos::Variable::kDense;
+        } else {
+          size_t slice_size = 1;
+          for (size_t i = 1; i < info.shape.size(); i++) {
+            slice_size *= info.shape[i];
+          }
+          auto iter = info.args.find("batch_read");
+          double ratio = iter == info.args.end() ? 1 : atof(iter->second.c_str()) / info.shape[0];
+          x.type = iter == info.args.end() ? VariableInfos::Variable::kDense : VariableInfos::Variable::kSparse;
+          x.slice_num = info.shape[0];
+          x.slice_mem = SizeOfType(info.datatype) * slice_size * mem_ratio;
+          iter = info.args.find("io_ratio");
+          double io_ratio = iter == info.args.end() ? 1 : atof(iter->second.c_str());
+          x.slice_net = SizeOfType(info.datatype) * slice_size * ratio * io_ratio;
+          if (x.type == VariableInfos::Variable::kSparse) {
+            total_sparse_mem += x.slice_num * x.slice_mem;
+          }
+        }
+      } else if (info.type == VariableInfo::kHash128 || info.type == VariableInfo::kHash64) {
+        if (info.shape.empty()) {
+          return Status::ArgumentError("Hash Should at least 1 dim");
+        }
+        size_t slice_size = 1;
+        for (size_t i = 1; i < info.shape.size(); i++) {
+          slice_size *= info.shape[i];
+        }
+        auto iter = info.args.find("batch_read");
+        int64_t batch_read = iter == info.args.end() ? info.shape[0] : atoll(iter->second.c_str());
+        x.type = VariableInfos::Variable::kHash;
+        x.slice_num = Hasher::kTargetRange;
+        //x.slice_mem = double((SizeOfType(info.datatype) * slice_size * mem_ratio + kHashMem) * info.shape[0]) * 2 / Hasher::kTargetRange;
+        x.slice_mem = 1;
+        iter = info.args.find("io_ratio");
+        double io_ratio = iter == info.args.end() ? 1 : atof(iter->second.c_str());
+        x.slice_net = double(SizeOfType(info.datatype) * slice_size * batch_read * io_ratio) / Hasher::kTargetRange;
+      } else {
+        return Status::NotImplemented("Balance PlacementerV2 not support type: " + std::to_string(info.type) + " @ " + info.name);
+      }
+      if(x.type == VariableInfos::Variable::kDense) {
+        total_net += x.slice_net * x.slice_num;
+      }
+      if (info.parts.empty()) {
+        if (x.type == VariableInfos::Variable::kDense) { infos.dense_vars.push_back(x); }
+        else if (x.type == VariableInfos::Variable::kSparse) { infos.sparse_vars.push_back(x); }
+        else if (x.type == VariableInfos::Variable::kHash) { infos.hash_vars.push_back(x); }
+      } else {
+        for (auto&& part : info.parts) {
+          if (x.type == VariableInfos::Variable::kDense) {
+            infos.servers[part.server].net += x.slice_net * part.size;
+          }
+          infos.servers[part.server].mem += x.slice_mem * part.size;
+          infos.servers[part.server].socket++;
+        }
+      }
+    }
+    infos.avg_net = total_net / server;
+    infos.avg_sparse_mem = total_sparse_mem / server;
+    Solution solution;
+    if (infos.dense_vars.size() + infos.sparse_vars.size() + infos.hash_vars.size() > 0) {
+      bool result = Get(infos, &solution);
+      if (!result) {
+        return Status::ArgumentError("Cannot Placement, Too Heavy");
+      }
+    }
+    outputs->clear();
+    for (VariableInfo info : inputs) {
+      if (info.parts.empty()) {
+        auto parts_iter = solution.parts_map.find(info.name);
+        for (auto item : parts_iter->second) {
+          info.parts.push_back(VariableInfo::Part{.server = item.server, .size = item.size});
+        }
+      }
+      outputs->push_back(info);
+    }
+    return Status::Ok();
+  }
+};
+
+PLUGIN_REGISTER(Placementer, BalanceV2, BalancePlacementerV2);
+
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.cc b/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.cc
index c2c4f979..b140f074 100644
--- a/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.cc
@@ -20,28 +20,32 @@ limitations under the License.
 #include <future>
 #include <sstream>
 #include <cstdlib>
-#include <glog/logging.h>
 
+#include "ps-plus/common/logging.h"
+#include "ps-plus/common/string_utils.h"
 #include "ps-plus/common/file_system.h"
 #include "ps-plus/common/serializer.h"
 #include "ps-plus/common/initializer/none_initializer.h"
 
+#define CHECK_COND(cond, str) do {if (!(cond)) {return Status::ArgumentError(str);}} while(0);
+
 using namespace ps;
 using namespace ps::scheduler;
 using namespace std;
 using namespace std::chrono;
 
 SchedulerImpl::SchedulerImpl(
-    const std::string& server_count,
-    const std::string& scheduler_addr,
-    const std::string& checkpoint_path,
+    const string& server_count,
+    const string& scheduler_addr,
+    const string& checkpoint_path,
     const Placementer::Arg& placement_arg,
-    const std::string& streaming_dense_model_addr,
-    const std::string& streaming_sparse_model_addr,
-    const std::string& streaming_hash_model_addr,
+    const string& streaming_dense_model_addr,
+    const string& streaming_sparse_model_addr,
+    const string& streaming_hash_model_addr,
     bool bind_cores)
     : main_thread_(nullptr), meta_thread_(nullptr), stopped_(false), ready_(false),
       version_(kUnusedVersion),
+      server_count_(server_count),
       checkpoint_path_(checkpoint_path),
       placement_arg_(placement_arg),
       streaming_dense_model_addr_(streaming_dense_model_addr),
@@ -54,7 +58,7 @@ SchedulerImpl::SchedulerImpl(
   if (meta_var != NULL) { meta_string_ = meta_var; }
   else { meta_string_ = ""; }
   if (vp_string_ == "balance") { placementer_ = GetPlugin<Placementer>("Balance"); }
-  else { placementer_ = GetPlugin<Placementer>("Anneal"); }
+  else { placementer_ = GetPlugin<Placementer>("BalanceV2"); }
   lazy_queue_.reset(new ThreadPool(1));
   synchronizer_queue_.reset(new ThreadPool(1));
 }
@@ -87,6 +91,10 @@ Version SchedulerImpl::GetVersion() {
 
 Status SchedulerImpl::RegisterServer(const ServerInfo& server) {
   unique_lock<mutex> lock(m_);
+  if (disconnected_server_.find(server) != disconnected_server_.end()) {
+    LOG(INFO) << "Skip Disconnected Server " << server.ToString();
+    return Status::ArgumentError("you are died.");
+  }
   const std::pair<ServerType, ServerId> id(server.GetServerType(), server.GetId());
   const auto& it = servers_.find(id);
   if (it == servers_.end()) {
@@ -97,10 +105,11 @@ Status SchedulerImpl::RegisterServer(const ServerInfo& server) {
     ServerInfo old_server = it->second;
     if (old_server != server) {
       ready_ = false;
+      r_ready_ = false;
       servers_[id] = server;
       service_->SetServer(id.first, id.second, server.Address());
-      LOG(INFO) << "Server" << old_server.ToString() << 
-        " failed And Restore at " << server.ToString();
+      LOG(INFO) << "Server" << old_server.ToString() << " failed And Restore at " << server.ToString();
+      disconnected_server_.insert(old_server);
       op_cv_.notify_all();
     }
   }
@@ -128,16 +137,61 @@ void SchedulerImpl::Restore(Version version, const string& checkpoint,
   AssignOp(kRestore, version, checkpoint, cb);
 }
 
-void SchedulerImpl::TriggerStreamingDense(Version version, OpCallback cb) {
-  lazy_queue_->Schedule([=](){cb(InternalTriggerStreamingDense(version));});
+void SchedulerImpl::TriggerStreamingDense(Version version, const std::string& stream_version, OpCallback cb) {
+  lazy_queue_->Schedule([=](){cb(InternalTriggerStreamingDense(version, stream_version));});
+}
+
+Status SchedulerImpl::InitGlobalQueue(
+    Version version, 
+    const std::string& name,
+    const std::vector<std::string>& paths,
+    size_t epochs,
+    bool epoch_isolate) {
+  std::unique_lock<std::mutex> lock(mu_);
+  auto it = global_file_queues_.find(name);
+  if (it == global_file_queues_.end()) {
+    global_file_queues_[name].reset(new GlobalFileQueue());
+  }
+
+  return global_file_queues_[name]->Init(
+      paths, epochs, epoch_isolate);
+}
+
+Status SchedulerImpl::GetNextFile(
+    Version version, 
+    const std::string& name,
+    size_t worker_id, 
+    WorkerState* ws) {
+  std::unique_lock<std::mutex> lock(mu_);
+  return global_file_queues_[name]->GetNextFile(
+      worker_id, ws);
+}
+
+Status SchedulerImpl::ReportWorkerState(
+    Version version, 
+    const std::string& name,
+    size_t worker_id,
+    const std::vector<ps::WorkerState>& worker_states) {
+  std::unique_lock<std::mutex> lock(mu_);
+  return global_file_queues_[name]->ReportWorkerState(
+      worker_id, worker_states);
+}
+
+Status SchedulerImpl::RestoreWorkerState(
+    Version version, 
+    const std::string& name,
+    size_t worker_id) {
+  std::unique_lock<std::mutex> lock(mu_);
+  return global_file_queues_[name]->RestoreWorkerState(
+      worker_id);
 }
 
-void SchedulerImpl::TriggerStreamingSparse(Version version, OpCallback cb) {
-  lazy_queue_->Schedule([=](){cb(InternalTriggerStreamingSparse(version));});
+void SchedulerImpl::TriggerStreamingSparse(Version version, const std::string& stream_version, OpCallback cb) {
+  lazy_queue_->Schedule([=](){cb(InternalTriggerStreamingSparse(version, stream_version));});
 }
 
-void SchedulerImpl::TriggerStreamingHash(Version version, OpCallback cb) {
-  lazy_queue_->Schedule([=](){cb(InternalTriggerStreamingHash(version));});
+void SchedulerImpl::TriggerStreamingHash(Version version, const std::string& stream_version, OpCallback cb) {
+  lazy_queue_->Schedule([=](){cb(InternalTriggerStreamingHash(version, stream_version));});
 }
 
 void SchedulerImpl::AsynchronizeEnter(Version version, int id, int staleness, int worker_count,
@@ -159,7 +213,6 @@ void SchedulerImpl::SynchronizeLeave(Version version, int id, int64_t token, fun
   });
 }
 
-
 void SchedulerImpl::WorkerReportFinish(Version version, int id, function<void (const Status&)> cb) {
   synchronizer_queue_->Schedule([=] {
     InternalWorkerReportFinish(version, id, cb);
@@ -172,6 +225,24 @@ void SchedulerImpl::WorkerBarrier(Version version, int id, int worker_count, fun
   });
 }
 
+void SchedulerImpl::WorkerBarrierV2(
+    Version version, 
+    int barrier_id, 
+    int task_id, 
+    int task_num,
+    int token,
+    function<void (const Status&)> cb) {
+  synchronizer_queue_->Schedule([=] {
+    InternalWorkerBarrierV2(version, barrier_id, task_id, task_num, token, cb);
+  });
+}
+
+void SchedulerImpl::GetWorkerFinishCount(Version version, function<void (int64_t, const Status&)> cb) {
+  synchronizer_queue_->Schedule([=] {
+    InternalGetWorkerFinishCount(version, cb);
+  });
+}
+
 Status SchedulerImpl::UpdateVariableInfo(Version version,
                                          const vector<VariableInfo>& info,
                                          vector<VariableInfo>* result) {
@@ -185,11 +256,21 @@ Status SchedulerImpl::InternalUpdateVariableInfo(const vector<VariableInfo>& inf
   map<string, VariableInfo> m;
   for (const auto& i: info) { m[i.name] = i; }
   for (auto& i: variable_info_) {
-    if (m[i.name].type == VariableInfo::Type::kHash) {
+    if (m[i.name].type == VariableInfo::Type::kHash128 || m[i.name].type == VariableInfo::Type::kHash64) {
       i.shape[0] = m[i.name].shape[0];
     }
   }
   for (const auto& i: variable_info_) { m[i.name] = i; }
+
+  // fill in new args
+  std::vector<std::string> arg_names{"save_ratio", "batch_read", "mem_ratio", "no_split", "save", VariableInfo::ORIGIN_NAME, VariableInfo::ORIGIN_FILE_PATH};
+  for (const auto& i: info) {
+    for (auto& arg_name: arg_names) {
+      auto it = i.args.find(arg_name);
+      if (it != i.args.end()) m[i.name].args[arg_name] = it->second;
+    }
+  }
+
   vector<VariableInfo> v;
   for (const auto& it: m) { v.push_back(it.second); }
   const auto& st = placementer_->Placement(v, result, placement_arg_, service_->GetServerSize(0));
@@ -199,7 +280,7 @@ Status SchedulerImpl::InternalUpdateVariableInfo(const vector<VariableInfo>& inf
   return Status::Ok();    
 }
 
-Status SchedulerImpl::UpdateVariableVisitInfo(Version version, const std::string& var_name, int64_t ids) {
+Status SchedulerImpl::UpdateVariableVisitInfo(Version version, const string& var_name, int64_t ids) {
   unique_lock<mutex> lock(m_);
   if (!ready_) { return Status::NotReady("Cluster is not ready"); }
   if (version != version_) { return VersionMismatch(version_, version); }
@@ -207,8 +288,8 @@ Status SchedulerImpl::UpdateVariableVisitInfo(Version version, const std::string
     if (i.name == var_name) { 
       i.visit_time++;
       if (ids < 0) {
-        if (i.shape.empty()) { i.dense_visit_ids += 1; }
-        else { i.dense_visit_ids += i.shape[0]; }
+		if (i.shape.empty()) { i.dense_visit_ids += 1; }
+		else { i.dense_visit_ids += i.shape[0]; }
       } else {
         i.sparse_visit_ids += ids;
       }
@@ -252,8 +333,16 @@ Status SchedulerImpl::WriteMetaInfo() {
     PS_CHECK_STATUS(FileSystem::OpenWriteStreamAny(meta_string_, &s));
     PS_CHECK_STATUS(s->WriteRaw(variable_info_.size()));
     for (auto& info : variable_info_) {
-      std::string data = info.name + " " + std::to_string(info.visit_time) + " "
-      + std::to_string(info.dense_visit_ids) + " " + std::to_string(info.sparse_visit_ids) + "\n";
+	  string data;
+	  if (info.shape.empty()) {
+	    data = info.name + " " + std::to_string(info.visit_time) + " "
+             + std::to_string(info.dense_visit_ids) + " " + std::to_string(info.sparse_visit_ids) + " "
+             + std::to_string(1) + "\n";	
+	  } else {
+	    data = info.name + " " + std::to_string(info.visit_time) + " "
+             + std::to_string(info.dense_visit_ids) + " " + std::to_string(info.sparse_visit_ids) + " "
+             + std::to_string(info.shape[0]) + "\n";
+	  }
       PS_CHECK_STATUS(s->WriteStr(data));
     }
   }
@@ -265,16 +354,16 @@ void SchedulerImpl::MainLoop() {
     // First Run: Must Have a restore op
     switch (op_code_) {
     case kSave: {
-      LOG(INFO) << "Saving checkpoint :" << op_checkpoint_;
+      LOG(INFO) << "Saving checkpoint " << op_checkpoint_;
       Status st = InternalSave(op_checkpoint_);
-      LOG(INFO) << "Saving checkpoint :" << op_checkpoint_ << ", Get Status: " << st.ToString();
+      LOG(INFO) << "Saving checkpoint " << op_checkpoint_ << ", Get Status " << st.ToString();
       op_cb_(st);
       break;
     }
     case kRestore: {
-      LOG(INFO) << "Restore checkpoint: " << op_checkpoint_;
+      LOG(INFO) << "Restore checkpoint " << op_checkpoint_;
       Status st = InternalRestore(op_checkpoint_);
-      LOG(INFO) << "Restore checkpoint :" << op_checkpoint_ << ", Get Status: " << st.ToString();
+      LOG(INFO) << "Restore checkpoint " << op_checkpoint_ << ", Get Status " << st.ToString();
       op_cb_(st);
       if (sync_) { sync_->Reset(); }
       break;
@@ -351,8 +440,7 @@ void SchedulerImpl::AssignOp(OpCode code, Version version,
     op_checkpoint_ = checkpoint;
     op_cb_ = cb;
     op_cv_.notify_all();
-    LOG(INFO) << "Schedule a new op to " << OpName(code) << 
-      " checkpoint:" << checkpoint;
+    LOG(INFO) << "Schedule a new op to " << OpName(code) << " checkpoint " << checkpoint;
   }
 }
 
@@ -362,7 +450,7 @@ void SchedulerImpl::WaitForServers() {
       unique_lock<mutex> lock(m_);
       const size_t n = service_->GetServerTotalSize() - servers_.size();
       if (n == 0) { return; }
-      LOG(INFO) << "Waiting for " << n << " more servers";
+      LOG(INFO) << "Waiting for " << n << " more server";
     }
     this_thread::sleep_for(seconds(1));
   }
@@ -378,26 +466,12 @@ Status SchedulerImpl::InternalRestore(const string& checkpoint) {
 
     // disable
     ready_ = false;
+    r_ready_ = true;
     version_ = NewRandomVersion();
 
-
-    std::vector<std::string> checkpoints;
-    {
-      std::unique_ptr<FileSystem::ReadStream> s;
-      Status st = FileSystem::OpenReadStreamAny(checkpoint_path_ + "/checkpoints", &s);
-      LOG(INFO) << "st is " << st.ToString();
-      // Ignore st fail when we use a fresh checkpoint dir
-      if (st.IsOk()) {
-        size_t size;
-        PS_CHECK_STATUS(s->ReadRaw(&size));
-        checkpoints.resize(size);
-        for (size_t i = 0; i < size; i++) {
-          PS_CHECK_STATUS(s->ReadStr(&checkpoints[i]));
-        }
-      }
-    }
-
-    std::string real_checkpoint = "";
+    vector<string> checkpoints;
+    PS_CHECK_STATUS(ReadCheckpoints(checkpoint_path_, true, &checkpoints));
+    string real_checkpoint = "";
     if (checkpoint == "") {
       real_checkpoint = checkpoints.size() == 0 ? "" : checkpoints.back();
     } else {
@@ -411,90 +485,45 @@ Status SchedulerImpl::InternalRestore(const string& checkpoint) {
         return Status::NotFound("Checkpoint Not Found : " + checkpoint);
       }
     }
-
+    LOG(INFO) << "Real checkpoint is " << real_checkpoint;
     
-    std::vector<VariableInfo> infos;
-
-    if (real_checkpoint != "") {
-      std::unique_ptr<FileSystem::ReadStream> s;
-      PS_CHECK_STATUS(FileSystem::OpenReadStreamAny(checkpoint_path_ + "/" + real_checkpoint + "/__meta__", &s));
-      size_t old_server;
-
-      {
-        size_t infos_type;
-        std::string infos_buf;
-        PS_CHECK_STATUS(s->ReadRaw(&old_server));
-        PS_CHECK_STATUS(s->ReadRaw(&infos_type));
-        PS_CHECK_STATUS(s->ReadStr(&infos_buf));
-        Data* info_wrapper;
-        size_t len;
-        serializer::MemGuard mem;
-        serializer::Fragment frag(&infos_buf[0], infos_buf.size());
-        PS_CHECK_STATUS(serializer::DeserializeAny<Data>(infos_type, &frag, 0, &info_wrapper, &len, mem));
-        std::unique_ptr<Data> info_wrapper_deleter(info_wrapper);
-        WrapperData<VariableInfoCollection>* info_wrapper_converted = dynamic_cast<WrapperData<VariableInfoCollection>*>(info_wrapper);
-        if (info_wrapper_converted == nullptr) {
-          return Status::Unknown("Variable Info Load Error");
-        }
-        infos = info_wrapper_converted->Internal().infos;
-      }
-
-      if (old_server != service_->GetServerSize(0)) {
-        LOG(INFO) << "Change ps_num from " <<  old_server << " to " << service_->GetServerSize(0);
-      }
-      LOG(INFO) << "Info from checkpoint " << PrintVariableInfo(infos);
-      vector<VariableInfo> result;
-      vector<VariableInfo> input_infos = infos;
-      for (auto& i: input_infos) {
-        i.parts.clear();
-      }
-      Status st = InternalUpdateVariableInfo(input_infos, &result);
-      if (!st.IsOk()) {
-        return st;
-      }
-      variable_info_ = result;
-      LOG(INFO) << "Info from placement " << PrintVariableInfo(variable_info_);
-    } else {
-      infos = variable_info_;
-    }
-
-    LOG(INFO) << "Real Checkpoints[" << real_checkpoint << "] with info_size[" << infos.size() << "]";
+    vector<VariableInfo> source_infos;
+    PS_CHECK_STATUS(GenerateVariableInfo(real_checkpoint, &source_infos));
+    PS_CHECK_STATUS(RestoreGlobalQueue(checkpoint_path_ + "/" + real_checkpoint));
 
     count_down = service_->GetServerTotalSize();
-
-    for (auto& it: servers_) {
-      ServerInfo& server = it.second;
-      ServerId id = server.GetId();
+    LOG(INFO) << "VariableInfos " << PrintVariableInfo(variable_info_);
+    for (const auto& it: servers_) {
+      const ServerInfo& server = it.second;
+      const ServerId id = server.GetId();
       ServerType server_type = server.GetServerType();
       if (server_type == 0) {
         service_->ServerRestore(
             server_type, id, version_,
-            real_checkpoint == "" ? "" : checkpoint_path_ + "/" + real_checkpoint,
-            infos, variable_info_, [id, &result, &mu, &collect, &count_down](Status st) {
-          std::unique_lock<std::mutex> lock(mu);
-          if (!st.IsOk() && collect.IsOk()) {
-            collect = st;
-          }
-          std::string st_str = st.IsOk() ? "OK" : st.Msg();
-          LOG(INFO) << "server " << id << " finish restore, status " << st_str << " waiting " << count_down - 1 << " more.";
-          if (--count_down == 0) {
-            lock.unlock();
-            result.set_value(collect);
-          }
-        });
+            source_infos, variable_info_, [id, &result, &mu, &collect, &count_down](Status st) {
+              std::unique_lock<std::mutex> lock(mu);
+              if (!st.IsOk() && collect.IsOk()) {
+                collect = st;
+              }
+              if (--count_down == 0) {
+                lock.unlock();
+                result.set_value(collect);
+              }
+              LOG(INFO) << "server " << id << " finish restore, status " << (st.IsOk() ? "OK" : st.Msg()) << ", waiting " << count_down << " more";
+            });
       } else {
         service_->ModelServerFlush(
             server_type, id, version_,
             [&result, &mu, &collect, &count_down](Status st) {
-          std::unique_lock<std::mutex> lock(mu);
-          if (!st.IsOk() && collect.IsOk()) {
-            collect = st;
-          }
-          if (--count_down == 0) {
-            lock.unlock();
-            result.set_value(collect);
-          }
-        });
+              std::unique_lock<std::mutex> lock(mu);
+              if (!st.IsOk() && collect.IsOk()) {
+                collect = st;
+              }
+              if (--count_down == 0) {
+                lock.unlock();
+                result.set_value(collect);
+              }
+            });
       }
     }
   }
@@ -502,11 +531,77 @@ Status SchedulerImpl::InternalRestore(const string& checkpoint) {
   if (collect.IsOk()) {
     // enable
     unique_lock<mutex> lock(m_);
-    ready_ = true;
+    ready_ = r_ready_;
   }
   return collect;
 }
 
+Status SchedulerImpl::GenerateVariableInfo(string real_checkpoint, vector<VariableInfo>* source) {
+  std::string checkpoint = "";
+  if (real_checkpoint != "") {
+    checkpoint += "*@" + checkpoint_path_ + "/" + real_checkpoint;
+  }
+  if (checkpoint != "") {
+    vector<VariableInfo> result;
+    PS_CHECK_STATUS(ParseVariables(checkpoint, source));
+    vector<VariableInfo> input_infos = *source;
+    for (auto& i: input_infos) {
+      i.parts.clear();
+    }
+    PS_CHECK_STATUS(InternalUpdateVariableInfo(input_infos, &result));
+    variable_info_ = result;
+  } else {
+    LOG(INFO) << "Empty checkpoint, not load";
+  }
+  return Status::Ok();
+}
+
+Status SchedulerImpl::ParseVariables(const std::string& checkpoint, vector<VariableInfo>* result) {
+  map<string, VariableInfo> var_map;
+  vector<string> v = StringUtils::split(checkpoint, "@");
+  string source_path = v[1];
+  if (source_path.back() == '/') {
+    source_path = source_path.substr(0, source_path.size()-1);
+  }
+  vector<string> checkpoints;
+  PS_CHECK_STATUS(ReadCheckpoints(source_path, true, &checkpoints));
+  if (checkpoints.size() != 0) {
+    source_path += "/" + checkpoints.back();
+  }
+  size_t server_num;
+  std::vector<VariableInfo> infos;
+  PS_CHECK_STATUS(ReadVariableInfoMeta(source_path, &server_num, &infos));
+  for (VariableInfo& info : infos) {
+    info.args[VariableInfo::ORIGIN_FILE_PATH] = source_path;
+    info.args[VariableInfo::ORIGIN_NAME] = info.name;
+    var_map[info.name] = info;
+  }
+  for (auto& iter : var_map) {
+    result->push_back(iter.second);
+  }
+  return Status::Ok();
+}
+
+string SchedulerImpl::PrintVariableInfo(const vector<VariableInfo>& infos) {
+  string logger = "";
+  for (const auto& item : infos) {
+    logger += item.name + "<shape[";
+    for (auto dim : item.shape) {
+      logger += std::to_string(dim) + ",";
+    }
+    logger += "]parts[";
+    for (auto part : item.parts) {
+      logger += std::to_string(part.server) + ":" + std::to_string(part.size) + ",";
+    }
+    logger += "]>args[";
+    for (auto& iter : item.args) {
+      logger += iter.first + "=" + iter.second + ",";
+    }
+    logger += "]";
+  }
+  return logger;
+}    
+
 Status SchedulerImpl::InternalSave(const string& checkpoint) {
   std::promise<Status> result;
   std::mutex mu;
@@ -525,11 +620,17 @@ Status SchedulerImpl::InternalSave(const string& checkpoint) {
       PS_CHECK_STATUS(FileSystem::OpenWriteStreamAny(checkpoint_path_ + "/" + checkpoint + "/__meta__", &s));
 
       {
-        std::string infos_buf;
+        string infos_buf;
         size_t infos_type;
         std::unique_ptr<WrapperData<VariableInfoCollection>> info_wrapper(new WrapperData<VariableInfoCollection>);
-        info_wrapper->Internal().infos = variable_info_;
-        std::vector<serializer::Fragment> frags;
+        for (const auto& info: variable_info_) {
+          auto iter = info.args.find("save");
+          if (iter != info.args.end() && iter->second == "false") {
+            continue;
+          }
+          info_wrapper->Internal().infos.push_back(info);
+        }
+        vector<serializer::Fragment> frags;
         serializer::MemGuard mem;
         PS_CHECK_STATUS(serializer::SerializeAny<Data>(info_wrapper.get(), &infos_type, &frags, mem));
         for (auto frag : frags) {
@@ -549,22 +650,23 @@ Status SchedulerImpl::InternalSave(const string& checkpoint) {
       ServerType server_type = server.GetServerType();
       if (server_type == 0) {
         service_->ServerSave(server_type, id, version_, checkpoint_path_ + "/" + checkpoint, variable_info_, [id, &result, &mu, &collect, &count_down](Status st) {
-          std::unique_lock<std::mutex> lock(mu);
-          if (!st.IsOk() && collect.IsOk()) {
-            collect = st;
-          }
-          if (--count_down == 0) {
-            lock.unlock();
-            result.set_value(collect);
-          }
-        });
+              std::unique_lock<std::mutex> lock(mu);
+              if (!st.IsOk() && collect.IsOk()) {
+                collect = st;
+              }
+              if (--count_down == 0) {
+                lock.unlock();
+                result.set_value(collect);
+              }
+              LOG(INFO) << "server " << id << " finish save, status " << (st.IsOk() ? "OK" : st.Msg()) << ", waiting " << count_down << " more.";
+            });
       }
     }
   }
   result.get_future().wait();
   PS_CHECK_STATUS(collect);
 
-  std::vector<std::string> checkpoints;
+  vector<string> checkpoints;
   {
     std::unique_ptr<FileSystem::ReadStream> s;
     Status st = FileSystem::OpenReadStreamAny(checkpoint_path_ + "/checkpoints", &s);
@@ -591,11 +693,19 @@ Status SchedulerImpl::InternalSave(const string& checkpoint) {
   FileSystem::RemoveAny(checkpoint_path_ + "/checkpoints");
   PS_CHECK_STATUS(FileSystem::RenameAny(checkpoint_path_ + "/checkpoints.tmp", checkpoint_path_ + "/checkpoints"));
 
+  {
+    std::unique_ptr<FileSystem::WriteStream> s;
+    PS_CHECK_STATUS(FileSystem::OpenWriteStreamAny(checkpoint_path_ + "/" + checkpoint + "/global_queue_meta", &s));
+    std::string queue_buf;
+    PS_CHECK_STATUS(SerializeGlobalQueue(&queue_buf));
+    PS_CHECK_STATUS(s->WriteStr(queue_buf));
+  }
+
   return Status::Ok();;
 }
 
-Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
-  std::vector<ps::VariableInfo> variable_info;
+Status SchedulerImpl::InternalTriggerStreamingDense(Version version, const std::string& stream_version) {
+  vector<ps::VariableInfo> variable_info;
   {
     unique_lock<mutex> lock(m_);
     if (!ready_) {
@@ -612,7 +722,7 @@ Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
   if (streaming_dense_model_writer_ == nullptr) {
     return Status::Unknown("Dense Model Writer Open Error");
   }
-  std::unordered_set<std::string> dense_vars;
+  std::unordered_set<string> dense_vars;
   for (auto& info : variable_info) {
     if (info.args["streaming_dense_output"] == "true") {
       dense_vars.insert(info.name);
@@ -633,19 +743,19 @@ Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
           service_->ServerStreamingDenseVarName(
               server_type, id, version,
               [&, id](Status st, const DenseVarNames& vars) {
-            std::unique_lock<std::mutex> lock(mu);
-            if (!st.IsOk() && collect.IsOk()) {
-              collect = st;
-            } else {
-              for (auto& item : vars.names) {
-                dense_vars.insert(item);
-              }
-            }
-            if (--count_down == 0) {
-              lock.unlock();
-              result.set_value(collect);
-            }
-          });
+                std::unique_lock<std::mutex> lock(mu);
+                if (!st.IsOk() && collect.IsOk()) {
+                  collect = st;
+                } else {
+                  for (auto& item : vars.names) {
+                    dense_vars.insert(item);
+                  }
+                }
+                if (--count_down == 0) {
+                  lock.unlock();
+                  result.set_value(collect);
+                }
+              });
         }
       }
     }
@@ -656,7 +766,7 @@ Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
   for (auto& item : dense_vars) {
     vars.names.push_back(item);
   }
-  std::unordered_map<std::string, std::vector<DenseVarValues::DenseVarValue>> values;
+  std::unordered_map<string, vector<DenseVarValues::DenseVarValue>> values;
   { 
     std::promise<Status> result;
     std::mutex mu;
@@ -672,35 +782,35 @@ Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
           service_->ServerGatherStreamingDenseVar(
               server_type, id, version, vars,
               [&count_down, &mu, &result, &collect, &values, id](Status st, const DenseVarValues& val) {
-            std::unique_lock<std::mutex> lock(mu);
-            if (!st.IsOk() && collect.IsOk()) {
-              collect = st;
-            } else {
-              for (auto& item : val.values) {
-                Tensor copy_tensor(item.data.Type(), item.data.Shape(), new initializer::NoneInitializer);
-                memcpy(copy_tensor.Raw<char>(), item.data.Raw<char>(), SizeOfType(copy_tensor.Type()) * copy_tensor.Shape().NumElements());
-                values[item.name].push_back(DenseVarValues::DenseVarValue{
-                  .name = item.name,
-                  .offset = item.offset,
-                  .data = copy_tensor
-                });
-              }
-            }
-            if (--count_down == 0) {
-              lock.unlock();
-              result.set_value(collect);
-            }
-          });
+                std::unique_lock<std::mutex> lock(mu);
+                if (!st.IsOk() && collect.IsOk()) {
+                  collect = st;
+                } else {
+                  for (auto& item : val.values) {
+                    Tensor copy_tensor(item.data.Type(), item.data.Shape(), new initializer::NoneInitializer);
+                    memcpy(copy_tensor.Raw<char>(), item.data.Raw<char>(), SizeOfType(copy_tensor.Type()) * copy_tensor.Shape().NumElements());
+                    values[item.name].push_back(DenseVarValues::DenseVarValue{
+                          .name = item.name,
+                          .offset = item.offset,
+                          .data = copy_tensor
+                            });
+                  }
+                }
+                if (--count_down == 0) {
+                  lock.unlock();
+                  result.set_value(collect);
+                }
+              });
         }
       }
     }
     result.get_future().wait();
     PS_CHECK_STATUS(collect);
   }
-  std::unordered_map<std::string, Tensor> datas;
+  std::unordered_map<string, Tensor> datas;
   for (auto& item : values) {
-    std::string name = item.first;
-    std::vector<DenseVarValues::DenseVarValue> val = item.second;
+    string name = item.first;
+    vector<DenseVarValues::DenseVarValue> val = item.second;
     VariableInfo info;
     bool found = false;
     for (auto& xinfo : variable_info) {
@@ -713,7 +823,7 @@ Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
     if (!found) {
       return Status::NotFound("Not Found variable info: " + name);
     }
-    Tensor result(info.datatype, TensorShape(std::vector<size_t>(info.shape.begin(), info.shape.end())), new initializer::NoneInitializer);
+    Tensor result(info.datatype, TensorShape(vector<size_t>(info.shape.begin(), info.shape.end())), new initializer::NoneInitializer);
     size_t slice_size = SizeOfType(info.datatype);
     for (size_t i = 1; i < info.shape.size(); i++) {
       slice_size *= info.shape[i];
@@ -746,15 +856,15 @@ Status SchedulerImpl::InternalTriggerStreamingDense(Version version) {
     }
     datas[name] = result;
   }
-  std::vector<StreamingModelWriter::DenseModel> result;
+  vector<StreamingModelWriter::DenseModel> result;
   for (auto& item : datas) {
     result.push_back(StreamingModelWriter::DenseModel{.name = item.first, .data = item.second});
   }
-  Status rst = streaming_dense_model_writer_->WriteDenseModel(result);
+  Status rst = streaming_dense_model_writer_->WriteDenseModel(result, stream_version);
   return rst;
 }
 
-Status SchedulerImpl::InternalTriggerStreamingSparse(Version version) {
+Status SchedulerImpl::InternalTriggerStreamingSparse(Version version, const std::string& stream_version) {
   {
     unique_lock<mutex> lock(m_);
     if (!ready_) {
@@ -777,17 +887,17 @@ Status SchedulerImpl::InternalTriggerStreamingSparse(Version version) {
         ServerId id = server.GetId();
         if (server_type == 0) {
           service_->ServerTriggerStreamingSparse(
-              server_type, id, version,
+              server_type, id, version, stream_version,
               [id, &result, &mu, &collect, &count_down](Status st) {
-            std::unique_lock<std::mutex> lock(mu);
-            if (!st.IsOk() && collect.IsOk()) {
-              collect = st;
-            }
-            if (--count_down == 0) {
-              lock.unlock();
-              result.set_value(collect);
-            }
-          });
+                std::unique_lock<std::mutex> lock(mu);
+                if (!st.IsOk() && collect.IsOk()) {
+                  collect = st;
+                }
+                if (--count_down == 0) {
+                  lock.unlock();
+                  result.set_value(collect);
+                }
+              });
         }
       }
     }
@@ -797,7 +907,7 @@ Status SchedulerImpl::InternalTriggerStreamingSparse(Version version) {
   return Status::Ok();
 }
 
-Status SchedulerImpl::InternalTriggerStreamingHash(Version version) {
+Status SchedulerImpl::InternalTriggerStreamingHash(Version version, const std::string& stream_version) {
   {
     unique_lock<mutex> lock(m_);
     if (!ready_) {
@@ -820,17 +930,17 @@ Status SchedulerImpl::InternalTriggerStreamingHash(Version version) {
         ServerType server_type = server.GetServerType();
         if (server_type == 0) {
           service_->ServerTriggerStreamingHash(
-              server_type, id, version,
+              server_type, id, version, stream_version,
               [id, &result, &mu, &collect, &count_down](Status st) {
-            std::unique_lock<std::mutex> lock(mu);
-            if (!st.IsOk() && collect.IsOk()) {
-              collect = st;
-            }
-            if (--count_down == 0) {
-              lock.unlock();
-              result.set_value(collect);
-            }
-          });
+                std::unique_lock<std::mutex> lock(mu);
+                if (!st.IsOk() && collect.IsOk()) {
+                  collect = st;
+                }
+                if (--count_down == 0) {
+                  lock.unlock();
+                  result.set_value(collect);
+                }
+              });
         }
       }
     }
@@ -869,35 +979,130 @@ void SchedulerImpl::InternalWorkerReportFinish(Version version, int id, function
       return;
     }
   }
+
   finished_workers_.insert(id);
-  auto iter = worker_barriers_.find(id);
-  if (iter != worker_barriers_.end()) {
-    worker_barriers_.erase(iter);
+
+  {
+    auto iter = worker_barriers_.find(id);
+    if (iter != worker_barriers_.end()) {
+      worker_barriers_.erase(iter);
+    }
+
+    if (worker_barriers_.size() == worker_count_ - finished_workers_.size()) {
+      for (auto iter : worker_barriers_) {
+        (iter.second)(Status::Ok());
+      }
+
+      worker_barriers_.clear();
+    }
   }
-  if (worker_barriers_.size() == worker_count_ - finished_workers_.size()) {
-    for (auto iter : worker_barriers_) {
-      (iter.second)(Status::Ok());
+
+  {
+    auto iter = barrier_infos_.find(id);
+    if (iter != barrier_infos_.end()) {
+      barrier_infos_.erase(iter);
+    }
+
+    if (barrier_infos_.size() == worker_count_ - finished_workers_.size()) {
+      for (auto iter : barrier_infos_) {
+        (iter.second.cb)(Status::Ok());
+      }
+
+      barrier_infos_.clear();
     }
-    worker_barriers_.clear();
   }
+
   cb(Status::Ok());
 }
 
 void SchedulerImpl::InternalWorkerBarrier(Version version, int id, int worker_count, function<void (const Status&)> cb) {
-  worker_count_ = worker_count;  
+  worker_count_ = worker_count;
   if (version != version_) {
     cb(VersionMismatch(version_, version));
     return;
   }
   worker_barriers_[id] = cb;
   if (worker_barriers_.size() == worker_count - finished_workers_.size()) {
-      for (auto iter : worker_barriers_) {
-          (iter.second)(Status::Ok());
+    for (auto iter : worker_barriers_) {
+      (iter.second)(Status::Ok());
+    }
+    worker_barriers_.clear();
+  }
+}
+
+void SchedulerImpl::InternalWorkerBarrierV2(
+    Version version, 
+    int barrier_id, 
+    int task_id, 
+    int task_num,
+    int token,
+    function<void (const Status&)> cb) {
+  worker_count_ = task_num;
+  if (version != version_) {
+    cb(VersionMismatch(version_, version));
+    return;
+  }
+
+  auto it = barrier_tokens_.find(task_id);
+  if (it == barrier_tokens_.end()) {
+    barrier_tokens_[task_id] = token;
+  }
+
+  BarrierV2Info bi = BarrierV2Info{
+    .token=token, 
+    .barrier_id=barrier_id, 
+    .cb=cb};
+
+  if (barrier_tokens_[task_id] == token) {
+    if (barrier_infos_.empty()) {
+      for (auto& it: failover_barrier_infos_) {
+        if (it.second.barrier_id == barrier_id) {
+          barrier_infos_[it.first] = it.second;
+        } else {
+          (it.second.cb)(Status::Ok());
+        }
       }
-      worker_barriers_.clear();
+
+      failover_barrier_infos_.clear();
+    }
+
+    BarrierAddAndNotifyAll(task_id, bi);
+  } else {
+    // failovered worker
+    barrier_tokens_[task_id] = token;
+    if (barrier_infos_.empty()) {
+      failover_barrier_infos_[task_id] = bi;
+    } else {
+      if (barrier_infos_.begin()->second.barrier_id == barrier_id) {
+        BarrierAddAndNotifyAll(task_id, bi);
+      } else {
+        cb(Status::Ok());
+      }
+    }
+  }
+}
+
+void SchedulerImpl::BarrierAddAndNotifyAll(
+    int task_id, const BarrierV2Info& bi) {
+  barrier_infos_[task_id] = bi;
+  if (barrier_infos_.size() == worker_count_ - finished_workers_.size()) {
+    for (auto& it: barrier_infos_) {
+      (it.second.cb)(Status::Ok());
+    }
+
+    barrier_infos_.clear();
   }
 }
 
+void SchedulerImpl::InternalGetWorkerFinishCount(Version version, function<void (int64_t, const Status&)> cb) {
+  if (version != version_) {
+    cb(-1, VersionMismatch(version_, version));
+    return;
+  }
+  int64_t size = finished_workers_.size();
+  cb(size, Status::Ok());
+}
+
 void SchedulerImpl::InternalSynchronizeEnter(Version version, int id, int worker_count,
         function<void (int64_t, const Status&)> cb) {
   if (version != version_) {
@@ -929,18 +1134,97 @@ void SchedulerImpl::InternalSynchronizeLeave(Version version, int id, int64_t to
   sync->Leave(id, token, cb);
 }
 
-std::string SchedulerImpl::PrintVariableInfo(const std::vector<VariableInfo>& infos) {
-    std::string logger = "";
-    for (const auto& item : infos) {
-      logger += item.name + "<shape[";
-      for (auto dim : item.shape) {
-          logger += std::to_string(dim) + ",";
-      }
-      logger += "]parts[";
-      for (auto part : item.parts) {
-          logger += std::to_string(part.server) + ":" + std::to_string(part.size) + ",";
-      }
-      logger += "]>";
+Status SchedulerImpl::RestoreGlobalQueue(const std::string& ckpt_dir) {
+  std::unique_ptr<FileSystem::ReadStream> s;
+  Status st = FileSystem::OpenReadStreamAny(ckpt_dir + "/global_queue_meta", &s);    
+  if (st.IsOk()) {
+    std::string queue_state;
+    PS_CHECK_STATUS(s->ReadStr(&queue_state));    
+    PS_CHECK_STATUS(DeserializeGlobalQueue(queue_state));
+  }
+
+  return Status::Ok();
+}
+
+Status SchedulerImpl::SerializeGlobalQueue(std::string* buf) {
+  std::unique_lock<std::mutex> lock(mu_);
+  size_t size = global_file_queues_.size();
+  buf->append((char*)&size, sizeof(size_t));
+  for (auto& it: global_file_queues_) {
+    size_t name_size = it.first.size();
+    buf->append((char*)&name_size, sizeof(size_t));    
+    buf->append((char*)it.first.data(), it.first.size());    
+    std::string queue_state;
+    it.second->Serialize(&queue_state);
+    size_t queue_state_size = queue_state.size();
+    buf->append((char*)&queue_state_size, sizeof(size_t));    
+    buf->append((char*)queue_state.data(), queue_state.size());        
+  }
+
+  return Status::Ok();
+}
+
+Status SchedulerImpl::DeserializeGlobalQueue(const std::string& buf) {
+  std::unordered_map<std::string, std::unique_ptr<GlobalFileQueue> > queues;
+  char* ptr = const_cast<char*>(buf.data());
+  size_t len = *(reinterpret_cast<size_t*>(ptr));
+  ptr += sizeof(size_t);
+  for (size_t i = 0; i < len; ++i) {
+    size_t name_len = *(reinterpret_cast<size_t*>(ptr));    
+    ptr += sizeof(size_t);
+    std::string name;
+    name.assign(ptr, name_len);
+    ptr += name_len;
+    size_t queue_state_len = *(reinterpret_cast<size_t*>(ptr));    
+    ptr += sizeof(size_t);    
+    std::string queue_state;
+    queue_state.assign(ptr, queue_state_len);
+    ptr += queue_state_len;    
+    queues[name].reset(new GlobalFileQueue());
+    PS_CHECK_STATUS(queues[name]->Deserialize(queue_state));
+  }
+
+  std::unique_lock<std::mutex> lock(mu_);
+  global_file_queues_ = std::move(queues);
+  return Status::Ok();
+}
+
+Status SchedulerImpl::ReadCheckpoints(const std::string& ckpt_dir, bool ignoreError, std::vector<std::string>* checkpoints) {
+  std::unique_ptr<FileSystem::ReadStream> s;
+  Status st = FileSystem::OpenReadStreamAny(ckpt_dir + "/checkpoints", &s);
+  if (st.IsOk()) {
+    size_t size;
+    PS_CHECK_STATUS(s->ReadRaw(&size));
+    checkpoints->resize(size);
+    for (size_t i = 0; i < size; i++) {
+      PS_CHECK_STATUS(s->ReadStr(&(*checkpoints)[i]));
     }
-    return logger;
-}    
+    return Status::Ok();
+  } else if (ignoreError) {
+    return Status::Ok();
+  } else {
+    return st;
+  }
+}
+
+Status SchedulerImpl::ReadVariableInfoMeta(const std::string& path, size_t* server_num, std::vector<VariableInfo>* result) {
+  std::unique_ptr<FileSystem::ReadStream> s;
+  PS_CHECK_STATUS(FileSystem::OpenReadStreamAny(path + "/__meta__", &s));
+  size_t infos_type;
+  std::string infos_buf;
+  PS_CHECK_STATUS(s->ReadRaw(server_num));
+  PS_CHECK_STATUS(s->ReadRaw(&infos_type));
+  PS_CHECK_STATUS(s->ReadStr(&infos_buf));
+  Data* info_wrapper;
+  size_t len;
+  serializer::MemGuard mem;
+  serializer::Fragment frag(&infos_buf[0], infos_buf.size());
+  PS_CHECK_STATUS(serializer::DeserializeAny<Data>(infos_type, &frag, 0, &info_wrapper, &len, mem));
+  std::unique_ptr<Data> info_wrapper_deleter(info_wrapper);
+  WrapperData<VariableInfoCollection>* info_wrapper_converted = dynamic_cast<WrapperData<VariableInfoCollection>*>(info_wrapper);
+  if (info_wrapper_converted == nullptr) {
+    return Status::Unknown("Variable Info Load Error");
+  }
+  *result = info_wrapper_converted->Internal().infos;
+  return Status::Ok();
+}
diff --git a/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.h b/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.h
index 465caf5f..7daec1e3 100644
--- a/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.h
+++ b/xdl/ps-plus/ps-plus/scheduler/scheduler_impl.h
@@ -14,8 +14,7 @@ limitations under the License.
 ==============================================================================*/
 
 #ifndef PS_SCHEDULER_SCHEDULER_IMPL_H_
-#define PS_SCHEDULER_SCHEDULER_IMPL_H_
-
+#define PS_SCHEDULER_SCHEDULER_IMPL_H_ 
 #include <condition_variable>
 #include <list>
 #include <map>
@@ -23,6 +22,7 @@ limitations under the License.
 #include <mutex>
 #include <thread>
 #include <vector>
+#include <unordered_set>
 
 #include "ps-plus/common/status.h"
 #include "ps-plus/message/cluster_info.h"
@@ -30,10 +30,12 @@ limitations under the License.
 #include "ps-plus/message/version.h"
 #include "ps-plus/common/thread_pool.h"
 #include "ps-plus/message/streaming_model_manager.h"
+#include "ps-plus/message/worker_state.h"
 
 #include "placementer.h"
 #include "scheduler_service.h"
 #include "synchronizer.h"
+#include "ps-plus/common/global_file_queue.h"
 
 namespace ps {
 namespace scheduler {
@@ -64,9 +66,29 @@ class SchedulerImpl {
   Status GetClusterInfo(const Version version, ClusterInfo* result);
   void Save(Version version, const std::string& checkpoint, OpCallback cb);
   void Restore(Version version, const std::string& checkpoint, OpCallback cb);
-  void TriggerStreamingDense(Version version, OpCallback cb);
-  void TriggerStreamingSparse(Version version, OpCallback cb);
-  void TriggerStreamingHash(Version version, OpCallback cb);
+  void TriggerStreamingDense(Version version, const std::string& stream_version, OpCallback cb);
+  void TriggerStreamingSparse(Version version, const std::string& stream_version, OpCallback cb);
+  void TriggerStreamingHash(Version version, const std::string& stream_version, OpCallback cb);
+  Status InitGlobalQueue(
+      Version version, 
+      const std::string& name,
+      const std::vector<std::string>& paths,
+      size_t epoch,
+      bool epoch_isolate);
+  Status GetNextFile(
+      Version version, 
+      const std::string& name,
+      size_t worker_id, 
+      WorkerState* ws);
+  Status ReportWorkerState(
+      Version version, 
+      const std::string& name,
+      size_t worker_id, 
+      const std::vector<ps::WorkerState>& worker_states);
+  Status RestoreWorkerState(
+      Version version,
+      const std::string& name, 
+      size_t worker_id);
   ps::Status UpdateVariableInfo(Version version,
                                 const std::vector<VariableInfo>& info,
                                 std::vector<VariableInfo>* result);
@@ -75,23 +97,43 @@ class SchedulerImpl {
   void SynchronizeEnter(Version version, int id, int worker_count, 
                         std::function<void (int64_t, const Status&)> cb);
   void SynchronizeLeave(Version version, int id, int64_t token, std::function<void (const Status&)> cb);
-  void WorkerReportFinish(Version version, int id, std::function<void (const Status&)> cb);    
+  void WorkerReportFinish(Version version, int id, std::function<void (const Status&)> cb);
+  void GetWorkerFinishCount(Version version, std::function<void (int64_t, const Status&)> cb);
   void WorkerBarrier(Version version, int id, int worker_count, std::function<void (const Status&)> cb);
+  void WorkerBarrierV2(Version version, 
+                       int barrier_id, 
+                       int task_id, 
+                       int task_num,
+                       int token,
+                       std::function<void (const Status&)> cb);
   ps::Status UpdateVariableVisitInfo(Version version, const std::string& var_name, int64_t ids);
+  ps::Status ParseVariables(const std::string& checkpoint, std::vector<VariableInfo>* result);
   ps::Status WriteMetaInfo();
-  std::string PrintVariableInfo(const std::vector<VariableInfo>& infos);  
+  static Status ReadVariableInfoMeta(const std::string& path, size_t* server_num, std::vector<VariableInfo>* result);
+  static Status ReadCheckpoints(const std::string& ckpt_dir, bool ignoreError, std::vector<std::string>* checkpoints);
+  Status RestoreGlobalQueue(const std::string& ckpt_dir);
+  struct BarrierV2Info {
+    int token;
+    int barrier_id;
+    std::function<void (const Status&)> cb;
+  };
+
+  void BarrierAddAndNotifyAll(int task_id, const BarrierV2Info& bi);
 
  private:
   std::unique_ptr<std::thread> main_thread_;
   std::unique_ptr<std::thread> meta_thread_;
   bool stopped_;
-
+  bool variable_info_updated_ = false;
+    
   std::mutex m_;
   bool ready_;
-  Version version_;
+  bool r_ready_;
   std::map<int32_t, std::function<void (const Status&)>> worker_barriers_;
   int worker_count_ = 0;
+  Version version_;
   std::set<int32_t> finished_workers_;
+  std::string server_count_;
   std::map<std::pair<ServerType, ServerId>, ServerInfo> servers_;
 
   ps::Status VersionMismatch(Version exp, Version act);
@@ -114,9 +156,9 @@ class SchedulerImpl {
   Status InternalUpdateVariableInfo(const std::vector<VariableInfo>& info, std::vector<VariableInfo>* result);
   Status InternalRestore(const std::string& checkpoint);
   Status InternalSave(const std::string& checkpoint);
-  Status InternalTriggerStreamingDense(Version version);
-  Status InternalTriggerStreamingSparse(Version version);
-  Status InternalTriggerStreamingHash(Version version);
+  Status InternalTriggerStreamingDense(Version version, const std::string& stream_version);
+  Status InternalTriggerStreamingSparse(Version version, const std::string& stream_version);
+  Status InternalTriggerStreamingHash(Version version, const std::string& stream_version);
   void InternalAsynchronizeEnter(Version version, int id,
                                 int staleness, int worker_count,
                                 std::function<void (const Status&)> cb);
@@ -125,8 +167,14 @@ class SchedulerImpl {
   void InternalSynchronizeLeave(Version version, int id, int64_t token,
                                 std::function<void (const Status&)> cb);
   void InternalWorkerReportFinish(Version version, int id, std::function<void (const Status&)> cb);
-  void InternalWorkerBarrier(Version version, int id, int worker_count, std::function<void (const Status&)> cb);    
-    
+  void InternalGetWorkerFinishCount(Version version, std::function<void (int64_t, const Status&)> cb);
+  void InternalWorkerBarrier(Version version, int id, int worker_count, std::function<void (const Status&)> cb);
+  void InternalWorkerBarrierV2(Version version, int barrier_id, int task_id, int task_num, int token, std::function<void (const Status&)> cb);
+  std::string static PrintVariableInfo(const std::vector<VariableInfo>& infos);
+  Status GenerateVariableInfo(std::string real_checkpoint, std::vector<VariableInfo>* source);
+  Status SerializeGlobalQueue(std::string* buf);
+  Status DeserializeGlobalQueue(const std::string& buf);  
+  
   Placementer* placementer_;
   const std::string checkpoint_path_;
   const Placementer::Arg placement_arg_;
@@ -139,10 +187,24 @@ class SchedulerImpl {
 
   std::unique_ptr<SyncMechanism> sync_;
 
+  std::mutex mu_;
+  std::unordered_map<std::string, std::unique_ptr<GlobalFileQueue> > global_file_queues_;
+
   std::string streaming_dense_model_addr_;
   std::string streaming_sparse_model_addr_;
   std::string streaming_hash_model_addr_;
   std::unique_ptr<StreamingModelWriter> streaming_dense_model_writer_;
+
+  struct ServerInfoHasher {
+    std::size_t operator()(const ServerInfo& info) const {
+      return info.GetVersion();
+    }
+  };
+  std::unordered_set<ServerInfo, ServerInfoHasher> disconnected_server_;
+
+  std::unordered_map<int32_t, BarrierV2Info> barrier_infos_;
+  std::unordered_map<int32_t, BarrierV2Info> failover_barrier_infos_;
+  std::unordered_map<int32_t, int32_t> barrier_tokens_;
 };
 
 }
diff --git a/xdl/ps-plus/ps-plus/scheduler/scheduler_service.cc b/xdl/ps-plus/ps-plus/scheduler/scheduler_service.cc
index e401dbdf..b6849ca9 100644
--- a/xdl/ps-plus/ps-plus/scheduler/scheduler_service.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/scheduler_service.cc
@@ -148,24 +148,61 @@ Status SchedulerService::Start() {
              ps::service::seastar::DoneClosure* done) {
       AsynchronizeEnter(inputs, outputs, done);
   });
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerWorkerReportFinish,
+      [this](const std::vector<ps::Data*>& inputs,
+             std::vector<ps::Data*>* outputs,
+             ps::service::seastar::DoneClosure* done) {
+      WorkerReportFinish(inputs, outputs, done);
+  });
   seastar_lib_->RegisterServerFunc(func_ids::kSchedulerWorkerBarrier,
       [this](const std::vector<ps::Data*>& inputs,
              std::vector<ps::Data*>* outputs,
              ps::service::seastar::DoneClosure* done) {
       WorkerBarrier(inputs, outputs, done);
   });
-  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerWorkerReportFinish,
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerWorkerBarrierV2,
       [this](const std::vector<ps::Data*>& inputs,
              std::vector<ps::Data*>* outputs,
              ps::service::seastar::DoneClosure* done) {
-      WorkerReportFinish(inputs, outputs, done);
-  });  
+      WorkerBarrierV2(inputs, outputs, done);
+  });
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerGetWorkerFinishCount,
+      [this](const std::vector<ps::Data*>& inputs,
+             std::vector<ps::Data*>* outputs,
+             ps::service::seastar::DoneClosure* done) {
+      GetWorkerFinishCount(inputs, outputs, done);
+  });      
   seastar_lib_->RegisterServerFunc(func_ids::kSchedulerUpdateVariableVisitInfo,
       [this](const std::vector<ps::Data*>& inputs,
              std::vector<ps::Data*>* outputs,
              ps::service::seastar::DoneClosure* done) {
       UpdateVariableVisitInfo(inputs, outputs, done);
   });
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerInitGlobalFileQueue,
+      [this](const std::vector<ps::Data*>& inputs,
+             std::vector<ps::Data*>* outputs,
+             ps::service::seastar::DoneClosure* done) {
+      InitGlobalQueue(inputs, outputs, done);
+  });
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerGetNextFile,
+      [this](const std::vector<ps::Data*>& inputs,
+             std::vector<ps::Data*>* outputs,
+             ps::service::seastar::DoneClosure* done) {
+      GetNextFile(inputs, outputs, done);
+  });
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerReportWorkerState,
+      [this](const std::vector<ps::Data*>& inputs,
+             std::vector<ps::Data*>* outputs,
+             ps::service::seastar::DoneClosure* done) {
+      ReportWorkerState(inputs, outputs, done);
+  });
+  seastar_lib_->RegisterServerFunc(func_ids::kSchedulerRestoreWorkerState,
+      [this](const std::vector<ps::Data*>& inputs,
+             std::vector<ps::Data*>* outputs,
+             ps::service::seastar::DoneClosure* done) {
+      RestoreWorkerState(inputs, outputs, done);
+  });
+
   seastar_lib_->Start();
 
   NetUtils::GetDefaultIP(ip_);
@@ -207,13 +244,11 @@ void SchedulerService::ServerRestore(
     int server_type,
     int server_id,
     Version version,
-    const std::string& checkpoint,
     const std::vector<VariableInfo>& from,
     const std::vector<VariableInfo>& to,
     std::function<void(Status)> cb) {
   std::vector<Data*> datas = {
     new WrapperData<Version>(version),
-    new WrapperData<std::string>(checkpoint),
     new WrapperData<VariableInfoCollection>(VariableInfoCollection{.infos = from}),
     new WrapperData<VariableInfoCollection>(VariableInfoCollection{.infos = to})
   }; seastar_lib_->Request(server_offset_[server_type] + server_id, func_ids::kServerRestore, datas,
@@ -283,9 +318,11 @@ void SchedulerService::ServerTriggerStreamingSparse(
     int server_type,
     int server_id,
     Version version,
+    const std::string& stream_version,
     std::function<void(Status)> cb) {
   std::vector<Data*> datas = {
-    new WrapperData<Version>(version)
+    new WrapperData<Version>(version),
+    new WrapperData<std::string>(stream_version)
   };
   seastar_lib_->Request(server_offset_[server_type] + server_id, func_ids::kServerTriggerStreamingSparse, datas,
     new CallBackClosure([cb](const SeastarStatus& sst, const std::vector<ps::Data*>& datas) {
@@ -297,9 +334,11 @@ void SchedulerService::ServerTriggerStreamingHash(
     int server_type,
     int server_id,
     Version version,
+    const std::string& stream_version,
     std::function<void(Status)> cb) {
   std::vector<Data*> datas = {
-    new WrapperData<Version>(version)
+    new WrapperData<Version>(version),
+    new WrapperData<std::string>(stream_version)
   };
   seastar_lib_->Request(server_offset_[server_type] + server_id, func_ids::kServerTriggerStreamingHash, datas,
     new CallBackClosure([cb](const SeastarStatus& sst, const std::vector<ps::Data*>& datas) {
@@ -383,6 +422,119 @@ void SchedulerService::Restore(const std::vector<Data*>& inputs, std::vector<Dat
   });
 }
 
+void SchedulerService::InitGlobalQueue(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
+  if (inputs.size() != 5) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService InitGlobalQueue: Need 5 inputs")));
+    done->Run();
+    return;
+  }
+
+  WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
+  WrapperData<std::string>* name = dynamic_cast<WrapperData<std::string>*>(inputs[1]);  
+  using StringVec = std::vector<std::string>;
+  WrapperData<StringVec>* paths = dynamic_cast<WrapperData<StringVec>*>(inputs[2]);
+  WrapperData<size_t>* epoch = dynamic_cast<WrapperData<size_t>*>(inputs[3]);
+  WrapperData<bool>* epoch_isolate = dynamic_cast<WrapperData<bool>*>(inputs[4]);
+
+  if (ver == nullptr || paths == nullptr || 
+      name == nullptr ||
+      epoch == nullptr || 
+      epoch_isolate == nullptr) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService InitGlobalQueue: Input Type Error")));
+    done->Run();
+    return;
+  }
+
+  Status st = impl_->InitGlobalQueue(
+      ver->Internal(), 
+      name->Internal(),
+      paths->Internal(), 
+      epoch->Internal(), 
+      epoch_isolate->Internal());
+  outputs->push_back(new WrapperData<Status>(st));
+  done->Run();
+}
+
+void SchedulerService::GetNextFile(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
+  if (inputs.size() != 3) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService GetNextFile: Need 3 inputs")));
+    done->Run();
+    return;
+  }
+
+  WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
+  WrapperData<std::string>* name = dynamic_cast<WrapperData<std::string>*>(inputs[1]);  
+  WrapperData<size_t>* worker_id = dynamic_cast<WrapperData<size_t>*>(inputs[2]);
+  if (ver == nullptr || name == nullptr || worker_id == nullptr) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService GetNextFile: Input Type Error")));
+    done->Run();
+    return;
+  }
+
+  WorkerState ws;
+  Status st = impl_->GetNextFile(ver->Internal(), name->Internal() ,worker_id->Internal(), &ws);
+  outputs->push_back(new WrapperData<Status>(st));
+  outputs->push_back(new WrapperData<std::string>(ws.path_));
+  outputs->push_back(new WrapperData<size_t>(ws.begin_));
+  outputs->push_back(new WrapperData<size_t>(ws.epoch_));
+  done->Run();
+}
+
+void SchedulerService::ReportWorkerState(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
+  if (inputs.size() != 4) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService ReportWorkerState: Need 4 inputs")));
+    done->Run();
+    return;
+  }
+
+  WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
+  WrapperData<std::string>* name = dynamic_cast<WrapperData<std::string>*>(inputs[1]);  
+  WrapperData<size_t>* worker_id = dynamic_cast<WrapperData<size_t>*>(inputs[2]);
+  using WorkerStateVec = std::vector<WorkerState>;
+  WrapperData<WorkerStateVec>* worker_states = 
+    dynamic_cast<WrapperData<WorkerStateVec>*>(inputs[3]);
+
+  if (ver == nullptr || worker_id == nullptr || 
+      name == nullptr ||
+      worker_states == nullptr) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService ReportWorkerState: Input Type Error")));
+    done->Run();
+    return;
+  }
+
+  Status st = impl_->ReportWorkerState(
+      ver->Internal(), 
+      name->Internal(),
+      worker_id->Internal(), 
+      worker_states->Internal());
+  outputs->push_back(new WrapperData<Status>(st));
+  done->Run();
+}
+
+void SchedulerService::RestoreWorkerState(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
+  if (inputs.size() != 3) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService RestoreWorkerState: Need 3 inputs")));
+    done->Run();
+    return;
+  }
+
+  WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
+  WrapperData<std::string>* name = dynamic_cast<WrapperData<std::string>*>(inputs[1]);  
+  WrapperData<size_t>* worker_id = dynamic_cast<WrapperData<size_t>*>(inputs[2]);
+  if (ver == nullptr || name == nullptr || worker_id == nullptr) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService RestoreWorkerState: Input Type Error")));
+    done->Run();
+    return;
+  }
+
+  Status st = impl_->RestoreWorkerState(
+      ver->Internal(), 
+      name->Internal(),
+      worker_id->Internal());
+  outputs->push_back(new WrapperData<Status>(st));
+  done->Run();
+}
+
 void SchedulerService::RegisterServer(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
   if (inputs.size() != 1) {
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService RegisterServer: Need 1 inputs")));
@@ -444,54 +596,57 @@ void SchedulerService::UpdateVariableInfo(const std::vector<Data*>& inputs, std:
 }
 
 void SchedulerService::TriggerStreamingDense(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
-  if (inputs.size() != 1) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingDense: Need 1 inputs")));
+  if (inputs.size() != 2) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingDense: Need 2 inputs")));
     done->Run();
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
-  if (ver == nullptr) {
+  WrapperData<std::string>* stream_version = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
+  if ((ver == nullptr) || (stream_version == nullptr)){
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingDense: Input Type Error")));
     done->Run();
     return;
   }
-  impl_->TriggerStreamingDense(ver->Internal(), [outputs, done](const Status& st) {
+  impl_->TriggerStreamingDense(ver->Internal(), stream_version->Internal(), [outputs, done](const Status& st) {
     outputs->push_back(new WrapperData<Status>(st));
     done->Run();
   });
 }
 
 void SchedulerService::TriggerStreamingSparse(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
-  if (inputs.size() != 1) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingSparse: Need 1 inputs")));
+  if (inputs.size() != 2) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingSparse: Need 2 inputs")));
     done->Run();
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
-  if (ver == nullptr) {
+  WrapperData<std::string>* stream_version = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
+  if ((ver == nullptr) || (stream_version == nullptr)){
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingSparse: Input Type Error")));
     done->Run();
     return;
   }
-  impl_->TriggerStreamingSparse(ver->Internal(), [outputs, done](const Status& st) {
+  impl_->TriggerStreamingSparse(ver->Internal(), stream_version->Internal(), [outputs, done](const Status& st) {
     outputs->push_back(new WrapperData<Status>(st));
     done->Run();
   });
 }
 
 void SchedulerService::TriggerStreamingHash(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done) {
-  if (inputs.size() != 1) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingHash: Need 1 inputs")));
+  if (inputs.size() != 2) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingHash: Need 2 inputs")));
     done->Run();
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
-  if (ver == nullptr) {
+  WrapperData<std::string>* stream_version = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
+  if ((ver == nullptr) || (stream_version == nullptr)){
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService TriggerStreamingHash: Input Type Error")));
     done->Run();
     return;
   }
-  impl_->TriggerStreamingHash(ver->Internal(), [outputs, done](const Status& st) {
+  impl_->TriggerStreamingHash(ver->Internal(), stream_version->Internal(), [outputs, done](const Status& st) {
     outputs->push_back(new WrapperData<Status>(st));
     done->Run();
   });
@@ -575,14 +730,14 @@ void SchedulerService::WorkerReportFinish(const std::vector<Data*>& inputs,
                                           std::vector<Data*>* outputs,
                                           ps::service::seastar::DoneClosure* done) {
   if (inputs.size() != 2) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService SynchronizeLeave: Need 3 inputs")));
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService WorkerReportFinish: Need 2 inputs")));
     done->Run();
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
   WrapperData<int>* id = dynamic_cast<WrapperData<int>*>(inputs[1]);
   if (ver == nullptr || id == nullptr) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService SynchronizeLeave: Input Type Error")));
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService WorkerReportFinish: Input Type Error")));
     done->Run();
     return;
   }
@@ -592,6 +747,29 @@ void SchedulerService::WorkerReportFinish(const std::vector<Data*>& inputs,
   });
 }
 
+void SchedulerService::GetWorkerFinishCount(const std::vector<Data*>& inputs,
+    std::vector<Data*>* outputs,
+    ps::service::seastar::DoneClosure* done) {
+  if (inputs.size() != 1) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService GetWorkerFinishCount: Need 1 inputs")));
+    outputs->push_back(new WrapperData<int64_t>(-1));
+    done->Run();
+    return;
+  }
+  WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
+  if (ver == nullptr) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService GetWorkerFinishCount: Input Type Error")));
+    outputs->push_back(new WrapperData<int64_t>(-1));
+    done->Run();
+    return;
+  }
+  impl_->GetWorkerFinishCount(ver->Internal(), [outputs, done](int64_t count, const Status& st) {
+        outputs->push_back(new WrapperData<Status>(st));
+        outputs->push_back(new WrapperData<int64_t>(count));
+        done->Run();
+      });
+}
+
 void SchedulerService::WorkerBarrier(const std::vector<Data*>& inputs,
                                      std::vector<Data*>* outputs,
                                      ps::service::seastar::DoneClosure* done) {
@@ -614,6 +792,45 @@ void SchedulerService::WorkerBarrier(const std::vector<Data*>& inputs,
   });
 }
 
+void SchedulerService::WorkerBarrierV2(const std::vector<Data*>& inputs,
+                                       std::vector<Data*>* outputs,
+                                       ps::service::seastar::DoneClosure* done) {
+  if (inputs.size() != 5) {
+    outputs->push_back(
+        new WrapperData<Status>(
+            Status::ArgumentError("SchedulerService WorkerBarrier: Need 3 inputs")));
+    done->Run();
+    return;
+  }
+
+  WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
+  WrapperData<int>* barrier_id = dynamic_cast<WrapperData<int>*>(inputs[1]);
+  WrapperData<int>* task_id = dynamic_cast<WrapperData<int>*>(inputs[2]);
+  WrapperData<int>* task_num = dynamic_cast<WrapperData<int>*>(inputs[3]);
+  WrapperData<int>* token = dynamic_cast<WrapperData<int>*>(inputs[4]);
+  if (ver == nullptr || 
+      barrier_id == nullptr || 
+      task_id == nullptr || 
+      task_num == nullptr || 
+      token == nullptr) {
+    outputs->push_back(
+        new WrapperData<Status>(
+            Status::ArgumentError("SchedulerService WorkerBarrier: Input Type Error")));
+    done->Run();
+    return;
+  }
+
+  impl_->WorkerBarrierV2(ver->Internal(), 
+                         barrier_id->Internal(), 
+                         task_id->Internal(), 
+                         task_num->Internal(), 
+                         token->Internal(), 
+                         [outputs, done](const Status& st) {
+    outputs->push_back(new WrapperData<Status>(st));
+    done->Run();
+  });
+}
+
 void SchedulerService::UpdateVariableVisitInfo(const std::vector<Data*>& inputs,
                                                std::vector<Data*>* outputs,
                                                ps::service::seastar::DoneClosure* done) {
@@ -626,7 +843,6 @@ void SchedulerService::UpdateVariableVisitInfo(const std::vector<Data*>& inputs,
   WrapperData<std::string>* var_name = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
   WrapperData<int64_t>* ids = dynamic_cast<WrapperData<int64_t>*>(inputs[2]);
 
-
   if (ver == nullptr || var_name == nullptr || ids == nullptr) {
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SchedulerService UpdateVariableVisitInfo: Input Type Error")));
     done->Run();
diff --git a/xdl/ps-plus/ps-plus/scheduler/scheduler_service.h b/xdl/ps-plus/ps-plus/scheduler/scheduler_service.h
index c77aa71d..73021ad0 100644
--- a/xdl/ps-plus/ps-plus/scheduler/scheduler_service.h
+++ b/xdl/ps-plus/ps-plus/scheduler/scheduler_service.h
@@ -40,7 +40,7 @@ class SchedulerService {
     : impl_(impl)
     , core_num_(NetUtils::GetAvailableCpuNum())
     , scheduler_kv_addr_(scheduler_kv_addr) 
-    , port_(NetUtils::GetAvailablePort()) 
+    , port_(NetUtils::GetAvailablePort())
     , bind_cores_(bind_cores) {
     server_count_ = server_count;
     server_offset_.push_back(0);
@@ -71,7 +71,6 @@ class SchedulerService {
       int server_type,
       int server_id,
       Version version,
-      const std::string& checkpoint,
       const std::vector<VariableInfo>& from,
       const std::vector<VariableInfo>& to,
       std::function<void(Status)> cb);
@@ -90,11 +89,13 @@ class SchedulerService {
       int server_type,
       int server_id,
       Version version,
+      const std::string& stream_version,
       std::function<void(Status)> cb);
   void ServerTriggerStreamingHash(
       int server_type,
       int server_id,
       Version version,
+      const std::string& stream_version,
       std::function<void(Status)> cb);
   void ModelServerFlush(
       int server_type,
@@ -110,6 +111,10 @@ class SchedulerService {
   void GetClusterInfo(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void Save(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void Restore(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
+  void InitGlobalQueue(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
+  void GetNextFile(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
+  void ReportWorkerState(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
+  void RestoreWorkerState(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void UpdateVariableInfo(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void TriggerStreamingDense(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void TriggerStreamingSparse(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
@@ -118,13 +123,16 @@ class SchedulerService {
   void SynchronizeLeave(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void AsynchronizeEnter(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void WorkerReportFinish(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
+  void GetWorkerFinishCount(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
   void WorkerBarrier(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);    
+  void WorkerBarrierV2(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);    
   void UpdateVariableVisitInfo(const std::vector<Data*>& inputs, std::vector<Data*>* outputs, ps::service::seastar::DoneClosure* done);
 
   static const int CLIENT_THREAD_NUM = 100;
 
   SchedulerImpl* impl_;
   std::string server_count_;
+  bool bind_cores_;
   int core_num_;
   std::unique_ptr<ps::service::seastar::SeastarServerClientLib> seastar_lib_;
 
@@ -133,7 +141,6 @@ class SchedulerService {
   std::string ip_;
   int server_type_size_;
   std::vector<int> server_offset_;
-  bool bind_cores_;
 };
 
 }
diff --git a/xdl/ps-plus/ps-plus/scheduler/simple_placementer.cc b/xdl/ps-plus/ps-plus/scheduler/simple_placementer.cc
index 1a8e3400..9b980f27 100644
--- a/xdl/ps-plus/ps-plus/scheduler/simple_placementer.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/simple_placementer.cc
@@ -177,7 +177,7 @@ class SimplePlacementer : public Placementer {
           x.slice_mem = SizeOfType(info.datatype) * slice_size;
           x.slice_net = SizeOfType(info.datatype) * slice_size * ratio;
         }
-      } else if (info.type == VariableInfo::kHash) {
+      } else if (info.type == VariableInfo::kHash128 || info.type == VariableInfo::kHash64) {
         if (info.shape.empty()) {
           return Status::ArgumentError("Hash Should at least 1 dim");
         }
diff --git a/xdl/ps-plus/ps-plus/scheduler/synchronizer.cc b/xdl/ps-plus/ps-plus/scheduler/synchronizer.cc
index 31c6f85d..1e44f06b 100644
--- a/xdl/ps-plus/ps-plus/scheduler/synchronizer.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/synchronizer.cc
@@ -16,7 +16,7 @@ limitations under the License.
 #include "synchronizer.h"
 
 #include "ps-plus/common/status.h"
-#include <glog/logging.h>
+#include "ps-plus/common/logging.h"
 #include <string>
 #include <iostream>
 
diff --git a/xdl/ps-plus/ps-plus/scheduler/test/anneal_placementer_test.cc b/xdl/ps-plus/ps-plus/scheduler/test/anneal_placementer_test.cc
index 6777bf6b..9c143e70 100644
--- a/xdl/ps-plus/ps-plus/scheduler/test/anneal_placementer_test.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/test/anneal_placementer_test.cc
@@ -52,7 +52,7 @@ TEST(AnnealPlacementer, AnnealPlacementer) {
   Placementer::Arg arg1{.net = 100, .mem = 10, .query = 100};
   EXPECT_FALSE(sp->Placement(input, &output, arg1, sn).IsOk());
   shape2[0] = 65535;
-  VariableInfo info3{.type = VariableInfo::Type::kHash, .name = "var2", .parts = parts2, .shape = shape2, .datatype = DataType::kInt8, .args = args2};
+  VariableInfo info3{.type = VariableInfo::Type::kHash128, .name = "var2", .parts = parts2, .shape = shape2, .datatype = DataType::kInt8, .args = args2};
   input[1] = info3;
   EXPECT_TRUE(sp->Placement(input, &output, arg, sn).IsOk());
 }
diff --git a/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_test.cc b/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_test.cc
index 86486f30..df542c9e 100644
--- a/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_test.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_test.cc
@@ -49,12 +49,12 @@ TEST(BalancePlacementerTest, BalancePlacementer) {
   FILE *fp = fopen("./meta.bin", "w");
   size_t a = 2;
   fwrite(&a, sizeof(a), 1, fp);
-  a = 11;
+  a = 13;
   fwrite(&a, sizeof(a), 1, fp);
-  fwrite("var1\n1\n2\n3\n", 11, 1, fp);
-  a = 11;
+  fwrite("var1\n1\n2\n3\n4\n", 13, 1, fp);
+  a = 13;
   fwrite(&a, sizeof(a), 1, fp);
-  fwrite("var2\n4\n5\n6\n", 11, 1, fp);
+  fwrite("var2\n4\n5\n6\n4\n", 13, 1, fp);
   fclose(fp);
 
   setenv("meta_dir", "./meta.bin", 1);
@@ -62,7 +62,9 @@ TEST(BalancePlacementerTest, BalancePlacementer) {
   Status st = sp->Placement(input, &output, arg, sn);
   EXPECT_EQ(0, output.size());
   std::vector<VariableInfo> input1 = output;
-  EXPECT_TRUE(sp->Placement(input1, &output, arg, sn).IsOk());
+  st = sp->Placement(input1, &output, arg, sn);
+  std::cout << st.ToString() << std::endl;
+  EXPECT_TRUE(st.IsOk());
   EXPECT_EQ(0, output.size());
   Placementer::Arg arg1{.net = 100, .mem = 10, .query = 100};
   EXPECT_FALSE(sp->Placement(input, &output, arg1, sn).IsOk());
diff --git a/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_v2_test.cc b/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_v2_test.cc
new file mode 100644
index 00000000..7febf434
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/scheduler/test/balance_placementer_v2_test.cc
@@ -0,0 +1,57 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <stdio.h>
+
+#include "gtest/gtest.h"
+#include "ps-plus/scheduler/placementer.h"
+
+using ps::scheduler::Placementer;
+using ps::VariableInfo;
+using ps::Status;
+using ps::DataType;
+
+TEST(BalancePlacementerV2Test, BalancePlacementerV2) {
+  auto sp = ps::GetPlugin<Placementer>("BalanceV2");
+
+  size_t sn = 2;
+  std::vector<VariableInfo> input;
+  std::vector<int64_t> shape1;
+  shape1.push_back(4);
+  shape1.push_back(8);
+  std::vector<int64_t> shape2;
+  shape2.push_back(4);
+  shape2.push_back(8);
+  std::vector<VariableInfo::Part> parts1;
+  std::vector<VariableInfo::Part> parts2;
+  std::unordered_map<std::string, std::string> args1;
+  std::unordered_map<std::string, std::string> args2;
+
+  VariableInfo info1{.type = VariableInfo::Type::kIndex, .name = "var1", .parts = parts1, .shape = shape1, .datatype = DataType::kInt8, .args = args1};
+  VariableInfo info2{.type = VariableInfo::Type::kIndex, .name = "var2", .parts = parts2, .shape = shape2, .datatype = DataType::kInt8, .args = args2};
+  input.push_back(info1);
+  input.push_back(info2);
+  std::vector<VariableInfo> output;
+  Placementer::Arg arg{.net = 0, .mem = 0, .query = 0};
+
+  Status st = sp->Placement(input, &output, arg, sn);
+  EXPECT_EQ(0, output.size());
+  std::vector<VariableInfo> input1 = output;
+  EXPECT_TRUE(sp->Placement(input1, &output, arg, sn).IsOk());
+  EXPECT_EQ(0, output.size());
+  Placementer::Arg arg1{.net = 100, .mem = 10, .query = 100};
+  EXPECT_FALSE(sp->Placement(input, &output, arg1, sn).IsOk());
+}
+
diff --git a/xdl/ps-plus/ps-plus/scheduler/test/simple_placementer_test.cc b/xdl/ps-plus/ps-plus/scheduler/test/simple_placementer_test.cc
index 16fd5a7c..1b45fceb 100644
--- a/xdl/ps-plus/ps-plus/scheduler/test/simple_placementer_test.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/test/simple_placementer_test.cc
@@ -52,7 +52,7 @@ TEST(SimplePlacementer, SimplePlacementer) {
   Placementer::Arg arg1{.net = 100, .mem = 10, .query = 100};
   EXPECT_FALSE(sp->Placement(input, &output, arg1, sn).IsOk());
   shape2[0] = 65535;
-  VariableInfo info3{.type = VariableInfo::Type::kHash, .name = "var2", .parts = parts2, .shape = shape2, .datatype = DataType::kInt8, .args = args2};
+  VariableInfo info3{.type = VariableInfo::Type::kHash128, .name = "var2", .parts = parts2, .shape = shape2, .datatype = DataType::kInt8, .args = args2};
   input[1] = info3;
   EXPECT_FALSE(sp->Placement(input, &output, arg, sn).IsOk());
 }
diff --git a/xdl/ps-plus/ps-plus/scheduler/test/synchronizer_tests.cc b/xdl/ps-plus/ps-plus/scheduler/test/synchronizer_tests.cc
index dd5460af..c540cd4a 100644
--- a/xdl/ps-plus/ps-plus/scheduler/test/synchronizer_tests.cc
+++ b/xdl/ps-plus/ps-plus/scheduler/test/synchronizer_tests.cc
@@ -98,3 +98,30 @@ TEST(Synchronizer, Reset) {
   });
   EXPECT_EQ(result, 1);      
 }
+
+TEST(Synchronizer, WorkerReportFinish) {
+  unique_ptr<Synchronizer> sync(new Synchronizer(2));
+  int64_t result = -1;
+  sync->Enter(0, [&result](int64_t token, const Status& st) {
+    result = token;
+  });
+  EXPECT_EQ(result, 0);
+  sync->Enter(1, [&result](int64_t token, const Status& st) {
+    result = token;
+  });
+  EXPECT_EQ(result, 0);
+  string execute_log;
+  sync->Leave(0, 0, [&execute_log](const Status& st) {
+    execute_log += "0L";
+  });
+  EXPECT_EQ(execute_log, "0L");
+  sync->Enter(0, [&result, &execute_log](int64_t token, const Status& st) {
+    result = token;    
+    execute_log += "0E";
+  });
+  EXPECT_EQ(result, 0L);
+  EXPECT_EQ(execute_log, "0L");
+  sync->WorkerReportFinish(1);
+  EXPECT_EQ(execute_log, "0L0E");
+  EXPECT_EQ(result, 1L);    
+}
diff --git a/xdl/ps-plus/ps-plus/server/checkpoint_utils.cc b/xdl/ps-plus/ps-plus/server/checkpoint_utils.cc
index bce403dd..b2192f2f 100644
--- a/xdl/ps-plus/ps-plus/server/checkpoint_utils.cc
+++ b/xdl/ps-plus/ps-plus/server/checkpoint_utils.cc
@@ -1,140 +1,160 @@
-#include <glog/logging.h>
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <chrono>
 #include "ps-plus/server/checkpoint_utils.h"
 #include "ps-plus/common/serializer.h"
-#include "ps-plus/common/hasher.h"
+#include "ps-plus/common/logging.h"
+#include <map>
+#define CK_CHECK_STATUS(STATUS, STATUS_RET, COUNTER, OK) do { Status st = STATUS_RET; if (!st.IsOk()) {STATUS = st; if (--COUNTER == 0) {OK.set_value(true);} return;}} while(0);
 
 namespace ps {
 namespace server {
 
-CheckpointUtils::CheckpointUtils(const std::string& path, const VariableInfoCollection& infos) {
-  path_ = path;
-  for (auto&& item : infos.infos) {
-    infos_[item.name] = item;
-  }
+CheckpointUtils::CheckpointUtils(const VariableInfoCollection& infos) : infos_(infos) {
 }
 
-/*
 Status CheckpointUtils::LoadVariables(
     const VariableInfoCollection& infos,
     size_t id,
     std::unordered_map<std::string, std::unique_ptr<Variable>>* vars) {
-  ThreadPool* pool = ThreadPool::Global();
-  std::promise<Status> status;
   std::atomic<size_t> counter(0);
-  for (auto&& info : infos.infos) {
-    for (auto& part : info.parts) {
-      if (part.server == id) {
-        counter++;
-      }
+  std::map<std::string, VariableInfo> source_infos;
+  for (auto&& item : infos_.infos) {
+    auto iter = item.args.find(VariableInfo::ORIGIN_NAME);
+    if (iter != item.args.end()) {
+      source_infos[iter->second] = item;
+    } else {
+      source_infos[item.name] = item;   
     }
   }
-  for (auto&& info : infos.infos) {
-    auto iter = infos_.find(info.name);
-    if (iter == infos_.end()) {
-      continue;
-    }
-    size_t beg = 0;
-    for (size_t i = 0; i < info.parts.size(); i++) {
-      auto part = info.parts[i];
-      size_t end = beg + part.size;
-      if (part.server == id) {
-        LOG_INFO("Loading variable[%s] part[%d].", info.name.c_str(), i);
-        (*vars)[info.name] = std::unique_ptr<Variable>(nullptr);
-        VariableInfo vi = iter->second;
-        pool->Schedule([vi, beg, end, vars, i, this, &counter, &status] {
-                                VariableStruct vs;
-                                Status st = MergeLoadVariable(vi.name, vi, beg, end, &vs, &(*vars)[vi.name]);
-                                if (!st.IsOk()) {
-                                  status.set_value(st);
-                                }
-                                LOG(INFO) << "Load variable" << vi.name.c_str() << " part " << i << " MergeLoadVariable success.";
-                                if (--counter == 0) {
-                                  status.set_value(Status::Ok());
-                                }
-                            });
-      }
-      beg = end;
-    }
-  }
-  infos_.clear();
-  for (auto&& item : infos.infos) {
-    infos_[item.name] = item;
-  }
-  std::future<Status> future = status.get_future();
-  future.wait();
-  PS_CHECK_STATUS(future.get());
-  LOG(INFO) << "Finish load variables.";
-  return Status::Ok();
-}
-*/
 
-Status CheckpointUtils::LoadVariables(
-    const VariableInfoCollection& infos,
-    size_t id,
-    std::unordered_map<std::string, std::unique_ptr<Variable>>* vars) {
-  for (auto&& info : infos.infos) {
-    auto iter = infos_.find(info.name);
-    if (iter == infos_.end()) {
-      continue;
-    }
-    size_t beg = 0;
-    for (size_t i = 0; i < info.parts.size(); i++) {
-      auto part = info.parts[i];
-      size_t end = beg + part.size;
-      if (part.server == id) {
-//          LOG(DEBUG) << "Loading variable" << info.name.c_str() << " part" << i;
-        VariableInfo vi = iter->second;
-        VariableStruct vs;
-        Status st = MergeLoadVariable(vi.name, vi, beg, end, &vs, &(*vars)[vi.name]);
-        if (st.Code() == Status::ErrorCode::kNotFound) {
-          LOG(WARNING) << st.Msg();
-          vars->erase(vi.name);
-        } else {
-          PS_CHECK_STATUS(st);
-//          LOG(DEBUG) << "Load variable" << vi.name << " part" << i << " MergeLoadVariable success.";
+  for (auto&& to : infos.infos) {
+    auto n = to.args.find(VariableInfo::ORIGIN_NAME); 
+    std::string name = n == to.args.end() ? to.name : n->second;    
+    auto iter = source_infos.find(name);
+    if (iter != source_infos.end()) {
+      for (size_t i = 0; i < to.parts.size(); i++) {
+        auto part = to.parts[i];
+        if (part.server == id) {
+          (*vars)[to.name] = std::unique_ptr<Variable>(nullptr);
+          ++counter;
+          break;
         }
       }
-      beg = end;
     }
   }
-  infos_.clear();
-  for (auto&& item : infos.infos) {
-    infos_[item.name] = item;
+  if (counter == 0) {
+    return Status::Ok();
   }
-//  LOG(DEBUG) << "Finish load variables.";
+  PS_CHECK_STATUS(MultiThreadDo(infos.infos.size(), [&](const Range& range) {
+        for (size_t si = range.begin; si < range.end; ++si) {
+          auto& to = infos.infos[si];
+          auto n = to.args.find(VariableInfo::ORIGIN_NAME);
+          std::string name = n == to.args.end() ? to.name : n->second;
+          auto iter = source_infos.find(name);
+          if (iter == source_infos.end()) {
+            continue;
+          }
+          size_t beg = 0;
+          for (size_t i = 0; i < to.parts.size(); i++) {
+            auto part = to.parts[i];
+            size_t end = beg + part.size;
+            if (part.server == id) {
+              LOG(INFO) << "Loading variable " << name << " part " << i;
+              VariableInfo vi = iter->second;
+              auto p = to.args.find(VariableInfo::ORIGIN_FILE_PATH);
+              if (p != to.args.end()) {
+                vi.args[VariableInfo::ORIGIN_FILE_PATH] = p->second;
+              }
+              Status st = MergeLoadVariable(to.name, vi, beg, end, &(*vars)[to.name]);
+              if (!st.IsOk()) {
+                if ((st.Code() == Status::ErrorCode::kUnknown || st.Code() == Status::ErrorCode::kNotFound) && vi.args.find("save") != vi.args.end() && vi.args["save"] == "false") {
+                  LOG(INFO) << "Variable[" << to.name << "] not load.";
+                  vars->erase(to.name);
+                  continue;
+                }
+                LOG(WARNING) << "Variable[" << to.name <<  "] MergeLoadVariable failed, status[" << st.Msg() << "].";
+                vars->erase(to.name);
+                return st;
+              } else {
+                LOG(INFO) << "Variable[" << to.name << "] MergeLoadVariable success.";
+              }
+            }
+            beg = end;
+          }
+        }
+        return Status::Ok();}, 4));
+  LOG(INFO) << "Finish load variables.";
   return Status::Ok();
 }
 
 Status CheckpointUtils::SaveVariables(
     size_t id,
-    const std::unordered_map<std::string, std::unique_ptr<Variable>>& vars) {
+    const std::string& checkpoint_path,
+    const std::unordered_map<std::string, std::unique_ptr<Variable>>& vars,
+    size_t timeout) {
+  std::map<std::string, VariableInfo> dest_infos;
+  for (auto&& item : infos_.infos) {
+    dest_infos[item.name] = item;
+  }
+  if (vars.size() == 0) {
+    return Status::Ok();
+  }
+  std::atomic<size_t> counter(vars.size());
+  Status status = Status::Ok();
+  std::promise<bool> ok;
   for (auto&& item : vars) {
-    auto iter = infos_.find(item.first);
-    if (iter == infos_.end()) {
-      LOG(ERROR) << "Can't find variable " << item.first << " in variable_infos.";
-      continue;
-    }
-    VariableInfo info = iter->second;
-    if (info.args["save"] == "false") {
-      LOG(ERROR) << "Variable" << item.first << " not to save.";
-      continue;
-    }
-    int part = -1;
-    for (size_t i = 0; i < info.parts.size(); i++) {
-      if (info.parts[i].server == id) {
-        part = i;
-        break;
-      }
-    }
-    if (part == -1) {
-      LOG(ERROR) << "Not found variable" << item.first << " part" << id << " in variable_infos when save variable.";
-      continue;
-    }
-    VariableStruct vs;
-    PS_CHECK_STATUS(VariableToStruct(item.second, &vs));
-    PS_CHECK_STATUS(SaveVariable(iter->first, part, &vs));
+    std::string name = item.first;
+    ThreadPool::Global()->Schedule([&, name] {
+          auto iter = dest_infos.find(name);
+          if (iter == dest_infos.end()) {
+            CK_CHECK_STATUS(status, Status::ArgumentError("Can't find variable[" + name + "] in variable_infos."), counter, ok);
+          }
+          VariableInfo info = iter->second;
+          if (info.args["save"] == "false") {
+            if (--counter == 0) {
+              ok.set_value(true);
+            }
+            return;
+          }
+          int part = -1;
+          for (size_t i = 0; i < info.parts.size(); i++) {
+            if (info.parts[i].server == id) {
+              part = i;
+              break;
+            }
+          }
+          if (part == -1) {
+            CK_CHECK_STATUS(status, Status::ArgumentError("Not found variable[" + name + "] part[" + std::to_string(id) + "] in variable_infos when save variable."),
+                            counter, ok);
+          }
+          VariableStruct vs;
+          CK_CHECK_STATUS(status, VariableToStruct(vars.at(name), &vs), counter, ok);
+          CK_CHECK_STATUS(status, SaveVariable(checkpoint_path, iter->first, part, &vs), counter, ok);
+          if (--counter == 0) {
+            ok.set_value(true);
+          }
+        });
   }
-  return Status::Ok();
+  std::future_status fstatus = ok.get_future().wait_for(std::chrono::minutes(timeout));
+  if (fstatus != std::future_status::ready) {
+    LOG(FATAL) << "Save checkpoint timeout, killing myself...";
+    throw std::runtime_error("Save checkpoint timeout");
+  }
+  return status;
 }
 
 std::string CheckpointUtils::VariableNameToFileName(const std::string& name, size_t id) {
@@ -147,23 +167,35 @@ std::string CheckpointUtils::VariableNameToFileName(const std::string& name, siz
   return ret + '^' + std::to_string(id);
 }
 
-Status CheckpointUtils::MergeLoadVariable(const std::string& var_name, const VariableInfo& info, size_t beg, size_t end, VariableStruct* var, std::unique_ptr<Variable>* result_variable) {
+std::string CheckpointUtils::VariableInfoToFileName(const VariableInfo& info, size_t id) {
+  auto p = info.args.find(VariableInfo::ORIGIN_FILE_PATH);
+  if (p == info.args.end()) {
+    LOG(ERROR) << info.name << " args not contain " << VariableInfo::ORIGIN_FILE_PATH;
+    return "";
+  }
+  std::string file_path = p->second;
+  auto n = info.args.find(VariableInfo::ORIGIN_NAME);
+  std::string name = n == info.args.end() ? info.name : n->second;
+  return file_path + "/" + VariableNameToFileName(name, id);
+}
+
+Status CheckpointUtils::MergeLoadVariable(const std::string& name, const VariableInfo& info, size_t beg, size_t end, std::unique_ptr<Variable>* result_variable) {
   std::vector<std::unique_ptr<LoadVariableStruct>> variables;
   size_t part_beg = 0;
-  clock_t time_start, time_end;
-  time_start = clock();
-
+  std::chrono::time_point<std::chrono::system_clock> time_start, time_end;
+  time_start = std::chrono::system_clock::now();
+  
   for (size_t i = 0; i < info.parts.size(); i++) {
     size_t part_end = part_beg + info.parts[i].size;
-//    LOG(DEBUG) << "part_beg " << part_beg << " part_end" << part_end;
     if (part_beg < end && beg < part_end) {
+      LOG(INFO) << name << ", part_beg [" << part_beg << "] part_end [" << part_end << "]";
       variables.emplace_back(new LoadVariableStruct);
       LoadVariableStruct& lvs = *variables.back();
       lvs.beg = part_beg;
       lvs.end = part_end;
       lvs.clip_beg = std::max(part_beg, beg);
       lvs.clip_end = std::min(part_end, end);
-      PS_CHECK_STATUS(LoadVariable(var_name, i, &lvs.variable));
+      PS_CHECK_STATUS(LoadVariable(info, i, &lvs.variable));
       if (!lvs.variable.initialized) {
         variables.pop_back();
       }
@@ -173,8 +205,10 @@ Status CheckpointUtils::MergeLoadVariable(const std::string& var_name, const Var
   if (variables.size() == 0) {
     return Status::NotFound("Not found variable when load " + info.name);
   }
-  time_end = clock();
+  time_end = std::chrono::system_clock::now();  
+  LOG(INFO) << info.name << ", LoadVariable takes " << std::chrono::duration_cast<std::chrono::seconds>(time_end-time_start).count();
 
+  VariableStruct var;
   // convert index_slicer
   if (info.type == VariableInfo::Type::kIndex) {
       std::unique_ptr<Data> slicer;
@@ -182,182 +216,179 @@ Status CheckpointUtils::MergeLoadVariable(const std::string& var_name, const Var
       if (shape.Dims().size() != 0) {
         shape.Set(0, end - beg);
       }
-      var->index_slicer = beg;
+      var.index_slicer = beg;
       slicer.reset(new WrapperData<size_t>(beg));
-      var->data = Tensor(variables[0]->variable.data.Type(), shape, variables[0]->variable.data.GetInitializer()->Clone(), true);
-      size_t slice_size = SizeOfType(var->data.Type());
+      var.data = Tensor(variables[0]->variable.data.Type(), shape, variables[0]->variable.data.GetInitializer()->Clone());
+      size_t slice_size = SizeOfType(var.data.Type());
       if (shape.Dims().size() != 0) {
-        slice_size = SizeOfType(var->data.Type()) * shape.NumElements() / shape[0];
+        slice_size = SizeOfType(var.data.Type()) * shape.NumElements() / shape[0];
       }
       for (const auto& lvs : variables) {
         if (lvs->beg <= beg) {
-          QuickMemcpy(var->data.Raw<char>(), lvs->variable.data.Raw<char>() + (beg-lvs->beg)* slice_size, (lvs->clip_end-lvs->clip_beg) * slice_size);
+          QuickMemcpy(var.data.Raw<char>(), lvs->variable.data.Raw<char>() + (beg-lvs->beg)* slice_size, (lvs->clip_end-lvs->clip_beg) * slice_size);
         } else {
-          QuickMemcpy(var->data.Raw<char>() + (lvs->beg-beg) * slice_size, lvs->variable.data.Raw<char>(), (lvs->clip_end-lvs->clip_beg) * slice_size);
+          QuickMemcpy(var.data.Raw<char>() + (lvs->beg-beg) * slice_size, lvs->variable.data.Raw<char>(), (lvs->clip_end-lvs->clip_beg) * slice_size);
         }
       }
-      var->type = variables[0]->variable.type;
+      var.type = variables[0]->variable.type;
       for (auto& iter : variables[0]->variable.slots) {
           if (iter.second.joiner == Variable::SlotJoiner::kAnyOne) {
-              var->slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(*iter.second.tensor)), .joiner = iter.second.joiner};
+            var.slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(*iter.second.tensor)), .joiner = iter.second.joiner};
           } else {
-              Tensor* t = iter.second.tensor.get();
-              TensorShape s = t->Shape();
-              if (s.Dims().size() != 0) {              
-                  s.Set(0, end - beg);
-              }
-              var->slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(t->Type(), s, t->GetInitializer()->Clone(), true)), .joiner = iter.second.joiner};
-              size_t ssize = SizeOfType(t->Type());
-              if (s.Dims().size() != 0) {              
-                  ssize = SizeOfType(t->Type()) * s.NumElements() / s[0];
-              }
-              for (auto& lvs : variables) {
-                  if (lvs->beg <= beg) {
-                      QuickMemcpy(var->slots[iter.first].tensor->Raw<char>(), lvs->variable.slots[iter.first].tensor->Raw<char>() + (beg-lvs->beg)* ssize,
-                              (lvs->clip_end-lvs->clip_beg) * ssize);
-                  } else {
-                      QuickMemcpy(var->slots[iter.first].tensor->Raw<char>()+(lvs->beg-beg) * slice_size, lvs->variable.slots[iter.first].tensor->Raw<char>(),
-                              (lvs->clip_end-lvs->clip_beg) * ssize);
-                  }
+            Tensor* t = iter.second.tensor.get();
+            TensorShape s = t->Shape();
+            if (s.Dims().size() != 0) {
+              s.Set(0, end - beg);
+            }
+            var.slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(t->Type(), s, t->GetInitializer()->Clone())), .joiner = iter.second.joiner};
+            size_t ssize = SizeOfType(t->Type());
+            if (s.Dims().size() != 0) {              
+              ssize = SizeOfType(t->Type()) * s.NumElements() / s[0];
+            }
+            for (auto& lvs : variables) {
+              if (lvs->beg <= beg) {
+                QuickMemcpy(var.slots[iter.first].tensor->Raw<char>(), lvs->variable.slots[iter.first].tensor->Raw<char>() + (beg-lvs->beg)* ssize, (lvs->clip_end-lvs->clip_beg) * ssize);
+              } else {
+                QuickMemcpy(var.slots[iter.first].tensor->Raw<char>()+(lvs->beg-beg) * slice_size, lvs->variable.slots[iter.first].tensor->Raw<char>(), (lvs->clip_end-lvs->clip_beg) * ssize);
               }
+            }
           }
       }
-      var->initialized = true;
-      result_variable->reset(new Variable(new Tensor(var->data), slicer.release()));
-      (*result_variable)->SetSlots(CloneSlots(var->slots));
+      var.initialized = true;
+      result_variable->reset(new Variable(new Tensor(var.data), slicer.release(), name));
+      (*result_variable)->SetSlots(CloneSlots(var.slots));
       return Status::Ok();
+  } else {
+    time_start = std::chrono::system_clock::now();
+    LoadHashVariable(variables, name, info, beg, end, *result_variable);
+    time_end = std::chrono::system_clock::now();
+    LOG(INFO) << info.name << ", load hash variable total, takes " << std::chrono::duration_cast<std::chrono::seconds>(time_end-time_start).count();
+    return Status::Ok();
   }
+}
+
+Status CheckpointUtils::LoadHashVariable(const std::vector<std::unique_ptr<LoadVariableStruct>>& variables, const std::string& name, const VariableInfo& info, size_t beg, size_t end, std::unique_ptr<Variable>& result_variable) {
+  auto time_start = std::chrono::system_clock::now();
+  std::vector<std::vector<int64_t> > keys, values;
+  size_t max_size = CalMaxSize(variables, name, beg, end, &keys, &values);
+  if (max_size == 0) {
+    max_size = 1;
+  }
+  auto time_end = std::chrono::system_clock::now();
+  LOG(INFO) << name << ", CalMaxSize, takes " << std::chrono::duration_cast<std::chrono::seconds>(time_end-time_start).count() << ", max_size is " << max_size;
 
-  time_start = clock();
-  // convert hash_slicer
-  size_t max_size = CalMaxSize(variables, beg, end);
-  var->hash_slicer.counter = max_size;
-//  LOG(DEBUG) << "variable " << info.name << " slice " << max_size;
-  TensorShape data_shape = variables[0]->variable.data.Shape();
-  max_size = int(max_size * 1.2) + 10;
+  time_start = std::chrono::system_clock::now();
+  const Tensor& t = variables[0]->variable.data;
+  TensorShape data_shape = t.Shape();
   data_shape.Set(0, max_size);
-  var->data = Tensor(variables[0]->variable.data.Type(), data_shape, variables[0]->variable.data.GetInitializer()->Clone(), true);
+  HashMap* hashmap;
+  if (info.type == VariableInfo::Type::kHash128) {
+    hashmap = new HashMapImpl<Hash128Key>(100);
+  } else {
+    hashmap = new HashMapImpl<int64_t>(100);
+  }
+  Variable* var = new Variable(new Tensor(t.Type(), data_shape, t.GetInitializer()->Clone(), Tensor::TType::kSegment, false), new WrapperData<std::unique_ptr<HashMap> >(hashmap), name);
+  std::unordered_map<std::string, Variable::Slot> slots;
   for (const auto& iter : variables[0]->variable.slots) {
-      if (iter.second.joiner == Variable::SlotJoiner::kAnyOne) {
-          var->slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(*iter.second.tensor)), .joiner = iter.second.joiner};
-      } else {
-          Tensor* t = iter.second.tensor.get();
-          TensorShape s = t->Shape();
-          s.Set(0, max_size);
-          var->slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(t->Type(), s, t->GetInitializer()->Clone(), true)), .joiner = iter.second.joiner};
-      }
+    if (iter.second.joiner == Variable::SlotJoiner::kAnyOne) {
+      slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(*iter.second.tensor)), .joiner = iter.second.joiner};
+    } else {
+      Tensor& tt = *iter.second.tensor;
+      TensorShape tt_shape = tt.Shape();
+      tt_shape.Set(0, max_size);
+      slots[iter.first] = Variable::Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(tt.Type(), tt_shape, tt.GetInitializer()->Clone(), Tensor::TType::kSegment, false)), .joiner = iter.second.joiner};
+    }
   }
-  time_end = clock();
+  time_end = std::chrono::system_clock::now();
+  LOG(INFO) << name << ", initialize takes " << std::chrono::duration_cast<std::chrono::seconds>(time_end-time_start).count();
 
-  time_start = clock();  
-  std::unique_ptr<Data> slicer;
-  std::unique_ptr<WrapperData<HashMap>> xslicer(new WrapperData<HashMap>(max_size));
-  std::vector<int64_t> ids, reused_ids;
-  for (const auto& iter: variables) {
-    const HashMap::HashMapStruct& hash_slicer = iter->variable.hash_slicer;
-    std::vector<int64_t> keys, item_ids;
-    for (size_t index = 0; index < hash_slicer.items.size(); index++) {
-      auto& item = hash_slicer.items[index];
-      uint32_t range = Hasher::Hash128(item.x, item.y);
-      if (beg <= range && range < end) {
-        keys.push_back(item.x);
-        keys.push_back(item.y);
-        item_ids.push_back(item.id);
-      }
-      if (keys.size() > 400000 || index == hash_slicer.items.size()-1) {
-        if (xslicer->Internal().Get(&keys[0], keys.size()/2, 2, &ids, &reused_ids) != 0) {
-          return Status::ArgumentError("insert hashmap failed.");
-        }
-        size_t slice_size = SizeOfType(var->data.Type()) * var->data.Shape().NumElements() / var->data.Shape()[0];
-        for (size_t ki = 0; ki < keys.size()/2; ki++) {
-          CASES(var->data.Type(), do {
-                      T* target = var->data.Raw<T>();
-                      T* source = iter->variable.data.Raw<T>();
-                      memcpy((void*)target + (ids[ki]*slice_size), (void*)source + (item_ids[ki]*slice_size), slice_size);
-                  } while(0));
-          for (auto& slot : var->slots) {
-            if (slot.second.tensor->Shape().IsScalar()) {
-              continue;
-            }
-            size_t ssize = SizeOfType(slot.second.tensor->Type()) * slot.second.tensor->Shape().NumElements() / slot.second.tensor->Shape()[0];
-            CASES(slot.second.tensor->Type(), do {
-                        T* target = slot.second.tensor->Raw<T>();
-                        T* source = iter->variable.slots[slot.first].tensor->Raw<T>();
-                        memcpy((void*)target + (ids[ki]*ssize), (void*)source + (item_ids[ki]*ssize), ssize);
-                    } while(0));
-          }
+  for (size_t i = 0; i < variables.size(); i++) {
+    const std::unique_ptr<LoadVariableStruct>& lvs = variables[i];
+    std::vector<int64_t>& key = keys[i];
+    std::vector<int64_t>& value = values[i];
+    std::vector<size_t> ids;
+    time_start = std::chrono::system_clock::now();
+    size_t no_use;
+    hashmap->Get((int64_t*)&key[0], value.size(), false, 1.0, &ids, nullptr, &no_use, 10000000000L);
+    size_t slice_size = SizeOfType(var->GetData()->Type()) * var->GetData()->Shape().NumElements() / var->GetData()->Shape()[0];
+    for (size_t j = 0; j < ids.size(); j++) {
+      char* target = var->GetData()->Raw<char>(ids[j]);
+      char* source = lvs->variable.data.Raw<char>(value[j]);
+      memcpy(target, source, slice_size);
+      for (auto& slot : slots) {
+        if (slot.second.joiner == Variable::SlotJoiner::kVariableLike) {
+          size_t ssize = SizeOfType(slot.second.tensor->Type()) * slot.second.tensor->Shape().NumElements() / slot.second.tensor->Shape()[0];
+          char* target = slot.second.tensor->Raw<char>(ids[j]);
+          char* source = lvs->variable.slots[slot.first].tensor->Raw<char>(value[j]);
+          memcpy(target, source, ssize);
         }
-        keys.clear();
-        item_ids.clear();
       }
     }
+    time_end = std::chrono::system_clock::now();
+    LOG(INFO) << name << ", memcpy takes " << std::chrono::duration_cast<std::chrono::seconds>(time_end-time_start).count();
   }
-  time_end = clock();
-  
-  //slicer.reset(xslicer.release());
-  result_variable->reset(new Variable(new Tensor(var->data), xslicer.release()));
-  (*result_variable)->SetSlots(CloneSlots(var->slots));
-  var->type = VariableStruct::kHashSlicer;
-  var->initialized = true;
+  var->SetSlots(std::move(slots));
+  result_variable.reset(var);
   return Status::Ok();
 }
 
-int64_t CheckpointUtils::CalMaxSize(const std::vector<std::unique_ptr<LoadVariableStruct>>& variables, size_t begin, size_t end) {
-  int64_t total = 0;
-  for (auto& lvs : variables) {
-    if (begin <= lvs->beg && lvs->end <= end) {
-      total += lvs->variable.hash_slicer.items.size();
-      continue;
+int64_t CheckpointUtils::CalMaxSize(const std::vector<std::unique_ptr<LoadVariableStruct> >& variables, const std::string& name, size_t begin, size_t end, std::vector<std::vector<int64_t> >* keys, std::vector<std::vector<int64_t> >* values) {
+  keys->resize(variables.size());
+  values->resize(variables.size());  
+  for (size_t i = 0; i < variables.size(); i++) {
+    if (variables[i]->variable.type == VariableStruct::kHashSlicer128) {
+      (*keys)[i].reserve(variables[i]->variable.hash_slicer128.items.size() * 2);
+      (*values)[i].reserve(variables[i]->variable.hash_slicer128.items.size());
+    } else {
+      (*keys)[i].reserve(variables[i]->variable.hash_slicer64.items.size());
+      (*values)[i].reserve(variables[i]->variable.hash_slicer64.items.size());
     }
-    for (auto item : lvs->variable.hash_slicer.items) {
-      uint32_t range = Hasher::Hash128(item.x, item.y);
-      if (begin <= range && range < end) {
-        ++total;
+  }
+  for (size_t i = 0; i < variables.size(); i++) {
+    const std::unique_ptr<LoadVariableStruct>& lvs = variables[i];
+    if (lvs->variable.type == VariableStruct::kHashSlicer128) {
+      for (size_t j = 0; j < lvs->variable.hash_slicer128.items.size(); j++) {
+        const HashMapItem<Hash128Key>& item = lvs->variable.hash_slicer128.items[j];
+        uint32_t range = Hasher::Hash128(item.key.hash1, item.key.hash2);
+        if (begin <= range && range < end) {
+          (*keys)[i].push_back(item.key.hash1);
+          (*keys)[i].push_back(item.key.hash2);
+          (*values)[i].push_back(item.id);
+        }
+      }
+    } else {
+      for (size_t j = 0; j < lvs->variable.hash_slicer64.items.size(); j++) {
+        const HashMapItem<int64_t>& item = lvs->variable.hash_slicer64.items[j];
+        uint32_t range = Hasher::Hash64(item.key);
+        if (begin <= range && range < end) {
+          (*keys)[i].push_back(item.key);
+          (*values)[i].push_back(item.id);
+        }
       }
     }
   }
+  size_t total = 0;
+  for (size_t i = 0; i < variables.size(); i++) {
+    total += (*values)[i].size();
+  }
+  LOG(INFO) << name << ", variables.size() " << variables.size() << " begin " << begin << " end " << end << " total " << total;
   return total;
 }
 
-Status CheckpointUtils::StructToVariable(const VariableStruct& vs, std::unique_ptr<Variable>* var, const VariableInfo& info, size_t part) {
-    std::unique_ptr<Data> slicer;
-    switch (vs.type) {
-    case VariableStruct::kIndexSlicer: {
-        slicer.reset(new WrapperData<size_t>(vs.index_slicer));
-        break;
-    }
-    case VariableStruct::kHashSlicer: {
-        if (info.shape.empty()) {
-            return Status::ArgumentError("CheckpointUtils: Hash Shape should not be scalar");
-        }
-        size_t hashmap_size = std::max(info.shape[0] * info.parts[part].size / Hasher::kTargetRange, vs.hash_slicer.counter) + 10;
-        std::unique_ptr<WrapperData<HashMap>> xslicer(new WrapperData<HashMap>(hashmap_size));
-        xslicer->Internal().SetHashKeys(vs.hash_slicer);
-        slicer.reset(xslicer.release());
-        break;
-    }
-    default:
-        return Status::NotImplemented("Not Implemented variable slicer type");
-    }
-    var->reset(new Variable(new Tensor(vs.data), slicer.release()));
-    (*var)->SetSlots(CloneSlots(vs.slots));
-    return Status::Ok();
-}
-
-Status CheckpointUtils::LoadVariable(const std::string& var_name, size_t part, VariableStruct* var) {
+Status CheckpointUtils::LoadVariable(const VariableInfo& info, size_t part, VariableStruct* var) {
   std::unique_ptr<FileSystem::ReadStream> s;
-  Status st = FileSystem::OpenReadStreamAny(path_ + '/' + VariableNameToFileName(var_name, part), &s);
+  Status st = FileSystem::OpenReadStreamAny(VariableInfoToFileName(info, part), &s);
   if (!st.IsOk()) {
-    LOG(ERROR) << "Open" << path_ << "/" << VariableNameToFileName(var_name, part) << " failed.";
+    LOG(ERROR) << "Open " << VariableInfoToFileName(info, part) << " failed.";
     var->initialized = false;
-    return Status::Ok();
+    return st;
   }
-  return LoadVariable(s.get(), var);
+  return LoadVariable(info.name + " part[" + std::to_string(part) + "]", s.get(), var);
 }
 
-Status CheckpointUtils::SaveVariable(const std::string& var_name, size_t part, VariableStruct* var) {
+Status CheckpointUtils::SaveVariable(const std::string& checkpoint, const std::string& var_name, size_t part, VariableStruct* var) {
   std::unique_ptr<FileSystem::WriteStream> s;
-  PS_CHECK_STATUS(FileSystem::OpenWriteStreamAny(path_ + '/' + VariableNameToFileName(var_name, part), &s));
+  PS_CHECK_STATUS(FileSystem::OpenWriteStreamAny(checkpoint + '/' + VariableNameToFileName(var_name, part), &s));
   return SaveVariable(s.get(), var);
 }
 
@@ -366,11 +397,14 @@ Status CheckpointUtils::VariableToStruct(const std::unique_ptr<Variable>& var, V
   if (dynamic_cast<WrapperData<size_t>*>(slicer) != nullptr) {
     vs->type = VariableStruct::kIndexSlicer;
     vs->index_slicer = dynamic_cast<WrapperData<size_t>*>(slicer)->Internal();
-  } else if (dynamic_cast<WrapperData<HashMap>*>(slicer) != nullptr) {
-    vs->type = VariableStruct::kHashSlicer;
-    int ret = dynamic_cast<WrapperData<HashMap>*>(slicer)->Internal().GetHashKeys(&vs->hash_slicer);
-    if (ret) {
-      return Status::Unknown("HashMap GetHashKeys Internal Error");
+  } else if (dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(slicer) != nullptr) {
+    HashMap* hashmap = dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(slicer)->Internal().get();
+    if (dynamic_cast<HashMapImpl<int64_t>*>(hashmap) != nullptr) {
+      vs->type = VariableStruct::kHashSlicer64;
+      dynamic_cast<HashMapImpl<int64_t>*>(hashmap)->GetItems(&vs->hash_slicer64);
+    } else if (dynamic_cast<HashMapImpl<Hash128Key>*>(hashmap) != nullptr) {
+      vs->type = VariableStruct::kHashSlicer128;
+      dynamic_cast<HashMapImpl<Hash128Key>*>(hashmap)->GetItems(&vs->hash_slicer128);
     }
   } else {
     return Status::NotImplemented("Not Implemented variable slicer type");
@@ -381,22 +415,24 @@ Status CheckpointUtils::VariableToStruct(const std::unique_ptr<Variable>& var, V
   return Status::Ok();
 }
 
-Status CheckpointUtils::LoadVariable(FileSystem::ReadStream* s, VariableStruct* var) {
+Status CheckpointUtils::LoadVariable(const std::string& name, FileSystem::ReadStream* s, VariableStruct* var) {
   PS_CHECK_STATUS(s->ReadRaw(&(var->type)));
   switch (var->type) {
   case VariableStruct::kIndexSlicer:
     PS_CHECK_STATUS(s->ReadRaw(&(var->index_slicer)));
-//    LOG(DEBUG) << "index_slicer size is " << var->index_slicer;
     break;
-  case VariableStruct::kHashSlicer:
-    PS_CHECK_STATUS(s->ReadRaw(&(var->hash_slicer.counter)));
-//    LOG(DEBUG) << "Hash_slicer counter is " << var->hash_slicer.counter;
-    PS_CHECK_STATUS(s->ReadVec(&(var->hash_slicer.items)));
+  case VariableStruct::kHashSlicer128:
+    PS_CHECK_STATUS(s->ReadRaw(&(var->hash_slicer128.count)));
+    PS_CHECK_STATUS(s->ReadTBBVec(&(var->hash_slicer128.items)));
+    break;
+  case VariableStruct::kHashSlicer64:
+    PS_CHECK_STATUS(s->ReadRaw(&(var->hash_slicer64.count)));
+    PS_CHECK_STATUS(s->ReadTBBVec(&(var->hash_slicer64.items)));
     break;
   default:
     return Status::NotImplemented("Not Implemented variable slicer type");
   }
-  PS_CHECK_STATUS(LoadTensor(s, &var->data));
+  PS_CHECK_STATUS(LoadTensor(name, s, var->type, &var->data));
   size_t slot_size;
   PS_CHECK_STATUS(s->ReadRaw(&slot_size));
   for (size_t i = 0; i < slot_size; i++) {
@@ -405,7 +441,7 @@ Status CheckpointUtils::LoadVariable(FileSystem::ReadStream* s, VariableStruct*
     Variable::Slot& slot = var->slots[slot_name];
     slot.tensor.reset(new Tensor);
     PS_CHECK_STATUS(s->ReadRaw(&slot.joiner));
-    PS_CHECK_STATUS(LoadTensor(s, slot.tensor.get()));
+    PS_CHECK_STATUS(LoadTensor(name + " slot[" + slot_name + "]", s, var->type, slot.tensor.get()));
   }
   var->initialized = true;
   return Status::Ok();
@@ -417,9 +453,13 @@ Status CheckpointUtils::SaveVariable(FileSystem::WriteStream* s, VariableStruct*
   case VariableStruct::kIndexSlicer:
     PS_CHECK_STATUS(s->WriteRaw(var->index_slicer));
     break;
-  case VariableStruct::kHashSlicer:
-    PS_CHECK_STATUS(s->WriteRaw(var->hash_slicer.counter));
-    PS_CHECK_STATUS(s->WriteVec(var->hash_slicer.items));
+  case VariableStruct::kHashSlicer128:
+    PS_CHECK_STATUS(s->WriteRaw(var->hash_slicer128.count.load()));
+    PS_CHECK_STATUS(s->WriteTBBVec(var->hash_slicer128.items));
+    break;
+  case VariableStruct::kHashSlicer64:
+    PS_CHECK_STATUS(s->WriteRaw(var->hash_slicer64.count.load()));
+    PS_CHECK_STATUS(s->WriteTBBVec(var->hash_slicer64.items));
     break;
   default:
     return Status::NotImplemented("Not Implemented variable slicer type");
@@ -435,7 +475,7 @@ Status CheckpointUtils::SaveVariable(FileSystem::WriteStream* s, VariableStruct*
   return Status::Ok();
 }
 
-Status CheckpointUtils::LoadTensor(FileSystem::ReadStream* s, Tensor* data) {
+Status CheckpointUtils::LoadTensor(const std::string& name, FileSystem::ReadStream* s, VariableStruct::SlicerType slicer_type, Tensor* data) {
   DataType type;
   std::vector<size_t> shape;
   Initializer* initializer;
@@ -450,7 +490,7 @@ Status CheckpointUtils::LoadTensor(FileSystem::ReadStream* s, Tensor* data) {
   serializer::MemGuard mem;
   serializer::Fragment frag(&initializer_buf[0], initializer_buf.size());
   PS_CHECK_STATUS(serializer::DeserializeAny<Initializer>(initializer_type, &frag, 0, &initializer, &len, mem));
-  Tensor result(type, TensorShape(shape), initializer, false);
+  Tensor result(type, TensorShape(shape), initializer, Tensor::TType::kContinuous, false);
   PS_CHECK_STATUS(s->Read(result.Raw<char>(), result.Shape().NumElements() * SizeOfType(type)));
   *data = result;
   return Status::Ok();
@@ -458,7 +498,8 @@ Status CheckpointUtils::LoadTensor(FileSystem::ReadStream* s, Tensor* data) {
 
 Status CheckpointUtils::SaveTensor(FileSystem::WriteStream* s, const Tensor& data) {
   DataType type = data.Type();
-  const std::vector<size_t>& shape = data.Shape().Dims();
+  TensorShape tensor_shape = data.Shape();
+  const std::vector<size_t>& shape = tensor_shape.Dims();
   Initializer* initializer = data.GetInitializer();
   size_t initializer_type;
   std::string initializer_buf;
@@ -474,8 +515,16 @@ Status CheckpointUtils::SaveTensor(FileSystem::WriteStream* s, const Tensor& dat
   PS_CHECK_STATUS(s->WriteVec(shape));
   PS_CHECK_STATUS(s->WriteRaw(initializer_type));
   PS_CHECK_STATUS(s->WriteStr(initializer_buf));
-  PS_CHECK_STATUS(s->Write(data.Raw<char>(), data.Shape().NumElements() * SizeOfType(type)));
-
+  if (data.TensorType() == Tensor::TType::kContinuous) { 
+    PS_CHECK_STATUS(s->Write(data.Raw<char>(), tensor_shape.NumElements() * SizeOfType(type)));
+  } else if (data.TensorType() == Tensor::TType::kSegment) {
+    size_t slice_size = tensor_shape.NumElements()/tensor_shape[0];
+    for (size_t i = 0; i < tensor_shape[0] / data.SegmentSize(); i++) {
+      PS_CHECK_STATUS(s->Write(data.Raw<char>(i * data.SegmentSize()), data.SegmentSize() * slice_size * SizeOfType(type)));
+    }
+  } else {
+    return Status::ArgumentError("Tensor type not support .");
+  }
   return Status::Ok();
 }
 
@@ -487,6 +536,7 @@ std::unordered_map<std::string, Variable::Slot> CheckpointUtils::CloneSlots(cons
   return std::move(ret);
 }
 
+
 }
 }
 
diff --git a/xdl/ps-plus/ps-plus/server/checkpoint_utils.h b/xdl/ps-plus/ps-plus/server/checkpoint_utils.h
index 2d3e34e3..4b536da1 100644
--- a/xdl/ps-plus/ps-plus/server/checkpoint_utils.h
+++ b/xdl/ps-plus/ps-plus/server/checkpoint_utils.h
@@ -1,60 +1,80 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
 #ifndef PS_PLUS_SERVER_CHECKPOINT_UTILS_H_
 #define PS_PLUS_SERVER_CHECKPOINT_UTILS_H_
 
+#include <memory>
+#include <string>
 #include "ps-plus/common/status.h"
 #include "ps-plus/common/file_system.h"
 #include "ps-plus/common/hashmap.h"
 #include "ps-plus/message/variable_info.h"
 #include "ps-plus/server/variable.h"
-
-#include <string>
+#include "ps-plus/common/hasher.h"
 
 namespace ps {
 namespace server {
 
 class CheckpointUtils {
  public:
-  CheckpointUtils(const std::string& path, const VariableInfoCollection& infos);
+  CheckpointUtils(const VariableInfoCollection& infos);
   Status LoadVariables(
       const VariableInfoCollection& infos,
       size_t id,
       std::unordered_map<std::string, std::unique_ptr<Variable>>* vars);
   Status SaveVariables(
       size_t id,
-      const std::unordered_map<std::string, std::unique_ptr<Variable>>& vars);
+      const std::string& checkpoint_path,
+      const std::unordered_map<std::string, std::unique_ptr<Variable>>& vars,
+      size_t timeout=30);
+
+ private:
   struct VariableStruct {
     enum SlicerType : int32_t {
       kIndexSlicer = 0,
-      kHashSlicer = 1
+      kHashSlicer128 = 1,
+      kHashSlicer64 = 2,
     };
     bool initialized;
     SlicerType type;
-    HashMap::HashMapStruct hash_slicer;
+    HashMapStruct<Hash128Key> hash_slicer128;
+    HashMapStruct<int64_t> hash_slicer64;
     size_t index_slicer;
     Tensor data;
     std::unordered_map<std::string, Variable::Slot> slots;
   };
-  Status LoadVariable(const std::string& var_name, size_t part, VariableStruct* var);
- private:
   struct LoadVariableStruct {
     VariableStruct variable;
     size_t beg, end;
     size_t clip_beg, clip_end;
   };
-  Status MergeLoadVariable(const std::string& var_name, const VariableInfo& info, size_t beg, size_t end, VariableStruct* var, std::unique_ptr<Variable>* result_variable);
-  Status SaveVariable(const std::string& var_name, size_t part, VariableStruct* var);
-  int64_t CalMaxSize(const std::vector<std::unique_ptr<LoadVariableStruct>>& variables, size_t begin, size_t end);
+  Status LoadVariable(const VariableInfo& info, size_t part, VariableStruct* var);
+  Status VariableToStruct(const std::unique_ptr<Variable>& var, VariableStruct* vs);
+  static Status SaveVariable(const std::string& checkpoint_path, const std::string& var_name, size_t part, VariableStruct* var);
+  static std::string VariableInfoToFileName(const VariableInfo& info, size_t id);
   static std::string VariableNameToFileName(const std::string& name, size_t id);
-  static Status StructToVariable(const VariableStruct& vs, std::unique_ptr<Variable>* var, const VariableInfo& info, size_t part);
-  static Status VariableToStruct(const std::unique_ptr<Variable>& var, VariableStruct* vs);
-  static Status LoadVariable(FileSystem::ReadStream* s, VariableStruct* var);
+  static Status LoadVariable(const std::string& name, FileSystem::ReadStream* s, VariableStruct* var);
   static Status SaveVariable(FileSystem::WriteStream* s, VariableStruct* var);
-  static Status LoadTensor(FileSystem::ReadStream* s, Tensor* data);
+  static Status LoadTensor(const std::string& name, FileSystem::ReadStream* s, VariableStruct::SlicerType slicer_type, Tensor* data);
   static Status SaveTensor(FileSystem::WriteStream* s, const Tensor& data);
   static std::unordered_map<std::string, Variable::Slot> CloneSlots(const std::unordered_map<std::string, Variable::Slot>& slots);
-
-  std::string path_;
-  std::unordered_map<std::string, VariableInfo> infos_;
+  Status MergeLoadVariable(const std::string& name, const VariableInfo& info, size_t beg, size_t end, std::unique_ptr<Variable>* result_variable);
+  Status LoadHashVariable(const std::vector<std::unique_ptr<LoadVariableStruct>>& variables, const std::string& name, const VariableInfo& info, size_t beg, size_t end, std::unique_ptr<Variable>& result_variable);
+  static int64_t CalMaxSize(const std::vector<std::unique_ptr<LoadVariableStruct> >& variables, const std::string& name, size_t begin, size_t end, std::vector<std::vector<int64_t> >* keys, std::vector<std::vector<int64_t> >* values);
+  VariableInfoCollection infos_;
 };
 
 }
diff --git a/xdl/ps-plus/ps-plus/server/local_server.cc b/xdl/ps-plus/ps-plus/server/local_server.cc
index 927a2e74..d562c4fd 100644
--- a/xdl/ps-plus/ps-plus/server/local_server.cc
+++ b/xdl/ps-plus/ps-plus/server/local_server.cc
@@ -127,18 +127,20 @@ Status LocalServer::Restore(const std::string& ckpt_version) {
   {
     std::lock_guard<std::mutex> lock(var_info_mutex_);
     for (auto& item: info.infos) {
+      item.args[VariableInfo::ORIGIN_FILE_PATH] = real_ckpt_path;
+      item.args[VariableInfo::ORIGIN_NAME] = item.name;
       size_t total = 0;
       for (const auto& part : item.parts) {
         total += part.size;
       }
       item.parts.clear();
-      item.parts.push_back(ps::VariableInfo::Part{.server=0, .size=total});
+      item.parts.push_back(ps::VariableInfo::Part{.server=0, .size=total});   
       var_infos_.insert(std::make_pair(item.name, item));
     }
   }
 
   storage_manager_->Internal().clear();
-  CheckpointUtils ckpt_utils(real_ckpt_path, info);
+  CheckpointUtils ckpt_utils(info);
   return ckpt_utils.LoadVariables(info, 0, &storage_manager_->Internal());
 }
 
@@ -203,7 +205,7 @@ Status LocalServer::RegisterVariable(const std::string& name,
   }
 
   std::lock_guard<std::mutex> lock(var_info_mutex_);
-  var_infos_.insert({name, vi});
+  var_infos_[name] = vi;
   return Status::Ok();
 }
 
@@ -242,8 +244,8 @@ Status LocalServer::Save(const std::string& ckpt_version) {
   }
 
   std::string real_ckpt_path = ckpt_path_ + "/" + ckpt_version;
-  CheckpointUtils ckpt_utils(real_ckpt_path, info);  
-  PS_CHECK_STATUS(ckpt_utils.SaveVariables(0, storage_manager_->Internal()));
+  CheckpointUtils ckpt_utils(info);  
+  PS_CHECK_STATUS(ckpt_utils.SaveVariables(0, real_ckpt_path, storage_manager_->Internal()));
   std::vector<std::string> checkpoints;
   {
     std::unique_ptr<FileSystem::ReadStream> s;
diff --git a/xdl/ps-plus/ps-plus/server/server.cc b/xdl/ps-plus/ps-plus/server/server.cc
index 04702343..bc311410 100644
--- a/xdl/ps-plus/ps-plus/server/server.cc
+++ b/xdl/ps-plus/ps-plus/server/server.cc
@@ -15,6 +15,7 @@ limitations under the License.
 
 #include "ps-plus/server/server.h"
 #include "ps-plus/server/checkpoint_utils.h"
+#include "ps-plus/common/logging.h"
 
 namespace ps {
 namespace server {
@@ -65,6 +66,7 @@ Status Server::RunUdfChain(Version ver, size_t udf, const std::string& variable_
     locker.reset(new QRWLocker(variable->VariableLock(), QRWLocker::kSimpleRead));
     ctx->SetLocker(locker.get());
   }
+  ctx->SetServerLocker(&lock);
   Status ret = udf_chain->Process(ctx);
   return ret;
 }
@@ -74,18 +76,15 @@ Status Server::Save(Version ver, const std::string& checkpoint, const VariableIn
   if (ver != ver_) {
     return Status::VersionMismatch("RunUdfChain Version Mismatch");
   }
-  CheckpointUtils ckpt(checkpoint, info);
-  return ckpt.SaveVariables(id_, storage_manager_->Internal());
+  CheckpointUtils ckpt(info);
+  return ckpt.SaveVariables(id_, checkpoint, storage_manager_->Internal());
 }
 
-Status Server::Restore(Version ver, const std::string& checkpoint, const VariableInfoCollection& from, const VariableInfoCollection& to) {
+Status Server::Restore(Version ver, const VariableInfoCollection& from, const VariableInfoCollection& to) {
   QRWLocker lock(server_lock_, QRWLocker::kWrite);
   ver_ = ver;
   storage_manager_->Internal().clear();
-  CheckpointUtils ckpt(checkpoint, from);
-  if (checkpoint == "") {
-    return Status::Ok();
-  }
+  CheckpointUtils ckpt(from);
   return ckpt.LoadVariables(to, id_, &storage_manager_->Internal());
 }
 
@@ -136,18 +135,18 @@ Status Server::GatherStreamingDenseVar(Version ver, const DenseVarNames& name, D
   return Status::Ok();
 }
 
-Status Server::TriggerStreamingSparse(Version ver) {
+Status Server::TriggerStreamingSparse(Version ver, const int& server_id, const std::string& stream_version) {
   {
     QRWLocker lock(server_lock_, QRWLocker::kSimpleRead);
     if (ver != ver_) {
       return Status::VersionMismatch("RunUdfChain Version Mismatch");
     }
   }
-  if (streaming_model_args_.streaming_sparse_model_addr.empty()) {
-    return Status::Unknown("Streaming Sparse Model is Disabled");
+  if (streaming_model_args_.streaming_hash_model_addr.empty()) {
+    return Status::Unknown("Streaming Hash Model is Disabled");
   }
-  if (streaming_model_args_.streaming_sparse_model_writer == nullptr) {
-    return Status::Unknown("Streaming Sparse Model Writer connect error");
+  if (streaming_model_args_.streaming_hash_model_writer == nullptr) {
+    return Status::Unknown("Streaming Hash Model Writer connect error");
   }
   std::unordered_map<std::string, StreamingModelUtils::SparseLog> logs;
   StreamingModelUtils::GetSparse(&logs);
@@ -172,10 +171,10 @@ Status Server::TriggerStreamingSparse(Version ver) {
     }
     results.emplace_back(std::move(ret));
   }
-  return streaming_model_args_.streaming_sparse_model_writer->WriteSparseModel(results);
+  return streaming_model_args_.streaming_sparse_model_writer->WriteSparseModel(results, stream_version, server_id);
 }
 
-Status Server::TriggerStreamingHash(Version ver) {
+Status Server::TriggerStreamingHash(Version ver, const int& server_id, const std::string& stream_version) {
   {
     QRWLocker lock(server_lock_, QRWLocker::kSimpleRead);
     if (ver != ver_) {
@@ -198,13 +197,21 @@ Status Server::TriggerStreamingHash(Version ver) {
     PS_CHECK_STATUS(storage_manager_->Get(var_name, &var));
     QRWLocker var_lock(var->VariableLock(), QRWLocker::kSimpleRead);
     StreamingModelWriter::HashModel ret;
-    WrapperData<HashMap>* offset_slicer = dynamic_cast<WrapperData<HashMap>*>(var->GetSlicer());
-    if (offset_slicer == nullptr) {
+    std::unique_ptr<HashMap>& hashmap = (dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(var->GetSlicer()))->Internal();
+    if (hashmap == nullptr) {
       return Status::Unknown("Variable " + var_name + " is not a hash variable");
     }
-    std::vector<int64_t> ids;
-    std::vector<std::pair<int64_t, int64_t>> keys(log.write_ids.begin(), log.write_ids.end());
-    size_t r = offset_slicer->Internal().GetWithoutAdd(&keys[0].first, keys.size(), 2, &ids);
+    std::vector<size_t> ids;
+    int64_t* keys = new int64_t[log.write_ids.size()*2];
+    int i = 0;
+    for (auto it = log.write_ids.begin(); it != log.write_ids.end(); ++it){
+        keys[2*i] = it->first;
+        keys[2*i+1] = it->second;
+        i++;
+    }
+    tbb::concurrent_vector<size_t> reids;
+    size_t filter;
+    size_t r = hashmap->Get(keys, log.write_ids.size(), false, 1.0, &ids, &reids, &filter);
     if (r != 0) {
       return Status::Unknown("Streaming Hash Model Get Hashmap error");
     }
@@ -214,13 +221,15 @@ Status Server::TriggerStreamingHash(Version ver) {
       if (ids[i] < 0) {
         continue;
       }
-      ret.ids.push_back(keys[i]);
+      std::pair<int64_t, int64_t> temp(keys[2*i], keys[2*i+1]);
+      ret.ids.push_back(temp);
       ret.offsets.push_back(ids[i]);
     }
     ret.del_ids = std::vector<std::pair<int64_t, int64_t>>(log.del_ids.begin(), log.del_ids.end());
     results.emplace_back(std::move(ret));
+    delete keys;
   }
-  return streaming_model_args_.streaming_hash_model_writer->WriteHashModel(results);
+  return streaming_model_args_.streaming_hash_model_writer->WriteHashModel(results, stream_version, server_id);
 }
 
 }
diff --git a/xdl/ps-plus/ps-plus/server/server.h b/xdl/ps-plus/ps-plus/server/server.h
index 5cbcce26..eae6d24f 100644
--- a/xdl/ps-plus/ps-plus/server/server.h
+++ b/xdl/ps-plus/ps-plus/server/server.h
@@ -37,11 +37,11 @@ class Server {
   Status RegisterUdfChain(Version ver, const UdfChainRegister& def);
   Status RunUdfChain(Version ver, size_t udf, const std::string& variable_name, const std::vector<Data*>& inputs, UdfContext* ctx);
   Status Save(Version ver, const std::string& checkpoint, const VariableInfoCollection& info);
-  Status Restore(Version ver, const std::string& checkpoint, const VariableInfoCollection& from, const VariableInfoCollection& to);
+  Status Restore(Version ver, const VariableInfoCollection& from, const VariableInfoCollection& to);
   Status StreamingDenseVarName(Version ver, DenseVarNames* result);
   Status GatherStreamingDenseVar(Version ver, const DenseVarNames& name, DenseVarValues* result);
-  Status TriggerStreamingSparse(Version ver);
-  Status TriggerStreamingHash(Version ver);
+  Status TriggerStreamingSparse(Version ver, const int& server_id, const std::string& stream_version);
+  Status TriggerStreamingHash(Version ver, const int& server_id, const std::string& stream_version);
  private:
   // Writelocked when restore.
   QRWLock server_lock_;
diff --git a/xdl/ps-plus/ps-plus/server/server_service.cc b/xdl/ps-plus/ps-plus/server/server_service.cc
index 71ff3900..f0626def 100644
--- a/xdl/ps-plus/ps-plus/server/server_service.cc
+++ b/xdl/ps-plus/ps-plus/server/server_service.cc
@@ -15,6 +15,7 @@ limitations under the License.
 
 #include "ps-plus/server/server_service.h"
 
+#include "ps-plus/common/logging.h"
 #include "ps-plus/common/net_utils.h"
 #include "ps-plus/common/reliable_kv.h"
 #include "ps-plus/message/server_info.h"
@@ -23,7 +24,6 @@ limitations under the License.
 #include <tuple>
 #include <future>
 #include <tuple>
-#include <glog/logging.h>
 
 using ps::service::seastar::SeastarStatus;
 using ps::service::seastar::SeastarServerClientLib;
@@ -215,27 +215,26 @@ void ServerService::Save(const std::vector<Data*>& inputs, std::vector<Data*>* o
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("SaveFunc: Input Type Error")));
     return;
   }
-  LOG(INFO) << "Saving Checkpoint " << checkpoint->Internal();
+  LOG(INFO) << "Saving Checkpoint " << checkpoint->Internal().c_str();
   Status st = server_->Save(ver->Internal(), checkpoint->Internal(), info->Internal());
   outputs->push_back(new WrapperData<Status>(st));
-  LOG(INFO) << "Saving Checkpoint Done " << checkpoint->Internal();
+  LOG(INFO) << "Saving Checkpoint Done " << checkpoint->Internal().c_str();
   return;
 }
 
 void ServerService::Restore(const std::vector<Data*>& inputs, std::vector<Data*>* outputs) {
-  if (inputs.size() != 4) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("RestoreFunc: Need 4 inputs")));
+  if (inputs.size() != 3) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("RestoreFunc: Need 3 inputs")));
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
-  WrapperData<std::string>* checkpoint = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
-  WrapperData<VariableInfoCollection>* from = dynamic_cast<WrapperData<VariableInfoCollection>*>(inputs[2]);
-  WrapperData<VariableInfoCollection>* to = dynamic_cast<WrapperData<VariableInfoCollection>*>(inputs[3]);
-  if (ver == nullptr || checkpoint == nullptr || from == nullptr || to == nullptr) {
+  WrapperData<VariableInfoCollection>* from = dynamic_cast<WrapperData<VariableInfoCollection>*>(inputs[1]);
+  WrapperData<VariableInfoCollection>* to = dynamic_cast<WrapperData<VariableInfoCollection>*>(inputs[2]);
+  if (ver == nullptr || from == nullptr || to == nullptr) {
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("RestoreFunc: Input Type Error")));
     return;
   }
-  Status st = server_->Restore(ver->Internal(), checkpoint->Internal(), from->Internal(), to->Internal());
+  Status st = server_->Restore(ver->Internal(), from->Internal(), to->Internal());
   outputs->push_back(new WrapperData<Status>(st));
   return;
 }
@@ -280,31 +279,33 @@ void ServerService::GatherStreamingDenseVar(const std::vector<Data*>& inputs, st
 }
 
 void ServerService::TriggerStreamingSparse(const std::vector<Data*>& inputs, std::vector<Data*>* outputs) {
-  if (inputs.size() != 1) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("TriggerStreamingSparseFunc: Need 1 inputs")));
+  if (inputs.size() != 2) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("TriggerStreamingSparseFunc: Need 2 inputs")));
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
-  if (ver == nullptr) {
+  WrapperData<std::string>* stream_version = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
+  if ((ver == nullptr) || (stream_version == nullptr)){
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("TriggerStreamingSparseFunc: Input Type Error")));
     return;
   }
-  Status st = server_->TriggerStreamingSparse(ver->Internal());
+  Status st = server_->TriggerStreamingSparse(ver->Internal(), server_id_, stream_version->Internal());
   outputs->push_back(new WrapperData<Status>(st));
   return;
 }
 
 void ServerService::TriggerStreamingHash(const std::vector<Data*>& inputs, std::vector<Data*>* outputs) {
-  if (inputs.size() != 1) {
-    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("TriggerStreamingHashFunc: Need 1 inputs")));
+  if (inputs.size() != 2) {
+    outputs->push_back(new WrapperData<Status>(Status::ArgumentError("TriggerStreamingHashFunc: Need 2 inputs")));
     return;
   }
   WrapperData<Version>* ver = dynamic_cast<WrapperData<Version>*>(inputs[0]);
-  if (ver == nullptr) {
+  WrapperData<std::string>* stream_version = dynamic_cast<WrapperData<std::string>*>(inputs[1]);
+  if ((ver == nullptr) || (stream_version == nullptr)){
     outputs->push_back(new WrapperData<Status>(Status::ArgumentError("TriggerStreamingHashFunc: Input Type Error")));
     return;
   }
-  Status st = server_->TriggerStreamingHash(ver->Internal());
+  Status st = server_->TriggerStreamingHash(ver->Internal(), server_id_, stream_version->Internal());
   outputs->push_back(new WrapperData<Status>(st));
   return;
 }
@@ -322,11 +323,11 @@ void ServerService::RegisterServer() {
 
     size_t pos = scheduler_addr.find('^');
     if (pos == std::string::npos) {
-      LOG(WARNING) << "Cannot Get Scheduler Addr[" << scheduler_kv_addr_ << 
-        "]: Store[" << scheduler_addr << "]";
+      LOG(WARNING) << "Cannot Get Scheduler Addr[" << scheduler_kv_addr_ <<
+                "]: Store[" << scheduler_addr << "]";
     }
-
     scheduler_addr = scheduler_addr.substr(pos + 1);
+
     if (scheduler_addr != old_scheduler_addr) {
       seastar_lib_->Connect(0, scheduler_addr);
       old_scheduler_addr = scheduler_addr;
@@ -347,6 +348,7 @@ void ServerService::RegisterServer() {
           }
     }));
     result.get_future().wait();
+    // TODO: process errors
   }
 }
 
diff --git a/xdl/ps-plus/ps-plus/server/server_service.h b/xdl/ps-plus/ps-plus/server/server_service.h
index 40a423d4..68f4fdb7 100644
--- a/xdl/ps-plus/ps-plus/server/server_service.h
+++ b/xdl/ps-plus/ps-plus/server/server_service.h
@@ -31,11 +31,11 @@ namespace server {
 class ServerService {
  public:
   ServerService(const std::string& scheduler, 
-                int server_id,
-                std::string streaming_dense_model_addr,
-                std::string streaming_sparse_model_addr,
-                std::string streaming_hash_model_addr,
-                bool bind_cores = false);
+		int server_id,
+		std::string streaming_dense_model_addr,
+		std::string streaming_sparse_model_addr,
+    std::string streaming_hash_model_addr,
+    bool bind_cores);
   Status Init();
   ~ServerService();
  private:
@@ -58,8 +58,8 @@ class ServerService {
   bool stop_;
   int server_id_;
   int core_num_;
-  bool bind_cores_;
-
+  int bind_cores_;
+  
   Version server_version_;
   std::unique_ptr<Server> server_;
   std::unique_ptr<ps::service::seastar::SeastarServerClientLib> seastar_lib_;
diff --git a/xdl/ps-plus/ps-plus/server/storage_manager.cc b/xdl/ps-plus/ps-plus/server/storage_manager.cc
index a56eb03f..b91d76d7 100644
--- a/xdl/ps-plus/ps-plus/server/storage_manager.cc
+++ b/xdl/ps-plus/ps-plus/server/storage_manager.cc
@@ -22,10 +22,10 @@ Status StorageManager::Get(const std::string& name, Variable** variable) {
   QRWLocker lock(rd_lock_, QRWLocker::kSimpleRead);
   auto iter = variable_map_.find(name);
   if (iter == variable_map_.end()) {
-    return Status::NotFound("Storage Manager Get: Net Found For Name: " + name);
+    return Status::NotFound("Storage Manager Get: Not Found For Name: " + name);
   }
   if (iter->second == nullptr) {
-    return Status::NotFound("Sotrage Manager Get: Initializing: " + name);
+    return Status::NotFound("Storage Manager Get: Initializing: " + name);
   }
   *variable = iter->second.get();
   return Status::Ok();
diff --git a/xdl/ps-plus/ps-plus/server/test/checkpoint_utils_test.cc b/xdl/ps-plus/ps-plus/server/test/checkpoint_utils_test.cc
index 0054dc9e..1e09d0f4 100644
--- a/xdl/ps-plus/ps-plus/server/test/checkpoint_utils_test.cc
+++ b/xdl/ps-plus/ps-plus/server/test/checkpoint_utils_test.cc
@@ -14,14 +14,21 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
+
+#define private public
 #include "ps-plus/server/checkpoint_utils.h"
+#include "ps-plus/scheduler/scheduler_impl.h"
 #include "ps-plus/common/initializer/constant_initializer.h"
+#include <ps-plus/common/logging.h>
+#undef private
 
 using ps::Tensor;
 using ps::Initializer;
 using ps::DataType;
 using ps::TensorShape;
 using ps::HashMap;
+using ps::HashMapImpl;
+using ps::Hash128Key;
 using ps::server::Variable;
 using ps::server::CheckpointUtils;
 using ps::initializer::ConstantInitializer;
@@ -32,77 +39,98 @@ using ps::VariableInfo;
 TEST(CheckpointUtilsTest, CheckpointUtilsTest) {
   std::unordered_map<std::string, std::unique_ptr<Variable>> a;
   std::unordered_map<std::string, std::unique_ptr<Variable>> b;
-  WrapperData<HashMap>* y_slicer = new WrapperData<HashMap>(10);
-  int64_t y_keys[] = {1, 2, 3, 4}; 
-  std::vector<int64_t> y_ids;
-  std::vector<int64_t> y_reused_ids;
-  EXPECT_EQ(0, y_slicer->Internal().Get(y_keys, 2, 2, &y_ids, &y_reused_ids));
+  WrapperData<std::unique_ptr<HashMap> >* y_slicer = new WrapperData<std::unique_ptr<HashMap> >(new HashMapImpl<Hash128Key>(10));
+  int64_t y_keys[] = {1, 2, 3, 4};
+  std::vector<size_t> y_ids;
+  size_t filtered;
+  EXPECT_EQ(2, y_slicer->Internal()->Get(y_keys, 2, false, 1.0, &y_ids, nullptr, &filtered));
   EXPECT_EQ(2u, y_ids.size());
-  EXPECT_EQ(0, y_ids[1]);
-  EXPECT_EQ(1, y_ids[0]);
-  a["x"].reset(new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), new WrapperData<size_t>(10)));
-  a["y"].reset(new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), y_slicer));
-  a["z"].reset(new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(2)), new WrapperData<size_t>(5)));
+  EXPECT_EQ(1, y_ids[1] + y_ids[0]);
+  a["x"].reset(new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), new WrapperData<size_t>(10), "x"));
+  a["y"].reset(new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), y_slicer, "y"));
+  a["z"].reset(new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(2)), new WrapperData<size_t>(5), "z"));
   a["x"]->GetVariableLikeSlot("slot", DataType::kInt16, []{return new ConstantInitializer(42);});
-  VariableInfoCollection infos = {.infos = {
-      VariableInfo {
-        .type = VariableInfo::kIndex,
-        .name = "w",
-        .parts = {VariableInfo::Part{.server = 0, .size = 10}, {.server = 1, .size = 4}},
-        .shape = {14, 8},
-        .datatype = DataType::kInt8,
-        .args = {}},
-      VariableInfo {
-        .type = VariableInfo::kIndex,
-        .name = "x",
-        .parts = {VariableInfo::Part{.server = 0, .size = 10}, {.server = 1, .size = 4}},
-        .shape = {14, 8},
-        .datatype = DataType::kInt8,
-        .args = {}},
-      VariableInfo {
-        .type = VariableInfo::kHash,
-        .name = "y",
-        .parts = {VariableInfo::Part{.server = 0, .size = 32760}, {.server = 1, .size = 32776}},
-        .shape = {2, 8},
-        .datatype = DataType::kInt8,
-        .args = {}},
-      VariableInfo {
-        .type = VariableInfo::kIndex,
-        .name = "z",
-        .parts = {VariableInfo::Part{.server = 0, .size = 4}, {.server = 1, .size = 4}},
-        .shape = {9, 8},
-        .datatype = DataType::kInt8,
-        .args = {{"save", "false"}}}
-    }};
-  CheckpointUtils ckpt("memory://save", infos);
-  EXPECT_TRUE(ckpt.SaveVariables(1, a).IsOk());
-  EXPECT_TRUE(ckpt.LoadVariables(infos, 1, &b).IsOk());
-  EXPECT_TRUE(b.find("x") != b.end());
-  EXPECT_TRUE(b.find("y") != b.end());
-  EXPECT_TRUE(b.find("z") == b.end());
-  EXPECT_TRUE(b.find("w") == b.end());
-  Tensor* slot = b["x"]->GetVariableLikeSlot("slot", DataType::kInt16, []{return new ConstantInitializer(43);});
-  EXPECT_EQ(4, b["x"]->GetData()->Shape()[0]);
-  EXPECT_EQ(8, b["x"]->GetData()->Shape()[1]);
-  EXPECT_EQ(12, b["y"]->GetData()->Shape()[0]);
-  EXPECT_EQ(8, b["y"]->GetData()->Shape()[1]);
+  VariableInfoCollection from = {.infos = {
+  VariableInfo {
+    .type = VariableInfo::kIndex,
+    .name = "w",
+    .parts = {VariableInfo::Part{.server = 0, .size = 10}, {.server = 1, .size = 4}},
+    .shape = {14, 8},
+    .datatype = DataType::kInt8,
+    .args = {}},
+  VariableInfo {
+    .type = VariableInfo::kIndex,
+    .name = "x",
+    .parts = {VariableInfo::Part{.server = 0, .size = 10}, {.server = 1, .size = 4}},
+    .shape = {14, 8},
+    .datatype = DataType::kInt8,
+    .args = {}},
+  VariableInfo {
+    .type = VariableInfo::kHash128,
+    .name = "y",
+    .parts = {VariableInfo::Part{.server = 0, .size = 1}, {.server = 1, .size = 65534}},
+    .shape = {2, 8},
+    .datatype = DataType::kInt8,
+    .args = {}},
+  VariableInfo {
+    .type = VariableInfo::kIndex,
+    .name = "z",
+    .parts = {VariableInfo::Part{.server = 0, .size = 4}, {.server = 1, .size = 4}},
+    .shape = {9, 8},
+    .datatype = DataType::kInt8,
+    .args = {{"save", "false"}}}
+  }};
+  CheckpointUtils ckpt(from);
+
+  ps::Status status = ckpt.SaveVariables(1, "memory://save", a);
+  std::cout << status.ToString() << std::endl;
+  EXPECT_TRUE(status.IsOk());
+
+  VariableInfoCollection to = from;
+  for (auto& info : to.infos) {
+    info.args[VariableInfo::ORIGIN_FILE_PATH] = "memory://save";
+    info.args[VariableInfo::ORIGIN_NAME] = info.name;
+    //z=>d, y=>c, etc
+    info.name[0] -= 22;
+  }
+  EXPECT_FALSE(ckpt.LoadVariables(to, 1, &b).IsOk());
+  to.infos.erase(to.infos.begin());
+
+  status = ckpt.LoadVariables(to, 1, &b);
+  std::cout << status.ToString() << std::endl;
+  EXPECT_TRUE(status.IsOk());
+
+  EXPECT_TRUE(b.find("b") != b.end());
+  EXPECT_TRUE(b.find("c") != b.end());
+  EXPECT_TRUE(b.find("d") == b.end());
+  EXPECT_TRUE(b.find("a") == b.end());
+  Tensor* slot = b["b"]->GetVariableLikeSlot("slot", DataType::kInt16, []{return new ConstantInitializer(43);});
+  EXPECT_EQ(TensorShape({4, 8}), b["b"]->GetData()->Shape());
+  TensorShape c_shape = b["c"]->GetData()->Shape();
+  EXPECT_EQ(TensorShape({ps::Tensor::DEFAULT_SEGMENT_SIZE, 8}), c_shape);
   EXPECT_EQ(TensorShape({4, 8}), slot->Shape());
-  EXPECT_EQ(DataType::kInt8, b["x"]->GetData()->Type());
-  EXPECT_EQ(DataType::kInt8, b["y"]->GetData()->Type());
+  EXPECT_EQ(DataType::kInt8, b["b"]->GetData()->Type());
+  EXPECT_EQ(DataType::kInt8, b["c"]->GetData()->Type());
   EXPECT_EQ(DataType::kInt16, slot->Type());
   for (size_t i = 0; i < 32; i++) {
-    EXPECT_EQ(0, b["x"]->GetData()->Raw<int8_t>()[i]);
-    EXPECT_EQ(1, b["y"]->GetData()->Raw<int8_t>()[i]);
+    EXPECT_EQ(0, b["b"]->GetData()->Raw<int8_t>()[i]);
+    EXPECT_EQ(1, b["c"]->GetData()->Raw<int8_t>()[i]);
     EXPECT_EQ(42, slot->Raw<int16_t>()[i]);
   }
-  WrapperData<size_t>* x_slicer = dynamic_cast<WrapperData<size_t>*>(b["x"]->GetSlicer());
-  y_slicer = dynamic_cast<WrapperData<HashMap>*>(b["y"]->GetSlicer());
+
+  WrapperData<size_t>* x_slicer = dynamic_cast<WrapperData<size_t>*>(b["b"]->GetSlicer());
+  WrapperData<std::unique_ptr<HashMap> >* c_slicer = dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(b["c"]->GetSlicer());
   EXPECT_TRUE(x_slicer != nullptr);
   EXPECT_EQ(10u, x_slicer->Internal());
-  EXPECT_TRUE(y_slicer != nullptr);
+  EXPECT_TRUE(c_slicer != nullptr);
   int64_t keys1[] = {1, 2, 3, 4, 13, 14};
-  EXPECT_EQ(0, y_slicer->Internal().Get(keys1, 3, 2, &y_ids, &y_reused_ids));
+  tbb::concurrent_vector<size_t> y_reused_ids;
+  size_t filter_count;
+  EXPECT_EQ(3, y_slicer->Internal()->Get(keys1, 3, false, 1.0, &y_ids, &y_reused_ids, &filter_count));
   EXPECT_EQ(3u, y_ids.size());
   EXPECT_EQ(3, y_ids[2] + y_ids[1] + y_ids[0]);
   EXPECT_EQ(0u, y_reused_ids.size());
 }
+
+TEST(CheckpointUtilsTest, CheckpointUtilsDebug) {
+}
diff --git a/xdl/ps-plus/ps-plus/server/test/server_test.cc b/xdl/ps-plus/ps-plus/server/test/server_test.cc
index 61d4fcda..0f58f63f 100644
--- a/xdl/ps-plus/ps-plus/server/test/server_test.cc
+++ b/xdl/ps-plus/ps-plus/server/test/server_test.cc
@@ -106,9 +106,8 @@ TEST(ServerTest, ServerTest) {
   VariableInfoCollection vic;
   st = server.Save(0, "hello", vic);
   EXPECT_EQ(st, Status::Ok());
-
   VariableInfoCollection from, to;
-  st = server.Restore(0, "hello", from, to);
+  st = server.Restore(0, from, to);
   EXPECT_EQ(st, Status::Ok());
 
   DenseVarNames dvn;
@@ -122,17 +121,18 @@ TEST(ServerTest, ServerTest) {
   server.GatherStreamingDenseVar(0, dvn2, &dvv);
   EXPECT_EQ(st, Status::Ok());
 
-  st = server.TriggerStreamingSparse(0);
+  std::string ver("inc-99");
+  st = server.TriggerStreamingSparse(0, 10, ver);
   EXPECT_NE(st, Status::Ok());
 
-  st = server.TriggerStreamingHash(0);
+  st = server.TriggerStreamingHash(0, 10, ver);
   EXPECT_NE(st, Status::Ok());
 
   EXPECT_TRUE(server.RegisterUdfChain(kUnusedVersion, BuildUdfChainRegister()).IsOk());
   EXPECT_TRUE(server.RegisterUdfChain(kUnusedVersion, BuildUdfChainRegister()).IsOk());
   UdfContext ctx1;
   EXPECT_TRUE(server.RunUdfChain(kUnusedVersion, 100, "^var", Inputs(), &ctx1).IsOk());
-  ctx1.GetStorageManager()->Set("var", []{ return new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr); });
+  ctx1.GetStorageManager()->Set("var", []{ return new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr, "");});
   UdfContext ctx2;
   EXPECT_TRUE(server.RunUdfChain(kUnusedVersion, 100, "var", Inputs(), &ctx2).IsOk());
   UdfContext ctx3;
@@ -144,7 +144,6 @@ TEST(ServerTest, ServerTest) {
 
   EXPECT_EQ(1u, ctx2.Outputs().size());
   EXPECT_EQ(40, dynamic_cast<WrapperData<int>*>(ctx2.Outputs()[0])->Internal());
-
 }
 
 TEST(LocalServerTest, LocalServer) {
diff --git a/xdl/ps-plus/ps-plus/server/test/storage_manager_test.cc b/xdl/ps-plus/ps-plus/server/test/storage_manager_test.cc
index 7e9860f9..678f5293 100644
--- a/xdl/ps-plus/ps-plus/server/test/storage_manager_test.cc
+++ b/xdl/ps-plus/ps-plus/server/test/storage_manager_test.cc
@@ -28,9 +28,9 @@ using ps::initializer::ConstantInitializer;
 TEST(StorageManagerTest, SingleThread) {
   StorageManager* manager = new StorageManager;
   Variable* rst = nullptr;
-  Variable* x = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
-  Variable* y = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
-  Variable* z = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
+  Variable* x = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "");
+  Variable* y = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "");
+  Variable* z = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "");
   EXPECT_FALSE(manager->Get("abc", &rst).IsOk());
   EXPECT_TRUE(manager->Set("abc", [x](){return x;}).IsOk());
   EXPECT_FALSE(manager->Set("abc", [y](){return y;}).IsOk());
diff --git a/xdl/ps-plus/ps-plus/server/test/variable_test.cc b/xdl/ps-plus/ps-plus/server/test/variable_test.cc
index 71ff0af9..195ee21b 100644
--- a/xdl/ps-plus/ps-plus/server/test/variable_test.cc
+++ b/xdl/ps-plus/ps-plus/server/test/variable_test.cc
@@ -27,7 +27,7 @@ using ps::initializer::ConstantInitializer;
 using ps::QRWLocker;
 
 TEST(VariableTest, Constructor) {
-  Variable var(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr);
+  Variable var(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr, "");
   EXPECT_EQ(TensorShape({4, 8}), var.GetData()->Shape());
   EXPECT_EQ(DataType::kInt8, var.GetData()->Type());
   EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[0]);
@@ -37,7 +37,7 @@ TEST(VariableTest, Constructor) {
 }
 
 TEST(VariableTest, Slot) {
-  Variable var(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr);
+  Variable var(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr, "");
   QRWLocker locker(var.VariableLock(), QRWLocker::kSimpleRead);
   EXPECT_EQ(TensorShape({4, 8}), var.GetData()->Shape());
   EXPECT_EQ(DataType::kInt8, var.GetData()->Type());
@@ -59,3 +59,27 @@ TEST(VariableTest, Slot) {
   EXPECT_EQ(TensorShape({2, 8}), z->Shape());
   EXPECT_EQ(DataType::kInt64, z->Type());
 }
+
+TEST(VariableTest, ClearId) {
+  Variable var(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1), Tensor::TType::kSegment), nullptr, "");
+  EXPECT_EQ(TensorShape({Tensor::DEFAULT_SEGMENT_SIZE, 8}), var.GetData()->Shape());
+  EXPECT_EQ(DataType::kInt8, var.GetData()->Type());
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[0]);
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[1]);
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[2]);
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[3]);
+  var.GetData()->Raw<int64_t>()[0] = 100;
+  var.GetData()->Raw<int64_t>()[2] = 200;
+  var.GetData()->Raw<int64_t>()[3] = 300;    
+  EXPECT_EQ(100, var.GetData()->Raw<int64_t>()[0]);
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[1]);
+  EXPECT_EQ(200, var.GetData()->Raw<int64_t>()[2]);
+  EXPECT_EQ(300, var.GetData()->Raw<int64_t>()[3]);
+  var.ClearIds(std::vector<size_t>{0, 2});
+  /*
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[0]);
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[1]);
+  EXPECT_EQ(0x0101010101010101, var.GetData()->Raw<int64_t>()[2]);
+  EXPECT_EQ(300, var.GetData()->Raw<int64_t>()[3]);
+  */
+}
diff --git a/xdl/ps-plus/ps-plus/server/udf/adagrad_updater.cc b/xdl/ps-plus/ps-plus/server/udf/adagrad_updater.cc
index dac1b1b5..cde9e664 100644
--- a/xdl/ps-plus/ps-plus/server/udf/adagrad_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/adagrad_updater.cc
@@ -22,49 +22,51 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AdagradUpdater : public SimpleUdf<Slices, Tensor, double, double> {
+using std::vector;
+
+class AdagradUpdater : public SimpleUdf<vector<Slices>, vector<Tensor>, vector<double>, vector<double> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor,
-      const double& learning_rate_,
-      const double& initial_accumulator_value_) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors,
+      const vector<double>& learning_rates,
+      const vector<double>& initial_accumulator_values) const {
+    if (sslices.size() != grad_tensors.size() || sslices.size() != learning_rates.size() || sslices.size() != initial_accumulator_values.size()) {
+      return Status::ArgumentError("AdagradUpdater: slices and other size not match");
     }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
+      double learning_rate = learning_rates[si];
+      double initial_accumulator_value = initial_accumulator_values[si];
+      Tensor* data_tensor = slices.variable->GetData();
+      Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("adagrad_accumulation", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
+      const Tensor& grad_tensor = grad_tensors[si];
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
+      }
 
-    double learning_rate = learning_rate_;
-    double initial_accumulator_value = initial_accumulator_value_;
-    Tensor* data_tensor = slices.variable->GetData();
-    Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("accumulation", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
-    
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  T* grad = grad_tensor.Raw<T>(i);
+                  T* acc = acc_tensor->Raw<T>(slice);
+                  T* data = data_tensor->Raw<T>(slice);
+                  for (size_t j = 0; j < slices.slice_size; j++) {
+                    *acc += *grad * *grad;
+                    *data -= *grad * learning_rate / sqrt(*acc);
+                    data++;grad++;acc++;
+                  }
+                }
+                return Status::Ok();
+              }));
     }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
-    }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      T* acc_ptr = acc_tensor->Raw<T>();
-      for (size_t slice : slices.slice_id) {
-          if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-            grad += slices.slice_size;
-            continue;
-          }          
-          T* data = data_ptr + slice * slices.slice_size;
-          T* acc = acc_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; i++) {
-              *acc += *grad * *grad;
-              *data -= *grad * learning_rate / sqrt(*acc);
-              data++;grad++;acc++;
-          }
-      }
-    } while(0));
     return Status::Ok();
   }
 };
@@ -74,4 +76,3 @@ SIMPLE_UDF_REGISTER(AdagradUpdater, AdagradUpdater);
 }
 }
 }
-
diff --git a/xdl/ps-plus/ps-plus/server/udf/adam_updater.cc b/xdl/ps-plus/ps-plus/server/udf/adam_updater.cc
index 6223b7e3..7fb1c1b7 100644
--- a/xdl/ps-plus/ps-plus/server/udf/adam_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/adam_updater.cc
@@ -22,77 +22,78 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AdamUpdater : public SimpleUdf<Slices, Tensor, double, double, double, double, bool> {
+using std::vector;
+
+class AdamUpdater : public SimpleUdf<vector<Slices>, vector<Tensor>, vector<double>, vector<double>, vector<double>, vector<double>, vector<bool> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor,
-      const double& learning_rate_,
-      const double& epsilon_,
-      const double& beta1_,
-      const double& beta2_,
-      const bool& lr_decay_) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors,
+      const vector<double>& learning_rates,
+      const vector<double>& epsilons,
+      const vector<double>& beta1s,
+      const vector<double>& beta2s,
+      const vector<bool>& lr_decays) const {
+    if (sslices.size() != grad_tensors.size() || sslices.size() != learning_rates.size() || sslices.size() != epsilons.size()
+        || sslices.size() != beta1s.size() || sslices.size() != beta2s.size() || sslices.size() != lr_decays.size()) {
+      return Status::ArgumentError("AdamUpdater: slices and other size not match");
     }
-
-    double learning_rate = learning_rate_;
-    double epsilon = epsilon_;
-    double beta1 = beta1_;
-    double beta2 = beta2_;
-    bool lr_decay = lr_decay_;
-    Tensor* data_tensor = slices.variable->GetData();
-    
-    Tensor* beta1_tensor = slices.variable->GetAnyOneSlot("beta1", DataType::kDouble, ps::TensorShape({}), [&]{ return new initializer::ConstantInitializer(beta1); });
-    Tensor* beta2_tensor = slices.variable->GetAnyOneSlot("beta2", DataType::kDouble, ps::TensorShape({}), [&]{ return new initializer::ConstantInitializer(beta2); });
-    Tensor* m_tensor = slices.variable->GetVariableLikeSlot("m", DataType::kDouble, []{ return new initializer::ConstantInitializer(0); });
-    Tensor* v_tensor = slices.variable->GetVariableLikeSlot("v", DataType::kDouble, []{ return new initializer::ConstantInitializer(0); });    
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
+      double learning_rate = learning_rates[si];
+      double epsilon = epsilons[si];
+      double beta1 = beta1s[si];
+      double beta2 = beta2s[si];
+      const Tensor& grad_tensor = grad_tensors[si];
+      bool lr_decay = lr_decays[si];
+      Tensor* data_tensor = slices.variable->GetData();
+      Tensor* beta1_tensor = slices.variable->GetAnyOneSlot("beta1", DataType::kDouble, ps::TensorShape({}), [&]{ return new initializer::ConstantInitializer(beta1); });
+      Tensor* beta2_tensor = slices.variable->GetAnyOneSlot("beta2", DataType::kDouble, ps::TensorShape({}), [&]{ return new initializer::ConstantInitializer(beta2); });
+      Tensor* m_tensor = slices.variable->GetVariableLikeSlot("m", DataType::kDouble, []{ return new initializer::ConstantInitializer(0); });
+      Tensor* v_tensor = slices.variable->GetVariableLikeSlot("v", DataType::kDouble, []{ return new initializer::ConstantInitializer(0); });    
     
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
-    }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
-    }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      double* beta1_power = beta1_tensor->Raw<double>();
-      double* beta2_power = beta2_tensor->Raw<double>();
-      double* m_ptr = m_tensor->Raw<double>();
-      double* v_ptr = v_tensor->Raw<double>();
-
-      double alpha;
-      if (lr_decay) {
-        alpha = learning_rate * sqrt(1 - *beta2_power) / (1 - *beta1_power);
-      } else {
-        alpha = learning_rate;
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
       }
 
-      for (size_t slice : slices.slice_id) {
-        if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-          grad += slices.slice_size;
-          continue;
-        }          
-        T* data = data_ptr + slice * slices.slice_size;
-        double* m = m_ptr + slice * slices.slice_size;
-        double* v = v_ptr + slice * slices.slice_size;
-        for (size_t i = 0; i < slices.slice_size; i++) {
-          double grad_d = (double)(*grad);
-
-          *m += (grad_d - *m) * (1 - beta1);
-          *v += (grad_d * grad_d - *v) * (1 - beta2);
-          *data -= (alpha * *m) / (sqrt(*v) + epsilon);
-          data++;grad++;m++;v++;
-        }
-      }
-      *beta1_power *= beta1;
-      *beta2_power *= beta2;
-    } while(0));
-    return Status::Ok();
+      CASES(data_tensor->Type(), do {
+            double* beta1_power = beta1_tensor->Raw<double>();
+            double* beta2_power = beta2_tensor->Raw<double>();
+            double alpha;
+            if (lr_decay) {
+              alpha = learning_rate * sqrt(1 - *beta2_power) / (1 - *beta1_power);
+            } else {
+              alpha = learning_rate;
+            }
+            MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                  for (size_t i = r.begin; i < r.end; i++) {
+                    T* grad = grad_tensor.Raw<T>(i);
+                    size_t slice = slices.slice_id[i];
+                    if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                      continue;
+                    }
+                    T* data = data_tensor->Raw<T>(slice);
+                    double* m = m_tensor->Raw<double>(slice);
+                    double* v = v_tensor->Raw<double>(slice);
+                    for (size_t j = 0; j < slices.slice_size; j++) {
+                      double grad_d = (double)(*grad);
+                      *m += (grad_d - *m) * (1 - beta1);
+                      *v += (grad_d * grad_d - *v) * (1 - beta2);
+                      *data -= (alpha * *m) / (sqrt(*v) + epsilon);
+                      data++;grad++;m++;v++;
+                    }
+                  }
+                  return Status::Ok();
+                });
+            *beta1_power *= beta1;
+            *beta2_power *= beta2;
+          } while(0));
+    }
+    return Status::Ok();    
   }
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_pull_updater.cc b/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_pull_updater.cc
index d98bc218..cbcfc359 100644
--- a/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_pull_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_pull_updater.cc
@@ -22,42 +22,46 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AdaptiveRevisionPullUpdater : public SimpleUdf<Slices, size_t, size_t> {
+using std::vector;
+
+class AdaptiveRevisionPullUpdater : public SimpleUdf<vector<Slices>, size_t, size_t> {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const size_t& worker_cnt_,
-      const size_t& worker_idx_) const {
-	if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
-    }
-
-    size_t worker_cnt = worker_cnt_;
-    size_t worker_idx = worker_idx_;
+      const vector<Slices>& sslices,
+      const size_t& worker_cnt,
+      const size_t& worker_idx) const {
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
 
-    Tensor* data_tensor = slices.variable->GetData();
-    Tensor* g_tensor = slices.variable->GetVariableLikeSlot("g", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(0.0); });
-    
-    std::vector<size_t> g_worker_dims{worker_cnt};
-    const std::vector<size_t>& var_dims = data_tensor->Shape().Dims();
-    g_worker_dims.insert(g_worker_dims.end(), var_dims.begin(), var_dims.end());
-    Tensor* g_old_tensor = slices.variable->GetAnyOneSlot("g_old", data_tensor->Type(), ps::TensorShape(g_worker_dims), [=]{ return new initializer::ConstantInitializer(0.0); });
-    
-    CASES(data_tensor->Type(), do {
-      T* g_base_ptr = g_tensor->Raw<T>();
-      T* g_old_base_ptr = g_old_tensor->Raw<T>();
-      g_old_base_ptr += worker_idx * data_tensor->Shape().NumElements();
+      Tensor* data_tensor = slices.variable->GetData();
+      Tensor* g_tensor = slices.variable->GetVariableLikeSlot("g", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(0.0); });
+      std::vector<size_t> g_worker_dims{worker_cnt};
+      const std::vector<size_t> var_dims = data_tensor->Shape().Dims();
+      g_worker_dims.insert(g_worker_dims.end(), var_dims.begin(), var_dims.end());
+      Tensor* g_old_tensor = slices.variable->GetAnyOneSlot("g_old", data_tensor->Type(), ps::TensorShape(g_worker_dims), [=]{ return new initializer::ConstantInitializer(0.0); });
+            
+      CASES(data_tensor->Type(), do {
+            T* g_old_base_ptr = g_old_tensor->Raw<T>();
+            g_old_base_ptr += worker_idx * data_tensor->Shape().NumElements();
+            MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                  for (size_t i = r.begin; i < r.end; i++) {
+                    int64_t slice = slices.slice_id[i];
+                    if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                      continue;
+                    }
 
-      for (auto slice : slices.slice_id) {
-        if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-          continue;
-        }          
-        T* g = g_base_ptr + slice * slices.slice_size;
-        T* g_old = g_old_base_ptr + slice * slices.slice_size;
-        memcpy(g_old, g, slices.slice_size * sizeof(T));
-      }
-    } while(0));
+                    T* g = g_tensor->Raw<T>(slice);
+                    T* g_old = g_old_base_ptr + slice * slices.slice_size;
+                    memcpy(g_old, g, slices.slice_size * sizeof(T));
+                  }
+                  return Status::Ok();
+                });
+          } while(0));
+    }
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_updater.cc b/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_updater.cc
index d9f381a9..25fae838 100644
--- a/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/adaptive_revision_updater.cc
@@ -22,119 +22,113 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AdaptiveRevisionUpdater : public SimpleUdf<Slices, Tensor, double, double, double, size_t, size_t> {
+using std::vector;
+
+class AdaptiveRevisionUpdater : public SimpleUdf<vector<Slices>, vector<Tensor>, vector<double>, vector<double>, vector<double>, size_t, size_t> {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor,
-      const double& learning_rate_,
-      const double& initial_accumulator_value_,
-      const double& max_revision_ratio_,
-      const size_t& worker_cnt_,
-      const size_t& worker_idx_) const {
-	if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
-    }
-
-    double learning_rate = learning_rate_;
-    double initial_accumulator_value = initial_accumulator_value_;
-    double max_revision_ratio = max_revision_ratio_;
-    size_t worker_cnt = worker_cnt_;
-    size_t worker_idx = worker_idx_;
-
-    Tensor* data_tensor = slices.variable->GetData();
-    Tensor* g_tensor = slices.variable->GetVariableLikeSlot("g", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(0.0); });
-    
-    std::vector<size_t> g_worker_dims{worker_cnt};
-    const std::vector<size_t>& var_dims = data_tensor->Shape().Dims();
-    g_worker_dims.insert(g_worker_dims.end(), var_dims.begin(), var_dims.end());
-    Tensor* g_old_tensor = slices.variable->GetAnyOneSlot("g_old", data_tensor->Type(), ps::TensorShape(g_worker_dims), [=]{ return new initializer::ConstantInitializer(0.0); });
-    
-    Tensor* z_tensor = slices.variable->GetVariableLikeSlot("z", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
-    Tensor* z2_tensor = slices.variable->GetVariableLikeSlot("z2", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
-    
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors,
+      const vector<double>& learning_rates,
+      const vector<double>& initial_accumulator_values,
+      const vector<double>& max_revision_ratios,
+      const size_t& worker_cnt,
+      const size_t& worker_idx) const {
+    if (sslices.size() != grad_tensors.size() || sslices.size() != learning_rates.size() || sslices.size() != initial_accumulator_values.size() || sslices.size() != max_revision_ratios.size()) {
+      return Status::ArgumentError("AdaptiveRevisionUpdater: slices and other size not match");
     }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
-    }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* g_base_ptr = g_tensor->Raw<T>();
-      T* g_old_base_ptr = g_old_tensor->Raw<T>();
-      g_old_base_ptr += worker_idx * data_tensor->Shape().NumElements();
-      T* z_base_ptr = z_tensor->Raw<T>();
-      T* z2_base_ptr = z2_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-
-      size_t num_vals = 0;
-      for (size_t i = 0; i < slices.slice_id.size(); ++i) {
-        num_vals += slices.slice_size;
-      }
-      T* delta2_base = new T[num_vals];
-      T* delta2 = delta2_base;
-      T delta1_sum = 0.0;
-      T delta2_sum = 0.0;
-
-      for (size_t slice : slices.slice_id) {
-        if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-          continue;
-        }          
-        T* data = data_ptr + slice * slices.slice_size;
-        T* g = g_base_ptr + slice * slices.slice_size;
-        T* g_old = g_old_base_ptr + slice * slices.slice_size;
-        T* z = z_base_ptr + slice * slices.slice_size;
-        T* z2 = z2_base_ptr + slice * slices.slice_size;
-
-        for (size_t i = 0; i < slices.slice_size; ++i) {
-          T g_bck = *g - *g_old;
-          T lr_old = learning_rate / sqrt(*z2);
-          T z_delta = *grad * *grad + 2 * *grad * g_bck;
-          T z_new = *z + z_delta;
-          T z2_new = fmax(z_new, *z2);
-          T z2_delta = z2_new - *z2;
-          T lr = learning_rate / sqrt(z2_new);
-          T delta1 = - lr * *grad;
-          *delta2 = (lr_old - lr) * g_bck;
-          delta1_sum += delta1 * delta1;
-          delta2_sum += *delta2 * *delta2;
-
-          *data += delta1;
-          *g += *grad;
-          *z += z_delta;
-          *z2 += z2_delta;
-
-          data++; g++; g_old++; z++; z2++; delta2++; grad++;
-        }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
       }
-      // Stabilize the initial revision process.
-      T delta1_dot = sqrt(delta1_sum);
-      T delta2_dot = sqrt(delta2_sum);
-      T delta_ratio = delta2_dot / delta1_dot;
-      if (delta_ratio > max_revision_ratio) {
-        for (size_t i = 0; i < num_vals; ++i) {
-          delta2_base[i] = delta2_base[i] * max_revision_ratio / delta_ratio;
-        }
+      double learning_rate = learning_rates[si];
+      double initial_accumulator_value = initial_accumulator_values[si];
+      double max_revision_ratio = max_revision_ratios[si];
+      Tensor* data_tensor = slices.variable->GetData();
+      Tensor* g_tensor = slices.variable->GetVariableLikeSlot("g", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(0.0); });
+      std::vector<size_t> g_worker_dims{worker_cnt};
+      const std::vector<size_t>& var_dims = data_tensor->Shape().Dims();
+      g_worker_dims.insert(g_worker_dims.end(), var_dims.begin(), var_dims.end());
+      Tensor* g_old_tensor = slices.variable->GetAnyOneSlot("g_old", data_tensor->Type(), ps::TensorShape(g_worker_dims), [=]{ return new initializer::ConstantInitializer(0.0); });
+      Tensor* z_tensor = slices.variable->GetVariableLikeSlot("z", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
+      Tensor* z2_tensor = slices.variable->GetVariableLikeSlot("z2", data_tensor->Type(), [=]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
+      const Tensor& grad_tensor = grad_tensors[si];
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
       }
 
-      delta2 = delta2_base;
-      for (size_t slice : slices.slice_id) {
-        T* data = data_ptr + slice * slices.slice_size;
-        for (size_t i = 0; i < slices.slice_size; ++i) {
-          *data += *delta2;
-          data++;
-          delta2++;
-        }
-      }
-
-      delete[] delta2_base;
-    } while(0));
+      size_t num_vals = slices.slice_id.size() * slices.slice_size;
+      CASES(data_tensor->Type(), do {
+            T* delta2_base = new T[num_vals];
+            T* g_old_base_ptr = g_old_tensor->Raw<T>();
+            g_old_base_ptr += worker_idx * data_tensor->Shape().NumElements();
+            T* delta2 = delta2_base;
+            T delta1_sum = 0.0;
+            T delta2_sum = 0.0;
+            MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {                  
+                  for (size_t i = r.begin; i < r.end; i++) {
+                    int64_t slice = slices.slice_id[i];
+                    if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                      continue;
+                    }
+                        
+                    T* data = data_tensor->Raw<T>(slice);
+                    T* g = g_tensor->Raw<T>(slice);
+                    T* g_old = g_old_base_ptr + slice * slices.slice_size;
+                          
+                    T* z = z_tensor->Raw<T>(slice);
+                    T* z2 = z2_tensor->Raw<T>(slice);
+                    T* grad = grad_tensor.Raw<T>(i);
+                          
+                    for (size_t j = 0; j < slices.slice_size; ++j) {
+                      T g_bck = *g - *g_old;
+                      T lr_old = learning_rate / sqrt(*z2);
+                      T z_delta = *grad * *grad + 2 * *grad * g_bck;
+                      T z_new = *z + z_delta;
+                      T z2_new = fmax(z_new, *z2);
+                      T z2_delta = z2_new - *z2;
+                      T lr = learning_rate / sqrt(z2_new);
+                      T delta1 = - lr * *grad;
+                      *delta2 = (lr_old - lr) * g_bck;
+                      delta1_sum += delta1 * delta1;
+                      delta2_sum += *delta2 * *delta2;
+                      *data += delta1;
+                      *g += *grad;
+                      *z += z_delta;
+                      *z2 += z2_delta;
+                      data++; g++; g_old++; z++; z2++; delta2++; grad++;
+                    }
+                  }
+                  return Status::Ok();
+                });
+            // Stabilize the initial revision process.
+            T delta1_dot = sqrt(delta1_sum);
+            T delta2_dot = sqrt(delta2_sum);
+            T delta_ratio = delta2_dot / delta1_dot;
+            if (delta_ratio > max_revision_ratio) {
+              for (size_t i = 0; i < num_vals; ++i) {
+                delta2_base[i] = delta2_base[i] * max_revision_ratio / delta_ratio;
+              }
+            }
+
+            delta2 = delta2_base;
+            for (size_t slice : slices.slice_id) {
+              if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                continue;
+              }
+              T* data = data_tensor->Raw<T>(slice);         
+              for (size_t i = 0; i < slices.slice_size; ++i) {
+                *data += *delta2;
+                data++;delta2++;
+              }
+            }
+            delete[] delta2_base;
+          } while(0));
+    }
     return Status::Ok();
-  }
+  }            
 };
 
 SIMPLE_UDF_REGISTER(AdaptiveRevisionUpdater, AdaptiveRevisionUpdater);
diff --git a/xdl/ps-plus/ps-plus/server/udf/aggregate_slice.cc b/xdl/ps-plus/ps-plus/server/udf/aggregate_slice.cc
index 49c63bf0..ed9360eb 100644
--- a/xdl/ps-plus/ps-plus/server/udf/aggregate_slice.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/aggregate_slice.cc
@@ -18,6 +18,8 @@ limitations under the License.
 #include "ps-plus/server/slice.h"
 #include "ps-plus/common/hashmap.h"
 #include "ps-plus/server/streaming_model_utils.h"
+#include "ps-plus/common/logging.h"
+#include "ps-plus/common/thread_pool.h"
 #include <iostream>
 #include <map>
 
@@ -25,95 +27,130 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AggregateSlice : public SimpleUdf<Slices, int64_t, int, Tensor, Slices*, Tensor*> {
+using std::vector;
+
+class AggregateSlice : public SimpleUdf<vector<Slices>, int64_t, int, vector<Tensor>, vector<Slices>*, vector<Tensor>*> {
  public:
-   virtual Status SimpleRun(UdfContext* ctx, const Slices& input_slices, const int64_t& token, const int& worker_count, const Tensor& input_grad, Slices* output_slices, Tensor* output_grad) const {
-       std::vector<Tensor> grads = {};
-       std::vector<Slices> slices = {};
-       Tensor tensor_cp(input_grad.Type(), input_grad.Shape(), new ps::initializer::ConstantInitializer(0.0), false);
-       QuickMemcpy(tensor_cp.Raw<char>(), input_grad.Raw<char>(), SizeOfType(input_grad.Type()) * input_grad.Shape().NumElements());
-       std::string variable_name = ctx->GetVariableName();
-       lock_.lock();
-       if (current_tokens[variable_name] != token) {
-           current_tokens[variable_name] = token;
-           grads_map[variable_name] = {};
-           slices_map[variable_name] = {};
-       }
-
-       grads_map[variable_name].push_back(tensor_cp);
-       slices_map[variable_name].push_back(input_slices);
-       if (grads_map[variable_name].size() == (size_t) worker_count) {
-           grads = grads_map[variable_name];
-           slices = slices_map[variable_name];
-           grads_map[variable_name] = {};
-           slices_map[variable_name] = {};
-       }
-       lock_.unlock();
-       
-       std::map<size_t, size_t> id_count;
-       for (const Slices& cur_slices: slices) {
-           for (size_t id : cur_slices.slice_id) {
-               auto iter = id_count.find(id);
-               if (iter == id_count.end()) {
-                   id_count[id] = 1;
-               } else {
-                   iter->second++;
-               }
-           }
-       }
-       std::unordered_map<size_t, size_t> id_position;
-       size_t base_index = 0;
-       for (auto iter = id_count.begin(); iter != id_count.end(); ++iter) {
-           id_position[iter->first] = base_index++;
-       } 
-       size_t total_id = id_count.size();
-       TensorShape new_shape = input_grad.Shape();
-       if (new_shape.Size() > 1 && input_slices.dim_part != -1) {
-           new_shape.Set(0, total_id);
-       }
-       *output_grad = Tensor(input_grad.Type(), new_shape, new ps::initializer::ConstantInitializer(0.0), true);
-       for (size_t i = 0; i < grads.size(); i++) {
-           const Slices& cur_slices = slices[i];
-           const Tensor& cur_grad = grads[i];
-           CASES(input_grad.Type(), do {
-                       T* grad = cur_grad.Raw<T>();
-                       T* out = output_grad->Raw<T>();
-                       for (size_t j = 0; j < cur_slices.slice_id.size(); j++) {
-                           size_t index = id_position[(cur_slices.slice_id[j])];
-                           T* p = out + index * cur_slices.slice_size;
-                           for (size_t k = 0; k < cur_slices.slice_size; k++) {
-                               *p += *grad;
-                               ++p;++grad;
-                           }
-                       }
-                   } while(0));
-       }
-
-       output_slices->writable = input_slices.writable;
-       output_slices->variable = input_slices.variable;
-       output_slices->dim_part = input_slices.dim_part;
-       output_slices->slice_size = input_slices.slice_size;
-       CASES(input_grad.Type(), do {
-                   T* out = output_grad->Raw<T>();
-                   for (auto iter = id_count.begin(); iter != id_count.end(); ++iter) {
-                       output_slices->slice_id.push_back(iter->first);
-                       for (size_t i = 0; i < input_slices.slice_size; i++) {
-                           *out++ /= (T)iter->second;
-                       }
-                   }
-               } while(0));
-       return Status::Ok();
-   }
+  virtual Status SimpleRun(UdfContext* ctx, const vector<Slices>& sslices, const int64_t& token, const int& worker_count, const vector<Tensor>& input_grads, vector<Slices>* output_slices, vector<Tensor>* output_grads) const {
+    if (sslices.size() != input_grads.size()) {
+      return Status::ArgumentError("AggregateSlice: slices and other size not match");
+    }
+
+    //for dense and sparse, token_name and variable_name are same, but for hash variable, token_name is fake.
+    const std::string& token_name = ctx->GetVariableName();
+    lock_.lock();
+    if (current_tokens[token_name].first != token) {
+      if (current_tokens[token_name].second != worker_count) {
+        LOG(WARNING) << "AggregateSlice: receive wrong token [" << token << "] current token[" << current_tokens[token_name].first << "]";
+      }
+      current_tokens[token_name] = std::make_pair(token, 0);
+      for (size_t si = 0; si < sslices.size(); si++) {
+        const Slices& input_slices = sslices[si];
+        std::string variable_name = input_slices.variable->GetName();
+        grads_map[variable_name] = {};
+        slices_map[variable_name] = {};
+      }
+    }
+    current_tokens[token_name].second += 1;
+    lock_.unlock();
+
+    output_slices->resize(sslices.size());
+    output_grads->resize(sslices.size());
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Tensor& input_grad = input_grads[si];
+      const Slices& input_slices = sslices[si];
+      const std::string& variable_name = input_slices.variable->GetName();
+
+      lock_.lock();
+
+      std::vector<Tensor> grads;
+      std::vector<Slices> slices;
+
+      grads_map[variable_name].push_back(input_grad.Clone());
+      slices_map[variable_name].push_back(input_slices);
+      if (current_tokens[token_name].second == worker_count) {
+        grads = std::move(grads_map[variable_name]);
+        slices = std::move(slices_map[variable_name]);
+        grads_map[variable_name] = {};
+        slices_map[variable_name] = {};
+      }
+      lock_.unlock();
+
+      (*output_slices)[si].writable = input_slices.writable;
+      (*output_slices)[si].variable = input_slices.variable;
+      (*output_slices)[si].dim_part = input_slices.dim_part;
+      (*output_slices)[si].slice_size = input_slices.slice_size;
+      if (grads.size() == 0) {
+        (*output_grads)[si] = Tensor(input_grad.Type(), TensorShape({}), new ps::initializer::ConstantInitializer(0.0));
+        continue;
+      }
+      HashMap* id_position = new HashMapImpl<int64_t>(100);
+      tbb::concurrent_vector<size_t> no_use;
+      MultiThreadDoTBB(slices.size(), [&](const Range& r) {
+            for (size_t i = r.begin; i < r.end; i++) {
+              const Slices& cur_slices = slices[i];
+              std::vector<size_t> position;
+              size_t filter_count;
+              size_t ret = id_position->Get((int64_t*)&cur_slices.slice_id[0], cur_slices.slice_id.size(), false, 1.0, &position, &no_use, &filter_count);
+            }
+            return Status::Ok();});
+      size_t ids_size = id_position->GetSize();
+      // empty slices
+      if (ids_size == 0) {
+        (*output_grads)[si] = Tensor(input_grad.Type(), TensorShape({}), new ps::initializer::ConstantInitializer(0.0));
+        continue;
+      }
+      TensorShape output_shape = input_grad.Shape();
+      if (output_shape.Size() > 1 && input_slices.dim_part != -1) {
+        output_shape.Set(0, ids_size);
+      }
+      Tensor output_grad(input_grad.Type(), output_shape, new ps::initializer::ConstantInitializer(0.0));
+      (*output_slices)[si].slice_id.resize(ids_size);
+      for (size_t i = 0; i < grads.size(); i++) {
+        const Slices& cur_slices = slices[i];
+        const Tensor& cur_grad = grads[i];
+        CASES(input_grad.Type(), do {
+              std::vector<size_t> position;
+              size_t filter_count;
+              id_position->Get((int64_t*)&cur_slices.slice_id[0], cur_slices.slice_id.size(), true, 0.0, &position, &no_use, &filter_count);
+              MultiThreadDoTBB(cur_slices.slice_id.size(), [&](const Range& r) {
+                    for (size_t j = r.begin; j < r.end; j++) {
+                      T* o = output_grad.Raw<T>(position[j]);
+                      T* i = cur_grad.Raw<T>(j);
+                      for (size_t k = 0; k < cur_slices.slice_size; k++) {
+                        *o++ += *i++;
+                      }
+                      (*output_slices)[si].slice_id[position[j]] = cur_slices.slice_id[j];
+                    }
+                    return Status::Ok();
+                  });
+            } while(0));
+      }
+
+      CASES(input_grad.Type(), MultiThreadDoTBB(ids_size, [&](const Range& r) {
+            for (size_t i = r.begin; i < r.end; i++) {
+              T* out = output_grad.Raw<T>(i);
+              for (size_t j = 0; j < input_slices.slice_size; j++) {
+                *out++ /= worker_count;
+              }
+            }
+            return Status::Ok();}));
+      (*output_grads)[si] = std::move(output_grad);
+      delete id_position;
+    }
+    return Status::Ok();
+  }
 private:
-    static std::mutex lock_;
-    static std::map<std::string, std::vector<Slices>> slices_map;
-    static std::map<std::string, std::vector<Tensor>> grads_map;
-    static std::map<std::string, int64_t> current_tokens;
+  static std::mutex lock_;
+  static std::map<std::string, std::vector<Slices>> slices_map;
+  static std::map<std::string, std::vector<Tensor>> grads_map;
+  //map<token_name, pair<token, count>>
+  static std::map<std::string, std::pair<int64_t, int> > current_tokens;
 };
 
 std::map<std::string, std::vector<Slices>> AggregateSlice::slices_map;
 std::map<std::string, std::vector<Tensor>> AggregateSlice::grads_map;
-std::map<std::string, int64_t> AggregateSlice::current_tokens;
+std::map<std::string, std::pair<int64_t, int> > AggregateSlice::current_tokens;
 std::mutex AggregateSlice::lock_;
 
 SIMPLE_UDF_REGISTER(AggregateSlice, AggregateSlice);
diff --git a/xdl/ps-plus/ps-plus/server/udf/assign_add_updater.cc b/xdl/ps-plus/ps-plus/server/udf/assign_add_updater.cc
index 62011863..88ec0568 100644
--- a/xdl/ps-plus/ps-plus/server/udf/assign_add_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/assign_add_updater.cc
@@ -22,40 +22,43 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AssignAddUpdater : public SimpleUdf<Slices, Tensor> {
+using std::vector;
+
+class AssignAddUpdater : public SimpleUdf<vector<Slices>, vector<Tensor> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors) const {
+    if (sslices.size() != grad_tensors.size()) {
+      return Status::ArgumentError("AssignAddUpdater: slices and other size not match");
     }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
+      Tensor* data_tensor = slices.variable->GetData();
+      const Tensor& grad_tensor = grad_tensors[si];
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
+      }
 
-    Tensor* data_tensor = slices.variable->GetData();
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  T* grad = grad_tensor.Raw<T>(i);
+                  T* data = data_tensor->Raw<T>(slice);
+                  for (size_t j = 0; j < slices.slice_size; j++) {
+                    *data += *grad;
+                    data++;grad++;
+                  }
+                }
+                return Status::Ok();}));
     }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
-    }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      for (size_t slice : slices.slice_id) {
-          if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-            grad += slices.slice_size;
-            continue;
-          }          
-          T* data = data_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; i++) {
-              *data += *grad;
-              data++;grad++;
-          }
-      }
-    } while(0));
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/assign_sub_updater.cc b/xdl/ps-plus/ps-plus/server/udf/assign_sub_updater.cc
index c6d98d50..b2c4c8a0 100644
--- a/xdl/ps-plus/ps-plus/server/udf/assign_sub_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/assign_sub_updater.cc
@@ -22,40 +22,43 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class AssignSubUpdater : public SimpleUdf<Slices, Tensor> {
+using std::vector;
+
+class AssignSubUpdater : public SimpleUdf<vector<Slices>, vector<Tensor> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors) const {
+    if (sslices.size() != grad_tensors.size()) {
+      return Status::ArgumentError("AssignSubUpdater: slices and other size not match");
     }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
+      Tensor* data_tensor = slices.variable->GetData();
+      const Tensor& grad_tensor = grad_tensors[si];
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
+      }
 
-    Tensor* data_tensor = slices.variable->GetData();
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  T* grad = grad_tensor.Raw<T>(i);
+                  T* data = data_tensor->Raw<T>(slice);
+                  for (size_t j = 0; j < slices.slice_size; j++) {
+                    *data -= *grad;
+                    data++;grad++;
+                  }
+                }
+                return Status::Ok();}));
     }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
-    }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      for (size_t slice : slices.slice_id) {
-          if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-            grad += slices.slice_size;
-            continue;
-          }          
-          T* data = data_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; i++) {
-              *data -= *grad;
-              data++;grad++;
-          }
-      }
-    } while(0));
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/assign_updater.cc b/xdl/ps-plus/ps-plus/server/udf/assign_updater.cc
index b8010a1d..ba4c4c1a 100644
--- a/xdl/ps-plus/ps-plus/server/udf/assign_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/assign_updater.cc
@@ -16,42 +16,48 @@ limitations under the License.
 #include "ps-plus/server/udf/simple_udf.h"
 #include "ps-plus/server/slice.h"
 #include "ps-plus/common/initializer/constant_initializer.h"
+#include "ps-plus/common/logging.h"
 #include "ps-plus/common/hashmap.h"
 
 namespace ps {
 namespace server {
 namespace udf {
 
-class AssignUpdater : public SimpleUdf<Slices, Tensor> {
+using std::vector;
+
+class AssignUpdater : public SimpleUdf<vector<Slices>, vector<Tensor> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
-    }
-    Tensor* data_tensor = slices.variable->GetData();
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
-    }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors) const {
+    if (sslices.size() != grad_tensors.size()) {
+      return Status::ArgumentError("AssignAddUpdater: slices and other size not match");
     }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      for (size_t slice : slices.slice_id) {
-          T* data = data_ptr + slice * slices.slice_size;
-          if ((int64_t)slice != ps::HashMap::NOT_ADD_ID) {
-              memcpy((void*)data, (void*)grad, sizeof(T) * slices.slice_size);
-          }
-          grad += slices.slice_size;
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
       }
-    } while(0));
-    return Status::Ok();
+      Tensor* data_tensor = slices.variable->GetData();
+      const Tensor& grad_tensor = grad_tensors[si];
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
+      }
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  T* grad = grad_tensor.Raw<T>(i);
+                  T* data = data_tensor->Raw<T>(slice);
+                  memcpy((void*)data, (void*)grad, sizeof(T) * slices.slice_size);
+                }
+                return Status::Ok();
+              }));
+    }
+    return Status::Ok();;
   }
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/build_dense_slice.cc b/xdl/ps-plus/ps-plus/server/udf/build_dense_slice.cc
index 47b40ec8..771a0c13 100644
--- a/xdl/ps-plus/ps-plus/server/udf/build_dense_slice.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/build_dense_slice.cc
@@ -21,20 +21,23 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class BuildDenseSlice : public SimpleUdf<bool, Slices*> {
+class BuildDenseSlice : public SimpleUdf<bool, std::vector<Slices>*> {
  public:
-  virtual Status SimpleRun(UdfContext* ctx, const bool& writable, Slices* result) const {
+  virtual Status SimpleRun(UdfContext* ctx, const bool& writable, std::vector<Slices>* result) const {
     Variable* variable = GetVariable(ctx);
     if (variable == nullptr) {
       return Status::ArgumentError("BuildDenseSlice: Variable should not be empty");
     }
-    result->writable = writable;
-    result->variable = variable;
-    result->dim_part = -1;
-    result->slice_size = variable->GetData()->Shape().NumElements();
-    result->slice_id.push_back(0);
-
-    if (writable && !ctx->GetStreamingModelArgs()->streaming_dense_model_addr.empty()) {
+    Slices slices;
+    slices.writable = writable;
+    slices.variable = variable;
+    slices.dim_part = -1;
+    slices.slice_size = variable->GetData()->Shape().NumElements();
+    slices.slice_id.push_back(0);
+    result->push_back(slices);
+
+    //TODO write dense
+    if (writable && ctx->GetStreamingModelArgs() != NULL && !ctx->GetStreamingModelArgs()->streaming_dense_model_addr.empty()) {
       PS_CHECK_STATUS(StreamingModelUtils::WriteDense(ctx->GetVariableName()));
     }
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/build_hash_slice.cc b/xdl/ps-plus/ps-plus/server/udf/build_hash_slice.cc
index 7522a7ed..f33c8c3d 100644
--- a/xdl/ps-plus/ps-plus/server/udf/build_hash_slice.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/build_hash_slice.cc
@@ -17,66 +17,63 @@ limitations under the License.
 #include "ps-plus/server/slice.h"
 #include "ps-plus/common/hashmap.h"
 #include "ps-plus/server/streaming_model_utils.h"
+#include "ps-plus/common/string_utils.h"
+#include "ps-plus/common/logging.h"
 #include <iostream>
 
 namespace ps {
 namespace server {
 namespace udf {
 
-class BuildHashSlice : public SimpleUdf<Tensor, bool, double, Slices*> {
+class BuildHashSlice : public SimpleUdf<std::vector<Tensor>, std::vector<std::string>, std::vector<float>, bool, bool, std::vector<Slices>*> {
  public:
- virtual Status SimpleRun(UdfContext* ctx, const Tensor& ids, const bool& writable, const double& add_probability, Slices* result) const {
-    Variable* variable = GetVariable(ctx);
-    if (variable == nullptr) {
-      return Status::ArgumentError("BuildHashSlice: Variable should not be empty");
+  virtual Status SimpleRun(UdfContext* ctx, const std::vector<Tensor>& ids, const std::vector<std::string>& tensor_names, const std::vector<float>& save_ratios, const bool& writable, const bool& insert, std::vector<Slices>* result) const {
+    static size_t step = 0;
+    size_t current_step = step++;
+    if (ids.size() != tensor_names.size()) {
+      return Status::ArgumentError("BuildHashSlice: ids and tensor_names can't match");
     }
-    if (variable->GetData()->Shape().IsScalar()) {
-      return Status::ArgumentError("BuildHashSlice: Variable should not be Scalar");
-    }
-    if (ids.Shape().Size() != 2 || ids.Shape()[1] != 2 || ids.Type() != DataType::kInt64) {
-      return Status::ArgumentError("BuildHashSlice: Id should be [?:2] and dtype should be int64");
-    }
-    WrapperData<HashMap>* hashmap = dynamic_cast<WrapperData<HashMap>*>(variable->GetSlicer());
-    if (hashmap == nullptr) {
-      return Status::ArgumentError("BuildHashSlice: Variable Should be a Hash Variable");
-    }
-
-    result->writable = writable;
-    result->variable = variable;
-    result->dim_part = 1;
-    result->slice_size = variable->GetData()->Shape().NumElements() / variable->GetData()->Shape()[0];
-
-    std::vector<int64_t> raw_ids, reused_ids;
-    hashmap->Internal().GetWithAddProbability(ids.Raw<int64_t>(), ids.Shape()[0], 2, add_probability, &raw_ids, &reused_ids);
-    std::vector<size_t> raw_reused_ids;
-    for (int64_t id : reused_ids) {
-      raw_reused_ids.push_back(id);
-    }
-    variable->ClearIds(raw_reused_ids);
-    size_t max = 0;
-    result->slice_id.reserve(raw_ids.size());
-    for (int64_t id : raw_ids) {
-      result->slice_id.push_back(id);
-      if (id > 0) {
-        max = std::max(max, (size_t)id);
+    StorageManager* manager = ctx->GetStorageManager();
+    result->resize(ids.size());
+    size_t total_id = 0;
+    for (size_t si = 0; si < ids.size(); si++) {
+      const Tensor& id = ids[si];
+      Variable* variable;
+      PS_CHECK_STATUS(manager->Get(tensor_names[si], &variable));
+      if (id.Type() != DataType::kInt64) {
+        return Status::ArgumentError("BuildHashSlice: dtype should be int64 for " + tensor_names[si]);
       }
-    }
-    if (max >= variable->GetData()->Shape()[0]) {
-      ctx->GetLocker()->ChangeType(QRWLocker::kWrite);
-      if (max >= variable->GetData()->Shape()[0]) {
-        TensorShape shape = variable->GetData()->Shape();
-        size_t x = shape[0];
-        while (x <= max) {
-          x *= 2;
+      std::unique_ptr<HashMap>& hashmap = (dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(variable->GetSlicer()))->Internal();
+      if (hashmap == nullptr) {
+        return Status::ArgumentError("BuildHashSlice: Variable Should be a Hash Variable for " + tensor_names[si]);
+      }
+      QRWLocker locker(variable->VariableLock(), QRWLocker::kSimpleRead);
+      Slices& element = (*result)[si];
+      tbb::concurrent_vector<size_t> reused_ids;
+      size_t total_filtered_count = 0;
+      int64_t max_id = hashmap->Get(id.Raw<int64_t>(), id.Shape()[0], !insert, save_ratios[si], &element.slice_id, &reused_ids, &total_filtered_count);
+      if (!insert && (current_step % 200 == 0) && total_filtered_count != 0) {
+        LOG(INFO) << "Step " << current_step/2 << ", variable[" << tensor_names[si] << "], filtered keys [" << total_filtered_count << "], hashmap size [" << hashmap->GetSize() << "]";
+      }
+      if (max_id > 0) {
+        PS_CHECK_STATUS(variable->ReShapeId(max_id));
+      }
+      if (reused_ids.size() != 0) {
+        std::vector<size_t> raw_reused_ids;
+        for (auto iter : reused_ids) {
+          raw_reused_ids.push_back(iter);
         }
-        PS_CHECK_STATUS(variable->ReShapeId(x));
+        variable->ClearIds(raw_reused_ids);
+      }
+      ps::TensorShape shape = variable->GetData()->Shape();
+      element.slice_size = shape.NumElements() / shape[0];
+      element.writable = writable;
+      element.variable = variable;
+      element.dim_part = 1;
+      if (writable && ctx->GetStreamingModelArgs() != NULL && !ctx->GetStreamingModelArgs()->streaming_hash_model_addr.empty()) { 
+          PS_CHECK_STATUS(StreamingModelUtils::WriteHash(tensor_names[si], id));
       }
-      ctx->GetLocker()->ChangeType(QRWLocker::kSimpleRead);
-    }
-    if (writable && !ctx->GetStreamingModelArgs()->streaming_hash_model_addr.empty()) {
-      PS_CHECK_STATUS(StreamingModelUtils::WriteHash(ctx->GetVariableName(), ids));
     }
-
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/build_sparse_slice.cc b/xdl/ps-plus/ps-plus/server/udf/build_sparse_slice.cc
index cf1650db..2d61af1c 100644
--- a/xdl/ps-plus/ps-plus/server/udf/build_sparse_slice.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/build_sparse_slice.cc
@@ -21,9 +21,9 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class BuildSparseSlice : public SimpleUdf<Tensor, bool, Slices*> {
+class BuildSparseSlice : public SimpleUdf<Tensor, bool, std::vector<Slices>*> {
  public:
-  virtual Status SimpleRun(UdfContext* ctx, const Tensor& ids, const bool& writable, Slices* result) const {
+  virtual Status SimpleRun(UdfContext* ctx, const Tensor& ids, const bool& writable, std::vector<Slices>* result) const {
     Variable* variable = GetVariable(ctx);
     if (variable == nullptr) {
       return Status::ArgumentError("BuildSparseSlice: Variable should not be empty");
@@ -41,25 +41,27 @@ class BuildSparseSlice : public SimpleUdf<Tensor, bool, Slices*> {
     int64_t min_id = offset->Internal();
     int64_t max_id = variable->GetData()->Shape()[0] + min_id;
 
-    result->writable = writable;
-    result->variable = variable;
-    result->dim_part = 1;
-    result->slice_size = variable->GetData()->Shape().NumElements() / variable->GetData()->Shape()[0];
+    Slices slices;
+    slices.writable = writable;
+    slices.variable = variable;
+    slices.dim_part = 1;
+    slices.slice_size = variable->GetData()->Shape().NumElements() / variable->GetData()->Shape()[0];
+    TensorShape shape = variable->GetData()->Shape();
     CASES(ids.Type(), do {
-	result->slice_id.reserve(ids.Shape()[0]);
-      for (size_t i = 0; i < ids.Shape()[0]; i++) {
-        int64_t id = ids.Raw<T>()[i];
-        if (id < min_id || id >= max_id) {
-          return Status::ArgumentError("BuildSparseSlice: id Overflow");
-        }
-        result->slice_id.push_back(id - min_id);
-      }
-    } while (0));
-
-    if (writable && !ctx->GetStreamingModelArgs()->streaming_sparse_model_addr.empty()) {
+                            slices.slice_id.reserve(ids.Shape()[0]);
+                            for (size_t i = 0; i < ids.Shape()[0]; i++) {
+                              int64_t id = ids.Raw<T>()[i];
+                              if (id < min_id || id >= max_id) {
+                                return Status::ArgumentError("BuildSparseSlice: id Overflow");
+                              }
+                              slices.slice_id.push_back(id - min_id);
+                            }
+                          } while (0));
+    result->push_back(slices);
+    //TODO Write Sparse
+    if (writable && ctx->GetStreamingModelArgs() != NULL  && !ctx->GetStreamingModelArgs()->streaming_sparse_model_addr.empty()) {
       PS_CHECK_STATUS(StreamingModelUtils::WriteSparse(ctx->GetVariableName(), ids));
     }
-
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/ftrl_updater.cc b/xdl/ps-plus/ps-plus/server/udf/ftrl_updater.cc
index eadfbda3..30ce2ff8 100644
--- a/xdl/ps-plus/ps-plus/server/udf/ftrl_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/ftrl_updater.cc
@@ -22,81 +22,82 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class FtrlUpdater : public SimpleUdf<Slices, Tensor, double, double, double, double, double> {
+using std::vector;
+
+class FtrlUpdater : public SimpleUdf<vector<Slices>, vector<Tensor>, vector<double>, vector<double>, vector<double>, vector<double>, vector<double> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor,
-      const double& learning_rate_,
-      const double& learning_rate_power_,
-      const double& initial_accumulator_value_,
-      const double& l1_reg_,
-      const double& l2_reg_) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors,
+      const vector<double>& learning_rates,
+      const vector<double>& learning_rate_powers,
+      const vector<double>& initial_accumulator_values,
+      const vector<double>& l1_regs,
+      const vector<double>& l2_regs) const {
+    if (sslices.size() != grad_tensors.size() || sslices.size() != learning_rates.size() || sslices.size() != learning_rate_powers.size() || sslices.size() != initial_accumulator_values.size() || sslices.size() != l1_regs.size() || sslices.size() != l1_regs.size()) {
+      return Status::ArgumentError("FtrlUpdater: slices and other size not match");
     }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
+      double learning_rate = learning_rates[si];
+      double learning_rate_power = learning_rate_powers[si];
+      double initial_accumulator_value = initial_accumulator_values[si];
+      double l1_reg = l1_regs[si];
+      double l2_reg = l2_regs[si];
+      const Tensor& grad_tensor = grad_tensors[si];
 
-    double learning_rate = learning_rate_;
-    double learning_rate_power = learning_rate_power_;
-    double initial_accumulator_value = initial_accumulator_value_;
-    double l1_reg = l1_reg_;
-    double l2_reg = l2_reg_;
-
-    Tensor* data_tensor = slices.variable->GetData();
-    Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("accum", data_tensor->Type(), [&]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
-    Tensor* linear_tensor = slices.variable->GetVariableLikeSlot("linear", data_tensor->Type(), [&]{ return new initializer::ConstantInitializer(0); });
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
-    }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
-    }
-    */
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      T* acc_ptr = acc_tensor->Raw<T>();
-      T* linear_ptr = linear_tensor->Raw<T>();      
+      Tensor* data_tensor = slices.variable->GetData();
+      Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("accum", data_tensor->Type(), [&]{ return new initializer::ConstantInitializer(initial_accumulator_value); });
+      Tensor* linear_tensor = slices.variable->GetVariableLikeSlot("linear", data_tensor->Type(), [&]{ return new initializer::ConstantInitializer(0); });
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
+      }
 
-      for (size_t slice : slices.slice_id) {
-          if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-            grad += slices.slice_size;
-            continue;
-          }            
-          T* data = data_ptr + slice * slices.slice_size;
-          T* accum = acc_ptr + slice * slices.slice_size;
-          T* linear = linear_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; i++) {
-              T new_accum = *accum + *grad * *grad;
-              if (fabs(learning_rate_power + 0.5) < 1e-6) {
-                  *linear += *grad - (sqrt(new_accum) - sqrt(*accum)) / learning_rate * *data;
-                  auto x = l1_reg * sgn(*linear) - *linear;
-                  auto y = sqrt(new_accum) / learning_rate + l2_reg * 2;
-                  auto pre_shrink = x / y;
-                  if (fabs(*linear) > l1_reg) {
-                      *data = pre_shrink;
-                  } else {
-                      *data = 0;
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  T* grad = grad_tensor.Raw<T>(i);
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
                   }
-              } else {
-                  *linear += *grad - (pow(new_accum, -learning_rate_power) - pow(*accum, -learning_rate_power)) / learning_rate * *data;
-                  auto x = l1_reg * sgn(*linear) - *linear;
-                  auto y = pow(new_accum, -learning_rate_power) / learning_rate + l2_reg * 2;
-                  auto pre_shrink = x / y;
-                  if (fabs(*linear) > l1_reg) {
-                      *data = pre_shrink;
-                  } else {
-                      *data = 0;
+                  T* data = data_tensor->Raw<T>(slice);
+                  T* acc = acc_tensor->Raw<T>(slice);
+                  T* linear = linear_tensor->Raw<T>(slice);
+                  for (size_t j = 0; j < slices.slice_size; j++) {
+                    T new_accum = *acc + *grad * *grad;
+                    if (fabs(learning_rate_power + 0.5) < 1e-6) {
+                      *linear += *grad - (sqrt(new_accum) - sqrt(*acc)) / learning_rate * *data;
+                      auto x = l1_reg * sgn(*linear) - *linear;
+                      auto y = sqrt(new_accum) / learning_rate + l2_reg * 2;
+                      auto pre_shrink = x / y;
+                      if (fabs(*linear) > l1_reg) {
+                        *data = pre_shrink;
+                      } else {
+                        *data = 0;
+                      }
+                    } else {
+                      *linear += *grad - (pow(new_accum, -learning_rate_power) - pow(*acc, -learning_rate_power)) / learning_rate * *data;
+                      auto x = l1_reg * sgn(*linear) - *linear;
+                      auto y = pow(new_accum, -learning_rate_power) / learning_rate + l2_reg * 2;
+                      auto pre_shrink = x / y;
+                      if (fabs(*linear) > l1_reg) {
+                        *data = pre_shrink;
+                      } else {
+                        *data = 0;
+                      }
+                    }
+                    *acc += *grad * *grad;
+                    data++; grad++; acc++; linear++;
                   }
-              }
-              *accum += *grad * *grad;
-              data++; grad++; accum++; linear++;
-          }
-      }
-    } while(0));
-    return Status::Ok();
+                }
+                return Status::Ok();
+              }));
+    }
+    return Status::Ok();;
   }
 
 protected:
diff --git a/xdl/ps-plus/ps-plus/server/udf/hash_black_list.cc b/xdl/ps-plus/ps-plus/server/udf/hash_black_list.cc
new file mode 100644
index 00000000..7c6591d4
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/hash_black_list.cc
@@ -0,0 +1,143 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/server/udf/simple_udf.h"
+#include "ps-plus/common/hashmap.h"
+#include "ps-plus/common/hasher.h"
+#include "ps-plus/common/file_system.h"
+
+namespace ps {
+namespace server {
+namespace udf {
+
+namespace {
+struct ListHandle {
+  HashMapImpl<int64_t>::NonCocurrentHashTable* list;
+  int beg, end;
+  int threshold;
+  bool is_black;
+};
+}
+
+class HashBlackWhiteList : public SimpleUdf<std::vector<std::string>, std::vector<std::string>, std::vector<std::string>, std::vector<int>, std::vector<int>, std::vector<int>, std::vector<int>> {
+ public:
+  virtual Status SimpleRun(
+      UdfContext* ctx, const std::vector<std::string>& token_names,
+      const std::vector<std::string>& var_names,
+      const std::vector<std::string>& dirs, const std::vector<int>& threshold,
+      const std::vector<int>& is_black, const std::vector<int>& beg, const std::vector<int>& end) const {
+    ctx->GetServerLocker()->ChangeType(QRWLocker::kWrite);
+    std::unordered_map<std::string, HashMapImpl<int64_t>*> hashmaps;
+    std::unordered_map<std::string, ListHandle> lists;
+    StorageManager* manager = ctx->GetStorageManager();
+    std::unordered_map<std::string, HashMapImpl<int64_t>*> white_hashmap, black_hashmap;
+    for (size_t i = 0; i < token_names.size(); i++) {
+      std::string token = token_names[i];
+      std::string var = var_names[i];
+      Variable* variable;
+      PS_CHECK_STATUS(manager->Get(var, &variable));
+      auto slicer = dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(variable->GetSlicer());
+      if (slicer == nullptr) {
+        return Status::ArgumentError("HashBlackWhiteList: Variable Should be a Hash Variable for " + var);
+      }
+      auto hashmap = dynamic_cast<HashMapImpl<int64_t>*>(slicer->Internal().get());
+      if (hashmap == nullptr) {
+        return Status::ArgumentError("HashBlackWhiteList: Variable Should be a Hash 64 Variable for " + var);
+      }
+      hashmaps[token] = hashmap;
+      if (is_black[i]) {
+        if (black_hashmap[var] == nullptr) {
+          black_hashmap[var] = hashmap;
+          lists[token].list = hashmap->NewBlackList();
+        } else {
+          lists[token].list = hashmap->GetBlackList();
+        }
+      } else {
+        if (white_hashmap[var] == nullptr) {
+          white_hashmap[var] = hashmap;
+          lists[token].list = hashmap->NewWhiteList();
+        } else {
+          lists[token].list = hashmap->GetWhiteList();
+        }
+      }
+      lists[token].beg = beg[i];
+      lists[token].end = end[i];
+      lists[token].threshold = threshold[i];
+      lists[token].is_black = is_black[i];
+    }
+    std::vector<std::string> files;
+    for (auto&& dir : dirs) {
+      std::vector<std::string> filenames;
+      PS_CHECK_STATUS(FileSystem::ListDirectoryAny(dir, &filenames));
+      for (auto&& file : filenames) {
+        files.emplace_back(file);
+      }
+    }
+    for (auto& file : files) {
+      LOG(INFO) << "Processing " << file;
+      std::unique_ptr<FileSystem::ReadStream> f;
+      PS_CHECK_STATUS(FileSystem::OpenReadStreamAny(file, &f));
+      while (true) {
+        bool eof;
+        PS_CHECK_STATUS(f->Eof(&eof));
+        if (eof) {
+          break;
+        }
+        std::string token;
+        int64_t id;
+        double d;
+        PS_CHECK_STATUS(f->ReadShortStr(&token));
+        PS_CHECK_STATUS(f->ReadRaw(&id));
+        PS_CHECK_STATUS(f->ReadRaw(&d));
+        auto iter = lists.find(token);
+        if (iter == lists.end()) {
+          continue;
+        }
+        int hash = Hasher::Hash64(id);
+        auto&& list = iter->second;
+        if (hash < list.beg || hash >= list.end) {
+          continue;
+        }
+        if (list.is_black) {
+          if (d < list.threshold) {
+            list.list->insert(id);
+          }
+        } else {
+          if (d >= list.threshold) {
+            list.list->insert(id);
+          }
+        }
+      }
+      f->Close();
+    }
+    for (auto&& item : white_hashmap) {
+      size_t s = item.second->FilterByWhiteList();
+      LOG(INFO) << "filter " << item.first << " as " << s << " listsize " << item.second->GetWhiteList()->size();
+    }
+    for (auto&& item : black_hashmap) {
+      size_t s = item.second->FilterByBlackList();
+      LOG(INFO) << "filter " << item.first << " as " << s << " listsize " << item.second->GetBlackList()->size();
+    }
+    ctx->GetServerLocker()->ChangeType(QRWLocker::kSimpleRead);
+    return Status::Ok();
+  }
+};
+
+SIMPLE_UDF_REGISTER(HashBlackWhiteList, HashBlackWhiteList);
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/hash_simple_filter.cc b/xdl/ps-plus/ps-plus/server/udf/hash_simple_filter.cc
new file mode 100644
index 00000000..5b8a6b7b
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/hash_simple_filter.cc
@@ -0,0 +1,126 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/server/udf/simple_udf.h"
+#include "ps-plus/server/slice.h"
+#include "ps-plus/common/hashmap.h"
+#include "ps-plus/server/streaming_model_utils.h"
+#include "ps-plus/common/logging.h"
+#include "ps-plus/server/udf/python_runner.h"
+
+namespace ps {
+namespace server {
+namespace udf {
+
+namespace {
+
+struct Argument {
+  enum Type {
+    kArr,
+    kSlice
+  };
+  Type type;
+  Tensor t;
+  PythonRunner::NumpyArray arr;
+};
+
+}
+
+class HashSimpleFilter
+    : public SimpleUdf<std::string,
+                       std::string,
+                       std::vector<std::string>,
+                       std::vector<std::string>,
+                       std::vector<Tensor>,
+                       size_t*> {
+ public:
+  virtual Status SimpleRun(
+      UdfContext* ctx,
+      const std::string& func_def,
+      const std::string& func_name,
+      const std::vector<std::string>& func_args,
+      const std::vector<std::string>& payload_name,
+      const std::vector<Tensor>& payload,
+      size_t* del_size) const {
+    PythonRunner runner;
+    Variable* var = ctx->GetVariable();
+    PS_CHECK_STATUS(runner.Init(func_def, func_name));
+    std::unique_ptr<HashMap>& hashmap = (dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(var->GetSlicer()))->Internal();
+    if (hashmap == nullptr) {
+      return Status::ArgumentError("HashSimpleFilter: Variable Should be a Hash Variable for " + ctx->GetVariableName());
+    }
+    std::vector<Argument> arguments;
+    for (auto&& arg : func_args) {
+      Argument argument;
+      auto iter = std::find(payload_name.begin(), payload_name.end(), arg);
+      if (iter != payload_name.end()) {
+        argument.type = Argument::kArr;
+        argument.t = payload[iter - payload_name.begin()];
+        PS_CHECK_STATUS(PythonRunner::ParseTensor(argument.t, &argument.arr));
+      } else if (arg == "data_") {
+        argument.type = Argument::kSlice;
+        argument.t = *var->GetData();
+      } else {
+        Tensor* t;
+        PS_CHECK_STATUS(var->GetExistSlot(arg, &t));
+        argument.type = Argument::kSlice;
+        argument.t = *t;
+      }
+      arguments.push_back(argument);
+    }
+    // Block Everything
+    ctx->GetServerLocker()->ChangeType(QRWLocker::kWrite);
+    size_t size = hashmap->GetSize();
+    size_t segment_size = var->GetData()->SegmentSize();
+    size_t segment_count = (size + segment_size - 1) / segment_size;
+    std::vector<size_t> ids;
+    for (size_t i = 0; i < segment_count; i++) {
+      std::vector<PythonRunner::NumpyArray> real_args;
+      for (auto& arg : arguments) {
+        PythonRunner::NumpyArray real_arg;
+        if (arg.type == Argument::kArr) {
+          real_arg = arg.arr;
+        } else {
+          PS_CHECK_STATUS(PythonRunner::ParseSubTensor(arg.t, i, size, &real_arg));
+        }
+        real_args.push_back(real_arg);
+      }
+      PythonRunner::NumpyArray result;
+      PS_CHECK_STATUS(runner.Run(real_args, &result));
+      if (result.shape.Size() != 1) {
+        return Status::ArgumentError("HashSimpleFilter: return array should be 1-D");
+      }
+      if (result.type != DataType::kInt8) {
+        return Status::ArgumentError("HashSimpleFilter: return array type should be Bool");
+      }
+      for (size_t j = 0; j < result.shape[0]; j++) {
+        if (((uint8_t*)result.data)[j]) {
+          ids.push_back(j + segment_size * i);
+        }
+      }
+    }
+    tbb::concurrent_vector<size_t> unfiltered_ids;
+    *del_size = hashmap->EraseById(ctx->GetVariableName(), ids, &unfiltered_ids);
+    ctx->GetServerLocker()->ChangeType(QRWLocker::kSimpleRead);
+    return Status::Ok();
+  }
+};
+
+SIMPLE_UDF_REGISTER(HashSimpleFilter, HashSimpleFilter);
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/hash_slot_filter.cc b/xdl/ps-plus/ps-plus/server/udf/hash_slot_filter.cc
new file mode 100644
index 00000000..84f5eaa7
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/hash_slot_filter.cc
@@ -0,0 +1,145 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/server/udf/simple_udf.h"
+#include "ps-plus/server/slice.h"
+#include "ps-plus/common/hashmap.h"
+#include "ps-plus/server/streaming_model_utils.h"
+#include "ps-plus/common/logging.h"
+#include "ps-plus/server/udf/python_runner.h"
+#include "ps-plus/common/initializer/constant_initializer.h"
+
+namespace ps {
+namespace server {
+namespace udf {
+
+namespace {
+
+struct Argument {
+  enum Type {
+    kArr,
+    kSlice
+  };
+  Type type;
+  Tensor t;
+  PythonRunner::NumpyArray arr;
+};
+
+}
+
+class HashSlotFilter
+    : public SimpleUdf<std::string,
+                       std::string,
+                       std::vector<std::string>,
+                       std::vector<std::string>,
+                       std::vector<Tensor>,
+                       std::string,
+                       size_t,
+                       size_t*> {
+ public:
+  virtual Status SimpleRun(
+      UdfContext* ctx,
+      const std::string& func_def,
+      const std::string& func_name,
+      const std::vector<std::string>& func_args,
+      const std::vector<std::string>& payload_name,
+      const std::vector<Tensor>& payload,
+      const std::string& slot_name,
+      const size_t& slot_size,
+      size_t* del_size) const {
+    PythonRunner runner;
+    Variable* var = ctx->GetVariable();
+    PS_CHECK_STATUS(runner.Init(func_def, func_name));
+    std::unique_ptr<HashMap>& hashmap = (dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(var->GetSlicer()))->Internal();
+    if (hashmap == nullptr) {
+      return Status::ArgumentError("HashSlotFilter: Variable Should be a Hash Variable for " + ctx->GetVariableName());
+    }
+    Tensor* slot = var->GetVariableLikeSlot(slot_name, DataType::kFloat, TensorShape({slot_size}), []{ return new initializer::ConstantInitializer(0); });
+    std::vector<Argument> arguments;
+    for (auto&& arg : func_args) {
+      Argument argument;
+      auto iter = std::find(payload_name.begin(), payload_name.end(), arg);
+      if (iter != payload_name.end()) {
+        argument.type = Argument::kArr;
+        argument.t = payload[iter - payload_name.begin()];
+        PS_CHECK_STATUS(PythonRunner::ParseTensor(argument.t, &argument.arr));
+      } else if (arg == "data_") {
+        argument.type = Argument::kSlice;
+        argument.t = *var->GetData();
+      } else {
+        Tensor* t;
+        PS_CHECK_STATUS(var->GetExistSlot(arg, &t));
+        argument.type = Argument::kSlice;
+        argument.t = *t;
+      }
+      arguments.push_back(argument);
+    }
+    // Block Everything
+    ctx->GetServerLocker()->ChangeType(QRWLocker::kWrite);
+    size_t size = hashmap->GetSize();
+    size_t segment_size = var->GetData()->SegmentSize();
+    size_t segment_count = (size + segment_size - 1) / segment_size;
+    *del_size = 0;
+    for (size_t i = 0; i < segment_count; i++) {
+      std::vector<PythonRunner::NumpyArray> real_args;
+      for (auto& arg : arguments) {
+        PythonRunner::NumpyArray real_arg;
+        if (arg.type == Argument::kArr) {
+          real_arg = arg.arr;
+        } else {
+          PS_CHECK_STATUS(PythonRunner::ParseSubTensor(arg.t, i, size, &real_arg));
+        }
+        real_args.push_back(real_arg);
+      }
+      PythonRunner::NumpyArray result, new_slot;
+      PS_CHECK_STATUS(runner.Run(real_args, &result, &new_slot));
+      if (result.shape.Size() != 1) {
+        return Status::ArgumentError("HashSlotFilter: return array should be 1-D");
+      }
+      if (result.type != DataType::kInt8) {
+        return Status::ArgumentError("HashSlotFilter: return array type should be Bool");
+      }
+      if (new_slot.shape.Size() != 2) {
+        return Status::ArgumentError("HashSlotFilter: return slot array should be 2-D");
+      }
+      if (new_slot.type != DataType::kFloat) {
+        return Status::ArgumentError("HashSlotFilter: return slot array type should be Float");
+      }
+      if (new_slot.shape[1] != slot_size) {
+        return Status::ArgumentError("HashSlotFilter: return slot array should be [*, slot_size]");
+      }
+      std::vector<size_t> ids;
+      for (size_t j = 0; j < result.shape[0]; j++) {
+        if (((uint8_t*)result.data)[j]) {
+          ids.push_back(j + segment_size * i);
+        }
+      }
+      tbb::concurrent_vector<size_t> unfiltered_ids;
+      *del_size += hashmap->EraseById(ctx->GetVariableName(), ids, &unfiltered_ids);
+      for (auto id : unfiltered_ids) {
+        memcpy(slot->Raw<float>(id), ((float*)new_slot.data) + slot_size * (id - segment_size * i), sizeof(float) * slot_size);
+      }
+    }
+    ctx->GetServerLocker()->ChangeType(QRWLocker::kSimpleRead);
+    return Status::Ok();
+  }
+};
+
+SIMPLE_UDF_REGISTER(HashSlotFilter, HashSlotFilter);
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/hash_unary_filter.cc b/xdl/ps-plus/ps-plus/server/udf/hash_unary_filter.cc
index 7baf7b40..2b4f9903 100644
--- a/xdl/ps-plus/ps-plus/server/udf/hash_unary_filter.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/hash_unary_filter.cc
@@ -13,12 +13,11 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-#include <glog/logging.h>
-
 #include "ps-plus/server/udf/simple_udf.h"
 #include "ps-plus/server/slice.h"
 #include "ps-plus/common/hashmap.h"
 #include "ps-plus/server/streaming_model_utils.h"
+#include "ps-plus/common/logging.h"
 
 namespace ps {
 namespace server {
@@ -61,6 +60,7 @@ namespace udf {
 class HashUnaryFilter : public SimpleUdf<std::string, double, int64_t> {
  public:
   virtual Status SimpleRun(UdfContext* ctx, const std::string& cond, const double& pd, const int64_t& pi) const {
+    #if 0
     double d = pd;
     int64_t i = pi;
     Variable* variable = GetVariable(ctx);
@@ -109,10 +109,8 @@ class HashUnaryFilter : public SimpleUdf<std::string, double, int64_t> {
       PS_CHECK_STATUS(StreamingModelUtils::DelHash(ctx->GetVariableName(), keys));
     }
 
-    //LOG(INFO) << "Hash Filter for " << ctx->GetVariableName() << " origin=" << 
-      //map.items.size() << ", clear=" << keys.size() / 2;
-    printf("Hash Filter for %s origin= %ld, clear= %ld\n", ctx->GetVariableName().c_str(), map.items.size(), keys.size() / 2);
-
+    LOG_INFO("Hash Filter for %s, origin=%lld, clear=%lld", ctx->GetVariableName().c_str(), map.items.size(), keys.size() / 2);
+    #endif 
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/hash_variable_initializer.cc b/xdl/ps-plus/ps-plus/server/udf/hash_variable_initializer.cc
index 90e3ec0e..cc2dfdb0 100644
--- a/xdl/ps-plus/ps-plus/server/udf/hash_variable_initializer.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/hash_variable_initializer.cc
@@ -15,22 +15,69 @@ limitations under the License.
 
 #include "ps-plus/server/udf/simple_udf.h"
 #include "ps-plus/common/hashmap.h"
+#include "ps-plus/common/string_utils.h"
 
 namespace ps {
 namespace server {
 namespace udf {
 
-class HashVariableInitializer : public SimpleUdf<DataType, TensorShape, std::unique_ptr<Initializer>> {
+class HashVariableInitializer : public SimpleUdf<DataType, TensorShape, std::string, std::unique_ptr<Initializer>> {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const DataType& type,
+      const DataType& dt,
       const TensorShape& shape,
+      const std::string& extra_info,
       const std::unique_ptr<Initializer>& initializer) const {
     if (shape.IsScalar()) {
       return Status::ArgumentError("Hash Shape Should not be Scalar");
     }
-    return ctx->GetStorageManager()->Set(ctx->GetVariableName(), [&]{ return new Variable(new Tensor(type, shape, initializer->Clone()), new WrapperData<HashMap>(shape[0])); });
+    std::unordered_map<std::string, std::string> kvs = StringUtils::ParseMap(extra_info);
+    bool hash64 = false;
+    int32_t bloom_filter_threthold = 0;
+    for (const auto iter : kvs) {
+      if (iter.first == "hash64" && iter.second == "true") {
+        hash64 = true;
+      } else if (iter.first == "bloom_filter") {
+        if (!StringUtils::strToInt32(iter.second.c_str(), bloom_filter_threthold)) {
+          return Status::ArgumentError("HashVariableInitializer: bloom_filter not int "  + iter.first + "=" + iter.second);
+        }
+        if (bloom_filter_threthold >= 65500) {
+          return Status::ArgumentError("HashVariableInitializer: bloom_filter_threthold too large, only support < 65500, "  + iter.first + "=" + iter.second);
+        }
+        GlobalBloomFilter::SetThrethold(bloom_filter_threthold);
+      }
+    }
+    if (bloom_filter_threthold != 0) {
+      LOG(INFO) << ctx->GetVariableName() << ", bloom_filter_threthold " << bloom_filter_threthold;
+    }
+    std::string var_name = ctx->GetVariableName();
+    Variable* var;
+    ps::Status status = GetStorageManager(ctx)->Get(var_name, &var);
+    if (!status.IsOk()) {
+      return ctx->GetStorageManager()->Set(var_name, [&]{
+            HashMap* hashmap = nullptr;
+            if (hash64) {
+              hashmap = new HashMapImpl<int64_t>(shape[0]);
+            } else {
+              hashmap = new HashMapImpl<Hash128Key>(shape[0]);
+            }
+            hashmap->SetBloomFilterThrethold(bloom_filter_threthold);
+            Variable* var = new Variable(new Tensor(dt, shape, initializer->Clone(), Tensor::TType::kSegment, true), new WrapperData<std::unique_ptr<HashMap> >(hashmap), var_name);
+            var->SetRealInited(true);
+            return var;
+          });
+    } else {
+      std::unique_ptr<HashMap>& hashmap = dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(var->GetSlicer())->Internal();
+      if (hashmap.get() == nullptr) {
+        return Status::ArgumentError("hashmap is empty for " + var_name);
+      }
+      var->GetData()->SetInititalizer(initializer->Clone());
+      var->GetData()->InitChunkFrom(hashmap->GetSize());
+      hashmap->SetBloomFilterThrethold(bloom_filter_threthold);
+      var->SetRealInited(true);
+      return Status::Ok();
+    }
   }
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/identity_index_variable_initializer.cc b/xdl/ps-plus/ps-plus/server/udf/identity_index_variable_initializer.cc
index 191b530e..63906940 100644
--- a/xdl/ps-plus/ps-plus/server/udf/identity_index_variable_initializer.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/identity_index_variable_initializer.cc
@@ -34,11 +34,20 @@ class IdentityIndexVariableInitializer : public SimpleUdf<DataType, TensorShape,
     if (type != tensor.Type() || shape != tensor.Shape()) {
       return Status::ArgumentError("IdentityIndexVariableInitializer: type or shape mismatch for variable and tensor");
     }
-    return ctx->GetStorageManager()->Set(ctx->GetVariableName(), [&]{
-      Tensor* ret = new Tensor(type, shape, new initializer::NoneInitializer);
-      QuickMemcpy(ret->Raw<char>(), tensor.Raw<char>(), SizeOfType(type) * shape.NumElements());
-      return new Variable(ret, new WrapperData<size_t>(offset));
-    });
+    std::string var_name = ctx->GetVariableName();
+    Variable* var;
+    ps::Status status = GetStorageManager(ctx)->Get(var_name, &var);
+    if (!status.IsOk()) {
+      return ctx->GetStorageManager()->Set(var_name, [&]{
+            Tensor* ret = new Tensor(type, shape, new initializer::NoneInitializer);
+            QuickMemcpy(ret->Raw<char>(), tensor.Raw<char>(), SizeOfType(type) * shape.NumElements());
+            Variable* var = new Variable(ret, new WrapperData<size_t>(offset), var_name);
+            var->SetRealInited(true);
+            return var;});
+    } else {
+      var->SetRealInited(true);
+      return Status::Ok();
+    }
   }
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/index_variable_initializer.cc b/xdl/ps-plus/ps-plus/server/udf/index_variable_initializer.cc
index 2eb649db..d7685075 100644
--- a/xdl/ps-plus/ps-plus/server/udf/index_variable_initializer.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/index_variable_initializer.cc
@@ -27,7 +27,15 @@ class IndexVariableInitializer : public SimpleUdf<DataType, TensorShape, size_t,
       const TensorShape& shape,
       const size_t& offset,
       const std::unique_ptr<Initializer>& initializer) const {
-    return ctx->GetStorageManager()->Set(ctx->GetVariableName(), [&]{ return new Variable(new Tensor(type, shape, initializer->Clone()), new WrapperData<size_t>(offset)); });
+    std::string var_name = ctx->GetVariableName();
+    Variable* var;
+    ps::Status status = GetStorageManager(ctx)->Get(var_name, &var);
+    if (!status.IsOk()) {
+      return ctx->GetStorageManager()->Set(var_name, [&]{ Variable* var = new Variable(new Tensor(type, shape, initializer->Clone()), new WrapperData<size_t>(offset), var_name); var->SetRealInited(true); return var;});
+    } else {
+      var->SetRealInited(true);
+      return Status::Ok();
+    }
   }
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/is_initialized.cc b/xdl/ps-plus/ps-plus/server/udf/is_initialized.cc
index 18de063c..184ac928 100644
--- a/xdl/ps-plus/ps-plus/server/udf/is_initialized.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/is_initialized.cc
@@ -24,8 +24,13 @@ class IsInitialized : public SimpleUdf<bool*> {
  public:
   virtual Status SimpleRun(UdfContext* ctx, bool* result) const {
     std::string variable_name = GetVariableName(ctx);
-    Variable* unused;
-    *result = GetStorageManager(ctx)->Get(variable_name, &unused).IsOk();
+    Variable* var;
+    ps::Status status = GetStorageManager(ctx)->Get(variable_name, &var);
+    if (!status.IsOk()) {
+      *result = false;
+    } else {
+      *result = var->RealInited();
+    }
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/momentum_updater.cc b/xdl/ps-plus/ps-plus/server/udf/momentum_updater.cc
index fd6c11cc..036c1258 100644
--- a/xdl/ps-plus/ps-plus/server/udf/momentum_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/momentum_updater.cc
@@ -22,66 +22,63 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class MomentumUpdater : public SimpleUdf<Slices, Tensor, double, double, bool> {
+using std::vector;
+
+class MomentumUpdater : public SimpleUdf<vector<Slices>, vector<Tensor>, vector<double>, vector<double>, vector<bool> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const Tensor& grad_tensor,
-      const double& learning_rate_,
-      const double& momentum_,
-      const bool& use_nesterov_) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors,
+      const vector<double>& learning_rates,
+      const vector<double>& momentums,
+      const vector<bool>& use_nesterovs) const {
+    if (sslices.size() != grad_tensors.size() || sslices.size() != learning_rates.size() || sslices.size() != momentums.size() || sslices.size() != use_nesterovs.size()) {
+      return Status::ArgumentError("MomentumUpdater: slices and other size not match");
     }
+    for (size_t si = 0; si < sslices.size(); si++) {
+            const Slices& slices = sslices[si];
+            std::unique_ptr<QRWLocker> locker;
+            locker.reset(new QRWLocker(slices.variable->VariableLock(), QRWLocker::kSimpleRead));
+            if (!slices.writable) {
+              return Status::ArgumentError("slice is not writable");
+            }
+            double learning_rate = learning_rates[si];
+            double momentum = momentums[si];
+            bool use_nesterov = use_nesterovs[si];
+            const Tensor& grad_tensor = grad_tensors[si];
+            Tensor* data_tensor = slices.variable->GetData();
+            Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("accumulation", data_tensor->Type(), []{ return new initializer::ConstantInitializer(0); });
+            if (grad_tensor.Type() != data_tensor->Type()) {
+              return Status::ArgumentError("grad should has same datatype with variable");
+            }
 
-    double learning_rate = learning_rate_;
-    double momentum = momentum_;
-    bool use_nesterov = use_nesterov_;
-    Tensor* data_tensor = slices.variable->GetData();
-    Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("accumulation", data_tensor->Type(), []{ return new initializer::ConstantInitializer(0); });
-    if (grad_tensor.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("grad should has same datatype with variable");
-    }
-    /*
-    if (grad_tensor.Shape().NumElements() != slices.slice_size * slices.slice_id.size()) {
-      return Status::ArgumentError("grad should has shape: " + std::to_string(slices.slice_size * slices.slice_id.size()));
+            CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                      for (size_t i = r.begin; i < r.end; i++) {
+                        int64_t slice = slices.slice_id[i];
+                        if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                          continue;
+                        }                  
+                        T* data = data_tensor->Raw<T>(slice);
+                        T* acc = acc_tensor->Raw<T>(slice);
+                        T* grad = grad_tensor.Raw<T>(i);
+                        if (use_nesterov) {
+                          for (size_t j = 0; j < slices.slice_size; j++) {
+                            *acc = *acc * momentum + *grad;
+                            *data -= *grad * learning_rate + *acc * momentum * learning_rate;
+                            data++; acc++; grad++;
+                          }
+                        } else {
+                          for (size_t j = 0; j < slices.slice_size; j++) {
+                            *acc = *acc * momentum + *grad;
+                            *data -= *acc * learning_rate;
+                            data++; acc++; grad++;
+                          }
+                        }
+                      }
+                      return Status::Ok();
+                    }));
     }
-    */
-    CASES(data_tensor->Type(), {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* acc_ptr = acc_tensor->Raw<T>();
-      T* grad = grad_tensor.Raw<T>();
-      if (use_nesterov) {
-        for (size_t slice : slices.slice_id) {
-          if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {            
-            grad += slices.slice_size;
-            continue;
-          }
-          T* data = data_ptr + slice * slices.slice_size;
-          T* acc = acc_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; i++) {
-            *acc = *acc * momentum + *grad;
-            *data -= *grad * learning_rate + *acc * momentum * learning_rate;
-            data++; acc++; grad++;
-          }
-        }
-      } else {
-        for (size_t slice : slices.slice_id) {
-          if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
-            grad += slices.slice_size;
-            continue;
-          }            
-          T* data = data_ptr + slice * slices.slice_size;
-          T* acc = acc_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; i++) {
-            *acc = *acc * momentum + *grad;
-            *data -= *acc * learning_rate;
-            data++; acc++; grad++;
-          }
-        }
-      }
-    });
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf/moving_average_updater.cc b/xdl/ps-plus/ps-plus/server/udf/moving_average_updater.cc
index 7d7c713e..7586bacc 100644
--- a/xdl/ps-plus/ps-plus/server/udf/moving_average_updater.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/moving_average_updater.cc
@@ -15,43 +15,53 @@ limitations under the License.
 
 #include "ps-plus/server/udf/simple_udf.h"
 #include "ps-plus/server/slice.h"
+#include "ps-plus/common/logging.h"
 #include "ps-plus/common/hashmap.h"
 
 namespace ps {
 namespace server {
 namespace udf {
 
-class MovingAverageUpdater : public SimpleUdf<Slices, float, Tensor> {
+using std::vector;
+
+class MovingAverageUpdater : public SimpleUdf<vector<Slices>, vector<float>, vector<Tensor> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const float& moment,
-      const Tensor& value) const {
-    if (!slices.writable) {
-      return Status::ArgumentError("slice is not writable");
-    }
-
-    Tensor* data_tensor = slices.variable->GetData();
-    if (value.Type() != data_tensor->Type()) {
-      return Status::ArgumentError("value should has same datatype with variable");
+      const vector<Slices>& sslices,
+      const vector<float>& moments,
+      const vector<Tensor>& value_tensors) const {
+    if (sslices.size() != value_tensors.size() || sslices.size() != moments.size()) {
+      return Status::ArgumentError("MovingAverageUpdater: slices and other size not match");
     }
-
-    CASES(data_tensor->Type(), do {
-      T* data_ptr = data_tensor->Raw<T>();
-      T* value_ptr = value.Raw<T>();
-      for (size_t slice : slices.slice_id) {
-          T* data = data_ptr + slice * slices.slice_size;
-          for (size_t i = 0; i < slices.slice_size; ++i) {
-            *data = moment * (*data) + (1.0 - moment) * (*value_ptr);
-            data++;
-            value_ptr++;
-          }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
       }
-    } while(0));
-
+      float moment = moments[si];
+      const Tensor& value_tensor = value_tensors[si];
+      Tensor* data_tensor = slices.variable->GetData();
+      if (value_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("value should has same datatype with variable");
+      }
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  T* data = data_tensor->Raw<T>(slice);
+                  T* value = value_tensor.Raw<T>(i);
+                  for (size_t j = 0; j < slices.slice_size; ++j) {
+                    *data = moment * (*data) + (1.0 - moment) * (*value);
+                    data++;value++;
+                  }
+                }
+                return Status::Ok();}));
+    }
     return Status::Ok();
-  }
+  }          
 };
 
 SIMPLE_UDF_REGISTER(MovingAverageUpdater, MovingAverageUpdater);
diff --git a/xdl/ps-plus/ps-plus/server/udf/python_runner.cc b/xdl/ps-plus/ps-plus/server/udf/python_runner.cc
new file mode 100644
index 00000000..833812b9
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/python_runner.cc
@@ -0,0 +1,297 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "python_runner.h"
+#include <mutex>
+#include "numpy/npy_common.h"
+#include "numpy/ndarrayobject.h"
+
+namespace ps {
+
+namespace {
+int DtypeToNumpy(DataType type) {
+  switch(type) {
+  case DataType::kInt8: return NPY_INT8;
+  case DataType::kInt16: return NPY_INT16;
+  case DataType::kInt32: return NPY_INT32;
+  case DataType::kInt64: return NPY_INT64;
+  case DataType::kFloat: return NPY_FLOAT;
+  case DataType::kDouble: return NPY_DOUBLE;
+  default: return -1;
+  };
+}
+
+Status NumpyToDtype(int x, DataType* type) {
+  switch(x) {
+    case NPY_BOOL: case NPY_INT8: *type = DataType::kInt8; return Status::Ok();
+    case NPY_INT16: *type = DataType::kInt16; return Status::Ok();
+    case NPY_INT32: *type = DataType::kInt32; return Status::Ok();
+    case NPY_INT64: *type = DataType::kInt64; return Status::Ok();
+    case NPY_FLOAT: *type = DataType::kFloat; return Status::Ok();
+    case NPY_DOUBLE: *type = DataType::kDouble; return Status::Ok();
+    default: return Status::ArgumentError("return type error " + std::to_string(x));
+  };
+}
+
+class PythonContext {
+ public:
+  PythonContext() : lock_(mu_) {
+    if (!inited_) {
+      Py_Initialize();
+      PyRun_SimpleString("import traceback");
+      PyRun_SimpleString("import numpy");
+      import_array();
+      PyObject* mainModule = PyImport_ImportModule("__main__" );
+      PyObject* dict = PyModule_GetDict(mainModule);
+      PyObject* traceback = PyDict_GetItemString(dict, "traceback");
+      format_exception = PyObject_GetAttrString(traceback, "format_exception");
+      format_exception_only = PyObject_GetAttrString(traceback, "format_exception_only");
+      if (format_exception == nullptr || format_exception_only == nullptr) {
+        std::cerr << "traceback module import error." << std::endl;
+        abort();
+      }
+      inited_ = true;
+    }
+    PyErr_Clear();
+  }
+  std::string getException() {
+    PyObject *ptype = nullptr, *pvalue = nullptr, *ptraceback = nullptr, *pstr;
+    PyErr_Fetch(&ptype, &pvalue, &ptraceback);
+    if (ptype == nullptr) {
+      return "Unknown Python Exception";
+    }
+    if (ptraceback != nullptr) {
+      pstr = PyObject_CallFunction(format_exception, "OOO", ptype, pvalue, ptraceback);
+    } else {
+      pstr = PyObject_CallFunction(format_exception_only, "OO", ptype, pvalue);
+    }
+    PyObject* slash_n = PyString_FromString("\n");
+    pstr = PyObject_CallMethod(slash_n, "join", "O", pstr);
+    char *pStrErrorMessage = PyString_AsString(pstr);
+    PyErr_Clear();
+    return pStrErrorMessage;
+  }
+ private:
+  std::unique_lock<std::mutex> lock_;
+  static PyObject *format_exception, *format_exception_only;
+  static bool inited_;
+  static std::mutex mu_;
+};
+
+bool PythonContext::inited_ = false;
+std::mutex PythonContext::mu_;
+PyObject *PythonContext::format_exception, *PythonContext::format_exception_only;
+}
+
+PythonRunner::NumpyArray::~NumpyArray() {
+  Py_XDECREF(object);
+}
+
+PythonRunner::NumpyArray::NumpyArray() {
+  this->object = nullptr;
+}
+
+PythonRunner::NumpyArray::NumpyArray(
+    void* data, DataType type, const TensorShape& shape, PyObject* object) {
+  this->data = data;
+  this->type = type;
+  this->shape = shape;
+  this->object = object;
+}
+
+PythonRunner::NumpyArray::NumpyArray(const PythonRunner::NumpyArray& rhs) {
+  this->data = rhs.data;
+  this->type = rhs.type;
+  this->shape = rhs.shape;
+  this->object = rhs.object;
+  Py_XINCREF(object);
+}
+
+PythonRunner::NumpyArray& PythonRunner::NumpyArray::operator=(const PythonRunner::NumpyArray& rhs) {
+  Py_XDECREF(this->object);
+  this->data = rhs.data;
+  this->type = rhs.type;
+  this->shape = rhs.shape;
+  this->object = rhs.object;
+  Py_XINCREF(object);
+}
+
+Status PythonRunner::Init(
+    const std::string& func_def,
+    const std::string& func_name) {
+  PythonContext ctx;
+  PyRun_SimpleString(func_def.c_str());
+  if (PyErr_Occurred()) {
+    return Status::ArgumentError("Cannot Create Python Func\n" + ctx.getException());
+  }
+  PyObject* mainModule = PyImport_ImportModule("__main__" );
+  PyObject* dict = PyModule_GetDict(mainModule);
+  func_ = PyDict_GetItemString(dict, func_name.c_str());
+  if (func_ == nullptr) {
+    return Status::ArgumentError("Python Func Name Error\n" + ctx.getException());
+  }
+  Py_XINCREF(func_);
+  return Status::Ok();
+}
+
+Status PythonRunner::RunImpl(
+    const std::vector<PythonRunner::NumpyArray>& inputs,
+    PyObject** result) {
+  PythonContext ctx;
+  PyObject* result_object;
+  switch (inputs.size()) {
+  case 0:result_object = PyObject_CallFunction(func_, ""); break;
+  case 1:result_object = PyObject_CallFunction(func_, "O", inputs[0].object); break;
+  case 2:result_object = PyObject_CallFunction(func_, "OO", inputs[0].object, inputs[1].object); break;
+  case 3:result_object = PyObject_CallFunction(func_, "OOO", inputs[0].object, inputs[1].object, inputs[2].object); break;
+  case 4:result_object = PyObject_CallFunction(func_, "OOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object); break;
+  case 5:result_object = PyObject_CallFunction(func_, "OOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object); break;
+  case 6:result_object = PyObject_CallFunction(func_, "OOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object); break;
+  case 7:result_object = PyObject_CallFunction(func_, "OOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object); break;
+  case 8:result_object = PyObject_CallFunction(func_, "OOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object); break;
+  case 9:result_object = PyObject_CallFunction(func_, "OOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object); break;
+  case 10:result_object = PyObject_CallFunction(func_, "OOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object); break;
+  case 11:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object); break;
+  case 12:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object); break;
+  case 13:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object); break;
+  case 14:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object); break;
+  case 15:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object); break;
+  case 16:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object); break;
+  case 17:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object); break;
+  case 18:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object); break;
+  case 19:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object); break;
+  case 20:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object); break;
+  case 21:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object); break;
+  case 22:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object); break;
+  case 23:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object); break;
+  case 24:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object); break;
+  case 25:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object); break;
+  case 26:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object, inputs[25].object); break;
+  case 27:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object, inputs[25].object, inputs[26].object); break;
+  case 28:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object, inputs[25].object, inputs[26].object, inputs[27].object); break;
+  case 29:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object, inputs[25].object, inputs[26].object, inputs[27].object, inputs[28].object); break;
+  case 30:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object, inputs[25].object, inputs[26].object, inputs[27].object, inputs[28].object, inputs[29].object); break;
+  case 31:result_object = PyObject_CallFunction(func_, "OOOOOOOOOOOOOOOOOOOOOOOOOOOOOOO", inputs[0].object, inputs[1].object, inputs[2].object, inputs[3].object, inputs[4].object, inputs[5].object, inputs[6].object, inputs[7].object, inputs[8].object, inputs[9].object, inputs[10].object, inputs[11].object, inputs[12].object, inputs[13].object, inputs[14].object, inputs[15].object, inputs[16].object, inputs[17].object, inputs[18].object, inputs[19].object, inputs[20].object, inputs[21].object, inputs[22].object, inputs[23].object, inputs[24].object, inputs[25].object, inputs[26].object, inputs[27].object, inputs[28].object, inputs[29].object, inputs[30].object); break;
+  default: return Status::ArgumentError("Python Call should less than 31 arguments");
+  }
+  if (PyErr_Occurred()) {
+    return Status::ArgumentError("Python Call run with some error\n" + ctx.getException());
+  }
+  if (result_object == nullptr) {
+    return Status::ArgumentError("Python Call run return None");
+  }
+  *result = result_object;
+  return Status::Ok();
+}
+Status PythonRunner::ParseObject(PyObject* arr, PythonRunner::NumpyArray* result) {
+  PyArrayObject* obj = (PyArrayObject*)PyArray_FROM_OF(arr, NPY_ARRAY_IN_ARRAY);
+  if (obj == nullptr) {
+    return Status::ArgumentError("Cannot convert to numpy array");
+  }
+  DataType dtype;
+  Status conv_status = NumpyToDtype(PyArray_TYPE(obj), &dtype);
+  if (!conv_status.IsOk()) {
+    Py_XDECREF(obj);
+    return conv_status;
+  }
+  result->object = (PyObject*)obj;
+  result->data = PyArray_DATA(obj);
+  int dim_size = PyArray_NDIM(obj);
+  npy_intp * dims = PyArray_DIMS(obj);
+  result->shape = TensorShape(std::vector<size_t>(dims, dims+dim_size));
+  result->type = dtype;
+  return Status::Ok();
+}
+
+Status PythonRunner::Run(const std::vector<PythonRunner::NumpyArray>& inputs) {
+  PyObject* obj;
+  PS_CHECK_STATUS(RunImpl(inputs, &obj));
+  return Status::Ok();
+}
+Status PythonRunner::Run(
+    const std::vector<PythonRunner::NumpyArray>& inputs,
+    PythonRunner::NumpyArray* result) {
+  PyObject* obj;
+  PS_CHECK_STATUS(RunImpl(inputs, &obj));
+  PythonContext ctx;
+  Status st = ParseObject(obj, result);
+  Py_XDECREF(obj);
+  return st;
+}
+
+Status PythonRunner::Run(
+    const std::vector<PythonRunner::NumpyArray>& inputs,
+    PythonRunner::NumpyArray* r1,
+    PythonRunner::NumpyArray* r2) {
+  PyObject* obj, *obj1, *obj2;
+  PS_CHECK_STATUS(RunImpl(inputs, &obj));
+  PythonContext ctx;
+  if (!PyArg_ParseTuple(obj, "OO", &obj1, &obj2)) {
+    Py_XDECREF(obj);
+    return Status::ArgumentError("Parse Result Error!\n" + ctx.getException());
+  }
+  Status st1 = ParseObject(obj1, r1);
+  Status st2 = ParseObject(obj2, r2);
+  Py_XDECREF(obj);
+  if (!st1.IsOk()) {
+    return st1;
+  } else {
+    return st2;
+  }
+}
+
+Status PythonRunner::ParseSubTensor(
+    Tensor t, size_t seg_id, size_t max_id, PythonRunner::NumpyArray* arr) {
+  size_t segment_size = t.SegmentSize();
+  void* data = t.Raw<void>(segment_size * seg_id);
+  arr->shape = t.Shape();
+  arr->shape.Set(0, std::min(segment_size, max_id - seg_id * segment_size));
+  arr->data = data;
+  arr->type = t.Type();
+  std::vector<npy_intp> shapex;
+  for (int i = 0; i < arr->shape.Size(); i++) {
+    shapex.push_back(arr->shape[i]);
+  }
+  int type = DtypeToNumpy(arr->type);
+  if (type == -1) {
+    return Status::ArgumentError("input Type Error");
+  }
+  int ndim = shapex.size();
+  arr->object = PyArray_SimpleNewFromData(
+      ndim, &shapex[0], type, data);
+  return Status::Ok();
+}
+
+Status PythonRunner::ParseTensor(
+    Tensor t, PythonRunner::NumpyArray* arr) {
+  arr->shape = t.Shape();
+  arr->data = t.Raw<void>();
+  arr->type = t.Type();
+  std::vector<npy_intp> shapex;
+  for (int i = 0; i < arr->shape.Size(); i++) {
+    shapex.push_back(arr->shape[i]);
+  }
+  int type = DtypeToNumpy(arr->type);
+  if (type == -1) {
+    return Status::ArgumentError("input Type Error");
+  }
+  int ndim = shapex.size();
+  arr->object = PyArray_SimpleNewFromData(
+      ndim, &shapex[0], type, arr->data);
+  return Status::Ok();
+}
+
+}  // namespace ps
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/python_runner.h b/xdl/ps-plus/ps-plus/server/udf/python_runner.h
new file mode 100644
index 00000000..0840f041
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/python_runner.h
@@ -0,0 +1,64 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef PS_PLUS_COMMON_PYTHON_RUNNER_H_
+#define PS_PLUS_COMMON_PYTHON_RUNNER_H_
+
+#include <vector>
+#include <string>
+#include "Python.h"
+#include "ps-plus/common/types.h"
+#include "ps-plus/common/tensor_shape.h"
+#include "ps-plus/common/tensor.h"
+#include "ps-plus/common/status.h"
+
+namespace ps {
+
+class PythonRunner {
+ public:
+  struct NumpyArray {
+    ~NumpyArray();
+    NumpyArray();
+    NumpyArray(
+        void* data, DataType type, const TensorShape& shape, PyObject* object);
+    NumpyArray(const NumpyArray&);
+    NumpyArray& operator=(const NumpyArray&);
+    void* data;
+    DataType type;
+    TensorShape shape;
+    PyObject* object;
+  };
+  
+  PythonRunner() : func_(nullptr) {}
+  ~PythonRunner() {Py_XDECREF(func_);}
+
+  Status Init(const std::string& func_def, const std::string& func_name);
+
+  Status Run(const std::vector<NumpyArray>& inputs);
+  Status Run(const std::vector<NumpyArray>& inputs, NumpyArray* result);
+  Status Run(const std::vector<NumpyArray>& inputs, NumpyArray* r1, NumpyArray* r2);
+  static Status ParseSubTensor(Tensor t, size_t seg_id, size_t max_id, NumpyArray* arr);
+  static Status ParseTensor(Tensor t, NumpyArray* arr);
+ private:
+  Status RunImpl(const std::vector<NumpyArray>& inputs, PyObject** result);
+  Status ParseObject(PyObject* arr, NumpyArray* result);
+  PyObject* func_;
+};
+
+
+}  // namespace ps
+
+#endif  // PS_PLUS_COMMON_PYTHON_RUNNER_H_
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/rmsprop_updater.cc b/xdl/ps-plus/ps-plus/server/udf/rmsprop_updater.cc
new file mode 100644
index 00000000..1ac76561
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/rmsprop_updater.cc
@@ -0,0 +1,87 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/server/udf/simple_udf.h"
+#include "ps-plus/server/slice.h"
+#include "ps-plus/common/initializer/constant_initializer.h"
+#include "ps-plus/common/hashmap.h"
+
+namespace ps {
+namespace server {
+namespace udf {
+
+using std::vector;
+
+class RmspropUpdater : public SimpleUdf<vector<Slices>, vector<Tensor>, vector<double>, vector<double>, vector<double>, vector<double> > {
+ public:
+  virtual Status SimpleRun(
+      UdfContext* ctx,
+      const vector<Slices>& sslices,
+      const vector<Tensor>& grad_tensors,
+      const vector<double>& learning_rates,
+      const vector<double>& decays,
+      const vector<double>& alphas, /* It's called 'momentum' in tf.RMSPropOptimizer, but it is actually a coefficiency. Thus we call it 'alpha'. */
+      const vector<double>& epsilons) const {
+    if (sslices.size() != grad_tensors.size() || sslices.size() != learning_rates.size() || sslices.size() != decays.size() || sslices.size() != alphas.size() || sslices.size() != epsilons.size()) {
+      return Status::ArgumentError("Rmspropoptimizer: slices and other size not match");
+    }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      if (!slices.writable) {
+        return Status::ArgumentError("slice is not writable");
+      }
+      Tensor* data_tensor = slices.variable->GetData();
+      Tensor* acc_tensor = slices.variable->GetVariableLikeSlot("accumulator", data_tensor->Type(), []{ return new initializer::ConstantInitializer(0); });
+      Tensor* mom_tensor = slices.variable->GetVariableLikeSlot("momentum", data_tensor->Type(), []{ return new initializer::ConstantInitializer(0); });
+      double learning_rate = learning_rates[si];
+      double decay = decays[si];
+      double alpha = alphas[si];
+      double epsilon = epsilons[si];
+      const Tensor& grad_tensor = grad_tensors[si];
+    
+      if (grad_tensor.Type() != data_tensor->Type()) {
+        return Status::ArgumentError("grad should has same datatype with variable");
+      }
+
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  T* data = data_tensor->Raw<T>(slice);
+                  T* acc = acc_tensor->Raw<T>(slice);
+                  T* mom = mom_tensor->Raw<T>(slice);
+                  T* grad = grad_tensor.Raw<T>(i);
+                  for (size_t j = 0; j < slices.slice_size; j++) {
+                    *acc += (*grad * *grad - *acc) * (1 - decay);
+                    *mom = *mom * alpha + (*grad * learning_rate) / sqrt(*acc + epsilon);
+                    *data -= *mom;
+                    data++; grad++; acc++; mom++;
+                  }
+                }
+                return Status::Ok();
+              }));
+    }
+    return Status::Ok(); 
+  }
+};
+
+SIMPLE_UDF_REGISTER(RmspropUpdater, RmspropUpdater);
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/scalar_integer_logger.cc b/xdl/ps-plus/ps-plus/server/udf/scalar_integer_logger.cc
index c6afc2fa..df467e02 100644
--- a/xdl/ps-plus/ps-plus/server/udf/scalar_integer_logger.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/scalar_integer_logger.cc
@@ -15,27 +15,42 @@ limitations under the License.
 
 #include "ps-plus/server/udf/simple_udf.h"
 #include "ps-plus/server/slice.h"
-#include "ps-plus/common/initializer/constant_initializer.h"
 #include "ps-plus/common/hashmap.h"
+#include "ps-plus/common/initializer/constant_initializer.h"
 
 namespace ps {
 namespace server {
 namespace udf {
 
-class ScalarIntegerLogger : public SimpleUdf<Slices, std::string, int64_t> {
+using std::vector;
+
+class ScalarIntegerLogger : public SimpleUdf<vector<Slices>, vector<std::string>, vector<int64_t> > {
  public:
   virtual Status SimpleRun(
       UdfContext* ctx,
-      const Slices& slices,
-      const std::string& slot_name,
-      const int64_t& pval) const {
-    Tensor* t = slices.variable->GetVariableLikeSlot(slot_name, DataType::kInt64, TensorShape(), []{ return new initializer::ConstantInitializer(0); });
-    int64_t* data = t->Raw<int64_t>();
-    int64_t val = pval;
-    for (size_t slice : slices.slice_id) {
-      if (slice != (size_t)HashMap::NOT_ADD_ID) {
-        data[slice] = val;
-      }
+      const vector<Slices>& sslices,
+      const vector<std::string>& slot_names,
+      const vector<int64_t>& pvals) const {
+    if (sslices.size() != slot_names.size() || sslices.size() != pvals.size()) {
+      return Status::ArgumentError("ScalarIntegerLogger: slices and other size not match");
+    }
+    for (size_t si = 0; si < sslices.size(); si++) {
+      const Slices& slices = sslices[si];
+      Tensor* data_tensor = slices.variable->GetData();
+      std::string slot_name = slot_names[si];
+      Tensor* t = slices.variable->GetVariableLikeSlot(slot_name, DataType::kInt64, TensorShape(), []{ return new initializer::ConstantInitializer(0); });
+      int64_t val = pvals[si];
+      CASES(data_tensor->Type(), MultiThreadDo(slices.slice_id.size(), [&](const Range& r) {
+                for (size_t i = r.begin; i < r.end; i++) {
+                  int64_t slice = slices.slice_id[i];
+                  if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                    continue;
+                  }
+                  int64_t* data = t->Raw<int64_t>(slice);
+                  *data = val;
+                }
+                return Status::Ok();
+              }));
     }
     return Status::Ok();
   }
diff --git a/xdl/ps-plus/ps-plus/server/udf/simple_udf.h b/xdl/ps-plus/ps-plus/server/udf/simple_udf.h
index d2b5d2e8..69f55edc 100644
--- a/xdl/ps-plus/ps-plus/server/udf/simple_udf.h
+++ b/xdl/ps-plus/ps-plus/server/udf/simple_udf.h
@@ -65,6 +65,7 @@ class SimpleUdf : public Udf {
     }
     return ret;
   }
+
   static constexpr size_t kInputSize = simple_udf_helper::Counter<T...>::kInputSize;
   static constexpr size_t kOutputSize = simple_udf_helper::Counter<T...>::kOutputSize;
 };
@@ -76,5 +77,7 @@ class SimpleUdf : public Udf {
 #define SIMPLE_UDF_REGISTER(TYPE, NAME) \
   UDF_REGISTER(TYPE, NAME, TYPE::kInputSize, TYPE::kOutputSize)
 
+#define CHECK_COUNTER(COUNTER, OK) do { if (--COUNTER == 0) {OK.set_value(true);} return;} while(0);
+
 #endif
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/slice_to_tensor.cc b/xdl/ps-plus/ps-plus/server/udf/slice_to_tensor.cc
index c52729ff..a71769fa 100644
--- a/xdl/ps-plus/ps-plus/server/udf/slice_to_tensor.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/slice_to_tensor.cc
@@ -15,49 +15,55 @@ limitations under the License.
 
 #include "ps-plus/server/udf/simple_udf.h"
 #include "ps-plus/server/slice.h"
+#include "ps-plus/common/hashmap.h"
 
 namespace ps {
 namespace server {
 namespace udf {
 
-class SliceToTensor : public SimpleUdf<TensorSlices, Tensor*> {
- public:
-  virtual Status SimpleRun(UdfContext* ctx, const TensorSlices& slices, Tensor* result) const {
-    TensorShape new_shape;
-    const Tensor* t = &slices.tensor;
-    if (slices.dim_part < 0) {
-      *result = slices.tensor;
-    } else {
-      std::vector<size_t> dims(1, slices.slice_size);
-      if ((size_t)slices.dim_part > t->Shape().Size()) {
-        return Status::ArgumentError("Slice dim_part Error");
-      }
-
-      dims.insert(dims.end(), 
-		  t->Shape().Dims().begin() + slices.dim_part, 
-		  t->Shape().Dims().end());
-      new_shape = TensorShape(dims);
-      new_shape.Set(0, slices.slice_id.size());
-      size_t buf_size = 0;
-      CASES(t->Type(), {
-	  buf_size = slices.slice_id.size() * slices.slice_size * sizeof(T);
-	});
-
-      char* buf = new char[buf_size];
-      char* base = t->Raw<char>();
-      CASES(t->Type(), {
-	  size_t chunk_size = slices.slice_size * sizeof(T);
-	  for (size_t i = 0; i < slices.slice_id.size(); ++i) {
-	    memcpy(buf + i * chunk_size, 
-		   base + slices.slice_id[i] * chunk_size, 
-		   chunk_size);
-	  }
-	});
+using std::vector;
 
-      *result = ps::Tensor(t->Type(), new_shape, buf, nullptr);
+class SliceToTensor : public SimpleUdf<vector<Slices>, vector<Tensor>*> {
+ public:
+  virtual Status SimpleRun(UdfContext* ctx, const vector<Slices>& sslices, vector<Tensor>* results) const {
+    static char zero_buffer[1<<16] = {0};
+    results->resize(sslices.size());
+    std::promise<bool> ok;
+    Status status = Status::Ok();    
+    std::atomic<size_t> counter(sslices.size());
+    for (size_t si = 0; si < sslices.size(); si++) {
+      ThreadPool::Global()->Schedule([&, si]{
+            const Slices& slices = sslices[si];
+            const Tensor& t = *(slices.variable->GetData());
+            if (slices.dim_part < 0) {
+              (*results)[si] = t;
+            } else {
+              if ((size_t)slices.dim_part > t.Shape().Size()) {
+                status = Status::ArgumentError("Slice dim_part Error");
+                CHECK_COUNTER(counter, ok);
+              }
+              std::vector<size_t> dims(1, slices.slice_id.size());
+              for (size_t i = slices.dim_part; i < t.Shape().Dims().size(); i++) {
+                dims.push_back(t.Shape()[i]);
+              }
+              Tensor result(t.Type(), TensorShape{dims}, t.GetInitializer()->Clone(), ps::Tensor::TType::kContinuous, false);
+              CASES(t.Type(), {
+                    size_t chunk_size = slices.slice_size * sizeof(T);
+                    for (size_t i = 0; i < slices.slice_id.size(); ++i) {
+                      int64_t slice = slices.slice_id[i];
+                      if ((int64_t)slice == ps::HashMap::NOT_ADD_ID) {
+                        memcpy(result.Raw<T>(i), zero_buffer, chunk_size);
+                      } else {
+                        memcpy(result.Raw<T>(i), t.Raw<T>(slice), chunk_size);
+                      }
+                    }});
+              (*results)[si] = result;
+            }
+            CHECK_COUNTER(counter, ok);            
+          });
     }
-
-    return Status::Ok();
+    ok.get_future().wait();
+    return status;
   }
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/statis_slice.cc b/xdl/ps-plus/ps-plus/server/udf/statis_slice.cc
new file mode 100644
index 00000000..8d0a8451
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/statis_slice.cc
@@ -0,0 +1,120 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <math.h>
+#include <mutex>
+
+#include "ps-plus/common/hashmap.h"
+#include "ps-plus/common/initializer/constant_initializer.h"
+#include "ps-plus/server/udf/simple_udf.h"
+#include "ps-plus/server/slice.h"
+
+namespace ps {
+namespace server {
+namespace udf {
+
+class StatisSlice : public SimpleUdf<std::vector<Slices>, std::vector<Tensor>, Tensor, Tensor, Tensor,
+                                     std::string, std::vector<TensorSlices>*> {
+ public:
+  /*
+   *  S[0] = a[0]
+   *  S[N] = a[N] + decay * S[N-1]
+   *       = a[N] + decay*a[N-1] + decay^2*a[N-2] + ... + decay^(N-1)*a[1] + decay^N*a[0]
+   *       = decay^N * sum<j=0:N+1> { decay^(-j) * a[j] }
+   *
+   *  N = gs / period
+   *  K = decay^(N-offset)
+   *  acc = sum<j=0:N+1> { decay^(offset-j) * a[j] }
+   *  data = K * acc
+   */
+  virtual Status SimpleRun(UdfContext* ctx,
+                           const std::vector<Slices>& slices,
+                           const std::vector<Tensor>& clicks,
+                           const Tensor& global_step,
+                           const Tensor& statis_decay,
+                           const Tensor& statis_decay_period,
+                           const std::string& statis_type,
+                           std::vector<TensorSlices>* result) const {
+    int64_t gs = *global_step.Raw<int64_t>();
+    float decay = (float) *statis_decay.Raw<double>();
+    int64_t period = *statis_decay_period.Raw<int64_t>();
+    int64_t N = gs / period;
+    static int64_t N_begin = N;
+    static int64_t step = int64_t(logf(1e-30) / logf(decay));
+    static int64_t offset = (N_begin / step) * step;
+    static std::mutex mutex;
+    if (N - offset > step) {
+      std::lock_guard<std::mutex> lock(mutex);
+      while (N - offset > step) {
+        offset += step;
+        UpdateOffset(slices, decay, step);
+      }
+    }
+    float K = powf(decay, N - offset);
+    result->resize(slices.size());  // number of variables
+    for (size_t si = 0; si < slices.size(); ++si) {
+      const Slices& slice = slices[si];
+      Tensor* data_tensor = slice.variable->GetData();
+      Tensor* acc_tensor = slice.variable->GetVariableLikeSlot(slice.variable->GetName() + "_ACC", data_tensor->Type(),
+                                                               []{ return new initializer::ConstantInitializer(0); });
+      Statis(slice, clicks[si], decay, offset, N, K, acc_tensor, data_tensor);
+      (*result)[si].slice_size = slice.slice_size;
+      (*result)[si].slice_id = slice.slice_id;
+      (*result)[si].dim_part = slice.dim_part;
+      (*result)[si].tensor = *data_tensor;
+    }
+    return Status::Ok();
+  }
+
+ private:
+  inline void Statis(const Slices& slice, const Tensor& click, float decay, int64_t offset, int64_t N, float K,
+                     Tensor* acc_tensor, Tensor* data_tensor) const {
+    int32_t* pclick = click.Raw<int32_t>();
+    CASES(data_tensor->Type(), MultiThreadDo(slice.slice_id.size(), [&](const Range& r) {
+      for (size_t i = r.begin; i < r.end; ++i) {
+        size_t s = slice.slice_id[i];
+        if (s == ps::HashMap::NOT_ADD_ID) continue;
+        T* acc = acc_tensor->Raw<T>(s);
+        T* data = data_tensor->Raw<T>(s);
+        *acc += pclick[i] * powf(decay, offset - N);
+        *data = K * (*acc);
+      }
+      return Status::Ok();
+    }));
+  }
+
+  inline void UpdateOffset(const std::vector<Slices>& slices, float decay, int64_t step) const {
+    for (size_t si = 0; si < slices.size(); ++si) {
+      const Slices& slice = slices[si];
+      Tensor* data_tensor = slice.variable->GetData();
+      Tensor* acc_tensor = slice.variable->GetVariableLikeSlot(slice.variable->GetName() + "_ACC", data_tensor->Type(),
+                                                               []{ return new initializer::ConstantInitializer(0); });
+      CASES(data_tensor->Type(), MultiThreadDo(acc_tensor->Shape().NumElements(), [&](const Range& r) {
+        for (size_t i = r.begin; i < r.end; ++i) {
+          T* acc = acc_tensor->Raw<T>(i);
+          *acc *= powf(decay, step);
+        }
+        return Status::Ok();
+      }));
+    }
+  }
+};
+
+SIMPLE_UDF_REGISTER(StatisSlice, StatisSlice);
+
+}
+}
+}
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/adagrad_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/adagrad_updater_test.cc
index 730a82c1..fe57ca90 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/adagrad_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/adagrad_updater_test.cc
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+#include <iostream>
 #include "gtest/gtest.h"
 #include "ps-plus/common/data.h"
 #include "ps-plus/server/udf.h"
@@ -33,27 +34,34 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using ps::Status;
 
 TEST(AdagradUpdater, AdagradUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("AdagradUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  ctx->SetData(2, new WrapperData<double>(3), true);
-  ctx->SetData(3, new WrapperData<double>(5), true);
+  std::vector<Slices> sv;
+  sv.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true});
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(sv), true);
+  std::vector<Tensor> tv;
+  tv.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(tv), true);
+  ctx->SetData(2, new WrapperData<std::vector<double> >(std::vector<double>{3}), true);
+  ctx->SetData(3, new WrapperData<std::vector<double> >(std::vector<double>{5}), true);
 
-  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  Status status = udf->Run(ctx);
+  EXPECT_TRUE(status.IsOk());
   for (size_t i = 0; i < 8; i++) {
     EXPECT_EQ(3, var->GetData()->Raw<float>()[i]);
     EXPECT_EQ(3, var->GetData()->Raw<float>()[i + 16]);
     EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
     EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
   }
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)), true);  
+  std::vector<Tensor> tv2;
+  tv2.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)));
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(tv2), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
     EXPECT_FLOAT_EQ(0.6, var->GetData()->Raw<float>()[i]);
@@ -61,9 +69,9 @@ TEST(AdagradUpdater, AdagradUpdater) {
     EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
     EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
   }
-
-  Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
+  std::vector<Slices> slices2;
+  slices2.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = true});
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices2), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
     EXPECT_FLOAT_EQ(0.6, var->GetData()->Raw<float>()[i]);
@@ -71,14 +79,113 @@ TEST(AdagradUpdater, AdagradUpdater) {
     EXPECT_FLOAT_EQ(2.381385, var->GetData()->Raw<float>()[i + 8]);
     EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
   }  
-  Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices3), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  std::vector<Slices> slices3;
+  slices3.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+  
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices2), true);
+  std::vector<Tensor> vt3(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(vt3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");
   delete var;
   delete ctx;
   delete udf;
 }
 
+TEST(AdagradUpdater, AdagradUpdaterForHash) {
+  UdfRegistry* udf_registry = UdfRegistry::Get("AdagradUpdater");
+  Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3}), std::vector<size_t>({}));
+  UdfContext* ctx = new UdfContext;
+  ps::server::StorageManager* manager = new ps::server::StorageManager();
+  Variable* var0 = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), Tensor::TType::kSegment, true), nullptr, "");
+  Variable* var1 = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(1), Tensor::TType::kContinuous, true), nullptr, "");
+  EXPECT_TRUE(manager->Set("var0", [var0](){return var0;}).IsOk());
+  EXPECT_TRUE(manager->Set("var1", [var1](){return var1;}).IsOk());  
+  std::vector<Slices> slices;
+  slices.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var0, .writable = true});
+  slices.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({1, 2}), .dim_part = -1, .variable = var1, .writable = true});  
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices), true);
+  std::vector<Tensor> grads;
+  grads.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));
+  grads.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)));  
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(grads), true);
+  ctx->SetData(2, new WrapperData<std::vector<double> >(std::vector<double>{3, 4}), true);
+  ctx->SetData(3, new WrapperData<std::vector<double> >(std::vector<double>{5, 3}), true);
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  for (size_t i = 0; i < 8; i++) {
+    EXPECT_EQ(3, *(var0->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(3, *(var0->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var0->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var0->GetData()->Raw<float>(3) + i));
+
+    EXPECT_EQ(-1, *(var1->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(-1, *(var1->GetData()->Raw<float>(2) + i));    
+    EXPECT_EQ(1, *(var1->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(1, *(var1->GetData()->Raw<float>(3) + i));
+  }
+
+  std::vector<Tensor> grads2;
+  grads2.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)));
+  grads2.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(3)));  
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(grads2), true);
+
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  for (size_t i = 0; i < 8; i++) {
+    EXPECT_FLOAT_EQ(0.6, *(var0->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(0.6, *(var0->GetData()->Raw<float>(2) + i));
+    EXPECT_FLOAT_EQ(5, *(var0->GetData()->Raw<float>(1) + i));
+    EXPECT_FLOAT_EQ(5, *(var0->GetData()->Raw<float>(3) + i));
+
+    EXPECT_FLOAT_EQ(-4.3282, *(var1->GetData()->Raw<float>(1) + i));
+    EXPECT_FLOAT_EQ(-4.3282, *(var1->GetData()->Raw<float>(2) + i));
+    EXPECT_FLOAT_EQ(1, *(var1->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(1, *(var1->GetData()->Raw<float>(3) + i));
+  }
+  std::vector<Slices> slices2;
+  slices2.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var0, .writable = true});
+  slices2.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var1, .writable = true});  
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices2), true);
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  for (size_t i = 0; i < 8; i++) {
+    EXPECT_FLOAT_EQ(0.6, *(var0->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(0.6, *(var0->GetData()->Raw<float>(2) + i));
+    EXPECT_FLOAT_EQ(2.381385, *(var0->GetData()->Raw<float>(1) + i));
+    EXPECT_FLOAT_EQ(5, *(var0->GetData()->Raw<float>(3) + i));
+
+    EXPECT_FLOAT_EQ(-6.88661, *(var1->GetData()->Raw<float>(1) + i));
+    EXPECT_FLOAT_EQ(-4.3282, *(var1->GetData()->Raw<float>(2) + i));
+    EXPECT_FLOAT_EQ(1, *(var1->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(1, *(var1->GetData()->Raw<float>(3) + i));
+  }
+  std::vector<Slices> slices3;
+  slices3.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var0, .writable = false});
+  slices3.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var1, .writable = true});
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices3), true);
+  Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+  
+  ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices2), true);
+  std::vector<Tensor> grad3;
+  grad3.push_back(Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)));
+  grad3.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));  
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(grad3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");
+
+  std::vector<Tensor> grad4;
+  grad4.push_back(Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(1, new WrapperData<std::vector<Tensor> >(grad4), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "AdagradUpdater: slices and other size not match");  
+  delete manager;
+  delete ctx;
+  delete udf;
+}
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/adam_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/adam_updater_test.cc
index 4687fb77..8def91e4 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/adam_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/adam_updater_test.cc
@@ -33,53 +33,64 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using std::vector;
 
 TEST(AdamUpdater, AdamUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("AdamUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3, 4, 5, 6}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
-  ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  ctx->SetData(2, new WrapperData<double>(2), true);
-  ctx->SetData(3, new WrapperData<double>(0.5), true);
-  ctx->SetData(4, new WrapperData<double>(0.9), true);  
-  ctx->SetData(5, new WrapperData<double>(0.8), true);
-  ctx->SetData(6, new WrapperData<bool>(true), true);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), true, 1), nullptr, "");
 
-  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true});
+  vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad), true);
+  ctx->SetData(2, new WrapperData<vector<double> >(vector<double>{2}), true);
+  ctx->SetData(3, new WrapperData<vector<double> >(vector<double>{0.5}), true);
+  ctx->SetData(4, new WrapperData<vector<double> >(vector<double>{0.9}), true);
+  ctx->SetData(5, new WrapperData<vector<double> >(vector<double>{0.8}), true);
+  ctx->SetData(6, new WrapperData<vector<bool> >(vector<bool>{true}), true);
+
+  ps::Status status = udf->Run(ctx);
+  EXPECT_TRUE(status.IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_FLOAT_EQ(3.71714, var->GetData()->Raw<float>()[i]);
-    EXPECT_FLOAT_EQ(3.71714, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_FLOAT_EQ(3.71714, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(3.71714, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));
   }
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)), true);  
+
+  vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)));
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad2), true);  
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_FLOAT_EQ(2.46871, var->GetData()->Raw<float>()[i]);
-    EXPECT_FLOAT_EQ(2.46871, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_FLOAT_EQ(2.46871, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(2.46871, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));
   }
 
-  Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = true});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_FLOAT_EQ(2.46871, var->GetData()->Raw<float>()[i]);
-    EXPECT_FLOAT_EQ(2.46871, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_FLOAT_EQ(4.45572, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
-  }  
-  Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices3), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+    EXPECT_FLOAT_EQ(2.46871, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(2.46871, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_FLOAT_EQ(4.45572, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));
+  }
+  
+  vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");  
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  vector<Tensor> grad3(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");  
   delete var;
   delete ctx;
   delete udf;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/adaptive_revision_pull_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/adaptive_revision_pull_updater_test.cc
index 0404e2a3..21ce7c06 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/adaptive_revision_pull_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/adaptive_revision_pull_updater_test.cc
@@ -33,15 +33,16 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using std::vector;
 
 TEST(AdaptiveRevisionPullUpdater, AdaptiveRevisionPullUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("AdaptiveRevisionPullUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), true, 1), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
   ctx->SetData(1, new WrapperData<size_t>(5), true);
   ctx->SetData(2, new WrapperData<size_t>(2), true);
   
@@ -51,15 +52,15 @@ TEST(AdaptiveRevisionPullUpdater, AdaptiveRevisionPullUpdater) {
   EXPECT_TRUE(var->GetExistSlot("g", &g).IsOk());
   EXPECT_TRUE(var->GetExistSlot("g_old", &g_old).IsOk());
   EXPECT_EQ(2, g->Shape().Size());
-  EXPECT_EQ(4, g->Shape()[0]);
+  EXPECT_EQ(Tensor::DEFAULT_SEGMENT_SIZE, g->Shape()[0]);
   EXPECT_EQ(8, g->Shape()[1]);
   EXPECT_EQ(3, g_old->Shape().Size());
   EXPECT_EQ(5, g_old->Shape()[0]);
   EXPECT_EQ(4, g_old->Shape()[1]);
   EXPECT_EQ(8, g_old->Shape()[2]);
 
-  Slices slices1{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices1), true);
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
   EXPECT_FALSE(udf->Run(ctx).IsOk());
   
   delete var;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/aggregate_slice_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/aggregate_slice_test.cc
index 26eba377..45290ba9 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/aggregate_slice_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/aggregate_slice_test.cc
@@ -38,78 +38,95 @@ using ps::ThreadPool;
 using ps::Status;
 using std::cout;
 using std::endl;
+using std::vector;
 
 TEST(AggregateSlice, AggregateSliceSparse) {
     UdfRegistry* udf_registry = UdfRegistry::Get("AggregateSlice");
-    Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3}), std::vector<size_t>({0, 1}));
+    Udf* udf = udf_registry->Build(vector<size_t>({0, 1, 2, 3}), vector<size_t>({4, 5}));
     UdfContext* ctx = new UdfContext;
-    Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0.0), true), nullptr);
-    Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true};
-    ctx->SetData(0, new WrapperData<Slices>(slices), true);
+    Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0.0), Tensor::TType::kSegment, true), nullptr, "var");
+    ctx->SetVariableName("var");
+    vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = vector<size_t>({3, 5}), .dim_part = 1, .variable = var, .writable = true});
+    vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1.0)));
+    ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
     ctx->SetData(1, new WrapperData<int64_t>(1), true);
     ctx->SetData(2, new WrapperData<int32_t>(3), true);
-    ctx->SetData(3, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1.0), true), true);
+    ctx->SetData(3, new WrapperData<vector<Tensor> >(grad), true);
     ctx->SetVariable(var);
     
     Data* output;
-    
     EXPECT_TRUE(udf->Run(ctx).IsOk());
-    EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
-    Slices& out_slices = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-    EXPECT_EQ(8ul, out_slices.slice_size);
-    EXPECT_EQ(0ul, out_slices.slice_id.size());
-    EXPECT_EQ(1, out_slices.dim_part);
-    EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-    Tensor& out_grad = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-    EXPECT_EQ(0ul, out_grad.Shape().NumElements());
-    
-    Slices slices1{.slice_size = 8, .slice_id = std::vector<size_t>({1, 2}), .dim_part = 1, .variable = var, .writable = true};
-    ctx->SetData(0, new WrapperData<Slices>(slices1), true);
+    EXPECT_TRUE(ctx->GetData(4, &output).IsOk());
+    vector<Slices>& out_slices = dynamic_cast<WrapperData<vector<Slices> >*>(output)->Internal();
+    EXPECT_EQ(1ul, out_slices.size());
+    EXPECT_EQ(8ul, out_slices[0].slice_size);
+    EXPECT_EQ(0ul, out_slices[0].slice_id.size());
+    EXPECT_EQ(1, out_slices[0].dim_part);
+    ASSERT_TRUE(ctx->GetData(5, &output).IsOk());
+    vector<Tensor>& out_grad = dynamic_cast<WrapperData<vector<Tensor> >*>(output)->Internal();
+    ASSERT_EQ(1ul, out_grad.size());
+    EXPECT_TRUE(out_grad[0].Shape().IsScalar());
+
+    vector<Slices> slices1(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({4, 5}), .dim_part = 1, .variable = var, .writable = true});
+    vector<Tensor> grad1(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2.0)));
+    ctx->SetData(0, new WrapperData<vector<Slices> >(slices1), true);
     ctx->SetData(1, new WrapperData<int64_t>(1), true);
     ctx->SetData(2, new WrapperData<int32_t>(3), true);
-    ctx->SetData(3, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2.0), true), true);
+    ctx->SetData(3, new WrapperData<vector<Tensor> >(grad1), true);
     
     EXPECT_TRUE(udf->Run(ctx).IsOk());
-    EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
-    Slices& out_slices1 = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-    EXPECT_EQ(8ul, out_slices1.slice_size);
-    EXPECT_EQ(0ul, out_slices1.slice_id.size());
-    EXPECT_EQ(1, out_slices1.dim_part);
-    EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-    Tensor& out_grad1 = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-    EXPECT_EQ(0ul, out_grad1.Shape().NumElements());
-    
-    Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({0}), .dim_part = 1, .variable = var, .writable = true};
-    ctx->SetData(0, new WrapperData<Slices>(slices2), true);
+    EXPECT_TRUE(ctx->GetData(4, &output).IsOk());
+    vector<Slices>& out_slices1 = dynamic_cast<WrapperData<vector<Slices> >*>(output)->Internal();
+    EXPECT_EQ(1ul, out_slices1.size());
+    EXPECT_EQ(8ul, out_slices1[0].slice_size);
+    EXPECT_EQ(0ul, out_slices1[0].slice_id.size());
+    EXPECT_EQ(1, out_slices1[0].dim_part);
+    EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+    vector<Tensor>& out_grad1 = dynamic_cast<WrapperData<vector<Tensor> >*>(output)->Internal();
+    EXPECT_EQ(1ul, out_grad1.size());
+    EXPECT_TRUE(out_grad1[0].Shape().IsScalar());
+
+    vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({3}), .dim_part = 1, .variable = var, .writable = true});
+    vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({1, 8}), new ConstantInitializer(3.0)));
+    ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
     ctx->SetData(1, new WrapperData<int64_t>(1), true);
     ctx->SetData(2, new WrapperData<int32_t>(3), true);
-    ctx->SetData(3, new WrapperData<Tensor>(DataType::kFloat, TensorShape({1, 8}), new ConstantInitializer(3.0), true), true);
+    ctx->SetData(3, new WrapperData<vector<Tensor> >(grad2), true);
     
     EXPECT_TRUE(udf->Run(ctx).IsOk());
-    EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
-    Slices& out_slices2 = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-    EXPECT_EQ(8ul, out_slices2.slice_size);
-    EXPECT_EQ(3ul, out_slices2.slice_id.size());
-    for (size_t i = 0; i < 3; i++) {
-        EXPECT_EQ(i, out_slices2.slice_id[i]);
-    }
-    EXPECT_EQ(1, out_slices.dim_part);
-    EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-    Tensor& out_grad2 = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-    EXPECT_EQ(24ul, out_grad2.Shape().NumElements());
-    for (size_t i = 0; i < 8; i++) {
-        EXPECT_FLOAT_EQ(2, out_grad2.Raw<float>()[i]);
-        EXPECT_FLOAT_EQ(2, out_grad2.Raw<float>()[i + 8]);
-        EXPECT_FLOAT_EQ(1.5, out_grad2.Raw<float>()[i + 16]);            
+    EXPECT_TRUE(ctx->GetData(4, &output).IsOk());
+    vector<Slices>& out_slices2 = dynamic_cast<WrapperData<vector<Slices> >*>(output)->Internal();
+    EXPECT_EQ(1, out_slices2.size());
+    EXPECT_EQ(8ul, out_slices2[0].slice_size);
+    ASSERT_EQ(3ul, out_slices2[0].slice_id.size());
+    EXPECT_EQ(12, out_slices2[0].slice_id[0] + out_slices2[0].slice_id[1] + out_slices2[0].slice_id[2]);
+    EXPECT_EQ(1, out_slices[0].dim_part);
+    EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+    vector<Tensor>& out_grad2 = dynamic_cast<WrapperData<vector<Tensor> >*>(output)->Internal();
+    EXPECT_EQ(24ul, out_grad2[0].Shape().NumElements());
+    for (size_t j = 0; j < 3; j++) {
+      if (out_slices2[0].slice_id[j] == 3) {
+        for (size_t i = 0; i < 8; i++) {
+          EXPECT_FLOAT_EQ(4/3.0, *(out_grad2[0].Raw<float>(j) + i));
+        }
+      } else if (out_slices2[0].slice_id[j] == 4) {
+        for (size_t i = 0; i < 8; i++) {    
+          EXPECT_FLOAT_EQ(2/3.0, *(out_grad2[0].Raw<float>(j) + i));
+        }
+      } else {
+        for (size_t i = 0; i < 8; i++) {        
+          EXPECT_FLOAT_EQ(1, *(out_grad2[0].Raw<float>(j) + i));
+        }
+      }
     }
-    
-    Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({}), .dim_part = 1, .variable = var, .writable = true};
-    ctx->SetData(0, new WrapperData<Slices>(slices3), true);
+
+    vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({}), .dim_part = 1, .variable = var, .writable = true});
+    vector<Tensor> grad3(1, Tensor(DataType::kFloat, TensorShape(), new ConstantInitializer(3.0)));
+    ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
     ctx->SetData(1, new WrapperData<int64_t>(1), true);
     ctx->SetData(2, new WrapperData<int32_t>(3), true);
-    ctx->SetData(3, new WrapperData<Tensor>(DataType::kFloat, TensorShape(), new ConstantInitializer(3.0), true), true);
+    ctx->SetData(3, new WrapperData<vector<Tensor> >(grad3), true);
     EXPECT_TRUE(udf->Run(ctx).IsOk());
-    
     delete ctx;
     delete var;
     delete udf;
@@ -117,54 +134,61 @@ TEST(AggregateSlice, AggregateSliceSparse) {
 
 TEST(AggregateSlice, AggregateSliceDense) {
     UdfRegistry* udf_registry = UdfRegistry::Get("AggregateSlice");
-    Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3}), std::vector<size_t>({0, 1}));
+    Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3}), std::vector<size_t>({4, 5}));
     UdfContext* ctx = new UdfContext;
     
-    Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
+    Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "dense");
     ctx->SetVariable(var);
     ctx->SetVariableName("dense");
-    Slices slices{.slice_size = 32, .slice_id = std::vector<size_t>({0}), .dim_part = -1, .variable = var, .writable = true};
-    ctx->SetData(0, new WrapperData<Slices>(slices), true);
+    vector<Slices> slices(1, Slices{.slice_size = 32, .slice_id = std::vector<size_t>({0}), .dim_part = -1, .variable = var, .writable = true});
+    vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(1.0)));
+    ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
     ctx->SetData(1, new WrapperData<int64_t>(1), true);
     ctx->SetData(2, new WrapperData<int32_t>(2), true);
-    ctx->SetData(3, new WrapperData<Tensor>(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(1.0), true), true);
-    
+    ctx->SetData(3, new WrapperData<vector<Tensor> >(grad), true);
+
     Data* output;
     EXPECT_TRUE(udf->Run(ctx).IsOk());
-    EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
-    Slices& out_slices1 = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-    EXPECT_EQ(32ul, out_slices1.slice_size);
-    EXPECT_EQ(0ul, out_slices1.slice_id.size());
-    EXPECT_EQ(-1, out_slices1.dim_part);
-    EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-    Tensor& out_grad1 = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-    EXPECT_EQ(32ul, out_grad1.Shape().NumElements());
-    
-    ctx->SetData(0, new WrapperData<Slices>(slices), true);
+    EXPECT_TRUE(ctx->GetData(4, &output).IsOk());
+    vector<Slices>& out_slices1 = dynamic_cast<WrapperData<vector<Slices> >*>(output)->Internal();
+    EXPECT_EQ(1, out_slices1.size());
+    EXPECT_EQ(32ul, out_slices1[0].slice_size);
+    EXPECT_EQ(0ul, out_slices1[0].slice_id.size());
+    EXPECT_EQ(-1, out_slices1[0].dim_part);
+    EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+    vector<Tensor>& out_grad1 = dynamic_cast<WrapperData<vector<Tensor> >*>(output)->Internal();
+    EXPECT_EQ(1, out_grad1.size());
+    EXPECT_TRUE(out_grad1[0].Shape().IsScalar());
+
+    vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(2.0)));
+    ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
     ctx->SetData(1, new WrapperData<int64_t>(1), true);
     ctx->SetData(2, new WrapperData<int32_t>(2), true);
-    ctx->SetData(3, new WrapperData<Tensor>(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(2.0), true), true);
+    ctx->SetData(3, new WrapperData<vector<Tensor> >(grad2), true);
     
     EXPECT_TRUE(udf->Run(ctx).IsOk());
-    EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
-    Slices& out_slices2 = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-    EXPECT_EQ(32ul, out_slices2.slice_size);
-    EXPECT_EQ(1ul, out_slices2.slice_id.size());
-    EXPECT_EQ(0, out_slices2.slice_id[0]);  
-    EXPECT_EQ(-1, out_slices2.dim_part);
-    EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-    Tensor& out_grad2 = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-    EXPECT_EQ(32ul, out_grad2.Shape().NumElements());
+    EXPECT_TRUE(ctx->GetData(4, &output).IsOk());
+    vector<Slices>& out_slices2 = dynamic_cast<WrapperData<vector<Slices> >*>(output)->Internal();
+    EXPECT_EQ(1, out_slices2.size());
+    EXPECT_EQ(32ul, out_slices2[0].slice_size);
+    EXPECT_EQ(1ul, out_slices2[0].slice_id.size());
+    EXPECT_EQ(0, out_slices2[0].slice_id[0]);  
+    EXPECT_EQ(-1, out_slices2[0].dim_part);
+    EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+    vector<Tensor>& out_grad2 = dynamic_cast<WrapperData<vector<Tensor> >*>(output)->Internal();
+    EXPECT_EQ(1, out_grad2.size());
+    EXPECT_EQ(32ul, out_grad2[0].Shape().NumElements());
     
     for (size_t i = 0; i < 32; i++) {
-        EXPECT_FLOAT_EQ(1.5, out_grad2.Raw<float>()[i]);
+        EXPECT_FLOAT_EQ(1.5, out_grad2[0].Raw<float>()[i]);
     }
-    
     delete var;
     delete ctx;
     delete udf;
+    
 }
 
+/*
 TEST(AggregateSlice, AggregateSliceSparseBenchMark) {
     ThreadPool* queue_ = new ThreadPool(8);
     UdfRegistry* udf_registry = UdfRegistry::Get("AggregateSlice");
@@ -208,3 +232,4 @@ TEST(AggregateSlice, AggregateSliceSparseBenchMark) {
     delete var;
     delete udf;
 }
+*/
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/assign_add_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/assign_add_updater_test.cc
index c8099355..2fbf43af 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/assign_add_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/assign_add_updater_test.cc
@@ -33,48 +33,58 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using std::vector;
 
 TEST(AssignAddUpdater, AssignAddUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("AssignAddUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), true, 1), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)), true);
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true});
+  vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad), true);  
 
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(7, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(7, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(7, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(7, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));
   }
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)), true);  
+  vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)));    
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad2), true);  
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(11, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(11, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(11, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(11, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));        
   }
 
-  Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);  
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(11, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(15, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
-  }  
-  Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices3), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+    EXPECT_EQ(11, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(15, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));
+  }
+
+  vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
+  ps::Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+
+  vector<Tensor> grad4(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(6)));    
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad4), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");      
   delete var;
   delete ctx;
   delete udf;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/assign_sub_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/assign_sub_updater_test.cc
index ce209d02..f923244a 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/assign_sub_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/assign_sub_updater_test.cc
@@ -33,48 +33,58 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using std::vector;
 
 TEST(AssignSubUpdater, AssignSubUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("AssignSubUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), true, 1), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)), true);
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true});
+  vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad), true);    
 
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(3, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(3, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(3, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(3, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));    
   }
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)), true);  
+  vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)));
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad2), true);    
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(2, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(2, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(2, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(2, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));        
   }
 
-  Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);  
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);  
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(2, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(1, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
-  }  
-  Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices3), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+    EXPECT_EQ(2, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(1, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));            
+  }
+
+  vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
+  ps::Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+
+  vector<Tensor> grad4(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(6)));    
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad4), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");        
   delete var;
   delete ctx;
   delete udf;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/assign_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/assign_updater_test.cc
index 9f76a816..3f7ac099 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/assign_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/assign_updater_test.cc
@@ -33,49 +33,61 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using std::vector;
 
 TEST(AssignUpdater, AssignUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("AssignUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), true, 1), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)), true);
+  
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true});
+  vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(2)));  
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad), true);
 
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(2, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(2, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(2, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(2, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));
   }
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)), true);  
+  
+  vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(4)));    
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad2), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(4, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(4, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(4, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(4, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));    
   }
 
-  Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);  
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(6)), true); 
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true});
+  vector<Tensor> grad3(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(6)));  
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);  
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad3), true); 
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(4, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(6, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(5, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(4, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(6, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(5, *(var->GetData()->Raw<float>(3) + i));    
   }  
-  Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices3), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
+  ps::Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+
+  vector<Tensor> grad4(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(6)));    
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad4), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");    
   delete var;
   delete ctx;
   delete udf;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/build_dense_slice_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/build_dense_slice_test.cc
index 35c4b92f..a10111fc 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/build_dense_slice_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/build_dense_slice_test.cc
@@ -36,21 +36,20 @@ TEST(BuildDenseSlice, BuildDenseSlice) {
   UdfRegistry* udf_registry = UdfRegistry::Get("BuildDenseSlice");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0}), std::vector<size_t>({1}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "");
   ctx->SetVariable(var);
   EXPECT_TRUE(ctx->SetData(0, new WrapperData<bool>(false), true).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   Data* output;
   EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-  Slices& slices = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-  EXPECT_EQ(32u, slices.slice_size);
-  EXPECT_EQ(1u, slices.slice_id.size());
-  EXPECT_EQ(0u, slices.slice_id[0]);
-  EXPECT_EQ(-1, slices.dim_part);
+  std::vector<Slices>& slices = dynamic_cast<WrapperData<std::vector<Slices> >*>(output)->Internal();
+  EXPECT_EQ(32u, slices[0].slice_size);
+  EXPECT_EQ(1u, slices[0].slice_id.size());
+  EXPECT_EQ(0u, slices[0].slice_id[0]);
+  EXPECT_EQ(-1, slices[0].dim_part);
   ctx->SetVariable(nullptr);
   EXPECT_FALSE(udf->Run(ctx).IsOk());
   delete var;
   delete ctx;
   delete udf;
 }
-
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/build_hash_slice_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/build_hash_slice_test.cc
index ebf8a4f3..4f084ab4 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/build_hash_slice_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/build_hash_slice_test.cc
@@ -35,83 +35,85 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using ps::HashMapImpl;
 using ps::QRWLocker;
 using ps::Status;
+using ps::Hash128Key;
+using ps::server::StorageManager;
 
 TEST(BuildHashSlice, BuildHashSlice) {
   UdfRegistry* udf_registry = UdfRegistry::Get("BuildHashSlice");
-  Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2}), std::vector<size_t>({3}));
+  Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3, 4}), std::vector<size_t>({5}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({2, 8}), new ConstantInitializer(1)), new WrapperData<HashMap>(2));
-  QRWLocker* locker = new QRWLocker(var->VariableLock(), QRWLocker::kSimpleRead);
-  ctx->SetLocker(locker);
+  HashMap* hashmap = new HashMapImpl<Hash128Key>(2);
+  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({1, 8}), new ConstantInitializer(1), true, 1), new WrapperData<std::unique_ptr<HashMap> >(hashmap), "");
+  StorageManager* manager = new StorageManager();
+  EXPECT_TRUE(manager->Set("var", [var](){return var;}).IsOk());
+
+  ctx->SetStorageManager(manager);
   Tensor d(DataType::kInt64, TensorShape({3, 2}), new ConstantInitializer(0));
   d.Raw<int64_t>()[0] = d.Raw<int64_t>()[1] = 10;
   d.Raw<int64_t>()[2] = d.Raw<int64_t>()[3] = 10;
   d.Raw<int64_t>()[4] = d.Raw<int64_t>()[5] = 12;
+
   ctx->SetVariable(var);
-  EXPECT_TRUE(ctx->SetData(0, new WrapperData<Tensor>(d), true).IsOk());
-  EXPECT_TRUE(ctx->SetData(1, new WrapperData<bool>(false), true).IsOk());
-  EXPECT_TRUE(ctx->SetData(2, new WrapperData<double>(1.0), true).IsOk());
-  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  EXPECT_TRUE(ctx->SetData(0, new WrapperData<std::vector<Tensor> >(std::vector<Tensor>{d}), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(1, new WrapperData<std::vector<std::string> >(std::vector<std::string>{"var"}), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(2, new WrapperData<std::vector<float> >(std::vector<float>{1.0}), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(3, new WrapperData<bool>(false), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(4, new WrapperData<bool>(true), true).IsOk());
+
+  ps::Status status = udf->Run(ctx);
+  EXPECT_TRUE(status.IsOk());
   Data* output;
-  EXPECT_TRUE(ctx->GetData(3, &output).IsOk());
-  Slices slices = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-  EXPECT_EQ(8u, slices.slice_size);
-  EXPECT_EQ(3u, slices.slice_id.size());
-  EXPECT_EQ(1u, slices.slice_id[0]);
-  EXPECT_EQ(1u, slices.slice_id[1]);
-  EXPECT_EQ(0u, slices.slice_id[2]);
+  EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+  std::vector<Slices>& slices0 = dynamic_cast<WrapperData<std::vector<Slices> >*>(output)->Internal();
+  EXPECT_EQ(1, slices0.size());
+  EXPECT_EQ(8u, slices0[0].slice_size);
+  EXPECT_EQ(3u, slices0[0].slice_id.size());
+  EXPECT_EQ(1u, slices0[0].slice_id[0] + slices0[0].slice_id[2]);
+  EXPECT_EQ(slices0[0].slice_id[0], slices0[0].slice_id[1]);
 
   d.Raw<int64_t>()[0] = d.Raw<int64_t>()[1] = 12;
   d.Raw<int64_t>()[2] = d.Raw<int64_t>()[3] = 13;
   d.Raw<int64_t>()[4] = d.Raw<int64_t>()[5] = 14;
   EXPECT_TRUE(udf->Run(ctx).IsOk());
-  EXPECT_TRUE(ctx->GetData(3, &output).IsOk());
-  slices = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-  EXPECT_EQ(8u, slices.slice_size);
-  EXPECT_EQ(3u, slices.slice_id.size());
-  EXPECT_EQ(0u, slices.slice_id[0]);
-  EXPECT_EQ(3u, slices.slice_id[1]);
-  EXPECT_EQ(2u, slices.slice_id[2]);
-  EXPECT_EQ(1, slices.dim_part);
-  EXPECT_EQ(TensorShape({4, 8}), var->GetData()->Shape());
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[0]);
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[1]);
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[2]);
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[3]);
+  EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+  std::vector<Slices> slices1 = dynamic_cast<WrapperData<std::vector<Slices> >*>(output)->Internal();
+  EXPECT_EQ(8u, slices1[0].slice_size);
+  EXPECT_EQ(3u, slices1[0].slice_id.size());
+  EXPECT_EQ(slices0[0].slice_id[2], slices1[0].slice_id[0]);
+  EXPECT_EQ(5, slices1[0].slice_id[1] + slices1[0].slice_id[2]);
+  EXPECT_EQ(1, slices1[0].dim_part);
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(0));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(1));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(2));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(3));
 
-  EXPECT_TRUE(ctx->SetData(2, new WrapperData<double>(0.0), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(3, new WrapperData<bool>(true), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(4, new WrapperData<bool>(false), true).IsOk());  
   d.Raw<int64_t>()[0] = d.Raw<int64_t>()[1] = 10;
   d.Raw<int64_t>()[2] = d.Raw<int64_t>()[3] = 12;
   d.Raw<int64_t>()[4] = d.Raw<int64_t>()[5] = 16;
   EXPECT_TRUE(udf->Run(ctx).IsOk());
-  EXPECT_TRUE(ctx->GetData(3, &output).IsOk());
-  slices = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-  EXPECT_EQ(8u, slices.slice_size);
-  EXPECT_EQ(3u, slices.slice_id.size());
-  EXPECT_EQ(1u, slices.slice_id[0]);
-  EXPECT_EQ(0u, slices.slice_id[1]);
-  EXPECT_EQ(HashMap::NOT_ADD_ID, slices.slice_id[2]);
-  EXPECT_EQ(1, slices.dim_part);
-  EXPECT_EQ(TensorShape({4, 8}), var->GetData()->Shape());
+  EXPECT_TRUE(ctx->GetData(5, &output).IsOk());
+  std::vector<Slices>& slices2 = dynamic_cast<WrapperData<std::vector<Slices> >*>(output)->Internal();
+  EXPECT_EQ(8u, slices2[0].slice_size);
+  EXPECT_EQ(3u, slices2[0].slice_id.size());
+  EXPECT_EQ(slices0[0].slice_id[0], slices2[0].slice_id[0]);
+  EXPECT_EQ(slices0[0].slice_id[2], slices2[0].slice_id[1]);
+  EXPECT_EQ(0, slices2[0].slice_id[2]);
+  EXPECT_EQ(1, slices2[0].dim_part);
 
   ctx->SetVariable(nullptr);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  Variable* var1 = new Variable(new Tensor(DataType::kInt8, TensorShape({}), new ConstantInitializer(1)), new WrapperData<HashMap>(2));
-  ctx->SetVariable(var1);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  Tensor d1(DataType::kInt64, TensorShape({3}), new ConstantInitializer(0));
-  ctx->SetData(0, new WrapperData<Tensor>(d1), true);
-  ctx->SetVariable(var);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  Variable* var2 = new Variable(new Tensor(DataType::kInt8, TensorShape({2, 8}), new ConstantInitializer(1)), nullptr);
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  HashMap* hashmap2 = new HashMapImpl<Hash128Key>(2);
+  Variable* var2 = new Variable(new Tensor(DataType::kInt8, TensorShape({}), new ConstantInitializer(1)), new WrapperData<HashMap*>(hashmap2), "");
   ctx->SetVariable(var2);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
 
-  delete locker;
-  delete var;
+  delete manager;
+  delete var2;
   delete ctx;
   delete udf;
 }
-
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/build_sparse_slice_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/build_sparse_slice_test.cc
index e83fa693..44e70707 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/build_sparse_slice_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/build_sparse_slice_test.cc
@@ -36,7 +36,7 @@ TEST(BuildSparseSlice, BuildSparseSlice) {
   UdfRegistry* udf_registry = UdfRegistry::Get("BuildSparseSlice");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1}), std::vector<size_t>({2}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), new WrapperData<size_t>(10));
+  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), new WrapperData<size_t>(10), "");
   Tensor d(DataType::kInt8, TensorShape({2}), new ConstantInitializer(0));
   d.Raw<int8_t>()[0] = 10;
   d.Raw<int8_t>()[1] = 12;
@@ -46,15 +46,15 @@ TEST(BuildSparseSlice, BuildSparseSlice) {
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   Data* output;
   EXPECT_TRUE(ctx->GetData(2, &output).IsOk());
-  Slices& slices = dynamic_cast<WrapperData<Slices>*>(output)->Internal();
-  EXPECT_EQ(8u, slices.slice_size);
-  EXPECT_EQ(2u, slices.slice_id.size());
-  EXPECT_EQ(0u, slices.slice_id[0]);
-  EXPECT_EQ(2u, slices.slice_id[1]);
-  EXPECT_EQ(1, slices.dim_part);
+  std::vector<Slices>& slices = dynamic_cast<WrapperData<std::vector<Slices> >*>(output)->Internal();
+  EXPECT_EQ(8u, slices[0].slice_size);
+  EXPECT_EQ(2u, slices[0].slice_id.size());
+  EXPECT_EQ(0u, slices[0].slice_id[0]);
+  EXPECT_EQ(2u, slices[0].slice_id[1]);
+  EXPECT_EQ(1, slices[0].dim_part);
   ctx->SetVariable(nullptr);
   EXPECT_FALSE(udf->Run(ctx).IsOk());
-  Variable* var1 = new Variable(new Tensor(DataType::kInt8, TensorShape({}), new ConstantInitializer(0)), new WrapperData<size_t>(0));
+  Variable* var1 = new Variable(new Tensor(DataType::kInt8, TensorShape({}), new ConstantInitializer(0)), new WrapperData<size_t>(0), "");
   ctx->SetVariable(var1);
   EXPECT_FALSE(udf->Run(ctx).IsOk());
   Tensor d1(DataType::kInt8, TensorShape({2, 2}), new ConstantInitializer(0));
@@ -62,7 +62,7 @@ TEST(BuildSparseSlice, BuildSparseSlice) {
   ctx->SetData(0, new WrapperData<Tensor>(d1), true);
   EXPECT_FALSE(udf->Run(ctx).IsOk());
   ctx->SetData(0, new WrapperData<Tensor>(d), true);
-  Variable* var2 = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
+  Variable* var2 = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "");
   ctx->SetVariable(var2);
   EXPECT_FALSE(udf->Run(ctx).IsOk());
   delete var;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/hash_variable_initializer.cc b/xdl/ps-plus/ps-plus/server/udf/test/hash_variable_initializer_test.cc
similarity index 72%
rename from xdl/ps-plus/ps-plus/server/udf/test/hash_variable_initializer.cc
rename to xdl/ps-plus/ps-plus/server/udf/test/hash_variable_initializer_test.cc
index 0d0f1235..3a910a0a 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/hash_variable_initializer.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/hash_variable_initializer_test.cc
@@ -37,27 +37,29 @@ using ps::HashMap;
 
 TEST(HashVariableInitializer, HashVariableInitializer) {
   UdfRegistry* udf_registry = UdfRegistry::Get("HashVariableInitializer");
-  Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2}), std::vector<size_t>({}));
+  Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
   StorageManager* storage_manager = new StorageManager;
   EXPECT_TRUE(ctx->SetVariableName("123").IsOk());
   EXPECT_TRUE(ctx->SetData(0, new WrapperData<DataType>(DataType::kInt8), true).IsOk());
-  EXPECT_TRUE(ctx->SetData(2, new WrapperData<std::unique_ptr<Initializer>>(new ConstantInitializer(1)), true).IsOk());
+  EXPECT_TRUE(ctx->SetData(2, new WrapperData<std::string>("save_ratio=1.0&hash64=true"), true).IsOk());  
+  EXPECT_TRUE(ctx->SetData(3, new WrapperData<std::unique_ptr<Initializer>>(new ConstantInitializer(1)), true).IsOk());
   EXPECT_TRUE(ctx->SetStorageManager(storage_manager).IsOk());
   ctx->SetData(1, new WrapperData<TensorShape>(std::vector<size_t>({})), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  ps::Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "Hash Shape Should not be Scalar");  
   EXPECT_TRUE(ctx->SetData(1, new WrapperData<TensorShape>(std::vector<size_t>({4, 8})), true).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
   Variable* var;
   EXPECT_TRUE(storage_manager->Get("123", &var).IsOk());
-  EXPECT_EQ(TensorShape({4, 8}), var->GetData()->Shape());
   EXPECT_EQ(DataType::kInt8, var->GetData()->Type());
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[0]);
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[1]);
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[2]);
-  EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[3]);
-  EXPECT_NE(nullptr, dynamic_cast<WrapperData<HashMap>*>(var->GetSlicer()));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(0));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(1));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(2));
+  EXPECT_EQ(0x0101010101010101l, *var->GetData()->Raw<int64_t>(3));
+  EXPECT_NE(nullptr, dynamic_cast<WrapperData<std::unique_ptr<HashMap> >*>(var->GetSlicer()));
   delete ctx;
   delete udf;
 }
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/identity_index_variable_initializer.cc b/xdl/ps-plus/ps-plus/server/udf/test/identity_index_variable_initializer_test.cc
similarity index 97%
rename from xdl/ps-plus/ps-plus/server/udf/test/identity_index_variable_initializer.cc
rename to xdl/ps-plus/ps-plus/server/udf/test/identity_index_variable_initializer_test.cc
index c22b0a4a..13c9a6a4 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/identity_index_variable_initializer.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/identity_index_variable_initializer_test.cc
@@ -48,7 +48,7 @@ TEST(IdentityIndexVariableInitializer, IdentityIndexVariableInitializer) {
   EXPECT_FALSE(udf->Run(ctx).IsOk());
   EXPECT_TRUE(ctx->SetData(0, new WrapperData<DataType>(DataType::kInt8), true).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
   Variable* var;
   EXPECT_TRUE(storage_manager->Get("123", &var).IsOk());
   EXPECT_EQ(TensorShape({4, 8}), var->GetData()->Shape());
@@ -57,6 +57,7 @@ TEST(IdentityIndexVariableInitializer, IdentityIndexVariableInitializer) {
   EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[1]);
   EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[2]);
   EXPECT_EQ(0x0101010101010101l, var->GetData()->Raw<int64_t>()[3]);
+  delete storage_manager;
   delete ctx;
   delete udf;
 }
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/index_variable_initializer.cc b/xdl/ps-plus/ps-plus/server/udf/test/index_variable_initializer_test.cc
similarity index 98%
rename from xdl/ps-plus/ps-plus/server/udf/test/index_variable_initializer.cc
rename to xdl/ps-plus/ps-plus/server/udf/test/index_variable_initializer_test.cc
index c28e8775..ad485570 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/index_variable_initializer.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/index_variable_initializer_test.cc
@@ -45,7 +45,7 @@ TEST(IndexVariableInitializer, IndexVariableInitializer) {
   EXPECT_TRUE(ctx->SetData(3, new WrapperData<std::unique_ptr<Initializer>>(new ConstantInitializer(1)), true).IsOk());
   EXPECT_TRUE(ctx->SetStorageManager(storage_manager).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
   Variable* var;
   EXPECT_TRUE(storage_manager->Get("123", &var).IsOk());
   EXPECT_EQ(TensorShape({4, 8}), var->GetData()->Shape());
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/is_initiailzed_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/is_initiailzed_test.cc
index 3a863895..78fdb3ba 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/is_initiailzed_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/is_initiailzed_test.cc
@@ -39,12 +39,20 @@ TEST(IsInitialized, IsInitialized) {
   StorageManager* sm = new StorageManager;
   UdfContext* ctx = new UdfContext;
   ctx->SetStorageManager(sm);
-  sm->Set("a", [&]{ return new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr); });
+  sm->Set("a", [&]{ return new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, ""); });
   ctx->SetVariableName("a");
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   Data* output;
   EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
   bool inited = dynamic_cast<WrapperData<bool>*>(output)->Internal();
+  EXPECT_FALSE(inited);
+  Variable* var;
+  EXPECT_TRUE(sm->Get("a", &var).IsOk());
+  var->SetRealInited(true);
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  output;
+  EXPECT_TRUE(ctx->GetData(0, &output).IsOk());
+  inited = dynamic_cast<WrapperData<bool>*>(output)->Internal();
   EXPECT_TRUE(inited);
   ctx->SetVariableName("b");
   EXPECT_TRUE(udf->Run(ctx).IsOk());
@@ -52,7 +60,7 @@ TEST(IsInitialized, IsInitialized) {
   inited = dynamic_cast<WrapperData<bool>*>(output)->Internal();
   EXPECT_FALSE(inited);
   delete ctx;
-  delete udf;
   delete sm;
+  delete udf;
 }
 
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/momentum_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/momentum_updater_test.cc
index 55eeda84..e8f2b08c 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/momentum_updater_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/momentum_updater_test.cc
@@ -32,51 +32,61 @@ using ps::TensorShape;
 using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
+using std::vector;
 
 TEST(MomentumUpdater, MomentumUpdater) {
   UdfRegistry* udf_registry = UdfRegistry::Get("MomentumUpdater");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3, 4}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0)), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)), true);
-  ctx->SetData(2, new WrapperData<double>(1), true);
-  ctx->SetData(3, new WrapperData<double>(0.5), true);
-  ctx->SetData(4, new WrapperData<bool>(false), true);
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true});
+  vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad), true);
+  ctx->SetData(2, new WrapperData<vector<double> >(vector<double>{1}), true);
+  ctx->SetData(3, new WrapperData<vector<double> >(vector<double>{0.5}), true);
+  ctx->SetData(4, new WrapperData<vector<bool> >(vector<bool>{false}), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(-1, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(-1, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(0, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(0, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(-1, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(-1, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(3) + i));
   }
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(-2.5, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(-2.5, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(0, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(0, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(-2.5, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(-2.5, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(3) + i));
   }
 
-  Slices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({1, (size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true};
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(1)), true);  
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({1, (size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true});
+  vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(1)));
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad2), true);  
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   for (size_t i = 0; i < 8; i++) {
-    EXPECT_EQ(-2.5, var->GetData()->Raw<float>()[i]);
-    EXPECT_EQ(-4.25, var->GetData()->Raw<float>()[i + 16]);
-    EXPECT_EQ(-1, var->GetData()->Raw<float>()[i + 8]);
-    EXPECT_EQ(0, var->GetData()->Raw<float>()[i + 24]);
+    EXPECT_EQ(-2.5, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_EQ(-4.25, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(-1, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(3) + i));
   }
-  Slices slices3{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false};
-  ctx->SetData(0, new WrapperData<Slices>(slices3), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  ctx->SetData(0, new WrapperData<Slices>(slices2), true);
-  ctx->SetData(1, new WrapperData<Tensor>(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)), true);
-  EXPECT_FALSE(udf->Run(ctx).IsOk());
-  
+
+  vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
+  ps::Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+
+  vector<Tensor> grad3(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");  
+
   delete var;
   delete ctx;
   delete udf;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/python_runner_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/python_runner_test.cc
new file mode 100644
index 00000000..20af3f1e
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/test/python_runner_test.cc
@@ -0,0 +1,90 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/server/udf/python_runner.h"
+#include "ps-plus/common/initializer/constant_initializer.h"
+#include <iostream>
+
+using ps::PythonRunner;
+using ps::DataType;
+using ps::TensorShape;
+using ps::Tensor;
+using ps::Status;
+using ps::initializer::ConstantInitializer;
+
+TEST(PythonRunner, PythonRunner) {
+  std::string func_def = "import numpy\ndef X():\n print 'Hello World';\n return 1";
+  std::string func_name = "X";
+  PythonRunner runner;
+
+  Status status = runner.Init(func_def, func_name);
+  EXPECT_TRUE(status.IsOk());
+  PythonRunner::NumpyArray arr;
+  status = runner.Run({}, &arr);
+  EXPECT_TRUE(status.IsOk());
+  EXPECT_EQ(1, ((int*)arr.data)[0]);
+}
+
+TEST(PythonRunner, Add) {
+  std::string func_def = "import numpy\ndef Y(a, b):\n return a + b";
+  std::string func_name = "Y";
+  PythonRunner runner;
+  Status status = runner.Init(func_def, func_name);
+  EXPECT_TRUE(status.IsOk());
+  Tensor t1(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(1), true, 2);
+  Tensor t2(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(2), true, 2);
+  PythonRunner::NumpyArray r1, r2, r3;
+  status = PythonRunner::ParseSubTensor(t1, 1, 3, &r1);
+  EXPECT_TRUE(status.IsOk());
+  status = PythonRunner::ParseSubTensor(t2, 1, 3, &r2);
+  EXPECT_TRUE(status.IsOk());
+  status = runner.Run({r1, r2}, &r3);
+  EXPECT_TRUE(status.IsOk());
+  EXPECT_EQ(3, ((float*)r3.data)[0]);
+  EXPECT_EQ(1, r1.shape[0]);
+  EXPECT_EQ(8, r1.shape[1]);
+  EXPECT_EQ(1, r2.shape[0]);
+  EXPECT_EQ(8, r2.shape[1]);
+  EXPECT_EQ(1, r3.shape[0]);
+  EXPECT_EQ(8, r3.shape[1]);
+}
+
+TEST(PythonRunner, Swap) {
+  std::string func_def = "import numpy\ndef Z(a, b):\n return b, a";
+  std::string func_name = "Z";
+  PythonRunner runner;
+  Status status = runner.Init(func_def, func_name);
+  EXPECT_TRUE(status.IsOk());
+  Tensor t1(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(1));
+  Tensor t2(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(2));
+  PythonRunner::NumpyArray r1, r2, r3, r4;
+  status = PythonRunner::ParseTensor(t1, &r1);
+  EXPECT_TRUE(status.IsOk());
+  status = PythonRunner::ParseTensor(t2, &r2);
+  EXPECT_TRUE(status.IsOk());
+  status = runner.Run({r1, r2}, &r3, &r4);
+  EXPECT_TRUE(status.IsOk());
+  EXPECT_EQ(2, ((float*)r3.data)[0]);
+  EXPECT_EQ(1, ((float*)r4.data)[0]);
+  EXPECT_EQ(3, r1.shape[0]);
+  EXPECT_EQ(8, r1.shape[1]);
+  EXPECT_EQ(3, r2.shape[0]);
+  EXPECT_EQ(8, r2.shape[1]);
+  EXPECT_EQ(3, r3.shape[0]);
+  EXPECT_EQ(8, r3.shape[1]);
+  EXPECT_EQ(3, r4.shape[0]);
+  EXPECT_EQ(8, r4.shape[1]);
+}
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/rmsprop_updater_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/rmsprop_updater_test.cc
new file mode 100644
index 00000000..df298349
--- /dev/null
+++ b/xdl/ps-plus/ps-plus/server/udf/test/rmsprop_updater_test.cc
@@ -0,0 +1,95 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "gtest/gtest.h"
+#include "ps-plus/common/data.h"
+#include "ps-plus/server/udf.h"
+#include "ps-plus/server/slice.h"
+#include "ps-plus/common/initializer/constant_initializer.h"
+#include "ps-plus/common/hashmap.h"
+
+using ps::server::Udf;
+using ps::server::UdfContext;
+using ps::server::UdfRegistry;
+using ps::server::Variable;
+using ps::server::Slices;
+using ps::initializer::ConstantInitializer;
+using ps::Initializer;
+using ps::DataType;
+using ps::TensorShape;
+using ps::Tensor;
+using ps::Data;
+using ps::WrapperData;
+using std::vector;
+
+TEST(RmspropUpdater, RmspropUpdater) {
+  UdfRegistry* udf_registry = UdfRegistry::Get("RmspropUpdater");
+  Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2, 3, 4, 5}), std::vector<size_t>({}));
+  UdfContext* ctx = new UdfContext;
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(0), true, 1), nullptr, "");
+  ctx->SetVariable(var);
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var, .writable = true});
+  vector<Tensor> grad(1, Tensor(DataType::kFloat, TensorShape({2, 8}), new ConstantInitializer(1)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true); // slices
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad), true); // grad_tensor
+  ctx->SetData(2, new WrapperData<vector<double> >(vector<double>{1}), true); // learning_rate
+  ctx->SetData(3, new WrapperData<vector<double> >(vector<double>{0.99}), true); // decay
+  ctx->SetData(4, new WrapperData<vector<double> >(vector<double>{0.0}), true); // alpha
+  ctx->SetData(5, new WrapperData<vector<double> >(vector<double>{0.0}), true); // epsilon
+
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  for (size_t i = 0; i < 8; i++) {
+    EXPECT_FLOAT_EQ(-10, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(-10, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(3) + i));
+  }
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  for (size_t i = 0; i < 8; i++) {
+    EXPECT_FLOAT_EQ(-17.088812, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(-17.088812, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(3) + i));
+  }
+
+  vector<Slices> slices2(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({1, (size_t)ps::HashMap::NOT_ADD_ID, 2}), .dim_part = -1, .variable = var, .writable = true});
+  vector<Tensor> grad2(1, Tensor(DataType::kFloat, TensorShape({3, 8}), new ConstantInitializer(1)));
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad2), true);  
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  EXPECT_TRUE(udf->Run(ctx).IsOk());
+  for (size_t i = 0; i < 8; i++) {
+    EXPECT_FLOAT_EQ(-17.088812, *(var->GetData()->Raw<float>(0) + i));
+    EXPECT_FLOAT_EQ(-22.891302, *(var->GetData()->Raw<float>(2) + i));
+    EXPECT_EQ(-10, *(var->GetData()->Raw<float>(1) + i));
+    EXPECT_EQ(0, *(var->GetData()->Raw<float>(3) + i));
+  }
+  vector<Slices> slices3(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({(size_t)ps::HashMap::NOT_ADD_ID, 1}), .dim_part = -1, .variable = var, .writable = false});
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices3), true);
+  ps::Status status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "slice is not writable");
+
+  vector<Tensor> grad3(1, Tensor(DataType::kDouble, TensorShape({2, 8}), new ConstantInitializer(2)));
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices2), true);
+  ctx->SetData(1, new WrapperData<vector<Tensor> >(grad3), true);
+  status = udf->Run(ctx);
+  EXPECT_FALSE(status.IsOk());
+  EXPECT_EQ(status.Msg(), "grad should has same datatype with variable");    
+
+  delete var;
+  delete ctx;
+  delete udf;
+}
+
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/scalar_integer_logger_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/scalar_integer_logger_test.cc
index af635772..511a9a2c 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/scalar_integer_logger_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/scalar_integer_logger_test.cc
@@ -33,27 +33,32 @@ using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
 using ps::HashMap;
+using std::vector;
+using std::string;
 
 TEST(ScalarIntegerLogger, ScalarIntegerLogger) {
   UdfRegistry* udf_registry = UdfRegistry::Get("ScalarIntegerLogger");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0, 1, 2}), std::vector<size_t>({}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kFloat, TensorShape({4, 8}), new ConstantInitializer(5), true, 1), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  std::string slot_name = "test";
-  int64_t val = 8848;
-  ctx->SetData(0, new WrapperData<Slices>(slices), true);
-  ctx->SetData(1, new WrapperData<std::string>(slot_name), true);
-  ctx->SetData(2, new WrapperData<int64_t>(val), true);
+  vector<Slices> slices(1, Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true});
+  vector<string> slot_name(1, "test");
+  int64_t MAGIC_NUMBER = 8848;
+  ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true);
+  ctx->SetData(1, new WrapperData<vector<string> >(slot_name), true);
+  ctx->SetData(2, new WrapperData<vector<int64_t> >(vector<int64_t>{MAGIC_NUMBER}), true);
+
 
   EXPECT_TRUE(udf->Run(ctx).IsOk());
+
   Tensor* result;
   EXPECT_TRUE(var->GetExistSlot("test", &result).IsOk());
-  EXPECT_EQ(8848, result->Raw<int64_t>()[0]);
-  EXPECT_EQ(0, result->Raw<int64_t>()[1]);
-  EXPECT_EQ(8848, result->Raw<int64_t>()[2]);
-  EXPECT_EQ(0, result->Raw<int64_t>()[3]);
+  EXPECT_EQ(MAGIC_NUMBER, *(result->Raw<int64_t>(0)));
+  EXPECT_EQ(0, *(result->Raw<int64_t>(1)));
+  EXPECT_EQ(MAGIC_NUMBER, *(result->Raw<int64_t>(2)));
+  EXPECT_EQ(0, *(result->Raw<int64_t>(3)));
+
   delete var;
   delete ctx;
   delete udf;
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/slice_to_tensor_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/slice_to_tensor_test.cc
index 35a1ea9d..43de4d3a 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/slice_to_tensor_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/slice_to_tensor_test.cc
@@ -36,39 +36,51 @@ using ps::WrapperData;
 TEST(SliceToTensor, SliceToTensor) {
   UdfRegistry* udf_registry = UdfRegistry::Get("SliceToTensor");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0}), std::vector<size_t>({1}));
-  Udf* udf_ = udf_registry->Build(std::vector<size_t>({0, 1}), std::vector<size_t>({2}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr, "");
   ctx->SetVariable(var);
-  TensorSlices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .tensor = *(var->GetData())};
-  EXPECT_TRUE(ctx->SetData(0, new WrapperData<TensorSlices>(slices), true).IsOk());
+  std::vector<Slices> slices;
+  slices.push_back(Slices{.slice_size = 32, .slice_id = std::vector<size_t>({0}), .dim_part = -1, .variable = var});
+  EXPECT_TRUE(ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices), true).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
-  EXPECT_FALSE(udf_->Run(ctx).IsOk());
   Data* output;
   EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-  Tensor& tensor = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-  EXPECT_EQ(0x0101010101010101l, tensor.Raw<int64_t>()[0]);
-  EXPECT_EQ(0x0101010101010101l, tensor.Raw<int64_t>()[1]);
-  EXPECT_EQ(0x0101010101010101l, tensor.Raw<int64_t>()[2]);
-  EXPECT_EQ(0x0101010101010101l, tensor.Raw<int64_t>()[3]);
-  Variable* var1 = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), new WrapperData<size_t>(10));
+  std::vector<Tensor>& tensors = dynamic_cast<WrapperData<std::vector<Tensor> >*>(output)->Internal();
+  EXPECT_EQ(1, tensors.size());
+  TensorShape shape = tensors[0].Shape();
+  EXPECT_EQ(2, shape.Size());
+  EXPECT_EQ(4, shape.Dims()[0]);
+  EXPECT_EQ(8, shape.Dims()[1]);
+  EXPECT_EQ(0x0101010101010101l, *(tensors[0].Raw<int64_t>(0)));
+  EXPECT_EQ(0x0101010101010101l, *(tensors[0].Raw<int64_t>(1)));
+  EXPECT_EQ(0x0101010101010101l, *(tensors[0].Raw<int64_t>(2)));
+  EXPECT_EQ(0x0101010101010101l, *(tensors[0].Raw<int64_t>(3)));
+
+  Tensor* tensor_ = new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1));
+  Data* slicer_ = new WrapperData<size_t>(10);
+  Variable* var1 = new Variable(tensor_, slicer_, "");
+  Tensor* t = var1->GetData();
   ctx->SetVariable(var1);
-  TensorSlices slices1{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .tensor = *(var1->GetData())};
-  EXPECT_TRUE(ctx->SetData(0, new WrapperData<TensorSlices>(slices1), true).IsOk());
+  std::vector<Slices> slices1;
+  slices1.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 1, .variable = var1});
+
+  EXPECT_TRUE(ctx->SetData(0, new WrapperData<std::vector<Slices> >(slices1), true).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
-  tensor = dynamic_cast<WrapperData<Tensor>*>(output)->Internal();
-  EXPECT_EQ(2u, tensor.Shape().Size());
-  EXPECT_EQ(2u, tensor.Shape()[0]);
-  EXPECT_EQ(8u, tensor.Shape()[1]);
-  EXPECT_EQ(0x0101010101010101l, tensor.Raw<int64_t>()[0]);
-  EXPECT_EQ(0x0101010101010101l, tensor.Raw<int64_t>()[1]);
+  std::vector<Tensor>& tensors1 = dynamic_cast<WrapperData<std::vector<Tensor> >*>(output)->Internal();
+
+  EXPECT_EQ(1u, tensors1.size());
+  EXPECT_EQ(2u, tensors1[0].Shape().Size());
+  EXPECT_EQ(2u, tensors1[0].Shape()[0]);
+  EXPECT_EQ(8u, tensors1[0].Shape()[1]);
+  EXPECT_EQ(0x0101010101010101l, *(tensors1[0].Raw<int64_t>(0)));
+  EXPECT_EQ(0x0101010101010101l, *(tensors1[0].Raw<int64_t>(1)));
   TensorSlices slices2{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = 3, .tensor = *(var1->GetData())};
   EXPECT_TRUE(ctx->SetData(0, new WrapperData<TensorSlices>(slices2), true).IsOk());
   EXPECT_FALSE(udf->Run(ctx).IsOk());
-  delete var;
+
   delete var1;
+  delete var;
   delete ctx;
   delete udf;
 }
-
diff --git a/xdl/ps-plus/ps-plus/server/udf/test/trans_slice_test.cc b/xdl/ps-plus/ps-plus/server/udf/test/trans_slice_test.cc
index 6880570e..0ab12132 100644
--- a/xdl/ps-plus/ps-plus/server/udf/test/trans_slice_test.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/test/trans_slice_test.cc
@@ -32,15 +32,17 @@ using ps::TensorShape;
 using ps::Tensor;
 using ps::Data;
 using ps::WrapperData;
+using std::vector;
 
 TEST(TransSlice, TransSlice) {
   UdfRegistry* udf_registry = UdfRegistry::Get("TransSlice");
   Udf* udf = udf_registry->Build(std::vector<size_t>({0}), std::vector<size_t>({1}));
   UdfContext* ctx = new UdfContext;
-  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr);
+  Variable* var = new Variable(new Tensor(DataType::kInt8, TensorShape({4, 8}), new ConstantInitializer(1)), nullptr, "");
   ctx->SetVariable(var);
-  Slices slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true};
-  EXPECT_TRUE(ctx->SetData(0, new WrapperData<Slices>(slices), true).IsOk());
+  vector<Slices> slices;
+  slices.push_back(Slices{.slice_size = 8, .slice_id = std::vector<size_t>({0, 2}), .dim_part = -1, .variable = var, .writable = true});
+  EXPECT_TRUE(ctx->SetData(0, new WrapperData<vector<Slices> >(slices), true).IsOk());
   EXPECT_TRUE(udf->Run(ctx).IsOk());
   Data* output;
   EXPECT_TRUE(ctx->GetData(1, &output).IsOk());
diff --git a/xdl/ps-plus/ps-plus/server/udf/trans_slice.cc b/xdl/ps-plus/ps-plus/server/udf/trans_slice.cc
index ab5a196b..4f13e23c 100644
--- a/xdl/ps-plus/ps-plus/server/udf/trans_slice.cc
+++ b/xdl/ps-plus/ps-plus/server/udf/trans_slice.cc
@@ -20,13 +20,16 @@ namespace ps {
 namespace server {
 namespace udf {
 
-class TransSlice : public SimpleUdf<Slices, TensorSlices*> {
+class TransSlice : public SimpleUdf<std::vector<Slices>, TensorSlices*> {
  public:
-  virtual Status SimpleRun(UdfContext* ctx, const Slices& slices, TensorSlices* result) const {
-    result->slice_size = slices.slice_size;
-    result->slice_id = slices.slice_id;
-    result->dim_part = slices.dim_part;
-    result->tensor = *(slices.variable->GetData());
+  virtual Status SimpleRun(UdfContext* ctx, const std::vector<Slices>& slices, TensorSlices* result) const {
+    if (slices.size() != 1) {
+      return Status::ArgumentError("TransSlice: slices size must be 1");
+    }
+    result->slice_size = slices[0].slice_size;
+    result->slice_id = slices[0].slice_id;
+    result->dim_part = slices[0].dim_part;
+    result->tensor = *(slices[0].variable->GetData());
     return Status::Ok();
   }
 };
diff --git a/xdl/ps-plus/ps-plus/server/udf_context.cc b/xdl/ps-plus/ps-plus/server/udf_context.cc
index a54beb37..d723cbfe 100644
--- a/xdl/ps-plus/ps-plus/server/udf_context.cc
+++ b/xdl/ps-plus/ps-plus/server/udf_context.cc
@@ -21,7 +21,7 @@ namespace ps {
 namespace server {
 
 UdfContext::UdfContext()
-  : variable_(nullptr), storage_manager_(nullptr), locker_(nullptr) {
+  : variable_(nullptr), storage_manager_(nullptr), locker_(nullptr), server_locker_(nullptr), streaming_model_args_(nullptr) {
 }
 
 UdfContext::~UdfContext() {
@@ -70,6 +70,11 @@ Status UdfContext::SetLocker(QRWLocker* locker) {
   return Status::Ok();
 }
 
+Status UdfContext::SetServerLocker(QRWLocker* locker) {
+  server_locker_ = locker;
+  return Status::Ok();
+}
+
 Status UdfContext::SetStreamingModelArgs(StreamingModelArgs* streaming_model_args) {
   streaming_model_args_ = streaming_model_args;
   return Status::Ok();
@@ -127,6 +132,10 @@ QRWLocker* UdfContext::GetLocker() {
   return locker_;
 }
 
+QRWLocker* UdfContext::GetServerLocker() {
+  return server_locker_;
+}
+
 StreamingModelArgs* UdfContext::GetStreamingModelArgs() {
   return streaming_model_args_;
 }
diff --git a/xdl/ps-plus/ps-plus/server/udf_context.h b/xdl/ps-plus/ps-plus/server/udf_context.h
index 3eb4cae3..69355b88 100644
--- a/xdl/ps-plus/ps-plus/server/udf_context.h
+++ b/xdl/ps-plus/ps-plus/server/udf_context.h
@@ -43,6 +43,7 @@ class UdfContext {
   Status SetVariable(Variable* variable);
   Status SetVariableName(const std::string& variable_name);
   Status SetLocker(QRWLocker* locker);
+  Status SetServerLocker(QRWLocker* locker);
   Status SetStreamingModelArgs(StreamingModelArgs* streaming_model_args);
 
   Status SetData(size_t id, Data* data, bool need_free);
@@ -53,6 +54,7 @@ class UdfContext {
   Variable* GetVariable();
   const std::string& GetVariableName();
   QRWLocker* GetLocker();
+  QRWLocker* GetServerLocker();
   StreamingModelArgs* GetStreamingModelArgs();
  private:
   std::vector<Data*> datas_;
@@ -62,6 +64,7 @@ class UdfContext {
   std::string variable_name_;
   StorageManager* storage_manager_;
   QRWLocker* locker_;
+  QRWLocker* server_locker_;
   StreamingModelArgs* streaming_model_args_;
 };
 
diff --git a/xdl/ps-plus/ps-plus/server/udf_manager.cc b/xdl/ps-plus/ps-plus/server/udf_manager.cc
index 61007253..49873a76 100644
--- a/xdl/ps-plus/ps-plus/server/udf_manager.cc
+++ b/xdl/ps-plus/ps-plus/server/udf_manager.cc
@@ -102,7 +102,7 @@ Status UdfChain::Process(UdfContext* ctx) {
   for (Udf* udf : udfs_) {
     PS_CHECK_STATUS(udf->Run(ctx));
   }
-  ctx->ProcessOutputs(output_ids_);
+  PS_CHECK_STATUS(ctx->ProcessOutputs(output_ids_));
   return Status::Ok();
 }
 
diff --git a/xdl/ps-plus/ps-plus/server/variable.cc b/xdl/ps-plus/ps-plus/server/variable.cc
index 64855765..0e6fbc88 100644
--- a/xdl/ps-plus/ps-plus/server/variable.cc
+++ b/xdl/ps-plus/ps-plus/server/variable.cc
@@ -38,7 +38,7 @@ Tensor* Variable::GetSlot(const std::string& name, const std::function<Slot()>&
 }
 
 Variable::Slot Variable::VariableLikeSlot(DataType type, const TensorShape& shape, Initializer* initializer) {
-  return Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(type, shape, initializer)), .joiner = kVariableLike};
+  return Slot{.tensor = std::unique_ptr<Tensor>(new Tensor(type, shape, initializer, data_->TensorType(), true)), .joiner = kVariableLike};
 }
 
 Variable::Slot Variable::AnyOneSlot(DataType type, const TensorShape& shape, Initializer* initializer) {
@@ -81,19 +81,19 @@ Status Variable::ReShapeId(size_t id) {
   if (shape.Size() == 0) {
     return Status::ArgumentError("Scalar Not Support ReShapeId");
   }
-  shape.Set(0, id);
-  data_->ReShape(shape);
   for (auto& slot : slots_) {
     if (slot.second.joiner == kVariableLike) {
       Tensor* tensor = slot.second.tensor.get();
-      TensorShape shape = tensor->Shape();
-      if (shape.Size() == 0) {
+      TensorShape sshape = tensor->Shape();
+      if (sshape.Size() == 0) {
         return Status::ArgumentError("Scalar Not Support ReShapeId");
       }
-      shape.Set(0, id);
-      tensor->ReShape(shape);
+      sshape.Set(0, id);
+      tensor->ReShape(sshape);
     }
   }
+  shape.Set(0, id);  
+  data_->ReShape(shape);
   return Status::Ok();
 }
 
diff --git a/xdl/ps-plus/ps-plus/server/variable.h b/xdl/ps-plus/ps-plus/server/variable.h
index ea682bca..b20ad4ad 100644
--- a/xdl/ps-plus/ps-plus/server/variable.h
+++ b/xdl/ps-plus/ps-plus/server/variable.h
@@ -37,15 +37,18 @@ class Variable {
     SlotJoiner joiner;
   };
 
-  Variable(Tensor* data, Data* slicer)
-    : data_(data), slicer_(slicer) {}
+  Variable(Tensor* data, Data* slicer, std::string name): data_(data), slicer_(slicer), name_(name), real_inited_(false) {
+  }
 
   // you should lock this when you process the data.
   QRWLock& VariableLock() { return variable_lock_; }
 
   // you should use following method when VariableLock is read_locked.
   Data* GetSlicer() { return slicer_.get(); }
-  Tensor* GetData() { return data_.get(); }
+  Tensor* GetData() {
+    Tensor* tensor = data_.get();
+    return tensor;
+  }
   Tensor* GetSlot(const std::string& name, const std::function<Slot()>& slot_creator);
   Slot VariableLikeSlot(DataType type, const TensorShape& shape, Initializer* initializer);
   Slot AnyOneSlot(DataType type, const TensorShape& shape, Initializer* initializer);
@@ -55,10 +58,12 @@ class Variable {
   Status GetExistSlot(const std::string& name, Tensor** result);
   Status ReShapeId(size_t id);
   void ClearIds(const std::vector<size_t>& id);
-
+  std::string GetName() { return name_;}
   // Used for Save and Restore
   const std::unordered_map<std::string, Slot>& GetSlots() { return slots_; }
   void SetSlots(std::unordered_map<std::string, Slot>&& slots) { slots_ = std::move(slots); }
+  bool RealInited() {return real_inited_;}
+  void SetRealInited(bool init) {real_inited_ = init;}
 
  private:
   // There is 3 state in Variable Processor:
@@ -71,6 +76,8 @@ class Variable {
   std::unique_ptr<Tensor> data_;
   std::unique_ptr<Data> slicer_;
   std::unordered_map<std::string, Slot> slots_;
+  std::string name_;
+  bool real_inited_;  
 };
 
 }
diff --git a/xdl/ps-plus/ps-plus/service/seastar/lib/cpu_pool.h b/xdl/ps-plus/ps-plus/service/seastar/lib/cpu_pool.h
index 5379b239..9b32b540 100644
--- a/xdl/ps-plus/ps-plus/service/seastar/lib/cpu_pool.h
+++ b/xdl/ps-plus/ps-plus/service/seastar/lib/cpu_pool.h
@@ -54,15 +54,17 @@ class CPUPool {
       return false;
     }
 
+    std::stringstream ss;
     for (size_t i = 0; i < ids.size(); ++i) {
       if (i > 0) {
-        *core_ids += ",";
+        ss << ",";
       }
 
-      *core_ids += std::to_string(ids[i]);
+      ss << ids[i];
     }
 
-    printf("cpuset: %s\n", core_ids->c_str());
+    *core_ids = ss.str();
+    std::cout << "cpuset:" << *core_ids << std::endl;
     return true;
   }
 
diff --git a/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_client_lib.cc b/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_client_lib.cc
index a1b6dbe1..1180c655 100644
--- a/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_client_lib.cc
+++ b/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_client_lib.cc
@@ -24,7 +24,6 @@ limitations under the License.
 #include <service/stop_item.hh>
 
 #include <service/seastar_exception.hh>
-#include <glog/logging.h>
 
 #include "ps-plus/common/data.h"
 #include "common.h"
@@ -75,15 +74,8 @@ bool SeastarClientLib::Start() {
 }
 
 void SeastarClientLib::ToCmdOptions(int* argc, char*** argv) {
-  std::string is_poll_mode = ps::NetUtils::GetEnv("POLL_MODE");
-  if (is_poll_mode == "1") {
-    *argc = 8;
-    *argv = new char*[9];
-  } else {
-    *argc = 7;
-    *argv = new char*[8];
-  }
-
+  *argc = 7;
+  *argv = new char*[8];
   (*argv)[0] = new char[1000];
   (*argv)[1] = new char[1000];
   (*argv)[2] = new char[1000];
@@ -92,19 +84,13 @@ void SeastarClientLib::ToCmdOptions(int* argc, char*** argv) {
   (*argv)[5] = new char[1000];
   (*argv)[6] = new char[1000];
   (*argv)[7] = nullptr;
-
-  strcpy((*argv)[0], "fake_path_for_seastar");
-  snprintf((*argv)[1], 1000, "--smp=%d", core_num_);
-  snprintf((*argv)[2], 1000, "--cpuset=%s", core_ids_.c_str());
-  strcpy((*argv)[3], "--tcp_nodelay_on=1");
-  strcpy((*argv)[4], "--tcp_keep_alive_idle=300");
-  strcpy((*argv)[5], "--tcp_keep_alive_cnt=6");
-  strcpy((*argv)[6], "--tcp_keep_alive_interval=10");
-  if (is_poll_mode == "1") {
-    (*argv)[7] = new char[1000];
-    strcpy((*argv)[7], "--poll-mode");
-    (*argv)[8] = nullptr;
-  }
+  snprintf((*argv)[0], 1000, "--smp=%d", core_num_);
+  snprintf((*argv)[1], 1000, "--cpuset=%s", core_ids_.c_str());
+  strcpy((*argv)[2], "--tcp_nodelay_on=1");
+  strcpy((*argv)[3], "--tcp_keep_alive_idle=300");
+  strcpy((*argv)[4], "--tcp_keep_alive_cnt=6");
+  strcpy((*argv)[5], "--tcp_keep_alive_interval=10");
+  strcpy((*argv)[6], "--thread-affinity=0");
 }
 
 void SeastarClientLib::Stop() {
diff --git a/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_client_lib.cc b/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_client_lib.cc
index d697987d..6202d65a 100644
--- a/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_client_lib.cc
+++ b/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_client_lib.cc
@@ -45,11 +45,11 @@ const int SeastarServerClientLib::MAX_SERVER_NUM = 5000;
 const uint64_t SeastarServerClientLib::DEFAULT_TIMEOUT = 30 * 60 * 1000;
 
 SeastarServerClientLib::SeastarServerClientLib(int port,
-                                               int core_num,
-                                               int server_thread_num,
-                                               int client_thread_num,
-                                               bool bind_cores,
-                                               uint64_t timeout)
+        int core_num,
+        int server_thread_num,
+        int client_thread_num,
+        bool bind_cores,
+        uint64_t timeout)
   : context_(MAX_SERVER_NUM, 
              1, core_num, 
              client_thread_num, 
@@ -57,7 +57,7 @@ SeastarServerClientLib::SeastarServerClientLib(int port,
   , port_(port)
   , core_num_(core_num)
   , server_thread_num_(server_thread_num)
-  , client_thread_num_(client_thread_num) 
+  , client_thread_num_(client_thread_num)
   , bind_cores_(bind_cores)
   , timeout_(timeout) {
 }
@@ -80,8 +80,8 @@ bool SeastarServerClientLib::Start() {
 }
 
 void SeastarServerClientLib::ToCmdOptions(int* argc, char*** argv) {
-  *argc = 9;
-  *argv = new char*[10];
+  *argc = 8;
+  *argv = new char*[9];
   (*argv)[0] = new char[1000];
   (*argv)[1] = new char[1000];
   (*argv)[2] = new char[1000];
@@ -90,17 +90,15 @@ void SeastarServerClientLib::ToCmdOptions(int* argc, char*** argv) {
   (*argv)[5] = new char[1000];
   (*argv)[6] = new char[1000];
   (*argv)[7] = new char[1000];
-  (*argv)[8] = new char[1000];
-  (*argv)[9] = nullptr;
-  strcpy((*argv)[0], "fake_path_for_seastar");
-  snprintf((*argv)[1], 1000, "--smp=%d", core_num_);
-  snprintf((*argv)[2], 1000, "--cpuset=%s", core_ids_.c_str());
-  snprintf((*argv)[3], 1000, "--port=%d", port_);
-  strcpy((*argv)[4], "--tcp_nodelay_on=1");
-  strcpy((*argv)[5], "--tcp_keep_alive_idle=300");
-  strcpy((*argv)[6], "--tcp_keep_alive_cnt=6");
-  strcpy((*argv)[7], "--tcp_keep_alive_interval=10");
-  snprintf((*argv)[8], 1000, "--thread-affinity=%d", bind_cores_ ? 1 : 0);
+  (*argv)[8] = nullptr;
+  snprintf((*argv)[0], 1000, "--smp=%d", core_num_);
+  snprintf((*argv)[1], 1000, "--cpuset=%s", core_ids_.c_str());
+  snprintf((*argv)[2], 1000, "--port=%d", port_);
+  strcpy((*argv)[3], "--tcp_nodelay_on=1");
+  strcpy((*argv)[4], "--tcp_keep_alive_idle=300");
+  strcpy((*argv)[5], "--tcp_keep_alive_cnt=6");
+  strcpy((*argv)[6], "--tcp_keep_alive_interval=10");
+  snprintf((*argv)[7], 1000, "--thread-affinity=%d", bind_cores_ ? 1 : 0);
   printf("seastar binding cores: %s\n", bind_cores_ ? "true" : "false");
 }
 
diff --git a/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_lib.cc b/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_lib.cc
index 80601af8..e790501e 100644
--- a/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_lib.cc
+++ b/xdl/ps-plus/ps-plus/service/seastar/lib/seastar_server_lib.cc
@@ -47,13 +47,11 @@ bool SeastarServerLib::Start() {
 void SeastarServerLib::ToCmdOptions(int* argc, char*** argv) {
   std::string is_poll_mode = ps::NetUtils::GetEnv("POLL_MODE");
   if (is_poll_mode == "1") {
-    *argc = 9;
-    *argv = new char*[10];
-  } else {
     *argc = 8;
-    *argv = new char*[9];
+  } else {
+    *argc = 7;
   }
-
+  *argv = new char*[8];
   (*argv)[0] = new char[1000];
   (*argv)[1] = new char[1000];
   (*argv)[2] = new char[1000];
@@ -62,21 +60,14 @@ void SeastarServerLib::ToCmdOptions(int* argc, char*** argv) {
   (*argv)[5] = new char[1000];
   (*argv)[6] = new char[1000];
   (*argv)[7] = new char[1000];
-  (*argv)[8] = nullptr;
-  
-  strcpy((*argv)[0], "fake_path_for_seastar");
-  snprintf((*argv)[1], 1000, "--smp=%d", core_num_);
-  snprintf((*argv)[2], 1000, "--cpuset=%s", core_ids_.c_str());
-  snprintf((*argv)[3], 1000, "--port=%d", port_);
-  strcpy((*argv)[4], "--tcp_nodelay_on=1");
-  strcpy((*argv)[5], "--tcp_keep_alive_idle=300");
-  strcpy((*argv)[6], "--tcp_keep_alive_cnt=6");
-  strcpy((*argv)[7], "--tcp_keep_alive_interval=10");
-  if (is_poll_mode == "1") {
-    (*argv)[8] = new char[1000];
-    strcpy((*argv)[8], "--poll-mode");
-    (*argv)[9] = nullptr;
-  }
+  snprintf((*argv)[0], 1000, "--smp=%d", core_num_);
+  snprintf((*argv)[1], 1000, "--cpuset=%s", core_ids_.c_str());
+  snprintf((*argv)[2], 1000, "--port=%d", port_);
+  strcpy((*argv)[3], "--tcp_nodelay_on=1");
+  strcpy((*argv)[4], "--tcp_keep_alive_idle=300");
+  strcpy((*argv)[5], "--tcp_keep_alive_cnt=6");
+  strcpy((*argv)[6], "--tcp_keep_alive_interval=10");
+  strcpy((*argv)[7], "--poll-mode");
 }
 
 void SeastarServerLib::Stop() {
diff --git a/xdl/ps-plus/ps-plus/tool/client_tool.cpp b/xdl/ps-plus/ps-plus/tool/client_tool.cpp
index 98612f6c..ca6cbb92 100644
--- a/xdl/ps-plus/ps-plus/tool/client_tool.cpp
+++ b/xdl/ps-plus/ps-plus/tool/client_tool.cpp
@@ -14,7 +14,7 @@ limitations under the License.
 ==============================================================================*/
 
 #include <assert.h>
-#include <glog/logging.h>
+#include "xdl/core/utils/logging.h"
 #include "ps-plus/common/option_parser.h"
 #include "ps-plus/common/initializer.h"
 #include "ps-plus/common/initializer/constant_initializer.h"
@@ -93,8 +93,6 @@ void densePullVariable(client::Client& client, const std::string& variable_name)
 }
 
 int main(int argc, char** argv) {
-  google::InitGoogleLogging("ps-plus");
-//  FLAGS_logtostderr = 1;
   OptionParser optParser;
   optParser.addOption("-v", "--variable_name", "variable_name", OptionParser::OPT_STRING, true);
   optParser.addOption("-sn", "--server_num", "server_num", OptionParser::OPT_INT32, true);
diff --git a/xdl/test/binary/hadoop-2.8.5/etc/hadoop/core-site.xml b/xdl/test/binary/hadoop-2.8.5/etc/hadoop/core-site.xml
index 3c627cdc..49cdecae 100644
--- a/xdl/test/binary/hadoop-2.8.5/etc/hadoop/core-site.xml
+++ b/xdl/test/binary/hadoop-2.8.5/etc/hadoop/core-site.xml
@@ -1,28 +1 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
-<!--
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License. See accompanying LICENSE file.
--->
-
-<!-- Put site-specific property overrides in this file. -->
-
-<configuration>
-  <property>
-    <name>fs.defaultFS</name>
-    <value>hdfs://localhost:9090</value>
-  </property>
-  <property>
-    <name>hadoop.tmp.dir</name>
-    <value>/tmp/xdl_test/hadoop/</value>
-  </property>
-</configuration>
+<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="configuration.xsl"?><!--  Licensed under the Apache License, Version 2.0 (the "License");  you may not use this file except in compliance with the License.  You may obtain a copy of the License at    http://www.apache.org/licenses/LICENSE-2.0  Unless required by applicable law or agreed to in writing, software  distributed under the License is distributed on an "AS IS" BASIS,  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.  See the License for the specific language governing permissions and  limitations under the License. See accompanying LICENSE file.--><!-- Put site-specific property overrides in this file. --><configuration>  <property>    <name>fs.defaultFS</name>    <value>hdfs://localhost:9090</value>  </property>  <property>    <name>hadoop.tmp.dir</name>    <value>/tmp/xdl_test/hadoop/</value>  </property></configuration>
\ No newline at end of file
diff --git a/xdl/test/binary/hadoop-2.8.5/etc/hadoop/hdfs-site.xml b/xdl/test/binary/hadoop-2.8.5/etc/hadoop/hdfs-site.xml
index 778f3ef2..b6201713 100644
--- a/xdl/test/binary/hadoop-2.8.5/etc/hadoop/hdfs-site.xml
+++ b/xdl/test/binary/hadoop-2.8.5/etc/hadoop/hdfs-site.xml
@@ -1,24 +1 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
-<!--
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License. See accompanying LICENSE file.
--->
-
-<!-- Put site-specific property overrides in this file. -->
-
-<configuration>
-  <property>
-    <name>dfs.replication</name>
-    <value>1</value>
-  </property>
-</configuration>
+<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="configuration.xsl"?><!--  Licensed under the Apache License, Version 2.0 (the "License");  you may not use this file except in compliance with the License.  You may obtain a copy of the License at    http://www.apache.org/licenses/LICENSE-2.0  Unless required by applicable law or agreed to in writing, software  distributed under the License is distributed on an "AS IS" BASIS,  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.  See the License for the specific language governing permissions and  limitations under the License. See accompanying LICENSE file.--><!-- Put site-specific property overrides in this file. --><configuration>  <property>    <name>dfs.replication</name>    <value>1</value>  </property></configuration>
\ No newline at end of file
diff --git a/xdl/test/binary/hadoop-2.8.5/lib/native/libhadoop.so b/xdl/test/binary/hadoop-2.8.5/lib/native/libhadoop.so
deleted file mode 120000
index e9aafc2b..00000000
--- a/xdl/test/binary/hadoop-2.8.5/lib/native/libhadoop.so
+++ /dev/null
@@ -1 +0,0 @@
-libhadoop.so.1.0.0
\ No newline at end of file
diff --git a/xdl/test/binary/hadoop-2.8.5/lib/native/libhadoop.so b/xdl/test/binary/hadoop-2.8.5/lib/native/libhadoop.so
new file mode 100755
index 00000000..95f28390
Binary files /dev/null and b/xdl/test/binary/hadoop-2.8.5/lib/native/libhadoop.so differ
diff --git a/xdl/test/binary/hadoop-2.8.5/lib/native/libhdfs.so b/xdl/test/binary/hadoop-2.8.5/lib/native/libhdfs.so
deleted file mode 120000
index 2f587b56..00000000
--- a/xdl/test/binary/hadoop-2.8.5/lib/native/libhdfs.so
+++ /dev/null
@@ -1 +0,0 @@
-libhdfs.so.0.0.0
\ No newline at end of file
diff --git a/xdl/test/binary/hadoop-2.8.5/lib/native/libhdfs.so b/xdl/test/binary/hadoop-2.8.5/lib/native/libhdfs.so
new file mode 100755
index 00000000..bd45e348
Binary files /dev/null and b/xdl/test/binary/hadoop-2.8.5/lib/native/libhdfs.so differ
diff --git a/xdl/test/binary/zookeeper-3.4.13/conf/zoo.cfg b/xdl/test/binary/zookeeper-3.4.13/conf/zoo.cfg
index 3c3e5326..f00c6e8c 100644
--- a/xdl/test/binary/zookeeper-3.4.13/conf/zoo.cfg
+++ b/xdl/test/binary/zookeeper-3.4.13/conf/zoo.cfg
@@ -11,7 +11,7 @@ syncLimit=5
 # example sakes.
 dataDir=/tmp/xdl_zookeeper
 # the port at which the clients will connect
-clientPort=2181
+clientPort=${port}
 # the maximum number of client connections.
 # increase this if you need to handle more clients
 #maxClientCnxns=60
diff --git a/xdl/test/core/CMakeLists.txt b/xdl/test/core/CMakeLists.txt
index 387c3ab9..a91ee61f 100644
--- a/xdl/test/core/CMakeLists.txt
+++ b/xdl/test/core/CMakeLists.txt
@@ -3,11 +3,6 @@ add_executable(xdl_core_lib_test ${SRC_CORE_LIB_TEST})
 target_link_libraries(xdl_core_lib_test gtest gtest_main ${XDL_CORE_LIB})
 add_test(NAME xdl_core_lib_test COMMAND xdl_core_lib_test)
 
-aux_source_directory(inference SRC_CORE_INFERENCE_TEST)
-add_executable(xdl_core_inference_test ${SRC_CORE_INFERENCE_TEST})
-target_link_libraries(xdl_core_inference_test gtest gtest_main ${XDL_CORE_LIB})
-add_test(NAME xdl_core_inference_test COMMAND xdl_core_inference_test)
-
 aux_source_directory(grappler SRC_CORE_FRAMEWORK_TEST)
 aux_source_directory(framework SRC_CORE_FRAMEWORK_TEST)
 add_executable(xdl_core_framework_test ${SRC_CORE_FRAMEWORK_TEST})
diff --git a/xdl/test/core/backend/mxnet/convert_utils_test.cc b/xdl/test/core/backend/mxnet/convert_utils_test.cc
index 693c0646..6f412ecb 100644
--- a/xdl/test/core/backend/mxnet/convert_utils_test.cc
+++ b/xdl/test/core/backend/mxnet/convert_utils_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/backend/mxnet/mxnet_runner.h"
 #include "xdl/core/backend/mxnet/convert_utils.h"
diff --git a/xdl/test/core/backend/mxnet/mxnet_backend_dnn_test.cc b/xdl/test/core/backend/mxnet/mxnet_backend_dnn_test.cc
index 11d51c32..9c762d98 100644
--- a/xdl/test/core/backend/mxnet/mxnet_backend_dnn_test.cc
+++ b/xdl/test/core/backend/mxnet/mxnet_backend_dnn_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/utils/file_utils.h"
 #include "xdl/core/backend/device_singleton.h"
diff --git a/xdl/test/core/backend/mxnet/mxnet_backend_dummy_test.cc b/xdl/test/core/backend/mxnet/mxnet_backend_dummy_test.cc
index 15030a1b..e9b1538c 100644
--- a/xdl/test/core/backend/mxnet/mxnet_backend_dummy_test.cc
+++ b/xdl/test/core/backend/mxnet/mxnet_backend_dummy_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/utils/file_utils.h"
 #include "xdl/core/backend/device_singleton.h"
diff --git a/xdl/test/core/backend/mxnet/mxnet_backend_test.cc b/xdl/test/core/backend/mxnet/mxnet_backend_test.cc
index 6d98b0ca..ff769af3 100644
--- a/xdl/test/core/backend/mxnet/mxnet_backend_test.cc
+++ b/xdl/test/core/backend/mxnet/mxnet_backend_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/utils/file_utils.h"
 #include "xdl/core/backend/device_singleton.h"
diff --git a/xdl/test/core/backend/tf/convert_utils_test.cc b/xdl/test/core/backend/tf/convert_utils_test.cc
index e035f621..73190bd2 100644
--- a/xdl/test/core/backend/tf/convert_utils_test.cc
+++ b/xdl/test/core/backend/tf/convert_utils_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/backend/tf/convert_utils.h"
 #include "xdl/core/backend/device_singleton.h"
diff --git a/xdl/test/core/backend/tf/tf_backend_test.cc b/xdl/test/core/backend/tf/tf_backend_test.cc
index db578367..73d4c7f0 100644
--- a/xdl/test/core/backend/tf/tf_backend_test.cc
+++ b/xdl/test/core/backend/tf/tf_backend_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/utils/file_utils.h"
 #include "xdl/core/backend/tf/tf_runner.h"
diff --git a/xdl/test/core/framework/grappler_test.cc b/xdl/test/core/framework/grappler_test.cc
index 55e5fd15..e1cc542f 100644
--- a/xdl/test/core/framework/grappler_test.cc
+++ b/xdl/test/core/framework/grappler_test.cc
@@ -80,11 +80,10 @@ OutputSpec CreateOutput() {
 TEST(GrapplerTest, Grappler) {
   xdl::GraphDef def = CreateDef();
   xdl::OutputSpec output = CreateOutput();
-  xdl::InputSpec input;
 
   GrapplerRegistry *registry = GrapplerRegistry::Get();
   ASSERT_TRUE(registry != nullptr);
 
-  Status st = registry->Process(input, &def, &output);
+  Status st = registry->Process(&def, &output);
   ASSERT_EQ(st, Status::Ok());
 }
diff --git a/xdl/test/core/framework/op_registry_test.cc b/xdl/test/core/framework/op_registry_test.cc
index 51d2dcdf..1154d0c4 100644
--- a/xdl/test/core/framework/op_registry_test.cc
+++ b/xdl/test/core/framework/op_registry_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/op_registry.h"
 
 using xdl::OpKernelBase;
diff --git a/xdl/test/core/framework/tensor_test.cc b/xdl/test/core/framework/tensor_test.cc
index 82cab34d..a24738fd 100644
--- a/xdl/test/core/framework/tensor_test.cc
+++ b/xdl/test/core/framework/tensor_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/framework/tensor.h"
 
 using xdl::Tensor;
diff --git a/xdl/test/core/inference/serving_test.cc b/xdl/test/core/inference/serving_test.cc
deleted file mode 100644
index 6cb5c37f..00000000
--- a/xdl/test/core/inference/serving_test.cc
+++ /dev/null
@@ -1,52 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include "gtest/gtest.h"
-#include "glog/logging.h"
-#include "xdl/core/utils/file_utils.h"
-#include "test/util/test_utils.h"
-#include "xdl/core/inference/serving.h"
-#include "xdl/core/backend/device_singleton.h"
-
-using namespace xdl;
-
-namespace {
-
-TEST(ServingTest, TestWithTagDef) {
-  {
-    std::string graph_path = "../test_data/inference/ckpt/graph.txt";  
-    std::string ckpt_dir = "../test_data/inference/ckpt";
-    std::string ckpt_version = "v1";
-    Serving serving(ckpt_dir);
-    ASSERT_TRUE(serving.Init(graph_path, ckpt_version).IsOk());
-    Executor::Feeds feeds;
-    feeds.push_back({"sparse0.ids", TestUtils::MakeTensor<int64_t>({0,988,0,62,0,131,0,635,0,310,0,455,0,336,0,873,0,633,0,518,0,731,0,978,0,17}, {13,2})});
-    feeds.push_back({"sparse0.values", TestUtils::MakeTensor<float>({0.462050,0.909760,0.715116,0.845752,0.610643,0.169108,0.953582,0.443327,0.030230,0.622898,0.733503,0.332480,0.573710}, {13})});
-    feeds.push_back({"sparse0.segments", TestUtils::MakeTensor<int32_t>({13}, {1})});
-    feeds.push_back({"sparse1.ids", TestUtils::MakeTensor<int64_t>({0,480,0,733,0,710,0,914,0,634,0,695,0,729,0,132,0,217,0,494,0,392,0,533,0,211,0,950,0,596,0,230,0,431,0,282,0,341}, {19,2})});
-    feeds.push_back({"sparse1.values", TestUtils::MakeTensor<float>({0.263620,0.027927,0.199425,0.903399,0.704284,0.635139,0.524406,0.275044,0.288276,0.807933,0.075038,0.173196,0.021525,0.810449,0.669214,0.471364,0.334187,0.151534,0.793695}, {19})});
-    feeds.push_back({"sparse1.segments", TestUtils::MakeTensor<int32_t>({19}, {1})});
-    feeds.push_back({"deep0.values", TestUtils::MakeTensor<float>({0.011690,0.072661,0.012773,0.497300,0.656102,0.385087,0.846656,0.048085,0.011000,0.863605,0.275154,0.430491,0.207569,0.544758,0.780895,0.416272,0.858965,0.655775,0.462375,0.077353,0.295894,0.594692,0.438903,0.283392,0.540657,0.869890,0.349668,0.385125,0.329977,0.887843,0.425104,0.579968,0.053477,0.723641,0.289681,0.587159,0.628797,0.968358,0.996349,0.196942,0.875995,0.475879,0.811794,0.291763,0.851498,0.673549,0.070889,0.353601,0.847294,0.188653,0.499241,0.319653,0.796363,0.056922,0.039318,0.449564,0.107104,0.955146,0.860472,0.526347,0.982254,0.655419,0.748709,0.870242,0.874448,0.573869,0.873185,0.268479,0.320429,0.961806,0.673799,0.282271,0.353751,0.425874,0.190134,0.508951,0.444349,0.610549,0.610728,0.414319,0.883142,0.951144,0.262990,0.881435,0.686916,0.056805,0.438482,0.511482,0.650849,0.397393,0.965502,0.905666,0.135603,0.337483,0.118374,0.773380,0.322721,0.809750,0.284590,0.293164,0.731300,0.116791,0.201154,0.204524,0.095560,0.957432,0.818350,0.667117,0.981084,0.417561,0.487987,0.280055,0.315215,0.248960,0.865737,0.484733,0.958408,0.914768,0.910045,0.105318,0.734690,0.807400,0.806441,0.261733,0.872888,0.840520,0.692946,0.841746,0.038020,0.369281,0.500997,0.087760,0.446047,0.368810,0.426557,0.768465,0.395198,0.967053,0.590749,0.262509,0.758114,0.696760,0.151753,0.985716,0.294055,0.581717,0.521879,0.543686,0.756559,0.257276,0.436682,0.197747,0.037379,0.947728,0.383694,0.161544,0.259172,0.984394,0.300147,0.452491,0.911634,0.608224,0.618608,0.225436,0.930741,0.473881,0.300398,0.622700,0.730416,0.398802,0.293478,0.893828,0.278531,0.919002,0.427858,0.718807,0.003702,0.494992,0.310552,0.487752,0.250914,0.766800,0.145656,0.157410,0.298930,0.559552,0.468093,0.474567,0.124676,0.479369,0.782388,0.203840,0.695210,0.466275,0.516355,0.869807,0.183799,0.245824,0.728539,0.733798,0.436823,0.870649,0.121996,0.152889,0.084488,0.003179,0.245625,0.640358,0.373756,0.329289,0.479861,0.981833,0.486936,0.635539,0.354637,0.193547,0.841311,0.024777,0.097900,0.292391,0.663801,0.777566,0.146430,0.925205,0.860497,0.352129,0.342704,0.636091,0.271126,0.233050,0.229509,0.773627,0.805742,0.286443,0.150001,0.916064,0.410454,0.811541,0.222059,0.662017,0.379142,0.845451,0.531727,0.793938,0.576745,0.565500,0.970726,0.782866,0.173878,0.961354,0.955934,0.853337,0.145354,0.234441,0.910444,0.780746}, {1,256})});    
-    feeds.push_back({"label", TestUtils::MakeTensor<float>({1.0}, {1,1})});
-    std::vector<Tensor> results;
-    ASSERT_TRUE(serving.Predict(feeds, &results).IsOk());
-    ASSERT_EQ(1, results.size());
-    float* base = results[0].Raw<float>();
-    ASSERT_FLOAT_EQ(0.81805933, *base);
-  }
-}
-
-}
-
diff --git a/xdl/test/core/lib/any_test.cc b/xdl/test/core/lib/any_test.cc
index 1f3462f6..e1c13b65 100644
--- a/xdl/test/core/lib/any_test.cc
+++ b/xdl/test/core/lib/any_test.cc
@@ -31,8 +31,6 @@ limitations under the License.
 #include "xdl/core/lib/any.h"
 #include "gtest/gtest.h"
 
-#include "glog/logging.h"
-
 namespace xdl {
 
 TEST(AnyTest, TestAll) {
diff --git a/xdl/test/core/lib/atomic_test.cc b/xdl/test/core/lib/atomic_test.cc
index e0fa6116..f90c2cd1 100644
--- a/xdl/test/core/lib/atomic_test.cc
+++ b/xdl/test/core/lib/atomic_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/lib/atomic.h"
 
 using namespace xdl::common;
diff --git a/xdl/test/core/lib/refcount_test.cc b/xdl/test/core/lib/refcount_test.cc
index 8279f404..6428b249 100644
--- a/xdl/test/core/lib/refcount_test.cc
+++ b/xdl/test/core/lib/refcount_test.cc
@@ -14,7 +14,6 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
 #include "xdl/core/lib/refcount.h"
 
 using xdl::RefCounted;
diff --git a/xdl/test/core/lib/threadpool_test.cc b/xdl/test/core/lib/threadpool_test.cc
index 09a7adb0..62088865 100644
--- a/xdl/test/core/lib/threadpool_test.cc
+++ b/xdl/test/core/lib/threadpool_test.cc
@@ -14,21 +14,21 @@ limitations under the License.
 ==============================================================================*/
 
 #include "gtest/gtest.h"
-#include "glog/logging.h"
+#include "xdl/core/utils/logging.h"
 #include "xdl/core/lib/thread_pool.h"
 
 namespace xdl {
 
 TEST(ThreadPoolTest, ThreadPool) {
   ThreadPool *pool = new ThreadPool(1);
-  CHECK(pool != nullptr);
+  XDL_CHECK(pool != nullptr);
 
   pool->Schedule([] () { std::cout << "hello\n"; });
 
   delete pool;
 
   pool = ThreadPool::Global();
-  CHECK(pool != nullptr);
+  XDL_CHECK(pool != nullptr);
 }
 
 }
diff --git a/xdl/test/core/lib/timer_test.cc b/xdl/test/core/lib/timer_test.cc
index 2f207d91..6737b951 100644
--- a/xdl/test/core/lib/timer_test.cc
+++ b/xdl/test/core/lib/timer_test.cc
@@ -31,16 +31,14 @@ limitations under the License.
 
 #include <unistd.h>
 
+#include "xdl/core/utils/logging.h"
 #include "xdl/core/lib/timer.h"
 #include "gtest/gtest.h"
 
-#include "glog/logging.h"
-
 namespace xdl {
 
 TEST(TimerTest, TestTimer) {
   {
-    LOG(INFO) << "....";
     XDL_TIMER_NOW(t1);
     XDL_TIMER_START(t1);
     XDL_TIMER_STOP(t1);
@@ -50,9 +48,9 @@ TEST(TimerTest, TestTimer) {
     tc_keeper::Instance()->ResetAll();
     tc_keeper::Instance()->Step(3);
     TimerCore *tc = tc_keeper::Instance()->Get("hello");
-    CHECK(tc != nullptr);
+    XDL_CHECK(tc != nullptr);
     Timer *t1 = new Timer("hello", tc);
-    CHECK(t1 != nullptr);
+    XDL_CHECK(t1 != nullptr);
     t1->Start();
     sleep(1);
     t1->Reset();
@@ -64,9 +62,9 @@ TEST(TimerTest, TestTimer) {
 
   {
     TimerCore *tc = tc_keeper::Instance()->Get("hello");
-    CHECK(tc != nullptr);
+    XDL_CHECK(tc != nullptr);
     TimerScope *ts = new TimerScope("world", tc);
-    CHECK(ts != nullptr);
+    XDL_CHECK(ts != nullptr);
     delete ts;
   }
 }
diff --git a/xdl/test/core/utils/time_utils_test.cc b/xdl/test/core/utils/time_utils_test.cc
index 2fe90e57..3bbe90e7 100644
--- a/xdl/test/core/utils/time_utils_test.cc
+++ b/xdl/test/core/utils/time_utils_test.cc
@@ -31,8 +31,6 @@ limitations under the License.
 #include "xdl/core/utils/time_utils.h"
 #include "gtest/gtest.h"
 
-#include "glog/logging.h"
-
 namespace xdl {
 
 TEST(TimeUtilTest, TestAll) {
diff --git a/xdl/test/data_io/CMakeLists.txt b/xdl/test/data_io/CMakeLists.txt
index a8193008..643a0584 100644
--- a/xdl/test/data_io/CMakeLists.txt
+++ b/xdl/test/data_io/CMakeLists.txt
@@ -1,8 +1,8 @@
 aux_source_directory(op SRC_CORE_LIB_TEST)
 
-xdl_add_test( . ".cc" xdl_io xdl_core rdkafka++ jsoncpp glog libprotobuf gtest gtest_main test_util)
-xdl_add_test( op/feature_op ".cc" xdl_io xdl_core rdkafka++ jsoncpp glog libprotobuf gtest gtest_main)
-xdl_add_test( parser ".cc" xdl_io xdl_core glog rdkafka++ jsoncpp libprotobuf gtest gtest_main)
-xdl_add_test( packer ".cc" xdl_io xdl_core glog jsoncpp libprotobuf gtest gtest_main)
-xdl_add_test( merger ".cc" xdl_io xdl_core glog jsoncpp libprotobuf gtest gtest_main)
-xdl_add_test( fs ".cc" xdl_io xdl_core glog jsoncpp libprotobuf gtest gtest_main test_util)
+xdl_add_test_exclude( . ".cc" "global_scheduler_test" ${XDL_IO_LIB} ${XDL_CORE_LIB} gtest gtest_main test_util)
+xdl_add_test( op/feature_op ".cc" ${XDL_IO_LIB} ${XDL_CORE_LIB} gtest gtest_main test_util)
+xdl_add_test( parser ".cc" ${XDL_IO_LIB} ${XDL_CORE_LIB} gtest gtest_main test_util)
+xdl_add_test( packer ".cc" ${XDL_IO_LIB} ${XDL_CORE_LIB} gtest gtest_main test_util)
+xdl_add_test( merger ".cc" ${XDL_IO_LIB} ${XDL_CORE_LIB} gtest gtest_main test_util)
+xdl_add_test( fs ".cc" ${XDL_IO_LIB} ${XDL_CORE_LIB} gtest gtest_main test_util)
diff --git a/xdl/test/data_io/data_io_hdfs_test.cc b/xdl/test/data_io/data_io_hdfs_test.cc
deleted file mode 100644
index 81360169..00000000
--- a/xdl/test/data_io/data_io_hdfs_test.cc
+++ /dev/null
@@ -1,180 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include "xdl/data_io/data_io.h"
-#include "xdl/data_io/op/debug_op.h"
-#include "test/util/hdfs_launcher.h"
-#include "xdl/data_io/parser/parser.h"
-#include "xdl/data_io/fs/file_system_hdfs.h"
-#include "gtest/gtest.h"
-
-#include <string.h>
-
-const char *path = "hdfs://127.0.0.1:9090/test_data/data_io/sample.txt";
-const char *dir = "hdfs://127.0.0.1:9090/test_data/data_io/";
-size_t epochs = 1;
-
-namespace xdl {
-namespace io {
-
-class DataIOTest: public ::testing::Test {
- public:
-  void SetUp() override {
-    if (false == ps::HDFSLauncher::Start()) {
-      skip_ = true;
-    }
-    if (skip_) {
-      GTEST_SKIP();
-      return;
-    }
-
-    DataIO *data_io = new DataIO("test", kTxt, kHdfs, "hdfs://127.0.0.1:9090");
-    EXPECT_NE(nullptr, data_io);
-
-    data_io->SetEpochs(10);
-    data_io->SetBatchSize(kBatchSize);
-    data_io->SetLabelCount(kLabelCount);
-
-    data_io->AddFeatureOpt("ufav3", kSparse);
-    data_io->AddFeatureOpt("upv14", kSparse);
-    data_io->AddFeatureOpt("a", kDense, 0, 3);
-    data_io->AddFeatureOpt("s", kDense, 0, 1);
-
-    data_io_ = data_io;
-  }
-
-  void TearDown() override {
-    if (!skip_) {
-      ps::HDFSLauncher::Stop();
-    }
-  }
-
-  static void TestRun(const char *);
-  static void TestHdfs(const char *);
-  static void TestAnt(const char *);
-
-  static const size_t kBatchSize;
-  static const size_t kLabelCount;
-
-  static DataIO *data_io_;
-
-private:
-  bool skip_ = false;
-};
-
-const size_t DataIOTest::kBatchSize = 1024;
-const size_t DataIOTest::kLabelCount = 2;
-
-
-DataIO *DataIOTest::data_io_ = nullptr;
-
-void DataIOTest::TestRun(const char *path) {
-  //data_io_->SetMeta(meta);
-  data_io_->AddPath(path);
-  data_io_->SetEpochs(epochs);
-
-  //data_io_->AddOp(new DebugOP);
-
-  data_io_->Startup();
-
-  const Batch *batch;
-  do {
-   batch = data_io_->GetBatch();
-   if (batch != nullptr) {
-     XDL_CHECK(batch->Get("ufav3") !=nullptr);
-     XDL_CHECK(batch->Get("upv14") !=nullptr);
-     XDL_CHECK(batch->Get("a") !=nullptr);
-     XDL_CHECK(batch->Get("s") !=nullptr);
-     std::cerr << ".";
-   }
-  } while(batch != nullptr);
-
-  std::cerr << std::endl;
-
-  data_io_->Shutdown();
-}
-
-void DataIOTest::TestHdfs(const char *path) {
-  auto fs = FileSystemHdfs::Get("hdfs://127.0.0.1:9090");
-  XDL_CHECK(fs != nullptr);
-  FileSystemHdfs *hdfs = reinterpret_cast<FileSystemHdfs*>(fs);
-  XDL_CHECK(hdfs != nullptr);
-  XDL_CHECK(hdfs->IsReg(path) == true);
-  XDL_CHECK(hdfs->IsDir(path) == false);
-
-  auto files = hdfs->Dir(dir);
-  XDL_CHECK(files.size() > 1);
-
-  size_t st = hdfs->Size(path);
-  XDL_CHECK(st > 1);
-
-  void *fd = hdfs->Open(path, "r");
-  XDL_CHECK(fd != nullptr);
-
-  std::string node = hdfs->Path2Node("ftp://192.168.0.1");
-  XDL_CHECK(node == "");
-  node = hdfs->Path2Node("hdfs://192.168.0.1/hello");
-  XDL_CHECK(node == "hdfs://192.168.0.1");
-
-  std::string content = "What is nature's call?";
-  std::string file_name = std::string(dir) + "/write.test";
-  HdfsWrite(file_name, content);
-  XDL_CHECK(HdfsRead(file_name) == content);
-}
-
-void DataIOTest::TestAnt(const char *path) {
-  auto fs = GetHdfsFileSystem(path);
-  XDL_CHECK(fs != nullptr);
-
-  std::string file_name = std::string(dir) + "/ioant.test";
-  std::string content = "Fire, earth, storm. Hear my call!";
-  auto ant = fs->GetAnt(file_name.c_str(), 'w');
-  XDL_CHECK(ant != nullptr);
-
-  ssize_t res = ant->Write(content.c_str(), content.length());
-  XDL_CHECK(res == content.length());
-
-  delete ant; /* Need it to sync hdfs ! */
-
-  fs = GetHdfsFileSystem(path);
-  XDL_CHECK(fs != nullptr);
-
-  ant = fs->GetAnt(file_name.c_str(), 'r');
-  char buff[1024];
-  res = ant->Read(buff, content.length());
-  XDL_CHECK(res == content.length());
-}
-
-TEST_F(DataIOTest, Run) {
-  TestRun(path);
-}
-
-TEST_F(DataIOTest, Hdfs) {
-  TestHdfs(path);
-}
-
-TEST_F(DataIOTest, Ant) {
-  TestAnt(path);
-}
-
-}
-}
-
-int main(int argc, char **argv)
-{
-  ::testing::InitGoogleTest(&argc, argv);
-  return RUN_ALL_TESTS();
-}
-
diff --git a/xdl/test/data_io/data_io_kafaka_test.cc b/xdl/test/data_io/data_io_kafaka_test.cc
index b37bce51..240a89cb 100644
--- a/xdl/test/data_io/data_io_kafaka_test.cc
+++ b/xdl/test/data_io/data_io_kafaka_test.cc
@@ -18,6 +18,7 @@ limitations under the License.
 #include "xdl/data_io/parser/parser.h"
 #include "xdl/data_io/fs/file_system_kafka.h"
 #include "gtest/gtest.h"
+#include "xdl/core/utils/logging.h"
 
 size_t epochs = 1;
 
@@ -113,8 +114,8 @@ void DataIOKafkaTest::TestKafkaAnt(const char *path) {
 
 TEST_F(DataIOKafkaTest, Run) {
   //TestRun("earth:0");
-  //TestDir();
-  //TestKafkaAnt("earth:0");
+  TestDir();
+  TestKafkaAnt("earth:0");
 }
 
 }
diff --git a/xdl/test/data_io/data_io_state_test.cc b/xdl/test/data_io/data_io_state_test.cc
index bf182b42..d284742b 100644
--- a/xdl/test/data_io/data_io_state_test.cc
+++ b/xdl/test/data_io/data_io_state_test.cc
@@ -18,6 +18,7 @@ limitations under the License.
 #include "xdl/data_io/parser/parser.h"
 #include "xdl/data_io/fs/file_system_local.h"
 #include "gtest/gtest.h"
+#include "xdl/core/utils/logging.h"
 
 #include <string.h>
 
@@ -63,18 +64,13 @@ class DataIOTest: public ::testing::Test {
 void DataIOTest::TestState(void) {
   data_io_->Init();
   std::string text = data_io_->Store();
-  delete data_io_;
-  data_io_ = nullptr;
 
   std::cout << " >>> " << text << std::endl;
 
   EXPECT_NE(0, text.size());
 
-  DataIO *data_io = new DataIO("test", kTxt, kLocal, "");
-  EXPECT_NE(nullptr, data_io);
-
-  data_io->Restore(text);
-  data_io->Init();
+  data_io_->Restore(text);
+  data_io_->Init();
 }
 
 void DataIOTest::TestLocal(void) {
diff --git a/xdl/test/data_io/data_io_test.cc b/xdl/test/data_io/data_io_test.cc
index 3d268feb..b0cde4e1 100644
--- a/xdl/test/data_io/data_io_test.cc
+++ b/xdl/test/data_io/data_io_test.cc
@@ -17,6 +17,7 @@ limitations under the License.
 #include "xdl/data_io/op/debug_op.h"
 #include "xdl/data_io/parser/parser.h"
 #include "gtest/gtest.h"
+#include "xdl/core/utils/logging.h"
 
 #include <string.h>
 
@@ -102,9 +103,7 @@ void DataIOTest::TestRun(const char *path) {
 
      auto blk = batch->Get("skey");
      auto sbuf = blk->ts_[Block::kSBuf];
-     auto slen = blk->ts_[Block::kIndex];
      XDL_CHECK(sbuf != nullptr);
-     XDL_CHECK(slen != nullptr);
 
      auto dims = sbuf->Shape().Dims();
      XDL_CHECK(dims.size() == 2);
@@ -113,17 +112,12 @@ void DataIOTest::TestRun(const char *path) {
 
      size_t max_len = dims[1];
 
-     dims = slen->Shape().Dims();
-     XDL_CHECK(dims.size() == 1);
-     XDL_CHECK(dims[0] == kBatchSize);
-
      auto sbufs = sbuf->Raw<int8_t>();
-     auto slens = slen->Raw<int32_t>();
 
      /*
      for (size_t i = 0; i < kBatchSize; ++i) {
-       unsigned len = slens[i];
-       XDL_CHECK(len <= max_len) << i << " len=" << len << ", max_len=" << max_len;
+       unsigned len = strlen(&sbufs[i*max_len]);
+       XDL_CHECK(len < max_len) << i << " len=" << len << ", max_len=" << max_len;
        char *sk = (char *)&sbufs[i*max_len];
        std::cout << ">>> " << std::string(sk, len) << std::endl;
      }
diff --git a/xdl/test/data_io/fs/hdfs_test.cc b/xdl/test/data_io/fs/hdfs_test.cc
deleted file mode 100644
index 16ea0ebf..00000000
--- a/xdl/test/data_io/fs/hdfs_test.cc
+++ /dev/null
@@ -1,68 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include "xdl/data_io/fs/file_system.h"
-#include "test/util/hdfs_launcher.h"
-#include "gtest/gtest.h"
-
-#include <cstdlib>
-#include <iostream>
-
-namespace xdl {
-namespace io {
-
-const char *path = "hdfs://127.0.0.1:9090/test_data/data_io";
-
-class HdfsTest : public testing::Test {
-  public:
-    void SetUp() override {
-      if (false == ps::HDFSLauncher::Start()) {
-        skip_ = true;
-      }
-      if (skip_) {
-        GTEST_SKIP();
-      }
-    }
-
-    void TearDown() override {
-      if (!skip_) {
-        ps::HDFSLauncher::Stop();
-      }
-    }
-
-  private:
-    bool skip_ = false;
-};
-
-TEST_F(HdfsTest, TestHdfs) {
-  auto fs = GetFileSystem(kHdfs, "hdfs://127.0.0.1:9090");
-  std::cout << "connect" << std::endl;
-
-  auto ret = fs->IsDir(path);
-  ASSERT_TRUE(ret);
-
-  auto paths = fs->Dir("hdfs://127.0.0.1:9090/test_data/data_io");
-  
-  EXPECT_GT(paths.size(), 0);
-  for (auto &path: paths) {
-    std::cout << path << std::endl;
-  }
-
-  auto size = fs->Size("hdfs://127.0.0.1:9090/test_data/data_io/tdm.dat");
-  std::cout << "size=" << size << std::endl;
-}
-
-}
-}
diff --git a/xdl/test/data_io/fs/zlib_test.cc b/xdl/test/data_io/fs/zlib_test.cc
new file mode 100644
index 00000000..ee49c742
--- /dev/null
+++ b/xdl/test/data_io/fs/zlib_test.cc
@@ -0,0 +1,86 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/data_io.h"
+#include "xdl/data_io/op/debug_op.h"
+#include "xdl/data_io/parser/parser.h"
+#include "xdl/data_io/fs/zlib_ant.h"
+#include "xdl/data_io/fs/file_system_local.h"
+#include "gtest/gtest.h"
+#include "xdl/core/utils/logging.h"
+
+namespace xdl {
+namespace io {
+
+class FSZlibTest: public ::testing::Test {
+ public:
+  static void SetUpTestCase() {
+  }
+
+  static void TearDownTestCase() {
+  }
+
+  static void TestZlibAnt(const char *);
+};
+
+void FSZlibTest::TestZlibAnt(const char *path) {
+  auto fs = FileSystemLocal::Get();
+  XDL_CHECK(fs != nullptr);
+  // content is "abcdefghijklmnopqrstuvwxyz1234567890" * 10
+  IOAnt* local_ant = fs->GetAnt("./zlib_test_data", 'r');
+  XDL_CHECK(local_ant != nullptr);
+  //ZlibCompressionOptions options = ZlibCompressionOptions::DEFAULT();
+  //IOAnt* ant = new ZlibAnt(local_ant, options);
+  IOAnt* ant = new ZlibAnt(local_ant);  
+
+  char buff[1024];
+  memset(buff, 0, sizeof(buff));
+  const char* str = "abcdefghijklmnopqrstuvwxyz1234567890";
+  for (size_t i = 0; i < 9; i++) {
+    ssize_t ret = ant->Read(buff, 36);
+    EXPECT_EQ(ret, 36);
+    EXPECT_STREQ(str, buff);
+  }
+  ssize_t last = ant->Read(buff, 100);
+  EXPECT_EQ(last, 36);
+  EXPECT_STREQ(str, buff);
+
+  //SEEK to begin
+  XDL_CHECK(ant->Seek(0) == 0);
+  ssize_t ret = ant->Read(buff, 1000);
+  EXPECT_EQ(ret, 360);
+  char tmp[1024];
+  for (size_t i = 0; i < 10; i++) {
+    strncpy(tmp, &buff[i*36], 36);
+    tmp[36] = 0;
+    EXPECT_STREQ(str, tmp);
+  }
+  EXPECT_EQ(ant->Read(buff, 1000), 0);
+
+  //SEEK to spec
+  memset(buff, 0, sizeof(buff));
+  XDL_CHECK(ant->Seek(36*9) == 36*9);
+  ret = ant->Read(buff, 1000);
+  EXPECT_EQ(ret, 36);
+  EXPECT_STREQ(str, buff);
+  EXPECT_EQ(ant->Read(buff, 1000), 0);
+}
+
+TEST_F(FSZlibTest, Run) {
+  TestZlibAnt("earth:0");
+}
+
+}
+}
diff --git a/xdl/test/data_io/global_scheduler_test.cc b/xdl/test/data_io/global_scheduler_test.cc
new file mode 100644
index 00000000..b9b47922
--- /dev/null
+++ b/xdl/test/data_io/global_scheduler_test.cc
@@ -0,0 +1,113 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/global_scheduler.h"
+#include "gtest/gtest.h"
+#include "xdl/core/ops/ps_ops/client.h"
+
+#include <stdlib.h>
+
+namespace xdl {
+namespace io {
+
+static const char *path = "sample.txt";
+static const char *path2 = "sample2.txt";
+
+TEST(GlobalSchedulerTest, TestSchedule) {
+  ConnectToClient("localhost", "./v1");
+  GlobalScheduler sched("g1", kLocal);
+  sched.SetEpochs(2);
+  sched.AddPath(path);
+  sched.AddPath(path2);
+  ASSERT_TRUE(sched.Schedule());
+  ReadParam *rparam = nullptr;
+  for (int i = 0; i < 6; ++i) {
+    rparam = sched.Acquire();
+    if (i >= 4) {
+      ASSERT_EQ(nullptr, rparam);
+      continue;
+    }
+    ASSERT_NE(nullptr, rparam);
+    EXPECT_EQ(0, rparam->begin_);
+    EXPECT_EQ(i<2?0:1, rparam->epoch_);
+    EXPECT_GE(rparam->end_, 0);
+    EXPECT_NE(nullptr, rparam->ant_);
+  }
+}
+
+
+TEST(GlobalSchedulerTest, TestRestore) {
+  ResetClient();
+  ConnectToClient("localhost", "./v1");
+  GlobalScheduler sched("g1", kLocal);
+  sched.SetEpochs(2);
+
+  sched.AddPath(path);
+  sched.AddPath(path2);
+
+  ASSERT_TRUE(sched.Schedule());
+  auto rparam = sched.Acquire();
+  ASSERT_NE(nullptr, rparam);
+  EXPECT_EQ(0, rparam->begin_);
+  EXPECT_EQ(0, rparam->epoch_);
+  EXPECT_GE(rparam->end_, 0);
+  EXPECT_STREQ(rparam->path_, path);
+  EXPECT_NE(nullptr, rparam->ant_);
+
+  rparam->begin_ = 1;
+
+  rparam = sched.Acquire();
+  ASSERT_NE(nullptr, rparam);
+  EXPECT_EQ(0, rparam->begin_);
+  EXPECT_EQ(0, rparam->epoch_);
+  EXPECT_GE(rparam->end_, 0);
+  EXPECT_STREQ(rparam->path_, path2);
+  EXPECT_NE(nullptr, rparam->ant_);
+
+  rparam->begin_ = 2;
+
+  DSState ds_state;
+  sched.Store(&ds_state);
+
+  GlobalScheduler sched2("g1", kLocal);
+  sched2.Restore(ds_state);
+
+  ASSERT_TRUE(sched2.Schedule());
+
+  for (int i = 0; i < 6; ++i) {
+    rparam = sched2.Acquire();
+    if (i >= 4) {
+      ASSERT_EQ(nullptr, rparam);
+      continue;
+    }
+    ASSERT_NE(nullptr, rparam);
+    if (i == 0) {
+      EXPECT_EQ(2, rparam->begin_);
+      EXPECT_STREQ(rparam->path_, path2);
+    } else if (i == 1) {
+      EXPECT_EQ(1, rparam->begin_);
+      EXPECT_STREQ(rparam->path_, path);
+    } else {
+      EXPECT_EQ(0, rparam->begin_);
+    }
+
+    EXPECT_EQ(i<2?0:1, rparam->epoch_);
+    EXPECT_GE(rparam->end_, 0);
+    EXPECT_NE(nullptr, rparam->ant_);
+  }
+}
+
+}
+}
diff --git a/xdl/test/data_io/merger/merger_test.cc b/xdl/test/data_io/merger/merger_test.cc
index e0c0723d..629498e6 100644
--- a/xdl/test/data_io/merger/merger_test.cc
+++ b/xdl/test/data_io/merger/merger_test.cc
@@ -63,6 +63,7 @@ void MergerTest::SetUpTestCase() {
   merger_ = new Merger(&schema_, dev);
   auto a = batch_.GetMutable("a");
   a->ts_[Block::kKey] = new Tensor(dev, TensorShape({kFeatureCount, 1}), types::kInt64);
+  a->ts_[Block::kSegment] = new Tensor(dev, TensorShape({kFeatureCount, 1}), types::kInt32);  
   auto keys = a->ts_[Block::kKey]->Raw<int64_t>();
   int r = kFeatureCount / 2 + 1;
   for (size_t i = 0; i < kFeatureCount; ++i) {
@@ -74,6 +75,7 @@ void MergerTest::SetUpTestCase() {
   auto b = batch_.GetMutable("b");
   b->ts_[Block::kKey] = new Tensor(dev, TensorShape({kFeatureCount, 2}), types::kInt64);
   b->ts_[Block::kIndex] = new Tensor(dev, TensorShape({kFeatureCount}), types::kInt32);
+  b->ts_[Block::kSegment] = new Tensor(dev, TensorShape({kFeatureCount, 1}), types::kInt32);  
   keys = b->ts_[Block::kKey]->Raw<int64_t>();
   r = std::sqrt(kFeatureCount) + 1;
   for (size_t i = 0; i < kFeatureCount; ++i) {
@@ -98,16 +100,22 @@ TEST_F(MergerTest, TestRun) {
   EXPECT_NE(nullptr, a->ts_[Block::kKey]);
   EXPECT_NE(nullptr, a->ts_[Block::kUKey]);
   EXPECT_NE(nullptr, a->ts_[Block::kIndex]);
+  EXPECT_NE(nullptr, a->ts_[Block::kSIndex]);
+  EXPECT_NE(nullptr, a->ts_[Block::kSSegment]);    
 
   auto b = batch_.Get("b");
   EXPECT_NE(nullptr, b->ts_[Block::kKey]);
-  EXPECT_NE(nullptr, a->ts_[Block::kUKey]);
+  EXPECT_NE(nullptr, b->ts_[Block::kUKey]);
   EXPECT_NE(nullptr, b->ts_[Block::kIndex]);
+  EXPECT_NE(nullptr, b->ts_[Block::kSIndex]);
+  EXPECT_NE(nullptr, b->ts_[Block::kSSegment]);
 
   auto c = batch_.Get("c");
   EXPECT_EQ(nullptr, c->ts_[Block::kKey]);
   EXPECT_EQ(nullptr, c->ts_[Block::kUKey]);
   EXPECT_NE(nullptr, c->ts_[Block::kIndex]);
+  EXPECT_EQ(nullptr, c->ts_[Block::kSIndex]);
+  EXPECT_EQ(nullptr, c->ts_[Block::kSSegment]);    
 }
 
 }  // io
diff --git a/xdl/test/data_io/packer/pack_cutoff_test.cc b/xdl/test/data_io/packer/pack_cutoff_test.cc
new file mode 100644
index 00000000..e44ded4a
--- /dev/null
+++ b/xdl/test/data_io/packer/pack_cutoff_test.cc
@@ -0,0 +1,263 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/packer/pack_feature.h"
+
+#include <cstdlib>
+#include <ctime>
+#include <iostream>
+#include <map>
+#include <string>
+#include <vector>
+
+#include "gtest/gtest.h"
+
+#include "xdl/data_io/pool.h"
+#include "xdl/core/framework/cpu_device.h"
+
+
+namespace xdl {
+namespace io {
+
+
+class PackCutoffTest: public ::testing::Test {
+  static const size_t kBatchSize;
+
+ public:
+  static void SetUpTestCase();
+  static void TearDownTestCase();
+
+  static void TestStat();
+  static void TestSetup();
+  static void TestRun();
+
+  static PackFeature *pack_;
+  static Batch *batch_;
+
+
+ private:
+  static void CheckFeature();
+
+  static Device *dev_;
+  static Schema schema_;
+  static SampleGroup sg_;
+};
+
+const size_t PackCutoffTest::kBatchSize = 4;
+
+Device *PackCutoffTest::dev_ = nullptr;
+Schema PackCutoffTest::schema_;
+
+PackFeature *PackCutoffTest::pack_ = nullptr;
+Batch *PackCutoffTest::batch_ = nullptr;
+
+SampleGroup PackCutoffTest::sg_;
+
+void PackCutoffTest::SetUpTestCase() {
+  dev_ = new CpuDevice();
+  schema_.batch_size_ = kBatchSize;
+
+  for (auto fn: {"s", "l", "sr", "lr"}) {
+    FeatureOption *f = new FeatureOption();
+    f->set_name(fn);
+    f->set_type(kSparse);
+    f->set_table(0);
+    f->set_serialized(true);
+    int cutoff;
+    if (fn[0] == 's') {
+      cutoff = 3;
+    } else {
+      ASSERT_TRUE(fn[0] == 'l');
+      cutoff = 5;
+    }
+    if (strlen(fn) == 2) {
+      ASSERT_TRUE(fn[1] == 'r');
+      cutoff = -cutoff;
+    }
+    f->set_cutoff(cutoff);
+    schema_.Add(f);
+  }
+
+  auto ft = sg_.add_feature_tables();
+  for (int i = 0; i < kBatchSize; ++i) {
+    auto fl = ft->add_feature_lines();
+    for (auto fn: {"s", "l", "sr", "lr"}) {
+      auto f = fl->add_features();
+      f->set_name(fn);
+      f->set_type(kSparse);
+      for (int m = 1; m < 5; ++m) {
+        auto v = f->add_values();
+        v->set_key(m);
+        v->set_value(m*0.1);
+      }
+    }
+  }
+
+  pack_ = new PackFeature(dev_, &schema_);
+}
+
+void PackCutoffTest::TearDownTestCase() {
+  BatchPool::Get()->Release(batch_);
+  batch_ = nullptr;
+  delete pack_;
+  pack_ = nullptr;
+}
+
+
+void PackCutoffTest::CheckFeature() {
+  for (auto fn: {"s", "l", "sr", "lr"}) {
+    auto blk = batch_->Get(fn);
+    ASSERT_NE(nullptr, blk);
+
+    auto key = blk->ts_[Block::kKey];
+    auto value = blk->ts_[Block::kValue];
+    auto seg = blk->ts_[Block::kSegment];
+
+    uint64_t *keys = key->Raw<uint64_t>();
+    float *vals = value->Raw<float>();
+    uint32_t *segs = seg->Raw<uint32_t>();
+
+    int cutoff;
+    if (fn[0] == 's') {
+      cutoff = 3;
+    } else {
+      ASSERT_TRUE(fn[0] == 'l');
+      cutoff = 5;
+    }
+    if (strlen(fn) == 2) {
+      ASSERT_TRUE(fn[1] == 'r');
+      cutoff = -cutoff;
+    }
+
+    //std::cout << fn << " cutoff " << cutoff << std::endl;
+    for (int i = 0, n = 0, c = segs[n]; i < key->Shape()[0]; ++i, --c) {
+      if (c == 0) {
+        //std::cout << std::endl;
+        if (++ n == kBatchSize) { break; }
+        c = segs[n] - segs[n-1];
+        ASSERT_EQ(std::min(abs(cutoff), 4), c);
+        //std::cout << std::endl << "[" << n << "]";
+      }
+      //std::cout<< keys[i] << ":"  << vals[i] << " ";
+      if (cutoff > 0) {
+        EXPECT_EQ(i - segs[n-1] + 1, keys[i]);
+        EXPECT_FLOAT_EQ((i - segs[n-1] + 1)*0.1, vals[i]);
+      } else {
+        //EXPECT_EQ(4 - (i - segs[n-1]), keys[i]);
+        //EXPECT_FLOAT_EQ((4 - (i - segs[n-1]))*0.1, vals[i]);
+        EXPECT_EQ((i - segs[n-1]) + std::max(0, 4+cutoff) + 1, keys[i]);
+        EXPECT_FLOAT_EQ(((i - segs[n-1]) + std::max(0, 4+cutoff) + 1)*0.1, vals[i]);
+      }
+    }
+    //std::cout << std::endl;
+  }
+}
+
+void PackCutoffTest::TestStat() {
+  PParam pparam;
+
+  pparam.begin_ = 0;
+  pparam.end_ = sg_.feature_tables(0).feature_lines_size();
+  pparam.ftable_ = &sg_.feature_tables(0);
+  pparam.ktable_ = 0;
+  pparam.isgroup_ = 0;
+  EXPECT_GE(pparam.begin_, 0);
+  EXPECT_GE(pparam.end_, kBatchSize);
+  //std::cout << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
+  //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
+  auto range = pack_->Stat(pparam);
+  pparam.begin_ = range.first;
+  pparam.end_ = range.second;
+}
+
+void PackCutoffTest::TestSetup() {
+  ASSERT_TRUE(pack_->Setup());
+
+  for (auto &it: schema_.feature_opts()) {
+    auto opt = it.second;
+    auto ktable = opt->table();
+
+    auto blk = batch_->GetMutable(opt->name());
+    ASSERT_NE(nullptr, blk);
+    ASSERT_NE(nullptr, blk->ts_[Block::kValue]);
+    ASSERT_NE(nullptr, blk->ts_[Block::kKey]);
+    ASSERT_NE(nullptr, blk->ts_[Block::kSegment]);
+    auto kdims = blk->ts_[Block::kKey]->Shape().Dims();
+    auto sdims = blk->ts_[Block::kSegment]->Shape().Dims();
+    auto fn = opt->name().c_str();
+    int cutoff;
+    if (fn[0] == 's') {
+      cutoff = 3;
+    } else {
+      ASSERT_TRUE(fn[0] == 'l');
+      cutoff = 5;
+    }
+    if (strlen(fn) == 2) {
+      ASSERT_TRUE(fn[1] == 'r');
+      cutoff = -cutoff;
+    }
+    ASSERT_EQ(cutoff, opt->cutoff());
+    ASSERT_EQ(kSparse, opt->type());
+    ASSERT_EQ(std::vector<size_t>({kBatchSize*std::min(4, abs(cutoff))}), kdims);
+    ASSERT_EQ(std::vector<size_t>({kBatchSize}), sdims);
+    ASSERT_EQ(3, blk->ts_count_);
+  }
+
+  ASSERT_EQ(12, batch_->ts_count_);
+}
+
+void PackCutoffTest::TestRun() {
+  PParam pparam;
+
+  pparam.begin_ = 0;
+  pparam.end_ = sg_.feature_tables(0).feature_lines_size();
+  pparam.ftable_ = &sg_.feature_tables(0);
+  pparam.ktable_ = 0;
+  pparam.isgroup_ = 0;
+  //std::cout << "run[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
+  //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
+  auto range = pack_->Run(pparam);
+  pparam.begin_ = range.first;
+  pparam.end_ = range.second;
+
+  CheckFeature();
+
+  EXPECT_EQ(12, batch_->ts_count_);
+}
+
+TEST_F(PackCutoffTest, Run) {
+  batch_ = BatchPool::Get()->Acquire();
+  EXPECT_NE(nullptr, batch_);
+
+  EXPECT_TRUE(pack_->Init(batch_));
+
+  TestStat();
+  TestSetup();
+  TestRun();
+
+  batch_->Reuse();
+  batch_ = nullptr;
+
+  //std::cout << "cycles: " << pack_->cycles_ << std::endl;
+}
+
+}  // io
+}  // xdl
+
+int main(int argc, char **argv)
+{
+  ::testing::InitGoogleTest(&argc, argv);
+  return RUN_ALL_TESTS();
+}
diff --git a/xdl/test/data_io/packer/pack_feature_test.cc b/xdl/test/data_io/packer/pack_feature_test.cc
index 2a704290..de82d552 100644
--- a/xdl/test/data_io/packer/pack_feature_test.cc
+++ b/xdl/test/data_io/packer/pack_feature_test.cc
@@ -34,10 +34,10 @@ namespace xdl {
 namespace io {
 
 
-typedef std::map<std::string, std::vector<std::pair<unsigned, float>>> SMap;
-typedef std::map<std::string, std::vector<float>> DMap;
+typedef std::map<std::string, std::vector<std::pair<unsigned, float>>> FSMap;
+typedef std::map<std::string, std::vector<float>> FDMap;
 
-typedef std::vector<std::pair<SMap, DMap>> F4SG;
+typedef std::vector<std::pair<FSMap, FDMap>> FTable;
 
 class PackFeatureTest: public ::testing::Test {
   static const size_t kBatchSize;
@@ -49,7 +49,7 @@ class PackFeatureTest: public ::testing::Test {
   static void SetUpTestCase();
   static void TearDownTestCase();
 
-  static size_t sample_count_4_sg(size_t ktable);
+  static size_t sample_count(size_t ktable);
   static size_t batch_size(size_t ktable);
 
   static void TestStat();
@@ -61,15 +61,15 @@ class PackFeatureTest: public ::testing::Test {
 
 
  private:
-  static void InitTable(FeatureTable *ft, F4SG &vfs, int c, int ktable);
-  static void InitSampleGroup(SampleGroup &sg, std::vector<F4SG> &vfs, int sgi);
+  static void InitTable(FeatureTable *ft, FTable &fft, int c, int ktable);
+  static void InitSampleGroup(SampleGroup &sg, std::vector<FTable> &fsg, int sgi);
   static void CheckIndicator();
   static void CheckFeature();
 
   static Device *dev_;
   static Schema schema_;
 
-  static std::vector<std::vector<F4SG>> vfs_;  // [sg][table]
+  static std::vector<std::vector<FTable>> fsgs_;  // [sg][table]
   static std::vector<SampleGroup> sgs_;
 };
 
@@ -86,10 +86,10 @@ Schema PackFeatureTest::schema_;
 PackFeature *PackFeatureTest::pack_ = nullptr;
 Batch *PackFeatureTest::batch_ = nullptr;
 
-std::vector<std::vector<F4SG>> PackFeatureTest::vfs_;
+std::vector<std::vector<FTable>> PackFeatureTest::fsgs_;
 std::vector<SampleGroup> PackFeatureTest::sgs_;
 
-size_t PackFeatureTest::sample_count_4_sg(size_t ktable) {
+size_t PackFeatureTest::sample_count(size_t ktable) {
   size_t c = kBatchSize/kSGCount - 1;
   for (int k = 0; k < ktable; ++k) {
     c = c / 2 + 1;
@@ -100,9 +100,9 @@ size_t PackFeatureTest::sample_count_4_sg(size_t ktable) {
 size_t PackFeatureTest::batch_size(size_t ktable) {
     size_t batch_size = kBatchSize;
     if (ktable > 0) {
-      size_t c = sample_count_4_sg(ktable);
+      size_t c = sample_count(ktable);
       batch_size = c * kSGCount;
-      if (sample_count_4_sg(0) * kSGCount < kBatchSize) {
+      if (sample_count(0) * kSGCount < kBatchSize) {
         batch_size += 1;
       }
     }
@@ -130,32 +130,31 @@ void PackFeatureTest::SetUpTestCase() {
     }
   }
 
-  vfs_.resize(kSGCount);
+  fsgs_.resize(kSGCount);
   sgs_.resize(kSGCount);
 
-  //std::srand(std::time(nullptr));
-  std::srand(0);
+  std::srand(std::time(nullptr));
   for (int i = 0; i < kSGCount; ++i) {
-    InitSampleGroup(sgs_[i], vfs_[i], i);
+    InitSampleGroup(sgs_[i], fsgs_[i], i);
     //std::cout << sgs_[i].DebugString() << std::endl;
   }
 
   pack_ = new PackFeature(dev_, &schema_);
 }
 
-void PackFeatureTest::InitTable(FeatureTable *ft, F4SG &vfs, int c, int ktable) {
+void PackFeatureTest::InitTable(FeatureTable *ft, FTable &fft, int c, int ktable) {
   EXPECT_LT(ktable, kTableCount);
 
   if (times == 1) {
-    vfs.resize(c);
+    fft.resize(c);
   }
 
   for (int i = 0; i < c; ++i) {
     auto fl = ft->add_feature_lines();
     // sparse
-    SMap *smap = nullptr;
+    FSMap *smap = nullptr;
     if (times == 1) {
-      smap = &vfs[i].first;
+      smap = &fft[i].first;
     }
     int cs = std::rand() % 4 + 1;
     for (int j = 0; j < cs; ++j) {
@@ -168,16 +167,16 @@ void PackFeatureTest::InitTable(FeatureTable *ft, F4SG &vfs, int c, int ktable)
         kv->set_value(0.1*k);
       }
       if (times == 1) {
-        smap->insert(SMap::value_type(std::to_string(ktable)+"u"+std::to_string(j), kvs));
+        smap->insert(FSMap::value_type(std::to_string(ktable)+"u"+std::to_string(j), kvs));
       }
       f->set_name(std::to_string(ktable)+"u"+std::to_string(j));
       f->set_type(kSparse);
     }
 
     // dense
-    DMap *dmap = nullptr;
+    FDMap *dmap = nullptr;
     if (times == 1) {
-      dmap = &vfs[i].second;
+      dmap = &fft[i].second;
     }
     int cd = std::rand() % 4 + 1;
     for (int j = 0; j < cd; ++j) {
@@ -189,7 +188,7 @@ void PackFeatureTest::InitTable(FeatureTable *ft, F4SG &vfs, int c, int ktable)
         v->add_vector(0.1*k);
       }
       if (times == 1) {
-        dmap->insert(DMap::value_type(std::to_string(ktable)+"a"+std::to_string(j), vs));
+        dmap->insert(FDMap::value_type(std::to_string(ktable)+"a"+std::to_string(j), vs));
       }
       f->set_name(std::to_string(ktable)+"a"+std::to_string(j));
       f->set_type(kDense);
@@ -202,15 +201,15 @@ void PackFeatureTest::InitTable(FeatureTable *ft, F4SG &vfs, int c, int ktable)
   }
 }
 
-void PackFeatureTest::InitSampleGroup(SampleGroup &sg, std::vector<F4SG> &vfs, int sgi) {
+void PackFeatureTest::InitSampleGroup(SampleGroup &sg, std::vector<FTable> &fsgs, int sgi) {
   if (times == 1) {
-    vfs.resize(kTableCount);
+    fsgs.resize(kTableCount);
   }
 
   for (int ktable = 0; ktable < kTableCount; ++ktable) {
     auto ft = sg.add_feature_tables();
-    int c = sample_count_4_sg(ktable);
-    InitTable(ft, vfs[ktable], c, ktable);
+    int c = sample_count(ktable);
+    InitTable(ft, fsgs[ktable], c, ktable);
   }
 }
 
@@ -233,7 +232,7 @@ void PackFeatureTest::TestStat() {
       pparam.isgroup_ = i;
       EXPECT_GE(pparam.begin_, 0);
       if (times == 1) {
-        EXPECT_LE(pparam.end_, vfs_[i][ktable].size());
+        EXPECT_LE(pparam.end_, fsgs_[i][ktable].size());
       }
       //std::cout << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
       //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
@@ -242,7 +241,6 @@ void PackFeatureTest::TestStat() {
       pparam.end_ = range.second;
     }
   }
-
 }
 
 void PackFeatureTest::TestSetup() {
@@ -280,7 +278,7 @@ void PackFeatureTest::CheckIndicator() {
   if (times > 1) {
     return;
   }
-  ASSERT_EQ(kSGCount, vfs_.size());
+  ASSERT_EQ(kSGCount, fsgs_.size());
   ASSERT_EQ(kSGCount, sgs_.size());
 
   if (kTableCount <= 1) {
@@ -321,7 +319,7 @@ void PackFeatureTest::CheckIndicator() {
         << " shape=(" << blk->ts_[Block::kIndex]->Shape()[0] << ") bs=" << bs;
     ASSERT_EQ(1, blk->ts_count_);
     auto indices = blk->ts_[Block::kIndex]->Raw<int32_t>();
-    size_t c = sample_count_4_sg(t) * kSGCount;
+    size_t c = sample_count(t) * kSGCount;
     ASSERT_EQ(c, acc[t]);
     for (int i = acc[t]; i < bs; ++i) {
       ASSERT_EQ(acc[t+1], indices[i] + 1) << "t=" << t << " i=" << i << " bs=" << bs;  // TODO: should be ASSERT_EQ(acc[t+1], indices[i])
@@ -344,16 +342,15 @@ void PackFeatureTest::CheckFeature() {
     auto segment = blk->ts_[Block::kSegment];
 
     float *values = value->Raw<float>();
-    ASSERT_NE(nullptr, values);
+    //ASSERT_NE(nullptr, values) << "name=" << opt->name() << " table=" << opt->table();
 
     int64_t *keys = nullptr;
     int32_t *segments = nullptr;
 
-    ASSERT_NE(nullptr, value);
     if (opt->type() == kSparse) {
       ASSERT_NE(nullptr, key);
       keys = key->Raw<int64_t>();
-      ASSERT_NE(nullptr, keys);
+      //ASSERT_NE(nullptr, keys);
 
       ASSERT_NE(nullptr, segment);
       segments = segment->Raw<int32_t>();
@@ -369,13 +366,13 @@ void PackFeatureTest::CheckFeature() {
     int n = 0;  // sample count
     int m = 0;  // id count
 
-    for (auto vsg: vfs_) {
-      auto &vfs = vsg[ktable];
-      /// each sample group
-      for (auto &sd: vfs) {
+    for (auto fsg: fsgs_) {
+      auto &fft = fsg[ktable];
+      /// each table
+      for (auto &ffl: fft) {
         /// each feature line
-        auto &smap = sd.first;
-        auto &dmap = sd.second;
+        auto &smap = ffl.first;
+        auto &dmap = ffl.second;
         if (opt->type() == kSparse) {
           auto it = smap.find(opt->name());
           if (it != smap.end()) {
@@ -415,14 +412,14 @@ void PackFeatureTest::CheckFeature() {
     }  /// for each sample group
 
 
-    int c = sample_count_4_sg(ktable) * kSGCount;
+    int c = sample_count(ktable) * kSGCount;
     ASSERT_EQ(c, n) << "ktable=" << ktable;
 
     size_t bs = batch_size(ktable);
     /// padding zero
     for (; n < bs; ++n) {
       if (opt->type() == kSparse) {
-        EXPECT_EQ(m, segments[n]);
+        EXPECT_EQ(m, segments[n]) << "feature=" << opt->name() << " n=" << n;
       } else {
         for (int i = 0; i < opt->nvec(); ++i) {
           EXPECT_FLOAT_EQ(0, values[m]) << "feature=" << opt->name()
@@ -448,6 +445,8 @@ void PackFeatureTest::CheckFeature() {
       EXPECT_EQ(m, dims[0]);
       EXPECT_EQ(opt->has_nvec()?opt->nvec():1, dims[1]);
 
+      std::cout << "feature=" << opt->name() << " seg" << segment->Shape() << 
+          " idx" << key->Shape() << " val" << value->Shape() << " pass check" << std::endl;
       //LOG(INFO) << "feature=" << opt->name() << " seg" << segment->Shape() << 
       //    " idx" << key->Shape() << " val" << value->Shape() << " pass check";
     } else {
@@ -512,7 +511,6 @@ TEST_F(PackFeatureTest, Run) {
 int main(int argc, char **argv)
 {
   ::testing::InitGoogleTest(&argc, argv);
-
   for (int i = 1; i < argc; ++i) {
     printf("arg %2d = %s\n", i, argv[i]);
   }
diff --git a/xdl/test/data_io/packer/pack_mask_test.cc b/xdl/test/data_io/packer/pack_mask_test.cc
new file mode 100644
index 00000000..54892b6f
--- /dev/null
+++ b/xdl/test/data_io/packer/pack_mask_test.cc
@@ -0,0 +1,205 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/packer/pack_feature.h"
+
+#include <cstdlib>
+#include <ctime>
+#include <iostream>
+#include <map>
+#include <string>
+#include <vector>
+
+#include "gtest/gtest.h"
+
+#include "xdl/data_io/pool.h"
+#include "xdl/core/framework/cpu_device.h"
+
+
+namespace xdl {
+namespace io {
+
+
+class PackMaskTest: public ::testing::Test {
+  static const size_t kBatchSize;
+
+ public:
+  static void SetUpTestCase();
+  static void TearDownTestCase();
+
+  static void TestStat();
+  static void TestSetup();
+  static void TestRun();
+
+  static PackFeature *pack_;
+  static Batch *batch_;
+
+
+ private:
+  static void CheckFeature();
+
+  static Device *dev_;
+  static Schema schema_;
+  static SampleGroup sg_;
+};
+
+const size_t PackMaskTest::kBatchSize = 4;
+
+Device *PackMaskTest::dev_ = nullptr;
+Schema PackMaskTest::schema_;
+
+PackFeature *PackMaskTest::pack_ = nullptr;
+Batch *PackMaskTest::batch_ = nullptr;
+
+SampleGroup PackMaskTest::sg_;
+
+void PackMaskTest::SetUpTestCase() {
+  dev_ = new CpuDevice();
+  schema_.batch_size_ = kBatchSize;
+
+  FeatureOption *d = new FeatureOption();
+  d->set_name("d");
+  d->set_type(kDense);
+  d->set_nvec(4);
+  d->set_table(0);
+  d->set_mask("1110");
+  schema_.Add(d);
+
+  auto ft = sg_.add_feature_tables();
+  for (int i = 0; i < kBatchSize; ++i) {
+    auto fl = ft->add_feature_lines();
+    auto f = fl->add_features();
+    f->set_name("d");
+    f->set_type(kDense);
+    auto v = f->add_values();
+    for (int m = 0; m < 4; ++m) {
+        v->add_vector(0.1*m);
+    }
+  }
+
+  pack_ = new PackFeature(dev_, &schema_);
+}
+
+void PackMaskTest::TearDownTestCase() {
+  BatchPool::Get()->Release(batch_);
+  batch_ = nullptr;
+  delete pack_;
+  pack_ = nullptr;
+}
+
+
+void PackMaskTest::CheckFeature() {
+  for (auto &kv : schema_.feature_opts()) {
+    auto &opt = kv.second;
+    auto blk = batch_->Get(opt->name());
+    ASSERT_NE(nullptr, blk);
+
+    auto value = blk->ts_[Block::kValue];
+    ASSERT_EQ(kBatchSize, value->Shape()[0]);
+    ASSERT_EQ(3, value->Shape()[1]);
+
+    float *values = value->Raw<float>();
+    for (int i = 0; i < value->Shape()[0]; ++i) {
+      for (int m = 0; m < value->Shape()[1]; ++m) {
+        std::cout << values[i*value->Shape()[1]+m] << ", ";
+      }
+      std::cout << std::endl;
+    }
+  }
+}
+
+void PackMaskTest::TestStat() {
+  PParam pparam;
+
+  pparam.begin_ = 0;
+  pparam.end_ = sg_.feature_tables(0).feature_lines_size();
+  pparam.ftable_ = &sg_.feature_tables(0);
+  pparam.ktable_ = 0;
+  pparam.isgroup_ = 0;
+  EXPECT_GE(pparam.begin_, 0);
+  EXPECT_GE(pparam.end_, kBatchSize);
+  //std::cout << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
+  //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
+  auto range = pack_->Stat(pparam);
+  pparam.begin_ = range.first;
+  pparam.end_ = range.second;
+}
+
+void PackMaskTest::TestSetup() {
+  ASSERT_TRUE(pack_->Setup());
+
+  for (auto &it: schema_.feature_opts()) {
+    auto opt = it.second;
+
+    auto blk = batch_->GetMutable(opt->name());
+    ASSERT_NE(nullptr, blk);
+    ASSERT_NE(nullptr, blk->ts_[Block::kValue]);
+    auto vdims = blk->ts_[Block::kValue]->Shape().Dims();
+
+    auto ktable = opt->table();
+    size_t bs = kBatchSize;
+
+    ASSERT_EQ(kDense, opt->type());
+    ASSERT_EQ(2, vdims.size());
+    ASSERT_EQ(bs, vdims[0]);
+    ASSERT_EQ(1, blk->ts_count_);
+  }
+
+  ASSERT_EQ(1, batch_->ts_count_);
+}
+
+void PackMaskTest::TestRun() {
+  PParam pparam;
+
+  pparam.begin_ = 0;
+  pparam.end_ = sg_.feature_tables(0).feature_lines_size();
+  pparam.ftable_ = &sg_.feature_tables(0);
+  pparam.ktable_ = 0;
+  pparam.isgroup_ = 0;
+  //std::cout << "run[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
+  //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
+  auto range = pack_->Run(pparam);
+  pparam.begin_ = range.first;
+  pparam.end_ = range.second;
+
+  CheckFeature();
+
+  EXPECT_EQ(1, batch_->ts_count_);
+}
+
+TEST_F(PackMaskTest, Run) {
+  batch_ = BatchPool::Get()->Acquire();
+  EXPECT_NE(nullptr, batch_);
+
+  EXPECT_TRUE(pack_->Init(batch_));
+
+  TestStat();
+  TestSetup();
+  TestRun();
+
+  batch_->Reuse();
+  batch_ = nullptr;
+
+  //std::cout << "cycles: " << pack_->cycles_ << std::endl;
+}
+
+}  // io
+}  // xdl
+
+int main(int argc, char **argv)
+{
+  ::testing::InitGoogleTest(&argc, argv);
+  return RUN_ALL_TESTS();
+}
diff --git a/xdl/test/data_io/packer/pack_padding_test.cc b/xdl/test/data_io/packer/pack_padding_test.cc
new file mode 100644
index 00000000..95d685a1
--- /dev/null
+++ b/xdl/test/data_io/packer/pack_padding_test.cc
@@ -0,0 +1,252 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/packer/pack_feature.h"
+
+#include <cstdlib>
+#include <ctime>
+#include <iostream>
+#include <map>
+#include <string>
+#include <vector>
+
+#include "gtest/gtest.h"
+
+#include "xdl/data_io/pool.h"
+#include "xdl/core/framework/cpu_device.h"
+
+
+namespace xdl {
+namespace io {
+
+
+class PackFeatureTest: public ::testing::Test {
+  static const size_t kBatchSize;
+  static const size_t kSGCount;
+  static const size_t kTableCount;
+
+ public:
+  static void SetUpTestCase();
+  static void TearDownTestCase();
+
+  static size_t sample_count(size_t ktable);
+  static size_t batch_size(size_t ktable);
+
+  static void TestStat();
+  static void TestSetup();
+  static void TestRun();
+
+  static PackFeature *pack_;
+  static Batch *batch_;
+
+
+ private:
+  static void CheckIndicator();
+  static void CheckFeature();
+
+  static Device *dev_;
+  static Schema schema_;
+
+  static std::vector<SampleGroup> sgs_;
+};
+
+const size_t PackFeatureTest::kBatchSize = 8192;
+//const size_t PackFeatureTest::kBatchSize = 4;
+const size_t PackFeatureTest::kSGCount = 128;
+//const size_t PackFeatureTest::kSGCount = 2;
+const size_t PackFeatureTest::kTableCount = 2;
+
+Device *PackFeatureTest::dev_ = nullptr;
+Schema PackFeatureTest::schema_;
+
+PackFeature *PackFeatureTest::pack_ = nullptr;
+Batch *PackFeatureTest::batch_ = nullptr;
+
+std::vector<SampleGroup> PackFeatureTest::sgs_;
+
+size_t PackFeatureTest::sample_count(size_t ktable) {
+  size_t c = kBatchSize/kSGCount - 1;
+  for (int k = 0; k < ktable+1; ++k) {
+    c = c / 2 + 1;
+  }
+  return c;
+}
+
+size_t PackFeatureTest::batch_size(size_t ktable) {
+  size_t c = sample_count(ktable);
+  return c * kSGCount;
+}
+
+void PackFeatureTest::SetUpTestCase() {
+  dev_ = new CpuDevice();
+  schema_.batch_size_ = kBatchSize;
+  schema_.padding_ = false;
+
+  for (int ktable = 0; ktable < kTableCount; ++ktable) {
+    FeatureOption *s = new FeatureOption();
+    s->set_name(std::to_string(ktable)+"s");
+    s->set_type(kSparse);
+    s->set_table(ktable);
+    schema_.Add(s);
+
+    FeatureOption *d = new FeatureOption();
+    d->set_name(std::to_string(ktable)+"a");
+    d->set_type(kDense);
+    d->set_nvec(2);
+    d->set_table(ktable);
+    schema_.Add(d);
+  }
+
+  sgs_.resize(kSGCount);
+
+  for (int i = 0; i < kSGCount; ++i) {
+    auto &sg = sgs_[i];
+    int count = kBatchSize/kSGCount - 1;
+    for (int ktable = 0; ktable < kTableCount; ++ktable) {
+      count = count / 2 + 1;
+      auto ft = sg.add_feature_tables();
+      for (int n = 0; n < count; ++n) {
+        auto fl = ft->add_feature_lines();
+        auto f = fl->add_features();
+        f->set_name(std::to_string(ktable)+"d");
+        f->set_type(kDense);
+        auto v = f->add_values();
+        for (int m = 0; m < 2; ++m) {
+          v->add_vector(0.1*m);
+        }
+        f = fl->add_features();
+        f->set_name(std::to_string(ktable)+"s");
+        f->set_type(kSparse);
+        v = f->add_values();
+        v->set_key(1);
+        v->set_value(0.6);
+        /// refer
+        if (ktable < kTableCount - 1) {
+          fl->set_refer((n+1)/2);
+        }
+      }
+    }
+  }
+
+  pack_ = new PackFeature(dev_, &schema_);
+}
+
+void PackFeatureTest::TearDownTestCase() {
+  BatchPool::Get()->Release(batch_);
+  batch_ = nullptr;
+  delete pack_;
+  pack_ = nullptr;
+}
+
+void PackFeatureTest::TestStat() {
+  PParam pparam;
+
+  for (int i = 0; i < kSGCount; ++i) {
+    int count = kBatchSize/kSGCount - 1;
+    pparam.begin_ = 0;
+    pparam.end_ = sgs_[i].feature_tables(0).feature_lines_size();
+    for (int ktable = 0; ktable < kTableCount; ++ktable) {
+      count = count / 2 + 1;
+      pparam.ftable_ = &sgs_[i].feature_tables(ktable);
+      pparam.ktable_ = ktable;
+      pparam.isgroup_ = i;
+      EXPECT_GE(pparam.begin_, 0);
+      EXPECT_LE(pparam.end_, count);
+      //std::cout << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
+      //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
+      auto range = pack_->Stat(pparam);
+      pparam.begin_ = range.first;
+      pparam.end_ = range.second;
+    }
+  }
+
+}
+
+void PackFeatureTest::TestSetup() {
+  ASSERT_TRUE(pack_->Setup());
+
+  for (auto &it: schema_.feature_opts()) {
+    auto opt = it.second;
+
+    auto blk = batch_->GetMutable(opt->name());
+    ASSERT_NE(nullptr, blk);
+    ASSERT_NE(nullptr, blk->ts_[Block::kValue]);
+    auto vdims = blk->ts_[Block::kValue]->Shape().Dims();
+
+    auto ktable = opt->table();
+    size_t bs = batch_size(ktable);
+
+    if (opt->type() == kSparse) {
+      ASSERT_NE(nullptr, blk->ts_[Block::kKey]);
+      auto kdims = blk->ts_[Block::kKey]->Shape().Dims();
+      ASSERT_NE(nullptr, blk->ts_[Block::kSegment]);
+      auto sdims = blk->ts_[Block::kSegment]->Shape().Dims();
+      ASSERT_EQ(bs, sdims[0]);
+      ASSERT_EQ(3, blk->ts_count_);
+    } else {
+      ASSERT_EQ(2, vdims.size());
+      ASSERT_EQ(bs, vdims[0]);
+      ASSERT_EQ(1, blk->ts_count_);
+    }
+  }
+
+  ASSERT_EQ(kTableCount*(3+1) + kTableCount-1, batch_->ts_count_);
+}
+
+
+void PackFeatureTest::TestRun() {
+  PParam pparam;
+
+  for (int i = 0; i < kSGCount; ++i) {
+    pparam.begin_ = 0;
+    pparam.end_ = sgs_[i].feature_tables(0).feature_lines_size();
+    for (int ktable = 0; ktable < kTableCount; ++ktable) {
+      pparam.ftable_ = &sgs_[i].feature_tables(ktable);
+      pparam.ktable_ = ktable;
+      pparam.isgroup_ = i;
+      //std::cout << "run[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ 
+      //    << " -> " <<  pparam.end_ << "(" << pparam.ftable_->feature_lines_size() << ")" << std::endl;
+      auto range = pack_->Run(pparam);
+      pparam.begin_ = range.first;
+      pparam.end_ = range.second;
+    }
+  }
+}
+
+TEST_F(PackFeatureTest, Run) {
+
+    batch_ = BatchPool::Get()->Acquire();
+    EXPECT_NE(nullptr, batch_);
+
+    EXPECT_TRUE(pack_->Init(batch_));
+
+    TestStat();
+    TestSetup();
+    TestRun();
+
+    batch_->Reuse();
+    batch_ = nullptr;
+
+    //std::cout << "cycles: " << pack_->cycles_ << std::endl;
+}
+
+}  // io
+}  // xdl
+
+int main(int argc, char **argv)
+{
+  ::testing::InitGoogleTest(&argc, argv);
+  return RUN_ALL_TESTS();
+}
diff --git a/xdl/test/data_io/packer/pack_skey_test.cc b/xdl/test/data_io/packer/pack_skey_test.cc
index cd929e71..59573074 100644
--- a/xdl/test/data_io/packer/pack_skey_test.cc
+++ b/xdl/test/data_io/packer/pack_skey_test.cc
@@ -46,7 +46,7 @@ class PackSKeyTest: public ::testing::Test {
     int c = std::rand() % 32 + 1;
     for (int i = 0; i < c; ++i) {
       auto s = std::to_string(i);
-      skey_len_max_ = std::max(skey_len_max_, s.size());
+      skey_len_max_ = std::max(skey_len_max_, s.size()+1);
       s1_.push_back(s);
       sg1_.add_sample_ids(s);
     }
@@ -54,7 +54,7 @@ class PackSKeyTest: public ::testing::Test {
     c = std::rand() % 32 + 1;
     for (int i = 0; i < c; ++i) {
       auto s = std::to_string(i*1000);
-      skey_len_max_ = std::max(skey_len_max_, s.size());
+      skey_len_max_ = std::max(skey_len_max_, s.size()+1);
       s2_.push_back(s);
       sg2_.add_sample_ids(s);
     }
@@ -121,20 +121,15 @@ void PackSKeyTest::TestSetup() {
 
   auto blk = batch_->GetMutable(kSKeyName);
   EXPECT_NE(nullptr, blk);
-  EXPECT_NE(nullptr, blk->ts_[Block::kIndex]);
   EXPECT_NE(nullptr, blk->ts_[Block::kSBuf]);
 
-  auto dims = blk->ts_[Block::kIndex]->Shape().Dims();
-  EXPECT_EQ(1, dims.size());
-  EXPECT_EQ(kBatchSize, dims[0]);
-
-  dims = blk->ts_[Block::kSBuf]->Shape().Dims();
+  auto dims = blk->ts_[Block::kSBuf]->Shape().Dims();
   EXPECT_EQ(2, dims.size());
   EXPECT_EQ(kBatchSize, dims[0]);
   EXPECT_EQ(skey_len_max_, dims[1]);
 
-  EXPECT_EQ(2, blk->ts_count_);
-  EXPECT_EQ(2, batch_->ts_count_);
+  EXPECT_EQ(1, blk->ts_count_);
+  EXPECT_EQ(1, batch_->ts_count_);
 }
 
 void PackSKeyTest::TestRun() {
@@ -153,21 +148,20 @@ void PackSKeyTest::TestRun() {
   pack_->Run(pparam);
 
   auto blk = batch_->GetMutable(kSKeyName);
-  auto slen = blk->ts_[Block::kIndex]->Raw<int32_t>();
   auto sbuf = (char *)blk->ts_[Block::kSBuf]->Raw<int8_t>();
   auto dims = blk->ts_[Block::kSBuf]->Shape().Dims();
   EXPECT_EQ(2, dims.size());
   EXPECT_EQ(kBatchSize, dims[0]);
   EXPECT_EQ(skey_len_max_, dims[1]);
 
-  EXPECT_EQ(2, blk->ts_count_);
-  EXPECT_EQ(2, batch_->ts_count_);
+  EXPECT_EQ(1, blk->ts_count_);
+  EXPECT_EQ(1, batch_->ts_count_);
 
   for (int n = 0; n < dims[0]; ++n) {
     if (n < s1_.size() + s2_.size()) {
       std::string &s = n < s1_.size() ? s1_[n] : s2_[n-s1_.size()];
-      EXPECT_EQ(s.size(), (unsigned)slen[n]);
-      EXPECT_STREQ(s.c_str(), std::string(&sbuf[n*dims[1]], slen[n]).c_str());
+      EXPECT_EQ(s.size(), strlen(&sbuf[n*dims[1]]));
+      EXPECT_STREQ(s.c_str(), &sbuf[n*dims[1]]);
     }
   }
 }
diff --git a/xdl/test/data_io/parser/parse_v4_test.cc b/xdl/test/data_io/parser/parse_v4_test.cc
index 48e17151..155cc02f 100644
--- a/xdl/test/data_io/parser/parse_v4_test.cc
+++ b/xdl/test/data_io/parser/parse_v4_test.cc
@@ -31,23 +31,27 @@ TEST(ParseV4Test, TestRun) {
   meta.set_data_source_name("XXX");
   meta.set_batch_type(v4::kTrainBatch);
 
-  auto comm = meta.add_data_block_meta();
-  auto ncomm = meta.add_data_block_meta();
+  {
+    auto comm = meta.add_data_block_meta();
+    auto ncomm = meta.add_data_block_meta();
 
-  comm->set_data_block_type(v4::kCommonFeature);
-  ncomm->set_data_block_type(v4::kNCommonFeature);
+    comm->set_data_block_type(v4::kCommonFeature);
+    ncomm->set_data_block_type(v4::kNCommonFeature);
 
-  auto fgm = comm->add_feature_group_meta();
-  fgm->set_feature_group_name("comm1");
-  fgm->set_feature_type(v4::kKeyValue);
+    auto fgm = comm->add_feature_group_meta();
+    fgm->set_feature_group_name("comm1");
+    fgm->set_feature_type(v4::kKeyValue);
 
-  fgm = ncomm->add_feature_group_meta();
-  fgm->set_feature_group_name("ncomm1");
-  fgm->set_feature_type(v4::kKeyValue);
+    fgm = ncomm->add_feature_group_meta();
+    fgm->set_feature_group_name("ncomm1");
+    fgm->set_feature_type(v4::kKeyValue);
+  }
 
   std::string contents;
   EXPECT_TRUE(meta.SerializeToString(&contents));
 
+  int N = 10;
+
   Schema schema;
   schema.label_count_ = 2;
   ParseV4 p(&schema);
@@ -55,35 +59,40 @@ TEST(ParseV4Test, TestRun) {
 
   v4::SampleGroup v4sg;
 
-  auto blk = v4sg.add_data_block();
-  blk->set_data_block_type(v4::kCommonFeature);
-  auto fb = blk->add_feature_block();
+  auto ncomm = v4sg.add_data_block();
+  ncomm->set_data_block_type(v4::kNCommonFeature);
+
+  auto label = v4sg.add_data_block();
+  label->set_data_block_type(v4::kLabel);
+
+  auto skey = v4sg.add_data_block();
+  skey->set_data_block_type(v4::kSampleInfo);
+
+  for (int i = 0; i < N; ++i) {
+    auto fb = ncomm->add_feature_block();
+    auto fg = fb->add_feature_group();
+    fg->set_feature_index(0);
+    auto kv = fg->add_kv_feature();
+    kv->set_id(i);
+    kv->set_value(0.2*i);
+
+    auto lb = label->add_label_block();
+    lb->add_data(0.1*i);
+    lb->add_data(0.1*i);
+
+    auto sb = skey->add_sample_info_block();
+    sb->set_info(std::to_string(i));
+  }
+
+  auto comm= v4sg.add_data_block();
+  comm->set_data_block_type(v4::kCommonFeature);
+  auto fb = comm->add_feature_block();
   auto fg = fb->add_feature_group();
   fg->set_feature_index(0);
   auto kv = fg->add_kv_feature();
   kv->set_id(1);
   kv->set_value(0.1);
 
-  blk = v4sg.add_data_block();
-  blk->set_data_block_type(v4::kNCommonFeature);
-  fb = blk->add_feature_block();
-  fg = fb->add_feature_group();
-  fg->set_feature_index(0);
-  kv = fg->add_kv_feature();
-  kv->set_id(2);
-  kv->set_value(0.2);
-
-  blk = v4sg.add_data_block();
-  blk->set_data_block_type(v4::kLabel);
-  auto lb = blk->add_label_block();
-  lb->add_data(0.1);
-  lb->add_data(0.2);
-
-  blk = v4sg.add_data_block();
-  blk->set_data_block_type(v4::kSampleInfo);
-  auto sb = blk->add_sample_info_block();
-  sb->set_info("skey1");
-
   std::cout << v4sg.ShortDebugString() << std::endl;
   EXPECT_TRUE(v4sg.SerializeToString(&contents));
 
@@ -101,44 +110,49 @@ TEST(ParseV4Test, TestRun) {
   auto sg = sgroup->Get();
   std::cout << sg->ShortDebugString() << std::endl;
 
-  EXPECT_EQ(1, sg->labels_size());
-  EXPECT_EQ(1, sg->sample_ids_size());
+  EXPECT_EQ(N, sg->labels_size());
+  EXPECT_EQ(N, sg->sample_ids_size());
   EXPECT_EQ(2, sg->feature_tables_size());
 
-  EXPECT_EQ(2, sg->labels(0).values_size());
-  EXPECT_FLOAT_EQ(0.1, sg->labels(0).values(0));
-  EXPECT_FLOAT_EQ(0.2, sg->labels(0).values(1));
+  auto ft0 = sg->feature_tables(0);
+  EXPECT_EQ(N, ft0.feature_lines_size());
 
-  EXPECT_STREQ("skey1", sg->sample_ids(0).c_str());
+  auto ft1 = sg->feature_tables(1);
+  EXPECT_EQ(1, ft1.feature_lines_size());
 
-  /* table0 */
-  auto ft = sg->feature_tables(0);
-  EXPECT_EQ(1, ft.feature_lines_size());
-  auto fl = ft.feature_lines(0);
-  EXPECT_EQ(0, fl.refer());
-  EXPECT_EQ(1, fl.features_size());
+  for (int i = 0; i < N; ++i) {
+    EXPECT_EQ(2, sg->labels(i).values_size());
+    EXPECT_FLOAT_EQ(0.1*i, sg->labels(i).values(0));
+    EXPECT_FLOAT_EQ(0.1*i, sg->labels(i).values(1));
 
-  auto f = fl.features(0);
-  EXPECT_EQ(kSparse, f.type());
-  EXPECT_STREQ("ncomm1", f.name().c_str());
-  EXPECT_EQ(1, f.values_size());
+    EXPECT_STREQ((std::to_string(i)).c_str(), sg->sample_ids(i).c_str());
 
-  auto fv = f.values(0);
-  EXPECT_EQ(2, fv.key());
-  EXPECT_FLOAT_EQ(0.2, fv.value());
+    /* table0 */
+    auto fl = ft0.feature_lines(i);
+    EXPECT_EQ(0, fl.refer());
+    EXPECT_EQ(1, fl.features_size());
+
+    auto f = fl.features(0);
+    EXPECT_EQ(kSparse, f.type());
+    EXPECT_STREQ("ncomm1", f.name().c_str());
+    EXPECT_EQ(1, f.values_size());
+
+    auto fv = f.values(0);
+    EXPECT_EQ(i, fv.key());
+    EXPECT_FLOAT_EQ(0.2*i, fv.value());
+    ++i;
+  }
 
   /* table1 */
-  ft = sg->feature_tables(1);
-  EXPECT_EQ(1, ft.feature_lines_size());
-  fl = ft.feature_lines(0);
+  auto fl = ft1.feature_lines(0);
   EXPECT_EQ(1, fl.features_size());
 
-  f = fl.features(0);
+  auto f = fl.features(0);
   EXPECT_EQ(kSparse, f.type());
   EXPECT_STREQ("comm1", f.name().c_str());
   EXPECT_EQ(1, f.values_size());
 
-  fv = f.values(0);
+  auto fv = f.values(0);
   EXPECT_EQ(1, fv.key());
   EXPECT_FLOAT_EQ(0.1, fv.value());
 }
diff --git a/xdl/test/data_io/pause_test.cc b/xdl/test/data_io/pause_test.cc
index 75657d97..8c611627 100644
--- a/xdl/test/data_io/pause_test.cc
+++ b/xdl/test/data_io/pause_test.cc
@@ -17,6 +17,7 @@ limitations under the License.
 #include "xdl/data_io/op/debug_rebuild_op.h"
 #include "xdl/data_io/parser/parser.h"
 #include "gtest/gtest.h"
+#include "xdl/core/utils/logging.h"
 
 #include <string.h>
 
diff --git a/xdl/test/data_io/scheduler_test.cc b/xdl/test/data_io/scheduler_test.cc
index c82a44d6..814b5108 100644
--- a/xdl/test/data_io/scheduler_test.cc
+++ b/xdl/test/data_io/scheduler_test.cc
@@ -38,14 +38,17 @@ TEST(DataIOTest, TestSchedule) {
   for (int i = 0; i < 6; ++i) {
     rparam = sched.Acquire();
     if (i >= 4) {
-      ASSERT_EQ(nullptr, rparam);
+      ASSERT_EQ(nullptr, rparam) << "{" << i << "} " << rparam->DebugString();
       continue;
     }
     ASSERT_NE(nullptr, rparam);
     EXPECT_EQ(0, rparam->begin_);
     EXPECT_EQ(i<2?0:1, rparam->epoch_);
-    EXPECT_GT(rparam->end_, 0);
+    EXPECT_GE(rparam->end_, 0);
     EXPECT_NE(nullptr, rparam->ant_);
+    EXPECT_EQ(rparam->pathid_, i%2);
+    EXPECT_STREQ(rparam->path_, i%2==0?path:path2);
+    sched.Release(rparam);
   }
 }
 
@@ -63,53 +66,77 @@ TEST(DataIOTest, TestRestore) {
   ASSERT_NE(nullptr, rparam);
   EXPECT_EQ(0, rparam->begin_);
   EXPECT_EQ(0, rparam->epoch_);
-  EXPECT_GT(rparam->end_, 0);
+  EXPECT_GE(rparam->end_, 0);
+  EXPECT_EQ(rparam->pathid_, 0);
   EXPECT_STREQ(rparam->path_, path);
   EXPECT_NE(nullptr, rparam->ant_);
 
-  rparam->begin_ = 1;
+  rparam->begin_ = 10;
+  rparam->parsed_ = 1;
+
+  sched.Release(rparam);
 
   rparam = sched.Acquire();
   ASSERT_NE(nullptr, rparam);
   EXPECT_EQ(0, rparam->begin_);
   EXPECT_EQ(0, rparam->epoch_);
-  EXPECT_GT(rparam->end_, 0);
+  EXPECT_GE(rparam->end_, 0);
+  EXPECT_EQ(rparam->pathid_, 1);
   EXPECT_STREQ(rparam->path_, path2);
   EXPECT_NE(nullptr, rparam->ant_);
 
-  rparam->begin_ = 1;
+  rparam->begin_ = 30;
+  rparam->parsed_ = 3;
 
   DSState ds_state;
   sched.Store(&ds_state);
 
-  EXPECT_EQ(4, ds_state.states_size());
+  EXPECT_EQ(2, ds_state.states_size());
   EXPECT_EQ(2, ds_state.epochs());
   for (int i = 0; i < ds_state.states_size(); ++i) {
     auto state = ds_state.states(i);
-    EXPECT_EQ(i<2?1:0, state.begin());
-    EXPECT_EQ(i<2?0:1, state.epoch());
-    EXPECT_GT(state.end(), 0);
-    //EXPECT_STREQ(state.path().c_str(), i%2==0?path:path2);
+    EXPECT_EQ(i==0?3:0, state.begin());
+    EXPECT_EQ(i==0?0:1, state.epoch());
+    EXPECT_GE(state.end(), 0);
+    EXPECT_FALSE(state.has_path());
+    EXPECT_EQ(state.pathid(), i==0?1:0);
   }
 
   std::cout << ds_state.ShortDebugString() << std::endl;
 
-  Scheduler sched2(kLocal);
-  sched2.Restore(ds_state);
+  sched.Restore(ds_state);
 
-  ASSERT_FALSE(sched2.Schedule());
+  ASSERT_FALSE(sched.Schedule());
 
   for (int i = 0; i < 6; ++i) {
-    rparam = sched2.Acquire();
-    if (i >= 4) {
+    rparam = sched.Acquire();
+    if (i >= 3) {
       ASSERT_EQ(nullptr, rparam);
       continue;
     }
     ASSERT_NE(nullptr, rparam);
-    EXPECT_EQ(i<2?1:0, rparam->begin_);
-    EXPECT_EQ(i<2?0:1, rparam->epoch_);
-    EXPECT_GT(rparam->end_, 0);
+    if (i == 0) {
+      EXPECT_EQ(3, rparam->begin_);
+      EXPECT_EQ(3, rparam->parsed_);
+      EXPECT_EQ(0, rparam->epoch_);
+      EXPECT_EQ(rparam->pathid_, 1);
+      EXPECT_STREQ(rparam->path_, path2);
+    } else if (i == 1) {
+      EXPECT_EQ(0, rparam->begin_);
+      EXPECT_EQ(0, rparam->parsed_);
+      EXPECT_EQ(1, rparam->epoch_);
+      EXPECT_EQ(rparam->pathid_, 0);
+      EXPECT_STREQ(rparam->path_, path);
+    } else {
+      EXPECT_EQ(0, rparam->begin_);
+      EXPECT_EQ(0, rparam->parsed_);
+      EXPECT_EQ(1, rparam->epoch_);
+      EXPECT_EQ(rparam->pathid_, 1);
+      EXPECT_STREQ(rparam->path_, path2);
+    }
+    EXPECT_GE(rparam->end_, 0);
     EXPECT_NE(nullptr, rparam->ant_);
+    sched.Release(rparam);
   }
 }
 
diff --git a/xdl/test/data_io/sg_mocker.h b/xdl/test/data_io/sg_mocker.h
index 1a916fd8..63f111b7 100644
--- a/xdl/test/data_io/sg_mocker.h
+++ b/xdl/test/data_io/sg_mocker.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2018 Alibaba Group.
  *
@@ -85,7 +70,7 @@ class SGMocker {
 const size_t SGMocker::kSGCountMax = 128;
 
 void SGMocker::InitTable(FeatureTable *ft, FTab &f_tab, int c, int ktable) {
-  XDL_CHECK(ktable < table_count_);
+  CHECK(ktable < table_count_);
 
   f_tab.resize(c);
 
diff --git a/xdl/test/python/integration_test/test_gradient.py b/xdl/test/python/integration_test/test_gradient.py
deleted file mode 100644
index 99aeabcf..00000000
--- a/xdl/test/python/integration_test/test_gradient.py
+++ /dev/null
@@ -1,84 +0,0 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-# 
-#     http://www.apache.org/licenses/LICENSE-2.0
-# 
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import xdl
-import unittest
-import numpy as np
-from xdl.python.lib.datatype import *
-from xdl.python.lib.graph import execute
-try:
-  from xdl.python.backend.tf.tf_backend import *
-except ImportError:
-  sys.exit(0)
-
-def fc(inputs, w_shape):
-  with tf.variable_scope(name_or_scope='', reuse=tf.AUTO_REUSE):
-    w = tf.get_variable("weights", 
-                        w_shape, 
-                        initializer=tf.constant_initializer(0.1), 
-                        regularizer=tf.nn.l2_loss)
-  return tf.matmul(inputs, w)
-
-def main():
-  dense = xdl.mock_dense_op(shape=[1, 16], value=0.01, name_="dense")
-  labels = xdl.mock_dense_op(shape=[1, 1], value=1.0, name_="label")
-  ids = xdl.convert_to_tensor(np.array([[0,0], [0,1], [0,2]], dtype=np.int64))
-  values = xdl.convert_to_tensor(np.array([1.0, 2.0, 3.0], dtype=np.float32))
-  segments = xdl.convert_to_tensor(np.array([3], dtype=np.int32))
-  sparse = xdl.SparseTensor(ids, values, segments)
-  emb = xdl.embedding("sparse", sparse, xdl.Ones(), 1, 16, 'sum', vtype='hash')
-  loss = model(dense, emb, labels)
-  train_op = xdl.SGD(0.5).optimize()
-  sess = xdl.TrainSession()
-  loss, gradients = sess.run([loss, xdl.get_sparse_grads('sparse').grad])
-  return loss, gradients
-
-@xdl.tf_wrapper(is_training=True)
-def model(dense, emb, labels):
-    fc2 = fc(dense, [16, 1])
-    logits = fc2 + emb
-    cross_entropy = tf.nn.sigmoid_cross_entropy_with_logits(
-        labels=labels, logits=logits, name='xentropy')
-    return tf.reduce_mean(cross_entropy, name='xentropy_mean')
-
-class GradientTest(unittest.TestCase):
-  def test_all(self):
-    dense = xdl.mock_dense_op(shape=[1, 16], value=0.01, name_="dense")
-    labels = xdl.mock_dense_op(shape=[1, 1], value=1.0, name_="label")
-    ids = xdl.convert_to_tensor(np.array([[0,0], [0,1], [0,2]], dtype=np.int64))
-    values = xdl.convert_to_tensor(np.array([1.0, 2.0, 3.0], dtype=np.float32))
-    segments = xdl.convert_to_tensor(np.array([3], dtype=np.int32))
-    sparse = xdl.SparseTensor(ids, values, segments)
-    emb = xdl.embedding("sparse", sparse, xdl.Ones(), 1, 16, 'sum', vtype='hash')
-    loss = model(dense, emb, labels)
-    train_op = xdl.SGD(0.5).optimize()
-    sess = xdl.TrainSession()
-    _, l, g = sess.run([train_op, loss, xdl.get_sparse_grads('sparse').grad])
-    self.assertTrue((l==np.array(0.0024364376, dtype=np.float32)).all())
-    self.assertTrue((g==np.array([[-0.002433472],[-0.004866944],[-0.007300416]], dtype=np.float32)).all())
-    sparse_var = xdl.get_variable_by_name('sparse')
-    weights = sess.run(sparse_var.gather(np.array([[0,0],[0,1],[0,2]], dtype=np.int64)))
-    self.assertTrue((weights==np.array([[1.0012168],[1.0024334],[1.0036502]], dtype=np.float32)).all())
-    _, l, g = sess.run([train_op, loss, xdl.get_sparse_grads('sparse').grad])
-    self.assertTrue((l==np.array(0.002395329, dtype=np.float32)).all())
-    self.assertTrue((g==np.array([[-0.0023924622],[-0.0047849244],[-0.0071773864]], dtype=np.float32)).all())
-    weights = sess.run(sparse_var.gather(np.array([[0,0],[0,1],[0,2]], dtype=np.int64)))    
-    self.assertTrue((weights==np.array([[1.002413],[1.0048258],[1.0072389]], dtype=np.float32)).all())
-
-def suite():
-  return unittest.TestLoader().loadTestsFromTestCase(GradientTest)
-
-if __name__ == '__main__':
-  unittest.TextTestRunner().run(suite())
diff --git a/xdl/test/python/unit_test/backend/mxnet_backend_test.py b/xdl/test/python/unit_test/backend/mxnet_backend_test.py
index c264cdd7..e60a3dc7 100644
--- a/xdl/test/python/unit_test/backend/mxnet_backend_test.py
+++ b/xdl/test/python/unit_test/backend/mxnet_backend_test.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -16,13 +16,9 @@
 import xdl
 import unittest
 import numpy as np
-import sys
 from xdl.python.lib.datatype import *
 from xdl.python.lib.graph import execute
-try:
-  from xdl.python.backend.mxnet.mxnet_backend import *
-except ImportError:
-  sys.exit(0)
+from xdl.python.backend.mxnet.mxnet_backend import *
 
 def main():
   dense = xdl.mock_dense_op(shape=[1, 16], value=0.01, name_="dense")
diff --git a/xdl/test/python/unit_test/def b/xdl/test/python/unit_test/def
new file mode 100644
index 00000000..113e6323
--- /dev/null
+++ b/xdl/test/python/unit_test/def
@@ -0,0 +1,293 @@
+auc=0, pv_num=2
+auc=0.272727, pv_num=12
+auc=0.807692, pv_num=15
+auc=0.333333, pv_num=4
+auc=0.5, pv_num=6
+auc=0.4, pv_num=6
+auc=0.333333, pv_num=4
+1 0 0.0619345
+1 0 0.0619345
+0 1 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+0 1 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619347
+1 0 0.0619348
+1 0 0.0619348
+0 1 0.0619348
+1 0 0.0619349
+1 0 0.061935
+0 1 0.0619351
+1 0 0.0619352
+1 0 0.0619354
+1 0 0.0619354
+1 0 0.0619354
+0 1 0.0619355
+auc=0.561905, pv_num=26
+auc=1, pv_num=6
+auc=0.546875, pv_num=20
+auc=0.214286, pv_num=15
+auc=0.5, pv_num=6
+auc=0, pv_num=7
+auc=0.740741, pv_num=12
+auc=0.5, pv_num=3
+auc=0.666667, pv_num=4
+auc=0.769231, pv_num=14
+auc=0.583333, pv_num=8
+auc=0.6, pv_num=6
+auc=0, pv_num=2
+auc=1, pv_num=3
+auc=0.4, pv_num=6
+auc=1, pv_num=6
+auc=0.25, pv_num=9
+auc=0, pv_num=5
+auc=0.5, pv_num=3
+auc=1, pv_num=9
+auc=0, pv_num=3
+auc=0.8, pv_num=6
+auc=0.666667, pv_num=4
+auc=0.25, pv_num=9
+auc=0.5, pv_num=3
+auc=0.5, pv_num=3
+auc=0.75, pv_num=9
+auc=0.0909091, pv_num=12
+auc=0.75, pv_num=6
+auc=0.666667, pv_num=4
+auc=0.375, pv_num=9
+auc=0.5, pv_num=9
+auc=0.5, pv_num=3
+auc=0.8, pv_num=6
+auc=0.666667, pv_num=7
+auc=0.375, pv_num=9
+auc=1, pv_num=3
+auc=0, pv_num=10
+auc=0.25, pv_num=6
+auc=1, pv_num=6
+auc=1, pv_num=3
+auc=0.181818, pv_num=12
+auc=1, pv_num=2
+auc=0.125, pv_num=9
+auc=0.888889, pv_num=10
+auc=0.625, pv_num=9
+auc=0.2, pv_num=6
+auc=0.5, pv_num=3
+auc=0.5, pv_num=3
+auc=0.6, pv_num=6
+auc=0, pv_num=3
+auc=0.2, pv_num=6
+auc=0.444444, pv_num=10
+auc=0, pv_num=3
+auc=0.5, pv_num=3
+auc=0, pv_num=6
+auc=0.666667, pv_num=10
+auc=0.444444, pv_num=10
+auc=1, pv_num=6
+auc=0.375, pv_num=9
+auc=1, pv_num=3
+auc=0, pv_num=3
+auc=0.5, pv_num=3
+auc=1, pv_num=7
+auc=0.9, pv_num=11
+auc=0, pv_num=6
+auc=0.0909091, pv_num=12
+auc=0.8, pv_num=6
+auc=0.714286, pv_num=15
+auc=1, pv_num=2
+auc=0.8, pv_num=6
+auc=0.4, pv_num=6
+auc=0.375, pv_num=9
+auc=1, pv_num=3
+auc=0, pv_num=3
+auc=0.75, pv_num=21
+auc=0.34375, pv_num=12
+auc=0.6, pv_num=6
+auc=0, pv_num=3
+auc=0.8, pv_num=6
+auc=0.875, pv_num=9
+auc=0.727273, pv_num=12
+auc=0.666667, pv_num=5
+auc=0.8, pv_num=6
+auc=1, pv_num=6
+auc=0.4, pv_num=6
+auc=0.916667, pv_num=8
+auc=0, pv_num=3
+auc=0, pv_num=3
+auc=0.6, pv_num=12
+auc=0.5, pv_num=6
+auc=1, pv_num=3
+auc=0.944444, pv_num=9
+auc=0, pv_num=8
+auc=0.25, pv_num=6
+auc=0.5, pv_num=5
+auc=0.4, pv_num=6
+auc=0.2, pv_num=6
+auc=0.285714, pv_num=9
+auc=0.5, pv_num=3
+auc=0, pv_num=6
+auc=0, pv_num=3
+auc=0, pv_num=6
+auc=0.5, pv_num=6
+auc=0.4, pv_num=6
+auc=1, pv_num=5
+auc=1, pv_num=12
+auc=0.875, pv_num=9
+auc=0, pv_num=3
+auc=0, pv_num=3
+auc=1, pv_num=3
+auc=0.4, pv_num=16
+auc=0.571429, pv_num=9
+auc=1, pv_num=18
+auc=1, pv_num=3
+auc=0.5625, pv_num=12
+auc=1, pv_num=3
+auc=1, pv_num=3
+auc=0.5, pv_num=6
+auc=0.777778, pv_num=11
+auc=1, pv_num=3
+auc=0.4, pv_num=6
+auc=0.2, pv_num=6
+auc=0.454545, pv_num=12
+auc=0.5, pv_num=3
+auc=0.5, pv_num=3
+auc=0.5, pv_num=3
+auc=0.625, pv_num=6
+auc=0.5, pv_num=3
+auc=0.3, pv_num=11
+auc=0, pv_num=12
+auc=0, pv_num=3
+auc=1, pv_num=2
+auc=0.6, pv_num=6
+auc=0.541667, pv_num=11
+auc=1, pv_num=3
+auc=0, pv_num=6
+auc=0.411765, pv_num=20
+auc=0.25, pv_num=9
+auc=0, pv_num=3
+auc=1, pv_num=3
+auc=0.363636, pv_num=12
+auc=0.8, pv_num=6
+auc=0.5, pv_num=3
+auc=0, pv_num=6
+auc=0.615385, pv_num=15
+auc=0.909091, pv_num=12
+auc=0.392857, pv_num=11
+auc=1, pv_num=3
+auc=0, pv_num=3
+auc=0.45, pv_num=24
+auc=0, pv_num=3
+auc=0, pv_num=3
+auc=0.5, pv_num=3
+auc=1, pv_num=3
+auc=0.714286, pv_num=8
+auc=1, pv_num=9
+auc=1, pv_num=3
+auc=0.285714, pv_num=10
+auc=0.2, pv_num=6
+auc=0.125, pv_num=9
+auc=0.625, pv_num=9
+auc=0.666667, pv_num=7
+auc=1, pv_num=3
+auc=0, pv_num=3
+auc=0, pv_num=3
+auc=0, pv_num=3
+auc=0.5, pv_num=3
+auc=0.4, pv_num=6
+auc=1, pv_num=3
+auc=0.6, pv_num=6
+auc=0.875, pv_num=9
+auc=0.311111, pv_num=18
+auc=1, pv_num=2
+auc=0, pv_num=3
+auc=0, pv_num=3
+auc=0, pv_num=4
+auc=0.75, pv_num=9
+auc=1, pv_num=3
+auc=0.25, pv_num=5
+auc=0.6875, pv_num=18
+auc=0.5, pv_num=3
+auc=1, pv_num=3
+0 1 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619345
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619346
+1 0 0.0619346
+auc=0, pv_num=26
+auc=0.571429, pv_num=8
+auc=0, pv_num=8
+auc=1, pv_num=2
+auc=0.416667, pv_num=15
+auc=0, pv_num=3
+auc=0.5, pv_num=3
+auc=1, pv_num=2
+auc=0.5, pv_num=3
+auc=0.111111, pv_num=10
+auc=0.666667, pv_num=4
+auc=0.307692, pv_num=14
+auc=0.714286, pv_num=8
+auc=0.1, pv_num=12
+auc=1, pv_num=3
+auc=1, pv_num=3
+auc=0.909091, pv_num=12
+auc=0.75, pv_num=5
+auc=0.5, pv_num=18
+auc=0.0833333, pv_num=13
+auc=0.5, pv_num=5
+auc=0.2, pv_num=6
+auc=0.75, pv_num=5
+auc=0, pv_num=3
+auc=0.3, pv_num=11
+auc=0.882353, pv_num=18
+auc=1, pv_num=6
+auc=0.85, pv_num=21
+auc=0.5, pv_num=3
+auc=0.75, pv_num=6
+auc=0.125, pv_num=9
+auc=1, pv_num=7
+auc=0.111111, pv_num=9
+auc=0, pv_num=3
+auc=1, pv_num=5
+auc=0, pv_num=3
+auc=1, pv_num=3
+auc=0.791667, pv_num=14
+auc=0.909091, pv_num=12
+auc=0.5, pv_num=3
+auc=0.5, pv_num=3
+auc=0.785714, pv_num=9
+auc=0, pv_num=3
+auc=0.397059, pv_num=36
+auc=0.194444, pv_num=15
+auc=0, pv_num=5
+auc=0.5, pv_num=3
+auc=0, pv_num=14
+auc=0, pv_num=3
+auc=0.111111, pv_num=10
+batch gauc:867.636, pv_num: 1729merged gauc: 0.501814867.6365 1729 0.50181407
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/__meta__ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/__meta__
new file mode 100644
index 00000000..cf6cbe14
Binary files /dev/null and b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/__meta__ differ
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/dense$bias^0 b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/dense$bias^0
new file mode 100644
index 00000000..6bba6b90
Binary files /dev/null and b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/dense$bias^0 differ
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/dense$kernel^0 b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/dense$kernel^0
new file mode 100644
index 00000000..e5f6d4ae
Binary files /dev/null and b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/dense$kernel^0 differ
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/emb2^0 b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/emb2^0
new file mode 100644
index 00000000..c3265ba9
Binary files /dev/null and b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/emb2^0 differ
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/xdl_global_step^0 b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/xdl_global_step^0
new file mode 100644
index 00000000..50ab58d2
Binary files /dev/null and b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoint_00/xdl_global_step^0 differ
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoints b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoints
new file mode 100644
index 00000000..78979a52
Binary files /dev/null and b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_in/checkpoints differ
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&bias b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&bias
new file mode 100644
index 00000000..01c57cf1
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&bias
@@ -0,0 +1 @@
+-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&bias&accumulation b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&bias&accumulation
new file mode 100644
index 00000000..01c57cf1
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&bias&accumulation
@@ -0,0 +1 @@
+-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&kernel b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&kernel
new file mode 100644
index 00000000..cec53a43
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&kernel
@@ -0,0 +1 @@
+0.0000593432,0.000294756,-0.00170537,-0.0000734445,0.00044994,0.00176328,-0.000524585,0.000537846,-0.00143931,-0.000915714,-0.000155837,0.00018063,-0.000260326,-0.0000755778,0.000439453,-0.00162821,0.000095441,-0.00147991,-0.000969109,-0.000190611,-0.00101292,0.00170309,-0.0000743011,-0.000655983,-0.000381057,-0.0000716263,0.000520369,0.00174444,-0.000143522,-0.000668611,-0.000559025,-0.000104292,-0.000825897,0.000335143,-0.000107083,-0.000414723,0.000852662,0.000722052,0.0015646,0.000177771,0.000756739,-0.00035741,0.00157905,-0.000514344,0.000579142,-0.00168433,0.00136235,0.00193695,-0.00155303,-0.000571171,-0.000880265,0.000044084,0.00040226,0.000139342,-0.00100143,-0.000095964,0.000121769,0.0000334665,-0.000583088,0.000467473,-0.000558637,-0.000224379,-0.000951341,0.00129247,0.000646898,-0.00122314,-0.000580931,0.00149025,0.000462108,-0.000434427,0.00100005,0.000233159,0.000523165,-0.000376856,-0.0000305997,0.000239408,-0.000630372,-0.00102979,-0.000407872,-0.00115596,-0.00133183,-0.000784916,0.000410393,-0.00194366,-0.000357618,-0.00121084,-0.0000583662,0.000162287,-0.00135009,-0.000806318,-0.000589419,-0.00031057,0.000760597,0.000117939,0.0000720855,-0.0019294,0.000455446,0.000221111,0.0015344,0.0000774038,0.000230619,0.0013646,-0.00085012,0.00110946,-0.000500073,0.000412691,-0.000500556,0.000389054,-0.00137879,0.00126228,-0.00163427,-0.000574103,-0.0000521703,0.00170123,-0.000314788,0.00111482,0.000777614,-0.000996055,-0.000859682,0.00100666,0.000553863,-0.0015093,0.000117751,0.0013832,0.0000845181,-0.0011779,0.00183312,0.0000345043,-0.000752842,-0.00106275,-0.000615855,-0.000178208,0.000123227,0.0000778633,0.000757173,-0.0010638,0.000388156,0.00160738,-0.000732776,0.00175135,0.000827629,-0.0018652,0.000116772,0.000249614,0.000241883,0.000167159,-0.0013718,-0.000463339,-0.00111645,-0.00138462,0.000109151,-0.000778406,0.00105865,-0.00049027,0.0000489546,0.000607967,-0.00066597,-0.0000203958,0.00124954,0.0000315867,-0.00043025,-0.00190769,0.000000531007,0.00151344,0.000359007,0.0000450663,-0.00159988,-0.000278991,0.000282722,0.00101481,0.000338634,-0.000114864,-0.000129235,0.00144443,0.0012557,0.000541347,0.000749306,0.00108706,-0.000564901,0.000878978,0.0013042,-0.000143994,-0.0000144854,-0.000160061,0.000210887,-0.000631202,0.000267717,-0.000104092,0.000518102,-0.000169245,0.000879623,-0.000193808,-0.00009772,0.000228807,-0.000812141,0.000593194,-0.000290257,0.00128948,0.000187271,0.0000535644,0.000808218,-0.00180062,0.000847873,-0.000426624,0.000358223,0.000278337,-0.000537512,0.000324106,-0.00070897,0.00000582896,0.000335832,-0.00166802,0.000906117,-0.000295355,-0.00133083,0.0015673,0.00102968,0.000066251,0.000266712,0.0000391335,-0.000899517,-0.000845579,0.000234249,0.000850159,0.000195573,0.00115914,0.000240151,-0.00107295,0.000614631,0.000116929,-0.00011984,-0.000563901,0.00136543,0.000241498,0.00105846,-0.00194088,0.000764513,0.000281062,-0.0004424,0.000395729,0.00119086,-0.00108854,-0.000393745,0.00171319,-0.000111479,0.000844739,-0.000980996,0.000707528,0.00114426,-0.00030048,0.000889055,0.00198381,0.000373283,0.0000307672,0.000152446,-0.000299657,-0.000881584,0.000745867,-0.00128482,-0.00138425,0.000952347,0.0000930227,0.00043808,0.0000818481,-0.0000645624,0.000582474,-0.00164,0.000701752,0.0009497,0.000245388,0.000591238,-0.00180664,0.000740818,-0.00121594,-0.00110504,-0.00140666,0.000196556,-0.000638653,-0.000430541,-0.000530532,0.000414891,0.000757947,-0.00109112,0.0000766426,0.00000693972,0.00114992,0.000469843,-0.000468641,0.000378579,0.000998836,-0.0014593,0.00129207,0.00114939,-0.000194669,-0.000949898,0.00000539302,-0.000514493,0.000439659,0.000580661,-0.00076833,-0.000133765,-0.000256406,-0.000457857,0.000694173,-0.000231473,-0.000371135,0.000478418,0.00101236,-0.0000114161,0.000460127,-0.000202648,-0.000687327,-0.00134394,-0.000119172,0.000729695,0.000108036,0.000518293,-0.000230658,0.000329946,0.00136771,-0.000385043,0.000726705,-0.00000100067,0.00197265,-0.000920802,0.000640016,0.000661739,-0.000215427,-0.000836248,0.000683584,-0.000442804,0.000432209,-0.000078728,0.000164872,-0.00197945,-0.00174336,0.000456854,0.00127,-0.000532717,0.000747755,-0.000669028,-0.00184517,0.00045755,-0.000474785,0.00000226214,0.00103596,-0.000342241,0.00171247,0.00119531,-0.000868235,-0.001937,-0.000060953,0.000234326,0.000703868,-0.000607587,0.0014294,-0.0000801958,0.000289104,0.00085687,-0.0000818269,0.000487365,0.0000453375,0.000726791,0.000395239,-0.000421564,-0.000399961,-0.000558896,-0.000624434,0.000871103,0.00000581981,0.0000204051,-0.000963988,-0.00176153,-0.00106474,-0.000656898,0.000110148,-0.000142412,0.000627514,-0.00153232,0.000174781,-0.000695151,-0.0008397,-0.00036175,-0.00142665,-0.000479631,-0.0000703956,0.00000256666,0.000346393,0.000423183,0.000619206,0.000197312,0.0000488432,-0.000704072,-0.000235963,0.00154663,0.000639032,0.0000999795,-0.000124304,0.000212445,-0.00153912,-0.000531246,0.000333548,-0.0001974,-0.000810499,-0.000222493,-0.00118934,-0.000767651,0.000142226,-0.000243948,-0.000780038,-0.000680516,-0.00108515,0.0015715,-0.00164617,0.000467433,-0.00127426,0.000430589,0.000160641,-0.00030856,0.000202852,0.000335903,-0.000656775,-0.00193162,-0.000706688,0.00154198,-0.000192074,-0.000121925,-0.0000738467,-0.00174135,0.00110334,0.00139296,0.0000574815,0.00037294,-0.000633167,0.00014706,0.000438842,0.00121667,-0.000497442,-0.000988408,0.000311246,0.000805638,-0.00141583,0.000165229,-0.00101419,-0.000772904,0.000856954,0.000319099,0.000860442,-0.000430875,0.0011816,-0.00182736,-0.00102368,-0.00136783,-0.0000178997,0.0000546864,0.00108406,0.000560378,0.000754663,0.00041668,-0.000166494,-0.000531213,-0.00171454,-0.000454428,-0.000576223,0.000429111,-0.000736565,0.000646373,0.00110868,0.000890519,0.000475771,0.00048866,0.000297276,-0.00000627739,0.00150939,0.000776834,-0.00116358,0.000140905,-0.000179952,0.00052651,-0.00109028,-0.0012458,0.00144425,-0.000561927,-0.000143283,0.000602717,0.00154231,-0.000668241,0.0011812,0.000281999,-0.000193177,-0.00156058,-0.00164918,-0.000911561,-0.000888622,-0.000449161,-0.000296743,-0.00142091,0.000470439,-0.00118618,-0.000723711,-0.000870227,-0.0000886689,0.000629491,0.000854166,0.0000576107,-0.00181168,-0.00057099,0.000995991,-0.00187762,0.00049945,0.0000907681,-0.00011164,0.0017058,-0.000782327,-0.000559217,0.000288523,-0.000405185,-0.000642927,0.000952772,-0.000154412,-0.00199102,-0.00132722,-0.000219765,-0.000887952,-0.00107792,0.000594751,0.000544978,0.000335099,0.00000171497,0.000643353,0.000650538,-0.000616355,-0.00115992,-0.000963553,0.0000973592,-0.00156091,0.000414644,0.00170395,0.000409634,-0.000209405,-0.000702135,-0.00187253,0.00107854,0.000666639,0.000852251,-0.00182874,0.000219125,-0.00112166,0.00150888,-0.00149834,-0.00156855,-0.00115097,0.000569113,0.000320835,0.000169327,-0.00092707,-0.000660257,-0.00163002,0.00114788,0.00107299,0.00176355,0.000181829,-0.000899809,-0.000193967,0.00157319,-0.000759568,0.000513568,-0.000917004,0.000659578,-0.000958038,0.00104527,0.00135764,-0.000474609,-0.0000516198,-0.000425529,0.00105703,-0.00111259,-0.000432744,-0.000374592,0.000000838047,-0.00149122,0.000143148,0.000542425,-0.00178028,-0.000239676,-0.00104953,0.00107801,-0.000530332,-0.00160077,-0.000737073,-0.00127569,0.000159636,0.00000475358,-0.00100777,0.000344223,-0.000481293,0.000734948,-0.00071877,0.00056812,-0.000717818,-0.000615095,-0.000120228,-0.00162869,-0.00131714,-0.00141089,0.0010913,0.000256459,-0.000639549,-0.000704717,0.000794223,-0.0000848588,0.0015887,-0.000137887,0.000425673,-0.00122557,0.000492179,-0.000547623,-0.000436998,-0.000359353,0.00067684,-0.0000845688,0.000693238,0.00107694,-0.000307646,0.000279302,-0.00197645,0.000210422,-0.000876285,-0.000630509,-0.00189789,0.000153911,-0.00118198,-0.00188844,-0.000913427,-0.000589297,0.000338868,-0.00111135,-0.000339898,0.000763527,-0.000889322,0.000131178,0.000256506,-0.000510133,0.000689762,0.000739749,0.0000136807,-0.000282639,-0.00123796,0.00103433,-0.000652177,0.000294422,0.000550774,-0.000497342,0.00034028,-0.00142674,0.00138962,-0.000519536,-0.00149307,0.000102473,-0.000791714,-0.00116332,-0.000733457,0.000660915,-0.00101571,0.000384683,0.00152308,-0.00198076,0.000135633,0.00011811,0.000748711,0.0010533,-0.000543168,0.000385866,0.0000690547,-0.000438219,-0.000374012,0.00043452,-0.000216875,-0.000243008,-0.00153253,0.0018931,-0.00161653,0.000475385,-0.0000885506,0.00033958,0.00102093,0.000797395,0.0000691018,0.000313653,-0.000553369,0.000227024,-0.00176911,-0.000495923,-0.00029491,-0.000135735,-0.000383362,0.000847062,-0.00113319,-0.000374691,0.00148443,-0.0000469676,0.000314343,0.00130812,-0.000587488,0.000889603,0.00133724,0.000577222,-0.000201539,0.000960717,-0.000889988,0.0000636553,-0.000860724,-0.000397585,-0.000459119,-0.00120568,-0.000659942,-0.000358271,-0.000619852,-0.000210721,-0.000213926,-0.000675276,-0.00131353,0.000104872,-0.00101257,-0.000429893,0.000494949,-0.000343753,-0.000959707,0.00156356,0.000362586,0.000771298,-0.0000841251,0.000418499,-0.000357144,-0.00018314,-0.00155254,0.000955011,0.0015396,0.0000742918,0.00175152,0.00064047,-0.000941846,0.000611582,-0.000543942,0.00152983,0.000501978,-0.00173373,0.00030223,-0.000241308,0.000420325,-0.00151457,-0.000879524,0.00103359,-0.000658997,0.000944227,-0.00147107,-0.000462594,0.000650442,-0.000875504,-0.000430592,-0.0000208436,0.00005178,-0.000459303,0.00026315,-0.0000378354,-0.000668563,-0.0000653726,0.00123478,-0.0000214442,0.000370141,0.000396011,-0.00126144,0.000699958,-0.00017668,-0.0000599205,0.00152686,-0.000501982,-0.000306216,0.000709138,-0.000815761,0.000747337,-0.00125628,0.000174371,-0.00000258194,-0.00147934,-0.000968402,0.00145492,0.000219481,-0.000000136674,-0.000241103,-0.00104735,-0.000706733,0.000472345,-0.0000285102,0.000816303,0.00174451,0.000177402,0.000270587,0.000722654,0.000383219,0.0000212561,0.000291261,0.0000832566,-0.00138607,0.00109141,-0.00152448,-0.0000172708,0.000527089,0.000365047,0.000454225,0.00112481,-0.00101365,0.000500457,-0.000115585,0.000964553,-0.000662626,0.000419576,0.00111508,0.000164198,-0.000146492,0.000691825,-0.000381091,-0.000856605,0.000271155,-0.000830198,-0.000155017,-0.00141024,0.00107047,-0.000322832,-0.0000452383,0.0011465,0.000419151,0.000243176,0.00023953,-0.000375192,0.000842933,0.000684451,0.000835843,0.00116752,0.00116916,0.000941787,-0.0016785,0.000293616,0.000230648,-0.000426251,0.00155891,-0.000619922,-0.00145459,-0.000356738,0.000942753,0.00174468,-0.00086,-0.000451681,-0.000413836,0.000447466,0.00165991,-0.000188865,0.000104497,0.00193638,0.000380763,-0.000461872,0.000534002,0.000224234,0.00179225,-0.00054926,-0.0000901704,-0.000296872,0.00131367,-0.000304723,0.000255481,0.000123161,0.000951218,-0.0013377,-0.000124912,0.000144734,-0.000269401,-0.0000617447,-0.00000731103,-0.000390715,-0.000752414,0.00144569,0.00111928,-0.00000774574,0.000606547,-0.000932656,-0.000117504,0.00000472945,-0.000074212,-0.000710681,0.00137304,-0.000924282,-0.000122156,-0.000390708,-0.00111407,-0.000453677,-0.0010419,-0.00146223,-0.000493904,-0.000835061,-0.000632072,0.000878948,-0.000957119,0.000567771,0.000465229,0.000908125,0.00145805,-0.00175546,-0.000722687,0.000971123,-0.000538494,-0.00074994,0.000116855,0.000139938,-0.00100941,0.00050353,-0.00112334,-0.00128296,0.000559655,0.00155805,-0.000658456,0.00117151,-0.00121841,0.000116362,0.00100476,-0.000615938,-0.00136363,0.000193791,-0.00130674,-0.0000844449,-0.00072068,-0.000416771,0.000992298,0.000295601,-0.000371772,0.000574204,-0.000296743,0.000098646,-0.000462628,-0.000439277,-0.000835103,0.000298885,-0.000764016,0.00169833,0.000211422,0.000402157,0.00129181,0.00168903,-0.00090266,-0.000362521,-0.00100612,0.00155716,0.000290536,0.0000813515,-0.000712334,0.00075787,-0.0000849264,0.00096827,0.00052356,0.000669401,-0.00146752,-0.000331754,-0.00125778,-0.000349131,0.000762035,0.000123808,-0.000595389,0.000441837,0.000955906,0.000711887,-0.000224649,0.000000852076,0.00100194,-0.000603193,-0.00163297,-0.000319983,-0.000433601,-0.000807895,0.00167422,0.0017494,0.000324316,0.000486419,0.000326252,0.0000851904,0.000575415,0.0000448948,-0.00108626,0.000296104,0.00143263,-0.000108484,0.00144936,0.00125467,-0.000704671,-0.000555167,0.000673187,-0.00111526,-0.00113412,-0.00130148,0.00098061,0.000513605,-0.00192372,-0.000132779,-0.00100201,-0.000632166,-0.00162521,-0.000017805,-0.000704636,-0.000413261,-0.00109712,0.000974105,-0.000478798,-0.000310964,0.000871637,0.000338449,-0.00118093,0.000929325,0.000160954,-0.000931704,-0.00124927,-0.000990225,0.000421999,0.00115948,0.00146666,0.000277109,0.00163502,-0.000200621,-0.00166843,-0.000335768,0.0000989313,-0.000193192,-0.000546206,-0.000539932,0.00016542,0.00069142,-0.000568113,0.00022477,-0.000551242,0.000228421,-0.00049027,0.000391307,0.000530534,0.00100178,0.00199658,-0.000689885,-0.000476974,0.00108525,0.000342914,0.000586045,0.000587408,0.00107351,-0.00157661,0.0000807886,-0.00108402,-0.000237866,-0.000711501,-0.000394268,-0.000227293,0.000829417,-0.000618432,-0.000115189,-0.000184694,-0.00127688,-0.0000858049,0.00097926,-0.000772141,-0.00119617,0.000632735,-0.00154548,0.000201043,-0.0000666088,-0.000171988,-0.00152693,0.000592156,0.000978382,0.000564448,-0.000396538,0.000190587,-0.0000128651,-0.000354783,0.000115861,-0.000748083,-0.000622191,-0.000901784,-0.000939441,-0.000503759,0.0000349028,-0.000354536,0.000620022,0.000545623,0.00121696,-0.000729975,-0.00149531,-0.000836753,0.000405645,-0.00109147,-0.000100164,0.00016577,-0.00191803,0.000825175,0.000448559,-0.000569568,0.000594186,-0.000322929,-0.00182777,0.00123454,-0.000804523,0.000376045,-0.000472865,0.000142025,0.00095943,-0.0000591419,0.00086426,-0.000283488,-0.00140459,-0.00134704,0.0003665,-0.000103285,-0.00171027,0.00137246,0.000696391,-0.000308195,-0.000782331,0.000547429,-0.000892738,-0.0011289,0.000537625,0.00125177,0.000508946,0.00144446,0.00154554,0.000127322,0.00149424,0.000607878,0.00123367,-0.0018102,0.000180462,0.00104213,0.00038406,0.000644214,0.000761833,0.000950273,0.000741944,0.000533028,-0.0000862941,0.000351367,-0.000146674,-0.00029562,0.000175317,-0.000662491,0.00107308,-0.000676965,0.000407542,0.000464628,-0.000761114,-0.000898306,-0.000723664,-0.0002976,-0.000347667,-0.000765845,-0.000533487,-0.000738721,-0.00140015,0.000212754,0.00017579,0.00143569,0.000453712,0.00105525,0.000973838,0.000798782,0.000208604,0.000677838,0.00115327,0.000263503,-0.000309748,-0.000146752,0.000189268,0.00144508,0.000114519,-0.00184417,-0.00186862,0.000710835,-0.0000844774,0.00129561,0.0000327108,0.00119709,-0.000323807,0.0013058,-0.00109482,0.00098181,-0.000112469,0.00127746,-0.000959569,0.00164496,-0.000612534,-0.00168466,0.00084786,-0.000900846,0.000515028,0.000341228,-0.00124795,-0.000769691,0.000370622,-0.000135002,-0.00137487,0.00179986,-0.00111197,0.00189399,0.000280278,-0.00102595,0.000780063,0.000163652,-0.000263317,0.0000730568,0.000131546,0.000835868,0.000174665,-0.00132605,0.000601988,-0.00109172,-0.00054887,0.000338427,0.00158668,0.0000656243,0.0014458,-0.000182581,0.000220098,-0.000150277,-0.00104844,0.000574233,-0.000822215,-0.00190692,0.00109314,0.000250886,-0.000766458,0.000313595,-0.000256631,-0.000785006,0.000413981,0.000692434,-0.000672091,-0.000562502,-0.000639313,0.000886942,-0.00117259,0.0000307349,0.00024278,-0.000987267,0.0000121591,-0.00107007,0.000560948,0.00199689,-0.00199262,0.000464493,-0.00123506,0.0000606341,-0.00114486,0.000764202,-0.000567644,0.000443573,-0.000599528,-0.000326517,0.000177768,0.0000205507,0.000557665,-0.00185025,-0.0013275,0.0018825,-0.00173339,0.00144202,-0.00177051,0.000150006,0.000513513,0.000427477,-0.0000138849,0.000114027,-0.00051452,-0.000134011,-0.000573476,-0.0000740699,0.00000376658,0.000480396,0.000910553,0.00116185,0.000121605,-0.00144124,-0.000525155,0.000526479,0.00174918,-0.000273165,0.000668298,-0.000370211,-0.00025372,-0.00138596,-0.00100834,-0.000973026,0.000668082,-0.000923318,-0.000545734,-0.00116858,-0.000661036,0.000675044,0.000184197,-0.00159657,-0.000861967,-0.00129343,0.000220262,0.0000461003,-0.00130181,0.000137101,-0.00159732,0.000990296,0.000138664,-0.00145218,-0.000745363,-0.000534064,0.00106549,-0.00145182,0.000263936,-0.00197454,0.000261213,0.000982165,0.0012328,-0.0000376852,-0.000568935,0.00126134,0.000767994,-0.000282598,0.000519375,-0.000486061,0.00128684,0.000277451,-0.00121854,0.00139233,0.000428362,0.000488338,-0.00159963,0.000577875,0.00054703,0.000762272,-0.000902457,0.000507923,-0.000537756,0.000895478,0.00132514,-0.00175883,-0.000539129,0.000574571,-0.000761291,-0.00184241,-0.000710004,-0.0000467338,-0.0011741,0.000243128,-0.00159566,0.000155031,-0.00130397,-0.00154906,0.000254422,0.000265015,-0.00166245,-0.00140638,-0.00102053,0.000738595,0.000143741,0.000216583,0.00161111,-0.0000749361,0.000740316,-0.00023406,0.00181774,-0.000254191,-0.00155857,-0.000127973,0.000264865,-0.000163646,-0.000605286,-0.00126869,0.000303167,0.000824123,-0.000857331,0.00159693,0.00116463,-0.00114642,0.00085271,0.00169948,-0.000821866,-0.000556065,-0.000372792,0.000980729,0.000504218,0.000310118,0.000217532,0.000671754,-0.00112566,-0.00157395,-0.000666199,0.000566804,-0.00119043,-0.0000157849,0.000276883,0.00137993,0.000258256,-0.00060611,-0.00126985,0.000321151,0.000177655,-0.00167227,-0.000573653,0.000846023,-0.00102264,0.00129596,-0.00107432,0.0000807601,0.00195434,0.00139578,0.000692533,0.00170397,-0.000349236,0.000464428,0.000169416,0.000924355,0.0000960017,0.000719748,0.000418891,-0.000581824,0.000181595,-0.000565893,-0.00102204,-0.0012243,0.000786173,0.000506518,-0.000516408,0.000540671,-0.00129518,-0.00096826,0.000882028,-0.000879098,-0.00087526,-0.000492055,-0.000770088,-0.000201995,-0.000201735,-0.000306588,0.00140985,0.000769723,0.000441385,-0.000247391,-0.000311792,0.000332767,-0.00103971,-0.00122827,0.0015928,-0.00010327,-0.00115918,-0.000389047,-0.00113752,0.000352339,0.000931826,0.00167083,-0.000789573,-0.00059031,0.0006772,0.00101207,-0.0000994048,-0.00118907,-0.00155186,0.00108071,-0.000623741,-0.00048034,-0.0000446082,-0.00125083,-0.0000941759,-0.00125609,0.00128692,-0.0013168,-0.000153343,0.0012804,-0.00119229,0.000104682,0.000171743,0.00126114,0.0000528622,-0.00172358,0.000725315,0.00113176,0.000679466,0.00147652,-0.000208161,0.000679939,-0.00126232,-0.000690694,0.000570474,0.00165781,-0.0011389,-0.000563189,0.000732539,-0.000779829,0.0000721613,0.000408205,-0.000201071,0.000245457,0.000271987,0.000115652,0.000493102,-0.00170547,0.000204002,0.000735159,0.000227897,-0.000300862,0.0000166392,-0.000866897,0.0000799783,-0.00181246,0.00169138,-0.000222082,0.0000810697,-0.0000878856,0.00115993,0.000465249,-0.000627989,0.000390606,-0.000986884,0.0000937564,0.00104303,0.000446884,0.00112805,-0.000151603,-0.00199901,-0.000305297,-0.000491696,-0.0000335733,-0.0000226862,0.00119609,0.000697543,-0.000878587,0.000962843,-0.000760665,0.000585017,-0.00113566,0.000195258,0.00102341,-0.00185822,-0.000585159,-0.000936912,0.000923785,0.000664872,0.000188701,0.000269402,0.000844322,0.000333088,-0.000632796,-0.000663968,-0.0011441,0.000845226,0.000293947,0.000341118,0.000991625,-0.000408156,-0.000280731,-0.000284255,-0.000759575,-0.0000604187,-0.000946843,0.000762638,-0.000469239,0.000989209,0.000913665,0.00194477,0.0000454538,0.00157887,0.00124058,-0.000166534,0.000379172,-0.000776947,0.00151998,-0.000805771,-0.0008602,-0.000766332,0.000739152,0.000368655,-0.000835059,-0.000711289,0.00199966,-0.00133727,-0.000633972,0.000486751,-0.00125199,-0.000628748,-0.000939906,0.000779781,0.000641663,-0.00107737,0.000587084,-0.000812074,0.000713787,0.000531286,0.000263792,0.00140916,-0.000705169,0.000895514,0.000375244,-0.000297057,0.000930279,-0.000504593,-0.0000946852,-0.000813194,-0.000413908,-0.00134349,0.000112716,-0.00135163,-0.000292193,0.00142764,-0.000149957,-0.000102861,0.000397373,0.000116288,0.0000959132,-0.000236885,-0.00125747,-0.00109205,-0.000744171,-0.000640344,-0.0000173796,0.00114299,0.000316569,-0.000238778,-0.000220888,0.000382723,-0.000608171,0.0011031,-0.00120429,-0.00086663,0.0012586,-0.000862542,0.00102769,-0.000286728,-0.000341975,-0.0000355695,-0.000507051,0.000476886,-0.000131808,0.000383768,-0.0010343,0.00147172,0.000534859,-0.000550704,-0.00094189,0.000303417,0.000374922,0.000912861,-0.0000816096,0.00198946,-0.00121816,-0.000718835,0.000158292,-0.000180539,-0.00100643,-0.000668923,-0.00134461,0.00036634,0.000376613,0.00150476,0.00118861,0.000225148,0.00176182,0.000811199,0.000360277,0.000803469,0.00165191,0.0000958027,0.00019849,-0.00117444,0.000112894,0.000605286,-0.000735064,0.000236957,-0.000320935,-0.000948744,-0.00000569659,0.000477801,-0.000921148,0.000120597,0.000142844,0.0000592269,0.000104999,-0.00000686575,-0.00113475,0.00159361,-0.00120111,0.000590879,-0.000743456,0.000527044,0.00177708,0.00173921,0.00029991,-0.00120444,-0.000900895,-0.00191663,0.000554559,-0.00101286,-0.000522719,0.000655999,-0.000467357,-0.00031306,0.00123499,0.000231107,0.000339029,0.0000799655,0.000987077,0.0011362,-0.000578935,0.000325469,0.000414406,-0.000870948,-0.000396692,-0.000646169,0.000509523,-0.000100286,-0.0011888,-0.00164129,0.000538815,-0.0000181644,-0.0019026,-0.000410035,0.000974954,0.00136706,-0.000498622,0.000714,0.00108155,-0.000739498,0.00198077,-0.00132434,-0.000456959,0.000808239,-0.000449219,-0.0000800929,0.000646439,0.000938788,0.00043216,-0.00145091,-0.000526513,-0.00106586,0.00140568,-0.000961301,-0.00020423,-0.000564515,0.000137579,-0.000381972,0.0005689,-0.000632804,-0.000229557,-0.000312039,-0.00152719,-0.000798893,0.000707755,0.000835819,-0.000725642,-0.000422712,0.00174988,-0.000146099,-0.000221268,0.000921831,0.0018382,-0.00101628,-0.000458376,-0.000394522,-0.000123904,-0.00098667,-0.00168564,-0.00115349,0.00135367,-0.000410337,-0.00128232,0.000308408,-0.00106056,0.0000934496,0.000436902,0.000594863,0.00127231,0.000188832,-0.00106648,0.0000520783,0.0000665456,-0.000471635,0.000152664,0.000331353,-0.000839499,0.000663527,0.00183211,-0.000214565,0.000334025,-0.00102398,0.00107834,0.000163315,-0.000821034,0.00144977,0.000988639,0.00145308,0.000382906,0.00106893,-0.000534772,-0.00170667,0.000480516,-0.000947688,0.000775879,-0.000955366,0.0000380194,-0.000481506,-0.000361946,0.00130144,0.000437561,-0.000379663,0.0000697779,0.000850801,0.000179028,-0.00139805,0.000165397,-0.0000660569,-0.00106245,-0.00009505,-0.000164529,0.000939505,0.00169895,-0.00042465,0.00120849,-0.0000186337,0.000906068,0.000493845,-0.000116244,0.000158065,-0.000366268,0.000321587,-0.000211983,0.000188158,-0.000729659,0.000241998,-0.000795934,-0.000776953,-0.000706462,0.001386,-0.0000345958,-0.000629342,-0.000621856,0.000766112,0.00119527,-0.00105518,0.000246476,0.00102307,-0.0012315,-0.000291959,-0.000307147,-0.000904651,0.00181476,0.000183924,-0.000554212,-0.000503289,0.00121303,-0.00194507,0.000641832,-0.00125791,-0.0000404603,0.000692671,0.000123169,-0.000599522,-0.00117123,-0.000800972,0.000622673,0.000166339,0.000902037,0.000362932,-0.000166122,-0.00175033,-0.000718216,-0.000407456,0.000466901,0.000218372,0.0013124,-0.000933872,0.000293977,0.000105276,-0.00021256,0.000620539,0.000387846,0.000166822,0.00107876,0.000493156,-0.00044901,-0.000472398,0.000926911,0.000619269,0.0000594703,0.000128299,0.000485076,-0.000671414,-0.00179678,0.00128254,0.000957767,0.00068806,-0.0000985514,-0.00170904,-0.000802576,-0.000615518,0.000672837,-0.000614014,-0.0010879,-0.000307167,-0.00143257,0.00106709,0.00133502,-0.00080981,-0.000348099,-0.000361558,-0.000844614,0.00128835,0.000307305,0.00118785,0.000609498,0.000883772,-0.000154976,-0.000349194,-0.000424252,-0.00073453,-0.000268733,-0.00124107,-0.000227781,-0.000377621,-0.000774259,-0.00139603,0.000678696,0.000434486,-0.000462097,-0.000113012,0.000965102,-0.000302762,0.00111265,-0.00132899,-0.000278909,-0.000193944,0.00103151,0.00039617,-0.00102018,0.00135591,-0.000343485,-0.00116086,0.000294413,0.000730895,-0.00090225,0.000132992,0.000282608,-0.000482848,0.000742994,0.000499821,0.001165,0.00151354,-0.000400625,0.00165025,0.000213818,-0.000408756,0.000430545,0.000060793,0.000844694,0.00000989596,0.000569295,0.000890439,0.00102805,-0.00124982,-0.00088899,-0.000917315,-0.000516537,-0.000194367,0.00118298,0.00047375,0.00120196,-0.00082415,0.000662486,0.0000758171,0.000333154,-0.000314238,0.000543803,0.00129045,0.00188072,-0.0019195,0.00140721,0.00153841,0.00124398,-0.0000554565,-0.00096632,0.000357106,-0.0000177512,-0.00117384,-0.000111566,0.000197198,0.00042165,0.0000117364,0.00137579,-0.00147705,0.000344847,-0.00110917,0.00106571,0.00120829,0.000225271,0.000628351,-0.000271521,-0.000862601,0.0000702038,-0.00157916,-0.00101776,0.000419663,-0.000598095,-0.00022337,-0.00114419,-0.000767412,-0.000162656,-0.000877721,-0.000627395,0.000917818,-0.0000378226,-0.000785084,-0.000321633,0.00180964,0.000554544,0.00143455,-0.000184024,0.0017735,0.0016971,0.0000636118,0.00019431,0.000754668,-0.000606254,-0.000320907,0.00105708,0.000715246,0.000722442,-0.000451737,0.0019886,0.000594937,-0.000433461,0.000446295,-0.00157403,-0.00130059,-0.000904993,0.00124505,-0.00124991,-0.0000811837,-0.000635083,0.00105143,-0.0000515842,-0.000414757,-0.000711667,0.0000552653,0.000763717,0.000533647,-0.0000669605,-0.000916666,0.0000835944,0.000333992,0.000881779,0.00103057,-0.000681865,-0.000268332,-0.000493053,-0.000251226,0.000880007,-0.000478183,0.000656268,-0.00177651,0.00120201,-0.000435378,0.000393632,0.00183893,-0.00121387,-0.000335446,-0.00171023,0.000745157,-0.000656559,-0.000165377,0.00185561,0.000606586,-0.000966998,0.0000949432,0.00067499,0.000796806,-0.00170711,-0.00100694,-0.0000885873,0.00143231,-0.000884822,0.000143546,0.00109781,-0.000875377,-0.00123594,0.00134639,-0.000648479,0.00187546,-0.000490973,-0.000929096,-0.000789058,0.0000835391,0.000181123,0.00115184,0.000780813,-0.00122516,0.000560027,-0.000927785,0.00024713,0.00113009,-0.00138293,-0.00137211,0.000475438,-0.000601641,0.0000371315,0.00120668,-0.00057625,0.000842469,-0.000723989,0.000984651,-0.00145157,0.000789329,0.0000893755,0.000362319,-0.00118029,0.00123754,0.00043835,0.00188748,0.00048823,0.00094497,-0.000678026,-0.00159047,0.000373103,0.000799497,0.00119344,-0.000797095,-0.000125877,-0.000783165,0.00137976,0.000623376,0.000305726,0.000210236,0.0000615274,-0.0000990725,-0.000562264,-0.000607697,-0.000352217,0.000979586,0.000190497,0.000079596,0.0010489,-0.0000847856,0.00136876,0.000310886,-0.000637956,0.000520933,-0.0000132705,-0.000109038,-0.000100337,-0.000441034,-0.0016293,-0.000858904,0.0000810327,0.000864704,0.000205618,-0.00083363,0.000309089,0.000209012,0.0000107864,0.00041682,-0.00116606,0.000576069,0.000156981,-0.00130311,0.000368431,0.00024075,-0.00141612,-0.000509157,0.000798609,0.00195595,-0.000182031,-0.000828539,-0.00148783,0.000850905,-0.00137105,-0.000559445,0.00015586,0.000283934,-0.000461727,0.000400181,-0.000300997,0.0015698,0.00154809,0.00097043,0.00140854,-0.00120428,0.000786988,0.000490604,-0.000844241,0.00069906,-0.00164831,-0.00100502,0.00140492,-0.0000177751,0.00183633,0.00031809,0.00197071,0.000500498,0.000777208,-0.00199743,-0.000293014,0.00136454,-0.000421388,0.0000814689,-0.00152789,0.000101213,-0.000704314,0.000638517,0.000874636,-0.000409895,-0.00117886,-0.000801293,-0.00121954,0.0000282741,-0.0000014743,-0.000564779,0.00149262,0.0000184189,0.000401966,0.00163255,-0.00156136,0.000110834,0.000873781,-0.000464806,-0.000513631,-0.00135788,0.000744689,-0.000381013,-0.00148034,-0.000297022,-0.000140362,0.0000663492,0.000844956,0.000927639,0.000537394,0.00101939,0.00139188,0.000152885,-0.000948301,0.000567124,0.000760181,-0.00064821,-0.00154823,0.000267631,-0.000852744,-0.000533825,-0.000116993,0.000200312,-0.000920256,0.0000836137,0.000834699,-0.000852378,0.00025143,-0.00163263,-0.00105321,-0.00103429,0.0013898,-0.000424302,-0.000281446,0.0000977721,0.00122383,0.000190583,-0.00068122,0.0000753709,-0.000087077,0.00127168,-0.00170322,0.000266937,0.0000305331,-0.000841765,-0.00121425,0.00115987,-0.000729763,0.00131991,0.00060747,0.00149062,0.000289016,-0.000741628,0.0006295,-0.00000607886,-0.00127539,-0.00075301,-0.000343108,0.000801057,-0.000708965,-0.00108867,-0.000778758,-0.000364608,0.0000208815,-0.00100613,-0.000747614,0.00083613,-0.0010629,0.000034736,0.000940484,-0.000870603,-0.00140586,-0.00115028,-0.0000561301,0.00114508,0.001103,0.00115156,0.0001372,-0.00164657,-0.000706924,0.000224224,0.0015832,-0.00102241,0.000318569,0.001963,-0.000542867,0.000880772,-0.00115431,-0.00125317,-0.0000590211,0.000272688,0.000420928,-0.000271233,-0.000244631,-0.000484394,0.000665146,-0.000542017,0.000047545,0.000609452,-0.000470989,0.00175522,0.00122378,0.000525691,-0.000193169,0.00139415,0.0018886,-0.0013561,0.0000182331,0.000368791,-0.000754165,-0.000174322,0.00117818,0.0000480085,0.000765356,0.000739546,-0.000812787,0.00107848,-0.000381392,0.00105895,-0.000837381,0.000857341,-0.000109342,-0.000388005,0.000723498,0.00103076,0.000142766,0.000212919,0.0000348105,0.000490924,0.00070194,0.00119572,0.0000797439,0.00163433,0.000153426,-0.000299475,-0.000238133,-0.00040619,0.00117065,-0.00136178,-0.00114551,0.00124694,-0.000327871,-0.000629254,0.000898246,0.000283524,-0.000932505,-0.000971378,0.00071875,-0.0000206963,0.000564772,0.00172571,0.00135648,-0.00115946,0.00188472,0.00124236,-0.000112693,-0.00109301,0.000848234,-0.00109106,0.000741392,-0.00164748,-0.00125012,0.000727065,0.00160105,0.000789458,0.000892776,-0.00132206,-0.00105575,-0.000364901,-0.000126128,-0.0013001,-0.000290803,0.0017786,-0.00155994,0.000247437,-0.0000665478,0.00108681,0.000564148,0.000275311,-0.00091815,0.000784904,-0.0000909532,0.000469334,0.000520673,0.000150514,-0.000449629,-0.00170374,0.000131212,-0.000351283,0.000787517,0.000197542,0.000016975,0.00106271,-0.000772195,0.000324485,-0.00094356,-0.000413235,0.000378634,0.000694203,0.000661324,0.00109271,0.0000653615,-0.000328688,-0.00109621,0.000389559,0.00118554,0.000504721,0.000463636,-0.00131013,0.00168633,-0.00049515,-0.0000438237,-0.0000795722,0.000642953,-0.00055137,0.000844361,0.00112601,0.0000943234,0.00120437,0.00119033,0.00096482,0.00117641,0.001125,-0.00109122,0.00101191,0.0000155837,0.00171464,-0.000635634,0.0000316142,-0.0000364243,-0.000418709,0.000313187,-0.000788713,-0.000600829,0.000453102,0.000622024,0.00085209,0.00113645,-0.000464004,-0.000983016,-0.00177432,-0.000338421,0.000887569,0.00094364,0.000304817,0.00127009,-0.00059238,-0.000849232,0.000362979,0.000458081,-0.00198921,0.00112508,0.0000396685,-0.000545517,0.000573569,0.00140452,0.00000266544,0.00131895,-0.000907357,0.000730805,-0.000262306,0.00000705934,0.0000539947,-0.000465686,-0.00000645036,-0.000100785,0.000746237,-0.000586034,-0.000426089,0.000112185,-0.00111132,-0.00100733,-0.000498491,-0.000435271,0.000458966,0.000333471,0.000395317,-0.000749568,-0.000466619,0.00170195,-0.00055042,-0.000831775,0.000989095,0.000599936,-0.000884943,-0.00178747,0.0000205813,-0.00192764,0.00135343,-0.000147104,0.00075765,0.000631893,0.000943105,0.000511931,0.000987029,0.00074871,-0.000156905,0.000267731,0.000930963,-0.000681316,0.000249558,-0.000880463,-0.000477675,0.000442599,0.00081671,0.000126619,0.00123373,-0.0000681565,-0.00182816,-0.000911759,-0.00116574,0.000628052,-0.00106525,-0.000112637,0.000260982,-0.000806392,-0.0000344926,0.0000594317,-0.000347927,-0.00171273,-0.0000318618,-0.0000642098,0.000125926,0.000180845,-0.00114552,0.00123087,-0.00112225,0.00072205,-0.000744843,0.00145816,0.00127665,-0.000448765,-0.000741424,-0.000378302,0.000107907,0.000551533,0.000481032,0.000182394,0.00168058,0.000288882,-0.000260396,-0.000811719,-0.000164238,0.000399,0.00163824,-0.00154591,0.000998715,0.000566365,-0.00164177,-0.00169987,0.000180686,0.000726289,-0.000184617,-0.000736866,-0.000496329,0.000708275,0.0000319428,-0.000342625,-0.00137402,-0.000788938,0.00123888,0.0018539,0.000946817,0.000913311,-0.000466867,-0.000493367,-0.0000187344,0.00190191,-0.000964128,-0.00140357,0.00166318,-0.000544152,0.0000576756,-0.000134122,-0.000404823,-0.00172517,-0.00194524,0.000955805,-0.000928479,-0.0000424867,0.0014515,0.00160772,-0.000233475,-0.00078783,0.000107552,-0.00146411,0.000621559,0.000516491,0.0003499,-0.00183137,-0.000347315,-0.000917985,-0.000460624,-0.000904789,0.0000841446,-0.00136333,-0.00106718,-0.000610638,-0.000179258,-0.00115016,0.000150699,-0.000594338,-0.00063191,-0.00139592,0.000949471,0.00128394,-0.00119952,0.00111543,0.00188072,0.000181424,-0.000277842,0.00187049,-0.000198427,0.000181943,0.000628263,0.00113204,-0.0000662461,-0.00121496,0.000506187,-0.00115063,0.000170914,-0.000420701,0.00190447,-0.000146212,0.000772844,-0.00100165,-0.000371632,-0.00136117,0.00176933,0.000294051,0.000552573,-0.000447701,0.000560849,-0.00189873,-0.00188135,-0.00141292,-0.000134174,0.000581148,0.000352737,0.00126424,0.000176099,0.000143744,-0.00032452,-0.000225861,0.000455005,0.0000517733,-0.00075806,-0.00104414,-0.000377262,0.00164702,-0.000130255,0.000484148,-0.0006601,-0.0010674,0.000570898,-0.000602672,0.00161254,0.000314509,-0.00130179,0.000107457,-0.000989027,0.000194145,0.0013536,0.00132562,0.000764687,0.00108988,-0.000832984,0.000340259,0.000560542,0.00176634,-0.00153001,-0.000293487,-0.000182559,0.000943847,-0.000391796,-0.00100431,-0.00104001,-0.000825392,0.000729367,-0.00133153,0.00105816,0.00178461,0.000256863,0.00000394006,-0.00162841,0.00165791,0.00108697,0.00105531,0.000205981,0.00184442,-0.00174147,-0.000181045,0.0007273,-0.0000410061,-0.00121157,-0.00109577,0.000551787,0.000425469,-0.00117188,0.00135578,0.000597933,-0.000846981,0.000394291,-0.00106944,0.000510284,-0.000043242,-0.00138932,-0.00166757,0.000206654,-0.00137005,0.00158674,0.000910121,0.000358195,0.000035972,0.00159084,-0.00116366,0.000835133,-0.000868499,0.000442007,-0.00131381,-0.000477329,0.00179652,0.000558016,-0.000662779,-0.000140039,-0.00148818,0.000216168,-0.000484532,0.000168223,-0.000706224,-0.00113236,-0.00130739,0.000109879,0.00126139,-0.000263237,-0.000116522,-0.00105983,-0.000913096,-0.000832278,-0.00192619,0.000395553,0.0013673,-0.00152499,0.00103061,0.000368217,0.000606934,-0.000889021,0.00133381,0.000719571,0.000851202,0.000809252,-0.0000143471,0.00152955,-0.000947223,-0.000845063,0.0000756644,0.000970688,-0.000762909,0.000252243,0.000794778,-0.00119264,0.000303695,-0.000363917,0.00195733,-0.000559252,-0.000279865,0.00133614,-0.000286449,0.000448114,0.00166369,-0.00164825,-0.00111639,0.00116238,0.000222587,-0.00143539,-0.00174822,-0.000926473,-0.000850053,0.00143344,-0.000957269,-0.00056158,-0.0010918,-0.00190244,-0.000716132,-0.000346016,0.00147572,0.000085494,-0.000539184,0.000565355,0.00126157,0.0000439727,-0.00107109,-0.0000507225,0.00107474,0.000497127,0.0000271651,0.00126616,0.000690613,0.000208741,0.00185332,0.00158785,-0.000327603,0.000814938,-0.000917145,-0.000433756,0.0012556,0.000275482,0.000291783,-0.000769291,-0.000571741,-0.00190274,-0.00107944,-0.00181825,0.00107578,0.000733338,-0.000229049,0.00128134,0.000370367,-0.0000148482,-0.000505022,0.000685843,-0.000288551,0.000143441,-0.00138791,-0.00184005,0.00134342,0.000209579,-0.000523474,-0.00075836,0.000669928,-0.00105036,0.000105278,-0.00170772,-0.0000771306,-0.000680523,-0.000225299,-0.000765141,-0.0000305442,0.000560888,-0.00073655,0.000833318,0.000645471,-0.000963177,-0.000486597,-0.00162916,0.0000972358,0.000349947,-0.000491763,-0.00191081,-0.000466241,0.0012196,0.000574767,-0.00081816,-0.00106928,0.000823962,0.000326282,-0.000791626,-0.00120668,0.000792873,-0.000622137,-0.00169504,0.00110397,-0.000817248,0.0018254,0.000927688,0.00116687,-0.00112261,0.000530607,0.00149962,0.000350164,-0.000948429,0.000694513,-0.00192915,0.000884094,-0.000723068,0.000437845,-0.00107683,-0.00152897,-0.000132042,-0.000344759,0.000984549,-0.0000209983,-0.000565704,0.000855812,0.00102686,0.00110959,0.000349328,-0.000384819,-0.000794633,-0.000065824,-0.000711262,0.00167981,-0.00115112,0.000606777,0.000465807,-0.000662833,0.000867198,-0.000801755,0.00115958,0.0000182398,0.0000927973,-0.00139305,-0.000410872,-0.00131559,-0.00110761,0.00168737,-0.000618292,-0.00152538,0.00134845,0.000270085,-0.000970206,-0.000984659,-0.000836864,-0.0019026,0.00045631,0.00143686,0.00101846,0.000588346,-0.000380368,-0.000807185,-0.000866424,-0.000675593,-0.001278,0.00107067,-0.000908163,0.00161384,0.000597095,-0.00116833,-0.000355531,-0.00118707,-0.000330103,-0.000427942,0.000913564,-0.000260882,0.000292317,-0.00127109,0.00154032,0.00123482,0.000653661,0.00030278,-0.000377925,-0.00162664,-0.000383127,0.00131351,-0.0000116911,0.00131487,-0.000400038,0.000531603,0.000130073,0.000779365,0.000682475,0.00113342,0.00131991,-0.000115202,0.00107593,-0.000471717,0.000599221,-0.000307028,0.00111665,0.00160982,0.0000112154,-0.000432106,0.000538159,0.0000774768,0.000250534,-0.00185118,0.0000707568,0.000397385,0.000629682,-0.0000156234,0.000351262,-0.000570065,-0.000309708,0.000730507,-0.000626752,0.000392909,-0.000890005,0.000276155,-0.000878779,-0.000342303,-0.00115772,-0.000949822,0.000211413,-0.000545663,-0.000855933,0.000924334,-0.000723118,0.0000902622,0.00108515,0.00142015,-0.000411359,-0.000445962,0.000428037,-0.00124871,-0.00000898583,0.000839729,-0.000437366,0.000230496,0.00116453,0.000777535,-0.000499624,-0.00068029,-0.00120224,0.000008349,0.000196832,0.00133456,-0.000921907,0.000685214,-0.00140547,-0.000862228,0.000302872,0.000134277,0.00100369,-0.000633127,0.00113806,-0.00154094,-0.000838379,0.000431802,-0.000796791,-0.000499657,0.000123692,0.000905283,0.000335319,0.00135038,-0.000345557,0.00120568,0.000692122,0.00115416,0.0000882781,-0.00147415,-0.00019306,-0.000709341,0.000539039,-0.00087401,-0.000454281,-0.000336929,0.000118025,0.000639857,-0.00114993,0.000230816,0.00107467,-0.00124247,-0.00016508,-0.000464947,0.000264631,-0.0000915401,-0.000475089,-0.00114048,-0.000233869,-0.00107046,-0.00127262,-0.000496886,0.000335778,-0.000298953,0.000491513,-0.0000915012,-0.00046261,0.000203513,0.000775367,-0.00152877,-0.000696869,0.0000950996,-0.00014611,-0.000403759,0.00053341,-0.000450181,0.000229618,-0.000330735,-0.00136,-0.0000282249,0.000166341,-0.0000282613,0.00086158,0.00150775,0.000421058,-0.000702404,0.000884386,-0.000790584,0.000468252,-0.0000790854,0.00047872,-0.0012829,-0.000771587,-0.00111455,0.000625661,-0.00108032,0.00199823,0.000734654,0.000787919,0.000546496,0.00145635,0.0000757096,-0.000714371,-0.000736125,-0.0010301,0.000803119,0.0000592444,-0.00000701908,-0.00148925,0.000166444,0.00119288,0.00088137,-0.000158568,0.000357369,0.000350821,-0.000794765,0.000175558,0.000316202,-0.00023846,0.000161827,-0.000366225,-0.000423036,-0.000838634,-0.00071242,-0.00187332,-0.000534817,0.000359668,-0.00100435,-0.000275164,-0.0000688538,-0.000763804,-0.000804114,-0.000403515,-0.0000820838,0.000000291708,-0.00193422,0.000497139,-0.00110541,0.000542264,0.000623253,-0.00123362,0.000549356,-0.000490761,-0.000292406,-0.00049612,0.000252358,0.000913465,-0.000833298,-0.000354049,-0.000142507,-0.000426139,-0.00119454,0.000754412,0.000795154,0.000260702,0.00025734,-0.00135394,0.00148604,-0.000900371,0.000186778,-0.000133917,-0.0000948175,-0.000220736,-0.00146094,0.00115715,0.000000531089,0.00101129,0.00184128,-0.000852022,0.000664991,-0.00132649,0.0000719696,-0.00178216,-0.000444256,0.000109444,-0.000207913,-0.00115765,-0.000390819,-0.0019012,0.000620158,0.00000387446,-0.00119908,0.00131567,0.000741133,0.00125495,-0.000525187,-0.000413892,-0.0000246129,-0.000983142,-0.000359196,-0.00131969,0.000556228,-0.00151751,-0.000274382,-0.000789336,-0.0000206826,-0.00127906,-0.00104504,0.0000900284,0.000749669,-0.000608516,-0.00137097,-0.000716856,-0.000452431,0.000361206,-0.0004528,0.0000238264,0.000578121,-0.000975836,0.000582167,0.000279634,0.000343095,-0.0000794421,-0.0015287,0.000556506,-0.000602605,-0.00032252,0.000785198,-0.00171489,-0.0016305,-0.000692365,-0.0014792,0.000725055,0.000184024,-0.00196634,-0.00137965,-0.000698258,-0.000142494,-0.000727948,0.000316954,-0.00140025,-0.000276023,0.000825433,0.00090294,0.000929249,0.00118957,0.000644504,-0.000618984,-0.000210287,0.00102894,0.000112943,0.000388875,-0.000520943,0.000903893,-0.000447687,0.000192421,-0.00132232,0.00122901,-0.0000970742,-0.000629892,-0.000759212,-0.0016519,0.00144866,-0.000220616,0.000950852,-0.000409339,0.00121588,0.000684105,-0.000570121,-0.00141838,-0.00139266,-0.000442941,-0.000585609,0.001452,-0.00108242,0.000613249,0.000327156,0.0000290734,-0.000309582,-0.0015633,0.000584728,-0.000317594,0.000405709,-0.0000544906,-0.000290451,0.00158368,-0.000956024,0.00106604,-0.000043751,-0.000419661,0.00174204,0.00110192,-0.000681742,0.0000543862,-0.00035938,-0.000385241,-0.000206368,0.000637748,0.000730296,0.000127701,0.0000470481,-0.00019136,-0.000975788,-0.00165775,0.000705408,0.0000976705,-0.000474436,-0.000891967,-0.00152144,-0.000529701,-0.000122572,-0.00158463,-0.00000318643,-0.000837531,-0.00053541,0.00150418,-0.00143436,0.000846859,0.00172531,0.000566209,0.00104467,0.0000856416,0.000548408,-0.000299534,-0.0000457963,0.0000309151,-0.000295113,0.00132874,0.000106039,0.00101008,0.0000504405,-0.000185164,0.000457797,0.000408846,-0.000586234,0.00162301,0.000605135,-0.000806702,0.000547596,-0.00048679,-0.000792199,-0.000486433,-0.00115722,0.0000652847,-0.000186928,-0.000505072,-0.00190075,0.00157199,-0.000577807,-0.000659906,0.000141998,0.00179658,-0.000303135,0.000491349,-0.000662809,-0.000706141,0.000944921,0.000349254,0.000281244,0.00101288,0.0000890925,0.0011493,-0.0000339172,0.00112855,-0.000335937,-0.000521815,0.000989524,-0.000982707,0.00117741,0.00120886,0.00152219,-0.00106104,-0.000679819,0.00107966,0.000213809,0.0018157,0.00029081,-0.00125446,0.000352615,-0.000760257,-0.00137716,-0.000424146,0.00106249,0.000195447,0.000617639,0.00179663,0.000523943,0.00139249,0.00126885,0.000652193,-0.0017632,0.000141395,-0.00064392,0.000851771,-0.00137246,-0.0000912803,0.000136494,0.00103325,-0.000991926,0.000159014,-0.000241897,-0.000405912,-0.000845527,0.00054192,0.000652147,0.001268,-0.000377544,-0.00120309,-0.000684031,0.000412611,0.000162925,-0.00140459,-0.000635752,-0.0018609,0.000107719,0.000486526,-0.00169329,-0.00095206,-0.000599811,-0.000115909,-0.00133444,0.000449492,0.0000948519,-0.0000668589,-0.00065788,0.000319006,0.000258409,0.00127579,0.000288029,-0.000523989,0.000237143,-0.000696791,0.000516831,-0.000740937,-0.000445979,-0.000138295,0.00128685,-0.000830423,-0.000396736,0.000583881,-0.000764801,-0.00196231,0.00129487,-0.00114604,-0.000384235,0.0000869874,-0.000604744,0.00120732,0.0000437213,-0.000706359,0.000392416,0.00000515911,-0.000373672,0.000277452,0.000449867,-0.000420697,-0.000271852,-0.00049815,-0.00063306,-0.00154687,0.000413028,-0.00108382,0.000219861,-0.0000844018,-0.00117784,0.00152852,0.000227648,0.00162328,-0.000471416,0.00131028,0.00195711,-0.000430201,-0.000340377,-0.00159174,-0.000152468,-0.000108754,0.000282761,-0.000828646,-0.000865574,0.000353956,-0.00151134,-0.00106722,-0.000114246,0.00195681,-0.000552436,-0.00130697,-0.00122818,-0.000639465,-0.000154157,-0.000868132,0.000210413,0.000612169,-0.000995748,0.0014244,-0.000800195,0.000035079,-0.000217599,0.00127629,-0.000897898,0.000678263,0.000329707,-0.000213497,-0.000171616,-0.000201117,-0.0000540642,0.000666779,-0.001057,-0.000263674,-0.000623577,0.00175111,0.000972413,-0.000500537,-0.000763257,0.00189749,-0.000806225,-0.00112213,0.00111333,0.000691828,-0.000950322,0.000462314,0.000157917,-0.00142588,-0.000239033,-0.000485271,0.00134381,-0.000630197,-0.000479645,0.000213606,-0.000998514,0.00054541,-0.00125871,0.000214243,0.000861213,0.000404289,0.0000182668,-0.000483963,0.000173576,-0.000169033,-0.00137027,-0.000438308,-0.00121894,-0.000878148,0.000211329,0.00172999,0.000968848,0.000219852,-0.000578343,0.00114948,0.000487077,0.000928359,-0.00111681,0.000649682,0.000311315,-0.00133758,-0.00129253,0.000738867,-0.00170674,0.000862924,-0.000589121,-0.000613444,-0.00109566,-0.00161147,-0.00111058,0.0000111806,-0.000740794,-0.000109487,-0.000166478,-0.000269917,0.000779049,-0.00087861,0.000663385,-0.000374195,0.000965237,0.00021242,0.000304808,-0.00079507,-0.000962911,0.000300431,0.000124546,0.000311732,0.0012618,0.00137714,-0.0000415091,-0.000764557,-0.000514772,0.00192624,-0.0002172,0.00026968,-0.000662351,-0.000432138,0.000635829,0.00129612,0.000485897,-0.000662355,-0.000601778,0.000298523,-0.000584504,-0.000559412,-0.000747832,0.000527003,0.000108649,-0.00187776,-0.000333549,-0.000405765,0.0000293003,0.0000424332,0.00103973,-0.0000112959,0.000326856,0.000748373,0.000259629,-0.000290877,0.000124915,0.00155883,-0.0000593246,0.000994306,-0.00107631,0.000505683,-0.00164524,-0.00114767,0.00023729,0.000217306,0.000678452,-0.000415023,-0.000917704,0.000504979,0.000829878,0.0018753,-0.0000137044,-0.00142315,0.000403089,0.0010989,0.000343448,-0.00165526,-0.000250821,0.0000269918,0.000659873,-0.0013824,0.000186177,0.000976902,0.00198287,-0.0010075,-0.000162477,0.000109084,0.001386,-0.000874843,0.00135041,-0.00160492,-0.000980962,-0.00000555157,-0.00024731,-0.000965337,0.000738387,-0.000525831,0.000786155,0.00160517,0.00173383,0.000859677,0.000660397,0.000552412,0.0016017,0.0000774009,-0.000417482,-0.000200165,0.000863201,0.00071187,0.000523234,-0.00140793,-0.0010217,-0.00104965,0.0017235,0.000497286,-0.0000574057,0.00146607,0.00108605,-0.0000250603,0.0000242834,-0.00110347,-0.000363223,-0.0000299594,0.00147341,0.000952051,0.000224353,-0.000773026,0.000251217,0.000980367,0.0012821,-0.00061345,0.00122705,0.00124482,-0.000227708,0.00123842,0.000362906,0.000736566,-0.00161876,0.000311366,0.00111612,0.000806983,0.000562165,0.000427246,0.0019207,0.0000757777,-0.000258066,-0.000757437,0.000150722,-0.00014089,0.00180496,-0.000938321,-0.000667967,0.0012795,0.000473066,-0.000707332,0.000745864,0.000311794,0.000451319,0.0000844587,0.000267853,0.000400498,-0.000105204,0.000140962,0.000622981,0.00116579,-0.000499369,0.000553095,0.00196123,-0.000346835,0.000381906,-0.00131287,0.000499266,0.001766,0.000354225,-0.000538097,-0.0000788569,0.00167242,-0.0015191,0.000200823,-0.0012062,-0.000491074,0.000414585,-0.00186811,0.000507771,-0.000100313,-0.000143429,-0.000197278,-0.000815417,-0.0019231,0.000983757,-0.0001969,0.000758664,-0.000296402,0.00147127,0.000159561,0.000800197,0.000567292,0.000296311,-0.000276717,-0.00169398,-0.00087369,0.0000984212,-0.00027583,0.00139879,-0.000172896,-0.0000526918,0.00113494,0.000338046,0.0000832968,0.000144981,-0.000172289,0.00179132,0.000732101,0.00187847,0.000596708,0.00062022,0.000147665,0.00030552,0.00103882,0.000115945,-0.000235778,-0.000557408,0.00141704,-0.00165194,-0.000135928,-0.0000627948,0.0000734273,0.000591787,0.000906248,0.000643562,-0.000413209,0.00022715,0.00106679,-0.00096889,-0.000748923,-0.00112784,-0.000297932,-0.0000132968,-0.00158637,0.000513966,-0.000631843,0.0000140512,0.00157115,-0.000953484,0.00112412,0.000365068,0.000516379,-0.000206073,-0.000252688,-0.00106975,0.00102489,-0.00104689,-0.000179213,-0.000855643,-0.000260429,0.00161857,-0.000788721,0.00032226,-0.00101953,-0.000481844,0.00121485,-0.00116728,-0.0000860029,0.000202633,0.00108336,-0.000415217,0.00000629024,-0.00162079,0.0000474195,-0.000281457,-0.00122546,0.00131465,0.000190536,-0.000699156,0.000259752,-0.00152746,-0.00076818,0.000192269,-0.000308603,-0.00121003,0.000973256,-0.00030358,0.000298157,-0.000463079,-0.0000070762,-0.000378729,0.000615398,0.000530386,-0.000298044,0.000342476,0.000798159,-0.00129617,-0.00158849,-0.000825809,0.00131394,0.000117705,0.00081693,0.000849976,-0.00080337,-0.00113557,0.000226596,0.00183379,-0.00139758,-0.000874509,0.00144538,-0.00149572,0.00145758,0.000482298,0.00166777,0.000549851,-0.00042287,-0.000863371,0.00032533,-0.00150526,0.000608382,-0.000414686,0.000589512,0.00147093,0.000110081,-0.00175336,-0.000222567,-0.000546778,0.00107117,-0.00131266,-0.00171286,0.00000246323,0.000440157,0.000507564,-0.000230983,0.00035509,0.00142293,0.00050732,0.000435498,-0.000220341,0.000610691,-0.000909894,0.000262796,-0.000807597,0.0016871,-0.000465898,-0.00155604,-0.000556522,-0.000449497,0.000217235,-0.000452525,-0.000459539,-0.00151525,-0.000414148,-0.000217448,-0.000336082,0.000263858,-0.00000776613,0.000154556,-0.000633373,-0.000640243,0.00018752,-0.000965933,0.00156754,0.000565166,0.000145232,0.0000963052,-0.000753201,-0.000384688,-0.000421518,-0.000937035,0.000964001,-0.0010023,0.000605706,-0.000990064,-0.000856405,-0.000287689,-0.000727409,0.000885385,-0.000673938,0.0000650234,0.000421309,-0.0016496,-0.000249228,0.000442841,0.000133077,0.000763025,0.0000476686,0.000403729,-0.0012793,-0.000920974,0.00111856,0.00110762,0.00027887,0.000905238,-0.0000447231,0.000666953,0.00179829,-0.00115423,-0.000224531,0.00052044,0.00108055,0.00151637,0.000382174,-0.00041385,0.000347986,-0.0000239178,0.000230887,-0.000564135,0.00104121,-0.000849515,-0.00174914,0.00143284,0.000658141,0.000940764,0.000804477,0.000162055,-0.000503624,-0.000213089,-0.00053873,-0.00092745,0.000165023,-0.000362744,0.000755523,0.0000353056,-0.000879294,0.000247307,-0.000927713,0.000768445,0.0000870618,0.00181782,-0.000290039,0.00142352,0.000538156,-0.000732909,-0.000465884,-0.000169626,0.00148895,0.000576299,-0.000230637,-0.000964344,-0.000495885,0.000348622,0.000476708,0.0011967,-0.000860085,-0.000282544,0.000944767,0.00190149,0.000945153,0.00120346,-0.000418426,0.000141172,-0.0012412,-0.001278,-0.000386179,0.000826595,-0.000821401,-0.000874864,-0.000429585,0.000701666,-0.000338675,0.000422377,0.000391131,-0.000790654,-0.00139702,0.000644025,-0.000233158,0.000856395,-0.000171175,0.000733242,0.000196101,-0.000899756,-0.000247412,0.000330498,-0.000512303,0.000141853,-0.000520636,0.00119233,0.00077719,0.000629317,-0.000255442,0.000251705,-0.000105062,0.000722827,0.00083672,0.000427587,-0.000101833,-0.000192739,0.00149936,-0.00141718,0.000746685,0.00132599,-0.000102218,0.00057621,0.00146625,0.0000741666,0.000984138,0.00118468,0.000632384,-0.000108176,0.000486019,0.000518427,0.00074403,-0.000678334,-0.00128576,0.000980442,0.000889628,0.000707731,-0.0000133301,0.000542935,0.0000923745,0.000679902,0.000552496,0.000288237,-0.000419597,0.000245521,-0.00175478,-0.000298599,0.00165884,0.000626482,-0.000574777,0.000151908,-0.000108734,-0.000156168,0.000193404,0.000740401,0.000257526,0.0010588,0.0000414097,-0.000358953,-0.000916902,0.0001535,0.00021187,-0.000549603,-0.0000414656,0.000443221,-0.000608212,-0.000218711,-0.000307293,0.000572199,0.00018757,-0.00170147,0.000570834,0.000339171,0.00115649,0.00192832,-0.00199723,-0.0011751,-0.000965784,-0.00164018,0.000470572,0.00118195,0.000211104,-0.00182746,-0.00115334,0.00104367,0.000845695,-0.000996515,0.00103567,0.00071671,-0.00152342,0.00147343,-0.00108381,0.00139792,0.000866795,0.000736871,-0.000209478,0.000211396,0.00116242,0.000904698,-0.00124712,-0.00186008,-0.000228569,0.000750715,0.000665599,0.00156803,0.000417939,-0.0000177459,-0.000959715,0.000694107,0.000838621,-0.00000609,-0.000312728,0.00011068,0.000417764,0.000874312,-0.000444313,0.000695947,-0.000164636,0.00150855,-0.00093683,-0.000641713,-0.000537521,0.000750095,0.00110278,-0.0015466,-0.000163919,-0.0000462897,0.000968469,-0.0000877652,0.00116776,0.0000878424,0.000731678,-0.0000152432,-0.0000818802,-0.00065999,-0.000876649,-0.000681841,-0.0000353602,-0.00068574,0.000346784,-0.00134972,0.000555185,0.00153417,-0.000474267,0.0000294386,-0.000588706,0.000840098,-0.000332908,0.00150385,0.000756475,-0.000983008,-0.000798775,0.000121652,0.000339013,0.00102242,-0.000682776,0.000741523,0.00132859,-0.000392416,-0.000909572,-0.00199584,0.00100782,-0.00019463,0.00141363,0.00083462,0.000428612,0.000697083,0.00166333,-0.00046698,0.00105174,0.00099161,-0.000390383,-0.00082798,0.000863824,-0.000610228,0.000698906,0.00109181,0.000732576,-0.000366264,-0.0000595178,-0.00119567,0.00106503,0.00193891,-0.000529072,0.000131873,-0.000800226,0.000093765,-0.000631302,0.000426567,-0.00116813,0.000522675,0.000641719,-0.000112759,0.000592875,0.000675448,0.000148515,0.00183021,-0.000368743,-0.000329136,0.00169794,-0.000586713,-0.00064817,0.00100347,0.000317718,0.00100287,-0.000646726,0.000129036,0.000223137,0.0011916,0.00019562,-0.000229018,-0.000973244,0.000155389,-0.00097065,-0.000434965,0.000195992,-0.000935231,0.000380378,-0.000600374,-0.000945666,-0.000453257,-0.000423424,0.00151131,-0.000903415,-0.000746656,-0.000687205,-0.000867532,-0.000317833,-0.000712091,-0.000303948,0.000053543,-0.000830091,0.000560566,-0.000424266,0.0000496347,0.00140514,0.0005742,-0.0015889,0.000101225,-0.00134297,-0.000168372,-0.00136162,0.000660765,0.00106317,0.00110506,-0.000782461,-0.0000916868,-0.000436002,-0.00017719,0.000379612,-0.000530269,0.00042388,0.00100164,-0.00128668,-0.000016056,-0.000863901,-0.000554707,0.000203787,-0.000512697,-0.00170679,-0.000222476,0.000373217,0.0000275414,0.000200525,-0.000310207,-0.000638462,0.0000688361,-0.000203569,0.00114853,0.0011418,0.00109192,-0.000187628,0.000260428,-0.000549893,0.00121375,0.000590483,0.0000625683,-0.000319531,-0.00182601,0.000100933,0.00103137,0.000256456,-0.000640889,-0.00161348,-0.00087848,0.000707222,-0.0010814,-0.000478225,-0.00145157,-0.000463047,-0.000665419,-0.000815012,-0.00104658,0.0000297576,-0.000428029,-0.000264321,-0.0000395007,0.00147838,-0.000308638,-0.000610696,0.000241693,-0.000288694,-0.00057452,-0.000824705,0.000477662,0.0000749256,0.00029686,-0.0000739789,-0.0000689485,-0.000294446,0.000613665,-0.000173274,0.000277825,0.0000376381,0.00151168,0.00141122,-0.000751368,0.000774617,0.00041537,-0.000606679,0.000417307,0.000461243,-0.000127195,-0.00111202,0.000521803,-0.000753285,0.000494087,0.000471155,0.00107486,-0.00171859,-0.000117226,-0.00142154,-0.000630562,0.000781139,0.000678952,-0.000100232,-0.00140199,-0.000638001,-0.00116742,-0.000693495,-0.000381948,-0.00111743,-0.0000771352,0.0000362823,-0.0000795965,0.000254358,-0.000328029,0.00000274712,-0.00137295,0.00183233,-0.000226269,0.00105289,0.00108036,-0.0000962895,-0.000280689,-0.00182594,-0.000203682,0.000730434,0.0000756088,0.00157865,0.00146009,-0.0013071,-0.000717575,-0.00098059,-0.00165684,-0.000431901,-0.000980172,0.00143928,0.00000763392,0.000828367,-0.0000173141,0.00028086,0.000455864,0.0000917104,-0.0011159,-0.00000748758,-0.000414445,0.0000582903,0.00130849,-0.00185353,-0.000901912,0.000117553,-0.00105308,0.000500234,-0.00144465,-0.000857416,-0.000499988,0.00103761,-0.000101861,0.00114236,0.0013175,-0.000290669,0.000123575,-0.00161306,-0.00141166,0.00166043,0.000268314,-0.00111902,-0.000978697,0.000319887,0.00149886,-0.000218822,-0.000338297,0.000139285,0.00070739,0.000914872,-0.000343848,-0.00127462,-0.000391087,0.000960553,-0.000218095,0.00109321,-0.000933133,-0.0004746,-0.00030828,-0.000973161,0.00000889644,-0.00028741,-0.000323821,-0.000391978,-0.000258875,0.00129943,0.000666686,-0.00156158,-0.00109122,0.0000272371,-0.000589584,0.000591557,-0.000325849,0.000273128,0.000785821,-0.00142901,0.00125421,0.000933695,-0.0000639318,-0.000490453,-0.00029538,0.000110122,-0.000372238,0.00027076,0.00081412,-0.000109122,-0.000438868,0.000659009,-0.00108442,0.000889285,-0.00105473,-0.00166427,-0.00000365067,0.000244164,0.00146239,0.00174015,0.000523376,0.000442955,-0.000262557,-0.000106993,0.00115654,-0.00109358,0.000944057,0.000651354,0.00185946,0.000222886,-0.0018623,0.000100536,0.00196128,0.000971039,0.00143429,-0.000699093,0.00119904,-0.000755935,0.000109677,-0.000292419,0.000722805,-0.0000474021,0.0000704212,-0.00102593,-0.000818389,0.000601149,0.000494765,-0.000114624,-0.000842521,0.000599654,0.000926353,0.0004429,-0.00117026,0.00103829,0.000893692,0.000506463,-0.0017361,0.00071916,-0.000055107,-0.000266695,0.000686698,-0.00126922,-0.00012408,0.001447,0.0000229412,-0.000113235,-0.000814027,-0.000879549,-0.000555868,-0.000555451,0.000483118,-0.00133583,0.00069494,-0.000650568,0.000102778,-0.00180131,-0.000366943,-0.00029145,-0.000279954,-0.0011372,0.000538674,-0.000230185,-0.00105642,-0.000304288,0.0000294067,0.000884452,0.000359548,-0.0000914939,-0.0013411,-0.00012603,-0.0000574054,0.000107448,0.00177423,0.00119582,-0.000668661,-0.000255116,-0.000595878,-0.000051376,-0.000533215,-0.00026512,0.00108736,0.00109208,0.000545731,-0.00134955,-0.000294194,0.00183489,0.00111742,0.0011678,-0.0000128256,-0.00156282,0.000079767,-0.000540778,-0.000415636,-0.00034539,-0.000747182,0.0011184,-0.000132788,0.000451366,-0.000131463,-0.00105874,-0.000295025,0.00182896,-0.000099136,-0.00126156,-0.00180812,0.000233632,0.0000579223,0.00136741,-0.000195327,0.000306431,0.00062124,0.000800135,-0.000320872,0.000875261,-0.000910602,0.00132466,-0.0000334653,-0.000255081,0.000326776,0.00027831,-0.00157868,-0.000259412,-0.000894796,-0.00118365,-0.000160683,-0.000539599,-0.000926157,0.00173889,-0.000160093,-0.000487655,0.00162782,-0.00110354,-0.000114176,0.000282645,-0.0013823,-0.000800145,-0.00070469,-0.000473944,0.00157444,0.000949037,0.000118897,-0.000416602,-0.00140975,-0.000877146,0.000983206,-0.000980535,0.000669326,-0.000326233,0.000299015,0.0000260693,-0.000633155,-0.000323283,-0.00108238,0.00108627,0.000731169,-0.00150689,-0.000491389,-0.0014491,0.000467435,-0.000141346,-0.0010727,-0.000142649,-0.000849304,-0.000399865,-0.00195019,0.00101938,-0.000441476,-0.00107944,-0.000625822,0.000174013,0.00150679,0.00163308,0.0000617553,-0.000320154,0.000853329,-0.00101271,-0.000139274,0.00073256,-0.00117359,-0.000628236,-0.000546835,-0.000215352,0.000214334,0.000253091,-0.00147721,0.0000131799,0.000618219,-0.00112377,-0.00135912,-0.000307403,0.000649234,0.000737057,-0.00142846,-0.00112853,-0.000602808,-0.000746405,0.0017537,-0.000854919,0.00129717,0.00147239,0.000413265,0.000353491,0.00122428,-0.000317446,-0.000657395,-0.000978758,0.00157067,0.00161508,-0.00104853,0.000231616,0.00112161,0.00123876,0.000145325,0.000882283,0.000580278,0.000518019,0.000435312,-0.00143729,0.000121173,0.000132341,-0.0000594037,-0.0000672649,-0.000277291,-0.00197148,-0.00157256,0.000759607,0.000142949,0.0000607945,0.00155832,-0.000217066,0.000922578,0.000320041,0.0000711272,-0.000351442,-0.000379533,0.00161024,-0.000346819,-0.000225162,0.000254018,-0.00103542,-0.000134259,-0.00164171,0.00167768,0.000353347,0.0000561177,-0.000197893,-0.0000265131,0.00112281,0.000387856,-0.000835214,0.00114771,0.00140718,-0.0000788177,-0.00103591,-0.000854061,0.0000910989,-0.000355188,-0.000156486,-0.0000392679,0.00049228,-0.00116127,0.00041041,0.000148403,-0.000423197,0.000596555,0.000258906,0.00095003,-0.000675242,0.000926169,0.000581134,0.0000943845,0.00012841,0.00106825,0.000904235,0.000131016,0.00103887,0.00108722,0.000734396,-0.00132897,-0.00059937,-0.000899434,-0.000291074,-0.000515179,-0.000404689,-0.000991828,0.000436179,0.00109117,0.000649473,-0.00127639,-0.000596652,0.00066498,0.000675603,0.000421042,-0.000711912,0.0010617,0.00059132,0.000541155,-0.0000228522,-0.00026801,0.000274536,0.0000646672,-0.00114436,0.00144211,-0.0000431903,-0.000431332,-0.0013167,0.00102408,-0.00103933,-0.00159237,0.000880251,-0.00145745,0.00102473,-0.000250181,-0.000411472,0.00120608,0.000335234,-0.000269339,0.0000930055,0.00139806,0.000031326,-0.000518876,-0.00000936531,-0.000170473,-0.000154492,0.00182138,-0.00108068,0.00134443,0.000268713,0.00105188,0.000397885,0.00031402,0.000217221,0.000319152,0.000391825,0.00112518,-0.00111818,0.000693246,0.000811613,-0.00162633,-0.00129296,-0.00096868,-0.000110939,0.000212723,0.00151244,-0.00038073,0.00132559,0.000451213,-0.00103039,-0.00114783,0.000562067,-0.0000290008,-0.000381116,0.000287766,0.0000471544,-0.000124729,-0.000379033,-0.000998603,-0.000747696,0.00058541,0.00174897,0.00137744,0.000158092,0.0000417728,0.00126515,0.00109794,0.00051523,0.000274527,0.000116462,-0.000340477,-0.000982705,-0.0000587411,-0.00131163,0.000683597,-0.00153558,-0.000106913,-0.00142452,0.000930913,0.00179315,-0.00016395,0.000201751,0.0009328,0.00129637,-0.000321124,-0.000991492,0.00109253,-0.000211482,0.0000588909,-0.00139231,0.000340837,-0.00182856,-0.000325388,-0.000333251,0.00101659,-0.00166593,0.00041048,-0.000043215,-0.000872061,0.0000592995,-0.000266572,0.00002139,0.000215485,0.000690469,0.000820627,-0.00169857,-0.0001305,0.000601549,-0.00003187,-0.000988778,0.000086243,0.00113939,-0.000480621,0.0000816581,-0.00104133,0.00157657,-0.000479878,0.000515465,-0.00146948,0.000261583,-0.000423702,-0.000957404,-0.00123225,0.00144395,-0.000353246,0.000695201,-0.000387329,0.000468764,-0.00113137,-0.000381609,-0.00147452,0.00127177,0.000289822,0.000217424,0.00167444,-0.000640932,-0.00105845,0.0000982249,0.000969337,0.000138007,0.00139715,-0.000466377,-0.000926614,0.000673432,0.000875061,0.000652144,0.000340191,-0.000294368,0.000228234,0.00146083,0.00125209,-0.000658039,0.000513351,0.000329692,-0.000136052,-0.000330727,-0.000652885,0.000218961,-0.00137445,-0.00159731,0.0000321516,-0.00139759,0.00193184,-0.00103586,-0.0010337,0.00164633,0.00146258,0.000481941,-0.000033557,0.000692905,0.000203655,0.000714761,-0.0019163,0.00108421,0.000286219,0.000857411,-0.00187005,0.0000717431,-0.00109023,0.000648728,0.00141473,-0.000051973,-0.000474288,0.000282212,-0.000469585,0.00186312,-0.000172792,-0.000606728,-0.00121378,0.000132215,0.00065096,-0.000847675,-0.0013015,-0.00137881,0.000214583,-0.00092295,0.0002378,-0.0000363028,0.00111366,-0.00166821,0.0014585,0.000371432,0.0000805575,-0.00188835,-0.0000921919,-0.00186443,0.00108631,0.000359685,0.00168788,-0.000191211,-0.00182441,0.00177666,0.000241357,0.000100658,0.000380076,0.00122793,0.00130513,-0.001396,0.000725865,0.000553059,0.000737719,0.000964056,-0.00137737,-0.0000439494,-0.000530646,-0.00139881,0.0000220961,0.000403548,-0.000909066,-0.000964772,0.000290118,-0.00130434,0.000193102,-0.000706743,-0.000623227,-0.000894886,-0.000639294,-0.000937564,0.00132213,0.000656352,-0.000544667,-0.000697487,0.000356257,0.000162428,0.000459306,-0.000319427,0.00102601,0.000854599,0.000798894,-0.00131556,0.000586178,-0.00138066,0.000710731,0.000935783,-0.000263392,-0.000755257,0.000103879,0.000575146,-0.000149149,0.000384617,0.00146624,-0.0004249,0.0017981,-0.000466283,-0.00103476,-0.000408533,0.00028128,0.000957168,0.0000998357,0.000505402,-0.00143096,0.000291084,0.00111055,-0.000985197,-0.00108193,0.000216657,0.000386013,0.000433058,0.000770129,0.000282728,0.000578998,0.000571448,-0.00197163,0.000159436,0.000160097,0.00136427,0.000152942,-0.00125075,-0.000622275,-0.000892226,0.00119038,0.00119,0.00124722,-0.00110394,-0.000393161,0.0011282,-0.00105664,-0.00177141,0.00147715,-0.00070245,-0.00111638,-0.000317595,0.000378714,0.00162936,-0.00180444,-0.00124261,-0.00180081,0.000230857,0.000823623,0.000979635,-0.00136703,-0.000083065,-0.00129139,0.000573067,-0.000778924,-0.000758528,-0.0010311,-0.000486842,-0.000984181,-0.000494133,-0.00185972,0.000679588,0.00135346,-0.000770978,-0.000694083,0.00116402,0.000132002,-0.000326611,0.00130374,-0.000721903,0.000119915,-0.000879996,-0.00115003,-0.000606554,-0.0018344,-0.000407404,-0.00118985,0.000803013,-0.00115634,0.000495375,0.000191246,0.0000609751,-0.000150434,-0.000122841,0.000172531,-0.000327641,-0.000962881,-0.000972118,-0.000250739,-0.00114977,0.000741262,0.00119321,-0.000706568,-0.00142442,-0.000825062,-0.00109072,0.00028942,-0.000119694,-0.000194066,-0.00131661,0.00142449,-0.00107848,-0.000643522,-0.000198442,-0.000219711,0.0019117,-0.000873618,0.000728855,-0.000107768,-0.000604643,0.000712798,0.000693935,0.000861342,0.00124009,-0.00103855,0.00000782893,0.000302409,0.000665148,0.000767165,0.00126371,-0.00135457,-0.000767018,-0.000806647,-0.000549395,0.000991969,-0.000202379,-0.000566029,0.0000658663,0.00183819,-0.000417962,0.000828733,0.000869981,-0.000526529,0.00149047,0.000163879,0.000190123,-0.00139959,-0.000311541,0.00123678,0.000307321,0.00112152,-0.000302093,0.000587892,-0.00000371897,0.000862943,-0.0000711889,-0.000226542,0.0000331807,0.00114292,-0.000485904,0.00114978,0.000897052,-0.000809602,-0.00061206,0.00145053,-0.000467893,0.000877707,-0.000368292,-0.000413797,0.00120085,0.000221593,-0.000869052,-0.000424285,-0.00092237,-0.000237796,-0.000978612,0.00160006,0.000471077,-0.0000308318,0.000505909,-0.000897031,0.000290801,0.0000635167,-0.00150961,0.000388527,0.000803286,0.00111209,-0.00151419,0.000199164,-0.0000679943,0.000575843,0.000984826,0.000479412,-0.00098224,0.00173436,-0.00116467,0.000662637,0.00145545,0.000199992,-0.00037325,0.000272332,-0.000324078,0.00124769,0.00196693,-0.00188051,0.000456086,-0.000428403,-0.00129869,-0.00114232,-0.00141778,-0.000861931,0.00041812,-0.00103583,-0.000528493,-0.000652534,-0.00128292,0.000447781,0.00115345,-0.000398639,0.000397816,-0.0012897,-0.000795146,0.000180023,0.00130515,0.00113699,-0.00061655,-0.00142289,0.000656952,-0.000810233,0.000311547,0.00105979,-0.000238549,-0.000493912,0.000757381,-0.000408976,-0.000602765,0.00113325,0.00108816,-0.00111423,-0.000637355,0.00131909,-0.000733984,-0.000488793,0.00126577,-0.00124319,-0.000990515,0.00000617651,0.000525757,-0.00190766,-0.000754114,-0.0000524979,0.00017625,-0.000551092,-0.00146833,-0.0000718809,-0.000263356,0.000611511,-0.000388363,-0.000266872,0.000987739,-0.000377574,0.00181435,-0.00179366,-0.000746865,0.000185513,0.00104376,-0.000344725,0.000713505,0.000847415,0.000533589,-0.000549606,-0.000141986,-0.00137147,0.0000407045,0.000529374,0.000260619,-0.000552112,-0.000407358,-0.00097249,-0.00132424,-0.0000627816,0.00109929,-0.00162266,-0.000260773,0.00118992,0.000391117,-0.000942949,-0.000294529,0.000243882,0.00137379,-0.00032161,0.0000180226,0.000795443,-0.000765546,0.00123709,0.00129615,0.000718493,0.000834613,-0.000415844,0.00177189,0.000726701,-0.00143293,-0.00107637,-0.000820753,-0.000664485,-0.000710304,0.000723599,-0.00000137943,0.000022331,-0.000520406,0.000303287,0.000874979,-0.000767878,0.000157059,0.000313744,0.0008448,-0.000635515,0.000120297,0.000261191,-0.000649107,0.000144759,-0.000723828,0.000469911,-0.000156782,-0.000354168,-0.000317356,-0.00155487,-0.000333686,0.000662249,0.00069035,0.000435624,0.00118627,-0.00092607,-0.000765435,0.000142714,0.000285821,0.00030314,-0.000164539,-0.0014108,0.00068051,0.000977608,0.000107585,0.000761527,0.0000523822,-0.000282348,0.000440835,0.000995704,-0.000579311,-0.000324583,-0.000152318,0.0015708,-0.000236045,-0.000519508,0.00110247,-0.00072908,-0.000722978,-0.00140516,0.00162403,-0.0000248734,0.0000783174,0.00125788,-0.000359995,0.000805544,-0.0000913352,-0.000982515,-0.000154503,0.00186921,0.000581467,0.000020889,0.000923707,-0.00105868,0.000274279,-0.000676623,0.00131442,0.000179418,0.000160368,0.00116071,-0.0000258742,0.00117004,0.0015503,-0.000202135,-0.000641569,0.0013048,0.000342877,-0.000712418,-0.0000518171,0.00127819,0.000331183,-0.000557148,0.000580271,-0.000621586,-0.0000219905,0.000185807,0.0007732,-0.000304196,0.000122438,-0.00184603,0.000706093,-0.000954492,-0.0000280965,0.00033617,-0.00100923,-0.00036208,0.0000438265,0.000898261,-0.000555948,-0.000415568,0.000565932,0.00165615,0.0000268153,0.00103853,0.000721612,-0.0000985414,0.0000820652,-0.0000271042,0.00155442,0.001527,-0.00147615,-0.00102644,-0.00189133,0.000148359,0.000293552,0.000448178,0.000835293,-0.000394687,-0.00189981,-0.00144234,0.000428701,-0.00132677,0.000428415,0.000601031,-0.000540341,0.00034964,-0.00129516,-0.0000386046,-0.000363127,0.000549763,0.00133723,-0.000578149,0.00151106,-0.000518875,-0.000929632,-0.000519006,-0.000373024,0.000546367,-0.000855732,-0.00103866,-0.00025162,0.00163321,0.0019098,-0.000174982,0.000478672,0.000117554,-0.000533131,-0.00119463,0.000220387,0.0000669089,0.000673322,0.00159327,-0.000164154,-0.0000948099,-0.000655127,-0.000158196,-0.0000395409,0.000747544,0.000788543,-0.000822938,0.000458778,-0.00168971,0.000115166,0.000294724,-0.000492064,-0.000764305,-0.000251088,0.00073195,0.000115959,0.000619882,0.00147191,0.00192435,0.000702978,-0.000529503,0.000112687,0.00166109,-0.000337337,0.00195894,0.000628173,0.00023494,0.000401437,0.0011267,-0.000103144,-0.00130645,-0.000319391,0.00145203,-0.000977425,0.0000345898,0.000983153,-0.0000468746,-0.000631586,0.00117661,-0.00143916,-0.00124675,-0.00198322,0.00122876,0.00096585,0.00032468,0.000275934,0.000339496,-0.000210531,0.0000568874,-0.00180567,-0.00132589,0.0005949,0.00181677,0.000902797,0.000501442,0.000217374,-0.000059147,0.00096659,0.00111121,-0.000307401,-0.00078498,-0.00138756,0.000595888,-0.000789657,-0.000301292,-0.000712625,0.000683773,0.000498473,0.000235584,-0.000391243,-0.0000765276,0.000743948,0.000905413,-0.00126363,0.0000602608,-0.000641069,0.000344845,-0.00110158,0.000230677,-0.000813426,0.000243222,0.000235899,-0.000181154,0.000585779,0.000574372,-0.000175342,0.000892278,-0.000536847,0.000379865,-0.000593059,-0.000965165,-0.000283518,-0.000196479,-0.000382611,-0.00160422,0.00000193535,0.000465244,-0.00034221,-0.000585603,0.00127605,0.000169882,-0.000423875,-0.000256103,0.000943396,0.0000660302,-0.000193289,-0.00121991,0.00127934,-0.00115551,0.00024653,0.00122711,-0.00109822,-0.000635012,0.00102183,-0.00016627,-0.00053594,0.00144852,-0.000699413,0.00129238,0.000689547,-0.00180303,-0.00150663,0.00128336,-0.00135174,0.000704158,0.000813718,0.000638605,-0.000297498,0.000847428,-0.000554406,0.0000953092,-0.00136071,-0.000113181,-0.000035199,0.0012428,0.00124456,-0.000948423,-0.00139469,0.000175379,0.000519019,0.00162163,-0.0000599734,-0.000358118,-0.000387417,-0.00110226,-0.000985785,0.000549287,-0.000737177,0.000117743,0.000717154,-0.00157101,-0.000263545,-0.00177069,0.000230439,0.000114158,0.000549756,-0.0000408498,0.000745921,0.00127681,0.000141714,-0.0000794039,0.000155166,-0.000380407,-0.00115587,-0.000726743,-0.000617766,-0.0000964048,-0.00067224,0.00052826,0.00120131,-0.000955732,-0.00074396,-0.00159381,-0.00073139,0.0013403,0.00154135,0.000825191,0.000593233,-0.000668959,-0.000944731,-0.00161634,0.000481018,-0.00129059,-0.0000356158,0.00151094,-0.000877565,0.000113688,0.000440646,0.000621926,-0.000565662,0.000634736,0.000704767,0.00103791,-0.000343157,-0.000807154,0.00026478,0.000865677,0.000817583,-0.00151723,-0.000043388,-0.000777438,-0.0000984766,0.000115324,-0.00109225,0.000880792,0.00149158,0.00066587,0.000340773,0.00034649,-0.000370267,-0.000617668,0.00062403,-0.0000233033,-0.000697297,-0.000525954,-0.00000796512,-0.00154927,-0.000848771,0.00102735,0.000328789,-0.0000262097,0.000294053,-0.00133519,-0.000170996,-0.000185207,-0.000589278,-0.0000144157,-0.00019813,-0.000179243,0.000469615,-0.000189812,-0.0011035,0.000435507,-0.00148716,0.000436113,-0.000706272,-0.000630334,0.0000313331,0.000291297,0.000242017,-0.000211822,-0.00193828,-0.000825173,0.0000593127,-0.0004331,0.00176437,-0.00131747,-0.00133123,0.000138315,-0.0000505759,-0.00000371882,0.000498927,0.00102401,0.000144363,0.00111969,-0.000953693,-0.00034442,0.000369212,-0.001548,0.0000210534,-0.00137544,-0.000222995,0.000485851,-0.000738832,-0.000483132,0.000464123,0.00147634,-0.00116761,0.000078575,-0.00126224,0.000243692,0.000828838,0.000104182,-0.00128294,0.000897984,-0.000823593,0.00152253,0.0000927536,0.000911312,-0.000442209,-0.000217022,-0.0010674,0.0000367874,0.000211206,0.000317422,-0.000596599,0.000376284,-0.00116642,0.000693285,0.0013202,-0.000323476,-0.000907112,-0.00105138,0.000461194,-0.000784645,-0.00188641,-0.000293805,-0.00032511,0.0000493529,-0.00073099,-0.000637533,-0.000815874,-0.00142612,0.000600806,0.00146641,0.000145022,-0.000606631,0.0004319,0.00136909,0.001558,0.000878838,-0.000895452,0.000676561,0.000019486,-0.000208775,0.000364871,0.00194504,0.000207856,-0.000544298,0.0000121247,0.000930453,0.000871615,0.000239238,0.000648824,0.00136978,-0.000537043,0.000237104,-0.00100429,-0.000439204,0.000243563,-0.000244987,-0.000332935,0.000355422,0.000987612,-0.0011997,-0.00126781,0.000681987,0.000539835,0.000903086,-0.000689082,0.000148958,-0.000399744,-0.00030855,-0.00140725,0.000375639,-0.00112386,-0.00176054,-0.000362517,0.00006176,-0.00130321,0.000917462,0.00110309,-0.0000785817,0.000158715,0.000255819,0.000200316,0.000184556,-0.000490586,0.000315159,0.000560947,0.00196398,-0.0000407039,0.000620323,-0.000323192,0.000504226,0.000157924,-0.000547211,-0.000573201,0.000159083,0.00180196,-0.00104152,0.000259635,-0.000291398,0.000101246,-0.000132153,-0.0000217596,-0.00132563,-0.00057118,-0.00048311,-0.00120082,-0.0000210233,-0.000589208,-0.00120908,-0.00161409,-0.00030837,0.000450945,-0.000157229,-0.000292507,-0.000422712,-0.00106514,-0.00097724,-0.000226153,0.000392154,0.000791583,0.000180654,-0.000843089,-0.000810598,-0.000939613,-0.000230822,0.000439049,0.00175152,-0.000138792,0.000915985,-0.00133386,0.0000306653,-0.000511187,0.000445595,-0.00136637,-0.000809797,0.000848228,0.0000578965,-0.00105622,-0.000284286,-0.000227573,0.000440756,0.000124799,-0.000624536,-0.0007808,-0.0000342053,0.00177879,0.000575996,0.000994555,0.000425356,0.000496361,0.000908213,-0.000962018,0.000282449,-0.00179947,0.000415398,-0.000730946,0.0000840116,-0.000687534,0.000916453,-0.000401876,0.000985043,-0.00142229,-0.0000819256,0.00122297,-0.00071933,-0.000149462,0.00173477,-0.000951934,-0.000465903,0.00117684,-0.000615832,-0.000123394,0.00126219,0.000245152,0.00110546,-0.00111919,-0.000393184,-0.000524488,0.00106212,0.000701622,-0.000361469,-0.00152133,-0.000470576,0.000539089,-0.000355342,0.000765517,-0.000603749,0.000381801,-0.000459921,-0.00142853,0.0012607,0.000991536,0.000316165,-0.00102348,0.0000182907,0.0013134,0.00157265,-0.00110883,0.0000025099,-0.000491759,-0.00168792,-0.00165965,-0.00192104,-0.000907407,-0.000226571,0.000268134,-0.0001408,0.00133957,-0.00117323,0.0000510049,-0.000571717,-0.000852672,0.0000850007,-0.000177047,0.00139523,-0.00116124,0.000967101,-0.00138031,-0.000653229,0.000331158,0.00140086,-0.00175761,-0.00152788,-0.000926845,-0.000301842,0.000731401,0.00121892,-0.00116154,0.000375729,0.0000173693,0.000958299,-0.000459605,-0.00101153,-0.00127821,0.00069653,0.0013635,-0.000264963,-0.00130835,0.00169313,-0.0000190584,0.00151181,-0.000837412,0.000154108,0.000670344,0.000640271,-0.000471441,-0.00124671,0.00104213,0.000311487,0.00157463,-0.00148929,-0.000447387,-0.000176857,0.00164732,-0.000777159,-0.000604311,-0.000545062,0.0000702528,-0.0014713,-0.00136693,-0.00135387,0.000912967,-0.000221907,0.00105383,0.000431993,-0.000850394,0.00000410705,-0.00119835,0.00129852,-0.000703924,-0.00054643,-0.00123399,0.000740143,0.000749096,0.0000447541,0.0000451707,-0.0015711,0.00000461427,-0.000315969,0.00050843,-0.00139164,-0.000377633,0.000213272,0.000899525,-0.000134789,0.00157321,0.000517488,-0.000931094,0.00017325,0.00177861,0.000480221,0.00123174,0.0009217,0.000777036,0.000554,0.000368198,-0.00191293,0.000265563,0.0011569,-0.000312051,-0.000231018,-0.00115171,0.000589754,0.00124116,0.000634918,-0.000319423,0.00109127,-0.000029953,-0.000465953,-0.000784489,-0.000134251,0.00145896,0.000189561,-0.000636285,-0.000336976,-0.00132227,-0.000246316,-0.000944154,0.00115361,-0.0000488349,0.000661147,-0.000602233,0.00100458,-0.000935989,-0.000991644,0.000770074,-0.00000153991,-0.00134116,0.000753173,0.000667449,-0.000277731,-0.000410443,0.0000517257,-0.000433074,-0.000021094,0.000170045,-0.00018108,-0.00176254,-0.000711191,-0.000102276,0.000565756,-0.00194005,0.0000925055,-0.00148231,0.00137595,-0.00108657,0.000800805,0.00034087,0.00134628,-0.00136538,-0.00108507,-0.00102704,-0.000833968,-0.000400275,0.000478345,-0.000505955,0.000559654,-0.000341551,0.000306429,0.000509794,-0.000509525,0.000541517,-0.000629014,0.000582888,-0.000255818,0.00109658,-0.00100176,0.000569695,-0.000822575,-0.00135019,-0.000182453,0.00100847,-0.000631548,0.000295518,0.000462453,-0.00159886,0.000297433,-0.000722315,0.00080609,0.0008478,0.00145831,-0.00124925,-0.00103401,-0.00100848,0.00128163,0.0000482665,-0.000573305,0.00104247,-0.00177492,-0.00175023,-0.0014438,-0.00136755,-0.00177451,-0.000542333,-0.000522744,-0.00111108,0.00123428,0.00190827,-0.000533903,0.00139931,0.000477185,-0.000341363,-0.00101962,0.000725321,0.000344332,-0.000914684,0.000638169,0.0012687,0.000235998,-0.000350388,0.0000202021,-0.000256384,0.000561023,0.00103832,-0.000118421,0.000242335,0.00158728,0.000664799,-0.000795173,0.000934902,0.000906765,0.000984353,0.000406647,0.000423727,0.00165617,-0.00061877,-0.00166996,-0.000344656,-0.000905839,0.00154156,0.000454211,-0.0000121129,0.000312508,-0.000192653,-0.000766526,0.000143884,0.000833615,0.000479713,-0.00158418,-0.000671552,0.000323127,0.000118932,0.000424284,0.000945198,-0.000526289,0.000272698,0.000388865,-0.00167086,0.00168912,-0.000846544,0.00105723,-0.000402521,-0.000377132,-0.000931692,0.000429357,0.00188436,0.000182466,0.00187693,-0.000576073,0.000518648,-0.000625906,-0.00118221,-0.000311846,0.0000842099,0.0000749578,0.000503536,-0.00131957,0.001757,0.000584443,-0.00199042,0.000676391,-0.00120482,0.0000776998,0.000235415,0.0000148911,-0.000963329,0.00015904,0.000813761,0.000159614,0.000738882,-0.00182375,-0.00195858,0.000532456,-0.000799291,0.000588445,0.00022849,0.00182088,0.000352791,0.000746591,0.000299158,-0.00009754,0.00124554,-0.00063915,-0.000336967,-0.000791247,-0.00144046,0.000552085,0.0000254738,-0.00149901,0.00105077,-0.000468758,0.00142384,0.00056499,-0.0005598,-0.000574885,-0.00152291,-0.0014867,0.000505181,-0.000740589,0.001437,0.000490568,-0.000377456,0.000219058,0.000232134,0.000136811,-0.00106267,-0.0000516795,0.00035417,-0.000141771,-0.000300172,-0.000205333,0.00138907,0.000386398,0.00184326,-0.00123523,-0.00117761,0.000788198,0.000572441,0.000562167,-0.000522371,-0.000263947,0.000276499,0.00104178,0.00175287,0.000978704,0.000832698,0.000587162,0.00114316,0.000727183,0.000869958,-0.000470417,0.000211158,-0.000519508,-0.0009677,-0.000181626,0.000413833,0.000597707,0.00098227,0.000106018,-0.00119463,-0.00126595,-0.00198254,0.00177309,0.00177187,0.00093741,0.000424072,-0.00180746,-0.000109059,0.000563146,-0.000204088,0.0000452921,-0.0000767109,0.0010412,0.00017006,0.000954717,-0.0000144049,-0.00146844,-0.000543191,-0.00102268,0.000996689,0.000335016,-0.00135836,0.000820846,-0.000281905,0.00121058,0.000299546,0.00153399,-0.00019964,-0.000522148,0.000483927,-0.0000825967,0.000135843,0.000335676,0.000604144,-0.0000649868,-0.000702845,-0.000705247,-0.00117252,-0.000873802,-0.000450694,-0.000226593,0.000213695,-0.000156981,0.000503533,0.000998351,-0.00152479,-0.000271574,0.000491321,0.00113843,-0.00123775,-0.000850298,0.0000252334,0.0000563025,0.000507935,-0.000401229,-0.000677141,-0.000606722,-0.000915591,-0.000148659,0.0000999675,-0.00119665,0.000364116,-0.000949306,0.00199596,-0.00104688,0.000955687,0.000337893,0.00053632,-0.000551833,0.000483738,-0.000719166,0.00119371,-0.00055115,-0.00185049,0.000692318,-0.000252124,-0.000632539,0.000493462,0.000679369,-0.00129408,-0.000223803,-0.000933372,0.000182156,-0.000621965,0.000697546,0.00131751,-0.000677155,0.00191807,0.00113163,-0.000305771,-0.00123905,0.000225098,0.000873983,0.000923888,0.00151946,-0.000540863,0.00141942,0.00141601,-0.000248031,0.000559089,-0.000829759,0.000539671,0.00131248,0.000977431,-0.000490784,-0.0011942,0.00000387624,0.0014502,-0.000350412,0.00157466,-0.000402949,0.000497027,0.000580367,-0.000222721,0.0000139038,0.00156337,-0.0000534384,-0.000868624,0.00036026,0.00042732,0.00103519,0.000259432,0.00132622,-0.0000869656,-0.000256326,0.000325757,-0.00089612,0.00161117,-0.0000143851,-0.000373558,-0.000751495,0.000767057,0.000869094,-0.00000509754,-0.00166699,0.0011443,0.000149965,0.00078256,0.00115956,0.000360544,0.000802726,-0.000287157,-0.000751555,-0.000331491,0.00159423,-0.000996357,0.000504301,0.000838487,-0.000761751,-0.000672875,-0.000135305,0.00146244,0.00119473,0.000056763,-0.000683766,-0.000139796,0.000848836,0.00142903,-0.00120823,-0.000529798,-0.000198007,-0.00130591,0.000315463,-0.00115633,-0.000269101,0.000318885,0.000672052,0.00176464,-0.00190532,0.000832108,-0.000924944,0.000145201,-0.000971219,-0.000538274,0.0000101742,0.0000264181,-0.000704579,-0.00163709,-0.000175673,-0.0000202441,-0.000467392,0.000441241,0.000551438,0.000828501,-0.0000321225,-0.00103919,0.000250756,-0.0000513573,0.000358546,-0.000370881,-0.000401492,0.00176863,0.00100351,0.0012612,-0.0011569,0.00168662,-0.00173128,-0.000354907,0.000249204,-0.0000190067,-0.000265773,-0.00115178,-0.000552151,-0.00085795,-0.00110604,-0.000475664,-0.00144695,0.00197218,-0.000528232,-0.00150595,0.0000275048,0.000811739,-0.000230107,0.000139271,-0.0000461402,0.0000569281,0.000459679,-0.000472931,-0.000712886,0.000185737,-0.000558791,0.0018792,0.00149096,-0.00154007,-0.00150299,-0.00072069,0.000469617,-0.000924297,-0.00127358,-0.0000729841,-0.000101289,0.00050321,-0.000477413,-0.000827325,0.000621254,0.000171609,-0.000219758,0.0000213105,0.00115484,0.000956126,-0.00160244,-0.000853504,-0.00168903,-0.000770417,-0.000640814,0.000588741,-0.0012359,0.00042265,0.000564816,0.00101267,-0.000967017,0.0000858154,-0.000457594,-0.00050109,0.00138909,-0.00171291,-0.000276336,-0.000294699,0.00146046,-0.000137095,0.00145293,0.00070692,0.000450187,0.000431529,-0.000429021,-0.000612502,0.000320478,-0.00153589,-0.000666121,-0.000837544,0.000839799,-0.00067344,0.000444807,0.000461247,-0.0000936531,0.000124899,-0.000109693,-0.00083574,-0.000501311,-0.000170426,-0.000514431,-0.000536729,0.000117929,0.000732338,0.000408865,-0.000073341,-0.000527212,0.00018993,0.000265813,0.000292705,0.0018286,-0.000368359,-0.00018119,0.000103037,-0.0000325062,-0.00124432,0.000208547,-0.00000596399,-0.00103109,-0.00128798,0.00114181,0.000119839,0.00100164,-0.00133912,0.00124796,0.00192633,-0.000495973,-0.00032878,-0.000080213,0.000289776,0.000403087,-0.0000543942,0.000934617,-0.00100213,0.000330856,0.000473295,-0.000576993,0.000635397,-0.000496132,0.00063678,0.00092454,0.0000699745,0.000312364,-0.0000627232,-0.000484025,-0.000370429,0.00170633,-0.0012218,-0.00152079,0.00136105,0.000240395,-0.00053891,-0.0000792129,0.00030977,0.000249106,-0.000223724,-0.000439703,-0.0000184399,-0.000962043,-0.000555571,0.00104207,-0.00086825,0.0010545,0.000768339,-0.000783411,0.00102644,0.000401897,-0.00044936,-0.000504731,0.000711944,-0.000630346,0.00101486,-0.00000752552,-0.000867874,0.000114006,0.00182706,0.000435663,0.00037511,-0.000956238,-0.00113057,-0.0017058,0.000641035,-0.0000762726,0.00113967,0.00125116,0.00050254,-0.000254077,0.000460096,-0.000831247,0.000896919,0.000811563,0.0011469,-0.000895984,0.00115643,-0.0009041,-0.0000942902,-0.000690806,-0.000576328,0.000977714,0.000365233,0.000195953,-0.00063273,0.000919898,-0.000170007,-0.00111665,-0.000387817,-0.00113826,0.00112572,0.000827349,-0.000487037,0.00167818,0.00146286,-0.000754706,0.0000503575,-0.00147006,-0.00109195,0.000230989,0.000910085,0.000290898,-0.000341241,-0.000696278,0.00182328,0.00117619,-0.00176466,0.000474901,-0.00105951,0.000849468,0.000310202,0.000561934,0.000736378,-0.000671468,0.000337412,0.000209281,0.000497117,0.000199618,-0.000828277,-0.00019811,0.000690144,0.00181879,0.00042049,-0.00193422,0.00144206,0.00120858,0.000618459,-0.00065648,-0.000100114,-0.000534856,-0.00158641,-0.000440783,0.000297486,0.000903809,0.000172627,0.00115437,0.000965746,0.000921842,-0.00126457,0.000730606,0.00048418,-0.00101178,-0.000274247,-0.00103108,-0.00176259,-0.00151679,-0.0013138,-0.00191234,-0.000345327,-0.000945848,0.0000117571,-0.00103384,-0.000128806,-0.00173089,0.000191576,-0.000484424,-0.00196561,0.0014753,0.00120829,-0.00117875,0.000339339,-0.000706349,-0.00101533,-0.000785491,-0.000119072,-0.00051497,0.00116122,-0.00009031,0.000427374,-0.000152731,0.000685559,0.00108857,-0.000662243,0.000664696,-0.000509295,-0.0000595917,-0.000293593,-0.000924556,0.000695649,0.00118526,-0.000529102,0.00182817,0.000589684,0.000980815,0.000956411,-0.0000349257,-0.000698599,-0.000197909,0.00160825,0.000991853,0.00165387,-0.000567143,-0.000801655,0.00127584,-0.00170708,-0.00124798,0.00000129333,-0.000215967,-0.00152554,-0.000820475,-0.00123284,-0.0000672545,-0.000531224,0.00078052,-0.000633594,0.000963152,0.000571998,-0.0000686565,-0.0000179958,0.000282974,0.000569691,0.000564879,-0.000394542,-0.00115139,0.000188401,-0.000412016,-0.000220309,-0.00158459,0.000697498,-0.000862934,0.000670665,-0.0019524,-0.00117189,-0.00145257,0.000368256,0.00115817,-0.000368614,0.0000206023,-0.00165964,0.00105676,0.000671345,0.00169956,0.000732646,0.000656292,0.00161657,0.000708912,-0.000992932,-0.000881279,0.0010492,0.000713774,-0.000046923,-0.000811558,-0.000340193,-0.000925344,0.0000245139,-0.000842506,-0.00117196,0.000203865,0.00081172,-0.000250871,-0.000861889,0.000835154,-0.000127579,0.000161865,-0.00169701,-0.0000347345,0.00103055,-0.000774106,-0.000385477,-0.000275707,-0.000536795,-0.000915909,-0.000591568,-0.00150832,0.000956712,-0.000366817,-0.000151714,0.000712441,-0.000312061,-0.000402743,-0.00111415,0.00027689,-0.000541619,-0.000706761,-0.000235475,-0.000861021,0.0000112852,-0.000716552,-0.000550796,-0.000600348,-0.000805801,-0.000633733,-0.000732635,0.000120802,0.000379358,-0.000261525,0.000396423,0.000337871,0.00161646,-0.000989259,-0.000372174,0.00112611,-0.000238012,-0.000168961,0.0000245718,-0.000343594,-0.000154868,-0.000220056,-0.000349746,0.00118252,0.000902311,0.000145938,0.00150286,-0.0003955,-0.000260834,-0.000987681,-0.000233983,0.00102677,-0.0011063,-0.000598322,-0.000361645,0.00112087,-0.0000473218,-0.00125227,-0.0000320241,0.00160514,-0.00087412,-0.000250645,-0.000135844,-0.00194216,-0.000487585,0.000479665,0.000361462,-0.000704039,-0.000141703,0.000365189,-0.00108527,0.000350665,0.000891708,0.000333134,-0.000631533,-0.000492728,-0.000474885,-0.00180576,0.00118514,0.000475831,0.000477575,0.0014501,0.000278494,0.000301443,0.000953938,-0.000360516,-0.000321311,-0.00153364,0.000602837,0.000715914,-0.0017088,0.0019405,0.00000323534,0.0014745,0.00155244,-0.00125294,-0.000109023,-0.00091689,-0.00171845,-0.00021326,0.000959964,-0.00137342,0.0000788326,0.000249129,-0.00183309,-0.000328688,0.000816545,-0.000698564,-0.00138306,0.000851392,0.00101635,0.00129603,-0.000226102,-0.00136565,-0.00149536,0.00143922,-0.000657248,0.000176635,-0.000345766,-0.0000407411,-0.000566798,-0.00121643,0.0000252802,0.000447827,0.0000157634,-0.000655133,-0.00068409,0.000405253,0.00172024,0.000261356,-0.000654868,0.0000764904,-0.000487578,0.000883034,-0.000436083,-0.0000630782,-0.000490675,0.000878618,-0.000414037,0.000500821,0.000343774,0.00133693,0.00104072,0.00109978,-0.00183315,-0.000286791,-0.000495644,0.00097423,-0.00104954,0.00169717,-0.000949669,0.000400959,-0.000849834,0.000642281,-0.000583694,-0.000130512,-0.000718666,-0.0000184635,0.000330852,0.000184671,-0.00145807,0.0000389827,-0.0000806425,0.0011708,-0.001223,-0.000067637,0.000788326,0.000479764,-0.00054895,-0.000159538,-0.00092432,-0.0014238,0.00157987,-0.0019684,-0.000112704,0.000441085,-0.00136028,-0.000788699,0.000931869,-0.000657726,0.00000667395,-0.00170393,-0.000918064,0.00187772,-0.00189936,-0.000612031,-0.000364795,0.000585821,-0.00114663,0.00104857,-0.0000673508,-0.00149869,-0.00189413,0.00079189,0.000378545,-0.000765371,0.000613884,-0.00101505,-0.000650186,-0.000588677,-0.00147337,0.000921066,-0.000525313,0.000603183,0.00142041,0.000396534,-0.00179583,0.0011359,-0.00176704,0.00101779,-0.000955556,-0.00191655,0.000396662,-0.00123784,-0.000132112,0.00104173,-0.000514438,0.000180237,0.000741351,-0.000953884,-0.00168576,0.0000724998,-0.00105279,0.000949228,0.000704821,0.000353518,-0.000187811,0.00152953,0.00107338,-0.00187518,-0.000857041,-0.00171457,0.0000677245,-0.000838693,0.00168827,0.00156134,-0.000433852,0.00156075,-0.000161939,-0.000152239,0.000707901,-0.000166305,-0.000244733,-0.00109659,0.000047919,0.00169236,0.000742199,-0.000420732,0.000794104,0.0015749,-0.000527956,-0.000595098,0.000933594,-0.000191641,-0.00102837,-0.000243085,0.00100883,0.000194732,-0.00128568,0.0018436,0.00146792,0.00118352,-0.000233604,-0.00153627,-0.000247138,0.000308802,-0.000747986,-0.000596488,0.000432159,0.000706614,-0.00193245,-0.000344731,0.00172637,-0.000363731,-0.000419306,-0.00131917,0.00185171,-0.000935806,-0.000263763,0.000118703,-0.00124594,0.00111237,-0.000526376,-0.0000181247,-0.000984251,-0.000469415,0.000243662,-0.00195302,0.00100339,0.000729284,0.00138932,-0.000271105,0.000237159,-0.00110792,-0.000359973,0.000160741,-0.000535267,0.000932225,-0.000739294,-0.000945861,-0.000515158,-0.00146557,-0.0000633413,0.00119904,-0.00124886,0.00122093,0.000189251,0.000165589,0.000567057,-0.00110605,0.000840732,-0.000661469,0.00113887,0.0000417416,-0.00139292,-0.000857762,0.000663898,-0.000881988,0.00100159,0.00145601,0.0019009,0.000318142,0.00122538,0.00158692,-0.00105336,-0.00101942,0.000300529,-0.000999473,0.00183143,0.000762682,0.0000036516,-0.000708313,0.000219708,-0.0000336538,-0.000509932,-0.000647769,-0.000959283,-0.00158253,-0.00193821,0.000382855,0.000350653,-0.000749733,0.000563886,0.000342115,-0.000685623,-0.000452415,0.000209508,0.0000618202,0.000688397,0.000967265,-0.00066905,-0.000356484,0.000590234,-0.0000772595,-0.000370639,-0.00010867,0.00043013,0.000578363,-0.00104313,0.00112403,0.00122715,-0.000126968,0.00140956,0.0008971,0.00103348,0.00194469,-0.000790173,-0.000833114,0.00155235,-0.00023106,0.000304341,-0.000307906,0.000380157,0.000643741,-0.00045594,-0.00101778,-0.000279212,0.000736811,0.0012347,0.00069885,0.000323671,0.000683269,-0.00152812,0.000145711,-0.000131074,-0.0000949959,0.000446645,-0.00105532,-0.000213545,0.00130434,0.0010675,0.00142864,-0.00126577,0.0000725874,-0.000213446,0.000124403,0.00117964,0.000193754,0.000163943,-0.000182307,-0.000653793,0.000112173,0.000318171,0.000754512,-0.00091251,0.000296195,-0.000392415,-0.000347985,-0.000833399,-0.00104237,0.000861778,0.000403768,-0.000754151,0.0000787885,0.000368252,-0.000548201,-0.000249693,-0.000280872,-0.000243721,0.00116432,-0.000192307,0.000552307,-0.000668779,0.000226648,-0.000157636,0.000906279,-0.000469749,-0.000491144,-0.000619653,-0.000609424,0.000461556,-0.000246933,-0.000238968,0.00147272,0.000985597,-0.000302048,-0.00125442,-0.000559673,-0.00113465,0.000880045,0.000312337,-0.000197311,-0.000282816,0.000548975,-0.00108945,0.0001135,-0.00138296,-0.000719026,-0.00110262,0.00122691,0.000208717,0.000335042,-0.000850347,0.000526098,0.000512823,0.000512245,0.000888617,-0.00174009,0.000584642,0.000407582,-0.00117106,0.000588272,0.00156529,0.00115077,0.000619976,0.000352065,0.000926557,-0.000986929,-0.000892177,-0.00097356,-0.000309134,0.000541173,0.00037235,0.000638002,0.00107016,0.000118003,-0.00000538743,0.00075436,0.000151195,0.000312439,0.000323654,-0.0000521293,0.000230384,-0.000817691,-0.000832279,0.00166326,-0.000739671,0.000070324,-0.000564707,0.000558121,-0.00110286,-0.0014652,-0.000483152,0.00113592,0.000579018,-0.000246869,0.00064685,-0.000453952,-0.00182498,0.000564135,-0.000570303,-0.00127177,0.0000220757,0.0000490771,0.000363927,-0.000409781,-0.000707022,0.000248388,-0.00071678,0.000497393,-0.00071826,0.000224975,-0.000494923,-0.00164604,-0.0014039,-0.000180145,-0.00113258,0.00107454,-0.000709966,0.000771935,0.000247117,0.00076266,0.000188767,-0.000469117,-0.000180606,-0.00119556,-0.00114469,-0.000815741,0.00048483,-0.000171373,-0.000180462,-0.000322778,0.000167284,-0.000307838,0.000496999,0.00134152,0.000582286,-0.000200736,-0.00033487,0.000270991,-0.00100822,-0.000840267,-0.000115437,0.000883725,-0.000776304,0.000459491,0.000304374,-0.00094973,0.000840143,0.000751069,0.00174369,-0.000222359,0.000619814,-0.0000493162,0.000737625,0.000473862,-0.000471873,0.00156454,-0.000748039,0.000461791,0.00112553,-0.00059735,0.000133435,0.000958943,-0.00131976,-0.00015458,0.000464901,-0.000179007,0.00061035,-0.0000540078,0.000981845,-0.00139107,0.00163424,-0.000830213,-0.000152121,0.00103806,-0.000560454,0.000829366,0.00159674,0.000324344,0.000327968,-0.00009094,0.000614696,-0.00188142,0.001148,-0.000859214,0.000548569,0.000724736,-0.000997577,0.000972488,-0.000676789,-0.00119933,0.000850883,-0.000573202,0.000752933,0.00039471,0.000552257,0.000930338,0.00167689,-0.000931146,0.00025796,-0.000274866,0.00181537,0.00100095,-0.000574272,-0.00130445,-0.000122586,0.0000959004,-0.000313552,-0.00194409,-0.00146124,0.00107413,-0.000580427,0.000347775,0.00118867,-0.000272107,-0.00053915,0.00175645,0.00171545,-0.000453437,0.000114079,-0.000966373,-0.000929513,-0.0013332,0.000862183,0.001609,-0.000924944,0.000636111,-0.000937812,0.000122219,-0.0018181,0.00196202,-0.00121539,-0.000382029,-0.0003035,-0.000242971,-0.00046191,-0.000905269,0.00106832,0.000301422,-0.00106923,-0.00158923,-0.00144523,0.000658374,-0.000568576,0.000341821,-0.000606859,-0.00129392,-0.000513187,-0.000270928,0.00151825,0.000968029,-0.000250748,0.000233771,0.00118974,0.0002688,0.000270737,-0.000841127,-0.000894352,0.000303076,-0.000145269,0.00109075,-0.00167791,-0.00176869,-0.000579843,0.00156755,0.00180949,-0.0019415,0.00133516,-0.00059473,0.000133644,-0.00057498,-0.000445697,0.000353876,-0.000690548,-0.00118666,-0.000369264,0.000620476,-0.0000958923,-0.0011835,0.000836619,-0.0000535934,-0.000242799,0.00103176,0.000447859,0.00170134,0.00134098,-0.000736169,0.000314255,0.00153862,0.00024283,0.00162295,0.0000291522,-0.00146606,0.00021171,0.0000752761,-0.000715572,-0.000904918,0.000575588,-0.000713815,-0.00131237,0.000137528,0.000118859,-0.000229333,-0.000263533,0.0000742068,-0.000106831,-0.000406548,0.00184235,0.000405978,-0.000198994,0.000488085,0.00105597,-0.000222377,-0.00102761,-0.000102733,0.0000507709,-0.00039943,-0.000374904,0.000109195,-0.000432138,-0.00168761,0.000171,-0.00102785,0.00193216,-0.000209788,0.00120434,-0.00130229,0.00110181,0.0018336,-0.00191747,-0.000427448,-0.00119389,0.00047118,0.0000904099,0.000309275,-0.0000872673,0.000854701,-0.00177683,0.000511782,0.000528996,-0.000654227,-0.00101269,0.000420965,-0.00011173,-0.000165892,0.000698035,-0.00108891,-0.000513206,0.00169148,-0.00164201,-0.000847627,-0.00133901,-0.000845962,0.00140896,-0.000629633,0.000835577,0.000803762,0.000712655,-0.00102332,0.000551509,-0.000196945,0.000157242,-0.000180614,0.0000134523,-0.000657985,0.00126132,-0.000937799,-0.0000986462,-0.00044339,0.000261553,-0.00110321,0.000796007,-0.000252667,-0.00156152,-0.000412314,-0.000836338,-0.000279012,0.00116227,0.000199492,0.000204589,0.000650233,-0.000697776,0.000215267,0.000462186,-0.00135172,-0.000877087,-0.000715319,0.00131644,0.00109244,-0.000683991,-0.00141868,-0.000748303,-0.000963104,-0.00109295,-0.000430974,-0.000509752,0.00117152,-0.000933542,-0.00154329,0.00061871,0.00111553,0.000118368,0.00104753,0.000224672,0.000844024,0.000276461,-0.000594641,-0.00135717,0.00121894,0.000622164,-0.00132693,-0.00130404,-0.00015942,0.000217528,0.0000550876,-0.00110397,0.0000831952,-0.000716039,0.000309068,-0.00111651,-0.000775242,0.000765648,0.0010638,-0.000219481,-0.00118644,-0.000020346,-0.0011258,0.000598567,0.00100887,-0.000646497,0.0000668472,0.0014947,0.00114262,-0.0000362833,0.00172427,0.000328374,0.000801076,0.000633075,0.000268713,-0.000969651,-0.000245419,0.000995446,0.00167694,0.000805213,0.000885509,-0.000323941,0.000531857,-0.00091729,0.000851446,-0.00070152,0.00139195,0.00143768,-0.000571515,-0.000879807,-0.000135901,0.000662099,-0.00130352,-0.000102296,0.000973448,-0.00000942309,0.000191204,-0.0001208,0.00126013,0.00156985,-0.000393681,-0.00100124,-0.00104896,-0.000168126,0.000899269,-0.00147272,0.00145366,0.00107015,-0.00107956,0.000823934,-0.000972847,0.000976554,-0.000576031,0.000604272,0.000621163,0.000242377,0.000435564,0.00139058,-0.00121205,0.000304303,0.000817276,-0.000209427,-0.00059598,0.00114596,0.00139493,0.00173335,0.0000398504,-0.000436912,0.00109401,0.000344578,0.000766934,-0.000377124,-0.00116058,-0.000136174,0.0014923,-0.00164199,0.000601325,0.000567711,-0.000335743,-0.00000974097,-0.0000242577,-0.000190399,-0.00154724,0.0000127479,0.000946942,-0.000651769,-0.00113885,-0.0015019,-0.000955123,-0.00106286,0.000190379,-0.00128983,-0.000255531,0.00135837,0.000994778,-0.000833373,-0.000713187,-0.000548733,-0.000839862,0.000580149,0.000520101,-0.000170765,-0.00122797,-0.00147258,-0.000303029,-0.00142385,0.00122373,-0.00107743,0.00106872,-0.00000768799,0.000807091,0.00045157,0.000797679,-0.00016478,-0.000639597,-0.0000405799,0.000296069,-0.000778821,-0.0000686837,-0.00109056,-0.000573044,-0.000521007,0.000859072,0.000482464,0.000146464,0.000536319,-0.000468817,-0.000465067,-0.00101641,0.000353171,-0.00152244,-0.00139049,0.00170625,0.00135574,-0.00133614,-0.00020848,0.00086156,-0.000314966,-0.00136264,0.00107844,0.000385741,-0.00153133,0.000794595,-0.000687484,-0.0000228194,-0.000535258,0.00066378,-0.0005788,0.00112945,0.0000142542,-0.000781396,0.000367436,0.000218192,0.000481195,0.000685989,-0.00165738,0.0000217995,-0.000240452,0.000373503,-0.000860273,-0.000734496,-0.0000184622,0.0000287177,-0.000829082,0.000107622,-0.00153331,0.00183568,-0.00190025,0.00170263,0.00140442,-0.000992925,0.000549985,0.000428616,-0.00192829,-0.000401202,-0.000342706,-0.00095067,0.000860027,-0.000115017,0.000050841,0.00057274,0.000894883,-0.000124506,-0.000156906,0.000673813,0.000157301,-0.000965143,0.00123032,0.000512987,-0.000189816,-0.000721868,-0.000697749,-0.00138515,-0.00147306,0.000444135,0.0000619352,0.00066392,0.000352995,-0.000367953,-0.00107218,0.000972336,-0.000593609,-0.000518848,0.00111382,-0.000677732,0.00013633,0.000595859,0.00105757,-0.00129627,0.00195083,-0.000215955,-0.000272647,0.000572322,-0.000246014,0.000521834,0.000345064,-0.000744207,-0.000644855,0.000010472,-0.000034254,0.00180755,0.00064052,-0.000574167,-0.00167601,0.00140677,0.000391335,-0.00083331,-0.0000932903,0.00102805,-0.000547829,0.000641465,0.00145531,0.000127039,-0.000247393,-0.000170753,-0.00161784,-0.00133604,-0.000376399,-0.0002603,0.00104465,0.000579579,0.000837311,0.000473897,0.000354929,0.000499539,-0.00180239,-0.000937929,-0.00110293,-0.000319349,-0.00170217,0.000621525,-0.000836682,-0.000147887,0.0000363822,-0.000108333,-0.00190743,0.000350803,-0.000968675,-0.000599038,-0.000121736,-0.000379644,0.00017311,-0.00109903,-0.000991338,0.000986659,0.000205473,-0.000719426,0.00119919,-0.000194603,0.00107936,-0.00147919,0.000520222,-0.000822328,-0.000851953,0.0012095,0.0000989479,0.000283158,0.00074941,0.000842122,0.0000886344,0.00133693,-0.000119775,0.00149792,0.000765817,0.000707927,0.000230629,-0.000920002,0.000545787,0.000534198,-0.00036354,0.000148503,0.000727689,-0.000349699,0.00140127,0.000405418,-0.000444919,0.000570011,-0.000245525,0.000761731,0.000331688,-0.000240192,0.000660757,-0.00116372,-0.00141749,0.00116655,0.0000635388,-0.00137764,0.000475985,0.00123828,-0.000165827,0.000381358,-0.000431265,-0.000136802,-0.00127707,-0.000267984,-0.000190199,-0.000100166,0.000815377,-0.000640883,0.000884458,-0.000030429,-0.0015967,0.00050708,-0.00108688,-0.00121278,-0.0000310078,0.000408917,0.00178626,0.000940222,-0.000168498,0.0017299,0.000482684,0.000256855,0.000269046,-0.000344197,0.00186896,0.00192702,0.00159357,0.000174941,0.000244982,0.000265205,0.00198461,0.0000777265,-0.00152588,-0.00157682,-0.00162704,0.000517782,-0.000199201,-0.000933316,-0.00110928,-0.000320802,-0.00102054,-0.000906615,0.000601301,0.00000668281,0.0013943,-0.0000689028,-0.00100196,-0.00054595,0.000529667,-0.000707999,-0.000219734,0.000755871,-0.000376967,0.00020193,-0.000263053,0.000263448,0.000195427,-0.000384817,-0.000506116,-0.0000713512,0.0000547198,0.00109255,-0.000666833,-0.0000660172,0.000255128,0.00113224,0.00136887,0.0013731,0.00168872,0.0000174414,0.000668273,-0.000233847,0.000672044,-0.000500807,-0.000748358,0.000263943,0.00136057,-0.000506842,-0.000502368,-0.000659251,-0.0012353,-0.000829595,-0.00094228,-0.000652192,-0.00137519,-0.000493657,-0.000628901,-0.00138874,-0.000871151,-0.000953899,-0.00118917,-0.000481021,0.0000860401,-0.00140958,-0.000107558,-0.00101629,0.000803551,0.00000941662,0.00122202,-0.000739517,0.0000651613,0.000184533,-0.000111986,-0.000473814,0.000262325,-0.00121381,-0.00110339,0.0000331986,-0.00110988,0.000308403,-0.000874752,0.000546684,-0.000918331,-0.00118535,-0.000461708,-0.0000865321,0.000305739,0.00000728393,0.000736783,0.000893393,-0.00126878,-0.0000595554,0.0001013,0.000046491,0.000917027,0.000306536,-0.00147064,0.000205304,-0.00197163,-0.00148611,0.00193064,0.00100846,-0.0000830072,-0.0000537279,-0.000759604,0.000938664,-0.00030362,0.000898732,-0.00115338,-0.00184513,-0.000259989,-0.000626708,-0.000209983,-0.000345106,0.00023768,0.000466212,-0.000258121,0.000705845,-0.000800862,0.000800448,0.000641735,0.000735401,0.00092383,0.000361353,-0.000771553,0.00023845,0.00153655,0.00127597,-0.000266924,-0.000123492,-0.0011069,0.000394971,-0.000753819,-0.000894187,-0.0000427671,0.000721687,0.000326268,0.00156459,-0.00196586,-0.000396184,-0.0000276028,0.000381884,-0.000169339,-0.00111395,-0.000150526,-0.000653024,-0.000617149,-0.00077381,0.000274001,-0.00186594,0.000847861,0.000114754,0.00149832,-0.000363201,0.0000930884,-0.00113369,-0.000418125,-0.00105015,0.000528329,-0.001038,0.000360933,0.00126549,-0.000666592,0.000111166,-0.00138358,-0.000481832,0.000267092,-0.00072625,-0.00153073,-0.000638665,0.000278631,0.000100267,-0.000836535,-0.000786712,-0.00151935,-0.000677837,-0.000037012,-0.00101161,-0.000334392,0.00052103,-0.00141263,-0.00141465,-0.00094972,0.00108479,0.000642,-0.00165432,-0.000854473,0.00120588,0.00169426,-0.000837886,-0.000831265,-0.00110048,-0.000866173,0.000337617,-0.0000958714,-0.00143575,0.000193504,-0.00086101,0.000270535,0.0000733137,0.00130529,-0.00155956,0.00170095,0.0000116693,-0.00129413,0.000736015,-0.000833115,-0.00031271,0.000264654,-0.000314398,0.0000320655,-0.000389591,-0.000726211,-0.000252882,-0.000670527,0.000611434,0.000632509,0.000455593,0.000362994,0.00136523,0.00149442,0.000706997,0.000674179,-0.00176992,-0.000469212,-0.000953923,-0.00170165,0.000107472,-0.00014727,0.00163185,-0.0012646,0.0000925784,0.000280461,0.000077654,0.000403243,-0.00141805,-0.000552423,0.000584238,0.0000948501,0.00114478,0.000636376,-0.000108508,-0.00100323,-0.000327652,0.0000784443,0.00188481,-0.000838822,-0.00124644,-0.00135634,-0.0000580533,-0.000255938,-0.000226112,-0.00138036,0.00085233,-0.000189191,-0.000395298,-0.0000735012,-0.000393437,-0.00099225,0.00154931,0.000915983,0.000269529,0.00143511,0.000102447,-0.000514834,-0.00179498,0.000397602,-0.000955899,0.000623397,0.000210043,-0.000209068,-0.000643825,0.00104078,-0.000289051,0.00105134,-0.00125195,-0.000390863,0.000232097,-0.000215728,-0.00161437,0.000441493,0.000806861,-0.00129657,-0.000648293,-0.000782538,0.000495196,-0.000951896,0.000407561,-0.000552788,0.000398441,-0.00043066,-0.00119969,-0.00149915,-0.000188046,0.00119922,0.000148768,-0.000151694,0.000868192,0.00167288,0.000325992,0.00100876,-0.000962184,-0.00107525,0.000112261,0.00174092,0.000331153,-0.00150868,-0.00159022,0.0000202121,0.000644031,-0.000881656,0.000900332,0.00195644,0.0000113298,-0.00157271,-0.00144028,0.00100277,-0.000169205,-0.000189411,0.0000480666,0.000561523,-0.000494788,0.0006929,-0.000133189,-0.000250137,0.000341892,-0.00101556,-0.00180365,0.000653994,0.00135112,0.000281189,-0.000262408,-0.000439612,-0.000880863,0.000941063,-0.000342505,-0.00100893,0.000489277,0.000620331,0.00196136,0.00160977,-0.00196572,-0.00123751,0.000506392,-0.000133523,-0.00145323,0.000167626,0.000155673,0.000281321,0.0000106579,-0.000434735,0.000256204,-0.000849051,0.000462243,0.000613642,-0.00123125,0.0000538552,-0.000196752,0.00127104,-0.0000610352,0.000964427,0.00031884,0.000466105,0.00132759,-0.000916863,0.00028365,-0.0000372261,-0.000901024,-0.00079704,-0.000494411,0.0000888111,0.0000246864,-0.00136212,0.000596547,0.00107819,-0.00130294,0.00155606,0.000127924,-0.000204827,0.000359335,-0.00115133,0.000642867,0.00146013,0.000135538,0.000280181,0.000250723,0.000334791,0.000233539,0.00107051,-0.00160814,0.000774875,0.000210784,0.000106369,0.000234683,-0.000348902,-0.000340698,-0.00068017,0.00056468,0.00148529,0.000323129,0.000852813,0.000378544,0.000659884,0.000566116,0.00153093,0.000691296,-0.000849743,-0.00100052,-0.000303666,-0.00134728,0.000604759,-0.00132135,-0.00100841,-0.000659188,-0.00019298,0.000704265,0.000292227,0.000268056,0.000705536,0.000231234,-0.00118746,-0.000414897,0.000519059,0.000882436,0.00107546,0.000355636,-0.000120374,-0.00129847,-0.000892537,0.000635537,-0.000214852,0.000272494,-0.0000500104,-0.0010415,-0.000601394,-0.0000754863,-0.000868417,-0.0000509634,0.00111284,0.00000878604,0.0000740782,-0.0000416469,-0.000121631,-0.000311444,0.00124958,0.000326882,-0.000553974,-0.000525276,-0.000575995,-0.00109977,0.0004612,0.000189757,0.000121791,0.000189613,0.0000893412,0.000171231,-0.00095869,-0.000571017,0.00117069,-0.00147173,0.000471925,-0.00100871,0.000995345,0.000442586,-0.000130577,-0.0003467,0.000735892,0.000927119,-0.000294243,0.000740244,0.0000111768,0.000228105,0.000514389,0.000101264,0.000163848,0.00119391,-0.000785631,0.00121621,-0.000316259,0.000912109,0.000576585,0.00190444,0.00172528,0.0000855821,-0.00152367,0.000223057,-0.0000786743,0.00065523,-0.000340997,0.000783808,0.000374654,-0.000486771,0.000344006,0.00030268,-0.000204069,-0.00169384,0.0012845,0.0015221,0.000507161,0.000050597,0.000185825,0.000348438,-0.00137347,0.00033153,0.00157116,0.000333036,0.00049558,0.00135684,0.000227211,0.000152264,0.00178553,-0.0000328272,-0.00104001,-0.0000688662,-0.000945515,0.00164414,-0.000288786,0.00044677,0.000128085,-0.0000205813,0.000354875,-0.00120656,-0.000816857,-0.000319183,0.000771262,-0.0000742099,0.000709813,-0.000932331,0.0000608081,0.0010833,-0.000891247,-0.000701762,-0.000211599,0.000799057,0.000952201,-0.000247455,0.0016122,-0.00125754,0.000548425,0.00011775,-0.00163717,-0.00132796,0.000258306,-0.000184393,0.0003284,-0.000354042,-0.000786886,-0.000919055,-0.000049792,0.00019582,0.000689818,0.00137139,0.000256953,-0.000308182,0.00122208,-0.00177684,-0.000017443,-0.00185311,0.00114358,0.000673418,-0.000570441,0.000132014,-0.000912864,-0.000424716,-0.00143379,0.000981861,-0.000730336,-0.000892369,-0.000770609,0.00110979,-0.00108772,-0.00191778,-0.000804004,0.000492926,0.000742284,0.000131821,0.000372786,0.00145961,0.00148453,-0.0000380568,-0.000621795,-0.00166415,0.000057259,0.000665262,-0.000201742,0.000423383,-0.000541495,0.00024972,0.000121928,-0.000554179,0.00178718,-0.000492522,-0.000489979,-0.000626861,0.000402628,0.00120308,-0.00174139,0.000452453,-0.00156957,-0.000222463,0.000284827,0.00144078,0.0000686203,-0.000557597,0.000669866,-0.000639376,0.000576631,-0.000595081,-0.00131812,-0.000851512,-0.00173157,-0.000943571,0.000249619,0.00199256,0.000348574,0.00170129,0.000163503,-0.0000391827,-0.000644326,-0.000649812,0.000414118,0.000625801,-0.00018776,-0.00185892,-0.000511142,-0.00102854,-0.000273975,-0.00120122,0.000236723,-0.000548552,0.00128953,-0.00113639,0.0000167254,0.00119668,0.0000886267,-0.00124974,0.000340594,-0.0000813608,0.0000806586,0.000328149,0.00111734,-0.000196856,-0.00130259,-0.00037552,-0.00133751,0.000616538,0.000709724,-0.000252457,0.000395859,-0.000664124,-0.00133635,-0.000482345,0.000298297,0.000174231,-0.000290904,-0.000529802,0.000159592,-0.00105043,0.0000884819,0.00106279,-0.000605623,-0.000298964,0.00182066,0.000912344,0.00102889,-0.000852565,0.00152189,-0.00143294,0.000444165,-0.00119207,0.00165549,0.00123562,-0.00177663,-0.00111612,-0.00022489,0.00047089,0.000498472,0.000639335,0.000172573,0.00168229,-0.000652784,0.0000187721,0.000217013,-0.000389116,0.00178442,-0.000834781,0.00076206,-0.00015697,-0.000440606,-0.000578425,-0.000688549,0.000776971,0.000731052,0.000933606,0.000728536,0.000384046,0.00159058,-0.000236641,0.000331825,0.00142027,-0.000455597,0.000247467,-0.000368709,0.000859049,-0.00185713,0.00107162,0.00103104,-0.0015502,0.00099618,0.00133762,-0.00013396,0.000613251,0.00140917,0.00106826,-0.00148843,0.00180693,-0.000115629,-0.000889974,0.00149402,0.00124565,-0.000788677,-0.000669536,-0.000630551,0.00157295,0.000984129,-0.000401379,0.00060554,0.000343693,0.000963028,-0.000376449,0.000630243,0.000571561,-0.00130098,-0.00164377,-0.000678719,-0.00195825,-0.00124166,0.0011161,0.000906073,0.000937133,-0.0000191371,-0.000855169,-0.000528848,-0.00110466,-0.00122047,0.00170362,0.00143181,0.000353247,-0.000712617,0.000773497,0.000245867,0.000217075,-0.000752263,-0.000058767,-0.00142637,0.000369715,-0.000708836,-0.00197457,0.000783319,0.00197756,-0.000832828,0.000982789,-0.000744747,-0.00141164,-0.00123167,-0.000560144,-0.00136856,-0.00117094,0.000143253,-0.000975281,-0.000169428,-0.000406057,-0.000548264,0.00192366,0.000784862,0.00150077,0.00117481,-0.000220289,-0.000493721,-0.000414377,-0.000790233,0.000351994,-0.0011557,-0.000647626,0.000955616,-0.000950603,-0.00180789,0.00127041,0.000983281,-0.0000713693,0.000425788,-0.000864423,0.00011835,-0.000062871,0.0000639238,-0.00000604182,0.00112283,0.00153311,-0.00182829,-0.0000528389,0.000750848,0.000269028,0.000028537,0.000909433,0.00141845,0.000181678,-0.000436827,0.00129642,0.000791312,-0.000470178,0.000132019,-0.00106619,-0.00130361,-0.000629317,-0.000578178,0,-0.00131928,0.000413439,-0.000323007,-0.000821665,0.000290235,-0.000777638,0.000862458,0.00162941,0.000794756,0.00123824,0.000771829,0.000922717,-0.00101741,0.0008237,-0.000379004,0.00167649,0.00145821,-0.000561317,0.000398891,0.00111922,0.000777505,-0.000850048,-0.000840549,0.00159725,0.000317218,-0.000628899,0.00132821,0.000374995,0.000951901,0.000451001,-0.000621362,-0.00101423,0.000557958,-0.000134854,-0.000087123,0.000518217,0.00134539,-0.00143381,0.00125015,-0.000382438,0.00168737,0.000909244,-0.000879161,0.000154328,-0.000344767,0.000952464,0.0014408,0.000543424,-0.0008066,0.000175942,-0.000621324,-0.00034949,0.00106859,-0.00146198,0.000792835,0.00117073,-0.00112054,0.00196809,-0.000521925,-0.000713571,0.000811112,0.000419607,0.000288939,0.000291949,-0.000809164,-0.00124776,0.0000947372,-0.00140904,0.0000190149,-0.000676427,-0.00103446,0.00141721,0.00135428,0.00172248,0.000158805,0.00187406,-0.00188543,0.000737429,-0.00150885,0.000472871,0.000158553,0.00133132,0.00125356,0.00133394,0.00065774,0.00147034,-0.000438595,-0.00163265,-0.00105606,0.000382161,-0.00119068,0.000511031,-0.000663195,-0.00103964,-0.000149034,0.000270977,-0.000167338,0.000185597,0.000722196,-0.000403805,-0.0012354,-0.000062649,0.000941789,-0.000784201,-0.000157213,-0.000949754,0.0000932586,0.000199718,-0.00068802,0.00102559,-0.000805725,-0.000261131,0.000209452,-0.000194744,0.000662254,0.00178629,-0.000188921,0.0011532,0.000642431,0.00107165,-0.000858572,-0.000815571,0.000479553,0.00171882,0.00185251,-0.00119061,0.000903244,-0.000391477,0.000197727,0.00105221,0.000597401,-0.000523825,-0.000019365,-0.000654176,0.0002585,-0.0000344767,-0.000658469,0.000796413,-0.0000389308,-0.000028919,0.00138911,-0.00130668,-0.000314222,-0.00117137,-0.000868894,-0.00123812,-0.000193028,-0.00176206,0.00161859,0.000403326,0.0000191611,0.00187936,-0.00110534,-0.00139845,-0.000543486,-0.00143254,-0.000249474,0.000417519,-0.000185021,-0.000191111,-0.000681535,0.000435193,0.0000776214,0.00146852,-0.0000692524,-0.00106198,-0.000863204,-0.00139583,-0.00111218,-0.00169604,0.0000641097,0.000261817,-0.000203632,-0.00121072,-0.00110017,-0.000164794,0.000522037,-0.00175501,0.000299437,0.000122664,-0.00152024,-0.000789638,0.000343469,-0.00164049,-0.00162314,-0.00096489,0.000976761,-0.0000351687,0.000878769,0.000327617,-0.000611197,0.000369538,0.000443302,0.00100649,-0.000590227,-0.000561605,0.000866033,0.0000355111,0.00106857,-0.000457478,0.000229339,0.000544698,-0.00154679,-0.000401049,-0.0000199176,0.000112984,-0.000826849,-0.000847295,0.0012523,-0.0000876382,0.000412541,0.000974022,-0.000110439,-0.00122314,0.0014363,-0.000154573,0.000700794,0.00117085,-0.00157521,-0.000448924,0.000179597,0.000496384,-0.000208264,-0.000804201,-0.000271643,0.00161576,0.000292929,0.00124261,-0.000237138,0.00123273,0.000407324,0.000986845,0.0012027,0.00107957,-0.0000470206,0.000759815,-0.000979509,-0.00121541,-0.000158756,0.000545848,-0.00094269,-0.000332812,-0.000458361,0.00104717,-0.00128903,0.000321147,0.0010151,0.00156438,-0.000684698,-0.000313466,-0.000199553,0.00178417,-0.000419999,-0.00107107,0.000787546,0.000918468,0.0000423585,0.000575434,-0.00155054,-0.0000415344,0.000747162,-0.000792087,0.000722017,0.00197697,-0.000535929,-0.000630191,0.00107062,0.00146501,-0.000186679,-0.000574273,-0.00157911,0.000765494,-0.000677037,-0.000956397,-0.000150138,-0.000891207,0.000317854,-0.0000408415,-0.000147437,0.000283082,0.00187468,0.00047465,0.00172984,0.000448264,-0.000531756,-0.000542302,-0.000221002,-0.0000676514,-0.00108732,-0.00166438,-0.000742067,-0.000405484,0.000250005,-0.000747779,0.0000778442,-0.00046172,0.00133453,-0.000693994,-0.000862645,-0.0002345,-0.000289792,0.000551904,0.000434445,0.000553614,0.000689307,0.000090886,-0.000904941,0.00039435,0.000223818,-0.000729817,0.000757557,-0.000129609,0.0018662,-0.000722303,-0.00097721,0.00177086,-0.000253112,0.000312611,-0.000442251,0.00148019,-0.000103163,0.00120388,0.001679,-0.000502269,-0.000844355,0.000750822,-0.000447858,0.000480135,-0.000880511,-0.00130391,-0.00153592,-0.00199788,-0.000498829,0.000379644,0.00110889,-0.00170923,0.000221845,0.00013133,0.000168495,0.00048416,0.000113057,0.000779525,0.00111678,0.00128843,0.00148252,-0.000676085,-0.000252619,0.00101241,0.00020314,-0.00154682,-0.0012234,0.00134038,0.00000544166,-0.00130844,-0.000969745,-0.000712346,0.00157725,0.000355689,0.000804581,0.000287322,0.000333135,0.00103922,0.0004945,-0.000390912,-0.00172593,-0.000827838,0.000481671,0.00000556732,-0.000451399,-0.00130793,0.000477262,0.000238632,0.0000198992,0.00127278,-0.00153644,0.00187632,-0.00127829,0.000692852,-0.000294985,0.00105807,-0.000241142,-0.000538701,-0.000454701,0.00118462,-0.000489908,-0.000112285,-0.00019023,0.000718476,-0.00169522,-0.000056072,0.00196017,0.000616036,-0.00127293,0.000832226,0.000307203,0.00104098,0.000182988,-0.000493574,-0.000965892,0.00151674,-0.000787662,-0.000960994,-0.000944879,-0.000936855,-0.000398034,0.00166396,-0.0000388831,-0.0011934,0.000234283,0.000797606,-0.000983235,0.00164421,0.00121526,0.000153483,0.000251587,-0.00108028,0.00163648,0.000741987,-0.0000222673,0.00137673,0.0000373777,0.000475294,0.00116421,0.000122542,0.00141369,0.001082,-0.00115745,0.000301764,-0.00153303,-0.00029785,0.0015127,-0.000623193,-0.000883737,0.000662871,0.0000856131,-0.000874275,-0.000465028,0.00176236,-0.000064315,0.00143394,0.00074442,0.0000934158,0.000166713,0.000760291,0.000547566,-0.0000524945,0.000565395,0.000186808,0.000437853,0.0007637,0.000918661,0.00115717,0.000427009,0.00152999,-0.000845823,0.000689006,-0.000866872,0.000441328,-0.00135343,0.000565347,-0.000645745,0.000192439,-0.00152834,0.000375764,0.000991566,-0.00137204,-0.00020164,-0.00136335,0.00190608,0.0000403122,-0.00111279,-0.000602952,-0.00114097,0.00140739,-0.00110903,-0.00140532,0.000278001,-0.000427966,0.000740778,0.000515329,0.000569275,-0.000932041,0.00168143,-0.000485363,-0.0000317644,0.00047005,0.000203639,0.000961553,0.000772956,0.000200017,-0.00031365,0.000656395,-0.000250698,-0.000446746,-0.000647483,-0.00105494,0.000906257,0.0000638707,0.00171435,0.000194081,0.000487261,-0.00107143,-0.000419431,0.000968221,0.00015468,-0.00163872,0.000666769,-0.000483719,0.000118086,0.00157382,0.000779029,-0.000321054,-0.000763992,-0.000337333,-0.000422958,0.000339942,0.00109433,0.000089299,0.000796753,0.000335533,0.00167851,0.000424173,0.00124828,-0.000562425,-0.000128528,0.000301804,-0.00108608,0.000479261,0.00042512,0.00129394,0.000571535,0.00102082,0.000376985,0.000618294,-0.000859185,-0.000427826,0.000525413,-0.00148898,-0.000249533,0.00151879,0.000411471,0.00028775,-0.00108676,0.000984334,-0.00151307,-0.000693218,-0.000604509,0.00109433,0.00109882,-0.00178494,-0.00046076,-0.00104599,-0.000671641,0.00137425,0.00029115,0.00098542,-0.000575106,0.000417596,-0.00103203,0.000488116,-0.000568087,0.00144343,0.00133407,0.000882601,0.00120568,-0.000385312,0.000265382,0.000362977,0.00141031,0.000295895,0.00177103,-0.000238951,-0.000875254,-0.000866566,-0.000951496,-0.000729408,-0.00076547,-0.000863589,-0.00112526,-0.000449082,0.000144624,0.000681351,0.000281295,-0.00121061,0.000174428,0.0000638892,0.00120198,-0.00116822,-0.000790204,-0.000387736,0.000325264,0.00033679,0.000600946,0.00144935,0.0011109,0.000163358,0.00121024,0.000295372,0.000829555,-0.000024248,0.000187232,0.00108991,0.000134438,0.000915994,-0.000556871,0.000819755,0.000054444,-0.000498726,0.000334835,-0.000642816,-0.0000880453,-0.0000783458,0.000624037,0.000461049,-0.000563986,0.000946539,-0.000443505,0.0000514644,-0.000196339,0.000963555,-0.00163679,0.00103871,-0.00112727,0.000423299,0.000940342,0.000224686,0.000793289,-0.000804473,-0.0000407374,-0.000365969,-0.00049174,-0.000325797,0.0000717476,0.000209738,0.00120879,0.000578453,-0.000413216,-0.00135204,-0.000334432,0.000145632,0.000245666,0.000504629,0.00119494,0.000305423,-0.000951286,-0.0000774163,0.000407826,-0.000109472,-0.000400744,0.0000330491,-0.00135911,0.00129307,-0.000529429,0.00165333,-0.000686809,0.000982968,0.00101036,-0.000941967,-0.000909221,0.000130727,-0.00147864,0.000779327,-0.00149888,0.0000723375,0.000447784,0.000503778,0.00123071,0.000847378,0.0000945704,-0.000882671,0.000218071,-0.000974152,-0.00165603,-0.00086905,-0.0000333478,0.000773682,-0.000318336,0.001062,0.0000133562,0.000840017,0.00000853348,-0.00141281,0.0000317353,0.000257338,-0.00106247,-0.000885524,0.00091871,-0.000138844,-0.000603696,-0.00101711,0.000702109,0.00091689,0.000187292,-0.00138856,0.0000879859,0.000519244,0.000794086,0.000442427,-0.000174204,-0.000900202,-0.0000168585,0.00191295,-0.000838649,-0.00103583,-0.000911698,0.00049044,0.00162334,-0.00140649,-0.00112875,0.000614908,0.000956634,-0.000403745,0.000305636,0.00146209,0.000118014,-0.000603462,0.00136304,-0.000135084,0.000184899,-0.0009137,0.00139458,-0.00120283,0.000905801,-0.00110946,-0.00000635834,-0.00125677,0.0011542,-0.0010164,0.000980168,0.00125466,-0.000273479,0.000364378,0.000781183,-0.000437237,-0.000957006,-0.00100244,0.00173541,0.000203229,0.000646346,0.000263061,-0.000368439,0.000349198,0.000939986,-0.00115525,0.00115559,-0.00105731,0.00139263,-0.0010973,0.00042576,0.00146764,0.000903773,0.000636623,0.00084533,0.000107737,0.000136965,-0.0000223148,0.0000356726,0.00174719,0.000410884,-0.000174079,-0.00010827,-0.000458692,0.0010009,-0.000242663,-0.000635029,-0.000356168,0.000306254,0.000268443,0.00117696,0.00164204,0.000346399,0.000593057,-0.000091133,-0.00161352,0.000546372,0.00116843,0.000175907,-0.00190619,0.0000267173,-0.000878948,-0.00185821,-0.000222793,0.000563173,-0.000677264,0.000828716,0.000671934,0.000168349,-0.00155766,-0.000133826,-0.000668458,0.000533989,0.000695863,-0.000511511,-0.00088023,0.000429898,-0.00172138,0.000778888,0.000599407,-0.000988086,0.0000485566,0.000966897,0.00117874,0.00035104,0.000714627,0.0000660673,0.000256112,-0.00138769,0.000002663,0.000825036,0.000408835,-0.00126746,0.000655101,-0.0000479161,0.000396351,-0.00042716,-0.0000067965,0.000712972,-0.000863879,-0.000662876,-0.00183468,0.000373168,-0.000779241,-0.000549755,0.000199918,-0.000724137,-0.000329498,0.000398355,-0.0000123491,0.00100244,0.0000855455,0.000596527,0.000800507,-0.000823536,0.00160924,0.000110389,0.000215917,0.000610188,0.000142472,0.000551699,0.000667207,0.000664856,-0.000560923,0.000382591,-0.000392449,0.0000363048,-0.000031871,0.000461273,-0.00188501,-0.00106505,0.0000579349,-0.000484709,0.000190605,0.000280534,-0.00118802,0.0006107,-0.000753158,-0.000229342,-0.000739806,0.00146566,0.000975198,0.000942694,-0.00139748,0.00085469,0.000529352,0.000310679,-0.000491079,-0.00149037,0.000558212,0.000479637,-0.000375916,-0.000866094,-0.00149845,0.00102506,-0.000493275,-0.00173712,-0.000044677,0.00022324,0.000309899,0.000783425,0.000271945,-0.00122849,-0.00107321,0.000448433,0.00134541,0.000888388,-0.00131332,0.00142069,-0.00170327,-0.000962678,0.0000886614,0.000209863,0.000529424,-0.00193021,0.00124965,-0.000354656,-0.0000820563,0.00124563,0.000181362,0.00119974,-0.000881374,0.00131123,-0.000442437,0.00108337,-0.000532613,-0.000240373,0.00109932,0.0014755,0.000999567,-0.00083319,-0.000708854,-0.000344156,0.000445209,-0.00000285074,0.000484887,-0.00119542,-0.000340339,0.000452588,-0.000478631,0.000175577,-0.000282171,-0.00193168,-0.00122434,-0.000321944,-0.000220017,0.00145706,0.000562253,0.000297897,0.000015478,0.0017242,0.000318296,-0.0014415,0.000781999,-0.000744979,0.00158974,-0.000131379,-0.000472689,-0.00102973,0.000314544,-0.00110053,0.000270544,-0.00173179,0.000687674,-0.000071565,0.000715626,0.000513698,-0.000497409,-0.000578089,0.000821655,0.000436292,-0.000734728,-0.00112925,-0.000526151,-0.000207114,0.000320393,-0.000813718,0.0000838429,-0.000066303,-0.000011818,0.000644083,-0.000682633,-0.0000185247,0.000658004,-0.00109214,0.0000489362,-0.0007424,0.00132383,0.00131571,0.0014326,0.00112485,0.000788,-0.0000931909,0.000419128,0.000808679,-0.000924983,0.00128142,-0.00046603,0.00123771,-0.000383178,0.00106004,0.00071474,-0.00194014,-0.00139503,-0.000161754,0.00140092,-0.0000359979,-0.0000456438,0.00166824,-0.000680828,-0.00101185,0.000194662,0.00131511,0.0006663,0.0000764315,-0.000397818,-0.000845023,0.0000271519,0.000734041,-0.000612722,-0.000076863,0.00107158,0.00130728,0.00040716,-0.000191616,0.000637779,0.000748832,-0.0010853,-0.000359282,-0.000631131,-0.000026536,-0.00016962,0.000840047,-0.000415771,0.000249715,0.000819309,-0.0016274,0.000864438,-0.00104955,-0.000833697,0.000199068,-0.000636464,0.00103385,-0.00146444,0.000494866,-0.000747388,-0.000976409,0.00120455,0.000552037,-0.00106414,0.000385728,-0.00055989,0.000141856,0.00124781,-0.00123776,-0.0000545615,0.000871977,0.000574254,0.000125246,-0.0007645,-0.00141861,-0.000711526,-0.00118947,0.000202717,0.000138771,-0.0013475,0.0000165045,-0.0013322,-0.000246496,-0.000874795,-0.00014516,0.000306621,0.000825725,0.000207433,-0.0000716538,0.000768073,0.00000109415,-0.00154696,-0.000376491,0.000606953,0.000372637,-0.000159948,-0.000468072,0.000253321,0.000278649,-0.0010709,0.000223941,-0.000561408,-0.00101335,-0.000432064,0.000442564,0.000362751,-0.000643572,0.000810446,-0.00000335818,-0.0011032,-0.000462562,0.00111872,-0.0000384036,-0.000410718,0.000926332,0.000538917,-0.000646848,-0.000014008,-0.00176189,-0.000355392,-0.0000085469,-0.00129632,0.00185647,0.00120383,0.000943838,-0.000732335,0.000913155,0.00114788,-0.00134039,0.0011853,0.00143367,0.000618882,0.000210519,-0.000774774,0.000586916,0.000296078,0.000727866,-0.000275174,0.000317451,0.000896896,0.000366223,0.000184306,-0.000122058,0.00037301,0.00163864,-0.000917838,-0.00170223,0.00099448,0.000607762,0.000216104,-0.000579343,-0.00021322,0.000210271,0.00122917,-0.000038417,0.00113148,0.00146175,0.000410145,0.000151158,0.00122,0.00117347,0.000063449,-0.00121888,0.000528649,0.000890939,0.0011261,-0.000711145,0.000258015,0.000095177,0.0000167361,0.00164901,0.000756979,0.0012023,0.00038299,-0.000587755,-0.000605246,0.000499487,-0.000200722,-0.00168847,0.000756952,-0.00105369,-0.000455794,0.000388133,-0.00152164,0.00115261,0.000833395,0.0000887737,0.00110565,-0.000641417,0.000631118,0.0013575,-0.00148666,0.00105702,0.000427386,0.000363754,-0.000594689,-0.00169196,0.000308128,-0.000210503,0.000950012,0.000651129,0.000272591,-0.000432456,-0.00169216,-0.00155997,0.000115198,0.00111589,0.000944881,-0.0000251125,-0.00117443,0.00152737,-0.00104816,-0.00129401,-0.00119642,-0.000263219,0.000215165,-0.000853757,-0.000547985,-0.000985576,0.000204258,-0.000324595,-0.00126308,-0.00171163,0.000807454,0.000677714,0.0000699848,-0.000236724,-0.000422329,-0.00105955,0.000818449,0.00174315,0.000178382,-0.00119124,-0.00137103,-0.000477189,-0.000710044,0.000893218,0.00120815,0.000406185,-0.000578206,-0.000246682,0.00132984,0.000737254,-0.000522471,0.000765243,-0.000727439,0.000287666,-0.00102406,0.00028104,-0.0010721,0.000353081,0.00121435,-0.000124017,0.0000905482,0.0000669302,-0.0000183902,0.00141855,0.00026888,-0.000395494,-0.000415596,-0.0000265152,-0.000265057,-0.000332785,-0.00144411,0.00036931,-0.000347418,0.00139602,0.000204334,0.000428987,0.00082562,-0.00095224,-0.00145917,0.000747615,-0.00042249,0.00112696,0.000381873,0.00190111,-0.00156313,-0.000830449,-0.000543477,-0.000539528,0.00148326,-0.000184093,-0.00036223,0.000597317,0.000225444,-0.000642147,0.000459193,0.000496222,-0.00176234,-0.000373301,0.000717377,0.00133344,-0.00146935,0.00100478,-0.001291,0.0012425,0.000600512,0.000228293,-0.000704312,0.000715983,0.00184304,0.000249642,-0.000789709,0.00128766,-0.000436885,0.000717421,0.00152275,0.000487063,0.00000277682,-0.000275897,0.000593735,0.000203172,0.00199697,0.000630937,0.00000442162,-0.000906326,-0.00159563,-0.000688265,-0.00194293,0.00137479,-0.00123136,0.000941333,-0.00123772,0.0000266813,0.000296804,-0.000544584,-0.000885833,0.000358303,-0.000266394,-0.00140117,0.00030871,-0.000200781,-0.0000355469,0.000849495,-0.000582045,-0.000725097,-0.00139008,0.00054366,-0.000203816,0.000349304,-0.000686328,-0.000907678,0.000145352,0.00107121,0.0000730875,0.000104947,0.000520673,0.00138229,0.000465404,-0.000492989,-0.000493245,0.000361899,0.00106426,-0.000677845,-0.000708359,-0.00121142,0.000605303,0.00104585,-0.00140407,-0.00133432,0.000293299,-0.000891179,0.000371732,-0.000900097,0.000988281,-0.000646114,0.00175067,-0.0007522,-0.000246487,0.000853296,-0.000294349,0.000542638,-0.00041812,-0.000451981,-0.00125972,-0.000687952,0.00180586,0.00133013,0.00173058,-0.00160673,-0.000286491,-0.000583809,0.00090232,0.000761359,0.00087059,-0.00136311,-0.000481839,0.00130826,0.000272645,0.000364485,-0.00136773,0.000829364,0.000445845,-0.000121293,0.00143602,0.00100697,-0.000207228,0.000693075,-0.000489167,-0.0000676801,-0.000175081,0.000130427,0.000994084,-0.000246764,0.0011654,0.000119769,-0.000605841,-0.000650611,-0.000215701,-0.000766936,-0.000478123,-0.000968452,-0.00128135,0.000954675,0.000543884,-0.00137102,0.0010613,-0.000165401,0.00014716,0.00105336,0.000135388,0.000570212,0.000254812,0.00157157,0.000390211,-0.000372421,0.00128445,0.000307198,-0.000101687,-0.00124361,-0.000632554,-0.000656101,0.000876854,0.000704664,-0.00129533,-0.000769698,0.000687303,0.00105071,0.000250207,-0.00199666,-0.00128068,0.00171826,0.0000104519,0.000433111,0.00168187,0.000798044,-0.00068512,-0.000786129,-0.000955945,0.000477474,-0.000202916,0.000304624,0.00129457,-0.000156293,0.0000480954,-0.00000271659,0.000257432,0.00162938,-0.00198472,-0.000372577,-0.000730933,0.000615462,-0.000353681,0.00055135,0.00146122,-0.00182068,0.0000125863,0.00116697,-0.000471812,-0.0014497,0.000247718,0.000755185,0.000513141,-0.00126959,-0.000780815,0.00109437,-0.000643421,-0.000463173,0.000311569,-0.000163455,-0.0000567492,0.000713644,-0.0011079,-0.00135956,0.000528606,-0.000211181,-0.00071056,0.000195223,-0.0000633729,0.000527921,0.000401769,0.000269773,0.00101391,-0.0013942,0.000998212,-0.000482461,-0.000559141,0.000520704,-0.0017023,-0.000508234,-0.00173481,-0.00081505,0.0000773451,-0.000337329,-0.00135754,-0.000385247,-0.000100155,0.00154698,0.0000827084,-0.000173757,-0.000193406,0.00147057,0.00128592,-0.00079332,-0.000668148,-0.00187839,-0.00125156,-0.00181461,0.00134044,-0.0000713728,-0.000515426,-0.000127606,-0.0000214274,-0.0000620023,0.0000524838,0.000112674,-0.00139534,-0.000020889,-0.000341175,-0.00012268,-0.00147527,0.000989377,0.00144799,-0.000340496,0.00115141,-0.000477846,-0.000369167,0.0000907474,-0.000884911,-0.000715599,-0.000390869,-0.000965633,-0.000664181,-0.000062331,0.00082491,0.0000987527,0.00119715,0.00110529,0.000804667,-0.000201198,0.00104551,-0.000728525,-0.000619836,-0.000197288,-0.00100485,-0.00131814,-0.000527642,-0.0000309032,-0.000468114,0.000750457,0.000341645,-0.00091758,0.000500443,-0.00137282,0.00133485,0.0000647138,-0.00000493365,-0.00114069,-0.000733751,-0.000370477,-0.00115095,-0.000353218,-0.00142102,-0.00114414,0.000307656,0.00120385,-0.000592957,-0.000394065,-0.000133329,0.00051333,0.000102149,-0.000205176,-0.000498192,-0.00171479,0.000404605,0.00103795,0.0013265,0.000681473,-0.0000495511,0.000306852,-0.000260057,0.000544611,-0.00110687,-0.000155605,0.0000944888,-0.0000913899,0.0000675573,-0.000385634,-0.000506258,0.00088886,-0.000441065,0.00157469,0.000890979,0.0012886,-0.000024363,0.000270301,0.000839581,-0.00130357,0.000165595,0.00108776,0.000549453,0.000122094,0.000385301,0.00103725,0.000190272,0.00110488,-0.000693002,-0.000891976,-0.00111151,0.000738899,0.000137712,0.000280681,0.000544462,-0.0000269395,0.00111951,0.000521762,0.000982846,0.000817772,0.00158682,-0.000184066,-0.000354684,0.00110143,0.000396352,-0.00174857,-0.00049454,-0.000233365,0.000229734,-0.000514977,-0.00126978,-0.000545221,-0.00129169,-0.0000997739,-0.0000184074,0.000962247,0.000824207,-0.00115278,-0.000351444,0.0016127,-0.00101115,-0.000527503,-0.000342822,0.00131143,-0.000078669,0.000909662,0.0000675657,0.0011493,0.000118625,0.00123277,0.00100709,-0.00189578,-0.0000245245,0.000936591,0.000914167,0.000543838,0.000829643,0.000360082,0.000374473,-0.00105467,0.00040675,0.000640899,0.0000611399,-0.000670982,-0.000390117,-0.000350498,0.00145223,0.00149511,0.000152287,-0.00144546,0.000795932,-0.00138653,-0.000202733,-0.000608306,0.0016028,-0.000971227,0.000802969,-0.000142111,0.000420497,-0.00114105,0.000794612,0.000714615,0.0000926347,0.0000733936,-0.00131917,-0.000771679,0.0012677,-0.000142896,0.0000172872,-0.000785425,0.000344442,-0.000313792,-0.00114732,0.00108,0.000675714,0.00188908,0.000530984,-0.000332925,-0.0000417673,0.000261863,-0.000254857,-0.000738005,-0.0000909124,-0.00136526,0.000669771,-0.000739097,0.000540088,-0.00131763,-0.00114492,-0.000581581,0.000218814,-0.0001163,0.0000352851,-0.00019784,0.00193881,0.000293732,0.0000404308,-0.000287982,-0.00101974,0.00106289,-0.000311859,-0.00154077,0.000647439,-0.000519463,-0.00161482,-0.000266345,-0.000302583,0.000790605,0.0000691638,0.000427521,-0.000902857,-0.000626616,-0.000680182,-0.0007947,-0.000340464,0.00100032,0.000834185,0.00103689,0.000306901,-0.000699,-0.00110655,-0.000799575,0.0019455,0.000594613,0.000655318,0.00183307,0.00113068,0.000985537,-0.00155661,0.000331506,-0.000305611,-0.000409875,0.00182546,-0.000297013,-0.000891118,-0.00089259,0.00128668,0.00080374,-0.00136218,0.000304723,-0.000549113,-0.00153944,0.000156072,0.000749411,0.000288915,-0.000386465,-0.000403354,0.00197693,0.000296408,0.000689316,0.000646139,-0.000238397,0.00184486,0.00117137,0.000115299,-0.000576186,0.000592849,-0.00118953,0.00140964,0.000403923,0.000514369,0.000412289,0.00128688,0.000676481,0.0000402985,-0.0000451613,-0.000463253,-0.00141443,-0.00000672497,-0.00143324,0.000204201,-0.000568028,0.000155704,-0.00141185,0.000905164,-0.000717252,0.00185039,-0.00000650478,-0.000428804,0.000357104,-0.000885472,-0.0000613653,0.000690895,-0.000879984,-0.00159291,0.000198644,0.00111581,-0.000407826,-0.000607368,0.000349474,0.000252631,0.000125876,0.000265397,0.00040013,0.00108653,-0.000626394,0.00168198,0.000195712,-0.000347259,-0.00110892,-0.000497256,0.000572394,0.00137763,-0.000211163,0.00109401,-0.0000537874,-0.00117542,0.000193424,0.000745036,0.000649148,0.000327507,0.000966098,0.000351775,-0.00111368,-0.00000815125,-0.000686647,-0.00000502774,0.00138997,0.000304236,0.00105909,0.0001128,0.00129319,-0.000472,0.000119775,-0.000109012,-0.00034944,-0.000207528,0.00016755,0.00155369,-0.0000210417,-0.000432414,0.0000141953,-0.000169838,-0.00051631,0.00166006,-0.00026223,-0.000661263,-0.000249651,0.0002931,-0.00026869,0.00131059,0.000194814,-0.000172901,0.00171096,0.000568432,-0.0012251,-0.0003225,-0.00100013,0.000164178,0.0000851436,-0.000193697,-0.0000482061,-0.000507625,-0.00135829,-0.000533449,-0.000608175,-0.0000147373,-0.000705985,0.0000948006,-0.000324078,0.00139999,-0.00132568,-0.000706733,0.0000555104,0.00189271,0.000668492,0.0014735,0.00109529,-0.000215741,0.00046804,-0.000563229,0.000166546,0.000102571,-0.0010023,-0.000518423,0.0000820853,-0.0000394002,-0.000660557,-0.00118199,-0.000719021,-0.000685169,0.0011513,-0.00158019,-0.000580896,-0.000384513,0.00111027,-0.000365475,0.000829105,0.000521565,0.00115513,0.0000734939,0.00058919,0.000334494,0.000853478,-0.000596576,0.00113175,-0.000601095,0.00115752,0.0015377,-0.000546143,0.00101732,-0.000485908,0.000611659,-0.000442799,0.000237085,0.000283023,0.000127135,-0.000177415,0.000227517,-0.000457824,0.000846745,0.000206144,-0.0013838,0.000262888,0.00021331,-0.000724611,-0.00164149,0.00102928,0.00029595,0.000280375,-0.0000189518,-0.000506882,0.000410031,0.00101062,0.000837332,0.0000943077,-0.000839207,0.000919561,0.00164463,0.000816018,-0.00106852,-0.0000144051,0.00067476,-0.000695347,0.000198525,-0.000378907,0.000182786,-0.00143567,-0.00166393,0.000444677,0.000828359,0.00112498,0.000682225,-0.00118513,0.000430071,0.000578832,0.000110367,-0.000401137,0.000460303,-0.000826508,0.000360862,-0.000539331,-0.0000167744,0.000271052,-0.00106048,0.000870803,0.000818926,-0.00016035,-0.00117284,0.00163059,0.00130999,0.00097613,0.000660847,0.00130705,0.00191363,0.000465223,0.000174551,0.000195407,-0.00121906,0.000385689,-0.00125224,0.000480898,-0.000900672,-0.000127625,-0.000154365,-0.00125916,0.000220653,-0.00197619,0.000243178,0.00119612,-0.000373803,-0.000765995,-0.00141596,-0.00181343,0.000792329,0.000158429,-0.000718414,0.000674546,-0.00181108,-0.00034066,-0.00170283,-0.00074864,-0.000760241,-0.0011983,-0.00079975,-0.000189572,0.00157348,0.00111234,-0.0000619229,0.0000881863,0.00117599,-0.000561843,-0.000032105,0.000680275,-0.000834571,-0.000372857,0.00013182,0.000788398,-0.0000958745,-0.000515918,0.000836191,-0.000958927,0.00129856,0.0000972146,0.000152052,0.000373722,-0.000658974,0.000722693,-0.000250608,-0.000101787,0.000786371,0.000425315,0.0000674397,-0.000500511,0.000262162,-0.0000761867,0.00045625,-0.000561497,-0.00128136,0.00102715,-0.000604677,0.000342435,-0.00133902,-0.00118701,0.00115674,-0.000472417,0.00107125,-0.000679028,-0.00199634,0.000385639,0.00149323,-0.000764161,0.000476147,-0.00121089,-0.000937854,0.000156183,0.00116821,0.000232785,0.00182365,0.000304607,-0.00122216,-0.000294644,-0.0000936795,0.000205076,0.000660672,-0.00000920632,0.000607792,0.000145483,-0.000820456,0.000105339,-0.00138399,-0.000139123,0.000529957,0.00130582,0.000217465,0.000576953,-0.000461298,0.000249988,-0.00152079,0.000878563,-0.0009547,-0.000216939,0.0000436908,-0.000636546,-0.000116848,-0.00060156,-0.00190289,0.00083026,-0.000214797,0.000420474,-0.000222832,0.000580258,0.0000527409,-0.000317945,-0.00137568,-0.0000825005,0.00133107,-0.0017628,-0.000124188,-0.00176217,0.000338583,0.000738155,-0.000359773,-0.000425157,0.00000381183,-0.000312962,0.000347885,-0.00105434,0.00000496134,0.000449337,-0.000113635,-0.000209486,-0.00074006,-0.000537762,0.00125915,-0.00197577,-0.00045607,0.000801687,-0.000887325,-0.00175533,0.00137619,-0.0000613076,-0.000848965,-0.00172542,0.000453987,0.000202095,-0.000212642,-0.00041181,0.000317205,0.000488017,0.00131804,-0.0000230657,-0.000527623,-0.000145378,-0.00099574,-0.00041684,-0.0010976,0.00119836,0.000671263,-0.00136153,-0.00157937,-0.000217204,-0.0000614119,-0.000646924,0.000106328,-0.000254391,0.00153176,-0.000198419,-0.00160604,0.0000528972,-0.00124327,0.00067288,-0.000598487,0.000790586,-0.000331787,0.000887662,-0.000751262,-0.000148593,0.00132589,-0.00141748,0.0017111,0.00134562,0.00128068,-0.00140415,-0.000765426,0.000463174,0.000137954,0.0000530601,-0.000036188,-0.00162283,0.000936654,-0.00000520555,0.00170876,0.0012696,0.000837271,0.00109699,-0.000300746,0.000147785,0.000878256,0.000228096,0.000353954,-0.00066568,-0.000119928,-0.00194437,-0.0016217,0.00166377,-0.00101772,-0.000787262,-0.000680647,0.000988754,-0.00113593,-0.00150042,-0.000199425,-0.00146946,0.000344631,-0.00091908,0.000727849,0.000446769,0.00110464,0.000168707,-0.000323545,0.000101194,0.000733136,-0.000432461,-0.000373709,0.00015354,0.00172559,0.00187587,0.000165498,-0.00105589,0.00117664,0.000216774,-0.000905885,0.000511637,0.000198325,-0.000142439,0.00142738,0.000858884,0.0000870345,0.00112718,-0.000592544,-0.000423263,-0.000731662,0.00133676,0.0000138418,-0.000936174,0.000551732,-0.000931486,-0.000697107,0.000188385,0.000856435,-0.000756726,-0.00174546,0.000553801,-0.000574227,0.00103209,0.00105381,-0.00103138,-0.00142384,-0.00019701,0.000551268,-0.00146731,0.000493154,0.000614613,0.0000434379,0.000226491,-0.000840528,0.000158777,-0.000340775,-0.000177498,0.000532151,0.000559289,0.000836732,-0.000276556,-0.000491263,-0.0000698971,-0.000638822,-0.00135095,-0.000724506,-0.0017784,-0.000579911,-0.000446844,-0.000609038,0.000192432,0.00103495,-0.00056949,-0.00164318,0.000944289,0.000723383,0.00156051,-0.00101799,-0.00120792,0.00101899,-0.0010529,-0.000500201,0.000414723,-0.000581412,-0.0010348,0.000870606,-0.000075396,0.00026405,0.000167778,-0.00132336,0.000178828,-0.00179406,0.000979547,0.0000758297,-0.00181941,-0.0004959,-0.000890529,0.000258521,-0.0016128,0.00140317,-0.000378791,-0.000209604,0.000196608,0.000635951,0.000113969,-0.00188167,-0.0000385945,-0.00128164,0.000177247,0.000343773,0.00138486,-0.000288546,-0.00198591,-0.000712219,-0.000476634,0.0000692192,-0.0014753,-0.000762969,-0.000490088,-0.000231497,0.000460567,0.000603921,0.000934681,-0.00113036,-0.000495621,0.00089834,-0.000494167,-0.000896765,-0.000212621,0.000341949,0.00104188,-0.00000797356,0.000479886,-0.000257154,-0.00117925,-0.000435011,0.000430338,-0.00128544,0.00160979,0.000845325,0.00105812,-0.000480987,-0.000289352,-0.000404508,0.00103555,-0.000488947,-0.00058018,0.000202792,-0.00103236,0.00146728,0.000490729,-0.00184861,-0.000283356,-0.00153792,0.000473989,0.00106829,-0.0011206,-0.00091716,-0.000327085,-0.000323221,0.000667246,0.000159766,0.00027947,-0.000128004,-0.000405272,-0.000308892,0.000659043,0.000530202,-0.00186044,-0.000109572,-0.000202726,-0.000776114,0.00178043,0.000857597,-0.000543157,0.000989968,-0.000822749,-0.000627246,0.00113506,0.000000954976,-0.000817976,-0.00102409,0.000731815,0.00083918,-0.00166528,0.00177531,0.000756218,-0.00187935,0.0012358,0.0010262,-0.000639803,0.000604895,0.00117672,0.000915022,0.00113535,0.000536723,0.00120249,0.000281991,-0.000444085,-0.00059919,-0.000516639,0.000966158,0.000690779,0.000634464,0.00132654,0.000888163,-0.000653482,-0.000428467,0.000202332,-0.000132838,0.00077706,0.000625502,0.00122621,0.00139404,-0.000301421,-0.000289323,-0.0012246,0.00109786,0.000457668,-0.0000986718,-0.00163628,0.000591118,-0.000138025,-0.000165118,0.0015623,-0.00199093,-0.0011478,-0.000482878,0.000559206,0.000849385,-0.0017038,-0.0000607913,0.000681872,-0.00113894,0.000308994,0.000865334,0.000819327,-0.000315685,-0.00067244,0.000775974,-0.000684996,-0.000664496,-0.00163461,-0.00191461,-0.000121327,-0.000155106,-0.000689665,-0.00149102,-0.000159793,-0.000709631,0.000900059,0.000797759,0.0015728,-0.000691701,0.000513342,-0.000126837,0.00122955,0.000223469,0.000129051,0.00161355,0.000237862,0.00158262,-0.00144019,-0.000474407,-0.000162169,-0.000799128,0.000642682,-0.000124351,0.000797156,0.00116908,-0.0000108501,-0.000662247,-0.000683781,-0.0013605,-0.00185936,0.000490786,0.000399857,0.00110658,-0.000137188,-0.000321904,-0.00156653,-0.000801979,0.00127473,0.00146742,0.000492542,0.00127639,0.000191537,-0.0017116,-0.00146928,0.000417903,-0.00185175,0.000215787,-0.000434515,-0.000172753,-0.00081271,-0.00099971,-0.00104575,0.00051593,0.000219034,0.000676299,0.000191331,-0.000114705,-0.0000815407,0.000923674,-0.0000263909,-0.0000844693,-0.00196235,0.00152456,0.00146476,-0.00130575,-0.00168984,-0.00122903,0.000936701,0.00113441,0.00138318,-0.00158507,0.0010316,-0.0000470909,0.000131508,0.000585311,0.00149533,0.000456218,-0.00163088,0.000194937,0.000790518,0.000723047,-0.00093686,-0.000334648,0.000221846,-0.000500731,0.0000284936,0.000356909,-0.00042733,-0.000153946,-0.00183828,-0.000391975,0.000829723,-0.0000402172,-0.000424118,0.00138794,-0.00156792,-0.000452795,0.000977296,-0.000344881,-0.000673458,-0.00024836,0.000256197,-0.000424619,-0.00103478,0.000623287,-0.00130331,0.000869641,-0.00188975,-0.000306039,-0.000230257,0.000886442,-0.00142024,0.00055689,-0.000357737,-0.000133723,-0.00116967,-0.00026622,-0.00130193,-0.000607729,-0.000596017,-0.000197219,0.00142503,0.000689041,-0.000752317,-0.000277752,0.00143779,0.000388053,0.000856829,0.000391187,-0.00163869,0.00146586,0.000834865,-0.00131326,-0.00105076,-0.0000729599,0.000337112,0.00163422,0.000150369,-0.000125973,0.0000201547,0.0000794395,-0.000582057,0.00185572,0.00109725,-0.00183246,-0.000168812,-0.0000993179,0.00147113,0.0000541772,0.000535882,-0.000509508,0.000865246,0.000572556,0.000675814,0.00127622,0.000612851,0.0000352717,0.0017068,0.00129173,0.000510208,0.000225057,0.00131304,-0.000414234,-0.00051037,-0.00074791,-0.000959379,0.00134233,-0.000390692,-0.000704675,-0.00126919,-0.000801144,0.000127407,-0.000401147,-0.00145648,0.000667777,0.000264538,0.00183469,-0.00103774,0.000230293,-0.000868263,-0.00052612,-0.000182058,-0.000395337,-0.0000113347,-0.000167268,-0.000743084,0.00170382,0.000356301,0.000997937,0.000265366,0.000932683,-0.00107953,0.000164098,-0.000135418,0.000426706,0.00149141,-0.000338482,0.000872666,-0.000935409,-0.000751422,0.000455872,0.000552427,-0.000199924,-0.000500709,-0.000737566,-0.0000694708,0.000782672,-0.000586479,0.00137206,0.000451206,-0.0000847094,-0.000190593,0.000612043,0.000400899,0.000209991,-0.00131483,0.000077784,0.000681518,0.00139331,-0.000605101,-0.0000265356,0.00109815,0.000337436,0.00124317,-0.000625724,-0.000071811,-0.000944082,0.00081943,-0.000579081,-0.00105556,-0.000336412,-0.000599124,0.00140532,-0.000615776,-0.000747628,-0.000276184,-0.00124923,0.000741601,0.000608988,-0.00104854,0.000108387,0.000632106,-0.001377,-0.000256606,-0.000218401,0.00136649,0.000353603,-0.000580004,-0.0012085,0.00125278,-0.0001871,-0.00106956,0.000342758,0.000340154,0.00081265,-0.00139186,-0.000474718,-0.00073386,-0.000332311,-0.00176291,-0.000294476,0.00171383,0.000900915,0.00116386,-0.0000407572,0.0000319591,0.00052598,-0.00149999,0.0000405803,-0.00149192,0.000571898,-0.0000114666,0.000917214,0.00089122,0.000751888,0.000270452,-0.000195001,0.000504884,-0.00047851,-0.001386,-0.000932423,-0.000746767,0.000269773,0.00114406,-0.0000998507,-0.000126252,0.00015319,0.00104101,-0.00101721,-0.00022469,-0.0000460088,-0.0000297357,0.000964557,0.00072388,0.000684404,0.000287399,0.000267846,0.00071344,0.000325277,-0.00152639,0.000714314,0.000717735,0.00104141,-0.000803354,0.00162244,-0.0000550423,0.000577201,-0.000858173,0.000141732,0.000653563,0.000132162,-0.00144232,0.000420498,0.00100801,0.000873994,0.000422117,0.00040275,0.000177472,0.000233084,0.000980021,0.000747146,0.000425422,-0.000586484,-0.00100779,0.00128541,-0.00157494,-0.00169785,0.00020274,0.000384708,-0.000224195,0.000667968,0.000465863,0.00171667,0.000872054,0.00137791,0.00033489,0.00126405,0.000210445,-0.000980522,-0.000248283,-0.0000344193,0.000788248,0.000649724,-0.000631358,-0.00106026,-0.000281862,0.0011643,-0.00105293,0.000791428,-0.00192865,-0.00110641,-0.000497396,0.000377691,-0.000623877,0.000303352,-0.00037529,-0.00099049,-0.000806658,0.000129827,-0.000805928,0.000305933,0.000188884,-0.000922714,-0.0011131,-0.000607967,-0.00123972,0.000394611,-0.000570618,-0.000917079,-0.000844643,0.00084522,0.00120415,0.00194736,-0.000322311,0.000629106,0.00170432,-0.000417265,0.00111989,-0.000058676,0.00112505,0.000745276,0.000582083,0.00116585,-0.000579957,-0.000581476,0.000447053,0.00000467427,0.000998823,-0.000291533,-0.00166017,-0.000232399,-0.00021604,-0.000203657,0.000207617,-0.00165636,-0.000812487,0.00184466,-0.00191152,0.000179164,-0.000754653,-0.0019156,0.00165307,-0.000258285,0.000575623,0.000177699,0.000584719,-0.00123754,0.000291439,-0.000377688,-0.000626593,0.0007735,-0.00139477,-0.000831778,0.00104171,0.000577313,0.000138264,0.000153967,0.000776327,0.0000135649,0.000412395,0.0007484,-0.000179707,-0.000707908,0.00150716,0.000747815,0.00166191,0.00107142,0.00102277,-0.000944291,0.0000635744,0.000881904,0.00114816,0.00115602,0.000620958,0.000575325,-0.000492137,-0.000094446,0.000928883,-0.000491708,-0.00143053,0.000948873,0.0000800113,0.000773923,0.000214864,0.0000151234,0.000690331,0.00118549,0.000593861,-0.00145269,0.00123073,-0.0000618662,-0.000156072,0.00121778,-0.00028543,0.001085,0.00178124,0.000326253,0.00031101,-0.000996804,0.000664127,0.000158086,0.00034673,-0.000513681,0.000211941,0.000330179,-0.000196905,-0.00151895,-0.00118773,-0.000890508,0.00055831,-0.000228517,-0.000643073,-0.00125831,0.0000313996,-0.00166294,0.000746105,-0.000223412,0.00123586,-0.0000904346,0.00089889,-0.00000411974,-0.00124851,0.0000829108,-0.00094009,-0.000571096,0.000660191,0.00169751,-0.00198313,0.00015874,0.000444874,-0.00182807,0.00168734,-0.000216583,0.000615531,0.000227721,-0.00146039,0.00142546,0.000111865,0.00106647,-0.000473734,-0.000335767,-0.0000596175,-0.000104571,-0.00139321,0.0010144,0.0005572,0.000521626,-0.00156186,-0.000990747,0.000728013,0.00118194,-0.00172176,0.000911361,0.00180919,-0.000502271,-0.0000028162,0.000591965,-0.0000862684,-0.000846311,-0.000873672,-0.000282826,0.000169244,-0.000550781,-0.000425953,-0.00167691,0.00138666,-0.000318733,0.000995153,0.000450162,-0.000915585,-0.000642828,0.000417842,-0.000285829,0.00109445,0.000997317,-0.000301746,-0.000463695,-0.00184048,-0.000478417,0.000475132,-0.0000154338,0.0010671,0.00148825,-0.00105596,-0.00112434,-0.000660729,-0.000769683,0.000158718,0.00193225,-0.0000901079,0.000326364,-0.00036871,0.00096305,0.000303451,0.000112784,-0.0000512894,-0.00112232,0.000898595,0.000692881,-0.0000858528,-0.000841828,0.000351574,-0.00114405,0.000119964,0.00158025,-0.00130685,0.0015235,0.000124668,0.00170428,0.000838648,-0.000312139,0.000228055,-0.000898027,0.000896749,0.00156337,0.001306,0.00144219,0.0000200656,-0.00000711471,0.0000969204,-0.000809394,0.00160191,0.0000358877,-0.00132283,-0.00188435,0.000410419,-0.000382497,-0.00198985,0.000514256,-0.000352727,-0.0000633149,-0.000105415,0.00122459,0.0000638783,0.000461293,-0.000809332,-0.000835755,0.00106869,0.0000275176,-0.000648805,0.000529068,0.000923825,0.000378463,-0.000850551,0.000220863,-0.000377158,0.00029906,0.000614893,-0.00152775,-0.00133945,-0.000853789,-0.0012939,-0.000023909,0.00038736,0.000933828,-0.000385983,-0.000100812,0.00150135,0.00125698,-0.000656461,0.00105872,-0.0000512526,-0.000699983,-0.000737413,-0.000460363,-0.000393773,0.00126744,0.000368249,-0.000707782,0.000809405,0.00146262,-0.00146948,0.00122829,0.00000837047,0.000120718,-0.00115025,0.000910861,-0.000627958,-0.000894118,-0.000693426,-0.0000337093,0.000500796,-0.000954105,-0.000620818,0.000830238,-0.00107495,-0.00150868,-0.000760857,-0.0000513719,0.000776119,-0.000892311,0.00116812,0.000987506,-0.000976825,-0.000530453,-0.000341008,-0.00180594,0.0000232828,-0.000918878,-0.000173487,0.00132868,0.000636936,-0.000781243,0.000637363,0.000556582,0.00169164,0.00128458,0.000491276,0.000858622,0.00029701,-0.000471733,0.000533182,0.000060331,-0.00012267,0.000135196,-0.000439163,-0.00135428,-0.000338152,0.0019551,-0.000190188,-0.00054284,0.000758005,0.00047104,-0.000386031,-0.000966087,0.00014503,0.00119697,-0.000476424,0.000984976,-0.000115729,-0.000810881,-0.000131474,0.000434488,0.000103205,-0.000716192,0.00109848,-0.000969435,-0.00016364,-0.00129959,0.000162043,0.000527734,0.0014968,-0.00189977,0.00151067,0.000521177,0.000377817,-0.00103916,-0.00060962,-0.000925261,-0.000569145,0.000167126,0.00016375,-0.00145022,0.000184995,0.000688953,0.000133444,0.000799639,0.00024318,-0.00123004,-0.000586585,0.00171408,-0.000596794,0.000521096,-0.0011105,0.000034173,-0.00136267,0.000537804,-0.000623235,0.000545902,-0.00132186,0.000709965,-0.000101034,0.000654577,-0.000199019,0.000757201,-0.000242022,-0.000351306,0.000684518,-0.00141644,0.000018461,0.000439018,0.001494,-0.000805213,0.00170169,0.000266833,0.000408478,0.000257704,0.001079,0.00157547,-0.00134507,-0.000770393,-0.000408903,0.00106496,0.000589133,0.00007388,-0.00109491,0.000914005,0.0000140588,-0.0000505991,-0.0000829942,-0.00145316,-0.000884505,0.000841138,-0.00010288,0.00142435,0.00180712,0.0000218122,-0.00109588,-0.00101458,-0.000683629,-0.00123302,0.0000868031,0.00129206,-0.000484961,0.00163242,-0.00010852,-0.0000309027,-0.0019838,0.00042234,0.00061345,0.00046748,-0.00116812,0.00163968,0.000915049,0.00134339,-0.000623617,0.0000693791,-0.00103196,-0.000132082,-0.000679393,0.000137416,-0.000513604,0.0000353812,-0.000595892,0.00167782,0.000697033,-0.0014334,-0.00162469,0.00120881,-0.000680819,0.000704334,0.00174101,-0.00072861,-0.000235765,-0.0000423474,-0.000990515,0.000136969,-0.00103941,-0.00066146,-0.000422091,-0.00119102,0.00148917,0.00103548,0.000918873,-0.0000916673,-0.000651643,-0.000311017,0.00161515,0.000404591,-0.000280217,-0.000401233,-0.00026291,-0.00120639,-0.00109483,-0.000698872,-0.000917465,-0.000163268,0.00018368,0.000486602,-0.00135604,0.000246836,-0.00065195,-0.0000145485,0.000457368,0.000794791,-0.000275326,-0.0000404395,-0.000702624,0.000185064,-0.0000663649,-0.000715284,-0.00138397,0.000517631,-0.000617068,-0.000056325,-0.000436929,-0.000820163,0.000660975,0.00109012,-0.000321021,0.000191756,-0.000604218,-0.000998815,0.000367891,0.000553954,-0.000337617,0.00191516,0.00039766,-0.000231796,-0.00102788,-0.000554286,-0.000448954,0.000603025,-0.000726366,0.000101564,0.00125273,0.000523287,-0.000131292,-0.00106357,-0.000223265,-0.000810158,0.00173914,-0.00046421,0.000335458,0.000878296,-0.000508877,0.00112034,0.000903518,-0.00026147,0.000655714,-0.000781166,0.00175404,-0.00182492,-0.000000807279,0.000616612,-0.000152079,-0.000117429,0.00136971,-0.000182873,-0.00108822,0.0013191,-0.000597573,0.000100028,-0.0016813,0.00100304,-0.000200713,-0.000684366,-0.000478257,0.00106545,0.000233654,-0.00153367,0.000133563,-0.000675624,0.00167053,-0.000758999,-0.00180556,-0.00111022,-0.00018326,-0.0000201224,-0.000606589,0.000880183,-0.000287112,-0.0000554531,-0.00114833,-0.00115771,-0.000168101,0.000941385,-0.000100538,-0.00100071,0.000576673,0.00151221,0.000234656,0.00048289,0.000664663,-0.000918304,-0.000249712,0.00127356,0.000250703,-0.000629836,0.000610123,-0.00114854,0.000791458,0.000189924,0.0000586069,-0.00132855,-0.000930842,-0.00162024,0.000201701,-0.0000248748,-0.000522702,-0.00068461,-0.00185148,0.00195562,-0.000136718,-0.00130339,0.00046013,-0.000436582,-0.0000310673,0.000318679,0.000387705,-0.000077786,-0.00123982,-0.00061049,-0.0006223,-0.000364537,-0.000594575,-0.00162714,0.000631552,-0.00085853,0.000051058,0.000325664,-0.00110964,-0.000850605,-0.000980117,0.000212289,-0.000979211,-0.00091192,0.000606142,0.0011311,-0.00018467,0.000314335,-0.000625089,0.00154583,-0.00116169,-0.000098189,0.000353125,-0.000581432,0.000260714,0.000204423,-0.00182731,0.00146954,0.00111073,0.000941453,-0.00114926,0.00153212,0.00167377,0.000361507,0.000454696,-0.000729378,-0.00117281,0.00135714,-0.000855218,0.000634889,-0.00029611,0.000782123,-0.000806695,0.00152511,0.00070917,0.00173505,-0.000903799,-0.000996419,0.000177817,-0.00153604,-0.00102316,0.000607947,0.000168447,0.0000443626,0.000780039,-0.000151349,0.000273278,0.000386984,0.00119731,-0.000745259,-0.00105668,0.0012445,0.000600829,0.000652814,-0.000337926,0.00150126,-0.0011063,-0.0000211373,0.00173242,0.000736991,0.000757673,-0.000324569,-0.000986879,-0.000716319,-0.000277141,0.000273154,0.00165214,-0.000328855,0.000459333,-0.00134021,0.00194833,-0.000678525,0.000666502,-0.0000627609,-0.000648737,-0.000233839,-0.00112563,0.00189597,-0.000114213,0.000329775,0.00156099,-0.00136656,-0.000947407,0.00150734,-0.00137668,-0.000275181,0.00137168,0.000540967,-0.000734884,0.00160576,-0.000700885,-0.000655325,-0.000873329,-0.00012882,0.0000216957,0.000482043,0.00105837,-0.000152351,0.000686392,-0.0000222155,-0.000170144,-0.000727728,0.00117608,0.000719617,-0.00018589,-0.000474828,0.000830388,-0.00105233,0.000411852,0.0014488,0.000142224,-0.000280512,0.000477139,-0.00195479,0.00138224,0.000585845,0.0000402115,-0.000420252,0.000858502,0.000712032,0.000703943,0.00104502,-0.0000473053,0.00131982,-0.000636027,-0.0000324511,-0.00116786,0.0000914047,-0.00170021,-0.00061269,0.00133428,-0.00130072,0.00123221,-0.0012518,0.00129402,-0.000208805,0.00114634,0.000348376,-0.000324346,-0.000668437,0.00173191,0.00149424,0.00014457,-0.000505646,0.000155125,0.000912936,-0.0000363412,0.000408218,-0.000168362,0.00104714,-0.000228651,-0.000642016,0.000675426,0.000308125,-0.00158586,-0.000988733,0.000568317,-0.00102406,0.000943768,-0.000908936,0.000516958,-0.000512098,0.000384916,0.000596721,0.00129458,0.0000552411,-0.000528332,0.000336559,-0.00124409,-0.00145634,-0.000859582,0.0000252506,-0.000242063,-0.00130563,0.00192273,0.00190787,-0.00112568,0.00181178,-0.000301345,0.00121803,0.000379543,-0.000350218,-0.000550765,0.00021473,-0.000745941,-0.0000557084,0.000338337,0.000603474,0.000685579,0.000628856,0.00017725,-0.0015303,0.00173811,-0.000734592,-0.00161546,0.0000792043,-0.000644923,-0.0017206,0.000688294,-0.000934275,-0.000798884,0.000108957,0.000995145,0.00146456,0.000074139,0.000132795,-0.000178435,0.000813104,-0.0000616656,0.00115806,0.000440722,-0.000824036,0.00159327,0.000402526,0.000842837,-0.00110419,-0.00109482,0.00183244,-0.0000702979,0.0000443972,0.000740006,-0.00109157,-0.00152154,-0.000405885,0.000322719,0.00098301,0.00110077,0.00149254,-0.000396129,-0.00164954,-0.00000121585,-0.00182501,0.000815779,-0.000764843,0.000833353,-0.000208732,-0.0013266,0.001085,0.000138863,-0.000613836,-0.00034098,-0.00161316,-0.00106942,-0.00097214,0.00142291,0.000279535,-0.00174114,0.000730688,-0.000569229,0.000515409,-0.000913184,0.000816926,0.000550922,-0.00054653,0.000374796,0.000660005,0.0013726,0.000391429,-0.000130438,0.00107349,-0.000835644,-0.00072753,-0.0000600481,0.00157345,-0.00127913,0.00129257,-0.00124992,0.00073558,-0.000778833,0.000584319,-0.00179709,0.000782835,0.000581763,0.000171285,-0.00130539,-0.000929543,-0.00172123,0.00144649,0.000132832,0.000312227,0.0000771008,-0.00103391,0.000865514,-0.000661339,-0.000751528,0.000368027,0.000127339,0.00135966,0.0010501,0.00000866169,0.0014567,-0.00136328,0.000454275,-0.000244344,-0.000114828,-0.00057423,-0.000197763,-0.000598095,-0.000582545,0.000764002,-0.00108365,0.00157141,0.000501952,-0.00105388,0.000445202,0.00180052,-0.000267727,-0.000791298,-0.000976791,-0.0000250635,-0.000348298,-0.000541375,0.000461454,0.000794175,0.00185755,-0.00102717,-0.000252364,0.00133438,0.000793033,-0.0012503,0.000142903,-0.00115643,-0.000674148,-0.0000467423,0.000443354,-0.00105705,-0.000581705,0.000832561,0.000836305,0.000383932,0.00015777,-0.00110229,-0.000478986,0.00019786,-0.000267283,0.000801557,0.0000391327,0.000511887,-0.000439042,-0.00148681,-0.000370147,0.000719858,0.000466086,0.000440189,0.00117814,-0.000732392,0.00014229,-0.000193126,0.000107387,-0.0000184074,-0.000612091,0.00012339,0.000169336,0.0000771362,-0.00100128,0.000208875,0.000323585,-0.00163473,-0.00130138,-0.00134198,-0.0000408443,0.00107475,-0.000136432,-0.000986871,-0.000623634,0.000961366,-0.000568883,-0.00117501,0.00141346,0.000538964,-0.000504362,-0.0000493294,0.000248878,-0.0012807,-0.000691568,0.00133343,-0.000222173,0.000529877,-0.00102509,-0.00125096,-0.00103769,0.00144737,0.000928499,0.0013525,-0.000192017,0.0010641,-0.00077387,0.000327529,0.00113557,0.0000810137,0.000682058,0.000939055,0.00119769,0.000695319,0.000004454,0.00000791585,-0.00175048,0.000148769,-0.00139204,-0.000218616,0.00010658,-0.00167249,0.000576276,-0.00155756,-0.00094911,-0.00114735,-0.000266193,0.0000287388,0.000349097,0.000078196,-0.00144582,-0.00148511,0.00170506,-0.000397372,0.000250374,-0.0011094,-0.00107546,0.000781522,0.000545364,0.00116251,0.000846076,-0.000621097,-0.000106003,0.000679184,-0.000566989,-0.000716455,0.000592464,0.00135333,0.00180868,-0.000179298,0.0019958,-0.00027308,0.0000892189,0.0000280765,0.000659376,0.00135728,-0.000750159,-0.000948042,-0.00127146,0.000669073,-0.000570383,-0.000140824,-0.00026315,0.00108228,0.0000603913,0.000902851,0.00146021,0.000410996,0.000420142,-0.000803055,0.000664008,0.000363639,0.0000419015,-0.000191177,0.0000083131,0.000475638,0.000676729,-0.000943765,0.00083759,-0.000358434,-0.000835194,-0.00010729,-0.000154282,0.000346666,-0.0000481491,0.000331845,0.000788435,-0.000945131,-0.00135751,-0.000754271,-0.0000377347,-0.00121364,0.000594145,0.00139745,-0.000458391,-0.00153903,-0.000788667,0.000948956,0.000708612,0.000397765,0.000590769,0.0000923949,-0.0000578643,-0.000991584,-0.000896218,0.000490684,-0.0000821768,-0.00155112,-0.000693083,0.000351888,0.000933871,-0.000831719,0.00164199,-0.000490668,-0.000243391,0.00115458,-0.000205448,-0.00151766,-0.000536501,0.000668443,0.0000951995,-0.00066936,-0.000665631,-0.000105257,-0.000663862,-0.00169691,-0.00052475,0.000368794,0.000688599,-0.000863875,-0.000240037,0.000620261,0.000768537,0.000946015,0.00144381,0.00122006,-0.000811699,0.0000786374,0.000278186,0.000350728,-0.000836361,0.00158724,0.00127332,0.000425432,0.00178756,0.000991303,-0.000545676,-0.00135197,0.000443718,-0.00127946,-0.000914979,-0.00129041,-0.00106848,0.0000874809,-0.000230466,-0.000307472,-0.000786899,-0.000912665,-0.0000125199,-0.000239898,0.00122751,-0.0010216,0.000386955,-0.000943037,-0.00014578,0.00113271,0.000760379,0.00112834,-0.00131424,0.0011779,-0.0012488,-0.00088635,-0.00090313,0.00111781,-0.000261467,-0.00139795,0.00107816,-0.00162638,0.00171048,0.00016384,-0.00132405,-0.000068029,-0.000527107,0.000772368,-0.000341853,0.000846001,0.000649433,0.000248394,0.000728319,0.00106221,-0.00120104,0.00166036,0.000580642,-0.0006361,-0.00142023,-0.000409479,0.00028304,-0.00155414,-0.000448988,-0.00178961,0.00101831,-0.00112991,0.000136429,0.0000364508,0.00115786,0.00187982,0.000545692,0.000547408,0.0012925,-0.000162669,-0.000658708,-0.0000169359,-0.0000388092,0.000840087,0.000206787,0.000598517,-0.00174803,0.00112215,-0.000215333,0.000138384,0.00110271,-0.00100113,0.000726638,-0.000205527,0.000337505,0.00130785,0.00049593,0.00168827,0.00056047,0.00123732,-0.0000906481,0.00127724,0.0010297,0.00189365,-0.000112129,0.00140626,0.000394381,-0.00172074,-0.000315299,-0.000832594,0.0000183249,0.000996044,-0.000660373,0.00100945,0.0000981722,-0.000702346,0.000228472,-0.000648312,-0.000686066,-0.000283532,0.000519309,0.00124245,0.000643665,0.000180163,0.000157591,0.00196959,-0.000723407,0.000989972,0.000421896,0.000610813,-0.000213516,-0.000858141,0.00143507,0.00042617,0.000721029,0.00120876,0.000229369,-0.000495263,0.00101874,-0.000938914,0.00101411,-0.00113004,0.00196997,-0.00146193,0.00104305,-0.000328508,-0.000417628,0.00124552,-0.000287923,-0.000357843,0.00120573,0.000326036,-0.00138273,-0.000263679,-0.00158505,-0.0010831,0.000137975,-0.000980206,-0.0000202597,0.0000231281,-0.000412393,0.0010851,-0.000906558,0.000801453,0.00196109,-0.00066566,-0.000768439,-0.000940372,0.00153089,-0.000436782,-0.00100501,0.00128228,-0.000676903,-0.000328391,-0.000520096,-0.000209707,-0.00160247,0.000774181,0.0000586903,0.0000493538,-0.000663734,0.00124815,0.000147929,-0.00100904,-0.000887416,0.000469223,0.000136652,0.000405744,0.0000597866,-0.0014215,-0.000748003,0.00119165,0.00069462,0.00111058,-0.000401187,-0.00108441,-0.000431919,0.00164216,-0.000478552,0.000857236,-0.000194478,-0.000629416,0.00104162,-0.000500183,-0.000377306,-0.00183175,0.001051,0.000824537,-0.000892749,0.000885003,-0.00104762,-0.000860279,0.000396728,-0.000259396,-0.00116603,0.000861805,-0.00032168,0.0001215,-0.000255151,-0.000337026,0.00012643,0.000219489,0.00011829,-0.0000731705,-0.00163692,-0.000404646,0.000761414,-0.000770575,0.0000806782,0.0000951042,-0.000503076,0.0016881,0.000498809,-0.0000267354,0.0000789362,-0.00116023,0.000119471,-0.000240665,-0.00149409,0.00131087,0.00121881,-0.000790119,0.00135216,0.00104451,0.000411191,0.0010943,-0.00193847,-0.00159153,0.00107968,0.00000794868,-0.00136038,-0.00013617,-0.000578984,-0.000288057,0.0014811,-0.000695982,-0.00181652,0.00141063,0.000267099,0.000660545,0.00180867,-0.00108181,0.000525885,-0.000744097,-0.00111905,0.000876786,0.000312923,-0.000921127,0.000110081,-0.00115895,-0.00110558,0.000367163,-0.000395776,0.000381472,0.000283351,-0.00146451,0.00121355,0.000261018,-0.000536652,-0.00035411,-0.000490975,-0.000945185,0.000710313,0.00115369,-0.0000416837,-0.000212686,0.000201782,0.000175163,-0.000491939,-0.00123302,-0.00104311,-0.000430077,-0.000380133,-0.000576586,0.000379758,0.00154505,0.000590419,-0.000696074,-0.000867994,0.000717283,-0.000243085,-0.000174937,-0.00116256,-0.000568947,-0.000498931,-0.000105818,-0.000762304,0.000546525,0.00046563,-0.000589198,0.001045,-0.000499771,-0.00179994,-0.00142787,-0.000353477,0.000279446,0.000249127,-0.00179773,0.00072488,-0.00141482,-0.000336944,-0.000513069,0.000266153,-0.000520329,0.0000339701,0.00108122,0.000915644,-0.00108095,-0.000524485,0.0000854543,0.000522763,0.000921407,-0.000400263,0.000554315,0.00102513,-0.00195637,0.000151307,-0.00186693,-0.0000979703,-0.00125864,-0.000101074,-0.000352422,-0.0000410197,0.00178983,0.000259194,-0.00147791,0.000239791,-0.000567894,-0.000637028,0.0000930114,-0.0000956615,-0.000527878,0.000917173,0.000092197,0.000480428,-0.0000872462,0.000210928,0.00125761,0.000671667,0.000234541,0.00105534,0.00176895,0.000970974,0.000377821,0.000869925,0.000420916,0.000716571,-0.000693841,-0.000792556,0.000712344,0.000525028,-0.00125059,0.00141417,-0.000971212,0.00188451,-0.000210777,-0.00172716,-0.000288278,0.000428977,0.00102572,-0.000541231,-0.00114403,-0.000825047,0.00147,-0.000920221,-0.000439217,0.00143901,0.000145017,-0.000873361,-0.0000279196,-0.00157225,-0.0000813775,-0.00115482,0.000599939,0.00016991,0.000159109,-0.000469298,0.00160732,0.0000248341,0.00151712,0.000183046,-0.0008891,-0.00198806,-0.00141663,0.000135903,0.000548693,0.000679699,0.000272878,0.000369093,0.000905121,-0.000829268,-0.00126009,-0.000106621,-0.00052729,0.0000573377,0.00070181,-0.000169995,-0.000558047,0.00126192,-0.000572713,-0.0012496,0.000221027,0.00145705,0.00140753,0.000360106,-0.000961753,-0.00128442,0.0006449,0.000543443,-0.000627483,0.00032834,-0.0000960698,0.000981676,0.00166672,-0.000077145,0.000611739,-0.000641083,0.000100078,-0.000226361,-0.000748153,-0.000961947,0.00101905,-0.000370275,0.000656034,0.000165626,-0.00071636,0.000316922,-0.00180786,0.000337602,0.000326012,0.000735168,-0.00136905,0.000197364,-0.000125102,-0.0005041,0.00147855,0.000254456,-0.000702037,-0.00025635,0.000885374,-0.00104272,0.00100422,0.0000644562,0.000201383,0.000760514,0.000906168,0.000405578,0.00113247,0.00029781,-0.000414627,0.000412126,0.000582467,0.0013709,-0.000741279,-0.0013861,0.0000303931,-0.00154736,0.000412736,0.0000972909,0.00149912,0.000663194,-0.00172688,0.000298382,0.000891928,0.000217385,0.000330133,-0.00186184,-0.000242217,0.000463659,0.000524375,0.000599542,-0.000234902,0.000307486,0.0000849776,-0.000195252,0.00132425,-0.00000309058,-0.00097057,0.000382662,-0.000351966,0.000690262,-0.00105284,-0.000753435,0.000645881,-0.000170759,-0.000415011,0.00122049,0.000264773,0.00145387,-0.0000341969,-0.000852492,0.000783016,0.00057324,0.000403258,-0.000953651,0.00105304,-0.000949206,0.000384096,-0.00105809,-0.000295705,0.000905184,-0.000877483,0.000563441,0.000079556,0.000549553,-0.000864941,0.000394112,-0.000652952,-0.00151364,-0.000240519,-0.00139437,0.000326499,-0.00160787,0.000200149,0.00134402,0.00096168,0.000727506,-0.000210441,0.000282735,-0.00151006,-0.0000274307,0.00188931,0.00146184,0.00163479,0.000628524,0.0000431304,-0.000728994,-0.000410466,0.000670602,-0.000464189,0.000703524,0.000607836,0.00104219,-0.00123474,0.000285991,-0.000701559,-0.00177876,-0.000160411,0.000821618,-0.000456834,-0.0015938,0.00112935,-0.00188265,0.000627034,-0.000103641,0.000785049,-0.000453362,0.00017177,0.00155237,-0.000378342,0.000304584,0.00172625,0.000100392,0.000255066,0.0000729655,0.00182527,-0.00158802,-0.000763545,-0.00114137,0.000650101,0.00185121,0.000321829,0.00088054,-0.000538285,0.0000741434,0.000268256,0.00196362,0.000894603,-0.000689958,-0.00066328,0.00137496,-0.000764731,-0.000353203,-0.000547083,0.00146116,-0.0000481612,-0.00188011,-0.000672524,-0.000903234,0.000883462,-0.000366268,0.000569295,0.000195114,0.00009146,-0.000185254,-0.00121078,0.000211812,-0.00165822,-0.000862385,-0.000427635,0.000436833,-0.000771605,-0.00197339,-0.000212398,0.000332669,-0.000272222,-0.000297948,0.000932738,-0.000743227,0.000149969,0.000279455,0.0000144956,0.000223142,0.000485828,-0.00147614,0.000259044,0.000920163,0.000837179,0.000495887,0.000129108,0.0011237,0.00137125,-0.000221029,0.000886383,0.0000840663,-0.000322165,0.000409649,0.000888322,0.00050441,0.000268925,0.000113579,0.000882121,0.000535996,-0.000738281,0.00130599,-0.00084508,-0.000109154,0.00101358,-0.000300408,0.000337634,0.000911048,0.000651863,0.000588209,0.0013579,0.000403891,-0.000238146,-0.00028919,-0.00181823,0.000985768,-0.000272013,-0.0000704991,0.00123367,0.0000417685,0.0000176931,0.000466115,-0.000137163,0.00113884,-0.00142704,0.00181996,-0.000447947,0.000662081,-0.000798366,0.000492935,-0.000905294,-0.00121522,-0.000401814,-0.00175104,-0.00100609,-0.000340016,0.000181776,-0.00158569,-0.000356177,-0.00124399,-0.000026441,-0.000374146,-0.000542821,-0.000537457,0.000932082,-0.00187366,0.00184242,-0.00053402,-0.0000893292,-0.000120516,0.000308187,0.000789646,-0.0000329432,0.000173095,0.000843413,-0.0000344258,0.00158028,-0.000476273,0.00042988,0.000420148,-0.000399298,-0.000673015,-0.0000305465,-0.00103189,-0.000227994,0.00179586,0.000459738,-0.00143901,0.000778549,-0.00177701,-0.00125899,-0.000447345,0.00022718,-0.0000056111,0.000306571,-0.000918156,-0.00166553,-0.000141865,0.00169877,0.000386384,0.000342741,-0.00079804,0.000638868,0.000389602,-0.00126818,0.000267745,-0.000977505,0.000464771,-0.000100519,0.00140059,0.000390858,-0.000290578,-0.000400904,-0.00199071,0.0000713871,-0.00151327,0.00113915,-0.00024605,0.00115884,0.000100131,0.000391801,-0.00158089,0.00140066,-0.000260569,-0.00160792,0.0000753176,-0.000956742,0.00140091,0.000882176,0.00139168,0.00107613,-0.000780737,-0.000276088,0.000116107,0.00015181,0.000735181,0.000627832,-0.000852845,-0.000775986,-0.00177461,0.000033407,0.000420935,-0.000384266,-0.00106489,-0.00100734,0.000497878,-0.000994173,0.000289805,-0.000464674,0.000115462,0.000228405,-0.000808942,0.00145318,0.00112343,0.000564158,0.000414498,-0.000649222,0.000501192,-0.00112085,-0.000442679,0.0000150345,-0.000092606,0.00195828,0.0000554964,0.000489074,-0.000278367,-0.00112974,0.000695624,-0.00166786,-0.00070057,-0.000173436,0.0000859134,-0.00025288,-0.000350198,0.0019918,0.000836905,0.00040427,-0.000749636,-0.000913002,0.000979544,-0.00112361,0.000808794,0.00121568,-0.00024806,-0.00084283,0.000127959,0.000245354,0.000504918,-0.000152111,-0.000524339,0.000552071,-0.000435886,-0.000307726,-0.000175522,-0.00015165,-0.00024015,-0.00150056,0.000414475,-0.000775395,-0.000472575,-0.000727755,0.00102653,0.00126407,0.000183896,0.000363325,0.000493601,-0.000308592,-0.00179484,0.000119461,-0.000188284,-0.00182769,0.00034276,0.000343687,-0.00137639,-0.00125625,0.000142738,0.000644055,-0.000847369,0.0000693367,-0.000597471,-0.00184729,0.00089455,-0.0000625059,-0.000856655,0.000395221,-0.000718837,0.000204924,-0.00124888,0.00111343,0.000484864,-0.000416893,0.00053644,-0.000932638,-0.000888107,0.00134208,-0.000797647,0.000258419,-0.0010453,-0.0000350831,-0.0000360301,-0.00156953,-0.000118543,-0.000575667,-0.000159332,0.000630231,0.000666226,-0.000836768,-0.00173902,0.000599253,-0.00110528,0.000702069,-0.000493063,-0.000483406,-0.000205771,-0.000229411,0.000602424,0.00035314,-0.00021502,-0.000103029,-0.0000698705,0.000857573,-0.00054978,0.00132421,0.00167996,0.00178824,0.0000830739,0.000757378,-0.000390211,0.00168512,-0.000135574,-0.000122864,0.0000965459,-0.00192489,-0.000727318,-0.000568405,0.000728115,-0.00114787,0.000923799,0.00104059,-0.00113664,0.000487129,-0.00145394,0.000913261,-0.00163658,-0.00198334,0.000875406,0.0000712342,-0.000352746,0.0000233679,-0.000270166,-0.000457298,0.000762335,-0.00118361,0.00120334,-0.00117926,-0.00164703,-0.000264515,0.000495476,0.00091293,-0.0014182,-0.000993264,0.00112938,0.00116491,0.00196228,0.00018009,0.000264124,0.000439837,-0.00111409,-0.00103511,-0.000845248,0.00169893,0.000958454,-0.000335418,-0.000881194,0.000436952,-0.00138952,-0.000584558,0.000270977,0.000678669,0.000111152,-0.000946939,0.000623368,-0.000843836,0.000283648,0.000077513,-0.000809931,-0.00133933,0.000157846,0.000845842,-0.000285175,0.000254064,-0.000864769,0.0000720032,-0.000631097,0.00123257,0.00100707,0.000731961,-0.0000753853,-0.000652642,-0.000306055,0.0000484548,-0.000279359,0.00157726,0.00065055,0.00115553,-0.000276528,0.000164265,0.000354862,-0.000282253,-0.000919056,-0.000934503,-0.00120502,-0.000459331,0.000557781,-0.000442592,-0.000270988,-0.000854331,0.00143907,0.00155676,0.000833611,-0.000307993,0.000419174,0.000336356,-0.00113059,0.000287631,0.00020807,0.00112212,0.00136602,0.000428184,-0.00129716,-0.00124294,0.00123861,0.00151405,-0.00155841,0.00032445,-0.000118814,-0.00146745,0.000422966,0.00137602,0.000276974,-0.000392133,0.000814477,0.000970563,-0.00195213,-0.0000310778,-0.000744991,0.00029539,0.000600839,-0.00023869,0.000454171,0.000937698,-0.001344,-0.000467719,0.000203299,-0.0001374,0.0000868971,0.000894633,0.000962288,-0.00163944,0.00124407,0.000736778,0.000719082,-0.00139021,-0.00112703,-0.000674363,0.000405068,0.000374772,0.00112935,-0.000185051,0.000621951,-0.000232581,-0.000987373,-0.000383755,-0.00128311,0.00103182,-0.00136845,0.000808526,-0.000186613,-0.00151687,-0.000389787,0.000358786,-0.000521197,-0.000020873,-0.000139041,0.000319676,-0.00140836,0.000181411,-0.000185937,-0.000164465,0.000279269,-0.000690135,-0.000478211,0.000358977,-0.000105809,-0.001122,0.000902372,0.000341502,0.000817052,0.00178076,-0.000600224,-0.000189849,-0.000543365,-0.00148873,0.000582805,0.00126132,-0.00038664,-0.000948511,0.000304007,0.000393351,-0.00123682,-0.00167542,-0.0018744,-0.000232921,-0.000180511,-0.0010472,-0.000331111,-0.000907882,-0.000554432,0.00191998,0.00092475,-0.0016112,-0.000888088,-0.000248673,0.000587937,-0.000484801,-0.000547335,0.000949143,0.000401901,-0.000263549,0.00104498,0.00130169,0.00063831,0.000643698,0.0000271649,0.0000012353,-0.00021521,-0.000229254,0.00126014,-0.000442324,-0.000844028,-0.00181926,0.0000506345,-0.000165406,0.0000378779,-0.000801053,-0.0000142515,0.000414116,0.00185574,-0.000469452,0.00020219,0.000554992,-0.00107263,0.000580024,0.000751239,-0.000155495,-0.000482472,-0.00105456,0.000803855,-0.00118618,-0.000849275,-0.00097502,-0.00149013,0.00174491,-0.000270663,0.000402495,0.000152502,-0.00103679,-0.0000779575,-0.0014185,-0.000606081,-0.000410012,-0.0011538,0.00194523,-0.00118373,0.000572819,-0.000524872,0.00152167,-0.000460491,-0.000295193,-0.00118649,-0.0000196746,0.000509585,0.000341322,0.00144437,0.00118468,-0.00154324,0.00160105,-0.000133525,-0.00129722,-0.00048195,0.000142854,-0.00111473,0.000824405,-0.0000875005,0.000355379,0.000332144,0.000195954,-0.0000574557,0.000779676,0.00167099,-0.00191417,-0.000961738,-0.000801629,0.00126133,-0.000234884,0.00100092,0.000608225,0.000544493,-0.000283676,-0.000811883,0.000642966,0.00134819,0.00122121,-0.000388503,0.000383917,0.000791354,0.000403638,0.000462176,-0.0000317387,0.000897451,0.00045665,0.000262076,-0.000446505,0.000919759,0.000549169,-0.000107292,0.000685149,-0.000601491,0.00152088,0.00000493253,0.000413273,0.00157734,0.00170114,-0.000928982,0.0000140137,0.00100115,-0.000924661,-0.000176561,-0.00146089,-0.000618532,-0.000568402,0.00101337,-0.000192409,0.000262231,-0.00050679,0.000625059,-0.00120164,0.00107973,-0.000601404,0.000263237,0.000432677,-0.00108833,-0.000563513,0.000186971,-0.000275944,0.00125584,0.000645727,0.00115909,-0.00133527,-0.00120845,-0.000148075,-0.00142888,0.00116964,0.0014282,0.000459292,0.0000900469,-0.000954324,0.00129147,0.000657015,0.000946471,-0.000579053,-0.00163568,-0.000101427,0.000937073,0.0000460703,0.000302328,-0.00000433077,-0.000690914,-0.000930594,0.00117231,-0.000219221,0.00149138,0.000864639,-0.000785717,-0.000563765,0.00073772,-0.00122093,-0.000908137,-0.00122492,-0.000353915,-0.00116681,-0.00071591,-0.000019702,0.00173375,-0.000848236,0.00116066,0.000632739,-0.000875877,-0.000851126,0.00013108,0.00059212,0.000829751,-0.000159362,0.00194919,-0.00139632,-0.0009035,-0.00178037,0.000332915,-0.000225589,0.000844625,0.00111295,-0.000424646,-0.00108086,0.000167104,-0.00147767,-0.000814856,0.000264799,0.000447139,0.000932043,-0.00160062,0.000318711,-0.000685765,0.000153313,-0.00057932,-0.000139329,0.00189696,-0.000340912,0.0000639247,0.00105315,0.0000405185,0.00102194,0.00116442,-0.000395976,-0.000714746,-0.000787228,-0.00176945,0.00185375,-0.000835497,-0.000120808,-0.00123639,-0.0000561234,0.000566791,-0.000553857,0.000377163,0.000483667,0.000211611,-0.00143819,0.00151236,-0.000481975,0.000515788,-0.000113394,-0.00154065,-0.000766094,-0.000289154,-0.00128095,0.00139132,-0.00143181,0.000381127,-0.000229902,0.00000761113,0.000746582,-0.0000853155,0.000746915,-0.000396719,-0.00132439,0.000139432,-0.00104047,-0.000880818,0.000320838,0.000536662,-0.00165312,0.00018253,0.00136209,0.0000552172,-0.000377592,-0.000647251,-0.000171257,-0.000545661,-0.000963848,-0.00052457,0.000825215,0.000241948,0.0000993794,-0.000105174,-0.000212137,-0.000870091,0.00166516,-0.00113759,-0.000336184,0.000203315,-0.0002331,-0.000804286,-0.00121731,-0.000131784,0.000339404,-0.0000676272,-0.000997901,0.000762558,-0.00152577,-0.0013178,-0.000678955,-0.00188726,0.00179973,0.000323372,0.000371039,-0.000298842,0.0000601413,0.00112409,-0.00147279,-0.00112282,-0.0000263057,-0.000444859,0.000887832,0.00198624,0.00125919,0.000554379,-0.000844711,-0.00189474,-0.000158935,0.00019959,-0.000223174,0.00128385,0.00143056,0.00164738,-0.000197508,0.000105062,0.00113001,-0.000103218,-0.0000484749,0.000844513,-0.000934531,-0.000332756,-0.0000734081,0.00110465,-0.00129437,0.000235699,0.000178619,-0.00110221,-0.00136805,-0.000577184,0.000309747,0.000986526,0.00101517,-0.00102532,-0.000646815,-0.000329042,-0.000264352,0.00024765,-0.000232189,-0.000392022,0.000586664,0.00024675,0.00000314468,-0.0003878,0.0000601515,-0.00114847,0.00124175,0.00134776,-0.000281578,0.000230151,0.000436494,0.000805847,0.000702545,-0.000635745,0.0000687457,0.000271165,-0.0011801,0.000427273,0.000134001,0.00059246,-0.00138957,-0.000240149,-0.0002108,0.000548805,0.00130878,-0.0000769231,-0.000326651,0.000782259,0.00198182,-0.000228823,0.00121948,-0.00118413,0.000279679,0.000392539,-0.000337471,0.0000165654,0.00118186,-0.000426177,-0.000375799,-0.00106525,0.00132041,-0.00179801,-0.000443728,-0.000579095,-0.00139892,0.000335269,-0.000130564,0.000997336,0.000564246,0.000744631,-0.000509503,0.00178358,-0.000775645,0.00122048,-0.000645229,0.00161291,-0.000431332,-0.000666697,-0.000117535,0.000230473,-0.000146285,-0.000595545,0.000113144,-0.000919159,0.000322749,-0.000260295,-0.000702458,-0.000428365,-0.0010346,0.00145067,0.000250371,-0.00049222,-0.00157264,-0.000249278,-0.00041264,0.00135673,-0.000278179,-0.00140036,0.000560893,-0.000566477,0.000155248,-0.000327889,0.00148394,-0.001782,-0.00013774,-0.00132113,-0.000309242,0.00100146,-0.000756641,0.0000425362,-0.00180983,-0.00129808,-0.00047365,-0.000826818,-0.0000610188,0.000265298,-0.000652788,0.000137514,0.000605371,0.000271503,-0.00122214,0.0014352,0.000519096,0.00108131,0.000853511,-0.000569086,0.0000217805,-0.00171915,0.000294443,-0.000824512,0.0000924953,0.00122234,-0.000170632,-0.000240283,-0.000925477,0.000474913,-0.000366935,-0.000839414,0.00027964,-0.0011463,0.0000440475,-0.000223963,-0.00087383,0.000615388,-0.000808992,-0.000828398,-0.0010574,-0.000322071,-0.0000282855,-0.00040879,0.000809362,-0.000898862,0.0012788,-0.000278327,-0.00134595,-0.000151775,0.000231908,-0.000205208,-0.00135141,0.00123956,-0.000796691,0.00103532,0.0000752493,0.0000882588,0.000501155,0.000828477,-0.0010062,-0.000350693,0.000388642,-0.00156486,0.000017009,-0.000235092,0.000859027,0.00169023,0.000360845,-0.000566869,-0.000406982,0.000834382,0.00127983,-0.00128333,-0.000760929,-0.000378786,0.00151481,-0.000297058,-0.000293793,-0.000349521,0.00137931,0.00033829,0.000239873,0.00130944,0.000836532,-0.0000960783,-0.000365859,-0.000467518,-0.000714282,-0.00106073,0.000649876,0.00039175,-0.0019115,-0.0010425,0.000279079,-0.00120569,-0.000692057,0.00140245,-0.000305717,-0.000148243,-0.0000637522,-0.00143341,0.000304508,-0.000906336,0.000877291,-0.000783095,-0.000928676,0.000114346,-0.00123177,-0.000546067,-0.000240443,-0.000492956,0.00081209,0.000832776,0.000210722,-0.000987163,-0.00140223,-0.00183333,-0.00157323,0.00145353,0.000238593,0.000874524,-0.0000997719,-0.00186671,0.00119905,-0.000492222,0.000706897,0.00164025,0.000739159,0.000612005,0.000386568,0.0000352954,0.00146112,0.000265611,0.000757846,-0.00159844,0.000493825,0.00135881,0.00123448,-0.000387349,-0.000461424,0.000768799,-0.000223229,0.00127566,0.00132279,0.00145588,0.000175741,-0.000469375,0.000618008,-0.000319672,-0.00191349,0.00109044,0.000327398,-0.00146933,0.000259091,-0.000463925,0.00154632,-0.000711485,0.000144362,-0.000247816,0.000901453,-0.00101524,0.000452605,-0.00191365,-0.00167773,-0.00139786,-0.000890651,0.00132729,0.00029316,0.000727593,-0.000299568,0.000221106,0.00114734,0.00123809,-0.00165839,-0.000341868,0.00025048,-0.000734907,0.000950936,-0.00117199,-0.000101159,0.00079538,0.00109598,-0.000818258,-0.000652689,0.000329753,0.000515097,0.000915595,-0.00140058,-0.000597163,0.000152242,-0.00142508,-0.000403303,-0.000529889,0.00104623,0.000673591,0.000515539,-0.000102782,0.0018459,0.000273276,0.000525706,0.0000565154,-0.00075052,-0.000958103,-0.00129694,0.000131564,-0.000406702,-0.000847901,-0.000132524,-0.000856772,-0.000849853,0.0000794221,0.00156131,-0.00000648958,-0.000424245,-0.00130834,-0.000158629,-0.000315746,0.000280603,0.00170586,-0.000934531,-0.000596982,0.000549324,0.0000631653,-0.000966544,-0.000191758,0.000451649,0.000168638,0.00175549,-0.00130812,0.000468674,-0.00137816,-0.000774772,0.0012502,0.0000419442,0.00165165,-0.00165566,-0.0000479978,0.000953411,-0.000886754,0.000219091,-0.0000129275,-0.00192146,0.000240002,0.000599197,0.0000270508,-0.00129037,0.000924079,0.000564185,0.000484454,0.000712537,0.000387331,-0.000773305,-0.000260891,-0.000614465,0.000443432,0.0000610067,-0.000514402,0.0000375932,0.00037349,0.00138314,0.00189241,-0.00112917,0.00120622,-0.000718917,0.000395568,0.000686246,0.000449516,-0.000583422,0.000151865,-0.00138166,-0.000116452,0.000209385,0.00192287,0.00167897,0.000447406,0.000148681,-0.00117564,0.000436863,-0.000285238,-0.00072646,0.00146298,0.000445551,0.000577698,-0.0000282338,-0.00016157,-0.000628864,0.00108377,-0.00144643,-0.000463391,-0.000259694,0.00151106,-0.0000998184,-0.000523448,-0.0000366533,0.000193615,-0.000465162,0.000770105,-0.0000515459,-0.000668863,0.0000471034,0.000623318,0.00126526,-0.00108532,-0.000303919,-0.0000185091,-0.000312082,0.00167095,0.000503357,-0.000178325,0.00138873,0.000332718,0.000262694,0.000324928,0.000193832,-0.000569708,0.000296848,0.000255045,-0.000157973,0.0011343,-0.000111151,0.000508223,-0.000274618,-0.000646862,-0.000834142,-0.000732039,0.00000705448,-0.000431241,-0.000501241,0.00100553,0.000192988,0.000881204,0.000988492,0.000429367,0.0000782704,0.000768182,-0.00123629,0.00114726,-0.0011092,-0.0000516249,0.000560237,0.000204363,-0.000483003,0.00122174,0.000641321,0.00142521,-0.00020783,0.000268735,-0.00119318,-0.0016958,-0.000176647,-0.0000725078,0.000410716,-0.00164627,0.00116715,0.000378077,-0.00174153,-0.000071866,0.00168053,-0.0000641512,-0.000288967,-0.000905902,-0.000873348,-0.000530712,-0.00108649,-0.00010327,-0.0000974137,-0.000651173,-0.0015299,0.0000248205,0.000241726,-0.000441446,-0.00117343,-0.0000260631,0.0000224351,0.000182374,0.000729576,0.000992988,0.00110455,0.00128422,0.0000244956,-0.000448164,-0.00156535,-0.0000904787,-0.000803654,0.0000605207,-0.00101672,0.000158165,0.000562012,-0.000529174,0.000648781,0.000546037,-0.000991299,-0.000206914,0.000195427,0.000330724,-0.000855768,-0.000746693,-0.000484108,0.000140306,-0.00197769,0.0000757481,0.00155846,0.00029284,0.00114178,0.00112405,-0.000090504,0.000512895,0.0000226939,0.000263575,0.0000787832,-0.00109448,-0.00168453,-0.000826684,-0.00132792,0.000496213,0.000494869,-0.00039848,0.000242939,0.000726579,0.000496938,0.000620831,0.00186358,0.000739218,-0.00178584,0.000289255,0.000693111,0.000165066,-0.000915845,0.000746561,-0.000960618,-0.000181079,0.000925227,0.00171508,0.000550174,0.000193868,-0.000862604,0.000170161,0.000377406,0.000435566,0.000317481,0.00123969,-0.0000439648,0.000480029,-0.000567714,0.0010925,-0.000335138,-0.00171033,0.000928752,-0.000570737,-0.000023233,0.00129715,0.000401905,-0.000353243,-0.000534997,-0.0000954155,-0.00189808,-0.000270488,-0.00073841,0.000800324,0.00114951,0.0000953527,-0.00017462,0.000470971,0.0000296344,0.000174506,-0.00104513,0.00123113,-0.000695182,0.000185912,0.00089713,-0.000320971,0.000597943,-0.0019886,-0.000535056,0.000430753,-0.000285414,0.000318134,-0.0000451383,-0.000723014,0.000187819,-0.00101679,0.00132433,-0.00110597,-0.000155965,0.000110081,0.000704317,0.00102107,-0.00145087,0.00135731,0.000619,0.00173646,0.000891587,-0.000527122,-0.00155011,0.00154279,0.0000758635,0.0012097,0.000646149,0.000632494,-0.00159763,0.000647738,-0.000874009,-0.000369356,0.000743635,-0.000485988,0.000947757,-0.000395184,0.000604083,0.000676266,-0.00081157,-0.0000529706,-0.00096411,-0.0000727427,-0.000814134,0.000698012,-0.000598682,-0.000672674,0.00078364,0.000447759,0.000761514,0.00108905,-0.000157292,0.000771398,0.00102767,0.000453984,-0.00109825,0.000924583,-0.000231792,0.00023225,0.000694727,-0.000265401,-0.000140196,0.000635811,0.00154074,0.000395463,-0.000984501,0.000952491,0.00103135,-0.00107965,0.00138198,0.00152651,0.000224345,-0.00158032,0.00111675,-0.0000904658,0.00117647,0.000911401,-0.000177678,-0.000614304,0.00109461,0.00146184,-0.000518954,-0.0001361,-0.000859822,-0.00162226,-0.000437034,0.0010563,-0.000689703,-0.00120357,-0.000242569,-0.000735461,-0.000179599,-0.000942138,0.000813008,0.00134607,-0.00101864,0.000387934,-0.000505708,-0.00125417,-0.000921074,0.000275543,-0.000165411,-0.000904,-0.000464159,-0.000597866,0.000626556,0.0012233,-0.000443311,-0.0000589913,0.000530797,0.00150423,-0.00113733,-0.000164884,-0.000408799,-0.00188755,-0.00142411,-0.000175494,-0.000217645,-0.000691146,-0.000388262,-0.000010359,-0.00177606,-0.000309739,-0.00141314,0.0000289577,0.00100051,-0.000426744,0.00173268,0.000288295,0.00150676,0.000937729,0.000514794,-0.000320615,-0.00129036,0.00104254,-0.000407872,0.00135039,0.00000819025,0.00140965,-0.000554259,-0.000282945,0.000227776,-0.0000644618,0.0013974,-0.000524619,-0.00181734,0.00025734,-0.000054376,0.00156362,0.00165742,0.000473188,0.0010817,0.000203905,-0.0002297,-0.00127866,0.0000353583,0.0010198,-0.00195503,-0.000645243,0.000317661,0.0001152,0.0000479586,-0.00143382,-0.0000833683,0.000954663,0.00115098,-0.000310587,0.00148239,0.0000721869,0.000291623,0.000451209,0.000826025,-0.000296863,-0.000462503,0.000793884,0.000469609,0.000969926,0.000250618,0.00159141,0.00164695,-0.000195714,0.00041337,-0.000357054,0.00125891,-0.000524943,-0.000172864,-0.000280487,-0.0014853,0.000452599,0.00145953,-0.00025346,0.000906752,-0.00186258,-0.000630208,-0.000730494,-0.00120481,0.000655155,0.000429507,-0.000563375,-0.000504433,-0.00167152,-0.000822478,-0.000378756,-0.000457138,-0.00052709,-0.000243136,-0.000472391,-0.000426212,0.00167797,-0.000604941,-0.000870882,-0.000561473,-0.000650154,-0.000898772,-0.00163832,-0.00132207,0.000148638,-0.0011825,-0.00152862,0.000982149,0.000575793,0.000402631,0.000859946,-0.000729734,0.00100442,-0.00114007,-0.000193381,0.00132085,-0.000933135,-0.000375352,-0.000410198,0.0001741,0.000310413,-0.000121371,0.000822858,0.00122321,-0.00100578,0.000432362,-0.0000304766,-0.000478912,-0.000632578,0.00012366,0.00131072,-0.000543991,0.000834346,0.00124405,-0.000334711,0.00136733,0.000634022,-0.000252271,0.00110206,-0.000426105,0.00135425,-0.000896375,0.000482477,0.000915721,-0.000335471,-0.000444325,0.00194319,0.00103116,0.00165358,-0.000899966,0.000381124,-0.000599407,0.000185124,-0.000141498,0.000254989,-0.000764795,0.00020727,-0.000984414,0.000447528,-0.000722179,0.000904474,0.000172152,0.00173974,-0.0017525,0.00104547,0.0000220024,-0.00155439,0.000239116,-0.000550802,0.000428571,-0.000154949,0.00000454015,-0.000851169,0.000262948,-0.00046202,-0.000520633,-0.00106252,-0.000226063,-0.000866892,0.000188246,-0.00109813,0.00174377,0.000488492,-0.000125039,0.00110663,-0.000660131,0.000218544,0.0000500738,0.000616004,-0.000868939,-0.000475998,0.000393856,0.00166155,0.000512491,-0.000226832,0.000231021,-0.0012074,0.000200562,-0.0000892164,-0.00106612,-0.00106123,-0.000800665,0.000979707,0.00153798,-0.000953322,-0.00119139,-0.00195019,0.00191531,-0.000451349,-0.000407611,-0.000852218,-0.0000281523,0.000618641,-0.00144725,-0.000688013,0.00192916,0.0000914093,-0.0000245444,-0.0000319689,-0.0000682794,0.00068078,-0.00146305,-0.000546488,-0.000587285,0.00156628,-0.000844488,0.00155175,-0.00084771,0.000819907,0.000565667,-0.000256577,-0.000546557,-0.00087266,0.00103422,-0.000382667,0.000198793,-0.000624732,0.000983677,-0.000713457,0.00138667,-0.000740483,-0.000892483,-0.00110074,-0.0000828631,-0.000687297,0.000115522,-0.00026262,0.000780078,0.00100319,0.00097886,-0.000132105,-0.000615395,0.000335588,-0.000469531,0.00141274,-0.0012371,0.0000571262,-0.00136672,-0.000658033,0.000759933,-0.000430554,-0.000594078,0.000596447,-0.000287878,0.000711943,-0.000414061,0.00169284,-0.000151316,0.000824377,0.000287895,0.000954958,-0.000323383,-0.000153618,0.000981457,-0.0000893895,-0.000123981,-0.00113104,-0.000684651,-0.000464674,-0.00135722,0.00045576,-0.000814144,-0.000812649,0.000170071,-0.000175347,0.000538392,0.000218232,0.000236871,-0.000965343,-0.000795282,0.000784289,0.000867439,-0.000194697,0.000266969,-0.000802496,0.00114418,0.00125486,-0.000444198,0.00000871605,0.000631788,0.000373974,-0.000840501,-0.000232216,-0.00176507,-0.000381987,0.00119264,0.000475272,0.000138222,0.0014289,0.000576866,-0.000925783,-0.00182238,-0.000411168,0.00168477,0.000117804,0.000756127,-0.000506435,-0.000395366,-0.00102275,0.000405249,-0.000402831,-0.000256021,-0.000815446,-0.00100548,-0.000837359,0.00159835,0.00030288,0.00164777,0.000763814,-0.000382479,-0.000154058,0.00101677,-0.000185625,0.000860296,0.00172579,-0.000183357,0.00115608,-0.00113058,-0.00119608,-0.000510886,-0.000316813,0.00157109,0.00108952,-0.000612814,0.00024653,0.000614205,0.000435044,0.000601808,-0.000297195,-0.000222022,-0.000152605,-0.000791276,-0.000329918,-0.00109395,0.000353857,0.001557,-0.000728598,0.000434267,-0.000537237,-0.000815142,0.0017725,-0.000197364,0.000498994,0.000881248,-0.000898551,-0.00126018,-0.000494752,-0.000394494,-0.00017548,-0.000784978,0.000177333,-0.00152855,-0.00056349,0.00000187382,0.000842314,-0.00132828,0.0000232835,0.000237593,0.000548569,0.00114156,-0.000899192,-0.00115862,0.00144666,-0.000307844,-0.000973069,-0.000414158,0.00130248,-0.000625776,-0.000314514,0.000428328,-0.000738037,-0.000759149,-0.00100605,-0.00146156,-0.000196212,-0.000653541,-0.000209401,0.000394137,0.000068537,-0.000672475,-0.000866485,0.00000616439,-0.00175641,0.000194742,-0.00102087,-0.000184978,-0.000600247,0.000986633,0.000549774,0.00105369,-0.0000709943,0.00155761,0.000688408,0.000658072,0.000565481,0.000563493,0.0000587229,0.000184609,0.000644142,-0.000436359,-0.00108666,0.000727581,-0.000118274,0.000465522,-0.0015171,0.0000559181,0.0000147294,0.00132431,0.00154605,-0.000675583,0.000349057,-0.000292902,0.0000232221,0.0000233353,0.00162038,-0.000416928,0.000235926,-0.00112982,0.000789978,-0.00106827,-0.0000730668,-0.00134239,-0.00096404,0.00169915,0.000366107,0.000847201,-0.00102842,-0.0000544109,-0.000706634,-0.00131035,-0.000158869,-0.000749024,-0.000823413,-0.00018637,-0.000129705,0.000796425,-0.00106374,0.000616497,0.000619241,-0.000864297,0.000149879,0.00017962,0.00014772,0.001304,-0.00148985,-0.0000122595,-0.00124246,0.00103704,-0.00103093,0.00197881,-0.00165392,-0.000286649,-0.00161227,0.00128159,0.000835201,-0.000495689,-0.00121988,0.00000162527,0.000670596,0.000450899,0.000634898,0.000839929,-0.00104994,-0.000124797,0.000421395,0.000132644,0.000206296,0.000600437,-0.000654359,0.00109999,0.00133857,0.00191902,0.000370345,-0.000142558,0.00151804,0.000635982,0.00145243,0.000786529,0.000879764,-0.000806208,0.00105125,0.000348464,0.00140656,-0.000726725,0.000432913,0.000291315,0.0000407046,-0.00126767,-0.000347149,-0.00117224,-0.00145742,0.000615188,-0.00139202,-0.00148395,0.000861995,0.00111626,-0.000798899,0.00140097,0.00123559,0.000209455,0.000111265,0.000480102,-0.00173848,0.000024578,0.0000386905,0.000350352,-0.000765864,-0.0000836203,0.000164946,0.00088783,-0.000924412,-0.00146659,-0.00183041,-0.000581483,0.000383277,0.00102288,-0.000862574,-0.000491092,-0.00120252,-0.000827928,0.000486093,0.0000572705,-0.00134703,-0.000177906,0.000274785,0.00110529,-0.000100319,0.000207065,0.000949529,0.000408558,0.000313078,0.00157114,0.00000193314,0.000953675,0.00169735,-0.000695763,0.000484334,-0.000107386,0.000244442,-0.00128556,-0.00066494,0.0000225642,-0.00054451,-0.00105731,0.000616271,0.000364704,0.0000713117,0.00134782,-0.00064998,0.000384346,-0.000106449,0.000241091,-0.000066531,0.0000879869,0.000822584,-0.000428952,-0.000252217,-0.00030173,-0.00191946,0.000316064,0.000877066,0.000692409,0.00173886,0.000244334,0.000698803,-0.0000738404,0.000767519,-0.00109501,-0.000065706,0.000040938,0.000108911,-0.000649463,-0.000983565,-0.000132801,-0.00112226,0.00113207,-0.0011103,0.000737058,-0.000110387,-0.00028406,-0.000332666,-0.000589113,-0.000376272,-0.00198009,-0.00137757,-0.00097863,-0.000178174,-0.00038688,-0.00123701,0.000567231,-0.000276406,-0.0000200928,-0.0000286491,0.00133579,-0.000546068,0.000196948,0.000953433,0.0000224716,-0.00136722,-0.000992542,-0.000545864,-0.00180846,0.000250078,-0.0000486679,0.00126797,-0.000420205,0.000357403,-0.000579274,-0.000104212,0.000601504,-0.00105254,-0.00104125,-0.000195055,0.00051132,0.000612827,0.00147687,-0.000227456,-0.0011611,-0.000972662,0.000385939,-0.0000750182,0.000836287,0.0000556426,0.000763725,0.00103017,0.000389623,0.00165943,-0.00123875,0.000162963,-0.000151917,-0.00171627,0.000347021,0.00104967,0.00131481,-0.00159929,-0.000647711,0.000377131,-0.0000310975,-0.000424386,-0.000416762,0.000323481,-0.00115557,-0.00021222,0.00196058,-0.00123667,-0.00136833,-0.000917673,0.00194469,-0.000345834,-0.00188474,-0.000387366,0.000545507,-0.000270191,0.000581136,0.000958594,-0.000594726,0.000884927,0.000855906,-0.000506131,0.00117752,0.00149571,0.000979948,-0.000189519,0.00152361,0.000575871,0.000245821,0.000807659,-0.000661313,0.00138662,0.000824301,0.000816915,0.00116741,0.000197194,0.00193991,0.000325879,0.000933115,0.0000813774,-0.000443361,-0.0000714531,0.00157474,-0.00126672,0.00187095,-0.000461205,0.000427672,0.00145994,-0.00120305,0.000473697,0.000704392,-0.000927981,-0.0000664966,-0.000727808,-0.000865504,0.00181686,-0.000996391,-0.000314321,-0.0019707,0.000313231,-0.00146126,0.000160641,-0.000270222,-0.000411787,-0.000648077,-0.00041673,0.00100211,0.000469685,0.000264984,0.00070332,-0.000234955,-0.000403761,-0.00104065,0.0000498519,0.000222341,0.0000690801,-0.000572582,-0.000404115,0.000472226,-0.000876014,0.00125216,-0.000898848,-0.000583324,-0.000644573,0.000904683,-0.000284119,-0.000498212,-0.000772072,0.000731314,-0.000493967,-0.00025196,0.00196914,0.000572202,-0.0013851,-0.000774036,-0.000519284,-0.0000447236,0.000167933,-0.000124956,0.000223285,-0.00136814,0.000736912,0.000311822,0.000222244,0.000984057,0.000350397,-0.000368689,-0.000690988,-0.000217876,-0.00098879,-0.000976995,0.000736159,0.0000852597,-0.000629344,0.000963857,0.000519444,0.000305283,0.000509323,0.000738985,-0.00112924,-0.000901414,0.000316948,0.000170765,-0.000453017,0.0000427655,-0.00120045,-0.00108001,-0.00053458,0.00123525,-0.000210408,-0.000408917,-0.000594994,-0.000537644,-0.00023946,-0.00145516,-0.000716629,0.00061825,0.000588083,-0.000185837,0.000362633,0.000303302,-0.000629507,0.00150725,0.000589504,0.00150812,0.00160066,0.000234988,0.000803933,-0.000529236,0.000162958,-0.00116637,0.00117885,-0.000965818,-0.000898477,0.000953111,-0.00126248,0.00124417,0.00112754,-0.00137033,0.000603441,0.000536401,-0.000526362,-0.000710517,0.000349932,0.000181199,0.000242779,0.00097173,-0.000583844,0.000127317,-0.00106316,0.00152316,-0.00104917,-0.00110136,-0.000744203,-0.00181388,0.000385475,-0.000339474,-0.000249364,-0.00108447,-0.000751751,0.00148751,-0.00115839,-0.00112976,-0.00183571,0.000950216,-0.000401697,-0.000204245,-0.000793617,0.000740017,0.000116544,0.00113584,0.00037713,0.000499252,0.00152568,-0.000345676,0.000303521,0.000899077,-0.000144224,-0.00148301,0.000153824,0.00122704,-0.0000793525,-0.000227755,0.000136804,-0.0000115524,0.00102082,-0.00115351,0.0000348716,0.000512491,0.000199027,0.00118706,0.00122177,-0.00146289,0.00111768,-0.00131447,-0.000300979,0.000658146,0.00065974,-0.00037709,0.000153347,0.000927924,0.0000323477,-0.00162657,0.0000696207,0.000654866,-0.00119951,-0.000289305,-0.00191114,-0.00136468,-0.000636951,-0.000913748,0.000676386,0.000827167,0.00106591,0.000965269,0.000386169,-0.0000989526,-0.000107735,-0.000964021,-0.000397022,0.00101755,0.000449878,-0.0000354871,-0.0000923,-0.00082905,0.000128409,-0.00129252,-0.000703716,0.000606435,-0.000255444,0.00107881,0.00141924,0.000586682,0.000631918,-0.000209997,0.00135891,0.000086039,0.00195265,-0.000824542,-0.00117705,-0.000307958,-0.000283828,0.000678146,-0.00172568,0.000736735,0.00101643,-0.00064704,-0.0000759413,0.000496766,-0.00079879,-0.000322285,0.000565141,-0.000954877,0.00043199,-0.00172867,-0.000935061,-0.000474799,0.000328315,0.000253534,-0.000668868,0.00049194,-0.00101276,0.000985028,0.000765849,-0.00106162,0.0000841037,0.00148955,0.00020554,0.000441413,-0.0000503101,-0.000922396,0.000694739,-0.000283634,0.00105672,-0.0001911,-0.000693279,0.0000583923,0.00171059,-0.000504794,-0.0000650499,0.00079372,-0.000180882,-0.000620533,-0.0000533948,0.000504557,0.000435496,0.00146487,-0.000193317,0.00023828,-0.00114206,0.00162171,-0.000724989,0.00150642,0.000221074,-0.000448279,-0.00105467,0.000710444,-0.000197602,-0.00100432,0.000114041,0.000359351,-0.00166578,0.000204138,0.000445522,-0.000418726,0.00155611,0.000675489,0.000730634,-0.000361743,0.000392995,0.00140109,-0.00122038,-0.0000946007,0.00163546,0.000790491,-0.000748126,0.000764458,-0.000720975,-0.000324888,0.000959579,0.00054185,-0.000351073,0.000522494,-0.000284988,-0.000424539,0.00127799,-0.000479086,0.000488096,0.000425783,0.000920027,-0.000842606,-0.000126452,-0.00107343,-0.000514014,-0.00138122,0.0006144,-0.00110823,-0.00159463,-0.000107095,0.000297385,0.00146204,0.00030098,0.000184786,-0.00000381369,-0.000589778,-0.000858668,-0.00022313,-0.00107183,-0.000979656,0.000026859,0.0014846,0.000632808,0.000384989,0.000229253,-0.000568258,0.000896503,-0.00076835,-0.000838591,0.00018077,0.00181993,0.00162581,0.0013679,-0.000314855,0.000684726,-0.000404891,-0.000352555,-0.000132491,-0.000849058,-0.00053069,0.0000517448,0.000323049,-0.000587932,-0.000321478,-0.00070869,-0.000111672,0.000515905,-0.000471794,-0.00118588,-0.0000165937,0.000504013,0.000945543,0.00162276,0.000874292,-0.0000577561,-0.000885126,0.000671775,-0.000515597,-0.000221332,-0.000453752,0.0000168139,0.00126582,-0.00138002,-0.00171086,-0.000983465,-0.00155424,-0.000028407,0.000119005,0.00105757,-0.00066864,-0.0010042,0.000267497,-0.000528973,0.000611536,0.0015777,0.000743254,-0.000470646,-0.00173269,-0.000521047,-0.00147129,-0.0011624,-0.0000213225,-0.000333118,-0.000451353,-0.0009048,0.00137883,-0.000533597,-0.000192291,0.0012812,0.00122224,0.000596486,0.00139831,-0.0010178,0.00076519,0.00014249,-0.000261267,0.00000407996,-0.000228622,-0.000165672,-0.00043968,-0.000951835,-0.000186546,-0.000156325,0.00132425,-0.000701797,-0.0016886,-0.00052398,-0.000781233,-0.000270479,0.000746742,0.000173946,0.00132645,-0.00096329,-0.00178159,-0.000336211,-0.00101349,0.000626736,-0.00130256,-0.00148293,0.000641062,-0.00151651,-0.000203309,0.000338443,0.000553371,0.000344072,0.000834026,-0.00103027,-0.00138366,0.0000191045,0.000457263,0.00113039,0.00133765,0.0017618,0.00140338,-0.00107654,-0.00098891,-0.00136714,0.00125058,0.00150805,-0.000625312,-0.000753173,-0.000870196,0.000724322,0.000954971,-0.000448537,-0.000842379,0.000168919,0.00103234,-0.000376626,0.00124621,-0.00036364,0.000708537,-0.00169136,0.00103215,-0.000603327,-0.0013324,-0.000567831,0.000898435,0.00139549,-0.00139219,0.000978484,-0.000283742,0.0009828,0.000875301,-0.00163198,-0.00155167,0.00109588,0.000619162,-0.000210922,-0.000997593,0.000284201,0.00112327,0.0000592617,-0.000877501,-0.000221395,-0.000776811,0.000561779,0.000911452,-0.000774409,-0.000354009,0.00055116,-0.00122407,-0.00185883,-0.000111297,0.00168809,0.00135712,-0.000626534,-0.000955328,-0.000281403,-0.000100509,-0.000354183,-0.000206116,0.000401243,0.00049041,-0.000893552,0.000587822,-0.000295242,0.000595776,-0.00148693,0.000823953,-0.000350862,0.000519601,-0.000927132,0.00144464,-0.000511396,0.000215214,0.00152461,0.00110099,0.00109723,0.000357437,0.0000636473,0.000276464,-0.000427527,0.000241347,0.000215597,-0.00189324,0.000650919,-0.000863642,-0.00182507,0.000462316,0.000802909,-0.000438277,-0.00145155,-0.000207844,-0.00139669,0.000292893,-0.000393792,-0.00104428,0.000787107,-0.0000816481,-0.000388693,-0.000964095,-0.000634321,0.000361094,-0.00147299,0.000683625,0.00111226,-0.00119939,0.00141648,0.000787036,-0.00087641,-0.00036196,-0.000202912,0.000239975,-0.000573008,0.000333326,0.0012028,0.00173718,-0.000530896,-0.000720517,0.000494491,-0.000759404,-0.00193318,0.000565706,-0.0000329727,0.00123801,-0.000790607,0.000260031,-0.000450901,-0.00106866,0.00120149,-0.00110988,0.0000761029,-0.00061477,0.000587858,-0.00113377,-0.000256707,0.000640059,0.000212472,0.000358244,-0.000264892,-0.00183502,0.00107972,0.00183062,0.00162225,0.0002718,-0.000600114,-0.000407288,0.000615352,-0.000709438,0.000912243,-0.0000690623,0.000209224,-0.00150937,-0.000416182,0.000778367,0.000277833,0.000102046,0.00165944,0.0007714,-0.00173639,-0.00101346,-0.000474835,0.000722346,-0.000252839,-0.000843693,0.00136328,0.000649451,0.000155311,-0.000801987,-0.00075319,0.0019534,0.00129978,-0.000397804,-0.00139824,0.00122416,-0.000838648,-0.000871203,-0.000362323,-0.00018118,-0.00101575,0.000340312,-0.000392278,0.000303896,0.000310979,0.000270922,0.00140293,-0.000578079,-0.000789998,-0.000936063,0.000577808,-0.00191617,0.000258411,-0.00137818,-0.00150758,-0.000336214,-0.00127137,0.000502013,-0.00152704,0.000625245,0.000415726,0.00115386,-0.000144097,-0.00131095,0.000734877,-0.000169807,0.00150238,-0.000880194,-0.000560395,0.000649892,0.00045652,-0.00112231,-0.00190014,-0.00142243,-0.00101673,0.00084214,-0.00114606,-0.0000602576,-0.00135454,-0.000885395,0.000246876,0.00114146,0.000237333,-0.000502692,0.00108516,-0.000863405,0.00153449,-0.000637827,0.000874049,0.000697601,-0.00120396,-0.00188556,-0.000219085,0.00109623,0.000222533,-0.00124133,0.00173289,-0.00113521,-0.000133632,0.000900179,0.001783,-0.000888622,0.0014785,-0.000360604,0.000467706,-0.0010345,-0.000572995,-0.000192694,0.000865734,0.000640241,-0.000566875,-0.000473723,-0.00176274,0.000453921,-0.000487768,0.00117947,-0.000291481,-0.000844175,-0.0017196,-0.000828841,0.000364835,-0.000296939,0.00132753,-0.000242416,-0.00110001,0.0000109643,-0.000264741,-0.00161894,0.00183477,-0.000559816,0.000177002,-0.00171082,0.000479019,0.00054262,0.00083629,0.000106227,0.000762312,0.000468648,-0.000242039,-0.000278045,0.00145919,-0.00101212,-0.000572774,0.0000496577,-0.00051168,0.000504844,-0.000134517,0.000682231,-0.000967631,-0.000785956,0.00167603,0.000187837,-0.000254599,0.000755095,-0.0000485757,0.000239365,0.00108742,-0.000146234,-0.000618695,0.000542601,-0.00006741,0.00022842,0.000451151,0.000689462,-0.000646006,0.000947111,-0.000670391,-0.00133805,0.00190036,0.00114663,0.000937102,0.000216562,-0.000856902,0.00183685,-0.000302115,-0.000457109,-0.0000607909,0.000811616,0.0000247182,-0.00104487,-0.000447381,0.000985039,-0.000961207,0.000393781,-0.000455594,-0.00147234,-0.000369627,0.00041039,0.000246356,-0.00101084,0.00033793,-0.000662215,0.00162009,-0.000153982,0.000291803,-0.000519646,0.000355739,-0.000916932,0.000475673,-0.00123898,0.0000829176,-0.000998642,0.00135036,0.00102926,0.000379972,-0.000238524,-0.000105152,-0.000605075,0.00129739,-0.00158159,0.000854484,0.000726568,-0.0006276,-0.000356121,-0.000592869,0.000612108,-0.00063264,-0.00122293,0.000764135,-0.000346385,0.00171385,-0.0012913,-0.000384063,0.000499073,0.000781839,0.000963881,-0.000834234,0.0000707033,0.000747243,0.00196815,-0.00025389,-0.00059469,-0.0000753421,-0.00194838,0.00064288,-0.000675823,-0.000886326,0.0000559652,-0.00112261,0.000796682,0.000766874,-0.000229028,-0.000789507,-0.0000472824,0.000224359,0.00174658,-0.0000433616,0.00161252,0.0000601742,0.0000498228,0.000204961,0.000177457,0.00157909,-0.0000556862,0.00135795,-0.000490685,0.000452761,-0.00138273,-0.00171463,-0.000551309,0.000581413,0.0000225003,0.000655141,0.000138763,-0.00152507,0.000927717,-0.000601068,-0.000879473,0.000159395,-0.000214194,0.0000446526,-0.000850845,0.000345909,-0.000837985,-0.00116796,-0.000179333,0.0000975313,-0.000999128,0.00119233,0.0000510703,-0.00138349,0.000940204,0.000670083,-0.00000774469,0.000220714,-0.000244677,0.000632611,-0.000734202,0.000503604,-0.000122304,-0.000005052,-0.00103659,0.000876975,0.000835688,-0.000864221,-0.000362784,-0.000361973,0.00116641,-0.00139704,-0.000586733,-0.000574739,0.0002493,-0.000774267,-0.000528071,0.000846752,-0.000806001,0.000464874,-0.000923023,0.000432294,-0.000591614,0.000957321,0.000927916,-0.000280238,0.00147161,-0.000811332,0.00148173,0.00171636,0.00136463,0.000023292,0.000420147,-0.000733657,-0.00131681,0.00136911,0.00150495,-0.000422608,-0.0013046,0.00119921,-0.000779625,0.000957705,-0.00109994,0.000486891,-0.000537866,0.000684833,-0.000276238,-0.000825778,-0.000260831,-0.000491519,-0.000791273,0.000425398,-0.000571072,0.0000500212,0.000659568,-0.000097868,-0.000431356,-0.000359211,0.000243923,-0.00172741,0.000787316,0.00112928,0.00116173,0.000638687,-0.0000821032,0.00078531,0.000641355,0.000538299,-0.000814737,-0.00197798,0.00153197,0.000318888,0.000285724,-0.000656774,-0.000695385,0.000826988,-0.000251032,-0.00165542,-0.000149803,-0.000957113,0.00119015,0.000196424,0.000244666,0.00148404,0.000482936,-0.00137414,0.00178339,0.000642298,0.000167122,-0.000591587,0.000442147,-0.0000168818,0.00178661,0.00173411,-0.000338651,0.00150088,-0.00103232,-0.000172669,-0.000824517,-0.0015639,-0.000377694,-0.000963588,-0.00122479,0.000712413,-0.000658874,-0.000517535,0.000647468,-0.000912735,0.0000473274,0.000294588,-0.000897855,-0.000648183,-0.000817356,0.000554335,0.000862341,-0.00185978,-0.000559784,-0.000767625,0.00145146,-0.000560764,0.000500399,0.000360982,0.000968794,0.00013891,0.00123229,0.000147865,-0.000184268,-0.000136468,-0.00155974,0.00145992,0.000474411,-0.000454741,-0.000880565,-0.00109798,-0.000247308,-0.00114959,-0.000134698,0.000970663,-0.000149706,-0.000815034,0.000768889,-0.00159846,-0.000643669,-0.000546833,0.000278231,0.000843837,-0.000758109,0.000451767,-0.00128008,0.00038437,-0.00035009,-0.000524975,-0.000298564,-0.000364409,-0.00103297,0.00178994,0.00152678,0.000231591,-0.000964237,-0.000301189,0.000087809,-0.000194848,-0.00047062,-0.000723941,0.000860268,-0.000604083,-0.000654588,-0.00143378,-0.000126361,0.00100261,-0.000370712,0.000381835,0.0015918,-0.00118756,-0.00166202,-0.00108761,0.000265251,-0.000571541,-0.000756972,0.00137431,-0.000685524,-0.000582585,-0.00131851,-0.000761144,0.00137134,0.00102468,0.00060052,0.000175883,-0.00196136,0.0013201,0.000374708,-0.000261053,-0.000439428,0.00114141,-0.000884836,0.00153999,-0.00061054,-0.00113842,0.00197554,-0.000123195,0.0010863,0.00149398,0.000748525,-0.00101698,-0.000695844,-0.00131753,-0.000155043,-0.000500419,-0.000911647,0.00146698,0.00112842,-0.000652257,-0.000395081,0.000598116,-0.00161478,-0.000524351,-0.00148516,-0.00033056,0.00114696,-0.00150528,0.000102058,-0.00170893,0.000339451,0.00062719,-0.000768249,-0.0014602,0.000998127,-0.00152918,-0.0000208894,0.000739512,-0.000387767,-0.000247678,-0.0010465,-0.000574847,0.0000784296,0.000158247,0.00110865,-0.00132626,0.000709441,-0.0000301099,-0.000103462,-0.000771531,0.00117398,0.000425078,-0.000537131,-0.00135709,-0.000624022,0.00115706,0.0018741,0.000245641,-0.00109876,-0.000474376,-0.000724711,-0.00107782,-0.00136107,-0.00023977,0.000531754,-0.000758145,-0.000942544,0.00053928,-0.000433278,-0.00114987,0.000553448,-0.000695671,-0.000835219,0.0000648513,-0.00136627,0.00192155,0.00199589,0.000552003,-0.000703239,0.000129842,-0.00165936,-0.000622707,-0.00062792,0.000910618,0.00130748,0.000461312,0.000693995,0.000767964,-0.000000161238,-0.000701238,-0.00114928,-0.000385446,0.000976954,0.000306605,0.000473546,-0.000744842,-0.00045803,0.00048415,0.000023348,-0.000368454,0.000377881,-0.00042572,0.000996909,-0.000144085,0.000811955,-0.000470455,-0.00123463,-0.00174631,-0.00149294,0.000614828,0.000670116,0.0013006,0.00189942,0.000207821,-0.00050684,0.00130161,0.000223371,-0.00132455,0.00101231,0.000530691,-0.000914335,0.000475818,0.000581576,-0.000290132,-0.000252357,0.00105726,0.000698537,0.000173823,-0.0000978198,0.000230127,-0.000654123,-0.000109047,0.000135525,0.00123984,-0.000805473,-0.00101579,0.000919973,-0.000801463,0.00016174,-0.000487985,0.00135867,0.000276011,-0.000210848,0.000137822,-0.000558317,-0.000429748,-0.000539942,-0.000169848,0.000350592,0.000803684,0.000716045,-0.00125648,0.000582386,-0.000431295,0.000152428,0.000666846,0.000351937,0.000283189,-0.00052327,0.0000767621,0.000675818,0.00106638,-0.00164356,-0.00152082,-0.000330423,-0.000718231,0.00118446,0.000294322,-0.00016215,0.0000222838,-0.00172529,-0.0013469,-0.000572369,0.000211351,0.000584324,0.000199883,0.000885368,0.000672615,-0.00153913,-0.0000863367,-0.00110966,0.000554307,-0.0011292,0.000622555,-0.000882693,-0.000895752,0.000594303,0.000355856,0.00105858,-0.00045262,-0.000805194,-0.00067163,0.0000432185,-0.00102125,-0.000686662,-0.000678341,-0.000394887,0.000743003,0.000698385,0.00170866,0.000924683,0.00117242,0.000418869,0.000489621,-0.000207151,-0.000148783,0.000392113,-0.00152693,-0.000699403,-0.0017078,-0.000945407,-0.000026715,-0.000182845,-0.000192165,0.00126507,0.00111951,-0.0000362708,0.00145862,-0.000264106,0.000374735,0.00128667,0.00125045,0.000637988,0.000183495,-0.0000737561,0.00111219,0.000629296,0.00134908,-0.000520503,0.000316485,-0.000656213,0.000340853,0.00186918,-0.000192438,0.00125708,-0.00184246,0.00135213,-0.000793383,-0.00147664,0.0000502473,0.0000522953,-0.000252482,0.000176483,-0.000465956,0.000947153,0.0000209438,-0.00158401,-0.00179739,-0.00191722,-0.000287287,0.000112189,0.000988819,-0.00000184972,-0.00143218,0.000272372,-0.000136143,0.0000048758,0.00110015,0.00176704,0.00117721,0.000520461,-0.000121643,-0.000676481,0.00154629,-0.00082528,-0.000961629,-0.000474376,-0.000172556,-0.000742514,0.000411809,0.00151668,0.000678692,0.000142543,-0.000266862,0.00125403,-0.000712541,-0.000490594,-0.0000325945,-0.00169837,-0.00104941,-0.000987461,0.000495482,-0.00163953,-0.00158137,0.000668357,0.00113388,0.00103013,0.000757311,-0.000151636,-0.00123943,0.0000837011,-0.0012408,0.000891051,0.00006581,-0.000100815,-0.000196074,-0.000165273,-0.000559208,0.00147685,-0.0000429797,-0.00129011,-0.000603686,0.000568842,0.000575682,-0.000434782,-0.000860116,-0.000591592,0.0000298867,-0.000666799,-0.000885289,0.000910043,0.0000675131,0.00169024,0.000593807,0.000512986,-0.00187284,0.0000413536,-0.00135627,0.000632931,-0.000362188,-0.00143977,-0.00044956,-0.000391839,-0.000787423,-0.000377076,0.000917384,0.000513688,-0.00125239,-0.000861619,-0.000386423,0.00174999,-0.000130314,-0.000512428,0.00116234,0.0012038,0.00124728,-0.000807514,0.000722762,-0.00186328,0.00032086,-0.00178287,-0.000168196,-0.00038868,0.000333896,0.00087997,-0.00169895,0.00124599,0.00148621,-0.000785898,0.000142371,0.00031315,0.00072065,-0.00075032,-0.0000867288,0.000481515,0.000947059,-0.000560162,0.00142288,-0.0000161746,0.000807123,-0.00168722,-0.00100455,-0.00130051,0.000465081,-0.0000677177,0.0016866,-0.000225953,-0.00105727,0.000283553,0.000123022,-0.0010517,0.0000488276,-0.0006214,-0.000767511,-0.000887629,-0.00128075,0.000109624,-0.000509775,0.00133939,-0.000347002,0.000690564,-0.000461361,-0.00058761,0.000858033,-0.000537682,-0.000566214,-0.000296383,0.00148654,-0.000821137,-0.000638145,-0.00125129,-0.00082412,0.000175659,0.00132948,0.000448032,-0.000961979,0.001093,0.000238839,-0.000193341,0.000717699,-0.000737626,-0.00023442,-0.00146831,-0.0000578056,-0.000531361,0.00106067,0.000136663,-0.00126253,0.000233674,0.0000958291,-0.000531511,0.000131647,0.00143089,-0.000924349,-0.000822194,-0.00198839,0.000760262,-0.000771829,0.000598682,-0.000790391,-0.000756625,-0.000989291,0.00123208,0.00106504,-0.00148551,0.00059522,-0.000142786,-0.000366103,-0.00100204,0.000599934,0.000124728,0.00151134,0.000618212,0.00119795,-0.00059981,0.000093232,0.000545203,0.000509724,-0.00072217,0.00182391,0.000724677,0.00108005,0.000191416,0.0019307,0.000114157,0.00197766,-0.00149091,0.00151912,-0.000204641,-0.00160508,0.000188323,-0.00165481,0.000543575,0.00146381,-0.000729517,0.00159621,0.00104292,-0.00113329,-0.000044381,-0.00061364,-0.000216507,0.000963005,-0.000550403,0.000336252,0.000431675,-0.00137636,0.000546037,-0.000582397,-0.000863402,-0.000725367,-0.00148257,0.000762668,0.0000406268,-0.00158662,-0.000850781,0.000957734,0.0000985271,0.0000550581,0.00119981,0.00176945,-0.0016512,0.00139954,-0.000278902,-0.00189133,-0.0000405702,-0.000984179,0.000830829,-0.00179171,0.000581877,0.000155203,-0.00156841,-0.00000155026,-0.0000244106,0.000329513,0.000464424,-0.000837239,-0.00000052537,-0.00103838,0.00142036,-0.000125994,-0.000695103,-0.000695437,0.000556352,0.000140432,-0.000765222,0.000893554,-0.00127098,0.000108109,0.000126938,0.000678992,0.000252874,-0.000555608,-0.000103032,-0.00107293,-0.000345197,-0.000449375,0.00136192,-0.000311143,0.0000770707,-0.00062711,-0.000887122,-0.000160744,-0.000710373,0.000187321,0.000557583,0.000845886,0.000700755,-0.00126209,0.00017617,0.000923816,0.0012162,0.00131397,-0.000358472,-0.00097199,-0.000351871,0.00100273,0.0015031,-0.00167488,0.000377613,-0.000766072,-0.000115935,-0.000803975,-0.000243751,0.000116981,-0.000287364,0.00109006,0.00165742,-0.0000618557,-0.000306239,0.000900149,0.0000755027,0.000250252,0.000280229,-0.00100493,0.00129139,0.00146904,0.00107704,0.000636247,-0.0012248,-0.000990201,0.000331236,-0.000336328,0.00150569,-0.00160807,0.000775683,0.000378983,0.000060694,-0.000505863,0.000550259,0.00155071,-0.000350495,0.000118934,-0.00102321,0.00174323,0.000198533,0.00115449,0.000718578,-0.000175813,-0.0000527193,-0.000139049,0.000285827,0.00157219,-0.0000338533,-0.0000740733,-0.000256605,0.00021148,-0.000581839,-0.000277637,-0.00063612,-0.00123201,-0.000372597,0.00107837,-0.00038244,-0.000429284,-0.000824134,-0.000972514,0.000609289,0.000383846,-0.00100518,-0.00126962,-0.0000079813,0.000704128,0.000980041,-0.00056152,0.000172477,0.000241159,-0.000515213,-0.000644303,0.0000117224,0.000069116,0.000443972,-0.000706865,-0.000393308,0.00160034,0.00154419,0.000654163,0.000236748,0.000269971,0.000849805,0.0015051,0.00172191,-0.00128896,-0.000632552,0.000352832,-0.000270213,-0.000569675,0.000312506,-0.00107246,-0.0000964239,0.000389037,0.000539336,0.000157023,0.000712603,0.000235108,-0.000224787,-0.000733278,0.00180618,0.000181605,0.000214856,-0.000894082,0.0000981057,-0.000971362,-0.0000392292,-0.000538433,-0.000316192,-0.000440598,-0.000657191,-0.00110667,0.000568862,-0.000234238,-0.0003616,0.000211418,-0.000237666,-0.000739433,-0.000140401,0.00191055,0.000167145,-0.00107954,-0.000634185,0.000402705,0.000477948,-0.000137163,-0.000538319,0.000285787,0.000810311,-0.00132675,-0.000225319,0.000421324,0.000242565,-0.000478156,0.000353839,-0.000401492,0.00198975,-0.000712577,0.000469073,0.00160279,-0.00165895,-0.000714649,-0.000197304,-0.00106464,-0.000230606,0.000376611,-0.00137537,0.000846763,0.00123295,0.000727111,-0.000363936,0.00148999,-0.000193653,0.00118493,-0.00113528,-0.00194457,-0.000129619,-0.00140819,-0.00147695,0.00128196,-0.000320744,-0.00137604,0.000390288,-0.00117376,-0.000189542,0.000419247,0.00030972,-0.00160821,0.000610601,0.000620275,0.000176957,-0.000608637,-0.00027717,-0.000404766,-0.000140141,0.00160703,0.00018387,-0.000244789,-0.000276623,-0.000357417,-0.000922184,0.000454443,0.000962229,-0.000422927,0.00145801,0.00134222,-0.00177714,-0.0000138916,-0.000750611,-0.00119846,-0.00199022,-0.00131712,-0.000647209,0.0000326106,0.000800315,0.00142114,0.000953773,0.000693373,-0.000510659,-0.000746056,0.000311423,-0.000789173,0.000151245,-0.000456289,-0.000851957,0.000445872,-0.000300609,0.00160472,-0.000427785,-0.00066575,-0.0000540941,-0.000804425,-0.000291199,-0.000673075,-0.0000237292,0.0000145458,-0.000633767,-0.00153462,-0.000155893,-0.00106261,-0.000147414,-0.00033636,0.00179341,-0.001457,0.000187272,0.00163812,0.0000886762,0.00113548,-0.000550294,0.0010339,0.00128366,0.00128899,0.000747922,0.00137869,-0.000819443,0.0000754709,-0.00109901,-0.00110349,-0.000886365,-0.000831829,-0.00188941,0.0011952,0.000480983,-0.000732805,-0.000658146,0.00133007,0.000437455,-0.00120534,0.000241692,-0.000472871,-0.0010922,0.00182751,-0.00180938,0.00103563,-0.000669608,0.0000270235,0.0000468826,0.000517492,-0.000520741,0.000599021,-0.000388358,-0.00173743,0.000255982,-0.000858418,0.00168668,0.000597602,-0.00038312,-0.0012729,0.000127293,0.0000512249,-0.0000484961,0.000290135,0.000538632,0.0000468406,0.00056403,-0.00159166,0.0011249,0.000313192,0.000332794,0.00146631,-0.000321698,-0.00139968,-0.00133353,-0.00107569,0.000207496,-0.000246495,0.000572811,0.000492361,-0.000808831,0.000537127,-0.000370091,-0.000442222,0.000579011,0.000217169,0.000538975,-0.000797195,-0.000414298,0.00130853,-0.000592578,0.00059262,0.000554265,-0.000853951,0.000152057,0.000648936,-0.0005763,0.00125611,0.000676685,0.0000714373,-0.00120048,0.000736263,-0.000789348,0.000556819,-0.000237295,-0.000300427,-0.00084132,-0.000330926,0.00171701,0.000320926,-0.000546222,-0.000814136,0.0006415,0.000743188,-0.000168201,-0.0000612706,-0.000217368,0.000191223,0.00159815,-0.00112316,0.00181926,0.000866913,0.000297745,-0.000684124,-0.000138823,0.0011191,-0.00127905,0.000179299,0.000477319,-0.0000821993,-0.00121956,0.00011562,-0.00126286,0.000127924,0.000170471,-0.00127492,-0.00127669,-0.000540502,0.00104613,-0.00124106,-0.000041746,0.000423351,0.00128491,-0.000228298,-0.00110238,0.000265036,0.00136717,-0.00067487,-0.0000441604,-0.000355938,-0.00114167,-0.00100646,0.000948558,0.000741798,-0.000947318,0.00178881,-0.000364309,-0.000817958,-0.0010846,0.000748615,-0.000300002,0.000971787,-0.000613325,-0.000678466,-0.000390569,0.000350583,0.000277456,0.000223984,-0.000688175,-0.000723453,-0.00139173,-0.000543953,-0.0000826789,0.000380132,-0.00106345,-0.000317691,0.00015461,0.00109766,0.000975019,0.00194765,-0.000135062,0.000885452,-0.0008311,-0.000110829,0.000698428,0.00102845,-0.000430333,-0.000827516,0.00130956,0.000854447,-0.00114698,-0.00131128,0.000850856,0.00112116,-0.000373071,0.000974738,-0.00132823,-0.0000579207,0.000808791,0.00134271,0.0000830541,-0.00005293,0.000282854,-0.000640385,-0.000971453,-0.000808332,-0.000968634,0.000363186,-0.00107588,0.000469393,-0.000133308,-0.0000572085,0.00100475,-0.000192224,0.000580092,0.000888209,-0.000781746,0.000683113,-0.000423176,0.00137447,0.000337371,0.000225429,0.000319686,0.000636855,0.0000428319,-0.00136468,0.000389894,-0.00105165,0.000731973,-0.000775435,-0.000673065,-0.000138586,0.000333407,-0.000854799,0.0001937,-0.00000467561,0.00177759,0.000627335,0.000516666,0.00120039,-0.00122816,-0.000185747,0.00061212,0.00150625,0.00111103,0.000823231,0.00089914,-0.000674489,0.000743787,0.000239331,-0.000907447,-0.00100932,0.0000652264,0.000559916,0.00141228,0.00018965,0.000174781,0.000237577,-0.000286508,-0.000607327,0.000915547,-0.00155628,0.00040293,0.0000216714,-0.0000885276,0.00000174085,-0.0000910605,0.00134242,-0.000850138,0.0000481132,-0.000493519,0.0000627026,0.00068284,0.000302449,-0.000632332,0.0000868426,0.000329693,-0.000643219,-0.00132721,-0.00186413,0.000883434,0.000839271,0.0000885285,0.000728081,0.0006696,0.000295328,0.000828312,0.000332399,-0.00101801,-0.000133459,0.000439871,0.0017098,-0.000151936,0.000135129,-0.0003841,0.00171866,-0.000887521,0.00092097,0.00058584,-0.0000716035,0.000296984,0.00060726,0.000178972,-0.000396985,0.000171825,-0.000602815,0.000276345,0.000670421,0.00183283,0.0017581,0.000505217,0.000610168,-0.00118422,-0.00184509,0.000351022,-0.00107453,-0.00144752,0.000504814,-0.00120606,0.00103273,-0.00147134,0.000502379,0.000703017,-0.000977489,-0.00128426,0.000906477,-0.00152667,0.000760441,-0.000440277,-0.00199314,0.0000405908,-0.00140006,-0.000377449,0.000442808,-0.000123653,0.000377431,0.000230427,0.00159873,0.00112758,-0.00150649,0.00164914,-0.00148818,-0.00187901,-0.000355828,0.000483309,0.00136866,-0.000943744,-0.000434454,0.000340735,0.000582598,0.00198527,0.000400286,0.00127928,-0.0000253953,-0.0013148,0.0000319269,0.00151066,0.00102741,0.000194145,-0.000252539,-0.00123383,0.000866156,-0.00144379,-0.00119846,-0.000863487,-0.000165989,0.00000465648,0.000432887,0.000476429,-0.00122955,0.00151488,0.000714182,0.000461582,-0.000304639,0.000486312,-0.00147795,-0.0000648756,0.000140629,0.000487574,-0.000415743,0.000897534,0.00130429,0.000578931,0.00169562,0.00192175,0.00079073,-0.00073771,-0.000980748,-0.00167431,0.000889585,0.000639606,0.000902949,0.000953748,-0.00065174,0.00130231,0.000187618,0.000125834,0.000278513,0.00150384,0.000863251,-0.000223186,0.000571993,0.000201282,-0.000333196,0.00166436,-0.00192668,0.000936012,0.000499472,-0.000814945,0.0000438624,-0.00112282,-0.00101052,-0.000274336,-0.000421093,-0.00082524,-0.0000244954,-0.00060593,0.000210454,-0.000514739,0.000705498,-0.00187643,-0.000753662,-0.000269278,0.00107719,0.00130335,-0.00108068,0.000689673,-0.00102811,-0.00000792218,-0.000669822,-0.000359325,0.00168367,0.00062867,0.000561274,0.000364588,-0.000162607,0.000952926,0.000390985,-0.00013232,-0.00114484,0.00179491,0.000366503,-0.00038433,0.000755032,0.000918272,-0.000136838,-0.000786574,0.000870364,-0.000996091,0.0000944039,-0.001044,0.000217289,-0.000726401,-0.0000274291,-0.000171956,-0.000760811,0.00105405,-0.000552736,-0.000247508,0.0000817825,-0.00104947,-0.00155632,0.00151989,0.00072523,0.000388816,0.000658866,-0.000829575,-0.000260388,-0.000145639,-0.000966797,0.0000717024,-0.000389626,-0.000626635,0.0000629191,-0.00110074,0.000331064,-0.000190364,0.000250582,-0.00138654,0.000994172,-0.000260518,0.000182755,-0.0005771,0.0000633435,-0.000111731,-0.000196602,-0.00109029,-0.000428667,-0.00030929,-0.00188705,0.000513974,-0.000725416,-0.000824998,-0.000972782,-0.000972965,0.000497867,0.00050344,0.000696249,0.0018352,0.000248849,0.00175502,-0.00109591,-0.00176795,-0.00119607,-0.000962534,0.000623336,0.00152465,-0.000275031,0.00176568,0.000441467,0.000573364,0.000945879,-0.00193756,-0.00132232,0.000533189,-0.00106451,0.0010184,-0.000162504,-0.000866471,-0.000637557,-0.000551655,0.000504067,0.00126942,-0.000139295,-0.0000832823,-0.000564265,0.00142746,0.000899426,0.000180515,0.00123275,0.00143712,0.00103647,0.000853348,-0.00147367,-0.000215517,0.0000652177,-0.000426196,-0.000176153,0.00140145,-0.000135838,0.00160946,0.000659299,-0.000870985,-0.00106474,0.000931839,-0.00147744,-0.000872798,-0.000445011,-0.000066052,0.000407709,-0.0000149319,0.000843395,0.000311827,-0.00102222,-0.00139901,-0.000123451,-0.0000785452,0.0000700665,-0.00105917,-0.00122374,0.000956545,-0.0007004,-0.000643417,-0.000875679,-0.0015035,-0.000153871,-0.00011959,0.000573829,-0.000220966,0.00133061,-0.000886889,-0.00165156,0.000791226,-0.000572805,-0.000866035,0.000751754,0.000712419,-0.00133284,0.00118209,0.000234418,0.00158097,-0.00105795,-0.000569049,-0.000940986,-0.000466494,0.00133941,-0.00020222,0.000603281,-0.000766864,0.00165034,-0.000400873,-0.000439414,0.000188861,0.000152185,-0.000430414,0.000752955,-0.0000265176,0.00140829,-0.000293225,0.000408139,-0.000332186,0.00164715,0.00104548,0.00178665,-0.000630764,-0.0000567694,-0.000463299,-0.00060017,0.000505497,-0.000385137,-0.00149713,-0.000907852,0.00083157,0.00194644,0.00156675,-0.000158618,-0.000788745,-0.000355093,0.000212454,-0.00032925,-0.000649162,-0.000158236,0.000126817,0.000487123,-0.000633699,0.000276021,-0.00126003,-0.000188075,-0.000240872,0.000119619,-0.00142189,0.00000655944,-0.0012682,0.00027378,0.00199821,0.000386892,0.00010578,0.000167356,0.000724614,-0.000563968,-0.000364823,-0.00140282,0.00101246,-0.00120123,0.00193407,0.00135546,-0.000208751,0.00132585,0.000858463,-0.000522012,-0.000856916,-0.00108314,0.000127537,0.00119896,-0.00182601,-0.000549486,-0.000878612,-0.00151478,-0.000721651,0.00110932,-0.000618523,0.000566593,0.0000789469,0.0000211106,-0.000374704,-0.00162256,0.000425292,-0.000267191,-0.000284765,-0.00121642,-0.000556212,0.000705134,0.000694906,0.0000631192,-0.000866849,-0.0000631492,-0.000254831,0.000568965,0.000642933,0.000622152,0.00128465,-0.0000796762,0.000751217,-0.000718766,0.0016244,0.000328166,-0.000105694,-0.000971072,0.000428802,0.000906071,-0.00116683,-0.000339896,-0.0012475,-0.0014136,0.000550864,-0.000700866,0.000141247,0.0014282,-0.000439275,-0.00101059,-0.000543585,-0.00126819,0.0000145276,0.00117568,0.000222961,0.00115431,0.000447294,0.000188283,-0.000868933,0.00104638,0.000397107,-0.00066209,0.0000540325,0.000743959,-0.000207932,-0.000949759,0.000377273,0.000398425,0.000137145,0.000774402,-0.00083134,-0.000288112,-0.0016768,-0.00143247,-0.000186175,0.000382167,0.000194533,0.000770479,-0.00179712,-0.00151519,0.0000681836,-0.000218,0.00151061,-0.00178239,-0.000578118,0.0000702413,-0.00118457,-0.00165603,0.00136516,0.000160276,-0.00114431,-0.000941698,-0.0013214,-0.001349,-0.000942948,-0.000981545,-0.000154295,-0.000976332,0.00120582,-0.000333135,-0.000286802,-0.00119618,-0.000209912,-0.0016806,0.00108576,-0.00109445,0.000900693,-0.00089297,-0.000615253,0.000548267,-0.000514023,-0.000902267,0.000171811,0.0010358,0.000701757,0.00129339,0.000422237,-0.00134274,0.00114513,0.000209607,-0.0000680246,-0.000357876,-0.000862909,-0.000356871,0.000710171,-0.00120675,0.000130576,-0.000642949,0.0000243551,-0.000482704,-0.00109906,-0.00134841,-0.000300535,-0.000133141,0.000339454,0.00105239,0.000320343,0.000189048,0.00112147,-0.000842238,-0.000681115,-0.0000407773,0.00137605,-0.000599645,-0.00149291,0.000659132,0.0000955099,-0.000671112,-0.000606153,0.00103429,0.0000563182,-0.00030449,0.00130928,0.000779866,-0.00020013,0.00031887,-0.00046221,0.000464797,0.000249671,0.00131583,0.000980545,-0.0000122535,-0.000777391,0.000204646,0.00127833,0.000381027,0.00073341,0.000952819,0.00138788,-0.000552069,0.000303286,0.000536412,-0.000149839,0.00013788,-0.0010207,-0.000755284,-0.000470403,0.000381816,0.000788928,0.000432074,-0.000184173,0.0000995494,0.00125102,-0.000729003,-0.000177814,0.000360932,-0.00090587,0.000645361,-0.000789713,0.00150481,-0.00110518,0.0010808,0.00107315,-0.000443794,0.00114153,0.000225116,0.000384776,-0.000499249,-0.00057068,-0.00115481,-0.000206647,-0.000570941,-0.00163009,-0.000747651,-0.00161248,0.000198605,0.00122665,-0.000592575,-0.0013566,0.000385551,-0.000902454,-0.000612792,0.000464581,0.00192036,0.000813618,0.00142692,-0.000369305,-0.00103421,-0.000731577,-0.000799962,0.000983454,0.000831149,0.000602489,-0.000100031,-0.000227175,-0.00031051,-0.00115513,0.000993693,0.000529984,0.00146637,0.00148069,0.000793514,0.000626158,0.0000821805,-0.000857056,0.00125444,0.000210147,-0.00102201,-0.0014607,0.001047,0.000644671,-0.000906978,-0.00135692,-0.000690491,-0.000318631,-0.00128425,-0.000511318,0.00184484,-0.000551181,-0.000385185,-0.00126128,0.000425775,0.000900381,-0.0000676109,0.00151634,-0.000507445,-0.000447331,0.0000254245,-0.000830932,0.000360662,0.00182158,0.000344482,0.000465034,0.00126429,0.00132148,-0.00177092,-0.00041,-0.000741469,0.000129445,-0.00145321,-0.00143166,0.000917608,0.000250052,0.000493341,0.00181216,-0.000142421,-0.00133758,-0.000258783,-0.000355855,-0.000444105,-0.0017376,-0.00175257,0.00170965,0.000469599,0.000572908,0.000342711,-0.000557033,-0.000570965,-0.000725214,-0.00170195,-0.000475888,-0.000354207,0.000128432,0.00122471,0.00105473,-0.000103823,0.000875135,-0.000102514,-0.000638163,0.000174633,0.000649024,-0.000348908,-0.00138041,0.000526294,-0.000365713,-0.00100838,0.000258038,-0.000986936,0.00177178,0.000658551,0.001365,-0.000210993,0.00043073,-0.00015453,-0.00114184,0.000223673,0.000111936,0.000828332,-0.00106471,-0.000180741,0.000456632,-0.0000935684,0.000366552,-0.00138113,0.000246057,-0.000687529,0.00106893,-0.000818525,0.000113542,0.00120158,0.00152696,0.000191773,0.00117747,-0.000255426,-0.00140875,0.000469037,-0.000628065,-0.000326268,0.00101012,-0.000163138,-0.00162671,-0.000119508,0.000113583,0.0011239,-0.00046278,0.0012661,0.000500799,0.00104083,0.000995036,-0.00155899,-0.000481449,0.000209753,-0.000202335,0.000101532,-0.000298814,-0.00140398,0.00111153,-0.000555299,-0.000118151,-0.000652053,0.000292334,0.000981416,-0.000491106,-0.0000259701,0.000833292,-0.000521199,0.00101141,0.00163102,-0.0000938849,0.00102972,-0.00134378,-0.000668365,-0.00128965,-0.000502579,0.00063652,0.000127177,0.000841439,-0.00112093,-0.000907524,-0.000600996,0.000651475,-0.000324698,0.00067066,-0.000694646,-0.00137941,-0.00190132,-0.000126281,-0.000160337,-0.0010063,0.000199117,0.000114793,0.000951909,0.000224962,-0.000249712,0.000387191,0.000357731,0.0000969701,0.000779851,-0.00196009,-0.00193639,0.000437059,-0.000144207,-0.000101307,0.00117766,-0.0000105162,0.000157789,-0.000739958,-0.000516552,0.000415937,0.00161448,0.000722824,0.000122966,0.00108337,-0.00033345,-0.00114414,-0.00169884,0.000838837,0.000652189,-0.000651642,0.00197292,-0.000535703,-0.000316794,0.00146363,-0.000967782,0.000478991,0.000913994,-0.0000302231,-0.000712922,0.00090936,-0.0017302,0.000355257,0.000247263,0.000987502,-0.0000097429,0.00086271,0.000443359,-0.000585328,0.0010771,-0.000368108,-0.00138474,0.00109461,0.00153644,0.000340124,-0.00102467,0.000839736,-0.000328045,-0.000632098,-0.00063849,0.000698816,0.00100363,-0.000897216,0.000329572,0.000304754,0.000151247,-0.000479838,-0.00188104,0.000710108,-0.000238521,-0.00133635,-0.000679476,-0.00177434,0.00141934,-0.0010314,0.000926915,0.0000531316,-0.00159507,0.000894586,-0.00139787,-0.000880166,-0.000146065,-0.000365829,-0.000602091,-0.000553928,0.000197631,-0.00103597,0.000642502,-0.0009905,-0.0000798996,-0.0000471458,0.00013205,-0.000325851,-0.000587177,-0.00121516,0.0013554,0.00125511,0.000175504,-0.000989159,-0.000300058,0.00128934,0.000914399,0.000631338,0.00101705,0.00168505,0.00155639,0.0000451462,-0.000281425,0.000667046,0.000260057,-0.000294485,-0.00129719,0.000690089,-0.000505545,0.000137127,-0.000225977,-0.000242071,-0.00113043,-0.000844231,0.000123537,-0.000884133,-0.000890697,0.000868568,0.00121793,-0.00125635,0.00192978,0.0000590295,-0.000115182,0.000515781,0.000949773,-0.00101609,0.00138305,0.000506826,0.000491038,-0.000588344,0.00163657,-0.00050778,-0.000747487,0.001467,-0.000394578,-0.0017356,0.000204251,-0.000161704,0.000646329,0.00095945,0.000774836,-0.000440062,-0.0000327667,-0.000221171,0.00154915,0.000532331,-0.00134439,0.000216787,-0.00009543,-0.000994147,-0.00164463,-0.00114352,0.00139343,0.000555183,0.00171086,-0.00037851,-0.00142675,-0.00152613,0.000322681,0.00114353,0.000531971,0.000382766,0.000754727,0.0000654189,0.000709423,0.00156951,-0.00108454,0.000980854,0.00150803,-0.000597821,-0.000246615,-0.000640872,-0.00100005,0.000214603,-0.001448,-0.000344792,-0.00131554,0.000331589,-0.000519299,-0.000365262,-0.000177908,-0.00140789,-0.00103126,-0.00044027,0.000629168,-0.0000757146,0.00044374,-0.00130864,0.000348071,-0.000527885,0.00199165,0.00101944,0.00108074,-0.000160032,0.00195631,0.000362133,-0.000147954,-0.000690355,0.00103583,0.00111381,-0.000737743,0.0000750282,-0.00062965,-0.00047504,-0.000521751,0.00145296,0.000557881,0.00110137,-0.000116377,0.000402113,0.000504917,-0.000704363,0.000618938,0.0000212101,0.00109522,0.00137395,0.000702473,-0.000759435,-0.00159285,-0.000781899,-0.0000854839,-0.000406203,-0.000762842,0.000534255,-0.00072187,0.000752342,0.00106312,-0.0012884,-0.000176763,-0.0000715585,0.000452275,0.000368119,0.000740601,0.0000532073,0.000484038,0.000974941,0.000239539,-0.000219619,-0.00000849165,-0.000118107,0.00146123,-0.000909033,0.000460371,0.00024006,-0.000668462,0.000869123,0.0000227569,-0.00000715214,0.00133765,-0.000128151,0.000350006,-0.000987029,0.0009833,-0.000462771,-0.00118308,-0.000949168,0.00168348,-0.00103431,0.00175333,0.000105066,0.000157219,0.000498842,-0.000361863,0.000173214,-0.000334621,-0.000580873,-0.00138785,0.00148891,-0.00087261,0.000734539,-0.000242364,0.00174875,0.00105671,0.000913175,-0.000392344,-0.001934,-0.000461378,0.000208657,0.000374601,-0.00116916,0.00165857,0.00185664,0.000830083,-0.0000455042,0.00109897,0.00101162,0.000242446,-0.00151534,-0.0000734747,-0.00106847,0.00124907,-0.000711593,0.000291757,0.000111633,0.0000480486,0.00105623,0.000684415,0.00104823,-0.00126838,0.000594414,-0.000304244,0.000229121,-0.00160646,-0.000806956,-0.000660882,-0.000441217,-0.000977566,0.000797003,-0.000585558,-0.00112922,-0.000688406,-0.000116756,-0.00190095,0.000132114,-0.000251474,0.000664179,-0.000778889,-0.000189238,0.0000378202,0.000583111,0.000163001,-0.00161141,-0.000507353,-0.000175144,0.00101949,-0.00000555123,0.000442108,-0.000128489,-0.0000431152,0.00176877,0.000413205,-0.00024559,-0.000537744,-0.000309962,-0.000528839,0.00176142,0.00143792,0.00127317,-0.0000684284,-0.00022163,-0.00042256,0.0013493,0.000692235,-0.000000707091,-0.00158773,0.00138344,-0.000627801,-0.00171963,-0.000603593,-0.00118441,0.000279658,-0.000944472,-0.000697435,0.00103723,0.00139753,-0.00152883,0.000621646,0.0000776635,0.00000625983,-0.00110651,0.000516875,-0.00140372,0.000288825,0.000504126,-0.000481697,-0.000632872,0.000637513,-0.000900623,-0.00031404,0.000931889,-0.0000401107,-0.00116648,-0.000746063,0.000198501,-0.0000583914,0.000314715,-0.000317942,0.000480265,0.000323286,-0.000674735,-0.00173082,-0.00137926,0.00140577,0.000400611,-0.000391664,0.00123914,0.00166822,0.000933412,0.000386424,0.000399231,-0.000406445,-0.000900248,0.000989207,0.0000383135,0.000839171,-0.000670077,0.00106209,-0.00121331,0.00132431,-0.000880041,0.00118845,-0.000881828,-0.00000726684,0.00049077,-0.00143659,-0.00130932,-0.00147882,0.00156774,-0.000646794,-0.00114104,0.00041874,0.000577262,0.000565653,0.000209454,-0.000175768,-0.000778087,0.000517675,-0.000850268,0.000119186,-0.00141994,0.000676344,0.00100459,-0.00148485,-0.00107232,0.00035905,-0.000969881,-0.0012518,0.000271153,0.000041136,-0.000649992,-0.00143691,-0.000579526,0.0000291309,-0.00128235,-0.000222651,0.00045398,0.00197677,0.00152101,0.000689454,-0.00071957,0.000768896,0.000802692,-0.00064769,-0.00126674,0.000708138,0.000422841,-0.0012428,-0.000655953,-0.000977793,-0.000090221,0.00122925,-0.00105735,-0.00157343,0.000501776,0.000678937,-0.00055095,0.00103062,0.0000498874,0.00015925,0.001238,0.000680159,-0.000196411,0.00151784,0.000030781,0.000779421,0.000987257,0.000752056,-0.000181139,0.0000746465,0.000771655,-0.000399102,0.0000893647,-0.0000130943,-0.000142602,0.000494299,-0.000117465,0.000203276,-0.00171962,0.00146999,0.00193343,0.00145578,0.00023685,-0.000548337,-0.000486315,-0.000812127,0.000784519,-0.000411604,0.000687379,-0.000793015,0.000716332,0.000357714,-0.00168637,0.000561315,-0.000278611,0.000349944,-0.000650852,-0.00167834,-0.0000423328,0.00126621,0.000296887,-0.00113789,0.000843653,-0.000846106,-0.000157127,0.00115487,0.00135395,0.000413619,-0.0012215,0.0014121,0.000308812,-0.0003317,-0.000790681,-0.000256929,-0.0000809832,-0.00151791,-0.000207561,-0.0000807536,-0.0000876477,-0.00039315,-0.000354297,0.0014363,0.000300705,0.000219112,0.00103586,0.00127924,-0.000478586,-0.000203836,0.0000226088,-0.000379011,0.0000804073,0.000585863,0.000318798,-0.00137449,-0.00117091,-0.00117468,-0.000256107,0.00139293,0.000979026,-0.000271061,0.000172857,0.00106975,0.000320242,-0.000366641,-0.000066436,-0.000470296,0.000778467,0.00119748,0.000178524,-0.000163112,-0.00116195,0.000506542,-0.000255195,-0.00122325,0.000803644,0.000219443,0.00170181,0.00167976,-0.000402091,-0.000729757,0.00103528,-0.00154715,-0.000232158,-0.000803478,-0.000628845,0.000139428,-0.00168394,-0.000214366,-0.000873196,0.00186829,-0.0000872793,-0.0000256778,-0.000943252,-0.000474474,-0.000270119,0.000605914,-0.000920838,0.000789023,0.00001446,-0.000581763,0.000100321,0.000168135,-0.000782536,-0.0015432,-0.000663903,-0.000409957,0.000179051,0.000634857,0.000522944,-0.0000319004,0.0000616505,0.000610797,0.000278612,-0.0000860141,0.000634469,-0.00103751,0.000715663,-0.00105281,-0.00160775,0.000110873,0.00190213,0.0000970895,0.000704097,-0.00189571,0.00182299,-0.000833013,0.00119577,0.000390117,0.000139812,-0.000423377,0.000977007,-0.000888723,-0.000941842,0.00025293,0.000882417,0.000278144,0.000612585,0.00142647,0.000995246,0.000586326,-0.000711763,0.0000758899,-0.00102504,0.00131979,-0.00195074,0.000718048,-0.000126021,-0.000146165,0.000661904,0.000587102,-0.00156443,0.000151893,-0.000901117,-0.000292804,-0.000928673,0.000938734,0.000331032,-0.00130336,0.00152443,-0.000510758,-0.000857788,0.00018262,-0.0000425735,-0.0000682787,-0.000929316,0.0000257312,0.0013052,-0.000413022,-0.00108157,0.00036943,-0.00120388,0.00118361,-0.00164559,-0.00158933,-0.00114828,0.000375844,0.000880593,-0.0000669608,-0.000461977,-0.000891337,-0.000790712,-0.0016616,-0.00154962,-0.00111988,0.00125786,-0.000317778,0.000389853,-0.000855355,0.000566791,0.000879887,-0.000515043,0.000233408,-0.000918978,0.00108228,-0.00122081,0.0000223683,0.000351937,0.00117651,-0.000681096,-0.00129288,-0.00130122,0.000182988,-0.00149815,-0.00152236,-0.0014016,-0.000895501,-0.000944016,-0.000154622,-0.000146337,-0.00138553,0.000140315,0.0000771831,-0.00107183,-0.000540414,-0.000811569,0.000675401,0.000641231,0.000133076,0.00131049,-0.000401427,-0.00125949,-0.00167554,0.000226633,-0.000953657,-0.000011256,0.0000932189,-0.000595596,0.000374324,-0.000573759,-0.00125057,-0.000230787,-0.000448654,0.000775937,0.000773457,-0.0000672549,0.000866676,-0.000913667,-0.000458362,0.0000964471,0.00108121,-0.000241323,-0.000697078,0.000260928,-0.000764594,-0.000401882,-0.000554439,-0.00128688,0.0012498,0.000712335,-0.000882129,0.00108589,-0.00168073,0.00115561,0.000335847,-0.000928975,-0.000757459,-0.000568124,0.000201701,-0.000739638,0.00154093,-0.000418793,-0.0000463864,0.00065931,-0.00168841,0.00114237,-0.00028609,-0.000484372,-0.000127186,-0.000367526,-0.000253853,0.0012475,-0.000287587,-0.000844661,0.000123372,-0.000386738,0.00173541,0.000140488,-0.0000489216,0.0010769,-0.000573221,0.0000283733,0.0010982,0.000544813,0.000539744,-0.00154152,-0.000666345,0.00120149,-0.00106607,0.000856492,-0.000422378,0.000407384,0.0000966026,0.000759491,-0.00108072,-0.00116069,-0.000483912,-0.000509278,0.0000530343,0.000430481,-0.000318635,0.00128473,0.00151271,0.000951302,0.000729086,0.0000325211,0.000599189,-0.000542685,0.000292761,0.00111588,-0.000717291,-0.000719292,-0.000104948,0.00130806,0.000843093,-0.000734176,0.000544488,0.000175078,-0.00148751,0.000120678,0.000821987,-0.000347378,-0.0000291375,0.000517989,0.00074382,-0.000704787,0.000187218,-0.00160026,-0.00144495,-0.000241179,-0.000406592,0.00198494,0.000910479,0.00105927,-0.00142982,-0.000863278,-0.000430299,-0.000141448,0.000747236,0.000590532,-0.00146381,0.0000718071,-0.000300771,0.000356615,-0.000960828,-0.000677901,-0.00179973,-0.00156557,0.00116429,-0.000831745,-0.000349114,0.000693066,-0.000369156,-0.000197531,0.00138278,-0.000320641,0.000186976,0.000272212,-0.000726098,0.000138147,0.0011326,0.000790994,-0.00090791,-0.000272367,0.000212453,-0.000222371,0.00132612,0.0010272,-0.000580987,-0.000695295,0.000484059,-0.00142829,0.00008162,-0.00185307,-0.000775668,-0.000161941,-0.00019473,-0.0000659566,-0.00119252,0.0000601074,0.00139063,-0.000403281,0.000135413,0.00148663,0.000711613,-0.000234109,-0.000969027,0.0000799059,-0.000086077,0.00053831,-0.000344587,-0.00180316,0.00102246,0.0000289997,0.000527111,0.000679524,-0.000150872,0.000660226,0.00113399,0.000933548,-0.000578995,-0.00051973,0.000224347,-0.00127061,-0.000872377,0.000823176,0.00140462,-0.000671645,0.000647303,0.00105344,0.00147365,0.000988741,-0.00162104,0.0000678099,-0.000767015,-0.00170647,0.00127668,0.00120863,-0.00119072,-0.000835016,0.000927195,0.000458337,-0.000468567,-0.00128856,0.000942021,-0.000588508,-0.00107351,0.0000752566,-0.000188954,-0.00114791,-0.00010963,0.00102653,0.00018605,-0.000178064,0.000758929,-0.000138813,0.000789185,0.000149757,-0.0000175456,-0.0000723106,0.000165055,0.000788927,-0.000237613,-0.00108457,0.000675601,0.00155023,0.000533973,0.000411685,-0.000652047,0.00150864,-0.000854586,-0.00194628,-0.00162219,-0.000697717,-0.0000993822,0.000801422,0.00199072,0.0000817023,-0.000594426,-0.000710362,0.000545561,-0.000300458,-0.000836767,0.000795771,-0.00163791,0.00021446,-0.0012725,0.000732455,-0.00011271,-0.000296394,0.00106266,0.00135401,-0.000631887,-0.00015657,0.00121778,-0.000284759,-0.000340677,0.00162903,0.00198334,0.000686512,0.00089799,0.00156455,-0.000834919,0.000232427,0.00142822,0.000403677,-0.00100911,0.000990873,0.0000707823,0.000776564,0.000160616,0.00105791,-0.00182218,-0.0000731089,-0.000120772,0.000023658,-0.000429185,0.0000695688,0.000638882,0.000251888,-0.000295323,-0.00036761,-0.000224153,-0.0000308518,-0.00122502,0.000710251,-0.000855413,-0.000843591,-0.000515206,-0.00146017,0.000205281,0.000468522,0.000816966,0.001091,-0.00104819,0.000353519,-0.000446762,-0.000454996,0.00196944,0.000859978,0.000128527,0.000395811,0.0016487,0.0008039,-0.000840665,-0.0016841,-0.000793964,-0.000377029,-0.000983055,-0.00189412,-0.000157536,0.000619551,-0.00163626,0.00106932,0.000790039,-0.000144004,-0.0011839,-0.00125482,0.00149478,-0.00103383,-0.000471093,0.00130229,-0.00042853,-0.00030987,0.0000515155,-0.00017063,0.00120256,-0.00112301,-0.0012307,0.0000509965,-0.00197865,-0.000446067,0.00147437,0.00191843,-0.000843264,-0.00141315,-0.000480798,0.0010579,0.00146141,-0.00122762,0.000921855,0.000403988,0.000235879,-0.0000147367,-0.00188593,0.00180359,0.00126023,-0.00117119,0.00023174,0.00135992,0.000321424,0.000769917,-0.000618283,0.000905872,-0.000440532,-0.000886984,0.000187283,-0.000181395,0.000279043,-0.000207072,-0.000484367,0.00100704,0.000572686,0.000359368,0.00141213,0.0000170335,-0.00102889,0.000019384,-0.00052567,0.000458852,-0.000273227,-0.0000993676,0.000480693,0.0011694,0.00023044,0.00179178,-0.0000542944,0.000213019,0.00158746,0.00182753,0.00118854,-0.000104298,-0.000813337,0.000657909,0.000956623,-0.000183719,0.00153834,-0.00118292,0.00098147,-0.000764687,0.00109794,-0.00115359,0.00163315,-0.0011591,-0.000596467,-0.000951912,-0.00100473,-0.0000654095,0.000525549,-0.000138844,0.00105971,0.000101061,0.000601267,0.000179063,-0.0000962197,0.000368043,-0.000553367,-0.00183954,-0.000500717,0.00157539,-0.000756738,0.00112361,-0.00170469,0.00105061,0.00024957,0.000512454,-0.000636753,0.000140133,-0.00127773,-0.000614583,-0.000414145,-0.00139233,0.000213223,-0.000544369,-0.0000793841,-0.00161624,0.000849171,0.0000681145,0.000387296,-0.00161011,0.00190211,0.00171898,-0.000194919,0.0000585788,-0.000489162,0.000602103,0.00111019,0.0000885901,-0.000107409,-0.000151297,0.00111722,-0.00118616,0.000259761,-0.00123397,-0.000993168,-0.00062712,-0.000385915,0.00112258,0.000721087,-0.00159903,-0.000864305,0.000645174,0.00156229,-0.00135062,-0.000450366,0.000203465,0.00190523,0.0000919673,-0.000336619,-0.000814153,-0.000880708,-0.000994182,0.00112924,0.000445979,-0.000433669,-0.000622127,0.000562232,0.000745458,-0.00169017,0.000715195,0.000141325,-0.0000780149,-0.0000217626,-0.000799649,-0.0000199594,0.000027971,0.000129787,-0.000141571,-0.000762869,0.000709572,0.000123182,-0.0000754477,0.000248942,0.000310554,-0.000174395,-0.00137647,0.0013321,-0.00156089,0.00091495,0.0000378404,-0.00099866,-0.000648101,-0.000343978,0.000248793,-0.00176139,0.00108193,0.000192789,0.000688794,0.000503313,-0.000666696,-0.000959053,0.000693579,0.000745546,0.00164885,-0.000635156,0.000626746,0.000360652,0.00122043,-0.000634115,0.00127406,0.000727181,-0.000527157,-0.000337256,-0.000327014,-0.000943344,0.00100884,-0.00184295,0.000783266,0.000873156,0.00105016,-0.000265284,-0.00115802,-0.000206182,-0.000897179,0.00133249,-0.000884856,-0.00172443,0.000929681,0.00141452,0.0000410592,-0.000858481,-0.000577519,0.00179786,0.0004863,-0.00130649,-0.000903336,-0.00189117,-0.000604586,-0.000793329,0.000768223,0.000913875,0.000475175,0.000643733,0.000667505,0.000715929,0.000753606,0.000265975,0.0019968,0.000381379,0.00013119,-0.000535979,0.000611367,0.000306209,-0.000383208,-0.000725337,-0.000758564,0.000801435,0.0000707652,-0.000519076,-0.000051656,-0.00116027,0.000255303,-0.00154978,-0.000118458,-0.000303054,-0.00189364,0.000380735,0.000570501,-0.000726961,0.00073667,-0.0000665543,0.00107214,0.000819866,0.00135712,-0.00185684,0.00155656,-0.00101762,-0.00018645,0.000488884,-0.000141308,0.0015288,-0.000963729,-0.000918324,0.00064815,-0.00056448,-0.000200636,-0.00142252,0.0009668,-0.00036689,0.00137176,0.000636587,0.000142309,0.000887902,0.000698265,0.000263981,0.000897659,-0.000484427,-0.00150621,0.00084962,0.00101783,0.00125243,0.000735617,-0.000203118,-0.000511082,-0.000924354,0.0011506,0.00188397,0.00174929,-0.00105065,-0.000149283,-0.000552912,-0.000389549,0.00026665,-0.000221754,0.00123205,0.000965925,-0.000466531,-0.000823419,0.000462792,0.000208385,-0.00162052,-0.000177833,0.000531455,0.000154001,-0.00109147,0.000337158,-0.000665977,0.000175891,0.000246046,-0.0003065,-0.00027362,-0.0000853759,-0.000806854,0.000525837,-0.000906859,-0.00137202,-0.00116331,-0.000700147,-0.000821073,-0.000803987,0.000507226,0.00171682,0.000392979,0.000472849,-0.000070249,0.000612413,-0.000328005,0.000706153,0.000637604,0.000538928,-0.000710624,0.00177847,-0.000738577,0.00111847,0.00016983,0.000654133,0.000180918,-0.00161187,0.00117287,0.00117005,-0.0016845,0.00188756,0.000240727,-0.000125875,-0.00158266,-0.000827227,0.000924559,-0.000633985,-0.000147259,-0.000240536,-0.00088609,0.000281454,0.000869415,0.0000165228,-0.000116874,0.000167029,-0.000218828,0.0010353,-0.000606691,0.00133952,0.0000546545,-0.00130795,0.000671884,0.000612276,-0.000692952,-0.0000779731,-0.000100505,-0.000671415,-0.00103377,-0.00151563,-0.000515027,0.000935559,-0.00171652,0.000102293,-0.000730082,0.0000691329,-0.000529275,-0.00033102,0.00156551,-0.000124897,-0.0000784797,0.000142452,0.000317824,-0.000415814,-0.000554989,0.000182273,0.000689985,0.000320175,-0.000387075,-0.00115866,-0.000281684,0.000909045,-0.00117099,-0.000635972,-0.00117869,-0.0000511691,-0.00191872,-0.000179971,0.000244972,0.000145113,-0.000383125,-0.0000873866,-0.00109724,-0.00108265,-0.00154038,-0.000366424,0.00112477,0.0000625393,-0.0000652369,0.00130013,-0.000164819,-0.0000686726,-0.000755303,0.000643161,0.001337,-0.000867818,-0.000480266,-0.000510306,0.000623962,0.000125587,0.000012965,-0.000656084,0.00148622,0.0018142,0.000852745,-0.000214414,-0.00159149,0.000898512,-0.000665649,-0.00147916,0.000763403,0.0000139865,-0.00131433,0.000303835,0.000947552,-0.000588453,-0.0000174431,0.000915152,0.00105631,-0.000556435,-0.000225757,0.000225258,0.00176908,-0.000740145,0.000525131,0.000532074,-0.000297856,-0.000331476,-0.000955411,-0.00015666,-0.0000664009,0.00163378,0.0000906923,-0.000101502,0.000903761,-0.000474674,-0.00116596,-0.000665223,-0.000358699,0.000920161,-0.00053369,-0.000545069,-0.000693341,-0.000803547,-0.000504516,0.00198681,0.000252584,-0.000199206,0.0000162005,0.0000858841,-0.000774794,-0.00116307,0.000220006,-0.000306983,0.00082354,-0.000420446,0.00120833,0.00113464,0.0000475691,0.00139635,0.0001161,0.0000434449,-0.00000637857,0.000755139,-0.000907362,0.000534091,0.000451975,-0.000837384,0.000994083,-0.00102934,-0.000362965,0.0010393,-0.000173114,0.0009147,0.000617766,0.000935719,0.000811761,0.000184844,-0.000691837,-0.00135735,0.0000427982,0.000623958,-0.00156083,-0.000981156,0.000186413,0.000645166,0.00107993,-0.00109391,0.00115328,0.00119238,0.0000529251,0.000347863,-0.000672,0.00162732,-0.000246647,0.000803303,-0.000539642,0.00140243,-0.00102008,0.000000807418,0.00146416,0.00183853,-0.00168334,0.00101907,0.00151386,-0.000132495,0.000180434,-0.00197964,0.00121943,-0.000762874,-0.0000556697,0.000504452,-0.0010585,-0.00127312,-0.00198837,-0.00169983,0.000732248,-0.00114153,-0.000289967,-0.000951054,-0.00119659,0.0000445827,0.000894357,-0.000873144,-0.000622803,0.0000259074,-0.000486192,-0.0000948832,-0.0015358,-0.00058985,0.00124304,-0.00159566,-0.000316053,0.00159423,0.00105794,-0.000305872,0.000995916,-0.00112203,0.000415825,0.000251377,-0.000600538,0.000038579,-0.00000832602,-0.00130387,-0.000937653,-0.000331405,-0.000595219,-0.00094968,-0.00049372,-0.00179629,0.000390333,-0.00167207,0.00184488,0.000307196,0.00122292,-0.000488578,0.00086664,-0.00116165,0.001009,0.000150835,0.000702026,-0.000385974,-0.00138591,0.000200555,-0.000387652,0.00057204,0.000763749,0.000337657,0.000911588,0.000761579,0.00131204,0.000286869,0.000641994,-0.000861535,0.000597999,0.000754098,-0.00120798,-0.00098655,0.000486763,0.000492371,0.000120531,-0.000595694,0.000136395,0.000619905,0.0002689,0.0000742896,-0.000609738,-0.000566226,0.00127477,-0.00159655,0.00144285,0.000602454,-0.00152831,0.000124775,0.000574455,0.0000242968,-0.000205071,-0.00136805,-0.00188103,0.00105176,0.00152635,0.00151088,-0.000708937,0.0000438486,-0.000762444,-0.000895718,-0.000994548,-0.000983062,0.000746865,-0.0000208613,0.00127611,-0.000563585,0.000655929,0.000203107,-0.000700396,-0.00167037,-0.0010705,0.00102036,-0.000935876,0.0000777493,0.000208114,-0.0000725165,0.00154173,-0.00128523,-0.00038969,0.000291925,-0.00160846,0.00081963,0.0000576639,0.00143584,0.0000714264,0.00109077,-0.000605535,-0.000658794,0.000353919,-0.000591688,-0.0000914209,0.000852801,0.00038272,0.000647349,-0.000593662,-0.000408856,0.00082469,0.00121369,0.0010478,0.000862615,-0.0019327,0.000975888,0.000391155,0.000420911,-0.000273481,-0.00107805,-0.000202975,-0.000225527,-0.000266293,-0.00185612,0.00063899,0.00160592,-0.0010686,0.000755917,0.000909739,0.000167381,-0.000508576,0.00134584,-0.00151801,-0.00103559,0.000969642,-0.000013624,-0.000424924,-0.000875397,-0.00062805,0.0000150583,0.000739217,0.00121013,0.000269873,-0.000924539,0.00140904,-0.000774723,0.000563127,-0.000541837,0.0000788511,0.000173433,-0.00127203,0.00156251,0.000259305,-0.00105604,-0.000386714,-0.00000262178,-0.000140358,0.000408087,0.000476691,-0.000795968,-0.000912194,0.00145068,0.000774622,0.000517036,-0.000919313,0.00000272233,0.0000201933,0.00178246,0.00077041,-0.00117398,0.000402588,0.000198504,-0.000625799,-0.000208217,0.00111743,0.00118281,0.000902215,0.000233886,0.000473873,0.00100981,0.000169804,-0.00126166,0.000513572,0.0016747,-0.000547134,0.000642416,0.00169637,-0.000710892,0.000912992,-0.000142897,-0.000885651,-0.000273198,0.000355938,-0.000732422,0.000418829,-0.0014183,0.000496644,-0.000755225,0.000953593,-0.000942453,-0.000573257,0.0000516134,-0.00013815,-0.000460957,0.000947778,-0.00125652,-0.000589404,0.000560024,0.000995947,0.000812855,-0.000612228,0.000536282,-0.000795906,0.000470647,-0.000141176,0.000855418,-0.000888666,0.00045147,0.000584934,-0.000127195,-0.000687122,-0.000102379,-0.0000292063,-0.000615403,-0.00175038,0.000530338,-0.000521713,-0.000183423,0.000272224,0.000615424,0.000864145,-0.000151811,0.000147488,-0.00095098,0.00157819,-0.00056977,-0.000536093,-0.00100756,0.0012233,-0.0000860982,0.0010375,0.000982005,0.00072883,0.00150791,-0.000442772,0.000958534,0.00107231,0.000551897,0.000428275,0.00068055,-0.00125525,0.000941992,-0.000693176,-0.000445885,-0.000962315,0.000189057,0.00012235,0.000172288,-0.000321478,0.000701296,-0.000806054,0.000467524,-0.00024011,0.00174057,-0.00131733,0.00157813,-0.000538381,-0.000496077,-0.000288731,0.00129801,0.000286578,0.000115442,-0.000155452,0.00140236,0.00000305822,-0.0000964326,-0.00167435,-0.000763243,-0.000191531,-0.000802551,-0.000797727,0.000639007,0.0000201908,-0.00123566,0.0014323,-0.0000246077,0.0000115595,0.000345252,-0.00144295,-0.0000194254,-0.000052978,0.00122078,-0.00104009,0.000566502,0.00168698,0.00183881,0.000646569,-0.00083138,-0.000276847,0.000427019,-0.000417019,-0.000598453,0.000280634,0.000406459,0.000504031,-0.000309387,-0.0000342454,-0.000974993,0.00161933,-0.00100617,0.00016089,0.000252543,0.00138916,0.000545602,0.000908721,-0.000330267,-0.00125505,0.00109068,0.000554437,-0.00125967,0.000675985,0.00061823,-0.000351166,0.000118309,-0.000886943,0.00156211,0.00142158,0.000302327,-0.0000410321,-0.00020137,-0.00197369,0.000982519,-0.0000573997,-0.000352056,0.000882719,-0.0013544,-0.000527741,0.000000237573,0.000182777,-0.000271595,0.00109137,0.00128494,0.000626406,-0.00105658,-0.00151499,-0.000559211,-0.000363759,-0.0000267001,-0.000679946,-0.000506721,-0.00128847,-0.000624122,-0.000684841,0.0000286826,0.000464906,-0.000375188,-0.000459034,0.00136429,-0.000411834,-0.000544603,-0.000246729,0.000880355,0.000853667,-0.00150638,0.000666132,0.00129642,-0.00182543,0.000297735,-0.00031915,-0.000378809,0.000964939,-0.000743506,-0.00152053,-0.00134618,-0.00145224,-0.000232837,0.000673215,-0.00134387,0.00188873,0.000794609,-0.000291914,0.000258691,0.000514006,-0.000123913,-0.00090116,0.000562919,-0.000186379,-0.000410714,0.0000993146,-0.000451559,-0.000132432,0.000310323,-0.00107947,-0.00119463,0.000110592,0.00120002,-0.000550115,0.000862441,0.000423979,0.00162345,0.00113067,0.000869715,-0.0011526,0.000430006,0.000134093,0.000566584,-0.00131575,-0.0000684888,-0.0011998,0.000339154,0.00101207,-0.000517827,-0.00151853,-0.000741035,0.000732346,0.00012827,0.0012017,-0.000538229,-0.000538589,0.000669856,-0.00127033,-0.000348013,-0.000142202,0.00000729129,-0.000643318,0.000846451,0.000590474,0.000616003,-0.000521241,0.00108259,-0.000287548,-0.00061111,0.000948375,0.00121373,-0.00163191,0.00110983,-0.0000680837,-0.0000168547,0.0000577638,-0.00186765,-0.000172419,-0.000560391,0.000127449,0.000382456,-0.000372612,-0.0000551872,0.0000542807,0.0000272091,-0.000587391,0.00140284,-0.00106786,-0.0011284,-0.000949925,-0.000415549,-0.00080017,-0.000536365,-0.000334531,0.00187344,-0.000599542,-0.000595889,-0.000301919,-0.000451092,0.000786108,0.000818254,-0.00125003,-0.00132116,-0.000149572,-0.000232781,-0.000739884,0.000451163,-0.000755047,-0.000512326,-0.000439269,0.000098149,-0.0000564748,-0.000549478,-0.000844787,-0.000300787,-0.000633253,0.00141444,0.00109055,-0.000740559,-0.000103082,0.000718016,0.0000802796,0.000762605,0.000684894,0.00120618,-0.000630136,0.00139036,0.000565794,0.000716378,0.000845053,0.000703003,-0.000746175,-0.000324415,-0.000910016,-0.000458656,-0.00101888,0.0010806,-0.00115207,0.00085255,-0.000614043,-0.000640062,0.00041576,-0.0000211001,0.000117607,-0.00176975,-0.000474091,-0.000310436,-0.0000904056,-0.000727125,0.000154607,0.000149904,0.000125386,-0.000374098,-0.00110035,0.000832771,0.00108597,-0.00147903,0.000232728,-0.000875649,-0.000543692,-0.0000765037,0.00134421,-0.000164802,-0.00108501,0.000350464,-0.000245445,-0.000085656,0.000431902,-0.00142934,0.000334438,-0.000041833,0.000333403,-0.000232097,-0.000492198,-0.000319426,0.000173502,-0.000300904,-0.00096613,-0.000475417,-0.000693835,0.000842754,-0.00007938,-0.00111456,0.000866211,0.0000437214,0.000208595,0.000961046,-0.000179202,-0.00108062,-0.000846507,-0.00016235,0.00170921,-0.000669011,0.000732141,-0.0000826396,0.00145133,0.000912806,0.000171483,0.0000291617,-0.00169504,0.000761671,-0.00052647,0.000911782,0.00102042,0.000584039,0.00101285,-0.000456834,-0.000273589,0.00107666,0.000117437,0.000209721,0.000843981,0.000936109,-0.00024364,0.00167143,0.000136212,-0.00146704,0.00110411,0.0004009,0.00100735,0.000676054,-0.000490933,-0.000915051,-0.000132253,0.00198238,0.00166333,-0.000674041,0.00111439,0.000816678,-0.000509016,-0.00100613,-0.000110101,-0.000761069,0.00000139997,0.000168607,-0.00096287,-0.00107281,-0.00031421,0.000310831,-0.0007672,-0.000346945,0.0000303487,0.000846693,0.00106397,0.000736702,-0.000236792,-0.000343752,-0.000533844,0.000938609,0.00117816,0.000948744,0.000690729,-0.00143815,0.000672122,0.00082659,0.000924281,0.0012793,-0.000236622,0.000491017,0.00028548,0.00136938,-0.000172153,0.00071291,-0.000507072,-0.00173211,0.000239179,-0.000928608,0.000224178,0.00183075,0.000235217,-0.000550683,-0.00183398,-0.000161173,0.000185579,0.000869517,0.000494622,-0.0007059,-0.000388363,-0.000558445,0.00123647,-0.000266574,0.000375829,0.000991279,0.0016386,0.00162609,0.000662972,0.0000585979,0.000279305,0.00122729,0.000999763,-0.00107894,-0.00114173,-0.000805777,0.00193038,0.000350163,-0.0000679923,0.000127257,0.00063957,-0.000430451,-0.000098172,-0.0000526079,-0.0000326945,0.00168674,-0.00153122,0.00028469,0.000843319,-0.000966343,0.00147391,-0.00151143,-0.000918863,-0.00183176,0.00083367,0.00196316,0.000831159,-0.000910889,-0.00154979,-0.00000595366,-0.00100571,-0.00127284,0.00076265,0.00110756,0.00145764,0.00166089,-0.000269752,-0.000227301,-0.0000444632,-0.00023514,0.000269156,-0.000469988,0.00111281,0.000167962,-0.00144874,-0.00143971,-0.000566432,0.00110733,-0.0019366,-0.000272193,0.000052267,0.000065926,0.0000893807,0.000794733,-0.000831829,-0.00147989,0.000177873,-0.0000384809,-0.00127563,-0.000509443,-0.000670605,0.000103763,-0.0000574895,-0.00140249,-0.0000116707,0.000245325,-0.000794286,0.00114584,0.000788599,-0.000871041,-0.00174771,0.0011873,-0.00142443,-0.00017131,-0.000456707,-0.000106301,-0.000632554,-0.000443171,-0.000628397,-0.00184051,-0.000357105,0.000203239,0.00112337,-0.000331754,-0.00105095,-0.000572581,-0.000650244,-0.0000921613,-0.000863891,-0.00162989,-0.000680095,-0.00156574,-0.000124565,-0.00000835104,0.00173858,-0.000873279,-0.00108788,-0.00146264,-0.000480657,0.00112709,-0.00129674,0.000929399,0.0000298675,-0.000652404,0.000124398,-0.000258499,-0.0000973581,0.000726072,-0.000448489,-0.000417071,0.000492756,0.00121309,-0.0010379,0.00150889,-0.000347399,0.000672868,0.000282346,-0.000820381,-0.00109066,-0.000937673,-0.000575604,-0.000439227,0.00081721,0.000231673,0.00114353,0.000124568,-0.000589226,0.0001338,-0.0012239,-0.00177894,-0.000642461,-0.000806607,0.000257719,-0.000351927,-0.000407206,0.000665406,0.000834843,-0.000615283,0.000400379,0.000473994,0.00000242595,-0.00186754,-0.00188049,-0.000800177,-0.00105924,0.000045641,0.001321,0.000451335,-0.000931572,-0.000596846,-0.00106934,-0.0000453354,-0.0000258001,-0.000193018,0.00139729,0.00141638,-0.000112106,-0.000194896,0.00148164,0.000313086,-0.000301849,-0.0000495672,-0.00120971,0.000534599,-0.00105981,0.000120916,0.00166345,0.000567247,0.000145402,0.00113515,-0.00106973,0.000706074,0.000091163,-0.000986014,0.000301681,-0.0017091,-0.0017227,-0.0011921,0.000059315,-0.00103682,0.000276416,-0.000392327,-0.000542839,-0.00074248,-0.000226737,0.00135193,0.000747974,0.00151078,0.000464175,-0.00154567,0.00152405,0.000140251,-0.000569071,-0.000526494,0.00191055,-0.00134619,-0.000127449,0.000136268,-0.0000351869,-0.000088397,-0.00176117,0.000597006,-0.000250834,-0.00115977,-0.000330829,0.000136761,0.00133496,-0.00111508,0.00098224,0.000695533,-0.0000271685,0.0000639446,0.00109357,0.00187876,0.000114047,0.000276378,0.00146872,0.000786063,-0.0000451062,-0.000856884,0.000643486,-0.000203687,0.000341753,0.000334859,-0.000302239,0.000138836,-0.00000793728,-0.000948383,-0.000885798,0.000158056,-0.00111228,0.0010942,0.00118165,0.000300158,-0.000158439,0.000243361,0.00170079,0.000968191,-0.00148578,-0.00133197,0.0000798421,0.00132953,-0.000436042,-0.00067044,-0.00000539866,0.00018528,0.000215901,-0.0000239136,0.00028919,0.00154344,0.00141007,-0.000451346,-0.00108266,0.00125516,0.000405056,-0.0004381,-0.00141533,0.000845212,-0.00161365,-0.00155945,-0.00118477,-0.00160924,-0.000894911,0.000813065,-0.000482214,0.00121065,-0.000632861,0.00176611,0.00099151,-0.000389934,0.000611423,-0.00115154,0.000322233,-0.000956151,0.000541724,0.000561831,-0.000556218,0.000340012,0.00015887,0.00047056,0.000153416,0.000290406,-0.000539708,-0.000698179,-0.000286846,-0.000748154,0.000498428,0.00000464493,0.000394531,-0.000308056,0.000909767,-0.000882798,-0.000248063,-0.000263408,0.000897806,-0.00130487,0.000478412,0.00057623,-0.000843701,0.000376132,-0.0000474505,-0.00065415,-0.000218983,0.000968658,0.000915954,0.000893451,0.00155696,0.000855268,0.00000925971,0.000628432,-0.000494395,-0.000605939,0.00108731,0.000312756,-0.000293009,-0.000122374,0.00174707,-0.00122898,0.000559601,0.000574148,0.00166831,0.00111184,0.000475879,0.000381004,-0.000428656,-0.000281372,0.00131846,-0.000245593,-0.000403475,-0.000356213,0.00159483,0.000371065,0.000294711,-0.00124936,0.00014018,-0.0010262,0.000901647,-0.000527081,0.000127581,-0.000520671,-0.0000590322,-0.00108878,0.00069773,-0.000630501,0.0003696,-0.0010187,0.000831548,0.00169983,-0.000436015,0.00136808,-0.00149437,0.00159135,-0.00175122,-0.000773452,0.00147884,-0.00155423,-0.000297986,0.000181215,-0.000427827,-0.000453914,-0.00001039,0.00194704,0.00117868,0.000218581,-0.000731476,-0.00106037,0.000357336,-0.000508838,0.0000974012,-0.000374244,0.000941799,0.000606344,-0.00151092,-0.000301472,-0.000473373,0.001134,0.00143967,0.0000762573,-0.000769642,0.000667735,0.00115737,-0.000783119,-0.000815976,0.000149933,0.000898607,0.000283868,-0.000601347,0.000913664,0.000815617,-0.000149095,-0.000447208,-0.000494984,0.00110414,-0.000185435,-0.00105683,-0.000346478,-0.00110876,-0.000582435,-0.000217119,0.000286078,0.000846174,0.000482408,-0.00124262,-0.0000569729,0.00090198,0.000194972,0.00120885,-0.000815406,-0.000656788,-0.000131933,0.000332393,0.0000412553,-0.000248858,-0.000981778,0.0000137248,-0.00132608,-0.000582425,0.00120252,-0.000575386,-0.00169879,0.00147695,0.000723468,0.000276154,-0.00155143,0.00114478,-0.000795771,0.00122933,-0.0011654,0.0012551,-0.00044132,-0.00114404,-0.00160585,0.000492869,-0.00101089,-0.000408167,-0.000845331,-0.0000712857,0.00105084,0.000632972,0.00144686,-0.00121552,-0.000275097,0.0000933722,0.000928574,0.000920011,0.000683944,0.000248375,0.000765212,0.000742706,-0.00119443,-0.00147179,-0.000818919,-0.000376668,0.00110776,0.00151989,-0.00111451,0.0008594,0.000675858,-0.0000330307,0.000352864,-0.000364374,0.00141282,-0.00120322,-0.00171063,0.000388934,-0.00023153,0.000506975,-0.000443232,0.000465472,0.000467924,0.000114883,0.000598409,-0.00166022,0.00122876,0.000213743,-0.00132525,0.0010846,-0.000990292,-0.0000957595,-0.00025465,-0.00127711,-0.0000194031,-0.000477531,-0.000761119,-0.00130927,-0.0001537,-0.00027441,0.0000426227,0.00055591,0.000987081,-0.000146996,-0.00155783,-0.00102692,-0.000271533,-0.000287036,0.00167168,-0.000386687,0.000526463,-0.00114478,-0.000851666,-0.000919667,-0.00125239,0.0011208,0.00134076,-0.00126031,-0.000713903,0.00110026,-0.00076708,0.00130953,-0.000175377,-0.000686941,-0.000284679,-0.0000701566,0.000694369,0.000266375,0.00123808,-0.000362977,-0.00029335,-0.0010371,0.000296803,0.000233869,0.000922014,-0.000373594,-0.000036378,-0.00190395,-0.0000227794,0.00142573,-0.00029408,0.000740207,-0.000265835,-0.00169566,-0.000590073,0.000602402,0.0013049,-0.000202298,0.00127153,-0.000189939,0.000375557,-0.00112103,0.000850732,0.000927818,-0.0007049,-0.0016292,-0.00069723,0.000879966,0.00123935,0.000337963,0.000811389,0.000497551,-0.000902223,0.00133111,0.00124862,0.00012585,0.00124381,-0.000283016,0.0014863,0.000217757,0.0000329029,0.00107148,0.000898809,-0.00114151,0.00046429,-0.000658522,0.00062835,0.000675047,-0.000850041,-0.000438568,0.000742585,-0.0000208749,-0.000632903,0.000100416,0.000593751,0.00154151,0.000858026,0.00187186,0.00012161,-0.000588871,-0.000892682,-0.000645998,-0.00132017,-0.0000959663,-0.000330983,0.00123479,0.00161201,-0.000965814,-0.0000688347,-0.00044836,0.0000535499,0.000317976,-0.000194833,0.0005277,-0.000662029,-0.000611552,-0.00135721,-0.000268369,0.000543263,-0.00105326,-0.00155134,-0.00104523,0.000186415,0.000236757,-0.000923079,-0.00117322,0.00160353,0.00131681,-0.000693928,-0.000130783,0.00174004,0.00129264,0.00126921,0.00154733,0.00167541,0.000440209,0.0000296227,0.000781929,-0.000141162,-0.00161346,-0.00135406,0.00107161,-0.000240529,0.000076817,0.00055892,-0.000186961,0.00139302,-0.000510538,0.000150945,0.000638428,-0.00151667,-0.00072139,0.000488569,0.000952493,0.000387288,-0.000466817,-0.000187759,-0.000114105,-0.000482141,-0.00116274,-0.000246505,-0.000275552,0.000764466,0.000669669,0.00107959,0.000802531,-0.000107631,0.00114153,0.000586614,-0.00116149,0.000971632,-0.000108561,0.000454411,0.00130098,0.000118215,-0.000366948,0.000606952,-0.000113953,0.000734748,0.000578023,-0.000484005,0.000508987,-0.000597833,-0.000173302,0.000539857,-0.0008853,-0.000026043,-0.000963799,0.000117664,-0.000469579,0.000158941,0.000818138,-0.000317238,-0.00147452,-0.000824098,0.00192418,0.00167665,-0.000632647,-0.00048872,0.000321129,0.000391928,-0.000551031,0.000222498,-0.000738243,0.000126353,-0.0012702,-0.00123918,0.000768652,0.000153356,0.00175079,0.000874628,0.00124523,0.00066978,-0.00178004,0.000560858,0.000402499,-0.00111115,0.00138901,-0.00011803,0.00055181,-0.00106894,-0.00108934,-0.00127015,-0.000886546,-0.000747765,-0.00125896,-0.000414755,-0.000108591,-0.000413392,0.000614798,-0.00190616,-0.00178187,0.000353129,0.0000140771,-0.000113309,0.000509283,0.000925473,0.00134821,-0.0008414,-0.000129822,-0.00145847,-0.00157606,0.001024,-0.000215901,-0.000975683,-0.00123143,-0.00000574846,0.00124207,-0.000793181,-0.000558093,-0.0000058991,0.000407052,0.000951704,-0.00119065,-0.0000737759,-0.000486601,0.000118764,-0.00188318,0.00116977,0.00157115,0.00013673,0.000138821,0.0018726,0.000353863,-0.000506536,-0.000396585,-0.00154792,0.00102142,-0.00128367,-0.000508538,-0.000209182,-0.000319007,0.000207139,0.000179982,0.000797584,-0.00189821,-0.000638396,-0.00165687,0.00192932,-0.000289529,-0.00123743,-0.000262943,-0.00131335,0.0000037018,0.000503867,-0.000959988,0.000810201,-0.000279687,-0.000134951,-0.00143663,0.00165875,-0.00104727,-0.00160563,0.0010426,-0.00131236,-0.000471816,0.000381421,0.000311645,0.00101231,-0.000212408,-0.00146774,-0.00101302,-0.000192205,0.000582007,-0.000229789,-0.000281199,-0.00114161,-0.00125505,0.000741321,0.00189931,-0.00183351,0.000771486,-0.00060454,0.00113391,0.00102083,0.000534169,0.00145262,-0.00028586,-0.00096695,0.000508138,-0.000501527,0.000867742,-0.00194176,-0.000522029,0.000267683,0.00127887,-0.000199837,0.000855029,-0.00000334849,-0.0000131306,0.000940161,-0.00000385862,0.000209183,-0.000829988,0.000106268,-0.000513774,0.000553233,0.00173523,-0.00115531,-0.000856849,-0.00168573,0.000350205,0.00143522,0.0001773,0.000734307,0.000600922,0.000894979,0.000344769,-0.000498495,0.00126996,-0.000260972,0.000349595,0.000408386,0.000204421,-0.000792252,-0.00196191,0.00169059,-0.000747282,0.0000964617,0.000257997,-0.000954171,0.000433083,0.00050373,0.00125762,0.000879463,-0.000466812,0.000324984,0.00128527,0.000334013,0.000483818,-0.00111548,0.00127601,-0.000467827,-0.00112178,0.00144268,-0.00166474,-0.000450774,0.000807053,-0.000265792,0.000761878,-0.0000522767,-0.00075507,-0.000244933,0.000377279,-0.00148974,-0.00038231,-0.00107336,-0.000749849,0.000758071,0.000329534,-0.000420979,-0.00148322,0.00143645,-0.00014748,-0.00068993,0.000675007,0.0000919093,-0.000833066,0.00145735,0.000469536,-0.000114209,-0.000509931,-0.000269669,-0.000637428,0.00127081,-0.00194439,0.000341056,0.00010402,-0.000541392,0.000755839,-0.00000833283,0.000326158,-0.000645982,0.00108474,0.000866448,0.00108998,0.000822017,0.000933234,0.00117216,0.000322307,0.000474449,0.00106704,0.000666904,0.000391124,-0.00029216,0.00014506,-0.000485088,-0.000239763,-0.00101466,-0.000752682,0.000348364,0.00107086,0.0000697963,-0.0000407116,-0.000627548,-0.000123153,-0.000431088,0.000298085,0.00176339,0.00180084,-0.000786972,-0.000195107,0.000583366,0.00111623,-0.00051551,0.00111402,0.000434677,-0.000111996,0.00111263,-0.000527413,-0.000533244,-0.0000401902,-0.000732368,0.000899756,-0.0000164859,-0.000223284,0.000217673,-0.000321445,0.000682657,0.000194876,0.00000768445,-0.000431664,0.000380112,-0.000622261,0.000407774,0.00000795478,0.000617816,0.000705179,0.00110847,0.000524475,0.0000771649,0.000187307,0.00129998,-0.000643033,-0.000931516,0.00120623,0.000242088,0.000323746,0.00148855,0.00157118,-0.00184458,-0.00117009,-0.000477221,0.000177334,-0.000538374,-0.000192397,0.000521077,-0.000294126,-0.000662292,0.000017274,-0.00111828,0.00190658,0.0010673,0.000851187,-0.000808245,0.00082828,-0.000561239,-0.00128518,-0.00109036,-0.000926938,-0.00025722,-0.0000643371,0.00105431,-0.000925322,-0.00160221,0.000902804,0.000701003,0.000417659,0.000333467,-0.000910054,-0.00113201,-0.000131107,0.0006495,0.00122534,0.000413537,-0.0011087,0.00133816,0.000634419,-0.000689048,-0.000142568,-0.0000789831,-0.00110788,-0.00192211,-0.000407558,-0.000542939,-0.00123601,-0.00107088,-0.000518355,0.000439416,-0.000179469,0.000636129,0.000478498,0.000330149,0.00100408,0.0013636,0.000357151,-0.00137527,-0.00184872,0.00142575,-0.00155778,0.0014559,0.000223484,-0.00106535,-0.000721987,-0.000244366,0.000759175,-0.000196732,0.0015246,-0.000688205,-0.000385123,-0.00000436154,0.000977732,-0.0000089107,0.000623774,0.000575841,0.000230397,-0.000679017,-0.000437788,-0.000268172,0.000731177,0.000835289,0.000731201,0.0000712315,-0.000296204,-0.000400441,0.000174816,0.000905003,0.00177366,0.000232942,-0.000469937,0.000186959,0.000139736,0.00149932,0.00051894,0.0000773784,-0.000147819,0.000339624,0.000619721,-0.000683172,0.000520481,0.000126689,-0.000356946,-0.00197361,-0.00119003,0.000407774,0.000117493,0.00107155,-0.000510127,0.000814496,0.000768795,-0.000416214,-0.000587937,0.000882508,-0.00024153,0.00161706,-0.000265701,0.000162635,0.000189857,0.000130573,0.00113939,-0.000363403,0.000788794,-0.0006477,-0.000423206,0.000154564,-0.000235909,-0.000598158,-0.000624176,0.000126756,0.000154774,-0.00127058,0.00019287,-0.00135607,0.00019502,-0.000419249,0.000103601,-0.00106226,-0.000948643,-0.000487021,0.000084251,0.00178183,-0.000630472,0.000197823,-0.000157947,-0.00114719,-0.000255586,-0.00196182,-0.000304829,-0.000840088,0.00163482,-0.000108821,-0.000307724,0.00177821,0.000212986,0.000699965,0.000275379,0.000332588,0.000316309,0.000389782,0.00000751403,0.000476655,0.000711818,-0.000432891,-0.000672043,-0.000842001,0.00108951,-0.00117472,0.00137887,-0.00107003,-0.00177464,-0.000484646,-0.000432477,0.000282827,0.000830522,0.000562201,0.000355123,-0.000302133,0.000433291,0.000154443,0.0000313146,0.00181823,0.000848855,0.00110215,0.000684424,-0.00122754,0.00011905,0.0000334175,-0.000623768,-0.000902067,-0.00129292,-0.00088616,-0.000514336,-0.00146209,-0.00177009,0.00144764,0.000440328,0.000224679,0.000888101,0.000333877,-0.00169398,-0.000374868,0.00084307,0.00138439,-0.000876752,-0.00167081,-0.00183006,0.000132733,0.0000362738,0.000214646,0.000228906,-0.000120811,0.000495814,-0.000232298,0.000642517,0.000423256,0.000558399,-0.000560979,0.000137283,-0.00158166,0.0000944979,0.0000157705,0.001054,0.000656256,-0.000432687,0.000725864,0.00127346,-0.000467358,-0.000610688,-0.00149659,0.0017074,-0.000355493,-0.000844531,0.000233806,-0.00103295,0.000471212,-0.000835798,0.0000250656,-0.00182403,-0.00100945,0.000127779,-0.00091001,0.000848537,-0.000406957,0.000329441,-0.000432698,0.000470878,0.00150579,-0.00102841,-0.000800046,-0.00104238,-0.00028888,0.0011953,-0.000769801,-0.000700907,-0.00189241,0.000219913,-0.000406775,-0.000551643,-0.000204152,0.000608219,0.00120393,-0.000950181,0.000711434,-0.00099223,0.00116666,0.000810657,-0.00016292,-0.000438331,0.000250828,0.000681807,0.000132488,-0.000240282,-0.000561025,0.00154501,-0.00118216,-0.00130762,0.000413384,-0.000791029,-0.00138886,-0.000188765,-0.000160237,0.000786533,-0.00182212,-0.000466175,0.000150338,-0.00020107,-0.000703179,-0.000993425,0.000715128,0.000599201,-0.000423842,-0.00000398807,-0.00121332,-0.000355874,0.000828345,-0.000291294,-0.00130903,-0.000281318,-0.000544281,0.000217144,0.000473379,0.000243029,-0.00016137,-0.000817769,0.00172457,-0.00149542,0.00135869,0.00047067,-0.000592457,0.000169037,0.00169141,0.00154339,-0.000612825,-0.000563134,0.00036452,0.000956856,0.000620268,-0.000278093,0.000647985,-0.000228592,0.00125961,0.000431022,-0.00123821,-0.0000952723,0.00134731,0.00117141,-0.000920242,0.000033997,0.000903201,-0.00127165,-0.000103701,-0.000988785,-0.00139954,-0.000939243,0.000592537,0.00161046,-0.000490508,-0.000467206,-0.000447487,-0.00102366,0.00056293,-0.00118469,0.000856399,-0.00104415,0.0011745,0.00124842,-0.000715122,-0.000178415,0.000454481,0.00152331,-0.000260315,-0.000213876,-0.000369091,0.0000417015,0.000796647,-0.000374361,-0.00097413,-0.00022756,0.000407016,-0.00182408,0.00104943,0.00136315,0.000973597,-0.00154441,-0.000343925,0.000222447,-0.000450984,-0.00139367,-0.00127099,0.000931497,0.000925246,0.000681866,-0.000176685,-0.0000896157,0.000359426,-0.000373526,0.000338532,0.000924226,-0.00108125,0.000681004,0.00148338,0.000254782,0.000128708,-0.000223395,0.000701785,0.00107732,0.000577975,0.000379839,-0.000354466,0.00080659,-0.000304501,-0.00156919,-0.000966553,0.000364494,-0.00103426,-0.000298698,0.000491157,-0.00159814,0.00126016,-0.000628514,0.000421736,-0.000244843,0.0000851215,0.000813966,0.000109007,-0.000279762,-0.000962223,0.000345436,0.000338442,0.00127393,0.000912882,-0.0000135172,0.00135519,-0.00091542,-0.000392767,0.000648456,-0.00125462,0.000643661,-0.00157381,0.000636149,0.000847755,-0.00110062,0.000513878,0.00152874,0.000556521,0.000519332,-0.000876539,-0.000737599,-0.000353568,0.000602306,-0.00158762,0.00167837,-0.00075204,-0.000275911,0.000158137,-0.00145551,0.000195,0.00164456,-0.00040417,0.000458581,0.000485754,-0.000286603,0.000899804,-0.000633211,-0.000564465,0.000662236,-0.000592863,0.000103472,0.00194377,0.000748359,0.00142088,0.000556239,-0.000713003,-0.000440125,0.00110107,0.00019763,0.000435792,-0.000494196,0.00118522,-0.00108469,0.000428004,0.0011541,-0.000348155,-0.000978358,0.0000530264,0.000534197,0.000634922,-0.00157046,0.00034977,-0.0000645745,0.00110167,-0.00173966,-0.000518027,0.0010377,-0.00111558,-0.00125548,-0.0000703719,0.00192234,-0.000398875,-0.000587563,-0.00133173,0.00157395,0.000903328,-0.000512914,-0.000566409,-0.000186789,-0.00135089,-0.000318595,-0.000408899,0.000315805,0.00109775,0.000706581,0.00167686,0.00192465,-0.000247367,-0.000287298,-0.000176708,-0.00099258,0.00106886,-0.000556719,0.000862722,-0.0000605792,-0.000487716,-0.00030889,-0.000674176,-0.00165853,-0.00161155,-0.00137041,-0.000199489,-0.0014886,-0.000246995,0.000622459,0.000481954,-0.000345669,0.00107781,-0.0011648,-0.00132833,0.000040454,-0.000118715,0.00120567,-0.00130361,0.000791802,-0.00185501,-0.0000042537,0.000819287,0.000751263,-0.00102459,0.000622523,0.000186594,0.000724726,-0.000471859,0.000346502,0.000354089,-0.00104936,0.00107123,0.00038525,0.0017702,0.000632264,-0.00122198,-0.000454673,-0.0000369561,-0.00110378,0.0010372,-0.000213163,0.000443562,0.000278761,0.000854021,-0.000473197,-0.000972655,-0.00131776,0.00023991,-0.000110452,0.0017732,0.000769507,-0.00166272,-0.00131303,0.0000804608,0.000519591,-0.000549186,-0.000258152,-0.000966721,-0.000854323,-0.00183026,0.00191824,0.000119239,-0.00164676,0.00133118,0.000722608,0.00127706,0.000764906,-0.000774618,0.000890781,0.00021376,0.00130506,-0.000248705,0.00094212,-0.00158292,-0.000151605,-0.000795766,0.000311518,0.00111895,-0.000196071,0.00166452,-0.000736775,0.000532171,-0.000567965,0.000673764,-0.000591759,-0.000647979,0.00113282,-0.000810055,0.00144217,-0.00120362,-0.00082963,-0.000290047,0.000624591,0.000654706,0.000147247,-0.000118742,-0.000813608,0.000280529,-0.00195518,-0.000376347,0.00185769,0.000320694,-0.000729131,0.00120151,0.000545709,0.00156645,-0.0012906,0.000426123,-0.000513238,-0.000649585,-0.000624555,0.00108756,0.00104328,-0.000628823,0.000201089,-0.000963099,0.000514333,-0.00111705,0.000134571,0.000534733,0.00028423,0.000280049,-0.000295727,0.000882438,-0.00038739,-0.0013745,-0.000372206,0.00160132,0.00174729,-0.000752837,0.000288846,-0.00012206,-0.00148929,0.00146266,0.000201794,0.000115419,-0.00118276,0.000297361,0.000167907,0.000461038,0.000249914,0.000063531,0.00170353,0.000160163,-0.000377169,0.000187835,0.00029076,0.000774693,0.000872422,-0.000744091,-0.00123289,-0.000308648,0.000203833,-0.00121285,-0.00134069,0.0000535291,-0.00110233,0.00174229,0.000611187,0.000351423,0.000972135,-0.00131586,0.000665763,0.000619051,-0.000987294,0.000452453,0.000687932,-0.000318432,0.00127117,-0.000936155,0.00100216,-0.000156829,0.000465544,-0.000270454,0.000558132,-0.000346753,0.000578975,-0.00119578,0.00190034,-0.000887639,-0.000722558,-0.0000382724,-0.000658358,0.00040724,0.000760862,0.0012669,0.0004593,-0.0000465823,0.00119066,0.000427067,0.000377523,0.00154682,0.000161093,0.000808169,0.000345132,-0.0000257689,0.000475874,-0.00127891,-0.000217681,-0.0000462093,-0.000079818,-0.000177192,0.00121705,0.00160349,-0.000517488,-0.00132872,-0.000579385,0.00100518,-0.000644819,-0.000592986,-0.000558854,-0.00159906,-0.000529731,0.0000827514,0.000205652,-0.0016302,-0.000710683,0.000382391,-0.000907957,0.00100636,-0.0010405,0.000678306,-0.000707257,-0.00132837,-0.000188575,-0.00095816,-0.00085339,-0.00178716,0.000621747,0.000229724,-0.000972873,0.000719934,0.00168654,-0.000861388,0.00169889,0.000673212,-0.000320266,-0.000135281,-0.000394673,0.000703202,-0.00145791,0.000428602,-0.000119586,-0.000529752,0.000432802,-0.000573767,0.00009133,-0.00138105,-0.000667639,-0.00115607,-0.000125768,-0.000406595,-0.000468525,-0.000544326,-0.000651838,0.000466046,0.0000340823,-0.000128175,0.00159407,0.00111252,0.00116307,0.000770076,0.000793303,-0.00144613,-0.000427805,0.0000472193,-0.000818582,0.00013457,-0.000801391,0.000633075,-0.000496504,0.000844581,0.000970947,0.001323,0.000554826,-0.000822747,0.000669732,0.00120084,0.000588134,-0.00012553,-0.00051679,0.000664282,-0.000125291,0.000784243,-0.000177431,-0.000673953,-0.000489214,0.000233419,0.000632494,0.00072452,-0.00174747,0.00170664,-0.00184682,0.00129819,-0.000546686,-0.00123676,-0.000342657,-0.000544924,0.000867712,0.00136057,-0.000484082,0.000299754,-0.000466439,0.00116326,0.000525173,-0.000673582,-0.000510127,-0.000388195,-0.000907863,0.000125782,-0.0005119,-0.000102842,-0.000719317,-0.000586833,0.0000995001,-0.000692525,0.000795879,-0.000914915,-0.000482344,0.0000325979,0.000158566,-0.00113671,0.000174576,0.000712219,0.0000128249,-0.000512463,0.00132352,0.00119929,-0.000559078,-0.000705344,0.00104522,-0.000685854,-0.0000970576,-0.000296275,0.00031283,-0.000360147,-0.000314381,0.000982128,-0.000201796,0.000074486,0.00101822,0.00116511,-0.00107499,-0.000318663,-0.000182277,0.000182263,0.00107612,0.000933917,0.00111248,0.00131825,-0.00140872,0.0000879419,0.00116176,-0.000753763,0.000748231,0.000366694,-0.000394573,0.000175692,-0.0000207261,0.0017059,0.00181674,-0.000370591,-0.00079605,-0.000311457,-0.000440674,0.00019798,-0.00152147,0.00132498,0.000261635,0.000192849,0.00122704,-0.000899285,-0.000887519,0.0018785,-0.000927345,-0.000475745,-0.0000921714,-0.000449621,0.000383185,-0.000297433,-0.00108639,-0.00013329,-0.000419327,-0.000805314,0.00168334,0.00185814,0.000451516,-0.00150134,-0.000329944,-0.00124767,-0.000325974,0.00169081,-0.000234364,-0.00168871,0.000141025,0.00103988,-0.00116708,-0.000887556,-0.000806152,-0.000843746,-0.0019166,0.000609178,0.00142747,0.000366882,-0.000504865,-0.000515035,0.0017732,-0.00168008,0.00196324,-0.000268369,-0.00162584,0.00130363,0.000673628,0.000622072,0.00176031,0.00101198,-0.000371114,-0.0006215,-0.00136667,0.00100814,0.000227421,-0.00000362074,0.00137677,0.000300398,-0.000111867,0.000328726,0.000256603,-0.000587023,0.00070275,0.00010267,0.00122684,-0.00166631,-0.0000492438,0.0000478703,0.00129566,-0.000855203,0.00131228,0.00122303,-0.000408238,0.00165781,-0.000219697,-0.000390654,-0.000132574,0.0000606671,0.000994698,-0.000430406,0.00139594,-0.00157107,-0.000984422,0.000522655,0.000348005,-0.000160505,0.000742813,0.000992775,-0.0004482,0.000679951,-0.000422159,-0.0011098,-0.000538478,-0.000804472,0.000476188,-0.000152743,0.000791037,0.000102948,0.000933367,0.00119022,0.000250337,-0.000382266,-0.00166471,-0.0000102367,-0.00059811,0.0000352954,0.00178631,0.00198754,0.000451339,-0.0000728126,-0.000052557,0.000366566,0.000272247,0.00176019,0.000775749,0.00130232,0.000843404,-0.00057748,0.00114496,0.00138457,0.000714929,-0.000562685,0.00178533,0.000647793,-0.000381174,-0.000822885,0.000698116,0.000927857,-0.000216609,0.000799989,-0.000301,0.00141731,-0.00144014,0.0000458878,-0.000473006,-0.00053015,0.0012044,-0.00177131,-0.000842885,-0.000302339,-0.00156291,0.000692476,0.00118824,0.000796432,-0.0016915,0.000169023,-0.000791199,0.000225154,0.0000356371,0.000835681,-0.000806972,0.000755629,-0.001883,-0.000255751,0.0000359802,-0.000445098,-0.00142863,-0.00133292,0.00168688,-0.000683972,0.00130548,-0.000989042,0.000759594,0.000786698,-0.00028179,0.00103068,-0.00116406,-0.00151198,-0.000565358,-0.00058306,0.00198587,0.00199272,0.0000360934,-0.000341816,0.000426614,0.00097603,-0.00162099,0.00103877,-0.000377482,0.000536973,0.000198683,0.00125644,-0.00039999,-0.000656008,0.00163299,0.000963443,-0.000802031,0.00106617,-0.000476016,-0.000803576,-0.000777354,-0.000241262,-0.000529211,-0.000720531,0.000700617,0.000576645,0.000351544,-0.00080435,0.00141092,-0.00114626,-0.000898897,0.000718933,-0.000129497,0.00031943,0.000369982,0.000253044,0.000903508,0.000800872,-0.000597389,0.00106203,0.000503374,0.000670414,-0.000396418,0.000953297,-0.000729954,-0.0000949123,-0.000642909,0.00035406,0.000543856,-0.000970951,-0.0000914765,-0.000905238,-0.000198087,-0.00136901,0.00080854,0.000165634,-0.000243651,-0.000467981,-0.000861995,0.00125773,-0.000323026,0.000396677,-0.0006686,0.000395894,0.000869542,0.000058824,0.000627586,0.000751788,0.000901806,-0.000499609,0.000516246,0.0019679,-0.000629359,0.000851392,-0.000794855,-0.00175912,-0.00106467,-0.000290506,0.00151352,0.00113432,-0.000571416,-0.0000655937,0.000295579,-0.00121462,-0.00129512,0.00125278,0.000133272,-0.000351233,0.00141404,-0.00128578,-0.000545471,0.000262219,-0.0000110122,-0.00168592,0.000277147,-0.000308882,-0.0000548254,-0.000198219,-0.000151248,0.000107709,0.00145574,0.0000331254,0.0000353531,-0.000267206,-0.000600972,0.000347719,0.000100859,-0.00131763,0.000260065,0.00172586,0.000250763,-0.000562149,-0.00102007,0.000428388,-0.00111576,-0.0000444462,0.000260038,-0.0000856467,0.000937791,0.000164626,-0.000740346,-0.0011298,-0.00066783,-0.000521038,0.000403151,0.000320357,-0.00171942,-0.00164455,0.000541254,-0.00046367,0.000364773,0.00122137,-0.000742678,-0.000318098,-0.000232625,0.00168845,0.00095512,0.00122318,0.000298799,0.000328688,0.000469428,0.0000873453,-0.0000864635,-0.000675237,-0.00177151,-0.0000473491,-0.00120488,-0.000967574,0.000285635,-0.000307505,-0.000393629,-0.000323095,0.00109192,0.0011113,-0.000466686,0.000947247,0.000489249,0.000918446,0.00020114,-0.0000453082,-0.000858524,-0.00103401,-0.000619224,0.000158765,0.000402546,-0.0012737,0.000537265,-0.000467239,-0.00115544,-0.00135007,0.00153067,-0.000728962,-0.00125519,0.00195425,-0.00067652,-0.000508438,0.00108368,0.00152587,-0.000161024,0.000493063,-0.000709661,-0.00078999,-0.000664312,-0.000165277,0.000724736,-0.000191003,-0.0000742684,0.00115264,-0.000875375,-0.000189098,-0.0010764,0.00154088,0.000117583,0.000520011,-0.00106583,0.000000797268,-0.000240298,-0.000332317,0.000414947,0.000229053,0.00165532,0.00178608,0.000471028,-0.000292085,-0.00033733,0.000392288,0.000648427,-0.00149834,0.000939604,-0.000439858,0.00110237,-0.000146234,0.0000271596,0.000886927,-0.0000440176,0.00142006,0.000198106,-0.000462276,0.000299101,-0.000848971,-0.00034504,-0.00077815,0.0000886044,0.0000114126,-0.000113248,0.0014466,0.00165502,0.000276319,0.000810343,0.00109353,0.000960788,-0.00135843,0.000202574,-0.000444669,0.00117143,0.00119601,0.0000869523,-0.0000725198,0.00129193,-0.000135613,0.00114245,-0.000573527,-0.00041096,-0.00113722,-0.00181075,0.00104488,0.000341559,0.000530227,-0.00076892,-0.000891685,-0.00143262,0.000608074,0.0019056,-0.0000839331,-0.00104957,0.000185248,0.000459316,-0.000292026,0.00199381,-0.000702067,-0.000758415,0.000228737,0.000300346,0.000675203,0.00121087,0.00199363,0.0000242407,0.00055355,-0.000648433,-0.000486351,-0.000328883,-0.00192322,0.0000569243,0.000297804,0.000633938,0.000977696,0.000081638,-0.000491138,0.00107203,0.000835569,0.00148619,-0.000464228,0.000732285,-0.0014248,0.0010972,0.000465126,0.000150858,-0.0012586,-0.000412986,0.000127835,-0.000699777,-0.00154975,0.00136515,-0.000246737,0.000600402,-0.000105552,0.0000986039,0.000275367,-0.000883678,-0.000233837,-0.000145832,-0.000266358,0.00164442,0.000173327,0.000773005,-0.00176856,-0.00130256,-0.0000527354,0.000776816,-0.000863504,-0.000000180332,0.000281983,0.000445399,0.00136521,-0.0000250483,-0.000284252,0.00114025,0.00124035,0.000277123,0.000409136,0.000436282,0.000101712,-0.00000777521,-0.000387073,0.00131129,-0.00118032,0.000211498,0.000694229,0.00019303,0.000417775,-0.0000459894,-0.000471081,0.00030507,0.000904351,-0.000881592,-0.000311494,0.000747041,0.00129334,0.000329084,-0.000134519,-0.0000596863,-0.000426297,-0.000988893,-0.000620055,-0.00165655,-0.000690909,-0.000429158,-0.000414932,-0.0000580591,-0.000202909,-0.0012468,0.000834388,0.000190414,-0.000532582,-0.000471361,0.00130348,-0.000550042,-0.000693306,0.000710627,-0.00193599,0.000549309,0.000222455,0.00108475,-0.00062762,0.0000496892,-0.000162355,-0.00110139,0.000612262,0.0000415979,0.000246404,-0.000237481,0.000386943,0.00074565,0.00137719,0.0000634811,0.0000820933,0.00113254,0.00128449,-0.00150352,-0.000614875,0.0000535115,-0.000117284,-0.00158139,-0.000437809,-0.0000214462,0.0000594912,0.000134555,0.000714332,-0.000681267,-0.000265946,-0.000708974,-0.000366056,-0.0000442201,0.000712699,0.000603338,-0.000804112,0.000871151,-0.00192352,-0.000722665,-0.000836639,0.000743532,0.000986821,-0.000128588,-0.000380683,-0.000410089,0.000122218,0.0000721759,0.000159328,0.00176557,-0.00170369,0.0000779255,0.000132254,-0.000892816,0.0000981028,-0.000703845,-0.0000824385,-0.0000710947,-0.000729067,0.000704997,0.000757896,-0.000438027,0.000251646,-0.000621259,0.000846969,-0.00123031,-0.000935506,0.0000249999,-0.000945378,-0.000017802,0.000923317,0.00107958,0.0019172,0.00025486,0.000971833,0.000816686,0.000530189,-0.000667176,-0.00061186,0.00040357,0.00123869,0.000159845,0.000122839,0.000543938,0.0013212,-0.000983668,-0.000876283,0.00157939,-0.00144885,-0.0000455562,-0.000941354,-0.000566202,0.0000814232,-0.000766108,0.000403637,0.000800838,0.000645515,0.00114739,0.00115829,-0.000256834,0.00105459,-0.000253171,-0.00109755,-0.00000873269,0.00188464,0.000822624,0.00118653,-0.000243271,-0.00149084,-0.000056072,-0.000125333,-0.0012816,0.000296657,0.000360052,0.000277898,0.000610176,-0.0000180149,-0.000430202,0.000240394,0.000349146,-0.00177337,0.000880444,0.000553769,-0.000433149,0.000107966,-0.000431052,-0.00134291,-0.000746882,0.000158262,0.000000268174,0.000770418,0.00113901,-0.000817501,0.000934793,0.000846722,0.00132959,-0.00122724,-0.000216499,-0.0010482,-0.00191699,0.000270473,0.000990646,0.000276028,0.000268258,0.000662025,-0.00112481,-0.000507674,-0.000754997,-0.000700226,-0.000461357,0.000746349,0.00110848,-0.000149315,0.00109381,0.000872476,-0.000434963,-0.00108096,0.000878264,-0.000191957,-0.00114406,-0.000180952,0.0000700803,0.000799047,-0.000368722,-0.00115878,0.000364854,-0.000726946,0.000614854,-0.000318728,-0.000342941,0.000408098,-0.00110198,0.0000730848,0.00044281,0.000244412,-0.000311859,-0.000486213,0.000318328,-0.000453802,0.000239346,-0.00102535,0.00106381,-0.0000265616,0.00173596,-0.0000925888,-0.00125369,0.000146842,-0.000349503,0.000767374,-0.00122766,-0.000432284,0.000396001,0.000694172,-0.00115524,-0.00123439,0.000157902,-0.000619166,-0.000335933,-0.000671465,-0.00065354,0.00144644,0.000991968,-0.000356869,-0.00025622,0.0000454213,-0.000998424,0.000291333,-0.00109668,0.00161108,-0.00156776,0.000269125,-0.0015351,0.00163734,-0.00130958,0.0000668316,-0.00070992,0.000665144,0.000655773,-0.00104449,0.00022877,-0.00143585,-0.000110916,-0.000327103,0.000187729,0.000921126,0.000933958,0.00123107,0.00195398,0.0000448436,-0.000221223,-0.000037007,0.000694744,0.000745542,-0.000513722,-0.00126116,0.00123396,-0.00154231,-0.00183154,0.00199362,0.000674936,-0.000253553,0.000598683,0.000608982,-0.000504331,0.00126812,0.0000877271,0.000682759,-0.00154297,-0.00021319,-0.00102329,0.000365086,0.00059781,-0.000141029,0.0000181517,-0.00166529,0.00046255,-0.00134973,-0.00124788,0.000319948,0.000574771,0.000798623,-0.000849555,0.000130277,0.00001123,-0.000406034,0.00153171,-0.000229656,-0.000199929,-0.00164318,-0.00159703,0.000851167,0.00108723,0.00125269,-0.00129389,0.0000655937,-0.00184294,-0.000872114,-0.000902364,0.000228977,0.000972053,0.000926715,-0.00105697,-0.000440059,-0.00176597,0.000109967,0.000787754,-0.00121817,-0.00187697,-0.000923564,0.000574068,0.000215642,0.00178581,0.000191726,0.000298771,0.00082702,-0.0000157859,0.000607139,-0.00180745,-0.000432098,-0.000358446,-0.000546702,0.00136676,-0.000382772,-0.000814552,0.000410588,-0.000638253,0.00051872,0.00154266,-0.000114187,0.00109293,-0.00158473,0.000466303,-0.000472165,-0.00186106,0.0000859795,0.000499341,0.00117583,-0.000291118,0.000815206,0.000017029,-0.000993982,0.00114267,-0.00168819,-0.000667672,0.000613952,-0.00160969,-0.000807537,0.000345463,-0.000611069,-0.000414108,0.00066571,0.000543285,0.000728868,0.00102441,-0.000712495,0.000247474,-0.000331242,-0.000264425,0.0012278,0.00158153,0.0011716,0.0010308,0.00104394,0.00121944,-0.00115474,0.000934614,-0.00036174,0.000955997,-0.000243317,-0.0000582999,0.000998425,-0.000359835,0.000447226,-0.000454401,0.000684791,-0.000980722,0.000646328,0.00064076,0.00110861,-0.000769828,0.000146244,-0.00013853,-0.000438992,-0.00164355,-0.00117006,0.000200781,-0.000982962,0.000221488,-0.00106974,-0.00122769,0.000826568,0.000352193,0.000210999,0.000131221,0.000837192,-0.000214274,-0.000808667,0.000426104,0.00018289,0.000862678,-0.00148993,-0.000988819,-0.0000743318,0.0014125,-0.000980588,-0.00107003,-0.00116173,0.00138685,-0.000849707,-0.000650707,-0.000390185,0.000349277,-0.000288187,-0.000198516,0.00120125,0.00143957,0.0000746833,0.000399007,0.000316488,-0.00093279,-0.000772904,0.00163032,-0.0015388,-0.0000574428,-0.000153584,-0.000842479,-0.000974769,-0.000491213,-0.00198754,-0.0000326053,0.000171669,-0.00112344,0.000519691,-0.000490373,0.000132198,0.000601947,-0.000843208,-0.000456324,-0.00100182,0.000605557,0.000685446,-0.00062266,0.00127465,-0.0000347332,-0.00181018,0.000171188,0.00106259,0.00000649427,-0.0015466,-0.00157513,-0.00110179,0.000354534,-0.000360345,0.000724603,-0.00182918,0.000510562,-0.000887026,0.00082382,-0.00111774,-0.00031186,0.0000515023,-0.000167547,-0.0000266811,0.00113295,0.000429885,-0.00048785,0.000554118,0.00132813,0.000426966,-0.00159416,0.000277596,-0.000226348,-0.000762182,0.000838233,-0.00051265,-0.000277794,-0.000892211,0.000191379,-0.00168784,0.000333455,0.000393885,-0.000655777,0.0000143305,0.000811719,-0.00179246,-0.000138564,0.000337398,-0.00129603,0.000989485,0.000179694,-0.000207885,-0.000361752,-0.00104165,0.00106047,0.0000152954,-0.00105018,-0.000131808,0.000804918,-0.000628038,-0.000611844,-0.000125442,0.000218451,0.00156519,-0.000112784,-0.000302252,-0.000648267,0.00176672,0.000180701,-0.00170569,0.00183332,0.000211622,0.000133575,0.000750785,-0.000524938,-0.000741142,-0.0000574015,-0.000501482,-0.00144589,-0.0011959,0.000757398,-0.00114963,-0.0000511725,0.000699347,-0.00169252,-0.000169294,-0.000166429,0.00101363,-0.000123858,0.000865133,-0.000822292,0.00120359,-0.00199817,-0.000479164,-0.000848861,0.00145606,0.00118197,0.00129053,-0.000744439,0.00152138,0.000741304,0.000685118,-0.00174029,-0.00042916,0.00054879,0.000431368,-0.00138686,-0.000310886,-0.000967075,0.000161452,0.00121107,-0.000111499,-0.000476574,0.000136353,0.000103121,0.00026999,0.0000309904,-0.000593634,0.000292815,-0.000158208,0.000795784,0.00141988,-0.000371748,-0.000317214,0.00188,-0.00123063,-0.00173872,0.000241043,-0.000534429,-0.000449987,-0.00110205,0.00161448,0.00021781,0.000445524,0.000278992,0.0000693673,-0.000126334,0.000718091,-0.00102833,0.0000881374,0.000106176,-0.00149118,-0.00137593,-0.000348196,0.000654343,-0.00107733,0.00112868,0.000585105,0.000917819,-0.00124903,0.0000613187,0.000409404,0.000224764,0.000387958,0.0000876242,0.00028767,0.000158268,-0.000278426,-0.000515006,0.000317779,0.000960775,-0.00158105,-0.000153128,0.00139898,-0.00102558,-0.0000404412,-0.0012973,-0.000677368,-0.00133387,0.000307551,-0.00120737,0.000172025,0.0000738403,0.00117314,0.00157521,-0.0000325031,0.0000747858,-0.000477279,-0.000159516,-0.00136944,0.000184845,-0.00138523,0.00177599,-0.00134143,0.00149533,-0.000943281,0.000863607,0.00142152,-0.000300659,0.00123692,-0.0014131,-0.000594199,0.000602814,0.000464212,0.000961228,-0.0011901,0.000105185,-0.000543589,0.000810331,0.000748754,-0.000417689,-0.000283242,-0.000948353,0.00166176,-0.00123167,-0.000372335,0.000117968,0.00181716,-0.000604977,-0.000631144,-0.000662241,0.00152117,-0.00009781,0.000666673,-0.000489008,0.00092254,-0.000389414,0.000401755,-0.0000679867,-0.000729177,0.000441909,-0.000731453,-0.000280212,-0.00136138,0.000147653,-0.000558561,-0.0000754203,0.000500048,-0.00113493,-0.00126525,0.00150509,0.0000764318,0.00063848,-0.000233124,-0.000419526,0.001713,0.00015598,0.00187283,-0.000916167,-0.000308072,-0.00176522,0.000511903,-0.00131874,-0.000761546,-0.000168045,-0.000270812,0.000567945,-0.00050286,-0.0008182,-0.000550123,-0.000387651,-0.000743605,-0.000135446,-0.000356148,0.000304262,-0.0010272,-0.0014682,-0.000583567,0.00000989403,-0.000133393,0.000419135,0.00147118,-0.000233512,-0.000561051,-0.000722628,0.000652257,0.000844152,-0.00101595,0.000992556,0.00129494,0.00109797,0.000591207,-0.00116568,0.000393113,0.000108882,0.00112452,-0.000911117,0.000367715,0.000709161,-0.000548305,-0.000097641,0.000979732,-0.000207344,0.000448447,0.000185098,-0.000743342,0.000907962,0.00166526,-0.00126464,-0.00039074,0.000305078,-0.00000289868,0.0014384,-0.000621067,0.000363308,-0.00093402,0.000120711,-0.000312797,-0.000372696,0.000670825,0.000347136,-0.000586705,-0.00138919,-0.00043205,-0.000352232,0.0001229,0.000960643,0.000749723,-0.00149071,-0.00130839,-0.000295048,-0.000120556,0.000614615,-0.00198135,-0.000636807,0.000641916,0.0011466,0.000150338,0.000698704,-0.00062767,0.000739886,0.00035944,-0.000326962,-0.001372,-0.0000559648,-0.000867997,0.000247104,0.000625435,-0.0013879,-0.00119403,-0.00112125,0.000881638,0.000349474,0.000429574,0.000988893,0.00078027,0.000300445,-0.000929895,0.00149176,0.000883696,0.000271089,-0.000616993,0.000149687,-0.0000971701,-0.000863315,-0.000648308,0.000956654,0.000589864,-0.000248717,-0.000898797,-0.000142111,-0.000750792,0.00198396,0.000260597,0.000242769,-0.000470954,-0.00157324,-0.000311858,-0.000635815,-0.000230792,-0.000615294,-0.000479245,-0.00047117,0.00036587,-0.000661066,0.000116936,0.000179505,-0.000729631,0.00153224,0.000123882,0.000778696,0.000237956,-0.000776357,-0.000517075,0.0000816982,0.000411998,0.000554388,0.000588542,-0.0000240068,-0.000103317,0.000432972,0.000683828,-0.000125214,-0.000904427,-0.00018598,-0.000225818,0.00103124,0.000334414,-0.000602258,-0.00163067,0.000213121,0.000078276,-0.000897465,-0.000359089,0.000176059,-0.000934983,0.000417554,-0.00125186,0.00157923,0.000959965,0.000486997,0.000903602,0.00083499,0.000529103,-0.000750441,0.00178348,0.000176105,-0.000326164,0.000626915,-0.000615488,0.00150689,-0.000626899,-0.000784372,-0.00129132,-0.000231875,-0.000788897,0.000698694,0.000217075,-0.00113311,0.00180939,0.00121527,-0.000699887,0.000491232,-0.000268756,-0.00137743,-0.000510496,-0.0000598925,0.000245005,0.000738227,0.00149805,-0.00015295,-0.0000576925,0.00079861,0.000110507,0.000134656,-0.00115566,-0.000552571,-0.000512448,-0.000464188,-0.000457421,-0.000344289,-0.000327292,-0.00197219,-0.000268248,0.000350862,-0.000352491,-0.0000479484,0.000599618,-0.000666399,0.0001324,-0.000217792,-0.00129682,0.00055497,0.000970214,-0.000432409,0.000111149,0.000290408,0.000186366,-0.000880406,-0.000261775,0.000307309,-0.00101468,-0.00173146,0.000573932,-0.0000779967,0.000491077,-0.0000625441,-0.00083958,-0.000122303,-0.000248369,0.00110642,-0.000589712,-0.000270444,-0.000617682,-0.00107658,-0.00129105,0.000587887,0.000252085,0.000978821,0.000240491,0.000260986,-0.0000888333,-0.000839109,0.000639003,-0.000731918,0.000918746,-0.000833531,0.000289604,-0.00195982,0.0019574,-0.000911227,0.00143212,-0.00068558,-0.000365808,0.000629087,0.00136618,0.000216647,0.000730136,0.00132238,-0.000253494,-0.00167401,0.00070419,-0.0000656363,-0.00043481,0.00187937,0.00163508,0.0012565,0.00049529,-0.00142094,0.000104382,0.000688962,0.000836975,-0.000635108,0.000956554,-0.000208997,0.000787247,0.00178811,0.000789133,-0.00114467,0.000355836,0.00145437,-0.000716486,-0.000243204,-0.000842614,0.0000421117,0.000130091,0.000411854,0.000946485,-0.000226768,-0.00012327,0.00041688,-0.000307611,-0.00163352,-0.000552038,-0.0000654218,0.0000923428,-0.00187549,-0.000405511,-0.00092338,-0.000371032,-0.00147525,0.000143504,-0.00127328,-0.00140678,0.00189482,0.000150994,-0.000658135,-0.000469662,0.00114044,-0.00120833,0.000360491,0.000610785,-0.00131098,0.00100975,-0.000204162,-0.000360245,0.000888731,0.00187171,-0.000790346,0.000035833,-0.00120849,0.0014942,0.000255822,-0.00114256,0.0000268749,-0.00143196,-0.000401603,0.00184018,0.000487396,-0.000868156,0.00187525,0.000325744,-0.000199945,0.000326901,0.000401219,0.000655509,-0.000518099,0.00159588,-0.000433104,-0.00145112,-0.000535692,-0.0000517196,0.000524237,0.00125259,0.00129339,0.000316407,-0.00000316146,0.000599001,0.000737946,0.001315,-0.000424427,0.0000814552,-0.000364505,0.00124074,0.00123599,-0.00125732,0.00162628,0.000840576,-0.000825915,-0.0000266514,0.000312438,-0.000102814,0.000427157,-0.00114473,0.000598552,0.00135934,0.000569388,-0.00100324,0.0000446044,0.000831602,-0.000913882,-0.00114165,-0.00033404,-0.000147352,-0.000562384,0.000826865,-0.00146179,0.00126564,0.00094667,-0.000954381,-0.000933525,-0.000591031,0.0017807,-0.000288816,-0.000714568,0.000384066,-0.00167503,0.000732585,-0.000438612,-0.000343319,0.00103931,0.000671922,-0.00185339,0.00088108,-0.00115338,-0.000131769,0.000181724,0.000826878,0.001193,-0.000525606,0.000519993,-0.000318135,0.0000642517,0.000482665,0.000238474,-0.00026305,-0.000223518,-0.000157462,0.0000336327,-0.000000711658,0.000557857,-0.000362691,0.000573631,0.000283103,0.000251324,-0.000475559,0.001504,-0.0018722,0.000487354,-0.00128341,0.0000331005,-0.00169758,-0.00017504,0.000241595,-0.000648098,0.0000852847,0.0019076,0.000401929,0.00150571,0.000608981,-0.000311596,0.000622269,0.000154584,0.00179675,0.000598014,-0.00189359,0.00116259,-0.000400285,-0.0000164223,0.000519133,0.00153323,0.000883032,-0.000342217,0.000959364,-0.000281758,-0.000978142,-0.00113602,-0.000227063,-0.00118259,0.0000176,-0.0010032,-0.00143408,0.000723225,-0.0013087,0.000390434,0.000742375,0.00087079,0.000668014,-0.00145921,-0.000782407,-0.000442237,0.00178962,-0.00182262,-0.00152117,-0.000601935,0.00174228,0.000365309,0.00029306,-0.0003649,0.0000716903,0.000936882,0.0000658267,-0.00113373,-0.000123259,-0.0000737159,-0.00012716,-0.000285102,-0.000933183,0.000257369,-0.000325192,0.000150414,-0.000356534,-0.000809926,0.0012638,-0.0000310375,0.00128512,0.00132469,-0.001975,-0.000542672,-0.000300925,-0.000456202,-0.000798354,0.000551355,0.00154259,0.00140816,-0.000906041,0.00119252,0.0000845102,-0.00174683,0.000531697,-0.00144033,-0.000422275,0.000252745,0.0000652468,-0.000277573,-0.000662999,0.000317819,-0.000684778,-0.000849575,0.000400339,0.00000693377,-0.00081823,-0.00124987,-0.0000708673,-0.0000711753,-0.00101308,-0.000420283,-0.000183547,-0.000060101,0.00134121,0.000427904,0.000934219,0.00182168,-0.000270422,0.0000545672,-0.000776027,-0.00156224,-0.000579386,-0.00056683,0.000237162,0.000227489,0.00000160739,-0.000213029,-0.00101644,-0.0012131,0.000351712,-0.00138342,-0.00120595,0.000883205,0.00077622,0.000778898,-0.00141174,0.000704706,-0.0000148986,-0.000197516,0.000338197,-0.000523767,0.0000616515,0.0017511,-0.000676419,-0.000413971,0.001679,-0.0000989211,-0.0000713734,-0.000305195,0.000830606,-0.000943596,-0.00118767,-0.000280349,-0.00113788,0.0000595596,0.000101952,-0.000850838,0.000892078,-0.000485558,-0.00161745,0.000932981,-0.00110686,-0.00147889,-0.000543578,-0.00000583434,0.000138253,0.00034397,0.00106922,-0.00135994,-0.000167984,-0.000207979,-0.00190592,-0.0000959921,-0.00157373,-0.000045455,0.0000158781,-0.00044578,0.000687233,-0.0000459941,0.000552007,-0.000314576,0.0013909,0.00082739,0.000517868,0.000558841,0.000753633,-0.0000248891,0.000134822,0.00108513,0.000846604,0.0000884853,-0.0000371699,-0.000213653,-0.00194619,-0.000853664,-0.00110351,0.0000430824,-0.00136909,0.000293044,0.000113821,-0.0000786221,0.0000477695,-0.000540653,0.000493285,0.000305325,-0.00128608,-0.000340442,-0.00168734,0.000779153,-0.000587339,0.00144682,-0.000220081,-0.000264646,0.00000719365,-0.00110339,0.000248093,-0.000305184,0.000680453,-0.000278662,0.000510361,0.0000448848,0.0011344,-0.000172128,0.000471874,-0.000745343,-0.00024903,0.000201193,-0.000552016,-0.000883979,0.00099323,0.000499725,-0.000278942,0.000055201,-0.000637485,-0.000769117,0.0000252687,0.00149063,-0.000914684,-0.000604669,0.0002713,0.000456566,-0.0000243493,0.00121902,0.00117651,0.00068785,-0.000434079,0.000833697,0.000997296,-0.000769544,0.00136777,0.00130398,0.000417747,0.000343274,-0.000782109,0.000159037,0.000346462,0.00103761,0.00158768,0.00185682,0.000374424,-0.000138077,-0.000406345,0.00112371,0.00100337,-0.000771169,0.00139879,0.00122464,-0.00171164,-0.00192159,0.00154937,-0.000019017,-0.00110282,0.00111931,-0.000392578,-0.000750448,-0.000846897,0.000963967,-0.00127189,0.00117233,0.000119048,0.0000970952,-0.000883959,0.000635897,0.0000383008,0.000404173,0.000700791,-0.000640449,-0.00139303,0.00165753,-0.000780937,0.000709936,-0.00120117,-0.00114583,-0.00060655,0.00140075,0.000432443,-0.000864421,-0.00047688,0.000901631,-0.000636237,0.000415848,0.0012146,0.00159918,-0.000921887,-0.000229112,-0.000538771,-0.000423985,0.00088843,0.000197871,0.000694635,-0.00144029,0.00055364,0.00181026,0.000463039,0.000136437,0.000966596,0.000344927,-0.000779664,0.000247051,0.00147819,0.000591372,-0.000536542,0.00165465,0.000747552,0.000830249,0.00154768,-0.000905265,0.00114125,-0.00153313,0.000536495,-0.0000927223,0.0000956855,-0.00085565,0.000460914,0.0000765542,0.000709364,-0.000843981,0.000357422,0.00043557,-0.00138568,0.00124002,-0.000797473,-0.00139818,-0.0000464951,0.0000572381,0.00141204,0.000790375,0.000638241,-0.00169708,-0.000403602,-0.00136265,0.000244162,-0.00149483,0.000629228,-0.00163289,-0.000435322,0.00121346,0.000737271,0.000126772,0.000552836,-0.000139193,0.00038442,0.000620966,0.00140908,0.000153474,0.00108688,0.0000669436,0.00015723,0.00092656,0.00119914,0.0005778,0.000487493,-0.000098132,0.000147733,-0.00109161,0.000570795,-0.0000946793,0.00000536258,0.000512899,-0.000659143,-0.000523765,-0.0000937476,0.00147112,0.000637757,-0.000618401,-0.000624237,-0.000412884,0.00158827,-0.0012811,0.000158039,0.00140484,0.00102097,0.0015698,0.000579367,0.000494841,-0.000038153,-0.000523891,-0.0000121097,-0.000403109,0.0000858818,-0.0000789319,0.000085497,0.00017349,0.000183362,-0.00143198,0.00176541,0.00177716,0.00124221,-0.000801609,-0.000353332,-0.000649944,0.0000833512,0.00194675,0.000445109,0.0009371,0.00047177,0.00125371,0.000345696,0.001153,-0.00198403,0.00135268,0.000321198,-0.000460139,-0.000217617,0.00130636,0.000396672,-0.000418412,-0.000286202,-0.000961744,0.00120717,-0.000992218,-0.000894886,0.0000691185,0.000253996,-0.000516927,0.000882929,0.000873841,0.00112653,0.000415689,-0.000737803,0.00014427,-0.00170682,0.000314955,0.000326297,-0.00115995,-0.00121404,-0.00199826,0.00171441,-0.00102303,-0.000034434,0.00127322,-0.000553161,-0.000783227,-0.000896439,0.00000464676,-0.00110213,-0.000947034,0.000951349,-0.00112614,-0.00108039,0.000864702,0.000239213,0.000405472,-0.000335525,0.00133141,0.000185194,0.000227799,0.000848334,-0.000824659,-0.000600764,0.00125022,-0.000534689,0.00112885,0.000582044,0.00116543,0.000877215,-0.000315029,0.00014919,0.00188828,0.000106377,-0.000145429,-0.00137336,-0.00088905,-0.00101939,-0.00152834,-0.000219826,-0.000408778,0.00102494,0.00092557,-0.000978449,0.0000650489,0.000137883,-0.000449695,-0.00149665,0.00160653,0.000204995,-0.000665366,-0.000252242,-0.000458759,0.00146062,-0.00016632,-0.000679728,-0.00000863599,0.000862985,-0.000998112,0.00186152,-0.00126338,-0.00146102,-0.00126533,-0.000397974,0.000917829,-0.000280545,-0.000610128,0.000660788,0.000999213,0.000118196,-0.000908974,0.000113456,-0.000250863,0.00184084,-0.000789732,0.000625124,0.000484698,-0.0000212152,0.000223928,-0.000835068,-0.000410335,-0.000694486,-0.0000991313,0.000908282,-0.000660007,-0.000730988,-0.000183879,0.00010308,-0.0000363599,-0.00147872,0.000655706,0.0000217281,0.000754501,0.00122773,0.000640118,-0.000491073,-0.0000552928,0.000200087,0.000163683,0.00145084,-0.000671473,0.000804593,-0.000252143,-0.0000915106,-0.00160026,0.000679885,0.000336161,-0.0011338,0.00112492,-0.000270019,-0.00110765,0.00118384,-0.000234709,-0.00109037,0.000418394,0.00114204,0.00103935,-0.000255242,-0.000320579,-0.000484793,-0.000511468,-0.00000875159,0.000652506,-0.000803534,0.000181338,-0.000318302,-0.000257713,-0.0015401,0.00119511,0.000208205,0.000951493,0.00132352,0.00169667,0.000515363,0.000328607,0.00166399,-0.000998757,-0.00085736,-0.000524229,-0.000581296,0.000431154,-0.00118757,0.000391541,-0.000404627,0.00142049,-0.00175369,-0.000121307,-0.000615235,-0.001419,-0.00157864,-0.000562978,-0.00115437,-0.000219521,0.000631975,0.0000472602,0.000235953,0.00131338,-0.00144072,-0.00153332,-0.00153522,-0.00138972,-0.00044155,0.000288675,0.000912233,-0.000378808,0.00199636,-0.000899281,0.0000984729,0.0015584,0.000969791,-0.0000851564,0.000203656,-0.000923316,-0.000390051,-0.000159876,-0.000515874,-0.000772257,-0.00117031,0.000414953,-0.000757331,0.00020288,0.000426053,0.0000188018,-0.0000308783,-0.000483485,-0.0014309,-0.00158097,-0.00191652,0.000855057,0.000295792,0.00151418,-0.000580584,-0.000708102,-0.00000537999,0.0007062,0.00146848,0.000747154,0.00118077,0.000153989,-0.00195677,-0.000191152,0.00060731,-0.00168902,-0.000391029,-0.000595638,-0.0017627,0.00157282,-0.00106411,-0.000425262,0.000185751,0.00014608,0.000500637,0.000498701,-0.00183122,0.00113819,0.000675202,0.000351668,0.000223599,-0.0000428374,-0.000633403,-0.00125142,0.000934072,0.000165394,-0.000842271,0.00132998,0.000884812,0.00195699,-0.00136275,0.00153401,-0.00085695,0.0000753369,-0.000459138,-0.000872915,0.0000250893,-0.0019301,0.000738923,-0.00128134,-0.00194718,0.00166816,0.00120494,0.00110525,0.00134903,0.000936344,-0.0005915,0.0000575697,0.00000431103,0.00120036,-0.000323903,0.0000520404,-0.00122725,0.00090703,-0.00182697,0.00103895,0.000912994,-0.000886824,-0.0000786469,0.000644651,0.000691181,0.000380386,-0.00017093,0.000413953,0.000146818,0.000127234,0.000213364,-0.00148732,-0.000558335,0.0000109791,0.000152815,0.00160043,0.0000537598,0.00118447,-0.000333204,0.000115214,-0.000693737,-0.00140535,0.00121189,-0.00019078,-0.000692397,-0.00112532,-0.000481331,-0.000841416,0.000107985,0.000789146,-0.000580926,-0.000226246,-0.000982434,0.000222394,0.000273591,-0.000735243,-0.00146575,-0.000212016,-0.000237466,-0.0000995795,-0.00101475,-0.00184138,0.00100024,-0.00103569,-0.000935501,-0.000989503,0.000249736,-0.00061671,0.000479829,0.000111702,-0.00157945,0.000243342,0.000225699,0.000415273,-0.000246688,0.000340809,0.00108333,0.000444703,0.000849013,0.00057337,0.000280407,-0.000137038,0.000316931,0.00103112,0.00067735,-0.000738999,0.00111121,-0.000288063,0.000841615,0.0000884051,-0.00184758,0.000617085,0.000130844,0.000523545,0.0000351335,0.000209283,0.000833135,0.00197833,0.000272819,-0.0000942372,-0.000253362,0.0010237,-0.000115955,-0.000411801,-0.00106826,-0.000998951,0.000453063,0.000566877,-0.000835792,0.000458607,0.0000137305,0.0000550506,-0.0000430953,-0.000135474,0.00184706,0.00061249,0.000920593,-0.000905142,-0.0000399661,-0.000398189,0.00161031,-0.0000484751,0.000984885,-0.000911906,0.00111469,0.000254149,-0.000139282,0.000214954,0.00119968,-0.000495448,-0.00107535,-0.000758226,0.000170277,0.00167598,0.000545439,0.00150009,-0.000262393,-0.00085595,0.000384736,0.0000980766,0.00141158,0.000523621,-0.0000548346,-0.000406351,-0.00107455,-0.000682685,0.000554937,0.000751471,-0.000121189,0.000881081,0.000280947,-0.00130255,0.000095494,0.00112737,0.000218552,-0.000520896,-0.000921578,0.000701133,0.000943329,-0.000188803,0.000551383,-0.00101974,0.000014913,0.00108916,-0.00158079,0.00115154,-0.00167195,0.00136151,0.00067629,-0.0017319,-0.000670923,-0.000683051,-0.000412886,-0.00151126,-0.00061547,0.000840588,0.00118618,-0.00105604,0.00101903,-0.000838982,0.00132103,0.000243351,-0.000749008,-0.000186795,0.000430582,-0.00159584,-0.000162618,-0.0000392553,-0.00052523,-0.00125606,0.00011036,-0.00137454,0.00121672,0.00140643,-0.000725197,0.00130683,0.000374635,-0.000105567,-0.00105724,0.000880279,0.000489708,0.000980377,-0.0000529132,-0.00081757,-0.000755819,-0.00146441,0.0013101,0.000634949,-0.000475981,-0.000284719,-0.000479783,-0.000324551,-0.00000839611,0.00089664,0.0000859283,-0.0000820854,-0.0000473217,-0.000975384,-0.00086332,0.000628388,-0.00180851,0.000115197,0.000411849,-0.000789069,0.00151139,0.000534888,-0.00034259,-0.00121098,0.000952066,-0.000670757,0.000762309,-0.000134839,-0.000718288,-0.00119491,0.00018058,0.000661313,0.000830683,0.000702234,0.000983697,0.00111487,-0.0000451966,0.00151916,0.000922855,-0.00039578,-0.000608181,0.00162135,-0.000207713,-0.000860879,-0.0000263621,-0.000328009,0.000817737,-0.00129985,-0.000265006,-0.00146138,-0.000260784,0.000694217,0.000451646,-0.000554883,0.00181591,0.00105716,0.000749222,0.00141434,0.000562037,-0.0008483,-0.000374409,-0.000384982,0.00173762,0.00000862615,0.000835405,-0.000447592,-0.000882658,0.000570751,-0.000116759,-0.00029248,-0.000520386,-0.00123627,-0.00026711,-0.000309822,0.000616886,-0.00120681,-0.000767156,-0.000182237,-0.00071847,0.000924845,-0.000900015,0.00184879,0.000241299,-0.00124324,-0.000717868,0.00096671,-0.00146525,0.000293025,0.0013312,0.000400244,0.000165196,0.000118643,0.000728493,-0.00177155,0.00104225,-0.00145171,-0.0000498344,0.000969055,0.00101445,-0.000958353,-0.00171128,-0.00135776,0.00130785,0.000551974,-0.000174334,0.000900673,0.000504337,-0.000190992,-0.00166244,0.00115158,-0.00106647,-0.00147914,-0.00166808,0.00100696,0.000476731,0.000741538,0.000191106,-0.000288143,0.0000141991,0.0000511997,0.00132233,-0.000205744,0.000676272,-0.00121233,0.00150262,-0.0000448407,-0.00123054,0.000821747,0.000321651,-0.000740997,-0.000226183,0.0000714352,0.000468716,-0.000405154,0.00125437,0.000145818,0.000872232,0.00116955,-0.00020108,-0.00174423,-0.00158379,-0.000473495,0.00102605,-0.00132237,-0.00087804,-0.000185004,-0.000925787,-0.00037735,-0.0000324632,-0.0010551,0.000502786,0.0000144665,-0.000375618,0.000486061,-0.0000958388,0.0000323086,-0.000365035,0.000706316,-0.00179847,0.000764424,-0.000652336,0.000431229,0.000805071,-0.000967613,0.000380518,-0.00046329,-0.000136402,0.000434585,-0.000278515,-0.000454043,0.000456303,-0.00026066,-0.00112116,-0.000451313,0.00146829,0.0000293963,-0.00128476,-0.00117151,0.000341377,-0.000550169,-0.00032971,0.0014285,-0.0000474384,-0.00046568,-0.00133777,-0.00171796,0.000164668,0.000613605,-0.000606739,-0.000178881,-0.0000795503,-0.00182976,0.000529543,-0.000533669,-0.0000254811,0.00028308,-0.000100633,0.000533273,0.0012283,0.000132214,-0.00166369,-0.000434617,0.00120838,-0.00168012,0.00000948802,-0.000934478,-0.00148111,0.000495705,0.00121673,0.000996678,0.000829839,-0.000269332,-0.00129568,0.000146551,-0.00142573,-0.000297121,0.000544529,0.000400491,0.0000828713,0.000569606,-0.000634387,-0.00117179,0.000829484,-0.0000129551,-0.000459582,-0.000648181,0.00119353,0.00105856,0.000231265,0.000405189,-0.000550965,-0.0011683,0.00109119,-0.000423464,-0.000832783,-0.0000879268,0.000706682,0.00151245,0.000050665,0.000263655,-0.00156076,0.000195532,-0.000212029,0.00105935,-0.000755841,0.00166486,-0.000713679,-0.000966031,0.000627068,0.000142826,-0.00031311,-0.00178542,-0.00175301,-0.000323439,-0.000942356,0.00021833,0.00073662,-0.000653562,0.000387565,-0.00134664,-0.000428948,0.0000362096,-0.000177584,0.000774518,0.00101558,0.0000279553,0.000213885,-0.0017024,0.000514085,-0.000121169,0.000169268,-0.00112969,-0.0011668,-0.000453989,-0.000412417,-0.000204808,-0.0000316611,-0.0000846379,0.00021428,-0.000482869,-0.000784476,-0.000066044,0.00108488,-0.000530798,-0.000084307,-0.000337134,0.000946304,0.000195951,0.00104527,-0.00160141,-0.00140338,-0.000300411,-0.00020714,0.000585484,0.00143573,0.00118222,-0.000391245,0.000748086,-0.0014092,0.000176525,-0.0003869,0.000445085,-0.000897522,0.000557702,-0.00156793,-0.000958796,0.0000528288,-0.00112298,-0.0013423,0.0008821,0.000524309,-0.000793943,-0.000155529,0.000760473,-0.000166278,0.00000979501,0.000805821,0.000430974,0.00035935,-0.00104465,-0.0010404,0.000908364,0.000779165,0.0000896871,0.000863052,0.00031025,-0.00129018,0.0011547,-0.000722847,-0.000252111,0.0000799254,0.000778543,-0.00148526,-0.000576445,-0.000770514,0.00139866,0.0010385,-0.000716096,0.000772167,-0.000809627,-0.000474374,0.00139723,-0.00112394,0.000269525,0.00165772,-0.000657088,0.000316449,-0.000521789,0.00172479,0.00152874,-0.000437741,0.000612285,0.000743119,-0.00197276,0.000522165,0.00174573,0.000404425,0.000590093,0.00131194,0.000920615,-0.000399913,0.000559724,-0.000274022,-0.00110627,-0.000939007,0.000913073,-0.000185852,-0.00118615,0.000353997,0.000661027,0.000618421,-0.00124796,-0.000664342,-0.000383993,0.000019844,0.000746776,0.00058907,0.000805529,-0.0000395174,0.00156525,0.00107818,0.00192487,-0.00139731,0.000368568,-0.000815664,0.00096275,0.000931881,-0.000693229,0.000440054,-0.000701443,0.000361797,0.000987671,-0.000558497,-0.000174914,-0.000115567,-0.000272987,0.000720388,0.00103486,-0.00113736,0.000940891,-0.00158106,-0.000889139,-0.000499548,-0.000527273,0.000893576,0.000529194,0.00086438,0.000357977,-0.00117892,-0.00158984,-0.000555759,0.000363197,-0.00126273,-0.000393658,-0.00178567,0.00136319,-0.00123092,-0.0000942864,-0.000887671,0.000499116,-0.0000667493,-0.0016997,-0.00104136,-0.0016038,-0.000187722,0.000199458,0.000168808,-0.00012916,-0.00151626,0.000445931,-0.000322217,0.000339875,-0.000745851,-0.00136622,-0.000407787,0.0000175274,0.000806227,0.000132672,0.000117037,-0.000413335,-0.000829505,-0.000627658,-0.0000942099,-0.000871998,0.000959186,0.00055513,-0.000369181,-0.00130349,-0.00108448,0.000131909,0.00123118,-0.00104116,-0.00181585,-0.001216,-0.000319493,0.00019165,0.000528346,-0.000132748,0.00056076,0.000988056,-0.000457284,0.000872412,0.000399488,-0.00103949,-0.000126095,0.0000276171,0.000401261,0.00165149,-0.00184802,-0.00181076,0.000211152,-0.000970486,-0.00127033,0.000717351,0.000420005,-0.00006382,0.000203382,-0.00100851,0.000323758,0.0000109344,-0.000316047,-0.00087553,0.000451779,0.000716018,0.000782044,0.000924477,-0.00177772,0.00102663,-0.000288184,0.0017373,0.000328272,-0.00194049,-0.000415871,0.000241611,-0.00160836,-0.00117097,-0.000289775,-0.000136346,0.0000229783,0.000571032,0.0000759795,-0.0000719883,0.000220309,-0.000108884,-0.0000833285,0.000245044,0.000191332,0.000929248,-0.000543624,0.000467639,-0.0000366637,0.00148717,0.000526376,0.000775702,0.00048006,-0.00113884,-0.00151492,-0.00104535,-0.000893032,-0.0000147303,-0.00158131,-0.000658668,-0.000618738,-0.000620678,-0.000133246,-0.00148046,-0.00056378,-0.00196971,-0.00135656,-0.000516165,-0.000246144,-0.00038566,-0.00033631,-0.000689372,0.00012636,0.00135355,0.000712394,0.000112509,0.000954789,0.000678832,0.00110516,-0.000582806,-0.0011386,0.000142028,-0.00159712,0.000457565,0.000861618,-0.000270596,0.000779026,-0.000916564,-0.000771141,0.0013412,0.000411903,-0.000308149,-0.0000668436,0.0016661,-0.00108891,0.000316916,0.000338851,-0.000451148,-0.000545107,-0.00113432,0.000116386,-0.000265416,0.00189662,0.000288865,0.0000808272,0.000718063,-0.000435176,0.0000697525,-0.000372391,-0.000406147,0.000796479,0.000387298,0.000152625,-0.00132586,-0.000212003,-0.00154159,-0.0000924122,-0.000494103,-0.000067826,0.00109077,-0.000395726,-0.00068537,0.000769523,-0.000626963,-0.000260446,-0.00109582,-0.00053582,0.000586405,0.000237273,-0.000459285,-0.000317515,-0.0000132198,0.000467006,-0.000175748,-0.00180747,0.000493152,-0.000452482,-0.000381547,-0.0000679886,-0.000613915,0.00115585,-0.00136607,-0.000147111,0.000575,-0.000384823,-0.000123036,-0.000731739,-0.00059203,-0.000489122,-0.000131828,0.0000273103,0.00114262,0.000296937,-0.00112601,0.0000364737,0.000947446,-0.000361116,0.00163515,-0.000573138,-0.000313336,-0.000179394,0.000969214,0.00043407,-0.000696778,-0.000532518,-0.0011704,0.0000661542,-0.00194757,0.000953017,-0.000844046,-0.000796205,0.00174813,-0.0000455016,0.00139801,0.00132202,-0.000905118,-0.00120364,0.00166238,0.000641334,-0.000240323,-0.000626302,-0.000140235,0.000376607,0.000286187,0.00000414905,0.00121379,-0.000967955,-0.000417083,-0.00141921,-0.000973029,-0.000377434,-0.000825255,-0.00066166,-0.000794886,-0.000140379,0.000426274,-0.0000955514,-0.000594372,-0.000406096,-0.000957558,-0.000816105,0.0004498,-0.000369411,0.000829163,0.000745864,-0.00128994,-0.000139394,-0.000712989,0.00086823,-0.00108234,0.000841009,-0.000984667,0.00104114,-0.00175536,-0.000585907,0.000230837,-0.000170349,0.00059901,-0.00153686,-0.000696986,0.00140516,-0.000967038,-0.000341631,0.0017911,0.000983749,0.000313147,0.0000262642,0.00043441,-0.000132795,-0.000869794,0.0000873045,-0.000981119,0.000632224,0.000412174,0.00102886,-0.000701834,0.000967644,0.0000963473,0.000501495,0.000687245,-0.00105287,0.00032975,-0.0003263,-0.000389963,0.00108528,0.00000114567,0.0000614648,-0.000525761,-0.000311936,-0.00174441,-0.000688206,0.000910947,0.000286433,0.00149967,0.000680615,-0.000393932,0.000208953,-0.0000189259,0.00167408,-0.000699124,0.0011877,-0.000453068,-0.00151555,-0.00192794,-0.000118079,-0.0000687601,-0.00110625,0.0000172393,0.000214893,0.0000940031,0.00178377,0.000897409,-0.000234647,-0.00124465,-0.000104125,0.000181228,0.000110384,0.000771221,0.00021905,0.000287422,-0.00148126,0.000721069,-0.000929155,0.00113304,-0.00181262,0.000456831,-0.000521171,-0.0000802467,0.000982758,0.0010142,-0.000163676,-0.00139769,0.00144127,-0.000316927,-0.00173262,-0.000367368,-0.000106146,-0.000115132,-0.00141925,-0.000641694,0.0014762,-0.000339103,-0.00039713,-0.000571024,0.000654091,-0.00122305,-0.000225771,0.000961856,-0.000873623,-0.000567056,-0.000816992,0.000633936,0.000747598,-0.000577115,0.000513346,-0.000292815,-0.00150572,-0.00154969,0.000677918,0.000103477,0.000166643,0.00126268,-0.000764231,-0.000759339,0.000359356,0.000216121,0.00103929,0.000669339,0.000277577,-0.000318564,0.0000142235,0.0013478,0.000465575,-0.000737109,0.00125998,-0.000273199,-0.000593677,-0.000398691,0.000280313,0.000196516,-0.000955018,0.000155525,-0.00060889,-0.00172375,0.00010417,-0.000812573,0.0015012,0.00000559191,0.000471924,0.000655152,0.0013881,-0.000847107,0.000763501,-0.000661858,-0.0010588,0.00031774,-0.000514311,0.000541654,0.0000310465,0.000366631,-0.000379048,0.000162123,0.000287096,-0.000210137,0.00117159,0.00112491,0.000841634,-0.000106632,0.000273112,0.000350665,-0.000629694,0.000352842,-0.00055302,0.00097654,-0.00161673,0.000871777,-0.000302523,-0.00116089,-0.00133294,0.000218511,0.000240725,0.000736799,-0.00137758,0.000625109,-0.000130585,-0.000994292,0.000393552,0.000316293,-0.00194852,-0.000166201,-0.000999011,-0.00100038,-0.000586387,0.000181749,0.000761443,0.000785582,-0.00188822,-0.000946857,0.0000131643,-0.0000699133,-0.00137715,-0.000322303,-0.000539914,0.00142151,-0.00175897,0.00052959,-0.00186934,0.00053915,0.000644444,0.000949353,0.000254388,0.000171469,0.000286127,-0.000283431,0.000268068,0.0000922801,0.000748166,0.00107551,-0.00108071,-0.000203507,-0.000722897,-0.00171548,0.0010061,0.000444127,-0.000892398,0.00158651,-0.000831807,0.000108065,-0.000324145,0.000617154,-0.000257718,-0.000868099,-0.00136715,-0.000916796,0.00110208,-0.00158164,-0.00112906,-0.000124443,0.00151976,-0.00159946,-0.000920685,0.000373591,-0.00150754,0.0000400107,0.0005047,-0.000219429,-0.000873263,0.000292848,0.000562057,-0.000526426,-0.00039518,0.000705777,-0.000260994,-0.000301355,-0.0016874,-0.00130605,-0.00112627,0.000524502,-0.0000820242,-0.00000119078,-0.00191866,0.000217815,0.000332296,-0.000484622,-0.000190451,0.000280121,-0.000501139,-0.00095177,-0.000821324,-0.000886146,-0.000481051,0.00101427,-0.000236685,-0.000390119,-0.000720937,-0.000207542,-0.0000550454,-0.000105579,-0.00088439,0.00047957,0.000225185,0.00067005,-0.000195049,0.000481325,-0.000237096,0.00174741,-0.0000806832,-0.000965189,0.00186199,0.00115132,0.000987983,-0.000119842,0.000486625,-0.000206765,0.00089589,-0.0012084,-0.00165105,-0.000322273,-0.000421137,0.000392133,0.000153577,0.000856015,-0.00142639,0.00182536,-0.00130717,0.00036587,-0.00127534,-0.0000851178,-0.00120407,0.000673303,-0.000304155,0.000198094,0.000591173,-0.000816301,-0.00100836,0.000166726,0.00106024,-0.0000771788,-0.00162147,-0.000736781,-0.00111422,0.00000686624,0.000174428,0.000667601,-0.000758423,-0.000208653,0.0000100465,-0.000608647,0.00139167,-0.00102729,-0.00153482,-0.000363223,0.00142666,-0.00170925,-0.000831361,0.000545369,-0.00146665,-0.000939784,0.000813645,0.000114572,-0.00107213,-0.000172234,0.000977222,0.000525996,0.000265126,0.000713792,-0.000187568,-0.00184579,0.00103811,0.00166172,-0.00105957,0.000362666,-0.00080116,-0.000490903,0.000809483,0.00103835,0.000483128,-0.000678745,-0.000506617,-0.000712944,0.000271265,-0.00118887,-0.000615484,0.0000693495,0.000858575,-0.00108766,-0.000728753,-0.00110848,-0.000163577,-0.000434835,-0.000482903,0.000842481,0.000943382,0.0014772,-0.000362777,-0.000444046,-0.000305495,-0.000071569,-0.000492563,-0.000279182,-0.000793115,-0.000823153,-0.00169039,-0.000854385,-0.00110864,0.000222392,0.000190518,-0.0013444,0.000132404,0.000756802,0.00068863,0.00172173,-0.00170328,0.000129802,0.000394073,-0.00114615,0.000623532,0.000326964,-0.000203989,0.000839986,0.000241216,0.000781495,-0.0000765141,0.000171411,-0.000769897,0.000072316,-0.000838596,-0.000109839,-0.000981209,-0.000696876,0.0000903179,0.000476286,-0.000136711,0.00183477,0.000115485,0.00100632,-0.00132083,0.0001822,-0.00021244,-0.000299343,0.00112453,0.0000681377,-0.000497476,0.000727053,0.00156733,-0.000595601,-0.000505113,0.000725025,-0.000187958,-0.000476451,-0.000553799,0.0011558,-0.0013154,-0.00117894,-0.00161362,0.00136554,0.000746121,-0.000638663,0.00141564,0.000392803,-0.000262949,-0.000923086,0.0011488,-0.00102172,-0.000927583,0.000969834,0.000220333,0.0013778,0.000493107,-0.000345822,0.000209557,0.000241134,-0.000886324,-0.000627274,0.000157819,0.00056219,-0.00105546,0.000363821,0.000279814,-0.000273526,0.000541838,0.000232575,0.00156135,-0.00134831,-0.000453736,-0.000226457,-0.00131044,-0.000642286,0.000359408,0.000355497,-0.00176861,0.0000694277,0.000472373,0.00191545,-0.000335203,-0.00051372,-0.000510794,-0.000469159,0.000311943,0.000316482,-0.000447226,-0.00000912403,0.000857072,-0.00100078,-0.00110063,0.000444454,-0.0013022,-0.00104485,-0.00152762,0.000564381,-0.000923541,-0.00137041,-0.000328579,-0.00131183,-0.0007573,0.00027067,0.000721294,0.000130549,0.000208844,0.000225459,-0.000323156,-0.000523051,-0.000147872,-0.00032,-0.000909585,0.000299842,0.000131603,-0.000779257,-0.00100164,0.00112649,0.000589042,0.0010489,0.00153213,-0.00176843,0.000794125,-0.00191364,0.000386182,-0.000355411,-0.00184355,0.000900016,-0.000842004,0.000750384,0.00119395,-0.000664983,-0.000841714,0.00043739,0.00129041,-0.00059814,0.000391477,0.000493713,0.000600186,-0.000341603,-0.000273551,0.000285745,0.000167255,-0.00124852,0.000482929,-0.000152466,0.000561706,-0.000321989,-0.0012071,0.0000534531,-0.000464806,0.000117773,0.000803653,-0.000418611,0.00115523,0.00117086,0.000471404,-0.0000901382,0.000576895,-0.000279161,0.000912737,0.000192283,0.00134684,-0.000431466,0.000286476,0.00136205,0.000585043,0.000928146,0.00101987,0.000680422,-0.00133406,0.00074442,0.000568495,-0.00104252,-0.000771168,-0.00139718,-0.000387466,0.000332847,-0.000148182,-0.00174665,0.000498085,-0.00153904,0.000389195,-0.00179171,-0.000765631,0.000359521,0.000391637,0.000805011,0.000253861,0.000430321,-0.000993027,0.000609772,-0.00106248,0.000511106,-0.00000538805,-0.000649387,0.00000421559,0.0000509807,0.000864105,-0.00037232,0.000663639,0.000434344,0.000509045,0.0016749,0.000954829,0.00114248,0.000766521,0.0000861566,0.00108412,-0.000995963,-0.00100929,-0.000936926,0.00109313,-0.000367855,-0.000639119,0.00050467,-0.000729248,0.000641434,0.000244571,0.000622247,0.00100476,-0.000273229,-0.000508866,-0.000455294,-0.00147997,-0.000475807,-0.00163594,0.000428148,0.00102741,-0.000926765,0.00124842,-0.000901651,0.000721072,0.000347837,-0.000650237,-0.000425329,-0.000391809,-0.00146317,0.000439885,0.000685102,-0.000429067,0.000440234,-0.000729259,0.00013223,-0.00143405,-0.000998624,-0.000573303,-0.000173015,-0.00141092,0.00063033,-0.000297446,0.000265581,0.00113253,-0.00118361,0.000310737,-0.000898206,-0.00116746,-0.000111906,-0.00167369,-0.00113557,-0.000458337,-0.000335186,0.000773642,-0.000499704,-0.000103638,0.00113601,0.000554491,0.000416233,-0.000396094,0.000654314,0.000468143,0.000334054,0.000916036,-0.000110937,0.000623302,-0.0000209669,0.000479604,0.00140415,-0.000428986,0.00175649,-0.00176955,-0.00125626,0.00192547,-0.000237461,0.000555193,-0.000691765,0.000180319,-0.000704104,0.000358427,-0.00100792,-0.00106332,-0.000288791,-0.0000796109,-0.000476137,-0.00110841,0.000184396,0.000636688,0.0000608705,0.00162248,0.000326665,-0.001348,-0.000479672,0.000177488,0.000737678,0.000696978,0.0000861369,-0.000262297,0.000121094,0.000459213,0.000640788,-0.0000387206,0.000358865,0.000202404,-0.00130987,-0.0000386397,-0.000149151,0.000749701,0.00103686,0.000198098,0.00185431,-0.000543248,-0.000038519,-0.000186927,0.000229413,-0.00036551,-0.000653784,0.00157717,-0.00151258,-0.000161981,-0.000475071,0.000786041,0.00130826,0.00126255,-0.000520403,0.00181155,0.000879535,0.0014296,0.000138433,-0.000567683,-0.000467233,-0.00130834,-0.000791532,-0.000223153,0.000196144,0.000677198,0.0005521,0.000552916,0.000326486,0.00164074,-0.0000654926,0.000105789,0.000556734,0.00126561,0.000586439,0.000126392,-0.000366172,-0.000148522,0.000743529,0.000275771,0.000632947,0.00120283,-0.00131189,0.000155215,0.00107291,0.000778489,0.000587031,-0.00107642,0.000709412,0.00000750425,-0.00165922,-0.00187994,0.000793368,0.00137259,0.00119862,0.000364194,0.0000165948,0.00143106,-0.000666986,-0.000251881,-0.000520369,-0.000642312,0.00090816,0.000620518,-0.000945944,-0.00125968,0.000979859,-0.000440928,0.0000900117,-0.00138705,0.000326396,0.00186984,0.000102959,0.000737829,0.000709399,0.000360004,-0.00190109,0.000250655,-0.000933902,-0.000700267,-0.00144373,-0.000967698,-0.0000107699,-0.000617405,0.00169743,-0.00137269,0.00124254,-0.00127093,-0.000125306,-0.000598618,-0.000297111,-0.000370405,-0.000103729,0.000905003,-0.000116349,0.0000472274,-0.000475148,0.000278478,-0.000165622,-0.000563264,0.00110901,0.000459698,0.00157737,0.000424498,0.000342521,-0.000301874,-0.000737802,-0.00184075,-0.000338319,-0.0000350082,-0.00111384,-0.00175231,0.000716195,-0.000185238,-0.000572398,-0.000554454,0.0013836,-0.000993375,0.00153758,0.00180379,0.000811644,0.0013693,-0.000985425,0.000347475,-0.000309134,-0.000419752,-0.0000741782,0.00116659,-0.000547412,0.000383247,0.000183138,-0.000504744,0.000644692,-0.000737844,-0.00104911,-0.000279726,0.00172646,-0.000111122,0.000655303,-0.00122457,-0.000479744,0.0014744,-0.000912949,-0.00103004,-0.00173677,-0.000305313,0.00126526,0.000181397,-0.000540526,0.000377493,0.00194154,0.000145715,0.000867916,-0.00138809,-0.000818867,-0.00196512,-0.00105239,0.000800269,0.000412604,0.000981964,0.000101881,0.000137793,-0.000793593,-0.00137923,0.000507219,0.000808968,-0.0015974,-0.000355486,-0.000427891,-0.00014919,-0.0000659512,-0.00180127,-0.0000248288,0.000222499,-0.00159264,0.000478588,0.000714947,0.000649978,0.000910604,0.000254013,-0.000191568,-0.00121499,-0.00015842,0.000892823,0.00149571,-0.000774344,0.0000883292,-0.000292186,-0.000243252,0.000809735,-0.000306123,-0.00136737,0.000839087,0.00013321,0.00144341,-0.000103577,0.00139875,0.00114436,0.000396397,-0.000565546,0.000597169,-0.000300298,-0.000268035,-0.000168457,-0.000635515,-0.0010817,-0.000230517,0.000289591,0.000469553,0.000471116,-0.000550903,0.000268682,-0.000291973,-0.00104563,-0.00093327,0.000958964,0.00109176,0.000109128,0.000445651,0.000825393,-0.000693389,0.000813062,0.000772789,-0.000924062,0.00149618,-0.000418395,0.0000104104,-0.00087425,-0.00179228,-0.00065495,0.0000863516,-0.000656411,0.00121906,-0.000293375,-0.000848356,0.000350841,0.00154513,0.000281335,0.000194843,-0.000526458,-0.000114623,0.000498226,-0.0000428166,0.00115753,-0.000187757,0.000000748742,0.000310577,-0.000984797,0.000555184,0.00134314,-0.00140774,0.000406885,0.00153516,-0.000391937,0.000882678,-0.000925252,0.000460385,-0.00194814,0.000943522,-0.00117285,-0.0015037,-0.000423272,0.000487655,0.000391749,0.000656222,0.0000954345,0.0014707,0.0000704411,-0.000946728,-0.00138644,-0.000459514,0.000231498,0.000388173,0.000580706,0.0000922316,0.00172686,0.000486265,-0.000654873,0.0000427206,0.000966617,-0.000351683,0.000466587,0.000877605,-0.000956132,-0.000111797,0.000624134,-0.000650957,-0.000957086,0.000661188,0.00125387,0.000971118,0.0006905,-0.00132017,-0.000946003,0.000832651,-0.00139185,-0.000169359,0.00078308,0.00127758,-0.0000284138,-0.000491582,-0.000775822,0.00118842,-0.000303553,0.000594844,0.000488716,0.00111996,0.00166537,0.000687577,0.000264978,-0.00182866,-0.000749875,0.0000435887,-0.000670895,0.000464878,0.00103158,0.000609149,0.00126966,-0.000825493,0.000221184,0.000314173,0.000789397,-0.000565913,-0.0015903,0.000403289,-0.00055817,-0.000754139,-0.000320905,0.0017781,-0.00078514,0.000268798,-0.0000680287,-0.000385768,0.000543047,0.00106068,-0.000519108,-0.00150997,0.00128312,-0.000503187,-0.00126428,0.00169691,-0.00110018,-0.00125651,-0.000602799,-0.000154273,0.00167594,0.00114151,0.0018792,-0.00131241,-0.000000682857,-0.000147438,-0.0013798,-0.00031191,0.000698385,0.000484574,-0.00157254,0.000378599,0.000541823,-0.000984384,0.00109791,0.00069351,0.000388784,-0.000818458,-0.00133914,-0.00066447,-0.000156457,0.00158348,-0.000341933,0.00172152,0.000380611,-0.000514209,0.00127566,-0.000943796,0.000850929,0.000182523,-0.000151372,0.000654007,-0.00127024,0.000603775,-0.00102976,0.000558088,-0.00113135,-0.000691711,0.000632953,-0.000986753,-0.0000884527,-0.000982571,0.000628443,-0.00153419,0.00137728,0.00126419,-0.000795151,-0.0013555,0.000960693,0.000950097,-0.000310883,0.00111095,-0.00123972,-0.000495777,-0.000038828,0.00045214,0.0000758724,0.000691423,-0.00129059,0.000619639,-0.000982058,0.000591075,0.000188209,-0.000488009,-0.000596811,0.000205372,0.000310936,-0.00100881,0.000792325,-0.000930825,-0.00115342,0.00118532,-0.000248027,0.000475036,-0.00134683,0.00185494,-0.00158196,-0.000672667,0.000415423,0.000733981,-0.00091992,0.000764159,-0.000968777,0.000503384,-0.000185603,-0.00174748,0.000290934,0.00108837,0.00133938,-0.00051132,0.000754877,0.000793016,0.00038938,0.00188317,-0.00116223,-0.0000088513,0.00114516,0.000143706,-0.000863831,0.000681262,0.00154293,0.00138702,-0.000879461,-0.000411259,0.0000447673,-0.000780941,-0.000501186,0.000759535,-0.00116886,0.000277251,0.000661274,0.00102696,0.000875018,-0.000342364,0.00103228,-0.00149203,-0.00151545,-0.00077095,0.000759125,-0.000907411,-0.00107804,0.000142562,-0.000869663,-0.0000866122,0.0000535565,-0.00146972,-0.000611629,-0.000242692,0.0016932,0.0000311867,-0.000196704,0.00134623,0.00136787,-0.000531715,0.00088381,0.00118659,0.000659974,-0.000390482,-0.00186198,0.000550919,-0.000343443,0.000285486,-0.000523525,0.0000847295,0.000652893,0.000873445,-0.000381007,-0.000405031,-0.000334961,-0.000518612,-0.000791265,0.000367843,-0.000920293,0.00103887,-0.000623237,-0.00000153508,-0.000722547,0.0000450692,-0.000562192,-0.00039981,0.00126477,0.000572612,0.000198508,0.000507957,0.00125025,-0.00081755,-0.000315928,0.00117797,-0.000821866,-0.00154608,-0.000538265,0.000615598,-0.000701319,0.000235318,-0.0000890969,0.000612536,0.00188433,0.000906803,-0.000232324,0.000678499,-0.000560464,-0.000811561,-0.000244796,0.0000450838,0.0000554395,-0.00128625,-0.000395521,-0.000178446,-0.00176507,0.000167214,-0.000540542,0.0000017267,-0.0000194597,0.000678254,0.000360677,-0.00147694,-0.000170295,-0.000485705,-0.00029152,-0.00101391,0.000914771,0.000556508,0.000495344,0.000755772,0.000293975,0.0000846592,-0.000791094,0.000912108,0.000128295,0.000686757,0.000664552,0.00100269,0.000247264,0.000337093,-0.000622079,-0.00111949,0.0000409416,-0.000288874,0.00144234,0.00118833,0.000203059,0.00130298,0.000369728,0.00107538,-0.000974176,0.00007335,0.000578402,0.0000608163,0.000464541,-0.000252563,-0.000662611,0.00185568,0.00144804,-0.000522317,-0.000110546,-0.000120759,0.000861334,-0.000551025,0.00166684,-0.00024493,-0.000651698,0.0000420927,0.000446707,0.000191519,-0.00115705,-0.000638094,-0.00069593,-0.000598785,0.000869849,-0.000984113,-0.00152418,0.000374408,0.000176019,-0.00057696,-0.0000243188,0.00182544,0.00143953,-0.000272846,0.00109521,0.00172882,-0.000253392,-0.000168765,0.00156377,-0.0000541966,0.000121441,-0.000541529,0.0000524351,-0.00091427,-0.000787387,0.00113648,-0.000660556,0.00115876,0.000190378,0.00102969,-0.00103456,0.00100777,0.000234154,-0.00192555,0.000208918,0.000117679,0.000260582,-0.000745721,0.000569639,-0.00131701,-0.00142216,-0.0000255826,0.0017629,-0.000112467,-0.00111201,-0.000924796,0.000101151,-0.000709977,0.00100254,-0.0000395416,-0.000494176,-0.000345199,-0.00032136,0.00024929,-0.000753443,0.000967307,-0.000255709,-0.000594642,0.00119936,-0.000879841,-0.000616853,0.00163589,0.000255291,-0.00119471,-0.00112394,0.0012919,0.000390657,-0.00191921,-0.000196437,0.0000748251,0.000457262,-0.00148747,-0.00116355,-0.000296129,-0.000168411,0.00180956,0.000495974,-0.000459665,0.000936484,-0.000383904,0.000926829,-0.000318577,-0.00131904,0.000738769,0.00111507,0.000297428,0.000766476,0.000965673,0.00107339,-0.00114807,-0.00173787,0.000367508,0.00196647,-0.000143751,0.0000830818,0.00113065,0.000880991,0.000481852,-0.000636687,0.000336136,0.00122948,-0.000203802,0.000653794,0.000970766,0.00010464,0.000762337,0.00183129,-0.000276013,-0.000849064,-0.000644003,-0.000790042,0.000925678,0.000680163,0.000668918,-0.000978907,0.00143763,0.000537852,0.000118587,-0.000134841,0.00064436,0.000322637,0.00126127,-0.0015787,-0.000461035,0.000226539,0.0000547674,-0.000005894,0.000219764,-0.00137298,-0.000441425,-0.00000408452,0.00130139,0.00151111,-0.000180862,0.00114,-0.000724786,-0.00122803,-0.0014716,0.000358832,0.000405526,0.00135358,0.00135962,-0.000756374,0.00114643,-0.00107208,0.00147384,0.00121282,-0.000104584,-0.00109181,0.000952179,-0.0014418,0.0000624404,-0.00108967,-0.000495738,-0.000961299,-0.000244843,0.00107937,0.00062726,-0.000342883,0.000727778,-0.000630631,-0.000103012,-0.000483134,-0.000890047,-0.00147733,0.00128251,0.00180243,0.00161712,-0.000226807,0.0000624434,0.00104179,0.000255871,0.000881469,0.000604033,0.000537127,-0.0000476207,-0.00119754,-0.000114547,0.000848105,-0.00136046,-0.000486056,-0.00071415,-0.000784648,0.000503367,0.000965134,0.000190814,0.000615458,-0.000241873,0.00126023,0.00111923,-0.000290162,-0.000103851,-0.0000696956,0.0000213832,0.000955473,-0.00066167,-0.000271184,0.00186231,0.000998063,0.000667784,-0.00108199,-0.00179653,0.000601849,0.00122741,0.000244986,0.00146419,-0.000242242,0.0000292378,0.0000334308,-0.000470347,-0.000858839,0.00108666,0.00100506,0.000242711,0.000425972,0.000517212,0.000311854,0.00165391,0.000521527,0.00111695,0.000931106,-0.000365468,-0.00138383,0.000873506,0.000568182,-0.0000239143,-0.000248037,0.0010131,0.000313327,0.000899656,-0.00030322,-0.00167446,0.000276722,0.00107089,0.00140186,-0.0012862,-0.0000189285,-0.00031829,-0.000935643,0.000102136,0.000338502,-0.000895558,-0.00164155,0.000176572,-0.00121125,0.000361326,0.000016852,-0.00029682,-0.000218278,-0.00022275,-0.00170332,-0.000730914,-0.000330375,0.00175967,-0.000120961,-0.000143855,0.00170794,-0.000498437,-0.00079655,0.000549451,-0.000081404,-0.000876809,0.000148027,0.000746375,0.00024022,-0.00021608,-0.000303593,0.000346064,0.00133548,-0.000363328,0.0000259907,0.00148619,-0.000991273,0.000862335,0.000103344,0.000305181,0.000897507,-0.00192311,0.000897707,0.000632465,-0.000589009,-0.000964709,0.00169552,-0.00111999,-0.00129679,-0.00110556,-0.00067698,0.000615718,0.000273684,0.0000955932,-0.000830966,0.000240884,0.0000677611,0.000525235,-0.00101711,0.000286534,-0.00088005,-0.0000137055,0.00108433,0.000870091,0.00125294,-0.000066723,0.000991336,-0.000488487,-0.00075521,-0.00185927,-0.00120099,0.00076999,0.00023536,-0.00101623,0.0000945972,-0.000178714,0.000254422,-0.0000148497,-0.00107731,-0.00023268,0.000345289,-0.000373825,-0.000616874,-0.000323743,0.00114369,0.000299626,0.000186171,-0.00121497,-0.000498846,-0.0010126,0.0015689,-0.00098196,-0.00148839,-0.00138602,0.001576,-0.00115578,0.000328228,0.000301959,0.000522182,0.000901873,-0.000460058,-0.000643693,0.00115875,0.000743834,0.00015068,-0.0000456636,0.000929144,0.000443941,-0.0013795,0.000611007,-0.0000838385,0.00105139,-0.000625378,0.000259354,-0.000254148,0.00102374,0.0011431,0.000395523,-0.000596181,-0.000215528,-0.000572007,-0.000637189,-0.00128862,0.000324635,0.00114712,0.000260904,0.000834326,0.00182398,-0.000711082,-0.000903719,0.000338929,-0.000689924,-0.000134082,0.000373292,0.00113303,0.00189005,0.00130374,-0.000206447,-0.0000610911,-0.00106942,0.00096493,-0.00106811,0.000392231,0.00119025,-0.000721541,-0.000809569,-0.000691065,-0.000557517,0.00091518,-0.000770293,-0.000855703,-0.000121695,0.000697188,0.00191696,-0.00116178,-0.000457892,-0.000350486,0.000449136,0.000211769,-0.000299392,-0.00143432,-0.000971804,-0.000648821,0.00199751,0.000557734,0.00196874,0.000470376,0.000869937,-0.000698217,0.00069113,-0.0000333096,0.00132709,-0.00140646,-0.00128722,0.000960672,0.00058554,-0.00121345,-0.00178515,0.0000196595,-0.00037071,0.00046376,-0.0000190136,0.00034535,-0.000956661,-0.000608078,-0.00130444,0.000060638,0.00119785,-0.000431143,0.000061624,0.000694349,0.000493107,0.000426439,-0.000622909,-0.0000304096,0.000246132,-0.000794828,0.0000779659,0.000786794,-0.000443143,0.000823385,0.000722676,0.000269036,-0.000210572,0.00110971,0.000723783,-0.000087979,0.000886386,0.00122923,0.000592873,0.00120653,0.0010292,-0.000337389,-0.00104982,0.00127845,-0.00104385,0.000777597,0.000670562,0.00132625,0.000366397,0.000952003,-0.00000314737,-0.00138668,0.000426276,-0.0000343264,0.000392976,-0.000383289,0.00124015,0.000470916,0.000942403,-0.000271157,-0.000431094,0.000364063,0.00029742,-0.000913716,-0.000083278,-0.000338319,-0.000132543,-0.000267758,0.000278742,0.000435904,-0.000930952,0.00105696,-0.00168741,-0.0013281,-0.000421362,0.00186472,-0.00139585,0.000311926,-0.000556584,-0.000478919,-0.000789261,0.000651271,0.00198651,0.00027966,0.0000981495,-0.000236913,-0.00127704,-0.000231704,0.000648638,-0.000865234,0.00105564,0.000132066,-0.000912275,-0.000931073,0.00109764,-0.000844499,0.00120654,0.000549069,0.000434101,-0.000343426,0.00161994,-0.000202058,-0.00110667,-0.000419687,-0.000381327,-0.000610248,0.000575572,0.000751442,0.00135313,-0.000624334,-0.000575681,0.00187652,-0.000667462,0.000170774,-0.00080422,0.000433446,0.000989244,-0.00146026,0.00144934,0.000604583,0.0000068381,0.000372868,-0.00103372,0.000321175,-0.00159553,-0.000777476,-0.000168414,-0.0015334,0.000459265,-0.00000675901,0.000137722,0.000423195,0.00124928,0.000231928,-0.000732951,0.000441003,-0.000316554,-0.00122384,0.000701619,0.000643564,-0.000663679,0.00109877,0.000825008,0.00130745,0.00000110506,-0.0000839147,-0.000381594,-0.000710666,-0.000344619,0.0000741054,-0.000288893,0.0000696986,0.000836108,0.0000409478,-0.000495514,0.000929753,-0.00042998,-0.000342708,0.000591305,-0.000263406,-0.00157386,-0.000777151,-0.000872744,0.000411285,-0.000154702,-0.000874666,-0.00151608,-0.0000688035,0.000776713,0.000706674,0.000350919,-0.000186457,0.0000369156,-0.00089862,0.00132961,0.000564711,0.00183406,-0.000442554,0.000553236,-0.00177428,0.00182894,0.000641658,0.00145632,0.00100853,0.0000721857,-0.00126566,0.000512736,-0.000836378,0.0000494874,-0.000880181,-0.000927303,-0.000242543,0.00084681,-0.000745622,-0.000192284,0.00159407,0.0000868943,0.00160404,-0.000862006,-0.000402507,-0.0000899651,-0.00117171,-0.00126918,-0.000677157,-0.0002702,-0.000117368,0.00033959,-0.00125154,0.000443314,-0.00115803,0.000707564,-0.000465475,0.00000600081,-0.0000862343,0.000793267,0.000313713,0.0000744304,0.000188086,-0.000247801,0.000370886,0.000164136,0.000795292,0.000558931,0.0011183,-0.000168975,-0.00182531,0.000324593,0.000321025,0.000214856,0.000398959,0.00109321,-0.000739375,-0.00190575,-0.000750199,-0.00150149,0.0000333961,-0.00105703,-0.0007125,0.000130663,0.000306016,0.000616541,0.0000418467,-0.000264105,-0.000117792,0.00091502,-0.00196167,0.000313839,0.000281687,-0.000316429,0.00122343,-0.00048285,0.000206012,-0.000272195,-0.000223154,-0.000579185,-0.000421018,0.000335535,0.00137137,-0.00143718,-0.00192868,0.000657622,-0.000276434,-0.000521761,0.000627787,0.000993005,0.0011158,-0.00193069,-0.000103554,0.000687881,-0.000266249,-0.000566819,-0.000742501,0.0000713198,0.000719413,-0.0013244,-0.000640556,0.000899182,-0.0000521976,0.000750962,-0.00051409,0.000174547,0.00191977,-0.00117148,0.00126201,-0.000456236,0.000187504,-0.000207831,0.00127054,0.000150461,-0.00102424,0.000149386,-0.000812929,-0.000862891,0.000678325,-0.000416522,-0.0000244023,-0.000730325,0.00081909,0.000083711,-0.00153188,-0.000120959,0.00061061,0.000988209,-0.00133466,-0.000655249,-0.000441425,-0.000885218,-0.000698938,0.00158561,-0.00125216,-0.0000294467,-0.000771484,-0.000695725,0.00167242,0.000519937,0.000419423,0.000507984,0.000683571,-0.00139011,0.000634583,-0.000163526,-0.000225351,0.000520542,0.00108229,-0.000683071,-0.00111724,-0.000483019,0.000703687,-0.000111918,0.0016683,0.000514771,-0.00127508,-0.00101299,-0.00122348,0.00116867,0.000567026,-0.000654297,0.000128168,0.000378161,-0.000876675,-0.00029493,-0.00090934,-0.000167138,0.0000208153,0.000187253,0.000366212,-0.0000564339,-0.000930221,0.00165306,0.000175872,-0.000785034,-0.000274931,0.000312406,0.0000407302,-0.00112726,0.000455866,-0.00149704,-0.000411649,-0.000174475,0.000433699,-0.000794258,0.000193657,-0.000206137,-0.00082913,-0.00102113,0.00127275,-0.000944885,-0.000734692,-0.0000981842,0.00131166,0.000300786,-0.000275682,0.000113887,0.000145588,0.0000104002,0.00111708,-0.000841735,-0.00114268,-0.00115241,-0.0000543831,-0.000253203,-0.00142502,0.000577326,0.000425227,-0.000057235,0.00137721,0.00108223,-0.00000350435,0.000869753,-0.000065457,0.0000477098,-0.000698308,0.00107063,-0.00065953,0.000778053,-0.000912817,0.0000829269,-0.00037031,-0.000483921,0.000389426,0.0000811531,-0.000221166,-0.000159323,-0.000493824,-0.000880705,-0.00105969,0.00135639,0.0012965,0.000787799,-0.000461429,0.00010145,-0.000996877,-0.000461512,-0.00177919,-0.0000913334,-0.000752974,0.000365347,0.000382276,0.00156831,-0.00118653,0.000283216,0.000296331,0.000443071,-0.000553211,0.00114401,-0.00162365,0.000746182,0.000449647,0.000839088,0.000824165,0.000895743,0.00044758,-0.000327168,-0.00052741,0.000204146,0.000760763,-0.000133246,0.00112645,0.000959032,0.000688654,0.000153584,0.0000875539,0.00101862,-0.000393361,-0.000347173,-0.000390588,-0.000770313,0.00137234,0.00169596,-0.000789592,-0.00131369,0.000664559,0.00070259,0.000588972,-0.000394061,0.000407907,-0.000539243,-0.000683243,0.0004912,0.000340859,0.00033163,-0.00136068,-0.00113937,0.000246058,0.00110676,0.00126314,0.00130005,-0.0011353,-0.0000866611,0.0011014,0.000513478,-0.00167885,0.000304941,0.00135161,-0.00130807,-0.000746257,-0.00149225,-0.000450636,-0.00052517,0.000985257,-0.00117529,0.000618306,0.00073486,-0.0014367,0.000882271,-0.000358339,0.0008042,0.000262567,0.000600466,-0.000360483,-0.000807837,-0.00118203,-0.000593154,-0.000231287,-0.000103088,0.000859086,0.000233684,0.000252488,-0.0000560295,0.00135442,0.000514659,0.000476179,-0.000146954,-0.0000674657,-0.000424069,0.00155015,-0.000143232,0.000673651,0.00141985,-0.00147035,0.000921838,0.000515997,-0.000911806,0.000877075,0.00074135,-0.000602494,-0.000576095,-0.000463776,-0.000393155,-0.000680284,-0.000587552,-0.00116837,-0.00116917,0.000269257,-0.00019186,0.000870695,0.000596715,0.0000687357,-0.000314432,0.000539536,-0.00128194,0.000555091,-0.00127846,-0.000583015,-0.000737931,0.00047308,-0.00096626,0.000690935,0.000501313,-0.000536433,0.00118407,-0.000732398,-0.00164891,-0.00193124,0.000520933,0.00175177,-0.000159484,-0.0003403,0.000460469,-0.000833911,-0.0017992,0.0000496041,0.00111534,0.000241429,-0.0000650995,-0.000340643,-0.00050723,0.000129399,-0.0000913402,-0.00191654,-0.00128093,0.00119512,-0.00097093,-0.0000787979,-0.00126541,-0.00133884,0.000363435,0.000944653,0.00102341,0.000496673,-0.0010426,0.00188632,0.000935347,-0.000804225,-0.00129836,-0.000439963,0.00168614,0.00139139,0.00143342,0.000616751,-0.000914584,-0.000576227,-0.000265002,-0.000000486452,-0.00101573,-0.00108388,0.000560685,-0.00100896,-0.000553817,-0.00181512,-0.000806423,0.000901651,0.00076878,-0.00123968,0.000281109,-0.000877509,0.000422955,0.000349919,-0.000280869,-0.000304932,-0.00092393,0.00125494,0.00140616,-0.000403946,-0.00125836,0.00000674142,-0.000525551,0.000763057,-0.00026793,0.000313727,-0.000811759,0.000777078,-0.000141434,-0.000495324,-0.000683889,-0.000100829,-0.000136137,-0.000243263,0.000202032,-0.000597636,-0.000446111,0.00056964,0.0000572923,0.00151663,0.000866366,-0.000349071,0.000292246,0.000517539,0.00170907,0.000645935,0.00162483,-0.00182985,-0.00181097,0.00129354,0.000812805,-0.000142997,0.00116856,-0.000983512,-0.000250785,-0.000467926,-0.00113555,-0.0015496,0.0000574753,-0.000571496,-0.000436351,0.00163014,-0.00151654,0.000107915,-0.000369689,-0.000906486,0.000330364,-0.00112883,0.000281031,-0.000818741,0.0000221662,0.000399357,0.000242894,0.000079047,0.00144971,-0.000536557,0.00149371,-0.000262696,-0.000561282,0.000625042,0.0010762,-0.00112453,0.000336067,0.0000605084,-0.00051437,0.000153327,0.000734754,-0.000246584,-0.000403903,0.000809583,-0.0000199964,-0.00120205,0.0000816381,-0.00144474,-0.000146423,0.00136962,0.00118032,0.00051214,-0.00135263,-0.00111075,-0.000339919,0.000181865,0.000710024,0.00024875,0.00175254,0.00014257,-0.000666146,0.00180726,-0.00156411,-0.000872141,0.00138696,-0.000433438,0.000402402,0.0000459717,0.000645604,-0.000542179,0.000744222,0.000786431,-0.00055494,0.000925309,0.00187267,-0.000815912,0.000998222,-0.00101233,0.00155572,-0.000755121,-0.00149554,-0.000485095,-0.000211984,0.000299225,0.000256191,0.000284085,0.00133022,-0.00111259,-0.00083619,-0.000156655,-0.00178099,0.00105713,-0.00117565,-0.000170494,0.0010276,0.000794545,0.000747615,-0.0000718296,-0.000651606,0.000741617,0.00139197,0.00000265668,-0.000121912,-0.000694228,0.000318215,-0.000614392,0.00108507,0.000843089,0.000344723,0.00130153,-0.00058219,-0.000379332,-0.00119035,-0.000146498,0.000945051,0.000321269,0.00036082,0.000776104,-0.0000688879,0.000220665,0.000870951,-0.000337161,-0.000727216,0.000997172,-0.00151683,0.000577266,0.00113336,-0.00173889,0.00107956,0.0000320297,-0.000383453,-0.000869249,0.000504532,0.000605123,0.000327023,-0.00138745,0.00019313,-0.000772554,0.000760531,-0.000432114,0.00100007,-0.000800059,0.0017612,-0.000356956,0.000335665,-0.00160988,0.000874169,-0.000836229,-0.000100105,-0.000419602,0.000222049,-0.000430242,-0.00130451,-0.000510137,0.00113522,-0.000053265,0.000943448,0.0000146728,-0.000464444,-0.000948991,0.000643471,-0.001264,0.0000484513,-0.000409706,-0.000319517,0.0000526827,0.00142315,0.000633561,0.00042234,0.000662447,0.000254065,0.00130192,-0.000529854,0.0000984869,-0.000592715,0.0000820282,0.00101548,-0.00166687,0.00033583,-0.0016578,0.00103254,-0.000929635,0.000453337,-0.000495479,0.00160935,0.00117475,0.000132539,-0.00033564,-0.000404863,-0.00187145,0.000487569,-0.000698975,-0.0000830163,-0.00067829,0.00108593,0.0000182266,0.00121851,-0.000849038,0.00037922,-0.0000970454,-0.000793915,-0.00190327,0.000769834,0.0013631,0.000557941,0.00113789,0.000858009,0.000204373,-0.000345377,-0.000840806,0.00105442,-0.0000265867,-0.000717894,-0.000814991,0.000416826,-0.000262865,-0.000421538,-0.00161409,-0.000472906,0.000259133,0.000407764,-0.000987238,-0.00079765,-0.000311041,-0.00160877,0.000938293,0.000360734,0.0000848861,-0.000434561,0.000359287,-0.000217871,-0.0000290821,-0.000031535,-0.000515343,-0.000882659,-0.0011449,-0.000132545,-0.000545733,-0.000545807,0.000168992,-0.00082779,-0.000932886,-0.000546122,-0.000436843,0.000143476,-0.000532799,-0.00118009,0.000349846,-0.000311671,-0.000214273,-0.000640242,-0.00161871,0.000648799,0.00105993,0.000408081,0.00135962,-0.00196698,0.000491378,-0.00103324,-0.000253695,-0.00114956,-0.000315739,0.00187954,0.0000122439,0.00192047,-0.00025559,-0.000474972,0.00141619,0.000237998,0.00190546,-0.000111606,0.00128312,-0.000478809,0.000372807,-0.00113183,0.000309624,0.000918538,-0.000409586,-0.0000651856,-0.00148024,0.00113107,-0.000679838,0.000604513,-0.000436723,-0.000614757,-0.000920837,-0.000740829,0.00114656,0.000550562,0.000762987,-0.000758171,0.0000228064,0.000254905,-0.000855723,0.00134446,0.000480246,0.0010276,0.00154403,0.0012522,0.000666075,-0.000282293,0.000204389,-0.000126424,-0.00056348,-0.00107192,0.000483815,-0.000156708,0.00133587,-0.000757119,0.00140696,-0.000544921,-0.00133599,0.000621034,0.000519893,-0.000753066,0.000764523,-0.0000750696,-0.000421075,-0.00132264,-0.000541751,0.00020206,-0.000591986,-0.000418666,0.000399396,0.00103851,0.000346016,-0.000534028,-0.0000937873,0.000531078,-0.00101891,0.00014369,-0.00156254,0.0000116538,0.00138984,0.00102549,0.000773059,-0.0000638003,0.0000703334,-0.000000166741,0.000034642,-0.00199941,-0.00142408,-0.00165869,0.0000387641,0.000493296,0.00125566,-0.000426775,0.00155076,-0.00018834,-0.0000935217,-0.00103418,0.000539052,-0.000283097,-0.000430552,0.00076763,-0.000702797,-0.000220469,-0.000490959,0.0013067,0.00113154,0.00046344,0.00198501,0.000889749,0.000831818,0.0006807,0.000645208,0.000790603,0.000682904,-0.00000268313,-0.0000761801,0.000159211,0.000475464,0.000039434,0.000234755,0.000501222,-0.000575132,0.000675856,0.000342368,-0.000777262,-0.00132596,-0.00090697,0.000498854,0.000579155,-0.000761049,0.00146147,-0.000620366,0.000662744,-0.000101088,0.000580802,0.00000829124,-0.000677143,0.0000271404,-0.00111949,-0.000858558,-0.00117831,-0.00164686,0.00124556,0.00017634,-0.000680846,-0.000282133,-0.000307533,0.00140686,0.00170594,0.00122215,0.000221792,0.00117472,0.000551714,0.00193034,0.00145052,-0.000720192,0.00160849,0.00136419,-0.000936799,-0.000879939,-0.000216344,-0.00104293,-0.000490137,-0.000476491,-0.000778927,-0.000195416,-0.000694591,-0.0000884017,-0.000900201,-0.00184939,-0.000943469,0.000243172,-0.000661642,-0.00159174,-0.000123191,0.00122094,-0.000950301,-0.00145686,0.00198892,0.000604786,-0.000322333,0.000755935,-0.000592615,-0.000467843,0.000243247,-0.00010443,-0.000150785,-0.00075442,-0.00168442,-0.000380452,-0.000661536,-0.0016723,-0.000683963,0.000678278,0.00114009,-0.00101524,-0.00128396,-0.00033022,-0.00048544,0.00199539,0.00143287,-0.000940306,0.000814773,-0.000296784,-0.000624324,-0.000592816,0.00149269,0.000208278,0.00088622,0.00106821,0.00121995,-0.000540703,-0.00136146,-0.0000232232,0.000884565,-0.000537359,-0.000113715,-0.000716918,-0.00139766,0.000284503,-0.000603936,-0.0000875087,-0.000931179,0.000889491,-0.000989575,0.000612818,-0.000578837,-0.00103146,0.00122704,0.00119036,0.00154867,-0.000638468,0.000819874,0.000373149,0.000859291,-0.000195205,-0.00038847,-0.000644156,-0.00175463,-0.000156872,-0.0011055,0.0000489549,0.000518616,0.00079958,0.000528715,-0.000194493,0.00127922,0.000438488,0.00125259,0.000167544,0.000812928,-0.000279586,0.00103724,0.00169295,-0.000480283,0.000325377,-0.0014699,0.000110702,0.000801954,-0.00147755,0.000351965,-0.00022405,-0.000535976,0.00080379,0.000387029,-0.000241334,-0.000151935,-0.000992909,0.00116506,0.000427582,-0.00194368,-0.000187994,-0.000227706,0.00127636,-0.0000269618,0.000463389,-0.00095996,-0.00159688,-0.000932704,-0.00074478,-0.00000302986,-0.00098362,-0.000288439,-0.00118897,-0.000920797,-0.000830767,0.000580172,-0.000681533,-0.000285368,0.000690842,0.00147099,-0.000236187,-0.000608034,0.000811518,0.00122723,-0.0010118,0.000387628,0.0000475218,0.0000855626,0.000851919,0.00094796,0.000854671,0.00000582967,0.000207071,0.000669848,-0.00183346,0.000417847,-0.000993021,0.00102904,-0.00125315,0.00015337,-0.000635852,-0.00148758,-0.000537553,0.000547986,0.000354959,-0.000566855,0.000299206,-0.00171241,-0.00157076,0.000111544,0.000724403,0.000217502,0.0010773,-0.000692834,-0.000904748,-0.000113574,-0.00165173,-0.000680983,0.00173562,-0.000102933,0.00114866,0.00135684,-0.000293787,0.000754996,-0.000684622,0.000732916,-0.0017841,0.00109156,0.0000434911,-0.0000779962,0.00000031229,-0.00138083,-0.00118102,0.000986092,-0.0002378,-0.00098327,0.00030822,0.000103922,0.00114252,0.0002156,-0.000131269,0.000192872,0.000135255,0.000691917,0.000278886,-0.000850284,-0.0000934792,0.00107435,0.0005291,0.0000729766,0.00159138,0.00104475,0.000164289,-0.0000740981,-0.000296505,-0.00110235,0.00135394,0.000482867,0.000116612,0.0014453,0.00157938,0.000723799,0.000248019,0.0000273,0.00185595,0.000624545,0.00115418,0.000400525,-0.000429199,0.0000138758,-0.000177167,-0.000157554,0.00107241,-0.000526066,0.00000422087,-0.000541383,-0.000457822,-0.00000594777,-0.000165932,-0.000720823,-0.000383427,0.000968809,0.000655332,-0.0000254834,0.000455945,-0.000573488,0.000849367,0.00151962,-0.000587299,-0.00106924,0.0000282854,0.000531694,-0.000888246,-0.000272938,0.00128041,-0.000548892,0.000517245,0.000711643,-0.000245408,-0.00154077,0.00127747,0.00118989,-0.00158092,-0.000321,-0.0000875083,0.0000575909,0.00081356,0.00158814,-0.00121969,-0.0000518965,0.000738919,0.00136533,-0.000964985,0.000916111,0.000493048,0.000439784,0.00159546,-0.00183975,0.000764811,0.000285472,0.000378847,0.00144249,-0.000335702,-0.00191447,0.000414939,-0.000136902,-0.00121058,0.00101474,-0.00182338,0.0000450955,0.00058093,-0.00103711,-0.00087692,-0.000217778,0.000303639,-0.000116624,0.000515151,-0.000790842,-0.000540929,-0.000062131,-0.00118088,-0.00104326,-0.000588625,-0.00117762,0.0013397,-0.00120383,0.000844672,-0.000126357,-0.000910398,0.00123974,0.00106891,-0.00123015,-0.00105538,0.00112933,-0.000342266,-0.00198694,-0.000250145,0.000507466,0.000172971,-0.00040521,0.00106074,0.000625319,0.000466767,0.00072548,0.000940908,-0.000952126,-0.00109123,-0.000862857,0.00103309,-0.00138119,0.000415798,0.000978506,-0.000277359,0.00164874,-0.00098917,0.000355697,0.000974219,-0.000609874,-0.000223358,-0.00155864,-0.00114575,-0.000712115,-0.000446506,0.000416922,0.000539135,0.00119932,0.000237298,0.00115946,-0.000468763,-0.000640042,0.00109177,-0.000632024,-0.000321564,-0.0012282,-0.000384623,0.000291314,-0.000520562,0.000704841,0.000521288,-0.00161944,-0.000191448,0.000758967,0.000030883,0.000320336,0.00049016,-0.000708725,0.000319612,-0.000938326,-0.00192076,0.000775404,0.000431893,0.000925309,0.00024005,-0.000210446,-0.00113459,0.000679675,-0.000554332,-0.000718949,-0.000109164,0.000104395,0.000118359,-0.000168659,0.000131147,0.00035699,0.000888364,0.000256244,0.00106819,-0.000887978,0.000268564,-0.00165157,0.000496613,0.00105009,-0.00100316,-0.000351029,0.00150707,0.000995645,-0.00113442,0.000722291,-0.000744639,0.000692883,0.00123167,-0.000412259,0.000706072,0.000517644,0.00130293,-0.000731392,-0.000843428,0.000571493,0.000304728,-0.000193462,-0.000369125,0.000216401,0.00124855,0.000874549,0.000163469,-0.0000179583,0.0002783,0.000886777,-0.00049349,-0.00125282,0.000012501,0.000958499,-0.000176652,-0.00066568,0.00141218,0.000364301,0.000478116,-0.00193075,-0.000096094,-0.00129522,0.000755155,-0.0000907631,-0.000940004,0.000746618,0.0014504,0.000434573,-0.000192895,-0.00126655,0.00107346,0.000861768,-0.000387103,0.0000569272,-0.000543294,-0.000903652,0.000447329,-0.00104014,0.00151007,0.000370592,0.000379279,0.00125836,-0.000693096,-0.000618509,-0.000911872,-0.00104272,-0.000185565,-0.000191543,-0.00114738,0.00107306,0.00140211,0.000904241,-0.0017706,0.00040275,-0.000765767,0.00113248,-0.00120524,-0.000259222,-0.00175238,0.00151294,-0.0000686303,-0.0010187,0.00081583,0.00131541,-0.00017406,-0.000512428,0.000474652,-0.000618996,-0.000665986,-0.00152494,-0.00118311,0.000737858,-0.0000614078,0.000490969,-0.000739295,0.000323549,-0.000158341,-0.000501071,-0.000259018,-0.00120974,0.000738965,0.000491099,0.0019123,0.000943138,0.0000682114,0.00199926,0.000179392,-0.000100576,-0.000859386,0.00103486,0.000583024,-0.00156459,0.00185488,0.000745384,0.000163991,-0.00118952,-0.000297083,-0.00148425,-0.000830862,-0.00133788,-0.000312622,-0.000977313,-0.000794373,-0.000497391,0.000293197,-0.000949475,0.00134484,0.000197068,-0.00141236,0.00026258,-0.0000754768,0.00123519,0.00136457,0.000483114,0.000420811,-0.000272509,-0.00108694,-0.0013688,-0.000679005,-0.000297881,-0.00042778,0.00071646,0.000349572,-0.00109942,-0.000247871,0.000609186,-0.000401935,-0.000791724,0.000863575,0.000708433,0.00135194,-0.00188284,0.000974936,0.00122636,0.000397093,-0.000931295,0.00139394,-0.001858,-0.00198549,0.000332466,0.000673131,0.0014809,0.000162176,0.000502924,0.000391471,-0.00110219,-0.0000616457,0.00021257,0.00199582,0.000604555,0.00056743,0.00120476,-0.00112049,0.000567602,0.000477213,0.000914017,-0.000913073,0.000000481442,-0.000817725,0.000385828,-0.000634129,0.000812107,0.000391131,-0.000981396,-0.000487205,-0.000216513,-0.00157562,-0.000576556,0.000766507,-0.00113491,0.000845853,-0.000860142,0.0000733885,-0.000781568,-0.0000367514,0.00153622,-0.000754393,-0.000764828,0.00030126,-0.00145686,-0.00178948,0.000213479,-0.000702133,-0.001118,-0.0000545326,-0.000535247,0.0000652696,-0.000443331,0.0000258152,0.0000508137,-0.000549534,-0.00133857,-0.000271374,-0.00105,-0.00051812,0.0000545408,0.00141159,0.000283232,-0.000783393,-0.000783657,-0.000731451,-0.000188178,-0.000753436,0.000546294,0.000581596,-0.000110088,0.00157107,0.00127525,0.0000938977,0.00173095,0.00106426,-0.00085288,-0.00122956,-0.000749563,-0.00107897,0.000217213,0.000550261,0.0000319412,0.000208003,-0.0013114,-0.00041432,-0.000917068,0.000352973,-0.000691498,-0.000254599,0.000812202,-0.000144353,-0.000214462,-0.00111723,0.0000775759,0.000992469,-0.00186311,0.0000089056,-0.00000848564,-0.000590214,-0.00105389,0.000867537,-0.000959555,0.000115472,-0.000724623,0.0000392406,0.00111087,0.00089502,-0.00019173,-0.00132584,-0.000887208,-0.00077592,-0.0000232259,0.000967609,-0.000492094,-0.00112441,0.00114973,-0.000265645,0.000603884,0.000440417,-0.00109247,-0.000989534,0.000194172,-0.000349068,-0.00000369431,-0.00113161,-0.000817056,-0.000387766,0.00121768,0.00169644,-0.000213952,-0.000773263,0.00105189,0.000211905,-0.00045609,-0.00137606,0.00110383,-0.000907926,-0.000823886,-0.00139734,-0.00118454,-0.00153718,-0.000259576,-0.000328502,0.000114985,-0.000447108,-0.000100285,0.00183567,0.00149599,0.00196918,-0.000831161,-0.000458926,0.00002389,0.00030515,0.00130439,0.000744037,0.00136699,-0.000614535,-0.000555489,0.00019735,-0.00158887,0.000539902,-0.000278459,-0.000740248,0.00124896,-0.000615011,-0.000410201,0.0000804943,0.00111384,-0.000701205,0.000244095,0.00122047,-0.00169643,0.000941794,-0.000538341,0.000353965,0.00135562,-0.0010069,0.00014633,0.00108758,-0.00101959,-0.000130869,-0.000670555,-0.00115167,-0.00107776,-0.00050982,0.0000384694,0.000396646,0.00130468,-0.0000173611,0.00149785,0.00182259,0.00104619,0.00192678,0.00162885,-0.0011868,-0.000487746,-0.0000491593,-0.00150467,0.000986142,-0.000691443,-0.00192846,-0.0000403703,0.0000306671,-0.00112065,0.000134846,0.00190624,0.000194683,-0.000617274,0.000168141,-0.00058843,0.0000716468,-0.000877344,-0.00100912,0.0000989853,-0.0005248,-0.00000962224,0.000403647,-0.000437993,-0.00142841,-0.00122418,0.000236815,-0.000660468,-0.00135147,-0.00119608,-0.000622839,0.000990055,0.0002452,-0.000684948,0.00130681,0.000720611,-0.000587418,0.000841329,-0.00131953,0.000203955,-0.000749387,-0.00130903,0.00100251,0.000629768,0.0007757,0.000911233,-0.000664211,0.00155628,0.0000344208,-0.000546923,0.000185722,-0.000618294,0.00010645,-0.00104918,0.000918082,-0.000550081,-0.000109924,0.00030147,-0.00085997,0.000796782,0.000640404,-0.000170127,0.000687903,-0.000010356,-0.000271534,0.000462421,-0.000137921,0.00110677,0.00119226,0.00151829,-0.00100114,0.00113878,-0.000381626,-0.000369073,-0.000926563,0.000730334,-0.000878221,-0.000654622,-0.000972588,0.00158443,0.0010087,0.000202129,-0.00119317,-0.000339189,-0.00140978,0.000870101,0.000565321,0.000236308,-0.000369793,0.000618335,-0.0016856,0.000228321,0.000428017,-0.000391736,-0.000148529,0.000497411,-0.0013521,0.00102461,0.00142752,-0.000348895,0.000823911,-0.000379496,0.000494028,0.000701222,-0.0000768327,-0.0000602204,-0.000571797,0.000332081,0.000958598,0.000507021,-0.000280098,0.000494772,0.000466925,0.00000833247,-0.000206974,0.000734839,0.000228462,-0.000366055,0.00166054,-0.00185388,0.000821944,0.000597682,0.00192754,0.0000643373,0.000988378,0.000529836,0.000220358,-0.0004106,-0.00112921,0.00180713,-0.000583319,-0.0010844,-0.000725509,-0.000239748,0.000764237,-0.000856576,0.00112597,0.00136265,-0.0000486175,0.000865774,0.0011508,0.000628556,-0.000736296,0.00139189,-0.0000348149,-0.000228857,0.00104866,0.000422164,0.000482041,-0.000386005,0.00130734,-0.00114122,0.000818657,-0.000682293,-0.00165585,0.000168988,-0.00100603,-0.000390315,0.00035621,-0.000746814,0.000874956,0.00082329,-0.000732103,-0.0012765,0.000170202,0.000234071,-0.00125018,-0.00021033,0.000602306,0.00105645,0.00117242,-0.000715862,0.000506445,0.000667936,0.00163324,-0.000495394,-0.0000588172,0.000245321,0.00108318,-0.000467376,-0.000425171,-0.000405259,0.00183639,-0.000645681,0.000950988,0.00112182,-0.000284214,0.000365426,-0.00170257,0.000797751,0.000329362,-0.000498105,-0.000192522,-0.000274392,0.000477818,-0.000328843,-0.000272434,0.000976992,-0.000401891,0.00129172,-0.000905999,0.000000486714,-0.000486968,-0.000714139,-0.000163741,-0.000114943,0.0001474,0.000857158,0.000804768,0.000228259,-0.000342321,0.000155346,-0.000204557,0.0000764565,-0.000925872,-0.00115839,-0.000536291,-0.0000315923,0.00000476578,-0.000553405,-0.000630925,0.00072392,0.000881984,0.0000577304,0.000472407,-0.000785996,-0.00149602,-0.00159549,-0.000217044,-0.000555884,-0.00017296,0.000134793,-0.00156664,-0.000314043,-0.000546115,-0.000486212,0.000149849,0.00195225,-0.00100081,0.00109454,-0.000953081,0.0000143782,-0.0000245176,0.0000713503,0.00168033,-0.000371461,-0.00145549,0.000566486,-0.000310272,0.000950225,-0.00069271,-0.00128016,-0.000316526,0.0012321,-0.00101486,0.00185329,0.000216121,-0.000585889,0.000839271,0.000783589,-0.000916145,-0.0000927936,0.000808215,-0.00088799,-0.000547573,0.000385028,0.000571582,-0.00118875,-0.00148061,-0.0006401,-0.0003353,-0.00157044,0.000308628,0.00179458,-0.00132619,0.00119213,-0.00120072,-0.0000234313,0.0000967715,-0.000979045,-0.000118768,0.00051811,0.0009594,-0.000193351,0.000674965,0.000280524,-0.000407514,0.000832279,0.00120482,0.000387469,0.00145452,0.000204701,-0.000976541,-0.00139832,0.00102626,0.00032785,0.000736223,0.000574233,0.000486636,0.000814405,-0.00132685,0.00109103,-0.000797192,-0.00185581,0.000328563,-0.000600984,0.00131572,0.00119505,-0.000221552,-0.00114855,0.00168587,0.000890979,-0.000925666,-0.000372589,0.000873452,0.00157534,-0.0000126937,0.00142741,-0.00090729,0.00137848,0.000648355,-0.000165559,0.00188544,0.0000654763,0.000890556,-0.00000656571,-0.00167092,-0.0000246936,-0.00100266,0.00115625,-0.00000649762,-0.000847742,0.00107207,-0.000361488,0.00129242,-0.00188994,-0.000735987,-0.00059169,-0.000808286,-0.00144986,0.000713267,-0.000144515,0.00141085,-0.000383666,-0.000283957,0.000624879,-0.000756157,0.0000101961,-0.00106754,0.000929989,0.00119766,-0.00108684,0.0000897493,0.000559005,0.00182188,0.000060007,-0.000641049,-0.000402638,-0.00183475,0.000857921,-0.000428003,0.0013863,-0.000118459,-0.00134984,0.0000374013,0.0011114,-0.000156416,0.000595224,0.000401404,0.000479444,0.000623424,0.0000187392,0.000774962,-0.000509175,0.000181132,0.000660327,0.001599,-0.00130565,0.00103223,0.0012209,0.000300731,0.000248057,-0.000612279,0.000765314,0.000482533,0.00019808,0.000927754,-0.000816642,0.000235269,-0.000484221,-0.0015921,0.000166092,0.000251901,0.000682317,-0.0000267257,-0.00101994,0.00110694,0.00112415,0.0012788,-0.00124792,0.000096597,0.00156173,-0.000213157,0.0000341458,-0.000183434,0.000992257,-0.00015566,-0.00109288,0.000186544,0.00129804,0.000376946,0.00174772,0.00105158,-0.000482402,-0.000273853,-0.000147798,-0.000673506,-0.000943254,0.000540491,0.000944589,-0.000273146,0.000536889,-0.00043933,0.00134555,0.0017843,0.000409524,0.00023399,-0.000459484,-0.000249075,-0.000227756,0.00190367,-0.000725541,-0.000812389,-0.000232477,-0.000648041,0.000184844,-0.000242002,-0.000777085,0.000849926,-0.0000933877,0.0000989039,-0.000923806,-0.000211131,-0.0000181111,0.000968715,0.000851814,0.000870734,0.000587656,0.000709896,0.0000334443,0.00105256,-0.00158234,-0.000630738,0.0001051,0.00122467,0.00161342,0.00111426,0.000152418,0.000298442,0.0000641715,-0.000799874,0.0010949,-0.000819293,0.00199588,0.000964092,0.0000952061,0.00110163,0.00100187,0.00141776,0.00063971,0.000560005,0.000914803,-0.00135088,-0.000394063,-0.000765072,-0.000444134,0.000570051,-0.000548524,0.0000968381,0.00164759,-0.000834781,0.000233029,0.000652802,0.000042032,0.000164885,-0.000477911,-0.000953111,-0.000926082,-0.000545903,-0.000663107,-0.0000355752,0.00134062,0.00126542,-0.000438444,-0.000164421,0.000540362,0.000107185,-0.00095855,-0.00105295,0.000457647,0.000591506,0.000142602,-0.00144688,-0.00058604,-0.000333275,-0.000475472,-0.000973241,0.000149734,-0.000277033,-0.000978478,-0.00172465,0.000891883,-0.00158245,0.00193902,-0.00144716,0.000326626,-0.00107654,0.000733701,-0.000231389,-0.00188522,-0.00123907,0.000184733,0.00036936,0.000315193,-0.00000404445,0.000333032,0.000958061,0.000959381,-0.000923731,-0.00129501,0.000145731,0.000808937,-0.000208473,0.00147664,-0.000108368,-0.000457499,-0.000163517,-0.000329899,-0.0000345054,0.000463095,0.000601253,0.000970202,0.00102179,-0.000441895,-0.000225443,0.000162211,0.000982766,-0.000113036,-0.000111356,-0.00174751,0.000700303,-0.0000717643,-0.000699527,-0.00132894,0.00166351,-0.000755138,-0.00141641,0.00133104,0.000817178,0.00080697,-0.000224505,-0.000752243,-0.000184859,0.000964434,0.000882999,0.000430386,-0.00108925,0.000654492,-0.000344563,0.000220787,0.000433912,0.000388254,0.00182833,-0.00090888,-0.000900596,0.00142224,0.000329076,0.00110824,0.00174397,0.00111203,-0.000668839,-0.000460152,-0.00117353,-0.000112606,0.000229593,-0.0000254277,0.000756871,0.00143581,-0.000282758,0.000900489,0.00118234,-0.00104258,0.000287386,-0.00064898,-0.000409349,0.000453879,-0.00103723,-0.000485395,-0.000632474,0.00109743,-0.000047049,-0.0011441,0.000260675,-0.00111553,0.00117252,0.00110248,0.000214002,-0.000430743,0.000616612,0.000238075,0.00135482,-0.00057152,0.000164795,0.000409103,0.00067594,0.0000924761,-0.00044889,0.00033905,0.000711886,-0.000184377,0.00047351,-0.00046466,-0.000927411,-0.000253665,0.000892022,0.000438304,0.000467859,0.000831161,-0.00186465,-0.000690785,-0.00125792,-0.000973491,-0.00141109,-0.000650413,-0.000152668,0.000986432,0.000830119,0.00150662,-0.000208718,-0.00149497,0.000351778,0.00157859,-0.000890799,0.000661367,0.0010007,0.000275509,0.00130994,0.00103295,-0.000121317,0.000571964,-0.000711905,-0.000694902,-0.00163583,0.000335394,0.000806703,-0.00099405,0.00088228,0.000289298,0.000443015,0.00132445,-0.00123786,0.000749227,-0.00141357,-0.000109452,0.000140573,0.000479996,0.000255998,0.000666653,-0.000460261,-0.000241451,-0.00153775,-0.000788802,0.00160898,-0.00105686,0.000169743,0.000925577,0.000427857,0.00115021,0.00123446,0.000123439,0.000630713,0.00121308,0.00115967,-0.000069536,0.000861808,-0.000593418,-0.0009532,0.00087519,0.000247402,0.000309404,-0.000421186,-0.00123311,0.0000902793,0.0000628727,0.000822032,0.00192692,-0.000886292,0.000972055,-0.000978942,0.000497315,0.00131519,0.000117119,0.00104716,0.000544873,-0.0000133248,0.000210401,0.000178643,0.000696124,-0.000111012,-0.00140738,0.000718294,0.000482854,-0.0000226135,-0.00101148,0.00194419,-0.00067397,-0.000566034,-0.000715631,0.000576041,-0.000175695,-0.00137365,0.000850381,-0.000690868,-0.000908299,-0.000330731,-0.00103916,-0.0000478281,0.000855403,0.000956913,0.000180862,0.00118424,-0.00090617,0.00102693,0.000991666,0.000700725,-0.00085196,-0.0000349259,-0.00117893,-0.000610529,0.000860852,0.000312366,0.000111179,0.000096613,-0.000236132,0.000968169,0.000494817,-0.000208363,0.000448645,0.00197104,-0.000971883,-0.000120108,0.00168404,0.0000381094,-0.00008737,-0.000132408,0.00159107,-0.00114973,0.000142276,0.000638935,-0.000168067,-0.000162717,0.000582904,0.000477963,0.0000626343,0.000695014,-0.00126819,-0.000490566,-0.00120853,0.000420469,0.000350612,0.000595001,0.000570116,0.000771335,-0.00147544,-0.000837711,0.00000705841,0.000127918,0.00114357,-0.000469954,0.00160747,0.000459359,0.000441016,-0.000461188,0.00191124,0.000896134,0.00071513,-0.000560078,-0.00015981,-0.000673816,0.000424602,0.000269001,0.0000615073,0.00144401,0.0000626085,-0.00136272,-0.000043549,-0.0006519,-0.000588946,-0.0014112,-0.0000978921,0.0000671882,-0.000108253,-0.000503178,-0.0000615739,0.00123006,0.000917102,-0.000816901,-0.000437609,0.000843393,0.000305228,0.00116988,-0.00145933,-0.00117408,0.000165525,-0.000588718,-0.000938124,-0.000804293,0.00176082,0.000176532,0.000650561,0.0000509292,-0.00193361,-0.00103302,-0.000566773,-0.000079,-0.0000666497,0.00139977,0.000836197,-0.000647227,0.000393367,-0.000866452,-0.000708535,-0.00136864,0.001302,0.00113908,0.000234217,0.000690459,-0.000380222,-0.00117651,0.000769677,-0.000474727,0.00128532,0.00142281,0.00106876,0.000290869,-0.00052885,0.00122332,0.000878944,-0.000603624,-0.00086881,0.00105249,0.000887443,-0.000606993,-0.00134856,0.00163713,-0.000517859,-0.000817725,-0.000880878,-0.000521244,0.000666852,-0.0000108971,0.000511673,-0.00024367,-0.00031606,0.0000971916,-0.00040303,0.000795496,0.00193618,-0.0000739557,0.000215112,-0.000971561,-0.000231245,0.000504865,-0.000427372,0.000728979,0.00123077,-0.0000782154,-0.00021181,0.000318787,0.000331067,-0.000863936,0.00110738,-0.000313808,0.0000375186,-0.000184127,0.000771297,0.000518464,-0.0019122,0.000276734,-0.000150561,0.0000752487,-0.00102426,-0.000142256,0.000212747,0.0000940332,-0.000416093,-0.000232232,-0.000394907,-0.000680678,0.00115622,0.000471285,-0.000490097,0.000210202,0.000592958,0.0000477915,-0.000869701,0.000973264,0.0000258431,0.000476944,0.000741596,0.000531835,-0.000250705,0.000272045,0.000766925,0.000355352,-0.00173022,0.0000252007,0.000414227,-0.000589665,-0.00113658,0.000301252,-0.00007908,-0.001222,0.00187502,0.000536821,0.00000575232,0.00047537,0.000200574,-0.000328857,-0.000511719,0.000532748,-0.000901649,-0.000667508,0.000642343,0.00120331,0.000428535,0.000350168,-0.00151507,-0.00174652,0.000988499,-0.000367248,-0.000918636,0.000821497,0.000743938,0.000635271,-0.000348084,0.000416283,0.0010944,-0.00000749459,0.000428621,-0.000387579,0.000570812,-0.00164485,0.0000944111,-0.000196155,-0.00128018,-0.0000103509,0.000550792,-0.00111001,0.00108265,-0.000887818,-0.00157784,-0.00115226,-0.000147826,-0.0000193328,-0.000139536,-0.00140555,-0.00109001,0.00116029,0.000564484,0.00113889,-0.000808234,0.00119157,-0.000789982,0.00013455,-0.00127644,0.000528068,0.00119168,-0.000645098,0.000216655,-0.000449617,0.000097325,-0.0010525,0.000391593,-0.00141362,-0.000369861,-0.000724072,-0.00081459,-0.000709582,0.000226755,0.00181002,-0.00114434,-0.0000435357,-0.00119956,0.000629266,-0.000986454,-0.00111292,-0.00108146,0.000424741,0.000102824,0.00168199,-0.00106801,-0.00119969,-0.000463734,-0.0000207407,-0.000165196,0.000062013,0.0010484,-0.00167064,0.00108079,0.000962932,0.000938564,0.000732561,0.00114453,0.0000658357,0.000818814,-0.000212905,-0.0012706,0.000109311,0.0000608044,0.000524508,0.00129179,-0.000444147,-0.0000980393,-0.00139217,0.00072626,0.000396101,-0.000386155,0.000705838,0.000925478,-0.00105174,0.0000528,0.000548307,0.000538486,-0.000503852,0.000797318,-0.00162772,-0.00119801,-0.000234154,-0.000259543,-0.000381262,-0.00123938,0.0000673405,-0.000929838,0.0000915427,0.000767182,-0.000495405,-0.00151471,0.00160308,0.000568784,-0.000255255,-0.00164459,0.000985487,-0.00035249,-0.000860874,-0.00110065,-0.000210316,-0.000326402,-0.00122094,-0.000659826,-0.000283804,-0.0000942566,-0.000567928,0.0014251,0.000630895,-0.000588082,0.00152302,-0.000530603,-0.000785592,-0.0000937984,-0.00126289,0.000601951,0.0008184,0.000227062,0.0000370091,-0.000456358,-0.00158329,-0.000788197,-0.0010384,0.00129582,-0.000793838,0.000125808,0.000290204,-0.00158599,-0.001697,0.000525435,0.000239766,0.00116005,-0.000155782,0.00170944,-0.000506994,-0.000281055,-0.000438239,-0.000808782,0.00129538,0.000829414,-0.00177507,-0.0000256263,0.000419748,-0.000392169,0.00130959,0.000692331,0.000601704,-0.000294103,-0.00129256,-0.00084022,0.000805316,0.000598235,-0.000667262,-0.0000231306,-0.000502845,0.000625791,0.000270519,-0.00125675,-0.00197584,0.00165211,0.000700811,-0.00138827,-0.000297958,-0.00129471,-0.00127159,0.000360936,-0.00178218,-0.000641788,-0.00120583,0.00123658,-0.000908994,-0.000850765,-0.00101779,0.00148806,0.00127762,-0.00122214,-0.00134522,-0.000483764,-0.00128704,0.000159708,-0.00112323,-0.000244867,0.00021382,-0.0000988563,0.000216576,-0.000361702,-0.000352545,-0.000363975,0.0012154,0.0000123932,-0.00036035,0.00141744,-0.0000374977,0.000540869,-0.000886678,-0.000852651,0.000469911,0.00183305,-0.000538075,0.000190104,-0.00051606,-0.000537663,0.00181682,-0.00126845,-0.0003267,-0.00126466,0.000871263,-0.000744011,0.000180057,0.000634327,-0.000666512,-0.00120007,0.00127178,-0.000478333,-0.000399304,-0.000665337,0.000341263,0.00083168,-0.000314194,-0.000047185,0.000634256,0.00132148,0.00049321,0.000189369,-0.00169887,-0.000745591,0.000656334,0.00155426,-0.000240223,0.000884384,-0.000178185,-0.00121652,-0.000683451,0.000661469,0.000841945,0.000935941,0.000196224,-0.00152435,-0.000448378,0.000900539,-0.000163699,-0.000393153,0.0014108,0.000954223,-0.000633187,-0.000976294,-0.00177125,0.00103896,-0.00110552,0.0012533,0.000345841,0.000504628,-0.000852832,-0.000647377,-0.00001479,-0.000263649,-0.000194773,0.000377311,-0.00105877,0.000895548,0.000771326,-0.000597437,-0.000448526,0.00120116,0.00165618,-0.00112702,0.000558661,-0.00116045,-0.000510678,0.00167726,-0.00091111,-0.00107358,0.00103578,-0.00189153,-0.00114338,-0.00118907,-0.00108337,0.00132918,-0.00049083,0.00091673,0.000632137,-0.00168306,-0.000263599,0.000364306,0.000180637,-0.000169645,0.000714238,-0.000915744,0.00125802,-0.000336682,0.00102606,-0.000368724,-0.00040179,0.000417851,-0.000790305,0.000817468,-0.000211928,0.000630054,0.000345331,-0.000730457,0.000347355,-0.00110995,0.000623741,-0.000355359,0.000924409,0.000211159,-0.00110499,-0.000109504,0.000174557,-0.00164862,0.0007866,-0.000818835,0.00114219,0.000631401,-0.000355816,-0.00147896,0.000000301397,-0.000205155,0.0000538252,-0.0000990286,-0.000975885,0.000270712,0.000808676,0.0000636363,0.000522189,0.000439534,0.000152569,0.00195119,-0.000388773,0.00136087,0.0000698656,-0.00113003,0.000434347,-0.0000365695,0.000233812,0.000240832,-0.000113666,-0.00116665,0.000741839,-0.00029579,0.000136828,-0.000393395,-0.00120879,0.00020164,-0.00118868,-0.000914544,0.000969479,0.000885649,-0.000683022,-0.000253276,-0.000110255,-0.000560859,0.00109333,-0.00058125,0.0000597532,-0.000336788,0.000271633,0.000223436,0.00134168,0.00111027,-0.000661554,0.0000613318,0.000219294,0.00161443,-0.0000699156,0.000556804,-0.000331165,-0.0000150632,0.000099693,-0.000357476,-0.00135756,0.00123715,0.00178783,0.000332035,-0.000449759,0.000361893,0.00178796,-0.000782719,0.000177382,0.000218179,0.000642805,0.000969622,-0.0016487,-0.000490809,-0.000299636,-0.000192991,0.00178866,-0.00028344,-0.000369095,0.0000075497,-0.0000821893,-0.00106336,-0.000539278,0.000144787,-0.00109783,0.000924659,-0.00134641,0.00174012,0.0000455396,-0.0008671,0.00110479,0.000480184,-0.000460568,-0.000141243,-0.00108062,-0.000599101,0.000131857,-0.00136391,-0.000672565,0.00132074,0.000174016,0.000488652,0.00149669,0.0000611672,-0.00120225,0.000559803,-0.00048928,0.0012078,-0.000228061,-0.000624109,0.000527395,0.000210683,-0.000581569,0.000905798,-0.00129145,-0.000704524,-0.000169511,0.00090508,-0.00164412,0.000166831,0.0000341435,0.0000722343,-0.00108738,-0.00132628,-0.000614503,0.000155817,-0.00136366,0.00104239,-0.000733317,-0.000438574,-0.000637854,0.000243132,-0.000325741,-0.000606379,-0.000922216,-0.000716851,0.00141975,0.00163566,0.000655298,-0.00124772,-0.000638793,0.000381843,-0.00172888,0.000291018,-0.00107716,-0.000854767,-0.000168066,-0.00056945,-0.00148784,-0.000573174,0.0015909,-0.000026581,-0.00152918,-0.000165005,0.000111369,-0.000524226,0.000069593,0.000604349,-0.000297588,0.000134182,-0.000706234,-0.00049721,0.000529315,0.000935346,-0.000724235,0.000370177,-0.000581237,0.000945413,0.000200457,-0.00074476,-0.00193482,-0.00139244,-0.000484525,0.00110523,0.000600964,0.00155252,-0.000206156,0.000790694,0.00120003,-0.000329377,-0.000657784,-0.00135831,0.00100224,-0.000640373,0.00109978,0.00152453,-0.000879829,-0.000749658,-0.00155854,0.00101457,0.000213376,-0.000219384,-0.00027022,0.000767502,-0.000864426,0.000148197,0.000239855,-0.0013203,0.000685713,-0.00149959,0.000282756,-0.000780204,0.000171609,0.0000619758,-0.000798253,-0.00179111,0.00159732,0.000690885,-0.00115293,-0.000145392,0.000490637,-0.0000379926,0.00114686,0.00030987,0.00127889,0.000573525,-0.00048032,0.00186815,-0.0000417708,0.00109068,0.000836466,0.000359486,-0.000528606,0.00047708,-0.000643783,0.000220969,0.000676405,-0.000129697,-0.0011453,0.000167345,-0.00000965817,0.00122458,0.000052005,-0.0010667,0.00132902,0.000244823,0.000193869,0.00113245,0.000263146,0.00159936,-0.000458352,0.000870754,0.00165372,0.000368481,-0.000710329,-0.000263616,0.00131053,-0.000495651,-0.0010026,0.0000933121,0.0016201,-0.00136837,-0.00130894,-0.00122055,0.000218733,0.000509207,-0.000696994,0.00130934,0.000598126,0.00154324,-0.00122216,0.00145724,-0.000421189,-0.00174189,-0.00039387,-0.000992362,0.0000764464,0.000353005,-0.00125181,0.000367559,0.000910795,0.00127423,-0.00136227,0.000849364,-0.00182424,0.000913881,-0.000488684,0.000280453,0.000770724,0.000465065,-0.00152246,0.000909207,-0.000773829,-0.000101506,0.0000975168,-0.00167256,0.00117622,0.00123515,-0.0018048,-0.000693674,-0.000844864,-0.00036801,0.000445887,0.00111684,-0.0000233604,-0.00137639,0.000360723,-0.00034465,0.000340797,0.000435806,-0.000500443,-0.000890077,-0.000396716,-0.000554288,0.000204296,0.000673874,0.000966101,0.000858,-0.000958858,-0.0000815698,0.000887304,0.000551895,-0.000961182,0.000621669,-0.000313485,0.00133691,0.000755488,-0.000779764,0.00112762,-0.000922396,-0.00199007,-0.000306339,-0.0000912623,0.000403466,0.000110122,-0.0000176374,-0.00139154,0.000291145,-0.000815246,0.000422306,0.0000969384,-0.00146966,0.00024078,0.000527332,-0.00141692,-0.000497196,0.00150758,-0.000416177,0.00181092,0.000241473,0.000450269,-0.00024299,0.000524367,0.000917077,0.000961812,0.00125345,-0.000459852,-0.000283909,0.000321833,-0.00199419,-0.00109623,0.0000400128,-0.000894657,-0.000769656,0.000369203,0.0000591213,0.00196592,0.000126481,0.000030246,0.000850286,0.00175654,0.0000548677,-0.000254399,0.000605372,0.00108021,0.00062985,0.00167241,0.0007632,0.0000684014,0.0000249903,0.00117721,-0.0000494645,-0.000704489,0.00135594,-0.000536929,0.000507326,-0.00156846,0.00191034,-0.0000688335,0.00105131,0.000117344,-0.00140148,-0.0000275384,0.000808232,0.00109778,0.00109673,0.000274409,-0.000351422,-0.00114693,0.00106872,-0.00039886,-0.000714289,-0.000891438,0.000267267,0.000343225,-0.000164857,-0.000258971,-0.000783844,0.00135161,-0.000128253,0.000327902,-0.00118567,-0.000234147,0.000160532,0.000152423,-0.000690506,-0.000409225,-0.0000299235,0.000430777,0.000415492,-0.00111152,-0.000267148,-0.0000675747,-0.000540497,0.000355223,-0.000778238,0.00103562,0.00124639,-0.00000381738,0.00119541,-0.000517732,-0.00198982,0.00115674,-0.00158019,0.000198934,-0.00138195,0.00123773,-0.00151812,0.00098835,-0.00198566,0.000419692,0.000252677,0.0000330254,0.000991851,0.000399392,0.000548461,0.000886948,-0.000795393,-0.000645264,0.00162408,0.000571386,0.000836664,0.000255057,-0.000219031,-0.00161169,-0.000246196,-0.000371164,-0.0000255767,-0.00159371,0.000390009,0.000580707,0.000135621,-0.0000748179,0.000429676,-0.000358854,0.000640208,0.000740043,0.00165616,-0.0000518613,0.00160995,0.0016807,0.00031726,0.0000940658,-0.00152942,-0.000223636,-0.0010497,-0.000199392,-0.00122363,-0.000844292,-0.000272434,0.000909678,0.00113269,0.000374518,0.000141161,0.000700439,-0.000247209,0.000592149,-0.00126623,-0.000547241,0.000395558,-0.000431703,0.000633959,-0.00109738,0.000320071,-0.00129768,0.0000237255,0.000791343,0.00072971,0.00178768,-0.00067527,0.000201487,0.000336974,-0.0013074,-0.0000772533,-0.00163357,-0.000339086,-0.000963305,0.000846215,0.000844723,-0.000358025,-0.000369793,-0.000290614,-0.000257819,-0.00105762,0.000737922,-0.000771608,0.0000927785,-0.00080624,0.0003187,-0.00113156,0.000154829,0.00134845,-0.000545292,-0.00111253,-0.000187949,-0.00128068,0.00034665,0.000349303,-0.0000750887,-0.000443896,-0.00141785,0.00021038,-0.000258658,-0.000228914,0.000683763,-0.000596122,0.000141786,-0.00109768,-0.00066445,-0.0011849,-0.000685238,0.000248787,0.00000488591,0.00088525,0.00193038,0.000677432,0.00025832,-0.000318405,-0.000230639,0.000839793,0.000470257,0.000928364,0.000737281,0.000954299,-0.000568164,-0.00000956978,-0.000213025,0.000441154,-0.000326871,-0.000446739,0.000385734,0.000840325,0.000000627269,0.000350703,-0.00105251,0.00150811,-0.000817299,-0.000361517,0.0000319027,0.000510064,-0.000848577,0.000952674,-0.000448097,-0.000952948,0.00151195,0.000982702,-0.0000816896,-0.000607677,-0.000683411,-0.000263797,-0.000652134,-0.00119055,-0.00000880898,0.00124087,-0.000495743,-0.000399402,0.00196364,-0.000107472,-0.00167538,0.0000195496,0.000284243,0.000194831,-0.0000109658,0.000646433,-0.00106889,0.00129046,-0.000166695,0.000385178,-0.000485961,-0.000793029,-0.0000631984,0.00047508,0.0010396,-0.0015475,0.000122855,0.0000566913,-0.000103265,-0.000222197,0.0017061,-0.000604673,0.000658522,-0.00112604,-0.000132232,0.00156942,-0.000922674,0.000248385,-0.000252734,0.0000282294,-0.000181947,0.000124182,0.000356352,-0.000423561,-0.00078726,0.000514248,0.000844742,0.000411934,-0.00159559,-0.000779423,0.000505192,0.000441053,0.0014416,0.000500349,0.000393769,-0.000554806,0.00195002,-0.000576156,0.000662972,-0.000934901,-0.000569878,0.000272618,-0.0000468928,-0.000722238,0.00119986,-0.000515163,0.000843738,-0.00138741,0.000871109,0.000481863,0.00129273,-0.000218006,-0.00053753,-0.000173346,-0.000279463,-0.00159973,0.0000145089,0.000546619,-0.000475459,-0.000746847,0.0000264031,0.000162854,-0.0000890746,0.000470153,-0.00120789,0.000530902,-0.0000842524,0.0013955,-0.00020763,-0.00164114,-0.000655053,-0.0000541323,0.000577821,-0.00108232,0.000933146,0.000450141,-0.00174247,0.000383375,-0.000124185,-0.000753258,0.00139082,-0.000895826,0.00000801208,0.00150076,0.00156564,-0.000345058,-0.000972383,0.00105012,0.000948532,-0.00107431,-0.000876718,-0.000043571,0.000587762,0.00126392,-0.000771958,0.00175306,-0.000758654,0.000739978,0.000998522,0.000475975,-0.000907981,0.00033042,0.00147773,-0.00116706,-0.00174035,-0.00104834,0.000263791,0.0000322315,0.00177343,0.000139534,0.000282968,-0.000273222,-0.000968641,0.00136322,-0.00065142,0.000542336,-0.00132155,-0.000558748,0.000601561,-0.00112233,0.00000625044,0.000674633,-0.000726301,-0.000380837,0.000791673,-0.000128279,0.00148702,-0.000642115,0.00135041,-0.000593877,-0.0012454,0.000536055,-0.000814183,-0.000103824,-0.00119198,-0.000452197,-0.000588093,0.000924646,0.0011552,-0.000185869,-0.000807313,0.00111241,-0.000103901,-0.000813971,0.00082068,-0.00113269,-0.000778223,0.000200598,0.000621249,-0.0000271394,0.000440252,0.000770284,-0.000451168,-0.000331429,-0.00134742,-0.000591107,0.000675717,0.00100951,-0.000165766,-0.000827589,-0.0017673,0.000724072,-0.000223919,-0.0000220882,-0.00107616,0.000896315,-0.00123636,-0.000656599,0.000441098,-0.000823363,0.0000762804,-0.000480904,0.000099443,0.000897329,-0.000653686,-0.0004327,0.0000575201,0.00140975,-0.000755411,-0.000304561,-0.00128046,-0.000721405,0.0000715065,-0.000324388,-0.000580722,0.00150192,-0.000487047,0.000252266,0.000285114,-0.000859414,0.000657236,0.00114798,-0.000796614,0.000925622,-0.000382095,0.000143211,0.000642044,-0.00116572,-0.000221358,-0.00092218,-0.000688178,-0.000682379,-0.00172186,-0.00159923,0.000113639,-0.00126776,0.000513206,-0.0000919288,-0.000700747,-0.000768517,0.00098819,-0.000366558,0.000964631,-0.00180795,0.000633695,0.00127851,-0.000555687,0.00145285,0.000239306,-0.000504081,0.000255063,0.000573702,-0.00127129,-0.00000212248,0.00175412,0.00187854,-0.00173014,0.000505179,0.00124777,0.000720432,0.000908775,0.00162698,0.000110521,0.000213437,-0.000308006,-0.00019028,-0.00182053,0.000313435,-0.00021638,0.00073784,-0.0010758,-0.000659717,0.00123867,-0.000406572,0.0000167189,-0.000925997,0.00036208,0.00028073,0.000557473,-0.00068627,-0.000334279,-0.00098814,-0.000361919,-0.000734227,0.000877732,0.000694066,0.000614615,-0.00116725,0.00174515,-0.000612908,0.00026588,-0.0000197154,0.00166389,0.00165555,-0.00126277,0.00105878,0.00141889,-0.00122366,0.000948275,-0.00194735,0.000897837,-0.00121907,-0.00102203,0.0011036,-0.000733119,0.000869351,0.000759245,-0.000946537,0.000187656,-0.00133438,0.00126866,-0.000308035,0.000585914,0.000485283,0.000243374,0.000412308,0.00163081,0.000315406,0.00104749,-0.000159652,0.000540012,-0.000663128,-0.0010159,-0.00020698,-0.00154044,-0.000112841,-0.000349778,0.000940252,0.000172806,0.00122366,0.0000201922,0.000431144,-0.00055491,0.000493646,0.000378744,-0.0000527187,-0.000778379,-0.000114452,0.000388631,0.000292784,-0.000525801,-0.000175539,0.000685563,-0.000930304,0.00155303,-0.00102216,-0.00125675,-0.000169785,0.0000977846,-0.000723164,0.000124692,-0.00138903,0.0013607,-0.000439218,0.000225758,-0.000531353,0.000739112,-0.000309554,-0.00131197,0.000205358,-0.000471608,-0.0005559,0.00105473,-0.000542278,-0.000738147,0.000335224,-0.000367478,0.0000888615,0.000200324,0.0000736732,0.000752006,0.00152082,0.000417721,-0.000848871,0.00112787,0.000551357,-0.00179522,-0.0000551825,-0.00137118,0.000261823,0.00175315,-0.000102964,-0.000803525,-0.00118529,-0.000550332,0.000161083,-0.000766095,-0.00170502,0.000342368,-0.0000100937,-0.000215572,0.000988035,0.000868527,0.000673699,0.00045149,0.000452862,0.00156505,0.000568299,-0.0000313361,0.00172489,-0.000682266,-0.00137696,-0.00116123,-0.000956315,-0.00062064,0.0000520741,0.000952632,-0.00027886,-0.00125621,-0.00022535,-0.000833967,-0.000219566,-0.00180285,0.0003406,-0.000595621,0.00141098,-0.000615353,-0.00119825,0.0000866263,-0.000326858,0.000664756,-0.00185317,-0.00139501,-0.00105545,0.00126421,0.00107688,-0.00180566,0.000831637,-0.000130988,-0.00113916,0.000443157,-0.000807385,-0.0010028,-0.000289526,-0.00145762,-0.000221196,0.00173891,-0.000540936,0.00153484,-0.00125119,0.000141158,-0.000151633,-0.00082546,-0.000182351,-0.000671915,0.000720988,-0.0000558569,0.00168416,0.000471036,0.000607445,0.00159046,-0.000361302,-0.00137167,-0.000319756,0.000781026,-0.0000617868,-0.0000200451,0.00115536,-0.000453332,-0.000722111,0.000602053,-0.00010311,-0.000288225,-0.000968465,-0.000356077,-0.00126346,0.00104297,-0.000747307,-0.00091169,0.00175242,-0.00030389,-0.000431852,-0.000984991,0.00131798,0.00064096,-0.000541012,0.00146998,0.000518712,-0.000773941,0.00015362,-0.000465274,0.000760845,-0.0000902818,0.000529122,-0.000159545,-0.000448914,-0.000459454,0.00119395,0.00101294,-0.000280659,0.000678982,0.00142252,-0.0000856495,0.000501044,-0.000956019,-0.000304522,0.000783471,0.00137313,0.00120346,0.00139375,-0.00175935,-0.000959927,-0.000932558,0.000856087,-0.000711334,0.0000702684,-0.000120824,0.00141097,-0.000987449,0.000498033,0.00152276,0.00189446,0.000124134,-0.000580519,-0.000438893,0.00110322,-0.00101749,0.00199604,-0.000813827,0.0000505357,-0.0000153321,-0.0014664,0.000335863,0.00111088,0.0000306418,0.000731605,-0.000524197,0.000876101,-0.0013848,-0.000984063,-0.000980494,-0.00104976,0.000722013,-0.000175196,0.000551896,0.000494272,0.000112566,0.00145058,0.000703616,-0.000111431,0.000597734,0.0012913,-0.00051146,0.000677603,-0.000260219,0.000576599,-0.00161186,0.000416715,0.000573983,-0.000985301,0.000559778,0.0000488815,0.000386019,-0.000735126,0.000701683,0.000536641,0.000166845,0.00108327,-0.000174384,-0.00122237,0.00021485,0.00132859,0.0000559432,-0.000495631,-0.000125548,-0.00094599,0.000216618,0.00157035,0.00124059,0.000239022,-0.000392976,0.00145621,-0.000692275,-0.000251597,0.000178633,0.000900098,-0.0002883,-0.000926857,0.000146691,0.000365895,0.00093777,-0.00105156,0.000194432,0.000502947,-0.0011221,-0.000453525,-0.000019639,0.00115093,0.00032829,0.0000125012,0.00089134,-0.000031698,0.000481837,-0.0000237022,0.00075674,-0.0010968,-0.0013142,0.000384825,0.000301647,-0.00123243,0.00142328,-0.000268748,0.00184279,0.000768065,-0.00188307,0.00114754,0.000376401,0.000107122,-0.000662934,-0.000176501,-0.000271688,-0.000795678,-0.000173041,0.000133835,-0.000570366,0.000281556,0.0015508,0.00101949,0.000645903,-0.000285115,-0.000523052,-0.00158777,-0.000311204,0.00124891,-0.000780466,0.000264359,0.0000177712,0.000206273,0.000173427,0.000933268,0.00117384,-0.000730438,-0.00181904,-0.000117574,-0.00060138,-0.000784466,-0.0019773,0.000898283,0.000368581,-0.00182591,-0.000727045,-0.00119489,-0.000130229,0.000587203,-0.00197995,0.000645413,-0.000238462,-0.000700864,-0.000853329,-0.000760316,-0.000348712,-0.000636972,0.000259565,0.000198787,-0.000109799,-0.000475591,0.00032901,-0.000579365,0.000512196,-0.00000990874,0.000511134,0.000556079,-0.00179034,0.00129936,0.00168361,0.000547154,0.000785439,-0.0000252366,-0.00139193,0.000773377,0.000364856,-0.00107162,0.000735202,0.000479313,-0.000840097,-0.000393046,-0.000459588,-0.00000814502,-0.0000627014,0.000181351,-0.000294499,0.000636947,0.00180897,-0.0017894,0.00107518,-0.00124142,-0.00058558,-0.0000529189,-0.0000225612,0.000712674,0.00165153,-0.00110507,-0.000269745,0.000921224,-0.000167559,-0.000324536,0.00161987,-0.000304976,-0.0000634628,-0.000624194,0.000238784,-0.001233,-0.000482917,-0.000477498,-0.00059944,0.000122122,0.000328745,-0.00055061,0.000195,-0.00034817,0.000419133,-0.000500148,0.00039271,-0.000126813,-0.0000363133,-0.00138568,-0.000287321,-0.000179966,0.000240984,0.00021216,-0.0000434935,0.000794585,0.00136079,-0.000341968,-0.000185019,-0.000749252,-0.0019158,0.00056567,-0.000379882,-0.000012827,0.000230858,-0.00072726,0.000346717,0.0012913,-0.000374666,0.000780581,-0.000674156,-0.00188688,-0.00110595,0.000221026,0.000815019,0.00084204,-0.000803691,0.000930704,0.00102285,0.0008797,0.00108671,-0.0000523726,0.000428309,0.0015778,0.000233021,0.0000596151,0.000209925,0.000249177,0.00152698,0.000691292,0.00152183,0.000329266,0.000469698,-0.000526702,0.000172039,0.0015053,0.000271801,0.00076903,-0.000996757,0.00147046,0.000042359,0.000505758,0.000624638,-0.000682859,0.000188383,-0.000731562,-0.000665321,0.00132453,0.00116033,-0.000960048,0.0000260845,0.000575812,-0.00125837,-0.000737049,0.000166483,-0.000174306,0.00160504,0.000602029,0.000462177,-0.000658716,-0.0000981746,-0.00100506,-0.000654552,0.00155722,0.000198035,0.00171058,0.000205528,0.000215474,-0.0000106332,0.00153037,0.000641372,0.000463793,-0.000201959,-0.000546464,0.000540113,0.000634744,-0.000278462,-0.0000932465,0.000948252,-0.000173196,-0.000177391,-0.000145341,-0.000382325,0.0004771,-0.000699851,-0.00121827,-0.000609555,-0.000154638,0.00103218,0.00015954,-0.00102361,-0.000337733,0.00125629,-0.00145896,0.000849464,0.000117038,0.001017,-0.000231819,0.000588337,-0.000964741,-0.00131404,-0.000898569,0.000149266,0.0000186352,0.000797929,-0.00159395,0.000311082,-0.000759716,0.000156416,0.000638832,0.000152741,0.00121456,-0.000015433,-0.000379617,-0.000470608,-0.000316777,-0.000283829,-0.00167396,0.00136372,-0.000264353,0.00111056,-0.000130568,-0.0000683997,-0.000247752,0.000202153,-0.000771305,-0.000448794,0.00038181,-0.000257023,-0.000146722,-0.000355926,0.000328346,0.000628677,0.000347192,-0.00180161,0.000756039,-0.000262617,0.000260576,0.000518406,-0.000330613,0.00180226,0.0000440553,0.000122993,-0.000230674,0.00131032,-0.000312899,-0.000773891,-0.000716369,-0.0017235,0.00038148,0.000403409,0.000432281,-0.00139449,-0.00161705,-0.00171212,-0.000553818,-0.000421393,-0.000202954,0.000282401,0.000309617,-0.000545661,-0.000190065,0.000337335,-0.000746593,0.000720039,-0.000249121,0.000756543,0.00173411,-0.000879969,-0.00149003,0.00176724,0.000104595,-0.00124674,0.000551226,-0.00126428,-0.000411542,-0.00175778,0.000458574,-0.00113339,-0.000771321,0.00025034,-0.000521373,0.00010458,0.000306834,-0.00127931,-0.00163018,0.000155818,-0.000175349,0.00000707149,0.000638716,0.000161131,0.000386473,0.00114213,-0.00112224,0.00171492,-0.000456152,0.000777016,0.000929958,0.000531208,0.000403512,-0.00121256,-0.00127512,-0.00194752,0.000619085,0.000385742,-0.00076353,0.000925992,0.000345348,0.00124557,0.000355906,-0.000337753,0.00115844,-0.000514181,-0.000955948,-0.000969187,0.00103562,-0.000524195,0.000162407,-0.000549089,-0.0000881644,0.000818543,0.000909193,-0.00139779,0.00152205,0.00015416,-0.00183913,0.000947709,-0.000796177,0.000491099,0.00108199,0.00105632,-0.000340074,-0.000708979,0.0000892247,-0.0005516,-0.000575426,-0.000672723,0.00076753,0.00148036,-0.000980174,-0.000989649,0.00113538,0.000462648,0.00153007,0.000542005,0.000479191,0.000777653,0.00102019,0.00168462,-0.000205994,-0.000064732,0.000472261,-0.000960271,0.00192243,0.000401384,-0.00105145,-0.00028142,0.000529543,0.00109128,0.00000690544,-0.00037787,0.000128784,0.000243728,0.000619587,0.00047751,0.000995934,-0.000229524,-0.00157074,0.000890243,0.00108478,0.000968663,0.000625631,0.00120044,-0.00116308,0.000626536,-0.00155432,-0.000033579,0.000376259,-0.00166889,0.000479649,-0.00064825,0.00187571,-0.00157162,0.000735776,-0.000471959,0.000281119,-0.000971012,0.000335551,0.000912298,-0.000993073,0.00024655,0.000193918,-0.0000659779,-0.000969139,0.000454821,0.000635723,0.000524741,-0.000829728,-0.000644773,-0.000380492,-0.0000468828,0.000391611,-0.00111972,0.00042566,-0.00042143,-0.00112158,0.000632354,0.000397723,-0.00115454,0.000397522,-0.00113539,-0.000996085,-0.00157418,-0.000497377,0.000978652,-0.00106377,-0.000336684,-0.0010473,0.000646376,-0.00176277,0.0000121363,0.000715576,-0.00137744,-0.000251332,-0.0000397553,-0.000251627,0.000102272,-0.000477223,0.000840599,0.0000200561,-0.000528866,-0.00042937,-0.00000542081,0.00116993,-0.000607216,0.00146963,0.000696883,0.0000385611,0.000980103,-0.000405468,-0.00175665,0.000169963,-0.000265987,0.000739446,-0.00045395,-0.000648843,0.00138149,-0.000540854,0.00100066,0.000843632,-0.000368735,0.000608366,0.000213111,-0.000153618,-0.000817938,0.00040999,0.000623853,0.000467039,-0.000155242,-0.00144591,0.000946219,-0.00168388,-0.000590648,-0.00114934,-0.000317724,0.00122104,0.000686456,-0.000104671,0.000315731,-0.0015026,-0.000795826,0.000236279,0.000696565,0.00179343,0.001758,0.000363008,-0.00073598,-0.000133035,-0.0000627466,0.0000684428,-0.000816602,0.000316254,0.00100614,0.000505498,0.0000498298,0.00155538,0.000401026,-0.00058222,0.000765003,-0.0000062434,0.00105963,-0.00165166,-0.00134632,-0.000626163,0.0000318749,0.00187401,0.00107674,0.000753886,0.000110325,0.00127801,-0.00165079,-0.000285052,-0.000572163,-0.000300772,0.000113793,0.000614312,0.00194941,-0.00134208,0.000316228,0.000211721,-0.000995934,0.000204979,-0.000853902,-0.00141087,-0.000674793,0.000145622,0.000423329,0.00103489,-0.0000644296,-0.000372544,-0.000746849,0.00145536,0.000255563,0.000902754,0.00105762,0.00026687,-0.000295396,-0.000119892,-0.000693642,0.0000845214,0.000469691,0.00172796,0.0000345388,0.0000725586,-0.0010147,-0.000530742,-0.000358678,-0.0000816326,0.00133943,0.00160364,-0.000730429,0.000658046,-0.00134733,0.00104465,-0.0000173523,0.000496229,0.00108057,-0.00142744,-0.000147778,-0.000475106,0.000554172,-0.000492307,0.0012253,-0.0014568,-0.000881065,-0.000174937,-0.0013869,-0.000758789,0.000373692,-0.000912377,0.00131981,-0.000145237,-0.00104635,0.000458471,0.00039078,0.000751664,0.00116704,0.00150154,0.000328273,0.0000459578,0.000262737,0.0012585,-0.000687263,0.000704218,0.000992163,-0.000769604,-0.00099971,-0.00178412,-0.00120248,-0.000378764,0.000486732,0.0000845768,0.000105739,-0.000286163,0.000943782,-0.000998132,-0.000174812,-0.000277291,-0.00124469,-0.000224175,-0.000911334,-0.0000232016,-0.000777197,0.000329085,0.00093281,0.00161902,-0.00133238,0.00106607,-0.000519596,-0.000627021,0.000176869,-0.000506978,-0.00029301,-0.000893472,0.000394988,-0.00125327,-0.00100588,-0.0000664747,0.000673145,0.000938768,-0.00135114,-0.000263631,-0.000348011,0.000142363,0.00135206,-0.000451481,-0.000316786,-0.00182035,-0.00127337,-0.000468523,0.000225511,0.00017019,0.0000592708,0.000984432,-0.00161096,0.00132278,0.00131223,-0.00074629,-0.000465575,0.000146749,0.00039158,0.000961104,0.000639711,-0.0000658409,-0.00149168,-0.000708607,-0.00052805,-0.0014407,0.000577628,-0.000126917,-0.000233031,-0.000750575,-0.00126362,-0.00066503,0.000861159,0.000039426,0.000798678,-0.000431199,0.0016072,-0.00139225,-0.000417182,-0.000657752,0.0000578777,0.000169422,0.000201342,-0.00130835,-0.0006159,-0.000577795,-0.00022312,-0.000339532,0.00103314,-0.000312594,0.000617913,-0.0000813945,0.00187635,-0.00043009,0.0018363,0.00143326,-0.00111033,-0.000869041,0.000469751,0.000429019,0.000333019,0.001804,-0.000495563,-0.000315189,0.00113761,0.000140276,0.00093615,0.0019316,0.00124015,0.00179964,0.000467863,-0.00127654,0.00077554,0.000172978,0.000431125,0.00111634,-0.000138111,-0.000273391,-0.00151449,-0.000727958,-0.000100728,-0.000158911,0.000316212,0.000301036,-0.000906029,0.000507052,0.000620096,0.0000123868,-0.00141099,0.000523388,0.000926962,-0.0000280954,-0.000177303,0.000642923,-0.000107886,-0.00000367713,0.000851805,0.00037345,0.000873155,0.000133346,0.000286306,0.000626373,-0.000983092,-0.00104846,0.000210187,-0.00107299,-0.000733472,0.00029351,0.000988864,-0.000635458,-0.000045442,-0.00177312,0.000366242,0.00100729,-0.000799497,0.000964234,0.000379033,-0.000670347,-0.00131943,-0.00131985,0.000736207,0.00097816,0.000141429,-0.000978718,-0.000483187,-0.00113347,0.0018559,-0.000906112,0.00150533,-0.000312231,-0.00024583,0.000340016,-0.00144509,0.000938292,-0.00140624,-0.00149625,0.00020336,0.000942423,-0.000147814,0.000666239,0.00113011,-0.000905123,-0.000467858,0.000643678,-0.000406202,0.00163353,0.000987023,-0.00116877,-0.000223064,-0.0000150656,-0.000798934,0.000240445,0.000972653,-0.000522757,0.000789951,-0.00119636,-0.0000678479,-0.0000820836,-0.0000102203,0.0002297,0.000791436,0.000480668,0.00101698,0.000379745,-0.00126852,0.000342914,0.000750468,0.00097311,-0.00158727,-0.00102811,0.000628931,-0.00060321,0.000108756,0.000722213,-0.000257073,-0.00114059,-0.000503251,-0.000476621,0.000862522,-0.00146537,0.0000663373,0.000279572,0.000622133,-0.000229769,0.0012042,-0.000358071,-0.00140594,0.000355494,0.000412592,0.00021915,-0.00112523,0.000621881,-0.000130894,0.000142086,-0.000951857,-0.000103429,-0.00138515,-0.000395982,-0.000675386,0.00026928,0.000236451,-0.000792017,-0.000261352,-0.00136619,0.000721878,-0.00153108,-0.000145738,0.0006138,0.00111337,0.000902865,0.00025405,-0.00061703,-0.0000371132,-0.000631128,0.000341772,0.000471726,-0.000715019,0.0017303,-0.00110949,-0.000688004,-0.00153632,-0.000177224,0.000306615,0.000447214,-0.00135379,-0.00163426,-0.00118231,-0.000401016,0.00121186,0.000625505,-0.000267149,-0.000176298,-0.00057314,0.000449983,0.0018643,0.00035559,0.000213668,-0.000167472,-0.000722818,-0.000287562,-0.000460396,-0.00101992,-0.000484138,-0.000319407,0.00101565,-0.0000166181,0.00105059,-0.0018557,0.000999407,0.000483924,0.00162007,0.00118793,0.000174739,-0.000281987,0.00120331,-0.0018223,-0.00192442,0.000427649,-0.000173848,0.000762569,0.00031212,0.00136848,0.000590481,0.00133185,-0.00104601,0.00100467,-0.000384295,-0.00180633,-0.000395321,-0.000467463,-0.0010474,0.000531894,-0.000745086,0.000554771,0.000709554,-0.000238289,-0.0000920221,-0.00084848,0.0018243,0.00134075,-0.00115196,-0.000189815,-0.000338737,0.00147221,0.00151696,-0.000993254,-0.000872247,0.00125505,-0.000169512,0.00131613,0.0000494955,-0.000766876,-0.000444721,-0.000288814,-0.000722109,-0.00024275,0.000278757,0.000804961,0.000706867,0.00118623,-0.00147699,-0.000901899,-0.00111067,0.000522672,0.00072929,-0.000516842,0.000482862,0.000518075,-0.000911765,-0.000164803,0.00164303,-0.000790601,0.000827643,0.0000792295,-0.000643416,0.00052443,0.00185522,-0.0000979591,0.000433918,-0.000705352,-0.000981673,-0.0000781859,-0.00138663,-0.000580909,-0.000379275,-0.000558149,0.000211726,0.0000438334,0.000305792,-0.00148644,0.000835431,-0.00105572,-0.00120724,-0.00054301,-0.000116879,0.00140904,-0.000381636,0.00102357,0.000425674,-0.001044,-0.000620459,0.0000577196,-0.00141963,0.00017831,0.000427881,-0.0013886,0.00122665,-0.000834669,0.000900877,-0.000585278,0.00136823,0.0014363,-0.00160976,-0.000917307,-0.000371714,-0.000614029,-0.00129232,0.000269139,-0.000973724,-0.00089353,-0.000206574,-0.000332718,-0.000245886,0.00027202,-0.000343771,-0.000880844,0.00134858,0.000814512,-0.000107707,-0.0010412,0.000277714,0.000139965,0.000188917,0.000123815,0.000763661,0.00138525,0.000232975,0.00136392,0.000503906,-0.00084186,0.00129833,0.000568237,-0.000129403,-0.000577676,-0.000898565,0.00174865,0.000154733,0.000600447,0.000270443,-0.0000845625,0.0000830085,0.000814206,0.000957394,0.000844427,-0.000928527,0.00123055,-0.000832806,0.00159776,-0.00160695,-0.000272658,0.00115311,-0.00155057,-0.000552295,0.00135394,0.000820118,-0.000500733,0.000384561,-0.000539277,0.000625998,-0.000568159,0.000639027,0.000125631,-0.000591612,-0.00103495,-0.000942282,-0.000651971,0.00149652,0.000307746,-0.000194177,0.0000389646,0.00124966,-0.000107,-0.000253807,-0.00059313,-0.000391429,-0.00127296,0.000308893,0.000337721,-0.000966486,0.000604307,-0.00110415,-0.000440671,0.00034689,0.000313103,0.00123528,-0.000652229,0.000370868,0.00170217,-0.0018575,0.0013135,-0.001467,0.000532727,0.000559225,0.00103781,0.0012506,0.00154036,0.000670466,-0.000354978,-0.00046532,0.000759993,0.00132472,-0.000296559,0.000212728,-0.0000950172,-0.000645985,-0.000796598,0.000282314,0.000394892,-0.00152392,0.000651287,-0.000431173,0.00195762,-0.00142888,0.00152804,0.000139052,-0.00137277,0.000329661,0.0000127365,0.000980541,-0.000251174,0.000592287,0.000829048,-0.00129071,-0.0016037,-0.000728379,-0.00172322,-0.000158835,0.000180782,0.00135618,0.000821178,0.00116613,0.000624802,-0.00017424,0.0000869573,0.000138873,-0.000418967,0.000948223,0.000121391,0.00151257,-0.00151597,-0.000742752,0.0000508763,0.000997986,-0.0000883201,0.000232089,-0.000578038,0.000515657,0.000176336,-0.000152732,-0.000573089,-0.000727601,-0.00123572,-0.000810324,0.000118953,-0.000483471,-0.000522524,-0.00106668,0.000137162,0.000593891,-0.00182251,0.000879273,-0.00143911,-0.00123984,-0.00106334,0.000556743,0.00115817,0.00113871,-0.000990406,0.000700468,0.000684256,-0.00151751,-0.00034379,0.00126042,0.000160925,-0.00186606,0.00148629,-0.00164395,-0.000173527,0.000287298,-0.000495255,-0.0000507129,-0.000487023,-0.00176829,0.00146063,0.00022304,0.00107002,-0.000704442,-0.00069735,-0.000275484,0.00000334104,-0.0011071,-0.00162827,-0.000968338,0.00141846,0.000534514,-0.000386101,-0.000549535,-0.000491702,0.000770775,-0.00193153,-0.000904868,0.00104019,-0.00115257,0.00114598,0.0000486004,-0.000318937,0.000443513,-0.000719462,-0.00101989,0.000867826,0.000910676,-0.00142855,-0.00128167,0.00123698,0.000292353,0.000413979,-0.00148625,-0.0000140189,-0.000770293,-0.00119055,-0.000239113,0.000110386,-0.00114624,0.000308313,0.000577218,-0.00175047,0.000439158,0.000149828,0.000456471,0.00110349,-0.0005425,-0.000103914,-0.00114717,-0.000916977,-0.00114121,0.00134138,0.00152267,0.00120398,0.00023804,-0.000268974,0.000109642,0.000443662,-0.000553261,-0.000943386,0.0019699,0.00102977,-0.000373206,0.00110698,-0.000156268,0.000211951,0.000662003,-0.000512639,0.000480579,0.000298012,0.0017466,-0.000190626,0.00124931,0.000170202,0.00102478,0.00075322,0.0010847,-0.00154325,0.00134482,0.000868192,-0.000689233,-0.000814676,0.000600894,-0.000705331,-0.00113713,-0.000316,-0.000758568,0.00057475,0.000659029,0.000849917,0.0019501,0.000147008,0.00104021,-0.000534548,0.0000932226,-0.000441588,0.000815126,-0.000760266,-0.00137283,0.000707989,-0.00015389,-0.00127912,-0.000991693,-0.00108284,-0.0000412031,-0.000579267,0.000452506,0.00116305,-0.00102323,-0.000262146,0.0000966782,-0.000430689,0.000283435,0.000485098,0.000524988,0.000339995,-0.00163581,0.000199352,0.000629822,-0.000215392,-0.000610397,-0.0000526736,-0.000863954,-0.000468422,-0.00156257,-0.0000918781,-0.000468736,-0.000114512,-0.000476814,-0.000702649,-0.000774779,-0.00108202,0.0000291034,-0.00104284,-0.00148949,0.000536316,-0.000256104,0.000135786,0.00103956,-0.00024275,0.0014419,-0.000253892,-0.0016567,0.00155616,-0.000626118,0.000460849,-0.000955666,-0.000204096,-0.000433452,-0.000118673,-0.00018709,-0.0000769648,0.00038564,0.00102756,-0.000535687,-0.000336301,0.000889589,-0.000505531,-0.000269337,-0.00000548184,-0.000577041,-0.000141721,0.000402235,-0.00042564,-0.0000749254,0.000452065,-0.000762636,-0.000564985,-0.00123249,-0.000863392,-0.00143964,-0.00124459,-0.000709453,-0.00122352,0.000843663,0.000118534,-0.000659886,0.000214548,-0.000603404,0.00145183,-0.00146616,-0.000545033,0.000436487,-0.000327384,-0.000731294,-0.00097432,-0.00181972,-0.000782672,-0.00169271,-0.000334323,-0.0000912017,-0.00163937,0.000875917,-0.000620811,0.000682655,-0.00117192,-0.00014109,-0.000220694,0.000620791,0.000493393,0.000780411,0.000419035,0.000488672,0.000889538,-0.000243186,0.00104174,-0.000436418,-0.00142332,-0.000915942,-0.0004724,-0.000866591,0.00114129,0.000854608,-0.000801037,0.000714884,-0.000237317,-0.000212644,-0.00106797,-0.000804628,-0.000778105,0.00105807,-0.0011143,0.00111049,-0.00194035,0.00127543,0.000613007,0.000279682,0.00117934,-0.00154151,-0.000236622,-0.00105575,-0.000385093,0.0000787364,-0.00165798,0.000185885,0.000386475,-0.000601215,0.0011461,-0.00154357,0.000623065,-0.000979208,-0.000387546,-0.00082184,-0.0000571145,-0.000737233,-0.000528414,-0.000343038,0.000463283,-0.000278836,0.000657338,0.0000605211,0.0000358479,-0.000903245,0.000322288,0.000178469,0.00167638,-0.000103923,-0.000242562,-0.00164701,0.000482544,0.00160555,-0.000278847,-0.00153437,-0.000786364,0.000131658,0.00107568,0.000416543,-0.000254942,0.00133402,0.00103809,-0.000377027,-0.0000179782,0.000761048,-0.000255001,0.000622879,0.000317307,-0.000925899,0.000810963,0.00105608,-0.000323256,-0.00137105,-0.000906892,-0.000650909,0.000621539,-0.000936356,0.00037711,0.000855576,-0.00113134,-0.000821985,0.00141391,-0.00184947,-0.00139785,0.000399872,-0.000151622,-0.000295563,-0.00144248,-0.000552317,-0.000437224,-0.000760953,-0.000915569,0.0000632197,-0.000169278,-0.00145482,0.000551227,0.00026898,0.0000422655,-0.0010349,-0.0000439012,-0.00052903,0.000866656,0.00183256,-0.000253413,0.00145269,0.000163828,-0.0008058,-0.000109322,0.000175419,0.00147384,0.000619758,0.000526692,0.00189114,-0.000983147,-0.000473734,0.000449566,0.0000756913,0.00102348,0.000357663,0.000931734,0.00041872,0.000292519,0.000821153,0.000736767,0.000613585,-0.000759166,-0.000813049,-0.000576361,0.000140534,0.000164552,0.000261305,-0.000402899,0.00156838,-0.000979844,-0.000754583,0.00182386,0.00142329,0.000573821,-0.00191587,0.00158607,-0.00157814,-0.00086076,-0.000985947,-0.000408036,-0.00104341,0.0000445341,0.00148602,-0.000253449,0.000200914,-0.00123332,-0.000484131,0.000603266,-0.00182473,0.000455381,-0.000521255,0.000260382,0.00126057,0.000634549,0.000857316,-0.000559154,-0.00122457,-0.000029897,0.00103287,0.000973643,0.00124724,0.00149262,-0.000388658,-0.000197778,0.00176271,-0.000485996,0.000449468,-0.000751395,-0.00153662,0.00091205,-0.000269398,-0.00112666,-0.00118338,0.000313526,-0.00101465,-0.0000460064,0.00062215,-0.000076016,-0.00124598,0.00124339,0.000401524,-0.0010816,-0.000227721,-0.000707228,-0.000873148,-0.000650414,0.000516797,-0.00144122,-0.000195895,-0.00103256,-0.000384333,-0.0000158464,-0.000400279,0.000619502,-0.000874681,-0.000911568,0.00107358,0.000191265,-0.00107209,0.000988467,-0.00175633,-0.00173522,0.00081043,0.000281002,0.000070399,0.000316459,0.000115645,-0.000570716,0.00036183,-0.00128529,-0.00000810713,-0.0000285936,-0.00172754,0.000499589,0.000535775,-0.000531498,0.000584143,0.000616634,0.00019513,-0.000329162,-0.000445892,0.0000552104,-0.000243383,-0.000361395,0.00143203,-0.000364297,-0.000446448,-0.00169847,0.00103016,0.00189422,-0.000806884,-0.0014934,-0.0000862255,-0.00054325,-0.000209758,0.00171301,0.000735221,-0.000607691,-0.000192457,0.000540225,-0.00142909,-0.00163123,0.001237,0.000916847,0.00127712,0.00104731,0.000838621,-0.000300664,-0.000847235,0.000862952,0.000556562,0.000374489,-0.00000585109,-0.00161439,-0.0000848407,-0.000904311,0.00141944,0.00084311,-0.00125204,0.000190653,0.00134913,-0.000306791,0.00117819,0.000428835,-0.0000306989,0.000965843,-0.0012634,-0.000738676,-0.00176191,0.00133103,-0.000873766,-0.00046642,0.000611451,0.000250283,0.000428084,0.000387647,-0.000801565,-0.000684122,0.00107782,0.000997867,0.000676072,-0.000547683,-0.000240944,-0.0016789,-0.00168149,-0.0012056,-0.00081598,0.00165,0.0000112887,0.000616444,0.000222937,-0.00111875,0.000775163,0.000739631,0.000244728,0.000379906,0.000485592,0.000838266,-0.00081533,-0.00105748,0.00106988,-0.000379474,-0.0000756902,-0.000864956,0.00104497,0.00109097,-0.000426142,-0.000537457,-0.00149955,-0.000572951,-0.000167594,0.0000694944,-0.0016952,-0.000203923,0.0000158944,-0.000638863,-0.000822198,-0.000970163,-0.000780489,-0.0000400384,0.000661161,-0.00161297,-0.0000915492,-0.000265562,0.00131028,0.000551546,0.00146218,-0.00154674,0.000336709,-0.000341483,-0.000120245,-0.00129957,-0.0012905,-0.00132078,-0.000377302,0.000699337,-0.00100129,0.000000583906,0.000987733,0.000510969,-0.0000122477,0.00138425,0.000706825,0.000872245,-0.000383135,0.000157721,-0.0000594394,-0.00104422,-0.000739543,0.00058503,0.00134528,0.00144573,-0.00116483,-0.000505568,0.00128497,0.000559013,-0.000759636,0.00112601,-0.0016261,0.000505485,0.000351301,0.00108034,-0.000716723,-0.000614312,0.000933617,-0.000573704,-0.000547409,0.000776068,-0.000820084,-0.00118156,-0.00139495,-0.000791413,-0.00139639,0.00133619,-0.000371391,0.000182732,-0.000464993,-0.000862989,0.0014628,-0.000114459,0.000492524,-0.000766428,-0.000858428,-0.00131525,0.00165774,-0.00155359,-0.000163729,-0.000451702,0.00117818,-0.000249279,-0.00108691,0.000761196,0.000842095,0.00041127,0.000439563,0.000337691,-0.00125935,0.000532749,0.000766814,0.000344392,0.000298177,-0.00022887,-0.000462456,0.000425605,0.00018314,-0.000839005,-0.000439154,-0.000374426,0.000433794,-0.00188029,-0.00177296,-0.00025216,0.00063594,-0.00177209,-0.000177448,-0.0017759,-0.000480836,0.000129695,-0.000727038,0.000508668,-0.000953554,-0.00138666,0.000541941,-0.00134071,-0.00146621,0.000573098,-0.000614116,-0.00000827201,0.000499119,0.00095074,0.000299005,-0.000226469,0.000332263,-0.00127032,-0.000604712,0.000805977,-0.00143511,0.0000380121,-0.00182277,0.00077834,-0.00144847,0.00155921,-0.00102347,-0.000460448,0.00184013,0.0000454136,0.000194526,-0.00138829,-0.00102278,0.0017572,-0.00144822,-0.000954886,-0.000360329,0.000483696,-0.00198729,0.00198072,-0.00178487,-0.0013632,0.000459548,-0.000905874,-0.0000461679,-0.000108745,-0.0000906467,-0.000771287,0.00149328,0.000427689,0.00060147,-0.000468994,-0.000858951,-0.0000721488,0.00133395,-0.000152285,0.000665414,-0.00181344,-0.000599171,-0.00144709,0.00029703,0.000166888,0.00187503,0.00151005,-0.00131149,0.00133962,0.000528417,0.000163138,0.000593217,-0.000869396,0.000205041,0.000219837,0.000424081,0.00142638,0.000687466,-0.00141793,-0.000387587,0.000915669,-0.000675895,-0.000863452,-0.00130204,-0.0000908364,0.00133648,-0.00105121,-0.00182548,0.0016282,0.00108876,0.0000680453,0.000612969,0.000755708,0.0000972196,-0.000317543,0.000720181,0.000659973,0.000263037,-0.000553058,-0.000085564,-0.000100584,-0.000666685,-0.00092811,-0.000278812,0.000147446,0.000791149,0.00036123,0.00126459,0.0000777658,-0.000927822,-0.0000678246,-0.00051761,0.00089908,-0.00112772,-0.000044697,-0.00046911,0.00011585,-0.000376428,-0.0012972,-0.000236919,0.00074675,0.000208782,0.0000369707,0.000567393,0.000191373,0.00127047,-0.00108738,-0.000286577,-0.00148712,-0.0000893481,0.00000772781,0.000996339,-0.000546245,-0.00108663,-0.000766729,-0.00056852,-0.00119992,0.00184486,-0.000109443,-0.00168998,0.00141607,-0.000155824,-0.00120775,-0.00135257,0.000921985,-0.000213967,0.00124408,0.00052461,0.00015112,0.000785456,-0.00138667,-0.00149316,-0.000912378,-0.000110243,-0.000559397,-0.000171464,-0.000315927,0.000496543,-0.000763088,0.000189308,-0.000591784,0.00159265,0.0000750013,0.000866723,-0.000548827,0.000797506,-0.0000303072,-0.000561625,0.0013245,0.000126934,-0.00105693,0.000250843,-0.000984871,0.00117891,0.000866169,0.00122868,0.00125743,0.000682502,-0.0016037,-0.000496252,-0.00158213,-0.000614311,-0.000794046,-0.000402041,-0.00141687,-0.000571249,-0.00116676,-0.00122571,0.00107363,0.000392774,0.000386828,0.000146878,-0.000220165,0.00129833,-0.0000751256,-0.00103615,0.0000739561,-0.00121088,0.000691386,-0.0000489851,0.000854895,-0.000919023,-0.000904041,0.000214717,0.000418586,0.00119518,-0.000762138,0.00022506,0.00132839,0.000757146,0.000446036,0.000296732,0.000205617,0.000542597,-0.000353727,-0.000855342,0.001699,0.000815525,0.000653486,0.000377756,0.000316789,0.0011222,0.0000518933,0.00139433,0.000244118,-0.000671749,-0.000123779,0.000146528,-0.000262157,0.000498138,0.000418123,0.000764505,-0.000222487,0.00108477,0.00031247,-0.00175839,0.00139422,-0.000738649,-0.000799908,0.00115848,0.000638477,0.00163242,-0.000243235,-0.000627879,-0.000979334,0.0000222351,0.000573425,-0.000589454,-0.000307196,-0.0000897342,0.000276418,-0.000272142,0.000152796,-0.000716625,-0.000535439,0.0000157086,-0.00130846,0.000406622,0.00106954,0.000169139,-0.000813948,-0.00155898,0.00106471,-0.00113029,-0.000297487,0.00035213,0.000137745,-0.000586007,0.00135602,-0.000191648,-0.000365665,0.0000413402,0.00110963,-0.00177295,-0.0013425,0.000599696,-0.000347425,-0.000210662,0.000644164,-0.000748795,0.000485639,0.000619728,-0.000548306,-0.0015784,-0.000484071,-0.000869527,-0.000851974,-0.000732538,0.000843084,-0.00180503,0.0012888,0.000872764,-0.000578362,0.00137741,-0.000483133,-0.000957807,-0.000412508,0.0000738669,0.000944047,-0.000627961,0.000475539,0.00166872,-0.000454477,-0.00140529,-0.000827439,0.000673014,0.000780615,-0.000127097,-0.00141974,0.000097219,0.000972341,0.00144239,0.000023984,0.00105372,0.00120803,-0.000129929,-0.000324521,0.0000952581,0.000194997,0.000264232,0.00151465,-0.000770467,0.000802126,0.0000462041,0.00150416,0.0000543951,0.000863304,0.000419873,0.000714565,0.000951528,-0.000576175,-0.000596579,0.00146991,-0.000241297,-0.0005968,0.00164089,0.000845509,0.000840769,0.00012285,-0.000011433,-0.000147766,0.00182018,0.000516473,-0.000644173,-0.0000586754,0.0015328,-0.0000208886,0.0000732931,0.000589584,-0.000335088,-0.00143045,0.000554937,-0.00096301,-0.00166242,-0.000386631,-0.00086874,0.000159626,-0.000479474,-0.000685944,0.000481829,0.000117146,-0.00127372,-0.000735156,0.000698247,-0.00102411,0.000384961,-0.0014125,-0.00114148,0.000944026,-0.000442698,0.00151474,0.000500018,-0.000109018,0.000622183,-0.000511941,0.00127919,0.000844674,0.000667926,0.000389043,-0.00146462,0.000502366,0.00137303,0.000426913,-0.000984097,-0.000652429,0.00000829288,0.000365468,0.000331696,-0.000458545,0.000858744,-0.00109765,0.000491422,0.0000535394,-0.000503437,0.000153346,0.000144418,0.000746811,0.000283991,-0.00000911525,0.00102531,-0.0000262874,0.00104934,-0.000641378,-0.000221275,0.00135131,-0.00123408,0.000556832,-0.00163512,-0.0000505854,-0.000131919,-0.000213541,-0.000626107,0.000770053,0.000526937,-0.000181425,-0.000730335,-0.0013186,0.000472422,-0.00087447,0.000197435,0.000959083,-0.000402998,-0.00143979,-0.000631136,-0.000518899,-0.00091341,0.000478105,-0.00147525,0.00111098,-0.00174259,-0.00086621,-0.000108231,0.000179965,-0.000271595,-0.00106298,-0.000838457,0.000819881,0.00115559,0.00115672,0.000829813,-0.00023918,-0.0000720705,0.000635563,0.00133472,0.000791445,0.000610656,-0.000588665,0.00015016,-0.000509586,-0.00115092,-0.0012976,-0.000903431,-0.00000990146,0.000832837,0.000633739,0.000467477,-0.00153921,0.00059832,0.000746117,0.00119224,-0.000899614,-0.000742296,0.000587864,0.00059445,0.0000108863,0.00158064,0.000721953,-0.000381668,0.00111884,-0.00048427,-0.00122091,-0.000964495,0.00151331,0.00193214,0.00037228,-0.00152694,0.000578259,-0.00145543,0.000346135,0.00147202,-0.00165288,0.000345248,0.000197841,0.0000284741,0.0004362,-0.000225613,0.000966689,-0.000992802,0.000637621,0.00199061,0.00108915,0.000665645,-0.000706964,-0.00121876,-0.000389831,-0.000642693,-0.000659883,0.000583156,0.000329895,-0.000502622,0.000926254,-0.000235739,0.000421345,-0.000778119,0.00114239,0.000430024,-0.000396856,-0.00000721441,0.00131387,-0.000613428,0.000714212,0.000704923,-0.000199002,0.000793715,-0.000596292,0.000270821,-0.000517786,0.0000193019,0.000155777,0.000507548,-0.000353846,0.00108673,0.0017158,-0.000547866,0.000293103,-0.00132409,0.0000972416,-0.00149845,0.000194513,0.000497203,0.00100959,0.00111201,0.000467173,-0.00180766,-0.000187819,0.000558349,-0.000262507,0.000488376,-0.00058048,-0.000395189,-0.0018787,0.000194596,-0.000283038,0.00184203,0.00062118,0.000646641,0.000137441,-0.000426463,0.00106138,-0.000703934,-0.000308602,-0.00075392,0.00179154,-0.000242178,0.000768542,-0.00105308,0.000856469,0.000218168,-0.000624358,0.00049483,-0.000547579,-0.000100098,0.000443505,-0.000269695,0.000330818,-0.0000630613,-0.000575493,-0.00131682,0.000248397,0.00121571,0.000120586,0.000368631,-0.000958557,0.000480949,0.00097203,-0.00172612,-0.00107382,0.0000879149,-0.00150172,-0.00107988,0.00166161,-0.000726475,-0.00110783,0.00118247,-0.000114714,-0.00077166,-0.00131677,-0.00168809,-0.000183499,-0.00127072,-0.00050214,0.000976988,0.000846963,-0.00144719,-0.000751526,0.000173432,0.000570352,0.000379241,0.0000187881,-0.000552049,0.00176858,-0.000936725,0.000488343,-0.000196773,-0.000449852,-0.000570876,0.000439568,-0.00167496,-0.00142697,-0.000584731,0.000569473,0.000683319,0.00110831,-0.00027135,-0.00188002,0.000630017,-0.000499208,0.00103235,0.0013193,0.000819444,-0.00102462,0.000285934,0.000850072,-0.000690617,-0.00000108533,-0.000112232,-0.00153078,-0.000164975,0.00080176,0.000140671,-0.000289367,0.000521458,-0.000849152,-0.000581803,0.000606704,-0.000650693,-0.00157437,0.000695884,0.0000502164,0.000941814,0.000566696,0.000194385,0.000672844,0.000214569,-0.0000296184,-0.00138624,-0.00191053,0.000418739,-0.000166792,0.000418172,0.00147527,-0.00170489,-0.000454804,0.000658062,0.000821247,0.0000283624,-0.000483513,-0.000656752,-0.0000728043,-0.00111828,0.000604134,-0.00106569,0.00139272,0.000318641,-0.00190488,-0.000726551,-0.00116447,0.00191044,-0.00136207,0.000943788,0.000316086,0.00158451,-0.0010302,0.00049886,0.00126194,0.00154007,-0.00104536,0.000725628,0.000142824,0.000193622,-0.000119172,0.000757862,0.000605199,-0.00104209,-0.000163592,0.000623378,-0.00139504,0.00107046,0.00120148,-0.00115552,0.000612059,0.00148334,-0.000642311,-0.00147131,-0.00125226,0.000307525,-0.000855298,-0.000478332,-0.00153829,0.0003948,0.00152105,-0.000289918,-0.00168499,0.000459671,-0.0000792957,-0.000203926,-0.000218365,-0.000882849,-0.000227429,0.000623745,0.00112671,0.000464568,0.000589925,0.00128338,-0.00196492,-0.00169723,-0.000468642,0.00143138,-0.00148412,0.00165426,0.00110461,0.000528256,0.00106778,0.00110807,-0.000751084,0.00116893,0.000647737,0.000301772,-0.000527149,0.000376911,0.00115928,-0.0011041,0.000794648,-0.00138776,0.000518104,-0.0000779474,-0.000122372,0.000482519,0.000367164,0.000979204,-0.000281425,0.0007812,0.000741399,0.000637811,-0.0000653093,0.000346136,-0.0000697918,0.00137211,0.000422744,0.000605772,-0.00084956,-0.0000828168,-0.000269587,-0.000320831,-0.000544082,0.00170604,0.00112239,0.000322925,0.00184348,-0.0000918005,0.000198243,0.0011329,-0.00035544,0.000446142,-0.000782264,0.000226241,0.000435403,0.00110409,-0.0009129,0.000240597,-0.000456963,0.000767099,-0.00102002,0.000258573,-0.00188433,-0.00159278,0.000469508,0.000525662,0.00021512,0.00117409,0.00143813,0.0000574444,0.0000449568,-0.000288549,-0.00105491,-0.000968236,0.000241559,0.00100798,0.00140431,-0.00160884,-0.00057689,-0.000243285,-0.000825044,0.0018581,0.000753857,0.00142299,-0.000517805,-0.000892435,0.000049001,0.000867522,-0.000535191,0.00124564,-0.000996084,0.000817795,-0.00166854,-0.0000269151,-0.000556804,0.000364017,0.000116464,-0.00071379,-0.000353046,-0.00120625,0.00101447,-0.000848804,0.00110068,0.000561882,-0.000431663,0.000519466,-0.00055859,0.000951604,-0.00101846,-0.00123051,0.00069334,0.000406394,-0.000181202,-0.00118464,-0.000623832,0.00111546,0.000838498,-0.000446559,0.000726261,0.000469838,-0.000756694,0.000509681,0.00100307,-0.000561561,0.000230863,0.000485945,-0.00123647,-0.000248417,0.000452712,0.000829469,0.00146137,0.000604679,0.000413907,-0.000705154,0.000534838,0.000444148,0.000491913,0.000977125,0.000955249,0.00120779,0.0000360333,-0.000707476,-0.00130906,0.000111318,0.00171459,0.0017601,0.0010625,0.000790412,-0.00101907,-0.000582916,-0.000150896,0.000558434,-0.00031832,0.0000418735,0.00163373,0.000990448,-0.00130772,0.000685195,-0.00109613,-0.000218519,-0.000924948,-0.00157462,-0.001042,0.0000233269,0.000483113,-0.000253645,-0.00155675,0.000326294,-0.00022758,-0.000421171,-0.000735471,0.00175213,-0.000891948,-0.000112995,-0.000385041,0.00109004,0.00195035,0.00173167,-0.000901752,0.00169012,0.000392234,-0.0006568,0.0000744693,0.000911733,-0.00100798,-0.000201265,0.00129911,0.00124096,-0.00140045,0.0000587845,0.000572333,0.0014333,0.00114032,-0.000589335,-0.000593066,0.00112973,0.00180252,0.000366482,0.000171273,-0.0000330948,-0.00169791,-0.000521908,0.000416335,0.000479849,-0.0011595,0.000111558,0.000683798,-0.000208834,0.000841485,-0.00101265,-0.000670407,-0.000634865,-0.0000882544,0.000130753,-0.00132608,0.000756946,-0.00162854,-0.000362472,0.000400712,-0.000471443,0.000266596,-0.00155684,-0.0000490013,0.000587123,-0.0000477372,0.000396185,0.00134433,0.000603601,-0.000123524,-0.000115242,0.000503412,0.00142005,-0.00194746,0.000504903,0.000676835,0.000661855,-0.000587876,0.0000184646,0.000621909,-0.000173279,-0.0000242639,-0.000294901,-0.000430941,0.000628443,0.0006093,-0.00129419,0.000185719,-0.00034895,0.000523165,-0.000761852,0.000835593,-0.00104574,0.000814026,0.000773988,0.000934417,0.00103406,0.000799445,0.000115083,0.000961943,-0.00072446,-0.00041519,-0.00109711,0.00199981,0.000688966,-0.000647404,0.00143632,-0.00173683,-0.00019238,-0.000533952,0.00182861,0.00116927,-0.000516094,-0.000505018,-0.0000883187,0.000372084,0.000911309,-0.00114748,0.000817753,0.00146443,0.000625702,0.00151586,0.00149732,0.00074505,0.000181628,-0.000419116,0.000160039,0.000753031,-0.000716747,0.00121593,-0.000451191,0.00179885,-0.000349842,-0.00059344,0.000384329,-0.000368638,-0.000656732,-0.000660884,0.000667036,0.000460016,-0.00143225,0.00105491,-0.000668276,-0.00126977,-0.000101993,-0.000180918,-0.0014508,-0.000195902,0.0000793958,-0.000215557,0.00159855,0.000389122,0.000184523,0.00128923,-0.00127203,0.0000210356,-0.000482792,-0.000679966,0.000452869,-0.0011122,0.0000129764,0.00124412,-0.000192537,-0.000186412,0.000262082,0.000655599,-0.000698264,0.00155599,0.000429579,-0.00026071,0.0000280027,0.000361446,0.000428111,0.000300118,-0.000499238,-0.00105623,-0.00150002,-0.000392977,0.00171273,-0.00158388,0.00141726,0.0011361,0.00102618,0.00181492,-0.000267936,0.0000994752,0.000735187,-0.000139117,-0.000956087,-0.00150572,0.00000284755,0.000955783,-0.000125165,0.0000985409,-0.00025031,-0.000289716,0.0000543263,0.000615201,0.000973981,-0.000645678,0.00146709,-0.00185424,0.000286985,0.000308483,-0.000500723,-0.000134695,0.000545503,0.000914869,0.00164598,0.000648387,-0.0000977849,0.000685045,-0.000751616,0.000199263,-0.000524184,0.000117625,0.000227081,-0.000182785,0.000677549,0.0000888383,0.000204967,-0.00129818,0.000675685,0.00146508,-0.000104855,-0.00136736,0.000887201,-0.00136708,0.000212693,0.000209418,-0.00144735,0.00152683,-0.000583272,0.00169839,-0.00138029,0.00102198,0.000201231,0.000278975,-0.000472288,-0.00101918,-0.0000699201,0.000547555,0.000306102,0.000244082,0.00155456,0.000541133,0.0000680261,-0.000353245,0.000300315,0.00168104,0.00129523,0.00133915,-0.00106951,0.00157235,-0.000246775,0.00168635,-0.000515484,-0.000580013,-0.00159606,-0.000420822,-0.0000389577,-0.00115415,0.00155775,-0.000729676,-0.000533396,0.000988238,-0.000929894,0.000658631,0.00181003,0.000542837,-0.0000309181,-0.000562021,0.000738509,0.0000702001,-0.000478389,0.000284481,-0.00134789,-0.00129027,0.0000690662,0.000356586,-0.0018575,0.000886439,0.00115505,-0.000752113,-0.00102689,-0.000846187,-0.000991992,-0.000229449,-0.00152941,-0.00119887,-0.00118212,-0.000403296,0.00190204,0.00113671,0.000324711,-0.00101669,-0.00066162,-0.0000790495,-0.000965021,-0.00082345,-0.000742582,-0.000246446,-0.00115569,0.000911109,-0.0000691248,0.000982884,0.000998638,-0.00130299,0.00174999,-0.00104283,-0.000387173,-0.000748101,-0.000733227,0.00165661,0.0000898117,-0.00113511,-0.000485817,-0.00181865,-0.000179618,0.000230764,-0.00043628,-0.000262215,0.000875482,0.000429736,-0.000746051,0.00193962,-0.000512408,0.000165035,0.00121899,0.00128704,-0.00107981,-0.000713993,0.000698837,-0.000902781,0.000241041,0.00174197,-0.00160716,0.000296965,-0.000120568,-0.000897505,0.000238757,0.000211976,-0.0000650325,0.00126447,0.00133645,0.000700816,0.0019461,-0.000653153,-0.00168956,0.000208957,-0.00151078,0.00154943,0.000541723,0.000717083,0.000614508,-0.000211659,-0.00112469,0.000311393,0.000621611,-0.000588322,-0.000133933,0.000393509,-0.000232454,0.000106238,0.000183431,-0.000769438,-0.000679372,-0.000537327,-0.000492326,0.000967272,-0.00168897,0.000578019,0.000209275,-0.000699961,0.000462684,0.000268871,-0.00120633,0.000256088,-0.000847421,0.000705915,-0.00074269,-0.000535087,0.000702573,-0.00058507,0.000531562,-0.00141313,0.00069873,-0.000587609,-0.00117427,0.00101815,-0.00104073,-0.000614904,-0.0000417074,0.000186648,0.000386038,0.00100142,0.000553001,0.000915099,0.00186296,-0.00105942,0.000315044,-0.00113786,0.000485299,0.000483543,-0.00000967587,-0.00034586,-0.0016043,0.000616051,-0.000809165,0.000035457,0.00133102,-0.00000465516,-0.000504167,-0.000399523,0.000873967,0.00124535,-0.000615577,0.000243873,-0.000868728,-0.000213266,0.000362377,0.00022537,0.0000459785,0.000229116,-0.000602967,-0.000995784,-0.000250045,-0.000928476,-0.000681834,0.0000321446,-0.000829871,0.0000942275,-0.000587721,0.000433417,-0.000910126,0.000345171,-0.000538764,-0.000245089,-0.00154389,0.00105317,-0.000597704,0.00157788,0.0000433118,-0.000505589,0.00096493,0.000701301,-0.0000897253,0.00105498,0.00180869,-0.000137591,0.000588566,-0.000309959,0.00126238,-0.000909134,-0.000342973,-0.00152853,-0.00178474,-0.00185668,-0.000323809,0.0000304968,0.000564438,0.000302956,-0.00111997,0.00139036,-0.000957689,-0.000783282,0.00140322,0.000463635,0.000530494,-0.00114338,0.000488018,-0.000430149,-0.00109346,-0.000252427,0.000952627,0.00146563,0.00001044,-0.00183669,0.000746569,-0.00143944,-0.000799937,-0.000100299,-0.000981503,-0.0019682,-0.000608892,-0.00094777,-0.00155452,-0.0000196544,-0.000740638,0.000408205,0.000341424,0.000383496,0.000318533,-0.000526835,0.000621896,-0.000640448,-0.00169931,-0.00186949,-0.000263991,-0.000778379,-0.000372746,0.00072085,0.000123317,-0.00039604,-0.00154628,0.000829595,0.00131273,-0.00136583,-0.000149691,0.00123432,0.00150986,-0.00167992,-0.000963511,-0.000130273,0.000548776,0.00012495,0.000442952,-0.000315579,-0.000212349,-0.000406264,-0.000377979,0.000171824,-0.0008989,-0.000718202,-0.0013607,-0.00026456,-0.000486039,-0.000907156,-0.00184912,0.000837827,-0.0000820068,0.00105961,-0.000399373,0.00128598,0.000259086,0.000569885,-0.00194374,0.00126389,0.000953763,-0.0011601,-0.000947108,0.000877291,0.00000429881,-0.00119686,0.00134673,-0.000339338,0.000743316,-0.00147352,-0.000324524,0.0000393489,-0.000663433,-0.000639543,-0.000866555,0.000273769,0.000605397,0.000331879,0.000770423,0.00102507,-0.000271956,-0.00107971,0.000820763,0.000449778,-0.000505182,0.00112763,-0.00130973,-0.000331107,0.000819896,-0.0000630934,-0.000754355,-0.00112304,-0.000329958,-0.0000941328,0.000175927,-0.000233565,0.000216514,0.000133227,0.00143126,-0.000164945,-0.000909532,0.00083691,-0.0016549,-0.000302275,0.000120975,-0.000861028,-0.000316521,-0.000426046,0.000240013,-0.000385531,0.00104011,0.000118602,-0.000736767,-0.000966167,-0.00107778,-0.000203622,0.0000353216,-0.000807679,0.00142519,0.00117039,0.000529697,0.000670893,-0.000943445,0.00175397,0.000256471,0.000157694,0.000444396,-0.0000786863,-0.000850713,-0.00133958,0.000563236,-0.00156028,-0.000789026,0.000945565,-0.0000140243,0.000195249,-0.000219786,-0.000234031,0.00008298,-0.000834757,-0.000670047,-0.00085721,-0.00057077,-0.00026598,0.0009946,0.00118418,0.000956345,0.000245625,0.00105173,0.00107052,0.000775546,0.000764146,0.000474389,0.000295376,0.000961817,0.000347967,0.000734468,0.000134494,0.000478386,-0.00135265,0.000797635,0.00065321,-0.00186063,0.0000821238,0.00026947,0.00011574,-0.000210625,0.00100538,0.0000591205,0.000166876,0.000493023,-0.000472772,0.00109271,-0.00184224,-0.00152752,0.000243308,-0.00140697,-0.000574283,-0.000939465,-0.00184681,0.000263084,0.00154878,-0.000260596,0.000366846,0.000638629,0.0000229923,0.000801805,0.000921115,0.000711024,0.000768379,-0.00193132,0.000697772,0.000552211,-0.000652121,0.000456549,0.0000324426,-0.000161238,-0.00118687,-0.00136208,-0.000440629,-0.00166943,0.000221933,-0.00000879034,0.000438116,-0.000663809,0.000465276,-0.000213502,0.000731207,0.000282544,-0.00174634,0.00135031
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&kernel&accumulation b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&kernel&accumulation
new file mode 100644
index 00000000..95f2be83
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/dense&kernel&accumulation
@@ -0,0 +1 @@
+-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,0,0,-0,0,-0,-0,-0,-0,-0,-0,-0,0,-0,-0,0,-0,0,0,-0,0,-0,-0,-0,-0,0,-0,0,0,-0,0,0,-0,-0,0,0,0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,0,-0,-0,-0,0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,-0,-0,-0,-0,0,-0,0,-0,0,0,-0,-0,-0,0,-0,0,-0,-0,-0,0,0,-0,-0,0,-0,-0,0,0,-0,0,-0,0,-0,0,-0,-0,-0,0,-0,0,0,-0,-0,0,0,-0,0,-0,0,0,0,0,-0,-0,-0,-0,0,-0,0,0,0,0,0,0,0,-0,0,0,-0,0,-0,-0,0,-0,0,0,0,0,-0,0,-0,-0,0,-0,-0,0,0,-0,-0,-0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,-0,0,0,0,-0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,0,0,0,0,-0,0,-0,0,0,0,0,0,-0,0,-0,0,-0,-0,0,0,0,-0,0,-0,0,0,0,-0,-0,0,0,-0,0,0,-0,-0,0,-0,0,-0,0,-0,0,0,0,-0,0,-0,-0,0,0,-0,-0,0,-0,0,-0,-0,-0,-0,0,0
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/emb2 b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/emb2
new file mode 100644
index 00000000..f3f72e9f
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/emb2
@@ -0,0 +1,49 @@
+0,8,-0.00122064,0.000786952,-0.00130245,0.00067982,-0.000719293,0.000513744,0.00058648,0.00000735173
+0,36,-0.000333569,-0.000402242,0.000631229,0.00170233,0.000961394,-0.0014132,-0.000656905,0.000165634
+0,48,0.000360543,0.000442801,-0.000357308,-0.000212897,0.00161441,-0.000339376,-0.000785099,0.000949445
+0,16,-0.000626772,-0.000739705,0.0000855334,-0.000831555,0.00172617,0.000748104,-0.000659167,0.000634341
+0,32,-0.000849079,-0.00170433,-0.000955112,-0.00170322,-0.000843388,0.000671623,-0.000437592,-0.000946085
+0,28,-0.000565935,0.000615678,-0.000726944,-0.00158319,-0.000186041,-0.000500402,-0.000879545,0.00055097
+0,20,0.00195215,0.000447417,0.00095067,0.0010152,-0.000571456,0.00132048,-0.000876266,0.000975916
+0,12,-0.000214213,0.000380639,0.00105054,-0.00139965,-0.000902571,0.00114655,-0.000479975,-0.00165699
+0,44,0.00000563833,0.000454858,-0.00065734,-0.000135377,-0.00055496,-0.00174822,-0.000226461,-0.000160685
+0,10,0.000710857,0.000426823,0.001154,0.000579382,-0.000284535,-0.00138646,-0.000877801,0.000475955
+0,2,-0.000147199,-0.00188124,0.000460898,-0.00049024,-0.0009496,0.0015914,-0.000248668,0.00121112
+0,34,0.000942517,0.00155599,-0.00191155,0.000811014,0.00105028,-0.00022994,0.000115965,-0.0013638
+0,18,0.000613628,-0.00152867,-0.000507273,0.0000575028,0.00155677,-0.000102919,0.000370329,0.00124317
+0,38,0.00051539,-0.000305181,-0.00123245,0.00166845,-0.000381066,0.00102506,-0.0000865528,0.000890616
+0,42,0.000108827,-0.00106936,-0.000198147,0.000444506,0.000774812,-0.000605076,0.0000164686,-0.000763695
+0,26,-0.00100088,0.000622186,-0.00178689,0.000575404,-0.000261924,0.00146113,0.000458893,0.000509167
+0,6,-0.000253681,-0.00083373,0.000615356,0.000532619,0.000144336,0.000257915,0.00043903,-0.000779675
+0,4,0.00043616,-0.000167231,0.00159501,-0.0000915569,0.000247062,-0.00106867,-0.000583421,-0.000403892
+0,24,-0.000672695,0.000278957,-0.00146487,0.0000792318,0.000245195,-0.000766711,-0.00138131,0.0000929452
+0,30,-0.00167353,0.00071295,-0.000230719,0.000897446,0.000571516,0.000117238,0.000452728,-0.00173582
+0,46,-0.000533684,-0.00040086,-0.00144291,0.000853643,0.00109643,0.00020963,-0.000615997,-0.000797766
+0,14,0.000585399,0.0000268727,0.00146024,-0.00041227,0.0000791869,-0.00088814,-0.000608854,-0.00115769
+0,22,-0.000407623,-0.0007978,-0.000515678,-0.000688702,0.00133291,0.00141403,-0.00124564,0.00113773
+0,49,0.00024599,-0.00139885,-0.00134118,0.000680574,0.000822545,0.000205223,-0.00199289,-0.00160549
+0,5,0.000252519,0.00172277,-0.000774048,0.00105482,0.00157968,0.00068246,0.000302345,0.000272061
+0,17,0.000332206,0.000850077,-0.000113361,0.000799429,-0.0000131923,-0.00127533,-0.000825769,-0.000156705
+0,33,0.00152963,0.000841445,-0.00112162,-0.000973657,-0.00128374,0.000422527,0.000950569,0.000195189
+0,1,0.00075814,-0.000587209,0.000903484,-0.000108747,-0.00140954,-0.000315132,0.000294968,0.0000869167
+0,40,0.00101958,-0.000410531,-0.000989156,0.000498749,-0.000804316,0.00051152,0.000895026,0.000341662
+0,45,-0.000322203,0.0000955498,-0.000413361,-0.000395182,0.000295093,0.000364574,0.000224402,0.000822664
+0,19,-0.00103563,0.000662192,-0.00182366,-0.000496727,-0.000350139,0.000385288,0.00037764,-0.000342287
+0,13,0.000889658,0.00136757,0.000250672,0.000811663,0.000141562,0.00149958,0.000337377,0.000791678
+0,7,-0.000627439,0.000323514,-0.000889976,0.00166839,0.000941792,-0.000283746,0.00134405,-0.000332387
+0,47,0.000368997,-0.00131334,-0.000671208,-0.0000709974,-0.000811614,0.000872083,-0.00110866,0.00124579
+0,35,0.000377375,0.0000575534,0.00024383,0.00188709,-0.00109969,-0.000526684,-0.000810978,0.000859606
+0,3,-0.000269341,-0.000681135,0.00158194,0.000673177,-0.00012071,-0.00107477,-0.00196249,0.00057643
+0,21,-0.000545799,0.000363359,-0.000996135,-0.000979275,0.000245788,-0.00164952,0.00131344,0.000241195
+0,29,0.000508612,0.000855692,0.0000443237,-0.000381697,-0.000195357,0.00040877,0.0000891462,-0.000385841
+0,27,0.00151015,-0.0013355,0.00156885,0.000183032,-0.0010015,0.000260447,0.00131999,0.0014149
+0,31,-0.00107524,0.000457745,0.00163474,-0.0014891,-0.00165544,-0.000383712,0.000736342,0.000219888
+0,43,0.000863689,-0.000485066,-0.00125901,0.000764543,-0.000576094,-0.000440971,0.000580035,0.000936413
+0,25,-0.00104292,-0.00010936,-0.00171131,0.000323557,0.00170108,-0.000816313,0.00104121,0.000373546
+0,15,0.000512246,-0.000333859,0.0000884758,-0.000320762,0.0000200917,0.000244293,0.000270312,0.000420948
+0,37,-0.000201442,0.00125545,0.0000383429,-0.00014956,-0.000201054,0.00131812,0.000207073,-0.000348482
+0,41,-0.000598096,0.00010944,0.000883715,-0.00121188,-0.0010052,0.0013767,-0.000230849,-0.000218533
+0,9,-0.000567076,0.000245513,0.00184858,0.000126402,0.00160834,-0.0016991,-0.000958186,0.00037194
+0,23,-0.000915858,-0.000524326,-0.000131364,-0.000292422,0.000963874,0.000375571,0.000735867,0.0000996958
+0,39,0.000189471,-0.000719253,-0.00124747,-0.00125807,0.000524775,-0.0010452,0.000551221,-0.0000534098
+0,11,0.000532252,0.0000307481,0.00065371,-0.000223169,-0.00148284,-0.000368691,0.000253769,0.00112011
diff --git a/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/emb2&accumulation b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/emb2&accumulation
new file mode 100644
index 00000000..62a2f121
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/ckpt/ckpt_standard/emb2&accumulation
@@ -0,0 +1,49 @@
+0,8,0,0,-0,-0,-0,0,0,-0
+0,36,-0,-0,0,0,0,-0,-0,0
+0,48,-0,-0,0,0,0,-0,-0,0
+0,16,0,0,-0,-0,-0,0,0,-0
+0,32,0,0,-0,-0,-0,0,0,-0
+0,28,0,0,-0,-0,-0,0,0,-0
+0,20,-0,-0,0,0,0,-0,-0,0
+0,12,0,0,-0,-0,-0,0,0,-0
+0,44,-0,-0,0,0,0,-0,-0,0
+0,10,0,0,-0,-0,-0,0,0,-0
+0,2,0,0,-0,-0,-0,0,0,-0
+0,34,0,0,-0,-0,-0,0,0,-0
+0,18,0,0,-0,-0,-0,0,0,-0
+0,38,0,0,-0,-0,-0,0,0,-0
+0,42,0,0,-0,-0,-0,0,0,-0
+0,26,0,0,-0,-0,-0,0,0,-0
+0,6,0,0,-0,-0,-0,0,0,-0
+0,4,0,0,-0,-0,-0,0,0,-0
+0,24,0,0,-0,-0,-0,0,0,-0
+0,30,0,0,-0,-0,-0,0,0,-0
+0,46,-0,-0,0,0,0,-0,-0,0
+0,14,0,0,-0,-0,-0,0,0,-0
+0,22,0,0,-0,-0,-0,0,0,-0
+0,49,-0,-0,0,0,0,-0,-0,0
+0,5,0,0,-0,-0,-0,0,0,-0
+0,17,0,0,-0,-0,-0,0,0,-0
+0,33,-0,-0,0,0,0,-0,-0,0
+0,1,-0,-0,0,0,0,-0,-0,0
+0,40,-0,-0,0,0,0,-0,-0,0
+0,45,0,0,-0,-0,-0,0,0,-0
+0,19,-0,-0,0,0,0,-0,-0,0
+0,13,0,0,-0,-0,-0,0,0,-0
+0,7,0,0,-0,-0,-0,0,0,-0
+0,47,-0,-0,0,0,0,-0,-0,0
+0,35,-0,-0,0,0,0,-0,-0,0
+0,3,0,0,-0,-0,-0,0,0,-0
+0,21,0,0,-0,-0,-0,0,0,-0
+0,29,0,0,-0,-0,-0,0,0,-0
+0,27,0,0,-0,-0,-0,0,0,-0
+0,31,-0,-0,0,0,0,-0,-0,0
+0,43,0,0,-0,-0,-0,0,0,-0
+0,25,-0,-0,0,0,0,-0,-0,0
+0,15,0,0,-0,-0,-0,0,0,-0
+0,37,0,0,-0,-0,-0,0,0,-0
+0,41,-0,-0,0,0,0,-0,-0,0
+0,9,0,0,-0,-0,-0,0,0,-0
+0,23,0,0,-0,-0,-0,0,0,-0
+0,39,0,0,-0,-0,-0,0,0,-0
+0,11,-0,-0,0,0,0,-0,-0,0
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_apply_moving_average_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_apply_moving_average_op.py
index 733743ce..61117c29 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_apply_moving_average_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_apply_moving_average_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_assign_add_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_assign_add_op.py
index d9729d48..22da6159 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_assign_add_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_assign_add_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_assign_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_assign_op.py
index 74175c8c..095d6f4d 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_assign_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_assign_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_assign_sub_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_assign_sub_op.py
index 810a2e0c..5caa96e4 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_assign_sub_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_assign_sub_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_constant_initializer_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_constant_initializer_op.py
index 41843f06..925e2058 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_constant_initializer_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_constant_initializer_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_convert_ckpt_variable_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_convert_ckpt_variable_op.py
new file mode 100644
index 00000000..e9e841cd
--- /dev/null
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_convert_ckpt_variable_op.py
@@ -0,0 +1,50 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+from xdl.python.lib.graph import execute
+import filecmp
+import sys, os
+
+def cmp_file(file1_str, file2_str):
+    with open(file1_str, 'r') as file1:
+        content1 = file1.read().splitlines()
+    with open(file2_str, 'r') as file2:
+        content2 = file2.read().splitlines()
+    return content1 == content2
+
+class TestPsSaveAndRestoreOp(unittest.TestCase):
+    def test_all(self):
+        pwd = sys.path[0]
+        variables=['emb2', 'dense/kernel', 'dense/bias']
+        with xdl.model_scope('train'):
+            xdl.convert_ps_variable([x for x in variables], pwd + "/ckpt/ckpt_in", pwd + "/ckpt/ckpt_out", True)
+        self.assertTrue(cmp_file(pwd + "/ckpt/ckpt_standard/emb2", pwd + "/ckpt/ckpt_out/emb2"))
+        self.assertTrue(cmp_file(pwd + "/ckpt/ckpt_standard/emb2&accumulation", pwd + "/ckpt/ckpt_out/emb2&accumulation"))
+        self.assertTrue(cmp_file(pwd + "/ckpt/ckpt_standard/dense&kernel", pwd + "/ckpt/ckpt_out/dense&kernel"))
+        self.assertTrue(cmp_file(pwd + "/ckpt/ckpt_standard/dense&kernel&accumulation", pwd + "/ckpt/ckpt_out/dense&kernel&accumulation"))
+        self.assertTrue(cmp_file(pwd + "/ckpt/ckpt_standard/dense&bias", pwd + "/ckpt/ckpt_out/dense&bias"))
+        self.assertTrue(cmp_file(pwd + "/ckpt/ckpt_standard/dense&bias&accumulation", pwd + "/ckpt/ckpt_out/dense&bias&accumulation"))
+        os.system("rm -r " + pwd + "/ckpt/ckpt_out")
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestPsSaveAndRestoreOp)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
+
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adagrad_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adagrad_op.py
index b04a910c..187892fc 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adagrad_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adagrad_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adam_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adam_op.py
index fc4365fd..4a9c9bbf 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adam_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_adam_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -35,6 +35,7 @@ def test_all(self):
             var_type="index")
         execute(op)
         ret = execute(var.value)
+        print(ret)
         self.assertTrue((ret == np.array([0.90000004,0.90000004,0.90000004,0.90000004], dtype=np.float32)).all())
         execute(op)
         ret = execute(var.value)
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_ftrl_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_ftrl_op.py
index 70265ce3..49d63c58 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_ftrl_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_ftrl_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_momentum_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_momentum_op.py
index 4a315bf7..f064753c 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_momentum_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_dense_apply_momentum_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_identity_initializer_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_identity_initializer_op.py
index 2cae4cdc..1918a19e 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_identity_initializer_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_identity_initializer_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_is_initialized_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_is_initialized_op.py
index 6f5a84f8..71e8de98 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_is_initialized_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_is_initialized_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_mark_and_filter_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_mark_and_filter_op.py
deleted file mode 100644
index 2f3806e8..00000000
--- a/xdl/test/python/unit_test/ps_ops/test_ps_mark_and_filter_op.py
+++ /dev/null
@@ -1,46 +0,0 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-# 
-#     http://www.apache.org/licenses/LICENSE-2.0
-# 
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import xdl
-import unittest
-import numpy as np
-from xdl.python.lib.datatype import *
-from xdl.python.lib.graph import execute
-from xdl.python.framework.variable import VarType
-
-class TestPsMarkAndFilterOp(unittest.TestCase):
-    def test_all(self):
-        var = xdl.Variable(name="w", dtype=DataType.int64, shape=[4,8], 
-                           vtype = VarType.Hash, initializer=xdl.Ones())
-        execute(xdl.variable_registers())
-        execute(xdl.global_initializers())
-        mark_op = xdl.ps_mark_op(
-          var_name = "w", 
-          ids = np.array([[10,10],[10,10],[12,12]], dtype=np.int64),
-          pattern = "g",
-          i = 12)
-        execute(mark_op)
-        filter_op = xdl.ps_filter_op(
-          var_name = "w",
-          pattern = "i==g",
-          i = 12, d = 0.5)
-        execute(filter_op)
-
-def suite():
-    return unittest.TestLoader().loadTestsFromTestCase(TestPsMarkAndFilterOp)
-
-if __name__ == '__main__':
-    unittest.TextTestRunner().run(suite())
-
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_pull_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_pull_op.py
index dfa1f106..1393b6af 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_pull_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_pull_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_save_and_restore_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_save_and_restore_op.py
index f0e8eac1..7a6b4891 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_save_and_restore_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_save_and_restore_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adagrad_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adagrad_op.py
index 6ae26b93..e657b3b1 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adagrad_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adagrad_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adam_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adam_op.py
index 80fc57bc..640ef052 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adam_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_adam_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -31,11 +31,12 @@ def test_all(self):
             learning_rate=np.array(0.1, dtype=np.float),
             grad=np.array([[1],[2]], dtype=np.float32),
             indices=np.array([1,2], dtype=np.int32),
-            lr_decay=True,
             var_name="w",
+            lr_decay=True,
             var_type="index")
         execute(op)
         ret = execute(var.value)
+        print(ret)
         self.assertTrue((ret == np.array([[1],[0.90000004],[0.90000004],[1]], dtype=np.float32)).all())
         execute(op)
         ret = execute(var.value)
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_ftrl_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_ftrl_op.py
index a8bb9760..0e79fa8d 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_ftrl_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_ftrl_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_momentum_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_momentum_op.py
index f2b7c7ef..4592b822 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_momentum_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_apply_momentum_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_assign_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_assign_op.py
index 827acea0..a68756d4 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_assign_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_assign_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_pull_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_pull_op.py
index 72c8e896..2b4cef6d 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_sparse_pull_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_sparse_pull_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -26,9 +26,9 @@ def test_all(self):
         execute(xdl.variable_registers())
         execute(xdl.global_initializers())
         op = xdl.ps_sparse_pull_op(var_name="w", 
-                                   var_type="index", 
-                                   save_ratio=1.0,
+                                   var_type="index",
                                    otype=DataType.int32,
+                                   save_ratio=np.array(1.0, dtype=np.float32),
                                    ids=np.array([1,3], dtype=np.int32))
         ret = execute(op)
         self.assertTrue((ret == np.array([[1,1],[1,1]])).all())
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_dense_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_dense_op.py
index dd1ec4f8..951096c8 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_dense_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_dense_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,9 +19,12 @@
 from xdl.python.lib.datatype import *
 from xdl.python.lib.graph import execute
 
+def _string_to_int8(src):
+    return np.array([ord(ch) for ch in src], dtype=np.int8)
+
 class TestPsStreamingTriggerDenseOp(unittest.TestCase):
     def test_all(self):
-        op = xdl.ps_streaming_trigger_dense_op()
+        op = xdl.ps_streaming_trigger_dense_op(_string_to_int8("inc-1234"))
         execute(op)
 
 def suite():
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_hash_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_hash_op.py
index 26dddd69..c585edcc 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_hash_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_hash_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,9 +19,13 @@
 from xdl.python.lib.datatype import *
 from xdl.python.lib.graph import execute
 
+
+def _string_to_int8(src):
+    return np.array([ord(ch) for ch in src], dtype=np.int8)
+
 class TestPsStreamingTriggerHashOp(unittest.TestCase):
     def test_all(self):
-        op = xdl.ps_streaming_trigger_hash_op()
+        op = xdl.ps_streaming_trigger_hash_op(_string_to_int8("inc-1234"))
         execute(op)
 
 def suite():
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_sparse_op.py b/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_sparse_op.py
index 58fd29d1..0343d79c 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_sparse_op.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_streaming_trigger_sparse_op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,9 +19,12 @@
 from xdl.python.lib.datatype import *
 from xdl.python.lib.graph import execute
 
+def _string_to_int8(src):
+    return np.array([ord(ch) for ch in src], dtype=np.int8)
+
 class TestPsStreamingTriggerSparseOp(unittest.TestCase):
     def test_all(self):
-        op = xdl.ps_streaming_trigger_sparse_op()
+        op = xdl.ps_streaming_trigger_sparse_op(_string_to_int8("inc-1234"))
         execute(op)
 
 def suite():
diff --git a/xdl/test/python/unit_test/ps_ops/test_ps_synchronizer_ops.py b/xdl/test/python/unit_test/ps_ops/test_ps_synchronizer_ops.py
index f8364a21..255cc5e4 100644
--- a/xdl/test/python/unit_test/ps_ops/test_ps_synchronizer_ops.py
+++ b/xdl/test/python/unit_test/ps_ops/test_ps_synchronizer_ops.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -20,21 +20,24 @@
 from xdl.python.lib.graph import execute
 
 class TestPsSynchronizerOps(unittest.TestCase):
-    def test_all(self):
+    def test_async(self):
         as_enter_op = xdl.ps_asynchronize_enter_op(
                 id = np.array(0, dtype=np.int32), 
                 staleness = np.array(32, dtype=np.int32),
                 worker_count = np.array(10, dtype=np.int32))
+        s_leave_op = xdl.worker_report_finish_op(id = np.array(0, dtype=np.int32))
+        execute(as_enter_op)
+        execute(s_leave_op)
+
+    def test_sync(self):
         s_enter_op = xdl.ps_synchronize_enter_op(
                 id = np.array(0, dtype=np.int32), 
                 worker_count = np.array(10, dtype=np.int32))
-        s_leave_op = xdl.ps_synchronize_leave_op(id = np.array(0, dtype=np.int32))
-        finish_op = xdl.ps_semi_synchronize_leave_op(id = np.array(0, dtype=np.int32))
-        execute(as_enter_op)
+        finish_op = xdl.worker_report_finish_op(id = np.array(0, dtype=np.int32))
         execute(s_enter_op)
-        execute(s_leave_op)
         execute(finish_op)
 
+
 def suite():
     return unittest.TestLoader().loadTestsFromTestCase(TestPsSynchronizerOps)
 
diff --git a/xdl/test/python/unit_test/run.sh b/xdl/test/python/unit_test/run.sh
new file mode 100644
index 00000000..499a1a3d
--- /dev/null
+++ b/xdl/test/python/unit_test/run.sh
@@ -0,0 +1 @@
+find . -name "*.py" | awk '{cmd="python "$0" --run_mode=local";print(cmd);system(cmd)}'
diff --git a/xdl/test/python/unit_test/test_add_sparse_gradient.py b/xdl/test/python/unit_test/test_add_sparse_gradient.py
index 8be19678..31a76006 100644
--- a/xdl/test/python/unit_test/test_add_sparse_gradient.py
+++ b/xdl/test/python/unit_test/test_add_sparse_gradient.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_all.py b/xdl/test/python/unit_test/test_all.py
index 2cc9758e..58c201e9 100644
--- a/xdl/test/python/unit_test/test_all.py
+++ b/xdl/test/python/unit_test/test_all.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_auc.py b/xdl/test/python/unit_test/test_auc.py
index d5e74d01..95a88259 100644
--- a/xdl/test/python/unit_test/test_auc.py
+++ b/xdl/test/python/unit_test/test_auc.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_concat.py b/xdl/test/python/unit_test/test_concat.py
new file mode 100644
index 00000000..19369966
--- /dev/null
+++ b/xdl/test/python/unit_test/test_concat.py
@@ -0,0 +1,74 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+
+class TestConcat(unittest.TestCase):
+    def test_concat_0(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.concat([a, b, c], axis=0)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.concatenate([a, b, c], axis=0)))
+
+    def test_concat_1(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.concat([a, b, c], axis=1)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.concatenate([a, b, c], axis=1)))
+
+    def test_concat_2(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.concat([a, b, c], axis=2)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.concatenate([a, b, c], axis=2)))
+
+    def test_concat_x1(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.concat([a, b, c], axis=-1)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.concatenate([a, b, c], axis=-1)))
+
+    def test_concat_x2(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.concat([a, b, c], axis=-2)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.concatenate([a, b, c], axis=-2)))
+
+    def test_concat_x3(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.concat([a, b, c], axis=-3)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.concatenate([a, b, c], axis=-3)))
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestConcat)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
diff --git a/xdl/test/python/unit_test/test_constant.py b/xdl/test/python/unit_test/test_constant.py
index 467ce8a2..ff494229 100644
--- a/xdl/test/python/unit_test/test_constant.py
+++ b/xdl/test/python/unit_test/test_constant.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_constant.pyc b/xdl/test/python/unit_test/test_constant.pyc
deleted file mode 100644
index 50e1fc31..00000000
Binary files a/xdl/test/python/unit_test/test_constant.pyc and /dev/null differ
diff --git a/xdl/test/python/unit_test/test_expand_dims.py b/xdl/test/python/unit_test/test_expand_dims.py
new file mode 100644
index 00000000..e8419e32
--- /dev/null
+++ b/xdl/test/python/unit_test/test_expand_dims.py
@@ -0,0 +1,62 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+
+class TestExpandDims(unittest.TestCase):
+    def test_expand_dims_0(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.expand_dims(value, 0)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[1, 2], [3, 4]]))
+
+    def test_expand_dims_1(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.expand_dims(value, 1)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[[1, 2]], [[3, 4]]]))
+
+    def test_expand_dims_2(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.expand_dims(value, 2)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[[1], [2]], [[3], [4]]]))
+
+    def test_expand_dims_x3(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.expand_dims(value, -3)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[1, 2], [3, 4]]))
+
+    def test_expand_dims_x2(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.expand_dims(value, -2)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[[1, 2]], [[3, 4]]]))
+
+    def test_expand_dims_x1(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.expand_dims(value, -1)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[[1], [2]], [[3], [4]]]))
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestExpandDims)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
diff --git a/xdl/test/python/unit_test/test_gauc.py b/xdl/test/python/unit_test/test_gauc.py
index 2d60ba38..3c6c33e6 100644
--- a/xdl/test/python/unit_test/test_gauc.py
+++ b/xdl/test/python/unit_test/test_gauc.py
@@ -1,19 +1,4 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-# 
-#     http://www.apache.org/licenses/LICENSE-2.0
-# 
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
+# Copyright 2018 Alibaba Group. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
diff --git a/xdl/test/python/unit_test/test_graident_aggregation.py b/xdl/test/python/unit_test/test_graident_aggregation.py
index cfff52b2..bfb79b69 100644
--- a/xdl/test/python/unit_test/test_graident_aggregation.py
+++ b/xdl/test/python/unit_test/test_graident_aggregation.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -24,7 +24,7 @@
 from xdl.python.utils.collections import READER_HOOKS, get_collection
 from xdl.python.utils.metrics import add_metrics
 from xdl.python.training.train_session import QpsMetricsHook, MetricsPrinterHook
-from xdl.python.framework.variable import trainable_variables
+from xdl.python.framework.variable import trainable_variables_with_scope
 from xdl.python.sparse_engine.embedding import is_embedding_var
 from xdl.python.backend.model_scope import cur_model_scope
 from xdl.python.training.gradient_utils import get_gradient, get_var_mapping
@@ -48,7 +48,7 @@ def mock_embedding(name1, name2):
     emb = xdl.embedding(name1, sparse, xdl.Ones(), embed_dim, 16, 'sum', vtype='hash')
     emb.set_shape((1,3))
 
-    ids2 = xdl.convert_to_tensor(np.array([[0,1], [1,1], [0,2]], dtype=np.int64))
+    ids2 = xdl.convert_to_tensor(np.array([[0,1], [0,2], [1,1]], dtype=np.int64))
     values2 = xdl.convert_to_tensor(np.array([1.0, 2.0, 3.0], dtype=np.float32))
     segments2 = xdl.convert_to_tensor(np.array([3], dtype=np.int32))
     sparse2 = xdl.SparseTensor(ids2, values2, segments2)
@@ -56,18 +56,31 @@ def mock_embedding(name1, name2):
     emb2.set_shape((1,3))
     return [emb, emb2]
 
-def run(name1, name2, scope):
+def run(name1, name2, scope, optimizer):
     with xdl.model_scope(scope):
         labels = xdl.mock_dense_op(shape=[1, 1], value=1.0)
         mock_embs = mock_embedding(name1, name2)
         loss = model(mock_embs,labels)
-        train_op = xdl.SGD(lr).optimize()
+        if optimizer == 'sgd':
+            train_op = xdl.SGD(0.5).optimize()
+        elif optimizer == 'momentum':
+            train_op = xdl.Momentum(0.005, 0.99).optimize()
+        elif optimizer == 'ftrl':
+            train_op = xdl.Ftrl(0.01).optimize()
+        elif optimizer == 'adam':
+            train_op = xdl.Adam(0.001).optimize()
+        elif optimizer == 'adagrad':
+            train_op = xdl.Adagrad(0.04, 0.1).optimize()
+        elif optimizer == 'rmsprop':
+            train_op = xdl.RMSProp(0.001).optimize()
+        else:
+            train_op = xdl.SGD(0.5).optimize()
         hooks = []
         sess = xdl.TrainSession(hooks)
         run_ops = [train_op, loss]
         op_names = ['none', 'loss']
 
-        embed_vars = [var for var in trainable_variables() if is_embedding_var(var)]
+        embed_vars = [var for var in trainable_variables_with_scope(scope) if is_embedding_var(var)]
         sparse_embed_grads = []
         for var in embed_vars:
             sparse_embed_grads.append(xdl.get_sparse_grads(var.name))
@@ -85,15 +98,49 @@ class GradientAggregationTest(unittest.TestCase):
     def test(self):
         id1 = [[0,0],[0,1],[0,2]]
         id2 = [[0,1],[1,1],[0,2]]
-        grad1, grad2 = run("853", "861", "normal")
-        grad3 = run("872", "872", "aggregate")
-        self.assertTrue(np.allclose(grad1[0], grad3[0]))
-        self.assertTrue(np.allclose(grad1[1] + grad2[0], grad3[1]))
-        self.assertTrue(np.allclose(grad1[2] + grad2[2], grad3[2]))
-        self.assertTrue(np.allclose(grad2[1], grad3[3]))
+        grad1, grad2 = run("853", "861", "normal", "sgd")
+        grad3 = run("872", "872", "aggregate", "sgd")
+        print 'grad1: ', grad1
+        print 'grad2: ', grad2
+        print 'grad3: ', grad3
+        self.assertTrue(np.allclose(grad1[1], grad3[1]))
+        self.assertTrue(np.allclose(grad1[2] + grad2[1], grad3[2]))
+        self.assertTrue(np.allclose(grad1[0] + grad2[2], grad3[0]))
+        self.assertTrue(np.allclose(grad2[0], grad3[3]))
+        grad1, grad2 = run("1", "2", "normal1", "momentum")
+        grad3 = run("3", "3", "aggregate1", "momentum")
+        self.assertTrue(np.allclose(grad1[1], grad3[1]))
+        self.assertTrue(np.allclose(grad1[2] + grad2[1], grad3[2]))
+        self.assertTrue(np.allclose(grad1[0] + grad2[2], grad3[0]))
+        self.assertTrue(np.allclose(grad2[0], grad3[3]))
+        grad1, grad2 = run("4", "5", "normal2", "ftrl")
+        grad3 = run("6", "6", "aggregate2", "ftrl")
+        self.assertTrue(np.allclose(grad1[1], grad3[1]))
+        self.assertTrue(np.allclose(grad1[2] + grad2[1], grad3[2]))
+        self.assertTrue(np.allclose(grad1[0] + grad2[2], grad3[0]))
+        self.assertTrue(np.allclose(grad2[0], grad3[3]))
+        grad1, grad2 = run("7", "8", "normal3", "adam")
+        grad3 = run("9", "9", "aggregate3", "adam")
+        self.assertTrue(np.allclose(grad1[1], grad3[1]))
+        self.assertTrue(np.allclose(grad1[2] + grad2[1], grad3[2]))
+        self.assertTrue(np.allclose(grad1[0] + grad2[2], grad3[0]))
+        self.assertTrue(np.allclose(grad2[0], grad3[3]))
+        grad1, grad2 = run("10", "11", "normal4", "adagrad")
+        grad3 = run("12", "12", "aggregate4", "adagrad")
+        self.assertTrue(np.allclose(grad1[1], grad3[1]))
+        self.assertTrue(np.allclose(grad1[2] + grad2[1], grad3[2]))
+        self.assertTrue(np.allclose(grad1[0] + grad2[2], grad3[0]))
+        self.assertTrue(np.allclose(grad2[0], grad3[3]))
+        grad1, grad2 = run("13", "14", "normal5", "rmsprop")
+        grad3 = run("15", "15", "aggregate5", "rmsprop")
+        self.assertTrue(np.allclose(grad1[1], grad3[1]))
+        self.assertTrue(np.allclose(grad1[2] + grad2[1], grad3[2]))
+        self.assertTrue(np.allclose(grad1[0] + grad2[2], grad3[0]))
+        self.assertTrue(np.allclose(grad2[0], grad3[3]))
 
 def suite():
   return unittest.TestLoader().loadTestsFromTestCase(GradientAggregationTest)
 
 if __name__ == '__main__':
   unittest.TextTestRunner().run(suite())
+
diff --git a/xdl/test/python/unit_test/test_ksum.py b/xdl/test/python/unit_test/test_ksum.py
index c71d67be..5a9cd3a6 100644
--- a/xdl/test/python/unit_test/test_ksum.py
+++ b/xdl/test/python/unit_test/test_ksum.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -23,11 +23,13 @@
 segs = np.array([3,6,10],dtype=np.int32)
 grps = np.array([2,3,4,6,7,10],dtype=np.int32)
 embeds = np.array([[0.1],[0.2],[0.3],[0.4],[0.5],[0.6]],dtype=np.float)
+sidx = np.array([],dtype=np.int32)
+sseg = np.array([],dtype=np.int32)        
 
 class TestKsum(unittest.TestCase):
     def test_cpu_ksum(self):
         grps = np.array([],dtype=np.int32)
-        ksum = xdl.ksum(embeds, idx, values, segs, grps)
+        ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg)
         ksum = xdl.execute(ksum)
         res = np.array([[0.06],[0.09],[0.15]], dtype=np.float)
         self.assertTrue(np.allclose(ksum, res))
@@ -35,14 +37,14 @@ def test_cpu_ksum(self):
     def test_gpu_ksum(self):
         with xdl.device("GPU"):
             grps = np.array([],dtype=np.int32)
-            ksum = xdl.ksum(embeds, idx, values, segs, grps)
+            ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg)
             ksum = xdl.execute(ksum)
             res = np.array([[0.06],[0.09],[0.15]], dtype=np.float)
             self.assertTrue(np.allclose(ksum, res))
-
+        
     def test_cpu_kavg(self):
         grps = np.array([],dtype=np.int32)
-        ksum = xdl.ksum(embeds, idx, values, segs, grps, average=True)
+        ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg, average=True)
         ksum = xdl.execute(ksum)
         res = np.array([[0.02],[0.03],[0.0375]], dtype=np.float)
         self.assertTrue(np.allclose(ksum, res))
@@ -50,13 +52,13 @@ def test_cpu_kavg(self):
     def test_gpu_kavg(self):
         with xdl.device("GPU"):
             grps = np.array([],dtype=np.int32)
-            ksum = xdl.ksum(embeds, idx, values, segs, grps, average=True)
+            ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg, average=True)
             ksum = xdl.execute(ksum)
             res = np.array([[0.02],[0.03],[0.0375]], dtype=np.float)
             self.assertTrue(np.allclose(ksum, res))
 
     def test_cpu_merged_ksum(self):
-        ksum = xdl.ksum(embeds, idx, values, segs, grps)
+        ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg)
         ksum = xdl.execute(ksum)
         res = np.array([[0.03, 0.03],[0.04,0.05],[0.05,0.1]],
                        dtype=np.float)
@@ -64,14 +66,14 @@ def test_cpu_merged_ksum(self):
 
     def test_gpu_merged_ksum(self):
         with xdl.device("GPU"):
-            ksum = xdl.ksum(embeds, idx, values, segs, grps)
+            ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg)
             ksum = xdl.execute(ksum)
             res = np.array([[0.03, 0.03],[0.04,0.05],[0.05,0.1]],
                            dtype=np.float)
             self.assertTrue(np.allclose(ksum, res))
 
     def test_cpu_merged_kavg(self):
-        ksum = xdl.ksum(embeds, idx, values, segs, grps, average=True)
+        ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg, average=True)
         ksum = xdl.execute(ksum)
         res = np.array([[0.015,0.03],[0.04,0.025],[0.05,0.03333333]],
                        dtype=np.float)
@@ -79,7 +81,7 @@ def test_cpu_merged_kavg(self):
 
     def test_gpu_merged_kavg(self):
         with xdl.device("GPU"):
-            ksum = xdl.ksum(embeds, idx, values, segs, grps, average=True)
+            ksum = xdl.ksum(embeds, idx, values, segs, grps, sidx, sseg, average=True)
             ksum = xdl.execute(ksum)
             res = np.array([[0.015,0.03],[0.04,0.025],[0.05,0.03333333]],
                            dtype=np.float)
diff --git a/xdl/test/python/unit_test/test_ksum_grad.py b/xdl/test/python/unit_test/test_ksum_grad.py
index 4b538c21..c1adcb5e 100644
--- a/xdl/test/python/unit_test/test_ksum_grad.py
+++ b/xdl/test/python/unit_test/test_ksum_grad.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,40 +19,83 @@
 from xdl.python.lib.datatype import *
 
 idx = np.array([0,1,2,3,2,1,4,5,0,2],dtype=np.int32)
-values = np.array([0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1],dtype=np.float)
+values = np.array([1,1,1,1,1,1,1,1,1,1],dtype=np.float)
 segs = np.array([3,6,10],dtype=np.int32)
 grps = np.array([2,3,4,6,7,10],dtype=np.int32)
 embeds = np.array([[0.1],[0.2],[0.3],[0.4],[0.5],[0.6]],dtype=np.float)
+with xdl.device('CPU'):
+  embeds_shape = xdl.shape_op(embeds)
 grads = np.array([[1],[2],[3]], dtype=np.float)
 merged_grads = np.array([[1,2],[3,4],[5,6]],dtype=np.float)
+sidx = np.array([0,5,0,3,1,3,5,2,4,5],dtype=np.int32)
+sseg = np.array([2,4,7,8,9,10],dtype=np.int32)
+
+sidx_nogrp = np.array([0,2,0,1,0,1,2,1,2,2],dtype=np.int32)
 
 class TestKsumGrad(unittest.TestCase):
-    def test_cpu(self):
-        grps = np.array([],dtype=np.int32)
-        ksum_grad = xdl.ksum_grad(embeds, idx, values, segs, grps, grads)
-        ksum_grad = xdl.execute(ksum_grad)
-        res = np.array([[0.4],[0.3],[0.6],[0.2],[0.3],[0.3]],dtype=np.float)
-        self.assertTrue(np.allclose(ksum_grad, res))
+    #old_fashion_way
+    def test_cpu_with_values(self):
+      grps = np.array([],dtype=np.int32)
+      ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx_nogrp, sseg, grads)
+      ksum_grad = xdl.execute(ksum_grad)
+      res = np.array([[4],[3],[6],[2],[3],[3]],dtype=np.float)
+      self.assertTrue(np.allclose(ksum_grad, res))
 
+      ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx_nogrp, sseg, grads, average=True)
+      ksum_grad = xdl.execute(ksum_grad)
+      res = np.array([[1.0833333],[1],[1.75],[0.66666666],[0.75],[0.75]],dtype=np.float)
+      self.assertTrue(np.allclose(ksum_grad, res))      
+
+    #new_way      
+    def test_cpu_no_values(self):
+      grps = np.array([],dtype=np.int32)      
+      values = np.array([],dtype=np.float)
+      ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx_nogrp, sseg, grads)
+      ksum_grad = xdl.execute(ksum_grad)
+      res = np.array([[4],[3],[6],[2],[3],[3]],dtype=np.float)
+      self.assertTrue(np.allclose(ksum_grad, res))
+
+      ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx_nogrp, sseg, grads, average=True)
+      ksum_grad = xdl.execute(ksum_grad)
+      res = np.array([[1.0833333],[1],[1.75],[0.66666666],[0.75],[0.75]],dtype=np.float)
+      self.assertTrue(np.allclose(ksum_grad, res))
+      
     def test_gpu(self):
         with xdl.device("GPU"):
             grps = np.array([],dtype=np.int32)
-            ksum_grad = xdl.ksum_grad(embeds, idx, values, segs, grps, grads)
+            ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx_nogrp, sseg, grads)
             ksum_grad = xdl.execute(ksum_grad)
-            res = np.array([[0.4],[0.3],[0.6],[0.2],[0.3],[0.3]],dtype=np.float)
+            res = np.array([[4],[3],[6],[2],[3],[3]],dtype=np.float)
             self.assertTrue(np.allclose(ksum_grad, res))
 
-    def test_merged_cpu(self):
-        ksum_grad = xdl.ksum_grad(embeds, idx, values, segs, grps, merged_grads)
+    def test_merged_cpu_with_values(self):
+        ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx, sseg, merged_grads)
+        ksum_grad = xdl.execute(ksum_grad)
+        res = np.array([[7],[5],[12],[3],[5],[6]],dtype=np.float)
+        self.assertTrue(np.allclose(ksum_grad, res))
+
+        ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx, sseg, merged_grads, average=True)
+        ksum_grad = xdl.execute(ksum_grad)
+        res = np.array([[2.5],[2.5],[6],[3],[5],[2]],dtype=np.float)
+        self.assertTrue(np.allclose(ksum_grad, res))        
+
+    def test_merged_cpu_no_values(self):
+        values = np.array([],dtype=np.float)      
+        ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx, sseg, merged_grads)
         ksum_grad = xdl.execute(ksum_grad)
-        res = np.array([[0.7],[0.5],[1.2],[0.3],[0.5],[0.6]],dtype=np.float)
+        res = np.array([[7],[5],[12],[3],[5],[6]],dtype=np.float)
         self.assertTrue(np.allclose(ksum_grad, res))
 
+        ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx, sseg, merged_grads, average=True)
+        ksum_grad = xdl.execute(ksum_grad)
+        res = np.array([[2.5],[2.5],[6],[3],[5],[2]],dtype=np.float)
+        self.assertTrue(np.allclose(ksum_grad, res))        
+
     def test_merged_gpu(self):
         with xdl.device("GPU"):
-            ksum_grad = xdl.ksum_grad(embeds, idx, values, segs, grps, merged_grads)
+            ksum_grad = xdl.ksum_grad(embeds_shape, idx, values, segs, grps, sidx_nogrp, sseg, merged_grads)
             ksum_grad = xdl.execute(ksum_grad)
-            res = np.array([[0.7],[0.5],[1.2],[0.3],[0.5],[0.6]],dtype=np.float)
+            res = np.array([[7],[5],[12],[3],[5],[6]],dtype=np.float)
             self.assertTrue(np.allclose(ksum_grad, res))
 
 def suite():
diff --git a/xdl/test/python/unit_test/test_merge_sparse.py b/xdl/test/python/unit_test/test_merge_sparse.py
index dada651e..4fd348a6 100644
--- a/xdl/test/python/unit_test/test_merge_sparse.py
+++ b/xdl/test/python/unit_test/test_merge_sparse.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_merged_tile.py b/xdl/test/python/unit_test/test_merged_tile.py
index a4c44cf4..32afc6d1 100644
--- a/xdl/test/python/unit_test/test_merged_tile.py
+++ b/xdl/test/python/unit_test/test_merged_tile.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_py_func.py b/xdl/test/python/unit_test/test_py_func.py
index 230eb28f..1077d8ae 100644
--- a/xdl/test/python/unit_test/test_py_func.py
+++ b/xdl/test/python/unit_test/test_py_func.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_reshape.py b/xdl/test/python/unit_test/test_reshape.py
new file mode 100644
index 00000000..15aad8c8
--- /dev/null
+++ b/xdl/test/python/unit_test/test_reshape.py
@@ -0,0 +1,38 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+
+class TestReshape(unittest.TestCase):
+    def test_reshape(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.reshape(value, [4])
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [1, 2, 3, 4]))
+
+    def test_reshape_x(self):
+      value = np.array([[1, 2], [3, 4]])
+      a = xdl.reshape(value, [1, -1])
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == [[1, 2, 3, 4]]))
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestReshape)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
diff --git a/xdl/test/python/unit_test/test_split.py b/xdl/test/python/unit_test/test_split.py
new file mode 100644
index 00000000..66602cbf
--- /dev/null
+++ b/xdl/test/python/unit_test/test_split.py
@@ -0,0 +1,58 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+
+class TestSplit(unittest.TestCase):
+    def test_split_0_dim(self):
+      value = np.array([[10, 20], [30, 40], [50, 60], [70, 80]])
+      num_or_size_splits = np.array([1, 3])
+      a, b = xdl.split(value, num_or_size_splits, 0, 2)
+      a, b = xdl.execute([a, b])
+      self.assertTrue(np.alltrue(a == [[10, 20]]))
+      self.assertTrue(np.alltrue(b == [[30, 40], [50, 60], [70, 80]]))
+
+    def test_split_0_dim_x(self):
+      value = np.array([[10, 20], [30, 40], [50, 60], [70, 80]])
+      num_or_size_splits = np.array(2)
+      a, b = xdl.split(value, num_or_size_splits, 0, 2)
+      a, b = xdl.execute([a, b])
+      self.assertTrue(np.alltrue(a == [[10, 20], [30, 40]]))
+      self.assertTrue(np.alltrue(b == [[50, 60], [70, 80]]))
+
+    def test_split_neg_dim(self):
+      value = np.array([[10, 20, 1], [30, 40, 1], [50, 60, 1], [70, 80, 1]])
+      num_or_size_splits = np.array([1, 2])
+      a, b = xdl.split(value, num_or_size_splits, -1, 2)
+      a, b = xdl.execute([a, b])
+      self.assertTrue(np.alltrue(a == [[10], [30], [50], [70]]))
+      self.assertTrue(np.alltrue(b == [[20, 1], [40, 1], [60, 1], [80, 1]]))
+
+    def test_split_neg_dim_x(self):
+      value = np.array([[10, 20], [30, 40], [50, 60], [70, 80]])
+      num_or_size_splits = np.array(2)
+      a, b = xdl.split(value, num_or_size_splits, -1, 2)
+      a, b = xdl.execute([a, b])
+      self.assertTrue(np.alltrue(a == [[10], [30], [50], [70]]))
+      self.assertTrue(np.alltrue(b == [[20], [40], [60], [80]]))
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestSplit)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
diff --git a/xdl/test/python/unit_test/test_stack.py b/xdl/test/python/unit_test/test_stack.py
new file mode 100644
index 00000000..62391fe7
--- /dev/null
+++ b/xdl/test/python/unit_test/test_stack.py
@@ -0,0 +1,91 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+
+class TestStack(unittest.TestCase):
+    def test_stack_0(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=0)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=0)))
+
+    def test_stack_1(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=1)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=1)))
+
+    def test_stack_2(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=2)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=2)))
+
+    def test_stack_3(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=3)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=3)))
+
+    def test_stack_x1(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=-1)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=-1)))
+
+    def test_stack_x2(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=-2)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=-2)))
+
+    def test_stack_x3(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=-3)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=-3)))
+
+    def test_stack_x4(self):
+      a = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+      b = np.array([[[11, 12], [13, 14]], [[15, 16], [17, 18]]])
+      c = np.array([[[21, 22], [23, 24]], [[25, 26], [27, 28]]])
+      r = xdl.stack([a, b, c], axis=-4)
+      r = xdl.execute(r)
+      self.assertTrue(np.alltrue(r == np.stack([a, b, c], axis=-4)))
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestStack)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
+
diff --git a/xdl/test/python/unit_test/test_take.py b/xdl/test/python/unit_test/test_take.py
index aa01b588..37117664 100644
--- a/xdl/test/python/unit_test/test_take.py
+++ b/xdl/test/python/unit_test/test_take.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_take_grad.py b/xdl/test/python/unit_test/test_take_grad.py
index 4306e68a..dbfbb444 100644
--- a/xdl/test/python/unit_test/test_take_grad.py
+++ b/xdl/test/python/unit_test/test_take_grad.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,20 +19,22 @@
 from xdl.python.lib.datatype import *
 
 comm = np.array([[0.1,0.2,0.3],[0.4,0.5,0.6],[0.7,0.8,0.9]],dtype=np.float)
+with xdl.device('CPU'):
+  comm_shape = xdl.shape_op(comm)
 comm_grad = np.array([[0.1,0.2,0.3],[0.4,0.5,0.6],[0.7,0.8,0.9],
                       [0.1,0.2,0.3],[0.4,0.5,0.6]],dtype=np.float)
 indicator = np.array([0,0,1,1,2],dtype=np.int32)
 
 class TestTakeGrad(unittest.TestCase):
     def test_cpu(self):
-        out = xdl.take_grad(comm_grad, indicator,comm)
+        out = xdl.take_grad(comm_grad, indicator,comm_shape)
         out = xdl.execute(out)
         res = np.array([[0.5,0.7,0.9],[0.8,1.0,1.2],[0.4,0.5,0.6]],dtype=np.float)
         self.assertTrue(np.allclose(out, res))
 
     def test_gpu(self):
         with xdl.device("GPU"):
-            out = xdl.take_grad(comm_grad, indicator,comm)
+            out = xdl.take_grad(comm_grad, indicator,comm_shape)
             out = xdl.execute(out)
             res = np.array([[0.5,0.7,0.9],[0.8,1.0,1.2],[0.4,0.5,0.6]],dtype=np.float)
             self.assertTrue(np.allclose(out, res))
diff --git a/xdl/test/python/unit_test/test_tile.py b/xdl/test/python/unit_test/test_tile.py
index 611e84d4..5e8319a2 100644
--- a/xdl/test/python/unit_test/test_tile.py
+++ b/xdl/test/python/unit_test/test_tile.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_tile_grad.py b/xdl/test/python/unit_test/test_tile_grad.py
index 7cfe2c88..3a7f742d 100644
--- a/xdl/test/python/unit_test/test_tile_grad.py
+++ b/xdl/test/python/unit_test/test_tile_grad.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/test/python/unit_test/test_unique.py b/xdl/test/python/unit_test/test_unique.py
index e1eff471..f1e97f63 100644
--- a/xdl/test/python/unit_test/test_unique.py
+++ b/xdl/test/python/unit_test/test_unique.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -17,45 +17,87 @@
 import unittest
 import numpy as np
 from xdl.python.lib.datatype import *
+from xdl.python.ops.constant_converter import *
 
 data = np.array([3,1,2,1,3,1,2,0,1,3,1,1,2,0,1,3,3,2,3,2,2,1,2,0])
-
+                   
 class TestUnique(unittest.TestCase):
     def test_unique_cpu_1d(self):
-        res_uniq = np.array([3,1,2,0])
-        res_idx = np.array([0,1,2,1,0,1,2,3,1,0,1,1,
-                            2,3,1,0,0,2,0,2,2,1,2,3])
-        uniq, idx = xdl.unique(data, itype=DataType.int32)
-        uniq, idx = xdl.execute([uniq, idx])
+        res_uniq = np.array([0,2,1,3])
+        res_idx = np.array([3,2,1,2,3,2,1,0,2,3,2,2,
+                            1,0,2,3,3,1,3,1,1,2,1,0])
+        res_sidx = np.array([2,6,10,0,2,6,7,8,9,10,0,1,2,3,4,5,6,9,0,1,3,6,7,8])
+        res_sseg = np.array([3,10,18,24])
+        
+        segment = np.array([3,5,8,10,11,12,16,18,20,22,24], np.int32)
+        uniq, idx, sidx, sseg = xdl.unique(input=data, segment=segment, itype=DataType.int32)
+        uniq, idx, sidx, sseg = xdl.execute([uniq, idx, sidx, sseg])
+        self.assertTrue((uniq == res_uniq).all())
+        self.assertTrue((idx == res_idx).all())
+        self.assertTrue((sidx == res_sidx).all())
+        self.assertTrue((sseg == res_sseg).all())
+
+        segment = np.array([3,5,8,10,11,12,16,18,20,22,24], np.int64)
+        uniq, idx, sidx, sseg = xdl.unique(input=data, segment=segment, itype=DataType.int64)
+        uniq, idx, sidx, sseg = xdl.execute([uniq, idx, sidx, sseg])
         self.assertTrue((uniq == res_uniq).all())
         self.assertTrue((idx == res_idx).all())
+        self.assertTrue((sidx == res_sidx).all())
+        self.assertTrue((sseg == res_sseg).all())        
+
+        segment2 = np.array([3,5,5,8,10,11,12,12,16,18,20,22,24], np.int32)
+        uniq, idx, sidx, sseg = xdl.unique(input=data, segment=segment2, itype=DataType.int32)
+        uniq, idx, sidx, sseg = xdl.execute([uniq, idx, sidx, sseg])
+        res_sidx = np.array([3,8,12,0,3,8,9,10,11,12,0,1,3,4,5,6,8,11,0,1,4,8,9,10])
+        self.assertTrue((uniq == res_uniq).all())
+        self.assertTrue((idx == res_idx).all())
+        self.assertTrue((sidx == res_sidx).all())
+        self.assertTrue((sseg == res_sseg).all())        
 
     def test_unique_gpu_1d(self):
         with xdl.device("GPU"):
             res_uniq = np.array([0,1,2,3])
             res_idx = np.array([3,1,2,1,3,1,2,0,1,3,1,1,
                                 2,0,1,3,3,2,3,2,2,1,2,0])
-            uniq, idx = xdl.unique(data, itype=DataType.int32)
-            uniq, idx = xdl.execute([uniq, idx])
+            res_sidx = np.array([2,6,10, 0,1,2,3,4,5,6,9, 0,2,6,7,8,9,10, 0,1,3,6,7,8])
+            res_sseg = np.array([3,11,18,24])
+            segment = np.array([3,5,8,10,11,12,16,18,20,22,24], np.int32)
+            uniq, idx, sidx, sseg = xdl.unique(data, segment=segment, itype=DataType.int32)
+            uniq, idx, sidx, sseg = xdl.execute([uniq, idx, sidx, sseg])
             self.assertTrue((uniq == res_uniq).all())
             self.assertTrue((idx == res_idx).all())
+            self.assertTrue((sidx == res_sidx).all())
+            self.assertTrue((sseg == res_sseg).all())
 
     def test_unique_cpu_2d(self):
-        res_uniq = np.array([[3,1],[2,1],[2,0],[1,3],[1,1],[3,2]])
-        res_idx = np.array([0,1,0,2,3,4,2,3,5,5,1,2])
-        uniq, idx = xdl.unique(data.reshape((data.size/2, 2)),itype=DataType.int32)
-        uniq, idx = xdl.execute([uniq, idx])
+        data = np.array([3,1,2,1,3,1,2,0,1,3,1,1,2,0,1,3,3,2,3,2,2,1,2,0])
+        res_uniq = np.array([[3,2],[1,1],[1,3],[2,0],[2,1],[3,1]])
+        res_idx = np.array([5,4,5,3,2,1,3,2,0,0,4,3])
+        res_sidx = np.array([4,5,3,2,4,2,4,5,0,5,0,2])
+        res_sseg = np.array([2,3,5,8,10,12])
+                            
+        segment = np.array([2,2,5,6,9,12], np.int32)
+        uniq, idx, sidx, sseg = xdl.unique(data.reshape((data.size/2, 2)), segment, itype=DataType.int32)
+        uniq, idx, sidx, sseg = xdl.execute([uniq, idx, sidx, sseg])
+
         self.assertTrue((uniq == res_uniq).all())
         self.assertTrue((idx == res_idx).all())
+        self.assertTrue((sidx == res_sidx).all())
+        self.assertTrue((sseg == res_sseg).all())
 
     def test_unique_gpu_2d(self):
         with xdl.device("GPU"):
             res_uniq = np.array([[1,1],[1,3],[2,0],[2,1],[3,1],[3,2]])
             res_idx = np.array([4,3,4,2,1,0,2,1,5,5,3,2])
-            uniq, idx = xdl.unique(data.reshape((data.size/2, 2)),itype=DataType.int32)
-            uniq, idx = xdl.execute([uniq, idx])
+            segment = np.array([2,2,5,6,9,12], np.int32)
+            res_sidx = np.array([3, 2,4, 2,4,5, 0,5, 0,2, 4,5])
+            res_sseg = np.array([1,3,6,8,10,12])
+            uniq, idx, sidx, sseg = xdl.unique(data.reshape((data.size/2, 2)), segment, itype=DataType.int32)
+            uniq, idx, sidx, sseg = xdl.execute([uniq, idx, sidx, sseg])
             self.assertTrue((uniq == res_uniq).all())
             self.assertTrue((idx == res_idx).all())
+            self.assertTrue((sidx == res_sidx).all())
+            self.assertTrue((sseg == res_sseg).all())
 
 def suite():
     return unittest.TestLoader().loadTestsFromTestCase(TestUnique)
diff --git a/xdl/test/python/unit_test/test_zeros.py b/xdl/test/python/unit_test/test_zeros.py
new file mode 100644
index 00000000..84242fb8
--- /dev/null
+++ b/xdl/test/python/unit_test/test_zeros.py
@@ -0,0 +1,47 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import unittest
+import numpy as np
+from xdl.python.lib.datatype import *
+
+class TestZeros(unittest.TestCase):
+    def test_zeros_0(self):
+      a = xdl.zeros(np.array([], np.int64), xdl.DataType.float)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == 0))
+      self.assertTrue(a.shape == ())
+      self.assertTrue(a.dtype == np.float32)
+
+    def test_zeros_1(self):
+      a = xdl.zeros([100], xdl.DataType.float)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == 0))
+      self.assertTrue(a.shape == (100,))
+      self.assertTrue(a.dtype == np.float32)
+
+    def test_zeros_int64(self):
+      a = xdl.zeros([100], xdl.DataType.int64)
+      a = xdl.execute(a)
+      self.assertTrue(np.alltrue(a == 0))
+      self.assertTrue(a.shape == (100,))
+      self.assertTrue(a.dtype == np.int64)
+
+def suite():
+    return unittest.TestLoader().loadTestsFromTestCase(TestZeros)
+
+if __name__ == '__main__':
+    unittest.TextTestRunner().run(suite())
diff --git a/xdl/test/test_data/data_io/zlib_test_data b/xdl/test/test_data/data_io/zlib_test_data
new file mode 100644
index 00000000..864d66a3
Binary files /dev/null and b/xdl/test/test_data/data_io/zlib_test_data differ
diff --git a/xdl/test/util/hdfs_define.h b/xdl/test/util/hdfs_define.h
deleted file mode 100644
index 8ea6df67..00000000
--- a/xdl/test/util/hdfs_define.h
+++ /dev/null
@@ -1 +0,0 @@
-const char *XDL_HADOOP_PATH = "/home/yue.song/x-deeplearning/xdl/test/binary/hadoop-2.8.5/";
diff --git a/xdl/test/util/hdfs_launcher.cpp b/xdl/test/util/hdfs_launcher.cpp
index c9b8e10d..385c5ac8 100644
--- a/xdl/test/util/hdfs_launcher.cpp
+++ b/xdl/test/util/hdfs_launcher.cpp
@@ -12,7 +12,7 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-#include <cstdlib>
+
 #include <cstdio>
 #include <iostream>
 #include <memory>
@@ -20,14 +20,70 @@ limitations under the License.
 #include <array>
 #include <sstream>
 #include <iostream>
-#include <string>
+#include <stdio.h>
+#include <unistd.h>
+#include <stdlib.h>
+#include <unistd.h>
+#include <netdb.h>
+#include <arpa/inet.h>
+#include <net/if.h>
+#include <ifaddrs.h>
+#include <netinet/in.h>
+#include <cstring>
 
-#include "hdfs_launcher.h"
 #include "hdfs_define.h"
+#include "hdfs_launcher.h"
 
 using namespace std;
 
-namespace ps {
+namespace xdl {
+
+HDFSLauncher::HDFSLauncher() { 
+  config_path_ = std::string(XDL_HADOOP_PATH) + "etc/hadoop/core-site.xml";
+  hdfs_config_path_ = std::string(XDL_HADOOP_PATH) + "etc/hadoop/hdfs-site.xml";
+  Start();
+}
+
+HDFSLauncher::~HDFSLauncher() { 
+  Stop();
+}
+
+int HDFSLauncher::GetAvailablePort() {
+    struct sockaddr_in addr;
+    addr.sin_port = htons(0);  // have system pick up a random port available for me
+    addr.sin_family = AF_INET;  // IPV4
+    addr.sin_addr.s_addr = htonl(INADDR_ANY);  // set our addr to any interface
+
+    int sock = socket(AF_INET, SOCK_STREAM, 0);
+    if (0 != bind(sock, (struct sockaddr*)&addr, sizeof(struct sockaddr_in))) {
+        return -1;
+    }
+
+    socklen_t addr_len = sizeof(struct sockaddr_in);
+    if (0 != getsockname(sock, (struct sockaddr*)&addr, &addr_len)) {
+        return -1;
+    }
+
+    int ret_port = ntohs(addr.sin_port);
+    close(sock);
+    return ret_port;
+}
+
+void HDFSLauncher::GetAvailablePorts(int num, std::vector<int>* ports) {
+  std::set<int> uniq_ports;
+  while (uniq_ports.size() < num) {
+    int port = GetAvailablePort();
+    if (port == -1) {
+	continue;
+    }
+    
+    if (uniq_ports.find(port) == uniq_ports.end()) {
+	uniq_ports.insert(port);
+    }
+  }
+
+  ports->insert(ports->end(), uniq_ports.begin(), uniq_ports.end());
+}
 
 std::string HDFSLauncher::Exec(const char* cmd) {
   std::array<char, 128> buffer;
@@ -41,30 +97,26 @@ std::string HDFSLauncher::Exec(const char* cmd) {
   return result;
 }
 
-bool HDFSLauncher::Start(void) {
-  /* Run hdfs test case need four environment variable:
-   * JAVA_HOME, HADOOP_HDFS_HOME, CLASSPATH, LD_LIBRARY_PATH */
-  char *hdfs_home = getenv("HADOOP_HDFS_HOME");
-  char *java_home = getenv("JAVA_HOME");
-  char *classpath = getenv("CLASSPATH");
-  char *ld_path = getenv("LD_LIBRARY_PATH");
-
-  if (hdfs_home == NULL || java_home == NULL || classpath == NULL || ld_path == NULL) {
-    return false;
-  }
-
+void HDFSLauncher::Start() {
+  port_ = GetAvailablePort();
+  UpdateCoreSiteConfig(port_);
+  std::vector<int> ports;
+  GetAvailablePorts(5, &ports);
+  UpdateHdfsSiteConfig(ports);
   stringstream ss;
-  ss << "cd " << XDL_HADOOP_PATH << "; sh run.sh";
+  ss << "cd " << XDL_HADOOP_PATH << "; sh run.sh " << \
+    std::to_string(port_) << "; sleep 26";
   string out = Exec(ss.str().c_str());
   cout << out << std::endl;
-  return true;
 }
 
-void HDFSLauncher::Stop(void) {
+void HDFSLauncher::Stop() {
   stringstream ss;
   ss << "cd " << XDL_HADOOP_PATH << "; sh stop.sh";
   string out = Exec(ss.str().c_str());
   cout << out << std::endl;
+  RestoreCoreSiteConfig();
+  RestoreHdfsSiteConfig();
 }
 
 }
diff --git a/xdl/test/util/hdfs_launcher.h b/xdl/test/util/hdfs_launcher.h
index 558c4f2a..19cf8869 100644
--- a/xdl/test/util/hdfs_launcher.h
+++ b/xdl/test/util/hdfs_launcher.h
@@ -17,16 +17,104 @@ limitations under the License.
 #define HDFS_LAUNCHER_H_
 
 #include <string>
+#include <fstream>
+#include <sstream>
+#include <sys/stat.h>
+#include <cstdlib>
+#include <cstring>
+#include <cstdio>
+#include <unistd.h>
+#include <vector>
+#include <set>
 
-namespace ps {
+namespace xdl {
   
 class HDFSLauncher {
 public:
-  static bool Start(void);
-  static void Stop(void);
+  void Start();
+  void Stop();
+  static HDFSLauncher* Instance() {
+    static HDFSLauncher launch;
+    return &launch;
+  }
+
+  int GetPort() {
+    return port_;
+  }
 
 private:
+  HDFSLauncher();
+  ~HDFSLauncher();
+
+  std::string ReadLocalFile(const std::string &filePath) {
+    std::ifstream in(filePath.c_str());
+    std::stringstream ss;
+    std::string line;
+    if (!in) {
+      return std::string("");
+    }
+    while (std::getline(in, line)) {
+      ss << line;
+    }
+    in.close();
+    return ss.str();
+  }
+
+  bool WriteLocalFile(const std::string &filePath, 
+		      const std::string &content) {
+    std::ofstream file(filePath.c_str());
+    if (!file) {
+      return false;
+    }
+    file.write(content.c_str(), content.length());
+    file.flush();
+    file.close();
+    return true;
+  }
+
+  int GetAvailablePort();
+  void GetAvailablePorts(int num, std::vector<int>* ports);
+
+  void UpdateCoreSiteConfig(int port) {
+    raw_config_ = ReadLocalFile(config_path_);
+    std::string new_config = raw_config_;
+    size_t pos = new_config.find("${port}");
+    if (pos != std::string::npos) {
+      new_config.replace(pos, 7, std::to_string(port));
+    }
+
+    WriteLocalFile(config_path_, new_config);
+  }
+
+  void RestoreCoreSiteConfig() {
+    WriteLocalFile(config_path_, raw_config_);
+  }
+
+  void UpdateHdfsSiteConfig(const std::vector<int>& port_list) {
+    raw_hdfs_config_ = ReadLocalFile(hdfs_config_path_);
+    std::string hdfs_config = raw_hdfs_config_;
+    for (size_t i = 1; i <= port_list.size(); ++i) {
+      std::string placeholder = "${port" + std::to_string(i) + "}";
+      std::string value = "0.0.0.0:" + std::to_string(port_list[i]);
+      size_t pos = hdfs_config.find(placeholder);
+      if (pos != std::string::npos) {
+	hdfs_config.replace(pos, placeholder.size(), value);
+      }
+    }
+
+    WriteLocalFile(hdfs_config_path_, hdfs_config);
+  }
+
+  void RestoreHdfsSiteConfig() {
+    WriteLocalFile(hdfs_config_path_, raw_hdfs_config_);
+  }
+  
   static std::string Exec(const char *cmd);
+  int port_;
+  std::string config_path_;
+  std::string raw_config_;
+  std::string hdfs_config_path_;
+  std::string raw_hdfs_config_;
 };
 
 }
diff --git a/xdl/test/util/zookeeper_define.h b/xdl/test/util/zookeeper_define.h
deleted file mode 100644
index 35affb44..00000000
--- a/xdl/test/util/zookeeper_define.h
+++ /dev/null
@@ -1 +0,0 @@
-const char *XDL_ZOOKEEPER_PATH = "/home/yue.song/x-deeplearning/xdl/test/binary/zookeeper-3.4.13/";
diff --git a/xdl/test/util/zookeeper_launcher.cpp b/xdl/test/util/zookeeper_launcher.cpp
index bf561f36..392689b0 100644
--- a/xdl/test/util/zookeeper_launcher.cpp
+++ b/xdl/test/util/zookeeper_launcher.cpp
@@ -21,13 +21,52 @@ limitations under the License.
 #include <sstream>
 #include <iostream>
 #include <string>
+#include <stdio.h>
+#include <unistd.h>
+#include <stdlib.h>
+#include <unistd.h>
+#include <netdb.h>
+#include <arpa/inet.h>
+#include <net/if.h>
+#include <ifaddrs.h>
+#include <netinet/in.h>
 
 #include "zookeeper_launcher.h"
 #include "zookeeper_define.h"
 
 using namespace std;
 
-namespace ps {
+namespace xdl {
+
+ZookeeperLauncher::ZookeeperLauncher() {
+  config_path_ = std::string(XDL_ZOOKEEPER_PATH) + "conf/zoo.cfg";
+  Start();
+}
+
+ZookeeperLauncher::~ZookeeperLauncher() {
+  Stop();
+}
+
+int ZookeeperLauncher::GetAvailablePort() {
+    struct sockaddr_in addr;
+    addr.sin_port = htons(0);  // have system pick up a random port available for me
+    addr.sin_family = AF_INET;  // IPV4
+    addr.sin_addr.s_addr = htonl(INADDR_ANY);  // set our addr to any interface
+
+    int sock = socket(AF_INET, SOCK_STREAM, 0);
+    if (0 != bind(sock, (struct sockaddr*)&addr, sizeof(struct sockaddr_in))) {
+        return -1;
+    }
+
+    socklen_t addr_len = sizeof(struct sockaddr_in);
+    if (0 != getsockname(sock, (struct sockaddr*)&addr, &addr_len)) {
+        return -1;
+    }
+
+    int ret_port = ntohs(addr.sin_port);
+    close(sock);
+    return ret_port;
+}
 
 std::string ZookeeperLauncher::Exec(const char* cmd) {
   std::array<char, 128> buffer;
@@ -42,19 +81,23 @@ std::string ZookeeperLauncher::Exec(const char* cmd) {
 }
 
 void ZookeeperLauncher::Start(void) {
+  port_ = GetAvailablePort();
+  UpdateCoreSiteConfig(port_);
   stringstream ss;
-  ss << "cd " << XDL_ZOOKEEPER_PATH << "; bin/zkServer.sh start";
+  ss << "cd " << XDL_ZOOKEEPER_PATH << "; bin/zkServer.sh start; sleep 26";
   string out = Exec(ss.str().c_str());
   cout << out << std::endl;
 }
 
 void ZookeeperLauncher::Stop(void) {
+  std::cout << "Stop zookeeeper!\n\n\n";
   stringstream ss;
   ss << "cd " << XDL_ZOOKEEPER_PATH << "; bin/zkServer.sh stop; rm -rf zookeeper.out";
   string out = Exec(ss.str().c_str());
   cout << out << std::endl;
   out = Exec("rm -rf /tmp/xdl_zookeeper");
   cout << out << std::endl;
+  RestoreCoreSiteConfig();
 }
 
 }
diff --git a/xdl/test/util/zookeeper_launcher.h b/xdl/test/util/zookeeper_launcher.h
index 8f1772f2..9c583f3c 100644
--- a/xdl/test/util/zookeeper_launcher.h
+++ b/xdl/test/util/zookeeper_launcher.h
@@ -17,16 +17,81 @@ limitations under the License.
 #define ZOOKEEPER_LAUNCHER_H_
 
 #include <string>
+#include <fstream>
+#include <sstream>
+#include <sys/stat.h>
+#include <cstdlib>
+#include <cstring>
+#include <cstdio>
+#include <unistd.h>
 
-namespace ps {
+namespace xdl {
 
 class ZookeeperLauncher {
 public:
-  static void Start(void);
-  static void Stop(void);
+  void Start(void);
+  void Stop(void);
+  static ZookeeperLauncher* Instance() {
+    static ZookeeperLauncher launch;
+    return &launch;
+  }
+
+  int GetPort() {
+    return port_;
+  }
 
 private:
+  ZookeeperLauncher();
+  ~ZookeeperLauncher();
+
+  std::string ReadLocalFile(const std::string &filePath) {
+    std::ifstream in(filePath.c_str());
+    std::stringstream ss;
+    std::string line;
+    if (!in) {
+      return std::string("");
+    }
+    while (std::getline(in, line)) {
+      ss << line << "\n";
+    }
+    in.close();
+    return ss.str();
+  }
+
+  bool WriteLocalFile(const std::string &filePath,
+		      const std::string &content) {
+    std::ofstream file(filePath.c_str());
+    if (!file) {
+      return false;
+    }
+    file.write(content.c_str(), content.length());
+    file.flush();
+    file.close();
+    return true;
+  }
+
+  int GetAvailablePort();
+
+  void UpdateCoreSiteConfig(int port) {
+    raw_config_ = ReadLocalFile(config_path_);
+    std::string new_config = raw_config_;
+    size_t pos = new_config.find("${port}");
+    if (pos != std::string::npos) {
+      new_config.replace(pos, 7, std::to_string(port));
+    }
+
+    WriteLocalFile(config_path_, new_config);
+  }
+
+  void RestoreCoreSiteConfig() {
+    WriteLocalFile(config_path_, raw_config_);
+  }
+
   static std::string Exec(const char *cmd);
+
+  int port_;
+  std::string config_path_;
+  std::string raw_config_;
 };
 
 }
diff --git a/xdl/third_party/tbb/.gitattributes b/xdl/third_party/tbb/.gitattributes
new file mode 100644
index 00000000..039edb3a
--- /dev/null
+++ b/xdl/third_party/tbb/.gitattributes
@@ -0,0 +1,45 @@
+# Set the default behavior, in case people don't have core.autocrlf set.
+* text=auto
+
+# Explicitly declare text files you want to always be normalized and converted
+# to native line endings on checkout.
+*.c text
+*.h text
+*.cpp text
+*.def text
+*.rc text
+*.i text
+*.sh text
+*.csh text
+*.mk text
+*.java text
+*.csv text
+*.lst text
+*.asm text
+*.cfg text
+*.css text
+*.inc text
+*.js text
+*.rb text
+*.strings text
+*.txt text
+*export.lst text
+*.xml text
+*.py text
+*.md text
+*.classpath text
+*.cproject text
+*.project text
+*.properties text
+*.java text
+*.gradle text
+
+# Declare files that will always have CRLF line endings on checkout.
+*.sln text eol=crlf
+*.bat text eol=crlf
+
+# Denote all files that are truly binary and should not be modified.
+*.png binary
+*.jpg binary
+*.ico binary
+*.spir binary
diff --git a/xdl/third_party/tbb/.gitignore b/xdl/third_party/tbb/.gitignore
new file mode 100644
index 00000000..0182b141
--- /dev/null
+++ b/xdl/third_party/tbb/.gitignore
@@ -0,0 +1,86 @@
+# Ignore the debug and release directories created with Makefile builds #
+#########################################################################
+build/*_debug/
+build/*_release/
+
+# Compiled source #
+###################
+*.com
+*.class
+*.dll
+*.lib
+*.pdb
+*.exe
+*.o
+*.so
+*.so.1
+*.so.2
+*.dylib
+*.a
+*.obj
+*.pyc
+
+*.orig
+*.raw
+*.sample
+*.slo
+*.swp
+*.config
+*.la
+*.lai
+*.lo
+*.nhdr
+*.nii.gz
+*.nrrd
+
+# Packages #
+############
+# it's better to unpack these files and commit the raw source
+# git has its own built in compression methods
+*.7z
+*.dmg
+*.gz
+*.iso
+*.jar
+*.rar
+*.tar
+*.tgz
+*.zip
+
+# Logs and databases #
+######################
+*.log
+*.sql
+*.sqlite
+
+# OS generated files #
+######################
+.DS_Store
+.DS_Store?
+._*
+.Spotlight-V100
+.Trashes
+ehthumbs.db
+Thumbs.db
+
+# IDE generated files #
+######################
+/.ninja_deps
+/.ninja_log
+/build.ninja
+/rules.ninja
+*~
+.emacs.desktop
+
+# Build system generated files #
+################################
+CMakeCache.txt
+CMakeFiles/
+
+# Other #
+#########
+.clang_complete
+.idea
+.svn
+crash*
+*.tmp
diff --git a/xdl/third_party/tbb/CHANGES b/xdl/third_party/tbb/CHANGES
new file mode 100644
index 00000000..2a02117f
--- /dev/null
+++ b/xdl/third_party/tbb/CHANGES
@@ -0,0 +1,2650 @@
+------------------------------------------------------------------------
+The list of most significant changes made over time in
+Intel(R) Threading Building Blocks (Intel(R) TBB).
+
+Intel TBB 2019 Update 3
+TBB_INTERFACE_VERSION == 11003
+
+Changes (w.r.t. Intel TBB 2019 Update 2):
+
+- Added tbb::transform_iterator.
+- Added new Makefile target 'profile' to flow graph examples enabling
+    additional support for Intel(R) Parallel Studio XE tools.
+- Added TBB_MALLOC_DISABLE_REPLACEMENT environment variable to switch off
+    dynamic memory allocation replacement on Windows*. Inspired by
+    a contribution from Edward Lam.
+
+Preview Features:
+
+- Extended flow graph API to support relative priorities for functional
+    nodes, specified as an optional parameter to the node constructors.
+
+Open-source contributions integrated:
+
+- Enabled using process-local futex operations
+    (https://github.com/01org/tbb/pull/58) by Andrey Semashev.
+
+------------------------------------------------------------------------
+Intel TBB 2019 Update 2
+TBB_INTERFACE_VERSION == 11002
+
+Changes (w.r.t. Intel TBB 2019 Update 1):
+
+- Added overloads for parallel_reduce with default partitioner and
+    user-supplied context.
+- Added deduction guides for tbb containers: concurrent_vector,
+    concurrent_queue, concurrent_bounded_queue,
+    concurrent_priority_queue.
+- Reallocation of memory objects >1MB now copies and frees memory if
+    the size is decreased twice or more, trading performance off for
+    reduced memory usage.
+- After a period of sleep, TBB worker threads now prefer returning to
+    their last used task arena.
+
+Bugs fixed:
+
+- Fixed compilation of task_group.h when targeting macOS* 10.11 or
+    earlier (https://github.com/conda-forge/tbb-feedstock/issues/42).
+
+Open-source contributions integrated:
+
+- Added constructors with HashCompare argument to concurrent_hash_map
+    (https://github.com/01org/tbb/pull/63) by arewedancer.
+
+------------------------------------------------------------------------
+Intel TBB 2019 Update 1
+TBB_INTERFACE_VERSION == 11001
+
+Changes (w.r.t. Intel TBB 2019):
+
+- Doxygen documentation could be built with 'make doxygen' command now.
+
+Changes affecting backward compatibility:
+
+- Enforced 8 byte alignment for tbb::atomic<long long> and
+    tbb::atomic<double>. On IA-32 architecture it may cause layout
+    changes in structures that use these types.
+
+Bugs fixed:
+
+- Fixed an issue with dynamic memory allocation replacement on Windows*
+    occurred for some versions of ucrtbase.dll.
+- Fixed possible deadlock in tbbmalloc cleanup procedure during process
+    shutdown. Inspired by a contribution from Edward Lam.
+- Fixed usage of std::uncaught_exception() deprecated in C++17
+   (https://github.com/01org/tbb/issues/67).
+- Fixed a crash when a local observer is activated after an arena
+    observer.
+- Fixed compilation of task_group.h by Visual C++* 15.7 with
+    /permissive- option (https://github.com/01org/tbb/issues/53).
+- Fixed tbb4py to avoid dependency on Intel(R) C++ Compiler shared
+    libraries.
+- Fixed compilation for Anaconda environment with GCC 7.3 and higher.
+
+Open-source contributions integrated:
+
+- Fix various warnings when building with Visual C++
+    (https://github.com/01org/tbb/pull/70) by Edward Lam.
+
+------------------------------------------------------------------------
+Intel TBB 2019
+TBB_INTERFACE_VERSION == 11000
+
+Changes (w.r.t. Intel TBB 2018 Update 5):
+
+- Lightweight policy for functional nodes in the flow graph is now
+    a fully supported feature.
+- Reservation support in flow::write_once_node and flow::overwrite_node
+    is now a fully supported feature.
+- Support for Flow Graph Analyzer and improvements for
+    Intel(R) VTune(TM) Amplifier become a regular feature enabled by
+    TBB_USE_THREADING_TOOLS macro.
+- Added support for std::new_handler in the replacement functions for
+    global operator new.
+- Added C++14 constructors to concurrent unordered containers.
+- Added tbb::counting_iterator and tbb::zip_iterator.
+- Fixed multiple -Wextra warnings in TBB source files.
+
+Preview Features:
+
+- Extracting nodes from a flow graph is deprecated and disabled by
+    default. To enable, use TBB_DEPRECATED_FLOW_NODE_EXTRACTION macro.
+
+Changes affecting backward compatibility:
+
+- Due to internal changes in the flow graph classes, recompilation is
+    recommended for all binaries that use the flow graph.
+
+Open-source contributions integrated:
+
+- Added support for OpenBSD by Anthony J. Bentley.
+
+------------------------------------------------------------------------
+Intel TBB 2018 Update 5
+TBB_INTERFACE_VERSION == 10005
+
+Changes (w.r.t. Intel TBB 2018 Update 4):
+
+Preview Features:
+
+- Added user event tracing API for Intel(R) VTune(TM) Amplifier and
+    Flow Graph Analyzer.
+
+Bugs fixed:
+
+- Fixed the memory allocator to properly support transparent huge pages.
+- Removed dynamic exception specifications in tbbmalloc_proxy for C++11
+    and later (https://github.com/01org/tbb/issues/41).
+- Added -flifetime-dse=1 option when building with GCC on macOS*
+    (https://github.com/01org/tbb/issues/60).
+
+Open-source contributions integrated:
+
+- Added ARMv8 support by Siddhesh Poyarekar.
+- Avoid GCC warnings for clearing an object of non-trivial type
+    (https://github.com/01org/tbb/issues/54) by Daniel Arndt.
+
+------------------------------------------------------------------------
+Intel TBB 2018 Update 4
+TBB_INTERFACE_VERSION == 10004
+
+Changes (w.r.t. Intel TBB 2018 Update 3):
+
+Preview Features:
+
+- Improved support for Flow Graph Analyzer and Intel(R) VTune(TM)
+    Amplifier in the task scheduler and generic parallel algorithms.
+- Default device set for opencl_node now includes all the devices from
+    the first available OpenCL* platform.
+- Added lightweight policy for functional nodes in the flow graph. It
+    indicates that the node body has little work and should, if possible,
+    be executed immediately upon receiving a message, avoiding task
+    scheduling overhead.
+
+------------------------------------------------------------------------
+Intel TBB 2018 Update 3
+TBB_INTERFACE_VERSION == 10003
+
+Changes (w.r.t. Intel TBB 2018 Update 2):
+
+Preview Features:
+
+- Added template class blocked_rangeNd for a generic multi-dimensional
+    range (requires C++11). Inspired by a contribution from Jeff Hammond.
+
+Bugs fixed:
+
+- Fixed a crash with dynamic memory allocation replacement on
+    Windows* for applications using system() function.
+- Fixed parallel_deterministic_reduce to split range correctly when used
+     with static_partitioner.
+- Fixed a synchronization issue in task_group::run_and_wait() which
+    caused a simultaneous call to task_group::wait() to return
+    prematurely.
+
+------------------------------------------------------------------------
+Intel TBB 2018 Update 2
+TBB_INTERFACE_VERSION == 10002
+
+Changes (w.r.t. Intel TBB 2018 Update 1):
+
+- Added support for Android* NDK r16, macOS* 10.13, Fedora* 26.
+- Binaries for Universal Windows Driver (vc14_uwd) now link with static
+    Microsoft* runtime libraries, and are only available in commercial
+    releases.
+- Extended flow graph documentation with more code samples.
+
+Preview Features:
+
+- Added a Python* module for multi-processing computations in numeric
+    Python* libraries.
+
+Bugs fixed:
+
+- Fixed constructors of concurrent_hash_map to be exception-safe.
+- Fixed auto-initialization in the main thread to be cleaned up at
+    shutdown.
+- Fixed a crash when tbbmalloc_proxy is used together with dbghelp.
+- Fixed static_partitioner to assign tasks properly in case of nested
+    parallelism.
+
+------------------------------------------------------------------------
+Intel TBB 2018 Update 1
+TBB_INTERFACE_VERSION == 10001
+
+Changes (w.r.t. Intel TBB 2018):
+
+- Added lambda-friendly overloads for parallel_scan.
+- Added support of static and simple partitioners in
+    parallel_deterministic_reduce.
+
+Preview Features:
+
+- Added initial support for Flow Graph Analyzer to parallel_for.
+- Added reservation support in overwrite_node and write_once_node.
+
+Bugs fixed:
+
+- Fixed a potential deadlock scenario in the flow graph that affected
+    Intel TBB 2018.
+
+------------------------------------------------------------------------
+Intel TBB 2018
+TBB_INTERFACE_VERSION == 10000
+
+Changes (w.r.t. Intel TBB 2017 Update 7):
+
+- Introduced Parallel STL, an implementation of the C++ standard
+    library algorithms with support for execution policies. For more
+    information, see Getting Started with Parallel STL
+    (https://software.intel.com/en-us/get-started-with-pstl).
+- this_task_arena::isolate() function is now a fully supported feature.
+- this_task_arena::isolate() function and task_arena::execute() method
+    were extended to pass on the value returned by the executed functor
+    (requires C++11).
+- task_arena::enqueue() and task_group::run() methods extended to accept
+    move-only functors.
+- A flow graph now spawns all tasks into the same task arena,
+    and waiting for graph completion also happens in that arena.
+- Improved support for Flow Graph Analyzer in async_node, opencl_node,
+    and composite_node.
+- Added support for Android* NDK r15, r15b.
+- Added support for Universal Windows Platform.
+- Increased minimally supported version of macOS*
+    (MACOSX_DEPLOYMENT_TARGET) to 10.11.
+
+Changes affecting backward compatibility:
+
+- Internal layout changes in some flow graph classes;
+- Several undocumented methods are removed from class graph,
+    including set_active() and is_active().
+- Due to incompatible changes, the namespace version is updated
+    for the flow graph; recompilation is recommended for all
+    binaries that use the flow graph classes.
+
+Preview Features:
+
+- opencl_node can be used with any graph object; class opencl_graph
+    is removed.
+- graph::wait_for_all() now automatically waits for all not yet consumed
+    async_msg objects.
+- Improved concurrent_lru_cache::handle_object to support C++11 move
+    semantics, default construction, and conversion to bool.
+
+Bugs fixed:
+
+- Fixed a bug preventing use of streaming_node and opencl_node with
+    Clang; inspired by a contribution from Francisco Facioni.
+- Fixed this_task_arena::isolate() function to work correctly with
+    parallel_invoke and parallel_do algorithms.
+- Fixed a memory leak in composite_node.
+- Fixed an assertion failure in debug tbbmalloc binaries when
+    TBBMALLOC_CLEAN_ALL_BUFFERS is used.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 8
+TBB_INTERFACE_VERSION == 9108
+
+Changes (w.r.t. Intel TBB 2017 Update 7):
+
+Bugs fixed:
+
+- Fixed an assertion failure in debug tbbmalloc binaries when
+    TBBMALLOC_CLEAN_ALL_BUFFERS is used.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 7
+TBB_INTERFACE_VERSION == 9107
+
+Changes (w.r.t. Intel TBB 2017 Update 6):
+
+- In the huge pages mode, the memory allocator now is also able to use
+    transparent huge pages.
+
+Preview Features:
+
+- Added support for Intel TBB integration into CMake-aware
+    projects, with valuable guidance and feedback provided by Brad King
+    (Kitware).
+
+Bugs fixed:
+
+- Fixed scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS, 0)
+    to process memory left after exited threads.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 6
+TBB_INTERFACE_VERSION == 9106
+
+Changes (w.r.t. Intel TBB 2017 Update 5):
+
+- Added support for Android* NDK r14.
+
+Preview Features:
+
+- Added a blocking terminate extension to the task_scheduler_init class
+    that allows an object to wait for termination of worker threads.
+
+Bugs fixed:
+
+- Fixed compilation and testing issues with MinGW (GCC 6).
+- Fixed compilation with /std:c++latest option of VS 2017
+    (https://github.com/01org/tbb/issues/13).
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 5
+TBB_INTERFACE_VERSION == 9105
+
+Changes (w.r.t. Intel TBB 2017 Update 4):
+
+- Added support for Microsoft* Visual Studio* 2017.
+- Added graph/matmult example to demonstrate support for compute offload
+    to Intel(R) Graphics Technology in the flow graph API.
+- The "compiler" build option now allows to specify a full path to the
+    compiler.
+
+Changes affecting backward compatibility:
+
+- Constructors for many classes, including graph nodes, concurrent
+    containers, thread-local containers, etc., are declared explicit and
+    cannot be used for implicit conversions anymore.
+
+Bugs fixed:
+
+- Added a workaround for bug 16657 in the GNU C Library (glibc)
+    affecting the debug version of tbb::mutex.
+- Fixed a crash in pool_identify() called for an object allocated in
+    another thread.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 4
+TBB_INTERFACE_VERSION == 9104
+
+Changes (w.r.t. Intel TBB 2017 Update 3):
+
+- Added support for C++11 move semantics in parallel_do.
+- Added support for FreeBSD* 11.
+
+Changes affecting backward compatibility:
+
+- Minimal compiler versions required for support of C++11 move semantics
+    raised to GCC 4.5, VS 2012, and Intel(R) C++ Compiler 14.0.
+
+Bugs fixed:
+
+- The workaround for crashes in the library compiled with GCC 6
+    (-flifetime-dse=1) was extended to Windows*.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 3
+TBB_INTERFACE_VERSION == 9103
+
+Changes (w.r.t. Intel TBB 2017 Update 2):
+
+- Added support for Android* 7.0 and Android* NDK r13, r13b.
+
+Preview Features:
+
+- Added template class gfx_factory to the flow graph API. It implements
+    the Factory concept for streaming_node to offload computations to
+    Intel(R) processor graphics.
+
+Bugs fixed:
+
+- Fixed a possible deadlock caused by missed wakeup signals in
+    task_arena::execute().
+
+Open-source contributions integrated:
+
+- A build fix for Linux* s390x platform by Jerry J.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 2
+TBB_INTERFACE_VERSION == 9102
+
+Changes (w.r.t. Intel TBB 2017 Update 1):
+
+- Removed the long-outdated support for Xbox* consoles.
+
+Bugs fixed:
+
+- Fixed the issue with task_arena::execute() not being processed when
+    the calling thread cannot join the arena.
+- Fixed dynamic memory allocation replacement failure on macOS* 10.12.
+
+------------------------------------------------------------------------
+Intel TBB 2017 Update 1
+TBB_INTERFACE_VERSION == 9101
+
+Changes (w.r.t. Intel TBB 2017):
+
+Bugs fixed:
+
+- Fixed dynamic memory allocation replacement failures on Windows* 10
+    Anniversary Update.
+- Fixed emplace() method of concurrent unordered containers to not
+    require a copy constructor.
+
+------------------------------------------------------------------------
+Intel TBB 2017
+TBB_INTERFACE_VERSION == 9100
+
+Changes (w.r.t. Intel TBB 4.4 Update 5):
+
+- static_partitioner class is now a fully supported feature.
+- async_node class is now a fully supported feature.
+- Improved dynamic memory allocation replacement on Windows* OS to skip
+    DLLs for which replacement cannot be done, instead of aborting.
+- Intel TBB no longer performs dynamic memory allocation replacement
+    for Microsoft* Visual Studio* 2008.
+- For 64-bit platforms, quadrupled the worst-case limit on the amount
+    of memory the Intel TBB allocator can handle.
+- Added TBB_USE_GLIBCXX_VERSION macro to specify the version of GNU
+    libstdc++ when it cannot be properly recognized, e.g. when used
+    with Clang on Linux* OS. Inspired by a contribution from David A.
+- Added graph/stereo example to demostrate tbb::flow::async_msg.
+- Removed a few cases of excessive user data copying in the flow graph.
+- Reworked split_node to eliminate unnecessary overheads.
+- Added support for C++11 move semantics to the argument of
+    tbb::parallel_do_feeder::add() method.
+- Added C++11 move constructor and assignment operator to
+    tbb::combinable template class.
+- Added tbb::this_task_arena::max_concurrency() function and
+    max_concurrency() method of class task_arena returning the maximal
+    number of threads that can work inside an arena.
+- Deprecated tbb::task_arena::current_thread_index() static method;
+    use tbb::this_task_arena::current_thread_index() function instead.
+- All examples for commercial version of library moved online:
+    https://software.intel.com/en-us/product-code-samples. Examples are
+    available as a standalone package or as a part of Intel(R) Parallel
+    Studio XE or Intel(R) System Studio Online Samples packages.
+
+Changes affecting backward compatibility:
+
+- Renamed following methods and types in async_node class:
+    Old                   New
+    async_gateway_type => gateway_type
+    async_gateway()    => gateway()
+    async_try_put()    => try_put()
+    async_reserve()    => reserve_wait()
+    async_commit()     => release_wait()
+- Internal layout of some flow graph nodes has changed; recompilation
+    is recommended for all binaries that use the flow graph.
+
+Preview Features:
+
+- Added template class streaming_node to the flow graph API. It allows
+    a flow graph to offload computations to other devices through
+    streaming or offloading APIs.
+- Template class opencl_node reimplemented as a specialization of
+    streaming_node that works with OpenCL*.
+- Added tbb::this_task_arena::isolate() function to isolate execution
+    of a group of tasks or an algorithm from other tasks submitted
+    to the scheduler.
+
+Bugs fixed:
+
+- Added a workaround for GCC bug #62258 in std::rethrow_exception()
+    to prevent possible problems in case of exception propagation.
+- Fixed parallel_scan to provide correct result if the initial value
+    of an accumulator is not the operation identity value.
+- Fixed a memory corruption in the memory allocator when it meets
+    internal limits.
+- Fixed the memory allocator on 64-bit platforms to align memory
+    to 16 bytes by default for all allocations bigger than 8 bytes.
+- As a workaround for crashes in the Intel TBB library compiled with
+    GCC 6, added -flifetime-dse=1 to compilation options on Linux* OS.
+- Fixed a race in the flow graph implementation.
+
+Open-source contributions integrated:
+
+- Enabling use of C++11 'override' keyword by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.4 Update 6
+TBB_INTERFACE_VERSION == 9006
+
+Changes (w.r.t. Intel TBB 4.4 Update 5):
+
+- For 64-bit platforms, quadrupled the worst-case limit on the amount
+    of memory the Intel TBB allocator can handle.
+
+Bugs fixed:
+
+- Fixed a memory corruption in the memory allocator when it meets
+    internal limits.
+- Fixed the memory allocator on 64-bit platforms to align memory
+    to 16 bytes by default for all allocations bigger than 8 bytes.
+- Fixed parallel_scan to provide correct result if the initial value
+    of an accumulator is not the operation identity value.
+- As a workaround for crashes in the Intel TBB library compiled with
+    GCC 6, added -flifetime-dse=1 to compilation options on Linux* OS.
+
+------------------------------------------------------------------------
+Intel TBB 4.4 Update 5
+TBB_INTERFACE_VERSION == 9005
+
+Changes (w.r.t. Intel TBB 4.4 Update 4):
+
+- Modified graph/fgbzip2 example to remove unnecessary data queuing.
+
+Preview Features:
+
+- Added a Python* module which is able to replace Python's thread pool
+    class with the implementation based on Intel TBB task scheduler.
+
+Bugs fixed:
+
+- Fixed the implementation of 64-bit tbb::atomic for IA-32 architecture
+    to work correctly with GCC 5.2 in C++11/14 mode.
+- Fixed a possible crash when tasks with affinity (e.g. specified via
+    affinity_partitioner) are used simultaneously with task priority
+    changes.
+
+------------------------------------------------------------------------
+Intel TBB 4.4 Update 4
+TBB_INTERFACE_VERSION == 9004
+
+Changes (w.r.t. Intel TBB 4.4 Update 3):
+
+- Removed a few cases of excessive user data copying in the flow graph.
+- Improved robustness of concurrent_bounded_queue::abort() in case of
+    simultaneous push and pop operations.
+
+Preview Features:
+
+- Added tbb::flow::async_msg, a special message type to support
+    communications between the flow graph and external asynchronous
+    activities.
+- async_node modified to support use with C++03 compilers.
+
+Bugs fixed:
+
+- Fixed a bug in dynamic memory allocation replacement for Windows* OS.
+- Fixed excessive memory consumption on Linux* OS caused by enabling
+    zero-copy realloc.
+- Fixed performance regression on Intel(R) Xeon Phi(tm) coprocessor with
+    auto_partitioner.
+
+------------------------------------------------------------------------
+Intel TBB 4.4 Update 3
+TBB_INTERFACE_VERSION == 9003
+
+Changes (w.r.t. Intel TBB 4.4 Update 2):
+
+- Modified parallel_sort to not require a default constructor for values
+    and to use iter_swap() for value swapping.
+- Added support for creating or initializing a task_arena instance that
+    is connected to the arena currently used by the thread.
+- graph/binpack example modified to use multifunction_node.
+- For performance analysis, use Intel(R) VTune(TM) Amplifier XE 2015
+    and higher; older versions are no longer supported.
+- Improved support for compilation with disabled RTTI, by omitting its use
+    in auxiliary code, such as assertions. However some functionality,
+    particularly the flow graph, does not work if RTTI is disabled.
+- The tachyon example for Android* can be built using Android Studio 1.5
+    and higher with experimental Gradle plugin 0.4.0.
+
+Preview Features:
+
+- Added class opencl_subbufer that allows using OpenCL* sub-buffer
+    objects with opencl_node.
+- Class global_control supports the value of 1 for
+    max_allowed_parallelism.
+
+Bugs fixed:
+
+- Fixed a race causing "TBB Warning: setaffinity syscall failed" message.
+- Fixed a compilation issue on OS X* with Intel(R) C++ Compiler 15.0.
+- Fixed a bug in queuing_rw_mutex::downgrade() that could temporarily
+    block new readers.
+- Fixed speculative_spin_rw_mutex to stop using the lazy subscription
+    technique due to its known flaws.
+- Fixed memory leaks in the tool support code.
+
+------------------------------------------------------------------------
+Intel TBB 4.4 Update 2
+TBB_INTERFACE_VERSION == 9002
+
+Changes (w.r.t. Intel TBB 4.4 Update 1):
+
+- Improved interoperability with Intel(R) OpenMP RTL (libiomp) on Linux:
+    OpenMP affinity settings do not affect the default number of threads
+    used in the task scheduler. Intel(R) C++ Compiler 16.0 Update 1
+    or later is required.
+- Added a new flow graph example with different implementations of the
+    Cholesky Factorization algorithm.
+
+Preview Features:
+
+- Added template class opencl_node to the flow graph API. It allows a
+    flow graph to offload computations to OpenCL* devices.
+- Extended join_node to use type-specified message keys. It simplifies
+    the API of the node by obtaining message keys via functions
+    associated with the message type (instead of node ports).
+- Added static_partitioner that minimizes overhead of parallel_for and
+    parallel_reduce for well-balanced workloads.
+- Improved template class async_node in the flow graph API to support
+    user settable concurrency limits.
+
+Bugs fixed:
+
+- Fixed a possible crash in the GUI layer for library examples on Linux.
+
+------------------------------------------------------------------------
+Intel TBB 4.4 Update 1
+TBB_INTERFACE_VERSION == 9001
+
+Changes (w.r.t. Intel TBB 4.4):
+
+- Added support for Microsoft* Visual Studio* 2015.
+- Intel TBB no longer performs dynamic replacement of memory allocation
+    functions for Microsoft Visual Studio 2005 and earlier versions.
+- For GCC 4.7 and higher, the intrinsics-based platform isolation layer
+    uses __atomic_* built-ins instead of the legacy __sync_* ones.
+    This change is inspired by a contribution from Mathieu Malaterre.
+- Improvements in task_arena:
+    Several application threads may join a task_arena and execute tasks
+    simultaneously. The amount of concurrency reserved for application
+    threads at task_arena construction can be set to any value between
+    0 and the arena concurrency limit.
+- The fractal example was modified to demonstrate class task_arena
+    and moved to examples/task_arena/fractal.
+
+Bugs fixed:
+
+- Fixed a deadlock during destruction of task_scheduler_init objects
+    when one of destructors is set to wait for worker threads.
+- Added a workaround for a possible crash on OS X* when dynamic memory
+    allocator replacement (libtbbmalloc_proxy) is used and memory is
+    released during application startup.
+- Usage of mutable functors with task_group::run_and_wait() and
+    task_arena::enqueue() is disabled. An attempt to pass a functor
+    which operator()() is not const will produce compilation errors.
+- Makefiles and environment scripts now properly recognize GCC 5.0 and
+    higher.
+
+Open-source contributions integrated:
+
+- Improved performance of parallel_for_each for inputs allowing random
+    access, by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.4
+TBB_INTERFACE_VERSION == 9000
+
+Changes (w.r.t. Intel TBB 4.3 Update 6):
+
+- The following features are now fully supported:
+    tbb::flow::composite_node;
+    additional policies of tbb::flow::graph_node::reset().
+- Platform abstraction layer for Windows* OS updated to use compiler
+    intrinsics for most atomic operations.
+- The tbb/compat/thread header updated to automatically include
+    C++11 <thread> where available.
+- Fixes and refactoring in the task scheduler and class task_arena.
+- Added key_matching policy to tbb::flow::join_node, which removes
+    the restriction on the type that can be compared-against.
+- For tag_matching join_node, tag_value is redefined to be 64 bits
+    wide on all architectures.
+- Expanded the documentation for the flow graph with details about
+    node semantics and behavior.
+- Added dynamic replacement of C11 standard function aligned_alloc()
+    under Linux* OS.
+- Added C++11 move constructors and assignment operators to
+    tbb::enumerable_thread_specific container.
+- Added hashing support for tbb::tbb_thread::id.
+- On OS X*, binaries that depend on libstdc++ are not provided anymore.
+    In the makefiles, libc++ is now used by default; for building with
+    libstdc++, specify stdlib=libstdc++ in the make command line.
+
+Preview Features:
+
+- Added a new example, graph/fgbzip2, that shows usage of
+    tbb::flow::async_node.
+- Modification to the low-level API for memory pools:
+    added a function for finding a memory pool by an object allocated
+    from that pool.
+- tbb::memory_pool now does not request memory till the first allocation
+    from the pool.
+
+Changes affecting backward compatibility:
+
+- Internal layout of flow graph nodes has changed; recompilation is
+    recommended for all binaries that use the flow graph.
+- Resetting a tbb::flow::source_node will immediately activate it,
+    unless it was created in inactive state.
+
+Bugs fixed:
+
+- Failure at creation of a memory pool will not cause process
+    termination anymore.
+
+Open-source contributions integrated:
+
+- Supported building TBB with Clang on AArch64 with use of built-in
+    intrinsics by David A.
+
+------------------------------------------------------------------------
+Intel TBB 4.3 Update 6
+TBB_INTERFACE_VERSION == 8006
+
+Changes (w.r.t. Intel TBB 4.3 Update 5):
+
+- Supported zero-copy realloc for objects >1MB under Linux* via
+    mremap system call.
+- C++11 move-aware insert and emplace methods have been added to
+    concurrent_hash_map container.
+- install_name is set to @rpath/<library name> on OS X*.
+
+Preview Features:
+
+- Added template class async_node to the flow graph API. It allows a
+    flow graph to communicate with an external activity managed by
+    the user or another runtime.
+- Improved speed of flow::graph::reset() clearing graph edges.
+    rf_extract flag has been renamed rf_clear_edges.
+- extract() method of graph nodes now takes no arguments.
+
+Bugs fixed:
+
+- concurrent_unordered_{set,map} behaves correctly for degenerate
+    hashes.
+- Fixed a race condition in the memory allocator that may lead to
+    excessive memory consumption under high multithreading load.
+
+------------------------------------------------------------------------
+Intel TBB 4.3 Update 5
+TBB_INTERFACE_VERSION == 8005
+
+Changes (w.r.t. Intel TBB 4.3 Update 4):
+
+- Added add_ref_count() method of class tbb::task.
+
+Preview Features:
+
+- Added class global_control for application-wide control of allowed
+    parallelism and thread stack size.
+- memory_pool_allocator now throws the std::bad_alloc exception on
+    allocation failure.
+- Exceptions thrown for by memory pool constructors changed from
+    std::bad_alloc to std::invalid_argument and std::runtime_error.
+
+Bugs fixed:
+
+- scalable_allocator now throws the std::bad_alloc exception on
+    allocation failure.
+- Fixed a race condition in the memory allocator that may lead to
+    excessive memory consumption under high multithreading load.
+- A new scheduler created right after destruction of the previous one
+    might be unable to modify the number of worker threads.
+
+Open-source contributions integrated:
+
+- (Added but not enabled) push_front() method of class tbb::task_list
+    by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.3 Update 4
+TBB_INTERFACE_VERSION == 8004
+
+Changes (w.r.t. Intel TBB 4.3 Update 3):
+
+- Added a C++11 variadic constructor for enumerable_thread_specific.
+    The arguments from this constructor are used to construct
+    thread-local values.
+- Improved exception safety for enumerable_thread_specific.
+- Added documentation for tbb::flow::tagged_msg class and
+    tbb::flow::output_port function.
+- Fixed build errors for systems that do not support dynamic linking.
+- C++11 move-aware insert and emplace methods have been added to
+    concurrent unordered containers.
+
+Preview Features:
+
+- Interface-breaking change: typedefs changed for node predecessor and
+    successor lists, affecting copy_predecessors and copy_successors
+    methods.
+- Added template class composite_node to the flow graph API. It packages
+    a subgraph to represent it as a first-class flow graph node.
+- make_edge and remove_edge now accept multiport nodes as arguments,
+    automatically using the node port with index 0 for an edge.
+
+Open-source contributions integrated:
+
+- Draft code for enumerable_thread_specific constructor with multiple
+    arguments (see above) by Adrien Guinet.
+- Fix for GCC invocation on IBM* Blue Gene*
+    by Jeff Hammond and Raf Schietekat.
+- Extended testing with smart pointers for Clang & libc++
+    by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.3 Update 3
+TBB_INTERFACE_VERSION == 8003
+
+Changes (w.r.t. Intel TBB 4.3 Update 2):
+
+- Move constructor and assignment operator were added to unique_lock.
+
+Preview Features:
+
+- Time overhead for memory pool destruction was reduced.
+
+Open-source contributions integrated:
+
+- Build error fix for iOS* by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.3 Update 2
+TBB_INTERFACE_VERSION == 8002
+
+Changes (w.r.t. Intel TBB 4.3 Update 1):
+
+- Binary files for 64-bit Android* applications were added as part of the
+    Linux* OS package.
+- Exact exception propagation is enabled for Intel C++ Compiler on OS X*.
+- concurrent_vector::shrink_to_fit was optimized for types that support
+    C++11 move semantics.
+
+Bugs fixed:
+
+- Fixed concurrent unordered containers to insert elements much faster
+    in debug mode.
+- Fixed concurrent priority queue to support types that do not have
+    copy constructors.
+- Fixed enumerable_thread_specific to forbid copying from an instance
+    with a different value type.
+
+Open-source contributions integrated:
+
+- Support for PathScale* EKOPath* Compiler by Erik Lindahl.
+
+------------------------------------------------------------------------
+Intel TBB 4.3 Update 1
+TBB_INTERFACE_VERSION == 8001
+
+Changes (w.r.t. Intel TBB 4.3):
+
+- The ability to split blocked_ranges in a proportion, used by
+    affinity_partitioner since version 4.2 Update 4, became a formal
+    extension of the Range concept.
+- More checks for an incorrect address to release added to the debug
+    version of the memory allocator.
+- Different kind of solutions for each TBB example were merged.
+
+Preview Features:
+
+- Task priorities are re-enabled in preview binaries.
+
+Bugs fixed:
+
+- Fixed a duplicate symbol when TBB_PREVIEW_VARIADIC_PARALLEL_INVOKE is
+    used in multiple compilation units.
+- Fixed a crash in __itt_fini_ittlib seen on Ubuntu 14.04.
+- Fixed a crash in memory release after dynamic replacement of the
+    OS X* memory allocator.
+- Fixed incorrect indexing of arrays in seismic example.
+- Fixed a data race in lazy initialization of task_arena.
+
+Open-source contributions integrated:
+
+- Fix for dumping information about gcc and clang compiler versions
+    by Misty De Meo.
+
+------------------------------------------------------------------------
+Intel TBB 4.3
+TBB_INTERFACE_VERSION == 8000
+
+Changes (w.r.t. Intel TBB 4.2 Update 5):
+
+- The following features are now fully supported: flow::indexer_node,
+    task_arena, speculative_spin_rw_mutex.
+- Compatibility with C++11 standard improved for tbb/compat/thread
+    and tbb::mutex.
+- C++11 move constructors have been added to concurrent_queue and
+    concurrent_bounded_queue.
+- C++11 move constructors and assignment operators have been added to
+    concurrent_vector, concurrent_hash_map, concurrent_priority_queue,
+    concurrent_unordered_{set,multiset,map,multimap}.
+- C++11 move-aware emplace/push/pop methods have been added to
+    concurrent_vector, concurrent_queue, concurrent_bounded_queue,
+    concurrent_priority_queue.
+- Methods to insert a C++11 initializer list have been added:
+    concurrent_vector::grow_by(), concurrent_hash_map::insert(),
+    concurrent_unordered_{set,multiset,map,multimap}::insert().
+- Testing for compatibility of containers with some C++11 standard
+    library types has been added.
+- Dynamic replacement of standard memory allocation routines has been
+    added for OS X*.
+- Microsoft* Visual Studio* projects for Intel TBB examples updated
+    to VS 2010.
+- For open-source packages, debugging information (line numbers) in
+    precompiled binaries now matches the source code.
+- Debug information was added to release builds for OS X*, Solaris*,
+    FreeBSD* operating systems and MinGW*.
+- Various improvements in documentation, debug diagnostics and examples.
+
+Preview Features:
+
+- Additional actions on reset of graphs, and extraction of individual
+    nodes from a graph (TBB_PREVIEW_FLOW_GRAPH_FEATURES).
+- Support for an arbitrary number of arguments in parallel_invoke
+   (TBB_PREVIEW_VARIADIC_PARALLEL_INVOKE).
+
+Changes affecting backward compatibility:
+
+- For compatibility with C++11 standard, copy and move constructors and
+    assignment operators are disabled for all mutex classes. To allow
+    the old behavior, use TBB_DEPRECATED_MUTEX_COPYING macro.
+- flow::sequencer_node rejects messages with repeating sequence numbers.
+- Changed internal interface between tbbmalloc and tbbmalloc_proxy.
+- Following deprecated functionality has been removed:
+    old debugging macros TBB_DO_ASSERT & TBB_DO_THREADING_TOOLS;
+    no-op depth-related methods in class task;
+    tbb::deprecated::concurrent_queue;
+    deprecated variants of concurrent_vector methods.
+- register_successor() and remove_successor() are deprecated as methods
+    to add and remove edges in flow::graph; use make_edge() and
+    remove_edge() instead.
+
+Bugs fixed:
+
+- Fixed incorrect scalable_msize() implementation for aligned objects.
+- Flow graph buffering nodes now destroy their copy of forwarded items.
+- Multiple fixes in task_arena implementation, including for:
+    inconsistent task scheduler state inside executed functions;
+    incorrect floating-point settings and exception propagation;
+    possible stalls in concurrent invocations of execute().
+- Fixed floating-point settings propagation when the same instance of
+    task_group_context is used in different arenas.
+- Fixed compilation error in pipeline.h with Intel Compiler on OS X*.
+- Added missed headers for individual components to tbb.h.
+
+Open-source contributions integrated:
+
+- Range interface addition to parallel_do, parallel_for_each and
+    parallel_sort by Stephan Dollberg.
+- Variadic template implementation of parallel_invoke
+    by Kizza George Mbidde (see Preview Features).
+- Improvement in Seismic example for MacBook Pro* with Retina* display
+    by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.2 Update 5
+TBB_INTERFACE_VERSION == 7005
+
+Changes (w.r.t. Intel TBB 4.2 Update 4):
+
+- The second template argument of class aligned_space<T,N> now is set
+    to 1 by default.
+
+Preview Features:
+
+- Better support for exception safety, task priorities and floating
+    point settings in class task_arena.
+- task_arena::current_slot() has been renamed to
+    task_arena::current_thread_index().
+
+Bugs fixed:
+
+- Task priority change possibly ignored by a worker thread entering
+    a nested parallel construct.
+- Memory leaks inside the task scheduler when running on
+    Intel(R) Xeon Phi(tm) coprocessor.
+
+Open-source contributions integrated:
+
+- Improved detection of X Window support for Intel TBB examples
+    and other feedback by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.2 Update 4
+TBB_INTERFACE_VERSION == 7004
+
+Changes (w.r.t. Intel TBB 4.2 Update 3):
+
+- Added possibility to specify floating-point settings at invocation
+    of most parallel algorithms (including flow::graph) via
+    task_group_context.
+- Added dynamic replacement of malloc_usable_size() under
+    Linux*/Android* and dlmalloc_usable_size() under Android*.
+- Added new methods to concurrent_vector:
+    grow_by() that appends a sequence between two given iterators;
+    grow_to_at_least() that initializes new elements with a given value.
+- Improved affinity_partitioner for better performance on balanced
+    workloads.
+- Improvements in the task scheduler, including better scalability
+    when threads search for a task arena, and better diagnostics.
+- Improved allocation performance for workloads that do intensive
+    allocation/releasing of same-size objects larger than ~8KB from
+    multiple threads.
+- Exception support is enabled by default for 32-bit MinGW compilers.
+- The tachyon example for Android* can be built for all targets
+    supported by the installed NDK.
+- Added Windows Store* version of the tachyon example.
+- GettingStarted/sub_string_finder example ported to offload execution
+    on Windows* for Intel(R) Many Integrated Core Architecture.
+
+Preview Features:
+
+- Removed task_scheduler_observer::on_scheduler_leaving() callback.
+- Added task_scheduler_observer::may_sleep() callback.
+- The CPF or_node has been renamed indexer_node. The input to
+    indexer_node is now a list of types. The output of indexer_node is
+    a tagged_msg type composed of a tag and a value. For indexer_node,
+    the tag is a size_t.
+
+Bugs fixed:
+
+- Fixed data races in preview extensions of task_scheduler_observer.
+- Added noexcept(false) for destructor of task_group_base to avoid
+    crash on cancellation of structured task group in C++11.
+
+Open-source contributions integrated:
+
+- Improved concurrency detection for BG/Q, and other improvements
+    by Raf Schietekat.
+- Fix for crashes in enumerable_thread_specific in case if a contained
+    object is too big to be constructed on the stack by Adrien Guinet.
+
+------------------------------------------------------------------------
+Intel TBB 4.2 Update 3
+TBB_INTERFACE_VERSION == 7003
+
+Changes (w.r.t. Intel TBB 4.2 Update 2):
+
+- Added support for Microsoft* Visual Studio* 2013.
+- Improved Microsoft* PPL-compatible form of parallel_for for better
+    support of auto-vectorization.
+- Added a new example for cancellation and reset in the flow graph:
+    Kohonen self-organizing map (examples/graph/som).
+- Various improvements in source code, tests, and makefiles.
+
+Bugs fixed:
+
+- Added dynamic replacement of _aligned_msize() previously missed.
+- Fixed task_group::run_and_wait() to throw invalid_multiple_scheduling
+    exception if the specified task handle is already scheduled.
+
+Open-source contributions integrated:
+
+- A fix for ARM* processors by Steve Capper.
+- Improvements in std::swap calls by Robert Maynard.
+
+------------------------------------------------------------------------
+Intel TBB 4.2 Update 2
+TBB_INTERFACE_VERSION == 7002
+
+Changes (w.r.t. Intel TBB 4.2 Update 1):
+
+- Enable C++11 features for Microsoft* Visual Studio* 2013 Preview.
+- Added a test for compatibility of TBB containers with C++11
+    range-based for loop.
+
+Changes affecting backward compatibility:
+
+- Internal layout changed for class tbb::flow::limiter_node.
+
+Preview Features:
+
+- Added speculative_spin_rw_mutex, a read-write lock class which uses
+    Intel(R) Transactional Synchronization Extensions.
+
+Bugs fixed:
+
+- When building for Intel(R) Xeon Phi(tm) coprocessor, TBB programs
+    no longer require explicit linking with librt and libpthread.
+
+Open-source contributions integrated:
+
+- Fixes for ARM* processors by Steve Capper, Leif Lindholm
+    and Steven Noonan.
+- Support for Clang on Linux by Raf Schietekat.
+- Typo correction in scheduler.cpp by Julien Schueller.
+
+------------------------------------------------------------------------
+Intel TBB 4.2 Update 1
+TBB_INTERFACE_VERSION == 7001
+
+Changes (w.r.t. Intel TBB 4.2):
+
+- Added project files for Microsoft* Visual Studio* 2010.
+- Initial support of Microsoft* Visual Studio* 2013 Preview.
+- Enable C++11 features available in Intel(R) C++ Compiler 14.0.
+- scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT, <size>) can be
+    used to urge releasing memory from tbbmalloc internal buffers when
+    the given limit is exceeded.
+
+Preview Features:
+
+- Class task_arena no longer requires linking with a preview library,
+    though still remains a community preview feature.
+- The method task_arena::wait_until_empty() is removed.
+- The method task_arena::current_slot() now returns -1 if
+    the task scheduler is not initialized in the thread.
+
+Changes affecting backward compatibility:
+
+- Because of changes in internal layout of graph nodes, the namespace
+    interface number of flow::graph has been incremented from 6 to 7.
+
+Bugs fixed:
+
+- Fixed a race in lazy initialization of task_arena.
+- Fixed flow::graph::reset() to prevent situations where tasks would be
+    spawned in the process of resetting the graph to its initial state.
+- Fixed decrement bug in limiter_node.
+- Fixed a race in arc deletion in the flow graph.
+
+Open-source contributions integrated:
+
+- Improved support for IBM* Blue Gene* by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.2
+TBB_INTERFACE_VERSION == 7000
+
+Changes (w.r.t. Intel TBB 4.1 Update 4):
+
+- Added speculative_spin_mutex, which uses Intel(R) Transactional
+    Synchronization Extensions when they are supported by hardware.
+- Binary files linked with libc++ (the C++ standard library in Clang)
+    were added on OS X*.
+- For OS X* exact exception propagation is supported with Clang;
+    it requires use of libc++ and corresponding Intel TBB binaries.
+- Support for C++11 initializer lists in constructor and assigment
+    has been added to concurrent_hash_map, concurrent_unordered_set,
+    concurrent_unordered_multiset, concurrent_unordered_map,
+    concurrent_unordered_multimap.
+- The memory allocator may now clean its per-thread memory caches
+    when it cannot get more memory.
+- Added the scalable_allocation_command() function for on-demand
+    cleaning of internal memory caches.
+- Reduced the time overhead for freeing memory objects smaller than ~8K.
+- Simplified linking with the debug library for applications that use
+    Intel TBB in code offloaded to Intel(R) Xeon Phi(tm) coprocessors.
+    See an example in
+    examples/GettingStarted/sub_string_finder/Makefile.
+- Various improvements in source code, scripts and makefiles.
+
+Changes affecting backward compatibility:
+
+- tbb::flow::graph has been modified to spawn its tasks;
+    the old behaviour (task enqueuing) is deprecated. This change may
+    impact applications that expected a flow graph to make progress
+    without calling wait_for_all(), which is no longer guaranteed. See
+    the documentation for more details.
+- Changed the return values of the scalable_allocation_mode() function.
+
+Bugs fixed:
+
+- Fixed a leak of parallel_reduce body objects when execution is
+    cancelled or an exception is thrown, as suggested by Darcy Harrison.
+- Fixed a race in the task scheduler which can lower the effective
+    priority despite the existence of higher priority tasks.
+- On Linux an error during destruction of the internal thread local
+    storage no longer results in an exception.
+
+Open-source contributions integrated:
+
+- Fixed task_group_context state propagation to unrelated context trees
+    by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.1 Update 4
+TBB_INTERFACE_VERSION == 6105
+
+Changes (w.r.t. Intel TBB 4.1 Update 3):
+
+- Use /volatile:iso option with VS 2012 to disable extended
+    semantics for volatile variables.
+- Various improvements in affinity_partitioner, scheduler,
+    tests, examples, makefiles.
+- Concurrent_priority_queue class now supports initialization/assignment
+    via C++11 initializer list feature (std::initializer_list<T>).
+
+Bugs fixed:
+
+- Fixed more possible stalls in concurrent invocations of
+    task_arena::execute(), especially waiting for enqueued tasks.
+- Fixed requested number of workers for task_arena(P,0).
+- Fixed interoperability with Intel(R) VTune(TM) Amplifier XE in
+    case of using task_arena::enqueue() from a terminating thread.
+
+Open-source contributions integrated:
+
+- Type fixes, cleanups, and code beautification by Raf Schietekat.
+- Improvements in atomic operations for big endian platforms
+    by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 4.1 Update 3
+TBB_INTERFACE_VERSION == 6103
+
+Changes (w.r.t. Intel TBB 4.1 Update 2):
+
+- Binary files for Android* applications were added to the Linux* OS
+    package.
+- Binary files for Windows Store* applications were added to the
+    Windows* OS package.
+- Exact exception propagation (exception_ptr) support on Linux OS is
+    now turned on by default for GCC 4.4 and higher.
+- Stopped implicit use of large memory pages by tbbmalloc (Linux-only).
+    Now use of large pages must be explicitly enabled with
+    scalable_allocation_mode() function or TBB_MALLOC_USE_HUGE_PAGES
+    environment variable.
+
+Community Preview Features:
+
+- Extended class task_arena constructor and method initialize() to
+    allow some concurrency to be reserved strictly for application
+    threads.
+- New methods terminate() and is_active() were added to class
+    task_arena.
+
+Bugs fixed:
+
+- Fixed initialization of hashing helper constant in the hash
+    containers.
+- Fixed possible stalls in concurrent invocations of
+    task_arena::execute() when no worker thread is available to make
+    progress.
+- Fixed incorrect calculation of hardware concurrency in the presence
+    of inactive processor groups, particularly on systems running
+    Windows* 8 and Windows* Server 2012.
+
+Open-source contributions integrated:
+
+- The fix for the GUI examples on OS X* systems by Raf Schietekat.
+- Moved some power-of-2 calculations to functions to improve readability
+    by Raf Schietekat.
+- C++11/Clang support improvements by arcata.
+- ARM* platform isolation layer by Steve Capper, Leif Lindholm, Leo Lara
+    (ARM).
+
+------------------------------------------------------------------------
+Intel TBB 4.1 Update 2
+TBB_INTERFACE_VERSION == 6102
+
+Changes (w.r.t. Intel TBB 4.1 Update 1):
+
+- Objects up to 128 MB are now cached by the tbbmalloc. Previously
+    the threshold was 8MB. Objects larger than 128 MB are still
+    processed by direct OS calls.
+- concurrent_unordered_multiset and concurrent_unordered_multimap
+    have been added, based on Microsoft* PPL prototype.
+- Ability to value-initialize a tbb::atomic<T> variable on construction
+    in C++11, with const expressions properly supported.
+
+Community Preview Features:
+
+- Added a possibility to wait until all worker threads terminate.
+    This is necessary before calling fork() from an application.
+
+Bugs fixed:
+
+- Fixed data race in tbbmalloc that might lead to memory leaks
+    for large object allocations.
+- Fixed task_arena::enqueue() to use task_group_context of target arena.
+- Improved implementation of 64 bit atomics on ia32.
+
+------------------------------------------------------------------------
+Intel TBB 4.1 Update 1
+TBB_INTERFACE_VERSION == 6101
+
+Changes (w.r.t. Intel TBB 4.1):
+
+- concurrent_vector class now supports initialization/assignment
+    via C++11 initializer list feature (std::initializer_list<T>)
+- Added implementation of the platform isolation layer based on
+    Intel compiler atomic built-ins; it is supposed to work on
+    any platform supported by compiler version 12.1 and newer.
+- Using GetNativeSystemInfo() instead of GetSystemInfo() to support
+    more than 32 processors for 32-bit applications under WOW64.
+- The following form of parallel_for:
+    parallel_for(first, last, [step,] f[, context]) now accepts an
+    optional partitioner parameter after the function f.
+
+Backward-incompatible API changes:
+
+- The library no longer injects tuple in to namespace std.
+    In previous releases, tuple was injected into namespace std by
+    flow_graph.h when std::tuple was not available.  In this release,
+    flow_graph.h now uses tbb::flow::tuple.  On platforms where
+    std::tuple is available, tbb::flow::tuple is typedef'ed to
+    std::tuple.  On all other platforms, tbb::flow::tuple provides
+    a subset of the functionality defined by std::tuple. Users of
+    flow_graph.h may need to change their uses of std::tuple to
+    tbb::flow::tuple to ensure compatibility with non-C++11 compliant
+    compilers.
+
+Bugs fixed:
+
+- Fixed local observer to be able to override propagated CPU state and
+    to provide correct value of task_arena::current_slot() in callbacks.
+
+------------------------------------------------------------------------
+Intel TBB 4.1
+TBB_INTERFACE_VERSION == 6100
+
+Changes (w.r.t. Intel TBB 4.0 Update 5):
+
+- _WIN32_WINNT must be set to 0x0501 or greater in order to use TBB
+    on Microsoft* Windows*.
+- parallel_deterministic_reduce template function is fully supported.
+- TBB headers can be used with C++0x/C++11 mode (-std=c++0x) of GCC
+    and Intel(R) Compiler.
+- C++11 std::make_exception_ptr is used where available, instead of
+    std::copy_exception from earlier C++0x implementations.
+- Improvements in the TBB allocator to reduce extra memory consumption.
+- Partial refactoring of the task scheduler data structures.
+- TBB examples allow more flexible specification of the thread number,
+    including arithmetic and geometric progression.
+
+Bugs fixed:
+
+- On Linux & OS X*, pre-built TBB binaries do not yet support exact
+    exception propagation via C++11 exception_ptr. To prevent run time
+    errors, by default TBB headers disable exact exception propagation
+    even if the C++ implementation provides exception_ptr.
+
+Community Preview Features:
+
+- Added: class task_arena, for work submission by multiple application
+    threads with thread-independent control of concurrency level.
+- Added: task_scheduler_observer can be created as local to a master
+    thread, to observe threads that work on behalf of that master.
+    Local observers may have new on_scheduler_leaving() callback.
+
+------------------------------------------------------------------------
+Intel TBB 4.0 Update 5
+TBB_INTERFACE_VERSION == 6005
+
+Changes (w.r.t. Intel TBB 4.0 Update 4):
+
+- Parallel pipeline optimization (directly storing small objects in the
+    interstage data buffers) limited to trivially-copyable types for
+    C++11 and a short list of types for earlier compilers.
+- _VARIADIC_MAX switch is honored for TBB tuple implementation
+    and flow::graph nodes based on tuple.
+- Support of Cocoa framework was added to the GUI examples on OS X*
+    systems.
+
+Bugs fixed:
+
+- Fixed a tv_nsec overflow bug in condition_variable::wait_for.
+- Fixed execution order of enqueued tasks with different priorities.
+- Fixed a bug with task priority changes causing lack of progress
+    for fire-and-forget tasks when TBB was initialized to use 1 thread.
+- Fixed duplicate symbol problem when linking multiple compilation
+    units that include flow_graph.h on VC 10.
+
+------------------------------------------------------------------------
+Intel TBB 4.0 Update 4
+TBB_INTERFACE_VERSION == 6004
+
+Changes (w.r.t. Intel TBB 4.0 Update 3):
+
+- The TBB memory allocator transparently supports large pages on Linux.
+- A new flow_graph example, logic_sim, was added.
+- Support for DirectX* 9 was added to GUI examples.
+
+Community Preview Features:
+
+- Added: aggregator, a new concurrency control mechanism.
+
+Bugs fixed:
+
+- The abort operation on concurrent_bounded_queue now leaves the queue
+    in a reusable state. If a bad_alloc or bad_last_alloc exception is
+    thrown while the queue is recovering from an abort, that exception
+    will be reported instead of user_abort on the thread on which it
+    occurred, and the queue will not be reusable.
+- Steal limiting heuristic fixed to avoid premature stealing disabling
+    when large amount of __thread data is allocated on thread stack.
+- Fixed a low-probability leak of arenas in the task scheduler.
+- In STL-compatible allocator classes, the method construct() was fixed
+    to comply with C++11 requirements.
+- Fixed a bug that prevented creation of fixed-size memory pools
+    smaller than 2M.
+- Significantly reduced the amount of warnings from various compilers.
+
+Open-source contributions integrated:
+
+- Multiple improvements by Raf Schietekat.
+- Basic support for Clang on OS X* by Blas Rodriguez Somoza.
+- Fixes for warnings and corner-case bugs by Blas Rodriguez Somoza
+    and Edward Lam.
+
+------------------------------------------------------------------------
+Intel TBB 4.0 Update 3
+TBB_INTERFACE_VERSION == 6003
+
+Changes (w.r.t. Intel TBB 4.0 Update 2):
+
+- Modifications to the low-level API for memory pools:
+    added support for aligned allocations;
+    pool policies reworked to allow backward-compatible extensions;
+    added a policy to not return memory space till destruction;
+    pool_reset() does not return memory space anymore.
+- Class tbb::flow::graph_iterator added to iterate over all nodes
+    registered with a graph instance.
+- multioutput_function_node has been renamed multifunction_node.
+    multifunction_node and split_node are now fully-supported features.
+- For the tagged join node, the policy for try_put of an item with
+    already existing tag has been defined: the item will be rejected.
+- Matching the behavior on Windows, on other platforms the optional
+    shared libraries (libtbbmalloc, libirml) now are also searched
+    only in the directory where libtbb is located.
+- The platform isolation layer based on GCC built-ins is extended.
+
+Backward-incompatible API changes:
+
+- a graph reference parameter is now required to be passed to the
+    constructors of the following flow graph nodes: overwrite_node,
+    write_once_node, broadcast_node, and the CPF or_node.
+- the following tbb::flow node methods and typedefs have been renamed:
+       Old                             New
+    join_node and or_node:
+       inputs()                 ->     input_ports()
+       input_ports_tuple_type   ->     input_ports_type
+    multifunction_node and split_node:
+       ports_type               ->     output_ports_type
+
+Bugs fixed:
+
+- Not all logical processors were utilized on systems with more than
+    64 cores split by Windows into several processor groups.
+
+------------------------------------------------------------------------
+Intel TBB 4.0 Update 2 commercial-aligned release
+TBB_INTERFACE_VERSION == 6002
+
+Changes (w.r.t. Intel TBB 4.0 Update 1 commercial-aligned release):
+
+- concurrent_bounded_queue now has an abort() operation that releases
+    threads involved in pending push or pop operations. The released
+    threads will receive a tbb::user_abort exception.
+- Added Community Preview Feature:  concurrent_lru_cache container,
+    a concurrent implementation of LRU (least-recently-used) cache.
+
+Bugs fixed:
+
+- fixed a race condition in the TBB scalable allocator.
+- concurrent_queue counter wraparound bug was fixed, which occurred when
+    the number of push and pop operations exceeded ~>4 billion on IA32.
+- fixed races in the TBB scheduler that could put workers asleep too
+    early, especially in presence of affinitized tasks.
+
+------------------------------------------------------------------------
+Intel TBB 4.0 Update 1 commercial-aligned release
+TBB_INTERFACE_VERSION == 6000 (forgotten to increment)
+
+Changes (w.r.t. Intel TBB 4.0 commercial-aligned release):
+
+- Memory leaks fixed in binpack example.
+- Improvements and fixes in the TBB allocator.
+
+------------------------------------------------------------------------
+Intel TBB 4.0 commercial-aligned release
+TBB_INTERFACE_VERSION == 6000
+
+Changes (w.r.t. Intel TBB 3.0 Update 8 commercial-aligned release):
+
+- concurrent_priority_queue is now a fully supported feature.
+    Capacity control methods were removed.
+- Flow graph is now a fully supported feature.
+- A new memory backend has been implemented in the TBB allocator.
+    It can reuse freed memory for both small and large objects, and
+    returns unused memory blocks to the OS more actively.
+- Improved partitioning algorithms for parallel_for and parallel_reduce
+    to better handle load imbalance.
+- The convex_hull example has been refactored for reproducible
+    performance results.
+- The major interface version has changed from 5 to 6.
+    Deprecated interfaces might be removed in future releases.
+
+Community Preview Features:
+
+- Added: serial subset, i.e. sequential implementations of TBB generic
+    algorithms (currently, only provided for parallel_for).
+- Preview of new flow graph nodes:
+    or_node (accepts multiple inputs, forwards each input separately
+      to all successors),
+    split_node (accepts tuples, and forwards each element of a tuple
+      to a corresponding successor), and
+    multioutput_function_node (accepts one input, and passes the input
+    and a tuple of output ports to the function body to support outputs
+    to multiple successors).
+- Added: memory pools for more control on memory source, grouping,
+    and collective deallocation.
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 8 commercial-aligned release
+TBB_INTERFACE_VERSION == 5008
+
+Changes (w.r.t. Intel TBB 3.0 Update 7 commercial-aligned release):
+
+- Task priorities become an official feature of TBB,
+    not community preview as before.
+- Atomics API extended, and implementation refactored.
+- Added task::set_parent() method.
+- Added concurrent_unordered_set container.
+
+Open-source contributions integrated:
+
+- PowerPC support by Raf Schietekat.
+- Fix of potential task pool overrun and other improvements
+    in the task scheduler by Raf Schietekat.
+- Fix in parallel_for_each to work with std::set in Visual* C++ 2010.
+
+Community Preview Features:
+
+- Graph community preview feature was renamed to flow graph.
+    Multiple improvements in the implementation.
+    Binpack example was added for the feature.
+- A number of improvements to concurrent_priority_queue.
+    Shortpath example was added for the feature.
+- TBB runtime loaded functionality was added (Windows*-only).
+    It allows to specify which versions of TBB should be used,
+    as well as to set directories for the library search.
+- parallel_deterministic_reduce template function was added.
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 7 commercial-aligned release
+TBB_INTERFACE_VERSION == 5006 (forgotten to increment)
+
+Changes (w.r.t. Intel TBB 3.0 Update 6 commercial-aligned release):
+
+- Added implementation of the platform isolation layer based on
+    GCC atomic built-ins; it is supposed to work on any platform
+    where GCC has these built-ins.
+
+Community Preview Features:
+
+- Graph's dining_philosophers example added.
+- A number of improvements to graph and concurrent_priority_queue.
+
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 6 commercial-aligned release
+TBB_INTERFACE_VERSION == 5006
+
+Changes (w.r.t. Intel TBB 3.0 Update 5 commercial-aligned release):
+
+- Added Community Preview feature: task and task group priority, and
+    Fractal example demonstrating it.
+- parallel_pipeline optimized for data items of small and large sizes.
+- Graph's join_node is now parametrized with a tuple of up to 10 types.
+- Improved performance of concurrent_priority_queue.
+
+Open-source contributions integrated:
+
+- Initial NetBSD support by Aleksej Saushev.
+
+Bugs fixed:
+
+- Failure to enable interoperability with Intel(R) Cilk(tm) Plus runtime
+    library, and a crash caused by invoking the interoperability layer
+    after one of the libraries was unloaded.
+- Data race that could result in concurrent_unordered_map structure
+    corruption after call to clear() method.
+- Stack corruption caused by PIC version of 64-bit CAS compiled by Intel
+    compiler on Linux.
+- Inconsistency of exception propagation mode possible when application
+    built with Microsoft* Visual Studio* 2008 or earlier uses TBB built
+    with Microsoft* Visual Studio* 2010.
+- Affinitizing master thread to a subset of available CPUs after TBB
+    scheduler was initialized tied all worker threads to the same CPUs.
+- Method is_stolen_task() always returned 'false' for affinitized tasks.
+- write_once_node and overwrite_node did not immediately send buffered
+    items to successors
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 5 commercial-aligned release
+TBB_INTERFACE_VERSION == 5005
+
+Changes (w.r.t. Intel TBB 3.0 Update 4 commercial-aligned release):
+
+- Added Community Preview feature: graph.
+- Added automatic propagation of master thread FPU settings to
+    TBB worker threads.
+- Added a public function to perform a sequentially consistent full
+    memory fence: tbb::atomic_fence() in tbb/atomic.h.
+
+Bugs fixed:
+
+- Data race that could result in scheduler data structures corruption
+    when using fire-and-forget tasks.
+- Potential referencing of destroyed concurrent_hash_map element after
+    using erase(accessor&A) method with A acquired as const_accessor.
+- Fixed a correctness bug in the convex hull example.
+
+Open-source contributions integrated:
+
+- Patch for calls to internal::atomic_do_once() by Andrey Semashev.
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 4 commercial-aligned release
+TBB_INTERFACE_VERSION == 5004
+
+Changes (w.r.t. Intel TBB 3.0 Update 3 commercial-aligned release):
+
+- Added Community Preview feature: concurrent_priority_queue.
+- Fixed library loading to avoid possibility for remote code execution,
+    see http://www.microsoft.com/technet/security/advisory/2269637.mspx.
+- Added support of more than 64 cores for appropriate Microsoft*
+    Windows* versions. For more details, see
+    http://msdn.microsoft.com/en-us/library/dd405503.aspx.
+- Default number of worker threads is adjusted in accordance with
+    process affinity mask.
+
+Bugs fixed:
+
+- Calls of scalable_* functions from inside the allocator library
+    caused issues if the functions were overridden by another module.
+- A crash occurred if methods run() and wait() were called concurrently
+    for an empty tbb::task_group (1736).
+- The tachyon example exhibited build problems associated with
+    bug 554339 on Microsoft* Visual Studio* 2010. Project files were
+    modified as a partial workaround to overcome the problem. See
+    http://connect.microsoft.com/VisualStudio/feedback/details/554339.
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 3 commercial-aligned release
+TBB_INTERFACE_VERSION == 5003
+
+Changes (w.r.t. Intel TBB 3.0 Update 2 commercial-aligned release):
+
+- cache_aligned_allocator class reworked to use scalable_aligned_malloc.
+- Improved performance of count() and equal_range() methods
+    in concurrent_unordered_map.
+- Improved implementation of 64-bit atomic loads and stores on 32-bit
+    platforms, including compilation with VC 7.1.
+- Added implementation of atomic operations on top of OSAtomic API
+    provided by OS X*.
+- Removed gratuitous try/catch blocks surrounding thread function calls
+  in tbb_thread.
+- Xcode* projects were added for sudoku and game_of_life examples.
+- Xcode* projects were updated to work without TBB framework.
+
+Bugs fixed:
+
+- Fixed a data race in task scheduler destruction that on rare occasion
+    could result in memory corruption.
+- Fixed idle spinning in thread bound filters in tbb::pipeline (1670).
+
+Open-source contributions integrated:
+
+- MinGW-64 basic support by brsomoza (partially).
+- Patch for atomic.h by Andrey Semashev.
+- Support for AIX & GCC on PowerPC by Giannis Papadopoulos.
+- Various improvements by Raf Schietekat.
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 2 commercial-aligned release
+TBB_INTERFACE_VERSION == 5002
+
+Changes (w.r.t. Intel TBB 3.0 Update 1 commercial-aligned release):
+
+- Destructor of tbb::task_group class throws missing_wait exception
+    if there are tasks running when it is invoked.
+- Interoperability layer with Intel Cilk Plus runtime library added
+    to protect TBB TLS in case of nested usage with Intel Cilk Plus.
+- Compilation fix for dependent template names in concurrent_queue.
+- Memory allocator code refactored to ease development and maintenance.
+
+Bugs fixed:
+
+- Improved interoperability with other Intel software tools on Linux in
+    case of dynamic replacement of memory allocator (1700)
+- Fixed install issues that prevented installation on
+    Mac OS* X 10.6.4 (1711).
+
+------------------------------------------------------------------------
+Intel TBB 3.0 Update 1 commercial-aligned release
+TBB_INTERFACE_VERSION == 5000 (forgotten to increment)
+
+Changes (w.r.t. Intel TBB 3.0 commercial-aligned release):
+
+- Decreased memory fragmentation by allocations bigger than 8K.
+- Lazily allocate worker threads, to avoid creating unnecessary stacks.
+
+Bugs fixed:
+
+- TBB allocator used much more memory than malloc (1703) - see above.
+- Deadlocks happened in some specific initialization scenarios
+    of the TBB allocator (1701, 1704).
+- Regression in enumerable_thread_specific: excessive requirements
+    for object constructors.
+- A bug in construction of parallel_pipeline filters when body instance
+    was a temporary object.
+- Incorrect usage of memory fences on PowerPC and XBOX360 platforms.
+- A subtle issue in task group context binding that could result
+    in cancellation signal being missed by nested task groups.
+- Incorrect construction of concurrent_unordered_map if specified
+    number of buckets is not power of two.
+- Broken count() and equal_range() of concurrent_unordered_map.
+- Return type of postfix form of operator++ for hash map's iterators.
+
+------------------------------------------------------------------------
+Intel TBB 3.0 commercial-aligned release
+TBB_INTERFACE_VERSION == 5000
+
+Changes (w.r.t. Intel TBB 2.2 Update 3 commercial-aligned release):
+
+- All open-source-release changes down to TBB 2.2 U3 below
+    were incorporated into this release.
+
+------------------------------------------------------------------------
+20100406 open-source release
+
+Changes (w.r.t. 20100310 open-source release):
+
+- Added support for Microsoft* Visual Studio* 2010, including binaries.
+- Added a PDF file with recommended Design Patterns for TBB.
+- Added parallel_pipeline function and companion classes and functions
+    that provide a strongly typed lambda-friendly pipeline interface.
+- Reworked enumerable_thread_specific to use a custom implementation of
+    hash map that is more efficient for ETS usage models.
+- Added example for class task_group; see examples/task_group/sudoku.
+- Removed two examples, as they were long outdated and superceded:
+    pipeline/text_filter (use pipeline/square);
+    parallel_while/parallel_preorder (use parallel_do/parallel_preorder).
+- PDF documentation updated.
+- Other fixes and changes in code, tests, and examples.
+
+Bugs fixed:
+
+- Eliminated build errors with MinGW32.
+- Fixed post-build step and other issues in VS projects for examples.
+- Fixed discrepancy between scalable_realloc and scalable_msize that
+    caused crashes with malloc replacement on Windows.
+
+------------------------------------------------------------------------
+20100310 open-source release
+
+Changes (w.r.t. Intel TBB 2.2 Update 3 commercial-aligned release):
+
+- Version macros changed in anticipation of a future release.
+- Directory structure aligned with Intel(R) C++ Compiler;
+    now TBB binaries reside in <arch>/<os_key>/[bin|lib]
+    (in TBB 2.x, it was [bin|lib]/<arch>/<os_key>).
+- Visual Studio projects changed for examples: instead of separate set
+    of files for each VS version, now there is single 'msvs' directory
+    that contains workspaces for MS C++ compiler (<example>_cl.sln) and
+    Intel C++ compiler (<example>_icl.sln). Works with VS 2005 and above.
+- The name versioning scheme for backward compatibility was improved;
+    now compatibility-breaking changes are done in a separate namespace.
+- Added concurrent_unordered_map implementation based on a prototype
+    developed in Microsoft for a future version of PPL.
+- Added PPL-compatible writer-preference RW lock (reader_writer_lock).
+- Added TBB_IMPLEMENT_CPP0X macro to control injection of C++0x names
+    implemented in TBB into namespace std.
+- Added almost-C++0x-compatible std::condition_variable, plus a bunch
+    of other C++0x classes required by condition_variable.
+- With TBB_IMPLEMENT_CPP0X, tbb_thread can be also used as std::thread.
+- task.cpp was split into several translation units to structure
+    TBB scheduler sources layout. Static data layout and library
+    initialization logic were also updated.
+- TBB scheduler reworked to prevent master threads from stealing
+    work belonging to other masters.
+- Class task was extended with enqueue() method, and slightly changed
+    semantics of methods spawn() and destroy(). For exact semantics,
+    refer to TBB Reference manual.
+- task_group_context now allows for destruction by non-owner threads.
+- Added TBB_USE_EXCEPTIONS macro to control use of exceptions in TBB
+    headers. It turns off (i.e. sets to 0) automatically if specified
+    compiler options disable exception handling.
+- TBB is enabled to run on top of Microsoft's Concurrency Runtime
+    on Windows* 7 (via our worker dispatcher known as RML).
+- Removed old unused busy-waiting code in concurrent_queue.
+- Described the advanced build & test options in src/index.html.
+- Warning level for GCC raised with -Wextra and a few other options.
+- Multiple fixes and improvements in code, tests, examples, and docs.
+
+Open-source contributions integrated:
+
+- Xbox support by Roman Lut (Deep Shadows), though further changes are
+    required to make it working; e.g. post-2.1 entry points are missing.
+- "Eventcount" by Dmitry Vyukov evolved into concurrent_monitor,
+    an internal class used in the implementation of concurrent_queue.
+
+------------------------------------------------------------------------
+Intel TBB 2.2 Update 3 commercial-aligned release
+TBB_INTERFACE_VERSION == 4003
+
+Changes (w.r.t. Intel TBB 2.2 Update 2 commercial-aligned release):
+
+- PDF documentation updated.
+
+Bugs fixed:
+
+- concurrent_hash_map compatibility issue exposed on Linux in case
+    two versions of the container were used by different modules.
+- enforce 16 byte stack alignment for consistence with GCC; required
+    to work correctly with 128-bit variables processed by SSE.
+- construct() methods of allocator classes now use global operator new.
+
+------------------------------------------------------------------------
+Intel TBB 2.2 Update 2 commercial-aligned release
+TBB_INTERFACE_VERSION == 4002
+
+Changes (w.r.t. Intel TBB 2.2 Update 1 commercial-aligned release):
+
+- parallel_invoke and parallel_for_each now take function objects
+    by const reference, not by value.
+- Building TBB with /MT is supported, to avoid dependency on particular
+    versions of Visual C++* runtime DLLs. TBB DLLs built with /MT
+    are located in vc_mt directory.
+- Class critical_section introduced.
+- Improvements in exception support: new exception classes introduced,
+    all exceptions are thrown via an out-of-line internal method.
+- Improvements and fixes in the TBB allocator and malloc replacement,
+    including robust memory identification, and more reliable dynamic
+    function substitution on Windows*.
+- Method swap() added to class tbb_thread.
+- Methods rehash() and bucket_count() added to concurrent_hash_map.
+- Added support for Visual Studio* 2010 Beta2. No special binaries
+    provided, but CRT-independent DLLs (vc_mt) should work.
+- Other fixes and improvements in code, tests, examples, and docs.
+
+Open-source contributions integrated:
+
+- The fix to build 32-bit TBB on Mac OS* X 10.6.
+- GCC-based port for SPARC Solaris by Michailo Matijkiw, with use of
+    earlier work by Raf Schietekat.
+
+Bugs fixed:
+
+- 159 - TBB build for PowerPC* running Mac OS* X.
+- 160 - IBM* Java segfault if used with TBB allocator.
+- crash in concurrent_queue<char> (1616).
+
+------------------------------------------------------------------------
+Intel TBB 2.2 Update 1 commercial-aligned release
+TBB_INTERFACE_VERSION == 4001
+
+Changes (w.r.t. Intel TBB 2.2 commercial-aligned release):
+
+- Incorporates all changes from open-source releases below.
+- Documentation was updated.
+- TBB scheduler auto-initialization now covers all possible use cases.
+- concurrent_queue: made argument types of sizeof used in paddings
+  consistent with those actually used.
+- Memory allocator was improved: supported corner case of user's malloc
+    calling scalable_malloc (non-Windows), corrected processing of
+    memory allocation requests during tbb memory allocator startup
+    (Linux).
+- Windows malloc replacement has got better support for static objects.
+- In pipeline setups that do not allow actual parallelism, execution
+    by a single thread is guaranteed, idle spinning eliminated, and
+    performance improved.
+- RML refactoring and clean-up.
+- New constructor for concurrent_hash_map allows reserving space for
+    a number of items.
+- Operator delete() added to the TBB exception classes.
+- Lambda support was improved in parallel_reduce.
+- gcc 4.3 warnings were fixed for concurrent_queue.
+- Fixed possible initialization deadlock in modules using TBB entities
+    during construction of global static objects.
+- Copy constructor in concurrent_hash_map was fixed.
+- Fixed a couple of rare crashes in the scheduler possible before
+    in very specific use cases.
+- Fixed a rare crash in the TBB allocator running out of memory.
+- New tests were implemented, including test_lambda.cpp that checks
+    support for lambda expressions.
+- A few other small changes in code, tests, and documentation.
+
+------------------------------------------------------------------------
+20090809 open-source release
+
+Changes (w.r.t. Intel TBB 2.2 commercial-aligned release):
+
+- Fixed known exception safety issues in concurrent_vector.
+- Better concurrency of simultaneous grow requests in concurrent_vector.
+- TBB allocator further improves performance of large object allocation.
+- Problem with source of text relocations was fixed on Linux
+- Fixed bugs related to malloc replacement under Windows
+- A few other small changes in code and documentation.
+
+------------------------------------------------------------------------
+Intel TBB 2.2 commercial-aligned release
+TBB_INTERFACE_VERSION == 4000
+
+Changes (w.r.t. Intel TBB 2.1 U4 commercial-aligned release):
+
+- Incorporates all changes from open-source releases below.
+- Architecture folders renamed from em64t to intel64 and from itanium
+    to ia64.
+- Major Interface version changed from 3 to 4. Deprecated interfaces
+    might be removed in future releases.
+- Parallel algorithms that use partitioners have switched to use
+    the auto_partitioner by default.
+- Improved memory allocator performance for allocations bigger than 8K.
+- Added new thread-bound filters functionality for pipeline.
+- New implementation of concurrent_hash_map that improves performance
+    significantly.
+- A few other small changes in code and documentation.
+
+------------------------------------------------------------------------
+20090511 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Basic support for MinGW32 development kit.
+- Added tbb::zero_allocator class that initializes memory with zeros.
+    It can be used as an adaptor to any STL-compatible allocator class.
+- Added tbb::parallel_for_each template function as alias to parallel_do.
+- Added more overloads for tbb::parallel_for.
+- Added support for exact exception propagation (can only be used with
+    compilers that support C++0x std::exception_ptr).
+- tbb::atomic template class can be used with enumerations.
+- mutex, recursive_mutex, spin_mutex, spin_rw_mutex classes extended
+    with explicit lock/unlock methods.
+- Fixed size() and grow_to_at_least() methods of tbb::concurrent_vector
+    to provide space allocation guarantees. More methods added for
+    compatibility with std::vector, including some from C++0x.
+- Preview of a lambda-friendly interface for low-level use of tasks.
+- scalable_msize function added to the scalable allocator (Windows only).
+- Rationalized internal auxiliary functions for spin-waiting and backoff.
+- Several tests undergo decent refactoring.
+
+Changes affecting backward compatibility:
+
+- Improvements in concurrent_queue, including limited API changes.
+    The previous version is deprecated; its functionality is accessible
+    via methods of the new tbb::concurrent_bounded_queue class.
+- grow* and push_back methods of concurrent_vector changed to return
+    iterators; old semantics is deprecated.
+
+------------------------------------------------------------------------
+Intel TBB 2.1 Update 4 commercial-aligned release
+TBB_INTERFACE_VERSION == 3016
+
+Changes (w.r.t. Intel TBB 2.1 U3 commercial-aligned release):
+
+- Added tests for aligned memory allocations and malloc replacement.
+- Several improvements for better bundling with Intel(R) C++ Compiler.
+- A few other small changes in code and documentaion.
+
+Bugs fixed:
+
+- 150 - request to build TBB examples with debug info in release mode.
+- backward compatibility issue with concurrent_queue on Windows.
+- dependency on VS 2005 SP1 runtime libraries removed.
+- compilation of GUI examples under Xcode* 3.1 (1577).
+- On Windows, TBB allocator classes can be instantiated with const types
+    for compatibility with MS implementation of STL containers (1566).
+
+------------------------------------------------------------------------
+20090313 open-source release
+
+Changes (w.r.t. 20081109 open-source release):
+
+- Includes all changes introduced in TBB 2.1 Update 2 & Update 3
+    commercial-aligned releases (see below for details).
+- Added tbb::parallel_invoke template function. It runs up to 10
+    user-defined functions in parallel and waits for them to complete.
+- Added a special library providing ability to replace the standard
+    memory allocation routines in Microsoft* C/C++ RTL (malloc/free,
+    global new/delete, etc.) with the TBB memory allocator.
+    Usage details are described in include/tbb/tbbmalloc_proxy.h file.
+- Task scheduler switched to use new implementation of its core
+    functionality (deque based task pool, new structure of arena slots).
+- Preview of Microsoft* Visual Studio* 2005 project files for
+    building the library is available in build/vsproject folder.
+- Added tests for aligned memory allocations and malloc replacement.
+- Added parallel_for/game_of_life.net example (for Windows only)
+    showing TBB usage in a .NET application.
+- A number of other fixes and improvements to code, tests, makefiles,
+    examples and documents.
+
+Bugs fixed:
+
+- The same list as in TBB 2.1 Update 4 right above.
+
+------------------------------------------------------------------------
+Intel TBB 2.1 Update 3 commercial-aligned release
+TBB_INTERFACE_VERSION == 3015
+
+Changes (w.r.t. Intel TBB 2.1 U2 commercial-aligned release):
+
+- Added support for aligned allocations to the TBB memory allocator.
+- Added a special library to use with LD_PRELOAD on Linux* in order to
+    replace the standard memory allocation routines in C/C++ with the
+    TBB memory allocator.
+- Added null_mutex and null_rw_mutex: no-op classes interface-compliant
+    to other TBB mutexes.
+- Improved performance of parallel_sort, to close most of the serial gap
+    with std::sort, and beat it on 2 and more cores.
+- A few other small changes.
+
+Bugs fixed:
+
+- the problem where parallel_for hanged after exception throw
+    if affinity_partitioner was used (1556).
+- get rid of VS warnings about mbstowcs deprecation (1560),
+    as well as some other warnings.
+- operator== for concurrent_vector::iterator fixed to work correctly
+    with different vector instances.
+
+------------------------------------------------------------------------
+Intel TBB 2.1 Update 2 commercial-aligned release
+TBB_INTERFACE_VERSION == 3014
+
+Changes (w.r.t. Intel TBB 2.1 U1 commercial-aligned release):
+
+- Incorporates all open-source-release changes down to TBB 2.1 U1,
+    except for:
+    - 20081019 addition of enumerable_thread_specific;
+- Warning level for Microsoft* Visual C++* compiler raised to /W4 /Wp64;
+    warnings found on this level were cleaned or suppressed.
+- Added TBB_runtime_interface_version API function.
+- Added new example: pipeline/square.
+- Added exception handling and cancellation support
+    for parallel_do and pipeline.
+- Added copy constructor and [begin,end) constructor to concurrent_queue.
+- Added some support for beta version of Intel(R) Parallel Amplifier.
+- Added scripts to set environment for cross-compilation of 32-bit
+    applications on 64-bit Linux with Intel(R) C++ Compiler.
+- Fixed semantics of concurrent_vector::clear() to not deallocate
+    internal arrays. Fixed compact() to perform such deallocation later.
+- Fixed the issue with atomic<T*> when T is incomplete type.
+- Improved support for PowerPC* Macintosh*, including the fix
+    for a bug in masked compare-and-swap reported by a customer.
+- As usual, a number of other improvements everywhere.
+
+------------------------------------------------------------------------
+20081109 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Added new serial out of order filter for tbb::pipeline.
+- Fixed the issue with atomic<T*>::operator= reported at the forum.
+- Fixed the issue with using tbb::task::self() in task destructor
+    reported at the forum.
+- A number of other improvements to code, tests, makefiles, examples
+    and documents.
+
+Open-source contributions integrated:
+- Changes in the memory allocator were partially integrated.
+
+------------------------------------------------------------------------
+20081019 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Introduced enumerable_thread_specific<T>.  This new class provides a
+    wrapper around native thread local storage as well as iterators and
+    ranges for accessing the thread local copies (1533).
+- Improved support for Intel(R) Threading Analysis Tools
+    on Intel(R) 64 architecture.
+- Dependency from Microsoft* CRT was integrated to the libraries using
+    manifests, to avoid issues if called from code that uses different
+    version of Visual C++* runtime than the library.
+- Introduced new defines TBB_USE_ASSERT, TBB_USE_DEBUG,
+    TBB_USE_PERFORMANCE_WARNINGS, TBB_USE_THREADING_TOOLS.
+- A number of other improvements to code, tests, makefiles, examples
+    and documents.
+
+Open-source contributions integrated:
+
+- linker optimization: /incremental:no .
+
+------------------------------------------------------------------------
+20080925 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Same fix for a memory leak in the memory allocator as in TBB 2.1 U1.
+- Improved support for lambda functions.
+- Fixed more concurrent_queue issues reported at the forum.
+- A number of other improvements to code, tests, makefiles, examples
+    and documents.
+
+------------------------------------------------------------------------
+Intel TBB 2.1 Update 1 commercial-aligned release
+TBB_INTERFACE_VERSION == 3013
+
+Changes (w.r.t. Intel TBB 2.1 commercial-aligned release):
+
+- Fixed small memory leak in the memory allocator.
+- Incorporates all open-source-release changes since TBB 2.1,
+    except for:
+    - 20080825 changes for parallel_do;
+
+------------------------------------------------------------------------
+20080825 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Added exception handling and cancellation support for parallel_do.
+- Added default HashCompare template argument for concurrent_hash_map.
+- Fixed concurrent_queue.clear() issues due to incorrect assumption
+    about clear() being private method.
+- Added the possibility to use TBB in applications that change
+    default calling conventions (Windows* only).
+- Many improvements to code, tests, examples, makefiles and documents.
+
+Bugs fixed:
+
+- 120, 130 - memset declaration missed in concurrent_hash_map.h
+
+------------------------------------------------------------------------
+20080724 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Inline assembly for atomic operations improved for gcc 4.3
+- A few more improvements to the code.
+
+------------------------------------------------------------------------
+20080709 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- operator=() was added to the tbb_thread class according to
+    the current working draft for std::thread.
+- Recognizing SPARC* in makefiles for Linux* and Sun Solaris*.
+
+Bugs fixed:
+
+- 127 - concurrent_hash_map::range fixed to split correctly.
+
+Open-source contributions integrated:
+
+- fix_set_midpoint.diff by jyasskin
+- SPARC* support in makefiles by Raf Schietekat
+
+------------------------------------------------------------------------
+20080622 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Fixed a hang that rarely happened on Linux
+    during deinitialization of the TBB scheduler.
+- Improved support for Intel(R) Thread Checker.
+- A few more improvements to the code.
+
+------------------------------------------------------------------------
+Intel TBB 2.1 commercial-aligned release
+TBB_INTERFACE_VERSION == 3011
+
+Changes (w.r.t. Intel TBB 2.0 U3 commercial-aligned release):
+
+- All open-source-release changes down to, and including, TBB 2.0 below,
+    were incorporated into this release.
+
+------------------------------------------------------------------------
+20080605 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Explicit control of exported symbols by version scripts added on Linux.
+- Interfaces polished for exception handling & algorithm cancellation.
+- Cache behavior improvements in the scalable allocator.
+- Improvements in text_filter, polygon_overlay, and other examples.
+- A lot of other stability improvements in code, tests, and makefiles.
+- First release where binary packages include headers/docs/examples, so
+    binary packages are now self-sufficient for using TBB.
+
+Open-source contributions integrated:
+
+- atomics patch (partially).
+- tick_count warning patch.
+
+Bugs fixed:
+
+- 118 - fix for boost compatibility.
+- 123 - fix for tbb_machine.h.
+
+------------------------------------------------------------------------
+20080512 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Fixed a problem with backward binary compatibility
+    of debug Linux builds.
+- Sun* Studio* support added.
+- soname support added on Linux via linker script. To restore backward
+    binary compatibility, *.so -> *.so.2 softlinks should be created.
+- concurrent_hash_map improvements - added few new forms of insert()
+    method and fixed precondition and guarantees of erase() methods.
+    Added runtime warning reporting about bad hash function used for
+    the container. Various improvements for performance and concurrency.
+- Cancellation mechanism reworked so that it does not hurt scalability.
+- Algorithm parallel_do reworked. Requirement for Body::argument_type
+    definition removed, and work item argument type can be arbitrarily
+    cv-qualified.
+- polygon_overlay example added.
+- A few more improvements to code, tests, examples and Makefiles.
+
+Open-source contributions integrated:
+
+- Soname support patch for Bugzilla #112.
+
+Bugs fixed:
+
+- 112 - fix for soname support.
+
+------------------------------------------------------------------------
+Intel TBB 2.0 U3 commercial-aligned release (package 017, April 20, 2008)
+
+Corresponds to commercial 019 (for Linux*, 020; for Mac OS* X, 018)
+packages.
+
+Changes (w.r.t. Intel TBB 2.0 U2 commercial-aligned release):
+
+- Does not contain open-source-release changes below; this release is
+    only a minor update of TBB 2.0 U2.
+- Removed spin-waiting in pipeline and concurrent_queue.
+- A few more small bug fixes from open-source releases below.
+
+------------------------------------------------------------------------
+20080408 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- count_strings example reworked: new word generator implemented, hash
+    function replaced, and tbb_allocator is used with std::string class.
+- Static methods of spin_rw_mutex were replaced by normal member
+    functions, and the class name was versioned.
+- tacheon example was renamed to tachyon.
+- Improved support for Intel(R) Thread Checker.
+- A few more minor improvements.
+
+Open-source contributions integrated:
+
+- Two sets of Sun patches for IA Solaris support.
+
+------------------------------------------------------------------------
+20080402 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Exception handling and cancellation support for tasks and algorithms
+    fully enabled.
+- Exception safety guaranties defined and fixed for all concurrent
+    containers.
+- User-defined memory allocator support added to all concurrent
+    containers.
+- Performance improvement of concurrent_hash_map, spin_rw_mutex.
+- Critical fix for a rare race condition during scheduler
+    initialization/de-initialization.
+- New methods added for concurrent containers to be closer to STL,
+    as well as automatic filters removal from pipeline
+    and __TBB_AtomicAND function.
+- The volatile keyword dropped from where it is not really needed.
+- A few more minor improvements.
+
+------------------------------------------------------------------------
+20080319 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Support for gcc version 4.3 was added.
+- tbb_thread class, near compatible with std::thread expected in C++0x,
+    was added.
+
+Bugs fixed:
+
+- 116 - fix for compilation issues with gcc version 4.2.1.
+- 120 - fix for compilation issues with gcc version 4.3.
+
+------------------------------------------------------------------------
+20080311 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- An enumerator added for pipeline filter types (serial vs. parallel).
+- New task_scheduler_observer class introduced, to observe when
+    threads start and finish interacting with the TBB task scheduler.
+- task_scheduler_init reverted to not use internal versioned class;
+    binary compatibility guaranteed with stable releases only.
+- Various improvements to code, tests, examples and Makefiles.
+
+------------------------------------------------------------------------
+20080304 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Task-to-thread affinity support, previously kept under a macro,
+    now fully legalized.
+- Work-in-progress on cache_aligned_allocator improvements.
+- Pipeline really supports parallel input stage; it's no more serialized.
+- Various improvements to code, tests, examples and Makefiles.
+
+Bugs fixed:
+
+- 119 - fix for scalable_malloc sometimes failing to return a big block.
+- TR575 - fixed a deadlock occurring on Windows in startup/shutdown
+    under some conditions.
+
+------------------------------------------------------------------------
+20080226 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Introduced tbb_allocator to select between standard allocator and
+    tbb::scalable_allocator when available.
+- Removed spin-waiting in pipeline and concurrent_queue.
+- Improved performance of concurrent_hash_map by using tbb_allocator.
+- Improved support for Intel(R) Thread Checker.
+- Various improvements to code, tests, examples and Makefiles.
+
+------------------------------------------------------------------------
+Intel TBB 2.0 U2 commercial-aligned release (package 017, February 14, 2008)
+
+Corresponds to commercial 017 (for Linux*, 018; for Mac OS* X, 016)
+packages.
+
+Changes (w.r.t. Intel TBB 2.0 U1 commercial-aligned release):
+
+- Does not contain open-source-release changes below; this release is
+    only a minor update of TBB 2.0 U1.
+- Add support for Microsoft* Visual Studio* 2008, including binary
+    libraries and VS2008 projects for examples.
+- Use SwitchToThread() not Sleep() to yield threads on Windows*.
+- Enhancements to Doxygen-readable comments in source code.
+- A few more small bug fixes from open-source releases below.
+
+Bugs fixed:
+
+- TR569 - Memory leak in concurrent_queue.
+
+------------------------------------------------------------------------
+20080207 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Improvements and minor fixes in VS2008 projects for examples.
+- Improvements in code for gating worker threads that wait for work,
+  previously consolidated under #if IMPROVED_GATING, now legalized.
+- Cosmetic changes in code, examples, tests.
+
+Bugs fixed:
+
+- 113 - Iterators and ranges should be convertible to their const
+    counterparts.
+- TR569 - Memory leak in concurrent_queue.
+
+------------------------------------------------------------------------
+20080122 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Updated examples/parallel_for/seismic to improve the visuals and to
+    use the affinity_partitioner (20071127 and forward) for better
+    performance.
+- Minor improvements to unittests and performance tests.
+
+------------------------------------------------------------------------
+20080115 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Cleanup, simplifications and enhancements to the Makefiles for
+    building the libraries (see build/index.html for high-level
+    changes) and the examples.
+- Use SwitchToThread() not Sleep() to yield threads on Windows*.
+- Engineering work-in-progress on exception safety/support.
+- Engineering work-in-progress on affinity_partitioner for
+    parallel_reduce.
+- Engineering work-in-progress on improved gating for worker threads
+    (idle workers now block in the OS instead of spinning).
+- Enhancements to Doxygen-readable comments in source code.
+
+Bugs fixed:
+
+- 102 - Support for parallel build with gmake -j
+- 114 - /Wp64 build warning on Windows*.
+
+------------------------------------------------------------------------
+20071218 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Full support for Microsoft* Visual Studio* 2008 in open-source.
+    Binaries for vc9/ will be available in future stable releases.
+- New recursive_mutex class.
+- Full support for 32-bit PowerMac including export files for builds.
+- Improvements to parallel_do.
+
+------------------------------------------------------------------------
+20071206 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Support for Microsoft* Visual Studio* 2008 in building libraries
+    from source as well as in vc9/ projects for examples.
+- Small fixes to the affinity_partitioner first introduced in 20071127.
+- Small fixes to the thread-stack size hook first introduced in 20071127.
+- Engineering work in progress on concurrent_vector.
+- Engineering work in progress on exception behavior.
+- Unittest improvements.
+
+------------------------------------------------------------------------
+20071127 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- Task-to-thread affinity support (affinity partitioner) first appears.
+- More work on concurrent_vector.
+- New parallel_do algorithm (function-style version of parallel while)
+    and parallel_do/parallel_preorder example.
+- New task_scheduler_init() hooks for getting default_num_threads() and
+    for setting thread stack size.
+- Support for weak memory consistency models in the code base.
+- Futex usage in the task scheduler (Linux).
+- Started adding 32-bit PowerMac support.
+- Intel(R) 9.1 compilers are now the base supported Intel(R) compiler
+    version.
+- TBB libraries added to link line automatically on Microsoft Windows*
+    systems via #pragma comment linker directives.
+
+Open-source contributions integrated:
+
+- FreeBSD platform support patches.
+- AIX weak memory model patch.
+
+Bugs fixed:
+
+- 108 - Removed broken affinity.h reference.
+- 101 - Does not build on Debian Lenny (replaced arch with uname -m).
+
+------------------------------------------------------------------------
+20071030 open-source release
+
+Changes (w.r.t. previous open-source release):
+
+- More work on concurrent_vector.
+- Better support for building with -Wall -Werror (or not) as desired.
+- A few fixes to eliminate extraneous warnings.
+- Begin introduction of versioning hooks so that the internal/API
+    version is tracked via TBB_INTERFACE_VERSION.  The newest binary
+    libraries should always work with previously-compiled code when-
+    ever possible.
+- Engineering work in progress on using futex inside the mutexes (Linux).
+- Engineering work in progress on exception behavior.
+- Engineering work in progress on a new parallel_do algorithm.
+- Unittest improvements.
+
+------------------------------------------------------------------------
+20070927 open-source release
+
+Changes (w.r.t. Intel TBB 2.0 U1 commercial-aligned release):
+
+- Minor update to TBB 2.0 U1 below.
+- Begin introduction of new concurrent_vector interfaces not released
+    with TBB 2.0 U1.
+
+------------------------------------------------------------------------
+Intel TBB 2.0 U1 commercial-aligned release (package 014, October 1, 2007)
+
+Corresponds to commercial 014 (for Linux*, 016) packages.
+
+Changes (w.r.t. Intel TBB 2.0 commercial-aligned release):
+
+- All open-source-release changes down to, and including, TBB 2.0
+    below, were incorporated into this release.
+- Made a number of changes to the officially supported OS list:
+    Added Linux* OSs:
+	Asianux* 3, Debian* 4.0, Fedora Core* 6, Fedora* 7,
+	Turbo Linux* 11, Ubuntu* 7.04;
+    Dropped Linux* OSs:
+	Asianux* 2, Fedora Core* 4, Haansoft* Linux 2006 Server,
+	Mandriva/Mandrake* 10.1, Miracle Linux* 4.0,
+	Red Flag* DC Server 5.0;
+    Only Mac OS* X 10.4.9 (and forward) and Xcode* tool suite 2.4.1 (and
+	forward) are now supported.
+- Commercial installers on Linux* fixed to recommend the correct
+    binaries to use in more cases, with less unnecessary warnings.
+- Changes to eliminate spurious build warnings.
+
+Open-source contributions integrated:
+
+- Two small header guard macro patches; it also fixed bug #94.
+- New blocked_range3d class.
+
+Bugs fixed:
+
+- 93 - Removed misleading comments in task.h.
+- 94 - See above.
+
+------------------------------------------------------------------------
+20070815 open-source release
+
+Changes:
+
+- Changes to eliminate spurious build warnings.
+- Engineering work in progress on concurrent_vector allocator behavior.
+- Added hooks to use the Intel(R) compiler code coverage tools.
+
+Open-source contributions integrated:
+
+- Mac OS* X build warning patch.
+
+Bugs fixed:
+
+- 88 - Fixed TBB compilation errors if both VS2005 and Windows SDK are
+    installed.
+
+------------------------------------------------------------------------
+20070719 open-source release
+
+Changes:
+
+- Minor update to TBB 2.0 commercial-aligned release below.
+- Changes to eliminate spurious build warnings.
+
+------------------------------------------------------------------------
+Intel TBB 2.0 commercial-aligned release (package 010, July 19, 2007)
+
+Corresponds to commercial 010 (for Linux*, 012) packages.
+
+- TBB open-source debut release.
+
+------------------------------------------------------------------------
+Intel TBB 1.1 commercial release (April 10, 2007)
+
+Changes (w.r.t. Intel TBB 1.0 commercial release):
+
+- auto_partitioner which offered an automatic alternative to specifying
+    a grain size parameter to estimate the best granularity for tasks.
+- The release was added to the Intel(R) C++ Compiler 10.0 Pro.
+
+------------------------------------------------------------------------
+Intel TBB 1.0 Update 2 commercial release
+
+Changes (w.r.t. Intel TBB 1.0 Update 1 commercial release):
+
+- Mac OS* X 64-bit support added.
+- Source packages for commercial releases introduced.
+
+------------------------------------------------------------------------
+Intel TBB 1.0 Update 1 commercial-aligned release
+
+Changes (w.r.t. Intel TBB 1.0 commercial release):
+
+- Fix for critical package issue on Mac OS* X.
+
+------------------------------------------------------------------------
+Intel TBB 1.0 commercial release (August 29, 2006)
+
+Changes (w.r.t. Intel TBB 1.0 beta commercial release):
+
+- New namespace (and compatibility headers for old namespace).
+    Namespaces are tbb and tbb::internal and all classes are in the
+    underscore_style not the WindowsStyle.
+- New class: scalable_allocator (and cache_aligned_allocator using that
+    if it exists).
+- Added parallel_for/tacheon example.
+- Removed C-style casts from headers for better C++ compliance.
+- Bug fixes.
+- Documentation improvements.
+- Improved performance of the concurrent_hash_map class.
+- Upgraded parallel_sort() to support STL-style random-access iterators
+    instead of just pointers.
+- The Windows vs7_1 directories renamed to vs7.1 in examples.
+- New class: spin version of reader-writer lock.
+- Added push_back() interface to concurrent_vector().
+
+------------------------------------------------------------------------
+Intel TBB 1.0 beta commercial release
+
+Initial release.
+
+Features / APIs:
+
+- Concurrent containers: ConcurrentHashTable, ConcurrentVector,
+    ConcurrentQueue.
+- Parallel algorithms: ParallelFor, ParallelReduce, ParallelScan,
+    ParallelWhile, Pipeline, ParallelSort.
+- Support: AlignedSpace, BlockedRange (i.e., 1D), BlockedRange2D
+- Task scheduler with multi-master support.
+- Atomics: read, write, fetch-and-store, fetch-and-add, compare-and-swap.
+- Locks: spin, reader-writer, queuing, OS-wrapper.
+- Memory allocation: STL-style memory allocator that avoids false
+    sharing.
+- Timers.
+
+Tools Support:
+- Intel(R) Thread Checker 3.0.
+- Intel(R) Thread Profiler 3.0.
+
+Documentation:
+- First Use Documents: README.txt, INSTALL.txt, Release_Notes.txt,
+    Doc_Index.html, Getting_Started.pdf, Tutorial.pdf, Reference.pdf.
+- Class hierarchy HTML pages (Doxygen).
+- Tree of index.html pages for navigating the installed package, esp.
+    for the examples.
+
+Examples:
+- One for each of these TBB features: ConcurrentHashTable, ParallelFor,
+    ParallelReduce, ParallelWhile, Pipeline, Task.
+- Live copies of examples from Getting_Started.pdf.
+- TestAll example that exercises every class and header in the package
+    (i.e., a "liveness test").
+- Compilers: see Release_Notes.txt.
+- APIs: OpenMP, WinThreads, Pthreads.
+
+Packaging:
+- Package for Windows installs IA-32 and EM64T bits.
+- Package for Linux installs IA-32, EM64T and IPF bits.
+- Package for Mac OS* X installs IA-32 bits.
+- All packages support Intel(R) software setup assistant (ISSA) and
+    install-time FLEXlm license checking.
+- ISSA support allows license file to be specified directly in case of
+    no Internet connection or problems with IRC or serial #s.
+- Linux installer allows root or non-root, RPM or non-RPM installs.
+- FLEXlm license servers (for those who need floating/counted licenses)
+    are provided separately on Intel(R) Premier.
+
+------------------------------------------------------------------------
+Intel, the Intel logo, Xeon, Intel Xeon Phi, and Cilk are registered
+trademarks or trademarks of Intel Corporation or its subsidiaries in
+the United States and other countries.
+
+* Other names and brands may be claimed as the property of others.
diff --git a/xdl/third_party/tbb/Doxyfile b/xdl/third_party/tbb/Doxyfile
new file mode 100644
index 00000000..e024073e
--- /dev/null
+++ b/xdl/third_party/tbb/Doxyfile
@@ -0,0 +1,1327 @@
+# Doxyfile 1.4.7
+
+# This file describes the settings to be used by the documentation system
+# doxygen (www.doxygen.org) for a project
+#
+# All text after a hash (#) is considered a comment and will be ignored
+# The format is:
+#       TAG = value [value, ...]
+# For lists items can also be appended using:
+#       TAG += value [value, ...]
+# Values that contain spaces should be placed between quotes (" ")
+
+#---------------------------------------------------------------------------
+# Project related configuration options
+#---------------------------------------------------------------------------
+
+# The PROJECT_NAME tag is a single word (or a sequence of words surrounded 
+# by quotes) that should identify the project.
+
+PROJECT_NAME           = "Intel(R) Threading Building Blocks Doxygen Documentation"
+
+# The PROJECT_NUMBER tag can be used to enter a project or revision number. 
+# This could be handy for archiving the generated documentation or 
+# if some version control system is used.
+
+PROJECT_NUMBER         = "version 4.2.3"
+
+# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) 
+# base path where the generated documentation will be put. 
+# If a relative path is entered, it will be relative to the location 
+# where doxygen was started. If left blank the current directory will be used.
+
+OUTPUT_DIRECTORY       =
+
+# If the CREATE_SUBDIRS tag is set to YES, then doxygen will create 
+# 4096 sub-directories (in 2 levels) under the output directory of each output 
+# format and will distribute the generated files over these directories. 
+# Enabling this option can be useful when feeding doxygen a huge amount of 
+# source files, where putting all generated files in the same directory would 
+# otherwise cause performance problems for the file system.
+
+CREATE_SUBDIRS         = NO
+
+# The OUTPUT_LANGUAGE tag is used to specify the language in which all 
+# documentation generated by doxygen is written. Doxygen will use this 
+# information to generate all constant output in the proper language. 
+# The default language is English, other supported languages are: 
+# Brazilian, Catalan, Chinese, Chinese-Traditional, Croatian, Czech, Danish, 
+# Dutch, Finnish, French, German, Greek, Hungarian, Italian, Japanese, 
+# Japanese-en (Japanese with English messages), Korean, Korean-en, Norwegian, 
+# Polish, Portuguese, Romanian, Russian, Serbian, Slovak, Slovene, Spanish, 
+# Swedish, and Ukrainian.
+
+OUTPUT_LANGUAGE        = English
+
+# This tag can be used to specify the encoding used in the generated output. 
+# The encoding is not always determined by the language that is chosen, 
+# but also whether or not the output is meant for Windows or non-Windows users. 
+# In case there is a difference, setting the USE_WINDOWS_ENCODING tag to YES 
+# forces the Windows encoding (this is the default for the Windows binary), 
+# whereas setting the tag to NO uses a Unix-style encoding (the default for 
+# all platforms other than Windows).
+
+USE_WINDOWS_ENCODING   = NO
+
+# If the BRIEF_MEMBER_DESC tag is set to YES (the default) Doxygen will 
+# include brief member descriptions after the members that are listed in 
+# the file and class documentation (similar to JavaDoc). 
+# Set to NO to disable this.
+
+BRIEF_MEMBER_DESC      = YES
+
+# If the REPEAT_BRIEF tag is set to YES (the default) Doxygen will prepend 
+# the brief description of a member or function before the detailed description. 
+# Note: if both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the 
+# brief descriptions will be completely suppressed.
+
+REPEAT_BRIEF           = YES
+
+# This tag implements a quasi-intelligent brief description abbreviator 
+# that is used to form the text in various listings. Each string 
+# in this list, if found as the leading text of the brief description, will be 
+# stripped from the text and the result after processing the whole list, is 
+# used as the annotated text. Otherwise, the brief description is used as-is. 
+# If left blank, the following values are used ("$name" is automatically 
+# replaced with the name of the entity): "The $name class" "The $name widget" 
+# "The $name file" "is" "provides" "specifies" "contains" 
+# "represents" "a" "an" "the"
+
+ABBREVIATE_BRIEF       = 
+
+# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then 
+# Doxygen will generate a detailed section even if there is only a brief 
+# description.
+
+ALWAYS_DETAILED_SEC    = NO
+
+# If the INLINE_INHERITED_MEMB tag is set to YES, doxygen will show all 
+# inherited members of a class in the documentation of that class as if those 
+# members were ordinary class members. Constructors, destructors and assignment 
+# operators of the base classes will not be shown.
+
+INLINE_INHERITED_MEMB  = NO
+
+# If the FULL_PATH_NAMES tag is set to YES then Doxygen will prepend the full 
+# path before files name in the file list and in the header files. If set 
+# to NO the shortest path that makes the file name unique will be used.
+
+FULL_PATH_NAMES        = NO
+
+# If the FULL_PATH_NAMES tag is set to YES then the STRIP_FROM_PATH tag 
+# can be used to strip a user-defined part of the path. Stripping is 
+# only done if one of the specified strings matches the left-hand part of 
+# the path. The tag can be used to show relative paths in the file list. 
+# If left blank the directory from which doxygen is run is used as the 
+# path to strip.
+
+STRIP_FROM_PATH        = 
+
+# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of 
+# the path mentioned in the documentation of a class, which tells 
+# the reader which header file to include in order to use a class. 
+# If left blank only the name of the header file containing the class 
+# definition is used. Otherwise one should specify the include paths that 
+# are normally passed to the compiler using the -I flag.
+
+STRIP_FROM_INC_PATH    = 
+
+# If the SHORT_NAMES tag is set to YES, doxygen will generate much shorter 
+# (but less readable) file names. This can be useful is your file systems 
+# doesn't support long names like on DOS, Mac, or CD-ROM.
+
+SHORT_NAMES            = YES
+
+# If the JAVADOC_AUTOBRIEF tag is set to YES then Doxygen 
+# will interpret the first line (until the first dot) of a JavaDoc-style 
+# comment as the brief description. If set to NO, the JavaDoc 
+# comments will behave just like the Qt-style comments (thus requiring an 
+# explicit @brief command for a brief description.
+
+JAVADOC_AUTOBRIEF      = NO
+
+# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make Doxygen 
+# treat a multi-line C++ special comment block (i.e. a block of //! or /// 
+# comments) as a brief description. This used to be the default behaviour. 
+# The new default is to treat a multi-line C++ comment block as a detailed 
+# description. Set this tag to YES if you prefer the old behaviour instead.
+
+MULTILINE_CPP_IS_BRIEF = NO
+
+# If the DETAILS_AT_TOP tag is set to YES then Doxygen 
+# will output the detailed description near the top, like JavaDoc.
+# If set to NO, the detailed description appears after the member 
+# documentation.
+
+DETAILS_AT_TOP         = NO
+
+# If the INHERIT_DOCS tag is set to YES (the default) then an undocumented 
+# member inherits the documentation from any documented member that it 
+# re-implements.
+
+INHERIT_DOCS           = YES
+
+# If the SEPARATE_MEMBER_PAGES tag is set to YES, then doxygen will produce 
+# a new page for each member. If set to NO, the documentation of a member will 
+# be part of the file/class/namespace that contains it.
+
+SEPARATE_MEMBER_PAGES  = NO
+
+# The TAB_SIZE tag can be used to set the number of spaces in a tab. 
+# Doxygen uses this value to replace tabs by spaces in code fragments.
+
+TAB_SIZE               = 8
+
+# This tag can be used to specify a number of aliases that acts 
+# as commands in the documentation. An alias has the form "name=value". 
+# For example adding "sideeffect=\par Side Effects:\n" will allow you to 
+# put the command \sideeffect (or @sideeffect) in the documentation, which 
+# will result in a user-defined paragraph with heading "Side Effects:". 
+# You can put \n's in the value part of an alias to insert newlines.
+
+ALIASES                = 
+
+# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C 
+# sources only. Doxygen will then generate output that is more tailored for C. 
+# For instance, some of the names that are used will be different. The list 
+# of all members will be omitted, etc.
+
+OPTIMIZE_OUTPUT_FOR_C  = NO
+
+# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java 
+# sources only. Doxygen will then generate output that is more tailored for Java. 
+# For instance, namespaces will be presented as packages, qualified scopes 
+# will look different, etc.
+
+OPTIMIZE_OUTPUT_JAVA   = NO
+
+# If the MARKDOWN_SUPPORT tag is enabled then doxygen pre-processes all comments
+# according to the Markdown format, which allows for more readable
+# documentation. See http://daringfireball.net/projects/markdown/ for details.
+# The output of markdown processing is further processed by doxygen, so you can
+# mix doxygen, HTML, and XML commands with Markdown formatting. Disable only in
+# case of backward compatibilities issues.
+# The default value is: YES.
+
+MARKDOWN_SUPPORT       = YES
+
+# When the TOC_INCLUDE_HEADINGS tag is set to a non-zero value, all headings up
+# to that level are automatically included in the table of contents, even if
+# they do not have an id attribute.
+# Note: This feature currently applies only to Markdown headings.
+# Minimum value: 0, maximum value: 99, default value: 0.
+# This tag requires that the tag MARKDOWN_SUPPORT is set to YES.
+
+TOC_INCLUDE_HEADINGS   = 0
+
+# When enabled doxygen tries to link words that correspond to documented
+# classes, or namespaces to their corresponding documentation. Such a link can
+# be prevented in individual cases by putting a % sign in front of the word or
+# globally by setting AUTOLINK_SUPPORT to NO.
+# The default value is: YES.
+
+AUTOLINK_SUPPORT       = YES
+
+# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want to 
+# include (a tag file for) the STL sources as input, then you should 
+# set this tag to YES in order to let doxygen match functions declarations and 
+# definitions whose arguments contain STL classes (e.g. func(std::string); v.s. 
+# func(std::string) {}). This also make the inheritance and collaboration 
+# diagrams that involve STL classes more complete and accurate.
+
+BUILTIN_STL_SUPPORT    = YES
+
+# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC 
+# tag is set to YES, then doxygen will reuse the documentation of the first 
+# member in the group (if any) for the other members of the group. By default 
+# all members of a group must be documented explicitly.
+
+DISTRIBUTE_GROUP_DOC   = NO
+
+# Set the SUBGROUPING tag to YES (the default) to allow class member groups of 
+# the same type (for instance a group of public functions) to be put as a 
+# subgroup of that type (e.g. under the Public Functions section). Set it to 
+# NO to prevent subgrouping. Alternatively, this can be done per class using 
+# the \nosubgrouping command.
+
+SUBGROUPING            = YES
+
+#---------------------------------------------------------------------------
+# Build related configuration options
+#---------------------------------------------------------------------------
+
+# If the EXTRACT_ALL tag is set to YES doxygen will assume all entities in 
+# documentation are documented, even if no documentation was available. 
+# Private class members and static file members will be hidden unless 
+# the EXTRACT_PRIVATE and EXTRACT_STATIC tags are set to YES
+
+EXTRACT_ALL            = YES
+
+# If the EXTRACT_PRIVATE tag is set to YES all private members of a class 
+# will be included in the documentation.
+
+EXTRACT_PRIVATE        = YES
+
+# If the EXTRACT_STATIC tag is set to YES all static members of a file 
+# will be included in the documentation.
+
+EXTRACT_STATIC         = YES
+
+# If the EXTRACT_LOCAL_CLASSES tag is set to YES classes (and structs) 
+# defined locally in source files will be included in the documentation. 
+# If set to NO only classes defined in header files are included.
+
+EXTRACT_LOCAL_CLASSES  = YES
+
+# This flag is only useful for Objective-C code. When set to YES local 
+# methods, which are defined in the implementation section but not in 
+# the interface are included in the documentation. 
+# If set to NO (the default) only methods in the interface are included.
+
+EXTRACT_LOCAL_METHODS  = NO
+
+# If the HIDE_UNDOC_MEMBERS tag is set to YES, Doxygen will hide all 
+# undocumented members of documented classes, files or namespaces. 
+# If set to NO (the default) these members will be included in the 
+# various overviews, but no documentation section is generated. 
+# This option has no effect if EXTRACT_ALL is enabled.
+
+HIDE_UNDOC_MEMBERS     = NO
+
+# If the HIDE_UNDOC_CLASSES tag is set to YES, Doxygen will hide all 
+# undocumented classes that are normally visible in the class hierarchy. 
+# If set to NO (the default) these classes will be included in the various 
+# overviews. This option has no effect if EXTRACT_ALL is enabled.
+
+HIDE_UNDOC_CLASSES     = NO
+
+# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, Doxygen will hide all 
+# friend (class|struct|union) declarations. 
+# If set to NO (the default) these declarations will be included in the 
+# documentation.
+
+HIDE_FRIEND_COMPOUNDS  = NO
+
+# If the HIDE_IN_BODY_DOCS tag is set to YES, Doxygen will hide any 
+# documentation blocks found inside the body of a function. 
+# If set to NO (the default) these blocks will be appended to the 
+# function's detailed documentation block.
+
+HIDE_IN_BODY_DOCS      = NO
+
+# The INTERNAL_DOCS tag determines if documentation 
+# that is typed after a \internal command is included. If the tag is set 
+# to NO (the default) then the documentation will be excluded. 
+# Set it to YES to include the internal documentation.
+
+INTERNAL_DOCS          = YES
+
+# If the CASE_SENSE_NAMES tag is set to NO then Doxygen will only generate 
+# file names in lower-case letters. If set to YES upper-case letters are also 
+# allowed. This is useful if you have classes or files whose names only differ 
+# in case and if your file system supports case sensitive file names. Windows 
+# and Mac users are advised to set this option to NO.
+
+CASE_SENSE_NAMES       = YES
+
+# If the HIDE_SCOPE_NAMES tag is set to NO (the default) then Doxygen 
+# will show members with their full class and namespace scopes in the 
+# documentation. If set to YES the scope will be hidden.
+
+HIDE_SCOPE_NAMES       = NO
+
+# If the SHOW_INCLUDE_FILES tag is set to YES (the default) then Doxygen 
+# will put a list of the files that are included by a file in the documentation 
+# of that file.
+
+SHOW_INCLUDE_FILES     = YES
+
+# If the INLINE_INFO tag is set to YES (the default) then a tag [inline] 
+# is inserted in the documentation for inline members.
+
+INLINE_INFO            = YES
+
+# If the SORT_MEMBER_DOCS tag is set to YES (the default) then doxygen 
+# will sort the (detailed) documentation of file and class members 
+# alphabetically by member name. If set to NO the members will appear in 
+# declaration order.
+
+SORT_MEMBER_DOCS       = YES
+
+# If the SORT_BRIEF_DOCS tag is set to YES then doxygen will sort the 
+# brief documentation of file, namespace and class members alphabetically 
+# by member name. If set to NO (the default) the members will appear in 
+# declaration order.
+
+SORT_BRIEF_DOCS        = NO
+
+# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be 
+# sorted by fully-qualified names, including namespaces. If set to 
+# NO (the default), the class list will be sorted only by class name, 
+# not including the namespace part. 
+# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
+# Note: This option applies only to the class list, not to the 
+# alphabetical list.
+
+SORT_BY_SCOPE_NAME     = NO
+
+# The GENERATE_TODOLIST tag can be used to enable (YES) or 
+# disable (NO) the todo list. This list is created by putting \todo 
+# commands in the documentation.
+
+GENERATE_TODOLIST      = NO
+
+# The GENERATE_TESTLIST tag can be used to enable (YES) or 
+# disable (NO) the test list. This list is created by putting \test 
+# commands in the documentation.
+
+GENERATE_TESTLIST      = NO
+
+# The GENERATE_BUGLIST tag can be used to enable (YES) or 
+# disable (NO) the bug list. This list is created by putting \bug 
+# commands in the documentation.
+
+GENERATE_BUGLIST       = NO
+
+# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or 
+# disable (NO) the deprecated list. This list is created by putting 
+# \deprecated commands in the documentation.
+
+GENERATE_DEPRECATEDLIST= YES
+
+# The ENABLED_SECTIONS tag can be used to enable conditional 
+# documentation sections, marked by \if sectionname ... \endif.
+
+ENABLED_SECTIONS       = INTERNAL
+
+# The MAX_INITIALIZER_LINES tag determines the maximum number of lines 
+# the initial value of a variable or define consists of for it to appear in 
+# the documentation. If the initializer consists of more lines than specified 
+# here it will be hidden. Use a value of 0 to hide initializers completely. 
+# The appearance of the initializer of individual variables and defines in the 
+# documentation can be controlled using \showinitializer or \hideinitializer 
+# command in the documentation regardless of this setting.
+
+MAX_INITIALIZER_LINES  = 30
+
+# Set the SHOW_USED_FILES tag to NO to disable the list of files generated 
+# at the bottom of the documentation of classes and structs. If set to YES the 
+# list will mention the files that were used to generate the documentation.
+
+SHOW_USED_FILES        = YES
+
+# If the sources in your project are distributed over multiple directories 
+# then setting the SHOW_DIRECTORIES tag to YES will show the directory hierarchy 
+# in the documentation. The default is NO.
+
+SHOW_DIRECTORIES       = YES
+
+# The FILE_VERSION_FILTER tag can be used to specify a program or script that 
+# doxygen should invoke to get the current version for each file (typically from the 
+# version control system). Doxygen will invoke the program by executing (via 
+# popen()) the command <command> <input-file>, where <command> is the value of 
+# the FILE_VERSION_FILTER tag, and <input-file> is the name of an input file 
+# provided by doxygen. Whatever the program writes to standard output 
+# is used as the file version. See the manual for examples.
+
+FILE_VERSION_FILTER    = 
+
+#---------------------------------------------------------------------------
+# configuration options related to warning and progress messages
+#---------------------------------------------------------------------------
+
+# The QUIET tag can be used to turn on/off the messages that are generated 
+# by doxygen. Possible values are YES and NO. If left blank NO is used.
+
+QUIET                  = NO
+
+# The WARNINGS tag can be used to turn on/off the warning messages that are 
+# generated by doxygen. Possible values are YES and NO. If left blank 
+# NO is used.
+
+WARNINGS               = YES
+
+# If WARN_IF_UNDOCUMENTED is set to YES, then doxygen will generate warnings 
+# for undocumented members. If EXTRACT_ALL is set to YES then this flag will 
+# automatically be disabled.
+
+WARN_IF_UNDOCUMENTED   = YES
+
+# If WARN_IF_DOC_ERROR is set to YES, doxygen will generate warnings for 
+# potential errors in the documentation, such as not documenting some 
+# parameters in a documented function, or documenting parameters that 
+# don't exist or using markup commands wrongly.
+
+WARN_IF_DOC_ERROR      = YES
+
+# This WARN_NO_PARAMDOC option can be abled to get warnings for 
+# functions that are documented, but have no documentation for their parameters 
+# or return value. If set to NO (the default) doxygen will only warn about 
+# wrong or incomplete parameter documentation, but not about the absence of 
+# documentation.
+
+WARN_NO_PARAMDOC       = NO
+
+# The WARN_FORMAT tag determines the format of the warning messages that 
+# doxygen can produce. The string should contain the $file, $line, and $text 
+# tags, which will be replaced by the file and line number from which the 
+# warning originated and the warning text. Optionally the format may contain 
+# $version, which will be replaced by the version of the file (if it could 
+# be obtained via FILE_VERSION_FILTER)
+
+WARN_FORMAT            = "$file:$line: $text"
+
+# The WARN_LOGFILE tag can be used to specify a file to which warning 
+# and error messages should be written. If left blank the output is written 
+# to stderr.
+
+WARN_LOGFILE           = 
+
+#---------------------------------------------------------------------------
+# configuration options related to the input files
+#---------------------------------------------------------------------------
+
+# The INPUT tag can be used to specify the files and/or directories that contain 
+# documented source files. You may enter file names like "myfile.cpp" or 
+# directories like "/usr/src/myproject". Separate the files or directories 
+# with spaces.
+
+INPUT                  = include/ src/tbb/
+
+# If the value of the INPUT tag contains directories, you can use the 
+# FILE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp 
+# and *.h) to filter out the source-files in the directories. If left 
+# blank the following patterns are tested: 
+# *.c *.cc *.cxx *.cpp *.c++ *.java *.ii *.ixx *.ipp *.i++ *.inl *.h *.hh *.hxx 
+# *.hpp *.h++ *.idl *.odl *.cs *.php *.php3 *.inc *.m *.mm *.py
+
+FILE_PATTERNS          = 
+
+# The RECURSIVE tag can be used to turn specify whether or not subdirectories 
+# should be searched for input files as well. Possible values are YES and NO. 
+# If left blank NO is used.
+
+RECURSIVE              = YES
+
+# The EXCLUDE tag can be used to specify files and/or directories that should 
+# excluded from the INPUT source files. This way you can easily exclude a 
+# subdirectory from a directory tree whose root is specified with the INPUT tag.
+
+EXCLUDE                = 
+
+# The EXCLUDE_SYMLINKS tag can be used select whether or not files or 
+# directories that are symbolic links (a Unix filesystem feature) are excluded 
+# from the input.
+
+EXCLUDE_SYMLINKS       = NO
+
+# If the value of the INPUT tag contains directories, you can use the 
+# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude 
+# certain files from those directories. Note that the wildcards are matched 
+# against the file with absolute path, so to exclude all test directories 
+# for example use the pattern */test/*
+
+EXCLUDE_PATTERNS       = 
+
+# The EXAMPLE_PATH tag can be used to specify one or more files or 
+# directories that contain example code fragments that are included (see 
+# the \include command).
+
+EXAMPLE_PATH           = 
+
+# If the value of the EXAMPLE_PATH tag contains directories, you can use the 
+# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp 
+# and *.h) to filter out the source-files in the directories. If left 
+# blank all files are included.
+
+EXAMPLE_PATTERNS       = 
+
+# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be 
+# searched for input files to be used with the \include or \dontinclude 
+# commands irrespective of the value of the RECURSIVE tag. 
+# Possible values are YES and NO. If left blank NO is used.
+
+EXAMPLE_RECURSIVE      = NO
+
+# The IMAGE_PATH tag can be used to specify one or more files or 
+# directories that contain image that are included in the documentation (see 
+# the \image command).
+
+IMAGE_PATH             = 
+
+# The INPUT_FILTER tag can be used to specify a program that doxygen should 
+# invoke to filter for each input file. Doxygen will invoke the filter program 
+# by executing (via popen()) the command <filter> <input-file>, where <filter> 
+# is the value of the INPUT_FILTER tag, and <input-file> is the name of an 
+# input file. Doxygen will then use the output that the filter program writes 
+# to standard output.  If FILTER_PATTERNS is specified, this tag will be 
+# ignored.
+
+INPUT_FILTER           = 
+
+# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern 
+# basis.  Doxygen will compare the file name with each pattern and apply the 
+# filter if there is a match.  The filters are a list of the form: 
+# pattern=filter (like *.cpp=my_cpp_filter). See INPUT_FILTER for further 
+# info on how filters are used. If FILTER_PATTERNS is empty, INPUT_FILTER 
+# is applied to all files.
+
+FILTER_PATTERNS        = 
+
+# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using 
+# INPUT_FILTER) will be used to filter the input files when producing source 
+# files to browse (i.e. when SOURCE_BROWSER is set to YES).
+
+FILTER_SOURCE_FILES    = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to source browsing
+#---------------------------------------------------------------------------
+
+# If the SOURCE_BROWSER tag is set to YES then a list of source files will 
+# be generated. Documented entities will be cross-referenced with these sources. 
+# Note: To get rid of all source code in the generated output, make sure also 
+# VERBATIM_HEADERS is set to NO.
+
+SOURCE_BROWSER         = YES
+
+# Setting the INLINE_SOURCES tag to YES will include the body 
+# of functions and classes directly in the documentation.
+
+INLINE_SOURCES         = YES
+
+# Setting the STRIP_CODE_COMMENTS tag to YES (the default) will instruct 
+# doxygen to hide any special comment blocks from generated source code 
+# fragments. Normal C and C++ comments will always remain visible.
+
+STRIP_CODE_COMMENTS    = YES
+
+# If the REFERENCED_BY_RELATION tag is set to YES (the default) 
+# then for each documented function all documented 
+# functions referencing it will be listed.
+
+REFERENCED_BY_RELATION = YES
+
+# If the REFERENCES_RELATION tag is set to YES (the default) 
+# then for each documented function all documented entities 
+# called/used by that function will be listed.
+
+REFERENCES_RELATION    = YES
+
+# If the REFERENCES_LINK_SOURCE tag is set to YES (the default)
+# and SOURCE_BROWSER tag is set to YES, then the hyperlinks from
+# functions in REFERENCES_RELATION and REFERENCED_BY_RELATION lists will
+# link to the source code.  Otherwise they will link to the documentstion.
+
+REFERENCES_LINK_SOURCE = NO
+
+# If the USE_HTAGS tag is set to YES then the references to source code 
+# will point to the HTML generated by the htags(1) tool instead of doxygen 
+# built-in source browser. The htags tool is part of GNU's global source 
+# tagging system (see http://www.gnu.org/software/global/global.html). You 
+# will need version 4.8.6 or higher.
+
+USE_HTAGS              = NO
+
+# If the VERBATIM_HEADERS tag is set to YES (the default) then Doxygen 
+# will generate a verbatim copy of the header file for each class for 
+# which an include is specified. Set to NO to disable this.
+
+VERBATIM_HEADERS       = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the alphabetical class index
+#---------------------------------------------------------------------------
+
+# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index 
+# of all compounds will be generated. Enable this if the project 
+# contains a lot of classes, structs, unions or interfaces.
+
+ALPHABETICAL_INDEX     = YES
+
+# If the alphabetical index is enabled (see ALPHABETICAL_INDEX) then 
+# the COLS_IN_ALPHA_INDEX tag can be used to specify the number of columns 
+# in which this list will be split (can be a number in the range [1..20])
+
+COLS_IN_ALPHA_INDEX    = 5
+
+# In case all classes in a project start with a common prefix, all 
+# classes will be put under the same header in the alphabetical index. 
+# The IGNORE_PREFIX tag can be used to specify one or more prefixes that 
+# should be ignored while generating the index headers.
+
+IGNORE_PREFIX          = 
+
+#---------------------------------------------------------------------------
+# configuration options related to the HTML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_HTML tag is set to YES (the default) Doxygen will 
+# generate HTML output.
+
+GENERATE_HTML          = YES
+
+# The HTML_OUTPUT tag is used to specify where the HTML docs will be put. 
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be 
+# put in front of it. If left blank `html' will be used as the default path.
+
+HTML_OUTPUT            = html
+
+# The HTML_FILE_EXTENSION tag can be used to specify the file extension for 
+# each generated HTML page (for example: .htm,.php,.asp). If it is left blank 
+# doxygen will generate files with .html extension.
+
+HTML_FILE_EXTENSION    = .html
+
+# The HTML_HEADER tag can be used to specify a personal HTML header for 
+# each generated HTML page. If it is left blank doxygen will generate a 
+# standard header.
+
+HTML_HEADER            = 
+
+# The HTML_FOOTER tag can be used to specify a personal HTML footer for 
+# each generated HTML page. If it is left blank doxygen will generate a 
+# standard footer.
+
+HTML_FOOTER            = doc/copyright_brand_disclaimer_doxygen.txt
+
+# The HTML_STYLESHEET tag can be used to specify a user-defined cascading 
+# style sheet that is used by each HTML page. It can be used to 
+# fine-tune the look of the HTML output. If the tag is left blank doxygen 
+# will generate a default style sheet. Note that doxygen will try to copy 
+# the style sheet file to the HTML output directory, so don't put your own 
+# stylesheet in the HTML output directory as well, or it will be erased!
+
+HTML_STYLESHEET        = 
+
+# If the HTML_ALIGN_MEMBERS tag is set to YES, the members of classes, 
+# files or namespaces will be aligned in HTML using tables. If set to 
+# NO a bullet list will be used.
+
+HTML_ALIGN_MEMBERS     = YES
+
+# If the GENERATE_HTMLHELP tag is set to YES, additional index files 
+# will be generated that can be used as input for tools like the 
+# Microsoft HTML help workshop to generate a compressed HTML help file (.chm) 
+# of the generated HTML documentation.
+
+GENERATE_HTMLHELP      = NO
+
+# If the GENERATE_HTMLHELP tag is set to YES, the CHM_FILE tag can 
+# be used to specify the file name of the resulting .chm file. You 
+# can add a path in front of the file if the result should not be 
+# written to the html output directory.
+
+CHM_FILE               = 
+
+# If the GENERATE_HTMLHELP tag is set to YES, the HHC_LOCATION tag can 
+# be used to specify the location (absolute path including file name) of 
+# the HTML help compiler (hhc.exe). If non-empty doxygen will try to run 
+# the HTML help compiler on the generated index.hhp.
+
+HHC_LOCATION           = 
+
+# If the GENERATE_HTMLHELP tag is set to YES, the GENERATE_CHI flag 
+# controls if a separate .chi index file is generated (YES) or that 
+# it should be included in the master .chm file (NO).
+
+GENERATE_CHI           = NO
+
+# If the GENERATE_HTMLHELP tag is set to YES, the BINARY_TOC flag 
+# controls whether a binary table of contents is generated (YES) or a 
+# normal table of contents (NO) in the .chm file.
+
+BINARY_TOC             = NO
+
+# The TOC_EXPAND flag can be set to YES to add extra items for group members 
+# to the contents of the HTML help documentation and to the tree view.
+
+TOC_EXPAND             = NO
+
+# The DISABLE_INDEX tag can be used to turn on/off the condensed index at 
+# top of each HTML page. The value NO (the default) enables the index and 
+# the value YES disables it.
+
+DISABLE_INDEX          = NO
+
+# This tag can be used to set the number of enum values (range [1..20]) 
+# that doxygen will group on one line in the generated HTML documentation.
+
+ENUM_VALUES_PER_LINE   = 4
+
+# If the GENERATE_TREEVIEW tag is set to YES, a side panel will be
+# generated containing a tree-like index structure (just like the one that 
+# is generated for HTML Help). For this to work a browser that supports 
+# JavaScript, DHTML, CSS and frames is required (for instance Mozilla 1.0+, 
+# Netscape 6.0+, Internet explorer 5.0+, or Konqueror). Windows users are 
+# probably better off using the HTML help feature.
+
+GENERATE_TREEVIEW      = YES
+
+# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be 
+# used to set the initial width (in pixels) of the frame in which the tree 
+# is shown.
+
+TREEVIEW_WIDTH         = 250
+
+#---------------------------------------------------------------------------
+# configuration options related to the LaTeX output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_LATEX tag is set to YES (the default) Doxygen will 
+# generate Latex output.
+
+GENERATE_LATEX         = NO
+
+# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put. 
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be 
+# put in front of it. If left blank `latex' will be used as the default path.
+
+LATEX_OUTPUT           = latex
+
+# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be 
+# invoked. If left blank `latex' will be used as the default command name.
+
+LATEX_CMD_NAME         = latex
+
+# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to 
+# generate index for LaTeX. If left blank `makeindex' will be used as the 
+# default command name.
+
+MAKEINDEX_CMD_NAME     = makeindex
+
+# If the COMPACT_LATEX tag is set to YES Doxygen generates more compact 
+# LaTeX documents. This may be useful for small projects and may help to 
+# save some trees in general.
+
+COMPACT_LATEX          = NO
+
+# The PAPER_TYPE tag can be used to set the paper type that is used 
+# by the printer. Possible values are: a4, a4wide, letter, legal and 
+# executive. If left blank a4wide will be used.
+
+PAPER_TYPE             = a4wide
+
+# The EXTRA_PACKAGES tag can be to specify one or more names of LaTeX 
+# packages that should be included in the LaTeX output.
+
+EXTRA_PACKAGES         = 
+
+# The LATEX_HEADER tag can be used to specify a personal LaTeX header for 
+# the generated latex document. The header should contain everything until 
+# the first chapter. If it is left blank doxygen will generate a 
+# standard header. Notice: only use this tag if you know what you are doing!
+
+LATEX_HEADER           = 
+
+# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated 
+# is prepared for conversion to pdf (using ps2pdf). The pdf file will 
+# contain links (just like the HTML output) instead of page references 
+# This makes the output suitable for online browsing using a pdf viewer.
+
+PDF_HYPERLINKS         = NO
+
+# If the USE_PDFLATEX tag is set to YES, pdflatex will be used instead of 
+# plain latex in the generated Makefile. Set this option to YES to get a 
+# higher quality PDF documentation.
+
+USE_PDFLATEX           = NO
+
+# If the LATEX_BATCHMODE tag is set to YES, doxygen will add the \\batchmode. 
+# command to the generated LaTeX files. This will instruct LaTeX to keep 
+# running if errors occur, instead of asking the user for help. 
+# This option is also used when generating formulas in HTML.
+
+LATEX_BATCHMODE        = NO
+
+# If LATEX_HIDE_INDICES is set to YES then doxygen will not 
+# include the index chapters (such as File Index, Compound Index, etc.) 
+# in the output.
+
+LATEX_HIDE_INDICES     = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the RTF output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_RTF tag is set to YES Doxygen will generate RTF output 
+# The RTF output is optimized for Word 97 and may not look very pretty with 
+# other RTF readers or editors.
+
+GENERATE_RTF           = NO
+
+# The RTF_OUTPUT tag is used to specify where the RTF docs will be put. 
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be 
+# put in front of it. If left blank `rtf' will be used as the default path.
+
+RTF_OUTPUT             = rtf
+
+# If the COMPACT_RTF tag is set to YES Doxygen generates more compact 
+# RTF documents. This may be useful for small projects and may help to 
+# save some trees in general.
+
+COMPACT_RTF            = NO
+
+# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated 
+# will contain hyperlink fields. The RTF file will 
+# contain links (just like the HTML output) instead of page references. 
+# This makes the output suitable for online browsing using WORD or other 
+# programs which support those fields. 
+# Note: wordpad (write) and others do not support links.
+
+RTF_HYPERLINKS         = NO
+
+# Load stylesheet definitions from file. Syntax is similar to doxygen's 
+# config file, i.e. a series of assignments. You only have to provide 
+# replacements, missing definitions are set to their default value.
+
+RTF_STYLESHEET_FILE    = 
+
+# Set optional variables used in the generation of an rtf document. 
+# Syntax is similar to doxygen's config file.
+
+RTF_EXTENSIONS_FILE    = 
+
+#---------------------------------------------------------------------------
+# configuration options related to the man page output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_MAN tag is set to YES (the default) Doxygen will 
+# generate man pages
+
+GENERATE_MAN           = NO
+
+# The MAN_OUTPUT tag is used to specify where the man pages will be put. 
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be 
+# put in front of it. If left blank `man' will be used as the default path.
+
+MAN_OUTPUT             = man
+
+# The MAN_EXTENSION tag determines the extension that is added to 
+# the generated man pages (default is the subroutine's section .3)
+
+MAN_EXTENSION          = .3
+
+# If the MAN_LINKS tag is set to YES and Doxygen generates man output, 
+# then it will generate one additional man file for each entity 
+# documented in the real man page(s). These additional files 
+# only source the real man page, but without them the man command 
+# would be unable to find the correct page. The default is NO.
+
+MAN_LINKS              = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the XML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_XML tag is set to YES Doxygen will 
+# generate an XML file that captures the structure of 
+# the code including all documentation.
+
+GENERATE_XML           = NO
+
+# The XML_OUTPUT tag is used to specify where the XML pages will be put. 
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be 
+# put in front of it. If left blank `xml' will be used as the default path.
+
+XML_OUTPUT             = xml
+
+# The XML_SCHEMA tag can be used to specify an XML schema, 
+# which can be used by a validating XML parser to check the 
+# syntax of the XML files.
+
+XML_SCHEMA             = 
+
+# The XML_DTD tag can be used to specify an XML DTD, 
+# which can be used by a validating XML parser to check the 
+# syntax of the XML files.
+
+XML_DTD                = 
+
+# If the XML_PROGRAMLISTING tag is set to YES Doxygen will 
+# dump the program listings (including syntax highlighting 
+# and cross-referencing information) to the XML output. Note that 
+# enabling this will significantly increase the size of the XML output.
+
+XML_PROGRAMLISTING     = NO
+
+#---------------------------------------------------------------------------
+# configuration options for the AutoGen Definitions output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_AUTOGEN_DEF tag is set to YES Doxygen will 
+# generate an AutoGen Definitions (see autogen.sf.net) file 
+# that captures the structure of the code including all 
+# documentation. Note that this feature is still experimental 
+# and incomplete at the moment.
+
+GENERATE_AUTOGEN_DEF   = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the Perl module output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_PERLMOD tag is set to YES Doxygen will 
+# generate a Perl module file that captures the structure of 
+# the code including all documentation. Note that this 
+# feature is still experimental and incomplete at the 
+# moment.
+
+GENERATE_PERLMOD       = NO
+
+# If the PERLMOD_LATEX tag is set to YES Doxygen will generate 
+# the necessary Makefile rules, Perl scripts and LaTeX code to be able 
+# to generate PDF and DVI output from the Perl module output.
+
+PERLMOD_LATEX          = NO
+
+# If the PERLMOD_PRETTY tag is set to YES the Perl module output will be 
+# nicely formatted so it can be parsed by a human reader.  This is useful 
+# if you want to understand what is going on.  On the other hand, if this 
+# tag is set to NO the size of the Perl module output will be much smaller 
+# and Perl will parse it just the same.
+
+PERLMOD_PRETTY         = YES
+
+# The names of the make variables in the generated doxyrules.make file 
+# are prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX. 
+# This is useful so different doxyrules.make files included by the same 
+# Makefile don't overwrite each other's variables.
+
+PERLMOD_MAKEVAR_PREFIX = 
+
+#---------------------------------------------------------------------------
+# Configuration options related to the preprocessor   
+#---------------------------------------------------------------------------
+
+# If the ENABLE_PREPROCESSING tag is set to YES (the default) Doxygen will 
+# evaluate all C-preprocessor directives found in the sources and include 
+# files.
+
+ENABLE_PREPROCESSING   = YES
+
+# If the MACRO_EXPANSION tag is set to YES Doxygen will expand all macro 
+# names in the source code. If set to NO (the default) only conditional 
+# compilation will be performed. Macro expansion can be done in a controlled 
+# way by setting EXPAND_ONLY_PREDEF to YES.
+
+MACRO_EXPANSION        = NO
+
+# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES 
+# then the macro expansion is limited to the macros specified with the 
+# PREDEFINED and EXPAND_AS_DEFINED tags.
+
+EXPAND_ONLY_PREDEF     = NO
+
+# If the SEARCH_INCLUDES tag is set to YES (the default) the includes files 
+# in the INCLUDE_PATH (see below) will be search if a #include is found.
+
+SEARCH_INCLUDES        = YES
+
+# The INCLUDE_PATH tag can be used to specify one or more directories that 
+# contain include files that are not input files but should be processed by 
+# the preprocessor.
+
+INCLUDE_PATH           = 
+
+# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard 
+# patterns (like *.h and *.hpp) to filter out the header-files in the 
+# directories. If left blank, the patterns specified with FILE_PATTERNS will 
+# be used.
+
+INCLUDE_FILE_PATTERNS  = 
+
+# The PREDEFINED tag can be used to specify one or more macro names that 
+# are defined before the preprocessor is started (similar to the -D option of 
+# gcc). The argument of the tag is a list of macros of the form: name 
+# or name=definition (no spaces). If the definition and the = are 
+# omitted =1 is assumed. To prevent a macro definition from being 
+# undefined via #undef or recursively expanded use the := operator 
+# instead of the = operator.
+
+PREDEFINED             = TBB_PREVIEW_FLOW_GRAPH_FEATURES \
+                         TBB_PREVIEW_FLOW_GRAPH_NODES \
+                         __TBB_GFX_PRESENT \
+                         __TBB_PREVIEW_OPENCL_NODE \
+                         __TBB_CPP11_RVALUE_REF_PRESENT \
+                         __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT \
+                         __TBB_IMPLICIT_MOVE_PRESENT \
+                         __TBB_EXCEPTION_PTR_PRESENT \
+                         __TBB_STATIC_ASSERT_PRESENT \
+                         __TBB_CPP11_TUPLE_PRESENT \
+                         __TBB_INITIALIZER_LISTS_PRESENT \
+                         __TBB_CONSTEXPR_PRESENT \
+                         __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT \
+                         __TBB_NOEXCEPT_PRESENT \
+                         __TBB_CPP11_STD_BEGIN_END_PRESENT \
+                         __TBB_CPP11_AUTO_PRESENT \
+                         __TBB_CPP11_DECLTYPE_PRESENT \
+                         __TBB_CPP11_LAMBDAS_PRESENT \
+                         __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT \
+                         __TBB_OVERRIDE_PRESENT \
+                         __TBB_ALIGNAS_PRESENT \
+                         __TBB_CPP11_TEMPLATE_ALIASES_PRESENT \
+                         __TBB_FLOW_GRAPH_CPP11_FEATURES \
+                         __TBB_PREVIEW_GFX_FACTORY \
+                         __TBB_PREVIEW_STREAMING_NODE
+
+# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then 
+# this tag can be used to specify a list of macro names that should be expanded. 
+# The macro definition that is found in the sources will be used. 
+# Use the PREDEFINED tag if you want to use a different macro definition.
+
+EXPAND_AS_DEFINED      = 
+
+# If the SKIP_FUNCTION_MACROS tag is set to YES (the default) then 
+# doxygen's preprocessor will remove all function-like macros that are alone 
+# on a line, have an all uppercase name, and do not end with a semicolon. Such 
+# function macros are typically used for boiler-plate code, and will confuse 
+# the parser if not removed.
+
+SKIP_FUNCTION_MACROS   = YES
+
+#---------------------------------------------------------------------------
+# Configuration::additions related to external references   
+#---------------------------------------------------------------------------
+
+# The TAGFILES option can be used to specify one or more tagfiles. 
+# Optionally an initial location of the external documentation 
+# can be added for each tagfile. The format of a tag file without 
+# this location is as follows: 
+#   TAGFILES = file1 file2 ... 
+# Adding location for the tag files is done as follows: 
+#   TAGFILES = file1=loc1 "file2 = loc2" ... 
+# where "loc1" and "loc2" can be relative or absolute paths or 
+# URLs. If a location is present for each tag, the installdox tool 
+# does not have to be run to correct the links.
+# Note that each tag file must have a unique name
+# (where the name does NOT include the path)
+# If a tag file is not located in the directory in which doxygen 
+# is run, you must also specify the path to the tagfile here.
+
+TAGFILES               = 
+
+# When a file name is specified after GENERATE_TAGFILE, doxygen will create 
+# a tag file that is based on the input files it reads.
+
+GENERATE_TAGFILE       = 
+
+# If the ALLEXTERNALS tag is set to YES all external classes will be listed 
+# in the class index. If set to NO only the inherited external classes 
+# will be listed.
+
+ALLEXTERNALS           = NO
+
+# If the EXTERNAL_GROUPS tag is set to YES all external groups will be listed 
+# in the modules index. If set to NO, only the current project's groups will 
+# be listed.
+
+EXTERNAL_GROUPS        = YES
+
+# The PERL_PATH should be the absolute path and name of the perl script 
+# interpreter (i.e. the result of `which perl').
+
+PERL_PATH              = /usr/bin/perl
+
+#---------------------------------------------------------------------------
+# Configuration options related to the dot tool   
+#---------------------------------------------------------------------------
+
+# If the CLASS_DIAGRAMS tag is set to YES (the default) Doxygen will 
+# generate a inheritance diagram (in HTML, RTF and LaTeX) for classes with base 
+# or super classes. Setting the tag to NO turns the diagrams off. Note that 
+# this option is superseded by the HAVE_DOT option below. This is only a 
+# fallback. It is recommended to install and use dot, since it yields more 
+# powerful graphs.
+
+CLASS_DIAGRAMS         = YES
+
+# If set to YES, the inheritance and collaboration graphs will hide 
+# inheritance and usage relations if the target is undocumented 
+# or is not a class.
+
+HIDE_UNDOC_RELATIONS   = YES
+
+# If you set the HAVE_DOT tag to YES then doxygen will assume the dot tool is 
+# available from the path. This tool is part of Graphviz, a graph visualization 
+# toolkit from AT&T and Lucent Bell Labs. The other options in this section 
+# have no effect if this option is set to NO (the default)
+
+HAVE_DOT               = YES
+
+# If the CLASS_GRAPH and HAVE_DOT tags are set to YES then doxygen 
+# will generate a graph for each documented class showing the direct and 
+# indirect inheritance relations. Setting this tag to YES will force the 
+# the CLASS_DIAGRAMS tag to NO.
+
+CLASS_GRAPH            = YES
+
+# If the COLLABORATION_GRAPH and HAVE_DOT tags are set to YES then doxygen 
+# will generate a graph for each documented class showing the direct and 
+# indirect implementation dependencies (inheritance, containment, and 
+# class references variables) of the class with other documented classes.
+
+COLLABORATION_GRAPH    = YES
+
+# If the GROUP_GRAPHS and HAVE_DOT tags are set to YES then doxygen 
+# will generate a graph for groups, showing the direct groups dependencies
+
+GROUP_GRAPHS           = YES
+
+# If the UML_LOOK tag is set to YES doxygen will generate inheritance and 
+# collaboration diagrams in a style similar to the OMG's Unified Modeling 
+# Language.
+
+UML_LOOK               = YES
+
+# If set to YES, the inheritance and collaboration graphs will show the 
+# relations between templates and their instances.
+
+TEMPLATE_RELATIONS     = YES
+
+# If the ENABLE_PREPROCESSING, SEARCH_INCLUDES, INCLUDE_GRAPH, and HAVE_DOT 
+# tags are set to YES then doxygen will generate a graph for each documented 
+# file showing the direct and indirect include dependencies of the file with 
+# other documented files.
+
+INCLUDE_GRAPH          = YES
+
+# If the ENABLE_PREPROCESSING, SEARCH_INCLUDES, INCLUDED_BY_GRAPH, and 
+# HAVE_DOT tags are set to YES then doxygen will generate a graph for each 
+# documented header file showing the documented files that directly or 
+# indirectly include this file.
+
+INCLUDED_BY_GRAPH      = YES
+
+# If the CALL_GRAPH and HAVE_DOT tags are set to YES then doxygen will 
+# generate a call dependency graph for every global function or class method. 
+# Note that enabling this option will significantly increase the time of a run. 
+# So in most cases it will be better to enable call graphs for selected 
+# functions only using the \callgraph command.
+
+CALL_GRAPH             = YES
+
+# If the CALLER_GRAPH and HAVE_DOT tags are set to YES then doxygen will 
+# generate a caller dependency graph for every global function or class method. 
+# Note that enabling this option will significantly increase the time of a run. 
+# So in most cases it will be better to enable caller graphs for selected 
+# functions only using the \callergraph command.
+
+CALLER_GRAPH           = YES
+
+# If the GRAPHICAL_HIERARCHY and HAVE_DOT tags are set to YES then doxygen 
+# will graphical hierarchy of all classes instead of a textual one.
+
+GRAPHICAL_HIERARCHY    = YES
+
+# If the DIRECTORY_GRAPH, SHOW_DIRECTORIES and HAVE_DOT tags are set to YES 
+# then doxygen will show the dependencies a directory has on other directories 
+# in a graphical way. The dependency relations are determined by the #include
+# relations between the files in the directories.
+
+DIRECTORY_GRAPH        = YES
+
+# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images 
+# generated by dot. Possible values are png, jpg, or gif
+# If left blank png will be used.
+
+DOT_IMAGE_FORMAT       = svg
+
+# If DOT_IMAGE_FORMAT is set to svg, then this option can be set to YES to
+# enable generation of interactive SVG images that allow zooming and panning.
+#
+# Note that this requires a modern browser other than Internet Explorer. Tested
+# and working are Firefox, Chrome, Safari, and Opera.
+# Note: For IE 9+ you need to set HTML_FILE_EXTENSION to xhtml in order to make
+# the SVG files visible. Older versions of IE do not have SVG support.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INTERACTIVE_SVG        = YES
+
+# The tag DOT_PATH can be used to specify the path where the dot tool can be 
+# found. If left blank, it is assumed the dot tool can be found in the path.
+
+DOT_PATH               =
+
+# The DOTFILE_DIRS tag can be used to specify one or more directories that 
+# contain dot files that are included in the documentation (see the 
+# \dotfile command).
+
+DOTFILE_DIRS           = 
+
+# The MAX_DOT_GRAPH_WIDTH tag can be used to set the maximum allowed width 
+# (in pixels) of the graphs generated by dot. If a graph becomes larger than 
+# this value, doxygen will try to truncate the graph, so that it fits within 
+# the specified constraint. Beware that most browsers cannot cope with very 
+# large images.
+
+MAX_DOT_GRAPH_WIDTH    = 1024
+
+# The MAX_DOT_GRAPH_HEIGHT tag can be used to set the maximum allows height 
+# (in pixels) of the graphs generated by dot. If a graph becomes larger than 
+# this value, doxygen will try to truncate the graph, so that it fits within 
+# the specified constraint. Beware that most browsers cannot cope with very 
+# large images.
+
+MAX_DOT_GRAPH_HEIGHT   = 1024
+
+# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the 
+# graphs generated by dot. A depth value of 3 means that only nodes reachable 
+# from the root by following a path via at most 3 edges will be shown. Nodes 
+# that lay further from the root node will be omitted. Note that setting this 
+# option to 1 or 2 may greatly reduce the computation time needed for large 
+# code bases. Also note that a graph may be further truncated if the graph's 
+# image dimensions are not sufficient to fit the graph (see MAX_DOT_GRAPH_WIDTH 
+# and MAX_DOT_GRAPH_HEIGHT). If 0 is used for the depth value (the default), 
+# the graph is not depth-constrained.
+
+# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of nodes
+# that will be shown in the graph. If the number of nodes in a graph becomes
+# larger than this value, doxygen will truncate the graph, which is visualized
+# by representing a node as a red box. Note that doxygen if the number of direct
+# children of the root node in a graph is already larger than
+# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note that
+# the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
+# Minimum value: 0, maximum value: 10000, default value: 50.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_GRAPH_MAX_NODES    = 200
+
+MAX_DOT_GRAPH_DEPTH    = 0
+
+# Set the DOT_TRANSPARENT tag to YES to generate images with a transparent 
+# background. This is disabled by default, which results in a white background. 
+# Warning: Depending on the platform used, enabling this option may lead to 
+# badly anti-aliased labels on the edges of a graph (i.e. they become hard to 
+# read).
+
+DOT_TRANSPARENT        = NO
+
+# Set the DOT_MULTI_TARGETS tag to YES allow dot to generate multiple output 
+# files in one run (i.e. multiple -o and -T options on the command line). This 
+# makes dot run faster, but since only newer versions of dot (>1.8.10) 
+# support this, this feature is disabled by default.
+
+DOT_MULTI_TARGETS      = YES
+
+# If the GENERATE_LEGEND tag is set to YES (the default) Doxygen will 
+# generate a legend page explaining the meaning of the various boxes and 
+# arrows in the dot generated graphs.
+
+GENERATE_LEGEND        = YES
+
+# If the DOT_CLEANUP tag is set to YES (the default) Doxygen will 
+# remove the intermediate dot files that are used to generate 
+# the various graphs.
+
+DOT_CLEANUP            = YES
+
+#---------------------------------------------------------------------------
+# Configuration::additions related to the search engine   
+#---------------------------------------------------------------------------
+
+# The SEARCHENGINE tag specifies whether or not a search engine should be 
+# used. If set to NO the values of all tags below this one will be ignored.
+
+SEARCHENGINE           = YES
diff --git a/xdl/third_party/tbb/LICENSE b/xdl/third_party/tbb/LICENSE
new file mode 100644
index 00000000..261eeb9e
--- /dev/null
+++ b/xdl/third_party/tbb/LICENSE
@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/xdl/third_party/tbb/Makefile b/xdl/third_party/tbb/Makefile
new file mode 100644
index 00000000..0f7d30d0
--- /dev/null
+++ b/xdl/third_party/tbb/Makefile
@@ -0,0 +1,85 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+tbb_root?=.
+include $(tbb_root)/build/common.inc
+.PHONY: default all tbb tbbmalloc tbbproxy test examples
+
+#workaround for non-depend targets tbb and tbbmalloc which both depend on version_string.ver
+#According to documentation, recursively invoked make commands can process their targets in parallel
+.NOTPARALLEL: tbb tbbmalloc tbbproxy
+
+default: tbb tbbmalloc $(if $(use_proxy),tbbproxy)
+
+all: tbb tbbmalloc tbbproxy test examples
+
+tbb: mkdir
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbb cfg=debug
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbb cfg=release
+
+tbbmalloc: mkdir
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=debug malloc
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=release malloc
+
+tbbproxy: mkdir
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbbproxy cfg=debug tbbproxy
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbbproxy cfg=release tbbproxy
+
+test: tbb tbbmalloc $(if $(use_proxy),tbbproxy)
+	-$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=debug malloc_test
+	-$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.test cfg=debug
+	-$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=release malloc_test
+	-$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.test cfg=release
+
+rml: mkdir
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.rml cfg=debug
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.rml cfg=release
+
+examples: tbb tbbmalloc
+	$(MAKE) -C examples -r -f Makefile tbb_root=.. release test
+
+python: tbb
+	$(MAKE) -C "$(work_dir)_release" -rf $(tbb_root)/python/Makefile install
+
+doxygen:
+	doxygen Doxyfile
+
+.PHONY: clean clean_examples mkdir info
+
+clean: clean_examples
+	$(shell $(RM) $(work_dir)_release$(SLASH)*.* >$(NUL) 2>$(NUL))
+	$(shell $(RD) $(work_dir)_release >$(NUL) 2>$(NUL))
+	$(shell $(RM) $(work_dir)_debug$(SLASH)*.* >$(NUL) 2>$(NUL))
+	$(shell $(RD) $(work_dir)_debug >$(NUL) 2>$(NUL))
+	@echo clean done
+
+clean_examples:
+	$(shell $(MAKE) -s -i -r -C examples -f Makefile tbb_root=.. clean >$(NUL) 2>$(NUL))
+
+mkdir:
+	$(shell $(MD) "$(work_dir)_release" >$(NUL) 2>$(NUL))
+	$(shell $(MD) "$(work_dir)_debug" >$(NUL) 2>$(NUL))
+	@echo Created $(work_dir)_release and ..._debug directories
+
+info:
+	@echo OS: $(tbb_os)
+	@echo arch=$(arch)
+	@echo compiler=$(compiler)
+	@echo runtime=$(runtime)
+	@echo tbb_build_prefix=$(tbb_build_prefix)
+
diff --git a/xdl/third_party/tbb/README b/xdl/third_party/tbb/README
new file mode 100644
index 00000000..fcc87af0
--- /dev/null
+++ b/xdl/third_party/tbb/README
@@ -0,0 +1,11 @@
+Intel(R) Threading Building Blocks - README
+
+See index.html for directions and documentation.
+
+If source is present (./Makefile and src/ directories),
+type 'gmake' in this directory to build and test.
+
+See examples/index.html for runnable examples and directions.
+
+See http://threadingbuildingblocks.org for full documentation
+and software information.
diff --git a/xdl/third_party/tbb/README.md b/xdl/third_party/tbb/README.md
new file mode 100644
index 00000000..81896699
--- /dev/null
+++ b/xdl/third_party/tbb/README.md
@@ -0,0 +1,34 @@
+# Threading Building Blocks 2019 Update 3
+[![Stable release](https://img.shields.io/badge/version-2019_U3-green.svg)](https://github.com/01org/tbb/releases/tag/2019_U3)
+[![Apache License Version 2.0](https://img.shields.io/badge/license-Apache_2.0-green.svg)](LICENSE)
+
+Threading Building Blocks (TBB) lets you easily write parallel C++ programs that take
+full advantage of multicore performance, that are portable, composable and have future-proof scalability.
+
+## Release Information
+Here are the latest [Changes](CHANGES) and [Release Notes](doc/Release_Notes.txt) (contains system requirements and known issues).
+
+Since [2018 U5](https://github.com/01org/tbb/releases/tag/2018_U5) TBB binary packages include [Parallel STL](https://github.com/intel/parallelstl) as a high-level component.
+
+## Documentation
+* TBB [tutorial](https://software.intel.com/en-us/tbb-tutorial)
+* TBB general documentation: [stable](https://software.intel.com/en-us/tbb-documentation)
+and [latest](https://www.threadingbuildingblocks.org/docs/help/index.htm)
+
+## Support
+Please report issues and suggestions via
+[GitHub issues](https://github.com/01org/tbb/issues) or start a topic on the
+[TBB forum](http://software.intel.com/en-us/forums/intel-threading-building-blocks/).
+
+## How to Contribute
+To contribute to TBB, please open a GitHub pull request (preferred) or send us a patch by e-mail.
+Threading Building Blocks is licensed under [Apache License, Version 2.0](LICENSE).
+By its terms, contributions submitted to the project are also done under that license.
+
+## Engineering team contacts
+* [E-mail us.](mailto:inteltbbdevelopers@intel.com)
+
+------------------------------------------------------------------------
+Intel and the Intel logo are trademarks of Intel Corporation or its subsidiaries in the U.S. and/or other countries.
+
+\* Other names and brands may be claimed as the property of others.
diff --git a/xdl/third_party/tbb/build/AIX.gcc.inc b/xdl/third_party/tbb/build/AIX.gcc.inc
new file mode 100644
index 00000000..5adcd41d
--- /dev/null
+++ b/xdl/third_party/tbb/build/AIX.gcc.inc
@@ -0,0 +1,75 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+DYLIB_KEY = -shared
+LIBDL = -ldl
+
+CPLUS = g++ 
+CONLY = gcc
+LIB_LINK_FLAGS = -shared
+LIBS = -lpthread -ldl 
+C_FLAGS = $(CPLUS_FLAGS) -x c
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = -O2 -DUSE_PTHREAD -pthread
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG -g -O0 -DUSE_PTHREAD -pthread
+endif
+
+ASM=
+ASM_FLAGS=
+
+TBB_ASM.OBJ=
+
+ifeq (powerpc,$(arch))
+    CPLUS_FLAGS    += -maix64 -Wl,-G
+    LIB_LINK_FLAGS += -maix64 -Wl,-b64 -Wl,-brtl -Wl,-G
+endif 
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+
+ASSEMBLY_SOURCE=ibm_aix51
+ifeq (powerpc,$(arch))
+    TBB_ASM.OBJ = atomic_support.o
+endif
+
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/AIX.inc b/xdl/third_party/tbb/build/AIX.inc
new file mode 100644
index 00000000..e279a4da
--- /dev/null
+++ b/xdl/third_party/tbb/build/AIX.inc
@@ -0,0 +1,66 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifndef arch
+        arch:=$(shell uname -p)
+        export arch
+endif
+
+ifndef runtime
+        gcc_version:=$(shell gcc -dumpversion)
+        os_version:=$(shell uname -r)
+        os_kernel_version:=$(shell uname -r | sed -e 's/-.*$$//')
+        export runtime:=cc$(gcc_version)_kernel$(os_kernel_version)
+endif
+
+native_compiler := gcc
+export compiler ?= gcc
+debugger ?= gdb
+
+CMD=$(SHELL) -c
+CWD=$(shell pwd)
+RM?=rm -f
+RD?=rmdir
+MD?=mkdir -p
+NUL= /dev/null
+SLASH=/
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_aix.sh $(VERSION_FLAGS) >version_string.ver
+MAKE_TBBVARS=sh $(tbb_root)/build/generate_tbbvars.sh
+
+ifdef LIBPATH
+        export LIBPATH := .:$(LIBPATH)
+else
+        export LIBPATH := .
+endif
+
+####### Build settings ########################################################
+
+OBJ = o
+DLL = so
+
+TBB.LST =
+TBB.DEF =
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+TEST_LAUNCHER=sh $(tbb_root)/build/test_launcher.sh $(largs)
diff --git a/xdl/third_party/tbb/build/BSD.clang.inc b/xdl/third_party/tbb/build/BSD.clang.inc
new file mode 100644
index 00000000..fc134061
--- /dev/null
+++ b/xdl/third_party/tbb/build/BSD.clang.inc
@@ -0,0 +1,110 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wextra -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor -Wno-dangling-else
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL =
+
+CPLUS = clang++
+CONLY = clang
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+LIBS += -lpthread
+LINK_FLAGS = -Wl,-rpath-link=. -Wl,-rpath=. -rdynamic
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = $(ITT_NOTIFY) -g -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG $(ITT_NOTIFY) -g -O0 -DUSE_PTHREAD
+endif
+
+ifneq (,$(stdlib))
+    CPLUS_FLAGS    += -stdlib=$(stdlib)
+    LIB_LINK_FLAGS += -stdlib=$(stdlib)
+endif
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m32 -march=pentium4
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (ppc64,$(arch))
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ppc32,$(arch))
+    CPLUS_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (bg,$(arch))
+    CPLUS = bgclang++
+    CONLY = bgclang
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/BSD.inc b/xdl/third_party/tbb/build/BSD.inc
new file mode 100644
index 00000000..0ba21351
--- /dev/null
+++ b/xdl/third_party/tbb/build/BSD.inc
@@ -0,0 +1,74 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifndef arch
+        ifeq ($(shell uname -m),i386)
+                export arch:=ia32
+        endif
+        ifeq ($(shell uname -m),ia64)
+                export arch:=ia64
+        endif
+        ifeq ($(shell uname -m),amd64)
+                export arch:=intel64
+        endif
+endif
+
+ifndef runtime
+        clang_version:=$(shell clang -v 2>&1 | grep version | sed "s/.*version \([0-9]*\.[0-9]*\).*/\1/")
+        os_version:=$(shell uname -r)
+        os_kernel_version:=$(shell uname -r | sed -e 's/-.*$$//')
+        export runtime:=cc$(clang_version)_kernel$(os_kernel_version)
+endif
+
+native_compiler := clang
+export compiler ?= clang
+debugger ?= gdb
+
+CMD=$(SHELL) -c
+CWD=$(shell pwd)
+RM?=rm -f
+RD?=rmdir
+MD?=mkdir -p
+NUL= /dev/null
+SLASH=/
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_linux.sh $(VERSION_FLAGS) >version_string.ver
+MAKE_TBBVARS=sh $(tbb_root)/build/generate_tbbvars.sh
+
+ifdef LD_LIBRARY_PATH
+        export LD_LIBRARY_PATH := .:$(LD_LIBRARY_PATH)
+else
+        export LD_LIBRARY_PATH := .
+endif
+
+####### Build settings ########################################################
+
+OBJ = o
+DLL = so
+LIBEXT=so
+
+TBB.LST =
+TBB.DEF =
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+TEST_LAUNCHER=sh $(tbb_root)/build/test_launcher.sh $(largs)
diff --git a/xdl/third_party/tbb/build/FreeBSD.clang.inc b/xdl/third_party/tbb/build/FreeBSD.clang.inc
new file mode 100644
index 00000000..aae99642
--- /dev/null
+++ b/xdl/third_party/tbb/build/FreeBSD.clang.inc
@@ -0,0 +1,21 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+include $(tbb_root)/build/BSD.clang.inc
+
+LIBS += -lrt
diff --git a/xdl/third_party/tbb/build/FreeBSD.gcc.inc b/xdl/third_party/tbb/build/FreeBSD.gcc.inc
new file mode 100644
index 00000000..1c8ff5ff
--- /dev/null
+++ b/xdl/third_party/tbb/build/FreeBSD.gcc.inc
@@ -0,0 +1,93 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+DYLIB_KEY = -shared
+WARNING_SUPPRESS = -Wno-parentheses
+
+CPLUS = g++ 
+CONLY = gcc
+LIB_LINK_FLAGS = -shared
+LIBS = -lpthread 
+C_FLAGS = $(CPLUS_FLAGS)
+
+# gcc 6.0 and later have -flifetime-dse option that controls
+# elimination of stores done outside the object lifetime
+ifneq (,$(shell gcc -dumpversion | egrep  "^([6-9])"))
+    # keep pre-contruction stores for zero initialization
+    DSE_KEY = -flifetime-dse=1
+endif
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = -g -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG -g -O0 -DUSE_PTHREAD
+endif
+
+ASM=
+ASM_FLAGS=
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ifeq (ia64,$(arch))
+# Position-independent code (PIC) is a must on IA-64 architecture, even for regular (not shared) executables
+    CPLUS_FLAGS += $(PIC_KEY)
+endif 
+
+ifeq (intel64,$(arch))
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif 
+
+ifeq (ia32,$(arch))
+    CPLUS_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif 
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASSEMBLY_SOURCE=$(arch)-gas
+ifeq (ia64,$(arch))
+    ASM=as
+    TBB_ASM.OBJ = atomic_support.o lock_byte.o log2.o pause.o
+    MALLOC_ASM.OBJ = atomic_support.o lock_byte.o pause.o
+endif 
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/FreeBSD.inc b/xdl/third_party/tbb/build/FreeBSD.inc
new file mode 100644
index 00000000..91bebc96
--- /dev/null
+++ b/xdl/third_party/tbb/build/FreeBSD.inc
@@ -0,0 +1,19 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+include $(tbb_root)/build/BSD.inc
diff --git a/xdl/third_party/tbb/build/Makefile.rml b/xdl/third_party/tbb/build/Makefile.rml
new file mode 100644
index 00000000..e3150e39
--- /dev/null
+++ b/xdl/third_party/tbb/build/Makefile.rml
@@ -0,0 +1,166 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# TODO: investigate why version_string.ver is not complete when $(RML_SERVER.OBJ) is being compiled.
+.NOTPARALLEL:
+
+tbb_root ?= $(TBBROOT)
+BUILDING_PHASE=1
+TEST_RESOURCE = $(RML.RES)
+include $(tbb_root)/build/common.inc
+DEBUG_SUFFIX=$(findstring _debug,_$(cfg))
+
+ifeq (android,$(target))
+$(error "RML is not supported on Android")
+endif
+
+# default target
+default_rml: rml rml_test
+
+RML_ROOT ?= $(tbb_root)/src/rml
+RML_SERVER_ROOT = $(RML_ROOT)/server
+
+VPATH = $(tbb_root)/src/tbb $(tbb_root)/src/tbb/$(ASSEMBLY_SOURCE)
+VPATH += $(RML_ROOT)/server $(RML_ROOT)/client $(RML_ROOT)/test $(tbb_root)/src/test
+
+include $(tbb_root)/build/common_rules.inc
+
+#--------------------------------------------------------------------------
+# Define rules for making the RML server shared library and client objects.
+#--------------------------------------------------------------------------
+
+# Object files that make up RML server
+RML_SERVER.OBJ = rml_server.$(OBJ)
+
+# Object files that RML clients need
+RML_TBB_CLIENT.OBJ ?= rml_tbb.$(OBJ) dynamic_link_rml.$(OBJ)
+RML_OMP_CLIENT.OBJ ?= rml_omp.$(OBJ) omp_dynamic_link.$(OBJ)
+
+RML.OBJ = $(RML_SERVER.OBJ) $(RML_TBB_CLIENT.OBJ) $(RML_OMP_CLIENT.OBJ)
+ifeq (windows,$(tbb_os))
+RML_ASM.OBJ = $(if $(findstring intel64,$(arch)),$(TBB_ASM.OBJ))
+endif
+ifeq (linux,$(tbb_os))
+RML_ASM.OBJ = $(if $(findstring ia64,$(arch)),$(TBB_ASM.OBJ))
+endif
+
+RML_TBB_DEP= cache_aligned_allocator_rml.$(OBJ) dynamic_link_rml.$(OBJ) concurrent_vector_rml.$(OBJ) semaphore_rml.$(OBJ) tbb_misc_rml.$(OBJ) tbb_misc_ex_rml.$(OBJ)
+TBB_DEP_NON_RML_TEST?= cache_aligned_allocator_rml.$(OBJ) dynamic_link_rml.$(OBJ) $(RML_ASM.OBJ) tbb_misc_rml.$(OBJ) tbb_misc_ex_rml.$(OBJ)
+ifeq ($(cfg),debug)
+RML_TBB_DEP+= spin_mutex_rml.$(OBJ)
+TBB_DEP_RML_TEST?= $(RML_ASM.OBJ) tbb_misc_rml.$(OBJ)
+else
+TBB_DEP_RML_TEST?= $(RML_ASM.OBJ)
+endif
+LIBS += $(LIBDL)
+
+INCLUDES += $(INCLUDE_KEY)$(RML_ROOT)/include $(INCLUDE_KEY).
+T_INCLUDES = $(INCLUDES) $(INCLUDE_KEY)$(tbb_root)/src/test $(INCLUDE_KEY)$(RML_SERVER_ROOT)
+
+ifeq ($(rml_wcrm),1)
+CPLUS_FLAGS+=/DRML_USE_WCRM
+endif
+
+# Suppress superfluous warnings for RML compilation
+R_CPLUS_FLAGS =  $(subst DO_ITT_NOTIFY,DO_ITT_NOTIFY=0,$(CPLUS_FLAGS)) $(WARNING_SUPPRESS) \
+		 $(DEFINE_KEY)TBB_USE_THREADING_TOOLS=0 $(DEFINE_KEY)__TBB_RML_STATIC=1 $(DEFINE_KEY)__TBB_NO_IMPLICIT_LINKAGE=1
+
+%.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(R_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(INCLUDES) $<
+
+ifeq (linux,$(tbb_os))
+omp_dynamic_link.$(OBJ): CPLUS_FLAGS+=-fno-exceptions
+endif
+
+tbb_misc_rml.$(OBJ) $(RML_SERVER.OBJ): version_string.ver
+
+RML_TEST.OBJ = test_job_automaton.$(OBJ) test_thread_monitor.$(OBJ) test_rml_tbb.$(OBJ) test_rml_omp.$(OBJ) test_rml_mixed.$(OBJ)
+
+$(RML_TBB_DEP): %_rml.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(OUTPUTOBJ_KEY)$@ $(R_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(INCLUDES) $<
+
+$(RML_TEST.OBJ): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(R_CPLUS_FLAGS) $(PIC_KEY) $(T_INCLUDES) $<
+
+ifneq (,$(RML.DEF))
+rml.def: $(RML.DEF)
+	$(CPLUS) $(PREPROC_ONLY) $< $(CPLUS_FLAGS) $(INCLUDES) > $@
+
+LIB_LINK_FLAGS += $(EXPORT_KEY)rml.def
+$(RML.DLL): rml.def
+endif
+
+$(RML.DLL): CPLUS_FLAGS += $(SDL_FLAGS)
+$(RML.DLL): BUILDING_LIBRARY = $(RML.DLL)
+$(RML.DLL): $(RML_TBB_DEP) $(RML_SERVER.OBJ) $(RML.RES) $(RML_NO_VERSION.DLL) $(RML_ASM.OBJ)
+	$(LIB_LINK_CMD) $(LIB_OUTPUT_KEY)$(RML.DLL) $(RML_SERVER.OBJ) $(RML_TBB_DEP) $(RML_ASM.OBJ) $(RML.RES) $(LIB_LINK_LIBS) $(LIB_LINK_FLAGS)
+
+ifneq (,$(RML_NO_VERSION.DLL))
+$(RML_NO_VERSION.DLL):
+	echo "INPUT ($(RML.DLL))" > $(RML_NO_VERSION.DLL)
+endif
+
+rml: $(RML.DLL) $(RML_TBB_CLIENT.OBJ) $(RML_OMP_CLIENT.OBJ)
+
+#------------------------------------------------------
+# End of rules for making the RML server shared library
+#------------------------------------------------------
+
+#------------------------------------------------------
+# Define rules for making the RML unit tests
+#------------------------------------------------------
+
+add_debug=$(basename $(1))_debug$(suffix $(1))
+cross_suffix=$(if $(crosstest),$(if $(DEBUG_SUFFIX),$(subst _debug,,$(1)),$(call add_debug,$(1))),$(1))
+
+RML_TESTS = test_job_automaton.$(TEST_EXT) test_thread_monitor.$(TEST_EXT)
+RML_CUSTOM_TESTS = test_rml_tbb.$(TEST_EXT) test_rml_omp.$(TEST_EXT) test_rml_mixed.$(TEST_EXT) test_rml_omp_c_linkage.$(TEST_EXT)
+
+test_rml_tbb.$(TEST_EXT): test_rml_tbb.$(OBJ) $(RML_TBB_CLIENT.OBJ) $(TBB_DEP_RML_TEST)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) test_rml_tbb.$(OBJ) $(RML_TBB_CLIENT.OBJ) $(TBB_DEP_RML_TEST) $(LIBS) $(LINK_FLAGS)
+
+test_rml_omp.$(TEST_EXT): test_rml_omp.$(OBJ) $(RML_OMP_CLIENT.OBJ) $(TBB_DEP_NON_RML_TEST)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) test_rml_omp.$(OBJ) $(RML_OMP_CLIENT.OBJ) $(TBB_DEP_NON_RML_TEST) $(LIBS) $(LINK_FLAGS)
+
+test_rml_mixed.$(TEST_EXT): test_rml_mixed.$(OBJ) $(RML_TBB_CLIENT.OBJ) $(RML_OMP_CLIENT.OBJ) $(TBB_DEP_RML_TEST)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) test_rml_mixed.$(OBJ) $(RML_TBB_CLIENT.OBJ) $(RML_OMP_CLIENT.OBJ) $(TBB_DEP_RML_TEST) $(LIBS) $(LINK_FLAGS)
+
+rml_omp_stub.$(OBJ): rml_omp_stub.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(M_CPLUS_FLAGS) $(WARNING_SUPPRESS) $(T_INCLUDES) $(PIC_KEY) $<
+
+test_rml_omp_c_linkage.$(TEST_EXT): test_rml_omp_c_linkage.$(OBJ) rml_omp_stub.$(OBJ) omp_dynamic_link.$(OBJ)
+	$(CONLY) $(C_FLAGS) $(OUTPUT_KEY)$@ test_rml_omp_c_linkage.$(OBJ) rml_omp_stub.$(OBJ) omp_dynamic_link.$(OBJ) $(LIBS) $(LINK_FLAGS)
+
+$(RML_TESTS): %.$(TEST_EXT): %.$(OBJ) $(TBB_DEP_NON_RML_TEST)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) $< $(TBB_DEP_NON_RML_TEST) $(LIBS) $(LINK_FLAGS)
+
+### run_cmd is usually empty
+rml_test: $(call cross_suffix,$(RML.DLL)) $(TEST_PREREQUISITE) $(RML_TESTS) $(RML_CUSTOM_TESTS)
+	$(run_cmd) ./test_job_automaton.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_thread_monitor.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_rml_tbb.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_rml_omp.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_rml_mixed.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_rml_omp_c_linkage.$(TEST_EXT) $(args)
+
+#------------------------------------------------------
+# End of rules for making the TBBMalloc unit tests
+#------------------------------------------------------
+
+# Include automatically generated dependencies
+-include *.d
diff --git a/xdl/third_party/tbb/build/Makefile.tbb b/xdl/third_party/tbb/build/Makefile.tbb
new file mode 100644
index 00000000..0ddf4601
--- /dev/null
+++ b/xdl/third_party/tbb/build/Makefile.tbb
@@ -0,0 +1,118 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#------------------------------------------------------------------------------
+# Define rules for making the TBB shared library.
+#------------------------------------------------------------------------------
+
+tbb_root ?= "$(TBBROOT)"
+BUILDING_PHASE=1
+include $(tbb_root)/build/common.inc
+CPLUS_FLAGS += $(SDL_FLAGS)
+DEBUG_SUFFIX=$(findstring _debug,_$(cfg))
+
+#------------------------------------------------------------
+# Define static pattern rules dealing with .cpp source files
+#------------------------------------------------------------
+$(warning CONFIG: cfg=$(cfg) arch=$(arch) compiler=$(compiler) target=$(target) runtime=$(runtime))
+
+default_tbb: $(TBB.DLL)
+.PHONY: default_tbb tbbvars clean
+.PRECIOUS: %.$(OBJ)
+
+VPATH = $(tbb_root)/src/tbb/$(ASSEMBLY_SOURCE) $(tbb_root)/src/tbb $(tbb_root)/src/old $(tbb_root)/src/rml/client
+
+CPLUS_FLAGS += $(PIC_KEY) $(DSE_KEY) $(DEFINE_KEY)__TBB_BUILD=1
+
+# Object files (that were compiled from C++ code) that gmake up TBB
+TBB_CPLUS.OBJ = concurrent_hash_map.$(OBJ) \
+		concurrent_queue.$(OBJ) \
+		concurrent_vector.$(OBJ) \
+		dynamic_link.$(OBJ) \
+		itt_notify.$(OBJ) \
+		cache_aligned_allocator.$(OBJ) \
+		pipeline.$(OBJ) \
+		queuing_mutex.$(OBJ) \
+		queuing_rw_mutex.$(OBJ) \
+		reader_writer_lock.$(OBJ) \
+		spin_rw_mutex.$(OBJ) \
+		x86_rtm_rw_mutex.$(OBJ) \
+		spin_mutex.$(OBJ) \
+		critical_section.$(OBJ) \
+		mutex.$(OBJ) \
+		recursive_mutex.$(OBJ) \
+		condition_variable.$(OBJ) \
+		tbb_thread.$(OBJ) \
+		concurrent_monitor.$(OBJ) \
+		semaphore.$(OBJ) \
+		private_server.$(OBJ) \
+		rml_tbb.$(OBJ) \
+		tbb_misc.$(OBJ) \
+		tbb_misc_ex.$(OBJ) \
+		task.$(OBJ) \
+		task_group_context.$(OBJ) \
+		governor.$(OBJ) \
+		market.$(OBJ) \
+		arena.$(OBJ) \
+		scheduler.$(OBJ) \
+		observer_proxy.$(OBJ) \
+		tbb_statistics.$(OBJ) \
+		tbb_main.$(OBJ)
+
+# OLD/Legacy object files for backward binary compatibility
+ifeq (,$(findstring $(DEFINE_KEY)TBB_NO_LEGACY,$(CPLUS_FLAGS)))
+TBB_CPLUS_OLD.OBJ = \
+		concurrent_vector_v2.$(OBJ) \
+		concurrent_queue_v2.$(OBJ) \
+		spin_rw_mutex_v2.$(OBJ) \
+		task_v2.$(OBJ)
+endif
+
+# Object files that gmake up TBB (TBB_ASM.OBJ is platform-specific)
+TBB.OBJ = $(TBB_CPLUS.OBJ) $(TBB_CPLUS_OLD.OBJ) $(TBB_ASM.OBJ)
+
+# Suppress superfluous warnings for TBB compilation
+WARNING_KEY += $(WARNING_SUPPRESS)
+
+include $(tbb_root)/build/common_rules.inc
+
+ifneq (,$(TBB.DEF))
+tbb.def: $(TBB.DEF) $(TBB.LST)
+	$(CPLUS) $(PREPROC_ONLY) $< $(CPLUS_FLAGS) $(INCLUDES) > $@
+
+LIB_LINK_FLAGS += $(EXPORT_KEY)tbb.def
+$(TBB.DLL): tbb.def
+endif
+
+tbbvars.sh:
+	$(MAKE_TBBVARS)
+
+$(TBB.DLL): BUILDING_LIBRARY = $(TBB.DLL)
+$(TBB.DLL): $(TBB.OBJ) $(TBB.RES) tbbvars.sh $(TBB_NO_VERSION.DLL)
+	$(LIB_LINK_CMD) $(LIB_OUTPUT_KEY)$(TBB.DLL) $(TBB.OBJ) $(TBB.RES) $(LIB_LINK_LIBS) $(LIB_LINK_FLAGS)
+
+ifneq (,$(TBB_NO_VERSION.DLL))
+$(TBB_NO_VERSION.DLL):
+	echo "INPUT ($(TBB.DLL))" > $(TBB_NO_VERSION.DLL)
+endif
+
+#clean:
+#	$(RM) *.$(OBJ) *.$(DLL) *.res *.map *.ilk *.pdb *.exp *.manifest *.tmp *.d core core.*[0-9][0-9] *.ver
+
+# Include automatically generated dependencies
+-include *.d
diff --git a/xdl/third_party/tbb/build/Makefile.tbbmalloc b/xdl/third_party/tbb/build/Makefile.tbbmalloc
new file mode 100644
index 00000000..c147568b
--- /dev/null
+++ b/xdl/third_party/tbb/build/Makefile.tbbmalloc
@@ -0,0 +1,260 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# default target
+default_malloc: malloc malloc_test
+
+tbb_root ?= $(TBBROOT)
+BUILDING_PHASE=1
+TEST_RESOURCE = $(MALLOC.RES)
+TESTFILE=tbbmalloc
+include $(tbb_root)/build/common.inc
+DEBUG_SUFFIX=$(findstring _debug,$(call cross_cfg,_$(cfg)))
+
+MALLOC_ROOT ?= $(tbb_root)/src/tbbmalloc
+MALLOC_SOURCE_ROOT ?= $(MALLOC_ROOT)
+
+VPATH = $(tbb_root)/src/tbb/$(ASSEMBLY_SOURCE) $(tbb_root)/src/tbb $(tbb_root)/src/test
+VPATH += $(MALLOC_ROOT) $(MALLOC_SOURCE_ROOT)
+
+CPLUS_FLAGS += $(if $(crosstest),$(DEFINE_KEY)__TBBMALLOC_NO_IMPLICIT_LINKAGE=1)
+
+TEST_SUFFIXES=proxy
+TEST_PREREQUISITE+=$(MALLOC.LIB)
+LINK_FILES+=$(LINK_MALLOC.LIB)
+include $(tbb_root)/build/common_rules.inc
+
+ORIG_CPLUS_FLAGS:=$(CPLUS_FLAGS)
+ORIG_INCLUDES:=$(INCLUDES)
+ORIG_LINK_MALLOC.LIB:=$(LINK_MALLOC.LIB)
+
+#------------------------------------------------------
+# Define rules for making the TBBMalloc shared library.
+#------------------------------------------------------
+
+# Object files that make up TBBMalloc
+MALLOC_CPLUS.OBJ = backend.$(OBJ) large_objects.$(OBJ) backref.$(OBJ)  tbbmalloc.$(OBJ)
+MALLOC.OBJ := $(MALLOC_CPLUS.OBJ) $(MALLOC_ASM.OBJ) itt_notify_malloc.$(OBJ) frontend.$(OBJ)
+PROXY.OBJ := proxy.$(OBJ) tbb_function_replacement.$(OBJ)
+M_CPLUS_FLAGS += $(DEFINE_KEY)__TBBMALLOC_BUILD=1
+M_INCLUDES := $(INCLUDES) $(INCLUDE_KEY)$(MALLOC_ROOT) $(INCLUDE_KEY)$(MALLOC_SOURCE_ROOT)
+
+# Suppress superfluous warnings for TBBMalloc compilation
+$(MALLOC.OBJ): M_CPLUS_FLAGS := $(subst $(WARNING_KEY),,$(M_CPLUS_FLAGS)) $(WARNING_SUPPRESS)
+# Suppress superfluous warnings for TBBMalloc proxy compilation
+$(PROXY.OBJ): CPLUS_FLAGS += $(WARNING_SUPPRESS)
+
+frontend.$(OBJ): frontend.cpp version_string.ver
+	$(CPLUS) $(COMPILE_ONLY) $(M_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(M_INCLUDES) $(INCLUDE_KEY). $<
+
+$(PROXY.OBJ): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(DEFINE_KEY)__TBBMALLOC_BUILD=1 $(M_INCLUDES) $<
+
+$(MALLOC_CPLUS.OBJ): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(M_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(M_INCLUDES) $<
+
+itt_notify_malloc.$(OBJ): itt_notify.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(M_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(OUTPUTOBJ_KEY)$@ $(INCLUDES) $<
+
+MALLOC_LINK_FLAGS = $(LIB_LINK_FLAGS)
+PROXY_LINK_FLAGS = $(LIB_LINK_FLAGS)
+
+ifneq (,$(MALLOC.DEF))
+tbbmalloc.def: $(MALLOC.DEF)
+	$(CPLUS) $(PREPROC_ONLY) $< $(M_CPLUS_FLAGS) $(WARNING_SUPPRESS) $(INCLUDES) > $@
+
+MALLOC_LINK_FLAGS += $(EXPORT_KEY)tbbmalloc.def
+$(MALLOC.DLL): tbbmalloc.def
+endif
+
+$(MALLOC.DLL) $(MALLOCPROXY.DLL): CPLUS_FLAGS += $(SDL_FLAGS)
+$(MALLOC.DLL) $(MALLOCPROXY.DLL): M_CPLUS_FLAGS += $(SDL_FLAGS)
+$(MALLOC.DLL): BUILDING_LIBRARY = $(MALLOC.DLL)
+$(MALLOC.DLL): $(MALLOC.OBJ) $(MALLOC.RES) $(MALLOC_NO_VERSION.DLL)
+	$(subst $(CPLUS),$(CONLY),$(LIB_LINK_CMD)) $(LIB_OUTPUT_KEY)$(MALLOC.DLL) $(MALLOC.OBJ) $(MALLOC.RES) $(LIB_LINK_LIBS) $(MALLOC_LINK_FLAGS)
+
+ifneq (,$(MALLOCPROXY.DEF))
+tbbmallocproxy.def: $(MALLOCPROXY.DEF)
+	$(CPLUS) $(PREPROC_ONLY) $< $(CPLUS_FLAGS) $(WARNING_SUPPRESS) $(INCLUDES) > $@
+
+PROXY_LINK_FLAGS += $(EXPORT_KEY)tbbmallocproxy.def
+$(MALLOCPROXY.DLL): tbbmallocproxy.def
+endif
+
+ifneq (,$(MALLOCPROXY.DLL))
+$(MALLOCPROXY.DLL): BUILDING_LIBRARY = $(MALLOCPROXY.DLL)
+$(MALLOCPROXY.DLL): $(PROXY.OBJ) $(MALLOCPROXY_NO_VERSION.DLL) $(MALLOC.DLL) $(MALLOC.RES)
+	$(LIB_LINK_CMD) $(LIB_OUTPUT_KEY)$(MALLOCPROXY.DLL) $(PROXY.OBJ) $(MALLOC.RES) $(LIB_LINK_LIBS) $(LINK_MALLOC.LIB) $(PROXY_LINK_FLAGS)
+endif
+
+ifneq (,$(MALLOC_NO_VERSION.DLL))
+$(MALLOC_NO_VERSION.DLL):
+	echo "INPUT ($(MALLOC.DLL))" > $(MALLOC_NO_VERSION.DLL)
+endif
+
+ifneq (,$(MALLOCPROXY_NO_VERSION.DLL))
+$(MALLOCPROXY_NO_VERSION.DLL):
+	echo "INPUT ($(MALLOCPROXY.DLL))" > $(MALLOCPROXY_NO_VERSION.DLL)
+endif
+
+malloc: $(MALLOC.DLL) $(MALLOCPROXY.DLL)
+
+malloc_dll: $(MALLOC.DLL)
+
+malloc_proxy_dll: $(MALLOCPROXY.DLL)
+
+.PHONY: malloc malloc_dll malloc_proxy_dll
+
+#------------------------------------------------------
+# End of rules for making the TBBMalloc shared library
+#------------------------------------------------------
+
+#------------------------------------------------------
+# Define rules for making the TBBMalloc unit tests
+#------------------------------------------------------
+
+# --------- The list of TBBMalloc unit tests ----------
+MALLOC_TESTS = test_ScalableAllocator.$(TEST_EXT) \
+               test_ScalableAllocator_STL.$(TEST_EXT) \
+               test_malloc_compliance.$(TEST_EXT) \
+               test_malloc_regression.$(TEST_EXT) \
+               test_malloc_init_shutdown.$(TEST_EXT) \
+               test_malloc_pools.$(TEST_EXT) \
+               test_malloc_pure_c.$(TEST_EXT) \
+               test_malloc_whitebox.$(TEST_EXT) \
+               test_malloc_used_by_lib.$(TEST_EXT) \
+               test_malloc_lib_unload.$(TEST_EXT) \
+               test_malloc_shutdown_hang.$(TEST_EXT)
+ifneq (,$(MALLOCPROXY.DLL))
+MALLOC_TESTS += test_malloc_overload.$(TEST_EXT) \
+                test_malloc_overload_proxy.$(TEST_EXT) \
+                test_malloc_overload_disable.$(TEST_EXT) \
+                test_malloc_atexit.$(TEST_EXT) \
+                test_malloc_new_handler.$(TEST_EXT)
+endif
+# -----------------------------------------------------
+
+# ------------ Set test specific variables ------------
+# TODO: implement accurate warning suppression for tests to unify with Makefile.test.
+$(MALLOC_TESTS): CPLUS_FLAGS += $(TEST_WARNING_KEY) $(if $(no_exceptions),$(DEFINE_KEY)__TBB_TEST_NO_EXCEPTIONS=1)
+$(MALLOC_TESTS): M_CPLUS_FLAGS += $(TEST_WARNING_KEY) $(if $(no_exceptions),$(DEFINE_KEY)__TBB_TEST_NO_EXCEPTIONS=1)
+$(MALLOC_TESTS): INCLUDES += $(INCLUDE_TEST_HEADERS)
+$(MALLOC_TESTS): M_INCLUDES += $(INCLUDE_TEST_HEADERS)
+
+ifeq (windows.gcc,$(tbb_os).$(compiler))
+test_malloc_overload.$(TEST_EXT): LIBS += $(MALLOCPROXY.LIB)
+endif
+
+MALLOC_M_CPLUS_TESTS =    test_malloc_whitebox.$(TEST_EXT) test_malloc_lib_unload.$(TEST_EXT) \
+        test_malloc_used_by_lib.$(TEST_EXT)
+MALLOC_NO_LIB_TESTS =     test_malloc_whitebox.$(TEST_EXT) test_malloc_lib_unload.$(TEST_EXT) \
+        test_malloc_used_by_lib.$(TEST_EXT) test_malloc_overload.$(TEST_EXT)
+MALLOC_LINK_PROXY_TESTS = test_malloc_overload_proxy.$(TEST_EXT) test_malloc_new_handler.$(TEST_EXT)
+MALLOC_ADD_DLL_TESTS =    test_malloc_lib_unload.$(TEST_EXT) test_malloc_used_by_lib.$(TEST_EXT) \
+        test_malloc_atexit.$(TEST_EXT)
+MALLOC_SUPPRESS_WARNINGS =  test_malloc_whitebox.$(TEST_EXT) test_malloc_pure_c.$(TEST_EXT)
+
+$(MALLOC_SUPPRESS_WARNINGS): WARNING_KEY=
+$(MALLOC_SUPPRESS_WARNINGS): TEST_WARNING_KEY=
+$(MALLOC_M_CPLUS_TESTS): CPLUS_FLAGS:=$(M_CPLUS_FLAGS)
+$(MALLOC_M_CPLUS_TESTS): INCLUDES=$(M_INCLUDES)
+$(MALLOC_NO_LIB_TESTS): LINK_MALLOC.LIB=
+$(MALLOC_NO_LIB_TESTS): LINK_FLAGS+=$(LIBDL)
+$(MALLOC_LINK_PROXY_TESTS): LINK_MALLOC.LIB=$(LINK_MALLOCPROXY.LIB)
+ifneq (,$(DYLIB_KEY))
+$(MALLOC_ADD_DLL_TESTS): %.$(TEST_EXT): %_dll.$(DLL)
+$(MALLOC_ADD_DLL_TESTS): TEST_LIBS+=$(@:.$(TEST_EXT)=_dll.$(LIBEXT))
+endif
+
+test_malloc_over%.$(TEST_EXT): CPLUS_FLAGS:=$(subst /MT,/MD,$(M_CPLUS_FLAGS))
+test_malloc_over%.$(TEST_EXT): INCLUDES=$(M_INCLUDES)
+test_malloc_overload_proxy.$(TEST_EXT): LINK_FLAGS+=$(LIBDL)
+
+test_malloc_atexit_dll.$(DLL): CPLUS_FLAGS:=$(subst /MT,/MD,$(M_CPLUS_FLAGS))
+test_malloc_atexit.$(TEST_EXT): CPLUS_FLAGS:=$(subst /MT,/MD,$(M_CPLUS_FLAGS))
+test_malloc_atexit.$(TEST_EXT): LINK_FLAGS+=$(LIBDL)
+# on Ubuntu 11.10 linker called with --as-needed, so dependency on libtbbmalloc_proxy
+# is not created, and malloc overload via linking with -ltbbmalloc_proxy is not working.
+# Overcome with --no-as-needed.
+ifeq (linux.gcc,$(tbb_os).$(compiler))
+test_malloc_atexit.$(TEST_EXT): MALLOCPROXY.LIB := -Wl,--no-as-needed $(MALLOCPROXY.LIB)
+endif
+# The test isn't added to MALLOC_LINK_PROXY_TESTS, because we need both
+# tbbmalloc and proxy libs. For platforms other than Android it's enough
+# to modify LINK_MALLOC.LIB for TEST_EXT target only. But under Android build
+# of DLL and TEST_EXT can be requested independently, so there is no chance
+# to set LINK_MALLOC.LIB in TEST_EXT build rule, and affect DLL build.
+test_malloc_atexit.$(TEST_EXT): LINK_MALLOC.LIB := $(LINK_MALLOC.LIB) $(LINK_MALLOCPROXY.LIB)
+test_malloc_atexit_dll.$(DLL): LINK_MALLOC.LIB := $(LINK_MALLOC.LIB) $(LINK_MALLOCPROXY.LIB)
+
+test_malloc_whitebox.$(TEST_EXT): $(MALLOC_ASM.OBJ) version_string.ver
+test_malloc_whitebox.$(TEST_EXT): INCLUDES+=$(INCLUDE_KEY).
+test_malloc_whitebox.$(TEST_EXT): LINK_FILES+=$(MALLOC_ASM.OBJ)
+
+# Some _dll targets need to restore variables since they are changed by parent
+# target-specific rule of its .exe targets
+test_malloc_lib_unload_dll.$(DLL): CPLUS_FLAGS=$(ORIG_CPLUS_FLAGS) $(if $(no_exceptions),$(DEFINE_KEY)__TBB_TEST_NO_EXCEPTIONS=1)
+test_malloc_lib_unload_dll.$(DLL): INCLUDES=$(ORIG_INCLUDES) $(INCLUDE_TEST_HEADERS)
+
+test_malloc_used_by_lib_dll.$(DLL): CPLUS_FLAGS:=$(subst /MT,/LD,$(M_CPLUS_FLAGS))
+test_malloc_used_by_lib_dll.$(DLL): LINK_FILES+=$(ORIG_LINK_MALLOC.LIB)
+test_malloc_used_by_lib_dll.$(DLL): LIBDL=
+
+# The test needs both tbb and tbbmalloc.
+# For static build LINK_TBB.LIB is resolved in tbb.a static lib name (Linux), which cannot be found (dynamic tbb is used only).
+# In order to link properly, have to define LINK_TBB.LIB ourselves except for Windows where linkage with *.lib file expected.
+ifdef extra_inc
+ifneq ($(tbb_os),windows)
+DYNAMIC_TBB_LIB=$(LIBPREF)tbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+endif
+endif
+test_malloc_shutdown_hang.$(TEST_EXT): LINK_FILES += $(if $(DYNAMIC_TBB_LIB), $(DYNAMIC_TBB_LIB), $(LINK_TBB.LIB))
+
+# -----------------------------------------------------
+
+# ---- The list of TBBMalloc test running commands ----
+# run_cmd is usually empty
+malloc_test: $(MALLOC.DLL) malloc_test_no_depends
+
+malloc_test_no_depends: $(TEST_PREREQUISITE) $(MALLOC_TESTS)
+	$(run_cmd) ./test_malloc_pools.$(TEST_EXT) $(args) 1:4
+ifneq (,$(MALLOCPROXY.DLL))
+	$(run_cmd) ./test_malloc_atexit.$(TEST_EXT) $(args)
+	$(run_cmd) $(TEST_LAUNCHER) -l $(MALLOCPROXY.DLL) ./test_malloc_overload.$(TEST_EXT) $(args)
+	$(run_cmd) $(TEST_LAUNCHER) ./test_malloc_overload_proxy.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_malloc_overload_disable.$(TEST_EXT) $(args)
+	$(run_cmd) $(TEST_LAUNCHER) ./test_malloc_new_handler.$(TEST_EXT) $(args)
+endif
+	$(run_cmd) $(TEST_LAUNCHER) ./test_malloc_lib_unload.$(TEST_EXT) $(args)
+	$(run_cmd) $(TEST_LAUNCHER) ./test_malloc_used_by_lib.$(TEST_EXT)
+	$(run_cmd) ./test_malloc_whitebox.$(TEST_EXT) $(args) 1:4
+	$(run_cmd) $(TEST_LAUNCHER) -u ./test_malloc_compliance.$(TEST_EXT) $(args) 1:4
+	$(run_cmd) ./test_ScalableAllocator.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_ScalableAllocator_STL.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_malloc_regression.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_malloc_init_shutdown.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_malloc_pure_c.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_malloc_shutdown_hang.$(TEST_EXT)
+# -----------------------------------------------------
+
+#------------------------------------------------------
+# End of rules for making the TBBMalloc unit tests
+#------------------------------------------------------
+
+# Include automatically generated dependencies
+-include *.d
diff --git a/xdl/third_party/tbb/build/Makefile.tbbproxy b/xdl/third_party/tbb/build/Makefile.tbbproxy
new file mode 100644
index 00000000..eae6c9f3
--- /dev/null
+++ b/xdl/third_party/tbb/build/Makefile.tbbproxy
@@ -0,0 +1,109 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# default target
+default_tbbproxy: tbbproxy tbbproxy_test
+
+tbb_root ?= $(TBBROOT)
+BUILDING_PHASE=1
+include $(tbb_root)/build/common.inc
+DEBUG_SUFFIX=$(findstring _debug,_$(cfg))
+
+PROXY_ROOT ?= $(tbb_root)/src/tbbproxy
+PROXY_SOURCE_ROOT ?= $(PROXY_ROOT)
+
+VPATH = $(tbb_root)/src/tbb/$(ASSEMBLY_SOURCE) $(tbb_root)/src/tbb $(tbb_root)/src/test
+VPATH += $(PROXY_ROOT) $(PROXY_SOURCE_ROOT)
+
+CPLUS_FLAGS += $(DEFINE_KEY)__TBB_DLL_NAME=$(TBB.DLL)
+CPLUS_FLAGS += $(DEFINE_KEY)__TBB_LST=$(TBB.LST)
+CPLUS_FLAGS += $(foreach dir,$(VPATH),$(INCLUDE_KEY)$(dir))
+CPLUS_FLAGS += $(PIC_KEY) $(DSE_KEY)
+
+include $(tbb_root)/build/common_rules.inc
+
+#------------------------------------------------------
+# Define rules for making the TBB Proxy static library.
+#------------------------------------------------------
+
+# Object files that make up TBB Proxy
+PROXY_CPLUS.OBJ = tbbproxy.$(OBJ)
+PROXY_ASM.OBJ   = tbbproxy-asm.$(OBJ)
+PROXY.OBJ := $(PROXY_CPLUS.OBJ) $(PROXY_ASM.OBJ)
+
+# Not using intrinsics prevents undesired dependence on ICL libraries (e.g. libirc).
+# Not using default libs prevents link issues caused by different CRT versions in tbbproxy and in an app.
+$(PROXY.OBJ): CPLUS_FLAGS += $(DEFINE_KEY)ARCH_$(arch) $(DEFINE_KEY)OS_$(tbb_os) $(NOINTRINSIC_KEY) $(NODEFAULTLIB_KEY)
+
+$(PROXY_CPLUS.OBJ): CPLUS_FLAGS+=$(if $(filter windows.%cl,$(tbb_os).$(compiler)),/Fdtbbproxy$(DEBUG_SUFFIX).pdb)
+$(PROXY_CPLUS.OBJ): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(CPLUS_FLAGS) $(INCLUDES) $<
+
+$(PROXY.LIB): $(PROXY.OBJ)
+	$(AR) $(AR_FLAGS) $(AR_OUTPUT_KEY)$@ $^
+
+.PRECIOUS : %.$(ASMEXT)
+tbbproxy-asm.$(ASMEXT) : tbbproxy-$(tbb_os).$(ASMEXT) $(TBB.LST) $(TBB-OBJECTS.LST)
+	$(CPLUS) $(PREPROC_ONLY) $< $(INCLUDES) $(CPLUS_FLAGS) $(DEFINE_KEY)__TBB_BUILD=1 > $@
+
+.PHONY: tbbproxy
+ifeq (windows,$(tbb_os))
+tbbproxy: $(PROXY.LIB)
+else
+tbbproxy:
+endif
+
+#------------------------------------------------------
+# End of rules for making the TBB Proxy static library
+#------------------------------------------------------
+
+#------------------------------------------------------
+# Define rules for making the TBB Proxy unit tests
+#------------------------------------------------------
+
+add_debug=$(basename $(1))_debug$(suffix $(1))
+cross_suffix=$(if $(crosstest),$(if $(DEBUG_SUFFIX),$(subst _debug,,$(1)),$(call add_debug,$(1))),$(1))
+
+PROXY_LIB        = $(call cross_suffix,$(PROXY.LIB))
+PROXY_TESTS_SRCS = test_runtime_loader.cpp
+PROXY_TESTS_OBJS = $(PROXY_TESTS_SRCS:.cpp=.$(OBJ))
+PROXY_TESTS_EXES = $(PROXY_TESTS_OBJS:.$(OBJ)=.$(TEST_EXT))
+
+# Run rules.
+.PHONY: tbbproxy_test
+ifeq (windows,$(tbb_os))
+tbbproxy_test: $(call cross_suffix,$(PROXY.LIB)) $(TEST_PREREQUISITE) $(PROXY_TESTS_EXES)
+	$(run_cmd) ./test_runtime_loader.$(TEST_EXT) $(args)
+else
+tbbproxy_test:
+endif
+
+# Link rules.
+$(PROXY_TESTS_EXES): %.$(TEST_EXT): %.$(OBJ) $(PROXY_LIB)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) $< $(PROXY_LIB) $(LIBS) $(LIBDL) $(LINK_FLAGS)
+
+# Compilation rules.
+$(PROXY_TESTS_OBJS): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(CPLUS_FLAGS) $(CXX_ONLY_FLAGS) $(CXX_WARN_SUPPRESS) $(INCLUDES) $(OUTPUT_KEY)$@ $<
+
+#------------------------------------------------------
+# End of rules for making the TBB Proxy unit tests
+#------------------------------------------------------
+
+# Include automatically generated dependencies
+-include *.d
diff --git a/xdl/third_party/tbb/build/Makefile.test b/xdl/third_party/tbb/build/Makefile.test
new file mode 100644
index 00000000..8e38d368
--- /dev/null
+++ b/xdl/third_party/tbb/build/Makefile.test
@@ -0,0 +1,318 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#------------------------------------------------------------------------------
+# Define rules for making the TBB tests.
+#------------------------------------------------------------------------------
+.PHONY: default test_tbb_plain test_tbb_openmp test_tbb_cilk test_tbb_old clean
+
+default: test_tbb_plain test_tbb_openmp test_tbb_cilk test_tbb_old
+
+tbb_root ?= $(TBBROOT)
+BUILDING_PHASE=1
+TEST_RESOURCE = $(TBB.RES)
+TESTFILE=test
+include $(tbb_root)/build/common.inc
+DEBUG_SUFFIX=$(findstring _debug,$(call cross_cfg,_$(cfg)))
+
+#------------------------------------------------------------
+# Define static pattern rules dealing with .cpp source files
+#------------------------------------------------------------
+
+VPATH = $(tbb_root)/src/tbb/$(ASSEMBLY_SOURCE) $(tbb_root)/src/tbb $(tbb_root)/src/rml/client $(tbb_root)/src/old $(tbb_root)/src/test $(tbb_root)/src/perf
+CPLUS_FLAGS += $(if $(crosstest),$(DEFINE_KEY)__TBB_NO_IMPLICIT_LINKAGE=1) \
+               $(if $(no_exceptions),$(DEFINE_KEY)__TBB_TEST_NO_EXCEPTIONS=1) \
+               $(if $(LINK_TBB.LIB),$(DEFINE_KEY)TEST_USES_TBB=1)
+
+TEST_PREREQUISITE+=$(TBB.LIB)
+LINK_FILES+=$(LINK_TBB.LIB)
+
+ifdef use_proxy
+    USE_PROXY_FLAG = $(DEFINE_KEY)HARNESS_USE_RUNTIME_LOADER
+    CPLUS_FLAGS += $(USE_PROXY_FLAG)
+    LINK_TBB.LIB = $(PROXY.LIB)
+    LIBS += $(LIBDL)
+endif
+
+TEST_SUFFIXES=secondary compiler_builtins pic
+include $(tbb_root)/build/common_rules.inc
+
+# Rules for the tests, which use TBB in a dynamically loadable library
+test_model_plugin.$(TEST_EXT): LINK_TBB.LIB =
+test_model_plugin.$(TEST_EXT): CPLUS_FLAGS := $(CPLUS_FLAGS:$(USE_PROXY_FLAG)=)
+test_model_plugin.$(TEST_EXT): LIBS += $(LIBDL)
+ifneq (,$(DYLIB_KEY))
+test_model_plugin.$(TEST_EXT): test_model_plugin_dll.$(DLL)
+endif
+
+# tbb_misc.$(OBJ) has to be specified here (instead of harness_inject_scheduler.h) because it carries dependency on version_string.ver
+SCHEDULER_DEPENDENCIES = $(TBB_ASM.OBJ) tbb_misc.$(OBJ)
+
+# These executables don't depend on the TBB library, but include core .cpp files directly
+SCHEDULER_DIRECTLY_INCLUDED = test_task_leaks.$(TEST_EXT) \
+    test_task_assertions.$(TEST_EXT) \
+    test_fast_random.$(TEST_EXT) \
+    test_global_control_whitebox.$(TEST_EXT) \
+    test_concurrent_queue_whitebox.$(TEST_EXT)
+
+# Necessary to locate version_string.ver referenced from directly included tbb_misc.cpp
+INCLUDES += $(INCLUDE_KEY). $(INCLUDE_TEST_HEADERS)
+
+$(SCHEDULER_DIRECTLY_INCLUDED): CPLUS_FLAGS += $(DSE_KEY)
+$(SCHEDULER_DIRECTLY_INCLUDED): WARNING_KEY += $(WARNING_SUPPRESS)
+$(SCHEDULER_DIRECTLY_INCLUDED): LIBS += $(LIBDL)
+#tbb.lib must not be linked to scheduler white box tests in order to not violate ODR
+$(SCHEDULER_DIRECTLY_INCLUDED): LINK_TBB.LIB =
+$(SCHEDULER_DIRECTLY_INCLUDED): LINK_FILES += $(SCHEDULER_DEPENDENCIES)
+$(SCHEDULER_DIRECTLY_INCLUDED): $(SCHEDULER_DEPENDENCIES)
+
+# test_tbb_header detects "multiple definition" linker error using the test that covers the whole library
+TWICE_LINKED_TESTS = test_tbb_header.$(TEST_EXT) \
+                     test_concurrent_unordered_set.$(TEST_EXT)
+
+%_secondary.$(OBJ): CPLUS_FLAGS+=$(DEFINE_KEY)__TBB_TEST_SECONDARY=1
+
+# Detecting "multiple definition" linker error using the test that covers the whole library
+$(TWICE_LINKED_TESTS): %.$(TEST_EXT): %.$(OBJ) %_secondary.$(OBJ)
+$(TWICE_LINKED_TESTS): LINK_FILES+=$(@:.$(TEST_EXT)=_secondary.$(OBJ))
+
+# Checks that TBB works correctly in position independent code
+%_pic.$(OBJ): CPLUS_FLAGS+=$(PIC_KEY)
+%_pic.$(OBJ): CPLUS_FLAGS+=$(DEFINE_KEY)__TBB_TEST_PIC=1
+
+# Test of generic gcc port and icc intrinsics port
+%_compiler_builtins.$(TEST_EXT): LINK_TBB.LIB =
+%_compiler_builtins.$(OBJ): CPLUS_FLAGS+=$(DEFINE_KEY)__TBB_TEST_BUILTINS=1 $(DEFINE_KEY)TBB_USE_ASSERT=0
+
+# dynamic_link tests don't depend on the TBB library
+test_dynamic_link%.$(TEST_EXT): LINK_TBB.LIB =
+test_dynamic_link.$(TEST_EXT): LIBS += $(LIBDL)
+
+# Resolving issue with the number of sections that an object file can contain
+ifneq (,$(BIGOBJ_KEY))
+TEST_BIGOBJ = test_opencl_node.$(TEST_EXT)      \
+    test_atomic.$(TEST_EXT)                     \
+    test_concurrent_unordered_set.$(TEST_EXT)   \
+    test_concurrent_unordered_map.$(TEST_EXT)   \
+    test_join_node_key_matching.$(TEST_EXT)     \
+    test_join_node_msg_key_matching.$(TEST_EXT) \
+    test_join_node.$(TEST_EXT)
+$(TEST_BIGOBJ): override CXXFLAGS += $(BIGOBJ_KEY)
+endif
+
+# TODO: remove repetition of .$(TEST_EXT) in the list bellow
+# The main list of TBB tests
+TEST_TBB_PLAIN.EXE = test_assembly.$(TEST_EXT)   \
+	test_global_control.$(TEST_EXT)              \
+	test_tbb_fork.$(TEST_EXT)                    \
+	test_assembly_compiler_builtins.$(TEST_EXT)  \
+	test_aligned_space.$(TEST_EXT)               \
+	test_atomic.$(TEST_EXT)                      \
+	test_atomic_pic.$(TEST_EXT)                  \
+	test_atomic_compiler_builtins.$(TEST_EXT)    \
+	test_blocked_range.$(TEST_EXT)               \
+	test_blocked_range2d.$(TEST_EXT)             \
+	test_blocked_range3d.$(TEST_EXT)             \
+	test_blocked_rangeNd.$(TEST_EXT)             \
+	test_concurrent_queue.$(TEST_EXT)            \
+	test_concurrent_vector.$(TEST_EXT)           \
+	test_concurrent_unordered_set.$(TEST_EXT)    \
+	test_concurrent_unordered_map.$(TEST_EXT)    \
+	test_concurrent_hash_map.$(TEST_EXT)         \
+	test_enumerable_thread_specific.$(TEST_EXT)  \
+	test_handle_perror.$(TEST_EXT)               \
+	test_halt.$(TEST_EXT)                        \
+	test_model_plugin.$(TEST_EXT)                \
+	test_mutex.$(TEST_EXT)                       \
+	test_mutex_native_threads.$(TEST_EXT)        \
+	test_rwm_upgrade_downgrade.$(TEST_EXT)       \
+	test_cache_aligned_allocator.$(TEST_EXT)     \
+	test_cache_aligned_allocator_STL.$(TEST_EXT) \
+	test_parallel_for.$(TEST_EXT)                \
+	test_parallel_reduce.$(TEST_EXT)             \
+	test_parallel_sort.$(TEST_EXT)               \
+	test_parallel_scan.$(TEST_EXT)               \
+	test_parallel_while.$(TEST_EXT)              \
+	test_parallel_do.$(TEST_EXT)                 \
+	test_pipeline.$(TEST_EXT)                    \
+	test_pipeline_with_tbf.$(TEST_EXT)           \
+	test_parallel_pipeline.$(TEST_EXT)           \
+	test_lambda.$(TEST_EXT)                      \
+	test_task_scheduler_init.$(TEST_EXT)         \
+	test_task_scheduler_observer.$(TEST_EXT)     \
+	test_task.$(TEST_EXT)                        \
+	test_tbb_thread.$(TEST_EXT)                  \
+	test_std_thread.$(TEST_EXT)                  \
+	test_tick_count.$(TEST_EXT)                  \
+	test_inits_loop.$(TEST_EXT)                  \
+	test_yield.$(TEST_EXT)                       \
+	test_eh_tasks.$(TEST_EXT)                    \
+	test_eh_algorithms.$(TEST_EXT)               \
+	test_eh_flow_graph.$(TEST_EXT)               \
+	test_parallel_invoke.$(TEST_EXT)             \
+	test_task_group.$(TEST_EXT)                  \
+	test_ittnotify.$(TEST_EXT)                   \
+	test_parallel_for_each.$(TEST_EXT)           \
+	test_tbb_header.$(TEST_EXT)                  \
+	test_combinable.$(TEST_EXT)                  \
+	test_task_auto_init.$(TEST_EXT)              \
+	test_task_arena.$(TEST_EXT)                  \
+	test_concurrent_monitor.$(TEST_EXT)          \
+	test_semaphore.$(TEST_EXT)                   \
+	test_critical_section.$(TEST_EXT)            \
+	test_reader_writer_lock.$(TEST_EXT)          \
+	test_tbb_condition_variable.$(TEST_EXT)      \
+	test_intrusive_list.$(TEST_EXT)              \
+	test_concurrent_priority_queue.$(TEST_EXT)   \
+	test_task_priority.$(TEST_EXT)               \
+	test_task_enqueue.$(TEST_EXT)                \
+	test_task_steal_limit.$(TEST_EXT)            \
+	test_hw_concurrency.$(TEST_EXT)              \
+	test_fp.$(TEST_EXT)                          \
+	test_tuple.$(TEST_EXT)                       \
+	test_flow_graph.$(TEST_EXT)                  \
+	test_broadcast_node.$(TEST_EXT)              \
+	test_continue_node.$(TEST_EXT)               \
+	test_function_node.$(TEST_EXT)               \
+	test_limiter_node.$(TEST_EXT)                \
+	test_join_node.$(TEST_EXT)                   \
+	test_join_node_key_matching.$(TEST_EXT)      \
+	test_join_node_msg_key_matching.$(TEST_EXT)  \
+	test_buffer_node.$(TEST_EXT)                 \
+	test_queue_node.$(TEST_EXT)                  \
+	test_priority_queue_node.$(TEST_EXT)         \
+	test_sequencer_node.$(TEST_EXT)              \
+	test_source_node.$(TEST_EXT)                 \
+	test_overwrite_node.$(TEST_EXT)              \
+	test_write_once_node.$(TEST_EXT)             \
+	test_indexer_node.$(TEST_EXT)                \
+	test_multifunction_node.$(TEST_EXT)          \
+	test_split_node.$(TEST_EXT)                  \
+	test_static_assert.$(TEST_EXT)               \
+	test_aggregator.$(TEST_EXT)                  \
+	test_concurrent_lru_cache.$(TEST_EXT)        \
+	test_examples_common_utility.$(TEST_EXT)     \
+	test_dynamic_link.$(TEST_EXT)                \
+	test_parallel_for_vectorization.$(TEST_EXT)  \
+	test_tagged_msg.$(TEST_EXT)                  \
+	test_partitioner_whitebox.$(TEST_EXT)        \
+	test_flow_graph_whitebox.$(TEST_EXT)         \
+	test_composite_node.$(TEST_EXT)              \
+	test_async_node.$(TEST_EXT)                  \
+	test_async_msg.$(TEST_EXT)                   \
+	test_tbb_version.$(TEST_EXT)                 # insert new files right above
+
+# These tests depend on other technologies
+TEST_TBB_SPECIAL.EXE = test_openmp.$(TEST_EXT) \
+    test_cilk_interop.$(TEST_EXT)              \
+    test_gfx_factory.$(TEST_EXT)               \
+    test_opencl_node.$(TEST_EXT)
+
+# skip mode_plugin for now
+skip_tests += test_model_plugin
+
+ifdef OPENMP_FLAG
+test_openmp.$(TEST_EXT): CPLUS_FLAGS += $(OPENMP_FLAG)
+
+test_tbb_openmp: $(TEST_PREREQUISITE) test_openmp.$(TEST_EXT)
+	$(run_cmd) ./test_openmp.$(TEST_EXT) 1:4
+else
+test_tbb_openmp:
+	@echo "OpenMP is not available"
+endif
+
+ifdef CILK_AVAILABLE
+# Workaround on cilkrts linkage known issue (see Intel(R) C++ Composer XE 2011 Release Notes)
+# The issue reveals itself if a version of binutils is prior to 2.17
+ifeq (linux_icc,$(tbb_os)_$(compiler))
+test_cilk_interop.$(TEST_EXT): LIBS += -lcilkrts
+test_gfx_factory.$(TEST_EXT): LIBS += -lcilkrts
+endif
+test_tbb_cilk: test_cilk_interop.$(TEST_EXT)
+	$(run_cmd) ./test_cilk_interop.$(TEST_EXT) $(args)
+else
+test_tbb_cilk:
+	@echo "Intel(R) Cilk(TM) Plus is not available"
+endif
+
+test_opencl_node.$(TEST_EXT): LIBS += $(OPENCL.LIB)
+
+$(TEST_TBB_PLAIN.EXE) $(TEST_TBB_SPECIAL.EXE): WARNING_KEY += $(TEST_WARNING_KEY)
+
+# Run tests that are in SCHEDULER_DIRECTLY_INCLUDED and TEST_TBB_PLAIN.EXE but not in skip_tests (which is specified by user)
+TESTS_TO_RUN := $(filter-out $(addsuffix .$(TEST_EXT),$(skip_tests)),$(TEST_TBB_PLAIN.EXE) $(SCHEDULER_DIRECTLY_INCLUDED))
+
+# This definition intentionally consists of two blank lines
+define eol
+
+
+endef
+
+# First build the targets, then run them
+# Form a list of commands separated with end of line
+# Note that usually run_cmd is empty, and tests run directly
+
+test_tbb_plain: $(TEST_PREREQUISITE) $(TESTS_TO_RUN)
+	$(foreach test, $(TESTS_TO_RUN), $(run_cmd) ./$(test) $(args) $(eol))
+
+
+# For deprecated files, we don't mind warnings etc., thus compilation rules are most relaxed
+CPLUS_FLAGS_DEPRECATED = $(DEFINE_KEY)__TBB_TEST_DEPRECATED=1 $(subst $(WARNING_KEY),,$(CPLUS_FLAGS)) $(WARNING_SUPPRESS) $(INCLUDE_KEY)$(tbb_root)/src/test
+TEST_TBB_OLD.OBJ = test_concurrent_vector_v2.$(OBJ) test_concurrent_queue_v2.$(OBJ) test_mutex_v2.$(OBJ) test_task_scheduler_observer_v3.$(OBJ) 
+
+$(TEST_TBB_OLD.OBJ): CPLUS_FLAGS := $(CPLUS_FLAGS_DEPRECATED)
+
+TEST_TBB_OLD.EXE = $(subst .$(OBJ),.$(TEST_EXT),$(TEST_TBB_OLD.OBJ))
+
+ifeq (,$(NO_LEGACY_TESTS))
+test_tbb_old: $(TEST_PREREQUISITE) $(TEST_TBB_OLD.EXE)
+	$(run_cmd) ./test_concurrent_vector_v2.$(TEST_EXT) $(args) 1:4
+	$(run_cmd) ./test_concurrent_queue_v2.$(TEST_EXT) $(args) 1:4
+	$(run_cmd) ./test_mutex_v2.$(TEST_EXT) $(args) 1
+	$(run_cmd) ./test_mutex_v2.$(TEST_EXT) $(args) 2
+	$(run_cmd) ./test_mutex_v2.$(TEST_EXT) $(args) 4
+	$(run_cmd) ./test_task_scheduler_observer_v3.$(TEST_EXT) $(args) 1:4
+else
+test_tbb_old:
+	@echo Legacy tests skipped
+endif
+
+ifneq (,$(codecov))
+codecov_gen:
+	profmerge
+	codecov $(if $(findstring -,$(codecov)),$(codecov),) -demang -comp $(tbb_root)/build/codecov.txt
+endif
+
+time_%: time_%.$(TEST_EXT) $(TEST_PREREQUISITE)
+	$(run_cmd) ./$< $(args)
+
+
+# for some reason, "perf_%.$(TEST_EXT): perf_dll.$(DLL)" does not work TODO: find out how to apply pattern here
+perf_sched.$(TEST_EXT): perf_dll.$(DLL)
+perf_%.$(TEST_EXT): TEST_LIBS = perf_dll.$(LIBEXT)
+perf_%: perf_%.$(TEST_EXT) $(TEST_PREREQUISITE)
+	$(run_cmd) ./$< $(args)
+
+clean_%:
+	$(RM) $*.$(OBJ) $*.exe $*.$(DLL) $*.$(LIBEXT) $*.res $*.map $*.ilk $*.pdb $*.exp $*.*manifest $*.tmp $*.d *.ver
+
+clean:
+	$(RM) *.$(OBJ) *.exe *.$(DLL) *.$(LIBEXT) *.res *.map *.ilk *.pdb *.exp *.manifest *.tmp *.d pgopti.* *.dyn core core.*[0-9][0-9] *.ver
+
+# Include automatically generated dependencies
+-include *.d
diff --git a/xdl/third_party/tbb/build/OpenBSD.clang.inc b/xdl/third_party/tbb/build/OpenBSD.clang.inc
new file mode 100644
index 00000000..8d7bf854
--- /dev/null
+++ b/xdl/third_party/tbb/build/OpenBSD.clang.inc
@@ -0,0 +1,19 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+include $(tbb_root)/build/BSD.clang.inc
diff --git a/xdl/third_party/tbb/build/OpenBSD.inc b/xdl/third_party/tbb/build/OpenBSD.inc
new file mode 100644
index 00000000..91bebc96
--- /dev/null
+++ b/xdl/third_party/tbb/build/OpenBSD.inc
@@ -0,0 +1,19 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+include $(tbb_root)/build/BSD.inc
diff --git a/xdl/third_party/tbb/build/SunOS.gcc.inc b/xdl/third_party/tbb/build/SunOS.gcc.inc
new file mode 100644
index 00000000..1e8dcf4f
--- /dev/null
+++ b/xdl/third_party/tbb/build/SunOS.gcc.inc
@@ -0,0 +1,92 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor -Wextra
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor
+DYLIB_KEY = -shared
+LIBDL = -ldl
+
+CPLUS = g++ 
+CONLY = gcc
+LIB_LINK_FLAGS = -shared
+LIBS = -lpthread -lrt -ldl 
+C_FLAGS = $(CPLUS_FLAGS) -x c
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = -g -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG -g -O0 -DUSE_PTHREAD
+endif
+
+ASM=
+ASM_FLAGS=
+
+TBB_ASM.OBJ=
+
+ifeq (ia64,$(arch))
+# Position-independent code (PIC) is a must for IA-64
+    CPLUS_FLAGS += $(PIC_KEY)
+endif 
+
+ifeq (intel64,$(arch))
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif 
+
+ifeq (ia32,$(arch))
+    CPLUS_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif 
+
+# for some gcc versions on Solaris, -m64 may imply V9, but perhaps not everywhere (TODO: verify)
+ifeq (sparc,$(arch))
+    CPLUS_FLAGS    += -mcpu=v9 -m64
+    LIB_LINK_FLAGS += -mcpu=v9 -m64
+endif 
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASSEMBLY_SOURCE=$(arch)-gas
+ifeq (ia64,$(arch))
+    ASM=ias
+    TBB_ASM.OBJ = atomic_support.o lock_byte.o log2.o pause.o
+endif 
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/SunOS.inc b/xdl/third_party/tbb/build/SunOS.inc
new file mode 100644
index 00000000..95b17353
--- /dev/null
+++ b/xdl/third_party/tbb/build/SunOS.inc
@@ -0,0 +1,83 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifndef arch
+        arch:=$(shell uname -p)
+        ifeq ($(arch),i386)
+            ifeq ($(shell isainfo -b),64)
+                arch:=intel64
+            else
+                arch:=ia32
+            endif
+        endif
+        export arch
+# For non-IA systems running Sun OS, 'arch' will contain whatever is printed by uname -p.
+# In particular, for SPARC architecture it will contain "sparc".
+endif
+
+ifndef runtime
+        gcc_version:=$(shell gcc -dumpversion)
+        os_version:=$(shell uname -r)
+        os_kernel_version:=$(shell uname -r | sed -e 's/-.*$$//')
+        export runtime:=cc$(gcc_version)_kernel$(os_kernel_version)
+endif
+
+ifeq ($(arch),sparc)
+        native_compiler := gcc
+        export compiler ?= gcc
+else
+        native_compiler := suncc
+        export compiler ?= suncc
+endif
+# debugger ?= gdb
+
+CMD=$(SHELL) -c
+CWD=$(shell pwd)
+RM?=rm -f
+RD?=rmdir
+MD?=mkdir -p
+NUL= /dev/null
+SLASH=/
+MAKE_VERSIONS=bash $(tbb_root)/build/version_info_sunos.sh $(VERSION_FLAGS) >version_string.ver
+MAKE_TBBVARS=bash $(tbb_root)/build/generate_tbbvars.sh
+
+ifdef LD_LIBRARY_PATH
+        export LD_LIBRARY_PATH := .:$(LD_LIBRARY_PATH)
+else
+        export LD_LIBRARY_PATH := .
+endif
+
+####### Build settings ########################################################
+
+OBJ = o
+DLL = so
+LIBEXT=so
+
+TBB.LST =
+TBB.DEF =
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+MALLOCPROXY.DLL = libtbbmalloc_proxy$(DEBUG_SUFFIX).$(DLL)
+
+TEST_LAUNCHER=sh $(tbb_root)/build/test_launcher.sh $(largs)
diff --git a/xdl/third_party/tbb/build/SunOS.suncc.inc b/xdl/third_party/tbb/build/SunOS.suncc.inc
new file mode 100644
index 00000000..b1fda770
--- /dev/null
+++ b/xdl/third_party/tbb/build/SunOS.suncc.inc
@@ -0,0 +1,92 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+COMPILE_ONLY = -c -xMMD -errtags
+PREPROC_ONLY = -E -xMMD
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -KPIC
+DYLIB_KEY = -G
+LIBDL = -ldl
+# WARNING_AS_ERROR_KEY = -errwarn=%all
+WARNING_AS_ERROR_KEY = Warning as error
+# Supported Solaris Studio* 12.2 and above, remove ',inlasmpnu' in the line below to build by compiler prior Solaris Studio* 12.2 
+WARNING_SUPPRESS = -erroff=unassigned,attrskipunsup,badargtype2w,badbinaryopw,wbadasg,wvarhidemem,inlasmpnu
+tbb_strict=0
+
+CPLUS = CC
+CONLY = cc
+
+OPENMP_FLAG = -xopenmp
+LIB_LINK_FLAGS = -G -R . -M$(tbb_root)/build/suncc.map.pause
+LINK_FLAGS += -M$(tbb_root)/build/suncc.map.pause
+LIBS = -lpthread -lrt -R .
+C_FLAGS = $(CPLUS_FLAGS)
+
+#TODO: the $(stdlib) instead of hard-wiring STLPort 
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = -mt -xO2 -g -library=stlport4 -DUSE_PTHREAD $(WARNING_SUPPRESS)
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -mt -DTBB_USE_DEBUG -g -library=stlport4 -DUSE_PTHREAD $(WARNING_SUPPRESS)
+endif
+
+ASM=
+ASM_FLAGS=
+
+TBB_ASM.OBJ=
+
+ifeq (intel64,$(arch))
+    CPLUS_FLAGS += -m64
+    ASM_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif 
+
+ifeq (ia32,$(arch))
+    CPLUS_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif 
+
+# TODO: verify whether -m64 implies V9 on relevant Sun Studio versions
+#       (those that handle gcc assembler syntax)
+ifeq (sparc,$(arch))
+    CPLUS_FLAGS    += -m64
+    LIB_LINK_FLAGS += -m64
+endif 
+
+export TBB_CUSTOM_VARS_SH=export CXXFLAGS="-I$${TBBROOT}/include -library=stlport4 $(CXXFLAGS) -M$${TBBROOT}/build/suncc.map.pause"
+export TBB_CUSTOM_VARS_CSH=setenv CXXFLAGS "-I$${TBBROOT}/include -library=stlport4 $(CXXFLAGS) -M$${TBBROOT}/build/suncc.map.pause"
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASSEMBLY_SOURCE=$(arch)-fbe
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+M_INCLUDES = $(INCLUDES) -I$(MALLOC_ROOT) -I$(MALLOC_SOURCE_ROOT)
+M_CPLUS_FLAGS = $(CPLUS_FLAGS)
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/android.clang.inc b/xdl/third_party/tbb/build/android.clang.inc
new file mode 100644
index 00000000..4f9ef31d
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.clang.inc
@@ -0,0 +1,130 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+SDL_FLAGS = -fPIE -fPIC -fstack-protector -Wformat -Wformat-security
+TEST_WARNING_KEY = -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor -Wextra
+
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+CPLUS = $(TARGET_CXX)
+CONLY = $(TARGET_CC)
+
+# -soname is necessary for proper linkage to TBB prebuilt libraries when building application with Android SDK
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY) -z relro -z now
+
+# pie is necessary for test executables to work and might be removed if newer NDK will add it implicitly
+PIE_FLAG = -pie
+ifeq ($(APP_PIE), false)
+    PIE_FLAG=
+endif
+
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic 
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+    SDL_FLAGS += -D_FORTIFY_SOURCE=2
+    CPLUS_FLAGS = -O2
+endif
+ifeq ($(cfg), debug)
+    CPLUS_FLAGS = -g -O0 $(DEFINE_KEY)TBB_USE_DEBUG
+endif
+
+CPLUS_FLAGS += $(DEFINE_KEY)USE_PTHREAD $(DEFINE_KEY)_GLIBCXX_HAVE_FENV_H
+
+ifneq (,$(findstring $(arch),ia32 intel64))
+    CPLUS_FLAGS += $(DEFINE_KEY)DO_ITT_NOTIFY
+endif
+
+ifeq (0, $(dynamic_load))
+     CPLUS_FLAGS += $(DEFINE_KEY)__TBB_DYNAMIC_LOAD_ENABLED=0
+endif
+
+# Paths to the NDK prebuilt tools and libraries
+ifeq (,$(findstring $(ndk_version), $(foreach v, 7 8 9 10 11 12 13 14 15,r$(v) r$(v)b r$(v)c r$(v)d r$(v)e)))
+    # Since Android* NDK r16 another sysroot and isystem paths have to be specified
+    CPLUS_FLAGS += --sysroot=$(NDK_ROOT)/sysroot -isystem $(NDK_ROOT)/sysroot/usr/include/$(TRIPLE)
+    # Android* version flag required since r16
+    CPLUS_FLAGS += -D__ANDROID_API__=$(API_LEVEL)
+else
+    CPLUS_FLAGS += --sysroot=$(SYSROOT)
+endif
+
+# Library sysroot flag
+LIB_LINK_FLAGS += --sysroot=$(SYSROOT)
+# Flag for test executables
+LINK_FLAGS     += --sysroot=$(SYSROOT)
+
+LIBS           = -L$(CPLUS_LIB_PATH) -lc++_shared
+ifeq (,$(findstring $(ndk_version),$(foreach v, 7 8 9 10 11,r$(v) r$(v)b r$(v)c r$(v)d r$(v)e)))
+    LIBS +=  -lc++abi
+    ifeq (arm,$(arch))
+        LIBS += -lunwind 
+    endif
+endif
+
+ifeq (arm,$(arch))
+    CPLUS_FLAGS += $(DEFINE_KEY)__TBB_64BIT_ATOMICS=0
+endif
+
+CPLUS_FLAGS += $(TARGET_CFLAGS)
+LIB_LINK_FLAGS += $(TARGET_CFLAGS) $(TARGET_LDFLAGS) -L$(CPLUS_LIB_PATH)
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ASM = $(tbb_tool_prefix)as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/android.gcc.inc b/xdl/third_party/tbb/build/android.gcc.inc
new file mode 100644
index 00000000..a90d5870
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.gcc.inc
@@ -0,0 +1,117 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor -Wextra
+
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+CPLUS = $(tbb_tool_prefix)g++
+CONLY = $(tbb_tool_prefix)gcc
+
+# -soname is necessary for proper linkage to TBB prebuilt libraries when building application with Android SDK
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+
+# pie is necessary for test executables to work and might be removed if newer NDK will add it implicitly
+PIE_FLAG = -pie
+ifeq ($(APP_PIE), false)
+    PIE_FLAG=
+endif
+
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic 
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+    CPLUS_FLAGS = -O2
+endif
+ifeq ($(cfg), debug)
+    CPLUS_FLAGS = -g -O0 $(DEFINE_KEY)TBB_USE_DEBUG
+endif
+
+CPLUS_FLAGS += $(DEFINE_KEY)USE_PTHREAD $(DEFINE_KEY)_GLIBCXX_HAVE_FENV_H
+
+ifneq (,$(findstring $(arch),ia32 intel64))
+    CPLUS_FLAGS += $(DEFINE_KEY)DO_ITT_NOTIFY
+endif
+
+ifeq (0, $(dynamic_load))
+     CPLUS_FLAGS += $(DEFINE_KEY)__TBB_DYNAMIC_LOAD_ENABLED=0
+endif
+
+
+# Paths to the NDK prebuilt tools and libraries
+CPLUS_FLAGS    += --sysroot=$(SYSROOT)
+LIB_LINK_FLAGS += --sysroot=$(SYSROOT)
+LIBS           = -L$(CPLUS_LIB_PATH) -lgnustl_shared
+
+ifeq (ia32,$(arch))
+    # TODO: Determine best setting of -march and add to CPLUS_FLAGS
+    CPLUS_FLAGS += -m32 
+    LIB_LINK_FLAGS += -m32
+else ifeq (intel64,$(arch))
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+else ifeq (arm,$(arch))
+    CPLUS_FLAGS += -march=armv7-a $(DEFINE_KEY)TBB_USE_GCC_BUILTINS=1 $(DEFINE_KEY)__TBB_64BIT_ATOMICS=0
+else ifeq (arm64,$(arch))
+    CPLUS_FLAGS += -march=armv8-a
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ASM = $(tbb_tool_prefix)as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/android.icc.inc b/xdl/third_party/tbb/build/android.icc.inc
new file mode 100644
index 00000000..3909b38f
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.icc.inc
@@ -0,0 +1,120 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY =
+TEST_WARNING_KEY = -Wshadow -Woverloaded-virtual -Wextra
+
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+CPLUS = icpc
+CONLY = icc
+
+# -soname is necessary for proper linkage to TBB prebuilt libraries when building application with Android SDK
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+
+# pie is necessary for test executables to work and might be removed if newer NDK will add it implicitly
+PIE_FLAG = -pie
+ifeq ($(APP_PIE), false)
+    PIE_FLAG=
+endif
+
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic 
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+    CPLUS_FLAGS = -O2
+endif
+ifeq ($(cfg), debug)
+    CPLUS_FLAGS = -g -O0 $(DEFINE_KEY)TBB_USE_DEBUG
+endif
+
+CPLUS_FLAGS += $(DEFINE_KEY)USE_PTHREAD $(DEFINE_KEY)_GLIBCXX_HAVE_FENV_H 
+
+ifneq (,$(findstring $(arch),ia32 intel64))
+    CPLUS_FLAGS += $(DEFINE_KEY)DO_ITT_NOTIFY
+endif
+
+ifeq (0, $(dynamic_load))
+     CPLUS_FLAGS += $(DEFINE_KEY)__TBB_DYNAMIC_LOAD_ENABLED=0
+endif
+
+
+# Paths to the NDK prebuilt tools and libraries
+CPLUS_FLAGS    += --sysroot=$(SYSROOT)
+LIB_LINK_FLAGS += --sysroot=$(SYSROOT)
+# the -static-intel flag is to remove the need to copy Intel-specific libs to the device.
+LIBS           = -L$(CPLUS_LIB_PATH) -lgnustl_shared -static-intel
+
+ifeq (ia32,$(arch))
+    # TODO: Determine best setting of -march and add to CPLUS_FLAGS
+    CPLUS_FLAGS += -m32 -march=pentium4 -falign-stack=maintain-16-byte
+    LIB_LINK_FLAGS += -m32
+else
+    ifeq (intel64,$(arch))
+        CPLUS_FLAGS += -m64
+        LIB_LINK_FLAGS += -m64
+    endif
+endif
+
+ifeq (arm,$(findstring arm,$(arch)))
+    $(error "Unsupported architecture $(arch) for icc compiler")
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ASM = $(tbb_tool_prefix)as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/android.inc b/xdl/third_party/tbb/build/android.inc
new file mode 100644
index 00000000..c0232b03
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.inc
@@ -0,0 +1,63 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#
+# Extra gmake command-line parameters for use with Android:
+#
+#    dlopen_workaround:  Some OS versions need workaround for dlopen to avoid recursive calls.
+#
+
+####### Detections and Commands ###############################################
+
+ifeq (android,$(findstring android,$(tbb_os)))
+    $(error TBB only supports cross-compilation for Android. Specify "target=android" instead.)
+endif
+
+ifndef BUILDING_PHASE
+    ifneq ("command line","$(origin arch)")
+        ifeq (icc,$(compiler))
+            export COMPILER_VERSION := ICC: $(shell icc -V </dev/null 2>&1 | grep 'Version')
+            ifneq (,$(findstring running on IA-32, $(COMPILER_VERSION)))
+                export arch:=ia32
+            else ifneq (,$(findstring running on Intel(R) 64, $(COMPILER_VERSION)))
+                export arch:=intel64
+            else
+                $(error "No support for Android in $(COMPILER_VERSION)")
+            endif
+
+        else
+            ifdef ANDROID_SERIAL
+                uname_m:=$(shell adb shell uname -m)
+                ifeq (i686,$(uname_m))
+                    export arch:=ia32
+                else
+                    export arch:=$(uname_m)
+                endif
+            endif
+        endif
+    endif
+endif
+
+ifeq ("$(arch)","")
+    $(error "No target architecture specified and \'ANDROID_SERIAL\' environment variable specifying target device not set")
+endif
+
+# Android platform only supported from TBB 4.1 forward
+NO_LEGACY_TESTS = 1
+
+
diff --git a/xdl/third_party/tbb/build/android.linux.inc b/xdl/third_party/tbb/build/android.linux.inc
new file mode 100644
index 00000000..c95e5e35
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.linux.inc
@@ -0,0 +1,67 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+####### Detections and Commands ###############################################
+
+# Must set def_prefix according to target architecture detected above
+ifeq (ia32,$(arch))
+    def_prefix = lin32
+endif
+ifeq (arm,$(findstring arm,$(arch)))
+    def_prefix = lin32
+endif
+ifeq (64,$(findstring 64,$(arch)))
+    def_prefix = lin64
+endif
+
+ifdef ndk_version
+    $(warning "NDK version $(ndk_version)")
+else
+    $(warning "NDK version not set in environment, using \'unknown\' instead.")
+    ndk_version:=unknown
+endif
+
+export runtime:=$(target)_NDK$(ndk_version)_version_$(target_os_version)
+
+AR = $(tbb_tool_prefix)ar
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_android.sh $(VERSION_FLAGS) >version_string.ver
+
+####### Build settings ########################################################
+
+# No SONAME_SUFFIX for Android allowed in library names
+TBB.LST = $(tbb_root)/src/tbb/$(def_prefix)-tbb-export.lst
+TBB.DEF = $(TBB.LST:.lst=.def)
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+TBB_NO_VERSION.DLL=
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-tbbmalloc-export.def
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+MALLOC_NO_VERSION.DLL=
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+MALLOCPROXY.DEF = $(MALLOC_ROOT)/$(def_prefix)-proxy-export.def
+MALLOCPROXY.DLL = libtbbmalloc_proxy$(DEBUG_SUFFIX).$(DLL)
+MALLOCPROXY_NO_VERSION.DLL=
+MALLOCPROXY.LIB = $(MALLOCPROXY.DLL)
+LINK_MALLOCPROXY.LIB = $(MALLOCPROXY.LIB)
+
+TEST_LAUNCHER=
+run_cmd ?= -sh $(tbb_root)/build/android.linux.launcher.sh $(largs)
diff --git a/xdl/third_party/tbb/build/android.linux.launcher.sh b/xdl/third_party/tbb/build/android.linux.launcher.sh
new file mode 100644
index 00000000..919bc49c
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.linux.launcher.sh
@@ -0,0 +1,148 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Usage:
+# android.linux.launcher.sh [-v] [-q] [-s] [-r <repeats>] [-u] [-l <library>] <executable> <arg1> <arg2> <argN>
+#         where: -v enables verbose output
+#         where: -q enables quiet mode
+#         where: -s runs the test in stress mode (until non-zero exit code or ctrl-c pressed)
+#         where: -r <repeats> specifies number of times to repeat execution
+#         where: -u is ignored on Android
+#         where: -l <library> specifies the library name to be assigned to LD_PRELOAD
+#
+# Libs and executable necessary for testing should be present in the current directory before running.
+# ANDROID_SERIAL must be set to the connected Android target device name for file transfer and test runs.
+# ANDROID_TEST_DIRECTORY may be set to the directory used for testing on the Android target device; otherwise, 
+#                        the default directory used is "/data/local/tmp/$(basename $PWD)".
+# Note: Do not remove the redirections to '/dev/null' in the script, otherwise the nightly test system will fail.
+
+do_cleanup() #
+{ #
+    adb pull $targetdir/events.txt events.txt > /dev/null 2>&1 #
+    # Remove target directory on the device
+    adb shell "rm -r ${targetdir}; mkdir -p ${targetdir}" > /dev/null 2>&1 #
+} #
+do_trap_cleanup() #
+{ #
+    do_cleanup #
+    exit -1 #
+} #
+while getopts  "qvsr:ul:" flag #
+do case $flag in #
+    s )  # Stress testing mode
+         echo Doing stress testing. Press Ctrl-C to terminate
+         run_env='stressed() { while $*; do :; done; }; ' #
+         run_prefix="stressed $run_prefix" ;; #
+    r )  # Repeats test n times
+         run_env="repeated() { for i in $(seq -s ' ' 1 $OPTARG) ; do echo \$i of $OPTARG:; \$*; done; }; " #
+         run_prefix="repeated $run_prefix" ;; #
+    l )  # Additional library
+         ldpreload="$OPTARG " ;; #
+    u )  # Stack limit
+         ;; # 
+    q )  # Quiet mode, removes 'done' but prepends any other output by test name
+         OUTPUT='2>&1 | sed -e "s/done//;/^[[:space:]]*$/d;s!^!$exename: !"' ;; #
+    v )  # Verbose mode
+         SUPPRESS='' #
+         verbose=1 ;; #
+esac done #
+shift `expr $OPTIND - 1` #
+[ -z "$OUTPUT" ] && OUTPUT='| sed -e "s/\\r$//"' #
+[ $verbose ] || SUPPRESS='>/dev/null' #
+# Collect the executable name
+exename=$(basename $1) #
+shift #
+# Prepare the target directory on the device
+currentdir=$(basename $PWD) #
+targetdir=${ANDROID_TEST_DIRECTORY:-/data/local/tmp/$currentdir} #
+do_cleanup #
+trap do_trap_cleanup INT  # if someone hits control-c, cleanup the device
+# Collect the list of files to transfer to the target device, starting with executable itself.
+fnamelist="$exename" #
+# Add the C++ standard library from the NDK, which is required for all tests on Android.
+if [ ! -z "${LIB_STL_ANDROID}" ]; then #
+	fnamelist="$fnamelist ${LIB_STL_ANDROID}" #
+else #
+	fnamelist="$fnamelist libc++_shared.so" #
+fi #
+# Find the TBB libraries and add them to the list.
+# Add TBB libraries from the current directory that contains libtbb* files
+files="$(ls libtbb* 2> /dev/null)" #
+[ -z "$files" ] || fnamelist="$fnamelist $files" #
+# Add any libraries built for specific tests.
+exeroot=${exename%\.*} #
+files="$(ls ${exeroot}*.so ${exeroot}*.so.* 2> /dev/null)" #
+[ -z "$files" ] || fnamelist="$fnamelist $files" #
+# TODO: Add extra libraries from the Intel(R) Compiler for certain tests
+# found=$(echo $exename | egrep 'test_malloc_atexit\|test_malloc_lib_unload' 2> /dev/null)
+# if [ ! -z $found ] ; then
+#     fnamelist="$fnamelist ${compiler_path_lib}/libimf.so  \
+#                           ${compiler_path_lib}/libsvml.so \
+#                           ${compiler_path_lib}/libintlc.so.5"
+# fi
+
+# Transfer collected executable and library files to the target device.
+transfers_ok=1 #
+for fullname in $fnamelist; do { #
+    if [ -r $fullname ]; then { #
+        # Transfer the executable and libraries to top-level target directory
+        [ $verbose ] && echo -n "Pushing $fullname: " #
+        eval "adb push $fullname ${targetdir}/$(basename $fullname) $SUPPRESS 2>&1" #
+    }; else { #
+        echo "Error: required file ${currentdir}/${fullname} for test $exename not available for transfer." #
+        transfers_ok=0 #
+    }; fi #
+}; done #
+if [ "${transfers_ok}" = "0" ]; then { #
+    do_cleanup #
+    exit -1 #
+}; fi #
+# Transfer input files used by example codes by scanning the executable argument list.
+for fullname in "$@"; do { #
+    if [ -r $fullname ]; then { #
+        directory=$(dirname $fullname) #
+        filename=$(basename $fullname) #
+        # strip leading "." from fullname if present
+        if [ "$directory" = "\." ]; then { #
+            directory="" #
+            fullname=$filename #
+        }; fi #
+        # Create the target directory to hold input file if necessary
+        if [ ! -z $directory ]; then { #
+            eval "adb shell 'mkdir $directory' $SUPPRESS 2>&1" #
+        }; fi #
+        # Transfer the input file to corresponding directory on target device
+        [ $verbose ] && echo -n "Pushing $fullname: " #
+        eval "adb push $fullname ${targetdir}/$fullname $SUPPRESS 2>&1" #
+    }; fi #
+}; done #
+# Set LD_PRELOAD if necessary
+[ -z "$ldpreload" ] || run_prefix="LD_PRELOAD='$ldpreload' $run_prefix" #
+[ $verbose ] && echo Running $run_prefix ./$exename $* #
+run_env="$run_env cd $targetdir; export LD_LIBRARY_PATH=." #
+[ -z "$VIRTUAL_MACHINE" ] || run_env="$run_env; export VIRTUAL_MACHINE=$VIRTUAL_MACHINE" #
+# The return_code file is the best way found to return the status of the test execution when using adb shell.
+eval 'adb shell "$run_env; $run_prefix ./$exename $* || echo -n \$? >error_code"' "${OUTPUT}" #
+# Capture the return code string and remove the trailing \r from the return_code file contents
+err=`adb shell "cat $targetdir/error_code 2>/dev/null"` #
+[ -z $err ] || echo $exename: exited with error $err #
+do_cleanup #
+# Return the exit code of the test.
+exit $err #
diff --git a/xdl/third_party/tbb/build/android.macos.inc b/xdl/third_party/tbb/build/android.macos.inc
new file mode 100644
index 00000000..8b1c7ae6
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.macos.inc
@@ -0,0 +1,76 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+####### Detections and Commands ###############################################
+
+# Must set def_prefix according to target architecture detected above
+ifeq (ia32,$(arch))
+    def_prefix = lin32
+endif
+ifeq (arm,$(findstring arm,$(arch)))
+    def_prefix = lin32
+endif
+ifeq (64,$(findstring 64,$(arch)))
+    def_prefix = lin64
+endif
+
+ifdef ndk_version
+    $(warning "NDK version $(ndk_version)")
+else
+    $(warning "NDK version not set in environment, using \'unknown\' instead.")
+    ndk_version:=unknown
+endif
+
+export runtime:=$(target)_NDK$(ndk_version)_version_$(target_os_version)
+
+AR = $(tbb_tool_prefix)ar
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_android.sh $(VERSION_FLAGS) >version_string.ver
+
+####### Build settings ########################################################
+
+# No SONAME_SUFFIX for Android allowed in library names
+TBB.LST = $(tbb_root)/src/tbb/$(def_prefix)-tbb-export.lst
+TBB.DEF = $(TBB.LST:.lst=.def)
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+TBB_NO_VERSION.DLL=
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-tbbmalloc-export.def
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+MALLOC_NO_VERSION.DLL=
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+MALLOCPROXY.DEF = $(MALLOC_ROOT)/$(def_prefix)-proxy-export.def
+MALLOCPROXY.DLL = libtbbmalloc_proxy$(DEBUG_SUFFIX).$(DLL)
+MALLOCPROXY_NO_VERSION.DLL=
+MALLOCPROXY.LIB = $(MALLOCPROXY.DLL)
+LINK_MALLOCPROXY.LIB = $(MALLOCPROXY.LIB)
+
+TBB.RES =
+MALLOC.RES =
+RML.RES =
+TBB.MANIFEST =
+MALLOC.MANIFEST =
+RML.MANIFEST =
+OBJ = o
+DLL = so
+
+TEST_LAUNCHER=
+run_cmd ?= -sh $(tbb_root)/build/android.linux.launcher.sh $(largs)
diff --git a/xdl/third_party/tbb/build/android.windows.inc b/xdl/third_party/tbb/build/android.windows.inc
new file mode 100644
index 00000000..01b1d90d
--- /dev/null
+++ b/xdl/third_party/tbb/build/android.windows.inc
@@ -0,0 +1,78 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+####### Detections and Commands ###############################################
+
+# Must set def_prefix according to target architecture detected above
+ifeq (ia32,$(arch))
+    def_prefix = lin32
+endif
+ifeq (arm,$(findstring arm,$(arch)))
+    def_prefix = lin32
+endif
+ifeq (64,$(findstring 64,$(arch)))
+    def_prefix = lin64
+endif
+
+ifdef ndk_version
+    $(warning "NDK version $(ndk_version)")
+else
+    $(warning "NDK version not set in environment, using \'unknown\' instead.")
+    ndk_version:=unknown
+endif
+
+export runtime:=$(target)_NDK$(ndk_version)_version_$(target_os_version)
+
+AR = $(tbb_tool_prefix)ar
+MAKE_VERSIONS = cmd /C cscript /nologo /E:jscript $(subst \,/,$(tbb_root))/build/version_info_windows.js $(CONLY) $(arch) $(subst \,/,"$(VERSION_FLAGS)") > version_string.ver
+
+####### Build settings ########################################################
+
+# No SONAME_SUFFIX for Android allowed in library names
+TBB.LST = $(tbb_root)/src/tbb/$(def_prefix)-tbb-export.lst
+TBB.DEF = $(TBB.LST:.lst=.def)
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+TBB_NO_VERSION.DLL=
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-tbbmalloc-export.def
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+MALLOC_NO_VERSION.DLL=
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+MALLOCPROXY.DEF = $(MALLOC_ROOT)/$(def_prefix)-proxy-export.def
+MALLOCPROXY.DLL = libtbbmalloc_proxy$(DEBUG_SUFFIX).$(DLL)
+MALLOCPROXY_NO_VERSION.DLL=
+MALLOCPROXY.LIB = $(MALLOCPROXY.DLL)
+
+TBB.RES =
+MALLOC.RES =
+RML.RES =
+TBB.MANIFEST =
+MALLOC.MANIFEST =
+RML.MANIFEST =
+OBJ = o
+DLL = so
+
+TEST_LAUNCHER=
+run_cmd ?= -sh $(tbb_root)/build/android.linux.launcher.sh $(largs)
+export UNIXMODE = 1
+# Clang for Android* uses the INCLUDE variable (instead of CPATH)
+export USE_INCLUDE_ENV = 1
diff --git a/xdl/third_party/tbb/build/big_iron.inc b/xdl/third_party/tbb/build/big_iron.inc
new file mode 100644
index 00000000..ad1b4fba
--- /dev/null
+++ b/xdl/third_party/tbb/build/big_iron.inc
@@ -0,0 +1,76 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#------------------------------------------------------------------------------
+# Defines settings for building the TBB run-time as a static library.
+# Use these only on platforms where dynamic linking is impractical.
+#
+# IF YOU USE TBB AS A STATIC LIBRARY, YOU MUST GUARANTEE THAT ONLY ONE COPY OF 
+# THE TBB RUN-TIME IS LINKED INTO AN APPLICATION!  LINKING IN MULTIPLE COPIES
+# OF THE TBB RUN-TIME, DIRECTLY OR INDIRECTLY, MAY CAUSE PROGRAM FAILURE!
+#------------------------------------------------------------------------------
+
+# Note that ITT_NOTIFY allows to selectively remove the definition of
+# DO_ITT_NOTIFY without sabotaging deferred expansion of CPLUS_FLAGS.
+# TODO: currently only in linux.{gcc,xl}.inc
+
+# Note that -pthread with xl gives "1501-210 (W) command option t contains an incorrect subargument";
+# multithreading is instead achieved by using the _r affix in the compiler name.
+# TODO: is -lpthread still relevant/needed with XL and _r affix?
+
+# Note that usage of dynamic (shared) libraries is disabled
+# (via -D__TBB_DYNAMIC_LOAD_ENABLED=0 and LIBDL emptied) primarily for performance.
+
+# OS specific settings =>
+    LIB_LINK_CMD = ar rcs
+    LIB_LINK_FLAGS =
+    LIB_LINK_LIBS =
+    LIB_OUTPUT_KEY =
+    DYLIB_KEY =
+    ifeq ($(tbb_os),linux)
+        ifeq ($(compiler),clang)
+            LIBS = -pthread -lrt
+        endif
+        ifeq ($(compiler),gcc)
+            LIBS = -pthread -lrt
+        endif
+        ifeq ($(compiler),xl)
+            LIBS = -lpthread -lrt
+        endif
+        LINK_FLAGS =
+    endif
+    override CXXFLAGS += -D__TBB_DYNAMIC_LOAD_ENABLED=0 -D__TBB_SOURCE_DIRECTLY_INCLUDED=1
+    ITT_NOTIFY =
+    DLL = a
+    LIBEXT = a
+    LIBPREF = lib
+    LIBDL =
+# <= OS specific settings
+
+TBB.DLL = $(LIBPREF)tbb$(DEBUG_SUFFIX).$(LIBEXT)
+LINK_TBB.LIB = $(TBB.DLL)
+TBB.LST =
+TBB.DEF =
+TBB_NO_VERSION.DLL =
+
+MALLOC.DLL = $(LIBPREF)tbbmalloc$(DEBUG_SUFFIX).$(LIBEXT)
+LINK_MALLOC.LIB = $(MALLOC.DLL)
+MALLOC.DEF =
+MALLOC_NO_VERSION.DLL =
+MALLOCPROXY.DLL =
+MALLOCPROXY.DEF =
diff --git a/xdl/third_party/tbb/build/build.py b/xdl/third_party/tbb/build/build.py
new file mode 100644
index 00000000..53796a94
--- /dev/null
+++ b/xdl/third_party/tbb/build/build.py
@@ -0,0 +1,193 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Provides unified tool for preparing TBB for packaging
+
+from __future__ import print_function
+import os
+import re
+import sys
+import shutil
+import platform
+import argparse
+from glob import glob
+from collections import OrderedDict
+
+jp = os.path.join
+is_win = (platform.system() == 'Windows')
+is_lin = (platform.system() == 'Linux')
+is_mac = (platform.system() == 'Darwin')
+
+default_prefix = os.getenv('PREFIX', 'install_prefix')
+if is_win:
+    default_prefix = jp(default_prefix, 'Library') # conda-specific by default on Windows
+
+parser = argparse.ArgumentParser()
+parser.add_argument('--tbbroot',       default='.', help='Take Intel TBB from here')
+parser.add_argument('--prefix',        default=default_prefix, help='Prefix')
+parser.add_argument('--prebuilt',      default=[],    action='append', help='Directories to find prebuilt files')
+parser.add_argument('--no-rebuild',    default=False, action='store_true', help='do not rebuild')
+parser.add_argument('--install',       default=False, action='store_true', help='install all')
+parser.add_argument('--install-libs',  default=False, action='store_true', help='install libs')
+parser.add_argument('--install-devel', default=False, action='store_true', help='install devel')
+parser.add_argument('--install-docs',  default=False, action='store_true', help='install docs')
+parser.add_argument('--install-python',default=False, action='store_true', help='install python module')
+parser.add_argument('--make-tool',     default='make', help='Use different make command instead')
+parser.add_argument('--copy-tool',     default=None, help='Use this command for copying ($ tool file dest-dir)')
+parser.add_argument('--build-args',    default="", help='specify extra build args')
+parser.add_argument('--build-prefix',  default='local', help='build dir prefix')
+if is_win:
+    parser.add_argument('--msbuild',   default=False, action='store_true', help='Use msbuild')
+    parser.add_argument('--vs',          default="2012", help='select VS version for build')
+    parser.add_argument('--vs-platform', default="x64",  help='select VS platform for build')
+parser.add_argument('ignore', nargs='?', help="workaround conda-build issue #2512")
+
+args = parser.parse_args()
+
+if args.install:
+    args.install_libs  = True
+    args.install_devel = True
+    args.install_docs  = True
+    args.install_python= True
+
+def custom_cp(src, dst):
+     assert os.system(' '.join([args.copy_tool, src, dst])) == 0
+
+if args.copy_tool:
+    install_cp = custom_cp # e.g. to use install -p -D -m 755 on Linux
+else:
+    install_cp = shutil.copy
+
+bin_dir = jp(args.prefix, "bin")
+lib_dir = jp(args.prefix, "lib")
+inc_dir = jp(args.prefix, 'include')
+doc_dir = jp(args.prefix, 'share', 'doc', 'tbb')
+if is_win:
+    os.environ["OS"] = "Windows_NT" # make sure TBB will interpret it corretly
+    libext = '.dll'
+    libpref = ''
+    dll_dir = bin_dir
+else:
+    libext = '.dylib' if is_mac else '.so.2'
+    libpref = 'lib'
+    dll_dir = lib_dir
+
+tbb_names = ["tbb", "tbbmalloc", "tbbmalloc_proxy"]
+
+##############################################################
+
+def system(arg):
+    print('$ ', arg)
+    return os.system(arg)
+
+def run_make(arg):
+    if system('%s -j %s'% (args.make_tool, arg)) != 0:
+       print("\nBummer. Running serial build in order to recover the log and have a chance to fix the build")
+       assert system('%s %s'% (args.make_tool, arg)) == 0
+
+os.chdir(args.tbbroot)
+if args.prebuilt:
+    release_dirs = sum([glob(d) for d in args.prebuilt], [])
+    print("Using pre-built files from ", release_dirs)
+else:
+    if is_win and args.msbuild:
+        preview_release_dir = release_dir = jp(args.tbbroot, 'build', 'vs'+args.vs, args.vs_platform, 'Release')
+        if not args.no_rebuild or not os.path.isdir(release_dir):
+            assert os.system('msbuild /m /p:Platform=%s /p:Configuration=Release %s build/vs%s/makefile.sln'% \
+                            (args.vs_platform, args.build_args, args.vs)) == 0
+        preview_debug_dir = debug_dir = jp(args.tbbroot, 'build', 'vs'+args.vs, args.vs_platform, 'Debug')
+        if not args.no_rebuild or not os.path.isdir(debug_dir):
+            assert os.system('msbuild /m /p:Platform=%s /p:Configuration=Debug %s build/vs%s/makefile.sln'% \
+                            (args.vs_platform, args.build_args, args.vs)) == 0
+    else:
+        release_dir = jp(args.tbbroot, 'build', args.build_prefix+'_release')
+        debug_dir = jp(args.tbbroot, 'build', args.build_prefix+'_debug')
+        if not args.no_rebuild or not (os.path.isdir(release_dir) and os.path.isdir(debug_dir)):
+            run_make('tbb_build_prefix=%s %s'% (args.build_prefix, args.build_args))
+        preview_release_dir = jp(args.tbbroot, 'build', args.build_prefix+'_preview_release')
+        preview_debug_dir = jp(args.tbbroot, 'build', args.build_prefix+'_preview_debug')
+        if not args.no_rebuild or not (os.path.isdir(preview_release_dir) and os.path.isdir(preview_debug_dir)):
+            run_make('tbb_build_prefix=%s_preview %s tbb_cpf=1 tbb'% (args.build_prefix, args.build_args))
+    release_dirs = [release_dir, debug_dir, preview_release_dir, preview_debug_dir]
+
+filemap = OrderedDict()
+def append_files(names, dst, paths=release_dirs):
+    global filemap
+    files = sum([glob(jp(d, f)) for d in paths for f in names], [])
+    filemap.update(dict(zip(files, [dst]*len(files))))
+
+
+if args.install_libs:
+    append_files([libpref+f+libext for f in tbb_names], dll_dir)
+
+if args.install_devel:
+    dll_files = [libpref+f+'_debug'+libext for f in tbb_names]          # adding debug libraries
+    if not is_win or not args.msbuild:
+        dll_files += [libpref+"tbb_preview"+libext, libpref+"tbb_preview_debug"+libext]
+    if is_win:
+        dll_files += ['tbb*.pdb']                                       # copying debug info
+    if is_lin:
+        dll_files += ['libtbb*.so']                                     # copying linker scripts
+        # symlinks .so -> .so.2 should not be created instead
+        # since linking with -ltbb when using links can result in
+        # incorrect dependence upon unversioned .so files
+    append_files(dll_files, dll_dir)
+    if is_win:
+        append_files(['*.lib', '*.def'], lib_dir)                       # copying linker libs and defs
+    for rootdir, dirnames, filenames in os.walk(jp(args.tbbroot,'include')):
+        files = [f for f in filenames if not '.html' in f]
+        append_files(files, jp(inc_dir, rootdir.split('include')[1][1:]), paths=(rootdir,))
+
+if args.install_python: # RML part
+    irml_dir = jp(args.tbbroot, 'build', args.build_prefix+'_release')
+    run_make('-C src tbb_build_prefix=%s %s python_rml'% (args.build_prefix, args.build_args))
+    if is_lin:
+        append_files(['libirml.so.1'], dll_dir, paths=[irml_dir])
+
+if args.install_docs:
+    files = [
+            'CHANGES',
+            'LICENSE',
+            'README',
+            'README.md',
+            'Release_Notes.txt',
+            ]
+    append_files(files, doc_dir, paths=release_dirs+[jp(args.tbbroot, d) for d in ('.', 'doc')])
+
+for f in filemap.keys():
+    assert os.path.exists(f)
+    assert os.path.isfile(f)
+
+if filemap:
+    print("Copying to prefix =", args.prefix)
+for f, dest in filemap.items():
+    if not os.path.isdir(dest):
+        os.makedirs(dest)
+    print("+ %s to $prefix%s"%(f,dest.replace(args.prefix, '')))
+    install_cp(f, dest)
+
+if args.install_python: # Python part
+    paths = [os.path.abspath(d) for d in [args.prefix, inc_dir, irml_dir, lib_dir]+release_dirs]
+    os.environ["TBBROOT"] = paths[0]
+    # all the paths must be relative to python/ directory or be absolute
+    assert system('python python/setup.py build -b%s build_ext -I%s -L%s install -f'% \
+        (paths[2], paths[1], ':'.join(paths[2:]))) == 0
+
+print("done")
diff --git a/xdl/third_party/tbb/build/codecov.txt b/xdl/third_party/tbb/build/codecov.txt
new file mode 100644
index 00000000..e22f8059
--- /dev/null
+++ b/xdl/third_party/tbb/build/codecov.txt
@@ -0,0 +1,7 @@
+src/tbb
+src/tbbmalloc
+include/tbb
+src/rml/server
+src/rml/client
+src/rml/include
+source/malloc
diff --git a/xdl/third_party/tbb/build/common.inc b/xdl/third_party/tbb/build/common.inc
new file mode 100644
index 00000000..cef75df7
--- /dev/null
+++ b/xdl/third_party/tbb/build/common.inc
@@ -0,0 +1,174 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifndef tbb_os
+
+  # Windows sets environment variable OS; for other systems, ask uname
+  ifeq ($(OS),)
+    OS:=$(shell uname)
+    ifeq ($(OS),)
+      $(error "Cannot detect operating system")
+    endif
+    export tbb_os=$(OS)
+  endif
+
+  ifeq ($(OS), Windows_NT)
+    export tbb_os=windows
+  endif
+  ifeq ($(OS), Linux)
+    export tbb_os=linux
+  endif
+  ifeq ($(OS), Darwin)
+    export tbb_os=macos
+  endif
+
+endif # !tbb_os
+
+ifeq (1,$(tbb_cpf))
+  export CPF_SUFFIX ?=_preview
+endif
+
+ifeq (0,$(exceptions))
+# Inverse the value, for simplicity of use
+  export no_exceptions=1
+endif
+
+ifdef cpp0x
+    $(warning "Warning: deprecated cpp0x=$(cpp0x) is used, stdver must be used instead. Building in stdver=c++0x mode.")
+    export stdver?=c++0x
+    override cpp0x=
+endif
+
+# Define C & C++ compilers according to platform defaults or CXX & CC environment variables
+ifneq (,$(findstring environment, $(origin CXX)))
+    CPLUS = $(CXX)
+endif
+ifneq (,$(findstring environment, $(origin CC)))
+    CONLY = $(CC)
+endif
+
+ifneq (,$(stdver))
+    ifeq (,$(findstring ++, $(stdver)))
+        $(warning "Warning: unexpected stdver=$(stdver) is used.")
+    endif
+    CXX_STD_FLAGS=-std=$(stdver)
+endif
+
+# The requested option is added unconditionally.
+# If it is not supported, a compiler warning or error is expected.
+# Note that CXX_STD_FLAGS can be changed in <os>.<compiler>.inc.
+CXX_ONLY_FLAGS+=$(CXX_STD_FLAGS)
+
+ifeq (,$(wildcard $(tbb_root)/build/$(tbb_os).inc))
+  $(error "$(tbb_os)" is not supported. Add build/$(tbb_os).inc file with os-specific settings )
+endif
+
+# detect arch and runtime versions, provide common host-specific definitions
+include $(tbb_root)/build/$(tbb_os).inc
+
+ifeq ($(arch),)
+ $(error Architecture not detected)
+endif
+ifeq ($(runtime),)
+ $(error Runtime version not detected)
+endif
+
+# process target-dependent compilation and testing configurations
+ifdef target
+ # optionally process target-dependent options for compilation and testing
+ ifneq (,$(wildcard $(tbb_root)/build/$(target).inc))
+  include $(tbb_root)/build/$(target).inc
+ endif
+
+ # optionally process host-dependent environment for target-dependent compilation and testing
+ ifneq (,$(wildcard $(tbb_root)/build/$(target).$(tbb_os).inc))
+  include $(tbb_root)/build/$(target).$(tbb_os).inc
+ endif
+
+ # insure at least one target-dependent configuration file was found for compilation and testing
+ ifeq (,$(wildcard $(tbb_root)/build/$(target).inc)$(wildcard $(tbb_root)/build/$(target).$(tbb_os).inc))
+  $(error "$(target)" is not supported. Add build/$(target).inc or build/$(target).$(tbb_os).inc file)
+ endif
+endif  #target
+
+# Support for running debug tests to release library and vice versa
+flip_cfg=$(subst _flipcfg,_release,$(subst _release,_debug,$(subst _debug,_flipcfg,$(1))))
+cross_cfg = $(if $(crosstest),$(call flip_cfg,$(1)),$(1))
+# Setting default configuration to release
+cfg?=release
+
+compiler_name=$(notdir $(compiler))
+ifdef BUILDING_PHASE
+ ifndef target
+  target:=$(tbb_os)
+ endif
+ # process host/target compiler-dependent build configuration
+ ifeq (,$(wildcard $(tbb_root)/build/$(target).$(compiler_name).inc))
+  $(error "$(compiler_name)" is not supported on $(target). Add build/$(target).$(compiler_name).inc file with compiler-specific settings. )
+ endif
+ include $(tbb_root)/build/$(target).$(compiler_name).inc
+endif
+
+ifneq ($(BUILDING_PHASE),1)
+ # definitions for top-level Makefiles
+ origin_build_dir:=$(origin tbb_build_dir)
+ tbb_build_dir?=$(tbb_root)$(SLASH)build
+ export tbb_build_prefix?=$(tbb_os)_$(arch)_$(compiler_name)_$(runtime)$(CPF_SUFFIX)
+ work_dir=$(tbb_build_dir)$(SLASH)$(tbb_build_prefix)
+endif  # BUILDING_PHASE != 1
+
+ifdef offload
+  extra_inc=$(offload).offload.inc
+endif
+ifdef extra_inc
+ ifneq (,$(wildcard $(tbb_root)/build/$(extra_inc)))
+  include $(tbb_root)/build/$(extra_inc)
+ else
+  $(error specified build file: "build/$(extra_inc)" is not found. )
+ endif
+endif
+
+ifndef BUILDING_PHASE
+  work_dir:=$(work_dir)
+  # assign new value for tbb_root if path is not absolute (the filter keeps only /* paths)
+  ifeq ($(filter /% $(SLASH)%, $(subst :, ,$(tbb_root)) ),)
+   full_tbb_root:=$(CURDIR)/$(tbb_root)
+   ifeq ($(origin_build_dir),undefined)
+   #relative path are needed here as a workaround to support whitespaces in path
+    override tbb_root:=../..
+   else
+    override tbb_root:=$(full_tbb_root)
+   endif
+  export tbb_root
+  endif
+ endif # !BUILDING_PHASE
+
+.DELETE_ON_ERROR:    # Make will delete target if error occurred when building it.
+
+# MAKEOVERRIDES contains the command line variable definitions. Reseting it to
+# empty allows propogating all exported overridden variables to nested makes.
+# NOTEs:
+#   1. All variable set in command line are propagated to nested makes.
+#   2. All variables declared with the "export" keyword are propagated to
+#   nested makes.
+#   3. "override" allows changing variables set in command line. But it doesn't
+#   propagate new values to nested makes. For propagation, the "export" keyword
+#   should be used.
+#   4. gmake v3.80 doesn't support exporting of target-specific variables using
+#   the "export" keyword
+MAKEOVERRIDES =
diff --git a/xdl/third_party/tbb/build/common_rules.inc b/xdl/third_party/tbb/build/common_rules.inc
new file mode 100644
index 00000000..6bb2e7a6
--- /dev/null
+++ b/xdl/third_party/tbb/build/common_rules.inc
@@ -0,0 +1,169 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+ifeq ($(tbb_strict),1)
+  ifeq ($(WARNING_AS_ERROR_KEY),)
+    $(error WARNING_AS_ERROR_KEY is empty)
+  endif
+  # Do not remove line below!
+  WARNING_KEY += $(WARNING_AS_ERROR_KEY)
+endif
+
+ifneq (,$(findstring s,$(MAKEFLAGS)))
+  override largs+=-q
+endif
+ifneq (,$(repeat))
+  override largs+=-r $(repeat)
+endif
+ifneq (,$(largs)$(run_prefix))
+  override run_cmd:=$(run_cmd) $(TEST_LAUNCHER)
+  TEST_LAUNCHER=
+  ifeq (,$(strip $(run_cmd)))
+    $(warning Test launcher is not defined for the platform, ignoring launcher arguments)
+  endif
+endif
+
+ifndef TEST_EXT
+    TEST_EXT = exe
+endif
+
+INCLUDES += $(INCLUDE_KEY)$(tbb_root)/src $(INCLUDE_KEY)$(tbb_root)/src/rml/include $(INCLUDE_KEY)$(tbb_root)/include
+
+CPLUS_FLAGS += $(WARNING_KEY) $(CXXFLAGS)
+ifeq (1,$(tbb_cpf))
+CPLUS_FLAGS += $(DEFINE_KEY)__TBB_CPF_BUILD=1
+endif
+ifeq (0,$(exceptions))
+CPLUS_FLAGS += $(DEFINE_KEY)TBB_USE_EXCEPTIONS=0
+endif
+LINK_FLAGS += $(LDFLAGS)
+LIB_LINK_FLAGS += $(LDFLAGS)
+
+LIB_LINK_CMD ?= $(CPLUS) $(PIC_KEY)
+ifeq ($(origin LIB_OUTPUT_KEY), undefined)
+    LIB_OUTPUT_KEY = $(OUTPUT_KEY)
+endif
+ifeq ($(origin LIB_LINK_LIBS), undefined)
+    LIB_LINK_LIBS = $(LIBDL) $(LIBS)
+endif
+
+# some platforms do not provide separate C-only compiler
+CONLY ?= $(CPLUS)
+
+# The most generic rules
+#$(1) - is the target pattern
+define make-cxx-obj
+$1: %.cpp
+	$$(CPLUS) $$(OUTPUTOBJ_KEY)$$@ $$(COMPILE_ONLY) $$(CPLUS_FLAGS) $$(CXX_ONLY_FLAGS) $$(CXX_WARN_SUPPRESS) $$(INCLUDES) $$<
+endef
+
+TEST_AFFIXES_OBJS=$(addsuffix .$(OBJ),$(addprefix %_,$(TEST_SUFFIXES)) $(addsuffix _%,$(TEST_PREFIXES)))
+
+# Make will not process the same recipe for each test pattern (since the dependency on the same %.cpp)
+# thus the separated recipes should be provided
+$(foreach t,%.$(OBJ) $(TEST_AFFIXES_OBJS),$(eval $(call make-cxx-obj,$(t))))
+
+.PRECIOUS: %.$(OBJ) %.$(TEST_EXT) %.res $(TEST_AFFIXES_OBJS)
+
+# Rules for generating a test DLL
+%_dll.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(OUTPUTOBJ_KEY)$@ $(CPLUS_FLAGS) $(PIC_KEY) $(DEFINE_KEY)_USRDLL $(INCLUDES) $<
+
+#$(1) - is the binary name
+#$(2) - is the input obj files and libraries
+define make-test-binary
+	$(CPLUS) $(OUTPUT_KEY)$(strip $1) $(CPLUS_FLAGS) $(2) $(LIBS) $(LINK_FLAGS)
+endef
+
+# LINK_FILES the list of options to link test specific files (libraries and object files)
+LINK_FILES+=$(TEST_LIBS)
+# Rule for generating executable test
+%.$(TEST_EXT): %.$(OBJ) $(TEST_LIBS) $(TEST_PREREQUISITE) $(if $(use_proxy),$(PROXY.LIB))
+	$(call make-test-binary,$@,$< $(LINK_FILES) $(PIE_FLAG))
+
+# Rules for generating a test DLL
+%_dll.$(DLL): LINK_FLAGS += $(PIC_KEY) $(DYLIB_KEY)
+%_dll.$(DLL): TEST_LIBS := $(subst %_dll.$(DLL),,$(TEST_LIBS))
+%_dll.$(DLL): %_dll.$(OBJ)
+	$(call make-test-binary,$@,$< $(LINK_FILES))
+.PRECIOUS: %_dll.$(OBJ) %_dll.$(DLL)
+
+%.$(OBJ): %.c
+	$(CONLY) $(COMPILE_ONLY) $(OUTPUTOBJ_KEY)$@ $(C_FLAGS) $(INCLUDES) $<
+
+%.$(OBJ): %.asm
+	$(ASM) $(ASM_FLAGS) $<
+
+%.$(OBJ): %.s
+	cpp <$< | grep -v '^#' >$*.tmp
+	$(ASM) $(ASM_FLAGS) -o $@ $*.tmp
+
+# Rule for generating .E file if needed for visual inspection
+# Note that ICL treats an argument after PREPROC_ONLY as a file to open,
+# so all uses of PREPROC_ONLY should be immediately followed by a file name
+%.E: %.cpp
+	$(CPLUS) $(CPLUS_FLAGS) $(CXX_ONLY_FLAGS) $(INCLUDES) $(PREPROC_ONLY) $< >$@
+
+# TODO Rule for generating .asm file if needed for visual inspection
+%.asm: %.cpp
+	$(CPLUS) /c /FAs /Fa $(CPLUS_FLAGS) $(CXX_ONLY_FLAGS) $(INCLUDES) $<
+
+# TODO Rule for generating .s file if needed for visual inspection
+%.s: %.cpp
+	$(CPLUS) -S $(CPLUS_FLAGS) $(CXX_ONLY_FLAGS) $(INCLUDES) $<
+
+# Customizations
+$(KNOWN_WARNINGS): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(subst $(WARNING_KEY),,$(CPLUS_FLAGS)) $(CXX_ONLY_FLAGS) $(CXX_WARN_SUPPRESS) $(INCLUDES) $<
+
+tbb_misc.$(OBJ): version_string.ver
+tbb_misc.$(OBJ): INCLUDES+=$(INCLUDE_KEY).
+
+tbb_misc.E: tbb_misc.cpp version_string.ver
+	$(CPLUS) $(CPLUS_FLAGS) $(CXX_ONLY_FLAGS) $(INCLUDE_KEY). $(INCLUDES) $(PREPROC_ONLY) $< >$@
+
+%.res: %.rc version_string.ver $(TBB.MANIFEST)
+	rc /Fo$@ $(INCLUDES) $(filter /D%,$(CPLUS_FLAGS)) $<
+
+# TODO: add $(LIB_LINK_LIBS) $(LIB_LINK_FLAGS) (in a separate line?) and remove useless $(INCLUDES)
+VERSION_FLAGS=$(CPLUS) $(CPLUS_FLAGS) $(CXX_ONLY_FLAGS) $(INCLUDES)
+
+ifneq (,$(TBB.MANIFEST))
+$(TBB.MANIFEST):
+	cmd /C "echo #include ^<stdio.h^> >tbbmanifest.c"
+	cmd /C "echo int main(){return 0;} >>tbbmanifest.c"
+	cl /nologo $(C_FLAGS) tbbmanifest.c
+
+version_string.ver: $(TBB.MANIFEST)
+	$(MAKE_VERSIONS)
+	cmd /C "echo #define TBB_MANIFEST 1 >> version_string.ver"
+# TODO: fix parallel build by writing to a temporary file and rename it when complete
+else
+# TODO: make version strings directly representative for all the libraries
+version_string.ver:
+	$(MAKE_VERSIONS)
+endif
+
+test_% debug_%: test_%.$(TEST_EXT) $(TEST_PREREQUISITE)
+	$(run_cmd) ./$< $(args)
+ifneq (,$(codecov))
+	profmerge
+	codecov $(if $(findstring -,$(codecov)),$(codecov),) -demang -comp $(tbb_root)/build/codecov.txt
+endif
+
diff --git a/xdl/third_party/tbb/build/detect.js b/xdl/third_party/tbb/build/detect.js
new file mode 100644
index 00000000..45d6b4ba
--- /dev/null
+++ b/xdl/third_party/tbb/build/detect.js
@@ -0,0 +1,199 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+function readAllFromFile(fname) {
+    var fso = new ActiveXObject("Scripting.FileSystemObject");
+    var file = null;
+    try {
+        file = fso.OpenTextFile(fname, 1, 0);
+        return (file.readAll());
+    } finally {
+        // Close the file in the finally section to guarantee that it will be closed in any case
+        // (if the exception is thrown or not).
+        file.Close();
+    }
+}
+
+function doWork() {
+    var WshShell = WScript.CreateObject("WScript.Shell");
+
+    var tmpExec = WshShell.Run("cmd /c echo int main(){return 0;} >detect.c", 0, true);
+
+    // The next block deals with GCC (MinGW)
+    if (WScript.Arguments.Count() > 1) {
+        var compilerPath = WScript.Arguments(1);
+        // The RegExp matches everything up to and including the last slash (it uses a greedy approach.)
+        var compilerName = compilerPath.replace(/^.*[\/\\]/, "");
+        if (compilerName.match(/gcc/i) != null) {
+            if (WScript.Arguments(0) == "/arch") {
+                // Get predefined macros
+                tmpExec = WshShell.Run("cmd /C " + compilerPath + " -dM -E detect.c > detect.map", 0, true);
+                var defs = readAllFromFile("detect.map");
+                //detect target architecture
+                var intel64 = /x86_64|amd64/mgi;
+                var ia32 = /i386/mgi;
+                if (defs.match(intel64)) {
+                    WScript.Echo("intel64");
+                } else if (defs.match(ia32)) {
+                    WScript.Echo("ia32");
+                } else {
+                    WScript.Echo("unknown");
+                }
+            } else {
+                tmpExec = WshShell.Exec(compilerPath + " -dumpversion");
+                var gccVersion = tmpExec.StdOut.ReadLine();
+                if (WScript.Arguments(0) == "/runtime") {
+                    WScript.Echo("mingw" + gccVersion);
+                }
+                else if (WScript.Arguments(0) == "/minversion") {
+                    // Comparing strings, not numbers; will not work for two-digit versions
+                    if (gccVersion >= WScript.Arguments(2)) {
+                        WScript.Echo("ok");
+                    } else {
+                        WScript.Echo("fail");
+                    }
+                }
+            }
+            return;
+        }
+    }
+
+    //Compile binary
+    tmpExec = WshShell.Exec("cl /MD detect.c /link /MAP");
+    while (tmpExec.Status == 0) {
+        WScript.Sleep(100);
+    }
+    //compiler banner that includes version and target arch was printed to stderr
+    var clVersion = tmpExec.StdErr.ReadAll();
+
+    if (WScript.Arguments(0) == "/arch") {
+        //detect target architecture
+        var intel64 = /AMD64|EM64T|x64/mgi;
+        var ia32 = /[80|\s]x86/mgi;
+        var arm = /ARM/mgi;
+        if (clVersion.match(intel64)) {
+            WScript.Echo("intel64");
+        } else if (clVersion.match(ia32)) {
+            WScript.Echo("ia32");
+        } else if (clVersion.match(arm)) {
+            WScript.Echo("armv7");
+        } else {
+            WScript.Echo("unknown");
+        }
+        return;
+    }
+
+    if (WScript.Arguments(0) == "/runtime") {
+        //read map-file
+        var mapContext = readAllFromFile("detect.map");
+        //detect runtime
+        var vc71 = /MSVCR71\.DLL/mgi;
+        var vc80 = /MSVCR80\.DLL/mgi;
+        var vc90 = /MSVCR90\.DLL/mgi;
+        var vc100 = /MSVCR100\.DLL/mgi;
+        var vc110 = /MSVCR110\.DLL/mgi;
+        var vc120 = /MSVCR120\.DLL/mgi;
+        var vc140 = /VCRUNTIME140\.DLL/mgi;
+        var psdk = /MSVCRT\.DLL/mgi;
+        if (mapContext.match(vc71)) {
+            WScript.Echo("vc7.1");
+        } else if (mapContext.match(vc80)) {
+            WScript.Echo("vc8");
+        } else if (mapContext.match(vc90)) {
+            WScript.Echo("vc9");
+        } else if (mapContext.match(vc100)) {
+            WScript.Echo("vc10");
+        } else if (mapContext.match(vc110)) {
+            WScript.Echo("vc11");
+        } else if (mapContext.match(vc120)) {
+            WScript.Echo("vc12");
+        } else if (mapContext.match(vc140)) {
+            if (WshShell.ExpandEnvironmentStrings("%VisualStudioVersion%") == "15.0")
+                WScript.Echo("vc14.1");
+            else
+                WScript.Echo("vc14");
+        } else {
+            WScript.Echo("unknown");
+        }
+        return;
+    }
+
+    if (WScript.Arguments(0) == "/minversion") {
+        var compilerVersion;
+        var compilerUpdate;
+        if (WScript.Arguments(1) == "cl") {
+            compilerVersion = clVersion.match(/Compiler Version ([0-9.]+)\s/mi)[1];
+            // compilerVersion is in xx.xx.xxxxx.xx format, i.e. a string.
+            // It will compare well with major.minor versions where major has two digits,
+            // which is sufficient as the versions of interest start from 13 (for VC7).
+        } else if (WScript.Arguments(1) == "icl") {
+            // Get predefined ICL macros
+            tmpExec = WshShell.Run("cmd /C icl /QdM /E detect.c > detect.map", 0, true);
+            var defs = readAllFromFile("detect.map");
+            // In #define __INTEL_COMPILER XXYY, XX is the major ICL version, YY is minor
+            compilerVersion = defs.match(/__INTEL_COMPILER[ \t]*([0-9]+).*$/mi)[1] / 100;
+            compilerUpdate = defs.match(/__INTEL_COMPILER_UPDATE[ \t]*([0-9]+).*$/mi)[1];
+            // compiler version is a number; it compares well with another major.minor
+            // version number, where major has one, two, and perhaps more digits (9.1, 11, etc).
+        }
+        var requestedVersion = WScript.Arguments(2);
+        var requestedUpdate = 0;
+        if (WScript.Arguments.Count() > 3)
+            requestedUpdate = WScript.Arguments(3);
+        if (compilerVersion < requestedVersion) {
+            WScript.Echo("fail");
+        } else if (compilerVersion == requestedVersion && compilerUpdate < requestedUpdate) {
+            WScript.Echo("fail");
+        } else {
+            WScript.Echo("ok");
+        }
+        return;
+    }
+}
+
+function doClean() {
+    var fso = new ActiveXObject("Scripting.FileSystemObject");
+    // delete intermediate files
+    if (fso.FileExists("detect.c"))
+        fso.DeleteFile("detect.c", false);
+    if (fso.FileExists("detect.obj"))
+        fso.DeleteFile("detect.obj", false);
+    if (fso.FileExists("detect.map"))
+        fso.DeleteFile("detect.map", false);
+    if (fso.FileExists("detect.exe"))
+        fso.DeleteFile("detect.exe", false);
+    if (fso.FileExists("detect.exe.manifest"))
+        fso.DeleteFile("detect.exe.manifest", false);
+}
+
+if (WScript.Arguments.Count() > 0) {
+
+    try {
+        doWork();
+    } catch (error) {
+        WScript.Echo("unknown");
+    }
+    doClean();
+
+} else {
+    WScript.Echo("Supported options:\n"
+                  + "\t/arch [compiler]\n"
+                  + "\t/runtime [compiler]\n"
+                  + "\t/minversion compiler version");
+}
+
diff --git a/xdl/third_party/tbb/build/generate_tbbvars.bat b/xdl/third_party/tbb/build/generate_tbbvars.bat
new file mode 100644
index 00000000..a7bee908
--- /dev/null
+++ b/xdl/third_party/tbb/build/generate_tbbvars.bat
@@ -0,0 +1,66 @@
+@echo off
+REM
+REM Copyright (c) 2005-2018 Intel Corporation
+REM
+REM Licensed under the Apache License, Version 2.0 (the "License");
+REM you may not use this file except in compliance with the License.
+REM You may obtain a copy of the License at
+REM
+REM     http://www.apache.org/licenses/LICENSE-2.0
+REM
+REM Unless required by applicable law or agreed to in writing, software
+REM distributed under the License is distributed on an "AS IS" BASIS,
+REM WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+REM See the License for the specific language governing permissions and
+REM limitations under the License.
+REM
+REM
+REM
+REM
+REM
+setlocal
+for %%D in ("%tbb_root%") do set actual_root=%%~fD
+set fslash_root=%actual_root:\=/%
+set bin_dir=%CD%
+set fslash_bin_dir=%bin_dir:\=/%
+set _INCLUDE=INCLUDE& set _LIB=LIB
+if not x%UNIXMODE%==x set _INCLUDE=CPATH& set _LIB=LIBRARY_PATH
+if not x%USE_INCLUDE_ENV%==x set _INCLUDE=INCLUDE
+
+echo Generating local tbbvars.bat
+echo @echo off>tbbvars.bat
+echo SET TBBROOT=%actual_root%>>tbbvars.bat
+echo SET TBB_ARCH_PLATFORM=%arch%\%runtime%>>tbbvars.bat
+echo SET TBB_TARGET_ARCH=%arch%>>tbbvars.bat
+echo SET %_INCLUDE%=%%TBBROOT%%\include;%%%_INCLUDE%%%>>tbbvars.bat
+echo SET %_LIB%=%bin_dir%;%%%_LIB%%%>>tbbvars.bat
+echo SET PATH=%bin_dir%;%%PATH%%>>tbbvars.bat
+if not x%UNIXMODE%==x echo SET LD_LIBRARY_PATH=%bin_dir%;%%LD_LIBRARY_PATH%%>>tbbvars.bat
+
+echo Generating local tbbvars.sh
+echo #!/bin/sh>tbbvars.sh
+echo export TBBROOT="%fslash_root%">>tbbvars.sh
+echo export TBB_ARCH_PLATFORM="%arch%\%runtime%">>tbbvars.sh
+echo export TBB_TARGET_ARCH="%arch%">>tbbvars.sh
+echo export %_INCLUDE%="${TBBROOT}/include;$%_INCLUDE%">>tbbvars.sh
+echo export %_LIB%="%fslash_bin_dir%;$%_LIB%">>tbbvars.sh
+echo export PATH="%fslash_bin_dir%;$PATH">>tbbvars.sh
+if not x%UNIXMODE%==x echo export LD_LIBRARY_PATH="%fslash_bin_dir%;$LD_LIBRARY_PATH">>tbbvars.sh
+
+echo Generating local tbbvars.csh
+echo #!/bin/csh>tbbvars.csh
+echo setenv TBBROOT "%actual_root%">>tbbvars.csh
+echo setenv TBB_ARCH_PLATFORM "%arch%\%runtime%">>tbbvars.csh
+echo setenv TBB_TARGET_ARCH "%arch%">>tbbvars.csh
+echo setenv %_INCLUDE% "${TBBROOT}\include;$%_INCLUDE%">>tbbvars.csh
+echo setenv %_LIB% "%bin_dir%;$%_LIB%">>tbbvars.csh
+echo setenv PATH "%bin_dir%;$PATH">>tbbvars.csh
+if not x%UNIXMODE%==x echo setenv LD_LIBRARY_PATH "%bin_dir%;$LD_LIBRARY_PATH">>tbbvars.csh
+
+if not x%LIB_STL_ANDROID%==x (
+REM Workaround for copying Android* specific stl shared library to work folder
+copy /Y "%LIB_STL_ANDROID:/=\%" .
+)
+
+endlocal
+exit
diff --git a/xdl/third_party/tbb/build/generate_tbbvars.sh b/xdl/third_party/tbb/build/generate_tbbvars.sh
new file mode 100644
index 00000000..4dd9c2c7
--- /dev/null
+++ b/xdl/third_party/tbb/build/generate_tbbvars.sh
@@ -0,0 +1,71 @@
+#!/bin/bash
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Script used to generate tbbvars.[c]sh scripts
+bin_dir="$PWD"  # 
+cd "$tbb_root"  # keep this comments here
+tbb_root="$PWD" # to make it unsensible
+cd "$bin_dir"   # to EOL encoding
+cat >./tbbvars.sh <<EOF
+#!/bin/bash
+export TBBROOT="${tbb_root}" #
+tbb_bin="${bin_dir}" #
+if [ -z "\$CPATH" ]; then #
+    export CPATH="\${TBBROOT}/include" #
+else #
+    export CPATH="\${TBBROOT}/include:\$CPATH" #
+fi #
+if [ -z "\$${2}LIBRARY_PATH" ]; then #
+    export ${2}LIBRARY_PATH="\${tbb_bin}" #
+else #
+    export ${2}LIBRARY_PATH="\${tbb_bin}:\$${2}LIBRARY_PATH" #
+fi #
+if [ -z "\$${1}LD_LIBRARY_PATH" ]; then #
+    export ${1}LD_LIBRARY_PATH="\${tbb_bin}" #
+else #
+    export ${1}LD_LIBRARY_PATH="\${tbb_bin}:\$${1}LD_LIBRARY_PATH" #
+fi #
+${TBB_CUSTOM_VARS_SH} #
+EOF
+cat >./tbbvars.csh <<EOF
+#!/bin/csh
+setenv TBBROOT "${tbb_root}" #
+setenv tbb_bin "${bin_dir}" #
+if (! \$?CPATH) then #
+    setenv CPATH "\${TBBROOT}/include" #
+else #
+    setenv CPATH "\${TBBROOT}/include:\$CPATH" #
+endif #
+if (! \$?${2}LIBRARY_PATH) then #
+    setenv ${2}LIBRARY_PATH "\${tbb_bin}" #
+else #
+    setenv ${2}LIBRARY_PATH "\${tbb_bin}:\$${2}LIBRARY_PATH" #
+endif #
+if (! \$?${1}LD_LIBRARY_PATH) then #
+    setenv ${1}LD_LIBRARY_PATH "\${tbb_bin}" #
+else #
+    setenv ${1}LD_LIBRARY_PATH "\${tbb_bin}:\$${1}LD_LIBRARY_PATH" #
+endif #
+${TBB_CUSTOM_VARS_CSH} #
+EOF
+# Workaround for copying Android* specific stl shared library to "."
+if [ ! -z "${LIB_STL_ANDROID}" ]; then #
+	cp ${LIB_STL_ANDROID} . #
+fi #
diff --git a/xdl/third_party/tbb/build/index.html b/xdl/third_party/tbb/build/index.html
new file mode 100644
index 00000000..57f41d83
--- /dev/null
+++ b/xdl/third_party/tbb/build/index.html
@@ -0,0 +1,242 @@
+<HTML>
+<BODY>
+
+<H2>Overview</H2>
+This directory contains the internal Makefile infrastructure for Intel&reg; Threading Building Blocks (Intel&reg; TBB).
+
+<P>
+See below for how to <A HREF="#build">build</A> Intel TBB and how to <A HREF="#port">port</A> Intel TBB
+to a new platform, operating system or architecture.
+</P>
+
+<H2>Files</H2>
+The files here are not intended to be used directly.  See below for usage.
+<DL>
+<DT><A HREF="Makefile.tbb">Makefile.tbb</A>
+<DD>Main Makefile to build the Intel TBB library.
+    Invoked via 'make tbb' from <A HREF="../Makefile">top-level Makefile</A>.
+<DT><A HREF="Makefile.tbbmalloc">Makefile.tbbmalloc</A>
+<DD>Main Makefile to build the Intel TBB scalable memory allocator library as well as its tests.
+    Invoked via 'make tbbmalloc' from <A HREF="../Makefile">top-level Makefile</A>.
+<DT><A HREF="Makefile.test">Makefile.test</A>
+<DD>Main Makefile to build and run the tests for the Intel TBB library.
+    Invoked via 'make test' from <A HREF="../Makefile">top-level Makefile</A>.
+<DT><A HREF="common.inc">common.inc</A>
+<DD>Main common included Makefile that includes OS-specific and compiler-specific Makefiles.
+<DT>&lt;os&gt;.inc
+<DD>OS-specific Makefile for a particular &lt;os&gt;.
+<DT>&lt;os&gt;.&lt;compiler&gt;.inc
+<DD>Compiler-specific Makefile for a particular &lt;os&gt; / &lt;compiler&gt; combination.
+<DT>*.sh
+<DD>Infrastructure utilities for Linux* OS, macOS*, and UNIX*-related operating systems.
+<DT>*.js, *.bat
+<DD>Infrastructure utilities for Windows* OS.
+</DL>
+
+<A NAME="build"><H2>To Build</H2></A>
+<P>
+To port Intel TBB to a new platform, operating system or architecture, see the <A HREF="#port">porting directions</A> below.
+</P>
+
+<H3>Software prerequisites:</H3>
+<OL>
+<LI>C++ compiler for the platform, operating system and architecture of interest.
+    Either the native compiler for your system, or, optionally, the appropriate Intel&reg; C++ Compiler, may be used.
+<LI>GNU make utility. On Windows OS, if a UNIX* emulator is used to run GNU make,
+    it should be able to run Windows OS utilities and commands. On Linux OS, macOS, etc.,
+    shell commands issued by GNU make should execute in a Bourne or BASH compatible shell.
+    In the following examples, replace <TT>make</TT> with the correct GNU make command for
+    your system (for example, <TT>gmake</TT>). GNU make version 3.80 and more recent are supported.
+</OL>
+
+<P>
+Intel TBB libraries can be built by performing the following steps.
+On systems that support only one ABI (e.g., 32-bit), these steps build the libraries for that ABI.
+On systems that support both 64-bit and 32-bit libraries, these steps build the 64-bit libraries
+(Linux OS, macOS, and related systems) or whichever ABI is selected in the development environment (Windows OS).
+</P>
+<OL>
+<LI>Change to the <A HREF="../index.html">top-level directory</A> of the installed software.
+<LI>If using the Intel&reg; C++ Compiler, make sure the appropriate compiler is available in your PATH
+    (e.g., by sourcing the appropriate iccvars script for the compiler to be used).
+<LI>Invoke GNU make using no arguments, for example, <TT>make</TT>.
+</OL>
+
+<P>
+To build Intel TBB libraries for other than the default ABI (e.g., to build 32-bit libraries on Linux OS, macOS,
+or related systems that support both 64-bit and 32-bit libraries), perform the following steps:
+</P>
+<OL>
+<LI>Change to the <A HREF="../index.html">top-level directory</A> of the installed software.
+<LI>If using the Intel&reg; C++ Compiler, make sure the appropriate compiler is available in your PATH
+    (e.g., by sourcing the appropriate iccvars script for the compiler to be used).
+<LI>Explicitly specify the architecture when invoking GNU make, e.g. <TT>make arch=ia32</TT>.
+</OL>
+
+<P>The default make target will build the release and debug versions of the Intel TBB library.</P>
+<P>Other targets are available in the top-level Makefile. You might find the following targets useful:
+<UL>
+<LI><TT>make test</TT> will build and run Intel TBB <A HREF="../src/test">unit-tests</A>;
+<LI><TT>make examples</TT> will build and run Intel TBB <A HREF="../examples/index.html">examples</A>. Available in the open-source version only.
+For the commercial version, you can download Intel TBB Samples at the <a href="https://software.intel.com/en-us/product-code-samples?topic=20828">Intel&reg; Software Product Samples and Tutorials</a> website;
+<LI><TT>make all</TT> will do all of the above. Available in the open-source version only.
+</UL>
+See also the list of other targets below.
+</P>
+
+<P>
+By default, the libraries will be built in sub-directories within the build/ directory.
+The sub-directories are named according to the operating system, architecture, compiler and software environment used
+(the sub-directory names also distinguish release vs. debug libraries).  On Linux OS, the software environment comprises
+the GCC, libc and kernel version used.  On macOS, the software environment comprises the GCC and OS version used.
+On Windows OS, the software environment comprises the Microsoft* Visual Studio* version used.
+See below for how to change the default build directory.
+</P>
+
+<P>
+To perform different build and/or test operations, use the following steps.
+</P>
+<OL>
+<LI>Change to the <A HREF="../index.html">top-level directory</A> of the installed software.
+<LI>If using the Intel&reg; C++ Compiler, make sure the appropriate compiler is available in your PATH
+    (e.g., by sourcing the appropriate iccvars script for the compiler to be used).
+<LI>Invoke GNU make by using one or more of the following commands.
+    <DL>
+    <DT><TT>make</TT>
+    <DD>Default build.  Equivalent to <TT>make tbb tbbmalloc</TT>.
+    <DT><TT>make all</TT>
+    <DD>Equivalent to <TT>make tbb tbbmalloc test examples</TT>. Available in the open-source version only.
+    <DT><TT>cd src;make release</TT>
+    <DD>Build and test release libraries only.
+    <DT><TT>cd src;make debug</TT>
+    <DD>Build and test debug libraries only. 
+    <DT><TT>make tbb</TT>
+    <DD>Make Intel TBB release and debug libraries.
+    <DT><TT>make tbbmalloc</TT>
+    <DD>Make Intel TBB scalable memory allocator libraries.
+    <DT><TT>make test</TT>
+    <DD>Compile and run unit-tests
+    <DT><TT>make examples</TT>
+    <DD>Build libraries and run all examples, like doing <TT>make debug clean release</TT> from <A HREF="../examples/Makefile">the general example Makefile</A>.
+        Available in the open-source version only.
+    <DT><TT>make python</TT>
+    <DD>Build, install, and test Python* API for Intel TBB. See <A HREF="../python/index.html">details here</A>.
+    <DT><TT>make compiler=<B>{</B>icl, icc, gcc, clang<B>}</B> <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but use specified compilers instead of default, native compilers
+    <ol>
+        <li><tt><b> {</b>icl, icc<b>}</b> </tt> - to use Intel&reg; compilers (<tt>icl</tt> on Windows OS,  <tt>icc</tt>  on Linux OS or macOS). </li>
+        <li><tt>gcc</tt>  - to use g++ (e.g. MinGW on Windows OS)</li>
+        <li><tt>clang</tt> - to use Clang compiler</li>
+    </ol>
+    <DT><TT>make compiler=clang stdlib=libc++ <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but use <TT>libc++</TT> as a standard c++ library for clang.
+    <DT><TT>make stdver=<B>{</B>c++11, c++14, ...<B>}</B> <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but additionally specify the version of the C++ standard or dialect to be used by
+      the compiler. The specified value of <TT>stdver</TT> will be used as a parameter to the appropriate
+      compiler option (such as <TT>-std</TT>); the behavior in case of unsupported value is compiler-specific.
+    <DT><TT>make target_app=<B>{</B>win8ui, uwp, uwd<B>}</B> [target_mode=store] <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but use API that is compliant with Universal Windows* applications. Use <TT>win8ui</TT> option, if you want to use Intel TBB in Windows* 8 Universal application, <TT>uwp</TT> in case of Windows* 10 Universal Windows application and <TT>uwd</TT> for the usage inside Universal Windows* driver.
+    <TT>target_mode=store</TT> is used to produce binaries that are compliant with Windows Store* application container. In later case they won't work with Intel TBB unit tests but work only with Windows Store* applications.
+    <DT><TT>ndk-build target=android <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but build libraries for Android* OS by Android NDK that should be installed. Makefiles were tested with revision 8.
+    <DT><TT>make arch=<B>{</B>ia32, intel64, ia64<B>}</B> <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but build libraries for the selected ABI.
+        Might be useful for cross-compilation; ensure proper environment is set before running this command.
+    <DT><TT>make tbb_root=<B>{</B>(Intel TBB directory)<B>}</B> <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above; for use when invoking <TT>make</TT> from a directory other than the <A HREF="../index.html">top-level directory</A>.
+    <DT><TT>make tbb_build_dir=<B>{</B>(build directory)<B>}</B> <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but place the built libraries in the specified directory, rather than in the default sub-directory within the build/ directory. This command might have troubles with the build in case the sources installed to the directory with spaces in the path.
+    <DT><TT>make tbb_build_prefix=<B>{</B>(build sub-directory)<B>}</B> <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but place the built libraries in the specified sub-directory within the build/ directory, rather than using the default sub-directory name.
+    <DT><TT>make tbb_cpf=1 <B>[</B>(above options or targets)<B>]</B></TT>
+    <DD>Build and run as above, but build and use libraries with the Community Preview Features enabled, rather than the default libraries.
+    <DT><TT>make <B>[</B>(above options)<B>]</B> clean</TT>
+    <DD>Remove any executables or intermediate files produced by the above commands.
+        Includes build directories, object files, libraries and test executables.
+    </DL>
+</OL>
+
+<A NAME="port"><H2>To Port</H2></A>
+<P>
+This section provides information on how to port Intel TBB to a new platform, operating system or architecture.
+A subset or a superset of these steps may be required for porting to a given platform.
+</P>
+
+<H4>To port the Intel TBB source code:</H4>
+<OL>
+<LI>If porting to a new architecture, create a file that describes the architecture-specific details for that architecture.
+    <UL>
+    <LI>Create a &lt;os&gt;_&lt;architecture&gt;.h file in the <A HREF="../include/tbb/machine">include/tbb/machine</A> directory
+	that describes these details.
+	<UL>
+	<LI>The &lt;os&gt;_&lt;architecture&gt;.h is named after the operating system and architecture as recognized by
+	    <A HREF="../include/tbb/tbb_machine.h">include/tbb/tbb_machine.h</A> and the Makefile infrastructure.
+	<LI>This file defines the implementations of synchronization operations, and also the
+	    scheduler yield function, for the operating system and architecture.
+	<LI>Several examples of &lt;os&gt;_&lt;architecture&gt;.h files can be found in the
+	    <A HREF="../include/tbb/machine">include/tbb/machine</A> directory.
+	    <UL>
+	    <LI>A minimal implementation defines the 4-byte and 8-byte compare-and-swap operations,
+		and the scheduler yield function.  See <A HREF="../include/tbb/machine/mac_ppc.h">include/tbb/machine/mac_ppc.h</A>
+		for an example of a minimal implementation.
+	    <LI>More complex implementation examples can also be found in the
+		<A HREF="../include/tbb/machine">include/tbb/machine</A> directory
+		that implement all the individual variants of synchronization operations that Intel TBB uses.
+		Such implementations are more verbose but may achieve better performance on a given architecture.
+	    <LI>In a given implementation, any synchronization operation that is not defined is implemented, by default,
+		in terms of 4-byte or 8-byte compare-and-swap.  More operations can thus be added incrementally to increase
+		the performance of an implementation.
+	    <LI>In most cases, synchronization operations are implemented as inline assembly code; examples also exist,
+		(e.g., for Intel&reg; Itanium&reg; processors) that use out-of-line assembly code in *.s or *.asm files
+		(see the assembly code sub-directories in the <A HREF="../src/tbb">src/tbb</A> directory).
+	    </UL>
+	</UL>
+    <LI>Modify <A HREF="../include/tbb/tbb_machine.h">include/tbb/tbb_machine.h</A>, if needed, to invoke the appropriate
+	&lt;os&gt;_&lt;architecture&gt;.h file in the <A HREF="../include/tbb/machine">include/tbb/machine</A> directory.
+    </UL>
+<LI>Add an implementation of DetectNumberOfWorkers() in <A HREF="../src/tbb/tbb_misc.h">src/tbb/tbb_misc.h</A>,
+    that returns the number of cores found on the system in case it is not supported by the current implementation.  
+    This is used to determine the default number of threads for the Intel TBB task scheduler.
+<LI>Either properly define FillDynamicLinks for use in
+    <A HREF="../src/tbb/cache_aligned_allocator.cpp">src/tbb/cache_aligned_allocator.cpp</A>,
+    or hardcode the allocator to be used.
+<LI>Additional types might be required in the union defined in
+    <A HREF="../include/tbb/aligned_space.h">include/tbb/aligned_space.h</A>
+    to ensure proper alignment on your platform.
+<LI>Changes may be required in <A HREF="../include/tbb/tick_count.h">include/tbb/tick_count.h</A>
+    for systems that do not provide gettimeofday.
+</OL>
+
+<H4>To port the Makefile infrastructure:</H4>
+Modify the appropriate files in the Makefile infrastructure to add a new platform, operating system or architecture as needed.
+See the Makefile infrastructure files for examples.
+<OL>
+<LI>The <A HREF="../Makefile">top-level Makefile</A> includes <A HREF="common.inc">common.inc</A> to determine the operating system.
+    <UL>
+    <LI>To add a new operating system, add the appropriate test to <A HREF="common.inc">common.inc</A>, and create the needed &lt;os&gt;.inc and &lt;os&gt;.&lt;compiler&gt;.inc files (see below).
+    </UL>
+<LI>The &lt;os&gt;.inc file makes OS-specific settings for a particular operating systems.
+    <UL>
+    <LI>For example, <A HREF="linux.inc">linux.inc</A> makes settings specific to Linux operating systems.
+    <LI>This file performs OS-dependent tests to determine the specific platform and/or architecture, and sets other platform-dependent values.
+    <LI>Add a new &lt;os&gt;.inc file for each new operating system added.
+    </UL>
+<LI>The &lt;os&gt;.&lt;compiler&gt;.inc file makes compiler-specific settings for a particular
+    &lt;os&gt; / &lt;compiler&gt; combination.
+    <UL>
+    <LI>For example, <A HREF="linux.gcc.inc">linux.gcc.inc</A> makes specific settings for using GCC on Linux OS, and <A HREF="linux.icc.inc">linux.icc.inc</A> makes specific settings for using the Intel&reg; C++ compiler on Linux OS.
+    <LI>This file sets particular compiler, assembler and linker options required when using a particular &lt;os&gt; / &lt;compiler&gt; combination.
+    <LI>Add a new &lt;os&gt;.&lt;compiler&gt;.inc file for each new &lt;os&gt; / &lt;compiler&gt; combination added.
+    </UL>
+</OL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<P></P>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel, the Intel logo and Itanium are trademarks of Intel Corporation or its subsidiaries in the U.S. and/or other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/build/ios.clang.inc b/xdl/third_party/tbb/build/ios.clang.inc
new file mode 100644
index 00000000..6c810421
--- /dev/null
+++ b/xdl/third_party/tbb/build/ios.clang.inc
@@ -0,0 +1,23 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+include $(tbb_root)/build/macos.clang.inc
+
+CPLUS_FLAGS += -miphoneos-version-min=8.0
+LINK_FLAGS += -miphoneos-version-min=8.0
+LIB_LINK_FLAGS += -miphoneos-version-min=8.0
diff --git a/xdl/third_party/tbb/build/ios.macos.inc b/xdl/third_party/tbb/build/ios.macos.inc
new file mode 100644
index 00000000..03308a05
--- /dev/null
+++ b/xdl/third_party/tbb/build/ios.macos.inc
@@ -0,0 +1,36 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifneq ($(arch),$(filter $(arch),ia32 intel64 armv7 armv7s arm64))
+  $(error $(arch) is unknown architecture. Known arhitechtures are ia32 intel64 armv7 armv7s arm64)
+endif
+
+# If target is ios but arch is ia32/intel64 then build for 32/64 simulator!
+ifeq (,$(SDKROOT))
+  ifeq ($(arch),$(filter $(arch),ia32 intel64))
+    export SDKROOT:=$(shell xcodebuild -sdk -version | grep -o -E '/.*SDKs/iPhoneSimulator.*' 2>/dev/null)
+  else
+    export SDKROOT:=$(shell xcodebuild -sdk -version | grep -o -E '/.*SDKs/iPhoneOS.*' 2>/dev/null)
+  endif
+endif
+ifeq (,$(SDKROOT))
+  $(error iOS* SDK not found)
+endif
+
+ios_version:=$(shell echo $(SDKROOT) | sed -e "s/.*[a-z,A-Z]\(.*\).sdk/\1/")
+runtime:=cc$(clang_version)_ios$(ios_version)
diff --git a/xdl/third_party/tbb/build/linux.clang.inc b/xdl/third_party/tbb/build/linux.clang.inc
new file mode 100644
index 00000000..065f1d3d
--- /dev/null
+++ b/xdl/third_party/tbb/build/linux.clang.inc
@@ -0,0 +1,115 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= clang++
+CONLY ?= clang
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall -Wextra
+TEST_WARNING_KEY = -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor -Wno-dangling-else
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+LIBS += -lpthread -lrt
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = $(ITT_NOTIFY) -g -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG $(ITT_NOTIFY) -g -O0 -DUSE_PTHREAD
+endif
+
+ifneq (,$(stdlib))
+    CPLUS_FLAGS    += -stdlib=$(stdlib)
+    LIB_LINK_FLAGS += -stdlib=$(stdlib)
+endif
+
+ifneq (,$(gcc_version))
+    # TODO: do not assume that GCC minor and patchlevel versions are always single-digit.
+    CPLUS_FLAGS += -DTBB_USE_GLIBCXX_VERSION=$(subst .,0,$(gcc_version))
+endif
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m32 -march=pentium4
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (ppc64,$(arch))
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ppc32,$(arch))
+    CPLUS_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (bg,$(arch))
+    CPLUS = bgclang++
+    CONLY = bgclang
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/linux.gcc.inc b/xdl/third_party/tbb/build/linux.gcc.inc
new file mode 100644
index 00000000..36936767
--- /dev/null
+++ b/xdl/third_party/tbb/build/linux.gcc.inc
@@ -0,0 +1,156 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= g++
+CONLY ?= gcc
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor
+
+WARNING_SUPPRESS = -Wno-parentheses
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+LIBS += -lpthread -lrt
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic
+C_FLAGS = $(CPLUS_FLAGS)
+
+# gcc 4.2 and higher support OpenMP
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^(4\.[2-9]|[5-9])"))
+    OPENMP_FLAG = -fopenmp
+endif
+
+# gcc 4.8 and later support RTM intrinsics, but require command line switch to enable them
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^(4\.[8-9]|[5-9])"))
+    RTM_KEY = -mrtm
+endif
+
+# gcc 4.0 and later have -Wextra that is used by some our customers.
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^([4-9])"))
+    WARNING_KEY += -Wextra
+endif
+
+# gcc 5.0 and later have -Wsuggest-override and -Wno-sized-deallocation options
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^([5-9])"))
+    # enable -Wsuggest-override via a pre-included header in order to limit to C++11 and above
+    INCLUDE_TEST_HEADERS = -include $(tbb_root)/src/test/harness_preload.h
+    WARNING_SUPPRESS += -Wno-sized-deallocation
+endif
+
+# gcc 6.0 and later have -flifetime-dse option that controls
+# elimination of stores done outside the object lifetime
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^([6-9])"))
+    # keep pre-contruction stores for zero initialization
+    DSE_KEY = -flifetime-dse=1
+endif
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = $(ITT_NOTIFY) -g -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG $(ITT_NOTIFY) -g -O0 -DUSE_PTHREAD
+endif
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ifeq (ia64,$(arch))
+# Position-independent code (PIC) is a must on IA-64 architecture, even for regular (not shared) executables
+    CPLUS_FLAGS += $(PIC_KEY)
+endif
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m64 $(RTM_KEY)
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m32 -march=pentium4 $(RTM_KEY)
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (ppc64,$(arch))
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ppc32,$(arch))
+    CPLUS_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (bg,$(arch))
+    CPLUS = $(firstword $(notdir $(shell which powerpc{64,32,}-bg{z..a}-linux-g++ 2>/dev/null)))
+    CONLY = $(firstword $(notdir $(shell which powerpc{64,32,}-bg{z..a}-linux-gcc 2>/dev/null)))
+endif
+
+# for some gcc versions on Solaris, -m64 may imply V9, but perhaps not everywhere (TODO: verify)
+ifeq (sparc,$(arch))
+    CPLUS_FLAGS    += -mcpu=v9 -m64
+    LIB_LINK_FLAGS += -mcpu=v9 -m64
+endif
+
+# automatically generate "IT" instructions when compiling for Thumb ISA
+ifeq (armv7,$(arch))
+    CPLUS_FLAGS    += -Wa,-mimplicit-it=thumb
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+ifeq (ia64,$(arch))
+    ASM_FLAGS += -xexplicit
+    TBB_ASM.OBJ += atomic_support.o lock_byte.o log2.o pause.o ia64_misc.o
+    MALLOC_ASM.OBJ += atomic_support.o lock_byte.o pause.o log2.o
+endif
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/linux.icc.inc b/xdl/third_party/tbb/build/linux.icc.inc
new file mode 100644
index 00000000..4731f963
--- /dev/null
+++ b/xdl/third_party/tbb/build/linux.icc.inc
@@ -0,0 +1,119 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= icpc
+CONLY ?= icc
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -w1
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+NOINTRINSIC_KEY = -fno-builtin
+LIBDL = -ldl
+ifneq (,$(shell icc -dumpversion | egrep "1[2-9]\."))
+SDL_FLAGS = -fstack-protector -Wformat -Wformat-security
+endif
+
+ITT_NOTIFY = -DDO_ITT_NOTIFY
+ifeq (release,$(cfg))
+SDL_FLAGS += -D_FORTIFY_SOURCE=2
+CPLUS_FLAGS = $(ITT_NOTIFY) -O2 -g -DUSE_PTHREAD
+else
+CPLUS_FLAGS = $(ITT_NOTIFY) -O0 -g -DUSE_PTHREAD -DTBB_USE_DEBUG
+endif
+
+LIB_LINK_FLAGS = -shared -static-intel -Wl,-soname=$(BUILDING_LIBRARY) -z relro -z now
+LIBS += -lpthread -lrt
+LINK_FLAGS = -rdynamic
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifneq (,$(shell icc -dumpversion | egrep  "^1[6-9]\."))
+OPENMP_FLAG = -qopenmp
+else
+OPENMP_FLAG = -openmp
+endif
+
+# ICC 12.0 and higher provide Intel(R) Cilk(TM) Plus
+ifneq (,$(shell icc -dumpversion | egrep  "^1[2-9]\."))
+    CILK_AVAILABLE = yes
+endif
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ifeq (ia32,$(arch))
+    CPLUS_FLAGS += -m32 -falign-stack=maintain-16-byte
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (ia64,$(arch))
+    ITT_NOTIFY =
+# Position-independent code (PIC) is a must on IA-64 architecture, even for regular (not shared) executables
+# strict-ansi does not work with <signal.h> on RHEL 4 AS
+    CPLUS_FLAGS += $(PIC_KEY) $(if $(findstring cc3.,$(runtime)),-ansi,-strict-ansi)
+else
+# For ICC 16 and older, in std=c++14 mode -strict-ansi does not work with GNU C++ library headers
+# egrep returns 0 or 1, compare it in concatenation
+    CPLUS_FLAGS += $(if $(findstring c++14_1,$(stdver)_$(shell icc -dumpversion| egrep -c "^1[1-6]\.")),-ansi,-strict-ansi)
+endif
+
+ifneq (,$(codecov))
+# no tool support for code coverage, need profile data generation
+    ITT_NOTIFY = -prof-gen=srcpos
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+ifeq (ia64,$(arch))
+    ASM_FLAGS += -xexplicit
+    TBB_ASM.OBJ += atomic_support.o lock_byte.o log2.o pause.o ia64_misc.o
+    MALLOC_ASM.OBJ += atomic_support.o lock_byte.o pause.o log2.o
+endif
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
diff --git a/xdl/third_party/tbb/build/linux.inc b/xdl/third_party/tbb/build/linux.inc
new file mode 100644
index 00000000..8e58f1ee
--- /dev/null
+++ b/xdl/third_party/tbb/build/linux.inc
@@ -0,0 +1,142 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+####### Detections and Commands ###############################################
+
+ifeq (icc,$(compiler))
+  export COMPILER_VERSION := ICC: $(shell icc -V </dev/null 2>&1 | grep 'Version')
+  ifneq (,$(findstring running on IA-32, $(COMPILER_VERSION)))
+    export arch:=ia32
+  else
+    ifneq (,$(findstring running on Intel(R) 64, $(COMPILER_VERSION)))
+      export arch:=intel64
+    else
+      ifneq (,$(findstring IA-64, $(COMPILER_VERSION)))
+        export arch:=ia64
+      endif
+    endif
+  endif
+  ifeq (,$(arch))
+    $(warning "Unknown Intel compiler")
+  endif
+endif
+
+ifndef arch
+        uname_m:=$(shell uname -m)
+        ifeq ($(uname_m),i686)
+                export arch:=ia32
+        endif
+        ifeq ($(uname_m),ia64)
+                export arch:=ia64
+        endif
+        ifeq ($(uname_m),x86_64)
+                export arch:=intel64
+        endif
+        ifeq ($(uname_m),sparc64)
+                export arch:=sparc
+        endif
+        ifeq ($(uname_m),armv7l)
+                export arch:=armv7
+        endif
+        ifndef arch
+                export arch:=$(uname_m)
+        endif
+endif
+
+ifndef runtime
+        export gcc_version:=$(shell gcc -dumpversion)
+        os_version:=$(shell uname -r)
+        os_kernel_version:=$(shell uname -r | sed -e 's/-.*$$//')
+        export os_glibc_version_full:=$(shell getconf GNU_LIBC_VERSION | grep glibc | sed -e 's/^glibc //')
+        os_glibc_version:=$(shell echo "$(os_glibc_version_full)" | sed -e '2,$$d' -e 's/-.*$$//')
+        export runtime:=cc$(gcc_version)_libc$(os_glibc_version)_kernel$(os_kernel_version)
+endif
+
+native_compiler := gcc
+export compiler ?= gcc
+debugger ?= gdb
+
+CMD=sh -c
+CWD=$(shell pwd)
+CP=cp
+RM?=rm -f
+RD?=rmdir
+MD?=mkdir -p
+NUL= /dev/null
+SLASH=/
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_linux.sh $(VERSION_FLAGS) >version_string.ver
+MAKE_TBBVARS=sh $(tbb_root)/build/generate_tbbvars.sh
+
+ifdef LD_LIBRARY_PATH
+        export LD_LIBRARY_PATH := .:$(LD_LIBRARY_PATH)
+else
+        export LD_LIBRARY_PATH := .
+endif
+
+####### Build settings ########################################################
+
+OBJ = o
+DLL = so
+MALLOC_DLL?=$(DLL)
+LIBEXT = so
+SONAME_SUFFIX =$(shell grep TBB_COMPATIBLE_INTERFACE_VERSION $(tbb_root)/include/tbb/tbb_stddef.h | egrep -o [0-9.]+)
+
+ifeq ($(arch),ia64)
+        def_prefix = lin64ipf
+endif
+ifneq (,$(findstring $(arch),sparc s390x))
+        def_prefix = lin64
+endif
+ifeq ($(arch),armv7)
+        def_prefix = lin32
+endif
+ifeq (,$(def_prefix))
+    ifeq (64,$(findstring 64,$(arch)))
+            def_prefix = lin64
+    else
+            def_prefix = lin32
+    endif
+endif
+TBB.LST = $(tbb_root)/src/tbb/$(def_prefix)-tbb-export.lst
+TBB.DEF = $(TBB.LST:.lst=.def)
+
+TBB.DLL = $(TBB_NO_VERSION.DLL).$(SONAME_SUFFIX)
+TBB.LIB = $(TBB.DLL)
+TBB_NO_VERSION.DLL=libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+LINK_TBB.LIB = $(TBB_NO_VERSION.DLL)
+
+MALLOC_NO_VERSION.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(MALLOC_DLL)
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-tbbmalloc-export.def
+MALLOC.DLL = $(MALLOC_NO_VERSION.DLL).$(SONAME_SUFFIX)
+MALLOC.LIB = $(MALLOC_NO_VERSION.DLL)
+LINK_MALLOC.LIB = $(MALLOC_NO_VERSION.DLL)
+
+MALLOCPROXY_NO_VERSION.DLL = libtbbmalloc_proxy$(DEBUG_SUFFIX).$(DLL)
+MALLOCPROXY.DEF = $(MALLOC_ROOT)/$(def_prefix)-proxy-export.def
+MALLOCPROXY.DLL = $(MALLOCPROXY_NO_VERSION.DLL).$(SONAME_SUFFIX)
+MALLOCPROXY.LIB = $(MALLOCPROXY_NO_VERSION.DLL)
+LINK_MALLOCPROXY.LIB = $(MALLOCPROXY.LIB)
+
+RML_NO_VERSION.DLL = libirml$(DEBUG_SUFFIX).$(DLL)
+RML.DEF = $(RML_SERVER_ROOT)/lin-rml-export.def
+RML.DLL = $(RML_NO_VERSION.DLL).1
+RML.LIB = $(RML_NO_VERSION.DLL)
+
+TEST_LAUNCHER=sh $(tbb_root)/build/test_launcher.sh $(largs)
+
+OPENCL.LIB = -lOpenCL
diff --git a/xdl/third_party/tbb/build/linux.pathcc.inc b/xdl/third_party/tbb/build/linux.pathcc.inc
new file mode 100644
index 00000000..d2693c1d
--- /dev/null
+++ b/xdl/third_party/tbb/build/linux.pathcc.inc
@@ -0,0 +1,93 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= pathCC
+CONLY ?= pathcc
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor -Wextra
+
+WARNING_SUPPRESS = -Wno-parentheses -Wno-non-virtual-dtor
+DYLIB_KEY = -shared
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+LIBS += -lstl -lpthread -lrt
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic
+C_FLAGS = $(CPLUS_FLAGS)
+
+OPENMP_FLAG = -openmp
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = $(ITT_NOTIFY) -g -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG $(ITT_NOTIFY) -g -O0 -DUSE_PTHREAD
+endif
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m32 -march=pentium4
+    LIB_LINK_FLAGS += -m32
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += --64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += --32
+endif
+ifeq ($(cfg),debug)
+    ASM_FLAGS += -g
+endif
+
+ASSEMBLY_SOURCE=$(arch)-gas
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/linux.xl.inc b/xdl/third_party/tbb/build/linux.xl.inc
new file mode 100644
index 00000000..dcec5a64
--- /dev/null
+++ b/xdl/third_party/tbb/build/linux.xl.inc
@@ -0,0 +1,104 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+####### Detections and Commands ###############################################
+
+CPLUS ?= xlc++_r
+CONLY ?= xlc_r
+COMPILE_ONLY = -c
+PREPROC_ONLY = -E -qsourcetype=c
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -qpic
+WARNING_AS_ERROR_KEY = -qhalt=w
+WARNING_KEY =
+TEST_WARNING_KEY =
+
+WARNING_SUPPRESS =
+DYLIB_KEY = -qmkshrobj
+EXPORT_KEY = -Wl,--version-script,
+LIBDL = -ldl
+
+LIB_LINK_FLAGS = $(DYLIB_KEY) -Wl,-soname=$(BUILDING_LIBRARY)
+LIBS = -lpthread -lrt
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = $(ITT_NOTIFY) -O2 -DUSE_PTHREAD
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -DTBB_USE_DEBUG $(ITT_NOTIFY) -g -O0 -DUSE_PTHREAD
+endif
+
+# Adding directly to CPLUS_FLAGS instead of to WARNING_SUPPRESS because otherwise it would not be used in several tests (why not?).
+# Suppress warnings like:
+# - "1500-029: (W) WARNING: subprogram [...] could not be inlined into [...]."
+# - "1501-201: (W) Maximum number of common component diagnostics, 10  has been exceeded."
+#     see http://www-01.ibm.com/support/docview.wss?uid=swg1LI72843
+#     it seems that the internal compiler error that would ensue has now been avoided, making the condition harmless
+# - "1540-0198 (W) The omitted keyword "private" is assumed for base class "no_copy"."
+# - "1540-0822 (W) The name "__FUNCTION__" must not be defined as a macro."
+CPLUS_FLAGS += -qsuppress=1500-029:1501-201:1540-0198:1540-0822
+
+ASM=
+ASM_FLAGS=
+
+TBB_ASM.OBJ=
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -q64
+    LIB_LINK_FLAGS += -q64
+endif
+
+# TODO: equivalent for -march=pentium4 in CPLUS_FLAGS
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -q32 -qarch=pentium4
+    LIB_LINK_FLAGS += -q32
+endif
+
+ifeq (ppc64,$(arch))
+    CPLUS_FLAGS += -q64
+    LIB_LINK_FLAGS += -q64
+endif
+
+ifeq (ppc32,$(arch))
+    CPLUS_FLAGS += -q32
+    LIB_LINK_FLAGS += -q32
+endif
+
+ifeq (bg,$(arch))
+    CPLUS = bgxlC_r
+    CONLY = bgxlc_r
+endif
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+# Suppress innumerable warnings like "1540-1088 (W) The exception specification is being ignored."
+# Suppress             warnings like "1540-1090 (I) The destructor of "lock" might not be called."
+# TODO: aren't these warnings an indication that -qnoeh might not be appropriate?
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -qnortti -qnoeh -qsuppress=1540-1088:1540-1090
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/macos.clang.inc b/xdl/third_party/tbb/build/macos.clang.inc
new file mode 100644
index 00000000..23a4288d
--- /dev/null
+++ b/xdl/third_party/tbb/build/macos.clang.inc
@@ -0,0 +1,125 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= clang++
+CONLY ?= clang
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wextra -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor
+WARNING_SUPPRESS = -Wno-non-virtual-dtor -Wno-dangling-else
+DYLIB_KEY = -dynamiclib
+EXPORT_KEY = -Wl,-exported_symbols_list,
+LIBDL = -ldl
+
+LIBS = -lpthread
+LINK_FLAGS =
+LIB_LINK_FLAGS = -dynamiclib -install_name @rpath/$(BUILDING_LIBRARY)
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq ($(cfg), release)
+    CPLUS_FLAGS = -g -O2
+else
+    CPLUS_FLAGS = -g -O0 -DTBB_USE_DEBUG
+endif
+
+CPLUS_FLAGS += -DUSE_PTHREAD $(ITT_NOTIFY)
+
+# For Clang, we add the option to support RTM intrinsics *iff* xtest is found in <immintrin.h>
+ifneq (,$(shell grep xtest `echo "\#include<immintrin.h>" | $(CONLY) -E -M - 2>&1 | grep immintrin.h` 2>/dev/null))
+    RTM_KEY = -mrtm
+endif
+
+ifneq (,$(stdlib))
+    CPLUS_FLAGS    += -stdlib=$(stdlib)
+    LIB_LINK_FLAGS += -stdlib=$(stdlib)
+endif
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m64 $(RTM_KEY)
+    LINK_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m32 $(RTM_KEY)
+    LINK_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (ppc64,$(arch))
+    CPLUS_FLAGS += -arch ppc64
+    LINK_FLAGS += -arch ppc64
+    LIB_LINK_FLAGS += -arch ppc64
+endif
+
+ifeq (ppc32,$(arch))
+    CPLUS_FLAGS += -arch ppc
+    LINK_FLAGS += -arch ppc
+    LIB_LINK_FLAGS += -arch ppc
+endif
+
+ifeq ($(arch),$(filter $(arch),armv7 armv7s arm64))
+    CPLUS_FLAGS += -arch $(arch)
+    LINK_FLAGS += -arch $(arch)
+    LIB_LINK_FLAGS += -arch $(arch)
+endif
+
+ifdef SDKROOT
+    CPLUS_FLAGS += -isysroot $(SDKROOT)
+    LINK_FLAGS += -L$(SDKROOT)/usr/lib/system -L$(SDKROOT)/usr/lib/
+    LIB_LINK_FLAGS += -L$(SDKROOT)/usr/lib/system -L$(SDKROOT)/usr/lib/
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += -arch x86_64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += -arch i386
+endif
+ifeq ($(cfg), debug)
+    ASM_FLAGS += -g
+endif
+
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
diff --git a/xdl/third_party/tbb/build/macos.gcc.inc b/xdl/third_party/tbb/build/macos.gcc.inc
new file mode 100644
index 00000000..5df569d5
--- /dev/null
+++ b/xdl/third_party/tbb/build/macos.gcc.inc
@@ -0,0 +1,132 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= g++
+CONLY ?= gcc
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wextra -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor
+WARNING_SUPPRESS = -Wno-non-virtual-dtor
+DYLIB_KEY = -dynamiclib
+EXPORT_KEY = -Wl,-exported_symbols_list,
+LIBDL = -ldl
+
+LIBS = -lpthread
+LINK_FLAGS =
+LIB_LINK_FLAGS = -dynamiclib -install_name @rpath/$(BUILDING_LIBRARY)
+C_FLAGS = $(CPLUS_FLAGS)
+
+# gcc 4.8 and later support RTM intrinsics, but require command line switch to enable them
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^(4\.[8-9]|[5-9])"))
+    RTM_KEY = -mrtm
+endif
+
+# gcc 5.0 and later have -Wsuggest-override option
+# enable it via a pre-included header in order to limit to C++11 and above
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^([5-9])"))
+    INCLUDE_TEST_HEADERS = -include $(tbb_root)/src/test/harness_preload.h
+endif
+
+# gcc 6.0 and later have -flifetime-dse option that controls
+# elimination of stores done outside the object lifetime
+ifneq (,$(shell $(CONLY) -dumpversion | egrep  "^([6-9])"))
+    # keep pre-contruction stores for zero initialization
+    DSE_KEY = -flifetime-dse=1
+endif
+
+ifeq ($(cfg), release)
+    CPLUS_FLAGS = -g -O2
+else
+    CPLUS_FLAGS = -g -O0 -DTBB_USE_DEBUG
+endif
+
+CPLUS_FLAGS += -DUSE_PTHREAD $(ITT_NOTIFY)
+
+ifeq (intel64,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m64
+    LINK_FLAGS += -m64
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    ITT_NOTIFY = -DDO_ITT_NOTIFY
+    CPLUS_FLAGS += -m32
+    LINK_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+endif
+
+ifeq (ppc64,$(arch))
+    CPLUS_FLAGS += -arch ppc64
+    LINK_FLAGS += -arch ppc64
+    LIB_LINK_FLAGS += -arch ppc64
+endif
+
+ifeq (ppc32,$(arch))
+    CPLUS_FLAGS += -arch ppc
+    LINK_FLAGS += -arch ppc
+    LIB_LINK_FLAGS += -arch ppc
+endif
+
+ifeq (armv7,$(arch))
+    CPLUS_FLAGS += -arch armv7
+    LINK_FLAGS += -arch armv7
+    LIB_LINK_FLAGS += -arch armv7
+endif
+
+ifdef SDKROOT
+    CPLUS_FLAGS += -isysroot $(SDKROOT)
+    LIB_LINK_FLAGS += -L$(SDKROOT)/usr/lib/system -L$(SDKROOT)/usr/lib/
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += -arch x86_64
+endif
+ifeq (ia32,$(arch))
+    ASM_FLAGS += -arch i386
+endif
+ifeq ($(cfg), debug)
+    ASM_FLAGS += -g
+endif
+
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
diff --git a/xdl/third_party/tbb/build/macos.icc.inc b/xdl/third_party/tbb/build/macos.icc.inc
new file mode 100644
index 00000000..aa7d3324
--- /dev/null
+++ b/xdl/third_party/tbb/build/macos.icc.inc
@@ -0,0 +1,107 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= icpc
+CONLY ?= icc
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -w1
+ifneq (,$(shell icc -dumpversion | egrep "1[2-9]\."))
+SDL_FLAGS = -fstack-protector -Wformat -Wformat-security
+endif
+
+DYLIB_KEY = -dynamiclib
+EXPORT_KEY = -Wl,-exported_symbols_list,
+LIBDL = -ldl
+
+LIBS = -lpthread
+LINK_FLAGS =
+LIB_LINK_FLAGS = -dynamiclib -static-intel -install_name @rpath/$(BUILDING_LIBRARY)
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifneq (,$(shell icc -dumpversion | egrep  "^1[6-9]\."))
+OPENMP_FLAG = -qopenmp
+else
+OPENMP_FLAG = -openmp
+endif
+
+# ICC 12.0 and higher provide Intel(R) Cilk(TM) Plus
+ifneq (,$(shell icc -dumpversion | egrep  "^1[2-9]\."))
+    CILK_AVAILABLE = yes
+endif
+
+ifeq ($(cfg), release)
+    SDL_FLAGS += -D_FORTIFY_SOURCE=2
+    CPLUS_FLAGS = -g -O2 -fno-omit-frame-pointer
+else
+    CPLUS_FLAGS = -g -O0 -DTBB_USE_DEBUG
+endif
+
+ITT_NOTIFY = -DDO_ITT_NOTIFY
+CPLUS_FLAGS += -DUSE_PTHREAD $(ITT_NOTIFY)
+
+ifneq (,$(codecov))
+    CPLUS_FLAGS += -prof-gen=srcpos
+endif
+
+# ICC 14.0 and higher support usage of libc++, clang standard library
+MACOSX_DEPLOYMENT_TARGET ?= 10.11
+ifneq (,$(shell icc -dumpversion | egrep  "^1[4-9]\."))
+ifneq (,$(stdlib))
+    CPLUS_FLAGS    += -stdlib=$(stdlib) -mmacosx-version-min=$(MACOSX_DEPLOYMENT_TARGET)
+    LIB_LINK_FLAGS += -stdlib=$(stdlib) -mmacosx-version-min=$(MACOSX_DEPLOYMENT_TARGET)
+endif
+endif
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+
+ASM = as
+ifeq (intel64,$(arch))
+    ASM_FLAGS += -arch x86_64
+endif
+ifeq (ia32,$(arch))
+    CPLUS_FLAGS += -m32
+    LINK_FLAGS += -m32
+    LIB_LINK_FLAGS += -m32
+    ASM_FLAGS += -arch i386
+endif
+ifeq ($(cfg), debug)
+    ASM_FLAGS += -g
+endif
+
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/macos.inc b/xdl/third_party/tbb/build/macos.inc
new file mode 100644
index 00000000..c219e574
--- /dev/null
+++ b/xdl/third_party/tbb/build/macos.inc
@@ -0,0 +1,107 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+####### Detections and Commands ###############################################
+
+ifeq (icc,$(compiler))
+  export COMPILER_VERSION := ICC: $(shell icc -V </dev/null 2>&1 | grep 'Version')
+  ifneq (,$(findstring running on IA-32, $(COMPILER_VERSION)))
+    export arch:=ia32
+  else
+    ifneq (,$(findstring running on Intel(R) 64, $(COMPILER_VERSION)))
+      export arch:=intel64
+    endif
+  endif
+  ifeq (,$(arch))
+    $(warning "Unknown Intel compiler")
+  endif
+endif
+
+ifndef arch
+ ifeq ($(shell /usr/sbin/sysctl -n hw.machine),Power Macintosh)
+   ifeq ($(shell /usr/sbin/sysctl -n hw.optional.64bitops),1)
+     export arch:=ppc64
+   else
+     export arch:=ppc32
+   endif
+ else
+   ifeq ($(shell /usr/sbin/sysctl -n hw.optional.x86_64 2>/dev/null),1)
+     export arch:=intel64
+   else
+     export arch:=ia32
+   endif
+ endif
+endif
+
+ifndef runtime
+  clang_version:=$(shell clang -v 2>&1 >/dev/null | grep version | sed -e "s/.*version \(.*[0-9]\) .*/\1/")
+  ifndef os_version
+    os_version:=$(shell /usr/bin/sw_vers -productVersion)
+  endif
+  export runtime:=cc$(clang_version)_os$(os_version)
+endif
+
+native_compiler := clang
+export compiler ?= clang
+debugger ?= lldb
+
+export stdlib ?= libc++
+
+CMD=$(SHELL) -c
+CWD=$(shell pwd)
+RM?=rm -f
+RD?=rmdir
+MD?=mkdir -p
+NUL= /dev/null
+SLASH=/
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_macos.sh $(VERSION_FLAGS) >version_string.ver
+MAKE_TBBVARS=sh $(tbb_root)/build/generate_tbbvars.sh DY
+
+ifdef DYLD_LIBRARY_PATH
+        export DYLD_LIBRARY_PATH := .:$(DYLD_LIBRARY_PATH)
+else
+        export DYLD_LIBRARY_PATH := .
+endif
+
+####### Build settings ########################################################
+
+OBJ=o
+DLL=dylib
+MALLOC_DLL?=$(DLL)
+LIBEXT=dylib
+
+def_prefix = $(if $(findstring 64,$(arch)),mac64,mac32)
+
+TBB.LST = $(tbb_root)/src/tbb/$(def_prefix)-tbb-export.lst
+TBB.DEF = $(TBB.LST:.lst=.def)
+TBB.DLL = libtbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = $(TBB.DLL)
+LINK_TBB.LIB = $(TBB.LIB)
+
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-tbbmalloc-export.def
+MALLOC.DLL = libtbbmalloc$(DEBUG_SUFFIX).$(MALLOC_DLL)
+MALLOC.LIB = $(MALLOC.DLL)
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+MALLOCPROXY.DLL = libtbbmalloc_proxy$(DEBUG_SUFFIX).$(MALLOC_DLL)
+MALLOCPROXY.LIB = $(MALLOCPROXY.DLL)
+LINK_MALLOCPROXY.LIB = $(MALLOCPROXY.LIB)
+
+TEST_LAUNCHER=sh $(tbb_root)/build/test_launcher.sh $(largs)
+
+OPENCL.LIB = -framework OpenCL
diff --git a/xdl/third_party/tbb/build/mic.icc.inc b/xdl/third_party/tbb/build/mic.icc.inc
new file mode 100644
index 00000000..f91519ab
--- /dev/null
+++ b/xdl/third_party/tbb/build/mic.icc.inc
@@ -0,0 +1,79 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+CPLUS ?= icpc
+CONLY ?= icc
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY = -fPIC
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -w1
+DYLIB_KEY = -shared -Wl,-soname=$@
+EXPORT_KEY = -Wl,--version-script,
+NOINTRINSIC_KEY = -fno-builtin
+LIBDL = -ldl
+SDL_FLAGS = -fstack-protector -Wformat -Wformat-security
+
+ifeq (release,$(cfg))
+    SDL_FLAGS += -D_FORTIFY_SOURCE=2
+    CPLUS_FLAGS = -O2 -g -DUSE_PTHREAD
+else
+    CPLUS_FLAGS = -O0 -g -DUSE_PTHREAD -DTBB_USE_DEBUG
+endif
+
+ifneq (,$(codecov))
+    CPLUS_FLAGS += -prof-gen=srcpos
+endif
+
+ifneq (,$(shell icc -dumpversion | egrep  "^1[6-9]\."))
+OPENMP_FLAG = -qopenmp
+else
+OPENMP_FLAG = -openmp
+endif
+
+LIB_LINK_FLAGS = -shared -static-intel -Wl,-soname=$(BUILDING_LIBRARY) -z relro -z now
+LIBS += -lpthread -lrt
+C_FLAGS = $(CPLUS_FLAGS)
+CILK_AVAILABLE = yes
+
+TBB_ASM.OBJ=
+MALLOC_ASM.OBJ=
+
+CPLUS_FLAGS += -DHARNESS_INCOMPLETE_SOURCES=1 -D__TBB_MIC_NATIVE -DTBB_USE_EXCEPTIONS=0 -qopt-streaming-stores never
+CPLUS += -mmic
+CONLY += -mmic
+LINK_FLAGS = -Wl,-rpath-link=. -rdynamic
+# Tell the icc to not link against libcilk*. Otherwise icc tries to link and emits a warning message.
+LIB_LINK_FLAGS += -no-intel-extensions
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+
+
diff --git a/xdl/third_party/tbb/build/mic.linux.inc b/xdl/third_party/tbb/build/mic.linux.inc
new file mode 100644
index 00000000..bb1e81a5
--- /dev/null
+++ b/xdl/third_party/tbb/build/mic.linux.inc
@@ -0,0 +1,43 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifeq ($(tbb_os),mic)
+  $(error MIC supports only cross-compilation.  Specify "target=mic" instead.)
+endif
+
+ifneq ($(BUILDING_PHASE),1)
+  # The same build prefix should be used in offload.inc
+  ifeq (,$(tbb_build_prefix))
+    tbb_build_prefix=mic_icc$(CPF_SUFFIX)
+  endif
+  # For examples
+  mic_tbb_build_prefix=$(tbb_build_prefix)
+endif
+
+MAKE_VERSIONS=sh $(tbb_root)/build/version_info_linux.sh $(VERSION_FLAGS) >version_string.ver
+MAKE_TBBVARS=sh $(tbb_root)/build/generate_tbbvars.sh MIC_ MIC_
+def_prefix=lin64
+
+TEST_LAUNCHER=
+run_cmd ?= bash $(tbb_root)/build/mic.linux.launcher.sh $(largs)
+
+# detects whether examples are being built.
+ifeq ($(BUILDING_PHASE),0)
+ export UI = con
+ export x64 = 64
+endif # examples
diff --git a/xdl/third_party/tbb/build/mic.linux.launcher.sh b/xdl/third_party/tbb/build/mic.linux.launcher.sh
new file mode 100644
index 00000000..60e01b78
--- /dev/null
+++ b/xdl/third_party/tbb/build/mic.linux.launcher.sh
@@ -0,0 +1,161 @@
+#!/bin/bash
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Usage:
+# mic.linux.launcher.sh [-v] [-q] [-s] [-r <repeats>] [-u] [-l <library>] <executable> <arg1> <arg2> <argN>
+#         where: -v enables verbose output
+#         where: -q enables quiet mode
+#         where: -s runs the test in stress mode (until non-zero exit code or ctrl-c pressed)
+#         where: -r <repeats> specifies number of times to repeat execution
+#         where: -u limits stack size
+#         where: -l <library> specifies the library name to be assigned to LD_PRELOAD
+#
+# Libs and executable necessary for testing should be present in the current directory before running.
+# Note: Do not remove the redirections to '/dev/null' in the script, otherwise the nightly test system will fail.
+#
+trap 'echo Error at line $LINENO while executing "$BASH_COMMAND"' ERR #
+trap 'echo -e "\n*** Interrupted ***" && exit 1' SIGINT SIGQUIT #
+# Process the optional arguments if present
+while getopts  "qvsr:ul:" flag #
+do case $flag in #
+    s )  # Stress testing mode
+         echo Doing stress testing. Press Ctrl-C to terminate
+         run_env='stressed() { while $*; do :; done; };' #
+         run_prefix="stressed $run_prefix" ;; #
+    r )  # Repeats test n times
+         run_env="repeated() { for i in \$(seq 1 $OPTARG); do echo \$i of $OPTARG:; \$*; done; };" #
+         run_prefix="repeated $run_prefix" ;; #
+    l )  # Additional library
+         ldd_list+="$OPTARG " #
+         run_prefix+=" LD_PRELOAD=$OPTARG" ;; #
+    u )  # Set stack limit
+         run_prefix="ulimit -s 10240; $run_prefix" ;; # 
+    q )  # Quiet mode, removes 'done' but prepends any other output by test name
+         SUPPRESS='>/dev/null' #
+         verbose=1 ;; # TODO: implement a better quiet mode
+    v )  # Verbose mode
+         verbose=1 ;; #
+esac done #
+shift `expr $OPTIND - 1` #
+[ $verbose ] || SUPPRESS='>/dev/null' #
+#
+# Collect the executable name
+fexename="$1" #
+exename=`basename $1` #
+shift #
+#
+: ${MICDEV:=mic0} #
+RSH="sudo ssh $MICDEV" #
+RCP="sudo scp" #
+currentdir=$PWD #
+#
+# Prepare the target directory on the device
+targetdir="`$RSH mktemp -d /tmp/tbbtestXXXXXX 2>/dev/null`" #
+# Prepare the temporary directory on the host
+hostdir="`mktemp -d /tmp/tbbtestXXXXXX 2>/dev/null`" #
+#
+function copy_files { #
+    [ $verbose ] && echo Going to copy $* #
+    eval "cp $* $hostdir/ $SUPPRESS 2>/dev/null || exit \$?" #
+    eval "$RCP $hostdir/* $MICDEV:$targetdir/ $SUPPRESS 2>/dev/null || exit \$?" #
+    eval "rm $hostdir/* $SUPPRESS 2>/dev/null || exit \$?" #
+} # copy files
+#
+function clean_all() { #
+    eval "$RSH rm -fr $targetdir $SUPPRESS" ||: #
+    eval "rm -fr $hostdir $SUPPRESS" ||: #
+} # clean all temporary files
+#
+function kill_interrupt() { #
+    echo -e "\n*** Killing remote $exename ***" && $RSH "killall $exename" #
+    clean_all #
+} # kill target process
+#
+trap 'clean_all' SIGINT SIGQUIT # trap keyboard interrupt (control-c)
+#
+# Transfer the test executable file and its auxiliary libraries (named as {test}_dll.so) to the target device.
+copy_files $fexename `ls ${exename%\.*}*.so 2>/dev/null ||:` #
+#
+# Collect all dependencies of the test and its auxiliary libraries to transfer them to the target device.
+ldd_list+="libtbbmalloc*.so* libirml*.so* `$RSH ldd $targetdir/\* | grep = | cut -d= -f1 2>/dev/null`" #
+fnamelist="" #
+#
+# Find the libraries and add them to the list.
+# For example, go through MIC_LD_LIBRARY_PATH and add TBB libraries from the first
+# directory that contains tbb files
+mic_dir_list=`echo .:$MIC_LD_LIBRARY_PATH | tr : " "` #
+[ $verbose ] && echo Searching libraries in $mic_dir_list
+for name in $ldd_list; do # adds the first matched name in specified dirs
+    found="`find -L $mic_dir_list -name $name -a -readable -print -quit 2>/dev/null` "||: #
+    [ $verbose ] && echo File $name: $found
+    fnamelist+=$found
+done #
+#
+# Remove extra spaces.
+fnamelist=`echo $fnamelist` #
+# Transfer collected executable and library files to the target device.
+[ -n "$fnamelist" ] && copy_files $fnamelist
+#
+# Transfer input files used by example codes by scanning the executable argument list.
+argfiles= #
+args= #
+for arg in "$@"; do #
+  if [ -r $arg ]; then #
+    argfiles+="$arg " #
+    args+="$(basename $arg) " #
+  else #
+    args+="$arg " #
+  fi #
+done #
+[ -n "$argfiles" ] && copy_files $argfiles #
+#
+# Get the list of transferred files
+testfiles="`$RSH find $targetdir/ -type f | tr '\n' ' ' 2>/dev/null`" #
+#
+[ $verbose ] && echo Running $run_prefix ./$exename $args #
+# Run the test on the target device
+trap 'kill_interrupt' SIGINT SIGQUIT # trap keyboard interrupt (control-c)
+trap - ERR #
+run_env+="cd $targetdir; export LD_LIBRARY_PATH=.:\$LD_LIBRARY_PATH;" #
+$RSH "$run_env $run_prefix ./$exename $args" #
+#
+# Delete the test files and get the list of output files
+outfiles=`$RSH rm $testfiles 2>/dev/null; find $targetdir/ -type f 2>/dev/null` ||: #
+if [ -n "$outfiles" ]; then #
+    for outfile in $outfiles; do #
+        filename=$(basename $outfile) #
+        subdir=$(dirname $outfile) #
+        subdir="${subdir#$targetdir}" #
+        [ -n $subdir ] subdir=$subdir/ #
+        # Create directories on host
+        [ ! -d "$hostdir/$subdir" ] && mkdir -p "$hostdir/$subdir" #
+        [ ! -d "$currentdir/$subdir" ] && mkdir -p "$currentdir/$subdir" #
+        # Copy the output file to the temporary directory on host
+        eval "$RCP -r '$MICDEV:${outfile#}' '$hostdir/$subdir$filename' $SUPPRESS 2>&1 || exit \$?" #
+        # Copy the output file from the temporary directory to the current directory
+        eval "cp '$hostdir/$subdir$filename' '$currentdir/$subdir$filename' $SUPPRESS 2>&1 || exit \$?" #
+    done #
+fi #
+#
+# Clean up temporary directories
+clean_all
+#
+# Return the exit code of the test.
+exit $? #
diff --git a/xdl/third_party/tbb/build/mic.offload.inc b/xdl/third_party/tbb/build/mic.offload.inc
new file mode 100644
index 00000000..e2b09718
--- /dev/null
+++ b/xdl/third_party/tbb/build/mic.offload.inc
@@ -0,0 +1,118 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifneq (mic,$(offload))
+  $(error File mic.offload.inc should not be included directly. Use offload=mic instead.)
+endif
+ifneq (icc,$(compiler))
+  $(error Only Intel(R) Compiler is supported for MIC offload compilation)
+endif
+
+# The same build prefix should be used in mic.linux.inc
+mic_tbb_build_prefix=mic_icc$(CPF_SUFFIX)
+MIC_OFFLOAD_NATIVE_PATH?=../$(mic_tbb_build_prefix)_$(cfg)
+
+ifdef BUILDING_PHASE
+  ifeq ($(BUILDING_PHASE),1)
+    # Tests
+    export MIC_OFFLOAD_NATIVE_PATH
+    LINK_TBB_NATIVE.LIB=$(MIC_OFFLOAD_NATIVE_PATH)/$(TBB.LIB)
+    LINK_TBB.LIB=-qoffload-option,mic,ld,"$(LINK_TBB_NATIVE.LIB)" $(TBB.LIB)
+    LINK_MALLOC_NATIVE.LIB=$(MIC_OFFLOAD_NATIVE_PATH)/$(MALLOC.DLL)
+    LINK_MALLOC.LIB=-qoffload-option,mic,ld,"$(LINK_MALLOC_NATIVE.LIB)" $(MALLOC.LIB)
+    LINK_MALLOCPROXY_NATIVE.LIB=$(MIC_OFFLOAD_NATIVE_PATH)/$(MALLOCPROXY.DLL)
+    LINK_MALLOCPROXY.LIB=-qoffload-option,mic,ld,"$(LINK_MALLOCPROXY_NATIVE.LIB)" $(MALLOCPROXY.LIB)
+
+    # Export extensions for test_launcher
+    export DLL
+    export TEST_EXT=offload.exe
+    OBJ=offload.o
+
+    # Do not use -Werror because it is too strict for the early offload compiler.
+    # Need to set anything because WARNING_AS_ERROR_KEY should not be empty.
+    # Treat #2426 as a warning. Print errors only.
+    tbb_strict=0
+    WARNING_AS_ERROR_KEY = Warning as error
+    WARNING_KEY = -diag-warning 2426 -w0
+
+    CXX_MIC_STUFF = -qoffload-attribute-target=mic -D__TBB_MIC_OFFLOAD=1 -qoffload-option,mic,compiler,"-D__TBB_MIC_OFFLOAD=1 $(CXX_MIC_NATIVE_STUFF)"
+    CXX_MIC_NATIVE_STUFF = -DHARNESS_INCOMPLETE_SOURCES=1 -D__TBB_MIC_NATIVE -DTBB_USE_EXCEPTIONS=0
+    CPLUS_FLAGS += $(CXX_MIC_STUFF)
+
+    # Some tests require that an executable exports its symbols.
+    LINK_FLAGS += -qoffload-option,mic,ld,"--export-dynamic"
+
+    # libcoi_device.so is needed for COIProcessProxyFlush used in Harness.
+    LINK_FLAGS += -qoffload-option,mic,ld,"-lcoi_device"
+
+    # DSO-linking semantics forces linking libpthread and librt to a test.
+    LINK_FLAGS += -qoffload-option,mic,ld,"-lpthread -lrt"
+
+    .PHONY: FORCE
+    FORCE:
+
+    $(MIC_OFFLOAD_NATIVE_PATH)/%_dll.$(DLL): FORCE
+	@$(MAKE) --no-print-directory -C "$(MIC_OFFLOAD_NATIVE_PATH)" target=mic offload= -f$(tbb_root)/build/Makefile.$(TESTFILE) $*_dll.$(DLL)
+    %_dll.$(DLL): $(MIC_OFFLOAD_NATIVE_PATH)/%_dll.$(DLL) FORCE
+	@$(MAKE) --no-print-directory offload= -f$(tbb_root)/build/Makefile.$(TESTFILE) $*_dll.$(DLL)
+
+    .PRECIOUS: $(MIC_OFFLOAD_NATIVE_PATH)/%_dll.$(DLL)
+
+    %.$(TEST_EXT): LINK_FILES+=-qoffload-option,mic,ld,"$(addprefix $(MIC_OFFLOAD_NATIVE_PATH)/,$(TEST_LIBS))"
+
+    TEST_LAUNCHER=sh $(tbb_root)/build/test_launcher.sh $(largs)
+
+    ifdef MIC_LD_LIBRARY_PATH
+      export MIC_LD_LIBRARY_PATH := $(MIC_OFFLOAD_NATIVE_PATH):$(MIC_LD_LIBRARY_PATH)
+    else
+      export MIC_LD_LIBRARY_PATH := $(MIC_OFFLOAD_NATIVE_PATH)
+    endif
+  else
+    # Examples
+    export UI = con
+    export x64 = 64
+  endif
+else
+  # Libraries
+  LIB_TARGETS = tbb tbbmalloc tbbproxy rml
+  addsuffixes = $(foreach suff,$(1),$(addsuffix $(suff),$(2)))
+
+  .PHONY: $(call addsuffixes, _debug _release _debug_mic _release_mic,$(LIB_TARGETS))
+
+  # The dependence on *_debug and *_release targets unifies the offload support
+  # for top-level Makefile and src/Makefile
+  $(LIB_TARGETS): %: %_release %_debug
+
+  # "override offload=" suppresses the "offload" variable value for nested makes
+  $(LIB_TARGETS) $(call addsuffixes, _debug _release,$(LIB_TARGETS)): override offload=
+  # Apply overriding for library builds
+  export offload
+  export tbb_build_prefix
+  # Add the dependency on target libraries
+  $(call addsuffixes, _debug _release,$(LIB_TARGETS)): %: %_mic
+
+  # tbb_build_prefix should be overridden since we want to restart make in "clear" environment
+  $(call addsuffixes, _debug_mic _release_mic,$(LIB_TARGETS)): override tbb_build_prefix=
+  $(call addsuffixes, _debug_mic _release_mic,$(LIB_TARGETS)): %_mic:
+	@$(MAKE) --no-print-directory -C "$(full_tbb_root)/src" $* target=mic tbb_root=..
+
+  mic_clean: override tbb_build_prefix=
+  mic_clean:
+	@$(MAKE) --no-print-directory -C "$(full_tbb_root)/src" clean offload= target=mic tbb_root=..
+  clean: mic_clean
+endif
diff --git a/xdl/third_party/tbb/build/suncc.map.pause b/xdl/third_party/tbb/build/suncc.map.pause
new file mode 100644
index 00000000..a92d08eb
--- /dev/null
+++ b/xdl/third_party/tbb/build/suncc.map.pause
@@ -0,0 +1 @@
+hwcap_1 = OVERRIDE;
\ No newline at end of file
diff --git a/xdl/third_party/tbb/build/test_launcher.bat b/xdl/third_party/tbb/build/test_launcher.bat
new file mode 100644
index 00000000..8e1fb31e
--- /dev/null
+++ b/xdl/third_party/tbb/build/test_launcher.bat
@@ -0,0 +1,74 @@
+@echo off
+REM
+REM Copyright (c) 2005-2018 Intel Corporation
+REM
+REM Licensed under the Apache License, Version 2.0 (the "License");
+REM you may not use this file except in compliance with the License.
+REM You may obtain a copy of the License at
+REM
+REM     http://www.apache.org/licenses/LICENSE-2.0
+REM
+REM Unless required by applicable law or agreed to in writing, software
+REM distributed under the License is distributed on an "AS IS" BASIS,
+REM WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+REM See the License for the specific language governing permissions and
+REM limitations under the License.
+REM
+REM
+REM
+REM
+REM
+
+set cmd_line=
+if DEFINED run_prefix set cmd_line=%run_prefix%
+:while
+if NOT "%1"=="" (
+    REM Verbose mode
+    if "%1"=="-v" (
+        set verbose=yes
+        GOTO continue
+    )
+    REM Silent mode of 'make' requires additional support for associating
+    REM of test output with the test name. Verbose mode is the simplest way
+    if "%1"=="-q" (
+        set verbose=yes
+        GOTO continue
+    )
+    REM Run in stress mode
+    if "%1"=="-s" (
+        echo Doing stress testing. Press Ctrl-C to terminate
+        set stress=yes
+        GOTO continue
+    )
+    REM Repeat execution specified number of times
+    if "%1"=="-r" (
+        set repeat=%2
+        SHIFT
+        GOTO continue
+    )
+    REM no LD_PRELOAD under Windows
+    REM but run the test to check "#pragma comment" construction
+    if "%1"=="-l" (
+        REM The command line may specify -l with empty dll name,
+        REM e.g. "test_launcher.bat -l  app.exe". If the dll name is
+        REM empty then %2 contains the application name and the SHIFT
+        REM operation is not necessary.
+        if exist "%3" SHIFT
+        GOTO continue
+    )
+    REM no need to setup up stack size under Windows
+    if "%1"=="-u" GOTO continue
+    set cmd_line=%cmd_line% %1
+:continue
+    SHIFT
+    GOTO while
+)
+set cmd_line=%cmd_line:./=.\%
+if DEFINED verbose echo Running %cmd_line%
+if DEFINED stress set cmd_line=%cmd_line% ^& IF NOT ERRORLEVEL 1 GOTO stress
+:stress
+if DEFINED repeat (
+    for /L %%i in (1,1,%repeat%) do echo %%i of %repeat%: & %cmd_line%
+) else (
+    %cmd_line%
+)
diff --git a/xdl/third_party/tbb/build/test_launcher.sh b/xdl/third_party/tbb/build/test_launcher.sh
new file mode 100644
index 00000000..8df4c14d
--- /dev/null
+++ b/xdl/third_party/tbb/build/test_launcher.sh
@@ -0,0 +1,94 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Usage:
+# test_launcher.sh [-v] [-q] [-s] [-r <repeats>] [-u] [-l <library>] <executable> <arg1> <arg2> <argN>
+#         where: -v enables verbose output
+#         where: -q enables quiet mode
+#         where: -s runs the test in stress mode (until non-zero exit code or ctrl-c pressed)
+#         where: -r <repeats> specifies number of times to repeat execution
+#         where: -u limits stack size
+#         where: -l <library> specifies the library name to be assigned to LD_PRELOAD
+
+while getopts  "qvsr:ul:" flag #
+do case $flag in #
+    s )  # Stress testing mode
+         run_prefix="stressed $run_prefix" ;; #
+    r )  # Repeats test n times
+         repeat=$OPTARG #
+         run_prefix="repeated $run_prefix" ;; #
+    l )  if [ `uname` = 'Linux' ] ; then #
+             LD_PRELOAD=$OPTARG #
+         elif [ `uname` = 'Darwin' ] ; then #
+             DYLD_INSERT_LIBRARIES=$OPTARG #
+         else #
+             echo 'skip' #
+             exit #
+         fi ;; #
+    u )  # Set stack limit
+         ulimit -s 10240 ;; #
+    q )  # Quiet mode, removes 'done' but prepends any other output by test name
+         OUTPUT='2>&1 | sed -e "s/done//;/^[[:space:]]*$/d;s!^!$1: !"' ;; #
+    v )  # Verbose mode
+         verbose=1 ;; #
+esac done #
+shift `expr $OPTIND - 1` #
+if [ $MIC_OFFLOAD_NATIVE_PATH ] ; then #
+    LIB_NAME=${1/%.$TEST_EXT/_dll.$DLL} #
+    if [ -f "$MIC_OFFLOAD_NATIVE_PATH/$LIB_NAME" ]; then #
+       [ -z "$MIC_CARD" ] && MIC_CARD=mic0 #
+        TMPDIR_HOST=`mktemp -d /tmp/tbbtestXXXXXX` #
+        TMPDIR_MIC=`sudo ssh $MIC_CARD mktemp -d /tmp/tbbtestXXXXXX` #
+        sudo ssh $MIC_CARD "chmod +x $TMPDIR_MIC" #
+        # Test specific library may depend on libtbbmalloc*
+        cp "$MIC_OFFLOAD_NATIVE_PATH/$LIB_NAME" "$MIC_OFFLOAD_NATIVE_PATH"/libtbbmalloc* "$TMPDIR_HOST" >/dev/null 2>/dev/null #
+        sudo scp "$TMPDIR_HOST"/* $MIC_CARD:"$TMPDIR_MIC" >/dev/null 2>/dev/null #
+
+        LD_LIBRARY_PATH=$TMPDIR_MIC:$LD_LIBRARY_PATH #
+        export LD_LIBRARY_PATH #
+    fi #
+fi #
+stressed() { echo Doing stress testing. Press Ctrl-C to terminate #
+    while :; do $*; done;#
+} #
+repeated() { #
+    i=0; while [ "$i" -lt $repeat ]; do i=`expr $i + 1`; echo $i of $repeat:; $*; done #
+} #
+# DYLD_LIBRARY_PATH can be purged on OS X 10.11, set it again
+if [ `uname` = 'Darwin' -a -z "$DYLD_LIBRARY_PATH" ] ; then #
+    DYLD_LIBRARY_PATH=. #
+    export DYLD_LIBRARY_PATH #
+fi #
+# Run the command line passed via parameters
+[ $verbose ] && echo Running $run_prefix $* #
+if [ -n "$LD_PRELOAD" ] ; then #
+    export LD_PRELOAD #
+elif [ -n "$DYLD_INSERT_LIBRARIES" ] ; then #
+    export DYLD_INSERT_LIBRARIES #
+fi #
+exec 4>&1 # extracting exit code of the first command in pipeline needs duplicated stdout
+# custom redirection needs eval, otherwise shell cannot parse it
+err=`eval '( $run_prefix $* || echo \$? >&3; )' ${OUTPUT} 3>&1 >&4` #
+[ -z "$err" ] || echo $1: exited with error $err #
+if [ $MIC_OFFLOAD_NATIVE_PATH ] ; then #
+    sudo ssh $MIC_CARD rm -fr "$TMPDIR_MIC" >/dev/null 2>/dev/null #
+    rm -fr "$TMPDIR_HOST" >/dev/null 2>/dev/null #
+fi #
+exit $err #
diff --git a/xdl/third_party/tbb/build/version_info_aix.sh b/xdl/third_party/tbb/build/version_info_aix.sh
new file mode 100644
index 00000000..7703f4ca
--- /dev/null
+++ b/xdl/third_party/tbb/build/version_info_aix.sh
@@ -0,0 +1,34 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Script used to generate version info string
+echo "#define __TBB_VERSION_STRINGS(N) \\"
+echo '#N": BUILD_HOST'"\t\t"`hostname -s`" ("`uname -m`")"'" ENDL \'
+# find OS name in *-release and issue* files by filtering blank lines and lsb-release content out
+echo '#N": BUILD_OS'"\t\t"`lsb_release -sd 2>/dev/null | grep -ih '[a-z] ' - /etc/*release /etc/issue 2>/dev/null | head -1 | sed -e 's/["\\\\]//g'`'" ENDL \'
+echo '#N": BUILD_KERNEL'"\t"`uname -srv`'" ENDL \'
+echo '#N": BUILD_GCC'"\t\t"`g++ --version </dev/null 2>&1 | grep 'g++'`'" ENDL \'
+[ -z "$COMPILER_VERSION" ] || echo '#N": BUILD_COMPILER'"\t"$COMPILER_VERSION'" ENDL \'
+echo '#N": BUILD_LIBC'"\t"`getconf GNU_LIBC_VERSION | grep glibc | sed -e 's/^glibc //'`'" ENDL \'
+echo '#N": BUILD_LD'"\t\t"`ld -v 2>&1 | grep 'version'`'" ENDL \'
+echo '#N": BUILD_TARGET'"\t$arch on $runtime"'" ENDL \'
+echo '#N": BUILD_COMMAND'"\t"$*'" ENDL \'
+echo ""
+echo "#define __TBB_DATETIME \""`date -u`"\""
diff --git a/xdl/third_party/tbb/build/version_info_android.sh b/xdl/third_party/tbb/build/version_info_android.sh
new file mode 100644
index 00000000..ba8211aa
--- /dev/null
+++ b/xdl/third_party/tbb/build/version_info_android.sh
@@ -0,0 +1,33 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Script used to generate version info string
+echo "#define __TBB_VERSION_STRINGS(N) \\"
+echo '#N": BUILD_HOST'"\t\t"`hostname -s`" ("`uname -m`")"'" ENDL \'
+# find OS name in *-release and issue* files by filtering blank lines and lsb-release content out
+echo '#N": BUILD_OS'"\t\t"`lsb_release -sd 2>/dev/null | grep -ih '[a-z] ' - /etc/*release /etc/issue 2>/dev/null | head -1 | sed -e 's/["\\\\]//g'`'" ENDL \'
+echo '#N": BUILD_TARGET_CXX'"\t"`$TARGET_CXX --version | head -n1`'" ENDL \'
+[ -z "$COMPILER_VERSION" ] || echo '#N": BUILD_COMPILER'"\t"$COMPILER_VERSION'" ENDL \'
+[ -z "$ndk_version" ] || echo '#N": BUILD_NDK'"\t\t$ndk_version"'" ENDL \'
+echo '#N": BUILD_LD'"\t\t"`${tbb_tool_prefix}ld -v 2>&1 | grep 'ld'`'" ENDL \'
+echo '#N": BUILD_TARGET'"\t$arch on $runtime"'" ENDL \'
+echo '#N": BUILD_COMMAND'"\t"$*'" ENDL \'
+echo ""
+echo "#define __TBB_DATETIME \""`date -u`"\""
diff --git a/xdl/third_party/tbb/build/version_info_linux.sh b/xdl/third_party/tbb/build/version_info_linux.sh
new file mode 100644
index 00000000..7703f4ca
--- /dev/null
+++ b/xdl/third_party/tbb/build/version_info_linux.sh
@@ -0,0 +1,34 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Script used to generate version info string
+echo "#define __TBB_VERSION_STRINGS(N) \\"
+echo '#N": BUILD_HOST'"\t\t"`hostname -s`" ("`uname -m`")"'" ENDL \'
+# find OS name in *-release and issue* files by filtering blank lines and lsb-release content out
+echo '#N": BUILD_OS'"\t\t"`lsb_release -sd 2>/dev/null | grep -ih '[a-z] ' - /etc/*release /etc/issue 2>/dev/null | head -1 | sed -e 's/["\\\\]//g'`'" ENDL \'
+echo '#N": BUILD_KERNEL'"\t"`uname -srv`'" ENDL \'
+echo '#N": BUILD_GCC'"\t\t"`g++ --version </dev/null 2>&1 | grep 'g++'`'" ENDL \'
+[ -z "$COMPILER_VERSION" ] || echo '#N": BUILD_COMPILER'"\t"$COMPILER_VERSION'" ENDL \'
+echo '#N": BUILD_LIBC'"\t"`getconf GNU_LIBC_VERSION | grep glibc | sed -e 's/^glibc //'`'" ENDL \'
+echo '#N": BUILD_LD'"\t\t"`ld -v 2>&1 | grep 'version'`'" ENDL \'
+echo '#N": BUILD_TARGET'"\t$arch on $runtime"'" ENDL \'
+echo '#N": BUILD_COMMAND'"\t"$*'" ENDL \'
+echo ""
+echo "#define __TBB_DATETIME \""`date -u`"\""
diff --git a/xdl/third_party/tbb/build/version_info_macos.sh b/xdl/third_party/tbb/build/version_info_macos.sh
new file mode 100644
index 00000000..2fcfc071
--- /dev/null
+++ b/xdl/third_party/tbb/build/version_info_macos.sh
@@ -0,0 +1,32 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Script used to generate version info string
+echo "#define __TBB_VERSION_STRINGS(N) \\"
+echo '#N": BUILD_HOST'"\t\t"`hostname -s`" ("`arch`")"'" ENDL \'
+echo '#N": BUILD_OS'"\t\t"`sw_vers -productName`" version "`sw_vers -productVersion`'" ENDL \'
+echo '#N": BUILD_KERNEL'"\t"`uname -v`'" ENDL \'
+echo '#N": BUILD_CLANG'"\t"`clang --version </dev/null 2>&1 | grep 'version '`'" ENDL \'
+echo '#N": BUILD_XCODE'"\t"`xcodebuild -version </dev/null 2>&1 | grep 'Xcode'`'" ENDL \'
+[ -z "$COMPILER_VERSION" ] || echo '#N": BUILD_COMPILER'"\t"$COMPILER_VERSION'" ENDL \'
+echo '#N": BUILD_TARGET'"\t$arch on $runtime"'" ENDL \'
+echo '#N": BUILD_COMMAND'"\t"$*'" ENDL \'
+echo ""
+echo "#define __TBB_DATETIME \""`date -u`"\""
diff --git a/xdl/third_party/tbb/build/version_info_sunos.sh b/xdl/third_party/tbb/build/version_info_sunos.sh
new file mode 100644
index 00000000..885bcc40
--- /dev/null
+++ b/xdl/third_party/tbb/build/version_info_sunos.sh
@@ -0,0 +1,31 @@
+#!/bin/sh
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Script used to generate version info string
+echo "#define __TBB_VERSION_STRINGS(N) \\"
+echo '#N": BUILD_HOST'"\t"`hostname`" ("`arch`")"'" ENDL \'
+echo '#N": BUILD_OS'"\t\t"`uname`'" ENDL \'
+echo '#N": BUILD_KERNEL'"\t"`uname -srv`'" ENDL \'
+echo '#N": BUILD_SUNCC'"\t"`CC -V </dev/null 2>&1 | grep 'C++'`'" ENDL \'
+[ -z "$COMPILER_VERSION" ] || echo '#N": BUILD_COMPILER'"\t"$COMPILER_VERSION'" ENDL \'
+echo '#N": BUILD_TARGET'"\t$arch on $runtime"'" ENDL \'
+echo '#N": BUILD_COMMAND'"\t"$*'" ENDL \'
+echo ""
+echo "#define __TBB_DATETIME \""`date -u`"\""
diff --git a/xdl/third_party/tbb/build/version_info_windows.js b/xdl/third_party/tbb/build/version_info_windows.js
new file mode 100644
index 00000000..031b22c3
--- /dev/null
+++ b/xdl/third_party/tbb/build/version_info_windows.js
@@ -0,0 +1,95 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+var WshShell = WScript.CreateObject("WScript.Shell");
+
+var tmpExec;
+
+WScript.Echo("#define __TBB_VERSION_STRINGS(N) \\");
+
+//Getting BUILD_HOST
+WScript.echo( "#N \": BUILD_HOST\\t\\t" + 
+              WshShell.ExpandEnvironmentStrings("%COMPUTERNAME%") +
+              "\" ENDL \\" );
+
+//Getting BUILD_OS
+tmpExec = WshShell.Exec("cmd /c ver");
+while ( tmpExec.Status == 0 ) {
+    WScript.Sleep(100);
+}
+tmpExec.StdOut.ReadLine();
+
+WScript.echo( "#N \": BUILD_OS\\t\\t" + 
+              tmpExec.StdOut.ReadLine() +
+              "\" ENDL \\" );
+
+if ( WScript.Arguments(0).toLowerCase().match("gcc") ) {
+    tmpExec = WshShell.Exec(WScript.Arguments(0) + " --version");
+    WScript.echo( "#N \": BUILD_GCC\\t\\t" + 
+                  tmpExec.StdOut.ReadLine() + 
+                  "\" ENDL \\" );
+
+} else if ( WScript.Arguments(0).toLowerCase().match("clang") ) {
+    tmpExec = WshShell.Exec(WScript.Arguments(0) + " --version");
+    WScript.echo( "#N \": BUILD_CLANG\\t" + 
+                  tmpExec.StdOut.ReadLine() + 
+                  "\" ENDL \\" );
+
+} else { // MS / Intel compilers
+    //Getting BUILD_CL
+    tmpExec = WshShell.Exec("cmd /c echo #define 0 0>empty.cpp");
+    tmpExec = WshShell.Exec("cl -c empty.cpp ");
+    while ( tmpExec.Status == 0 ) {
+        WScript.Sleep(100);
+    }
+    var clVersion = tmpExec.StdErr.ReadLine();
+    WScript.echo( "#N \": BUILD_CL\\t\\t" + 
+                  clVersion +
+                  "\" ENDL \\" );
+
+    //Getting BUILD_COMPILER
+    if ( WScript.Arguments(0).toLowerCase().match("icl") ) {
+        tmpExec = WshShell.Exec("icl -c empty.cpp ");
+        while ( tmpExec.Status == 0 ) {
+            WScript.Sleep(100);
+        }
+        WScript.echo( "#N \": BUILD_COMPILER\\t" + 
+                      tmpExec.StdErr.ReadLine() + 
+                      "\" ENDL \\" );
+    } else {
+        WScript.echo( "#N \": BUILD_COMPILER\\t\\t" + 
+                      clVersion +
+                      "\" ENDL \\" );
+    }
+    tmpExec = WshShell.Exec("cmd /c del /F /Q empty.obj empty.cpp");
+}
+
+//Getting BUILD_TARGET
+WScript.echo( "#N \": BUILD_TARGET\\t" + 
+              WScript.Arguments(1) + 
+              "\" ENDL \\" );
+
+//Getting BUILD_COMMAND
+WScript.echo( "#N \": BUILD_COMMAND\\t" + WScript.Arguments(2) + "\" ENDL" );
+
+//Getting __TBB_DATETIME and __TBB_VERSION_YMD
+var date = new Date();
+WScript.echo( "#define __TBB_DATETIME \"" + date.toUTCString() + "\"" );
+WScript.echo( "#define __TBB_VERSION_YMD " + date.getUTCFullYear() + ", " + 
+              (date.getUTCMonth() > 8 ? (date.getUTCMonth()+1):("0"+(date.getUTCMonth()+1))) + 
+              (date.getUTCDate() > 9 ? date.getUTCDate():("0"+date.getUTCDate())) );
diff --git a/xdl/third_party/tbb/build/vs2013/index.html b/xdl/third_party/tbb/build/vs2013/index.html
new file mode 100644
index 00000000..11466543
--- /dev/null
+++ b/xdl/third_party/tbb/build/vs2013/index.html
@@ -0,0 +1,30 @@
+<HTML>
+<BODY>
+
+<H2>Overview</H2>
+This directory contains the Visual Studio* 2013 solution to build Intel&reg; Threading Building Blocks.
+
+
+<H2>Files</H2>
+<DL>
+<DT><A HREF="makefile.sln">makefile.sln</A>
+<DD>Solution file.</DD>
+<DT><A HREF="tbb.vcxproj">tbb.vcxproj</A>
+<DD>Library project file.</DD>
+<DT><A HREF="tbbmalloc.vcxproj">tbbmalloc.vcxproj</A>
+<DD>Scalable allocator library project file.</DD>
+<DT><A HREF="tbbmalloc_proxy.vcxproj">tbbmalloc_proxy.vcxproj</A>
+<DD>Standard allocator replacement project file. </DD>
+</DL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<P></P>
+Copyright &copy; 2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel and the Intel logo are trademarks of Intel Corporation
+or its subsidiaries in the U.S. and/or other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/build/vs2013/makefile.sln b/xdl/third_party/tbb/build/vs2013/makefile.sln
new file mode 100644
index 00000000..b913551e
--- /dev/null
+++ b/xdl/third_party/tbb/build/vs2013/makefile.sln
@@ -0,0 +1,80 @@
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "Solution Items", "Solution Items", "{8898CE0B-0BFB-45AE-AA71-83735ED2510D}"
+	ProjectSection(SolutionItems) = preProject
+		index.html = index.html
+	EndProjectSection
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tbb", "tbb.vcxproj", "{F62787DD-1327-448B-9818-030062BCFAA5}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tbbmalloc", "tbbmalloc.vcxproj", "{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tbbmalloc_proxy", "tbbmalloc_proxy.vcxproj", "{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Debug-MT|Win32 = Debug-MT|Win32
+		Debug-MT|x64 = Debug-MT|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+		Release-MT|Win32 = Release-MT|Win32
+		Release-MT|x64 = Release-MT|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug|Win32.ActiveCfg = Debug|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug|Win32.Build.0 = Debug|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug|x64.ActiveCfg = Debug|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug|x64.Build.0 = Debug|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug-MT|Win32.ActiveCfg = Debug-MT|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug-MT|Win32.Build.0 = Debug-MT|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug-MT|x64.ActiveCfg = Debug-MT|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Debug-MT|x64.Build.0 = Debug-MT|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release|Win32.ActiveCfg = Release|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release|Win32.Build.0 = Release|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release|x64.ActiveCfg = Release|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release|x64.Build.0 = Release|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release-MT|Win32.ActiveCfg = Release-MT|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release-MT|Win32.Build.0 = Release-MT|Win32
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release-MT|x64.ActiveCfg = Release-MT|x64
+		{F62787DD-1327-448B-9818-030062BCFAA5}.Release-MT|x64.Build.0 = Release-MT|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug|Win32.ActiveCfg = Debug|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug|Win32.Build.0 = Debug|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug|x64.ActiveCfg = Debug|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug|x64.Build.0 = Debug|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug-MT|Win32.ActiveCfg = Debug-MT|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug-MT|Win32.Build.0 = Debug-MT|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug-MT|x64.ActiveCfg = Debug-MT|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Debug-MT|x64.Build.0 = Debug-MT|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release|Win32.ActiveCfg = Release|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release|Win32.Build.0 = Release|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release|x64.ActiveCfg = Release|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release|x64.Build.0 = Release|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release-MT|Win32.ActiveCfg = Release-MT|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release-MT|Win32.Build.0 = Release-MT|Win32
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release-MT|x64.ActiveCfg = Release-MT|x64
+		{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}.Release-MT|x64.Build.0 = Release-MT|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug|Win32.ActiveCfg = Debug|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug|Win32.Build.0 = Debug|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug|x64.ActiveCfg = Debug|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug|x64.Build.0 = Debug|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug-MT|Win32.ActiveCfg = Debug-MT|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug-MT|Win32.Build.0 = Debug-MT|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug-MT|x64.ActiveCfg = Debug-MT|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Debug-MT|x64.Build.0 = Debug-MT|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release|Win32.ActiveCfg = Release|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release|Win32.Build.0 = Release|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release|x64.ActiveCfg = Release|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release|x64.Build.0 = Release|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release-MT|Win32.ActiveCfg = Release-MT|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release-MT|Win32.Build.0 = Release-MT|Win32
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release-MT|x64.ActiveCfg = Release-MT|x64
+		{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}.Release-MT|x64.Build.0 = Release-MT|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/build/vs2013/tbb.vcxproj b/xdl/third_party/tbb/build/vs2013/tbb.vcxproj
new file mode 100644
index 00000000..cbfcd391
--- /dev/null
+++ b/xdl/third_party/tbb/build/vs2013/tbb.vcxproj
@@ -0,0 +1,697 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug-MT|Win32">
+      <Configuration>Debug-MT</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug-MT|x64">
+      <Configuration>Debug-MT</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release-MT|Win32">
+      <Configuration>Release-MT</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release-MT|x64">
+      <Configuration>Release-MT</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{F62787DD-1327-448B-9818-030062BCFAA5}</ProjectGuid>
+    <RootNamespace>tbb</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+    <Import Project="$(VCTargetsPath)\BuildCustomizations\masm.props" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(ProjectName)_debug</TargetName>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <AdditionalOptions>  /c /MDd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions>  /c /MDd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ShowIncludes>false</ShowIncludes>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+      <ImageHasSafeExceptionHandlers>false</ImageHasSafeExceptionHandlers>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalOptions>  /c /MD /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions>  /c /MD /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+      <ImageHasSafeExceptionHandlers>false</ImageHasSafeExceptionHandlers>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">
+    <ClCompile>
+      <AdditionalOptions>  /c /MTd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions>  /c /MTd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ShowIncludes>false</ShowIncludes>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+      <ImageHasSafeExceptionHandlers>false</ImageHasSafeExceptionHandlers>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">
+    <ClCompile>
+      <AdditionalOptions>  /c /MT /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions>  /c /MT /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBB_BUILD=1 /W4 /I../../src /I../../src/rml/include /I../../include</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO /DEF:"$(IntDir)tbb.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbb.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+      <ImageHasSafeExceptionHandlers>false</ImageHasSafeExceptionHandlers>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <MASM Include="..\..\src\tbb\ia32-masm\atomic_support.asm">
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">/coff /Zi</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">/coff /Zi</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">/coff</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">/coff</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+    </MASM>
+    <CustomBuild Include="..\..\src\tbb\intel64-masm\atomic_support.asm">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+    </CustomBuild>
+    <CustomBuild Include="..\..\src\tbb\intel64-masm\intel64_misc.asm">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">building intel64_misc.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/intel64_misc.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">building intel64_misc.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/intel64_misc.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">building intel64_misc.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/intel64_misc.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">building intel64_misc.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/intel64_misc.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+    </CustomBuild>
+    <MASM Include="..\..\src\tbb\ia32-masm\itsx.asm">
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">/coff /Zi</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">/coff /Zi</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">/coff</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">/coff</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+    </MASM>
+    <CustomBuild Include="..\..\src\tbb\intel64-masm\itsx.asm">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">building itsx.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/itsx.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">building itsx.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/itsx.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">building itsx.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/itsx.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">building itsx.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/itsx.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+    </CustomBuild>
+    <MASM Include="..\..\src\tbb\ia32-masm\lock_byte.asm">
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">/coff /Zi</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">/coff /Zi</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">/coff /Zi</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">/coff /Zi</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">/coff</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">true</ExcludedFromBuild>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">/coff</AdditionalOptions>
+      <UseSafeExceptionHandlers Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</UseSafeExceptionHandlers>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+    </MASM>
+  </ItemGroup>
+  <ItemGroup>
+    <CustomBuild Include="..\..\src\tbb\win32-tbb-export.def">
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">cl /nologo /TC /EP ../../src/tbb/win32-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+    </CustomBuild>
+    <CustomBuild Include="..\..\src\tbb\win64-tbb-export.def">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">generating tbb.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">cl /nologo /TC /EP ../../src/tbb/win64-tbb-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBB_BUILD=1 /I../../src /I../../include &gt;"$(IntDir)tbb.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)tbb.def;%(Outputs)</Outputs>
+    </CustomBuild>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\..\src\tbb\concurrent_hash_map.cpp" />
+    <ClCompile Include="..\..\src\tbb\concurrent_queue.cpp" />
+    <ClCompile Include="..\..\src\tbb\concurrent_vector.cpp" />
+    <ClCompile Include="..\..\src\tbb\dynamic_link.cpp" />
+    <ClCompile Include="..\..\src\tbb\itt_notify.cpp" />
+    <ClCompile Include="..\..\src\tbb\cache_aligned_allocator.cpp" />
+    <ClCompile Include="..\..\src\tbb\pipeline.cpp" />
+    <ClCompile Include="..\..\src\tbb\queuing_mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\queuing_rw_mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\reader_writer_lock.cpp" />
+    <ClCompile Include="..\..\src\tbb\spin_rw_mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\x86_rtm_rw_mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\spin_mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\critical_section.cpp" />
+    <ClCompile Include="..\..\src\tbb\mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\recursive_mutex.cpp" />
+    <ClCompile Include="..\..\src\tbb\condition_variable.cpp" />
+    <ClCompile Include="..\..\src\tbb\tbb_thread.cpp" />
+    <ClCompile Include="..\..\src\tbb\concurrent_monitor.cpp" />
+    <ClCompile Include="..\..\src\tbb\semaphore.cpp" />
+    <ClCompile Include="..\..\src\tbb\private_server.cpp" />
+    <ClCompile Include="..\..\src\rml\client\rml_tbb.cpp" />
+    <ClCompile Include="..\..\src\tbb\tbb_misc.cpp" />
+    <ClCompile Include="..\..\src\tbb\tbb_misc_ex.cpp" />
+    <ClCompile Include="..\..\src\tbb\task.cpp" />
+    <ClCompile Include="..\..\src\tbb\task_group_context.cpp" />
+    <ClCompile Include="..\..\src\tbb\governor.cpp" />
+    <ClCompile Include="..\..\src\tbb\market.cpp" />
+    <ClCompile Include="..\..\src\tbb\arena.cpp" />
+    <ClCompile Include="..\..\src\tbb\scheduler.cpp" />
+    <ClCompile Include="..\..\src\tbb\observer_proxy.cpp" />
+    <ClCompile Include="..\..\src\tbb\tbb_statistics.cpp" />
+    <ClCompile Include="..\..\src\tbb\tbb_main.cpp" />
+    <ClCompile Include="..\..\src\old\concurrent_vector_v2.cpp" />
+    <ClCompile Include="..\..\src\old\concurrent_queue_v2.cpp" />
+    <ClCompile Include="..\..\src\old\spin_rw_mutex_v2.cpp" />
+    <ClCompile Include="..\..\src\old\task_v2.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\..\include\tbb\internal\_concurrent_queue_impl.h" />
+    <ClInclude Include="..\..\include\tbb\_tbb_windef.h" />
+    <ClInclude Include="..\..\include\tbb\aligned_space.h" />
+    <ClInclude Include="..\..\include\tbb\atomic.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_range.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_range2d.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_range3d.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_rangeNd.h" />
+    <ClInclude Include="..\..\include\tbb\cache_aligned_allocator.h" />
+    <ClInclude Include="..\..\include\tbb\combinable.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_hash_map.h" />
+    <ClInclude Include="..\..\src\tbb\concurrent_monitor.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_priority_queue.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_queue.h" />
+    <ClInclude Include="..\..\src\old\concurrent_queue_v2.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_vector.h" />
+    <ClInclude Include="..\..\src\old\concurrent_vector_v2.h" />
+    <ClInclude Include="..\..\include\tbb\critical_section.h" />
+    <ClInclude Include="..\..\src\tbb\dynamic_link.h" />
+    <ClInclude Include="..\..\include\tbb\enumerable_thread_specific.h" />
+    <ClInclude Include="..\..\src\tbb\gate.h" />
+    <ClInclude Include="..\..\src\test\harness.h" />
+    <ClInclude Include="..\..\src\test\harness_allocator.h" />
+    <ClInclude Include="..\..\src\test\harness_assert.h" />
+    <ClInclude Include="..\..\src\test\harness_bad_expr.h" />
+    <ClInclude Include="..\..\src\test\harness_barrier.h" />
+    <ClInclude Include="..\..\src\test\harness_concurrency_tracker.h" />
+    <ClInclude Include="..\..\src\test\harness_cpu.h" />
+    <ClInclude Include="..\..\src\test\harness_eh.h" />
+    <ClInclude Include="..\..\src\test\harness_iterator.h" />
+    <ClInclude Include="..\..\src\test\harness_m128.h" />
+    <ClInclude Include="..\..\src\test\harness_memory.h" />
+    <ClInclude Include="..\..\src\test\harness_report.h" />
+    <ClInclude Include="..\..\include\tbb\machine\ibm_aix51.h" />
+    <ClInclude Include="..\..\src\tbb\itt_notify.h" />
+    <ClInclude Include="..\..\include\tbb\machine\linux_common.h" />
+    <ClInclude Include="..\..\include\tbb\machine\linux_ia32.h" />
+    <ClInclude Include="..\..\include\tbb\machine\linux_ia64.h" />
+    <ClInclude Include="..\..\include\tbb\machine\linux_intel64.h" />
+    <ClInclude Include="..\..\include\tbb\machine\mac_ppc.h" />
+    <ClInclude Include="..\..\include\tbb\mutex.h" />
+    <ClInclude Include="..\..\include\tbb\null_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\null_rw_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_do.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_for.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_for_each.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_invoke.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_reduce.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_scan.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_sort.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_while.h" />
+    <ClInclude Include="..\..\include\tbb\partitioner.h" />
+    <ClInclude Include="..\..\include\tbb\pipeline.h" />
+    <ClInclude Include="..\..\include\tbb\compat\ppl.h" />
+    <ClInclude Include="..\..\include\tbb\queuing_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\queuing_rw_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\reader_writer_lock.h" />
+    <ClInclude Include="..\..\include\tbb\recursive_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\scalable_allocator.h" />
+    <ClInclude Include="..\..\src\tbb\semaphore.h" />
+    <ClInclude Include="..\..\include\tbb\spin_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\spin_rw_mutex.h" />
+    <ClInclude Include="..\..\src\old\spin_rw_mutex_v2.h" />
+    <ClInclude Include="..\..\include\tbb\task.h" />
+    <ClInclude Include="..\..\include\tbb\task_group.h" />
+    <ClInclude Include="..\..\include\tbb\task_scheduler_init.h" />
+    <ClInclude Include="..\..\include\tbb\task_scheduler_observer.h" />
+    <ClInclude Include="..\..\include\tbb\tbb.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_allocator.h" />
+    <ClInclude Include="..\..\src\tbb\tbb_assert_impl.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_config.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_exception.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_machine.h" />
+    <ClInclude Include="..\..\src\tbb\tbb_misc.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_profiling.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_stddef.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_thread.h" />
+    <ClInclude Include="..\..\src\tbb\tbb_version.h" />
+    <ClInclude Include="..\..\include\tbb\tbbmalloc_proxy.h" />
+    <ClInclude Include="..\..\src\test\test_allocator.h" />
+    <ClInclude Include="..\..\src\test\test_allocator_STL.h" />
+    <ClInclude Include="..\..\include\tbb\tick_count.h" />
+    <ClInclude Include="..\..\src\tbb\tls.h" />
+    <ClInclude Include="..\..\include\tbb\machine\windows_ia32.h" />
+    <ClInclude Include="..\..\include\tbb\machine\windows_intel64.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="..\..\src\tbb\tbb_resource.rc">
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+    </ResourceCompile>
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+    <Import Project="$(VCTargetsPath)\BuildCustomizations\masm.targets" />
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/build/vs2013/tbbmalloc.vcxproj b/xdl/third_party/tbb/build/vs2013/tbbmalloc.vcxproj
new file mode 100644
index 00000000..0a38cd5f
--- /dev/null
+++ b/xdl/third_party/tbb/build/vs2013/tbbmalloc.vcxproj
@@ -0,0 +1,559 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug-MT|Win32">
+      <Configuration>Debug-MT</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug-MT|x64">
+      <Configuration>Debug-MT</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release-MT|Win32">
+      <Configuration>Release-MT</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release-MT|x64">
+      <Configuration>Release-MT</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{B15F131E-328A-4D42-ADC2-9FF4CA6306D8}</ProjectGuid>
+    <RootNamespace>tbbmalloc</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+    <Import Project="$(VCTargetsPath)\BuildCustomizations\masm.props" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(ProjectName)_debug</TargetName>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MDd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MDd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <MinimalRebuild>false</MinimalRebuild>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <TreatWChar_tAsBuiltInType>true</TreatWChar_tAsBuiltInType>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ShowIncludes>false</ShowIncludes>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MD /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MD /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MTd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MTd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <MinimalRebuild>false</MinimalRebuild>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
+      <TreatWChar_tAsBuiltInType>true</TreatWChar_tAsBuiltInType>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ShowIncludes>false</ShowIncludes>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MT /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MT /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc /I.</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ExceptionHandling>false</ExceptionHandling>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO /DEF:"$(IntDir)tbbmalloc.def" %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <CustomBuild Include="..\..\src\tbb\intel64-masm\atomic_support.asm">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">ml64 /Fo"$(IntDir)%(FileName).obj" /DUSE_FRAME_POINTER /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">building atomic_support.obj</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">ml64 /Fo"$(IntDir)%(FileName).obj"  /DEM64T=1 /c /Zi ../../src/tbb/intel64-masm/atomic_support.asm</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)%(FileName).obj;%(Outputs)</Outputs>
+    </CustomBuild>
+  </ItemGroup>
+  <ItemGroup>
+    <CustomBuild Include="..\..\src\tbbmalloc\win32-tbbmalloc-export.def">
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">cl /nologo /TC /EP ../../src/tbbmalloc/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">cl /nologo /TC /EP ../../src/tbbmalloc/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">cl /nologo /TC /EP ../../src/tbbmalloc/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">cl /nologo /TC /EP ../../src/tbbmalloc/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">cl /nologo /TC /EP ../../src/tbbmalloc/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">cl /nologo /TC /EP ../../src/tbb/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">cl /nologo /TC /EP ../../src/tbbmalloc/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">cl /nologo /TC /EP ../../src/tbb/win32-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+    </CustomBuild>
+    <CustomBuild Include="..\..\src\tbbmalloc\win64-tbbmalloc-export.def">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">cl /nologo /TC /EP ../../src/tbbmalloc/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">cl /nologo /TC /EP ../../src/tbbmalloc/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">cl /nologo /TC /EP ../../src/tbbmalloc/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">cl /nologo /TC /EP ../../src/tbb/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">generating tbbmalloc.def file</Message>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">cl /nologo /TC /EP ../../src/tbbmalloc/win64-tbbmalloc-export.def /DTBB_USE_DEBUG /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 /D__TBBMALLOC_BUILD=1 &gt;"$(IntDir)tbbmalloc.def"
+</Command>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(IntDir)tbbmalloc.def;%(Outputs)</Outputs>
+    </CustomBuild>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\..\src\tbbmalloc\backend.cpp" />
+    <ClCompile Include="..\..\src\tbbmalloc\large_objects.cpp" />
+    <ClCompile Include="..\..\src\tbbmalloc\backref.cpp" />
+    <ClCompile Include="..\..\src\tbbmalloc\tbbmalloc.cpp" />
+    <ClCompile Include="..\..\src\tbb\itt_notify.cpp" />
+    <ClCompile Include="..\..\src\tbbmalloc\frontend.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\..\include\tbb\internal\_concurrent_queue_impl.h" />
+    <ClInclude Include="..\..\include\tbb\_tbb_windef.h" />
+    <ClInclude Include="..\..\include\tbb\aligned_space.h" />
+    <ClInclude Include="..\..\include\tbb\atomic.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_range.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_range2d.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_range3d.h" />
+    <ClInclude Include="..\..\include\tbb\blocked_rangeNd.h" />
+    <ClInclude Include="..\..\include\tbb\cache_aligned_allocator.h" />
+    <ClInclude Include="..\..\include\tbb\combinable.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_hash_map.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_queue.h" />
+    <ClInclude Include="..\..\include\tbb\concurrent_vector.h" />
+    <ClInclude Include="..\..\include\tbb\critical_section.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\Customize.h" />
+    <ClInclude Include="..\..\include\tbb\enumerable_thread_specific.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\LifoList.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\MapMemory.h" />
+    <ClInclude Include="..\..\include\tbb\mutex.h" />
+    <ClInclude Include="..\..\include\tbb\null_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\null_rw_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_do.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_for.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_for_each.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_invoke.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_reduce.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_scan.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_sort.h" />
+    <ClInclude Include="..\..\include\tbb\parallel_while.h" />
+    <ClInclude Include="..\..\include\tbb\partitioner.h" />
+    <ClInclude Include="..\..\include\tbb\pipeline.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\proxy.h" />
+    <ClInclude Include="..\..\include\tbb\queuing_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\queuing_rw_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\recursive_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\scalable_allocator.h" />
+    <ClInclude Include="..\..\include\tbb\spin_mutex.h" />
+    <ClInclude Include="..\..\include\tbb\spin_rw_mutex.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\Statistics.h" />
+    <ClInclude Include="..\..\include\tbb\task.h" />
+    <ClInclude Include="..\..\include\tbb\task_group.h" />
+    <ClInclude Include="..\..\include\tbb\task_scheduler_init.h" />
+    <ClInclude Include="..\..\include\tbb\task_scheduler_observer.h" />
+    <ClInclude Include="..\..\include\tbb\tbb.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_allocator.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_config.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_exception.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\tbb_function_replacement.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_machine.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_profiling.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_stddef.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_thread.h" />
+    <ClInclude Include="..\..\include\tbb\tbb_version.h" />
+    <ClInclude Include="..\..\include\tbb\tbbmalloc_proxy.h" />
+    <ClInclude Include="..\..\include\tbb\tick_count.h" />
+    <ClInclude Include="..\..\src\tbbmalloc\TypeDefinitions.h" />
+    <ClInclude Include="..\..\include\tbb\machine\windows_ia32.h" />
+    <ClInclude Include="..\..\include\tbb\machine\windows_intel64.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="..\..\src\tbbmalloc\tbbmalloc.rc">
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+    </ResourceCompile>
+  </ItemGroup>
+  <ItemGroup>
+    <ProjectReference Include="tbb.vcxproj">
+      <Project>{f62787dd-1327-448b-9818-030062bcfaa5}</Project>
+      <ReferenceOutputAssembly>false</ReferenceOutputAssembly>
+    </ProjectReference>
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+    <Import Project="$(VCTargetsPath)\BuildCustomizations\masm.targets" />
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/build/vs2013/tbbmalloc_proxy.vcxproj b/xdl/third_party/tbb/build/vs2013/tbbmalloc_proxy.vcxproj
new file mode 100644
index 00000000..758bb517
--- /dev/null
+++ b/xdl/third_party/tbb/build/vs2013/tbbmalloc_proxy.vcxproj
@@ -0,0 +1,425 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug-MT|Win32">
+      <Configuration>Debug-MT</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug-MT|x64">
+      <Configuration>Debug-MT</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release-MT|Win32">
+      <Configuration>Release-MT</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release-MT|x64">
+      <Configuration>Release-MT</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{02F61511-D5B6-46E6-B4BB-DEAA96E6BCC7}</ProjectGuid>
+    <RootNamespace>tbbmalloc_proxy</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>DynamicLibrary</ConfigurationType>
+    <CharacterSet>NotSet</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+    <Import Project="$(VCTargetsPath)\BuildCustomizations\masm.props" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(ProjectName)_debug</TargetName>
+    <TargetName Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">$(ProjectName)_debug</TargetName>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MDd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <ExceptionHandling>Sync</ExceptionHandling>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MDd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <MinimalRebuild>false</MinimalRebuild>
+      <ExceptionHandling>
+      </ExceptionHandling>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <TreatWChar_tAsBuiltInType>true</TreatWChar_tAsBuiltInType>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ShowIncludes>false</ShowIncludes>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MD /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ExceptionHandling>
+      </ExceptionHandling>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO   %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MD /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ExceptionHandling>
+      </ExceptionHandling>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MTd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <MinimalRebuild>true</MinimalRebuild>
+      <ExceptionHandling>Sync</ExceptionHandling>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO  %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MTd /Od /Ob0 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=tbb_debug.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <MinimalRebuild>false</MinimalRebuild>
+      <ExceptionHandling>
+      </ExceptionHandling>
+      <BasicRuntimeChecks>Default</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
+      <TreatWChar_tAsBuiltInType>true</TreatWChar_tAsBuiltInType>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <ShowIncludes>false</ShowIncludes>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy_debug.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">
+    <ClCompile>
+      <AdditionalOptions> /c /MT /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ExceptionHandling>
+      </ExceptionHandling>
+      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO   %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions> /c /MT /O2 /Zi /EHsc /GR /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=tbb.lib /DDO_ITT_NOTIFY /GS /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0502 /W4 /D__TBBMALLOC_BUILD=1 /I../../src /I../../src/rml/include /I../../include /I../../src/tbbmalloc /I../../src/tbbmalloc</AdditionalOptions>
+      <AdditionalIncludeDirectories>.;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ExceptionHandling>
+      </ExceptionHandling>
+      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level4</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalOptions>/nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO %(AdditionalOptions)</AdditionalOptions>
+      <OutputFile>$(OutDir)tbbmalloc_proxy.dll</OutputFile>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\..\src\tbbmalloc\tbb_function_replacement.h" />
+    <ClInclude Include="..\..\include\tbb\tbbmalloc_proxy.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="..\..\src\tbbmalloc\tbbmalloc.rc">
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug-MT|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release-MT|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalOptions Condition="'$(Configuration)|$(Platform)'=='Release|x64'">/I../../src /I../../include /DDO_ITT_NOTIFY /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE /D_WIN32_WINNT=0x0400 %(AdditionalOptions)</AdditionalOptions>
+    </ResourceCompile>
+    <ClCompile Include="..\..\src\tbbmalloc\proxy.cpp" />
+    <ClCompile Include="..\..\src\tbbmalloc\tbb_function_replacement.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ProjectReference Include="tbbmalloc.vcxproj">
+      <Project>{b15f131e-328a-4d42-adc2-9ff4ca6306d8}</Project>
+      <ReferenceOutputAssembly>false</ReferenceOutputAssembly>
+    </ProjectReference>
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+    <Import Project="$(VCTargetsPath)\BuildCustomizations\masm.targets" />
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/build/vs2013/version_string.ver b/xdl/third_party/tbb/build/vs2013/version_string.ver
new file mode 100644
index 00000000..5d8f04e5
--- /dev/null
+++ b/xdl/third_party/tbb/build/vs2013/version_string.ver
@@ -0,0 +1 @@
+#define __TBB_VERSION_STRINGS(N) "Empty"
diff --git a/xdl/third_party/tbb/build/windows.cl.inc b/xdl/third_party/tbb/build/windows.cl.inc
new file mode 100644
index 00000000..97909cf4
--- /dev/null
+++ b/xdl/third_party/tbb/build/windows.cl.inc
@@ -0,0 +1,166 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#------------------------------------------------------------------------------
+# Define compiler-specific variables.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting compiler flags.
+#------------------------------------------------------------------------------
+CPLUS ?= cl /nologo
+LINK_FLAGS = /link /nologo
+LIB_LINK_FLAGS=/link /nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO /DYNAMICBASE /NXCOMPAT
+
+ifneq (,$(stdver))
+    CXX_STD_FLAGS = /std:$(stdver)
+endif
+
+ifeq ($(arch), ia32)
+    LIB_LINK_FLAGS += /SAFESEH
+endif
+
+ifeq ($(runtime), vc_mt)
+    MS_CRT_KEY = /MT$(if $(findstring debug,$(cfg)),d)
+else
+    MS_CRT_KEY = /MD$(if $(findstring debug,$(cfg)),d)
+endif
+EH_FLAGS = $(if $(no_exceptions),/EHs-,/EHsc /GR)
+
+# UWD binaries have to use static CRT linkage
+ifeq ($(target_app), uwd)
+    MS_CRT_KEY = /MT$(if $(findstring debug,$(cfg)),d)
+endif
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = $(MS_CRT_KEY) /O2 /Zi $(EH_FLAGS) /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=$(TBB.LIB)
+        ASM_FLAGS =
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = $(MS_CRT_KEY) /Od /Ob0 /Zi $(EH_FLAGS) /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=$(TBB.LIB)
+        ASM_FLAGS = /DUSE_FRAME_POINTER
+endif
+
+ZW_KEY = /ZW:nostdlib
+
+# These flags are general for Windows* universal applications
+ifneq (,$(target_app))
+    CPLUS_FLAGS += $(ZW_KEY) /D "_UNICODE" /D "UNICODE" /D "WINAPI_FAMILY=WINAPI_FAMILY_APP"
+endif
+
+ifeq ($(target_app), win8ui)
+        _WIN32_WINNT = 0x0602
+else ifneq (,$(filter $(target_app),uwp uwd))
+        _WIN32_WINNT = 0x0A00
+        LIB_LINK_FLAGS += /NODEFAULTLIB:kernel32.lib OneCore.lib
+else
+        CPLUS_FLAGS += /DDO_ITT_NOTIFY
+endif
+ifeq ($(target_mode), store)
+#       it is necessary to source vcvars with 'store' argument in production
+        LIB_LINK_FLAGS += /APPCONTAINER
+endif
+
+CPLUS_FLAGS += /GS
+
+COMPILE_ONLY = /c
+PREPROC_ONLY = /TP /EP
+INCLUDE_KEY = /I
+DEFINE_KEY = /D
+OUTPUT_KEY = /Fe
+OUTPUTOBJ_KEY = /Fo
+WARNING_AS_ERROR_KEY = /WX
+WARNING_SUPPRESS = $(if $(no_exceptions),/wd4530 /wd4577)
+BIGOBJ_KEY = /bigobj
+
+ifeq ($(runtime),vc7.1)
+        WARNING_KEY = /W3
+else
+        WARNING_KEY = /W4
+        OPENMP_FLAG = /openmp
+endif
+
+DYLIB_KEY = /DLL
+EXPORT_KEY = /DEF:
+NODEFAULTLIB_KEY = /Zl
+NOINTRINSIC_KEY = /Oi-
+
+INCLUDE_TEST_HEADERS = /FI$(tbb_root)/src/test/harness_preload.h
+
+ifeq ($(runtime),vc8)
+        WARNING_KEY += /Wp64
+        CPLUS_FLAGS += /D_USE_RTM_VERSION
+endif
+
+# Since VS2012, VC++ provides /volatile option to control semantics of volatile variables.
+# We want to use strict ISO semantics in the library and tests
+ifeq (ok,$(call detect_js,/minversion cl 17))
+        CPLUS_FLAGS += /volatile:iso
+endif
+
+# Since VS2013, VC++ uses the same .pdb file for different sources so we need
+# to add /FS (Force Synchronous PDB Writes)
+ifeq (ok,$(call detect_js,/minversion cl 18))
+        CPLUS_FLAGS += /FS
+endif
+
+CPLUS_FLAGS += /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE \
+        /D_WIN32_WINNT=$(_WIN32_WINNT)
+C_FLAGS = $(subst $(ZW_KEY),,$(subst $(EH_FLAGS),,$(CPLUS_FLAGS)))
+
+#------------------------------------------------------------------------------
+# End of setting compiler flags.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASSEMBLY_SOURCE=$(arch)-masm
+ifeq (intel64,$(arch))
+    ASM=ml64 /nologo
+    ASM_FLAGS += /DEM64T=1 /c /Zi
+    TBB_ASM.OBJ = atomic_support.obj intel64_misc.obj itsx.obj
+    MALLOC_ASM.OBJ = atomic_support.obj
+else
+ifeq (armv7,$(arch))
+    ASM=
+    TBB_ASM.OBJ= 
+else
+    ASM=ml /nologo
+    ASM_FLAGS += /c /coff /Zi /safeseh
+    TBB_ASM.OBJ = atomic_support.obj lock_byte.obj itsx.obj
+endif
+endif
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+M_CPLUS_FLAGS = $(CPLUS_FLAGS)
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# End of define compiler-specific variables.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/windows.gcc.inc b/xdl/third_party/tbb/build/windows.gcc.inc
new file mode 100644
index 00000000..90a956af
--- /dev/null
+++ b/xdl/third_party/tbb/build/windows.gcc.inc
@@ -0,0 +1,142 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#------------------------------------------------------------------------------
+# Overriding settings from windows.inc
+#------------------------------------------------------------------------------
+
+SLASH= $(strip \)
+OBJ = o
+LIBEXT = dll # MinGW allows linking with DLLs directly
+
+TBB.RES =
+MALLOC.RES =
+RML.RES =
+TBB.MANIFEST =
+MALLOC.MANIFEST =
+RML.MANIFEST =
+
+ifeq (ia32,$(arch))
+    TBB.LST = $(tbb_root)/src/tbb/lin32-tbb-export.lst
+else
+    TBB.LST = $(tbb_root)/src/tbb/win64-gcc-tbb-export.lst
+endif
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-gcc-tbbmalloc-export.def
+RML.DEF = $(RML_SERVER_ROOT)/lin-rml-export.def
+
+LINK_TBB.LIB = $(TBB.LIB)
+# no TBB proxy for the configuration
+PROXY.LIB =
+
+#------------------------------------------------------------------------------
+# End of overridden settings
+#------------------------------------------------------------------------------
+# Compiler-specific variables
+#------------------------------------------------------------------------------
+
+CPLUS ?= g++
+COMPILE_ONLY = -c -MMD
+PREPROC_ONLY = -E -x c++
+INCLUDE_KEY = -I
+DEFINE_KEY = -D
+OUTPUT_KEY = -o #
+OUTPUTOBJ_KEY = -o #
+PIC_KEY =
+WARNING_AS_ERROR_KEY = -Werror
+WARNING_KEY = -Wall
+TEST_WARNING_KEY = -Wextra -Wshadow -Wcast-qual -Woverloaded-virtual -Wnon-virtual-dtor -Wno-uninitialized
+WARNING_SUPPRESS = -Wno-parentheses -Wno-uninitialized -Wno-non-virtual-dtor
+DYLIB_KEY = -shared
+LIBDL =
+EXPORT_KEY = -Wl,--version-script,
+LIBS = -lpsapi
+BIGOBJ_KEY = -Wa,-mbig-obj
+
+#------------------------------------------------------------------------------
+# End of compiler-specific variables
+#------------------------------------------------------------------------------
+# Command lines
+#------------------------------------------------------------------------------
+
+LINK_FLAGS = -Wl,--enable-auto-import
+LIB_LINK_FLAGS = $(DYLIB_KEY)
+
+# gcc 4.8 and later support RTM intrinsics, but require command line switch to enable them
+ifeq (ok,$(call detect_js,/minversion gcc 4.8))
+    RTM_KEY = -mrtm
+endif
+
+# gcc 6.0 and later have -flifetime-dse option that controls
+# elimination of stores done outside the object lifetime
+ifeq (ok,$(call detect_js,/minversion gcc 6.0))
+    # keep pre-contruction stores for zero initialization
+    DSE_KEY = -flifetime-dse=1
+endif
+
+ifeq ($(cfg), release)
+        CPLUS_FLAGS = -g -O2
+endif
+ifeq ($(cfg), debug)
+        CPLUS_FLAGS = -g -O0 -DTBB_USE_DEBUG
+endif
+
+CPLUS_FLAGS += -DUSE_WINTHREAD
+CPLUS_FLAGS += -D_WIN32_WINNT=$(_WIN32_WINNT)
+
+# MinGW specific
+CPLUS_FLAGS += -DMINGW_HAS_SECURE_API=1 -D__MSVCRT_VERSION__=0x0700 -msse -mthreads
+
+CONLY = gcc
+debugger = gdb
+C_FLAGS = $(CPLUS_FLAGS)
+
+ifeq (intel64,$(arch))
+    CPLUS_FLAGS += -m64 $(RTM_KEY)
+    LIB_LINK_FLAGS += -m64
+endif
+
+ifeq (ia32,$(arch))
+    CPLUS_FLAGS += -m32 -march=i686 $(RTM_KEY)
+    LIB_LINK_FLAGS += -m32
+endif
+
+# For examples
+export UNIXMODE = 1
+
+#------------------------------------------------------------------------------
+# End of command lines
+#------------------------------------------------------------------------------
+# Setting assembler data
+#------------------------------------------------------------------------------
+
+ASM=
+ASM_FLAGS=
+TBB_ASM.OBJ=
+ASSEMBLY_SOURCE=$(arch)-gas
+
+#------------------------------------------------------------------------------
+# End of setting assembler data
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data
+#------------------------------------------------------------------------------
+
+M_CPLUS_FLAGS = $(CPLUS_FLAGS) -fno-rtti -fno-exceptions
+
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/windows.icl.inc b/xdl/third_party/tbb/build/windows.icl.inc
new file mode 100644
index 00000000..8fc8cdf7
--- /dev/null
+++ b/xdl/third_party/tbb/build/windows.icl.inc
@@ -0,0 +1,178 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#------------------------------------------------------------------------------
+# Define compiler-specific variables.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting default configuration to release.
+#------------------------------------------------------------------------------
+cfg ?= release
+#------------------------------------------------------------------------------
+# End of setting default configuration to release.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting compiler flags.
+#------------------------------------------------------------------------------
+CPLUS ?= icl /nologo $(VCCOMPAT_FLAG)
+LINK_FLAGS = /link /nologo
+LIB_LINK_FLAGS= /link /nologo /DLL /MAP /DEBUG /fixed:no /INCREMENTAL:NO /DYNAMICBASE /NXCOMPAT
+
+ifeq ($(arch), ia32)
+    LIB_LINK_FLAGS += /SAFESEH
+endif
+
+ifneq (,$(stdver))
+    CXX_STD_FLAGS = /Qstd=$(stdver)
+endif
+
+# ICC 12.0 and higher provide Intel(R) Cilk(TM) Plus
+ifeq (ok,$(call detect_js,/minversion icl 12))
+    CILK_AVAILABLE = yes
+endif
+
+# ICC 17.0.4 and higher provide support for VS2017
+ifeq (ok,$(call detect_js,/minversion icl 17 4))
+    VS2017_SUPPORT = yes
+endif
+
+ifeq ($(runtime), vc_mt)
+    MS_CRT_KEY = /MT$(if $(findstring debug,$(cfg)),d)
+else
+    MS_CRT_KEY = /MD$(if $(findstring debug,$(cfg)),d)
+endif
+EH_FLAGS = $(if $(no_exceptions),/EHs-,/EHsc /GR)
+
+ifeq ($(cfg), release)
+    CPLUS_FLAGS = $(MS_CRT_KEY) /O2 /Zi $(EH_FLAGS) /Zc:forScope /Zc:wchar_t /D__TBB_LIB_NAME=$(TBB.LIB)
+    ASM_FLAGS =
+endif
+ifeq ($(cfg), debug)
+    CPLUS_FLAGS = $(MS_CRT_KEY) /Od /Ob0 /Zi $(EH_FLAGS) /Zc:forScope /Zc:wchar_t /DTBB_USE_DEBUG /D__TBB_LIB_NAME=$(TBB.LIB)
+    ASM_FLAGS = /DUSE_FRAME_POINTER
+endif
+CPLUS_FLAGS += /GS
+
+COMPILE_ONLY = /c /QMMD
+# PREPROC_ONLY should really use /TP which applies to all files in the command line.
+# But with /TP, ICL does not preprocess *.def files.
+PREPROC_ONLY = /EP /Tp
+INCLUDE_KEY = /I
+DEFINE_KEY = /D
+OUTPUT_KEY = /Fe
+OUTPUTOBJ_KEY = /Fo
+WARNING_AS_ERROR_KEY = /WX
+WARNING_KEY = /W3
+WARNING_SUPPRESS = $(if $(no_exceptions),/wd583)
+DYLIB_KEY = /DLL
+EXPORT_KEY = /DEF:
+NODEFAULTLIB_KEY = /Zl
+NOINTRINSIC_KEY = /Oi-
+BIGOBJ_KEY = /bigobj
+INCLUDE_TEST_HEADERS = /FI$(tbb_root)/src/test/harness_preload.h
+
+
+ifneq (,$(codecov))
+    CPLUS_FLAGS += /Qprof-genx
+else
+    CPLUS_FLAGS += /DDO_ITT_NOTIFY
+endif
+
+OPENMP_FLAG = /Qopenmp
+CPLUS_FLAGS += /DUSE_WINTHREAD /D_CRT_SECURE_NO_DEPRECATE \
+               /D_WIN32_WINNT=$(_WIN32_WINNT)
+
+ifeq ($(runtime),vc8)
+    CPLUS_FLAGS += /D_USE_RTM_VERSION
+endif
+
+
+C_FLAGS = $(subst $(EH_FLAGS),,$(CPLUS_FLAGS))
+
+VCVERSION:=$(runtime)
+VCCOMPAT_FLAG ?= $(if $(findstring vc7.1, $(VCVERSION)),/Qvc7.1)
+ifeq ($(VCCOMPAT_FLAG),)
+        VCCOMPAT_FLAG := $(if $(findstring vc8, $(VCVERSION)),/Qvc8)
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+        VCCOMPAT_FLAG := $(if $(findstring vc_mt, $(VCVERSION)),/Qvc10)
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+        VCCOMPAT_FLAG := $(if $(findstring vc9, $(VCVERSION)),/Qvc9)
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+        VCCOMPAT_FLAG := $(if $(findstring vc10, $(VCVERSION)),/Qvc10)
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+        VCCOMPAT_FLAG := $(if $(findstring vc11, $(VCVERSION)),/Qvc11)
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+        VCCOMPAT_FLAG := $(if $(findstring vc12, $(VCVERSION)),/Qvc12)
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+    VCCOMPAT_FLAG := $(if $(findstring vc14, $(VCVERSION)),/Qvc14)
+    ifeq ($(VS2017_SUPPORT),yes)
+        ifneq (,$(findstring vc14.1, $(VCVERSION)))
+            VCCOMPAT_FLAG := /Qvc14.1
+        endif
+    endif
+endif
+ifeq ($(VCCOMPAT_FLAG),)
+        $(error VC version not detected correctly: $(VCVERSION) )
+endif
+export VCCOMPAT_FLAG
+
+#------------------------------------------------------------------------------
+# End of setting compiler flags.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting assembler data.
+#------------------------------------------------------------------------------
+ASSEMBLY_SOURCE=$(arch)-masm
+ifeq (intel64,$(arch))
+    ASM=ml64 /nologo
+    ASM_FLAGS += /DEM64T=1 /c /Zi
+    TBB_ASM.OBJ = atomic_support.obj intel64_misc.obj itsx.obj
+    MALLOC_ASM.OBJ = atomic_support.obj
+else
+    ASM=ml /nologo
+    ASM_FLAGS += /c /coff /Zi /safeseh
+    TBB_ASM.OBJ = atomic_support.obj lock_byte.obj itsx.obj
+endif
+#------------------------------------------------------------------------------
+# End of setting assembler data.
+#------------------------------------------------------------------------------
+
+
+#------------------------------------------------------------------------------
+# Setting tbbmalloc data.
+#------------------------------------------------------------------------------
+M_CPLUS_FLAGS = $(CPLUS_FLAGS)
+#------------------------------------------------------------------------------
+# End of setting tbbmalloc data.
+#------------------------------------------------------------------------------
+
+#------------------------------------------------------------------------------
+# End of define compiler-specific variables.
+#------------------------------------------------------------------------------
diff --git a/xdl/third_party/tbb/build/windows.inc b/xdl/third_party/tbb/build/windows.inc
new file mode 100644
index 00000000..891bf94e
--- /dev/null
+++ b/xdl/third_party/tbb/build/windows.inc
@@ -0,0 +1,111 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+export SHELL = cmd
+
+ifdef tbb_build_dir
+  test_dir:=$(tbb_build_dir)
+else
+  test_dir:=.
+endif
+
+# A convenience wrapper for calls to detect.js.
+# $(1) is the full command line for the script, e.g. /minversion icl 12
+detect_js = $(shell cmd /C "cscript /nologo /E:jscript $(tbb_root)/build/detect.js $(1)")
+
+# TODO give an error if archs doesn't match
+ifndef arch
+  export arch:=$(call detect_js, /arch $(compiler))
+endif
+
+ifndef runtime
+  export runtime:=$(call detect_js, /runtime $(compiler))
+endif
+
+native_compiler := cl
+export compiler ?= cl
+debugger ?= devenv /debugexe
+
+CMD=cmd /C
+CWD=$(shell cmd /C echo %CD%)
+RM=cmd /C del /Q /F
+RD=cmd /C rmdir
+MD=cmd /c mkdir
+SLASH=\\
+NUL = nul
+
+AR=lib
+AR_OUTPUT_KEY=/out:
+AR_FLAGS=/nologo /nodefaultlib
+
+OBJ = obj
+DLL = dll
+LIBEXT = lib
+ASMEXT = asm
+
+def_prefix = $(if $(findstring intel64,$(arch)),win64,win32)
+
+# Target Windows version. Do not increase beyond 0x0502 without prior discussion!
+# Used as the value for macro definition option in windows.cl.inc etc.
+# For tests, we need at least Windows XP SP2 for sake of enabling stack backtraces.
+_WIN32_WINNT=0x0502
+
+TBB.LST = $(tbb_root)/src/tbb/$(def_prefix)-tbb-export.lst
+TBB.DEF = $(TBB.LST:.lst=.def)
+TBB.DLL = tbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(DLL)
+TBB.LIB = tbb$(CPF_SUFFIX)$(DEBUG_SUFFIX).$(LIBEXT)
+TBB.RES = tbb_resource.res
+# On Windows, we use #pragma comment to set the proper TBB lib to link with.
+# But for cross-configuration testing, need to link explicitly.
+# Tests use this variable to detect dependency on TBB binary, so have to be non-empty. 
+LINK_TBB.LIB = $(if $(crosstest),$(TBB.LIB),$(DEFINE_KEY)__TBB_IMPLICITLY_LINKED)
+TBB.MANIFEST =
+ifneq ($(filter vc8 vc9,$(runtime)),)
+    TBB.MANIFEST = tbbmanifest.exe.manifest
+endif
+
+MALLOC.DEF = $(MALLOC_ROOT)/$(def_prefix)-tbbmalloc-export.def
+MALLOC.DLL = tbbmalloc$(DEBUG_SUFFIX).$(DLL)
+MALLOC.LIB = tbbmalloc$(DEBUG_SUFFIX).$(LIBEXT)
+MALLOC.RES = tbbmalloc.res
+MALLOC.MANIFEST =
+ifneq ($(filter vc8 vc9,$(runtime)),)
+MALLOC.MANIFEST = tbbmanifest.exe.manifest
+endif
+LINK_MALLOC.LIB = $(MALLOC.LIB)
+
+MALLOCPROXY.DLL = tbbmalloc_proxy$(DEBUG_SUFFIX).$(DLL)
+MALLOCPROXY.LIB = tbbmalloc_proxy$(DEBUG_SUFFIX).$(LIBEXT)
+LINK_MALLOCPROXY.LIB = $(MALLOCPROXY.LIB)
+
+PROXY.LIB = tbbproxy$(DEBUG_SUFFIX).$(LIBEXT)
+
+RML.DEF = $(RML_SERVER_ROOT)/$(def_prefix)-rml-export.def
+RML.DLL = irml$(DEBUG_SUFFIX).$(DLL)
+RML.LIB = irml$(DEBUG_SUFFIX).$(LIBEXT)
+RML.RES = irml.res
+ifneq ($(filter vc8 vc9,$(runtime)),)
+RML.MANIFEST = tbbmanifest.exe.manifest
+endif
+
+MAKE_VERSIONS = cmd /C cscript /nologo /E:jscript $(subst \,/,$(tbb_root))/build/version_info_windows.js $(compiler) $(arch) $(subst \,/,"$(VERSION_FLAGS)") > version_string.ver
+MAKE_TBBVARS  = cmd /C "$(subst /,\,$(tbb_root))\build\generate_tbbvars.bat"
+
+TEST_LAUNCHER = $(subst /,\,$(tbb_root))\build\test_launcher.bat $(largs)
+
+OPENCL.LIB = OpenCL.$(LIBEXT)
diff --git a/xdl/third_party/tbb/cmake/README.rst b/xdl/third_party/tbb/cmake/README.rst
new file mode 100644
index 00000000..40befbfc
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/README.rst
@@ -0,0 +1,285 @@
+.. contents::
+
+Introduction
+------------
+Many developers use CMake to manage their development projects, so the Intel(R) Threading Building Blocks (Intel(R) TBB)
+team created the set of CMake modules to simplify integration of the Intel TBB library into a CMake project.
+The modules are available starting from Intel TBB 2017 U7 in `<tbb_root>/cmake <https://github.com/01org/tbb/tree/tbb_2017/cmake>`_.
+
+About Intel TBB
+^^^^^^^^^^^^^^^
+Intel TBB is a library that supports scalable parallel programming using standard ISO C++ code. It does not require special languages or compilers. It is designed to promote scalable data parallel programming. Additionally, it fully supports nested parallelism, so you can build larger parallel components from smaller parallel components. To use the library, you specify tasks, not threads, and let the library map tasks onto threads in an efficient manner.
+
+Many of the library interfaces employ generic programming, in which interfaces are defined by requirements on types and not specific types. The C++ Standard Template Library (STL) is an example of generic programming. Generic programming enables Intel TBB to be flexible yet efficient. The generic interfaces enable you to customize components to your specific needs.
+
+The net result is that Intel TBB enables you to specify parallelism far more conveniently than using raw threads, and at the same time can improve performance.
+
+References
+^^^^^^^^^^
+* `Official Intel TBB open source site <https://www.threadingbuildingblocks.org/>`_
+* `Official GitHub repository <https://github.com/01org/tbb>`_
+
+Engineering team contacts
+^^^^^^^^^^^^^^^^^^^^^^^^^
+The Intel TBB team is very interested in convenient integration of the Intel TBB library into customer projects. These CMake modules were created to provide such a possibility for CMake projects using a simple but powerful interface. We hope you will try these modules and we are looking forward to receiving your feedback!
+
+E-mail us: `inteltbbdevelopers@intel.com <mailto:inteltbbdevelopers@intel.com>`_.
+
+Visit our `forum <https://software.intel.com/en-us/forums/intel-threading-building-blocks/>`_.
+
+Release Notes
+-------------
+* Minimum supported CMake version: ``3.0.0``.
+* Intel TBB versioning via `find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_ has restricted functionality: compatibility of update numbers (as well as interface versions) is not checked. Supported versioning: ``find_package(TBB <major>.<minor> ...)``. Intel TBB interface version can be obtained in the customer project via the ``TBB_INTERFACE_VERSION`` variable.
+
+Use cases of Intel TBB integration into CMake-aware projects
+------------------------------------------------------------
+There are two types of Intel TBB packages:
+ * Binary packages with pre-built binaries for Windows* OS, Linux* OS and macOS*. They are available on the releases page of the Github repository: https://github.com/01org/tbb/releases. The main purpose of the binary package integration is the ability to build Intel TBB header files and binaries into your CMake-aware project.
+ * A source package is also available to download from the release page via the "Source code" link. In addition, it can be cloned from the repository by ``git clone https://github.com/01org/tbb.git``. The main purpose of the source package integration is to allow you to do a custom build of the Intel TBB library from the source files and then build that into your CMake-aware project.
+
+There are four types of CMake modules that can be used to integrate Intel TBB: `TBBConfig`, `TBBGet`, `TBBMakeConfig` and `TBBBuild`. See `Technical documentation for CMake modules`_ section for additional details.
+
+Binary package integration
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The following use case is valid for packages starting from Intel TBB 2017 U7:
+
+* Download package manually and make integration.
+
+ Pre-condition: Location of TBBConfig.cmake is available via ``TBB_DIR`` or ``CMAKE_PREFIX_PATH`` contains path to Intel TBB root.
+
+ CMake code for integration:
+
+  .. code:: cmake
+
+   find_package(TBB <options>)
+
+The following use case is valid for all Intel TBB 2017 packages.
+
+* Download package using TBBGet_ and make integration.
+
+ Pre-condition: Intel TBB CMake modules are available via <path-to-tbb-cmake-modules>.
+
+ CMake code for integration:
+  .. code:: cmake
+
+   include(<path-to-tbb-cmake-modules>/TBBGet.cmake)
+   tbb_get(TBB_ROOT tbb_root CONFIG_DIR TBB_DIR)
+   find_package(TBB <options>)
+
+Source package integration
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+* Build Intel TBB from existing source files using TBBBuild_ and make integration.
+
+ Pre-condition: Intel TBB source code is available via <tbb_root> and Intel TBB CMake modules are available via <path-to-tbb-cmake-modules>.
+
+ CMake code for integration:
+  .. code:: cmake
+
+   include(<path-to-tbb-cmake-modules>/TBBBuild.cmake)
+   tbb_build(TBB_ROOT <tbb_root> CONFIG_DIR TBB_DIR)
+   find_package(TBB <options>)
+
+* Download Intel TBB source files using TBBGet_, build it using TBBBuild_ and make integration.
+
+ Pre-condition: Intel TBB CMake modules are available via <path-to-tbb-cmake-modules>.
+
+ CMake code for integration:
+  .. code:: cmake
+
+   include(<path-to-tbb-cmake-modules>/TBBGet.cmake)
+   include(<path-to-tbb-cmake-modules>/TBBBuild.cmake)
+   tbb_get(TBB_ROOT tbb_root SOURCE_CODE)
+   tbb_build(TBB_ROOT ${tbb_root} CONFIG_DIR TBB_DIR)
+   find_package(TBB <options>)
+
+Tutorials: Intel TBB integration using CMake
+--------------------------------------------
+Binary Intel TBB integration to the sub_string_finder sample (Windows* OS)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In this example, we will integrate binary Intel TBB package into the sub_string_finder sample on Windows* OS (Microsoft* Visual Studio).
+This example is also applicable for other platforms with slight changes.
+Place holders <version> and <date> should be replaced with the actual values for the Intel TBB package being used. The example is written for `CMake 3.7.1`.
+
+Precondition:
+  * `Microsoft* Visual Studio 11` or higher.
+  * `CMake 3.0.0` or higher.
+
+#. Download the latest binary package for Windows from `this page <https://github.com/01org/tbb/releases/latest>`_ and unpack it to the directory ``C:\demo_tbb_cmake``.
+#. In the directory ``C:\demo_tbb_cmake\tbb<version>_<date>oss\examples\GettingStarted\sub_string_finder`` create ``CMakeLists.txt`` file with the following content:
+    .. code:: cmake
+
+        cmake_minimum_required(VERSION 3.0.0 FATAL_ERROR)
+
+        project(sub_string_finder CXX)
+        add_executable(sub_string_finder sub_string_finder.cpp)
+
+        # find_package will search for available TBBConfig using variables CMAKE_PREFIX_PATH and TBB_DIR.
+        find_package(TBB REQUIRED tbb)
+
+        # Link Intel TBB imported targets to the executable;
+        # "TBB::tbb" can be used instead of "${TBB_IMPORTED_TARGETS}".
+        target_link_libraries(sub_string_finder ${TBB_IMPORTED_TARGETS})
+#. Run CMake GUI and:
+    * Fill the following fields (you can use the buttons ``Browse Source...`` and ``Browse Build...`` accordingly)
+
+     * Where is the source code: ``C:/demo_tbb_cmake/tbb<version>_<date>oss/examples/GettingStarted/sub_string_finder``
+     * Where to build the binaries: ``C:/demo_tbb_cmake/tbb<version>_<date>oss/examples/GettingStarted/sub_string_finder/build``
+
+    * Add new cache entry using button ``Add Entry`` to let CMake know where to search for TBBConfig:
+
+     * Name: ``CMAKE_PREFIX_PATH``
+     * Type: ``PATH``
+     * Value: ``C:/demo_tbb_cmake/tbb<version>_<date>oss``
+
+    * Push the button ``Generate`` and choose a proper generator for your Microsoft* Visual Studio version.
+#. Now you can open the generated solution ``C:/demo_tbb_cmake/tbb<version>_<date>oss/examples/GettingStarted/sub_string_finder/build/sub_string_finder.sln`` in your Microsoft* Visual Studio and build it.
+
+Source code integration of Intel TBB to the sub_string_finder sample (Linux* OS)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In this example, we will build Intel TBB from source code with enabled Community Preview Features and link the sub_string_finder sample with the built library.
+This example is also applicable for other platforms with slight changes.
+
+Precondition:
+  * `CMake 3.0.0` or higher.
+  * `Git` (to clone the Intel TBB repository from GitHub)
+
+#. Create the directory ``~/demo_tbb_cmake``, go to the created directory and clone the Intel TBB repository there:
+    ``mkdir ~/demo_tbb_cmake ; cd ~/demo_tbb_cmake ; git clone https://github.com/01org/tbb.git``
+#. In the directory ``~/demo_tbb_cmake/tbb/examples/GettingStarted/sub_string_finder`` create ``CMakeLists.txt`` file with following content:
+    .. code:: cmake
+
+     cmake_minimum_required(VERSION 3.0.0 FATAL_ERROR)
+
+     project(sub_string_finder CXX)
+     add_executable(sub_string_finder sub_string_finder.cpp)
+
+     include(${TBB_ROOT}/cmake/TBBBuild.cmake)
+
+     # Build Intel TBB with enabled Community Preview Features (CPF).
+     tbb_build(TBB_ROOT ${TBB_ROOT} CONFIG_DIR TBB_DIR MAKE_ARGS tbb_cpf=1)
+
+     find_package(TBB REQUIRED tbb_preview)
+
+     # Link Intel TBB imported targets to the executable;
+     # "TBB::tbb_preview" can be used instead of "${TBB_IMPORTED_TARGETS}".
+     target_link_libraries(sub_string_finder ${TBB_IMPORTED_TARGETS})
+#. Create a build directory for the sub_string_finder sample to perform build out of source, go to the created directory
+    ``mkdir ~/demo_tbb_cmake/tbb/examples/GettingStarted/sub_string_finder/build ; cd ~/demo_tbb_cmake/tbb/examples/GettingStarted/sub_string_finder/build``
+#. Run CMake to prepare Makefile for the sub_string_finder sample and provide Intel TBB location (root) where to perform build:
+    ``cmake -DTBB_ROOT=${HOME}/demo_tbb_cmake/tbb ..``
+#. Make an executable and run it:
+    ``make ; ./sub_string_finder``
+
+Technical documentation for CMake modules
+-----------------------------------------
+TBBConfig
+^^^^^^^^^
+
+Configuration module for ``Intel(R) Threading Building Blocks (Intel(R) TBB)`` library.
+
+How to use this module in your CMake project:
+ #. Add location of Intel TBB (root) to `CMAKE_PREFIX_PATH <https://cmake.org/cmake/help/latest/variable/CMAKE_PREFIX_PATH.html>`_
+    or specify location of TBBConfig.cmake in ``TBB_DIR``.
+ #. Use `find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_ to configure Intel TBB.
+ #. Use provided variables and/or imported targets (described below) to work with Intel TBB.
+
+Intel TBB components can be passed to `find_package <https://cmake.org/cmake/help/latest/command/find_package.html>`_
+after keyword ``COMPONENTS`` or ``REQUIRED``.
+Use basic names of components (``tbb``, ``tbbmalloc``, ``tbb_preview``, etc.).
+
+If components are not specified then default are used: ``tbb``, ``tbbmalloc`` and ``tbbmalloc_proxy``.
+
+If ``tbbmalloc_proxy`` is requested, ``tbbmalloc`` component will also be added and set as dependency for ``tbbmalloc_proxy``.
+
+TBBConfig creates `imported targets <https://cmake.org/cmake/help/latest/manual/cmake-buildsystem.7.html#imported-targets>`_ as
+shared libraries using the following format: ``TBB::<component>`` (for example, ``TBB::tbb``, ``TBB::tbbmalloc``).
+
+Variables set during Intel TBB configuration:
+
+=========================  ================================================
+         Variable                            Description
+=========================  ================================================
+``TBB_FOUND``              Intel TBB library is found
+``TBB_<component>_FOUND``  specific Intel TBB component is found
+``TBB_IMPORTED_TARGETS``   all created Intel TBB imported targets
+``TBB_VERSION``            Intel TBB version (format: ``<major>.<minor>``)
+``TBB_INTERFACE_VERSION``  Intel TBB interface version
+=========================  ================================================
+
+TBBGet
+^^^^^^
+
+Module for getting ``Intel(R) Threading Building Blocks (Intel(R) TBB)`` library from `GitHub <https://github.com/01org/tbb>`_.
+
+Provides the following functions:
+ ``tbb_get(TBB_ROOT <variable> [RELEASE_TAG <release_tag>|LATEST] [SAVE_TO <path>] [SYSTEM_NAME Linux|Windows|Darwin] [CONFIG_DIR <variable> | SOURCE_CODE])``
+  downloads Intel TBB from GitHub and creates TBBConfig for the downloaded binary package if there is no TBBConfig.
+
+  ====================================  ====================================
+                     Parameter                       Description
+  ====================================  ====================================
+  ``TBB_ROOT <variable>``               a variable to save Intel TBB root in, ``<variable>-NOTFOUND`` will be provided in case ``tbb_get`` is unsuccessful
+  ``RELEASE_TAG <release_tag>|LATEST``  Intel TBB release tag to be downloaded (for example, ``2017_U6``), ``LATEST`` is used by default
+  ``SAVE_TO <path>``                    path to location at which to unpack downloaded Intel TBB, ``${CMAKE_CURRENT_BINARY_DIR}/tbb_downloaded`` is used by default
+  ``SYSTEM_NAME Linux|Windows|Darwin``  operating system name to download a binary package for,
+                                        value of `CMAKE_SYSTEM_NAME <https://cmake.org/cmake/help/latest/variable/CMAKE_SYSTEM_NAME.html>`_ is used by default
+  ``CONFIG_DIR <variable>``             a variable to save location of TBBConfig.cmake and TBBConfigVersion.cmake. Ignored if ``SOURCE_CODE`` specified
+  ``SOURCE_CODE``                       flag to get Intel TBB source code (instead of binary package)
+  ====================================  ====================================
+
+TBBMakeConfig
+^^^^^^^^^^^^^
+
+Module for making TBBConfig in ``Intel(R) Threading Building Blocks (Intel(R) TBB)`` binary package.
+
+This module is to be used for packages that do not have TBBConfig.
+
+Provides the following functions:
+ ``tbb_make_config(TBB_ROOT <path> CONFIG_DIR <variable> [SYSTEM_NAME Linux|Windows|Darwin])``
+  creates CMake configuration files (TBBConfig.cmake and TBBConfigVersion.cmake) for Intel TBB binary package.
+
+  ====================================  ====================================
+                     Parameter                       Description
+  ====================================  ====================================
+  ``TBB_ROOT <variable>``               path to Intel TBB root
+  ``CONFIG_DIR <variable>``             a variable to store location of the created configuration files
+  ``SYSTEM_NAME Linux|Windows|Darwin``  operating system name of the binary Intel TBB package,
+                                        value of `CMAKE_SYSTEM_NAME <https://cmake.org/cmake/help/latest/variable/CMAKE_SYSTEM_NAME.html>`_ is used by default
+  ====================================  ====================================
+
+TBBBuild
+^^^^^^^^
+
+Module for building ``Intel(R) Threading Building Blocks (Intel(R) TBB)`` library from the source code.
+
+Provides the following functions:
+ ``tbb_build(TBB_ROOT <tbb_root> CONFIG_DIR <variable> [MAKE_ARGS <custom_make_arguments>])``
+  builds Intel TBB from source code using the ``Makefile``, creates and provides the location of the CMake configuration files (TBBConfig.cmake and TBBConfigVersion.cmake) .
+
+  =====================================  ====================================
+                Parameter                             Description
+  =====================================  ====================================
+  ``TBB_ROOT <variable>``                path to Intel TBB root
+  ``CONFIG_DIR <variable>``              a variable to store location of the created configuration files,
+                                         ``<variable>-NOTFOUND`` will be provided in case ``tbb_build`` is unsuccessful
+  ``MAKE_ARGS <custom_make_arguments>``  custom arguments to be passed to ``make`` tool.
+
+                                         The following arguments are always passed with automatically detected values to
+                                         ``make`` tool if they are not redefined in ``<custom_make_arguments>``:
+
+                                           - ``compiler=<compiler>``
+                                           - ``tbb_build_dir=<tbb_build_dir>``
+                                           - ``tbb_build_prefix=<tbb_build_prefix>``
+                                           - ``-j<n>``
+  =====================================  ====================================
+
+
+------------
+
+Intel and the Intel logo are trademarks of Intel Corporation or its subsidiaries in the U.S. and/or other countries.
+
+``*`` Other names and brands may be claimed as the property of others.
diff --git a/xdl/third_party/tbb/cmake/TBBBuild.cmake b/xdl/third_party/tbb/cmake/TBBBuild.cmake
new file mode 100644
index 00000000..14f8517b
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/TBBBuild.cmake
@@ -0,0 +1,197 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#
+# Usage:
+#  include(TBBBuild.cmake)
+#  tbb_build(ROOT <tbb_root> MAKE_ARGS <arg1> [... <argN>])
+#  find_package(TBB <options>)
+#
+
+include(CMakeParseArguments)
+
+# Save the location of Intel TBB CMake modules here, as it will not be possible to do inside functions,
+# see for details: https://cmake.org/cmake/help/latest/variable/CMAKE_CURRENT_LIST_DIR.html
+set(_tbb_cmake_module_path ${CMAKE_CURRENT_LIST_DIR})
+
+##
+# Builds Intel TBB.
+#
+# Parameters:
+#  TBB_ROOT   <directory> - path to Intel TBB root directory (with sources);
+#  MAKE_ARGS  <list>      - user-defined arguments to be passed to make-tool;
+#  CONFIG_DIR <variable>  - store location of the created TBBConfig if the build was ok, store <variable>-NOTFOUND otherwise.
+#
+function(tbb_build)
+    # NOTE: internal function are used to hide them from user.
+
+    ##
+    # Provides arguments for make-command to build Intel TBB.
+    #
+    # Following arguments are provided automatically if they are not defined by user:
+    #  compiler=<value>
+    #  tbb_build_dir=<value>
+    #  tbb_build_prefix=<value>
+    #  -j<n>
+    #
+    # Parameters:
+    #  USER_DEFINED_ARGS <list> - list of user-defined arguments;
+    #  RESULT <variable> - resulting list of 'make' arguments.
+    #
+    function(tbb_get_make_args)
+        set(oneValueArgs RESULT)
+        set(multiValueArgs USER_DEFINED_ARGS)
+        cmake_parse_arguments(tbb_GMA "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+        set(result ${tbb_GMA_USER_DEFINED_ARGS})
+
+        if (NOT tbb_GMA_USER_DEFINED_ARGS MATCHES "compiler=")
+            # TODO: add other supported compilers.
+            if (CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
+                set(compiler gcc)
+            elseif (CMAKE_CXX_COMPILER_ID STREQUAL "Intel")
+                set(compiler icc)
+                if (CMAKE_SYSTEM_NAME MATCHES "Windows")
+                    set(compiler icl)
+                endif()
+            elseif (MSVC)
+                set(compiler cl)
+            elseif (CMAKE_CXX_COMPILER_ID MATCHES "Clang")
+                set(compiler clang)
+            endif()
+
+            set(result "compiler=${compiler}" ${result})
+        endif()
+
+        if (NOT tbb_GMA_USER_DEFINED_ARGS MATCHES "tbb_build_dir=")
+            set(result "tbb_build_dir=${CMAKE_CURRENT_BINARY_DIR}/tbb_cmake_build" ${result})
+        endif()
+
+        if (NOT tbb_GMA_USER_DEFINED_ARGS MATCHES "tbb_build_prefix=")
+            set(result "tbb_build_prefix=tbb_cmake_build_subdir" ${result})
+        endif()
+
+        if (NOT tbb_GMA_USER_DEFINED_ARGS MATCHES "(;|^) *\\-j[0-9]* *(;|$)")
+            include(ProcessorCount)
+            ProcessorCount(num_of_cores)
+            if (NOT num_of_cores EQUAL 0)
+                set(result "-j${num_of_cores}" ${result})
+            endif()
+        endif()
+
+        if (CMAKE_SYSTEM_NAME MATCHES "Android")
+            set(result target=android ${result})
+        endif()
+
+        set(${tbb_GMA_RESULT} ${result} PARENT_SCOPE)
+    endfunction()
+
+    ##
+    # Provides release and debug directories basing on 'make' arguments.
+    #
+    # Following 'make' arguments are parsed: tbb_build_dir, tbb_build_prefix
+    #
+    # Parameters:
+    #  MAKE_ARGS   <list>     - 'make' arguments (tbb_build_dir and tbb_build_prefix are required)
+    #  RELEASE_DIR <variable> - store normalized (CMake) path to release directory
+    #  DEBUG_DIR   <variable> - store normalized (CMake) path to debug directory
+    #
+    function(tbb_get_build_paths_from_make_args)
+        set(oneValueArgs RELEASE_DIR DEBUG_DIR)
+        set(multiValueArgs MAKE_ARGS)
+        cmake_parse_arguments(tbb_GBPFMA "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+        foreach(arg ${tbb_GBPFMA_MAKE_ARGS})
+            if (arg MATCHES "tbb_build_dir=")
+                string(REPLACE "tbb_build_dir=" "" tbb_build_dir "${arg}")
+            elseif (arg MATCHES "tbb_build_prefix=")
+                string(REPLACE "tbb_build_prefix=" "" tbb_build_prefix "${arg}")
+            endif()
+        endforeach()
+
+        set(tbb_release_dir "${tbb_build_dir}/${tbb_build_prefix}_release")
+        set(tbb_debug_dir "${tbb_build_dir}/${tbb_build_prefix}_debug")
+
+        file(TO_CMAKE_PATH "${tbb_release_dir}" tbb_release_dir)
+        file(TO_CMAKE_PATH "${tbb_debug_dir}" tbb_debug_dir)
+
+        set(${tbb_GBPFMA_RELEASE_DIR} ${tbb_release_dir} PARENT_SCOPE)
+        set(${tbb_GBPFMA_DEBUG_DIR} ${tbb_debug_dir} PARENT_SCOPE)
+    endfunction()
+
+    # -------------------- #
+    # Function entry point #
+    # -------------------- #
+    set(oneValueArgs TBB_ROOT CONFIG_DIR)
+    set(multiValueArgs MAKE_ARGS)
+    cmake_parse_arguments(tbb_build "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+    if (NOT EXISTS "${tbb_build_TBB_ROOT}/Makefile" OR NOT EXISTS "${tbb_build_TBB_ROOT}/src")
+        message(STATUS "Intel TBB can not be built: Makefile or src directory was not found in ${tbb_build_TBB_ROOT}")
+        set(${tbb_build_CONFIG_DIR} ${tbb_build_CONFIG_DIR}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    set(make_tool_name make)
+    if (CMAKE_SYSTEM_NAME MATCHES "Windows")
+        set(make_tool_name gmake)
+    elseif (CMAKE_SYSTEM_NAME MATCHES "Android")
+        set(make_tool_name ndk-build)
+    endif()
+
+    find_program(TBB_MAKE_TOOL ${make_tool_name} DOC "Make-tool to build Intel TBB.")
+    mark_as_advanced(TBB_MAKE_TOOL)
+
+    if (NOT TBB_MAKE_TOOL)
+        message(STATUS "Intel TBB can not be built: required make-tool (${make_tool_name}) was not found")
+        set(${tbb_build_CONFIG_DIR} ${tbb_build_CONFIG_DIR}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    tbb_get_make_args(USER_DEFINED_ARGS ${tbb_build_MAKE_ARGS} RESULT tbb_make_args)
+
+    set(tbb_build_cmd ${TBB_MAKE_TOOL} ${tbb_make_args})
+
+    string(REPLACE ";" " " tbb_build_cmd_str "${tbb_build_cmd}")
+    message(STATUS "Building Intel TBB: ${tbb_build_cmd_str}")
+    execute_process(COMMAND ${tbb_build_cmd}
+                    WORKING_DIRECTORY ${tbb_build_TBB_ROOT}
+                    RESULT_VARIABLE tbb_build_result
+                    ERROR_VARIABLE tbb_build_error_output
+                    OUTPUT_QUIET)
+
+    if (NOT tbb_build_result EQUAL 0)
+        message(STATUS "Building is unsuccessful (${tbb_build_result}): ${tbb_build_error_output}")
+        set(${tbb_build_CONFIG_DIR} ${tbb_build_CONFIG_DIR}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    tbb_get_build_paths_from_make_args(MAKE_ARGS ${tbb_make_args}
+                                       RELEASE_DIR tbb_release_dir
+                                       DEBUG_DIR tbb_debug_dir)
+
+    include(${_tbb_cmake_module_path}/TBBMakeConfig.cmake)
+    tbb_make_config(TBB_ROOT ${tbb_build_TBB_ROOT}
+                    SYSTEM_NAME ${CMAKE_SYSTEM_NAME}
+                    CONFIG_DIR tbb_config_dir
+                    CONFIG_FOR_SOURCE
+                    TBB_RELEASE_DIR ${tbb_release_dir}
+                    TBB_DEBUG_DIR ${tbb_debug_dir})
+
+    set(${tbb_build_CONFIG_DIR} ${tbb_config_dir} PARENT_SCOPE)
+endfunction()
diff --git a/xdl/third_party/tbb/cmake/TBBConfigVersion.cmake b/xdl/third_party/tbb/cmake/TBBConfigVersion.cmake
new file mode 100644
index 00000000..80d92ebb
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/TBBConfigVersion.cmake
@@ -0,0 +1,28 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+set(PACKAGE_VERSION 2019.0)
+
+if ("${PACKAGE_VERSION}" VERSION_LESS "${PACKAGE_FIND_VERSION}")
+    set(PACKAGE_VERSION_COMPATIBLE FALSE)
+else()
+    set(PACKAGE_VERSION_COMPATIBLE TRUE)
+    if ("${PACKAGE_VERSION}" VERSION_EQUAL "${PACKAGE_FIND_VERSION}")
+        set(PACKAGE_VERSION_EXACT TRUE)
+    endif()
+endif()
diff --git a/xdl/third_party/tbb/cmake/TBBGet.cmake b/xdl/third_party/tbb/cmake/TBBGet.cmake
new file mode 100644
index 00000000..5cb93af5
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/TBBGet.cmake
@@ -0,0 +1,298 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+include(CMakeParseArguments)
+
+# Save the location of Intel TBB CMake modules here, as it will not be possible to do inside functions,
+# see for details: https://cmake.org/cmake/help/latest/variable/CMAKE_CURRENT_LIST_DIR.html
+set(_tbb_cmake_module_path ${CMAKE_CURRENT_LIST_DIR})
+
+##
+# Downloads file.
+#
+# Parameters:
+#  URL     <url>      - URL to download data from;
+#  SAVE_AS <filename> - filename there to save downloaded data;
+#  INFO    <string>   - text description of content to be downloaded;
+#                       will be printed as message in format is "Downloading <INFO>: <URL>;
+#  FORCE              - option to delete local file from SAVE_AS if it exists;
+#
+function(_tbb_download_file)
+    set(options FORCE)
+    set(oneValueArgs URL RELEASE SAVE_AS INFO)
+    cmake_parse_arguments(tbb_df "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+    if (tbb_df_FORCE AND EXISTS "${tbb_df_SAVE_AS}")
+        file(REMOVE ${tbb_df_SAVE_AS})
+    endif()
+
+    if (NOT EXISTS "${tbb_df_SAVE_AS}")
+        set(_show_progress)
+        if (TBB_DOWNLOADING_PROGRESS)
+            set(_show_progress SHOW_PROGRESS)
+        endif()
+
+        message(STATUS "Downloading ${tbb_df_INFO}: ${tbb_df_URL}")
+        file(DOWNLOAD ${tbb_df_URL} ${tbb_df_SAVE_AS} ${_show_progress} STATUS download_status)
+
+        list(GET download_status 0 download_status_num)
+        if (NOT download_status_num EQUAL 0)
+            message(STATUS "Unsuccessful downloading: ${download_status}")
+            file(REMOVE ${tbb_df_SAVE_AS})
+            return()
+        endif()
+    else()
+        message(STATUS "Needed file was found locally ${tbb_df_SAVE_AS}. Remove it if you still want to download a new one")
+    endif()
+endfunction()
+
+##
+# Checks if specified Intel TBB release is available on GitHub.
+#
+# tbb_check_git_release(<release> <result>)
+# Parameters:
+#  <release_tag> - release to be checked;
+#  <result>  - store result (TRUE/FALSE).
+#
+function(_tbb_check_git_release_tag _tbb_release_tag _tbb_release_tag_avail)
+    if (_tbb_release_tag STREQUAL LATEST)
+        set(${_tbb_release_tag_avail} TRUE PARENT_SCOPE)
+        return()
+    endif()
+
+    set(tbb_releases_file "${CMAKE_CURRENT_BINARY_DIR}/tbb_releases.json")
+
+    _tbb_download_file(URL     "${tbb_github_api}/releases"
+                       SAVE_AS ${tbb_releases_file}
+                       INFO    "information from GitHub about Intel TBB releases"
+                       FORCE)
+
+    if (NOT EXISTS "${tbb_releases_file}")
+        set(${_tbb_release_tag_avail} FALSE PARENT_SCOPE)
+        return()
+    endif()
+
+    file(READ ${tbb_releases_file} tbb_releases)
+
+    string(REPLACE "\"" "" tbb_releases ${tbb_releases})
+    string(REGEX MATCHALL "tag_name: *([A-Za-z0-9_\\.]+)" tbb_releases ${tbb_releases})
+
+    set(_release_available FALSE)
+    foreach(tbb_rel ${tbb_releases})
+        string(REGEX REPLACE "tag_name: *" "" tbb_rel_cut ${tbb_rel})
+        list(REMOVE_ITEM tbb_releases ${tbb_rel})
+        list(APPEND tbb_releases ${tbb_rel_cut})
+        if (_tbb_release_tag STREQUAL tbb_rel_cut)
+            set(_release_available TRUE)
+            break()
+        endif()
+    endforeach()
+
+    if (NOT _release_available)
+        string(REPLACE ";" ", " tbb_releases_str "${tbb_releases}")
+        message(STATUS "Requested release tag ${_tbb_release_tag} is not available. Available Intel TBB release tags: ${tbb_releases_str}")
+    endif()
+
+    set(${_tbb_release_tag_avail} ${_release_available} PARENT_SCOPE)
+endfunction()
+
+##
+# Compares two Intel TBB releases and provides result
+# TRUE if the first release is less than the second, FALSE otherwise.
+#
+# tbb_is_release_less(<rel1> <rel2> <result>)
+#
+function(_tbb_is_release_less rel1 rel2 result)
+    # Convert release to numeric representation to compare it using "if" with VERSION_LESS.
+    string(REGEX REPLACE "[A-Za-z]" "" rel1 "${rel1}")
+    string(REPLACE "_" "." rel1 "${rel1}")
+    string(REGEX REPLACE "[A-Za-z]" "" rel2 "${rel2}")
+    string(REPLACE "_" "." rel2 "${rel2}")
+
+    if (${rel1} VERSION_LESS ${rel2})
+        set(${result} TRUE PARENT_SCOPE)
+        return()
+    endif()
+
+    set(${result} FALSE PARENT_SCOPE)
+endfunction()
+
+##
+# Finds exact URL to download Intel TBB basing on provided parameters.
+#
+# Usage:
+#  _tbb_get_url(URL <var_to_save_url> RELEASE_TAG <release_tag|LATEST> OS <os> [SOURCE_CODE])
+#
+function(_tbb_get_url)
+    set(oneValueArgs URL RELEASE_TAG OS)
+    set(options SOURCE_CODE)
+    cmake_parse_arguments(tbb_get_url "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+    set(tbb_github_api "https://api.github.com/repos/01org/tbb")
+
+    _tbb_check_git_release_tag(${tbb_get_url_RELEASE_TAG} tbb_release_available)
+    if (NOT tbb_release_available)
+        set(${tbb_download_FULL_PATH} ${tbb_download_FULL_PATH}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    if (tbb_get_url_RELEASE_TAG STREQUAL LATEST)
+        set(tbb_rel_info_api_url "${tbb_github_api}/releases/latest")
+    else()
+        set(tbb_rel_info_api_url "${tbb_github_api}/releases/tags/${tbb_get_url_RELEASE_TAG}")
+    endif()
+
+    set(tbb_release_info_file "${CMAKE_CURRENT_BINARY_DIR}/tbb_${tbb_get_url_RELEASE_TAG}_info.json")
+
+    _tbb_download_file(URL     ${tbb_rel_info_api_url}
+                       SAVE_AS ${tbb_release_info_file}
+                       INFO    "information from GitHub about packages for Intel TBB ${tbb_get_url_RELEASE_TAG}"
+                       FORCE)
+
+    if (NOT EXISTS "${tbb_release_info_file}")
+        set(${tbb_get_url_URL} ${tbb_get_url_URL}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    file(STRINGS ${tbb_release_info_file} tbb_release_info)
+
+    if (tbb_get_url_SOURCE_CODE)
+        # Find name of the latest release to get link to source archive.
+        if (tbb_get_url_RELEASE_TAG STREQUAL LATEST)
+            string(REPLACE "\"" "" tbb_release_info ${tbb_release_info})
+            string(REGEX REPLACE ".*tag_name: *([A-Za-z0-9_\\.]+).*" "\\1" tbb_get_url_RELEASE_TAG "${tbb_release_info}")
+        endif()
+
+        set(${tbb_get_url_URL} "https://github.com/01org/tbb/archive/${tbb_get_url_RELEASE_TAG}.tar.gz" PARENT_SCOPE)
+    else()
+        if (tbb_get_url_OS MATCHES "Linux")
+            set(tbb_lib_archive_suffix lin.tgz)
+        elseif (tbb_get_url_OS MATCHES "Windows")
+            set(tbb_lib_archive_suffix win.zip)
+        elseif (tbb_get_url_OS MATCHES "Darwin")
+            set(tbb_lib_archive_suffix mac.tgz)
+
+            # Since 2017_U4 release archive for Apple has suffix "mac.tgz" instead of "osx.tgz".
+            if (NOT tbb_get_url_RELEASE_TAG STREQUAL "LATEST")
+                _tbb_is_release_less(${tbb_get_url_RELEASE_TAG} 2017_U4 release_less)
+                if (release_less)
+                    set(tbb_lib_archive_suffix osx.tgz)
+                endif()
+            endif()
+        elseif (tbb_get_url_OS MATCHES "Android")
+            set(tbb_lib_archive_suffix and.tgz)
+        else()
+            message(STATUS "Currently prebuilt Intel TBB is not available for your OS (${tbb_get_url_OS})")
+            set(${tbb_get_url_URL} ${tbb_get_url_URL}-NOTFOUND PARENT_SCOPE)
+            return()
+        endif()
+
+        string(REGEX REPLACE ".*(https.*oss_${tbb_lib_archive_suffix}).*" "\\1" tbb_bin_url "${tbb_release_info}")
+
+        set(${tbb_get_url_URL} ${tbb_bin_url} PARENT_SCOPE)
+    endif()
+endfunction()
+
+function(tbb_get)
+    set(oneValueArgs RELEASE_TAG SYSTEM_NAME SAVE_TO TBB_ROOT CONFIG_DIR)
+    set(options SOURCE_CODE)
+    cmake_parse_arguments(tbb_get "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+    set(tbb_os ${CMAKE_SYSTEM_NAME})
+    if (tbb_get_SYSTEM_NAME)
+        set(tbb_os ${tbb_get_SYSTEM_NAME})
+    endif()
+
+    set(tbb_release_tag LATEST)
+    if (tbb_get_RELEASE_TAG)
+        set(tbb_release_tag ${tbb_get_RELEASE_TAG})
+    endif()
+
+    set(tbb_save_to ${CMAKE_CURRENT_BINARY_DIR}/tbb_downloaded)
+    if (tbb_get_SAVE_TO)
+        set(tbb_save_to ${tbb_get_SAVE_TO})
+    endif()
+
+    if (tbb_get_SOURCE_CODE)
+        _tbb_get_url(URL tbb_url RELEASE_TAG ${tbb_release_tag} OS ${tbb_os} SOURCE_CODE)
+    else()
+        _tbb_get_url(URL tbb_url RELEASE_TAG ${tbb_release_tag} OS ${tbb_os})
+    endif()
+
+    if (NOT tbb_url)
+        message(STATUS "URL to download Intel TBB has not been found")
+        set(${tbb_get_TBB_ROOT} ${tbb_get_TBB_ROOT}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    get_filename_component(filename ${tbb_url} NAME)
+    set(local_file "${CMAKE_CURRENT_BINARY_DIR}/${filename}")
+
+    _tbb_download_file(URL     ${tbb_url}
+                       SAVE_AS ${local_file}
+                       INFO    "Intel TBB library")
+
+    if (NOT EXISTS "${local_file}")
+        set(${tbb_get_TBB_ROOT} ${tbb_get_TBB_ROOT}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    get_filename_component(subdir_name ${filename} NAME_WE)
+    file(MAKE_DIRECTORY ${tbb_save_to}/${subdir_name})
+    if (NOT EXISTS "${tbb_save_to}/${subdir_name}")
+        message(STATUS "${tbb_save_to}/${subdir_name} can not be created")
+        set(${tbb_get_TBB_ROOT} ${tbb_get_TBB_ROOT}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    message(STATUS "Unpacking ${local_file} to ${tbb_save_to}/${subdir_name}")
+    execute_process(COMMAND ${CMAKE_COMMAND} -E tar xzf ${local_file}
+                    WORKING_DIRECTORY ${tbb_save_to}/${subdir_name}
+                    RESULT_VARIABLE unpacking_result)
+
+    if (NOT unpacking_result EQUAL 0)
+        message(STATUS "Unsuccessful unpacking: ${unpacking_result}")
+        set(${tbb_get_TBB_ROOT} ${tbb_get_TBB_ROOT}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    file(GLOB_RECURSE tbb_h ${tbb_save_to}/${subdir_name}/*/include/tbb/tbb.h)
+    list(GET tbb_h 0 tbb_h)
+
+    if (NOT EXISTS "${tbb_h}")
+        message(STATUS "tbb/tbb.h has not been found in the downloaded package")
+        set(${tbb_get_TBB_ROOT} ${tbb_get_TBB_ROOT}-NOTFOUND PARENT_SCOPE)
+        return()
+    endif()
+
+    get_filename_component(tbb_root "${tbb_h}" PATH)
+    get_filename_component(tbb_root "${tbb_root}" PATH)
+    get_filename_component(tbb_root "${tbb_root}" PATH)
+
+    if (NOT tbb_get_SOURCE_CODE)
+        set(tbb_config_dir ${tbb_root}/cmake)
+
+        if (NOT EXISTS "${tbb_config_dir}")
+            tbb_make_config(TBB_ROOT ${tbb_root} CONFIG_DIR tbb_config_dir)
+        endif()
+
+        set(${tbb_get_CONFIG_DIR} ${tbb_config_dir} PARENT_SCOPE)
+    endif()
+
+    set(${tbb_get_TBB_ROOT} ${tbb_root} PARENT_SCOPE)
+endfunction()
diff --git a/xdl/third_party/tbb/cmake/TBBMakeConfig.cmake b/xdl/third_party/tbb/cmake/TBBMakeConfig.cmake
new file mode 100644
index 00000000..54fc7c60
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/TBBMakeConfig.cmake
@@ -0,0 +1,169 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+#
+# Usage:
+#   include(TBBMakeConfig.cmake)
+#   tbb_make_config(TBB_ROOT <tbb_root> SYSTEM_NAME <system_name> CONFIG_DIR <var_to_store_config_dir> [SAVE_TO] [CONFIG_FOR_SOURCE TBB_RELEASE_DIR <tbb_release_dir> TBB_DEBUG_DIR <tbb_debug_dir>])
+#
+
+include(CMakeParseArguments)
+
+# Save the location of Intel TBB CMake modules here, as it will not be possible to do inside functions,
+# see for details: https://cmake.org/cmake/help/latest/variable/CMAKE_CURRENT_LIST_DIR.html
+set(_tbb_cmake_module_path ${CMAKE_CURRENT_LIST_DIR})
+
+function(tbb_make_config)
+    set(oneValueArgs TBB_ROOT SYSTEM_NAME CONFIG_DIR SAVE_TO TBB_RELEASE_DIR TBB_DEBUG_DIR)
+    set(options CONFIG_FOR_SOURCE)
+    cmake_parse_arguments(tbb_MK "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
+
+    set(tbb_system_name ${CMAKE_SYSTEM_NAME})
+    if (tbb_MK_SYSTEM_NAME)
+        set(tbb_system_name ${tbb_MK_SYSTEM_NAME})
+    endif()
+
+    set(tbb_config_dir ${tbb_MK_TBB_ROOT}/cmake)
+    if (tbb_MK_SAVE_TO)
+        set(tbb_config_dir ${tbb_MK_SAVE_TO})
+    endif()
+
+    file(MAKE_DIRECTORY ${tbb_config_dir})
+
+    set(TBB_DEFAULT_COMPONENTS tbb tbbmalloc tbbmalloc_proxy)
+
+    if (tbb_MK_CONFIG_FOR_SOURCE)
+        set(TBB_RELEASE_DIR ${tbb_MK_TBB_RELEASE_DIR})
+        set(TBB_DEBUG_DIR ${tbb_MK_TBB_DEBUG_DIR})
+    endif()
+
+    if (tbb_system_name STREQUAL "Linux")
+        set(TBB_SHARED_LIB_DIR "lib")
+        set(TBB_X32_SUBDIR "ia32")
+        set(TBB_X64_SUBDIR "intel64")
+        set(TBB_LIB_PREFIX "lib")
+        set(TBB_LIB_EXT "so.2")
+
+        # Note: multiline variable
+        set(TBB_CHOOSE_COMPILER_SUBDIR "if (CMAKE_CXX_COMPILER_LOADED)
+    set(_tbb_compiler_id \${CMAKE_CXX_COMPILER_ID})
+    set(_tbb_compiler_ver \${CMAKE_CXX_COMPILER_VERSION})
+elseif (CMAKE_C_COMPILER_LOADED)
+    set(_tbb_compiler_id \${CMAKE_C_COMPILER_ID})
+    set(_tbb_compiler_ver \${CMAKE_C_COMPILER_VERSION})
+endif()
+
+# For non-GCC compilers try to find version of system GCC to choose right compiler subdirectory.
+if (NOT _tbb_compiler_id STREQUAL \"GNU\")
+    execute_process(COMMAND gcc --version OUTPUT_VARIABLE _tbb_gcc_ver_output ERROR_QUIET)
+    string(REGEX REPLACE \".*gcc.*([0-9]+\\\\.[0-9]+)\\\\.[0-9]+.*\" \"\\\\1\" _tbb_compiler_ver \"\${_tbb_gcc_ver_output}\")
+    if (NOT _tbb_compiler_ver)
+        message(FATAL_ERROR \"This Intel TBB package is intended to be used only environment with available 'gcc'\")
+    endif()
+    unset(_tbb_gcc_ver_output)
+endif()
+
+set(_tbb_compiler_subdir gcc4.1)
+foreach (_tbb_gcc_version 4.1 4.4 4.7)
+    if (NOT _tbb_compiler_ver VERSION_LESS \${_tbb_gcc_version})
+        set(_tbb_compiler_subdir gcc\${_tbb_gcc_version})
+    endif()
+endforeach()
+
+unset(_tbb_compiler_id)
+unset(_tbb_compiler_ver)")
+
+    elseif (tbb_system_name STREQUAL "Windows")
+        set(TBB_SHARED_LIB_DIR "bin")
+        set(TBB_X32_SUBDIR "ia32")
+        set(TBB_X64_SUBDIR "intel64")
+        set(TBB_LIB_PREFIX "")
+        set(TBB_LIB_EXT "dll")
+
+        # Note: multiline variable
+        set(TBB_CHOOSE_COMPILER_SUBDIR "if (NOT MSVC)
+    message(FATAL_ERROR \"This Intel TBB package is intended to be used only in the project with MSVC\")
+endif()
+
+# Detect the most relevant MSVC subdirectory
+set(_tbb_msvc_1700_subdir vc11)
+set(_tbb_msvc_1800_subdir vc12)
+set(_tbb_msvc_1900_subdir vc14)
+set(_tbb_msvc_ver \${MSVC_VERSION})
+if (MSVC_VERSION VERSION_LESS 1700)
+    message(FATAL_ERROR \"This Intel TBB package is intended to be used only in the project with MSVC version 1700 (vc11) or higher\")
+elseif (MSVC_VERSION VERSION_GREATER 1900)
+    set(_tbb_msvc_ver 1900)
+endif()
+set(_tbb_compiler_subdir \${_tbb_msvc_\${_tbb_msvc_ver}_subdir})
+unset(_tbb_msvc_1700_subdir)
+unset(_tbb_msvc_1800_subdir)
+unset(_tbb_msvc_1900_subdir)
+
+if (WINDOWS_STORE)
+    set(_tbb_compiler_subdir \${_tbb_compiler_subdir}_ui)
+endif()")
+
+        if (tbb_MK_CONFIG_FOR_SOURCE)
+            set(TBB_IMPLIB_RELEASE "\nIMPORTED_IMPLIB_RELEASE \"${tbb_MK_TBB_RELEASE_DIR}/\${_tbb_component}.lib\"")
+            set(TBB_IMPLIB_DEBUG "\nIMPORTED_IMPLIB_DEBUG \"${tbb_MK_TBB_DEBUG_DIR}/\${_tbb_component}_debug.lib\"")
+        else()
+            # Note: multiline variable
+            set(TBB_IMPLIB "
+                              IMPORTED_IMPLIB_RELEASE       \"\${_tbb_root}/lib/\${_tbb_arch_subdir}/\${_tbb_compiler_subdir}/\${_tbb_component}.lib\"
+                              IMPORTED_IMPLIB_DEBUG         \"\${_tbb_root}/lib/\${_tbb_arch_subdir}/\${_tbb_compiler_subdir}/\${_tbb_component}_debug.lib\"")
+        endif()
+
+        # Note: multiline variable
+        # tbb/internal/_tbb_windef.h (included via tbb/tbb_stddef.h) does implicit linkage of some .lib files, use a special define to avoid it
+        set(TBB_COMPILE_DEFINITIONS "
+                              INTERFACE_COMPILE_DEFINITIONS \"__TBB_NO_IMPLICIT_LINKAGE=1\"")
+    elseif (tbb_system_name STREQUAL "Darwin")
+        set(TBB_SHARED_LIB_DIR "lib")
+        set(TBB_X32_SUBDIR ".")
+        set(TBB_X64_SUBDIR ".")
+        set(TBB_LIB_PREFIX "lib")
+        set(TBB_LIB_EXT "dylib")
+        set(TBB_CHOOSE_COMPILER_SUBDIR "set(_tbb_compiler_subdir .)")
+    elseif (tbb_system_name STREQUAL "Android")
+        set(TBB_SHARED_LIB_DIR "lib")
+        set(TBB_X32_SUBDIR ".")
+        set(TBB_X64_SUBDIR "x86_64")
+        set(TBB_LIB_PREFIX "lib")
+        set(TBB_LIB_EXT "so")
+        set(TBB_CHOOSE_COMPILER_SUBDIR "set(_tbb_compiler_subdir .)")
+    else()
+        message(FATAL_ERROR "Unsupported OS name: ${tbb_system_name}")
+    endif()
+
+    file(READ "${tbb_MK_TBB_ROOT}/include/tbb/tbb_stddef.h" _tbb_stddef)
+    string(REGEX REPLACE ".*#define TBB_VERSION_MAJOR ([0-9]+).*" "\\1" _tbb_ver_major "${_tbb_stddef}")
+    string(REGEX REPLACE ".*#define TBB_VERSION_MINOR ([0-9]+).*" "\\1" _tbb_ver_minor "${_tbb_stddef}")
+    string(REGEX REPLACE ".*#define TBB_INTERFACE_VERSION ([0-9]+).*" "\\1" TBB_INTERFACE_VERSION "${_tbb_stddef}")
+    set(TBB_VERSION "${_tbb_ver_major}.${_tbb_ver_minor}")
+
+    if (tbb_MK_CONFIG_FOR_SOURCE)
+        set(_tbb_config_template TBBConfigForSource.cmake.in)
+    else()
+        set(_tbb_config_template TBBConfig.cmake.in)
+    endif()
+    configure_file(${_tbb_cmake_module_path}/templates/${_tbb_config_template}   ${tbb_config_dir}/TBBConfig.cmake @ONLY)
+    configure_file(${_tbb_cmake_module_path}/templates/TBBConfigVersion.cmake.in ${tbb_config_dir}/TBBConfigVersion.cmake @ONLY)
+
+    set(${tbb_MK_CONFIG_DIR} ${tbb_config_dir} PARENT_SCOPE)
+endfunction()
diff --git a/xdl/third_party/tbb/cmake/tbb_config_generator.cmake b/xdl/third_party/tbb/cmake/tbb_config_generator.cmake
new file mode 100644
index 00000000..5c38aaa4
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/tbb_config_generator.cmake
@@ -0,0 +1,45 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+function(tbb_conf_gen_print_help)
+    message("Usage: cmake -DTBB_ROOT=<tbb_root> -DTBB_OS=Linux|Windows|Darwin [-DSAVE_TO=<path>] -P tbb_config_generator.cmake")
+endfunction()
+
+if (NOT DEFINED TBB_ROOT)
+    tbb_conf_gen_print_help()
+    message(FATAL_ERROR "Required parameter TBB_ROOT is not defined")
+endif()
+
+if (NOT EXISTS "${TBB_ROOT}")
+    tbb_conf_gen_print_help()
+    message(FATAL_ERROR "TBB_ROOT=${TBB_ROOT} does not exist")
+endif()
+
+if (NOT DEFINED TBB_OS)
+    tbb_conf_gen_print_help()
+    message(FATAL_ERROR "Required parameter TBB_OS is not defined")
+endif()
+
+if (DEFINED SAVE_TO)
+    set(tbb_conf_gen_save_to_param SAVE_TO ${SAVE_TO})
+endif()
+
+include(${CMAKE_CURRENT_LIST_DIR}/TBBMakeConfig.cmake)
+tbb_make_config(TBB_ROOT ${TBB_ROOT} CONFIG_DIR tbb_config_dir SYSTEM_NAME ${TBB_OS} ${tbb_conf_gen_save_to_param})
+
+message(STATUS "TBBConfig files were created in ${tbb_config_dir}")
diff --git a/xdl/third_party/tbb/cmake/templates/TBBConfig.cmake.in b/xdl/third_party/tbb/cmake/templates/TBBConfig.cmake.in
new file mode 100644
index 00000000..9094343c
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/templates/TBBConfig.cmake.in
@@ -0,0 +1,89 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# TBB_FOUND should not be set explicitly. It is defined automatically by CMake.
+# Handling of TBB_VERSION is in TBBConfigVersion.cmake.
+
+if (NOT TBB_FIND_COMPONENTS)
+    set(TBB_FIND_COMPONENTS "@TBB_DEFAULT_COMPONENTS@")
+    foreach (_tbb_component ${TBB_FIND_COMPONENTS})
+        set(TBB_FIND_REQUIRED_${_tbb_component} 1)
+    endforeach()
+endif()
+
+# Add components with internal dependencies: tbbmalloc_proxy -> tbbmalloc
+list(FIND TBB_FIND_COMPONENTS tbbmalloc_proxy _tbbmalloc_proxy_ix)
+if (NOT _tbbmalloc_proxy_ix EQUAL -1)
+    list(FIND TBB_FIND_COMPONENTS tbbmalloc _tbbmalloc_ix)
+    if (_tbbmalloc_ix EQUAL -1)
+        list(APPEND TBB_FIND_COMPONENTS tbbmalloc)
+        set(TBB_FIND_REQUIRED_tbbmalloc ${TBB_FIND_REQUIRED_tbbmalloc_proxy})
+    endif()
+endif()
+
+set(TBB_INTERFACE_VERSION @TBB_INTERFACE_VERSION@)
+
+get_filename_component(_tbb_root "${CMAKE_CURRENT_LIST_FILE}" PATH)
+get_filename_component(_tbb_root "${_tbb_root}" PATH)
+
+set(_tbb_x32_subdir @TBB_X32_SUBDIR@)
+set(_tbb_x64_subdir @TBB_X64_SUBDIR@)
+
+if (CMAKE_SIZEOF_VOID_P EQUAL 8)
+    set(_tbb_arch_subdir ${_tbb_x64_subdir})
+else()
+    set(_tbb_arch_subdir ${_tbb_x32_subdir})
+endif()
+
+@TBB_CHOOSE_COMPILER_SUBDIR@
+
+get_filename_component(_tbb_lib_path "${_tbb_root}/@TBB_SHARED_LIB_DIR@/${_tbb_arch_subdir}/${_tbb_compiler_subdir}" ABSOLUTE)
+
+foreach (_tbb_component ${TBB_FIND_COMPONENTS})
+    set(_tbb_release_lib "${_tbb_lib_path}/@TBB_LIB_PREFIX@${_tbb_component}.@TBB_LIB_EXT@")
+    set(_tbb_debug_lib "${_tbb_lib_path}/@TBB_LIB_PREFIX@${_tbb_component}_debug.@TBB_LIB_EXT@")
+
+    if (EXISTS "${_tbb_release_lib}" AND EXISTS "${_tbb_debug_lib}")
+        add_library(TBB::${_tbb_component} SHARED IMPORTED)
+        set_target_properties(TBB::${_tbb_component} PROPERTIES
+                              IMPORTED_CONFIGURATIONS "RELEASE;DEBUG"
+                              IMPORTED_LOCATION_RELEASE     "${_tbb_release_lib}"
+                              IMPORTED_LOCATION_DEBUG       "${_tbb_debug_lib}"
+                              INTERFACE_INCLUDE_DIRECTORIES "${_tbb_root}/include"@TBB_IMPLIB@@TBB_COMPILE_DEFINITIONS@)
+
+        # Add internal dependencies for imported targets: TBB::tbbmalloc_proxy -> TBB::tbbmalloc
+        if (_tbb_component STREQUAL tbbmalloc_proxy)
+            set_target_properties(TBB::tbbmalloc_proxy PROPERTIES INTERFACE_LINK_LIBRARIES TBB::tbbmalloc)
+        endif()
+
+        list(APPEND TBB_IMPORTED_TARGETS TBB::${_tbb_component})
+        set(TBB_${_tbb_component}_FOUND 1)
+    elseif (TBB_FIND_REQUIRED AND TBB_FIND_REQUIRED_${_tbb_component})
+        message(FATAL_ERROR "Missed required Intel TBB component: ${_tbb_component}")
+    endif()
+endforeach()
+
+unset(_tbb_x32_subdir)
+unset(_tbb_x64_subdir)
+unset(_tbb_arch_subdir)
+unset(_tbb_compiler_subdir)
+unset(_tbbmalloc_proxy_ix)
+unset(_tbbmalloc_ix)
+unset(_tbb_lib_path)
+unset(_tbb_release_lib)
+unset(_tbb_debug_lib)
diff --git a/xdl/third_party/tbb/cmake/templates/TBBConfigForSource.cmake.in b/xdl/third_party/tbb/cmake/templates/TBBConfigForSource.cmake.in
new file mode 100644
index 00000000..2bccdd9e
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/templates/TBBConfigForSource.cmake.in
@@ -0,0 +1,82 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# TBB_FOUND should not be set explicitly. It is defined automatically by CMake.
+# Handling of TBB_VERSION is in TBBConfigVersion.cmake.
+
+if (NOT TBB_FIND_COMPONENTS)
+    set(TBB_FIND_COMPONENTS "@TBB_DEFAULT_COMPONENTS@")
+    foreach (_tbb_component ${TBB_FIND_COMPONENTS})
+        set(TBB_FIND_REQUIRED_${_tbb_component} 1)
+    endforeach()
+endif()
+
+# Add components with internal dependencies: tbbmalloc_proxy -> tbbmalloc
+list(FIND TBB_FIND_COMPONENTS tbbmalloc_proxy _tbbmalloc_proxy_ix)
+if (NOT _tbbmalloc_proxy_ix EQUAL -1)
+    list(FIND TBB_FIND_COMPONENTS tbbmalloc _tbbmalloc_ix)
+    if (_tbbmalloc_ix EQUAL -1)
+        list(APPEND TBB_FIND_COMPONENTS tbbmalloc)
+        set(TBB_FIND_REQUIRED_tbbmalloc ${TBB_FIND_REQUIRED_tbbmalloc_proxy})
+    endif()
+endif()
+
+set(TBB_INTERFACE_VERSION @TBB_INTERFACE_VERSION@)
+
+get_filename_component(_tbb_root "${CMAKE_CURRENT_LIST_FILE}" PATH)
+get_filename_component(_tbb_root "${_tbb_root}" PATH)
+
+foreach (_tbb_component ${TBB_FIND_COMPONENTS})
+    set(_tbb_release_lib "@TBB_RELEASE_DIR@/@TBB_LIB_PREFIX@${_tbb_component}.@TBB_LIB_EXT@")
+    set(_tbb_debug_lib "@TBB_DEBUG_DIR@/@TBB_LIB_PREFIX@${_tbb_component}_debug.@TBB_LIB_EXT@")
+
+    if (EXISTS "${_tbb_release_lib}" OR EXISTS "${_tbb_debug_lib}")
+        add_library(TBB::${_tbb_component} SHARED IMPORTED)
+        set_target_properties(TBB::${_tbb_component} PROPERTIES
+                              INTERFACE_INCLUDE_DIRECTORIES "${_tbb_root}/include"@TBB_COMPILE_DEFINITIONS@)
+
+
+        if (EXISTS "${_tbb_release_lib}")
+            set_target_properties(TBB::${_tbb_component} PROPERTIES
+                                  IMPORTED_LOCATION_RELEASE "${_tbb_release_lib}"@TBB_IMPLIB_RELEASE@)
+            set_property(TARGET TBB::${_tbb_component} APPEND PROPERTY IMPORTED_CONFIGURATIONS RELEASE)
+        endif()
+
+        if (EXISTS "${_tbb_debug_lib}")
+            set_target_properties(TBB::${_tbb_component} PROPERTIES
+                                  IMPORTED_LOCATION_DEBUG "${_tbb_debug_lib}"@TBB_IMPLIB_DEBUG@)
+            set_property(TARGET TBB::${_tbb_component} APPEND PROPERTY IMPORTED_CONFIGURATIONS DEBUG)
+        endif()
+
+        # Add internal dependencies for imported targets: TBB::tbbmalloc_proxy -> TBB::tbbmalloc
+        if (_tbb_component STREQUAL tbbmalloc_proxy)
+            set_target_properties(TBB::tbbmalloc_proxy PROPERTIES INTERFACE_LINK_LIBRARIES TBB::tbbmalloc)
+        endif()
+
+        list(APPEND TBB_IMPORTED_TARGETS TBB::${_tbb_component})
+        set(TBB_${_tbb_component}_FOUND 1)
+    elseif (TBB_FIND_REQUIRED AND TBB_FIND_REQUIRED_${_tbb_component})
+        message(FATAL_ERROR "Missed required Intel TBB component: ${_tbb_component}")
+    endif()
+endforeach()
+
+unset(_tbbmalloc_proxy_ix)
+unset(_tbbmalloc_ix)
+unset(_tbb_lib_path)
+unset(_tbb_release_lib)
+unset(_tbb_debug_lib)
diff --git a/xdl/third_party/tbb/cmake/templates/TBBConfigVersion.cmake.in b/xdl/third_party/tbb/cmake/templates/TBBConfigVersion.cmake.in
new file mode 100644
index 00000000..f587af28
--- /dev/null
+++ b/xdl/third_party/tbb/cmake/templates/TBBConfigVersion.cmake.in
@@ -0,0 +1,28 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+set(PACKAGE_VERSION @TBB_VERSION@)
+
+if ("${PACKAGE_VERSION}" VERSION_LESS "${PACKAGE_FIND_VERSION}")
+    set(PACKAGE_VERSION_COMPATIBLE FALSE)
+else()
+    set(PACKAGE_VERSION_COMPATIBLE TRUE)
+    if ("${PACKAGE_VERSION}" VERSION_EQUAL "${PACKAGE_FIND_VERSION}")
+        set(PACKAGE_VERSION_EXACT TRUE)
+    endif()
+endif()
diff --git a/xdl/third_party/tbb/doc/Release_Notes.txt b/xdl/third_party/tbb/doc/Release_Notes.txt
new file mode 100644
index 00000000..aba73d9a
--- /dev/null
+++ b/xdl/third_party/tbb/doc/Release_Notes.txt
@@ -0,0 +1,134 @@
+------------------------------------------------------------------------
+Intel(R) Threading Building Blocks - Release Notes
+                   Version 2019
+------------------------------------------------------------------------
+
+
+System Requirements
+-------------------
+
+Intel(R) Threading Building Blocks (Intel(R) TBB) is available
+commercially (see http://software.intel.com/en-us/intel-tbb) as a
+binary distribution, and in open source, in both source and binary
+forms (see http://threadingbuildingblocks.org).
+
+When built from source, Intel(R) TBB is intended to be highly portable
+and so supports a wide variety of operating systems and platforms (see
+http://threadingbuildingblocks.org for more details).
+
+Binary distributions, including commercial distributions, are validated
+and officially supported for the hardware, software, operating systems
+and compilers listed here.
+
+Hardware - Recommended
+
+    Microsoft* Windows* Systems
+        Intel(R) Core(TM) processor family
+        Intel(R) Xeon(R) processor family
+        Intel(R) Xeon Phi(TM) processor family
+    Linux* Systems
+        Intel(R) Core(TM) processor family
+        Intel(R) Xeon(R) processor family
+        Intel(R) Xeon Phi(TM) processor family
+    macOS* Systems
+        Intel(R) Core(TM) processor family
+    Android* Systems
+        Intel(R) Atom(TM) processor family
+
+Hardware - Supported
+
+    Intel(R) Pentium(R) 4 processor family
+    Intel(R) Xeon Phi(TM) coprocessor
+    Intel(R) Atom(TM) processor family
+    Non Intel(R) processors compatible with the above processors
+
+Software - Minimum Requirements
+
+    Supported operating system (see below)
+    Supported compiler (see below)
+
+Software - Recommended
+
+    Intel(R) Parallel Studio XE 2018, 2019
+    Intel(R) System Studio 2018, 2019
+
+Software - Supported Operating Systems
+
+    Systems with Microsoft* Windows* operating systems
+        Microsoft* Windows* 10
+        Microsoft* Windows* 8.1
+        Microsoft* Windows* 7 SP1
+        Microsoft* Windows* Server 2016
+        Microsoft* Windows* Server 2012 R2
+    Systems with Linux* operating systems
+        CentOS 7.1
+        Debian* 8, 9
+        Fedora* 27
+        Intel(R) Cluster Ready
+        Red Hat* Enterprise Linux* 6, 7
+        SuSE* Linux* Enterprise Server 12
+        Ubuntu* 14.04 LTS, 16.04 LTS, 18.04 LTS
+        WindRiver* Linux 8, 9
+        Yocto 2.3
+    Systems with OS X* or macOS* operating systems
+        OS X* 10.11
+        macOS* 10.12, 10.13
+    Systems with Android* operating systems
+        Android* 5.x, 6.x, 7.x, 8.x
+
+Software - Supported Compilers
+
+    Intel(R) C++ Compiler 17, 18 and 19 version
+    Microsoft* Visual C++ 12.0 (Microsoft* Visual Studio* 2013,
+        Windows* OS only)
+    Microsoft* Visual C++ 14.0 (Microsoft* Visual Studio* 2015,
+        Windows* OS only)
+    Microsoft* Visual C++ 14.1 (Microsoft* Visual Studio* 2017,
+        Windows* OS only)
+    Microsoft* Windows* Software Development Kit for Windows* 8.1
+    Microsoft* Windows* Software Development Kit for Windows* 10
+    For each supported Linux* operating system, the standard gcc
+        version provided with that operating system is supported
+            GNU Compilers (gcc) 4.1 - 7.1
+            GNU C Library (glibc) version 2.4 - 2.19
+    Xcode* 7.0 - 9.1
+    Android* NDK r10e - r17b
+
+Software - Supported Performance Analysis Tools
+
+    Intel(R) VTune(TM) Amplifier XE 2018, 2019
+    Intel(R) Inspector XE 2018, 2019
+    Intel(R) Advisor XE 2018, 2019
+
+Known Issues
+------------
+
+Below is the list of known issues in this release of
+Intel(R) Threading Building Blocks (Intel(R) TBB).
+See the "Known Issues" appendix in the Intel(R) TBB Developer
+Reference for notes applicable to multiple releases of Intel(R) TBB.
+
+Library Issues
+
+    - If you build Intel(R) TBB from sources with GCC 6, specify
+        the -flifetime-dse=1 option to prevent crashes at runtime,
+        or use Intel(R) TBB makefiles that automatically set this option.
+
+    - The current implementation of gfx_factory does not allow memory
+        buffer objects to be used concurrently. As a result, several
+        streaming nodes customized with gfx_factory cannot be connected
+        with each other directly.
+
+------------------------------------------------------------------------
+(C) 2018 Intel Corporation
+
+Intel, the Intel logo, Intel Core, Intel Atom, Xeon, Intel Xeon Phi and
+Pentium are trademarks of Intel Corporation in the U.S. and/or other
+countries.
+
+* Other names and brands may be claimed as the property of others.
+
+Third Party and Open Source Licenses
+
+Content of some examples or binaries may be covered by various open-source
+licenses. See the index.html file in each respective folder for details.
diff --git a/xdl/third_party/tbb/doc/copyright_brand_disclaimer_doxygen.txt b/xdl/third_party/tbb/doc/copyright_brand_disclaimer_doxygen.txt
new file mode 100644
index 00000000..7ba446bb
--- /dev/null
+++ b/xdl/third_party/tbb/doc/copyright_brand_disclaimer_doxygen.txt
@@ -0,0 +1,9 @@
+<hr>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<p></p>
+Intel, Pentium, Intel Xeon, Itanium, Intel XScale and VTune are
+registered trademarks or trademarks of Intel Corporation or its
+subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
diff --git a/xdl/third_party/tbb/examples/GettingStarted/index.html b/xdl/third_party/tbb/examples/GettingStarted/index.html
new file mode 100644
index 00000000..ee3e985d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Getting Started Samples</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Getting Started Samples</h1>
+	</div>
+	
+	<p>
+		This directory contains the examples referenced by the Intel&reg; Threading Building Blocks <a href="http://software.intel.com/en-us/tbb-tutorial">Getting&nbsp;Started&nbsp;Guide</a>.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="sub_string_finder/readme.html">sub_string_finder</a>
+				<dd>Finds largest matching substrings.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/CMakeLists.txt b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/CMakeLists.txt
new file mode 100644
index 00000000..4fc7a7d2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/CMakeLists.txt
@@ -0,0 +1,15 @@
+cmake_minimum_required(VERSION 3.0.0 FATAL_ERROR)
+
+project(sub_string_finder CXX)
+add_executable(sub_string_finder sub_string_finder.cpp)
+
+include(${TBB_ROOT}/cmake/TBBBuild.cmake)
+
+# Build Intel TBB with enabled Community Preview Features (CPF).
+tbb_build(TBB_ROOT ${TBB_ROOT} CONFIG_DIR TBB_DIR MAKE_ARGS)
+
+find_package(TBB REQUIRED)
+
+# Link Intel TBB imported targets to the executable;
+# "TBB::tbb_preview" can be used instead of "${TBB_IMPORTED_TARGETS}".
+target_link_libraries(sub_string_finder ${TBB_IMPORTED_TARGETS})
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/Makefile b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/Makefile
new file mode 100644
index 00000000..cb97400b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/Makefile
@@ -0,0 +1,74 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=sub_string_finder_extended
+ARGS=
+LIGHT_PROG=sub_string_finder
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+TBBLIB = -ltbb
+TBBLIB_DEBUG = -ltbb_debug
+
+ifneq (,$(findstring mic, $(offload)))
+override CXXFLAGS += -qoffload-arch=$(offload) -qopt-report-phase:offload -D__TBB_MIC_OFFLOAD=1
+# Replace -ltbb with -tbb in the offload mode
+TBBLIB = -tbb
+TBBLIB_DEBUG += -qoffload-option,mic,ld,"-ltbb_debug"
+endif
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: *.cpp
+ifeq ($(offload),)
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o sub_string_finder sub_string_finder.cpp $(TBBLIB) $(LIBS)
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o sub_string_finder_pretty sub_string_finder_pretty.cpp $(TBBLIB) $(LIBS)
+endif
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o sub_string_finder_extended sub_string_finder_extended.cpp $(TBBLIB) $(LIBS)
+
+debug: *.cpp
+ifeq ($(offload),)
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o sub_string_finder sub_string_finder.cpp $(TBBLIB_DEBUG) $(LIBS)
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o sub_string_finder_pretty sub_string_finder_pretty.cpp  $(TBBLIB_DEBUG) $(LIBS)
+endif
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o sub_string_finder_extended sub_string_finder_extended.cpp $(TBBLIB_DEBUG) $(LIBS)
+
+clean:
+	$(RM) sub_string_finder sub_string_finder_extended sub_string_finder_pretty *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+light_test:
+	$(run_cmd) ./$(LIGHT_PROG) $(ARGS)
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/Makefile.windows b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/Makefile.windows
new file mode 100644
index 00000000..cc49a396
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/Makefile.windows
@@ -0,0 +1,59 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs examples.
+PROG=sub_string_finder_extended
+ARGS=
+LIGHT_PROG=sub_string_finder
+
+# The C++ compiler options
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+offload1 = $(offload)+
+OFFLOADFLAGS1 = $(offload1:mic+=/Qoffload-arch=mic)
+OFFLOADFLAGS2 = $(OFFLOADFLAGS1:mic-avx512+=/Qoffload-arch=mic-avx512)
+offload2 = $(offload:mic-avx512=mic)
+OFFLOADFLAGS = $(OFFLOADFLAGS2:+=) $(offload2:mic=/D__TBB_MIC_OFFLOAD /Qdiag-disable:3335,3440,3441)
+
+MYCXXFLAGS = /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 $(OFFLOADFLAGS) $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+TBB_MIC_LIB = $(offload2:mic=/Qtbb)
+TBB_DEBUG_MIC_LIB = $(offload2:mic=/Qoffload-option,mic,link,"-ltbb_debug")
+
+all: release test
+release: compiler_check
+	$(CXX) sub_string_finder.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) $(TBB_MIC_LIB) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:sub_string_finder.exe
+	$(CXX) sub_string_finder_extended.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) $(TBB_MIC_LIB) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:sub_string_finder_extended.exe
+	$(CXX) sub_string_finder_pretty.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) $(TBB_MIC_LIB) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:sub_string_finder_pretty.exe
+debug: compiler_check
+	$(CXX) sub_string_finder.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) $(TBB_DEBUG_MIC_LIB) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:sub_string_finder.exe
+	$(CXX) sub_string_finder_extended.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) $(TBB_DEBUG_MIC_LIB) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:sub_string_finder_extended.exe
+	$(CXX) sub_string_finder_pretty.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) $(TBB_DEBUG_MIC_LIB) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:sub_string_finder_pretty.exe
+clean:
+	@cmd.exe /C del sub_string_finder*.exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(LIGHT_PROG) $(ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder.sln b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder.sln
new file mode 100644
index 00000000..ffe7699b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder.sln
@@ -0,0 +1,48 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "sub_string_finder", "sub_string_finder.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A2525}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "sub_string_finder_extended", "sub_string_finder_extended.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A2526}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "sub_string_finder_pretty", "sub_string_finder_pretty.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A2524}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2525}.Release|x64.Build.0 = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2526}.Release|x64.Build.0 = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2524}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder.vcxproj b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder.vcxproj
new file mode 100644
index 00000000..89261817
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder.vcxproj
@@ -0,0 +1,198 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>sub_string_finder</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A2525}</ProjectGuid>
+    <RootNamespace>sub_string_finder</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\sub_string_finder.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder_extended.vcxproj b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder_extended.vcxproj
new file mode 100644
index 00000000..fad40433
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder_extended.vcxproj
@@ -0,0 +1,198 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>sub_string_finder_extended</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A2526}</ProjectGuid>
+    <RootNamespace>sub_string_finder_extended</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\sub_string_finder_extended.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder_pretty.vcxproj b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder_pretty.vcxproj
new file mode 100644
index 00000000..bb3e84b7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/msvs/sub_string_finder_pretty.vcxproj
@@ -0,0 +1,198 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>sub_string_finder_pretty</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A2524}</ProjectGuid>
+    <RootNamespace>sub_string_finder_pretty</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\sub_string_finder_pretty.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/readme.html b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/readme.html
new file mode 100644
index 00000000..7afbed81
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/readme.html
@@ -0,0 +1,416 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Sub_string_finder sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Sub_string_finder sample</h1>
+	</div>
+
+	<p>
+		A simple example that uses the parallel_for template in a substring matching program.
+		The Intel&reg; Threading Building Blocks <a href="http://software.intel.com/en-us/tbb-tutorial">Getting&nbsp;Started&nbsp;Guide</a> describes this example.
+	<br><br>
+		For each position 
+		in a string, the program displays the length of the largest matching substring elsewhere in the string. 
+		The program also displays the location of a largest match for each position.  Consider the string "babba" 
+		as an example. Starting at position 0, "ba" is the largest substring with a match elsewhere in the 
+		string (position 3). 
+	<br><br>
+		The code located in the <a href="sub_string_finder_extended.cpp">sub_string_finder_extended.cpp</a> file 
+		demonstrates offload programming for Intel&reg; Many Integrated Core (Intel&reg; MIC) Architecture (see <a href="../../index.html">build instructions</a>).
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="sub_string_finder.cpp">sub_string_finder.cpp</a>
+				<dd>The example as it appears in the Getting Started Guide.
+				<dt><a href="sub_string_finder_extended.cpp">sub_string_finder_extended.cpp</a>
+				<dd>An example similar to the one in the Getting Started Guide, but with an added sequential
+					implementation, and with an offload region added that can be executed on Intel&reg; MIC Architecture based coprocessor.
+					The three implementations are timed, by using tick_count,
+					and the speedup of the parallel version and 
+					the speedup of the parallel version and, if applicable, the offload version is calculated and displayed.
+				<dt><a href="sub_string_finder_pretty.cpp">sub_string_finder_pretty.cpp</a>
+				<dd>An example similar to the one in the Getting Started Guide, but with more attractive printing of the results.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+			<dt><a href="msvs/">msvs</a>
+			<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+			<dt><a href="xcode/">xcode</a>
+			<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>sub_string_finder</tt>
+				<dd>Runs the example as it appears in the Getting Started Guide.
+				<dt><tt>sub_string_finder_pretty</tt>
+				<dd>Runs the similar example with more attractive printing of the results.
+				<dt><tt>sub_string_finder_extended</tt>
+				<dd>Runs the example extended with a sequential implementation and an offload region that can be executed on Intel&reg; MIC Architecture based coprocessor.
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Threading Tools:
+				<dd>Build a <i>debug</i> version of the <tt>sub_string_finder_pretty</tt> example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it, e.g., <tt>sub_string_finder_pretty</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder.cpp b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder.cpp
new file mode 100644
index 00000000..9274c473
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder.cpp
@@ -0,0 +1,78 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <iostream>
+#include <string>
+#include <vector>
+#include <algorithm>    //std::max
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+
+static const std::size_t N = 23;
+
+class SubStringFinder {
+    const std::string &str;
+    std::vector<std::size_t> &max_array;
+    std::vector<std::size_t> &pos_array;
+public:
+    void operator() ( const tbb::blocked_range<std::size_t> &r ) const {
+        for (std::size_t i = r.begin(); i != r.end(); ++i) {
+            std::size_t max_size = 0, max_pos = 0;
+            for (std::size_t j = 0; j < str.size(); ++j) {
+                if (j != i) {
+                    std::size_t limit = str.size()-(std::max)(i,j);
+                    for (std::size_t k = 0; k < limit; ++k) {
+                        if (str[i + k] != str[j + k])
+                            break;
+                        if (k > max_size) {
+                            max_size = k;
+                            max_pos = j;
+                        }
+                    }
+                }
+            }
+            max_array[i] = max_size;
+            pos_array[i] = max_pos;
+        }
+    }
+
+    SubStringFinder( const std::string &s, std::vector<std::size_t> &m, std::vector<std::size_t> &p ) :
+        str(s), max_array(m), pos_array(p) { }
+};
+
+int main() {
+    std::string str[N] = { std::string("a"), std::string("b") };
+    for (std::size_t i = 2; i < N; ++i)
+        str[i] = str[i-1]+str[i-2];
+    std::string &to_scan = str[N-1];
+    const std::size_t num_elem = to_scan.size();
+
+    std::vector<std::size_t> max(num_elem);
+    std::vector<std::size_t> pos(num_elem);
+
+    tbb::parallel_for( tbb::blocked_range<std::size_t>( 0, num_elem ),
+                SubStringFinder( to_scan, max, pos ) );
+
+    for (std::size_t i = 0; i < num_elem; ++i)
+        std::cout << " " << max[i] << "(" << pos[i] << ")" << std::endl;
+
+    return 0;
+}
+
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder_extended.cpp b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder_extended.cpp
new file mode 100644
index 00000000..6f255b04
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder_extended.cpp
@@ -0,0 +1,166 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (push,target(mic))
+#endif // __TBB_MIC_OFFLOAD
+
+#include <iostream>
+#include <string>
+#include <vector>
+#include <algorithm>    //std::max
+
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/tick_count.h"
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (pop)
+
+class __declspec(target(mic)) SubStringFinder;
+#endif // __TBB_MIC_OFFLOAD
+
+static const std::size_t N = 22;
+
+void SerialSubStringFinder ( const std::string &str, std::vector<std::size_t> &max_array, std::vector<std::size_t> &pos_array ) {
+    for (std::size_t i = 0; i < str.size(); ++i) {
+        std::size_t max_size = 0, max_pos = 0;
+        for (std::size_t j = 0; j < str.size(); ++j)
+            if (j != i) {
+                std::size_t limit = str.size()-(std::max)(i,j);
+                for (std::size_t k = 0; k < limit; ++k) {
+                    if (str[i + k] != str[j + k])
+                        break;
+                    if (k > max_size) {
+                        max_size = k;
+                        max_pos = j;
+                    }
+                }
+            }
+        max_array[i] = max_size;
+        pos_array[i] = max_pos;
+    }
+}
+
+class SubStringFinder {
+    const char *str;
+    const std::size_t len;
+    std::size_t *max_array;
+    std::size_t *pos_array;
+public:
+    void operator() ( const tbb::blocked_range<std::size_t>& r ) const {
+        for (std::size_t i = r.begin(); i != r.end(); ++i) {
+            std::size_t max_size = 0, max_pos = 0;
+            for (std::size_t j = 0; j < len; ++j) {
+                if (j != i) {
+                    std::size_t limit = len-(std::max)(i,j);
+                    for (std::size_t k = 0; k < limit; ++k) {
+                        if (str[i + k] != str[j + k])
+                            break;
+                        if (k > max_size) {
+                            max_size = k;
+                            max_pos = j;
+                        }
+                    }
+                }
+            }
+            max_array[i] = max_size;
+            pos_array[i] = max_pos;
+        }
+    }
+    // We do not use std::vector for compatibility with offload execution
+    SubStringFinder( const char *s, const std::size_t s_len, std::size_t *m, std::size_t *p ) :
+        str(s), len(s_len), max_array(m), pos_array(p) { }
+};
+
+int main() {
+    using namespace tbb;
+
+    std::string str[N] = { std::string("a"), std::string("b") };
+    for (std::size_t i = 2; i < N; ++i)
+        str[i] = str[i-1]+str[i-2];
+    std::string &to_scan = str[N-1];
+    const std::size_t num_elem = to_scan.size();
+
+    std::vector<std::size_t> max1(num_elem);
+    std::vector<std::size_t> pos1(num_elem);
+    std::vector<std::size_t> max2(num_elem);
+    std::vector<std::size_t> pos2(num_elem);
+
+    std::cout << " Done building string." << std::endl;
+
+    tick_count serial_t0 = tick_count::now();
+    SerialSubStringFinder( to_scan, max2, pos2 );
+    tick_count serial_t1 = tick_count::now();
+    std::cout << " Done with serial version." << std::endl;
+
+    tick_count parallel_t0 = tick_count::now();
+    parallel_for(blocked_range<std::size_t>(0, num_elem, 100),
+            SubStringFinder( to_scan.c_str(), num_elem, &max1[0], &pos1[0] ) );
+    tick_count parallel_t1 = tick_count::now();
+    std::cout << " Done with parallel version." << std::endl;
+
+    for (std::size_t i = 0; i < num_elem; ++i) {
+        if (max1[i] != max2[i] || pos1[i] != pos2[i]) {
+            std::cout << "ERROR: Serial and Parallel Results are Different!" << std::endl;
+            break;
+        }
+    }
+    std::cout << " Done validating results." << std::endl;
+
+    std::cout << "Serial version ran in " << (serial_t1 - serial_t0).seconds() << " seconds" << std::endl
+              << "Parallel version ran in " <<  (parallel_t1 - parallel_t0).seconds() << " seconds" << std::endl
+              << "Resulting in a speedup of " << (serial_t1 - serial_t0).seconds() / (parallel_t1 - parallel_t0).seconds() << std::endl;
+
+#if __TBB_MIC_OFFLOAD
+    // Do offloadable version. Do the timing on host.
+
+    std::vector<std::size_t> max3(num_elem);
+    std::vector<std::size_t> pos3(num_elem);
+
+    std::size_t *max3_array = &max3[0];   // method data() for vector is not available in C++03
+    std::size_t *pos3_array = &pos3[0];
+    tick_count parallel_tt0 = tick_count::now();
+    const char *to_scan_str = to_scan.c_str();  // Offload the string as a char array.
+    #pragma offload target(mic) in(num_elem) in(to_scan_str:length(num_elem)) out(max3_array,pos3_array:length(num_elem))
+    {
+        parallel_for(blocked_range<std::size_t>(0, num_elem, 100),
+                SubStringFinder ( to_scan_str, num_elem, max3_array, pos3_array ) );
+    }
+    tick_count parallel_tt1 = tick_count::now();
+    std::cout << " Done with offloadable version." << std::endl;
+
+    // Do validation of offloadable results on host.
+    for (std::size_t i = 0; i < num_elem; ++i) {
+        if (max1[i] != max3[i] || pos1[i] != pos3[i]) {
+            std::cout << "ERROR: Serial and Offloadable Results are Different!" << std::endl;
+            break;
+        }
+    }
+    std::cout << " Done validating offloadable results." << std::endl;
+
+    std::cout << "Offloadable version ran in " << (parallel_tt1 - parallel_tt0).seconds() << " seconds" << std::endl
+              << "Resulting in a speedup of " << (serial_t1 - serial_t0).seconds() / (parallel_tt1 - parallel_tt0).seconds()
+              << " of offloadable version" << std::endl;
+
+#endif // __TBB_MIC_OFFLOAD
+
+    return 0;
+}
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder_pretty.cpp b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder_pretty.cpp
new file mode 100644
index 00000000..067d2817
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/sub_string_finder_pretty.cpp
@@ -0,0 +1,98 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <iostream>
+#include <string>
+#include <algorithm>
+#include <vector>
+#include <algorithm>    //std::max
+
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+
+static const std::size_t N = 9;
+
+class SubStringFinder {
+    const std::string &str;
+    std::vector<std::size_t> &max_array;
+    std::vector<std::size_t> &pos_array;
+public:
+    void operator() ( const tbb::blocked_range<std::size_t>& r ) const {
+        for (std::size_t i = r.begin(); i != r.end(); ++i) {
+            std::size_t max_size = 0, max_pos = 0;
+            for (std::size_t j = 0; j < str.size(); ++j) {
+                if (j != i) {
+                    std::size_t limit = str.size()-(std::max)(i,j);
+                    for (std::size_t k = 0; k < limit; ++k) {
+                        if (str[i + k] != str[j + k])
+                            break;
+                        if (k+1 > max_size) {
+                            max_size = k+1;
+                            max_pos = j;
+                        }
+                    }
+                }
+            }
+            max_array[i] = max_size;
+            pos_array[i] = max_pos;
+        }
+    }
+
+    SubStringFinder( const std::string &s, std::vector<std::size_t> &m, std::vector<std::size_t> &p ) :
+        str(s), max_array(m), pos_array(p) { }
+};
+
+int main() {
+    using namespace tbb;
+
+    std::string str[N] = { std::string("a"), std::string("b") };
+    for (std::size_t i = 2; i < N; ++i)
+        str[i] = str[i-1]+str[i-2];
+    std::string &to_scan = str[N-1];
+    const std::size_t num_elem = to_scan.size();
+    std::cout << "String to scan: " << to_scan << std::endl;
+
+    std::vector<std::size_t> max( num_elem );
+    std::vector<std::size_t> pos( num_elem );
+
+    parallel_for( blocked_range<std::size_t>( 0, num_elem, 100 ),
+            SubStringFinder( to_scan, max, pos ) );
+
+    for (std::size_t i = 0; i < num_elem; ++i) {
+        for (std::size_t j = 0; j < num_elem; ++j) {
+            if (j >= i && j < i + max[i])
+                std::cout << "_";
+            else
+                std::cout << " ";
+        }
+        std::cout << std::endl << to_scan << std::endl;
+
+        for (std::size_t j = 0; j < num_elem; ++j) {
+            if (j >= pos[i] && j < pos[i] + max[i])
+                std::cout << "*";
+            else
+                std::cout << " ";
+        }
+        std::cout << std::endl;
+    }
+
+    return 0;
+}
+
diff --git a/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/xcode/sub_string_finder.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/xcode/sub_string_finder.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..9ff1086c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/GettingStarted/sub_string_finder/xcode/sub_string_finder.xcodeproj/project.pbxproj
@@ -0,0 +1,502 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* sub_string_finder.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* sub_string_finder.cpp */; };
+		A1F594270B8F1F8100073279 /* sub_string_finder_extended.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F594260B8F1F8100073279 /* sub_string_finder_extended.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5894D218B576600DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C5894E218B57EA00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C5894F218B581400DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594140B8F1E2D00073279 /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 2147483647;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F5941D0B8F1F2D00073279 /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 2147483647;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* sub_string_finder */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = sub_string_finder; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* sub_string_finder.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = sub_string_finder.cpp; path = ../sub_string_finder.cpp; sourceTree = SOURCE_ROOT; };
+		A1F5940A0B8F1D8E00073279 /* sub_string_finder_pretty */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = sub_string_finder_pretty; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F594110B8F1E0C00073279 /* sub_string_finder_pretty.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = sub_string_finder_pretty.cpp; path = ../sub_string_finder_pretty.cpp; sourceTree = SOURCE_ROOT; };
+		A1F5941B0B8F1F0900073279 /* sub_string_finder_extended */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = sub_string_finder_extended; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F594260B8F1F8100073279 /* sub_string_finder_extended.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = sub_string_finder_extended.cpp; path = ../sub_string_finder_extended.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594080B8F1D8E00073279 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594190B8F1F0900073279 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* sub_string_finder */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = sub_string_finder;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F594260B8F1F8100073279 /* sub_string_finder_extended.cpp */,
+				A1F594110B8F1E0C00073279 /* sub_string_finder_pretty.cpp */,
+				A1F593A50B8F042A00073279 /* sub_string_finder.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* sub_string_finder */,
+				A1F5940A0B8F1D8E00073279 /* sub_string_finder_pretty */,
+				A1F5941B0B8F1F0900073279 /* sub_string_finder_extended */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* sub_string_finder */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "sub_string_finder" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5894F218B581400DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = sub_string_finder;
+			productInstallPath = "$(HOME)/bin";
+			productName = sub_string_finder;
+			productReference = 8DD76F6C0486A84900D96B5E /* sub_string_finder */;
+			productType = "com.apple.product-type.tool";
+		};
+		A1F594090B8F1D8E00073279 /* sub_string_finder_pretty */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = A1F5940C0B8F1DB600073279 /* Build configuration list for PBXNativeTarget "sub_string_finder_pretty" */;
+			buildPhases = (
+				A1F594070B8F1D8E00073279 /* Sources */,
+				A1F594080B8F1D8E00073279 /* Frameworks */,
+				A1F594140B8F1E2D00073279 /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5894E218B57EA00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = sub_string_finder_pretty;
+			productName = sub_string_finder_pretty;
+			productReference = A1F5940A0B8F1D8E00073279 /* sub_string_finder_pretty */;
+			productType = "com.apple.product-type.tool";
+		};
+		A1F5941A0B8F1F0900073279 /* sub_string_finder_extended */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = A1F5941F0B8F1F4E00073279 /* Build configuration list for PBXNativeTarget "sub_string_finder_extended" */;
+			buildPhases = (
+				A1F594180B8F1F0900073279 /* Sources */,
+				A1F594190B8F1F0900073279 /* Frameworks */,
+				A1F5941D0B8F1F2D00073279 /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5894D218B576600DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = sub_string_finder_extended;
+			productName = sub_string_finder_extended;
+			productReference = A1F5941B0B8F1F0900073279 /* sub_string_finder_extended */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "sub_string_finder" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* sub_string_finder */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				A1F5941A0B8F1F0900073279 /* sub_string_finder_extended */,
+				A1F594090B8F1D8E00073279 /* sub_string_finder_pretty */,
+				8DD76F620486A84900D96B5E /* sub_string_finder */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* sub_string_finder.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594070B8F1D8E00073279 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594180B8F1F0900073279 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F594270B8F1F8100073279 /* sub_string_finder_extended.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = sub_string_finder;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = sub_string_finder;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+		A1F5940E0B8F1DB600073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = sub_string_finder_pretty;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F594100B8F1DB600073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = sub_string_finder_pretty;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F594210B8F1F4E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = sub_string_finder_extended;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F594230B8F1F4E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = sub_string_finder_extended;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "sub_string_finder" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "sub_string_finder" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		A1F5940C0B8F1DB600073279 /* Build configuration list for PBXNativeTarget "sub_string_finder_pretty" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F5940E0B8F1DB600073279 /* Debug64 */,
+				A1F594100B8F1DB600073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		A1F5941F0B8F1F4E00073279 /* Build configuration list for PBXNativeTarget "sub_string_finder_extended" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F594210B8F1F4E00073279 /* Debug64 */,
+				A1F594230B8F1F4E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/Makefile b/xdl/third_party/tbb/examples/Makefile
new file mode 100644
index 00000000..3594be30
--- /dev/null
+++ b/xdl/third_party/tbb/examples/Makefile
@@ -0,0 +1,159 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# This file should be always located and called in $(tbb_root)/examples
+
+# Usage:
+#   make [all] [clean] [release] [debug] [test]
+#      executes specified targets for all examples.
+#   make {example's dir}/{target}
+#      calls specified example with specified target.
+#      For instance: make task/tree_sum/all
+
+tbb_root?=..
+BUILDING_PHASE:=0
+include ../build/common.inc
+
+#check, if tbb_root is not absolute path (the filter keeps only /* paths)
+ifeq ($(filter /% $(SLASH)%, $(subst :, ,$(tbb_root)) ),)
+    # also changes related variables like work_dir
+    override tbb_root := $(CWD)$(SLASH)..
+    export TBBROOT := $(tbb_root)
+endif
+
+override CXXFLAGS += $(CXX_STD_FLAGS)
+
+# give stdver priotity over autodetection
+ifneq (,$(stdver))
+    CXX0XFLAGS=-std=$(stdver)
+endif
+# empty CXX0XFLAGS exported as well, to have control over C++ autodetection
+export CXX0XFLAGS
+
+ifeq ($(tbb_os),windows)
+    ifeq ($(UNIXMODE),1)
+        EXAMPLE_MAKEFILE = Makefile
+        EXAMPLES = $(wildcard */*/$(EXAMPLE_MAKEFILE))
+        ifeq ($(compiler),gcc)
+            override CXXFLAGS += -Wl,--enable-auto-import
+        endif
+        export CPATH := $(CPATH);$(tbb_root)/include
+        export LIBRARY_PATH := $(LIBRARY_PATH);$(work_dir)_release;$(work_dir)_debug
+        export RM = cmd /C del /Q /F
+    else
+        EXAMPLE_MAKEFILE = Makefile.windows
+        EXAMPLES = $(wildcard */*/$(EXAMPLE_MAKEFILE))
+        EXAMPLE_MAKEFILE := $(if $(EXAMPLES),Makefile.windows,Makefile)
+        export INCLUDE := $(tbb_root)$(SLASH)include;$(INCLUDE)
+        export LIB := $(work_dir)_release;$(work_dir)_debug;$(LIB)
+    endif
+    work_dir := $(subst /,$(SLASH),$(work_dir))
+    export PATH := $(work_dir)_release;$(work_dir)_debug;$(PATH)
+    export TBB_ARCH_PLATFORM = $(arch)\$(runtime)
+    export TBB_TARGET_ARCH = $(arch)
+else
+    EXAMPLE_MAKEFILE = Makefile
+    EXAMPLES := $(wildcard */*/$(EXAMPLE_MAKEFILE))
+    # platform-specific settings
+    ifeq ($(arch),ia64)
+        override CXXFLAGS += $(PIC_KEY)
+    endif
+    ifneq ($(filter suncc gcc clang,$(compiler)),)
+        ifeq ($(compiler),suncc)
+            override CXXFLAGS += -I$(tbb_root)$(SLASH)include -library=stlport4 -M$(tbb_root)/build/suncc.map.pause -erroff=unassigned,attrskipunsup,badargtype2w,badbinaryopw,wbadasg,wvarhidemem,wbadinit
+        endif
+        ifeq ($(arch),intel64)
+            override CXXFLAGS += -m64
+        endif
+        ifeq ($(arch),ia32)
+            override CXXFLAGS += -m32
+        endif
+        ifeq ($(arch),ppc64)
+            override CXXFLAGS += -m64
+        endif
+        ifeq ($(arch),ppc32)
+            override CXXFLAGS += -m32
+        endif
+        ifeq ($(arch),sparc)
+            override CXXFLAGS += -mcpu=v9 -m64
+        endif
+    endif
+    ifeq ($(compiler),xl)
+        # -qsuppress=1540-0198 suppresses warnings like "1540-0198 (W) The omitted keyword "private" is assumed for base class "no_copy"."
+        # -qsuppress=1540-1401 suppresses warnings like "1540-1401 (I) An unknown "pragma ivdep" is specified."
+        override CXXFLAGS += -I$(tbb_root)$(SLASH)include -qsuppress=1540-0198:1540-1401 -L$(work_dir)_release -L$(work_dir)_debug
+        ifeq ($(arch),intel64)
+            override CXXFLAGS += -q64
+        endif
+        ifeq ($(arch),ia32)
+            override CXXFLAGS += -q32
+        endif
+        ifeq ($(arch),ppc64)
+            override CXXFLAGS += -q64
+        endif
+        ifeq ($(arch),ppc32)
+            override CXXFLAGS += -q32
+        endif
+    endif
+    ifeq ($(tbb_os),macos)
+        export DYLD_LIBRARY_PATH := $(DYLD_LIBRARY_PATH):$(work_dir)_release:$(work_dir)_debug
+        override CXXFLAGS += -Wl,-rpath,$(work_dir)_release -Wl,-rpath,$(work_dir)_debug
+    else
+        export LD_LIBRARY_PATH := $(LD_LIBRARY_PATH):$(work_dir)_release:$(work_dir)_debug
+        ifeq ($(findstring mic,$(offload) $(target)),mic)
+            mic_path=$(tbb_build_dir)$(SLASH)$(mic_tbb_build_prefix)
+            export MIC_LIBRARY_PATH := $(mic_path)_release:$(mic_path)_debug:$(MIC_LIBRARY_PATH)
+            export MIC_LD_LIBRARY_PATH := $(mic_path)_release:$(mic_path)_debug:$(MIC_LD_LIBRARY_PATH)
+        else
+            # -L necessary for non-native compilers which don't search $LIBRARY_PATH
+            override CXXFLAGS += -L$(work_dir)_release -L$(work_dir)_debug
+        endif
+    endif
+    export LIBS
+    export LIBRARY_PATH := $(LIBRARY_PATH):$(work_dir)_release:$(work_dir)_debug
+    export CPATH := $(CPATH):$(tbb_root)/include
+endif
+
+export CXXFLAGS
+COMMON_TARGETS := all clean release debug test perf_build perf_run
+# list of directories of examples
+EXAMPLES_DIRS := $(foreach T,$(EXAMPLES),$(dir $(T)))
+# targets to explicitly call example have format: {example's dir}/{example's target}
+EXAMPLES_TARGETS := $(foreach T,$(COMMON_TARGETS),$(addsuffix $(T),$(EXAMPLES_DIRS)))
+
+.PHONY: $(COMMON_TARGETS) $(EXAMPLES_TARGETS)
+
+.DEFAULT: all
+
+# execute standard targets for all examples
+$(COMMON_TARGETS):: % : $(addsuffix %,$(EXAMPLES_DIRS))
+
+# proxy rule for calling appropriate example
+$(EXAMPLES_TARGETS)::
+	@echo ------------------------ $@ ------------------------
+	-$(MAKE) -C $(@D)  -f $(EXAMPLE_MAKEFILE) $(notdir $@) CXX="$(CPLUS)" $(if $(run_cmd),run_cmd="$(run_cmd)",) $(if $(args),ARGS="$(args)",)  $(if $(UI),UI="$(UI)")
+
+printenv:
+ifeq ($(tbb_os),windows)
+	@cmd /C set PATH
+	@cmd /C set LIB
+	@cmd /C set INCLUDE
+else
+	@env | grep PATH
+endif
+
diff --git a/xdl/third_party/tbb/examples/common/copy_libraries.bat b/xdl/third_party/tbb/examples/common/copy_libraries.bat
new file mode 100644
index 00000000..87c4a594
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/copy_libraries.bat
@@ -0,0 +1,77 @@
+@echo off
+REM
+REM Copyright (c) 2005-2018 Intel Corporation
+REM
+REM Licensed under the Apache License, Version 2.0 (the "License");
+REM you may not use this file except in compliance with the License.
+REM You may obtain a copy of the License at
+REM
+REM     http://www.apache.org/licenses/LICENSE-2.0
+REM
+REM Unless required by applicable law or agreed to in writing, software
+REM distributed under the License is distributed on an "AS IS" BASIS,
+REM WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+REM See the License for the specific language governing permissions and
+REM limitations under the License.
+REM
+REM
+REM
+REM
+REM
+
+:: Getting parameters
+if ("%1") == ("") goto error0
+if ("%2") == ("") goto error0
+if ("%3") == ("") goto error0
+set arch=%1
+if ("%2") == ("debug") set postfix=_debug
+set output_dir=%3
+
+:: Optional 4th parameter to set install root
+if ("%4") NEQ ("") set TBBROOT=%4
+:: Actually we can set install root by ourselves
+if ("%TBBROOT%") == ("") set TBBROOT=%~d0%~p0..\..\
+
+:: Getting vs folders in case vc_mt binaries are not provided
+:: ordered from oldest to newest, so we end with newest available version
+if ("%VS110COMNTOOLS%") NEQ ("") set vc_dir=vc11
+if ("%VS120COMNTOOLS%") NEQ ("") set vc_dir=vc12
+if ("%VS140COMNTOOLS%") NEQ ("") set vc_dir=vc14
+:: To use Microsoft* Visual Studio* 2017 IDE, make sure the variable VS150COMNTOOLS is set in your IDE instance.
+:: If it is not, try running Microsoft Visual Studio 2017 from Microsoft* Developer Command Prompt* for VS 2017.
+:: For details, see https://developercommunity.visualstudio.com/content/problem/730/vs154-env-var-vs150comntools-missing-from-build-sy.html
+if ("%VS150COMNTOOLS%") NEQ ("") set vc_dir=vc14
+
+:: Are we standalone/oss or inside compiler?
+if exist "%TBBROOT%\bin\%arch%\%vc_dir%\tbb%postfix%.dll" set interim_path=bin\%arch%
+if exist "%TBBROOT%\..\redist\%arch%\tbb\%vc_dir%\tbb%postfix%.dll" set interim_path=..\redist\%arch%\tbb
+if ("%interim_path%") == ("") goto error1
+
+:: Do we provide vc_mt binaries?
+if exist "%TBBROOT%\%interim_path%\vc_mt\tbb%postfix%.dll" set vc_dir=vc_mt
+if ("%vc_dir%") == ("") goto error2
+
+:: We know everything we wanted and there are no errors
+:: Copying binaries
+
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbb%postfix%.dll" "%output_dir%"
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbb%postfix%.pdb" "%output_dir%"
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbbmalloc%postfix%.dll" "%output_dir%"
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbbmalloc%postfix%.pdb" "%output_dir%"
+if exist "%TBBROOT%\%interim_path%\%vc_dir%\tbb_preview%postfix%.dll" copy "%TBBROOT%\%interim_path%\%vc_dir%\tbb_preview%postfix%.dll" "%output_dir%"
+if exist "%TBBROOT%\%interim_path%\%vc_dir%\tbb_preview%postfix%.pdb" copy "%TBBROOT%\%interim_path%\%vc_dir%\tbb_preview%postfix%.pdb" "%output_dir%"
+
+goto end
+:error0
+echo number of parameters not correct
+exit /B 1
+:error1
+echo Could not determine path to TBB libraries
+exit /B 1
+:error2
+echo Could not determine Visual Studio version
+exit /B 1
+
+:end
+exit /B 0
+
diff --git a/xdl/third_party/tbb/examples/common/examples-common.inc b/xdl/third_party/tbb/examples/common/examples-common.inc
new file mode 100644
index 00000000..3417a92b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/examples-common.inc
@@ -0,0 +1,38 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# detect if a compiler can support C++11
+# If CXX0XFLAGS already set, do not change it
+ifneq (,$(findstring $(CXX), icc icpc clang++))
+    # every supported icc or clang is OK
+    CXX0XFLAGS ?= -std=c++0x
+else
+    ifneq (,$(findstring $(CXX), g++ gcc))
+        ifneq (, $(strip $(shell $(CXX) -v 2>&1 | grep "clang-")))
+            # This is clang actually,
+            # every supported clang is OK
+            CXX0XFLAGS ?= -std=c++0x
+        else
+            # support of lambda started GCC 4.5
+            ifneq (, $(strip $(shell g++ -dumpversion | egrep "^(4\.[5-9]|[5-9])")))
+               CXX0XFLAGS ?= -std=c++0x
+            endif
+        endif
+    endif
+endif
+
diff --git a/xdl/third_party/tbb/examples/common/gui/Makefile.gmake b/xdl/third_party/tbb/examples/common/gui/Makefile.gmake
new file mode 100644
index 00000000..c4aeb826
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/Makefile.gmake
@@ -0,0 +1,90 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# The C++ compiler
+#CXX=g++
+
+# detecting MS Windows (for MinGW support)
+ifeq ($(OS), Windows_NT)
+RM = cmd /C del /Q /F
+RD = cmd /C rmdir
+UI = con
+EXE = $(NAME)$(SUFFIX).exe
+
+else
+RM = rm -f
+RD = rmdir -r
+
+# detecting 64-bit platform
+arch ?= $(shell uname -m)
+# Possible values of interest: intel64 x86_64 amd64 ia64 ppc64 sparc sparc64
+x64 ?= $(findstring 64,$(subst sparc,sparc64,$(arch)))
+
+# see https://wiki.debian.org/Multiarch/Tuples
+MULTIARCH = $(arch)
+ifeq ($(arch),ia32)
+MULTIARCH = i386
+endif
+ifeq ($(arch),intel64)
+MULTIARCH = x86_64
+endif
+ifeq ($(arch),ppc32)
+MULTIARCH = powerpc
+endif
+ifeq ($(arch),sparc)
+MULTIARCH = sparc64
+endif
+MULTIARCHTUPLE ?= $(MULTIARCH)-linux-gnu
+
+# detecting UI ("mac", "x" or "con")
+ifeq ($(shell uname),Darwin)
+  UI ?= mac
+else
+  UI ?= $(shell sh -c "[ -f /usr/X11R6/lib$(x64)/libX11.so -o -f /usr/lib$(x64)/libX11.so -o -f /usr/lib/$(MULTIARCHTUPLE)/libX11.so ] && echo x")
+endif
+
+ifeq ($(UI),x)
+  EXE = $(NAME)$(SUFFIX)
+  UI_CXXFLAGS += -I/usr/X11R6/include
+  LIBS += -lpthread -L/usr/X11R6/lib$(x64) -lX11
+  # detect if libXext can be found
+  ifeq ($(shell sh -c "[ -f /usr/X11R6/lib$(x64)/libXext.so -o -f /usr/lib$(x64)/libXext.so -o -f /usr/lib/$(MULTIARCHTUPLE)/libXext.so ] && echo 0"),0)
+    LIBS += -lXext
+  else  # no libXext
+    UI_CXXFLAGS += -DX_NOSHMEM
+  endif # libXext
+
+else # ! X
+  ifeq ($(UI),mac)
+    CXX_UI?=g++
+    LIBS += -framework OpenGL -framework Foundation -framework Cocoa
+    MACUISOURCES = ../../common/gui/xcode/tbbExample/OpenGLView.m ../../common/gui/xcode/tbbExample/main.m ../../common/gui/xcode/tbbExample/tbbAppDelegate.m 
+    MACUIOBJS = OpenGLView.o main.o tbbAppDelegate.o
+    APPRES = $(NAME)$(SUFFIX).app/Contents/Resources
+    EXE = $(NAME)$(SUFFIX).app/Contents/MacOS/$(NAME)$(SUFFIX)
+
+  else # ! macOS*
+
+    EXE = $(NAME)$(SUFFIX)
+    ifeq (,$(strip $(UI)))
+       UI = con
+       $(warning Note: no graphics output capability detected, building for console output.)
+    endif
+  endif # macOS
+endif # X
+endif # Windows vs. other
diff --git a/xdl/third_party/tbb/examples/common/gui/Makefile.win b/xdl/third_party/tbb/examples/common/gui/Makefile.win
new file mode 100644
index 00000000..fb0e4a64
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/Makefile.win
@@ -0,0 +1,74 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Per-build Makefile rules (for recursive $(MAKE) calls from Makefile)
+
+# Base compile/link options
+MYCXXFLAGS = /nologo /EHsc /Zc:forScope /D WIN32 /D _MBCS /D _CRT_SECURE_NO_DEPRECATE /MP $(CXXFLAGS)
+MYLFLAGS = /link /incremental:no /fixed:no $(LFLAGS)
+CXXFLAGS_NDEBUG = /MD /O2 /Ot /Gy /D NDEBUG
+CXXFLAGS_DEBUG = /MDd /Od /Zi /D _DEBUG
+
+# Specify library directory for Direct X SDK
+DDLIB_DIR=$(DXSDK_DIR)\lib\$(XARCH:AMD64=x64)
+
+# Input and output files
+#SOURCE = v
+#RCNAME = specified externaly
+#EXE =    ^
+# defaults on XARCH = x86
+UISRC = ../../common/gui/$(UI)video.cpp
+
+default:
+
+build_echo:
+	-@echo Building$(DEBUG) $(EXE) with UI=$(UI) XARCH=$(XARCH)
+
+build_one:	build_echo build_$(UI)$(DEBUG)
+
+build_con: $(SOURCE) $(UISRC) compiler_check
+	$(CXX) $(CXXFLAGS_NDEBUG) $(MYCXXFLAGS) $(SOURCE) $(UISRC) $(MYLFLAGS) /subsystem:console /OUT:$(EXE)
+	@cmd.exe /C del *.obj
+
+build_con_debug: $(SOURCE) $(UISRC) compiler_check
+	$(CXX) $(CXXFLAGS_DEBUG) $(MYCXXFLAGS) $(SOURCE) $(UISRC) $(MYLFLAGS) /debug /subsystem:console /OUT:$(EXE)
+	@cmd.exe /C del *.obj
+
+build_gdi: $(SOURCE) $(UISRC) msvs/$(RCNAME).res compiler_check
+	$(CXX) $(CXXFLAGS_NDEBUG) /D _WINDOWS $(MYCXXFLAGS) $(SOURCE) $(UISRC) $(MYLFLAGS) msvs/$(RCNAME).res /subsystem:windows /machine:$(XARCH) /OUT:$(EXE)
+	@cmd.exe /C del *.obj
+
+build_gdi_debug: $(SOURCE) $(UISRC) msvs/$(RCNAME).res compiler_check
+	$(CXX) $(CXXFLAGS_DEBUG) /D _WINDOWS $(MYCXXFLAGS) $(SOURCE) $(UISRC) $(MYLFLAGS) msvs/$(RCNAME).res /debug /subsystem:windows /machine:$(XARCH) /OUT:$(EXE)
+	@cmd.exe /C del *.obj
+
+build_d2d: $(SOURCE) $(UISRC) msvs/$(RCNAME).res compiler_check
+	-@echo Using DirectX SDK from "$(DDLIB_DIR)"
+	$(CXX) $(CXXFLAGS_NDEBUG) /D _WINDOWS $(MYCXXFLAGS) /I "$(DXSDK_DIR)\include" $(SOURCE) $(UISRC) $(MYLFLAGS) /LIBPATH:"$(DDLIB_DIR)" msvs/$(RCNAME).res /subsystem:windows /machine:$(XARCH) /OUT:$(EXE)
+	@cmd.exe /C del *.obj
+
+build_d2d_debug: $(SOURCE) $(UISRC) msvs/$(RCNAME).res compiler_check
+	-@echo Using DirectX SDK from "$(DDLIB_DIR)"
+	$(CXX) $(CXXFLAGS_DEBUG) /D _WINDOWS $(MYCXXFLAGS) /I "$(DXSDK_DIR)\include" $(SOURCE) $(UISRC) $(MYLFLAGS) /LIBPATH:"$(DDLIB_DIR)" msvs/$(RCNAME).res /debug /subsystem:windows /machine:$(XARCH) /OUT:$(EXE)
+	@cmd.exe /C del *.obj
+
+msvs/$(RCNAME).res:
+	rc /r msvs/$(RCNAME)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/common/gui/convideo.cpp b/xdl/third_party/tbb/examples/common/gui/convideo.cpp
new file mode 100644
index 00000000..18d10968
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/convideo.cpp
@@ -0,0 +1,136 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "video.h"
+#include <cassert>
+#include <stdio.h>
+
+unsigned int *              g_pImg = 0;
+int                         g_sizex, g_sizey;
+static video *g_video = 0;
+static int g_fps = 0;
+
+#if _WIN32 || _WIN64
+
+static DWORD g_msec = 0;
+
+#ifdef _WINDOWS
+HINSTANCE video::win_hInstance = 0;
+int video::win_iCmdShow = 0;
+void video::win_set_class(WNDCLASSEX &wcex) { }
+void video::win_load_accelerators(int idc)  { }
+#endif //_WINDOWS
+
+#else
+#include <sched.h>
+#include <sys/time.h>
+struct timeval g_time;
+#endif //_WIN32||_WIN64
+
+#define CALC_FPS_ENABLED ((WINAPI_FAMILY != WINAPI_FAMILY_APP) && (!__ANDROID__))
+
+video::video()
+    // OpenGL* RGBA byte order for little-endian CPU
+    : depth(24), red_shift(0), green_shift(8), blue_shift(16),
+      red_mask(0xff), green_mask(0xff00), blue_mask(0xff0000)
+{
+    assert(g_video == 0);
+    g_video = this; title = "Video"; updating = calc_fps = false;
+}
+
+bool video::init_window(int x, int y)
+{
+    g_sizex = x; g_sizey = y;
+    g_pImg = new unsigned int[x*y];
+    running = true;
+    return false;
+}
+
+bool video::init_console()
+{
+    running = true;
+    return true;
+}
+
+void video::terminate()
+{
+#if CALC_FPS_ENABLED
+    if(calc_fps) {
+        double fps = g_fps;
+#if _WIN32 || _WIN64
+        fps /= (GetTickCount()-g_msec)/1000.0;
+#else
+        struct timezone tz; struct timeval end_time; gettimeofday(&end_time, &tz);
+        fps /= (end_time.tv_sec+1.0*end_time.tv_usec/1000000.0) - (g_time.tv_sec+1.0*g_time.tv_usec/1000000.0);
+#endif
+        printf("%s: %.1f fps\n", title, fps);
+    }
+#endif
+    g_video = 0; running = false;
+    if(g_pImg) { delete[] g_pImg; g_pImg = 0; }
+}
+
+video::~video()
+{
+    if(g_video) terminate();
+}
+
+//! Count and display FPS count in titlebar
+bool video::next_frame()
+{
+#if CALC_FPS_ENABLED
+    if(calc_fps){
+        if(!g_fps) {
+#if _WIN32 || _WIN64
+            g_msec = GetTickCount();
+#else
+            struct timezone tz; gettimeofday(&g_time, &tz);
+#endif
+        }
+        g_fps++;
+    }
+#endif
+    return running;
+}
+
+//! Do standard loop
+void video::main_loop()
+{
+    on_process();
+}
+
+//! Change window title
+void video::show_title()
+{
+}
+
+///////////////////////////////////////////// public methods of video class ///////////////////////
+
+drawing_area::drawing_area(int x, int y, int sizex, int sizey)
+    : base_index(y*g_sizex + x), max_index(g_sizex*g_sizey), index_stride(g_sizex),
+      pixel_depth(24), ptr32(g_pImg), start_x(x), start_y(y), size_x(sizex), size_y(sizey)
+{
+    assert(x < g_sizex); assert(y < g_sizey);
+    assert(x+sizex <= g_sizex); assert(y+sizey <= g_sizey);
+
+    index = base_index; // current index
+}
+
+void drawing_area::update() {}
diff --git a/xdl/third_party/tbb/examples/common/gui/d2dvideo.cpp b/xdl/third_party/tbb/examples/common/gui/d2dvideo.cpp
new file mode 100644
index 00000000..0ca77664
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/d2dvideo.cpp
@@ -0,0 +1,201 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// common Windows parts
+#include "winvideo.h"
+
+// and another headers
+#include <cassert>
+#include <stdio.h>
+#include <dxsdkver.h>
+#if _DXSDK_PRODUCT_MAJOR < 9
+#error DXSDK Version 9 and above required.
+#endif
+#include <d2d1.h>
+#include <d2d1helper.h>
+#pragma comment(lib, "d2d1.lib")
+
+ID2D1Factory *m_pD2DFactory;
+ID2D1HwndRenderTarget *m_pRenderTarget;
+ID2D1Bitmap *m_pBitmap;
+D2D1_SIZE_U bitmapSize;
+
+HANDLE g_hVSync;
+
+#include <DXErr.h>
+#pragma comment(lib, "DxErr.lib")
+
+//! Create a dialog box and tell the user what went wrong
+bool DisplayError(LPSTR lpstrErr, HRESULT hres)
+{
+    if(hres != S_OK){
+        static bool InError = false;
+        int retval = 0;
+        if (!InError)
+        {
+            InError = true;
+            const char *message = hres?DXGetErrorString(hres):0;
+            retval = MessageBoxA(g_hAppWnd, lpstrErr, hres?message:"Error!", MB_OK|MB_ICONERROR);
+            InError = false;
+        }
+    }
+    return false;
+}
+
+void DrawBitmap()
+{
+    HRESULT hr = S_OK;
+    if (m_pRenderTarget) {
+        m_pRenderTarget->BeginDraw();
+        if (m_pBitmap)
+            hr = m_pBitmap->CopyFromMemory(NULL,(BYTE*)g_pImg, 4*g_sizex);
+        DisplayError( "DrawBitmap error", hr );
+        m_pRenderTarget->DrawBitmap(m_pBitmap);
+        m_pRenderTarget->EndDraw();
+    }
+    return;
+}
+
+inline void mouse(int k, LPARAM lParam)
+{
+    int x = (int)LOWORD(lParam);
+    int y = (int)HIWORD(lParam);
+    RECT rc;
+    GetClientRect(g_hAppWnd, &rc);
+    g_video->on_mouse( x*g_sizex/(rc.right - rc.left), y*g_sizey/(rc.bottom - rc.top), k );
+}
+
+//! Win event processing function
+LRESULT CALLBACK InternalWndProc(HWND hwnd, UINT iMsg, WPARAM wParam, LPARAM lParam)
+{
+    switch (iMsg)
+    {
+        case WM_MOVE:
+            // Check to make sure our window exists before we tell it to repaint.
+            // This will fail the first time (while the window is being created).
+            if (hwnd) {
+                InvalidateRect(hwnd, NULL, FALSE);
+                UpdateWindow(hwnd);
+            }
+            return 0L;
+
+        case WM_SIZE:
+        case WM_PAINT:
+            if( g_video->running && g_video->updating ) {
+                DrawBitmap();
+                Sleep(0);
+            }
+            break;
+        // Process all mouse and keyboard events
+        case WM_LBUTTONDOWN:    mouse( 1, lParam ); break;
+        case WM_LBUTTONUP:      mouse(-1, lParam ); break;
+        case WM_RBUTTONDOWN:    mouse( 2, lParam ); break;
+        case WM_RBUTTONUP:      mouse(-2, lParam ); break;
+        case WM_MBUTTONDOWN:    mouse( 3, lParam ); break;
+        case WM_MBUTTONUP:      mouse(-3, lParam ); break;
+        case WM_CHAR:           g_video->on_key( (int)wParam); break;
+
+        // some useless stuff
+        case WM_ERASEBKGND:     return 1;  // keeps erase-background events from happening, reduces chop
+        case WM_DISPLAYCHANGE:  return 0;
+
+        // Now, shut down the window...
+        case WM_DESTROY:        PostQuitMessage(0); return 0;
+    }
+    // call user defined proc, if exists
+    return g_pUserProc? g_pUserProc(hwnd, iMsg, wParam, lParam) : DefWindowProc(hwnd, iMsg, wParam, lParam);
+}
+
+bool video::init_window(int sizex, int sizey)
+{
+    assert(win_hInstance != 0);
+    g_sizex = sizex; g_sizey = sizey;
+    if (!WinInit(win_hInstance, win_iCmdShow, gWndClass, title, false)) {
+        DisplayError("Unable to initialize the program's window.");
+        return false;
+    }
+    ShowWindow(g_hAppWnd, SW_SHOW);
+    g_pImg = new unsigned int[sizex*sizey];
+
+    HRESULT hr = S_OK;
+
+    hr = D2D1CreateFactory(D2D1_FACTORY_TYPE_SINGLE_THREADED, &m_pD2DFactory);
+    // Create a Direct2D render target.
+    if (SUCCEEDED(hr) && !m_pRenderTarget){
+        RECT rc;
+        GetClientRect(g_hAppWnd, &rc);
+
+        bitmapSize = D2D1::SizeU(
+            rc.right - rc.left,
+            rc.bottom - rc.top
+            );
+
+        hr = m_pD2DFactory->CreateHwndRenderTarget(
+            D2D1::RenderTargetProperties(),
+            D2D1::HwndRenderTargetProperties(g_hAppWnd, bitmapSize),
+            &m_pRenderTarget
+            );
+        if (SUCCEEDED(hr) && !m_pBitmap){
+            D2D1_PIXEL_FORMAT pixelFormat = D2D1::PixelFormat(
+                DXGI_FORMAT_B8G8R8A8_UNORM,
+                D2D1_ALPHA_MODE_IGNORE
+                );
+            D2D1_BITMAP_PROPERTIES bitmapProperties;
+            bitmapProperties.pixelFormat = pixelFormat;
+            m_pRenderTarget->GetDpi( &bitmapProperties.dpiX, &bitmapProperties.dpiY );
+            m_pRenderTarget->CreateBitmap(bitmapSize,bitmapProperties,&m_pBitmap);
+            m_pRenderTarget->DrawBitmap(m_pBitmap);
+        }
+    }
+
+    running = true;
+    return true;
+}
+
+void video::terminate()
+{
+    if (m_pBitmap) m_pBitmap->Release();
+    if (m_pRenderTarget) m_pRenderTarget->Release();
+    if (m_pD2DFactory) m_pD2DFactory->Release();
+    g_video = 0; running = false;
+    if(g_pImg) { delete[] g_pImg; g_pImg = 0; }
+}
+
+//////////// drawing area constructor & destructor /////////////
+
+drawing_area::drawing_area(int x, int y, int sizex, int sizey)
+    : base_index(y*g_sizex + x), max_index(g_sizex*g_sizey), index_stride(g_sizex),
+    pixel_depth(24), ptr32(g_pImg), start_x(x), start_y(y), size_x(sizex), size_y(sizey)
+{
+    assert(x < g_sizex); assert(y < g_sizey);
+    assert(x+sizex <= g_sizex); assert(y+sizey <= g_sizey);
+
+    index = base_index; // current index
+}
+
+void drawing_area::update()
+{
+    if(g_video->updating) {
+        RECT r;
+        r.left = start_x; r.right  = start_x + size_x;
+        r.top  = start_y; r.bottom = start_y + size_y;
+        InvalidateRect(g_hAppWnd, &r, false);
+    }
+}
diff --git a/xdl/third_party/tbb/examples/common/gui/dxcheck.bat b/xdl/third_party/tbb/examples/common/gui/dxcheck.bat
new file mode 100644
index 00000000..281bc6f6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/dxcheck.bat
@@ -0,0 +1,28 @@
+@echo off
+REM
+REM Copyright (c) 2005-2018 Intel Corporation
+REM
+REM Licensed under the Apache License, Version 2.0 (the "License");
+REM you may not use this file except in compliance with the License.
+REM You may obtain a copy of the License at
+REM
+REM     http://www.apache.org/licenses/LICENSE-2.0
+REM
+REM Unless required by applicable law or agreed to in writing, software
+REM distributed under the License is distributed on an "AS IS" BASIS,
+REM WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+REM See the License for the specific language governing permissions and
+REM limitations under the License.
+REM
+REM
+REM
+REM
+REM
+if "%DXSDK_DIR%"=="" goto error_no_DXSDK
+goto end
+
+:error_no_DXSDK
+echo DirectX SDK Check : error : This example requires the DirectX SDK.  Either (re)-install the DirectX SDK, or set the DXSDK_DIR environment variable to indicate where it is installed.
+
+:end
+
diff --git a/xdl/third_party/tbb/examples/common/gui/gdivideo.cpp b/xdl/third_party/tbb/examples/common/gui/gdivideo.cpp
new file mode 100644
index 00000000..3e401761
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/gdivideo.cpp
@@ -0,0 +1,146 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// common Windows parts
+#include "winvideo.h"
+// include GDI+ headers
+#include <gdiplus.h>
+// and another headers
+#include <stdio.h>
+
+// tag linking library
+#pragma comment(lib, "gdiplus.lib")
+
+// global specific variables
+Gdiplus::Bitmap *           g_pBitmap;           // main drawing bitmap
+ULONG_PTR                   gdiplusToken;
+Gdiplus::GdiplusStartupInput gdiplusStartupInput;// GDI+
+
+//! display system error
+bool DisplayError(LPSTR lpstrErr, HRESULT hres)
+{
+    static bool InError = false;
+    int retval = 0;
+    if (!InError)
+    {
+        InError = true;
+        LPCSTR lpMsgBuf;
+        if(!hres) hres = GetLastError();
+        FormatMessage( FORMAT_MESSAGE_ALLOCATE_BUFFER | FORMAT_MESSAGE_FROM_SYSTEM | FORMAT_MESSAGE_IGNORE_INSERTS,
+                               NULL, hres, MAKELANGID(LANG_NEUTRAL, SUBLANG_DEFAULT), (LPTSTR) &lpMsgBuf, 0, NULL );
+        retval = MessageBox(g_hAppWnd, lpstrErr, lpMsgBuf, MB_OK|MB_ICONERROR);
+        LocalFree( (HLOCAL)lpMsgBuf );
+        InError = false;
+    }
+    return false;
+}
+
+//! Win event processing function
+LRESULT CALLBACK InternalWndProc(HWND hwnd, UINT iMsg, WPARAM wParam, LPARAM lParam)
+{
+    switch (iMsg)
+    {
+        case WM_MOVE:
+            // Check to make sure our window exists before we tell it to repaint.
+            // This will fail the first time (while the window is being created).
+            if (hwnd) {
+                InvalidateRect(hwnd, NULL, FALSE);
+                UpdateWindow(hwnd);
+            }
+            return 0L;
+
+        case WM_PAINT:
+            {
+                PAINTSTRUCT ps;
+                Gdiplus::Graphics graphics( BeginPaint(hwnd, &ps) );
+                // redraw just requested area. This call is as fast as simple DrawImage() call.
+                if(g_video->updating) graphics.DrawImage(g_pBitmap, ps.rcPaint.left, ps.rcPaint.top, ps.rcPaint.left, ps.rcPaint.top,
+                                    ps.rcPaint.right, ps.rcPaint.bottom, Gdiplus::UnitPixel);
+                EndPaint(hwnd, &ps);
+            }
+            return 0L;
+
+        // Process all mouse and keyboard events
+        case WM_LBUTTONDOWN:    g_video->on_mouse( (int)LOWORD(lParam), (int)HIWORD(lParam), 1); break;
+        case WM_LBUTTONUP:      g_video->on_mouse( (int)LOWORD(lParam), (int)HIWORD(lParam), -1); break;
+        case WM_RBUTTONDOWN:    g_video->on_mouse( (int)LOWORD(lParam), (int)HIWORD(lParam), 2); break;
+        case WM_RBUTTONUP:      g_video->on_mouse( (int)LOWORD(lParam), (int)HIWORD(lParam), -2); break;
+        case WM_MBUTTONDOWN:    g_video->on_mouse( (int)LOWORD(lParam), (int)HIWORD(lParam), 3); break;
+        case WM_MBUTTONUP:      g_video->on_mouse( (int)LOWORD(lParam), (int)HIWORD(lParam), -3); break;
+        case WM_CHAR:           g_video->on_key( (int)wParam); break;
+
+        // some useless stuff
+        case WM_ERASEBKGND:     return 1;  // keeps erase-background events from happening, reduces chop
+        case WM_DISPLAYCHANGE:  return 0;
+
+        // Now, shut down the window...
+        case WM_DESTROY:        PostQuitMessage(0); return 0;
+    }
+    // call user defined proc, if exists
+    return g_pUserProc? g_pUserProc(hwnd, iMsg, wParam, lParam) : DefWindowProc(hwnd, iMsg, wParam, lParam);
+}
+
+///////////// video functions ////////////////
+
+bool video::init_window(int sizex, int sizey)
+{
+    assert(win_hInstance != 0);
+    g_sizex = sizex; g_sizey = sizey;
+    if (!WinInit(win_hInstance, win_iCmdShow, gWndClass, title, true)) {
+        DisplayError("Unable to initialize the program's window.");
+        return false;
+    }
+    ShowWindow(g_hAppWnd, SW_SHOW);
+    Gdiplus::GdiplusStartup(&gdiplusToken, &gdiplusStartupInput, NULL);
+    g_pImg = new unsigned int[sizex*sizey];
+    g_pBitmap = new Gdiplus::Bitmap(g_sizex, g_sizey, 4*g_sizex, PixelFormat32bppRGB, (BYTE*)g_pImg );
+    running = true;
+    return true;
+}
+
+void video::terminate()
+{
+    if(g_pBitmap) { delete g_pBitmap; g_pBitmap = 0; }
+    Gdiplus::GdiplusShutdown(gdiplusToken);
+    g_video = 0; running = false;
+    if(g_pImg) { delete[] g_pImg; g_pImg = 0; }
+}
+
+//////////// drawing area constructor & destructor /////////////
+
+drawing_area::drawing_area(int x, int y, int sizex, int sizey)
+    : base_index(y*g_sizex + x), max_index(g_sizex*g_sizey), index_stride(g_sizex),
+      pixel_depth(24), ptr32(g_pImg), start_x(x), start_y(y), size_x(sizex), size_y(sizey)
+{
+    assert(x < g_sizex); assert(y < g_sizey);
+    assert(x+sizex <= g_sizex); assert(y+sizey <= g_sizey);
+
+    index = base_index; // current index
+}
+
+void drawing_area::update()
+{
+    if(g_video->updating) {
+        RECT r;
+        r.left = start_x; r.right  = start_x + size_x;
+        r.top  = start_y; r.bottom = start_y + size_y;
+        InvalidateRect(g_hAppWnd, &r, false);
+    }
+}
diff --git a/xdl/third_party/tbb/examples/common/gui/macvideo.cpp b/xdl/third_party/tbb/examples/common/gui/macvideo.cpp
new file mode 100644
index 00000000..a35ccb7f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/macvideo.cpp
@@ -0,0 +1,164 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "video.h"
+#include <cassert>
+#include <stdio.h>
+#include <iostream>
+#include <pthread.h>
+
+unsigned int* g_pImg = 0;
+int g_sizex=0, g_sizey=0;
+static video *g_video = 0;
+static int g_fps = 0;
+char *window_title=NULL;
+#define WINDOW_TITLE_SIZE 256
+int cocoa_update=0;
+
+#include <sched.h>
+#include <sys/time.h>
+struct timeval g_time;
+
+video::video()
+#if __TBB_IOS
+    : depth(24), red_shift(0), green_shift(8), blue_shift(16),
+    red_mask(0xff), green_mask(0xff00), blue_mask(0xff0000)
+#else
+    : depth(24), red_shift(16), green_shift(8), blue_shift(0),
+    red_mask(0xff0000), green_mask(0xff00), blue_mask(0xff)
+#endif
+{
+    assert(g_video == 0);
+    g_video = this; title = "Video"; cocoa_update=1; updating = true; calc_fps = false;
+}
+
+bool video::init_window(int x, int y)
+{
+    g_sizex = x; g_sizey = y;
+    g_pImg = new unsigned int[x*y];
+    if( window_title==NULL )
+        window_title = (char*)malloc(WINDOW_TITLE_SIZE);
+    strncpy( window_title, title, WINDOW_TITLE_SIZE-1 );
+    running = true;
+    return true;
+}
+
+bool video::init_console()
+{
+    running = true;
+    return true;
+}
+
+void video::terminate()
+{
+    if(calc_fps) {
+        double fps = g_fps;
+        struct timezone tz; struct timeval end_time; gettimeofday(&end_time, &tz);
+        fps /= (end_time.tv_sec+1.0*end_time.tv_usec/1000000.0) - (g_time.tv_sec+1.0*g_time.tv_usec/1000000.0);
+        printf("%s: %.1f fps\n", title, fps);
+    }
+    g_video = 0; running = false;
+    if(g_pImg) { delete[] g_pImg; g_pImg = 0; }
+}
+
+video::~video()
+{
+    if(g_video) terminate();
+}
+
+//! Count and display FPS count in titlebar
+bool video::next_frame()
+{
+    if(calc_fps){
+        if(!g_fps) {
+            struct timezone tz; gettimeofday(&g_time, &tz);
+        }
+        g_fps++;
+    }
+    struct timezone tz; struct timeval now_time; gettimeofday(&now_time, &tz);
+    double sec=((now_time.tv_sec+1.0*now_time.tv_usec/1000000.0) - (g_time.tv_sec+1.0*g_time.tv_usec/1000000.0));
+    if( sec>1 ){
+        if(calc_fps) {
+            memcpy(&g_time, &now_time, sizeof(g_time));
+            int fps;
+            fps = g_fps/sec;
+            cocoa_update = (int)updating;
+            snprintf(window_title,WINDOW_TITLE_SIZE, "%s%s: %d fps", title, updating?"":" (no updating)", int(fps));
+            g_fps=0;
+        }
+    }
+    return running;
+}
+
+
+void* thread_func(void*)
+{
+    g_video->on_process();
+    exit(EXIT_SUCCESS);
+}
+
+extern "C" void on_mouse_func(int x, int y, int k)
+{
+    g_video->on_mouse(x, y, k);
+    return;
+}
+
+extern "C" void on_key_func(int x)
+{
+    g_video->on_key(x);
+    return;
+}
+
+extern "C" int cocoa_main( int argc, char *argv[] );
+//! Do standard loop
+void video::main_loop()
+{
+    pthread_t handle;
+    pthread_attr_t attr;
+    pthread_attr_init(&attr);
+    pthread_create(&handle,&attr,&thread_func,(void*)NULL);
+    pthread_detach(handle);
+    cocoa_main( 0, NULL );
+}
+
+//! Change window title
+void video::show_title()
+{
+    if(title)
+        strncpy( window_title, title, WINDOW_TITLE_SIZE );
+    return;
+}
+
+///////////////////////////////////////////// public methods of video class ///////////////////////
+
+drawing_area::drawing_area(int x, int y, int sizex, int sizey)
+    : base_index(y*g_sizex + x), max_index(g_sizex*g_sizey), index_stride(g_sizex),
+    pixel_depth(24), ptr32(g_pImg), start_x(x), start_y(y), size_x(sizex), size_y(sizey)
+{
+    assert(x < g_sizex); assert(y < g_sizey);
+    assert(x+sizex <= g_sizex); assert(y+sizey <= g_sizey);
+
+    index = base_index; // current index
+}
+
+void drawing_area::update()
+{
+    //nothing to do, updating via timer in cocoa part.
+}
diff --git a/xdl/third_party/tbb/examples/common/gui/video.h b/xdl/third_party/tbb/examples/common/gui/video.h
new file mode 100644
index 00000000..db347e03
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/video.h
@@ -0,0 +1,241 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __VIDEO_H__
+#define __VIDEO_H__
+
+#include <cassert>
+#if _MSC_VER
+#include <stddef.h> // for uintptr_t
+#else
+#include <stdint.h> // for uintptr_t
+#endif
+#if _WIN32 || _WIN64
+#include <windows.h>
+#else
+#include <unistd.h>
+#endif
+
+typedef unsigned int color_t;
+typedef unsigned char colorcomp_t;
+typedef signed char depth_t;
+
+//! Class for getting access to drawing memory
+class drawing_memory
+{
+#ifdef __TBB_MIC_OFFLOAD
+    // The address is kept as uintptr_t since
+    // the compiler could not offload a pointer
+#endif
+    uintptr_t   my_address;
+public:
+    depth_t     pixel_depth;
+    int         sizex, sizey;
+    //! Get drawing memory
+    inline char* get_address() const { return reinterpret_cast<char*>(my_address); }
+    //! Get drawing memory size
+    inline int get_size() const { return ((pixel_depth>16) ? 4:2) * sizex * sizey; }
+    //! Set drawing memory
+    inline void set_address(char *mem) { my_address = reinterpret_cast<uintptr_t>(mem); }
+
+    friend class drawing_area;
+    friend class video;
+};
+
+//! Simple proxy class for managing of different video systems
+class video
+{
+    //! colorspace information
+    depth_t depth, red_shift, green_shift, blue_shift;
+    color_t red_mask, green_mask, blue_mask;
+    friend class drawing_area;
+
+public:
+    //! Constructor
+    video();
+    //! Destructor
+    ~video();
+    //! member to set window name
+    const char *title;
+    //! true is enable to show fps
+    bool calc_fps;
+    //! if true: on windows fork processing thread for on_process(), on non-windows note that next_frame() is called concurrently.
+    bool threaded;
+    //! true while running within main_loop()
+    bool running;
+    //! if true, do gui updating
+    bool updating;
+    //! initialize graphical video system
+    bool init_window(int sizex, int sizey);
+    //! initialize console. returns true if console is available
+    bool init_console();
+    //! terminate video system
+    void terminate();
+    //! Do standard event & processing loop. Use threaded = true to separate event/updating loop from frame processing
+    void main_loop();
+    //! Process next frame
+    bool next_frame();
+    //! Change window title
+    void show_title();
+    //! translate RGB components into packed type
+    inline color_t get_color(colorcomp_t red, colorcomp_t green, colorcomp_t blue) const;
+    //! Get drawing memory descriptor
+    inline drawing_memory get_drawing_memory() const;
+
+    //! code of the ESCape key
+    static const int esc_key = 27;
+    //! Mouse events handler.
+    virtual void on_mouse(int x, int y, int key) { }
+    //! Mouse events handler.
+    virtual void on_key(int key) { }
+    //! Main processing loop. Redefine with your own
+    virtual void on_process() { while(next_frame()); }
+
+#ifdef _WINDOWS
+    //! Windows specific members
+    //! if VIDEO_WINMAIN isn't defined then set this just before init() by arguments of WinMain
+    static HINSTANCE win_hInstance; static int win_iCmdShow;
+    //! optionally call it just before init() to set own. Use ascii strings convention
+    void win_set_class(WNDCLASSEX &);
+    //! load and set accelerator table from resources
+    void win_load_accelerators(int idc);
+#endif
+};
+
+//! Drawing class
+class drawing_area
+{
+    const size_t base_index, max_index, index_stride;
+    const depth_t pixel_depth;
+    unsigned int * const ptr32;
+    size_t index;
+public:
+    const int start_x, start_y, size_x, size_y;
+    //! constructors
+    drawing_area(int x, int y, int sizex, int sizey);
+    inline drawing_area(int x, int y, int sizex, int sizey, const drawing_memory &dmem);
+    //! destructor
+    inline ~drawing_area();
+    //! update the image
+    void update();
+    //! set current position. local_x could be bigger then size_x
+    inline void set_pos(int local_x, int local_y);
+    //! put pixel in current position with incremental address calculating to next right pixel
+    inline void put_pixel(color_t color);
+    //! draw pixel at position by packed color
+    void set_pixel(int localx, int localy, color_t color)
+        { set_pos(localx, localy); put_pixel(color); }
+};
+
+extern int g_sizex;
+extern int g_sizey;
+extern unsigned int *g_pImg;
+
+inline drawing_memory video::get_drawing_memory() const
+{
+    drawing_memory dmem;
+    dmem.pixel_depth = depth;
+    dmem.my_address = reinterpret_cast<uintptr_t>(g_pImg);
+    dmem.sizex = g_sizex;
+    dmem.sizey = g_sizey;
+    return dmem;
+}
+
+inline color_t video::get_color(colorcomp_t red, colorcomp_t green, colorcomp_t blue) const
+{
+    if(red_shift == 16) // only for depth == 24 && red_shift > blue_shift
+        return (red<<16) | (green<<8) | blue;
+    else if(depth >= 24)
+        return
+#if __ANDROID__
+                // Setting Alpha to 0xFF
+                0xFF000000 |
+#endif
+                (red<<red_shift) | (green<<green_shift) | (blue<<blue_shift);
+    else if(depth > 0) {
+        depth_t bs = blue_shift, rs = red_shift;
+        if(blue_shift < 0) blue >>= -bs, bs = 0;
+        else /*red_shift < 0*/ red >>= -rs, rs = 0;
+        return ((red<<rs)&red_mask) | ((green<<green_shift)&green_mask) | ((blue<<bs)&blue_mask);
+    } else { // UYVY colorspace
+        unsigned y, u, v;
+        y = red * 77 + green * 150 + blue * 29; // sum(77+150+29=256) * max(=255):  limit->2^16
+        u = (2048 + (blue << 3) - (y >> 5)) >> 4; // (limit->2^12)>>4
+        v = (2048 + (red << 3) - (y >> 5)) >> 4;
+        y = y >> 8;
+        return u | (y << 8) | (v << 16) | (y << 24);
+    }
+}
+
+inline drawing_area::drawing_area(int x, int y, int sizex, int sizey, const drawing_memory &dmem)
+    : base_index(y*dmem.sizex + x), max_index(dmem.sizex*dmem.sizey), index_stride(dmem.sizex),
+    pixel_depth(dmem.pixel_depth), ptr32(reinterpret_cast<unsigned int*>(dmem.my_address)),
+    start_x(x), start_y(y), size_x(sizex), size_y(sizey)
+{
+    assert(x < dmem.sizex); assert(y < dmem.sizey);
+    assert(x+sizex <= dmem.sizex); assert(y+sizey <= dmem.sizey);
+
+    index = base_index; // current index
+}
+
+inline void drawing_area::set_pos(int local_x, int local_y)
+{
+    index = base_index + local_x + local_y*index_stride;
+}
+
+inline void drawing_area::put_pixel(color_t color)
+{
+    assert(index < max_index);
+    if(pixel_depth > 16) ptr32[index++] = color;
+    else if(pixel_depth > 0)
+        ((unsigned short*)ptr32)[index++] = (unsigned short)color;
+    else { // UYVY colorspace
+        if(index&1) color >>= 16;
+        ((unsigned short*)ptr32)[index++] = (unsigned short)color;
+    }
+}
+
+inline drawing_area::~drawing_area()
+{
+#if ! __TBB_DEFINE_MIC
+    update();
+#endif
+}
+
+#if defined(_WINDOWS) && (defined(VIDEO_WINMAIN) || defined(VIDEO_WINMAIN_ARGS) )
+#include <cstdlib>
+//! define WinMain for subsystem:windows.
+#ifdef VIDEO_WINMAIN_ARGS
+int main(int, char *[]);
+#else
+int main();
+#endif
+int WINAPI WinMain(HINSTANCE hInstance, HINSTANCE, PSTR szCmdLine, int iCmdShow)
+{
+    video::win_hInstance = hInstance;  video::win_iCmdShow = iCmdShow;
+#ifdef VIDEO_WINMAIN_ARGS
+    return main(__argc, __argv);
+#else
+    return main();
+#endif
+}
+#endif
+
+#endif// __VIDEO_H__
diff --git a/xdl/third_party/tbb/examples/common/gui/winvideo.h b/xdl/third_party/tbb/examples/common/gui/winvideo.h
new file mode 100644
index 00000000..c5ae8a3b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/winvideo.h
@@ -0,0 +1,283 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/////// Common internal implementation of Windows-specific stuff //////////////
+///////                  Must be the first included header       //////////////
+
+#ifndef __WINVIDEO_H__
+#define __WINVIDEO_H__
+
+#ifndef _CRT_SECURE_NO_DEPRECATE
+#define _CRT_SECURE_NO_DEPRECATE
+#endif
+// Check that the target Windows version has all API calls requried.
+#ifndef _WIN32_WINNT
+# define _WIN32_WINNT 0x0400
+#endif
+#if _WIN32_WINNT<0x0400
+# define YIELD_TO_THREAD() Sleep(0)
+#else
+# define YIELD_TO_THREAD() SwitchToThread()
+#endif
+#include "video.h"
+#include <fcntl.h>
+#include <io.h>
+#include <iostream>
+#include <fstream>
+
+#pragma comment(lib, "gdi32.lib")
+#pragma comment(lib, "user32.lib")
+
+// maximum mumber of lines the output console should have
+static const WORD MAX_CONSOLE_LINES = 500;
+const COLORREF              RGBKEY = RGB(8, 8, 16); // at least 8 for 16-bit palette
+HWND                        g_hAppWnd;           // The program's window handle
+HANDLE                      g_handles[2] = {0,0};// thread and wake up event
+unsigned int *              g_pImg = 0;          // drawing memory
+int                         g_sizex, g_sizey;
+static video *              g_video = 0;
+WNDPROC                     g_pUserProc = 0;
+HINSTANCE                   video::win_hInstance = 0;
+int                         video::win_iCmdShow = 0;
+static WNDCLASSEX *         gWndClass = 0;
+static HACCEL               hAccelTable = 0;
+static DWORD                g_msec = 0;
+static int g_fps = 0, g_updates = 0, g_skips = 0;
+
+bool DisplayError(LPSTR lpstrErr, HRESULT hres = 0); // always returns false
+LRESULT CALLBACK InternalWndProc(HWND hwnd, UINT iMsg, WPARAM wParam, LPARAM lParam);
+
+//! Create window
+bool WinInit(HINSTANCE hInstance, int nCmdShow, WNDCLASSEX *uwc, const char *title, bool fixedsize)
+{
+    WNDCLASSEX wndclass;  // Our app's windows class
+    if(uwc) {
+        memcpy(&wndclass, uwc, sizeof(wndclass));
+        g_pUserProc = uwc->lpfnWndProc;
+    } else {
+        memset(&wndclass, 0, sizeof(wndclass));
+        wndclass.hCursor = LoadCursor(NULL, IDC_ARROW);
+        wndclass.lpszClassName = title;
+    }
+    wndclass.cbSize = sizeof(wndclass);
+    wndclass.hInstance = hInstance;
+    wndclass.lpfnWndProc = InternalWndProc;
+    wndclass.style |= CS_HREDRAW | CS_VREDRAW;
+    wndclass.hbrBackground = CreateSolidBrush(RGBKEY);
+
+    if( !RegisterClassExA(&wndclass) ) return false;
+    int xaddend = GetSystemMetrics(fixedsize?SM_CXFIXEDFRAME:SM_CXFRAME)*2;
+    int yaddend = GetSystemMetrics(fixedsize?SM_CYFIXEDFRAME:SM_CYFRAME)*2 + GetSystemMetrics(SM_CYCAPTION);
+    if(wndclass.lpszMenuName) yaddend += GetSystemMetrics(SM_CYMENU);
+
+    // Setup the new window's physical parameters - and tell Windows to create it
+    g_hAppWnd = CreateWindowA(wndclass.lpszClassName,  // Window class name
+                             title,  // Window caption
+                             !fixedsize ? WS_OVERLAPPEDWINDOW :  // Window style
+                             WS_OVERLAPPED|WS_CAPTION|WS_SYSMENU|WS_MINIMIZEBOX,
+                             CW_USEDEFAULT,  // Initial x pos: use default placement
+                             0,              // Initial y pos: not used here
+                             g_sizex+xaddend,// Initial x size
+                             g_sizey+yaddend,// Initial y size
+                             NULL,      // parent window handle
+                             NULL,      // window menu handle
+                             hInstance, // program instance handle
+                             NULL);     // Creation parameters
+    return g_hAppWnd != NULL;
+}
+
+//! create console window with redirection
+static bool RedirectIOToConsole(void)
+{
+    int hConHandle; size_t lStdHandle;
+    CONSOLE_SCREEN_BUFFER_INFO coninfo;
+    FILE *fp;
+    // allocate a console for this app
+    AllocConsole();
+
+    // set the screen buffer to be big enough to let us scroll text
+    GetConsoleScreenBufferInfo(GetStdHandle(STD_OUTPUT_HANDLE), &coninfo);
+    coninfo.dwSize.Y = MAX_CONSOLE_LINES;
+    SetConsoleScreenBufferSize(GetStdHandle(STD_OUTPUT_HANDLE), coninfo.dwSize);
+
+    // redirect unbuffered STDOUT to the console
+    lStdHandle = (size_t)GetStdHandle(STD_OUTPUT_HANDLE);
+    hConHandle = _open_osfhandle(lStdHandle, _O_TEXT);
+    if(hConHandle <= 0) return false;
+    fp = _fdopen( hConHandle, "w" );
+    *stdout = *fp;
+    setvbuf( stdout, NULL, _IONBF, 0 );
+
+    // redirect unbuffered STDERR to the console
+    lStdHandle = (size_t)GetStdHandle(STD_ERROR_HANDLE);
+    hConHandle = _open_osfhandle(lStdHandle, _O_TEXT);
+    if(hConHandle > 0) {
+        fp = _fdopen( hConHandle, "w" );
+        *stderr = *fp;
+        setvbuf( stderr, NULL, _IONBF, 0 );
+    }
+
+    // redirect unbuffered STDIN to the console
+    lStdHandle = (size_t)GetStdHandle(STD_INPUT_HANDLE);
+    hConHandle = _open_osfhandle(lStdHandle, _O_TEXT);
+    if(hConHandle > 0) {
+        fp = _fdopen( hConHandle, "r" );
+        *stdin = *fp;
+        setvbuf( stdin, NULL, _IONBF, 0 );
+    }
+
+    // make cout, wcout, cin, wcin, wcerr, cerr, wclog and clog
+    // point to console as well
+    std::ios::sync_with_stdio();
+    return true;
+}
+
+
+video::video()
+    : depth(24), red_shift(16), green_shift(8), blue_shift(0),
+      red_mask(0xff0000), green_mask(0xff00), blue_mask(0xff)
+{
+    assert(g_video == 0);
+    g_video = this; title = "Video"; running = threaded = calc_fps = false; updating = true;
+}
+
+//! optionally call it just before init() to set own
+void video::win_set_class(WNDCLASSEX &wcex)
+{
+    gWndClass = &wcex;
+}
+
+void video::win_load_accelerators(int idc)
+{
+    hAccelTable = LoadAccelerators(win_hInstance, MAKEINTRESOURCE(idc));
+}
+
+bool video::init_console()
+{
+    if(RedirectIOToConsole()) {
+        if(!g_pImg && g_sizex && g_sizey)
+            g_pImg = new unsigned int[g_sizex * g_sizey];
+        if(g_pImg) running = true;
+        return true;
+    }
+    return false;
+}
+
+video::~video()
+{
+    if(g_video) terminate();
+}
+
+DWORD WINAPI thread_video(LPVOID lpParameter)
+{
+    video *v = (video*)lpParameter;
+    v->on_process();
+    return 0;
+}
+
+static bool loop_once(video *v)
+{
+    // screen update notify
+    if(int updates = g_updates) {
+        g_updates = 0;
+        if(g_video->updating) { g_skips += updates-1; g_fps++; }
+        else g_skips += updates;
+        UpdateWindow(g_hAppWnd);
+    }
+    // update fps
+    DWORD msec = GetTickCount();
+    if(v->calc_fps && msec >= g_msec+1000) {
+        double sec = (msec - g_msec)/1000.0;
+        char buffer[256], n = _snprintf(buffer, 128, "%s: %d fps", v->title, int(double(g_fps + g_skips)/sec));
+        if(g_skips) _snprintf(buffer+n, 128, " - %d skipped = %d updates", int(g_skips/sec), int(g_fps/sec));
+        SetWindowTextA(g_hAppWnd, buffer);
+        g_msec = msec; g_skips = g_fps = 0;
+    }
+    // event processing, including painting
+    MSG msg;
+    if(PeekMessage(&msg, NULL, 0, 0, PM_REMOVE)){
+        if( msg.message == WM_QUIT ) { v->running = false; return false; }
+        if( !hAccelTable || !TranslateAccelerator(msg.hwnd, hAccelTable, &msg) ){
+            TranslateMessage(&msg);
+            DispatchMessage(&msg);
+        }
+        return true; // try again
+    }
+    return false;
+}
+
+//! Do standard event loop
+void video::main_loop()
+{
+    // let Windows draw and unroll the window
+    InvalidateRect(g_hAppWnd, 0, false);
+    g_msec = GetTickCount(); // let's stay for 0,5 sec
+    while(g_msec + 500 > GetTickCount()) { loop_once(this); Sleep(1); }
+    g_msec = GetTickCount();
+    // now, start main process
+    if(threaded) {
+        g_handles[0] = CreateThread (
+            NULL,             // LPSECURITY_ATTRIBUTES security_attrs
+            0,                // SIZE_T stacksize
+            (LPTHREAD_START_ROUTINE) thread_video,
+            this,               // argument
+            0, 0);
+        if(!g_handles[0]) { DisplayError("Can't create thread"); return; }
+        else // harmless race is possible here
+            g_handles[1] = CreateEvent(NULL, false, false, NULL);
+        while(running) {
+            while(loop_once(this));
+            YIELD_TO_THREAD(); // give time for processing when running on single CPU
+            DWORD r = MsgWaitForMultipleObjects(2, g_handles, false, INFINITE, QS_ALLINPUT^QS_MOUSEMOVE);
+            if(r == WAIT_OBJECT_0) break; // thread terminated
+        }
+        running = false;
+        if(WaitForSingleObject(g_handles[0], 3000) == WAIT_TIMEOUT){
+            // there was not enough time for graceful shutdown, killing the example with code 1.
+            exit(1);
+        }
+        if(g_handles[0]) CloseHandle(g_handles[0]);
+        if(g_handles[1]) CloseHandle(g_handles[1]);
+        g_handles[0] = g_handles[1] = 0;
+    }
+    else on_process();
+}
+
+//! Refresh screen picture
+bool video::next_frame()
+{
+    if(!running) return false;
+    g_updates++; // Fast but inaccurate counter. The data race here is benign.
+    if(!threaded) while(loop_once(this));
+    else if(g_handles[1]) {
+        SetEvent(g_handles[1]);
+        YIELD_TO_THREAD();
+    }
+    return true;
+}
+
+//! Change window title
+void video::show_title()
+{
+    if(g_hAppWnd)
+        SetWindowTextA(g_hAppWnd, title);
+}
+
+#endif //__WINVIDEO_H__
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/OpenGLView.h b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/OpenGLView.h
new file mode 100644
index 00000000..81e19952
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/OpenGLView.h
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#import <Foundation/Foundation.h>
+
+#if TARGET_OS_IPHONE
+
+#import <UIKit/UIKit.h>
+#import "OpenGLES/ES2/gl.h"
+
+@interface OpenGLView : UIView {
+    NSTimer *timer;
+    CGRect imageRect;
+}
+
+@property (nonatomic, retain) NSTimer *timer;
+@property (nonatomic) CGRect imageRect;
+
+- (void) drawRect:(CGRect)rect;
+- (void) touchesBegan:(NSSet *)touches withEvent:(UIEvent *)event;
+
+@end
+
+#elif TARGET_OS_MAC
+
+#import <Foundation/Foundation.h>
+#import <Cocoa/Cocoa.h>
+
+@interface OpenGLView : NSOpenGLView{
+    NSTimer *timer;
+}
+
+@property (nonatomic,retain) NSTimer *timer;
+
+- (void) drawRect:(NSRect)start;
+- (void) mouseDown:(NSEvent *)theEvent;
+- (void) keyDown:(NSEvent *)theEvent;
+- (BOOL) acceptsFirstResponder;
+- (void) viewDidEndLiveResize;
+
+@end
+
+#endif
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/OpenGLView.m b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/OpenGLView.m
new file mode 100644
index 00000000..096db8a2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/OpenGLView.m
@@ -0,0 +1,147 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#import <Foundation/Foundation.h>
+#import "OpenGLView.h"
+
+// defined in macvideo.cpp
+extern char* window_title;
+extern int cocoa_update;
+extern int g_sizex, g_sizey;
+extern unsigned int *g_pImg;
+void on_mouse_func(int x, int y, int k);
+void on_key_func(int x);
+
+bool initilized = false;
+
+#if TARGET_OS_IPHONE
+
+#import "OpenGLES/ES2/gl.h"
+
+@implementation OpenGLView
+
+@synthesize timer;
+@synthesize imageRect;
+
+- (void)drawRect:(CGRect)start
+{
+    if (initilized == false) {
+        NSLog(@"INITIALIZE");
+        timer = [NSTimer scheduledTimerWithTimeInterval:0.03 target:self selector:@selector(update_window) userInfo:nil repeats:YES];
+        imageRect = [[UIScreen mainScreen] bounds];
+        CGFloat full_height = imageRect.size.height;
+        const float ratio=(float)g_sizex/g_sizey;
+        imageRect.size.height=imageRect.size.width/ratio;
+        imageRect.origin.y=(full_height-imageRect.size.height)/2;
+        initilized = true;
+    }
+    
+    CGColorSpaceRef colourSpace = CGColorSpaceCreateDeviceRGB();
+    CGDataProviderRef dataProvider = CGDataProviderCreateWithData(NULL, g_pImg, 4*g_sizex*g_sizey, NULL);
+    
+    CGImageRef inputImage = CGImageCreate(g_sizex, g_sizey, 8, 32, g_sizex * 4, colourSpace,(CGBitmapInfo)kCGImageAlphaNoneSkipLast, dataProvider, NULL, NO, kCGRenderingIntentDefault);
+    UIImage *image = [UIImage imageWithCGImage:inputImage];
+    
+    CGDataProviderRelease(dataProvider);
+    CGColorSpaceRelease(colourSpace);
+    CGImageRelease(inputImage);
+    
+    [image drawInRect:imageRect];
+
+}
+
+- (void) touchesBegan:(NSSet *)touches withEvent:(UIEvent *)event
+{
+    CGPoint point = [[touches anyObject] locationInView:self];
+    const int x = point.x;
+    const int y = point.y;
+    if ( (y-imageRect.origin.y) > 0 && y < (imageRect.origin.y + imageRect.size.height ))
+    on_mouse_func( x*g_sizex/(imageRect.size.width), (y-imageRect.origin.y)*g_sizey/imageRect.size.height,1);
+    [self setNeedsDisplay];
+}
+
+-(void) update_window{
+    if( cocoa_update ) [self setNeedsDisplay];
+}
+
+@end
+
+#elif TARGET_OS_MAC
+
+#import <OpenGL/gl.h>
+
+@implementation OpenGLView
+
+@synthesize timer;
+
+- (void) drawRect:(NSRect)start
+{
+    if (initilized == false) {
+        NSLog(@"INITIALIZE");
+        timer = [NSTimer scheduledTimerWithTimeInterval:0.03 target:self selector:@selector(update_window) userInfo:nil repeats:YES];
+        initilized = true;
+    }
+    glWindowPos2i(0, (int)self.visibleRect.size.height);
+    glPixelZoom( (float)self.visibleRect.size.width /(float)g_sizex,
+                -(float)self.visibleRect.size.height/(float)g_sizey);
+    glDrawPixels(g_sizex, g_sizey, GL_BGRA_EXT, GL_UNSIGNED_INT_8_8_8_8_REV, g_pImg);
+    glFlush();
+}
+
+-(void) update_window{
+    if( cocoa_update ) [self setNeedsDisplay:YES]; 
+    if( window_title ) [_window setTitle:[NSString stringWithFormat:@"%s", window_title]];
+}
+
+-(void) keyDown:(NSEvent *)theEvent{
+    on_key_func([theEvent.characters characterAtIndex:0]);
+}
+
+-(void) mouseDown:(NSEvent *)theEvent{
+    // mouse event for seismic and fractal
+    NSPoint point= theEvent.locationInWindow;
+    const int x = (int)point.x;
+    const int y = (int)point.y;
+    NSRect rect = self.visibleRect;
+    on_mouse_func(x*g_sizex/(int)rect.size.width,((int)rect.size.height-y)*g_sizey/(int)rect.size.height,1);
+    [self setNeedsDisplay:YES];
+}
+
+- (BOOL) acceptsFirstResponder
+{
+    return YES;
+}
+
+- (void) rightMouseDown:(NSEvent *)theEvent
+{
+    return;
+}
+
+-(void) viewDidEndLiveResize
+{
+    NSRect rect = self.visibleRect;
+    const int x=(int)rect.size.width;
+    const int y=(int)rect.size.height;
+    [_window setTitle:[NSString stringWithFormat:@"X=%d Y=%d", x,y]];
+}
+
+@end
+
+#endif
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/PkgInfo b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/PkgInfo
new file mode 100644
index 00000000..bd04210f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/PkgInfo
@@ -0,0 +1 @@
+APPL????
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/InfoPlist.strings b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/InfoPlist.strings
new file mode 100644
index 00000000..477b28ff
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/InfoPlist.strings
@@ -0,0 +1,2 @@
+/* Localized versions of Info.plist keys */
+
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/MainMenu.nib b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/MainMenu.nib
new file mode 100644
index 00000000..bbcd0057
Binary files /dev/null and b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/MainMenu.nib differ
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/MainMenu.xib b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/MainMenu.xib
new file mode 100644
index 00000000..975382ce
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/en.lproj/MainMenu.xib
@@ -0,0 +1,48 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<document type="com.apple.InterfaceBuilder3.Cocoa.XIB" version="3.0" toolsVersion="9060" systemVersion="15B42" targetRuntime="MacOSX.Cocoa" propertyAccessControl="none">
+    <dependencies>
+        <deployment identifier="macosx"/>
+        <plugIn identifier="com.apple.InterfaceBuilder.CocoaPlugin" version="9060"/>
+    </dependencies>
+    <objects>
+        <customObject id="-2" userLabel="File's Owner" customClass="NSApplication">
+            <connections>
+                <outlet property="delegate" destination="494" id="495"/>
+            </connections>
+        </customObject>
+        <customObject id="-1" userLabel="First Responder" customClass="FirstResponder"/>
+        <customObject id="-3" userLabel="Application"/>
+        <menu title="AMainMenu" systemMenu="main" id="29">
+            <items>
+                <menuItem title="tbbExample" id="56">
+                    <menu key="submenu" title="tbbExample" systemMenu="apple" id="57">
+                        <items>
+                            <menuItem title="Quit tbbExample" keyEquivalent="q" id="136">
+                                <connections>
+                                    <action selector="terminate:" target="-3" id="449"/>
+                                </connections>
+                            </menuItem>
+                        </items>
+                    </menu>
+                </menuItem>
+            </items>
+        </menu>
+        <window title="tbbExample" allowsToolTipsWhenApplicationIsInactive="NO" deferred="NO" oneShot="NO" releasedWhenClosed="NO" showsToolbarButton="NO" animationBehavior="default" id="371">
+            <windowStyleMask key="styleMask" titled="YES" closable="YES" miniaturizable="YES" resizable="YES"/>
+            <windowPositionMask key="initialPositionMask" leftStrut="YES" rightStrut="YES" topStrut="YES" bottomStrut="YES"/>
+            <rect key="contentRect" x="100" y="100" width="480" height="360"/>
+            <rect key="screenRect" x="0.0" y="0.0" width="1280" height="1002"/>
+            <view key="contentView" focusRingType="none" horizontalHuggingPriority="1" verticalHuggingPriority="9" horizontalCompressionResistancePriority="1" verticalCompressionResistancePriority="1" id="372" customClass="OpenGLView">
+                <rect key="frame" x="0.0" y="0.0" width="480" height="360"/>
+                <autoresizingMask key="autoresizingMask"/>
+                <animations/>
+            </view>
+        </window>
+        <customObject id="494" customClass="tbbAppDelegate">
+            <connections>
+                <outlet property="window" destination="371" id="532"/>
+            </connections>
+        </customObject>
+        <customObject id="420" customClass="NSFontManager"/>
+    </objects>
+</document>
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/iOS.storyboard b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/iOS.storyboard
new file mode 100644
index 00000000..9906441e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/iOS.storyboard
@@ -0,0 +1,28 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<document type="com.apple.InterfaceBuilder3.CocoaTouch.Storyboard.XIB" version="3.0" toolsVersion="9060" systemVersion="15B42" targetRuntime="iOS.CocoaTouch" propertyAccessControl="none" useAutolayout="YES" initialViewController="AKo-RD-jUr">
+    <dependencies>
+        <deployment identifier="iOS"/>
+        <plugIn identifier="com.apple.InterfaceBuilder.IBCocoaTouchPlugin" version="9051"/>
+    </dependencies>
+    <scenes>
+        <!--View Controller-->
+        <scene sceneID="aF8-QV-POo">
+            <objects>
+                <viewController id="AKo-RD-jUr" sceneMemberID="viewController">
+                    <layoutGuides>
+                        <viewControllerLayoutGuide type="top" id="SEe-ff-xUc"/>
+                        <viewControllerLayoutGuide type="bottom" id="Cp9-IV-SKb"/>
+                    </layoutGuides>
+                    <view key="view" contentMode="scaleToFill" id="1aY-my-944" customClass="OpenGLView">
+                        <rect key="frame" x="0.0" y="0.0" width="320" height="568"/>
+                        <autoresizingMask key="autoresizingMask" flexibleMaxX="YES" flexibleMaxY="YES"/>
+                        <animations/>
+                        <color key="backgroundColor" white="0.0" alpha="1" colorSpace="custom" customColorSpace="calibratedWhite"/>
+                    </view>
+                </viewController>
+                <placeholder placeholderIdentifier="IBFirstResponder" id="wcZ-9q-FxX" userLabel="First Responder" sceneMemberID="firstResponder"/>
+            </objects>
+            <point key="canvasLocation" x="90" y="88"/>
+        </scene>
+    </scenes>
+</document>
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/main.m b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/main.m
new file mode 100644
index 00000000..5b873956
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/main.m
@@ -0,0 +1,51 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#import <Availability.h>
+#import <Foundation/Foundation.h>
+
+#if TARGET_OS_IPHONE
+
+#import <UIKit/UIKit.h>
+#import "tbbAppDelegate.h"
+
+void get_screen_resolution(int *x, int *y) {
+    // Getting landscape screen resolution in any case
+    CGRect imageRect = [[UIScreen mainScreen] bounds];
+    *x=imageRect.size.width>imageRect.size.height?imageRect.size.width:imageRect.size.height;
+    *y=imageRect.size.width<imageRect.size.height?imageRect.size.width:imageRect.size.height;
+    return;
+}
+
+int cocoa_main(int argc, char * argv[]) {
+    @autoreleasepool {
+        return UIApplicationMain(argc, argv, nil, NSStringFromClass([tbbAppDelegate class]));
+    }
+}
+
+#elif TARGET_OS_MAC
+
+#import <Cocoa/Cocoa.h>
+
+int cocoa_main(int argc, char *argv[])
+{
+    return NSApplicationMain(argc, (const char **)argv);
+}
+#endif
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbAppDelegate.h b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbAppDelegate.h
new file mode 100644
index 00000000..4bd08819
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbAppDelegate.h
@@ -0,0 +1,51 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+//  Created by Xcode* 4.3.2
+//
+
+#import <Foundation/Foundation.h>
+
+#if TARGET_OS_IPHONE
+
+#import <UIKit/UIKit.h>
+
+@interface tbbAppDelegate : UIResponder <UIApplicationDelegate>
+
+@property (strong, nonatomic) UIWindow *window;
+
+@end
+
+#elif TARGET_OS_MAC
+
+#import <Cocoa/Cocoa.h>
+
+@interface tbbAppDelegate : NSObject <NSApplicationDelegate>{
+    __unsafe_unretained NSWindow *_window;
+}
+
+@property (assign) IBOutlet NSWindow *window;
+
+- (BOOL) applicationShouldTerminateAfterLastWindowClosed:(NSApplication *) sender;
+
+@end
+
+#endif
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbAppDelegate.m b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbAppDelegate.m
new file mode 100644
index 00000000..266c1a4c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbAppDelegate.m
@@ -0,0 +1,66 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#import "tbbAppDelegate.h"
+
+#if TARGET_OS_IPHONE
+
+@implementation tbbAppDelegate
+
+- (BOOL)application:(UIApplication *)application didFinishLaunchingWithOptions:(NSDictionary *)launchOptions
+{
+    return YES;
+}
+
+- (void)applicationDidEnterBackground:(UIApplication *)application
+{
+    exit(EXIT_SUCCESS);
+}
+
+@end
+
+#elif TARGET_OS_MAC
+
+@implementation tbbAppDelegate
+
+@synthesize window = _window;
+
+//declared in macvideo.cpp file
+extern int g_sizex, g_sizey;
+
+- (void)applicationDidFinishLaunching:(NSNotification *)aNotification
+{
+    // Insert code here to initialize your application
+    NSRect windowSize;
+    windowSize.size.height = g_sizey;
+    windowSize.size.width = g_sizex;
+    windowSize.origin=_window.frame.origin;
+    [_window setFrame:windowSize display:YES];
+
+}
+
+- (BOOL) applicationShouldTerminateAfterLastWindowClosed:(NSApplication *) sender
+{
+    return YES;
+}
+
+@end
+
+#endif
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Info.ios.plist b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Info.ios.plist
new file mode 100644
index 00000000..80bdf4ff
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Info.ios.plist
@@ -0,0 +1,44 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+	<key>CFBundleDevelopmentRegion</key>
+	<string>en</string>
+	<key>CFBundleExecutable</key>
+	<string>$(EXECUTABLE_NAME)</string>
+	<key>CFBundleIdentifier</key>
+	<string>$(PRODUCT_BUNDLE_IDENTIFIER)</string>
+	<key>CFBundleInfoDictionaryVersion</key>
+	<string>6.0</string>
+	<key>CFBundleName</key>
+	<string>$(PRODUCT_NAME)</string>
+	<key>CFBundlePackageType</key>
+	<string>APPL</string>
+	<key>CFBundleShortVersionString</key>
+	<string>1.0</string>
+	<key>CFBundleSignature</key>
+	<string>????</string>
+	<key>CFBundleVersion</key>
+	<string>1</string>
+	<key>LSRequiresIPhoneOS</key>
+	<true/>
+	<key>UILaunchStoryboardName</key>
+	<string>iOS</string>
+	<key>UIMainStoryboardFile</key>
+	<string>iOS</string>
+	<key>UIRequiredDeviceCapabilities</key>
+	<array>
+		<string>armv7</string>
+	</array>
+	<key>UISupportedInterfaceOrientations</key>
+	<array>
+		<string>UIInterfaceOrientationLandscapeLeft</string>
+		<string>UIInterfaceOrientationLandscapeRight</string>
+	</array>
+	<key>UISupportedInterfaceOrientations~ipad</key>
+	<array>
+		<string>UIInterfaceOrientationLandscapeLeft</string>
+		<string>UIInterfaceOrientationLandscapeRight</string>
+	</array>
+</dict>
+</plist>
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Info.plist b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Info.plist
new file mode 100644
index 00000000..c344a910
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Info.plist
@@ -0,0 +1,45 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+	<key>CFBundleDevelopmentRegion</key>
+	<string>en</string>
+	<key>CFBundleDisplayName</key>
+	<string></string>
+	<key>CFBundleExecutable</key>
+	<string>${EXECUTABLE_NAME}</string>
+	<key>CFBundleIconFile</key>
+	<string></string>
+	<key>CFBundleIdentifier</key>
+	<string>$(PRODUCT_BUNDLE_IDENTIFIER)</string>
+	<key>CFBundleInfoDictionaryVersion</key>
+	<string>6.0</string>
+	<key>CFBundleName</key>
+	<string>${PRODUCT_NAME}</string>
+	<key>CFBundlePackageType</key>
+	<string>APPL</string>
+	<key>CFBundleShortVersionString</key>
+	<string>1.0</string>
+	<key>CFBundleSignature</key>
+	<string>????</string>
+	<key>CFBundleVersion</key>
+	<string>1</string>
+	<key>LSApplicationCategoryType</key>
+	<string>public.app-category.business</string>
+	<key>LSEnvironment</key>
+	<dict>
+		<key>DYLD_LIBRARY_PATH</key>
+		<string>Contents/Resources:.:../Resources:/tmp:$DYLD_LIBRARY_PATH</string>
+		<key>LIBRARY_PATH</key>
+		<string>Contents/Resources:.:../:/tmp:$DYLD_LIBRARY_PATH</string>
+	</dict>
+	<key>LSMinimumSystemVersion</key>
+	<string>${MACOSX_DEPLOYMENT_TARGET}</string>
+	<key>NSHumanReadableCopyright</key>
+	<string>Copyright 2005-2018 Intel Corporation.  All Rights Reserved.</string>
+	<key>NSMainNibFile</key>
+	<string>MainMenu</string>
+	<key>NSPrincipalClass</key>
+	<string>NSApplication</string>
+</dict>
+</plist>
diff --git a/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Prefix.pch b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Prefix.pch
new file mode 100644
index 00000000..4531cbe0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xcode/tbbExample/tbbExample-Prefix.pch
@@ -0,0 +1,36 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// Prefix header for all source files of the 'tbbExample' target in the 'tbbExample' project
+//
+
+#import <Availability.h>
+
+#if TARGET_OS_IPHONE
+#ifdef __OBJC__
+    #import <UIKit/UIKit.h>
+    #import <Foundation/Foundation.h>
+#endif
+#elif TARGET_OS_MAC
+#ifdef __OBJC__
+    #import <Cocoa/Cocoa.h>
+#endif
+#endif
diff --git a/xdl/third_party/tbb/examples/common/gui/xvideo.cpp b/xdl/third_party/tbb/examples/common/gui/xvideo.cpp
new file mode 100644
index 00000000..8f5ce231
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/gui/xvideo.cpp
@@ -0,0 +1,386 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Uncomment next line to disable shared memory features if you do not have libXext
+// (http://www.xfree86.org/current/mit-shm.html)
+//#define X_NOSHMEM
+
+// Note that it may happen that the build environment supports the shared-memory extension
+// (so there's no build-time reason to disable the relevant code by defining X_NOSHMEM),
+// but that using shared memory still fails at run time.
+// This situation will (ultimately) cause the error handler set by XSetErrorHandler()
+// to be invoked with XErrorEvent::minor_code==X_ShmAttach. The code below tries to make
+// such a determination at XShmAttach() time, which seems plausible, but unfortunately
+// it has also been observed in a specific environment that the error may be reported
+// at a later time instead, even after video::init_window() has returned.
+// It is not clear whether this may happen in that way in any environment where it might
+// depend on the kind of display, e.g., local vs. over "ssh -X", so #define'ing X_NOSHMEM
+// may not always be the appropriate solution, therefore an environment variable
+// has been introduced to disable shared memory at run time.
+// A diagnostic has been added to advise the user about possible workarounds.
+// X_ShmAttach macro was changed to 1 due to recent changes to X11/extensions/XShm.h header.
+
+#include "video.h"
+#include <string.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <math.h>
+#include <X11/Xlib.h>
+#include <X11/Xutil.h>
+#include <X11/keysym.h>
+#include <sys/time.h>
+#include <signal.h>
+#include <pthread.h>
+
+#ifndef X_NOSHMEM
+#include <errno.h>
+#include <X11/extensions/XShm.h>
+#include <sys/ipc.h>
+#include <sys/shm.h>
+
+static XShmSegmentInfo shmseginfo;
+static Pixmap pixmap = 0;
+static bool already_called_X_ShmAttach = false;
+static bool already_advised_about_NOSHMEM_workarounds = false;
+static const char* NOSHMEM_env_var_name = "TBB_EXAMPLES_X_NOSHMEM";
+#endif
+static char *display_name = NULL;
+static Display *dpy = NULL;
+static Screen *scrn;
+static Visual *vis;
+static Colormap cmap;
+static GC gc;
+static Window win, rootW;
+static int dispdepth = 0;
+static XGCValues xgcv;
+static XImage *ximage;
+static int x_error = 0;
+static int vidtype = 3;
+int g_sizex, g_sizey;
+static video *g_video = 0;
+unsigned int *g_pImg = 0;
+static int g_fps = 0;
+struct timeval g_time;
+static pthread_mutex_t g_mutex = PTHREAD_MUTEX_INITIALIZER;
+Atom _XA_WM_DELETE_WINDOW = 0;// like in Xatom.h
+
+///////////////////////////////////////////// public methods of video class ///////////////////////
+
+video::video()
+{
+    assert(g_video == 0);
+    g_video = this; title = "Video"; calc_fps = running = false; updating = true;
+}
+
+inline void mask2bits(unsigned int mask, unsigned int &save, depth_t &shift)
+{
+    save  = mask; if(!mask) { shift = dispdepth/3; return; }
+    shift = 0; while(!(mask&1)) ++shift, mask >>= 1;
+    int bits = 0; while(mask&1) ++bits,  mask >>= 1;
+    shift += bits - 8;
+}
+
+int xerr_handler(Display* dpy_, XErrorEvent *error)
+{
+    x_error = error->error_code;
+    if(g_video) g_video->running = false;
+#ifndef X_NOSHMEM
+    if (error->minor_code==1/*X_ShmAttach*/ && already_called_X_ShmAttach && !already_advised_about_NOSHMEM_workarounds)
+    {
+        char err[256]; XGetErrorText(dpy_, x_error, err, 255);
+        fprintf(stderr, "Warning: Can't attach shared memory to display: %s (%d)\n", err, x_error);
+        fprintf(stderr, "If you are seeing a black output window, try setting %s environment variable to 1"
+                        " to disable shared memory extensions (0 to re-enable, other values undefined),"
+                        " or rebuilding with X_NOSHMEM defined in " __FILE__ "\n", NOSHMEM_env_var_name);
+        already_advised_about_NOSHMEM_workarounds = true;
+    }
+#else
+    (void) dpy_; // warning prevention
+#endif
+    return 0;
+}
+
+bool video::init_window(int xsize, int ysize)
+{
+    { //enclose local variables before fail label
+    g_sizex = xsize; g_sizey = ysize;
+
+    // Open the display
+    if (!dpy) {
+        dpy = XOpenDisplay(display_name);
+        if (!dpy) {
+            fprintf(stderr, "Can't open X11 display %s\n", XDisplayName(display_name));
+            goto fail;
+        }
+    }
+    int theScreen = DefaultScreen(dpy);
+    scrn = ScreenOfDisplay(dpy, theScreen);
+    dispdepth = DefaultDepth(dpy, theScreen);
+    XVisualInfo vinfo;
+    if (!( (dispdepth >= 15 && dispdepth <= 32 && XMatchVisualInfo(dpy, theScreen, dispdepth, TrueColor, &vinfo) )
+        || XMatchVisualInfo(dpy, theScreen, 24, TrueColor, &vinfo)
+        || XMatchVisualInfo(dpy, theScreen, 32, TrueColor, &vinfo)
+        || XMatchVisualInfo(dpy, theScreen, 16, TrueColor, &vinfo)
+        || XMatchVisualInfo(dpy, theScreen, 15, TrueColor, &vinfo)
+        )) {
+        fprintf(stderr, "Display has no appropriate True Color visual\n");
+        goto fail;
+    }
+    vis = vinfo.visual;
+    depth = dispdepth = vinfo.depth;
+    mask2bits(vinfo.red_mask, red_mask, red_shift);
+    mask2bits(vinfo.green_mask, green_mask, green_shift);
+    mask2bits(vinfo.blue_mask, blue_mask, blue_shift);
+    rootW = RootWindow(dpy, theScreen);
+    cmap = XCreateColormap(dpy, rootW, vis, AllocNone);
+    XSetWindowAttributes attrs;
+    attrs.backing_store = Always;
+    attrs.colormap = cmap;
+    attrs.event_mask = StructureNotifyMask|KeyPressMask|ButtonPressMask|ButtonReleaseMask;
+    attrs.background_pixel = BlackPixelOfScreen(scrn);
+    attrs.border_pixel = WhitePixelOfScreen(scrn);
+    win = XCreateWindow(dpy, rootW,
+        0, 0, xsize, ysize, 2,
+        dispdepth, InputOutput, vis,
+        CWBackingStore | CWColormap | CWEventMask |
+        CWBackPixel | CWBorderPixel,
+        &attrs);
+    if(!win) {
+        fprintf(stderr, "Can't create the window\n");
+        goto fail;
+    }
+    XSizeHints sh;
+    sh.flags = PSize | PMinSize | PMaxSize;
+    sh.width = sh.min_width = sh.max_width = xsize;
+    sh.height = sh.min_height = sh.max_height = ysize;
+    XSetStandardProperties( dpy, win, g_video->title, g_video->title, None, NULL, 0, &sh );
+    _XA_WM_DELETE_WINDOW = XInternAtom(dpy, "WM_DELETE_WINDOW", false);
+    XSetWMProtocols(dpy, win, &_XA_WM_DELETE_WINDOW, 1);
+    gc = XCreateGC(dpy, win, 0L, &xgcv);
+    XMapRaised(dpy, win);
+    XFlush(dpy);
+#ifdef X_FULLSYNC
+    XSynchronize(dpy, true);
+#endif
+    XSetErrorHandler(xerr_handler);
+
+    int imgbytes = xsize*ysize*(dispdepth<=16?2:4);
+    const char *vidstr;
+#ifndef X_NOSHMEM
+    int major, minor, pixmaps;
+    if(XShmQueryExtension(dpy) &&
+       XShmQueryVersion(dpy, &major, &minor, &pixmaps))
+    { // Shared memory
+        if(NULL!=getenv(NOSHMEM_env_var_name) && 0!=strcmp("0",getenv(NOSHMEM_env_var_name))) {
+            goto generic;
+        }
+        shmseginfo.shmid = shmget(IPC_PRIVATE, imgbytes, IPC_CREAT|0777);
+        if(shmseginfo.shmid < 0) {
+            fprintf(stderr, "Warning: Can't get shared memory: %s\n", strerror(errno));
+            goto generic;
+        }
+        g_pImg = (unsigned int*)(shmseginfo.shmaddr = (char*)shmat(shmseginfo.shmid, 0, 0));
+        if(g_pImg == (unsigned int*)-1) {
+            fprintf(stderr, "Warning: Can't attach to shared memory: %s\n", strerror(errno));
+            shmctl(shmseginfo.shmid, IPC_RMID, NULL);
+            goto generic;
+        }
+        shmseginfo.readOnly = false;
+        if(!XShmAttach(dpy, &shmseginfo) || x_error) {
+            char err[256]; XGetErrorText(dpy, x_error, err, 255);
+            fprintf(stderr, "Warning: Can't attach shared memory to display: %s (%d)\n", err, x_error);
+            shmdt(shmseginfo.shmaddr); shmctl(shmseginfo.shmid, IPC_RMID, NULL);
+            goto generic;
+        }
+        already_called_X_ShmAttach = true;
+
+#ifndef X_NOSHMPIX
+        if(pixmaps && XShmPixmapFormat(dpy) == ZPixmap)
+        { // Pixmaps
+            vidtype = 2; vidstr = "X11 shared memory pixmap";
+            pixmap = XShmCreatePixmap(dpy, win, (char*)g_pImg, &shmseginfo, xsize, ysize, dispdepth);
+            XSetWindowBackgroundPixmap(dpy, win, pixmap);
+        } else
+#endif//!X_NOSHMPIX
+        { // Standard
+            vidtype = 1; vidstr = "X11 shared memory";
+            ximage = XShmCreateImage(dpy, vis, dispdepth,
+                ZPixmap, 0, &shmseginfo, xsize, ysize);
+            if(!ximage) {
+                fprintf(stderr, "Can't create the shared image\n");
+                goto fail;
+            }
+            assert(ximage->bytes_per_line == xsize*(dispdepth<=16?2:4));
+            ximage->data = shmseginfo.shmaddr;
+        }
+    } else
+#endif
+    {
+#ifndef X_NOSHMEM
+generic:
+#endif
+        vidtype = 0; vidstr = "generic X11";
+        g_pImg = new unsigned int[imgbytes/sizeof(int)];
+        ximage = XCreateImage(dpy, vis, dispdepth, ZPixmap, 0, (char*)g_pImg, xsize, ysize, 32, imgbytes/ysize);
+        if(!ximage) {
+            fprintf(stderr, "Can't create the image\n");
+            goto fail;
+        }
+    }
+    if( ximage ) {
+        // Note: It may be more efficient to adopt the server's byte order
+        //       and swap once per get_color() call instead of once per pixel.
+        const uint32_t probe = 0x03020100;
+        const bool big_endian = (((const char*)(&probe))[0]==0x03);
+        ximage->byte_order = big_endian ? MSBFirst : LSBFirst;
+    }
+    printf("Note: using %s with %s visual for %d-bit color depth\n", vidstr, vis==DefaultVisual(dpy, theScreen)?"default":"non-default", dispdepth);
+    running = true;
+    return true;
+    } // end of enclosing local variables
+fail:
+    terminate(); init_console();
+    return false;
+}
+
+bool video::init_console()
+{
+    if(!g_pImg && g_sizex && g_sizey) {
+        dispdepth = 24; red_shift = 16; vidtype = 3; // fake video
+        g_pImg = new unsigned int[g_sizex*g_sizey];
+        running = true;
+    }
+    return true;
+}
+
+void video::terminate()
+{
+    running = false;
+    if(dpy) {
+        vidtype = 3; // stop video
+        if(threaded) { pthread_mutex_lock(&g_mutex); pthread_mutex_unlock(&g_mutex); }
+        if(ximage) { XDestroyImage(ximage); ximage = 0; g_pImg = 0; } // it frees g_pImg for vidtype == 0
+#ifndef X_NOSHMEM
+        if(pixmap) XFreePixmap(dpy, pixmap);
+        if(shmseginfo.shmaddr) { XShmDetach(dpy, &shmseginfo); shmdt(shmseginfo.shmaddr); g_pImg = 0; }
+        if(shmseginfo.shmid >= 0) shmctl(shmseginfo.shmid, IPC_RMID, NULL);
+#endif
+        if(gc) XFreeGC(dpy, gc);
+        if(win) XDestroyWindow(dpy, win);
+        XCloseDisplay(dpy); dpy = 0;
+    }
+    if(g_pImg) { delete[] g_pImg; g_pImg = 0; } // if was allocated for console mode
+}
+
+video::~video()
+{
+    if(g_video) terminate();
+    g_video = 0;
+}
+
+//! Do standard event loop
+void video::main_loop()
+{
+    struct timezone tz; gettimeofday(&g_time, &tz);
+    on_process();
+}
+
+//! Check for pending events once
+bool video::next_frame()
+{
+    if(!running) return false;
+    //! try acquire mutex if threaded code, returns on failure
+    if(vidtype == 3 || threaded && pthread_mutex_trylock(&g_mutex))
+        return running;
+    //! Refresh screen picture
+    g_fps++;
+#ifndef X_NOSHMPIX
+    if(vidtype == 2 && updating) XClearWindow(dpy, win);
+#endif
+    while( XPending(dpy) ) {
+        XEvent report; XNextEvent(dpy, &report);
+        switch( report.type ) {
+            case ClientMessage:
+                if(report.xclient.format != 32 || report.xclient.data.l[0] != _XA_WM_DELETE_WINDOW) break;
+            case DestroyNotify:
+                running = false;
+            case KeyPress:
+                on_key( XLookupKeysym(&report.xkey, 0) ); break;
+            case ButtonPress:
+                on_mouse( report.xbutton.x, report.xbutton.y, report.xbutton.button ); break;
+            case ButtonRelease:
+                on_mouse( report.xbutton.x, report.xbutton.y, -report.xbutton.button ); break;
+        }
+    }
+    struct timezone tz; struct timeval now_time; gettimeofday(&now_time, &tz);
+    double sec = (now_time.tv_sec+1.0*now_time.tv_usec/1000000.0) - (g_time.tv_sec+1.0*g_time.tv_usec/1000000.0);
+    if(sec > 1) {
+        memcpy(&g_time, &now_time, sizeof(g_time));
+        if(calc_fps) {
+            double fps = g_fps; g_fps = 0;
+            char buffer[256]; snprintf(buffer, 256, "%s%s: %d fps", title, updating?"":" (no updating)", int(fps/sec));
+            XStoreName(dpy, win, buffer);
+        }
+#ifndef X_FULLSYNC
+        XSync(dpy, false); // It is often better then using XSynchronize(dpy, true)
+#endif//X_FULLSYNC
+    }
+    if(threaded) pthread_mutex_unlock(&g_mutex);
+    return true;
+}
+
+//! Change window title
+void video::show_title()
+{
+    if(vidtype < 3)
+        XStoreName(dpy, win, title);
+}
+
+drawing_area::drawing_area(int x, int y, int sizex, int sizey)
+    : base_index(y*g_sizex + x), max_index(g_sizex*g_sizey), index_stride(g_sizex),
+    pixel_depth(dispdepth), ptr32(g_pImg), start_x(x), start_y(y), size_x(sizex), size_y(sizey)
+{
+    assert(x < g_sizex); assert(y < g_sizey);
+    assert(x+sizex <= g_sizex); assert(y+sizey <= g_sizey);
+
+    index = base_index; // current index
+}
+
+void drawing_area::update()
+{
+    if(!g_video->updating) return;
+#ifndef X_NOSHMEM
+    switch(vidtype) {
+    case 0:
+#endif
+        pthread_mutex_lock(&g_mutex);
+        if(vidtype == 0) XPutImage(dpy, win, gc, ximage, start_x, start_y, start_x, start_y, size_x, size_y);
+        pthread_mutex_unlock(&g_mutex);
+#ifndef X_NOSHMEM
+        break;
+    case 1:
+        pthread_mutex_lock(&g_mutex);
+        if(vidtype == 1) XShmPutImage(dpy, win, gc, ximage, start_x, start_y, start_x, start_y, size_x, size_y, false);
+        pthread_mutex_unlock(&g_mutex);
+        break;
+    /*case 2: make it in next_frame(); break;*/
+    }
+#endif
+}
diff --git a/xdl/third_party/tbb/examples/common/index.html b/xdl/third_party/tbb/examples/common/index.html
new file mode 100644
index 00000000..6e9398a7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/index.html
@@ -0,0 +1,397 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Common source code for samples</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Common source code for samples</h1>
+	</div>
+	
+	<p>
+		This directory contains common code that is used in the Intel&reg; Threading Building Blocks (Intel&reg; TBB) samples.
+		<br>
+		This code is not intended to be used directly. It is incorporated automatically by the examples that need it.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="gui/">gui</a>
+				<dd>
+					GUI code for examples that have graphical user interfaces. Currently supports:
+					<ul>
+						<li>GDI+*, DirectDraw*, Direct2D* (Windows* systems)
+						<li>OpenGL* (macOS* systems)
+						<li>X window (Linux* or macOS* systems)
+					</ul>
+					See the examples that use the GUI
+					(<a href="../graph/stereo/readme.html">stereo</a>,
+					<a href="../parallel_for/tachyon/readme.html">tachyon</a>, 
+					<a href="../parallel_for/seismic/readme.html">seismic</a>,
+					<a href="../task_arena/fractal/readme.html">fractal</a>)
+					for more details.
+			</dl>
+			<dl>
+				<dt><a href="utility/">utility</a>
+				<dd>Common driver and utility code for examples. Currently provides:
+					<ul>
+						<li>class FastRandom - a random number generator that uses linear congruential method
+							(<a href="utility/fast_random.h">fast_random.h</a>)
+						<li>class thread_number_range - a class to specify the numbers of threads an example should use
+							(<a href="utility/utility.h">utility.h</a>)
+						<li>support for command line interface - class cli_argument_pack and function parse_cli_arguments
+							(<a href="utility/utility.h">utility.h</a>)
+					</ul>
+			</dl>
+		</div>
+	</div>
+	<div class="changes">
+		<div class="h3-alike">Common information</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+		<br>
+		<div class="h4-alike">Number of threads</div>
+			<p>
+				Most Intel TBB examples allow to specify <i>n-of-threads</i>, the set of thread numbers that should be used to run an example.
+				<br>Usually, it is a range of the form <i>low[:high[:(+|*|#)S]]</i>, where <i>low</i> and optional <i>high</i>
+				are non-negative integers or 'auto' for the default choice, and optional step expression <i>(+|*|#)S</i> 
+				specifies how thread numbers are chosen within the range:
+				<ul>
+					<li>With <i>+/*</i>, the previous number is incremented/multiplied by <i>S</i>.
+					E.g., expression '12:16:+1' means 12,13,14,15,16 threads, and '1:16:*2' means 1,2,4,8,16 threads.
+					<li>With <i>#</i>, <i>S</i> is the desired number of steps between any subsequent powers of 2;
+					it must be a power of 2 on its own, with most meaningful values being 2, 4, and 8. 
+					For a given number of threads, the actual step value is computed as the quotient
+					of the nearest smaller power of 2 divided by the number of steps, but is at least 1.
+					E.g., '1:32:#4' means 1,2,3,4,5,6,7,8,10,12,14,16,20,24,28,32 threads;
+					note the step doubling at 8 and 16 to keep 4 steps between powers of 2.
+				</ul>
+				A default value for the number of threads can be customized in an example. If not customized, it is '1:auto:#4'.
+				The 'auto' parameter is substituted with a value returned by a specified function, which typically is
+				<code>tbb::task_scheduler_init::default_num_threads()</code>.
+			</p>
+		</div>
+	</div>
+
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/common/toolset.props b/xdl/third_party/tbb/examples/common/toolset.props
new file mode 100644
index 00000000..44388c6a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/toolset.props
@@ -0,0 +1,9 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="4.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <PropertyGroup>
+    <PlatformToolset Condition="Exists('$(VCTargetsPath)\Platforms\$(Platform)\PlatformToolsets\Intel C++ Compiler 15.0 [Intel(R) System Studio]')">Intel C++ Compiler 15.0 [Intel(R) System Studio]</PlatformToolset>
+    <PlatformToolset Condition="Exists('$(VCTargetsPath)\Platforms\$(Platform)\PlatformToolsets\Intel C++ Compiler XE 15.0')">Intel C++ Compiler XE 15.0</PlatformToolset>
+    <PlatformToolset Condition="Exists('$(VCTargetsPath)\Platforms\$(Platform)\PlatformToolsets\Intel C++ Compiler 16.0')">Intel C++ Compiler 16.0</PlatformToolset>
+    <UseIntelTBB Condition="'$(UseIntelTBB)' == ''">true</UseIntelTBB>
+  </PropertyGroup>
+</Project>
diff --git a/xdl/third_party/tbb/examples/common/utility/fast_random.h b/xdl/third_party/tbb/examples/common/utility/fast_random.h
new file mode 100644
index 00000000..7ca97a21
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/utility/fast_random.h
@@ -0,0 +1,82 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef FAST_RANDOM_H_
+#define FAST_RANDOM_H_
+namespace utility{
+//------------------------------------------------------------------------
+// FastRandom
+//------------------------------------------------------------------------
+
+namespace internal{
+    size_t GetPrime ( size_t seed );
+}
+
+//! A fast random number generator.
+/** Uses linear congruential method. */
+class FastRandom {
+    size_t x, a;
+public:
+    //! Get a random number.
+    unsigned short get() {
+        return get(x);
+    }
+        //! Get a random number for the given seed; update the seed for next use.
+    unsigned short get( size_t& seed ) {
+        unsigned short r = (unsigned short)(seed>>16);
+        seed = seed*a+1;
+        return r;
+    }
+    //! Construct a random number generator.
+    FastRandom( size_t seed ) {
+        x = seed*internal::GetPrime(seed);
+        a = internal::GetPrime(x);
+    }
+};
+}
+
+namespace utility {
+namespace internal{
+//! Table of primes used by fast random-number generator (FastRandom).
+    static const unsigned Primes[] = {
+        0x9e3779b1, 0xffe6cc59, 0x2109f6dd, 0x43977ab5,
+        0xba5703f5, 0xb495a877, 0xe1626741, 0x79695e6b,
+        0xbc98c09f, 0xd5bee2b3, 0x287488f9, 0x3af18231,
+        0x9677cd4d, 0xbe3a6929, 0xadc6a877, 0xdcf0674b,
+        0xbe4d6fe9, 0x5f15e201, 0x99afc3fd, 0xf3f16801,
+        0xe222cfff, 0x24ba5fdb, 0x0620452d, 0x79f149e3,
+        0xc8b93f49, 0x972702cd, 0xb07dd827, 0x6c97d5ed,
+        0x085a3d61, 0x46eb5ea7, 0x3d9910ed, 0x2e687b5b,
+        0x29609227, 0x6eb081f1, 0x0954c4e1, 0x9d114db9,
+        0x542acfa9, 0xb3e6bd7b, 0x0742d917, 0xe9f3ffa7,
+        0x54581edb, 0xf2480f45, 0x0bb9288f, 0xef1affc7,
+        0x85fa0ca7, 0x3ccc14db, 0xe6baf34b, 0x343377f7,
+        0x5ca19031, 0xe6d9293b, 0xf0a9f391, 0x5d2e980b,
+        0xfc411073, 0xc3749363, 0xb892d829, 0x3549366b,
+        0x629750ad, 0xb98294e5, 0x892d9483, 0xc235baf3,
+        0x3d2402a3, 0x6bdef3c9, 0xbec333cd, 0x40c9520f
+    };
+    size_t GetPrime ( size_t seed ) {
+        return Primes[seed%(sizeof(Primes)/sizeof(Primes[0]))];
+    }
+}
+}
+
+#endif /* FAST_RANDOM_H_ */
diff --git a/xdl/third_party/tbb/examples/common/utility/utility.h b/xdl/third_party/tbb/examples/common/utility/utility.h
new file mode 100644
index 00000000..0f8475e1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/common/utility/utility.h
@@ -0,0 +1,526 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef UTILITY_H_
+#define UTILITY_H_
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (push,target(mic))
+#include <exception>
+#include <cstdio>
+#pragma offload_attribute (pop)
+#endif // __TBB_MIC_OFFLOAD
+
+#include <utility>
+#include <string>
+#include <cstring>
+#include <vector>
+#include <map>
+#include <set>
+#include <algorithm>
+#include <sstream>
+#include <numeric>
+#include <stdexcept>
+#include <memory>
+#include <cassert>
+#include <iostream>
+#include <cstdlib>
+// TBB headers should not be used, as some examples may need to be built without TBB.
+
+namespace utility{
+    namespace internal{
+
+#if (_MSC_VER >= 1600 || __cplusplus >= 201103L || __GXX_EXPERIMENTAL_CXX0X__) \
+    && (_CPPLIB_VER || _LIBCPP_VERSION || __GLIBCXX__ && _UNIQUE_PTR_H ) \
+    && (!__INTEL_COMPILER || __INTEL_COMPILER >= 1200 )
+    // std::unique_ptr is available, and compiler can use it
+    #define smart_ptr std::unique_ptr
+    using std::swap;
+#else
+    #if __INTEL_COMPILER && __GXX_EXPERIMENTAL_CXX0X__
+    // std::unique_ptr is unavailable, so suppress std::auto_prt<> deprecation warning
+    #pragma warning(disable: 1478)
+    #endif
+    #define smart_ptr std::auto_ptr
+    // in some C++ libraries, std::swap does not work with std::auto_ptr
+    template<typename T>
+    void swap( std::auto_ptr<T>& ptr1, std::auto_ptr<T>& ptr2 ) {
+        std::auto_ptr<T> tmp; tmp = ptr2; ptr2 = ptr1; ptr1 = tmp;
+    }
+#endif
+
+        //TODO: add tcs
+        template<class dest_type>
+        dest_type& string_to(std::string const& s, dest_type& result){
+            std::stringstream stream(s);
+            stream>>result;
+            if ((!stream)||(stream.fail())){
+                throw std::invalid_argument("error converting string '"+std::string(s)+"'");
+            }
+            return result;
+        }
+
+        template<class dest_type>
+        dest_type string_to(std::string const& s){
+            dest_type result;
+            return string_to(s,result);
+        }
+
+        template<typename>
+        struct is_bool          { static bool value(){return false;}};
+        template<>
+        struct is_bool<bool>    { static bool value(){return true;}};
+
+        class type_base {
+            type_base& operator=(const type_base&);
+            public:
+            const std::string name;
+            const std::string description;
+
+            type_base (std::string a_name, std::string a_description) : name(a_name), description(a_description) {}
+            virtual void parse_and_store(const std::string & s) = 0;
+            virtual std::string value() const = 0;
+            virtual smart_ptr<type_base> clone() const = 0;
+            virtual ~type_base(){}
+        };
+        template <typename type>
+        class type_impl : public type_base {
+        private:
+            type_impl& operator=(const type_impl&);
+            typedef bool(*validating_function_type)(const type&);
+        private:
+            type & target;
+            validating_function_type validating_function;
+        public:
+            type_impl(std::string a_name, std::string a_description, type & a_target, validating_function_type a_validating_function = NULL)
+                : type_base (a_name,a_description), target(a_target),validating_function(a_validating_function)
+            {};
+            void parse_and_store (const std::string & s) /*override*/ {
+                try{
+                    const bool is_bool = internal::is_bool<type>::value();
+                    if (is_bool && s.empty()){
+                        //to avoid directly assigning true
+                        //(as it will impose additional layer of indirection)
+                        //so, simply pass it as string
+                        internal::string_to("1",target);
+                    }else {
+                        internal::string_to(s,target);
+                    }
+                }catch(std::invalid_argument& e){
+                    std::stringstream str;
+                    str <<"'"<<s<<"' is incorrect input for argument '"<<name<<"'"
+                        <<" ("<<e.what()<<")";
+                    throw std::invalid_argument(str.str());
+                }
+                if (validating_function){
+                    if (!((validating_function)(target))){
+                        std::stringstream str;
+                        str <<"'"<<target<<"' is invalid value for argument '"<<name<<"'";
+                        throw std::invalid_argument(str.str());
+                    }
+                }
+            }
+            template <typename t>
+            static bool is_null_c_str(t&){return false;}
+            static bool is_null_c_str(char* s){return s==NULL;}
+            std::string value() const /*override*/ {
+                std::stringstream str;
+                if (!is_null_c_str(target))
+                    str<<target;
+                return str.str();
+            }
+            smart_ptr<type_base> clone() const /*override*/ {
+                return smart_ptr<type_base>(new type_impl(*this));
+            }
+        };
+
+        class argument{
+        private:
+            smart_ptr<type_base> p_type;
+            bool matched_;
+        public:
+            argument(argument const& other)
+                : p_type(other.p_type.get() ? (other.p_type->clone()).release() : NULL)
+                 ,matched_(other.matched_)
+            {}
+            argument& operator=(argument a){
+                this->swap(a);
+                return *this;
+            }
+            void swap(argument& other){
+                internal::swap(p_type, other.p_type);
+                std::swap(matched_,other.matched_);
+            }
+            template<class type>
+            argument(std::string a_name, std::string a_description, type& dest, bool(*a_validating_function)(const type&)= NULL)
+                :p_type(new type_impl<type>(a_name,a_description,dest,a_validating_function))
+                 ,matched_(false)
+            {}
+            std::string value()const{
+                return p_type->value();
+            }
+            std::string name()const{
+                return p_type->name;
+            }
+            std::string description() const{
+                return p_type->description;
+            }
+            void parse_and_store(const std::string & s){
+                p_type->parse_and_store(s);
+                matched_=true;
+            }
+            bool is_matched() const{return matched_;}
+        };
+    } // namespace internal
+
+    class cli_argument_pack{
+        typedef std::map<std::string,internal::argument> args_map_type;
+        typedef std::vector<std::string> args_display_order_type;
+        typedef std::vector<std::string> positional_arg_names_type;
+    private:
+        args_map_type args_map;
+        args_display_order_type args_display_order;
+        positional_arg_names_type positional_arg_names;
+        std::set<std::string> bool_args_names;
+    private:
+        void add_arg(internal::argument const& a){
+            std::pair<args_map_type::iterator, bool> result = args_map.insert(std::make_pair(a.name(),a));
+            if (!result.second){
+                throw std::invalid_argument("argument with name: '"+a.name()+"' already registered");
+            }
+            args_display_order.push_back(a.name());
+        }
+    public:
+        template<typename type>
+        cli_argument_pack& arg(type& dest,std::string const& name, std::string const& description, bool(*validate)(const type &)= NULL){
+            internal::argument a(name,description,dest,validate);
+            add_arg(a);
+            if (internal::is_bool<type>::value()){
+                bool_args_names.insert(name);
+            }
+            return *this;
+        }
+
+        //Positional means that argument name can be omitted in actual CL
+        //only key to match values for parameters with
+        template<typename type>
+        cli_argument_pack& positional_arg(type& dest,std::string const& name, std::string const& description, bool(*validate)(const type &)= NULL){
+            internal::argument a(name,description,dest,validate);
+            add_arg(a);
+            if (internal::is_bool<type>::value()){
+                bool_args_names.insert(name);
+            }
+            positional_arg_names.push_back(name);
+            return *this;
+        }
+
+        void parse(std::size_t argc, char const* argv[]){
+            {
+                std::size_t current_positional_index=0;
+                for (std::size_t j=1;j<argc;j++){
+                    internal::argument* pa = NULL;
+                    std::string argument_value;
+
+                    const char * const begin=argv[j];
+                    const char * const end=begin+std::strlen(argv[j]);
+
+                    const char * const assign_sign = std::find(begin,end,'=');
+
+                    struct throw_unknown_parameter{ static void _(std::string const& location){
+                        throw std::invalid_argument(std::string("unknown parameter starting at:'")+location+"'");
+                    }};
+                    //first try to interpret it like parameter=value string
+                    if (assign_sign!=end){
+                        std::string name_found = std::string(begin,assign_sign);
+                        args_map_type::iterator it = args_map.find(name_found );
+
+                        if(it!=args_map.end()){
+                            pa= &((*it).second);
+                            argument_value = std::string(assign_sign+1,end);
+                        }else {
+                            throw_unknown_parameter::_(argv[j]);
+                        }
+                    }
+                    //then see is it a named flag
+                    else{
+                        args_map_type::iterator it = args_map.find(argv[j] );
+                        if(it!=args_map.end()){
+                            pa= &((*it).second);
+                            argument_value = "";
+                        }
+                        //then try it as positional argument without name specified
+                        else if (current_positional_index < positional_arg_names.size()){
+                            std::stringstream str(argv[j]);
+                            args_map_type::iterator found_positional_arg = args_map.find(positional_arg_names.at(current_positional_index));
+                            //TODO: probably use of smarter assert would help here
+                            assert(found_positional_arg!=args_map.end()/*&&"positional_arg_names and args_map are out of sync"*/);
+                            if (found_positional_arg==args_map.end()){
+                                throw std::logic_error("positional_arg_names and args_map are out of sync");
+                            }
+                            pa= &((*found_positional_arg).second);
+                            argument_value = argv[j];
+
+                            current_positional_index++;
+                        }else {
+                            //TODO: add tc to check
+                            throw_unknown_parameter::_(argv[j]);
+                        }
+                    }
+                    assert(pa);
+                    if (pa->is_matched()){
+                        throw std::invalid_argument(std::string("several values specified for: '")+pa->name()+"' argument");
+                    }
+                    pa->parse_and_store(argument_value);
+                }
+            }
+        }
+        std::string usage_string(const std::string& binary_name)const{
+            std::string command_line_params;
+            std::string summary_description;
+
+            for (args_display_order_type::const_iterator it = args_display_order.begin();it!=args_display_order.end();++it){
+                const bool is_bool = (0!=bool_args_names.count((*it)));
+                args_map_type::const_iterator argument_it = args_map.find(*it);
+                //TODO: probably use of smarter assert would help here
+                assert(argument_it!=args_map.end()/*&&"args_display_order and args_map are out of sync"*/);
+                if (argument_it==args_map.end()){
+                    throw std::logic_error("args_display_order and args_map are out of sync");
+                }
+                const internal::argument & a = (*argument_it).second;
+                command_line_params +=" [" + a.name() + (is_bool ?"":"=value")+ "]";
+                summary_description +=" " + a.name() + " - " + a.description() +" ("+a.value() +")" + "\n";
+            }
+
+            std::string positional_arg_cl;
+            for (positional_arg_names_type::const_iterator it = positional_arg_names.begin();it!=positional_arg_names.end();++it){
+                positional_arg_cl +=" ["+(*it);
+            }
+            for (std::size_t i=0;i<positional_arg_names.size();++i){
+                positional_arg_cl+="]";
+            }
+            command_line_params+=positional_arg_cl;
+            std::stringstream str;
+            using std::endl;
+            str << " Program usage is:" << endl
+                 << " " << binary_name << command_line_params
+                 << endl << endl
+                 << " where:" << endl
+                 << summary_description
+            ;
+            return str.str();
+        }
+    }; // class cli_argument_pack
+
+    namespace internal {
+        template<typename T>
+        bool is_power_of_2( T val ) {
+            size_t intval = size_t(val);
+            return (intval&(intval-1)) == size_t(0);
+        }
+        int step_function_plus(int previous, double step){
+            return static_cast<int>(previous+step);
+        }
+        int step_function_multiply(int previous, double multiply){
+            return static_cast<int>(previous*multiply);
+        }
+        // "Power-of-2 ladder": nsteps is the desired number of steps between any subsequent powers of 2.
+        // The actual step is the quotient of the nearest smaller power of 2 divided by that number (but at least 1).
+        // E.g., '1:32:#4' means 1,2,3,4,5,6,7,8,10,12,14,16,20,24,28,32
+        int step_function_power2_ladder(int previous, double nsteps){
+            int steps = int(nsteps);
+            assert( is_power_of_2(steps) );  // must be a power of 2
+            // The actual step is 1 until the value is twice as big as nsteps
+            if( previous < 2*steps )
+                return previous+1;
+            // calculate the previous power of 2
+            int prev_power2 = previous/2;                 // start with half the given value
+            int rshift = 1;                               // and with the shift of 1;
+            while( int shifted = prev_power2>>rshift ) {  // shift the value right; while the result is non-zero,
+                prev_power2 |= shifted;                   //   add the bits set in 'shifted';
+                rshift <<= 1;                             //   double the shift, as twice as many top bits are set;
+            }                                             // repeat.
+            ++prev_power2; // all low bits set; now it's just one less than the desired power of 2
+            assert( is_power_of_2(prev_power2) );
+            assert( (prev_power2<=previous)&&(2*prev_power2>previous) );
+            // The actual step value is the previous power of 2 divided by steps
+            return previous + (prev_power2/steps);
+        }
+        typedef int (* step_function_ptr_type)(int,double);
+
+        struct step_function_descriptor  {
+            char mnemonic;
+            step_function_ptr_type function;
+        public:
+            step_function_descriptor(char a_mnemonic, step_function_ptr_type a_function) : mnemonic(a_mnemonic), function(a_function) {}
+        private:
+            void operator=(step_function_descriptor  const&);
+        };
+        step_function_descriptor step_function_descriptors[] = {
+                step_function_descriptor('*',step_function_multiply),
+                step_function_descriptor('+',step_function_plus),
+                step_function_descriptor('#',step_function_power2_ladder)
+        };
+
+        template<typename T, size_t N>
+        inline size_t array_length(const T(&)[N])
+        {
+           return N;
+        }
+
+        struct thread_range_step {
+            step_function_ptr_type step_function;
+            double step_function_argument;
+
+            thread_range_step ( step_function_ptr_type step_function_, double step_function_argument_)
+                :step_function(step_function_),step_function_argument(step_function_argument_)
+            {
+                if (!step_function_)
+                    throw std::invalid_argument("step_function for thread range step should not be NULL");
+            }
+            int operator()(int previous)const {
+                assert(0<=previous); // test 0<=first and loop discipline
+                const int ret = step_function(previous,step_function_argument);
+                assert(previous<ret);
+                return ret;
+            }
+            friend std::istream& operator>>(std::istream& input_stream, thread_range_step& step){
+                char function_char;
+                double function_argument;
+                input_stream >> function_char >> function_argument;
+                size_t i = 0;
+                while ((i<array_length(step_function_descriptors)) && (step_function_descriptors[i].mnemonic!=function_char)) ++i;
+                if (i >= array_length(step_function_descriptors)){
+                    throw std::invalid_argument("unknown step function mnemonic: "+std::string(1,function_char));
+                } else if ((function_char=='#') && !is_power_of_2(function_argument)) {
+                    throw std::invalid_argument("the argument of # should be a power of 2");
+                }
+                step.step_function = step_function_descriptors[i].function;
+                step.step_function_argument = function_argument;
+                return input_stream;
+            }
+        };
+    } // namespace internal
+
+    struct thread_number_range{
+        int (*auto_number_of_threads)();
+        int first; // 0<=first (0 can be used as a special value)
+        int last;  // first<=last
+
+        internal::thread_range_step step;
+
+        thread_number_range( int (*auto_number_of_threads_)(),int low_=1, int high_=-1
+                , internal::thread_range_step step_ =  internal::thread_range_step(internal::step_function_power2_ladder,4)
+        )
+            : auto_number_of_threads(auto_number_of_threads_), first(low_), last((high_>-1) ? high_ : auto_number_of_threads_())
+              ,step(step_)
+        {
+            if (first<0) {
+                throw std::invalid_argument("negative value not allowed");
+            }
+            if (first>last) {
+                throw std::invalid_argument("decreasing sequence not allowed");
+            }
+        }
+        friend std::istream& operator>>(std::istream& i, thread_number_range& range){
+            try{
+                std::string s;
+                i>>s;
+                struct string_to_number_of_threads{
+                    int auto_value;
+                    string_to_number_of_threads(int auto_value_):auto_value(auto_value_){}
+                    int operator()(const std::string & value)const{
+                        return (value=="auto")? auto_value : internal::string_to<int>(value);
+                    }
+                };
+                string_to_number_of_threads string_to_number_of_threads(range.auto_number_of_threads());
+                int low, high;
+                std::size_t colon = s.find(':');
+                if ( colon == std::string::npos ){
+                    low = high = string_to_number_of_threads(s);
+                } else {
+                    //it is a range
+                    std::size_t second_colon = s.find(':',colon+1);
+
+                    low  = string_to_number_of_threads(std::string(s, 0, colon)); //not copying the colon
+                    high = string_to_number_of_threads(std::string(s, colon+1, second_colon - (colon+1))); //not copying the colons
+                    if (second_colon != std::string::npos){
+                        internal::string_to(std::string(s,second_colon + 1),range.step);
+                    }
+                }
+                range = thread_number_range(range.auto_number_of_threads,low,high,range.step);
+            }catch(std::invalid_argument&){
+                i.setstate(std::ios::failbit);
+                throw;
+            }
+            return i;
+        }
+        friend std::ostream& operator<<(std::ostream& o, thread_number_range const& range){
+            using namespace internal;
+            size_t i = 0;
+            for (; i < array_length(step_function_descriptors) && step_function_descriptors[i].function != range.step.step_function; ++i ) {}
+            if (i >= array_length(step_function_descriptors)){
+                throw std::invalid_argument("unknown step function for thread range");
+            }
+            o<<range.first<<":"<<range.last<<":"<<step_function_descriptors[i].mnemonic<<range.step.step_function_argument;
+            return o;
+        }
+    }; // struct thread_number_range
+    //TODO: fix unused warning here
+    //TODO: update the thread range description in the .html files
+    static const char* thread_number_range_desc="number of threads to use; a range of the form low[:high[:(+|*|#)step]],"
+                                                "\n\twhere low and optional high are non-negative integers or 'auto' for the default choice,"
+                                                "\n\tand optional step expression specifies how thread numbers are chosen within the range."
+                                                "\n\tSee examples/common/index.html for detailed description."
+   ;
+
+    inline void report_elapsed_time(double seconds){
+        std::cout<<"elapsed time : "<<seconds<<" seconds"<<std::endl;
+    }
+
+    inline void report_skipped(){
+        std::cout<<"skip"<<std::endl;
+    }
+
+    inline void parse_cli_arguments(int argc, const char* argv[], utility::cli_argument_pack cli_pack){
+        bool show_help = false;
+        cli_pack.arg(show_help,"-h","show this message");
+
+        bool invalid_input=false;
+        try {
+            cli_pack.parse(argc,argv);
+        }catch(std::exception& e){
+            std::cerr
+                    <<"error occurred while parsing command line."<<std::endl
+                    <<"error text: "<<e.what()<<std::endl
+                    <<std::flush;
+            invalid_input =true;
+        }
+        if (show_help || invalid_input){
+            std::cout<<cli_pack.usage_string(argv[0])<<std::flush;
+            std::exit(0);
+        }
+
+    }
+    inline void parse_cli_arguments(int argc, char* argv[], utility::cli_argument_pack cli_pack){
+         parse_cli_arguments(argc, const_cast<const char**>(argv), cli_pack);
+    }
+}
+
+#endif /* UTILITY_H_ */
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/Makefile b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/Makefile
new file mode 100644
index 00000000..f6630b5b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/Makefile
@@ -0,0 +1,59 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=count_strings
+ARGS=
+PERF_RUN_ARGS=auto 10000000 silent
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:   release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+	
+perf_build: release
+	
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/Makefile.windows b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/Makefile.windows
new file mode 100644
index 00000000..871cfd55
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/Makefile.windows
@@ -0,0 +1,51 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Count_Strings
+ARGS=
+PERF_RUN_ARGS=auto 10000000 silent
+
+# The C++ compiler options
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: compiler_check
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe 
+debug: compiler_check
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe 
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
+perf_build: release
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/count_strings.cpp b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/count_strings.cpp
new file mode 100644
index 00000000..779ac7d2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/count_strings.cpp
@@ -0,0 +1,235 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Workaround for ICC 11.0 not finding __sync_fetch_and_add_4 on some of the Linux platforms.
+#if __linux__ && defined(__INTEL_COMPILER)
+#define __sync_fetch_and_add(ptr,addend) _InterlockedExchangeAdd(const_cast<void*>(reinterpret_cast<volatile void*>(ptr)), addend)
+#endif
+#include <string>
+#include <cstring>
+#include <cctype>
+#include <cstdlib>
+#include <cstdio>
+#include "tbb/concurrent_hash_map.h"
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tbb_allocator.h"
+#include "../../common/utility/utility.h"
+
+
+//! String type with scalable allocator.
+/** On platforms with non-scalable default memory allocators, the example scales 
+    better if the string allocator is changed to tbb::tbb_allocator<char>. */
+typedef std::basic_string<char,std::char_traits<char>,tbb::tbb_allocator<char> > MyString;
+
+using namespace tbb;
+using namespace std;
+
+//! Set to true to counts.
+static bool verbose = false;
+static bool silent = false;
+//! Problem size
+long N = 1000000;
+const int size_factor = 2;
+
+//! A concurrent hash table that maps strings to ints.
+typedef concurrent_hash_map<MyString,int> StringTable;
+
+//! Function object for counting occurrences of strings.
+struct Tally {
+    StringTable& table;
+    Tally( StringTable& table_ ) : table(table_) {}
+    void operator()( const blocked_range<MyString*> range ) const {
+        for( MyString* p=range.begin(); p!=range.end(); ++p ) {
+            StringTable::accessor a;
+            table.insert( a, *p );
+            a->second += 1;
+        }
+    }
+};
+
+static MyString* Data;
+
+static void CountOccurrences(int nthreads) {
+    StringTable table;
+
+    tick_count t0 = tick_count::now();
+    parallel_for( blocked_range<MyString*>( Data, Data+N, 1000 ), Tally(table) );
+    tick_count t1 = tick_count::now();
+
+    int n = 0;
+    for( StringTable::iterator i=table.begin(); i!=table.end(); ++i ) {
+        if( verbose && nthreads )
+            printf("%s %d\n",i->first.c_str(),i->second);
+        n += i->second;
+    }
+
+    if ( !silent ) printf("total = %d  unique = %u  time = %g\n", n, unsigned(table.size()), (t1-t0).seconds());
+}
+
+/// Generator of random words
+
+struct Sound {
+    const char *chars;
+    int rates[3];// beginning, middle, ending
+};
+Sound Vowels[] = {
+    {"e", {445,6220,1762}}, {"a", {704,5262,514}}, {"i", {402,5224,162}}, {"o", {248,3726,191}},
+    {"u", {155,1669,23}}, {"y", {4,400,989}}, {"io", {5,512,18}}, {"ia", {1,329,111}},
+    {"ea", {21,370,16}}, {"ou", {32,298,4}}, {"ie", {0,177,140}}, {"ee", {2,183,57}},
+    {"ai", {17,206,7}}, {"oo", {1,215,7}}, {"au", {40,111,2}}, {"ua", {0,102,4}},
+    {"ui", {0,104,1}}, {"ei", {6,94,3}}, {"ue", {0,67,28}}, {"ay", {1,42,52}},
+    {"ey", {1,14,80}}, {"oa", {5,84,3}}, {"oi", {2,81,1}}, {"eo", {1,71,5}},
+    {"iou", {0,61,0}}, {"oe", {2,46,9}}, {"eu", {12,43,0}}, {"iu", {0,45,0}},
+    {"ya", {12,19,5}}, {"ae", {7,18,10}}, {"oy", {0,10,13}}, {"ye", {8,7,7}},
+    {"ion", {0,0,20}}, {"ing", {0,0,20}}, {"ium", {0,0,10}}, {"er", {0,0,20}}
+};
+Sound Consonants[] = {
+    {"r", {483,1414,1110}}, {"n", {312,1548,1114}}, {"t", {363,1653,251}}, {"l", {424,1341,489}},
+    {"c", {734,735,260}}, {"m", {732,785,161}}, {"d", {558,612,389}}, {"s", {574,570,405}},
+    {"p", {519,361,98}}, {"b", {528,356,30}}, {"v", {197,598,16}}, {"ss", {3,191,567}},
+    {"g", {285,430,42}}, {"st", {142,323,180}}, {"h", {470,89,30}}, {"nt", {0,350,231}},
+    {"ng", {0,117,442}}, {"f", {319,194,19}}, {"ll", {1,414,83}}, {"w", {249,131,64}},
+    {"k", {154,179,47}}, {"nd", {0,279,92}}, {"bl", {62,235,0}}, {"z", {35,223,16}},
+    {"sh", {112,69,79}}, {"ch", {139,95,25}}, {"th", {70,143,39}}, {"tt", {0,219,19}},
+    {"tr", {131,104,0}}, {"pr", {186,41,0}}, {"nc", {0,223,2}}, {"j", {184,32,1}},
+    {"nn", {0,188,20}}, {"rt", {0,148,51}}, {"ct", {0,160,29}}, {"rr", {0,182,3}},
+    {"gr", {98,87,0}}, {"ck", {0,92,86}}, {"rd", {0,81,88}}, {"x", {8,102,48}},
+    {"ph", {47,101,10}}, {"br", {115,43,0}}, {"cr", {92,60,0}}, {"rm", {0,131,18}},
+    {"ns", {0,124,18}}, {"sp", {81,55,4}}, {"sm", {25,29,85}}, {"sc", {53,83,1}},
+    {"rn", {0,100,30}}, {"cl", {78,42,0}}, {"mm", {0,116,0}}, {"pp", {0,114,2}},
+    {"mp", {0,99,14}}, {"rs", {0,96,16}}, /*{"q", {52,57,1}},*/ {"rl", {0,97,7}},
+    {"rg", {0,81,15}}, {"pl", {56,39,0}}, {"sn", {32,62,1}}, {"str", {38,56,0}},
+    {"dr", {47,44,0}}, {"fl", {77,13,1}}, {"fr", {77,11,0}}, {"ld", {0,47,38}},
+    {"ff", {0,62,20}}, {"lt", {0,61,19}}, {"rb", {0,75,4}}, {"mb", {0,72,7}},
+    {"rc", {0,76,1}}, {"gg", {0,74,1}}, {"pt", {1,56,10}}, {"bb", {0,64,1}},
+    {"sl", {48,17,0}}, {"dd", {0,59,2}}, {"gn", {3,50,4}}, {"rk", {0,30,28}},
+    {"nk", {0,35,20}}, {"gl", {40,14,0}}, {"wh", {45,6,0}}, {"ntr", {0,50,0}},
+    {"rv", {0,47,1}}, {"ght", {0,19,29}}, {"sk", {23,17,5}}, {"nf", {0,46,0}},
+    {"cc", {0,45,0}}, {"ln", {0,41,0}}, {"sw", {36,4,0}}, {"rp", {0,36,4}},
+    {"dn", {0,38,0}}, {"ps", {14,19,5}}, {"nv", {0,38,0}}, {"tch", {0,21,16}},
+    {"nch", {0,26,11}}, {"lv", {0,35,0}}, {"wn", {0,14,21}}, {"rf", {0,32,3}},
+    {"lm", {0,30,5}}, {"dg", {0,34,0}}, {"ft", {0,18,15}}, {"scr", {23,10,0}},
+    {"rch", {0,24,6}}, {"rth", {0,23,7}}, {"rh", {13,15,0}}, {"mpl", {0,29,0}},
+    {"cs", {0,1,27}}, {"gh", {4,10,13}}, {"ls", {0,23,3}}, {"ndr", {0,25,0}},
+    {"tl", {0,23,1}}, {"ngl", {0,25,0}}, {"lk", {0,15,9}}, {"rw", {0,23,0}},
+    {"lb", {0,23,1}}, {"tw", {15,8,0}}, /*{"sq", {15,8,0}},*/ {"chr", {18,4,0}},
+    {"dl", {0,23,0}}, {"ctr", {0,22,0}}, {"nst", {0,21,0}}, {"lc", {0,22,0}},
+    {"sch", {16,4,0}}, {"ths", {0,1,20}}, {"nl", {0,21,0}}, {"lf", {0,15,6}},
+    {"ssn", {0,20,0}}, {"xt", {0,18,1}}, {"xp", {0,20,0}}, {"rst", {0,15,5}},
+    {"nh", {0,19,0}}, {"wr", {14,5,0}}
+};
+const int VowelsNumber = sizeof(Vowels)/sizeof(Sound);
+const int ConsonantsNumber = sizeof(Consonants)/sizeof(Sound);
+int VowelsRatesSum[3] = {0,0,0}, ConsonantsRatesSum[3] = {0,0,0};
+
+int CountRateSum(Sound sounds[], const int num, const int part)
+{
+    int sum = 0;
+    for(int i = 0; i < num; i++)
+        sum += sounds[i].rates[part];
+    return sum;
+}
+
+const char *GetLetters(int type, const int part)
+{
+    Sound *sounds; int rate, i = 0;
+    if(type & 1)
+        sounds = Vowels, rate = rand() % VowelsRatesSum[part];
+    else
+        sounds = Consonants, rate = rand() % ConsonantsRatesSum[part];
+    do {
+        rate -= sounds[i++].rates[part];
+    } while(rate > 0);
+    return sounds[--i].chars;
+}
+
+static void CreateData() {
+    for(int i = 0; i < 3; i++) {
+        ConsonantsRatesSum[i] = CountRateSum(Consonants, ConsonantsNumber, i);
+        VowelsRatesSum[i] = CountRateSum(Vowels, VowelsNumber, i);
+    }
+    for( int i=0; i<N; ++i ) {
+        int type = rand();
+        Data[i] = GetLetters(type++, 0);
+        for( int j = 0; j < type%size_factor; ++j )
+            Data[i] += GetLetters(type++, 1);
+        Data[i] += GetLetters(type, 2);
+    }
+    MyString planet = Data[12]; planet[0] = toupper(planet[0]);
+    MyString helloworld = Data[0]; helloworld[0] = toupper(helloworld[0]);
+    helloworld += ", "+Data[1]+" "+Data[2]+" "+Data[3]+" "+Data[4]+" "+Data[5];
+    if ( !silent ) printf("Message from planet '%s': %s!\nAnalyzing whole text...\n", planet.c_str(), helloworld.c_str());
+}
+
+int main( int argc, char* argv[] ) {
+    try {
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+        srand(2);
+
+        //! Working threads count
+        // The 1st argument is the function to obtain 'auto' value; the 2nd is the default value
+        // The example interprets 0 threads as "run serially, then fully subscribed"
+        utility::thread_number_range threads(tbb::task_scheduler_init::default_num_threads,0);
+
+        utility::parse_cli_arguments(argc,argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(N,"n-of-strings","number of strings")
+            .arg(verbose,"verbose","verbose mode")
+            .arg(silent,"silent","no output except elapsed time")
+            );
+
+        if ( silent ) verbose = false;
+
+        Data = new MyString[N];
+        CreateData();
+
+        if ( threads.first ) {
+            for(int p = threads.first;  p <= threads.last; p = threads.step(p)) {
+                if ( !silent ) printf("threads = %d  ", p );
+                task_scheduler_init init( p );
+                CountOccurrences( p );
+            }
+        } else { // Number of threads wasn't set explicitly. Run serial and parallel version
+            { // serial run
+                if ( !silent ) printf("serial run   ");
+                task_scheduler_init init_serial(1);
+                CountOccurrences(1);
+            }
+            { // parallel run (number of threads is selected automatically)
+                if ( !silent ) printf("parallel run ");
+                task_scheduler_init init_parallel;
+                CountOccurrences(0);
+            }
+        }
+
+        delete[] Data;
+
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+
+        return 0;
+    } catch(std::exception& e) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+    }
+}
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/msvs/count_strings.sln b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/msvs/count_strings.sln
new file mode 100644
index 00000000..b0cc48cd
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/msvs/count_strings.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "count_strings", "count_strings.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252C}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252C}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/msvs/count_strings.vcxproj b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/msvs/count_strings.vcxproj
new file mode 100644
index 00000000..7e294631
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/msvs/count_strings.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>count_strings</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252C}</ProjectGuid>
+    <RootNamespace>count_strings</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat" ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\count_strings.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/readme.html b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/readme.html
new file mode 100644
index 00000000..9ed9d934
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/readme.html
@@ -0,0 +1,401 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Count_strings sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Count_strings sample</h1>
+	</div>
+	
+	<p>
+		The example counts the number of unique words in a text.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="count_strings.cpp">count_strings.cpp</a>
+				<dd>Source code for the example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>	
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only). 
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only). 
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>	
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>
+				General build directions can be found <a href="../../index.html">here</a>.
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>count_strings <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>count_strings [<i>n-of-threads</i>=value] [<i>n-of-strings</i>=value] [<i>verbose</i>] [<i>silent</i>]</tt>
+				<dt><tt>count_strings [<i>n-of-threads</i> [<i>n-of-strings</i>]] [<i>verbose</i>] [<i>silent</i>] </tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>n-of-strings</i> is a number of strings.<br>
+					<i>verbose</i> - enables printing of extra information during execution.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example.
+					<br>Run it with a small number of strings and the desired number of threads, e.g., <tt>count_strings 2 10000</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/xcode/count_strings.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/xcode/count_strings.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..44900a5f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/count_strings/xcode/count_strings.xcodeproj/project.pbxproj
@@ -0,0 +1,310 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* count_strings.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* count_strings.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5894B218B547B00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* count_strings */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = count_strings; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* count_strings.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = count_strings.cpp; path = ../count_strings.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* count_strings */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = count_strings;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F593A50B8F042A00073279 /* count_strings.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* count_strings */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* count_strings */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "count_strings" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5894B218B547B00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = count_strings;
+			productInstallPath = "$(HOME)/bin";
+			productName = count_strings;
+			productReference = 8DD76F6C0486A84900D96B5E /* count_strings */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "count_strings" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* count_strings */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* count_strings */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* count_strings.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = count_strings;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = count_strings;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "count_strings" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "count_strings" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/concurrent_hash_map/index.html b/xdl/third_party/tbb/examples/concurrent_hash_map/index.html
new file mode 100644
index 00000000..78521f71
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_hash_map/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on concurrent_hash_map container</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>concurrent_hash_map</code> container</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the <code>concurrent_hash_map</code> container.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="count_strings/readme.html">count_strings</a>
+				<dd>Concurrently inserts strings into a <code>concurrent_hash_map</code> container.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/index.html b/xdl/third_party/tbb/examples/concurrent_priority_queue/index.html
new file mode 100644
index 00000000..6e769e31
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on concurrent_priority_queue container</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>concurrent_priority_queue</code> container</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the <code>concurrent_priority_queue</code> container.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="shortpath/readme.html">shortpath</a>
+				<dd>Solves the single source shortest path problem using a <code>concurrent_priority_queue</code> container.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/Makefile b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/Makefile
new file mode 100644
index 00000000..6aa7e91c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/Makefile
@@ -0,0 +1,61 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=shortpath
+ARGS=4 N=1000 start=0 end=999 verbose
+PERF_RUN_ARGS=auto N=1000 start=0 end=99 silent
+
+# icpc by default
+ifneq (,$(shell which icc 2>/dev/null))
+    CXX=icpc
+endif
+
+# autodetect C++11 support
+include ../../common/examples-common.inc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:    release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS) $(CXX0XFLAGS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS) $(CXX0XFLAGS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/Makefile.windows b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/Makefile.windows
new file mode 100644
index 00000000..be78d4c0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/Makefile.windows
@@ -0,0 +1,50 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=shortpath
+ARGS=4 N=1000 start=0 end=999 verbose
+PERF_RUN_ARGS=auto N=1000 start=0 end=99 silent
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release:
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug:
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@$(CXX) >nul 2>&1 || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/msvs/shortpath.sln b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/msvs/shortpath.sln
new file mode 100644
index 00000000..c4c6ba27
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/msvs/shortpath.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "shortpath", "shortpath.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252A}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/msvs/shortpath.vcxproj b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/msvs/shortpath.vcxproj
new file mode 100644
index 00000000..22aed9c8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/msvs/shortpath.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>shortpath</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252A}</ProjectGuid>
+    <RootNamespace>shortpath</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\shortpath.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/readme.html b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/readme.html
new file mode 100644
index 00000000..dd730e88
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/readme.html
@@ -0,0 +1,427 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Shortpath sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Shortpath sample</h1>
+	</div>
+	
+	<p>
+		This directory contains a simple example that solves the single source
+		shortest path problem.
+	<br><br>
+		It is parameterized by N, a number of nodes, and a start and end node in [0..N). 
+		A graph is generated with N nodes and some random number of connections between those nodes.
+		A parallel algorithm based on A* is used to find the shortest path.
+	<br><br>
+		This algorithm varies from serial A* in that it needs to add nodes back to
+		the open set when the g estimate (shortest path from start to the node) is improved, 
+		even if the node has already been "visited".  This is because nodes are added and removed 
+		from the open-set in parallel, resulting in some less optimal paths being explored.
+		The open-set is implemented with the concurrent_priority_queue.
+	<br><br>
+		Note that since we re-visit nodes, the <i>f</i> estimate (on which the priority queue is sorted)
+		is not technically needed, so we could use this same parallel algorithm with just a concurrent_queue.
+		However, keeping the <i>f</i> estimate and using <code>concurrent_priority_queue</code>
+		results in much better performance.
+	<br><br>
+		Silent mode prints run time only,
+		regular mode prints the shortest path length, 
+		and verbose mode prints out the shortest path.
+	<br><br>
+		The generated graph follows a pattern in which the closer two pairs of
+		node ids are together, the fewer hops there are in a typical path
+		between those nodes. So, for example, the path between 5 and 7 likely
+		has few hops whereas 14 to 78 has more and 0 to 9999 has even more,
+		etc.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="shortpath.cpp">shortpath.cpp</a>
+				<dd>Driver.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example with the Intel&reg; C++ Compiler (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains macOS* Xcode* workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>shortpath <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>shortpath [<i>#threads</i>=value] [<i>verbose</i>] [<i>silent</i>] [<i>N</i>=value] [<i>start</i>=value] [<i>end</i>=value] [<i>#threads</i>]</tt>
+				<dd><tt><i>#threads</i></tt> is the number of threads to use; a range of the form <tt><i>low[:high]</i></tt> where <tt><i>low</i></tt> and optional <tt><i>high</i></tt> are non-negative integers, or <tt><i>'auto'</i></tt> for a platform-specific default number.<br>
+					<tt><i>verbose</i></tt> print full path to screen<br>
+					<tt><i>silent</i></tt> limits output to timing info; overrides verbose<br>
+					<tt><i>N</i></tt> number of nodes in graph<br>
+					<tt><i>start</i></tt> node to start path at<br>
+					<tt><i>end</i></tt> node to end path at<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size and the desired number of threads, e.g., <tt>shortpath&nbsp;4&nbsp;N=20&nbsp;start=0&nbsp;end=19</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/shortpath.cpp b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/shortpath.cpp
new file mode 100644
index 00000000..0d380c85
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/shortpath.cpp
@@ -0,0 +1,369 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstdio>
+#include <vector>
+#include <math.h>
+
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task_group.h"
+#include "tbb/concurrent_priority_queue.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "../../common/utility/utility.h"
+#include "../../common/utility/fast_random.h"
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif /* _MSC_VER && _Wp64 */
+
+using namespace std;
+using namespace tbb;
+
+struct point {
+    double x, y;
+    point() {}
+    point(double _x, double _y) : x(_x), y(_y) {}
+    point(const point& p) : x(p.x), y(p.y) {}
+};
+
+double get_distance(const point& p1, const point& p2) {
+    double xdiff=p1.x-p2.x, ydiff=p1.y-p2.y;
+    return sqrt(xdiff*xdiff + ydiff*ydiff);
+}
+
+// generates random points on 2D plane within a box of maxsize width & height
+point generate_random_point(utility::FastRandom& mr) {
+    const size_t maxsize=500;
+    double x = (double)(mr.get() % maxsize);
+    double y = (double)(mr.get() % maxsize);
+    return point(x,y);
+}
+
+// weighted toss makes closer nodes (in the point vector) heavily connected
+bool die_toss(size_t a, size_t b, utility::FastRandom& mr) {
+    int node_diff = std::abs((int)(a-b));
+    // near nodes
+    if (node_diff < 16) return true;
+    // mid nodes
+    if (node_diff < 64) return ((int)mr.get() % 8 == 0);
+    // far nodes
+    if (node_diff < 512) return ((int)mr.get() % 16 == 0);
+    return false;
+}
+
+typedef vector<point> point_set;
+typedef size_t vertex_id;
+typedef std::pair<vertex_id,double> vertex_rec;
+typedef vector<vector<vertex_id> > edge_set;
+
+bool verbose = false;          // prints bin details and other diagnostics to screen
+bool silent = false;           // suppress all output except for time
+size_t N = 1000;               // number of vertices
+size_t src = 0;                // start of path
+size_t dst = N-1;              // end of path
+double INF=100000.0;           // infinity
+size_t grainsize = 16;         // number of vertices per task on average
+size_t max_spawn;              // max tasks to spawn
+tbb::atomic<size_t> num_spawn;      // number of active tasks
+
+point_set vertices;            // vertices
+edge_set edges;                // edges
+vector<vertex_id> predecessor; // for recreating path from src to dst
+
+vector<double> f_distance;     // estimated distances at particular vertex
+vector<double> g_distance;     // current shortest distances from src vertex
+spin_mutex    *locks;          // a lock for each vertex
+task_group *sp_group;          // task group for tasks executing sub-problems
+
+class compare_f {
+public:
+    bool operator()(const vertex_rec& u, const vertex_rec& v) const {
+        return u.second>v.second;
+    }
+};
+
+concurrent_priority_queue<vertex_rec, compare_f> open_set; // tentative vertices
+
+void shortpath_helper();
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+class shortpath_helper_functor {
+public:
+    shortpath_helper_functor() {};
+    void operator() () const { shortpath_helper(); }
+};
+#endif
+
+void shortpath() {
+    sp_group = new task_group;
+    g_distance[src] = 0.0; // src's distance from src is zero
+    f_distance[src] = get_distance(vertices[src], vertices[dst]); // estimate distance from src to dst
+    open_set.push(make_pair(src,f_distance[src])); // push src into open_set
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    sp_group->run([](){ shortpath_helper(); });
+#else
+    sp_group->run( shortpath_helper_functor() );
+#endif
+    sp_group->wait();
+    delete sp_group;
+}
+
+void shortpath_helper() {
+    vertex_rec u_rec;
+    while (open_set.try_pop(u_rec)) {
+        vertex_id u = u_rec.first;
+        if (u==dst) continue;
+        double f = u_rec.second;
+        double old_g_u = 0.0;
+        {
+            spin_mutex::scoped_lock l(locks[u]);
+            if (f > f_distance[u]) continue; // prune search space
+            old_g_u = g_distance[u];
+        }
+        for (size_t i=0; i<edges[u].size(); ++i) {
+            vertex_id v = edges[u][i];
+            double new_g_v = old_g_u + get_distance(vertices[u], vertices[v]);
+            double new_f_v = 0.0;
+            // the push flag lets us move some work out of the critical section below
+            bool push = false;
+            {
+                spin_mutex::scoped_lock l(locks[v]);
+                if (new_g_v < g_distance[v]) {
+                    predecessor[v] = u;
+                    g_distance[v] = new_g_v;
+                    new_f_v = f_distance[v] = g_distance[v] + get_distance(vertices[v], vertices[dst]);
+                    push = true;
+                }
+            }
+            if (push) {
+                open_set.push(make_pair(v,new_f_v));
+                size_t n_spawn = ++num_spawn;
+                if (n_spawn < max_spawn) {
+#if __TBB_CPP11_LAMBDAS_PRESENT
+                    sp_group->run([]{ shortpath_helper(); });
+#else
+                    sp_group->run( shortpath_helper_functor() );
+#endif
+                }
+                else --num_spawn;
+            }
+        }
+    }
+    --num_spawn;
+}
+
+void make_path(vertex_id src, vertex_id dst, vector<vertex_id>& path) {
+    vertex_id at = predecessor[dst];
+    if (at == N) path.push_back(src);
+    else if (at == src) { path.push_back(src); path.push_back(dst); }
+    else { make_path(src, at, path); path.push_back(dst); }
+}
+
+void print_path() {
+    vector<vertex_id> path;
+    double path_length=0.0;
+    make_path(src, dst, path);
+    if (verbose) printf("\n      ");
+    for (size_t i=0; i<path.size(); ++i) {
+        if (path[i] != dst) {
+            double seg_length = get_distance(vertices[path[i]], vertices[path[i+1]]);
+            if (verbose) printf("%6.1f       ", seg_length);
+            path_length += seg_length;
+        }
+        else if (verbose) printf("\n");
+    }
+    if (verbose) {
+        for (size_t i=0; i<path.size(); ++i) {
+            if (path[i] != dst) printf("(%4d)------>", (int)path[i]);
+            else printf("(%4d)\n", (int)path[i]);
+        }
+    }
+    if (verbose) printf("Total distance = %5.1f\n", path_length);
+    else if (!silent) printf(" %5.1f\n", path_length);
+}
+
+int get_default_num_threads() {
+    static int threads = 0;
+    if (threads == 0)
+        threads = tbb::task_scheduler_init::default_num_threads();
+    return threads;
+}
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+class gen_vertices {
+public:
+    gen_vertices() {}
+    void operator() (blocked_range<size_t>& r) const {
+        utility::FastRandom my_random((unsigned int)r.begin());
+        for (size_t i=r.begin(); i!=r.end(); ++i) {
+            vertices[i] = generate_random_point(my_random);
+        }
+    }
+};
+
+class gen_edges {
+public:
+    gen_edges() {}
+    void operator() (blocked_range<size_t>& r) const {
+        utility::FastRandom my_random((unsigned int)r.begin());
+        for (size_t i=r.begin(); i!=r.end(); ++i) {
+            for (size_t j=0; j<i; ++j) {
+                if (die_toss(i, j, my_random))
+                    edges[i].push_back(j);
+            }
+        }
+    }
+};
+
+class reset_vertices {
+public:
+    reset_vertices() {}
+    void operator() (blocked_range<size_t>& r) const {
+        for (size_t i=r.begin(); i!=r.end(); ++i) {
+            f_distance[i] = g_distance[i] = INF;
+            predecessor[i] = N;
+        }
+    }
+};
+#endif
+
+void InitializeGraph() {
+    task_scheduler_init init(get_default_num_threads());
+    vertices.resize(N);
+    edges.resize(N);
+    predecessor.resize(N);
+    g_distance.resize(N);
+    f_distance.resize(N);
+    locks = new spin_mutex[N];
+    if (verbose) printf("Generating vertices...\n");
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    parallel_for(blocked_range<size_t>(0,N,64),
+                 [&](blocked_range<size_t>& r) {
+                     utility::FastRandom my_random(r.begin());
+                     for (size_t i=r.begin(); i!=r.end(); ++i) {
+                         vertices[i] = generate_random_point(my_random);
+                     }
+                 }, simple_partitioner());
+#else
+    parallel_for(blocked_range<size_t>(0,N,64), gen_vertices(), simple_partitioner());
+#endif
+    if (verbose) printf("Generating edges...\n");
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    parallel_for(blocked_range<size_t>(0,N,64),
+                 [&](blocked_range<size_t>& r) {
+                     utility::FastRandom my_random(r.begin());
+                     for (size_t i=r.begin(); i!=r.end(); ++i) {
+                         for (size_t j=0; j<i; ++j) {
+                             if (die_toss(i, j, my_random))
+                                 edges[i].push_back(j);
+                         }
+                     }
+                 }, simple_partitioner());
+#else
+    parallel_for(blocked_range<size_t>(0,N,64), gen_edges(), simple_partitioner());
+#endif
+    for (size_t i=0; i<N; ++i) {
+        for (size_t j=0; j<edges[i].size(); ++j) {
+            vertex_id k = edges[i][j];
+            edges[k].push_back(i);
+        }
+    }
+    if (verbose) printf("Done.\n");
+}
+
+void ReleaseGraph() {
+    delete []locks;
+}
+
+void ResetGraph() {
+    task_scheduler_init init(get_default_num_threads());
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    parallel_for(blocked_range<size_t>(0,N),
+                 [&](blocked_range<size_t>& r) {
+                     for (size_t i=r.begin(); i!=r.end(); ++i) {
+                         f_distance[i] = g_distance[i] = INF;
+                         predecessor[i] = N;
+                     }
+                 });
+#else
+    parallel_for(blocked_range<size_t>(0,N), reset_vertices());
+#endif
+}
+
+int main(int argc, char *argv[]) {
+    try {
+        utility::thread_number_range threads(get_default_num_threads);
+        utility::parse_cli_arguments(argc, argv,
+                                     utility::cli_argument_pack()
+                                     //"-h" option for displaying help is present implicitly
+                                     .positional_arg(threads,"#threads",utility::thread_number_range_desc)
+                                     .arg(verbose,"verbose","   print diagnostic output to screen")
+                                     .arg(silent,"silent","    limits output to timing info; overrides verbose")
+                                     .arg(N,"N","         number of vertices")
+                                     .arg(src,"start","      start of path")
+                                     .arg(dst,"end","        end of path")
+        );
+        if (silent) verbose = false;  // make silent override verbose
+        else
+            printf("shortpath will run with %d vertices to find shortest path between vertices"
+                   " %d and %d using %d:%d threads.\n",
+                   (int)N, (int)src, (int)dst, (int)threads.first, (int)threads.last);
+
+        if (dst >= N) {
+            if (verbose)
+                printf("end value %d is invalid for %d vertices; correcting to %d\n", (int)dst, (int)N, (int)N-1);
+            dst = N-1;
+        }
+
+        num_spawn = 0;
+        max_spawn = N/grainsize;
+        tick_count t0, t1;
+        InitializeGraph();
+        for (int n_thr=threads.first; n_thr<=threads.last; n_thr=threads.step(n_thr)) {
+            ResetGraph();
+            task_scheduler_init init(n_thr);
+            t0 = tick_count::now();
+            shortpath();
+            t1 = tick_count::now();
+            if (!silent) {
+                if (predecessor[dst] != N) {
+                    printf("%d threads: [%6.6f] The shortest path from vertex %d to vertex %d is:",
+                           (int)n_thr, (t1-t0).seconds(), (int)src, (int)dst);
+                    print_path();
+                }
+                else {
+                    printf("%d threads: [%6.6f] There is no path from vertex %d to vertex %d\n",
+                           (int)n_thr, (t1-t0).seconds(), (int)src, (int)dst);
+                }
+            } else
+                utility::report_elapsed_time((t1-t0).seconds());
+        }
+        ReleaseGraph();
+        return 0;
+    } catch(std::exception& e) {
+        cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/xcode/shortpath.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/xcode/shortpath.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..4b26fb15
--- /dev/null
+++ b/xdl/third_party/tbb/examples/concurrent_priority_queue/shortpath/xcode/shortpath.xcodeproj/project.pbxproj
@@ -0,0 +1,308 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		61C4771B13CE199D0022F8F6 /* shortpath.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 61C4771A13CE199D0022F8F6 /* shortpath.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5894C218B560C00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		61C4771A13CE199D0022F8F6 /* shortpath.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = shortpath.cpp; path = ../shortpath.cpp; sourceTree = "<group>"; };
+		8DD76F6C0486A84900D96B5E /* Shortpath */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = Shortpath; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* Shortpath */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = Shortpath;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				61C4771A13CE199D0022F8F6 /* shortpath.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* Shortpath */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* Shortpath */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Shortpath" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5894C218B560C00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = Shortpath;
+			productInstallPath = "$(HOME)/bin";
+			productName = Shortpath;
+			productReference = 8DD76F6C0486A84900D96B5E /* Shortpath */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "shortpath" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* Shortpath */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* Shortpath */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				61C4771B13CE199D0022F8F6 /* shortpath.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Shortpath;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Shortpath;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Shortpath" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "shortpath" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/graph/binpack/Makefile b/xdl/third_party/tbb/examples/graph/binpack/Makefile
new file mode 100644
index 00000000..e7945965
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/Makefile
@@ -0,0 +1,61 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=binpack
+ARGS=4 N=1000
+PERF_RUN_ARGS=auto N=1000 silent
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # which icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:    release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/binpack/Makefile.windows b/xdl/third_party/tbb/examples/graph/binpack/Makefile.windows
new file mode 100644
index 00000000..ebab52d4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/Makefile.windows
@@ -0,0 +1,52 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=binpack
+ARGS= 4 N=1000
+PERF_RUN_ARGS=auto N=1000 silent
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release:
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug:
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+profile:
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@$(CXX) >nul 2>&1 || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/binpack/binpack.cpp b/xdl/third_party/tbb/examples/graph/binpack/binpack.cpp
new file mode 100644
index 00000000..944e2071
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/binpack.cpp
@@ -0,0 +1,300 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+/* Bin-packing algorithm that attempts to use minimal number of bins B of
+   size V to contain N items of varying sizes. */
+
+#include <string>
+#include <iostream>
+#include <cmath>
+#include <vector>
+#include "tbb/atomic.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/flow_graph.h"
+#include "../../common/utility/utility.h"
+
+using tbb::tick_count;
+using tbb::task_scheduler_init;
+using namespace tbb::flow;
+
+typedef size_t size_type;             // to represent non-zero indices, capacities, etc.
+typedef size_t value_type;            // the type of items we are attempting to pack into bins
+typedef std::vector<value_type> bin;  // we use a simple vector to represent a bin
+// Our bin packers will be function nodes in the graph that take value_type items and
+// return a dummy value.  They will also implicitly send packed bins to the bin_buffer
+// node, and unused items back to the value_pool node:
+typedef multifunction_node<value_type, tuple<value_type, bin>, rejecting> bin_packer;
+// Items are placed into a pool that all bin packers grab from, represent by a queue_node:
+typedef queue_node<value_type> value_pool;
+// Packed bins are placed in this buffer waiting to be serially printed and/or accounted for:
+typedef buffer_node<bin> bin_buffer;
+// Packed bins are taken from the_bin_buffer and processed by the_writer:
+typedef function_node<bin, continue_msg, rejecting> bin_writer;
+// Items are injected into the graph when this node sends them to the_value_pool:
+typedef source_node<value_type> value_source;
+
+// User-specified globals with default values
+size_type V = 42;                // desired capacity for each bin
+size_type N = 1000;              // number of elements to generate
+bool verbose = false;            // prints bin details and other diagnostics to screen
+bool silent = false;             // suppress all output except for time
+int num_bin_packers=-1;          // number of concurrent bin packers in operation; default is #threads;
+                                 // larger values can result in more bins at less than full capacity
+size_type optimality=1;          // 1 (default) is highest the algorithm can obtain; larger numbers run faster
+
+// Calculated globals
+size_type min_B;                 // lower bound on the optimal number of bins
+size_type B;                     // the answer, i.e. number of bins used by the algorithm
+size_type *input_array;          // stores randomly generated input values
+value_type item_sum;             // sum of all randomly generated input values
+tbb::atomic<value_type> packed_sum;   // sum of all values currently packed into all bins
+tbb::atomic<size_type> packed_items;  // number of values currently packed into all bins
+tbb::atomic<size_type> active_bins;   // number of active bin_packers
+bin_packer **bins;               // the array of bin packers
+
+// This class is the Body type for bin_packer
+class bin_filler {
+    typedef bin_packer::output_ports_type ports_type;
+    bin my_bin;                   // the current bin that this bin_filler is packing
+    size_type my_used;            // capacity of bin used by current contents (not to be confused with my_bin.size())
+    size_type relax, relax_val;   // relaxation counter for determining when to settle for a non-full bin
+    bin_packer* my_bin_packer;    // ptr to the bin packer that this body object is associated with
+    size_type bin_index;          // index of the encapsulating bin packer in the global bins array
+    value_type looking_for;       // the minimum size of item this bin_packer will accept
+    value_pool* the_value_pool;   // the queue of incoming values
+    bool done;                    // flag to indicate that this binpacker has been deactivated
+ public:
+    bin_filler(size_t bidx, value_pool* _q) :
+        my_used(0), relax(0), relax_val(0), my_bin_packer(NULL), bin_index(bidx), looking_for(V), the_value_pool(_q), done(false) {}
+    void operator()(const value_type& item, ports_type& p) {
+        if (!my_bin_packer) my_bin_packer = bins[bin_index];
+        if (done) get<0>(p).try_put(item); // this bin_packer is done packing items; put item back to pool
+        else if (item > V) { // signal that packed_sum has reached item_sum at some point
+            size_type remaining = active_bins--;
+            if (remaining == 1 && packed_sum == item_sum) { // this is the last bin and it has seen everything
+                // this bin_packer may not have seen everything, so stay active
+                if (my_used>0) get<1>(p).try_put(my_bin);
+                my_bin.clear();
+                my_used = 0;
+                looking_for = V;
+                ++active_bins;
+            }
+            else if (remaining == 1) { // this is the last bin, but there are remaining items
+                get<0>(p).try_put(V+1); // send out signal
+                ++active_bins;
+            }
+            else if (remaining > 1) { // this is not the last bin; deactivate
+                if (my_used < V/(1+optimality*.1)) { // this bin is ill-utilized; throw back items and deactivate
+                    packed_sum -= my_used;
+                    packed_items -= my_bin.size();
+                    for (size_type i=0; i<my_bin.size(); ++i)
+                        get<0>(p).try_put(my_bin[i]);
+                    the_value_pool->remove_successor(*my_bin_packer); // deactivate
+                    done = true;
+                    get<0>(p).try_put(V+1); // send out signal
+                }
+                else { // this bin is well-utilized; send out bin and deactivate
+                    the_value_pool->remove_successor(*my_bin_packer); // build no more bins
+                    done = true;
+                    if (my_used>0) get<1>(p).try_put(my_bin);
+                    get<0>(p).try_put(V+1); // send out signal
+                }
+            }
+        }
+        else if (item <= V-my_used && item >= looking_for) { // this item can be packed
+            my_bin.push_back(item);
+            my_used += item;
+            packed_sum += item;
+            ++packed_items;
+            looking_for = V-my_used;
+            relax = 0;
+            if (packed_sum == item_sum) {
+                get<0>(p).try_put(V+1); // send out signal
+            }
+            if (my_used == V) {
+                get<1>(p).try_put(my_bin);
+                my_bin.clear();
+                my_used = 0;
+                looking_for = V;
+            }
+        }
+        else { // this item can't be packed; relax constraints
+            ++relax;
+            if (relax >= (N-packed_items)/optimality) { // this bin_packer has looked through enough items
+                relax = 0;
+                --looking_for; // accept a wider range of items
+                if (looking_for == 0 && my_used < V/(1+optimality*.1) && my_used > 0 && active_bins > 1) {
+                    // this bin_packer is ill-utilized and can't find items; deactivate and throw back items
+                    size_type remaining = active_bins--;
+                    if (remaining > 1) { // not the last bin_packer
+                        the_value_pool->remove_successor(*my_bin_packer); // deactivate
+                        done = true;
+                    }
+                    else active_bins++; // can't deactivate last bin_packer
+                    packed_sum -= my_used;
+                    packed_items -= my_bin.size();
+                    for (size_type i=0; i<my_bin.size(); ++i)
+                        get<0>(p).try_put(my_bin[i]);
+                    my_bin.clear();
+                    my_used = 0;
+                }
+                else if (looking_for == 0 && (my_used >= V/(1+optimality*.1) || active_bins == 1)) {
+                    // this bin_packer can't find items but is well-utilized, so send it out and reset
+                    get<1>(p).try_put(my_bin);
+                    my_bin.clear();
+                    my_used = 0;
+                    looking_for = V;
+                }
+            }
+            get<0>(p).try_put(item); // put unused item back to pool
+        }
+    }
+};
+
+// source node uses this to send the values to the value_pool
+class item_generator {
+    size_type counter;
+public:
+    item_generator() : counter(0) {}
+    bool operator()(value_type& m) {
+        if (counter<N) {
+            m = input_array[counter];
+            ++counter;
+            return true;
+        }
+        return false;
+    }
+};
+
+// the terminal function_node uses this to gather stats and print bin information
+class bin_printer {
+    value_type running_count;
+    size_type item_count;
+    value_type my_min, my_max;
+    double avg;
+public:
+    bin_printer() : running_count(0), item_count(0), my_min(V), my_max(0), avg(0) {}
+    continue_msg operator()(bin b) {
+        value_type sum=0;
+        ++B;
+        if (verbose)
+            std::cout << "[ ";
+        for (size_type i=0; i<b.size(); ++i) {
+            if (verbose)
+                std::cout << b[i] << " ";
+            sum+=b[i];
+            ++item_count;
+        }
+        if (sum < my_min) my_min = sum;
+        if (sum > my_max) my_max = sum;
+        avg += sum;
+        running_count += sum;
+        if (verbose)
+        std::cout << "]=" << sum << "; Done/Packed/Total cap: " << running_count << "/" << packed_sum << "/" << item_sum
+             << " items:" << item_count << "/" << packed_items << "/" << N << " B=" << B << std::endl;
+        if (item_count == N) { // should be the last; print stats
+            avg = avg/(double)B;
+            if (!silent)
+                std::cout << "SUMMARY: #Bins used: " << B << "; Avg size: " << avg << "; Max size: " << my_max
+                     << "; Min size: " << my_min << "\n         Lower bound on optimal #bins: " << min_B
+                     << "; Start #bins: " << num_bin_packers << std::endl;
+        }
+        return continue_msg();  // need to return something
+    }
+};
+
+int get_default_num_threads() {
+    static int threads = 0;
+    if (threads == 0)
+        threads = task_scheduler_init::default_num_threads();
+    return threads;
+}
+
+int main(int argc, char *argv[]) {
+    try {
+        utility::thread_number_range threads(get_default_num_threads);
+        utility::parse_cli_arguments(argc, argv,
+                                     utility::cli_argument_pack()
+                                     //"-h" option for displaying help is present implicitly
+                                     .positional_arg(threads,"#threads",utility::thread_number_range_desc)
+                                     .arg(verbose,"verbose","   print diagnostic output to screen")
+                                     .arg(silent,"silent","    limits output to timing info; overrides verbose")
+                                     .arg(N,"N","         number of values to pack")
+                                     .arg(V,"V","         capacity of each bin")
+                                     .arg(num_bin_packers,"#packers","  number of concurrent bin packers to use "
+                                          "(default=#threads)")
+                                     .arg(optimality,"optimality","controls optimality of solution; 1 is highest, use\n"
+                                          "              larger numbers for less optimal but faster solution")
+        );
+
+        if (silent) verbose = false;  // make silent override verbose
+        // Generate random input data
+        srand(42);
+        input_array = new value_type[N];
+        item_sum = 0;
+        for (size_type i=0; i<N; ++i) {
+            input_array[i] = rand() % V + 1;  // generate items that fit in a bin
+            item_sum += input_array[i];
+        }
+        min_B = (item_sum % V) ? item_sum/V + 1 : item_sum/V;
+
+        tick_count start = tick_count::now();
+        for(int p = threads.first; p <= threads.last; p = threads.step(p)) {
+            task_scheduler_init init(p);
+            packed_sum = 0;
+            packed_items = 0;
+            B = 0;
+            if (num_bin_packers == -1) num_bin_packers = p;
+            active_bins = num_bin_packers;
+            if (!silent)
+                std::cout << "binpack running with " << item_sum << " capacity over " << N << " items, optimality="
+                     << optimality << ", " << num_bin_packers << " bins of capacity=" << V << " on " << p
+                     << " threads.\n";
+            graph g;
+            value_source the_source(g, item_generator(), false);
+            value_pool the_value_pool(g);
+            make_edge(the_source, the_value_pool);
+            bin_buffer the_bin_buffer(g);
+            bins = new bin_packer*[num_bin_packers];
+            for (int i=0; i<num_bin_packers; ++i) {
+                bins[i] = new bin_packer(g, 1, bin_filler(i, &the_value_pool));
+                make_edge(the_value_pool, *(bins[i]));
+                make_edge(output_port<0>(*(bins[i])), the_value_pool);
+                make_edge(output_port<1>(*(bins[i])), the_bin_buffer);
+            }
+            bin_writer the_writer(g, 1, bin_printer());
+            make_edge(the_bin_buffer, the_writer);
+            the_source.activate();
+            g.wait_for_all();
+            for (int i=0; i<num_bin_packers; ++i) {
+                delete bins[i];
+            }
+            delete[] bins;
+        }
+        utility::report_elapsed_time((tick_count::now() - start).seconds());
+        delete[] input_array;
+        return 0;
+    } catch(std::exception& e) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/graph/binpack/msvs/binpack.sln b/xdl/third_party/tbb/examples/graph/binpack/msvs/binpack.sln
new file mode 100644
index 00000000..f019c534
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/msvs/binpack.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "binpack", "binpack.vcxproj", "{C931C7A2-074E-4150-9E7A-39A03250411E}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.ActiveCfg = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.Build.0 = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.ActiveCfg = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.Build.0 = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.ActiveCfg = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.Build.0 = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.ActiveCfg = Release|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/binpack/msvs/binpack.vcxproj b/xdl/third_party/tbb/examples/graph/binpack/msvs/binpack.vcxproj
new file mode 100644
index 00000000..5946c668
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/msvs/binpack.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>binpack</ProjectName>
+    <ProjectGuid>{C931C7A2-074E-4150-9E7A-39A03250411E}</ProjectGuid>
+    <RootNamespace>binpack</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\binpack.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/binpack/readme.html b/xdl/third_party/tbb/examples/graph/binpack/readme.html
new file mode 100644
index 00000000..e05804a0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/readme.html
@@ -0,0 +1,415 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Binpack sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Binpack sample</h1>
+	</div>
+	
+	<p>
+		This directory contains a simple tbb::flow example that performs 
+		binpacking of N integer values into a near-optimal number of bins
+		of capacity V.
+	<br><br>
+		It features a source_node which passes randomly
+		generated integer values of size&lt;=V to a queue_node. Multiple
+		function_nodes set about taking values from this queue_node and 
+		packing them into bins according to a best-fit policy. Items that
+		cannot be made to fit are rejected and returned to the queue. When 
+		a bin is packed as well as it can be, it is passed to a buffer_node
+		where it waits to be picked up by another function_node.  This final
+		function nodes gathers stats about the bin and optionally prints its
+		contents. When all bins are accounted for, it optionally prints a 
+		summary of the quality of the bin-packing.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="binpack.cpp">binpack.cpp</a>
+				<dd>Driver.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example with the Intel&reg; C++ Compiler (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>binpack <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>binpack [<i>#threads</i>=value] [<i>verbose</i>] [<i>silent</i>] [<i>N</i>=value] [<i>V</i>=value] [<i>#packers</i>=value] [<i>optimality</i>=value] [<i>#threads</i>]</tt>
+				<dd><tt><i>#threads</i></tt> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>] where low and optional high are non-negative integers, or 'auto' for a platform-specific default number.<br>
+					<tt><i>verbose</i></tt> print diagnostic output to screen<br>
+					<tt><i>silent</i></tt> limits output to timing info; overrides verbose<br>
+					<tt><i>N</i></tt> number of values to pack<br>
+					<tt><i>V</i></tt> capacity of each bin<br>
+					<tt><i>#packers</i></tt> number of concurrent bin packers to use (default=#threads)<br>
+					<tt><i>optimality</i></tt> controls optimality of solution; 1 is highest, use larger numbers for less optimal but faster solution<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size and the desired number of threads, e.g., <tt>binpack&nbsp;4&nbsp;N=100</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/binpack/xcode/binpack.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/graph/binpack/xcode/binpack.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..5d282c4b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/binpack/xcode/binpack.xcodeproj/project.pbxproj
@@ -0,0 +1,306 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* binpack.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* binpack.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58950218B599300DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* Binpack */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = Binpack; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* binpack.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = binpack.cpp; path = ../binpack.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* Binpack */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = Binpack;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F593A50B8F042A00073279 /* binpack.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* Binpack */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* Binpack */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Binpack" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58950218B599300DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = Binpack;
+			productInstallPath = "$(HOME)/bin";
+			productName = Binpack;
+			productReference = 8DD76F6C0486A84900D96B5E /* Binpack */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "binpack" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* Binpack */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* Binpack */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* binpack.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Binpack;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Binpack;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Binpack" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "binpack" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/Makefile b/xdl/third_party/tbb/examples/graph/cholesky/Makefile
new file mode 100644
index 00000000..5f8b60e3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/Makefile
@@ -0,0 +1,59 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=cholesky
+ARGS=4 2
+
+# The C++ compiler
+ifneq (,$(shell which icpc 2>/dev/null))
+CXX=icpc
+endif # which icpc
+
+ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib  -Wl,-rpath,$(MKLROOT)/lib
+# MKL support
+override MKL_LIBS += -lmkl_intel_lp64 -lmkl_sequential -lmkl_core
+else
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt 
+endif
+# MKL support
+override MKL_LIBS += -lmkl_rt
+endif
+
+# C++0x support
+override CXXFLAGS += -std=c++0x
+
+all:	release test
+
+release: *.cpp
+	$(CXX) -O2  -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(MKL_LIBS) $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(MKL_LIBS) $(LIBS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/Makefile.windows b/xdl/third_party/tbb/examples/graph/cholesky/Makefile.windows
new file mode 100644
index 00000000..d244a6ac
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/Makefile.windows
@@ -0,0 +1,52 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Cholesky
+ARGS=4 2
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _WIN32_WINNT=0x0501 $(CXXFLAGS)
+MYLDFLAGS = /INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+# MKL support
+MKL_LIBS1 = $(TBB_TARGET_ARCH)
+MKL_LIBS2 = $(MKL_LIBS1:ia32=mkl_core.lib mkl_sequential.lib mkl_intel_c.lib)
+MKL_LIBS  = $(MKL_LIBS2:intel64=mkl_core.lib mkl_sequential.lib mkl_intel_lp64.lib)
+
+all: release test
+release: compiler_check
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(MKL_LIBS) $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: compiler_check
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(MKL_LIBS) $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+profile: compiler_check
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(MKL_LIBS) $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/cholesky.cpp b/xdl/third_party/tbb/examples/graph/cholesky/cholesky.cpp
new file mode 100644
index 00000000..d11c9401
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/cholesky.cpp
@@ -0,0 +1,715 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <string>
+#include <cstring>
+#include <cstdio>
+#include <cmath>
+#include <vector>
+#include <map>
+
+#include "mkl_lapack.h"
+#include "mkl.h"
+
+#include "tbb/tbb_config.h"
+#include "tbb/flow_graph.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+
+// Application command line arguments parsing
+#include "../../common/utility/utility.h"
+
+/************************************************************
+ FORWARD DECLARATIONS
+************************************************************/
+
+/**********************************************
+ Read or generate a positive-definite matrix
+ -- reads from file if fname != NULL
+     -- sets n to matrix size
+     -- allocates and reads values in to A
+ -- otherwise generates a matrix
+     -- uses n to determine size
+     -- allocates and generates values in to A
+**********************************************/
+void matrix_init( double * &A, int &n, const char *fname );
+
+/**********************************************
+ Writes a lower triangular matrix to a file
+ -- first line of file is n 
+ -- subsequently 1 row per line
+**********************************************/
+void matrix_write ( double *A, int n, const char *fname, bool is_triangular = false );
+
+/************************************************************
+ GLOBAL VARIABLES
+************************************************************/
+bool g_benchmark_run = false;
+int g_num_tbb_threads = tbb::task_scheduler_init::default_num_threads();
+int g_n = -1, g_b = -1, g_num_trials = 1;
+char *g_input_file_name = NULL;
+char *g_output_prefix = NULL;
+std::string g_alg_name;
+
+// Creates tiled array
+static double ***create_tile_array( double *A, int n, int b ) {
+    const int p = n/b;
+    double ***tile = (double ***)calloc( sizeof( double ** ), p );
+
+    for ( int j = 0; j < p; ++j ) {
+        tile[j] = (double **)calloc( sizeof( double * ), p );
+    }
+
+    for ( int j = 0; j < p; ++j ) {
+        for ( int i = 0; i < p; ++i ) {
+            double *temp_block = (double *)calloc( sizeof( double ), b*b );
+
+            for ( int A_j = j*b, T_j = 0; T_j < b; ++A_j, ++T_j ) {
+                for ( int A_i = i*b, T_i = 0; T_i < b; ++A_i, ++T_i ) {
+                    temp_block[T_j*b+T_i] = A[A_j*n+A_i];
+                }
+            }
+
+            tile[j][i] = temp_block;
+        }
+    }
+    return tile;
+}
+
+static void collapse_tile_array( double ***tile, double *A, int n, int b ) {
+    const int p = n/b;
+
+    for ( int j = 0; j < p; ++j ) {
+        for ( int i = 0; i < p; ++i ) {
+            double *temp_block = tile[j][i];
+
+            for ( int A_j = j*b, T_j = 0; T_j < b; ++A_j, ++T_j ) {
+                for ( int A_i = i*b, T_i = 0; T_i < b; ++A_i, ++T_i ) {
+                    A[A_j*n+A_i] = temp_block[T_j*b+T_i];
+                }
+            }
+
+            free( temp_block );
+            tile[j][i] = NULL;
+        }
+
+        free( tile[j] );
+    }
+
+    free( tile );
+}
+
+/************************************************************
+ Helper base class: algorithm
+************************************************************/
+class algorithm {
+
+    std::string name;
+    bool is_tiled;
+
+    bool check_if_valid( double *A0, double *C, double *A, int n ) {
+        char transa = 'n', transb = 't';
+        double alpha = 1;
+        double beta = 0;
+
+        for ( int i = 0; i < n; ++i ) {
+            for ( int j = i+1; j < n; ++j ) {
+                A0[j*n+i] = 0.;
+            }
+        }
+
+        dgemm ( &transa, &transb, &n, &n, &n, &alpha, A0, &n, A0, &n, &beta, C, &n );
+
+        for ( int j = 0; j < n; ++j ) {
+            for ( int i = 0; i < n; ++i ) {
+                const double epsilon = std::abs( A[j*n+i]*0.1 );
+
+                if ( std::abs( C[j*n+i] - A[j*n+i] ) > epsilon ) {
+                    printf( "ERROR: %s did not validate at C(%d,%d) = %lf != A(%d,%d) = %lf\n",
+                        name.c_str(), i, j, C[j*n+i], i, j, A[j*n+i] );
+                    printf( "ERROR: %g; %g < %g < %g\n", epsilon, A[j*n+i] - epsilon, C[j*n+i], A[j*n+i] + epsilon );
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+
+public:
+    algorithm( const std::string& alg_name, bool t ) : name(alg_name), is_tiled(t) {}
+
+    double operator() ( double *A, int n, int b, int trials ) {
+        tbb::tick_count t0, t1;
+        double elapsed_time = 0.0;
+        double *A0 = (double *)calloc( sizeof( double ), n*n );
+        double *C = (double *)calloc( sizeof( double ), n*n );
+
+        for ( int t = 0; t < trials+1; ++t ) {
+            if ( is_tiled ) {
+                double ***tile = create_tile_array( A, n, b );
+                t0 = tbb::tick_count::now();
+                func( tile, n, b );
+                t1 = tbb::tick_count::now();
+
+                collapse_tile_array( tile, A0, n, b );
+            }
+            else {
+                memcpy( A0, A, sizeof( double )*n*n );
+                t0 = tbb::tick_count::now();
+                func( A0, n, b );
+                t1 = tbb::tick_count::now();
+            }
+
+            if ( t ) elapsed_time += (t1-t0).seconds();
+
+            if( !g_benchmark_run && !check_if_valid( A0, C, A, n ) ) {
+                if ( g_output_prefix ) {
+                    std::string s( g_output_prefix );
+                    s += "_" + name + ".txt";
+                    matrix_write( A0, g_n, s.c_str(), true );
+                    free( A0 );
+                    free( C );
+                    return 0.;
+                }
+            }
+        }
+
+        if ( g_output_prefix ) {
+            std::string s( g_output_prefix );
+            s += "_" + name + ".txt";
+            matrix_write( A0, g_n, s.c_str(), true );
+        }
+
+        printf( "%s %d %d %d %d %lf %lf\n", name.c_str(), g_num_tbb_threads, trials, n, b, elapsed_time, elapsed_time/trials );
+        free( A0 );
+        free( C );
+        return elapsed_time;
+    }
+
+protected:
+    // Main algorithm body function must be defined in any direved class
+    virtual void func( void * ptr, int n, int b ) = 0;
+};
+
+/***********************************************************/
+
+static void call_dpotf2( double ***tile, int b, int k ) {
+    double *A_block = tile[k][k];
+    char uplo = 'l';
+    int info = 0;
+    dpotf2( &uplo, &b, A_block, &b, &info ); 
+    return;
+}
+
+static void call_dtrsm( double ***tile, int b, int k, int j ) {
+    double *A_block = tile[k][j];
+    double *L_block = tile[k][k];
+    char uplo = 'l', side = 'r', transa = 't', diag = 'n';
+    double alpha = 1;
+    dtrsm( &side, &uplo, &transa, &diag, &b, &b, &alpha, L_block, &b, A_block, &b );
+    return;
+}
+
+static void call_dsyr2k( double ***tile, int b, int k, int j, int i ) {
+    double *A_block = tile[i][j];
+    char transa = 'n', transb = 't';
+    char uplo = 'l';
+    double alpha = -1;
+    double beta = 1;
+
+    if ( i == j ) {   // Diagonal block
+        double *L_block = tile[k][i];
+        dsyrk( &uplo, &transa, &b, &b, &alpha, L_block, &b, &beta, A_block, &b );
+    } else {   // Non-diagonal block
+        double *L2_block = tile[k][i];
+        double *L1_block = tile[k][j];
+        dgemm( &transa, &transb, &b, &b, &b, &alpha, L1_block, &b, L2_block, &b, &beta, A_block, &b );
+    }
+    return;
+}
+
+class algorithm_crout : public algorithm
+{
+public:
+    algorithm_crout() : algorithm("crout_cholesky", true) {}
+
+protected:
+    virtual void func( void * ptr, int n, int b ) {
+        double ***tile = (double ***)ptr;
+        const int p = n/b;
+
+        for ( int k = 0; k < p; ++k ) {
+            call_dpotf2( tile, b, k );
+
+            for ( int j = k+1; j < p; ++j ) {
+                call_dtrsm( tile, b, k, j );
+
+                for ( int i = k+1; i <= j; ++i ) {
+                    call_dsyr2k( tile, b, k, j, i );
+                }
+            }
+        }
+    }
+};
+
+class algorithm_dpotrf : public algorithm
+{
+public:
+    algorithm_dpotrf() : algorithm("dpotrf_cholesky", false) {}
+
+protected:
+    virtual void func( void * ptr, int n, int /* b */ ) {
+        double *A = (double *)ptr;
+        int lda = n;
+        int info = 0;
+        char uplo = 'l';
+        dpotrf( &uplo, &n, A, &lda, &info );
+    }
+};
+
+/************************************************************
+ Begin data join graph based version of cholesky
+************************************************************/
+
+typedef union {
+    char a[4];
+    size_t tag;
+} tag_t;
+
+typedef double * tile_t;
+
+typedef std::pair< tag_t, tile_t > tagged_tile_t;
+typedef tbb::flow::tuple< tagged_tile_t > t1_t;
+typedef tbb::flow::tuple< tagged_tile_t, tagged_tile_t > t2_t;
+typedef tbb::flow::tuple< tagged_tile_t, tagged_tile_t, tagged_tile_t > t3_t;
+
+typedef tbb::flow::multifunction_node< tagged_tile_t, t1_t > dpotf2_node_t;
+typedef tbb::flow::multifunction_node< t2_t, t2_t > dtrsm_node_t;
+typedef tbb::flow::multifunction_node< t3_t, t3_t > dsyr2k_node_t;
+
+typedef tbb::flow::join_node< t2_t, tbb::flow::tag_matching > dtrsm_join_t;
+typedef tbb::flow::join_node< t3_t, tbb::flow::tag_matching > dsyr2k_join_t;
+
+class dpotf2_body {
+    int p;
+    int b;
+public:
+    dpotf2_body( int p_, int b_ ) : p(p_), b(b_) {}
+
+    void operator()( const tagged_tile_t &in, dpotf2_node_t::output_ports_type &ports ) {
+        int k = in.first.a[0];
+        tile_t A_block = in.second;
+        tag_t t;
+        t.tag = 0;
+        t.a[0] = k;
+        char uplo = 'l';
+        int info = 0;
+        dpotf2( &uplo, &b, A_block, &b, &info );
+
+        // Send to dtrsms in same column
+        // k == k  j == k 
+        t.a[2] = k;
+        for ( int j = k+1; j < p; ++j ) {
+            t.a[1] = j;
+            tbb::flow::get<0>( ports ).try_put( std::make_pair( t, A_block ) );
+        }
+    }
+};
+
+class dtrsm_body {
+    int p;
+    int b;
+public:
+    dtrsm_body( int p_, int b_ ) : p(p_), b(b_) {}
+
+    void operator()( const t2_t &in, dtrsm_node_t::output_ports_type &ports ) {
+        using tbb::flow::get;
+
+        tagged_tile_t in0 = get<0>( in );
+        tagged_tile_t in1 = get<1>( in );
+        int k = in0.first.a[0];
+        int j = in0.first.a[1];
+        tile_t L_block = in0.second;
+        tile_t A_block = in1.second;
+        tag_t t;
+        t.tag = 0;
+        t.a[0] = k;
+        char uplo = 'l', side = 'r', transa = 't', diag = 'n';
+        double alpha = 1;
+        dtrsm( &side, &uplo, &transa, &diag, &b, &b, &alpha, L_block, &b, A_block, &b);
+
+        // Send to rest of my row
+        t.a[1] = j;
+        for ( int i = k+1; i <= j; ++i ) {
+            t.a[2] = i;
+            get<0>( ports ).try_put( std::make_pair( t, A_block ) );
+        }
+
+        // Send to transposed row
+        t.a[2] = j;
+        for ( int i = j; i < p; ++i ) {
+            t.a[1] = i;
+            get<1>( ports ).try_put( std::make_pair( t, A_block ) );
+        }
+    }
+};
+
+class dsyr2k_body {
+    int p;
+    int b;
+public:
+    dsyr2k_body( int p_, int b_ ) : p(p_), b(b_) {}
+
+    void operator()( const t3_t &in, dsyr2k_node_t::output_ports_type &ports ) {
+        using tbb::flow::get;
+
+        tag_t t;
+        t.tag = 0;
+        char transa = 'n', transb = 't';
+        char uplo = 'l';
+        double alpha = -1;
+        double beta = 1;
+
+        tagged_tile_t in0 = get<0>( in );
+        tagged_tile_t in1 = get<1>( in );
+        tagged_tile_t in2 = get<2>( in );
+        int k = in2.first.a[0];
+        int j = in2.first.a[1];
+        int i = in2.first.a[2];
+
+        tile_t A_block = in2.second; 
+        if ( i == j ) {   // Diagonal block
+            tile_t L_block = in0.second;
+            dsyrk( &uplo, &transa, &b, &b, &alpha, L_block, &b, &beta, A_block, &b );
+        } else {   // Non-diagonal block
+            tile_t L1_block = in0.second;
+            tile_t L2_block = in1.second;
+            dgemm( &transa, &transb, &b, &b, &b, &alpha, L1_block, &b, L2_block, &b, &beta, A_block, &b );
+        }
+
+        // All outputs flow to next step
+        t.a[0] = k+1;
+        t.a[1] = j;
+        t.a[2] = i;
+        if ( k != p-1 && j == k+1 && i == k+1 ) {
+            get<0>( ports ).try_put( std::make_pair( t, A_block ) );
+        }
+
+        if ( k < p-2 ) {
+            if ( i == k+1 && j > i ) {
+                t.a[0] = k+1;
+                t.a[1] = j;
+                get<1>( ports ).try_put( std::make_pair( t, A_block ) );
+            }
+
+            if ( j != k+1 && i != k+1 ) {
+                t.a[0] = k+1;
+                t.a[1] = j;
+                t.a[2] = i;
+                get<2>( ports ).try_put( std::make_pair( t, A_block ) );
+            }
+        }
+    }
+};
+
+struct tagged_tile_to_size_t {
+    size_t operator()( const tagged_tile_t &t ) {
+        return t.first.tag;
+    }
+};
+
+class algorithm_join : public algorithm
+{
+public:
+    algorithm_join() : algorithm("data_join_cholesky", true) {}
+
+protected:
+    virtual void func( void * ptr, int n, int b ) {
+        using tbb::flow::unlimited;
+        using tbb::flow::output_port;
+        using tbb::flow::input_port;
+
+        double ***tile = (double ***)ptr;
+        const int p = n/b;
+        tbb::flow::graph g;
+
+        dpotf2_node_t dpotf2_node( g, unlimited, dpotf2_body(p, b) );
+        dtrsm_node_t dtrsm_node( g, unlimited, dtrsm_body(p, b) );
+        dsyr2k_node_t dsyr2k_node( g, unlimited, dsyr2k_body(p, b) );
+        dtrsm_join_t dtrsm_join( g, tagged_tile_to_size_t(), tagged_tile_to_size_t() );
+        dsyr2k_join_t dsyr2k_join( g, tagged_tile_to_size_t(), tagged_tile_to_size_t(), tagged_tile_to_size_t() );
+
+        make_edge( output_port<0>( dsyr2k_node ), dpotf2_node );
+
+        make_edge( output_port<0>( dpotf2_node ), input_port<0>( dtrsm_join ) );
+        make_edge( output_port<1>( dsyr2k_node ), input_port<1>( dtrsm_join ) );
+        make_edge( dtrsm_join, dtrsm_node );
+
+        make_edge( output_port<0>( dtrsm_node ), input_port<0>( dsyr2k_join ) );
+        make_edge( output_port<1>( dtrsm_node ), input_port<1>( dsyr2k_join ) );
+        make_edge( output_port<2>( dsyr2k_node ), input_port<2>( dsyr2k_join ) );
+        make_edge( dsyr2k_join, dsyr2k_node );
+
+        // Now we need to send out the tiles to their first nodes
+        tag_t t;
+        t.tag = 0;
+        t.a[0] = 0;
+        t.a[1] = 0;
+        t.a[2] = 0;
+
+        // Send to feedback input of first dpotf2
+        // k == 0, j == 0, i == 0
+        dpotf2_node.try_put( std::make_pair( t, tile[0][0] ) );
+
+        // Send to feedback input (port 1) of each dtrsm
+        // k == 0, j == 1..p-1
+        for ( int j = 1; j < p; ++j ) {
+            t.a[1] = j;
+            input_port<1>( dtrsm_join ).try_put( std::make_pair( t, tile[0][j] ) );
+        }
+
+        // Send to feedback input (port 2) of each dsyr2k
+        // k == 0
+        for ( int i = 1; i < p; ++i ) {
+            t.a[2] = i;
+
+            for ( int j = i; j < p; ++j ) {
+                t.a[1] = j;
+                input_port<2>( dsyr2k_join ).try_put( std::make_pair( t, tile[i][j] ) );
+            }
+        }
+
+        g.wait_for_all();
+    }
+};
+
+/************************************************************
+ End data join graph based version of cholesky
+************************************************************/
+
+/************************************************************
+ Begin dependence graph based version of cholesky
+************************************************************/
+
+typedef tbb::flow::continue_node< tbb::flow::continue_msg > continue_type;
+typedef continue_type * continue_ptr_type;
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+// Using helper functor classes (instead of built-in C++ 11 lambda functions)
+class call_dpotf2_functor
+{
+    double ***tile;
+    int b, k;
+public:
+    call_dpotf2_functor( double ***tile_, int b_, int k_ )
+        : tile(tile_), b(b_), k(k_) {}
+
+    void operator()( const tbb::flow::continue_msg & ) { call_dpotf2( tile, b, k ); }
+};
+
+class call_dtrsm_functor
+{
+    double ***tile;
+    int b, k, j;
+public:
+    call_dtrsm_functor( double ***tile_, int b_, int k_, int j_ )
+        : tile(tile_), b(b_), k(k_), j(j_) {}
+
+    void operator()( const tbb::flow::continue_msg & ) { call_dtrsm( tile, b, k, j ); }
+};
+
+class call_dsyr2k_functor
+{
+    double ***tile;
+    int b, k, j, i;
+public:
+    call_dsyr2k_functor( double ***tile_, int b_, int k_, int j_, int i_ )
+        : tile(tile_), b(b_), k(k_), j(j_), i(i_) {}
+
+    void operator()( const tbb::flow::continue_msg & ) { call_dsyr2k( tile, b, k, j, i ); }
+};
+
+#endif // !__TBB_CPP11_LAMBDAS_PRESENT
+
+class algorithm_depend : public algorithm
+{
+public:
+    algorithm_depend() : algorithm("depend_cholesky", true) {}
+
+protected:
+    virtual void func( void * ptr, int n, int b ) {
+        double ***tile = (double ***)ptr;
+
+        const int p = n/b;
+        continue_ptr_type *c = new continue_ptr_type[p];
+        continue_ptr_type **t = new continue_ptr_type *[p];
+        continue_ptr_type ***u = new continue_ptr_type **[p];
+
+        tbb::flow::graph g;
+        for ( int k = p-1; k >= 0; --k ) {
+            c[k] = new continue_type( g,
+#if __TBB_CPP11_LAMBDAS_PRESENT
+                [=]( const tbb::flow::continue_msg & ) { call_dpotf2( tile, b, k ); } );
+#else
+                call_dpotf2_functor( tile, b, k ) );
+#endif // __TBB_CPP11_LAMBDAS_PRESENT
+            t[k] = new continue_ptr_type[p];
+            u[k] = new continue_ptr_type *[p];
+
+            for ( int j = k+1; j < p; ++j ) {
+                t[k][j] = new continue_type( g,
+#if __TBB_CPP11_LAMBDAS_PRESENT
+                    [=]( const tbb::flow::continue_msg & ) { call_dtrsm( tile, b, k, j ); } );
+#else
+                    call_dtrsm_functor( tile, b, k, j ) );
+#endif // __TBB_CPP11_LAMBDAS_PRESENT
+                make_edge( *c[k], *t[k][j] );
+                u[k][j] = new continue_ptr_type[p];
+
+                for ( int i = k+1; i <= j; ++i ) {
+                    u[k][j][i] = new continue_type( g,
+#if __TBB_CPP11_LAMBDAS_PRESENT
+                        [=]( const tbb::flow::continue_msg & ) { call_dsyr2k( tile, b, k, j, i ); } );
+#else
+                        call_dsyr2k_functor( tile, b, k, j, i ) );
+#endif // __TBB_CPP11_LAMBDAS_PRESENT
+
+                    if ( k < p-2 && k+1 != j && k+1 != i ) {
+                        make_edge( *u[k][j][i], *u[k+1][j][i] );
+                    }
+
+                    make_edge( *t[k][j], *u[k][j][i] );
+
+                    if ( i != j ) {
+                        make_edge( *t[k][i], *u[k][j][i] );
+                    }
+
+                    if ( k < p-2 && j > i && i == k+1 ) {
+                        make_edge( *u[k][j][i], *t[i][j] );
+                    }
+                }
+            }
+
+            if ( k != p-1 ) {
+                make_edge( *u[k][k+1][k+1], *c[k+1] );
+            }
+        }
+
+        c[0]->try_put( tbb::flow::continue_msg() );
+        g.wait_for_all();
+    }
+}; // class algorithm_depend
+
+/************************************************************
+ End dependence graph based version of cholesky
+************************************************************/
+
+bool process_args( int argc, char *argv[] ) {
+    utility::parse_cli_arguments( argc, argv,
+        utility::cli_argument_pack()
+        //"-h" option for displaying help is present implicitly
+        .positional_arg( g_n, "size", "the row/column size of NxN matrix (size <= 46000)" )
+        .positional_arg( g_b, "blocksize", "the block size; size must be a multiple of the blocksize" )
+        .positional_arg( g_num_trials, "num_trials", "the number of times to run each algorithm" )
+        .positional_arg( g_output_prefix, "output_prefix",
+            "if provided the prefix will be preappended to output files:\n"
+            "                     output_prefix_posdef.txt\n"
+            "                     output_prefix_X.txt; where X is the algorithm used\n"
+            "                 if output_prefix is not provided, no output will be written" )
+        .positional_arg( g_alg_name, "algorithm", "name of the used algorithm - can be dpotrf, crout, depend or join" )
+        .positional_arg( g_num_tbb_threads, "num_tbb_threads", "number of started TBB threads" )
+
+        .arg( g_input_file_name, "input_file", "if provided it will be read to get the input matrix" )
+        .arg( g_benchmark_run, "-x", "skips all validation" )
+    );
+
+    if ( g_n > 46000 ) {
+        printf( "ERROR: invalid 'size' value (must be less or equal 46000): %d\n", g_n );
+        return false;
+    }
+
+    if ( g_n%g_b != 0 ) {
+        printf( "ERROR: size %d must be a multiple of the blocksize %d\n", g_n, g_b );
+        return false;
+    }
+
+    if ( g_n/g_b > 256 ) {
+        // Because tile index size is 1 byte only in tag_t type
+        printf( "ERROR: size / blocksize must be less or equal 256, but %d / %d = %d\n", g_n, g_b, g_n/g_b );
+        return false;
+    }
+
+    if ( g_b == -1 || (g_n == -1 && g_input_file_name == NULL) ) {
+        return false;
+    }
+
+    return true;
+}
+
+int main(int argc, char *argv[]) {
+    typedef std::map< std::string, algorithm * > algmap_t;
+    algmap_t algmap;
+
+    // Init algorithms
+    algmap.insert(std::pair<std::string, algorithm *>("dpotrf", new algorithm_dpotrf));
+    algmap.insert(std::pair<std::string, algorithm *>("crout", new algorithm_crout));
+    algmap.insert(std::pair<std::string, algorithm *>("depend", new algorithm_depend));
+    algmap.insert(std::pair<std::string, algorithm *>("join", new algorithm_join));
+
+    if ( !process_args( argc, argv ) ) {
+        printf( "ERROR: Invalid arguments. Run: %s -h\n", argv[0] );
+        exit( 1 );
+    }
+
+    tbb::task_scheduler_init init( g_num_tbb_threads );
+    double *A = NULL;
+
+    // Read input matrix
+    matrix_init( A, g_n, g_input_file_name );
+
+    // Write input matrix if output_prefix is set and we didn't read from a file
+    if ( !g_input_file_name && g_output_prefix ) {
+        std::string s( g_output_prefix );
+        s += "_posdef.txt";
+        matrix_write( A, g_n, s.c_str() );
+    }
+
+    if ( g_alg_name.empty() ) {
+        for ( algmap_t::iterator i = algmap.begin(); i != algmap.end(); ++i ) {
+            algorithm* const alg = i->second;
+            (*alg)( A, g_n, g_b, g_num_trials );
+        }
+    }
+    else {
+        algmap_t::iterator alg_iter = algmap.find(g_alg_name);
+
+        if ( alg_iter != algmap.end() ) {
+            algorithm* const alg = alg_iter->second;
+            (*alg)( A, g_n, g_b, g_num_trials );
+        }
+        else {
+            printf( "ERROR: Invalid algorithm name: %s\n", g_alg_name.c_str() );
+            exit( 2 );
+        }
+    }
+
+    free( A );
+    return 0;
+}
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/init.cpp b/xdl/third_party/tbb/examples/graph/cholesky/init.cpp
new file mode 100644
index 00000000..4fd8992a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/init.cpp
@@ -0,0 +1,138 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstdio>
+#include <cassert>
+#include <cstring>
+#include <cstdlib>
+#include <mkl_cblas.h>
+
+static void posdef_gen( double * A, int n )
+{
+    /* Allocate memory for the matrix and its transpose */
+    double *L = (double *)calloc( sizeof( double ), n*n );
+    assert( L );
+
+    double *LT = (double *)calloc( sizeof( double ), n*n) ;
+    assert( LT );
+
+    memset( A, 0, sizeof( double )*n*n );
+
+    /* Generate a conditioned matrix and fill it with random numbers */
+    for ( int j = 0; j < n; ++j ) {
+        for ( int k = 0; k < j; ++k ) {
+            // The initial value has to be between [0,1].
+            L[k*n+j] = ( ( (j*k) / ((double)(j+1)) / ((double)(k+2)) * 2.0) - 1.0 ) / ((double)n);
+        }
+
+        L[j*n+j] = 1;
+    }
+
+    /* Compute transpose of the matrix */
+    for ( int i = 0; i < n; ++i ) {
+        for ( int j = 0; j < n; ++j ) {
+            LT[j*n+i] = L[i*n+j];
+        }
+    }
+    cblas_dgemm( CblasColMajor, CblasNoTrans, CblasNoTrans, n, n, n, 1, L, n, LT, n, 0, A, n );
+
+    free( L );
+    free( LT );
+}
+
+// Read the matrix from the input file
+void matrix_init( double * &A, int &n, const char *fname ) {
+    if( fname ) {
+        int i;
+        int j;
+        FILE *fp;
+
+        fp = fopen( fname, "r" );
+        if ( fp == NULL ) {
+            fprintf( stderr, "\nFile does not exist\n" );
+            exit( 0 );
+        }
+        if ( fscanf( fp, "%d", &n ) <= 0 ) {
+            fprintf( stderr,"\nCouldn't read n from %s\n", fname );
+            exit( 1 );
+        }
+        A = (double *)calloc( sizeof( double ), n*n );
+        for ( i = 0; i < n; ++i ) {
+            for ( j = 0; j <= i; ++j ) {
+                if( fscanf( fp, "%lf ", &A[i*n+j] ) <= 0) {
+                    fprintf( stderr,"\nMatrix size incorrect %i %i\n", i, j );
+                    exit( 1 );
+                }
+                if ( i != j ) {
+                    A[j*n+i] = A[i*n+j];
+                }
+            }
+        }
+        fclose( fp );
+    } else {
+        A = (double *)calloc( sizeof( double ), n*n );
+        posdef_gen( A, n );
+    }
+}
+
+// write matrix to file
+void matrix_write ( double *A, int n, const char *fname, bool is_triangular = false )
+{
+    if( fname ) {
+        int i = 0;
+        int j = 0;
+        FILE *fp = NULL;
+
+        fp = fopen( fname, "w" );
+        if ( fp == NULL ) {
+            fprintf( stderr, "\nCould not open file %s for writing.\n", fname );
+            exit( 0 );
+        }
+        fprintf( fp, "%d\n", n );
+        for ( i = 0; i < n; ++i) {
+            for ( j = 0; j <= i; ++j ) {
+                fprintf( fp, "%lf ", A[j*n+i] );
+            }
+            if ( !is_triangular ) {
+                for ( ; j < n; ++j ) {
+                    fprintf( fp, "%lf ", A[i*n+j] );
+                }
+            } else {
+                for ( ; j < n; ++j ) {
+                    fprintf( fp, "%lf ", 0.0 );
+                }
+            } 
+            fprintf( fp, "\n" );
+        }
+        if ( is_triangular ) {
+            fprintf( fp, "\n" );
+            for ( i = 0; i < n; ++i ) {
+                for ( j = 0; j < i; ++j ) {
+                    fprintf( fp, "%lf ", 0.0 );
+                }
+                for ( ; j < n; ++j ) {
+                    fprintf( fp, "%lf ", A[i*n+j] );
+                }
+                fprintf( fp, "\n" );
+            }
+        }
+        fclose( fp );
+    }
+}
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/msvs/cholesky.sln b/xdl/third_party/tbb/examples/graph/cholesky/msvs/cholesky.sln
new file mode 100644
index 00000000..87ed855b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/msvs/cholesky.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "cholesky", "cholesky.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252E}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/msvs/cholesky.vcxproj b/xdl/third_party/tbb/examples/graph/cholesky/msvs/cholesky.vcxproj
new file mode 100644
index 00000000..d906a466
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/msvs/cholesky.vcxproj
@@ -0,0 +1,206 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>cholesky</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252E}</ProjectGuid>
+    <RootNamespace>cholesky</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(MKLROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <OpenMP>GenerateParallelCode</OpenMP>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;mkl_rt.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(MKLROOT)\lib\ia32;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(MKLROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <OpenMP>GenerateParallelCode</OpenMP>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;mkl_rt.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(MKLROOT)\lib\intel64;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(MKLROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <OpenMP>GenerateParallelCode</OpenMP>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;mkl_rt.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(MKLROOT)\lib\ia32;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(MKLROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <OpenMP>GenerateParallelCode</OpenMP>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;mkl_rt.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(MKLROOT)\lib\intel64;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\cholesky.cpp" />
+    <ClCompile Include="..\init.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/readme.html b/xdl/third_party/tbb/examples/graph/cholesky/readme.html
new file mode 100644
index 00000000..cb82eba3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/readme.html
@@ -0,0 +1,415 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Cholesky sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Cholesky sample</h1>
+	</div>
+	
+	<p>
+		This directory contains an example of several versions of Cholesky Factorization algorithm. 
+		<br>
+		<br><b>dpotrf</b>: An implementation that calls the Intel&reg; Math Kernel Library (Intel&reg; MKL) dpotrf function to directly perform the factorization.  This can be a serial implementation or threaded implementation depending on the version of the Intel MKL library that is linked against.
+		<br>
+		<br><b>crout</b>: A serial implementation that uses the Crout-Cholesky algorithm for factorization.  The same approach is parallelized for the other Intel&reg; Threading Building Blocks (Intel&reg; TBB) based approaches below.
+		<br>
+		<br><b>depend</b>: A parallel version of Crout-Cholesky factorization that uses an Intel TBB flow graph.  This version uses a dependence graph made solely of continue_node objects. This an inspector-executor approach, where a loop nest that is similar to the serial implementation is used to create an unrolled version of the computation.  Where the Intel MKL calls would have been made in the original serial implementation of Crout-Cholesky, instead nodes are created and these nodes are linked by edges to the other nodes that they are dependent upon.  The resulting graph is relatively large, with a node for each instance of each Intel MKL call.  For example, there are many nodes that call dtrsm; one for each invocation of dtrsm in the serial implementation.  The is very little overhead in message management for this version and so it is often the highest performing.
+		<br>
+		<br><b>join</b>: A parallel version of Crout-Cholesky factorization that uses an Intel TBB flow graph.  This version uses a data flow approach. This is a small, compact graph that passes tiles along its edges.  There is one node per type of Intel MKL call, plus join_nodes that combine the inputs required for each call.  So for example, there is only a single node that applies all calls to dtrsm.  This node is invoked when the tiles that hold the inputs and outputs for an invocation are matched together in the tag-matching join_node that precedes it.   The tag represents the iteration values of the i, j, k loops in the serial implementation at that invocation of the call. There is some overhead in message matching and forwarding, so it may not perform as well as the dependence graph implementation.
+		<br>
+		<br>This sample code requires a recent Intel TBB library (one that supports the flow graph). And also the Intel MKL library.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="cholesky.cpp">cholesky.cpp</a>
+				<dd>Source code for example.
+				<dt><a href="init.cpp">init.cpp</a>
+				<dd>Source code for example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a> 
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+			<p>Also, you need to source Intel MKL environment variables.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>cholesky [<i>size=value</i>] [<i>blocksize=value</i>] [<i>num_trials=value</i>] [<i>output_prefix=value</i>] [<i>algorithm=value</i>] [<i>num_tbb_threads=value</i>] [<i>input_file=value</i>] [<i>-x</i>] [<i>-h</i>] [<i>size</i> [<i>blocksize</i> [<i>num_trials</i> [<i>output_prefix</i> [<i>algorithm</i> [<i>num_tbb_threads</i>]]]]]]</tt>
+				<dd>where:
+				<br><tt><i>size</i></tt> - the row/column size of NxN matrix (size &lt;= 46000)
+				<br><tt><i>blocksize</i></tt> - the block size; size must be a multiple of the blocksize
+				<br><tt><i>num_trials</i></tt> - the number of times to run each algorithm
+				<br><tt><i>output_prefix</i></tt> - if provided the prefix will be prepended to output files:
+									 <i>output_prefix_posdef.txt</i> and
+									 <i>output_prefix_X.txt</i>; where <i>X</i> is the algorithm used
+				<br>if <tt><i>output_prefix</i></tt> is not provided, no output will be written
+				<br><tt><i>algorithm</i></tt> - name of the used algorithm - can be dpotrf, crout, depend or join
+				<br><tt><i>num_tbb_threads</i></tt> - number of started TBB threads
+				<br><tt><i>input_file</i></tt> - if provided it will be read to get the input matrix
+				<br><tt><i>-x</i></tt> - skips all validation
+				<br><tt><i>-h</i></tt> - show this message
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/cholesky/xcode/cholesky.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/graph/cholesky/xcode/cholesky.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..6529166d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/cholesky/xcode/cholesky.xcodeproj/project.pbxproj
@@ -0,0 +1,316 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* Cholesky.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* Cholesky.cpp */; };
+		A1F593A60B8F053A00073279 /* init.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F053A00073279 /* init.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58951218B5ACC00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* Cholesky */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = Cholesky; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* Cholesky.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = Cholesky.cpp; path = ../Cholesky.cpp; sourceTree = SOURCE_ROOT; };
+		A1F593A50B8F053A00073279 /* init.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = init.cpp; path = ../init.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* Cholesky */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = Cholesky;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F593A50B8F042A00073279 /* Cholesky.cpp */,
+				A1F593A50B8F053A00073279 /* init.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* Cholesky */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* Cholesky */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Cholesky" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58951218B5ACC00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = Cholesky;
+			productInstallPath = "$(HOME)/bin";
+			productName = Cholesky;
+			productReference = 8DD76F6C0486A84900D96B5E /* Cholesky */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "cholesky" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* Cholesky */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* Cholesky */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* Cholesky.cpp in Sources */,
+				A1F593A60B8F053A00073279 /* init.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Cholesky;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Cholesky;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					/opt/intel/tbb/include,
+					/opt/intel/mkl/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib $(MKLROOT)/lib /opt/intel/mkl/lib";
+				LIBRARY_SEARCH_PATHS = (
+					/opt/intel/tbb/lib,
+					/opt/intel/mkl/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+					"-lmkl_intel_lp64",
+					"-lmkl_sequential",
+					"-lmkl_core",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					/opt/intel/tbb/include,
+					/opt/intel/mkl/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib $(MKLROOT)/lib /opt/intel/mkl/lib";
+				LIBRARY_SEARCH_PATHS = (
+					/opt/intel/tbb/lib,
+					/opt/intel/mkl/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+					"-lmkl_intel_lp64",
+					"-lmkl_sequential",
+					"-lmkl_core",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Cholesky" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "cholesky" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/Makefile b/xdl/third_party/tbb/examples/graph/dining_philosophers/Makefile
new file mode 100644
index 00000000..63d42734
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/Makefile
@@ -0,0 +1,58 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=dining_philosophers
+ARGS= auto 5
+LIGHT_ARGS= auto 3
+
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: dining_philosophers.cpp
+	$(CXX) -O2 -DNDEBUG -D_CONSOLE $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug:  dining_philosophers.cpp
+	$(CXX) -O0 -D_CONSOLE -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	rm -f $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+light_test:
+	$(run_cmd) ./$(PROG) $(LIGHT_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/Makefile.windows b/xdl/third_party/tbb/examples/graph/dining_philosophers/Makefile.windows
new file mode 100644
index 00000000..6a3267b6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/Makefile.windows
@@ -0,0 +1,48 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=dining_philosophers
+ARGS= auto 5
+LIGHT_ARGS= auto 3
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: 
+	$(CXX) ./dining_philosophers.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: 
+	$(CXX) ./dining_philosophers.cpp /MDd /Od /Zi /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+profile: 
+	$(CXX) ./dining_philosophers.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/dining_philosophers.cpp b/xdl/third_party/tbb/examples/graph/dining_philosophers/dining_philosophers.cpp
new file mode 100644
index 00000000..66b18b64
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/dining_philosophers.cpp
@@ -0,0 +1,306 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER
+    // Suppress "decorated name length exceeded, name was truncated" warning
+    #pragma warning (disable: 4503)
+#endif
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/atomic.h"
+#include "tbb/spin_mutex.h"
+#include <iostream>
+#include "../../common/utility/utility.h"
+#include <cstdlib>
+#include <cstdio>
+
+// Each philosopher is an object, and is invoked in the think() function_node, the
+// eat() function_node and forward() multifunction_node.
+//
+// The graph is constructed, and each think() function_node is started with a continue_msg.
+//
+// The philosopher will think, then gather two chopsticks, eat, place the chopsticks back,
+// and if they have not completed the required number of cycles, will start to think() again
+// by sending a continue_msg to their corresponding think() function_node.
+//
+// The reserving join has as its inputs the left and right chopstick queues an a queue
+// that stores the continue_msg emitted by the function_node after think()ing is done.
+// When all three inputs are available, a tuple of the inputs will be forwarded to the
+// eat() function_node.  The output of the eat() function_node is sent to the forward()
+// multifunction_node.
+
+const tbb::tick_count::interval_t think_time(1.0);
+const tbb::tick_count::interval_t eat_time(1.0);
+const int num_times = 10;
+
+tbb::tick_count t0;
+bool verbose = false;
+
+const char *names[] = { "Archimedes", "Bakunin", "Confucius", "Democritus", "Euclid"
+                      , "Favorinus", "Geminus", "Heraclitus", "Ichthyas", "Jason of Nysa",
+                          "Kant", "Lavrov", "Metrocles", "Nausiphanes", "Onatas", "Phaedrus",
+                          "Quillot", "Russell", "Socrates", "Thales", "Udayana",
+                          "Vernadsky", "Wittgenstein", "Xenophilus", "Yen Yuan", "Zenodotus"
+};
+const int NumPhilosophers = sizeof(names) / sizeof(char*);
+
+struct RunOptions {
+    utility::thread_number_range threads;
+    int number_of_philosophers;
+    bool silent;
+    RunOptions(utility::thread_number_range threads_, int number_of_philosophers_, bool silent_) :
+        threads(threads_), number_of_philosophers(number_of_philosophers_), silent(silent_) { }
+};
+
+RunOptions ParseCommandLine(int argc, char *argv[]) {
+    int auto_threads = tbb::task_scheduler_init::default_num_threads();
+    utility::thread_number_range threads(tbb::task_scheduler_init::default_num_threads, auto_threads, auto_threads);
+    int nPhilosophers = 5;
+    bool verbose = false;
+    char charbuf[100];
+    std::sprintf(charbuf, "%d", NumPhilosophers);
+    std::string pCount = "how many philosophers, from 2-";
+    pCount += charbuf;
+
+    utility::cli_argument_pack cli_pack;
+    cli_pack.positional_arg(threads, "n-of_threads", utility::thread_number_range_desc)
+            .positional_arg(nPhilosophers, "n-of-philosophers", pCount)
+            .arg(verbose,"verbose","verbose output");
+    utility::parse_cli_arguments(argc, argv, cli_pack);
+    if(nPhilosophers < 2 || nPhilosophers > NumPhilosophers) {
+        std::cout << "Number of philosophers (" << nPhilosophers << ") out of range [2:" << NumPhilosophers << "]\n";
+        std::cout << cli_pack.usage_string(argv[0]) << std::flush;
+        std::exit(1);
+    }
+    return RunOptions(threads, nPhilosophers,!verbose);
+}
+
+
+tbb::spin_mutex my_mutex;
+
+class chopstick {};
+
+using namespace tbb::flow;
+
+typedef tbb::flow::tuple<continue_msg, chopstick, chopstick> join_output;
+typedef join_node< join_output, reserving > join_node_type;
+
+typedef function_node<continue_msg, continue_msg> think_node_type;
+typedef function_node<join_output, continue_msg> eat_node_type;
+typedef multifunction_node<continue_msg, join_output> forward_node_type;
+
+class philosopher {
+public:
+
+    philosopher( const char *name ) :
+        my_name(name), my_count(num_times) { }
+
+    ~philosopher() {
+    }
+
+    void check();
+    const char *name() const { return my_name; }
+
+private:
+
+    friend std::ostream& operator<<(std::ostream& o, philosopher const &p);
+
+    const char *my_name;
+    int my_count;
+
+    friend class think_node_body;
+    friend class eat_node_body;
+    friend class forward_node_body;
+
+    void think( );
+    void eat();
+    void forward( const continue_msg &in, forward_node_type::output_ports_type &out_ports );
+};
+
+std::ostream& operator<<(std::ostream& o, philosopher const &p) {
+    o << "< philosopher[" << reinterpret_cast<uintptr_t>(const_cast<philosopher *>(&p)) << "] " << p.name()
+        << ", my_count=" << p.my_count;
+    return o;
+}
+
+class think_node_body {
+    philosopher& my_philosopher;
+public:
+    think_node_body( philosopher &p ) : my_philosopher(p) { }
+    think_node_body( const think_node_body &other ) : my_philosopher(other.my_philosopher) { }
+    continue_msg operator()( continue_msg /*m*/) {
+        my_philosopher.think();
+        return continue_msg();
+    }
+};
+
+class eat_node_body {
+    philosopher &my_philosopher;
+public:
+    eat_node_body( philosopher &p) : my_philosopher(p) {}
+    eat_node_body( const eat_node_body &other ) : my_philosopher(other.my_philosopher) { }
+    continue_msg operator()(const join_output &in) {
+        my_philosopher.eat();
+        return continue_msg();
+    }
+};
+
+class forward_node_body {
+    philosopher &my_philosopher;
+public:
+    forward_node_body( philosopher &p) : my_philosopher(p) {}
+    forward_node_body( const forward_node_body &other ) : my_philosopher(other.my_philosopher) { }
+    void operator()( const continue_msg &in, forward_node_type::output_ports_type &out) {
+        my_philosopher.forward( in, out);
+    }
+};
+
+void philosopher::check() {
+    if ( my_count != 0 ) {
+        std::printf("ERROR: philosopher %s still had to run %d more times\n", name(), my_count);
+        std::exit(1);
+    }
+}
+
+void philosopher::forward( const continue_msg &/*in*/, forward_node_type::output_ports_type &out_ports ) {
+    if(my_count < 0) abort();
+    --my_count;
+    (void)tbb::flow::get<1>(out_ports).try_put(chopstick());
+    (void)tbb::flow::get<2>(out_ports).try_put(chopstick());
+    if (my_count > 0) {
+        (void)tbb::flow::get<0>(out_ports).try_put(continue_msg());  //start thinking again
+    } else {
+        if(verbose) {
+            tbb::spin_mutex::scoped_lock lock(my_mutex);
+            std::printf("%s has left the building\n", name());
+        }
+    }
+}
+
+void philosopher::eat() {
+    if(verbose) {
+        tbb::spin_mutex::scoped_lock lock(my_mutex);
+        std::printf("%s eating\n", name());
+    }
+    tbb::this_tbb_thread::sleep(eat_time);
+    if(verbose) {
+        tbb::spin_mutex::scoped_lock lock(my_mutex);
+        std::printf("%s done eating\n", name());
+    }
+}
+
+void philosopher::think() {
+    if(verbose) {
+        tbb::spin_mutex::scoped_lock lock(my_mutex);
+        std::printf("%s thinking\n", name());
+    }
+    tbb::this_tbb_thread::sleep(think_time);
+    if(verbose) {
+        tbb::spin_mutex::scoped_lock lock(my_mutex);
+        std::printf("%s done thinking\n", name());
+    }
+}
+
+typedef queue_node<continue_msg> thinking_done_type;
+
+int main(int argc, char *argv[]) {
+    try {
+        tbb::tick_count main_time = tbb::tick_count::now();
+        int num_threads;
+        int num_philosophers;
+
+        RunOptions options = ParseCommandLine(argc, argv);
+        num_philosophers = options.number_of_philosophers;
+        verbose = !options.silent;
+
+    for(num_threads = options.threads.first; num_threads <= options.threads.last; num_threads = options.threads.step(num_threads)) {
+
+        tbb::task_scheduler_init init(num_threads);
+
+            graph g;
+
+            if(verbose) std::cout << std::endl << num_philosophers << " philosophers with "
+                << num_threads << " threads" << std::endl << std::endl;
+            t0 = tbb::tick_count::now();
+
+            std::vector<queue_node<chopstick> > places(num_philosophers, queue_node<chopstick>(g));
+            std::vector<philosopher> philosophers;
+            philosophers.reserve(num_philosophers);
+            std::vector<think_node_type *> think_nodes;
+            think_nodes.reserve(num_philosophers);
+            std::vector<thinking_done_type> done_vector(num_philosophers, thinking_done_type(g));
+            std::vector<join_node_type> join_vector(num_philosophers,join_node_type(g));
+            std::vector<eat_node_type *> eat_nodes;
+            eat_nodes.reserve(num_philosophers);
+            std::vector<forward_node_type *> forward_nodes;
+            forward_nodes.reserve(num_philosophers);
+            for ( int i = 0; i < num_philosophers; ++i ) {
+                places[i].try_put(chopstick());
+                philosophers.push_back( philosopher( names[i] ) );  // allowed because of default generated assignment
+                if(verbose) {
+                    tbb::spin_mutex::scoped_lock lock(my_mutex);
+                    std::cout << "Built philosopher " << philosophers[i] << std::endl;
+                }
+                think_nodes.push_back(new think_node_type(g, unlimited, think_node_body(philosophers[i])));
+                eat_nodes.push_back( new eat_node_type(g, unlimited, eat_node_body(philosophers[i])));
+                forward_nodes.push_back( new forward_node_type(g, unlimited, forward_node_body(philosophers[i])));
+            }
+
+            // attach chopstick buffers and think function_nodes to joins
+            for(int i = 0; i < num_philosophers; ++i) {
+                make_edge( *think_nodes[i], done_vector[i] );
+                make_edge( done_vector[i], input_port<0>(join_vector[i]) );
+                make_edge( places[i], input_port<1>(join_vector[i]) ); // left chopstick
+                make_edge( places[(i+1) % num_philosophers], input_port<2>(join_vector[i]) ); // right chopstick
+                make_edge( join_vector[i], *eat_nodes[i] );
+                make_edge( *eat_nodes[i], *forward_nodes[i] );
+                make_edge( output_port<0>(*forward_nodes[i]), *think_nodes[i] );
+                make_edge( output_port<1>(*forward_nodes[i]), places[i] );
+                make_edge( output_port<2>(*forward_nodes[i]), places[(i+1) % num_philosophers] );
+            }
+
+            // start all the philosophers thinking
+            for(int i = 0; i < num_philosophers; ++i) think_nodes[i]->try_put(continue_msg());
+
+            g.wait_for_all();
+
+            tbb::tick_count t1 = tbb::tick_count::now();
+            if(verbose) std::cout << std::endl << num_philosophers << " philosophers with "
+                << num_threads << " threads have taken " << (t1-t0).seconds() << "seconds" << std::endl;
+
+            for ( int i = 0; i < num_philosophers; ++i ) philosophers[i].check();
+
+            for(int i = 0; i < num_philosophers; ++i) {
+                delete think_nodes[i];
+                delete eat_nodes[i];
+                delete forward_nodes[i];
+            }
+        }
+
+        utility::report_elapsed_time((tbb::tick_count::now() - main_time).seconds());
+        return 0;
+    } catch(std::exception& e) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/msvs/dining_philosophers.sln b/xdl/third_party/tbb/examples/graph/dining_philosophers/msvs/dining_philosophers.sln
new file mode 100644
index 00000000..d00745fa
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/msvs/dining_philosophers.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "dining_philosophers", "dining_philosophers.vcxproj", "{3894D1D2-A574-4937-AD56-726758EFE5B7}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Debug|Win32.Build.0 = Debug|Win32
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Debug|x64.ActiveCfg = Debug|x64
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Debug|x64.Build.0 = Debug|x64
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Release|Win32.ActiveCfg = Release|Win32
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Release|Win32.Build.0 = Release|Win32
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Release|x64.ActiveCfg = Release|x64
+		{3894D1D2-A574-4937-AD56-726758EFE5B7}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/msvs/dining_philosophers.vcxproj b/xdl/third_party/tbb/examples/graph/dining_philosophers/msvs/dining_philosophers.vcxproj
new file mode 100644
index 00000000..78b0ae28
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/msvs/dining_philosophers.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>dining_philosophers</ProjectName>
+    <ProjectGuid>{3894d1d2-a574-4937-ad56-726758efe5b7}</ProjectGuid>
+    <RootNamespace>dining_philosophers</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\dining_philosophers.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/readme.html b/xdl/third_party/tbb/examples/graph/dining_philosophers/readme.html
new file mode 100644
index 00000000..ada56dd7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/readme.html
@@ -0,0 +1,383 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Dining_philosophers sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Dining_philosophers sample</h1>
+	</div>
+	
+	<p>
+		The Dining Philosophers problem demonstrates tbb::flow and the use of the reserving join node to
+		solve the potential deadlock.
+	<br><br>
+		This program runs some number of philosophers in parallel, each thinking and then waiting for chopsticks
+		to be available before eating.  Eating and thinking are implemented with sleep().  The chopstick positions are represented by a queue_node with one item.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="dining_philosophers.cpp">dining_philosophers.cpp</a>
+				<dd>Source code for the example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+			<dt><a href="msvs/">msvs</a>
+			<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+			<dt><a href="xcode/">xcode</a>
+			<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/dining_philosophers/xcode/dining_philosophers.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/graph/dining_philosophers/xcode/dining_philosophers.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..83e62661
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/dining_philosophers/xcode/dining_philosophers.xcodeproj/project.pbxproj
@@ -0,0 +1,314 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* dining_philosophers.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* dining_philosophers.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58955218B5FE200DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* dining_philosophers */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = dining_philosophers; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* dining_philosophers.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = dining_philosophers.cpp; path = ../dining_philosophers.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* dining_philosophers */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = dining_philosophers;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F593A50B8F042A00073279 /* dining_philosophers.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* dining_philosophers */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* dining_philosophers */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "dining_philosophers" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58955218B5FE200DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = dining_philosophers;
+			productInstallPath = "$(HOME)/bin";
+			productName = dining_philosophers;
+			productReference = 8DD76F6C0486A84900D96B5E /* dining_philosophers */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "dining_philosophers" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* dining_philosophers */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* dining_philosophers */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* dining_philosophers.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRODUCT_NAME = dining_philosophers;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRODUCT_NAME = dining_philosophers;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "dining_philosophers" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "dining_philosophers" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/Makefile b/xdl/third_party/tbb/examples/graph/fgbzip2/Makefile
new file mode 100644
index 00000000..0b01b048
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/Makefile
@@ -0,0 +1,60 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+
+run_cmd=
+PROG=fgbzip2
+ARGS=-b=9 -a=async_node $(PROG)
+PERF_RUN_ARGS=-b=9 -a=async_node $(PROG)
+
+# icpc by default
+ifneq (,$(shell which icc 2>/dev/null))
+    CXX=icpc
+endif
+
+# autodetect C++11 support
+include ../../common/examples-common.inc
+
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt -lpthread
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all: release test
+
+release:
+	$(CXX) -O2 -DNDEBUG *.cpp $(CXXFLAGS) -o $(PROG) -ltbb $(LIBS) $(CXX0XFLAGS)
+
+debug:
+	$(CXX) -O0 -g -DTBB_USE_DEBUG *.cpp $(CXXFLAGS) -o $(PROG) -ltbb_debug $(LIBS)  $(CXX0XFLAGS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(PROG) *.o *.d *.bz2
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/Makefile.windows b/xdl/third_party/tbb/examples/graph/fgbzip2/Makefile.windows
new file mode 100644
index 00000000..e3a539d2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/Makefile.windows
@@ -0,0 +1,57 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+run_cmd=
+PROG=fgbzip2
+ARGS=-b=9 -a=async_node $(PROG).exe
+PERF_RUN_ARGS=-b=9 -a=async_node $(PROG).exe
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_WARNINGS /D _CRT_NONSTDC_NO_DEPRECATE /wd4267 /wd4244
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+
+release:
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+debug:
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+profile: 
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest *.bz2
+
+test:
+	$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/blocksort.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/blocksort.cpp
new file mode 100644
index 00000000..60dffb44
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/blocksort.cpp
@@ -0,0 +1,1146 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Block sorting machinery                               ---*/
+/*---                                         blocksort.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+    The original source for this example:
+    This file is part of bzip2/libbzip2, a program and library for
+    lossless, block-sorting data compression.
+
+    bzip2/libbzip2 version 1.0.6 of 6 September 2010
+    Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+    This program, "bzip2", the associated library "libbzip2", and all
+    documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+    rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+
+    1. Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+
+    2. The origin of this software must not be misrepresented; you must 
+    not claim that you wrote the original software.  If you use this 
+    software in a product, an acknowledgment in the product 
+    documentation would be appreciated but is not required.
+
+    3. Altered source versions must be plainly marked as such, and must
+    not be misrepresented as being the original software.
+
+    4. The name of the author may not be used to endorse or promote 
+    products derived from this software without specific prior written 
+    permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+    GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+    INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+    WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+    Julian Seward, jseward@bzip.org
+    bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#include "bzlib_private.h"
+
+/*---------------------------------------------*/
+/*--- Fallback O(N log(N)^2) sorting        ---*/
+/*--- algorithm, for repetitive blocks      ---*/
+/*---------------------------------------------*/
+
+/*---------------------------------------------*/
+static 
+__inline__
+void fallbackSimpleSort ( UInt32* fmap, 
+                          UInt32* eclass, 
+                          Int32   lo, 
+                          Int32   hi )
+{
+   Int32 i, j, tmp;
+   UInt32 ec_tmp;
+
+   if (lo == hi) return;
+
+   if (hi - lo > 3) {
+      for ( i = hi-4; i >= lo; i-- ) {
+         tmp = fmap[i];
+         ec_tmp = eclass[tmp];
+         for ( j = i+4; j <= hi && ec_tmp > eclass[fmap[j]]; j += 4 )
+            fmap[j-4] = fmap[j];
+         fmap[j-4] = tmp;
+      }
+   }
+
+   for ( i = hi-1; i >= lo; i-- ) {
+      tmp = fmap[i];
+      ec_tmp = eclass[tmp];
+      for ( j = i+1; j <= hi && ec_tmp > eclass[fmap[j]]; j++ )
+         fmap[j-1] = fmap[j];
+      fmap[j-1] = tmp;
+   }
+}
+
+
+/*---------------------------------------------*/
+#define fswap(zz1, zz2) \
+   { Int32 zztmp = zz1; zz1 = zz2; zz2 = zztmp; }
+
+#define fvswap(zzp1, zzp2, zzn)       \
+{                                     \
+   Int32 yyp1 = (zzp1);               \
+   Int32 yyp2 = (zzp2);               \
+   Int32 yyn  = (zzn);                \
+   while (yyn > 0) {                  \
+      fswap(fmap[yyp1], fmap[yyp2]);  \
+      yyp1++; yyp2++; yyn--;          \
+   }                                  \
+}
+
+
+#define fmin(a,b) ((a) < (b)) ? (a) : (b)
+
+#define fpush(lz,hz) { stackLo[sp] = lz; \
+                       stackHi[sp] = hz; \
+                       sp++; }
+
+#define fpop(lz,hz) { sp--;              \
+                      lz = stackLo[sp];  \
+                      hz = stackHi[sp]; }
+
+#define FALLBACK_QSORT_SMALL_THRESH 10
+#define FALLBACK_QSORT_STACK_SIZE   100
+
+
+static
+void fallbackQSort3 ( UInt32* fmap, 
+                      UInt32* eclass,
+                      Int32   loSt, 
+                      Int32   hiSt )
+{
+   Int32 unLo, unHi, ltLo, gtHi, n, m;
+   Int32 sp, lo, hi;
+   UInt32 med, r, r3;
+   Int32 stackLo[FALLBACK_QSORT_STACK_SIZE];
+   Int32 stackHi[FALLBACK_QSORT_STACK_SIZE];
+
+   r = 0;
+
+   sp = 0;
+   fpush ( loSt, hiSt );
+
+   while (sp > 0) {
+
+      AssertH ( sp < FALLBACK_QSORT_STACK_SIZE - 1, 1004 );
+
+      fpop ( lo, hi );
+      if (hi - lo < FALLBACK_QSORT_SMALL_THRESH) {
+         fallbackSimpleSort ( fmap, eclass, lo, hi );
+         continue;
+      }
+
+      /* Random partitioning.  Median of 3 sometimes fails to
+         avoid bad cases.  Median of 9 seems to help but 
+         looks rather expensive.  This too seems to work but
+         is cheaper.  Guidance for the magic constants 
+         7621 and 32768 is taken from Sedgewick's algorithms
+         book, chapter 35.
+      */
+      r = ((r * 7621) + 1) % 32768;
+      r3 = r % 3;
+      if (r3 == 0) med = eclass[fmap[lo]]; else
+      if (r3 == 1) med = eclass[fmap[(lo+hi)>>1]]; else
+                   med = eclass[fmap[hi]];
+
+      unLo = ltLo = lo;
+      unHi = gtHi = hi;
+
+      while (1) {
+         while (1) {
+            if (unLo > unHi) break;
+            n = (Int32)eclass[fmap[unLo]] - (Int32)med;
+            if (n == 0) { 
+               fswap(fmap[unLo], fmap[ltLo]); 
+               ltLo++; unLo++; 
+               continue; 
+            };
+            if (n > 0) break;
+            unLo++;
+         }
+         while (1) {
+            if (unLo > unHi) break;
+            n = (Int32)eclass[fmap[unHi]] - (Int32)med;
+            if (n == 0) { 
+               fswap(fmap[unHi], fmap[gtHi]); 
+               gtHi--; unHi--; 
+               continue; 
+            };
+            if (n < 0) break;
+            unHi--;
+         }
+         if (unLo > unHi) break;
+         fswap(fmap[unLo], fmap[unHi]); unLo++; unHi--;
+      }
+
+      AssertD ( unHi == unLo-1, "fallbackQSort3(2)" );
+
+      if (gtHi < ltLo) continue;
+
+      n = fmin(ltLo-lo, unLo-ltLo); fvswap(lo, unLo-n, n);
+      m = fmin(hi-gtHi, gtHi-unHi); fvswap(unLo, hi-m+1, m);
+
+      n = lo + unLo - ltLo - 1;
+      m = hi - (gtHi - unHi) + 1;
+
+      if (n - lo > hi - m) {
+         fpush ( lo, n );
+         fpush ( m, hi );
+      } else {
+         fpush ( m, hi );
+         fpush ( lo, n );
+      }
+   }
+}
+
+#undef fmin
+#undef fpush
+#undef fpop
+#undef fswap
+#undef fvswap
+#undef FALLBACK_QSORT_SMALL_THRESH
+#undef FALLBACK_QSORT_STACK_SIZE
+
+
+/*---------------------------------------------*/
+/* Pre:
+      nblock > 0
+      eclass exists for [0 .. nblock-1]
+      ((UChar*)eclass) [0 .. nblock-1] holds block
+      ptr exists for [0 .. nblock-1]
+
+   Post:
+      ((UChar*)eclass) [0 .. nblock-1] holds block
+      All other areas of eclass destroyed
+      fmap [0 .. nblock-1] holds sorted order
+      bhtab [ 0 .. 2+(nblock/32) ] destroyed
+*/
+
+#define       SET_BH(zz)  bhtab[(zz) >> 5] |= (1 << ((zz) & 31))
+#define     CLEAR_BH(zz)  bhtab[(zz) >> 5] &= ~(1 << ((zz) & 31))
+#define     ISSET_BH(zz)  (bhtab[(zz) >> 5] & (1 << ((zz) & 31)))
+#define      WORD_BH(zz)  bhtab[(zz) >> 5]
+#define UNALIGNED_BH(zz)  ((zz) & 0x01f)
+
+static
+void fallbackSort ( UInt32* fmap, 
+                    UInt32* eclass, 
+                    UInt32* bhtab,
+                    Int32   nblock,
+                    Int32   verb )
+{
+   Int32 ftab[257];
+   Int32 ftabCopy[256];
+   Int32 H, i, j, k, l, r, cc, cc1;
+   Int32 nNotDone;
+   Int32 nBhtab;
+   UChar* eclass8 = (UChar*)eclass;
+
+   /*--
+      Initial 1-char radix sort to generate
+      initial fmap and initial BH bits.
+   --*/
+   if (verb >= 4)
+      VPrintf0 ( "        bucket sorting ...\n" );
+   for (i = 0; i < 257;    i++) ftab[i] = 0;
+   for (i = 0; i < nblock; i++) ftab[eclass8[i]]++;
+   for (i = 0; i < 256;    i++) ftabCopy[i] = ftab[i];
+   for (i = 1; i < 257;    i++) ftab[i] += ftab[i-1];
+
+   for (i = 0; i < nblock; i++) {
+      j = eclass8[i];
+      k = ftab[j] - 1;
+      ftab[j] = k;
+      fmap[k] = i;
+   }
+
+   nBhtab = 2 + (nblock / 32);
+   for (i = 0; i < nBhtab; i++) bhtab[i] = 0;
+   for (i = 0; i < 256; i++) SET_BH(ftab[i]);
+
+   /*--
+      Inductively refine the buckets.  Kind-of an
+      "exponential radix sort" (!), inspired by the
+      Manber-Myers suffix array construction algorithm.
+   --*/
+
+   /*-- set sentinel bits for block-end detection --*/
+   for (i = 0; i < 32; i++) { 
+      SET_BH(nblock + 2*i);
+      CLEAR_BH(nblock + 2*i + 1);
+   }
+
+   /*-- the log(N) loop --*/
+   H = 1;
+   while (1) {
+
+      if (verb >= 4) 
+         VPrintf1 ( "        depth %6d has ", H );
+
+      j = 0;
+      for (i = 0; i < nblock; i++) {
+         if (ISSET_BH(i)) j = i;
+         k = fmap[i] - H; if (k < 0) k += nblock;
+         eclass[k] = j;
+      }
+
+      nNotDone = 0;
+      r = -1;
+      while (1) {
+
+	 /*-- find the next non-singleton bucket --*/
+         k = r + 1;
+         while (ISSET_BH(k) && UNALIGNED_BH(k)) k++;
+         if (ISSET_BH(k)) {
+            while (WORD_BH(k) == 0xffffffff) k += 32;
+            while (ISSET_BH(k)) k++;
+         }
+         l = k - 1;
+         if (l >= nblock) break;
+         while (!ISSET_BH(k) && UNALIGNED_BH(k)) k++;
+         if (!ISSET_BH(k)) {
+            while (WORD_BH(k) == 0x00000000) k += 32;
+            while (!ISSET_BH(k)) k++;
+         }
+         r = k - 1;
+         if (r >= nblock) break;
+
+         /*-- now [l, r] bracket current bucket --*/
+         if (r > l) {
+            nNotDone += (r - l + 1);
+            fallbackQSort3 ( fmap, eclass, l, r );
+
+            /*-- scan bucket and generate header bits-- */
+            cc = -1;
+            for (i = l; i <= r; i++) {
+               cc1 = eclass[fmap[i]];
+               if (cc != cc1) { SET_BH(i); cc = cc1; };
+            }
+         }
+      }
+
+      if (verb >= 4) 
+         VPrintf1 ( "%6d unresolved strings\n", nNotDone );
+
+      H *= 2;
+      if (H > nblock || nNotDone == 0) break;
+   }
+
+   /*-- 
+      Reconstruct the original block in
+      eclass8 [0 .. nblock-1], since the
+      previous phase destroyed it.
+   --*/
+   if (verb >= 4)
+      VPrintf0 ( "        reconstructing block ...\n" );
+   j = 0;
+   for (i = 0; i < nblock; i++) {
+      while (ftabCopy[j] == 0) j++;
+      ftabCopy[j]--;
+      eclass8[fmap[i]] = (UChar)j;
+   }
+   AssertH ( j < 256, 1005 );
+}
+
+#undef       SET_BH
+#undef     CLEAR_BH
+#undef     ISSET_BH
+#undef      WORD_BH
+#undef UNALIGNED_BH
+
+
+/*---------------------------------------------*/
+/*--- The main, O(N^2 log(N)) sorting       ---*/
+/*--- algorithm.  Faster for "normal"       ---*/
+/*--- non-repetitive blocks.                ---*/
+/*---------------------------------------------*/
+
+/*---------------------------------------------*/
+static
+__inline__
+Bool mainGtU ( UInt32  i1, 
+               UInt32  i2,
+               UChar*  block, 
+               UInt16* quadrant,
+               UInt32  nblock,
+               Int32*  budget )
+{
+   Int32  k;
+   UChar  c1, c2;
+   UInt16 s1, s2;
+
+   AssertD ( i1 != i2, "mainGtU" );
+   /* 1 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 2 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 3 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 4 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 5 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 6 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 7 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 8 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 9 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 10 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 11 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+   /* 12 */
+   c1 = block[i1]; c2 = block[i2];
+   if (c1 != c2) return (c1 > c2);
+   i1++; i2++;
+
+   k = nblock + 8;
+
+   do {
+      /* 1 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 2 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 3 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 4 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 5 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 6 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 7 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+      /* 8 */
+      c1 = block[i1]; c2 = block[i2];
+      if (c1 != c2) return (c1 > c2);
+      s1 = quadrant[i1]; s2 = quadrant[i2];
+      if (s1 != s2) return (s1 > s2);
+      i1++; i2++;
+
+      if (i1 >= nblock) i1 -= nblock;
+      if (i2 >= nblock) i2 -= nblock;
+
+      k -= 8;
+      (*budget)--;
+   }
+      while (k >= 0);
+
+   return False;
+}
+
+
+/*---------------------------------------------*/
+/*--
+   Knuth's increments seem to work better
+   than Incerpi-Sedgewick here.  Possibly
+   because the number of elements to sort
+   is usually small, typically <= 20.
+--*/
+static
+Int32 incs[14] = { 1, 4, 13, 40, 121, 364, 1093, 3280,
+                   9841, 29524, 88573, 265720,
+                   797161, 2391484 };
+
+static
+void mainSimpleSort ( UInt32* ptr,
+                      UChar*  block,
+                      UInt16* quadrant,
+                      Int32   nblock,
+                      Int32   lo, 
+                      Int32   hi, 
+                      Int32   d,
+                      Int32*  budget )
+{
+   Int32 i, j, h, bigN, hp;
+   UInt32 v;
+
+   bigN = hi - lo + 1;
+   if (bigN < 2) return;
+
+   hp = 0;
+   while (incs[hp] < bigN) hp++;
+   hp--;
+
+   for (; hp >= 0; hp--) {
+      h = incs[hp];
+
+      i = lo + h;
+      while (True) {
+
+         /*-- copy 1 --*/
+         if (i > hi) break;
+         v = ptr[i];
+         j = i;
+         while ( mainGtU ( 
+                    ptr[j-h]+d, v+d, block, quadrant, nblock, budget 
+                 ) ) {
+            ptr[j] = ptr[j-h];
+            j = j - h;
+            if (j <= (lo + h - 1)) break;
+         }
+         ptr[j] = v;
+         i++;
+
+         /*-- copy 2 --*/
+         if (i > hi) break;
+         v = ptr[i];
+         j = i;
+         while ( mainGtU ( 
+                    ptr[j-h]+d, v+d, block, quadrant, nblock, budget 
+                 ) ) {
+            ptr[j] = ptr[j-h];
+            j = j - h;
+            if (j <= (lo + h - 1)) break;
+         }
+         ptr[j] = v;
+         i++;
+
+         /*-- copy 3 --*/
+         if (i > hi) break;
+         v = ptr[i];
+         j = i;
+         while ( mainGtU ( 
+                    ptr[j-h]+d, v+d, block, quadrant, nblock, budget 
+                 ) ) {
+            ptr[j] = ptr[j-h];
+            j = j - h;
+            if (j <= (lo + h - 1)) break;
+         }
+         ptr[j] = v;
+         i++;
+
+         if (*budget < 0) return;
+      }
+   }
+}
+
+
+/*---------------------------------------------*/
+/*--
+   The following is an implementation of
+   an elegant 3-way quicksort for strings,
+   described in a paper "Fast Algorithms for
+   Sorting and Searching Strings", by Robert
+   Sedgewick and Jon L. Bentley.
+--*/
+
+#define mswap(zz1, zz2) \
+   { Int32 zztmp = zz1; zz1 = zz2; zz2 = zztmp; }
+
+#define mvswap(zzp1, zzp2, zzn)       \
+{                                     \
+   Int32 yyp1 = (zzp1);               \
+   Int32 yyp2 = (zzp2);               \
+   Int32 yyn  = (zzn);                \
+   while (yyn > 0) {                  \
+      mswap(ptr[yyp1], ptr[yyp2]);    \
+      yyp1++; yyp2++; yyn--;          \
+   }                                  \
+}
+
+static 
+__inline__
+UChar mmed3 ( UChar a, UChar b, UChar c )
+{
+   UChar t;
+   if (a > b) { t = a; a = b; b = t; };
+   if (b > c) { 
+      b = c;
+      if (a > b) b = a;
+   }
+   return b;
+}
+
+#define mmin(a,b) ((a) < (b)) ? (a) : (b)
+
+#define mpush(lz,hz,dz) { stackLo[sp] = lz; \
+                          stackHi[sp] = hz; \
+                          stackD [sp] = dz; \
+                          sp++; }
+
+#define mpop(lz,hz,dz) { sp--;             \
+                         lz = stackLo[sp]; \
+                         hz = stackHi[sp]; \
+                         dz = stackD [sp]; }
+
+
+#define mnextsize(az) (nextHi[az]-nextLo[az])
+
+#define mnextswap(az,bz)                                        \
+   { Int32 tz;                                                  \
+     tz = nextLo[az]; nextLo[az] = nextLo[bz]; nextLo[bz] = tz; \
+     tz = nextHi[az]; nextHi[az] = nextHi[bz]; nextHi[bz] = tz; \
+     tz = nextD [az]; nextD [az] = nextD [bz]; nextD [bz] = tz; }
+
+
+#define MAIN_QSORT_SMALL_THRESH 20
+#define MAIN_QSORT_DEPTH_THRESH (BZ_N_RADIX + BZ_N_QSORT)
+#define MAIN_QSORT_STACK_SIZE 100
+
+static
+void mainQSort3 ( UInt32* ptr,
+                  UChar*  block,
+                  UInt16* quadrant,
+                  Int32   nblock,
+                  Int32   loSt, 
+                  Int32   hiSt, 
+                  Int32   dSt,
+                  Int32*  budget )
+{
+   Int32 unLo, unHi, ltLo, gtHi, n, m, med;
+   Int32 sp, lo, hi, d;
+
+   Int32 stackLo[MAIN_QSORT_STACK_SIZE];
+   Int32 stackHi[MAIN_QSORT_STACK_SIZE];
+   Int32 stackD [MAIN_QSORT_STACK_SIZE];
+
+   Int32 nextLo[3];
+   Int32 nextHi[3];
+   Int32 nextD [3];
+
+   sp = 0;
+   mpush ( loSt, hiSt, dSt );
+
+   while (sp > 0) {
+
+      AssertH ( sp < MAIN_QSORT_STACK_SIZE - 2, 1001 );
+
+      mpop ( lo, hi, d );
+      if (hi - lo < MAIN_QSORT_SMALL_THRESH || 
+          d > MAIN_QSORT_DEPTH_THRESH) {
+         mainSimpleSort ( ptr, block, quadrant, nblock, lo, hi, d, budget );
+         if (*budget < 0) return;
+         continue;
+      }
+
+      med = (Int32) 
+            mmed3 ( block[ptr[ lo         ]+d],
+                    block[ptr[ hi         ]+d],
+                    block[ptr[ (lo+hi)>>1 ]+d] );
+
+      unLo = ltLo = lo;
+      unHi = gtHi = hi;
+
+      while (True) {
+         while (True) {
+            if (unLo > unHi) break;
+            n = ((Int32)block[ptr[unLo]+d]) - med;
+            if (n == 0) { 
+               mswap(ptr[unLo], ptr[ltLo]); 
+               ltLo++; unLo++; continue; 
+            };
+            if (n >  0) break;
+            unLo++;
+         }
+         while (True) {
+            if (unLo > unHi) break;
+            n = ((Int32)block[ptr[unHi]+d]) - med;
+            if (n == 0) { 
+               mswap(ptr[unHi], ptr[gtHi]); 
+               gtHi--; unHi--; continue; 
+            };
+            if (n <  0) break;
+            unHi--;
+         }
+         if (unLo > unHi) break;
+         mswap(ptr[unLo], ptr[unHi]); unLo++; unHi--;
+      }
+
+      AssertD ( unHi == unLo-1, "mainQSort3(2)" );
+
+      if (gtHi < ltLo) {
+         mpush(lo, hi, d+1 );
+         continue;
+      }
+
+      n = mmin(ltLo-lo, unLo-ltLo); mvswap(lo, unLo-n, n);
+      m = mmin(hi-gtHi, gtHi-unHi); mvswap(unLo, hi-m+1, m);
+
+      n = lo + unLo - ltLo - 1;
+      m = hi - (gtHi - unHi) + 1;
+
+      nextLo[0] = lo;  nextHi[0] = n;   nextD[0] = d;
+      nextLo[1] = m;   nextHi[1] = hi;  nextD[1] = d;
+      nextLo[2] = n+1; nextHi[2] = m-1; nextD[2] = d+1;
+
+      if (mnextsize(0) < mnextsize(1)) mnextswap(0,1);
+      if (mnextsize(1) < mnextsize(2)) mnextswap(1,2);
+      if (mnextsize(0) < mnextsize(1)) mnextswap(0,1);
+
+      AssertD (mnextsize(0) >= mnextsize(1), "mainQSort3(8)" );
+      AssertD (mnextsize(1) >= mnextsize(2), "mainQSort3(9)" );
+
+      mpush (nextLo[0], nextHi[0], nextD[0]);
+      mpush (nextLo[1], nextHi[1], nextD[1]);
+      mpush (nextLo[2], nextHi[2], nextD[2]);
+   }
+}
+
+#undef mswap
+#undef mvswap
+#undef mpush
+#undef mpop
+#undef mmin
+#undef mnextsize
+#undef mnextswap
+#undef MAIN_QSORT_SMALL_THRESH
+#undef MAIN_QSORT_DEPTH_THRESH
+#undef MAIN_QSORT_STACK_SIZE
+
+
+/*---------------------------------------------*/
+/* Pre:
+      nblock > N_OVERSHOOT
+      block32 exists for [0 .. nblock-1 +N_OVERSHOOT]
+      ((UChar*)block32) [0 .. nblock-1] holds block
+      ptr exists for [0 .. nblock-1]
+
+   Post:
+      ((UChar*)block32) [0 .. nblock-1] holds block
+      All other areas of block32 destroyed
+      ftab [0 .. 65536 ] destroyed
+      ptr [0 .. nblock-1] holds sorted order
+      if (*budget < 0), sorting was abandoned
+*/
+
+#define BIGFREQ(b) (ftab[((b)+1) << 8] - ftab[(b) << 8])
+#define SETMASK (1 << 21)
+#define CLEARMASK (~(SETMASK))
+
+static
+void mainSort ( UInt32* ptr, 
+                UChar*  block,
+                UInt16* quadrant, 
+                UInt32* ftab,
+                Int32   nblock,
+                Int32   verb,
+                Int32*  budget )
+{
+   Int32  i, j, k, ss, sb;
+   Int32  runningOrder[256];
+   Bool   bigDone[256];
+   Int32  copyStart[256];
+   Int32  copyEnd  [256];
+   UChar  c1;
+   Int32  numQSorted;
+   UInt16 s;
+   if (verb >= 4) VPrintf0 ( "        main sort initialise ...\n" );
+
+   /*-- set up the 2-byte frequency table --*/
+   for (i = 65536; i >= 0; i--) ftab[i] = 0;
+
+   j = block[0] << 8;
+   i = nblock-1;
+   for (; i >= 3; i -= 4) {
+      quadrant[i] = 0;
+      j = (j >> 8) | ( ((UInt16)block[i]) << 8);
+      ftab[j]++;
+      quadrant[i-1] = 0;
+      j = (j >> 8) | ( ((UInt16)block[i-1]) << 8);
+      ftab[j]++;
+      quadrant[i-2] = 0;
+      j = (j >> 8) | ( ((UInt16)block[i-2]) << 8);
+      ftab[j]++;
+      quadrant[i-3] = 0;
+      j = (j >> 8) | ( ((UInt16)block[i-3]) << 8);
+      ftab[j]++;
+   }
+   for (; i >= 0; i--) {
+      quadrant[i] = 0;
+      j = (j >> 8) | ( ((UInt16)block[i]) << 8);
+      ftab[j]++;
+   }
+
+   /*-- (emphasises close relationship of block & quadrant) --*/
+   for (i = 0; i < BZ_N_OVERSHOOT; i++) {
+      block   [nblock+i] = block[i];
+      quadrant[nblock+i] = 0;
+   }
+
+   if (verb >= 4) VPrintf0 ( "        bucket sorting ...\n" );
+
+   /*-- Complete the initial radix sort --*/
+   for (i = 1; i <= 65536; i++) ftab[i] += ftab[i-1];
+
+   s = block[0] << 8;
+   i = nblock-1;
+   for (; i >= 3; i -= 4) {
+      s = (s >> 8) | (block[i] << 8);
+      j = ftab[s] -1;
+      ftab[s] = j;
+      ptr[j] = i;
+      s = (s >> 8) | (block[i-1] << 8);
+      j = ftab[s] -1;
+      ftab[s] = j;
+      ptr[j] = i-1;
+      s = (s >> 8) | (block[i-2] << 8);
+      j = ftab[s] -1;
+      ftab[s] = j;
+      ptr[j] = i-2;
+      s = (s >> 8) | (block[i-3] << 8);
+      j = ftab[s] -1;
+      ftab[s] = j;
+      ptr[j] = i-3;
+   }
+   for (; i >= 0; i--) {
+      s = (s >> 8) | (block[i] << 8);
+      j = ftab[s] -1;
+      ftab[s] = j;
+      ptr[j] = i;
+   }
+
+   /*--
+      Now ftab contains the first loc of every small bucket.
+      Calculate the running order, from smallest to largest
+      big bucket.
+   --*/
+   for (i = 0; i <= 255; i++) {
+      bigDone     [i] = False;
+      runningOrder[i] = i;
+   }
+
+   {
+      Int32 vv;
+      Int32 h = 1;
+      do h = 3 * h + 1; while (h <= 256);
+      do {
+         h = h / 3;
+         for (i = h; i <= 255; i++) {
+            vv = runningOrder[i];
+            j = i;
+            while ( BIGFREQ(runningOrder[j-h]) > BIGFREQ(vv) ) {
+               runningOrder[j] = runningOrder[j-h];
+               j = j - h;
+               if (j <= (h - 1)) goto zero;
+            }
+            zero:
+            runningOrder[j] = vv;
+         }
+      } while (h != 1);
+   }
+
+   /*--
+      The main sorting loop.
+   --*/
+
+   numQSorted = 0;
+
+   for (i = 0; i <= 255; i++) {
+
+      /*--
+         Process big buckets, starting with the least full.
+         Basically this is a 3-step process in which we call
+         mainQSort3 to sort the small buckets [ss, j], but
+         also make a big effort to avoid the calls if we can.
+      --*/
+      ss = runningOrder[i];
+
+      /*--
+         Step 1:
+         Complete the big bucket [ss] by quicksorting
+         any unsorted small buckets [ss, j], for j != ss.  
+         Hopefully previous pointer-scanning phases have already
+         completed many of the small buckets [ss, j], so
+         we don't have to sort them at all.
+      --*/
+      for (j = 0; j <= 255; j++) {
+         if (j != ss) {
+            sb = (ss << 8) + j;
+            if ( ! (ftab[sb] & SETMASK) ) {
+               Int32 lo = ftab[sb]   & CLEARMASK;
+               Int32 hi = (ftab[sb+1] & CLEARMASK) - 1;
+               if (hi > lo) {
+                  if (verb >= 4)
+                     VPrintf4 ( "        qsort [0x%x, 0x%x]   "
+                                "done %d   this %d\n",
+                                ss, j, numQSorted, hi - lo + 1 );
+                  mainQSort3 ( 
+                     ptr, block, quadrant, nblock, 
+                     lo, hi, BZ_N_RADIX, budget 
+                  );   
+                  numQSorted += (hi - lo + 1);
+                  if (*budget < 0) return;
+               }
+            }
+            ftab[sb] |= SETMASK;
+         }
+      }
+
+      AssertH ( !bigDone[ss], 1006 );
+
+      /*--
+         Step 2:
+         Now scan this big bucket [ss] so as to synthesise the
+         sorted order for small buckets [t, ss] for all t,
+         including, magically, the bucket [ss,ss] too.
+         This will avoid doing Real Work in subsequent Step 1's.
+      --*/
+      {
+         for (j = 0; j <= 255; j++) {
+            copyStart[j] =  ftab[(j << 8) + ss]     & CLEARMASK;
+            copyEnd  [j] = (ftab[(j << 8) + ss + 1] & CLEARMASK) - 1;
+         }
+         for (j = ftab[ss << 8] & CLEARMASK; j < copyStart[ss]; j++) {
+            k = ptr[j]-1; if (k < 0) k += nblock;
+            c1 = block[k];
+            if (!bigDone[c1])
+               ptr[ copyStart[c1]++ ] = k;
+         }
+         for (j = (ftab[(ss+1) << 8] & CLEARMASK) - 1; j > copyEnd[ss]; j--) {
+            k = ptr[j]-1; if (k < 0) k += nblock;
+            c1 = block[k];
+            if (!bigDone[c1]) 
+               ptr[ copyEnd[c1]-- ] = k;
+         }
+      }
+
+      AssertH ( (copyStart[ss]-1 == copyEnd[ss])
+                || 
+                /* Extremely rare case missing in bzip2-1.0.0 and 1.0.1.
+                   Necessity for this case is demonstrated by compressing 
+                   a sequence of approximately 48.5 million of character 
+                   251; 1.0.0/1.0.1 will then die here. */
+                (copyStart[ss] == 0 && copyEnd[ss] == nblock-1),
+                1007 )
+
+      for (j = 0; j <= 255; j++) ftab[(j << 8) + ss] |= SETMASK;
+
+      /*--
+         Step 3:
+         The [ss] big bucket is now done.  Record this fact,
+         and update the quadrant descriptors.  Remember to
+         update quadrants in the overshoot area too, if
+         necessary.  The "if (i < 255)" test merely skips
+         this updating for the last bucket processed, since
+         updating for the last bucket is pointless.
+
+         The quadrant array provides a way to incrementally
+         cache sort orderings, as they appear, so as to 
+         make subsequent comparisons in fullGtU() complete
+         faster.  For repetitive blocks this makes a big
+         difference (but not big enough to be able to avoid
+         the fallback sorting mechanism, exponential radix sort).
+
+         The precise meaning is: at all times:
+
+            for 0 <= i < nblock and 0 <= j <= nblock
+
+            if block[i] != block[j], 
+
+               then the relative values of quadrant[i] and 
+                    quadrant[j] are meaningless.
+
+               else {
+                  if quadrant[i] < quadrant[j]
+                     then the string starting at i lexicographically
+                     precedes the string starting at j
+
+                  else if quadrant[i] > quadrant[j]
+                     then the string starting at j lexicographically
+                     precedes the string starting at i
+
+                  else
+                     the relative ordering of the strings starting
+                     at i and j has not yet been determined.
+               }
+      --*/
+      bigDone[ss] = True;
+
+      if (i < 255) {
+         Int32 bbStart  = ftab[ss << 8] & CLEARMASK;
+         Int32 bbSize   = (ftab[(ss+1) << 8] & CLEARMASK) - bbStart;
+         Int32 shifts   = 0;
+
+         while ((bbSize >> shifts) > 65534) shifts++;
+
+         for (j = bbSize-1; j >= 0; j--) {
+            Int32 a2update     = ptr[bbStart + j];
+            UInt16 qVal        = (UInt16)(j >> shifts);
+            quadrant[a2update] = qVal;
+            if (a2update < BZ_N_OVERSHOOT)
+               quadrant[a2update + nblock] = qVal;
+         }
+         AssertH ( ((bbSize-1) >> shifts) <= 65535, 1002 );
+      }
+
+   }
+
+   if (verb >= 4)
+      VPrintf3 ( "        %d pointers, %d sorted, %d scanned\n",
+                 nblock, numQSorted, nblock - numQSorted );
+}
+
+#undef BIGFREQ
+#undef SETMASK
+#undef CLEARMASK
+
+
+/*---------------------------------------------*/
+/* Pre:
+      nblock > 0
+      arr2 exists for [0 .. nblock-1 +N_OVERSHOOT]
+      ((UChar*)arr2)  [0 .. nblock-1] holds block
+      arr1 exists for [0 .. nblock-1]
+
+   Post:
+      ((UChar*)arr2) [0 .. nblock-1] holds block
+      All other areas of block destroyed
+      ftab [ 0 .. 65536 ] destroyed
+      arr1 [0 .. nblock-1] holds sorted order
+*/
+void BZ2_blockSort ( EState* s )
+{
+   UInt32* ptr    = s->ptr; 
+   UChar*  block  = s->block;
+   UInt32* ftab   = s->ftab;
+   Int32   nblock = s->nblock;
+   Int32   verb   = s->verbosity;
+   Int32   wfact  = s->workFactor;
+   UInt16* quadrant;
+   Int32   budget;
+   Int32   budgetInit;
+   Int32   i;
+
+   if (nblock < 10000) {
+      fallbackSort ( s->arr1, s->arr2, ftab, nblock, verb );
+   } else {
+      /* Calculate the location for quadrant, remembering to get
+         the alignment right.  Assumes that &(block[0]) is at least
+         2-byte aligned -- this should be ok since block is really
+         the first section of arr2.
+      */
+      i = nblock+BZ_N_OVERSHOOT;
+      if (i & 1) i++;
+      quadrant = (UInt16*)(&(block[i]));
+
+      /* (wfact-1) / 3 puts the default-factor-30
+         transition point at very roughly the same place as 
+         with v0.1 and v0.9.0.  
+         Not that it particularly matters any more, since the
+         resulting compressed stream is now the same regardless
+         of whether or not we use the main sort or fallback sort.
+      */
+      if (wfact < 1  ) wfact = 1;
+      if (wfact > 100) wfact = 100;
+      budgetInit = nblock * ((wfact-1) / 3);
+      budget = budgetInit;
+
+      mainSort ( ptr, block, quadrant, ftab, nblock, verb, &budget );
+      if (verb >= 3) 
+         VPrintf3 ( "      %d work, %d block, ratio %5.2f\n",
+                    budgetInit - budget,
+                    nblock, 
+                    (float)(budgetInit - budget) /
+                    (float)(nblock==0 ? 1 : nblock) ); 
+      if (budget < 0) {
+         if (verb >= 2) 
+            VPrintf0 ( "    too repetitive; using fallback"
+                       " sorting algorithm\n" );
+         fallbackSort ( s->arr1, s->arr2, ftab, nblock, verb );
+      }
+   }
+
+   s->origPtr = -1;
+   for (i = 0; i < s->nblock; i++)
+      if (ptr[i] == 0)
+         { s->origPtr = i; break; };
+
+   AssertH( s->origPtr != -1, 1003 );
+}
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                       blocksort.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib.cpp
new file mode 100644
index 00000000..8a413061
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib.cpp
@@ -0,0 +1,1624 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Library top-level functions.                          ---*/
+/*---                                             bzlib.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+/* CHANGES
+   0.9.0    -- original version.
+   0.9.0a/b -- no changes in this file.
+   0.9.0c   -- made zero-length BZ_FLUSH work correctly in bzCompress().
+     fixed bzWrite/bzRead to ignore zero-length requests.
+     fixed bzread to correctly handle read requests after EOF.
+     wrong parameter order in call to bzDecompressInit in
+     bzBuffToBuffDecompress.  Fixed.
+*/
+
+#include "bzlib_private.h"
+
+
+/*---------------------------------------------------*/
+/*--- Compression stuff                           ---*/
+/*---------------------------------------------------*/
+
+
+/*---------------------------------------------------*/
+#ifndef BZ_NO_STDIO
+void BZ2_bz__AssertH__fail ( int errcode )
+{
+   fprintf(stderr, 
+      "\n\nbzip2/libbzip2: internal error number %d.\n"
+      "This is a bug in bzip2/libbzip2, %s.\n"
+      "Please report it to me at: jseward@bzip.org.  If this happened\n"
+      "when you were using some program which uses libbzip2 as a\n"
+      "component, you should also report this bug to the author(s)\n"
+      "of that program.  Please make an effort to report this bug;\n"
+      "timely and accurate bug reports eventually lead to higher\n"
+      "quality software.  Thanks.  Julian Seward, 10 December 2007.\n\n",
+      errcode,
+      BZ2_bzlibVersion()
+   );
+
+   if (errcode == 1007) {
+   fprintf(stderr,
+      "\n*** A special note about internal error number 1007 ***\n"
+      "\n"
+      "Experience suggests that a common cause of i.e. 1007\n"
+      "is unreliable memory or other hardware.  The 1007 assertion\n"
+      "just happens to cross-check the results of huge numbers of\n"
+      "memory reads/writes, and so acts (unintendedly) as a stress\n"
+      "test of your memory system.\n"
+      "\n"
+      "I suggest the following: try compressing the file again,\n"
+      "possibly monitoring progress in detail with the -vv flag.\n"
+      "\n"
+      "* If the error cannot be reproduced, and/or happens at different\n"
+      "  points in compression, you may have a flaky memory system.\n"
+      "  Try a memory-test program.  I have used Memtest86\n"
+      "  (www.memtest86.com).  At the time of writing it is free (GPLd).\n"
+      "  Memtest86 tests memory much more thorougly than your BIOSs\n"
+      "  power-on test, and may find failures that the BIOS doesn't.\n"
+      "\n"
+      "* If the error can be repeatably reproduced, this is a bug in\n"
+      "  bzip2, and I would very much like to hear about it.  Please\n"
+      "  let me know, and, ideally, save a copy of the file causing the\n"
+      "  problem -- without which I will be unable to investigate it.\n"
+      "\n"
+   );
+   }
+
+   exit(3);
+}
+#endif
+
+
+/*---------------------------------------------------*/
+static
+int bz_config_ok ( void )
+{
+   if (sizeof(int)   != 4) return 0;
+   if (sizeof(short) != 2) return 0;
+   if (sizeof(char)  != 1) return 0;
+   return 1;
+}
+
+
+/*---------------------------------------------------*/
+static
+void* default_bzalloc ( void* opaque, Int32 items, Int32 size )
+{
+   void* v = malloc ( items * size );
+   return v;
+}
+
+static
+void default_bzfree ( void* opaque, void* addr )
+{
+   if (addr != NULL) free ( addr );
+}
+
+
+/*---------------------------------------------------*/
+static
+void prepare_new_block ( EState* s )
+{
+   Int32 i;
+   s->nblock = 0;
+   s->numZ = 0;
+   s->state_out_pos = 0;
+   BZ_INITIALISE_CRC ( s->blockCRC );
+   for (i = 0; i < 256; i++) s->inUse[i] = False;
+   s->blockNo++;
+}
+
+
+/*---------------------------------------------------*/
+static
+void init_RL ( EState* s )
+{
+   s->state_in_ch  = 256;
+   s->state_in_len = 0;
+}
+
+
+static
+Bool isempty_RL ( EState* s )
+{
+   if (s->state_in_ch < 256 && s->state_in_len > 0)
+      return False; else
+      return True;
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzCompressInit) 
+                    ( bz_stream* strm, 
+                     int        blockSize100k,
+                     int        verbosity,
+                     int        workFactor )
+{
+   Int32   n;
+   EState* s;
+
+   if (!bz_config_ok()) return BZ_CONFIG_ERROR;
+
+   if (strm == NULL || 
+       blockSize100k < 1 || blockSize100k > 9 ||
+       workFactor < 0 || workFactor > 250)
+     return BZ_PARAM_ERROR;
+
+   if (workFactor == 0) workFactor = 30;
+   if (strm->bzalloc == NULL) strm->bzalloc = default_bzalloc;
+   if (strm->bzfree == NULL) strm->bzfree = default_bzfree;
+
+   s = (EState*)BZALLOC( sizeof(EState) );
+   if (s == NULL) return BZ_MEM_ERROR;
+   s->strm = strm;
+
+   s->arr1 = NULL;
+   s->arr2 = NULL;
+   s->ftab = NULL;
+
+   n       = 100000 * blockSize100k;
+   s->arr1 = (UInt32*)BZALLOC( n                  * sizeof(UInt32) );
+   s->arr2 = (UInt32*)BZALLOC( (n+BZ_N_OVERSHOOT) * sizeof(UInt32) );
+   s->ftab = (UInt32*)BZALLOC( 65537              * sizeof(UInt32) );
+
+   if (s->arr1 == NULL || s->arr2 == NULL || s->ftab == NULL) {
+      if (s->arr1 != NULL) BZFREE(s->arr1);
+      if (s->arr2 != NULL) BZFREE(s->arr2);
+      if (s->ftab != NULL) BZFREE(s->ftab);
+      if (s       != NULL) BZFREE(s);
+      return BZ_MEM_ERROR;
+   }
+
+   s->blockNo           = 0;
+   s->state             = BZ_S_INPUT;
+   s->mode              = BZ_M_RUNNING;
+   s->combinedCRC       = 0;
+   s->blockSize100k     = blockSize100k;
+   s->nblockMAX         = 100000 * blockSize100k - 19;
+   s->verbosity         = verbosity;
+   s->workFactor        = workFactor;
+
+   s->block             = (UChar*)s->arr2;
+   s->mtfv              = (UInt16*)s->arr1;
+   s->zbits             = NULL;
+   s->ptr               = (UInt32*)s->arr1;
+
+   strm->state          = s;
+   strm->total_in_lo32  = 0;
+   strm->total_in_hi32  = 0;
+   strm->total_out_lo32 = 0;
+   strm->total_out_hi32 = 0;
+   init_RL ( s );
+   prepare_new_block ( s );
+   return BZ_OK;
+}
+
+
+/*---------------------------------------------------*/
+static
+void add_pair_to_block ( EState* s )
+{
+   Int32 i;
+   UChar ch = (UChar)(s->state_in_ch);
+   for (i = 0; i < s->state_in_len; i++) {
+      BZ_UPDATE_CRC( s->blockCRC, ch );
+   }
+   s->inUse[s->state_in_ch] = True;
+   switch (s->state_in_len) {
+      case 1:
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         break;
+      case 2:
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         break;
+      case 3:
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         break;
+      default:
+         s->inUse[s->state_in_len-4] = True;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = (UChar)ch; s->nblock++;
+         s->block[s->nblock] = ((UChar)(s->state_in_len-4));
+         s->nblock++;
+         break;
+   }
+}
+
+
+/*---------------------------------------------------*/
+static
+void flush_RL ( EState* s )
+{
+   if (s->state_in_ch < 256) add_pair_to_block ( s );
+   init_RL ( s );
+}
+
+
+/*---------------------------------------------------*/
+#define ADD_CHAR_TO_BLOCK(zs,zchh0)               \
+{                                                 \
+   UInt32 zchh = (UInt32)(zchh0);                 \
+   /*-- fast track the common case --*/           \
+   if (zchh != zs->state_in_ch &&                 \
+       zs->state_in_len == 1) {                   \
+      UChar ch = (UChar)(zs->state_in_ch);        \
+      BZ_UPDATE_CRC( zs->blockCRC, ch );          \
+      zs->inUse[zs->state_in_ch] = True;          \
+      zs->block[zs->nblock] = (UChar)ch;          \
+      zs->nblock++;                               \
+      zs->state_in_ch = zchh;                     \
+   }                                              \
+   else                                           \
+   /*-- general, uncommon cases --*/              \
+   if (zchh != zs->state_in_ch ||                 \
+      zs->state_in_len == 255) {                  \
+      if (zs->state_in_ch < 256)                  \
+         add_pair_to_block ( zs );                \
+      zs->state_in_ch = zchh;                     \
+      zs->state_in_len = 1;                       \
+   } else {                                       \
+      zs->state_in_len++;                         \
+   }                                              \
+}
+
+
+/*---------------------------------------------------*/
+static
+Bool copy_input_until_stop ( EState* s )
+{
+   Bool progress_in = False;
+
+   if (s->mode == BZ_M_RUNNING) {
+
+      /*-- fast track the common case --*/
+      while (True) {
+         /*-- block full? --*/
+         if (s->nblock >= s->nblockMAX) break;
+         /*-- no input? --*/
+         if (s->strm->avail_in == 0) break;
+         progress_in = True;
+         ADD_CHAR_TO_BLOCK ( s, (UInt32)(*((UChar*)(s->strm->next_in))) ); 
+         s->strm->next_in++;
+         s->strm->avail_in--;
+         s->strm->total_in_lo32++;
+         if (s->strm->total_in_lo32 == 0) s->strm->total_in_hi32++;
+      }
+
+   } else {
+
+      /*-- general, uncommon case --*/
+      while (True) {
+         /*-- block full? --*/
+         if (s->nblock >= s->nblockMAX) break;
+         /*-- no input? --*/
+         if (s->strm->avail_in == 0) break;
+         /*-- flush/finish end? --*/
+         if (s->avail_in_expect == 0) break;
+         progress_in = True;
+         ADD_CHAR_TO_BLOCK ( s, (UInt32)(*((UChar*)(s->strm->next_in))) ); 
+         s->strm->next_in++;
+         s->strm->avail_in--;
+         s->strm->total_in_lo32++;
+         if (s->strm->total_in_lo32 == 0) s->strm->total_in_hi32++;
+         s->avail_in_expect--;
+      }
+   }
+   return progress_in;
+}
+
+
+/*---------------------------------------------------*/
+static
+Bool copy_output_until_stop ( EState* s )
+{
+   Bool progress_out = False;
+
+   while (True) {
+
+      /*-- no output space? --*/
+      if (s->strm->avail_out == 0) break;
+
+      /*-- block done? --*/
+      if (s->state_out_pos >= s->numZ) break;
+
+      progress_out = True;
+      *(s->strm->next_out) = s->zbits[s->state_out_pos];
+      s->state_out_pos++;
+      s->strm->avail_out--;
+      s->strm->next_out++;
+      s->strm->total_out_lo32++;
+      if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++;
+   }
+
+   return progress_out;
+}
+
+
+/*---------------------------------------------------*/
+static
+Bool handle_compress ( bz_stream* strm )
+{
+   Bool progress_in  = False;
+   Bool progress_out = False;
+   EState* s = (EState*)strm->state;
+   
+   while (True) {
+
+      if (s->state == BZ_S_OUTPUT) {
+         progress_out |= copy_output_until_stop ( s );
+         if (s->state_out_pos < s->numZ) break;
+         if (s->mode == BZ_M_FINISHING && 
+             s->avail_in_expect == 0 &&
+             isempty_RL(s)) break;
+         prepare_new_block ( s );
+         s->state = BZ_S_INPUT;
+         if (s->mode == BZ_M_FLUSHING && 
+             s->avail_in_expect == 0 &&
+             isempty_RL(s)) break;
+      }
+
+      if (s->state == BZ_S_INPUT) {
+         progress_in |= copy_input_until_stop ( s );
+         if (s->mode != BZ_M_RUNNING && s->avail_in_expect == 0) {
+            flush_RL ( s );
+            BZ2_compressBlock ( s, (Bool)(s->mode == BZ_M_FINISHING) );
+            s->state = BZ_S_OUTPUT;
+         }
+         else
+         if (s->nblock >= s->nblockMAX) {
+            BZ2_compressBlock ( s, False );
+            s->state = BZ_S_OUTPUT;
+         }
+         else
+         if (s->strm->avail_in == 0) {
+            break;
+         }
+      }
+
+   }
+
+   return progress_in || progress_out;
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzCompress) ( bz_stream *strm, int action )
+{
+   Bool progress;
+   EState* s;
+   if (strm == NULL) return BZ_PARAM_ERROR;
+   s = (EState*)strm->state;
+   if (s == NULL) return BZ_PARAM_ERROR;
+   if (s->strm != strm) return BZ_PARAM_ERROR;
+
+   preswitch:
+   switch (s->mode) {
+
+      case BZ_M_IDLE:
+         return BZ_SEQUENCE_ERROR;
+
+      case BZ_M_RUNNING:
+         if (action == BZ_RUN) {
+            progress = handle_compress ( strm );
+            return progress ? BZ_RUN_OK : BZ_PARAM_ERROR;
+         } 
+         else
+	 if (action == BZ_FLUSH) {
+            s->avail_in_expect = strm->avail_in;
+            s->mode = BZ_M_FLUSHING;
+            goto preswitch;
+         }
+         else
+         if (action == BZ_FINISH) {
+            s->avail_in_expect = strm->avail_in;
+            s->mode = BZ_M_FINISHING;
+            goto preswitch;
+         }
+         else 
+            return BZ_PARAM_ERROR;
+
+      case BZ_M_FLUSHING:
+         if (action != BZ_FLUSH) return BZ_SEQUENCE_ERROR;
+         if (s->avail_in_expect != s->strm->avail_in) 
+            return BZ_SEQUENCE_ERROR;
+         progress = handle_compress ( strm );
+         if (s->avail_in_expect > 0 || !isempty_RL(s) ||
+             s->state_out_pos < s->numZ) return BZ_FLUSH_OK;
+         s->mode = BZ_M_RUNNING;
+         return BZ_RUN_OK;
+
+      case BZ_M_FINISHING:
+         if (action != BZ_FINISH) return BZ_SEQUENCE_ERROR;
+         if (s->avail_in_expect != s->strm->avail_in) 
+            return BZ_SEQUENCE_ERROR;
+         progress = handle_compress ( strm );
+         if (!progress) return BZ_SEQUENCE_ERROR;
+         if (s->avail_in_expect > 0 || !isempty_RL(s) ||
+             s->state_out_pos < s->numZ) return BZ_FINISH_OK;
+         s->mode = BZ_M_IDLE;
+         return BZ_STREAM_END;
+   }
+   return BZ_OK; /*--not reached--*/
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzCompressEnd)  ( bz_stream *strm )
+{
+   EState* s;
+   if (strm == NULL) return BZ_PARAM_ERROR;
+   s = (EState*)strm->state;
+   if (s == NULL) return BZ_PARAM_ERROR;
+   if (s->strm != strm) return BZ_PARAM_ERROR;
+
+   if (s->arr1 != NULL) BZFREE(s->arr1);
+   if (s->arr2 != NULL) BZFREE(s->arr2);
+   if (s->ftab != NULL) BZFREE(s->ftab);
+   BZFREE(strm->state);
+
+   strm->state = NULL;   
+
+   return BZ_OK;
+}
+
+
+/*---------------------------------------------------*/
+/*--- Decompression stuff                         ---*/
+/*---------------------------------------------------*/
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzDecompressInit) 
+                     ( bz_stream* strm, 
+                       int        verbosity,
+                       int        small )
+{
+   DState* s;
+
+   if (!bz_config_ok()) return BZ_CONFIG_ERROR;
+
+   if (strm == NULL) return BZ_PARAM_ERROR;
+   if (small != 0 && small != 1) return BZ_PARAM_ERROR;
+   if (verbosity < 0 || verbosity > 4) return BZ_PARAM_ERROR;
+
+   if (strm->bzalloc == NULL) strm->bzalloc = default_bzalloc;
+   if (strm->bzfree == NULL) strm->bzfree = default_bzfree;
+
+   s = (DState*)BZALLOC( sizeof(DState) );
+   if (s == NULL) return BZ_MEM_ERROR;
+   s->strm                  = strm;
+   strm->state              = s;
+   s->state                 = BZ_X_MAGIC_1;
+   s->bsLive                = 0;
+   s->bsBuff                = 0;
+   s->calculatedCombinedCRC = 0;
+   strm->total_in_lo32      = 0;
+   strm->total_in_hi32      = 0;
+   strm->total_out_lo32     = 0;
+   strm->total_out_hi32     = 0;
+   s->smallDecompress       = (Bool)small;
+   s->ll4                   = NULL;
+   s->ll16                  = NULL;
+   s->tt                    = NULL;
+   s->currBlockNo           = 0;
+   s->verbosity             = verbosity;
+
+   return BZ_OK;
+}
+
+
+/*---------------------------------------------------*/
+/* Return  True iff data corruption is discovered.
+   Returns False if there is no problem.
+*/
+static
+Bool unRLE_obuf_to_output_FAST ( DState* s )
+{
+   UChar k1;
+
+   if (s->blockRandomised) {
+
+      while (True) {
+         /* try to finish existing run */
+         while (True) {
+            if (s->strm->avail_out == 0) return False;
+            if (s->state_out_len == 0) break;
+            *( (UChar*)(s->strm->next_out) ) = s->state_out_ch;
+            BZ_UPDATE_CRC ( s->calculatedBlockCRC, s->state_out_ch );
+            s->state_out_len--;
+            s->strm->next_out++;
+            s->strm->avail_out--;
+            s->strm->total_out_lo32++;
+            if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++;
+         }
+
+         /* can a new run be started? */
+         if (s->nblock_used == s->save_nblock+1) return False;
+               
+         /* Only caused by corrupt data stream? */
+         if (s->nblock_used > s->save_nblock+1)
+            return True;
+   
+         s->state_out_len = 1;
+         s->state_out_ch = s->k0;
+         BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         s->state_out_len = 2;
+         BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         s->state_out_len = 3;
+         BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         s->state_out_len = ((Int32)k1) + 4;
+         BZ_GET_FAST(s->k0); BZ_RAND_UPD_MASK; 
+         s->k0 ^= BZ_RAND_MASK; s->nblock_used++;
+      }
+
+   } else {
+
+      /* restore */
+      UInt32        c_calculatedBlockCRC = s->calculatedBlockCRC;
+      UChar         c_state_out_ch       = s->state_out_ch;
+      Int32         c_state_out_len      = s->state_out_len;
+      Int32         c_nblock_used        = s->nblock_used;
+      Int32         c_k0                 = s->k0;
+      UInt32*       c_tt                 = s->tt;
+      UInt32        c_tPos               = s->tPos;
+      char*         cs_next_out          = s->strm->next_out;
+      unsigned int  cs_avail_out         = s->strm->avail_out;
+      Int32         ro_blockSize100k     = s->blockSize100k;
+      /* end restore */
+
+      UInt32       avail_out_INIT = cs_avail_out;
+      Int32        s_save_nblockPP = s->save_nblock+1;
+      unsigned int total_out_lo32_old;
+
+      while (True) {
+
+         /* try to finish existing run */
+         if (c_state_out_len > 0) {
+            while (True) {
+               if (cs_avail_out == 0) goto return_notr;
+               if (c_state_out_len == 1) break;
+               *( (UChar*)(cs_next_out) ) = c_state_out_ch;
+               BZ_UPDATE_CRC ( c_calculatedBlockCRC, c_state_out_ch );
+               c_state_out_len--;
+               cs_next_out++;
+               cs_avail_out--;
+            }
+            s_state_out_len_eq_one:
+            {
+               if (cs_avail_out == 0) { 
+                  c_state_out_len = 1; goto return_notr;
+               };
+               *( (UChar*)(cs_next_out) ) = c_state_out_ch;
+               BZ_UPDATE_CRC ( c_calculatedBlockCRC, c_state_out_ch );
+               cs_next_out++;
+               cs_avail_out--;
+            }
+         }   
+         /* Only caused by corrupt data stream? */
+         if (c_nblock_used > s_save_nblockPP)
+            return True;
+
+         /* can a new run be started? */
+         if (c_nblock_used == s_save_nblockPP) {
+            c_state_out_len = 0; goto return_notr;
+         };   
+         c_state_out_ch = c_k0;
+         BZ_GET_FAST_C(k1); c_nblock_used++;
+         if (k1 != c_k0) { 
+            c_k0 = k1; goto s_state_out_len_eq_one; 
+         };
+         if (c_nblock_used == s_save_nblockPP) 
+            goto s_state_out_len_eq_one;
+   
+         c_state_out_len = 2;
+         BZ_GET_FAST_C(k1); c_nblock_used++;
+         if (c_nblock_used == s_save_nblockPP) continue;
+         if (k1 != c_k0) { c_k0 = k1; continue; };
+   
+         c_state_out_len = 3;
+         BZ_GET_FAST_C(k1); c_nblock_used++;
+         if (c_nblock_used == s_save_nblockPP) continue;
+         if (k1 != c_k0) { c_k0 = k1; continue; };
+   
+         BZ_GET_FAST_C(k1); c_nblock_used++;
+         c_state_out_len = ((Int32)k1) + 4;
+         BZ_GET_FAST_C(c_k0); c_nblock_used++;
+      }
+
+      return_notr:
+      total_out_lo32_old = s->strm->total_out_lo32;
+      s->strm->total_out_lo32 += (avail_out_INIT - cs_avail_out);
+      if (s->strm->total_out_lo32 < total_out_lo32_old)
+         s->strm->total_out_hi32++;
+
+      /* save */
+      s->calculatedBlockCRC = c_calculatedBlockCRC;
+      s->state_out_ch       = c_state_out_ch;
+      s->state_out_len      = c_state_out_len;
+      s->nblock_used        = c_nblock_used;
+      s->k0                 = c_k0;
+      s->tt                 = c_tt;
+      s->tPos               = c_tPos;
+      s->strm->next_out     = cs_next_out;
+      s->strm->avail_out    = cs_avail_out;
+      /* end save */
+   }
+   return False;
+}
+
+
+
+/*---------------------------------------------------*/
+Int32 BZ2_indexIntoF ( Int32 indx, Int32 *cftab )
+{
+   Int32 nb, na, mid;
+   nb = 0;
+   na = 256;
+   do {
+      mid = (nb + na) >> 1;
+      if (indx >= cftab[mid]) nb = mid; else na = mid;
+   }
+   while (na - nb != 1);
+   return nb;
+}
+
+
+/*---------------------------------------------------*/
+/* Return  True iff data corruption is discovered.
+   Returns False if there is no problem.
+*/
+static
+Bool unRLE_obuf_to_output_SMALL ( DState* s )
+{
+   UChar k1;
+
+   if (s->blockRandomised) {
+
+      while (True) {
+         /* try to finish existing run */
+         while (True) {
+            if (s->strm->avail_out == 0) return False;
+            if (s->state_out_len == 0) break;
+            *( (UChar*)(s->strm->next_out) ) = s->state_out_ch;
+            BZ_UPDATE_CRC ( s->calculatedBlockCRC, s->state_out_ch );
+            s->state_out_len--;
+            s->strm->next_out++;
+            s->strm->avail_out--;
+            s->strm->total_out_lo32++;
+            if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++;
+         }
+   
+         /* can a new run be started? */
+         if (s->nblock_used == s->save_nblock+1) return False;
+
+         /* Only caused by corrupt data stream? */
+         if (s->nblock_used > s->save_nblock+1)
+            return True;
+   
+         s->state_out_len = 1;
+         s->state_out_ch = s->k0;
+         BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         s->state_out_len = 2;
+         BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         s->state_out_len = 3;
+         BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; 
+         k1 ^= BZ_RAND_MASK; s->nblock_used++;
+         s->state_out_len = ((Int32)k1) + 4;
+         BZ_GET_SMALL(s->k0); BZ_RAND_UPD_MASK; 
+         s->k0 ^= BZ_RAND_MASK; s->nblock_used++;
+      }
+
+   } else {
+
+      while (True) {
+         /* try to finish existing run */
+         while (True) {
+            if (s->strm->avail_out == 0) return False;
+            if (s->state_out_len == 0) break;
+            *( (UChar*)(s->strm->next_out) ) = s->state_out_ch;
+            BZ_UPDATE_CRC ( s->calculatedBlockCRC, s->state_out_ch );
+            s->state_out_len--;
+            s->strm->next_out++;
+            s->strm->avail_out--;
+            s->strm->total_out_lo32++;
+            if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++;
+         }
+   
+         /* can a new run be started? */
+         if (s->nblock_used == s->save_nblock+1) return False;
+
+         /* Only caused by corrupt data stream? */
+         if (s->nblock_used > s->save_nblock+1)
+            return True;
+   
+         s->state_out_len = 1;
+         s->state_out_ch = s->k0;
+         BZ_GET_SMALL(k1); s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         s->state_out_len = 2;
+         BZ_GET_SMALL(k1); s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         s->state_out_len = 3;
+         BZ_GET_SMALL(k1); s->nblock_used++;
+         if (s->nblock_used == s->save_nblock+1) continue;
+         if (k1 != s->k0) { s->k0 = k1; continue; };
+   
+         BZ_GET_SMALL(k1); s->nblock_used++;
+         s->state_out_len = ((Int32)k1) + 4;
+         BZ_GET_SMALL(s->k0); s->nblock_used++;
+      }
+
+   }
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzDecompress) ( bz_stream *strm )
+{
+   Bool    corrupt;
+   DState* s;
+   if (strm == NULL) return BZ_PARAM_ERROR;
+   s = (DState*)strm->state;
+   if (s == NULL) return BZ_PARAM_ERROR;
+   if (s->strm != strm) return BZ_PARAM_ERROR;
+
+   while (True) {
+      if (s->state == BZ_X_IDLE) return BZ_SEQUENCE_ERROR;
+      if (s->state == BZ_X_OUTPUT) {
+         if (s->smallDecompress)
+            corrupt = unRLE_obuf_to_output_SMALL ( s ); else
+            corrupt = unRLE_obuf_to_output_FAST  ( s );
+         if (corrupt) return BZ_DATA_ERROR;
+         if (s->nblock_used == s->save_nblock+1 && s->state_out_len == 0) {
+            BZ_FINALISE_CRC ( s->calculatedBlockCRC );
+            if (s->verbosity >= 3) 
+               VPrintf2 ( " {0x%08x, 0x%08x}", s->storedBlockCRC, 
+                          s->calculatedBlockCRC );
+            if (s->verbosity >= 2) VPrintf0 ( "]" );
+            if (s->calculatedBlockCRC != s->storedBlockCRC)
+               return BZ_DATA_ERROR;
+            s->calculatedCombinedCRC 
+               = (s->calculatedCombinedCRC << 1) | 
+                    (s->calculatedCombinedCRC >> 31);
+            s->calculatedCombinedCRC ^= s->calculatedBlockCRC;
+            s->state = BZ_X_BLKHDR_1;
+         } else {
+            return BZ_OK;
+         }
+      }
+      if (s->state >= BZ_X_MAGIC_1) {
+         Int32 r = BZ2_decompress ( s );
+         if (r == BZ_STREAM_END) {
+            if (s->verbosity >= 3)
+               VPrintf2 ( "\n    combined CRCs: stored = 0x%08x, computed = 0x%08x", 
+                          s->storedCombinedCRC, s->calculatedCombinedCRC );
+            if (s->calculatedCombinedCRC != s->storedCombinedCRC)
+               return BZ_DATA_ERROR;
+            return r;
+         }
+         if (s->state != BZ_X_OUTPUT) return r;
+      }
+   }
+
+   AssertH ( 0, 6001 );
+
+   return 0;  /*NOTREACHED*/
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzDecompressEnd)  ( bz_stream *strm )
+{
+   DState* s;
+   if (strm == NULL) return BZ_PARAM_ERROR;
+   s = (DState*)strm->state;
+   if (s == NULL) return BZ_PARAM_ERROR;
+   if (s->strm != strm) return BZ_PARAM_ERROR;
+
+   if (s->tt   != NULL) BZFREE(s->tt);
+   if (s->ll16 != NULL) BZFREE(s->ll16);
+   if (s->ll4  != NULL) BZFREE(s->ll4);
+
+   BZFREE(strm->state);
+   strm->state = NULL;
+
+   return BZ_OK;
+}
+
+
+#ifndef BZ_NO_STDIO
+/*---------------------------------------------------*/
+/*--- File I/O stuff                              ---*/
+/*---------------------------------------------------*/
+
+#define BZ_SETERR(eee)                    \
+{                                         \
+   if (bzerror != NULL) *bzerror = eee;   \
+   if (bzf != NULL) bzf->lastErr = eee;   \
+}
+
+typedef 
+   struct {
+      FILE*     handle;
+      Char      buf[BZ_MAX_UNUSED];
+      Int32     bufN;
+      Bool      writing;
+      bz_stream strm;
+      Int32     lastErr;
+      Bool      initialisedOk;
+   }
+   bzFile;
+
+
+/*---------------------------------------------*/
+static Bool myfeof ( FILE* f )
+{
+   Int32 c = fgetc ( f );
+   if (c == EOF) return True;
+   ungetc ( c, f );
+   return False;
+}
+
+
+/*---------------------------------------------------*/
+BZFILE* BZ_API(BZ2_bzWriteOpen) 
+                    ( int*  bzerror,      
+                      FILE* f, 
+                      int   blockSize100k, 
+                      int   verbosity,
+                      int   workFactor )
+{
+   Int32   ret;
+   bzFile* bzf = NULL;
+
+   BZ_SETERR(BZ_OK);
+
+   if (f == NULL ||
+       (blockSize100k < 1 || blockSize100k > 9) ||
+       (workFactor < 0 || workFactor > 250) ||
+       (verbosity < 0 || verbosity > 4))
+      { BZ_SETERR(BZ_PARAM_ERROR); return NULL; };
+
+   if (ferror(f))
+      { BZ_SETERR(BZ_IO_ERROR); return NULL; };
+
+   bzf = (bzFile*)malloc ( sizeof(bzFile) );
+   if (bzf == NULL)
+      { BZ_SETERR(BZ_MEM_ERROR); return NULL; };
+
+   BZ_SETERR(BZ_OK);
+   bzf->initialisedOk = False;
+   bzf->bufN          = 0;
+   bzf->handle        = f;
+   bzf->writing       = True;
+   bzf->strm.bzalloc  = NULL;
+   bzf->strm.bzfree   = NULL;
+   bzf->strm.opaque   = NULL;
+
+   if (workFactor == 0) workFactor = 30;
+   ret = BZ2_bzCompressInit ( &(bzf->strm), blockSize100k, 
+                              verbosity, workFactor );
+   if (ret != BZ_OK)
+      { BZ_SETERR(ret); free(bzf); return NULL; };
+
+   bzf->strm.avail_in = 0;
+   bzf->initialisedOk = True;
+   return bzf;   
+}
+
+
+
+/*---------------------------------------------------*/
+void BZ_API(BZ2_bzWrite)
+             ( int*    bzerror, 
+               BZFILE* b, 
+               void*   buf, 
+               int     len )
+{
+   Int32 n, n2, ret;
+   bzFile* bzf = (bzFile*)b;
+
+   BZ_SETERR(BZ_OK);
+   if (bzf == NULL || buf == NULL || len < 0)
+      { BZ_SETERR(BZ_PARAM_ERROR); return; };
+   if (!(bzf->writing))
+      { BZ_SETERR(BZ_SEQUENCE_ERROR); return; };
+   if (ferror(bzf->handle))
+      { BZ_SETERR(BZ_IO_ERROR); return; };
+
+   if (len == 0)
+      { BZ_SETERR(BZ_OK); return; };
+
+   bzf->strm.avail_in = len;
+   bzf->strm.next_in  = (char*)buf;
+
+   while (True) {
+      bzf->strm.avail_out = BZ_MAX_UNUSED;
+      bzf->strm.next_out = bzf->buf;
+      ret = BZ2_bzCompress ( &(bzf->strm), BZ_RUN );
+      if (ret != BZ_RUN_OK)
+         { BZ_SETERR(ret); return; };
+
+      if (bzf->strm.avail_out < BZ_MAX_UNUSED) {
+         n = BZ_MAX_UNUSED - bzf->strm.avail_out;
+         n2 = fwrite ( (void*)(bzf->buf), sizeof(UChar), 
+                       n, bzf->handle );
+         if (n != n2 || ferror(bzf->handle))
+            { BZ_SETERR(BZ_IO_ERROR); return; };
+      }
+
+      if (bzf->strm.avail_in == 0)
+         { BZ_SETERR(BZ_OK); return; };
+   }
+}
+
+
+/*---------------------------------------------------*/
+void BZ_API(BZ2_bzWriteClose)
+                  ( int*          bzerror, 
+                    BZFILE*       b, 
+                    int           abandon,
+                    unsigned int* nbytes_in,
+                    unsigned int* nbytes_out )
+{
+   BZ2_bzWriteClose64 ( bzerror, b, abandon, 
+                        nbytes_in, NULL, nbytes_out, NULL );
+}
+
+
+void BZ_API(BZ2_bzWriteClose64)
+                  ( int*          bzerror, 
+                    BZFILE*       b, 
+                    int           abandon,
+                    unsigned int* nbytes_in_lo32,
+                    unsigned int* nbytes_in_hi32,
+                    unsigned int* nbytes_out_lo32,
+                    unsigned int* nbytes_out_hi32 )
+{
+   Int32   n, n2, ret;
+   bzFile* bzf = (bzFile*)b;
+
+   if (bzf == NULL)
+      { BZ_SETERR(BZ_OK); return; };
+   if (!(bzf->writing))
+      { BZ_SETERR(BZ_SEQUENCE_ERROR); return; };
+   if (ferror(bzf->handle))
+      { BZ_SETERR(BZ_IO_ERROR); return; };
+
+   if (nbytes_in_lo32 != NULL) *nbytes_in_lo32 = 0;
+   if (nbytes_in_hi32 != NULL) *nbytes_in_hi32 = 0;
+   if (nbytes_out_lo32 != NULL) *nbytes_out_lo32 = 0;
+   if (nbytes_out_hi32 != NULL) *nbytes_out_hi32 = 0;
+
+   if ((!abandon) && bzf->lastErr == BZ_OK) {
+      while (True) {
+         bzf->strm.avail_out = BZ_MAX_UNUSED;
+         bzf->strm.next_out = bzf->buf;
+         ret = BZ2_bzCompress ( &(bzf->strm), BZ_FINISH );
+         if (ret != BZ_FINISH_OK && ret != BZ_STREAM_END)
+            { BZ_SETERR(ret); return; };
+
+         if (bzf->strm.avail_out < BZ_MAX_UNUSED) {
+            n = BZ_MAX_UNUSED - bzf->strm.avail_out;
+            n2 = fwrite ( (void*)(bzf->buf), sizeof(UChar), 
+                          n, bzf->handle );
+            if (n != n2 || ferror(bzf->handle))
+               { BZ_SETERR(BZ_IO_ERROR); return; };
+         }
+
+         if (ret == BZ_STREAM_END) break;
+      }
+   }
+
+   if ( !abandon && !ferror ( bzf->handle ) ) {
+      fflush ( bzf->handle );
+      if (ferror(bzf->handle))
+         { BZ_SETERR(BZ_IO_ERROR); return; };
+   }
+
+   if (nbytes_in_lo32 != NULL)
+      *nbytes_in_lo32 = bzf->strm.total_in_lo32;
+   if (nbytes_in_hi32 != NULL)
+      *nbytes_in_hi32 = bzf->strm.total_in_hi32;
+   if (nbytes_out_lo32 != NULL)
+      *nbytes_out_lo32 = bzf->strm.total_out_lo32;
+   if (nbytes_out_hi32 != NULL)
+      *nbytes_out_hi32 = bzf->strm.total_out_hi32;
+
+   BZ_SETERR(BZ_OK);
+   BZ2_bzCompressEnd ( &(bzf->strm) );
+   free ( bzf );
+}
+
+
+/*---------------------------------------------------*/
+BZFILE* BZ_API(BZ2_bzReadOpen) 
+                   ( int*  bzerror, 
+                     FILE* f, 
+                     int   verbosity,
+                     int   small,
+                     void* unused,
+                     int   nUnused )
+{
+   bzFile* bzf = NULL;
+   int     ret;
+
+   BZ_SETERR(BZ_OK);
+
+   if (f == NULL || 
+       (small != 0 && small != 1) ||
+       (verbosity < 0 || verbosity > 4) ||
+       (unused == NULL && nUnused != 0) ||
+       (unused != NULL && (nUnused < 0 || nUnused > BZ_MAX_UNUSED)))
+      { BZ_SETERR(BZ_PARAM_ERROR); return NULL; };
+
+   if (ferror(f))
+      { BZ_SETERR(BZ_IO_ERROR); return NULL; };
+
+   bzf = (bzFile*)malloc ( sizeof(bzFile) );
+   if (bzf == NULL) 
+      { BZ_SETERR(BZ_MEM_ERROR); return NULL; };
+
+   BZ_SETERR(BZ_OK);
+
+   bzf->initialisedOk = False;
+   bzf->handle        = f;
+   bzf->bufN          = 0;
+   bzf->writing       = False;
+   bzf->strm.bzalloc  = NULL;
+   bzf->strm.bzfree   = NULL;
+   bzf->strm.opaque   = NULL;
+   
+   while (nUnused > 0) {
+      bzf->buf[bzf->bufN] = *((UChar*)(unused)); bzf->bufN++;
+      unused = ((void*)( 1 + ((UChar*)(unused))  ));
+      nUnused--;
+   }
+
+   ret = BZ2_bzDecompressInit ( &(bzf->strm), verbosity, small );
+   if (ret != BZ_OK)
+      { BZ_SETERR(ret); free(bzf); return NULL; };
+
+   bzf->strm.avail_in = bzf->bufN;
+   bzf->strm.next_in  = bzf->buf;
+
+   bzf->initialisedOk = True;
+   return bzf;   
+}
+
+
+/*---------------------------------------------------*/
+void BZ_API(BZ2_bzReadClose) ( int *bzerror, BZFILE *b )
+{
+   bzFile* bzf = (bzFile*)b;
+
+   BZ_SETERR(BZ_OK);
+   if (bzf == NULL)
+      { BZ_SETERR(BZ_OK); return; };
+
+   if (bzf->writing)
+      { BZ_SETERR(BZ_SEQUENCE_ERROR); return; };
+
+   if (bzf->initialisedOk)
+      (void)BZ2_bzDecompressEnd ( &(bzf->strm) );
+   free ( bzf );
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzRead) 
+           ( int*    bzerror, 
+             BZFILE* b, 
+             void*   buf, 
+             int     len )
+{
+   Int32   n, ret;
+   bzFile* bzf = (bzFile*)b;
+
+   BZ_SETERR(BZ_OK);
+
+   if (bzf == NULL || buf == NULL || len < 0)
+      { BZ_SETERR(BZ_PARAM_ERROR); return 0; };
+
+   if (bzf->writing)
+      { BZ_SETERR(BZ_SEQUENCE_ERROR); return 0; };
+
+   if (len == 0)
+      { BZ_SETERR(BZ_OK); return 0; };
+
+   bzf->strm.avail_out = len;
+   bzf->strm.next_out = (char*)buf;
+
+   while (True) {
+
+      if (ferror(bzf->handle)) 
+         { BZ_SETERR(BZ_IO_ERROR); return 0; };
+
+      if (bzf->strm.avail_in == 0 && !myfeof(bzf->handle)) {
+         n = fread ( bzf->buf, sizeof(UChar), 
+                     BZ_MAX_UNUSED, bzf->handle );
+         if (ferror(bzf->handle))
+            { BZ_SETERR(BZ_IO_ERROR); return 0; };
+         bzf->bufN = n;
+         bzf->strm.avail_in = bzf->bufN;
+         bzf->strm.next_in = bzf->buf;
+      }
+
+      ret = BZ2_bzDecompress ( &(bzf->strm) );
+
+      if (ret != BZ_OK && ret != BZ_STREAM_END)
+         { BZ_SETERR(ret); return 0; };
+
+      if (ret == BZ_OK && myfeof(bzf->handle) && 
+          bzf->strm.avail_in == 0 && bzf->strm.avail_out > 0)
+         { BZ_SETERR(BZ_UNEXPECTED_EOF); return 0; };
+
+      if (ret == BZ_STREAM_END)
+         { BZ_SETERR(BZ_STREAM_END);
+           return len - bzf->strm.avail_out; };
+      if (bzf->strm.avail_out == 0)
+         { BZ_SETERR(BZ_OK); return len; };
+      
+   }
+
+   return 0; /*not reached*/
+}
+
+
+/*---------------------------------------------------*/
+void BZ_API(BZ2_bzReadGetUnused) 
+                     ( int*    bzerror, 
+                       BZFILE* b, 
+                       void**  unused, 
+                       int*    nUnused )
+{
+   bzFile* bzf = (bzFile*)b;
+   if (bzf == NULL)
+      { BZ_SETERR(BZ_PARAM_ERROR); return; };
+   if (bzf->lastErr != BZ_STREAM_END)
+      { BZ_SETERR(BZ_SEQUENCE_ERROR); return; };
+   if (unused == NULL || nUnused == NULL)
+      { BZ_SETERR(BZ_PARAM_ERROR); return; };
+
+   BZ_SETERR(BZ_OK);
+   *nUnused = bzf->strm.avail_in;
+   *unused = bzf->strm.next_in;
+}
+#endif
+
+
+/*---------------------------------------------------*/
+/*--- Misc convenience stuff                      ---*/
+/*---------------------------------------------------*/
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzBuffToBuffCompress) 
+                         ( char*         dest, 
+                           unsigned int* destLen,
+                           char*         source, 
+                           unsigned int  sourceLen,
+                           int           blockSize100k, 
+                           int           verbosity, 
+                           int           workFactor )
+{
+   bz_stream strm;
+   int ret;
+
+   if (dest == NULL || destLen == NULL || 
+       source == NULL ||
+       blockSize100k < 1 || blockSize100k > 9 ||
+       verbosity < 0 || verbosity > 4 ||
+       workFactor < 0 || workFactor > 250) 
+      return BZ_PARAM_ERROR;
+
+   if (workFactor == 0) workFactor = 30;
+   strm.bzalloc = NULL;
+   strm.bzfree = NULL;
+   strm.opaque = NULL;
+   ret = BZ2_bzCompressInit ( &strm, blockSize100k, 
+                              verbosity, workFactor );
+   if (ret != BZ_OK) return ret;
+
+   strm.next_in = source;
+   strm.next_out = dest;
+   strm.avail_in = sourceLen;
+   strm.avail_out = *destLen;
+
+   ret = BZ2_bzCompress ( &strm, BZ_FINISH );
+   if (ret == BZ_FINISH_OK) goto output_overflow;
+   if (ret != BZ_STREAM_END) goto errhandler;
+
+   /* normal termination */
+   *destLen -= strm.avail_out;   
+   BZ2_bzCompressEnd ( &strm );
+   return BZ_OK;
+
+   output_overflow:
+   BZ2_bzCompressEnd ( &strm );
+   return BZ_OUTBUFF_FULL;
+
+   errhandler:
+   BZ2_bzCompressEnd ( &strm );
+   return ret;
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzBuffToBuffDecompress) 
+                           ( char*         dest, 
+                             unsigned int* destLen,
+                             char*         source, 
+                             unsigned int  sourceLen,
+                             int           small,
+                             int           verbosity )
+{
+   bz_stream strm;
+   int ret;
+
+   if (dest == NULL || destLen == NULL || 
+       source == NULL ||
+       (small != 0 && small != 1) ||
+       verbosity < 0 || verbosity > 4) 
+          return BZ_PARAM_ERROR;
+
+   strm.bzalloc = NULL;
+   strm.bzfree = NULL;
+   strm.opaque = NULL;
+   ret = BZ2_bzDecompressInit ( &strm, verbosity, small );
+   if (ret != BZ_OK) return ret;
+
+   strm.next_in = source;
+   strm.next_out = dest;
+   strm.avail_in = sourceLen;
+   strm.avail_out = *destLen;
+
+   ret = BZ2_bzDecompress ( &strm );
+   if (ret == BZ_OK) goto output_overflow_or_eof;
+   if (ret != BZ_STREAM_END) goto errhandler;
+
+   /* normal termination */
+   *destLen -= strm.avail_out;
+   BZ2_bzDecompressEnd ( &strm );
+   return BZ_OK;
+
+   output_overflow_or_eof:
+   if (strm.avail_out > 0) {
+      BZ2_bzDecompressEnd ( &strm );
+      return BZ_UNEXPECTED_EOF;
+   } else {
+      BZ2_bzDecompressEnd ( &strm );
+      return BZ_OUTBUFF_FULL;
+   };      
+
+   errhandler:
+   BZ2_bzDecompressEnd ( &strm );
+   return ret; 
+}
+
+
+/*---------------------------------------------------*/
+/*--
+   Code contributed by Yoshioka Tsuneo (tsuneo@rr.iij4u.or.jp)
+   to support better zlib compatibility.
+   This code is not _officially_ part of libbzip2 (yet);
+   I haven't tested it, documented it, or considered the
+   threading-safeness of it.
+   If this code breaks, please contact both Yoshioka and me.
+--*/
+/*---------------------------------------------------*/
+
+/*---------------------------------------------------*/
+/*--
+   return version like "0.9.5d, 4-Sept-1999".
+--*/
+const char * BZ_API(BZ2_bzlibVersion)(void)
+{
+   return BZ_VERSION;
+}
+
+
+#ifndef BZ_NO_STDIO
+/*---------------------------------------------------*/
+
+#if defined(_WIN32) || defined(OS2) || defined(MSDOS)
+#   include <fcntl.h>
+#   include <io.h>
+#   define SET_BINARY_MODE(file) setmode(fileno(file),O_BINARY)
+#else
+#   define SET_BINARY_MODE(file)
+#endif
+static
+BZFILE * bzopen_or_bzdopen
+               ( const char *path,   /* no use when bzdopen */
+                 int fd,             /* no use when bzdopen */
+                 const char *mode,
+                 int open_mode)      /* bzopen: 0, bzdopen:1 */
+{
+   int    bzerr;
+   char   unused[BZ_MAX_UNUSED];
+   int    blockSize100k = 9;
+   int    writing       = 0;
+   char   mode2[10]     = "";
+   FILE   *fp           = NULL;
+   BZFILE *bzfp         = NULL;
+   int    verbosity     = 0;
+   int    workFactor    = 30;
+   int    smallMode     = 0;
+   int    nUnused       = 0; 
+
+   if (mode == NULL) return NULL;
+   while (*mode) {
+      switch (*mode) {
+      case 'r':
+         writing = 0; break;
+      case 'w':
+         writing = 1; break;
+      case 's':
+         smallMode = 1; break;
+      default:
+         if (isdigit((int)(*mode))) {
+            blockSize100k = *mode-BZ_HDR_0;
+         }
+      }
+      mode++;
+   }
+   strcat(mode2, writing ? "w" : "r" );
+   strcat(mode2,"b");   /* binary mode */
+
+   if (open_mode==0) {
+      if (path==NULL || strcmp(path,"")==0) {
+        fp = (writing ? stdout : stdin);
+        SET_BINARY_MODE(fp);
+      } else {
+        fp = fopen(path,mode2);
+      }
+   } else {
+#ifdef BZ_STRICT_ANSI
+      fp = NULL;
+#else
+      fp = fdopen(fd,mode2);
+#endif
+   }
+   if (fp == NULL) return NULL;
+
+   if (writing) {
+      /* Guard against total chaos and anarchy -- JRS */
+      if (blockSize100k < 1) blockSize100k = 1;
+      if (blockSize100k > 9) blockSize100k = 9; 
+      bzfp = BZ2_bzWriteOpen(&bzerr,fp,blockSize100k,
+                             verbosity,workFactor);
+   } else {
+      bzfp = BZ2_bzReadOpen(&bzerr,fp,verbosity,smallMode,
+                            unused,nUnused);
+   }
+   if (bzfp == NULL) {
+      if (fp != stdin && fp != stdout) fclose(fp);
+      return NULL;
+   }
+   return bzfp;
+}
+
+
+/*---------------------------------------------------*/
+/*--
+   open file for read or write.
+      ex) bzopen("file","w9")
+      case path="" or NULL => use stdin or stdout.
+--*/
+BZFILE * BZ_API(BZ2_bzopen)
+               ( const char *path,
+                 const char *mode )
+{
+   return bzopen_or_bzdopen(path,-1,mode,/*bzopen*/0);
+}
+
+
+/*---------------------------------------------------*/
+BZFILE * BZ_API(BZ2_bzdopen)
+               ( int fd,
+                 const char *mode )
+{
+   return bzopen_or_bzdopen(NULL,fd,mode,/*bzdopen*/1);
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzread) (BZFILE* b, void* buf, int len )
+{
+   int bzerr, nread;
+   if (((bzFile*)b)->lastErr == BZ_STREAM_END) return 0;
+   nread = BZ2_bzRead(&bzerr,b,buf,len);
+   if (bzerr == BZ_OK || bzerr == BZ_STREAM_END) {
+      return nread;
+   } else {
+      return -1;
+   }
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzwrite) (BZFILE* b, void* buf, int len )
+{
+   int bzerr;
+
+   BZ2_bzWrite(&bzerr,b,buf,len);
+   if(bzerr == BZ_OK){
+      return len;
+   }else{
+      return -1;
+   }
+}
+
+
+/*---------------------------------------------------*/
+int BZ_API(BZ2_bzflush) (BZFILE *b)
+{
+   /* do nothing now... */
+   return 0;
+}
+
+
+/*---------------------------------------------------*/
+void BZ_API(BZ2_bzclose) (BZFILE* b)
+{
+   int bzerr;
+   FILE *fp;
+   
+   if (b==NULL) {return;}
+   fp = ((bzFile *)b)->handle;
+   if(((bzFile*)b)->writing){
+      BZ2_bzWriteClose(&bzerr,b,0,NULL,NULL);
+      if(bzerr != BZ_OK){
+         BZ2_bzWriteClose(NULL,b,1,NULL,NULL);
+      }
+   }else{
+      BZ2_bzReadClose(&bzerr,b);
+   }
+   if(fp!=stdin && fp!=stdout){
+      fclose(fp);
+   }
+}
+
+
+/*---------------------------------------------------*/
+/*--
+   return last error code 
+--*/
+static const char *bzerrorstrings[] = {
+       "OK"
+      ,"SEQUENCE_ERROR"
+      ,"PARAM_ERROR"
+      ,"MEM_ERROR"
+      ,"DATA_ERROR"
+      ,"DATA_ERROR_MAGIC"
+      ,"IO_ERROR"
+      ,"UNEXPECTED_EOF"
+      ,"OUTBUFF_FULL"
+      ,"CONFIG_ERROR"
+      ,"???"   /* for future */
+      ,"???"   /* for future */
+      ,"???"   /* for future */
+      ,"???"   /* for future */
+      ,"???"   /* for future */
+      ,"???"   /* for future */
+};
+
+
+const char * BZ_API(BZ2_bzerror) (BZFILE *b, int *errnum)
+{
+   int err = ((bzFile *)b)->lastErr;
+
+   if(err>0) err = 0;
+   *errnum = err;
+   return bzerrorstrings[err*-1];
+}
+#endif
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                           bzlib.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib.h b/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib.h
new file mode 100644
index 00000000..cfd22210
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib.h
@@ -0,0 +1,334 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Public header file for the library.                   ---*/
+/*---                                               bzlib.h ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#ifndef _BZLIB_H
+#define _BZLIB_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#define BZ_RUN               0
+#define BZ_FLUSH             1
+#define BZ_FINISH            2
+
+#define BZ_OK                0
+#define BZ_RUN_OK            1
+#define BZ_FLUSH_OK          2
+#define BZ_FINISH_OK         3
+#define BZ_STREAM_END        4
+#define BZ_SEQUENCE_ERROR    (-1)
+#define BZ_PARAM_ERROR       (-2)
+#define BZ_MEM_ERROR         (-3)
+#define BZ_DATA_ERROR        (-4)
+#define BZ_DATA_ERROR_MAGIC  (-5)
+#define BZ_IO_ERROR          (-6)
+#define BZ_UNEXPECTED_EOF    (-7)
+#define BZ_OUTBUFF_FULL      (-8)
+#define BZ_CONFIG_ERROR      (-9)
+
+typedef 
+   struct {
+      char *next_in;
+      unsigned int avail_in;
+      unsigned int total_in_lo32;
+      unsigned int total_in_hi32;
+
+      char *next_out;
+      unsigned int avail_out;
+      unsigned int total_out_lo32;
+      unsigned int total_out_hi32;
+
+      void *state;
+
+      void *(*bzalloc)(void *,int,int);
+      void (*bzfree)(void *,void *);
+      void *opaque;
+   } 
+   bz_stream;
+
+
+#ifndef BZ_IMPORT
+#define BZ_EXPORT
+#endif
+
+#ifndef BZ_NO_STDIO
+/* Need a definitition for FILE */
+#include <stdio.h>
+#endif
+
+#ifdef _WIN32
+#   include <windows.h>
+#   ifdef small
+      /* windows.h define small to char */
+#      undef small
+#   endif
+#   ifdef BZ_EXPORT
+#   define BZ_API(func) WINAPI func
+#   define BZ_EXTERN extern
+#   else
+   /* import windows dll dynamically */
+#   define BZ_API(func) (WINAPI * func)
+#   define BZ_EXTERN
+#   endif
+#else
+#   define BZ_API(func) func
+#   define BZ_EXTERN extern
+#endif
+
+
+/*-- Core (low-level) library functions --*/
+
+BZ_EXTERN int BZ_API(BZ2_bzCompressInit) ( 
+      bz_stream* strm, 
+      int        blockSize100k, 
+      int        verbosity, 
+      int        workFactor 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzCompress) ( 
+      bz_stream* strm, 
+      int action 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzCompressEnd) ( 
+      bz_stream* strm 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzDecompressInit) ( 
+      bz_stream *strm, 
+      int       verbosity, 
+      int       small
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzDecompress) ( 
+      bz_stream* strm 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzDecompressEnd) ( 
+      bz_stream *strm 
+   );
+
+
+
+/*-- High(er) level library functions --*/
+
+#ifndef BZ_NO_STDIO
+#define BZ_MAX_UNUSED 5000
+
+typedef void BZFILE;
+
+BZ_EXTERN BZFILE* BZ_API(BZ2_bzReadOpen) ( 
+      int*  bzerror,   
+      FILE* f, 
+      int   verbosity, 
+      int   small,
+      void* unused,    
+      int   nUnused 
+   );
+
+BZ_EXTERN void BZ_API(BZ2_bzReadClose) ( 
+      int*    bzerror, 
+      BZFILE* b 
+   );
+
+BZ_EXTERN void BZ_API(BZ2_bzReadGetUnused) ( 
+      int*    bzerror, 
+      BZFILE* b, 
+      void**  unused,  
+      int*    nUnused 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzRead) ( 
+      int*    bzerror, 
+      BZFILE* b, 
+      void*   buf, 
+      int     len 
+   );
+
+BZ_EXTERN BZFILE* BZ_API(BZ2_bzWriteOpen) ( 
+      int*  bzerror,      
+      FILE* f, 
+      int   blockSize100k, 
+      int   verbosity, 
+      int   workFactor 
+   );
+
+BZ_EXTERN void BZ_API(BZ2_bzWrite) ( 
+      int*    bzerror, 
+      BZFILE* b, 
+      void*   buf, 
+      int     len 
+   );
+
+BZ_EXTERN void BZ_API(BZ2_bzWriteClose) ( 
+      int*          bzerror, 
+      BZFILE*       b, 
+      int           abandon, 
+      unsigned int* nbytes_in, 
+      unsigned int* nbytes_out 
+   );
+
+BZ_EXTERN void BZ_API(BZ2_bzWriteClose64) ( 
+      int*          bzerror, 
+      BZFILE*       b, 
+      int           abandon, 
+      unsigned int* nbytes_in_lo32, 
+      unsigned int* nbytes_in_hi32, 
+      unsigned int* nbytes_out_lo32, 
+      unsigned int* nbytes_out_hi32
+   );
+#endif
+
+
+/*-- Utility functions --*/
+
+BZ_EXTERN int BZ_API(BZ2_bzBuffToBuffCompress) ( 
+      char*         dest, 
+      unsigned int* destLen,
+      char*         source, 
+      unsigned int  sourceLen,
+      int           blockSize100k, 
+      int           verbosity, 
+      int           workFactor 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzBuffToBuffDecompress) ( 
+      char*         dest, 
+      unsigned int* destLen,
+      char*         source, 
+      unsigned int  sourceLen,
+      int           small, 
+      int           verbosity 
+   );
+
+
+/*--
+   Code contributed by Yoshioka Tsuneo (tsuneo@rr.iij4u.or.jp)
+   to support better zlib compatibility.
+   This code is not _officially_ part of libbzip2 (yet);
+   I haven't tested it, documented it, or considered the
+   threading-safeness of it.
+   If this code breaks, please contact both Yoshioka and me.
+--*/
+
+BZ_EXTERN const char * BZ_API(BZ2_bzlibVersion) (
+      void
+   );
+
+#ifndef BZ_NO_STDIO
+BZ_EXTERN BZFILE * BZ_API(BZ2_bzopen) (
+      const char *path,
+      const char *mode
+   );
+
+BZ_EXTERN BZFILE * BZ_API(BZ2_bzdopen) (
+      int        fd,
+      const char *mode
+   );
+         
+BZ_EXTERN int BZ_API(BZ2_bzread) (
+      BZFILE* b, 
+      void* buf, 
+      int len 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzwrite) (
+      BZFILE* b, 
+      void*   buf, 
+      int     len 
+   );
+
+BZ_EXTERN int BZ_API(BZ2_bzflush) (
+      BZFILE* b
+   );
+
+BZ_EXTERN void BZ_API(BZ2_bzclose) (
+      BZFILE* b
+   );
+
+BZ_EXTERN const char * BZ_API(BZ2_bzerror) (
+      BZFILE *b, 
+      int    *errnum
+   );
+#endif
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif
+
+/*-------------------------------------------------------------*/
+/*--- end                                           bzlib.h ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib_private.h b/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib_private.h
new file mode 100644
index 00000000..14f03760
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/bzlib_private.h
@@ -0,0 +1,561 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Private header file for the library.                  ---*/
+/*---                                       bzlib_private.h ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#ifndef _BZLIB_PRIVATE_H
+#define _BZLIB_PRIVATE_H
+
+#include <stdlib.h>
+
+#ifndef BZ_NO_STDIO
+#include <stdio.h>
+#include <ctype.h>
+#include <string.h>
+#endif
+
+#include "bzlib.h"
+
+
+
+/*-- General stuff. --*/
+
+#define BZ_VERSION  "1.0.6, 6-Sept-2010"
+
+typedef char            Char;
+typedef unsigned char   Bool;
+typedef unsigned char   UChar;
+typedef int             Int32;
+typedef unsigned int    UInt32;
+typedef short           Int16;
+typedef unsigned short  UInt16;
+
+#define True  ((Bool)1)
+#define False ((Bool)0)
+
+#ifndef __GNUC__
+#define __inline__  /* */
+#endif 
+
+#ifndef BZ_NO_STDIO
+
+extern void BZ2_bz__AssertH__fail ( int errcode );
+#define AssertH(cond,errcode) \
+   { if (!(cond)) BZ2_bz__AssertH__fail ( errcode ); }
+
+#if BZ_DEBUG
+#define AssertD(cond,msg) \
+   { if (!(cond)) {       \
+      fprintf ( stderr,   \
+        "\n\nlibbzip2(debug build): internal error\n\t%s\n", msg );\
+      exit(1); \
+   }}
+#else
+#define AssertD(cond,msg) /* */
+#endif
+
+#define VPrintf0(zf) \
+   fprintf(stderr,zf)
+#define VPrintf1(zf,za1) \
+   fprintf(stderr,zf,za1)
+#define VPrintf2(zf,za1,za2) \
+   fprintf(stderr,zf,za1,za2)
+#define VPrintf3(zf,za1,za2,za3) \
+   fprintf(stderr,zf,za1,za2,za3)
+#define VPrintf4(zf,za1,za2,za3,za4) \
+   fprintf(stderr,zf,za1,za2,za3,za4)
+#define VPrintf5(zf,za1,za2,za3,za4,za5) \
+   fprintf(stderr,zf,za1,za2,za3,za4,za5)
+
+#else
+
+extern void bz_internal_error ( int errcode );
+#define AssertH(cond,errcode) \
+   { if (!(cond)) bz_internal_error ( errcode ); }
+#define AssertD(cond,msg)                do { } while (0)
+#define VPrintf0(zf)                     do { } while (0)
+#define VPrintf1(zf,za1)                 do { } while (0)
+#define VPrintf2(zf,za1,za2)             do { } while (0)
+#define VPrintf3(zf,za1,za2,za3)         do { } while (0)
+#define VPrintf4(zf,za1,za2,za3,za4)     do { } while (0)
+#define VPrintf5(zf,za1,za2,za3,za4,za5) do { } while (0)
+
+#endif
+
+
+#define BZALLOC(nnn) (strm->bzalloc)(strm->opaque,(nnn),1)
+#define BZFREE(ppp)  (strm->bzfree)(strm->opaque,(ppp))
+
+
+/*-- Header bytes. --*/
+
+#define BZ_HDR_B 0x42   /* 'B' */
+#define BZ_HDR_Z 0x5a   /* 'Z' */
+#define BZ_HDR_h 0x68   /* 'h' */
+#define BZ_HDR_0 0x30   /* '0' */
+  
+/*-- Constants for the back end. --*/
+
+#define BZ_MAX_ALPHA_SIZE 258
+#define BZ_MAX_CODE_LEN    23
+
+#define BZ_RUNA 0
+#define BZ_RUNB 1
+
+#define BZ_N_GROUPS 6
+#define BZ_G_SIZE   50
+#define BZ_N_ITERS  4
+
+#define BZ_MAX_SELECTORS (2 + (900000 / BZ_G_SIZE))
+
+
+
+/*-- Stuff for randomising repetitive blocks. --*/
+
+extern Int32 BZ2_rNums[512];
+
+#define BZ_RAND_DECLS                          \
+   Int32 rNToGo;                               \
+   Int32 rTPos                                 \
+
+#define BZ_RAND_INIT_MASK                      \
+   s->rNToGo = 0;                              \
+   s->rTPos  = 0                               \
+
+#define BZ_RAND_MASK ((s->rNToGo == 1) ? 1 : 0)
+
+#define BZ_RAND_UPD_MASK                       \
+   if (s->rNToGo == 0) {                       \
+      s->rNToGo = BZ2_rNums[s->rTPos];         \
+      s->rTPos++;                              \
+      if (s->rTPos == 512) s->rTPos = 0;       \
+   }                                           \
+   s->rNToGo--;
+
+
+
+/*-- Stuff for doing CRCs. --*/
+
+extern UInt32 BZ2_crc32Table[256];
+
+#define BZ_INITIALISE_CRC(crcVar)              \
+{                                              \
+   crcVar = 0xffffffffL;                       \
+}
+
+#define BZ_FINALISE_CRC(crcVar)                \
+{                                              \
+   crcVar = ~(crcVar);                         \
+}
+
+#define BZ_UPDATE_CRC(crcVar,cha)              \
+{                                              \
+   crcVar = (crcVar << 8) ^                    \
+            BZ2_crc32Table[(crcVar >> 24) ^    \
+                           ((UChar)cha)];      \
+}
+
+
+
+/*-- States and modes for compression. --*/
+
+#define BZ_M_IDLE      1
+#define BZ_M_RUNNING   2
+#define BZ_M_FLUSHING  3
+#define BZ_M_FINISHING 4
+
+#define BZ_S_OUTPUT    1
+#define BZ_S_INPUT     2
+
+#define BZ_N_RADIX 2
+#define BZ_N_QSORT 12
+#define BZ_N_SHELL 18
+#define BZ_N_OVERSHOOT (BZ_N_RADIX + BZ_N_QSORT + BZ_N_SHELL + 2)
+
+
+
+
+/*-- Structure holding all the compression-side stuff. --*/
+
+typedef
+   struct {
+      /* pointer back to the struct bz_stream */
+      bz_stream* strm;
+
+      /* mode this stream is in, and whether inputting */
+      /* or outputting data */
+      Int32    mode;
+      Int32    state;
+
+      /* remembers avail_in when flush/finish requested */
+      UInt32   avail_in_expect;
+
+      /* for doing the block sorting */
+      UInt32*  arr1;
+      UInt32*  arr2;
+      UInt32*  ftab;
+      Int32    origPtr;
+
+      /* aliases for arr1 and arr2 */
+      UInt32*  ptr;
+      UChar*   block;
+      UInt16*  mtfv;
+      UChar*   zbits;
+
+      /* for deciding when to use the fallback sorting algorithm */
+      Int32    workFactor;
+
+      /* run-length-encoding of the input */
+      UInt32   state_in_ch;
+      Int32    state_in_len;
+      BZ_RAND_DECLS;
+
+      /* input and output limits and current posns */
+      Int32    nblock;
+      Int32    nblockMAX;
+      Int32    numZ;
+      Int32    state_out_pos;
+
+      /* map of bytes used in block */
+      Int32    nInUse;
+      Bool     inUse[256];
+      UChar    unseqToSeq[256];
+
+      /* the buffer for bit stream creation */
+      UInt32   bsBuff;
+      Int32    bsLive;
+
+      /* block and combined CRCs */
+      UInt32   blockCRC;
+      UInt32   combinedCRC;
+
+      /* misc administratium */
+      Int32    verbosity;
+      Int32    blockNo;
+      Int32    blockSize100k;
+
+      /* stuff for coding the MTF values */
+      Int32    nMTF;
+      Int32    mtfFreq    [BZ_MAX_ALPHA_SIZE];
+      UChar    selector   [BZ_MAX_SELECTORS];
+      UChar    selectorMtf[BZ_MAX_SELECTORS];
+
+      UChar    len     [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+      Int32    code    [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+      Int32    rfreq   [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+      /* second dimension: only 3 needed; 4 makes index calculations faster */
+      UInt32   len_pack[BZ_MAX_ALPHA_SIZE][4];
+
+   }
+   EState;
+
+
+
+/*-- externs for compression. --*/
+
+extern void 
+BZ2_blockSort ( EState* );
+
+extern void 
+BZ2_compressBlock ( EState*, Bool );
+
+extern void 
+BZ2_bsInitWrite ( EState* );
+
+extern void 
+BZ2_hbAssignCodes ( Int32*, UChar*, Int32, Int32, Int32 );
+
+extern void 
+BZ2_hbMakeCodeLengths ( UChar*, Int32*, Int32, Int32 );
+
+
+
+/*-- states for decompression. --*/
+
+#define BZ_X_IDLE        1
+#define BZ_X_OUTPUT      2
+
+#define BZ_X_MAGIC_1     10
+#define BZ_X_MAGIC_2     11
+#define BZ_X_MAGIC_3     12
+#define BZ_X_MAGIC_4     13
+#define BZ_X_BLKHDR_1    14
+#define BZ_X_BLKHDR_2    15
+#define BZ_X_BLKHDR_3    16
+#define BZ_X_BLKHDR_4    17
+#define BZ_X_BLKHDR_5    18
+#define BZ_X_BLKHDR_6    19
+#define BZ_X_BCRC_1      20
+#define BZ_X_BCRC_2      21
+#define BZ_X_BCRC_3      22
+#define BZ_X_BCRC_4      23
+#define BZ_X_RANDBIT     24
+#define BZ_X_ORIGPTR_1   25
+#define BZ_X_ORIGPTR_2   26
+#define BZ_X_ORIGPTR_3   27
+#define BZ_X_MAPPING_1   28
+#define BZ_X_MAPPING_2   29
+#define BZ_X_SELECTOR_1  30
+#define BZ_X_SELECTOR_2  31
+#define BZ_X_SELECTOR_3  32
+#define BZ_X_CODING_1    33
+#define BZ_X_CODING_2    34
+#define BZ_X_CODING_3    35
+#define BZ_X_MTF_1       36
+#define BZ_X_MTF_2       37
+#define BZ_X_MTF_3       38
+#define BZ_X_MTF_4       39
+#define BZ_X_MTF_5       40
+#define BZ_X_MTF_6       41
+#define BZ_X_ENDHDR_2    42
+#define BZ_X_ENDHDR_3    43
+#define BZ_X_ENDHDR_4    44
+#define BZ_X_ENDHDR_5    45
+#define BZ_X_ENDHDR_6    46
+#define BZ_X_CCRC_1      47
+#define BZ_X_CCRC_2      48
+#define BZ_X_CCRC_3      49
+#define BZ_X_CCRC_4      50
+
+
+
+/*-- Constants for the fast MTF decoder. --*/
+
+#define MTFA_SIZE 4096
+#define MTFL_SIZE 16
+
+
+
+/*-- Structure holding all the decompression-side stuff. --*/
+
+typedef
+   struct {
+      /* pointer back to the struct bz_stream */
+      bz_stream* strm;
+
+      /* state indicator for this stream */
+      Int32    state;
+
+      /* for doing the final run-length decoding */
+      UChar    state_out_ch;
+      Int32    state_out_len;
+      Bool     blockRandomised;
+      BZ_RAND_DECLS;
+
+      /* the buffer for bit stream reading */
+      UInt32   bsBuff;
+      Int32    bsLive;
+
+      /* misc administratium */
+      Int32    blockSize100k;
+      Bool     smallDecompress;
+      Int32    currBlockNo;
+      Int32    verbosity;
+
+      /* for undoing the Burrows-Wheeler transform */
+      Int32    origPtr;
+      UInt32   tPos;
+      Int32    k0;
+      Int32    unzftab[256];
+      Int32    nblock_used;
+      Int32    cftab[257];
+      Int32    cftabCopy[257];
+
+      /* for undoing the Burrows-Wheeler transform (FAST) */
+      UInt32   *tt;
+
+      /* for undoing the Burrows-Wheeler transform (SMALL) */
+      UInt16   *ll16;
+      UChar    *ll4;
+
+      /* stored and calculated CRCs */
+      UInt32   storedBlockCRC;
+      UInt32   storedCombinedCRC;
+      UInt32   calculatedBlockCRC;
+      UInt32   calculatedCombinedCRC;
+
+      /* map of bytes used in block */
+      Int32    nInUse;
+      Bool     inUse[256];
+      Bool     inUse16[16];
+      UChar    seqToUnseq[256];
+
+      /* for decoding the MTF values */
+      UChar    mtfa   [MTFA_SIZE];
+      Int32    mtfbase[256 / MTFL_SIZE];
+      UChar    selector   [BZ_MAX_SELECTORS];
+      UChar    selectorMtf[BZ_MAX_SELECTORS];
+      UChar    len  [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+
+      Int32    limit  [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+      Int32    base   [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+      Int32    perm   [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+      Int32    minLens[BZ_N_GROUPS];
+
+      /* save area for scalars in the main decompress code */
+      Int32    save_i;
+      Int32    save_j;
+      Int32    save_t;
+      Int32    save_alphaSize;
+      Int32    save_nGroups;
+      Int32    save_nSelectors;
+      Int32    save_EOB;
+      Int32    save_groupNo;
+      Int32    save_groupPos;
+      Int32    save_nextSym;
+      Int32    save_nblockMAX;
+      Int32    save_nblock;
+      Int32    save_es;
+      Int32    save_N;
+      Int32    save_curr;
+      Int32    save_zt;
+      Int32    save_zn; 
+      Int32    save_zvec;
+      Int32    save_zj;
+      Int32    save_gSel;
+      Int32    save_gMinlen;
+      Int32*   save_gLimit;
+      Int32*   save_gBase;
+      Int32*   save_gPerm;
+
+   }
+   DState;
+
+
+
+/*-- Macros for decompression. --*/
+
+#define BZ_GET_FAST(cccc)                     \
+    /* c_tPos is unsigned, hence test < 0 is pointless. */ \
+    if (s->tPos >= (UInt32)100000 * (UInt32)s->blockSize100k) return True; \
+    s->tPos = s->tt[s->tPos];                 \
+    cccc = (UChar)(s->tPos & 0xff);           \
+    s->tPos >>= 8;
+
+#define BZ_GET_FAST_C(cccc)                   \
+    /* c_tPos is unsigned, hence test < 0 is pointless. */ \
+    if (c_tPos >= (UInt32)100000 * (UInt32)ro_blockSize100k) return True; \
+    c_tPos = c_tt[c_tPos];                    \
+    cccc = (UChar)(c_tPos & 0xff);            \
+    c_tPos >>= 8;
+
+#define SET_LL4(i,n)                                          \
+   { if (((i) & 0x1) == 0)                                    \
+        s->ll4[(i) >> 1] = (s->ll4[(i) >> 1] & 0xf0) | (n); else    \
+        s->ll4[(i) >> 1] = (s->ll4[(i) >> 1] & 0x0f) | ((n) << 4);  \
+   }
+
+#define GET_LL4(i)                             \
+   ((((UInt32)(s->ll4[(i) >> 1])) >> (((i) << 2) & 0x4)) & 0xF)
+
+#define SET_LL(i,n)                          \
+   { s->ll16[i] = (UInt16)(n & 0x0000ffff);  \
+     SET_LL4(i, n >> 16);                    \
+   }
+
+#define GET_LL(i) \
+   (((UInt32)s->ll16[i]) | (GET_LL4(i) << 16))
+
+#define BZ_GET_SMALL(cccc)                            \
+    /* c_tPos is unsigned, hence test < 0 is pointless. */ \
+    if (s->tPos >= (UInt32)100000 * (UInt32)s->blockSize100k) return True; \
+    cccc = BZ2_indexIntoF ( s->tPos, s->cftab );    \
+    s->tPos = GET_LL(s->tPos);
+
+
+/*-- externs for decompression. --*/
+
+extern Int32 
+BZ2_indexIntoF ( Int32, Int32* );
+
+extern Int32 
+BZ2_decompress ( DState* );
+
+extern void 
+BZ2_hbCreateDecodeTables ( Int32*, Int32*, Int32*, UChar*,
+                           Int32,  Int32, Int32 );
+
+
+#endif
+
+
+/*-- BZ_NO_STDIO seems to make NULL disappear on some platforms. --*/
+
+#ifdef BZ_NO_STDIO
+#ifndef NULL
+#define NULL 0
+#endif
+#endif
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                   bzlib_private.h ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/compress.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/compress.cpp
new file mode 100644
index 00000000..46ab18a1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/compress.cpp
@@ -0,0 +1,724 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Compression machinery (not incl block sorting)        ---*/
+/*---                                          compress.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+/* CHANGES
+    0.9.0    -- original version.
+    0.9.0a/b -- no changes in this file.
+    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
+                so as to do a bit better on small files
+*/
+
+#include "bzlib_private.h"
+
+
+/*---------------------------------------------------*/
+/*--- Bit stream I/O                              ---*/
+/*---------------------------------------------------*/
+
+/*---------------------------------------------------*/
+void BZ2_bsInitWrite ( EState* s )
+{
+   s->bsLive = 0;
+   s->bsBuff = 0;
+}
+
+
+/*---------------------------------------------------*/
+static
+void bsFinishWrite ( EState* s )
+{
+   while (s->bsLive > 0) {
+      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
+      s->numZ++;
+      s->bsBuff <<= 8;
+      s->bsLive -= 8;
+   }
+}
+
+
+/*---------------------------------------------------*/
+#define bsNEEDW(nz)                           \
+{                                             \
+   while (s->bsLive >= 8) {                   \
+      s->zbits[s->numZ]                       \
+         = (UChar)(s->bsBuff >> 24);          \
+      s->numZ++;                              \
+      s->bsBuff <<= 8;                        \
+      s->bsLive -= 8;                         \
+   }                                          \
+}
+
+
+/*---------------------------------------------------*/
+static
+__inline__
+void bsW ( EState* s, Int32 n, UInt32 v )
+{
+   bsNEEDW ( n );
+   s->bsBuff |= (v << (32 - s->bsLive - n));
+   s->bsLive += n;
+}
+
+
+/*---------------------------------------------------*/
+static
+void bsPutUInt32 ( EState* s, UInt32 u )
+{
+   bsW ( s, 8, (u >> 24) & 0xffL );
+   bsW ( s, 8, (u >> 16) & 0xffL );
+   bsW ( s, 8, (u >>  8) & 0xffL );
+   bsW ( s, 8,  u        & 0xffL );
+}
+
+
+/*---------------------------------------------------*/
+static
+void bsPutUChar ( EState* s, UChar c )
+{
+   bsW( s, 8, (UInt32)c );
+}
+
+
+/*---------------------------------------------------*/
+/*--- The back end proper                         ---*/
+/*---------------------------------------------------*/
+
+/*---------------------------------------------------*/
+static
+void makeMaps_e ( EState* s )
+{
+   Int32 i;
+   s->nInUse = 0;
+   for (i = 0; i < 256; i++)
+      if (s->inUse[i]) {
+         s->unseqToSeq[i] = s->nInUse;
+         s->nInUse++;
+      }
+}
+
+
+/*---------------------------------------------------*/
+static
+void generateMTFValues ( EState* s )
+{
+   UChar   yy[256];
+   Int32   i, j;
+   Int32   zPend;
+   Int32   wr;
+   Int32   EOB;
+
+   /* 
+      After sorting (eg, here),
+         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
+         and
+         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
+         holds the original block data.
+
+      The first thing to do is generate the MTF values,
+      and put them in
+         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
+      Because there are strictly fewer or equal MTF values
+      than block values, ptr values in this area are overwritten
+      with MTF values only when they are no longer needed.
+
+      The final compressed bitstream is generated into the
+      area starting at
+         (UChar*) (&((UChar*)s->arr2)[s->nblock])
+
+      These storage aliases are set up in bzCompressInit(),
+      except for the last one, which is arranged in 
+      compressBlock().
+   */
+   UInt32* ptr   = s->ptr;
+   UChar* block  = s->block;
+   UInt16* mtfv  = s->mtfv;
+
+   makeMaps_e ( s );
+   EOB = s->nInUse+1;
+
+   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
+
+   wr = 0;
+   zPend = 0;
+   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
+
+   for (i = 0; i < s->nblock; i++) {
+      UChar ll_i;
+      AssertD ( wr <= i, "generateMTFValues(1)" );
+      j = ptr[i]-1; if (j < 0) j += s->nblock;
+      ll_i = s->unseqToSeq[block[j]];
+      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
+
+      if (yy[0] == ll_i) { 
+         zPend++;
+      } else {
+
+         if (zPend > 0) {
+            zPend--;
+            while (True) {
+               if (zPend & 1) {
+                  mtfv[wr] = BZ_RUNB; wr++; 
+                  s->mtfFreq[BZ_RUNB]++; 
+               } else {
+                  mtfv[wr] = BZ_RUNA; wr++; 
+                  s->mtfFreq[BZ_RUNA]++; 
+               }
+               if (zPend < 2) break;
+               zPend = (zPend - 2) / 2;
+            };
+            zPend = 0;
+         }
+         {
+            UChar  rtmp;
+            UChar* ryy_j;
+            UChar  rll_i;
+            rtmp  = yy[1];
+            yy[1] = yy[0];
+            ryy_j = &(yy[1]);
+            rll_i = ll_i;
+            while ( rll_i != rtmp ) {
+               UChar rtmp2;
+               ryy_j++;
+               rtmp2  = rtmp;
+               rtmp   = *ryy_j;
+               *ryy_j = rtmp2;
+            };
+            yy[0] = rtmp;
+            j = ryy_j - &(yy[0]);
+            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
+         }
+
+      }
+   }
+
+   if (zPend > 0) {
+      zPend--;
+      while (True) {
+         if (zPend & 1) {
+            mtfv[wr] = BZ_RUNB; wr++; 
+            s->mtfFreq[BZ_RUNB]++; 
+         } else {
+            mtfv[wr] = BZ_RUNA; wr++; 
+            s->mtfFreq[BZ_RUNA]++; 
+         }
+         if (zPend < 2) break;
+         zPend = (zPend - 2) / 2;
+      };
+      zPend = 0;
+   }
+
+   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
+
+   s->nMTF = wr;
+}
+
+
+/*---------------------------------------------------*/
+#define BZ_LESSER_ICOST  0
+#define BZ_GREATER_ICOST 15
+
+static
+void sendMTFValues ( EState* s )
+{
+   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
+   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
+   Int32 nGroups, nBytes;
+
+   /*--
+   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+   is a global since the decoder also needs it.
+
+   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
+   are also globals only used in this proc.
+   Made global to keep stack frame size small.
+   --*/
+
+
+   UInt16 cost[BZ_N_GROUPS];
+   Int32  fave[BZ_N_GROUPS];
+
+   UInt16* mtfv = s->mtfv;
+
+   if (s->verbosity >= 3)
+      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
+                "%d+2 syms in use\n", 
+                s->nblock, s->nMTF, s->nInUse );
+
+   alphaSize = s->nInUse+2;
+   for (t = 0; t < BZ_N_GROUPS; t++)
+      for (v = 0; v < alphaSize; v++)
+         s->len[t][v] = BZ_GREATER_ICOST;
+
+   /*--- Decide how many coding tables to use ---*/
+   AssertH ( s->nMTF > 0, 3001 );
+   if (s->nMTF < 200)  nGroups = 2; else
+   if (s->nMTF < 600)  nGroups = 3; else
+   if (s->nMTF < 1200) nGroups = 4; else
+   if (s->nMTF < 2400) nGroups = 5; else
+                       nGroups = 6;
+
+   /*--- Generate an initial set of coding tables ---*/
+   { 
+      Int32 nPart, remF, tFreq, aFreq;
+
+      nPart = nGroups;
+      remF  = s->nMTF;
+      gs = 0;
+      while (nPart > 0) {
+         tFreq = remF / nPart;
+         ge = gs-1;
+         aFreq = 0;
+         while (aFreq < tFreq && ge < alphaSize-1) {
+            ge++;
+            aFreq += s->mtfFreq[ge];
+         }
+
+         if (ge > gs 
+             && nPart != nGroups && nPart != 1 
+             && ((nGroups-nPart) % 2 == 1)) {
+            aFreq -= s->mtfFreq[ge];
+            ge--;
+         }
+
+         if (s->verbosity >= 3)
+            VPrintf5( "      initial group %d, [%d .. %d], "
+                      "has %d syms (%4.1f%%)\n",
+                      nPart, gs, ge, aFreq, 
+                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
+ 
+         for (v = 0; v < alphaSize; v++)
+            if (v >= gs && v <= ge) 
+               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
+               s->len[nPart-1][v] = BZ_GREATER_ICOST;
+ 
+         nPart--;
+         gs = ge+1;
+         remF -= aFreq;
+      }
+   }
+
+   /*--- 
+      Iterate up to BZ_N_ITERS times to improve the tables.
+   ---*/
+   for (iter = 0; iter < BZ_N_ITERS; iter++) {
+
+      for (t = 0; t < nGroups; t++) fave[t] = 0;
+
+      for (t = 0; t < nGroups; t++)
+         for (v = 0; v < alphaSize; v++)
+            s->rfreq[t][v] = 0;
+
+      /*---
+        Set up an auxiliary length table which is used to fast-track
+	the common case (nGroups == 6). 
+      ---*/
+      if (nGroups == 6) {
+         for (v = 0; v < alphaSize; v++) {
+            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
+            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
+            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
+	 }
+      }
+
+      nSelectors = 0;
+      totc = 0;
+      gs = 0;
+      while (True) {
+
+         /*--- Set group start & end marks. --*/
+         if (gs >= s->nMTF) break;
+         ge = gs + BZ_G_SIZE - 1; 
+         if (ge >= s->nMTF) ge = s->nMTF-1;
+
+         /*-- 
+            Calculate the cost of this group as coded
+            by each of the coding tables.
+         --*/
+         for (t = 0; t < nGroups; t++) cost[t] = 0;
+
+         if (nGroups == 6 && 50 == ge-gs+1) {
+            /*--- fast track the common case ---*/
+            UInt32 cost01, cost23, cost45;
+            UInt16 icv;
+            cost01 = cost23 = cost45 = 0;
+
+#           define BZ_ITER(nn)                \
+               icv = mtfv[gs+(nn)];           \
+               cost01 += s->len_pack[icv][0]; \
+               cost23 += s->len_pack[icv][1]; \
+               cost45 += s->len_pack[icv][2]; \
+
+            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
+            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
+            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
+            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
+            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
+            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
+            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
+            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
+            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
+            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
+
+#           undef BZ_ITER
+
+            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
+            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
+            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
+
+         } else {
+	    /*--- slow version which correctly handles all situations ---*/
+            for (i = gs; i <= ge; i++) { 
+               UInt16 icv = mtfv[i];
+               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
+            }
+         }
+ 
+         /*-- 
+            Find the coding table which is best for this group,
+            and record its identity in the selector table.
+         --*/
+         bc = 999999999; bt = -1;
+         for (t = 0; t < nGroups; t++)
+            if (cost[t] < bc) { bc = cost[t]; bt = t; };
+         totc += bc;
+         fave[bt]++;
+         s->selector[nSelectors] = bt;
+         nSelectors++;
+
+         /*-- 
+            Increment the symbol frequencies for the selected table.
+          --*/
+         if (nGroups == 6 && 50 == ge-gs+1) {
+            /*--- fast track the common case ---*/
+
+#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
+
+            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
+            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
+            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
+            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
+            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
+            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
+            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
+            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
+            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
+            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
+
+#           undef BZ_ITUR
+
+         } else {
+	    /*--- slow version which correctly handles all situations ---*/
+            for (i = gs; i <= ge; i++)
+               s->rfreq[bt][ mtfv[i] ]++;
+         }
+
+         gs = ge+1;
+      }
+      if (s->verbosity >= 3) {
+         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
+                   iter+1, totc/8 );
+         for (t = 0; t < nGroups; t++)
+            VPrintf1 ( "%d ", fave[t] );
+         VPrintf0 ( "\n" );
+      }
+
+      /*--
+        Recompute the tables based on the accumulated frequencies.
+      --*/
+      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
+         comment in huffman.c for details. */
+      for (t = 0; t < nGroups; t++)
+         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
+                                 alphaSize, 17 /*20*/ );
+   }
+
+
+   AssertH( nGroups < 8, 3002 );
+   AssertH( nSelectors < 32768 &&
+            nSelectors <= (2 + (900000 / BZ_G_SIZE)),
+            3003 );
+
+
+   /*--- Compute MTF values for the selectors. ---*/
+   {
+      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
+      for (i = 0; i < nGroups; i++) pos[i] = i;
+      for (i = 0; i < nSelectors; i++) {
+         ll_i = s->selector[i];
+         j = 0;
+         tmp = pos[j];
+         while ( ll_i != tmp ) {
+            j++;
+            tmp2 = tmp;
+            tmp = pos[j];
+            pos[j] = tmp2;
+         };
+         pos[0] = tmp;
+         s->selectorMtf[i] = j;
+      }
+   };
+
+   /*--- Assign actual codes for the tables. --*/
+   for (t = 0; t < nGroups; t++) {
+      minLen = 32;
+      maxLen = 0;
+      for (i = 0; i < alphaSize; i++) {
+         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
+         if (s->len[t][i] < minLen) minLen = s->len[t][i];
+      }
+      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
+      AssertH ( !(minLen < 1),  3005 );
+      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
+                          minLen, maxLen, alphaSize );
+   }
+
+   /*--- Transmit the mapping table. ---*/
+   { 
+      Bool inUse16[16];
+      for (i = 0; i < 16; i++) {
+          inUse16[i] = False;
+          for (j = 0; j < 16; j++)
+             if (s->inUse[i * 16 + j]) inUse16[i] = True;
+      }
+     
+      nBytes = s->numZ;
+      for (i = 0; i < 16; i++)
+         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
+
+      for (i = 0; i < 16; i++)
+         if (inUse16[i])
+            for (j = 0; j < 16; j++) {
+               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
+            }
+
+      if (s->verbosity >= 3) 
+         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
+   }
+
+   /*--- Now the selectors. ---*/
+   nBytes = s->numZ;
+   bsW ( s, 3, nGroups );
+   bsW ( s, 15, nSelectors );
+   for (i = 0; i < nSelectors; i++) { 
+      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
+      bsW(s,1,0);
+   }
+   if (s->verbosity >= 3)
+      VPrintf1( "selectors %d, ", s->numZ-nBytes );
+
+   /*--- Now the coding tables. ---*/
+   nBytes = s->numZ;
+
+   for (t = 0; t < nGroups; t++) {
+      Int32 curr = s->len[t][0];
+      bsW ( s, 5, curr );
+      for (i = 0; i < alphaSize; i++) {
+         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
+         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
+         bsW ( s, 1, 0 );
+      }
+   }
+
+   if (s->verbosity >= 3)
+      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
+
+   /*--- And finally, the block data proper ---*/
+   nBytes = s->numZ;
+   selCtr = 0;
+   gs = 0;
+   while (True) {
+      if (gs >= s->nMTF) break;
+      ge = gs + BZ_G_SIZE - 1; 
+      if (ge >= s->nMTF) ge = s->nMTF-1;
+      AssertH ( s->selector[selCtr] < nGroups, 3006 );
+
+      if (nGroups == 6 && 50 == ge-gs+1) {
+            /*--- fast track the common case ---*/
+            UInt16 mtfv_i;
+            UChar* s_len_sel_selCtr 
+               = &(s->len[s->selector[selCtr]][0]);
+            Int32* s_code_sel_selCtr
+               = &(s->code[s->selector[selCtr]][0]);
+
+#           define BZ_ITAH(nn)                      \
+               mtfv_i = mtfv[gs+(nn)];              \
+               bsW ( s,                             \
+                     s_len_sel_selCtr[mtfv_i],      \
+                     s_code_sel_selCtr[mtfv_i] )
+
+            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
+            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
+            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
+            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
+            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
+            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
+            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
+            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
+            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
+            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
+
+#           undef BZ_ITAH
+
+      } else {
+	 /*--- slow version which correctly handles all situations ---*/
+         for (i = gs; i <= ge; i++) {
+            bsW ( s, 
+                  s->len  [s->selector[selCtr]] [mtfv[i]],
+                  s->code [s->selector[selCtr]] [mtfv[i]] );
+         }
+      }
+
+
+      gs = ge+1;
+      selCtr++;
+   }
+   AssertH( selCtr == nSelectors, 3007 );
+
+   if (s->verbosity >= 3)
+      VPrintf1( "codes %d\n", s->numZ-nBytes );
+}
+
+
+/*---------------------------------------------------*/
+void BZ2_compressBlock ( EState* s, Bool is_last_block )
+{
+   if (s->nblock > 0) {
+
+      BZ_FINALISE_CRC ( s->blockCRC );
+      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
+      s->combinedCRC ^= s->blockCRC;
+      if (s->blockNo > 1) s->numZ = 0;
+
+      if (s->verbosity >= 2)
+         VPrintf4( "    block %d: crc = 0x%08x, "
+                   "combined CRC = 0x%08x, size = %d\n",
+                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
+
+      BZ2_blockSort ( s );
+   }
+
+   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
+
+   /*-- If this is the first block, create the stream header. --*/
+   if (s->blockNo == 1) {
+      BZ2_bsInitWrite ( s );
+      bsPutUChar ( s, BZ_HDR_B );
+      bsPutUChar ( s, BZ_HDR_Z );
+      bsPutUChar ( s, BZ_HDR_h );
+      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
+   }
+
+   if (s->nblock > 0) {
+
+      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
+      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
+      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
+
+      /*-- Now the block's CRC, so it is in a known place. --*/
+      bsPutUInt32 ( s, s->blockCRC );
+
+      /*-- 
+         Now a single bit indicating (non-)randomisation. 
+         As of version 0.9.5, we use a better sorting algorithm
+         which makes randomisation unnecessary.  So always set
+         the randomised bit to 'no'.  Of course, the decoder
+         still needs to be able to handle randomised blocks
+         so as to maintain backwards compatibility with
+         older versions of bzip2.
+      --*/
+      bsW(s,1,0);
+
+      bsW ( s, 24, s->origPtr );
+      generateMTFValues ( s );
+      sendMTFValues ( s );
+   }
+
+
+   /*-- If this is the last block, add the stream trailer. --*/
+   if (is_last_block) {
+
+      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
+      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
+      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
+      bsPutUInt32 ( s, s->combinedCRC );
+      if (s->verbosity >= 2)
+         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
+      bsFinishWrite ( s );
+   }
+}
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                        compress.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/crctable.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/crctable.cpp
new file mode 100644
index 00000000..a64504f5
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/crctable.cpp
@@ -0,0 +1,156 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Table for doing CRCs                                  ---*/
+/*---                                          crctable.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#include "bzlib_private.h"
+
+/*--
+  I think this is an implementation of the AUTODIN-II,
+  Ethernet & FDDI 32-bit CRC standard.  Vaguely derived
+  from code by Rob Warnock, in Section 51 of the
+  comp.compression FAQ.
+--*/
+
+UInt32 BZ2_crc32Table[256] = {
+
+   /*-- Ugly, innit? --*/
+
+   0x00000000L, 0x04c11db7L, 0x09823b6eL, 0x0d4326d9L,
+   0x130476dcL, 0x17c56b6bL, 0x1a864db2L, 0x1e475005L,
+   0x2608edb8L, 0x22c9f00fL, 0x2f8ad6d6L, 0x2b4bcb61L,
+   0x350c9b64L, 0x31cd86d3L, 0x3c8ea00aL, 0x384fbdbdL,
+   0x4c11db70L, 0x48d0c6c7L, 0x4593e01eL, 0x4152fda9L,
+   0x5f15adacL, 0x5bd4b01bL, 0x569796c2L, 0x52568b75L,
+   0x6a1936c8L, 0x6ed82b7fL, 0x639b0da6L, 0x675a1011L,
+   0x791d4014L, 0x7ddc5da3L, 0x709f7b7aL, 0x745e66cdL,
+   0x9823b6e0L, 0x9ce2ab57L, 0x91a18d8eL, 0x95609039L,
+   0x8b27c03cL, 0x8fe6dd8bL, 0x82a5fb52L, 0x8664e6e5L,
+   0xbe2b5b58L, 0xbaea46efL, 0xb7a96036L, 0xb3687d81L,
+   0xad2f2d84L, 0xa9ee3033L, 0xa4ad16eaL, 0xa06c0b5dL,
+   0xd4326d90L, 0xd0f37027L, 0xddb056feL, 0xd9714b49L,
+   0xc7361b4cL, 0xc3f706fbL, 0xceb42022L, 0xca753d95L,
+   0xf23a8028L, 0xf6fb9d9fL, 0xfbb8bb46L, 0xff79a6f1L,
+   0xe13ef6f4L, 0xe5ffeb43L, 0xe8bccd9aL, 0xec7dd02dL,
+   0x34867077L, 0x30476dc0L, 0x3d044b19L, 0x39c556aeL,
+   0x278206abL, 0x23431b1cL, 0x2e003dc5L, 0x2ac12072L,
+   0x128e9dcfL, 0x164f8078L, 0x1b0ca6a1L, 0x1fcdbb16L,
+   0x018aeb13L, 0x054bf6a4L, 0x0808d07dL, 0x0cc9cdcaL,
+   0x7897ab07L, 0x7c56b6b0L, 0x71159069L, 0x75d48ddeL,
+   0x6b93dddbL, 0x6f52c06cL, 0x6211e6b5L, 0x66d0fb02L,
+   0x5e9f46bfL, 0x5a5e5b08L, 0x571d7dd1L, 0x53dc6066L,
+   0x4d9b3063L, 0x495a2dd4L, 0x44190b0dL, 0x40d816baL,
+   0xaca5c697L, 0xa864db20L, 0xa527fdf9L, 0xa1e6e04eL,
+   0xbfa1b04bL, 0xbb60adfcL, 0xb6238b25L, 0xb2e29692L,
+   0x8aad2b2fL, 0x8e6c3698L, 0x832f1041L, 0x87ee0df6L,
+   0x99a95df3L, 0x9d684044L, 0x902b669dL, 0x94ea7b2aL,
+   0xe0b41de7L, 0xe4750050L, 0xe9362689L, 0xedf73b3eL,
+   0xf3b06b3bL, 0xf771768cL, 0xfa325055L, 0xfef34de2L,
+   0xc6bcf05fL, 0xc27dede8L, 0xcf3ecb31L, 0xcbffd686L,
+   0xd5b88683L, 0xd1799b34L, 0xdc3abdedL, 0xd8fba05aL,
+   0x690ce0eeL, 0x6dcdfd59L, 0x608edb80L, 0x644fc637L,
+   0x7a089632L, 0x7ec98b85L, 0x738aad5cL, 0x774bb0ebL,
+   0x4f040d56L, 0x4bc510e1L, 0x46863638L, 0x42472b8fL,
+   0x5c007b8aL, 0x58c1663dL, 0x558240e4L, 0x51435d53L,
+   0x251d3b9eL, 0x21dc2629L, 0x2c9f00f0L, 0x285e1d47L,
+   0x36194d42L, 0x32d850f5L, 0x3f9b762cL, 0x3b5a6b9bL,
+   0x0315d626L, 0x07d4cb91L, 0x0a97ed48L, 0x0e56f0ffL,
+   0x1011a0faL, 0x14d0bd4dL, 0x19939b94L, 0x1d528623L,
+   0xf12f560eL, 0xf5ee4bb9L, 0xf8ad6d60L, 0xfc6c70d7L,
+   0xe22b20d2L, 0xe6ea3d65L, 0xeba91bbcL, 0xef68060bL,
+   0xd727bbb6L, 0xd3e6a601L, 0xdea580d8L, 0xda649d6fL,
+   0xc423cd6aL, 0xc0e2d0ddL, 0xcda1f604L, 0xc960ebb3L,
+   0xbd3e8d7eL, 0xb9ff90c9L, 0xb4bcb610L, 0xb07daba7L,
+   0xae3afba2L, 0xaafbe615L, 0xa7b8c0ccL, 0xa379dd7bL,
+   0x9b3660c6L, 0x9ff77d71L, 0x92b45ba8L, 0x9675461fL,
+   0x8832161aL, 0x8cf30badL, 0x81b02d74L, 0x857130c3L,
+   0x5d8a9099L, 0x594b8d2eL, 0x5408abf7L, 0x50c9b640L,
+   0x4e8ee645L, 0x4a4ffbf2L, 0x470cdd2bL, 0x43cdc09cL,
+   0x7b827d21L, 0x7f436096L, 0x7200464fL, 0x76c15bf8L,
+   0x68860bfdL, 0x6c47164aL, 0x61043093L, 0x65c52d24L,
+   0x119b4be9L, 0x155a565eL, 0x18197087L, 0x1cd86d30L,
+   0x029f3d35L, 0x065e2082L, 0x0b1d065bL, 0x0fdc1becL,
+   0x3793a651L, 0x3352bbe6L, 0x3e119d3fL, 0x3ad08088L,
+   0x2497d08dL, 0x2056cd3aL, 0x2d15ebe3L, 0x29d4f654L,
+   0xc5a92679L, 0xc1683bceL, 0xcc2b1d17L, 0xc8ea00a0L,
+   0xd6ad50a5L, 0xd26c4d12L, 0xdf2f6bcbL, 0xdbee767cL,
+   0xe3a1cbc1L, 0xe760d676L, 0xea23f0afL, 0xeee2ed18L,
+   0xf0a5bd1dL, 0xf464a0aaL, 0xf9278673L, 0xfde69bc4L,
+   0x89b8fd09L, 0x8d79e0beL, 0x803ac667L, 0x84fbdbd0L,
+   0x9abc8bd5L, 0x9e7d9662L, 0x933eb0bbL, 0x97ffad0cL,
+   0xafb010b1L, 0xab710d06L, 0xa6322bdfL, 0xa2f33668L,
+   0xbcb4666dL, 0xb8757bdaL, 0xb5365d03L, 0xb1f740b4L
+};
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                        crctable.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/decompress.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/decompress.cpp
new file mode 100644
index 00000000..85b0a14a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/decompress.cpp
@@ -0,0 +1,698 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Decompression machinery                               ---*/
+/*---                                        decompress.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#include "bzlib_private.h"
+
+
+/*---------------------------------------------------*/
+static
+void makeMaps_d ( DState* s )
+{
+   Int32 i;
+   s->nInUse = 0;
+   for (i = 0; i < 256; i++)
+      if (s->inUse[i]) {
+         s->seqToUnseq[s->nInUse] = i;
+         s->nInUse++;
+      }
+}
+
+
+/*---------------------------------------------------*/
+#define RETURN(rrr)                               \
+   { retVal = rrr; goto save_state_and_return; };
+
+#define GET_BITS(lll,vvv,nnn)                     \
+   case lll: s->state = lll;                      \
+   while (True) {                                 \
+      if (s->bsLive >= nnn) {                     \
+         UInt32 v;                                \
+         v = (s->bsBuff >>                        \
+             (s->bsLive-nnn)) & ((1 << nnn)-1);   \
+         s->bsLive -= nnn;                        \
+         vvv = v;                                 \
+         break;                                   \
+      }                                           \
+      if (s->strm->avail_in == 0) RETURN(BZ_OK);  \
+      s->bsBuff                                   \
+         = (s->bsBuff << 8) |                     \
+           ((UInt32)                              \
+              (*((UChar*)(s->strm->next_in))));   \
+      s->bsLive += 8;                             \
+      s->strm->next_in++;                         \
+      s->strm->avail_in--;                        \
+      s->strm->total_in_lo32++;                   \
+      if (s->strm->total_in_lo32 == 0)            \
+         s->strm->total_in_hi32++;                \
+   }
+
+#define GET_UCHAR(lll,uuu)                        \
+   GET_BITS(lll,uuu,8)
+
+#define GET_BIT(lll,uuu)                          \
+   GET_BITS(lll,uuu,1)
+
+/*---------------------------------------------------*/
+#define GET_MTF_VAL(label1,label2,lval)           \
+{                                                 \
+   if (groupPos == 0) {                           \
+      groupNo++;                                  \
+      if (groupNo >= nSelectors)                  \
+         RETURN(BZ_DATA_ERROR);                   \
+      groupPos = BZ_G_SIZE;                       \
+      gSel = s->selector[groupNo];                \
+      gMinlen = s->minLens[gSel];                 \
+      gLimit = &(s->limit[gSel][0]);              \
+      gPerm = &(s->perm[gSel][0]);                \
+      gBase = &(s->base[gSel][0]);                \
+   }                                              \
+   groupPos--;                                    \
+   zn = gMinlen;                                  \
+   GET_BITS(label1, zvec, zn);                    \
+   while (1) {                                    \
+      if (zn > 20 /* the longest code */)         \
+         RETURN(BZ_DATA_ERROR);                   \
+      if (zvec <= gLimit[zn]) break;              \
+      zn++;                                       \
+      GET_BIT(label2, zj);                        \
+      zvec = (zvec << 1) | zj;                    \
+   };                                             \
+   if (zvec - gBase[zn] < 0                       \
+       || zvec - gBase[zn] >= BZ_MAX_ALPHA_SIZE)  \
+      RETURN(BZ_DATA_ERROR);                      \
+   lval = gPerm[zvec - gBase[zn]];                \
+}
+
+
+/*---------------------------------------------------*/
+Int32 BZ2_decompress ( DState* s )
+{
+   UChar      uc;
+   Int32      retVal;
+   Int32      minLen, maxLen;
+   bz_stream* strm = s->strm;
+
+   /* stuff that needs to be saved/restored */
+   Int32  i;
+   Int32  j;
+   Int32  t;
+   Int32  alphaSize;
+   Int32  nGroups;
+   Int32  nSelectors;
+   Int32  EOB;
+   Int32  groupNo;
+   Int32  groupPos;
+   Int32  nextSym;
+   Int32  nblockMAX;
+   Int32  nblock;
+   Int32  es;
+   Int32  N;
+   Int32  curr;
+   Int32  zt;
+   Int32  zn; 
+   Int32  zvec;
+   Int32  zj;
+   Int32  gSel;
+   Int32  gMinlen;
+   Int32* gLimit;
+   Int32* gBase;
+   Int32* gPerm;
+
+   if (s->state == BZ_X_MAGIC_1) {
+      /*initialise the save area*/
+      s->save_i           = 0;
+      s->save_j           = 0;
+      s->save_t           = 0;
+      s->save_alphaSize   = 0;
+      s->save_nGroups     = 0;
+      s->save_nSelectors  = 0;
+      s->save_EOB         = 0;
+      s->save_groupNo     = 0;
+      s->save_groupPos    = 0;
+      s->save_nextSym     = 0;
+      s->save_nblockMAX   = 0;
+      s->save_nblock      = 0;
+      s->save_es          = 0;
+      s->save_N           = 0;
+      s->save_curr        = 0;
+      s->save_zt          = 0;
+      s->save_zn          = 0;
+      s->save_zvec        = 0;
+      s->save_zj          = 0;
+      s->save_gSel        = 0;
+      s->save_gMinlen     = 0;
+      s->save_gLimit      = NULL;
+      s->save_gBase       = NULL;
+      s->save_gPerm       = NULL;
+   }
+
+   /*restore from the save area*/
+   i           = s->save_i;
+   j           = s->save_j;
+   t           = s->save_t;
+   alphaSize   = s->save_alphaSize;
+   nGroups     = s->save_nGroups;
+   nSelectors  = s->save_nSelectors;
+   EOB         = s->save_EOB;
+   groupNo     = s->save_groupNo;
+   groupPos    = s->save_groupPos;
+   nextSym     = s->save_nextSym;
+   nblockMAX   = s->save_nblockMAX;
+   nblock      = s->save_nblock;
+   es          = s->save_es;
+   N           = s->save_N;
+   curr        = s->save_curr;
+   zt          = s->save_zt;
+   zn          = s->save_zn; 
+   zvec        = s->save_zvec;
+   zj          = s->save_zj;
+   gSel        = s->save_gSel;
+   gMinlen     = s->save_gMinlen;
+   gLimit      = s->save_gLimit;
+   gBase       = s->save_gBase;
+   gPerm       = s->save_gPerm;
+
+   retVal = BZ_OK;
+
+   switch (s->state) {
+
+      GET_UCHAR(BZ_X_MAGIC_1, uc);
+      if (uc != BZ_HDR_B) RETURN(BZ_DATA_ERROR_MAGIC);
+
+      GET_UCHAR(BZ_X_MAGIC_2, uc);
+      if (uc != BZ_HDR_Z) RETURN(BZ_DATA_ERROR_MAGIC);
+
+      GET_UCHAR(BZ_X_MAGIC_3, uc)
+      if (uc != BZ_HDR_h) RETURN(BZ_DATA_ERROR_MAGIC);
+
+      GET_BITS(BZ_X_MAGIC_4, s->blockSize100k, 8)
+      if (s->blockSize100k < (BZ_HDR_0 + 1) || 
+          s->blockSize100k > (BZ_HDR_0 + 9)) RETURN(BZ_DATA_ERROR_MAGIC);
+      s->blockSize100k -= BZ_HDR_0;
+
+      if (s->smallDecompress) {
+         s->ll16 = (UInt16*)BZALLOC( s->blockSize100k * 100000 * sizeof(UInt16) );
+         s->ll4  = (UChar*)BZALLOC( 
+                      ((1 + s->blockSize100k * 100000) >> 1) * sizeof(UChar) 
+                   );
+         if (s->ll16 == NULL || s->ll4 == NULL) RETURN(BZ_MEM_ERROR);
+      } else {
+         s->tt  = (UInt32*)BZALLOC( s->blockSize100k * 100000 * sizeof(Int32) );
+         if (s->tt == NULL) RETURN(BZ_MEM_ERROR);
+      }
+
+      GET_UCHAR(BZ_X_BLKHDR_1, uc);
+
+      if (uc == 0x17) goto endhdr_2;
+      if (uc != 0x31) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_BLKHDR_2, uc);
+      if (uc != 0x41) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_BLKHDR_3, uc);
+      if (uc != 0x59) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_BLKHDR_4, uc);
+      if (uc != 0x26) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_BLKHDR_5, uc);
+      if (uc != 0x53) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_BLKHDR_6, uc);
+      if (uc != 0x59) RETURN(BZ_DATA_ERROR);
+
+      s->currBlockNo++;
+      if (s->verbosity >= 2)
+         VPrintf1 ( "\n    [%d: huff+mtf ", s->currBlockNo );
+ 
+      s->storedBlockCRC = 0;
+      GET_UCHAR(BZ_X_BCRC_1, uc);
+      s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc);
+      GET_UCHAR(BZ_X_BCRC_2, uc);
+      s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc);
+      GET_UCHAR(BZ_X_BCRC_3, uc);
+      s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc);
+      GET_UCHAR(BZ_X_BCRC_4, uc);
+      s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc);
+
+      GET_BITS(BZ_X_RANDBIT, s->blockRandomised, 1);
+
+      s->origPtr = 0;
+      GET_UCHAR(BZ_X_ORIGPTR_1, uc);
+      s->origPtr = (s->origPtr << 8) | ((Int32)uc);
+      GET_UCHAR(BZ_X_ORIGPTR_2, uc);
+      s->origPtr = (s->origPtr << 8) | ((Int32)uc);
+      GET_UCHAR(BZ_X_ORIGPTR_3, uc);
+      s->origPtr = (s->origPtr << 8) | ((Int32)uc);
+
+      if (s->origPtr < 0)
+         RETURN(BZ_DATA_ERROR);
+      if (s->origPtr > 10 + 100000*s->blockSize100k) 
+         RETURN(BZ_DATA_ERROR);
+
+      /*--- Receive the mapping table ---*/
+      for (i = 0; i < 16; i++) {
+         GET_BIT(BZ_X_MAPPING_1, uc);
+         if (uc == 1) 
+            s->inUse16[i] = True; else 
+            s->inUse16[i] = False;
+      }
+
+      for (i = 0; i < 256; i++) s->inUse[i] = False;
+
+      for (i = 0; i < 16; i++)
+         if (s->inUse16[i])
+            for (j = 0; j < 16; j++) {
+               GET_BIT(BZ_X_MAPPING_2, uc);
+               if (uc == 1) s->inUse[i * 16 + j] = True;
+            }
+      makeMaps_d ( s );
+      if (s->nInUse == 0) RETURN(BZ_DATA_ERROR);
+      alphaSize = s->nInUse+2;
+
+      /*--- Now the selectors ---*/
+      GET_BITS(BZ_X_SELECTOR_1, nGroups, 3);
+      if (nGroups < 2 || nGroups > 6) RETURN(BZ_DATA_ERROR);
+      GET_BITS(BZ_X_SELECTOR_2, nSelectors, 15);
+      if (nSelectors < 1) RETURN(BZ_DATA_ERROR);
+      for (i = 0; i < nSelectors; i++) {
+         j = 0;
+         while (True) {
+            GET_BIT(BZ_X_SELECTOR_3, uc);
+            if (uc == 0) break;
+            j++;
+            if (j >= nGroups) RETURN(BZ_DATA_ERROR);
+         }
+         s->selectorMtf[i] = j;
+      }
+
+      /*--- Undo the MTF values for the selectors. ---*/
+      {
+         UChar pos[BZ_N_GROUPS], tmp, v;
+         for (v = 0; v < nGroups; v++) pos[v] = v;
+   
+         for (i = 0; i < nSelectors; i++) {
+            v = s->selectorMtf[i];
+            tmp = pos[v];
+            while (v > 0) { pos[v] = pos[v-1]; v--; }
+            pos[0] = tmp;
+            s->selector[i] = tmp;
+         }
+      }
+
+      /*--- Now the coding tables ---*/
+      for (t = 0; t < nGroups; t++) {
+         GET_BITS(BZ_X_CODING_1, curr, 5);
+         for (i = 0; i < alphaSize; i++) {
+            while (True) {
+               if (curr < 1 || curr > 20) RETURN(BZ_DATA_ERROR);
+               GET_BIT(BZ_X_CODING_2, uc);
+               if (uc == 0) break;
+               GET_BIT(BZ_X_CODING_3, uc);
+               if (uc == 0) curr++; else curr--;
+            }
+            s->len[t][i] = curr;
+         }
+      }
+
+      /*--- Create the Huffman decoding tables ---*/
+      for (t = 0; t < nGroups; t++) {
+         minLen = 32;
+         maxLen = 0;
+         for (i = 0; i < alphaSize; i++) {
+            if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
+            if (s->len[t][i] < minLen) minLen = s->len[t][i];
+         }
+         BZ2_hbCreateDecodeTables ( 
+            &(s->limit[t][0]), 
+            &(s->base[t][0]), 
+            &(s->perm[t][0]), 
+            &(s->len[t][0]),
+            minLen, maxLen, alphaSize
+         );
+         s->minLens[t] = minLen;
+      }
+
+      /*--- Now the MTF values ---*/
+
+      EOB      = s->nInUse+1;
+      nblockMAX = 100000 * s->blockSize100k;
+      groupNo  = -1;
+      groupPos = 0;
+
+      for (i = 0; i <= 255; i++) s->unzftab[i] = 0;
+
+      /*-- MTF init --*/
+      {
+         Int32 ii, jj, kk;
+         kk = MTFA_SIZE-1;
+         for (ii = 256 / MTFL_SIZE - 1; ii >= 0; ii--) {
+            for (jj = MTFL_SIZE-1; jj >= 0; jj--) {
+               s->mtfa[kk] = (UChar)(ii * MTFL_SIZE + jj);
+               kk--;
+            }
+            s->mtfbase[ii] = kk + 1;
+         }
+      }
+      /*-- end MTF init --*/
+
+      nblock = 0;
+      GET_MTF_VAL(BZ_X_MTF_1, BZ_X_MTF_2, nextSym);
+
+      while (True) {
+
+         if (nextSym == EOB) break;
+
+         if (nextSym == BZ_RUNA || nextSym == BZ_RUNB) {
+
+            es = -1;
+            N = 1;
+            do {
+               /* Check that N doesn't get too big, so that es doesn't
+                  go negative.  The maximum value that can be
+                  RUNA/RUNB encoded is equal to the block size (post
+                  the initial RLE), viz, 900k, so bounding N at 2
+                  million should guard against overflow without
+                  rejecting any legitimate inputs. */
+               if (N >= 2*1024*1024) RETURN(BZ_DATA_ERROR);
+               if (nextSym == BZ_RUNA) es = es + (0+1) * N; else
+               if (nextSym == BZ_RUNB) es = es + (1+1) * N;
+               N = N * 2;
+               GET_MTF_VAL(BZ_X_MTF_3, BZ_X_MTF_4, nextSym);
+            }
+               while (nextSym == BZ_RUNA || nextSym == BZ_RUNB);
+
+            es++;
+            uc = s->seqToUnseq[ s->mtfa[s->mtfbase[0]] ];
+            s->unzftab[uc] += es;
+
+            if (s->smallDecompress)
+               while (es > 0) {
+                  if (nblock >= nblockMAX) RETURN(BZ_DATA_ERROR);
+                  s->ll16[nblock] = (UInt16)uc;
+                  nblock++;
+                  es--;
+               }
+            else
+               while (es > 0) {
+                  if (nblock >= nblockMAX) RETURN(BZ_DATA_ERROR);
+                  s->tt[nblock] = (UInt32)uc;
+                  nblock++;
+                  es--;
+               };
+
+            continue;
+
+         } else {
+
+            if (nblock >= nblockMAX) RETURN(BZ_DATA_ERROR);
+
+            /*-- uc = MTF ( nextSym-1 ) --*/
+            {
+               Int32 ii, jj, kk, pp, lno, off;
+               UInt32 nn;
+               nn = (UInt32)(nextSym - 1);
+
+               if (nn < MTFL_SIZE) {
+                  /* avoid general-case expense */
+                  pp = s->mtfbase[0];
+                  uc = s->mtfa[pp+nn];
+                  while (nn > 3) {
+                     Int32 z = pp+nn;
+                     s->mtfa[(z)  ] = s->mtfa[(z)-1];
+                     s->mtfa[(z)-1] = s->mtfa[(z)-2];
+                     s->mtfa[(z)-2] = s->mtfa[(z)-3];
+                     s->mtfa[(z)-3] = s->mtfa[(z)-4];
+                     nn -= 4;
+                  }
+                  while (nn > 0) { 
+                     s->mtfa[(pp+nn)] = s->mtfa[(pp+nn)-1]; nn--; 
+                  };
+                  s->mtfa[pp] = uc;
+               } else { 
+                  /* general case */
+                  lno = nn / MTFL_SIZE;
+                  off = nn % MTFL_SIZE;
+                  pp = s->mtfbase[lno] + off;
+                  uc = s->mtfa[pp];
+                  while (pp > s->mtfbase[lno]) { 
+                     s->mtfa[pp] = s->mtfa[pp-1]; pp--; 
+                  };
+                  s->mtfbase[lno]++;
+                  while (lno > 0) {
+                     s->mtfbase[lno]--;
+                     s->mtfa[s->mtfbase[lno]] 
+                        = s->mtfa[s->mtfbase[lno-1] + MTFL_SIZE - 1];
+                     lno--;
+                  }
+                  s->mtfbase[0]--;
+                  s->mtfa[s->mtfbase[0]] = uc;
+                  if (s->mtfbase[0] == 0) {
+                     kk = MTFA_SIZE-1;
+                     for (ii = 256 / MTFL_SIZE-1; ii >= 0; ii--) {
+                        for (jj = MTFL_SIZE-1; jj >= 0; jj--) {
+                           s->mtfa[kk] = s->mtfa[s->mtfbase[ii] + jj];
+                           kk--;
+                        }
+                        s->mtfbase[ii] = kk + 1;
+                     }
+                  }
+               }
+            }
+            /*-- end uc = MTF ( nextSym-1 ) --*/
+
+            s->unzftab[s->seqToUnseq[uc]]++;
+            if (s->smallDecompress)
+               s->ll16[nblock] = (UInt16)(s->seqToUnseq[uc]); else
+               s->tt[nblock]   = (UInt32)(s->seqToUnseq[uc]);
+            nblock++;
+
+            GET_MTF_VAL(BZ_X_MTF_5, BZ_X_MTF_6, nextSym);
+            continue;
+         }
+      }
+
+      /* Now we know what nblock is, we can do a better sanity
+         check on s->origPtr.
+      */
+      if (s->origPtr < 0 || s->origPtr >= nblock)
+         RETURN(BZ_DATA_ERROR);
+
+      /*-- Set up cftab to facilitate generation of T^(-1) --*/
+      /* Check: unzftab entries in range. */
+      for (i = 0; i <= 255; i++) {
+         if (s->unzftab[i] < 0 || s->unzftab[i] > nblock)
+            RETURN(BZ_DATA_ERROR);
+      }
+      /* Actually generate cftab. */
+      s->cftab[0] = 0;
+      for (i = 1; i <= 256; i++) s->cftab[i] = s->unzftab[i-1];
+      for (i = 1; i <= 256; i++) s->cftab[i] += s->cftab[i-1];
+      /* Check: cftab entries in range. */
+      for (i = 0; i <= 256; i++) {
+         if (s->cftab[i] < 0 || s->cftab[i] > nblock) {
+            /* s->cftab[i] can legitimately be == nblock */
+            RETURN(BZ_DATA_ERROR);
+         }
+      }
+      /* Check: cftab entries non-descending. */
+      for (i = 1; i <= 256; i++) {
+         if (s->cftab[i-1] > s->cftab[i]) {
+            RETURN(BZ_DATA_ERROR);
+         }
+      }
+
+      s->state_out_len = 0;
+      s->state_out_ch  = 0;
+      BZ_INITIALISE_CRC ( s->calculatedBlockCRC );
+      s->state = BZ_X_OUTPUT;
+      if (s->verbosity >= 2) VPrintf0 ( "rt+rld" );
+
+      if (s->smallDecompress) {
+
+         /*-- Make a copy of cftab, used in generation of T --*/
+         for (i = 0; i <= 256; i++) s->cftabCopy[i] = s->cftab[i];
+
+         /*-- compute the T vector --*/
+         for (i = 0; i < nblock; i++) {
+            uc = (UChar)(s->ll16[i]);
+            SET_LL(i, s->cftabCopy[uc]);
+            s->cftabCopy[uc]++;
+         }
+
+         /*-- Compute T^(-1) by pointer reversal on T --*/
+         i = s->origPtr;
+         j = GET_LL(i);
+         do {
+            Int32 tmp = GET_LL(j);
+            SET_LL(j, i);
+            i = j;
+            j = tmp;
+         }
+            while (i != s->origPtr);
+
+         s->tPos = s->origPtr;
+         s->nblock_used = 0;
+         if (s->blockRandomised) {
+            BZ_RAND_INIT_MASK;
+            BZ_GET_SMALL(s->k0); s->nblock_used++;
+            BZ_RAND_UPD_MASK; s->k0 ^= BZ_RAND_MASK; 
+         } else {
+            BZ_GET_SMALL(s->k0); s->nblock_used++;
+         }
+
+      } else {
+
+         /*-- compute the T^(-1) vector --*/
+         for (i = 0; i < nblock; i++) {
+            uc = (UChar)(s->tt[i] & 0xff);
+            s->tt[s->cftab[uc]] |= (i << 8);
+            s->cftab[uc]++;
+         }
+
+         s->tPos = s->tt[s->origPtr] >> 8;
+         s->nblock_used = 0;
+         if (s->blockRandomised) {
+            BZ_RAND_INIT_MASK;
+            BZ_GET_FAST(s->k0); s->nblock_used++;
+            BZ_RAND_UPD_MASK; s->k0 ^= BZ_RAND_MASK; 
+         } else {
+            BZ_GET_FAST(s->k0); s->nblock_used++;
+         }
+
+      }
+
+      RETURN(BZ_OK);
+
+
+
+    endhdr_2:
+
+      GET_UCHAR(BZ_X_ENDHDR_2, uc);
+      if (uc != 0x72) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_ENDHDR_3, uc);
+      if (uc != 0x45) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_ENDHDR_4, uc);
+      if (uc != 0x38) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_ENDHDR_5, uc);
+      if (uc != 0x50) RETURN(BZ_DATA_ERROR);
+      GET_UCHAR(BZ_X_ENDHDR_6, uc);
+      if (uc != 0x90) RETURN(BZ_DATA_ERROR);
+
+      s->storedCombinedCRC = 0;
+      GET_UCHAR(BZ_X_CCRC_1, uc);
+      s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc);
+      GET_UCHAR(BZ_X_CCRC_2, uc);
+      s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc);
+      GET_UCHAR(BZ_X_CCRC_3, uc);
+      s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc);
+      GET_UCHAR(BZ_X_CCRC_4, uc);
+      s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc);
+
+      s->state = BZ_X_IDLE;
+      RETURN(BZ_STREAM_END);
+
+      default: AssertH ( False, 4001 );
+   }
+
+   AssertH ( False, 4002 );
+
+   save_state_and_return:
+
+   s->save_i           = i;
+   s->save_j           = j;
+   s->save_t           = t;
+   s->save_alphaSize   = alphaSize;
+   s->save_nGroups     = nGroups;
+   s->save_nSelectors  = nSelectors;
+   s->save_EOB         = EOB;
+   s->save_groupNo     = groupNo;
+   s->save_groupPos    = groupPos;
+   s->save_nextSym     = nextSym;
+   s->save_nblockMAX   = nblockMAX;
+   s->save_nblock      = nblock;
+   s->save_es          = es;
+   s->save_N           = N;
+   s->save_curr        = curr;
+   s->save_zt          = zt;
+   s->save_zn          = zn;
+   s->save_zvec        = zvec;
+   s->save_zj          = zj;
+   s->save_gSel        = gSel;
+   s->save_gMinlen     = gMinlen;
+   s->save_gLimit      = gLimit;
+   s->save_gBase       = gBase;
+   s->save_gPerm       = gPerm;
+
+   return retVal;   
+}
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                      decompress.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/fgbzip2.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/fgbzip2.cpp
new file mode 100644
index 00000000..8ab1da2b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/fgbzip2.cpp
@@ -0,0 +1,501 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+#include "tbb/tbb_config.h"
+#include "../../common/utility/utility.h"
+
+#if __TBB_PREVIEW_ASYNC_MSG && __TBB_CPP11_LAMBDAS_PRESENT
+
+#include <iostream>
+#include <fstream>
+#include <string>
+#include <memory>
+#include <queue>
+
+#include "bzlib.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/tick_count.h"
+#include "tbb/compat/thread"
+#include "tbb/concurrent_queue.h"
+
+// TODO: change memory allocation/deallocation to be managed in constructor/destructor
+struct Buffer {
+    size_t len;
+    char* b;
+};
+
+struct BufferMsg {
+
+    BufferMsg() {}
+    BufferMsg(Buffer& inputBuffer, Buffer& outputBuffer, size_t seqId, bool isLast = false)
+        : inputBuffer(inputBuffer), outputBuffer(outputBuffer), seqId(seqId), isLast(isLast) {}
+
+    static BufferMsg createBufferMsg(size_t seqId, size_t chunkSize) {
+        Buffer inputBuffer;
+        inputBuffer.b = new char[chunkSize];
+        inputBuffer.len = chunkSize;
+
+        Buffer outputBuffer;
+        size_t compressedChunkSize = chunkSize * 1.01 + 600; // compression overhead
+        outputBuffer.b = new char[compressedChunkSize];
+        outputBuffer.len = compressedChunkSize;
+
+        return BufferMsg(inputBuffer, outputBuffer, seqId);
+    }
+
+    static void destroyBufferMsg(const BufferMsg& destroyMsg) {
+        delete[] destroyMsg.inputBuffer.b;
+        delete[] destroyMsg.outputBuffer.b;
+    }
+
+    void markLast(size_t lastId) {
+        isLast = true;
+        seqId = lastId;
+    }
+
+    size_t seqId;
+    Buffer inputBuffer;
+    Buffer outputBuffer;
+    bool isLast;
+};
+
+class BufferCompressor {
+public:
+
+    BufferCompressor(int blockSizeIn100KB) : m_blockSize(blockSizeIn100KB) {}
+
+    BufferMsg operator()(BufferMsg buffer) const {
+        if (!buffer.isLast) {
+            unsigned int outSize = buffer.outputBuffer.len;
+            BZ2_bzBuffToBuffCompress(buffer.outputBuffer.b, &outSize,
+                buffer.inputBuffer.b, buffer.inputBuffer.len,
+                m_blockSize, 0, 30);
+            buffer.outputBuffer.len = outSize;
+        }
+        return buffer;
+    }
+
+private:
+    int m_blockSize;
+};
+
+class IOOperations {
+public:
+
+    IOOperations(std::ifstream& inputStream, std::ofstream& outputStream, size_t chunkSize)
+        : m_inputStream(inputStream), m_outputStream(outputStream), m_chunkSize(chunkSize), m_chunksRead(0) {}
+
+    void readChunk(Buffer& buffer) {
+        m_inputStream.read(buffer.b, m_chunkSize);
+        buffer.len = static_cast<size_t>(m_inputStream.gcount());
+        m_chunksRead++;
+    }
+
+    void writeChunk(const Buffer& buffer) {
+        m_outputStream.write(buffer.b, buffer.len);
+    }
+
+    size_t chunksRead() const {
+        return m_chunksRead;
+    }
+
+    size_t chunkSize() const {
+        return m_chunkSize;
+    }
+
+    bool hasDataToRead() const {
+        return m_inputStream.is_open() && !m_inputStream.eof();
+    }
+
+private:
+
+    std::ifstream& m_inputStream;
+    std::ofstream& m_outputStream;
+
+    size_t m_chunkSize;
+    size_t m_chunksRead;
+};
+
+//-----------------------------------------------------------------------------------------------------------------------
+//---------------------------------------Compression example based on async_node-----------------------------------------
+//-----------------------------------------------------------------------------------------------------------------------
+
+typedef tbb::flow::async_node< tbb::flow::continue_msg, BufferMsg > async_file_reader_node;
+typedef tbb::flow::async_node< BufferMsg, tbb::flow::continue_msg > async_file_writer_node;
+
+class AsyncNodeActivity {
+public:
+
+    AsyncNodeActivity(IOOperations& io)
+        : m_io(io), m_fileWriterThread(&AsyncNodeActivity::writingLoop, this) {}
+
+    ~AsyncNodeActivity() {
+        m_fileReaderThread.join();
+        m_fileWriterThread.join();
+    }
+
+    void submitRead(async_file_reader_node::gateway_type& gateway) {
+        gateway.reserve_wait();
+        std::thread(&AsyncNodeActivity::readingLoop, this, std::ref(gateway)).swap(m_fileReaderThread);
+    }
+
+    void submitWrite(const BufferMsg& bufferMsg) {
+        m_writeQueue.push(bufferMsg);
+    }
+
+private:
+
+    void readingLoop(async_file_reader_node::gateway_type& gateway) {
+        while (m_io.hasDataToRead()) {
+            BufferMsg bufferMsg = BufferMsg::createBufferMsg(m_io.chunksRead(), m_io.chunkSize());
+            m_io.readChunk(bufferMsg.inputBuffer);
+            gateway.try_put(bufferMsg);
+        }
+        sendLastMessage(gateway);
+        gateway.release_wait();
+    }
+
+    void writingLoop() {
+        BufferMsg buffer;
+        m_writeQueue.pop(buffer);
+        while (!buffer.isLast) {
+            m_io.writeChunk(buffer.outputBuffer);
+            m_writeQueue.pop(buffer);
+        }
+    }
+
+    void sendLastMessage(async_file_reader_node::gateway_type& gateway) {
+        BufferMsg lastMsg;
+        lastMsg.markLast(m_io.chunksRead());
+        gateway.try_put(lastMsg);
+    }
+
+    IOOperations& m_io;
+
+    tbb::concurrent_bounded_queue< BufferMsg > m_writeQueue;
+
+    std::thread m_fileReaderThread;
+    std::thread m_fileWriterThread;
+};
+
+void fgCompressionAsyncNode(IOOperations& io, int blockSizeIn100KB) {
+    tbb::flow::graph g;
+
+    AsyncNodeActivity asyncNodeActivity(io);
+
+    async_file_reader_node file_reader(g, tbb::flow::unlimited, [&asyncNodeActivity](const tbb::flow::continue_msg& msg, async_file_reader_node::gateway_type& gateway) {
+        asyncNodeActivity.submitRead(gateway);
+    });
+
+    tbb::flow::function_node< BufferMsg, BufferMsg > compressor(g, tbb::flow::unlimited, BufferCompressor(blockSizeIn100KB));
+
+    tbb::flow::sequencer_node< BufferMsg > ordering(g, [](const BufferMsg& bufferMsg)->size_t {
+        return bufferMsg.seqId;
+    });
+
+    // The node is serial to preserve the right order of buffers set by the preceding sequencer_node
+    async_file_writer_node output_writer(g, tbb::flow::serial, [&asyncNodeActivity](const BufferMsg& bufferMsg, async_file_writer_node::gateway_type& gateway) {
+        asyncNodeActivity.submitWrite(bufferMsg);
+    });
+
+    make_edge(file_reader, compressor);
+    make_edge(compressor, ordering);
+    make_edge(ordering, output_writer);
+
+    file_reader.try_put(tbb::flow::continue_msg());
+
+    g.wait_for_all();
+}
+
+//-----------------------------------------------------------------------------------------------------------------------
+//------------------------------------------Compression example based on async_msg---------------------------------------
+//-----------------------------------------------------------------------------------------------------------------------
+
+typedef tbb::flow::async_msg< BufferMsg > async_msg_type;
+
+class AsyncMsgActivity {
+public:
+
+    AsyncMsgActivity(tbb::flow::graph& g, IOOperations& io)
+        : m_io(io), m_graph(g), m_fileReaderThread(&AsyncMsgActivity::readingLoop, this),
+          m_fileWriterThread(&AsyncMsgActivity::writingLoop, this)
+    {
+        // Graph synchronization starts here and ends
+        // when the last buffer was written in "writing thread"
+        m_graph.increment_wait_count();
+    }
+
+    ~AsyncMsgActivity() {
+        m_fileReaderThread.join();
+        m_fileWriterThread.join();
+
+        // Lets release resources that async
+        // activity and graph were acquired
+        freeBuffers();
+    }
+
+    async_msg_type submitRead(BufferMsg& bufferMsg) {
+        async_msg_type msg;
+        work_type readWork = { bufferMsg, msg };
+        m_readQueue.push(readWork);
+        return msg;
+    }
+
+    async_msg_type submitWrite(const BufferMsg& bufferMsg) {
+        async_msg_type msg;
+        work_type writeWork = { bufferMsg, msg };
+        m_writeQueue.push(writeWork);
+        return msg;
+    }
+
+private:
+
+    struct work_type {
+        BufferMsg bufferMsg;
+        async_msg_type msg;
+    };
+
+    void readingLoop() {
+        work_type readWork;
+        m_readQueue.pop(readWork);
+
+        // Reading thread waits for buffers to be received
+        // (the graph reuses limitted number of buffers)
+        // and reads the file while there is something to read
+        while (m_io.hasDataToRead()) {
+            readWork.bufferMsg.seqId = m_io.chunksRead();
+            m_io.readChunk(readWork.bufferMsg.inputBuffer);
+            readWork.msg.set(readWork.bufferMsg);
+            m_readQueue.pop(readWork);
+        }
+
+        // Pass message with an end flag to the graph
+        sendLastMessage(readWork);
+    }
+
+    void sendLastMessage(work_type& work) {
+        work.bufferMsg.markLast(m_io.chunksRead());
+        work.msg.set(work.bufferMsg);
+    }
+
+    void writingLoop() {
+        work_type writeWork;
+        m_writeQueue.pop(writeWork);
+
+        // Writing thread writes all buffers that it gets
+        // and reuses them. At the end all reusing buffers
+        // is stored in read queue
+        while (!writeWork.bufferMsg.isLast) {
+            m_io.writeChunk(writeWork.bufferMsg.outputBuffer);
+            writeWork.msg.set(writeWork.bufferMsg);
+            m_writeQueue.pop(writeWork);
+        }
+
+        // Store last message to the reading queue to free resources later
+        writeWork.msg.set(writeWork.bufferMsg);
+
+        // After all buffers have been written
+        // the synchronization ends
+        m_graph.decrement_wait_count();
+    }
+
+    void freeBuffers() {
+        int buffersNumber = m_readQueue.size();
+        for (int i = 0; i < buffersNumber; i++) {
+            work_type workToDelete;
+            m_readQueue.pop(workToDelete);
+            BufferMsg::destroyBufferMsg(workToDelete.bufferMsg);
+        }
+    }
+
+    IOOperations& m_io;
+
+    tbb::flow::graph& m_graph;
+
+    tbb::concurrent_bounded_queue< work_type > m_writeQueue;
+    tbb::concurrent_bounded_queue< work_type > m_readQueue;
+
+    std::thread m_fileReaderThread;
+    std::thread m_fileWriterThread;
+};
+
+void fgCompressionAsyncMsg(IOOperations& io, int blockSizeIn100KB, size_t memoryLimitIn1MB) {
+    // Memory limit sets the number of buffers that can be reused
+    int buffersNumber = memoryLimitIn1MB * 1000 * 1024 / io.chunkSize();
+
+    tbb::flow::graph g;
+
+    AsyncMsgActivity asyncMsgActivity(g, io);
+
+    tbb::flow::function_node< BufferMsg, async_msg_type > file_reader(g, tbb::flow::unlimited, [&asyncMsgActivity](BufferMsg bufferMsg) -> async_msg_type {
+        return asyncMsgActivity.submitRead(bufferMsg);
+    });
+
+    tbb::flow::function_node< BufferMsg, BufferMsg > compressor(g, tbb::flow::unlimited, BufferCompressor(blockSizeIn100KB));
+
+    tbb::flow::sequencer_node< BufferMsg > ordering(g, [](const BufferMsg& bufferMsg) -> size_t {
+        return bufferMsg.seqId;
+    });
+
+    // The node is serial to preserve the right order of buffers set by the preceding sequencer_node
+    tbb::flow::function_node< BufferMsg, async_msg_type > output_writer(g, tbb::flow::serial, [&asyncMsgActivity](const BufferMsg& bufferMsg) -> async_msg_type {
+        return asyncMsgActivity.submitWrite(bufferMsg);
+    });
+
+    make_edge(file_reader, compressor);
+    make_edge(compressor, ordering);
+    make_edge(ordering, output_writer);
+    make_edge(output_writer, file_reader);
+
+    // Creating buffers to be reused in read/compress/write graph loop
+    for (int i = 0; i < buffersNumber; i++) {
+        BufferMsg reuseBufferMsg = BufferMsg::createBufferMsg(0, io.chunkSize());
+        file_reader.try_put(reuseBufferMsg);
+    }
+
+    g.wait_for_all();
+}
+
+//-----------------------------------------------------------------------------------------------------------------------
+//---------------------------------------------Simple compression example------------------------------------------------
+//-----------------------------------------------------------------------------------------------------------------------
+
+void fgCompression(IOOperations& io, int blockSizeIn100KB) {
+    tbb::flow::graph g;
+
+    tbb::flow::source_node< BufferMsg > file_reader(g, [&io](BufferMsg& bufferMsg)->bool {
+        if (io.hasDataToRead()) {
+            bufferMsg = BufferMsg::createBufferMsg(io.chunksRead(), io.chunkSize());
+            io.readChunk(bufferMsg.inputBuffer);
+            return true;
+        }
+        return false;
+    });
+
+    tbb::flow::function_node< BufferMsg, BufferMsg > compressor(g, tbb::flow::unlimited, BufferCompressor(blockSizeIn100KB));
+
+    tbb::flow::sequencer_node< BufferMsg > ordering(g, [](const BufferMsg& buffer)->size_t {
+        return buffer.seqId;
+    });
+
+    tbb::flow::function_node< BufferMsg > output_writer(g, tbb::flow::serial, [&io](const BufferMsg& bufferMsg) {
+        io.writeChunk(bufferMsg.outputBuffer);
+        BufferMsg::destroyBufferMsg(bufferMsg);
+    });
+
+    make_edge(file_reader, compressor);
+    make_edge(compressor, ordering);
+    make_edge(ordering, output_writer);
+
+    g.wait_for_all();
+}
+
+//-----------------------------------------------------------------------------------------------------------------------
+
+bool endsWith(const std::string& str, const std::string& suffix) {
+    return str.find(suffix, str.length() - suffix.length()) != std::string::npos;
+}
+
+//-----------------------------------------------------------------------------------------------------------------------
+
+int main(int argc, char* argv[]) {
+    try {
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        const std::string archiveExtension = ".bz2";
+        bool verbose = false;
+        std::string asyncType;
+        std::string inputFileName;
+        int blockSizeIn100KB = 1; // block size in 100KB chunks
+        size_t memoryLimitIn1MB = 1; // memory limit for compression in megabytes granularity
+
+        utility::parse_cli_arguments(argc, argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .arg(blockSizeIn100KB, "-b", "\t block size in 100KB chunks, [1 .. 9]")
+            .arg(verbose, "-v", "verbose mode")
+            .arg(memoryLimitIn1MB, "-l", "used memory limit for compression algorithm in 1MB (minimum) granularity")
+            .arg(asyncType, "-a", "name of the used graph async implementation - can be async_node or async_msg")
+            .positional_arg(inputFileName, "filename", "input file name")
+        );
+
+        if (inputFileName.empty()) {
+            throw std::invalid_argument("Input file name is not specified. Try 'fgbzip2 -h' for more information.");
+        }
+
+        if (blockSizeIn100KB < 1 || blockSizeIn100KB > 9) {
+            throw std::invalid_argument("Incorrect block size. Try 'fgbzip2 -h' for more information.");
+        }
+
+        if (memoryLimitIn1MB < 1) {
+            throw std::invalid_argument("Incorrect memory limit size. Try 'fgbzip2 -h' for more information.");
+        }
+
+        if (verbose) std::cout << "Input file name: " << inputFileName << std::endl;
+        if (endsWith(inputFileName, archiveExtension)) {
+            throw std::invalid_argument("Input file already have " + archiveExtension + " extension.");
+        }
+
+        std::ifstream inputStream(inputFileName.c_str(), std::ios::in | std::ios::binary);
+        if (!inputStream.is_open()) {
+            throw std::invalid_argument("Cannot open " + inputFileName + " file.");
+        }
+
+        std::string outputFileName(inputFileName + archiveExtension);
+
+        std::ofstream outputStream(outputFileName.c_str(), std::ios::out | std::ios::binary | std::ios::trunc);
+        if (!outputStream.is_open()) {
+            throw std::invalid_argument("Cannot open " + outputFileName + " file.");
+        }
+
+        // General interface to work with I/O buffers operations
+        size_t chunkSize = blockSizeIn100KB * 100 * 1024;
+        IOOperations io(inputStream, outputStream, chunkSize);
+
+        if (asyncType.empty()) {
+            if (verbose) std::cout << "Running flow graph based compression algorithm." << std::endl;
+            fgCompression(io, blockSizeIn100KB);
+        } else if (asyncType == "async_node") {
+            if (verbose) std::cout << "Running flow graph based compression algorithm with async_node based asynchronious IO operations." << std::endl;
+            fgCompressionAsyncNode(io, blockSizeIn100KB);
+        } else if (asyncType == "async_msg") {
+            if (verbose) std::cout << "Running flow graph based compression algorithm with async_msg based asynchronious IO operations. Using limited memory: " << memoryLimitIn1MB << "MB." << std::endl;
+            fgCompressionAsyncMsg(io, blockSizeIn100KB, memoryLimitIn1MB);
+        }
+
+        inputStream.close();
+        outputStream.close();
+
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+
+        return 0;
+    } catch (std::exception& e) {
+        std::cerr << "Error occurred. Error text is : \"" << e.what() << "\"\n";
+        return -1;
+    }
+}
+#else
+int main() {
+    utility::report_skipped();
+    return 0;
+}
+#endif /* __TBB_PREVIEW_ASYNC_NODE && __TBB_CPP11_LAMBDAS_PRESENT */
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/huffman.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/huffman.cpp
new file mode 100644
index 00000000..717e053d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/huffman.cpp
@@ -0,0 +1,257 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Huffman coding low-level stuff                        ---*/
+/*---                                           huffman.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#include "bzlib_private.h"
+
+/*---------------------------------------------------*/
+#define WEIGHTOF(zz0)  ((zz0) & 0xffffff00)
+#define DEPTHOF(zz1)   ((zz1) & 0x000000ff)
+#define MYMAX(zz2,zz3) ((zz2) > (zz3) ? (zz2) : (zz3))
+
+#define ADDWEIGHTS(zw1,zw2)                           \
+   (WEIGHTOF(zw1)+WEIGHTOF(zw2)) |                    \
+   (1 + MYMAX(DEPTHOF(zw1),DEPTHOF(zw2)))
+
+#define UPHEAP(z)                                     \
+{                                                     \
+   Int32 zz, tmp;                                     \
+   zz = z; tmp = heap[zz];                            \
+   while (weight[tmp] < weight[heap[zz >> 1]]) {      \
+      heap[zz] = heap[zz >> 1];                       \
+      zz >>= 1;                                       \
+   }                                                  \
+   heap[zz] = tmp;                                    \
+}
+
+#define DOWNHEAP(z)                                   \
+{                                                     \
+   Int32 zz, yy, tmp;                                 \
+   zz = z; tmp = heap[zz];                            \
+   while (True) {                                     \
+      yy = zz << 1;                                   \
+      if (yy > nHeap) break;                          \
+      if (yy < nHeap &&                               \
+          weight[heap[yy+1]] < weight[heap[yy]])      \
+         yy++;                                        \
+      if (weight[tmp] < weight[heap[yy]]) break;      \
+      heap[zz] = heap[yy];                            \
+      zz = yy;                                        \
+   }                                                  \
+   heap[zz] = tmp;                                    \
+}
+
+
+/*---------------------------------------------------*/
+void BZ2_hbMakeCodeLengths ( UChar *len, 
+                             Int32 *freq,
+                             Int32 alphaSize,
+                             Int32 maxLen )
+{
+   /*--
+      Nodes and heap entries run from 1.  Entry 0
+      for both the heap and nodes is a sentinel.
+   --*/
+   Int32 nNodes, nHeap, n1, n2, i, j, k;
+   Bool  tooLong;
+
+   Int32 heap   [ BZ_MAX_ALPHA_SIZE + 2 ];
+   Int32 weight [ BZ_MAX_ALPHA_SIZE * 2 ];
+   Int32 parent [ BZ_MAX_ALPHA_SIZE * 2 ]; 
+
+   for (i = 0; i < alphaSize; i++)
+      weight[i+1] = (freq[i] == 0 ? 1 : freq[i]) << 8;
+
+   while (True) {
+
+      nNodes = alphaSize;
+      nHeap = 0;
+
+      heap[0] = 0;
+      weight[0] = 0;
+      parent[0] = -2;
+
+      for (i = 1; i <= alphaSize; i++) {
+         parent[i] = -1;
+         nHeap++;
+         heap[nHeap] = i;
+         UPHEAP(nHeap);
+      }
+
+      AssertH( nHeap < (BZ_MAX_ALPHA_SIZE+2), 2001 );
+   
+      while (nHeap > 1) {
+         n1 = heap[1]; heap[1] = heap[nHeap]; nHeap--; DOWNHEAP(1);
+         n2 = heap[1]; heap[1] = heap[nHeap]; nHeap--; DOWNHEAP(1);
+         nNodes++;
+         parent[n1] = parent[n2] = nNodes;
+         weight[nNodes] = ADDWEIGHTS(weight[n1], weight[n2]);
+         parent[nNodes] = -1;
+         nHeap++;
+         heap[nHeap] = nNodes;
+         UPHEAP(nHeap);
+      }
+
+      AssertH( nNodes < (BZ_MAX_ALPHA_SIZE * 2), 2002 );
+
+      tooLong = False;
+      for (i = 1; i <= alphaSize; i++) {
+         j = 0;
+         k = i;
+         while (parent[k] >= 0) { k = parent[k]; j++; }
+         len[i-1] = j;
+         if (j > maxLen) tooLong = True;
+      }
+      
+      if (! tooLong) break;
+
+      /* 17 Oct 04: keep-going condition for the following loop used
+         to be 'i < alphaSize', which missed the last element,
+         theoretically leading to the possibility of the compressor
+         looping.  However, this count-scaling step is only needed if
+         one of the generated Huffman code words is longer than
+         maxLen, which up to and including version 1.0.2 was 20 bits,
+         which is extremely unlikely.  In version 1.0.3 maxLen was
+         changed to 17 bits, which has minimal effect on compression
+         ratio, but does mean this scaling step is used from time to
+         time, enough to verify that it works.
+
+         This means that bzip2-1.0.3 and later will only produce
+         Huffman codes with a maximum length of 17 bits.  However, in
+         order to preserve backwards compatibility with bitstreams
+         produced by versions pre-1.0.3, the decompressor must still
+         handle lengths of up to 20. */
+
+      for (i = 1; i <= alphaSize; i++) {
+         j = weight[i] >> 8;
+         j = 1 + (j / 2);
+         weight[i] = j << 8;
+      }
+   }
+}
+
+
+/*---------------------------------------------------*/
+void BZ2_hbAssignCodes ( Int32 *code,
+                         UChar *length,
+                         Int32 minLen,
+                         Int32 maxLen,
+                         Int32 alphaSize )
+{
+   Int32 n, vec, i;
+
+   vec = 0;
+   for (n = minLen; n <= maxLen; n++) {
+      for (i = 0; i < alphaSize; i++)
+         if (length[i] == n) { code[i] = vec; vec++; };
+      vec <<= 1;
+   }
+}
+
+
+/*---------------------------------------------------*/
+void BZ2_hbCreateDecodeTables ( Int32 *limit,
+                                Int32 *base,
+                                Int32 *perm,
+                                UChar *length,
+                                Int32 minLen,
+                                Int32 maxLen,
+                                Int32 alphaSize )
+{
+   Int32 pp, i, j, vec;
+
+   pp = 0;
+   for (i = minLen; i <= maxLen; i++)
+      for (j = 0; j < alphaSize; j++)
+         if (length[j] == i) { perm[pp] = j; pp++; };
+
+   for (i = 0; i < BZ_MAX_CODE_LEN; i++) base[i] = 0;
+   for (i = 0; i < alphaSize; i++) base[length[i]+1]++;
+
+   for (i = 1; i < BZ_MAX_CODE_LEN; i++) base[i] += base[i-1];
+
+   for (i = 0; i < BZ_MAX_CODE_LEN; i++) limit[i] = 0;
+   vec = 0;
+
+   for (i = minLen; i <= maxLen; i++) {
+      vec += (base[i+1] - base[i]);
+      limit[i] = vec-1;
+      vec <<= 1;
+   }
+   for (i = minLen + 1; i <= maxLen; i++)
+      base[i] = ((limit[i-1] + 1) << 1) - base[i];
+}
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                         huffman.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/msvs/fgbzip2.sln b/xdl/third_party/tbb/examples/graph/fgbzip2/msvs/fgbzip2.sln
new file mode 100644
index 00000000..663e94a8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/msvs/fgbzip2.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "fgbzip2", "fgbzip2.vcxproj", "{C931C7A2-074E-4150-9E7A-39A03250411E}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.ActiveCfg = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.Build.0 = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.ActiveCfg = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.Build.0 = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.ActiveCfg = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.Build.0 = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.ActiveCfg = Release|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/msvs/fgbzip2.vcxproj b/xdl/third_party/tbb/examples/graph/fgbzip2/msvs/fgbzip2.vcxproj
new file mode 100644
index 00000000..bf28d99e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/msvs/fgbzip2.vcxproj
@@ -0,0 +1,216 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>fgbzip2</ProjectName>
+    <ProjectGuid>{C931C7A2-074E-4150-9E7A-39A03250411E}</ProjectGuid>
+    <RootNamespace>fgbzip2</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_PREVIEW_FLOW_GRAPH_NODES;WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <Cpp0xSupport>true</Cpp0xSupport>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_PREVIEW_FLOW_GRAPH_NODES;WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <Cpp0xSupport>true</Cpp0xSupport>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>REM call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_PREVIEW_FLOW_GRAPH_NODES;WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <Cpp0xSupport>true</Cpp0xSupport>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_PREVIEW_FLOW_GRAPH_NODES;WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+      <Cpp0xSupport>true</Cpp0xSupport>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\blocksort.cpp" />
+    <ClCompile Include="..\bzlib.cpp" />
+    <ClCompile Include="..\compress.cpp" />
+    <ClCompile Include="..\crctable.cpp" />
+    <ClCompile Include="..\decompress.cpp" />
+    <ClCompile Include="..\fgbzip2.cpp" />
+    <ClCompile Include="..\huffman.cpp" />
+    <ClCompile Include="..\randtable.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\bzlib.h" />
+    <ClInclude Include="..\bzlib_private.h" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/randtable.cpp b/xdl/third_party/tbb/examples/graph/fgbzip2/randtable.cpp
new file mode 100644
index 00000000..67f9a371
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/randtable.cpp
@@ -0,0 +1,136 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*-------------------------------------------------------------*/
+/*--- Table for randomising repetitive blocks               ---*/
+/*---                                         randtable.cpp ---*/
+/*-------------------------------------------------------------*/
+
+/* ------------------------------------------------------------------
+   The original source for this example:
+   This file is part of bzip2/libbzip2, a program and library for
+   lossless, block-sorting data compression.
+
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
+
+   This program, "bzip2", the associated library "libbzip2", and all
+   documentation, are copyright (C) 1996-2010 Julian R Seward.  All
+   rights reserved.
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions
+   are met:
+
+   1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+
+   2. The origin of this software must not be misrepresented; you must 
+   not claim that you wrote the original software.  If you use this 
+   software in a product, an acknowledgment in the product 
+   documentation would be appreciated but is not required.
+
+   3. Altered source versions must be plainly marked as such, and must
+   not be misrepresented as being the original software.
+
+   4. The name of the author may not be used to endorse or promote 
+   products derived from this software without specific prior written 
+   permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+   OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+   WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+   ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+   DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+   GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+   WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+   Julian Seward, jseward@bzip.org
+   bzip2/libbzip2 version 1.0.6 of 6 September 2010
+   ------------------------------------------------------------------ */
+
+
+#include "bzlib_private.h"
+
+
+/*---------------------------------------------*/
+Int32 BZ2_rNums[512] = { 
+   619, 720, 127, 481, 931, 816, 813, 233, 566, 247, 
+   985, 724, 205, 454, 863, 491, 741, 242, 949, 214, 
+   733, 859, 335, 708, 621, 574, 73, 654, 730, 472, 
+   419, 436, 278, 496, 867, 210, 399, 680, 480, 51, 
+   878, 465, 811, 169, 869, 675, 611, 697, 867, 561, 
+   862, 687, 507, 283, 482, 129, 807, 591, 733, 623, 
+   150, 238, 59, 379, 684, 877, 625, 169, 643, 105, 
+   170, 607, 520, 932, 727, 476, 693, 425, 174, 647, 
+   73, 122, 335, 530, 442, 853, 695, 249, 445, 515, 
+   909, 545, 703, 919, 874, 474, 882, 500, 594, 612, 
+   641, 801, 220, 162, 819, 984, 589, 513, 495, 799, 
+   161, 604, 958, 533, 221, 400, 386, 867, 600, 782, 
+   382, 596, 414, 171, 516, 375, 682, 485, 911, 276, 
+   98, 553, 163, 354, 666, 933, 424, 341, 533, 870, 
+   227, 730, 475, 186, 263, 647, 537, 686, 600, 224, 
+   469, 68, 770, 919, 190, 373, 294, 822, 808, 206, 
+   184, 943, 795, 384, 383, 461, 404, 758, 839, 887, 
+   715, 67, 618, 276, 204, 918, 873, 777, 604, 560, 
+   951, 160, 578, 722, 79, 804, 96, 409, 713, 940, 
+   652, 934, 970, 447, 318, 353, 859, 672, 112, 785, 
+   645, 863, 803, 350, 139, 93, 354, 99, 820, 908, 
+   609, 772, 154, 274, 580, 184, 79, 626, 630, 742, 
+   653, 282, 762, 623, 680, 81, 927, 626, 789, 125, 
+   411, 521, 938, 300, 821, 78, 343, 175, 128, 250, 
+   170, 774, 972, 275, 999, 639, 495, 78, 352, 126, 
+   857, 956, 358, 619, 580, 124, 737, 594, 701, 612, 
+   669, 112, 134, 694, 363, 992, 809, 743, 168, 974, 
+   944, 375, 748, 52, 600, 747, 642, 182, 862, 81, 
+   344, 805, 988, 739, 511, 655, 814, 334, 249, 515, 
+   897, 955, 664, 981, 649, 113, 974, 459, 893, 228, 
+   433, 837, 553, 268, 926, 240, 102, 654, 459, 51, 
+   686, 754, 806, 760, 493, 403, 415, 394, 687, 700, 
+   946, 670, 656, 610, 738, 392, 760, 799, 887, 653, 
+   978, 321, 576, 617, 626, 502, 894, 679, 243, 440, 
+   680, 879, 194, 572, 640, 724, 926, 56, 204, 700, 
+   707, 151, 457, 449, 797, 195, 791, 558, 945, 679, 
+   297, 59, 87, 824, 713, 663, 412, 693, 342, 606, 
+   134, 108, 571, 364, 631, 212, 174, 643, 304, 329, 
+   343, 97, 430, 751, 497, 314, 983, 374, 822, 928, 
+   140, 206, 73, 263, 980, 736, 876, 478, 430, 305, 
+   170, 514, 364, 692, 829, 82, 855, 953, 676, 246, 
+   369, 970, 294, 750, 807, 827, 150, 790, 288, 923, 
+   804, 378, 215, 828, 592, 281, 565, 555, 710, 82, 
+   896, 831, 547, 261, 524, 462, 293, 465, 502, 56, 
+   661, 821, 976, 991, 658, 869, 905, 758, 745, 193, 
+   768, 550, 608, 933, 378, 286, 215, 979, 792, 961, 
+   61, 688, 793, 644, 986, 403, 106, 366, 905, 644, 
+   372, 567, 466, 434, 645, 210, 389, 550, 919, 135, 
+   780, 773, 635, 389, 707, 100, 626, 958, 165, 504, 
+   920, 176, 193, 713, 857, 265, 203, 50, 668, 108, 
+   645, 990, 626, 197, 510, 357, 358, 850, 858, 364, 
+   936, 638
+};
+
+
+/*-------------------------------------------------------------*/
+/*--- end                                       randtable.c ---*/
+/*-------------------------------------------------------------*/
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/readme.html b/xdl/third_party/tbb/examples/graph/fgbzip2/readme.html
new file mode 100644
index 00000000..0f3e9aff
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/readme.html
@@ -0,0 +1,466 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. fgbzip2 sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>fgbzip2 sample</h1>
+	</div>
+
+	<p>
+		fgbzip2 is a parallel implementation of bzip2 block-sorting file compressor that uses tbb::flow.
+		The output of this application is fully compatible with bzip2 v1.0.6 or newer.
+	<br><br>
+	<i>
+		This example includes software developed by Julian R Seward. See
+		<a href="#copyright">here</a> for copyright information.
+	</i>
+	<br>
+		It exemplifies support for asynchronous capabilities in the flow graph API, in particular async_node and async_msg.
+	<br><br>
+		This example uses C++11 lambda expressions. Specifying a compiler option such as -std=c++11 or similar might be necessary in order to build the example.
+		For more information please refer to the documentation for the compiler you use.
+	</p>
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="fgbzip2.cpp">fgbzip2.cpp</a>
+				<dd>Flow Graph implementation of bzip2 compressor.
+				<dt><a href="blocksort.cpp">blocksort.cpp</a>
+				<dd>Block sorting machinery of libbzip2.
+				<dt><a href="bzlib.cpp">bzlib.cpp</a>
+				<dd>libbzip2 top-level functions.
+				<dt><a href="bzlib.h">bzlib.h</a>
+				<dd>Public header file for the libbzip2.
+				<dt><a href="bzlib_private.h">bzlib_private.h</a>
+				<dd>Private header file for the libbzip2.
+				<dt><a href="compress.cpp">compress.cpp</a>
+				<dd>Compression machinery of libbzip2.
+				<dt><a href="crctable.cpp">crctable.cpp</a>
+				<dd>libbzip2 table for doing CRCs.
+				<dt><a href="decompress.cpp">decompress.cpp</a>
+				<dd>Decompression machinery of libbzip2.
+				<dt><a href="huffman.cpp">huffman.cpp</a>
+				<dd>Huffman coding low-level stuff of libbzip2.
+				<dt><a href="randtable.cpp">randtable.cpp</a>
+				<dd>libbzip2 table for randomising repetitive blocks.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+			<dt><a href="msvs/">msvs</a>
+			<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+			<dt><a href="xcode/">xcode</a>
+			<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>fgbzip2 <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>fgbzip2 [<i>-b</i>=value] [<i>-v</i>] [<i>-l</i>=value] [<i>-a</i>=value] [<i>filename</i>]</tt>
+				<dd><i>-b</i> block size in 100 KB chunks, [1 .. 9]<br>
+					<i>-v</i> print diagnostic output to screen<br>
+					<i>-l</i> used memory limit for compression algorithm with 1 MB (minimum) granularity<br>
+					<i>-a</i> name of the used graph async realization - can be async_node or async_msg<br>
+					<i>filename</i> name of the file to compress<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size, e.g., <tt>fgbzip2&nbsp;-b=1&nbsp;-a&nbsp;fgbzip2</tt>.
+			</dl>
+		</div>
+	</div>
+
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<a name="copyright"></a>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+
+			<p>
+				The "libbzip2" sources for this example is
+				Copyright (c) 1996-2010 Julian R Seward.
+				All rights reserved.
+			</p>
+			<p>
+				Redistribution and use in source and binary forms, with or without
+				modification, are permitted provided that the following conditions
+				are met:
+				<ol>
+					<li>Redistributions of source code must retain the above copyright
+					   notice, this list of conditions and the following disclaimer.
+					<li>The origin of this software must not be misrepresented; you must
+					   not claim that you wrote the original software.  If you use this
+					   software in a product, an acknowledgment in the product
+					   documentation would be appreciated but is not required.
+					<li>Altered source versions must be plainly marked as such, and must
+					   not be misrepresented as being the original software.
+					<li>The name of the author may not be used to endorse or promote
+					   products derived from this software without specific prior written
+					   permission.
+				</ol>
+			</p>
+			<p>
+				THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+				OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+				WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+				ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+				DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+				DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+				GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+				INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+				WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+				NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+				SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+			</p>
+		</div>
+	</div>
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/fgbzip2/xcode/fgbzip2.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/graph/fgbzip2/xcode/fgbzip2.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..dceabccd
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/fgbzip2/xcode/fgbzip2.xcodeproj/project.pbxproj
@@ -0,0 +1,337 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* fgbzip2.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* fgbzip2.cpp */; };
+		EAA00DB11B443FB000A83D1A /* blocksort.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00D931B443FB000A83D1A /* blocksort.cpp */; };
+		EAA00DB31B443FB000A83D1A /* bzlib.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00D961B443FB000A83D1A /* bzlib.cpp */; };
+		EAA00DB51B443FB000A83D1A /* compress.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00D991B443FB000A83D1A /* compress.cpp */; };
+		EAA00DB71B443FB000A83D1A /* crctable.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00D9B1B443FB000A83D1A /* crctable.cpp */; };
+		EAA00DB91B443FB000A83D1A /* decompress.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00D9D1B443FB000A83D1A /* decompress.cpp */; };
+		EAA00DBB1B443FB000A83D1A /* huffman.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00DA11B443FB000A83D1A /* huffman.cpp */; };
+		EAA00DBE1B443FB000A83D1A /* randtable.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAA00DAB1B443FB000A83D1A /* randtable.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58956218B620500DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* fgbzip2 */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = fgbzip2; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* fgbzip2.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = fgbzip2.cpp; path = ../fgbzip2.cpp; sourceTree = SOURCE_ROOT; };
+		EAA00D931B443FB000A83D1A /* blocksort.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = blocksort.cpp; path = ../blocksort.cpp; sourceTree = "<group>"; };
+		EAA00D951B443FB000A83D1A /* bzlib_private.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.h; name = bzlib_private.h; path = ../bzlib_private.h; sourceTree = "<group>"; };
+		EAA00D961B443FB000A83D1A /* bzlib.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = bzlib.cpp; path = ../bzlib.cpp; sourceTree = "<group>"; };
+		EAA00D971B443FB000A83D1A /* bzlib.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.h; name = bzlib.h; path = ../bzlib.h; sourceTree = "<group>"; };
+		EAA00D991B443FB000A83D1A /* compress.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = compress.cpp; path = ../compress.cpp; sourceTree = "<group>"; };
+		EAA00D9B1B443FB000A83D1A /* crctable.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = crctable.cpp; path = ../crctable.cpp; sourceTree = "<group>"; };
+		EAA00D9D1B443FB000A83D1A /* decompress.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = decompress.cpp; path = ../decompress.cpp; sourceTree = "<group>"; };
+		EAA00DA11B443FB000A83D1A /* huffman.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = huffman.cpp; path = ../huffman.cpp; sourceTree = "<group>"; };
+		EAA00DAB1B443FB000A83D1A /* randtable.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = randtable.cpp; path = ../randtable.cpp; sourceTree = "<group>"; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* fgbzip2 */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = fgbzip2;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				EAA00D931B443FB000A83D1A /* blocksort.cpp */,
+				EAA00D951B443FB000A83D1A /* bzlib_private.h */,
+				EAA00D961B443FB000A83D1A /* bzlib.cpp */,
+				EAA00D971B443FB000A83D1A /* bzlib.h */,
+				EAA00D991B443FB000A83D1A /* compress.cpp */,
+				EAA00D9B1B443FB000A83D1A /* crctable.cpp */,
+				EAA00D9D1B443FB000A83D1A /* decompress.cpp */,
+				EAA00DA11B443FB000A83D1A /* huffman.cpp */,
+				EAA00DAB1B443FB000A83D1A /* randtable.cpp */,
+				A1F593A50B8F042A00073279 /* fgbzip2.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* fgbzip2 */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* fgbzip2 */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "fgbzip2" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58956218B620500DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = fgbzip2;
+			productInstallPath = "$(HOME)/bin";
+			productName = fgbzip2;
+			productReference = 8DD76F6C0486A84900D96B5E /* fgbzip2 */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "fgbzip2" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* fgbzip2 */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* fgbzip2 */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				EAA00DB91B443FB000A83D1A /* decompress.cpp in Sources */,
+				EAA00DBB1B443FB000A83D1A /* huffman.cpp in Sources */,
+				EAA00DB31B443FB000A83D1A /* bzlib.cpp in Sources */,
+				EAA00DB71B443FB000A83D1A /* crctable.cpp in Sources */,
+				A1F593A60B8F042A00073279 /* fgbzip2.cpp in Sources */,
+				EAA00DB11B443FB000A83D1A /* blocksort.cpp in Sources */,
+				EAA00DBE1B443FB000A83D1A /* randtable.cpp in Sources */,
+				EAA00DB51B443FB000A83D1A /* compress.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		1DEB923208733DC60010E9CD /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = com.apple.compilers.llvm.clang.1_0;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = fgbzip2;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		1DEB923308733DC60010E9CD /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = com.apple.compilers.llvm.clang.1_0;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = fgbzip2;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		1DEB923608733DC60010E9CD /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_PREPROCESSOR_DEFINITIONS = TBB_PREVIEW_FLOW_GRAPH_NODES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		1DEB923708733DC60010E9CD /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_PREPROCESSOR_DEFINITIONS = TBB_PREVIEW_FLOW_GRAPH_NODES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "fgbzip2" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				1DEB923208733DC60010E9CD /* Debug64 */,
+				1DEB923308733DC60010E9CD /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "fgbzip2" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				1DEB923608733DC60010E9CD /* Debug64 */,
+				1DEB923708733DC60010E9CD /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/graph/index.html b/xdl/third_party/tbb/examples/graph/index.html
new file mode 100644
index 00000000..095b92bc
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/index.html
@@ -0,0 +1,358 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks (Intel&reg; TBB). Samples on Intel&reg; TBB Flow Graph feature</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks (Intel&reg; TBB).<br>Samples on Intel&reg; TBB Flow Graph feature</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the Intel TBB Flow Graph feature.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="dining_philosophers/readme.html">dining_philosophers</a>
+				<dd>An implementation of dining philosophers in graph using the reserving join node.
+				<dt><a href="binpack/readme.html">binpack</a>
+				<dd>A solution to the binpacking problem using a <code>queue_node</code>, a <code>buffer_node</code> and <code>function_nodes</code>.
+				<dt><a href="logic_sim/readme.html">logic_sim</a>
+				<dd>A simplistic example of a collection of digital logic gates that can be easily composed into larger circuits.
+				<dt><a href="som/readme.html">som</a>
+				<dd>A simple example of a Kohonen Self-Organizing Map using cancellation.
+				<dt><a href="fgbzip2/readme.html">fgbzip2</a>
+				<dd>A parallel implementation of bzip2 block-sorting file compressor.
+				<dt><a href="cholesky/readme.html">cholesky</a>
+				<dd>Several versions of Cholesky Factorization algorithm implementation.
+				<dt><a href="stereo/readme.html">stereo</a>
+				<dd>An implementation of stereo image creation from two images (anaglyph effect).
+				<dt><a href="matmult/readme.html">matmult</a>
+				<dd>Matrix multiplication Gen kernel implementation with the flow graph interface.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/D_latch.h b/xdl/third_party/tbb/examples/graph/logic_sim/D_latch.h
new file mode 100644
index 00000000..de14d9c8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/D_latch.h
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBBexample_graph_logicsim_dlatch_H
+#define __TBBexample_graph_logicsim_dlatch_H 1
+
+#include "basics.h"
+
+class D_latch : public composite_node< tuple< signal_t, signal_t >, tuple< signal_t, signal_t > > {
+    broadcast_node<signal_t> D_port;
+    broadcast_node<signal_t> E_port;
+    not_gate a_not;
+    and_gate<2> first_and;
+    and_gate<2> second_and;
+    nor_gate<2> first_nor;
+    nor_gate<2> second_nor;
+    graph& my_graph;
+    typedef composite_node< tuple< signal_t, signal_t >, tuple< signal_t, signal_t > > base_type;
+
+ public:
+    D_latch(graph& g) : base_type(g), my_graph(g), D_port(g), E_port(g), a_not(g), first_and(g), second_and(g), 
+                        first_nor(g), second_nor(g) 
+    {
+        make_edge(D_port, input_port<0>(a_not));
+        make_edge(D_port, input_port<1>(second_and));
+        make_edge(E_port, input_port<1>(first_and));
+        make_edge(E_port, input_port<0>(second_and));
+        make_edge(a_not, input_port<0>(first_and));
+        make_edge(first_and, input_port<0>(first_nor));
+        make_edge(second_and, input_port<1>(second_nor));
+        make_edge(first_nor, input_port<0>(second_nor));
+        make_edge(second_nor, input_port<1>(first_nor));
+ 
+        base_type::input_ports_type input_tuple(D_port, E_port);
+        base_type::output_ports_type output_tuple(output_port<0>(first_nor), output_port<0>(second_nor)); 
+
+        base_type::set_external_ports(input_tuple, output_tuple); 
+        base_type::add_visible_nodes(D_port, E_port, a_not, first_and, second_and, first_nor, second_nor);
+    }
+    ~D_latch() {}
+};
+
+#endif /* __TBBexample_graph_logicsim_dlatch_H */
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/Makefile b/xdl/third_party/tbb/examples/graph/logic_sim/Makefile
new file mode 100644
index 00000000..0a7d6f6c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/Makefile
@@ -0,0 +1,61 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=test_all
+ARGS=4
+PERF_RUN_ARGS=auto silent
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # which icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:    release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $(PROG).cpp -std=c++0x -ltbb $(LIBS) 
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $(PROG).cpp -std=c++0x -ltbb_debug $(LIBS) 
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/Makefile.windows b/xdl/third_party/tbb/examples/graph/logic_sim/Makefile.windows
new file mode 100644
index 00000000..b7d25e13
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/Makefile.windows
@@ -0,0 +1,56 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+PROG=test_all
+ARGS=4
+PERF_RUN_ARGS=auto silent
+
+# Try to find icl.exe
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all:	release test
+
+release: *.cpp
+	$(CXX) $(PROG).cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+debug: *.cpp
+	$(CXX) $(PROG).cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+profile: *.cpp
+	$(CXX) $(PROG).cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+
+test:
+	$(PROG) $(ARGS)
+
+compiler_check:
+	@$(CXX) >nul 2>&1 || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/basics.h b/xdl/third_party/tbb/examples/graph/logic_sim/basics.h
new file mode 100644
index 00000000..527ca92f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/basics.h
@@ -0,0 +1,560 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBBexample_graph_logicsim_basics_H
+#define __TBBexample_graph_logicsim_basics_H 1
+
+#include <cstdio>
+#include <string>
+#include "tbb/atomic.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/flow_graph.h"
+#include "../../common/utility/utility.h"
+
+#ifndef _WIN32
+#include <sys/time.h>
+#include <unistd.h>
+
+void rt_sleep(int msec) {
+    usleep(msec*1000);
+}
+
+#else //_WIN32
+
+#undef OLDUNIXTIME
+#undef STDTIME
+
+#include <windows.h>
+
+void rt_sleep(int msec) {
+    Sleep(msec);
+}
+#endif  /*  _WIN32  */
+
+using namespace std;
+using namespace tbb;
+using namespace tbb::flow;
+
+typedef enum { low=0, high, undefined } signal_t;
+
+template<int N> class gate;
+
+template<>
+class gate<1> : public composite_node< tuple< signal_t >, tuple< signal_t > > {
+protected:
+    typedef indexer_node<signal_t> input_port_t;
+    typedef multifunction_node< input_port_t::output_type, tuple<signal_t> > gate_fn_t;
+    typedef gate_fn_t::output_ports_type ports_type;
+    typedef composite_node< tuple< signal_t >, tuple< signal_t > > base_type;
+public:
+    template <typename Body>
+    gate(graph& g, Body b) : base_type(g), my_graph(g), in_ports(g), gate_fn(g, 1, b) {
+        make_edge(in_ports, gate_fn);
+        base_type::input_ports_type input_tuple(input_port<0>(in_ports));
+        base_type::output_ports_type output_tuple(output_port<0>(gate_fn));
+        base_type::set_external_ports(input_tuple, output_tuple);
+        base_type::add_visible_nodes(in_ports, gate_fn);
+    }
+    virtual ~gate() {}
+    gate& operator=(const gate& src) { return *this; }
+protected:
+    graph& my_graph;
+private:
+    input_port_t in_ports;
+    gate_fn_t gate_fn;
+};
+
+template<>
+class gate<2> : public composite_node< tuple< signal_t, signal_t >, tuple< signal_t > > {
+protected:
+    typedef indexer_node<signal_t,signal_t> input_port_t;
+    typedef multifunction_node< input_port_t::output_type, tuple<signal_t> > gate_fn_t;
+    typedef gate_fn_t::output_ports_type ports_type;
+    typedef composite_node< tuple< signal_t, signal_t >, tuple< signal_t > > base_type;
+public:
+    template <typename Body>
+    gate(graph& g, Body b) : base_type(g), my_graph(g), in_ports(g), gate_fn(g, 1, b) {
+        make_edge(in_ports, gate_fn);
+        base_type::input_ports_type input_tuple(input_port<0>(in_ports),input_port<1>(in_ports));
+        base_type::output_ports_type output_tuple(output_port<0>(gate_fn));
+        base_type::set_external_ports(input_tuple, output_tuple);
+        base_type::add_visible_nodes(in_ports, gate_fn);
+    }
+    virtual ~gate() {}
+    gate& operator=(const gate& src) { return *this; }
+protected:
+    graph& my_graph;
+private:
+    input_port_t in_ports;
+    gate_fn_t gate_fn;
+};
+
+template<>
+class gate<3> : public composite_node< tuple< signal_t, signal_t, signal_t >, tuple< signal_t > > {
+protected:
+    typedef indexer_node<signal_t, signal_t, signal_t> input_port_t;
+    typedef multifunction_node< input_port_t::output_type, tuple<signal_t> > gate_fn_t;
+    typedef gate_fn_t::output_ports_type ports_type;
+    typedef composite_node< tuple< signal_t, signal_t, signal_t >, tuple< signal_t > > base_type;
+public:
+    template <typename Body>
+    gate(graph& g, Body b) : base_type(g), my_graph(g), in_ports(g), gate_fn(g, 1, b) {
+        make_edge(in_ports, gate_fn);
+        base_type::input_ports_type input_tuple(input_port<0>(in_ports),input_port<1>(in_ports),input_port<2>(in_ports));
+        base_type::output_ports_type output_tuple(output_port<0>(gate_fn));
+        base_type::set_external_ports(input_tuple, output_tuple);
+        base_type::add_visible_nodes(in_ports, gate_fn);
+    }
+    virtual ~gate() {}
+    gate& operator=(const gate& src) { return *this; }
+protected:
+    graph& my_graph;
+private:
+    input_port_t in_ports;
+    gate_fn_t gate_fn;
+};
+
+template<>
+class gate<4> : public composite_node< tuple< signal_t, signal_t, signal_t, signal_t >, tuple< signal_t > > {
+protected:
+    typedef indexer_node<signal_t, signal_t, signal_t, signal_t> input_port_t;
+    typedef multifunction_node< input_port_t::output_type, tuple<signal_t> > gate_fn_t;
+    typedef gate_fn_t::output_ports_type ports_type;
+    typedef composite_node< tuple< signal_t, signal_t, signal_t, signal_t >, tuple< signal_t > > base_type;
+public:
+    template <typename Body>
+    gate(graph& g, Body b) : base_type(g), my_graph(g), in_ports(g), gate_fn(g, 1, b) {
+        make_edge(in_ports, gate_fn);
+        base_type::input_ports_type input_tuple(input_port<0>(in_ports),input_port<1>(in_ports),input_port<2>(in_ports), input_port<3>(in_ports)); 
+        base_type::output_ports_type output_tuple(output_port<0>(gate_fn));
+        base_type::set_external_ports(input_tuple, output_tuple);
+        base_type::add_visible_nodes(in_ports, gate_fn);
+    }
+    virtual ~gate() {}
+    gate& operator=(const gate& src) { return *this; }
+protected:
+    graph& my_graph;
+private:
+    input_port_t in_ports;
+    gate_fn_t gate_fn;
+};
+
+// Input devices
+class steady_signal {
+    graph& my_graph;
+    signal_t init_signal;
+    write_once_node<signal_t> signal_node;
+ public:
+    steady_signal(graph& g, signal_t v) :
+        my_graph(g), init_signal(v), signal_node(g) {}
+    steady_signal(const steady_signal& src) : 
+        my_graph(src.my_graph), init_signal(src.init_signal), 
+        signal_node(src.my_graph) {}
+    ~steady_signal() {}
+    // Assignment is ignored
+    steady_signal& operator=(const steady_signal& src) { return *this; }
+    sender<signal_t>& get_out() { return signal_node; }
+    void activate() { signal_node.try_put(init_signal); }
+};
+
+class pulse {
+    class clock_body {
+        size_t& ms;
+        int& reps;
+        signal_t val;
+    public:
+        clock_body(size_t& _ms, int& _reps) : ms(_ms), reps(_reps), val(low) {}
+        bool operator()(signal_t& out) {
+            rt_sleep((int)ms);
+            if (reps>0) --reps;
+            if (val==low) val = high;
+            else val = low;
+            out = val;
+            return reps>0 || reps == -1;
+        }
+    };
+    graph& my_graph;
+    size_t ms, init_ms;
+    int reps, init_reps;
+    source_node<signal_t> clock_node;
+
+public:
+    pulse(graph& g, size_t _ms=1000, int _reps=-1) : 
+        my_graph(g), ms(_ms), init_ms(_ms), reps(_reps), init_reps(_reps),
+        clock_node(g, clock_body(ms, reps), false)
+    {}
+    pulse(const pulse& src) : 
+        my_graph(src.my_graph), ms(src.init_ms), init_ms(src.init_ms),
+        reps(src.init_reps), init_reps(src.init_reps), 
+        clock_node(src.my_graph, clock_body(ms, reps), false)
+    {}
+    ~pulse() {}
+    // Assignment changes the behavior of LHS to that of the RHS, but doesn't change owning graph
+    pulse& operator=(const pulse& src) {
+        ms = src.ms; init_ms = src.init_ms; reps = src.reps; init_reps = src.init_reps;
+        return *this; 
+    }
+    sender<signal_t>& get_out() { return clock_node; }
+    void activate() { clock_node.activate(); }
+    void reset() { reps = init_reps; }
+};
+
+class push_button {
+    graph& my_graph;
+    overwrite_node<signal_t> push_button_node;
+ public:
+    push_button(graph& g) : my_graph(g), push_button_node(g) { 
+        push_button_node.try_put(low);
+    }
+    push_button(const push_button& src) : 
+        my_graph(src.my_graph), push_button_node(src.my_graph) { 
+        push_button_node.try_put(low);
+    }
+    ~push_button() {}
+    // Assignment is ignored
+    push_button& operator=(const push_button& src) { return *this; }
+    sender<signal_t>& get_out() { return push_button_node; }
+    void press() { push_button_node.try_put(high); }
+    void release() { push_button_node.try_put(low); }
+};
+
+class toggle {
+    graph& my_graph;
+    signal_t state;
+    overwrite_node<signal_t> toggle_node;
+ public:
+    toggle(graph& g) : my_graph(g), state(undefined), toggle_node(g) {}
+    toggle(const toggle& src) : my_graph(src.my_graph), state(undefined), 
+                                toggle_node(src.my_graph) {}
+    ~toggle() {}
+    // Assignment ignored
+    toggle& operator=(const toggle& src) { return *this; }
+    sender<signal_t>& get_out() { return toggle_node; }
+    void flip() { 
+        if (state==high) state = low; 
+        else state = high;
+        toggle_node.try_put(state); 
+    }
+    void activate() { 
+        state = low;
+        toggle_node.try_put(state);
+    }
+};
+
+// Basic gates
+class buffer : public gate<1> {
+    using gate<1>::my_graph;
+    typedef gate<1>::ports_type ports_type;
+    class buffer_body {
+        signal_t state;
+        bool touched;
+    public:
+        buffer_body() : state(undefined), touched(false) {}
+        void operator()(const input_port_t::output_type &v, ports_type& p) { 
+            if (!touched || state != cast_to<signal_t>(v)) {
+                state = cast_to<signal_t>(v); 
+                tbb::flow::get<0>(p).try_put(state); 
+                touched = true;
+            }
+        }
+    };
+public: 
+    buffer(graph& g) : gate<1>(g, buffer_body()) {}
+    buffer(const buffer& src) : gate<1>(src.my_graph, buffer_body()) {}
+    ~buffer() {}
+};
+
+class not_gate : public gate<1> {
+    using gate<1>::my_graph;
+    typedef gate<1>::ports_type ports_type;
+    class not_body {
+        signal_t port;
+        bool touched;
+    public:
+    not_body() : port(undefined), touched(false) {}
+        void operator()(const input_port_t::output_type &v, ports_type& p) {
+            if (!touched || port != cast_to<signal_t>(v)) {
+                port = cast_to<signal_t>(v); 
+                signal_t state = low;
+                if (port==low) state = high; 
+                tbb::flow::get<0>(p).try_put(state);
+                touched = true;
+            }
+        }
+    };
+ public: 
+    not_gate(graph& g) : gate<1>(g, not_body()) {}
+    not_gate(const not_gate& src) : gate<1>(src.my_graph, not_body()) {}
+    ~not_gate() {}
+};
+
+template <int N>
+class and_gate : public gate<N> {
+    using gate<N>::my_graph;
+    typedef typename gate<N>::ports_type ports_type;
+    typedef typename gate<N>::input_port_t::output_type from_input;
+    class and_body {
+        signal_t *ports;
+        signal_t state;
+        bool touched;
+    public:
+        and_body() : state(undefined), touched(false) {
+            ports = new signal_t[N];
+            for (int i=0; i<N; ++i) ports[i] = undefined;
+        }
+        void operator()(const from_input& v, ports_type& p) {
+            ports[v.tag()] = cast_to<signal_t>(v);
+            signal_t new_state=high;
+            size_t i=0;
+            while (i<N) {
+                if (ports[i] == low) { new_state = low; break; }
+                else if (ports[i] == undefined && new_state != low) { new_state = undefined; }
+                ++i;
+            }
+            if (!touched || state != new_state) {
+                state = new_state;
+                tbb::flow::get<0>(p).try_put(state);
+                touched = true;
+            }
+        }
+    };
+ public:
+    and_gate(graph& g) : gate<N>(g, and_body()) {}
+    and_gate(const and_gate<N>& src) : gate<N>(src.my_graph, and_body()) {}
+    ~and_gate() {}
+};
+
+template<int N>
+class or_gate : public gate<N> {
+    using gate<N>::my_graph;
+    typedef typename gate<N>::ports_type ports_type;
+    typedef typename gate<N>::input_port_t::output_type from_input;
+    class or_body {
+        signal_t *ports;
+        signal_t state;
+        bool touched;
+    public:
+        or_body() : state(undefined), touched(false) {
+            ports = new signal_t[N];
+            for (int i=0; i<N; ++i) ports[i] = undefined;
+        }
+        void operator()(const from_input& v, ports_type& p) {
+            ports[v.tag()] = cast_to<signal_t>(v);
+            signal_t new_state=low;
+            size_t i=0;
+            while (i<N) {
+                if (ports[i] == high) { new_state = high; break; }
+                else if (ports[i] == undefined && new_state != high) { new_state = undefined; }
+                ++i;
+            }
+            if (!touched || state != new_state) {
+                state = new_state;
+                tbb::flow::get<0>(p).try_put(state);
+                touched = true;
+            }
+        }
+    };
+public:
+    or_gate(graph& g) : gate<N>(g, or_body()) {}
+    or_gate(const or_gate& src) : gate<N>(src.my_graph, or_body()) {}
+    ~or_gate() {}
+};
+
+template <int N>
+class xor_gate : public gate<N> {
+    using gate<N>::my_graph;
+    typedef typename gate<N>::ports_type ports_type;
+    typedef typename gate<N>::input_port_t input_port_t;
+    class xor_body {
+        signal_t *ports;
+        signal_t state;
+        bool touched;
+    public:
+        xor_body() : state(undefined), touched(false) {
+            ports = new signal_t[N];
+            for (int i=0; i<N; ++i) ports[i] = undefined;
+        }
+        void operator()(const typename input_port_t::output_type &v, ports_type& p) {
+            ports[v.tag()] = cast_to<signal_t>(v);
+            signal_t new_state=low;
+            size_t i=0, highs=0;
+            while (i<N) {
+                if (ports[i] == undefined) { new_state = undefined; }  
+                else if (ports[i] == high && new_state == low) { new_state = high; ++highs; }
+                else if (ports[i] == high && highs > 0) { new_state = low; break; }
+                else if (ports[i] == high ) { ++highs; }
+                ++i;
+            }
+            if (!touched || state != new_state) {
+                state = new_state;
+                tbb::flow::get<0>(p).try_put(state);
+                touched = true;
+            }
+        }
+    };
+ public:
+    xor_gate(graph& g) : gate<N>(g, xor_body()) {}
+    xor_gate(const xor_gate& src) : gate<N>(src.my_graph, xor_body()) {}
+    ~xor_gate() {}
+};
+
+template <int N>
+class nor_gate : public gate<N> {
+    using gate<N>::my_graph;
+    typedef typename gate<N>::ports_type ports_type;
+    typedef typename gate<N>::input_port_t input_port_t;
+    class nor_body {
+        signal_t *ports;
+        signal_t state;
+        bool touched;
+    public:
+        nor_body() : state(undefined), touched(false) {
+            ports = new signal_t[N];
+            for (int i=0; i<N; ++i) ports[i] = undefined;
+        }
+        void operator()(const typename input_port_t::output_type &v, ports_type& p) {
+            ports[v.tag()] = cast_to<signal_t>(v);
+            signal_t new_state=low;
+            size_t i=0;
+            while (i<N) {
+                if (ports[i] == high) { new_state = high; break; }
+                else if (ports[i] == undefined && new_state != high) { new_state = undefined; }
+                ++i;
+            }
+            if (new_state == high) new_state = low;
+            else if (new_state == low) new_state = high;
+            if (!touched || state != new_state) {
+                state = new_state;
+                tbb::flow::get<0>(p).try_put(state);
+                touched = true;
+            }
+        }
+    };
+ public:
+    nor_gate(graph& g) : gate<N>(g, nor_body()) {}
+    nor_gate(const nor_gate& src) : gate<N>(src.my_graph, nor_body()) {}
+    ~nor_gate() {}
+};
+
+// Output devices
+class led {
+    class led_body {
+        signal_t &state;
+        string &label;
+        bool report_changes;
+        bool touched;
+    public:
+        led_body(signal_t &s, string &l, bool r) :
+            state(s), label(l), report_changes(r), touched(false)
+        {}
+        continue_msg operator()(signal_t b) {
+            if (!touched || b!=state) {
+                state = b;
+                if (state != undefined && report_changes) {
+                    if (state) printf("%s: (*)\n", label.c_str());
+                    else printf("%s: ( )\n", label.c_str());
+                }
+                touched = false;
+            }
+            return continue_msg();
+        }
+    };
+    graph& my_graph;
+    string label;
+    signal_t state;
+    bool report_changes;
+    function_node<signal_t, continue_msg> led_node;
+ public:
+    led(graph& g, string l, bool rc=false) : my_graph(g), label(l), state(undefined), 
+                                             report_changes(rc), 
+                                             led_node(g, 1, led_body(state, label, report_changes))
+    {}
+    led(const led& src) : my_graph(src.my_graph), label(src.label), state(undefined), 
+                          report_changes(src.report_changes), 
+                          led_node(src.my_graph, 1, led_body(state, label, report_changes)) 
+    {}
+    ~led() {}
+    // Assignment changes the behavior of LHS to that of the RHS, but doesn't change owning graph
+    // state is set to undefined so that next signal changes it
+    led& operator=(const led& src) { 
+        label = src.label; state = undefined; report_changes = src.report_changes; 
+        return *this;
+    }
+    receiver<signal_t>& get_in() { return led_node; }
+    void display() { 
+        if (state == high) printf("%s: (*)\n", label.c_str());
+        else if (state == low) printf("%s: ( )\n", label.c_str());
+        else printf("%s: (u)\n", label.c_str());
+    }
+    signal_t get_value() { return state; }
+};
+
+class digit : public gate<4> {
+    using gate<4>::my_graph;
+    typedef gate<4>::ports_type ports_type;
+    typedef gate<4>::input_port_t input_port_t;
+    class digit_body {
+        signal_t ports[4];
+        static const int N = 4;
+        unsigned int &state;
+        string &label;
+        bool& report_changes;
+    public:
+        digit_body(unsigned int &s, string &l, bool& r) : state(s), label(l), report_changes(r) {
+            for (int i=0; i<N; ++i) ports[i] = undefined;
+        }
+        void operator()(const input_port_t::output_type& v, ports_type& p) {
+            unsigned int new_state = 0;
+            ports[v.tag()] = cast_to<signal_t>(v);
+            if (ports[0] == high) ++new_state;
+            if (ports[1] == high) new_state += 2;
+            if (ports[2] == high) new_state += 4;
+            if (ports[3] == high) new_state += 8;
+            if (state != new_state) {
+                state = new_state;
+                if (report_changes) {
+                    printf("%s: %x\n", label.c_str(), state);
+                }
+            }
+        }
+    };
+    string label;
+    unsigned int state;
+    bool report_changes;
+ public:
+    digit(graph& g, string l, bool rc=false) : 
+        gate<4>(g, digit_body(state, label, report_changes)), 
+        label(l), state(0), report_changes(rc) {}
+    digit(const digit& src) : 
+        gate<4>(src.my_graph, digit_body(state, label, report_changes)), 
+        label(src.label), state(0), report_changes(src.report_changes) {}
+    ~digit() {}
+    // Assignment changes the behavior of LHS to that of the RHS, but doesn't change owning graph.
+    // state is reset as in constructors
+    digit& operator=(const digit& src) { 
+        label = src.label; state = 0; report_changes = src.report_changes; 
+        return *this;
+    }
+    void display() { printf("%s: %x\n", label.c_str(), state); }
+    unsigned int get_value() { return state; }
+};
+
+#endif /* __TBBexample_graph_logicsim_basics_H */
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/four_bit_adder.h b/xdl/third_party/tbb/examples/graph/logic_sim/four_bit_adder.h
new file mode 100644
index 00000000..0818eb4d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/four_bit_adder.h
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBBexample_graph_logicsim_fba_H
+#define __TBBexample_graph_logicsim_fba_H 1
+
+#include "one_bit_adder.h"
+
+typedef composite_node< tuple< signal_t, signal_t, signal_t, signal_t, signal_t, signal_t, signal_t, signal_t, signal_t >,
+                      tuple< signal_t, signal_t, signal_t, signal_t, signal_t > > fba_base_type;
+
+class four_bit_adder : public fba_base_type {
+    graph& my_graph;
+    std::vector<one_bit_adder> four_adders; 
+
+public:
+    four_bit_adder(graph& g) : fba_base_type(g), my_graph(g), four_adders(4, one_bit_adder(g)) {
+        make_connections();
+        set_up_composite();
+    }
+    four_bit_adder(const four_bit_adder& src) : 
+        fba_base_type(src.my_graph), my_graph(src.my_graph), four_adders(4, one_bit_adder(src.my_graph)) 
+    {
+        make_connections();
+        set_up_composite();
+    }
+    ~four_bit_adder() {}
+
+private:
+    void make_connections() {
+        make_edge(output_port<1>(four_adders[0]), input_port<0>(four_adders[1]));
+        make_edge(output_port<1>(four_adders[1]), input_port<0>(four_adders[2]));
+        make_edge(output_port<1>(four_adders[2]), input_port<0>(four_adders[3]));
+    }
+    void set_up_composite() {
+
+        fba_base_type::input_ports_type input_tuple(input_port<0>(four_adders[0]/*CI*/), input_port<1>(four_adders[0]), input_port<2>(four_adders[0]), input_port<1>(four_adders[1]), input_port<2>(four_adders[1]), input_port<1>(four_adders[2]), input_port<2>(four_adders[2]), input_port<1>(four_adders[3]), input_port<2>(four_adders[3])); 
+
+       fba_base_type::output_ports_type output_tuple(output_port<0>(four_adders[0]), output_port<0>(four_adders[1]), output_port<0>(four_adders[2]), output_port<0>(four_adders[3]),output_port<1>(four_adders[3]/*CO*/));
+
+        fba_base_type::set_external_ports(input_tuple, output_tuple);
+    }
+};
+
+#endif /* __TBBexample_graph_logicsim_fba_H */
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/msvs/logic_sim.sln b/xdl/third_party/tbb/examples/graph/logic_sim/msvs/logic_sim.sln
new file mode 100644
index 00000000..04ccab98
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/msvs/logic_sim.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "logic_sim", "logic_sim.vcxproj", "{6E9B1702-78E0-4D64-B771-8B274D963B58}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Debug|Win32.ActiveCfg = Debug|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Debug|Win32.Build.0 = Debug|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Debug|x64.ActiveCfg = Debug|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Debug|x64.Build.0 = Debug|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Release|Win32.ActiveCfg = Release|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Release|Win32.Build.0 = Release|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Release|x64.ActiveCfg = Release|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/msvs/logic_sim.vcxproj b/xdl/third_party/tbb/examples/graph/logic_sim/msvs/logic_sim.vcxproj
new file mode 100644
index 00000000..922e86b2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/msvs/logic_sim.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>logic_sim</ProjectName>
+    <ProjectGuid>{6E9B1702-78E0-4D64-B771-8B274D963B58}</ProjectGuid>
+    <RootNamespace>test_all</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\test_all.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/one_bit_adder.h b/xdl/third_party/tbb/examples/graph/logic_sim/one_bit_adder.h
new file mode 100644
index 00000000..4ba65a0b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/one_bit_adder.h
@@ -0,0 +1,103 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBBexample_graph_logicsim_oba_H
+#define __TBBexample_graph_logicsim_oba_H 1
+
+namespace P {
+    //input ports 
+    const int CI = 0;
+    const int A0 = 1;
+    const int B0 = 2;
+    const int A1 = 3;
+    const int B1 = 4;
+    const int A2 = 5;
+    const int B2 = 6;
+    const int A3 = 7;
+    const int B3 = 8;
+    
+    //output_ports
+    const int S0 = 0;
+    const int S1 = 1;
+    const int S2 = 2;
+    const int S3 = 3;
+
+#if USE_TWO_BIT_FULL_ADDER
+    const int CO = 2;
+#else   
+    const int CO = 4;
+#endif
+}
+
+#include "basics.h"
+
+class one_bit_adder : public composite_node< tuple< signal_t, signal_t, signal_t >, tuple< signal_t, signal_t > > {
+    broadcast_node<signal_t> A_port;
+    broadcast_node<signal_t> B_port;
+    broadcast_node<signal_t> CI_port;
+    xor_gate<2> FirstXOR;
+    xor_gate<2> SecondXOR;
+    and_gate<2> FirstAND;
+    and_gate<2> SecondAND;
+    or_gate<2> FirstOR;
+    graph& my_graph;
+    typedef composite_node< tuple< signal_t, signal_t, signal_t >, tuple< signal_t, signal_t > > base_type;
+
+public:
+    one_bit_adder(graph& g) : base_type(g), my_graph(g), A_port(g), B_port(g), CI_port(g), FirstXOR(g), 
+                              SecondXOR(g), FirstAND(g), SecondAND(g), FirstOR(g) {
+        make_connections();
+        set_up_composite();
+    }
+    one_bit_adder(const one_bit_adder& src) : 
+        base_type(src.my_graph), my_graph(src.my_graph), A_port(src.my_graph), B_port(src.my_graph), 
+        CI_port(src.my_graph), FirstXOR(src.my_graph), SecondXOR(src.my_graph), 
+        FirstAND(src.my_graph), SecondAND(src.my_graph), FirstOR(src.my_graph) 
+    {
+        make_connections();
+        set_up_composite();
+    }
+
+    ~one_bit_adder() {}
+
+private:
+    void make_connections() {
+  
+        make_edge(A_port, input_port<0>(FirstXOR));
+        make_edge(A_port, input_port<0>(FirstAND));
+        make_edge(B_port, input_port<1>(FirstXOR));
+        make_edge(B_port, input_port<1>(FirstAND));
+        make_edge(CI_port, input_port<1>(SecondXOR));
+        make_edge(CI_port, input_port<1>(SecondAND));
+        make_edge(FirstXOR, input_port<0>(SecondXOR));
+        make_edge(FirstXOR, input_port<0>(SecondAND));
+        make_edge(SecondAND, input_port<0>(FirstOR));
+        make_edge(FirstAND, input_port<1>(FirstOR));
+    }
+
+    void set_up_composite() {
+        base_type::input_ports_type input_tuple(CI_port, A_port, B_port);
+        base_type::output_ports_type output_tuple(output_port<0>(SecondXOR), output_port<0>(FirstOR));
+        base_type::set_external_ports( input_tuple, output_tuple);
+        base_type::add_visible_nodes(A_port, B_port, CI_port, FirstXOR, SecondXOR, FirstAND, SecondAND, FirstOR );
+    }
+};
+
+#endif /* __TBBexample_graph_logicsim_oba_H */
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/readme.html b/xdl/third_party/tbb/examples/graph/logic_sim/readme.html
new file mode 100644
index 00000000..23947d7d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/readme.html
@@ -0,0 +1,406 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. logic_sim sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Logic_sim sample</h1>
+	</div>
+	
+	<p>
+		This directory contains a simple tbb::flow example that performs
+		simplistic digital logic simulations with basic logic gates that can
+		be easily composed to create more interesting circuits. It
+		exemplifies the multifunction_node and the indexer_node CPF, among others.	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="basics.h">basics.h</a>
+				<dd>Several I/O devices and basic gates.
+				<dt><a href="one_bit_adder.h">one_bit_adder.h</a>
+				<dd>A one-bit full adder composed of basic gates.
+				<dt><a href="four_bit_adder.h">four_bit_adder.h</a>
+				<dd>A four-bit full adder composed of one-bit adders.
+				<dt><a href="D_latch.h">D_latch.h</a>
+				<dd>A D-latch composed of basic gates.
+				<dt><a href="test_all.cpp">test_all.cpp</a>
+				<dd>A simple test program that exercises the code in the headers.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example with the Intel&reg; C++ Compiler (Windows* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>test_all <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>test_all [<i>#threads</i>=value] [<i>verbose</i>] [<i>silent</i>] [<i>#threads</i>]</tt>
+				<dd><tt><i>#threads</i></tt> is the number of threads to use; a range of the form <tt><i>low[:high]</i></tt> where <tt><i>low</i></tt> and optional <tt><i>high</i></tt> are non-negative integers, or <tt><i>'auto'</i></tt> for a platform-specific default number.<br>
+					<tt><i>verbose</i></tt> print diagnostic output to screen<br>
+					<tt><i>silent</i></tt> limits output to timing info; overrides verbose<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with the desired number of threads, e.g., <tt>test_all&nbsp;4</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/test_all.cpp b/xdl/third_party/tbb/examples/graph/logic_sim/test_all.cpp
new file mode 100644
index 00000000..0e8574dd
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/test_all.cpp
@@ -0,0 +1,646 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#include <cstdio>
+
+#include "../../common/utility/utility.h"
+
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+#if _MSC_VER
+#pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#endif
+
+#define USE_TWO_BIT_FULL_ADDER 1
+
+#include "basics.h"
+#include "one_bit_adder.h"
+#if USE_TWO_BIT_FULL_ADDER
+#include "two_bit_adder.h"
+#else
+#include "four_bit_adder.h"
+#endif
+#include "D_latch.h"
+#include <cassert>
+
+// User-specified globals with default values
+bool verbose = false;            // prints bin details and other diagnostics to screen
+bool silent = false;             // suppress all output except for time
+
+int get_default_num_threads() {
+    static int threads = 0;
+    if (threads == 0)
+        threads = tbb::task_scheduler_init::default_num_threads();
+    return threads;
+}
+
+#endif // __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+int main(int argc, char *argv[]) {
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+    try {
+        utility::thread_number_range threads(get_default_num_threads);
+        utility::parse_cli_arguments(argc, argv,
+                                     utility::cli_argument_pack()
+                                     //"-h" option for displaying help is present implicitly
+                                     .positional_arg(threads,"#threads",utility::thread_number_range_desc)
+                                     .arg(verbose,"verbose","   print diagnostic output to screen")
+                                     .arg(silent,"silent","    limits output to timing info; overrides verbose")
+        );
+
+        if (silent) verbose = false;  // make silent override verbose
+
+        tick_count start = tick_count::now();
+        for(int p = threads.first; p <= threads.last; p = threads.step(p)) {
+            task_scheduler_init init(p);
+            if (!silent)  cout << "graph test running on " << p << " threads.\n";
+            
+            graph g;
+
+            { // test buffer: 0, 1
+                buffer b(g);
+                toggle input(g);
+                led output(g, "OUTPUT", false); // false means we will explicitly call display to see LED
+                
+                make_edge(input.get_out(), input_port<0>(b));
+                make_edge(output_port<0>(b), output.get_in());
+                
+                if (!silent) printf("Testing buffer...\n");
+                input.activate(); // 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input.flip(); // 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+            }
+
+            { // test not_gate: 0, 1
+                not_gate n(g);
+                toggle input(g);
+                led output(g, "OUTPUT", false);
+                
+                make_edge(input.get_out(), input_port<0>(n));
+                make_edge(output_port<0>(n), output.get_in());
+                
+                if (!silent) printf("Testing not_gate...\n");
+                input.activate(); // 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input.flip(); // 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+            }
+
+            { // test two-input and_gate: 00, 01, 10, 11
+                and_gate<2> a(g);
+                toggle input0(g);
+                toggle input1(g);
+                led output(g, "OUTPUT", false);
+                
+                make_edge(input0.get_out(), input_port<0>(a));
+                make_edge(input1.get_out(), input_port<1>(a));
+                make_edge(output_port<0>(a), output.get_in());
+                
+                if (!silent) printf("Testing and_gate...\n");
+                input1.activate();  input0.activate();  // 0 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input0.flip();  // 0 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input1.flip(); input0.flip();  // 1 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input0.flip();  // 1 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+            }
+
+            { // test three-input or_gate: 000, 001, 010, 100, 011, 101, 110, 111
+                or_gate<3> o(g);
+                toggle input0(g);
+                toggle input1(g);
+                toggle input2(g);
+                led output(g, "OUTPUT", false);
+                
+                make_edge(input0.get_out(), input_port<0>(o));
+                make_edge(input1.get_out(), input_port<1>(o));
+                make_edge(input2.get_out(), input_port<2>(o));
+                make_edge(output_port<0>(o), output.get_in());
+                
+                if (!silent) printf("Testing or_gate...\n");
+                input2.activate();  input1.activate();  input0.activate();  // 0 0 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input0.flip();  // 0 0 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input1.flip(); input0.flip();  // 0 1 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input2.flip();  input1.flip();  // 1 0 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input2.flip();  input1.flip();  input0.flip();  // 0 1 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input2.flip();  input1.flip();  // 1 0 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input1.flip();  input0.flip();  // 1 1 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input0.flip();  // 1 1 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+            }
+
+            { // test two-input xor_gate: 00, 01, 10, 11
+                xor_gate<2> x(g);
+                toggle input0(g);
+                toggle input1(g);
+                led output(g, "OUTPUT", false);
+                
+                make_edge(input0.get_out(), input_port<0>(x));
+                make_edge(input1.get_out(), input_port<1>(x));
+                make_edge(output_port<0>(x), output.get_in());
+                
+                if (!silent) printf("Testing xor_gate...\n");
+                input1.activate();  input0.activate();  // 0 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input0.flip();  // 0 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input1.flip();  input0.flip();  // 1 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input0.flip();  // 1 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+            }
+
+
+            { // test two-input nor_gate: 00, 01, 10, 11
+                nor_gate<2> n(g);
+                toggle input0(g);
+                toggle input1(g);
+                led output(g, "OUTPUT", false);
+                
+                make_edge(input0.get_out(), input_port<0>(n));
+                make_edge(input1.get_out(), input_port<1>(n));
+                make_edge(output_port<0>(n), output.get_in());
+                
+                if (!silent) printf("Testing nor_gate...\n");
+                input1.activate();  input0.activate();  // 0 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == high);
+                input0.flip();  // 0 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input1.flip();  input0.flip();  // 1 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+                input0.flip();  // 1 1
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == low);
+            }
+
+            { // test steady_signal and digit
+                steady_signal input0(g, high);
+                steady_signal input1(g, low);
+                and_gate<2> a(g);
+                or_gate<2> o(g);
+                xor_gate<2> x(g);
+                nor_gate<2> n(g);
+                digit output(g, "OUTPUT", false);
+                
+                make_edge(input0.get_out(), input_port<0>(a));
+                make_edge(input1.get_out(), input_port<1>(a));
+                make_edge(output_port<0>(a), input_port<0>(output));
+
+                make_edge(input0.get_out(), input_port<0>(o));
+                make_edge(input1.get_out(), input_port<1>(o));
+                make_edge(output_port<0>(o), input_port<1>(output));
+
+                make_edge(input0.get_out(), input_port<0>(x));
+                make_edge(input1.get_out(), input_port<1>(x));
+                make_edge(output_port<0>(x), input_port<2>(output));
+
+                make_edge(input0.get_out(), input_port<0>(n));
+                make_edge(input1.get_out(), input_port<1>(n));
+                make_edge(output_port<0>(n), input_port<3>(output));
+                
+                if (!silent) printf("Testing steady_signal...\n");
+                input0.activate();  // 1
+                input1.activate();  // 0
+                g.wait_for_all();
+                if (!silent) output.display();
+                assert(output.get_value() == 6);
+            }
+
+            { // test push_button
+                push_button p(g);
+                buffer b(g);
+                led output(g, "OUTPUT", !silent); // true means print all LED state changes
+
+                make_edge(p.get_out(), input_port<0>(b));
+                make_edge(output_port<0>(b), output.get_in());
+
+                if (!silent) printf("Testing push_button...\n");
+                p.press();
+                p.release();
+                p.press();
+                p.release();
+                g.wait_for_all();
+            }
+
+            { // test one_bit_adder
+                one_bit_adder my_adder(g);
+                toggle A(g);
+                toggle B(g);
+                toggle CarryIN(g);
+                led Sum(g, "SUM");
+                led CarryOUT(g, "CarryOUT");
+                
+                make_edge(A.get_out(), input_port<P::A0>(my_adder));
+                make_edge(B.get_out(), input_port<P::B0>(my_adder));
+                make_edge(CarryIN.get_out(), input_port<P::CI>(my_adder));
+                make_edge(output_port<P::S0>(my_adder), Sum.get_in());
+                make_edge(output_port<1>(my_adder), CarryOUT.get_in());
+                
+                A.activate();
+                B.activate();
+                CarryIN.activate();
+                
+                if (!silent) printf("A on\n");
+                A.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == high) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("A off\n");
+                A.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("B on\n");
+                B.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == high) && (CarryOUT.get_value() == low));
+                if (!silent) printf("B off\n");
+                B.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("CarryIN on\n");
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == high) && (CarryOUT.get_value() == low));
+                if (!silent) printf("CarryIN off\n");
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("A&B on\n");
+                A.flip();
+                B.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == high));
+                if (!silent) printf("A&B off\n");
+                A.flip();
+                B.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("A&CarryIN on\n");
+                A.flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == high));
+                if (!silent) printf("A&CarryIN off\n");
+                A.flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("B&CarryIN on\n");
+                B.flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == high));
+                if (!silent) printf("B&CarryIN off\n");
+                B.flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("A&B&CarryIN on\n");
+                A.flip();
+                B.flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == high) && (CarryOUT.get_value() == high));
+                if (!silent) printf("A&B&CarryIN off\n");
+                A.flip();
+                B.flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == low) && (CarryOUT.get_value() == low));
+            }
+
+#if USE_TWO_BIT_FULL_ADDER
+            { // test two_bit_adder
+                if (!silent) printf("testing two_bit adder\n");
+                two_bit_adder two_adder(g);
+                std::vector<toggle> A(2, toggle(g));
+                std::vector<toggle> B(2, toggle(g));
+                toggle CarryIN(g);
+                digit Sum(g, "SUM");
+                led CarryOUT(g, "CarryOUT");
+
+                make_edge(A[0].get_out(), input_port<P::A0>(two_adder));
+                make_edge(B[0].get_out(), input_port<P::B0>(two_adder));
+                make_edge(output_port<P::S0>(two_adder), input_port<0>(Sum));
+
+                make_edge(A[1].get_out(), input_port<P::A1>(two_adder));
+                make_edge(B[1].get_out(), input_port<P::B1>(two_adder)); 
+                make_edge(output_port<P::S1>(two_adder), input_port<1>(Sum));
+
+                make_edge(CarryIN.get_out(), input_port<P::CI>(two_adder));
+                make_edge(output_port<P::CO>(two_adder), CarryOUT.get_in());
+
+                // Activate all switches at low state
+                for (int i=0; i<2; ++i) {
+                    A[i].activate();
+                    B[i].activate();
+                }
+                CarryIN.activate();
+
+                if (!silent) printf("1+0\n");
+                A[0].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 1) && (CarryOUT.get_value() == low));
+
+                if (!silent) printf("0+1\n");
+                A[0].flip();
+                B[0].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 1) && (CarryOUT.get_value() == low));
+            }
+#else
+            { // test four_bit_adder
+                four_bit_adder four_adder(g);
+                std::vector<toggle> A(4, toggle(g));
+                std::vector<toggle> B(4, toggle(g));
+                toggle CarryIN(g);
+                digit Sum(g, "SUM");
+                led CarryOUT(g, "CarryOUT");
+
+                    make_edge(A[0].get_out(), input_port<P::A0>(four_adder));
+                    make_edge(B[0].get_out(), input_port<P::B0>(four_adder));
+                    make_edge(output_port<P::S0>(four_adder), input_port<0>(Sum));
+
+                    make_edge(A[1].get_out(), input_port<P::A1>(four_adder));
+                    make_edge(B[1].get_out(), input_port<P::B1>(four_adder));
+                    make_edge(output_port<P::S1>(four_adder), input_port<1>(Sum));
+
+                    make_edge(A[2].get_out(), input_port<P::A2>(four_adder));
+                    make_edge(B[2].get_out(), input_port<P::B2>(four_adder));
+                    make_edge(output_port<P::S2>(four_adder), input_port<2>(Sum));
+
+                    make_edge(A[3].get_out(), input_port<P::A3>(four_adder));
+                    make_edge(B[3].get_out(), input_port<P::B3>(four_adder));
+                    make_edge(output_port<P::S3>(four_adder), input_port<3>(Sum));
+
+                    make_edge(CarryIN.get_out(), input_port<P::CI>(four_adder));
+                    make_edge(output_port<P::CO>(four_adder), CarryOUT.get_in());
+                
+                // Activate all switches at low state
+                for (int i=0; i<4; ++i) {
+                    A[i].activate();
+                    B[i].activate();
+                }
+                CarryIN.activate();
+                
+                if (!silent) printf("1+0\n");
+                A[0].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 1) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("0+1\n");
+                A[0].flip();
+                B[0].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 1) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("3+4\n");
+                A[0].flip();
+                A[1].flip();
+                B[0].flip();
+                B[2].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 7) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("6+1\n");
+                A[0].flip();
+                A[2].flip();
+                B[0].flip();
+                B[2].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 7) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("0+0+carry\n");
+                A[1].flip();
+                A[2].flip();
+                B[0].flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 1) && (CarryOUT.get_value() == low));
+                
+                if (!silent) printf("15+15+carry\n");
+                A[0].flip();
+                A[1].flip();
+                A[2].flip();
+                A[3].flip();
+                B[0].flip();
+                B[1].flip();
+                B[2].flip();
+                B[3].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 0xf) && (CarryOUT.get_value() == high));
+                
+                if (!silent) printf("8+8\n");
+                A[0].flip();
+                A[1].flip();
+                A[2].flip();
+                B[0].flip();
+                B[1].flip();
+                B[2].flip();
+                CarryIN.flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 0) && (CarryOUT.get_value() == high));
+                
+                if (!silent) printf("0+0\n");
+                A[3].flip();
+                B[3].flip();
+                g.wait_for_all();
+                if (!silent) Sum.display();
+                if (!silent) CarryOUT.display();
+                assert((Sum.get_value() == 0) && (CarryOUT.get_value() == low));
+            }
+#endif
+
+            { // test D_latch
+                D_latch my_d_latch(g);
+                toggle D(g);
+                pulse E(g, 500, 4); // clock changes every 500ms; stops after 4 changes
+                led Q(g, " Q", verbose); // if true, LEDs print at every state change
+                led notQ(g, "~Q", verbose);
+
+                make_edge(D.get_out(), input_port<0>(my_d_latch)); 
+                make_edge(E.get_out(), input_port<1>(my_d_latch));
+                make_edge(output_port<0>(my_d_latch), Q.get_in());
+                make_edge(output_port<1>(my_d_latch), notQ.get_in());
+
+                D.activate();
+
+                if (!silent) printf("Toggling D\n");
+                E.activate();
+                D.flip();
+                g.wait_for_all();
+                if (!silent && !verbose) { Q.display(); notQ.display(); }
+                assert((Q.get_value() == high) && (notQ.get_value() == low));
+                E.reset();
+                
+                if (!silent) printf("Toggling D\n");
+                E.activate();
+                D.flip();
+                g.wait_for_all();
+                if (!silent && !verbose) { Q.display(); notQ.display(); }
+                assert((Q.get_value() == low) && (notQ.get_value() == high));
+                E.reset();
+                
+                if (!silent) printf("Toggling D\n");
+                E.activate();
+                D.flip();
+                g.wait_for_all();
+                if (!silent && !verbose) { Q.display(); notQ.display(); }
+                assert((Q.get_value() == high) && (notQ.get_value() == low));
+                E.reset();
+                
+                if (!silent) printf("Toggling D\n");
+                E.activate();
+                D.flip();
+                g.wait_for_all();
+                if (!silent && !verbose) { Q.display(); notQ.display(); }
+                assert((Q.get_value() == low) && (notQ.get_value() == high));
+                E.reset();
+                
+                if (!silent) printf("Toggling D\n");
+                E.activate();
+                D.flip();
+                g.wait_for_all();
+                if (!silent && !verbose) { Q.display(); notQ.display(); }
+                assert((Q.get_value() == high) && (notQ.get_value() == low));
+            }
+        }
+        utility::report_elapsed_time((tbb::tick_count::now() - start).seconds());
+        return 0;
+    } catch(std::exception& e) {
+        cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+#else
+    utility::report_skipped();
+    return 0;
+#endif // __TBB_FLOW_GRAPH_CPP11_FEATURES
+}
+
diff --git a/xdl/third_party/tbb/examples/graph/logic_sim/two_bit_adder.h b/xdl/third_party/tbb/examples/graph/logic_sim/two_bit_adder.h
new file mode 100644
index 00000000..3e9b9f52
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/logic_sim/two_bit_adder.h
@@ -0,0 +1,59 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBBexample_graph_logicsim_tba_H
+#define __TBBexample_graph_logicsim_tba_H 1
+
+#include "one_bit_adder.h"
+
+class two_bit_adder : public composite_node< tuple< signal_t, signal_t, signal_t, signal_t, signal_t >, 
+                                            tuple< signal_t, signal_t, signal_t > > {
+    graph& my_graph;
+    std::vector<one_bit_adder> two_adders; 
+    typedef composite_node< tuple< signal_t, signal_t, signal_t, signal_t, signal_t >, 
+                          tuple< signal_t, signal_t, signal_t > > base_type;
+ public:
+    two_bit_adder(graph& g) : base_type(g), my_graph(g), two_adders(2, one_bit_adder(g)) {
+        make_connections();
+        set_up_composite();
+    }
+    two_bit_adder(const two_bit_adder& src) : 
+        base_type(src.my_graph), my_graph(src.my_graph), two_adders(2, one_bit_adder(src.my_graph)) 
+    {
+        make_connections();
+        set_up_composite();
+    }
+    ~two_bit_adder() {}
+
+private:
+    void make_connections() {
+        make_edge(output_port<1>(two_adders[0]), input_port<0>(two_adders[1]));
+    }
+    void set_up_composite() {
+
+        base_type::input_ports_type input_tuple(input_port<0>(two_adders[0]/*CI*/), input_port<1>(two_adders[0]), input_port<2>(two_adders[0]), input_port<1>(two_adders[1]), input_port<2>(two_adders[1]));
+
+       base_type::output_ports_type output_tuple(output_port<0>(two_adders[0]), output_port<0>(two_adders[1]),output_port<1>(two_adders[1]/*CO*/));
+       base_type::set_external_ports(input_tuple, output_tuple);
+    }
+};
+
+#endif /* __TBBexample_graph_logicsim_tba_H */
+
diff --git a/xdl/third_party/tbb/examples/graph/matmult/Makefile b/xdl/third_party/tbb/examples/graph/matmult/Makefile
new file mode 100644
index 00000000..413bab9f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/matmult/Makefile
@@ -0,0 +1,59 @@
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+
+run_cmd=
+PROG=matmult
+ARGS=
+
+# icpc by default
+ifneq (,$(shell which icc 2>/dev/null))
+    CXX=icpc
+endif
+
+# autodetect C++11 support
+include ../../common/examples-common.inc
+
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt -lpthread -lcilkrts
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all: release test
+
+release:
+	$(CXX) -O2 -DNDEBUG *.cpp $(CXXFLAGS) -o $(PROG) -ltbb $(LIBS) $(CXX0XFLAGS)
+
+debug:
+	$(CXX) -O0 -g -DTBB_USE_DEBUG *.cpp $(CXXFLAGS) -o $(PROG) -ltbb_debug $(LIBS)  $(CXX0XFLAGS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG)
diff --git a/xdl/third_party/tbb/examples/graph/matmult/Makefile.windows b/xdl/third_party/tbb/examples/graph/matmult/Makefile.windows
new file mode 100644
index 00000000..e8611453
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/matmult/Makefile.windows
@@ -0,0 +1,56 @@
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+run_cmd=
+PROG=matmult
+ARGS=
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_WARNINGS /D _CRT_NONSTDC_NO_DEPRECATE /wd4267 /wd4244
+MYLDFLAGS = /INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+
+release:
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+debug:
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+profile: 
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+
+test:
+	$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/graph/matmult/matmult.cpp b/xdl/third_party/tbb/examples/graph/matmult/matmult.cpp
new file mode 100644
index 00000000..42879223
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/matmult/matmult.cpp
@@ -0,0 +1,374 @@
+/*
+    Copyright (c) 2016-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// -------------------------------------------------------------------------------------------------
+// This is an example of a matrix multiplication Gen kernel usage with TBB Flow Graph.
+// It exemplifies support for compute offload to Intel(R) Graphics Technology in the flow graph API.
+// -------------------------------------------------------------------------------------------------
+
+#define TBB_PREVIEW_FLOW_GRAPH_NODES 1
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+
+#include "tbb/tbb_config.h"
+#include "../../common/utility/utility.h"
+
+#if __TBB_PREVIEW_GFX_FACTORY && __TBB_PREVIEW_STREAMING_NODE
+
+#if _MSC_VER
+#pragma warning(disable : 4503) // suppress warning C4503: decorated name length exceeded, name was truncated 
+#endif
+
+// -------------------------------------------------------------------------------------------------
+
+#include <iostream>
+
+#include <cilk/cilk.h>
+#include <cilk/cilk_api.h>
+
+#include "tbb/tick_count.h"
+#include "tbb/flow_graph.h"
+#include "tbb/gfx_factory.h"
+
+// -------------------------------------------------------------------------------------------------
+
+#define SLM_TILE_X (4*8)
+#define SLM_TILE_Y (4*8)
+#define SLM_TILE_K (4*8)
+
+#define SIZE_X (2*SLM_TILE_X)
+#define SIZE_Y (2*SLM_TILE_Y)
+#define SIZE_K (2*SLM_TILE_X)
+
+#ifdef __GFX__
+#define BARRIER _gfx_gpgpu_thread_barrier()
+#else
+#define BARRIER
+#endif
+
+#define TILE_Y 8
+#define TILE_K 8
+#define TILE_X 8
+
+// The naive straightforward algorithm used to obtain reference results on CPU
+void matmult_naive(const float* A, const float* B, float* C) {
+    for (int y = 0; y < SIZE_Y; y++) {
+        for (int x = 0; x < SIZE_X; x++) {
+            C[y * SIZE_Y + x] = (float)0;
+
+            for (int k = 0; k < SIZE_K; k++) {
+                C[y * SIZE_Y + x] += A[y * SIZE_K + k] * B[k * SIZE_K + x];
+            }
+        }
+    }
+}
+
+// Shared Local Memory based algorithm
+__declspec(target(gfx_kernel))
+void matmult_tiled_slm(const float A[][SIZE_K], const float B[][SIZE_X], float C[][SIZE_X]) {
+    // The parallel loop nest below iterates over "supertiles" in the resulting
+    // matrix C and it is parallelized across thread groups, 1 iteration per
+    // group, which effectively means that the loop nest is peeled off.
+    // This kernel is programmed so that each thread group calculates one
+    // resulting supertile in matrix C.
+    _Cilk_for _Thread_group(int tg_y = 0; tg_y < SIZE_Y; tg_y += SLM_TILE_Y) {
+        _Cilk_for _Thread_group(int tg_x = 0; tg_x < SIZE_X; tg_x += SLM_TILE_X) {
+            // declare "supertiles" of each matrix to be allocated in SLM
+            __thread_group_local float slm_atile[SLM_TILE_Y][SLM_TILE_K];
+            __thread_group_local float slm_btile[SLM_TILE_K][SLM_TILE_X];
+            __thread_group_local float slm_ctile[SLM_TILE_Y][SLM_TILE_X];
+
+            // initialize the result supertile (in parallel)
+            //slm_ctile[:][:] = (float)0;
+            _Cilk_for(int i0 = 0; i0 < SLM_TILE_Y; i0++)
+                _Cilk_for(int i1 = 0; i1 < SLM_TILE_X; i1++)
+                    slm_ctile[i0][i1] = (float)0;
+
+            // calculate the dot product of supertiles:
+            for (int super_k = 0; super_k < SIZE_K; super_k += SLM_TILE_K) {
+                // cache A's and B's "supertiles" in SLM (in parallel)
+                //slm_atile[:][:] = A[tg_y:SLM_TILE_Y][super_k:SLM_TILE_K];
+                _Cilk_for(int i0 = 0; i0 < SLM_TILE_Y; i0++)
+                    _Cilk_for(int i1 = 0; i1 < SLM_TILE_K; i1++)
+                        slm_atile[i0][i1] = A[tg_y + i0][super_k + i1];
+
+                //slm_btile[:][:] = B[super_k:SLM_TILE_K][tg_x:SLM_TILE_X];
+                _Cilk_for(int i0 = 0; i0 < SLM_TILE_K; i0++)
+                    _Cilk_for(int i1 = 0; i1 < SLM_TILE_X; i1++)
+                        slm_btile[i0][i1] = B[super_k + i0][tg_x + i1];
+
+                // need a barrier, since every tile in tiles are used by
+                // multiple threads in the group
+                BARRIER;
+
+                // now multiply the supertiles as usual matrices (in parallel)
+                // ...
+                // ... using the most effective tiled algorithm:
+                _Cilk_for(int t_y = 0; t_y < SLM_TILE_Y; t_y += TILE_Y) {
+                    _Cilk_for(int t_x = 0; t_x < SLM_TILE_X; t_x += TILE_X) {
+                        // allocate tiles in registers
+                        float atile[TILE_Y][TILE_K], btile[TILE_X];
+                        float ctile[TILE_Y][TILE_X];
+
+                        // ... and initialize ctile to zero
+                        ctile[:][:] = (float)0;
+
+                        // calculate the dot product of the tiles
+                        for (int k = 0; k < SLM_TILE_K; k += TILE_K) {
+                            atile[:][:] = slm_atile[t_y:TILE_Y][k:TILE_K];
+
+                            for (int k_ind = 0; k_ind < TILE_K; k_ind++) {
+                                btile[:] = slm_btile[k + k_ind][t_x:TILE_X];
+
+                                // multiply current btile row by atile's
+                                // current element and add up to corresponding
+                                // ctile row
+                                for (int y_ind = 0; y_ind < TILE_Y; y_ind++) {
+                                    ctile[y_ind][:] += atile[y_ind][k_ind] *
+                                        btile[:];
+                                }
+                            }
+                        }
+                        // flush the thread-local ctile (registers) into the
+                        // thread group-local supertile (SLM) adding up
+                        // elements
+                        slm_ctile[t_y:TILE_Y][t_x:TILE_X] += ctile[:][:];
+                    }
+                }
+
+                // barrier to make sure
+                // (1) next iteration of the loop does not overwrite a and b
+                //   SLM tiles used in the above calculation of slm_ctile
+                // (2) on the last iteration of the loop, all threads wait
+                //   for the SLM ctile calculation to be completed before
+                //   writing it back to memory below this loop
+                BARRIER;
+            }
+
+            // write (in parallel) the result supertile back to memory:
+            //C[tg_y:SLM_TILE_Y][tg_x:SLM_TILE_X] = slm_ctile[:][:];
+            _Cilk_for(int i0 = 0; i0 < SLM_TILE_Y; i0++)
+                _Cilk_for(int i1 = 0; i1 < SLM_TILE_X; i1++)
+                    C[tg_y + i0][tg_x + i1] = slm_ctile[i0][i1];
+
+            // next iteration of the loop zeroes out slm_ctile - make sure this
+            // always happens after slm_ctile has been dumped to memory (above
+            // loop nest completes):
+            BARRIER;
+        }
+    }
+}
+
+// Matrix initialization function
+void init_matrix(int width, int height, float* matrix) {
+    for (int j = 0; j < height; j++) {
+        for (int i = 0; i < width; i++) {
+            matrix[j * height + i] = (float)(j * 4 + i);
+        }
+    }
+}
+
+// Validate matrix with reference values
+bool validate_mat(char *title, int size_y, int size_x, const float* mat, const float* ref_mat) {
+    int err_cnt = 0;
+    printf("verifying %s...", title);
+    fflush(stdout);
+
+    for (int y = 0; y < size_y; y++) {
+        for (int x = 0; x < size_x; x++) {
+            float val = mat[y * size_y + x];
+            float gold_val = ref_mat[y * size_y + x];
+
+            if (val != gold_val) {
+                if (err_cnt == 0) {
+                    printf("\n");
+                }
+                if (++err_cnt < 10) {
+                    std::cout <<
+                        "  ERROR at [" << y << "][" << x << "]: " <<
+                        val << "(should be " << gold_val << ")" << std::endl;
+                }
+            }
+        }
+    }
+    if (err_cnt == 0) {
+        printf(" ok\n");
+    } else {
+        printf("FAILED\n");
+    }
+    return err_cnt == 0;
+}
+
+// ----------------------------------------------------------------------------
+// Helper types and functions
+// ----------------------------------------------------------------------------
+
+struct matrix_size {
+    int columns;
+    int rows;
+};
+
+typedef std::tuple< tbb::flow::gfx_buffer<float>,
+                    tbb::flow::gfx_buffer<float>,
+                    tbb::flow::gfx_buffer<float> > kernel_args_type;
+typedef kernel_args_type cpu_args_type;
+typedef kernel_args_type validation_args_type;
+
+// Constructs flow graph with three computation nodes that all make matrixes multiplication
+// - CPU node - obtains reference result on CPU
+// - CPU SLM node - Intel(R) Cilk(TM) based matrixes multiplication implementation on CPU
+// - GPU node - obtains result on GPU using GFX offload API
+void mat_multiplication() {
+
+    //------------------------------------------
+    // TBB Flow Graph nodes declaration section
+    //------------------------------------------
+
+    tbb::flow::graph g;
+    tbb::flow::gfx_factory factory(g);
+
+    // Enqueue task for running on Gen
+    tbb::flow::split_node< kernel_args_type > gpu_slm_split_n(g);
+    tbb::flow::streaming_node< kernel_args_type, tbb::flow::queueing, tbb::flow::gfx_factory > gpu_slm_mat_mult_n(g, matmult_tiled_slm, tbb::flow::gfx_factory::dummy_device_selector(), factory);
+
+    // Obtain SLM algorithm result on CPU
+    tbb::flow::function_node< cpu_args_type, tbb::flow::gfx_buffer<float> > cpu_slm_mat_mult_n(g, tbb::flow::unlimited, [](const cpu_args_type& args) -> tbb::flow::gfx_buffer<float> {
+        // Get references to matrixes
+        const tbb::flow::gfx_buffer<float >& A_MATRIX = std::get<0>(args);
+        const tbb::flow::gfx_buffer<float>& B_MATRIX  = std::get<1>(args);
+        tbb::flow::gfx_buffer<float> CPU_SLM_MATRIX   = std::get<2>(args);
+
+        matmult_tiled_slm((float(*)[SIZE_K])A_MATRIX.data(), (float(*)[SIZE_X])B_MATRIX.data(), (float(*)[SIZE_X])CPU_SLM_MATRIX.data());
+
+        return CPU_SLM_MATRIX;
+    });
+
+    // Obtain reference result on CPU
+    tbb::flow::function_node< cpu_args_type, tbb::flow::gfx_buffer<float> > cpu_naive_mat_mult_n(g, tbb::flow::unlimited, [](const cpu_args_type& args) -> tbb::flow::gfx_buffer<float> {
+        // Get references to matrixes
+        const tbb::flow::gfx_buffer<float>& A_MATRIX  = std::get<0>(args);
+        const tbb::flow::gfx_buffer<float>& B_MATRIX  = std::get<1>(args);
+        tbb::flow::gfx_buffer<float> CPU_NAIVE_MATRIX = std::get<2>(args);
+
+        matmult_naive(A_MATRIX.data(), B_MATRIX.data(), CPU_NAIVE_MATRIX.data());
+
+        return CPU_NAIVE_MATRIX;
+    });
+
+    // Validate computed matrixes
+    tbb::flow::join_node< validation_args_type > validation_join_n(g);
+    tbb::flow::function_node< validation_args_type > mat_validation_n(g, tbb::flow::unlimited, [](const validation_args_type& result) {
+        // Get references to matrixes
+        const tbb::flow::gfx_buffer<float>& GPU_SLM_MAT   = std::get<0>(result);
+        const tbb::flow::gfx_buffer<float>& CPU_SLM_MAT   = std::get<1>(result);
+        const tbb::flow::gfx_buffer<float>& CPU_NAIVE_MAT = std::get<2>(result);
+
+        // Verify results
+        // Check that slm algorithm produces correct results on CPU:
+        validate_mat("matrix multiply: 'SLM' CPU vs. CPU", SIZE_Y, SIZE_X, CPU_SLM_MAT.data(), CPU_NAIVE_MAT.data());
+        // Verify Gen results:
+        validate_mat("matrix multiply: SLM Gen vs. CPU", SIZE_Y, SIZE_X, GPU_SLM_MAT.data(), CPU_NAIVE_MAT.data());
+    });
+
+    //-----------------------------------------
+    // Make edge section - connecting nodes
+    //-----------------------------------------
+
+    // Prepare main graph input ports for data
+    make_edge(tbb::flow::output_port<0>(gpu_slm_split_n), tbb::flow::input_port<0>(gpu_slm_mat_mult_n));
+    make_edge(tbb::flow::output_port<1>(gpu_slm_split_n), tbb::flow::input_port<1>(gpu_slm_mat_mult_n));
+    make_edge(tbb::flow::output_port<2>(gpu_slm_split_n), tbb::flow::input_port<2>(gpu_slm_mat_mult_n));
+
+    // Join results
+    make_edge(tbb::flow::output_port<2>(gpu_slm_mat_mult_n), tbb::flow::input_port<0>(validation_join_n));
+    make_edge(cpu_slm_mat_mult_n, tbb::flow::input_port<1>(validation_join_n));
+    make_edge(cpu_naive_mat_mult_n, tbb::flow::input_port<2>(validation_join_n));
+
+    //Verify correctness
+    make_edge(validation_join_n, mat_validation_n);
+
+    // Set args for GFX kernel.
+    // Default behaviour if not set.
+    gpu_slm_mat_mult_n.set_args(tbb::flow::port_ref<0, 2>);
+
+    //-----------------------------------------
+    // Input sizes and matrixes initialization
+    //-----------------------------------------
+
+    const matrix_size A_MATRIX_SIZE         = { SIZE_Y, SIZE_K };
+    const matrix_size B_MATRIX_SIZE         = { SIZE_K, SIZE_X };
+    const matrix_size GPU_SLM_MATRIX_SIZE   = { SIZE_Y, SIZE_X };
+    const matrix_size CPU_SLM_MATRIX_SIZE   = { SIZE_Y, SIZE_X };
+    const matrix_size CPU_NAIVE_MATRIX_SIZE = { SIZE_Y, SIZE_X };
+
+    tbb::flow::gfx_buffer<float> A_MATRIX(A_MATRIX_SIZE.columns * A_MATRIX_SIZE.rows);
+    tbb::flow::gfx_buffer<float> B_MATRIX(B_MATRIX_SIZE.columns * B_MATRIX_SIZE.rows);
+    tbb::flow::gfx_buffer<float> GPU_SLM_MATRIX(GPU_SLM_MATRIX_SIZE.columns * GPU_SLM_MATRIX_SIZE.rows);
+    tbb::flow::gfx_buffer<float> CPU_SLM_MATRIX(CPU_SLM_MATRIX_SIZE.columns * CPU_SLM_MATRIX_SIZE.rows);
+    tbb::flow::gfx_buffer<float> CPU_NAIVE_MATRIX(CPU_NAIVE_MATRIX_SIZE.columns * CPU_NAIVE_MATRIX_SIZE.rows);
+
+    // Intitialize input matrixes
+    init_matrix(A_MATRIX_SIZE.columns, A_MATRIX_SIZE.rows, A_MATRIX.data());
+    init_matrix(B_MATRIX_SIZE.columns, B_MATRIX_SIZE.rows, B_MATRIX.data());
+
+    // Make tuples with input data for graph
+    kernel_args_type GPU_SLM_INPUT   = std::make_tuple(A_MATRIX, B_MATRIX, GPU_SLM_MATRIX);
+    kernel_args_type CPU_SLM_INPUT   = std::make_tuple(A_MATRIX, B_MATRIX, CPU_SLM_MATRIX);
+    kernel_args_type CPU_NAIVE_INPUT = std::make_tuple(A_MATRIX, B_MATRIX, CPU_NAIVE_MATRIX);
+
+    //-----------------------------------------
+    // Send input to the graph and run it
+    //-----------------------------------------
+
+    gpu_slm_split_n.try_put(GPU_SLM_INPUT);
+    cpu_slm_mat_mult_n.try_put(CPU_SLM_INPUT);
+    cpu_naive_mat_mult_n.try_put(CPU_NAIVE_INPUT);
+
+    // Run graph
+    g.wait_for_all();
+}
+
+//---------------------------------------------------------------------------------
+
+int main(int argc, char* argv[]) {
+    try {
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        utility::parse_cli_arguments(argc, argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+        );
+
+        // Compute matrices and verify result
+        mat_multiplication();
+
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+        return 0;
+    } catch (std::exception& e) {
+        std::cerr << "Error occurred. Error text is : \"" << e.what() << "\"\n";
+        return -1;
+    }
+}
+
+#else
+int main() {
+    utility::report_skipped();
+    return 0;
+}
+#endif /* __TBB_PREVIEW_GFX_FACTORY && __TBB_PREVIEW_STREAMING_NODE */
diff --git a/xdl/third_party/tbb/examples/graph/matmult/msvs/matmult.sln b/xdl/third_party/tbb/examples/graph/matmult/msvs/matmult.sln
new file mode 100644
index 00000000..73f132ca
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/matmult/msvs/matmult.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "matmult", "matmult.vcxproj", "{517E31A4-BEED-481A-A5A7-5B37B82A1C16}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Debug|Win32.ActiveCfg = Debug|Win32
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Debug|Win32.Build.0 = Debug|Win32
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Debug|x64.ActiveCfg = Debug|x64
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Debug|x64.Build.0 = Debug|x64
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Release|Win32.ActiveCfg = Release|Win32
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Release|Win32.Build.0 = Release|Win32
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Release|x64.ActiveCfg = Release|x64
+		{517E31A4-BEED-481A-A5A7-5B37B82A1C16}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/matmult/msvs/matmult.vcxproj b/xdl/third_party/tbb/examples/graph/matmult/msvs/matmult.vcxproj
new file mode 100644
index 00000000..e9ebbeee
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/matmult/msvs/matmult.vcxproj
@@ -0,0 +1,145 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{517E31A4-BEED-481A-A5A7-5B37B82A1C16}</ProjectGuid>
+    <RootNamespace>matmult</RootNamespace>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>Disabled</Optimization>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;</AdditionalIncludeDirectories>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;</AdditionalLibraryDirectories>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>Disabled</Optimization>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;</AdditionalIncludeDirectories>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;</AdditionalLibraryDirectories>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>MaxSpeed</Optimization>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;</AdditionalIncludeDirectories>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;</AdditionalLibraryDirectories>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>MaxSpeed</Optimization>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;</AdditionalIncludeDirectories>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;</AdditionalLibraryDirectories>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\matmult.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/matmult/readme.html b/xdl/third_party/tbb/examples/graph/matmult/readme.html
new file mode 100644
index 00000000..ffc2e7e3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/matmult/readme.html
@@ -0,0 +1,414 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. matmult sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>matmult sample</h1>
+	</div>
+
+	<p>
+		The Matmult is an example of a Gen kernel implementing matrix multiplication.
+	<br>
+	<br>
+		It exemplifies support for compute offload to Intel&reg; Graphics Technology in the flow graph API.
+	<br><br>
+		This example uses C++11 features. Specifying a compiler option such as -std=c++11 or similar might be necessary in order to build the example.
+		For more information please refer to the documentation for the compiler you use.
+	</p>
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+			<p> For detailed Intel&reg; Graphics Technology requirements, please refer to article <a href="https://software.intel.com/en-us/articles/getting-started-with-compute-offload-to-intelr-graphics-technology">Getting Started With Compute Offload to Intel&reg;  Graphics Technology</a>
+            </p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="matmult.cpp">matmult.cpp</a>
+				<dd>Matrix multiplication Gen kernel implementation with the flow graph interface.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+			<dt><a href="msvs/">msvs</a>
+			<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>matmult <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>matmult [<i>-v</i>]</tt>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+			</dl>
+		</div>
+	</div>
+
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<a name="copyright"></a>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+
+			<p>
+				THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+				OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+				WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+				ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+				DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+				DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
+				GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+				INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+				WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+				NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+				SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+			</p>
+		</div>
+	</div>
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/som/Makefile b/xdl/third_party/tbb/examples/graph/som/Makefile
new file mode 100644
index 00000000..7312e071
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/Makefile
@@ -0,0 +1,63 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+NAME=som
+EXE=$(NAME).exe
+ARGS=
+LIGHT_ARGS=4
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+override CXXFLAGS += $(UI_CXXFLAGS)
+
+SRCFILES = som_graph.cpp som.cpp
+
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt 
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: $(SRCFILES)
+ifeq ($(compiler),xl)
+	# Avoiding "1586-346 (U) An error occurred during code generation.  The code generation return code was 40." with -O3.
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(EXE) $(SRCFILES) -ltbb -ltbbmalloc $(LIBS)
+else
+	$(CXX) -O3 -DNDEBUG $(CXXFLAGS) -o $(EXE) $(SRCFILES) -ltbb -ltbbmalloc $(LIBS)
+endif
+
+debug:  $(SRCFILES)
+	$(CXX) -g -O0 -DTBB_USE_DEBUG -D_DEBUG $(CXXFLAGS) -o $(EXE) $(SRCFILES) -ltbb_debug -ltbbmalloc_debug $(LIBS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(EXE) *.o *.d
+
+test:
+	$(run_cmd) ./$(EXE) $(ARGS)
+
+light_test:
+	$(run_cmd) ./$(EXE) $(LIGHT_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/som/Makefile.windows b/xdl/third_party/tbb/examples/graph/som/Makefile.windows
new file mode 100644
index 00000000..d0bfdc11
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/Makefile.windows
@@ -0,0 +1,48 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=som
+ARGS=
+LIGHT_ARGS=4
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: 
+	$(CXX) ./som_graph.cpp ./som.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: 
+	$(CXX) ./som_graph.cpp ./som.cpp /MDd /Od /Zi /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+profile: 
+	$(CXX) ./som_graph.cpp ./som.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/graph/som/msvs/som.sln b/xdl/third_party/tbb/examples/graph/som/msvs/som.sln
new file mode 100644
index 00000000..d9bff897
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/msvs/som.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "som", "som.vcxproj", "{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Debug|Win32.ActiveCfg = Debug|Win32
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Debug|Win32.Build.0 = Debug|Win32
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Debug|x64.ActiveCfg = Debug|x64
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Debug|x64.Build.0 = Debug|x64
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Release|Win32.ActiveCfg = Release|Win32
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Release|Win32.Build.0 = Release|Win32
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Release|x64.ActiveCfg = Release|x64
+		{B2AE2EDC-697B-4C85-AC0D-E3E523D20D6D}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/som/msvs/som.vcxproj b/xdl/third_party/tbb/examples/graph/som/msvs/som.vcxproj
new file mode 100644
index 00000000..a29633e9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/msvs/som.vcxproj
@@ -0,0 +1,217 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>som</ProjectName>
+    <ProjectGuid>{b2ae2edc-697b-4c85-ac0d-e3e523d20d6d}</ProjectGuid>
+    <RootNamespace>som</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <FixedBaseAddress>false</FixedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <FixedBaseAddress>false</FixedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <FixedBaseAddress>false</FixedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <RandomizedBaseAddress>false</RandomizedBaseAddress>
+      <FixedBaseAddress>false</FixedBaseAddress>
+      <DataExecutionPrevention>
+      </DataExecutionPrevention>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\som.cpp" />
+    <ClCompile Include="..\som_graph.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\som.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/som/readme.html b/xdl/third_party/tbb/examples/graph/som/readme.html
new file mode 100644
index 00000000..18e34d50
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/readme.html
@@ -0,0 +1,391 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Self-Organizing Map (SOM) sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Self-Organizing Map (SOM) sample</h1>
+	</div>
+	
+	<p>
+		The Self-Organizing Map demonstrates tbb::flow and the use of cancellation in scheduling multiple iterations of
+		map updates.
+	<br><br>
+		For tutorials on Self-organizing Maps, see <a href="http://www.ai-junkie.com/ann/som/som1.html">here</a> and
+		<a href="http://davis.wpi.edu/~matt/courses/soms/">here</a>.
+	<br><br>
+		The program trains the map with several examples, splitting the map into subsections and looking for best-match
+		for multiple examples.  When an example is used to update the map, the graphs examining the sections being
+		updated for the next example are cancelled and restarted after the update.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="som_graph.cpp">som_graph.cpp</a>
+				<dd>The main program.
+				<dt><a href="som.cpp">som.cpp</a>
+				<dd>Utilities for handling the map.
+				<dt><a href="som.h">som.h</a>
+				<dd>Definitions and utilities.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/som/som.cpp b/xdl/third_party/tbb/examples/graph/som/som.cpp
new file mode 100644
index 00000000..89b58da4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/som.cpp
@@ -0,0 +1,217 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// Self-organizing map in TBB flow::graph
+//
+// we will do a color map (the simple example.)
+//
+//  serial algorithm
+//
+//       initialize map with vectors (could be random, gradient, or something else)
+//       for some number of iterations
+//           update radius r, weight of change L 
+//           for each example V
+//               find the best matching unit
+//               for each part of map within radius of BMU W
+//                   update vector:  W(t+1) = W(t) + w(dist)*L*(V - W(t))
+
+#include "som.h"
+#include "tbb/task.h"
+
+std::ostream& operator<<( std::ostream &out, const SOM_element &s) {
+    out << "(";
+    for(int i=0;i<(int)s.w.size();++i) {
+        out << s.w[i];
+        if(i < (int)s.w.size()-1) {
+            out << ",";
+        }
+    }
+    out << ")";
+    return out;
+}
+
+void remark_SOM_element(const SOM_element &s) {
+    printf("(");
+    for(int i=0;i<(int)s.w.size();++i) {
+        printf("%g",s.w[i]);
+        if(i < (int)s.w.size()-1) {
+            printf(",");
+        }
+    }
+    printf(")");
+}
+
+std::ostream& operator<<( std::ostream &out, const search_result_type &s) {
+    out << "<";
+    out << get<RADIUS>(s);
+    out <<  ", " << get<XV>(s);
+    out << ", ";
+    out << get<YV>(s);
+    out << ">";
+    return out;
+}
+
+void remark_search_result_type(const search_result_type &s) {
+    printf("<%g,%d,%d>", get<RADIUS>(s), get<XV>(s), get<YV>(s));
+}
+
+double
+randval( double lowlimit, double highlimit) {
+    return double(rand()) / double(RAND_MAX) * (highlimit - lowlimit) + lowlimit;
+}
+
+void
+find_data_ranges(teaching_vector_type &teaching, SOM_element &max_range, SOM_element &min_range ) {
+    if(teaching.size() == 0) return;
+    max_range = min_range = teaching[0];
+    for(int i = 1; i < (int)teaching.size(); ++i) {
+        max_range.elementwise_max(teaching[i]);
+        min_range.elementwise_min(teaching[i]);
+    }
+} 
+
+void add_fraction_of_difference( SOM_element &to, SOM_element const &from, double frac) {
+    for(int i = 0; i < (int)from.size(); ++i) {
+        to[i] += frac*(from[i] - to[i]);
+    }
+}
+
+double
+distance_squared(SOM_element x, SOM_element y) {
+    double rval = 0.0; for(int i=0;i<(int)x.size();++i) {
+        double diff = x[i] - y[i];
+        rval += diff*diff;
+    }
+    return rval;
+}
+
+void SOMap::initialize(InitializeType it, SOM_element &max_range, SOM_element &min_range) {
+    for(int x = 0; x < xMax; ++x) {
+        for(int y = 0; y < yMax; ++y) {
+            for( int i = 0; i < (int)max_range.size(); ++i) {
+                if(it == InitializeRandom) {
+                    my_map[x][y][i] = (randval(min_range[i], max_range[i]));
+                }
+                else if(it == InitializeGradient) {
+                    my_map[x][y][i] = ((double)(x+y)/(xMax+yMax)*(max_range[i]-min_range[i]) + min_range[i]);
+                }
+            }
+        }
+    }
+}
+
+// subsquare [low,high)
+double
+SOMap::BMU_range( const SOM_element &s, int &xval, int &yval, subsquare_type &r) {
+    double min_distance_squared = DBL_MAX;
+    task &my_task = task::self();
+    int min_x = -1;
+    int min_y = -1;
+    for(int x = r.rows().begin(); x != r.rows().end(); ++x) {
+        for( int y = r.cols().begin(); y != r.cols().end(); ++y) {
+            double dist = distance_squared(s,my_map[x][y]);
+            if(dist < min_distance_squared) {
+                min_distance_squared = dist;
+                min_x = x;
+                min_y = y;
+            }
+            if(cancel_test && my_task.is_cancelled()) {
+                xval = r.rows().begin();
+                yval = r.cols().begin();
+                return DBL_MAX;
+            }
+        }
+    }
+    xval = min_x;
+    yval = min_y;
+    return sqrt(min_distance_squared);
+}
+
+void
+SOMap::epoch_update_range( SOM_element const &s, int epoch, int min_x, int min_y, double radius, double learning_rate, blocked_range<int> &r) {
+    int min_xiter = (int)((double)min_x - radius);
+    if(min_xiter < 0) min_xiter = 0;
+    int max_xiter = (int)((double)min_x + radius);
+    if(max_xiter > (int)my_map.size()-1) max_xiter = (int)my_map.size()-1;
+    for(int xx = r.begin(); xx <= r.end(); ++xx) {
+        double xrsq = (xx-min_x)*(xx-min_x);
+        double ysq = radius*radius - xrsq;  // max extent of y influence
+        double yd;
+        if(ysq > 0) {
+            yd = sqrt(ysq);
+            int lb = (int)(min_y - yd);
+            int ub = (int)(min_y + yd);
+            for(int yy = lb; yy < ub; ++yy) {
+                if(yy >= 0 && yy < (int)my_map[xx].size()) {
+                    // [xx, yy] is in the range of the update.
+                    double my_rsq = xrsq + (yy-min_y)*(yy-min_y);  // distance from BMU squared
+                    double theta = exp(-(radius*radius) /(2.0* my_rsq)); 
+                    add_fraction_of_difference(my_map[xx][yy], s, theta * learning_rate);
+                }
+            }
+        }
+    }
+}
+
+void SOMap::teach(teaching_vector_type &in) {
+    for(int i = 0; i < nPasses; ++i ) {
+        int j = (int)(randval(0, (double)in.size()));  // this won't be reproducible.
+        if(j == in.size()) --j;
+        
+        int min_x = -1;
+        int min_y = -1;
+        subsquare_type br2(0, (int)my_map.size(), 1, 0, (int)my_map[0].size(), 1);
+        (void) BMU_range(in[j],min_x, min_y, br2);  // just need min_x, min_y
+        // radius of interest
+        double radius = max_radius * exp(-(double)i*radius_decay_rate);
+        // update circle is min_xiter to max_xiter inclusive.
+        double learning_rate = max_learning_rate * exp( -(double)i * learning_decay_rate);
+        epoch_update(in[j], i, min_x, min_y, radius, learning_rate);
+    }
+}
+
+void SOMap::debug_output() {
+    printf("SOMap:\n");
+    for(int i = 0; i < (int)(this->my_map.size()); ++i) {
+        for(int j = 0; j < (int)(this->my_map[i].size()); ++j) {
+            printf( "map[%d, %d] == ", i, j );
+            remark_SOM_element( this->my_map[i][j] );
+            printf("\n");
+        }
+    }
+}
+
+#define RED 0
+#define GREEN 1
+#define BLUE 2
+
+void readInputData() {
+    my_teaching.push_back(SOM_element());
+    my_teaching.push_back(SOM_element());
+    my_teaching.push_back(SOM_element());
+    my_teaching.push_back(SOM_element());
+    my_teaching.push_back(SOM_element());
+    my_teaching[0][RED] = 1.0; my_teaching[0][GREEN] = 0.0; my_teaching[0][BLUE] = 0.0;
+    my_teaching[1][RED] = 0.0; my_teaching[1][GREEN] = 1.0; my_teaching[1][BLUE] = 0.0;
+    my_teaching[2][RED] = 0.0; my_teaching[2][GREEN] = 0.0; my_teaching[2][BLUE] = 1.0;
+    my_teaching[3][RED] = 0.3; my_teaching[3][GREEN] = 0.3; my_teaching[3][BLUE] = 0.0;
+    my_teaching[4][RED] = 0.5; my_teaching[4][GREEN] = 0.5; my_teaching[4][BLUE] = 0.9;
+}
diff --git a/xdl/third_party/tbb/examples/graph/som/som.h b/xdl/third_party/tbb/examples/graph/som/som.h
new file mode 100644
index 00000000..9d46e7fa
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/som.h
@@ -0,0 +1,161 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// Self-organizing map
+//
+// support for self-ordering maps
+#ifndef __SOM_H__
+#define __SOM_H__
+
+#include <vector>
+#include <cstdlib>
+#include <cmath>
+#include <cfloat>
+#include <iostream>
+#include <cstdio>
+
+#include "tbb/flow_graph.h"
+#include "tbb/blocked_range2d.h"
+
+using namespace tbb;
+using namespace tbb::flow;
+
+typedef blocked_range2d<int> subsquare_type;
+typedef tuple<double,int,int> search_result_type;
+
+std::ostream& operator<<( std::ostream &out, const search_result_type &s);
+
+#define RADIUS 0  // for the std::gets
+#define XV     1
+#define YV     2
+
+// to have single definitions of static variables, define _MAIN_C_ in the main program
+// 
+#ifdef _MAIN_C_
+#define DEFINE // nothing
+#define INIT(n) = n
+#else // not in main file
+#define DEFINE extern
+#define INIT(n) // nothing
+#endif  // _MAIN_C_
+
+DEFINE int nElements INIT(3);  // length of input vectors, matching vector in map
+DEFINE double max_learning_rate INIT(0.8);  // decays exponentially
+DEFINE double radius_decay_rate;
+DEFINE double learning_decay_rate INIT(0.005);
+DEFINE double max_radius;
+DEFINE bool extra_debug INIT(false);
+DEFINE bool cancel_test INIT(false);
+
+DEFINE int xMax INIT(100);
+DEFINE int yMax INIT(100);
+DEFINE int nPasses INIT(100);
+
+enum InitializeType { InitializeRandom, InitializeGradient };
+#define RED 0
+#define GREEN 1
+#define BLUE 2
+class SOM_element;
+void remark_SOM_element(const SOM_element &s);
+
+// all SOM_element vectors are the same length (nElements), so we do not have
+// to range-check the vector accesses.
+class SOM_element {
+    std::vector<double> w;
+public:
+    friend std::ostream& operator<<( std::ostream &out, const SOM_element &s);
+    friend void remark_SOM_element(const SOM_element &s);
+    SOM_element() : w(nElements,0.0) {}
+    double &operator[](int indx) { return w.at(indx); }
+    const double &operator[](int indx) const { return w.at(indx); }
+    bool operator==(SOM_element const &other) const {
+        for(size_t i=0;i<size();++i) {
+            if(w[i] != other.w[i]) {
+                return false;
+            }
+        }
+        return true;
+    }
+    bool operator!=(SOM_element const &other) const { return !operator==(other); }
+    void elementwise_max(SOM_element const &other) {
+        for(size_t i = 0; i < w.size(); ++i) if(w[i] < other.w[i]) w[i] = other.w[i];
+    }
+    void elementwise_min(SOM_element const &other) {
+        for(size_t i = 0; i < w.size(); ++i) if(w[i] > other.w[i]) w[i] = other.w[i];
+    }
+    size_t size() const { return w.size(); }
+};
+
+typedef std::vector<SOM_element> teaching_vector_type;
+
+DEFINE SOM_element max_range;
+DEFINE SOM_element min_range;
+
+extern double randval( double lowlimit, double highlimit);
+
+extern void find_data_ranges(teaching_vector_type &teaching, SOM_element &max_range, SOM_element &min_range );
+
+extern void add_fraction_of_difference( SOM_element &to, SOM_element &from, double frac);
+
+DEFINE teaching_vector_type my_teaching;
+
+class SOMap {
+    std::vector< std::vector< SOM_element > > my_map;
+public:
+    SOMap(int xSize, int ySize) {
+        my_map.reserve(xSize);
+        for(int i = 0; i < xSize; ++i) {
+            my_map.push_back(teaching_vector_type());
+            my_map[i].reserve(ySize);
+            for(int j = 0; j < ySize;++j) {
+                my_map[i].push_back(SOM_element());
+            }
+        }
+    }
+    size_t size() { return my_map.size(); }
+    void initialize(InitializeType it, SOM_element &max_range, SOM_element &min_range);
+    teaching_vector_type &operator[](int indx) { return my_map[indx]; }
+    SOM_element &at(int xVal, int yVal) { return my_map[xVal][yVal]; }
+    SOM_element &at(search_result_type const &s) { return my_map[flow::get<1>(s)][flow::get<2>(s)]; }
+    void epoch_update( SOM_element const &s, int epoch, int min_x, int min_y, double radius, double learning_rate) {
+        int min_xiter = (int)((double)min_x - radius);
+        if(min_xiter < 0) min_xiter = 0;
+        int max_xiter = (int)((double)min_x + radius);
+        if(max_xiter > (int)my_map.size()-1) max_xiter = (int)(my_map.size()-1);
+        blocked_range<int> br1(min_xiter, max_xiter, 1);
+        epoch_update_range(s, epoch, min_x, min_y, radius, learning_rate, br1);
+    }
+    void epoch_update_range( SOM_element const &s, int epoch, int min_x, int min_y, double radius, double learning_rate, blocked_range<int> &r);
+    void teach( teaching_vector_type &id);
+    void debug_output();
+    // find BMU given an input, returns distance
+    double BMU_range(const SOM_element &s, int &xval, int &yval, subsquare_type &r);
+    double BMU(const SOM_element &s, int &xval, int &yval) {
+        subsquare_type br(0,(int)my_map.size(),1,0,(int)my_map[0].size(),1);
+        return BMU_range(s, xval, yval, br);
+    }
+};
+
+extern double distance_squared(SOM_element x, SOM_element y);
+void remark_SOM_element(const SOM_element &s);
+
+extern void readInputData();
+#endif // __SOM_H__
diff --git a/xdl/third_party/tbb/examples/graph/som/som_graph.cpp b/xdl/third_party/tbb/examples/graph/som/som_graph.cpp
new file mode 100644
index 00000000..18759047
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/som_graph.cpp
@@ -0,0 +1,423 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// Self-organizing map in TBB flow::graph
+//
+//   This is an example of the use of cancellation in a graph.  After a point in searching for
+//   the best match for an example, two examples are looked for simultaneously.  When the
+//   earlier example is found and the update radius is determined, the affected searches
+//   for the subsequent example are cancelled, and after the update they are restarted.
+//   As the update radius shrinks fewer searches are cancelled, and by the last iterations
+//   virtually all the work done for the speculating example is useful.
+//
+// first, a simple implementation with only one example vector
+// at a time.
+//
+// we will do a color map (the simple example.)
+//
+//  graph algorithm
+//
+//       for some number of iterations
+//           update radius r, weight of change L 
+//           for each example V
+//               use graph to find BMU
+//               for each part of map within radius of BMU W
+//                   update vector:  W(t+1) = W(t) + w(dist)*L*(V - W(t))
+
+#define _MAIN_C_ 1
+#include "som.h"
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/flow_graph.h"
+#include "tbb/blocked_range2d.h"
+#include "tbb/tick_count.h"
+#include "../../common/utility/utility.h"
+
+#define RED 0
+#define GREEN 1
+#define BLUE 2
+
+static int xranges = 1;
+static int yranges = 1;
+static int xsize = -1;
+static int ysize = -1;
+
+static int global_i = 0;
+static int speculation_start; 
+std::vector<int> function_node_execs;
+static int xRangeMax = 3;
+static int yRangeMax = 3;
+static bool dont_speculate = false;
+static search_result_type last_update;
+
+class BMU_search_body {
+    SOMap &my_map;
+    subsquare_type my_square;
+    int &fn_tally;
+public:
+    BMU_search_body(SOMap &_m, subsquare_type &_sq, int &fnt) : my_map(_m), my_square(_sq), fn_tally(fnt) { }
+    BMU_search_body( const BMU_search_body &other) : my_map(other.my_map), my_square(other.my_square), fn_tally(other.fn_tally) { }
+    search_result_type operator()(const SOM_element s) {
+        int my_x;
+        int my_y;
+        double min_dist = my_map.BMU_range(s, my_x, my_y, my_square);
+        ++fn_tally;  // count how many times this function_node executed
+        return search_result_type(min_dist, my_x, my_y);
+    }
+};
+
+typedef function_node<SOM_element, search_result_type> search_node;
+typedef broadcast_node<SOM_element> b_node;
+typedef std::vector< search_node *> search_node_vector_type;
+typedef std::vector< search_node_vector_type > search_node_array_type;
+typedef std::vector< graph *> graph_vector_type;
+typedef std::vector< graph_vector_type > graph_array_type;
+
+#define SPECULATION_CNT 2
+
+graph *g[SPECULATION_CNT];  // main graph; there should only be one per epoch
+b_node *send_to[SPECULATION_CNT];      // broadcast node to send exemplar to all function_nodes
+queue_node<search_result_type> *q[SPECULATION_CNT];  // queue for function nodes to put their results in
+// each function_node should have its own graph
+search_node_array_type* s_array[SPECULATION_CNT];  // 2d array of function nodes
+graph_array_type* g_array[SPECULATION_CNT];        // 2d array of graphs
+
+// build a set of SPECULATION_CNT graphs, each of which consists of a broadcast_node,
+//    xranges x yranges function_nodes, and one queue_node for output.
+//    once speculation starts, if i % SPECULATION_CNT is the current graph, (i+1) % SPECULATION_CNT
+//    is the first speculation, and so on.
+void
+build_BMU_graph(SOMap &map1) {
+    // build current graph
+    xsize = ((int)map1.size() + xranges - 1) / xranges;
+    ysize = ((int)map1[0].size() + yranges - 1) / yranges;
+    function_node_execs.clear();
+    function_node_execs.reserve(xranges*yranges+1);
+    for(int ii = 0; ii < xranges*yranges+1;++ii) function_node_execs.push_back(0);
+
+    for(int scnt = 0; scnt < SPECULATION_CNT; ++scnt) {
+        g[scnt] = new graph;
+        send_to[scnt] = new b_node(*(g[scnt]));  // broadcast node to the function_nodes
+        q[scnt] = new queue_node<search_result_type>(*(g[scnt]));  // output queue
+
+        // create the function_nodes, tie to the graph
+        s_array[scnt] = new search_node_array_type;
+        s_array[scnt]->reserve(xranges);
+        g_array[scnt] = new graph_array_type;
+        g_array[scnt]->reserve(xranges);
+        for(int i = 0; i < (int)map1.size(); i += xsize) {
+            int xindex = i / xsize;
+            s_array[scnt]->push_back(search_node_vector_type());
+            (*s_array[scnt])[xindex].reserve(yranges);
+            g_array[scnt]->push_back(graph_vector_type());
+            (*g_array[scnt])[xindex].reserve(yranges);
+            for( int j = 0; j < (int)map1[0].size(); j += ysize) {
+                int offset = (i/xsize)*yranges + (j / ysize);
+                int xmax = (i + xsize) > (int)map1.size() ? (int)map1.size() : i + xsize;
+                int ymax = (j + ysize) > (int)map1[0].size() ? (int)map1[0].size() : j + ysize;
+                subsquare_type sst(i,xmax,1,j,ymax,1);
+                BMU_search_body bb(map1,sst,function_node_execs[offset]);
+                graph *g_local = new graph;
+                search_node *s = new search_node(*g_local, serial, bb); // copies Body
+                (*g_array[scnt])[xindex].push_back(g_local);
+                (*s_array[scnt])[xindex].push_back(s);
+                make_edge(*(send_to[scnt]), *s);  // broadcast_node -> function_node
+                make_edge(*s, *(q[scnt]));   // function_node -> queue_node
+            }
+        }
+    }
+}
+
+// Wait for the 2D array of flow::graphs.
+void wait_for_all_graphs(int cIndex) {  // cIndex ranges over [0 .. SPECULATION_CNT - 1]
+    for(int x = 0; x < xranges; ++x) {
+        for(int y = 0; y < yranges; ++y) {
+            (*g_array[cIndex])[x][y]->wait_for_all();
+        }
+    }
+}
+
+void
+destroy_BMU_graph() {
+    for(int scnt = 0; scnt < SPECULATION_CNT; ++scnt) {
+        for( int i = 0; i < (int)(*s_array[scnt]).size(); ++i ) {
+            for(int j = 0; j < (int)(*s_array[scnt])[i].size(); ++j) {
+                delete (*s_array[scnt])[i][j];
+                delete (*g_array[scnt])[i][j];
+            }
+        }
+        (*s_array[scnt]).clear();
+        delete s_array[scnt];
+        (*g_array[scnt]).clear();
+        delete g_array[scnt];
+        delete q[scnt];
+        delete send_to[scnt];
+        delete g[scnt];
+    }
+}
+
+void find_subrange_overlap(int const &xval, int const &yval, double const &radius, int &xlow, int &xhigh, int &ylow, int &yhigh) {
+    xlow = int((xval-radius)/xsize);
+    xhigh = int((xval+radius)/xsize);
+    ylow = int((yval-radius)/ysize);
+    yhigh = int((yval+radius)/ysize);
+    // circle may fall partly outside map
+    if(xlow < 0) xlow = 0;
+    if(xhigh >= xranges) xhigh = xranges - 1;
+    if(ylow < 0) ylow = 0;
+    if(yhigh >= yranges) yhigh = yranges - 1;
+}
+
+bool overlap( int &xval, int &yval, search_result_type &sr) {
+    int xlow, xhigh, ylow, yhigh;
+    find_subrange_overlap(get<XV>(sr), get<YV>(sr), get<RADIUS>(sr), xlow, xhigh, ylow, yhigh);
+    return xval >= xlow && xval <= xhigh && yval >= ylow && yval <= yhigh;
+}
+
+void
+cancel_submaps(int &xval, int &yval, double &radius, int indx) {
+    int xlow;
+    int xhigh;
+    int ylow;
+    int yhigh;
+    find_subrange_overlap(xval, yval, radius, xlow, xhigh, ylow, yhigh);
+    for(int x = xlow; x <= xhigh; ++x) {
+        for(int y = ylow; y <= yhigh; ++y) {
+            (*g_array[indx])[x][y]->root_task()->cancel_group_execution();
+        }
+    }
+}
+
+void
+restart_submaps(int &xval, int &yval, double &radius, int indx, SOM_element &vector) {
+    int xlow;
+    int xhigh;
+    int ylow;
+    int yhigh;
+    find_subrange_overlap(xval, yval, radius, xlow, xhigh, ylow, yhigh);
+    for(int x = xlow; x <= xhigh; ++x) {
+        for(int y = ylow; y <= yhigh; ++y) {
+            // have to reset the graph
+            (*g_array[indx])[x][y]->root_task()->context()->reset();
+            // and re-submit the exemplar for search.
+            (*s_array[indx])[x][y]->try_put(vector);
+        }
+    }
+}
+
+search_result_type
+graph_BMU( int indx ) {  // indx ranges over [0 .. SPECULATION_CNT -1]
+    wait_for_all_graphs(indx);  // wait for the array of subgraphs
+    (g[indx])->wait_for_all();
+    std::vector<search_result_type> all_srs(xRangeMax*yRangeMax,search_result_type(DBL_MAX,-1,-1));
+    search_result_type sr;
+    search_result_type min_sr;
+    get<RADIUS>(min_sr) = DBL_MAX;
+    int result_count = 0;
+    while((q[indx])->try_get(sr)) {
+        ++result_count;
+        // figure which submap this came from
+        int x = get<XV>(sr) / xsize;
+        int y = get<YV>(sr) / ysize;
+        int offset = x*yranges+y;  // linearized subscript
+        all_srs[offset] = sr;
+        if(get<RADIUS>(sr) < get<RADIUS>(min_sr))
+            min_sr = sr;
+        else if(get<RADIUS>(sr) == get<RADIUS>(min_sr)) {
+            if(get<XV>(sr) < get<XV>(min_sr)) {
+                min_sr = sr;
+            }
+            else if((get<XV>(sr) == get<XV>(min_sr) &&
+                  get<YV>(sr) < get<YV>(min_sr)))
+            {
+                min_sr = sr;
+            }
+        }
+    }
+    return min_sr;
+    // end of one epoch
+}
+
+void graph_teach(SOMap &map1, teaching_vector_type &in) {
+    build_BMU_graph(map1);
+    // normally the training would pick random exemplars to teach the SOM.  We need
+    // the process to be reproducible, so we will pick the exemplars in order, [0, in.size())
+    int next_j = 0;
+    for(int epoch = 0; epoch < nPasses; ++epoch) {
+        global_i = epoch;
+        bool canceled_submaps = false;
+        int j = next_j;  // try to make reproducible
+        next_j = (epoch+1) % in.size();
+        search_result_type min_sr;
+        if(epoch < speculation_start) {
+            (send_to[epoch%SPECULATION_CNT])->try_put(in[j]);
+        }
+        else if(epoch == speculation_start) {
+            (send_to[epoch%SPECULATION_CNT])->try_put(in[j]);
+            if(epoch < nPasses-1) {
+                (send_to[(epoch+1)%SPECULATION_CNT])->try_put(in[next_j]);
+            }
+        }
+        else if(epoch < nPasses - 1) {
+            (send_to[(epoch+1)%SPECULATION_CNT])->try_put(in[next_j]);
+        }
+        min_sr = graph_BMU(epoch % SPECULATION_CNT);  //calls wait_for_all()
+        double min_distance = get<0>(min_sr);
+        double radius = max_radius * exp(-(double)epoch*radius_decay_rate);
+        double learning_rate = max_learning_rate * exp(-(double)epoch * learning_decay_rate);
+        if(epoch >= speculation_start && epoch < (nPasses - 1)) {
+            // have to cancel the affected submaps
+            cancel_submaps(get<XV>(min_sr), get<YV>(min_sr), radius, (epoch+1)%SPECULATION_CNT);
+            canceled_submaps = true;
+        }
+        map1.epoch_update(in[j], epoch, get<1>(min_sr), get<2>(min_sr), radius, learning_rate);
+        ++global_i;
+        if(canceled_submaps) {
+            // do I have to wait for all the non-canceled speculative graph to complete first?
+            // yes, in case a canceled task was already executing.
+            wait_for_all_graphs((epoch+1) % SPECULATION_CNT);  // wait for the array of subgraphs
+            restart_submaps(get<1>(min_sr), get<2>(min_sr), radius, (epoch+1)%SPECULATION_CNT, in[next_j]);
+        }
+
+        last_update = min_sr;
+        get<RADIUS>(last_update) = radius;  // not smallest value, but range of effect
+    }
+    destroy_BMU_graph();
+}
+
+static const double serial_time_adjust = 1.25;
+static double radius_fraction = 3.0;
+
+int
+main(int argc, char** argv) {
+    int l_speculation_start;
+    utility::thread_number_range threads( 
+            task_scheduler_init::default_num_threads,
+            task_scheduler_init::default_num_threads()  // run only the default number of threads if none specified
+    );
+
+    utility::parse_cli_arguments(argc,argv,
+            utility::cli_argument_pack()
+            //"-h" option for for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads","number of threads to use; a range of the form low[:high], where low and optional high are non-negative integers or 'auto' for the TBB default.")
+            // .positional_arg(InputFileName,"input-file","input file name")
+            // .positional_arg(OutputFileName,"output-file","output file name")
+            .positional_arg(radius_fraction, "radius-fraction","size of radius at which to start speculating")
+            .positional_arg(nPasses, "number-of-epochs","number of examples used in learning phase")
+            .arg(cancel_test, "cancel-test", "test for cancel signal while finding BMU")
+            .arg(extra_debug, "debug", "additional output")
+            .arg(dont_speculate,"nospeculate","don't speculate in SOM map teaching")
+         );
+
+    readInputData();
+    max_radius = (xMax < yMax) ? yMax / 2 : xMax / 2;
+    // need this value for the 1x1 timing below
+    radius_decay_rate = -(log(1.0/(double)max_radius) / (double)nPasses);
+    find_data_ranges(my_teaching, max_range, min_range );
+    if(extra_debug) {
+        printf( "Data range: ");
+        remark_SOM_element(min_range);
+        printf( " to ");
+        remark_SOM_element(max_range);
+        printf( "\n");
+    }
+
+    // find how much time is taken for the single function_node case.
+    // adjust nPasses so the 1x1 time is somewhere around serial_time_adjust seconds.
+   // make sure the example test runs for at least 0.5 second.
+    for(;;) {
+        task_scheduler_init init(1);
+        SOMap map1(xMax,yMax);
+        speculation_start = nPasses + 1;  // Don't speculate
+
+        xranges = 1;
+        yranges = 1;
+        map1.initialize(InitializeGradient, max_range, min_range);
+        tick_count t0 = tick_count::now();
+        graph_teach(map1, my_teaching);
+        tick_count t1 = tick_count::now();
+        double nSeconds = (t1-t0).seconds();
+        if(nSeconds < 0.5) {
+            xMax *= 2;
+            yMax *= 2;
+            continue;
+        }
+        double size_adjust = sqrt(serial_time_adjust / nSeconds);
+        xMax = (int)((double)xMax * size_adjust);
+        yMax = (int)((double)yMax * size_adjust);
+        max_radius = (xMax < yMax) ? yMax / 2 : xMax / 2;
+        radius_decay_rate = log((double)max_radius) / (double)nPasses;
+
+        if(extra_debug) {
+            printf("original 1x1 case ran in %g seconds\n", nSeconds);
+            printf("   Size of table == %d x %d\n", xMax, yMax);
+            printf("   radius_decay_rate == %g\n", radius_decay_rate);
+        }
+        break;
+    }
+
+    // the "max_radius" starts at 1/2*radius_fraction the table size.  To start the speculation when the radius is
+    // 1 / n * the table size, the constant in the log below should be n / 2.  so 2 == 1/4, 3 == 1/6th,
+    // et c.
+    if(dont_speculate) {
+        l_speculation_start = nPasses + 1;
+        if ( extra_debug )printf("speculation will not be done\n");
+    }
+    else {
+        if(radius_fraction < 1.0 ) {
+            if ( extra_debug )printf("Warning: radius_fraction should be >= 1.  Setting to 1.\n");
+            radius_fraction = 1.0;
+        }
+        l_speculation_start = (int)((double)nPasses * log(radius_fraction) / log((double)nPasses)); 
+        if ( extra_debug )printf( "We will start speculation at iteration %d\n", l_speculation_start );
+    }
+    double single_time;  // for speedup calculations
+    for(int p = threads.first; p <= threads.last; ++p) {
+        task_scheduler_init init(p);
+        if ( extra_debug )printf( " -------------- Running with %d threads. ------------\n", p);
+       // run the SOM build for a series of subranges
+        for(xranges = 1; xranges <= xRangeMax; ++xranges) {
+            for(yranges = xranges; yranges <= yRangeMax; ++yranges) {
+                if(xranges == 1 && yranges == 1) {
+                    // don't pointlessly speculate if we're only running one subrange.
+                    speculation_start = nPasses + 1;
+                }
+                else {
+                    speculation_start = l_speculation_start;
+                }
+                SOMap map1(xMax, yMax);
+                map1.initialize(InitializeGradient, max_range, min_range);
+    
+                if(extra_debug) printf( "Start learning for [%d,%d] ----------- \n", xranges,yranges);
+                tick_count t0 = tick_count::now();
+                graph_teach(map1, my_teaching);
+                tick_count t1 = tick_count::now();
+                
+                if ( extra_debug )printf( "Done learning for [%d,%d], which took %g seconds ", xranges,yranges, (t1-t0).seconds());
+                if(xranges == 1 && yranges == 1) single_time = (t1-t0).seconds();
+                if ( extra_debug )printf( ": speedup == %g\n", single_time / (t1-t0).seconds());
+    
+            }  // yranges
+        }  // xranges
+    }  // #threads p
+    printf("done\n");
+    return 0;
+}
diff --git a/xdl/third_party/tbb/examples/graph/som/xcode/som.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/graph/som/xcode/som.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..41fd598f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/som/xcode/som.xcodeproj/project.pbxproj
@@ -0,0 +1,312 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		522FF8DD11F573FC00A587B2 /* som_graph.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 522FF8DB11F573FC00A587B2 /* som_graph.cpp */; };
+		522FF8DE11F573FC00A587B2 /* som.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 522FF8DC11F573FC00A587B2 /* som.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58957218B643900DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		522FF8DB11F573FC00A587B2 /* som_graph.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = som_graph.cpp; path = ../som_graph.cpp; sourceTree = SOURCE_ROOT; };
+		522FF8DC11F573FC00A587B2 /* som.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = som.cpp; path = ../som.cpp; sourceTree = SOURCE_ROOT; };
+		8DD76F6C0486A84900D96B5E /* som */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = som; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* som */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = som;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				522FF8DB11F573FC00A587B2 /* som_graph.cpp */,
+				522FF8DC11F573FC00A587B2 /* som.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* som */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* som */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "som" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58957218B643900DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = som;
+			productInstallPath = "$(HOME)/bin";
+			productName = som;
+			productReference = 8DD76F6C0486A84900D96B5E /* som */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "som" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* som */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* som */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				522FF8DD11F573FC00A587B2 /* som_graph.cpp in Sources */,
+				522FF8DE11F573FC00A587B2 /* som.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = _CONSOLE;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = som;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_PREPROCESSOR_DEFINITIONS = _CONSOLE;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = som;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "som" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "som" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/graph/stereo/Makefile b/xdl/third_party/tbb/examples/graph/stereo/Makefile
new file mode 100644
index 00000000..404dafa3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/Makefile
@@ -0,0 +1,74 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=stereo
+ARGS=
+PERF_RUN_ARGS=
+
+# icpc by default
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icpc
+endif
+
+# autodetect C++11 support
+include ../../common/examples-common.inc
+
+# TBB libs
+TBBLIB=-ltbb
+TBBLIB_DEBUG=-ltbb_debug
+
+# OpenCL lib
+OPENCL_LIB=-lOpenCL
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt
+endif
+else
+ifeq ($(shell uname),Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+override OPENCL_LIB=-framework OpenCL
+endif
+endif
+
+all: release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ $(TBBLIB) $(OPENCL_LIB) $(LIBS) $(CXX0XFLAGS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ $(TBBLIB_DEBUG) $(OPENCL_LIB) $(LIBS) $(CXX0XFLAGS)
+
+profile: override CXXFLAGS += -DTBB_USE_THREADING_TOOLS -g
+profile: release
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/stereo/Makefile.windows b/xdl/third_party/tbb/examples/graph/stereo/Makefile.windows
new file mode 100644
index 00000000..032fa95d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/Makefile.windows
@@ -0,0 +1,59 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=stereo
+ARGS=
+PERF_RUN_ARGS=
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# TBB libs
+TBBLIB=tbb.lib
+TBBLIB_DEBUG=tbb_debug.lib
+
+# OpenCL lib
+OPENCL_LIB=OpenCL.lib
+
+# The C++ compiler options
+MYCXXFLAGS=/TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE /D _CRT_SECURE_NO_WARNINGS /D _SCL_SECURE_NO_WARNINGS $(CXXFLAGS)
+MYLDFLAGS=/INCREMENTAL:NO /NOLOGO /DEBUG $(LDFLAGS)
+
+all: release test
+release:
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link $(TBBLIB) $(OPENCL_LIB) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug:
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link $(TBBLIB_DEBUG) $(OPENCL_LIB) $(MYLDFLAGS) /OUT:$(PROG).exe
+profile: 
+	$(CXX) *.cpp /MD /O2 /Zi /D NDEBUG $(MYCXXFLAGS) /D TBB_USE_THREADING_TOOLS /link $(TBBLIB) $(OPENCL_LIB) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@$(CXX) >nul 2>&1 || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/graph/stereo/imageEffects.cl b/xdl/third_party/tbb/examples/graph/stereo/imageEffects.cl
new file mode 100644
index 00000000..7c77955e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/imageEffects.cl
@@ -0,0 +1,56 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+__constant int redChannelOffset = 0;
+__constant int greenChannelOffset = 1;
+__constant int blueChannelOffset = 2;
+__constant int channelsPerPixel = 4;
+__constant uint channelIncreaseValue = 10;
+
+__kernel void mergeImages( __global uchar* bufferLeft, __global uchar* bufferRight, uint width) {
+    const int indexWidth = get_global_id(0);
+    const int indexHeight = get_global_id(1);
+
+    const int pixelIndex = channelsPerPixel * width * indexHeight + channelsPerPixel * indexWidth;
+    const int pixelGreenChannelIndex = pixelIndex + greenChannelOffset;
+    const int pixelBlueChannelIndex = pixelIndex + blueChannelOffset;
+
+    bufferLeft[pixelGreenChannelIndex] = (bufferRight[pixelGreenChannelIndex] + bufferLeft[pixelGreenChannelIndex]) / 2;
+    bufferLeft[pixelBlueChannelIndex] = bufferRight[pixelBlueChannelIndex];
+}
+
+__kernel void applyLeftImageEffect( __global uchar* bufferLeft, uint width) {
+    const int indexWidth = get_global_id(0);
+    const int indexHeight = get_global_id(1);
+
+    const int pixelRedChannelIndex = channelsPerPixel * width * indexHeight + channelsPerPixel * indexWidth + redChannelOffset;
+
+    bufferLeft[pixelRedChannelIndex] = convert_uchar_sat(bufferLeft[pixelRedChannelIndex] + channelIncreaseValue);
+}
+
+__kernel void applyRightImageEffect( __global uchar* bufferRight, uint width) {
+    const int indexWidth = get_global_id(0);
+    const int indexHeight = get_global_id(1);
+
+    const int pixelBlueChannelIndex = channelsPerPixel * width * indexHeight + channelsPerPixel * indexWidth + blueChannelOffset;
+
+    bufferRight[pixelBlueChannelIndex] = convert_uchar_sat(bufferRight[pixelBlueChannelIndex] + channelIncreaseValue);
+
+}
diff --git a/xdl/third_party/tbb/examples/graph/stereo/lodepng.cpp b/xdl/third_party/tbb/examples/graph/stereo/lodepng.cpp
new file mode 100644
index 00000000..5080f5a0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/lodepng.cpp
@@ -0,0 +1,6227 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+LodePNG version 20160409
+
+Copyright (c) 2005-2016 Lode Vandevenne
+
+This software is provided 'as-is', without any express or implied
+warranty. In no event will the authors be held liable for any damages
+arising from the use of this software.
+
+Permission is granted to anyone to use this software for any purpose,
+including commercial applications, and to alter it and redistribute it
+freely, subject to the following restrictions:
+
+    1. The origin of this software must not be misrepresented; you must not
+    claim that you wrote the original software. If you use this software
+    in a product, an acknowledgment in the product documentation would be
+    appreciated but is not required.
+
+    2. Altered source versions must be plainly marked as such, and must not be
+    misrepresented as being the original software.
+
+    3. This notice may not be removed or altered from any source
+    distribution.
+*/
+
+/*
+The manual and changelog are in the header file "lodepng.h"
+Rename this file to lodepng.cpp to use it for C++, or to lodepng.c to use it for C.
+*/
+
+#include "lodepng.h"
+
+#include <limits.h>
+#include <stdio.h>
+#include <stdlib.h>
+
+/*Visual Studio: A few warning types are not desired here.*/
+#if defined(_MSC_VER) && (_MSC_VER >= 1310)
+#pragma warning( disable : 4244 ) /*implicit conversions: not warned by gcc -Wall -Wextra and requires too much casts*/
+#pragma warning( disable : 4996 ) /*VS does not like fopen, but fopen_s is not standard C so unusable here*/
+#endif /*_MSC_VER */
+
+const char* LODEPNG_VERSION_STRING = "20160409";
+
+/*
+This source file is built up in the following large parts. The code sections
+with the "LODEPNG_COMPILE_" #defines divide this up further in an intermixed way.
+-Tools for C and common code for PNG and Zlib
+-C Code for Zlib (huffman, deflate, ...)
+-C Code for PNG (file format chunks, adam7, PNG filters, color conversions, ...)
+-The C++ wrapper around all of the above
+*/
+
+/*The malloc, realloc and free functions defined here with "lodepng_" in front
+of the name, so that you can easily change them to others related to your
+platform if needed. Everything else in the code calls these. Pass
+-DLODEPNG_NO_COMPILE_ALLOCATORS to the compiler, or comment out
+#define LODEPNG_COMPILE_ALLOCATORS in the header, to disable the ones here and
+define them in your own project's source files without needing to change
+lodepng source code. Don't forget to remove "static" if you copypaste them
+from here.*/
+
+#ifdef LODEPNG_COMPILE_ALLOCATORS
+static void* lodepng_malloc(size_t size)
+{
+  return malloc(size);
+}
+
+static void* lodepng_realloc(void* ptr, size_t new_size)
+{
+  return realloc(ptr, new_size);
+}
+
+static void lodepng_free(void* ptr)
+{
+  free(ptr);
+}
+#else /*LODEPNG_COMPILE_ALLOCATORS*/
+void* lodepng_malloc(size_t size);
+void* lodepng_realloc(void* ptr, size_t new_size);
+void lodepng_free(void* ptr);
+#endif /*LODEPNG_COMPILE_ALLOCATORS*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* // Tools for C, and common code for PNG and Zlib.                       // */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*
+Often in case of an error a value is assigned to a variable and then it breaks
+out of a loop (to go to the cleanup phase of a function). This macro does that.
+It makes the error handling code shorter and more readable.
+
+Example: if(!uivector_resizev(&frequencies_ll, 286, 0)) ERROR_BREAK(83);
+*/
+#define CERROR_BREAK(errorvar, code)\
+{\
+  errorvar = code;\
+  break;\
+}
+
+/*version of CERROR_BREAK that assumes the common case where the error variable is named "error"*/
+#define ERROR_BREAK(code) CERROR_BREAK(error, code)
+
+/*Set error var to the error code, and return it.*/
+#define CERROR_RETURN_ERROR(errorvar, code)\
+{\
+  errorvar = code;\
+  return code;\
+}
+
+/*Try the code, if it returns error, also return the error.*/
+#define CERROR_TRY_RETURN(call)\
+{\
+  unsigned error = call;\
+  if(error) return error;\
+}
+
+/*Set error var to the error code, and return from the void function.*/
+#define CERROR_RETURN(errorvar, code)\
+{\
+  errorvar = code;\
+  return;\
+}
+
+/*
+About uivector, ucvector and string:
+-All of them wrap dynamic arrays or text strings in a similar way.
+-LodePNG was originally written in C++. The vectors replace the std::vectors that were used in the C++ version.
+-The string tools are made to avoid problems with compilers that declare things like strncat as deprecated.
+-They're not used in the interface, only internally in this file as static functions.
+-As with many other structs in this file, the init and cleanup functions serve as ctor and dtor.
+*/
+
+#ifdef LODEPNG_COMPILE_ZLIB
+/*dynamic vector of unsigned ints*/
+typedef struct uivector
+{
+  unsigned* data;
+  size_t size; /*size in number of unsigned longs*/
+  size_t allocsize; /*allocated size in bytes*/
+} uivector;
+
+static void uivector_cleanup(void* p)
+{
+  ((uivector*)p)->size = ((uivector*)p)->allocsize = 0;
+  lodepng_free(((uivector*)p)->data);
+  ((uivector*)p)->data = NULL;
+}
+
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned uivector_reserve(uivector* p, size_t allocsize)
+{
+  if(allocsize > p->allocsize)
+  {
+    size_t newsize = (allocsize > p->allocsize * 2) ? allocsize : (allocsize * 3 / 2);
+    void* data = lodepng_realloc(p->data, newsize);
+    if(data)
+    {
+      p->allocsize = newsize;
+      p->data = (unsigned*)data;
+    }
+    else return 0; /*error: not enough memory*/
+  }
+  return 1;
+}
+
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned uivector_resize(uivector* p, size_t size)
+{
+  if(!uivector_reserve(p, size * sizeof(unsigned))) return 0;
+  p->size = size;
+  return 1; /*success*/
+}
+
+/*resize and give all new elements the value*/
+static unsigned uivector_resizev(uivector* p, size_t size, unsigned value)
+{
+  size_t oldsize = p->size, i;
+  if(!uivector_resize(p, size)) return 0;
+  for(i = oldsize; i < size; ++i) p->data[i] = value;
+  return 1;
+}
+
+static void uivector_init(uivector* p)
+{
+  p->data = NULL;
+  p->size = p->allocsize = 0;
+}
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned uivector_push_back(uivector* p, unsigned c)
+{
+  if(!uivector_resize(p, p->size + 1)) return 0;
+  p->data[p->size - 1] = c;
+  return 1;
+}
+#endif /*LODEPNG_COMPILE_ENCODER*/
+#endif /*LODEPNG_COMPILE_ZLIB*/
+
+/* /////////////////////////////////////////////////////////////////////////// */
+
+/*dynamic vector of unsigned chars*/
+typedef struct ucvector
+{
+  unsigned char* data;
+  size_t size; /*used size*/
+  size_t allocsize; /*allocated size*/
+} ucvector;
+
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned ucvector_reserve(ucvector* p, size_t allocsize)
+{
+  if(allocsize > p->allocsize)
+  {
+    size_t newsize = (allocsize > p->allocsize * 2) ? allocsize : (allocsize * 3 / 2);
+    void* data = lodepng_realloc(p->data, newsize);
+    if(data)
+    {
+      p->allocsize = newsize;
+      p->data = (unsigned char*)data;
+    }
+    else return 0; /*error: not enough memory*/
+  }
+  return 1;
+}
+
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned ucvector_resize(ucvector* p, size_t size)
+{
+  if(!ucvector_reserve(p, size * sizeof(unsigned char))) return 0;
+  p->size = size;
+  return 1; /*success*/
+}
+
+#ifdef LODEPNG_COMPILE_PNG
+
+static void ucvector_cleanup(void* p)
+{
+  ((ucvector*)p)->size = ((ucvector*)p)->allocsize = 0;
+  lodepng_free(((ucvector*)p)->data);
+  ((ucvector*)p)->data = NULL;
+}
+
+static void ucvector_init(ucvector* p)
+{
+  p->data = NULL;
+  p->size = p->allocsize = 0;
+}
+#endif /*LODEPNG_COMPILE_PNG*/
+
+#ifdef LODEPNG_COMPILE_ZLIB
+/*you can both convert from vector to buffer&size and vica versa. If you use
+init_buffer to take over a buffer and size, it is not needed to use cleanup*/
+static void ucvector_init_buffer(ucvector* p, unsigned char* buffer, size_t size)
+{
+  p->data = buffer;
+  p->allocsize = p->size = size;
+}
+#endif /*LODEPNG_COMPILE_ZLIB*/
+
+#if (defined(LODEPNG_COMPILE_PNG) && defined(LODEPNG_COMPILE_ANCILLARY_CHUNKS)) || defined(LODEPNG_COMPILE_ENCODER)
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned ucvector_push_back(ucvector* p, unsigned char c)
+{
+  if(!ucvector_resize(p, p->size + 1)) return 0;
+  p->data[p->size - 1] = c;
+  return 1;
+}
+#endif /*defined(LODEPNG_COMPILE_PNG) || defined(LODEPNG_COMPILE_ENCODER)*/
+
+
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_PNG
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+/*returns 1 if success, 0 if failure ==> nothing done*/
+static unsigned string_resize(char** out, size_t size)
+{
+  char* data = (char*)lodepng_realloc(*out, size + 1);
+  if(data)
+  {
+    data[size] = 0; /*null termination char*/
+    *out = data;
+  }
+  return data != 0;
+}
+
+/*init a {char*, size_t} pair for use as string*/
+static void string_init(char** out)
+{
+  *out = NULL;
+  string_resize(out, 0);
+}
+
+/*free the above pair again*/
+static void string_cleanup(char** out)
+{
+  lodepng_free(*out);
+  *out = NULL;
+}
+
+static void string_set(char** out, const char* in)
+{
+  size_t insize = strlen(in), i;
+  if(string_resize(out, insize))
+  {
+    for(i = 0; i != insize; ++i)
+    {
+      (*out)[i] = in[i];
+    }
+  }
+}
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+#endif /*LODEPNG_COMPILE_PNG*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+
+unsigned lodepng_read32bitInt(const unsigned char* buffer)
+{
+  return (unsigned)((buffer[0] << 24) | (buffer[1] << 16) | (buffer[2] << 8) | buffer[3]);
+}
+
+#if defined(LODEPNG_COMPILE_PNG) || defined(LODEPNG_COMPILE_ENCODER)
+/*buffer must have at least 4 allocated bytes available*/
+static void lodepng_set32bitInt(unsigned char* buffer, unsigned value)
+{
+  buffer[0] = (unsigned char)((value >> 24) & 0xff);
+  buffer[1] = (unsigned char)((value >> 16) & 0xff);
+  buffer[2] = (unsigned char)((value >>  8) & 0xff);
+  buffer[3] = (unsigned char)((value      ) & 0xff);
+}
+#endif /*defined(LODEPNG_COMPILE_PNG) || defined(LODEPNG_COMPILE_ENCODER)*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+static void lodepng_add32bitInt(ucvector* buffer, unsigned value)
+{
+  ucvector_resize(buffer, buffer->size + 4); /*todo: give error if resize failed*/
+  lodepng_set32bitInt(&buffer->data[buffer->size - 4], value);
+}
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / File IO                                                                / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_DISK
+
+/* returns negative value on error. This should be pure C compatible, so no fstat. */
+static long lodepng_filesize(const char* filename)
+{
+  FILE* file;
+  long size;
+  file = fopen(filename, "rb");
+  if(!file) return -1;
+
+  if(fseek(file, 0, SEEK_END) != 0)
+  {
+    fclose(file);
+    return -1;
+  }
+
+  size = ftell(file);
+  /* It may give LONG_MAX as directory size, this is invalid for us. */
+  if(size == LONG_MAX) size = -1;
+
+  fclose(file);
+  return size;
+}
+
+/* load file into buffer that already has the correct allocated size. Returns error code.*/
+static unsigned lodepng_buffer_file(unsigned char* out, size_t size, const char* filename)
+{
+  FILE* file;
+  size_t readsize;
+  file = fopen(filename, "rb");
+  if(!file) return 78;
+
+  readsize = fread(out, 1, size, file);
+  fclose(file);
+
+  if (readsize != size) return 78;
+  return 0;
+}
+
+unsigned lodepng_load_file(unsigned char** out, size_t* outsize, const char* filename)
+{
+  long size = lodepng_filesize(filename);
+  if (size < 0) return 78;
+  *outsize = (size_t)size;
+
+  *out = (unsigned char*)lodepng_malloc((size_t)size);
+  if(!(*out) && size > 0) return 83; /*the above malloc failed*/
+
+  return lodepng_buffer_file(*out, (size_t)size, filename);
+}
+
+/*write given buffer to the file, overwriting the file, it doesn't append to it.*/
+unsigned lodepng_save_file(const unsigned char* buffer, size_t buffersize, const char* filename)
+{
+  FILE* file;
+  file = fopen(filename, "wb" );
+  if(!file) return 79;
+  fwrite((char*)buffer , 1 , buffersize, file);
+  fclose(file);
+  return 0;
+}
+
+#endif /*LODEPNG_COMPILE_DISK*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* // End of common code and tools. Begin of Zlib related code.            // */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_ZLIB
+#ifdef LODEPNG_COMPILE_ENCODER
+/*TODO: this ignores potential out of memory errors*/
+#define addBitToStream(/*size_t**/ bitpointer, /*ucvector**/ bitstream, /*unsigned char*/ bit)\
+{\
+  /*add a new byte at the end*/\
+  if(((*bitpointer) & 7) == 0) ucvector_push_back(bitstream, (unsigned char)0);\
+  /*earlier bit of huffman code is in a lesser significant bit of an earlier byte*/\
+  (bitstream->data[bitstream->size - 1]) |= (bit << ((*bitpointer) & 0x7));\
+  ++(*bitpointer);\
+}
+
+static void addBitsToStream(size_t* bitpointer, ucvector* bitstream, unsigned value, size_t nbits)
+{
+  size_t i;
+  for(i = 0; i != nbits; ++i) addBitToStream(bitpointer, bitstream, (unsigned char)((value >> i) & 1));
+}
+
+static void addBitsToStreamReversed(size_t* bitpointer, ucvector* bitstream, unsigned value, size_t nbits)
+{
+  size_t i;
+  for(i = 0; i != nbits; ++i) addBitToStream(bitpointer, bitstream, (unsigned char)((value >> (nbits - 1 - i)) & 1));
+}
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+#define READBIT(bitpointer, bitstream) ((bitstream[bitpointer >> 3] >> (bitpointer & 0x7)) & (unsigned char)1)
+
+static unsigned char readBitFromStream(size_t* bitpointer, const unsigned char* bitstream)
+{
+  unsigned char result = (unsigned char)(READBIT(*bitpointer, bitstream));
+  ++(*bitpointer);
+  return result;
+}
+
+static unsigned readBitsFromStream(size_t* bitpointer, const unsigned char* bitstream, size_t nbits)
+{
+  unsigned result = 0, i;
+  for(i = 0; i != nbits; ++i)
+  {
+    result += ((unsigned)READBIT(*bitpointer, bitstream)) << i;
+    ++(*bitpointer);
+  }
+  return result;
+}
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Deflate - Huffman                                                      / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#define FIRST_LENGTH_CODE_INDEX 257
+#define LAST_LENGTH_CODE_INDEX 285
+/*256 literals, the end code, some length codes, and 2 unused codes*/
+#define NUM_DEFLATE_CODE_SYMBOLS 288
+/*the distance codes have their own symbols, 30 used, 2 unused*/
+#define NUM_DISTANCE_SYMBOLS 32
+/*the code length codes. 0-15: code lengths, 16: copy previous 3-6 times, 17: 3-10 zeros, 18: 11-138 zeros*/
+#define NUM_CODE_LENGTH_CODES 19
+
+/*the base lengths represented by codes 257-285*/
+static const unsigned LENGTHBASE[29]
+  = {3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 15, 17, 19, 23, 27, 31, 35, 43, 51, 59,
+     67, 83, 99, 115, 131, 163, 195, 227, 258};
+
+/*the extra bits used by codes 257-285 (added to base length)*/
+static const unsigned LENGTHEXTRA[29]
+  = {0, 0, 0, 0, 0, 0, 0,  0,  1,  1,  1,  1,  2,  2,  2,  2,  3,  3,  3,  3,
+      4,  4,  4,   4,   5,   5,   5,   5,   0};
+
+/*the base backwards distances (the bits of distance codes appear after length codes and use their own huffman tree)*/
+static const unsigned DISTANCEBASE[30]
+  = {1, 2, 3, 4, 5, 7, 9, 13, 17, 25, 33, 49, 65, 97, 129, 193, 257, 385, 513,
+     769, 1025, 1537, 2049, 3073, 4097, 6145, 8193, 12289, 16385, 24577};
+
+/*the extra bits of backwards distances (added to base)*/
+static const unsigned DISTANCEEXTRA[30]
+  = {0, 0, 0, 0, 1, 1, 2,  2,  3,  3,  4,  4,  5,  5,   6,   6,   7,   7,   8,
+       8,    9,    9,   10,   10,   11,   11,   12,    12,    13,    13};
+
+/*the order in which "code length alphabet code lengths" are stored, out of this
+the huffman tree of the dynamic huffman tree lengths is generated*/
+static const unsigned CLCL_ORDER[NUM_CODE_LENGTH_CODES]
+  = {16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15};
+
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*
+Huffman tree struct, containing multiple representations of the tree
+*/
+typedef struct HuffmanTree
+{
+  unsigned* tree2d;
+  unsigned* tree1d;
+  unsigned* lengths; /*the lengths of the codes of the 1d-tree*/
+  unsigned maxbitlen; /*maximum number of bits a single code can get*/
+  unsigned numcodes; /*number of symbols in the alphabet = number of codes*/
+} HuffmanTree;
+
+/*function used for debug purposes to draw the tree in ascii art with C++*/
+/*
+static void HuffmanTree_draw(HuffmanTree* tree)
+{
+  std::cout << "tree. length: " << tree->numcodes << " maxbitlen: " << tree->maxbitlen << std::endl;
+  for(size_t i = 0; i != tree->tree1d.size; ++i)
+  {
+    if(tree->lengths.data[i])
+      std::cout << i << " " << tree->tree1d.data[i] << " " << tree->lengths.data[i] << std::endl;
+  }
+  std::cout << std::endl;
+}*/
+
+static void HuffmanTree_init(HuffmanTree* tree)
+{
+  tree->tree2d = 0;
+  tree->tree1d = 0;
+  tree->lengths = 0;
+}
+
+static void HuffmanTree_cleanup(HuffmanTree* tree)
+{
+  lodepng_free(tree->tree2d);
+  lodepng_free(tree->tree1d);
+  lodepng_free(tree->lengths);
+}
+
+/*the tree representation used by the decoder. return value is error*/
+static unsigned HuffmanTree_make2DTree(HuffmanTree* tree)
+{
+  unsigned nodefilled = 0; /*up to which node it is filled*/
+  unsigned treepos = 0; /*position in the tree (1 of the numcodes columns)*/
+  unsigned n, i;
+
+  tree->tree2d = (unsigned*)lodepng_malloc(tree->numcodes * 2 * sizeof(unsigned));
+  if(!tree->tree2d) return 83; /*alloc fail*/
+
+  /*
+  convert tree1d[] to tree2d[][]. In the 2D array, a value of 32767 means
+  uninited, a value >= numcodes is an address to another bit, a value < numcodes
+  is a code. The 2 rows are the 2 possible bit values (0 or 1), there are as
+  many columns as codes - 1.
+  A good huffman tree has N * 2 - 1 nodes, of which N - 1 are internal nodes.
+  Here, the internal nodes are stored (what their 0 and 1 option point to).
+  There is only memory for such good tree currently, if there are more nodes
+  (due to too long length codes), error 55 will happen
+  */
+  for(n = 0; n < tree->numcodes * 2; ++n)
+  {
+    tree->tree2d[n] = 32767; /*32767 here means the tree2d isn't filled there yet*/
+  }
+
+  for(n = 0; n < tree->numcodes; ++n) /*the codes*/
+  {
+    for(i = 0; i != tree->lengths[n]; ++i) /*the bits for this code*/
+    {
+      unsigned char bit = (unsigned char)((tree->tree1d[n] >> (tree->lengths[n] - i - 1)) & 1);
+      /*oversubscribed, see comment in lodepng_error_text*/
+      if(treepos > 2147483647 || treepos + 2 > tree->numcodes) return 55;
+      if(tree->tree2d[2 * treepos + bit] == 32767) /*not yet filled in*/
+      {
+        if(i + 1 == tree->lengths[n]) /*last bit*/
+        {
+          tree->tree2d[2 * treepos + bit] = n; /*put the current code in it*/
+          treepos = 0;
+        }
+        else
+        {
+          /*put address of the next step in here, first that address has to be found of course
+          (it's just nodefilled + 1)...*/
+          ++nodefilled;
+          /*addresses encoded with numcodes added to it*/
+          tree->tree2d[2 * treepos + bit] = nodefilled + tree->numcodes;
+          treepos = nodefilled;
+        }
+      }
+      else treepos = tree->tree2d[2 * treepos + bit] - tree->numcodes;
+    }
+  }
+
+  for(n = 0; n < tree->numcodes * 2; ++n)
+  {
+    if(tree->tree2d[n] == 32767) tree->tree2d[n] = 0; /*remove possible remaining 32767's*/
+  }
+
+  return 0;
+}
+
+/*
+Second step for the ...makeFromLengths and ...makeFromFrequencies functions.
+numcodes, lengths and maxbitlen must already be filled in correctly. return
+value is error.
+*/
+static unsigned HuffmanTree_makeFromLengths2(HuffmanTree* tree)
+{
+  uivector blcount;
+  uivector nextcode;
+  unsigned error = 0;
+  unsigned bits, n;
+
+  uivector_init(&blcount);
+  uivector_init(&nextcode);
+
+  tree->tree1d = (unsigned*)lodepng_malloc(tree->numcodes * sizeof(unsigned));
+  if(!tree->tree1d) error = 83; /*alloc fail*/
+
+  if(!uivector_resizev(&blcount, tree->maxbitlen + 1, 0)
+  || !uivector_resizev(&nextcode, tree->maxbitlen + 1, 0))
+    error = 83; /*alloc fail*/
+
+  if(!error)
+  {
+    /*step 1: count number of instances of each code length*/
+    for(bits = 0; bits != tree->numcodes; ++bits) ++blcount.data[tree->lengths[bits]];
+    /*step 2: generate the nextcode values*/
+    for(bits = 1; bits <= tree->maxbitlen; ++bits)
+    {
+      nextcode.data[bits] = (nextcode.data[bits - 1] + blcount.data[bits - 1]) << 1;
+    }
+    /*step 3: generate all the codes*/
+    for(n = 0; n != tree->numcodes; ++n)
+    {
+      if(tree->lengths[n] != 0) tree->tree1d[n] = nextcode.data[tree->lengths[n]]++;
+    }
+  }
+
+  uivector_cleanup(&blcount);
+  uivector_cleanup(&nextcode);
+
+  if(!error) return HuffmanTree_make2DTree(tree);
+  else return error;
+}
+
+/*
+given the code lengths (as stored in the PNG file), generate the tree as defined
+by Deflate. maxbitlen is the maximum bits that a code in the tree can have.
+return value is error.
+*/
+static unsigned HuffmanTree_makeFromLengths(HuffmanTree* tree, const unsigned* bitlen,
+                                            size_t numcodes, unsigned maxbitlen)
+{
+  unsigned i;
+  tree->lengths = (unsigned*)lodepng_malloc(numcodes * sizeof(unsigned));
+  if(!tree->lengths) return 83; /*alloc fail*/
+  for(i = 0; i != numcodes; ++i) tree->lengths[i] = bitlen[i];
+  tree->numcodes = (unsigned)numcodes; /*number of symbols*/
+  tree->maxbitlen = maxbitlen;
+  return HuffmanTree_makeFromLengths2(tree);
+}
+
+#ifdef LODEPNG_COMPILE_ENCODER
+
+/*BPM: Boundary Package Merge, see "A Fast and Space-Economical Algorithm for Length-Limited Coding",
+Jyrki Katajainen, Alistair Moffat, Andrew Turpin, 1995.*/
+
+/*chain node for boundary package merge*/
+typedef struct BPMNode
+{
+  int weight; /*the sum of all weights in this chain*/
+  unsigned index; /*index of this leaf node (called "count" in the paper)*/
+  struct BPMNode* tail; /*the next nodes in this chain (null if last)*/
+  int in_use;
+} BPMNode;
+
+/*lists of chains*/
+typedef struct BPMLists
+{
+  /*memory pool*/
+  unsigned memsize;
+  BPMNode* memory;
+  unsigned numfree;
+  unsigned nextfree;
+  BPMNode** freelist;
+  /*two heads of lookahead chains per list*/
+  unsigned listsize;
+  BPMNode** chains0;
+  BPMNode** chains1;
+} BPMLists;
+
+/*creates a new chain node with the given parameters, from the memory in the lists */
+static BPMNode* bpmnode_create(BPMLists* lists, int weight, unsigned index, BPMNode* tail)
+{
+  unsigned i;
+  BPMNode* result;
+
+  /*memory full, so garbage collect*/
+  if(lists->nextfree >= lists->numfree)
+  {
+    /*mark only those that are in use*/
+    for(i = 0; i != lists->memsize; ++i) lists->memory[i].in_use = 0;
+    for(i = 0; i != lists->listsize; ++i)
+    {
+      BPMNode* node;
+      for(node = lists->chains0[i]; node != 0; node = node->tail) node->in_use = 1;
+      for(node = lists->chains1[i]; node != 0; node = node->tail) node->in_use = 1;
+    }
+    /*collect those that are free*/
+    lists->numfree = 0;
+    for(i = 0; i != lists->memsize; ++i)
+    {
+      if(!lists->memory[i].in_use) lists->freelist[lists->numfree++] = &lists->memory[i];
+    }
+    lists->nextfree = 0;
+  }
+
+  result = lists->freelist[lists->nextfree++];
+  result->weight = weight;
+  result->index = index;
+  result->tail = tail;
+  return result;
+}
+
+static int bpmnode_compare(const void* a, const void* b)
+{
+  int wa = ((const BPMNode*)a)->weight;
+  int wb = ((const BPMNode*)b)->weight;
+  if(wa < wb) return -1;
+  if(wa > wb) return 1;
+  /*make the qsort a stable sort*/
+  return ((const BPMNode*)a)->index < ((const BPMNode*)b)->index ? 1 : -1;
+}
+
+/*Boundary Package Merge step, numpresent is the amount of leaves, and c is the current chain.*/
+static void boundaryPM(BPMLists* lists, BPMNode* leaves, size_t numpresent, int c, int num)
+{
+  unsigned lastindex = lists->chains1[c]->index;
+
+  if(c == 0)
+  {
+    if(lastindex >= numpresent) return;
+    lists->chains0[c] = lists->chains1[c];
+    lists->chains1[c] = bpmnode_create(lists, leaves[lastindex].weight, lastindex + 1, 0);
+  }
+  else
+  {
+    /*sum of the weights of the head nodes of the previous lookahead chains.*/
+    int sum = lists->chains0[c - 1]->weight + lists->chains1[c - 1]->weight;
+    lists->chains0[c] = lists->chains1[c];
+    if(lastindex < numpresent && sum > leaves[lastindex].weight)
+    {
+      lists->chains1[c] = bpmnode_create(lists, leaves[lastindex].weight, lastindex + 1, lists->chains1[c]->tail);
+      return;
+    }
+    lists->chains1[c] = bpmnode_create(lists, sum, lastindex, lists->chains1[c - 1]);
+    /*in the end we are only interested in the chain of the last list, so no
+    need to recurse if we're at the last one (this gives measurable speedup)*/
+    if(num + 1 < (int)(2 * numpresent - 2))
+    {
+      boundaryPM(lists, leaves, numpresent, c - 1, num);
+      boundaryPM(lists, leaves, numpresent, c - 1, num);
+    }
+  }
+}
+
+unsigned lodepng_huffman_code_lengths(unsigned* lengths, const unsigned* frequencies,
+                                      size_t numcodes, unsigned maxbitlen)
+{
+  unsigned error = 0;
+  unsigned i;
+  size_t numpresent = 0; /*number of symbols with non-zero frequency*/
+  BPMNode* leaves; /*the symbols, only those with > 0 frequency*/
+
+  if(numcodes == 0) return 80; /*error: a tree of 0 symbols is not supposed to be made*/
+  if(( (size_t)1 << maxbitlen) < numcodes) return 80; /*error: represent all symbols*/
+
+  leaves = (BPMNode*)lodepng_malloc(numcodes * sizeof(*leaves));
+  if(!leaves) return 83; /*alloc fail*/
+
+  for(i = 0; i != numcodes; ++i)
+  {
+    if(frequencies[i] > 0)
+    {
+      leaves[numpresent].weight = (int)frequencies[i];
+      leaves[numpresent].index = i;
+      ++numpresent;
+    }
+  }
+
+  for(i = 0; i != numcodes; ++i) lengths[i] = 0;
+
+  /*ensure at least two present symbols. There should be at least one symbol
+  according to RFC 1951 section 3.2.7. Some decoders incorrectly require two. To
+  make these work as well ensure there are at least two symbols. The
+  Package-Merge code below also doesn't work correctly if there's only one
+  symbol, it'd give it the theoritical 0 bits but in practice zlib wants 1 bit*/
+  if(numpresent == 0)
+  {
+    lengths[0] = lengths[1] = 1; /*note that for RFC 1951 section 3.2.7, only lengths[0] = 1 is needed*/
+  }
+  else if(numpresent == 1)
+  {
+    lengths[leaves[0].index] = 1;
+    lengths[leaves[0].index == 0 ? 1 : 0] = 1;
+  }
+  else
+  {
+    BPMLists lists;
+    BPMNode* node;
+
+    qsort(leaves, numpresent, sizeof(BPMNode), bpmnode_compare);
+
+    lists.listsize = maxbitlen;
+    lists.memsize = 2 * maxbitlen * (maxbitlen + 1);
+    lists.nextfree = 0;
+    lists.numfree = lists.memsize;
+    lists.memory = (BPMNode*)lodepng_malloc(lists.memsize * sizeof(*lists.memory));
+    lists.freelist = (BPMNode**)lodepng_malloc(lists.memsize * sizeof(BPMNode*));
+    lists.chains0 = (BPMNode**)lodepng_malloc(lists.listsize * sizeof(BPMNode*));
+    lists.chains1 = (BPMNode**)lodepng_malloc(lists.listsize * sizeof(BPMNode*));
+    if(!lists.memory || !lists.freelist || !lists.chains0 || !lists.chains1) error = 83; /*alloc fail*/
+
+    if(!error)
+    {
+      for(i = 0; i != lists.memsize; ++i) lists.freelist[i] = &lists.memory[i];
+
+      bpmnode_create(&lists, leaves[0].weight, 1, 0);
+      bpmnode_create(&lists, leaves[1].weight, 2, 0);
+
+      for(i = 0; i != lists.listsize; ++i)
+      {
+        lists.chains0[i] = &lists.memory[0];
+        lists.chains1[i] = &lists.memory[1];
+      }
+
+      /*each boundaryPM call adds one chain to the last list, and we need 2 * numpresent - 2 chains.*/
+      for(i = 2; i != 2 * numpresent - 2; ++i) boundaryPM(&lists, leaves, numpresent, (int)maxbitlen - 1, (int)i);
+
+      for(node = lists.chains1[maxbitlen - 1]; node; node = node->tail)
+      {
+        for(i = 0; i != node->index; ++i) ++lengths[leaves[i].index];
+      }
+    }
+
+    lodepng_free(lists.memory);
+    lodepng_free(lists.freelist);
+    lodepng_free(lists.chains0);
+    lodepng_free(lists.chains1);
+  }
+
+  lodepng_free(leaves);
+  return error;
+}
+
+/*Create the Huffman tree given the symbol frequencies*/
+static unsigned HuffmanTree_makeFromFrequencies(HuffmanTree* tree, const unsigned* frequencies,
+                                                size_t mincodes, size_t numcodes, unsigned maxbitlen)
+{
+  unsigned error = 0;
+  while(!frequencies[numcodes - 1] && numcodes > mincodes) --numcodes; /*trim zeroes*/
+  tree->maxbitlen = maxbitlen;
+  tree->numcodes = (unsigned)numcodes; /*number of symbols*/
+  tree->lengths = (unsigned*)lodepng_realloc(tree->lengths, numcodes * sizeof(unsigned));
+  if(!tree->lengths) return 83; /*alloc fail*/
+  /*initialize all lengths to 0*/
+  memset(tree->lengths, 0, numcodes * sizeof(unsigned));
+
+  error = lodepng_huffman_code_lengths(tree->lengths, frequencies, numcodes, maxbitlen);
+  if(!error) error = HuffmanTree_makeFromLengths2(tree);
+  return error;
+}
+
+static unsigned HuffmanTree_getCode(const HuffmanTree* tree, unsigned index)
+{
+  return tree->tree1d[index];
+}
+
+static unsigned HuffmanTree_getLength(const HuffmanTree* tree, unsigned index)
+{
+  return tree->lengths[index];
+}
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+/*get the literal and length code tree of a deflated block with fixed tree, as per the deflate specification*/
+static unsigned generateFixedLitLenTree(HuffmanTree* tree)
+{
+  unsigned i, error = 0;
+  unsigned* bitlen = (unsigned*)lodepng_malloc(NUM_DEFLATE_CODE_SYMBOLS * sizeof(unsigned));
+  if(!bitlen) return 83; /*alloc fail*/
+
+  /*288 possible codes: 0-255=literals, 256=endcode, 257-285=lengthcodes, 286-287=unused*/
+  for(i =   0; i <= 143; ++i) bitlen[i] = 8;
+  for(i = 144; i <= 255; ++i) bitlen[i] = 9;
+  for(i = 256; i <= 279; ++i) bitlen[i] = 7;
+  for(i = 280; i <= 287; ++i) bitlen[i] = 8;
+
+  error = HuffmanTree_makeFromLengths(tree, bitlen, NUM_DEFLATE_CODE_SYMBOLS, 15);
+
+  lodepng_free(bitlen);
+  return error;
+}
+
+/*get the distance code tree of a deflated block with fixed tree, as specified in the deflate specification*/
+static unsigned generateFixedDistanceTree(HuffmanTree* tree)
+{
+  unsigned i, error = 0;
+  unsigned* bitlen = (unsigned*)lodepng_malloc(NUM_DISTANCE_SYMBOLS * sizeof(unsigned));
+  if(!bitlen) return 83; /*alloc fail*/
+
+  /*there are 32 distance codes, but 30-31 are unused*/
+  for(i = 0; i != NUM_DISTANCE_SYMBOLS; ++i) bitlen[i] = 5;
+  error = HuffmanTree_makeFromLengths(tree, bitlen, NUM_DISTANCE_SYMBOLS, 15);
+
+  lodepng_free(bitlen);
+  return error;
+}
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+/*
+returns the code, or (unsigned)(-1) if error happened
+inbitlength is the length of the complete buffer, in bits (so its byte length times 8)
+*/
+static unsigned huffmanDecodeSymbol(const unsigned char* in, size_t* bp,
+                                    const HuffmanTree* codetree, size_t inbitlength)
+{
+  unsigned treepos = 0, ct;
+  for(;;)
+  {
+    if(*bp >= inbitlength) return (unsigned)(-1); /*error: end of input memory reached without endcode*/
+    /*
+    decode the symbol from the tree. The "readBitFromStream" code is inlined in
+    the expression below because this is the biggest bottleneck while decoding
+    */
+    ct = codetree->tree2d[(treepos << 1) + READBIT(*bp, in)];
+    ++(*bp);
+    if(ct < codetree->numcodes) return ct; /*the symbol is decoded, return it*/
+    else treepos = ct - codetree->numcodes; /*symbol not yet decoded, instead move tree position*/
+
+    if(treepos >= codetree->numcodes) return (unsigned)(-1); /*error: it appeared outside the codetree*/
+  }
+}
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Inflator (Decompressor)                                                / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*get the tree of a deflated block with fixed tree, as specified in the deflate specification*/
+static void getTreeInflateFixed(HuffmanTree* tree_ll, HuffmanTree* tree_d)
+{
+  /*TODO: check for out of memory errors*/
+  generateFixedLitLenTree(tree_ll);
+  generateFixedDistanceTree(tree_d);
+}
+
+/*get the tree of a deflated block with dynamic tree, the tree itself is also Huffman compressed with a known tree*/
+static unsigned getTreeInflateDynamic(HuffmanTree* tree_ll, HuffmanTree* tree_d,
+                                      const unsigned char* in, size_t* bp, size_t inlength)
+{
+  /*make sure that length values that aren't filled in will be 0, or a wrong tree will be generated*/
+  unsigned error = 0;
+  unsigned n, HLIT, HDIST, HCLEN, i;
+  size_t inbitlength = inlength * 8;
+
+  /*see comments in deflateDynamic for explanation of the context and these variables, it is analogous*/
+  unsigned* bitlen_ll = 0; /*lit,len code lengths*/
+  unsigned* bitlen_d = 0; /*dist code lengths*/
+  /*code length code lengths ("clcl"), the bit lengths of the huffman tree used to compress bitlen_ll and bitlen_d*/
+  unsigned* bitlen_cl = 0;
+  HuffmanTree tree_cl; /*the code tree for code length codes (the huffman tree for compressed huffman trees)*/
+
+  if((*bp) + 14 > (inlength << 3)) return 49; /*error: the bit pointer is or will go past the memory*/
+
+  /*number of literal/length codes + 257. Unlike the spec, the value 257 is added to it here already*/
+  HLIT =  readBitsFromStream(bp, in, 5) + 257;
+  /*number of distance codes. Unlike the spec, the value 1 is added to it here already*/
+  HDIST = readBitsFromStream(bp, in, 5) + 1;
+  /*number of code length codes. Unlike the spec, the value 4 is added to it here already*/
+  HCLEN = readBitsFromStream(bp, in, 4) + 4;
+
+  if((*bp) + HCLEN * 3 > (inlength << 3)) return 50; /*error: the bit pointer is or will go past the memory*/
+
+  HuffmanTree_init(&tree_cl);
+
+  while(!error)
+  {
+    /*read the code length codes out of 3 * (amount of code length codes) bits*/
+
+    bitlen_cl = (unsigned*)lodepng_malloc(NUM_CODE_LENGTH_CODES * sizeof(unsigned));
+    if(!bitlen_cl) ERROR_BREAK(83 /*alloc fail*/);
+
+    for(i = 0; i != NUM_CODE_LENGTH_CODES; ++i)
+    {
+      if(i < HCLEN) bitlen_cl[CLCL_ORDER[i]] = readBitsFromStream(bp, in, 3);
+      else bitlen_cl[CLCL_ORDER[i]] = 0; /*if not, it must stay 0*/
+    }
+
+    error = HuffmanTree_makeFromLengths(&tree_cl, bitlen_cl, NUM_CODE_LENGTH_CODES, 7);
+    if(error) break;
+
+    /*now we can use this tree to read the lengths for the tree that this function will return*/
+    bitlen_ll = (unsigned*)lodepng_malloc(NUM_DEFLATE_CODE_SYMBOLS * sizeof(unsigned));
+    bitlen_d = (unsigned*)lodepng_malloc(NUM_DISTANCE_SYMBOLS * sizeof(unsigned));
+    if(!bitlen_ll || !bitlen_d) ERROR_BREAK(83 /*alloc fail*/);
+    for(i = 0; i != NUM_DEFLATE_CODE_SYMBOLS; ++i) bitlen_ll[i] = 0;
+    for(i = 0; i != NUM_DISTANCE_SYMBOLS; ++i) bitlen_d[i] = 0;
+
+    /*i is the current symbol we're reading in the part that contains the code lengths of lit/len and dist codes*/
+    i = 0;
+    while(i < HLIT + HDIST)
+    {
+      unsigned code = huffmanDecodeSymbol(in, bp, &tree_cl, inbitlength);
+      if(code <= 15) /*a length code*/
+      {
+        if(i < HLIT) bitlen_ll[i] = code;
+        else bitlen_d[i - HLIT] = code;
+        ++i;
+      }
+      else if(code == 16) /*repeat previous*/
+      {
+        unsigned replength = 3; /*read in the 2 bits that indicate repeat length (3-6)*/
+        unsigned value; /*set value to the previous code*/
+
+        if(i == 0) ERROR_BREAK(54); /*can't repeat previous if i is 0*/
+
+        if((*bp + 2) > inbitlength) ERROR_BREAK(50); /*error, bit pointer jumps past memory*/
+        replength += readBitsFromStream(bp, in, 2);
+
+        if(i < HLIT + 1) value = bitlen_ll[i - 1];
+        else value = bitlen_d[i - HLIT - 1];
+        /*repeat this value in the next lengths*/
+        for(n = 0; n < replength; ++n)
+        {
+          if(i >= HLIT + HDIST) ERROR_BREAK(13); /*error: i is larger than the amount of codes*/
+          if(i < HLIT) bitlen_ll[i] = value;
+          else bitlen_d[i - HLIT] = value;
+          ++i;
+        }
+      }
+      else if(code == 17) /*repeat "0" 3-10 times*/
+      {
+        unsigned replength = 3; /*read in the bits that indicate repeat length*/
+        if((*bp + 3) > inbitlength) ERROR_BREAK(50); /*error, bit pointer jumps past memory*/
+        replength += readBitsFromStream(bp, in, 3);
+
+        /*repeat this value in the next lengths*/
+        for(n = 0; n < replength; ++n)
+        {
+          if(i >= HLIT + HDIST) ERROR_BREAK(14); /*error: i is larger than the amount of codes*/
+
+          if(i < HLIT) bitlen_ll[i] = 0;
+          else bitlen_d[i - HLIT] = 0;
+          ++i;
+        }
+      }
+      else if(code == 18) /*repeat "0" 11-138 times*/
+      {
+        unsigned replength = 11; /*read in the bits that indicate repeat length*/
+        if((*bp + 7) > inbitlength) ERROR_BREAK(50); /*error, bit pointer jumps past memory*/
+        replength += readBitsFromStream(bp, in, 7);
+
+        /*repeat this value in the next lengths*/
+        for(n = 0; n < replength; ++n)
+        {
+          if(i >= HLIT + HDIST) ERROR_BREAK(15); /*error: i is larger than the amount of codes*/
+
+          if(i < HLIT) bitlen_ll[i] = 0;
+          else bitlen_d[i - HLIT] = 0;
+          ++i;
+        }
+      }
+      else /*if(code == (unsigned)(-1))*/ /*huffmanDecodeSymbol returns (unsigned)(-1) in case of error*/
+      {
+        if(code == (unsigned)(-1))
+        {
+          /*return error code 10 or 11 depending on the situation that happened in huffmanDecodeSymbol
+          (10=no endcode, 11=wrong jump outside of tree)*/
+          error = (*bp) > inbitlength ? 10 : 11;
+        }
+        else error = 16; /*unexisting code, this can never happen*/
+        break;
+      }
+    }
+    if(error) break;
+
+    if(bitlen_ll[256] == 0) ERROR_BREAK(64); /*the length of the end code 256 must be larger than 0*/
+
+    /*now we've finally got HLIT and HDIST, so generate the code trees, and the function is done*/
+    error = HuffmanTree_makeFromLengths(tree_ll, bitlen_ll, NUM_DEFLATE_CODE_SYMBOLS, 15);
+    if(error) break;
+    error = HuffmanTree_makeFromLengths(tree_d, bitlen_d, NUM_DISTANCE_SYMBOLS, 15);
+
+    break; /*end of error-while*/
+  }
+
+  lodepng_free(bitlen_cl);
+  lodepng_free(bitlen_ll);
+  lodepng_free(bitlen_d);
+  HuffmanTree_cleanup(&tree_cl);
+
+  return error;
+}
+
+/*inflate a block with dynamic of fixed Huffman tree*/
+static unsigned inflateHuffmanBlock(ucvector* out, const unsigned char* in, size_t* bp,
+                                    size_t* pos, size_t inlength, unsigned btype)
+{
+  unsigned error = 0;
+  HuffmanTree tree_ll; /*the huffman tree for literal and length codes*/
+  HuffmanTree tree_d; /*the huffman tree for distance codes*/
+  size_t inbitlength = inlength * 8;
+
+  HuffmanTree_init(&tree_ll);
+  HuffmanTree_init(&tree_d);
+
+  if(btype == 1) getTreeInflateFixed(&tree_ll, &tree_d);
+  else if(btype == 2) error = getTreeInflateDynamic(&tree_ll, &tree_d, in, bp, inlength);
+
+  while(!error) /*decode all symbols until end reached, breaks at end code*/
+  {
+    /*code_ll is literal, length or end code*/
+    unsigned code_ll = huffmanDecodeSymbol(in, bp, &tree_ll, inbitlength);
+    if(code_ll <= 255) /*literal symbol*/
+    {
+      /*ucvector_push_back would do the same, but for some reason the two lines below run 10% faster*/
+      if(!ucvector_resize(out, (*pos) + 1)) ERROR_BREAK(83 /*alloc fail*/);
+      out->data[*pos] = (unsigned char)code_ll;
+      ++(*pos);
+    }
+    else if(code_ll >= FIRST_LENGTH_CODE_INDEX && code_ll <= LAST_LENGTH_CODE_INDEX) /*length code*/
+    {
+      unsigned code_d, distance;
+      unsigned numextrabits_l, numextrabits_d; /*extra bits for length and distance*/
+      size_t start, forward, backward, length;
+
+      /*part 1: get length base*/
+      length = LENGTHBASE[code_ll - FIRST_LENGTH_CODE_INDEX];
+
+      /*part 2: get extra bits and add the value of that to length*/
+      numextrabits_l = LENGTHEXTRA[code_ll - FIRST_LENGTH_CODE_INDEX];
+      if((*bp + numextrabits_l) > inbitlength) ERROR_BREAK(51); /*error, bit pointer will jump past memory*/
+      length += readBitsFromStream(bp, in, numextrabits_l);
+
+      /*part 3: get distance code*/
+      code_d = huffmanDecodeSymbol(in, bp, &tree_d, inbitlength);
+      if(code_d > 29)
+      {
+        if(code_ll == (unsigned)(-1)) /*huffmanDecodeSymbol returns (unsigned)(-1) in case of error*/
+        {
+          /*return error code 10 or 11 depending on the situation that happened in huffmanDecodeSymbol
+          (10=no endcode, 11=wrong jump outside of tree)*/
+          error = (*bp) > inlength * 8 ? 10 : 11;
+        }
+        else error = 18; /*error: invalid distance code (30-31 are never used)*/
+        break;
+      }
+      distance = DISTANCEBASE[code_d];
+
+      /*part 4: get extra bits from distance*/
+      numextrabits_d = DISTANCEEXTRA[code_d];
+      if((*bp + numextrabits_d) > inbitlength) ERROR_BREAK(51); /*error, bit pointer will jump past memory*/
+      distance += readBitsFromStream(bp, in, numextrabits_d);
+
+      /*part 5: fill in all the out[n] values based on the length and dist*/
+      start = (*pos);
+      if(distance > start) ERROR_BREAK(52); /*too long backward distance*/
+      backward = start - distance;
+
+      if(!ucvector_resize(out, (*pos) + length)) ERROR_BREAK(83 /*alloc fail*/);
+      if (distance < length) {
+        for(forward = 0; forward < length; ++forward)
+        {
+          out->data[(*pos)++] = out->data[backward++];
+        }
+      } else {
+        memcpy(out->data + *pos, out->data + backward, length);
+        *pos += length;
+      }
+    }
+    else if(code_ll == 256)
+    {
+      break; /*end code, break the loop*/
+    }
+    else /*if(code == (unsigned)(-1))*/ /*huffmanDecodeSymbol returns (unsigned)(-1) in case of error*/
+    {
+      /*return error code 10 or 11 depending on the situation that happened in huffmanDecodeSymbol
+      (10=no endcode, 11=wrong jump outside of tree)*/
+      error = ((*bp) > inlength * 8) ? 10 : 11;
+      break;
+    }
+  }
+
+  HuffmanTree_cleanup(&tree_ll);
+  HuffmanTree_cleanup(&tree_d);
+
+  return error;
+}
+
+static unsigned inflateNoCompression(ucvector* out, const unsigned char* in, size_t* bp, size_t* pos, size_t inlength)
+{
+  size_t p;
+  unsigned LEN, NLEN, n, error = 0;
+
+  /*go to first boundary of byte*/
+  while(((*bp) & 0x7) != 0) ++(*bp);
+  p = (*bp) / 8; /*byte position*/
+
+  /*read LEN (2 bytes) and NLEN (2 bytes)*/
+  if(p + 4 >= inlength) return 52; /*error, bit pointer will jump past memory*/
+  LEN = in[p] + 256u * in[p + 1]; p += 2;
+  NLEN = in[p] + 256u * in[p + 1]; p += 2;
+
+  /*check if 16-bit NLEN is really the one's complement of LEN*/
+  if(LEN + NLEN != 65535) return 21; /*error: NLEN is not one's complement of LEN*/
+
+  if(!ucvector_resize(out, (*pos) + LEN)) return 83; /*alloc fail*/
+
+  /*read the literal data: LEN bytes are now stored in the out buffer*/
+  if(p + LEN > inlength) return 23; /*error: reading outside of in buffer*/
+  for(n = 0; n < LEN; ++n) out->data[(*pos)++] = in[p++];
+
+  (*bp) = p * 8;
+
+  return error;
+}
+
+static unsigned lodepng_inflatev(ucvector* out,
+                                 const unsigned char* in, size_t insize,
+                                 const LodePNGDecompressSettings* settings)
+{
+  /*bit pointer in the "in" data, current byte is bp >> 3, current bit is bp & 0x7 (from lsb to msb of the byte)*/
+  size_t bp = 0;
+  unsigned BFINAL = 0;
+  size_t pos = 0; /*byte position in the out buffer*/
+  unsigned error = 0;
+
+  (void)settings;
+
+  while(!BFINAL)
+  {
+    unsigned BTYPE;
+    if(bp + 2 >= insize * 8) return 52; /*error, bit pointer will jump past memory*/
+    BFINAL = readBitFromStream(&bp, in);
+    BTYPE = 1u * readBitFromStream(&bp, in);
+    BTYPE += 2u * readBitFromStream(&bp, in);
+
+    if(BTYPE == 3) return 20; /*error: invalid BTYPE*/
+    else if(BTYPE == 0) error = inflateNoCompression(out, in, &bp, &pos, insize); /*no compression*/
+    else error = inflateHuffmanBlock(out, in, &bp, &pos, insize, BTYPE); /*compression, BTYPE 01 or 10*/
+
+    if(error) return error;
+  }
+
+  return error;
+}
+
+unsigned lodepng_inflate(unsigned char** out, size_t* outsize,
+                         const unsigned char* in, size_t insize,
+                         const LodePNGDecompressSettings* settings)
+{
+  unsigned error;
+  ucvector v;
+  ucvector_init_buffer(&v, *out, *outsize);
+  error = lodepng_inflatev(&v, in, insize, settings);
+  *out = v.data;
+  *outsize = v.size;
+  return error;
+}
+
+static unsigned inflate(unsigned char** out, size_t* outsize,
+                        const unsigned char* in, size_t insize,
+                        const LodePNGDecompressSettings* settings)
+{
+  if(settings->custom_inflate)
+  {
+    return settings->custom_inflate(out, outsize, in, insize, settings);
+  }
+  else
+  {
+    return lodepng_inflate(out, outsize, in, insize, settings);
+  }
+}
+
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Deflator (Compressor)                                                  / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+static const size_t MAX_SUPPORTED_DEFLATE_LENGTH = 258;
+
+/*bitlen is the size in bits of the code*/
+static void addHuffmanSymbol(size_t* bp, ucvector* compressed, unsigned code, unsigned bitlen)
+{
+  addBitsToStreamReversed(bp, compressed, code, bitlen);
+}
+
+/*search the index in the array, that has the largest value smaller than or equal to the given value,
+given array must be sorted (if no value is smaller, it returns the size of the given array)*/
+static size_t searchCodeIndex(const unsigned* array, size_t array_size, size_t value)
+{
+  /*binary search (only small gain over linear). TODO: use CPU log2 instruction for getting symbols instead*/
+  size_t left = 1;
+  size_t right = array_size - 1;
+
+  while(left <= right) {
+    size_t mid = (left + right) >> 1;
+    if (array[mid] >= value) right = mid - 1;
+    else left = mid + 1;
+  }
+  if(left >= array_size || array[left] > value) left--;
+  return left;
+}
+
+static void addLengthDistance(uivector* values, size_t length, size_t distance)
+{
+  /*values in encoded vector are those used by deflate:
+  0-255: literal bytes
+  256: end
+  257-285: length/distance pair (length code, followed by extra length bits, distance code, extra distance bits)
+  286-287: invalid*/
+
+  unsigned length_code = (unsigned)searchCodeIndex(LENGTHBASE, 29, length);
+  unsigned extra_length = (unsigned)(length - LENGTHBASE[length_code]);
+  unsigned dist_code = (unsigned)searchCodeIndex(DISTANCEBASE, 30, distance);
+  unsigned extra_distance = (unsigned)(distance - DISTANCEBASE[dist_code]);
+
+  uivector_push_back(values, length_code + FIRST_LENGTH_CODE_INDEX);
+  uivector_push_back(values, extra_length);
+  uivector_push_back(values, dist_code);
+  uivector_push_back(values, extra_distance);
+}
+
+/*3 bytes of data get encoded into two bytes. The hash cannot use more than 3
+bytes as input because 3 is the minimum match length for deflate*/
+static const unsigned HASH_NUM_VALUES = 65536;
+static const unsigned HASH_BIT_MASK = 65535; /*HASH_NUM_VALUES - 1, but C90 does not like that as initializer*/
+
+typedef struct Hash
+{
+  int* head; /*hash value to head circular pos - can be outdated if went around window*/
+  /*circular pos to prev circular pos*/
+  unsigned short* chain;
+  int* val; /*circular pos to hash value*/
+
+  /*TODO: do this not only for zeros but for any repeated byte. However for PNG
+  it's always going to be the zeros that dominate, so not important for PNG*/
+  int* headz; /*similar to head, but for chainz*/
+  unsigned short* chainz; /*those with same amount of zeros*/
+  unsigned short* zeros; /*length of zeros streak, used as a second hash chain*/
+} Hash;
+
+static unsigned hash_init(Hash* hash, unsigned windowsize)
+{
+  unsigned i;
+  hash->head = (int*)lodepng_malloc(sizeof(int) * HASH_NUM_VALUES);
+  hash->val = (int*)lodepng_malloc(sizeof(int) * windowsize);
+  hash->chain = (unsigned short*)lodepng_malloc(sizeof(unsigned short) * windowsize);
+
+  hash->zeros = (unsigned short*)lodepng_malloc(sizeof(unsigned short) * windowsize);
+  hash->headz = (int*)lodepng_malloc(sizeof(int) * (MAX_SUPPORTED_DEFLATE_LENGTH + 1));
+  hash->chainz = (unsigned short*)lodepng_malloc(sizeof(unsigned short) * windowsize);
+
+  if(!hash->head || !hash->chain || !hash->val  || !hash->headz|| !hash->chainz || !hash->zeros)
+  {
+    return 83; /*alloc fail*/
+  }
+
+  /*initialize hash table*/
+  for(i = 0; i != HASH_NUM_VALUES; ++i) hash->head[i] = -1;
+  for(i = 0; i != windowsize; ++i) hash->val[i] = -1;
+  for(i = 0; i != windowsize; ++i) hash->chain[i] = i; /*same value as index indicates uninitialized*/
+
+  for(i = 0; i <= MAX_SUPPORTED_DEFLATE_LENGTH; ++i) hash->headz[i] = -1;
+  for(i = 0; i != windowsize; ++i) hash->chainz[i] = i; /*same value as index indicates uninitialized*/
+
+  return 0;
+}
+
+static void hash_cleanup(Hash* hash)
+{
+  lodepng_free(hash->head);
+  lodepng_free(hash->val);
+  lodepng_free(hash->chain);
+
+  lodepng_free(hash->zeros);
+  lodepng_free(hash->headz);
+  lodepng_free(hash->chainz);
+}
+
+
+
+static unsigned getHash(const unsigned char* data, size_t size, size_t pos)
+{
+  unsigned result = 0;
+  if(pos + 2 < size)
+  {
+    /*A simple shift and xor hash is used. Since the data of PNGs is dominated
+    by zeroes due to the filters, a better hash does not have a significant
+    effect on speed in traversing the chain, and causes more time spend on
+    calculating the hash.*/
+    result ^= (unsigned)(data[pos + 0] << 0u);
+    result ^= (unsigned)(data[pos + 1] << 4u);
+    result ^= (unsigned)(data[pos + 2] << 8u);
+  } else {
+    size_t amount, i;
+    if(pos >= size) return 0;
+    amount = size - pos;
+    for(i = 0; i != amount; ++i) result ^= (unsigned)(data[pos + i] << (i * 8u));
+  }
+  return result & HASH_BIT_MASK;
+}
+
+static unsigned countZeros(const unsigned char* data, size_t size, size_t pos)
+{
+  const unsigned char* start = data + pos;
+  const unsigned char* end = start + MAX_SUPPORTED_DEFLATE_LENGTH;
+  if(end > data + size) end = data + size;
+  data = start;
+  while(data != end && *data == 0) ++data;
+  /*subtracting two addresses returned as 32-bit number (max value is MAX_SUPPORTED_DEFLATE_LENGTH)*/
+  return (unsigned)(data - start);
+}
+
+/*wpos = pos & (windowsize - 1)*/
+static void updateHashChain(Hash* hash, int wpos, unsigned hashval, unsigned short numzeros)
+{
+  hash->val[wpos] = (int)hashval;
+  if(hash->head[hashval] != -1) hash->chain[wpos] = hash->head[hashval];
+  hash->head[hashval] = wpos;
+
+  hash->zeros[wpos] = numzeros;
+  if(hash->headz[numzeros] != -1) hash->chainz[wpos] = hash->headz[numzeros];
+  hash->headz[numzeros] = wpos;
+}
+
+/*
+LZ77-encode the data. Return value is error code. The input are raw bytes, the output
+is in the form of unsigned integers with codes representing for example literal bytes, or
+length/distance pairs.
+It uses a hash table technique to let it encode faster. When doing LZ77 encoding, a
+sliding window (of windowsize) is used, and all past bytes in that window can be used as
+the "dictionary". A brute force search through all possible distances would be slow, and
+this hash technique is one out of several ways to speed this up.
+*/
+static unsigned encodeLZ77(uivector* out, Hash* hash,
+                           const unsigned char* in, size_t inpos, size_t insize, unsigned windowsize,
+                           unsigned minmatch, unsigned nicematch, unsigned lazymatching)
+{
+  size_t pos;
+  unsigned i, error = 0;
+  /*for large window lengths, assume the user wants no compression loss. Otherwise, max hash chain length speedup.*/
+  unsigned maxchainlength = windowsize >= 8192 ? windowsize : windowsize / 8;
+  unsigned maxlazymatch = windowsize >= 8192 ? MAX_SUPPORTED_DEFLATE_LENGTH : 64;
+
+  unsigned usezeros = 1; /*not sure if setting it to false for windowsize < 8192 is better or worse*/
+  unsigned numzeros = 0;
+
+  unsigned offset; /*the offset represents the distance in LZ77 terminology*/
+  unsigned length;
+  unsigned lazy = 0;
+  unsigned lazylength = 0, lazyoffset = 0;
+  unsigned hashval;
+  unsigned current_offset, current_length;
+  unsigned prev_offset;
+  const unsigned char *lastptr, *foreptr, *backptr;
+  unsigned hashpos;
+
+  if(windowsize == 0 || windowsize > 32768) return 60; /*error: windowsize smaller/larger than allowed*/
+  if((windowsize & (windowsize - 1)) != 0) return 90; /*error: must be power of two*/
+
+  if(nicematch > MAX_SUPPORTED_DEFLATE_LENGTH) nicematch = MAX_SUPPORTED_DEFLATE_LENGTH;
+
+  for(pos = inpos; pos < insize; ++pos)
+  {
+    unsigned int wpos = pos & (windowsize - 1); /*position for in 'circular' hash buffers*/
+    unsigned chainlength = 0;
+
+    hashval = getHash(in, insize, pos);
+
+    if(usezeros && hashval == 0)
+    {
+      if(numzeros == 0) numzeros = countZeros(in, insize, pos);
+      else if(pos + numzeros > insize || in[pos + numzeros - 1] != 0) --numzeros;
+    }
+    else
+    {
+      numzeros = 0;
+    }
+
+    updateHashChain(hash, wpos, hashval, numzeros);
+
+    /*the length and offset found for the current position*/
+    length = 0;
+    offset = 0;
+
+    hashpos = hash->chain[wpos];
+
+    lastptr = &in[insize < pos + MAX_SUPPORTED_DEFLATE_LENGTH ? insize : pos + MAX_SUPPORTED_DEFLATE_LENGTH];
+
+    /*search for the longest string*/
+    prev_offset = 0;
+    for(;;)
+    {
+      if(chainlength++ >= maxchainlength) break;
+      current_offset = hashpos <= wpos ? wpos - hashpos : wpos - hashpos + windowsize;
+
+      if(current_offset < prev_offset) break; /*stop when went completely around the circular buffer*/
+      prev_offset = current_offset;
+      if(current_offset > 0)
+      {
+        /*test the next characters*/
+        foreptr = &in[pos];
+        backptr = &in[pos - current_offset];
+
+        /*common case in PNGs is lots of zeros. Quickly skip over them as a speedup*/
+        if(numzeros >= 3)
+        {
+          unsigned skip = hash->zeros[hashpos];
+          if(skip > numzeros) skip = numzeros;
+          backptr += skip;
+          foreptr += skip;
+        }
+
+        while(foreptr != lastptr && *backptr == *foreptr) /*maximum supported length by deflate is max length*/
+        {
+          ++backptr;
+          ++foreptr;
+        }
+        current_length = (unsigned)(foreptr - &in[pos]);
+
+        if(current_length > length)
+        {
+          length = current_length; /*the longest length*/
+          offset = current_offset; /*the offset that is related to this longest length*/
+          /*jump out once a length of max length is found (speed gain). This also jumps
+          out if length is MAX_SUPPORTED_DEFLATE_LENGTH*/
+          if(current_length >= nicematch) break;
+        }
+      }
+
+      if(hashpos == hash->chain[hashpos]) break;
+
+      if(numzeros >= 3 && length > numzeros)
+      {
+        hashpos = hash->chainz[hashpos];
+        if(hash->zeros[hashpos] != numzeros) break;
+      }
+      else
+      {
+        hashpos = hash->chain[hashpos];
+        /*outdated hash value, happens if particular value was not encountered in whole last window*/
+        if(hash->val[hashpos] != (int)hashval) break;
+      }
+    }
+
+    if(lazymatching)
+    {
+      if(!lazy && length >= 3 && length <= maxlazymatch && length < MAX_SUPPORTED_DEFLATE_LENGTH)
+      {
+        lazy = 1;
+        lazylength = length;
+        lazyoffset = offset;
+        continue; /*try the next byte*/
+      }
+      if(lazy)
+      {
+        lazy = 0;
+        if(pos == 0) ERROR_BREAK(81);
+        if(length > lazylength + 1)
+        {
+          /*push the previous character as literal*/
+          if(!uivector_push_back(out, in[pos - 1])) ERROR_BREAK(83 /*alloc fail*/);
+        }
+        else
+        {
+          length = lazylength;
+          offset = lazyoffset;
+          hash->head[hashval] = -1; /*the same hashchain update will be done, this ensures no wrong alteration*/
+          hash->headz[numzeros] = -1; /*idem*/
+          --pos;
+        }
+      }
+    }
+    if(length >= 3 && offset > windowsize) ERROR_BREAK(86 /*too big (or overflown negative) offset*/);
+
+    /*encode it as length/distance pair or literal value*/
+    if(length < 3) /*only lengths of 3 or higher are supported as length/distance pair*/
+    {
+      if(!uivector_push_back(out, in[pos])) ERROR_BREAK(83 /*alloc fail*/);
+    }
+    else if(length < minmatch || (length == 3 && offset > 4096))
+    {
+      /*compensate for the fact that longer offsets have more extra bits, a
+      length of only 3 may be not worth it then*/
+      if(!uivector_push_back(out, in[pos])) ERROR_BREAK(83 /*alloc fail*/);
+    }
+    else
+    {
+      addLengthDistance(out, length, offset);
+      for(i = 1; i < length; ++i)
+      {
+        ++pos;
+        wpos = pos & (windowsize - 1);
+        hashval = getHash(in, insize, pos);
+        if(usezeros && hashval == 0)
+        {
+          if(numzeros == 0) numzeros = countZeros(in, insize, pos);
+          else if(pos + numzeros > insize || in[pos + numzeros - 1] != 0) --numzeros;
+        }
+        else
+        {
+          numzeros = 0;
+        }
+        updateHashChain(hash, wpos, hashval, numzeros);
+      }
+    }
+  } /*end of the loop through each character of input*/
+
+  return error;
+}
+
+/* /////////////////////////////////////////////////////////////////////////// */
+
+static unsigned deflateNoCompression(ucvector* out, const unsigned char* data, size_t datasize)
+{
+  /*non compressed deflate block data: 1 bit BFINAL,2 bits BTYPE,(5 bits): it jumps to start of next byte,
+  2 bytes LEN, 2 bytes NLEN, LEN bytes literal DATA*/
+
+  size_t i, j, numdeflateblocks = (datasize + 65534) / 65535;
+  unsigned datapos = 0;
+  for(i = 0; i != numdeflateblocks; ++i)
+  {
+    unsigned BFINAL, BTYPE, LEN, NLEN;
+    unsigned char firstbyte;
+
+    BFINAL = (i == numdeflateblocks - 1);
+    BTYPE = 0;
+
+    firstbyte = (unsigned char)(BFINAL + ((BTYPE & 1) << 1) + ((BTYPE & 2) << 1));
+    ucvector_push_back(out, firstbyte);
+
+    LEN = 65535;
+    if(datasize - datapos < 65535) LEN = (unsigned)datasize - datapos;
+    NLEN = 65535 - LEN;
+
+    ucvector_push_back(out, (unsigned char)(LEN & 255));
+    ucvector_push_back(out, (unsigned char)(LEN >> 8));
+    ucvector_push_back(out, (unsigned char)(NLEN & 255));
+    ucvector_push_back(out, (unsigned char)(NLEN >> 8));
+
+    /*Decompressed data*/
+    for(j = 0; j < 65535 && datapos < datasize; ++j)
+    {
+      ucvector_push_back(out, data[datapos++]);
+    }
+  }
+
+  return 0;
+}
+
+/*
+write the lz77-encoded data, which has lit, len and dist codes, to compressed stream using huffman trees.
+tree_ll: the tree for lit and len codes.
+tree_d: the tree for distance codes.
+*/
+static void writeLZ77data(size_t* bp, ucvector* out, const uivector* lz77_encoded,
+                          const HuffmanTree* tree_ll, const HuffmanTree* tree_d)
+{
+  size_t i = 0;
+  for(i = 0; i != lz77_encoded->size; ++i)
+  {
+    unsigned val = lz77_encoded->data[i];
+    addHuffmanSymbol(bp, out, HuffmanTree_getCode(tree_ll, val), HuffmanTree_getLength(tree_ll, val));
+    if(val > 256) /*for a length code, 3 more things have to be added*/
+    {
+      unsigned length_index = val - FIRST_LENGTH_CODE_INDEX;
+      unsigned n_length_extra_bits = LENGTHEXTRA[length_index];
+      unsigned length_extra_bits = lz77_encoded->data[++i];
+
+      unsigned distance_code = lz77_encoded->data[++i];
+
+      unsigned distance_index = distance_code;
+      unsigned n_distance_extra_bits = DISTANCEEXTRA[distance_index];
+      unsigned distance_extra_bits = lz77_encoded->data[++i];
+
+      addBitsToStream(bp, out, length_extra_bits, n_length_extra_bits);
+      addHuffmanSymbol(bp, out, HuffmanTree_getCode(tree_d, distance_code),
+                       HuffmanTree_getLength(tree_d, distance_code));
+      addBitsToStream(bp, out, distance_extra_bits, n_distance_extra_bits);
+    }
+  }
+}
+
+/*Deflate for a block of type "dynamic", that is, with freely, optimally, created huffman trees*/
+static unsigned deflateDynamic(ucvector* out, size_t* bp, Hash* hash,
+                               const unsigned char* data, size_t datapos, size_t dataend,
+                               const LodePNGCompressSettings* settings, unsigned final)
+{
+  unsigned error = 0;
+
+  /*
+  A block is compressed as follows: The PNG data is lz77 encoded, resulting in
+  literal bytes and length/distance pairs. This is then huffman compressed with
+  two huffman trees. One huffman tree is used for the lit and len values ("ll"),
+  another huffman tree is used for the dist values ("d"). These two trees are
+  stored using their code lengths, and to compress even more these code lengths
+  are also run-length encoded and huffman compressed. This gives a huffman tree
+  of code lengths "cl". The code lenghts used to describe this third tree are
+  the code length code lengths ("clcl").
+  */
+
+  /*The lz77 encoded data, represented with integers since there will also be length and distance codes in it*/
+  uivector lz77_encoded;
+  HuffmanTree tree_ll; /*tree for lit,len values*/
+  HuffmanTree tree_d; /*tree for distance codes*/
+  HuffmanTree tree_cl; /*tree for encoding the code lengths representing tree_ll and tree_d*/
+  uivector frequencies_ll; /*frequency of lit,len codes*/
+  uivector frequencies_d; /*frequency of dist codes*/
+  uivector frequencies_cl; /*frequency of code length codes*/
+  uivector bitlen_lld; /*lit,len,dist code lenghts (int bits), literally (without repeat codes).*/
+  uivector bitlen_lld_e; /*bitlen_lld encoded with repeat codes (this is a rudemtary run length compression)*/
+  /*bitlen_cl is the code length code lengths ("clcl"). The bit lengths of codes to represent tree_cl
+  (these are written as is in the file, it would be crazy to compress these using yet another huffman
+  tree that needs to be represented by yet another set of code lengths)*/
+  uivector bitlen_cl;
+  size_t datasize = dataend - datapos;
+
+  /*
+  Due to the huffman compression of huffman tree representations ("two levels"), there are some anologies:
+  bitlen_lld is to tree_cl what data is to tree_ll and tree_d.
+  bitlen_lld_e is to bitlen_lld what lz77_encoded is to data.
+  bitlen_cl is to bitlen_lld_e what bitlen_lld is to lz77_encoded.
+  */
+
+  unsigned BFINAL = final;
+  size_t numcodes_ll, numcodes_d, i;
+  unsigned HLIT, HDIST, HCLEN;
+
+  uivector_init(&lz77_encoded);
+  HuffmanTree_init(&tree_ll);
+  HuffmanTree_init(&tree_d);
+  HuffmanTree_init(&tree_cl);
+  uivector_init(&frequencies_ll);
+  uivector_init(&frequencies_d);
+  uivector_init(&frequencies_cl);
+  uivector_init(&bitlen_lld);
+  uivector_init(&bitlen_lld_e);
+  uivector_init(&bitlen_cl);
+
+  /*This while loop never loops due to a break at the end, it is here to
+  allow breaking out of it to the cleanup phase on error conditions.*/
+  while(!error)
+  {
+    if(settings->use_lz77)
+    {
+      error = encodeLZ77(&lz77_encoded, hash, data, datapos, dataend, settings->windowsize,
+                         settings->minmatch, settings->nicematch, settings->lazymatching);
+      if(error) break;
+    }
+    else
+    {
+      if(!uivector_resize(&lz77_encoded, datasize)) ERROR_BREAK(83 /*alloc fail*/);
+      for(i = datapos; i < dataend; ++i) lz77_encoded.data[i - datapos] = data[i]; /*no LZ77, but still will be Huffman compressed*/
+    }
+
+    if(!uivector_resizev(&frequencies_ll, 286, 0)) ERROR_BREAK(83 /*alloc fail*/);
+    if(!uivector_resizev(&frequencies_d, 30, 0)) ERROR_BREAK(83 /*alloc fail*/);
+
+    /*Count the frequencies of lit, len and dist codes*/
+    for(i = 0; i != lz77_encoded.size; ++i)
+    {
+      unsigned symbol = lz77_encoded.data[i];
+      ++frequencies_ll.data[symbol];
+      if(symbol > 256)
+      {
+        unsigned dist = lz77_encoded.data[i + 2];
+        ++frequencies_d.data[dist];
+        i += 3;
+      }
+    }
+    frequencies_ll.data[256] = 1; /*there will be exactly 1 end code, at the end of the block*/
+
+    /*Make both huffman trees, one for the lit and len codes, one for the dist codes*/
+    error = HuffmanTree_makeFromFrequencies(&tree_ll, frequencies_ll.data, 257, frequencies_ll.size, 15);
+    if(error) break;
+    /*2, not 1, is chosen for mincodes: some buggy PNG decoders require at least 2 symbols in the dist tree*/
+    error = HuffmanTree_makeFromFrequencies(&tree_d, frequencies_d.data, 2, frequencies_d.size, 15);
+    if(error) break;
+
+    numcodes_ll = tree_ll.numcodes; if(numcodes_ll > 286) numcodes_ll = 286;
+    numcodes_d = tree_d.numcodes; if(numcodes_d > 30) numcodes_d = 30;
+    /*store the code lengths of both generated trees in bitlen_lld*/
+    for(i = 0; i != numcodes_ll; ++i) uivector_push_back(&bitlen_lld, HuffmanTree_getLength(&tree_ll, (unsigned)i));
+    for(i = 0; i != numcodes_d; ++i) uivector_push_back(&bitlen_lld, HuffmanTree_getLength(&tree_d, (unsigned)i));
+
+    /*run-length compress bitlen_ldd into bitlen_lld_e by using repeat codes 16 (copy length 3-6 times),
+    17 (3-10 zeroes), 18 (11-138 zeroes)*/
+    for(i = 0; i != (unsigned)bitlen_lld.size; ++i)
+    {
+      unsigned j = 0; /*amount of repititions*/
+      while(i + j + 1 < (unsigned)bitlen_lld.size && bitlen_lld.data[i + j + 1] == bitlen_lld.data[i]) ++j;
+
+      if(bitlen_lld.data[i] == 0 && j >= 2) /*repeat code for zeroes*/
+      {
+        ++j; /*include the first zero*/
+        if(j <= 10) /*repeat code 17 supports max 10 zeroes*/
+        {
+          uivector_push_back(&bitlen_lld_e, 17);
+          uivector_push_back(&bitlen_lld_e, j - 3);
+        }
+        else /*repeat code 18 supports max 138 zeroes*/
+        {
+          if(j > 138) j = 138;
+          uivector_push_back(&bitlen_lld_e, 18);
+          uivector_push_back(&bitlen_lld_e, j - 11);
+        }
+        i += (j - 1);
+      }
+      else if(j >= 3) /*repeat code for value other than zero*/
+      {
+        size_t k;
+        unsigned num = j / 6, rest = j % 6;
+        uivector_push_back(&bitlen_lld_e, bitlen_lld.data[i]);
+        for(k = 0; k < num; ++k)
+        {
+          uivector_push_back(&bitlen_lld_e, 16);
+          uivector_push_back(&bitlen_lld_e, 6 - 3);
+        }
+        if(rest >= 3)
+        {
+          uivector_push_back(&bitlen_lld_e, 16);
+          uivector_push_back(&bitlen_lld_e, rest - 3);
+        }
+        else j -= rest;
+        i += j;
+      }
+      else /*too short to benefit from repeat code*/
+      {
+        uivector_push_back(&bitlen_lld_e, bitlen_lld.data[i]);
+      }
+    }
+
+    /*generate tree_cl, the huffmantree of huffmantrees*/
+
+    if(!uivector_resizev(&frequencies_cl, NUM_CODE_LENGTH_CODES, 0)) ERROR_BREAK(83 /*alloc fail*/);
+    for(i = 0; i != bitlen_lld_e.size; ++i)
+    {
+      ++frequencies_cl.data[bitlen_lld_e.data[i]];
+      /*after a repeat code come the bits that specify the number of repetitions,
+      those don't need to be in the frequencies_cl calculation*/
+      if(bitlen_lld_e.data[i] >= 16) ++i;
+    }
+
+    error = HuffmanTree_makeFromFrequencies(&tree_cl, frequencies_cl.data,
+                                            frequencies_cl.size, frequencies_cl.size, 7);
+    if(error) break;
+
+    if(!uivector_resize(&bitlen_cl, tree_cl.numcodes)) ERROR_BREAK(83 /*alloc fail*/);
+    for(i = 0; i != tree_cl.numcodes; ++i)
+    {
+      /*lenghts of code length tree is in the order as specified by deflate*/
+      bitlen_cl.data[i] = HuffmanTree_getLength(&tree_cl, CLCL_ORDER[i]);
+    }
+    while(bitlen_cl.data[bitlen_cl.size - 1] == 0 && bitlen_cl.size > 4)
+    {
+      /*remove zeros at the end, but minimum size must be 4*/
+      if(!uivector_resize(&bitlen_cl, bitlen_cl.size - 1)) ERROR_BREAK(83 /*alloc fail*/);
+    }
+    if(error) break;
+
+    /*
+    Write everything into the output
+
+    After the BFINAL and BTYPE, the dynamic block consists out of the following:
+    - 5 bits HLIT, 5 bits HDIST, 4 bits HCLEN
+    - (HCLEN+4)*3 bits code lengths of code length alphabet
+    - HLIT + 257 code lenghts of lit/length alphabet (encoded using the code length
+      alphabet, + possible repetition codes 16, 17, 18)
+    - HDIST + 1 code lengths of distance alphabet (encoded using the code length
+      alphabet, + possible repetition codes 16, 17, 18)
+    - compressed data
+    - 256 (end code)
+    */
+
+    /*Write block type*/
+    addBitToStream(bp, out, BFINAL);
+    addBitToStream(bp, out, 0); /*first bit of BTYPE "dynamic"*/
+    addBitToStream(bp, out, 1); /*second bit of BTYPE "dynamic"*/
+
+    /*write the HLIT, HDIST and HCLEN values*/
+    HLIT = (unsigned)(numcodes_ll - 257);
+    HDIST = (unsigned)(numcodes_d - 1);
+    HCLEN = (unsigned)bitlen_cl.size - 4;
+    /*trim zeroes for HCLEN. HLIT and HDIST were already trimmed at tree creation*/
+    while(!bitlen_cl.data[HCLEN + 4 - 1] && HCLEN > 0) --HCLEN;
+    addBitsToStream(bp, out, HLIT, 5);
+    addBitsToStream(bp, out, HDIST, 5);
+    addBitsToStream(bp, out, HCLEN, 4);
+
+    /*write the code lenghts of the code length alphabet*/
+    for(i = 0; i != HCLEN + 4; ++i) addBitsToStream(bp, out, bitlen_cl.data[i], 3);
+
+    /*write the lenghts of the lit/len AND the dist alphabet*/
+    for(i = 0; i != bitlen_lld_e.size; ++i)
+    {
+      addHuffmanSymbol(bp, out, HuffmanTree_getCode(&tree_cl, bitlen_lld_e.data[i]),
+                       HuffmanTree_getLength(&tree_cl, bitlen_lld_e.data[i]));
+      /*extra bits of repeat codes*/
+      if(bitlen_lld_e.data[i] == 16) addBitsToStream(bp, out, bitlen_lld_e.data[++i], 2);
+      else if(bitlen_lld_e.data[i] == 17) addBitsToStream(bp, out, bitlen_lld_e.data[++i], 3);
+      else if(bitlen_lld_e.data[i] == 18) addBitsToStream(bp, out, bitlen_lld_e.data[++i], 7);
+    }
+
+    /*write the compressed data symbols*/
+    writeLZ77data(bp, out, &lz77_encoded, &tree_ll, &tree_d);
+    /*error: the length of the end code 256 must be larger than 0*/
+    if(HuffmanTree_getLength(&tree_ll, 256) == 0) ERROR_BREAK(64);
+
+    /*write the end code*/
+    addHuffmanSymbol(bp, out, HuffmanTree_getCode(&tree_ll, 256), HuffmanTree_getLength(&tree_ll, 256));
+
+    break; /*end of error-while*/
+  }
+
+  /*cleanup*/
+  uivector_cleanup(&lz77_encoded);
+  HuffmanTree_cleanup(&tree_ll);
+  HuffmanTree_cleanup(&tree_d);
+  HuffmanTree_cleanup(&tree_cl);
+  uivector_cleanup(&frequencies_ll);
+  uivector_cleanup(&frequencies_d);
+  uivector_cleanup(&frequencies_cl);
+  uivector_cleanup(&bitlen_lld_e);
+  uivector_cleanup(&bitlen_lld);
+  uivector_cleanup(&bitlen_cl);
+
+  return error;
+}
+
+static unsigned deflateFixed(ucvector* out, size_t* bp, Hash* hash,
+                             const unsigned char* data,
+                             size_t datapos, size_t dataend,
+                             const LodePNGCompressSettings* settings, unsigned final)
+{
+  HuffmanTree tree_ll; /*tree for literal values and length codes*/
+  HuffmanTree tree_d; /*tree for distance codes*/
+
+  unsigned BFINAL = final;
+  unsigned error = 0;
+  size_t i;
+
+  HuffmanTree_init(&tree_ll);
+  HuffmanTree_init(&tree_d);
+
+  generateFixedLitLenTree(&tree_ll);
+  generateFixedDistanceTree(&tree_d);
+
+  addBitToStream(bp, out, BFINAL);
+  addBitToStream(bp, out, 1); /*first bit of BTYPE*/
+  addBitToStream(bp, out, 0); /*second bit of BTYPE*/
+
+  if(settings->use_lz77) /*LZ77 encoded*/
+  {
+    uivector lz77_encoded;
+    uivector_init(&lz77_encoded);
+    error = encodeLZ77(&lz77_encoded, hash, data, datapos, dataend, settings->windowsize,
+                       settings->minmatch, settings->nicematch, settings->lazymatching);
+    if(!error) writeLZ77data(bp, out, &lz77_encoded, &tree_ll, &tree_d);
+    uivector_cleanup(&lz77_encoded);
+  }
+  else /*no LZ77, but still will be Huffman compressed*/
+  {
+    for(i = datapos; i < dataend; ++i)
+    {
+      addHuffmanSymbol(bp, out, HuffmanTree_getCode(&tree_ll, data[i]), HuffmanTree_getLength(&tree_ll, data[i]));
+    }
+  }
+  /*add END code*/
+  if(!error) addHuffmanSymbol(bp, out, HuffmanTree_getCode(&tree_ll, 256), HuffmanTree_getLength(&tree_ll, 256));
+
+  /*cleanup*/
+  HuffmanTree_cleanup(&tree_ll);
+  HuffmanTree_cleanup(&tree_d);
+
+  return error;
+}
+
+static unsigned lodepng_deflatev(ucvector* out, const unsigned char* in, size_t insize,
+                                 const LodePNGCompressSettings* settings)
+{
+  unsigned error = 0;
+  size_t i, blocksize, numdeflateblocks;
+  size_t bp = 0; /*the bit pointer*/
+  Hash hash;
+
+  if(settings->btype > 2) return 61;
+  else if(settings->btype == 0) return deflateNoCompression(out, in, insize);
+  else if(settings->btype == 1) blocksize = insize;
+  else /*if(settings->btype == 2)*/
+  {
+    /*on PNGs, deflate blocks of 65-262k seem to give most dense encoding*/
+    blocksize = insize / 8 + 8;
+    if(blocksize < 65536) blocksize = 65536;
+    if(blocksize > 262144) blocksize = 262144;
+  }
+
+  numdeflateblocks = (insize + blocksize - 1) / blocksize;
+  if(numdeflateblocks == 0) numdeflateblocks = 1;
+
+  error = hash_init(&hash, settings->windowsize);
+  if(error) return error;
+
+  for(i = 0; i != numdeflateblocks && !error; ++i)
+  {
+    unsigned final = (i == numdeflateblocks - 1);
+    size_t start = i * blocksize;
+    size_t end = start + blocksize;
+    if(end > insize) end = insize;
+
+    if(settings->btype == 1) error = deflateFixed(out, &bp, &hash, in, start, end, settings, final);
+    else if(settings->btype == 2) error = deflateDynamic(out, &bp, &hash, in, start, end, settings, final);
+  }
+
+  hash_cleanup(&hash);
+
+  return error;
+}
+
+unsigned lodepng_deflate(unsigned char** out, size_t* outsize,
+                         const unsigned char* in, size_t insize,
+                         const LodePNGCompressSettings* settings)
+{
+  unsigned error;
+  ucvector v;
+  ucvector_init_buffer(&v, *out, *outsize);
+  error = lodepng_deflatev(&v, in, insize, settings);
+  *out = v.data;
+  *outsize = v.size;
+  return error;
+}
+
+static unsigned deflate(unsigned char** out, size_t* outsize,
+                        const unsigned char* in, size_t insize,
+                        const LodePNGCompressSettings* settings)
+{
+  if(settings->custom_deflate)
+  {
+    return settings->custom_deflate(out, outsize, in, insize, settings);
+  }
+  else
+  {
+    return lodepng_deflate(out, outsize, in, insize, settings);
+  }
+}
+
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Adler32                                                                  */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+static unsigned update_adler32(unsigned adler, const unsigned char* data, unsigned len)
+{
+   unsigned s1 = adler & 0xffff;
+   unsigned s2 = (adler >> 16) & 0xffff;
+
+  while(len > 0)
+  {
+    /*at least 5550 sums can be done before the sums overflow, saving a lot of module divisions*/
+    unsigned amount = len > 5550 ? 5550 : len;
+    len -= amount;
+    while(amount > 0)
+    {
+      s1 += (*data++);
+      s2 += s1;
+      --amount;
+    }
+    s1 %= 65521;
+    s2 %= 65521;
+  }
+
+  return (s2 << 16) | s1;
+}
+
+/*Return the adler32 of the bytes data[0..len-1]*/
+static unsigned adler32(const unsigned char* data, unsigned len)
+{
+  return update_adler32(1L, data, len);
+}
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Zlib                                                                   / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+unsigned lodepng_zlib_decompress(unsigned char** out, size_t* outsize, const unsigned char* in,
+                                 size_t insize, const LodePNGDecompressSettings* settings)
+{
+  unsigned error = 0;
+  unsigned CM, CINFO, FDICT;
+
+  if(insize < 2) return 53; /*error, size of zlib data too small*/
+  /*read information from zlib header*/
+  if((in[0] * 256 + in[1]) % 31 != 0)
+  {
+    /*error: 256 * in[0] + in[1] must be a multiple of 31, the FCHECK value is supposed to be made that way*/
+    return 24;
+  }
+
+  CM = in[0] & 15;
+  CINFO = (in[0] >> 4) & 15;
+  /*FCHECK = in[1] & 31;*/ /*FCHECK is already tested above*/
+  FDICT = (in[1] >> 5) & 1;
+  /*FLEVEL = (in[1] >> 6) & 3;*/ /*FLEVEL is not used here*/
+
+  if(CM != 8 || CINFO > 7)
+  {
+    /*error: only compression method 8: inflate with sliding window of 32k is supported by the PNG spec*/
+    return 25;
+  }
+  if(FDICT != 0)
+  {
+    /*error: the specification of PNG says about the zlib stream:
+      "The additional flags shall not specify a preset dictionary."*/
+    return 26;
+  }
+
+  error = inflate(out, outsize, in + 2, insize - 2, settings);
+  if(error) return error;
+
+  if(!settings->ignore_adler32)
+  {
+    unsigned ADLER32 = lodepng_read32bitInt(&in[insize - 4]);
+    unsigned checksum = adler32(*out, (unsigned)(*outsize));
+    if(checksum != ADLER32) return 58; /*error, adler checksum not correct, data must be corrupted*/
+  }
+
+  return 0; /*no error*/
+}
+
+static unsigned zlib_decompress(unsigned char** out, size_t* outsize, const unsigned char* in,
+                                size_t insize, const LodePNGDecompressSettings* settings)
+{
+  if(settings->custom_zlib)
+  {
+    return settings->custom_zlib(out, outsize, in, insize, settings);
+  }
+  else
+  {
+    return lodepng_zlib_decompress(out, outsize, in, insize, settings);
+  }
+}
+
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+
+unsigned lodepng_zlib_compress(unsigned char** out, size_t* outsize, const unsigned char* in,
+                               size_t insize, const LodePNGCompressSettings* settings)
+{
+  /*initially, *out must be NULL and outsize 0, if you just give some random *out
+  that's pointing to a non allocated buffer, this'll crash*/
+  ucvector outv;
+  size_t i;
+  unsigned error;
+  unsigned char* deflatedata = 0;
+  size_t deflatesize = 0;
+
+  /*zlib data: 1 byte CMF (CM+CINFO), 1 byte FLG, deflate data, 4 byte ADLER32 checksum of the Decompressed data*/
+  unsigned CMF = 120; /*0b01111000: CM 8, CINFO 7. With CINFO 7, any window size up to 32768 can be used.*/
+  unsigned FLEVEL = 0;
+  unsigned FDICT = 0;
+  unsigned CMFFLG = 256 * CMF + FDICT * 32 + FLEVEL * 64;
+  unsigned FCHECK = 31 - CMFFLG % 31;
+  CMFFLG += FCHECK;
+
+  /*ucvector-controlled version of the output buffer, for dynamic array*/
+  ucvector_init_buffer(&outv, *out, *outsize);
+
+  ucvector_push_back(&outv, (unsigned char)(CMFFLG >> 8));
+  ucvector_push_back(&outv, (unsigned char)(CMFFLG & 255));
+
+  error = deflate(&deflatedata, &deflatesize, in, insize, settings);
+
+  if(!error)
+  {
+    unsigned ADLER32 = adler32(in, (unsigned)insize);
+    for(i = 0; i != deflatesize; ++i) ucvector_push_back(&outv, deflatedata[i]);
+    lodepng_free(deflatedata);
+    lodepng_add32bitInt(&outv, ADLER32);
+  }
+
+  *out = outv.data;
+  *outsize = outv.size;
+
+  return error;
+}
+
+/* compress using the default or custom zlib function */
+static unsigned zlib_compress(unsigned char** out, size_t* outsize, const unsigned char* in,
+                              size_t insize, const LodePNGCompressSettings* settings)
+{
+  if(settings->custom_zlib)
+  {
+    return settings->custom_zlib(out, outsize, in, insize, settings);
+  }
+  else
+  {
+    return lodepng_zlib_compress(out, outsize, in, insize, settings);
+  }
+}
+
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+#else /*no LODEPNG_COMPILE_ZLIB*/
+
+#ifdef LODEPNG_COMPILE_DECODER
+static unsigned zlib_decompress(unsigned char** out, size_t* outsize, const unsigned char* in,
+                                size_t insize, const LodePNGDecompressSettings* settings)
+{
+  if(!settings->custom_zlib) return 87; /*no custom zlib function provided */
+  return settings->custom_zlib(out, outsize, in, insize, settings);
+}
+#endif /*LODEPNG_COMPILE_DECODER*/
+#ifdef LODEPNG_COMPILE_ENCODER
+static unsigned zlib_compress(unsigned char** out, size_t* outsize, const unsigned char* in,
+                              size_t insize, const LodePNGCompressSettings* settings)
+{
+  if(!settings->custom_zlib) return 87; /*no custom zlib function provided */
+  return settings->custom_zlib(out, outsize, in, insize, settings);
+}
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+#endif /*LODEPNG_COMPILE_ZLIB*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_ENCODER
+
+/*this is a good tradeoff between speed and compression ratio*/
+#define DEFAULT_WINDOWSIZE 2048
+
+void lodepng_compress_settings_init(LodePNGCompressSettings* settings)
+{
+  /*compress with dynamic huffman tree (not in the mathematical sense, just not the predefined one)*/
+  settings->btype = 2;
+  settings->use_lz77 = 1;
+  settings->windowsize = DEFAULT_WINDOWSIZE;
+  settings->minmatch = 3;
+  settings->nicematch = 128;
+  settings->lazymatching = 1;
+
+  settings->custom_zlib = 0;
+  settings->custom_deflate = 0;
+  settings->custom_context = 0;
+}
+
+const LodePNGCompressSettings lodepng_default_compress_settings = {2, 1, DEFAULT_WINDOWSIZE, 3, 128, 1, 0, 0, 0};
+
+
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+void lodepng_decompress_settings_init(LodePNGDecompressSettings* settings)
+{
+  settings->ignore_adler32 = 0;
+
+  settings->custom_zlib = 0;
+  settings->custom_inflate = 0;
+  settings->custom_context = 0;
+}
+
+const LodePNGDecompressSettings lodepng_default_decompress_settings = {0, 0, 0, 0};
+
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* // End of Zlib related code. Begin of PNG related code.                 // */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_PNG
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / CRC32                                                                  / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+
+#ifndef LODEPNG_NO_COMPILE_CRC
+/* CRC polynomial: 0xedb88320 */
+static unsigned lodepng_crc32_table[256] = {
+           0u, 1996959894u, 3993919788u, 2567524794u,  124634137u, 1886057615u, 3915621685u, 2657392035u,
+   249268274u, 2044508324u, 3772115230u, 2547177864u,  162941995u, 2125561021u, 3887607047u, 2428444049u,
+   498536548u, 1789927666u, 4089016648u, 2227061214u,  450548861u, 1843258603u, 4107580753u, 2211677639u,
+   325883990u, 1684777152u, 4251122042u, 2321926636u,  335633487u, 1661365465u, 4195302755u, 2366115317u,
+   997073096u, 1281953886u, 3579855332u, 2724688242u, 1006888145u, 1258607687u, 3524101629u, 2768942443u,
+   901097722u, 1119000684u, 3686517206u, 2898065728u,  853044451u, 1172266101u, 3705015759u, 2882616665u,
+   651767980u, 1373503546u, 3369554304u, 3218104598u,  565507253u, 1454621731u, 3485111705u, 3099436303u,
+   671266974u, 1594198024u, 3322730930u, 2970347812u,  795835527u, 1483230225u, 3244367275u, 3060149565u,
+  1994146192u,   31158534u, 2563907772u, 4023717930u, 1907459465u,  112637215u, 2680153253u, 3904427059u,
+  2013776290u,  251722036u, 2517215374u, 3775830040u, 2137656763u,  141376813u, 2439277719u, 3865271297u,
+  1802195444u,  476864866u, 2238001368u, 4066508878u, 1812370925u,  453092731u, 2181625025u, 4111451223u,
+  1706088902u,  314042704u, 2344532202u, 4240017532u, 1658658271u,  366619977u, 2362670323u, 4224994405u,
+  1303535960u,  984961486u, 2747007092u, 3569037538u, 1256170817u, 1037604311u, 2765210733u, 3554079995u,
+  1131014506u,  879679996u, 2909243462u, 3663771856u, 1141124467u,  855842277u, 2852801631u, 3708648649u,
+  1342533948u,  654459306u, 3188396048u, 3373015174u, 1466479909u,  544179635u, 3110523913u, 3462522015u,
+  1591671054u,  702138776u, 2966460450u, 3352799412u, 1504918807u,  783551873u, 3082640443u, 3233442989u,
+  3988292384u, 2596254646u,   62317068u, 1957810842u, 3939845945u, 2647816111u,   81470997u, 1943803523u,
+  3814918930u, 2489596804u,  225274430u, 2053790376u, 3826175755u, 2466906013u,  167816743u, 2097651377u,
+  4027552580u, 2265490386u,  503444072u, 1762050814u, 4150417245u, 2154129355u,  426522225u, 1852507879u,
+  4275313526u, 2312317920u,  282753626u, 1742555852u, 4189708143u, 2394877945u,  397917763u, 1622183637u,
+  3604390888u, 2714866558u,  953729732u, 1340076626u, 3518719985u, 2797360999u, 1068828381u, 1219638859u,
+  3624741850u, 2936675148u,  906185462u, 1090812512u, 3747672003u, 2825379669u,  829329135u, 1181335161u,
+  3412177804u, 3160834842u,  628085408u, 1382605366u, 3423369109u, 3138078467u,  570562233u, 1426400815u,
+  3317316542u, 2998733608u,  733239954u, 1555261956u, 3268935591u, 3050360625u,  752459403u, 1541320221u,
+  2607071920u, 3965973030u, 1969922972u,   40735498u, 2617837225u, 3943577151u, 1913087877u,   83908371u,
+  2512341634u, 3803740692u, 2075208622u,  213261112u, 2463272603u, 3855990285u, 2094854071u,  198958881u,
+  2262029012u, 4057260610u, 1759359992u,  534414190u, 2176718541u, 4139329115u, 1873836001u,  414664567u,
+  2282248934u, 4279200368u, 1711684554u,  285281116u, 2405801727u, 4167216745u, 1634467795u,  376229701u,
+  2685067896u, 3608007406u, 1308918612u,  956543938u, 2808555105u, 3495958263u, 1231636301u, 1047427035u,
+  2932959818u, 3654703836u, 1088359270u,  936918000u, 2847714899u, 3736837829u, 1202900863u,  817233897u,
+  3183342108u, 3401237130u, 1404277552u,  615818150u, 3134207493u, 3453421203u, 1423857449u,  601450431u,
+  3009837614u, 3294710456u, 1567103746u,  711928724u, 3020668471u, 3272380065u, 1510334235u,  755167117u
+};
+
+/*Return the CRC of the bytes buf[0..len-1].*/
+unsigned lodepng_crc32(const unsigned char* data, size_t length)
+{
+  unsigned r = 0xffffffffu;
+  size_t i;
+  for(i = 0; i < length; ++i)
+  {
+    r = lodepng_crc32_table[(r ^ data[i]) & 0xff] ^ (r >> 8);
+  }
+  return r ^ 0xffffffffu;
+}
+#else /* !LODEPNG_NO_COMPILE_CRC */
+unsigned lodepng_crc32(const unsigned char* data, size_t length);
+#endif /* !LODEPNG_NO_COMPILE_CRC */
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Reading and writing single bits and bytes from/to stream for LodePNG   / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+static unsigned char readBitFromReversedStream(size_t* bitpointer, const unsigned char* bitstream)
+{
+  unsigned char result = (unsigned char)((bitstream[(*bitpointer) >> 3] >> (7 - ((*bitpointer) & 0x7))) & 1);
+  ++(*bitpointer);
+  return result;
+}
+
+static unsigned readBitsFromReversedStream(size_t* bitpointer, const unsigned char* bitstream, size_t nbits)
+{
+  unsigned result = 0;
+  size_t i;
+  for(i = nbits - 1; i < nbits; --i)
+  {
+    result += (unsigned)readBitFromReversedStream(bitpointer, bitstream) << i;
+  }
+  return result;
+}
+
+#ifdef LODEPNG_COMPILE_DECODER
+static void setBitOfReversedStream0(size_t* bitpointer, unsigned char* bitstream, unsigned char bit)
+{
+  /*the current bit in bitstream must be 0 for this to work*/
+  if(bit)
+  {
+    /*earlier bit of huffman code is in a lesser significant bit of an earlier byte*/
+    bitstream[(*bitpointer) >> 3] |= (bit << (7 - ((*bitpointer) & 0x7)));
+  }
+  ++(*bitpointer);
+}
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+static void setBitOfReversedStream(size_t* bitpointer, unsigned char* bitstream, unsigned char bit)
+{
+  /*the current bit in bitstream may be 0 or 1 for this to work*/
+  if(bit == 0) bitstream[(*bitpointer) >> 3] &=  (unsigned char)(~(1 << (7 - ((*bitpointer) & 0x7))));
+  else         bitstream[(*bitpointer) >> 3] |=  (1 << (7 - ((*bitpointer) & 0x7)));
+  ++(*bitpointer);
+}
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / PNG chunks                                                             / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+unsigned lodepng_chunk_length(const unsigned char* chunk)
+{
+  return lodepng_read32bitInt(&chunk[0]);
+}
+
+void lodepng_chunk_type(char type[5], const unsigned char* chunk)
+{
+  unsigned i;
+  for(i = 0; i != 4; ++i) type[i] = (char)chunk[4 + i];
+  type[4] = 0; /*null termination char*/
+}
+
+unsigned char lodepng_chunk_type_equals(const unsigned char* chunk, const char* type)
+{
+  if(strlen(type) != 4) return 0;
+  return (chunk[4] == type[0] && chunk[5] == type[1] && chunk[6] == type[2] && chunk[7] == type[3]);
+}
+
+unsigned char lodepng_chunk_ancillary(const unsigned char* chunk)
+{
+  return((chunk[4] & 32) != 0);
+}
+
+unsigned char lodepng_chunk_private(const unsigned char* chunk)
+{
+  return((chunk[6] & 32) != 0);
+}
+
+unsigned char lodepng_chunk_safetocopy(const unsigned char* chunk)
+{
+  return((chunk[7] & 32) != 0);
+}
+
+unsigned char* lodepng_chunk_data(unsigned char* chunk)
+{
+  return &chunk[8];
+}
+
+const unsigned char* lodepng_chunk_data_const(const unsigned char* chunk)
+{
+  return &chunk[8];
+}
+
+unsigned lodepng_chunk_check_crc(const unsigned char* chunk)
+{
+  unsigned length = lodepng_chunk_length(chunk);
+  unsigned CRC = lodepng_read32bitInt(&chunk[length + 8]);
+  /*the CRC is taken of the data and the 4 chunk type letters, not the length*/
+  unsigned checksum = lodepng_crc32(&chunk[4], length + 4);
+  if(CRC != checksum) return 1;
+  else return 0;
+}
+
+void lodepng_chunk_generate_crc(unsigned char* chunk)
+{
+  unsigned length = lodepng_chunk_length(chunk);
+  unsigned CRC = lodepng_crc32(&chunk[4], length + 4);
+  lodepng_set32bitInt(chunk + 8 + length, CRC);
+}
+
+unsigned char* lodepng_chunk_next(unsigned char* chunk)
+{
+  unsigned total_chunk_length = lodepng_chunk_length(chunk) + 12;
+  return &chunk[total_chunk_length];
+}
+
+const unsigned char* lodepng_chunk_next_const(const unsigned char* chunk)
+{
+  unsigned total_chunk_length = lodepng_chunk_length(chunk) + 12;
+  return &chunk[total_chunk_length];
+}
+
+unsigned lodepng_chunk_append(unsigned char** out, size_t* outlength, const unsigned char* chunk)
+{
+  unsigned i;
+  unsigned total_chunk_length = lodepng_chunk_length(chunk) + 12;
+  unsigned char *chunk_start, *new_buffer;
+  size_t new_length = (*outlength) + total_chunk_length;
+  if(new_length < total_chunk_length || new_length < (*outlength)) return 77; /*integer overflow happened*/
+
+  new_buffer = (unsigned char*)lodepng_realloc(*out, new_length);
+  if(!new_buffer) return 83; /*alloc fail*/
+  (*out) = new_buffer;
+  (*outlength) = new_length;
+  chunk_start = &(*out)[new_length - total_chunk_length];
+
+  for(i = 0; i != total_chunk_length; ++i) chunk_start[i] = chunk[i];
+
+  return 0;
+}
+
+unsigned lodepng_chunk_create(unsigned char** out, size_t* outlength, unsigned length,
+                              const char* type, const unsigned char* data)
+{
+  unsigned i;
+  unsigned char *chunk, *new_buffer;
+  size_t new_length = (*outlength) + length + 12;
+  if(new_length < length + 12 || new_length < (*outlength)) return 77; /*integer overflow happened*/
+  new_buffer = (unsigned char*)lodepng_realloc(*out, new_length);
+  if(!new_buffer) return 83; /*alloc fail*/
+  (*out) = new_buffer;
+  (*outlength) = new_length;
+  chunk = &(*out)[(*outlength) - length - 12];
+
+  /*1: length*/
+  lodepng_set32bitInt(chunk, (unsigned)length);
+
+  /*2: chunk name (4 letters)*/
+  chunk[4] = (unsigned char)type[0];
+  chunk[5] = (unsigned char)type[1];
+  chunk[6] = (unsigned char)type[2];
+  chunk[7] = (unsigned char)type[3];
+
+  /*3: the data*/
+  for(i = 0; i != length; ++i) chunk[8 + i] = data[i];
+
+  /*4: CRC (of the chunkname characters and the data)*/
+  lodepng_chunk_generate_crc(chunk);
+
+  return 0;
+}
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / Color types and such                                                   / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*return type is a LodePNG error code*/
+static unsigned checkColorValidity(LodePNGColorType colortype, unsigned bd) /*bd = bitdepth*/
+{
+  switch(colortype)
+  {
+    case 0: if(!(bd == 1 || bd == 2 || bd == 4 || bd == 8 || bd == 16)) return 37; break; /*grey*/
+    case 2: if(!(                                 bd == 8 || bd == 16)) return 37; break; /*RGB*/
+    case 3: if(!(bd == 1 || bd == 2 || bd == 4 || bd == 8            )) return 37; break; /*palette*/
+    case 4: if(!(                                 bd == 8 || bd == 16)) return 37; break; /*grey + alpha*/
+    case 6: if(!(                                 bd == 8 || bd == 16)) return 37; break; /*RGBA*/
+    default: return 31;
+  }
+  return 0; /*allowed color type / bits combination*/
+}
+
+static unsigned getNumColorChannels(LodePNGColorType colortype)
+{
+  switch(colortype)
+  {
+    case 0: return 1; /*grey*/
+    case 2: return 3; /*RGB*/
+    case 3: return 1; /*palette*/
+    case 4: return 2; /*grey + alpha*/
+    case 6: return 4; /*RGBA*/
+  }
+  return 0; /*unexisting color type*/
+}
+
+static unsigned lodepng_get_bpp_lct(LodePNGColorType colortype, unsigned bitdepth)
+{
+  /*bits per pixel is amount of channels * bits per channel*/
+  return getNumColorChannels(colortype) * bitdepth;
+}
+
+/* ////////////////////////////////////////////////////////////////////////// */
+
+void lodepng_color_mode_init(LodePNGColorMode* info)
+{
+  info->key_defined = 0;
+  info->key_r = info->key_g = info->key_b = 0;
+  info->colortype = LCT_RGBA;
+  info->bitdepth = 8;
+  info->palette = 0;
+  info->palettesize = 0;
+}
+
+void lodepng_color_mode_cleanup(LodePNGColorMode* info)
+{
+  lodepng_palette_clear(info);
+}
+
+unsigned lodepng_color_mode_copy(LodePNGColorMode* dest, const LodePNGColorMode* source)
+{
+  size_t i;
+  lodepng_color_mode_cleanup(dest);
+  *dest = *source;
+  if(source->palette)
+  {
+    dest->palette = (unsigned char*)lodepng_malloc(1024);
+    if(!dest->palette && source->palettesize) return 83; /*alloc fail*/
+    for(i = 0; i != source->palettesize * 4; ++i) dest->palette[i] = source->palette[i];
+  }
+  return 0;
+}
+
+static int lodepng_color_mode_equal(const LodePNGColorMode* a, const LodePNGColorMode* b)
+{
+  size_t i;
+  if(a->colortype != b->colortype) return 0;
+  if(a->bitdepth != b->bitdepth) return 0;
+  if(a->key_defined != b->key_defined) return 0;
+  if(a->key_defined)
+  {
+    if(a->key_r != b->key_r) return 0;
+    if(a->key_g != b->key_g) return 0;
+    if(a->key_b != b->key_b) return 0;
+  }
+  /*if one of the palette sizes is 0, then we consider it to be the same as the
+  other: it means that e.g. the palette was not given by the user and should be
+  considered the same as the palette inside the PNG.*/
+  if(1/*a->palettesize != 0 && b->palettesize != 0*/) {
+    if(a->palettesize != b->palettesize) return 0;
+    for(i = 0; i != a->palettesize * 4; ++i)
+    {
+      if(a->palette[i] != b->palette[i]) return 0;
+    }
+  }
+  return 1;
+}
+
+void lodepng_palette_clear(LodePNGColorMode* info)
+{
+  if(info->palette) lodepng_free(info->palette);
+  info->palette = 0;
+  info->palettesize = 0;
+}
+
+unsigned lodepng_palette_add(LodePNGColorMode* info,
+                             unsigned char r, unsigned char g, unsigned char b, unsigned char a)
+{
+  unsigned char* data;
+  /*the same resize technique as C++ std::vectors is used, and here it's made so that for a palette with
+  the max of 256 colors, it'll have the exact alloc size*/
+  if(!info->palette) /*allocate palette if empty*/
+  {
+    /*room for 256 colors with 4 bytes each*/
+    data = (unsigned char*)lodepng_realloc(info->palette, 1024);
+    if(!data) return 83; /*alloc fail*/
+    else info->palette = data;
+  }
+  info->palette[4 * info->palettesize + 0] = r;
+  info->palette[4 * info->palettesize + 1] = g;
+  info->palette[4 * info->palettesize + 2] = b;
+  info->palette[4 * info->palettesize + 3] = a;
+  ++info->palettesize;
+  return 0;
+}
+
+unsigned lodepng_get_bpp(const LodePNGColorMode* info)
+{
+  /*calculate bits per pixel out of colortype and bitdepth*/
+  return lodepng_get_bpp_lct(info->colortype, info->bitdepth);
+}
+
+unsigned lodepng_get_channels(const LodePNGColorMode* info)
+{
+  return getNumColorChannels(info->colortype);
+}
+
+unsigned lodepng_is_greyscale_type(const LodePNGColorMode* info)
+{
+  return info->colortype == LCT_GREY || info->colortype == LCT_GREY_ALPHA;
+}
+
+unsigned lodepng_is_alpha_type(const LodePNGColorMode* info)
+{
+  return (info->colortype & 4) != 0; /*4 or 6*/
+}
+
+unsigned lodepng_is_palette_type(const LodePNGColorMode* info)
+{
+  return info->colortype == LCT_PALETTE;
+}
+
+unsigned lodepng_has_palette_alpha(const LodePNGColorMode* info)
+{
+  size_t i;
+  for(i = 0; i != info->palettesize; ++i)
+  {
+    if(info->palette[i * 4 + 3] < 255) return 1;
+  }
+  return 0;
+}
+
+unsigned lodepng_can_have_alpha(const LodePNGColorMode* info)
+{
+  return info->key_defined
+      || lodepng_is_alpha_type(info)
+      || lodepng_has_palette_alpha(info);
+}
+
+size_t lodepng_get_raw_size(unsigned w, unsigned h, const LodePNGColorMode* color)
+{
+  /*will not overflow for any color type if roughly w * h < 268435455*/
+  size_t bpp = lodepng_get_bpp(color);
+  size_t n = w * h;
+  return ((n / 8) * bpp) + ((n & 7) * bpp + 7) / 8;
+}
+
+size_t lodepng_get_raw_size_lct(unsigned w, unsigned h, LodePNGColorType colortype, unsigned bitdepth)
+{
+  /*will not overflow for any color type if roughly w * h < 268435455*/
+  size_t bpp = lodepng_get_bpp_lct(colortype, bitdepth);
+  size_t n = w * h;
+  return ((n / 8) * bpp) + ((n & 7) * bpp + 7) / 8;
+}
+
+
+#ifdef LODEPNG_COMPILE_PNG
+#ifdef LODEPNG_COMPILE_DECODER
+/*in an idat chunk, each scanline is a multiple of 8 bits, unlike the lodepng output buffer*/
+static size_t lodepng_get_raw_size_idat(unsigned w, unsigned h, const LodePNGColorMode* color)
+{
+  /*will not overflow for any color type if roughly w * h < 268435455*/
+  size_t bpp = lodepng_get_bpp(color);
+  size_t line = ((w / 8) * bpp) + ((w & 7) * bpp + 7) / 8;
+  return h * line;
+}
+#endif /*LODEPNG_COMPILE_DECODER*/
+#endif /*LODEPNG_COMPILE_PNG*/
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+
+static void LodePNGUnknownChunks_init(LodePNGInfo* info)
+{
+  unsigned i;
+  for(i = 0; i != 3; ++i) info->unknown_chunks_data[i] = 0;
+  for(i = 0; i != 3; ++i) info->unknown_chunks_size[i] = 0;
+}
+
+static void LodePNGUnknownChunks_cleanup(LodePNGInfo* info)
+{
+  unsigned i;
+  for(i = 0; i != 3; ++i) lodepng_free(info->unknown_chunks_data[i]);
+}
+
+static unsigned LodePNGUnknownChunks_copy(LodePNGInfo* dest, const LodePNGInfo* src)
+{
+  unsigned i;
+
+  LodePNGUnknownChunks_cleanup(dest);
+
+  for(i = 0; i != 3; ++i)
+  {
+    size_t j;
+    dest->unknown_chunks_size[i] = src->unknown_chunks_size[i];
+    dest->unknown_chunks_data[i] = (unsigned char*)lodepng_malloc(src->unknown_chunks_size[i]);
+    if(!dest->unknown_chunks_data[i] && dest->unknown_chunks_size[i]) return 83; /*alloc fail*/
+    for(j = 0; j < src->unknown_chunks_size[i]; ++j)
+    {
+      dest->unknown_chunks_data[i][j] = src->unknown_chunks_data[i][j];
+    }
+  }
+
+  return 0;
+}
+
+/******************************************************************************/
+
+static void LodePNGText_init(LodePNGInfo* info)
+{
+  info->text_num = 0;
+  info->text_keys = NULL;
+  info->text_strings = NULL;
+}
+
+static void LodePNGText_cleanup(LodePNGInfo* info)
+{
+  size_t i;
+  for(i = 0; i != info->text_num; ++i)
+  {
+    string_cleanup(&info->text_keys[i]);
+    string_cleanup(&info->text_strings[i]);
+  }
+  lodepng_free(info->text_keys);
+  lodepng_free(info->text_strings);
+}
+
+static unsigned LodePNGText_copy(LodePNGInfo* dest, const LodePNGInfo* source)
+{
+  size_t i = 0;
+  dest->text_keys = 0;
+  dest->text_strings = 0;
+  dest->text_num = 0;
+  for(i = 0; i != source->text_num; ++i)
+  {
+    CERROR_TRY_RETURN(lodepng_add_text(dest, source->text_keys[i], source->text_strings[i]));
+  }
+  return 0;
+}
+
+void lodepng_clear_text(LodePNGInfo* info)
+{
+  LodePNGText_cleanup(info);
+}
+
+unsigned lodepng_add_text(LodePNGInfo* info, const char* key, const char* str)
+{
+  char** new_keys = (char**)(lodepng_realloc(info->text_keys, sizeof(char*) * (info->text_num + 1)));
+  char** new_strings = (char**)(lodepng_realloc(info->text_strings, sizeof(char*) * (info->text_num + 1)));
+  if(!new_keys || !new_strings)
+  {
+    lodepng_free(new_keys);
+    lodepng_free(new_strings);
+    return 83; /*alloc fail*/
+  }
+
+  ++info->text_num;
+  info->text_keys = new_keys;
+  info->text_strings = new_strings;
+
+  string_init(&info->text_keys[info->text_num - 1]);
+  string_set(&info->text_keys[info->text_num - 1], key);
+
+  string_init(&info->text_strings[info->text_num - 1]);
+  string_set(&info->text_strings[info->text_num - 1], str);
+
+  return 0;
+}
+
+/******************************************************************************/
+
+static void LodePNGIText_init(LodePNGInfo* info)
+{
+  info->itext_num = 0;
+  info->itext_keys = NULL;
+  info->itext_langtags = NULL;
+  info->itext_transkeys = NULL;
+  info->itext_strings = NULL;
+}
+
+static void LodePNGIText_cleanup(LodePNGInfo* info)
+{
+  size_t i;
+  for(i = 0; i != info->itext_num; ++i)
+  {
+    string_cleanup(&info->itext_keys[i]);
+    string_cleanup(&info->itext_langtags[i]);
+    string_cleanup(&info->itext_transkeys[i]);
+    string_cleanup(&info->itext_strings[i]);
+  }
+  lodepng_free(info->itext_keys);
+  lodepng_free(info->itext_langtags);
+  lodepng_free(info->itext_transkeys);
+  lodepng_free(info->itext_strings);
+}
+
+static unsigned LodePNGIText_copy(LodePNGInfo* dest, const LodePNGInfo* source)
+{
+  size_t i = 0;
+  dest->itext_keys = 0;
+  dest->itext_langtags = 0;
+  dest->itext_transkeys = 0;
+  dest->itext_strings = 0;
+  dest->itext_num = 0;
+  for(i = 0; i != source->itext_num; ++i)
+  {
+    CERROR_TRY_RETURN(lodepng_add_itext(dest, source->itext_keys[i], source->itext_langtags[i],
+                                        source->itext_transkeys[i], source->itext_strings[i]));
+  }
+  return 0;
+}
+
+void lodepng_clear_itext(LodePNGInfo* info)
+{
+  LodePNGIText_cleanup(info);
+}
+
+unsigned lodepng_add_itext(LodePNGInfo* info, const char* key, const char* langtag,
+                           const char* transkey, const char* str)
+{
+  char** new_keys = (char**)(lodepng_realloc(info->itext_keys, sizeof(char*) * (info->itext_num + 1)));
+  char** new_langtags = (char**)(lodepng_realloc(info->itext_langtags, sizeof(char*) * (info->itext_num + 1)));
+  char** new_transkeys = (char**)(lodepng_realloc(info->itext_transkeys, sizeof(char*) * (info->itext_num + 1)));
+  char** new_strings = (char**)(lodepng_realloc(info->itext_strings, sizeof(char*) * (info->itext_num + 1)));
+  if(!new_keys || !new_langtags || !new_transkeys || !new_strings)
+  {
+    lodepng_free(new_keys);
+    lodepng_free(new_langtags);
+    lodepng_free(new_transkeys);
+    lodepng_free(new_strings);
+    return 83; /*alloc fail*/
+  }
+
+  ++info->itext_num;
+  info->itext_keys = new_keys;
+  info->itext_langtags = new_langtags;
+  info->itext_transkeys = new_transkeys;
+  info->itext_strings = new_strings;
+
+  string_init(&info->itext_keys[info->itext_num - 1]);
+  string_set(&info->itext_keys[info->itext_num - 1], key);
+
+  string_init(&info->itext_langtags[info->itext_num - 1]);
+  string_set(&info->itext_langtags[info->itext_num - 1], langtag);
+
+  string_init(&info->itext_transkeys[info->itext_num - 1]);
+  string_set(&info->itext_transkeys[info->itext_num - 1], transkey);
+
+  string_init(&info->itext_strings[info->itext_num - 1]);
+  string_set(&info->itext_strings[info->itext_num - 1], str);
+
+  return 0;
+}
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+void lodepng_info_init(LodePNGInfo* info)
+{
+  lodepng_color_mode_init(&info->color);
+  info->interlace_method = 0;
+  info->compression_method = 0;
+  info->filter_method = 0;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  info->background_defined = 0;
+  info->background_r = info->background_g = info->background_b = 0;
+
+  LodePNGText_init(info);
+  LodePNGIText_init(info);
+
+  info->time_defined = 0;
+  info->phys_defined = 0;
+
+  LodePNGUnknownChunks_init(info);
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+}
+
+void lodepng_info_cleanup(LodePNGInfo* info)
+{
+  lodepng_color_mode_cleanup(&info->color);
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  LodePNGText_cleanup(info);
+  LodePNGIText_cleanup(info);
+
+  LodePNGUnknownChunks_cleanup(info);
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+}
+
+unsigned lodepng_info_copy(LodePNGInfo* dest, const LodePNGInfo* source)
+{
+  lodepng_info_cleanup(dest);
+  *dest = *source;
+  lodepng_color_mode_init(&dest->color);
+  CERROR_TRY_RETURN(lodepng_color_mode_copy(&dest->color, &source->color));
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  CERROR_TRY_RETURN(LodePNGText_copy(dest, source));
+  CERROR_TRY_RETURN(LodePNGIText_copy(dest, source));
+
+  LodePNGUnknownChunks_init(dest);
+  CERROR_TRY_RETURN(LodePNGUnknownChunks_copy(dest, source));
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+  return 0;
+}
+
+void lodepng_info_swap(LodePNGInfo* a, LodePNGInfo* b)
+{
+  LodePNGInfo temp = *a;
+  *a = *b;
+  *b = temp;
+}
+
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*index: bitgroup index, bits: bitgroup size(1, 2 or 4), in: bitgroup value, out: octet array to add bits to*/
+static void addColorBits(unsigned char* out, size_t index, unsigned bits, unsigned in)
+{
+  unsigned m = bits == 1 ? 7 : bits == 2 ? 3 : 1; /*8 / bits - 1*/
+  /*p = the partial index in the byte, e.g. with 4 palettebits it is 0 for first half or 1 for second half*/
+  unsigned p = index & m;
+  in &= (1u << bits) - 1u; /*filter out any other bits of the input value*/
+  in = in << (bits * (m - p));
+  if(p == 0) out[index * bits / 8] = in;
+  else out[index * bits / 8] |= in;
+}
+
+typedef struct ColorTree ColorTree;
+
+/*
+One node of a color tree
+This is the data structure used to count the number of unique colors and to get a palette
+index for a color. It's like an octree, but because the alpha channel is used too, each
+node has 16 instead of 8 children.
+*/
+struct ColorTree
+{
+  ColorTree* children[16]; /*up to 16 pointers to ColorTree of next level*/
+  int index; /*the payload. Only has a meaningful value if this is in the last level*/
+};
+
+static void color_tree_init(ColorTree* tree)
+{
+  int i;
+  for(i = 0; i != 16; ++i) tree->children[i] = 0;
+  tree->index = -1;
+}
+
+static void color_tree_cleanup(ColorTree* tree)
+{
+  int i;
+  for(i = 0; i != 16; ++i)
+  {
+    if(tree->children[i])
+    {
+      color_tree_cleanup(tree->children[i]);
+      lodepng_free(tree->children[i]);
+    }
+  }
+}
+
+/*returns -1 if color not present, its index otherwise*/
+static int color_tree_get(ColorTree* tree, unsigned char r, unsigned char g, unsigned char b, unsigned char a)
+{
+  int bit = 0;
+  for(bit = 0; bit < 8; ++bit)
+  {
+    int i = 8 * ((r >> bit) & 1) + 4 * ((g >> bit) & 1) + 2 * ((b >> bit) & 1) + 1 * ((a >> bit) & 1);
+    if(!tree->children[i]) return -1;
+    else tree = tree->children[i];
+  }
+  return tree ? tree->index : -1;
+}
+
+#ifdef LODEPNG_COMPILE_ENCODER
+static int color_tree_has(ColorTree* tree, unsigned char r, unsigned char g, unsigned char b, unsigned char a)
+{
+  return color_tree_get(tree, r, g, b, a) >= 0;
+}
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+/*color is not allowed to already exist.
+Index should be >= 0 (it's signed to be compatible with using -1 for "doesn't exist")*/
+static void color_tree_add(ColorTree* tree,
+                           unsigned char r, unsigned char g, unsigned char b, unsigned char a, unsigned index)
+{
+  int bit;
+  for(bit = 0; bit < 8; ++bit)
+  {
+    int i = 8 * ((r >> bit) & 1) + 4 * ((g >> bit) & 1) + 2 * ((b >> bit) & 1) + 1 * ((a >> bit) & 1);
+    if(!tree->children[i])
+    {
+      tree->children[i] = (ColorTree*)lodepng_malloc(sizeof(ColorTree));
+      color_tree_init(tree->children[i]);
+    }
+    tree = tree->children[i];
+  }
+  tree->index = (int)index;
+}
+
+/*put a pixel, given its RGBA color, into image of any color type*/
+static unsigned rgba8ToPixel(unsigned char* out, size_t i,
+                             const LodePNGColorMode* mode, ColorTree* tree /*for palette*/,
+                             unsigned char r, unsigned char g, unsigned char b, unsigned char a)
+{
+  if(mode->colortype == LCT_GREY)
+  {
+    unsigned char grey = r; /*((unsigned short)r + g + b) / 3*/;
+    if(mode->bitdepth == 8) out[i] = grey;
+    else if(mode->bitdepth == 16) out[i * 2 + 0] = out[i * 2 + 1] = grey;
+    else
+    {
+      /*take the most significant bits of grey*/
+      grey = (grey >> (8 - mode->bitdepth)) & ((1 << mode->bitdepth) - 1);
+      addColorBits(out, i, mode->bitdepth, grey);
+    }
+  }
+  else if(mode->colortype == LCT_RGB)
+  {
+    if(mode->bitdepth == 8)
+    {
+      out[i * 3 + 0] = r;
+      out[i * 3 + 1] = g;
+      out[i * 3 + 2] = b;
+    }
+    else
+    {
+      out[i * 6 + 0] = out[i * 6 + 1] = r;
+      out[i * 6 + 2] = out[i * 6 + 3] = g;
+      out[i * 6 + 4] = out[i * 6 + 5] = b;
+    }
+  }
+  else if(mode->colortype == LCT_PALETTE)
+  {
+    int index = color_tree_get(tree, r, g, b, a);
+    if(index < 0) return 82; /*color not in palette*/
+    if(mode->bitdepth == 8) out[i] = index;
+    else addColorBits(out, i, mode->bitdepth, (unsigned)index);
+  }
+  else if(mode->colortype == LCT_GREY_ALPHA)
+  {
+    unsigned char grey = r; /*((unsigned short)r + g + b) / 3*/;
+    if(mode->bitdepth == 8)
+    {
+      out[i * 2 + 0] = grey;
+      out[i * 2 + 1] = a;
+    }
+    else if(mode->bitdepth == 16)
+    {
+      out[i * 4 + 0] = out[i * 4 + 1] = grey;
+      out[i * 4 + 2] = out[i * 4 + 3] = a;
+    }
+  }
+  else if(mode->colortype == LCT_RGBA)
+  {
+    if(mode->bitdepth == 8)
+    {
+      out[i * 4 + 0] = r;
+      out[i * 4 + 1] = g;
+      out[i * 4 + 2] = b;
+      out[i * 4 + 3] = a;
+    }
+    else
+    {
+      out[i * 8 + 0] = out[i * 8 + 1] = r;
+      out[i * 8 + 2] = out[i * 8 + 3] = g;
+      out[i * 8 + 4] = out[i * 8 + 5] = b;
+      out[i * 8 + 6] = out[i * 8 + 7] = a;
+    }
+  }
+
+  return 0; /*no error*/
+}
+
+/*put a pixel, given its RGBA16 color, into image of any color 16-bitdepth type*/
+static void rgba16ToPixel(unsigned char* out, size_t i,
+                         const LodePNGColorMode* mode,
+                         unsigned short r, unsigned short g, unsigned short b, unsigned short a)
+{
+  if(mode->colortype == LCT_GREY)
+  {
+    unsigned short grey = r; /*((unsigned)r + g + b) / 3*/;
+    out[i * 2 + 0] = (grey >> 8) & 255;
+    out[i * 2 + 1] = grey & 255;
+  }
+  else if(mode->colortype == LCT_RGB)
+  {
+    out[i * 6 + 0] = (r >> 8) & 255;
+    out[i * 6 + 1] = r & 255;
+    out[i * 6 + 2] = (g >> 8) & 255;
+    out[i * 6 + 3] = g & 255;
+    out[i * 6 + 4] = (b >> 8) & 255;
+    out[i * 6 + 5] = b & 255;
+  }
+  else if(mode->colortype == LCT_GREY_ALPHA)
+  {
+    unsigned short grey = r; /*((unsigned)r + g + b) / 3*/;
+    out[i * 4 + 0] = (grey >> 8) & 255;
+    out[i * 4 + 1] = grey & 255;
+    out[i * 4 + 2] = (a >> 8) & 255;
+    out[i * 4 + 3] = a & 255;
+  }
+  else if(mode->colortype == LCT_RGBA)
+  {
+    out[i * 8 + 0] = (r >> 8) & 255;
+    out[i * 8 + 1] = r & 255;
+    out[i * 8 + 2] = (g >> 8) & 255;
+    out[i * 8 + 3] = g & 255;
+    out[i * 8 + 4] = (b >> 8) & 255;
+    out[i * 8 + 5] = b & 255;
+    out[i * 8 + 6] = (a >> 8) & 255;
+    out[i * 8 + 7] = a & 255;
+  }
+}
+
+/*Get RGBA8 color of pixel with index i (y * width + x) from the raw image with given color type.*/
+static void getPixelColorRGBA8(unsigned char* r, unsigned char* g,
+                               unsigned char* b, unsigned char* a,
+                               const unsigned char* in, size_t i,
+                               const LodePNGColorMode* mode)
+{
+  if(mode->colortype == LCT_GREY)
+  {
+    if(mode->bitdepth == 8)
+    {
+      *r = *g = *b = in[i];
+      if(mode->key_defined && *r == mode->key_r) *a = 0;
+      else *a = 255;
+    }
+    else if(mode->bitdepth == 16)
+    {
+      *r = *g = *b = in[i * 2 + 0];
+      if(mode->key_defined && 256U * in[i * 2 + 0] + in[i * 2 + 1] == mode->key_r) *a = 0;
+      else *a = 255;
+    }
+    else
+    {
+      unsigned highest = ((1U << mode->bitdepth) - 1U); /*highest possible value for this bit depth*/
+      size_t j = i * mode->bitdepth;
+      unsigned value = readBitsFromReversedStream(&j, in, mode->bitdepth);
+      *r = *g = *b = (value * 255) / highest;
+      if(mode->key_defined && value == mode->key_r) *a = 0;
+      else *a = 255;
+    }
+  }
+  else if(mode->colortype == LCT_RGB)
+  {
+    if(mode->bitdepth == 8)
+    {
+      *r = in[i * 3 + 0]; *g = in[i * 3 + 1]; *b = in[i * 3 + 2];
+      if(mode->key_defined && *r == mode->key_r && *g == mode->key_g && *b == mode->key_b) *a = 0;
+      else *a = 255;
+    }
+    else
+    {
+      *r = in[i * 6 + 0];
+      *g = in[i * 6 + 2];
+      *b = in[i * 6 + 4];
+      if(mode->key_defined && 256U * in[i * 6 + 0] + in[i * 6 + 1] == mode->key_r
+         && 256U * in[i * 6 + 2] + in[i * 6 + 3] == mode->key_g
+         && 256U * in[i * 6 + 4] + in[i * 6 + 5] == mode->key_b) *a = 0;
+      else *a = 255;
+    }
+  }
+  else if(mode->colortype == LCT_PALETTE)
+  {
+    unsigned index;
+    if(mode->bitdepth == 8) index = in[i];
+    else
+    {
+      size_t j = i * mode->bitdepth;
+      index = readBitsFromReversedStream(&j, in, mode->bitdepth);
+    }
+
+    if(index >= mode->palettesize)
+    {
+      /*This is an error according to the PNG spec, but common PNG decoders make it black instead.
+      Done here too, slightly faster due to no error handling needed.*/
+      *r = *g = *b = 0;
+      *a = 255;
+    }
+    else
+    {
+      *r = mode->palette[index * 4 + 0];
+      *g = mode->palette[index * 4 + 1];
+      *b = mode->palette[index * 4 + 2];
+      *a = mode->palette[index * 4 + 3];
+    }
+  }
+  else if(mode->colortype == LCT_GREY_ALPHA)
+  {
+    if(mode->bitdepth == 8)
+    {
+      *r = *g = *b = in[i * 2 + 0];
+      *a = in[i * 2 + 1];
+    }
+    else
+    {
+      *r = *g = *b = in[i * 4 + 0];
+      *a = in[i * 4 + 2];
+    }
+  }
+  else if(mode->colortype == LCT_RGBA)
+  {
+    if(mode->bitdepth == 8)
+    {
+      *r = in[i * 4 + 0];
+      *g = in[i * 4 + 1];
+      *b = in[i * 4 + 2];
+      *a = in[i * 4 + 3];
+    }
+    else
+    {
+      *r = in[i * 8 + 0];
+      *g = in[i * 8 + 2];
+      *b = in[i * 8 + 4];
+      *a = in[i * 8 + 6];
+    }
+  }
+}
+
+/*Similar to getPixelColorRGBA8, but with all the for loops inside of the color
+mode test cases, optimized to convert the colors much faster, when converting
+to RGBA or RGB with 8 bit per cannel. buffer must be RGBA or RGB output with
+enough memory, if has_alpha is true the output is RGBA. mode has the color mode
+of the input buffer.*/
+static void getPixelColorsRGBA8(unsigned char* buffer, size_t numpixels,
+                                unsigned has_alpha, const unsigned char* in,
+                                const LodePNGColorMode* mode)
+{
+  unsigned num_channels = has_alpha ? 4 : 3;
+  size_t i;
+  if(mode->colortype == LCT_GREY)
+  {
+    if(mode->bitdepth == 8)
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = buffer[1] = buffer[2] = in[i];
+        if(has_alpha) buffer[3] = mode->key_defined && in[i] == mode->key_r ? 0 : 255;
+      }
+    }
+    else if(mode->bitdepth == 16)
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = buffer[1] = buffer[2] = in[i * 2];
+        if(has_alpha) buffer[3] = mode->key_defined && 256U * in[i * 2 + 0] + in[i * 2 + 1] == mode->key_r ? 0 : 255;
+      }
+    }
+    else
+    {
+      unsigned highest = ((1U << mode->bitdepth) - 1U); /*highest possible value for this bit depth*/
+      size_t j = 0;
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        unsigned value = readBitsFromReversedStream(&j, in, mode->bitdepth);
+        buffer[0] = buffer[1] = buffer[2] = (value * 255) / highest;
+        if(has_alpha) buffer[3] = mode->key_defined && value == mode->key_r ? 0 : 255;
+      }
+    }
+  }
+  else if(mode->colortype == LCT_RGB)
+  {
+    if(mode->bitdepth == 8)
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = in[i * 3 + 0];
+        buffer[1] = in[i * 3 + 1];
+        buffer[2] = in[i * 3 + 2];
+        if(has_alpha) buffer[3] = mode->key_defined && buffer[0] == mode->key_r
+           && buffer[1]== mode->key_g && buffer[2] == mode->key_b ? 0 : 255;
+      }
+    }
+    else
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = in[i * 6 + 0];
+        buffer[1] = in[i * 6 + 2];
+        buffer[2] = in[i * 6 + 4];
+        if(has_alpha) buffer[3] = mode->key_defined
+           && 256U * in[i * 6 + 0] + in[i * 6 + 1] == mode->key_r
+           && 256U * in[i * 6 + 2] + in[i * 6 + 3] == mode->key_g
+           && 256U * in[i * 6 + 4] + in[i * 6 + 5] == mode->key_b ? 0 : 255;
+      }
+    }
+  }
+  else if(mode->colortype == LCT_PALETTE)
+  {
+    unsigned index;
+    size_t j = 0;
+    for(i = 0; i != numpixels; ++i, buffer += num_channels)
+    {
+      if(mode->bitdepth == 8) index = in[i];
+      else index = readBitsFromReversedStream(&j, in, mode->bitdepth);
+
+      if(index >= mode->palettesize)
+      {
+        /*This is an error according to the PNG spec, but most PNG decoders make it black instead.
+        Done here too, slightly faster due to no error handling needed.*/
+        buffer[0] = buffer[1] = buffer[2] = 0;
+        if(has_alpha) buffer[3] = 255;
+      }
+      else
+      {
+        buffer[0] = mode->palette[index * 4 + 0];
+        buffer[1] = mode->palette[index * 4 + 1];
+        buffer[2] = mode->palette[index * 4 + 2];
+        if(has_alpha) buffer[3] = mode->palette[index * 4 + 3];
+      }
+    }
+  }
+  else if(mode->colortype == LCT_GREY_ALPHA)
+  {
+    if(mode->bitdepth == 8)
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = buffer[1] = buffer[2] = in[i * 2 + 0];
+        if(has_alpha) buffer[3] = in[i * 2 + 1];
+      }
+    }
+    else
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = buffer[1] = buffer[2] = in[i * 4 + 0];
+        if(has_alpha) buffer[3] = in[i * 4 + 2];
+      }
+    }
+  }
+  else if(mode->colortype == LCT_RGBA)
+  {
+    if(mode->bitdepth == 8)
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = in[i * 4 + 0];
+        buffer[1] = in[i * 4 + 1];
+        buffer[2] = in[i * 4 + 2];
+        if(has_alpha) buffer[3] = in[i * 4 + 3];
+      }
+    }
+    else
+    {
+      for(i = 0; i != numpixels; ++i, buffer += num_channels)
+      {
+        buffer[0] = in[i * 8 + 0];
+        buffer[1] = in[i * 8 + 2];
+        buffer[2] = in[i * 8 + 4];
+        if(has_alpha) buffer[3] = in[i * 8 + 6];
+      }
+    }
+  }
+}
+
+/*Get RGBA16 color of pixel with index i (y * width + x) from the raw image with
+given color type, but the given color type must be 16-bit itself.*/
+static void getPixelColorRGBA16(unsigned short* r, unsigned short* g, unsigned short* b, unsigned short* a,
+                                const unsigned char* in, size_t i, const LodePNGColorMode* mode)
+{
+  if(mode->colortype == LCT_GREY)
+  {
+    *r = *g = *b = 256 * in[i * 2 + 0] + in[i * 2 + 1];
+    if(mode->key_defined && 256U * in[i * 2 + 0] + in[i * 2 + 1] == mode->key_r) *a = 0;
+    else *a = 65535;
+  }
+  else if(mode->colortype == LCT_RGB)
+  {
+    *r = 256u * in[i * 6 + 0] + in[i * 6 + 1];
+    *g = 256u * in[i * 6 + 2] + in[i * 6 + 3];
+    *b = 256u * in[i * 6 + 4] + in[i * 6 + 5];
+    if(mode->key_defined
+       && 256u * in[i * 6 + 0] + in[i * 6 + 1] == mode->key_r
+       && 256u * in[i * 6 + 2] + in[i * 6 + 3] == mode->key_g
+       && 256u * in[i * 6 + 4] + in[i * 6 + 5] == mode->key_b) *a = 0;
+    else *a = 65535;
+  }
+  else if(mode->colortype == LCT_GREY_ALPHA)
+  {
+    *r = *g = *b = 256u * in[i * 4 + 0] + in[i * 4 + 1];
+    *a = 256u * in[i * 4 + 2] + in[i * 4 + 3];
+  }
+  else if(mode->colortype == LCT_RGBA)
+  {
+    *r = 256u * in[i * 8 + 0] + in[i * 8 + 1];
+    *g = 256u * in[i * 8 + 2] + in[i * 8 + 3];
+    *b = 256u * in[i * 8 + 4] + in[i * 8 + 5];
+    *a = 256u * in[i * 8 + 6] + in[i * 8 + 7];
+  }
+}
+
+unsigned lodepng_convert(unsigned char* out, const unsigned char* in,
+                         const LodePNGColorMode* mode_out, const LodePNGColorMode* mode_in,
+                         unsigned w, unsigned h)
+{
+  unsigned int i;
+  ColorTree tree;
+  size_t numpixels = w * h;
+
+  if(lodepng_color_mode_equal(mode_out, mode_in))
+  {
+    size_t numbytes = lodepng_get_raw_size(w, h, mode_in);
+    for(i = 0; i != numbytes; ++i) out[i] = in[i];
+    return 0;
+  }
+
+  if(mode_out->colortype == LCT_PALETTE)
+  {
+    size_t palettesize = mode_out->palettesize;
+    const unsigned char* palette = mode_out->palette;
+    size_t palsize = (size_t)1 << mode_out->bitdepth;
+    /*if the user specified output palette but did not give the values, assume
+    they want the values of the input color type (assuming that one is palette).
+    Note that we never create a new palette ourselves.*/
+    if(palettesize == 0)
+    {
+      palettesize = mode_in->palettesize;
+      palette = mode_in->palette;
+    }
+    if(palettesize < palsize) palsize = palettesize;
+    color_tree_init(&tree);
+    for(i = 0; i != palsize; ++i)
+    {
+      const unsigned char* p = &palette[i * 4];
+      color_tree_add(&tree, p[0], p[1], p[2], p[3], i);
+    }
+  }
+
+  if(mode_in->bitdepth == 16 && mode_out->bitdepth == 16)
+  {
+    for(i = 0; i != numpixels; ++i)
+    {
+      unsigned short r = 0, g = 0, b = 0, a = 0;
+      getPixelColorRGBA16(&r, &g, &b, &a, in, i, mode_in);
+      rgba16ToPixel(out, i, mode_out, r, g, b, a);
+    }
+  }
+  else if(mode_out->bitdepth == 8 && mode_out->colortype == LCT_RGBA)
+  {
+    getPixelColorsRGBA8(out, numpixels, 1, in, mode_in);
+  }
+  else if(mode_out->bitdepth == 8 && mode_out->colortype == LCT_RGB)
+  {
+    getPixelColorsRGBA8(out, numpixels, 0, in, mode_in);
+  }
+  else
+  {
+    unsigned char r = 0, g = 0, b = 0, a = 0;
+    for(i = 0; i != numpixels; ++i)
+    {
+      getPixelColorRGBA8(&r, &g, &b, &a, in, i, mode_in);
+      CERROR_TRY_RETURN(rgba8ToPixel(out, i, mode_out, &tree, r, g, b, a));
+    }
+  }
+
+  if(mode_out->colortype == LCT_PALETTE)
+  {
+    color_tree_cleanup(&tree);
+  }
+
+  return 0; /*no error*/
+}
+
+#ifdef LODEPNG_COMPILE_ENCODER
+
+void lodepng_color_profile_init(LodePNGColorProfile* profile)
+{
+  profile->colored = 0;
+  profile->key = 0;
+  profile->alpha = 0;
+  profile->key_r = profile->key_g = profile->key_b = 0;
+  profile->numcolors = 0;
+  profile->bits = 1;
+}
+
+/*function used for debug purposes with C++*/
+/*void printColorProfile(LodePNGColorProfile* p)
+{
+  std::cout << "colored: " << (int)p->colored << ", ";
+  std::cout << "key: " << (int)p->key << ", ";
+  std::cout << "key_r: " << (int)p->key_r << ", ";
+  std::cout << "key_g: " << (int)p->key_g << ", ";
+  std::cout << "key_b: " << (int)p->key_b << ", ";
+  std::cout << "alpha: " << (int)p->alpha << ", ";
+  std::cout << "numcolors: " << (int)p->numcolors << ", ";
+  std::cout << "bits: " << (int)p->bits << std::endl;
+}*/
+
+/*Returns how many bits needed to represent given value (max 8 bit)*/
+static unsigned getValueRequiredBits(unsigned char value)
+{
+  if(value == 0 || value == 255) return 1;
+  /*The scaling of 2-bit and 4-bit values uses multiples of 85 and 17*/
+  if(value % 17 == 0) return value % 85 == 0 ? 2 : 4;
+  return 8;
+}
+
+/*profile must already have been inited with mode.
+It's ok to set some parameters of profile to done already.*/
+unsigned lodepng_get_color_profile(LodePNGColorProfile* profile,
+                                   const unsigned char* in, unsigned w, unsigned h,
+                                   const LodePNGColorMode* mode)
+{
+  unsigned error = 0;
+  size_t i;
+  ColorTree tree;
+  size_t numpixels = w * h;
+
+  unsigned colored_done = lodepng_is_greyscale_type(mode) ? 1 : 0;
+  unsigned alpha_done = lodepng_can_have_alpha(mode) ? 0 : 1;
+  unsigned numcolors_done = 0;
+  unsigned bpp = lodepng_get_bpp(mode);
+  unsigned bits_done = bpp == 1 ? 1 : 0;
+  unsigned maxnumcolors = 257;
+  unsigned sixteen = 0;
+  if(bpp <= 8) maxnumcolors = bpp == 1 ? 2 : (bpp == 2 ? 4 : (bpp == 4 ? 16 : 256));
+
+  color_tree_init(&tree);
+
+  /*Check if the 16-bit input is truly 16-bit*/
+  if(mode->bitdepth == 16)
+  {
+    unsigned short r, g, b, a;
+    for(i = 0; i != numpixels; ++i)
+    {
+      getPixelColorRGBA16(&r, &g, &b, &a, in, i, mode);
+      if((r & 255) != ((r >> 8) & 255) || (g & 255) != ((g >> 8) & 255) ||
+         (b & 255) != ((b >> 8) & 255) || (a & 255) != ((a >> 8) & 255)) /*first and second byte differ*/
+      {
+        sixteen = 1;
+        break;
+      }
+    }
+  }
+
+  if(sixteen)
+  {
+    unsigned short r = 0, g = 0, b = 0, a = 0;
+    profile->bits = 16;
+    bits_done = numcolors_done = 1; /*counting colors no longer useful, palette doesn't support 16-bit*/
+
+    for(i = 0; i != numpixels; ++i)
+    {
+      getPixelColorRGBA16(&r, &g, &b, &a, in, i, mode);
+
+      if(!colored_done && (r != g || r != b))
+      {
+        profile->colored = 1;
+        colored_done = 1;
+      }
+
+      if(!alpha_done)
+      {
+        unsigned matchkey = (r == profile->key_r && g == profile->key_g && b == profile->key_b);
+        if(a != 65535 && (a != 0 || (profile->key && !matchkey)))
+        {
+          profile->alpha = 1;
+          alpha_done = 1;
+          if(profile->bits < 8) profile->bits = 8; /*PNG has no alphachannel modes with less than 8-bit per channel*/
+        }
+        else if(a == 0 && !profile->alpha && !profile->key)
+        {
+          profile->key = 1;
+          profile->key_r = r;
+          profile->key_g = g;
+          profile->key_b = b;
+        }
+        else if(a == 65535 && profile->key && matchkey)
+        {
+          /* Color key cannot be used if an opaque pixel also has that RGB color. */
+          profile->alpha = 1;
+          alpha_done = 1;
+        }
+      }
+      if(alpha_done && numcolors_done && colored_done && bits_done) break;
+    }
+
+    if(profile->key && !profile->alpha)
+    {
+      for(i = 0; i != numpixels; ++i)
+      {
+        getPixelColorRGBA16(&r, &g, &b, &a, in, i, mode);
+        if(a != 0 && r == profile->key_r && g == profile->key_g && b == profile->key_b)
+        {
+          /* Color key cannot be used if an opaque pixel also has that RGB color. */
+          profile->alpha = 1;
+          alpha_done = 1;
+        }
+      }
+    }
+  }
+  else /* < 16-bit */
+  {
+    unsigned char r = 0, g = 0, b = 0, a = 0;
+    for(i = 0; i != numpixels; ++i)
+    {
+      getPixelColorRGBA8(&r, &g, &b, &a, in, i, mode);
+
+      if(!bits_done && profile->bits < 8)
+      {
+        /*only r is checked, < 8 bits is only relevant for greyscale*/
+        unsigned bits = getValueRequiredBits(r);
+        if(bits > profile->bits) profile->bits = bits;
+      }
+      bits_done = (profile->bits >= bpp);
+
+      if(!colored_done && (r != g || r != b))
+      {
+        profile->colored = 1;
+        colored_done = 1;
+        if(profile->bits < 8) profile->bits = 8; /*PNG has no colored modes with less than 8-bit per channel*/
+      }
+
+      if(!alpha_done)
+      {
+        unsigned matchkey = (r == profile->key_r && g == profile->key_g && b == profile->key_b);
+        if(a != 255 && (a != 0 || (profile->key && !matchkey)))
+        {
+          profile->alpha = 1;
+          alpha_done = 1;
+          if(profile->bits < 8) profile->bits = 8; /*PNG has no alphachannel modes with less than 8-bit per channel*/
+        }
+        else if(a == 0 && !profile->alpha && !profile->key)
+        {
+          profile->key = 1;
+          profile->key_r = r;
+          profile->key_g = g;
+          profile->key_b = b;
+        }
+        else if(a == 255 && profile->key && matchkey)
+        {
+          /* Color key cannot be used if an opaque pixel also has that RGB color. */
+          profile->alpha = 1;
+          alpha_done = 1;
+          if(profile->bits < 8) profile->bits = 8; /*PNG has no alphachannel modes with less than 8-bit per channel*/
+        }
+      }
+
+      if(!numcolors_done)
+      {
+        if(!color_tree_has(&tree, r, g, b, a))
+        {
+          color_tree_add(&tree, r, g, b, a, profile->numcolors);
+          if(profile->numcolors < 256)
+          {
+            unsigned char* p = profile->palette;
+            unsigned n = profile->numcolors;
+            p[n * 4 + 0] = r;
+            p[n * 4 + 1] = g;
+            p[n * 4 + 2] = b;
+            p[n * 4 + 3] = a;
+          }
+          ++profile->numcolors;
+          numcolors_done = profile->numcolors >= maxnumcolors;
+        }
+      }
+
+      if(alpha_done && numcolors_done && colored_done && bits_done) break;
+    }
+
+    if(profile->key && !profile->alpha)
+    {
+      for(i = 0; i != numpixels; ++i)
+      {
+        getPixelColorRGBA8(&r, &g, &b, &a, in, i, mode);
+        if(a != 0 && r == profile->key_r && g == profile->key_g && b == profile->key_b)
+        {
+          /* Color key cannot be used if an opaque pixel also has that RGB color. */
+          profile->alpha = 1;
+          alpha_done = 1;
+        }
+      }
+    }
+
+    /*make the profile's key always 16-bit for consistency - repeat each byte twice*/
+    profile->key_r += (profile->key_r << 8);
+    profile->key_g += (profile->key_g << 8);
+    profile->key_b += (profile->key_b << 8);
+  }
+
+  color_tree_cleanup(&tree);
+  return error;
+}
+
+/*Automatically chooses color type that gives smallest amount of bits in the
+output image, e.g. grey if there are only greyscale pixels, palette if there
+are less than 256 colors, ...
+Updates values of mode with a potentially smaller color model. mode_out should
+contain the user chosen color model, but will be overwritten with the new chosen one.*/
+unsigned lodepng_auto_choose_color(LodePNGColorMode* mode_out,
+                                   const unsigned char* image, unsigned w, unsigned h,
+                                   const LodePNGColorMode* mode_in)
+{
+  LodePNGColorProfile prof;
+  unsigned error = 0;
+  unsigned i, n, palettebits, grey_ok, palette_ok;
+
+  lodepng_color_profile_init(&prof);
+  error = lodepng_get_color_profile(&prof, image, w, h, mode_in);
+  if(error) return error;
+  mode_out->key_defined = 0;
+
+  if(prof.key && w * h <= 16)
+  {
+    prof.alpha = 1; /*too few pixels to justify tRNS chunk overhead*/
+    if(prof.bits < 8) prof.bits = 8; /*PNG has no alphachannel modes with less than 8-bit per channel*/
+  }
+  grey_ok = !prof.colored && !prof.alpha; /*grey without alpha, with potentially low bits*/
+  n = prof.numcolors;
+  palettebits = n <= 2 ? 1 : (n <= 4 ? 2 : (n <= 16 ? 4 : 8));
+  palette_ok = n <= 256 && (n * 2 < w * h) && prof.bits <= 8;
+  if(w * h < n * 2) palette_ok = 0; /*don't add palette overhead if image has only a few pixels*/
+  if(grey_ok && prof.bits <= palettebits) palette_ok = 0; /*grey is less overhead*/
+
+  if(palette_ok)
+  {
+    unsigned char* p = prof.palette;
+    lodepng_palette_clear(mode_out); /*remove potential earlier palette*/
+    for(i = 0; i != prof.numcolors; ++i)
+    {
+      error = lodepng_palette_add(mode_out, p[i * 4 + 0], p[i * 4 + 1], p[i * 4 + 2], p[i * 4 + 3]);
+      if(error) break;
+    }
+
+    mode_out->colortype = LCT_PALETTE;
+    mode_out->bitdepth = palettebits;
+
+    if(mode_in->colortype == LCT_PALETTE && mode_in->palettesize >= mode_out->palettesize
+        && mode_in->bitdepth == mode_out->bitdepth)
+    {
+      /*If input should have same palette colors, keep original to preserve its order and prevent conversion*/
+      lodepng_color_mode_cleanup(mode_out);
+      lodepng_color_mode_copy(mode_out, mode_in);
+    }
+  }
+  else /*8-bit or 16-bit per channel*/
+  {
+    mode_out->bitdepth = prof.bits;
+    mode_out->colortype = prof.alpha ? (prof.colored ? LCT_RGBA : LCT_GREY_ALPHA)
+                                     : (prof.colored ? LCT_RGB : LCT_GREY);
+
+    if(prof.key && !prof.alpha)
+    {
+      unsigned mask = (1u << mode_out->bitdepth) - 1u; /*profile always uses 16-bit, mask converts it*/
+      mode_out->key_r = prof.key_r & mask;
+      mode_out->key_g = prof.key_g & mask;
+      mode_out->key_b = prof.key_b & mask;
+      mode_out->key_defined = 1;
+    }
+  }
+
+  return error;
+}
+
+#endif /* #ifdef LODEPNG_COMPILE_ENCODER */
+
+/*
+Paeth predicter, used by PNG filter type 4
+The parameters are of type short, but should come from unsigned chars, the shorts
+are only needed to make the paeth calculation correct.
+*/
+static unsigned char paethPredictor(short a, short b, short c)
+{
+  short pa = abs(b - c);
+  short pb = abs(a - c);
+  short pc = abs(a + b - c - c);
+
+  if(pc < pa && pc < pb) return (unsigned char)c;
+  else if(pb < pa) return (unsigned char)b;
+  else return (unsigned char)a;
+}
+
+/*shared values used by multiple Adam7 related functions*/
+
+static const unsigned ADAM7_IX[7] = { 0, 4, 0, 2, 0, 1, 0 }; /*x start values*/
+static const unsigned ADAM7_IY[7] = { 0, 0, 4, 0, 2, 0, 1 }; /*y start values*/
+static const unsigned ADAM7_DX[7] = { 8, 8, 4, 4, 2, 2, 1 }; /*x delta values*/
+static const unsigned ADAM7_DY[7] = { 8, 8, 8, 4, 4, 2, 2 }; /*y delta values*/
+
+/*
+Outputs various dimensions and positions in the image related to the Adam7 reduced images.
+passw: output containing the width of the 7 passes
+passh: output containing the height of the 7 passes
+filter_passstart: output containing the index of the start and end of each
+ reduced image with filter bytes
+padded_passstart output containing the index of the start and end of each
+ reduced image when without filter bytes but with padded scanlines
+passstart: output containing the index of the start and end of each reduced
+ image without padding between scanlines, but still padding between the images
+w, h: width and height of non-interlaced image
+bpp: bits per pixel
+"padded" is only relevant if bpp is less than 8 and a scanline or image does not
+ end at a full byte
+*/
+static void Adam7_getpassvalues(unsigned passw[7], unsigned passh[7], size_t filter_passstart[8],
+                                size_t padded_passstart[8], size_t passstart[8], unsigned w, unsigned h, unsigned bpp)
+{
+  /*the passstart values have 8 values: the 8th one indicates the byte after the end of the 7th (= last) pass*/
+  unsigned i;
+
+  /*calculate width and height in pixels of each pass*/
+  for(i = 0; i != 7; ++i)
+  {
+    passw[i] = (w + ADAM7_DX[i] - ADAM7_IX[i] - 1) / ADAM7_DX[i];
+    passh[i] = (h + ADAM7_DY[i] - ADAM7_IY[i] - 1) / ADAM7_DY[i];
+    if(passw[i] == 0) passh[i] = 0;
+    if(passh[i] == 0) passw[i] = 0;
+  }
+
+  filter_passstart[0] = padded_passstart[0] = passstart[0] = 0;
+  for(i = 0; i != 7; ++i)
+  {
+    /*if passw[i] is 0, it's 0 bytes, not 1 (no filtertype-byte)*/
+    filter_passstart[i + 1] = filter_passstart[i]
+                            + ((passw[i] && passh[i]) ? passh[i] * (1 + (passw[i] * bpp + 7) / 8) : 0);
+    /*bits padded if needed to fill full byte at end of each scanline*/
+    padded_passstart[i + 1] = padded_passstart[i] + passh[i] * ((passw[i] * bpp + 7) / 8);
+    /*only padded at end of reduced image*/
+    passstart[i + 1] = passstart[i] + (passh[i] * passw[i] * bpp + 7) / 8;
+  }
+}
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / PNG Decoder                                                            / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*read the information from the header and store it in the LodePNGInfo. return value is error*/
+unsigned lodepng_inspect(unsigned* w, unsigned* h, LodePNGState* state,
+                         const unsigned char* in, size_t insize)
+{
+  LodePNGInfo* info = &state->info_png;
+  if(insize == 0 || in == 0)
+  {
+    CERROR_RETURN_ERROR(state->error, 48); /*error: the given data is empty*/
+  }
+  if(insize < 33)
+  {
+    CERROR_RETURN_ERROR(state->error, 27); /*error: the data length is smaller than the length of a PNG header*/
+  }
+
+  /*when decoding a new PNG image, make sure all parameters created after previous decoding are reset*/
+  lodepng_info_cleanup(info);
+  lodepng_info_init(info);
+
+  if(in[0] != 137 || in[1] != 80 || in[2] != 78 || in[3] != 71
+     || in[4] != 13 || in[5] != 10 || in[6] != 26 || in[7] != 10)
+  {
+    CERROR_RETURN_ERROR(state->error, 28); /*error: the first 8 bytes are not the correct PNG signature*/
+  }
+  if(lodepng_chunk_length(in + 8) != 13)
+  {
+    CERROR_RETURN_ERROR(state->error, 94); /*error: header size must be 13 bytes*/
+  }
+  if(!lodepng_chunk_type_equals(in + 8, "IHDR"))
+  {
+    CERROR_RETURN_ERROR(state->error, 29); /*error: it doesn't start with a IHDR chunk!*/
+  }
+
+  /*read the values given in the header*/
+  *w = lodepng_read32bitInt(&in[16]);
+  *h = lodepng_read32bitInt(&in[20]);
+  info->color.bitdepth = in[24];
+  info->color.colortype = (LodePNGColorType)in[25];
+  info->compression_method = in[26];
+  info->filter_method = in[27];
+  info->interlace_method = in[28];
+
+  if(*w == 0 || *h == 0)
+  {
+    CERROR_RETURN_ERROR(state->error, 93);
+  }
+
+  if(!state->decoder.ignore_crc)
+  {
+    unsigned CRC = lodepng_read32bitInt(&in[29]);
+    unsigned checksum = lodepng_crc32(&in[12], 17);
+    if(CRC != checksum)
+    {
+      CERROR_RETURN_ERROR(state->error, 57); /*invalid CRC*/
+    }
+  }
+
+  /*error: only compression method 0 is allowed in the specification*/
+  if(info->compression_method != 0) CERROR_RETURN_ERROR(state->error, 32);
+  /*error: only filter method 0 is allowed in the specification*/
+  if(info->filter_method != 0) CERROR_RETURN_ERROR(state->error, 33);
+  /*error: only interlace methods 0 and 1 exist in the specification*/
+  if(info->interlace_method > 1) CERROR_RETURN_ERROR(state->error, 34);
+
+  state->error = checkColorValidity(info->color.colortype, info->color.bitdepth);
+  return state->error;
+}
+
+static unsigned unfilterScanline(unsigned char* recon, const unsigned char* scanline, const unsigned char* precon,
+                                 size_t bytewidth, unsigned char filterType, size_t length)
+{
+  /*
+  For PNG filter method 0
+  unfilter a PNG image scanline by scanline. when the pixels are smaller than 1 byte,
+  the filter works byte per byte (bytewidth = 1)
+  precon is the previous unfiltered scanline, recon the result, scanline the current one
+  the incoming scanlines do NOT include the filtertype byte, that one is given in the parameter filterType instead
+  recon and scanline MAY be the same memory address! precon must be disjoint.
+  */
+
+  size_t i;
+  switch(filterType)
+  {
+    case 0:
+      for(i = 0; i != length; ++i) recon[i] = scanline[i];
+      break;
+    case 1:
+      for(i = 0; i != bytewidth; ++i) recon[i] = scanline[i];
+      for(i = bytewidth; i < length; ++i) recon[i] = scanline[i] + recon[i - bytewidth];
+      break;
+    case 2:
+      if(precon)
+      {
+        for(i = 0; i != length; ++i) recon[i] = scanline[i] + precon[i];
+      }
+      else
+      {
+        for(i = 0; i != length; ++i) recon[i] = scanline[i];
+      }
+      break;
+    case 3:
+      if(precon)
+      {
+        for(i = 0; i != bytewidth; ++i) recon[i] = scanline[i] + (precon[i] >> 1);
+        for(i = bytewidth; i < length; ++i) recon[i] = scanline[i] + ((recon[i - bytewidth] + precon[i]) >> 1);
+      }
+      else
+      {
+        for(i = 0; i != bytewidth; ++i) recon[i] = scanline[i];
+        for(i = bytewidth; i < length; ++i) recon[i] = scanline[i] + (recon[i - bytewidth] >> 1);
+      }
+      break;
+    case 4:
+      if(precon)
+      {
+        for(i = 0; i != bytewidth; ++i)
+        {
+          recon[i] = (scanline[i] + precon[i]); /*paethPredictor(0, precon[i], 0) is always precon[i]*/
+        }
+        for(i = bytewidth; i < length; ++i)
+        {
+          recon[i] = (scanline[i] + paethPredictor(recon[i - bytewidth], precon[i], precon[i - bytewidth]));
+        }
+      }
+      else
+      {
+        for(i = 0; i != bytewidth; ++i)
+        {
+          recon[i] = scanline[i];
+        }
+        for(i = bytewidth; i < length; ++i)
+        {
+          /*paethPredictor(recon[i - bytewidth], 0, 0) is always recon[i - bytewidth]*/
+          recon[i] = (scanline[i] + recon[i - bytewidth]);
+        }
+      }
+      break;
+    default: return 36; /*error: unexisting filter type given*/
+  }
+  return 0;
+}
+
+static unsigned unfilter(unsigned char* out, const unsigned char* in, unsigned w, unsigned h, unsigned bpp)
+{
+  /*
+  For PNG filter method 0
+  this function unfilters a single image (e.g. without interlacing this is called once, with Adam7 seven times)
+  out must have enough bytes allocated already, in must have the scanlines + 1 filtertype byte per scanline
+  w and h are image dimensions or dimensions of reduced image, bpp is bits per pixel
+  in and out are allowed to be the same memory address (but aren't the same size since in has the extra filter bytes)
+  */
+
+  unsigned y;
+  unsigned char* prevline = 0;
+
+  /*bytewidth is used for filtering, is 1 when bpp < 8, number of bytes per pixel otherwise*/
+  size_t bytewidth = (bpp + 7) / 8;
+  size_t linebytes = (w * bpp + 7) / 8;
+
+  for(y = 0; y < h; ++y)
+  {
+    size_t outindex = linebytes * y;
+    size_t inindex = (1 + linebytes) * y; /*the extra filterbyte added to each row*/
+    unsigned char filterType = in[inindex];
+
+    CERROR_TRY_RETURN(unfilterScanline(&out[outindex], &in[inindex + 1], prevline, bytewidth, filterType, linebytes));
+
+    prevline = &out[outindex];
+  }
+
+  return 0;
+}
+
+/*
+in: Adam7 interlaced image, with no padding bits between scanlines, but between
+ reduced images so that each reduced image starts at a byte.
+out: the same pixels, but re-ordered so that they're now a non-interlaced image with size w*h
+bpp: bits per pixel
+out has the following size in bits: w * h * bpp.
+in is possibly bigger due to padding bits between reduced images.
+out must be big enough AND must be 0 everywhere if bpp < 8 in the current implementation
+(because that's likely a little bit faster)
+NOTE: comments about padding bits are only relevant if bpp < 8
+*/
+static void Adam7_deinterlace(unsigned char* out, const unsigned char* in, unsigned w, unsigned h, unsigned bpp)
+{
+  unsigned passw[7], passh[7];
+  size_t filter_passstart[8], padded_passstart[8], passstart[8];
+  unsigned i;
+
+  Adam7_getpassvalues(passw, passh, filter_passstart, padded_passstart, passstart, w, h, bpp);
+
+  if(bpp >= 8)
+  {
+    for(i = 0; i != 7; ++i)
+    {
+      unsigned x, y, b;
+      size_t bytewidth = bpp / 8;
+      for(y = 0; y < passh[i]; ++y)
+      for(x = 0; x < passw[i]; ++x)
+      {
+        size_t pixelinstart = passstart[i] + (y * passw[i] + x) * bytewidth;
+        size_t pixeloutstart = ((ADAM7_IY[i] + y * ADAM7_DY[i]) * w + ADAM7_IX[i] + x * ADAM7_DX[i]) * bytewidth;
+        for(b = 0; b < bytewidth; ++b)
+        {
+          out[pixeloutstart + b] = in[pixelinstart + b];
+        }
+      }
+    }
+  }
+  else /*bpp < 8: Adam7 with pixels < 8 bit is a bit trickier: with bit pointers*/
+  {
+    for(i = 0; i != 7; ++i)
+    {
+      unsigned x, y, b;
+      unsigned ilinebits = bpp * passw[i];
+      unsigned olinebits = bpp * w;
+      size_t obp, ibp; /*bit pointers (for out and in buffer)*/
+      for(y = 0; y < passh[i]; ++y)
+      for(x = 0; x < passw[i]; ++x)
+      {
+        ibp = (8 * passstart[i]) + (y * ilinebits + x * bpp);
+        obp = (ADAM7_IY[i] + y * ADAM7_DY[i]) * olinebits + (ADAM7_IX[i] + x * ADAM7_DX[i]) * bpp;
+        for(b = 0; b < bpp; ++b)
+        {
+          unsigned char bit = readBitFromReversedStream(&ibp, in);
+          /*note that this function assumes the out buffer is completely 0, use setBitOfReversedStream otherwise*/
+          setBitOfReversedStream0(&obp, out, bit);
+        }
+      }
+    }
+  }
+}
+
+static void removePaddingBits(unsigned char* out, const unsigned char* in,
+                              size_t olinebits, size_t ilinebits, unsigned h)
+{
+  /*
+  After filtering there are still padding bits if scanlines have non multiple of 8 bit amounts. They need
+  to be removed (except at last scanline of (Adam7-reduced) image) before working with pure image buffers
+  for the Adam7 code, the color convert code and the output to the user.
+  in and out are allowed to be the same buffer, in may also be higher but still overlapping; in must
+  have >= ilinebits*h bits, out must have >= olinebits*h bits, olinebits must be <= ilinebits
+  also used to move bits after earlier such operations happened, e.g. in a sequence of reduced images from Adam7
+  only useful if (ilinebits - olinebits) is a value in the range 1..7
+  */
+  unsigned y;
+  size_t diff = ilinebits - olinebits;
+  size_t ibp = 0, obp = 0; /*input and output bit pointers*/
+  for(y = 0; y < h; ++y)
+  {
+    size_t x;
+    for(x = 0; x < olinebits; ++x)
+    {
+      unsigned char bit = readBitFromReversedStream(&ibp, in);
+      setBitOfReversedStream(&obp, out, bit);
+    }
+    ibp += diff;
+  }
+}
+
+/*out must be buffer big enough to contain full image, and in must contain the full decompressed data from
+the IDAT chunks (with filter index bytes and possible padding bits)
+return value is error*/
+static unsigned postProcessScanlines(unsigned char* out, unsigned char* in,
+                                     unsigned w, unsigned h, const LodePNGInfo* info_png)
+{
+  /*
+  This function converts the filtered-padded-interlaced data into pure 2D image buffer with the PNG's colortype.
+  Steps:
+  *) if no Adam7: 1) unfilter 2) remove padding bits (= posible extra bits per scanline if bpp < 8)
+  *) if adam7: 1) 7x unfilter 2) 7x remove padding bits 3) Adam7_deinterlace
+  NOTE: the in buffer will be overwritten with intermediate data!
+  */
+  unsigned bpp = lodepng_get_bpp(&info_png->color);
+  if(bpp == 0) return 31; /*error: invalid colortype*/
+
+  if(info_png->interlace_method == 0)
+  {
+    if(bpp < 8 && w * bpp != ((w * bpp + 7) / 8) * 8)
+    {
+      CERROR_TRY_RETURN(unfilter(in, in, w, h, bpp));
+      removePaddingBits(out, in, w * bpp, ((w * bpp + 7) / 8) * 8, h);
+    }
+    /*we can immediately filter into the out buffer, no other steps needed*/
+    else CERROR_TRY_RETURN(unfilter(out, in, w, h, bpp));
+  }
+  else /*interlace_method is 1 (Adam7)*/
+  {
+    unsigned passw[7], passh[7]; size_t filter_passstart[8], padded_passstart[8], passstart[8];
+    unsigned i;
+
+    Adam7_getpassvalues(passw, passh, filter_passstart, padded_passstart, passstart, w, h, bpp);
+
+    for(i = 0; i != 7; ++i)
+    {
+      CERROR_TRY_RETURN(unfilter(&in[padded_passstart[i]], &in[filter_passstart[i]], passw[i], passh[i], bpp));
+      /*TODO: possible efficiency improvement: if in this reduced image the bits fit nicely in 1 scanline,
+      move bytes instead of bits or move not at all*/
+      if(bpp < 8)
+      {
+        /*remove padding bits in scanlines; after this there still may be padding
+        bits between the different reduced images: each reduced image still starts nicely at a byte*/
+        removePaddingBits(&in[passstart[i]], &in[padded_passstart[i]], passw[i] * bpp,
+                          ((passw[i] * bpp + 7) / 8) * 8, passh[i]);
+      }
+    }
+
+    Adam7_deinterlace(out, in, w, h, bpp);
+  }
+
+  return 0;
+}
+
+static unsigned readChunk_PLTE(LodePNGColorMode* color, const unsigned char* data, size_t chunkLength)
+{
+  unsigned pos = 0, i;
+  if(color->palette) lodepng_free(color->palette);
+  color->palettesize = chunkLength / 3;
+  color->palette = (unsigned char*)lodepng_malloc(4 * color->palettesize);
+  if(!color->palette && color->palettesize)
+  {
+    color->palettesize = 0;
+    return 83; /*alloc fail*/
+  }
+  if(color->palettesize > 256) return 38; /*error: palette too big*/
+
+  for(i = 0; i != color->palettesize; ++i)
+  {
+    color->palette[4 * i + 0] = data[pos++]; /*R*/
+    color->palette[4 * i + 1] = data[pos++]; /*G*/
+    color->palette[4 * i + 2] = data[pos++]; /*B*/
+    color->palette[4 * i + 3] = 255; /*alpha*/
+  }
+
+  return 0; /* OK */
+}
+
+static unsigned readChunk_tRNS(LodePNGColorMode* color, const unsigned char* data, size_t chunkLength)
+{
+  unsigned i;
+  if(color->colortype == LCT_PALETTE)
+  {
+    /*error: more alpha values given than there are palette entries*/
+    if(chunkLength > color->palettesize) return 38;
+
+    for(i = 0; i != chunkLength; ++i) color->palette[4 * i + 3] = data[i];
+  }
+  else if(color->colortype == LCT_GREY)
+  {
+    /*error: this chunk must be 2 bytes for greyscale image*/
+    if(chunkLength != 2) return 30;
+
+    color->key_defined = 1;
+    color->key_r = color->key_g = color->key_b = 256u * data[0] + data[1];
+  }
+  else if(color->colortype == LCT_RGB)
+  {
+    /*error: this chunk must be 6 bytes for RGB image*/
+    if(chunkLength != 6) return 41;
+
+    color->key_defined = 1;
+    color->key_r = 256u * data[0] + data[1];
+    color->key_g = 256u * data[2] + data[3];
+    color->key_b = 256u * data[4] + data[5];
+  }
+  else return 42; /*error: tRNS chunk not allowed for other color models*/
+
+  return 0; /* OK */
+}
+
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+/*background color chunk (bKGD)*/
+static unsigned readChunk_bKGD(LodePNGInfo* info, const unsigned char* data, size_t chunkLength)
+{
+  if(info->color.colortype == LCT_PALETTE)
+  {
+    /*error: this chunk must be 1 byte for indexed color image*/
+    if(chunkLength != 1) return 43;
+
+    info->background_defined = 1;
+    info->background_r = info->background_g = info->background_b = data[0];
+  }
+  else if(info->color.colortype == LCT_GREY || info->color.colortype == LCT_GREY_ALPHA)
+  {
+    /*error: this chunk must be 2 bytes for greyscale image*/
+    if(chunkLength != 2) return 44;
+
+    info->background_defined = 1;
+    info->background_r = info->background_g = info->background_b = 256u * data[0] + data[1];
+  }
+  else if(info->color.colortype == LCT_RGB || info->color.colortype == LCT_RGBA)
+  {
+    /*error: this chunk must be 6 bytes for greyscale image*/
+    if(chunkLength != 6) return 45;
+
+    info->background_defined = 1;
+    info->background_r = 256u * data[0] + data[1];
+    info->background_g = 256u * data[2] + data[3];
+    info->background_b = 256u * data[4] + data[5];
+  }
+
+  return 0; /* OK */
+}
+
+/*text chunk (tEXt)*/
+static unsigned readChunk_tEXt(LodePNGInfo* info, const unsigned char* data, unsigned int chunkLength)
+{
+  unsigned error = 0;
+  char *key = 0, *str = 0;
+  unsigned i;
+
+  while(!error) /*not really a while loop, only used to break on error*/
+  {
+    unsigned length, string2_begin;
+
+    length = 0;
+    while(length < chunkLength && data[length] != 0) ++length;
+    /*even though it's not allowed by the standard, no error is thrown if
+    there's no null termination char, if the text is empty*/
+    if(length < 1 || length > 79) CERROR_BREAK(error, 89); /*keyword too short or long*/
+
+    key = (char*)lodepng_malloc(length + 1);
+    if(!key) CERROR_BREAK(error, 83); /*alloc fail*/
+
+    key[length] = 0;
+    for(i = 0; i != length; ++i) key[i] = (char)data[i];
+
+    string2_begin = length + 1; /*skip keyword null terminator*/
+
+    length = chunkLength < string2_begin ? 0 : chunkLength - string2_begin;
+    str = (char*)lodepng_malloc(length + 1);
+    if(!str) CERROR_BREAK(error, 83); /*alloc fail*/
+
+    str[length] = 0;
+    for(i = 0; i != length; ++i) str[i] = (char)data[string2_begin + i];
+
+    error = lodepng_add_text(info, key, str);
+
+    break;
+  }
+
+  lodepng_free(key);
+  lodepng_free(str);
+
+  return error;
+}
+
+/*compressed text chunk (zTXt)*/
+static unsigned readChunk_zTXt(LodePNGInfo* info, const LodePNGDecompressSettings* zlibsettings,
+                               const unsigned char* data, unsigned int chunkLength)
+{
+  unsigned error = 0;
+  unsigned i;
+
+  unsigned length, string2_begin;
+  char *key = 0;
+  ucvector decoded;
+
+  ucvector_init(&decoded);
+
+  while(!error) /*not really a while loop, only used to break on error*/
+  {
+    for(length = 0; length < chunkLength && data[length] != 0; ++length) ;
+    if(length + 2 >= chunkLength) CERROR_BREAK(error, 75); /*no null termination, corrupt?*/
+    if(length < 1 || length > 79) CERROR_BREAK(error, 89); /*keyword too short or long*/
+
+    key = (char*)lodepng_malloc(length + 1);
+    if(!key) CERROR_BREAK(error, 83); /*alloc fail*/
+
+    key[length] = 0;
+    for(i = 0; i != length; ++i) key[i] = (char)data[i];
+
+    if(data[length + 1] != 0) CERROR_BREAK(error, 72); /*the 0 byte indicating compression must be 0*/
+
+    string2_begin = length + 2;
+    if(string2_begin > chunkLength) CERROR_BREAK(error, 75); /*no null termination, corrupt?*/
+
+    length = chunkLength - string2_begin;
+    /*will fail if zlib error, e.g. if length is too small*/
+    error = zlib_decompress(&decoded.data, &decoded.size,
+                            (unsigned char*)(&data[string2_begin]),
+                            length, zlibsettings);
+    if(error) break;
+    ucvector_push_back(&decoded, 0);
+
+    error = lodepng_add_text(info, key, (char*)decoded.data);
+
+    break;
+  }
+
+  lodepng_free(key);
+  ucvector_cleanup(&decoded);
+
+  return error;
+}
+
+/*international text chunk (iTXt)*/
+static unsigned readChunk_iTXt(LodePNGInfo* info, const LodePNGDecompressSettings* zlibsettings,
+                               const unsigned char* data, unsigned int chunkLength)
+{
+  unsigned error = 0;
+  unsigned i;
+
+  unsigned length, begin, compressed;
+  char *key = 0, *langtag = 0, *transkey = 0;
+  ucvector decoded;
+  ucvector_init(&decoded);
+
+  while(!error) /*not really a while loop, only used to break on error*/
+  {
+    /*Quick check if the chunk length isn't too small. Even without check
+    it'd still fail with other error checks below if it's too short. This just gives a different error code.*/
+    if(chunkLength < 5) CERROR_BREAK(error, 30); /*iTXt chunk too short*/
+
+    /*read the key*/
+    for(length = 0; length < chunkLength && data[length] != 0; ++length) ;
+    if(length + 3 >= chunkLength) CERROR_BREAK(error, 75); /*no null termination char, corrupt?*/
+    if(length < 1 || length > 79) CERROR_BREAK(error, 89); /*keyword too short or long*/
+
+    key = (char*)lodepng_malloc(length + 1);
+    if(!key) CERROR_BREAK(error, 83); /*alloc fail*/
+
+    key[length] = 0;
+    for(i = 0; i != length; ++i) key[i] = (char)data[i];
+
+    /*read the compression method*/
+    compressed = data[length + 1];
+    if(data[length + 2] != 0) CERROR_BREAK(error, 72); /*the 0 byte indicating compression must be 0*/
+
+    /*even though it's not allowed by the standard, no error is thrown if
+    there's no null termination char, if the text is empty for the next 3 texts*/
+
+    /*read the langtag*/
+    begin = length + 3;
+    length = 0;
+    for(i = begin; i < chunkLength && data[i] != 0; ++i) ++length;
+
+    langtag = (char*)lodepng_malloc(length + 1);
+    if(!langtag) CERROR_BREAK(error, 83); /*alloc fail*/
+
+    langtag[length] = 0;
+    for(i = 0; i != length; ++i) langtag[i] = (char)data[begin + i];
+
+    /*read the transkey*/
+    begin += length + 1;
+    length = 0;
+    for(i = begin; i < chunkLength && data[i] != 0; ++i) ++length;
+
+    transkey = (char*)lodepng_malloc(length + 1);
+    if(!transkey) CERROR_BREAK(error, 83); /*alloc fail*/
+
+    transkey[length] = 0;
+    for(i = 0; i != length; ++i) transkey[i] = (char)data[begin + i];
+
+    /*read the actual text*/
+    begin += length + 1;
+
+    length = chunkLength < begin ? 0 : chunkLength - begin;
+
+    if(compressed)
+    {
+      /*will fail if zlib error, e.g. if length is too small*/
+      error = zlib_decompress(&decoded.data, &decoded.size,
+                              (unsigned char*)(&data[begin]),
+                              length, zlibsettings);
+      if(error) break;
+      if(decoded.allocsize < decoded.size) decoded.allocsize = decoded.size;
+      ucvector_push_back(&decoded, 0);
+    }
+    else
+    {
+      if(!ucvector_resize(&decoded, length + 1)) CERROR_BREAK(error, 83 /*alloc fail*/);
+
+      decoded.data[length] = 0;
+      for(i = 0; i != length; ++i) decoded.data[i] = data[begin + i];
+    }
+
+    error = lodepng_add_itext(info, key, langtag, transkey, (char*)decoded.data);
+
+    break;
+  }
+
+  lodepng_free(key);
+  lodepng_free(langtag);
+  lodepng_free(transkey);
+  ucvector_cleanup(&decoded);
+
+  return error;
+}
+
+static unsigned readChunk_tIME(LodePNGInfo* info, const unsigned char* data, size_t chunkLength)
+{
+  if(chunkLength != 7) return 73; /*invalid tIME chunk size*/
+
+  info->time_defined = 1;
+  info->time.year = 256u * data[0] + data[1];
+  info->time.month = data[2];
+  info->time.day = data[3];
+  info->time.hour = data[4];
+  info->time.minute = data[5];
+  info->time.second = data[6];
+
+  return 0; /* OK */
+}
+
+static unsigned readChunk_pHYs(LodePNGInfo* info, const unsigned char* data, size_t chunkLength)
+{
+  if(chunkLength != 9) return 74; /*invalid pHYs chunk size*/
+
+  info->phys_defined = 1;
+  info->phys_x = 16777216u * data[0] + 65536u * data[1] + 256u * data[2] + data[3];
+  info->phys_y = 16777216u * data[4] + 65536u * data[5] + 256u * data[6] + data[7];
+  info->phys_unit = data[8];
+
+  return 0; /* OK */
+}
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+/*read a PNG, the result will be in the same color type as the PNG (hence "generic")*/
+static void decodeGeneric(unsigned char** out, unsigned* w, unsigned* h,
+                          LodePNGState* state,
+                          const unsigned char* in, size_t insize)
+{
+  unsigned char IEND = 0;
+  const unsigned char* chunk;
+  size_t i;
+  ucvector idat; /*the data from idat chunks*/
+  ucvector scanlines;
+  size_t predict;
+  size_t numpixels;
+  size_t outsize;
+
+  /*for unknown chunk order*/
+  unsigned unknown = 0;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  unsigned critical_pos = 1; /*1 = after IHDR, 2 = after PLTE, 3 = after IDAT*/
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+  /*provide some proper output values if error will happen*/
+  *out = 0;
+
+  state->error = lodepng_inspect(w, h, state, in, insize); /*reads header and resets other parameters in state->info_png*/
+  if(state->error) return;
+
+  numpixels = *w * *h;
+
+  /*multiplication overflow*/
+  if(*h != 0 && numpixels / *h != *w) CERROR_RETURN(state->error, 92);
+  /*multiplication overflow possible further below. Allows up to 2^31-1 pixel
+  bytes with 16-bit RGBA, the rest is room for filter bytes.*/
+  if(numpixels > 268435455) CERROR_RETURN(state->error, 92);
+
+  ucvector_init(&idat);
+  chunk = &in[33]; /*first byte of the first chunk after the header*/
+
+  /*loop through the chunks, ignoring unknown chunks and stopping at IEND chunk.
+  IDAT data is put at the start of the in buffer*/
+  while(!IEND && !state->error)
+  {
+    unsigned chunkLength;
+    const unsigned char* data; /*the data in the chunk*/
+
+    /*error: size of the in buffer too small to contain next chunk*/
+    if((size_t)((chunk - in) + 12) > insize || chunk < in) CERROR_BREAK(state->error, 30);
+
+    /*length of the data of the chunk, excluding the length bytes, chunk type and CRC bytes*/
+    chunkLength = lodepng_chunk_length(chunk);
+    /*error: chunk length larger than the max PNG chunk size*/
+    if(chunkLength > 2147483647) CERROR_BREAK(state->error, 63);
+
+    if((size_t)((chunk - in) + chunkLength + 12) > insize || (chunk + chunkLength + 12) < in)
+    {
+      CERROR_BREAK(state->error, 64); /*error: size of the in buffer too small to contain next chunk*/
+    }
+
+    data = lodepng_chunk_data_const(chunk);
+
+    /*IDAT chunk, containing compressed image data*/
+    if(lodepng_chunk_type_equals(chunk, "IDAT"))
+    {
+      size_t oldsize = idat.size;
+      if(!ucvector_resize(&idat, oldsize + chunkLength)) CERROR_BREAK(state->error, 83 /*alloc fail*/);
+      for(i = 0; i != chunkLength; ++i) idat.data[oldsize + i] = data[i];
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+      critical_pos = 3;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    }
+    /*IEND chunk*/
+    else if(lodepng_chunk_type_equals(chunk, "IEND"))
+    {
+      IEND = 1;
+    }
+    /*palette chunk (PLTE)*/
+    else if(lodepng_chunk_type_equals(chunk, "PLTE"))
+    {
+      state->error = readChunk_PLTE(&state->info_png.color, data, chunkLength);
+      if(state->error) break;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+      critical_pos = 2;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    }
+    /*palette transparency chunk (tRNS)*/
+    else if(lodepng_chunk_type_equals(chunk, "tRNS"))
+    {
+      state->error = readChunk_tRNS(&state->info_png.color, data, chunkLength);
+      if(state->error) break;
+    }
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+    /*background color chunk (bKGD)*/
+    else if(lodepng_chunk_type_equals(chunk, "bKGD"))
+    {
+      state->error = readChunk_bKGD(&state->info_png, data, chunkLength);
+      if(state->error) break;
+    }
+    /*text chunk (tEXt)*/
+    else if(lodepng_chunk_type_equals(chunk, "tEXt"))
+    {
+      if(state->decoder.read_text_chunks)
+      {
+        state->error = readChunk_tEXt(&state->info_png, data, chunkLength);
+        if(state->error) break;
+      }
+    }
+    /*compressed text chunk (zTXt)*/
+    else if(lodepng_chunk_type_equals(chunk, "zTXt"))
+    {
+      if(state->decoder.read_text_chunks)
+      {
+        state->error = readChunk_zTXt(&state->info_png, &state->decoder.zlibsettings, data, chunkLength);
+        if(state->error) break;
+      }
+    }
+    /*international text chunk (iTXt)*/
+    else if(lodepng_chunk_type_equals(chunk, "iTXt"))
+    {
+      if(state->decoder.read_text_chunks)
+      {
+        state->error = readChunk_iTXt(&state->info_png, &state->decoder.zlibsettings, data, chunkLength);
+        if(state->error) break;
+      }
+    }
+    else if(lodepng_chunk_type_equals(chunk, "tIME"))
+    {
+      state->error = readChunk_tIME(&state->info_png, data, chunkLength);
+      if(state->error) break;
+    }
+    else if(lodepng_chunk_type_equals(chunk, "pHYs"))
+    {
+      state->error = readChunk_pHYs(&state->info_png, data, chunkLength);
+      if(state->error) break;
+    }
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    else /*it's not an implemented chunk type, so ignore it: skip over the data*/
+    {
+      /*error: unknown critical chunk (5th bit of first byte of chunk type is 0)*/
+      if(!lodepng_chunk_ancillary(chunk)) CERROR_BREAK(state->error, 69);
+
+      unknown = 1;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+      if(state->decoder.remember_unknown_chunks)
+      {
+        state->error = lodepng_chunk_append(&state->info_png.unknown_chunks_data[critical_pos - 1],
+                                            &state->info_png.unknown_chunks_size[critical_pos - 1], chunk);
+        if(state->error) break;
+      }
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    }
+
+    if(!state->decoder.ignore_crc && !unknown) /*check CRC if wanted, only on known chunk types*/
+    {
+      if(lodepng_chunk_check_crc(chunk)) CERROR_BREAK(state->error, 57); /*invalid CRC*/
+    }
+
+    if(!IEND) chunk = lodepng_chunk_next_const(chunk);
+  }
+
+  ucvector_init(&scanlines);
+  /*predict output size, to allocate exact size for output buffer to avoid more dynamic allocation.
+  If the decompressed size does not match the prediction, the image must be corrupt.*/
+  if(state->info_png.interlace_method == 0)
+  {
+    /*The extra *h is added because this are the filter bytes every scanline starts with*/
+    predict = lodepng_get_raw_size_idat(*w, *h, &state->info_png.color) + *h;
+  }
+  else
+  {
+    /*Adam-7 interlaced: predicted size is the sum of the 7 sub-images sizes*/
+    const LodePNGColorMode* color = &state->info_png.color;
+    predict = 0;
+    predict += lodepng_get_raw_size_idat((*w + 7) >> 3, (*h + 7) >> 3, color) + ((*h + 7) >> 3);
+    if(*w > 4) predict += lodepng_get_raw_size_idat((*w + 3) >> 3, (*h + 7) >> 3, color) + ((*h + 7) >> 3);
+    predict += lodepng_get_raw_size_idat((*w + 3) >> 2, (*h + 3) >> 3, color) + ((*h + 3) >> 3);
+    if(*w > 2) predict += lodepng_get_raw_size_idat((*w + 1) >> 2, (*h + 3) >> 2, color) + ((*h + 3) >> 2);
+    predict += lodepng_get_raw_size_idat((*w + 1) >> 1, (*h + 1) >> 2, color) + ((*h + 1) >> 2);
+    if(*w > 1) predict += lodepng_get_raw_size_idat((*w + 0) >> 1, (*h + 1) >> 1, color) + ((*h + 1) >> 1);
+    predict += lodepng_get_raw_size_idat((*w + 0), (*h + 0) >> 1, color) + ((*h + 0) >> 1);
+  }
+  if(!state->error && !ucvector_reserve(&scanlines, predict)) state->error = 83; /*alloc fail*/
+  if(!state->error)
+  {
+    state->error = zlib_decompress(&scanlines.data, &scanlines.size, idat.data,
+                                   idat.size, &state->decoder.zlibsettings);
+    if(!state->error && scanlines.size != predict) state->error = 91; /*decompressed size doesn't match prediction*/
+  }
+  ucvector_cleanup(&idat);
+
+  if(!state->error)
+  {
+    outsize = lodepng_get_raw_size(*w, *h, &state->info_png.color);
+    *out = (unsigned char*)lodepng_malloc(outsize);
+    if(!*out) state->error = 83; /*alloc fail*/
+  }
+  if(!state->error)
+  {
+    for(i = 0; i < outsize; i++) (*out)[i] = 0;
+    state->error = postProcessScanlines(*out, scanlines.data, *w, *h, &state->info_png);
+  }
+  ucvector_cleanup(&scanlines);
+}
+
+unsigned lodepng_decode(unsigned char** out, unsigned* w, unsigned* h,
+                        LodePNGState* state,
+                        const unsigned char* in, size_t insize)
+{
+  *out = 0;
+  decodeGeneric(out, w, h, state, in, insize);
+  if(state->error) return state->error;
+  if(!state->decoder.color_convert || lodepng_color_mode_equal(&state->info_raw, &state->info_png.color))
+  {
+    /*same color type, no copying or converting of data needed*/
+    /*store the info_png color settings on the info_raw so that the info_raw still reflects what colortype
+    the raw image has to the end user*/
+    if(!state->decoder.color_convert)
+    {
+      state->error = lodepng_color_mode_copy(&state->info_raw, &state->info_png.color);
+      if(state->error) return state->error;
+    }
+  }
+  else
+  {
+    /*color conversion needed; sort of copy of the data*/
+    unsigned char* data = *out;
+    size_t outsize;
+
+    /*TODO: check if this works according to the statement in the documentation: "The converter can convert
+    from greyscale input color type, to 8-bit greyscale or greyscale with alpha"*/
+    if(!(state->info_raw.colortype == LCT_RGB || state->info_raw.colortype == LCT_RGBA)
+       && !(state->info_raw.bitdepth == 8))
+    {
+      return 56; /*unsupported color mode conversion*/
+    }
+
+    outsize = lodepng_get_raw_size(*w, *h, &state->info_raw);
+    *out = (unsigned char*)lodepng_malloc(outsize);
+    if(!(*out))
+    {
+      state->error = 83; /*alloc fail*/
+    }
+    else state->error = lodepng_convert(*out, data, &state->info_raw,
+                                        &state->info_png.color, *w, *h);
+    lodepng_free(data);
+  }
+  return state->error;
+}
+
+unsigned lodepng_decode_memory(unsigned char** out, unsigned* w, unsigned* h, const unsigned char* in,
+                               size_t insize, LodePNGColorType colortype, unsigned bitdepth)
+{
+  unsigned error;
+  LodePNGState state;
+  lodepng_state_init(&state);
+  state.info_raw.colortype = colortype;
+  state.info_raw.bitdepth = bitdepth;
+  error = lodepng_decode(out, w, h, &state, in, insize);
+  lodepng_state_cleanup(&state);
+  return error;
+}
+
+unsigned lodepng_decode32(unsigned char** out, unsigned* w, unsigned* h, const unsigned char* in, size_t insize)
+{
+  return lodepng_decode_memory(out, w, h, in, insize, LCT_RGBA, 8);
+}
+
+unsigned lodepng_decode24(unsigned char** out, unsigned* w, unsigned* h, const unsigned char* in, size_t insize)
+{
+  return lodepng_decode_memory(out, w, h, in, insize, LCT_RGB, 8);
+}
+
+#ifdef LODEPNG_COMPILE_DISK
+unsigned lodepng_decode_file(unsigned char** out, unsigned* w, unsigned* h, const char* filename,
+                             LodePNGColorType colortype, unsigned bitdepth)
+{
+  unsigned char* buffer = 0;
+  size_t buffersize;
+  unsigned error;
+  error = lodepng_load_file(&buffer, &buffersize, filename);
+  if(!error) error = lodepng_decode_memory(out, w, h, buffer, buffersize, colortype, bitdepth);
+  lodepng_free(buffer);
+  return error;
+}
+
+unsigned lodepng_decode32_file(unsigned char** out, unsigned* w, unsigned* h, const char* filename)
+{
+  return lodepng_decode_file(out, w, h, filename, LCT_RGBA, 8);
+}
+
+unsigned lodepng_decode24_file(unsigned char** out, unsigned* w, unsigned* h, const char* filename)
+{
+  return lodepng_decode_file(out, w, h, filename, LCT_RGB, 8);
+}
+#endif /*LODEPNG_COMPILE_DISK*/
+
+void lodepng_decoder_settings_init(LodePNGDecoderSettings* settings)
+{
+  settings->color_convert = 1;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  settings->read_text_chunks = 1;
+  settings->remember_unknown_chunks = 0;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+  settings->ignore_crc = 0;
+  lodepng_decompress_settings_init(&settings->zlibsettings);
+}
+
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#if defined(LODEPNG_COMPILE_DECODER) || defined(LODEPNG_COMPILE_ENCODER)
+
+void lodepng_state_init(LodePNGState* state)
+{
+#ifdef LODEPNG_COMPILE_DECODER
+  lodepng_decoder_settings_init(&state->decoder);
+#endif /*LODEPNG_COMPILE_DECODER*/
+#ifdef LODEPNG_COMPILE_ENCODER
+  lodepng_encoder_settings_init(&state->encoder);
+#endif /*LODEPNG_COMPILE_ENCODER*/
+  lodepng_color_mode_init(&state->info_raw);
+  lodepng_info_init(&state->info_png);
+  state->error = 1;
+}
+
+void lodepng_state_cleanup(LodePNGState* state)
+{
+  lodepng_color_mode_cleanup(&state->info_raw);
+  lodepng_info_cleanup(&state->info_png);
+}
+
+void lodepng_state_copy(LodePNGState* dest, const LodePNGState* source)
+{
+  lodepng_state_cleanup(dest);
+  *dest = *source;
+  lodepng_color_mode_init(&dest->info_raw);
+  lodepng_info_init(&dest->info_png);
+  dest->error = lodepng_color_mode_copy(&dest->info_raw, &source->info_raw); if(dest->error) return;
+  dest->error = lodepng_info_copy(&dest->info_png, &source->info_png); if(dest->error) return;
+}
+
+#endif /* defined(LODEPNG_COMPILE_DECODER) || defined(LODEPNG_COMPILE_ENCODER) */
+
+#ifdef LODEPNG_COMPILE_ENCODER
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* / PNG Encoder                                                            / */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+/*chunkName must be string of 4 characters*/
+static unsigned addChunk(ucvector* out, const char* chunkName, const unsigned char* data, size_t length)
+{
+  CERROR_TRY_RETURN(lodepng_chunk_create(&out->data, &out->size, (unsigned)length, chunkName, data));
+  out->allocsize = out->size; /*fix the allocsize again*/
+  return 0;
+}
+
+static void writeSignature(ucvector* out)
+{
+  /*8 bytes PNG signature, aka the magic bytes*/
+  ucvector_push_back(out, 137);
+  ucvector_push_back(out, 80);
+  ucvector_push_back(out, 78);
+  ucvector_push_back(out, 71);
+  ucvector_push_back(out, 13);
+  ucvector_push_back(out, 10);
+  ucvector_push_back(out, 26);
+  ucvector_push_back(out, 10);
+}
+
+static unsigned addChunk_IHDR(ucvector* out, unsigned w, unsigned h,
+                              LodePNGColorType colortype, unsigned bitdepth, unsigned interlace_method)
+{
+  unsigned error = 0;
+  ucvector header;
+  ucvector_init(&header);
+
+  lodepng_add32bitInt(&header, w); /*width*/
+  lodepng_add32bitInt(&header, h); /*height*/
+  ucvector_push_back(&header, (unsigned char)bitdepth); /*bit depth*/
+  ucvector_push_back(&header, (unsigned char)colortype); /*color type*/
+  ucvector_push_back(&header, 0); /*compression method*/
+  ucvector_push_back(&header, 0); /*filter method*/
+  ucvector_push_back(&header, interlace_method); /*interlace method*/
+
+  error = addChunk(out, "IHDR", header.data, header.size);
+  ucvector_cleanup(&header);
+
+  return error;
+}
+
+static unsigned addChunk_PLTE(ucvector* out, const LodePNGColorMode* info)
+{
+  unsigned error = 0;
+  size_t i;
+  ucvector PLTE;
+  ucvector_init(&PLTE);
+  for(i = 0; i != info->palettesize * 4; ++i)
+  {
+    /*add all channels except alpha channel*/
+    if(i % 4 != 3) ucvector_push_back(&PLTE, info->palette[i]);
+  }
+  error = addChunk(out, "PLTE", PLTE.data, PLTE.size);
+  ucvector_cleanup(&PLTE);
+
+  return error;
+}
+
+static unsigned addChunk_tRNS(ucvector* out, const LodePNGColorMode* info)
+{
+  unsigned error = 0;
+  size_t i;
+  ucvector tRNS;
+  ucvector_init(&tRNS);
+  if(info->colortype == LCT_PALETTE)
+  {
+    size_t amount = info->palettesize;
+    /*the tail of palette values that all have 255 as alpha, does not have to be encoded*/
+    for(i = info->palettesize; i != 0; --i)
+    {
+      if(info->palette[4 * (i - 1) + 3] == 255) --amount;
+      else break;
+    }
+    /*add only alpha channel*/
+    for(i = 0; i != amount; ++i) ucvector_push_back(&tRNS, info->palette[4 * i + 3]);
+  }
+  else if(info->colortype == LCT_GREY)
+  {
+    if(info->key_defined)
+    {
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_r >> 8));
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_r & 255));
+    }
+  }
+  else if(info->colortype == LCT_RGB)
+  {
+    if(info->key_defined)
+    {
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_r >> 8));
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_r & 255));
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_g >> 8));
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_g & 255));
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_b >> 8));
+      ucvector_push_back(&tRNS, (unsigned char)(info->key_b & 255));
+    }
+  }
+
+  error = addChunk(out, "tRNS", tRNS.data, tRNS.size);
+  ucvector_cleanup(&tRNS);
+
+  return error;
+}
+
+static unsigned addChunk_IDAT(ucvector* out, const unsigned char* data, size_t datasize,
+                              LodePNGCompressSettings* zlibsettings)
+{
+  ucvector zlibdata;
+  unsigned error = 0;
+
+  /*compress with the Zlib compressor*/
+  ucvector_init(&zlibdata);
+  error = zlib_compress(&zlibdata.data, &zlibdata.size, data, datasize, zlibsettings);
+  if(!error) error = addChunk(out, "IDAT", zlibdata.data, zlibdata.size);
+  ucvector_cleanup(&zlibdata);
+
+  return error;
+}
+
+static unsigned addChunk_IEND(ucvector* out)
+{
+  unsigned error = 0;
+  error = addChunk(out, "IEND", 0, 0);
+  return error;
+}
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+
+static unsigned addChunk_tEXt(ucvector* out, const char* keyword, const char* textstring)
+{
+  unsigned error = 0;
+  size_t i;
+  ucvector text;
+  ucvector_init(&text);
+  for(i = 0; keyword[i] != 0; ++i) ucvector_push_back(&text, (unsigned char)keyword[i]);
+  if(i < 1 || i > 79) return 89; /*error: invalid keyword size*/
+  ucvector_push_back(&text, 0); /*0 termination char*/
+  for(i = 0; textstring[i] != 0; ++i) ucvector_push_back(&text, (unsigned char)textstring[i]);
+  error = addChunk(out, "tEXt", text.data, text.size);
+  ucvector_cleanup(&text);
+
+  return error;
+}
+
+static unsigned addChunk_zTXt(ucvector* out, const char* keyword, const char* textstring,
+                              LodePNGCompressSettings* zlibsettings)
+{
+  unsigned error = 0;
+  ucvector data, compressed;
+  size_t i, textsize = strlen(textstring);
+
+  ucvector_init(&data);
+  ucvector_init(&compressed);
+  for(i = 0; keyword[i] != 0; ++i) ucvector_push_back(&data, (unsigned char)keyword[i]);
+  if(i < 1 || i > 79) return 89; /*error: invalid keyword size*/
+  ucvector_push_back(&data, 0); /*0 termination char*/
+  ucvector_push_back(&data, 0); /*compression method: 0*/
+
+  error = zlib_compress(&compressed.data, &compressed.size,
+                        (unsigned char*)textstring, textsize, zlibsettings);
+  if(!error)
+  {
+    for(i = 0; i != compressed.size; ++i) ucvector_push_back(&data, compressed.data[i]);
+    error = addChunk(out, "zTXt", data.data, data.size);
+  }
+
+  ucvector_cleanup(&compressed);
+  ucvector_cleanup(&data);
+  return error;
+}
+
+static unsigned addChunk_iTXt(ucvector* out, unsigned compressed, const char* keyword, const char* langtag,
+                              const char* transkey, const char* textstring, LodePNGCompressSettings* zlibsettings)
+{
+  unsigned error = 0;
+  ucvector data;
+  size_t i, textsize = strlen(textstring);
+
+  ucvector_init(&data);
+
+  for(i = 0; keyword[i] != 0; ++i) ucvector_push_back(&data, (unsigned char)keyword[i]);
+  if(i < 1 || i > 79) return 89; /*error: invalid keyword size*/
+  ucvector_push_back(&data, 0); /*null termination char*/
+  ucvector_push_back(&data, compressed ? 1 : 0); /*compression flag*/
+  ucvector_push_back(&data, 0); /*compression method*/
+  for(i = 0; langtag[i] != 0; ++i) ucvector_push_back(&data, (unsigned char)langtag[i]);
+  ucvector_push_back(&data, 0); /*null termination char*/
+  for(i = 0; transkey[i] != 0; ++i) ucvector_push_back(&data, (unsigned char)transkey[i]);
+  ucvector_push_back(&data, 0); /*null termination char*/
+
+  if(compressed)
+  {
+    ucvector compressed_data;
+    ucvector_init(&compressed_data);
+    error = zlib_compress(&compressed_data.data, &compressed_data.size,
+                          (unsigned char*)textstring, textsize, zlibsettings);
+    if(!error)
+    {
+      for(i = 0; i != compressed_data.size; ++i) ucvector_push_back(&data, compressed_data.data[i]);
+    }
+    ucvector_cleanup(&compressed_data);
+  }
+  else /*not compressed*/
+  {
+    for(i = 0; textstring[i] != 0; ++i) ucvector_push_back(&data, (unsigned char)textstring[i]);
+  }
+
+  if(!error) error = addChunk(out, "iTXt", data.data, data.size);
+  ucvector_cleanup(&data);
+  return error;
+}
+
+static unsigned addChunk_bKGD(ucvector* out, const LodePNGInfo* info)
+{
+  unsigned error = 0;
+  ucvector bKGD;
+  ucvector_init(&bKGD);
+  if(info->color.colortype == LCT_GREY || info->color.colortype == LCT_GREY_ALPHA)
+  {
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_r >> 8));
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_r & 255));
+  }
+  else if(info->color.colortype == LCT_RGB || info->color.colortype == LCT_RGBA)
+  {
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_r >> 8));
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_r & 255));
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_g >> 8));
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_g & 255));
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_b >> 8));
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_b & 255));
+  }
+  else if(info->color.colortype == LCT_PALETTE)
+  {
+    ucvector_push_back(&bKGD, (unsigned char)(info->background_r & 255)); /*palette index*/
+  }
+
+  error = addChunk(out, "bKGD", bKGD.data, bKGD.size);
+  ucvector_cleanup(&bKGD);
+
+  return error;
+}
+
+static unsigned addChunk_tIME(ucvector* out, const LodePNGTime* time)
+{
+  unsigned error = 0;
+  unsigned char* data = (unsigned char*)lodepng_malloc(7);
+  if(!data) return 83; /*alloc fail*/
+  data[0] = (unsigned char)(time->year >> 8);
+  data[1] = (unsigned char)(time->year & 255);
+  data[2] = (unsigned char)time->month;
+  data[3] = (unsigned char)time->day;
+  data[4] = (unsigned char)time->hour;
+  data[5] = (unsigned char)time->minute;
+  data[6] = (unsigned char)time->second;
+  error = addChunk(out, "tIME", data, 7);
+  lodepng_free(data);
+  return error;
+}
+
+static unsigned addChunk_pHYs(ucvector* out, const LodePNGInfo* info)
+{
+  unsigned error = 0;
+  ucvector data;
+  ucvector_init(&data);
+
+  lodepng_add32bitInt(&data, info->phys_x);
+  lodepng_add32bitInt(&data, info->phys_y);
+  ucvector_push_back(&data, info->phys_unit);
+
+  error = addChunk(out, "pHYs", data.data, data.size);
+  ucvector_cleanup(&data);
+
+  return error;
+}
+
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+static void filterScanline(unsigned char* out, const unsigned char* scanline, const unsigned char* prevline,
+                           size_t length, size_t bytewidth, unsigned char filterType)
+{
+  size_t i;
+  switch(filterType)
+  {
+    case 0: /*None*/
+      for(i = 0; i != length; ++i) out[i] = scanline[i];
+      break;
+    case 1: /*Sub*/
+      for(i = 0; i != bytewidth; ++i) out[i] = scanline[i];
+      for(i = bytewidth; i < length; ++i) out[i] = scanline[i] - scanline[i - bytewidth];
+      break;
+    case 2: /*Up*/
+      if(prevline)
+      {
+        for(i = 0; i != length; ++i) out[i] = scanline[i] - prevline[i];
+      }
+      else
+      {
+        for(i = 0; i != length; ++i) out[i] = scanline[i];
+      }
+      break;
+    case 3: /*Average*/
+      if(prevline)
+      {
+        for(i = 0; i != bytewidth; ++i) out[i] = scanline[i] - (prevline[i] >> 1);
+        for(i = bytewidth; i < length; ++i) out[i] = scanline[i] - ((scanline[i - bytewidth] + prevline[i]) >> 1);
+      }
+      else
+      {
+        for(i = 0; i != bytewidth; ++i) out[i] = scanline[i];
+        for(i = bytewidth; i < length; ++i) out[i] = scanline[i] - (scanline[i - bytewidth] >> 1);
+      }
+      break;
+    case 4: /*Paeth*/
+      if(prevline)
+      {
+        /*paethPredictor(0, prevline[i], 0) is always prevline[i]*/
+        for(i = 0; i != bytewidth; ++i) out[i] = (scanline[i] - prevline[i]);
+        for(i = bytewidth; i < length; ++i)
+        {
+          out[i] = (scanline[i] - paethPredictor(scanline[i - bytewidth], prevline[i], prevline[i - bytewidth]));
+        }
+      }
+      else
+      {
+        for(i = 0; i != bytewidth; ++i) out[i] = scanline[i];
+        /*paethPredictor(scanline[i - bytewidth], 0, 0) is always scanline[i - bytewidth]*/
+        for(i = bytewidth; i < length; ++i) out[i] = (scanline[i] - scanline[i - bytewidth]);
+      }
+      break;
+    default: return; /*unexisting filter type given*/
+  }
+}
+
+/* log2 approximation. A slight bit faster than std::log. */
+static float flog2(float f)
+{
+  float result = 0;
+  while(f > 32) { result += 4; f /= 16; }
+  while(f > 2) { ++result; f /= 2; }
+  return result + 1.442695f * (f * f * f / 3 - 3 * f * f / 2 + 3 * f - 1.83333f);
+}
+
+static unsigned filter(unsigned char* out, const unsigned char* in, unsigned w, unsigned h,
+                       const LodePNGColorMode* info, const LodePNGEncoderSettings* settings)
+{
+  /*
+  For PNG filter method 0
+  out must be a buffer with as size: h + (w * h * bpp + 7) / 8, because there are
+  the scanlines with 1 extra byte per scanline
+  */
+
+  unsigned bpp = lodepng_get_bpp(info);
+  /*the width of a scanline in bytes, not including the filter type*/
+  size_t linebytes = (w * bpp + 7) / 8;
+  /*bytewidth is used for filtering, is 1 when bpp < 8, number of bytes per pixel otherwise*/
+  size_t bytewidth = (bpp + 7) / 8;
+  const unsigned char* prevline = 0;
+  unsigned x, y;
+  unsigned error = 0;
+  LodePNGFilterStrategy strategy = settings->filter_strategy;
+
+  /*
+  There is a heuristic called the minimum sum of absolute differences heuristic, suggested by the PNG standard:
+   *  If the image type is Palette, or the bit depth is smaller than 8, then do not filter the image (i.e.
+      use fixed filtering, with the filter None).
+   * (The other case) If the image type is Grayscale or RGB (with or without Alpha), and the bit depth is
+     not smaller than 8, then use adaptive filtering heuristic as follows: independently for each row, apply
+     all five filters and select the filter that produces the smallest sum of absolute values per row.
+  This heuristic is used if filter strategy is LFS_MINSUM and filter_palette_zero is true.
+
+  If filter_palette_zero is true and filter_strategy is not LFS_MINSUM, the above heuristic is followed,
+  but for "the other case", whatever strategy filter_strategy is set to instead of the minimum sum
+  heuristic is used.
+  */
+  if(settings->filter_palette_zero &&
+     (info->colortype == LCT_PALETTE || info->bitdepth < 8)) strategy = LFS_ZERO;
+
+  if(bpp == 0) return 31; /*error: invalid color type*/
+
+  if(strategy == LFS_ZERO)
+  {
+    for(y = 0; y != h; ++y)
+    {
+      size_t outindex = (1 + linebytes) * y; /*the extra filterbyte added to each row*/
+      size_t inindex = linebytes * y;
+      out[outindex] = 0; /*filter type byte*/
+      filterScanline(&out[outindex + 1], &in[inindex], prevline, linebytes, bytewidth, 0);
+      prevline = &in[inindex];
+    }
+  }
+  else if(strategy == LFS_MINSUM)
+  {
+    /*adaptive filtering*/
+    size_t sum[5];
+    unsigned char* attempt[5]; /*five filtering attempts, one for each filter type*/
+    size_t smallest = 0;
+    unsigned char type, bestType = 0;
+
+    for(type = 0; type != 5; ++type)
+    {
+      attempt[type] = (unsigned char*)lodepng_malloc(linebytes);
+      if(!attempt[type]) return 83; /*alloc fail*/
+    }
+
+    if(!error)
+    {
+      for(y = 0; y != h; ++y)
+      {
+        /*try the 5 filter types*/
+        for(type = 0; type != 5; ++type)
+        {
+          filterScanline(attempt[type], &in[y * linebytes], prevline, linebytes, bytewidth, type);
+
+          /*calculate the sum of the result*/
+          sum[type] = 0;
+          if(type == 0)
+          {
+            for(x = 0; x != linebytes; ++x) sum[type] += (unsigned char)(attempt[type][x]);
+          }
+          else
+          {
+            for(x = 0; x != linebytes; ++x)
+            {
+              /*For differences, each byte should be treated as signed, values above 127 are negative
+              (converted to signed char). Filtertype 0 isn't a difference though, so use unsigned there.
+              This means filtertype 0 is almost never chosen, but that is justified.*/
+              unsigned char s = attempt[type][x];
+              sum[type] += s < 128 ? s : (255U - s);
+            }
+          }
+
+          /*check if this is smallest sum (or if type == 0 it's the first case so always store the values)*/
+          if(type == 0 || sum[type] < smallest)
+          {
+            bestType = type;
+            smallest = sum[type];
+          }
+        }
+
+        prevline = &in[y * linebytes];
+
+        /*now fill the out values*/
+        out[y * (linebytes + 1)] = bestType; /*the first byte of a scanline will be the filter type*/
+        for(x = 0; x != linebytes; ++x) out[y * (linebytes + 1) + 1 + x] = attempt[bestType][x];
+      }
+    }
+
+    for(type = 0; type != 5; ++type) lodepng_free(attempt[type]);
+  }
+  else if(strategy == LFS_ENTROPY)
+  {
+    float sum[5];
+    unsigned char* attempt[5]; /*five filtering attempts, one for each filter type*/
+    float smallest = 0;
+    unsigned type, bestType = 0;
+    unsigned count[256];
+
+    for(type = 0; type != 5; ++type)
+    {
+      attempt[type] = (unsigned char*)lodepng_malloc(linebytes);
+      if(!attempt[type]) return 83; /*alloc fail*/
+    }
+
+    for(y = 0; y != h; ++y)
+    {
+      /*try the 5 filter types*/
+      for(type = 0; type != 5; ++type)
+      {
+        filterScanline(attempt[type], &in[y * linebytes], prevline, linebytes, bytewidth, type);
+        for(x = 0; x != 256; ++x) count[x] = 0;
+        for(x = 0; x != linebytes; ++x) ++count[attempt[type][x]];
+        ++count[type]; /*the filter type itself is part of the scanline*/
+        sum[type] = 0;
+        for(x = 0; x != 256; ++x)
+        {
+          float p = count[x] / (float)(linebytes + 1);
+          sum[type] += count[x] == 0 ? 0 : flog2(1 / p) * p;
+        }
+        /*check if this is smallest sum (or if type == 0 it's the first case so always store the values)*/
+        if(type == 0 || sum[type] < smallest)
+        {
+          bestType = type;
+          smallest = sum[type];
+        }
+      }
+
+      prevline = &in[y * linebytes];
+
+      /*now fill the out values*/
+      out[y * (linebytes + 1)] = bestType; /*the first byte of a scanline will be the filter type*/
+      for(x = 0; x != linebytes; ++x) out[y * (linebytes + 1) + 1 + x] = attempt[bestType][x];
+    }
+
+    for(type = 0; type != 5; ++type) lodepng_free(attempt[type]);
+  }
+  else if(strategy == LFS_PREDEFINED)
+  {
+    for(y = 0; y != h; ++y)
+    {
+      size_t outindex = (1 + linebytes) * y; /*the extra filterbyte added to each row*/
+      size_t inindex = linebytes * y;
+      unsigned char type = settings->predefined_filters[y];
+      out[outindex] = type; /*filter type byte*/
+      filterScanline(&out[outindex + 1], &in[inindex], prevline, linebytes, bytewidth, type);
+      prevline = &in[inindex];
+    }
+  }
+  else if(strategy == LFS_BRUTE_FORCE)
+  {
+    /*brute force filter chooser.
+    deflate the scanline after every filter attempt to see which one deflates best.
+    This is very slow and gives only slightly smaller, sometimes even larger, result*/
+    size_t size[5];
+    unsigned char* attempt[5]; /*five filtering attempts, one for each filter type*/
+    size_t smallest = 0;
+    unsigned type = 0, bestType = 0;
+    unsigned char* dummy;
+    LodePNGCompressSettings zlibsettings = settings->zlibsettings;
+    /*use fixed tree on the attempts so that the tree is not adapted to the filtertype on purpose,
+    to simulate the true case where the tree is the same for the whole image. Sometimes it gives
+    better result with dynamic tree anyway. Using the fixed tree sometimes gives worse, but in rare
+    cases better compression. It does make this a bit less slow, so it's worth doing this.*/
+    zlibsettings.btype = 1;
+    /*a custom encoder likely doesn't read the btype setting and is optimized for complete PNG
+    images only, so disable it*/
+    zlibsettings.custom_zlib = 0;
+    zlibsettings.custom_deflate = 0;
+    for(type = 0; type != 5; ++type)
+    {
+      attempt[type] = (unsigned char*)lodepng_malloc(linebytes);
+      if(!attempt[type]) return 83; /*alloc fail*/
+    }
+    for(y = 0; y != h; ++y) /*try the 5 filter types*/
+    {
+      for(type = 0; type != 5; ++type)
+      {
+        size_t testsize = linebytes;
+        /*if(testsize > 8) testsize /= 8;*/ /*it already works good enough by testing a part of the row*/
+
+        filterScanline(attempt[type], &in[y * linebytes], prevline, linebytes, bytewidth, type);
+        size[type] = 0;
+        dummy = 0;
+        zlib_compress(&dummy, &size[type], attempt[type], testsize, &zlibsettings);
+        lodepng_free(dummy);
+        /*check if this is smallest size (or if type == 0 it's the first case so always store the values)*/
+        if(type == 0 || size[type] < smallest)
+        {
+          bestType = type;
+          smallest = size[type];
+        }
+      }
+      prevline = &in[y * linebytes];
+      out[y * (linebytes + 1)] = bestType; /*the first byte of a scanline will be the filter type*/
+      for(x = 0; x != linebytes; ++x) out[y * (linebytes + 1) + 1 + x] = attempt[bestType][x];
+    }
+    for(type = 0; type != 5; ++type) lodepng_free(attempt[type]);
+  }
+  else return 88; /* unknown filter strategy */
+
+  return error;
+}
+
+static void addPaddingBits(unsigned char* out, const unsigned char* in,
+                           size_t olinebits, size_t ilinebits, unsigned h)
+{
+  /*The opposite of the removePaddingBits function
+  olinebits must be >= ilinebits*/
+  unsigned y;
+  size_t diff = olinebits - ilinebits;
+  size_t obp = 0, ibp = 0; /*bit pointers*/
+  for(y = 0; y != h; ++y)
+  {
+    size_t x;
+    for(x = 0; x < ilinebits; ++x)
+    {
+      unsigned char bit = readBitFromReversedStream(&ibp, in);
+      setBitOfReversedStream(&obp, out, bit);
+    }
+    /*obp += diff; --> no, fill in some value in the padding bits too, to avoid
+    "Use of uninitialised value of size ###" warning from valgrind*/
+    for(x = 0; x != diff; ++x) setBitOfReversedStream(&obp, out, 0);
+  }
+}
+
+/*
+in: non-interlaced image with size w*h
+out: the same pixels, but re-ordered according to PNG's Adam7 interlacing, with
+ no padding bits between scanlines, but between reduced images so that each
+ reduced image starts at a byte.
+bpp: bits per pixel
+there are no padding bits, not between scanlines, not between reduced images
+in has the following size in bits: w * h * bpp.
+out is possibly bigger due to padding bits between reduced images
+NOTE: comments about padding bits are only relevant if bpp < 8
+*/
+static void Adam7_interlace(unsigned char* out, const unsigned char* in, unsigned w, unsigned h, unsigned bpp)
+{
+  unsigned passw[7], passh[7];
+  size_t filter_passstart[8], padded_passstart[8], passstart[8];
+  unsigned i;
+
+  Adam7_getpassvalues(passw, passh, filter_passstart, padded_passstart, passstart, w, h, bpp);
+
+  if(bpp >= 8)
+  {
+    for(i = 0; i != 7; ++i)
+    {
+      unsigned x, y, b;
+      size_t bytewidth = bpp / 8;
+      for(y = 0; y < passh[i]; ++y)
+      for(x = 0; x < passw[i]; ++x)
+      {
+        size_t pixelinstart = ((ADAM7_IY[i] + y * ADAM7_DY[i]) * w + ADAM7_IX[i] + x * ADAM7_DX[i]) * bytewidth;
+        size_t pixeloutstart = passstart[i] + (y * passw[i] + x) * bytewidth;
+        for(b = 0; b < bytewidth; ++b)
+        {
+          out[pixeloutstart + b] = in[pixelinstart + b];
+        }
+      }
+    }
+  }
+  else /*bpp < 8: Adam7 with pixels < 8 bit is a bit trickier: with bit pointers*/
+  {
+    for(i = 0; i != 7; ++i)
+    {
+      unsigned x, y, b;
+      unsigned ilinebits = bpp * passw[i];
+      unsigned olinebits = bpp * w;
+      size_t obp, ibp; /*bit pointers (for out and in buffer)*/
+      for(y = 0; y < passh[i]; ++y)
+      for(x = 0; x < passw[i]; ++x)
+      {
+        ibp = (ADAM7_IY[i] + y * ADAM7_DY[i]) * olinebits + (ADAM7_IX[i] + x * ADAM7_DX[i]) * bpp;
+        obp = (8 * passstart[i]) + (y * ilinebits + x * bpp);
+        for(b = 0; b < bpp; ++b)
+        {
+          unsigned char bit = readBitFromReversedStream(&ibp, in);
+          setBitOfReversedStream(&obp, out, bit);
+        }
+      }
+    }
+  }
+}
+
+/*out must be buffer big enough to contain uncompressed IDAT chunk data, and in must contain the full image.
+return value is error**/
+static unsigned preProcessScanlines(unsigned char** out, size_t* outsize, const unsigned char* in,
+                                    unsigned w, unsigned h,
+                                    const LodePNGInfo* info_png, const LodePNGEncoderSettings* settings)
+{
+  /*
+  This function converts the pure 2D image with the PNG's colortype, into filtered-padded-interlaced data. Steps:
+  *) if no Adam7: 1) add padding bits (= posible extra bits per scanline if bpp < 8) 2) filter
+  *) if adam7: 1) Adam7_interlace 2) 7x add padding bits 3) 7x filter
+  */
+  unsigned bpp = lodepng_get_bpp(&info_png->color);
+  unsigned error = 0;
+
+  if(info_png->interlace_method == 0)
+  {
+    *outsize = h + (h * ((w * bpp + 7) / 8)); /*image size plus an extra byte per scanline + possible padding bits*/
+    *out = (unsigned char*)lodepng_malloc(*outsize);
+    if(!(*out) && (*outsize)) error = 83; /*alloc fail*/
+
+    if(!error)
+    {
+      /*non multiple of 8 bits per scanline, padding bits needed per scanline*/
+      if(bpp < 8 && w * bpp != ((w * bpp + 7) / 8) * 8)
+      {
+        unsigned char* padded = (unsigned char*)lodepng_malloc(h * ((w * bpp + 7) / 8));
+        if(!padded) error = 83; /*alloc fail*/
+        if(!error)
+        {
+          addPaddingBits(padded, in, ((w * bpp + 7) / 8) * 8, w * bpp, h);
+          error = filter(*out, padded, w, h, &info_png->color, settings);
+        }
+        lodepng_free(padded);
+      }
+      else
+      {
+        /*we can immediately filter into the out buffer, no other steps needed*/
+        error = filter(*out, in, w, h, &info_png->color, settings);
+      }
+    }
+  }
+  else /*interlace_method is 1 (Adam7)*/
+  {
+    unsigned passw[7], passh[7];
+    size_t filter_passstart[8], padded_passstart[8], passstart[8];
+    unsigned char* adam7;
+
+    Adam7_getpassvalues(passw, passh, filter_passstart, padded_passstart, passstart, w, h, bpp);
+
+    *outsize = filter_passstart[7]; /*image size plus an extra byte per scanline + possible padding bits*/
+    *out = (unsigned char*)lodepng_malloc(*outsize);
+    if(!(*out)) error = 83; /*alloc fail*/
+
+    adam7 = (unsigned char*)lodepng_malloc(passstart[7]);
+    if(!adam7 && passstart[7]) error = 83; /*alloc fail*/
+
+    if(!error)
+    {
+      unsigned i;
+
+      Adam7_interlace(adam7, in, w, h, bpp);
+      for(i = 0; i != 7; ++i)
+      {
+        if(bpp < 8)
+        {
+          unsigned char* padded = (unsigned char*)lodepng_malloc(padded_passstart[i + 1] - padded_passstart[i]);
+          if(!padded) ERROR_BREAK(83); /*alloc fail*/
+          addPaddingBits(padded, &adam7[passstart[i]],
+                         ((passw[i] * bpp + 7) / 8) * 8, passw[i] * bpp, passh[i]);
+          error = filter(&(*out)[filter_passstart[i]], padded,
+                         passw[i], passh[i], &info_png->color, settings);
+          lodepng_free(padded);
+        }
+        else
+        {
+          error = filter(&(*out)[filter_passstart[i]], &adam7[padded_passstart[i]],
+                         passw[i], passh[i], &info_png->color, settings);
+        }
+
+        if(error) break;
+      }
+    }
+
+    lodepng_free(adam7);
+  }
+
+  return error;
+}
+
+/*
+palette must have 4 * palettesize bytes allocated, and given in format RGBARGBARGBARGBA...
+returns 0 if the palette is opaque,
+returns 1 if the palette has a single color with alpha 0 ==> color key
+returns 2 if the palette is semi-translucent.
+*/
+static unsigned getPaletteTranslucency(const unsigned char* palette, size_t palettesize)
+{
+  size_t i;
+  unsigned key = 0;
+  unsigned r = 0, g = 0, b = 0; /*the value of the color with alpha 0, so long as color keying is possible*/
+  for(i = 0; i != palettesize; ++i)
+  {
+    if(!key && palette[4 * i + 3] == 0)
+    {
+      r = palette[4 * i + 0]; g = palette[4 * i + 1]; b = palette[4 * i + 2];
+      key = 1;
+      i = (size_t)(-1); /*restart from beginning, to detect earlier opaque colors with key's value*/
+    }
+    else if(palette[4 * i + 3] != 255) return 2;
+    /*when key, no opaque RGB may have key's RGB*/
+    else if(key && r == palette[i * 4 + 0] && g == palette[i * 4 + 1] && b == palette[i * 4 + 2]) return 2;
+  }
+  return key;
+}
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+static unsigned addUnknownChunks(ucvector* out, unsigned char* data, size_t datasize)
+{
+  unsigned char* inchunk = data;
+  while((size_t)(inchunk - data) < datasize)
+  {
+    CERROR_TRY_RETURN(lodepng_chunk_append(&out->data, &out->size, inchunk));
+    out->allocsize = out->size; /*fix the allocsize again*/
+    inchunk = lodepng_chunk_next(inchunk);
+  }
+  return 0;
+}
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+unsigned lodepng_encode(unsigned char** out, size_t* outsize,
+                        const unsigned char* image, unsigned w, unsigned h,
+                        LodePNGState* state)
+{
+  LodePNGInfo info;
+  ucvector outv;
+  unsigned char* data = 0; /*uncompressed version of the IDAT chunk data*/
+  size_t datasize = 0;
+
+  /*provide some proper output values if error will happen*/
+  *out = 0;
+  *outsize = 0;
+  state->error = 0;
+
+  lodepng_info_init(&info);
+  lodepng_info_copy(&info, &state->info_png);
+
+  if((info.color.colortype == LCT_PALETTE || state->encoder.force_palette)
+      && (info.color.palettesize == 0 || info.color.palettesize > 256))
+  {
+    state->error = 68; /*invalid palette size, it is only allowed to be 1-256*/
+    return state->error;
+  }
+
+  if(state->encoder.auto_convert)
+  {
+    state->error = lodepng_auto_choose_color(&info.color, image, w, h, &state->info_raw);
+  }
+  if(state->error) return state->error;
+
+  if(state->encoder.zlibsettings.btype > 2)
+  {
+    CERROR_RETURN_ERROR(state->error, 61); /*error: unexisting btype*/
+  }
+  if(state->info_png.interlace_method > 1)
+  {
+    CERROR_RETURN_ERROR(state->error, 71); /*error: unexisting interlace mode*/
+  }
+
+  state->error = checkColorValidity(info.color.colortype, info.color.bitdepth);
+  if(state->error) return state->error; /*error: unexisting color type given*/
+  state->error = checkColorValidity(state->info_raw.colortype, state->info_raw.bitdepth);
+  if(state->error) return state->error; /*error: unexisting color type given*/
+
+  if(!lodepng_color_mode_equal(&state->info_raw, &info.color))
+  {
+    unsigned char* converted;
+    size_t size = (w * h * lodepng_get_bpp(&info.color) + 7) / 8;
+
+    converted = (unsigned char*)lodepng_malloc(size);
+    if(!converted && size) state->error = 83; /*alloc fail*/
+    if(!state->error)
+    {
+      state->error = lodepng_convert(converted, image, &info.color, &state->info_raw, w, h);
+    }
+    if(!state->error) preProcessScanlines(&data, &datasize, converted, w, h, &info, &state->encoder);
+    lodepng_free(converted);
+  }
+  else preProcessScanlines(&data, &datasize, image, w, h, &info, &state->encoder);
+
+  ucvector_init(&outv);
+  while(!state->error) /*while only executed once, to break on error*/
+  {
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+    size_t i;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    /*write signature and chunks*/
+    writeSignature(&outv);
+    /*IHDR*/
+    addChunk_IHDR(&outv, w, h, info.color.colortype, info.color.bitdepth, info.interlace_method);
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+    /*unknown chunks between IHDR and PLTE*/
+    if(info.unknown_chunks_data[0])
+    {
+      state->error = addUnknownChunks(&outv, info.unknown_chunks_data[0], info.unknown_chunks_size[0]);
+      if(state->error) break;
+    }
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    /*PLTE*/
+    if(info.color.colortype == LCT_PALETTE)
+    {
+      addChunk_PLTE(&outv, &info.color);
+    }
+    if(state->encoder.force_palette && (info.color.colortype == LCT_RGB || info.color.colortype == LCT_RGBA))
+    {
+      addChunk_PLTE(&outv, &info.color);
+    }
+    /*tRNS*/
+    if(info.color.colortype == LCT_PALETTE && getPaletteTranslucency(info.color.palette, info.color.palettesize) != 0)
+    {
+      addChunk_tRNS(&outv, &info.color);
+    }
+    if((info.color.colortype == LCT_GREY || info.color.colortype == LCT_RGB) && info.color.key_defined)
+    {
+      addChunk_tRNS(&outv, &info.color);
+    }
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+    /*bKGD (must come between PLTE and the IDAt chunks*/
+    if(info.background_defined) addChunk_bKGD(&outv, &info);
+    /*pHYs (must come before the IDAT chunks)*/
+    if(info.phys_defined) addChunk_pHYs(&outv, &info);
+
+    /*unknown chunks between PLTE and IDAT*/
+    if(info.unknown_chunks_data[1])
+    {
+      state->error = addUnknownChunks(&outv, info.unknown_chunks_data[1], info.unknown_chunks_size[1]);
+      if(state->error) break;
+    }
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    /*IDAT (multiple IDAT chunks must be consecutive)*/
+    state->error = addChunk_IDAT(&outv, data, datasize, &state->encoder.zlibsettings);
+    if(state->error) break;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+    /*tIME*/
+    if(info.time_defined) addChunk_tIME(&outv, &info.time);
+    /*tEXt and/or zTXt*/
+    for(i = 0; i != info.text_num; ++i)
+    {
+      if(strlen(info.text_keys[i]) > 79)
+      {
+        state->error = 66; /*text chunk too large*/
+        break;
+      }
+      if(strlen(info.text_keys[i]) < 1)
+      {
+        state->error = 67; /*text chunk too small*/
+        break;
+      }
+      if(state->encoder.text_compression)
+      {
+        addChunk_zTXt(&outv, info.text_keys[i], info.text_strings[i], &state->encoder.zlibsettings);
+      }
+      else
+      {
+        addChunk_tEXt(&outv, info.text_keys[i], info.text_strings[i]);
+      }
+    }
+    /*LodePNG version id in text chunk*/
+    if(state->encoder.add_id)
+    {
+      unsigned alread_added_id_text = 0;
+      for(i = 0; i != info.text_num; ++i)
+      {
+        if(!strcmp(info.text_keys[i], "LodePNG"))
+        {
+          alread_added_id_text = 1;
+          break;
+        }
+      }
+      if(alread_added_id_text == 0)
+      {
+        addChunk_tEXt(&outv, "LodePNG", LODEPNG_VERSION_STRING); /*it's shorter as tEXt than as zTXt chunk*/
+      }
+    }
+    /*iTXt*/
+    for(i = 0; i != info.itext_num; ++i)
+    {
+      if(strlen(info.itext_keys[i]) > 79)
+      {
+        state->error = 66; /*text chunk too large*/
+        break;
+      }
+      if(strlen(info.itext_keys[i]) < 1)
+      {
+        state->error = 67; /*text chunk too small*/
+        break;
+      }
+      addChunk_iTXt(&outv, state->encoder.text_compression,
+                    info.itext_keys[i], info.itext_langtags[i], info.itext_transkeys[i], info.itext_strings[i],
+                    &state->encoder.zlibsettings);
+    }
+
+    /*unknown chunks between IDAT and IEND*/
+    if(info.unknown_chunks_data[2])
+    {
+      state->error = addUnknownChunks(&outv, info.unknown_chunks_data[2], info.unknown_chunks_size[2]);
+      if(state->error) break;
+    }
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+    addChunk_IEND(&outv);
+
+    break; /*this isn't really a while loop; no error happened so break out now!*/
+  }
+
+  lodepng_info_cleanup(&info);
+  lodepng_free(data);
+  /*instead of cleaning the vector up, give it to the output*/
+  *out = outv.data;
+  *outsize = outv.size;
+
+  return state->error;
+}
+
+unsigned lodepng_encode_memory(unsigned char** out, size_t* outsize, const unsigned char* image,
+                               unsigned w, unsigned h, LodePNGColorType colortype, unsigned bitdepth)
+{
+  unsigned error;
+  LodePNGState state;
+  lodepng_state_init(&state);
+  state.info_raw.colortype = colortype;
+  state.info_raw.bitdepth = bitdepth;
+  state.info_png.color.colortype = colortype;
+  state.info_png.color.bitdepth = bitdepth;
+  lodepng_encode(out, outsize, image, w, h, &state);
+  error = state.error;
+  lodepng_state_cleanup(&state);
+  return error;
+}
+
+unsigned lodepng_encode32(unsigned char** out, size_t* outsize, const unsigned char* image, unsigned w, unsigned h)
+{
+  return lodepng_encode_memory(out, outsize, image, w, h, LCT_RGBA, 8);
+}
+
+unsigned lodepng_encode24(unsigned char** out, size_t* outsize, const unsigned char* image, unsigned w, unsigned h)
+{
+  return lodepng_encode_memory(out, outsize, image, w, h, LCT_RGB, 8);
+}
+
+#ifdef LODEPNG_COMPILE_DISK
+unsigned lodepng_encode_file(const char* filename, const unsigned char* image, unsigned w, unsigned h,
+                             LodePNGColorType colortype, unsigned bitdepth)
+{
+  unsigned char* buffer;
+  size_t buffersize;
+  unsigned error = lodepng_encode_memory(&buffer, &buffersize, image, w, h, colortype, bitdepth);
+  if(!error) error = lodepng_save_file(buffer, buffersize, filename);
+  lodepng_free(buffer);
+  return error;
+}
+
+unsigned lodepng_encode32_file(const char* filename, const unsigned char* image, unsigned w, unsigned h)
+{
+  return lodepng_encode_file(filename, image, w, h, LCT_RGBA, 8);
+}
+
+unsigned lodepng_encode24_file(const char* filename, const unsigned char* image, unsigned w, unsigned h)
+{
+  return lodepng_encode_file(filename, image, w, h, LCT_RGB, 8);
+}
+#endif /*LODEPNG_COMPILE_DISK*/
+
+void lodepng_encoder_settings_init(LodePNGEncoderSettings* settings)
+{
+  lodepng_compress_settings_init(&settings->zlibsettings);
+  settings->filter_palette_zero = 1;
+  settings->filter_strategy = LFS_MINSUM;
+  settings->auto_convert = 1;
+  settings->force_palette = 0;
+  settings->predefined_filters = 0;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  settings->add_id = 0;
+  settings->text_compression = 1;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+}
+
+#endif /*LODEPNG_COMPILE_ENCODER*/
+#endif /*LODEPNG_COMPILE_PNG*/
+
+#ifdef LODEPNG_COMPILE_ERROR_TEXT
+/*
+This returns the description of a numerical error code in English. This is also
+the documentation of all the error codes.
+*/
+const char* lodepng_error_text(unsigned code)
+{
+  switch(code)
+  {
+    case 0: return "no error, everything went ok";
+    case 1: return "nothing done yet"; /*the Encoder/Decoder has done nothing yet, error checking makes no sense yet*/
+    case 10: return "end of input memory reached without huffman end code"; /*while huffman decoding*/
+    case 11: return "error in code tree made it jump outside of huffman tree"; /*while huffman decoding*/
+    case 13: return "problem while processing dynamic deflate block";
+    case 14: return "problem while processing dynamic deflate block";
+    case 15: return "problem while processing dynamic deflate block";
+    case 16: return "unexisting code while processing dynamic deflate block";
+    case 17: return "end of out buffer memory reached while inflating";
+    case 18: return "invalid distance code while inflating";
+    case 19: return "end of out buffer memory reached while inflating";
+    case 20: return "invalid deflate block BTYPE encountered while decoding";
+    case 21: return "NLEN is not ones complement of LEN in a deflate block";
+     /*end of out buffer memory reached while inflating:
+     This can happen if the inflated deflate data is longer than the amount of bytes required to fill up
+     all the pixels of the image, given the color depth and image dimensions. Something that doesn't
+     happen in a normal, well encoded, PNG image.*/
+    case 22: return "end of out buffer memory reached while inflating";
+    case 23: return "end of in buffer memory reached while inflating";
+    case 24: return "invalid FCHECK in zlib header";
+    case 25: return "invalid compression method in zlib header";
+    case 26: return "FDICT encountered in zlib header while it's not used for PNG";
+    case 27: return "PNG file is smaller than a PNG header";
+    /*Checks the magic file header, the first 8 bytes of the PNG file*/
+    case 28: return "incorrect PNG signature, it's no PNG or corrupted";
+    case 29: return "first chunk is not the header chunk";
+    case 30: return "chunk length too large, chunk broken off at end of file";
+    case 31: return "illegal PNG color type or bpp";
+    case 32: return "illegal PNG compression method";
+    case 33: return "illegal PNG filter method";
+    case 34: return "illegal PNG interlace method";
+    case 35: return "chunk length of a chunk is too large or the chunk too small";
+    case 36: return "illegal PNG filter type encountered";
+    case 37: return "illegal bit depth for this color type given";
+    case 38: return "the palette is too big"; /*more than 256 colors*/
+    case 39: return "more palette alpha values given in tRNS chunk than there are colors in the palette";
+    case 40: return "tRNS chunk has wrong size for greyscale image";
+    case 41: return "tRNS chunk has wrong size for RGB image";
+    case 42: return "tRNS chunk appeared while it was not allowed for this color type";
+    case 43: return "bKGD chunk has wrong size for palette image";
+    case 44: return "bKGD chunk has wrong size for greyscale image";
+    case 45: return "bKGD chunk has wrong size for RGB image";
+    case 48: return "empty input buffer given to decoder. Maybe caused by non-existing file?";
+    case 49: return "jumped past memory while generating dynamic huffman tree";
+    case 50: return "jumped past memory while generating dynamic huffman tree";
+    case 51: return "jumped past memory while inflating huffman block";
+    case 52: return "jumped past memory while inflating";
+    case 53: return "size of zlib data too small";
+    case 54: return "repeat symbol in tree while there was no value symbol yet";
+    /*jumped past tree while generating huffman tree, this could be when the
+    tree will have more leaves than symbols after generating it out of the
+    given lenghts. They call this an oversubscribed dynamic bit lengths tree in zlib.*/
+    case 55: return "jumped past tree while generating huffman tree";
+    case 56: return "given output image colortype or bitdepth not supported for color conversion";
+    case 57: return "invalid CRC encountered (checking CRC can be disabled)";
+    case 58: return "invalid ADLER32 encountered (checking ADLER32 can be disabled)";
+    case 59: return "requested color conversion not supported";
+    case 60: return "invalid window size given in the settings of the encoder (must be 0-32768)";
+    case 61: return "invalid BTYPE given in the settings of the encoder (only 0, 1 and 2 are allowed)";
+    /*LodePNG leaves the choice of RGB to greyscale conversion formula to the user.*/
+    case 62: return "conversion from color to greyscale not supported";
+    case 63: return "length of a chunk too long, max allowed for PNG is 2147483647 bytes per chunk"; /*(2^31-1)*/
+    /*this would result in the inability of a deflated block to ever contain an end code. It must be at least 1.*/
+    case 64: return "the length of the END symbol 256 in the Huffman tree is 0";
+    case 66: return "the length of a text chunk keyword given to the encoder is longer than the maximum of 79 bytes";
+    case 67: return "the length of a text chunk keyword given to the encoder is smaller than the minimum of 1 byte";
+    case 68: return "tried to encode a PLTE chunk with a palette that has less than 1 or more than 256 colors";
+    case 69: return "unknown chunk type with 'critical' flag encountered by the decoder";
+    case 71: return "unexisting interlace mode given to encoder (must be 0 or 1)";
+    case 72: return "while decoding, unexisting compression method encountering in zTXt or iTXt chunk (it must be 0)";
+    case 73: return "invalid tIME chunk size";
+    case 74: return "invalid pHYs chunk size";
+    /*length could be wrong, or data chopped off*/
+    case 75: return "no null termination char found while decoding text chunk";
+    case 76: return "iTXt chunk too short to contain required bytes";
+    case 77: return "integer overflow in buffer size";
+    case 78: return "failed to open file for reading"; /*file doesn't exist or couldn't be opened for reading*/
+    case 79: return "failed to open file for writing";
+    case 80: return "tried creating a tree of 0 symbols";
+    case 81: return "lazy matching at pos 0 is impossible";
+    case 82: return "color conversion to palette requested while a color isn't in palette";
+    case 83: return "memory allocation failed";
+    case 84: return "given image too small to contain all pixels to be encoded";
+    case 86: return "impossible offset in lz77 encoding (internal bug)";
+    case 87: return "must provide custom zlib function pointer if LODEPNG_COMPILE_ZLIB is not defined";
+    case 88: return "invalid filter strategy given for LodePNGEncoderSettings.filter_strategy";
+    case 89: return "text chunk keyword too short or long: must have size 1-79";
+    /*the windowsize in the LodePNGCompressSettings. Requiring POT(==> & instead of %) makes encoding 12% faster.*/
+    case 90: return "windowsize must be a power of two";
+    case 91: return "invalid decompressed idat size";
+    case 92: return "too many pixels, not supported";
+    case 93: return "zero width or height is invalid";
+    case 94: return "header chunk must have a size of 13 bytes";
+  }
+  return "unknown error code";
+}
+#endif /*LODEPNG_COMPILE_ERROR_TEXT*/
+
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* // C++ Wrapper                                                          // */
+/* ////////////////////////////////////////////////////////////////////////// */
+/* ////////////////////////////////////////////////////////////////////////// */
+
+#ifdef LODEPNG_COMPILE_CPP
+namespace lodepng
+{
+
+#ifdef LODEPNG_COMPILE_DISK
+unsigned load_file(std::vector<unsigned char>& buffer, const std::string& filename)
+{
+  long size = lodepng_filesize(filename.c_str());
+  if(size < 0) return 78;
+  buffer.resize((size_t)size);
+  return size == 0 ? 0 : lodepng_buffer_file(&buffer[0], (size_t)size, filename.c_str());
+}
+
+/*write given buffer to the file, overwriting the file, it doesn't append to it.*/
+unsigned save_file(const std::vector<unsigned char>& buffer, const std::string& filename)
+{
+  return lodepng_save_file(buffer.empty() ? 0 : &buffer[0], buffer.size(), filename.c_str());
+}
+#endif /* LODEPNG_COMPILE_DISK */
+
+#ifdef LODEPNG_COMPILE_ZLIB
+#ifdef LODEPNG_COMPILE_DECODER
+unsigned decompress(std::vector<unsigned char>& out, const unsigned char* in, size_t insize,
+                    const LodePNGDecompressSettings& settings)
+{
+  unsigned char* buffer = 0;
+  size_t buffersize = 0;
+  unsigned error = zlib_decompress(&buffer, &buffersize, in, insize, &settings);
+  if(buffer)
+  {
+    out.insert(out.end(), &buffer[0], &buffer[buffersize]);
+    lodepng_free(buffer);
+  }
+  return error;
+}
+
+unsigned decompress(std::vector<unsigned char>& out, const std::vector<unsigned char>& in,
+                    const LodePNGDecompressSettings& settings)
+{
+  return decompress(out, in.empty() ? 0 : &in[0], in.size(), settings);
+}
+#endif /* LODEPNG_COMPILE_DECODER */
+
+#ifdef LODEPNG_COMPILE_ENCODER
+unsigned compress(std::vector<unsigned char>& out, const unsigned char* in, size_t insize,
+                  const LodePNGCompressSettings& settings)
+{
+  unsigned char* buffer = 0;
+  size_t buffersize = 0;
+  unsigned error = zlib_compress(&buffer, &buffersize, in, insize, &settings);
+  if(buffer)
+  {
+    out.insert(out.end(), &buffer[0], &buffer[buffersize]);
+    lodepng_free(buffer);
+  }
+  return error;
+}
+
+unsigned compress(std::vector<unsigned char>& out, const std::vector<unsigned char>& in,
+                  const LodePNGCompressSettings& settings)
+{
+  return compress(out, in.empty() ? 0 : &in[0], in.size(), settings);
+}
+#endif /* LODEPNG_COMPILE_ENCODER */
+#endif /* LODEPNG_COMPILE_ZLIB */
+
+
+#ifdef LODEPNG_COMPILE_PNG
+
+State::State()
+{
+  lodepng_state_init(this);
+}
+
+State::State(const State& other)
+{
+  lodepng_state_init(this);
+  lodepng_state_copy(this, &other);
+}
+
+State::~State()
+{
+  lodepng_state_cleanup(this);
+}
+
+State& State::operator=(const State& other)
+{
+  lodepng_state_copy(this, &other);
+  return *this;
+}
+
+#ifdef LODEPNG_COMPILE_DECODER
+
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h, const unsigned char* in,
+                size_t insize, LodePNGColorType colortype, unsigned bitdepth)
+{
+  unsigned char* buffer;
+  unsigned error = lodepng_decode_memory(&buffer, &w, &h, in, insize, colortype, bitdepth);
+  if(buffer && !error)
+  {
+    State state;
+    state.info_raw.colortype = colortype;
+    state.info_raw.bitdepth = bitdepth;
+    size_t buffersize = lodepng_get_raw_size(w, h, &state.info_raw);
+    out.insert(out.end(), &buffer[0], &buffer[buffersize]);
+    lodepng_free(buffer);
+  }
+  return error;
+}
+
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                const std::vector<unsigned char>& in, LodePNGColorType colortype, unsigned bitdepth)
+{
+  return decode(out, w, h, in.empty() ? 0 : &in[0], (unsigned)in.size(), colortype, bitdepth);
+}
+
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                State& state,
+                const unsigned char* in, size_t insize)
+{
+  unsigned char* buffer = NULL;
+  unsigned error = lodepng_decode(&buffer, &w, &h, &state, in, insize);
+  if(buffer && !error)
+  {
+    size_t buffersize = lodepng_get_raw_size(w, h, &state.info_raw);
+    out.insert(out.end(), &buffer[0], &buffer[buffersize]);
+  }
+  lodepng_free(buffer);
+  return error;
+}
+
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                State& state,
+                const std::vector<unsigned char>& in)
+{
+  return decode(out, w, h, state, in.empty() ? 0 : &in[0], in.size());
+}
+
+#ifdef LODEPNG_COMPILE_DISK
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h, const std::string& filename,
+                LodePNGColorType colortype, unsigned bitdepth)
+{	
+  std::vector<unsigned char> buffer;
+  unsigned error = load_file(buffer, filename);
+  if(error) return error;
+  return decode(out, w, h, buffer, colortype, bitdepth);
+}
+#endif /* LODEPNG_COMPILE_DECODER */
+#endif /* LODEPNG_COMPILE_DISK */
+
+#ifdef LODEPNG_COMPILE_ENCODER
+unsigned encode(std::vector<unsigned char>& out, const unsigned char* in, unsigned w, unsigned h,
+                LodePNGColorType colortype, unsigned bitdepth)
+{
+  unsigned char* buffer;
+  size_t buffersize;
+  unsigned error = lodepng_encode_memory(&buffer, &buffersize, in, w, h, colortype, bitdepth);
+  if(buffer)
+  {
+    out.insert(out.end(), &buffer[0], &buffer[buffersize]);
+    lodepng_free(buffer);
+  }
+  return error;
+}
+
+unsigned encode(std::vector<unsigned char>& out,
+                const std::vector<unsigned char>& in, unsigned w, unsigned h,
+                LodePNGColorType colortype, unsigned bitdepth)
+{
+  if(lodepng_get_raw_size_lct(w, h, colortype, bitdepth) > in.size()) return 84;
+  return encode(out, in.empty() ? 0 : &in[0], w, h, colortype, bitdepth);
+}
+
+unsigned encode(std::vector<unsigned char>& out,
+                const unsigned char* in, unsigned w, unsigned h,
+                State& state)
+{
+  unsigned char* buffer;
+  size_t buffersize;
+  unsigned error = lodepng_encode(&buffer, &buffersize, in, w, h, &state);
+  if(buffer)
+  {
+    out.insert(out.end(), &buffer[0], &buffer[buffersize]);
+    lodepng_free(buffer);
+  }
+  return error;
+}
+
+unsigned encode(std::vector<unsigned char>& out,
+                const std::vector<unsigned char>& in, unsigned w, unsigned h,
+                State& state)
+{
+  if(lodepng_get_raw_size(w, h, &state.info_raw) > in.size()) return 84;
+  return encode(out, in.empty() ? 0 : &in[0], w, h, state);
+}
+
+#ifdef LODEPNG_COMPILE_DISK
+unsigned encode(const std::string& filename,
+                const unsigned char* in, unsigned w, unsigned h,
+                LodePNGColorType colortype, unsigned bitdepth)
+{
+  std::vector<unsigned char> buffer;
+  unsigned error = encode(buffer, in, w, h, colortype, bitdepth);
+  if(!error) error = save_file(buffer, filename);
+  return error;
+}
+
+unsigned encode(const std::string& filename,
+                const std::vector<unsigned char>& in, unsigned w, unsigned h,
+                LodePNGColorType colortype, unsigned bitdepth)
+{
+  if(lodepng_get_raw_size_lct(w, h, colortype, bitdepth) > in.size()) return 84;
+  return encode(filename, in.empty() ? 0 : &in[0], w, h, colortype, bitdepth);
+}
+#endif /* LODEPNG_COMPILE_DISK */
+#endif /* LODEPNG_COMPILE_ENCODER */
+#endif /* LODEPNG_COMPILE_PNG */
+} /* namespace lodepng */
+#endif /*LODEPNG_COMPILE_CPP*/
diff --git a/xdl/third_party/tbb/examples/graph/stereo/lodepng.h b/xdl/third_party/tbb/examples/graph/stereo/lodepng.h
new file mode 100644
index 00000000..91f769ba
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/lodepng.h
@@ -0,0 +1,1778 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+LodePNG version 20160409
+
+Copyright (c) 2005-2016 Lode Vandevenne
+
+This software is provided 'as-is', without any express or implied
+warranty. In no event will the authors be held liable for any damages
+arising from the use of this software.
+
+Permission is granted to anyone to use this software for any purpose,
+including commercial applications, and to alter it and redistribute it
+freely, subject to the following restrictions:
+
+    1. The origin of this software must not be misrepresented; you must not
+    claim that you wrote the original software. If you use this software
+    in a product, an acknowledgment in the product documentation would be
+    appreciated but is not required.
+
+    2. Altered source versions must be plainly marked as such, and must not be
+    misrepresented as being the original software.
+
+    3. This notice may not be removed or altered from any source
+    distribution.
+*/
+
+#ifndef LODEPNG_H
+#define LODEPNG_H
+
+#include <string.h> /*for size_t*/
+
+extern const char* LODEPNG_VERSION_STRING;
+
+/*
+The following #defines are used to create code sections. They can be disabled
+to disable code sections, which can give faster compile time and smaller binary.
+The "NO_COMPILE" defines are designed to be used to pass as defines to the
+compiler command to disable them without modifying this header, e.g.
+-DLODEPNG_NO_COMPILE_ZLIB for gcc.
+In addition to those below, you can also define LODEPNG_NO_COMPILE_CRC to
+allow implementing a custom lodepng_crc32.
+*/
+/*deflate & zlib. If disabled, you must specify alternative zlib functions in
+the custom_zlib field of the compress and decompress settings*/
+#ifndef LODEPNG_NO_COMPILE_ZLIB
+#define LODEPNG_COMPILE_ZLIB
+#endif
+/*png encoder and png decoder*/
+#ifndef LODEPNG_NO_COMPILE_PNG
+#define LODEPNG_COMPILE_PNG
+#endif
+/*deflate&zlib decoder and png decoder*/
+#ifndef LODEPNG_NO_COMPILE_DECODER
+#define LODEPNG_COMPILE_DECODER
+#endif
+/*deflate&zlib encoder and png encoder*/
+#ifndef LODEPNG_NO_COMPILE_ENCODER
+#define LODEPNG_COMPILE_ENCODER
+#endif
+/*the optional built in harddisk file loading and saving functions*/
+#ifndef LODEPNG_NO_COMPILE_DISK
+#define LODEPNG_COMPILE_DISK
+#endif
+/*support for chunks other than IHDR, IDAT, PLTE, tRNS, IEND: ancillary and unknown chunks*/
+#ifndef LODEPNG_NO_COMPILE_ANCILLARY_CHUNKS
+#define LODEPNG_COMPILE_ANCILLARY_CHUNKS
+#endif
+/*ability to convert error numerical codes to English text string*/
+#ifndef LODEPNG_NO_COMPILE_ERROR_TEXT
+#define LODEPNG_COMPILE_ERROR_TEXT
+#endif
+/*Compile the default allocators (C's free, malloc and realloc). If you disable this,
+you can define the functions lodepng_free, lodepng_malloc and lodepng_realloc in your
+source files with custom allocators.*/
+#ifndef LODEPNG_NO_COMPILE_ALLOCATORS
+#define LODEPNG_COMPILE_ALLOCATORS
+#endif
+/*compile the C++ version (you can disable the C++ wrapper here even when compiling for C++)*/
+#ifdef __cplusplus
+#ifndef LODEPNG_NO_COMPILE_CPP
+#define LODEPNG_COMPILE_CPP
+#endif
+#endif
+
+#ifdef LODEPNG_COMPILE_CPP
+#include <vector>
+#include <string>
+#endif /*LODEPNG_COMPILE_CPP*/
+
+#ifdef LODEPNG_COMPILE_PNG
+/*The PNG color types (also used for raw).*/
+typedef enum LodePNGColorType
+{
+  LCT_GREY = 0, /*greyscale: 1,2,4,8,16 bit*/
+  LCT_RGB = 2, /*RGB: 8,16 bit*/
+  LCT_PALETTE = 3, /*palette: 1,2,4,8 bit*/
+  LCT_GREY_ALPHA = 4, /*greyscale with alpha: 8,16 bit*/
+  LCT_RGBA = 6 /*RGB with alpha: 8,16 bit*/
+} LodePNGColorType;
+
+#ifdef LODEPNG_COMPILE_DECODER
+/*
+Converts PNG data in memory to raw pixel data.
+out: Output parameter. Pointer to buffer that will contain the raw pixel data.
+     After decoding, its size is w * h * (bytes per pixel) bytes larger than
+     initially. Bytes per pixel depends on colortype and bitdepth.
+     Must be freed after usage with free(*out).
+     Note: for 16-bit per channel colors, uses big endian format like PNG does.
+w: Output parameter. Pointer to width of pixel data.
+h: Output parameter. Pointer to height of pixel data.
+in: Memory buffer with the PNG file.
+insize: size of the in buffer.
+colortype: the desired color type for the raw output image. See explanation on PNG color types.
+bitdepth: the desired bit depth for the raw output image. See explanation on PNG color types.
+Return value: LodePNG error code (0 means no error).
+*/
+unsigned lodepng_decode_memory(unsigned char** out, unsigned* w, unsigned* h,
+                               const unsigned char* in, size_t insize,
+                               LodePNGColorType colortype, unsigned bitdepth);
+
+/*Same as lodepng_decode_memory, but always decodes to 32-bit RGBA raw image*/
+unsigned lodepng_decode32(unsigned char** out, unsigned* w, unsigned* h,
+                          const unsigned char* in, size_t insize);
+
+/*Same as lodepng_decode_memory, but always decodes to 24-bit RGB raw image*/
+unsigned lodepng_decode24(unsigned char** out, unsigned* w, unsigned* h,
+                          const unsigned char* in, size_t insize);
+
+#ifdef LODEPNG_COMPILE_DISK
+/*
+Load PNG from disk, from file with given name.
+Same as the other decode functions, but instead takes a filename as input.
+*/
+unsigned lodepng_decode_file(unsigned char** out, unsigned* w, unsigned* h,
+                             const char* filename,
+                             LodePNGColorType colortype, unsigned bitdepth);
+
+/*Same as lodepng_decode_file, but always decodes to 32-bit RGBA raw image.*/
+unsigned lodepng_decode32_file(unsigned char** out, unsigned* w, unsigned* h,
+                               const char* filename);
+
+/*Same as lodepng_decode_file, but always decodes to 24-bit RGB raw image.*/
+unsigned lodepng_decode24_file(unsigned char** out, unsigned* w, unsigned* h,
+                               const char* filename);
+#endif /*LODEPNG_COMPILE_DISK*/
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*
+Converts raw pixel data into a PNG image in memory. The colortype and bitdepth
+  of the output PNG image cannot be chosen, they are automatically determined
+  by the colortype, bitdepth and content of the input pixel data.
+  Note: for 16-bit per channel colors, needs big endian format like PNG does.
+out: Output parameter. Pointer to buffer that will contain the PNG image data.
+     Must be freed after usage with free(*out).
+outsize: Output parameter. Pointer to the size in bytes of the out buffer.
+image: The raw pixel data to encode. The size of this buffer should be
+       w * h * (bytes per pixel), bytes per pixel depends on colortype and bitdepth.
+w: width of the raw pixel data in pixels.
+h: height of the raw pixel data in pixels.
+colortype: the color type of the raw input image. See explanation on PNG color types.
+bitdepth: the bit depth of the raw input image. See explanation on PNG color types.
+Return value: LodePNG error code (0 means no error).
+*/
+unsigned lodepng_encode_memory(unsigned char** out, size_t* outsize,
+                               const unsigned char* image, unsigned w, unsigned h,
+                               LodePNGColorType colortype, unsigned bitdepth);
+
+/*Same as lodepng_encode_memory, but always encodes from 32-bit RGBA raw image.*/
+unsigned lodepng_encode32(unsigned char** out, size_t* outsize,
+                          const unsigned char* image, unsigned w, unsigned h);
+
+/*Same as lodepng_encode_memory, but always encodes from 24-bit RGB raw image.*/
+unsigned lodepng_encode24(unsigned char** out, size_t* outsize,
+                          const unsigned char* image, unsigned w, unsigned h);
+
+#ifdef LODEPNG_COMPILE_DISK
+/*
+Converts raw pixel data into a PNG file on disk.
+Same as the other encode functions, but instead takes a filename as output.
+NOTE: This overwrites existing files without warning!
+*/
+unsigned lodepng_encode_file(const char* filename,
+                             const unsigned char* image, unsigned w, unsigned h,
+                             LodePNGColorType colortype, unsigned bitdepth);
+
+/*Same as lodepng_encode_file, but always encodes from 32-bit RGBA raw image.*/
+unsigned lodepng_encode32_file(const char* filename,
+                               const unsigned char* image, unsigned w, unsigned h);
+
+/*Same as lodepng_encode_file, but always encodes from 24-bit RGB raw image.*/
+unsigned lodepng_encode24_file(const char* filename,
+                               const unsigned char* image, unsigned w, unsigned h);
+#endif /*LODEPNG_COMPILE_DISK*/
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+
+#ifdef LODEPNG_COMPILE_CPP
+namespace lodepng
+{
+#ifdef LODEPNG_COMPILE_DECODER
+/*Same as lodepng_decode_memory, but decodes to an std::vector. The colortype
+is the format to output the pixels to. Default is RGBA 8-bit per channel.*/
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                const unsigned char* in, size_t insize,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                const std::vector<unsigned char>& in,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+#ifdef LODEPNG_COMPILE_DISK
+/*
+Converts PNG file from disk to raw pixel data in memory.
+Same as the other decode functions, but instead takes a filename as input.
+*/
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                const std::string& filename,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+#endif /* LODEPNG_COMPILE_DISK */
+#endif /* LODEPNG_COMPILE_DECODER */
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*Same as lodepng_encode_memory, but encodes to an std::vector. colortype
+is that of the raw input data. The output PNG color type will be auto chosen.*/
+unsigned encode(std::vector<unsigned char>& out,
+                const unsigned char* in, unsigned w, unsigned h,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+unsigned encode(std::vector<unsigned char>& out,
+                const std::vector<unsigned char>& in, unsigned w, unsigned h,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+#ifdef LODEPNG_COMPILE_DISK
+/*
+Converts 32-bit RGBA raw pixel data into a PNG file on disk.
+Same as the other encode functions, but instead takes a filename as output.
+NOTE: This overwrites existing files without warning!
+*/
+unsigned encode(const std::string& filename,
+                const unsigned char* in, unsigned w, unsigned h,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+unsigned encode(const std::string& filename,
+                const std::vector<unsigned char>& in, unsigned w, unsigned h,
+                LodePNGColorType colortype = LCT_RGBA, unsigned bitdepth = 8);
+#endif /* LODEPNG_COMPILE_DISK */
+#endif /* LODEPNG_COMPILE_ENCODER */
+} /* namespace lodepng */
+#endif /*LODEPNG_COMPILE_CPP*/
+#endif /*LODEPNG_COMPILE_PNG*/
+
+#ifdef LODEPNG_COMPILE_ERROR_TEXT
+/*Returns an English description of the numerical error code.*/
+const char* lodepng_error_text(unsigned code);
+#endif /*LODEPNG_COMPILE_ERROR_TEXT*/
+
+#ifdef LODEPNG_COMPILE_DECODER
+/*Settings for zlib decompression*/
+typedef struct LodePNGDecompressSettings LodePNGDecompressSettings;
+struct LodePNGDecompressSettings
+{
+  unsigned ignore_adler32; /*if 1, continue and don't give an error message if the Adler32 checksum is corrupted*/
+
+  /*use custom zlib decoder instead of built in one (default: null)*/
+  unsigned (*custom_zlib)(unsigned char**, size_t*,
+                          const unsigned char*, size_t,
+                          const LodePNGDecompressSettings*);
+  /*use custom deflate decoder instead of built in one (default: null)
+  if custom_zlib is used, custom_deflate is ignored since only the built in
+  zlib function will call custom_deflate*/
+  unsigned (*custom_inflate)(unsigned char**, size_t*,
+                             const unsigned char*, size_t,
+                             const LodePNGDecompressSettings*);
+
+  const void* custom_context; /*optional custom settings for custom functions*/
+};
+
+extern const LodePNGDecompressSettings lodepng_default_decompress_settings;
+void lodepng_decompress_settings_init(LodePNGDecompressSettings* settings);
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*
+Settings for zlib compression. Tweaking these settings tweaks the balance
+between speed and compression ratio.
+*/
+typedef struct LodePNGCompressSettings LodePNGCompressSettings;
+struct LodePNGCompressSettings /*deflate = compress*/
+{
+  /*LZ77 related settings*/
+  unsigned btype; /*the block type for LZ (0, 1, 2 or 3, see zlib standard). Should be 2 for proper compression.*/
+  unsigned use_lz77; /*whether or not to use LZ77. Should be 1 for proper compression.*/
+  unsigned windowsize; /*must be a power of two <= 32768. higher compresses more but is slower. Default value: 2048.*/
+  unsigned minmatch; /*mininum lz77 length. 3 is normally best, 6 can be better for some PNGs. Default: 0*/
+  unsigned nicematch; /*stop searching if >= this length found. Set to 258 for best compression. Default: 128*/
+  unsigned lazymatching; /*use lazy matching: better compression but a bit slower. Default: true*/
+
+  /*use custom zlib encoder instead of built in one (default: null)*/
+  unsigned (*custom_zlib)(unsigned char**, size_t*,
+                          const unsigned char*, size_t,
+                          const LodePNGCompressSettings*);
+  /*use custom deflate encoder instead of built in one (default: null)
+  if custom_zlib is used, custom_deflate is ignored since only the built in
+  zlib function will call custom_deflate*/
+  unsigned (*custom_deflate)(unsigned char**, size_t*,
+                             const unsigned char*, size_t,
+                             const LodePNGCompressSettings*);
+
+  const void* custom_context; /*optional custom settings for custom functions*/
+};
+
+extern const LodePNGCompressSettings lodepng_default_compress_settings;
+void lodepng_compress_settings_init(LodePNGCompressSettings* settings);
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+#ifdef LODEPNG_COMPILE_PNG
+/*
+Color mode of an image. Contains all information required to decode the pixel
+bits to RGBA colors. This information is the same as used in the PNG file
+format, and is used both for PNG and raw image data in LodePNG.
+*/
+typedef struct LodePNGColorMode
+{
+  /*header (IHDR)*/
+  LodePNGColorType colortype; /*color type, see PNG standard or documentation further in this header file*/
+  unsigned bitdepth;  /*bits per sample, see PNG standard or documentation further in this header file*/
+
+  /*
+  palette (PLTE and tRNS)
+
+  Dynamically allocated with the colors of the palette, including alpha.
+  When encoding a PNG, to store your colors in the palette of the LodePNGColorMode, first use
+  lodepng_palette_clear, then for each color use lodepng_palette_add.
+  If you encode an image without alpha with palette, don't forget to put value 255 in each A byte of the palette.
+
+  When decoding, by default you can ignore this palette, since LodePNG already
+  fills the palette colors in the pixels of the raw RGBA output.
+
+  The palette is only supported for color type 3.
+  */
+  unsigned char* palette; /*palette in RGBARGBA... order. When allocated, must be either 0, or have size 1024*/
+  size_t palettesize; /*palette size in number of colors (amount of bytes is 4 * palettesize)*/
+
+  /*
+  transparent color key (tRNS)
+
+  This color uses the same bit depth as the bitdepth value in this struct, which can be 1-bit to 16-bit.
+  For greyscale PNGs, r, g and b will all 3 be set to the same.
+
+  When decoding, by default you can ignore this information, since LodePNG sets
+  pixels with this key to transparent already in the raw RGBA output.
+
+  The color key is only supported for color types 0 and 2.
+  */
+  unsigned key_defined; /*is a transparent color key given? 0 = false, 1 = true*/
+  unsigned key_r;       /*red/greyscale component of color key*/
+  unsigned key_g;       /*green component of color key*/
+  unsigned key_b;       /*blue component of color key*/
+} LodePNGColorMode;
+
+/*init, cleanup and copy functions to use with this struct*/
+void lodepng_color_mode_init(LodePNGColorMode* info);
+void lodepng_color_mode_cleanup(LodePNGColorMode* info);
+/*return value is error code (0 means no error)*/
+unsigned lodepng_color_mode_copy(LodePNGColorMode* dest, const LodePNGColorMode* source);
+
+void lodepng_palette_clear(LodePNGColorMode* info);
+/*add 1 color to the palette*/
+unsigned lodepng_palette_add(LodePNGColorMode* info,
+                             unsigned char r, unsigned char g, unsigned char b, unsigned char a);
+
+/*get the total amount of bits per pixel, based on colortype and bitdepth in the struct*/
+unsigned lodepng_get_bpp(const LodePNGColorMode* info);
+/*get the amount of color channels used, based on colortype in the struct.
+If a palette is used, it counts as 1 channel.*/
+unsigned lodepng_get_channels(const LodePNGColorMode* info);
+/*is it a greyscale type? (only colortype 0 or 4)*/
+unsigned lodepng_is_greyscale_type(const LodePNGColorMode* info);
+/*has it got an alpha channel? (only colortype 2 or 6)*/
+unsigned lodepng_is_alpha_type(const LodePNGColorMode* info);
+/*has it got a palette? (only colortype 3)*/
+unsigned lodepng_is_palette_type(const LodePNGColorMode* info);
+/*only returns true if there is a palette and there is a value in the palette with alpha < 255.
+Loops through the palette to check this.*/
+unsigned lodepng_has_palette_alpha(const LodePNGColorMode* info);
+/*
+Check if the given color info indicates the possibility of having non-opaque pixels in the PNG image.
+Returns true if the image can have translucent or invisible pixels (it still be opaque if it doesn't use such pixels).
+Returns false if the image can only have opaque pixels.
+In detail, it returns true only if it's a color type with alpha, or has a palette with non-opaque values,
+or if "key_defined" is true.
+*/
+unsigned lodepng_can_have_alpha(const LodePNGColorMode* info);
+/*Returns the byte size of a raw image buffer with given width, height and color mode*/
+size_t lodepng_get_raw_size(unsigned w, unsigned h, const LodePNGColorMode* color);
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+/*The information of a Time chunk in PNG.*/
+typedef struct LodePNGTime
+{
+  unsigned year;    /*2 bytes used (0-65535)*/
+  unsigned month;   /*1-12*/
+  unsigned day;     /*1-31*/
+  unsigned hour;    /*0-23*/
+  unsigned minute;  /*0-59*/
+  unsigned second;  /*0-60 (to allow for leap seconds)*/
+} LodePNGTime;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+/*Information about the PNG image, except pixels, width and height.*/
+typedef struct LodePNGInfo
+{
+  /*header (IHDR), palette (PLTE) and transparency (tRNS) chunks*/
+  unsigned compression_method;/*compression method of the original file. Always 0.*/
+  unsigned filter_method;     /*filter method of the original file*/
+  unsigned interlace_method;  /*interlace method of the original file*/
+  LodePNGColorMode color;     /*color type and bits, palette and transparency of the PNG file*/
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  /*
+  suggested background color chunk (bKGD)
+  This color uses the same color mode as the PNG (except alpha channel), which can be 1-bit to 16-bit.
+
+  For greyscale PNGs, r, g and b will all 3 be set to the same. When encoding
+  the encoder writes the red one. For palette PNGs: When decoding, the RGB value
+  will be stored, not a palette index. But when encoding, specify the index of
+  the palette in background_r, the other two are then ignored.
+
+  The decoder does not use this background color to edit the color of pixels.
+  */
+  unsigned background_defined; /*is a suggested background color given?*/
+  unsigned background_r;       /*red component of suggested background color*/
+  unsigned background_g;       /*green component of suggested background color*/
+  unsigned background_b;       /*blue component of suggested background color*/
+
+  /*
+  non-international text chunks (tEXt and zTXt)
+
+  The char** arrays each contain num strings. The actual messages are in
+  text_strings, while text_keys are keywords that give a short description what
+  the actual text represents, e.g. Title, Author, Description, or anything else.
+
+  A keyword is minimum 1 character and maximum 79 characters long. It's
+  discouraged to use a single line length longer than 79 characters for texts.
+
+  Don't allocate these text buffers yourself. Use the init/cleanup functions
+  correctly and use lodepng_add_text and lodepng_clear_text.
+  */
+  size_t text_num; /*the amount of texts in these char** buffers (there may be more texts in itext)*/
+  char** text_keys; /*the keyword of a text chunk (e.g. "Comment")*/
+  char** text_strings; /*the actual text*/
+
+  /*
+  international text chunks (iTXt)
+  Similar to the non-international text chunks, but with additional strings
+  "langtags" and "transkeys".
+  */
+  size_t itext_num; /*the amount of international texts in this PNG*/
+  char** itext_keys; /*the English keyword of the text chunk (e.g. "Comment")*/
+  char** itext_langtags; /*language tag for this text's language, ISO/IEC 646 string, e.g. ISO 639 language tag*/
+  char** itext_transkeys; /*keyword translated to the international language - UTF-8 string*/
+  char** itext_strings; /*the actual international text - UTF-8 string*/
+
+  /*time chunk (tIME)*/
+  unsigned time_defined; /*set to 1 to make the encoder generate a tIME chunk*/
+  LodePNGTime time;
+
+  /*phys chunk (pHYs)*/
+  unsigned phys_defined; /*if 0, there is no pHYs chunk and the values below are undefined, if 1 else there is one*/
+  unsigned phys_x; /*pixels per unit in x direction*/
+  unsigned phys_y; /*pixels per unit in y direction*/
+  unsigned phys_unit; /*may be 0 (unknown unit) or 1 (metre)*/
+
+  /*
+  unknown chunks
+  There are 3 buffers, one for each position in the PNG where unknown chunks can appear
+  each buffer contains all unknown chunks for that position consecutively
+  The 3 buffers are the unknown chunks between certain critical chunks:
+  0: IHDR-PLTE, 1: PLTE-IDAT, 2: IDAT-IEND
+  Do not allocate or traverse this data yourself. Use the chunk traversing functions declared
+  later, such as lodepng_chunk_next and lodepng_chunk_append, to read/write this struct.
+  */
+  unsigned char* unknown_chunks_data[3];
+  size_t unknown_chunks_size[3]; /*size in bytes of the unknown chunks, given for protection*/
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+} LodePNGInfo;
+
+/*init, cleanup and copy functions to use with this struct*/
+void lodepng_info_init(LodePNGInfo* info);
+void lodepng_info_cleanup(LodePNGInfo* info);
+/*return value is error code (0 means no error)*/
+unsigned lodepng_info_copy(LodePNGInfo* dest, const LodePNGInfo* source);
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+void lodepng_clear_text(LodePNGInfo* info); /*use this to clear the texts again after you filled them in*/
+unsigned lodepng_add_text(LodePNGInfo* info, const char* key, const char* str); /*push back both texts at once*/
+
+void lodepng_clear_itext(LodePNGInfo* info); /*use this to clear the itexts again after you filled them in*/
+unsigned lodepng_add_itext(LodePNGInfo* info, const char* key, const char* langtag,
+                           const char* transkey, const char* str); /*push back the 4 texts of 1 chunk at once*/
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+
+/*
+Converts raw buffer from one color type to another color type, based on
+LodePNGColorMode structs to describe the input and output color type.
+See the reference manual at the end of this header file to see which color conversions are supported.
+return value = LodePNG error code (0 if all went ok, an error if the conversion isn't supported)
+The out buffer must have size (w * h * bpp + 7) / 8, where bpp is the bits per pixel
+of the output color type (lodepng_get_bpp).
+For < 8 bpp images, there should not be padding bits at the end of scanlines.
+For 16-bit per channel colors, uses big endian format like PNG does.
+Return value is LodePNG error code
+*/
+unsigned lodepng_convert(unsigned char* out, const unsigned char* in,
+                         const LodePNGColorMode* mode_out, const LodePNGColorMode* mode_in,
+                         unsigned w, unsigned h);
+
+#ifdef LODEPNG_COMPILE_DECODER
+/*
+Settings for the decoder. This contains settings for the PNG and the Zlib
+decoder, but not the Info settings from the Info structs.
+*/
+typedef struct LodePNGDecoderSettings
+{
+  LodePNGDecompressSettings zlibsettings; /*in here is the setting to ignore Adler32 checksums*/
+
+  unsigned ignore_crc; /*ignore CRC checksums*/
+
+  unsigned color_convert; /*whether to convert the PNG to the color type you want. Default: yes*/
+
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  unsigned read_text_chunks; /*if false but remember_unknown_chunks is true, they're stored in the unknown chunks*/
+  /*store all bytes from unknown chunks in the LodePNGInfo (off by default, useful for a png editor)*/
+  unsigned remember_unknown_chunks;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+} LodePNGDecoderSettings;
+
+void lodepng_decoder_settings_init(LodePNGDecoderSettings* settings);
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*automatically use color type with less bits per pixel if losslessly possible. Default: AUTO*/
+typedef enum LodePNGFilterStrategy
+{
+  /*every filter at zero*/
+  LFS_ZERO,
+  /*Use filter that gives minimum sum, as described in the official PNG filter heuristic.*/
+  LFS_MINSUM,
+  /*Use the filter type that gives smallest Shannon entropy for this scanline. Depending
+  on the image, this is better or worse than minsum.*/
+  LFS_ENTROPY,
+  /*
+  Brute-force-search PNG filters by compressing each filter for each scanline.
+  Experimental, very slow, and only rarely gives better compression than MINSUM.
+  */
+  LFS_BRUTE_FORCE,
+  /*use predefined_filters buffer: you specify the filter type for each scanline*/
+  LFS_PREDEFINED
+} LodePNGFilterStrategy;
+
+/*Gives characteristics about the colors of the image, which helps decide which color model to use for encoding.
+Used internally by default if "auto_convert" is enabled. Public because it's useful for custom algorithms.*/
+typedef struct LodePNGColorProfile
+{
+  unsigned colored; /*not greyscale*/
+  unsigned key; /*if true, image is not opaque. Only if true and alpha is false, color key is possible.*/
+  unsigned short key_r; /*these values are always in 16-bit bitdepth in the profile*/
+  unsigned short key_g;
+  unsigned short key_b;
+  unsigned alpha; /*alpha channel or alpha palette required*/
+  unsigned numcolors; /*amount of colors, up to 257. Not valid if bits == 16.*/
+  unsigned char palette[1024]; /*Remembers up to the first 256 RGBA colors, in no particular order*/
+  unsigned bits; /*bits per channel (not for palette). 1,2 or 4 for greyscale only. 16 if 16-bit per channel required.*/
+} LodePNGColorProfile;
+
+void lodepng_color_profile_init(LodePNGColorProfile* profile);
+
+/*Get a LodePNGColorProfile of the image.*/
+unsigned lodepng_get_color_profile(LodePNGColorProfile* profile,
+                                   const unsigned char* image, unsigned w, unsigned h,
+                                   const LodePNGColorMode* mode_in);
+/*The function LodePNG uses internally to decide the PNG color with auto_convert.
+Chooses an optimal color model, e.g. grey if only grey pixels, palette if < 256 colors, ...*/
+unsigned lodepng_auto_choose_color(LodePNGColorMode* mode_out,
+                                   const unsigned char* image, unsigned w, unsigned h,
+                                   const LodePNGColorMode* mode_in);
+
+/*Settings for the encoder.*/
+typedef struct LodePNGEncoderSettings
+{
+  LodePNGCompressSettings zlibsettings; /*settings for the zlib encoder, such as window size, ...*/
+
+  unsigned auto_convert; /*automatically choose output PNG color type. Default: true*/
+
+  /*If true, follows the official PNG heuristic: if the PNG uses a palette or lower than
+  8 bit depth, set all filters to zero. Otherwise use the filter_strategy. Note that to
+  completely follow the official PNG heuristic, filter_palette_zero must be true and
+  filter_strategy must be LFS_MINSUM*/
+  unsigned filter_palette_zero;
+  /*Which filter strategy to use when not using zeroes due to filter_palette_zero.
+  Set filter_palette_zero to 0 to ensure always using your chosen strategy. Default: LFS_MINSUM*/
+  LodePNGFilterStrategy filter_strategy;
+  /*used if filter_strategy is LFS_PREDEFINED. In that case, this must point to a buffer with
+  the same length as the amount of scanlines in the image, and each value must <= 5. You
+  have to cleanup this buffer, LodePNG will never free it. Don't forget that filter_palette_zero
+  must be set to 0 to ensure this is also used on palette or low bitdepth images.*/
+  const unsigned char* predefined_filters;
+
+  /*force creating a PLTE chunk if colortype is 2 or 6 (= a suggested palette).
+  If colortype is 3, PLTE is _always_ created.*/
+  unsigned force_palette;
+#ifdef LODEPNG_COMPILE_ANCILLARY_CHUNKS
+  /*add LodePNG identifier and version as a text chunk, for debugging*/
+  unsigned add_id;
+  /*encode text chunks as zTXt chunks instead of tEXt chunks, and use compression in iTXt chunks*/
+  unsigned text_compression;
+#endif /*LODEPNG_COMPILE_ANCILLARY_CHUNKS*/
+} LodePNGEncoderSettings;
+
+void lodepng_encoder_settings_init(LodePNGEncoderSettings* settings);
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+
+#if defined(LODEPNG_COMPILE_DECODER) || defined(LODEPNG_COMPILE_ENCODER)
+/*The settings, state and information for extended encoding and decoding.*/
+typedef struct LodePNGState
+{
+#ifdef LODEPNG_COMPILE_DECODER
+  LodePNGDecoderSettings decoder; /*the decoding settings*/
+#endif /*LODEPNG_COMPILE_DECODER*/
+#ifdef LODEPNG_COMPILE_ENCODER
+  LodePNGEncoderSettings encoder; /*the encoding settings*/
+#endif /*LODEPNG_COMPILE_ENCODER*/
+  LodePNGColorMode info_raw; /*specifies the format in which you would like to get the raw pixel buffer*/
+  LodePNGInfo info_png; /*info of the PNG image obtained after decoding*/
+  unsigned error;
+#ifdef LODEPNG_COMPILE_CPP
+  /* For the lodepng::State subclass. */
+  virtual ~LodePNGState(){}
+#endif
+} LodePNGState;
+
+/*init, cleanup and copy functions to use with this struct*/
+void lodepng_state_init(LodePNGState* state);
+void lodepng_state_cleanup(LodePNGState* state);
+void lodepng_state_copy(LodePNGState* dest, const LodePNGState* source);
+#endif /* defined(LODEPNG_COMPILE_DECODER) || defined(LODEPNG_COMPILE_ENCODER) */
+
+#ifdef LODEPNG_COMPILE_DECODER
+/*
+Same as lodepng_decode_memory, but uses a LodePNGState to allow custom settings and
+getting much more information about the PNG image and color mode.
+*/
+unsigned lodepng_decode(unsigned char** out, unsigned* w, unsigned* h,
+                        LodePNGState* state,
+                        const unsigned char* in, size_t insize);
+
+/*
+Read the PNG header, but not the actual data. This returns only the information
+that is in the header chunk of the PNG, such as width, height and color type. The
+information is placed in the info_png field of the LodePNGState.
+*/
+unsigned lodepng_inspect(unsigned* w, unsigned* h,
+                         LodePNGState* state,
+                         const unsigned char* in, size_t insize);
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*This function allocates the out buffer with standard malloc and stores the size in *outsize.*/
+unsigned lodepng_encode(unsigned char** out, size_t* outsize,
+                        const unsigned char* image, unsigned w, unsigned h,
+                        LodePNGState* state);
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+/*
+The lodepng_chunk functions are normally not needed, except to traverse the
+unknown chunks stored in the LodePNGInfo struct, or add new ones to it.
+It also allows traversing the chunks of an encoded PNG file yourself.
+
+PNG standard chunk naming conventions:
+First byte: uppercase = critical, lowercase = ancillary
+Second byte: uppercase = public, lowercase = private
+Third byte: must be uppercase
+Fourth byte: uppercase = unsafe to copy, lowercase = safe to copy
+*/
+
+/*
+Gets the length of the data of the chunk. Total chunk length has 12 bytes more.
+There must be at least 4 bytes to read from. If the result value is too large,
+it may be corrupt data.
+*/
+unsigned lodepng_chunk_length(const unsigned char* chunk);
+
+/*puts the 4-byte type in null terminated string*/
+void lodepng_chunk_type(char type[5], const unsigned char* chunk);
+
+/*check if the type is the given type*/
+unsigned char lodepng_chunk_type_equals(const unsigned char* chunk, const char* type);
+
+/*0: it's one of the critical chunk types, 1: it's an ancillary chunk (see PNG standard)*/
+unsigned char lodepng_chunk_ancillary(const unsigned char* chunk);
+
+/*0: public, 1: private (see PNG standard)*/
+unsigned char lodepng_chunk_private(const unsigned char* chunk);
+
+/*0: the chunk is unsafe to copy, 1: the chunk is safe to copy (see PNG standard)*/
+unsigned char lodepng_chunk_safetocopy(const unsigned char* chunk);
+
+/*get pointer to the data of the chunk, where the input points to the header of the chunk*/
+unsigned char* lodepng_chunk_data(unsigned char* chunk);
+const unsigned char* lodepng_chunk_data_const(const unsigned char* chunk);
+
+/*returns 0 if the crc is correct, 1 if it's incorrect (0 for OK as usual!)*/
+unsigned lodepng_chunk_check_crc(const unsigned char* chunk);
+
+/*generates the correct CRC from the data and puts it in the last 4 bytes of the chunk*/
+void lodepng_chunk_generate_crc(unsigned char* chunk);
+
+/*iterate to next chunks. don't use on IEND chunk, as there is no next chunk then*/
+unsigned char* lodepng_chunk_next(unsigned char* chunk);
+const unsigned char* lodepng_chunk_next_const(const unsigned char* chunk);
+
+/*
+Appends chunk to the data in out. The given chunk should already have its chunk header.
+The out variable and outlength are updated to reflect the new reallocated buffer.
+Returns error code (0 if it went ok)
+*/
+unsigned lodepng_chunk_append(unsigned char** out, size_t* outlength, const unsigned char* chunk);
+
+/*
+Appends new chunk to out. The chunk to append is given by giving its length, type
+and data separately. The type is a 4-letter string.
+The out variable and outlength are updated to reflect the new reallocated buffer.
+Returne error code (0 if it went ok)
+*/
+unsigned lodepng_chunk_create(unsigned char** out, size_t* outlength, unsigned length,
+                              const char* type, const unsigned char* data);
+
+
+/*Calculate CRC32 of buffer*/
+unsigned lodepng_crc32(const unsigned char* buf, size_t len);
+#endif /*LODEPNG_COMPILE_PNG*/
+
+
+#ifdef LODEPNG_COMPILE_ZLIB
+/*
+This zlib part can be used independently to zlib compress and decompress a
+buffer. It cannot be used to create gzip files however, and it only supports the
+part of zlib that is required for PNG, it does not support dictionaries.
+*/
+
+#ifdef LODEPNG_COMPILE_DECODER
+/*Inflate a buffer. Inflate is the decompression step of deflate. Out buffer must be freed after use.*/
+unsigned lodepng_inflate(unsigned char** out, size_t* outsize,
+                         const unsigned char* in, size_t insize,
+                         const LodePNGDecompressSettings* settings);
+
+/*
+Decompresses Zlib data. Reallocates the out buffer and appends the data. The
+data must be according to the zlib specification.
+Either, *out must be NULL and *outsize must be 0, or, *out must be a valid
+buffer and *outsize its size in bytes. out must be freed by user after usage.
+*/
+unsigned lodepng_zlib_decompress(unsigned char** out, size_t* outsize,
+                                 const unsigned char* in, size_t insize,
+                                 const LodePNGDecompressSettings* settings);
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/*
+Compresses data with Zlib. Reallocates the out buffer and appends the data.
+Zlib adds a small header and trailer around the deflate data.
+The data is output in the format of the zlib specification.
+Either, *out must be NULL and *outsize must be 0, or, *out must be a valid
+buffer and *outsize its size in bytes. out must be freed by user after usage.
+*/
+unsigned lodepng_zlib_compress(unsigned char** out, size_t* outsize,
+                               const unsigned char* in, size_t insize,
+                               const LodePNGCompressSettings* settings);
+
+/*
+Find length-limited Huffman code for given frequencies. This function is in the
+public interface only for tests, it's used internally by lodepng_deflate.
+*/
+unsigned lodepng_huffman_code_lengths(unsigned* lengths, const unsigned* frequencies,
+                                      size_t numcodes, unsigned maxbitlen);
+
+/*Compress a buffer with deflate. See RFC 1951. Out buffer must be freed after use.*/
+unsigned lodepng_deflate(unsigned char** out, size_t* outsize,
+                         const unsigned char* in, size_t insize,
+                         const LodePNGCompressSettings* settings);
+
+#endif /*LODEPNG_COMPILE_ENCODER*/
+#endif /*LODEPNG_COMPILE_ZLIB*/
+
+#ifdef LODEPNG_COMPILE_DISK
+/*
+Load a file from disk into buffer. The function allocates the out buffer, and
+after usage you should free it.
+out: output parameter, contains pointer to loaded buffer.
+outsize: output parameter, size of the allocated out buffer
+filename: the path to the file to load
+return value: error code (0 means ok)
+*/
+unsigned lodepng_load_file(unsigned char** out, size_t* outsize, const char* filename);
+
+/*
+Save a file from buffer to disk. Warning, if it exists, this function overwrites
+the file without warning!
+buffer: the buffer to write
+buffersize: size of the buffer to write
+filename: the path to the file to save to
+return value: error code (0 means ok)
+*/
+unsigned lodepng_save_file(const unsigned char* buffer, size_t buffersize, const char* filename);
+#endif /*LODEPNG_COMPILE_DISK*/
+
+#ifdef LODEPNG_COMPILE_CPP
+/* The LodePNG C++ wrapper uses std::vectors instead of manually allocated memory buffers. */
+namespace lodepng
+{
+#ifdef LODEPNG_COMPILE_PNG
+class State : public LodePNGState
+{
+  public:
+    State();
+    State(const State& other);
+    virtual ~State();
+    State& operator=(const State& other);
+};
+
+#ifdef LODEPNG_COMPILE_DECODER
+/* Same as other lodepng::decode, but using a State for more settings and information. */
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                State& state,
+                const unsigned char* in, size_t insize);
+unsigned decode(std::vector<unsigned char>& out, unsigned& w, unsigned& h,
+                State& state,
+                const std::vector<unsigned char>& in);
+#endif /*LODEPNG_COMPILE_DECODER*/
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/* Same as other lodepng::encode, but using a State for more settings and information. */
+unsigned encode(std::vector<unsigned char>& out,
+                const unsigned char* in, unsigned w, unsigned h,
+                State& state);
+unsigned encode(std::vector<unsigned char>& out,
+                const std::vector<unsigned char>& in, unsigned w, unsigned h,
+                State& state);
+#endif /*LODEPNG_COMPILE_ENCODER*/
+
+#ifdef LODEPNG_COMPILE_DISK
+/*
+Load a file from disk into an std::vector.
+return value: error code (0 means ok)
+*/
+unsigned load_file(std::vector<unsigned char>& buffer, const std::string& filename);
+
+/*
+Save the binary data in an std::vector to a file on disk. The file is overwritten
+without warning.
+*/
+unsigned save_file(const std::vector<unsigned char>& buffer, const std::string& filename);
+#endif /* LODEPNG_COMPILE_DISK */
+#endif /* LODEPNG_COMPILE_PNG */
+
+#ifdef LODEPNG_COMPILE_ZLIB
+#ifdef LODEPNG_COMPILE_DECODER
+/* Zlib-decompress an unsigned char buffer */
+unsigned decompress(std::vector<unsigned char>& out, const unsigned char* in, size_t insize,
+                    const LodePNGDecompressSettings& settings = lodepng_default_decompress_settings);
+
+/* Zlib-decompress an std::vector */
+unsigned decompress(std::vector<unsigned char>& out, const std::vector<unsigned char>& in,
+                    const LodePNGDecompressSettings& settings = lodepng_default_decompress_settings);
+#endif /* LODEPNG_COMPILE_DECODER */
+
+#ifdef LODEPNG_COMPILE_ENCODER
+/* Zlib-compress an unsigned char buffer */
+unsigned compress(std::vector<unsigned char>& out, const unsigned char* in, size_t insize,
+                  const LodePNGCompressSettings& settings = lodepng_default_compress_settings);
+
+/* Zlib-compress an std::vector */
+unsigned compress(std::vector<unsigned char>& out, const std::vector<unsigned char>& in,
+                  const LodePNGCompressSettings& settings = lodepng_default_compress_settings);
+#endif /* LODEPNG_COMPILE_ENCODER */
+#endif /* LODEPNG_COMPILE_ZLIB */
+} /* namespace lodepng */
+#endif /*LODEPNG_COMPILE_CPP*/
+
+/*
+TODO:
+[.] test if there are no memory leaks or security exploits - done a lot but needs to be checked often
+[.] check compatibility with various compilers  - done but needs to be redone for every newer version
+[X] converting color to 16-bit per channel types
+[ ] read all public PNG chunk types (but never let the color profile and gamma ones touch RGB values)
+[ ] make sure encoder generates no chunks with size > (2^31)-1
+[ ] partial decoding (stream processing)
+[X] let the "isFullyOpaque" function check color keys and transparent palettes too
+[X] better name for the variables "codes", "codesD", "codelengthcodes", "clcl" and "lldl"
+[ ] don't stop decoding on errors like 69, 57, 58 (make warnings)
+[ ] let the C++ wrapper catch exceptions coming from the standard library and return LodePNG error codes
+[ ] allow user to provide custom color conversion functions, e.g. for premultiplied alpha, padding bits or not, ...
+[ ] allow user to give data (void*) to custom allocator
+*/
+
+#endif /*LODEPNG_H inclusion guard*/
+
+/*
+LodePNG Documentation
+---------------------
+
+0. table of contents
+--------------------
+
+  1. about
+   1.1. supported features
+   1.2. features not supported
+  2. C and C++ version
+  3. security
+  4. decoding
+  5. encoding
+  6. color conversions
+    6.1. PNG color types
+    6.2. color conversions
+    6.3. padding bits
+    6.4. A note about 16-bits per channel and endianness
+  7. error values
+  8. chunks and PNG editing
+  9. compiler support
+  10. examples
+   10.1. decoder C++ example
+   10.2. decoder C example
+  11. state settings reference
+  12. changes
+  13. contact information
+
+
+1. about
+--------
+
+PNG is a file format to store raster images losslessly with good compression,
+supporting different color types and alpha channel.
+
+LodePNG is a PNG codec according to the Portable Network Graphics (PNG)
+Specification (Second Edition) - W3C Recommendation 10 November 2003.
+
+The specifications used are:
+
+*) Portable Network Graphics (PNG) Specification (Second Edition):
+     http://www.w3.org/TR/2003/REC-PNG-20031110
+*) RFC 1950 ZLIB Compressed Data Format version 3.3:
+     http://www.gzip.org/zlib/rfc-zlib.html
+*) RFC 1951 DEFLATE Compressed Data Format Specification ver 1.3:
+     http://www.gzip.org/zlib/rfc-deflate.html
+
+The most recent version of LodePNG can currently be found at
+http://lodev.org/lodepng/
+
+LodePNG works both in C (ISO C90) and C++, with a C++ wrapper that adds
+extra functionality.
+
+LodePNG exists out of two files:
+-lodepng.h: the header file for both C and C++
+-lodepng.c(pp): give it the name lodepng.c or lodepng.cpp (or .cc) depending on your usage
+
+If you want to start using LodePNG right away without reading this doc, get the
+examples from the LodePNG website to see how to use it in code, or check the
+smaller examples in chapter 13 here.
+
+LodePNG is simple but only supports the basic requirements. To achieve
+simplicity, the following design choices were made: There are no dependencies
+on any external library. There are functions to decode and encode a PNG with
+a single function call, and extended versions of these functions taking a
+LodePNGState struct allowing to specify or get more information. By default
+the colors of the raw image are always RGB or RGBA, no matter what color type
+the PNG file uses. To read and write files, there are simple functions to
+convert the files to/from buffers in memory.
+
+This all makes LodePNG suitable for loading textures in games, demos and small
+programs, ... It's less suitable for full fledged image editors, loading PNGs
+over network (it requires all the image data to be available before decoding can
+begin), life-critical systems, ...
+
+1.1. supported features
+-----------------------
+
+The following features are supported by the decoder:
+
+*) decoding of PNGs with any color type, bit depth and interlace mode, to a 24- or 32-bit color raw image,
+   or the same color type as the PNG
+*) encoding of PNGs, from any raw image to 24- or 32-bit color, or the same color type as the raw image
+*) Adam7 interlace and deinterlace for any color type
+*) loading the image from harddisk or decoding it from a buffer from other sources than harddisk
+*) support for alpha channels, including RGBA color model, translucent palettes and color keying
+*) zlib decompression (inflate)
+*) zlib compression (deflate)
+*) CRC32 and ADLER32 checksums
+*) handling of unknown chunks, allowing making a PNG editor that stores custom and unknown chunks.
+*) the following chunks are supported (generated/interpreted) by both encoder and decoder:
+    IHDR: header information
+    PLTE: color palette
+    IDAT: pixel data
+    IEND: the final chunk
+    tRNS: transparency for palettized images
+    tEXt: textual information
+    zTXt: compressed textual information
+    iTXt: international textual information
+    bKGD: suggested background color
+    pHYs: physical dimensions
+    tIME: modification time
+
+1.2. features not supported
+---------------------------
+
+The following features are _not_ supported:
+
+*) some features needed to make a conformant PNG-Editor might be still missing.
+*) partial loading/stream processing. All data must be available and is processed in one call.
+*) The following public chunks are not supported but treated as unknown chunks by LodePNG
+    cHRM, gAMA, iCCP, sRGB, sBIT, hIST, sPLT
+   Some of these are not supported on purpose: LodePNG wants to provide the RGB values
+   stored in the pixels, not values modified by system dependent gamma or color models.
+
+
+2. C and C++ version
+--------------------
+
+The C version uses buffers allocated with alloc that you need to free()
+yourself. You need to use init and cleanup functions for each struct whenever
+using a struct from the C version to avoid exploits and memory leaks.
+
+The C++ version has extra functions with std::vectors in the interface and the
+lodepng::State class which is a LodePNGState with constructor and destructor.
+
+These files work without modification for both C and C++ compilers because all
+the additional C++ code is in "#ifdef __cplusplus" blocks that make C-compilers
+ignore it, and the C code is made to compile both with strict ISO C90 and C++.
+
+To use the C++ version, you need to rename the source file to lodepng.cpp
+(instead of lodepng.c), and compile it with a C++ compiler.
+
+To use the C version, you need to rename the source file to lodepng.c (instead
+of lodepng.cpp), and compile it with a C compiler.
+
+
+3. Security
+-----------
+
+Even if carefully designed, it's always possible that LodePNG contains possible
+exploits. If you discover one, please let me know, and it will be fixed.
+
+When using LodePNG, care has to be taken with the C version of LodePNG, as well
+as the C-style structs when working with C++. The following conventions are used
+for all C-style structs:
+
+-if a struct has a corresponding init function, always call the init function when making a new one
+-if a struct has a corresponding cleanup function, call it before the struct disappears to avoid memory leaks
+-if a struct has a corresponding copy function, use the copy function instead of "=".
+ The destination must also be inited already.
+
+
+4. Decoding
+-----------
+
+Decoding converts a PNG compressed image to a raw pixel buffer.
+
+Most documentation on using the decoder is at its declarations in the header
+above. For C, simple decoding can be done with functions such as
+lodepng_decode32, and more advanced decoding can be done with the struct
+LodePNGState and lodepng_decode. For C++, all decoding can be done with the
+various lodepng::decode functions, and lodepng::State can be used for advanced
+features.
+
+When using the LodePNGState, it uses the following fields for decoding:
+*) LodePNGInfo info_png: it stores extra information about the PNG (the input) in here
+*) LodePNGColorMode info_raw: here you can say what color mode of the raw image (the output) you want to get
+*) LodePNGDecoderSettings decoder: you can specify a few extra settings for the decoder to use
+
+LodePNGInfo info_png
+--------------------
+
+After decoding, this contains extra information of the PNG image, except the actual
+pixels, width and height because these are already gotten directly from the decoder
+functions.
+
+It contains for example the original color type of the PNG image, text comments,
+suggested background color, etc... More details about the LodePNGInfo struct are
+at its declaration documentation.
+
+LodePNGColorMode info_raw
+-------------------------
+
+When decoding, here you can specify which color type you want
+the resulting raw image to be. If this is different from the colortype of the
+PNG, then the decoder will automatically convert the result. This conversion
+always works, except if you want it to convert a color PNG to greyscale or to
+a palette with missing colors.
+
+By default, 32-bit color is used for the result.
+
+LodePNGDecoderSettings decoder
+------------------------------
+
+The settings can be used to ignore the errors created by invalid CRC and Adler32
+chunks, and to disable the decoding of tEXt chunks.
+
+There's also a setting color_convert, true by default. If false, no conversion
+is done, the resulting data will be as it was in the PNG (after decompression)
+and you'll have to puzzle the colors of the pixels together yourself using the
+color type information in the LodePNGInfo.
+
+
+5. Encoding
+-----------
+
+Encoding converts a raw pixel buffer to a PNG compressed image.
+
+Most documentation on using the encoder is at its declarations in the header
+above. For C, simple encoding can be done with functions such as
+lodepng_encode32, and more advanced decoding can be done with the struct
+LodePNGState and lodepng_encode. For C++, all encoding can be done with the
+various lodepng::encode functions, and lodepng::State can be used for advanced
+features.
+
+Like the decoder, the encoder can also give errors. However it gives less errors
+since the encoder input is trusted, the decoder input (a PNG image that could
+be forged by anyone) is not trusted.
+
+When using the LodePNGState, it uses the following fields for encoding:
+*) LodePNGInfo info_png: here you specify how you want the PNG (the output) to be.
+*) LodePNGColorMode info_raw: here you say what color type of the raw image (the input) has
+*) LodePNGEncoderSettings encoder: you can specify a few settings for the encoder to use
+
+LodePNGInfo info_png
+--------------------
+
+When encoding, you use this the opposite way as when decoding: for encoding,
+you fill in the values you want the PNG to have before encoding. By default it's
+not needed to specify a color type for the PNG since it's automatically chosen,
+but it's possible to choose it yourself given the right settings.
+
+The encoder will not always exactly match the LodePNGInfo struct you give,
+it tries as close as possible. Some things are ignored by the encoder. The
+encoder uses, for example, the following settings from it when applicable:
+colortype and bitdepth, text chunks, time chunk, the color key, the palette, the
+background color, the interlace method, unknown chunks, ...
+
+When encoding to a PNG with colortype 3, the encoder will generate a PLTE chunk.
+If the palette contains any colors for which the alpha channel is not 255 (so
+there are translucent colors in the palette), it'll add a tRNS chunk.
+
+LodePNGColorMode info_raw
+-------------------------
+
+You specify the color type of the raw image that you give to the input here,
+including a possible transparent color key and palette you happen to be using in
+your raw image data.
+
+By default, 32-bit color is assumed, meaning your input has to be in RGBA
+format with 4 bytes (unsigned chars) per pixel.
+
+LodePNGEncoderSettings encoder
+------------------------------
+
+The following settings are supported (some are in sub-structs):
+*) auto_convert: when this option is enabled, the encoder will
+automatically choose the smallest possible color mode (including color key) that
+can encode the colors of all pixels without information loss.
+*) btype: the block type for LZ77. 0 = uncompressed, 1 = fixed huffman tree,
+   2 = dynamic huffman tree (best compression). Should be 2 for proper
+   compression.
+*) use_lz77: whether or not to use LZ77 for compressed block types. Should be
+   true for proper compression.
+*) windowsize: the window size used by the LZ77 encoder (1 - 32768). Has value
+   2048 by default, but can be set to 32768 for better, but slow, compression.
+*) force_palette: if colortype is 2 or 6, you can make the encoder write a PLTE
+   chunk if force_palette is true. This can used as suggested palette to convert
+   to by viewers that don't support more than 256 colors (if those still exist)
+*) add_id: add text chunk "Encoder: LodePNG <version>" to the image.
+*) text_compression: default 1. If 1, it'll store texts as zTXt instead of tEXt chunks.
+  zTXt chunks use zlib compression on the text. This gives a smaller result on
+  large texts but a larger result on small texts (such as a single program name).
+  It's all tEXt or all zTXt though, there's no separate setting per text yet.
+
+
+6. color conversions
+--------------------
+
+An important thing to note about LodePNG, is that the color type of the PNG, and
+the color type of the raw image, are completely independent. By default, when
+you decode a PNG, you get the result as a raw image in the color type you want,
+no matter whether the PNG was encoded with a palette, greyscale or RGBA color.
+And if you encode an image, by default LodePNG will automatically choose the PNG
+color type that gives good compression based on the values of colors and amount
+of colors in the image. It can be configured to let you control it instead as
+well, though.
+
+To be able to do this, LodePNG does conversions from one color mode to another.
+It can convert from almost any color type to any other color type, except the
+following conversions: RGB to greyscale is not supported, and converting to a
+palette when the palette doesn't have a required color is not supported. This is
+not supported on purpose: this is information loss which requires a color
+reduction algorithm that is beyong the scope of a PNG encoder (yes, RGB to grey
+is easy, but there are multiple ways if you want to give some channels more
+weight).
+
+By default, when decoding, you get the raw image in 32-bit RGBA or 24-bit RGB
+color, no matter what color type the PNG has. And by default when encoding,
+LodePNG automatically picks the best color model for the output PNG, and expects
+the input image to be 32-bit RGBA or 24-bit RGB. So, unless you want to control
+the color format of the images yourself, you can skip this chapter.
+
+6.1. PNG color types
+--------------------
+
+A PNG image can have many color types, ranging from 1-bit color to 64-bit color,
+as well as palettized color modes. After the zlib decompression and unfiltering
+in the PNG image is done, the raw pixel data will have that color type and thus
+a certain amount of bits per pixel. If you want the output raw image after
+decoding to have another color type, a conversion is done by LodePNG.
+
+The PNG specification gives the following color types:
+
+0: greyscale, bit depths 1, 2, 4, 8, 16
+2: RGB, bit depths 8 and 16
+3: palette, bit depths 1, 2, 4 and 8
+4: greyscale with alpha, bit depths 8 and 16
+6: RGBA, bit depths 8 and 16
+
+Bit depth is the amount of bits per pixel per color channel. So the total amount
+of bits per pixel is: amount of channels * bitdepth.
+
+6.2. color conversions
+----------------------
+
+As explained in the sections about the encoder and decoder, you can specify
+color types and bit depths in info_png and info_raw to change the default
+behaviour.
+
+If, when decoding, you want the raw image to be something else than the default,
+you need to set the color type and bit depth you want in the LodePNGColorMode,
+or the parameters colortype and bitdepth of the simple decoding function.
+
+If, when encoding, you use another color type than the default in the raw input
+image, you need to specify its color type and bit depth in the LodePNGColorMode
+of the raw image, or use the parameters colortype and bitdepth of the simple
+encoding function.
+
+If, when encoding, you don't want LodePNG to choose the output PNG color type
+but control it yourself, you need to set auto_convert in the encoder settings
+to false, and specify the color type you want in the LodePNGInfo of the
+encoder (including palette: it can generate a palette if auto_convert is true,
+otherwise not).
+
+If the input and output color type differ (whether user chosen or auto chosen),
+LodePNG will do a color conversion, which follows the rules below, and may
+sometimes result in an error.
+
+To avoid some confusion:
+-the decoder converts from PNG to raw image
+-the encoder converts from raw image to PNG
+-the colortype and bitdepth in LodePNGColorMode info_raw, are those of the raw image
+-the colortype and bitdepth in the color field of LodePNGInfo info_png, are those of the PNG
+-when encoding, the color type in LodePNGInfo is ignored if auto_convert
+ is enabled, it is automatically generated instead
+-when decoding, the color type in LodePNGInfo is set by the decoder to that of the original
+ PNG image, but it can be ignored since the raw image has the color type you requested instead
+-if the color type of the LodePNGColorMode and PNG image aren't the same, a conversion
+ between the color types is done if the color types are supported. If it is not
+ supported, an error is returned. If the types are the same, no conversion is done.
+-even though some conversions aren't supported, LodePNG supports loading PNGs from any
+ colortype and saving PNGs to any colortype, sometimes it just requires preparing
+ the raw image correctly before encoding.
+-both encoder and decoder use the same color converter.
+
+Non supported color conversions:
+-color to greyscale: no error is thrown, but the result will look ugly because
+only the red channel is taken
+-anything to palette when that palette does not have that color in it: in this
+case an error is thrown
+
+Supported color conversions:
+-anything to 8-bit RGB, 8-bit RGBA, 16-bit RGB, 16-bit RGBA
+-any grey or grey+alpha, to grey or grey+alpha
+-anything to a palette, as long as the palette has the requested colors in it
+-removing alpha channel
+-higher to smaller bitdepth, and vice versa
+
+If you want no color conversion to be done (e.g. for speed or control):
+-In the encoder, you can make it save a PNG with any color type by giving the
+raw color mode and LodePNGInfo the same color mode, and setting auto_convert to
+false.
+-In the decoder, you can make it store the pixel data in the same color type
+as the PNG has, by setting the color_convert setting to false. Settings in
+info_raw are then ignored.
+
+The function lodepng_convert does the color conversion. It is available in the
+interface but normally isn't needed since the encoder and decoder already call
+it.
+
+6.3. padding bits
+-----------------
+
+In the PNG file format, if a less than 8-bit per pixel color type is used and the scanlines
+have a bit amount that isn't a multiple of 8, then padding bits are used so that each
+scanline starts at a fresh byte. But that is NOT true for the LodePNG raw input and output.
+The raw input image you give to the encoder, and the raw output image you get from the decoder
+will NOT have these padding bits, e.g. in the case of a 1-bit image with a width
+of 7 pixels, the first pixel of the second scanline will the the 8th bit of the first byte,
+not the first bit of a new byte.
+
+6.4. A note about 16-bits per channel and endianness
+----------------------------------------------------
+
+LodePNG uses unsigned char arrays for 16-bit per channel colors too, just like
+for any other color format. The 16-bit values are stored in big endian (most
+significant byte first) in these arrays. This is the opposite order of the
+little endian used by x86 CPU's.
+
+LodePNG always uses big endian because the PNG file format does so internally.
+Conversions to other formats than PNG uses internally are not supported by
+LodePNG on purpose, there are myriads of formats, including endianness of 16-bit
+colors, the order in which you store R, G, B and A, and so on. Supporting and
+converting to/from all that is outside the scope of LodePNG.
+
+This may mean that, depending on your use case, you may want to convert the big
+endian output of LodePNG to little endian with a for loop. This is certainly not
+always needed, many applications and libraries support big endian 16-bit colors
+anyway, but it means you cannot simply cast the unsigned char* buffer to an
+unsigned short* buffer on x86 CPUs.
+
+
+7. error values
+---------------
+
+All functions in LodePNG that return an error code, return 0 if everything went
+OK, or a non-zero code if there was an error.
+
+The meaning of the LodePNG error values can be retrieved with the function
+lodepng_error_text: given the numerical error code, it returns a description
+of the error in English as a string.
+
+Check the implementation of lodepng_error_text to see the meaning of each code.
+
+
+8. chunks and PNG editing
+-------------------------
+
+If you want to add extra chunks to a PNG you encode, or use LodePNG for a PNG
+editor that should follow the rules about handling of unknown chunks, or if your
+program is able to read other types of chunks than the ones handled by LodePNG,
+then that's possible with the chunk functions of LodePNG.
+
+A PNG chunk has the following layout:
+
+4 bytes length
+4 bytes type name
+length bytes data
+4 bytes CRC
+
+8.1. iterating through chunks
+-----------------------------
+
+If you have a buffer containing the PNG image data, then the first chunk (the
+IHDR chunk) starts at byte number 8 of that buffer. The first 8 bytes are the
+signature of the PNG and are not part of a chunk. But if you start at byte 8
+then you have a chunk, and can check the following things of it.
+
+NOTE: none of these functions check for memory buffer boundaries. To avoid
+exploits, always make sure the buffer contains all the data of the chunks.
+When using lodepng_chunk_next, make sure the returned value is within the
+allocated memory.
+
+unsigned lodepng_chunk_length(const unsigned char* chunk):
+
+Get the length of the chunk's data. The total chunk length is this length + 12.
+
+void lodepng_chunk_type(char type[5], const unsigned char* chunk):
+unsigned char lodepng_chunk_type_equals(const unsigned char* chunk, const char* type):
+
+Get the type of the chunk or compare if it's a certain type
+
+unsigned char lodepng_chunk_critical(const unsigned char* chunk):
+unsigned char lodepng_chunk_private(const unsigned char* chunk):
+unsigned char lodepng_chunk_safetocopy(const unsigned char* chunk):
+
+Check if the chunk is critical in the PNG standard (only IHDR, PLTE, IDAT and IEND are).
+Check if the chunk is private (public chunks are part of the standard, private ones not).
+Check if the chunk is safe to copy. If it's not, then, when modifying data in a critical
+chunk, unsafe to copy chunks of the old image may NOT be saved in the new one if your
+program doesn't handle that type of unknown chunk.
+
+unsigned char* lodepng_chunk_data(unsigned char* chunk):
+const unsigned char* lodepng_chunk_data_const(const unsigned char* chunk):
+
+Get a pointer to the start of the data of the chunk.
+
+unsigned lodepng_chunk_check_crc(const unsigned char* chunk):
+void lodepng_chunk_generate_crc(unsigned char* chunk):
+
+Check if the crc is correct or generate a correct one.
+
+unsigned char* lodepng_chunk_next(unsigned char* chunk):
+const unsigned char* lodepng_chunk_next_const(const unsigned char* chunk):
+
+Iterate to the next chunk. This works if you have a buffer with consecutive chunks. Note that these
+functions do no boundary checking of the allocated data whatsoever, so make sure there is enough
+data available in the buffer to be able to go to the next chunk.
+
+unsigned lodepng_chunk_append(unsigned char** out, size_t* outlength, const unsigned char* chunk):
+unsigned lodepng_chunk_create(unsigned char** out, size_t* outlength, unsigned length,
+                              const char* type, const unsigned char* data):
+
+These functions are used to create new chunks that are appended to the data in *out that has
+length *outlength. The append function appends an existing chunk to the new data. The create
+function creates a new chunk with the given parameters and appends it. Type is the 4-letter
+name of the chunk.
+
+8.2. chunks in info_png
+-----------------------
+
+The LodePNGInfo struct contains fields with the unknown chunk in it. It has 3
+buffers (each with size) to contain 3 types of unknown chunks:
+the ones that come before the PLTE chunk, the ones that come between the PLTE
+and the IDAT chunks, and the ones that come after the IDAT chunks.
+It's necessary to make the distionction between these 3 cases because the PNG
+standard forces to keep the ordering of unknown chunks compared to the critical
+chunks, but does not force any other ordering rules.
+
+info_png.unknown_chunks_data[0] is the chunks before PLTE
+info_png.unknown_chunks_data[1] is the chunks after PLTE, before IDAT
+info_png.unknown_chunks_data[2] is the chunks after IDAT
+
+The chunks in these 3 buffers can be iterated through and read by using the same
+way described in the previous subchapter.
+
+When using the decoder to decode a PNG, you can make it store all unknown chunks
+if you set the option settings.remember_unknown_chunks to 1. By default, this
+option is off (0).
+
+The encoder will always encode unknown chunks that are stored in the info_png.
+If you need it to add a particular chunk that isn't known by LodePNG, you can
+use lodepng_chunk_append or lodepng_chunk_create to the chunk data in
+info_png.unknown_chunks_data[x].
+
+Chunks that are known by LodePNG should not be added in that way. E.g. to make
+LodePNG add a bKGD chunk, set background_defined to true and add the correct
+parameters there instead.
+
+
+9. compiler support
+-------------------
+
+No libraries other than the current standard C library are needed to compile
+LodePNG. For the C++ version, only the standard C++ library is needed on top.
+Add the files lodepng.c(pp) and lodepng.h to your project, include
+lodepng.h where needed, and your program can read/write PNG files.
+
+It is compatible with C90 and up, and C++03 and up.
+
+If performance is important, use optimization when compiling! For both the
+encoder and decoder, this makes a large difference.
+
+Make sure that LodePNG is compiled with the same compiler of the same version
+and with the same settings as the rest of the program, or the interfaces with
+std::vectors and std::strings in C++ can be incompatible.
+
+CHAR_BITS must be 8 or higher, because LodePNG uses unsigned chars for octets.
+
+*) gcc and g++
+
+LodePNG is developed in gcc so this compiler is natively supported. It gives no
+warnings with compiler options "-Wall -Wextra -pedantic -ansi", with gcc and g++
+version 4.7.1 on Linux, 32-bit and 64-bit.
+
+*) Clang
+
+Fully supported and warning-free.
+
+*) Mingw
+
+The Mingw compiler (a port of gcc for Windows) should be fully supported by
+LodePNG.
+
+*) Visual Studio and Visual C++ Express Edition
+
+LodePNG should be warning-free with warning level W4. Two warnings were disabled
+with pragmas though: warning 4244 about implicit conversions, and warning 4996
+where it wants to use a non-standard function fopen_s instead of the standard C
+fopen.
+
+Visual Studio may want "stdafx.h" files to be included in each source file and
+give an error "unexpected end of file while looking for precompiled header".
+This is not standard C++ and will not be added to the stock LodePNG. You can
+disable it for lodepng.cpp only by right clicking it, Properties, C/C++,
+Precompiled Headers, and set it to Not Using Precompiled Headers there.
+
+NOTE: Modern versions of VS should be fully supported, but old versions, e.g.
+VS6, are not guaranteed to work.
+
+*) Compilers on Macintosh
+
+LodePNG has been reported to work both with gcc and LLVM for Macintosh, both for
+C and C++.
+
+*) Other Compilers
+
+If you encounter problems on any compilers, feel free to let me know and I may
+try to fix it if the compiler is modern and standards complient.
+
+
+10. examples
+------------
+
+This decoder example shows the most basic usage of LodePNG. More complex
+examples can be found on the LodePNG website.
+
+10.1. decoder C++ example
+-------------------------
+
+#include "lodepng.h"
+#include <iostream>
+
+int main(int argc, char *argv[])
+{
+  const char* filename = argc > 1 ? argv[1] : "test.png";
+
+  //load and decode
+  std::vector<unsigned char> image;
+  unsigned width, height;
+  unsigned error = lodepng::decode(image, width, height, filename);
+
+  //if there's an error, display it
+  if(error) std::cout << "decoder error " << error << ": " << lodepng_error_text(error) << std::endl;
+
+  //the pixels are now in the vector "image", 4 bytes per pixel, ordered RGBARGBA..., use it as texture, draw it, ...
+}
+
+10.2. decoder C example
+-----------------------
+
+#include "lodepng.h"
+
+int main(int argc, char *argv[])
+{
+  unsigned error;
+  unsigned char* image;
+  size_t width, height;
+  const char* filename = argc > 1 ? argv[1] : "test.png";
+
+  error = lodepng_decode32_file(&image, &width, &height, filename);
+
+  if(error) printf("decoder error %u: %s\n", error, lodepng_error_text(error));
+
+  / * use image here * /
+
+  free(image);
+  return 0;
+}
+
+11. state settings reference
+----------------------------
+
+A quick reference of some settings to set on the LodePNGState
+
+For decoding:
+
+state.decoder.zlibsettings.ignore_adler32: ignore ADLER32 checksums
+state.decoder.zlibsettings.custom_...: use custom inflate function
+state.decoder.ignore_crc: ignore CRC checksums
+state.decoder.color_convert: convert internal PNG color to chosen one
+state.decoder.read_text_chunks: whether to read in text metadata chunks
+state.decoder.remember_unknown_chunks: whether to read in unknown chunks
+state.info_raw.colortype: desired color type for decoded image
+state.info_raw.bitdepth: desired bit depth for decoded image
+state.info_raw....: more color settings, see struct LodePNGColorMode
+state.info_png....: no settings for decoder but ouput, see struct LodePNGInfo
+
+For encoding:
+
+state.encoder.zlibsettings.btype: disable compression by setting it to 0
+state.encoder.zlibsettings.use_lz77: use LZ77 in compression
+state.encoder.zlibsettings.windowsize: tweak LZ77 windowsize
+state.encoder.zlibsettings.minmatch: tweak min LZ77 length to match
+state.encoder.zlibsettings.nicematch: tweak LZ77 match where to stop searching
+state.encoder.zlibsettings.lazymatching: try one more LZ77 matching
+state.encoder.zlibsettings.custom_...: use custom deflate function
+state.encoder.auto_convert: choose optimal PNG color type, if 0 uses info_png
+state.encoder.filter_palette_zero: PNG filter strategy for palette
+state.encoder.filter_strategy: PNG filter strategy to encode with
+state.encoder.force_palette: add palette even if not encoding to one
+state.encoder.add_id: add LodePNG identifier and version as a text chunk
+state.encoder.text_compression: use compressed text chunks for metadata
+state.info_raw.colortype: color type of raw input image you provide
+state.info_raw.bitdepth: bit depth of raw input image you provide
+state.info_raw: more color settings, see struct LodePNGColorMode
+state.info_png.color.colortype: desired color type if auto_convert is false
+state.info_png.color.bitdepth: desired bit depth if auto_convert is false
+state.info_png.color....: more color settings, see struct LodePNGColorMode
+state.info_png....: more PNG related settings, see struct LodePNGInfo
+
+
+12. changes
+-----------
+
+The version number of LodePNG is the date of the change given in the format
+yyyymmdd.
+
+Some changes aren't backwards compatible. Those are indicated with a (!)
+symbol.
+
+*) 09 apr 2016: Fixed colorkey usage detection, and better file loading (within
+   the limits of pure C90).
+*) 08 dec 2015: Made load_file function return error if file can't be opened.
+*) 24 okt 2015: Bugfix with decoding to palette output.
+*) 18 apr 2015: Boundary PM instead of just package-merge for faster encoding.
+*) 23 aug 2014: Reduced needless memory usage of decoder.
+*) 28 jun 2014: Removed fix_png setting, always support palette OOB for
+    simplicity. Made ColorProfile public.
+*) 09 jun 2014: Faster encoder by fixing hash bug and more zeros optimization.
+*) 22 dec 2013: Power of two windowsize required for optimization.
+*) 15 apr 2013: Fixed bug with LAC_ALPHA and color key.
+*) 25 mar 2013: Added an optional feature to ignore some PNG errors (fix_png).
+*) 11 mar 2013 (!): Bugfix with custom free. Changed from "my" to "lodepng_"
+    prefix for the custom allocators and made it possible with a new #define to
+    use custom ones in your project without needing to change lodepng's code.
+*) 28 jan 2013: Bugfix with color key.
+*) 27 okt 2012: Tweaks in text chunk keyword length error handling.
+*) 8 okt 2012 (!): Added new filter strategy (entropy) and new auto color mode.
+    (no palette). Better deflate tree encoding. New compression tweak settings.
+    Faster color conversions while decoding. Some internal cleanups.
+*) 23 sep 2012: Reduced warnings in Visual Studio a little bit.
+*) 1 sep 2012 (!): Removed #define's for giving custom (de)compression functions
+    and made it work with function pointers instead.
+*) 23 jun 2012: Added more filter strategies. Made it easier to use custom alloc
+    and free functions and toggle #defines from compiler flags. Small fixes.
+*) 6 may 2012 (!): Made plugging in custom zlib/deflate functions more flexible.
+*) 22 apr 2012 (!): Made interface more consistent, renaming a lot. Removed
+    redundant C++ codec classes. Reduced amount of structs. Everything changed,
+    but it is cleaner now imho and functionality remains the same. Also fixed
+    several bugs and shrunk the implementation code. Made new samples.
+*) 6 nov 2011 (!): By default, the encoder now automatically chooses the best
+    PNG color model and bit depth, based on the amount and type of colors of the
+    raw image. For this, autoLeaveOutAlphaChannel replaced by auto_choose_color.
+*) 9 okt 2011: simpler hash chain implementation for the encoder.
+*) 8 sep 2011: lz77 encoder lazy matching instead of greedy matching.
+*) 23 aug 2011: tweaked the zlib compression parameters after benchmarking.
+    A bug with the PNG filtertype heuristic was fixed, so that it chooses much
+    better ones (it's quite significant). A setting to do an experimental, slow,
+    brute force search for PNG filter types is added.
+*) 17 aug 2011 (!): changed some C zlib related function names.
+*) 16 aug 2011: made the code less wide (max 120 characters per line).
+*) 17 apr 2011: code cleanup. Bugfixes. Convert low to 16-bit per sample colors.
+*) 21 feb 2011: fixed compiling for C90. Fixed compiling with sections disabled.
+*) 11 dec 2010: encoding is made faster, based on suggestion by Peter Eastman
+    to optimize long sequences of zeros.
+*) 13 nov 2010: added LodePNG_InfoColor_hasPaletteAlpha and
+    LodePNG_InfoColor_canHaveAlpha functions for convenience.
+*) 7 nov 2010: added LodePNG_error_text function to get error code description.
+*) 30 okt 2010: made decoding slightly faster
+*) 26 okt 2010: (!) changed some C function and struct names (more consistent).
+     Reorganized the documentation and the declaration order in the header.
+*) 08 aug 2010: only changed some comments and external samples.
+*) 05 jul 2010: fixed bug thanks to warnings in the new gcc version.
+*) 14 mar 2010: fixed bug where too much memory was allocated for char buffers.
+*) 02 sep 2008: fixed bug where it could create empty tree that linux apps could
+    read by ignoring the problem but windows apps couldn't.
+*) 06 jun 2008: added more error checks for out of memory cases.
+*) 26 apr 2008: added a few more checks here and there to ensure more safety.
+*) 06 mar 2008: crash with encoding of strings fixed
+*) 02 feb 2008: support for international text chunks added (iTXt)
+*) 23 jan 2008: small cleanups, and #defines to divide code in sections
+*) 20 jan 2008: support for unknown chunks allowing using LodePNG for an editor.
+*) 18 jan 2008: support for tIME and pHYs chunks added to encoder and decoder.
+*) 17 jan 2008: ability to encode and decode compressed zTXt chunks added
+    Also various fixes, such as in the deflate and the padding bits code.
+*) 13 jan 2008: Added ability to encode Adam7-interlaced images. Improved
+    filtering code of encoder.
+*) 07 jan 2008: (!) changed LodePNG to use ISO C90 instead of C++. A
+    C++ wrapper around this provides an interface almost identical to before.
+    Having LodePNG be pure ISO C90 makes it more portable. The C and C++ code
+    are together in these files but it works both for C and C++ compilers.
+*) 29 dec 2007: (!) changed most integer types to unsigned int + other tweaks
+*) 30 aug 2007: bug fixed which makes this Borland C++ compatible
+*) 09 aug 2007: some VS2005 warnings removed again
+*) 21 jul 2007: deflate code placed in new namespace separate from zlib code
+*) 08 jun 2007: fixed bug with 2- and 4-bit color, and small interlaced images
+*) 04 jun 2007: improved support for Visual Studio 2005: crash with accessing
+    invalid std::vector element [0] fixed, and level 3 and 4 warnings removed
+*) 02 jun 2007: made the encoder add a tag with version by default
+*) 27 may 2007: zlib and png code separated (but still in the same file),
+    simple encoder/decoder functions added for more simple usage cases
+*) 19 may 2007: minor fixes, some code cleaning, new error added (error 69),
+    moved some examples from here to lodepng_examples.cpp
+*) 12 may 2007: palette decoding bug fixed
+*) 24 apr 2007: changed the license from BSD to the zlib license
+*) 11 mar 2007: very simple addition: ability to encode bKGD chunks.
+*) 04 mar 2007: (!) tEXt chunk related fixes, and support for encoding
+    palettized PNG images. Plus little interface change with palette and texts.
+*) 03 mar 2007: Made it encode dynamic Huffman shorter with repeat codes.
+    Fixed a bug where the end code of a block had length 0 in the Huffman tree.
+*) 26 feb 2007: Huffman compression with dynamic trees (BTYPE 2) now implemented
+    and supported by the encoder, resulting in smaller PNGs at the output.
+*) 27 jan 2007: Made the Adler-32 test faster so that a timewaste is gone.
+*) 24 jan 2007: gave encoder an error interface. Added color conversion from any
+    greyscale type to 8-bit greyscale with or without alpha.
+*) 21 jan 2007: (!) Totally changed the interface. It allows more color types
+    to convert to and is more uniform. See the manual for how it works now.
+*) 07 jan 2007: Some cleanup & fixes, and a few changes over the last days:
+    encode/decode custom tEXt chunks, separate classes for zlib & deflate, and
+    at last made the decoder give errors for incorrect Adler32 or Crc.
+*) 01 jan 2007: Fixed bug with encoding PNGs with less than 8 bits per channel.
+*) 29 dec 2006: Added support for encoding images without alpha channel, and
+    cleaned out code as well as making certain parts faster.
+*) 28 dec 2006: Added "Settings" to the encoder.
+*) 26 dec 2006: The encoder now does LZ77 encoding and produces much smaller files now.
+    Removed some code duplication in the decoder. Fixed little bug in an example.
+*) 09 dec 2006: (!) Placed output parameters of public functions as first parameter.
+    Fixed a bug of the decoder with 16-bit per color.
+*) 15 okt 2006: Changed documentation structure
+*) 09 okt 2006: Encoder class added. It encodes a valid PNG image from the
+    given image buffer, however for now it's not compressed.
+*) 08 sep 2006: (!) Changed to interface with a Decoder class
+*) 30 jul 2006: (!) LodePNG_InfoPng , width and height are now retrieved in different
+    way. Renamed decodePNG to decodePNGGeneric.
+*) 29 jul 2006: (!) Changed the interface: image info is now returned as a
+    struct of type LodePNG::LodePNG_Info, instead of a vector, which was a bit clumsy.
+*) 28 jul 2006: Cleaned the code and added new error checks.
+    Corrected terminology "deflate" into "inflate".
+*) 23 jun 2006: Added SDL example in the documentation in the header, this
+    example allows easy debugging by displaying the PNG and its transparency.
+*) 22 jun 2006: (!) Changed way to obtain error value. Added
+    loadFile function for convenience. Made decodePNG32 faster.
+*) 21 jun 2006: (!) Changed type of info vector to unsigned.
+    Changed position of palette in info vector. Fixed an important bug that
+    happened on PNGs with an uncompressed block.
+*) 16 jun 2006: Internally changed unsigned into unsigned where
+    needed, and performed some optimizations.
+*) 07 jun 2006: (!) Renamed functions to decodePNG and placed them
+    in LodePNG namespace. Changed the order of the parameters. Rewrote the
+    documentation in the header. Renamed files to lodepng.cpp and lodepng.h
+*) 22 apr 2006: Optimized and improved some code
+*) 07 sep 2005: (!) Changed to std::vector interface
+*) 12 aug 2005: Initial release (C++, decoder only)
+
+
+13. contact information
+-----------------------
+
+Feel free to contact me with suggestions, problems, comments, ... concerning
+LodePNG. If you encounter a PNG image that doesn't work properly with this
+decoder, feel free to send it and I'll use it to find and fix the problem.
+
+My email address is (puzzle the account and domain together with an @ symbol):
+Domain: gmail dot com.
+Account: lode dot vandevenne.
+
+
+Copyright (c) 2005-2016 Lode Vandevenne
+*/
diff --git a/xdl/third_party/tbb/examples/graph/stereo/msvs/stereo.sln b/xdl/third_party/tbb/examples/graph/stereo/msvs/stereo.sln
new file mode 100644
index 00000000..ee332b88
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/msvs/stereo.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "stereo", "stereo.vcxproj", "{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Debug|Win32.ActiveCfg = Debug|Win32
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Debug|Win32.Build.0 = Debug|Win32
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Debug|x64.ActiveCfg = Debug|x64
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Debug|x64.Build.0 = Debug|x64
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Release|Win32.ActiveCfg = Release|Win32
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Release|Win32.Build.0 = Release|Win32
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Release|x64.ActiveCfg = Release|x64
+		{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/graph/stereo/msvs/stereo.vcxproj b/xdl/third_party/tbb/examples/graph/stereo/msvs/stereo.vcxproj
new file mode 100644
index 00000000..e460eced
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/msvs/stereo.vcxproj
@@ -0,0 +1,163 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{9C777D75-70FF-4C24-AB74-EBCDF3328AB9}</ProjectGuid>
+    <RootNamespace>stereo</RootNamespace>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>MultiByte</CharacterSet>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
+    <IntDir>$(SolutionDir)$(Platform)\$(ProjectName)\$(Configuration)\</IntDir>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>Disabled</Optimization>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(SolutionDir)..\..\..\..\include;$(INTELOCLSDKROOT)include;$(TBBROOT)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_MBCS;_CRT_SECURE_NO_WARNINGS;_SCL_SECURE_NO_WARNINGS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <AdditionalLibraryDirectories>$(INTELOCLSDKROOT)lib\x86;$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <AdditionalDependencies>OpenCL.lib;%(AdditionalDependencies)</AdditionalDependencies>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>Disabled</Optimization>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(SolutionDir)..\..\..\..\include;$(INTELOCLSDKROOT)include;$(TBBROOT)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_MBCS;_CRT_SECURE_NO_WARNINGS;_SCL_SECURE_NO_WARNINGS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <AdditionalLibraryDirectories>$(INTELOCLSDKROOT)lib\x64;$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <AdditionalDependencies>OpenCL.lib;%(AdditionalDependencies)</AdditionalDependencies>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>MaxSpeed</Optimization>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(SolutionDir)..\..\..\..\include;$(INTELOCLSDKROOT)include;$(TBBROOT)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_MBCS;_CRT_SECURE_NO_WARNINGS;_SCL_SECURE_NO_WARNINGS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <AdditionalLibraryDirectories>$(INTELOCLSDKROOT)lib\x86;$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <AdditionalDependencies>OpenCL.lib;%(AdditionalDependencies)</AdditionalDependencies>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <Optimization>MaxSpeed</Optimization>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <AdditionalIncludeDirectories>$(SolutionDir)..\..\..\..\include;$(INTELOCLSDKROOT)include;$(TBBROOT)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_MBCS;_CRT_SECURE_NO_WARNINGS;_SCL_SECURE_NO_WARNINGS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <AdditionalLibraryDirectories>$(INTELOCLSDKROOT)lib\x64;$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <AdditionalDependencies>OpenCL.lib;%(AdditionalDependencies)</AdditionalDependencies>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <None Include="..\imageEffects.cl" />
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\lodepng.cpp" />
+    <ClCompile Include="..\stereo.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\lodepng.h" />
+    <ClInclude Include="..\utils.h" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/graph/stereo/readme.html b/xdl/third_party/tbb/examples/graph/stereo/readme.html
new file mode 100644
index 00000000..d7d787d1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/readme.html
@@ -0,0 +1,445 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Stereo sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Stereo sample</h1>
+	</div>
+	
+	<p>
+		The Stereo example is an implementation of the algorithm that applies stereoscopic 3D effect on two input images and achieved by means of encoding each eye's image using filters of different colors: red and blue -
+		<a href="http://en.wikipedia.org/wiki/Anaglyph_3D"><i>Anaglyph effect</i></a>.
+	<br><br>
+		The example uses the flow graph interface and can be executed both on CPU and GPU for image processing.
+		The output of this application is a PNG image with the anaglyph effect applied.
+	<br><br>
+		<i>
+			This example includes software developed by Lode Vandevenne. See
+			<a href="#copyright">here</a> for copyright information.
+		</i>
+	<br>
+		It exemplifies the opencl_node usage in the flow graph interface in context of creating a stereo image from two input images.
+	<br><br>
+		This example uses C++11 lambda expressions. Specifying a compiler option such as -std=c++11 or similar might be necessary in order to build the example.
+		For more information please refer to the documentation for the compiler you use.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+			<p>
+				Additionally, you have to install OpenCL&trade; version 1.2 or higher in order to run this example. See the <a href="https://software.intel.com/en-us/articles/opencl-drivers">OpenCL&trade; Drivers and Runtimes for Intel&reg; Architecture</a>.
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="stereo.cpp">stereo.cpp</a>
+				<dd>The implementation of stereo image creation algorithm based on the flow graph interface.
+				<dt><a href="lodepng.cpp">lodepng.cpp</a>
+				<dd>Library for reading and writing png images.
+				<dt><a href="lodepng.h">lodepng.h</a>
+				<dd>Public header file for the lodepng library.
+				<dt><a href="utils.h">utils.h</a>
+				<dd>Support functions for this example.
+				<dt><a href="imageEffects.cl">imageEffects.cl</a>
+				<dd>OpenCL kernel file with image effects algorithms.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a> 
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>stereo <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>stereo [<i>-v</i>] [<i>-alg</i>=value] [<i>first_filename</i>] [<i>second_filename</i>]</tt>
+				<dd><i>-v</i> print diagnostic output to screen<br>
+					<i>-alg</i> name of the used pipeline realization - can be host, target (default) or host_target<br>
+					<i>first_filename</i> first input file name<br>
+					<i>second_filename</i> second input file name<br>
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<a name="copyright"></a>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+
+			<p>
+				LodePNG version 20160409
+				Copyright (c) 2005-2016 Lode Vandevenne
+			</p>
+			<p>
+				This software is provided 'as-is', without any express or implied
+				warranty. In no event will the authors be held liable for any damages
+				arising from the use of this software.
+			<br>
+				Permission is granted to anyone to use this software for any purpose,
+				including commercial applications, and to alter it and redistribute it
+				freely, subject to the following restrictions:
+				<ol>
+					<li>The origin of this software must not be misrepresented; you must not
+						claim that you wrote the original software. If you use this software
+						in a product, an acknowledgment in the product documentation would be
+						appreciated but is not required.
+					<li>Altered source versions must be plainly marked as such, and must not be
+						misrepresented as being the original software.
+					<li>This notice may not be removed or altered from any source
+					distribution.
+				</ol>
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/graph/stereo/stereo.cpp b/xdl/third_party/tbb/examples/graph/stereo/stereo.cpp
new file mode 100644
index 00000000..44dfd53c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/stereo.cpp
@@ -0,0 +1,441 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_FLOW_GRAPH_NODES 1
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+
+#include "tbb/tbb_config.h"
+#include "../../common/utility/utility.h"
+
+#if __TBB_PREVIEW_OPENCL_NODE && __TBB_CPP11_LAMBDAS_PRESENT
+
+#if _MSC_VER
+// suppress warning C4503: decorated name length exceeded, name was truncated 
+#pragma warning(disable : 4503)
+#endif
+
+#include <iostream>
+
+#include "tbb/flow_graph.h"
+#include "tbb/flow_graph_opencl_node.h"
+#include "tbb/tick_count.h"
+
+#include "utils.h"
+
+static const int redChannelOffset = 0;
+static const int greenChannelOffset = 1;
+static const int blueChannelOffset = 2;
+static const int channelsPerPixel = 4;
+static const unsigned int channelIncreaseValue = 10;
+
+void applyLeftImageEffect(utils::image_buffer& image) {
+    const int heighBase = channelsPerPixel * image.width;
+    std::vector<unsigned char>& buffer = *image.buffer;
+
+    // Increase the Red channel of left image by 10
+    for (unsigned int y = 0; y < image.height; y++) {
+        const int heightOffset = heighBase * y;
+        for (unsigned int x = 0; x < image.width; x++) {
+            int pixelOffset = heightOffset + channelsPerPixel * x + redChannelOffset;
+            unsigned int pixelValue = buffer[pixelOffset] + channelIncreaseValue;
+            buffer[pixelOffset] = utils::convert_uchar_sat(pixelValue);
+        }
+    }
+}
+
+void applyRightImageEffect(utils::image_buffer& image) {
+    const int heighBase = channelsPerPixel * image.width;
+    std::vector<unsigned char>& buffer = *image.buffer;
+
+    // Increase the Blue channel of left image by 10
+    for (unsigned int y = 0; y < image.height; y++) {
+        const int heightOffset = heighBase * y;
+        for (unsigned int x = 0; x < image.width; x++) {
+            const int pixelOffset = heightOffset + channelsPerPixel * x + blueChannelOffset;
+            unsigned int pixelValue = buffer[pixelOffset] + channelIncreaseValue;
+            buffer[pixelOffset] = utils::convert_uchar_sat(pixelValue);
+        }
+    }
+}
+
+// This function merges to image buffers into the first buffer (leftImageBuffer as a destination)
+void mergeImageBuffers(utils::image_buffer& leftImage, const utils::image_buffer& rightImage) {
+    const int heighBase = channelsPerPixel * leftImage.width;
+    std::vector<unsigned char>& leftImageBuffer = *leftImage.buffer;
+    std::vector<unsigned char>& rightImageBuffer = *rightImage.buffer;
+
+    // Apply stereoscopic merge using algorithm: R: left image, G: left and right images (middle value), B: right image
+    for (unsigned int y = 0; y < leftImage.height; y++) {
+        const int heightOffset = heighBase * y;
+        for (unsigned int x = 0; x < leftImage.width; x++) {
+            const int pixelOffset = heightOffset + channelsPerPixel * x;
+            const int greenChannelIndex = pixelOffset + greenChannelOffset;
+            const int blueChannelIndex = pixelOffset + blueChannelOffset;
+            const int middleGreenChannel = (leftImageBuffer[greenChannelIndex] + rightImageBuffer[greenChannelIndex]);
+            leftImageBuffer[greenChannelIndex] = middleGreenChannel / 2;
+            leftImageBuffer[blueChannelIndex] = rightImageBuffer[blueChannelIndex];
+        }
+    }
+}
+
+void fillOpenclBuffer(tbb::flow::opencl_buffer<cl_uchar>& openclBuffer, const std::vector<unsigned char>& sourceBuffer) {
+    std::copy(sourceBuffer.begin(), sourceBuffer.end(), openclBuffer.begin());
+}
+
+class gpu_device_selector {
+public:
+    template <typename DeviceFilter>
+    tbb::flow::opencl_device operator()(tbb::flow::opencl_factory<DeviceFilter>& f) {
+        // Set your GPU device if available to execute kernel on
+        const tbb::flow::opencl_device_list &devices = f.devices();
+        tbb::flow::opencl_device_list::const_iterator it = std::find_if(
+            devices.cbegin(), devices.cend(),
+            [](const tbb::flow::opencl_device &d) {
+            cl_device_type type;
+            d.info(CL_DEVICE_TYPE, type);
+            return CL_DEVICE_TYPE_GPU == type;
+        });
+
+        if (it == devices.cend()) {
+            std::cout << "Info: could not find any GPU devices. Choosing the first available device (default behaviour)." << std::endl;
+            return *(f.devices().begin());
+        } else {
+            // Return GPU device from factory
+            return *it;
+        }
+    }
+};
+
+// Image processing function that is executed on CPU only
+void hostFunction(const std::string& firstFile, const std::string& secondFile, const std::string& outputFile) {
+    using namespace tbb::flow;
+    typedef tuple< utils::image_buffer, utils::image_buffer > MergeImagesTuple;
+
+    graph g;
+
+    function_node< std::string, utils::image_buffer > fileReaderOne(g, serial, [](const std::string& fileToRead) -> utils::image_buffer {
+        return utils::getOrGenerateImage(fileToRead);
+    });
+
+    function_node< std::string, utils::image_buffer > fileReaderTwo = fileReaderOne;
+
+    function_node< utils::image_buffer, utils::image_buffer > leftImageEffect(g, unlimited, [](utils::image_buffer image) -> utils::image_buffer {
+        applyLeftImageEffect(image);
+        return image;
+    });
+
+    function_node< utils::image_buffer, utils::image_buffer > rightImageEffect(g, unlimited, [](utils::image_buffer image) -> utils::image_buffer {
+        applyRightImageEffect(image);
+        return image;
+    });
+
+    join_node< tuple< utils::image_buffer, utils::image_buffer > > joinNode(g);
+
+    function_node< MergeImagesTuple, utils::image_buffer > mergeImages(g, unlimited, [](const MergeImagesTuple& bufferTuple) -> utils::image_buffer {
+        // Two input images from tupple are merged into the first image,
+        utils::image_buffer leftImageBuffer = std::get<0>(bufferTuple);
+        utils::image_buffer rightImageBuffer = std::get<1>(bufferTuple);
+
+        mergeImageBuffers(leftImageBuffer, rightImageBuffer);
+
+        return leftImageBuffer;
+    });
+
+    function_node< utils::image_buffer > outputWriter(g, unlimited, [&outputFile](const utils::image_buffer& image) {
+        utils::writePNGImage(image, outputFile);
+    });
+
+    // Read left image
+    make_edge(fileReaderOne, leftImageEffect);
+
+    // Read right image
+    make_edge(fileReaderTwo, rightImageEffect);
+
+    // Process left image
+    make_edge(leftImageEffect, tbb::flow::input_port<0>(joinNode));
+
+    // Process right image
+    make_edge(rightImageEffect, tbb::flow::input_port<1>(joinNode));
+
+    // Merge images
+    make_edge(joinNode, mergeImages);
+    make_edge(mergeImages, outputWriter);
+
+    // Start graph image processing
+    fileReaderOne.try_put(firstFile);
+    fileReaderTwo.try_put(secondFile);
+
+    g.wait_for_all();
+}
+
+
+// Image processing function using OpenCL
+/** Reading and writing image to file is executed on CPU, while all buffers manipulation are executed on GPU */
+void openclFunctionGPU(const std::string& firstFile, const std::string& secondFile, const std::string& outputFile) {
+    using namespace tbb::flow;
+    typedef opencl_buffer<cl_uchar> OpenclImageBuffer;
+    typedef std::array<unsigned int, 2> NDRange;
+    typedef tuple< OpenclImageBuffer, cl_uint, NDRange > OpenclImageTuple;
+    typedef tuple< OpenclImageBuffer, OpenclImageBuffer, cl_uint, NDRange > OpenclImagesMergeTuple;
+    typedef tuple< OpenclImageBuffer, NDRange > WriteImageBufferTuple;
+
+    graph g;
+
+    gpu_device_selector gpu_selector;
+
+    function_node< std::string, OpenclImageTuple > fileReaderOne(g, serial, [&g](const std::string& fileToRead) -> OpenclImageTuple {
+        utils::image_buffer src = utils::getOrGenerateImage(fileToRead);
+
+        // Create and initialize opencl_buffer in order to pass it to kernel
+        OpenclImageBuffer oclImage(src.buffer->size());
+        fillOpenclBuffer(oclImage, *src.buffer);
+
+        NDRange rangeList = { src.width, src.height };
+        return std::make_tuple(oclImage, src.width, rangeList);
+    });
+
+    function_node< std::string, OpenclImageTuple > fileReaderTwo = fileReaderOne;
+
+    split_node< OpenclImageTuple > splitArgumentsLeftNode(g);
+
+    // Kernel should be in the current folder
+    opencl_program<> program("imageEffects.cl");
+
+    opencl_node< OpenclImageTuple > leftImageEffect(g, program.get_kernel("applyLeftImageEffect"), gpu_selector);
+
+    split_node< OpenclImageTuple > splitArgumentsRightNode(g);
+
+    opencl_node< OpenclImageTuple > rightImageEffect(g, program.get_kernel("applyRightImageEffect"), gpu_selector);
+
+    opencl_node< OpenclImagesMergeTuple > mergeImages(g, program.get_kernel("mergeImages"), gpu_selector);
+
+    join_node< WriteImageBufferTuple > joinTupleNode(g);
+
+    function_node< WriteImageBufferTuple > outputWriter(g, unlimited, [&outputFile](const WriteImageBufferTuple& image) {
+        // The result image have to be copied in order to be changed,
+        // the second parameter - image size, can be taken by const reference
+        OpenclImageBuffer imageBuffer = std::get<0>(image);
+        const NDRange& imageSize = std::get<1>(image);
+        unsigned int width = imageSize[0];
+        unsigned int height = imageSize[1]; 
+
+        utils::writePNGImage(imageBuffer.data(), width, height, outputFile);
+    });
+
+    // Process left image
+    make_edge(fileReaderOne, splitArgumentsLeftNode);
+    make_edge(output_port<0>(splitArgumentsLeftNode), input_port<0>(leftImageEffect));
+    make_edge(output_port<1>(splitArgumentsLeftNode), input_port<1>(leftImageEffect));
+
+    // Pass OpenCL NDRange via input port because it depends on input data
+    make_edge(output_port<2>(splitArgumentsLeftNode), input_port<2>(leftImageEffect));
+
+    // Process right image
+    make_edge(fileReaderTwo, splitArgumentsRightNode);
+    make_edge(output_port<0>(splitArgumentsRightNode), input_port<0>(rightImageEffect));
+    make_edge(output_port<1>(splitArgumentsRightNode), input_port<1>(rightImageEffect));
+
+    // Pass OpenCL NDRange via input port because it depends on input data
+    make_edge(output_port<2>(splitArgumentsRightNode), input_port<2>(rightImageEffect));
+
+    // Merge images
+    make_edge(output_port<0>(leftImageEffect), input_port<0>(mergeImages));
+    make_edge(output_port<0>(rightImageEffect), input_port<1>(mergeImages));
+    make_edge(output_port<1>(leftImageEffect), input_port<2>(mergeImages));
+
+    // Set OpenCL NDRange here (because the values may vary, depending on input data)
+    make_edge(output_port<2>(leftImageEffect), input_port<3>(mergeImages));
+
+    // Write image to PNG
+    make_edge(output_port<0>(mergeImages), input_port<0>(joinTupleNode));
+    make_edge(output_port<3>(mergeImages), input_port<1>(joinTupleNode));
+    make_edge(joinTupleNode, outputWriter);
+
+    // Define where to get ndrange and kernel arguments
+    leftImageEffect.set_args(port_ref<0, 1>());
+    leftImageEffect.set_range(port_ref<2>());
+
+    rightImageEffect.set_args(port_ref<0, 1>());
+    rightImageEffect.set_range(port_ref<2>());
+
+    mergeImages.set_args(port_ref<0, 2>());
+    mergeImages.set_range(port_ref<3>());
+
+    // Start graph image processing pipeline
+    fileReaderOne.try_put(firstFile);
+    fileReaderTwo.try_put(secondFile);
+
+    g.wait_for_all();
+}
+
+
+// Second image processing function using OpenCL
+/** Reading and writing image to file is executed on CPU, while some buffers manipulation are executed on GPU
+    and others runs on CPU device. This case should have the best performance among others. */
+void openclFunctionGPUPlusCPU(const std::string& firstFile, const std::string& secondFile, const std::string& outputFile) {
+    using namespace tbb::flow;
+    typedef opencl_buffer<cl_uchar> OpenclImageBuffer;
+    typedef std::array<unsigned int, 2> NDRange;
+    typedef tuple< OpenclImageBuffer, cl_uint, NDRange > OpenclImageTuple;
+    typedef tuple< OpenclImageBuffer, OpenclImageBuffer, cl_uint, NDRange > OpenclImagesMergeTuple;
+    typedef tuple< OpenclImageBuffer, NDRange > WriteImageBufferTuple;
+
+    graph g;
+
+    gpu_device_selector gpu_selector;
+
+    function_node< std::string, OpenclImageTuple > fileReaderOne(g, serial, [&g](const std::string& fileToRead) -> OpenclImageTuple {
+        utils::image_buffer src = utils::getOrGenerateImage(fileToRead);
+
+        // Create and initialize opencl_buffer in order to pass it to mergeImages kernel
+        OpenclImageBuffer oclImage(src.buffer->size());
+        fillOpenclBuffer(oclImage, *src.buffer);
+
+        NDRange rangeList = { src.width, src.height };
+        return std::make_tuple(oclImage, src.width, rangeList);
+    });
+
+    function_node< std::string, utils::image_buffer > fileReaderTwo(g, serial, [](const std::string& fileToRead) -> utils::image_buffer {
+        return utils::readPNGImage(fileToRead);
+    });
+
+    split_node< OpenclImageTuple > splitArgumentsLeftNode(g);
+
+    // Kernel should be in the current folder
+    opencl_program<> program("imageEffects.cl");
+
+    opencl_node< OpenclImageTuple > leftImageEffect(g, program.get_kernel("applyLeftImageEffect"), gpu_selector);
+
+    function_node< utils::image_buffer, OpenclImageBuffer > rightImageEffect(g, unlimited, [&g](utils::image_buffer image) -> OpenclImageBuffer {
+        applyRightImageEffect(image);
+
+        // Create and initialize opencl_buffer in order to pass it to kernel
+        OpenclImageBuffer oclImage(image.buffer->size());
+        fillOpenclBuffer(oclImage, *image.buffer);
+
+        return oclImage;
+    });
+
+    opencl_node< OpenclImagesMergeTuple > mergeImages(g, program.get_kernel("mergeImages"), gpu_selector);
+
+    join_node< WriteImageBufferTuple > joinTupleNode(g);
+
+    function_node< WriteImageBufferTuple > outputWriter(g, unlimited, [&outputFile](const WriteImageBufferTuple& image) {
+        // The result image have to be copied in order to be changed,
+        // the second parameter - image size, can be taken by const reference
+        OpenclImageBuffer imageBuffer = std::get<0>(image);
+        const NDRange& imageSize = std::get<1>(image);
+        unsigned int width = imageSize[0];
+        unsigned int height = imageSize[1];
+
+        utils::writePNGImage(imageBuffer.data(), width, height, outputFile);
+    });
+
+    // Process left image on GPU
+    make_edge(fileReaderOne, splitArgumentsLeftNode);
+    make_edge(output_port<0>(splitArgumentsLeftNode), input_port<0>(leftImageEffect));
+    make_edge(output_port<1>(splitArgumentsLeftNode), input_port<1>(leftImageEffect));
+
+    // Pass OpenCL NDRange via input port because it depends on input data
+    make_edge(output_port<2>(splitArgumentsLeftNode), input_port<2>(leftImageEffect));
+
+    // Process right image on CPU
+    make_edge(fileReaderTwo, rightImageEffect);
+
+    // Merge images on GPU
+    make_edge(output_port<0>(leftImageEffect), input_port<0>(mergeImages));
+    make_edge(rightImageEffect, input_port<1>(mergeImages));
+    make_edge(output_port<1>(leftImageEffect), input_port<2>(mergeImages));
+
+    // Pass OpenCL NDRange via input port because it depends on input data
+    make_edge(output_port<2>(leftImageEffect), input_port<3>(mergeImages));
+
+    // Write image to PNG
+    make_edge(output_port<0>(mergeImages), input_port<0>(joinTupleNode));
+    make_edge(output_port<3>(mergeImages), input_port<1>(joinTupleNode));
+    make_edge(joinTupleNode, outputWriter);
+
+    // Define where to get ndrange and kernel arguments
+    leftImageEffect.set_args(port_ref<0, 1>());
+    leftImageEffect.set_range(port_ref<2>());
+
+    mergeImages.set_args(port_ref<0, 2>());
+    mergeImages.set_range(port_ref<3>());
+
+    // Start graph image processing pipeline
+    fileReaderOne.try_put(firstFile);
+    fileReaderTwo.try_put(secondFile);
+
+    g.wait_for_all();
+}
+
+
+int main(int argc, char* argv[]) {
+    try {
+
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        bool verbose = false;
+        std::string algVersion;
+
+        std::string inputFileFirst;
+        std::string inputFileSecond;
+        std::string outputFile = "output.png";
+
+        utility::parse_cli_arguments(argc, argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help
+            .arg(verbose, "-v", "verbose mode")
+            .arg(algVersion, "-alg", "name of the used pipeline realisation - can be host, target (default) or host_target")
+            .positional_arg(inputFileFirst, "first_filename", "first input file name")
+            .positional_arg(inputFileSecond, "second_filename", "second input file name")
+        );
+
+        if (!utils::isBothImagesExists(inputFileFirst, inputFileSecond)) {
+            std::cout << "Info: one or both images does not exists or empty. Input images will be generated instead." << std::endl;
+            inputFileFirst.clear();
+            inputFileSecond.clear();
+        } else {
+            std::cout << "First input file name: " << inputFileFirst << std::endl;
+            std::cout << "Second input file name: " << inputFileSecond << std::endl;
+        }
+
+        if (algVersion.empty() || algVersion == "target") {
+            openclFunctionGPU(inputFileFirst, inputFileSecond, outputFile);
+        } else if (algVersion == "host_target") {
+            openclFunctionGPUPlusCPU(inputFileFirst, inputFileSecond, outputFile);
+        } else if (algVersion == "host") {
+            hostFunction(inputFileFirst, inputFileSecond, outputFile);
+        }
+
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+
+        return 0;
+    } catch (std::exception& e) {
+        std::cerr << "Error occurred :\"" << e.what() << "\"\n";
+        return -1;
+    }
+}
+#else
+int main() {
+    utility::report_skipped();
+    return 0;
+}
+#endif /* __TBB_PREVIEW_OPENCL_NODE && __TBB_CPP11_LAMBDAS_PRESENT */
diff --git a/xdl/third_party/tbb/examples/graph/stereo/utils.h b/xdl/third_party/tbb/examples/graph/stereo/utils.h
new file mode 100644
index 00000000..c99399fb
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/utils.h
@@ -0,0 +1,108 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <iostream>
+#include <string>
+
+#include "lodepng.h"
+
+namespace utils {
+
+    inline unsigned char convert_uchar_sat(unsigned int v) {
+        return static_cast<unsigned char>(v < UCHAR_MAX ? v : UCHAR_MAX);
+    }
+
+    struct image_buffer {
+        unsigned int width, height;
+        std::shared_ptr< std::vector<unsigned char> > buffer; // smart pointer to the vector of raw pixels in RGBA format, 4 bytes per pixel
+    };
+
+    image_buffer readPNGImage(const std::string& imageName) {
+        image_buffer image;
+        image.buffer = std::make_shared< std::vector<unsigned char> >();
+
+        unsigned int error = lodepng::decode(*image.buffer, image.width, image.height, imageName.c_str());
+
+        if (error) {
+            std::string exceptionMessage = "decoder error: " + std::string(lodepng_error_text(error));
+            throw std::runtime_error(exceptionMessage);
+        }
+        return image;
+    }
+
+    void readPNGImage(unsigned char* imageBuffer, unsigned int& width, unsigned int& height, const char* imageName) {
+        unsigned int error = lodepng_decode32_file(&imageBuffer, &width, &height, imageName);
+
+        if (error) {
+            std::string exceptionMessage = "decoder error: " + std::string(lodepng_error_text(error));
+            throw std::runtime_error(exceptionMessage);
+        }
+    }
+
+    void writePNGImage(const image_buffer& image, const std::string& outputFile) {
+        unsigned int error = lodepng::encode(outputFile, *image.buffer, image.width, image.height);
+        if (error) {
+            std::string exceptionMessage = "encoder error: " + std::string(lodepng_error_text(error));
+            throw std::runtime_error(exceptionMessage);
+        }
+    }
+
+    void writePNGImage(unsigned char* imageBuffer, unsigned int& width, unsigned int& height, const std::string& outputFile) {
+        unsigned int error = lodepng::encode(outputFile, imageBuffer, width, height);
+        if (error) {
+            std::string exceptionMessage = "encoder error: " + std::string(lodepng_error_text(error));
+            throw std::runtime_error(exceptionMessage);
+        }
+    }
+
+    image_buffer generatePNGImage() {
+        image_buffer image;
+        image.width = 1024;
+        image.height = 1024;
+
+        image.buffer = std::make_shared< std::vector<unsigned char> >(image.width * image.height * 4);
+        std::vector<unsigned char>& buffer = *image.buffer;
+
+        const int widthOffset = 4 * image.width;
+        for (unsigned y = 0; y < image.height; y++) {
+            for (unsigned x = 0; x < image.width; x++) {
+                const int pixelOffset = widthOffset * y + 4 * x;
+                buffer[pixelOffset] = 200 * !(x & y);
+                buffer[pixelOffset + 1] = x ^ y;
+                buffer[pixelOffset + 2] = x | y;
+                buffer[pixelOffset + 3] = 255;
+            }
+        }
+        return image;
+    }
+
+    bool isFileExist(const std::string& fileName) {
+        std::ifstream file(fileName);
+        return file.good();
+    }
+
+    bool isBothImagesExists(const std::string& firstFile, const std::string& secondFile) {
+        return isFileExist(firstFile) && isFileExist(secondFile);
+    }
+
+    image_buffer getOrGenerateImage(const std::string& fileName) {
+        return fileName.empty() ? generatePNGImage() : readPNGImage(fileName);
+    }
+}
diff --git a/xdl/third_party/tbb/examples/graph/stereo/xcode/stereo.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/graph/stereo/xcode/stereo.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..820122d4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/graph/stereo/xcode/stereo.xcodeproj/project.pbxproj
@@ -0,0 +1,324 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		8415B6821CFC8B7F00A875B5 /* stereo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 8415B6801CFC8B7F00A875B5 /* stereo.cpp */; };
+		8415B6881CFC8B9200A875B5 /* lodepng.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 8415B6851CFC8B9200A875B5 /* lodepng.cpp */; };
+		8415B68A1CFC96D900A875B5 /* OpenCL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 8415B6891CFC96D900A875B5 /* OpenCL.framework */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58958218B657900DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8415B6801CFC8B7F00A875B5 /* stereo.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = stereo.cpp; path = ../stereo.cpp; sourceTree = "<group>"; };
+		8415B6831CFC8B9200A875B5 /* imageEffects.cl */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.opencl; name = imageEffects.cl; path = ../imageEffects.cl; sourceTree = "<group>"; };
+		8415B6851CFC8B9200A875B5 /* lodepng.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = lodepng.cpp; path = ../lodepng.cpp; sourceTree = "<group>"; };
+		8415B6861CFC8B9200A875B5 /* lodepng.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = lodepng.h; path = ../lodepng.h; sourceTree = "<group>"; };
+		8415B6891CFC96D900A875B5 /* OpenCL.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = OpenCL.framework; path = System/Library/Frameworks/OpenCL.framework; sourceTree = SDKROOT; };
+		8DD76F6C0486A84900D96B5E /* Stereo */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = Stereo; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				8415B68A1CFC96D900A875B5 /* OpenCL.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* Stereo */ = {
+			isa = PBXGroup;
+			children = (
+				8415B6891CFC96D900A875B5 /* OpenCL.framework */,
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = Stereo;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				8415B6831CFC8B9200A875B5 /* imageEffects.cl */,
+				8415B6851CFC8B9200A875B5 /* lodepng.cpp */,
+				8415B6861CFC8B9200A875B5 /* lodepng.h */,
+				8415B6801CFC8B7F00A875B5 /* stereo.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* Stereo */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* Stereo */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Stereo" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58958218B657900DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = Stereo;
+			productInstallPath = "$(HOME)/bin";
+			productName = Stereo;
+			productReference = 8DD76F6C0486A84900D96B5E /* Stereo */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "stereo" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* Stereo */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* Stereo */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				8415B6881CFC8B9200A875B5 /* lodepng.cpp in Sources */,
+				8415B6821CFC8B7F00A875B5 /* stereo.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Stereo;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Stereo;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+					"-framework",
+					OpenCL,
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+					"-framework",
+					OpenCL,
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Stereo" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "stereo" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/index.html b/xdl/third_party/tbb/examples/index.html
new file mode 100644
index 00000000..e9065fef
--- /dev/null
+++ b/xdl/third_party/tbb/examples/index.html
@@ -0,0 +1,581 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks Samples</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks Samples</h1>
+	</div>
+	
+	<p>
+		This directory includes example usages of Intel&reg; Threading Building Blocks (Intel&reg; TBB).
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="GettingStarted/index.html">GettingStarted</a>
+				<dd>Examples from the Intel TBB <a href="http://software.intel.com/en-us/tbb-tutorial">Getting&nbsp;Started&nbsp;Guide</a>.
+				<dt><a href="concurrent_hash_map/index.html">concurrent_hash_map</a>
+				<dd>Examples using <code>concurrent_hash_map</code> container.
+				<dt><a href="concurrent_priority_queue/index.html">concurrent_priority_queue</a>
+				<dd>Examples using <code>concurrent_priority_queue</code> container.
+				<dt><a href="graph/index.html">graph</a>
+				<dd>Examples using Intel TBB Flow Graph feature.
+				<dt><a href="parallel_do/index.html">parallel_do</a>
+				<dd>Examples using <code>parallel_do</code> algorithm.
+				<dt><a href="parallel_for/index.html">parallel_for</a>
+				<dd>Examples using <code>parallel_for</code> algorithm.
+				<dt><a href="parallel_reduce/index.html">parallel_reduce</a>
+				<dd>Examples using <code>parallel_reduce</code> algorithm.
+				<dt><a href="pipeline/index.html">pipeline</a>
+				<dd>Examples using <code>pipeline</code> algorithm.
+				<dt><a href="task/index.html">task</a>
+				<dd>Examples using raw <code>task</code> interface.
+				<dt><a href="task_group/index.html">task_group</a>
+				<dd>Examples using <code>task_group</code> interface.
+				<dt><a href="task_arena/index.html">task_arena</a>
+				<dd>Examples using the <code>task_arena</code> feature.
+				<dt><a href="test_all/index.html">test_all</a>
+				<dd>Examples that test various components of Intel TBB.
+				<dt><a href="common/index.html">common</a>
+				<dd>Common files for building various examples. Should not be used directly. But if you copy an example to other place this folder should be copied also and should have the same relative path for copied example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Build Instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<br>
+			<div class="note">
+				Note: Some of the following directions refer to a shell window. This refers
+				to the command prompt environment/window normally used on your system:
+				<ul>
+					<li>cmd.exe command prompt window for Windows* systems
+					<li>sh, bash, csh, ksh, etc. (or compatible) shell window for Windows*, Linux* or macOS* systems
+				</ul>
+			</div>
+			<p>
+			Set up the environment for using Intel TBB:
+			</p>
+			<div class="h4-alike">To set up the environment for Windows* OS:</div>
+			<input type="checkbox">
+			<div class="show-hide">
+
+				<p>
+					It is <b>strongly</b> recommended to set up the environment when installing Intel TBB.
+					Do this by selecting the appropriate check-box during the install. However, if the environment is not set up
+					during installation, or you wish to build for an alternate architecture or Microsoft* Visual Studio* version,
+					it may be set up, for a given type of shell window, by using one of the following commands:
+				</p>
+				<dl>
+				<dt>For cmd.exe (command prompt):
+				<dd>
+					<pre>
+&lt;<i>installdir</i>&gt;/bin/tbbvars.bat (arch) [vs]
+					</pre>
+				<dt>where:
+				<dd>
+					<li><i>(arch)</i> argument represents target architecture. Its possible values are 'ia32' or 'intel64'.
+					<li><i>[vs]</i> argument represents target version of Microsoft* Visual Studio*. Its possible values are:
+					<ul class='circ'>
+					<li><i>'vs&lt;msvs_version&gt;'</i> - to use Intel TBB library with Microsoft* Visual Studio* <i>&lt;msvs_version&gt;</i> runtime DLLs, e.g.: <code>tbbvars&nbsp;intel64&nbsp;vs2015</code>
+						<br><i>Note:</i> for the most up to date supported versions of Microsoft* Visual Studio*, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+					<li><i>'all'</i> - to use Intel TBB binaries statically linked with Microsoft Visual C++ runtime.
+						<br>If <i>[vs]</i> is not set the <i>'all'</i> value will be used by default.
+					</ul>
+				</dl>
+			</div>
+			<br>
+			<div class="h4-alike">To set up the environment for Linux* OS and macOS*:</div>
+			<input type="checkbox">
+			<div class="show-hide">
+				<p>
+					The environment may be set up, for a given type of shell window, by using one of the following commands:
+				</p>
+				<dl>
+				<dt>For sh, bash, ksh, dash (or compatibles):
+				<dd>
+				<pre>
+<b>.</b> &lt;<i>installdir</i>&gt;/bin/tbbvars.sh (arch) [platform [TBBROOT_detection_mode]]
+				</pre>
+				<dt>For csh (or compatibles):
+				<dd>
+				<pre>
+source &lt;<i>installdir</i>&gt;/bin/tbbvars.csh (arch) [platform [TBBROOT_detection_mode]]
+				</pre>
+				<dt>where:
+				<dd>
+					<li><i>(arch)</i> argument represents target architecture. Its possible values are <i>'ia32'</i> or <i>'intel64'</i>.
+					<li><i>[platform]</i> argument represents target platform. Its possible values are <i>'linux'</i> or <i>'android'</i>.
+					<li><i>[TBBROOT_detection_mode]</i> argument represents TBBROOT path detection method. Its only possible value is <i>'auto_tbbroot'</i>. In this case the environment variable TBBROOT is detected automatically by using the tbbvars script directory path.
+				</dl>
+			Environment setup need only be performed once per shell window to be used.
+			<br>Always source tbbvars.sh or tbbvars.csh rather than executing them directly.
+			<br>If the arguments to the sourced script are ignored (consult documentation for your shell) the alternative way to specify target is environment variables COMPILERVARS_ARCHITECTURE to pass (arch) to the script and COMPILERVARS_PLATFORM to pass [platform].
+				
+			</div>
+			<p>
+			Build each example by using one of the following methods:
+			</p>
+			<div class="h4-alike">To build by using a Microsoft* Visual Studio* project (Windows* systems):</div>
+			<input type="checkbox">
+			<div class="show-hide">
+			<ol>
+			<li>Identify the solution (*.sln) file for the example you wish to build and run. The *.sln file for each example is in the example's <i>msvs</i> sub-directory.
+			<li>Open the project by using one of the following methods:
+				<ul class="disc">
+				<li>Navigate to the *.sln file from My Computer, by using Windows Explorer, or by using another file browser. Double-click the *.sln file to invoke Microsoft* Visual Studio* and open the project.</li>
+				<li>Invoke Microsoft* Visual Studio* from the Start menu and use the "Open Project" dialog to navigate to and open the project.</li>
+				</ul>
+			</li>
+			<li>Press &lt;ctrl-F5&gt; to build and run the example.</li>
+			<li>If you copied an example to another place separately from libraries you need to
+				set %TBBROOT% variable pointing to &lt;installdir&gt; folder.</li>
+			</ol>
+			</div>
+			<br>
+			<div class="h4-alike">To build by using a Xcode* IDE project (macOS* systems):</div>
+			<input type="checkbox">
+			<div class="show-hide">
+			<br>
+			<div class="note">
+				Note: Xcode* project instructions are not applicable for the Intel TBB Sample Bundle for Intel&reg; System Studio
+				because Intel System Studio does not support macOS*. For additional information, see the
+				<a href="https://software.intel.com/en-us/articles/intel-system-studio-release-notes">Release Notes</a>.
+			</div>
+			<ol>
+			<li>Identify the project (*.xcodeproj) file for the example you wish to build and run. The *.xcodeproj file is in the example's <i>xcode</i> sub-directory.</li>
+			<li>Open the project by using one of the following methods:
+				<ul class="disc">
+				<li>Navigate to the *.xcodeproj file by using the Finder.Double-click the *.xcodeproj file to invoke the Xcode* IDE and open the project.</li>
+				<li>Invoke the Xcode* IDE and use the "File -> Open" dialog to navigate to and open the project.</li>
+				</ul>
+			</li>
+			<li>Press &lt;Apple-R&gt;, or press the "Build and Go" button in the toolbox, to build and run the example.
+			</li>
+			</ol>
+			</div>
+			<br>
+			<div class="h4-alike">To build by using a Makefile (Windows*, Linux* or macOS* systems):</div>
+			<input type="checkbox">
+			<div class="show-hide">
+			<ol>
+			<li>Open a shell window
+				<ul class="disc">
+				<li>For Windows* systems, make sure this shell window has the proper environment
+					defined for use with Microsoft* Visual Studio*. Such shell can be invoked from the Start menu, under Microsoft* Visual Studio*, Microsoft* Visual Studio Tools*, Microsoft* Visual Studio* Command Prompt.</li>
+				</ul>
+			<li>Set up the environment in this shell window for use with Intel TBB.
+				<br>See above for how to set up the environment for Windows*, Linux* or macOS* systems.
+			<li>Unless you installed Intel TBB yourself, you may not have write permissions to the directory
+				containing the example. In this case, make a copy of the example, and use the copy for the following steps.
+			<li>In the shell window, navigate to the directory for the example
+				(or to the directory for the copy of the example if you made one in the previous step).
+			<li>Use one or more of the following commands to build and run the example.
+				Here, make refers to the make command normally used on your system: this could be
+				nmake, gmake, or make on Windows* systems, or make or gmake on Linux* or macOS* systems.
+				<dl>
+				<dt><tt>make</tt>
+				<dd>Default build and run. Equivalent to 'make release test'.
+				<dt><tt>make release</tt>
+				<dd>Compile and link against the release version of Intel TBB runtime library. The resulting executable is left in the directory for the example.
+				<dt><tt>make debug</tt>
+				<dd>Compile and link against the debug version of Intel TBB runtime library. The resulting executable is left in the directory for the example.
+				<dt><tt>make profile</tt>
+				<dd>Similar to 'make release' but also enables additional support for Intel&reg; Parallel Studio XE analysis tools.
+                                        <br>
+                                        <div class="note">
+                                                Note: Only flow graph examples are currently supported.
+                                        </div>
+				<dt><tt>make test</tt>
+				<dd>Run an executable previously produced by one of the above commands.
+				<dt><tt>make <b>[</b>(above options or targets)<b>]</b> CXX=<b>{</b>icl, icc<b>}</b></tt>
+				<dd>Build and run as above, but use Intel&reg; C++ Compiler instead of default, native compilers (e.g., icl instead of cl.exe on Windows* systems, or icc instead of g++ on Linux* or macOS* systems).
+				<dt><tt>make <b>[</b>(above options or targets)<b>]</b> offload=mic</tt>
+				<dd>Build and run the offload version of an example for Intel&reg; Many Integrated Core (Intel&reg; MIC) Architecture.
+					<br>
+					<div class="note">
+						Note: Only Intel&reg; MIC Architecture with Linux* based host is currently supported.
+					</div>
+				<dt><tt>make clean</tt>
+				<dd>Remove any executables or intermediate files produced by the above commands.
+				</dl>
+			</ol>
+			</div>
+			<br>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a> (available only in the Intel&reg; Parallel Studio and Intel&reg; System Studio Online Samples packages and the open-source version of Intel TBB)
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<br>
+			<div class="tablenoborder">
+			<table border="1" rules="all" frame="border" cellspacing="0" cellpadding="4" summary=""> 
+				<thead align="left"> 
+				<tr> 
+					<th width="100%" align="left" class="cellrowborder" valign="top"> 
+						<p>Optimization Notice</p>
+					</th>
+			 	</tr>
+				</thead>
+			 
+				<tbody> 
+				<tr> 
+					<td width="100%" class="bgcolor(#f5f5f5)" valign="top" bgcolor="#f5f5f5"> 
+					  <p>Intel's compilers may or may not optimize to the same 
+					  degree for non-Intel microprocessors for optimizations that 
+					  are not unique to Intel microprocessors. These optimizations 
+					  include SSE2, SSE3, and SSSE3 instruction sets and other 
+					  optimizations. Intel does not guarantee the availability, 
+					  functionality, or effectiveness of any optimization on 
+					  microprocessors not manufactured by Intel. 
+					  Microprocessor-dependent optimizations in this product are 
+					  intended for use with Intel microprocessors. Certain 
+					  optimizations not specific to Intel microarchitecture are 
+					  reserved for Intel microprocessors. Please refer to the 
+					  applicable product User and Reference Guides for more 
+					  information regarding the specific instruction sets covered by 
+					  this notice. 
+					  </p>
+	 				  <p>Notice revision #20110804 
+					  </p>
+				  </td>
+				</tr>
+				</tbody>
+			</table>
+			</div>
+			
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_do/index.html b/xdl/third_party/tbb/examples/parallel_do/index.html
new file mode 100644
index 00000000..f211569b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on parallel_do algorithm</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>parallel_do</code> algorithm</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the <code>parallel_do</code> algorithm.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="parallel_preorder/readme.html">parallel_preorder</a>
+				<dd>Parallel preorder traversal of a graph.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Graph.cpp b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Graph.cpp
new file mode 100644
index 00000000..c8429dbc
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Graph.cpp
@@ -0,0 +1,101 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstdlib>
+#include "Graph.h"
+#include <iostream>
+
+using namespace std;
+
+void Graph::create_random_dag( size_t number_of_nodes ) {
+    my_vertex_set.resize(number_of_nodes);
+    for( size_t k=0; k<number_of_nodes; ++k ) {
+        Cell& c = my_vertex_set[k];
+        int op = int((rand()>>8)%5u);
+        if( op>int(k) ) op = int(k);
+        switch( op ) {
+            default:
+                c.op = OP_VALUE;
+                c.value = Cell::value_type((float)k);
+                break;
+            case 1:
+                c.op = OP_NEGATE;
+                break;
+            case 2:
+                c.op = OP_SUB;
+                break;
+            case 3: 
+                c.op = OP_ADD;
+                break;
+            case 4: 
+                c.op = OP_MUL;
+                break;
+        }
+        for( int j=0; j<ArityOfOp[c.op]; ++j ) {
+            Cell& input = my_vertex_set[rand()%k];
+            c.input[j] = &input;
+        }
+    }
+}
+
+void Graph::print() {
+    for( size_t k=0; k<my_vertex_set.size(); ++k ) {
+        std::cout<<"Cell "<<k<<":";
+        for( size_t j=0; j<my_vertex_set[k].successor.size(); ++j )
+            std::cout<<" "<<int(my_vertex_set[k].successor[j] - &my_vertex_set[0]);
+        std::cout<<std::endl;
+    }
+}
+
+void Graph::get_root_set( vector<Cell*>& root_set ) {
+    for( size_t k=0; k<my_vertex_set.size(); ++k ) {
+        my_vertex_set[k].successor.clear();
+    }
+    root_set.clear();
+    for( size_t k=0; k<my_vertex_set.size(); ++k ) {
+        Cell& c = my_vertex_set[k];
+        c.ref_count = ArityOfOp[c.op];
+        for( int j=0; j<ArityOfOp[c.op]; ++j ) {
+            c.input[j]->successor.push_back(&c);
+        }
+        if( ArityOfOp[c.op]==0 )
+            root_set.push_back(&my_vertex_set[k]);
+    }
+}
+
+void Cell::update() {
+    switch( op ) {
+        case OP_VALUE:
+            break;
+        case OP_NEGATE:
+            value = -(input[0]->value);
+            break;
+        case OP_ADD:
+            value = input[0]->value + input[1]->value;
+            break;
+        case OP_SUB:
+            value = input[0]->value - input[1]->value;
+            break;
+        case OP_MUL:
+            value = input[0]->value * input[1]->value;
+            break;
+    }
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Graph.h b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Graph.h
new file mode 100644
index 00000000..1f4ed128
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Graph.h
@@ -0,0 +1,80 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "Matrix.h"
+#include "tbb/atomic.h"
+#include <vector>
+
+enum OpKind {
+    // Use Cell's value
+    OP_VALUE,
+    // Unary negation
+    OP_NEGATE,
+    // Addition
+    OP_ADD,
+    // Subtraction
+    OP_SUB,
+    // Multiplication
+    OP_MUL
+};
+
+static const int ArityOfOp[] = {0,1,2,2,2};
+
+class Cell {
+public:
+    //! Operation for this cell
+    OpKind op;
+
+    //! Inputs to this cell
+    Cell* input[2];
+   
+    //! Type of value stored in a Cell
+    typedef Matrix value_type;
+
+    //! Value associated with this Cell
+    value_type value;
+
+    //! Set of cells that use this Cell as an input
+    std::vector<Cell*> successor;
+
+    //! Reference count of number of inputs that are not yet updated.
+    tbb::atomic<int> ref_count;
+
+    //! Update the Cell's value.
+    void update();
+
+    //! Default constructor
+    Cell() {}
+};
+
+//! A directed graph where the vertices are Cells.
+class Graph {
+    std::vector<Cell> my_vertex_set;
+public:
+    //! Create a random acyclic directed graph
+    void create_random_dag( size_t number_of_nodes );
+
+    //! Print the graph
+    void print();
+
+    //! Get set of cells that have no inputs.
+    void get_root_set( std::vector<Cell*>& root_set );
+};
+
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Makefile b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Makefile
new file mode 100644
index 00000000..3516207c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Makefile
@@ -0,0 +1,63 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=parallel_preorder
+ARGS=
+PERF_RUN_ARGS=auto silent 500000  100
+LIGHT_ARGS=1:auto:+4 n-of-traversals=50
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+light_test:
+	$(run_cmd) ./$(PROG) $(LIGHT_ARGS)
+
+perf_build:	release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Makefile.windows b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Makefile.windows
new file mode 100644
index 00000000..d4190126
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Makefile.windows
@@ -0,0 +1,54 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Parallel_Preorder
+ARGS=
+PERF_RUN_ARGS=auto silent 500000  100
+LIGHT_ARGS=1:auto:+4 n-of-traversals=50
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: compiler_check
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: compiler_check
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
+
+perf_build:	release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Matrix.h b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Matrix.h
new file mode 100644
index 00000000..aacc41d4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/Matrix.h
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+class Matrix {
+    static const int n = 20;
+    float array[n][n];
+public:
+    Matrix() {}
+    Matrix( float z ) {
+        for( int i=0; i<n; ++i )
+            for( int j=0; j<n; ++j )
+                array[i][j] = i==j ? z : 0;
+    }
+    friend Matrix operator-( const Matrix& x ) {
+        Matrix result;
+        for( int i=0; i<n; ++i )
+            for( int j=0; j<n; ++j )
+                result.array[i][j] = -x.array[i][j];
+        return result;
+    }
+    friend Matrix operator+( const Matrix& x, const Matrix& y ) {
+        Matrix result;
+        for( int i=0; i<n; ++i )
+            for( int j=0; j<n; ++j )
+                result.array[i][j] = x.array[i][j] + y.array[i][j];
+        return result;
+    }
+    friend Matrix operator-( const Matrix& x, const Matrix& y ) {
+        Matrix result;
+        for( int i=0; i<n; ++i )
+            for( int j=0; j<n; ++j )
+                result.array[i][j] = x.array[i][j] - y.array[i][j];
+        return result;
+    }
+    friend Matrix operator*( const Matrix& x, const Matrix& y ) {
+        Matrix result(0);
+        for( int i=0; i<n; ++i ) 
+            for( int k=0; k<n; ++k )
+                for( int j=0; j<n; ++j )
+                    result.array[i][j] += x.array[i][k] * y.array[k][j];
+        return result;
+    }
+};
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/main.cpp b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/main.cpp
new file mode 100644
index 00000000..6b1a19cf
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/main.cpp
@@ -0,0 +1,93 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Example program that shows how to use parallel_do to do parallel preorder
+   traversal of a directed acyclic graph. */
+
+#include <cstdlib>
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "../../common/utility/utility.h"
+#include <iostream>
+#include <vector>
+#include "Graph.h"
+
+// some forward declarations
+class Cell;
+void ParallelPreorderTraversal( const std::vector<Cell*>& root_set );
+
+//------------------------------------------------------------------------
+// Test driver
+//------------------------------------------------------------------------
+utility::thread_number_range threads(tbb::task_scheduler_init::default_num_threads);
+static unsigned nodes = 1000;
+static unsigned traversals = 500;
+static bool SilentFlag = false;
+
+//! Parse the command line.
+static void ParseCommandLine( int argc, const char* argv[] ) {
+    utility::parse_cli_arguments(
+            argc,argv,
+            utility::cli_argument_pack()
+                //"-h" option for displaying help is present implicitly
+                .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+                .positional_arg(nodes,"n-of-nodes","number of nodes in the graph.")
+                .positional_arg(traversals,"n-of-traversals","number of times to evaluate the graph. Reduce it (e.g. to 100) to shorten example run time\n")
+                .arg(SilentFlag,"silent","no output except elapsed time ")
+    );
+}
+
+int main( int argc, const char* argv[] ) {
+    try {
+        tbb::tick_count main_start = tbb::tick_count::now();
+        ParseCommandLine(argc,argv);
+
+        // Start scheduler with given number of threads.
+        for( int p=threads.first; p<=threads.last; p = threads.step(p) ) {
+            tbb::tick_count t0 = tbb::tick_count::now();
+            tbb::task_scheduler_init init(p);
+            srand(2);
+            size_t root_set_size = 0;
+            {
+                Graph g;
+                g.create_random_dag(nodes);
+                std::vector<Cell*> root_set;
+                g.get_root_set(root_set);
+                root_set_size = root_set.size();
+                for( unsigned int trial=0; trial<traversals; ++trial ) {
+                    ParallelPreorderTraversal(root_set);
+                }
+            }
+            tbb::tick_count::interval_t interval = tbb::tick_count::now()-t0;
+            if (!SilentFlag){
+                std::cout
+                    <<interval.seconds()<<" seconds using "<<p<<" threads ("<<root_set_size<<" nodes in root_set)\n";
+            }
+        }
+        utility::report_elapsed_time((tbb::tick_count::now()-main_start).seconds());
+
+        return 0;
+    }catch(std::exception& e){
+        std::cerr
+            << "unexpected error occurred. \n"
+            << "error description: "<<e.what()<<std::endl;
+        return -1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/msvs/parallel_preorder.sln b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/msvs/parallel_preorder.sln
new file mode 100644
index 00000000..30ad369a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/msvs/parallel_preorder.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "parallel_preorder", "parallel_preorder.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252B}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252B}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/msvs/parallel_preorder.vcxproj b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/msvs/parallel_preorder.vcxproj
new file mode 100644
index 00000000..4f66cc8c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/msvs/parallel_preorder.vcxproj
@@ -0,0 +1,207 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>parallel_preorder</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252B}</ProjectGuid>
+    <RootNamespace>parallel_preorder</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\Graph.cpp" />
+    <ClCompile Include="..\main.cpp" />
+    <ClCompile Include="..\parallel_preorder.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\Graph.h" />
+    <ClInclude Include="..\Matrix.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/parallel_preorder.cpp b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/parallel_preorder.cpp
new file mode 100644
index 00000000..0839da9e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/parallel_preorder.cpp
@@ -0,0 +1,56 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/parallel_do.h"
+#include <vector>
+#include <algorithm>
+#include "Graph.h"
+
+
+class Body {
+public:
+    Body() {};
+
+    //------------------------------------------------------------------------
+    // Following signatures are required by parallel_do
+    //------------------------------------------------------------------------
+    typedef Cell* argument_type;
+
+    void operator()( Cell* c, tbb::parallel_do_feeder<Cell*>& feeder ) const {
+        c->update();
+        // Restore ref_count in preparation for subsequent traversal.
+        c->ref_count = ArityOfOp[c->op];
+        for( size_t k=0; k<c->successor.size(); ++k ) {
+            Cell* successor = c->successor[k];
+            // ref_count is used for inter-task synchronization.
+            // Correctness checking tools might not take this into account, and report
+            // data races between different tasks, that are actually synchronized.
+            if( 0 == --(successor->ref_count) ) {
+                feeder.add( successor );
+            }
+        }
+    }
+};
+
+void ParallelPreorderTraversal( const std::vector<Cell*>& root_set ) {
+    tbb::parallel_do(root_set.begin(), root_set.end(),Body());
+}
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/readme.html b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/readme.html
new file mode 100644
index 00000000..43b17683
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/readme.html
@@ -0,0 +1,444 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Parallel_preorder sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Parallel_preorder sample</h1>
+	</div>
+	
+	<p>
+		Example that uses parallel_do to do parallel preorder traversal of a sparse graph.
+	<br><br>
+		Each vertex in the graph is called a "cell".  
+		Each cell has a value. 
+		The value is a matrix. 
+		Some of the cells have operators
+		that compute the cell's value, using other cell's values as input.
+		A cell that uses the value of cell x is called a successor of x.
+	<br><br>
+		The algorithm works as follows. 
+		<ol>
+		<li> Compute the set of cells that have no inputs. This set is called <tt>root_set</tt>.
+		<li> Each cell has an associated field <tt>ref_count</tt> that is an atomic integer.
+			 Initialize <tt>ref_count</tt> to the number of inputs for the Cell.
+		<li> Update each cell in <tt>root_set</tt>, by applying a <tt>parallel_do</tt> to a <tt>root_set</tt>
+		<li> After updating a cell, for each of its successors 
+		<ol>
+		<li> Atomically decrement the successor's <tt>ref_count</tt>
+		<li> If the count became zero, add the cell to the set of cells to be updated,
+			 by calling <tt>parallel_do_feeder_impl::add</tt>.
+		</ol>
+		</ol>
+		The times printed are for the traversal and update, 
+		and do not include time for computing the root_set.
+	<br><br>
+		The example is using custom synchronization via <tt>ref_count</tt> atomic variable.
+		Correctness checking tools might not take this into account, and report data races
+		between different tasks that are actually synchronized.
+	<br><br>
+		<b>Note:</b> It is important to understand that this example is unlikely to show speedup 
+		if the cell values are changed to type "float".  The reason is twofold.
+		<ul>
+		<li> The smaller value type causes each Cell to be significantly smaller than a cache line,
+			 which leads to false sharing conflicts.
+		<li> The time to update the cells becomes very small, and consequently the overhead of
+			 parallel_do swamps the useful work.
+		</ul>
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="main.cpp">main.cpp</a>
+				<dd>Main program which parses command line options and runs the algorithm with different numbers of threads.
+				<dt><a href="parallel_preorder.cpp">parallel_preorder.cpp</a>
+				<dd>Implementation of the parallel preorder traversal algorithm.
+				<dt><a href="Graph.h">Graph.h</a>
+				<dd>Interfaces of the Graph and Cell classes.
+				<dt><a href="Graph.cpp">Graph.cpp</a>
+				<dd>Implementations of the Graph and Cell classes.
+				<dt><a href="Matrix.h">Matrix.h</a>
+				<dd>The Matrix class definition.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>parallel_preorder <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>parallel_preorder [<i>n-of-threads</i>=value] [<i>n-of-nodes</i>=value] [<i>n-of-traversals</i>=value] [<i>silent</i>] </tt>
+				<dt><tt>parallel_preorder [<i>n-of-threads</i> [<i>n-of-nodes</i> [<i>n-of-traversals</i>]]] [<i>silent</i>] </tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>n-of-nodes</i> is a number of nodes in the graph. Default value is 1000.<br>
+					<i>n-of-traversals</i> is the number of times to evaluate the graph. Default value is 500.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with the desired number of threads and smaller number of traversals, e.g., <tt>parallel_preorder&nbsp;4&nbsp;1000&nbsp;5</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/xcode/parallel_preorder.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/xcode/parallel_preorder.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..d3c8cb6a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_do/parallel_preorder/xcode/parallel_preorder.xcodeproj/project.pbxproj
@@ -0,0 +1,272 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		05593AA80B8F55D500DE73AB /* Graph.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 05593AA40B8F55D500DE73AB /* Graph.cpp */; };
+		05593AAB0B8F55D500DE73AB /* parallel_preorder.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 05593AA70B8F55D500DE73AB /* parallel_preorder.cpp */; };
+		EAD808FA13051AB300FE8C7C /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EAD808F913051AB300FE8C7C /* main.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58959218B66AC00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		05593AA40B8F55D500DE73AB /* Graph.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = Graph.cpp; path = ../Graph.cpp; sourceTree = SOURCE_ROOT; };
+		05593AA50B8F55D500DE73AB /* Graph.h */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.c.h; name = Graph.h; path = ../Graph.h; sourceTree = SOURCE_ROOT; };
+		05593AA60B8F55D500DE73AB /* Matrix.h */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.c.h; name = Matrix.h; path = ../Matrix.h; sourceTree = SOURCE_ROOT; };
+		05593AA70B8F55D500DE73AB /* parallel_preorder.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = parallel_preorder.cpp; path = ../parallel_preorder.cpp; sourceTree = SOURCE_ROOT; };
+		8DD76F6C0486A84900D96B5E /* parallel_preorder */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = parallel_preorder; sourceTree = BUILT_PRODUCTS_DIR; };
+		EAD808F913051AB300FE8C7C /* main.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = main.cpp; path = ../main.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* parallel_preorder */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = parallel_preorder;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				EAD808F913051AB300FE8C7C /* main.cpp */,
+				05593AA70B8F55D500DE73AB /* parallel_preorder.cpp */,
+				05593AA40B8F55D500DE73AB /* Graph.cpp */,
+				05593AA50B8F55D500DE73AB /* Graph.h */,
+				05593AA60B8F55D500DE73AB /* Matrix.h */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* parallel_preorder */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* parallel_preorder */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "parallel_preorder" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58959218B66AC00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = parallel_preorder;
+			productInstallPath = "$(HOME)/bin";
+			productName = parallel_preorder;
+			productReference = 8DD76F6C0486A84900D96B5E /* parallel_preorder */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "parallel_preorder" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* parallel_preorder */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* parallel_preorder */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				05593AA80B8F55D500DE73AB /* Graph.cpp in Sources */,
+				05593AAB0B8F55D500DE73AB /* parallel_preorder.cpp in Sources */,
+				EAD808FA13051AB300FE8C7C /* main.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = parallel_preorder;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = parallel_preorder;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "parallel_preorder" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "parallel_preorder" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/Makefile b/xdl/third_party/tbb/examples/parallel_for/game_of_life/Makefile
new file mode 100644
index 00000000..3ca06968
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/Makefile
@@ -0,0 +1,53 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=game_of_life
+ARGS=2:4 -t 5
+LIGHT_ARGS=1:2 -t 5
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: src/Evolution.cpp src/Update_state.cpp src/Game_of_life.cpp
+	$(CXX) -O2 -DNDEBUG -D_CONSOLE $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug: src/Evolution.cpp src/Update_state.cpp src/Game_of_life.cpp
+	$(CXX) -O0 -D_CONSOLE -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+clean:
+	rm -f $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+light_test:
+	$(run_cmd) ./$(PROG) $(LIGHT_ARGS)
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/Makefile.windows b/xdl/third_party/tbb/examples/parallel_for/game_of_life/Makefile.windows
new file mode 100644
index 00000000..15c93430
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/Makefile.windows
@@ -0,0 +1,46 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=game_of_life
+ARGS=2:4 -t 5
+LIGHT_ARGS=1:2 -t 5
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: 
+	$(CXX) ./src/Evolution.cpp ./src/Game_of_life.cpp ./src/Update_state.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: 
+	$(CXX) ./src/Evolution.cpp ./src/Game_of_life.cpp ./src/Update_state.cpp /MDd /Od /Zi /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/Game_of_life.sln b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/Game_of_life.sln
new file mode 100644
index 00000000..97acd9eb
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/Game_of_life.sln
@@ -0,0 +1,40 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "Game of Life", "Game_of_life.vcxproj", "{731C7E2E-2766-41D9-96FC-0A3548973803}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug(console)|Win32 = Debug(console)|Win32
+		Debug(console)|x64 = Debug(console)|x64
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release(console)|Win32 = Release(console)|Win32
+		Release(console)|x64 = Release(console)|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug(console)|Win32.ActiveCfg = Debug(console)|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug(console)|Win32.Build.0 = Debug(console)|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug(console)|x64.ActiveCfg = Debug(console)|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug(console)|x64.Build.0 = Debug(console)|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug|Win32.ActiveCfg = Debug|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug|Win32.Build.0 = Debug|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug|x64.ActiveCfg = Debug|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Debug|x64.Build.0 = Debug|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release(console)|Win32.ActiveCfg = Release(console)|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release(console)|Win32.Build.0 = Release(console)|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release(console)|x64.ActiveCfg = Release(console)|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release(console)|x64.Build.0 = Release(console)|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release|Win32.ActiveCfg = Release|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release|Win32.Build.0 = Release|Win32
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release|x64.ActiveCfg = Release|x64
+		{731C7E2E-2766-41D9-96FC-0A3548973803}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/Game_of_life.vcxproj b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/Game_of_life.vcxproj
new file mode 100644
index 00000000..1a6c3ada
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/Game_of_life.vcxproj
@@ -0,0 +1,451 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug(console)|Win32">
+      <Configuration>Debug(console)</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug(console)|x64">
+      <Configuration>Debug(console)</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release(console)|Win32">
+      <Configuration>Release(console)</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release(console)|x64">
+      <Configuration>Release(console)</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>Game of Life</ProjectName>
+    <ProjectGuid>{731C7E2E-2766-41D9-96FC-0A3548973803}</ProjectGuid>
+    <RootNamespace>Game_of_life</RootNamespace>
+    <Keyword>ManagedCProj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <CLRSupport>false</CLRSupport>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <CLRSupport>false</CLRSupport>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>Unicode</CharacterSet>
+    <CLRSupport>true</CLRSupport>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>Unicode</CharacterSet>
+    <CLRSupport>true</CLRSupport>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <CLRSupport>false</CLRSupport>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <CLRSupport>false</CLRSupport>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>Unicode</CharacterSet>
+    <CLRSupport>true</CLRSupport>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>Unicode</CharacterSet>
+    <CLRSupport>true</CLRSupport>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <IgnoreImportLibrary Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</IgnoreImportLibrary>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <IgnoreImportLibrary Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</IgnoreImportLibrary>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <IgnoreImportLibrary Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</IgnoreImportLibrary>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <IgnoreImportLibrary Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</IgnoreImportLibrary>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_WINDOWS;_DEBUG;USE_SSE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <GenerateXMLDocumentationFiles>false</GenerateXMLDocumentationFiles>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;user32.lib</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <AssemblyDebug>true</AssemblyDebug>
+      <SubSystem>Windows</SubSystem>
+      <EntryPointSymbol>main</EntryPointSymbol>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <GenerateXMLDocumentationFiles>false</GenerateXMLDocumentationFiles>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;user32.lib</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <AssemblyDebug>true</AssemblyDebug>
+      <SubSystem>Windows</SubSystem>
+      <EntryPointSymbol>main</EntryPointSymbol>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalOptions>-S -03
+ %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level3</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;user32.lib</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <EntryPointSymbol>main</EntryPointSymbol>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalOptions>-S -03
+ %(AdditionalOptions)</AdditionalOptions>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level3</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;user32.lib</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <EntryPointSymbol>main</EntryPointSymbol>
+      <TargetMachine>MachineX64</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'">
+    <CustomBuildStep>
+      <Message>
+      </Message>
+    </CustomBuildStep>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;_CRT_SECURE_NO_DEPRECATE;USE_SSE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ExceptionHandling>Sync</ExceptionHandling>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <ProgramDatabaseFile>$(TargetDir)$(TargetName).pdb</ProgramDatabaseFile>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'">
+    <CustomBuildStep>
+      <Message>
+      </Message>
+    </CustomBuildStep>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ExceptionHandling>Sync</ExceptionHandling>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <ProgramDatabaseFile>$(TargetDir)$(TargetName).pdb</ProgramDatabaseFile>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'">
+    <CustomBuildStep>
+      <Message>
+      </Message>
+    </CustomBuildStep>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;_CRT_SECURE_NO_DEPRECATE;USE_SSE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'">
+    <CustomBuildStep>
+      <Message>
+      </Message>
+    </CustomBuildStep>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;_CRT_SECURE_NO_DEPRECATE;USE_SSE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <Reference Include="System">
+      <CopyLocalSatelliteAssemblies>true</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </Reference>
+    <Reference Include="System.Data">
+      <CopyLocalSatelliteAssemblies>true</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </Reference>
+    <Reference Include="System.Drawing">
+      <CopyLocalSatelliteAssemblies>true</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </Reference>
+    <Reference Include="System.Windows.Forms">
+      <CopyLocalSatelliteAssemblies>true</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </Reference>
+    <Reference Include="System.Xml">
+      <CopyLocalSatelliteAssemblies>true</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </Reference>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\src\AssemblyInfo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug(console)|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug(console)|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release(console)|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release(console)|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+    <ClCompile Include="..\src\Evolution.cpp" />
+    <ClCompile Include="..\src\Game_of_life.cpp" />
+    <ClCompile Include="..\src\Update_state.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\src\Board.h" />
+    <ClInclude Include="..\src\Evolution.h" />
+    <ClInclude Include="..\src\Form1.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="app.ico" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="app.rc" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/app.ico b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/app.ico
new file mode 100644
index 00000000..3a5525fd
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/app.ico differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/app.rc b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/app.rc
new file mode 100644
index 00000000..807aa896
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/app.rc
@@ -0,0 +1,63 @@
+// Microsoft Visual C++ generated resource script.
+//
+#include "resource.h"
+
+#define APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// English (U.S.) resources
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Icon
+//
+
+// Icon placed first or with lowest ID value becomes application icon
+
+LANGUAGE 9, 1
+#pragma code_page(1252)
+1           ICON         "app.ico"
+
+#ifdef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// TEXTINCLUDE
+//
+
+1 TEXTINCLUDE  
+BEGIN
+    "resource.h\0"
+    "\0"
+END
+
+2 TEXTINCLUDE  
+BEGIN
+    "#include ""afxres.h""\r\n"
+    "\0"
+END
+
+3 TEXTINCLUDE  
+BEGIN
+    "\0"
+END
+
+#endif    // APSTUDIO_INVOKED
+
+/////////////////////////////////////////////////////////////////////////////
+
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/resource.h b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/resource.h
new file mode 100644
index 00000000..4176a013
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/msvs/resource.h
@@ -0,0 +1,23 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//{{NO_DEPENDENCIES}}
+// Microsoft Visual C++ generated include file.
+// Used by app.rc
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/readme.html b/xdl/third_party/tbb/examples/parallel_for/game_of_life/readme.html
new file mode 100644
index 00000000..a690a814
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/readme.html
@@ -0,0 +1,392 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Game_of_life sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Game_of_life sample</h1>
+	</div>
+	
+	<p>
+		The "Game of life" example demonstrates interoperability of Intel&#174; Threading Building Blocks (Intel&#174; TBB) 
+		and Microsoft* .NET*.
+	<br><br>
+		This program runs 2 simultaneous instances of the classic Conway's "Game of Life". 
+		One of these instances uses serial calculations to update the board. The other one calculates in parallel with Intel TBB.
+		The visualization is written in managed C++ and uses .NET CLR.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="src/Form1.h">Form1.h</a>, <a href="src/Board.h">Board.h</a>
+				<dd>Header files for GUI classes.
+				<dt><a href="src/Evolution.h">Evolution.h</a>, <a href="src/Evolution.cpp">Evolution.cpp</a>
+				<dd>Contain class hierarchy to implement game evolution in serial and parallel.
+				<dt><a href="src/Update_state.cpp">Update_state.cpp </a>
+				<dd>Implements 2 approaches for calculating steps in the program: with the use of SSE intrinsics, and ordinary C++ code.
+				<dt><a href="src/Game_of_life.cpp">Game_of_life.cpp </a>
+				<dd>Contains program entry point and other source not related to logical structure of the example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="src/">src</a>
+				<dd>Contains source files mentioned above.
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/AssemblyInfo.cpp b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/AssemblyInfo.cpp
new file mode 100644
index 00000000..44eb0d88
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/AssemblyInfo.cpp
@@ -0,0 +1,58 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+using namespace System;
+using namespace System::Reflection;
+using namespace System::Runtime::CompilerServices;
+using namespace System::Runtime::InteropServices;
+using namespace System::Security::Permissions;
+
+//
+// General Information about an assembly is controlled through the following
+// set of attributes. Change these attribute values to modify the information
+// associated with an assembly.
+//
+[assembly:AssemblyTitleAttribute("Automata")];
+[assembly:AssemblyDescriptionAttribute("")];
+[assembly:AssemblyConfigurationAttribute("")];
+[assembly:AssemblyCompanyAttribute("")];
+[assembly:AssemblyProductAttribute("Automata")];
+[assembly:AssemblyCopyrightAttribute("Copyright (c)  2007")];
+[assembly:AssemblyTrademarkAttribute("")];
+[assembly:AssemblyCultureAttribute("")];
+
+//
+// Version information for an assembly consists of the following four values:
+//
+//      Major Version
+//      Minor Version
+//      Build Number
+//      Revision
+//
+// You can specify all the value or you can default the Revision and Build Numbers
+// by using the '*' as shown below:
+
+[assembly:AssemblyVersionAttribute("1.0.*")];
+
+[assembly:ComVisible(false)];
+
+[assembly:CLSCompliantAttribute(true)];
+
+[assembly:SecurityPermission(SecurityAction::RequestMinimum, UnmanagedCode = true)];
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Board.h b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Board.h
new file mode 100644
index 00000000..a0e0ad7d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Board.h
@@ -0,0 +1,107 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __BOARD_H__ 
+#define __BOARD_H__
+
+#define WIN32_LEAN_AND_MEAN
+
+#ifndef _CONSOLE
+#include <windows.h>
+
+using namespace System;
+using namespace System::ComponentModel;
+using namespace System::Collections;
+using namespace System::Windows::Forms;
+using namespace System::Data;
+using namespace System::Drawing;
+#define LabelPtr Label^
+#define BoardPtr Board^
+#else
+#define LabelPtr int*
+#define BoardPtr Board*
+#endif
+
+struct Matrix 
+{
+    int width;
+    int height;
+    char* data;
+};
+
+#ifndef _CONSOLE
+public ref class Board : public System::Windows::Forms::UserControl
+#else
+class Board
+#endif
+    {
+    public:
+        Board(int width, int height, int squareSize, LabelPtr counter);        
+        virtual ~Board();
+        void seed(int s);
+        void seed(const BoardPtr s);
+#ifndef _CONSOLE
+    protected: 
+        virtual void OnPaint(PaintEventArgs^ e) override;        
+        void Board::draw(Graphics^ g);
+
+    private:
+        System::ComponentModel::Container ^components;
+
+#pragma region Windows Form Designer generated code
+        void InitializeComponent(void)
+        {
+            this->AutoScaleMode = System::Windows::Forms::AutoScaleMode::Font;
+        }
+#pragma endregion
+
+    private: delegate void drawDelegate(Int32);
+    public:
+        //! Called from the Evolution thread
+        void draw( Int32 nCurIteration )
+        {
+            if (this->InvokeRequired)
+            {
+                drawDelegate^ d = gcnew drawDelegate(this, &Board::draw);
+                IAsyncResult^ result = BeginInvoke(d, nCurIteration);
+                EndInvoke(result);
+                return;
+            }
+            m_counter->Text = nCurIteration.ToString();
+            Invalidate();
+        }
+#endif
+    public:
+        Matrix *m_matrix;    
+
+    private:
+#ifndef _CONSOLE
+        SolidBrush^ m_occupiedBrush;
+        SolidBrush^ m_freeBrush;
+        Graphics^ m_graphics;
+        Graphics^ m_mem_dc;
+        Bitmap^ m_bmp;
+#endif
+        int m_width;
+        int m_height;
+        int m_squareSize;
+        LabelPtr m_counter;
+    };
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Evolution.cpp b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Evolution.cpp
new file mode 100644
index 00000000..357cc706
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Evolution.cpp
@@ -0,0 +1,243 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    Evolution.cpp: implementation file for evolution classes; evolution 
+                  classes do looped evolution of patterns in a defined 
+                  2 dimensional space
+*/
+
+#include "Evolution.h"
+#include "Board.h"
+
+#ifdef USE_SSE
+#define GRAIN_SIZE 14
+#else
+#define GRAIN_SIZE 4000
+#endif
+#define TIME_SLICE 330
+
+/*
+    Evolution
+*/
+
+/**
+    Evolution::UpdateMatrix() - moves the calculated destination data 
+    to the source data block. No destination zeroing is required since it will 
+    be completely overwritten during the next calculation cycle.
+**/
+void Evolution::UpdateMatrix()
+{
+    memcpy(m_matrix->data, m_dest, m_size);
+}
+
+/*
+    SequentialEvolution
+*/
+
+//! SequentialEvolution::Run - begins looped evolution
+#ifndef _CONSOLE
+void SequentialEvolution::Run()
+{
+#else
+void SequentialEvolution::Run(double execution_time, int nthread)
+{
+    printf("Starting game (Sequential evolution)\n");
+#endif
+
+    m_nIteration = 0;
+    m_serial_time = 0;
+    tbb::tick_count t0 = tbb::tick_count::now();
+    while (!m_done)
+    {
+        if( !is_paused ) 
+        {
+            tbb::tick_count t = tbb::tick_count::now();
+            Step();
+            tbb::tick_count t1 = tbb::tick_count::now();
+            ++m_nIteration;
+            double  work_time = (t1-t0).seconds();
+#ifndef _CONSOLE
+            if ( work_time * 1000 < TIME_SLICE )
+                continue;
+            m_serial_time += work_time;
+            m_board->draw(m_nIteration);
+#else
+            m_serial_time += work_time;
+#endif
+        }
+        //! Let the parallel algorithm work uncontended almost the same time
+        //! as the serial one. See ParallelEvolution::Run() as well.
+#ifndef _CONSOLE
+        m_evt_start_parallel->Set();
+        m_evt_start_serial->WaitOne();
+        t0 = tbb::tick_count::now();
+#else
+        t0 = tbb::tick_count::now();
+        if(m_serial_time > execution_time)
+        {
+            printf("iterations count = %d time = %g\n", m_nIteration, m_serial_time);
+            break;
+        }
+#endif
+    }
+}
+
+//! SequentialEvolution::Step() - override of step method
+void SequentialEvolution::Step()
+{
+        if( !is_paused ) 
+    {
+#ifdef USE_SSE
+    UpdateState(m_matrix, m_matrix->data, 0, m_matrix->height);
+#else
+    UpdateState(m_matrix, m_dest, 0, (m_matrix->width * m_matrix->height)-1);
+    UpdateMatrix();
+#endif
+        }
+}
+
+/*
+    ParallelEvolution
+*/
+
+//! SequentialEvolution::Run - begins looped evolution
+#ifndef _CONSOLE
+void ParallelEvolution::Run()
+{
+#else
+void ParallelEvolution::Run(double execution_time, int nthread)
+{
+    if(nthread == tbb::task_scheduler_init::automatic)
+        printf("Starting game (Parallel evolution for automatic number of thread(s))\n");
+    else
+        printf("Starting game (Parallel evolution for %d thread(s))\n", nthread);
+#endif
+
+    m_nIteration = 0;
+    m_parallel_time = 0;
+
+#ifndef _CONSOLE
+    //! start task scheduler as necessary
+    if (m_pInit == NULL)
+    {
+        m_pInit = new tbb::task_scheduler_init();
+    }
+    m_evt_start_parallel->WaitOne();
+#else
+    tbb::task_scheduler_init init(nthread);
+#endif
+
+    double  work_time = m_serial_time;
+    tbb::tick_count t0 = tbb::tick_count::now();
+
+    while (!m_done)
+    {
+        if( !is_paused ) 
+        {
+            tbb::tick_count t = tbb::tick_count::now();
+            Step();
+            tbb::tick_count t1 = tbb::tick_count::now();
+            ++m_nIteration;
+            double real_work_time = (t1-t0).seconds();
+#ifndef _CONSOLE
+            if ( real_work_time < work_time )
+                continue;
+            m_parallel_time += real_work_time;
+            m_board->draw(m_nIteration); 
+#else
+            m_parallel_time += real_work_time;
+#endif
+        }
+        //! Let the serial algorithm work the same time as the parallel one.
+#ifndef _CONSOLE
+        m_evt_start_serial->Set();
+        m_evt_start_parallel->WaitOne();
+
+        work_time = m_serial_time - m_parallel_time;
+        t0 = tbb::tick_count::now();
+#else
+        t0 = tbb::tick_count::now();
+        if(m_parallel_time > execution_time)
+        {
+            printf("iterations count = %d time = %g\n", m_nIteration, m_parallel_time);
+            init.terminate();
+            break;
+        }
+#endif
+    }
+}
+
+/**
+    class tbb_parallel_task
+    
+    TBB requires a class for parallel loop implementations. The actual 
+    loop "chunks" are performed using the () operator of the class. 
+    The blocked_range contains the range to calculate. Please see the 
+    TBB documentation for more information.
+**/
+#ifndef _CONSOLE
+public class tbb_parallel_task
+#else
+class tbb_parallel_task
+#endif
+{
+public:
+    static void set_values (Matrix* source, char* dest)
+    {
+        m_source = source;
+        m_dest = dest;
+        return;
+    }
+
+    void operator()( const tbb::blocked_range<size_t>& r ) const 
+    {
+        int begin = (int)r.begin();            //! capture lower range number for this chunk
+        int end = (int)r.end();                //! capture upper range number for this chunk
+        UpdateState(m_source, m_dest, begin, end);
+    }
+
+    tbb_parallel_task () {}
+
+private:
+    static Matrix* m_source;
+    static char* m_dest;
+};
+
+Matrix* tbb_parallel_task::m_source;
+char* tbb_parallel_task::m_dest;
+
+//! ParallelEvolution::Step() - override of Step method
+void ParallelEvolution::Step()
+{
+    size_t begin = 0;                   //! beginning cell position
+#ifdef USE_SSE
+    size_t end = m_matrix->height;      //! ending cell position
+#else
+    size_t end = m_size-1;              //! ending cell position
+#endif
+
+    //! set matrix pointers
+    tbb_parallel_task::set_values(m_matrix, m_dest);
+
+    //! do calculation loop
+    parallel_for (tbb::blocked_range<size_t> (begin, end, GRAIN_SIZE), tbb_parallel_task());
+    UpdateMatrix();
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Evolution.h b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Evolution.h
new file mode 100644
index 00000000..d485396c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Evolution.h
@@ -0,0 +1,195 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/** 
+    Evolution.h: Header file for evolution classes; evolution classes do 
+    looped evolution of patterns in a defined 2 dimensional space 
+**/
+
+#ifndef __EVOLUTION_H__
+#define __EVOLUTION_H__
+
+#include "Board.h"
+#include <string.h>
+#include <stdlib.h>
+#include <stdio.h>
+
+#define WIN32_LEAN_AND_MEAN
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+#include "tbb/tick_count.h"
+
+#ifndef _CONSOLE
+#include <windows.h>
+using namespace System::Threading;
+#else
+typedef unsigned int Int32;
+#endif
+
+void UpdateState(Matrix * m_matrix, char * dest ,int begin, int end);
+
+/**
+    class Evolution - base class for SequentialEvolution and ParallelEvolution
+**/
+#ifndef _CONSOLE
+public ref class Evolution abstract
+#else
+class Evolution
+#endif
+{
+public:
+    Evolution( Matrix *m,                //! beginning matrix including initial pattern
+               BoardPtr board              //! the board to update
+             ) : m_matrix(m), m_board(board), 
+                 m_size(m_matrix->height * m_matrix->width), m_done(false)
+    {
+        //! allocate memory for second matrix data block
+        m_dest = new char[m_size];
+        is_paused = false;
+#ifdef _CONSOLE
+        m_serial_time = 0;
+#endif
+    }
+
+    virtual ~Evolution()
+    {
+        delete[] m_dest;
+    }
+
+    //! Run() - begins looped evolution
+#ifndef _CONSOLE
+    virtual void Run() = 0;
+#else
+    virtual void Run(double execution_time, int nthread) = 0;
+#endif
+
+    //! Quit() - tell the thread to terminate
+    virtual void Quit() { m_done = true; }
+    
+    //! Step() - performs a single evolutionary generation computation on the game matrix
+    virtual void Step() = 0;
+
+    //! SetPause() - change condition of variable is_paused
+    virtual void SetPause(bool condition)
+    {
+        if ( condition == true )
+            is_paused = true;
+        else
+            is_paused = false;
+    }
+    
+protected:
+    /** 
+        UpdateMatrix() - moves the previous destination data to the source 
+        data block and zeros out destination.
+    **/
+    void UpdateMatrix();
+
+protected:
+    Matrix*         m_matrix;       //! Pointer to initial matrix
+    char*           m_dest;         //! Pointer to calculation destination data    
+    BoardPtr        m_board;        //! The game board to update
+    int             m_size;         //! size of the matrix data block
+    volatile bool   m_done;         //! a flag used to terminate the thread
+    Int32           m_nIteration;   //! current calculation cycle index
+    volatile bool   is_paused;      //! is needed to perform next iteration
+    
+    //! Calculation time of the sequential version (since the start), seconds.
+    /**
+        This member is updated by the sequential version and read by parallel,
+        so no synchronization is necessary.
+    **/
+#ifndef _CONSOLE
+    static volatile double m_serial_time = 0;
+
+    static System::Threading::AutoResetEvent    ^m_evt_start_serial = gcnew AutoResetEvent(false),
+                                                ^m_evt_start_parallel = gcnew AutoResetEvent(false);
+#else
+    double m_serial_time;
+#endif
+};
+
+/**
+    class SequentialEvolution - derived from Evolution - calculate life generations serially
+**/
+#ifndef _CONSOLE
+public ref class SequentialEvolution: public Evolution
+#else
+class SequentialEvolution: public Evolution
+#endif
+{
+public:
+    SequentialEvolution(Matrix *m, BoardPtr board)
+                       : Evolution(m, board)
+    {}
+#ifndef _CONSOLE        
+    virtual void Run() override;
+    virtual void Step() override;
+#else
+    virtual void Run(double execution_time, int nthread);
+    virtual void Step();
+#endif
+
+};
+
+/**
+    class ParallelEvolution - derived from Evolution - calculate life generations
+    in parallel using Intel(R) TBB
+**/
+#ifndef _CONSOLE
+public ref class ParallelEvolution: public Evolution
+#else
+class ParallelEvolution: public Evolution
+#endif
+{
+public:
+
+    ParallelEvolution(Matrix *m, BoardPtr board)
+                     : Evolution(m, board),
+                       m_parallel_time(0)
+    {
+        // instantiate a task_scheduler_init object and save a pointer to it
+        m_pInit = NULL;
+    }
+    
+    ~ParallelEvolution()
+    {
+        //! delete task_scheduler_init object
+        if (m_pInit != NULL)
+            delete m_pInit;
+    }
+#ifndef _CONSOLE
+    virtual void Run() override;
+    virtual void Step() override;
+#else
+    virtual void Run(double execution_time, int nthread);
+    virtual void Step();
+#endif
+    
+
+private:
+    tbb::task_scheduler_init* m_pInit;
+
+    double m_parallel_time;
+};
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Form1.h b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Form1.h
new file mode 100644
index 00000000..59d36004
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Form1.h
@@ -0,0 +1,306 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _CONSOLE
+#ifndef __FORM1_H__
+#define __FORM1_H__
+
+#include <time.h>
+#include "Board.h"
+#include "Evolution.h"
+
+#define BOARD_SQUARE_SIZE 2
+
+    using namespace System;
+    using namespace System::ComponentModel;
+    using namespace System::Collections;
+    using namespace System::Windows::Forms;
+    using namespace System::Data;
+    using namespace System::Drawing;
+
+    public ref class Form1 : public System::Windows::Forms::Form
+    {
+    public:
+        Form1(void)
+        {
+            InitializeComponent();
+
+            FormBorderStyle = System::Windows::Forms::FormBorderStyle::FixedDialog;
+            ClientSize = System::Drawing::Size(1206, 600+m_ribbonHeight+menuStrip1->Height);
+
+            int boardWidth = (ClientRectangle.Width/2-m_sepWidth/2)/BOARD_SQUARE_SIZE;
+            int boardHeight = (ClientRectangle.Height-menuStrip1->Height-m_ribbonHeight)/BOARD_SQUARE_SIZE;
+
+            m_board1 = gcnew Board(boardWidth, boardHeight, BOARD_SQUARE_SIZE, seqGen);
+            m_board2 = gcnew Board(boardWidth, boardHeight, BOARD_SQUARE_SIZE, parGen);
+            
+            Controls->Add(m_board1);
+            Controls->Add(m_board2);
+
+            m_board1->Location = System::Drawing::Point(2, m_ribbonHeight + menuStrip1->Height);
+            m_board2->Location = System::Drawing::Point(2 + boardWidth*BOARD_SQUARE_SIZE + m_sepWidth/2, m_ribbonHeight + menuStrip1->Height);
+
+            m_seq = gcnew SequentialEvolution(m_board1->m_matrix, m_board1);
+            m_par = gcnew ParallelEvolution(m_board2->m_matrix, m_board2);
+
+            m_seqThread = gcnew Thread(gcnew ThreadStart(m_seq, &SequentialEvolution::Run));
+            m_parThread = gcnew Thread(gcnew ThreadStart(m_par, &ParallelEvolution::Run));        
+
+            Thread::CurrentThread->Priority = ThreadPriority::AboveNormal;
+
+            m_suspend = true;
+        }
+    protected:
+        ~Form1()
+        {
+            if (components)
+            {
+                delete components;
+            }
+        }
+    private: System::Windows::Forms::MenuStrip^  menuStrip1;
+    private: System::Windows::Forms::ToolStripMenuItem^  fileToolStripMenuItem;
+    private: System::Windows::Forms::ToolStripMenuItem^  exitToolStripMenuItem;
+    private: System::Windows::Forms::ToolStripMenuItem^  gameToolStripMenuItem;
+    private: System::Windows::Forms::ToolStripMenuItem^  seedToolStripMenuItem;
+    private: System::Windows::Forms::ToolStripMenuItem^  runToolStripMenuItem;
+    private: System::Windows::Forms::ToolStripMenuItem^  pauseToolStripMenuItem;
+    private: Board^ m_board1;
+    private: Board^ m_board2;
+    private: System::Windows::Forms::Label^  Sequential;
+    private: System::Windows::Forms::Label^  label1;
+    private: static const int m_sepWidth = 5;
+    private: static const int m_ribbonHeight = 26;
+    private: SequentialEvolution^ m_seq;
+    private: ParallelEvolution^ m_par;
+    private: Thread^ m_seqThread;
+    private: Thread^ m_parThread;
+    private: System::Windows::Forms::Label^  seqGen;
+    private: System::Windows::Forms::Label^  parGen;
+    private: bool m_suspend;
+
+    private:
+        System::ComponentModel::Container ^components;
+
+#pragma region Windows Form Designer generated code
+        void InitializeComponent(void)
+        {
+            this->menuStrip1 = (gcnew System::Windows::Forms::MenuStrip());
+            this->fileToolStripMenuItem = (gcnew System::Windows::Forms::ToolStripMenuItem());
+            this->exitToolStripMenuItem = (gcnew System::Windows::Forms::ToolStripMenuItem());
+            this->gameToolStripMenuItem = (gcnew System::Windows::Forms::ToolStripMenuItem());
+            this->seedToolStripMenuItem = (gcnew System::Windows::Forms::ToolStripMenuItem());
+            this->runToolStripMenuItem = (gcnew System::Windows::Forms::ToolStripMenuItem());
+            this->pauseToolStripMenuItem = (gcnew System::Windows::Forms::ToolStripMenuItem());
+            this->Sequential = (gcnew System::Windows::Forms::Label());
+            this->label1 = (gcnew System::Windows::Forms::Label());
+            this->seqGen = (gcnew System::Windows::Forms::Label());
+            this->parGen = (gcnew System::Windows::Forms::Label());
+            this->menuStrip1->SuspendLayout();
+            this->SuspendLayout();
+            // 
+            // menuStrip1
+            // 
+            this->menuStrip1->Items->AddRange(gcnew cli::array< System::Windows::Forms::ToolStripItem^  >(2) 
+                {this->fileToolStripMenuItem, this->gameToolStripMenuItem});
+            this->menuStrip1->Location = System::Drawing::Point(0, 0);
+            this->menuStrip1->Name = L"menuStrip1";
+            this->menuStrip1->Padding = System::Windows::Forms::Padding(8, 2, 0, 2);
+            this->menuStrip1->Size = System::Drawing::Size(1600, 26);
+            this->menuStrip1->TabIndex = 0;
+            this->menuStrip1->Text = L"menuStrip1";
+            this->menuStrip1->ItemClicked += gcnew System::Windows::Forms::ToolStripItemClickedEventHandler(this, &Form1::menuStrip1_ItemClicked);
+            // 
+            // fileToolStripMenuItem
+            // 
+            this->fileToolStripMenuItem->DropDownItems->AddRange(gcnew cli::array< System::Windows::Forms::ToolStripItem^  >(1) {this->exitToolStripMenuItem});
+            this->fileToolStripMenuItem->Name = L"fileToolStripMenuItem";
+            this->fileToolStripMenuItem->Size = System::Drawing::Size(40, 22);
+            this->fileToolStripMenuItem->Text = L"File";
+            // 
+            // exitToolStripMenuItem
+            // 
+            this->exitToolStripMenuItem->Name = L"exitToolStripMenuItem";
+            this->exitToolStripMenuItem->Size = System::Drawing::Size(99, 22);
+            this->exitToolStripMenuItem->Text = L"Exit";
+            this->exitToolStripMenuItem->Click += gcnew System::EventHandler(this, &Form1::OnExit);
+            // 
+            // gameToolStripMenuItem
+            // 
+            this->gameToolStripMenuItem->DropDownItems->AddRange(gcnew cli::array< System::Windows::Forms::ToolStripItem^  >(3) {this->seedToolStripMenuItem, 
+                this->runToolStripMenuItem, this->pauseToolStripMenuItem});
+            this->gameToolStripMenuItem->Name = L"gameToolStripMenuItem";
+            this->gameToolStripMenuItem->Size = System::Drawing::Size(59, 22);
+            this->gameToolStripMenuItem->Text = L"Game";
+            // 
+            // seedToolStripMenuItem
+            // 
+            this->seedToolStripMenuItem->Name = L"seedToolStripMenuItem";
+            this->seedToolStripMenuItem->Size = System::Drawing::Size(115, 22);
+            this->seedToolStripMenuItem->Text = L"Seed";
+            this->seedToolStripMenuItem->Click += gcnew System::EventHandler(this, &Form1::OnSeed);
+            // 
+            // runToolStripMenuItem
+            // 
+            this->runToolStripMenuItem->Enabled = false;
+            this->runToolStripMenuItem->Name = L"runToolStripMenuItem";
+            this->runToolStripMenuItem->Size = System::Drawing::Size(115, 22);
+            this->runToolStripMenuItem->Text = L"Run";
+            this->runToolStripMenuItem->Click += gcnew System::EventHandler(this, &Form1::OnRun);
+            // 
+            // pauseToolStripMenuItem
+            // 
+            this->pauseToolStripMenuItem->Enabled = false;
+            this->pauseToolStripMenuItem->Name = L"pauseToolStripMenuItem";
+            this->pauseToolStripMenuItem->Size = System::Drawing::Size(115, 22);
+            this->pauseToolStripMenuItem->Text = L"Pause";
+            this->pauseToolStripMenuItem->Click += gcnew System::EventHandler(this, &Form1::OnPauseResume);
+            // 
+            // Sequential
+            // 
+            this->Sequential->AutoSize = true;
+            this->Sequential->Font = (gcnew System::Drawing::Font(L"Microsoft Sans Serif", 9, System::Drawing::FontStyle::Regular, System::Drawing::GraphicsUnit::Point, 
+                static_cast<System::Byte>(0)));
+            this->Sequential->Location = System::Drawing::Point(12, 32);
+            this->Sequential->Margin = System::Windows::Forms::Padding(4, 0, 4, 0);
+            this->Sequential->Name = L"Sequential";
+            this->Sequential->Size = System::Drawing::Size(239, 18);
+            this->Sequential->TabIndex = 1;
+            this->Sequential->Text = L"Sequential Algorithm      generation:";
+            // 
+            // label1
+            // 
+            this->label1->AutoSize = true;
+            this->label1->Font = (gcnew System::Drawing::Font(L"Microsoft Sans Serif", 9, System::Drawing::FontStyle::Regular, System::Drawing::GraphicsUnit::Point, 
+                static_cast<System::Byte>(0)));
+            this->label1->Location = System::Drawing::Point(813, 32);
+            this->label1->Margin = System::Windows::Forms::Padding(4, 0, 4, 0);
+            this->label1->Name = L"label1";
+            this->label1->Size = System::Drawing::Size(219, 18);
+            this->label1->TabIndex = 2;
+            this->label1->Text = L"Parallel Algorithm     generation: ";
+            // 
+            // seqGen
+            // 
+            this->seqGen->AutoSize = true;
+            this->seqGen->Location = System::Drawing::Point(289, 35);
+            this->seqGen->Margin = System::Windows::Forms::Padding(4, 0, 4, 0);
+            this->seqGen->Name = L"seqGen";
+            this->seqGen->Size = System::Drawing::Size(16, 17);
+            this->seqGen->TabIndex = 3;
+            this->seqGen->Text = L"0";
+            // 
+            // parGen
+            // 
+            this->parGen->AutoSize = true;
+            this->parGen->Location = System::Drawing::Point(1068, 35);
+            this->parGen->Margin = System::Windows::Forms::Padding(4, 0, 4, 0);
+            this->parGen->Name = L"parGen";
+            this->parGen->Size = System::Drawing::Size(16, 17);
+            this->parGen->TabIndex = 4;
+            this->parGen->Text = L"0";
+            // 
+            // Form1
+            // 
+            this->AutoScaleDimensions = System::Drawing::SizeF(8, 16);
+            this->AutoScaleMode = System::Windows::Forms::AutoScaleMode::Font;
+            this->ClientSize = System::Drawing::Size(1600, 738);
+            this->Controls->Add(this->parGen);
+            this->Controls->Add(this->seqGen);
+            this->Controls->Add(this->label1);
+            this->Controls->Add(this->Sequential);
+            this->Controls->Add(this->menuStrip1);
+            this->MainMenuStrip = this->menuStrip1;
+            this->Margin = System::Windows::Forms::Padding(4);
+            this->MaximizeBox = false;
+            this->Name = L"Form1";
+            this->Text = L"Game of Life";
+            this->menuStrip1->ResumeLayout(false);
+            this->menuStrip1->PerformLayout();
+            this->ResumeLayout(false);
+            this->PerformLayout();
+
+        }
+#pragma endregion    
+    protected: 
+        void CloseApp ()
+        {
+            m_seq->Quit();
+            m_par->Quit();
+            //! Perform a very ungracious exit, should coordinate the threads
+            System::Environment::Exit(0);            
+        }
+    
+    protected: 
+        virtual void OnPaint(PaintEventArgs^ e) override
+        {
+        }
+
+        virtual void OnFormClosing(FormClosingEventArgs^ e) override
+        { 
+            CloseApp();
+        }
+    
+        void OnExit(System::Object^ sender, System::EventArgs^ e)
+        {                
+            CloseApp();
+        }
+
+        void OnSeed(System::Object^ sender, System::EventArgs^ e)
+        {
+            this->seedToolStripMenuItem->Enabled = false;
+            this->runToolStripMenuItem->Enabled = true;            
+            time_t now = time(NULL);
+            this->m_board1->seed((int)now);
+            this->m_board2->seed(this->m_board1);
+            this->Invalidate();
+        }
+
+        void OnRun(System::Object^ sender, System::EventArgs^ e)
+        {    
+            this->runToolStripMenuItem->Enabled = false;        
+            this->pauseToolStripMenuItem->Enabled = true;
+            m_seqThread->Start();
+            m_parThread->Start();    
+        }
+
+        void OnPauseResume(System::Object^ sender, System::EventArgs^ e)
+        {    
+            if (m_suspend)
+            {
+                m_seq->SetPause(true);
+                m_par->SetPause(true);
+                this->pauseToolStripMenuItem->Text = L"Resume";
+            }
+            else
+            {
+                m_seq->SetPause(false);
+                m_par->SetPause(false);            
+                this->pauseToolStripMenuItem->Text = L"Pause";
+            }
+            m_suspend = !m_suspend;
+        }
+
+    private: 
+        System::Void menuStrip1_ItemClicked(System::Object^  sender, System::Windows::Forms::ToolStripItemClickedEventArgs^  e) 
+        {}
+};
+#endif
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Game_of_life.cpp b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Game_of_life.cpp
new file mode 100644
index 00000000..f13cbe97
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Game_of_life.cpp
@@ -0,0 +1,230 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* 
+    Game_of_life.cpp : 
+                      main project file.
+*/
+#include "Board.h"
+#include "Form1.h"
+
+#define WIN32_LEAN_AND_MEAN
+
+#ifndef _CONSOLE
+#include <windows.h>
+#else
+#include <iostream>
+#include <sstream>
+#include <time.h>
+#include "Evolution.h"
+
+#define BOARD_SQUARE_SIZE 2
+
+int low;                            //! lower range limit of threads
+int high;                           //! high range limit of threads
+double execution_time;              //! time for game of life iterations
+#endif
+
+Board::Board(int width, int height, int squareSize, LabelPtr counter)
+: m_width(width), m_height(height), m_squareSize(squareSize), m_counter(counter)
+{
+#ifndef _CONSOLE
+    InitializeComponent();
+    DoubleBuffered = true;
+
+    this->Width = m_squareSize*width;
+    this->Height = m_squareSize*height;
+#endif
+    m_matrix = new Matrix();
+    m_matrix->width = width;
+    m_matrix->height = height;
+    m_matrix->data = new char[width*height];
+    memset(m_matrix->data, 0, width*height);
+#ifndef _CONSOLE
+    m_occupiedBrush = gcnew SolidBrush(Color::Black);
+    m_freeBrush = gcnew SolidBrush(Color::LightGray);
+    
+    m_graphics = CreateGraphics();
+    m_bmp = gcnew Bitmap(Width, Height);
+    m_mem_dc = Graphics::FromImage(m_bmp);
+#endif
+}
+
+Board::~Board()
+{
+#ifndef _CONSOLE
+    if (components)
+    {
+        delete components;
+    }
+#endif
+    delete[] m_matrix->data;
+    delete m_matrix;
+}
+
+void Board::seed(int s)
+{        
+    srand(s);
+    for (int j=0; j<m_height; j++)
+    {
+        for (int i=0; i<m_width; i++)
+        {        
+            int x = rand()/(int)(((unsigned)RAND_MAX + 1) / 100);
+            m_matrix->data[i+j*m_width] = x>75? 1: 0;               // 25% occupied
+        }
+    }
+#ifndef _CONSOLE
+    Invalidate();
+#endif
+}
+
+void Board::seed( const BoardPtr src )
+{        
+            memcpy(m_matrix->data, src->m_matrix->data, m_height*m_width);
+#ifndef _CONSOLE
+    Invalidate();
+#endif
+}
+
+#ifndef _CONSOLE
+void Board::draw(Graphics^ g)
+{
+    m_mem_dc->FillRectangle(m_freeBrush, Drawing::Rectangle(0, 0, m_width*m_squareSize, m_height*m_squareSize));
+    for (int j=0; j<m_height; j++)
+    {
+        for (int i=0; i<m_width; i++)
+        {    
+            if ( m_matrix->data[i+j*m_width] )
+            {
+                m_mem_dc->FillRectangle(m_occupiedBrush, Drawing::Rectangle(i*m_squareSize, j*m_squareSize, m_squareSize, m_squareSize));
+            }
+        }
+    }
+    g->DrawImage(m_bmp, 0, 0);
+}
+
+void Board::OnPaint(PaintEventArgs^ e)
+{
+    draw(e->Graphics);
+}
+
+[STAThreadAttribute]
+int main(array<System::String ^> ^args)
+{
+    // Enabling Windows XP visual effects before any controls are created
+    Application::EnableVisualStyles();
+    Application::SetCompatibleTextRenderingDefault(false); 
+
+    // Create the main window and run it
+    Application::Run(gcnew Form1());
+    return 0;
+}
+#else
+
+//! Print usage of this program
+void PrintUsage() 
+{
+    printf("Usage: gol [M[:N] -t execution_time]\nM and N are a range of numbers of threads to be used.\nexecution_time is a time (in sec) for execution game_of_life iterations\n");
+    printf("Default values:\nM:\t\tautomatic\nN:\t\tM\nexecution_time:\t10\n");
+}
+
+//! Parse command line
+bool ParseCommandLine(int argc, char * argv []) 
+{
+    char* s = argv[1];
+    char* end;
+    //! command line without parameters
+    if(argc == 1)
+    {
+        low = tbb::task_scheduler_init::automatic;
+        high = low;
+        execution_time = 5;
+        return true;
+    }
+    //! command line with parameters
+    if(argc != 4)
+    {
+        PrintUsage();
+        return false;
+    }
+    if(std::string("-t") != argv[argc-2])
+    //! process M[:N] parameter
+    high = strtol(s,&end,0);
+    low = strtol(s,&end,0);
+    switch( *end ) 
+    {
+        case ':': 
+            high = strtol(end+1,0,0); 
+            break;
+        case '\0':
+            break;
+        default:
+            PrintUsage();
+            return false;
+    }
+    if (high < low)
+    {
+        std::cout << "Set correct range. Current range: " << low << ":" << high << std::endl;
+        PrintUsage();
+        return false;
+
+    }
+    //! process execution_time parameter
+    execution_time = strtol(argv[argc-1],&end,0);
+    return true;
+}
+
+int main( int argc, char* argv[] ) 
+{
+    if(!ParseCommandLine( argc, argv ))
+        return 1;
+    SequentialEvolution* m_seq;
+    ParallelEvolution* m_par;
+    Board* m_board1;
+    Board* m_board2; 
+    int* count = NULL;
+   
+    int boardWidth = 300;
+    int boardHeight = 300;
+
+    m_board1 = new Board(boardWidth, boardHeight, BOARD_SQUARE_SIZE, count);
+    m_board2 = new Board(boardWidth, boardHeight, BOARD_SQUARE_SIZE, count);
+
+    time_t now = time(NULL);
+    printf("Generate Game of life board\n");
+    m_board1->seed((int)now);
+    m_board2->seed(m_board1);
+
+    m_seq = new SequentialEvolution(m_board1->m_matrix, m_board1);
+    m_seq->Run(execution_time, 1);
+    delete m_seq;
+
+    m_par = new ParallelEvolution(m_board2->m_matrix, m_board2);
+    for( int p = low; p <= high; ++p ) 
+    {
+        m_par->Run(execution_time, p);
+    }
+    delete m_par;
+
+    delete m_board1;
+    delete m_board2;
+    return 0;
+}
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Update_state.cpp b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Update_state.cpp
new file mode 100644
index 00000000..a7e58b05
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/src/Update_state.cpp
@@ -0,0 +1,402 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "Evolution.h"
+
+#ifdef USE_SSE 
+/* Update states with SSE */
+
+#include <xmmintrin.h>
+#include <emmintrin.h>
+
+inline void create_record( char * src, unsigned * dst, unsigned width)
+{
+    dst[0] |= src[width - 1];
+    for( unsigned a=0; a<31u; ++a )
+        dst[0] |= src[a]<<(a+1);
+    unsigned a;
+    for( a=31u; a<width; ++a )
+        dst[(a+1)/32u] |= src[a]<<((a+1)%32u);
+    dst[(a+1)/32u] |= src[0]<<((a+1)%32u);
+}
+
+inline void sum_offset( __m128i * X, __m128i * A, __m128i * B, __m128i * C, 
+                        unsigned size_sse_ar, unsigned shift )
+{
+    for(unsigned i=0; i<size_sse_ar; ++i) 
+    {
+        __m128i tmp = _mm_and_si128(A[i],X[shift + i]);    
+        A[i]=_mm_xor_si128(A[i],X[shift + i]);    
+        C[i]=_mm_or_si128(C[i],_mm_and_si128(B[i],tmp));
+        B[i]=_mm_xor_si128(B[i],tmp);
+    }
+}
+
+inline void shift_left2D( __m128i * X, unsigned height, unsigned size_sse_row )
+{
+    for( unsigned b=0; b<height; ++b ) 
+    {
+        unsigned ind = b*size_sse_row;
+        unsigned x0 = X[ind].m128i_u32[0] & 1;
+
+        X[ind] =_mm_or_si128( _mm_srli_epi16(X[ind],1), 
+            _mm_slli_epi16( _mm_srli_si128( X[ind], 2), 15) );
+    
+        unsigned x1 = X[ind + 1].m128i_u32[0] & 1;
+        X[ind+1] =_mm_or_si128( _mm_srli_epi16( X[ind+1],1), 
+            _mm_slli_epi16( _mm_srli_si128( X[ind+1], 2), 15) );
+        X[ind].m128i_u32[3] |= x1<<31;
+        
+        unsigned x2 = X[ind + 2].m128i_u32[0] & 1;
+        X[ind+2] =_mm_or_si128( _mm_srli_epi16( X[ind+2],1), 
+            _mm_slli_epi16( _mm_srli_si128( X[ind+2], 2), 15) );
+        X[ind+1].m128i_u32[3] |= x2<<31;
+        
+        unsigned* dst = (unsigned*)&X[ind];
+        dst[301/32u] |= x0<<(301%32u);
+   }
+}
+
+inline void shift_right2D( __m128i * X, unsigned height, unsigned size_sse_row )
+{
+    for( unsigned b=0; b<height; ++b ) 
+    {
+        unsigned ind = b*size_sse_row;
+
+        unsigned x0 = X[ind].m128i_u32[3]; x0>>=31;
+        X[ind] =_mm_or_si128( _mm_slli_epi16(X[ind],1), 
+            _mm_srli_epi16( _mm_slli_si128( X[ind], 2), 15) );
+            
+        unsigned x1 = X[ind + 1].m128i_u32[3]; x1>>=31;
+        X[ind + 1] =_mm_or_si128( _mm_slli_epi16(X[ind + 1],1),
+                _mm_srli_epi16( _mm_slli_si128( X[ind + 1], 2), 15) );
+        X[ind + 1].m128i_u32[0] |= x0;
+                
+        unsigned* dst = (unsigned*)&X[ind];
+        unsigned x2 = dst[301/32u] & (1<<(301%32u)); x2>>=(301%32u);
+        X[ind + 2] =_mm_or_si128( _mm_slli_epi16(X[ind + 2],1),
+            _mm_srli_epi16( _mm_slli_si128( X[ind + 2], 2), 15) );        
+        X[ind + 2].m128i_u32[0] |= x1;    
+        X[ind].m128i_u32[0] |= x2;
+   }
+}
+
+void UpdateState(Matrix * m_matrix, char * dest ,int begin, int end)
+{
+    //300/128 + 1 =3, 3*300=900
+    unsigned size_sse_row = m_matrix->width/128 + 1; //3
+    unsigned size_sse_ar=size_sse_row * (end - begin); 
+    __m128i X[906], A[900], B[900], C[900];
+    char * mas  = m_matrix->data;
+    
+    for( unsigned i=0; i<size_sse_ar; ++i)
+    {
+        A[i].m128i_u32[0]=0;A[i].m128i_u32[1]=0;A[i].m128i_u32[2]=0;A[i].m128i_u32[3]=0;
+        B[i].m128i_u32[0]=0;B[i].m128i_u32[1]=0;B[i].m128i_u32[2]=0;B[i].m128i_u32[3]=0;
+        C[i].m128i_u32[0]=0;C[i].m128i_u32[1]=0;C[i].m128i_u32[2]=0;C[i].m128i_u32[3]=0;    
+    }
+
+    for( unsigned i=0; i<size_sse_ar+6; ++i)
+    {
+        X[i].m128i_u32[0]=0;X[i].m128i_u32[1]=0;X[i].m128i_u32[2]=0;X[i].m128i_u32[3]=0;
+    }
+
+    // create X[] with bounds
+    unsigned height = end - begin;
+    unsigned width = m_matrix->width;
+    for( unsigned b = 0 ; b < height; ++b ) 
+    {
+        char* src = &mas[(b + begin)*width];
+        unsigned* dst = (unsigned*)&X[(b+1)*size_sse_row];
+        create_record(src, dst, width);
+    }
+    // create high row in X[]
+    char * src;
+    if(begin == 0) 
+    {
+        src = &mas[(m_matrix->height-1)*width];
+    }
+    else 
+    {
+        src = &mas[(begin-1)*width];
+    }
+    unsigned* dst = (unsigned*)X;
+    create_record(src, dst, width);
+    
+    //create lower row in X[]
+    if(end == m_matrix->height ) 
+    {
+        src = mas;
+    }        
+    else 
+    {
+        src = &mas[end*width];
+    }
+    dst = (unsigned*)&X[(height+1)*size_sse_row];
+    create_record(src, dst, width);
+    
+    //sum( C, B, A, X+offset_for_upwards ); high-left friend
+    sum_offset(X,A,B,C,size_sse_ar, 0);
+    
+    //sum( C, B, A, X+offset_for_no_vertical_shift );
+    sum_offset(X,A,B,C,size_sse_ar, size_sse_row);
+    
+    //sum( C, B, A, X+offset_for_downwards );
+    sum_offset(X,A,B,C,size_sse_ar, 2*size_sse_row);
+
+    //shift_left( X ); (when view 2D) in our logic it is in right
+    height = end - begin + 2;
+    shift_left2D( X, height, size_sse_row);
+
+    //sum( C, B, A, X+offset_for_upwards ); high-left friend
+    sum_offset(X,A,B,C,size_sse_ar, 0);
+
+    //sum( C, B, A, X+offset_for_downwards );
+    sum_offset(X,A,B,C,size_sse_ar, 2*size_sse_row);
+
+    //shift_left( X ); (view in 2D) in our logic it is right shift
+    height = end - begin + 2;
+    shift_left2D( X, height, size_sse_row);
+    
+    //sum( C, B, A, X+offset_for_upwards ); high-right friend
+    sum_offset(X,A,B,C,size_sse_ar, 0);
+    
+    //sum( C, B, A, X+offset_for_no_vertical_shift ); right friend
+    sum_offset(X,A,B,C,size_sse_ar, size_sse_row);    
+    
+    //sum( C, B, A, X+offset_for_downwards ); right down friend
+    sum_offset(X,A,B,C,size_sse_ar, 2*size_sse_row);
+
+    //shift_right( X ); (when view in 2D) in our case it left shift.
+    height = end - begin + 2;
+    shift_right2D( X, height, size_sse_row);
+    
+    //X = (X|A)&B&~C (done bitwise over the arrays) 
+    unsigned shift = size_sse_row;
+    for(unsigned i=0; i<size_sse_ar; ++i) 
+    {
+        C[i].m128i_u32[0] = ~C[i].m128i_u32[0];
+        C[i].m128i_u32[1] = ~C[i].m128i_u32[1];
+        C[i].m128i_u32[2] = ~C[i].m128i_u32[2];
+        C[i].m128i_u32[3] = ~C[i].m128i_u32[3];
+        X[shift + i] = _mm_and_si128(_mm_and_si128(_mm_or_si128(X[shift + i],
+            A[i]),B[i]),C[i]);    
+    }
+
+    height = end - begin;
+    width=m_matrix->width;
+    for( unsigned b=0; b<height; ++b ) 
+    {
+        char* dst = &dest[(b+begin)*width];
+        unsigned* src = (unsigned*)&X[(b+1)*size_sse_row];
+        for( unsigned a=0; a<width; ++a )
+        {
+            unsigned c = src[a/32u] & 1<<(a%32u);
+            dst[a] = c>>(a%32u);
+        }
+    }
+}
+#else 
+/* end SSE block */
+
+// ----------------------------------------------------------------------
+// GetAdjacentCellState() - returns the state (value) of the specified 
+// adjacent cell of the current cell "cellNumber"
+char GetAdjacentCellState(
+                                char* source,      // pointer to source data block
+                                int x,             // logical width of field
+                                int y,             // logical height of field
+                                int cellNumber,    // number of cell position to examine
+                                int cp             // which adjacent position
+                               )
+{
+/* 
+cp 
+*-- cp=1 ... --- cp=8 (summary: -1-2-3-
+-x-          -x-                -4-x-5-
+---          --*                -6-7-8- )
+*/
+    char cellState = 0;        // return value
+
+    // set up boundary flags to trigger field-wrap logic
+    bool onTopRow = false;
+    bool onBottomRow = false;
+    bool onLeftColumn = false;
+    bool onRightColumn = false;
+
+    // check to see if cell is on top row
+    if (cellNumber < x)
+    {
+        onTopRow = true;
+    }
+    // check to see if cell is on bottom row
+    if ((x*y)-cellNumber <= x)
+    {
+        onBottomRow = true;
+    }
+    // check to see if cell is on left column
+    if (cellNumber%x == 0)
+    {
+        onLeftColumn = true;
+    }
+    // check to see if cell is on right column
+    if ((cellNumber+1)%x == 0)
+    {
+        onRightColumn = true;
+    }
+
+    switch (cp)
+    {
+        case 1:
+            if (onTopRow && onLeftColumn)
+            {
+                return *(source+((x*y)-1));
+            }
+            if (onTopRow && !onLeftColumn)
+            {
+                return *(source+(((x*y)-x)+(cellNumber-1)));
+            }
+            if (onLeftColumn && !onTopRow)
+            {
+                return *(source+(cellNumber-1));
+            }
+            return *((source+cellNumber)-(x+1));
+
+        case 2:
+            if (onTopRow)
+            {
+                return *(source+(((x*y)-x)+cellNumber));
+            }
+            return *((source+cellNumber)-x);
+
+        case 3:
+            if (onTopRow && onRightColumn)
+            {
+                return *(source+((x*y)-x));
+            }
+            if (onTopRow && !onRightColumn)
+            {
+                return *(source+(((x*y)-x)+(cellNumber+1)));
+            }
+            if (onRightColumn && !onTopRow)
+            {
+                return *(source+((cellNumber-(x*2))+1));
+            }
+            return *(source+(cellNumber-(x-1)));
+
+        case 4:
+            if (onRightColumn)
+            {
+                return *(source+(cellNumber-(x-1)));
+            }
+            return *(source+(cellNumber+1));
+
+        case 5:
+            if (onBottomRow && onRightColumn)
+            {
+                return *source;
+            }
+            if (onBottomRow && !onRightColumn)
+            {
+                return *(source+((cellNumber-((x*y)-x))+1));
+            }
+            if (onRightColumn && !onBottomRow)
+            {
+                return *(source+(cellNumber+1));
+            }
+            return *(source+(((cellNumber+x))+1));
+
+        case 6:
+            if (onBottomRow)
+            {
+                return *(source+(cellNumber-((x*y)-x)));
+            }
+            return *(source+(cellNumber+x));
+
+        case 7:
+            if (onBottomRow && onLeftColumn)
+            {
+                return *(source+(x-1));
+            }
+            if (onBottomRow && !onLeftColumn)
+            {
+                return *(source+(cellNumber-((x*y)-x)-1));
+            }
+            if (onLeftColumn && !onBottomRow)
+            {
+                return *(source+(cellNumber+((x*2)-1)));
+            }
+            return *(source+(cellNumber+(x-1)));
+
+        case 8:
+            if (onLeftColumn)
+            {
+                return *(source+(cellNumber+(x-1)));
+            }
+            return *(source+(cellNumber-1));
+    }
+    return cellState;
+}
+
+char CheckCell(Matrix * m_matrix, int cellNumber)
+{
+    char total = 0;
+    char* source = m_matrix->data;
+    //look around to find cell's with status "alive"
+    for(int i=1; i<9; i++)
+    {
+        total += GetAdjacentCellState(source, m_matrix->width, m_matrix->height, cellNumber, i);
+    }
+    // if the number of adjacent live cells is < 2 or > 3, the result is a dead 
+    // cell regardless of its current state. (A live cell dies of loneliness if it
+    // has less than 2 neighbors, and of overcrowding if it has more than 3; a new
+    // cell is born in an empty spot only if it has exactly 3 neighbors.
+    if (total < 2 || total > 3)
+    {
+        return 0;
+    }
+
+    // if we get here and the cell position holds a living cell, it stays alive
+    if (*(source+cellNumber))
+    {
+        return 1;
+    }
+
+    // we have an empty position. If there are only 2 neighbors, the position stays
+    // empty.
+    if (total == 2)
+    {
+        return 0;
+    }
+
+    // we have an empty position and exactly 3 neighbors. A cell is born.
+    return 1;
+}
+
+void UpdateState(Matrix * m_matrix, char * dest ,int begin, int end)
+{
+        for (int i=begin; i<=end; i++)
+        {
+            *(dest+i) = CheckCell(m_matrix, i);
+        }
+}
+
+#endif 
+/* end non-SSE block */
diff --git a/xdl/third_party/tbb/examples/parallel_for/game_of_life/xcode/game_of_life.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_for/game_of_life/xcode/game_of_life.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..cd8a515c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/game_of_life/xcode/game_of_life.xcodeproj/project.pbxproj
@@ -0,0 +1,270 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		612CD8DD11F573FC00A587B2 /* Game_of_life.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 612CD8DB11F573FC00A587B2 /* Game_of_life.cpp */; };
+		612CD8DE11F573FC00A587B2 /* Update_state.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 612CD8DC11F573FC00A587B2 /* Update_state.cpp */; };
+		612CD8E111F5742000A587B2 /* Evolution.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 612CD8E011F5742000A587B2 /* Evolution.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58967218C3E4A00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		612CD8DB11F573FC00A587B2 /* Game_of_life.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = Game_of_life.cpp; path = ../src/Game_of_life.cpp; sourceTree = SOURCE_ROOT; };
+		612CD8DC11F573FC00A587B2 /* Update_state.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = Update_state.cpp; path = ../src/Update_state.cpp; sourceTree = SOURCE_ROOT; };
+		612CD8E011F5742000A587B2 /* Evolution.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = Evolution.cpp; path = ../src/Evolution.cpp; sourceTree = SOURCE_ROOT; };
+		8DD76F6C0486A84900D96B5E /* game_of_life */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = game_of_life; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* game_of_life */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = game_of_life;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				612CD8E011F5742000A587B2 /* Evolution.cpp */,
+				612CD8DB11F573FC00A587B2 /* Game_of_life.cpp */,
+				612CD8DC11F573FC00A587B2 /* Update_state.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* game_of_life */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* game_of_life */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "game_of_life" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58967218C3E4A00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = game_of_life;
+			productInstallPath = "$(HOME)/bin";
+			productName = game_of_life;
+			productReference = 8DD76F6C0486A84900D96B5E /* game_of_life */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "game_of_life" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* game_of_life */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* game_of_life */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				612CD8DD11F573FC00A587B2 /* Game_of_life.cpp in Sources */,
+				612CD8DE11F573FC00A587B2 /* Update_state.cpp in Sources */,
+				612CD8E111F5742000A587B2 /* Evolution.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = _CONSOLE;
+				GCC_VERSION = com.apple.compilers.llvm.clang.1_0;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = game_of_life;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_PREPROCESSOR_DEFINITIONS = _CONSOLE;
+				GCC_VERSION = com.apple.compilers.llvm.clang.1_0;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = game_of_life;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "game_of_life" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "game_of_life" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/index.html b/xdl/third_party/tbb/examples/parallel_for/index.html
new file mode 100644
index 00000000..2b8a77d7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/index.html
@@ -0,0 +1,350 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on parallel_for algorithm</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>parallel_for</code> algorithm</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the <code>parallel_for</code> algorithm.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="seismic/readme.html">seismic</a>
+				<dd>Parallel seismic wave simulation.
+				<dt><a href="tachyon/readme.html">tachyon</a>
+				<dd>Parallel 2-D raytracer/renderer.
+				<dt><a href="polygon_overlay/readme.html">polygon_overlay</a>
+				<dd>Simple polygon overlay.
+				<dt><a href="game_of_life/readme.html">game_of_life</a>
+				<dd>Simple Game of life overlay.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/Makefile b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/Makefile
new file mode 100644
index 00000000..d1c94599
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/Makefile
@@ -0,0 +1,90 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+NAME=pover
+ARGS=
+LIGHT_ARGS= --polys 10 --size 5x5
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+include ../../common/gui/Makefile.gmake
+
+ifeq ($(UI),x)
+UI_CXXFLAGS += -DX_FULLSYNC
+endif # X
+
+override CXXFLAGS += $(UI_CXXFLAGS)
+
+SRCFILES = ../../common/gui/$(UI)video.cpp pover_video.cpp polymain.cpp polyover.cpp
+
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt 
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+resources:
+ifeq ($(UI),mac)
+	mkdir -p $(APPRES)/en.lproj $(NAME).app/Contents/MacOS
+	cp ../../common/gui/xcode/tbbExample/tbbExample-Info.plist $(NAME).app/Contents/Info.plist
+	cp ../../common/gui/xcode/tbbExample/PkgInfo $(NAME).app/Contents
+	cp ../../common/gui/xcode/tbbExample/en.lproj/* $(APPRES)/en.lproj
+endif # macOS*
+
+release: $(SRCFILES) resources
+ifeq ($(compiler),xl)
+	# Avoiding "1586-346 (U) An error occurred during code generation.  The code generation return code was 40." with -O3.
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(EXE) $(SRCFILES) -ltbb -ltbbmalloc $(LIBS)
+else
+ifeq ($(UI),mac)
+	$(CXX_UI) -O3 -DNDEBUG $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS
+	$(CXX) -O3 -DNDEBUG $(CXXFLAGS) -o $(EXE) $(SRCFILES) $(MACUIOBJS) -ltbb -ltbbmalloc $(LIBS)
+endif
+
+debug:  $(SRCFILES) resources
+ifeq ($(UI),mac)
+	$(CXX_UI) -g -O0 -DTBB_USE_DEBUG -D_DEBUG $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS
+	$(CXX) -g -O0 -DTBB_USE_DEBUG -D_DEBUG $(CXXFLAGS) -o $(EXE) $(SRCFILES) $(MACUIOBJS) -ltbb_debug -ltbbmalloc_debug $(LIBS)
+
+clean:
+	$(RM) $(EXE) *.o *.d
+ifeq ($(UI),mac)
+	rm -rf $(NAME).app
+endif
+
+test:
+ifeq ($(UI),mac)
+	export DYLD_LIBRARY_PATH="$(DYLD_LIBRARY_PATH):$(TBBLIBSPATH)"; $(run_cmd) ./$(EXE) $(ARGS)
+else
+	$(run_cmd) ./$(EXE) $(ARGS)
+endif
+
+light_test:
+ifeq ($(UI),mac)
+	export DYLD_LIBRARY_PATH="$(DYLD_LIBRARY_PATH):$(TBBLIBSPATH)"; $(run_cmd) ./$(EXE) $(LIGHT_ARGS)
+else
+	$(run_cmd) ./$(EXE) $(LIGHT_ARGS)
+endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/Makefile.windows b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/Makefile.windows
new file mode 100644
index 00000000..64490719
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/Makefile.windows
@@ -0,0 +1,60 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Pover
+ARGS=
+LIGHT_ARGS= --polys 10 --size 5x5
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+
+# Uncomment one of next lines to choose user interface type (console, gdiplus, direct draw)
+#UI = con
+UI = gdi
+#UI = dd
+
+# Machine architecture, auto-detected from TBB_TARGET_ARCH by default
+# Use XARCH variable to change it. See index.html for more information
+ARCH0 = $(TBB_TARGET_ARCH)-
+ARCH1 = $(ARCH0:ia32-=x86)
+ARCH2 = $(ARCH1:intel64-=AMD64)
+XARCH = $(ARCH2:-=x86)
+
+MAKEINC = ../../common/gui/Makefile.win
+
+all: release test
+release: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=$(UI) CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS)" LFLAGS="$(LDFLAGS) tbb.lib tbbmalloc.lib $(LIBS)" XARCH=$(XARCH) RCNAME=pover SOURCE=*.cpp EXE=$(PROG).exe build_one
+debug: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=$(UI) DEBUG=_debug CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS) /D TBB_USE_DEBUG" LFLAGS="$(LDFLAGS) tbb_debug.lib tbbmalloc_debug.lib $(LIBS)" XARCH=$(XARCH) RCNAME=pover SOURCE=*.cpp EXE=$(PROG).exe build_one
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest msvs\pover.res
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/polygon_overlay.sln b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/polygon_overlay.sln
new file mode 100644
index 00000000..77074dd9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/polygon_overlay.sln
@@ -0,0 +1,40 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "pover", "pover.vcxproj", "{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		_GDIRelease|Win32 = _GDIRelease|Win32
+		_GDIRelease|x64 = _GDIRelease|x64
+		DD Debug|Win32 = DD Debug|Win32
+		DD Debug|x64 = DD Debug|x64
+		DD Release|Win32 = DD Release|Win32
+		DD Release|x64 = DD Release|x64
+		GDIDebug|Win32 = GDIDebug|Win32
+		GDIDebug|x64 = GDIDebug|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}._GDIRelease|Win32.ActiveCfg = Release|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}._GDIRelease|Win32.Build.0 = Release|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}._GDIRelease|x64.ActiveCfg = Release|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}._GDIRelease|x64.Build.0 = Release|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Debug|Win32.ActiveCfg = DD Debug|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Debug|Win32.Build.0 = DD Debug|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Debug|x64.ActiveCfg = DD Debug|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Debug|x64.Build.0 = DD Debug|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Release|Win32.ActiveCfg = DD Release|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Release|Win32.Build.0 = DD Release|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Release|x64.ActiveCfg = DD Release|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.DD Release|x64.Build.0 = DD Release|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.GDIDebug|Win32.ActiveCfg = Debug|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.GDIDebug|Win32.Build.0 = Debug|Win32
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.GDIDebug|x64.ActiveCfg = Debug|x64
+		{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}.GDIDebug|x64.Build.0 = Debug|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/pover.rc b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/pover.rc
new file mode 100644
index 00000000..3eee795f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/pover.rc
@@ -0,0 +1,61 @@
+// Microsoft Visual C++ generated resource script.
+//
+#include "resource.h"
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#include "afxres.h"
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// English (U.S.) resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_ENU)
+LANGUAGE 9, 1
+#pragma code_page(1252)
+
+#ifdef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// TEXTINCLUDE
+//
+
+1 TEXTINCLUDE  
+BEGIN
+    "resource.h\0"
+END
+
+2 TEXTINCLUDE  
+BEGIN
+    "#include ""afxres.h""\r\n"
+    "\0"
+END
+
+3 TEXTINCLUDE  
+BEGIN
+    "\r\n"
+    "\0"
+END
+
+#endif    // APSTUDIO_INVOKED
+
+#endif    // English (U.S.) resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/pover.vcxproj b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/pover.vcxproj
new file mode 100644
index 00000000..dc5e8f9a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/pover.vcxproj
@@ -0,0 +1,448 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="DD Debug|Win32">
+      <Configuration>DD Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DD Debug|x64">
+      <Configuration>DD Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DD Release|Win32">
+      <Configuration>DD Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DD Release|x64">
+      <Configuration>DD Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>pover</ProjectName>
+    <ProjectGuid>{4BB7B455-1E09-41D3-BC89-6E67C9032F8C}</ProjectGuid>
+    <RootNamespace>pover</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\polymain.cpp" />
+    <ClCompile Include="..\polyover.cpp" />
+    <ClCompile Include="..\pover_video.cpp" />
+    <ClCompile Include="..\..\..\common\gui\d2dvideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+    <ClCompile Include="..\..\..\common\gui\gdivideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DD Debug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DD Debug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DD Release|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DD Release|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\polymain.h" />
+    <ClInclude Include="..\polyover.h" />
+    <ClInclude Include="..\pover_global.h" />
+    <ClInclude Include="..\pover_video.h" />
+    <ClInclude Include="..\rpolygon.h" />
+    <ClInclude Include="..\..\..\common\gui\video.h" />
+    <ClInclude Include="..\..\..\common\gui\winvideo.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/resource.h b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/resource.h
new file mode 100644
index 00000000..5a438165
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/msvs/resource.h
@@ -0,0 +1,34 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//{{NO_DEPENDENCIES}}
+// Microsoft Visual C++ generated include file.
+// Used by pover.rc
+
+// Next default values for new objects
+// 
+#ifdef APSTUDIO_INVOKED
+#ifndef APSTUDIO_READONLY_SYMBOLS
+#define _APS_NEXT_RESOURCE_VALUE        101
+#define _APS_NEXT_COMMAND_VALUE         40001
+#define _APS_NEXT_CONTROL_VALUE         1001
+#define _APS_NEXT_SYMED_VALUE           101
+#endif
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polymain.cpp b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polymain.cpp
new file mode 100644
index 00000000..ec3ecd9d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polymain.cpp
@@ -0,0 +1,620 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Polygon overlay
+//
+// Don't want warnings about deprecated sscanf, getenv
+#ifndef _CRT_SECURE_NO_DEPRECATE
+#define _CRT_SECURE_NO_DEPRECATE
+#endif
+#define _MAIN_C_ 1
+#include <iostream>
+#include <iomanip>
+#include <algorithm>
+#include <cstring>
+
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "pover_global.h"
+#include "polyover.h"
+#include "pover_video.h"
+#include "polymain.h"
+
+using namespace std;
+
+#if _DEBUG
+const char *faceNames[] = { "North", "East", "South", "West" };
+#endif
+
+/** 
+**/
+int main( int argc, char **argv) {
+    pover_video poly;
+    poly.threaded = true;
+    gVideo = &poly;
+
+    if(!initializeVideo(argc, argv)) {
+        return 1;
+    }
+
+    gIsGraphicalVersion = poly.graphic_display();
+    if(argc > 1) {
+        if(!ParseCmdLine(argc, argv)) {
+            if(gIsGraphicalVersion) rt_sleep(10000);
+            // if graphical, we haven't opened the console window so all the error messages we
+            // so carefully wrote out disappeared into the ether.  :(
+            exit(1);
+        }
+    }
+
+    if(gCsvFilename != NULL) {
+#define BUFLEN 1000
+        std::string fname_buf = gCsvFilename;
+        fname_buf += ".csv";
+        gCsvFile.open(fname_buf.c_str());
+    }
+
+    // we have gMapXSize and gMapYSize determining the number of "squares"
+    // we have g_xwinsize and g_ywinsize the total size of the window
+    // we also have BORDER_SIZE the size of the border between maps
+    // we need to determine
+    //      g_polyBoxSize -- the number of pixels on each size of each square
+
+    if(gIsGraphicalVersion) {
+        int xpixelsPerMap = (g_xwinsize - 4*BORDER_SIZE) / 3;  // three maps, with borders between and outside
+        gMapXSize = xpixelsPerMap;   // make the boxes one per pixel
+        gPolyXBoxSize = xpixelsPerMap / gMapXSize;
+        int ypixelsPerMap = (g_ywinsize - 2*BORDER_SIZE);       // one map vertically
+        gMapYSize = ypixelsPerMap;   // one pixel per box, rather.
+
+        gPolyYBoxSize = ypixelsPerMap / gMapYSize;
+        if((gPolyXBoxSize == 0) || (gPolyYBoxSize == 0)) {
+            cout << "The display window is not large enough to show the maps" << std::endl;
+            int minxSize = 4*BORDER_SIZE + 3*gMapXSize;
+            int minySize = 2*BORDER_SIZE + gMapYSize;
+            cout << "  Should be at least " << minxSize << " x " << minySize << "." << std::endl;
+            return 1;
+        }
+        map2XLoc = 2*BORDER_SIZE + gMapXSize * gPolyXBoxSize;
+        maprXLoc = 3*BORDER_SIZE + 2 * gMapXSize * gPolyXBoxSize;
+
+    }
+    else {  // not gIsGraphicalVersion
+        // gMapXSize, gMapYSize, gNPolygons defined in pover_global.h
+    }
+
+    // create two polygon maps
+    SetRandomSeed(gMyRandomSeed);  // for repeatability
+
+    gVideo->main_loop();
+}
+
+void Usage(int argc, char **argv) {
+    char *cmdTail = strrchr(*argv, '\\');
+    if(cmdTail == NULL)  {
+        cmdTail = *argv;
+    }
+    else { 
+        cmdTail++;
+    }
+    cout << cmdTail << " [threads[:threads2]] [--polys npolys] [--size nnnxnnn] [--seed nnn]" << std::endl;
+    cout << "Create polygon maps and overlay them." << std::endl << std::endl;
+    cout << "Parameters:" << std::endl;
+    cout << "   threads[:threads2] - number of threads to run" << std::endl;
+    cout << "   --polys npolys - number of polygons in each map" << std::endl;
+    cout << "   --size nnnxnnn - size of each map (X x Y)" << std::endl;
+    cout << "   --seed nnn - initial value of random number generator" << std::endl;
+    cout << "   --csv filename - write timing data to CSV-format file" << std::endl;
+    cout << "   --grainsize n - set grainsize to n" << std::endl;
+    cout << "   --use_malloc - allocate polygons with malloc instead of scalable allocator" << std::endl;
+    cout << std::endl;
+    cout << "npolys must be smaller than the size of the map" << std::endl;
+    cout << std::endl;
+    exit(1);
+}
+
+bool ParseCmdLine(int argc, char **argv ) {
+    bool error_found = false;
+    bool nPolysSpecified = false;
+    bool nMapSizeSpecified = false;
+    bool nSeedSpecified = false;
+    bool csvSpecified = false;
+    bool grainsizeSpecified = false;
+    bool mallocSpecified = false;
+    int origArgc = argc;
+    char** origArgv = argv;
+    unsigned int newnPolygons = gNPolygons;
+    unsigned int newSeed = gMyRandomSeed;
+    unsigned int newX = gMapXSize;
+    unsigned int newY = gMapYSize;
+    unsigned int newGrainSize = gGrainSize;
+    argc--; argv++;
+    if(argc > 0 && isdigit((*argv)[0])) {
+        // first argument is one or two numbers, specifying how mny threads to run
+        char* end; gThreadsHigh = gThreadsLow = (int)strtol(argv[0],&end,0);
+        switch( *end) {
+            case ':': gThreadsHigh = (int)strtol(end+1,0,0); break;
+            case '\0': break;
+            default: cout << "Unexpected character in thread specifier: " << *end << std::endl; break;
+        }
+        if(gThreadsLow > gThreadsHigh) {
+            int t = gThreadsLow;
+            gThreadsLow = gThreadsHigh;
+            gThreadsHigh = t;
+        }
+        argv++; argc--;
+    }
+    while(argc > 0) {
+        // format 1: --size nnnxnnn, where nnn in {0 .. 9}+ -- size of map in "squares"
+        if(!strncmp("--size", *argv, (size_t)6)) {
+            if(nMapSizeSpecified) {
+                cout << " Error: map size multiply specified" << std::endl;
+                error_found = true;
+            }
+            else  {
+                argv++; argc--;
+                if(argc == 0) {
+                    error_found = true;
+                    cout << " Error: --size must have a value" << std::endl;
+                }
+                if(strchr(*argv, 'x') != strrchr(*argv,'x')) {
+                    // more than one 'x'
+                    cout << "Error: map size should be nnnxnnn (" << *argv << ")" << std::endl;
+                    error_found = true;
+                }
+                else {
+                    int rval;
+                    rval = sscanf(*argv, "%ux%u", &newX, &newY);
+                    if(rval != 2) {
+                        cout << "Error parsing map size (format should be nnnxnnn (" << *argv << ")" << std::endl;
+                        error_found = true;
+                    }
+                    if(newX == 0 || newY == 0) {
+                        cout << "Error: size of map should be greater than 0 (" << *argv << ")" << std::endl;
+                        error_found = true;
+                    }
+                }
+            }
+            argc--; argv++;
+        }
+        // format 2: --seed nnn -- initial random number seed
+        else if(!strncmp("--seed", *argv, (size_t)6)) {
+            argv++; argc--;
+            if(nSeedSpecified) {
+                cout << "Error: new seed multiply specified" << std::endl;
+                error_found = true;
+            }
+            else {
+                nSeedSpecified = true;
+                int rtval = sscanf(*argv, "%u", &newSeed);
+                if(rtval == 0) {
+                    cout << "Error: --seed should be an unsigned number (instead of " << *argv << ")" << std::endl;
+                    error_found = true;
+                }
+            }
+            argv++; argc--;
+        }
+        // format 3: --polys n[n] -- number of polygons in each map
+        else if(!strncmp("--polys", *argv, (size_t)7)) {
+            //unsigned int newnPolygons;
+            argv++; argc--;
+            if(nPolysSpecified) {
+                cout << "Error: number of polygons multiply-specified" << std::endl;
+                error_found = true;
+            }else {
+                int rtval = sscanf(*argv, "%u", &newnPolygons);
+                if(newnPolygons == 0) {
+                    cout << "Error: number of polygons must be greater than 0 (" << *argv << ")" << std::endl;
+                }
+            }
+            argv++; argc--;
+        }
+        // format 4: --csv <fileroot> -- name of CSV output file ("xxx" for "xxx.csv")
+        else if(!strncmp("--csv", *argv, (size_t)5)) {
+            argv++; argc--;
+            if(csvSpecified) {
+                cout << "Error: Multiple specification of CSV file" << std::endl;
+                error_found = true;
+            }
+            else {
+                gCsvFilename = *argv;
+                argv++; argc--;
+                csvSpecified = true;
+            }
+        }
+        else if(!strncmp("--grainsize", *argv, (size_t)11)) {
+            argv++; argc--;
+            if(grainsizeSpecified) {
+                cout << "Error: Multiple specification of grainsize" << std::endl;
+                error_found = true;
+            }
+            else {
+                int grval = sscanf(*argv, "%u", &newGrainSize);
+                grainsizeSpecified = true;
+                if(newGrainSize == 0) {
+                    cout << "Error: grainsize must be greater than 0" << std::endl;
+                    error_found = true;
+                }
+            }
+            argv++; argc--;
+        }
+        else if(!strncmp("--use_malloc", *argv, (size_t)12)) {
+            argv++; argc--;
+            if(mallocSpecified) {
+                cout << "Error: --use_malloc multiply-specified" << std::endl;
+                error_found = true;
+            }
+            else {
+                mallocSpecified = true;
+                gMBehavior = UseMalloc;
+            }
+        }
+        else {
+            cout << "Error: unrecognized argument: " << *argv << std::endl;
+            error_found = true;
+            argv++; argc--;
+        }
+    }
+    if(!error_found) {
+        if(newX * newY < newnPolygons) {
+            error_found = true;
+            cout << "Error: map size should not be smaller than the number of polygons (gNPolygons = " << newnPolygons << ", map size " << newX << "x" << newY << ")" << std::endl;
+        }
+    }
+    if(!error_found) {
+        gMapXSize = newX;
+        gMapYSize = newY;
+        gNPolygons = newnPolygons;
+        gMyRandomSeed = newSeed;
+        gGrainSize = (int)newGrainSize;
+    }
+    else {
+        Usage(origArgc, origArgv);
+    }
+    return !error_found;
+}
+
+// create a polygon map with at least gNPolygons polygons.
+// Usually more than gNPolygons polygons will be generated, because the
+// process of growing the polygons results in holes.
+bool GenerateMap(Polygon_map_t **newMap, int xSize, int ySize, int gNPolygons, colorcomp_t maxR, colorcomp_t maxG, colorcomp_t maxB) {
+    bool error_found = false;
+    int  *validPolys;
+    int  *validSide;
+    int maxSides;
+    RPolygon *newPoly;
+
+    if(xSize <= 0) {
+        cout << "xSize (" << xSize << ") should be > 0." << std::endl;
+        error_found = true;
+    }
+    if(ySize <= 0) {
+        cout << "ySize (" << ySize << ") should be > 0." << std::endl;
+        error_found = true;
+    }
+    if(gNPolygons > (xSize * ySize)) {
+        cout << "gNPolygons (" << gNPolygons << ") should be less than " << (xSize * ySize) << std::endl;
+        error_found = true;
+    }
+    if(error_found) return false;
+    // the whole map is [xSize x ySize] squares
+    // the way we create the map is to
+    //    1) pick nPolygon discrete squares on an [xSize x ySize] grid
+    //    2) while there are unused squares on the grid
+    //        3) pick a polygon with a side that has unused squares on a side
+    //        4) expand the polygon by 1 to occupy the unused squares
+    //
+    // Continue until every square on the grid is occupied by a polygon
+    int *tempMap;
+    tempMap = (int *)malloc(xSize * ySize * sizeof(int));
+    for(int i=0;i < xSize; i++) {
+        for(int j=0;j < ySize; j++) {
+            tempMap[i*ySize + j] = 0;
+        }
+    }
+
+    // *newMap = new vector<RPolygon>;
+    *newMap = new Polygon_map_t;
+    (*newMap)->reserve(gNPolygons + 1);  // how much bigger does this need to be on average?
+    (*newMap)->push_back(RPolygon(0,0,xSize-1, ySize-1));
+    for(int i=0; i < gNPolygons; i++) {
+        int nX;
+        int nY;
+        do {    // look for an empty square.
+            nX = NextRan(xSize);
+            nY = NextRan(ySize);
+        } while(tempMap[nX * ySize + nY] != 0);
+        int nR = (maxR * NextRan(1000)) / 999;
+        int nG = (maxG * NextRan(1000)) / 999;
+        int nB = (maxB * NextRan(1000)) / 999;
+        (*newMap)->push_back(RPolygon(nX,nY,nX,nY,nR,nG,nB));
+        tempMap[nX * ySize + nY] = i+1;     // index of this polygon + 1
+    }
+    // now have to grow polygons to fill the space.
+    validPolys = (int *)malloc(4*gNPolygons * sizeof(int));
+    validSide = (int *)malloc(4*gNPolygons * sizeof(int));
+    for(int i=0;i<gNPolygons;i++) {
+        validPolys[4*i] = validPolys[4*i + 1] = validPolys[4*i + 2] = validPolys[4*i + 3] = i + 1;
+        validSide[4*i] = NORTH_SIDE;
+        validSide[4*i+1] = EAST_SIDE;
+        validSide[4*i+2] = SOUTH_SIDE;
+        validSide[4*i+3] = WEST_SIDE;
+    }
+    maxSides = 4*gNPolygons;
+    while(maxSides > 0) {
+        int indx = NextRan(maxSides);
+        int polyIndx = validPolys[indx];
+        int checkSide = validSide[indx];
+        int xlow, xhigh, ylow, yhigh;
+        int xlnew, xhnew, ylnew, yhnew;
+        (**newMap)[polyIndx].get(&xlow,&ylow,&xhigh,&yhigh);
+        xlnew = xlow;
+        xhnew = xhigh;
+        ylnew = ylow; 
+        yhnew = yhigh;
+        // can this polygon be expanded along the chosen side?
+        switch(checkSide) {
+        case NORTH_SIDE:
+            // y-1 from xlow to xhigh
+            ylow = yhigh = (ylow - 1);
+            ylnew--;
+            break;
+        case EAST_SIDE:
+            // x+1 from ylow to yhigh
+            xlow = xhigh = (xhigh + 1);
+            xhnew++;
+            break;
+        case SOUTH_SIDE:
+            // y+1 from xlow to xhigh
+            ylow = yhigh = (yhigh+1);
+            yhnew++;
+            break;
+        case WEST_SIDE:
+            // x-1 from ylow to yhigh
+            xlow = xhigh = (xlow - 1);
+            xlnew--;
+            break;
+        }
+        bool okay_to_extend = !(((xlow < 0) || (xlow >= xSize)) || ((ylow < 0) || (ylow >= ySize)));
+        for(int ii = xlow; (ii <= xhigh) && okay_to_extend; ii++) {
+            for(int jj=ylow; (jj <= yhigh) && okay_to_extend; jj++) {
+                okay_to_extend = tempMap[ii*ySize + jj] == 0;
+            }
+        }
+        if(okay_to_extend) {
+            (**newMap)[polyIndx].set(xlnew,ylnew,xhnew,yhnew);
+            for(int ii = xlow; ii <= xhigh; ii++) {
+                for(int jj=ylow; jj <= yhigh && okay_to_extend; jj++) {
+                    tempMap[ii*ySize + jj] = polyIndx;
+                }
+            }
+        }
+        else {
+            // once we cannot expand along a side, we will never be able to; remove from the list.
+            for(int i=indx + 1; i < maxSides; i++) {
+                validPolys[i-1] = validPolys[i];
+                validSide[i-1] = validSide[i];
+            }
+            maxSides--;
+        }
+    }
+
+    // Once no polygons can be grown, look for unused squares, and fill them with polygons.
+    for(int j=0;j<ySize;j++) {
+        for(int i=0;i<xSize;i++) {
+            if(tempMap[i*ySize+j] == 0) {
+                // try to grow in the x direction, then the y direction
+                int ilen = i;
+                int jlen = j;
+                while(ilen < (xSize - 1) && tempMap[(ilen+1)*ySize + jlen] == 0) {
+                    ilen++;
+                }
+                bool yok = true;
+                while(yok && jlen < (ySize - 1)) {
+                    for(int ii = i; ii <= ilen && yok; ii++) {
+                        yok = (tempMap[ii*ySize + jlen + 1] == 0);
+                    }
+                    if(yok) {
+                        jlen++;
+                    }
+                }
+
+                // create new polygon and push it on our list.
+                int nR = (maxR * NextRan(1000)) / 999;
+                int nG = (maxG * NextRan(1000)) / 999;
+                int nB = (maxB * NextRan(1000)) / 999;
+                (*newMap)->push_back(RPolygon(i,j,ilen,jlen,nR,nG,nB));
+                gNPolygons++;
+                for(int ii=i; ii<=ilen;ii++) {
+                    for(int jj=j;jj<=jlen;jj++) {
+                        tempMap[ii*ySize + jj] = gNPolygons;
+                    }
+                }
+            }
+        }
+    }
+
+#if _DEBUG
+    if(!gIsGraphicalVersion) {
+        cout << std::endl << "Final Map:" << std::endl;
+        for(int j=0; j < ySize; j++ ) {
+            cout << "Row " << setw(2) << j << ":";
+            for(int i=0;i<xSize;i++) {
+                int it = tempMap[i*ySize + j];
+                if(it<10) {
+                    cout << setw(2) << it;
+                }
+                else {
+                    char ct = (int)'a' + it - 10;
+                    cout << " " << ct;
+                }
+            }
+            cout << std::endl;
+        }
+    }
+#endif  // _DEBUG
+    free(tempMap);
+    free(validPolys);
+    free(validSide);
+    return true;
+}
+
+void CheckPolygonMap(Polygon_map_t *checkMap) {
+#define indx(i,j) (i*gMapYSize + j)
+#define rangeCheck(str,n,limit) if(((n)<0)||((n)>=limit)) {cout << "checkMap error: " << str << " out of range (" << n << ")" << std::endl;anError=true;}
+#define xRangeCheck(str,n) rangeCheck(str,n,gMapXSize)
+#define yRangeCheck(str,n) rangeCheck(str,n,gMapYSize)
+    // The first polygon is the whole map.
+    bool anError = false;
+    int *cArray;
+    if(checkMap->size() <= 0) {
+        cout << "checkMap error: no polygons in map" << std::endl;
+        return;
+    }
+    // mapXhigh and mapYhigh are inclusive, that is, if the map is 5x5, those values would be 4.
+    int mapXhigh, mapYhigh, mapLowX, mapLowY;
+    int gMapXSize, gMapYSize;
+    (*checkMap)[0].get(&mapLowX, &mapLowY, &mapXhigh, &mapYhigh);
+    if((mapLowX !=0) || (mapLowY != 0)) {
+        cout << "checkMap error: map origin not (0,0) (X=" << mapLowX << ", Y=" << mapLowY << ")" << std::endl;
+        anError = true;
+    }
+    if((mapXhigh < 0) || (mapYhigh < 0)) {
+        cout << "checkMap error: no area in map (X=" << mapXhigh << ", Y=" << mapYhigh << ")" << std::endl;
+        anError = true;
+    }
+    if(anError) return;
+    // bounds for array.
+    gMapXSize = mapXhigh + 1;
+    gMapYSize = mapYhigh + 1;
+    cArray = (int *)malloc(sizeof(int)*(gMapXSize*gMapYSize));
+
+    for(int i=0; i<gMapXSize; i++) {
+        for(int j=0; j< gMapYSize; j++) {
+            cArray[indx(i,j)] = 0;
+        }
+    }
+
+    int xlow, xhigh, ylow, yhigh;
+    for(int p=1; p < int(checkMap->size()) && !anError; p++) {
+        (*checkMap)[p].get(&xlow, &ylow, &xhigh, &yhigh);
+        xRangeCheck("xlow", xlow);
+        yRangeCheck("ylow", ylow);
+        xRangeCheck("xhigh", xhigh);
+        yRangeCheck("yhigh", yhigh);
+        if(xlow>xhigh) {
+            cout << "checkMap error: xlow > xhigh (" << xlow << "," << xhigh << ")" << std::endl;
+            anError = true;
+        }
+        if(ylow>yhigh) {
+            cout << "checkMap error: ylow > yhigh (" << ylow << "," << yhigh << ")" << std::endl;
+            anError = true;
+        }
+        for(int ii = xlow; ii <= xhigh; ii++) {
+            for(int jj = ylow; jj <= yhigh; jj++) {
+                if(cArray[indx(ii,jj)] != 0) {
+                    cout << "checkMap error: polygons " << cArray[indx(ii,jj)] << " and " << p << " intersect" << std::endl;
+                    anError = true;
+                }
+                cArray[indx(ii,jj)] = p;
+            }
+        }
+    }
+    for(int ii=0; ii < gMapXSize; ii++) {
+        for(int jj=0; jj < gMapYSize; jj++) {
+            if(cArray[indx(ii,jj)] == 0) {
+                cout << "checkMap error: block(" << ii << ", " << jj << ") not in any polygon" << std::endl;
+                anError = true;
+            }
+        }
+    }
+    free(cArray);
+}
+
+bool CompOnePolygon(RPolygon &p1, RPolygon &p2) {
+    int xl1, xh1, yl1, yh1;
+    int xl2, xh2, yl2, yh2;
+    p1.get(&xl1, &yl1, &xh1, &yh1);
+    p2.get(&xl2, &yl2, &xh2, &yh2);
+    if(yl1>yl2) return true;
+    if(yl1<yl2) return false;
+    return (xl1 > xl2);
+}
+
+bool PolygonsEqual(RPolygon *p1, RPolygon *p2) {
+    int xl1, xh1, yl1, yh1;
+    int xl2, xh2, yl2, yh2;
+    p1->get(&xl1, &yl1, &xh1, &yh1);
+    p2->get(&xl2, &yl2, &xh2, &yh2);
+    return ((xl1 == xl2) && (yl1==yl2) && (xh1 == xh2) && (yh1 == yh2));
+}
+
+bool ComparePolygonMaps(Polygon_map_t *map1, Polygon_map_t *map2) {
+    // create two new polygon maps, copy the pointers from the original to these.
+    // we have to skip the first polygon, which is the size of the whole map
+    Polygon_map_t *t1, *t2;
+    bool is_ok = true;
+    t1 = new Polygon_map_t;
+    t1->reserve(map1->size());
+    for(unsigned int i=1;i<map1->size(); i++) {
+        t1->push_back(map1->at(i));
+    }
+    t2 = new Polygon_map_t;
+    t2->reserve(map2->size());
+    for(unsigned int i=1;i<map2->size();i++) {
+        t2->push_back(map2->at(i));
+    }
+    // sort the two created maps by (xlow, ylow)
+    sort(t1->begin(), t1->end());
+    sort(t2->begin(), t2->end());
+    // compare each element of both maps.
+    if(t1->size() != t2->size()) {
+        cout << "Error: maps not the same size ( " << int(t1->size()) << " vs " << int(t2->size()) << ")." << std::endl;
+    }
+    int maxSize = (int)((t1->size() < t2->size()) ? t1->size() : t2->size());
+    for(int i=0; i < maxSize; i++) {
+        if(!PolygonsEqual(&((*t1)[i]), &((*t2)[i]))) {
+            cout << "Error: polygons unequal (" << (*t1)[i] << " vs " << (*t2)[i] << std::endl;
+            is_ok = false;
+        }
+    }
+    delete t1;
+    delete t2;
+    return is_ok;
+}
+
+void SetRandomSeed(int newSeed) {
+    srand((unsigned)newSeed);
+}
+
+int NextRan(int n) {
+    // assert(n > 1);
+    // if we are given 1, we will just return 0
+    //assert(n < RAND_MAX);
+    int rrand = rand() << 15 | rand();
+    if(rrand < 0) rrand = -rrand;
+    return rrand % n;
+}
+
+std::ostream& operator<<(std::ostream& s, const RPolygon &p) {
+    int xl, yl, xh, yh;
+    p.get(&xl, &yl, &xh, &yh);
+    return s << "[(" << xl << "," << yl << ")-(" << xh << "," << yh << ")] ";
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polymain.h b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polymain.h
new file mode 100644
index 00000000..56695d6a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polymain.h
@@ -0,0 +1,45 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "pover_global.h"  // for declaration of DEFINE and INIT
+
+DEFINE Polygon_map_t *gPolymap1 INIT(0);
+DEFINE Polygon_map_t *gPolymap2 INIT(0);
+DEFINE Polygon_map_t *gResultMap INIT(0);
+
+extern void Usage(int argc, char **argv);
+
+extern bool ParseCmdLine(int argc, char **argv );
+
+extern bool GenerateMap(Polygon_map_t **newMap, int xSize, int ySize, int gNPolygons, colorcomp_t maxR, colorcomp_t maxG, colorcomp_t maxB);
+
+extern bool PolygonsOverlap(RPolygon *p1, RPolygon *p2, int &xl, int &yl, int &xh, int &yh);
+
+extern void CheckPolygonMap(Polygon_map_t *checkMap);
+
+extern bool CompOnePolygon(RPolygon *p1, RPolygon *p2);
+
+extern bool PolygonsEqual(RPolygon *p1, RPolygon *p2);
+
+extern bool ComparePolygonMaps(Polygon_map_t *map1, Polygon_map_t *map2);
+
+extern void SetRandomSeed(int newSeed);
+
+extern int NextRan(int n);
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polyover.cpp b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polyover.cpp
new file mode 100644
index 00000000..f155f628
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polyover.cpp
@@ -0,0 +1,668 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Polygon overlay
+//
+#include <iostream>
+#include <algorithm>
+#include <string.h>
+#include <cstdlib>
+#include <assert.h>
+#include "tbb/tick_count.h"
+#include "tbb/blocked_range.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/mutex.h"
+#include "tbb/spin_mutex.h"
+#include "polyover.h"
+#include "polymain.h"
+#include "pover_video.h"
+
+using namespace std;
+
+/*!
+* @brief intersects a polygon with a map, adding any results to output map
+*
+* @param[out] resultMap output map (must be allocated)
+* @param[in] polygon to be intersected
+* @param[in] map intersected against
+* @param[in] lock to use when adding output polygons to result map
+*
+*/
+void OverlayOnePolygonWithMap(Polygon_map_t *resultMap, RPolygon *myPoly, Polygon_map_t *map2, tbb::spin_mutex *rMutex) {
+    int r1, g1, b1, r2, g2, b2;
+    int myr=0;
+    int myg=0;
+    int myb=0;
+    int p1Area = myPoly->area();
+    for(unsigned int j=1; (j < map2->size()) && (p1Area > 0); j++) {
+        RPolygon *p2 = &((*map2)[j]);
+        RPolygon *pnew;
+        int newxMin, newxMax, newyMin, newyMax;
+        myPoly->getColor(&r1, &g1, &b1);
+        if(PolygonsOverlap(myPoly, p2, newxMin, newyMin, newxMax, newyMax)) {
+            p2->getColor(&r2, &g2, &b2);
+            myr = r1 + r2;
+            myg = g1 + g2;
+            myb = b1 + b2;
+            p1Area -= (newxMax-newxMin+1)*(newyMax - newyMin + 1);
+            if(rMutex) {
+                tbb::spin_mutex::scoped_lock lock(*rMutex);
+                resultMap->push_back(RPolygon(newxMin, newyMin, newxMax, newyMax, myr, myg, myb));
+            }
+            else {
+                resultMap->push_back(RPolygon(newxMin, newyMin, newxMax, newyMax, myr, myg, myb));
+            }
+        }
+    }
+}
+
+/*!
+* @brief Serial version of polygon overlay
+* @param[out] output map
+* @param[in]  first map (map that individual polygons are taken from)
+* @param[in]  second map (map passed to OverlayOnePolygonWithMap)
+*/
+void SerialOverlayMaps(Polygon_map_t **resultMap, Polygon_map_t *map1, Polygon_map_t *map2) {
+    cout << "SerialOverlayMaps called" << std::endl;
+    *resultMap = new Polygon_map_t;
+
+    RPolygon *p0 = &((*map1)[0]);
+    int mapxSize, mapySize, ignore1, ignore2;
+    p0->get(&ignore1, &ignore2, &mapxSize, &mapySize);
+    (*resultMap)->reserve(mapxSize*mapySize); // can't be any bigger than this
+    // push the map size as the first polygon,
+    (*resultMap)->push_back(RPolygon(0,0,mapxSize, mapySize));
+    for(unsigned int i=1; i < map1->size(); i++) {
+        RPolygon *p1 = &((*map1)[i]);
+        OverlayOnePolygonWithMap(*resultMap, p1, map2, NULL);
+    }
+}
+
+/*!
+* @class ApplyOverlay
+* @brief Simple version of parallel overlay (make parallel on polygons in map1)
+*/
+class ApplyOverlay {
+    Polygon_map_t *m_map1, *m_map2, *m_resultMap;
+    tbb::spin_mutex *m_rMutex;
+public:
+    /*!
+    * @brief functor to apply
+    * @param[in] r range of polygons to intersect from map1
+    */
+    void operator()( const tbb::blocked_range<int> & r) const {
+        PRINT_DEBUG("From " << r.begin() << " to " << r.end());
+        for(int i=r.begin(); i != r.end(); i++) {
+            RPolygon *myPoly = &((*m_map1)[i]);
+            OverlayOnePolygonWithMap(m_resultMap, myPoly, m_map2, m_rMutex);
+        }
+    }
+    ApplyOverlay(Polygon_map_t *resultMap, Polygon_map_t *map1, Polygon_map_t *map2, tbb::spin_mutex *rmutex) :
+    m_resultMap(resultMap), m_map1(map1), m_map2(map2), m_rMutex(rmutex) {}
+};
+
+/*!
+* @brief apply the parallel algorithm
+* @param[out] result_map generated map
+* @param[in] polymap1 first map to be applied (algorithm is parallel on this map)
+* @param[in] polymap2 second map.
+*/
+void NaiveParallelOverlay(Polygon_map_t *&result_map, Polygon_map_t &polymap1, Polygon_map_t &polymap2) {
+// -----------------------------------
+    bool automatic_threadcount = false;
+
+    if(gThreadsLow == THREADS_UNSET || gThreadsLow == tbb::task_scheduler_init::automatic) {
+        gThreadsLow = gThreadsHigh = tbb::task_scheduler_init::automatic;
+        automatic_threadcount = true;
+    }
+    result_map = new Polygon_map_t;
+
+    RPolygon *p0 = &(polymap1[0]);
+    int mapxSize, mapySize, ignore1, ignore2;
+    p0->get(&ignore1, &ignore2, &mapxSize, &mapySize);
+    result_map->reserve(mapxSize*mapySize); // can't be any bigger than this
+    // push the map size as the first polygon,
+    tbb::spin_mutex *resultMutex = new tbb::spin_mutex();
+    int grain_size = gGrainSize;
+
+    for(int nthreads = gThreadsLow; nthreads <= gThreadsHigh; nthreads++) {
+        tbb::task_scheduler_init init(nthreads);
+        if(gIsGraphicalVersion) {
+            RPolygon *xp = new RPolygon(0, 0, gMapXSize-1, gMapYSize-1, 0, 0, 0);  // Clear the output space
+            delete xp;
+        }
+        // put size polygon in result map
+        result_map->push_back(RPolygon(0,0,mapxSize, mapySize));
+
+        tbb::tick_count t0 = tbb::tick_count::now();
+        tbb::parallel_for (tbb::blocked_range<int>(1,(int)(polymap1.size()),grain_size), ApplyOverlay(result_map, &polymap1, &polymap2, resultMutex));
+        tbb::tick_count t1 = tbb::tick_count::now();
+
+        double naiveParallelTime = (t1-t0).seconds() * 1000;
+        cout << "Naive parallel with spin lock and ";
+        if(automatic_threadcount) cout << "automatic";
+        else cout << nthreads;
+        cout << ((nthreads == 1) ? " thread" : " threads");
+        cout << " took " << naiveParallelTime << " msec : speedup over serial " << (gSerialTime / naiveParallelTime) << std::endl;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "," << naiveParallelTime;
+        }
+#if _DEBUG
+        CheckPolygonMap(result_map);
+        ComparePolygonMaps(result_map, gResultMap);
+#endif
+        result_map->clear();
+    }
+    delete resultMutex;
+    if(gCsvFile.is_open()) {
+        gCsvFile << std::endl;
+    }
+// -----------------------------------
+}
+
+template<typename T>
+void split_at( Flagged_map_t& in_map, Flagged_map_t &left_out, Flagged_map_t &right_out, const T median) {
+    left_out.reserve(in_map.size());
+    right_out.reserve(in_map.size());
+    for(Flagged_map_t::iterator i = in_map.begin(); i != in_map.end(); ++i ) {
+        RPolygon *p = i->p();
+        if(p->xmax() < median) {
+            // in left map
+            left_out.push_back(*i);
+        }
+        else if(p->xmin() >= median) {
+            right_out.push_back(*i);
+            // in right map
+        }
+        else {
+            // in both maps.
+            left_out.push_back(*i);
+            right_out.push_back(RPolygon_flagged(p, true));
+        }
+    }
+}
+
+// range that splits the maps as well as the range.  the flagged_map_t are
+// vectors of pointers, and each range owns its maps (has to free them on destruction.)
+template <typename T>
+class blocked_range_with_maps {
+    
+    typedef blocked_range<T> my_range_type;
+
+private:
+
+    my_range_type my_range;
+    Flagged_map_t my_map1;
+    Flagged_map_t my_map2;
+
+public:
+
+    blocked_range_with_maps(
+            T begin, T end, typename my_range_type::size_type my_grainsize,
+            Polygon_map_t *p1, Polygon_map_t *p2
+            )
+        : my_range(begin, end, my_grainsize)
+    {
+        my_map1.reserve(p1->size());
+        my_map2.reserve(p2->size());
+        for(int i=1; i < p1->size(); ++i) {
+            my_map1.push_back(RPolygon_flagged(&((*p1)[i]), false));
+        }
+        for(int i=1; i < p2->size(); ++i) {
+            my_map2.push_back(RPolygon_flagged(&(p2->at(i)), false));
+        }
+    }
+
+    // copy-constructor required for deep copy of flagged maps.  One copy is done at the start of the
+    // parallel for.
+    blocked_range_with_maps(const blocked_range_with_maps& other): my_range(other.my_range), my_map1(other.my_map1), my_map2(other.my_map2) { }
+    bool empty() const { return my_range.empty(); }
+    bool is_divisible() const { return my_range.is_divisible(); }
+
+#if _DEBUG
+    void check_my_map() {
+        assert(my_range.begin() <= my_range.end());
+        for(Flagged_map_t::iterator ci = my_map1.begin(); ci != my_map1.end(); ++ci) {
+            RPolygon *rp = ci->p();
+            assert(rp->xmax() >= my_range.begin());
+            assert(rp->xmin() < my_range.end());
+        }
+        for(Flagged_map_t::iterator ci = my_map2.begin(); ci != my_map2.end(); ++ci) {
+            RPolygon *rp = ci->p();
+            assert(rp->xmax() >= my_range.begin());
+            assert(rp->xmin() < my_range.end());
+        }
+    }
+
+    void dump_map( Flagged_map_t& mapx) {
+        cout << " ** MAP **\n";
+        for( Flagged_map_t::iterator ci = mapx.begin(); ci != mapx.end(); ++ci) {
+            cout << *(ci->p());
+            if(ci->isDuplicate()) {
+                cout << " -- is_duplicate";
+            }
+            cout << "\n";
+        }
+        cout << "\n";
+    }
+#endif
+
+    blocked_range_with_maps(blocked_range_with_maps& lhs_r, split ) : my_range(my_range_type(lhs_r.my_range, split())) {
+        // lhs_r.my_range makes my_range from [median, high) and rhs_r.my_range from [low, median)
+        Flagged_map_t original_map1 = lhs_r.my_map1;
+        Flagged_map_t original_map2 = lhs_r.my_map2;
+        lhs_r.my_map1.clear();
+        lhs_r.my_map2.clear();
+        split_at(original_map1, lhs_r.my_map1, my_map1, my_range.begin());
+        split_at(original_map2, lhs_r.my_map2, my_map2, my_range.begin());
+#if _DEBUG
+        this->check_my_map();
+        lhs_r.check_my_map();
+#endif
+    }
+
+    const my_range_type& range() const { return my_range; }
+    Flagged_map_t& map1() { return my_map1; }
+    Flagged_map_t& map2() { return my_map2; }
+};
+
+/*!
+* @class ApplySplitOverlay
+* @brief parallel by columnar strip
+*/
+class ApplySplitOverlay {
+    Polygon_map_t *m_map1, *m_map2, *m_resultMap;
+    tbb::spin_mutex *m_rMutex;
+public:
+    /*!
+    * @brief functor for columnar parallel version
+    * @param[in] r range of map to be operated on
+    */
+    void operator()(/*const*/ blocked_range_with_maps<int> & r) const {
+#ifdef _DEBUG
+        // if we are debugging, serialize the method.  That way we can
+        // see what is happening in each strip without the interleaving
+        // confusing things.
+        tbb::spin_mutex::scoped_lock lock(*m_rMutex);
+        cout << unitbuf << "From " << r.range().begin() << " to " << r.range().end()-1 << std::endl;
+#endif
+        // get yMapSize
+        int r1, g1, b1, r2, g2, b2;
+        int myr=-1;
+        int myg=-1;
+        int myb=-1;
+        int i1, i2, i3, yMapSize;
+        (*m_map1)[0].get(&i1, &i2, &i3, &yMapSize);
+
+        Flagged_map_t &fmap1 = r.map1();
+        Flagged_map_t &fmap2 = r.map2();
+
+        // When intersecting polygons from fmap1 and fmap2, if BOTH are flagged
+        // as duplicate, don't add the result to the output map.  We can still
+        // intersect them, because we are keeping track of how much of the polygon
+        // is left over from intersecting, and quitting when the polygon is
+        // used up.
+
+        for(unsigned int ii=0; ii < fmap1.size(); ii++) {
+            RPolygon *p1 = fmap1[ii].p();
+            bool is_dup = fmap1[ii].isDuplicate();
+            int parea = p1->area();
+            p1->getColor(&r1, &g1, &b1);
+            for(unsigned int jj=0;(jj < fmap2.size()) && (parea > 0); jj++) {
+                int xl, yl, xh, yh;
+                RPolygon *p2 = fmap2[jj].p();
+                if(PolygonsOverlap(p1, p2, xl, yl, xh, yh)) {
+                    if(!(is_dup && fmap2[jj].isDuplicate())) {
+                        p2->getColor(&r2, &g2, &b2);
+                        myr = r1 + r2;
+                        myg = g1 + g2;
+                        myb = b1 + b2;
+#ifdef _DEBUG
+#else
+                        tbb::spin_mutex::scoped_lock lock(*m_rMutex);
+#endif
+                        (*m_resultMap).push_back(RPolygon(xl, yl, xh, yh, myr, myg, myb));
+                    }
+                    parea -= (xh-xl+1)*(yh-yl+1);
+                }
+            }
+        }
+    }
+
+    ApplySplitOverlay(Polygon_map_t *resultMap, Polygon_map_t *map1, Polygon_map_t *map2, tbb::spin_mutex *rmutex) :
+    m_resultMap(resultMap), m_map1(map1), m_map2(map2), m_rMutex(rmutex) {}
+};
+
+
+/*!
+* @brief intersects two maps strip-wise
+*
+* @param[out] resultMap output map (must be allocated)
+* @param[in] polymap1 map to be intersected
+* @param[in] polymap2 map to be intersected
+*/
+void SplitParallelOverlay(Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2) {
+    int nthreads;
+    bool automatic_threadcount = false;
+    double domainSplitParallelTime;
+    tbb::tick_count t0, t1;
+    tbb::spin_mutex *resultMutex;
+    if(gThreadsLow == THREADS_UNSET || gThreadsLow == tbb::task_scheduler_init::automatic ) {
+        gThreadsLow = gThreadsHigh = tbb::task_scheduler_init::automatic;
+        automatic_threadcount = true;
+    }
+    *result_map = new Polygon_map_t;
+
+    RPolygon *p0 = &((*polymap1)[0]);
+    int mapxSize, mapySize, ignore1, ignore2;
+    p0->get(&ignore1, &ignore2, &mapxSize, &mapySize);
+    (*result_map)->reserve(mapxSize*mapySize); // can't be any bigger than this
+    resultMutex = new tbb::spin_mutex();
+
+    int grain_size;
+#ifdef _DEBUG
+    grain_size = gMapXSize / 4;
+#else
+    grain_size = gGrainSize;
+#endif
+    for(nthreads = gThreadsLow; nthreads <= gThreadsHigh; nthreads++) {
+        tbb::task_scheduler_init init(nthreads);
+        if(gIsGraphicalVersion) {
+            RPolygon *xp = new RPolygon(0, 0, gMapXSize-1, gMapYSize-1, 0, 0, 0);  // Clear the output space
+            delete xp;
+        }
+        // push the map size as the first polygon,
+        (*result_map)->push_back(RPolygon(0,0,mapxSize, mapySize));
+        t0 = tbb::tick_count::now();
+        tbb::parallel_for (blocked_range_with_maps<int>(0,(int)(mapxSize+1),grain_size, polymap1, polymap2), ApplySplitOverlay((*result_map), polymap1, polymap2, resultMutex));
+        t1 = tbb::tick_count::now();
+        domainSplitParallelTime = (t1-t0).seconds()*1000;
+        cout << "Splitting parallel with spin lock and ";
+        if(automatic_threadcount) cout << "automatic";
+        else cout << nthreads;
+        cout << ((nthreads == 1) ? " thread" : " threads");
+        cout << " took " << domainSplitParallelTime <<  " msec : speedup over serial " << (gSerialTime / domainSplitParallelTime) << std::endl;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "," << domainSplitParallelTime;
+        }
+#if _DEBUG
+        CheckPolygonMap(*result_map);
+        ComparePolygonMaps(*result_map, gResultMap);
+#endif
+        (*result_map)->clear();
+
+    }
+    delete resultMutex;
+    if(gCsvFile.is_open()) {
+        gCsvFile << std::endl;
+    }
+}
+
+class ApplySplitOverlayCV {
+    Polygon_map_t *m_map1, *m_map2;
+    concurrent_Polygon_map_t *m_resultMap;
+public:
+    /*!
+    * @brief functor for columnar parallel version
+    * @param[in] r range of map to be operated on
+    */
+    void operator()(blocked_range_with_maps<int> & r) const {
+        // get yMapSize
+        int r1, g1, b1, r2, g2, b2;
+        int myr=-1;
+        int myg=-1;
+        int myb=-1;
+        int i1, i2, i3, yMapSize;
+        (*m_map1)[0].get(&i1, &i2, &i3, &yMapSize);
+
+        Flagged_map_t &fmap1 = r.map1();
+        Flagged_map_t &fmap2 = r.map2();
+
+        // When intersecting polygons from fmap1 and fmap2, if BOTH are flagged
+        // as duplicate, don't add the result to the output map.  We can still
+        // intersect them, because we are keeping track of how much of the polygon
+        // is left over from intersecting, and quitting when the polygon is
+        // used up.
+
+        for(unsigned int ii=0; ii < fmap1.size(); ii++) {
+            RPolygon *p1 = fmap1[ii].p();
+            bool is_dup = fmap1[ii].isDuplicate();
+            int parea = p1->area();
+            p1->getColor(&r1, &g1, &b1);
+            for(unsigned int jj=0;(jj < fmap2.size()) && (parea > 0); jj++) {
+                int xl, yl, xh, yh;
+                RPolygon *p2 = fmap2[jj].p();
+                if(PolygonsOverlap(p1, p2, xl, yl, xh, yh)) {
+                    if(!(is_dup && fmap2[jj].isDuplicate())) {
+                        p2->getColor(&r2, &g2, &b2);
+                        myr = r1 + r2;
+                        myg = g1 + g2;
+                        myb = b1 + b2;
+                        (*m_resultMap).push_back(RPolygon(xl, yl, xh, yh, myr, myg, myb));
+                    }
+                    parea -= (xh-xl+1)*(yh-yl+1);
+                }
+            }
+        }
+    }
+
+    ApplySplitOverlayCV(concurrent_Polygon_map_t *resultMap, Polygon_map_t *map1, Polygon_map_t *map2 ) :
+    m_resultMap(resultMap), m_map1(map1), m_map2(map2) {}
+};
+
+
+/*!
+* @brief intersects two maps strip-wise, accumulating into a concurrent_vector
+*
+* @param[out] resultMap output map (must be allocated)
+* @param[in] polymap1 map to be intersected
+* @param[in] polymap2 map to be intersected
+*/
+void SplitParallelOverlayCV(concurrent_Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2) {
+    int nthreads;
+    bool automatic_threadcount = false;
+    double domainSplitParallelTime;
+    tbb::tick_count t0, t1;
+    if(gThreadsLow == THREADS_UNSET || gThreadsLow == tbb::task_scheduler_init::automatic ) {
+        gThreadsLow = gThreadsHigh = tbb::task_scheduler_init::automatic;
+        automatic_threadcount = true;
+    }
+    *result_map = new concurrent_Polygon_map_t;
+
+    RPolygon *p0 = &((*polymap1)[0]);
+    int mapxSize, mapySize, ignore1, ignore2;
+    p0->get(&ignore1, &ignore2, &mapxSize, &mapySize);
+    // (*result_map)->reserve(mapxSize*mapySize); // can't be any bigger than this
+
+    int grain_size;
+#ifdef _DEBUG
+    grain_size = gMapXSize / 4;
+#else
+    grain_size = gGrainSize;
+#endif
+    for(nthreads = gThreadsLow; nthreads <= gThreadsHigh; nthreads++) {
+        tbb::task_scheduler_init init(nthreads);
+        if(gIsGraphicalVersion) {
+            RPolygon *xp = new RPolygon(0, 0, gMapXSize-1, gMapYSize-1, 0, 0, 0);  // Clear the output space
+            delete xp;
+        }
+        // push the map size as the first polygon,
+        (*result_map)->push_back(RPolygon(0,0,mapxSize, mapySize));
+        t0 = tbb::tick_count::now();
+        tbb::parallel_for (blocked_range_with_maps<int>(0,(int)(mapxSize+1),grain_size, polymap1, polymap2), ApplySplitOverlayCV((*result_map), polymap1, polymap2));
+        t1 = tbb::tick_count::now();
+        domainSplitParallelTime = (t1-t0).seconds()*1000;
+        cout << "Splitting parallel with concurrent_vector and ";
+        if(automatic_threadcount) cout << "automatic";
+        else cout << nthreads;
+        cout << ((nthreads == 1) ? " thread" : " threads");
+        cout << " took " << domainSplitParallelTime <<  " msec : speedup over serial " << (gSerialTime / domainSplitParallelTime) << std::endl;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "," << domainSplitParallelTime;
+        }
+#if _DEBUG
+        {
+            
+            Polygon_map_t s_result_map;
+            for(concurrent_Polygon_map_t::const_iterator ci = (*result_map)->begin(); ci != (*result_map)->end(); ++ci) {
+                s_result_map.push_back(*ci);
+            }
+            CheckPolygonMap(&s_result_map);
+            ComparePolygonMaps(&s_result_map, gResultMap);
+        }
+#endif
+        (*result_map)->clear();
+
+    }
+
+    if(gCsvFile.is_open()) {
+        gCsvFile << std::endl;
+    }
+
+}
+
+// ------------------------------------------------------
+
+class ApplySplitOverlayETS {
+    Polygon_map_t *m_map1, *m_map2;
+    ETS_Polygon_map_t *m_resultMap;
+public:
+    /*!
+    * @brief functor for columnar parallel version
+    * @param[in] r range of map to be operated on
+    */
+    void operator()(blocked_range_with_maps<int> & r) const {
+        // get yMapSize
+        int r1, g1, b1, r2, g2, b2;
+        int myr=-1;
+        int myg=-1;
+        int myb=-1;
+        int i1, i2, i3, yMapSize;
+        (*m_map1)[0].get(&i1, &i2, &i3, &yMapSize);
+
+        Flagged_map_t &fmap1 = r.map1();
+        Flagged_map_t &fmap2 = r.map2();
+
+        // When intersecting polygons from fmap1 and fmap2, if BOTH are flagged
+        // as duplicate, don't add the result to the output map.  We can still
+        // intersect them, because we are keeping track of how much of the polygon
+        // is left over from intersecting, and quitting when the polygon is
+        // used up.
+
+        for(unsigned int ii=0; ii < fmap1.size(); ii++) {
+            RPolygon *p1 = fmap1[ii].p();
+            bool is_dup = fmap1[ii].isDuplicate();
+            int parea = p1->area();
+            p1->getColor(&r1, &g1, &b1);
+            for(unsigned int jj=0;(jj < fmap2.size()) && (parea > 0); jj++) {
+                int xl, yl, xh, yh;
+                RPolygon *p2 = fmap2[jj].p();
+                if(PolygonsOverlap(p1, p2, xl, yl, xh, yh)) {
+                    if(!(is_dup && fmap2[jj].isDuplicate())) {
+                        p2->getColor(&r2, &g2, &b2);
+                        myr = r1 + r2;
+                        myg = g1 + g2;
+                        myb = b1 + b2;
+                        (*m_resultMap).local().push_back(RPolygon(xl, yl, xh, yh, myr, myg, myb));
+                    }
+                    parea -= (xh-xl+1)*(yh-yl+1);
+                }
+            }
+        }
+    }
+
+    ApplySplitOverlayETS(ETS_Polygon_map_t *resultMap, Polygon_map_t *map1, Polygon_map_t *map2 ) :
+    m_resultMap(resultMap), m_map1(map1), m_map2(map2) {}
+};
+
+
+/*!
+* @brief intersects two maps strip-wise, accumulating into an ets variable
+*
+* @param[out] resultMap output map (must be allocated)
+* @param[in] polymap1 map to be intersected
+* @param[in] polymap2 map to be intersected
+*/
+void SplitParallelOverlayETS(ETS_Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2) {
+    int nthreads;
+    bool automatic_threadcount = false;
+    double domainSplitParallelTime;
+    tbb::tick_count t0, t1;
+    if(gThreadsLow == THREADS_UNSET || gThreadsLow == tbb::task_scheduler_init::automatic ) {
+        gThreadsLow = gThreadsHigh = tbb::task_scheduler_init::automatic;
+        automatic_threadcount = true;
+    }
+    *result_map = new ETS_Polygon_map_t;
+
+    RPolygon *p0 = &((*polymap1)[0]);
+    int mapxSize, mapySize, ignore1, ignore2;
+    p0->get(&ignore1, &ignore2, &mapxSize, &mapySize);
+    // (*result_map)->reserve(mapxSize*mapySize); // can't be any bigger than this
+
+    int grain_size;
+#ifdef _DEBUG
+    grain_size = gMapXSize / 4;
+#else
+    grain_size = gGrainSize;
+#endif
+    for(nthreads = gThreadsLow; nthreads <= gThreadsHigh; nthreads++) {
+        tbb::task_scheduler_init init(nthreads);
+        if(gIsGraphicalVersion) {
+            RPolygon *xp = new RPolygon(0, 0, gMapXSize-1, gMapYSize-1, 0, 0, 0);  // Clear the output space
+            delete xp;
+        }
+        // push the map size as the first polygon,
+        // This polygon needs to be first, so we can push it at the start of a combine.
+        // (*result_map)->local.push_back(RPolygon(0,0,mapxSize, mapySize));
+        t0 = tbb::tick_count::now();
+        tbb::parallel_for (blocked_range_with_maps<int>(0,(int)(mapxSize+1),grain_size, polymap1, polymap2), ApplySplitOverlayETS((*result_map), polymap1, polymap2));
+        t1 = tbb::tick_count::now();
+        domainSplitParallelTime = (t1-t0).seconds()*1000;
+        cout << "Splitting parallel with ETS and ";
+        if(automatic_threadcount) cout << "automatic";
+        else cout << nthreads;
+        cout << ((nthreads == 1) ? " thread" : " threads");
+        cout << " took " << domainSplitParallelTime <<  " msec : speedup over serial " << (gSerialTime / domainSplitParallelTime) << std::endl;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "," << domainSplitParallelTime;
+        }
+#if _DEBUG
+        {
+            
+            Polygon_map_t s_result_map;
+            flattened2d<ETS_Polygon_map_t> psv = flatten2d(**result_map);
+            s_result_map.push_back(RPolygon(0,0,mapxSize, mapySize));
+            for(flattened2d<ETS_Polygon_map_t>::const_iterator ci = psv.begin(); ci != psv.end(); ++ci) {
+                s_result_map.push_back(*ci);
+            }
+            CheckPolygonMap(&s_result_map);
+            ComparePolygonMaps(&s_result_map, gResultMap);
+        }
+#endif
+        (*result_map)->clear();
+
+    }
+
+    if(gCsvFile.is_open()) {
+        gCsvFile << std::endl;
+    }
+
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polyover.h b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polyover.h
new file mode 100644
index 00000000..440f2e83
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/polyover.h
@@ -0,0 +1,41 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*!
+ * polyover.h : extern declarations for polyover.cpp
+*/
+#include "rpolygon.h"
+#include "tbb/mutex.h"
+#include "tbb/spin_mutex.h"
+
+extern void OverlayOnePolygonWithMap(Polygon_map_t *resultMap, RPolygon *myPoly, Polygon_map_t  *map2, tbb::spin_mutex *rMutex);
+
+extern void SerialOverlayMaps(Polygon_map_t **resultMap, Polygon_map_t *map1, Polygon_map_t *map2);
+
+// extern void NaiveParallelOverlay(Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2);
+extern void NaiveParallelOverlay(Polygon_map_t *&result_map, Polygon_map_t &polymap1, Polygon_map_t &polymap2);
+
+extern void SplitParallelOverlay(Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2);
+extern void SplitParallelOverlayCV(concurrent_Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2);
+extern void SplitParallelOverlayETS(ETS_Polygon_map_t **result_map, Polygon_map_t *polymap1, Polygon_map_t *polymap2);
+
+extern void CheckPolygonMap(Polygon_map_t *checkMap);
+extern bool ComparePolygonMaps(Polygon_map_t *map1, Polygon_map_t *map2);
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_global.h b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_global.h
new file mode 100644
index 00000000..570fc6a8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_global.h
@@ -0,0 +1,93 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// pover_global.h
+//
+#ifndef _POVER_GLOBAL_H_
+#define _POVER_GLOBAL_H_
+
+#ifdef _MAIN_C_
+#define DEFINE // nothing
+#define STATIC static
+#define INIT(n) = n
+#else // not in main file
+#define DEFINE extern
+#define STATIC  // nothing
+#define INIT(n) // nothing
+#endif  // _MAIN_C_
+
+#include <iostream>
+#include <fstream>
+
+#ifdef _WINDOWS
+#include <windows.h>
+#endif
+
+// this Polygon class only supports rectangles
+DEFINE int gDrawXOffset INIT(0);   // used for drawing polygons
+DEFINE int gDrawYOffset INIT(0);
+DEFINE int gPolyXBoxSize INIT(0);  // number of pixels orresponding to one "square" (x)
+DEFINE int gPolyYBoxSize INIT(0);  // number of pixels orresponding to one "square" (y)
+DEFINE bool gDoDraw INIT(false);       // render the boxes
+
+#define THREADS_UNSET 0
+DEFINE int gThreadsLow INIT(THREADS_UNSET);
+DEFINE int gThreadsHigh INIT(THREADS_UNSET);
+
+DEFINE std::ofstream gCsvFile;
+DEFINE double gSerialTime;
+DEFINE char *gCsvFilename INIT(NULL);
+
+#define BORDER_SIZE 10  // number of pixels between maps
+
+// The map size and the number of polygons depends on the version we are compiling.
+// If DEBUG then it is small; else it is large.
+
+#ifdef _DEBUG
+DEFINE int gNPolygons INIT(30);  // default number of polygons in map
+DEFINE int gMapXSize INIT(30);
+DEFINE int gMapYSize INIT(30);
+DEFINE int gGrainSize INIT(5);
+#else
+DEFINE int gNPolygons INIT(50000);    // default number of polygons in map
+DEFINE int gMapXSize INIT(1000);
+DEFINE int gMapYSize INIT(1000);
+DEFINE int gGrainSize INIT(20);
+#endif
+DEFINE int gMyRandomSeed INIT(2453185);
+
+DEFINE bool gIsGraphicalVersion INIT(false);
+
+typedef enum {
+    NORTH_SIDE,
+    EAST_SIDE,
+    SOUTH_SIDE,
+    WEST_SIDE
+} allSides;
+
+#if _DEBUG
+#define PRINT_DEBUG(x) (cout << x << std::endl)
+#else
+#define PRINT_DEBUG(x)
+#endif
+
+
+#endif // _POVER_GLOBAL_H_
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_video.cpp b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_video.cpp
new file mode 100644
index 00000000..0b2cf7be
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_video.cpp
@@ -0,0 +1,175 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Support for GUI display for Polygon overlay demo
+
+#define VIDEO_WINMAIN_ARGS
+#include <iostream>
+#include "polyover.h"
+#include "polymain.h"
+#include "pover_video.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#ifndef _WIN32
+#include <sys/time.h>
+#include <unistd.h>
+
+void rt_sleep(int msec) {
+    usleep(msec*1000);
+}
+
+#else //_WIN32
+
+#undef OLDUNIXTIME
+#undef STDTIME
+
+#include <windows.h>
+
+void rt_sleep(int msec) {
+    Sleep(msec);
+}
+
+#endif  /*  _WIN32  */
+
+using namespace std;
+
+bool g_next_frame() {
+    if(++n_next_frame_calls >= frame_skips) { // the data race here is benign
+        n_next_frame_calls = 0; 
+        return gVideo->next_frame();
+    } 
+    return gVideo->running;
+}
+
+bool g_last_frame() {
+    if(n_next_frame_calls) return gVideo->next_frame(); 
+    return gVideo->running;
+}
+
+bool initializeVideo(int argc, char **argv) {
+    //pover_video *l_video = new pover_video();
+    //gVideo = l_video;
+    gVideo->init_console();  // don't check return code.
+    gVideo->title = g_windowTitle;
+    g_useGraphics = gVideo->init_window(g_xwinsize, g_ywinsize);
+    return true;
+}
+
+void pover_video::on_process() {
+    tbb::tick_count t0, t1;
+    double naiveParallelTime, domainSplitParallelTime;
+    // create map1  These could be done in parallel, if the pseudorandom number generator were re-seeded.
+    GenerateMap(&gPolymap1, gMapXSize, gMapYSize, gNPolygons, /*red*/255, /*green*/0, /*blue*/127);
+    // create map2
+    GenerateMap(&gPolymap2, gMapXSize, gMapYSize, gNPolygons, /*red*/0, /*green*/255, /*blue*/127);
+        //
+        // Draw source maps
+    gDrawXOffset = map1XLoc;
+    gDrawYOffset = map1YLoc;
+        for(int i=0; i < int(gPolymap1->size()); i++) {
+            (*gPolymap1)[i].drawPoly();
+        }
+    gDrawXOffset = map2XLoc;
+    gDrawYOffset = map2YLoc;
+        for(int i=0; i < int(gPolymap2->size()) ;i++) {
+            (*gPolymap2)[i].drawPoly();
+        }
+        gDoDraw = true;
+
+    // run serial map generation
+    gDrawXOffset = maprXLoc;
+    gDrawYOffset = maprYLoc;
+    {
+        RPolygon *xp = new RPolygon(0, 0, gMapXSize-1, gMapYSize-1, 0, 0, 0);  // Clear the output space
+        delete xp;
+        t0 = tbb::tick_count::now();
+        SerialOverlayMaps(&gResultMap, gPolymap1, gPolymap2);
+        t1 = tbb::tick_count::now();
+        cout << "Serial overlay took " << (t1-t0).seconds()*1000 << " msec" << std::endl;
+        gSerialTime = (t1-t0).seconds()*1000;
+#if _DEBUG
+        CheckPolygonMap(gResultMap);
+        // keep the map for comparison purposes.
+#else
+        delete gResultMap;
+#endif
+        if(gCsvFile.is_open()) {
+            gCsvFile << "Serial Time," << gSerialTime << std::endl;
+            gCsvFile << "Threads,";
+            if(gThreadsLow == THREADS_UNSET || gThreadsLow == tbb::task_scheduler_init::automatic) {
+                gCsvFile << "Threads,Automatic";
+            }
+            else {
+                for(int i=gThreadsLow; i <= gThreadsHigh; i++) {
+                    gCsvFile << i;
+                    if(i < gThreadsHigh) gCsvFile << ",";
+                }
+            }
+            gCsvFile << std::endl;
+        }
+        if(gIsGraphicalVersion) rt_sleep(2000);
+    }
+    // run naive parallel map generation
+    {
+        Polygon_map_t *resultMap;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "Naive Time";
+        }
+        NaiveParallelOverlay(resultMap, *gPolymap1, *gPolymap2);
+        delete resultMap;
+        if(gIsGraphicalVersion) rt_sleep(2000);
+    }
+    // run split map generation
+    {
+        Polygon_map_t *resultMap;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "Split Time";
+        }
+        SplitParallelOverlay(&resultMap, gPolymap1, gPolymap2);
+        delete resultMap;
+        if(gIsGraphicalVersion) rt_sleep(2000);
+    }
+    // split, accumulating into concurrent vector
+    {
+        concurrent_Polygon_map_t *cresultMap;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "Split CV time";
+        }
+        SplitParallelOverlayCV(&cresultMap, gPolymap1, gPolymap2);
+        delete cresultMap;
+        if(gIsGraphicalVersion) rt_sleep(2000);
+    }
+    // split, accumulating into ETS
+    {
+        ETS_Polygon_map_t *cresultMap;
+        if(gCsvFile.is_open()) {
+            gCsvFile << "Split ETS time";
+        }
+        SplitParallelOverlayETS(&cresultMap, gPolymap1, gPolymap2);
+        delete cresultMap;
+        if(gIsGraphicalVersion) rt_sleep(2000);
+    }
+    if(gIsGraphicalVersion) rt_sleep(8000);
+    delete gPolymap1;
+    delete gPolymap2;
+#if _DEBUG
+    delete gResultMap;
+#endif
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_video.h b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_video.h
new file mode 100644
index 00000000..385716d5
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/pover_video.h
@@ -0,0 +1,64 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// support for GUI for polygon overlay demo
+//
+#ifndef _POVER_VIDEO_H_
+#define _POVER_VIDEO_H_
+#include "../../common/gui/video.h"
+
+#include "pover_global.h"  // for declaration of DEFINE and INIT
+
+DEFINE class video *gVideo INIT(0);
+
+DEFINE int n_next_frame_calls INIT(0);
+DEFINE int frame_skips INIT(10);
+extern bool g_next_frame();
+extern bool g_last_frame();
+
+class pover_video: public video {
+    void on_process();
+public:
+#ifdef _WINDOWS
+    bool graphic_display(){return video::win_hInstance != (HINSTANCE)NULL;}
+#else
+    bool graphic_display() { return true;} // fix this for Linux
+#endif
+    //void on_key(int key);
+};
+
+DEFINE int g_xwinsize INIT(1024);
+DEFINE int g_ywinsize INIT(768);
+
+DEFINE int map1XLoc INIT(10);
+DEFINE int map1YLoc INIT(10);
+DEFINE int map2XLoc INIT(270);
+DEFINE int map2YLoc INIT(10);
+DEFINE int maprXLoc INIT(530);
+DEFINE int maprYLoc INIT(10);
+
+DEFINE const char *g_windowTitle INIT("Polygon Overlay");
+DEFINE bool g_useGraphics INIT(true);
+
+extern bool initializeVideo(int argc, char **argv);
+
+extern void rt_sleep(int msec);
+
+#endif  // _POVER_VIDEO_H_
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/readme.html b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/readme.html
new file mode 100644
index 00000000..1008b524
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/readme.html
@@ -0,0 +1,476 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Polygon_overlay sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Polygon_overlay sample</h1>
+	</div>
+
+	<p>
+		Polygon Overlay example that demonstrates the use of parallel_for.
+	<br><br>
+		This example is a simple implementation of polygon overlay, as described in 
+		<a href="http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.46.9538">
+			<i>Parallelizing the Polygon Overlay Problem Using Orca</i>, by H.F. Langendoen</a>.
+	<br><br>
+		The solution was implemented in three forms:
+		<ul>
+			<li>The naive serial solution.
+			<li>The naive parallel solution, by splitting list of polygons from one map and intersecting 
+			each sub-list against the entire list of polygons from the second map.
+			<li>A parallel solution where each map is split into submaps, with each resulting submap being
+			intersected against the corresponding submap from the other map.  This solution requires some
+			redundancy (some polygons are members of more than one submap).  To prevent multiple copies
+			of a polygon from being placed in the solution map, if both polygons are duplicated (that is,
+			if they both appear in more than one map), they are intersected but the result is not placed
+			in the solution map.
+		</ul>
+		The only optimization in each solution is that the area of the generated sub-polygons are subtracted from
+		the original area of one of the source polygons.  When the remaining area is zero, the intersection process
+		is halted.
+	<br><br>
+		<i>A word about the speedup of the submap case.</i> One may get superlinear speedup in this case (for instance a 
+		laptop with Intel&reg; Core(TM) Duo processor got a speedup of about 20 percent over serial.)  This results from two effects:
+		<ul>
+			<li>the number of threads used, and
+			<li>the fact that for each submap, the number of polygons is smaller than that for the other two cases.
+		</ul>
+		If there are, say, 400 polygons in each map, then on average the number of intersections calculated is 
+		approximately 80,000 (400 * 200, where 200 is the average number of polygons examined before stopping.)  
+		If the maps are split into 2 submaps, the time for each submap is about 200*100, or 20,000.  So even
+		comparing the two sets of submaps serially should result in a speedup somewhere around 2.  This number 
+		is affected by the number of redundant polygons being compared; this effect would eventually swamp the gain
+		from comparing smaller numbers of polygons per submap.  And remember the submaps are created by intersecting each
+		map with a rectangular polygon covering the submap being generated, which is additional work taking about N * O(400)
+		in the case above, where N is the number of submaps generated, that can be done in parallel.
+	<br><br>
+		Running the default release pover while varying the number of submaps from 1 to 1000, the speedup on the submap 
+		case for a 2-processor system looks like
+	<br><br>
+		<img src="speedup.gif" alt="Table of speedup for the algorithm">
+	<br><br>
+		One further optimization would be to sort one map, say <b>map1</b>, by maxY, and sort the other map (<b>map2</b>) 
+		by minY.  For <b>p1</b> in <b>map1</b>, start testing for intersection at the first <b>p2</b> in <b>map2</b> 
+		that intersected the last polygon tested in <b>map1</b>.  This would speed up the intersection process greatly, 
+		but the optimization would apply to all the methods, and the sort would have to be accounted for in the timing.
+	<br><br>
+		The source maps are generated pseudo-randomly in the manner described in the paper above.  That is, if
+		we need N polygons, then N "boxes" are chosen at random, then one-at-a-time the areas are expanded in
+		one of fours directions until the area hits an adjacent polygon.  When this process is finished, the
+		resulting map is inspected and any remaining unoccupied "boxes" are made into additional polygons, as
+		large as possible in each case.  So the actual number of polygons in each map will in general be larger
+		than the number of polygons requested (sometimes by 10% or more.)
+	<br><br>
+		One limitation of the program is that if the number of polygons in the source map is greater than the number of
+		"boxes" (pixels in the GUI case), the maps cannot be generated.
+	</p>
+	
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="polyover.cpp">polyover.cpp</a>
+				<dd>Source code for main program.
+				<dt><a href="polyover.h">polyover.h</a>
+				<dd>Global variables, classes and enums.
+				<dt><a href="pover_video.cpp">pover_video.cpp</a>
+				<dd>Source code for the GUI interface.
+				<dt><a href="pover_video.h">pover_video.h</a>
+				<dd>Defines for the GUI version.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>
+				General build directions can be found <a href="../../index.html">here</a>.
+			<br><br>
+				For the various UI options, see the <a href="../../common/index.html">common GUI code</a> build instructions.
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>
+				Building via the above make commands, or via Microsoft* Visual Studio* projects on Windows* systems, produces executable files
+				named pover.exe.  To run these executables directly, use one or more of the following commands:
+			</p>
+			<dl>
+				<dt><tt>pover.exe</tt>
+				<dd>Run this version (release or debug).
+				<dt><tt>pover.exe n:m</tt>
+				<dd>Run this version (release or debug) (m-n+1) times, with n threads to m threads inclusive.
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Threading Tools:
+				<dd>Build a <i>debug</i> version with the GUI turned off
+					(e.g., <tt>make UI=con debug</tt>; see also the build directions above).
+					<br>Run it with a small dataset, e.g., <tt>pover.exe&nbsp;--polys&nbsp;10&nbsp;--size&nbsp;5x5</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Notes</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<ul>
+			<li>While running with the GUI display should yield reasonable performance in most cases, <i>running with no GUI
+				display is strongly recommended</i> in order to demonstrate the full performance and scalability of the example.
+			</ul>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel, Intel Core and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/rpolygon.h b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/rpolygon.h
new file mode 100644
index 00000000..9cc8f743
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/rpolygon.h
@@ -0,0 +1,155 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// rpolygon.h
+//
+#ifndef _RPOLYGON_H_
+#define _RPOLYGON_H_
+#include <vector>
+#include <iostream>
+#include "pover_video.h"
+
+#include "tbb/scalable_allocator.h"
+#include "tbb/concurrent_vector.h"
+#include "tbb/enumerable_thread_specific.h"
+
+using namespace std;
+
+using namespace tbb;
+
+class RPolygon;
+typedef scalable_allocator<RPolygon> RPolygon_allocator;
+DEFINE RPolygon_allocator rAlloc;
+
+enum MallocBehavior {
+    UseMalloc,
+    UseScalableAllocator
+};
+
+DEFINE MallocBehavior gMBehavior INIT(UseScalableAllocator);
+
+class RPolygon {
+public:
+    RPolygon() {m_XMin = m_YMin = m_XMax = m_YMax = 0;
+        m_r = m_g = m_b = 0;
+    }
+    RPolygon(int xMin, int yMin, int xMax, int yMax, int r=-1, int g=-1, int b=-1) : m_XMin(xMin), m_YMin(yMin), m_XMax(xMax), m_YMax(yMax) {
+        if( r >= 0) {
+            m_r=(colorcomp_t)r; m_g=(colorcomp_t)g; m_b=(colorcomp_t)b;
+                        if(gDoDraw) drawPoly();
+        }
+    }
+
+    void set_nodraw(int xMin, int yMin, int xMax, int yMax) {m_XMin=xMin; m_YMin=yMin; m_XMax=xMax; m_YMax=yMax;}
+
+    RPolygon &intersect(RPolygon &otherPoly);
+    void set(int xMin, int yMin, int xMax, int yMax) {
+         set_nodraw(xMin,yMin,xMax,yMax);
+         if(gDoDraw) {
+            drawPoly();
+         }
+    }
+    void get(int *xMin, int *yMin, int *xMax, int *yMax) const {*xMin=m_XMin;*yMin=m_YMin;*xMax=m_XMax;*yMax=m_YMax;}
+    int xmax() const { return m_XMax; }
+    int xmin() const { return m_XMin; }
+    int ymax() const { return m_YMax; }
+    int ymin() const { return m_YMin; }
+    void setColor(colorcomp_t newr, colorcomp_t newg, colorcomp_t newb) {m_r = newr; m_g=newg; m_b=newb;}
+    void getColor(int *myr, int *myg, int *myb) {*myr=m_r; *myg=m_g; *myb=m_b;}
+    color_t myColor() {return gVideo->get_color(m_r, m_g, m_b);}
+    void drawPoly() {
+        if(gVideo->running) {
+            if(g_next_frame()) {    // Shouldn't call next_frame each time
+                drawing_area ldrawing(
+                    gDrawXOffset+m_XMin*gPolyXBoxSize,         //x
+                    gDrawYOffset+m_YMin*gPolyYBoxSize,         //y
+                    (m_XMax-m_XMin+1)*gPolyXBoxSize,           //sizex
+                    (m_YMax-m_YMin+1)*gPolyYBoxSize);          //sizey
+                for(int y=0; y<ldrawing.size_y; y++) {
+                    ldrawing.set_pos(0,y);
+                    color_t my_color = myColor();
+                    for(int x=0;x < ldrawing.size_x; x++) {
+                         ldrawing.put_pixel(my_color);
+                    }
+                }
+            }
+        }
+    }
+
+    int  area() {return ((m_XMax-m_XMin+1)*(m_YMax-m_YMin+1));}
+    void print(int i) { cout << "RPolygon " << i << " (" << m_XMin << ", " << m_YMin << ")-(" << m_XMax << ", " << m_YMax << ") " << endl; fflush(stdout);}
+private:
+    int m_XMin;
+    int m_YMin;
+    int m_XMax;
+    int m_YMax;
+    colorcomp_t m_r;
+    colorcomp_t m_g;
+    colorcomp_t m_b;
+};
+
+#if _MAIN_C_
+bool operator<(const RPolygon& a, const RPolygon& b) {
+    if(a.ymin() > b.ymin()) return false;
+    if(a.ymin() < b.ymin()) return true;
+    return a.xmin() < b.xmin();
+}
+#else
+extern bool operator<(const RPolygon& a, const RPolygon& b);
+#endif
+
+extern ostream& operator<<(ostream& s, const RPolygon &p);
+
+class RPolygon_flagged {
+    RPolygon *myPoly;
+    bool is_duplicate;
+public:
+    RPolygon_flagged() {myPoly = NULL; is_duplicate = false;}
+    RPolygon_flagged(RPolygon* _p, bool _is_duplicate) : myPoly(_p), is_duplicate(_is_duplicate) { }
+    bool isDuplicate() {return is_duplicate;}
+    void setDuplicate(bool newValue) {is_duplicate = newValue;}
+    RPolygon *p() {return myPoly;}
+    void setp(RPolygon *newp) {myPoly = newp;}
+};
+
+typedef class vector<RPolygon, RPolygon_allocator> Polygon_map_t;
+typedef class concurrent_vector<RPolygon, RPolygon_allocator> concurrent_Polygon_map_t;
+typedef class enumerable_thread_specific<Polygon_map_t> ETS_Polygon_map_t;
+typedef class vector<RPolygon_flagged, scalable_allocator<RPolygon_flagged> > Flagged_map_t; // we'll make shallow copies
+
+inline bool PolygonsOverlap(RPolygon *p1, RPolygon *p2, int &xl, int &yl, int &xh, int &yh) {
+    int xl1, yl1, xh1, yh1, xl2, yl2, xh2, yh2;
+#if _DEBUG
+     rt_sleep(1);   // slow down the process so we can see it.
+#endif
+    p1->get(&xl1, &yl1, &xh1, &yh1);
+    p2->get(&xl2, &yl2, &xh2, &yh2);
+    if(xl1 > xh2) return false;
+    if(xh1 < xl2) return false;
+    if(yl1 > yh2) return false;
+    if(yh1 < yl2) return false;
+    xl = (xl1 < xl2) ? xl2 : xl1;
+    xh = (xh1 < xh2) ? xh1 : xh2;
+    yl = (yl1 < yl2) ? yl2 : yl1;
+    yh = (yh1 < yh2) ? yh1 : yh2;
+    return true;
+}
+
+#endif // _RPOLYGON_H_
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/speedup.gif b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/speedup.gif
new file mode 100644
index 00000000..04d6d876
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/speedup.gif differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..b2b4b93e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/project.pbxproj
@@ -0,0 +1,573 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		84B8DA77152CA90100D59B95 /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		84B8DA7A152CA90100D59B95 /* (null) in Resources */ = {isa = PBXBuildFile; };
+		84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */; };
+		84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7E152CA97B00D59B95 /* MainMenu.xib */; };
+		84B8DA9A152CADF400D59B95 /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		84B8DAAC152CB05200D59B95 /* polymain.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DAA4152CB05200D59B95 /* polymain.cpp */; };
+		84B8DAAD152CB05200D59B95 /* polyover.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DAA6152CB05200D59B95 /* polyover.cpp */; };
+		84B8DAAE152CB05200D59B95 /* pover_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DAA9152CB05200D59B95 /* pover_video.cpp */; };
+		84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D017551527431F0008A4E0 /* Cocoa.framework */; };
+		84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D01775152744BD0008A4E0 /* OpenGL.framework */; };
+		D31F32621C11DEE000A77D54 /* polymain.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DAA4152CB05200D59B95 /* polymain.cpp */; };
+		D31F32631C11DEE300A77D54 /* polyover.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DAA6152CB05200D59B95 /* polyover.cpp */; };
+		D31F32641C11DEE700A77D54 /* pover_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DAA9152CB05200D59B95 /* pover_video.cpp */; };
+		D31F32651C11DEEC00A77D54 /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		D31F32661C11DEF000A77D54 /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		D31F32671C11DEF300A77D54 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		D31F32681C11DEF600A77D54 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		D31F326B1C11DF6000A77D54 /* iOS.storyboard in Resources */ = {isa = PBXBuildFile; fileRef = D31F32691C11DF1600A77D54 /* iOS.storyboard */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5897B2191EB8300DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXFileReference section */
+		84B8DA6F152CA90100D59B95 /* main.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = main.m; path = ../../../common/gui/xcode/tbbExample/main.m; sourceTree = "<group>"; };
+		84B8DA70152CA90100D59B95 /* OpenGLView.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = OpenGLView.h; path = ../../../common/gui/xcode/tbbExample/OpenGLView.h; sourceTree = "<group>"; };
+		84B8DA71152CA90100D59B95 /* OpenGLView.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = OpenGLView.m; path = ../../../common/gui/xcode/tbbExample/OpenGLView.m; sourceTree = "<group>"; };
+		84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = tbbAppDelegate.h; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.h; sourceTree = "<group>"; };
+		84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = tbbAppDelegate.m; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.m; sourceTree = "<group>"; };
+		84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = "tbbExample-Prefix.pch"; path = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch"; sourceTree = "<group>"; };
+		84B8DA7D152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = text.plist.strings; name = en; path = InfoPlist.strings; sourceTree = "<group>"; };
+		84B8DA7F152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = file.xib; name = en; path = MainMenu.xib; sourceTree = "<group>"; };
+		84B8DA99152CADF400D59B95 /* macvideo.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = macvideo.cpp; path = ../../../common/gui/macvideo.cpp; sourceTree = "<group>"; };
+		84B8DAA4152CB05200D59B95 /* polymain.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = polymain.cpp; path = ../polymain.cpp; sourceTree = "<group>"; };
+		84B8DAA5152CB05200D59B95 /* polymain.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = polymain.h; path = ../polymain.h; sourceTree = "<group>"; };
+		84B8DAA6152CB05200D59B95 /* polyover.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = polyover.cpp; path = ../polyover.cpp; sourceTree = "<group>"; };
+		84B8DAA7152CB05200D59B95 /* polyover.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = polyover.h; path = ../polyover.h; sourceTree = "<group>"; };
+		84B8DAA8152CB05200D59B95 /* pover_global.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = pover_global.h; path = ../pover_global.h; sourceTree = "<group>"; };
+		84B8DAA9152CB05200D59B95 /* pover_video.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = pover_video.cpp; path = ../pover_video.cpp; sourceTree = "<group>"; };
+		84B8DAAA152CB05200D59B95 /* pover_video.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = pover_video.h; path = ../pover_video.h; sourceTree = "<group>"; };
+		84B8DAAB152CB05200D59B95 /* rpolygon.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = rpolygon.h; path = ../rpolygon.h; sourceTree = "<group>"; };
+		84D017511527431F0008A4E0 /* tbbExample.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tbbExample.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		84D017551527431F0008A4E0 /* Cocoa.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Cocoa.framework; path = System/Library/Frameworks/Cocoa.framework; sourceTree = SDKROOT; };
+		84D017581527431F0008A4E0 /* AppKit.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = AppKit.framework; path = System/Library/Frameworks/AppKit.framework; sourceTree = SDKROOT; };
+		84D017591527431F0008A4E0 /* CoreData.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = CoreData.framework; path = System/Library/Frameworks/CoreData.framework; sourceTree = SDKROOT; };
+		84D0175A1527431F0008A4E0 /* Foundation.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Foundation.framework; path = System/Library/Frameworks/Foundation.framework; sourceTree = SDKROOT; };
+		84D01775152744BD0008A4E0 /* OpenGL.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = OpenGL.framework; path = System/Library/Frameworks/OpenGL.framework; sourceTree = SDKROOT; };
+		D31F324B1C11DEC100A77D54 /* tbbExample.ios.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tbbExample.ios.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		D31F32691C11DF1600A77D54 /* iOS.storyboard */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = file.storyboard; name = iOS.storyboard; path = ../iOS.storyboard; sourceTree = "<group>"; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		84D0174E1527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */,
+				84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D31F32481C11DEC100A77D54 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		84B8DA6C152CA8D900D59B95 /* tbbExample */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DAA4152CB05200D59B95 /* polymain.cpp */,
+				84B8DAA5152CB05200D59B95 /* polymain.h */,
+				84B8DAA6152CB05200D59B95 /* polyover.cpp */,
+				84B8DAA7152CB05200D59B95 /* polyover.h */,
+				84B8DAA8152CB05200D59B95 /* pover_global.h */,
+				84B8DAA9152CB05200D59B95 /* pover_video.cpp */,
+				84B8DAAA152CB05200D59B95 /* pover_video.h */,
+				84B8DAAB152CB05200D59B95 /* rpolygon.h */,
+				84B8DA98152CAD8600D59B95 /* Gui layer */,
+				84B8DA7B152CA97B00D59B95 /* Resources */,
+			);
+			name = tbbExample;
+			sourceTree = "<group>";
+		};
+		84B8DA7B152CA97B00D59B95 /* Resources */ = {
+			isa = PBXGroup;
+			children = (
+				D31F32691C11DF1600A77D54 /* iOS.storyboard */,
+				84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */,
+				84B8DA7E152CA97B00D59B95 /* MainMenu.xib */,
+			);
+			name = Resources;
+			path = ../../../common/gui/xcode/tbbExample/en.lproj;
+			sourceTree = "<group>";
+		};
+		84B8DA98152CAD8600D59B95 /* Gui layer */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA99152CADF400D59B95 /* macvideo.cpp */,
+				84B8DA6F152CA90100D59B95 /* main.m */,
+				84B8DA70152CA90100D59B95 /* OpenGLView.h */,
+				84B8DA71152CA90100D59B95 /* OpenGLView.m */,
+				84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */,
+				84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */,
+				84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */,
+			);
+			name = "Gui layer";
+			sourceTree = "<group>";
+		};
+		84D017461527431F0008A4E0 = {
+			isa = PBXGroup;
+			children = (
+				84B8DA6C152CA8D900D59B95 /* tbbExample */,
+				84D017541527431F0008A4E0 /* Frameworks */,
+				84D017521527431F0008A4E0 /* Products */,
+			);
+			sourceTree = "<group>";
+		};
+		84D017521527431F0008A4E0 /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				84D017511527431F0008A4E0 /* tbbExample.app */,
+				D31F324B1C11DEC100A77D54 /* tbbExample.ios.app */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+		84D017541527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXGroup;
+			children = (
+				84D01775152744BD0008A4E0 /* OpenGL.framework */,
+				84D017551527431F0008A4E0 /* Cocoa.framework */,
+				84D017571527431F0008A4E0 /* Other Frameworks */,
+			);
+			name = Frameworks;
+			sourceTree = "<group>";
+		};
+		84D017571527431F0008A4E0 /* Other Frameworks */ = {
+			isa = PBXGroup;
+			children = (
+				84D017581527431F0008A4E0 /* AppKit.framework */,
+				84D017591527431F0008A4E0 /* CoreData.framework */,
+				84D0175A1527431F0008A4E0 /* Foundation.framework */,
+			);
+			name = "Other Frameworks";
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		84D017501527431F0008A4E0 /* tbbExample */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tbbExample" */;
+			buildPhases = (
+				84D0174D1527431F0008A4E0 /* Sources */,
+				84D0174E1527431F0008A4E0 /* Frameworks */,
+				84D0174F1527431F0008A4E0 /* Resources */,
+			);
+			buildRules = (
+				C3C5897B2191EB8300DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tbbExample;
+			productName = tbbExample;
+			productReference = 84D017511527431F0008A4E0 /* tbbExample.app */;
+			productType = "com.apple.product-type.application";
+		};
+		D31F324A1C11DEC100A77D54 /* tbbExample.ios */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = D31F325F1C11DEC100A77D54 /* Build configuration list for PBXNativeTarget "tbbExample.ios" */;
+			buildPhases = (
+				D31F32471C11DEC100A77D54 /* Sources */,
+				D31F32481C11DEC100A77D54 /* Frameworks */,
+				D31F32491C11DEC100A77D54 /* Resources */,
+			);
+			buildRules = (
+			);
+			dependencies = (
+			);
+			name = tbbExample.ios;
+			productName = tbbExample.ios;
+			productReference = D31F324B1C11DEC100A77D54 /* tbbExample.ios.app */;
+			productType = "com.apple.product-type.application";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		84D017481527431F0008A4E0 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				CLASSPREFIX = tbb;
+				LastUpgradeCheck = 1000;
+				TargetAttributes = {
+					D31F324A1C11DEC100A77D54 = {
+						CreatedOnToolsVersion = 7.1.1;
+						DevelopmentTeam = 7J8M3RM94C;
+					};
+				};
+			};
+			buildConfigurationList = 84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "polygon_overlay" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 0;
+			knownRegions = (
+				en,
+				Base,
+			);
+			mainGroup = 84D017461527431F0008A4E0;
+			productRefGroup = 84D017521527431F0008A4E0 /* Products */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				84D017501527431F0008A4E0 /* tbbExample */,
+				D31F324A1C11DEC100A77D54 /* tbbExample.ios */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXResourcesBuildPhase section */
+		84D0174F1527431F0008A4E0 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA7A152CA90100D59B95 /* (null) in Resources */,
+				84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */,
+				84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D31F32491C11DEC100A77D54 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D31F326B1C11DF6000A77D54 /* iOS.storyboard in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXResourcesBuildPhase section */
+
+/* Begin PBXSourcesBuildPhase section */
+		84D0174D1527431F0008A4E0 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA77152CA90100D59B95 /* main.m in Sources */,
+				84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */,
+				84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */,
+				84B8DA9A152CADF400D59B95 /* macvideo.cpp in Sources */,
+				84B8DAAC152CB05200D59B95 /* polymain.cpp in Sources */,
+				84B8DAAD152CB05200D59B95 /* polyover.cpp in Sources */,
+				84B8DAAE152CB05200D59B95 /* pover_video.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D31F32471C11DEC100A77D54 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D31F32641C11DEE700A77D54 /* pover_video.cpp in Sources */,
+				D31F32631C11DEE300A77D54 /* polyover.cpp in Sources */,
+				D31F32651C11DEEC00A77D54 /* macvideo.cpp in Sources */,
+				D31F32681C11DEF600A77D54 /* tbbAppDelegate.m in Sources */,
+				D31F32621C11DEE000A77D54 /* polymain.cpp in Sources */,
+				D31F32661C11DEF000A77D54 /* main.m in Sources */,
+				D31F32671C11DEF300A77D54 /* OpenGLView.m in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin PBXVariantGroup section */
+		84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7D152CA97B00D59B95 /* en */,
+			);
+			name = InfoPlist.strings;
+			sourceTree = "<group>";
+		};
+		84B8DA7E152CA97B00D59B95 /* MainMenu.xib */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7F152CA97B00D59B95 /* en */,
+			);
+			name = MainMenu.xib;
+			sourceTree = "<group>";
+		};
+/* End PBXVariantGroup section */
+
+/* Begin XCBuildConfiguration section */
+		84D01770152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = YES;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+				);
+				GCC_SYMBOLS_PRIVATE_EXTERN = NO;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+					"-ltbbmalloc_debug",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		84D01771152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = YES;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = YES;
+				DEBUG_INFORMATION_FORMAT = "dwarf-with-dsym";
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+					"-ltbbmalloc",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+		84D01773152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Debug64;
+		};
+		84D01774152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Release64;
+		};
+		D31F32601C11DEC100A77D54 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "gnu++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				DEBUG_INFORMATION_FORMAT = dwarf;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+					"__TBB_IOS=1",
+				);
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				HEADER_SEARCH_PATHS = "\"$(SRCROOT)/../../../../include\"";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.1;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "\"$(SRCROOT)/../../../../lib/ios\"";
+				MTL_ENABLE_DEBUG_INFO = YES;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = 1;
+			};
+			name = Debug64;
+		};
+		D31F32611C11DEC100A77D54 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "gnu++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				COPY_PHASE_STRIP = NO;
+				ENABLE_NS_ASSERTIONS = NO;
+				GCC_PREPROCESSOR_DEFINITIONS = "__TBB_IOS=1";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				HEADER_SEARCH_PATHS = "\"$(SRCROOT)/../../../../include\"";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.1;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "\"$(SRCROOT)/../../../../lib/ios\"";
+				MTL_ENABLE_DEBUG_INFO = NO;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = 1;
+				VALIDATE_PRODUCT = YES;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "polygon_overlay" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01770152743200008A4E0 /* Debug64 */,
+				84D01771152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release64;
+		};
+		84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tbbExample" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01773152743200008A4E0 /* Debug64 */,
+				84D01774152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release64;
+		};
+		D31F325F1C11DEC100A77D54 /* Build configuration list for PBXNativeTarget "tbbExample.ios" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				D31F32601C11DEC100A77D54 /* Debug64 */,
+				D31F32611C11DEC100A77D54 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 84D017481527431F0008A4E0 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme
new file mode 100644
index 00000000..5516b613
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme
@@ -0,0 +1,91 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "D31F324A1C11DEC100A77D54"
+               BuildableName = "tbbExample.ios.app"
+               BlueprintName = "tbbExample.ios"
+               ReferencedContainer = "container:polygon_overlay.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D31F324A1C11DEC100A77D54"
+            BuildableName = "tbbExample.ios.app"
+            BlueprintName = "tbbExample.ios"
+            ReferencedContainer = "container:polygon_overlay.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "YES"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D31F324A1C11DEC100A77D54"
+            BuildableName = "tbbExample.ios.app"
+            BlueprintName = "tbbExample.ios"
+            ReferencedContainer = "container:polygon_overlay.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D31F324A1C11DEC100A77D54"
+            BuildableName = "tbbExample.ios.app"
+            BlueprintName = "tbbExample.ios"
+            ReferencedContainer = "container:polygon_overlay.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme
new file mode 100644
index 00000000..5c1312f4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/polygon_overlay/xcode/polygon_overlay.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme
@@ -0,0 +1,99 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "84D017501527431F0008A4E0"
+               BuildableName = "tbbExample.app"
+               BlueprintName = "tbbExample"
+               ReferencedContainer = "container:tbbExample.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:polygon_overlay.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      customWorkingDirectory = "/tmp"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "NO"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:polygon_overlay.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <EnvironmentVariables>
+         <EnvironmentVariable
+            key = "DYLD_LIBRARY_PATH"
+            value = "$(SRCROOT)/../../../../lib"
+            isEnabled = "YES">
+         </EnvironmentVariable>
+      </EnvironmentVariables>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:tbbExample.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/Makefile b/xdl/third_party/tbb/examples/parallel_for/seismic/Makefile
new file mode 100644
index 00000000..9c839df6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/Makefile
@@ -0,0 +1,97 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+NAME=seismic
+ARGS=auto 0
+PERF_RUN_ARGS=auto 10000 silent
+LIGHT_ARGS=1:2 100
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+TBBLIB = -ltbb
+TBBLIB_DEBUG = -ltbb_debug
+
+ifeq ($(offload), mic)
+override CXXFLAGS += -D__TBB_MIC_OFFLOAD=1 -offload-attribute-target=mic
+# Replace -ltbb with -tbb in the offload mode
+TBBLIB = -tbb
+TBBLIB_DEBUG += -offload-option,mic,ld,"-ltbb_debug"
+# Currently only console mode is supported in offload version
+override UI=con
+else
+PERFFLAGS=-msse2
+endif
+
+SOURCES = ../../common/gui/$(UI)video.cpp universe.cpp seismic_video.cpp main.cpp
+
+include ../../common/gui/Makefile.gmake
+override CXXFLAGS += $(UI_CXXFLAGS)
+
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt 
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+resources:
+ifeq ($(UI),mac)
+	mkdir -p $(APPRES)/en.lproj $(NAME).app/Contents/MacOS
+	cp ../../common/gui/xcode/tbbExample/tbbExample-Info.plist $(NAME).app/Contents/Info.plist
+	cp ../../common/gui/xcode/tbbExample/PkgInfo $(NAME).app/Contents
+	cp ../../common/gui/xcode/tbbExample/en.lproj/* $(APPRES)/en.lproj
+endif # macOS*
+
+release: resources
+ifeq ($(UI),mac)
+	$(CXX_UI) -O2 -DNDEBUG $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(EXE) $(SOURCES) $(MACUIOBJS) $(TBBLIB) $(LIBS)
+
+debug: resources
+ifeq ($(UI),mac)
+	$(CXX_UI) -g -O0 -DTBB_USE_DEBUG $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS
+	$(CXX) -g -O0 -DTBB_USE_DEBUG $(CXXFLAGS) -o $(EXE) $(SOURCES) $(MACUIOBJS) $(TBBLIB_DEBUG) $(LIBS)
+
+clean:
+	$(RM) $(EXE) *.o *.d
+ifeq ($(UI),mac)
+	rm -rf $(NAME).app
+endif
+
+test:
+ifeq ($(UI),mac)
+	export DYLD_LIBRARY_PATH="$(DYLD_LIBRARY_PATH):$(TBBLIBSPATH)"; $(run_cmd) ./$(EXE) $(ARGS)
+else
+	$(run_cmd) ./$(EXE) $(ARGS)
+endif
+
+perf_build: override CXXFLAGS+=$(PERFFLAGS)
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(EXE) $(PERF_RUN_ARGS)
+
+light_test:
+	$(run_cmd) ./$(EXE) $(LIGHT_ARGS)
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/Makefile.windows b/xdl/third_party/tbb/examples/parallel_for/seismic/Makefile.windows
new file mode 100644
index 00000000..5ebaac47
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/Makefile.windows
@@ -0,0 +1,67 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Seismic
+ARGS=auto 0
+PERF_RUN_ARGS=auto 10000 silent
+LIGHT_ARGS=1:2 100
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# Uncomment one of next lines to choose user interface type (console, gdiplus, direct draw)
+#UI = con
+UI = gdi
+#UI = dd
+
+# Machine architecture, auto-detected from TBB_TARGET_ARCH by default
+# Use XARCH variable to change it. See index.html for more information
+ARCH0 = $(TBB_TARGET_ARCH)-
+ARCH1 = $(ARCH0:ia32-=x86)
+ARCH2 = $(ARCH1:intel64-=AMD64)
+XARCH = $(ARCH2:-=x86)
+
+MAKEINC = ../../common/gui/Makefile.win
+SOURCES = seismic_video.cpp universe.cpp main.cpp 
+ 
+all: release test
+release: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=$(UI) CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS)" LFLAGS="$(LDFLAGS) tbb.lib $(LIBS)" XARCH=$(XARCH) RCNAME=SeismicSimulation SOURCE="$(SOURCES)" EXE=$(PROG).exe build_one
+debug: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=$(UI) DEBUG=_debug CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS) /D TBB_USE_DEBUG" LFLAGS="$(LDFLAGS) tbb_debug.lib $(LIBS)" XARCH=$(XARCH) RCNAME=SeismicSimulation SOURCE="$(SOURCES)" EXE=$(PROG).exe build_one
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest msvs\SeismicSimulation.res >nul 2>&1
+test:
+	$(PROG) $(ARGS) 
+
+perf_build: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=con CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS)" LFLAGS="$(LDFLAGS) tbb.lib $(LIBS)" XARCH=$(XARCH) RCNAME=SeismicSimulation SOURCE="$(SOURCES) " EXE=$(PROG).exe build_one
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/main.cpp b/xdl/third_party/tbb/examples/parallel_for/seismic/main.cpp
new file mode 100644
index 00000000..3905c278
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/main.cpp
@@ -0,0 +1,151 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define VIDEO_WINMAIN_ARGS
+
+#include <iostream>
+#include "tbb/tick_count.h"
+#include "../../common/utility/utility.h"
+
+#include "seismic_video.h"
+#include "universe.h"
+#include "tbb/task_scheduler_init.h"
+
+Universe u;
+
+struct RunOptions {
+    //! It is used for console mode for test with different number of threads and also has
+    //! meaning for GUI: threads.first  - use separate event/updating loop thread (>0) or not (0).
+    //!                  threads.second - initialization value for scheduler
+    utility::thread_number_range threads;
+    int numberOfFrames;
+    bool silent;
+    bool parallel;
+    RunOptions(utility::thread_number_range threads_ ,    int number_of_frames_ ,     bool silent_ , bool parallel_ )
+        : threads(threads_),numberOfFrames(number_of_frames_), silent(silent_), parallel(parallel_)
+    {
+    }
+};
+
+int do_get_default_num_threads() {
+    int threads;
+#if __TBB_MIC_OFFLOAD
+    #pragma offload target(mic) out(threads)
+#endif // __TBB_MIC_OFFLOAD
+    threads = tbb::task_scheduler_init::default_num_threads();
+    return threads;
+}
+
+int get_default_num_threads() {
+    static int threads = do_get_default_num_threads();
+    return threads;
+}
+
+RunOptions ParseCommandLine(int argc, char *argv[]){
+    // zero number of threads means to run serial version
+    utility::thread_number_range threads(get_default_num_threads,0,get_default_num_threads());
+
+    int numberOfFrames = 0;
+    bool silent = false;
+    bool serial = false;
+
+    utility::parse_cli_arguments(argc,argv,
+        utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(numberOfFrames,"n-of-frames","number of frames the example processes internally (0 means unlimited)")
+            .arg(silent,"silent","no output except elapsed time")
+            .arg(serial,"serial","in GUI mode start with serial version of algorithm")
+    );
+    return RunOptions(threads,numberOfFrames,silent,!serial);
+}
+
+int main(int argc, char *argv[])
+{
+    try{
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+        RunOptions options = ParseCommandLine(argc,argv);
+        SeismicVideo video(u,options.numberOfFrames,options.threads.last,options.parallel);
+
+        // video layer init
+        if(video.init_window(u.UniverseWidth, u.UniverseHeight)) {
+            video.calc_fps = true;
+            video.threaded = options.threads.first > 0;
+            // video is ok, init Universe
+            u.InitializeUniverse(video);
+            // main loop
+            video.main_loop();
+        }
+        else if(video.init_console()) {
+            // do console mode
+            if (options.numberOfFrames == 0) {
+                options.numberOfFrames = 1000;
+                std::cout << "Substituting 1000 for unlimited frames because not running interactively\n";
+            }
+            for(int p = options.threads.first;  p <= options.threads.last; p = options.threads.step(p)) {
+                tbb::tick_count xwayParallelismStartTime = tbb::tick_count::now();
+                u.InitializeUniverse(video);
+                int numberOfFrames = options.numberOfFrames;
+#if __TBB_MIC_OFFLOAD
+                drawing_memory dmem = video.get_drawing_memory();
+                char *pMem = dmem.get_address();
+                size_t memSize = dmem.get_size();
+
+                #pragma offload target(mic) in(u, numberOfFrames, p, dmem), out(pMem:length(memSize))
+                {
+                    // It is necessary to update the pointer on mic 
+                    // since the address spaces on host and on target are different
+                    dmem.set_address(pMem);
+                    u.SetDrawingMemory(dmem);
+#endif // __TBB_MIC_OFFLOAD
+                    if (p==0) {
+                        //run a serial version
+                        for( int i=0; i<numberOfFrames; ++i ) {
+                            u.SerialUpdateUniverse();
+                        }
+                    } else {
+                        tbb::task_scheduler_init init(p);
+                        for( int i=0; i<numberOfFrames; ++i ) {
+                            u.ParallelUpdateUniverse();
+                        }
+                    }
+#if __TBB_MIC_OFFLOAD
+                }
+#endif // __TBB_MIC_OFFLOAD
+
+                if (!options.silent){
+                    double fps =  options.numberOfFrames/((tbb::tick_count::now()-xwayParallelismStartTime).seconds());
+                    std::cout<<fps<<" frame per sec with ";
+                    if (p==0){
+                        std::cout<<"serial code\n";
+                    }else{
+                        std::cout<<p<<" way parallelism\n";
+                    }
+                }
+            }
+        }
+        video.terminate();
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+        return 0;
+    }catch(std::exception& e){
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.ico b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.ico
new file mode 100644
index 00000000..d551aa3a
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.ico differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.rc b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.rc
new file mode 100644
index 00000000..c2003347
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.rc
@@ -0,0 +1,145 @@
+// Microsoft Visual C++ generated resource script.
+//
+#include "resource.h"
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#define APSTUDIO_HIDDEN_SYMBOLS
+#include "windows.h"
+#undef APSTUDIO_HIDDEN_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// English (U.S.) resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_ENU)
+#ifdef _WIN32
+LANGUAGE LANG_ENGLISH, SUBLANG_ENGLISH_US
+#pragma code_page(1252)
+#endif //_WIN32
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Icon
+//
+
+// Icon with lowest ID value placed first to ensure application icon
+// remains consistent on all systems.
+IDI_SEISMICSIMULATION   ICON                    "SeismicSimulation.ico"
+IDI_SMALL               ICON                    "small.ico"
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Menu
+//
+
+IDC_SEISMICSIMULATION MENU 
+BEGIN
+    POPUP "&File"
+    BEGIN
+        MENUITEM "&Parallel",                   ID_FILE_PARALLEL
+        MENUITEM "&Serial",                     ID_FILE_SERIAL
+        MENUITEM SEPARATOR
+        MENUITEM "&Enable GUI",                 ID_FILE_ENABLEGUI
+        MENUITEM "&Disable GUI",                ID_FILE_DISABLEGUI
+        MENUITEM SEPARATOR
+        MENUITEM "E&xit",                       IDM_EXIT
+    END
+    POPUP "&Help"
+    BEGIN
+        MENUITEM "&About ...",                  IDM_ABOUT
+    END
+END
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Accelerator
+//
+
+IDC_SEISMICSIMULATION ACCELERATORS 
+BEGIN
+    VK_OEM_2,       IDM_ABOUT,              VIRTKEY, ALT, NOINVERT
+    "P",            ID_FILE_PARALLEL,       VIRTKEY, ALT, NOINVERT
+    "S",            ID_FILE_SERIAL,         VIRTKEY, ALT, NOINVERT
+    "D",            ID_FILE_DISABLEGUI,     VIRTKEY, ALT, NOINVERT
+    "E",            ID_FILE_ENABLEGUI,      VIRTKEY, ALT, NOINVERT
+END
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Dialog
+//
+
+IDD_ABOUTBOX DIALOG  22, 17, 230, 75
+STYLE DS_SETFONT | DS_MODALFRAME | WS_CAPTION | WS_SYSMENU
+CAPTION "About"
+FONT 8, "System"
+BEGIN
+    ICON            IDI_SEISMICSIMULATION,IDC_MYICON,14,9,16,16
+    LTEXT           "SeismicSimulation Version 1.1",IDC_STATIC,49,10,119,8,SS_NOPREFIX
+    LTEXT           "Copyright (C) 2005-2008",IDC_STATIC,49,20,119,8
+    DEFPUSHBUTTON   "OK",IDOK,195,6,30,11,WS_GROUP
+END
+
+
+#ifdef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// TEXTINCLUDE
+//
+
+1 TEXTINCLUDE 
+BEGIN
+    "resource.h\0"
+END
+
+2 TEXTINCLUDE 
+BEGIN
+    "#define APSTUDIO_HIDDEN_SYMBOLS\r\n"
+    "#include ""windows.h""\r\n"
+    "#undef APSTUDIO_HIDDEN_SYMBOLS\r\n"
+    "\0"
+END
+
+3 TEXTINCLUDE 
+BEGIN
+    "\r\n"
+    "\0"
+END
+
+#endif    // APSTUDIO_INVOKED
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// String Table
+//
+
+STRINGTABLE 
+BEGIN
+    IDS_APP_TITLE           "SeismicSimulation"
+    IDC_SEISMICSIMULATION   "SEISMICSIMULATION"
+END
+
+#endif    // English (U.S.) resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.vcxproj b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.vcxproj
new file mode 100644
index 00000000..33389117
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/SeismicSimulation.vcxproj
@@ -0,0 +1,451 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="DDDebug|Win32">
+      <Configuration>DDDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|x64">
+      <Configuration>DDDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|Win32">
+      <Configuration>DDRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|x64">
+      <Configuration>DDRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>SeismicSimulation</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A2527}</ProjectGuid>
+    <RootNamespace>SeismicSimulation</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\main.cpp" />
+    <ClCompile Include="..\seismic_video.cpp" />
+    <ClCompile Include="..\universe.cpp" />
+    <ClCompile Include="..\..\..\common\gui\d2dvideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+    <ClCompile Include="..\..\..\common\gui\gdivideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\seismic_video.h" />
+    <ClInclude Include="..\universe.h" />
+    <ClInclude Include="resource.h" />
+    <ClInclude Include="..\..\..\common\gui\video.h" />
+    <ClInclude Include="..\..\..\common\gui\winvideo.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="SeismicSimulation.ico" />
+    <None Include="small.ico" />
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="SeismicSimulation.rc" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/resource.h b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/resource.h
new file mode 100644
index 00000000..c984e28e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/resource.h
@@ -0,0 +1,52 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//{{NO_DEPENDENCIES}}
+// Microsoft Visual C++ generated include file.
+// Used by SeismicSimulation.rc
+//
+#define IDC_MYICON                      2
+#define IDD_SEISMICSIMULATION_DIALOG    102
+#define IDS_APP_TITLE                   103
+#define IDD_ABOUTBOX                    103
+#define IDM_ABOUT                       104
+#define IDM_EXIT                        105
+#define IDI_SEISMICSIMULATION           107
+#define IDI_SMALL                       108
+#define IDC_SEISMICSIMULATION           109
+#define IDR_MAINFRAME                   128
+#define ID_FILE_PARALLEL                32771
+#define ID_FILE_SERIAL                  32772
+#define IDM_PARALLEL                    32773
+#define ID_FILE_ENABLEGUI               32774
+#define ID_FILE_DISABLEGUI              32775
+#define IDC_STATIC                      -1
+
+// Next default values for new objects
+// 
+#ifdef APSTUDIO_INVOKED
+#ifndef APSTUDIO_READONLY_SYMBOLS
+#define _APS_NO_MFC                     1
+#define _APS_NEXT_RESOURCE_VALUE        129
+#define _APS_NEXT_COMMAND_VALUE         32782
+#define _APS_NEXT_CONTROL_VALUE         1000
+#define _APS_NEXT_SYMED_VALUE           110
+#endif
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/seismic.sln b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/seismic.sln
new file mode 100644
index 00000000..d131e35b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/seismic.sln
@@ -0,0 +1,40 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "SeismicSimulation", "SeismicSimulation.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A2527}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		_GDIRelease|Win32 = _GDIRelease|Win32
+		_GDIRelease|x64 = _GDIRelease|x64
+		DDDebug|Win32 = DDDebug|Win32
+		DDDebug|x64 = DDDebug|x64
+		DDRelease|Win32 = DDRelease|Win32
+		DDRelease|x64 = DDRelease|x64
+		GDIDebug|Win32 = GDIDebug|Win32
+		GDIDebug|x64 = GDIDebug|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|x64.Build.0 = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|Win32.ActiveCfg = DDDebug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|Win32.Build.0 = DDDebug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|x64.ActiveCfg = DDDebug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|x64.Build.0 = DDDebug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|Win32.ActiveCfg = DDRelease|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|Win32.Build.0 = DDRelease|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|x64.ActiveCfg = DDRelease|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|x64.Build.0 = DDRelease|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|x64.Build.0 = Debug|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/small.ico b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/small.ico
new file mode 100644
index 00000000..d551aa3a
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/seismic/msvs/small.ico differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/readme.html b/xdl/third_party/tbb/examples/parallel_for/seismic/readme.html
new file mode 100644
index 00000000..b7a660fe
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/readme.html
@@ -0,0 +1,471 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Seismic sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Seismic sample</h1>
+	</div>
+	
+	<p>
+		Parallel seismic wave simulation that demonstrates use of parallel_for and affinity_partitioner.
+	<br><br>
+		The example can be built in the offload version to run on Intel&reg; Many Integrated Core (Intel&reg; MIC) Architecture based coprocessor (see <a href="../../index.html">build instructions</a>).
+	<br><br>
+		<b>Note:</b> Currently, the offload version does not support GUI and can only be used with console mode.
+	</p>
+	
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="main.cpp">main.cpp</a>
+				<dd>Main program which parses command line options and runs the algorithm with different numbers of threads.
+				<dt><a href="universe.h">universe.h</a>
+				<dd>Wave propagation methods interface.
+				<dt><a href="universe.cpp">universe.cpp</a>
+				<dd>Wave propagation methods implementation.
+				<dt><a href="seismic_video.h">seismic_video.h</a>
+				<dd>GUI mode support interface.
+				<dt><a href="seismic_video.cpp">seismic_video.cpp</a>
+				<dd>GUI mode support implementation.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+			<p>The following additional options are supported:</p>
+			<dl>
+				<dt><tt>make [(general targets: {release, debug} [test])] UI={con, gdi, d2d, x, mac}</tt>
+				<dd>Build and run as usual, but build with the specified GUI driver: console, GDI+*,  
+					Direct2D*, X11, or OpenGL*
+					(see the description of the <a href="../../common/index.html">common GUI code</a>
+					for more information on available graphics support).<br>
+					For Linux* and macOS* systems, the best available driver is detected automatically by the Makefile.<br>
+					For Windows* systems, UI=gdi is the default GUI driver; compiling with UI=d2d may offer superior
+					performance, but can only be used if the Microsoft* DirectX* SDK is installed on your system 
+					and if overlay is supported by your graphics card.<br>
+					Use UI=con to build without the GUI for use in making performance measurements
+					<i>(strongly recommended when measuring performance or scalability; see note below)</i>.
+				<dt><tt>make [(above options or targets)] XARCH=x64</tt>
+				<dd>Build and run as above, but also specify XARCH=x64
+					(or XARCH=AMD64 for older compilers) when building the example on Windows* as a 64-bit binary.
+				<dt><tt>make [(above options or targets)] DDLIB_DIR=&lt;<i>specify path to Direct Draw* SDK here</i>&gt;</tt>
+				<dd>If you experience ddraw.lib linking problems, specify the correct library directory via this option.
+				<dt><tt>make [(above options or targets)] CXXFLAGS=-DX_FULLSYNC</tt>
+				<dd>Build and run as above, but enable full X11 synchronization if you experience "tearing" of motion on slower video systems.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>seismic <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>seismic [<i>n-of-threads</i>=value] [<i>n-of-frames</i>=value] [<i>silent</i>] [<i>serial</i>]</tt>
+				<dt><tt>seismic [<i>n-of-threads</i> [<i>n-of-frames</i>]] [<i>silent</i>] [<i>serial</i>]</tt>
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form low[:high], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>n-of-frames</i> is a number of frames the example processes internally.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+					<i>serial</i> - in GUI mode start with serial version of algorithm.<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector::
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with the desired number of threads and smaller number of frames, e.g., <tt>seismic 4 5</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Hot keys</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>
+				The following hot keys can be used in interactive execution mode when the example is compiled with the graphical
+				user interface:
+			</p>
+			<dl>
+				<dt>&lt;left mouse button&gt;
+				<dd>Starts new seismic wave in place specified by mouse cursor.
+				<dt>&lt;space&gt;
+				<dd>Toggles between parallel and serial execution modes.
+				<dt>&lt;p&gt;
+				<dd>Enables parallel execution mode.
+				<dt>&lt;s&gt;
+				<dd>Enables serial execution mode.
+				<dt>&lt;e&gt;
+				<dd>Enables screen updates.
+				<dt>&lt;d&gt;
+				<dd>Disables screen updates <i>(strongly recommended when measuring performance or scalability; see note below)</i>.
+				<dt>&lt;esc&gt;
+				<dd>Stops execution.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Notes</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<ul>
+			<li>While running with the GUI display turned on should yield reasonable performance in most cases, <i>running with the GUI
+				display turned off is strongly recommended</i> in order to demonstrate the full performance and scalability of the example.
+			</ul>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/seismic_video.cpp b/xdl/third_party/tbb/examples/parallel_for/seismic/seismic_video.cpp
new file mode 100644
index 00000000..3c3abb0d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/seismic_video.cpp
@@ -0,0 +1,148 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "seismic_video.h"
+#include "universe.h"
+#include "tbb/task_scheduler_init.h"
+
+const char * const SeismicVideo::titles[2] = {"Seismic Simulation: Serial", "Seismic Simulation: Parallel"};
+void SeismicVideo::on_mouse(int x, int y, int key) {
+    if(key == 1){
+        u_.TryPutNewPulseSource(x,y);
+    }
+}
+
+void SeismicVideo::on_key(int key) {
+    key &= 0xff;
+    if(char(key) == ' ') initIsParallel = !initIsParallel;
+    else if(char(key) == 'p') initIsParallel = true;
+    else if(char(key) == 's') initIsParallel = false;
+    else if(char(key) == 'e') updating = true;
+    else if(char(key) == 'd') updating = false;
+    else if(key == 27) running = false;
+    title = titles[initIsParallel?1:0];
+}
+
+void SeismicVideo::on_process() {
+    tbb::task_scheduler_init Init(threadsHigh);
+    for( int frames = 0; numberOfFrames_==0 || frames<numberOfFrames_; ++frames ) {
+        if( initIsParallel )
+            u_.ParallelUpdateUniverse();
+        else
+            u_.SerialUpdateUniverse();
+        if( !next_frame() ) break;
+    }
+}
+
+#ifdef _WINDOWS
+#include "msvs/resource.h"
+LRESULT CALLBACK WndProc(HWND hWnd, UINT message, WPARAM wParam, LPARAM lParam);
+SeismicVideo * gVideo = NULL;
+#endif
+
+SeismicVideo::SeismicVideo(    Universe &u, int number_of_frames, int threads_high, bool init_is_parallel)
+    :numberOfFrames_(number_of_frames),initIsParallel(init_is_parallel),u_(u),threadsHigh(threads_high)
+{
+    title = titles[initIsParallel?1:0];
+#ifdef _WINDOWS
+    gVideo = this;
+    LoadStringA(video::win_hInstance, IDC_SEISMICSIMULATION, szWindowClass, MAX_LOADSTRING);
+    memset(&wcex, 0, sizeof(wcex));
+    wcex.lpfnWndProc    = (WNDPROC)WndProc;
+    wcex.hIcon          = LoadIcon(video::win_hInstance, MAKEINTRESOURCE(IDI_SEISMICSIMULATION));
+    wcex.hCursor        = LoadCursor(NULL, IDC_ARROW);
+    wcex.hbrBackground  = (HBRUSH)(COLOR_WINDOW+1);
+    wcex.lpszMenuName   = LPCTSTR(IDC_SEISMICSIMULATION);
+    wcex.lpszClassName  = szWindowClass;
+    wcex.hIconSm        = LoadIcon(video::win_hInstance, MAKEINTRESOURCE(IDI_SMALL));
+    win_set_class(wcex); // ascii convention here
+    win_load_accelerators(IDC_SEISMICSIMULATION);
+#endif
+
+}
+
+
+
+
+
+#ifdef _WINDOWS
+//
+//  FUNCTION: WndProc(HWND, unsigned, WORD, LONG)
+//
+//  PURPOSE:  Processes messages for the main window.
+//
+//  WM_COMMAND  - process the application menu
+//  WM_PAINT    - Paint the main window
+//  WM_DESTROY  - post a quit message and return
+//
+//
+LRESULT CALLBACK About(HWND hDlg, UINT message, WPARAM wParam, LPARAM lParam)
+{
+    switch (message)
+    {
+    case WM_INITDIALOG: return TRUE;
+    case WM_COMMAND:
+        if (LOWORD(wParam) == IDOK || LOWORD(wParam) == IDCANCEL) {
+            EndDialog(hDlg, LOWORD(wParam));
+            return TRUE;
+        }
+        break;
+    }
+    return FALSE;
+}
+
+LRESULT CALLBACK WndProc(HWND hWnd, UINT message, WPARAM wParam, LPARAM lParam)
+{
+    int wmId;
+    switch (message) {
+    case WM_COMMAND:
+        wmId    = LOWORD(wParam);
+        // Parse the menu selections:
+        switch (wmId)
+        {
+        case IDM_ABOUT:
+            DialogBox(video::win_hInstance, MAKEINTRESOURCE(IDD_ABOUTBOX), hWnd, (DLGPROC)About);
+            break;
+        case IDM_EXIT:
+            PostQuitMessage(0);
+            break;
+        case ID_FILE_PARALLEL:
+            gVideo->on_key('p');
+            break;
+        case ID_FILE_SERIAL:
+            gVideo->on_key('s');
+            break;
+        case ID_FILE_ENABLEGUI:
+            gVideo->on_key('e');
+            break;
+        case ID_FILE_DISABLEGUI:
+            gVideo->on_key('d');
+            break;
+        default:
+            return DefWindowProc(hWnd, message, wParam, lParam);
+        }
+        break;
+    default:
+        return DefWindowProc(hWnd, message, wParam, lParam);
+    }
+    return 0;
+}
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/seismic_video.h b/xdl/third_party/tbb/examples/parallel_for/seismic/seismic_video.h
new file mode 100644
index 00000000..d9acaa84
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/seismic_video.h
@@ -0,0 +1,54 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef SEISMIC_VIDEO_H_
+#define SEISMIC_VIDEO_H_
+
+#include "../../common/gui/video.h"
+
+class Universe;
+
+class SeismicVideo : public video
+{
+#ifdef _WINDOWS
+    #define MAX_LOADSTRING 100
+    TCHAR szWindowClass[MAX_LOADSTRING];    // the main window class name
+    WNDCLASSEX wcex;
+#endif
+    static const char * const titles[2];
+
+    bool initIsParallel ;
+
+    Universe &u_;
+    int numberOfFrames_; // 0 means forever, positive means number of frames, negative is undefined
+    int threadsHigh;
+private:
+    void on_mouse(int x, int y, int key);
+    void on_process();
+
+#ifdef _WINDOWS
+public:
+#endif
+    void on_key(int key);
+
+public:
+    SeismicVideo(    Universe &u,int numberOfFrames, int threadsHigh, bool initIsParallel=true);
+};
+#endif /* SEISMIC_VIDEO_H_ */
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/universe.cpp b/xdl/third_party/tbb/examples/parallel_for/seismic/universe.cpp
new file mode 100644
index 00000000..eb9e6821
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/universe.cpp
@@ -0,0 +1,221 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "../../common/gui/video.h"
+#include <cmath>
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+
+
+using namespace std;
+
+#ifdef _MSC_VER
+// warning C4068: unknown pragma
+#pragma warning(disable: 4068)
+// warning C4351: new behavior: elements of array 'array' will be default initialized
+#pragma warning(disable: 4351)
+#endif
+
+#include "universe.h"
+
+const colorcomp_t MaterialColor[4][3] = { // BGR
+    {96,0,0},     // WATER
+    {0,48,48},    // SANDSTONE
+    {32,32,23}    // SHALE
+};
+
+void Universe::InitializeUniverse(video const& colorizer) {
+
+    pulseCounter = pulseTime = 100;
+    pulseX = UniverseWidth/3;
+    pulseY = UniverseHeight/4;
+    // Initialize V, S, and T to slightly non-zero values, in order to avoid denormal waves.
+    for( int i=0; i<UniverseHeight; ++i )
+#pragma ivdep
+        for( int j=0; j<UniverseWidth; ++j ) {
+            T[i][j] = S[i][j] = V[i][j] = ValueType(1.0E-6);
+        }
+    for( int i=1; i<UniverseHeight-1; ++i ) {
+        for( int j=1; j<UniverseWidth-1; ++j ) {
+            float x = float(j-UniverseWidth/2)/(UniverseWidth/2);
+            ValueType t = (ValueType)i/UniverseHeight;
+            MaterialType m;
+            D[i][j] = 1.0;
+            // Coefficient values are fictitious, and chosen to visually exaggerate
+            // physical effects such as Rayleigh waves.  The fabs/exp line generates
+            // a shale layer with a gentle upwards slope and an anticline.
+            if( t<0.3f ) {
+                m = WATER;
+                M[i][j] = 0.125;
+                L[i][j] = 0.125;
+            } else if( fabs(t-0.7+0.2*exp(-8*x*x)+0.025*x)<=0.1 ) {
+                m = SHALE;
+                M[i][j] = 0.5;
+                L[i][j] = 0.6;
+            } else {
+                m = SANDSTONE;
+                M[i][j] = 0.3;
+                L[i][j] = 0.4;
+            }
+            material[i][j] = m;
+        }
+    }
+    ValueType scale = 2.0f/ColorMapSize;
+    for( int k=0; k<4; ++k ) {
+        for( int i=0; i<ColorMapSize; ++i ) {
+            colorcomp_t c[3];
+            ValueType t = (i-ColorMapSize/2)*scale;
+            ValueType r = t>0 ? t : 0;
+            ValueType b = t<0 ? -t : 0;
+            ValueType g = 0.5f*fabs(t);
+            memcpy(c, MaterialColor[k], sizeof(c));
+            c[2] = colorcomp_t(r*(255-c[2])+c[2]);
+            c[1] = colorcomp_t(g*(255-c[1])+c[1]);
+            c[0] = colorcomp_t(b*(255-c[0])+c[0]);
+            ColorMap[k][i] = colorizer.get_color(c[2], c[1], c[0]);
+        }
+    }
+    // Set damping coefficients around border to reduce reflections from boundaries.
+    ValueType d = 1.0;
+    for( int k=DamperSize-1; k>0; --k ) {
+        d *= 1-1.0f/(DamperSize*DamperSize);
+        for( int j=1; j<UniverseWidth-1; ++j ) {
+            D[k][j] *= d;
+            D[UniverseHeight-1-k][j] *= d;
+        }
+        for( int i=1; i<UniverseHeight-1; ++i ) {
+            D[i][k] *= d;
+            D[i][UniverseWidth-1-k] *= d;
+        }
+    }
+    drawingMemory = colorizer.get_drawing_memory();
+}
+void Universe::UpdatePulse() {
+    if( pulseCounter>0 ) {
+        ValueType t = (pulseCounter-pulseTime/2)*0.05f;
+        V[pulseY][pulseX] += 64*sqrt(M[pulseY][pulseX])*exp(-t*t);
+        --pulseCounter;
+    }
+}
+
+struct Universe::Rectangle {
+    struct std::pair<int,int> xRange;
+    struct std::pair<int,int> yRange;
+    Rectangle (int startX, int startY, int width, int height):xRange(startX,width),yRange(startY,height){}
+    int StartX() const {return xRange.first;}
+    int StartY() const {return yRange.first;}
+    int Width()   const {return xRange.second;}
+    int Height()  const {return yRange.second;}
+    int EndX() const {return xRange.first + xRange.second;}
+    int EndY() const {return yRange.first + yRange.second;}
+
+};
+
+void Universe::UpdateStress(Rectangle const& r ) {
+    drawing_area  drawing(r.StartX(),r.StartY(),r.Width(),r.Height(),drawingMemory);
+    for( int i=r.StartY(); i<r.EndY() ; ++i ) {
+        drawing.set_pos(1, i-r.StartY());
+#pragma ivdep
+        for( int j=r.StartX(); j<r.EndX() ; ++j ) {
+            S[i][j] += M[i][j]*(V[i][j+1]-V[i][j]);
+            T[i][j] += M[i][j]*(V[i+1][j]-V[i][j]);
+            int index = (int)(V[i][j]*(ColorMapSize/2)) + ColorMapSize/2;
+            if( index<0 ) index = 0;
+            if( index>=ColorMapSize ) index = ColorMapSize-1;
+            color_t* c = ColorMap[material[i][j]];
+            drawing.put_pixel(c[index]);
+        }
+    }
+}
+
+void Universe::SerialUpdateStress() {
+    Rectangle  area(0, 0, UniverseWidth-1, UniverseHeight-1);
+    UpdateStress(area);
+}
+
+struct UpdateStressBody {
+    Universe & u_;
+    UpdateStressBody(Universe & u):u_(u){}
+    void operator()( const tbb::blocked_range<int>& range ) const {
+        Universe::Rectangle area(0, range.begin(), u_.UniverseWidth-1, range.size());
+        u_.UpdateStress(area);
+    }
+};
+
+void Universe::ParallelUpdateStress(tbb::affinity_partitioner &affinity) {
+    tbb::parallel_for( tbb::blocked_range<int>( 0, UniverseHeight-1 ), // Index space for loop
+                       UpdateStressBody(*this),                             // Body of loop
+                       affinity );                                     // Affinity hint
+}
+
+void Universe::UpdateVelocity(Rectangle const& r) {
+    for( int i=r.StartY(); i<r.EndY(); ++i )
+#pragma ivdep
+        for( int j=r.StartX(); j<r.EndX(); ++j )
+            V[i][j] = D[i][j]*(V[i][j] + L[i][j]*(S[i][j] - S[i][j-1] + T[i][j] - T[i-1][j]));
+}
+
+void Universe::SerialUpdateVelocity() {
+    UpdateVelocity(Rectangle(1,1,UniverseWidth-1,UniverseHeight-1));
+}
+
+struct UpdateVelocityBody {
+    Universe & u_;
+    UpdateVelocityBody(Universe & u):u_(u){}
+    void operator()( const tbb::blocked_range<int>& y_range ) const {
+        u_.UpdateVelocity(Universe::Rectangle(1,y_range.begin(),u_.UniverseWidth-1,y_range.size()));
+    }
+};
+
+void Universe::ParallelUpdateVelocity(tbb::affinity_partitioner &affinity) {
+    tbb::parallel_for( tbb::blocked_range<int>( 1, UniverseHeight ), // Index space for loop
+                       UpdateVelocityBody(*this),                    // Body of loop
+                       affinity );                                   // Affinity hint
+}
+
+void Universe::SerialUpdateUniverse() {
+    UpdatePulse();
+    SerialUpdateStress();
+    SerialUpdateVelocity();
+}
+
+void Universe::ParallelUpdateUniverse() {
+    /** Affinity is an argument to parallel_for to hint that an iteration of a loop
+    is best replayed on the same processor for each execution of the loop.
+    It is a static object because it must remember where the iterations happened
+    in previous executions. */
+    static tbb::affinity_partitioner affinity;
+    UpdatePulse();
+    ParallelUpdateStress(affinity);
+    ParallelUpdateVelocity(affinity);
+}
+
+bool Universe::TryPutNewPulseSource(int x, int y){
+    if(pulseCounter == 0) {
+        pulseCounter = pulseTime;
+        pulseX = x; pulseY = y;
+        return true;
+    }
+    return false;
+}
+
+void Universe::SetDrawingMemory(const drawing_memory &dmem) {
+    drawingMemory = dmem;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/universe.h b/xdl/third_party/tbb/examples/parallel_for/seismic/universe.h
new file mode 100644
index 00000000..5ba6df0e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/universe.h
@@ -0,0 +1,118 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef UNIVERSE_H_
+#define UNIVERSE_H_
+
+#ifndef UNIVERSE_WIDTH
+#define UNIVERSE_WIDTH 1024
+#endif
+#ifndef UNIVERSE_HEIGHT
+#define UNIVERSE_HEIGHT 512
+#endif
+
+#include "../../common/gui/video.h"
+#include "tbb/partitioner.h"
+
+class Universe {
+public:
+    enum {
+        UniverseWidth  = UNIVERSE_WIDTH,
+        UniverseHeight = UNIVERSE_HEIGHT
+    };
+private:
+    //in order to avoid performance degradation due to cache aliasing issue
+    //some padding is needed after each row in array, and between array themselves.
+    //the padding is achieved by adjusting number of rows and columns.
+    //as the compiler is forced to place class members of the same clause in order of the
+    //declaration this seems to be the right way of padding.
+
+    //magic constants added below are chosen experimentally for 1024x512.
+    enum {
+        MaxWidth = UniverseWidth+1,
+        MaxHeight = UniverseHeight+3
+    };
+
+    typedef float ValueType;
+
+    //! Horizontal stress
+    ValueType S[MaxHeight][MaxWidth];
+
+    //! Velocity at each grid point
+    ValueType V[MaxHeight][MaxWidth];
+
+    //! Vertical stress
+    ValueType T[MaxHeight][MaxWidth];
+
+    //! Coefficient related to modulus
+    ValueType M[MaxHeight][MaxWidth];
+
+    //! Damping coefficients
+    ValueType D[MaxHeight][MaxWidth];
+
+    //! Coefficient related to lightness
+    ValueType L[MaxHeight][MaxWidth];
+
+    enum { ColorMapSize = 1024};
+    color_t ColorMap[4][ColorMapSize];
+
+    enum MaterialType {
+        WATER=0,
+        SANDSTONE=1,
+        SHALE=2
+    };
+
+    //! Values are MaterialType, cast to an unsigned char to save space.
+    unsigned char material[MaxHeight][MaxWidth];
+
+private:
+    enum { DamperSize = 32};
+
+    int pulseTime;
+    int pulseCounter;
+    int pulseX;
+    int pulseY;
+
+    drawing_memory drawingMemory;
+
+public:
+    void InitializeUniverse(video const& colorizer);
+
+    void SerialUpdateUniverse();
+    void ParallelUpdateUniverse();
+    bool TryPutNewPulseSource(int x, int y);
+    void SetDrawingMemory(const drawing_memory &dmem);
+private:
+    struct Rectangle;
+    void UpdatePulse();
+    void UpdateStress(Rectangle const& r );
+
+    void SerialUpdateStress() ;
+    friend struct UpdateStressBody;
+    friend struct UpdateVelocityBody;
+    void ParallelUpdateStress(tbb::affinity_partitioner &affinity);
+
+    void UpdateVelocity(Rectangle const& r);
+
+    void SerialUpdateVelocity() ;
+    void ParallelUpdateVelocity(tbb::affinity_partitioner &affinity);
+};
+
+#endif /* UNIVERSE_H_ */
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..da6ed451
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/project.pbxproj
@@ -0,0 +1,586 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		84B8DA7A152CA90100D59B95 /* (null) in Resources */ = {isa = PBXBuildFile; };
+		84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */; };
+		84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7E152CA97B00D59B95 /* MainMenu.xib */; };
+		84B8DA87152CA99C00D59B95 /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA82152CA99C00D59B95 /* main.cpp */; };
+		84B8DA88152CA99C00D59B95 /* seismic_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA83152CA99C00D59B95 /* seismic_video.cpp */; };
+		84B8DA89152CA99C00D59B95 /* universe.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA85152CA99C00D59B95 /* universe.cpp */; };
+		84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D017551527431F0008A4E0 /* Cocoa.framework */; };
+		84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D01775152744BD0008A4E0 /* OpenGL.framework */; };
+		D3BD96921C0DD55E00163D8B /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA82152CA99C00D59B95 /* main.cpp */; };
+		D3BD96931C0DD56900163D8B /* seismic_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA83152CA99C00D59B95 /* seismic_video.cpp */; };
+		D3BD96941C0DD57600163D8B /* universe.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA85152CA99C00D59B95 /* universe.cpp */; };
+		D3BD96951C0DD59200163D8B /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		D3BD96961C0DD5A000163D8B /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		D3BD96971C0DD5A900163D8B /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		D3BD96A31C0DE2BB00163D8B /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		D3BD96A61C0DE3DE00163D8B /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = D3BD96A51C0DE3DE00163D8B /* main.m */; };
+		D3BD96AB1C0E08E500163D8B /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = D3BD96A51C0DE3DE00163D8B /* main.m */; };
+		D3BD96B31C0E0AFE00163D8B /* tbbExample-Info.ios.plist in Resources */ = {isa = PBXBuildFile; fileRef = D3BD966D1C0DD00400163D8B /* tbbExample-Info.ios.plist */; };
+		D3BD96B51C0E0B2200163D8B /* tbbExample-Info.plist in Resources */ = {isa = PBXBuildFile; fileRef = D3BD96B41C0E0B2200163D8B /* tbbExample-Info.plist */; };
+		D3BD96B81C0E11CE00163D8B /* iOS.storyboard in Resources */ = {isa = PBXBuildFile; fileRef = D3BD96B61C0E11C600163D8B /* iOS.storyboard */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5896E2191923E00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C5896F2191925E00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXFileReference section */
+		84B8DA70152CA90100D59B95 /* OpenGLView.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = OpenGLView.h; path = ../../../common/gui/xcode/tbbExample/OpenGLView.h; sourceTree = "<group>"; };
+		84B8DA71152CA90100D59B95 /* OpenGLView.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = OpenGLView.m; path = ../../../common/gui/xcode/tbbExample/OpenGLView.m; sourceTree = "<group>"; };
+		84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = tbbAppDelegate.h; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.h; sourceTree = "<group>"; };
+		84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = tbbAppDelegate.m; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.m; sourceTree = "<group>"; };
+		84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = "tbbExample-Prefix.pch"; path = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch"; sourceTree = "<group>"; };
+		84B8DA7D152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = text.plist.strings; name = en; path = InfoPlist.strings; sourceTree = "<group>"; };
+		84B8DA7F152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = file.xib; name = en; path = MainMenu.xib; sourceTree = "<group>"; };
+		84B8DA82152CA99C00D59B95 /* main.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = main.cpp; path = ../main.cpp; sourceTree = "<group>"; };
+		84B8DA83152CA99C00D59B95 /* seismic_video.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = seismic_video.cpp; path = ../seismic_video.cpp; sourceTree = "<group>"; };
+		84B8DA84152CA99C00D59B95 /* seismic_video.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = seismic_video.h; path = ../seismic_video.h; sourceTree = "<group>"; };
+		84B8DA85152CA99C00D59B95 /* universe.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = universe.cpp; path = ../universe.cpp; sourceTree = "<group>"; };
+		84B8DA86152CA99C00D59B95 /* universe.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = universe.h; path = ../universe.h; sourceTree = "<group>"; };
+		84B8DA99152CADF400D59B95 /* macvideo.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = macvideo.cpp; path = ../../../common/gui/macvideo.cpp; sourceTree = "<group>"; };
+		84D017511527431F0008A4E0 /* tbbExample.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tbbExample.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		84D017551527431F0008A4E0 /* Cocoa.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Cocoa.framework; path = System/Library/Frameworks/Cocoa.framework; sourceTree = SDKROOT; };
+		84D017581527431F0008A4E0 /* AppKit.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = AppKit.framework; path = System/Library/Frameworks/AppKit.framework; sourceTree = SDKROOT; };
+		84D017591527431F0008A4E0 /* CoreData.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = CoreData.framework; path = System/Library/Frameworks/CoreData.framework; sourceTree = SDKROOT; };
+		84D0175A1527431F0008A4E0 /* Foundation.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Foundation.framework; path = System/Library/Frameworks/Foundation.framework; sourceTree = SDKROOT; };
+		84D01775152744BD0008A4E0 /* OpenGL.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = OpenGL.framework; path = System/Library/Frameworks/OpenGL.framework; sourceTree = SDKROOT; };
+		D3BD966D1C0DD00400163D8B /* tbbExample-Info.ios.plist */ = {isa = PBXFileReference; lastKnownFileType = text.plist.xml; name = "tbbExample-Info.ios.plist"; path = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist"; sourceTree = "<group>"; };
+		D3BD96A51C0DE3DE00163D8B /* main.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = main.m; path = ../../../common/gui/xcode/tbbExample/main.m; sourceTree = "<group>"; };
+		D3BD96B41C0E0B2200163D8B /* tbbExample-Info.plist */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text.plist.xml; name = "tbbExample-Info.plist"; path = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist"; sourceTree = "<group>"; };
+		D3BD96B61C0E11C600163D8B /* iOS.storyboard */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = file.storyboard; name = iOS.storyboard; path = ../iOS.storyboard; sourceTree = "<group>"; };
+		D3BD96BB1C0E19E700163D8B /* tbbExample.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tbbExample.app; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		84D0174E1527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */,
+				84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D3BD96571C0DD00400163D8B /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		84B8DA6C152CA8D900D59B95 /* tbbExample Sources */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA7B152CA97B00D59B95 /* Resources */,
+				84B8DA82152CA99C00D59B95 /* main.cpp */,
+				D3BD96A51C0DE3DE00163D8B /* main.m */,
+				84B8DA83152CA99C00D59B95 /* seismic_video.cpp */,
+				84B8DA84152CA99C00D59B95 /* seismic_video.h */,
+				84B8DA85152CA99C00D59B95 /* universe.cpp */,
+				84B8DA86152CA99C00D59B95 /* universe.h */,
+			);
+			name = "tbbExample Sources";
+			sourceTree = "<group>";
+		};
+		84B8DA7B152CA97B00D59B95 /* Resources */ = {
+			isa = PBXGroup;
+			children = (
+				D3BD96B61C0E11C600163D8B /* iOS.storyboard */,
+				84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */,
+				84B8DA7E152CA97B00D59B95 /* MainMenu.xib */,
+			);
+			name = Resources;
+			path = ../../../common/gui/xcode/tbbExample/en.lproj;
+			sourceTree = "<group>";
+		};
+		84B8DA98152CAD8600D59B95 /* Gui layer */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA99152CADF400D59B95 /* macvideo.cpp */,
+				84B8DA70152CA90100D59B95 /* OpenGLView.h */,
+				84B8DA71152CA90100D59B95 /* OpenGLView.m */,
+				84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */,
+				84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */,
+				84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */,
+			);
+			name = "Gui layer";
+			sourceTree = "<group>";
+		};
+		84D017461527431F0008A4E0 = {
+			isa = PBXGroup;
+			children = (
+				D3BD96B41C0E0B2200163D8B /* tbbExample-Info.plist */,
+				D3BD966D1C0DD00400163D8B /* tbbExample-Info.ios.plist */,
+				84B8DA98152CAD8600D59B95 /* Gui layer */,
+				84B8DA6C152CA8D900D59B95 /* tbbExample Sources */,
+				84D017541527431F0008A4E0 /* Frameworks */,
+				84D017521527431F0008A4E0 /* Products */,
+			);
+			sourceTree = "<group>";
+		};
+		84D017521527431F0008A4E0 /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				84D017511527431F0008A4E0 /* tbbExample.app */,
+				D3BD96BB1C0E19E700163D8B /* tbbExample.app */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+		84D017541527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXGroup;
+			children = (
+				84D017591527431F0008A4E0 /* CoreData.framework */,
+				84D0175A1527431F0008A4E0 /* Foundation.framework */,
+				84D017581527431F0008A4E0 /* AppKit.framework */,
+				84D01775152744BD0008A4E0 /* OpenGL.framework */,
+				84D017551527431F0008A4E0 /* Cocoa.framework */,
+			);
+			name = Frameworks;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		84D017501527431F0008A4E0 /* tbbExample */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tbbExample" */;
+			buildPhases = (
+				84D0174D1527431F0008A4E0 /* Sources */,
+				84D0174E1527431F0008A4E0 /* Frameworks */,
+				84D0174F1527431F0008A4E0 /* Resources */,
+			);
+			buildRules = (
+				C3C5896E2191923E00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tbbExample;
+			productName = tbbExample;
+			productReference = 84D017511527431F0008A4E0 /* tbbExample.app */;
+			productType = "com.apple.product-type.application";
+		};
+		D3BD96591C0DD00400163D8B /* tbbExample_ios */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = D3BD96841C0DD00500163D8B /* Build configuration list for PBXNativeTarget "tbbExample_ios" */;
+			buildPhases = (
+				D3BD96561C0DD00400163D8B /* Sources */,
+				D3BD96571C0DD00400163D8B /* Frameworks */,
+				D3BD96581C0DD00400163D8B /* Resources */,
+			);
+			buildRules = (
+				C3C5896F2191925E00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tbbExample_ios;
+			productName = tbbExample_ios;
+			productReference = D3BD96BB1C0E19E700163D8B /* tbbExample.app */;
+			productType = "com.apple.product-type.application";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		84D017481527431F0008A4E0 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				CLASSPREFIX = tbb;
+				LastUpgradeCheck = 0710;
+				TargetAttributes = {
+					D3BD96591C0DD00400163D8B = {
+						CreatedOnToolsVersion = 7.1.1;
+						DevelopmentTeam = 7J8M3RM94C;
+					};
+				};
+			};
+			buildConfigurationList = 84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "seismic" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 0;
+			knownRegions = (
+				en,
+				Base,
+			);
+			mainGroup = 84D017461527431F0008A4E0;
+			productRefGroup = 84D017521527431F0008A4E0 /* Products */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				84D017501527431F0008A4E0 /* tbbExample */,
+				D3BD96591C0DD00400163D8B /* tbbExample_ios */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXResourcesBuildPhase section */
+		84D0174F1527431F0008A4E0 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D3BD96B51C0E0B2200163D8B /* tbbExample-Info.plist in Resources */,
+				84B8DA7A152CA90100D59B95 /* (null) in Resources */,
+				84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */,
+				84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D3BD96581C0DD00400163D8B /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D3BD96B81C0E11CE00163D8B /* iOS.storyboard in Resources */,
+				D3BD96B31C0E0AFE00163D8B /* tbbExample-Info.ios.plist in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXResourcesBuildPhase section */
+
+/* Begin PBXSourcesBuildPhase section */
+		84D0174D1527431F0008A4E0 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */,
+				84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */,
+				84B8DA87152CA99C00D59B95 /* main.cpp in Sources */,
+				D3BD96A31C0DE2BB00163D8B /* macvideo.cpp in Sources */,
+				84B8DA88152CA99C00D59B95 /* seismic_video.cpp in Sources */,
+				D3BD96A61C0DE3DE00163D8B /* main.m in Sources */,
+				84B8DA89152CA99C00D59B95 /* universe.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D3BD96561C0DD00400163D8B /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D3BD96941C0DD57600163D8B /* universe.cpp in Sources */,
+				D3BD96921C0DD55E00163D8B /* main.cpp in Sources */,
+				D3BD96951C0DD59200163D8B /* macvideo.cpp in Sources */,
+				D3BD96931C0DD56900163D8B /* seismic_video.cpp in Sources */,
+				D3BD96971C0DD5A900163D8B /* tbbAppDelegate.m in Sources */,
+				D3BD96AB1C0E08E500163D8B /* main.m in Sources */,
+				D3BD96961C0DD5A000163D8B /* OpenGLView.m in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin PBXVariantGroup section */
+		84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7D152CA97B00D59B95 /* en */,
+			);
+			name = InfoPlist.strings;
+			sourceTree = "<group>";
+		};
+		84B8DA7E152CA97B00D59B95 /* MainMenu.xib */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7F152CA97B00D59B95 /* en */,
+			);
+			name = MainMenu.xib;
+			sourceTree = "<group>";
+		};
+/* End PBXVariantGroup section */
+
+/* Begin XCBuildConfiguration section */
+		84D01770152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_INCREASE_PRECOMPILED_HEADER_SHARING = NO;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+				);
+				GCC_SYMBOLS_PRIVATE_EXTERN = NO;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		84D01771152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = YES;
+				DEBUG_INFORMATION_FORMAT = "dwarf-with-dsym";
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_INCREASE_PRECOMPILED_HEADER_SHARING = NO;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+		84D01773152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ARCHS = "$(ARCHS_STANDARD)";
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_BUNDLE_IDENTIFIER = "Intel.${PRODUCT_NAME:rfc1034identifier}";
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Debug64;
+		};
+		84D01774152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ARCHS = "$(ARCHS_STANDARD)";
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_BUNDLE_IDENTIFIER = "Intel.${PRODUCT_NAME:rfc1034identifier}";
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Release64;
+		};
+		D3BD96851C0DD00500163D8B /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "gnu++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				DEBUG_INFORMATION_FORMAT = dwarf;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+					"__TBB_IOS=1",
+				);
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.1;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "\"$(SRCROOT)/../../../../lib/ios\"";
+				MTL_ENABLE_DEBUG_INFO = YES;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = tbbExample;
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = 1;
+			};
+			name = Debug64;
+		};
+		D3BD96861C0DD00500163D8B /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "gnu++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				COPY_PHASE_STRIP = NO;
+				ENABLE_NS_ASSERTIONS = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_PREPROCESSOR_DEFINITIONS = "__TBB_IOS=1";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.1;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "\"$(SRCROOT)/../../../../lib/ios\"";
+				MTL_ENABLE_DEBUG_INFO = NO;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = tbbExample;
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = 1;
+				VALIDATE_PRODUCT = YES;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "seismic" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01770152743200008A4E0 /* Debug64 */,
+				84D01771152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tbbExample" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01773152743200008A4E0 /* Debug64 */,
+				84D01774152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		D3BD96841C0DD00500163D8B /* Build configuration list for PBXNativeTarget "tbbExample_ios" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				D3BD96851C0DD00500163D8B /* Debug64 */,
+				D3BD96861C0DD00500163D8B /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 84D017481527431F0008A4E0 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme b/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme
new file mode 100644
index 00000000..9975c8e3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme
@@ -0,0 +1,119 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "D3BD96591C0DD00400163D8B"
+               BuildableName = "tbbExample.app"
+               BlueprintName = "tbbExample_ios"
+               ReferencedContainer = "container:seismic.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+         <BuildActionEntry
+            buildForTesting = "NO"
+            buildForRunning = "NO"
+            buildForProfiling = "NO"
+            buildForArchiving = "NO"
+            buildForAnalyzing = "NO">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "D3BD96711C0DD00400163D8B"
+               BuildableName = "com.tbb.exampleTests.xctest"
+               BlueprintName = "com.tbb.exampleTests"
+               ReferencedContainer = "container:seismic.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+         <BuildActionEntry
+            buildForTesting = "NO"
+            buildForRunning = "NO"
+            buildForProfiling = "NO"
+            buildForArchiving = "NO"
+            buildForAnalyzing = "NO">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "D3BD967C1C0DD00500163D8B"
+               BuildableName = "com.tbb.exampleUITests.xctest"
+               BlueprintName = "com.tbb.exampleUITests"
+               ReferencedContainer = "container:seismic.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D3BD96591C0DD00400163D8B"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample_ios"
+            ReferencedContainer = "container:seismic.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "YES"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D3BD96591C0DD00400163D8B"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample_ios"
+            ReferencedContainer = "container:seismic.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D3BD96591C0DD00400163D8B"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample_ios"
+            ReferencedContainer = "container:seismic.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme b/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme
new file mode 100644
index 00000000..21b8d648
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/seismic/xcode/seismic.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme
@@ -0,0 +1,99 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "84D017501527431F0008A4E0"
+               BuildableName = "tbbExample.app"
+               BlueprintName = "tbbExample"
+               ReferencedContainer = "container:tbbExample.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:seismic.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      customWorkingDirectory = "/tmp"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "NO"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:seismic.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <EnvironmentVariables>
+         <EnvironmentVariable
+            key = "DYLD_LIBRARY_PATH"
+            value = "$(SRCROOT)/../../../../lib"
+            isEnabled = "YES">
+         </EnvironmentVariable>
+      </EnvironmentVariables>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:tbbExample.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/Makefile b/xdl/third_party/tbb/examples/parallel_for/tachyon/Makefile
new file mode 100644
index 00000000..4e9d3a5e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/Makefile
@@ -0,0 +1,184 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# The original source for this example is
+# Copyright (c) 1994-2008 John E. Stone
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. The name of the author may not be used to endorse or promote products
+#    derived from this software without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+# OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+# WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+# ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+# DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+# SUCH DAMAGE.
+
+# GNU Makefile that builds and runs example.
+NAME:=tachyon
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+# The default runtime arguments
+export ARGS = dat/balls.dat
+export PERF_RUN_ARGS = silent dat/balls3.dat
+export LIGHT_ARGS= dat/model2.dat
+
+# define name suffix
+SUFFIX = .$(VERSION)
+
+LIBS ?= -lm
+
+include ../../common/gui/Makefile.gmake
+
+ifeq ($(UI),x)
+UI_CXXFLAGS += -DX_FULLSYNC 
+ifneq (,$(findstring -lXext,$(LIBS)))
+UI_CXXFLAGS += -DX_NOSHMPIX
+endif
+endif # X
+
+MYCXXFLAGS = $(CXXFLAGS) $(UI_CXXFLAGS)
+
+all: build run
+release: build
+debug: build_debug
+test: run
+
+build: build_serial build_tbb1d build_tbb
+build_debug: build_serial_debug build_tbb1d_debug build_tbb_debug
+run: run_serial run_tbb1d run_tbb
+
+serial: build_serial run_serial
+serial_debug: build_serial_debug run_serial
+tbb: build_tbb run_tbb
+tbb_debug: build_tbb_debug run_tbb
+tbb1d: build_tbb1d run_tbb1d
+tbb1d_debug: build_tbb1d_debug run_tbb1d
+
+build_serial:
+	$(MAKE) VERSION=serial build_one
+build_serial_debug:
+	$(MAKE) VERSION=serial ADD_DEBUG=1 build_one
+run_serial:
+	$(MAKE) VERSION=serial run_one
+
+build_tbb:
+	$(MAKE) VERSION=tbb ADD_TBB=1 build_one
+build_tbb_debug:
+	$(MAKE) VERSION=tbb ADD_TBB=1 ADD_DEBUG=1 build_one
+run_tbb:
+	$(MAKE) VERSION=tbb run_one
+
+build_tbb1d:
+	$(MAKE) VERSION=tbb1d ADD_TBB=1 build_one
+build_tbb1d_debug:
+	$(MAKE) VERSION=tbb1d ADD_TBB=1 ADD_DEBUG=1 build_one
+run_tbb1d:
+	$(MAKE) VERSION=tbb1d run_one
+
+
+perf_build:
+	$(MAKE) UI=con VERSION=tbb ADD_TBB=1 build_one
+perf_run:
+	$(MAKE) UI=con VERSION=tbb run_perf_one
+
+light_test:
+	$(MAKE) UI=con VERSION=tbb light_test_one
+
+
+#
+# Per-build Makefile rules (for recursive $(MAKE) calls from above)
+#
+
+SVERSION = $(VERSION)
+
+ifeq ($(ADD_DEBUG),1)
+MYCXXFLAGS += -O0 -g -D_DEBUG
+else
+MYCXXFLAGS += -O2 -DNDEBUG
+endif
+
+
+ifeq ($(ADD_TBB),1)
+MYCXXFLAGS +=
+ifeq ($(ADD_DEBUG),1)
+MYCXXFLAGS += -DTBB_USE_DEBUG
+LIBS += -ltbb_debug
+else
+LIBS += -ltbb
+endif
+endif
+
+ifeq ($(shell uname), Linux)
+LIBS += -lrt 
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+SOURCE = ../../common/gui/$(UI)video.cpp src/trace.$(SVERSION).cpp src/main.cpp src/pthread.cpp src/tachyon_video.cpp src/api.cpp src/apigeom.cpp src/apitrigeom.cpp src/bndbox.cpp src/box.cpp src/camera.cpp src/coordsys.cpp src/cylinder.cpp src/extvol.cpp src/global.cpp src/grid.cpp src/imageio.cpp src/imap.cpp src/intersect.cpp src/jpeg.cpp src/light.cpp src/objbound.cpp src/parse.cpp src/plane.cpp src/ppm.cpp src/quadric.cpp src/render.cpp src/ring.cpp src/shade.cpp src/sphere.cpp src/texture.cpp src/tgafile.cpp src/trace_rest.cpp src/triangle.cpp src/ui.cpp src/util.cpp src/vector.cpp src/vol.cpp
+
+build_one:	$(EXE)
+
+run_one:
+ifeq ($(UI),mac)
+	export DYLD_LIBRARY_PATH="$(DYLD_LIBRARY_PATH):$(TBBLIBSPATH)"; $(run_cmd) ./$(EXE) $(ARGS)
+else
+	$(run_cmd) ./$(EXE) $(ARGS)
+endif
+
+run_perf_one:
+	$(run_cmd) ./$(EXE) $(PERF_RUN_ARGS)
+
+light_test_one:
+	$(run_cmd) ./$(EXE) $(LIGHT_ARGS)
+
+$(EXE): $(SOURCE)
+ifeq ($(UI),mac)
+	mkdir -p $(APPRES)/en.lproj $(NAME)$(SUFFIX).app/Contents/MacOS
+	cp ../../common/gui/xcode/tbbExample/tbbExample-Info.plist $(NAME)$(SUFFIX).app/Contents/Info.plist
+	cp ../../common/gui/xcode/tbbExample/PkgInfo $(NAME)$(SUFFIX).app/Contents
+	cp ../../common/gui/xcode/tbbExample/en.lproj/* $(APPRES)/en.lproj
+	$(CXX_UI) $(MYCXXFLAGS) $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS*
+	$(CXX) $(MYCXXFLAGS) -o $@ $(SOURCE) $(MACUIOBJS) $(LIBS)
+	$(RM) *.o
+
+clean: VERSION = *
+clean:
+ifeq ($(UI),mac)
+	rm -rf $(NAME).*
+endif
+	$(RM) $(EXE) *.o *.d
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/Makefile.windows b/xdl/third_party/tbb/examples/parallel_for/tachyon/Makefile.windows
new file mode 100644
index 00000000..d9ce96de
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/Makefile.windows
@@ -0,0 +1,150 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# The original source for this example is
+# Copyright (c) 1994-2008 John E. Stone
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. The name of the author may not be used to endorse or promote products
+#    derived from this software without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+# OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+# WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+# ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+# DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+# SUCH DAMAGE.
+
+# Common Makefile that builds and runs example.
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# Uncomment one of next lines to choose user interface type (console, gdiplus, direct draw)
+#UI = con
+UI = gdi
+#UI = dd
+
+# Machine architecture, auto-detected from TBB_TARGET_ARCH by default
+# Use XARCH variable to change it. See index.html for more information
+ARCH0 = $(TBB_TARGET_ARCH)-
+ARCH1 = $(ARCH0:ia32-=x86)
+ARCH2 = $(ARCH1:intel64-=AMD64)
+XARCH = $(ARCH2:-=x86)
+
+# The default runtime arguments
+ARGS = dat\balls.dat
+PERF_RUN_ARGS = silent dat\balls3.dat
+LIGHT_ARGS=dat\model2.dat
+
+# Add these for tbb/tbb1d release builds
+# /GL is a workaround to prevent run-time crash when built by VS2010
+CXXFLAGS_TBB_NDEBUG = $(CXXFLAGS) /GL
+LIBS_TBB_NDEBUG = tbb.lib $(LIBS)
+
+# Add these for tbb/tbb1d debug builds
+CXXFLAGS_TBB_DEBUG = $(CXXFLAGS) /D TBB_USE_DEBUG
+LIBS_TBB_DEBUG =  tbb_debug.lib $(LIBS)
+
+
+MAKEINC = ../../common/gui/Makefile.win
+# scr/main.cpp src/tachyon_video.cpp cannot be included to the SOURCE_COMMON list since it depends on UI and /subsystem which is not specified for common SOURCE build
+SOURCE = src/main.cpp src/tachyon_video.cpp
+SOURCE_COMMON = src/pthread.cpp  src/api.cpp src/apigeom.cpp src/apitrigeom.cpp src/bndbox.cpp src/box.cpp src/camera.cpp src/coordsys.cpp src/cylinder.cpp src/extvol.cpp src/global.cpp src/grid.cpp src/imageio.cpp src/imap.cpp src/intersect.cpp src/jpeg.cpp src/light.cpp src/objbound.cpp src/parse.cpp src/plane.cpp src/ppm.cpp src/quadric.cpp src/render.cpp src/ring.cpp src/shade.cpp src/sphere.cpp src/texture.cpp src/tgafile.cpp src/trace_rest.cpp src/triangle.cpp src/ui.cpp src/util.cpp src/vector.cpp src/vol.cpp
+
+# Targets
+all: build run
+release: build
+debug: build_debug
+test: run
+
+build: build_serial build_tbb1d build_tbb
+build_debug: build_serial_debug build_tbb1d_debug build_tbb_debug
+run: run_serial run_tbb1d run_tbb
+
+serial: build_serial run_serial
+serial_debug: build_serial_debug run_serial
+tbb: build_tbb run_tbb
+tbb_debug: build_tbb_debug run_tbb
+tbb1d: build_tbb1d run_tbb1d
+tbb1d_debug: build_tbb1d_debug run_tbb1d
+
+CXXFLAGS_COMMON = /c /nologo /EHsc /Zc:forScope /D WIN32 /D _MBCS /D _CRT_SECURE_NO_DEPRECATE /Foobj/ /MP $(CXXFLAGS)
+CXXFLAGS_NDEBUG = /MD /O2 /Ot /Gy /D NDEBUG
+CXXFLAGS_DEBUG = /MDd /Od /Zi /D _DEBUG
+LIB_LINK_FLAGS = /nologo /machine:$(XARCH)
+
+tachyon_common.lib:
+	@cmd.exe /C if not exist obj mkdir obj
+	$(CXX) $(CXXFLAGS_NDEBUG) $(CXXFLAGS_COMMON) $(SOURCE_COMMON)
+	LIB $(LIB_LINK_FLAGS) obj/*.obj /OUT:$@
+	@cmd.exe /C if exist obj rmdir /S /Q obj
+
+tachyon_common_debug.lib:
+	@cmd.exe /C if not exist obj mkdir obj
+	$(CXX) $(CXXFLAGS_DEBUG) $(CXXFLAGS_COMMON) $(SOURCE_COMMON)
+	LIB $(LIB_LINK_FLAGS) obj/*.obj /OUT:$@
+	@cmd.exe /C if exist obj rmdir /S /Q obj
+
+build_serial: tachyon_common.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.serial.cpp $(SOURCE) tachyon_common.lib" EXE=tachyon.serial.exe RCNAME=gui UI=$(UI) CXX="$(CXX)" CXXFLAGS="/GL $(CXXFLAGS)" XARCH=$(XARCH) build_one
+build_serial_debug: tachyon_common_debug.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.serial.cpp $(SOURCE) tachyon_common_debug.lib" EXE=tachyon.serial.exe RCNAME=gui UI=$(UI) DEBUG=_debug CXX="$(CXX)" CXXFLAGS=$(CXXFLAGS) XARCH=$(XARCH) build_one
+run_serial:
+	-.\tachyon.serial.exe $(ARGS)
+
+build_tbb: tachyon_common.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.tbb.cpp $(SOURCE) tachyon_common.lib" EXE=tachyon.tbb.exe RCNAME=gui UI=$(UI) CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS_TBB_NDEBUG)" LFLAGS="$(LIBS_TBB_NDEBUG)" XARCH=$(XARCH) build_one
+build_tbb_debug: tachyon_common_debug.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.tbb.cpp $(SOURCE) tachyon_common_debug.lib" EXE=tachyon.tbb.exe RCNAME=gui UI=$(UI) DEBUG=_debug CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS_TBB_DEBUG)" LFLAGS="$(LIBS_TBB_DEBUG)" XARCH=$(XARCH) build_one
+run_tbb:
+	-.\tachyon.tbb.exe $(ARGS)
+
+build_tbb1d: tachyon_common.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.tbb1d.cpp $(SOURCE) tachyon_common.lib" EXE=tachyon.tbb1d.exe RCNAME=gui UI=$(UI) CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS_TBB_NDEBUG)" LFLAGS="$(LIBS_TBB_NDEBUG)" XARCH=$(XARCH) build_one
+build_tbb1d_debug: tachyon_common_debug.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.tbb1d.cpp $(SOURCE) tachyon_common_debug.lib" EXE=tachyon.tbb1d.exe RCNAME=gui UI=$(UI) DEBUG=_debug CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS_TBB_DEBUG)" LFLAGS="$(LIBS_TBB_DEBUG)" XARCH=$(XARCH) build_one
+run_tbb1d:
+	-.\tachyon.tbb1d.exe $(ARGS)
+
+
+clean:
+	@cmd.exe /C del tachyon.* *.manifest *.obj *.lib msvs\gui.res *.?db
+
+perf_build: tachyon_common.lib
+	@$(MAKE) -f $(MAKEINC) SOURCE="src/trace.tbb.cpp $(SOURCE) tachyon_common.lib" EXE=tachyon.tbb.exe RCNAME=gui UI=con CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS_TBB_NDEBUG)" LFLAGS="$(LIBS_TBB_NDEBUG)" XARCH=$(XARCH) build_one
+perf_run:
+	-.\tachyon.tbb.exe $(PERF_RUN_ARGS)
+
+light_test:
+	-.\tachyon.tbb.exe $(LIGHT_ARGS)
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/820spheres.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/820spheres.dat
new file mode 100644
index 00000000..5d5a4300
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/820spheres.dat
@@ -0,0 +1,1671 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 512 512
+  VERBOSE 0
+ 
+CAMERA
+  ZOOM 1.0
+  ASPECTRATIO 1.0
+  ANTIALIASING 0
+  RAYDEPTH 12
+  CENTER 0.0 0.0 2.0
+  VIEWDIR 0 0 -1 
+  UPDIR 0 1 0
+ 
+END_CAMERA 
+ 
+LIGHT CENTER 4 3 2 RAD 0.2 COLOR 0.5 0.5 0.5
+ 
+LIGHT CENTER 1 -4 4 RAD 0.2 COLOR 0.5 0.5 0.5
+ 
+LIGHT CENTER -3 1 5 RAD 0.2 COLOR 0.5 0.5 0.5
+
+TEXDEF txt001 AMBIENT 0.2  DIFFUSE 0.8  SPECULAR 0  OPACITY 1 
+ COLOR 1 0.75 0.33 
+ TEXFUNC 0 
+
+TEXDEF txt002 AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0 OPACITY 1.0
+  COLOR 1.0 1.0 1.0 TEXFUNC 0
+
+ SPHERE CENTER 0 0 0 RAD 0.5 
+   txt002 
+ SPHERE CENTER 0.272166 0.272166 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.420314 0.420314 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.470715 0.470715 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.461623 0.409245 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.409245 0.461623 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.429405 0.481784 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.379004 0.431383 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.481784 0.429405 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.431383 0.379004 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.461844 0.304709 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.492085 0.33495 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.424345 0.305171 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.435193 0.368397 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.529584 0.334488 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.499343 0.304247 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.518736 0.271262 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.488495 0.241021 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.450996 0.241483 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.304709 0.461844 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.33495 0.492085 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.368397 0.435193 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.305171 0.424345 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.271262 0.518736 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.241483 0.450996 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.241021 0.488495 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.334488 0.529584 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.304247 0.499343 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.230635 0.38777 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.2506 0.446614 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.301839 0.407906 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.253236 0.449775 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.179397 0.426478 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.182032 0.429639 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.159431 0.367634 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.227999 0.384609 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.208034 0.325765 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.279238 0.345901 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.102505 0.502308 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.160392 0.474661 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.160392 0.474661 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0571437 0.456947 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0696698 0.383939 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0571437 0.456947 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0696698 0.383939 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.082487 0.239622 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0438957 0.258053 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.117687 0.252557 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0863845 0.308551 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.00869528 0.245118 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0511841 0.295616 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0472866 0.226687 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0399982 0.189123 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0785895 0.170692 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.11379 0.183628 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.38777 0.230635 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.446614 0.2506 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.449775 0.253236 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.407906 0.301839 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.384609 0.227999 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.345901 0.279238 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.325765 0.208034 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.426478 0.179397 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.367634 0.159431 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.429639 0.182032 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.239622 0.082487 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.258053 0.0438957 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.308551 0.0863845 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.252557 0.117687 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.189123 0.0399982 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.183628 0.11379 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.170692 0.0785895 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.245118 0.00869528 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.226687 0.0472866 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.295616 0.0511841 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.502308 0.102505 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.474661 0.160392 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.474661 0.160392 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.456947 0.0571437 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.383939 0.0696698 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.456947 0.0571437 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.383939 0.0696698 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.802608 0.281471 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.824035 0.30566 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.787796 0.241352 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.752156 0.305221 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.838847 0.34578 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.766968 0.345341 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.817421 0.321591 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.874487 0.28191 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.853061 0.257721 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.838248 0.217602 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.61371 0.202787 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.5724 0.191718 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.624779 0.244096 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.68526 0.183615 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.696329 0.224924 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.715501 0.153374 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.632882 0.131237 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.663122 0.100996 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.591572 0.120168 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.594141 0.358439 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.619127 0.408291 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.638217 0.337042 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.547576 0.389119 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.566667 0.317871 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.57505 0.429687 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.550064 0.379835 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.621614 0.399007 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.802608 0.281471 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.858698 0.329459 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.845371 0.280879 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.798572 0.337088 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.815936 0.330051 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.75581 0.33768 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.759846 0.282063 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.862735 0.273842 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.806645 0.225855 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.849407 0.225263 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.594141 0.358439 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.613592 0.428945 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.621614 0.399007 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.542042 0.409774 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.550064 0.379835 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.586119 0.388377 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.566667 0.317871 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.638217 0.337042 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.674191 0.202787 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.602641 0.183615 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.655019 0.131237 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.852418 0.0955788 2.30268e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.922609 0.11107 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.867231 0.135698 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.877966 0.164775 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.907797 0.0709499 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.863153 0.124655 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.837606 0.0554592 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.897062 0.0418734 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.826871 0.0263827 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.841683 0.0665023 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.69376 -0.0133465 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.740325 -0.0440268 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.721234 0.0272215 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.668775 -0.0631985 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.649684 0.00804971 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.712851 -0.0845947 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.666287 -0.0539145 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.737837 -0.0347427 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.69376 -0.0133465 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.745859 -0.0646815 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.737837 -0.0347427 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.674309 -0.0838533 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.666287 -0.0539145 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.701782 -0.0432853 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.649684 0.00804971 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.721234 0.0272215 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.281471 0.802608 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.30566 0.824035 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.305221 0.752156 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.241352 0.787796 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.28191 0.874487 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.217602 0.838248 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.257721 0.853061 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.34578 0.838847 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.321591 0.817421 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.345341 0.766968 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.358439 0.594141 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.408291 0.619127 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.337042 0.638217 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.429687 0.57505 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399007 0.621614 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.379835 0.550064 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389119 0.547576 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.317871 0.566667 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.142305 0.674191 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.100996 0.663122 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.153374 0.715501 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.213855 0.655019 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.224924 0.696329 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.244096 0.624779 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.161477 0.602641 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.191718 0.5724 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.120168 0.591572 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0955788 0.852418 1.31582e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.11107 0.922609 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.164775 0.877966 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.135698 0.867231 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0418734 0.897062 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0665023 0.841683 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0263827 0.826871 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0709499 0.907797 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0554592 0.837606 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.124655 0.863153 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0133465 0.69376 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0646815 0.745859 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0347427 0.737837 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0432853 0.701782 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0272215 0.721234 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.00804971 0.649684 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0838533 0.674309 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0539145 0.666287 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0133465 0.69376 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0440268 0.740325 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0272215 0.721234 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0845947 0.712851 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0347427 0.737837 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0539145 0.666287 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0631985 0.668775 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.00804971 0.649684 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.281471 0.802608 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.329459 0.858698 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.337088 0.798572 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.280879 0.845371 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.273842 0.862735 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.225263 0.849407 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.225855 0.806645 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.330051 0.815936 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282063 0.759846 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.33768 0.75581 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.202787 0.674191 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.131237 0.655019 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.183615 0.602641 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.358439 0.594141 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.428945 0.613592 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399007 0.621614 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.388377 0.586119 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.337042 0.638217 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.317871 0.566667 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.409774 0.542042 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.379835 0.550064 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.371785 0.0996195 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.393621 0.220501 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.368601 0.279642 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.321889 0.238665 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.372464 0.281062 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.440333 0.261479 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.444196 0.262898 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.465353 0.202338 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.389758 0.219082 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.414778 0.15994 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.343046 0.178104 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.191247 0.166275 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.130089 0.20793 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.154295 0.172673 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.192135 0.230419 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.167041 0.201532 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.229087 0.224021 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.228199 0.159877 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.129201 0.143787 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.190359 0.102131 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.153407 0.108529 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.277961 0.367156 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.252306 0.297666 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.339925 0.383759 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.376234 0.330873 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.376234 0.330873 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.277961 0.367156 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.252306 0.297666 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.574159 0.153845 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.612768 0.202534 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.543919 0.184086 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.643008 0.172294 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.585228 0.195155 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.6044 0.123605 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.631939 0.130984 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.56309 0.112536 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.494808 0.247614 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.494287 0.313607 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.452978 0.302539 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.434629 0.269833 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.536117 0.258683 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.476459 0.214908 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.536638 0.19269 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.554467 0.291389 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.513157 0.28032 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.552323 0.0329639 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.625877 0.0248832 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.584567 0.0138144 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.593633 0.0440327 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.561087 0.101445 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.520079 0.0521134 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.584869 -0.0244483 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.511316 -0.0163676 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.54356 -0.0355172 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.451136 0.0058509 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.447081 0.0051487 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.386138 0.0172804 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.439178 0.0688765 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.512079 -0.00628079 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.504176 0.0574471 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.516134 -0.00557859 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.459039 -0.0578769 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.463094 -0.0571747 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.398096 -0.0457452 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.424299 -0.178985 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.367336 -0.131634 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.486264 -0.162382 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.491265 -0.0984274 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.491265 -0.0984274 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.424299 -0.178985 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.367336 -0.131634 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.248762 -0.0483751 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.183785 -0.0599222 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.187119 -0.0172857 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.215921 0.00673113 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.245428 -0.0910116 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.277564 -0.0243582 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.310405 -0.0794645 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.216626 -0.115028 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.281603 -0.103481 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.21996 -0.0723919 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.508983 0.690426 1.25414e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.484794 0.755941 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.436283 0.7029 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.478434 0.695668 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.557494 0.743468 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551134 0.683194 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.581682 0.677953 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.515343 0.7507 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.539531 0.685185 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.466832 0.697658 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.335322 0.607487 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.283164 0.659645 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.286452 0.603979 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.33883 0.656357 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.332034 0.663153 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.384191 0.610996 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.279656 0.610775 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.331813 0.558618 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.335322 0.607487 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.313405 0.629404 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.331813 0.558618 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.384191 0.610996 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.316914 0.678274 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.33883 0.656357 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.264535 0.625895 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.286452 0.603979 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.645066 0.554344 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.681385 0.616373 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.649723 0.609912 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607573 0.617144 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.676727 0.560805 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.602915 0.561576 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.640408 0.498776 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.718878 0.553573 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.682558 0.491544 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687216 0.547112 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.501645 0.501645 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.542955 0.490576 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.490576 0.542955 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.430095 0.482473 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.419026 0.523783 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.399854 0.452233 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.482473 0.430095 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.452233 0.399854 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.523783 0.419026 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607487 0.335322 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.659645 0.283164 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.603979 0.286452 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.656357 0.33883 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.663153 0.332034 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.610996 0.384191 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.610775 0.279656 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.558618 0.331813 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.645066 0.554344 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.668521 0.610229 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.598918 0.585648 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.619787 0.622977 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.714669 0.578925 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.665934 0.591673 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.691213 0.52304 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.6938 0.541596 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.670344 0.48571 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.624197 0.517014 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607487 0.335322 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.629404 0.313405 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.558618 0.331813 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.610996 0.384191 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.678274 0.316914 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.656357 0.33883 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.625895 0.264535 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.603979 0.286452 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.441164 0.501645 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.512714 0.482473 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.460336 0.430095 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.835815 -0.157543 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.871646 -0.122136 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.799077 -0.135649 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.82339 -0.0854653 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.908384 -0.14403 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.860128 -0.107359 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.872552 -0.179437 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.884071 -0.194213 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.84824 -0.229621 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.811502 -0.207727 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.61371 -0.142305 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.68526 -0.161477 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.632882 -0.213855 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.69376 0.0133465 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.674309 0.0838533 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.666287 0.0539145 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.745859 0.0646815 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.737837 0.0347427 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.701782 0.0432853 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.721234 -0.0272215 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.649684 -0.00804971 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.835815 -0.157543 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.899353 -0.119969 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.868703 -0.130205 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.836885 -0.0844101 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.866465 -0.147308 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.803997 -0.111748 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.802927 -0.184881 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.898283 -0.193102 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.834745 -0.230676 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.867633 -0.203337 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.69376 0.0133465 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.668775 0.0631985 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.649684 -0.00804971 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.740325 0.0440268 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.721234 -0.0272215 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.712851 0.0845947 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.737837 0.0347427 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.666287 0.0539145 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.674191 -0.142305 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.715501 -0.153374 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.663122 -0.100996 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.602641 -0.161477 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.591572 -0.120168 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.5724 -0.191718 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.655019 -0.213855 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.624779 -0.244096 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.696329 -0.224924 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.786005 -0.343435 1.25414e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.82165 -0.392454 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.753118 -0.370774 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.80984 -0.323622 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.854538 -0.365116 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.842728 -0.296284 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.818893 -0.316097 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.797815 -0.412267 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.76217 -0.363249 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.729282 -0.390587 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.594141 -0.358439 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.542042 -0.409774 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.550064 -0.379835 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.613592 -0.428945 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.621614 -0.399007 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.586119 -0.388377 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.638217 -0.337042 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.566667 -0.317871 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.594141 -0.358439 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.547576 -0.389119 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.566667 -0.317871 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.619127 -0.408291 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.638217 -0.337042 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.57505 -0.429687 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.621614 -0.399007 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.550064 -0.379835 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0996195 -0.371785 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.220501 -0.393621 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.279642 -0.368601 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.281062 -0.372464 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.238665 -0.321889 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.219082 -0.389758 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.178104 -0.343046 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.15994 -0.414778 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.261479 -0.440333 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.202338 -0.465353 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.262898 -0.444196 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.367156 -0.277961 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.297666 -0.252306 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.367156 -0.277961 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.297666 -0.252306 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.383759 -0.339925 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.330873 -0.376234 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.330873 -0.376234 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.166275 -0.191247 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.20793 -0.130089 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.230419 -0.192135 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.172673 -0.154295 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.143787 -0.129201 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.108529 -0.153407 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.102131 -0.190359 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.201532 -0.167041 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.159877 -0.228199 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.224021 -0.229087 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0058509 -0.451136 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0051487 -0.447081 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0688765 -0.439178 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0172804 -0.386138 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0578769 -0.459039 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0457452 -0.398096 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0571747 -0.463094 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00628079 -0.512079 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00557859 -0.516134 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0574471 -0.504176 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0483751 -0.248762 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0599222 -0.183785 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.00673113 -0.215921 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0172857 -0.187119 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.115028 -0.216626 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0723919 -0.21996 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.103481 -0.281603 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0910116 -0.245428 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0794645 -0.310405 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0243582 -0.277564 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.178985 -0.424299 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.131634 -0.367336 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.178985 -0.424299 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.131634 -0.367336 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.162382 -0.486264 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0984274 -0.491265 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0984274 -0.491265 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.153845 -0.574159 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.202534 -0.612768 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.184086 -0.543919 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.130984 -0.631939 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.112536 -0.56309 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.172294 -0.643008 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.123605 -0.6044 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.195155 -0.585228 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0329639 -0.552323 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0248832 -0.625877 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0138144 -0.584567 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0244483 -0.584869 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0355172 -0.54356 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0163676 -0.511316 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0440327 -0.593633 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0521134 -0.520079 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.101445 -0.561087 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.247614 -0.494808 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.313607 -0.494287 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.269833 -0.434629 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.302539 -0.452978 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.291389 -0.554467 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.28032 -0.513157 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.258683 -0.536117 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.19269 -0.536638 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.214908 -0.476459 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.157543 -0.835815 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.122136 -0.871646 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0854653 -0.82339 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.135649 -0.799077 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.194213 -0.884071 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.207727 -0.811502 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.229621 -0.84824 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.14403 -0.908384 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.179437 -0.872552 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.107359 -0.860128 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0133465 -0.69376 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0838533 -0.674309 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0539145 -0.666287 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0432853 -0.701782 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00804971 -0.649684 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0272215 -0.721234 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0646815 -0.745859 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0347427 -0.737837 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.142305 -0.61371 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.213855 -0.632882 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.161477 -0.68526 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.343435 -0.786005 1.25414e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.392454 -0.82165 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.323622 -0.80984 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.370774 -0.753118 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.412267 -0.797815 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.390587 -0.729282 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.363249 -0.76217 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.365116 -0.854538 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.316097 -0.818893 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.296284 -0.842728 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.358439 -0.594141 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.389119 -0.547576 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.317871 -0.566667 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.429687 -0.57505 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.379835 -0.550064 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.399007 -0.621614 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.408291 -0.619127 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.337042 -0.638217 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.358439 -0.594141 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.409774 -0.542042 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.379835 -0.550064 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.388377 -0.586119 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.317871 -0.566667 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.337042 -0.638217 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.428945 -0.613592 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.399007 -0.621614 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.157543 -0.835815 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.119969 -0.899353 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0844101 -0.836885 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.130205 -0.868703 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.193102 -0.898283 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.203337 -0.867633 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.230676 -0.834745 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.147308 -0.866465 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.184881 -0.802927 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.111748 -0.803997 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.202787 -0.61371 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.244096 -0.624779 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.191718 -0.5724 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.131237 -0.632882 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.120168 -0.591572 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.100996 -0.663122 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.183615 -0.68526 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.153374 -0.715501 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.224924 -0.696329 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0133465 -0.69376 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0631985 -0.668775 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00804971 -0.649684 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0845947 -0.712851 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0539145 -0.666287 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0347427 -0.737837 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0440268 -0.740325 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0272215 -0.721234 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.690426 -0.508983 2.241e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.755941 -0.484794 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.695668 -0.478434 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.7029 -0.436283 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.7507 -0.515343 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.697658 -0.466832 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.685185 -0.539531 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.743468 -0.557494 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.677953 -0.581682 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.683194 -0.551134 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.607487 -0.335322 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.629404 -0.313405 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.610996 -0.384191 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.558618 -0.331813 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.625895 -0.264535 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.603979 -0.286452 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.678274 -0.316914 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.656357 -0.33883 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.607487 -0.335322 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.659645 -0.283164 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.656357 -0.33883 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.603979 -0.286452 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.610775 -0.279656 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.558618 -0.331813 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.663153 -0.332034 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.610996 -0.384191 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.554344 -0.645066 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.610229 -0.668521 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.622977 -0.619787 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.585648 -0.598918 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.541596 -0.6938 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.517014 -0.624197 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.48571 -0.670344 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.578925 -0.714669 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.52304 -0.691213 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.591673 -0.665934 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.501645 -0.441164 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.430095 -0.460336 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.482473 -0.512714 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.335322 -0.607487 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.313405 -0.629404 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.384191 -0.610996 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.331813 -0.558618 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.264535 -0.625895 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.286452 -0.603979 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.316914 -0.678274 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.33883 -0.656357 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.554344 -0.645066 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.616373 -0.681385 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.617144 -0.607573 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.609912 -0.649723 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.553573 -0.718878 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.547112 -0.687216 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.491544 -0.682558 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.560805 -0.676727 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.498776 -0.640408 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.561576 -0.602915 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.335322 -0.607487 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.283164 -0.659645 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.33883 -0.656357 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.286452 -0.603979 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.279656 -0.610775 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.331813 -0.558618 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.332034 -0.663153 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.384191 -0.610996 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.441164 -0.441164 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399854 -0.452233 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.452233 -0.399854 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.512714 -0.460336 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.523783 -0.419026 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.542955 -0.490576 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.460336 -0.512714 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.490576 -0.542955 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.419026 -0.523783 -0.222222 RAD 0.0185185 
+   txt002 
+
+END_SCENE
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/balls.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/balls.dat
new file mode 100644
index 00000000..0d4bbb15
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/balls.dat
@@ -0,0 +1,14804 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 512 512 
+  VERBOSE 0
+
+CAMERA
+  ZOOM 1.20711
+ASPECTRATIO 1.0
+  ANTIALIASING 0
+  RAYDEPTH 5
+  CENTER 2.1 1.3 1.7
+  VIEWDIR -0.700389 -0.433574 -0.566982
+  UPDIR -0.482085 -0.298433 0.82373
+
+END_CAMERA 
+
+BACKGROUND 0.078 0.361 0.753 
+
+LIGHT CENTER 4 3 2 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 1 -4 4 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER -3 1 5 RAD 0.002 COLOR 0.5 0.5 0.5
+
+TEXDEF txt001 AMBIENT 0.2  DIFFUSE 0.8  SPECULAR 0  OPACITY 1 
+PHONG PLASTIC 0 PHONG_SIZE 100000
+ COLOR 1 0.75 0.33 
+ TEXFUNC 0 
+
+TRI 
+  V0 12 12 -0.5   V1 -12 -12 -0.5   V2 12 -12 -0.5 
+   txt001 
+TRI 
+  V0 12 12 -0.5   V1 -12 12 -0.5   V2 -12 -12 -0.5 
+   txt001 
+TEXDEF txt002 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+PHONG PLASTIC 0.5 PHONG_SIZE 45.2776
+ COLOR 1 0.9 0.7 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0 RAD 0.5 
+   txt002 
+ SPHERE CENTER 0.272166 0.272166 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.420314 0.420314 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.470715 0.470715 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.481689 0.481689 0.57904 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475329 0.45787 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45787 0.475329 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.477074 0.494534 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.453255 0.488174 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4661 0.48356 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.494534 0.477074 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48356 0.4661 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488174 0.453255 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.461623 0.409245 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.47044 0.419664 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447954 0.425689 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.468014 0.433095 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484109 0.40322 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481683 0.416651 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475292 0.392801 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.464049 0.395814 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455233 0.385395 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.441563 0.401839 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409245 0.461623 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.419664 0.47044 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433095 0.468014 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.425689 0.447954 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.395814 0.464049 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401839 0.441563 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385395 0.455233 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40322 0.484109 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.392801 0.475292 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416651 0.481683 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429405 0.481784 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.441197 0.503434 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452601 0.483752 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434161 0.494577 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418001 0.501466 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410965 0.492609 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.406209 0.479816 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436441 0.490641 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42465 0.46899 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447846 0.470958 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.36376 0.497028 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383056 0.487812 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383056 0.487812 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34864 0.481907 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352815 0.457572 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34864 0.481907 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352815 0.457572 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379004 0.431383 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.376578 0.444814 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399064 0.438789 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385395 0.455233 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356518 0.437408 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.365335 0.447826 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.358944 0.423976 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.370187 0.420964 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372614 0.407532 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.392673 0.414939 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481784 0.429405 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.503434 0.441197 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.494577 0.434161 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.483752 0.452601 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490641 0.436441 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.470958 0.447846 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46899 0.42465 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501466 0.418001 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.479816 0.406209 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.492609 0.410965 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.431383 0.379004 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.444814 0.376578 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455233 0.385395 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.438789 0.399064 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420964 0.370187 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.414939 0.392673 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407532 0.372614 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.437408 0.356518 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423976 0.358944 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447826 0.365335 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.497028 0.36376 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.487812 0.383056 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.487812 0.383056 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481907 0.34864 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457572 0.352815 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481907 0.34864 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457572 0.352815 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.461844 0.304709 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.492085 0.33495 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.492085 0.33495 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488469 0.313874 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471009 0.331334 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495701 0.356025 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.474625 0.352409 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495701 0.356025 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51316 0.338566 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51316 0.338566 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.509544 0.31749 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.424345 0.305171 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.40568 0.315605 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403931 0.312107 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419383 0.329161 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426095 0.30867 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.439797 0.322225 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.444759 0.298235 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410643 0.291616 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429307 0.281181 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408893 0.288117 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435193 0.368397 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.440864 0.389015 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457301 0.37895 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.451857 0.367697 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418755 0.378463 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429748 0.357145 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.413085 0.357845 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4242 0.389715 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418529 0.369098 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440637 0.37965 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529584 0.334488 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.546497 0.347572 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532117 0.331508 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522481 0.352406 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.543964 0.350552 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519948 0.355387 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.52705 0.337468 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5536 0.329654 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536686 0.31657 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.53922 0.313589 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.48474 0.389488 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495668 0.369235 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.477004 0.379669 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.461764 0.388188 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.454027 0.37837 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449715 0.366636 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480429 0.377754 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46838 0.356202 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.491357 0.357501 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499343 0.304247 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.518259 0.314219 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519922 0.310678 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504895 0.328108 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.49768 0.307788 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484316 0.321677 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478764 0.297816 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.512708 0.290358 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493791 0.280387 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51437 0.286818 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.518736 0.271262 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.539811 0.274878 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.520873 0.290418 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.533373 0.290264 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.537674 0.255722 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531235 0.271108 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.516598 0.252106 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.525174 0.255876 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504099 0.25226 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506236 0.271416 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488495 0.241021 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.50716 0.230587 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51153 0.24936 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499694 0.253381 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484125 0.222248 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.476659 0.245042 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46546 0.232683 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495961 0.218227 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.477296 0.228661 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.500331 0.237 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.450996 0.241483 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.455172 0.217147 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472226 0.232599 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45115 0.228983 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433942 0.226031 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429921 0.237867 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429767 0.250367 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455018 0.229647 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.450842 0.253983 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472072 0.245099 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304709 0.461844 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.33495 0.492085 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.33495 0.492085 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331334 0.471009 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313874 0.488469 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338566 0.51316 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31749 0.509544 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338566 0.51316 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356025 0.495701 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356025 0.495701 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352409 0.474625 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.368397 0.435193 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389015 0.440864 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367697 0.451857 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37895 0.457301 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389715 0.4242 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37965 0.440637 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369098 0.418529 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378463 0.418755 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357845 0.413085 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357145 0.429748 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305171 0.424345 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.315605 0.40568 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329161 0.419383 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312107 0.403931 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291616 0.410643 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288117 0.408893 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281181 0.429307 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30867 0.426095 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298235 0.444759 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322225 0.439797 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271262 0.518736 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.274878 0.539811 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290264 0.533373 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290418 0.520873 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.255876 0.525174 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271416 0.506236 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.25226 0.504099 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.255722 0.537674 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.252106 0.516598 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271108 0.531235 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241483 0.450996 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.217147 0.455172 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228983 0.45115 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.232599 0.472226 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229647 0.455018 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245099 0.472072 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253983 0.450842 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.226031 0.433942 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250367 0.429767 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237867 0.429921 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241021 0.488495 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.230587 0.50716 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253381 0.499694 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.24936 0.51153 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218227 0.495961 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237 0.500331 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228661 0.477296 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.222248 0.484125 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.232683 0.46546 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245042 0.476659 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334488 0.529584 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.347572 0.546497 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352406 0.522481 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331508 0.532117 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329654 0.5536 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313589 0.53922 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31657 0.536686 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350552 0.543964 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337468 0.52705 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355387 0.519948 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304247 0.499343 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.314219 0.518259 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328108 0.504895 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310678 0.519922 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290358 0.512708 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286818 0.51437 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280387 0.493791 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307788 0.49768 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297816 0.478764 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321677 0.484316 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389488 0.48474 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379669 0.477004 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369235 0.495668 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.377754 0.480429 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357501 0.491357 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356202 0.46838 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388188 0.461764 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366636 0.449715 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37837 0.454027 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230635 0.38777 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.2506 0.446614 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.264242 0.467193 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.272442 0.447086 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253384 0.459832 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2424 0.46672 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.231541 0.459359 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228758 0.446141 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261459 0.453974 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247817 0.433396 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269659 0.433868 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301839 0.407906 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.319874 0.420236 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.303021 0.407886 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.296625 0.428474 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318692 0.420256 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295442 0.428494 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.300656 0.407926 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325088 0.399668 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307053 0.387338 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308235 0.387318 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253236 0.449775 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.263032 0.459076 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.270029 0.436804 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247378 0.440021 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.246239 0.472047 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230585 0.452992 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236443 0.462746 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26889 0.468829 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259094 0.459528 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275887 0.446557 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179397 0.426478 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.174744 0.447688 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.197172 0.437457 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.1895 0.447523 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156968 0.436708 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171724 0.436544 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161621 0.415499 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164641 0.426642 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.169293 0.405432 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187069 0.416412 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.182032 0.429639 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.177682 0.45215 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.190087 0.449636 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200611 0.44299 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.169628 0.432153 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.192556 0.422992 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173978 0.409641 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159104 0.438799 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.163454 0.416288 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171508 0.436286 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159431 0.367634 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.13761 0.368692 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.158434 0.366998 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153102 0.387887 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138607 0.369329 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.154099 0.388523 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160429 0.36827 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.14394 0.34844 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165761 0.347381 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164764 0.346745 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227999 0.384609 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.237348 0.393812 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251829 0.390976 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234368 0.408432 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.213518 0.387445 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.210538 0.402066 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.204169 0.378242 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23098 0.369989 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221631 0.360786 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245461 0.367152 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208034 0.325765 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.209548 0.312342 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229235 0.324887 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209827 0.337 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188347 0.31322 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188626 0.337878 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.186834 0.326643 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207755 0.301107 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206242 0.31453 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227442 0.313652 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.279238 0.345901 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.302145 0.344931 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297823 0.356827 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.289691 0.366251 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28356 0.334005 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271106 0.355325 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.260653 0.334975 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291692 0.324581 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268785 0.325551 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28737 0.336477 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.102505 0.502308 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.110567 0.524146 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.126738 0.506465 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.112687 0.504055 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0863343 0.519988 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0884544 0.499897 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0782715 0.49815 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100385 0.522399 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0923218 0.500561 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.116555 0.504718 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160392 0.474661 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.177777 0.492047 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176681 0.473492 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159222 0.490951 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161488 0.493217 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.142932 0.492121 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144102 0.475831 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.178947 0.475757 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161561 0.458371 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177851 0.457202 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160392 0.474661 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.167697 0.481967 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161561 0.458371 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144102 0.475831 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166528 0.498257 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.142932 0.492121 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159222 0.490951 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183987 0.480797 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176681 0.473492 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177851 0.457202 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0571437 0.456947 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0450372 0.477623 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.055591 0.475469 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696413 0.47788 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0465898 0.4591 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.071194 0.459357 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0586963 0.438424 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325396 0.45669 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0446461 0.436013 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0430934 0.454536 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.10495 0.439381 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0911807 0.435691 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10864 0.45315 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128801 0.43299 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13249 0.44676 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138881 0.42291 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111341 0.415531 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.121421 0.40545 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0975713 0.411841 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696698 0.383939 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.052284 0.366554 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0708393 0.36765 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0533799 0.385109 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511144 0.382844 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0522103 0.401399 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0685002 0.400229 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0685739 0.365384 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0859596 0.38277 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0871292 0.36648 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0571437 0.456947 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0493251 0.475575 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0725262 0.467381 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.06557 0.479825 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0339426 0.465141 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0501875 0.46939 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0417612 0.446512 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0408988 0.452697 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0487174 0.434069 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0640999 0.444504 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696698 0.383939 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0623642 0.376634 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0859596 0.38277 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0685002 0.400229 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0460743 0.377803 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0522103 0.401399 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0533799 0.385109 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0635337 0.360344 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0708393 0.36765 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0871292 0.36648 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.125111 0.439381 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138881 0.435691 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.121421 0.45315 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101261 0.43299 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0975713 0.44676 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0911807 0.42291 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11872 0.415531 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10864 0.40545 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13249 0.411841 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.082487 0.239622 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0438957 0.258053 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0426858 0.273525 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.064638 0.265928 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0510334 0.281546 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0219434 0.26565 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.030291 0.273671 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0231533 0.250178 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0355481 0.250032 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.036758 0.23456 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0575003 0.242434 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.117687 0.252557 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.135677 0.265544 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138361 0.25778 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12224 0.275732 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115003 0.26032 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101567 0.270508 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.097014 0.247334 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.131123 0.242369 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.113134 0.229382 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.133808 0.234605 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0863845 0.308551 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0971427 0.330622 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.109956 0.310023 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.091905 0.317013 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0735708 0.329151 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0683331 0.315541 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0628126 0.30708 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0916222 0.322161 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.080864 0.30009 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.104436 0.301561 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00869528 0.245118 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0110117 0.257416 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00823377 0.253319 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0102865 0.269325 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0105502 0.249215 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.010748 0.261124 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00915679 0.236916 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0126029 0.233209 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00710408 0.22091 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00664257 0.229111 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511841 0.295616 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0555846 0.315856 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0705987 0.309941 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0705297 0.296292 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.03617 0.301531 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511152 0.281968 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0317696 0.281291 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.036239 0.31518 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0318385 0.29494 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.051253 0.309265 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0472866 0.226687 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.025169 0.224935 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0281502 0.217281 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0288111 0.241399 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0443054 0.234341 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0479475 0.250805 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.066423 0.236092 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0436445 0.210223 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0657621 0.211974 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0466257 0.202569 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0399982 0.189123 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0335228 0.179527 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0567332 0.187058 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0385291 0.203632 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0167878 0.181593 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.021794 0.205698 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0232631 0.191189 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0349919 0.165018 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0414672 0.174615 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0582023 0.172549 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0785895 0.170692 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0867911 0.147549 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101845 0.166573 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.083121 0.161663 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0635354 0.151669 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0598652 0.165782 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0553337 0.174812 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822597 0.156579 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.074058 0.179722 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0973138 0.175603 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11379 0.183628 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.133336 0.176775 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136161 0.192663 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.124499 0.199753 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.110965 0.167739 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102127 0.190718 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0914184 0.174592 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.122627 0.160649 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.103081 0.167502 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.125452 0.176537 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38777 0.230635 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.446614 0.2506 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.467193 0.264242 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459832 0.253384 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447086 0.272442 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.453974 0.261459 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433868 0.269659 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433396 0.247817 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46672 0.2424 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446141 0.228758 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459359 0.231541 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449775 0.253236 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.459076 0.263032 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440021 0.247378 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436804 0.270029 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.468829 0.26889 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446557 0.275887 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459528 0.259094 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472047 0.246239 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.462746 0.236443 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452992 0.230585 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407906 0.301839 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.420236 0.319874 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428474 0.296625 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407886 0.303021 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399668 0.325088 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387318 0.308235 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387338 0.307053 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420256 0.318692 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407926 0.300656 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428494 0.295442 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384609 0.227999 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.393812 0.237348 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408432 0.234368 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.390976 0.251829 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369989 0.23098 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367152 0.245461 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.360786 0.221631 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387445 0.213518 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378242 0.204169 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402066 0.210538 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345901 0.279238 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.344931 0.302145 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366251 0.289691 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356827 0.297823 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324581 0.291692 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336477 0.28737 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325551 0.268785 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334005 0.28356 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334975 0.260653 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355325 0.271106 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325765 0.208034 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.312342 0.209548 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337 0.209827 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324887 0.229235 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301107 0.207755 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313652 0.227442 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31453 0.206242 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31322 0.188347 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.326643 0.186834 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337878 0.188626 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426478 0.179397 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.447688 0.174744 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447523 0.1895 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.437457 0.197172 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426642 0.164641 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416412 0.187069 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405432 0.169293 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436708 0.156968 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.415499 0.161621 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436544 0.171724 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367634 0.159431 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.368692 0.13761 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387887 0.153102 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366998 0.158434 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34844 0.14394 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.346745 0.164764 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347381 0.165761 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369329 0.138607 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36827 0.160429 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388523 0.154099 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429639 0.182032 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.45215 0.177682 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44299 0.200611 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449636 0.190087 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.438799 0.159104 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436286 0.171508 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416288 0.163454 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.432153 0.169628 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409641 0.173978 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.422992 0.192556 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.239622 0.082487 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.258053 0.0438957 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.273525 0.0426858 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281546 0.0510334 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.265928 0.064638 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250032 0.0355481 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242434 0.0575003 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23456 0.036758 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26565 0.0219434 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250178 0.0231533 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273671 0.030291 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308551 0.0863845 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.330622 0.0971427 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317013 0.091905 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310023 0.109956 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322161 0.0916222 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301561 0.104436 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30009 0.080864 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329151 0.0735708 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30708 0.0628126 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315541 0.0683331 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.252557 0.117687 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.265544 0.135677 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275732 0.12224 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.25778 0.138361 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242369 0.131123 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234605 0.133808 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229382 0.113134 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26032 0.115003 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247334 0.097014 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.270508 0.101567 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.189123 0.0399982 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.179527 0.0335228 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203632 0.0385291 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187058 0.0567332 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165018 0.0349919 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172549 0.0582023 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174615 0.0414672 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181593 0.0167878 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191189 0.0232631 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205698 0.021794 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183628 0.11379 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.176775 0.133336 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.199753 0.124499 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.192663 0.136161 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160649 0.122627 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176537 0.125452 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167502 0.103081 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167739 0.110965 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174592 0.0914184 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.190718 0.102127 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.170692 0.0785895 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.147549 0.0867911 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161663 0.083121 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166573 0.101845 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156579 0.0822597 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.175603 0.0973138 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179722 0.074058 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.151669 0.0635354 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174812 0.0553337 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165782 0.0598652 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245118 0.00869528 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.257416 -0.0110117 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269325 0.0102865 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253319 0.00823377 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233209 -0.0126029 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229111 0.00664257 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22091 0.00710408 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249215 -0.0105502 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236916 0.00915679 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261124 0.010748 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.226687 0.0472866 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.224935 0.025169 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241399 0.0288111 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217281 0.0281502 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.210223 0.0436445 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.202569 0.0466257 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211974 0.0657621 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234341 0.0443054 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236092 0.066423 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250805 0.0479475 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295616 0.0511841 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.315856 0.0555846 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.296292 0.0705297 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.309941 0.0705987 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31518 0.036239 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.309265 0.051253 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29494 0.0318385 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301531 0.03617 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281291 0.0317696 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281968 0.0511152 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.502308 0.102505 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.524146 0.110567 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504055 0.112687 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506465 0.126738 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522399 0.100385 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504718 0.116555 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.500561 0.0923218 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519988 0.0863343 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.49815 0.0782715 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499897 0.0884544 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.474661 0.160392 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.481967 0.167697 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475831 0.144102 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.458371 0.161561 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480797 0.183987 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457202 0.177851 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.473492 0.176681 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498257 0.166528 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490951 0.159222 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.492121 0.142932 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.474661 0.160392 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.492047 0.177777 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490951 0.159222 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.473492 0.176681 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475757 0.178947 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457202 0.177851 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.458371 0.161561 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493217 0.161488 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475831 0.144102 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.492121 0.142932 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.456947 0.0571437 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.475575 0.0493251 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.479825 0.06557 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.467381 0.0725262 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452697 0.0408988 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.444504 0.0640999 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434069 0.0487174 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.465141 0.0339426 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446512 0.0417612 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46939 0.0501875 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.439381 0.125111 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45315 0.121421 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435691 0.138881 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.415531 0.11872 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.411841 0.13249 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40545 0.10864 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.43299 0.101261 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42291 0.0911807 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44676 0.0975713 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383939 0.0696698 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.376634 0.0623642 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400229 0.0685002 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38277 0.0859596 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.360344 0.0635337 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36648 0.0871292 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36765 0.0708393 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.377803 0.0460743 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385109 0.0533799 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401399 0.0522103 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.456947 0.0571437 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.477623 0.0450372 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.47788 0.0696413 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475469 0.055591 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45669 0.0325396 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.454536 0.0430934 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436013 0.0446461 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4591 0.0465898 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.438424 0.0586963 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459357 0.071194 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383939 0.0696698 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.366554 0.052284 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385109 0.0533799 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36765 0.0708393 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.365384 0.0685739 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36648 0.0871292 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38277 0.0859596 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382844 0.0511144 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400229 0.0685002 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401399 0.0522103 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.41922 0.125111 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40545 0.121421 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42291 0.138881 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44307 0.11872 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44676 0.13249 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45315 0.10864 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.425611 0.101261 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435691 0.0911807 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.411841 0.0975713 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.802608 0.281471 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.824035 0.30566 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.822021 0.302088 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.821938 0.282758 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.802598 0.298094 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.824119 0.32499 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.804695 0.320997 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.826132 0.328563 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843459 0.309654 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845472 0.313227 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843375 0.290324 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.787796 0.241352 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.785699 0.218449 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.802677 0.22345 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.778718 0.223304 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770818 0.236351 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.763837 0.241205 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.772915 0.259253 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.794777 0.236497 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.796874 0.2594 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.811756 0.241498 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.752156 0.305221 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.741263 0.325175 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.747715 0.32493 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.765112 0.325981 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745704 0.305466 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.769553 0.306272 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.756597 0.285513 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.728307 0.304415 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7392 0.284462 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.734759 0.304171 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838847 0.34578 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.851488 0.360404 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853509 0.335865 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.832518 0.347059 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.836826 0.370319 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817857 0.356973 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.824185 0.355695 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857816 0.359125 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845176 0.344501 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.859838 0.334587 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.766968 0.345341 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.768944 0.369945 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.788341 0.356172 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.780624 0.356171 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.747572 0.359113 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759252 0.34534 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745596 0.33451 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755289 0.359115 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.753313 0.334511 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774685 0.345342 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817421 0.321591 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.83071 0.340361 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.840365 0.325527 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.822249 0.341208 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.807766 0.336425 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.799305 0.337272 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.794477 0.317654 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.825882 0.320744 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.812593 0.301973 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.835537 0.30591 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.874487 0.28191 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.891539 0.292033 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.868678 0.28812 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.872763 0.305711 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.897348 0.285824 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.878572 0.299501 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.880296 0.275701 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.893263 0.268233 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876212 0.25811 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.870402 0.264319 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853061 0.257721 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.87538 0.26204 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.87108 0.266856 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.860805 0.280934 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857361 0.252905 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842785 0.271799 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.835041 0.248586 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.867636 0.238827 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845317 0.234508 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.863337 0.243643 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838248 0.217602 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.860225 0.206363 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.858689 0.230102 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.854636 0.223536 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.839784 0.193863 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.834196 0.211035 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817808 0.205101 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843837 0.200429 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.821861 0.211667 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842301 0.224168 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.61371 0.202787 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.61556 0.221097 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621702 0.225035 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.635958 0.210779 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607567 0.198849 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627965 0.188531 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605717 0.180539 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593312 0.213105 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591462 0.194794 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.599454 0.217042 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.191718 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.556122 0.208861 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575596 0.203643 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.578791 0.215568 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.552927 0.196936 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575596 0.203643 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569205 0.179793 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549732 0.185011 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.56601 0.167868 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569205 0.179793 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.244096 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.631486 0.266765 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648629 0.250487 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.636704 0.247291 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607636 0.260374 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.612854 0.240901 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600929 0.237705 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.619561 0.26357 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.612854 0.240901 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.636704 0.247291 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68526 0.183615 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684921 0.190903 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665787 0.178397 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669989 0.201661 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704395 0.196121 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.689462 0.206879 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704733 0.188833 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700193 0.172858 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700531 0.165569 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681058 0.160351 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.224924 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.710584 0.23918 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705059 0.216195 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687599 0.233654 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701855 0.24791 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678869 0.242384 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687599 0.233654 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.719314 0.23045 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705059 0.216195 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.713788 0.207465 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.153374 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.738169 0.160081 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718696 0.165299 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721891 0.177224 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.734974 0.148156 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718696 0.165299 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712305 0.141449 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.731779 0.136231 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.70911 0.129524 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712305 0.141449 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.632882 0.131237 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.634145 0.108412 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.650927 0.115965 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627664 0.111763 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616099 0.123683 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609618 0.127034 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.614836 0.146508 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639363 0.127886 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.6381 0.15071 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656145 0.135439 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.100996 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.680265 0.0847178 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.686972 0.107387 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675047 0.104191 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656415 0.0783272 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651197 0.0978007 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639272 0.0946054 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.66834 0.0815225 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651197 0.0978007 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675047 0.104191 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.120168 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.577317 0.105912 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600302 0.111438 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582843 0.128897 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.568587 0.114642 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.574113 0.137627 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582843 0.128897 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586046 0.0971825 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600302 0.111438 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609032 0.102708 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.594141 0.358439 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.619127 0.408291 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.625955 0.411883 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630791 0.390369 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607547 0.396287 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61429 0.429805 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.595882 0.414208 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607462 0.426212 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.637535 0.423887 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630706 0.420295 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642371 0.402373 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688854 0.369058 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638217 0.337042 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.652948 0.344865 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.632683 0.357697 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651954 0.357326 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.658482 0.324211 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.657489 0.336672 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643752 0.316388 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639211 0.324581 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624481 0.316758 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.618946 0.337413 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547576 0.389119 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.541008 0.410169 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548718 0.410472 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.564748 0.405866 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539866 0.388816 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563607 0.384513 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546435 0.367766 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523836 0.393422 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530405 0.372372 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531546 0.393725 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566667 0.317871 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.555534 0.296626 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572202 0.297216 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.550163 0.307914 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549999 0.31728 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.544629 0.328569 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.561133 0.338525 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572037 0.306582 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.583171 0.327827 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588706 0.307172 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506807 0.320279 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57505 0.429687 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.58161 0.452905 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5989 0.436077 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586467 0.434777 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.55776 0.446515 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562617 0.428387 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5512 0.423296 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570193 0.447815 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563633 0.424596 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587483 0.430987 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.550064 0.379835 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.547099 0.396248 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569716 0.388263 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.557504 0.403175 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527447 0.387819 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.537852 0.394747 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530412 0.371406 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539659 0.372907 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542624 0.356494 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562276 0.364922 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621614 0.399007 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.637209 0.41723 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642848 0.401533 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624734 0.418027 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.615976 0.414703 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603501 0.4155 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600381 0.39648 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634089 0.39821 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.618494 0.379986 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639728 0.382513 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.802608 0.281471 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.858698 0.329459 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.872345 0.34259 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.86421 0.32016 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848329 0.338969 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.866833 0.351888 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842817 0.348268 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853186 0.338757 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882715 0.333079 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.869068 0.319948 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.87458 0.310649 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845371 0.280879 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.849036 0.291048 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.826067 0.287867 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.840755 0.304882 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.868341 0.28406 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.86006 0.297894 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.864676 0.273891 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853652 0.267046 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.849987 0.256877 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.830683 0.263865 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.798572 0.337088 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.808673 0.346884 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.82298 0.335792 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.807762 0.322361 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.784265 0.34818 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.783355 0.323657 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774164 0.338384 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.799483 0.361611 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.789382 0.351815 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.81379 0.350519 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.815936 0.330051 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.828769 0.350165 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838905 0.333232 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.820583 0.347547 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.805799 0.346984 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.797614 0.344366 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.792966 0.32687 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.824121 0.332668 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.811288 0.312554 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.834258 0.315735 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.75581 0.33768 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.753851 0.362219 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774086 0.350765 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76987 0.352319 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.735575 0.349134 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751594 0.339233 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737534 0.324595 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.739791 0.347581 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.74175 0.323042 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760026 0.336127 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759846 0.282063 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.756464 0.29233 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.779336 0.288514 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.765125 0.305929 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.736973 0.285879 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745634 0.299478 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.740355 0.275612 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751185 0.268464 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.754567 0.258198 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774058 0.264649 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.862735 0.273842 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.885497 0.282313 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876946 0.281455 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.867718 0.29787 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.871286 0.274699 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853506 0.290257 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848523 0.266228 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.880514 0.258284 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857752 0.249813 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.871963 0.257427 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.806645 0.225855 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.818054 0.21762 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.83061 0.230661 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.813612 0.241754 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.794089 0.212813 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.789647 0.236948 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.78268 0.221048 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.811087 0.20172 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.799677 0.209955 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.823642 0.214761 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.849407 0.225263 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.873186 0.21889 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.865588 0.240865 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.866351 0.236437 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857005 0.203288 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.850171 0.220835 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.833227 0.20966 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.856242 0.207715 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.832464 0.214088 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848644 0.22969 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.594141 0.358439 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.613592 0.428945 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.626191 0.448155 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634643 0.42519 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.614455 0.43276 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.60514 0.45191 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593404 0.436515 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.592541 0.4327 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625328 0.44434 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.612729 0.42513 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.63378 0.421375 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688854 0.369058 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621614 0.399007 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.625435 0.399844 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627149 0.378352 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.60511 0.38905 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.619901 0.420499 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.599576 0.409705 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61608 0.419661 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.641939 0.409801 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638118 0.408963 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643653 0.388308 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542042 0.409774 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.53788 0.433888 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.558395 0.423551 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.55574 0.426423 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.521526 0.42011 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539387 0.412646 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.525689 0.395996 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.524182 0.417238 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528344 0.393124 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.544697 0.406901 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.550064 0.379835 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.540802 0.399304 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.54453 0.400489 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563801 0.400119 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546337 0.37865 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569335 0.379464 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555599 0.35918 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527065 0.37902 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536327 0.359551 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530793 0.380205 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506807 0.320279 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586119 0.388377 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.594185 0.405974 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609969 0.394768 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593017 0.410332 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570335 0.399584 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569167 0.403942 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562269 0.381987 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587286 0.384019 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57922 0.366422 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.60307 0.372813 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566667 0.317871 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.567308 0.314012 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587901 0.320398 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569787 0.336891 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546074 0.311485 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548554 0.334364 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.545434 0.315344 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.564188 0.294991 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563547 0.29885 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.584781 0.301377 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638217 0.337042 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.659244 0.341809 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65787 0.345471 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645657 0.360383 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639592 0.33338 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626005 0.351955 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.618565 0.328614 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651804 0.318468 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630777 0.313702 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65043 0.32213 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.674191 0.202787 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.690652 0.219248 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.695267 0.206403 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677807 0.223862 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669577 0.215632 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656732 0.220246 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.653116 0.199171 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687036 0.198172 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.670575 0.181711 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.691651 0.185327 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.733129 0.203821 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.709966 0.212373 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.733129 0.203821 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.709966 0.212373 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.738664 0.183166 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721035 0.171063 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721035 0.171063 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.675225 0.261725 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683777 0.238562 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65457 0.267259 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642468 0.249631 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642468 0.249631 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675225 0.261725 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683777 0.238562 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602641 0.183615 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.600215 0.197046 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.622701 0.191021 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609032 0.207465 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.580155 0.18964 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588972 0.200059 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582581 0.176209 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593824 0.173196 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.596251 0.159765 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61631 0.167171 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.587397 0.24926 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606693 0.240045 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606693 0.240045 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572277 0.23414 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.576452 0.209804 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572277 0.23414 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.576452 0.209804 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.551082 0.155041 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566866 0.174029 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.551082 0.155041 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566866 0.174029 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.556617 0.134387 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.577935 0.13272 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.577935 0.13272 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.655019 0.131237 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.668451 0.12881 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678869 0.137627 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.662426 0.151296 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644601 0.12242 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638576 0.144906 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.631169 0.124846 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661044 0.108751 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647613 0.111177 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671463 0.117567 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.626446 0.0796777 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645433 0.0954616 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605791 0.0852121 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604124 0.10653 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604124 0.10653 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626446 0.0796777 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645433 0.0954616 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.720665 0.115992 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.711449 0.135288 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.711449 0.135288 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705544 0.100872 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681209 0.105047 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705544 0.100872 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681209 0.105047 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.852418 0.0955788 1.89979e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.922609 0.11107 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.937225 0.122151 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.916553 0.11086 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.915202 0.131874 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.943281 0.12236 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.921258 0.132084 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.928665 0.111279 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.944632 0.101346 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.930016 0.0902645 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.92396 0.090055 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.867231 0.135698 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.873196 0.134634 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882112 0.117797 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.858152 0.11765 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.858315 0.152536 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843271 0.135552 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.852349 0.1536 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882275 0.152682 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876309 0.153747 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.89119 0.135845 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.877966 0.164775 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.890926 0.182656 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.897331 0.159019 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876622 0.167676 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.871561 0.188412 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857256 0.173431 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.8586 0.17053 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.89227 0.179755 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.87931 0.161874 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.898675 0.156118 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.907797 0.0709499 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.930963 0.0752104 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.924191 0.0806562 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.915684 0.0941344 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.914568 0.0655041 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.899289 0.0844281 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.891402 0.0612436 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.923076 0.0520258 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.89991 0.0477654 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.916304 0.0574717 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.863153 0.124655 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.875744 0.141535 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.88655 0.129819 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.868763 0.146389 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.852347 0.136371 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845366 0.141225 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.839756 0.119492 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.870135 0.119801 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857544 0.102922 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.880941 0.108085 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.837606 0.0554592 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.842832 0.0523913 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.86055 0.0593957 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842434 0.0750766 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.819888 0.0484547 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.81949 0.07114 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.814662 0.0515226 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838004 0.0327739 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.832778 0.0358417 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.855722 0.0397783 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.897062 0.0418734 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.920407 0.0359958 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.912106 0.0588574 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.915603 0.0511067 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.905363 0.0190117 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.900559 0.0341227 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882018 0.0248894 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.901866 0.0267625 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.878521 0.0326401 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.893565 0.0496241 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.826871 0.0263827 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.825102 0.00436945 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.84533 0.018173 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.823964 0.025051 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.806642 0.0125791 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.805505 0.0332607 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.808411 0.0345923 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.828008 0.00570109 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.829777 0.0277143 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848237 0.0195047 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.841683 0.0665023 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.840284 0.0454909 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.856111 0.0473735 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.831823 0.0463379 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.825856 0.0646197 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817395 0.0654667 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.827255 0.0856311 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.850144 0.0656554 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.851543 0.0866667 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.865971 0.0675379 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.69376 -0.0133465 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.740325 -0.0440268 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.762259 -0.0417568 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759495 -0.0345526 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.748937 -0.0216407 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743089 -0.051231 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.729767 -0.0311149 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721155 -0.053501 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.753646 -0.0641429 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.731712 -0.0664129 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.750882 -0.0569387 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.788473 -0.00272662 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721234 0.0272215 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.736829 0.0454452 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.742467 0.0297485 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.724354 0.046242 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715595 0.0429182 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.70312 0.043715 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7 0.0246945 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.733709 0.0264247 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718114 0.00820099 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.739347 0.010728 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.668775 -0.0631985 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.669983 -0.0708196 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.690113 -0.0618185 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671462 -0.0467378 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648644 -0.0721997 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.650123 -0.0481178 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647436 -0.0645786 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.667296 -0.0872804 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666087 -0.0796593 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687426 -0.0782793 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649684 0.00804971 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.646718 0.0244627 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669336 0.016478 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.657124 0.0313903 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627066 0.0160343 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.637471 0.022962 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630031 -0.000378614 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639278 0.00112207 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642244 -0.0152909 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661896 -0.00686255 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606426 -0.051506 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712851 -0.0845947 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.730141 -0.101422 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.736701 -0.0782041 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.725284 -0.0832945 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.706291 -0.107813 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701434 -0.0896851 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.689001 -0.0909853 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.717709 -0.102723 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700418 -0.0858949 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.724268 -0.0795043 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666287 -0.0539145 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.655153 -0.0751594 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671821 -0.0745692 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649783 -0.0638711 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649619 -0.0545047 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644249 -0.0432164 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660752 -0.0332597 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671657 -0.0652028 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682791 -0.0439578 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688325 -0.0646126 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737837 -0.0347427 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.752567 -0.0269197 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.732303 -0.014088 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751574 -0.0144587 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.758102 -0.0475745 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.757108 -0.0351134 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743371 -0.0553974 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.73883 -0.0472037 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7241 -0.0550267 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718566 -0.0343719 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.69376 -0.0133465 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.745859 -0.0646815 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.770032 -0.0684873 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759394 -0.0481266 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.762305 -0.0507391 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.756497 -0.0850422 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.74877 -0.067294 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.732325 -0.0812364 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.753586 -0.0824297 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.729413 -0.0786239 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.742948 -0.062069 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.788473 -0.00272662 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737837 -0.0347427 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.758864 -0.0299763 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.757489 -0.0263144 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745277 -0.0114021 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.739212 -0.0384047 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.725625 -0.0198304 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718185 -0.043171 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751424 -0.0533169 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.730397 -0.0580833 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.750049 -0.0496549 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674309 -0.0838533 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.675276 -0.106805 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.694308 -0.091423 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.673094 -0.0875713 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.655278 -0.0992356 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.653095 -0.0800016 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65431 -0.0762835 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.676491 -0.103087 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675524 -0.0801352 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.695522 -0.0877049 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666287 -0.0539145 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.666927 -0.0577732 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68752 -0.0513875 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669407 -0.034894 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645694 -0.0603001 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648173 -0.0374209 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645053 -0.0564414 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663807 -0.0767937 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663167 -0.072935 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.6844 -0.070408 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606426 -0.051506 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701782 -0.0432853 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.717566 -0.0544915 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.725632 -0.0368947 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718734 -0.0588496 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.693716 -0.0608821 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.694884 -0.0652402 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677932 -0.0496759 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700615 -0.0389272 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.684831 -0.027721 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.708681 -0.0213304 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649684 0.00804971 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.640422 0.0275193 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644149 0.0287044 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.66342 0.0283337 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645956 0.00686453 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.668955 0.00767898 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.655218 -0.012605 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626685 0.00723527 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.635947 -0.0122343 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630413 0.00842045 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721234 0.0272215 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.725055 0.0280589 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.726768 0.00656677 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.70473 0.0172649 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.71952 0.0487136 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.699195 0.0379196 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715699 0.0478762 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.741558 0.0380155 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737738 0.0371781 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743272 0.0165234 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.281471 0.802608 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.30566 0.824035 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.302088 0.822021 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298094 0.802598 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282758 0.821938 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.309654 0.843459 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290324 0.843375 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313227 0.845472 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32499 0.824119 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328563 0.826132 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320997 0.804695 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305221 0.752156 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.325175 0.741263 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325981 0.765112 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32493 0.747715 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304415 0.728307 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304171 0.734759 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.284462 0.7392 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305466 0.745704 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285513 0.756597 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306272 0.769553 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241352 0.787796 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.218449 0.785699 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223304 0.778718 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22345 0.802677 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236497 0.794777 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241498 0.811756 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2594 0.796874 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236351 0.770818 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259253 0.772915 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241205 0.763837 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28191 0.874487 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.292033 0.891539 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305711 0.872763 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28812 0.868678 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268233 0.893263 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.264319 0.870402 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.25811 0.876212 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285824 0.897348 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275701 0.880296 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299501 0.878572 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217602 0.838248 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.206363 0.860225 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223536 0.854636 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230102 0.858689 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200429 0.843837 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224168 0.842301 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211667 0.821861 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193863 0.839784 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205101 0.817808 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211035 0.834196 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257721 0.853061 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.26204 0.87538 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280934 0.860805 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266856 0.87108 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238827 0.867636 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.243643 0.863337 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234508 0.845317 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.252905 0.857361 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248586 0.835041 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271799 0.842785 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34578 0.838847 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.360404 0.851488 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347059 0.832518 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335865 0.853509 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359125 0.857816 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334587 0.859838 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.344501 0.845176 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.370319 0.836826 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355695 0.824185 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356973 0.817857 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321591 0.817421 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340361 0.83071 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.341208 0.822249 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325527 0.840365 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320744 0.825882 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30591 0.835537 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301973 0.812593 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336425 0.807766 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317654 0.794477 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337272 0.799305 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345341 0.766968 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.369945 0.768944 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356171 0.780624 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356172 0.788341 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359115 0.755289 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345342 0.774685 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334511 0.753313 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359113 0.747572 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33451 0.745596 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34534 0.759252 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.358439 0.594141 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.408291 0.619127 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.411883 0.625955 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396287 0.607547 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.390369 0.630791 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423887 0.637535 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402373 0.642371 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420295 0.630706 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429805 0.61429 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426212 0.607462 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.414208 0.595882 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337042 0.638217 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.344865 0.652948 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357326 0.651954 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357697 0.632683 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324581 0.639211 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337413 0.618946 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316758 0.624481 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324211 0.658482 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316388 0.643752 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336672 0.657489 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369058 0.688854 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429687 0.57505 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.452905 0.58161 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434777 0.586467 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436077 0.5989 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447815 0.570193 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.430987 0.587483 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.424596 0.563633 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446515 0.55776 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423296 0.5512 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428387 0.562617 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399007 0.621614 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.41723 0.637209 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418027 0.624734 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401533 0.642848 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39821 0.634089 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382513 0.639728 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379986 0.618494 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.414703 0.615976 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39648 0.600381 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4155 0.603501 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379835 0.550064 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.396248 0.547099 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403175 0.557504 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388263 0.569716 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372907 0.539659 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.364922 0.562276 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356494 0.542624 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387819 0.527447 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.371406 0.530412 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.394747 0.537852 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389119 0.547576 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.410169 0.541008 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405866 0.564748 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410472 0.548718 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393422 0.523836 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393725 0.531546 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372372 0.530405 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388816 0.539866 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367766 0.546435 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384513 0.563607 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320279 0.506807 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317871 0.566667 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.296626 0.555534 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307914 0.550163 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297216 0.572202 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306582 0.572037 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307172 0.588706 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.327827 0.583171 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31728 0.549999 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338525 0.561133 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328569 0.544629 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.142305 0.674191 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.144155 0.692502 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.150298 0.696439 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164554 0.682184 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136163 0.670254 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156561 0.659936 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.134313 0.651943 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.121907 0.684509 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120057 0.666199 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12805 0.688447 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.663122 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0847178 0.680265 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.104191 0.675047 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.107387 0.686972 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0815225 0.66834 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.104191 0.675047 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0978007 0.651197 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0783272 0.656415 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0946054 0.639272 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0978007 0.651197 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.715501 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.160081 0.738169 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177224 0.721891 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165299 0.718696 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136231 0.731779 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141449 0.712305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.129524 0.70911 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.148156 0.734974 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141449 0.712305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165299 0.718696 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.213855 0.655019 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.213517 0.662308 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.194382 0.649801 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198584 0.673065 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23299 0.667526 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218058 0.678283 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233329 0.660237 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228788 0.644262 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229127 0.636974 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209653 0.631756 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.696329 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.23918 0.710584 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233654 0.687599 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.216195 0.705059 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23045 0.719314 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207465 0.713788 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.216195 0.705059 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.24791 0.701855 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233654 0.687599 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242384 0.678869 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.624779 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.266765 0.631486 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247291 0.636704 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250487 0.648629 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26357 0.619561 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247291 0.636704 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240901 0.612854 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.260374 0.607636 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237705 0.600929 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240901 0.612854 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161477 0.602641 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.162741 0.579817 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179523 0.58737 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156259 0.583168 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144695 0.595088 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138214 0.598439 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.143431 0.617912 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167958 0.59929 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166695 0.622115 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.184741 0.606843 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.5724 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.208861 0.556122 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215568 0.578791 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203643 0.575596 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.185011 0.549732 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179793 0.569205 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167868 0.56601 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.196936 0.552927 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179793 0.569205 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203643 0.575596 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.591572 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.105912 0.577317 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128897 0.582843 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111438 0.600302 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0971825 0.586046 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102708 0.609032 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111438 0.600302 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.114642 0.568587 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128897 0.582843 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.137627 0.574113 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0955788 0.852418 9.1293e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.11107 0.922609 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.122151 0.937225 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.131874 0.915202 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11086 0.916553 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101346 0.944632 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.090055 0.92396 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0902645 0.930016 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12236 0.943281 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111279 0.928665 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.132084 0.921258 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164775 0.877966 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.182656 0.890926 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167676 0.876622 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159019 0.897331 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179755 0.89227 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156118 0.898675 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161874 0.87931 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188412 0.871561 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.17053 0.8586 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173431 0.857256 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135698 0.867231 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.134634 0.873196 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11765 0.858152 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.117797 0.882112 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152682 0.882275 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135845 0.89119 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153747 0.876309 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152536 0.858315 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.1536 0.852349 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135552 0.843271 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0418734 0.897062 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0359958 0.920407 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511067 0.915603 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0588574 0.912106 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0267625 0.901866 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0496241 0.893565 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0326401 0.878521 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0190117 0.905363 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0248894 0.882018 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0341227 0.900559 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0665023 0.841683 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0454909 0.840284 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0463379 0.831823 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0473735 0.856111 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0656554 0.850144 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0675379 0.865971 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0866667 0.851543 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0646197 0.825856 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0856311 0.827255 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0654667 0.817395 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0263827 0.826871 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.00436945 0.825102 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.025051 0.823964 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.018173 0.84533 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00570109 0.828008 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0195047 0.848237 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0277143 0.829777 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0125791 0.806642 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0345923 0.808411 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0332607 0.805505 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0709499 0.907797 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0752104 0.930963 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0941344 0.915684 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0806562 0.924191 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0520258 0.923076 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0574717 0.916304 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0477654 0.89991 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0655041 0.914568 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0612436 0.891402 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0844281 0.899289 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0554592 0.837606 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0523913 0.842832 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0750766 0.842434 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0593957 0.86055 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0327739 0.838004 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0397783 0.855722 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0358417 0.832778 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0484547 0.819888 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0515226 0.814662 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.07114 0.81949 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.124655 0.863153 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.141535 0.875744 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.146389 0.868763 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.129819 0.88655 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.119801 0.870135 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108085 0.880941 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102922 0.857544 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136371 0.852347 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.119492 0.839756 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141225 0.845366 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0133465 0.69376 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0646815 0.745859 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0684873 0.770032 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0507391 0.762305 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0481266 0.759394 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0824297 0.753586 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.062069 0.742948 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0786239 0.729413 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0850422 0.756497 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0812364 0.732325 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.067294 0.74877 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0347427 0.737837 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0299763 0.758864 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0114021 0.745277 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0263144 0.757489 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0533169 0.751424 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0496549 0.750049 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0580833 0.730397 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0384047 0.739212 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.043171 0.718185 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0198304 0.725625 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00272662 0.788473 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0432853 0.701782 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0544915 0.717566 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0588496 0.718734 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0368947 0.725632 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0389272 0.700615 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0213304 0.708681 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.027721 0.684831 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0608821 0.693716 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0496759 0.677932 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0652402 0.694884 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0272215 0.721234 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0280589 0.725055 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0172649 0.70473 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00656677 0.726768 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0380155 0.741558 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0165234 0.743272 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0371781 0.737738 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0487136 0.71952 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0478762 0.715699 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0379196 0.699195 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00804971 0.649684 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0275193 0.640422 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0283337 0.66342 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0287044 0.644149 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00723527 0.626685 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00842045 0.630413 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0122343 0.635947 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00686453 0.645956 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.012605 0.655218 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00767898 0.668955 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0838533 0.674309 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.106805 0.675276 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0875713 0.673094 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.091423 0.694308 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103087 0.676491 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0877049 0.695522 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0801352 0.675524 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0992356 0.655278 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0762835 0.65431 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0800016 0.653095 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.051506 0.606426 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0539145 0.666287 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0577732 0.666927 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.034894 0.669407 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0513875 0.68752 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0767937 0.663807 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.070408 0.6844 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.072935 0.663167 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0603001 0.645694 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0564414 0.645053 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0374209 0.648173 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0133465 0.69376 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0440268 0.740325 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0417568 0.762259 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0216407 0.748937 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0345526 0.759495 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0641429 0.753646 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0569387 0.750882 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0664129 0.731712 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.051231 0.743089 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053501 0.721155 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0311149 0.729767 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0272215 0.721234 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0454452 0.736829 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.046242 0.724354 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0297485 0.742467 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0264247 0.733709 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.010728 0.739347 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00820099 0.718114 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0429182 0.715595 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0246945 0.7 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.043715 0.70312 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00272662 0.788473 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0845947 0.712851 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.101422 0.730141 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0832945 0.725284 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0782041 0.736701 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.102723 0.717709 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0795043 0.724268 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0858949 0.700418 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107813 0.706291 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0909853 0.689001 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0896851 0.701434 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0347427 0.737837 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0269197 0.752567 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0144587 0.751574 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.014088 0.732303 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0472037 0.73883 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0343719 0.718566 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0550267 0.7241 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0475745 0.758102 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0553974 0.743371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0351134 0.757108 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0539145 0.666287 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0751594 0.655153 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0638711 0.649783 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0745692 0.671821 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0652028 0.671657 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0646126 0.688325 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0439578 0.682791 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0545047 0.649619 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0332597 0.660752 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0432164 0.644249 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0631985 0.668775 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0708196 0.669983 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0467378 0.671462 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0618185 0.690113 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0872804 0.667296 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0782793 0.687426 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0796593 0.666087 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0721997 0.648644 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0645786 0.647436 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0481178 0.650123 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.051506 0.606426 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00804971 0.649684 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0244627 0.646718 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0313903 0.657124 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.016478 0.669336 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00112207 0.639278 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00686255 0.661896 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0152909 0.642244 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0160343 0.627066 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.000378614 0.630031 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.022962 0.637471 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281471 0.802608 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.329459 0.858698 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.34259 0.872345 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338969 0.848329 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32016 0.86421 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.333079 0.882715 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310649 0.87458 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.319948 0.869068 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351888 0.866833 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338757 0.853186 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.348268 0.842817 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337088 0.798572 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.346884 0.808673 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322361 0.807762 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335792 0.82298 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.361611 0.799483 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350519 0.81379 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351815 0.789382 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34818 0.784265 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338384 0.774164 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.323657 0.783355 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280879 0.845371 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.291048 0.849036 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304882 0.840755 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287867 0.826067 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267046 0.853652 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263865 0.830683 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.256877 0.849987 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28406 0.868341 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273891 0.864676 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297894 0.86006 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273842 0.862735 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282313 0.885497 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29787 0.867718 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281455 0.876946 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258284 0.880514 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257427 0.871963 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249813 0.857752 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.274699 0.871286 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266228 0.848523 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290257 0.853506 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225263 0.849407 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.21889 0.873186 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236437 0.866351 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240865 0.865588 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207715 0.856242 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22969 0.848644 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214088 0.832464 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203288 0.857005 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20966 0.833227 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.220835 0.850171 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225855 0.806645 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.21762 0.818054 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241754 0.813612 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230661 0.83061 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20172 0.811087 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214761 0.823642 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209955 0.799677 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212813 0.794089 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221048 0.78268 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236948 0.789647 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330051 0.815936 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.350165 0.828769 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347547 0.820583 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.333232 0.838905 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332668 0.824121 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315735 0.834258 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312554 0.811288 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.346984 0.805799 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32687 0.792966 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.344366 0.797614 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282063 0.759846 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.29233 0.756464 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305929 0.765125 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288514 0.779336 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268464 0.751185 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.264649 0.774058 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258198 0.754567 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285879 0.736973 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275612 0.740355 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299478 0.745634 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33768 0.75581 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.362219 0.753851 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352319 0.76987 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350765 0.774086 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347581 0.739791 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336127 0.760026 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.323042 0.74175 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.349134 0.735575 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324595 0.737534 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339233 0.751594 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.202787 0.674191 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.219248 0.690652 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223862 0.677807 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206403 0.695267 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198172 0.687036 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.185327 0.691651 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181711 0.670575 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215632 0.669577 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.199171 0.653116 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.220246 0.656732 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.261725 0.675225 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238562 0.683777 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261725 0.675225 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238562 0.683777 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267259 0.65457 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249631 0.642468 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249631 0.642468 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.203821 0.733129 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212373 0.709966 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183166 0.738664 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171063 0.721035 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171063 0.721035 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203821 0.733129 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212373 0.709966 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.131237 0.655019 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.12881 0.668451 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.151296 0.662426 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.137627 0.678869 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108751 0.661044 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.117567 0.671463 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111177 0.647613 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12242 0.644601 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.124846 0.631169 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144906 0.638576 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.115992 0.720665 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135288 0.711449 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135288 0.711449 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100872 0.705544 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.105047 0.681209 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100872 0.705544 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.105047 0.681209 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0796777 0.626446 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0954616 0.645433 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0796777 0.626446 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0954616 0.645433 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0852121 0.605791 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10653 0.604124 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10653 0.604124 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183615 0.602641 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.197046 0.600215 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207465 0.609032 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191021 0.622701 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173196 0.593824 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167171 0.61631 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159765 0.596251 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.18964 0.580155 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176209 0.582581 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200059 0.588972 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.155041 0.551082 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174029 0.566866 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.134387 0.556617 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13272 0.577935 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13272 0.577935 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.155041 0.551082 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174029 0.566866 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.24926 0.587397 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240045 0.606693 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240045 0.606693 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23414 0.572277 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209804 0.576452 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23414 0.572277 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209804 0.576452 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.358439 0.594141 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.428945 0.613592 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.448155 0.626191 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.43276 0.614455 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42519 0.634643 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44434 0.625328 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.421375 0.63378 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42513 0.612729 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45191 0.60514 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4327 0.592541 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436515 0.593404 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399007 0.621614 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399844 0.625435 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38905 0.60511 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378352 0.627149 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409801 0.641939 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388308 0.643653 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408963 0.638118 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420499 0.619901 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419661 0.61608 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409705 0.599576 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369058 0.688854 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388377 0.586119 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.405974 0.594185 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410332 0.593017 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.394768 0.609969 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384019 0.587286 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372813 0.60307 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366422 0.57922 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399584 0.570335 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.381987 0.562269 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403942 0.569167 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337042 0.638217 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.341809 0.659244 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.360383 0.645657 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345471 0.65787 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318468 0.651804 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32213 0.65043 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313702 0.630777 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33338 0.639592 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328614 0.618565 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351955 0.626005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317871 0.566667 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.314012 0.567308 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336891 0.569787 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320398 0.587901 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294991 0.564188 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301377 0.584781 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29885 0.563547 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.311485 0.546074 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315344 0.545434 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334364 0.548554 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409774 0.542042 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.433888 0.53788 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426423 0.55574 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423551 0.558395 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.417238 0.524182 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.406901 0.544697 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393124 0.528344 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42011 0.521526 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.395996 0.525689 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.412646 0.539387 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320279 0.506807 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379835 0.550064 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399304 0.540802 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400119 0.563801 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400489 0.54453 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37902 0.527065 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.380205 0.530793 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359551 0.536327 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37865 0.546337 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.35918 0.555599 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379464 0.569335 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.371785 0.0996195 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.393621 0.220501 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.368601 0.279642 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.354293 0.299716 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.347717 0.279022 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366989 0.292196 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375177 0.300337 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.387873 0.292817 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389485 0.280263 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355904 0.287162 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.370213 0.267088 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349329 0.266468 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.321889 0.238665 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.304702 0.250544 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32307 0.238717 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327715 0.259421 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.30352 0.250492 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.326533 0.259369 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320707 0.238612 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298875 0.229788 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316063 0.217908 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317244 0.21796 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.372464 0.281062 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.362978 0.289441 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.35549 0.267771 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378255 0.270044 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379952 0.302733 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.395229 0.283335 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389438 0.294353 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357187 0.30046 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366673 0.29208 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349699 0.278789 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440333 0.261479 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.443285 0.282991 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.421181 0.271991 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4302 0.282046 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462437 0.27248 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.449353 0.271534 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459485 0.250967 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453417 0.262424 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.450466 0.240911 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431313 0.251423 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.444196 0.262898 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.449273 0.285685 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436139 0.282528 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.426189 0.27701 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45733 0.266055 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434246 0.257381 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452254 0.243269 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46728 0.271573 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462204 0.248787 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.454146 0.268416 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.465353 0.202338 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.486123 0.204606 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464339 0.202946 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470107 0.223366 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.487137 0.203998 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471122 0.222757 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466367 0.201729 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.481368 0.183578 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.460599 0.18131 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459584 0.181918 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389758 0.219082 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.378635 0.228779 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.365937 0.225483 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383364 0.24293 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.402455 0.222377 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407185 0.236529 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.413578 0.21268 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385029 0.20493 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396152 0.195233 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.372331 0.201634 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414778 0.15994 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.412573 0.147477 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39322 0.15977 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.412448 0.172167 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434131 0.147647 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434006 0.172338 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436336 0.16011 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414903 0.13525 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.417108 0.147713 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39555 0.147543 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343046 0.178104 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.319723 0.177083 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.325124 0.189464 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.332294 0.198298 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337645 0.165722 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.350216 0.186938 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360967 0.166743 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330475 0.156889 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353797 0.157909 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335876 0.16927 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191247 0.166275 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.130089 0.20793 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.115471 0.221102 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.126388 0.200597 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13987 0.220766 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119172 0.228435 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143571 0.228099 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13379 0.215264 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10569 0.208266 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120308 0.195095 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116607 0.187762 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154295 0.172673 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.15554 0.180792 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.17557 0.171251 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166926 0.19323 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134265 0.182215 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.145651 0.194652 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.133019 0.174096 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.142909 0.160236 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141663 0.152117 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.162939 0.150694 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192135 0.230419 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.18209 0.243049 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168159 0.227721 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.185251 0.218634 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.206066 0.245747 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209227 0.221332 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216111 0.233117 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188974 0.254834 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.199019 0.242204 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.175043 0.239506 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.167041 0.201532 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.151829 0.219088 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14514 0.205084 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163068 0.221861 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173729 0.215537 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.184969 0.218309 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188942 0.197981 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155801 0.19876 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171014 0.181204 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149113 0.184756 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.229087 0.224021 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.22829 0.248268 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207937 0.234532 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216949 0.2391 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.249439 0.237756 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238098 0.228589 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.250236 0.213509 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240428 0.233189 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241225 0.208942 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220075 0.219453 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228199 0.159877 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.229756 0.167942 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207683 0.16569 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223214 0.183484 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.250271 0.162129 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.243729 0.177671 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248714 0.154064 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.234741 0.144336 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233184 0.13627 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212668 0.142084 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.129201 0.143787 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.105335 0.14887 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115741 0.153943 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121723 0.167242 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.118795 0.138714 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135183 0.157086 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.142661 0.13363 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.112813 0.125414 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.136679 0.120331 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.123219 0.130487 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.190359 0.102131 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.179968 0.0897843 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166467 0.105492 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.183804 0.114103 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.20386 0.0864233 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207696 0.110742 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.214251 0.0987702 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.186523 0.0778128 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196914 0.0901597 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173022 0.0935207 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153407 0.108529 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.130858 0.0995811 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135326 0.123725 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134736 0.113639 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.148938 0.0843858 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.152816 0.0984435 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171487 0.0933338 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149528 0.0944715 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172078 0.10342 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153997 0.118615 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.277961 0.367156 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.269898 0.374298 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.270045 0.350338 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.291334 0.362218 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277815 0.391115 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299251 0.379036 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.285878 0.383973 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.256525 0.379235 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.264588 0.372093 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.256671 0.355276 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.252306 0.297666 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.235688 0.305995 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259438 0.312359 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245915 0.321516 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228556 0.291303 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238783 0.306824 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245173 0.282974 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.242079 0.282145 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.258696 0.273816 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265828 0.288509 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.32435 0.32435 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33812 0.32066 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32066 0.33812 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3005 0.317959 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29681 0.331729 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29042 0.307879 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317959 0.3005 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307879 0.29042 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331729 0.29681 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339925 0.383759 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.334762 0.407156 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31686 0.392275 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.326552 0.388696 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357827 0.39864 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349618 0.380181 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362991 0.375243 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348135 0.402218 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353299 0.378821 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330233 0.387337 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376234 0.330873 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.393346 0.348239 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383366 0.345565 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369843 0.354723 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386213 0.333547 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362711 0.340031 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369102 0.316181 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399736 0.324389 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382624 0.307023 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389757 0.321715 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376234 0.330873 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.386461 0.346394 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362711 0.340031 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369843 0.354723 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399983 0.337237 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383366 0.345565 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389757 0.321715 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392851 0.322544 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382624 0.307023 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369102 0.316181 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277961 0.367156 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.261966 0.385852 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259422 0.36581 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.278159 0.38141 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.280504 0.387198 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296698 0.382755 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.2965 0.368501 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.261768 0.371598 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277764 0.352901 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259225 0.351556 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.304189 0.32435 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29042 0.32066 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307879 0.33812 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328039 0.317959 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331729 0.331729 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33812 0.307879 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31058 0.3005 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32066 0.29042 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29681 0.29681 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.252306 0.297666 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.228803 0.30415 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238783 0.306824 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245915 0.321516 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.242326 0.294992 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259438 0.312359 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265828 0.288509 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.235194 0.2803 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.258696 0.273816 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245173 0.282974 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574159 0.153845 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.612768 0.202534 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.612732 0.225282 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591695 0.212428 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60221 0.22113 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633805 0.215388 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623283 0.211236 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.63384 0.192641 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62329 0.206686 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623325 0.183939 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602253 0.193832 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543919 0.184086 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.527458 0.200547 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522843 0.187702 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.540303 0.205161 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548533 0.196931 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561378 0.201546 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.564994 0.18047 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531074 0.179472 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.547535 0.163011 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.526459 0.166627 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.542885 0.243024 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534333 0.219861 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563539 0.248559 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575642 0.23093 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575642 0.23093 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542885 0.243024 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534333 0.219861 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643008 0.172294 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.660425 0.189742 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645434 0.185725 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636618 0.196144 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657999 0.17631 0.57904 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634191 0.182712 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640582 0.158862 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666816 0.165892 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649399 0.148444 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651825 0.161875 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.585228 0.195155 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.574809 0.203972 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561378 0.201546 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.568784 0.181486 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598659 0.197581 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.592634 0.175095 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609078 0.188764 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591253 0.217641 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601672 0.208824 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577822 0.215215 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6044 0.123605 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.620861 0.107144 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608016 0.102529 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625475 0.119989 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617245 0.128219 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621859 0.141064 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600784 0.14468 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599785 0.11076 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583324 0.127221 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58694 0.106145 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631939 0.130984 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.643128 0.132649 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618482 0.133263 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631785 0.152367 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656585 0.130371 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645242 0.150088 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645397 0.128706 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643283 0.111266 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632094 0.109601 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618637 0.11188 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.591664 0.0609772 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572676 0.076761 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612319 0.0665116 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613986 0.0878298 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613986 0.0878298 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591664 0.0609772 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572676 0.076761 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56309 0.112536 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549659 0.11011 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53924 0.118927 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555684 0.132596 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.573509 0.103719 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579534 0.126205 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58694 0.106145 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557065 0.09005 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570497 0.0924762 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.546646 0.0988668 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.494808 0.247614 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.494287 0.313607 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.484182 0.326876 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470513 0.310432 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.488171 0.302705 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507957 0.330051 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511946 0.305881 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.518062 0.316783 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490299 0.337778 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500404 0.324509 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476629 0.321334 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452978 0.302539 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.436971 0.320401 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436675 0.29902 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.455413 0.3148 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453274 0.32392 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471717 0.318318 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469281 0.306057 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434535 0.30814 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.450543 0.290278 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434239 0.286759 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434629 0.269833 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.426389 0.279233 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.445377 0.263449 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448298 0.286276 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415641 0.285616 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.43755 0.29266 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42388 0.276216 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41272 0.262789 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420959 0.253389 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431707 0.247006 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536117 0.258683 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549787 0.275127 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549787 0.275127 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529727 0.282533 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536117 0.258683 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.516058 0.266089 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522448 0.242239 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556177 0.251277 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542508 0.234833 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556177 0.251277 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476459 0.214908 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.457868 0.209819 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.458164 0.2312 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453963 0.210053 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476163 0.193527 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.472258 0.193761 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.494753 0.198616 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.480363 0.214674 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.498954 0.219763 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.480659 0.236055 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536638 0.19269 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549603 0.17251 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528912 0.177908 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549105 0.191778 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557329 0.187292 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556831 0.20656 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544363 0.207471 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.537136 0.173421 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.524171 0.193601 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.516445 0.178819 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554467 0.291389 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.562288 0.314604 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542501 0.306499 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541186 0.310183 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574255 0.299494 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.553152 0.295073 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566433 0.276279 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575569 0.29581 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567748 0.272595 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555781 0.287705 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.567359 0.227186 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54267 0.227528 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555283 0.246777 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579676 0.225054 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567601 0.244644 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567305 0.223263 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567063 0.205805 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554691 0.204014 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542374 0.206147 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.513157 0.28032 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.507811 0.298839 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.489718 0.287442 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505577 0.302049 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531251 0.291716 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529016 0.294927 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536597 0.273198 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515392 0.27711 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.520738 0.258591 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497299 0.265714 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.552323 0.0329639 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.625877 0.0248832 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.646362 0.0316054 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625173 0.0287309 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627981 0.0478 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647066 0.0277577 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628685 0.0439523 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62658 0.0210355 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644258 0.00868865 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623773 0.00196644 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623069 0.00581415 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.584567 0.0138144 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.584898 0.0177119 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56353 0.0185345 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.580268 0.0364224 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.605935 0.0129918 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601305 0.0317022 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.605605 0.00909422 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.589197 -0.00489609 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.588867 -0.00879364 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567829 -0.00407348 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.593994 0.105299 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572783 0.0926585 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582384 0.100664 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.614541 0.0949359 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602932 0.090301 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613879 0.0719323 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604941 0.0869303 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604278 0.0639267 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58373 0.0742898 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593633 0.0440327 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607302 0.0604766 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607302 0.0604766 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587242 0.0678827 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593633 0.0440327 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.573573 0.0514389 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579964 0.0275889 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613693 0.0366265 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600023 0.0201827 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613693 0.0366265 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561087 0.101445 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551884 0.118381 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536664 0.103361 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550745 0.0944221 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576307 0.116465 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575168 0.0925065 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58551 0.0995293 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562225 0.125404 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571428 0.108468 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.547006 0.110383 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.520079 0.0521134 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.523344 0.0542684 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534291 0.0358996 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541988 0.0591566 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509132 0.0704822 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.527777 0.0753703 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505868 0.0683272 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.501435 0.0472252 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49817 0.0450702 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.512382 0.0288565 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.584869 -0.0244483 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.5935 -0.0473753 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57344 -0.0399691 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.595617 -0.0308315 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604929 -0.0318545 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607046 -0.0153107 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.596298 -0.00892756 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582752 -0.0409921 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574121 -0.0180651 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562692 -0.0335859 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511316 -0.0163676 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.48882 -0.0212225 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497372 0.00194055 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491256 -0.00896145 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502764 -0.0395307 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505199 -0.0272696 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.525259 -0.0346758 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.50888 -0.0286287 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531375 -0.0237738 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517432 -0.00546563 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54356 -0.0355172 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.530389 -0.0495897 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.519442 -0.031221 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53532 -0.0261165 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554507 -0.0538859 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.559438 -0.0304127 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567678 -0.0398133 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538628 -0.0589904 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.551799 -0.0449178 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.527681 -0.0406217 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.451136 0.0058509 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.447081 0.0051487 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.435909 0.01504 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423265 0.0115452 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440694 0.0289993 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459725 0.00864346 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46451 0.0226028 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470897 -0.0012478 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.442297 -0.00881065 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453468 -0.0187019 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.429652 -0.0123054 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386138 0.0172804 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.364644 0.0293677 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375512 0.0213457 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385352 0.0401449 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37527 0.0253024 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.395978 0.0360796 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396764 0.0132151 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.36543 0.0065032 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386924 -0.00558411 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376298 -0.00151881 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.439178 0.0688765 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.426942 0.0903221 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.416328 0.0699989 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435083 0.0806307 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.449792 0.0891998 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.457933 0.0795084 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462029 0.0677542 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431037 0.078568 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.443274 0.0571224 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420423 0.0582447 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.512079 -0.00628079 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.523883 -0.000557006 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49924 -0.00208214 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.51057 0.0165974 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536722 -0.00475566 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523409 0.0123987 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.524918 -0.0104794 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.525392 -0.0234352 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.513588 -0.029159 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500749 -0.0249603 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504176 0.0574471 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.508666 0.0817008 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.488971 0.0722467 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.489545 0.0732807 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523872 0.0669012 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504751 0.058481 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.519382 0.0426474 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523298 0.0658672 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.518808 0.0416134 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.503602 0.0564131 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.516134 -0.00557859 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.540463 -0.00154892 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.52751 -0.00538221 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.524673 0.0156462 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529087 -0.00174531 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.513298 0.0154498 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504759 -0.00577498 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531924 -0.0227737 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507596 -0.0268034 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.518971 -0.026607 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459039 -0.0578769 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.451803 -0.0707378 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435761 -0.0561039 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.454158 -0.0461991 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.475081 -0.0725109 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477435 -0.0479721 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.482316 -0.05965 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.456685 -0.0824157 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46392 -0.0695548 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440643 -0.0677817 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.463094 -0.0571747 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.459563 -0.081612 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.442243 -0.0665888 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.463589 -0.0696122 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.480415 -0.0721979 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.48444 -0.0601982 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.483946 -0.0477607 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459069 -0.0691745 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4626 -0.0447373 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.441749 -0.0541513 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398096 -0.0457452 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.373728 -0.0495643 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383722 -0.030137 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382672 -0.0306825 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388102 -0.0651725 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.397047 -0.0462908 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41247 -0.0613535 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389151 -0.064627 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41352 -0.060808 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399146 -0.0451997 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.424299 -0.178985 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.412497 -0.190929 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400273 -0.174844 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.417001 -0.16674 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436523 -0.195071 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.441027 -0.170881 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448325 -0.183127 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419795 -0.203175 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431597 -0.191231 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407571 -0.18709 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367336 -0.131634 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.343834 -0.12515 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353814 -0.122476 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360946 -0.107784 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357357 -0.134308 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374468 -0.116942 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380859 -0.140792 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.350225 -0.149 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.373727 -0.155484 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360204 -0.146326 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.41922 -0.10495 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40545 -0.10864 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42291 -0.0911807 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44307 -0.111341 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44676 -0.0975713 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45315 -0.121421 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425611 -0.128801 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435691 -0.138881 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.411841 -0.13249 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.486264 -0.162382 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.502603 -0.174264 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.479659 -0.170327 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.495376 -0.15142 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509207 -0.166319 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.501981 -0.143475 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.492868 -0.154437 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49349 -0.185226 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477151 -0.173345 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470546 -0.18129 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491265 -0.0984274 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.501491 -0.082906 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477742 -0.0892696 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484874 -0.0745774 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515014 -0.0920638 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.498397 -0.0837352 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504787 -0.107585 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507882 -0.106756 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497655 -0.122277 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484132 -0.11312 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491265 -0.0984274 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.508376 -0.0810612 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.498397 -0.0837352 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484874 -0.0745774 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.501244 -0.0957534 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477742 -0.0892696 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484132 -0.11312 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.514767 -0.104911 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497655 -0.122277 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504787 -0.107585 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.424299 -0.178985 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.411775 -0.200165 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399922 -0.179342 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415187 -0.189948 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436152 -0.199808 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.439564 -0.189591 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448677 -0.178629 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420888 -0.189202 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.433412 -0.168023 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409035 -0.168379 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.439381 -0.10495 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45315 -0.10864 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435691 -0.0911807 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415531 -0.111341 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.411841 -0.0975713 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40545 -0.121421 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.43299 -0.128801 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42291 -0.138881 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44676 -0.13249 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367336 -0.131634 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.350719 -0.123305 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374468 -0.116942 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360946 -0.107784 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343587 -0.137998 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353814 -0.122476 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360204 -0.146326 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357109 -0.147155 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.373727 -0.155484 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380859 -0.140792 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248762 -0.0483751 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.183785 -0.0599222 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.160406 -0.0522053 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171954 -0.0513956 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178533 -0.0358698 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172236 -0.0607319 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.190363 -0.0443964 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195615 -0.0684488 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165658 -0.0762577 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189036 -0.0839747 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177206 -0.075448 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.187119 -0.0172857 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.176731 -0.00705049 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192673 -0.025725 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200733 -0.00352517 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171177 0.00138875 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195179 0.00491406 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.181564 -0.00884647 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163117 -0.020811 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173504 -0.0310463 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179058 -0.0394855 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215921 0.00673113 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.20044 0.0258737 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196602 0.00551963 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215612 0.0203763 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.21976 0.0270852 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.234932 0.0215878 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.235241 0.00794264 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200749 0.0122285 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.21623 -0.00691403 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196911 -0.00812553 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245428 -0.0910116 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.234308 -0.0942304 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.221514 -0.0854464 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238704 -0.0714204 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.258223 -0.0997955 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.262619 -0.0769856 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.269343 -0.0965768 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241032 -0.113822 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.252152 -0.110603 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228237 -0.105038 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277564 -0.0243582 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.275459 -0.0076281 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.255218 -0.0167139 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.270078 -0.00142185 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.297806 -0.0152725 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.292425 -0.00906621 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299911 -0.0320026 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282946 -0.0305645 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.285051 -0.0472946 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.262704 -0.0396503 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.310405 -0.0794645 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.324811 -0.0817333 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.300317 -0.0800146 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.313378 -0.0603366 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.334899 -0.0811832 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.323466 -0.0597864 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320493 -0.0789143 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.321838 -0.100861 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307433 -0.0985923 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.297345 -0.0991425 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216626 -0.115028 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.195663 -0.127519 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194866 -0.104303 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.201738 -0.108803 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.217423 -0.138245 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223497 -0.119529 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238386 -0.125754 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210551 -0.133744 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.231514 -0.121254 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209754 -0.110528 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.281603 -0.103481 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.291073 -0.126206 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.271345 -0.119897 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293457 -0.110246 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.301332 -0.10979 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.303716 -0.0938302 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.291862 -0.0870656 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.279219 -0.119442 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.269749 -0.0967168 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.25949 -0.113132 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.21996 -0.0723919 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.20388 -0.0673141 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216456 -0.0490355 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.198742 -0.0609052 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207384 -0.0906706 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.202246 -0.0842617 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223463 -0.0957484 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225098 -0.0788008 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241177 -0.0838786 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.237674 -0.0605222 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.508983 0.690426 8.51251e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.484794 0.755941 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.47411 0.767658 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.467528 0.744501 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.489758 0.749038 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491377 0.779098 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507025 0.760478 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502061 0.767382 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469146 0.774562 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.47983 0.762845 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462564 0.751405 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436283 0.7029 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.418941 0.714226 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.43889 0.704751 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44101 0.724842 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.416335 0.712374 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.438403 0.722991 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.433677 0.701048 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414215 0.692283 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431557 0.680957 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434163 0.682808 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.478434 0.695668 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.481931 0.703418 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500827 0.694124 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491475 0.716184 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459538 0.704962 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469082 0.717727 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.456041 0.697211 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46889 0.682902 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.465393 0.675152 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.487786 0.673608 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557494 0.743468 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.560084 0.767402 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543179 0.760285 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53997 0.755145 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574398 0.750585 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554284 0.738328 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571808 0.726651 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577608 0.755725 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575017 0.731791 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.560703 0.748608 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.551134 0.683194 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.573364 0.687731 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571303 0.682033 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56324 0.703871 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.553195 0.688893 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543071 0.705033 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530964 0.684356 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561258 0.667055 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539027 0.662518 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.559196 0.661356 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.581682 0.677953 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.601808 0.682851 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579842 0.680568 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58454 0.700216 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603648 0.680237 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58638 0.697602 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583522 0.675339 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59895 0.660588 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.578824 0.65569 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576984 0.658304 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515343 0.7507 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.506594 0.773394 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491321 0.755462 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507924 0.764807 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530616 0.768632 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531946 0.760045 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539365 0.745938 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.514012 0.759287 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522762 0.736593 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49874 0.741355 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539531 0.685185 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.538818 0.693658 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517905 0.691194 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534075 0.708875 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.560445 0.687649 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555702 0.702866 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561158 0.679176 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544274 0.669969 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544988 0.661495 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523361 0.667505 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466832 0.697658 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.447385 0.709346 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.447429 0.703286 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46231 0.721188 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466788 0.703718 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.481713 0.71556 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.486235 0.692031 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.451907 0.685816 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471354 0.674129 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.451951 0.679757 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335322 0.607487 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.283164 0.659645 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.269894 0.672915 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.275822 0.649528 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293281 0.666987 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277236 0.683032 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.300624 0.677104 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.290507 0.669762 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259777 0.665573 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273047 0.652302 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265705 0.642185 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.286452 0.603979 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.279361 0.614273 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.303327 0.613293 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.288206 0.628413 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.262487 0.604959 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.271332 0.619099 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.269578 0.594664 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277607 0.589839 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.284698 0.579544 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.301572 0.588858 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33883 0.656357 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.328536 0.663448 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314396 0.654603 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.329516 0.639482 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.35297 0.665202 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353951 0.641237 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.363265 0.658111 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33785 0.680322 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348145 0.673232 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32371 0.671477 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.332034 0.663153 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.321274 0.684748 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.308341 0.666888 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.326131 0.678752 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.344967 0.681014 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349824 0.675018 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355727 0.659419 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327177 0.669149 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337937 0.647554 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314244 0.651289 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.391875 0.684201 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384191 0.610996 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.389739 0.622198 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366159 0.617804 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378964 0.63493 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407771 0.61539 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396997 0.628121 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.402224 0.604188 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.394966 0.598265 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389418 0.587062 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.371386 0.593871 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.279656 0.610775 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.258061 0.621535 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.264057 0.616678 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.275921 0.634468 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.27366 0.615632 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29152 0.628565 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.295255 0.604872 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.261795 0.597842 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.28339 0.587082 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267791 0.592985 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331813 0.558618 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.320611 0.55307 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.30788 0.563845 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.325005 0.57665 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.344544 0.547843 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348938 0.571423 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355747 0.553391 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327419 0.535038 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338621 0.540585 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314688 0.545813 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.258608 0.550934 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335322 0.607487 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.313405 0.629404 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.316595 0.626214 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318408 0.606941 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335868 0.624401 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.311592 0.648676 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330864 0.646863 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.308402 0.651867 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.294133 0.631217 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.290942 0.634407 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.295946 0.611945 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331813 0.558618 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.319608 0.539107 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307378 0.556863 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.322499 0.541743 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.344043 0.540862 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.346933 0.543497 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356248 0.560372 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328923 0.555982 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.341128 0.575492 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316693 0.573738 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384191 0.610996 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.403702 0.623201 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401066 0.62031 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385946 0.635431 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386827 0.613886 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369071 0.626116 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367317 0.601681 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401947 0.598766 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382437 0.586561 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399312 0.595876 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316914 0.678274 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.305407 0.69384 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296616 0.671002 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317721 0.674446 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.325704 0.701111 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338018 0.681717 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337211 0.685545 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3046 0.697667 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316107 0.682101 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.295809 0.67483 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.391875 0.684201 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33883 0.656357 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.329538 0.677411 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314897 0.661584 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.332022 0.674389 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353472 0.672184 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355956 0.669162 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362764 0.65113 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.336346 0.659378 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.345639 0.638325 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.321705 0.643552 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.264535 0.625895 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.248969 0.637402 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.268363 0.625088 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.271807 0.646193 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245142 0.638209 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267979 0.647 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.260708 0.626702 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241698 0.617105 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.257264 0.605598 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.261092 0.604791 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.286452 0.603979 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.265398 0.613271 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.26842 0.610787 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.281225 0.627912 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.283431 0.606463 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299257 0.621104 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.304484 0.59717 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.270625 0.589337 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.291679 0.580045 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273647 0.586853 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.258608 0.550934 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645066 0.554344 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.681385 0.616373 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.678928 0.639472 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661636 0.629767 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.664108 0.621631 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698678 0.626079 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683858 0.608237 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701135 0.602979 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696205 0.634214 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698662 0.611115 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678912 0.624508 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649723 0.609912 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.640648 0.631982 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625749 0.614812 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64267 0.62585 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.664623 0.627081 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666645 0.620949 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673698 0.605012 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647702 0.616044 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656777 0.593974 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632802 0.598874 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607573 0.617144 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.595495 0.63057 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594239 0.605919 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615286 0.617371 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608828 0.641795 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628619 0.628595 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.620906 0.628369 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587782 0.630343 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59986 0.616917 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586526 0.605692 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.676727 0.560805 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.689897 0.57563 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693998 0.575587 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673115 0.585222 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.672626 0.560848 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655844 0.57044 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659456 0.546023 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693509 0.551213 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680339 0.536388 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69761 0.55117 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602915 0.561576 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.602201 0.570049 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623084 0.560414 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615021 0.582252 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582032 0.571211 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594852 0.583414 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582745 0.562738 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.590095 0.549372 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.590808 0.540899 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610978 0.539737 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640408 0.498776 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.627785 0.478525 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615951 0.497935 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630799 0.484234 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.652241 0.479365 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655255 0.485075 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.664864 0.499616 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637394 0.493066 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.650016 0.513317 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62556 0.512476 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718878 0.553573 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.73992 0.563328 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.720935 0.559693 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719679 0.577348 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737863 0.557208 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717623 0.571228 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.716821 0.547453 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739118 0.539553 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718076 0.529798 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.720133 0.535918 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682558 0.491544 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.688647 0.474542 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666351 0.485132 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.686417 0.498226 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.704854 0.480953 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.702624 0.504637 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698765 0.497955 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.684788 0.46786 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678699 0.484862 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.662492 0.47845 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687216 0.547112 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.690713 0.554862 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.667813 0.552739 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682694 0.570641 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.710116 0.549235 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.702097 0.565014 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.706619 0.541484 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.695235 0.531333 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691738 0.523582 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.672335 0.52921 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.501645 0.501645 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.499795 0.519956 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.493653 0.523893 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.479397 0.509638 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507788 0.497708 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.48739 0.48739 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509638 0.479397 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522043 0.511963 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523893 0.493653 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515901 0.515901 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.490576 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.559233 0.507719 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539759 0.502501 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536564 0.514426 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562428 0.495794 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539759 0.502501 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54615 0.478651 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.565623 0.483869 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549345 0.466726 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54615 0.478651 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.542955 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.483869 0.565623 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466726 0.549345 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.478651 0.54615 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507719 0.559233 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502501 0.539759 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.514426 0.536564 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.495794 0.562428 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502501 0.539759 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.478651 0.54615 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.430095 0.482473 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.430434 0.489762 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.449569 0.477255 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.445366 0.500519 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41096 0.49498 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425893 0.505737 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410622 0.487691 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415162 0.471716 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414824 0.464428 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434297 0.45921 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.523783 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.404771 0.538038 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410297 0.515053 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427756 0.532513 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4135 0.546768 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436486 0.541242 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427756 0.532513 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396041 0.529309 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410297 0.515053 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401567 0.506323 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.452233 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.377186 0.45894 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396659 0.464158 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.393464 0.476083 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380381 0.447015 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396659 0.464158 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40305 0.440308 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383576 0.43509 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406245 0.428383 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40305 0.440308 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.482473 0.430095 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.48121 0.407271 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464428 0.414824 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.487691 0.410622 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499256 0.422542 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505737 0.425893 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500519 0.445366 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.475992 0.426744 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477255 0.449569 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45921 0.434297 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.399854 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.43509 0.383576 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428383 0.406245 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440308 0.40305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45894 0.377186 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464158 0.396659 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476083 0.393464 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.447015 0.380381 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464158 0.396659 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440308 0.40305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.419026 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.538038 0.404771 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515053 0.410297 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.532513 0.427756 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.546768 0.4135 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541242 0.436486 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.532513 0.427756 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529309 0.396041 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515053 0.410297 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.506323 0.401567 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607487 0.335322 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.659645 0.283164 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.672915 0.269894 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649528 0.275822 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666987 0.293281 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683032 0.277236 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.677104 0.300624 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669762 0.290507 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665573 0.259777 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.652302 0.273047 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642185 0.265705 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603979 0.286452 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.592776 0.280905 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.580045 0.291679 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59717 0.304484 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.61671 0.275678 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621104 0.299257 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627912 0.281225 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599585 0.262872 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610787 0.26842 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586853 0.273647 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656357 0.33883 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.661904 0.350033 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638325 0.345639 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65113 0.362764 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679937 0.343224 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669162 0.355956 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674389 0.332022 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.667131 0.326099 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661584 0.314897 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643552 0.321705 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663153 0.332034 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.685865 0.340177 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679339 0.33606 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669651 0.355123 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669679 0.336151 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.653465 0.351097 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.646968 0.328008 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679367 0.317089 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656656 0.308945 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.672841 0.312971 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.664041 0.412036 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610996 0.384191 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.600701 0.391282 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586561 0.382437 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601681 0.367317 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625136 0.393037 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626116 0.369071 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.635431 0.385946 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610016 0.408157 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62031 0.401066 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.595876 0.399312 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610775 0.279656 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.602632 0.256944 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587686 0.273158 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606749 0.26347 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62572 0.263442 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.629838 0.269968 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633864 0.286153 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606658 0.27313 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.614801 0.295841 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591712 0.289344 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558618 0.331813 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551527 0.342108 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575492 0.341128 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.560372 0.356248 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534652 0.332793 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543497 0.346933 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541743 0.322499 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549772 0.317673 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556863 0.307378 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.573738 0.316693 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.530773 0.278768 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645066 0.554344 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.668521 0.610229 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.663938 0.633406 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64522 0.617928 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65892 0.626429 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687239 0.625707 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682221 0.61873 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691822 0.602531 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673539 0.617206 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678123 0.59403 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.654822 0.601728 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598918 0.585648 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.580238 0.601562 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.581665 0.587563 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59781 0.605914 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.597491 0.599646 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615063 0.603999 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616171 0.583732 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.581346 0.581295 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600026 0.565381 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582773 0.567297 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619787 0.622977 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.608008 0.63767 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601637 0.613891 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623239 0.620102 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626157 0.646756 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.641389 0.629188 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637936 0.632063 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604555 0.640545 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616334 0.625852 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598184 0.616766 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.714669 0.578925 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.729812 0.597914 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711617 0.592661 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70632 0.602084 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732864 0.584178 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.709372 0.588348 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.71772 0.565189 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.738161 0.574755 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.723017 0.555767 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719965 0.569503 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665934 0.591673 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.658095 0.605761 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647455 0.607672 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643855 0.58746 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.676573 0.589763 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.662334 0.571461 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.684413 0.575674 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680174 0.609975 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.688013 0.595887 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669535 0.611885 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691213 0.52304 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.712906 0.511567 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.699372 0.507717 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.710453 0.529503 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.704747 0.526889 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.702295 0.544826 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683054 0.538362 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693665 0.505104 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671972 0.516576 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680131 0.501254 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6938 0.541596 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.70016 0.547376 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.676324 0.546319 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690564 0.564621 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717636 0.542652 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70804 0.559898 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711276 0.536873 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.703396 0.524351 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.697037 0.518571 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679561 0.523294 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.670344 0.48571 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.67091 0.466887 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.650637 0.480853 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671107 0.490138 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690617 0.471745 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690815 0.494995 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690052 0.490567 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.670147 0.46246 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669581 0.481283 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649874 0.476425 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624197 0.517014 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.60809 0.516313 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60089 0.524375 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616221 0.538029 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631397 0.508952 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639529 0.530668 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647504 0.509653 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616065 0.495298 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632172 0.495999 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608865 0.50336 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607487 0.335322 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.629404 0.313405 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.626214 0.316595 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606941 0.318408 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624401 0.335868 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648676 0.311592 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.646863 0.330864 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651867 0.308402 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631217 0.294133 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634407 0.290942 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.611945 0.295946 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558618 0.331813 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.537564 0.341105 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.540585 0.338621 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.553391 0.355747 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555596 0.334297 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571423 0.348938 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57665 0.325005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542791 0.317172 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563845 0.30788 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545813 0.314688 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610996 0.384191 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.601704 0.405245 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587062 0.389418 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604188 0.402224 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625637 0.400018 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628121 0.396997 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.63493 0.378964 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608512 0.387213 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617804 0.366159 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593871 0.371386 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678274 0.316914 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.697473 0.31938 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674538 0.318074 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681812 0.338182 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701209 0.31822 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.685547 0.337022 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682009 0.315754 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693935 0.298112 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674736 0.295646 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671 0.296805 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.664041 0.412036 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656357 0.33883 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.675867 0.351035 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673232 0.348145 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.658111 0.363265 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.658993 0.341721 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.641237 0.353951 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639482 0.329516 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674113 0.3266 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.654603 0.314396 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671477 0.32371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625895 0.264535 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.623429 0.245336 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604627 0.260997 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624736 0.268271 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644697 0.248874 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.646004 0.271809 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647163 0.268073 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624589 0.2416 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627055 0.2608 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.605787 0.257262 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603979 0.286452 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.591774 0.266942 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579544 0.284698 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594664 0.269578 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616209 0.268696 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619099 0.271332 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628413 0.288206 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601088 0.283817 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613293 0.303327 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.588858 0.301572 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.530773 0.278768 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.441164 0.501645 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.424703 0.518106 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420089 0.505261 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.437548 0.522721 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.445778 0.51449 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.458623 0.519105 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462239 0.498029 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428319 0.497031 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44478 0.48057 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423704 0.484186 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.382226 0.502679 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405389 0.511231 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382226 0.502679 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405389 0.511231 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376691 0.482024 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39432 0.469922 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39432 0.469922 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.44013 0.560583 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431578 0.53742 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.460785 0.566118 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.472887 0.548489 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.472887 0.548489 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44013 0.560583 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431578 0.53742 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.512714 0.482473 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.51514 0.495905 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.492654 0.48988 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.506323 0.506323 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5352 0.488498 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.526383 0.498917 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.532774 0.475067 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.521531 0.472055 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.519105 0.458623 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499045 0.46603 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.527958 0.548119 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.508662 0.538903 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.508662 0.538903 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543078 0.532998 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538903 0.508662 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543078 0.532998 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538903 0.508662 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.564273 0.4539 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548489 0.472887 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.564273 0.4539 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548489 0.472887 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558738 0.433245 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53742 0.431578 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53742 0.431578 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.460336 0.430095 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.446904 0.427669 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436486 0.436486 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45293 0.450155 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470754 0.421278 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.47678 0.443764 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484186 0.423704 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.454311 0.407609 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.467742 0.410035 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.443892 0.416426 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.488909 0.378536 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469922 0.39432 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509564 0.384071 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511231 0.405389 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511231 0.405389 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.488909 0.378536 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469922 0.39432 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.39469 0.414851 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403906 0.434147 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403906 0.434147 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409811 0.399731 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434147 0.403906 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409811 0.399731 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434147 0.403906 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.835815 -0.157543 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.871646 -0.122136 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.871334 -0.102403 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.850164 -0.113406 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862937 -0.100577 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.892817 -0.111133 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.884419 -0.109307 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.893129 -0.130866 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880044 -0.123961 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880356 -0.143694 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.858873 -0.134964 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.799077 -0.135649 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.781177 -0.120908 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.778973 -0.13149 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.795477 -0.113462 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.801282 -0.125067 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.815582 -0.11762 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819182 -0.139808 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.784778 -0.143095 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802678 -0.157836 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.782573 -0.153678 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.82339 -0.0854653 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.811594 -0.0654286 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.80102 -0.0876595 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.820516 -0.0820122 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.833964 -0.0632344 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.842886 -0.079818 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.845761 -0.083271 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.814468 -0.0688817 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.826265 -0.0889183 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803895 -0.0911125 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.908384 -0.14403 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.926643 -0.128672 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.90826 -0.133221 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.904034 -0.1198 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.926768 -0.139481 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.904159 -0.130608 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.908508 -0.154838 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.930993 -0.152902 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.912733 -0.16826 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.912609 -0.157451 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860128 -0.107359 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.853284 -0.0905999 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.839638 -0.0940331 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840233 -0.111382 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.873773 -0.103926 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860723 -0.124708 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880618 -0.120685 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.873178 -0.086577 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880022 -0.103336 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.859532 -0.0900102 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.872552 -0.179437 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.894035 -0.188167 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.885777 -0.195141 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.89378 -0.172046 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880811 -0.172463 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880556 -0.156342 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.859328 -0.163733 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.872807 -0.195558 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.851325 -0.186828 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.864549 -0.202532 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.884071 -0.194213 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.891905 -0.197746 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.867957 -0.193701 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.884286 -0.175383 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.908019 -0.198259 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.900401 -0.175896 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.900186 -0.194726 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.89169 -0.216576 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.883856 -0.213043 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.867741 -0.212531 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.84824 -0.229621 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.843832 -0.25245 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.826426 -0.235043 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.846687 -0.233837 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.865646 -0.247028 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.868501 -0.228415 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.870053 -0.224198 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.845385 -0.248234 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.849792 -0.225404 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.827978 -0.230827 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.811502 -0.207727 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.794108 -0.212743 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.788345 -0.199907 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802328 -0.189621 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.817265 -0.220563 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.825486 -0.197441 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.83466 -0.215547 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803282 -0.230849 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.820676 -0.225832 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.797518 -0.218012 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.61371 -0.142305 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.597249 -0.125845 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.592635 -0.138689 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610094 -0.12123 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618324 -0.12946 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631169 -0.124846 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634785 -0.145921 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600865 -0.14692 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617326 -0.163381 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.596251 -0.159765 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.554772 -0.141271 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577935 -0.13272 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554772 -0.141271 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577935 -0.13272 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549237 -0.161926 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566866 -0.174029 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566866 -0.174029 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.612676 -0.0833673 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604124 -0.10653 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633331 -0.0778329 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645433 -0.0954616 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645433 -0.0954616 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612676 -0.0833673 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604124 -0.10653 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.68526 -0.161477 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687686 -0.148046 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6652 -0.154071 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678869 -0.137627 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.707746 -0.155452 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698929 -0.145033 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70532 -0.168883 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.694077 -0.171896 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691651 -0.185327 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671591 -0.177921 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.700504 -0.095832 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681209 -0.105047 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681209 -0.105047 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715624 -0.110952 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711449 -0.135288 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715624 -0.110952 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711449 -0.135288 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.736819 -0.190051 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721035 -0.171063 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.736819 -0.190051 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721035 -0.171063 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.731284 -0.210706 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.709966 -0.212373 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.709966 -0.212373 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632882 -0.213855 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.61945 -0.216282 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609032 -0.207465 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625476 -0.193796 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6433 -0.222672 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649326 -0.200186 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656732 -0.220246 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626857 -0.236341 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640288 -0.233915 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616438 -0.227525 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.661455 -0.265414 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642468 -0.249631 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.68211 -0.25988 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683777 -0.238562 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683777 -0.238562 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661455 -0.265414 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642468 -0.249631 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.567237 -0.2291 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576452 -0.209804 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576452 -0.209804 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582357 -0.24422 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606693 -0.240045 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582357 -0.24422 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606693 -0.240045 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69376 0.0133465 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.674309 0.0838533 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.66171 0.103063 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.653258 0.0800983 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673446 0.0876683 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682761 0.106818 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.694497 0.0914233 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69536 0.0876083 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.662574 0.0992478 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.675172 0.0800382 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.654121 0.0762832 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599047 0.0239663 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666287 0.0539145 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.662466 0.0547519 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660752 0.0332597 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682791 0.0439578 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.668 0.0754066 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.688325 0.0646126 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671821 0.0745692 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645962 0.0647085 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649783 0.0638711 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644249 0.0432164 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.745859 0.0646815 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.750021 0.0887955 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.729506 0.078459 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732161 0.0813312 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.766375 0.075018 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.748514 0.0675537 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.762212 0.050904 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.763719 0.0721458 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759557 0.0480318 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743204 0.0618093 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737837 0.0347427 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.747099 0.0542122 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743371 0.0553974 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.7241 0.0550267 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741565 0.0335575 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718566 0.0343719 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732303 0.014088 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.760836 0.0339282 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.751574 0.0144587 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.757108 0.0351134 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.781094 -0.024813 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701782 0.0432853 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.693716 0.0608821 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.677932 0.0496759 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.694884 0.0652402 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717566 0.0544915 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718734 0.0588496 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.725632 0.0368947 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.700615 0.0389272 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.708681 0.0213304 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.684831 0.027721 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721234 -0.0272215 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.720593 -0.0310802 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.7 -0.0246945 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718114 -0.00820099 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741827 -0.0336072 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739347 -0.010728 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.742467 -0.0297485 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.723713 -0.0501007 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.724354 -0.046242 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70312 -0.043715 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649684 -0.00804971 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.628657 -0.00328338 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630031 0.000378614 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642244 0.0152909 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648309 -0.0117117 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661896 0.00686255 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669336 -0.016478 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636097 -0.026624 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657124 -0.0313903 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637471 -0.022962 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.835815 -0.157543 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.899353 -0.119969 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.909872 -0.0977075 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.891613 -0.104052 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.886771 -0.0997803 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.917612 -0.113625 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.894512 -0.115698 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.907093 -0.135886 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.922453 -0.117896 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.911935 -0.140158 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.904194 -0.124241 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.868703 -0.130205 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.867758 -0.11253 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.846864 -0.122142 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860854 -0.107566 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.889596 -0.120593 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.882692 -0.115629 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.890541 -0.138267 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.875606 -0.135168 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.876551 -0.152843 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.854713 -0.14478 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.836885 -0.0844101 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.826973 -0.0627848 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.81296 -0.083104 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.830202 -0.0805529 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.850898 -0.0640908 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.854126 -0.0818589 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860809 -0.0857161 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.833656 -0.0666419 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.843568 -0.0882673 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819643 -0.0869612 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.866465 -0.147308 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.876203 -0.130609 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.879733 -0.128522 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.857385 -0.124356 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862935 -0.149395 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.844117 -0.143141 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.853198 -0.166093 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.885283 -0.153561 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.875546 -0.170259 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.888813 -0.151474 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803997 -0.111748 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.798532 -0.108311 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.797989 -0.131037 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819589 -0.119537 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.80454 -0.0890219 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.825597 -0.100248 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.810005 -0.0924597 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.78294 -0.100522 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.788405 -0.10396 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.782397 -0.123249 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802927 -0.184881 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.785723 -0.180723 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.798991 -0.161937 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.782104 -0.173028 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.78966 -0.203667 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786041 -0.195972 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.806864 -0.207825 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.806546 -0.192576 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.82375 -0.196734 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819813 -0.17379 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.898283 -0.193102 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.920038 -0.201143 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.900209 -0.201384 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.910616 -0.17991 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.918112 -0.192861 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.90869 -0.171628 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.896357 -0.18482 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.907705 -0.214335 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.88595 -0.206294 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.887876 -0.214576 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.834745 -0.230676 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.824206 -0.252002 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.810793 -0.231282 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.827952 -0.234336 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.848158 -0.251396 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.851905 -0.23373 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.858698 -0.23007 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.830999 -0.248342 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.841538 -0.227016 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.817586 -0.227621 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.867633 -0.203337 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.868948 -0.209658 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.84746 -0.202239 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.865773 -0.186008 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.889121 -0.210757 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.885946 -0.187106 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.887806 -0.204436 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.870808 -0.226988 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.869493 -0.220667 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.84932 -0.219569 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69376 0.0133465 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.668775 0.0631985 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.661946 0.0667914 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65711 0.0452771 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680354 0.0511945 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673611 0.0847128 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.692019 0.069116 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680439 0.08112 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.650366 0.0787954 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657195 0.0752026 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64553 0.0572811 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599047 0.0239663 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649684 -0.00804971 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.634953 -0.000226782 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655218 0.012605 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.635947 0.0122343 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.629419 -0.0208815 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630413 -0.00842045 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644149 -0.0287044 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64869 -0.0205108 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.66342 -0.0283337 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.668955 -0.00767898 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.740325 0.0440268 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.746894 0.0650768 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739183 0.0653796 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.723153 0.0607735 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.748035 0.0437239 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.724295 0.0394207 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741466 0.0226739 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.764065 0.04833 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.757496 0.02728 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.756355 0.0486329 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721234 -0.0272215 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.732368 -0.0484665 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715699 -0.0478762 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737738 -0.0371781 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737902 -0.0278118 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743272 -0.0165234 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.726768 -0.00656677 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715864 -0.0385099 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70473 -0.0172649 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.699195 -0.0379196 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.781094 -0.024813 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.712851 0.0845947 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.706291 0.107813 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.689001 0.0909853 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701434 0.0896851 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.730141 0.101422 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.725284 0.0832945 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.736701 0.0782041 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717709 0.102723 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.724268 0.0795043 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.700418 0.0858949 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737837 0.0347427 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.740802 0.0511556 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718185 0.043171 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.730397 0.0580833 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.760455 0.0427273 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.750049 0.0496549 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.757489 0.0263144 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.748242 0.027815 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.745277 0.0114021 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.725625 0.0198304 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666287 0.0539145 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.650692 0.0721382 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645053 0.0564414 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663167 0.072935 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671925 0.0696112 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6844 0.070408 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.68752 0.0513875 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.653812 0.0531177 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669407 0.034894 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648173 0.0374209 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.674191 -0.142305 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.672341 -0.123995 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666199 -0.120057 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651943 -0.134313 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680334 -0.146243 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659936 -0.156561 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682184 -0.164554 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69459 -0.131987 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696439 -0.150298 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.688447 -0.12805 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.153374 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.731779 -0.136231 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.712305 -0.141449 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70911 -0.129524 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.734974 -0.148156 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.712305 -0.141449 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718696 -0.165299 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.738169 -0.160081 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721891 -0.177224 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718696 -0.165299 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.100996 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.656415 -0.0783272 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639272 -0.0946054 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651197 -0.0978007 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680265 -0.0847178 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.675047 -0.104191 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.686972 -0.107387 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.66834 -0.0815225 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.675047 -0.104191 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651197 -0.0978007 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602641 -0.161477 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.60298 -0.154189 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.622115 -0.166695 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617912 -0.143431 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583506 -0.148971 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598439 -0.138214 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583168 -0.156259 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587708 -0.172234 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58737 -0.179523 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606843 -0.184741 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.120168 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.577317 -0.105912 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582843 -0.128897 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600302 -0.111438 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586046 -0.0971825 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609032 -0.102708 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600302 -0.111438 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.568587 -0.114642 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582843 -0.128897 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574113 -0.137627 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.191718 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549732 -0.185011 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569205 -0.179793 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56601 -0.167868 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.552927 -0.196936 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569205 -0.179793 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575596 -0.203643 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556122 -0.208861 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.578791 -0.215568 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575596 -0.203643 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655019 -0.213855 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.653756 -0.23668 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636974 -0.229127 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660237 -0.233329 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671802 -0.221409 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678283 -0.218058 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673065 -0.198584 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648538 -0.217207 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649801 -0.194382 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631756 -0.209653 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.244096 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607636 -0.260374 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600929 -0.237705 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612854 -0.240901 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631486 -0.266765 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636704 -0.247291 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648629 -0.250487 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619561 -0.26357 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636704 -0.247291 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612854 -0.240901 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.224924 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.710584 -0.23918 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687599 -0.233654 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.705059 -0.216195 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719314 -0.23045 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.713788 -0.207465 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.705059 -0.216195 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701855 -0.24791 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687599 -0.233654 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678869 -0.242384 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786005 -0.343435 8.51251e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.82165 -0.392454 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.824791 -0.400556 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802599 -0.392663 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.821021 -0.376528 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.843843 -0.400347 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840073 -0.376319 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840701 -0.392245 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.82542 -0.416482 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.822279 -0.40838 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803228 -0.408589 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.753118 -0.370774 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.734271 -0.367981 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.731279 -0.362711 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.745269 -0.348136 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.756109 -0.376044 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.767107 -0.356199 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.774956 -0.378837 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.74212 -0.390619 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.760966 -0.393412 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739128 -0.385349 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.80984 -0.323622 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.80634 -0.308073 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786996 -0.316395 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802721 -0.300378 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.829184 -0.315299 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.825565 -0.307605 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.832685 -0.330849 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.813459 -0.331317 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.81696 -0.346866 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.794116 -0.339639 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.854538 -0.365116 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.878086 -0.365674 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.859887 -0.367962 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.863875 -0.346241 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.872736 -0.362827 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.858526 -0.343394 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.849188 -0.362269 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.868748 -0.384548 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.8452 -0.38399 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.85055 -0.386837 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.842728 -0.296284 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.848999 -0.272611 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.828835 -0.281616 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.829121 -0.278432 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862893 -0.287278 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.843015 -0.293099 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.856621 -0.310951 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862606 -0.290462 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.856335 -0.314135 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.842441 -0.299468 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.818893 -0.316097 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.819591 -0.297057 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.814956 -0.293153 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.79807 -0.304244 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.823527 -0.320001 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802007 -0.327188 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.822829 -0.339041 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840413 -0.30891 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.839716 -0.32795 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.835779 -0.305006 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.797815 -0.412267 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.793573 -0.436217 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.776294 -0.419454 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.796968 -0.420728 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.815094 -0.42903 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.818489 -0.413542 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819335 -0.405081 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.79442 -0.427756 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.798662 -0.403807 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.777141 -0.410993 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76217 -0.363249 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.747522 -0.356966 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759239 -0.339469 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.740618 -0.352002 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.750453 -0.380746 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743549 -0.375782 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.765101 -0.387029 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.769074 -0.368213 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.783722 -0.374496 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.780791 -0.350716 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.729282 -0.390587 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.704862 -0.392427 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717401 -0.374248 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.714218 -0.373948 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.716744 -0.408767 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.726099 -0.390287 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741164 -0.406927 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719927 -0.409067 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.744347 -0.407227 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732465 -0.390887 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594141 -0.358439 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.542042 -0.409774 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.517869 -0.413579 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528508 -0.393219 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.525596 -0.395831 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531404 -0.430134 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539131 -0.412386 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555577 -0.426328 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534315 -0.427522 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558488 -0.423716 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544953 -0.407161 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499428 -0.347819 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550064 -0.379835 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.529037 -0.375068 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530412 -0.371406 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542624 -0.356494 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548689 -0.383497 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562276 -0.364922 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569716 -0.388263 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536477 -0.398409 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557504 -0.403175 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.537852 -0.394747 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613592 -0.428945 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.612625 -0.451897 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593593 -0.436515 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.614807 -0.432663 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632624 -0.444328 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634806 -0.425094 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633591 -0.421376 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.61141 -0.448179 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612377 -0.425227 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.592379 -0.432797 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621614 -0.399007 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.620974 -0.402865 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600381 -0.39648 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618494 -0.379986 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642207 -0.405392 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639728 -0.382513 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642848 -0.401533 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624094 -0.421886 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624734 -0.418027 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603501 -0.4155 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681475 -0.396598 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586119 -0.388377 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.570335 -0.399584 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562269 -0.381987 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569167 -0.403942 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594185 -0.405974 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593017 -0.410332 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609969 -0.394768 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587286 -0.384019 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60307 -0.372813 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57922 -0.366422 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638217 -0.337042 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.64748 -0.317573 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643752 -0.316388 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624481 -0.316758 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.641945 -0.338228 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618946 -0.337413 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632683 -0.357697 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661216 -0.337857 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651954 -0.357326 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657489 -0.336672 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566667 -0.317871 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.562847 -0.317033 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561133 -0.338525 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583171 -0.327827 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.568381 -0.296378 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.588706 -0.307172 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572202 -0.297216 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.546343 -0.307077 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550163 -0.307914 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544629 -0.328569 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594141 -0.358439 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.547576 -0.389119 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.525642 -0.386849 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528407 -0.379645 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538964 -0.366733 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544812 -0.396323 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558134 -0.376207 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566746 -0.398593 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534255 -0.409235 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556189 -0.411505 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.537019 -0.402031 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499428 -0.347819 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566667 -0.317871 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551072 -0.299647 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545434 -0.315344 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563547 -0.29885 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572306 -0.302174 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.584781 -0.301377 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587901 -0.320398 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554192 -0.318667 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569787 -0.336891 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548554 -0.334364 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619127 -0.408291 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.617918 -0.415912 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.597788 -0.406911 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616439 -0.39183 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639257 -0.417292 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637778 -0.39321 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640465 -0.409671 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.620605 -0.432372 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621814 -0.424751 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600475 -0.423371 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638217 -0.337042 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.641183 -0.320629 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618565 -0.328614 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630777 -0.313702 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660835 -0.329058 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65043 -0.32213 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65787 -0.345471 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648623 -0.34397 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645657 -0.360383 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626005 -0.351955 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681475 -0.396598 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57505 -0.429687 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.55776 -0.446515 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5512 -0.423296 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562617 -0.428387 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58161 -0.452905 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586467 -0.434777 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5989 -0.436077 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570193 -0.447815 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587483 -0.430987 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563633 -0.424596 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621614 -0.399007 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.632748 -0.420252 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.61608 -0.419661 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638118 -0.408963 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638282 -0.399597 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643653 -0.388308 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627149 -0.378352 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616244 -0.410295 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60511 -0.38905 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599576 -0.409705 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550064 -0.379835 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.535334 -0.372012 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555599 -0.35918 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536327 -0.359551 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529799 -0.392667 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530793 -0.380205 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54453 -0.400489 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549071 -0.392296 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563801 -0.400119 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569335 -0.379464 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0996195 -0.371785 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.220501 -0.393621 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.279642 -0.368601 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.299716 -0.354293 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.292196 -0.366989 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.279022 -0.347717 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287162 -0.355904 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266468 -0.349329 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267088 -0.370213 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.300337 -0.375177 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280263 -0.389485 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.292817 -0.387873 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281062 -0.372464 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.289441 -0.362978 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.270044 -0.378255 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267771 -0.35549 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30046 -0.357187 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.278789 -0.349699 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29208 -0.366673 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302733 -0.379952 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294353 -0.389438 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.283335 -0.395229 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238665 -0.321889 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.250544 -0.304702 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259421 -0.327715 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238717 -0.32307 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229788 -0.298875 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.21796 -0.317244 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217908 -0.316063 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250492 -0.30352 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238612 -0.320707 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259369 -0.326533 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219082 -0.389758 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.228779 -0.378635 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.24293 -0.383364 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225483 -0.365937 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20493 -0.385029 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201634 -0.372331 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.195233 -0.396152 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.222377 -0.402455 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.21268 -0.413578 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236529 -0.407185 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.178104 -0.343046 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.177083 -0.319723 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198298 -0.332294 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.189464 -0.325124 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156889 -0.330475 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.16927 -0.335876 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.157909 -0.353797 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165722 -0.337645 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166743 -0.360967 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.186938 -0.350216 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.15994 -0.414778 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.147477 -0.412573 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172167 -0.412448 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.15977 -0.39322 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13525 -0.414903 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.147543 -0.39555 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.147713 -0.417108 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.147647 -0.434131 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.16011 -0.436336 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172338 -0.434006 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261479 -0.440333 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282991 -0.443285 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282046 -0.4302 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271991 -0.421181 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262424 -0.453417 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251423 -0.431313 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240911 -0.450466 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27248 -0.462437 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250967 -0.459485 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271534 -0.449353 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.202338 -0.465353 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.204606 -0.486123 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223366 -0.470107 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.202946 -0.464339 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183578 -0.481368 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181918 -0.459584 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.18131 -0.460599 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203998 -0.487137 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201729 -0.466367 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.222757 -0.471122 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262898 -0.444196 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.285685 -0.449273 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27701 -0.426189 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282528 -0.436139 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271573 -0.46728 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268416 -0.454146 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248787 -0.462204 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266055 -0.45733 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.243269 -0.452254 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257381 -0.434246 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.367156 -0.277961 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.374298 -0.269898 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.362218 -0.291334 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350338 -0.270045 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379235 -0.256525 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355276 -0.256671 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372093 -0.264588 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.391115 -0.277815 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383973 -0.285878 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379036 -0.299251 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.304189 -0.304189 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29042 -0.307879 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307879 -0.29042 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328039 -0.31058 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331729 -0.29681 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33812 -0.32066 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31058 -0.328039 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32066 -0.33812 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29681 -0.331729 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297666 -0.252306 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.305995 -0.235688 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321516 -0.245915 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312359 -0.259438 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282145 -0.242079 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288509 -0.265828 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273816 -0.258696 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291303 -0.228556 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282974 -0.245173 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306824 -0.238783 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367156 -0.277961 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.385852 -0.261966 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38141 -0.278159 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36581 -0.259422 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.371598 -0.261768 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351556 -0.259225 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352901 -0.277764 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387198 -0.280504 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.368501 -0.2965 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382755 -0.296698 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297666 -0.252306 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.30415 -0.228803 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321516 -0.245915 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306824 -0.238783 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2803 -0.235194 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282974 -0.245173 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273816 -0.258696 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294992 -0.242326 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288509 -0.265828 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312359 -0.259438 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.32435 -0.304189 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33812 -0.307879 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32066 -0.29042 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3005 -0.31058 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29681 -0.29681 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29042 -0.32066 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317959 -0.328039 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307879 -0.33812 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331729 -0.331729 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383759 -0.339925 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.407156 -0.334762 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388696 -0.326552 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.392275 -0.31686 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402218 -0.348135 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387337 -0.330233 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378821 -0.353299 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39864 -0.357827 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.375243 -0.362991 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.380181 -0.349618 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330873 -0.376234 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.346394 -0.386461 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.354723 -0.369843 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340031 -0.362711 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322544 -0.392851 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316181 -0.369102 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307023 -0.382624 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337237 -0.399983 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321715 -0.389757 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345565 -0.383366 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330873 -0.376234 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.348239 -0.393346 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.354723 -0.369843 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345565 -0.383366 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324389 -0.399736 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321715 -0.389757 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307023 -0.382624 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.333547 -0.386213 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316181 -0.369102 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340031 -0.362711 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166275 -0.191247 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.20793 -0.130089 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.221102 -0.115471 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.220766 -0.13987 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200597 -0.126388 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208266 -0.10569 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187762 -0.116607 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.195095 -0.120308 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228435 -0.119172 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215264 -0.13379 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228099 -0.143571 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230419 -0.192135 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.243049 -0.18209 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218634 -0.185251 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227721 -0.168159 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.254834 -0.188974 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.239506 -0.175043 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242204 -0.199019 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245747 -0.206066 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233117 -0.216111 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221332 -0.209227 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172673 -0.154295 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.180792 -0.15554 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.19323 -0.166926 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171251 -0.17557 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160236 -0.142909 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.150694 -0.162939 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152117 -0.141663 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.182215 -0.134265 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174096 -0.133019 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.194652 -0.145651 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.143787 -0.129201 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.14887 -0.105335 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167242 -0.121723 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153943 -0.115741 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.125414 -0.112813 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.130487 -0.123219 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120331 -0.136679 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138714 -0.118795 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13363 -0.142661 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.157086 -0.135183 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108529 -0.153407 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0995811 -0.130858 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.113639 -0.134736 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.123725 -0.135326 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0944715 -0.149528 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.118615 -0.153997 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10342 -0.172078 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0843858 -0.148938 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0933338 -0.171487 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0984435 -0.152816 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102131 -0.190359 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0897843 -0.179968 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.114103 -0.183804 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.105492 -0.166467 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0778128 -0.186523 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0935207 -0.173022 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0901597 -0.196914 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0864233 -0.20386 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0987702 -0.214251 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.110742 -0.207696 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201532 -0.167041 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.219088 -0.151829 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221861 -0.163068 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205084 -0.14514 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.19876 -0.155801 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.184756 -0.149113 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181204 -0.171014 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215537 -0.173729 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.197981 -0.188942 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218309 -0.184969 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159877 -0.228199 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.167942 -0.229756 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183484 -0.223214 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.16569 -0.207683 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144336 -0.234741 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.142084 -0.212668 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13627 -0.233184 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.162129 -0.250271 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.154064 -0.248714 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177671 -0.243729 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224021 -0.229087 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.248268 -0.22829 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2391 -0.216949 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234532 -0.207937 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233189 -0.240428 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219453 -0.220075 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208942 -0.241225 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237756 -0.249439 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.213509 -0.250236 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228589 -0.238098 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058509 -0.451136 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0051487 -0.447081 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.01504 -0.435909 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0289993 -0.440694 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0115452 -0.423265 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00881065 -0.442297 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0123054 -0.429652 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0187019 -0.453468 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00864346 -0.459725 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0012478 -0.470897 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0226028 -0.46451 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0688765 -0.439178 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0903221 -0.426942 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0806307 -0.435083 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0699989 -0.416328 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.078568 -0.431037 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0582447 -0.420423 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0571224 -0.443274 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0891998 -0.449792 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0677542 -0.462029 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0795084 -0.457933 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0172804 -0.386138 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0293677 -0.364644 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0401449 -0.385352 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0213457 -0.375512 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0065032 -0.36543 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00151881 -0.376298 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00558411 -0.386924 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0253024 -0.37527 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0132151 -0.396764 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0360796 -0.395978 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0578769 -0.459039 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0707378 -0.451803 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0461991 -0.454158 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0561039 -0.435761 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0824157 -0.456685 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0677817 -0.440643 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0695548 -0.46392 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0725109 -0.475081 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.05965 -0.482316 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0479721 -0.477435 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0457452 -0.398096 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0495643 -0.373728 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0306825 -0.382672 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.030137 -0.383722 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.064627 -0.389151 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0451997 -0.399146 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.060808 -0.41352 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0651725 -0.388102 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0613535 -0.41247 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0462908 -0.397047 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0571747 -0.463094 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.081612 -0.459563 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0696122 -0.463589 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0665888 -0.442243 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0691745 -0.459069 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0541513 -0.441749 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0447373 -0.4626 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0721979 -0.480415 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0477607 -0.483946 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0601982 -0.48444 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00628079 -0.512079 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.000557006 -0.523883 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0165974 -0.51057 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00208214 -0.49924 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0234352 -0.525392 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0249603 -0.500749 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.029159 -0.513588 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00475566 -0.536722 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0104794 -0.524918 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0123987 -0.523409 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00557859 -0.516134 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00154892 -0.540463 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0156462 -0.524673 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00538221 -0.52751 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0227737 -0.531924 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.026607 -0.518971 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0268034 -0.507596 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00174531 -0.529087 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00577498 -0.504759 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0154498 -0.513298 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0574471 -0.504176 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0817008 -0.508666 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0732807 -0.489545 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0722467 -0.488971 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0658672 -0.523298 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0564131 -0.503602 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0416134 -0.518808 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0669012 -0.523872 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0426474 -0.519382 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.058481 -0.504751 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0483751 -0.248762 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0599222 -0.183785 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0522053 -0.160406 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0358698 -0.178533 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0513956 -0.171954 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0762577 -0.165658 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.075448 -0.177206 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0839747 -0.189036 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0607319 -0.172236 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0684488 -0.195615 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0443964 -0.190363 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00673113 -0.215921 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0258737 -0.20044 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0203763 -0.215612 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00551963 -0.196602 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0122285 -0.200749 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00812553 -0.196911 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00691403 -0.21623 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0270852 -0.21976 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00794264 -0.235241 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0215878 -0.234932 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0172857 -0.187119 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00705049 -0.176731 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00352517 -0.200733 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.025725 -0.192673 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.020811 -0.163117 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0394855 -0.179058 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0310463 -0.173504 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00138875 -0.171177 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00884647 -0.181564 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00491406 -0.195179 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115028 -0.216626 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.127519 -0.195663 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.108803 -0.201738 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104303 -0.194866 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.133744 -0.210551 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110528 -0.209754 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121254 -0.231514 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138245 -0.217423 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.125754 -0.238386 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119529 -0.223497 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0723919 -0.21996 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0673141 -0.20388 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0609052 -0.198742 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0490355 -0.216456 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0788008 -0.225098 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0605222 -0.237674 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0838786 -0.241177 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0906706 -0.207384 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0957484 -0.223463 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0842617 -0.202246 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103481 -0.281603 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.126206 -0.291073 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110246 -0.293457 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119897 -0.271345 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119442 -0.279219 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113132 -0.25949 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0967168 -0.269749 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10979 -0.301332 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0870656 -0.291862 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0938302 -0.303716 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0910116 -0.245428 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0942304 -0.234308 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0714204 -0.238704 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0854464 -0.221514 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113822 -0.241032 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.105038 -0.228237 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110603 -0.252152 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0997955 -0.258223 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0965768 -0.269343 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0769856 -0.262619 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0794645 -0.310405 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0817333 -0.324811 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0603366 -0.313378 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0800146 -0.300317 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100861 -0.321838 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0991425 -0.297345 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0985923 -0.307433 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0811832 -0.334899 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0789143 -0.320493 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0597864 -0.323466 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0243582 -0.277564 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0076281 -0.275459 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00142185 -0.270078 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0167139 -0.255218 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0305645 -0.282946 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0396503 -0.262704 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0472946 -0.285051 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0152725 -0.297806 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0320026 -0.299911 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00906621 -0.292425 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.178985 -0.424299 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.190929 -0.412497 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.16674 -0.417001 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.174844 -0.400273 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203175 -0.419795 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.18709 -0.407571 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191231 -0.431597 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195071 -0.436523 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.183127 -0.448325 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.170881 -0.441027 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.10495 -0.41922 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0911807 -0.42291 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10864 -0.40545 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128801 -0.425611 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13249 -0.411841 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138881 -0.435691 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111341 -0.44307 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121421 -0.45315 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0975713 -0.44676 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131634 -0.367336 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.12515 -0.343834 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107784 -0.360946 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122476 -0.353814 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149 -0.350225 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.146326 -0.360204 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155484 -0.373727 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134308 -0.357357 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.140792 -0.380859 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116942 -0.374468 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178985 -0.424299 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.200165 -0.411775 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189948 -0.415187 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179342 -0.399922 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189202 -0.420888 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168379 -0.409035 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168023 -0.433412 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.199808 -0.436152 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178629 -0.448677 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189591 -0.439564 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131634 -0.367336 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.123305 -0.350719 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107784 -0.360946 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116942 -0.374468 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.147155 -0.357109 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.140792 -0.380859 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155484 -0.373727 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.137998 -0.343587 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.146326 -0.360204 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122476 -0.353814 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.125111 -0.41922 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138881 -0.42291 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121421 -0.40545 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.101261 -0.425611 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0975713 -0.411841 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0911807 -0.435691 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11872 -0.44307 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10864 -0.45315 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13249 -0.44676 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.162382 -0.486264 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.174264 -0.502603 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.15142 -0.495376 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.170327 -0.479659 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.185226 -0.49349 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.18129 -0.470546 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173345 -0.477151 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166319 -0.509207 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154437 -0.492868 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143475 -0.501981 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0984274 -0.491265 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0810612 -0.508376 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0745774 -0.484874 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0837352 -0.498397 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104911 -0.514767 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107585 -0.504787 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122277 -0.497655 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0957534 -0.501244 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11312 -0.484132 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0892696 -0.477742 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0984274 -0.491265 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.082906 -0.501491 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0745774 -0.484874 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0892696 -0.477742 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.106756 -0.507882 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11312 -0.484132 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122277 -0.497655 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0920638 -0.515014 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107585 -0.504787 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0837352 -0.498397 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153845 -0.574159 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.202534 -0.612768 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.225282 -0.612732 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22113 -0.60221 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212428 -0.591695 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206686 -0.62329 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193832 -0.602253 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183939 -0.623325 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215388 -0.633805 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.192641 -0.63384 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211236 -0.623283 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.243024 -0.542885 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219861 -0.534333 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.243024 -0.542885 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219861 -0.534333 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248559 -0.563539 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23093 -0.575642 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23093 -0.575642 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.184086 -0.543919 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.200547 -0.527458 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205161 -0.540303 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187702 -0.522843 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179472 -0.531074 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166627 -0.526459 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.163011 -0.547535 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.196931 -0.548533 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.18047 -0.564994 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201546 -0.561378 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.130984 -0.631939 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.132649 -0.643128 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152367 -0.631785 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.133263 -0.618482 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111266 -0.643283 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11188 -0.618637 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.109601 -0.632094 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.130371 -0.656585 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128706 -0.645397 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.150088 -0.645242 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.112536 -0.56309 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.11011 -0.549659 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.132596 -0.555684 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.118927 -0.53924 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.09005 -0.557065 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0988668 -0.546646 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0924762 -0.570497 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.103719 -0.573509 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.106145 -0.58694 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.126205 -0.579534 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0609772 -0.591664 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.076761 -0.572676 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0609772 -0.591664 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.076761 -0.572676 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0665116 -0.612319 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0878298 -0.613986 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0878298 -0.613986 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172294 -0.643008 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.189742 -0.660425 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.196144 -0.636618 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.185725 -0.645434 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165892 -0.666816 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161875 -0.651825 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.148444 -0.649399 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.17631 -0.657999 0.57904 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.158862 -0.640582 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.182712 -0.634191 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.123605 -0.6044 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.107144 -0.620861 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.119989 -0.625475 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102529 -0.608016 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11076 -0.599785 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.106145 -0.58694 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.127221 -0.583324 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128219 -0.617245 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.14468 -0.600784 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141064 -0.621859 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.195155 -0.585228 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.203972 -0.574809 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181486 -0.568784 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201546 -0.561378 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217641 -0.591253 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215215 -0.577822 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208824 -0.601672 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.197581 -0.598659 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188764 -0.609078 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.175095 -0.592634 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0329639 -0.552323 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0248832 -0.625877 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0316054 -0.646362 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0478 -0.627981 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0287309 -0.625173 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00868865 -0.644258 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00581415 -0.623069 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00196644 -0.623773 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0277577 -0.647066 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0210355 -0.62658 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0439523 -0.628685 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.105299 -0.593994 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100664 -0.582384 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0926585 -0.572783 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0869303 -0.604941 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0742898 -0.58373 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0639267 -0.604278 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0949359 -0.614541 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0719323 -0.613879 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.090301 -0.602932 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0138144 -0.584567 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0177119 -0.584898 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0364224 -0.580268 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0185345 -0.56353 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00489609 -0.589197 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00407348 -0.567829 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00879364 -0.588867 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0129918 -0.605935 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00909422 -0.605605 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0317022 -0.601305 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0244483 -0.584869 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0473753 -0.5935 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0308315 -0.595617 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0399691 -0.57344 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0409921 -0.582752 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0335859 -0.562692 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0180651 -0.574121 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0318545 -0.604929 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00892756 -0.596298 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0153107 -0.607046 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0355172 -0.54356 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0495897 -0.530389 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0261165 -0.53532 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.031221 -0.519442 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0589904 -0.538628 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0406217 -0.527681 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0449178 -0.551799 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0538859 -0.554507 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0398133 -0.567678 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0304127 -0.559438 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0163676 -0.511316 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0212225 -0.48882 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00896145 -0.491256 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00194055 -0.497372 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0286287 -0.50888 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00546563 -0.517432 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0237738 -0.531375 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0395307 -0.502764 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0346758 -0.525259 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0272696 -0.505199 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0440327 -0.593633 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0604766 -0.607302 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0678827 -0.587242 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0604766 -0.607302 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0366265 -0.613693 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0366265 -0.613693 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0201827 -0.600023 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0440327 -0.593633 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0275889 -0.579964 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0514389 -0.573573 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0521134 -0.520079 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0542684 -0.523344 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0591566 -0.541988 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0358996 -0.534291 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0472252 -0.501435 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0288565 -0.512382 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0450702 -0.49817 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0704822 -0.509132 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0683272 -0.505868 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0753703 -0.527777 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101445 -0.561087 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.118381 -0.551884 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0944221 -0.550745 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.103361 -0.536664 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.125404 -0.562225 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.110383 -0.547006 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108468 -0.571428 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.116465 -0.576307 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0995293 -0.58551 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0925065 -0.575168 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247614 -0.494808 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.313607 -0.494287 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.326876 -0.484182 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302705 -0.488171 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310432 -0.470513 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337778 -0.490299 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321334 -0.476629 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324509 -0.500404 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330051 -0.507957 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316783 -0.518062 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305881 -0.511946 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269833 -0.434629 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.279233 -0.426389 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286276 -0.448298 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263449 -0.445377 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262789 -0.41272 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247006 -0.431707 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253389 -0.420959 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285616 -0.415641 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.276216 -0.42388 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29266 -0.43755 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302539 -0.452978 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.320401 -0.436971 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3148 -0.455413 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29902 -0.436675 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30814 -0.434535 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286759 -0.434239 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290278 -0.450543 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32392 -0.453274 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306057 -0.469281 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318318 -0.471717 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291389 -0.554467 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.314604 -0.562288 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310183 -0.541186 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306499 -0.542501 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29581 -0.575569 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287705 -0.555781 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.272595 -0.567748 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299494 -0.574255 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.276279 -0.566433 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295073 -0.553152 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28032 -0.513157 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.298839 -0.507811 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302049 -0.505577 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287442 -0.489718 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27711 -0.515392 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.265714 -0.497299 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258591 -0.520738 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291716 -0.531251 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273198 -0.536597 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294927 -0.529016 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.227186 -0.567359 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.246777 -0.555283 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227528 -0.54267 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205805 -0.567063 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206147 -0.542374 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.204014 -0.554691 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225054 -0.579676 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223263 -0.567305 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244644 -0.567601 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258683 -0.536117 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.275127 -0.549787 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282533 -0.529727 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275127 -0.549787 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251277 -0.556177 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251277 -0.556177 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234833 -0.542508 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258683 -0.536117 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242239 -0.522448 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266089 -0.516058 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.19269 -0.536638 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.17251 -0.549603 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191778 -0.549105 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177908 -0.528912 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173421 -0.537136 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.178819 -0.516445 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193601 -0.524171 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187292 -0.557329 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207471 -0.544363 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20656 -0.556831 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214908 -0.476459 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.209819 -0.457868 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.210053 -0.453963 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2312 -0.458164 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214674 -0.480363 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236055 -0.480659 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219763 -0.498954 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193527 -0.476163 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198616 -0.494753 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193761 -0.472258 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.157543 -0.835815 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.122136 -0.871646 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.102403 -0.871334 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100577 -0.862937 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113406 -0.850164 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.123961 -0.880044 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134964 -0.858873 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143694 -0.880356 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111133 -0.892817 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.130866 -0.893129 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.109307 -0.884419 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0854653 -0.82339 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0654286 -0.811594 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0820122 -0.820516 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0876595 -0.80102 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0688817 -0.814468 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0911125 -0.803895 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0889183 -0.826265 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0632344 -0.833964 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.083271 -0.845761 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.079818 -0.842886 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135649 -0.799077 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.120908 -0.781177 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113462 -0.795477 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13149 -0.778973 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143095 -0.784778 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153678 -0.782573 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.157836 -0.802678 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.125067 -0.801282 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.139808 -0.819182 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11762 -0.815582 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194213 -0.884071 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.197746 -0.891905 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.175383 -0.884286 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.193701 -0.867957 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216576 -0.89169 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212531 -0.867741 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.213043 -0.883856 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.198259 -0.908019 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194726 -0.900186 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.175896 -0.900401 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207727 -0.811502 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.212743 -0.794108 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189621 -0.802328 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.199907 -0.788345 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.230849 -0.803282 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.218012 -0.797518 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225832 -0.820676 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220563 -0.817265 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215547 -0.83466 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.197441 -0.825486 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.229621 -0.84824 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.25245 -0.843832 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233837 -0.846687 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.235043 -0.826426 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248234 -0.845385 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.230827 -0.827978 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225404 -0.849792 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.247028 -0.865646 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224198 -0.870053 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228415 -0.868501 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14403 -0.908384 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.128672 -0.926643 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.1198 -0.904034 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.133221 -0.90826 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.152902 -0.930993 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.157451 -0.912609 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.16826 -0.912733 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.139481 -0.926768 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154838 -0.908508 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.130608 -0.904159 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179437 -0.872552 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.188167 -0.894035 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172046 -0.89378 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195141 -0.885777 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195558 -0.872807 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.202532 -0.864549 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.186828 -0.851325 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172463 -0.880811 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163733 -0.859328 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.156342 -0.880556 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107359 -0.860128 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0905999 -0.853284 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111382 -0.840233 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0940331 -0.839638 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.086577 -0.873178 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0900102 -0.859532 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103336 -0.880022 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103926 -0.873773 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120685 -0.880618 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124708 -0.860723 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0133465 -0.69376 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0838533 -0.674309 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.103063 -0.66171 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0876683 -0.673446 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0800983 -0.653258 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0992478 -0.662574 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0762832 -0.654121 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0800382 -0.675172 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.106818 -0.682761 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0876083 -0.69536 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0914233 -0.694497 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0539145 -0.666287 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0547519 -0.662466 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0439578 -0.682791 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0332597 -0.660752 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0647085 -0.645962 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0432164 -0.644249 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0638711 -0.649783 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0754066 -0.668 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0745692 -0.671821 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0646126 -0.688325 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0239663 -0.599047 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0432853 -0.701782 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0608821 -0.693716 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0652402 -0.694884 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0496759 -0.677932 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0389272 -0.700615 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.027721 -0.684831 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0213304 -0.708681 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0544915 -0.717566 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0368947 -0.725632 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0588496 -0.718734 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00804971 -0.649684 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00328338 -0.628657 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0152909 -0.642244 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.000378614 -0.630031 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.026624 -0.636097 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.022962 -0.637471 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0313903 -0.657124 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0117117 -0.648309 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.016478 -0.669336 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00686255 -0.661896 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0272215 -0.721234 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0310802 -0.720593 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00820099 -0.718114 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0246945 -0.7 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0501007 -0.723713 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.043715 -0.70312 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.046242 -0.724354 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0336072 -0.741827 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0297485 -0.742467 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.010728 -0.739347 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0646815 -0.745859 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0887955 -0.750021 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0813312 -0.732161 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.078459 -0.729506 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0721458 -0.763719 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0618093 -0.743204 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0480318 -0.759557 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.075018 -0.766375 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.050904 -0.762212 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0675537 -0.748514 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.024813 -0.781094 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0347427 -0.737837 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0542122 -0.747099 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0550267 -0.7241 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0553974 -0.743371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0339282 -0.760836 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0351134 -0.757108 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0144587 -0.751574 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0335575 -0.741565 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.014088 -0.732303 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0343719 -0.718566 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.142305 -0.61371 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.125845 -0.597249 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.12123 -0.610094 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138689 -0.592635 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14692 -0.600865 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.159765 -0.596251 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163381 -0.617326 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.12946 -0.618324 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.145921 -0.634785 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124846 -0.631169 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0833673 -0.612676 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10653 -0.604124 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0833673 -0.612676 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10653 -0.604124 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0778329 -0.633331 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0954616 -0.645433 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0954616 -0.645433 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.141271 -0.554772 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13272 -0.577935 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.161926 -0.549237 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.174029 -0.566866 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.174029 -0.566866 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141271 -0.554772 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13272 -0.577935 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.213855 -0.632882 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.216282 -0.61945 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.193796 -0.625476 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207465 -0.609032 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.236341 -0.626857 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.227525 -0.616438 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233915 -0.640288 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.222672 -0.6433 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220246 -0.656732 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200186 -0.649326 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.2291 -0.567237 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209804 -0.576452 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209804 -0.576452 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.24422 -0.582357 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240045 -0.606693 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.24422 -0.582357 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240045 -0.606693 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.265414 -0.661455 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.249631 -0.642468 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265414 -0.661455 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.249631 -0.642468 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.25988 -0.68211 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238562 -0.683777 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238562 -0.683777 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.161477 -0.68526 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.148046 -0.687686 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.137627 -0.678869 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154071 -0.6652 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171896 -0.694077 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177921 -0.671591 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.185327 -0.691651 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155452 -0.707746 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168883 -0.70532 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.145033 -0.698929 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.190051 -0.736819 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171063 -0.721035 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210706 -0.731284 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212373 -0.709966 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212373 -0.709966 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.190051 -0.736819 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171063 -0.721035 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.095832 -0.700504 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.105047 -0.681209 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.105047 -0.681209 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110952 -0.715624 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135288 -0.711449 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110952 -0.715624 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135288 -0.711449 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343435 -0.786005 8.51251e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.392454 -0.82165 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.400556 -0.824791 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376528 -0.821021 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392663 -0.802599 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.416482 -0.82542 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408589 -0.803228 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40838 -0.822279 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400347 -0.843843 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392245 -0.840701 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376319 -0.840073 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.323622 -0.80984 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.308073 -0.80634 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.300378 -0.802721 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316395 -0.786996 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331317 -0.813459 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339639 -0.794116 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.346866 -0.81696 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.315299 -0.829184 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330849 -0.832685 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307605 -0.825565 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.370774 -0.753118 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.367981 -0.734271 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348136 -0.745269 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362711 -0.731279 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390619 -0.74212 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385349 -0.739128 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.393412 -0.760966 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376044 -0.756109 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378837 -0.774956 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356199 -0.767107 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.412267 -0.797815 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.436217 -0.793573 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420728 -0.796968 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419454 -0.776294 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427756 -0.79442 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410993 -0.777141 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403807 -0.798662 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42903 -0.815094 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405081 -0.819335 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.413542 -0.818489 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390587 -0.729282 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.392427 -0.704862 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.373948 -0.714218 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374248 -0.717401 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409067 -0.719927 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390887 -0.732465 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407227 -0.744347 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408767 -0.716744 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406927 -0.741164 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390287 -0.726099 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.363249 -0.76217 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.356966 -0.747522 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.352002 -0.740618 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339469 -0.759239 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.368213 -0.769074 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.350716 -0.780791 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374496 -0.783722 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380746 -0.750453 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.387029 -0.765101 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375782 -0.743549 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.365116 -0.854538 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.365674 -0.878086 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.346241 -0.863875 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367962 -0.859887 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384548 -0.868748 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386837 -0.85055 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.38399 -0.8452 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362827 -0.872736 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362269 -0.849188 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343394 -0.858526 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316097 -0.818893 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.297057 -0.819591 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.304244 -0.79807 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293153 -0.814956 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.30891 -0.840413 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.305006 -0.835779 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32795 -0.839716 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320001 -0.823527 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339041 -0.822829 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327188 -0.802007 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296284 -0.842728 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.272611 -0.848999 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.278432 -0.829121 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.281616 -0.828835 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.290462 -0.862606 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299468 -0.842441 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314135 -0.856335 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.287278 -0.862893 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.310951 -0.856621 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293099 -0.843015 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.358439 -0.594141 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.389119 -0.547576 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.386849 -0.525642 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366733 -0.538964 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379645 -0.528407 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409235 -0.534255 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.402031 -0.537019 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.411505 -0.556189 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396323 -0.544812 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398593 -0.566746 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376207 -0.558134 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317871 -0.566667 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.299647 -0.551072 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29885 -0.563547 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.315344 -0.545434 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318667 -0.554192 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.334364 -0.548554 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.336891 -0.569787 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.302174 -0.572306 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320398 -0.587901 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.301377 -0.584781 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.347819 -0.499428 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.429687 -0.57505 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.446515 -0.55776 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428387 -0.562617 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423296 -0.5512 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.447815 -0.570193 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.424596 -0.563633 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.430987 -0.587483 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452905 -0.58161 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436077 -0.5989 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434777 -0.586467 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379835 -0.550064 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.372012 -0.535334 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359551 -0.536327 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.35918 -0.555599 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392296 -0.549071 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379464 -0.569335 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400119 -0.563801 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392667 -0.529799 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400489 -0.54453 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380205 -0.530793 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399007 -0.621614 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.420252 -0.632748 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408963 -0.638118 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419661 -0.61608 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410295 -0.616244 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409705 -0.599576 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.38905 -0.60511 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399597 -0.638282 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378352 -0.627149 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388308 -0.643653 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408291 -0.619127 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.415912 -0.617918 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39183 -0.616439 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406911 -0.597788 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.432372 -0.620605 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423371 -0.600475 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.424751 -0.621814 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.417292 -0.639257 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409671 -0.640465 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39321 -0.637778 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396598 -0.681475 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337042 -0.638217 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.320629 -0.641183 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.313702 -0.630777 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328614 -0.618565 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.34397 -0.648623 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.351955 -0.626005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360383 -0.645657 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.329058 -0.660835 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.345471 -0.65787 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32213 -0.65043 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.358439 -0.594141 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.409774 -0.542042 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.413579 -0.517869 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.395831 -0.525596 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.393219 -0.528508 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427522 -0.534315 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407161 -0.544953 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423716 -0.558488 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.430134 -0.531404 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.426328 -0.555577 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.412386 -0.539131 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379835 -0.550064 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.375068 -0.529037 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356494 -0.542624 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.371406 -0.530412 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398409 -0.536477 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.394747 -0.537852 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403175 -0.557504 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383497 -0.548689 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388263 -0.569716 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.364922 -0.562276 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.347819 -0.499428 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388377 -0.586119 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.399584 -0.570335 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403942 -0.569167 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.381987 -0.562269 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384019 -0.587286 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366422 -0.57922 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.372813 -0.60307 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405974 -0.594185 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.394768 -0.609969 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410332 -0.593017 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317871 -0.566667 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.317033 -0.562847 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327827 -0.583171 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338525 -0.561133 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307077 -0.546343 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328569 -0.544629 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307914 -0.550163 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296378 -0.568381 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.297216 -0.572202 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307172 -0.588706 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337042 -0.638217 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.317573 -0.64748 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316758 -0.624481 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316388 -0.643752 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337857 -0.661216 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.336672 -0.657489 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357326 -0.651954 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338228 -0.641945 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357697 -0.632683 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337413 -0.618946 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428945 -0.613592 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.451897 -0.612625 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.432663 -0.614807 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436515 -0.593593 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448179 -0.61141 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.432797 -0.592379 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425227 -0.612377 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.444328 -0.632624 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.421376 -0.633591 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425094 -0.634806 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396598 -0.681475 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399007 -0.621614 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.402865 -0.620974 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379986 -0.618494 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39648 -0.600381 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.421886 -0.624094 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4155 -0.603501 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.418027 -0.624734 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405392 -0.642207 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401533 -0.642848 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382513 -0.639728 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.157543 -0.835815 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.119969 -0.899353 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0977075 -0.909872 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0997803 -0.886771 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104052 -0.891613 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.117896 -0.922453 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124241 -0.904194 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.140158 -0.911935 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113625 -0.917612 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135886 -0.907093 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115698 -0.894512 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0844101 -0.836885 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0627848 -0.826973 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0805529 -0.830202 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.083104 -0.81296 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0666419 -0.833656 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0869612 -0.819643 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0882673 -0.843568 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0640908 -0.850898 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0857161 -0.860809 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0818589 -0.854126 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.130205 -0.868703 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.11253 -0.867758 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107566 -0.860854 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122142 -0.846864 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135168 -0.875606 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14478 -0.854713 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.152843 -0.876551 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120593 -0.889596 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138267 -0.890541 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115629 -0.882692 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.193102 -0.898283 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.201143 -0.920038 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.17991 -0.910616 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.201384 -0.900209 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.214335 -0.907705 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.214576 -0.887876 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.206294 -0.88595 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192861 -0.918112 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.18482 -0.896357 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171628 -0.90869 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203337 -0.867633 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.209658 -0.868948 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.186008 -0.865773 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.202239 -0.84746 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.226988 -0.870808 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.219569 -0.84932 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220667 -0.869493 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210757 -0.889121 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.204436 -0.887806 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.187106 -0.885946 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.230676 -0.834745 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.252002 -0.824206 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.234336 -0.827952 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.231282 -0.810793 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248342 -0.830999 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.227621 -0.817586 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.227016 -0.841538 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.251396 -0.848158 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.23007 -0.858698 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.23373 -0.851905 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.147308 -0.866465 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.130609 -0.876203 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124356 -0.857385 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128522 -0.879733 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153561 -0.885283 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.151474 -0.888813 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.170259 -0.875546 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149395 -0.862935 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166093 -0.853198 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143141 -0.844117 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.184881 -0.802927 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.180723 -0.785723 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173028 -0.782104 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.161937 -0.798991 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192576 -0.806546 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.17379 -0.819813 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196734 -0.82375 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203667 -0.78966 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207825 -0.806864 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195972 -0.786041 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111748 -0.803997 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.108311 -0.798532 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119537 -0.819589 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131037 -0.797989 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100522 -0.78294 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.123249 -0.782397 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10396 -0.788405 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0890219 -0.80454 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0924597 -0.810005 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100248 -0.825597 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.202787 -0.61371 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.200937 -0.595399 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194794 -0.591462 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.180539 -0.605717 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.208929 -0.617647 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188531 -0.627965 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210779 -0.635958 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223185 -0.603392 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225035 -0.621702 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.217042 -0.599454 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.624779 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.260374 -0.607636 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240901 -0.612854 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.237705 -0.600929 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.26357 -0.619561 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240901 -0.612854 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.247291 -0.636704 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.266765 -0.631486 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.250487 -0.648629 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.247291 -0.636704 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.5724 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.185011 -0.549732 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.167868 -0.56601 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179793 -0.569205 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.208861 -0.556122 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203643 -0.575596 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215568 -0.578791 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196936 -0.552927 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203643 -0.575596 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179793 -0.569205 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131237 -0.632882 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.131575 -0.625593 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.15071 -0.6381 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.146508 -0.614836 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.112102 -0.620375 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.127034 -0.609618 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111763 -0.627664 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116304 -0.643639 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115965 -0.650927 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135439 -0.656145 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.591572 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.105912 -0.577317 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111438 -0.600302 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128897 -0.582843 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.114642 -0.568587 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.137627 -0.574113 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128897 -0.582843 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0971825 -0.586046 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111438 -0.600302 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.102708 -0.609032 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.663122 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0783272 -0.656415 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0978007 -0.651197 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0946054 -0.639272 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0815225 -0.66834 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0978007 -0.651197 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104191 -0.675047 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0847178 -0.680265 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107387 -0.686972 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104191 -0.675047 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.183615 -0.68526 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.182351 -0.708085 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165569 -0.700531 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188833 -0.704733 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200397 -0.692813 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.206879 -0.689462 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.201661 -0.669989 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177134 -0.688611 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178397 -0.665787 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.160351 -0.681058 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.715501 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.136231 -0.731779 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.129524 -0.70911 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141449 -0.712305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.160081 -0.738169 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165299 -0.718696 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177224 -0.721891 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.148156 -0.734974 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165299 -0.718696 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141449 -0.712305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.696329 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.23918 -0.710584 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216195 -0.705059 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233654 -0.687599 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.24791 -0.701855 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.242384 -0.678869 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233654 -0.687599 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.23045 -0.719314 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216195 -0.705059 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207465 -0.713788 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0133465 -0.69376 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0631985 -0.668775 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0667914 -0.661946 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511945 -0.680354 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0452771 -0.65711 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0787954 -0.650366 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0572811 -0.64553 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0752026 -0.657195 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0847128 -0.673611 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.08112 -0.680439 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.069116 -0.692019 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00804971 -0.649684 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.000226782 -0.634953 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0122343 -0.635947 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.012605 -0.655218 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0205108 -0.64869 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00767898 -0.668955 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0283337 -0.66342 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0208815 -0.629419 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0287044 -0.644149 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00842045 -0.630413 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0239663 -0.599047 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0845947 -0.712851 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.107813 -0.706291 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0896851 -0.701434 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0909853 -0.689001 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102723 -0.717709 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0858949 -0.700418 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0795043 -0.724268 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101422 -0.730141 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0782041 -0.736701 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0832945 -0.725284 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0539145 -0.666287 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0721382 -0.650692 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.072935 -0.663167 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0564414 -0.645053 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0531177 -0.653812 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0374209 -0.648173 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.034894 -0.669407 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696112 -0.671925 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0513875 -0.68752 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.070408 -0.6844 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0347427 -0.737837 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0511556 -0.740802 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0580833 -0.730397 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.043171 -0.718185 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.027815 -0.748242 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0198304 -0.725625 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0114021 -0.745277 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0427273 -0.760455 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0263144 -0.757489 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0496549 -0.750049 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0440268 -0.740325 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0650768 -0.746894 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0607735 -0.723153 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0653796 -0.739183 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.04833 -0.764065 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0486329 -0.756355 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02728 -0.757496 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0437239 -0.748035 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0226739 -0.741466 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0394207 -0.724295 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.024813 -0.781094 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0272215 -0.721234 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0484665 -0.732368 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0371781 -0.737738 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0478762 -0.715699 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0385099 -0.715864 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0379196 -0.699195 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0172649 -0.70473 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0278118 -0.737902 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00656677 -0.726768 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0165234 -0.743272 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.690426 -0.508983 1.83812e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.755941 -0.484794 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.767658 -0.47411 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.749038 -0.489758 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.744501 -0.467528 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774562 -0.469146 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751405 -0.462564 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.762845 -0.47983 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.779098 -0.491377 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.767382 -0.502061 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760478 -0.507025 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.695668 -0.478434 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.703418 -0.481931 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.716184 -0.491475 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.694124 -0.500827 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682902 -0.46889 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.673608 -0.487786 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675152 -0.465393 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704962 -0.459538 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697211 -0.456041 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.717727 -0.469082 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7029 -0.436283 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.714226 -0.418941 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.724842 -0.44101 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704751 -0.43889 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.692283 -0.414215 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682808 -0.434163 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680957 -0.431557 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712374 -0.416335 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701048 -0.433677 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.722991 -0.438403 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7507 -0.515343 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.773394 -0.506594 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.764807 -0.507924 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755462 -0.491321 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759287 -0.514012 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.741355 -0.49874 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.736593 -0.522762 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.768632 -0.530616 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745938 -0.539365 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760045 -0.531946 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697658 -0.466832 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.709346 -0.447385 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721188 -0.46231 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.703286 -0.447429 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.685816 -0.451907 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.679757 -0.451951 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674129 -0.471354 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.703718 -0.466788 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.692031 -0.486235 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.71556 -0.481713 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.685185 -0.539531 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.693658 -0.538818 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.708875 -0.534075 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.691194 -0.517905 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669969 -0.544274 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.667505 -0.523361 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661495 -0.544988 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687649 -0.560445 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.679176 -0.561158 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.702866 -0.555702 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743468 -0.557494 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.767402 -0.560084 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755145 -0.53997 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760285 -0.543179 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755725 -0.577608 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.748608 -0.560703 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.731791 -0.575017 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.750585 -0.574398 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.726651 -0.571808 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.738328 -0.554284 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677953 -0.581682 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.682851 -0.601808 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700216 -0.58454 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680568 -0.579842 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660588 -0.59895 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.658304 -0.576984 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65569 -0.578824 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680237 -0.603648 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675339 -0.583522 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697602 -0.58638 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683194 -0.551134 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.687731 -0.573364 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.703871 -0.56324 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682033 -0.571303 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.667055 -0.561258 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661356 -0.559196 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.662518 -0.539027 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688893 -0.553195 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.684356 -0.530964 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705033 -0.543071 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607487 -0.335322 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.629404 -0.313405 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.626214 -0.316595 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624401 -0.335868 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606941 -0.318408 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.631217 -0.294133 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.611945 -0.295946 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634407 -0.290942 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648676 -0.311592 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651867 -0.308402 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.646863 -0.330864 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610996 -0.384191 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.623201 -0.403702 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.635431 -0.385946 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62031 -0.401066 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.598766 -0.401947 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.595876 -0.399312 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586561 -0.382437 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.613886 -0.386827 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.601681 -0.367317 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626116 -0.369071 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.558618 -0.331813 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.539107 -0.319608 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541743 -0.322499 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.556863 -0.307378 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555982 -0.328923 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.573738 -0.316693 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575492 -0.341128 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.540862 -0.344043 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560372 -0.356248 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.543497 -0.346933 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625895 -0.264535 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.637402 -0.248969 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.646193 -0.271807 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625088 -0.268363 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617105 -0.241698 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604791 -0.261092 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605598 -0.257264 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638209 -0.245142 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626702 -0.260708 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647 -0.267979 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.550934 -0.258608 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603979 -0.286452 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.613271 -0.265398 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627912 -0.281225 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610787 -0.26842 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.589337 -0.270625 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586853 -0.273647 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.580045 -0.291679 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606463 -0.283431 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.59717 -0.304484 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621104 -0.299257 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678274 -0.316914 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.69384 -0.305407 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674446 -0.317721 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671002 -0.296616 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697667 -0.3046 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.67483 -0.295809 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682101 -0.316107 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701111 -0.325704 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.685545 -0.337211 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681717 -0.338018 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656357 -0.33883 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.677411 -0.329538 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674389 -0.332022 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661584 -0.314897 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659378 -0.336346 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643552 -0.321705 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638325 -0.345639 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.672184 -0.353472 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65113 -0.362764 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669162 -0.355956 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684201 -0.391875 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607487 -0.335322 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.659645 -0.283164 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.672915 -0.269894 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666987 -0.293281 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649528 -0.275822 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665573 -0.259777 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642185 -0.265705 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.652302 -0.273047 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683032 -0.277236 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669762 -0.290507 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677104 -0.300624 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656357 -0.33883 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.663448 -0.328536 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639482 -0.329516 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.654603 -0.314396 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680322 -0.33785 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671477 -0.32371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.673232 -0.348145 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665202 -0.35297 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.658111 -0.363265 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.641237 -0.353951 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603979 -0.286452 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.614273 -0.279361 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628413 -0.288206 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.613293 -0.303327 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.589839 -0.277607 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588858 -0.301572 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.579544 -0.284698 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604959 -0.262487 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.594664 -0.269578 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.619099 -0.271332 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610775 -0.279656 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.621535 -0.258061 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634468 -0.275921 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616678 -0.264057 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.597842 -0.261795 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.592985 -0.267791 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587082 -0.28339 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.615632 -0.27366 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604872 -0.295255 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628565 -0.29152 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.550934 -0.258608 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.558618 -0.331813 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.55307 -0.320611 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57665 -0.325005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563845 -0.30788 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535038 -0.327419 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.545813 -0.314688 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.540585 -0.338621 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547843 -0.344544 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.553391 -0.355747 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571423 -0.348938 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663153 -0.332034 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684748 -0.321274 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678752 -0.326131 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666888 -0.308341 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669149 -0.327177 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651289 -0.314244 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647554 -0.337937 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681014 -0.344967 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659419 -0.355727 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675018 -0.349824 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610996 -0.384191 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.622198 -0.389739 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.63493 -0.378964 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617804 -0.366159 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.598265 -0.394966 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593871 -0.371386 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587062 -0.389418 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61539 -0.407771 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604188 -0.402224 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628121 -0.396997 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684201 -0.391875 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.554344 -0.645066 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.610229 -0.668521 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.633406 -0.663938 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626429 -0.65892 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617928 -0.64522 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617206 -0.673539 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.601728 -0.654822 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.59403 -0.678123 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625707 -0.687239 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602531 -0.691822 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61873 -0.682221 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.622977 -0.619787 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.63767 -0.608008 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.620102 -0.623239 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.613891 -0.601637 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.640545 -0.604555 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616766 -0.598184 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625852 -0.616334 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.646756 -0.626157 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.632063 -0.637936 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.629188 -0.641389 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.585648 -0.598918 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.601562 -0.580238 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605914 -0.59781 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587563 -0.581665 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.581295 -0.581346 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.567297 -0.582773 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.565381 -0.600026 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.599646 -0.597491 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.583732 -0.616171 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603999 -0.615063 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541596 -0.6938 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.547376 -0.70016 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.564621 -0.690564 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546319 -0.676324 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.524351 -0.703396 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523294 -0.679561 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.518571 -0.697037 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542652 -0.717636 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536873 -0.711276 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.559898 -0.70804 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517014 -0.624197 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.516313 -0.60809 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538029 -0.616221 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.524375 -0.60089 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495298 -0.616065 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.50336 -0.608865 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495999 -0.632172 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508952 -0.631397 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.509653 -0.647504 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530668 -0.639529 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48571 -0.670344 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.466887 -0.67091 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490138 -0.671107 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480853 -0.650637 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46246 -0.670147 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.476425 -0.649874 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481283 -0.669581 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471745 -0.690617 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490567 -0.690052 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.494995 -0.690815 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.578925 -0.714669 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.597914 -0.729812 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602084 -0.70632 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.592661 -0.711617 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.574755 -0.738161 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569503 -0.719965 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555767 -0.723017 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.584178 -0.732864 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.565189 -0.71772 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588348 -0.709372 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.52304 -0.691213 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.511567 -0.712906 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529503 -0.710453 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.507717 -0.699372 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.505104 -0.693665 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501254 -0.680131 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.516576 -0.671972 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.526889 -0.704747 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538362 -0.683054 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.544826 -0.702295 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591673 -0.665934 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.605761 -0.658095 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.58746 -0.643855 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607672 -0.647455 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609975 -0.680174 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.611885 -0.669535 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.595887 -0.688013 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.589763 -0.676573 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575674 -0.684413 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571461 -0.662334 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.501645 -0.441164 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.518106 -0.424703 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522721 -0.437548 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.505261 -0.420089 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497031 -0.428319 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484186 -0.423704 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48057 -0.44478 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51449 -0.445778 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498029 -0.462239 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519105 -0.458623 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.560583 -0.44013 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.53742 -0.431578 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560583 -0.44013 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.53742 -0.431578 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566118 -0.460785 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548489 -0.472887 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548489 -0.472887 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.502679 -0.382226 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.511231 -0.405389 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.482024 -0.376691 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.469922 -0.39432 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.469922 -0.39432 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.502679 -0.382226 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.511231 -0.405389 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.430095 -0.460336 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.427669 -0.446904 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.450155 -0.45293 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436486 -0.436486 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407609 -0.454311 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416426 -0.443892 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410035 -0.467742 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.421278 -0.470754 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423704 -0.484186 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.443764 -0.47678 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.414851 -0.39469 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434147 -0.403906 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434147 -0.403906 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399731 -0.409811 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403906 -0.434147 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399731 -0.409811 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403906 -0.434147 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.378536 -0.488909 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39432 -0.469922 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378536 -0.488909 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39432 -0.469922 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384071 -0.509564 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405389 -0.511231 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405389 -0.511231 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.482473 -0.512714 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.495905 -0.51514 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506323 -0.506323 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48988 -0.492654 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472055 -0.521531 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46603 -0.499045 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.458623 -0.519105 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488498 -0.5352 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475067 -0.532774 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498917 -0.526383 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.4539 -0.564273 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472887 -0.548489 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433245 -0.558738 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.431578 -0.53742 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.431578 -0.53742 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4539 -0.564273 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472887 -0.548489 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.548119 -0.527958 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538903 -0.508662 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538903 -0.508662 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532998 -0.543078 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508662 -0.538903 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532998 -0.543078 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508662 -0.538903 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335322 -0.607487 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.313405 -0.629404 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.316595 -0.626214 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335868 -0.624401 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318408 -0.606941 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294133 -0.631217 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295946 -0.611945 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290942 -0.634407 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.311592 -0.648676 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308402 -0.651867 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330864 -0.646863 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384191 -0.610996 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.405245 -0.601704 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402224 -0.604188 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389418 -0.587062 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387213 -0.608512 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.371386 -0.593871 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366159 -0.617804 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400018 -0.625637 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378964 -0.63493 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396997 -0.628121 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331813 -0.558618 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.341105 -0.537564 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355747 -0.553391 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338621 -0.540585 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317172 -0.542791 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.314688 -0.545813 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30788 -0.563845 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334297 -0.555596 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325005 -0.57665 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.348938 -0.571423 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.264535 -0.625895 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.245336 -0.623429 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268271 -0.624736 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.260997 -0.604627 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2416 -0.624589 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257262 -0.605787 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2608 -0.627055 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248874 -0.644697 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268073 -0.647163 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271809 -0.646004 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.278768 -0.530773 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286452 -0.603979 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.266942 -0.591774 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269578 -0.594664 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.284698 -0.579544 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.283817 -0.601088 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301572 -0.588858 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.303327 -0.613293 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268696 -0.616209 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288206 -0.628413 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271332 -0.619099 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316914 -0.678274 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.31938 -0.697473 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338182 -0.681812 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318074 -0.674538 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298112 -0.693935 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.296805 -0.671 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295646 -0.674736 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31822 -0.701209 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315754 -0.682009 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337022 -0.685547 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33883 -0.656357 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.351035 -0.675867 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.363265 -0.658111 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.348145 -0.673232 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3266 -0.674113 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32371 -0.671477 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.314396 -0.654603 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.341721 -0.658993 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329516 -0.639482 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.353951 -0.641237 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.412036 -0.664041 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.554344 -0.645066 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.616373 -0.681385 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.639472 -0.678928 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621631 -0.664108 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.629767 -0.661636 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634214 -0.696205 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624508 -0.678912 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.611115 -0.698662 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626079 -0.698678 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602979 -0.701135 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.608237 -0.683858 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617144 -0.607573 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.63057 -0.595495 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617371 -0.615286 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605919 -0.594239 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630343 -0.587782 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605692 -0.586526 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616917 -0.59986 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.641795 -0.608828 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628369 -0.620906 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628595 -0.628619 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609912 -0.649723 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.631982 -0.640648 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62585 -0.64267 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.614812 -0.625749 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616044 -0.647702 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.598874 -0.632802 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593974 -0.656777 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627081 -0.664623 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605012 -0.673698 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.620949 -0.666645 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.553573 -0.718878 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.563328 -0.73992 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.577348 -0.719679 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.559693 -0.720935 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539553 -0.739118 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535918 -0.720133 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529798 -0.718076 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.557208 -0.737863 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547453 -0.716821 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571228 -0.717623 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547112 -0.687216 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.554862 -0.690713 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570641 -0.682694 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.552739 -0.667813 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531333 -0.695235 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.52921 -0.672335 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523582 -0.691738 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549235 -0.710116 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541484 -0.706619 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.565014 -0.702097 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.491544 -0.682558 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.474542 -0.688647 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498226 -0.686417 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.485132 -0.666351 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46786 -0.684788 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.47845 -0.662492 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484862 -0.678699 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480953 -0.704854 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497955 -0.698765 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504637 -0.702624 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560805 -0.676727 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.57563 -0.689897 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.585222 -0.673115 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575587 -0.693998 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.551213 -0.693509 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.55117 -0.69761 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536388 -0.680339 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560848 -0.672626 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546023 -0.659456 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57044 -0.655844 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498776 -0.640408 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.478525 -0.627785 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484234 -0.630799 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497935 -0.615951 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493066 -0.637394 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.512476 -0.62556 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.513317 -0.650016 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.479365 -0.652241 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499616 -0.664864 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.485075 -0.655255 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.561576 -0.602915 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.570049 -0.602201 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582252 -0.615021 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560414 -0.623084 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549372 -0.590095 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539737 -0.610978 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.540899 -0.590808 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571211 -0.582032 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562738 -0.582745 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.583414 -0.594852 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335322 -0.607487 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.283164 -0.659645 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.269894 -0.672915 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.293281 -0.666987 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275822 -0.649528 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259777 -0.665573 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.265705 -0.642185 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273047 -0.652302 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.277236 -0.683032 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290507 -0.669762 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.300624 -0.677104 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33883 -0.656357 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.350033 -0.661904 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.362764 -0.65113 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345639 -0.638325 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.326099 -0.667131 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321705 -0.643552 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.314897 -0.661584 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.343224 -0.679937 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332022 -0.674389 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355956 -0.669162 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286452 -0.603979 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.280905 -0.592776 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304484 -0.59717 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291679 -0.580045 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262872 -0.599585 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273647 -0.586853 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26842 -0.610787 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275678 -0.61671 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281225 -0.627912 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299257 -0.621104 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.279656 -0.610775 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.256944 -0.602632 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26347 -0.606749 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273158 -0.587686 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27313 -0.606658 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.289344 -0.591712 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295841 -0.614801 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263442 -0.62572 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286153 -0.633864 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269968 -0.629838 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.278768 -0.530773 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331813 -0.558618 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.342108 -0.551527 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356248 -0.560372 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.341128 -0.575492 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317673 -0.549772 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316693 -0.573738 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307378 -0.556863 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332793 -0.534652 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322499 -0.541743 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.346933 -0.543497 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332034 -0.663153 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340177 -0.685865 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355123 -0.669651 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33606 -0.679339 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317089 -0.679367 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312971 -0.672841 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308945 -0.656656 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336151 -0.669679 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328008 -0.646968 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351097 -0.653465 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384191 -0.610996 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.391282 -0.600701 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367317 -0.601681 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382437 -0.586561 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408157 -0.610016 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399312 -0.595876 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401066 -0.62031 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393037 -0.625136 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385946 -0.635431 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369071 -0.626116 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.412036 -0.664041 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.441164 -0.441164 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.443014 -0.422853 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449156 -0.418916 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.463412 -0.433171 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435021 -0.445101 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455419 -0.455419 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433171 -0.463412 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420766 -0.430846 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418916 -0.449156 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426908 -0.426908 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.452233 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.383576 -0.43509 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40305 -0.440308 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.406245 -0.428383 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.380381 -0.447015 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40305 -0.440308 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396659 -0.464158 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.377186 -0.45894 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393464 -0.476083 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396659 -0.464158 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.399854 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.45894 -0.377186 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.476083 -0.393464 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.464158 -0.396659 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.43509 -0.383576 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440308 -0.40305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428383 -0.406245 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447015 -0.380381 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440308 -0.40305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.464158 -0.396659 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.512714 -0.460336 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.512375 -0.453047 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493241 -0.465554 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497443 -0.44229 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531849 -0.447829 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.516916 -0.437072 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532187 -0.455118 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527647 -0.471093 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527985 -0.478381 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508512 -0.483599 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.419026 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.538038 -0.404771 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532513 -0.427756 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.515053 -0.410297 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529309 -0.396041 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506323 -0.401567 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.515053 -0.410297 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546768 -0.4135 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532513 -0.427756 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541242 -0.436486 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.490576 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.565623 -0.483869 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.54615 -0.478651 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549345 -0.466726 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562428 -0.495794 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.54615 -0.478651 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539759 -0.502501 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.559233 -0.507719 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536564 -0.514426 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539759 -0.502501 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.460336 -0.512714 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.461599 -0.535539 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478381 -0.527985 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455118 -0.532187 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.443553 -0.520267 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.437072 -0.516916 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44229 -0.497443 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.466817 -0.516065 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.465554 -0.493241 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.483599 -0.508512 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.542955 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.507719 -0.559233 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.514426 -0.536564 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.502501 -0.539759 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.483869 -0.565623 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478651 -0.54615 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.466726 -0.549345 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495794 -0.562428 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478651 -0.54615 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.502501 -0.539759 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.523783 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.404771 -0.538038 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.427756 -0.532513 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410297 -0.515053 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396041 -0.529309 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401567 -0.506323 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410297 -0.515053 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4135 -0.546768 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.427756 -0.532513 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436486 -0.541242 -0.222222 RAD 0.00617284 
+   txt002 
+
+END_SCENE
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/balls3.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/balls3.dat
new file mode 100644
index 00000000..2837425d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/balls3.dat
@@ -0,0 +1,14804 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 1024 768 
+  VERBOSE 0
+
+CAMERA
+  ZOOM 1.20711
+ASPECTRATIO 1.0
+  ANTIALIASING 0
+  RAYDEPTH 5
+  CENTER 2.1 1.3 1.7
+  VIEWDIR -0.700389 -0.433574 -0.566982
+  UPDIR -0.482085 -0.298433 0.82373
+
+END_CAMERA 
+
+BACKGROUND 0.078 0.361 0.753 
+
+LIGHT CENTER 4 3 2 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 1 -4 4 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER -3 1 5 RAD 0.002 COLOR 0.5 0.5 0.5
+
+TEXDEF txt001 AMBIENT 0.2  DIFFUSE 0.8  SPECULAR 0  OPACITY 1 
+PHONG PLASTIC 0 PHONG_SIZE 100000
+ COLOR 1 0.75 0.33 
+ TEXFUNC 0 
+
+TRI 
+  V0 12 12 -0.5   V1 -12 -12 -0.5   V2 12 -12 -0.5 
+   txt001 
+TRI 
+  V0 12 12 -0.5   V1 -12 12 -0.5   V2 -12 -12 -0.5 
+   txt001 
+TEXDEF txt002 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+PHONG PLASTIC 0.5 PHONG_SIZE 45.2776
+ COLOR 1 0.9 0.7 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0 RAD 0.5 
+   txt002 
+ SPHERE CENTER 0.272166 0.272166 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.420314 0.420314 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.470715 0.470715 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.481689 0.481689 0.57904 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475329 0.45787 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45787 0.475329 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.477074 0.494534 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.453255 0.488174 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4661 0.48356 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.494534 0.477074 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48356 0.4661 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488174 0.453255 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.461623 0.409245 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.47044 0.419664 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447954 0.425689 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.468014 0.433095 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484109 0.40322 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481683 0.416651 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475292 0.392801 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.464049 0.395814 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455233 0.385395 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.441563 0.401839 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409245 0.461623 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.419664 0.47044 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433095 0.468014 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.425689 0.447954 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.395814 0.464049 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401839 0.441563 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385395 0.455233 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40322 0.484109 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.392801 0.475292 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416651 0.481683 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429405 0.481784 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.441197 0.503434 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452601 0.483752 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434161 0.494577 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418001 0.501466 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410965 0.492609 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.406209 0.479816 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436441 0.490641 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42465 0.46899 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447846 0.470958 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.36376 0.497028 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383056 0.487812 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383056 0.487812 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34864 0.481907 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352815 0.457572 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34864 0.481907 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352815 0.457572 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379004 0.431383 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.376578 0.444814 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399064 0.438789 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385395 0.455233 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356518 0.437408 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.365335 0.447826 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.358944 0.423976 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.370187 0.420964 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372614 0.407532 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.392673 0.414939 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481784 0.429405 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.503434 0.441197 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.494577 0.434161 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.483752 0.452601 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490641 0.436441 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.470958 0.447846 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46899 0.42465 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501466 0.418001 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.479816 0.406209 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.492609 0.410965 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.431383 0.379004 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.444814 0.376578 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455233 0.385395 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.438789 0.399064 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420964 0.370187 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.414939 0.392673 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407532 0.372614 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.437408 0.356518 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423976 0.358944 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447826 0.365335 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.497028 0.36376 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.487812 0.383056 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.487812 0.383056 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481907 0.34864 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457572 0.352815 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481907 0.34864 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457572 0.352815 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.461844 0.304709 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.492085 0.33495 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.492085 0.33495 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488469 0.313874 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471009 0.331334 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495701 0.356025 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.474625 0.352409 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495701 0.356025 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51316 0.338566 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51316 0.338566 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.509544 0.31749 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.424345 0.305171 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.40568 0.315605 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403931 0.312107 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419383 0.329161 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426095 0.30867 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.439797 0.322225 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.444759 0.298235 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410643 0.291616 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429307 0.281181 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408893 0.288117 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435193 0.368397 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.440864 0.389015 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457301 0.37895 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.451857 0.367697 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418755 0.378463 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429748 0.357145 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.413085 0.357845 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4242 0.389715 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418529 0.369098 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440637 0.37965 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529584 0.334488 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.546497 0.347572 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532117 0.331508 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522481 0.352406 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.543964 0.350552 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519948 0.355387 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.52705 0.337468 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5536 0.329654 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536686 0.31657 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.53922 0.313589 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472692 0.367935 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.48474 0.389488 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495668 0.369235 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.477004 0.379669 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.461764 0.388188 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.454027 0.37837 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449715 0.366636 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480429 0.377754 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46838 0.356202 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.491357 0.357501 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499343 0.304247 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.518259 0.314219 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519922 0.310678 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504895 0.328108 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.49768 0.307788 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484316 0.321677 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478764 0.297816 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.512708 0.290358 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493791 0.280387 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51437 0.286818 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.518736 0.271262 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.539811 0.274878 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.520873 0.290418 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.533373 0.290264 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.537674 0.255722 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531235 0.271108 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.516598 0.252106 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.525174 0.255876 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504099 0.25226 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506236 0.271416 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488495 0.241021 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.50716 0.230587 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51153 0.24936 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499694 0.253381 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484125 0.222248 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.476659 0.245042 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46546 0.232683 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495961 0.218227 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.477296 0.228661 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.500331 0.237 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.450996 0.241483 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.455172 0.217147 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472226 0.232599 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45115 0.228983 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433942 0.226031 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429921 0.237867 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429767 0.250367 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455018 0.229647 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.450842 0.253983 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472072 0.245099 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304709 0.461844 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.33495 0.492085 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.33495 0.492085 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331334 0.471009 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313874 0.488469 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338566 0.51316 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31749 0.509544 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338566 0.51316 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356025 0.495701 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356025 0.495701 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352409 0.474625 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.368397 0.435193 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389015 0.440864 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367697 0.451857 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37895 0.457301 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389715 0.4242 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37965 0.440637 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369098 0.418529 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378463 0.418755 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357845 0.413085 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357145 0.429748 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305171 0.424345 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.315605 0.40568 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329161 0.419383 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312107 0.403931 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291616 0.410643 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288117 0.408893 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281181 0.429307 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30867 0.426095 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298235 0.444759 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322225 0.439797 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271262 0.518736 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.274878 0.539811 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290264 0.533373 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290418 0.520873 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.255876 0.525174 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271416 0.506236 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.25226 0.504099 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.255722 0.537674 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.252106 0.516598 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271108 0.531235 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241483 0.450996 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.217147 0.455172 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228983 0.45115 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.232599 0.472226 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229647 0.455018 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245099 0.472072 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253983 0.450842 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.226031 0.433942 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250367 0.429767 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237867 0.429921 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241021 0.488495 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.230587 0.50716 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253381 0.499694 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.24936 0.51153 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218227 0.495961 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237 0.500331 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228661 0.477296 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.222248 0.484125 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.232683 0.46546 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245042 0.476659 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334488 0.529584 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.347572 0.546497 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352406 0.522481 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331508 0.532117 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329654 0.5536 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313589 0.53922 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31657 0.536686 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350552 0.543964 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337468 0.52705 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355387 0.519948 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304247 0.499343 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.314219 0.518259 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328108 0.504895 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310678 0.519922 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290358 0.512708 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286818 0.51437 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280387 0.493791 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307788 0.49768 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297816 0.478764 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321677 0.484316 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367935 0.472692 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389488 0.48474 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379669 0.477004 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369235 0.495668 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.377754 0.480429 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357501 0.491357 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356202 0.46838 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388188 0.461764 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366636 0.449715 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37837 0.454027 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230635 0.38777 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.2506 0.446614 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.264242 0.467193 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.272442 0.447086 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253384 0.459832 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2424 0.46672 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.231541 0.459359 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228758 0.446141 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261459 0.453974 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247817 0.433396 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269659 0.433868 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301839 0.407906 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.319874 0.420236 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.303021 0.407886 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.296625 0.428474 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318692 0.420256 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295442 0.428494 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.300656 0.407926 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325088 0.399668 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307053 0.387338 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308235 0.387318 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253236 0.449775 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.263032 0.459076 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.270029 0.436804 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247378 0.440021 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.246239 0.472047 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230585 0.452992 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236443 0.462746 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26889 0.468829 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259094 0.459528 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275887 0.446557 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179397 0.426478 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.174744 0.447688 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.197172 0.437457 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.1895 0.447523 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156968 0.436708 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171724 0.436544 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161621 0.415499 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164641 0.426642 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.169293 0.405432 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187069 0.416412 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.182032 0.429639 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.177682 0.45215 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.190087 0.449636 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200611 0.44299 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.169628 0.432153 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.192556 0.422992 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173978 0.409641 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159104 0.438799 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.163454 0.416288 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171508 0.436286 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159431 0.367634 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.13761 0.368692 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.158434 0.366998 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153102 0.387887 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138607 0.369329 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.154099 0.388523 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160429 0.36827 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.14394 0.34844 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165761 0.347381 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164764 0.346745 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227999 0.384609 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.237348 0.393812 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251829 0.390976 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234368 0.408432 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.213518 0.387445 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.210538 0.402066 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.204169 0.378242 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23098 0.369989 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221631 0.360786 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245461 0.367152 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208034 0.325765 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.209548 0.312342 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229235 0.324887 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209827 0.337 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188347 0.31322 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188626 0.337878 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.186834 0.326643 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207755 0.301107 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206242 0.31453 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227442 0.313652 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.279238 0.345901 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.302145 0.344931 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297823 0.356827 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.289691 0.366251 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28356 0.334005 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271106 0.355325 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.260653 0.334975 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291692 0.324581 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268785 0.325551 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28737 0.336477 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.102505 0.502308 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.110567 0.524146 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.126738 0.506465 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.112687 0.504055 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0863343 0.519988 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0884544 0.499897 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0782715 0.49815 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100385 0.522399 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0923218 0.500561 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.116555 0.504718 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160392 0.474661 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.177777 0.492047 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176681 0.473492 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159222 0.490951 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161488 0.493217 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.142932 0.492121 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144102 0.475831 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.178947 0.475757 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161561 0.458371 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177851 0.457202 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160392 0.474661 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.167697 0.481967 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161561 0.458371 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144102 0.475831 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166528 0.498257 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.142932 0.492121 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159222 0.490951 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183987 0.480797 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176681 0.473492 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177851 0.457202 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0571437 0.456947 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0450372 0.477623 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.055591 0.475469 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696413 0.47788 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0465898 0.4591 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.071194 0.459357 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0586963 0.438424 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325396 0.45669 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0446461 0.436013 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0430934 0.454536 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.10495 0.439381 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0911807 0.435691 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10864 0.45315 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128801 0.43299 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13249 0.44676 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138881 0.42291 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111341 0.415531 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.121421 0.40545 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0975713 0.411841 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696698 0.383939 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.052284 0.366554 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0708393 0.36765 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0533799 0.385109 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511144 0.382844 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0522103 0.401399 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0685002 0.400229 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0685739 0.365384 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0859596 0.38277 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0871292 0.36648 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0571437 0.456947 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0493251 0.475575 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0725262 0.467381 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.06557 0.479825 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0339426 0.465141 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0501875 0.46939 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0417612 0.446512 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0408988 0.452697 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0487174 0.434069 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0640999 0.444504 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696698 0.383939 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0623642 0.376634 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0859596 0.38277 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0685002 0.400229 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0460743 0.377803 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0522103 0.401399 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0533799 0.385109 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0635337 0.360344 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0708393 0.36765 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0871292 0.36648 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115031 0.4293 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.125111 0.439381 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138881 0.435691 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.121421 0.45315 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101261 0.43299 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0975713 0.44676 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0911807 0.42291 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11872 0.415531 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10864 0.40545 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13249 0.411841 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.082487 0.239622 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0438957 0.258053 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0426858 0.273525 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.064638 0.265928 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0510334 0.281546 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0219434 0.26565 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.030291 0.273671 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0231533 0.250178 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0355481 0.250032 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.036758 0.23456 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0575003 0.242434 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.117687 0.252557 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.135677 0.265544 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138361 0.25778 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12224 0.275732 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.115003 0.26032 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101567 0.270508 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.097014 0.247334 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.131123 0.242369 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.113134 0.229382 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.133808 0.234605 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0863845 0.308551 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0971427 0.330622 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.109956 0.310023 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.091905 0.317013 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0735708 0.329151 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0683331 0.315541 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0628126 0.30708 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0916222 0.322161 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.080864 0.30009 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.104436 0.301561 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00869528 0.245118 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0110117 0.257416 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00823377 0.253319 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0102865 0.269325 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0105502 0.249215 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.010748 0.261124 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00915679 0.236916 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0126029 0.233209 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00710408 0.22091 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00664257 0.229111 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511841 0.295616 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0555846 0.315856 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0705987 0.309941 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0705297 0.296292 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.03617 0.301531 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511152 0.281968 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0317696 0.281291 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.036239 0.31518 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0318385 0.29494 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.051253 0.309265 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0472866 0.226687 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.025169 0.224935 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0281502 0.217281 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0288111 0.241399 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0443054 0.234341 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0479475 0.250805 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.066423 0.236092 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0436445 0.210223 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0657621 0.211974 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0466257 0.202569 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0399982 0.189123 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0335228 0.179527 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0567332 0.187058 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0385291 0.203632 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0167878 0.181593 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.021794 0.205698 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0232631 0.191189 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0349919 0.165018 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0414672 0.174615 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0582023 0.172549 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0785895 0.170692 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0867911 0.147549 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101845 0.166573 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.083121 0.161663 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0635354 0.151669 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0598652 0.165782 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0553337 0.174812 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822597 0.156579 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.074058 0.179722 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0973138 0.175603 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11379 0.183628 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.133336 0.176775 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136161 0.192663 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.124499 0.199753 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.110965 0.167739 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102127 0.190718 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0914184 0.174592 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.122627 0.160649 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.103081 0.167502 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.125452 0.176537 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38777 0.230635 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.446614 0.2506 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.467193 0.264242 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459832 0.253384 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447086 0.272442 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.453974 0.261459 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433868 0.269659 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433396 0.247817 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46672 0.2424 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446141 0.228758 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459359 0.231541 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449775 0.253236 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.459076 0.263032 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440021 0.247378 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436804 0.270029 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.468829 0.26889 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446557 0.275887 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459528 0.259094 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472047 0.246239 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.462746 0.236443 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452992 0.230585 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407906 0.301839 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.420236 0.319874 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428474 0.296625 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407886 0.303021 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399668 0.325088 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387318 0.308235 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387338 0.307053 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420256 0.318692 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407926 0.300656 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428494 0.295442 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384609 0.227999 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.393812 0.237348 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408432 0.234368 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.390976 0.251829 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369989 0.23098 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367152 0.245461 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.360786 0.221631 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387445 0.213518 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378242 0.204169 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402066 0.210538 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345901 0.279238 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.344931 0.302145 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366251 0.289691 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356827 0.297823 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324581 0.291692 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336477 0.28737 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325551 0.268785 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334005 0.28356 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334975 0.260653 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355325 0.271106 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325765 0.208034 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.312342 0.209548 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337 0.209827 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324887 0.229235 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301107 0.207755 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313652 0.227442 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31453 0.206242 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31322 0.188347 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.326643 0.186834 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337878 0.188626 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426478 0.179397 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.447688 0.174744 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447523 0.1895 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.437457 0.197172 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426642 0.164641 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416412 0.187069 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405432 0.169293 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436708 0.156968 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.415499 0.161621 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436544 0.171724 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367634 0.159431 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.368692 0.13761 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387887 0.153102 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366998 0.158434 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34844 0.14394 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.346745 0.164764 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347381 0.165761 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369329 0.138607 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36827 0.160429 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388523 0.154099 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429639 0.182032 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.45215 0.177682 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44299 0.200611 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449636 0.190087 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.438799 0.159104 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436286 0.171508 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416288 0.163454 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.432153 0.169628 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409641 0.173978 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.422992 0.192556 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.239622 0.082487 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.258053 0.0438957 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.273525 0.0426858 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281546 0.0510334 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.265928 0.064638 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250032 0.0355481 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242434 0.0575003 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23456 0.036758 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26565 0.0219434 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250178 0.0231533 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273671 0.030291 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308551 0.0863845 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.330622 0.0971427 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317013 0.091905 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310023 0.109956 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322161 0.0916222 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301561 0.104436 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30009 0.080864 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329151 0.0735708 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30708 0.0628126 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315541 0.0683331 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.252557 0.117687 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.265544 0.135677 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275732 0.12224 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.25778 0.138361 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242369 0.131123 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234605 0.133808 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229382 0.113134 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26032 0.115003 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247334 0.097014 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.270508 0.101567 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.189123 0.0399982 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.179527 0.0335228 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203632 0.0385291 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187058 0.0567332 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165018 0.0349919 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172549 0.0582023 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174615 0.0414672 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181593 0.0167878 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191189 0.0232631 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205698 0.021794 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183628 0.11379 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.176775 0.133336 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.199753 0.124499 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.192663 0.136161 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160649 0.122627 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176537 0.125452 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167502 0.103081 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167739 0.110965 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174592 0.0914184 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.190718 0.102127 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.170692 0.0785895 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.147549 0.0867911 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161663 0.083121 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166573 0.101845 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156579 0.0822597 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.175603 0.0973138 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179722 0.074058 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.151669 0.0635354 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174812 0.0553337 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165782 0.0598652 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245118 0.00869528 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.257416 -0.0110117 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269325 0.0102865 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253319 0.00823377 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233209 -0.0126029 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229111 0.00664257 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22091 0.00710408 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249215 -0.0105502 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236916 0.00915679 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261124 0.010748 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.226687 0.0472866 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.224935 0.025169 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241399 0.0288111 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217281 0.0281502 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.210223 0.0436445 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.202569 0.0466257 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211974 0.0657621 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234341 0.0443054 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236092 0.066423 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250805 0.0479475 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295616 0.0511841 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.315856 0.0555846 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.296292 0.0705297 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.309941 0.0705987 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31518 0.036239 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.309265 0.051253 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29494 0.0318385 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301531 0.03617 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281291 0.0317696 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281968 0.0511152 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.502308 0.102505 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.524146 0.110567 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504055 0.112687 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506465 0.126738 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522399 0.100385 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504718 0.116555 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.500561 0.0923218 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519988 0.0863343 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.49815 0.0782715 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499897 0.0884544 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.474661 0.160392 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.481967 0.167697 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475831 0.144102 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.458371 0.161561 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480797 0.183987 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457202 0.177851 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.473492 0.176681 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498257 0.166528 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490951 0.159222 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.492121 0.142932 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.474661 0.160392 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.492047 0.177777 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490951 0.159222 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.473492 0.176681 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475757 0.178947 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.457202 0.177851 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.458371 0.161561 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493217 0.161488 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475831 0.144102 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.492121 0.142932 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.456947 0.0571437 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.475575 0.0493251 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.479825 0.06557 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.467381 0.0725262 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452697 0.0408988 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.444504 0.0640999 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434069 0.0487174 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.465141 0.0339426 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446512 0.0417612 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46939 0.0501875 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.439381 0.125111 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45315 0.121421 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435691 0.138881 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.415531 0.11872 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.411841 0.13249 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40545 0.10864 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.43299 0.101261 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42291 0.0911807 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44676 0.0975713 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383939 0.0696698 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.376634 0.0623642 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400229 0.0685002 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38277 0.0859596 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.360344 0.0635337 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36648 0.0871292 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36765 0.0708393 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.377803 0.0460743 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385109 0.0533799 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401399 0.0522103 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.456947 0.0571437 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.477623 0.0450372 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.47788 0.0696413 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475469 0.055591 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45669 0.0325396 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.454536 0.0430934 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436013 0.0446461 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4591 0.0465898 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.438424 0.0586963 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.459357 0.071194 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383939 0.0696698 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.366554 0.052284 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385109 0.0533799 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36765 0.0708393 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.365384 0.0685739 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36648 0.0871292 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38277 0.0859596 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382844 0.0511144 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400229 0.0685002 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401399 0.0522103 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4293 0.115031 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.41922 0.125111 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40545 0.121421 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42291 0.138881 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44307 0.11872 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44676 0.13249 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45315 0.10864 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.425611 0.101261 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435691 0.0911807 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.411841 0.0975713 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.802608 0.281471 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.824035 0.30566 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.822021 0.302088 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.821938 0.282758 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.802598 0.298094 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.824119 0.32499 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.804695 0.320997 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.826132 0.328563 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843459 0.309654 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845472 0.313227 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843375 0.290324 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.787796 0.241352 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.785699 0.218449 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.802677 0.22345 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.778718 0.223304 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770818 0.236351 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.763837 0.241205 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.772915 0.259253 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.794777 0.236497 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.796874 0.2594 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.811756 0.241498 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.752156 0.305221 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.741263 0.325175 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.747715 0.32493 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.765112 0.325981 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745704 0.305466 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.769553 0.306272 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.756597 0.285513 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.728307 0.304415 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7392 0.284462 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.734759 0.304171 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838847 0.34578 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.851488 0.360404 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853509 0.335865 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.832518 0.347059 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.836826 0.370319 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817857 0.356973 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.824185 0.355695 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857816 0.359125 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845176 0.344501 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.859838 0.334587 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.766968 0.345341 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.768944 0.369945 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.788341 0.356172 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.780624 0.356171 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.747572 0.359113 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759252 0.34534 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745596 0.33451 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755289 0.359115 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.753313 0.334511 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774685 0.345342 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817421 0.321591 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.83071 0.340361 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.840365 0.325527 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.822249 0.341208 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.807766 0.336425 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.799305 0.337272 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.794477 0.317654 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.825882 0.320744 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.812593 0.301973 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.835537 0.30591 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.874487 0.28191 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.891539 0.292033 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.868678 0.28812 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.872763 0.305711 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.897348 0.285824 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.878572 0.299501 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.880296 0.275701 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.893263 0.268233 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876212 0.25811 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.870402 0.264319 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853061 0.257721 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.87538 0.26204 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.87108 0.266856 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.860805 0.280934 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857361 0.252905 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842785 0.271799 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.835041 0.248586 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.867636 0.238827 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845317 0.234508 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.863337 0.243643 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838248 0.217602 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.860225 0.206363 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.858689 0.230102 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.854636 0.223536 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.839784 0.193863 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.834196 0.211035 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817808 0.205101 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843837 0.200429 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.821861 0.211667 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842301 0.224168 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.61371 0.202787 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.61556 0.221097 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621702 0.225035 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.635958 0.210779 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607567 0.198849 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627965 0.188531 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605717 0.180539 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593312 0.213105 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591462 0.194794 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.599454 0.217042 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.191718 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.556122 0.208861 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575596 0.203643 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.578791 0.215568 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.552927 0.196936 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575596 0.203643 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569205 0.179793 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549732 0.185011 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.56601 0.167868 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569205 0.179793 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.244096 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.631486 0.266765 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648629 0.250487 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.636704 0.247291 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607636 0.260374 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.612854 0.240901 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600929 0.237705 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.619561 0.26357 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.612854 0.240901 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.636704 0.247291 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68526 0.183615 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684921 0.190903 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665787 0.178397 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669989 0.201661 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704395 0.196121 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.689462 0.206879 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704733 0.188833 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700193 0.172858 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700531 0.165569 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681058 0.160351 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.224924 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.710584 0.23918 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705059 0.216195 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687599 0.233654 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701855 0.24791 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678869 0.242384 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687599 0.233654 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.719314 0.23045 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705059 0.216195 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.713788 0.207465 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.153374 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.738169 0.160081 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718696 0.165299 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721891 0.177224 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.734974 0.148156 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718696 0.165299 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712305 0.141449 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.731779 0.136231 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.70911 0.129524 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712305 0.141449 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.632882 0.131237 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.634145 0.108412 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.650927 0.115965 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627664 0.111763 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616099 0.123683 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609618 0.127034 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.614836 0.146508 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639363 0.127886 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.6381 0.15071 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656145 0.135439 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.100996 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.680265 0.0847178 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.686972 0.107387 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675047 0.104191 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656415 0.0783272 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651197 0.0978007 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639272 0.0946054 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.66834 0.0815225 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651197 0.0978007 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675047 0.104191 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.120168 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.577317 0.105912 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600302 0.111438 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582843 0.128897 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.568587 0.114642 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.574113 0.137627 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582843 0.128897 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586046 0.0971825 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600302 0.111438 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609032 0.102708 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.594141 0.358439 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.619127 0.408291 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.625955 0.411883 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630791 0.390369 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607547 0.396287 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61429 0.429805 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.595882 0.414208 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607462 0.426212 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.637535 0.423887 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630706 0.420295 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642371 0.402373 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688854 0.369058 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638217 0.337042 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.652948 0.344865 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.632683 0.357697 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651954 0.357326 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.658482 0.324211 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.657489 0.336672 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643752 0.316388 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639211 0.324581 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624481 0.316758 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.618946 0.337413 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547576 0.389119 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.541008 0.410169 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548718 0.410472 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.564748 0.405866 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539866 0.388816 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563607 0.384513 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546435 0.367766 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523836 0.393422 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530405 0.372372 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531546 0.393725 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566667 0.317871 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.555534 0.296626 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572202 0.297216 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.550163 0.307914 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549999 0.31728 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.544629 0.328569 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.561133 0.338525 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572037 0.306582 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.583171 0.327827 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588706 0.307172 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506807 0.320279 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57505 0.429687 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.58161 0.452905 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5989 0.436077 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586467 0.434777 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.55776 0.446515 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562617 0.428387 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5512 0.423296 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570193 0.447815 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563633 0.424596 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587483 0.430987 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.550064 0.379835 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.547099 0.396248 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569716 0.388263 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.557504 0.403175 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527447 0.387819 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.537852 0.394747 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530412 0.371406 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539659 0.372907 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542624 0.356494 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562276 0.364922 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621614 0.399007 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.637209 0.41723 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642848 0.401533 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624734 0.418027 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.615976 0.414703 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603501 0.4155 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600381 0.39648 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634089 0.39821 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.618494 0.379986 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639728 0.382513 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.802608 0.281471 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.858698 0.329459 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.872345 0.34259 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.86421 0.32016 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848329 0.338969 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.866833 0.351888 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842817 0.348268 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853186 0.338757 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882715 0.333079 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.869068 0.319948 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.87458 0.310649 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845371 0.280879 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.849036 0.291048 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.826067 0.287867 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.840755 0.304882 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.868341 0.28406 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.86006 0.297894 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.864676 0.273891 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853652 0.267046 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.849987 0.256877 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.830683 0.263865 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.798572 0.337088 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.808673 0.346884 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.82298 0.335792 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.807762 0.322361 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.784265 0.34818 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.783355 0.323657 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774164 0.338384 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.799483 0.361611 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.789382 0.351815 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.81379 0.350519 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.815936 0.330051 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.828769 0.350165 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838905 0.333232 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.820583 0.347547 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.805799 0.346984 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.797614 0.344366 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.792966 0.32687 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.824121 0.332668 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.811288 0.312554 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.834258 0.315735 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.75581 0.33768 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.753851 0.362219 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774086 0.350765 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76987 0.352319 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.735575 0.349134 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751594 0.339233 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737534 0.324595 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.739791 0.347581 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.74175 0.323042 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760026 0.336127 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759846 0.282063 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.756464 0.29233 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.779336 0.288514 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.765125 0.305929 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.736973 0.285879 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745634 0.299478 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.740355 0.275612 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751185 0.268464 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.754567 0.258198 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774058 0.264649 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.862735 0.273842 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.885497 0.282313 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876946 0.281455 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.867718 0.29787 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.871286 0.274699 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.853506 0.290257 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848523 0.266228 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.880514 0.258284 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857752 0.249813 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.871963 0.257427 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.806645 0.225855 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.818054 0.21762 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.83061 0.230661 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.813612 0.241754 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.794089 0.212813 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.789647 0.236948 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.78268 0.221048 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.811087 0.20172 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.799677 0.209955 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.823642 0.214761 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.849407 0.225263 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.873186 0.21889 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.865588 0.240865 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.866351 0.236437 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857005 0.203288 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.850171 0.220835 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.833227 0.20966 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.856242 0.207715 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.832464 0.214088 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848644 0.22969 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.594141 0.358439 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.613592 0.428945 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.626191 0.448155 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634643 0.42519 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.614455 0.43276 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.60514 0.45191 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593404 0.436515 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.592541 0.4327 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625328 0.44434 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.612729 0.42513 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.63378 0.421375 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68332 0.389713 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660156 0.398265 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665691 0.37761 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688854 0.369058 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671225 0.356956 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621614 0.399007 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.625435 0.399844 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627149 0.378352 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.60511 0.38905 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.619901 0.420499 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.599576 0.409705 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61608 0.419661 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.641939 0.409801 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638118 0.408963 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643653 0.388308 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542042 0.409774 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.53788 0.433888 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.558395 0.423551 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.55574 0.426423 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.521526 0.42011 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539387 0.412646 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.525689 0.395996 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.524182 0.417238 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528344 0.393124 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.544697 0.406901 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.550064 0.379835 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.540802 0.399304 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.54453 0.400489 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563801 0.400119 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546337 0.37865 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569335 0.379464 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555599 0.35918 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527065 0.37902 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536327 0.359551 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530793 0.380205 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501272 0.340934 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517056 0.359921 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522591 0.339267 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506807 0.320279 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.528125 0.318612 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586119 0.388377 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.594185 0.405974 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609969 0.394768 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593017 0.410332 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570335 0.399584 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569167 0.403942 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562269 0.381987 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587286 0.384019 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57922 0.366422 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.60307 0.372813 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566667 0.317871 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.567308 0.314012 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587901 0.320398 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569787 0.336891 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546074 0.311485 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548554 0.334364 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.545434 0.315344 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.564188 0.294991 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563547 0.29885 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.584781 0.301377 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638217 0.337042 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.659244 0.341809 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65787 0.345471 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645657 0.360383 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639592 0.33338 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626005 0.351955 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.618565 0.328614 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651804 0.318468 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630777 0.313702 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65043 0.32213 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643951 0.172546 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.674191 0.202787 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.690652 0.219248 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.695267 0.206403 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677807 0.223862 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669577 0.215632 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656732 0.220246 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.653116 0.199171 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687036 0.198172 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.670575 0.181711 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.691651 0.185327 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.733129 0.203821 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.709966 0.212373 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.733129 0.203821 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.709966 0.212373 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715501 0.191718 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.738664 0.183166 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721035 0.171063 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721035 0.171063 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.675225 0.261725 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683777 0.238562 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65457 0.267259 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642468 0.249631 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642468 0.249631 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675225 0.261725 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663122 0.244096 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683777 0.238562 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602641 0.183615 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.600215 0.197046 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.622701 0.191021 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609032 0.207465 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.580155 0.18964 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588972 0.200059 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582581 0.176209 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593824 0.173196 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.596251 0.159765 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61631 0.167171 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.587397 0.24926 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606693 0.240045 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606693 0.240045 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572277 0.23414 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.576452 0.209804 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.572277 0.23414 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.576452 0.209804 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591572 0.224924 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.551082 0.155041 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566866 0.174029 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.551082 0.155041 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566866 0.174029 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.5724 0.153374 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.556617 0.134387 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.577935 0.13272 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.577935 0.13272 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.655019 0.131237 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.668451 0.12881 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678869 0.137627 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.662426 0.151296 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644601 0.12242 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638576 0.144906 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.631169 0.124846 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661044 0.108751 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647613 0.111177 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671463 0.117567 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.626446 0.0796777 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645433 0.0954616 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605791 0.0852121 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604124 0.10653 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604124 0.10653 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626446 0.0796777 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624779 0.100996 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645433 0.0954616 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.720665 0.115992 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.711449 0.135288 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.711449 0.135288 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705544 0.100872 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681209 0.105047 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705544 0.100872 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681209 0.105047 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.696329 0.120168 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.852418 0.0955788 1.89979e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.922609 0.11107 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.937225 0.122151 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.916553 0.11086 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.915202 0.131874 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.943281 0.12236 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.921258 0.132084 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.928665 0.111279 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.944632 0.101346 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.930016 0.0902645 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.92396 0.090055 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.867231 0.135698 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.873196 0.134634 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882112 0.117797 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.858152 0.11765 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.858315 0.152536 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.843271 0.135552 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.852349 0.1536 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882275 0.152682 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876309 0.153747 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.89119 0.135845 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.877966 0.164775 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.890926 0.182656 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.897331 0.159019 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.876622 0.167676 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.871561 0.188412 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857256 0.173431 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.8586 0.17053 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.89227 0.179755 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.87931 0.161874 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.898675 0.156118 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.907797 0.0709499 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.930963 0.0752104 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.924191 0.0806562 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.915684 0.0941344 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.914568 0.0655041 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.899289 0.0844281 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.891402 0.0612436 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.923076 0.0520258 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.89991 0.0477654 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.916304 0.0574717 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.863153 0.124655 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.875744 0.141535 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.88655 0.129819 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.868763 0.146389 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.852347 0.136371 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.845366 0.141225 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.839756 0.119492 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.870135 0.119801 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.857544 0.102922 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.880941 0.108085 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.837606 0.0554592 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.842832 0.0523913 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.86055 0.0593957 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.842434 0.0750766 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.819888 0.0484547 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.81949 0.07114 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.814662 0.0515226 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.838004 0.0327739 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.832778 0.0358417 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.855722 0.0397783 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.897062 0.0418734 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.920407 0.0359958 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.912106 0.0588574 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.915603 0.0511067 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.905363 0.0190117 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.900559 0.0341227 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.882018 0.0248894 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.901866 0.0267625 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.878521 0.0326401 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.893565 0.0496241 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.826871 0.0263827 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.825102 0.00436945 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.84533 0.018173 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.823964 0.025051 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.806642 0.0125791 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.805505 0.0332607 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.808411 0.0345923 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.828008 0.00570109 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.829777 0.0277143 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.848237 0.0195047 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.841683 0.0665023 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.840284 0.0454909 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.856111 0.0473735 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.831823 0.0463379 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.825856 0.0646197 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.817395 0.0654667 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.827255 0.0856311 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.850144 0.0656554 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.851543 0.0866667 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.865971 0.0675379 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.69376 -0.0133465 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.740325 -0.0440268 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.762259 -0.0417568 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759495 -0.0345526 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.748937 -0.0216407 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743089 -0.051231 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.729767 -0.0311149 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721155 -0.053501 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.753646 -0.0641429 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.731712 -0.0664129 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.750882 -0.0569387 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.788473 -0.00272662 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721234 0.0272215 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.736829 0.0454452 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.742467 0.0297485 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.724354 0.046242 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715595 0.0429182 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.70312 0.043715 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7 0.0246945 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.733709 0.0264247 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718114 0.00820099 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.739347 0.010728 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.668775 -0.0631985 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.669983 -0.0708196 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.690113 -0.0618185 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671462 -0.0467378 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648644 -0.0721997 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.650123 -0.0481178 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647436 -0.0645786 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.667296 -0.0872804 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666087 -0.0796593 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687426 -0.0782793 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649684 0.00804971 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.646718 0.0244627 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669336 0.016478 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.657124 0.0313903 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627066 0.0160343 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.637471 0.022962 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630031 -0.000378614 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639278 0.00112207 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642244 -0.0152909 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661896 -0.00686255 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606426 -0.051506 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712851 -0.0845947 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.730141 -0.101422 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.736701 -0.0782041 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.725284 -0.0832945 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.706291 -0.107813 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701434 -0.0896851 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.689001 -0.0909853 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.717709 -0.102723 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700418 -0.0858949 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.724268 -0.0795043 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666287 -0.0539145 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.655153 -0.0751594 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671821 -0.0745692 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649783 -0.0638711 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649619 -0.0545047 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644249 -0.0432164 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660752 -0.0332597 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671657 -0.0652028 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682791 -0.0439578 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688325 -0.0646126 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737837 -0.0347427 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.752567 -0.0269197 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.732303 -0.014088 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751574 -0.0144587 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.758102 -0.0475745 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.757108 -0.0351134 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743371 -0.0553974 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.73883 -0.0472037 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7241 -0.0550267 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718566 -0.0343719 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.69376 -0.0133465 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.745859 -0.0646815 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.770032 -0.0684873 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759394 -0.0481266 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.762305 -0.0507391 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.756497 -0.0850422 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.74877 -0.067294 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.732325 -0.0812364 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.753586 -0.0824297 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.729413 -0.0786239 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.742948 -0.062069 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.782939 0.0179281 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759776 0.02648 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.76531 0.0058253 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.788473 -0.00272662 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.770845 -0.0148294 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737837 -0.0347427 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.758864 -0.0299763 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.757489 -0.0263144 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745277 -0.0114021 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.739212 -0.0384047 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.725625 -0.0198304 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718185 -0.043171 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751424 -0.0533169 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.730397 -0.0580833 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.750049 -0.0496549 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674309 -0.0838533 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.675276 -0.106805 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.694308 -0.091423 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.673094 -0.0875713 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.655278 -0.0992356 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.653095 -0.0800016 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65431 -0.0762835 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.676491 -0.103087 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675524 -0.0801352 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.695522 -0.0877049 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666287 -0.0539145 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.666927 -0.0577732 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.68752 -0.0513875 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669407 -0.034894 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645694 -0.0603001 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648173 -0.0374209 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645053 -0.0564414 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663807 -0.0767937 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663167 -0.072935 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.6844 -0.070408 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.600892 -0.0308513 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616676 -0.0118635 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62221 -0.0325183 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606426 -0.051506 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627745 -0.053173 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701782 -0.0432853 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.717566 -0.0544915 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.725632 -0.0368947 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.718734 -0.0588496 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.693716 -0.0608821 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.694884 -0.0652402 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677932 -0.0496759 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700615 -0.0389272 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.684831 -0.027721 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.708681 -0.0213304 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649684 0.00804971 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.640422 0.0275193 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644149 0.0287044 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.66342 0.0283337 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.645956 0.00686453 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.668955 0.00767898 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.655218 -0.012605 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626685 0.00723527 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.635947 -0.0122343 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630413 0.00842045 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721234 0.0272215 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.725055 0.0280589 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.726768 0.00656677 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.70473 0.0172649 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.71952 0.0487136 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.699195 0.0379196 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.715699 0.0478762 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.741558 0.0380155 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.737738 0.0371781 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743272 0.0165234 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.281471 0.802608 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.30566 0.824035 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.302088 0.822021 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298094 0.802598 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282758 0.821938 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.309654 0.843459 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290324 0.843375 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313227 0.845472 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32499 0.824119 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328563 0.826132 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320997 0.804695 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305221 0.752156 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.325175 0.741263 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325981 0.765112 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32493 0.747715 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304415 0.728307 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304171 0.734759 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.284462 0.7392 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305466 0.745704 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285513 0.756597 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306272 0.769553 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241352 0.787796 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.218449 0.785699 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223304 0.778718 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22345 0.802677 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236497 0.794777 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241498 0.811756 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2594 0.796874 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236351 0.770818 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259253 0.772915 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241205 0.763837 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28191 0.874487 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.292033 0.891539 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305711 0.872763 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28812 0.868678 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268233 0.893263 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.264319 0.870402 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.25811 0.876212 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285824 0.897348 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275701 0.880296 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299501 0.878572 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217602 0.838248 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.206363 0.860225 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223536 0.854636 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230102 0.858689 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200429 0.843837 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224168 0.842301 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211667 0.821861 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193863 0.839784 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205101 0.817808 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211035 0.834196 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257721 0.853061 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.26204 0.87538 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280934 0.860805 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266856 0.87108 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238827 0.867636 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.243643 0.863337 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234508 0.845317 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.252905 0.857361 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248586 0.835041 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271799 0.842785 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34578 0.838847 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.360404 0.851488 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347059 0.832518 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335865 0.853509 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359125 0.857816 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334587 0.859838 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.344501 0.845176 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.370319 0.836826 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355695 0.824185 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356973 0.817857 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321591 0.817421 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340361 0.83071 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.341208 0.822249 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325527 0.840365 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320744 0.825882 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30591 0.835537 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301973 0.812593 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336425 0.807766 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317654 0.794477 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337272 0.799305 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345341 0.766968 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.369945 0.768944 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356171 0.780624 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356172 0.788341 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359115 0.755289 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345342 0.774685 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334511 0.753313 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359113 0.747572 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33451 0.745596 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34534 0.759252 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.358439 0.594141 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.408291 0.619127 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.411883 0.625955 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396287 0.607547 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.390369 0.630791 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423887 0.637535 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402373 0.642371 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420295 0.630706 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429805 0.61429 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426212 0.607462 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.414208 0.595882 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337042 0.638217 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.344865 0.652948 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357326 0.651954 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.357697 0.632683 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324581 0.639211 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337413 0.618946 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316758 0.624481 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324211 0.658482 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316388 0.643752 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336672 0.657489 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369058 0.688854 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.429687 0.57505 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.452905 0.58161 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434777 0.586467 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436077 0.5989 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447815 0.570193 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.430987 0.587483 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.424596 0.563633 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.446515 0.55776 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423296 0.5512 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428387 0.562617 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399007 0.621614 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.41723 0.637209 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418027 0.624734 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401533 0.642848 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39821 0.634089 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382513 0.639728 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379986 0.618494 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.414703 0.615976 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39648 0.600381 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4155 0.603501 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379835 0.550064 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.396248 0.547099 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403175 0.557504 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388263 0.569716 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372907 0.539659 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.364922 0.562276 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356494 0.542624 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387819 0.527447 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.371406 0.530412 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.394747 0.537852 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389119 0.547576 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.410169 0.541008 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405866 0.564748 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410472 0.548718 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393422 0.523836 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393725 0.531546 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372372 0.530405 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388816 0.539866 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367766 0.546435 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384513 0.563607 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320279 0.506807 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317871 0.566667 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.296626 0.555534 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307914 0.550163 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297216 0.572202 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306582 0.572037 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307172 0.588706 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.327827 0.583171 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31728 0.549999 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338525 0.561133 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328569 0.544629 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.142305 0.674191 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.144155 0.692502 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.150298 0.696439 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164554 0.682184 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136163 0.670254 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156561 0.659936 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.134313 0.651943 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.121907 0.684509 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120057 0.666199 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12805 0.688447 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.663122 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0847178 0.680265 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.104191 0.675047 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.107387 0.686972 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0815225 0.66834 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.104191 0.675047 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0978007 0.651197 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0783272 0.656415 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0946054 0.639272 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0978007 0.651197 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.715501 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.160081 0.738169 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177224 0.721891 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165299 0.718696 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136231 0.731779 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141449 0.712305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.129524 0.70911 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.148156 0.734974 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141449 0.712305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165299 0.718696 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.213855 0.655019 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.213517 0.662308 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.194382 0.649801 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198584 0.673065 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23299 0.667526 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218058 0.678283 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233329 0.660237 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228788 0.644262 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229127 0.636974 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209653 0.631756 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.696329 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.23918 0.710584 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233654 0.687599 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.216195 0.705059 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23045 0.719314 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207465 0.713788 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.216195 0.705059 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.24791 0.701855 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233654 0.687599 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242384 0.678869 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.624779 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.266765 0.631486 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247291 0.636704 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250487 0.648629 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26357 0.619561 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247291 0.636704 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240901 0.612854 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.260374 0.607636 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237705 0.600929 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240901 0.612854 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161477 0.602641 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.162741 0.579817 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179523 0.58737 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156259 0.583168 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144695 0.595088 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138214 0.598439 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.143431 0.617912 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167958 0.59929 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166695 0.622115 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.184741 0.606843 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.5724 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.208861 0.556122 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215568 0.578791 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203643 0.575596 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.185011 0.549732 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179793 0.569205 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167868 0.56601 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.196936 0.552927 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179793 0.569205 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203643 0.575596 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.591572 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.105912 0.577317 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128897 0.582843 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111438 0.600302 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0971825 0.586046 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102708 0.609032 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111438 0.600302 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.114642 0.568587 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128897 0.582843 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.137627 0.574113 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0955788 0.852418 9.1293e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.11107 0.922609 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.122151 0.937225 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.131874 0.915202 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11086 0.916553 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101346 0.944632 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.090055 0.92396 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0902645 0.930016 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12236 0.943281 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111279 0.928665 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.132084 0.921258 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.164775 0.877966 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.182656 0.890926 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167676 0.876622 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159019 0.897331 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179755 0.89227 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156118 0.898675 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161874 0.87931 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188412 0.871561 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.17053 0.8586 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173431 0.857256 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135698 0.867231 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.134634 0.873196 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11765 0.858152 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.117797 0.882112 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152682 0.882275 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135845 0.89119 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153747 0.876309 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152536 0.858315 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.1536 0.852349 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135552 0.843271 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0418734 0.897062 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0359958 0.920407 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511067 0.915603 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0588574 0.912106 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0267625 0.901866 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0496241 0.893565 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0326401 0.878521 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0190117 0.905363 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0248894 0.882018 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0341227 0.900559 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0665023 0.841683 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0454909 0.840284 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0463379 0.831823 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0473735 0.856111 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0656554 0.850144 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0675379 0.865971 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0866667 0.851543 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0646197 0.825856 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0856311 0.827255 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0654667 0.817395 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0263827 0.826871 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.00436945 0.825102 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.025051 0.823964 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.018173 0.84533 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00570109 0.828008 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0195047 0.848237 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0277143 0.829777 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0125791 0.806642 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0345923 0.808411 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0332607 0.805505 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0709499 0.907797 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0752104 0.930963 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0941344 0.915684 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0806562 0.924191 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0520258 0.923076 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0574717 0.916304 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0477654 0.89991 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0655041 0.914568 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0612436 0.891402 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0844281 0.899289 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0554592 0.837606 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0523913 0.842832 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0750766 0.842434 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0593957 0.86055 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0327739 0.838004 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0397783 0.855722 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0358417 0.832778 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0484547 0.819888 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0515226 0.814662 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.07114 0.81949 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.124655 0.863153 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.141535 0.875744 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.146389 0.868763 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.129819 0.88655 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.119801 0.870135 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108085 0.880941 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102922 0.857544 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.136371 0.852347 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.119492 0.839756 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141225 0.845366 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0133465 0.69376 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0646815 0.745859 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0684873 0.770032 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0507391 0.762305 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0481266 0.759394 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0824297 0.753586 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.062069 0.742948 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0786239 0.729413 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0850422 0.756497 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0812364 0.732325 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.067294 0.74877 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0347427 0.737837 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0299763 0.758864 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0114021 0.745277 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0263144 0.757489 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0533169 0.751424 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0496549 0.750049 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0580833 0.730397 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0384047 0.739212 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.043171 0.718185 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0198304 0.725625 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00272662 0.788473 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0432853 0.701782 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0544915 0.717566 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0588496 0.718734 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0368947 0.725632 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0389272 0.700615 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0213304 0.708681 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.027721 0.684831 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0608821 0.693716 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0496759 0.677932 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0652402 0.694884 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0272215 0.721234 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0280589 0.725055 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0172649 0.70473 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00656677 0.726768 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0380155 0.741558 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0165234 0.743272 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0371781 0.737738 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0487136 0.71952 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0478762 0.715699 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0379196 0.699195 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00804971 0.649684 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0275193 0.640422 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0283337 0.66342 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0287044 0.644149 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00723527 0.626685 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00842045 0.630413 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0122343 0.635947 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00686453 0.645956 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.012605 0.655218 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00767898 0.668955 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0838533 0.674309 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.106805 0.675276 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0875713 0.673094 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.091423 0.694308 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103087 0.676491 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0877049 0.695522 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0801352 0.675524 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0992356 0.655278 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0762835 0.65431 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0800016 0.653095 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.051506 0.606426 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0539145 0.666287 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0577732 0.666927 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.034894 0.669407 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0513875 0.68752 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0767937 0.663807 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.070408 0.6844 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.072935 0.663167 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0603001 0.645694 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0564414 0.645053 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0374209 0.648173 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0133465 0.69376 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0440268 0.740325 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0417568 0.762259 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0216407 0.748937 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0345526 0.759495 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0641429 0.753646 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0569387 0.750882 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0664129 0.731712 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.051231 0.743089 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053501 0.721155 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0311149 0.729767 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0272215 0.721234 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0454452 0.736829 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.046242 0.724354 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0297485 0.742467 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0264247 0.733709 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.010728 0.739347 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00820099 0.718114 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0429182 0.715595 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0246945 0.7 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.043715 0.70312 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00272662 0.788473 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0148294 0.770845 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0179281 0.782939 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058253 0.76531 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02648 0.759776 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0845947 0.712851 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.101422 0.730141 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0832945 0.725284 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0782041 0.736701 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.102723 0.717709 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0795043 0.724268 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0858949 0.700418 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107813 0.706291 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0909853 0.689001 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0896851 0.701434 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0347427 0.737837 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0269197 0.752567 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0144587 0.751574 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.014088 0.732303 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0472037 0.73883 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0343719 0.718566 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0550267 0.7241 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0475745 0.758102 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0553974 0.743371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0351134 0.757108 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0539145 0.666287 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0751594 0.655153 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0638711 0.649783 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0745692 0.671821 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0652028 0.671657 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0646126 0.688325 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0439578 0.682791 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0545047 0.649619 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0332597 0.660752 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0432164 0.644249 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0631985 0.668775 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0708196 0.669983 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0467378 0.671462 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0618185 0.690113 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0872804 0.667296 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0782793 0.687426 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0796593 0.666087 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0721997 0.648644 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0645786 0.647436 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0481178 0.650123 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.051506 0.606426 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.053173 0.627745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0308513 0.600892 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0325183 0.62221 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0118635 0.616676 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00804971 0.649684 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0244627 0.646718 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0313903 0.657124 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.016478 0.669336 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00112207 0.639278 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00686255 0.661896 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0152909 0.642244 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0160343 0.627066 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.000378614 0.630031 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.022962 0.637471 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281471 0.802608 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.329459 0.858698 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.34259 0.872345 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338969 0.848329 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32016 0.86421 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.333079 0.882715 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310649 0.87458 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.319948 0.869068 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351888 0.866833 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338757 0.853186 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.348268 0.842817 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337088 0.798572 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.346884 0.808673 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322361 0.807762 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335792 0.82298 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.361611 0.799483 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350519 0.81379 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351815 0.789382 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.34818 0.784265 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338384 0.774164 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.323657 0.783355 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280879 0.845371 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.291048 0.849036 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304882 0.840755 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287867 0.826067 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267046 0.853652 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263865 0.830683 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.256877 0.849987 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28406 0.868341 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273891 0.864676 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297894 0.86006 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273842 0.862735 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282313 0.885497 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29787 0.867718 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281455 0.876946 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258284 0.880514 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257427 0.871963 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249813 0.857752 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.274699 0.871286 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266228 0.848523 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290257 0.853506 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225263 0.849407 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.21889 0.873186 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236437 0.866351 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240865 0.865588 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207715 0.856242 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22969 0.848644 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214088 0.832464 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203288 0.857005 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20966 0.833227 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.220835 0.850171 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225855 0.806645 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.21762 0.818054 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.241754 0.813612 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230661 0.83061 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20172 0.811087 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214761 0.823642 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209955 0.799677 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212813 0.794089 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221048 0.78268 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236948 0.789647 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330051 0.815936 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.350165 0.828769 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347547 0.820583 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.333232 0.838905 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332668 0.824121 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315735 0.834258 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312554 0.811288 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.346984 0.805799 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32687 0.792966 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.344366 0.797614 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282063 0.759846 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.29233 0.756464 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305929 0.765125 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288514 0.779336 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268464 0.751185 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.264649 0.774058 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258198 0.754567 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285879 0.736973 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275612 0.740355 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299478 0.745634 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33768 0.75581 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.362219 0.753851 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352319 0.76987 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350765 0.774086 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.347581 0.739791 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336127 0.760026 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.323042 0.74175 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.349134 0.735575 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324595 0.737534 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339233 0.751594 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172546 0.643951 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.202787 0.674191 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.219248 0.690652 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223862 0.677807 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206403 0.695267 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198172 0.687036 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.185327 0.691651 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181711 0.670575 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215632 0.669577 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.199171 0.653116 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.220246 0.656732 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.261725 0.675225 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238562 0.683777 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261725 0.675225 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238562 0.683777 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244096 0.663122 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267259 0.65457 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249631 0.642468 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.249631 0.642468 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.203821 0.733129 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212373 0.709966 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183166 0.738664 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171063 0.721035 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171063 0.721035 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203821 0.733129 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191718 0.715501 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212373 0.709966 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.131237 0.655019 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.12881 0.668451 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.151296 0.662426 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.137627 0.678869 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108751 0.661044 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.117567 0.671463 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111177 0.647613 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.12242 0.644601 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.124846 0.631169 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144906 0.638576 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.115992 0.720665 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135288 0.711449 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.135288 0.711449 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100872 0.705544 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.105047 0.681209 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100872 0.705544 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.105047 0.681209 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120168 0.696329 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0796777 0.626446 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0954616 0.645433 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0796777 0.626446 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0954616 0.645433 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100996 0.624779 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0852121 0.605791 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10653 0.604124 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10653 0.604124 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183615 0.602641 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.197046 0.600215 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207465 0.609032 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191021 0.622701 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173196 0.593824 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167171 0.61631 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159765 0.596251 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.18964 0.580155 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.176209 0.582581 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200059 0.588972 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.155041 0.551082 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174029 0.566866 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.134387 0.556617 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13272 0.577935 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13272 0.577935 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.155041 0.551082 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153374 0.5724 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174029 0.566866 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.24926 0.587397 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240045 0.606693 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240045 0.606693 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23414 0.572277 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209804 0.576452 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23414 0.572277 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.209804 0.576452 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224924 0.591572 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.358439 0.594141 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.428945 0.613592 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.448155 0.626191 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.43276 0.614455 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42519 0.634643 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44434 0.625328 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.421375 0.63378 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42513 0.612729 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.45191 0.60514 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4327 0.592541 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436515 0.593404 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399007 0.621614 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399844 0.625435 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38905 0.60511 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378352 0.627149 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409801 0.641939 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388308 0.643653 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408963 0.638118 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420499 0.619901 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419661 0.61608 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409705 0.599576 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369058 0.688854 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356956 0.671225 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389713 0.68332 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37761 0.665691 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.398265 0.660156 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388377 0.586119 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.405974 0.594185 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410332 0.593017 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.394768 0.609969 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384019 0.587286 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372813 0.60307 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366422 0.57922 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399584 0.570335 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.381987 0.562269 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403942 0.569167 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337042 0.638217 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.341809 0.659244 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.360383 0.645657 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345471 0.65787 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318468 0.651804 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32213 0.65043 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.313702 0.630777 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33338 0.639592 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328614 0.618565 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351955 0.626005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317871 0.566667 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.314012 0.567308 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336891 0.569787 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320398 0.587901 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294991 0.564188 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301377 0.584781 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29885 0.563547 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.311485 0.546074 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315344 0.545434 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334364 0.548554 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.409774 0.542042 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.433888 0.53788 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426423 0.55574 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423551 0.558395 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.417238 0.524182 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.406901 0.544697 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393124 0.528344 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.42011 0.521526 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.395996 0.525689 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.412646 0.539387 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.320279 0.506807 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318612 0.528125 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340934 0.501272 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.339267 0.522591 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359921 0.517056 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379835 0.550064 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.399304 0.540802 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400119 0.563801 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400489 0.54453 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37902 0.527065 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.380205 0.530793 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.359551 0.536327 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37865 0.546337 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.35918 0.555599 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379464 0.569335 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.371785 0.0996195 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.393621 0.220501 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.368601 0.279642 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.354293 0.299716 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.347717 0.279022 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366989 0.292196 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375177 0.300337 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.387873 0.292817 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389485 0.280263 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355904 0.287162 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.370213 0.267088 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349329 0.266468 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.321889 0.238665 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.304702 0.250544 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32307 0.238717 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327715 0.259421 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.30352 0.250492 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.326533 0.259369 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320707 0.238612 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298875 0.229788 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316063 0.217908 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317244 0.21796 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.372464 0.281062 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.362978 0.289441 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.35549 0.267771 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378255 0.270044 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379952 0.302733 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.395229 0.283335 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389438 0.294353 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357187 0.30046 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366673 0.29208 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349699 0.278789 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440333 0.261479 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.443285 0.282991 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.421181 0.271991 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4302 0.282046 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462437 0.27248 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.449353 0.271534 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459485 0.250967 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453417 0.262424 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.450466 0.240911 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431313 0.251423 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.444196 0.262898 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.449273 0.285685 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436139 0.282528 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.426189 0.27701 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45733 0.266055 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434246 0.257381 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452254 0.243269 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46728 0.271573 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462204 0.248787 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.454146 0.268416 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.465353 0.202338 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.486123 0.204606 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464339 0.202946 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470107 0.223366 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.487137 0.203998 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471122 0.222757 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466367 0.201729 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.481368 0.183578 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.460599 0.18131 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459584 0.181918 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389758 0.219082 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.378635 0.228779 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.365937 0.225483 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383364 0.24293 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.402455 0.222377 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407185 0.236529 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.413578 0.21268 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385029 0.20493 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396152 0.195233 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.372331 0.201634 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414778 0.15994 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.412573 0.147477 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39322 0.15977 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.412448 0.172167 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434131 0.147647 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434006 0.172338 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436336 0.16011 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414903 0.13525 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.417108 0.147713 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39555 0.147543 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343046 0.178104 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.319723 0.177083 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.325124 0.189464 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.332294 0.198298 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337645 0.165722 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.350216 0.186938 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360967 0.166743 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330475 0.156889 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353797 0.157909 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335876 0.16927 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191247 0.166275 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.130089 0.20793 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.115471 0.221102 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.126388 0.200597 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13987 0.220766 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119172 0.228435 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143571 0.228099 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13379 0.215264 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10569 0.208266 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120308 0.195095 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116607 0.187762 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154295 0.172673 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.15554 0.180792 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.17557 0.171251 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166926 0.19323 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134265 0.182215 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.145651 0.194652 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.133019 0.174096 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.142909 0.160236 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141663 0.152117 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.162939 0.150694 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192135 0.230419 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.18209 0.243049 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168159 0.227721 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.185251 0.218634 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.206066 0.245747 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209227 0.221332 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216111 0.233117 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188974 0.254834 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.199019 0.242204 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.175043 0.239506 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.167041 0.201532 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.151829 0.219088 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14514 0.205084 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163068 0.221861 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173729 0.215537 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.184969 0.218309 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188942 0.197981 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155801 0.19876 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171014 0.181204 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149113 0.184756 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.229087 0.224021 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.22829 0.248268 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207937 0.234532 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216949 0.2391 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.249439 0.237756 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238098 0.228589 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.250236 0.213509 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240428 0.233189 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241225 0.208942 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220075 0.219453 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228199 0.159877 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.229756 0.167942 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207683 0.16569 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223214 0.183484 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.250271 0.162129 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.243729 0.177671 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248714 0.154064 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.234741 0.144336 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233184 0.13627 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212668 0.142084 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.129201 0.143787 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.105335 0.14887 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115741 0.153943 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121723 0.167242 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.118795 0.138714 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135183 0.157086 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.142661 0.13363 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.112813 0.125414 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.136679 0.120331 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.123219 0.130487 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.190359 0.102131 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.179968 0.0897843 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166467 0.105492 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.183804 0.114103 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.20386 0.0864233 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207696 0.110742 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.214251 0.0987702 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.186523 0.0778128 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196914 0.0901597 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173022 0.0935207 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153407 0.108529 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.130858 0.0995811 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135326 0.123725 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134736 0.113639 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.148938 0.0843858 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.152816 0.0984435 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171487 0.0933338 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149528 0.0944715 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172078 0.10342 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153997 0.118615 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.277961 0.367156 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.269898 0.374298 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.270045 0.350338 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.291334 0.362218 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277815 0.391115 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299251 0.379036 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.285878 0.383973 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.256525 0.379235 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.264588 0.372093 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.256671 0.355276 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.252306 0.297666 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.235688 0.305995 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259438 0.312359 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245915 0.321516 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228556 0.291303 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238783 0.306824 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245173 0.282974 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.242079 0.282145 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.258696 0.273816 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265828 0.288509 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.32435 0.32435 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33812 0.32066 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32066 0.33812 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3005 0.317959 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29681 0.331729 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29042 0.307879 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317959 0.3005 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307879 0.29042 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331729 0.29681 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339925 0.383759 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.334762 0.407156 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31686 0.392275 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.326552 0.388696 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357827 0.39864 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349618 0.380181 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362991 0.375243 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348135 0.402218 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353299 0.378821 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330233 0.387337 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376234 0.330873 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.393346 0.348239 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383366 0.345565 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369843 0.354723 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386213 0.333547 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362711 0.340031 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369102 0.316181 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399736 0.324389 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382624 0.307023 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389757 0.321715 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376234 0.330873 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.386461 0.346394 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362711 0.340031 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369843 0.354723 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399983 0.337237 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383366 0.345565 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389757 0.321715 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392851 0.322544 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382624 0.307023 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369102 0.316181 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277961 0.367156 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.261966 0.385852 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259422 0.36581 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.278159 0.38141 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.280504 0.387198 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296698 0.382755 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.2965 0.368501 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.261768 0.371598 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277764 0.352901 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259225 0.351556 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31427 0.31427 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.304189 0.32435 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29042 0.32066 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307879 0.33812 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328039 0.317959 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331729 0.331729 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33812 0.307879 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.31058 0.3005 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32066 0.29042 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29681 0.29681 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.252306 0.297666 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.228803 0.30415 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238783 0.306824 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245915 0.321516 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.242326 0.294992 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259438 0.312359 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265828 0.288509 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.235194 0.2803 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.258696 0.273816 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245173 0.282974 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574159 0.153845 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.612768 0.202534 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.612732 0.225282 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591695 0.212428 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60221 0.22113 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633805 0.215388 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623283 0.211236 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.63384 0.192641 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62329 0.206686 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623325 0.183939 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602253 0.193832 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543919 0.184086 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.527458 0.200547 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522843 0.187702 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.540303 0.205161 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548533 0.196931 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561378 0.201546 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.564994 0.18047 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531074 0.179472 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.547535 0.163011 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.526459 0.166627 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.542885 0.243024 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534333 0.219861 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563539 0.248559 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575642 0.23093 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575642 0.23093 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542885 0.243024 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534333 0.219861 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643008 0.172294 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.660425 0.189742 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645434 0.185725 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636618 0.196144 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657999 0.17631 0.57904 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634191 0.182712 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640582 0.158862 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666816 0.165892 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649399 0.148444 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651825 0.161875 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.585228 0.195155 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.574809 0.203972 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561378 0.201546 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.568784 0.181486 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598659 0.197581 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.592634 0.175095 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609078 0.188764 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591253 0.217641 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601672 0.208824 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577822 0.215215 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6044 0.123605 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.620861 0.107144 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608016 0.102529 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625475 0.119989 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617245 0.128219 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621859 0.141064 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600784 0.14468 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599785 0.11076 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583324 0.127221 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58694 0.106145 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631939 0.130984 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.643128 0.132649 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618482 0.133263 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631785 0.152367 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656585 0.130371 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645242 0.150088 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645397 0.128706 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643283 0.111266 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632094 0.109601 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618637 0.11188 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.591664 0.0609772 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572676 0.076761 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612319 0.0665116 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613986 0.0878298 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613986 0.0878298 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591664 0.0609772 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572676 0.076761 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56309 0.112536 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549659 0.11011 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53924 0.118927 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555684 0.132596 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.573509 0.103719 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579534 0.126205 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58694 0.106145 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557065 0.09005 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570497 0.0924762 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.546646 0.0988668 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.494808 0.247614 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.494287 0.313607 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.484182 0.326876 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470513 0.310432 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.488171 0.302705 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507957 0.330051 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511946 0.305881 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.518062 0.316783 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490299 0.337778 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500404 0.324509 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476629 0.321334 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452978 0.302539 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.436971 0.320401 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436675 0.29902 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.455413 0.3148 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453274 0.32392 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471717 0.318318 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469281 0.306057 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434535 0.30814 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.450543 0.290278 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434239 0.286759 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434629 0.269833 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.426389 0.279233 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.445377 0.263449 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448298 0.286276 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415641 0.285616 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.43755 0.29266 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42388 0.276216 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41272 0.262789 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420959 0.253389 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431707 0.247006 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536117 0.258683 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549787 0.275127 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549787 0.275127 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529727 0.282533 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536117 0.258683 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.516058 0.266089 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522448 0.242239 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556177 0.251277 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542508 0.234833 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556177 0.251277 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476459 0.214908 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.457868 0.209819 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.458164 0.2312 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453963 0.210053 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476163 0.193527 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.472258 0.193761 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.494753 0.198616 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.480363 0.214674 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.498954 0.219763 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.480659 0.236055 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536638 0.19269 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549603 0.17251 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528912 0.177908 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549105 0.191778 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557329 0.187292 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556831 0.20656 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544363 0.207471 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.537136 0.173421 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.524171 0.193601 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.516445 0.178819 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554467 0.291389 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.562288 0.314604 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542501 0.306499 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541186 0.310183 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574255 0.299494 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.553152 0.295073 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566433 0.276279 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575569 0.29581 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567748 0.272595 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555781 0.287705 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554987 0.225396 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.567359 0.227186 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54267 0.227528 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555283 0.246777 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579676 0.225054 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567601 0.244644 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567305 0.223263 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567063 0.205805 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554691 0.204014 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542374 0.206147 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.513157 0.28032 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.507811 0.298839 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.489718 0.287442 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505577 0.302049 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531251 0.291716 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529016 0.294927 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536597 0.273198 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515392 0.27711 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.520738 0.258591 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497299 0.265714 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.552323 0.0329639 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.625877 0.0248832 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.646362 0.0316054 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625173 0.0287309 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627981 0.0478 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647066 0.0277577 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628685 0.0439523 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62658 0.0210355 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644258 0.00868865 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623773 0.00196644 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623069 0.00581415 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.584567 0.0138144 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.584898 0.0177119 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56353 0.0185345 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.580268 0.0364224 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.605935 0.0129918 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601305 0.0317022 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.605605 0.00909422 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.589197 -0.00489609 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.588867 -0.00879364 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567829 -0.00407348 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593331 0.0822954 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.593994 0.105299 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572783 0.0926585 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582384 0.100664 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.614541 0.0949359 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602932 0.090301 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613879 0.0719323 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604941 0.0869303 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604278 0.0639267 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58373 0.0742898 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593633 0.0440327 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607302 0.0604766 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607302 0.0604766 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587242 0.0678827 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593633 0.0440327 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.573573 0.0514389 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579964 0.0275889 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613693 0.0366265 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600023 0.0201827 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613693 0.0366265 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561087 0.101445 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551884 0.118381 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536664 0.103361 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550745 0.0944221 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576307 0.116465 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575168 0.0925065 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58551 0.0995293 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562225 0.125404 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571428 0.108468 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.547006 0.110383 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.520079 0.0521134 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.523344 0.0542684 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534291 0.0358996 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541988 0.0591566 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509132 0.0704822 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.527777 0.0753703 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505868 0.0683272 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.501435 0.0472252 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49817 0.0450702 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.512382 0.0288565 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.584869 -0.0244483 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.5935 -0.0473753 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57344 -0.0399691 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.595617 -0.0308315 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604929 -0.0318545 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607046 -0.0153107 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.596298 -0.00892756 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582752 -0.0409921 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574121 -0.0180651 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562692 -0.0335859 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511316 -0.0163676 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.48882 -0.0212225 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497372 0.00194055 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491256 -0.00896145 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502764 -0.0395307 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505199 -0.0272696 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.525259 -0.0346758 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.50888 -0.0286287 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531375 -0.0237738 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517432 -0.00546563 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54356 -0.0355172 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.530389 -0.0495897 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.519442 -0.031221 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53532 -0.0261165 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554507 -0.0538859 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.559438 -0.0304127 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.567678 -0.0398133 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538628 -0.0589904 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.551799 -0.0449178 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.527681 -0.0406217 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.451136 0.0058509 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.447081 0.0051487 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.435909 0.01504 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423265 0.0115452 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440694 0.0289993 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459725 0.00864346 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46451 0.0226028 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470897 -0.0012478 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.442297 -0.00881065 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.453468 -0.0187019 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.429652 -0.0123054 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386138 0.0172804 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.364644 0.0293677 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375512 0.0213457 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385352 0.0401449 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37527 0.0253024 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.395978 0.0360796 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396764 0.0132151 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.36543 0.0065032 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386924 -0.00558411 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376298 -0.00151881 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.439178 0.0688765 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.426942 0.0903221 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.416328 0.0699989 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435083 0.0806307 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.449792 0.0891998 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.457933 0.0795084 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462029 0.0677542 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431037 0.078568 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.443274 0.0571224 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420423 0.0582447 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.512079 -0.00628079 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.523883 -0.000557006 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49924 -0.00208214 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.51057 0.0165974 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536722 -0.00475566 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523409 0.0123987 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.524918 -0.0104794 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.525392 -0.0234352 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.513588 -0.029159 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500749 -0.0249603 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504176 0.0574471 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.508666 0.0817008 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.488971 0.0722467 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.489545 0.0732807 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523872 0.0669012 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504751 0.058481 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.519382 0.0426474 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523298 0.0658672 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.518808 0.0416134 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.503602 0.0564131 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.516134 -0.00557859 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.540463 -0.00154892 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.52751 -0.00538221 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.524673 0.0156462 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529087 -0.00174531 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.513298 0.0154498 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504759 -0.00577498 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531924 -0.0227737 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507596 -0.0268034 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.518971 -0.026607 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459039 -0.0578769 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.451803 -0.0707378 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435761 -0.0561039 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.454158 -0.0461991 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.475081 -0.0725109 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477435 -0.0479721 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.482316 -0.05965 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.456685 -0.0824157 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46392 -0.0695548 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440643 -0.0677817 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.463094 -0.0571747 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.459563 -0.081612 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.442243 -0.0665888 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.463589 -0.0696122 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.480415 -0.0721979 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.48444 -0.0601982 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.483946 -0.0477607 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459069 -0.0691745 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4626 -0.0447373 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.441749 -0.0541513 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398096 -0.0457452 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.373728 -0.0495643 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383722 -0.030137 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382672 -0.0306825 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388102 -0.0651725 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.397047 -0.0462908 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41247 -0.0613535 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389151 -0.064627 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41352 -0.060808 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399146 -0.0451997 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.424299 -0.178985 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.412497 -0.190929 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400273 -0.174844 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.417001 -0.16674 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436523 -0.195071 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.441027 -0.170881 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448325 -0.183127 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419795 -0.203175 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431597 -0.191231 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407571 -0.18709 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367336 -0.131634 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.343834 -0.12515 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353814 -0.122476 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360946 -0.107784 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357357 -0.134308 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374468 -0.116942 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380859 -0.140792 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.350225 -0.149 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.373727 -0.155484 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360204 -0.146326 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.41922 -0.10495 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40545 -0.10864 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42291 -0.0911807 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44307 -0.111341 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44676 -0.0975713 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45315 -0.121421 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425611 -0.128801 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435691 -0.138881 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.411841 -0.13249 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.486264 -0.162382 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.502603 -0.174264 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.479659 -0.170327 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.495376 -0.15142 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509207 -0.166319 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.501981 -0.143475 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.492868 -0.154437 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49349 -0.185226 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477151 -0.173345 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470546 -0.18129 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491265 -0.0984274 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.501491 -0.082906 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477742 -0.0892696 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484874 -0.0745774 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515014 -0.0920638 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.498397 -0.0837352 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504787 -0.107585 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507882 -0.106756 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497655 -0.122277 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484132 -0.11312 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491265 -0.0984274 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.508376 -0.0810612 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.498397 -0.0837352 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484874 -0.0745774 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.501244 -0.0957534 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477742 -0.0892696 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484132 -0.11312 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.514767 -0.104911 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.497655 -0.122277 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504787 -0.107585 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.424299 -0.178985 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.411775 -0.200165 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399922 -0.179342 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415187 -0.189948 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436152 -0.199808 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.439564 -0.189591 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448677 -0.178629 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420888 -0.189202 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.433412 -0.168023 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409035 -0.168379 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4293 -0.115031 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.439381 -0.10495 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45315 -0.10864 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.435691 -0.0911807 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415531 -0.111341 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.411841 -0.0975713 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40545 -0.121421 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.43299 -0.128801 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42291 -0.138881 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44676 -0.13249 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367336 -0.131634 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.350719 -0.123305 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374468 -0.116942 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360946 -0.107784 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343587 -0.137998 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353814 -0.122476 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360204 -0.146326 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357109 -0.147155 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.373727 -0.155484 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380859 -0.140792 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248762 -0.0483751 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.183785 -0.0599222 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.160406 -0.0522053 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171954 -0.0513956 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178533 -0.0358698 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172236 -0.0607319 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.190363 -0.0443964 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195615 -0.0684488 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165658 -0.0762577 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189036 -0.0839747 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177206 -0.075448 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.187119 -0.0172857 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.176731 -0.00705049 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192673 -0.025725 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200733 -0.00352517 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171177 0.00138875 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195179 0.00491406 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.181564 -0.00884647 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163117 -0.020811 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173504 -0.0310463 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179058 -0.0394855 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215921 0.00673113 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.20044 0.0258737 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196602 0.00551963 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215612 0.0203763 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.21976 0.0270852 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.234932 0.0215878 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.235241 0.00794264 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200749 0.0122285 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.21623 -0.00691403 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196911 -0.00812553 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245428 -0.0910116 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.234308 -0.0942304 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.221514 -0.0854464 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238704 -0.0714204 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.258223 -0.0997955 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.262619 -0.0769856 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.269343 -0.0965768 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241032 -0.113822 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.252152 -0.110603 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228237 -0.105038 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277564 -0.0243582 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.275459 -0.0076281 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.255218 -0.0167139 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.270078 -0.00142185 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.297806 -0.0152725 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.292425 -0.00906621 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299911 -0.0320026 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282946 -0.0305645 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.285051 -0.0472946 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.262704 -0.0396503 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.310405 -0.0794645 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.324811 -0.0817333 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.300317 -0.0800146 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.313378 -0.0603366 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.334899 -0.0811832 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.323466 -0.0597864 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320493 -0.0789143 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.321838 -0.100861 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307433 -0.0985923 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.297345 -0.0991425 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216626 -0.115028 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.195663 -0.127519 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194866 -0.104303 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.201738 -0.108803 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.217423 -0.138245 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223497 -0.119529 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238386 -0.125754 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210551 -0.133744 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.231514 -0.121254 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209754 -0.110528 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.281603 -0.103481 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.291073 -0.126206 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.271345 -0.119897 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293457 -0.110246 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.301332 -0.10979 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.303716 -0.0938302 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.291862 -0.0870656 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.279219 -0.119442 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.269749 -0.0967168 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.25949 -0.113132 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.21996 -0.0723919 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.20388 -0.0673141 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216456 -0.0490355 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.198742 -0.0609052 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207384 -0.0906706 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.202246 -0.0842617 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223463 -0.0957484 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225098 -0.0788008 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241177 -0.0838786 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.237674 -0.0605222 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.508983 0.690426 8.51251e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.484794 0.755941 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.47411 0.767658 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.467528 0.744501 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.489758 0.749038 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491377 0.779098 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507025 0.760478 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502061 0.767382 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469146 0.774562 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.47983 0.762845 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462564 0.751405 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436283 0.7029 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.418941 0.714226 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.43889 0.704751 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44101 0.724842 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.416335 0.712374 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.438403 0.722991 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.433677 0.701048 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414215 0.692283 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431557 0.680957 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434163 0.682808 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.478434 0.695668 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.481931 0.703418 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500827 0.694124 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491475 0.716184 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.459538 0.704962 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469082 0.717727 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.456041 0.697211 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46889 0.682902 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.465393 0.675152 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.487786 0.673608 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557494 0.743468 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.560084 0.767402 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543179 0.760285 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53997 0.755145 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574398 0.750585 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554284 0.738328 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571808 0.726651 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577608 0.755725 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575017 0.731791 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.560703 0.748608 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.551134 0.683194 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.573364 0.687731 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571303 0.682033 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56324 0.703871 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.553195 0.688893 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543071 0.705033 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530964 0.684356 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561258 0.667055 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539027 0.662518 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.559196 0.661356 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.581682 0.677953 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.601808 0.682851 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579842 0.680568 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58454 0.700216 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603648 0.680237 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58638 0.697602 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583522 0.675339 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59895 0.660588 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.578824 0.65569 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576984 0.658304 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515343 0.7507 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.506594 0.773394 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.491321 0.755462 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507924 0.764807 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530616 0.768632 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531946 0.760045 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539365 0.745938 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.514012 0.759287 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522762 0.736593 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.49874 0.741355 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539531 0.685185 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.538818 0.693658 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517905 0.691194 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534075 0.708875 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.560445 0.687649 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555702 0.702866 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561158 0.679176 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544274 0.669969 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544988 0.661495 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523361 0.667505 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466832 0.697658 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.447385 0.709346 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.447429 0.703286 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.46231 0.721188 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466788 0.703718 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.481713 0.71556 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.486235 0.692031 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.451907 0.685816 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471354 0.674129 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.451951 0.679757 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335322 0.607487 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.283164 0.659645 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.269894 0.672915 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.275822 0.649528 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293281 0.666987 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277236 0.683032 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.300624 0.677104 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.290507 0.669762 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.259777 0.665573 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273047 0.652302 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265705 0.642185 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.286452 0.603979 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.279361 0.614273 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.303327 0.613293 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.288206 0.628413 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.262487 0.604959 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.271332 0.619099 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.269578 0.594664 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.277607 0.589839 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.284698 0.579544 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.301572 0.588858 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33883 0.656357 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.328536 0.663448 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314396 0.654603 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.329516 0.639482 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.35297 0.665202 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353951 0.641237 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.363265 0.658111 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33785 0.680322 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348145 0.673232 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32371 0.671477 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.332034 0.663153 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.321274 0.684748 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.308341 0.666888 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.326131 0.678752 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.344967 0.681014 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.349824 0.675018 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355727 0.659419 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327177 0.669149 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337937 0.647554 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314244 0.651289 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.391875 0.684201 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384191 0.610996 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.389739 0.622198 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366159 0.617804 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378964 0.63493 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407771 0.61539 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396997 0.628121 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.402224 0.604188 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.394966 0.598265 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.389418 0.587062 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.371386 0.593871 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.279656 0.610775 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.258061 0.621535 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.264057 0.616678 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.275921 0.634468 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.27366 0.615632 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29152 0.628565 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.295255 0.604872 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.261795 0.597842 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.28339 0.587082 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267791 0.592985 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331813 0.558618 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.320611 0.55307 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.30788 0.563845 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.325005 0.57665 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.344544 0.547843 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348938 0.571423 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355747 0.553391 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327419 0.535038 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338621 0.540585 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314688 0.545813 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.258608 0.550934 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335322 0.607487 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.313405 0.629404 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.316595 0.626214 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318408 0.606941 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.335868 0.624401 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.311592 0.648676 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330864 0.646863 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.308402 0.651867 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.294133 0.631217 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.290942 0.634407 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.295946 0.611945 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331813 0.558618 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.319608 0.539107 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307378 0.556863 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.322499 0.541743 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.344043 0.540862 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.346933 0.543497 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356248 0.560372 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328923 0.555982 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.341128 0.575492 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316693 0.573738 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384191 0.610996 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.403702 0.623201 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401066 0.62031 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385946 0.635431 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386827 0.613886 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.369071 0.626116 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367317 0.601681 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401947 0.598766 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382437 0.586561 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399312 0.595876 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316914 0.678274 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.305407 0.69384 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296616 0.671002 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317721 0.674446 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.325704 0.701111 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338018 0.681717 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337211 0.685545 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3046 0.697667 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316107 0.682101 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.295809 0.67483 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.391875 0.684201 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37258 0.674986 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406996 0.669081 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40282 0.644745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.3877 0.659866 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.33883 0.656357 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.329538 0.677411 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314897 0.661584 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.332022 0.674389 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.353472 0.672184 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.355956 0.669162 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362764 0.65113 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.336346 0.659378 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.345639 0.638325 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.321705 0.643552 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.264535 0.625895 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.248969 0.637402 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.268363 0.625088 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.271807 0.646193 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.245142 0.638209 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267979 0.647 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.260708 0.626702 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.241698 0.617105 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.257264 0.605598 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.261092 0.604791 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.286452 0.603979 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.265398 0.613271 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.26842 0.610787 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.281225 0.627912 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.283431 0.606463 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299257 0.621104 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.304484 0.59717 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.270625 0.589337 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.291679 0.580045 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273647 0.586853 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.258608 0.550934 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.267823 0.570229 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.273728 0.535813 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.298064 0.539989 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.282943 0.555109 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645066 0.554344 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.681385 0.616373 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.678928 0.639472 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661636 0.629767 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.664108 0.621631 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698678 0.626079 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683858 0.608237 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701135 0.602979 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696205 0.634214 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698662 0.611115 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678912 0.624508 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649723 0.609912 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.640648 0.631982 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625749 0.614812 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64267 0.62585 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.664623 0.627081 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666645 0.620949 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673698 0.605012 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647702 0.616044 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656777 0.593974 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632802 0.598874 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607573 0.617144 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.595495 0.63057 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594239 0.605919 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615286 0.617371 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608828 0.641795 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628619 0.628595 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.620906 0.628369 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587782 0.630343 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59986 0.616917 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586526 0.605692 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.676727 0.560805 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.689897 0.57563 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693998 0.575587 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673115 0.585222 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.672626 0.560848 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655844 0.57044 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659456 0.546023 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693509 0.551213 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680339 0.536388 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69761 0.55117 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602915 0.561576 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.602201 0.570049 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623084 0.560414 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615021 0.582252 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582032 0.571211 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594852 0.583414 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582745 0.562738 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.590095 0.549372 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.590808 0.540899 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610978 0.539737 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640408 0.498776 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.627785 0.478525 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615951 0.497935 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630799 0.484234 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.652241 0.479365 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655255 0.485075 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.664864 0.499616 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637394 0.493066 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.650016 0.513317 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62556 0.512476 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718878 0.553573 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.73992 0.563328 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.720935 0.559693 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719679 0.577348 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737863 0.557208 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717623 0.571228 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.716821 0.547453 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739118 0.539553 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718076 0.529798 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.720133 0.535918 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682558 0.491544 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.688647 0.474542 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666351 0.485132 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.686417 0.498226 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.704854 0.480953 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.702624 0.504637 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698765 0.497955 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.684788 0.46786 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678699 0.484862 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.662492 0.47845 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687216 0.547112 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.690713 0.554862 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.667813 0.552739 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682694 0.570641 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.710116 0.549235 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.702097 0.565014 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.706619 0.541484 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.695235 0.531333 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691738 0.523582 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.672335 0.52921 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.501645 0.501645 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.499795 0.519956 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.493653 0.523893 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.479397 0.509638 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507788 0.497708 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.48739 0.48739 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509638 0.479397 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522043 0.511963 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523893 0.493653 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515901 0.515901 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.490576 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.559233 0.507719 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539759 0.502501 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536564 0.514426 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562428 0.495794 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539759 0.502501 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54615 0.478651 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.565623 0.483869 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549345 0.466726 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54615 0.478651 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.542955 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.483869 0.565623 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.466726 0.549345 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.478651 0.54615 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.507719 0.559233 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502501 0.539759 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.514426 0.536564 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.495794 0.562428 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.502501 0.539759 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.478651 0.54615 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.430095 0.482473 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.430434 0.489762 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.449569 0.477255 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.445366 0.500519 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.41096 0.49498 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425893 0.505737 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410622 0.487691 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.415162 0.471716 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.414824 0.464428 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434297 0.45921 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.523783 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.404771 0.538038 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410297 0.515053 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427756 0.532513 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4135 0.546768 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436486 0.541242 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427756 0.532513 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396041 0.529309 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410297 0.515053 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401567 0.506323 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.452233 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.377186 0.45894 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396659 0.464158 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.393464 0.476083 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380381 0.447015 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396659 0.464158 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40305 0.440308 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383576 0.43509 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406245 0.428383 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40305 0.440308 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.482473 0.430095 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.48121 0.407271 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464428 0.414824 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.487691 0.410622 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499256 0.422542 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.505737 0.425893 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.500519 0.445366 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.475992 0.426744 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.477255 0.449569 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45921 0.434297 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.399854 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.43509 0.383576 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428383 0.406245 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440308 0.40305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45894 0.377186 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464158 0.396659 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.476083 0.393464 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.447015 0.380381 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.464158 0.396659 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.440308 0.40305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.419026 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.538038 0.404771 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515053 0.410297 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.532513 0.427756 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.546768 0.4135 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541242 0.436486 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.532513 0.427756 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529309 0.396041 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.515053 0.410297 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.506323 0.401567 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607487 0.335322 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.659645 0.283164 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.672915 0.269894 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649528 0.275822 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666987 0.293281 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683032 0.277236 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.677104 0.300624 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669762 0.290507 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665573 0.259777 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.652302 0.273047 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642185 0.265705 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603979 0.286452 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.592776 0.280905 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.580045 0.291679 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59717 0.304484 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.61671 0.275678 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621104 0.299257 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627912 0.281225 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599585 0.262872 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610787 0.26842 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586853 0.273647 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656357 0.33883 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.661904 0.350033 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638325 0.345639 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65113 0.362764 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679937 0.343224 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669162 0.355956 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674389 0.332022 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.667131 0.326099 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661584 0.314897 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643552 0.321705 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663153 0.332034 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.685865 0.340177 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679339 0.33606 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669651 0.355123 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669679 0.336151 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.653465 0.351097 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.646968 0.328008 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679367 0.317089 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656656 0.308945 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.672841 0.312971 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.664041 0.412036 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610996 0.384191 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.600701 0.391282 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586561 0.382437 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601681 0.367317 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625136 0.393037 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626116 0.369071 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.635431 0.385946 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610016 0.408157 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62031 0.401066 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.595876 0.399312 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610775 0.279656 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.602632 0.256944 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587686 0.273158 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606749 0.26347 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62572 0.263442 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.629838 0.269968 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633864 0.286153 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606658 0.27313 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.614801 0.295841 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591712 0.289344 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558618 0.331813 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551527 0.342108 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575492 0.341128 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.560372 0.356248 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534652 0.332793 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543497 0.346933 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.541743 0.322499 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549772 0.317673 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556863 0.307378 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.573738 0.316693 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.530773 0.278768 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645066 0.554344 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.668521 0.610229 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.663938 0.633406 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64522 0.617928 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65892 0.626429 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687239 0.625707 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682221 0.61873 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691822 0.602531 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673539 0.617206 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678123 0.59403 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.654822 0.601728 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598918 0.585648 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.580238 0.601562 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.581665 0.587563 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.59781 0.605914 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.597491 0.599646 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.615063 0.603999 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616171 0.583732 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.581346 0.581295 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600026 0.565381 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582773 0.567297 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619787 0.622977 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.608008 0.63767 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601637 0.613891 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.623239 0.620102 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626157 0.646756 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.641389 0.629188 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637936 0.632063 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604555 0.640545 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616334 0.625852 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598184 0.616766 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.714669 0.578925 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.729812 0.597914 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711617 0.592661 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70632 0.602084 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732864 0.584178 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.709372 0.588348 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.71772 0.565189 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.738161 0.574755 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.723017 0.555767 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719965 0.569503 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665934 0.591673 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.658095 0.605761 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647455 0.607672 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643855 0.58746 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.676573 0.589763 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.662334 0.571461 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.684413 0.575674 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680174 0.609975 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.688013 0.595887 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669535 0.611885 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691213 0.52304 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.712906 0.511567 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.699372 0.507717 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.710453 0.529503 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.704747 0.526889 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.702295 0.544826 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683054 0.538362 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693665 0.505104 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671972 0.516576 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680131 0.501254 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6938 0.541596 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.70016 0.547376 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.676324 0.546319 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690564 0.564621 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717636 0.542652 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70804 0.559898 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711276 0.536873 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.703396 0.524351 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.697037 0.518571 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679561 0.523294 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.670344 0.48571 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.67091 0.466887 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.650637 0.480853 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671107 0.490138 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690617 0.471745 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690815 0.494995 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.690052 0.490567 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.670147 0.46246 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669581 0.481283 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649874 0.476425 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624197 0.517014 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.60809 0.516313 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60089 0.524375 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616221 0.538029 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631397 0.508952 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639529 0.530668 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647504 0.509653 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616065 0.495298 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632172 0.495999 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608865 0.50336 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.607487 0.335322 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.629404 0.313405 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.626214 0.316595 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606941 0.318408 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624401 0.335868 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648676 0.311592 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.646863 0.330864 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651867 0.308402 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631217 0.294133 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634407 0.290942 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.611945 0.295946 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558618 0.331813 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.537564 0.341105 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.540585 0.338621 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.553391 0.355747 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555596 0.334297 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.571423 0.348938 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57665 0.325005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542791 0.317172 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563845 0.30788 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545813 0.314688 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610996 0.384191 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.601704 0.405245 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587062 0.389418 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604188 0.402224 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625637 0.400018 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628121 0.396997 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.63493 0.378964 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.608512 0.387213 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617804 0.366159 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593871 0.371386 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678274 0.316914 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.697473 0.31938 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674538 0.318074 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681812 0.338182 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701209 0.31822 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.685547 0.337022 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682009 0.315754 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.693935 0.298112 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674736 0.295646 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671 0.296805 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.664041 0.412036 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644745 0.40282 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.679161 0.396915 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674986 0.37258 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659866 0.3877 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656357 0.33883 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.675867 0.351035 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673232 0.348145 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.658111 0.363265 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.658993 0.341721 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.641237 0.353951 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639482 0.329516 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.674113 0.3266 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.654603 0.314396 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671477 0.32371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625895 0.264535 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.623429 0.245336 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604627 0.260997 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624736 0.268271 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644697 0.248874 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.646004 0.271809 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.647163 0.268073 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624589 0.2416 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627055 0.2608 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.605787 0.257262 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603979 0.286452 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.591774 0.266942 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.579544 0.284698 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594664 0.269578 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616209 0.268696 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619099 0.271332 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.628413 0.288206 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.601088 0.283817 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613293 0.303327 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.588858 0.301572 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.530773 0.278768 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539989 0.298064 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545894 0.263648 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570229 0.267823 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555109 0.282943 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.471405 0.471405 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.441164 0.501645 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.424703 0.518106 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420089 0.505261 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.437548 0.522721 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.445778 0.51449 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.458623 0.519105 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.462239 0.498029 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428319 0.497031 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44478 0.48057 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423704 0.484186 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.382226 0.502679 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405389 0.511231 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382226 0.502679 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405389 0.511231 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399854 0.490576 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376691 0.482024 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39432 0.469922 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39432 0.469922 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.44013 0.560583 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431578 0.53742 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.460785 0.566118 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.472887 0.548489 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.472887 0.548489 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.44013 0.560583 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452233 0.542955 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.431578 0.53742 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.512714 0.482473 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.51514 0.495905 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.492654 0.48988 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.506323 0.506323 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5352 0.488498 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.526383 0.498917 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.532774 0.475067 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.521531 0.472055 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.519105 0.458623 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499045 0.46603 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.527958 0.548119 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.508662 0.538903 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.508662 0.538903 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543078 0.532998 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538903 0.508662 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.543078 0.532998 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538903 0.508662 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.523783 0.523783 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.564273 0.4539 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548489 0.472887 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.564273 0.4539 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548489 0.472887 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542955 0.452233 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558738 0.433245 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53742 0.431578 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.53742 0.431578 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.460336 0.430095 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.446904 0.427669 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436486 0.436486 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.45293 0.450155 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.470754 0.421278 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.47678 0.443764 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.484186 0.423704 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.454311 0.407609 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.467742 0.410035 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.443892 0.416426 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.488909 0.378536 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469922 0.39432 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.509564 0.384071 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511231 0.405389 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.511231 0.405389 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.488909 0.378536 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.490576 0.399854 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.469922 0.39432 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.39469 0.414851 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403906 0.434147 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403906 0.434147 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409811 0.399731 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434147 0.403906 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409811 0.399731 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434147 0.403906 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419026 0.419026 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.835815 -0.157543 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.871646 -0.122136 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.871334 -0.102403 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.850164 -0.113406 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862937 -0.100577 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.892817 -0.111133 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.884419 -0.109307 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.893129 -0.130866 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880044 -0.123961 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880356 -0.143694 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.858873 -0.134964 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.799077 -0.135649 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.781177 -0.120908 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.778973 -0.13149 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.795477 -0.113462 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.801282 -0.125067 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.815582 -0.11762 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819182 -0.139808 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.784778 -0.143095 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802678 -0.157836 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.782573 -0.153678 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.82339 -0.0854653 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.811594 -0.0654286 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.80102 -0.0876595 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.820516 -0.0820122 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.833964 -0.0632344 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.842886 -0.079818 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.845761 -0.083271 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.814468 -0.0688817 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.826265 -0.0889183 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803895 -0.0911125 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.908384 -0.14403 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.926643 -0.128672 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.90826 -0.133221 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.904034 -0.1198 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.926768 -0.139481 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.904159 -0.130608 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.908508 -0.154838 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.930993 -0.152902 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.912733 -0.16826 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.912609 -0.157451 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860128 -0.107359 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.853284 -0.0905999 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.839638 -0.0940331 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840233 -0.111382 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.873773 -0.103926 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860723 -0.124708 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880618 -0.120685 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.873178 -0.086577 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880022 -0.103336 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.859532 -0.0900102 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.872552 -0.179437 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.894035 -0.188167 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.885777 -0.195141 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.89378 -0.172046 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880811 -0.172463 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.880556 -0.156342 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.859328 -0.163733 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.872807 -0.195558 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.851325 -0.186828 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.864549 -0.202532 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.884071 -0.194213 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.891905 -0.197746 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.867957 -0.193701 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.884286 -0.175383 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.908019 -0.198259 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.900401 -0.175896 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.900186 -0.194726 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.89169 -0.216576 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.883856 -0.213043 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.867741 -0.212531 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.84824 -0.229621 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.843832 -0.25245 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.826426 -0.235043 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.846687 -0.233837 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.865646 -0.247028 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.868501 -0.228415 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.870053 -0.224198 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.845385 -0.248234 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.849792 -0.225404 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.827978 -0.230827 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.811502 -0.207727 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.794108 -0.212743 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.788345 -0.199907 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802328 -0.189621 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.817265 -0.220563 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.825486 -0.197441 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.83466 -0.215547 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803282 -0.230849 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.820676 -0.225832 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.797518 -0.218012 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.61371 -0.142305 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.597249 -0.125845 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.592635 -0.138689 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.610094 -0.12123 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618324 -0.12946 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631169 -0.124846 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634785 -0.145921 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600865 -0.14692 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617326 -0.163381 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.596251 -0.159765 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.554772 -0.141271 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577935 -0.13272 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554772 -0.141271 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.577935 -0.13272 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.153374 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549237 -0.161926 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566866 -0.174029 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566866 -0.174029 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.612676 -0.0833673 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604124 -0.10653 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633331 -0.0778329 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645433 -0.0954616 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645433 -0.0954616 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612676 -0.0833673 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.100996 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604124 -0.10653 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.68526 -0.161477 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687686 -0.148046 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6652 -0.154071 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678869 -0.137627 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.707746 -0.155452 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.698929 -0.145033 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70532 -0.168883 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.694077 -0.171896 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.691651 -0.185327 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671591 -0.177921 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.700504 -0.095832 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681209 -0.105047 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681209 -0.105047 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715624 -0.110952 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711449 -0.135288 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715624 -0.110952 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.711449 -0.135288 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.120168 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.736819 -0.190051 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721035 -0.171063 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.736819 -0.190051 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721035 -0.171063 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.191718 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.731284 -0.210706 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.709966 -0.212373 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.709966 -0.212373 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632882 -0.213855 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.61945 -0.216282 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609032 -0.207465 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.625476 -0.193796 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6433 -0.222672 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649326 -0.200186 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.656732 -0.220246 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626857 -0.236341 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640288 -0.233915 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616438 -0.227525 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.661455 -0.265414 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642468 -0.249631 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.68211 -0.25988 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683777 -0.238562 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.683777 -0.238562 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661455 -0.265414 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.244096 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642468 -0.249631 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.567237 -0.2291 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576452 -0.209804 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.576452 -0.209804 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582357 -0.24422 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606693 -0.240045 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582357 -0.24422 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606693 -0.240045 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.224924 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69376 0.0133465 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.674309 0.0838533 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.66171 0.103063 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.653258 0.0800983 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673446 0.0876683 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682761 0.106818 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.694497 0.0914233 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69536 0.0876083 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.662574 0.0992478 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.675172 0.0800382 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.654121 0.0762832 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599047 0.0239663 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666287 0.0539145 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.662466 0.0547519 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660752 0.0332597 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682791 0.0439578 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.668 0.0754066 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.688325 0.0646126 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671821 0.0745692 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645962 0.0647085 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649783 0.0638711 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644249 0.0432164 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.745859 0.0646815 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.750021 0.0887955 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.729506 0.078459 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732161 0.0813312 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.766375 0.075018 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.748514 0.0675537 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.762212 0.050904 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.763719 0.0721458 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759557 0.0480318 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743204 0.0618093 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737837 0.0347427 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.747099 0.0542122 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743371 0.0553974 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.7241 0.0550267 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741565 0.0335575 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718566 0.0343719 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732303 0.014088 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.760836 0.0339282 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.751574 0.0144587 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.757108 0.0351134 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.781094 -0.024813 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701782 0.0432853 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.693716 0.0608821 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.677932 0.0496759 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.694884 0.0652402 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717566 0.0544915 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718734 0.0588496 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.725632 0.0368947 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.700615 0.0389272 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.708681 0.0213304 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.684831 0.027721 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721234 -0.0272215 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.720593 -0.0310802 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.7 -0.0246945 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718114 -0.00820099 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741827 -0.0336072 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739347 -0.010728 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.742467 -0.0297485 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.723713 -0.0501007 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.724354 -0.046242 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70312 -0.043715 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649684 -0.00804971 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.628657 -0.00328338 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630031 0.000378614 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642244 0.0152909 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648309 -0.0117117 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661896 0.00686255 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669336 -0.016478 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636097 -0.026624 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657124 -0.0313903 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637471 -0.022962 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.835815 -0.157543 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.899353 -0.119969 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.909872 -0.0977075 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.891613 -0.104052 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.886771 -0.0997803 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.917612 -0.113625 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.894512 -0.115698 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.907093 -0.135886 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.922453 -0.117896 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.911935 -0.140158 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.904194 -0.124241 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.868703 -0.130205 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.867758 -0.11253 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.846864 -0.122142 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860854 -0.107566 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.889596 -0.120593 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.882692 -0.115629 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.890541 -0.138267 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.875606 -0.135168 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.876551 -0.152843 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.854713 -0.14478 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.836885 -0.0844101 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.826973 -0.0627848 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.81296 -0.083104 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.830202 -0.0805529 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.850898 -0.0640908 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.854126 -0.0818589 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.860809 -0.0857161 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.833656 -0.0666419 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.843568 -0.0882673 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819643 -0.0869612 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.866465 -0.147308 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.876203 -0.130609 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.879733 -0.128522 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.857385 -0.124356 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862935 -0.149395 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.844117 -0.143141 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.853198 -0.166093 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.885283 -0.153561 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.875546 -0.170259 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.888813 -0.151474 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803997 -0.111748 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.798532 -0.108311 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.797989 -0.131037 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819589 -0.119537 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.80454 -0.0890219 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.825597 -0.100248 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.810005 -0.0924597 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.78294 -0.100522 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.788405 -0.10396 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.782397 -0.123249 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802927 -0.184881 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.785723 -0.180723 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.798991 -0.161937 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.782104 -0.173028 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.78966 -0.203667 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786041 -0.195972 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.806864 -0.207825 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.806546 -0.192576 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.82375 -0.196734 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819813 -0.17379 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.898283 -0.193102 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.920038 -0.201143 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.900209 -0.201384 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.910616 -0.17991 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.918112 -0.192861 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.90869 -0.171628 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.896357 -0.18482 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.907705 -0.214335 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.88595 -0.206294 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.887876 -0.214576 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.834745 -0.230676 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.824206 -0.252002 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.810793 -0.231282 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.827952 -0.234336 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.848158 -0.251396 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.851905 -0.23373 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.858698 -0.23007 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.830999 -0.248342 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.841538 -0.227016 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.817586 -0.227621 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.867633 -0.203337 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.868948 -0.209658 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.84746 -0.202239 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.865773 -0.186008 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.889121 -0.210757 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.885946 -0.187106 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.887806 -0.204436 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.870808 -0.226988 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.869493 -0.220667 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.84932 -0.219569 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69376 0.0133465 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.668775 0.0631985 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.661946 0.0667914 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65711 0.0452771 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680354 0.0511945 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673611 0.0847128 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.692019 0.069116 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680439 0.08112 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.650366 0.0787954 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657195 0.0752026 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64553 0.0572811 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.604582 0.0446211 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627745 0.053173 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.62221 0.0325183 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599047 0.0239663 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616676 0.0118635 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649684 -0.00804971 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.634953 -0.000226782 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655218 0.012605 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.635947 0.0122343 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.629419 -0.0208815 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630413 -0.00842045 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.644149 -0.0287044 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.64869 -0.0205108 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.66342 -0.0283337 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.668955 -0.00767898 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.740325 0.0440268 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.746894 0.0650768 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739183 0.0653796 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.723153 0.0607735 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.748035 0.0437239 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.724295 0.0394207 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741466 0.0226739 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.764065 0.04833 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.757496 0.02728 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.756355 0.0486329 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721234 -0.0272215 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.732368 -0.0484665 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715699 -0.0478762 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737738 -0.0371781 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737902 -0.0278118 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743272 -0.0165234 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.726768 -0.00656677 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715864 -0.0385099 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70473 -0.0172649 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.699195 -0.0379196 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786629 -0.00415829 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.770845 0.0148294 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76531 -0.0058253 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.781094 -0.024813 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759776 -0.02648 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.712851 0.0845947 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.706291 0.107813 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.689001 0.0909853 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701434 0.0896851 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.730141 0.101422 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.725284 0.0832945 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.736701 0.0782041 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717709 0.102723 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.724268 0.0795043 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.700418 0.0858949 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.737837 0.0347427 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.740802 0.0511556 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718185 0.043171 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.730397 0.0580833 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.760455 0.0427273 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.750049 0.0496549 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.757489 0.0263144 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.748242 0.027815 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.745277 0.0114021 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.725625 0.0198304 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666287 0.0539145 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.650692 0.0721382 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645053 0.0564414 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663167 0.072935 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671925 0.0696112 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.6844 0.070408 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.68752 0.0513875 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.653812 0.0531177 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.669407 0.034894 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648173 0.0374209 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643951 -0.172546 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.674191 -0.142305 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.672341 -0.123995 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.666199 -0.120057 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651943 -0.134313 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680334 -0.146243 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.659936 -0.156561 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.682184 -0.164554 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.69459 -0.131987 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696439 -0.150298 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.688447 -0.12805 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.715501 -0.153374 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.731779 -0.136231 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.712305 -0.141449 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.70911 -0.129524 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.734974 -0.148156 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.712305 -0.141449 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718696 -0.165299 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.738169 -0.160081 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.721891 -0.177224 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.718696 -0.165299 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.663122 -0.100996 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.656415 -0.0783272 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639272 -0.0946054 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651197 -0.0978007 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.680265 -0.0847178 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.675047 -0.104191 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.686972 -0.107387 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.66834 -0.0815225 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.675047 -0.104191 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651197 -0.0978007 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.602641 -0.161477 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.60298 -0.154189 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.622115 -0.166695 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.617912 -0.143431 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583506 -0.148971 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.598439 -0.138214 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583168 -0.156259 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587708 -0.172234 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58737 -0.179523 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.606843 -0.184741 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.591572 -0.120168 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.577317 -0.105912 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582843 -0.128897 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600302 -0.111438 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586046 -0.0971825 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609032 -0.102708 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600302 -0.111438 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.568587 -0.114642 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.582843 -0.128897 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.574113 -0.137627 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5724 -0.191718 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.549732 -0.185011 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569205 -0.179793 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.56601 -0.167868 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.552927 -0.196936 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569205 -0.179793 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575596 -0.203643 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556122 -0.208861 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.578791 -0.215568 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.575596 -0.203643 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.655019 -0.213855 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.653756 -0.23668 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636974 -0.229127 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660237 -0.233329 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671802 -0.221409 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678283 -0.218058 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.673065 -0.198584 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648538 -0.217207 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.649801 -0.194382 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631756 -0.209653 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624779 -0.244096 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.607636 -0.260374 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600929 -0.237705 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612854 -0.240901 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.631486 -0.266765 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636704 -0.247291 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648629 -0.250487 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619561 -0.26357 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.636704 -0.247291 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612854 -0.240901 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.696329 -0.224924 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.710584 -0.23918 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687599 -0.233654 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.705059 -0.216195 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719314 -0.23045 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.713788 -0.207465 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.705059 -0.216195 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.701855 -0.24791 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687599 -0.233654 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.678869 -0.242384 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786005 -0.343435 8.51251e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.82165 -0.392454 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.824791 -0.400556 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802599 -0.392663 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.821021 -0.376528 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.843843 -0.400347 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840073 -0.376319 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840701 -0.392245 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.82542 -0.416482 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.822279 -0.40838 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.803228 -0.408589 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.753118 -0.370774 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.734271 -0.367981 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.731279 -0.362711 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.745269 -0.348136 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.756109 -0.376044 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.767107 -0.356199 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.774956 -0.378837 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.74212 -0.390619 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.760966 -0.393412 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.739128 -0.385349 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.80984 -0.323622 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.80634 -0.308073 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.786996 -0.316395 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802721 -0.300378 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.829184 -0.315299 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.825565 -0.307605 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.832685 -0.330849 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.813459 -0.331317 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.81696 -0.346866 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.794116 -0.339639 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.854538 -0.365116 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.878086 -0.365674 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.859887 -0.367962 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.863875 -0.346241 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.872736 -0.362827 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.858526 -0.343394 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.849188 -0.362269 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.868748 -0.384548 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.8452 -0.38399 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.85055 -0.386837 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.842728 -0.296284 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.848999 -0.272611 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.828835 -0.281616 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.829121 -0.278432 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862893 -0.287278 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.843015 -0.293099 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.856621 -0.310951 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.862606 -0.290462 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.856335 -0.314135 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.842441 -0.299468 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.818893 -0.316097 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.819591 -0.297057 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.814956 -0.293153 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.79807 -0.304244 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.823527 -0.320001 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.802007 -0.327188 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.822829 -0.339041 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.840413 -0.30891 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.839716 -0.32795 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.835779 -0.305006 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.797815 -0.412267 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.793573 -0.436217 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.776294 -0.419454 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.796968 -0.420728 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.815094 -0.42903 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.818489 -0.413542 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.819335 -0.405081 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.79442 -0.427756 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.798662 -0.403807 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.777141 -0.410993 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.76217 -0.363249 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.747522 -0.356966 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.759239 -0.339469 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.740618 -0.352002 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.750453 -0.380746 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.743549 -0.375782 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.765101 -0.387029 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.769074 -0.368213 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.783722 -0.374496 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.780791 -0.350716 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.729282 -0.390587 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.704862 -0.392427 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.717401 -0.374248 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.714218 -0.373948 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.716744 -0.408767 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.726099 -0.390287 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.741164 -0.406927 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.719927 -0.409067 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.744347 -0.407227 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.732465 -0.390887 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594141 -0.358439 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.542042 -0.409774 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.517869 -0.413579 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528508 -0.393219 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.525596 -0.395831 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.531404 -0.430134 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.539131 -0.412386 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555577 -0.426328 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534315 -0.427522 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558488 -0.423716 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544953 -0.407161 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499428 -0.347819 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550064 -0.379835 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.529037 -0.375068 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530412 -0.371406 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.542624 -0.356494 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548689 -0.383497 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562276 -0.364922 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569716 -0.388263 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536477 -0.398409 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.557504 -0.403175 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.537852 -0.394747 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.613592 -0.428945 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.612625 -0.451897 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593593 -0.436515 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.614807 -0.432663 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632624 -0.444328 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.634806 -0.425094 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.633591 -0.421376 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.61141 -0.448179 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.612377 -0.425227 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.592379 -0.432797 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621614 -0.399007 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.620974 -0.402865 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600381 -0.39648 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618494 -0.379986 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642207 -0.405392 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639728 -0.382513 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.642848 -0.401533 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624094 -0.421886 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624734 -0.418027 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.603501 -0.4155 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681475 -0.396598 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586119 -0.388377 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.570335 -0.399584 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562269 -0.381987 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569167 -0.403942 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594185 -0.405974 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.593017 -0.410332 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.609969 -0.394768 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587286 -0.384019 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60307 -0.372813 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57922 -0.366422 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638217 -0.337042 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.64748 -0.317573 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643752 -0.316388 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.624481 -0.316758 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.641945 -0.338228 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618946 -0.337413 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.632683 -0.357697 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.661216 -0.337857 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.651954 -0.357326 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.657489 -0.336672 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566667 -0.317871 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.562847 -0.317033 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.561133 -0.338525 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.583171 -0.327827 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.568381 -0.296378 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.588706 -0.307172 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572202 -0.297216 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.546343 -0.307077 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550163 -0.307914 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544629 -0.328569 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.594141 -0.358439 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.547576 -0.389119 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.525642 -0.386849 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528407 -0.379645 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.538964 -0.366733 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.544812 -0.396323 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.558134 -0.376207 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566746 -0.398593 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.534255 -0.409235 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.556189 -0.411505 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.537019 -0.402031 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.504962 -0.327164 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.528125 -0.318612 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.522591 -0.339267 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.499428 -0.347819 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.517056 -0.359921 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.566667 -0.317871 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.551072 -0.299647 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.545434 -0.315344 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563547 -0.29885 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.572306 -0.302174 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.584781 -0.301377 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587901 -0.320398 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.554192 -0.318667 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569787 -0.336891 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.548554 -0.334364 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.619127 -0.408291 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.617918 -0.415912 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.597788 -0.406911 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616439 -0.39183 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.639257 -0.417292 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.637778 -0.39321 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.640465 -0.409671 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.620605 -0.432372 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621814 -0.424751 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.600475 -0.423371 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638217 -0.337042 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.641183 -0.320629 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.618565 -0.328614 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.630777 -0.313702 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660835 -0.329058 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65043 -0.32213 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.65787 -0.345471 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.648623 -0.34397 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.645657 -0.360383 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.626005 -0.351955 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.687009 -0.375943 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.671225 -0.356956 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.665691 -0.37761 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.681475 -0.396598 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.660156 -0.398265 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.57505 -0.429687 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.55776 -0.446515 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5512 -0.423296 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.562617 -0.428387 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.58161 -0.452905 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.586467 -0.434777 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.5989 -0.436077 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.570193 -0.447815 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.587483 -0.430987 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563633 -0.424596 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.621614 -0.399007 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.632748 -0.420252 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.61608 -0.419661 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638118 -0.408963 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.638282 -0.399597 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.643653 -0.388308 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.627149 -0.378352 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.616244 -0.410295 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.60511 -0.38905 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.599576 -0.409705 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.550064 -0.379835 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.535334 -0.372012 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.555599 -0.35918 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.536327 -0.359551 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.529799 -0.392667 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.530793 -0.380205 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.54453 -0.400489 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.549071 -0.392296 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.563801 -0.400119 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.569335 -0.379464 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0996195 -0.371785 0.544331 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.220501 -0.393621 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.279642 -0.368601 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.299716 -0.354293 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.292196 -0.366989 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.279022 -0.347717 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287162 -0.355904 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266468 -0.349329 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267088 -0.370213 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.300337 -0.375177 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.280263 -0.389485 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.292817 -0.387873 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281062 -0.372464 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.289441 -0.362978 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.270044 -0.378255 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267771 -0.35549 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30046 -0.357187 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.278789 -0.349699 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29208 -0.366673 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302733 -0.379952 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294353 -0.389438 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.283335 -0.395229 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238665 -0.321889 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.250544 -0.304702 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259421 -0.327715 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238717 -0.32307 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.229788 -0.298875 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.21796 -0.317244 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217908 -0.316063 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250492 -0.30352 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.238612 -0.320707 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259369 -0.326533 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219082 -0.389758 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.228779 -0.378635 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.24293 -0.383364 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225483 -0.365937 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20493 -0.385029 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201634 -0.372331 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.195233 -0.396152 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.222377 -0.402455 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.21268 -0.413578 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236529 -0.407185 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.178104 -0.343046 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.177083 -0.319723 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198298 -0.332294 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.189464 -0.325124 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.156889 -0.330475 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.16927 -0.335876 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.157909 -0.353797 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165722 -0.337645 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166743 -0.360967 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.186938 -0.350216 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.15994 -0.414778 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.147477 -0.412573 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172167 -0.412448 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.15977 -0.39322 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13525 -0.414903 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.147543 -0.39555 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.147713 -0.417108 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.147647 -0.434131 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.16011 -0.436336 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172338 -0.434006 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.261479 -0.440333 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.282991 -0.443285 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282046 -0.4302 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271991 -0.421181 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262424 -0.453417 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251423 -0.431313 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.240911 -0.450466 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27248 -0.462437 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.250967 -0.459485 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271534 -0.449353 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.202338 -0.465353 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.204606 -0.486123 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223366 -0.470107 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.202946 -0.464339 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183578 -0.481368 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181918 -0.459584 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.18131 -0.460599 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.203998 -0.487137 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201729 -0.466367 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.222757 -0.471122 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262898 -0.444196 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.285685 -0.449273 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27701 -0.426189 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282528 -0.436139 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271573 -0.46728 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268416 -0.454146 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248787 -0.462204 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266055 -0.45733 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.243269 -0.452254 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257381 -0.434246 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.367156 -0.277961 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.374298 -0.269898 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.362218 -0.291334 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.350338 -0.270045 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379235 -0.256525 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355276 -0.256671 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.372093 -0.264588 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.391115 -0.277815 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383973 -0.285878 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.379036 -0.299251 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.304189 -0.304189 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29042 -0.307879 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307879 -0.29042 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328039 -0.31058 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331729 -0.29681 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33812 -0.32066 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31058 -0.328039 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32066 -0.33812 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29681 -0.331729 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297666 -0.252306 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.305995 -0.235688 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321516 -0.245915 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312359 -0.259438 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282145 -0.242079 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288509 -0.265828 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273816 -0.258696 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291303 -0.228556 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282974 -0.245173 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306824 -0.238783 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367156 -0.277961 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.385852 -0.261966 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.38141 -0.278159 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.36581 -0.259422 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.371598 -0.261768 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351556 -0.259225 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.352901 -0.277764 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387198 -0.280504 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.368501 -0.2965 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382755 -0.296698 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.297666 -0.252306 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.30415 -0.228803 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321516 -0.245915 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306824 -0.238783 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2803 -0.235194 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282974 -0.245173 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273816 -0.258696 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294992 -0.242326 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288509 -0.265828 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312359 -0.259438 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31427 -0.31427 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.32435 -0.304189 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33812 -0.307879 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32066 -0.29042 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3005 -0.31058 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29681 -0.29681 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29042 -0.32066 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317959 -0.328039 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307879 -0.33812 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331729 -0.331729 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.383759 -0.339925 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.407156 -0.334762 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.388696 -0.326552 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.392275 -0.31686 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402218 -0.348135 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387337 -0.330233 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378821 -0.353299 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39864 -0.357827 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.375243 -0.362991 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.380181 -0.349618 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330873 -0.376234 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.346394 -0.386461 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.354723 -0.369843 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340031 -0.362711 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322544 -0.392851 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316181 -0.369102 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307023 -0.382624 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337237 -0.399983 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321715 -0.389757 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345565 -0.383366 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330873 -0.376234 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.348239 -0.393346 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.354723 -0.369843 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345565 -0.383366 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324389 -0.399736 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321715 -0.389757 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307023 -0.382624 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.333547 -0.386213 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316181 -0.369102 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.340031 -0.362711 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166275 -0.191247 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.20793 -0.130089 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.221102 -0.115471 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.220766 -0.13987 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.200597 -0.126388 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208266 -0.10569 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187762 -0.116607 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.195095 -0.120308 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228435 -0.119172 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215264 -0.13379 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228099 -0.143571 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.230419 -0.192135 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.243049 -0.18209 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218634 -0.185251 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227721 -0.168159 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.254834 -0.188974 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.239506 -0.175043 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242204 -0.199019 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.245747 -0.206066 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233117 -0.216111 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221332 -0.209227 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172673 -0.154295 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.180792 -0.15554 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.19323 -0.166926 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.171251 -0.17557 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.160236 -0.142909 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.150694 -0.162939 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152117 -0.141663 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.182215 -0.134265 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.174096 -0.133019 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.194652 -0.145651 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.143787 -0.129201 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.14887 -0.105335 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.167242 -0.121723 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153943 -0.115741 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.125414 -0.112813 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.130487 -0.123219 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.120331 -0.136679 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.138714 -0.118795 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13363 -0.142661 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.157086 -0.135183 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108529 -0.153407 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0995811 -0.130858 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.113639 -0.134736 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.123725 -0.135326 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0944715 -0.149528 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.118615 -0.153997 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.10342 -0.172078 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0843858 -0.148938 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0933338 -0.171487 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0984435 -0.152816 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102131 -0.190359 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0897843 -0.179968 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.114103 -0.183804 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.105492 -0.166467 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0778128 -0.186523 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0935207 -0.173022 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0901597 -0.196914 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0864233 -0.20386 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0987702 -0.214251 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.110742 -0.207696 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201532 -0.167041 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.219088 -0.151829 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.221861 -0.163068 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205084 -0.14514 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.19876 -0.155801 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.184756 -0.149113 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181204 -0.171014 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215537 -0.173729 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.197981 -0.188942 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.218309 -0.184969 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.159877 -0.228199 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.167942 -0.229756 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183484 -0.223214 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.16569 -0.207683 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.144336 -0.234741 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.142084 -0.212668 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.13627 -0.233184 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.162129 -0.250271 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.154064 -0.248714 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177671 -0.243729 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.224021 -0.229087 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.248268 -0.22829 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2391 -0.216949 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234532 -0.207937 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.233189 -0.240428 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219453 -0.220075 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208942 -0.241225 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.237756 -0.249439 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.213509 -0.250236 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.228589 -0.238098 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0058509 -0.451136 0.729516 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0051487 -0.447081 0.803476 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.01504 -0.435909 0.823149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0289993 -0.440694 0.803352 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0115452 -0.423265 0.802231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00881065 -0.442297 0.823273 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0123054 -0.429652 0.802355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0187019 -0.453468 0.8036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00864346 -0.459725 0.824394 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0012478 -0.470897 0.804721 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0226028 -0.46451 0.804597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0688765 -0.439178 0.766553 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0903221 -0.426942 0.766429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0806307 -0.435083 0.745229 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0699989 -0.416328 0.757266 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.078568 -0.431037 0.787754 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0582447 -0.420423 0.77859 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0571224 -0.443274 0.787878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0891998 -0.449792 0.775717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0677542 -0.462029 0.775841 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0795084 -0.457933 0.754517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0172804 -0.386138 0.763155 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0293677 -0.364644 0.76191 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0401449 -0.385352 0.753867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0213457 -0.375512 0.741241 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0065032 -0.36543 0.771198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00151881 -0.376298 0.750529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00558411 -0.386924 0.772443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0253024 -0.37527 0.783824 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0132151 -0.396764 0.785069 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0360796 -0.395978 0.775781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0578769 -0.459039 0.766439 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0707378 -0.451803 0.786236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0461991 -0.454158 0.787639 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0561039 -0.435761 0.774481 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0824157 -0.456685 0.765035 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0677817 -0.440643 0.753281 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0695548 -0.46392 0.745238 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0725109 -0.475081 0.778193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.05965 -0.482316 0.758396 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0479721 -0.477435 0.779597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0457452 -0.398096 0.726118 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0495643 -0.373728 0.724997 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0306825 -0.382672 0.738155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.030137 -0.383722 0.713492 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.064627 -0.389151 0.71296 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0451997 -0.399146 0.701455 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.060808 -0.41352 0.714081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0651725 -0.388102 0.737623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0613535 -0.41247 0.738744 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0462908 -0.397047 0.750781 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0571747 -0.463094 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.081612 -0.459563 0.692603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0696122 -0.463589 0.713804 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0665888 -0.442243 0.701767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0691745 -0.459069 0.671279 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0541513 -0.441749 0.680442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0447373 -0.4626 0.671155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0721979 -0.480415 0.683315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0477607 -0.483946 0.683192 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0601982 -0.48444 0.704516 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00628079 -0.512079 0.769837 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.000557006 -0.523883 0.790755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0165974 -0.51057 0.779001 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00208214 -0.49924 0.790506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0234352 -0.525392 0.781591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0249603 -0.500749 0.781342 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.029159 -0.513588 0.760673 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00475566 -0.536722 0.770086 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0104794 -0.524918 0.749168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0123987 -0.523409 0.758332 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00557859 -0.516134 0.695877 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00154892 -0.540463 0.697123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0156462 -0.524673 0.705165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00538221 -0.52751 0.717791 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0227737 -0.531924 0.687835 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.026607 -0.518971 0.708504 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0268034 -0.507596 0.68659 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00174531 -0.529087 0.675209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00577498 -0.504759 0.673964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0154498 -0.513298 0.683251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0574471 -0.504176 0.732914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0817008 -0.508666 0.734036 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0732807 -0.489545 0.720878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0722467 -0.488971 0.745541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0658672 -0.523298 0.746073 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0564131 -0.503602 0.757577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0416134 -0.518808 0.744951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0669012 -0.523872 0.72141 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0426474 -0.519382 0.720288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.058481 -0.504751 0.708251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0483751 -0.248762 0.655442 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.0599222 -0.183785 0.689081 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0522053 -0.160406 0.690965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0358698 -0.178533 0.687193 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0513956 -0.171954 0.669156 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0762577 -0.165658 0.692853 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.075448 -0.177206 0.671044 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0839747 -0.189036 0.690969 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0607319 -0.172236 0.71089 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0684488 -0.195615 0.709006 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0443964 -0.190363 0.707118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00673113 -0.215921 0.692479 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0258737 -0.20044 0.690591 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0203763 -0.215612 0.671903 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00551963 -0.196602 0.677151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0122285 -0.200749 0.711167 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00812553 -0.196911 0.697727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00691403 -0.21623 0.713055 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0270852 -0.21976 0.705919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00794264 -0.235241 0.707807 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0215878 -0.234932 0.687231 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0172857 -0.187119 0.6286 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00705049 -0.176731 0.608675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00352517 -0.200733 0.613272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.025725 -0.192673 0.60607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.020811 -0.163117 0.624003 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0394855 -0.179058 0.621398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0310463 -0.173504 0.643928 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00138875 -0.171177 0.631205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00884647 -0.181564 0.65113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00491406 -0.195179 0.635801 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115028 -0.216626 0.652044 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.127519 -0.195663 0.655816 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.108803 -0.201738 0.670732 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104303 -0.194866 0.647447 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.133744 -0.210551 0.637128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110528 -0.209754 0.628759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121254 -0.231514 0.633356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138245 -0.217423 0.660413 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.125754 -0.238386 0.656641 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119529 -0.223497 0.675329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0723919 -0.21996 0.591563 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0673141 -0.20388 0.573526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0609052 -0.198742 0.596811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0490355 -0.216456 0.584361 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0788008 -0.225098 0.568278 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0605222 -0.237674 0.579113 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0838786 -0.241177 0.586315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0906706 -0.207384 0.580727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0957484 -0.223463 0.598764 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0842617 -0.202246 0.604012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103481 -0.281603 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.126206 -0.291073 0.620293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110246 -0.293457 0.638981 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119897 -0.271345 0.633733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119442 -0.279219 0.599717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113132 -0.25949 0.613157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0967168 -0.269749 0.597829 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10979 -0.301332 0.604965 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0870656 -0.291862 0.603077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0938302 -0.303716 0.623653 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0910116 -0.245428 0.715923 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0942304 -0.234308 0.737733 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0714204 -0.238704 0.729364 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0854464 -0.221514 0.718528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113822 -0.241032 0.724292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.105038 -0.228237 0.705088 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110603 -0.252152 0.702483 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0997955 -0.258223 0.735128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0965768 -0.269343 0.713318 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0769856 -0.262619 0.726759 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0794645 -0.310405 0.682285 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0817333 -0.324811 0.702209 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0603366 -0.313378 0.697613 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0800146 -0.300317 0.704814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100861 -0.321838 0.686881 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0991425 -0.297345 0.689486 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0985923 -0.307433 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0811832 -0.334899 0.67968 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0789143 -0.320493 0.659755 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0597864 -0.323466 0.675083 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0243582 -0.277564 0.719322 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0076281 -0.275459 0.737359 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00142185 -0.270078 0.714074 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0167139 -0.255218 0.726523 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0305645 -0.282946 0.742607 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0396503 -0.262704 0.731771 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0472946 -0.285051 0.72457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0152725 -0.297806 0.730157 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0320026 -0.299911 0.71212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00906621 -0.292425 0.706872 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.544331 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.178985 -0.424299 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.190929 -0.412497 0.599471 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.16674 -0.417001 0.601529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.174844 -0.400273 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203175 -0.419795 0.57931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.18709 -0.407571 0.565115 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191231 -0.431597 0.561208 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195071 -0.436523 0.595564 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.183127 -0.448325 0.577461 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.170881 -0.441027 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.10495 -0.41922 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0911807 -0.42291 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10864 -0.40545 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128801 -0.425611 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13249 -0.411841 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138881 -0.435691 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111341 -0.44307 0.638566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121421 -0.45315 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0975713 -0.44676 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131634 -0.367336 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.12515 -0.343834 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107784 -0.360946 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122476 -0.353814 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149 -0.350225 0.585275 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.146326 -0.360204 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155484 -0.373727 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134308 -0.357357 0.603794 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.140792 -0.380859 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116942 -0.374468 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178985 -0.424299 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.200165 -0.411775 0.505236 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189948 -0.415187 0.527454 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179342 -0.399922 0.511201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189202 -0.420888 0.485076 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168379 -0.409035 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168023 -0.433412 0.487134 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.199808 -0.436152 0.501329 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178629 -0.448677 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189591 -0.439564 0.523547 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131634 -0.367336 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.123305 -0.350719 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107784 -0.360946 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116942 -0.374468 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.147155 -0.357109 0.491041 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.140792 -0.380859 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155484 -0.373727 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.137998 -0.343587 0.509559 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.146326 -0.360204 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122476 -0.353814 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115031 -0.4293 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.125111 -0.41922 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138881 -0.42291 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.121421 -0.40545 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.101261 -0.425611 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0975713 -0.411841 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0911807 -0.435691 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11872 -0.44307 0.450097 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10864 -0.45315 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13249 -0.44676 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.162382 -0.486264 0.544331 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.174264 -0.502603 0.558526 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.15142 -0.495376 0.564491 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.170327 -0.479659 0.566757 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.185226 -0.49349 0.538366 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.18129 -0.470546 0.546597 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173345 -0.477151 0.524171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166319 -0.509207 0.536101 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154437 -0.492868 0.521905 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143475 -0.501981 0.542066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0984274 -0.491265 0.507294 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0810612 -0.508376 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0745774 -0.484874 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0837352 -0.498397 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104911 -0.514767 0.503387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107585 -0.504787 0.525813 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122277 -0.497655 0.507294 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0957534 -0.501244 0.484868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11312 -0.484132 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0892696 -0.477742 0.488775 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0984274 -0.491265 0.581368 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.082906 -0.501491 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0745774 -0.484874 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0892696 -0.477742 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.106756 -0.507882 0.597621 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11312 -0.484132 0.599887 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122277 -0.497655 0.581368 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0920638 -0.515014 0.579103 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107585 -0.504787 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0837352 -0.498397 0.56285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.153845 -0.574159 0.618405 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.202534 -0.612768 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.225282 -0.612732 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.22113 -0.60221 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.212428 -0.591695 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206686 -0.62329 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193832 -0.602253 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.183939 -0.623325 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215388 -0.633805 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.192641 -0.63384 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.211236 -0.623283 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.243024 -0.542885 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219861 -0.534333 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.243024 -0.542885 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219861 -0.534333 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248559 -0.563539 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23093 -0.575642 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.23093 -0.575642 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.184086 -0.543919 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.200547 -0.527458 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205161 -0.540303 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187702 -0.522843 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.179472 -0.531074 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.166627 -0.526459 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.163011 -0.547535 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.196931 -0.548533 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.18047 -0.564994 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201546 -0.561378 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.130984 -0.631939 0.658726 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.132649 -0.643128 0.680674 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.152367 -0.631785 0.671072 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.133263 -0.618482 0.679302 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.111266 -0.643283 0.668328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11188 -0.618637 0.666956 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.109601 -0.632094 0.64638 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.130371 -0.656585 0.660098 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128706 -0.645397 0.63815 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.150088 -0.645242 0.650495 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.112536 -0.56309 0.678886 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.11011 -0.549659 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.132596 -0.555684 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.118927 -0.53924 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.09005 -0.557065 0.687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0988668 -0.546646 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0924762 -0.570497 0.666541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.103719 -0.573509 0.699462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.106145 -0.58694 0.678886 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.126205 -0.579534 0.691232 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.618405 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0609772 -0.591664 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.643096 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.076761 -0.572676 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0609772 -0.591664 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.076761 -0.572676 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.593714 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0665116 -0.612319 0.618405 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0878298 -0.613986 0.606059 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0878298 -0.613986 0.630751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.172294 -0.643008 0.598245 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.189742 -0.660425 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.196144 -0.636618 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.185725 -0.645434 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.165892 -0.666816 0.599616 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.161875 -0.651825 0.618821 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.148444 -0.649399 0.598245 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.17631 -0.657999 0.57904 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.158862 -0.640582 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.182712 -0.634191 0.577669 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.123605 -0.6044 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.107144 -0.620861 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.119989 -0.625475 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102529 -0.608016 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.11076 -0.599785 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.106145 -0.58694 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.127221 -0.583324 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.128219 -0.617245 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.14468 -0.600784 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.141064 -0.621859 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.195155 -0.585228 0.557924 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.203972 -0.574809 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.181486 -0.568784 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.201546 -0.561378 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.217641 -0.591253 0.549693 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.215215 -0.577822 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.208824 -0.601672 0.57027 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.197581 -0.598659 0.537348 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.188764 -0.609078 0.557924 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.175095 -0.592634 0.545578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0329639 -0.552323 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0248832 -0.625877 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0316054 -0.646362 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0478 -0.627981 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0287309 -0.625173 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00868865 -0.644258 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00581415 -0.623069 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00196644 -0.623773 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0277577 -0.647066 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0210355 -0.62658 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0439523 -0.628685 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0822954 -0.593331 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.105299 -0.593994 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.100664 -0.582384 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0926585 -0.572783 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0869303 -0.604941 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0742898 -0.58373 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0639267 -0.604278 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0949359 -0.614541 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0719323 -0.613879 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.090301 -0.602932 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0138144 -0.584567 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0177119 -0.584898 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0364224 -0.580268 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0185345 -0.56353 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00489609 -0.589197 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00407348 -0.567829 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00879364 -0.588867 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0129918 -0.605935 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00909422 -0.605605 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0317022 -0.601305 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0244483 -0.584869 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0473753 -0.5935 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0308315 -0.595617 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0399691 -0.57344 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0409921 -0.582752 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0335859 -0.562692 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0180651 -0.574121 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0318545 -0.604929 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00892756 -0.596298 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0153107 -0.607046 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0355172 -0.54356 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0495897 -0.530389 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0261165 -0.53532 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.031221 -0.519442 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0589904 -0.538628 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0406217 -0.527681 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0449178 -0.551799 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0538859 -0.554507 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0398133 -0.567678 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0304127 -0.559438 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0163676 -0.511316 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0212225 -0.48882 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00896145 -0.491256 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00194055 -0.497372 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0286287 -0.50888 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00546563 -0.517432 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0237738 -0.531375 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0395307 -0.502764 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0346758 -0.525259 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0272696 -0.505199 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0440327 -0.593633 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0604766 -0.607302 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0678827 -0.587242 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0604766 -0.607302 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0366265 -0.613693 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0366265 -0.613693 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0201827 -0.600023 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0440327 -0.593633 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0275889 -0.579964 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0514389 -0.573573 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0521134 -0.520079 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0542684 -0.523344 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0591566 -0.541988 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0358996 -0.534291 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0472252 -0.501435 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0288565 -0.512382 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0450702 -0.49817 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0704822 -0.509132 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0683272 -0.505868 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0753703 -0.527777 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101445 -0.561087 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.118381 -0.551884 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0944221 -0.550745 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.103361 -0.536664 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.125404 -0.562225 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.110383 -0.547006 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.108468 -0.571428 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.116465 -0.576307 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0995293 -0.58551 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0925065 -0.575168 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247614 -0.494808 0.43322 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.313607 -0.494287 0.399581 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.326876 -0.484182 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302705 -0.488171 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310432 -0.470513 0.39372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337778 -0.490299 0.402668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321334 -0.476629 0.415013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.324509 -0.500404 0.420874 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330051 -0.507957 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316783 -0.518062 0.405442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.305881 -0.511946 0.384149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269833 -0.434629 0.396183 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.279233 -0.426389 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286276 -0.448298 0.383837 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263449 -0.445377 0.37489 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262789 -0.41272 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.247006 -0.431707 0.387235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.253389 -0.420959 0.408529 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.285616 -0.415641 0.396183 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.276216 -0.42388 0.417476 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29266 -0.43755 0.40513 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302539 -0.452978 0.460062 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.320401 -0.436971 0.454201 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3148 -0.455413 0.438769 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29902 -0.436675 0.441856 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30814 -0.434535 0.475494 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286759 -0.434239 0.463149 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290278 -0.450543 0.481355 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32392 -0.453274 0.472408 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306057 -0.469281 0.478269 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318318 -0.471717 0.456976 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291389 -0.554467 0.436618 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.314604 -0.562288 0.439705 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.310183 -0.541186 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.306499 -0.542501 0.45205 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.29581 -0.575569 0.448652 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287705 -0.555781 0.460998 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.272595 -0.567748 0.445566 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299494 -0.574255 0.424272 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.276279 -0.566433 0.421186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295073 -0.553152 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.28032 -0.513157 0.497099 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.298839 -0.507811 0.512531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.302049 -0.505577 0.488152 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.287442 -0.489718 0.500186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27711 -0.515392 0.521479 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.265714 -0.497299 0.509133 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258591 -0.520738 0.506047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291716 -0.531251 0.509445 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273198 -0.536597 0.494013 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294927 -0.529016 0.485065 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225396 -0.554987 0.470257 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.227186 -0.567359 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.246777 -0.555283 0.482603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.227528 -0.54267 0.49155 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.205805 -0.567063 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.206147 -0.542374 0.479204 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.204014 -0.554691 0.457911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.225054 -0.579676 0.470257 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.223263 -0.567305 0.448964 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.244644 -0.567601 0.46131 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258683 -0.536117 0.372739 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.275127 -0.549787 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282533 -0.529727 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275127 -0.549787 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251277 -0.556177 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.251277 -0.556177 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.234833 -0.542508 0.372739 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.258683 -0.536117 0.348047 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.242239 -0.522448 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.266089 -0.516058 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.19269 -0.536638 0.406378 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.17251 -0.549603 0.412239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.191778 -0.549105 0.427671 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.177908 -0.528912 0.424584 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.173421 -0.537136 0.390945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.178819 -0.516445 0.403291 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193601 -0.524171 0.385084 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.187292 -0.557329 0.394032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.207471 -0.544363 0.388171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.20656 -0.556831 0.409464 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214908 -0.476459 0.369341 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.209819 -0.457868 0.353908 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.210053 -0.453963 0.378288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2312 -0.458164 0.366254 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.214674 -0.480363 0.344961 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.236055 -0.480659 0.357307 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.219763 -0.498954 0.360393 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193527 -0.476163 0.356995 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.198616 -0.494753 0.372427 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.193761 -0.472258 0.381374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER -0.157543 -0.835815 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.122136 -0.871646 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.102403 -0.871334 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100577 -0.862937 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113406 -0.850164 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.123961 -0.880044 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.134964 -0.858873 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143694 -0.880356 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111133 -0.892817 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.130866 -0.893129 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.109307 -0.884419 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0854653 -0.82339 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0654286 -0.811594 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0820122 -0.820516 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0876595 -0.80102 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0688817 -0.814468 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0911125 -0.803895 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0889183 -0.826265 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0632344 -0.833964 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.083271 -0.845761 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.079818 -0.842886 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135649 -0.799077 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.120908 -0.781177 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113462 -0.795477 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13149 -0.778973 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143095 -0.784778 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153678 -0.782573 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.157836 -0.802678 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.125067 -0.801282 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.139808 -0.819182 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.11762 -0.815582 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194213 -0.884071 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.197746 -0.891905 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.175383 -0.884286 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.193701 -0.867957 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216576 -0.89169 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212531 -0.867741 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.213043 -0.883856 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.198259 -0.908019 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194726 -0.900186 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.175896 -0.900401 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207727 -0.811502 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.212743 -0.794108 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.189621 -0.802328 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.199907 -0.788345 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.230849 -0.803282 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.218012 -0.797518 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225832 -0.820676 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220563 -0.817265 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215547 -0.83466 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.197441 -0.825486 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.229621 -0.84824 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.25245 -0.843832 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233837 -0.846687 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.235043 -0.826426 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248234 -0.845385 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.230827 -0.827978 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225404 -0.849792 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.247028 -0.865646 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224198 -0.870053 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.228415 -0.868501 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14403 -0.908384 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.128672 -0.926643 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.1198 -0.904034 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.133221 -0.90826 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.152902 -0.930993 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.157451 -0.912609 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.16826 -0.912733 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.139481 -0.926768 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154838 -0.908508 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.130608 -0.904159 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179437 -0.872552 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.188167 -0.894035 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172046 -0.89378 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195141 -0.885777 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195558 -0.872807 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.202532 -0.864549 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.186828 -0.851325 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172463 -0.880811 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163733 -0.859328 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.156342 -0.880556 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107359 -0.860128 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0905999 -0.853284 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111382 -0.840233 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0940331 -0.839638 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.086577 -0.873178 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0900102 -0.859532 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103336 -0.880022 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.103926 -0.873773 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120685 -0.880618 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124708 -0.860723 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0133465 -0.69376 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0838533 -0.674309 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.103063 -0.66171 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0876683 -0.673446 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0800983 -0.653258 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0992478 -0.662574 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0762832 -0.654121 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0800382 -0.675172 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.106818 -0.682761 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0876083 -0.69536 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0914233 -0.694497 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0539145 -0.666287 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0547519 -0.662466 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0439578 -0.682791 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0332597 -0.660752 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0647085 -0.645962 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0432164 -0.644249 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0638711 -0.649783 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0754066 -0.668 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0745692 -0.671821 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0646126 -0.688325 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0239663 -0.599047 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0432853 -0.701782 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0608821 -0.693716 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0652402 -0.694884 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0496759 -0.677932 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0389272 -0.700615 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.027721 -0.684831 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0213304 -0.708681 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0544915 -0.717566 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0368947 -0.725632 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0588496 -0.718734 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00804971 -0.649684 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00328338 -0.628657 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0152909 -0.642244 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.000378614 -0.630031 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.026624 -0.636097 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.022962 -0.637471 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0313903 -0.657124 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0117117 -0.648309 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.016478 -0.669336 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.00686255 -0.661896 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0272215 -0.721234 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0310802 -0.720593 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00820099 -0.718114 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0246945 -0.7 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0501007 -0.723713 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.043715 -0.70312 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.046242 -0.724354 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0336072 -0.741827 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0297485 -0.742467 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.010728 -0.739347 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0646815 -0.745859 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0887955 -0.750021 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0813312 -0.732161 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.078459 -0.729506 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0721458 -0.763719 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0618093 -0.743204 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0480318 -0.759557 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.075018 -0.766375 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.050904 -0.762212 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0675537 -0.748514 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.024813 -0.781094 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0347427 -0.737837 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0542122 -0.747099 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0550267 -0.7241 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0553974 -0.743371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0339282 -0.760836 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0351134 -0.757108 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0144587 -0.751574 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0335575 -0.741565 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.014088 -0.732303 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0343719 -0.718566 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.142305 -0.61371 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.125845 -0.597249 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.12123 -0.610094 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138689 -0.592635 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14692 -0.600865 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.159765 -0.596251 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.163381 -0.617326 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.12946 -0.618324 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.145921 -0.634785 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124846 -0.631169 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0833673 -0.612676 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10653 -0.604124 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0833673 -0.612676 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10653 -0.604124 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.624779 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0778329 -0.633331 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0954616 -0.645433 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0954616 -0.645433 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.141271 -0.554772 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13272 -0.577935 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.161926 -0.549237 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.174029 -0.566866 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.174029 -0.566866 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141271 -0.554772 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.5724 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.13272 -0.577935 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.213855 -0.632882 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.216282 -0.61945 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.193796 -0.625476 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207465 -0.609032 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.236341 -0.626857 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.227525 -0.616438 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233915 -0.640288 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.222672 -0.6433 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220246 -0.656732 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200186 -0.649326 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.2291 -0.567237 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209804 -0.576452 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.209804 -0.576452 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.24422 -0.582357 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240045 -0.606693 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.24422 -0.582357 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240045 -0.606693 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.591572 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.265414 -0.661455 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.249631 -0.642468 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.265414 -0.661455 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.249631 -0.642468 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.663122 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.25988 -0.68211 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238562 -0.683777 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.238562 -0.683777 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.161477 -0.68526 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.148046 -0.687686 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.137627 -0.678869 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.154071 -0.6652 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171896 -0.694077 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177921 -0.671591 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.185327 -0.691651 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.155452 -0.707746 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.168883 -0.70532 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.145033 -0.698929 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.190051 -0.736819 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171063 -0.721035 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210706 -0.731284 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212373 -0.709966 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.212373 -0.709966 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.190051 -0.736819 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.715501 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171063 -0.721035 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.095832 -0.700504 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.105047 -0.681209 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.105047 -0.681209 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110952 -0.715624 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135288 -0.711449 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.110952 -0.715624 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135288 -0.711449 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.696329 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343435 -0.786005 8.51251e-17 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.392454 -0.82165 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.400556 -0.824791 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376528 -0.821021 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392663 -0.802599 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.416482 -0.82542 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408589 -0.803228 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.40838 -0.822279 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400347 -0.843843 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392245 -0.840701 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376319 -0.840073 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.323622 -0.80984 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.308073 -0.80634 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.300378 -0.802721 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316395 -0.786996 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.331317 -0.813459 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339639 -0.794116 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.346866 -0.81696 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.315299 -0.829184 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.330849 -0.832685 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307605 -0.825565 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.370774 -0.753118 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.367981 -0.734271 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.348136 -0.745269 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362711 -0.731279 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390619 -0.74212 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.385349 -0.739128 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.393412 -0.760966 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376044 -0.756109 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378837 -0.774956 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356199 -0.767107 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.412267 -0.797815 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.436217 -0.793573 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.420728 -0.796968 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419454 -0.776294 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427756 -0.79442 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410993 -0.777141 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403807 -0.798662 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.42903 -0.815094 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405081 -0.819335 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.413542 -0.818489 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390587 -0.729282 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.392427 -0.704862 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.373948 -0.714218 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374248 -0.717401 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409067 -0.719927 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390887 -0.732465 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407227 -0.744347 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408767 -0.716744 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406927 -0.741164 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.390287 -0.726099 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.363249 -0.76217 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.356966 -0.747522 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.352002 -0.740618 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339469 -0.759239 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.368213 -0.769074 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.350716 -0.780791 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.374496 -0.783722 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380746 -0.750453 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.387029 -0.765101 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375782 -0.743549 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.365116 -0.854538 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.365674 -0.878086 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.346241 -0.863875 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.367962 -0.859887 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384548 -0.868748 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.386837 -0.85055 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.38399 -0.8452 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362827 -0.872736 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.362269 -0.849188 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.343394 -0.858526 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316097 -0.818893 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.297057 -0.819591 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.304244 -0.79807 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293153 -0.814956 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.30891 -0.840413 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.305006 -0.835779 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32795 -0.839716 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320001 -0.823527 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339041 -0.822829 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327188 -0.802007 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296284 -0.842728 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.272611 -0.848999 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.278432 -0.829121 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.281616 -0.828835 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.290462 -0.862606 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.299468 -0.842441 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.314135 -0.856335 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.287278 -0.862893 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.310951 -0.856621 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.293099 -0.843015 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.358439 -0.594141 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.389119 -0.547576 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.386849 -0.525642 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366733 -0.538964 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379645 -0.528407 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409235 -0.534255 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.402031 -0.537019 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.411505 -0.556189 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396323 -0.544812 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398593 -0.566746 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.376207 -0.558134 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317871 -0.566667 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.299647 -0.551072 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.29885 -0.563547 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.315344 -0.545434 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318667 -0.554192 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.334364 -0.548554 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.336891 -0.569787 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.302174 -0.572306 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.320398 -0.587901 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.301377 -0.584781 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.347819 -0.499428 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.429687 -0.57505 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.446515 -0.55776 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428387 -0.562617 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423296 -0.5512 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.447815 -0.570193 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.424596 -0.563633 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.430987 -0.587483 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.452905 -0.58161 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436077 -0.5989 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.434777 -0.586467 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379835 -0.550064 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.372012 -0.535334 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359551 -0.536327 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.35918 -0.555599 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392296 -0.549071 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379464 -0.569335 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400119 -0.563801 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.392667 -0.529799 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.400489 -0.54453 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.380205 -0.530793 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399007 -0.621614 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.420252 -0.632748 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408963 -0.638118 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.419661 -0.61608 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410295 -0.616244 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409705 -0.599576 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.38905 -0.60511 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399597 -0.638282 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.378352 -0.627149 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388308 -0.643653 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.408291 -0.619127 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.415912 -0.617918 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39183 -0.616439 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.406911 -0.597788 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.432372 -0.620605 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423371 -0.600475 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.424751 -0.621814 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.417292 -0.639257 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.409671 -0.640465 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39321 -0.637778 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396598 -0.681475 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337042 -0.638217 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.320629 -0.641183 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.313702 -0.630777 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328614 -0.618565 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.34397 -0.648623 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.351955 -0.626005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.360383 -0.645657 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.329058 -0.660835 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.345471 -0.65787 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.32213 -0.65043 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.358439 -0.594141 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.409774 -0.542042 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.413579 -0.517869 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.395831 -0.525596 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.393219 -0.528508 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.427522 -0.534315 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.407161 -0.544953 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.423716 -0.558488 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.430134 -0.531404 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.426328 -0.555577 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.412386 -0.539131 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379835 -0.550064 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.375068 -0.529037 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356494 -0.542624 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.371406 -0.530412 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398409 -0.536477 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.394747 -0.537852 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403175 -0.557504 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.383497 -0.548689 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388263 -0.569716 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.364922 -0.562276 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.347819 -0.499428 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.359921 -0.517056 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327164 -0.504962 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.339267 -0.522591 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.318612 -0.528125 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.388377 -0.586119 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.399584 -0.570335 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.403942 -0.569167 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.381987 -0.562269 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.384019 -0.587286 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.366422 -0.57922 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.372813 -0.60307 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405974 -0.594185 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.394768 -0.609969 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.410332 -0.593017 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.317871 -0.566667 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.317033 -0.562847 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.327827 -0.583171 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338525 -0.561133 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307077 -0.546343 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.328569 -0.544629 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307914 -0.550163 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.296378 -0.568381 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.297216 -0.572202 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.307172 -0.588706 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337042 -0.638217 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.317573 -0.64748 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316758 -0.624481 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.316388 -0.643752 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337857 -0.661216 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.336672 -0.657489 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357326 -0.651954 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.338228 -0.641945 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.357697 -0.632683 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.337413 -0.618946 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.428945 -0.613592 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.451897 -0.612625 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.432663 -0.614807 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.436515 -0.593593 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.448179 -0.61141 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.432797 -0.592379 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425227 -0.612377 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.444328 -0.632624 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.421376 -0.633591 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.425094 -0.634806 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.396598 -0.681475 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.398265 -0.660156 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.375943 -0.687009 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.37761 -0.665691 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.356956 -0.671225 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.399007 -0.621614 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.402865 -0.620974 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.379986 -0.618494 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.39648 -0.600381 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.421886 -0.624094 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.4155 -0.603501 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.418027 -0.624734 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.405392 -0.642207 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.401533 -0.642848 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.382513 -0.639728 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.157543 -0.835815 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.119969 -0.899353 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0977075 -0.909872 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0997803 -0.886771 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104052 -0.891613 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.117896 -0.922453 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124241 -0.904194 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.140158 -0.911935 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.113625 -0.917612 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135886 -0.907093 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115698 -0.894512 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0844101 -0.836885 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0627848 -0.826973 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0805529 -0.830202 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.083104 -0.81296 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0666419 -0.833656 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0869612 -0.819643 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0882673 -0.843568 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0640908 -0.850898 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0857161 -0.860809 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0818589 -0.854126 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.130205 -0.868703 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.11253 -0.867758 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107566 -0.860854 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.122142 -0.846864 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135168 -0.875606 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.14478 -0.854713 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.152843 -0.876551 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120593 -0.889596 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.138267 -0.890541 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115629 -0.882692 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.193102 -0.898283 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.201143 -0.920038 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.17991 -0.910616 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.201384 -0.900209 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.214335 -0.907705 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.214576 -0.887876 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.206294 -0.88595 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192861 -0.918112 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.18482 -0.896357 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.171628 -0.90869 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203337 -0.867633 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.209658 -0.868948 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.186008 -0.865773 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.202239 -0.84746 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.226988 -0.870808 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.219569 -0.84932 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.220667 -0.869493 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210757 -0.889121 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.204436 -0.887806 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.187106 -0.885946 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.230676 -0.834745 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.252002 -0.824206 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.234336 -0.827952 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.231282 -0.810793 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.248342 -0.830999 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.227621 -0.817586 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.227016 -0.841538 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.251396 -0.848158 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.23007 -0.858698 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.23373 -0.851905 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.147308 -0.866465 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.130609 -0.876203 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.124356 -0.857385 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128522 -0.879733 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153561 -0.885283 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.151474 -0.888813 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.170259 -0.875546 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.149395 -0.862935 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.166093 -0.853198 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.143141 -0.844117 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.184881 -0.802927 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.180723 -0.785723 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.173028 -0.782104 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.161937 -0.798991 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.192576 -0.806546 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.17379 -0.819813 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196734 -0.82375 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203667 -0.78966 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207825 -0.806864 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.195972 -0.786041 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111748 -0.803997 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.108311 -0.798532 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.119537 -0.819589 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131037 -0.797989 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100522 -0.78294 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.123249 -0.782397 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.10396 -0.788405 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0890219 -0.80454 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0924597 -0.810005 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100248 -0.825597 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.172546 -0.643951 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER -0.202787 -0.61371 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.200937 -0.595399 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.194794 -0.591462 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.180539 -0.605717 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.208929 -0.617647 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188531 -0.627965 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.210779 -0.635958 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.223185 -0.603392 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.225035 -0.621702 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.217042 -0.599454 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.244096 -0.624779 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.260374 -0.607636 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240901 -0.612854 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.237705 -0.600929 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.26357 -0.619561 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.240901 -0.612854 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.247291 -0.636704 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.266765 -0.631486 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.250487 -0.648629 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.247291 -0.636704 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.191718 -0.5724 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.185011 -0.549732 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.167868 -0.56601 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179793 -0.569205 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.208861 -0.556122 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203643 -0.575596 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.215568 -0.578791 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.196936 -0.552927 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.203643 -0.575596 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.179793 -0.569205 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.131237 -0.632882 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.131575 -0.625593 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.15071 -0.6381 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.146508 -0.614836 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.112102 -0.620375 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.127034 -0.609618 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111763 -0.627664 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.116304 -0.643639 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.115965 -0.650927 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.135439 -0.656145 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.120168 -0.591572 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.105912 -0.577317 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111438 -0.600302 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128897 -0.582843 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.114642 -0.568587 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.137627 -0.574113 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.128897 -0.582843 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0971825 -0.586046 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.111438 -0.600302 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.102708 -0.609032 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.100996 -0.663122 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0783272 -0.656415 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0978007 -0.651197 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0946054 -0.639272 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0815225 -0.66834 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0978007 -0.651197 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104191 -0.675047 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0847178 -0.680265 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.107387 -0.686972 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.104191 -0.675047 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.183615 -0.68526 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.182351 -0.708085 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165569 -0.700531 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.188833 -0.704733 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.200397 -0.692813 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.206879 -0.689462 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.201661 -0.669989 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177134 -0.688611 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.178397 -0.665787 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.160351 -0.681058 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.153374 -0.715501 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.136231 -0.731779 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.129524 -0.70911 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141449 -0.712305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.160081 -0.738169 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165299 -0.718696 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.177224 -0.721891 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.148156 -0.734974 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.165299 -0.718696 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.141449 -0.712305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.224924 -0.696329 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.23918 -0.710584 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216195 -0.705059 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233654 -0.687599 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.24791 -0.701855 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.242384 -0.678869 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.233654 -0.687599 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.23045 -0.719314 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.216195 -0.705059 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.207465 -0.713788 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0133465 -0.69376 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.0631985 -0.668775 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0667914 -0.661946 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0511945 -0.680354 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0452771 -0.65711 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0787954 -0.650366 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0572811 -0.64553 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0752026 -0.657195 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0847128 -0.673611 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.08112 -0.680439 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.069116 -0.692019 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00804971 -0.649684 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.000226782 -0.634953 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0122343 -0.635947 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.012605 -0.655218 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0205108 -0.64869 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00767898 -0.668955 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0283337 -0.66342 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0208815 -0.629419 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0287044 -0.644149 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00842045 -0.630413 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0239663 -0.599047 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0118635 -0.616676 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0446211 -0.604582 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0325183 -0.62221 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.053173 -0.627745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0845947 -0.712851 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.107813 -0.706291 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0896851 -0.701434 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0909853 -0.689001 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.102723 -0.717709 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0858949 -0.700418 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0795043 -0.724268 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.101422 -0.730141 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0782041 -0.736701 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0832945 -0.725284 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0539145 -0.666287 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0721382 -0.650692 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.072935 -0.663167 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0564414 -0.645053 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0531177 -0.653812 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0374209 -0.648173 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.034894 -0.669407 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0696112 -0.671925 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0513875 -0.68752 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.070408 -0.6844 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0347427 -0.737837 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0511556 -0.740802 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0580833 -0.730397 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.043171 -0.718185 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.027815 -0.748242 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0198304 -0.725625 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0114021 -0.745277 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0427273 -0.760455 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0263144 -0.757489 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0496549 -0.750049 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0440268 -0.740325 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.0650768 -0.746894 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0607735 -0.723153 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0653796 -0.739183 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.04833 -0.764065 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0486329 -0.756355 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.02728 -0.757496 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0437239 -0.748035 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0226739 -0.741466 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0394207 -0.724295 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.024813 -0.781094 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.02648 -0.759776 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00415829 -0.786629 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0058253 -0.76531 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.0148294 -0.770845 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0272215 -0.721234 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER -0.0484665 -0.732368 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0371781 -0.737738 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0478762 -0.715699 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0385099 -0.715864 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0379196 -0.699195 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0172649 -0.70473 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0278118 -0.737902 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.00656677 -0.726768 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER -0.0165234 -0.743272 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 1.11022e-16 RAD 0.166667 
+   txt002 
+ SPHERE CENTER 0.690426 -0.508983 1.83812e-16 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.755941 -0.484794 -0.0246914 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.767658 -0.47411 -0.0436186 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.749038 -0.489758 -0.0478724 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.744501 -0.467528 -0.0381316 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.774562 -0.469146 -0.0204376 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.751405 -0.462564 -0.0149506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.762845 -0.47983 -0.00151032 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.779098 -0.491377 -0.0301783 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.767382 -0.502061 -0.0112511 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760478 -0.507025 -0.0344321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.695668 -0.478434 -0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.703418 -0.481931 -0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.716184 -0.491475 -0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.694124 -0.500827 -0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682902 -0.46889 -0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.673608 -0.487786 -0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675152 -0.465393 -0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704962 -0.459538 -0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697211 -0.456041 -0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.717727 -0.469082 -0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7029 -0.436283 -0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.714226 -0.418941 -0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.724842 -0.44101 -0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.704751 -0.43889 -0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.692283 -0.414215 -0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682808 -0.434163 -0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680957 -0.431557 0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.712374 -0.416335 0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701048 -0.433677 0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.722991 -0.438403 0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.7507 -0.515343 0.0425863 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.773394 -0.506594 0.0468401 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.764807 -0.507924 0.0237283 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755462 -0.491321 0.0394341 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.759287 -0.514012 0.065698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.741355 -0.49874 0.058292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.736593 -0.522762 0.0614442 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.768632 -0.530616 0.0499923 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.745938 -0.539365 0.0457385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760045 -0.531946 0.0268805 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697658 -0.466832 0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.709346 -0.447385 0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.721188 -0.46231 0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.703286 -0.447429 0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.685816 -0.451907 0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.679757 -0.451951 0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674129 -0.471354 0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.703718 -0.466788 0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.692031 -0.486235 0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.71556 -0.481713 0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.685185 -0.539531 0.0672777 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.693658 -0.538818 0.0904587 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.708875 -0.534075 0.0716007 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.691194 -0.517905 0.0775657 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669969 -0.544274 0.0861356 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.667505 -0.523361 0.0732426 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661495 -0.544988 0.0629546 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.687649 -0.560445 0.0801706 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.679176 -0.561158 0.0569896 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.702866 -0.555702 0.0613127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.743468 -0.557494 -0.0178949 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.767402 -0.560084 -0.0233819 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755145 -0.53997 -0.0307879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.760285 -0.543179 -0.00685171 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.755725 -0.577608 -0.0104889 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.748608 -0.560703 0.00604126 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.731791 -0.575017 -0.00500196 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.750585 -0.574398 -0.0344251 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.726651 -0.571808 -0.0289382 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.738328 -0.554284 -0.0418311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677953 -0.581682 0.00679642 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.682851 -0.601808 0.0202367 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.700216 -0.58454 0.0170845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680568 -0.579842 0.0312799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.660588 -0.59895 0.00994863 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.658304 -0.576984 0.0209919 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65569 -0.578824 -0.00349164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680237 -0.603648 -0.0042468 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675339 -0.583522 -0.0176871 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697602 -0.58638 -0.00739901 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683194 -0.551134 -0.0604812 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.687731 -0.573364 -0.070222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.703871 -0.56324 -0.0545162 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682033 -0.571303 -0.0462858 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.667055 -0.561258 -0.076187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661356 -0.559196 -0.0522508 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.662518 -0.539027 -0.0664462 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.688893 -0.553195 -0.0844174 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.684356 -0.530964 -0.0746767 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.705033 -0.543071 -0.0687117 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607487 -0.335322 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.629404 -0.313405 -0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.626214 -0.316595 -0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624401 -0.335868 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606941 -0.318408 -0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.631217 -0.294133 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.611945 -0.295946 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634407 -0.290942 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.648676 -0.311592 -0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651867 -0.308402 -0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.646863 -0.330864 -0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610996 -0.384191 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.623201 -0.403702 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.635431 -0.385946 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62031 -0.401066 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.598766 -0.401947 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.595876 -0.399312 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586561 -0.382437 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.613886 -0.386827 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.601681 -0.367317 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626116 -0.369071 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.558618 -0.331813 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.539107 -0.319608 -0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541743 -0.322499 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.556863 -0.307378 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555982 -0.328923 -0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.573738 -0.316693 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575492 -0.341128 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.540862 -0.344043 -0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560372 -0.356248 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.543497 -0.346933 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625895 -0.264535 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.637402 -0.248969 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.646193 -0.271807 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625088 -0.268363 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617105 -0.241698 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604791 -0.261092 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605598 -0.257264 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638209 -0.245142 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626702 -0.260708 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647 -0.267979 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.550934 -0.258608 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603979 -0.286452 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.613271 -0.265398 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627912 -0.281225 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610787 -0.26842 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.589337 -0.270625 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.586853 -0.273647 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.580045 -0.291679 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.606463 -0.283431 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.59717 -0.304484 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621104 -0.299257 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678274 -0.316914 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.69384 -0.305407 -0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674446 -0.317721 -0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671002 -0.296616 -0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.697667 -0.3046 -0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.67483 -0.295809 -0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.682101 -0.316107 -0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.701111 -0.325704 -0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.685545 -0.337211 -0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681717 -0.338018 -0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656357 -0.33883 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.677411 -0.329538 -0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674389 -0.332022 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.661584 -0.314897 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659378 -0.336346 -0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.643552 -0.321705 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.638325 -0.345639 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.672184 -0.353472 -0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.65113 -0.362764 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669162 -0.355956 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684201 -0.391875 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607487 -0.335322 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.659645 -0.283164 0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.672915 -0.269894 0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666987 -0.293281 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.649528 -0.275822 0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665573 -0.259777 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.642185 -0.265705 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.652302 -0.273047 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.683032 -0.277236 0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669762 -0.290507 0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.677104 -0.300624 0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.656357 -0.33883 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.663448 -0.328536 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.639482 -0.329516 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.654603 -0.314396 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.680322 -0.33785 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.671477 -0.32371 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.673232 -0.348145 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.665202 -0.35297 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.658111 -0.363265 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.641237 -0.353951 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603979 -0.286452 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.614273 -0.279361 0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628413 -0.288206 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.613293 -0.303327 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.589839 -0.277607 0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588858 -0.301572 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.579544 -0.284698 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604959 -0.262487 0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.594664 -0.269578 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.619099 -0.271332 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610775 -0.279656 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.621535 -0.258061 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634468 -0.275921 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616678 -0.264057 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.597842 -0.261795 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.592985 -0.267791 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587082 -0.28339 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.615632 -0.27366 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604872 -0.295255 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628565 -0.29152 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.550934 -0.258608 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570229 -0.267823 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535813 -0.273728 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539989 -0.298064 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555109 -0.282943 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.558618 -0.331813 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.55307 -0.320611 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57665 -0.325005 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.563845 -0.30788 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535038 -0.327419 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.545813 -0.314688 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.540585 -0.338621 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547843 -0.344544 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.553391 -0.355747 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571423 -0.348938 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.663153 -0.332034 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684748 -0.321274 0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.678752 -0.326131 0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.666888 -0.308341 0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669149 -0.327177 0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.651289 -0.314244 0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.647554 -0.337937 0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.681014 -0.344967 0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659419 -0.355727 0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.675018 -0.349824 0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.610996 -0.384191 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.622198 -0.389739 0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.63493 -0.378964 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617804 -0.366159 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.598265 -0.394966 0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593871 -0.371386 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587062 -0.389418 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61539 -0.407771 0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.604188 -0.402224 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628121 -0.396997 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.684201 -0.391875 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.674986 -0.37258 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.669081 -0.406996 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.644745 -0.40282 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.659866 -0.3877 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.554344 -0.645066 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.610229 -0.668521 0.153697 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.633406 -0.663938 0.160875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626429 -0.65892 0.137727 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617928 -0.64522 0.156428 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617206 -0.673539 0.176845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.601728 -0.654822 0.172398 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.59403 -0.678123 0.169668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625707 -0.687239 0.158144 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602531 -0.691822 0.150967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.61873 -0.682221 0.134996 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.622977 -0.619787 0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.63767 -0.608008 0.0834188 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.620102 -0.623239 0.0751099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.613891 -0.601637 0.0853287 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.640545 -0.604555 0.107698 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616766 -0.598184 0.109608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.625852 -0.616334 0.123668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.646756 -0.626157 0.0974792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.632063 -0.637936 0.113449 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.629188 -0.641389 0.0891702 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.585648 -0.598918 0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.601562 -0.580238 0.162601 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605914 -0.59781 0.14581 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.587563 -0.581665 0.142311 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.581295 -0.581346 0.176661 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.567297 -0.582773 0.156372 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.565381 -0.600026 0.173931 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.599646 -0.597491 0.18016 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.583732 -0.616171 0.177429 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.603999 -0.615063 0.163369 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541596 -0.6938 0.165419 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.547376 -0.70016 0.188567 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.564621 -0.690564 0.173728 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546319 -0.676324 0.182211 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.524351 -0.703396 0.180258 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523294 -0.679561 0.173902 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.518571 -0.697037 0.157111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542652 -0.717636 0.171776 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536873 -0.711276 0.148628 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.559898 -0.70804 0.156937 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.517014 -0.624197 0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.516313 -0.60809 0.190293 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538029 -0.616221 0.181811 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.524375 -0.60089 0.168094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495298 -0.616065 0.180075 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.50336 -0.608865 0.157875 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495999 -0.632172 0.161374 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508952 -0.631397 0.193792 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.509653 -0.647504 0.175091 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.530668 -0.639529 0.18531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48571 -0.670344 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.466887 -0.67091 0.138803 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490138 -0.671107 0.147112 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480853 -0.650637 0.136894 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46246 -0.670147 0.114524 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.476425 -0.649874 0.112614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.481283 -0.669581 0.0985541 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471745 -0.690617 0.124743 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490567 -0.690052 0.108773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.494995 -0.690815 0.133052 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.578925 -0.714669 0.104938 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.597914 -0.729812 0.109385 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602084 -0.70632 0.103028 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.592661 -0.711617 0.125228 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.574755 -0.738161 0.111295 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.569503 -0.719965 0.127138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.555767 -0.723017 0.106848 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.584178 -0.732864 0.0890951 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.565189 -0.71772 0.0846485 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.588348 -0.709372 0.0827387 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.52304 -0.691213 0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.511567 -0.712906 0.0596212 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529503 -0.710453 0.0764123 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.507717 -0.699372 0.079911 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.505104 -0.693665 0.0455609 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.501254 -0.680131 0.0658506 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.516576 -0.671972 0.0482916 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.526889 -0.704747 0.0420622 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538362 -0.683054 0.044793 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.544826 -0.702295 0.0588533 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.591673 -0.665934 0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.605761 -0.658095 0.0319289 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.58746 -0.643855 0.0404111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.607672 -0.647455 0.0541285 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609975 -0.680174 0.0421477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.611885 -0.669535 0.0643473 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.595887 -0.688013 0.0608487 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.589763 -0.676573 0.0284303 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575674 -0.684413 0.0471312 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571461 -0.662334 0.0369125 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.501645 -0.441164 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.518106 -0.424703 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.522721 -0.437548 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.505261 -0.420089 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497031 -0.428319 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484186 -0.423704 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48057 -0.44478 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.51449 -0.445778 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498029 -0.462239 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.519105 -0.458623 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.560583 -0.44013 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.53742 -0.431578 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560583 -0.44013 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.53742 -0.431578 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.452233 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.566118 -0.460785 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548489 -0.472887 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.548489 -0.472887 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.502679 -0.382226 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.511231 -0.405389 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.482024 -0.376691 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.469922 -0.39432 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.469922 -0.39432 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.502679 -0.382226 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.399854 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.511231 -0.405389 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.430095 -0.460336 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.427669 -0.446904 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.450155 -0.45293 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436486 -0.436486 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.407609 -0.454311 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.416426 -0.443892 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410035 -0.467742 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.421278 -0.470754 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.423704 -0.484186 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.443764 -0.47678 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.414851 -0.39469 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434147 -0.403906 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.434147 -0.403906 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399731 -0.409811 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403906 -0.434147 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399731 -0.409811 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.403906 -0.434147 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.419026 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.378536 -0.488909 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39432 -0.469922 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378536 -0.488909 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.39432 -0.469922 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.490576 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384071 -0.509564 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405389 -0.511231 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.405389 -0.511231 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.482473 -0.512714 0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.495905 -0.51514 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506323 -0.506323 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.48988 -0.492654 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472055 -0.521531 0.30328 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46603 -0.499045 0.295049 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.458623 -0.519105 0.282703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.488498 -0.5352 0.290934 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.475067 -0.532774 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498917 -0.526383 0.270358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.4539 -0.564273 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472887 -0.548489 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433245 -0.558738 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.431578 -0.53742 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.431578 -0.53742 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4539 -0.564273 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.542955 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.472887 -0.548489 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.548119 -0.527958 0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538903 -0.508662 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.538903 -0.508662 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532998 -0.543078 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.246914 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508662 -0.538903 0.234568 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532998 -0.543078 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508662 -0.538903 0.209877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.523783 0.197531 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335322 -0.607487 0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.313405 -0.629404 0.178389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.316595 -0.626214 0.202664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335868 -0.624401 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318408 -0.606941 0.187336 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.294133 -0.631217 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295946 -0.611945 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290942 -0.634407 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.311592 -0.648676 0.193717 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308402 -0.651867 0.169441 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.330864 -0.646863 0.178389 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384191 -0.610996 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.405245 -0.601704 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.402224 -0.604188 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.389418 -0.587062 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.387213 -0.608512 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.371386 -0.593871 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.366159 -0.617804 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.400018 -0.625637 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.378964 -0.63493 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396997 -0.628121 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331813 -0.558618 0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.341105 -0.537564 0.175614 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355747 -0.553391 0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338621 -0.540585 0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317172 -0.542791 0.178701 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.314688 -0.545813 0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.30788 -0.563845 0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.334297 -0.555596 0.191046 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.325005 -0.57665 0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.348938 -0.571423 0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.264535 -0.625895 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.245336 -0.623429 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268271 -0.624736 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.260997 -0.604627 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2416 -0.624589 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.257262 -0.605787 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.2608 -0.627055 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.248874 -0.644697 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268073 -0.647163 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271809 -0.646004 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.278768 -0.530773 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286452 -0.603979 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.266942 -0.591774 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269578 -0.594664 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.284698 -0.579544 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.283817 -0.601088 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.301572 -0.588858 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.303327 -0.613293 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.268696 -0.616209 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.288206 -0.628413 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.271332 -0.619099 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316914 -0.678274 0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.31938 -0.697473 0.138161 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.338182 -0.681812 0.134867 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.318074 -0.674538 0.147213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298112 -0.693935 0.126127 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.296805 -0.671 0.135179 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295646 -0.674736 0.110799 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.31822 -0.701209 0.113782 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.315754 -0.682009 0.0984536 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.337022 -0.685547 0.110488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33883 -0.656357 0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.351035 -0.675867 0.0466081 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.363265 -0.658111 0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.348145 -0.673232 0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3266 -0.674113 0.0435217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.32371 -0.671477 0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.314396 -0.654603 0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.341721 -0.658993 0.031176 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.329516 -0.639482 0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.353951 -0.641237 0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.412036 -0.664041 0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.554344 -0.645066 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.616373 -0.681385 -0.129006 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.639472 -0.678928 -0.137375 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.621631 -0.664108 -0.145845 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.629767 -0.661636 -0.122663 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.634214 -0.696205 -0.120537 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.624508 -0.678912 -0.105825 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.611115 -0.698662 -0.112168 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.626079 -0.698678 -0.143718 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.602979 -0.701135 -0.135349 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.608237 -0.683858 -0.152187 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617144 -0.607573 -0.122833 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.63057 -0.595495 -0.139672 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.617371 -0.615286 -0.146288 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605919 -0.594239 -0.140323 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.630343 -0.587782 -0.116217 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605692 -0.586526 -0.116868 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616917 -0.59986 -0.0993785 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.641795 -0.608828 -0.122182 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628369 -0.620906 -0.105343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.628595 -0.628619 -0.128798 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.609912 -0.649723 -0.062352 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.631982 -0.640648 -0.0560094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.62585 -0.64267 -0.0798417 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.614812 -0.625749 -0.0656463 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.616044 -0.647702 -0.0385197 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.598874 -0.632802 -0.0481565 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.593974 -0.656777 -0.0448623 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.627081 -0.664623 -0.0527151 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.605012 -0.673698 -0.0590577 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.620949 -0.666645 -0.0765474 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.553573 -0.718878 -0.117284 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.563328 -0.73992 -0.108814 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.577348 -0.719679 -0.110668 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.559693 -0.720935 -0.0934517 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539553 -0.739118 -0.115431 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.535918 -0.720133 -0.100068 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529798 -0.718076 -0.1239 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.557208 -0.737863 -0.132647 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547453 -0.716821 -0.141116 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571228 -0.717623 -0.1345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.547112 -0.687216 -0.0506299 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.554862 -0.690713 -0.0274488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.570641 -0.682694 -0.0446649 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.552739 -0.667813 -0.0364345 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531333 -0.695235 -0.0334138 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.52921 -0.672335 -0.0423994 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523582 -0.691738 -0.0565949 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549235 -0.710116 -0.0416443 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541484 -0.706619 -0.0648253 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.565014 -0.702097 -0.0588603 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.491544 -0.682558 -0.099389 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.474542 -0.688647 -0.0825505 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498226 -0.686417 -0.0759343 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.485132 -0.666351 -0.0818993 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.46786 -0.684788 -0.106005 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.47845 -0.662492 -0.105354 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484862 -0.678699 -0.122844 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.480953 -0.704854 -0.10004 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497955 -0.698765 -0.116879 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.504637 -0.702624 -0.093424 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560805 -0.676727 -0.177765 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.57563 -0.689897 -0.192477 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.585222 -0.673115 -0.177114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.575587 -0.693998 -0.168128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.551213 -0.693509 -0.193128 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.55117 -0.69761 -0.16878 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536388 -0.680339 -0.178416 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560848 -0.672626 -0.202114 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546023 -0.659456 -0.187402 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.57044 -0.655844 -0.186751 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.498776 -0.640408 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.478525 -0.627785 -0.166213 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.484234 -0.630799 -0.142381 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497935 -0.615951 -0.156576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493066 -0.637394 -0.183703 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.512476 -0.62556 -0.174066 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.513317 -0.650016 -0.17736 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.479365 -0.652241 -0.169507 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.499616 -0.664864 -0.163165 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.485075 -0.655255 -0.145675 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.561576 -0.602915 -0.171592 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.570049 -0.602201 -0.194773 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.582252 -0.615021 -0.177557 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.560414 -0.623084 -0.185788 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549372 -0.590095 -0.188808 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539737 -0.610978 -0.179823 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.540899 -0.590808 -0.165627 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.571211 -0.582032 -0.180578 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562738 -0.582745 -0.157397 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.583414 -0.594852 -0.163362 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.335322 -0.607487 -0.111111 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.283164 -0.659645 -0.104315 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.269894 -0.672915 -0.0882695 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.293281 -0.666987 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275822 -0.649528 -0.0830215 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.259777 -0.665573 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.265705 -0.642185 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273047 -0.652302 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.277236 -0.683032 -0.109563 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.290507 -0.669762 -0.125608 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.300624 -0.677104 -0.104315 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33883 -0.656357 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.350033 -0.661904 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.362764 -0.65113 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.345639 -0.638325 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.326099 -0.667131 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.321705 -0.643552 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.314897 -0.661584 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.343224 -0.679937 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332022 -0.674389 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355956 -0.669162 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286452 -0.603979 -0.0555556 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.280905 -0.592776 -0.0342624 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.304484 -0.59717 -0.0401235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.291679 -0.580045 -0.0524691 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.262872 -0.599585 -0.0496945 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273647 -0.586853 -0.0679012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26842 -0.610787 -0.0709877 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.275678 -0.61671 -0.0373488 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.281225 -0.627912 -0.058642 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.299257 -0.621104 -0.0432099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.279656 -0.610775 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.256944 -0.602632 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.26347 -0.606749 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.273158 -0.587686 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.27313 -0.606658 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.289344 -0.591712 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.295841 -0.614801 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263442 -0.62572 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.286153 -0.633864 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.269968 -0.629838 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.278768 -0.530773 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.298064 -0.539989 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.263648 -0.545894 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.267823 -0.570229 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.282943 -0.555109 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.331813 -0.558618 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.342108 -0.551527 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.356248 -0.560372 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.341128 -0.575492 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317673 -0.549772 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.316693 -0.573738 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.307378 -0.556863 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332793 -0.534652 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.322499 -0.541743 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.346933 -0.543497 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.332034 -0.663153 -0.15987 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.340177 -0.685865 -0.165118 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.355123 -0.669651 -0.154009 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.33606 -0.679339 -0.141664 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.317089 -0.679367 -0.170979 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.312971 -0.672841 -0.147525 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.308945 -0.656656 -0.165731 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.336151 -0.669679 -0.183325 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.328008 -0.646968 -0.178077 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.351097 -0.653465 -0.172216 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.384191 -0.610996 -0.166667 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.391282 -0.600701 -0.18796 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.367317 -0.601681 -0.182099 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.382437 -0.586561 -0.169753 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.408157 -0.610016 -0.172528 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399312 -0.595876 -0.154321 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401066 -0.62031 -0.151235 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393037 -0.625136 -0.184873 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.385946 -0.635431 -0.16358 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.369071 -0.626116 -0.179012 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.111111 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.412036 -0.664041 -0.111111 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40282 -0.644745 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.0864198 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 -0.0987654 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396915 -0.679161 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.37258 -0.674986 -0.123457 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.3877 -0.659866 -0.135802 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.471405 -0.471405 -0.222222 RAD 0.0555556 
+   txt002 
+ SPHERE CENTER 0.441164 -0.441164 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.443014 -0.422853 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.449156 -0.418916 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.463412 -0.433171 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.435021 -0.445101 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455419 -0.455419 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.433171 -0.463412 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.420766 -0.430846 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.418916 -0.449156 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.426908 -0.426908 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.399854 -0.452233 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.383576 -0.43509 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40305 -0.440308 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.406245 -0.428383 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.380381 -0.447015 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.40305 -0.440308 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396659 -0.464158 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.377186 -0.45894 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.393464 -0.476083 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396659 -0.464158 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.452233 -0.399854 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.45894 -0.377186 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.476083 -0.393464 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.464158 -0.396659 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.43509 -0.383576 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440308 -0.40305 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.428383 -0.406245 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.447015 -0.380381 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.440308 -0.40305 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.464158 -0.396659 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.512714 -0.460336 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.512375 -0.453047 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.493241 -0.465554 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.497443 -0.44229 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.531849 -0.447829 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.516916 -0.437072 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532187 -0.455118 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527647 -0.471093 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.527985 -0.478381 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.508512 -0.483599 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.523783 -0.419026 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.538038 -0.404771 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532513 -0.427756 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.515053 -0.410297 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.529309 -0.396041 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.506323 -0.401567 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.515053 -0.410297 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.546768 -0.4135 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.532513 -0.427756 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.541242 -0.436486 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.542955 -0.490576 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.565623 -0.483869 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.54615 -0.478651 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.549345 -0.466726 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.562428 -0.495794 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.54615 -0.478651 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539759 -0.502501 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.559233 -0.507719 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.536564 -0.514426 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.539759 -0.502501 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.460336 -0.512714 -0.282703 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.461599 -0.535539 -0.292037 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478381 -0.527985 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.455118 -0.532187 -0.268448 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.443553 -0.520267 -0.299164 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.437072 -0.516916 -0.275576 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.44229 -0.497443 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.466817 -0.516065 -0.306292 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.465554 -0.493241 -0.296959 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.483599 -0.508512 -0.289831 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.490576 -0.542955 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.507719 -0.559233 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.514426 -0.536564 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.502501 -0.539759 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.483869 -0.565623 -0.215094 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478651 -0.54615 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.466726 -0.549345 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.495794 -0.562428 -0.236478 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.478651 -0.54615 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.502501 -0.539759 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.419026 -0.523783 -0.222222 RAD 0.0185185 
+   txt002 
+ SPHERE CENTER 0.404771 -0.538038 -0.207967 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.427756 -0.532513 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410297 -0.515053 -0.200839 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.396041 -0.529309 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.401567 -0.506323 -0.222222 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.410297 -0.515053 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.4135 -0.546768 -0.22935 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.427756 -0.532513 -0.243606 RAD 0.00617284 
+   txt002 
+ SPHERE CENTER 0.436486 -0.541242 -0.222222 RAD 0.00617284 
+   txt002 
+
+END_SCENE
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/lattice.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/lattice.dat
new file mode 100644
index 00000000..fc40ed88
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/lattice.dat
@@ -0,0 +1,18012 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 512 512 
+  VERBOSE 0
+
+CAMERA
+  ZOOM 1.0
+  ASPECTRATIO 1.0
+  ANTIALIASING 0
+  RAYDEPTH 8
+  CENTER 0.5625 1 0.9375
+  VIEWDIR 0 -0.707107 -0.707107
+  UPDIR 0.272166 0.680414 -0.680414
+
+END_CAMERA 
+
+LIGHT CENTER 2 0.5 0.5 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER -1 0.5 0.5 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 0.5 2 0.5 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 0.5 -1 0.5 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 0.5 0.5 2 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 0.5 0.5 -1 RAD 0.002 COLOR 0.5 0.5 0.5
+
+TEXDEF txt001 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0 RAD 0.03125 
+   txt001 
+TEXDEF txt002 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0 APEX 0.109531 0 0 RAD 0.0078125
+   txt002 
+TEXDEF txt003 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0 APEX 0 0.109531 0 RAD 0.0078125
+   txt003 
+TEXDEF txt004 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.0154687 APEX 0 0 0.109531 RAD 0.0078125
+   txt004 
+TEXDEF txt005 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.125 RAD 0.03125 
+   txt005 
+TEXDEF txt006 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.125 APEX 0.109531 0 0.125 RAD 0.0078125
+   txt006 
+TEXDEF txt007 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.125 APEX 0 0.109531 0.125 RAD 0.0078125
+   txt007 
+TEXDEF txt008 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.140469 APEX 0 0 0.234531 RAD 0.0078125
+   txt008 
+TEXDEF txt009 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.25 RAD 0.03125 
+   txt009 
+TEXDEF txt010 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.25 APEX 0.109531 0 0.25 RAD 0.0078125
+   txt010 
+TEXDEF txt011 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.25 APEX 0 0.109531 0.25 RAD 0.0078125
+   txt011 
+TEXDEF txt012 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.265469 APEX 0 0 0.359531 RAD 0.0078125
+   txt012 
+TEXDEF txt013 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.375 RAD 0.03125 
+   txt013 
+TEXDEF txt014 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.375 APEX 0.109531 0 0.375 RAD 0.0078125
+   txt014 
+TEXDEF txt015 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.375 APEX 0 0.109531 0.375 RAD 0.0078125
+   txt015 
+TEXDEF txt016 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.390469 APEX 0 0 0.484531 RAD 0.0078125
+   txt016 
+TEXDEF txt017 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.5 RAD 0.03125 
+   txt017 
+TEXDEF txt018 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.5 APEX 0.109531 0 0.5 RAD 0.0078125
+   txt018 
+TEXDEF txt019 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.5 APEX 0 0.109531 0.5 RAD 0.0078125
+   txt019 
+TEXDEF txt020 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.515469 APEX 0 0 0.609531 RAD 0.0078125
+   txt020 
+TEXDEF txt021 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.625 RAD 0.03125 
+   txt021 
+TEXDEF txt022 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.625 APEX 0.109531 0 0.625 RAD 0.0078125
+   txt022 
+TEXDEF txt023 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.625 APEX 0 0.109531 0.625 RAD 0.0078125
+   txt023 
+TEXDEF txt024 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.640469 APEX 0 0 0.734531 RAD 0.0078125
+   txt024 
+TEXDEF txt025 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.75 RAD 0.03125 
+   txt025 
+TEXDEF txt026 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.75 APEX 0.109531 0 0.75 RAD 0.0078125
+   txt026 
+TEXDEF txt027 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.75 APEX 0 0.109531 0.75 RAD 0.0078125
+   txt027 
+TEXDEF txt028 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.765469 APEX 0 0 0.859531 RAD 0.0078125
+   txt028 
+TEXDEF txt029 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 0.875 RAD 0.03125 
+   txt029 
+TEXDEF txt030 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 0.875 APEX 0.109531 0 0.875 RAD 0.0078125
+   txt030 
+TEXDEF txt031 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 0.875 APEX 0 0.109531 0.875 RAD 0.0078125
+   txt031 
+TEXDEF txt032 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0 0.890469 APEX 0 0 0.984531 RAD 0.0078125
+   txt032 
+TEXDEF txt033 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0 1 RAD 0.03125 
+   txt033 
+TEXDEF txt034 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0 1 APEX 0.109531 0 1 RAD 0.0078125
+   txt034 
+TEXDEF txt035 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.0154687 1 APEX 0 0.109531 1 RAD 0.0078125
+   txt035 
+TEXDEF txt036 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0 RAD 0.03125 
+   txt036 
+TEXDEF txt037 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0 APEX 0.109531 0.125 0 RAD 0.0078125
+   txt037 
+TEXDEF txt038 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0 APEX 0 0.234531 0 RAD 0.0078125
+   txt038 
+TEXDEF txt039 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.0154687 APEX 0 0.125 0.109531 RAD 0.0078125
+   txt039 
+TEXDEF txt040 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.125 RAD 0.03125 
+   txt040 
+TEXDEF txt041 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.125 APEX 0.109531 0.125 0.125 RAD 0.0078125
+   txt041 
+TEXDEF txt042 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.125 APEX 0 0.234531 0.125 RAD 0.0078125
+   txt042 
+TEXDEF txt043 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.140469 APEX 0 0.125 0.234531 RAD 0.0078125
+   txt043 
+TEXDEF txt044 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.25 RAD 0.03125 
+   txt044 
+TEXDEF txt045 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.25 APEX 0.109531 0.125 0.25 RAD 0.0078125
+   txt045 
+TEXDEF txt046 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.25 APEX 0 0.234531 0.25 RAD 0.0078125
+   txt046 
+TEXDEF txt047 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.265469 APEX 0 0.125 0.359531 RAD 0.0078125
+   txt047 
+TEXDEF txt048 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.375 RAD 0.03125 
+   txt048 
+TEXDEF txt049 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.375 APEX 0.109531 0.125 0.375 RAD 0.0078125
+   txt049 
+TEXDEF txt050 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.375 APEX 0 0.234531 0.375 RAD 0.0078125
+   txt050 
+TEXDEF txt051 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.390469 APEX 0 0.125 0.484531 RAD 0.0078125
+   txt051 
+TEXDEF txt052 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.5 RAD 0.03125 
+   txt052 
+TEXDEF txt053 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.5 APEX 0.109531 0.125 0.5 RAD 0.0078125
+   txt053 
+TEXDEF txt054 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.5 APEX 0 0.234531 0.5 RAD 0.0078125
+   txt054 
+TEXDEF txt055 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.515469 APEX 0 0.125 0.609531 RAD 0.0078125
+   txt055 
+TEXDEF txt056 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.625 RAD 0.03125 
+   txt056 
+TEXDEF txt057 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.625 APEX 0.109531 0.125 0.625 RAD 0.0078125
+   txt057 
+TEXDEF txt058 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.625 APEX 0 0.234531 0.625 RAD 0.0078125
+   txt058 
+TEXDEF txt059 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.640469 APEX 0 0.125 0.734531 RAD 0.0078125
+   txt059 
+TEXDEF txt060 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.75 RAD 0.03125 
+   txt060 
+TEXDEF txt061 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.75 APEX 0.109531 0.125 0.75 RAD 0.0078125
+   txt061 
+TEXDEF txt062 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.75 APEX 0 0.234531 0.75 RAD 0.0078125
+   txt062 
+TEXDEF txt063 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.765469 APEX 0 0.125 0.859531 RAD 0.0078125
+   txt063 
+TEXDEF txt064 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 0.875 RAD 0.03125 
+   txt064 
+TEXDEF txt065 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 0.875 APEX 0.109531 0.125 0.875 RAD 0.0078125
+   txt065 
+TEXDEF txt066 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 0.875 APEX 0 0.234531 0.875 RAD 0.0078125
+   txt066 
+TEXDEF txt067 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.125 0.890469 APEX 0 0.125 0.984531 RAD 0.0078125
+   txt067 
+TEXDEF txt068 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.125 1 RAD 0.03125 
+   txt068 
+TEXDEF txt069 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.125 1 APEX 0.109531 0.125 1 RAD 0.0078125
+   txt069 
+TEXDEF txt070 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.140469 1 APEX 0 0.234531 1 RAD 0.0078125
+   txt070 
+TEXDEF txt071 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0 RAD 0.03125 
+   txt071 
+TEXDEF txt072 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0 APEX 0.109531 0.25 0 RAD 0.0078125
+   txt072 
+TEXDEF txt073 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0 APEX 0 0.359531 0 RAD 0.0078125
+   txt073 
+TEXDEF txt074 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.0154687 APEX 0 0.25 0.109531 RAD 0.0078125
+   txt074 
+TEXDEF txt075 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.125 RAD 0.03125 
+   txt075 
+TEXDEF txt076 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.125 APEX 0.109531 0.25 0.125 RAD 0.0078125
+   txt076 
+TEXDEF txt077 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.125 APEX 0 0.359531 0.125 RAD 0.0078125
+   txt077 
+TEXDEF txt078 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.140469 APEX 0 0.25 0.234531 RAD 0.0078125
+   txt078 
+TEXDEF txt079 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.25 RAD 0.03125 
+   txt079 
+TEXDEF txt080 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.25 APEX 0.109531 0.25 0.25 RAD 0.0078125
+   txt080 
+TEXDEF txt081 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.25 APEX 0 0.359531 0.25 RAD 0.0078125
+   txt081 
+TEXDEF txt082 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.265469 APEX 0 0.25 0.359531 RAD 0.0078125
+   txt082 
+TEXDEF txt083 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.375 RAD 0.03125 
+   txt083 
+TEXDEF txt084 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.375 APEX 0.109531 0.25 0.375 RAD 0.0078125
+   txt084 
+TEXDEF txt085 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.375 APEX 0 0.359531 0.375 RAD 0.0078125
+   txt085 
+TEXDEF txt086 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.390469 APEX 0 0.25 0.484531 RAD 0.0078125
+   txt086 
+TEXDEF txt087 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.5 RAD 0.03125 
+   txt087 
+TEXDEF txt088 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.5 APEX 0.109531 0.25 0.5 RAD 0.0078125
+   txt088 
+TEXDEF txt089 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.5 APEX 0 0.359531 0.5 RAD 0.0078125
+   txt089 
+TEXDEF txt090 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.515469 APEX 0 0.25 0.609531 RAD 0.0078125
+   txt090 
+TEXDEF txt091 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.625 RAD 0.03125 
+   txt091 
+TEXDEF txt092 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.625 APEX 0.109531 0.25 0.625 RAD 0.0078125
+   txt092 
+TEXDEF txt093 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.625 APEX 0 0.359531 0.625 RAD 0.0078125
+   txt093 
+TEXDEF txt094 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.640469 APEX 0 0.25 0.734531 RAD 0.0078125
+   txt094 
+TEXDEF txt095 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.75 RAD 0.03125 
+   txt095 
+TEXDEF txt096 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.75 APEX 0.109531 0.25 0.75 RAD 0.0078125
+   txt096 
+TEXDEF txt097 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.75 APEX 0 0.359531 0.75 RAD 0.0078125
+   txt097 
+TEXDEF txt098 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.765469 APEX 0 0.25 0.859531 RAD 0.0078125
+   txt098 
+TEXDEF txt099 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 0.875 RAD 0.03125 
+   txt099 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 0.875 APEX 0.109531 0.25 0.875 RAD 0.0078125
+   txt100 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 0.875 APEX 0 0.359531 0.875 RAD 0.0078125
+   txt101 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.25 0.890469 APEX 0 0.25 0.984531 RAD 0.0078125
+   txt102 
+TEXDEF txt103 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.25 1 RAD 0.03125 
+   txt103 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.25 1 APEX 0.109531 0.25 1 RAD 0.0078125
+   txt104 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.265469 1 APEX 0 0.359531 1 RAD 0.0078125
+   txt105 
+TEXDEF txt106 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0 RAD 0.03125 
+   txt106 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0 APEX 0.109531 0.375 0 RAD 0.0078125
+   txt107 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0 APEX 0 0.484531 0 RAD 0.0078125
+   txt108 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.0154687 APEX 0 0.375 0.109531 RAD 0.0078125
+   txt109 
+TEXDEF txt110 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.125 RAD 0.03125 
+   txt110 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.125 APEX 0.109531 0.375 0.125 RAD 0.0078125
+   txt111 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.125 APEX 0 0.484531 0.125 RAD 0.0078125
+   txt112 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.140469 APEX 0 0.375 0.234531 RAD 0.0078125
+   txt113 
+TEXDEF txt114 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.25 RAD 0.03125 
+   txt114 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.25 APEX 0.109531 0.375 0.25 RAD 0.0078125
+   txt115 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.25 APEX 0 0.484531 0.25 RAD 0.0078125
+   txt116 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.265469 APEX 0 0.375 0.359531 RAD 0.0078125
+   txt117 
+TEXDEF txt118 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.375 RAD 0.03125 
+   txt118 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.375 APEX 0.109531 0.375 0.375 RAD 0.0078125
+   txt119 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.375 APEX 0 0.484531 0.375 RAD 0.0078125
+   txt120 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.390469 APEX 0 0.375 0.484531 RAD 0.0078125
+   txt121 
+TEXDEF txt122 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.5 RAD 0.03125 
+   txt122 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.5 APEX 0.109531 0.375 0.5 RAD 0.0078125
+   txt123 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.5 APEX 0 0.484531 0.5 RAD 0.0078125
+   txt124 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.515469 APEX 0 0.375 0.609531 RAD 0.0078125
+   txt125 
+TEXDEF txt126 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.625 RAD 0.03125 
+   txt126 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.625 APEX 0.109531 0.375 0.625 RAD 0.0078125
+   txt127 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.625 APEX 0 0.484531 0.625 RAD 0.0078125
+   txt128 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.640469 APEX 0 0.375 0.734531 RAD 0.0078125
+   txt129 
+TEXDEF txt130 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.75 RAD 0.03125 
+   txt130 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.75 APEX 0.109531 0.375 0.75 RAD 0.0078125
+   txt131 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.75 APEX 0 0.484531 0.75 RAD 0.0078125
+   txt132 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.765469 APEX 0 0.375 0.859531 RAD 0.0078125
+   txt133 
+TEXDEF txt134 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 0.875 RAD 0.03125 
+   txt134 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 0.875 APEX 0.109531 0.375 0.875 RAD 0.0078125
+   txt135 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 0.875 APEX 0 0.484531 0.875 RAD 0.0078125
+   txt136 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.375 0.890469 APEX 0 0.375 0.984531 RAD 0.0078125
+   txt137 
+TEXDEF txt138 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.375 1 RAD 0.03125 
+   txt138 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.375 1 APEX 0.109531 0.375 1 RAD 0.0078125
+   txt139 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.390469 1 APEX 0 0.484531 1 RAD 0.0078125
+   txt140 
+TEXDEF txt141 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0 RAD 0.03125 
+   txt141 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0 APEX 0.109531 0.5 0 RAD 0.0078125
+   txt142 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0 APEX 0 0.609531 0 RAD 0.0078125
+   txt143 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.0154687 APEX 0 0.5 0.109531 RAD 0.0078125
+   txt144 
+TEXDEF txt145 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.125 RAD 0.03125 
+   txt145 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.125 APEX 0.109531 0.5 0.125 RAD 0.0078125
+   txt146 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.125 APEX 0 0.609531 0.125 RAD 0.0078125
+   txt147 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.140469 APEX 0 0.5 0.234531 RAD 0.0078125
+   txt148 
+TEXDEF txt149 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.25 RAD 0.03125 
+   txt149 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.25 APEX 0.109531 0.5 0.25 RAD 0.0078125
+   txt150 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.25 APEX 0 0.609531 0.25 RAD 0.0078125
+   txt151 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.265469 APEX 0 0.5 0.359531 RAD 0.0078125
+   txt152 
+TEXDEF txt153 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.375 RAD 0.03125 
+   txt153 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.375 APEX 0.109531 0.5 0.375 RAD 0.0078125
+   txt154 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.375 APEX 0 0.609531 0.375 RAD 0.0078125
+   txt155 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.390469 APEX 0 0.5 0.484531 RAD 0.0078125
+   txt156 
+TEXDEF txt157 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.5 RAD 0.03125 
+   txt157 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.5 APEX 0.109531 0.5 0.5 RAD 0.0078125
+   txt158 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.5 APEX 0 0.609531 0.5 RAD 0.0078125
+   txt159 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.515469 APEX 0 0.5 0.609531 RAD 0.0078125
+   txt160 
+TEXDEF txt161 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.625 RAD 0.03125 
+   txt161 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.625 APEX 0.109531 0.5 0.625 RAD 0.0078125
+   txt162 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.625 APEX 0 0.609531 0.625 RAD 0.0078125
+   txt163 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.640469 APEX 0 0.5 0.734531 RAD 0.0078125
+   txt164 
+TEXDEF txt165 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.75 RAD 0.03125 
+   txt165 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.75 APEX 0.109531 0.5 0.75 RAD 0.0078125
+   txt166 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.75 APEX 0 0.609531 0.75 RAD 0.0078125
+   txt167 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.765469 APEX 0 0.5 0.859531 RAD 0.0078125
+   txt168 
+TEXDEF txt169 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 0.875 RAD 0.03125 
+   txt169 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 0.875 APEX 0.109531 0.5 0.875 RAD 0.0078125
+   txt170 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 0.875 APEX 0 0.609531 0.875 RAD 0.0078125
+   txt171 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.5 0.890469 APEX 0 0.5 0.984531 RAD 0.0078125
+   txt172 
+TEXDEF txt173 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.5 1 RAD 0.03125 
+   txt173 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.5 1 APEX 0.109531 0.5 1 RAD 0.0078125
+   txt174 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.515469 1 APEX 0 0.609531 1 RAD 0.0078125
+   txt175 
+TEXDEF txt176 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0 RAD 0.03125 
+   txt176 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0 APEX 0.109531 0.625 0 RAD 0.0078125
+   txt177 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0 APEX 0 0.734531 0 RAD 0.0078125
+   txt178 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.0154687 APEX 0 0.625 0.109531 RAD 0.0078125
+   txt179 
+TEXDEF txt180 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.125 RAD 0.03125 
+   txt180 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.125 APEX 0.109531 0.625 0.125 RAD 0.0078125
+   txt181 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.125 APEX 0 0.734531 0.125 RAD 0.0078125
+   txt182 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.140469 APEX 0 0.625 0.234531 RAD 0.0078125
+   txt183 
+TEXDEF txt184 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.25 RAD 0.03125 
+   txt184 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.25 APEX 0.109531 0.625 0.25 RAD 0.0078125
+   txt185 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.25 APEX 0 0.734531 0.25 RAD 0.0078125
+   txt186 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.265469 APEX 0 0.625 0.359531 RAD 0.0078125
+   txt187 
+TEXDEF txt188 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.375 RAD 0.03125 
+   txt188 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.375 APEX 0.109531 0.625 0.375 RAD 0.0078125
+   txt189 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.375 APEX 0 0.734531 0.375 RAD 0.0078125
+   txt190 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.390469 APEX 0 0.625 0.484531 RAD 0.0078125
+   txt191 
+TEXDEF txt192 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.5 RAD 0.03125 
+   txt192 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.5 APEX 0.109531 0.625 0.5 RAD 0.0078125
+   txt193 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.5 APEX 0 0.734531 0.5 RAD 0.0078125
+   txt194 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.515469 APEX 0 0.625 0.609531 RAD 0.0078125
+   txt195 
+TEXDEF txt196 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.625 RAD 0.03125 
+   txt196 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.625 APEX 0.109531 0.625 0.625 RAD 0.0078125
+   txt197 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.625 APEX 0 0.734531 0.625 RAD 0.0078125
+   txt198 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.640469 APEX 0 0.625 0.734531 RAD 0.0078125
+   txt199 
+TEXDEF txt200 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.75 RAD 0.03125 
+   txt200 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.75 APEX 0.109531 0.625 0.75 RAD 0.0078125
+   txt201 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.75 APEX 0 0.734531 0.75 RAD 0.0078125
+   txt202 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.765469 APEX 0 0.625 0.859531 RAD 0.0078125
+   txt203 
+TEXDEF txt204 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 0.875 RAD 0.03125 
+   txt204 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 0.875 APEX 0.109531 0.625 0.875 RAD 0.0078125
+   txt205 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 0.875 APEX 0 0.734531 0.875 RAD 0.0078125
+   txt206 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.625 0.890469 APEX 0 0.625 0.984531 RAD 0.0078125
+   txt207 
+TEXDEF txt208 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.625 1 RAD 0.03125 
+   txt208 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.625 1 APEX 0.109531 0.625 1 RAD 0.0078125
+   txt209 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.640469 1 APEX 0 0.734531 1 RAD 0.0078125
+   txt210 
+TEXDEF txt211 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0 RAD 0.03125 
+   txt211 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0 APEX 0.109531 0.75 0 RAD 0.0078125
+   txt212 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0 APEX 0 0.859531 0 RAD 0.0078125
+   txt213 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.0154687 APEX 0 0.75 0.109531 RAD 0.0078125
+   txt214 
+TEXDEF txt215 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.125 RAD 0.03125 
+   txt215 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.125 APEX 0.109531 0.75 0.125 RAD 0.0078125
+   txt216 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.125 APEX 0 0.859531 0.125 RAD 0.0078125
+   txt217 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.140469 APEX 0 0.75 0.234531 RAD 0.0078125
+   txt218 
+TEXDEF txt219 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.25 RAD 0.03125 
+   txt219 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.25 APEX 0.109531 0.75 0.25 RAD 0.0078125
+   txt220 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.25 APEX 0 0.859531 0.25 RAD 0.0078125
+   txt221 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.265469 APEX 0 0.75 0.359531 RAD 0.0078125
+   txt222 
+TEXDEF txt223 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.375 RAD 0.03125 
+   txt223 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.375 APEX 0.109531 0.75 0.375 RAD 0.0078125
+   txt224 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.375 APEX 0 0.859531 0.375 RAD 0.0078125
+   txt225 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.390469 APEX 0 0.75 0.484531 RAD 0.0078125
+   txt226 
+TEXDEF txt227 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.5 RAD 0.03125 
+   txt227 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.5 APEX 0.109531 0.75 0.5 RAD 0.0078125
+   txt228 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.5 APEX 0 0.859531 0.5 RAD 0.0078125
+   txt229 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.515469 APEX 0 0.75 0.609531 RAD 0.0078125
+   txt230 
+TEXDEF txt231 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.625 RAD 0.03125 
+   txt231 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.625 APEX 0.109531 0.75 0.625 RAD 0.0078125
+   txt232 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.625 APEX 0 0.859531 0.625 RAD 0.0078125
+   txt233 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.640469 APEX 0 0.75 0.734531 RAD 0.0078125
+   txt234 
+TEXDEF txt235 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.75 RAD 0.03125 
+   txt235 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.75 APEX 0.109531 0.75 0.75 RAD 0.0078125
+   txt236 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.75 APEX 0 0.859531 0.75 RAD 0.0078125
+   txt237 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.765469 APEX 0 0.75 0.859531 RAD 0.0078125
+   txt238 
+TEXDEF txt239 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 0.875 RAD 0.03125 
+   txt239 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 0.875 APEX 0.109531 0.75 0.875 RAD 0.0078125
+   txt240 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 0.875 APEX 0 0.859531 0.875 RAD 0.0078125
+   txt241 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.75 0.890469 APEX 0 0.75 0.984531 RAD 0.0078125
+   txt242 
+TEXDEF txt243 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.75 1 RAD 0.03125 
+   txt243 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.75 1 APEX 0.109531 0.75 1 RAD 0.0078125
+   txt244 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.765469 1 APEX 0 0.859531 1 RAD 0.0078125
+   txt245 
+TEXDEF txt246 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0 RAD 0.03125 
+   txt246 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0 APEX 0.109531 0.875 0 RAD 0.0078125
+   txt247 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0 APEX 0 0.984531 0 RAD 0.0078125
+   txt248 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.0154687 APEX 0 0.875 0.109531 RAD 0.0078125
+   txt249 
+TEXDEF txt250 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.125 RAD 0.03125 
+   txt250 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.125 APEX 0.109531 0.875 0.125 RAD 0.0078125
+   txt251 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.125 APEX 0 0.984531 0.125 RAD 0.0078125
+   txt252 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.140469 APEX 0 0.875 0.234531 RAD 0.0078125
+   txt253 
+TEXDEF txt254 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.25 RAD 0.03125 
+   txt254 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.25 APEX 0.109531 0.875 0.25 RAD 0.0078125
+   txt255 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.25 APEX 0 0.984531 0.25 RAD 0.0078125
+   txt256 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.265469 APEX 0 0.875 0.359531 RAD 0.0078125
+   txt257 
+TEXDEF txt258 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.375 RAD 0.03125 
+   txt258 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.375 APEX 0.109531 0.875 0.375 RAD 0.0078125
+   txt259 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.375 APEX 0 0.984531 0.375 RAD 0.0078125
+   txt260 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.390469 APEX 0 0.875 0.484531 RAD 0.0078125
+   txt261 
+TEXDEF txt262 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.5 RAD 0.03125 
+   txt262 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.5 APEX 0.109531 0.875 0.5 RAD 0.0078125
+   txt263 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.5 APEX 0 0.984531 0.5 RAD 0.0078125
+   txt264 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.515469 APEX 0 0.875 0.609531 RAD 0.0078125
+   txt265 
+TEXDEF txt266 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.625 RAD 0.03125 
+   txt266 
+TEXDEF txt267 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.625 APEX 0.109531 0.875 0.625 RAD 0.0078125
+   txt267 
+TEXDEF txt268 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.625 APEX 0 0.984531 0.625 RAD 0.0078125
+   txt268 
+TEXDEF txt269 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.640469 APEX 0 0.875 0.734531 RAD 0.0078125
+   txt269 
+TEXDEF txt270 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.75 RAD 0.03125 
+   txt270 
+TEXDEF txt271 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.75 APEX 0.109531 0.875 0.75 RAD 0.0078125
+   txt271 
+TEXDEF txt272 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.75 APEX 0 0.984531 0.75 RAD 0.0078125
+   txt272 
+TEXDEF txt273 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.765469 APEX 0 0.875 0.859531 RAD 0.0078125
+   txt273 
+TEXDEF txt274 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 0.875 RAD 0.03125 
+   txt274 
+TEXDEF txt275 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 0.875 APEX 0.109531 0.875 0.875 RAD 0.0078125
+   txt275 
+TEXDEF txt276 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 0.875 APEX 0 0.984531 0.875 RAD 0.0078125
+   txt276 
+TEXDEF txt277 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.875 0.890469 APEX 0 0.875 0.984531 RAD 0.0078125
+   txt277 
+TEXDEF txt278 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 0.875 1 RAD 0.03125 
+   txt278 
+TEXDEF txt279 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 0.875 1 APEX 0.109531 0.875 1 RAD 0.0078125
+   txt279 
+TEXDEF txt280 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 0.890469 1 APEX 0 0.984531 1 RAD 0.0078125
+   txt280 
+TEXDEF txt281 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0 RAD 0.03125 
+   txt281 
+TEXDEF txt282 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0 APEX 0.109531 1 0 RAD 0.0078125
+   txt282 
+TEXDEF txt283 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.0154687 APEX 0 1 0.109531 RAD 0.0078125
+   txt283 
+TEXDEF txt284 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.125 RAD 0.03125 
+   txt284 
+TEXDEF txt285 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.125 APEX 0.109531 1 0.125 RAD 0.0078125
+   txt285 
+TEXDEF txt286 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.140469 APEX 0 1 0.234531 RAD 0.0078125
+   txt286 
+TEXDEF txt287 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.25 RAD 0.03125 
+   txt287 
+TEXDEF txt288 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.25 APEX 0.109531 1 0.25 RAD 0.0078125
+   txt288 
+TEXDEF txt289 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.265469 APEX 0 1 0.359531 RAD 0.0078125
+   txt289 
+TEXDEF txt290 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.375 RAD 0.03125 
+   txt290 
+TEXDEF txt291 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.375 APEX 0.109531 1 0.375 RAD 0.0078125
+   txt291 
+TEXDEF txt292 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.390469 APEX 0 1 0.484531 RAD 0.0078125
+   txt292 
+TEXDEF txt293 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.5 RAD 0.03125 
+   txt293 
+TEXDEF txt294 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.5 APEX 0.109531 1 0.5 RAD 0.0078125
+   txt294 
+TEXDEF txt295 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.515469 APEX 0 1 0.609531 RAD 0.0078125
+   txt295 
+TEXDEF txt296 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.625 RAD 0.03125 
+   txt296 
+TEXDEF txt297 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.625 APEX 0.109531 1 0.625 RAD 0.0078125
+   txt297 
+TEXDEF txt298 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.640469 APEX 0 1 0.734531 RAD 0.0078125
+   txt298 
+TEXDEF txt299 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.75 RAD 0.03125 
+   txt299 
+TEXDEF txt300 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.75 APEX 0.109531 1 0.75 RAD 0.0078125
+   txt300 
+TEXDEF txt301 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.765469 APEX 0 1 0.859531 RAD 0.0078125
+   txt301 
+TEXDEF txt302 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 0.875 RAD 0.03125 
+   txt302 
+TEXDEF txt303 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 0.875 APEX 0.109531 1 0.875 RAD 0.0078125
+   txt303 
+TEXDEF txt304 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0 1 0.890469 APEX 0 1 0.984531 RAD 0.0078125
+   txt304 
+TEXDEF txt305 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0 1 1 RAD 0.03125 
+   txt305 
+TEXDEF txt306 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.0154687 1 1 APEX 0.109531 1 1 RAD 0.0078125
+   txt306 
+TEXDEF txt307 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0 RAD 0.03125 
+   txt307 
+TEXDEF txt308 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0 APEX 0.234531 0 0 RAD 0.0078125
+   txt308 
+TEXDEF txt309 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0 APEX 0.125 0.109531 0 RAD 0.0078125
+   txt309 
+TEXDEF txt310 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.0154687 APEX 0.125 0 0.109531 RAD 0.0078125
+   txt310 
+TEXDEF txt311 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.125 RAD 0.03125 
+   txt311 
+TEXDEF txt312 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.125 APEX 0.234531 0 0.125 RAD 0.0078125
+   txt312 
+TEXDEF txt313 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.125 APEX 0.125 0.109531 0.125 RAD 0.0078125
+   txt313 
+TEXDEF txt314 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.140469 APEX 0.125 0 0.234531 RAD 0.0078125
+   txt314 
+TEXDEF txt315 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.25 RAD 0.03125 
+   txt315 
+TEXDEF txt316 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.25 APEX 0.234531 0 0.25 RAD 0.0078125
+   txt316 
+TEXDEF txt317 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.25 APEX 0.125 0.109531 0.25 RAD 0.0078125
+   txt317 
+TEXDEF txt318 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.265469 APEX 0.125 0 0.359531 RAD 0.0078125
+   txt318 
+TEXDEF txt319 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.375 RAD 0.03125 
+   txt319 
+TEXDEF txt320 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.375 APEX 0.234531 0 0.375 RAD 0.0078125
+   txt320 
+TEXDEF txt321 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.375 APEX 0.125 0.109531 0.375 RAD 0.0078125
+   txt321 
+TEXDEF txt322 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.390469 APEX 0.125 0 0.484531 RAD 0.0078125
+   txt322 
+TEXDEF txt323 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.5 RAD 0.03125 
+   txt323 
+TEXDEF txt324 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.5 APEX 0.234531 0 0.5 RAD 0.0078125
+   txt324 
+TEXDEF txt325 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.5 APEX 0.125 0.109531 0.5 RAD 0.0078125
+   txt325 
+TEXDEF txt326 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.515469 APEX 0.125 0 0.609531 RAD 0.0078125
+   txt326 
+TEXDEF txt327 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.625 RAD 0.03125 
+   txt327 
+TEXDEF txt328 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.625 APEX 0.234531 0 0.625 RAD 0.0078125
+   txt328 
+TEXDEF txt329 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.625 APEX 0.125 0.109531 0.625 RAD 0.0078125
+   txt329 
+TEXDEF txt330 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.640469 APEX 0.125 0 0.734531 RAD 0.0078125
+   txt330 
+TEXDEF txt331 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.75 RAD 0.03125 
+   txt331 
+TEXDEF txt332 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.75 APEX 0.234531 0 0.75 RAD 0.0078125
+   txt332 
+TEXDEF txt333 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.75 APEX 0.125 0.109531 0.75 RAD 0.0078125
+   txt333 
+TEXDEF txt334 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.765469 APEX 0.125 0 0.859531 RAD 0.0078125
+   txt334 
+TEXDEF txt335 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 0.875 RAD 0.03125 
+   txt335 
+TEXDEF txt336 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 0.875 APEX 0.234531 0 0.875 RAD 0.0078125
+   txt336 
+TEXDEF txt337 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 0.875 APEX 0.125 0.109531 0.875 RAD 0.0078125
+   txt337 
+TEXDEF txt338 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0 0.890469 APEX 0.125 0 0.984531 RAD 0.0078125
+   txt338 
+TEXDEF txt339 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0 1 RAD 0.03125 
+   txt339 
+TEXDEF txt340 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0 1 APEX 0.234531 0 1 RAD 0.0078125
+   txt340 
+TEXDEF txt341 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.0154687 1 APEX 0.125 0.109531 1 RAD 0.0078125
+   txt341 
+TEXDEF txt342 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0 RAD 0.03125 
+   txt342 
+TEXDEF txt343 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0 APEX 0.234531 0.125 0 RAD 0.0078125
+   txt343 
+TEXDEF txt344 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0 APEX 0.125 0.234531 0 RAD 0.0078125
+   txt344 
+TEXDEF txt345 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.0154687 APEX 0.125 0.125 0.109531 RAD 0.0078125
+   txt345 
+TEXDEF txt346 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.125 RAD 0.03125 
+   txt346 
+TEXDEF txt347 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.125 APEX 0.234531 0.125 0.125 RAD 0.0078125
+   txt347 
+TEXDEF txt348 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.125 APEX 0.125 0.234531 0.125 RAD 0.0078125
+   txt348 
+TEXDEF txt349 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.140469 APEX 0.125 0.125 0.234531 RAD 0.0078125
+   txt349 
+TEXDEF txt350 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.25 RAD 0.03125 
+   txt350 
+TEXDEF txt351 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.25 APEX 0.234531 0.125 0.25 RAD 0.0078125
+   txt351 
+TEXDEF txt352 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.25 APEX 0.125 0.234531 0.25 RAD 0.0078125
+   txt352 
+TEXDEF txt353 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.265469 APEX 0.125 0.125 0.359531 RAD 0.0078125
+   txt353 
+TEXDEF txt354 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.375 RAD 0.03125 
+   txt354 
+TEXDEF txt355 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.375 APEX 0.234531 0.125 0.375 RAD 0.0078125
+   txt355 
+TEXDEF txt356 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.375 APEX 0.125 0.234531 0.375 RAD 0.0078125
+   txt356 
+TEXDEF txt357 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.390469 APEX 0.125 0.125 0.484531 RAD 0.0078125
+   txt357 
+TEXDEF txt358 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.5 RAD 0.03125 
+   txt358 
+TEXDEF txt359 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.5 APEX 0.234531 0.125 0.5 RAD 0.0078125
+   txt359 
+TEXDEF txt360 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.5 APEX 0.125 0.234531 0.5 RAD 0.0078125
+   txt360 
+TEXDEF txt361 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.515469 APEX 0.125 0.125 0.609531 RAD 0.0078125
+   txt361 
+TEXDEF txt362 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.625 RAD 0.03125 
+   txt362 
+TEXDEF txt363 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.625 APEX 0.234531 0.125 0.625 RAD 0.0078125
+   txt363 
+TEXDEF txt364 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.625 APEX 0.125 0.234531 0.625 RAD 0.0078125
+   txt364 
+TEXDEF txt365 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.640469 APEX 0.125 0.125 0.734531 RAD 0.0078125
+   txt365 
+TEXDEF txt366 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.75 RAD 0.03125 
+   txt366 
+TEXDEF txt367 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.75 APEX 0.234531 0.125 0.75 RAD 0.0078125
+   txt367 
+TEXDEF txt368 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.75 APEX 0.125 0.234531 0.75 RAD 0.0078125
+   txt368 
+TEXDEF txt369 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.765469 APEX 0.125 0.125 0.859531 RAD 0.0078125
+   txt369 
+TEXDEF txt370 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 0.875 RAD 0.03125 
+   txt370 
+TEXDEF txt371 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 0.875 APEX 0.234531 0.125 0.875 RAD 0.0078125
+   txt371 
+TEXDEF txt372 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 0.875 APEX 0.125 0.234531 0.875 RAD 0.0078125
+   txt372 
+TEXDEF txt373 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.125 0.890469 APEX 0.125 0.125 0.984531 RAD 0.0078125
+   txt373 
+TEXDEF txt374 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.125 1 RAD 0.03125 
+   txt374 
+TEXDEF txt375 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.125 1 APEX 0.234531 0.125 1 RAD 0.0078125
+   txt375 
+TEXDEF txt376 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.140469 1 APEX 0.125 0.234531 1 RAD 0.0078125
+   txt376 
+TEXDEF txt377 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0 RAD 0.03125 
+   txt377 
+TEXDEF txt378 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0 APEX 0.234531 0.25 0 RAD 0.0078125
+   txt378 
+TEXDEF txt379 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0 APEX 0.125 0.359531 0 RAD 0.0078125
+   txt379 
+TEXDEF txt380 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.0154687 APEX 0.125 0.25 0.109531 RAD 0.0078125
+   txt380 
+TEXDEF txt381 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.125 RAD 0.03125 
+   txt381 
+TEXDEF txt382 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.125 APEX 0.234531 0.25 0.125 RAD 0.0078125
+   txt382 
+TEXDEF txt383 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.125 APEX 0.125 0.359531 0.125 RAD 0.0078125
+   txt383 
+TEXDEF txt384 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.140469 APEX 0.125 0.25 0.234531 RAD 0.0078125
+   txt384 
+TEXDEF txt385 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.25 RAD 0.03125 
+   txt385 
+TEXDEF txt386 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.25 APEX 0.234531 0.25 0.25 RAD 0.0078125
+   txt386 
+TEXDEF txt387 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.25 APEX 0.125 0.359531 0.25 RAD 0.0078125
+   txt387 
+TEXDEF txt388 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.265469 APEX 0.125 0.25 0.359531 RAD 0.0078125
+   txt388 
+TEXDEF txt389 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.375 RAD 0.03125 
+   txt389 
+TEXDEF txt390 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.375 APEX 0.234531 0.25 0.375 RAD 0.0078125
+   txt390 
+TEXDEF txt391 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.375 APEX 0.125 0.359531 0.375 RAD 0.0078125
+   txt391 
+TEXDEF txt392 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.390469 APEX 0.125 0.25 0.484531 RAD 0.0078125
+   txt392 
+TEXDEF txt393 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.5 RAD 0.03125 
+   txt393 
+TEXDEF txt394 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.5 APEX 0.234531 0.25 0.5 RAD 0.0078125
+   txt394 
+TEXDEF txt395 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.5 APEX 0.125 0.359531 0.5 RAD 0.0078125
+   txt395 
+TEXDEF txt396 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.515469 APEX 0.125 0.25 0.609531 RAD 0.0078125
+   txt396 
+TEXDEF txt397 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.625 RAD 0.03125 
+   txt397 
+TEXDEF txt398 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.625 APEX 0.234531 0.25 0.625 RAD 0.0078125
+   txt398 
+TEXDEF txt399 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.625 APEX 0.125 0.359531 0.625 RAD 0.0078125
+   txt399 
+TEXDEF txt400 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.640469 APEX 0.125 0.25 0.734531 RAD 0.0078125
+   txt400 
+TEXDEF txt401 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.75 RAD 0.03125 
+   txt401 
+TEXDEF txt402 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.75 APEX 0.234531 0.25 0.75 RAD 0.0078125
+   txt402 
+TEXDEF txt403 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.75 APEX 0.125 0.359531 0.75 RAD 0.0078125
+   txt403 
+TEXDEF txt404 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.765469 APEX 0.125 0.25 0.859531 RAD 0.0078125
+   txt404 
+TEXDEF txt405 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 0.875 RAD 0.03125 
+   txt405 
+TEXDEF txt406 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 0.875 APEX 0.234531 0.25 0.875 RAD 0.0078125
+   txt406 
+TEXDEF txt407 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 0.875 APEX 0.125 0.359531 0.875 RAD 0.0078125
+   txt407 
+TEXDEF txt408 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.25 0.890469 APEX 0.125 0.25 0.984531 RAD 0.0078125
+   txt408 
+TEXDEF txt409 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.25 1 RAD 0.03125 
+   txt409 
+TEXDEF txt410 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.25 1 APEX 0.234531 0.25 1 RAD 0.0078125
+   txt410 
+TEXDEF txt411 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.265469 1 APEX 0.125 0.359531 1 RAD 0.0078125
+   txt411 
+TEXDEF txt412 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0 RAD 0.03125 
+   txt412 
+TEXDEF txt413 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0 APEX 0.234531 0.375 0 RAD 0.0078125
+   txt413 
+TEXDEF txt414 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0 APEX 0.125 0.484531 0 RAD 0.0078125
+   txt414 
+TEXDEF txt415 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.0154687 APEX 0.125 0.375 0.109531 RAD 0.0078125
+   txt415 
+TEXDEF txt416 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.125 RAD 0.03125 
+   txt416 
+TEXDEF txt417 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.125 APEX 0.234531 0.375 0.125 RAD 0.0078125
+   txt417 
+TEXDEF txt418 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.125 APEX 0.125 0.484531 0.125 RAD 0.0078125
+   txt418 
+TEXDEF txt419 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.140469 APEX 0.125 0.375 0.234531 RAD 0.0078125
+   txt419 
+TEXDEF txt420 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.25 RAD 0.03125 
+   txt420 
+TEXDEF txt421 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.25 APEX 0.234531 0.375 0.25 RAD 0.0078125
+   txt421 
+TEXDEF txt422 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.25 APEX 0.125 0.484531 0.25 RAD 0.0078125
+   txt422 
+TEXDEF txt423 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.265469 APEX 0.125 0.375 0.359531 RAD 0.0078125
+   txt423 
+TEXDEF txt424 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.375 RAD 0.03125 
+   txt424 
+TEXDEF txt425 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.375 APEX 0.234531 0.375 0.375 RAD 0.0078125
+   txt425 
+TEXDEF txt426 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.375 APEX 0.125 0.484531 0.375 RAD 0.0078125
+   txt426 
+TEXDEF txt427 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.390469 APEX 0.125 0.375 0.484531 RAD 0.0078125
+   txt427 
+TEXDEF txt428 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.5 RAD 0.03125 
+   txt428 
+TEXDEF txt429 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.5 APEX 0.234531 0.375 0.5 RAD 0.0078125
+   txt429 
+TEXDEF txt430 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.5 APEX 0.125 0.484531 0.5 RAD 0.0078125
+   txt430 
+TEXDEF txt431 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.515469 APEX 0.125 0.375 0.609531 RAD 0.0078125
+   txt431 
+TEXDEF txt432 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.625 RAD 0.03125 
+   txt432 
+TEXDEF txt433 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.625 APEX 0.234531 0.375 0.625 RAD 0.0078125
+   txt433 
+TEXDEF txt434 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.625 APEX 0.125 0.484531 0.625 RAD 0.0078125
+   txt434 
+TEXDEF txt435 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.640469 APEX 0.125 0.375 0.734531 RAD 0.0078125
+   txt435 
+TEXDEF txt436 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.75 RAD 0.03125 
+   txt436 
+TEXDEF txt437 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.75 APEX 0.234531 0.375 0.75 RAD 0.0078125
+   txt437 
+TEXDEF txt438 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.75 APEX 0.125 0.484531 0.75 RAD 0.0078125
+   txt438 
+TEXDEF txt439 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.765469 APEX 0.125 0.375 0.859531 RAD 0.0078125
+   txt439 
+TEXDEF txt440 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 0.875 RAD 0.03125 
+   txt440 
+TEXDEF txt441 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 0.875 APEX 0.234531 0.375 0.875 RAD 0.0078125
+   txt441 
+TEXDEF txt442 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 0.875 APEX 0.125 0.484531 0.875 RAD 0.0078125
+   txt442 
+TEXDEF txt443 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.375 0.890469 APEX 0.125 0.375 0.984531 RAD 0.0078125
+   txt443 
+TEXDEF txt444 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.375 1 RAD 0.03125 
+   txt444 
+TEXDEF txt445 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.375 1 APEX 0.234531 0.375 1 RAD 0.0078125
+   txt445 
+TEXDEF txt446 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.390469 1 APEX 0.125 0.484531 1 RAD 0.0078125
+   txt446 
+TEXDEF txt447 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0 RAD 0.03125 
+   txt447 
+TEXDEF txt448 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0 APEX 0.234531 0.5 0 RAD 0.0078125
+   txt448 
+TEXDEF txt449 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0 APEX 0.125 0.609531 0 RAD 0.0078125
+   txt449 
+TEXDEF txt450 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.0154687 APEX 0.125 0.5 0.109531 RAD 0.0078125
+   txt450 
+TEXDEF txt451 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.125 RAD 0.03125 
+   txt451 
+TEXDEF txt452 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.125 APEX 0.234531 0.5 0.125 RAD 0.0078125
+   txt452 
+TEXDEF txt453 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.125 APEX 0.125 0.609531 0.125 RAD 0.0078125
+   txt453 
+TEXDEF txt454 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.140469 APEX 0.125 0.5 0.234531 RAD 0.0078125
+   txt454 
+TEXDEF txt455 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.25 RAD 0.03125 
+   txt455 
+TEXDEF txt456 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.25 APEX 0.234531 0.5 0.25 RAD 0.0078125
+   txt456 
+TEXDEF txt457 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.25 APEX 0.125 0.609531 0.25 RAD 0.0078125
+   txt457 
+TEXDEF txt458 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.265469 APEX 0.125 0.5 0.359531 RAD 0.0078125
+   txt458 
+TEXDEF txt459 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.375 RAD 0.03125 
+   txt459 
+TEXDEF txt460 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.375 APEX 0.234531 0.5 0.375 RAD 0.0078125
+   txt460 
+TEXDEF txt461 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.375 APEX 0.125 0.609531 0.375 RAD 0.0078125
+   txt461 
+TEXDEF txt462 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.390469 APEX 0.125 0.5 0.484531 RAD 0.0078125
+   txt462 
+TEXDEF txt463 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.5 RAD 0.03125 
+   txt463 
+TEXDEF txt464 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.5 APEX 0.234531 0.5 0.5 RAD 0.0078125
+   txt464 
+TEXDEF txt465 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.5 APEX 0.125 0.609531 0.5 RAD 0.0078125
+   txt465 
+TEXDEF txt466 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.515469 APEX 0.125 0.5 0.609531 RAD 0.0078125
+   txt466 
+TEXDEF txt467 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.625 RAD 0.03125 
+   txt467 
+TEXDEF txt468 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.625 APEX 0.234531 0.5 0.625 RAD 0.0078125
+   txt468 
+TEXDEF txt469 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.625 APEX 0.125 0.609531 0.625 RAD 0.0078125
+   txt469 
+TEXDEF txt470 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.640469 APEX 0.125 0.5 0.734531 RAD 0.0078125
+   txt470 
+TEXDEF txt471 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.75 RAD 0.03125 
+   txt471 
+TEXDEF txt472 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.75 APEX 0.234531 0.5 0.75 RAD 0.0078125
+   txt472 
+TEXDEF txt473 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.75 APEX 0.125 0.609531 0.75 RAD 0.0078125
+   txt473 
+TEXDEF txt474 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.765469 APEX 0.125 0.5 0.859531 RAD 0.0078125
+   txt474 
+TEXDEF txt475 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 0.875 RAD 0.03125 
+   txt475 
+TEXDEF txt476 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 0.875 APEX 0.234531 0.5 0.875 RAD 0.0078125
+   txt476 
+TEXDEF txt477 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 0.875 APEX 0.125 0.609531 0.875 RAD 0.0078125
+   txt477 
+TEXDEF txt478 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.5 0.890469 APEX 0.125 0.5 0.984531 RAD 0.0078125
+   txt478 
+TEXDEF txt479 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.5 1 RAD 0.03125 
+   txt479 
+TEXDEF txt480 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.5 1 APEX 0.234531 0.5 1 RAD 0.0078125
+   txt480 
+TEXDEF txt481 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.515469 1 APEX 0.125 0.609531 1 RAD 0.0078125
+   txt481 
+TEXDEF txt482 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0 RAD 0.03125 
+   txt482 
+TEXDEF txt483 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0 APEX 0.234531 0.625 0 RAD 0.0078125
+   txt483 
+TEXDEF txt484 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0 APEX 0.125 0.734531 0 RAD 0.0078125
+   txt484 
+TEXDEF txt485 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.0154687 APEX 0.125 0.625 0.109531 RAD 0.0078125
+   txt485 
+TEXDEF txt486 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.125 RAD 0.03125 
+   txt486 
+TEXDEF txt487 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.125 APEX 0.234531 0.625 0.125 RAD 0.0078125
+   txt487 
+TEXDEF txt488 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.125 APEX 0.125 0.734531 0.125 RAD 0.0078125
+   txt488 
+TEXDEF txt489 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.140469 APEX 0.125 0.625 0.234531 RAD 0.0078125
+   txt489 
+TEXDEF txt490 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.25 RAD 0.03125 
+   txt490 
+TEXDEF txt491 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.25 APEX 0.234531 0.625 0.25 RAD 0.0078125
+   txt491 
+TEXDEF txt492 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.25 APEX 0.125 0.734531 0.25 RAD 0.0078125
+   txt492 
+TEXDEF txt493 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.265469 APEX 0.125 0.625 0.359531 RAD 0.0078125
+   txt493 
+TEXDEF txt494 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.375 RAD 0.03125 
+   txt494 
+TEXDEF txt495 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.375 APEX 0.234531 0.625 0.375 RAD 0.0078125
+   txt495 
+TEXDEF txt496 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.375 APEX 0.125 0.734531 0.375 RAD 0.0078125
+   txt496 
+TEXDEF txt497 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.390469 APEX 0.125 0.625 0.484531 RAD 0.0078125
+   txt497 
+TEXDEF txt498 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.5 RAD 0.03125 
+   txt498 
+TEXDEF txt499 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.5 APEX 0.234531 0.625 0.5 RAD 0.0078125
+   txt499 
+TEXDEF txt500 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.5 APEX 0.125 0.734531 0.5 RAD 0.0078125
+   txt500 
+TEXDEF txt501 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.515469 APEX 0.125 0.625 0.609531 RAD 0.0078125
+   txt501 
+TEXDEF txt502 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.625 RAD 0.03125 
+   txt502 
+TEXDEF txt503 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.625 APEX 0.234531 0.625 0.625 RAD 0.0078125
+   txt503 
+TEXDEF txt504 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.625 APEX 0.125 0.734531 0.625 RAD 0.0078125
+   txt504 
+TEXDEF txt505 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.640469 APEX 0.125 0.625 0.734531 RAD 0.0078125
+   txt505 
+TEXDEF txt506 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.75 RAD 0.03125 
+   txt506 
+TEXDEF txt507 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.75 APEX 0.234531 0.625 0.75 RAD 0.0078125
+   txt507 
+TEXDEF txt508 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.75 APEX 0.125 0.734531 0.75 RAD 0.0078125
+   txt508 
+TEXDEF txt509 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.765469 APEX 0.125 0.625 0.859531 RAD 0.0078125
+   txt509 
+TEXDEF txt510 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 0.875 RAD 0.03125 
+   txt510 
+TEXDEF txt511 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 0.875 APEX 0.234531 0.625 0.875 RAD 0.0078125
+   txt511 
+TEXDEF txt512 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 0.875 APEX 0.125 0.734531 0.875 RAD 0.0078125
+   txt512 
+TEXDEF txt513 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.625 0.890469 APEX 0.125 0.625 0.984531 RAD 0.0078125
+   txt513 
+TEXDEF txt514 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.625 1 RAD 0.03125 
+   txt514 
+TEXDEF txt515 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.625 1 APEX 0.234531 0.625 1 RAD 0.0078125
+   txt515 
+TEXDEF txt516 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.640469 1 APEX 0.125 0.734531 1 RAD 0.0078125
+   txt516 
+TEXDEF txt517 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0 RAD 0.03125 
+   txt517 
+TEXDEF txt518 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0 APEX 0.234531 0.75 0 RAD 0.0078125
+   txt518 
+TEXDEF txt519 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0 APEX 0.125 0.859531 0 RAD 0.0078125
+   txt519 
+TEXDEF txt520 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.0154687 APEX 0.125 0.75 0.109531 RAD 0.0078125
+   txt520 
+TEXDEF txt521 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.125 RAD 0.03125 
+   txt521 
+TEXDEF txt522 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.125 APEX 0.234531 0.75 0.125 RAD 0.0078125
+   txt522 
+TEXDEF txt523 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.125 APEX 0.125 0.859531 0.125 RAD 0.0078125
+   txt523 
+TEXDEF txt524 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.140469 APEX 0.125 0.75 0.234531 RAD 0.0078125
+   txt524 
+TEXDEF txt525 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.25 RAD 0.03125 
+   txt525 
+TEXDEF txt526 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.25 APEX 0.234531 0.75 0.25 RAD 0.0078125
+   txt526 
+TEXDEF txt527 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.25 APEX 0.125 0.859531 0.25 RAD 0.0078125
+   txt527 
+TEXDEF txt528 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.265469 APEX 0.125 0.75 0.359531 RAD 0.0078125
+   txt528 
+TEXDEF txt529 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.375 RAD 0.03125 
+   txt529 
+TEXDEF txt530 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.375 APEX 0.234531 0.75 0.375 RAD 0.0078125
+   txt530 
+TEXDEF txt531 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.375 APEX 0.125 0.859531 0.375 RAD 0.0078125
+   txt531 
+TEXDEF txt532 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.390469 APEX 0.125 0.75 0.484531 RAD 0.0078125
+   txt532 
+TEXDEF txt533 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.5 RAD 0.03125 
+   txt533 
+TEXDEF txt534 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.5 APEX 0.234531 0.75 0.5 RAD 0.0078125
+   txt534 
+TEXDEF txt535 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.5 APEX 0.125 0.859531 0.5 RAD 0.0078125
+   txt535 
+TEXDEF txt536 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.515469 APEX 0.125 0.75 0.609531 RAD 0.0078125
+   txt536 
+TEXDEF txt537 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.625 RAD 0.03125 
+   txt537 
+TEXDEF txt538 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.625 APEX 0.234531 0.75 0.625 RAD 0.0078125
+   txt538 
+TEXDEF txt539 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.625 APEX 0.125 0.859531 0.625 RAD 0.0078125
+   txt539 
+TEXDEF txt540 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.640469 APEX 0.125 0.75 0.734531 RAD 0.0078125
+   txt540 
+TEXDEF txt541 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.75 RAD 0.03125 
+   txt541 
+TEXDEF txt542 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.75 APEX 0.234531 0.75 0.75 RAD 0.0078125
+   txt542 
+TEXDEF txt543 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.75 APEX 0.125 0.859531 0.75 RAD 0.0078125
+   txt543 
+TEXDEF txt544 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.765469 APEX 0.125 0.75 0.859531 RAD 0.0078125
+   txt544 
+TEXDEF txt545 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 0.875 RAD 0.03125 
+   txt545 
+TEXDEF txt546 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 0.875 APEX 0.234531 0.75 0.875 RAD 0.0078125
+   txt546 
+TEXDEF txt547 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 0.875 APEX 0.125 0.859531 0.875 RAD 0.0078125
+   txt547 
+TEXDEF txt548 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.75 0.890469 APEX 0.125 0.75 0.984531 RAD 0.0078125
+   txt548 
+TEXDEF txt549 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.75 1 RAD 0.03125 
+   txt549 
+TEXDEF txt550 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.75 1 APEX 0.234531 0.75 1 RAD 0.0078125
+   txt550 
+TEXDEF txt551 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.765469 1 APEX 0.125 0.859531 1 RAD 0.0078125
+   txt551 
+TEXDEF txt552 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0 RAD 0.03125 
+   txt552 
+TEXDEF txt553 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0 APEX 0.234531 0.875 0 RAD 0.0078125
+   txt553 
+TEXDEF txt554 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0 APEX 0.125 0.984531 0 RAD 0.0078125
+   txt554 
+TEXDEF txt555 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.0154687 APEX 0.125 0.875 0.109531 RAD 0.0078125
+   txt555 
+TEXDEF txt556 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.125 RAD 0.03125 
+   txt556 
+TEXDEF txt557 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.125 APEX 0.234531 0.875 0.125 RAD 0.0078125
+   txt557 
+TEXDEF txt558 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.125 APEX 0.125 0.984531 0.125 RAD 0.0078125
+   txt558 
+TEXDEF txt559 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.140469 APEX 0.125 0.875 0.234531 RAD 0.0078125
+   txt559 
+TEXDEF txt560 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.25 RAD 0.03125 
+   txt560 
+TEXDEF txt561 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.25 APEX 0.234531 0.875 0.25 RAD 0.0078125
+   txt561 
+TEXDEF txt562 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.25 APEX 0.125 0.984531 0.25 RAD 0.0078125
+   txt562 
+TEXDEF txt563 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.265469 APEX 0.125 0.875 0.359531 RAD 0.0078125
+   txt563 
+TEXDEF txt564 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.375 RAD 0.03125 
+   txt564 
+TEXDEF txt565 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.375 APEX 0.234531 0.875 0.375 RAD 0.0078125
+   txt565 
+TEXDEF txt566 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.375 APEX 0.125 0.984531 0.375 RAD 0.0078125
+   txt566 
+TEXDEF txt567 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.390469 APEX 0.125 0.875 0.484531 RAD 0.0078125
+   txt567 
+TEXDEF txt568 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.5 RAD 0.03125 
+   txt568 
+TEXDEF txt569 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.5 APEX 0.234531 0.875 0.5 RAD 0.0078125
+   txt569 
+TEXDEF txt570 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.5 APEX 0.125 0.984531 0.5 RAD 0.0078125
+   txt570 
+TEXDEF txt571 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.515469 APEX 0.125 0.875 0.609531 RAD 0.0078125
+   txt571 
+TEXDEF txt572 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.625 RAD 0.03125 
+   txt572 
+TEXDEF txt573 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.625 APEX 0.234531 0.875 0.625 RAD 0.0078125
+   txt573 
+TEXDEF txt574 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.625 APEX 0.125 0.984531 0.625 RAD 0.0078125
+   txt574 
+TEXDEF txt575 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.640469 APEX 0.125 0.875 0.734531 RAD 0.0078125
+   txt575 
+TEXDEF txt576 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.75 RAD 0.03125 
+   txt576 
+TEXDEF txt577 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.75 APEX 0.234531 0.875 0.75 RAD 0.0078125
+   txt577 
+TEXDEF txt578 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.75 APEX 0.125 0.984531 0.75 RAD 0.0078125
+   txt578 
+TEXDEF txt579 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.765469 APEX 0.125 0.875 0.859531 RAD 0.0078125
+   txt579 
+TEXDEF txt580 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 0.875 RAD 0.03125 
+   txt580 
+TEXDEF txt581 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 0.875 APEX 0.234531 0.875 0.875 RAD 0.0078125
+   txt581 
+TEXDEF txt582 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 0.875 APEX 0.125 0.984531 0.875 RAD 0.0078125
+   txt582 
+TEXDEF txt583 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.875 0.890469 APEX 0.125 0.875 0.984531 RAD 0.0078125
+   txt583 
+TEXDEF txt584 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 0.875 1 RAD 0.03125 
+   txt584 
+TEXDEF txt585 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 0.875 1 APEX 0.234531 0.875 1 RAD 0.0078125
+   txt585 
+TEXDEF txt586 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 0.890469 1 APEX 0.125 0.984531 1 RAD 0.0078125
+   txt586 
+TEXDEF txt587 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0 RAD 0.03125 
+   txt587 
+TEXDEF txt588 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0 APEX 0.234531 1 0 RAD 0.0078125
+   txt588 
+TEXDEF txt589 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.0154687 APEX 0.125 1 0.109531 RAD 0.0078125
+   txt589 
+TEXDEF txt590 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.125 RAD 0.03125 
+   txt590 
+TEXDEF txt591 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.125 APEX 0.234531 1 0.125 RAD 0.0078125
+   txt591 
+TEXDEF txt592 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.140469 APEX 0.125 1 0.234531 RAD 0.0078125
+   txt592 
+TEXDEF txt593 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.25 RAD 0.03125 
+   txt593 
+TEXDEF txt594 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.25 APEX 0.234531 1 0.25 RAD 0.0078125
+   txt594 
+TEXDEF txt595 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.265469 APEX 0.125 1 0.359531 RAD 0.0078125
+   txt595 
+TEXDEF txt596 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.375 RAD 0.03125 
+   txt596 
+TEXDEF txt597 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.375 APEX 0.234531 1 0.375 RAD 0.0078125
+   txt597 
+TEXDEF txt598 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.390469 APEX 0.125 1 0.484531 RAD 0.0078125
+   txt598 
+TEXDEF txt599 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.5 RAD 0.03125 
+   txt599 
+TEXDEF txt600 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.5 APEX 0.234531 1 0.5 RAD 0.0078125
+   txt600 
+TEXDEF txt601 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.515469 APEX 0.125 1 0.609531 RAD 0.0078125
+   txt601 
+TEXDEF txt602 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.625 RAD 0.03125 
+   txt602 
+TEXDEF txt603 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.625 APEX 0.234531 1 0.625 RAD 0.0078125
+   txt603 
+TEXDEF txt604 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.640469 APEX 0.125 1 0.734531 RAD 0.0078125
+   txt604 
+TEXDEF txt605 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.75 RAD 0.03125 
+   txt605 
+TEXDEF txt606 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.75 APEX 0.234531 1 0.75 RAD 0.0078125
+   txt606 
+TEXDEF txt607 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.765469 APEX 0.125 1 0.859531 RAD 0.0078125
+   txt607 
+TEXDEF txt608 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 0.875 RAD 0.03125 
+   txt608 
+TEXDEF txt609 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 0.875 APEX 0.234531 1 0.875 RAD 0.0078125
+   txt609 
+TEXDEF txt610 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.125 1 0.890469 APEX 0.125 1 0.984531 RAD 0.0078125
+   txt610 
+TEXDEF txt611 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.125 1 1 RAD 0.03125 
+   txt611 
+TEXDEF txt612 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.140469 1 1 APEX 0.234531 1 1 RAD 0.0078125
+   txt612 
+TEXDEF txt613 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0 RAD 0.03125 
+   txt613 
+TEXDEF txt614 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0 APEX 0.359531 0 0 RAD 0.0078125
+   txt614 
+TEXDEF txt615 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0 APEX 0.25 0.109531 0 RAD 0.0078125
+   txt615 
+TEXDEF txt616 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.0154687 APEX 0.25 0 0.109531 RAD 0.0078125
+   txt616 
+TEXDEF txt617 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.125 RAD 0.03125 
+   txt617 
+TEXDEF txt618 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.125 APEX 0.359531 0 0.125 RAD 0.0078125
+   txt618 
+TEXDEF txt619 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.125 APEX 0.25 0.109531 0.125 RAD 0.0078125
+   txt619 
+TEXDEF txt620 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.140469 APEX 0.25 0 0.234531 RAD 0.0078125
+   txt620 
+TEXDEF txt621 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.25 RAD 0.03125 
+   txt621 
+TEXDEF txt622 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.25 APEX 0.359531 0 0.25 RAD 0.0078125
+   txt622 
+TEXDEF txt623 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.25 APEX 0.25 0.109531 0.25 RAD 0.0078125
+   txt623 
+TEXDEF txt624 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.265469 APEX 0.25 0 0.359531 RAD 0.0078125
+   txt624 
+TEXDEF txt625 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.375 RAD 0.03125 
+   txt625 
+TEXDEF txt626 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.375 APEX 0.359531 0 0.375 RAD 0.0078125
+   txt626 
+TEXDEF txt627 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.375 APEX 0.25 0.109531 0.375 RAD 0.0078125
+   txt627 
+TEXDEF txt628 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.390469 APEX 0.25 0 0.484531 RAD 0.0078125
+   txt628 
+TEXDEF txt629 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.5 RAD 0.03125 
+   txt629 
+TEXDEF txt630 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.5 APEX 0.359531 0 0.5 RAD 0.0078125
+   txt630 
+TEXDEF txt631 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.5 APEX 0.25 0.109531 0.5 RAD 0.0078125
+   txt631 
+TEXDEF txt632 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.515469 APEX 0.25 0 0.609531 RAD 0.0078125
+   txt632 
+TEXDEF txt633 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.625 RAD 0.03125 
+   txt633 
+TEXDEF txt634 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.625 APEX 0.359531 0 0.625 RAD 0.0078125
+   txt634 
+TEXDEF txt635 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.625 APEX 0.25 0.109531 0.625 RAD 0.0078125
+   txt635 
+TEXDEF txt636 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.640469 APEX 0.25 0 0.734531 RAD 0.0078125
+   txt636 
+TEXDEF txt637 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.75 RAD 0.03125 
+   txt637 
+TEXDEF txt638 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.75 APEX 0.359531 0 0.75 RAD 0.0078125
+   txt638 
+TEXDEF txt639 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.75 APEX 0.25 0.109531 0.75 RAD 0.0078125
+   txt639 
+TEXDEF txt640 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.765469 APEX 0.25 0 0.859531 RAD 0.0078125
+   txt640 
+TEXDEF txt641 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 0.875 RAD 0.03125 
+   txt641 
+TEXDEF txt642 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 0.875 APEX 0.359531 0 0.875 RAD 0.0078125
+   txt642 
+TEXDEF txt643 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 0.875 APEX 0.25 0.109531 0.875 RAD 0.0078125
+   txt643 
+TEXDEF txt644 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0 0.890469 APEX 0.25 0 0.984531 RAD 0.0078125
+   txt644 
+TEXDEF txt645 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0 1 RAD 0.03125 
+   txt645 
+TEXDEF txt646 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0 1 APEX 0.359531 0 1 RAD 0.0078125
+   txt646 
+TEXDEF txt647 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.0154687 1 APEX 0.25 0.109531 1 RAD 0.0078125
+   txt647 
+TEXDEF txt648 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0 RAD 0.03125 
+   txt648 
+TEXDEF txt649 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0 APEX 0.359531 0.125 0 RAD 0.0078125
+   txt649 
+TEXDEF txt650 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0 APEX 0.25 0.234531 0 RAD 0.0078125
+   txt650 
+TEXDEF txt651 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.0154687 APEX 0.25 0.125 0.109531 RAD 0.0078125
+   txt651 
+TEXDEF txt652 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.125 RAD 0.03125 
+   txt652 
+TEXDEF txt653 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.125 APEX 0.359531 0.125 0.125 RAD 0.0078125
+   txt653 
+TEXDEF txt654 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.125 APEX 0.25 0.234531 0.125 RAD 0.0078125
+   txt654 
+TEXDEF txt655 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.140469 APEX 0.25 0.125 0.234531 RAD 0.0078125
+   txt655 
+TEXDEF txt656 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.25 RAD 0.03125 
+   txt656 
+TEXDEF txt657 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.25 APEX 0.359531 0.125 0.25 RAD 0.0078125
+   txt657 
+TEXDEF txt658 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.25 APEX 0.25 0.234531 0.25 RAD 0.0078125
+   txt658 
+TEXDEF txt659 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.265469 APEX 0.25 0.125 0.359531 RAD 0.0078125
+   txt659 
+TEXDEF txt660 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.375 RAD 0.03125 
+   txt660 
+TEXDEF txt661 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.375 APEX 0.359531 0.125 0.375 RAD 0.0078125
+   txt661 
+TEXDEF txt662 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.375 APEX 0.25 0.234531 0.375 RAD 0.0078125
+   txt662 
+TEXDEF txt663 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.390469 APEX 0.25 0.125 0.484531 RAD 0.0078125
+   txt663 
+TEXDEF txt664 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.5 RAD 0.03125 
+   txt664 
+TEXDEF txt665 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.5 APEX 0.359531 0.125 0.5 RAD 0.0078125
+   txt665 
+TEXDEF txt666 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.5 APEX 0.25 0.234531 0.5 RAD 0.0078125
+   txt666 
+TEXDEF txt667 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.515469 APEX 0.25 0.125 0.609531 RAD 0.0078125
+   txt667 
+TEXDEF txt668 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.625 RAD 0.03125 
+   txt668 
+TEXDEF txt669 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.625 APEX 0.359531 0.125 0.625 RAD 0.0078125
+   txt669 
+TEXDEF txt670 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.625 APEX 0.25 0.234531 0.625 RAD 0.0078125
+   txt670 
+TEXDEF txt671 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.640469 APEX 0.25 0.125 0.734531 RAD 0.0078125
+   txt671 
+TEXDEF txt672 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.75 RAD 0.03125 
+   txt672 
+TEXDEF txt673 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.75 APEX 0.359531 0.125 0.75 RAD 0.0078125
+   txt673 
+TEXDEF txt674 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.75 APEX 0.25 0.234531 0.75 RAD 0.0078125
+   txt674 
+TEXDEF txt675 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.765469 APEX 0.25 0.125 0.859531 RAD 0.0078125
+   txt675 
+TEXDEF txt676 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 0.875 RAD 0.03125 
+   txt676 
+TEXDEF txt677 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 0.875 APEX 0.359531 0.125 0.875 RAD 0.0078125
+   txt677 
+TEXDEF txt678 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 0.875 APEX 0.25 0.234531 0.875 RAD 0.0078125
+   txt678 
+TEXDEF txt679 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.125 0.890469 APEX 0.25 0.125 0.984531 RAD 0.0078125
+   txt679 
+TEXDEF txt680 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.125 1 RAD 0.03125 
+   txt680 
+TEXDEF txt681 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.125 1 APEX 0.359531 0.125 1 RAD 0.0078125
+   txt681 
+TEXDEF txt682 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.140469 1 APEX 0.25 0.234531 1 RAD 0.0078125
+   txt682 
+TEXDEF txt683 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0 RAD 0.03125 
+   txt683 
+TEXDEF txt684 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0 APEX 0.359531 0.25 0 RAD 0.0078125
+   txt684 
+TEXDEF txt685 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0 APEX 0.25 0.359531 0 RAD 0.0078125
+   txt685 
+TEXDEF txt686 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.0154687 APEX 0.25 0.25 0.109531 RAD 0.0078125
+   txt686 
+TEXDEF txt687 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.125 RAD 0.03125 
+   txt687 
+TEXDEF txt688 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.125 APEX 0.359531 0.25 0.125 RAD 0.0078125
+   txt688 
+TEXDEF txt689 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.125 APEX 0.25 0.359531 0.125 RAD 0.0078125
+   txt689 
+TEXDEF txt690 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.140469 APEX 0.25 0.25 0.234531 RAD 0.0078125
+   txt690 
+TEXDEF txt691 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.25 RAD 0.03125 
+   txt691 
+TEXDEF txt692 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.25 APEX 0.359531 0.25 0.25 RAD 0.0078125
+   txt692 
+TEXDEF txt693 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.25 APEX 0.25 0.359531 0.25 RAD 0.0078125
+   txt693 
+TEXDEF txt694 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.265469 APEX 0.25 0.25 0.359531 RAD 0.0078125
+   txt694 
+TEXDEF txt695 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.375 RAD 0.03125 
+   txt695 
+TEXDEF txt696 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.375 APEX 0.359531 0.25 0.375 RAD 0.0078125
+   txt696 
+TEXDEF txt697 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.375 APEX 0.25 0.359531 0.375 RAD 0.0078125
+   txt697 
+TEXDEF txt698 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.390469 APEX 0.25 0.25 0.484531 RAD 0.0078125
+   txt698 
+TEXDEF txt699 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.5 RAD 0.03125 
+   txt699 
+TEXDEF txt700 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.5 APEX 0.359531 0.25 0.5 RAD 0.0078125
+   txt700 
+TEXDEF txt701 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.5 APEX 0.25 0.359531 0.5 RAD 0.0078125
+   txt701 
+TEXDEF txt702 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.515469 APEX 0.25 0.25 0.609531 RAD 0.0078125
+   txt702 
+TEXDEF txt703 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.625 RAD 0.03125 
+   txt703 
+TEXDEF txt704 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.625 APEX 0.359531 0.25 0.625 RAD 0.0078125
+   txt704 
+TEXDEF txt705 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.625 APEX 0.25 0.359531 0.625 RAD 0.0078125
+   txt705 
+TEXDEF txt706 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.640469 APEX 0.25 0.25 0.734531 RAD 0.0078125
+   txt706 
+TEXDEF txt707 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.75 RAD 0.03125 
+   txt707 
+TEXDEF txt708 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.75 APEX 0.359531 0.25 0.75 RAD 0.0078125
+   txt708 
+TEXDEF txt709 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.75 APEX 0.25 0.359531 0.75 RAD 0.0078125
+   txt709 
+TEXDEF txt710 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.765469 APEX 0.25 0.25 0.859531 RAD 0.0078125
+   txt710 
+TEXDEF txt711 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 0.875 RAD 0.03125 
+   txt711 
+TEXDEF txt712 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 0.875 APEX 0.359531 0.25 0.875 RAD 0.0078125
+   txt712 
+TEXDEF txt713 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 0.875 APEX 0.25 0.359531 0.875 RAD 0.0078125
+   txt713 
+TEXDEF txt714 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.25 0.890469 APEX 0.25 0.25 0.984531 RAD 0.0078125
+   txt714 
+TEXDEF txt715 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.25 1 RAD 0.03125 
+   txt715 
+TEXDEF txt716 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.25 1 APEX 0.359531 0.25 1 RAD 0.0078125
+   txt716 
+TEXDEF txt717 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.265469 1 APEX 0.25 0.359531 1 RAD 0.0078125
+   txt717 
+TEXDEF txt718 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0 RAD 0.03125 
+   txt718 
+TEXDEF txt719 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0 APEX 0.359531 0.375 0 RAD 0.0078125
+   txt719 
+TEXDEF txt720 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0 APEX 0.25 0.484531 0 RAD 0.0078125
+   txt720 
+TEXDEF txt721 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.0154687 APEX 0.25 0.375 0.109531 RAD 0.0078125
+   txt721 
+TEXDEF txt722 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.125 RAD 0.03125 
+   txt722 
+TEXDEF txt723 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.125 APEX 0.359531 0.375 0.125 RAD 0.0078125
+   txt723 
+TEXDEF txt724 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.125 APEX 0.25 0.484531 0.125 RAD 0.0078125
+   txt724 
+TEXDEF txt725 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.140469 APEX 0.25 0.375 0.234531 RAD 0.0078125
+   txt725 
+TEXDEF txt726 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.25 RAD 0.03125 
+   txt726 
+TEXDEF txt727 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.25 APEX 0.359531 0.375 0.25 RAD 0.0078125
+   txt727 
+TEXDEF txt728 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.25 APEX 0.25 0.484531 0.25 RAD 0.0078125
+   txt728 
+TEXDEF txt729 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.265469 APEX 0.25 0.375 0.359531 RAD 0.0078125
+   txt729 
+TEXDEF txt730 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.375 RAD 0.03125 
+   txt730 
+TEXDEF txt731 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.375 APEX 0.359531 0.375 0.375 RAD 0.0078125
+   txt731 
+TEXDEF txt732 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.375 APEX 0.25 0.484531 0.375 RAD 0.0078125
+   txt732 
+TEXDEF txt733 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.390469 APEX 0.25 0.375 0.484531 RAD 0.0078125
+   txt733 
+TEXDEF txt734 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.5 RAD 0.03125 
+   txt734 
+TEXDEF txt735 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.5 APEX 0.359531 0.375 0.5 RAD 0.0078125
+   txt735 
+TEXDEF txt736 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.5 APEX 0.25 0.484531 0.5 RAD 0.0078125
+   txt736 
+TEXDEF txt737 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.515469 APEX 0.25 0.375 0.609531 RAD 0.0078125
+   txt737 
+TEXDEF txt738 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.625 RAD 0.03125 
+   txt738 
+TEXDEF txt739 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.625 APEX 0.359531 0.375 0.625 RAD 0.0078125
+   txt739 
+TEXDEF txt740 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.625 APEX 0.25 0.484531 0.625 RAD 0.0078125
+   txt740 
+TEXDEF txt741 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.640469 APEX 0.25 0.375 0.734531 RAD 0.0078125
+   txt741 
+TEXDEF txt742 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.75 RAD 0.03125 
+   txt742 
+TEXDEF txt743 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.75 APEX 0.359531 0.375 0.75 RAD 0.0078125
+   txt743 
+TEXDEF txt744 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.75 APEX 0.25 0.484531 0.75 RAD 0.0078125
+   txt744 
+TEXDEF txt745 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.765469 APEX 0.25 0.375 0.859531 RAD 0.0078125
+   txt745 
+TEXDEF txt746 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 0.875 RAD 0.03125 
+   txt746 
+TEXDEF txt747 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 0.875 APEX 0.359531 0.375 0.875 RAD 0.0078125
+   txt747 
+TEXDEF txt748 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 0.875 APEX 0.25 0.484531 0.875 RAD 0.0078125
+   txt748 
+TEXDEF txt749 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.375 0.890469 APEX 0.25 0.375 0.984531 RAD 0.0078125
+   txt749 
+TEXDEF txt750 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.375 1 RAD 0.03125 
+   txt750 
+TEXDEF txt751 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.375 1 APEX 0.359531 0.375 1 RAD 0.0078125
+   txt751 
+TEXDEF txt752 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.390469 1 APEX 0.25 0.484531 1 RAD 0.0078125
+   txt752 
+TEXDEF txt753 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0 RAD 0.03125 
+   txt753 
+TEXDEF txt754 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0 APEX 0.359531 0.5 0 RAD 0.0078125
+   txt754 
+TEXDEF txt755 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0 APEX 0.25 0.609531 0 RAD 0.0078125
+   txt755 
+TEXDEF txt756 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.0154687 APEX 0.25 0.5 0.109531 RAD 0.0078125
+   txt756 
+TEXDEF txt757 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.125 RAD 0.03125 
+   txt757 
+TEXDEF txt758 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.125 APEX 0.359531 0.5 0.125 RAD 0.0078125
+   txt758 
+TEXDEF txt759 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.125 APEX 0.25 0.609531 0.125 RAD 0.0078125
+   txt759 
+TEXDEF txt760 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.140469 APEX 0.25 0.5 0.234531 RAD 0.0078125
+   txt760 
+TEXDEF txt761 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.25 RAD 0.03125 
+   txt761 
+TEXDEF txt762 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.25 APEX 0.359531 0.5 0.25 RAD 0.0078125
+   txt762 
+TEXDEF txt763 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.25 APEX 0.25 0.609531 0.25 RAD 0.0078125
+   txt763 
+TEXDEF txt764 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.265469 APEX 0.25 0.5 0.359531 RAD 0.0078125
+   txt764 
+TEXDEF txt765 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.375 RAD 0.03125 
+   txt765 
+TEXDEF txt766 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.375 APEX 0.359531 0.5 0.375 RAD 0.0078125
+   txt766 
+TEXDEF txt767 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.375 APEX 0.25 0.609531 0.375 RAD 0.0078125
+   txt767 
+TEXDEF txt768 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.390469 APEX 0.25 0.5 0.484531 RAD 0.0078125
+   txt768 
+TEXDEF txt769 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.5 RAD 0.03125 
+   txt769 
+TEXDEF txt770 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.5 APEX 0.359531 0.5 0.5 RAD 0.0078125
+   txt770 
+TEXDEF txt771 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.5 APEX 0.25 0.609531 0.5 RAD 0.0078125
+   txt771 
+TEXDEF txt772 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.515469 APEX 0.25 0.5 0.609531 RAD 0.0078125
+   txt772 
+TEXDEF txt773 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.625 RAD 0.03125 
+   txt773 
+TEXDEF txt774 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.625 APEX 0.359531 0.5 0.625 RAD 0.0078125
+   txt774 
+TEXDEF txt775 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.625 APEX 0.25 0.609531 0.625 RAD 0.0078125
+   txt775 
+TEXDEF txt776 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.640469 APEX 0.25 0.5 0.734531 RAD 0.0078125
+   txt776 
+TEXDEF txt777 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.75 RAD 0.03125 
+   txt777 
+TEXDEF txt778 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.75 APEX 0.359531 0.5 0.75 RAD 0.0078125
+   txt778 
+TEXDEF txt779 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.75 APEX 0.25 0.609531 0.75 RAD 0.0078125
+   txt779 
+TEXDEF txt780 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.765469 APEX 0.25 0.5 0.859531 RAD 0.0078125
+   txt780 
+TEXDEF txt781 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 0.875 RAD 0.03125 
+   txt781 
+TEXDEF txt782 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 0.875 APEX 0.359531 0.5 0.875 RAD 0.0078125
+   txt782 
+TEXDEF txt783 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 0.875 APEX 0.25 0.609531 0.875 RAD 0.0078125
+   txt783 
+TEXDEF txt784 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.5 0.890469 APEX 0.25 0.5 0.984531 RAD 0.0078125
+   txt784 
+TEXDEF txt785 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.5 1 RAD 0.03125 
+   txt785 
+TEXDEF txt786 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.5 1 APEX 0.359531 0.5 1 RAD 0.0078125
+   txt786 
+TEXDEF txt787 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.515469 1 APEX 0.25 0.609531 1 RAD 0.0078125
+   txt787 
+TEXDEF txt788 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0 RAD 0.03125 
+   txt788 
+TEXDEF txt789 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0 APEX 0.359531 0.625 0 RAD 0.0078125
+   txt789 
+TEXDEF txt790 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0 APEX 0.25 0.734531 0 RAD 0.0078125
+   txt790 
+TEXDEF txt791 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.0154687 APEX 0.25 0.625 0.109531 RAD 0.0078125
+   txt791 
+TEXDEF txt792 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.125 RAD 0.03125 
+   txt792 
+TEXDEF txt793 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.125 APEX 0.359531 0.625 0.125 RAD 0.0078125
+   txt793 
+TEXDEF txt794 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.125 APEX 0.25 0.734531 0.125 RAD 0.0078125
+   txt794 
+TEXDEF txt795 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.140469 APEX 0.25 0.625 0.234531 RAD 0.0078125
+   txt795 
+TEXDEF txt796 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.25 RAD 0.03125 
+   txt796 
+TEXDEF txt797 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.25 APEX 0.359531 0.625 0.25 RAD 0.0078125
+   txt797 
+TEXDEF txt798 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.25 APEX 0.25 0.734531 0.25 RAD 0.0078125
+   txt798 
+TEXDEF txt799 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.265469 APEX 0.25 0.625 0.359531 RAD 0.0078125
+   txt799 
+TEXDEF txt800 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.375 RAD 0.03125 
+   txt800 
+TEXDEF txt801 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.375 APEX 0.359531 0.625 0.375 RAD 0.0078125
+   txt801 
+TEXDEF txt802 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.375 APEX 0.25 0.734531 0.375 RAD 0.0078125
+   txt802 
+TEXDEF txt803 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.390469 APEX 0.25 0.625 0.484531 RAD 0.0078125
+   txt803 
+TEXDEF txt804 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.5 RAD 0.03125 
+   txt804 
+TEXDEF txt805 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.5 APEX 0.359531 0.625 0.5 RAD 0.0078125
+   txt805 
+TEXDEF txt806 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.5 APEX 0.25 0.734531 0.5 RAD 0.0078125
+   txt806 
+TEXDEF txt807 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.515469 APEX 0.25 0.625 0.609531 RAD 0.0078125
+   txt807 
+TEXDEF txt808 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.625 RAD 0.03125 
+   txt808 
+TEXDEF txt809 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.625 APEX 0.359531 0.625 0.625 RAD 0.0078125
+   txt809 
+TEXDEF txt810 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.625 APEX 0.25 0.734531 0.625 RAD 0.0078125
+   txt810 
+TEXDEF txt811 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.640469 APEX 0.25 0.625 0.734531 RAD 0.0078125
+   txt811 
+TEXDEF txt812 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.75 RAD 0.03125 
+   txt812 
+TEXDEF txt813 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.75 APEX 0.359531 0.625 0.75 RAD 0.0078125
+   txt813 
+TEXDEF txt814 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.75 APEX 0.25 0.734531 0.75 RAD 0.0078125
+   txt814 
+TEXDEF txt815 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.765469 APEX 0.25 0.625 0.859531 RAD 0.0078125
+   txt815 
+TEXDEF txt816 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 0.875 RAD 0.03125 
+   txt816 
+TEXDEF txt817 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 0.875 APEX 0.359531 0.625 0.875 RAD 0.0078125
+   txt817 
+TEXDEF txt818 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 0.875 APEX 0.25 0.734531 0.875 RAD 0.0078125
+   txt818 
+TEXDEF txt819 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.625 0.890469 APEX 0.25 0.625 0.984531 RAD 0.0078125
+   txt819 
+TEXDEF txt820 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.625 1 RAD 0.03125 
+   txt820 
+TEXDEF txt821 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.625 1 APEX 0.359531 0.625 1 RAD 0.0078125
+   txt821 
+TEXDEF txt822 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.640469 1 APEX 0.25 0.734531 1 RAD 0.0078125
+   txt822 
+TEXDEF txt823 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0 RAD 0.03125 
+   txt823 
+TEXDEF txt824 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0 APEX 0.359531 0.75 0 RAD 0.0078125
+   txt824 
+TEXDEF txt825 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0 APEX 0.25 0.859531 0 RAD 0.0078125
+   txt825 
+TEXDEF txt826 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.0154687 APEX 0.25 0.75 0.109531 RAD 0.0078125
+   txt826 
+TEXDEF txt827 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.125 RAD 0.03125 
+   txt827 
+TEXDEF txt828 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.125 APEX 0.359531 0.75 0.125 RAD 0.0078125
+   txt828 
+TEXDEF txt829 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.125 APEX 0.25 0.859531 0.125 RAD 0.0078125
+   txt829 
+TEXDEF txt830 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.140469 APEX 0.25 0.75 0.234531 RAD 0.0078125
+   txt830 
+TEXDEF txt831 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.25 RAD 0.03125 
+   txt831 
+TEXDEF txt832 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.25 APEX 0.359531 0.75 0.25 RAD 0.0078125
+   txt832 
+TEXDEF txt833 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.25 APEX 0.25 0.859531 0.25 RAD 0.0078125
+   txt833 
+TEXDEF txt834 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.265469 APEX 0.25 0.75 0.359531 RAD 0.0078125
+   txt834 
+TEXDEF txt835 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.375 RAD 0.03125 
+   txt835 
+TEXDEF txt836 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.375 APEX 0.359531 0.75 0.375 RAD 0.0078125
+   txt836 
+TEXDEF txt837 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.375 APEX 0.25 0.859531 0.375 RAD 0.0078125
+   txt837 
+TEXDEF txt838 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.390469 APEX 0.25 0.75 0.484531 RAD 0.0078125
+   txt838 
+TEXDEF txt839 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.5 RAD 0.03125 
+   txt839 
+TEXDEF txt840 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.5 APEX 0.359531 0.75 0.5 RAD 0.0078125
+   txt840 
+TEXDEF txt841 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.5 APEX 0.25 0.859531 0.5 RAD 0.0078125
+   txt841 
+TEXDEF txt842 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.515469 APEX 0.25 0.75 0.609531 RAD 0.0078125
+   txt842 
+TEXDEF txt843 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.625 RAD 0.03125 
+   txt843 
+TEXDEF txt844 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.625 APEX 0.359531 0.75 0.625 RAD 0.0078125
+   txt844 
+TEXDEF txt845 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.625 APEX 0.25 0.859531 0.625 RAD 0.0078125
+   txt845 
+TEXDEF txt846 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.640469 APEX 0.25 0.75 0.734531 RAD 0.0078125
+   txt846 
+TEXDEF txt847 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.75 RAD 0.03125 
+   txt847 
+TEXDEF txt848 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.75 APEX 0.359531 0.75 0.75 RAD 0.0078125
+   txt848 
+TEXDEF txt849 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.75 APEX 0.25 0.859531 0.75 RAD 0.0078125
+   txt849 
+TEXDEF txt850 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.765469 APEX 0.25 0.75 0.859531 RAD 0.0078125
+   txt850 
+TEXDEF txt851 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 0.875 RAD 0.03125 
+   txt851 
+TEXDEF txt852 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 0.875 APEX 0.359531 0.75 0.875 RAD 0.0078125
+   txt852 
+TEXDEF txt853 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 0.875 APEX 0.25 0.859531 0.875 RAD 0.0078125
+   txt853 
+TEXDEF txt854 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.75 0.890469 APEX 0.25 0.75 0.984531 RAD 0.0078125
+   txt854 
+TEXDEF txt855 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.75 1 RAD 0.03125 
+   txt855 
+TEXDEF txt856 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.75 1 APEX 0.359531 0.75 1 RAD 0.0078125
+   txt856 
+TEXDEF txt857 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.765469 1 APEX 0.25 0.859531 1 RAD 0.0078125
+   txt857 
+TEXDEF txt858 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0 RAD 0.03125 
+   txt858 
+TEXDEF txt859 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0 APEX 0.359531 0.875 0 RAD 0.0078125
+   txt859 
+TEXDEF txt860 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0 APEX 0.25 0.984531 0 RAD 0.0078125
+   txt860 
+TEXDEF txt861 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.0154687 APEX 0.25 0.875 0.109531 RAD 0.0078125
+   txt861 
+TEXDEF txt862 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.125 RAD 0.03125 
+   txt862 
+TEXDEF txt863 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.125 APEX 0.359531 0.875 0.125 RAD 0.0078125
+   txt863 
+TEXDEF txt864 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.125 APEX 0.25 0.984531 0.125 RAD 0.0078125
+   txt864 
+TEXDEF txt865 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.140469 APEX 0.25 0.875 0.234531 RAD 0.0078125
+   txt865 
+TEXDEF txt866 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.25 RAD 0.03125 
+   txt866 
+TEXDEF txt867 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.25 APEX 0.359531 0.875 0.25 RAD 0.0078125
+   txt867 
+TEXDEF txt868 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.25 APEX 0.25 0.984531 0.25 RAD 0.0078125
+   txt868 
+TEXDEF txt869 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.265469 APEX 0.25 0.875 0.359531 RAD 0.0078125
+   txt869 
+TEXDEF txt870 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.375 RAD 0.03125 
+   txt870 
+TEXDEF txt871 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.375 APEX 0.359531 0.875 0.375 RAD 0.0078125
+   txt871 
+TEXDEF txt872 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.375 APEX 0.25 0.984531 0.375 RAD 0.0078125
+   txt872 
+TEXDEF txt873 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.390469 APEX 0.25 0.875 0.484531 RAD 0.0078125
+   txt873 
+TEXDEF txt874 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.5 RAD 0.03125 
+   txt874 
+TEXDEF txt875 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.5 APEX 0.359531 0.875 0.5 RAD 0.0078125
+   txt875 
+TEXDEF txt876 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.5 APEX 0.25 0.984531 0.5 RAD 0.0078125
+   txt876 
+TEXDEF txt877 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.515469 APEX 0.25 0.875 0.609531 RAD 0.0078125
+   txt877 
+TEXDEF txt878 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.625 RAD 0.03125 
+   txt878 
+TEXDEF txt879 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.625 APEX 0.359531 0.875 0.625 RAD 0.0078125
+   txt879 
+TEXDEF txt880 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.625 APEX 0.25 0.984531 0.625 RAD 0.0078125
+   txt880 
+TEXDEF txt881 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.640469 APEX 0.25 0.875 0.734531 RAD 0.0078125
+   txt881 
+TEXDEF txt882 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.75 RAD 0.03125 
+   txt882 
+TEXDEF txt883 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.75 APEX 0.359531 0.875 0.75 RAD 0.0078125
+   txt883 
+TEXDEF txt884 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.75 APEX 0.25 0.984531 0.75 RAD 0.0078125
+   txt884 
+TEXDEF txt885 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.765469 APEX 0.25 0.875 0.859531 RAD 0.0078125
+   txt885 
+TEXDEF txt886 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 0.875 RAD 0.03125 
+   txt886 
+TEXDEF txt887 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 0.875 APEX 0.359531 0.875 0.875 RAD 0.0078125
+   txt887 
+TEXDEF txt888 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 0.875 APEX 0.25 0.984531 0.875 RAD 0.0078125
+   txt888 
+TEXDEF txt889 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.875 0.890469 APEX 0.25 0.875 0.984531 RAD 0.0078125
+   txt889 
+TEXDEF txt890 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 0.875 1 RAD 0.03125 
+   txt890 
+TEXDEF txt891 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 0.875 1 APEX 0.359531 0.875 1 RAD 0.0078125
+   txt891 
+TEXDEF txt892 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 0.890469 1 APEX 0.25 0.984531 1 RAD 0.0078125
+   txt892 
+TEXDEF txt893 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0 RAD 0.03125 
+   txt893 
+TEXDEF txt894 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0 APEX 0.359531 1 0 RAD 0.0078125
+   txt894 
+TEXDEF txt895 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.0154687 APEX 0.25 1 0.109531 RAD 0.0078125
+   txt895 
+TEXDEF txt896 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.125 RAD 0.03125 
+   txt896 
+TEXDEF txt897 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.125 APEX 0.359531 1 0.125 RAD 0.0078125
+   txt897 
+TEXDEF txt898 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.140469 APEX 0.25 1 0.234531 RAD 0.0078125
+   txt898 
+TEXDEF txt899 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.25 RAD 0.03125 
+   txt899 
+TEXDEF txt900 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.25 APEX 0.359531 1 0.25 RAD 0.0078125
+   txt900 
+TEXDEF txt901 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.265469 APEX 0.25 1 0.359531 RAD 0.0078125
+   txt901 
+TEXDEF txt902 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.375 RAD 0.03125 
+   txt902 
+TEXDEF txt903 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.375 APEX 0.359531 1 0.375 RAD 0.0078125
+   txt903 
+TEXDEF txt904 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.390469 APEX 0.25 1 0.484531 RAD 0.0078125
+   txt904 
+TEXDEF txt905 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.5 RAD 0.03125 
+   txt905 
+TEXDEF txt906 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.5 APEX 0.359531 1 0.5 RAD 0.0078125
+   txt906 
+TEXDEF txt907 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.515469 APEX 0.25 1 0.609531 RAD 0.0078125
+   txt907 
+TEXDEF txt908 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.625 RAD 0.03125 
+   txt908 
+TEXDEF txt909 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.625 APEX 0.359531 1 0.625 RAD 0.0078125
+   txt909 
+TEXDEF txt910 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.640469 APEX 0.25 1 0.734531 RAD 0.0078125
+   txt910 
+TEXDEF txt911 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.75 RAD 0.03125 
+   txt911 
+TEXDEF txt912 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.75 APEX 0.359531 1 0.75 RAD 0.0078125
+   txt912 
+TEXDEF txt913 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.765469 APEX 0.25 1 0.859531 RAD 0.0078125
+   txt913 
+TEXDEF txt914 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 0.875 RAD 0.03125 
+   txt914 
+TEXDEF txt915 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 0.875 APEX 0.359531 1 0.875 RAD 0.0078125
+   txt915 
+TEXDEF txt916 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.25 1 0.890469 APEX 0.25 1 0.984531 RAD 0.0078125
+   txt916 
+TEXDEF txt917 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.25 1 1 RAD 0.03125 
+   txt917 
+TEXDEF txt918 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.265469 1 1 APEX 0.359531 1 1 RAD 0.0078125
+   txt918 
+TEXDEF txt919 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0 RAD 0.03125 
+   txt919 
+TEXDEF txt920 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0 APEX 0.484531 0 0 RAD 0.0078125
+   txt920 
+TEXDEF txt921 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0 APEX 0.375 0.109531 0 RAD 0.0078125
+   txt921 
+TEXDEF txt922 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.0154687 APEX 0.375 0 0.109531 RAD 0.0078125
+   txt922 
+TEXDEF txt923 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.125 RAD 0.03125 
+   txt923 
+TEXDEF txt924 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.125 APEX 0.484531 0 0.125 RAD 0.0078125
+   txt924 
+TEXDEF txt925 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.125 APEX 0.375 0.109531 0.125 RAD 0.0078125
+   txt925 
+TEXDEF txt926 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.140469 APEX 0.375 0 0.234531 RAD 0.0078125
+   txt926 
+TEXDEF txt927 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.25 RAD 0.03125 
+   txt927 
+TEXDEF txt928 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.25 APEX 0.484531 0 0.25 RAD 0.0078125
+   txt928 
+TEXDEF txt929 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.25 APEX 0.375 0.109531 0.25 RAD 0.0078125
+   txt929 
+TEXDEF txt930 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.265469 APEX 0.375 0 0.359531 RAD 0.0078125
+   txt930 
+TEXDEF txt931 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.375 RAD 0.03125 
+   txt931 
+TEXDEF txt932 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.375 APEX 0.484531 0 0.375 RAD 0.0078125
+   txt932 
+TEXDEF txt933 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.375 APEX 0.375 0.109531 0.375 RAD 0.0078125
+   txt933 
+TEXDEF txt934 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.390469 APEX 0.375 0 0.484531 RAD 0.0078125
+   txt934 
+TEXDEF txt935 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.5 RAD 0.03125 
+   txt935 
+TEXDEF txt936 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.5 APEX 0.484531 0 0.5 RAD 0.0078125
+   txt936 
+TEXDEF txt937 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.5 APEX 0.375 0.109531 0.5 RAD 0.0078125
+   txt937 
+TEXDEF txt938 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.515469 APEX 0.375 0 0.609531 RAD 0.0078125
+   txt938 
+TEXDEF txt939 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.625 RAD 0.03125 
+   txt939 
+TEXDEF txt940 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.625 APEX 0.484531 0 0.625 RAD 0.0078125
+   txt940 
+TEXDEF txt941 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.625 APEX 0.375 0.109531 0.625 RAD 0.0078125
+   txt941 
+TEXDEF txt942 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.640469 APEX 0.375 0 0.734531 RAD 0.0078125
+   txt942 
+TEXDEF txt943 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.75 RAD 0.03125 
+   txt943 
+TEXDEF txt944 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.75 APEX 0.484531 0 0.75 RAD 0.0078125
+   txt944 
+TEXDEF txt945 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.75 APEX 0.375 0.109531 0.75 RAD 0.0078125
+   txt945 
+TEXDEF txt946 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.765469 APEX 0.375 0 0.859531 RAD 0.0078125
+   txt946 
+TEXDEF txt947 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 0.875 RAD 0.03125 
+   txt947 
+TEXDEF txt948 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 0.875 APEX 0.484531 0 0.875 RAD 0.0078125
+   txt948 
+TEXDEF txt949 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 0.875 APEX 0.375 0.109531 0.875 RAD 0.0078125
+   txt949 
+TEXDEF txt950 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0 0.890469 APEX 0.375 0 0.984531 RAD 0.0078125
+   txt950 
+TEXDEF txt951 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0 1 RAD 0.03125 
+   txt951 
+TEXDEF txt952 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0 1 APEX 0.484531 0 1 RAD 0.0078125
+   txt952 
+TEXDEF txt953 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.0154687 1 APEX 0.375 0.109531 1 RAD 0.0078125
+   txt953 
+TEXDEF txt954 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0 RAD 0.03125 
+   txt954 
+TEXDEF txt955 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0 APEX 0.484531 0.125 0 RAD 0.0078125
+   txt955 
+TEXDEF txt956 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0 APEX 0.375 0.234531 0 RAD 0.0078125
+   txt956 
+TEXDEF txt957 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.0154687 APEX 0.375 0.125 0.109531 RAD 0.0078125
+   txt957 
+TEXDEF txt958 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.125 RAD 0.03125 
+   txt958 
+TEXDEF txt959 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.125 APEX 0.484531 0.125 0.125 RAD 0.0078125
+   txt959 
+TEXDEF txt960 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.125 APEX 0.375 0.234531 0.125 RAD 0.0078125
+   txt960 
+TEXDEF txt961 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.140469 APEX 0.375 0.125 0.234531 RAD 0.0078125
+   txt961 
+TEXDEF txt962 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.25 RAD 0.03125 
+   txt962 
+TEXDEF txt963 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.25 APEX 0.484531 0.125 0.25 RAD 0.0078125
+   txt963 
+TEXDEF txt964 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.25 APEX 0.375 0.234531 0.25 RAD 0.0078125
+   txt964 
+TEXDEF txt965 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.265469 APEX 0.375 0.125 0.359531 RAD 0.0078125
+   txt965 
+TEXDEF txt966 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.375 RAD 0.03125 
+   txt966 
+TEXDEF txt967 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.375 APEX 0.484531 0.125 0.375 RAD 0.0078125
+   txt967 
+TEXDEF txt968 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.375 APEX 0.375 0.234531 0.375 RAD 0.0078125
+   txt968 
+TEXDEF txt969 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.390469 APEX 0.375 0.125 0.484531 RAD 0.0078125
+   txt969 
+TEXDEF txt970 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.5 RAD 0.03125 
+   txt970 
+TEXDEF txt971 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.5 APEX 0.484531 0.125 0.5 RAD 0.0078125
+   txt971 
+TEXDEF txt972 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.5 APEX 0.375 0.234531 0.5 RAD 0.0078125
+   txt972 
+TEXDEF txt973 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.515469 APEX 0.375 0.125 0.609531 RAD 0.0078125
+   txt973 
+TEXDEF txt974 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.625 RAD 0.03125 
+   txt974 
+TEXDEF txt975 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.625 APEX 0.484531 0.125 0.625 RAD 0.0078125
+   txt975 
+TEXDEF txt976 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.625 APEX 0.375 0.234531 0.625 RAD 0.0078125
+   txt976 
+TEXDEF txt977 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.640469 APEX 0.375 0.125 0.734531 RAD 0.0078125
+   txt977 
+TEXDEF txt978 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.75 RAD 0.03125 
+   txt978 
+TEXDEF txt979 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.75 APEX 0.484531 0.125 0.75 RAD 0.0078125
+   txt979 
+TEXDEF txt980 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.75 APEX 0.375 0.234531 0.75 RAD 0.0078125
+   txt980 
+TEXDEF txt981 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.765469 APEX 0.375 0.125 0.859531 RAD 0.0078125
+   txt981 
+TEXDEF txt982 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 0.875 RAD 0.03125 
+   txt982 
+TEXDEF txt983 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 0.875 APEX 0.484531 0.125 0.875 RAD 0.0078125
+   txt983 
+TEXDEF txt984 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 0.875 APEX 0.375 0.234531 0.875 RAD 0.0078125
+   txt984 
+TEXDEF txt985 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.125 0.890469 APEX 0.375 0.125 0.984531 RAD 0.0078125
+   txt985 
+TEXDEF txt986 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.125 1 RAD 0.03125 
+   txt986 
+TEXDEF txt987 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.125 1 APEX 0.484531 0.125 1 RAD 0.0078125
+   txt987 
+TEXDEF txt988 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.140469 1 APEX 0.375 0.234531 1 RAD 0.0078125
+   txt988 
+TEXDEF txt989 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0 RAD 0.03125 
+   txt989 
+TEXDEF txt990 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0 APEX 0.484531 0.25 0 RAD 0.0078125
+   txt990 
+TEXDEF txt991 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0 APEX 0.375 0.359531 0 RAD 0.0078125
+   txt991 
+TEXDEF txt992 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.0154687 APEX 0.375 0.25 0.109531 RAD 0.0078125
+   txt992 
+TEXDEF txt993 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.125 RAD 0.03125 
+   txt993 
+TEXDEF txt994 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.125 APEX 0.484531 0.25 0.125 RAD 0.0078125
+   txt994 
+TEXDEF txt995 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.125 APEX 0.375 0.359531 0.125 RAD 0.0078125
+   txt995 
+TEXDEF txt996 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.140469 APEX 0.375 0.25 0.234531 RAD 0.0078125
+   txt996 
+TEXDEF txt997 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.25 RAD 0.03125 
+   txt997 
+TEXDEF txt998 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.25 APEX 0.484531 0.25 0.25 RAD 0.0078125
+   txt998 
+TEXDEF txt999 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.25 APEX 0.375 0.359531 0.25 RAD 0.0078125
+   txt999 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.265469 APEX 0.375 0.25 0.359531 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.375 RAD 0.03125 
+   txt100 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.375 APEX 0.484531 0.25 0.375 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.375 APEX 0.375 0.359531 0.375 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.390469 APEX 0.375 0.25 0.484531 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.5 RAD 0.03125 
+   txt100 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.5 APEX 0.484531 0.25 0.5 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.5 APEX 0.375 0.359531 0.5 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.515469 APEX 0.375 0.25 0.609531 RAD 0.0078125
+   txt100 
+TEXDEF txt100 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.625 RAD 0.03125 
+   txt100 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.625 APEX 0.484531 0.25 0.625 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.625 APEX 0.375 0.359531 0.625 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.640469 APEX 0.375 0.25 0.734531 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.75 RAD 0.03125 
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.75 APEX 0.484531 0.25 0.75 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.75 APEX 0.375 0.359531 0.75 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.765469 APEX 0.375 0.25 0.859531 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 0.875 RAD 0.03125 
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 0.875 APEX 0.484531 0.25 0.875 RAD 0.0078125
+   txt101 
+TEXDEF txt101 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 0.875 APEX 0.375 0.359531 0.875 RAD 0.0078125
+   txt101 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.25 0.890469 APEX 0.375 0.25 0.984531 RAD 0.0078125
+   txt102 
+TEXDEF txt102 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.25 1 RAD 0.03125 
+   txt102 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.25 1 APEX 0.484531 0.25 1 RAD 0.0078125
+   txt102 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.265469 1 APEX 0.375 0.359531 1 RAD 0.0078125
+   txt102 
+TEXDEF txt102 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0 RAD 0.03125 
+   txt102 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0 APEX 0.484531 0.375 0 RAD 0.0078125
+   txt102 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0 APEX 0.375 0.484531 0 RAD 0.0078125
+   txt102 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.0154687 APEX 0.375 0.375 0.109531 RAD 0.0078125
+   txt102 
+TEXDEF txt102 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.125 RAD 0.03125 
+   txt102 
+TEXDEF txt102 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.125 APEX 0.484531 0.375 0.125 RAD 0.0078125
+   txt102 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.125 APEX 0.375 0.484531 0.125 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.140469 APEX 0.375 0.375 0.234531 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.25 RAD 0.03125 
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.25 APEX 0.484531 0.375 0.25 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.25 APEX 0.375 0.484531 0.25 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.265469 APEX 0.375 0.375 0.359531 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.375 RAD 0.03125 
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.375 APEX 0.484531 0.375 0.375 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.375 APEX 0.375 0.484531 0.375 RAD 0.0078125
+   txt103 
+TEXDEF txt103 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.390469 APEX 0.375 0.375 0.484531 RAD 0.0078125
+   txt103 
+TEXDEF txt104 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.5 RAD 0.03125 
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.5 APEX 0.484531 0.375 0.5 RAD 0.0078125
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.5 APEX 0.375 0.484531 0.5 RAD 0.0078125
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.515469 APEX 0.375 0.375 0.609531 RAD 0.0078125
+   txt104 
+TEXDEF txt104 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.625 RAD 0.03125 
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.625 APEX 0.484531 0.375 0.625 RAD 0.0078125
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.625 APEX 0.375 0.484531 0.625 RAD 0.0078125
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.640469 APEX 0.375 0.375 0.734531 RAD 0.0078125
+   txt104 
+TEXDEF txt104 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.75 RAD 0.03125 
+   txt104 
+TEXDEF txt104 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.75 APEX 0.484531 0.375 0.75 RAD 0.0078125
+   txt104 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.75 APEX 0.375 0.484531 0.75 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.765469 APEX 0.375 0.375 0.859531 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 0.875 RAD 0.03125 
+   txt105 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 0.875 APEX 0.484531 0.375 0.875 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 0.875 APEX 0.375 0.484531 0.875 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.375 0.890469 APEX 0.375 0.375 0.984531 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.375 1 RAD 0.03125 
+   txt105 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.375 1 APEX 0.484531 0.375 1 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.390469 1 APEX 0.375 0.484531 1 RAD 0.0078125
+   txt105 
+TEXDEF txt105 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0 RAD 0.03125 
+   txt105 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0 APEX 0.484531 0.5 0 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0 APEX 0.375 0.609531 0 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.0154687 APEX 0.375 0.5 0.109531 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.125 RAD 0.03125 
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.125 APEX 0.484531 0.5 0.125 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.125 APEX 0.375 0.609531 0.125 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.140469 APEX 0.375 0.5 0.234531 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.25 RAD 0.03125 
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.25 APEX 0.484531 0.5 0.25 RAD 0.0078125
+   txt106 
+TEXDEF txt106 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.25 APEX 0.375 0.609531 0.25 RAD 0.0078125
+   txt106 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.265469 APEX 0.375 0.5 0.359531 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.375 RAD 0.03125 
+   txt107 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.375 APEX 0.484531 0.5 0.375 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.375 APEX 0.375 0.609531 0.375 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.390469 APEX 0.375 0.5 0.484531 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.5 RAD 0.03125 
+   txt107 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.5 APEX 0.484531 0.5 0.5 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.5 APEX 0.375 0.609531 0.5 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.515469 APEX 0.375 0.5 0.609531 RAD 0.0078125
+   txt107 
+TEXDEF txt107 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.625 RAD 0.03125 
+   txt107 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.625 APEX 0.484531 0.5 0.625 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.625 APEX 0.375 0.609531 0.625 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.640469 APEX 0.375 0.5 0.734531 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.75 RAD 0.03125 
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.75 APEX 0.484531 0.5 0.75 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.75 APEX 0.375 0.609531 0.75 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.765469 APEX 0.375 0.5 0.859531 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 0.875 RAD 0.03125 
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 0.875 APEX 0.484531 0.5 0.875 RAD 0.0078125
+   txt108 
+TEXDEF txt108 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 0.875 APEX 0.375 0.609531 0.875 RAD 0.0078125
+   txt108 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.5 0.890469 APEX 0.375 0.5 0.984531 RAD 0.0078125
+   txt109 
+TEXDEF txt109 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.5 1 RAD 0.03125 
+   txt109 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.5 1 APEX 0.484531 0.5 1 RAD 0.0078125
+   txt109 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.515469 1 APEX 0.375 0.609531 1 RAD 0.0078125
+   txt109 
+TEXDEF txt109 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0 RAD 0.03125 
+   txt109 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0 APEX 0.484531 0.625 0 RAD 0.0078125
+   txt109 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0 APEX 0.375 0.734531 0 RAD 0.0078125
+   txt109 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.0154687 APEX 0.375 0.625 0.109531 RAD 0.0078125
+   txt109 
+TEXDEF txt109 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.125 RAD 0.03125 
+   txt109 
+TEXDEF txt109 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.125 APEX 0.484531 0.625 0.125 RAD 0.0078125
+   txt109 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.125 APEX 0.375 0.734531 0.125 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.140469 APEX 0.375 0.625 0.234531 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.25 RAD 0.03125 
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.25 APEX 0.484531 0.625 0.25 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.25 APEX 0.375 0.734531 0.25 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.265469 APEX 0.375 0.625 0.359531 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.375 RAD 0.03125 
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.375 APEX 0.484531 0.625 0.375 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.375 APEX 0.375 0.734531 0.375 RAD 0.0078125
+   txt110 
+TEXDEF txt110 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.390469 APEX 0.375 0.625 0.484531 RAD 0.0078125
+   txt110 
+TEXDEF txt111 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.5 RAD 0.03125 
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.5 APEX 0.484531 0.625 0.5 RAD 0.0078125
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.5 APEX 0.375 0.734531 0.5 RAD 0.0078125
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.515469 APEX 0.375 0.625 0.609531 RAD 0.0078125
+   txt111 
+TEXDEF txt111 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.625 RAD 0.03125 
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.625 APEX 0.484531 0.625 0.625 RAD 0.0078125
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.625 APEX 0.375 0.734531 0.625 RAD 0.0078125
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.640469 APEX 0.375 0.625 0.734531 RAD 0.0078125
+   txt111 
+TEXDEF txt111 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.75 RAD 0.03125 
+   txt111 
+TEXDEF txt111 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.75 APEX 0.484531 0.625 0.75 RAD 0.0078125
+   txt111 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.75 APEX 0.375 0.734531 0.75 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.765469 APEX 0.375 0.625 0.859531 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 0.875 RAD 0.03125 
+   txt112 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 0.875 APEX 0.484531 0.625 0.875 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 0.875 APEX 0.375 0.734531 0.875 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.625 0.890469 APEX 0.375 0.625 0.984531 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.625 1 RAD 0.03125 
+   txt112 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.625 1 APEX 0.484531 0.625 1 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.640469 1 APEX 0.375 0.734531 1 RAD 0.0078125
+   txt112 
+TEXDEF txt112 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0 RAD 0.03125 
+   txt112 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0 APEX 0.484531 0.75 0 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0 APEX 0.375 0.859531 0 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.0154687 APEX 0.375 0.75 0.109531 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.125 RAD 0.03125 
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.125 APEX 0.484531 0.75 0.125 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.125 APEX 0.375 0.859531 0.125 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.140469 APEX 0.375 0.75 0.234531 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.25 RAD 0.03125 
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.25 APEX 0.484531 0.75 0.25 RAD 0.0078125
+   txt113 
+TEXDEF txt113 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.25 APEX 0.375 0.859531 0.25 RAD 0.0078125
+   txt113 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.265469 APEX 0.375 0.75 0.359531 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.375 RAD 0.03125 
+   txt114 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.375 APEX 0.484531 0.75 0.375 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.375 APEX 0.375 0.859531 0.375 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.390469 APEX 0.375 0.75 0.484531 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.5 RAD 0.03125 
+   txt114 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.5 APEX 0.484531 0.75 0.5 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.5 APEX 0.375 0.859531 0.5 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.515469 APEX 0.375 0.75 0.609531 RAD 0.0078125
+   txt114 
+TEXDEF txt114 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.625 RAD 0.03125 
+   txt114 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.625 APEX 0.484531 0.75 0.625 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.625 APEX 0.375 0.859531 0.625 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.640469 APEX 0.375 0.75 0.734531 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.75 RAD 0.03125 
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.75 APEX 0.484531 0.75 0.75 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.75 APEX 0.375 0.859531 0.75 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.765469 APEX 0.375 0.75 0.859531 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 0.875 RAD 0.03125 
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 0.875 APEX 0.484531 0.75 0.875 RAD 0.0078125
+   txt115 
+TEXDEF txt115 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 0.875 APEX 0.375 0.859531 0.875 RAD 0.0078125
+   txt115 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.75 0.890469 APEX 0.375 0.75 0.984531 RAD 0.0078125
+   txt116 
+TEXDEF txt116 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.75 1 RAD 0.03125 
+   txt116 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.75 1 APEX 0.484531 0.75 1 RAD 0.0078125
+   txt116 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.765469 1 APEX 0.375 0.859531 1 RAD 0.0078125
+   txt116 
+TEXDEF txt116 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0 RAD 0.03125 
+   txt116 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0 APEX 0.484531 0.875 0 RAD 0.0078125
+   txt116 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0 APEX 0.375 0.984531 0 RAD 0.0078125
+   txt116 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.0154687 APEX 0.375 0.875 0.109531 RAD 0.0078125
+   txt116 
+TEXDEF txt116 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.125 RAD 0.03125 
+   txt116 
+TEXDEF txt116 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.125 APEX 0.484531 0.875 0.125 RAD 0.0078125
+   txt116 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.125 APEX 0.375 0.984531 0.125 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.140469 APEX 0.375 0.875 0.234531 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.25 RAD 0.03125 
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.25 APEX 0.484531 0.875 0.25 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.25 APEX 0.375 0.984531 0.25 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.265469 APEX 0.375 0.875 0.359531 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.375 RAD 0.03125 
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.375 APEX 0.484531 0.875 0.375 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.375 APEX 0.375 0.984531 0.375 RAD 0.0078125
+   txt117 
+TEXDEF txt117 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.390469 APEX 0.375 0.875 0.484531 RAD 0.0078125
+   txt117 
+TEXDEF txt118 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.5 RAD 0.03125 
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.5 APEX 0.484531 0.875 0.5 RAD 0.0078125
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.5 APEX 0.375 0.984531 0.5 RAD 0.0078125
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.515469 APEX 0.375 0.875 0.609531 RAD 0.0078125
+   txt118 
+TEXDEF txt118 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.625 RAD 0.03125 
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.625 APEX 0.484531 0.875 0.625 RAD 0.0078125
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.625 APEX 0.375 0.984531 0.625 RAD 0.0078125
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.640469 APEX 0.375 0.875 0.734531 RAD 0.0078125
+   txt118 
+TEXDEF txt118 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.75 RAD 0.03125 
+   txt118 
+TEXDEF txt118 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.75 APEX 0.484531 0.875 0.75 RAD 0.0078125
+   txt118 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.75 APEX 0.375 0.984531 0.75 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.765469 APEX 0.375 0.875 0.859531 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 0.875 RAD 0.03125 
+   txt119 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 0.875 APEX 0.484531 0.875 0.875 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 0.875 APEX 0.375 0.984531 0.875 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.875 0.890469 APEX 0.375 0.875 0.984531 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 0.875 1 RAD 0.03125 
+   txt119 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 0.875 1 APEX 0.484531 0.875 1 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 0.890469 1 APEX 0.375 0.984531 1 RAD 0.0078125
+   txt119 
+TEXDEF txt119 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0 RAD 0.03125 
+   txt119 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0 APEX 0.484531 1 0 RAD 0.0078125
+   txt120 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.0154687 APEX 0.375 1 0.109531 RAD 0.0078125
+   txt120 
+TEXDEF txt120 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.125 RAD 0.03125 
+   txt120 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.125 APEX 0.484531 1 0.125 RAD 0.0078125
+   txt120 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.140469 APEX 0.375 1 0.234531 RAD 0.0078125
+   txt120 
+TEXDEF txt120 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.25 RAD 0.03125 
+   txt120 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.25 APEX 0.484531 1 0.25 RAD 0.0078125
+   txt120 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.265469 APEX 0.375 1 0.359531 RAD 0.0078125
+   txt120 
+TEXDEF txt120 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.375 RAD 0.03125 
+   txt120 
+TEXDEF txt120 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.375 APEX 0.484531 1 0.375 RAD 0.0078125
+   txt120 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.390469 APEX 0.375 1 0.484531 RAD 0.0078125
+   txt121 
+TEXDEF txt121 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.5 RAD 0.03125 
+   txt121 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.5 APEX 0.484531 1 0.5 RAD 0.0078125
+   txt121 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.515469 APEX 0.375 1 0.609531 RAD 0.0078125
+   txt121 
+TEXDEF txt121 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.625 RAD 0.03125 
+   txt121 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.625 APEX 0.484531 1 0.625 RAD 0.0078125
+   txt121 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.640469 APEX 0.375 1 0.734531 RAD 0.0078125
+   txt121 
+TEXDEF txt121 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.75 RAD 0.03125 
+   txt121 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.75 APEX 0.484531 1 0.75 RAD 0.0078125
+   txt121 
+TEXDEF txt121 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.765469 APEX 0.375 1 0.859531 RAD 0.0078125
+   txt121 
+TEXDEF txt122 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 0.875 RAD 0.03125 
+   txt122 
+TEXDEF txt122 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 0.875 APEX 0.484531 1 0.875 RAD 0.0078125
+   txt122 
+TEXDEF txt122 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.375 1 0.890469 APEX 0.375 1 0.984531 RAD 0.0078125
+   txt122 
+TEXDEF txt122 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.375 1 1 RAD 0.03125 
+   txt122 
+TEXDEF txt122 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.390469 1 1 APEX 0.484531 1 1 RAD 0.0078125
+   txt122 
+TEXDEF txt122 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0 RAD 0.03125 
+   txt122 
+TEXDEF txt122 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0 APEX 0.609531 0 0 RAD 0.0078125
+   txt122 
+TEXDEF txt122 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0 APEX 0.5 0.109531 0 RAD 0.0078125
+   txt122 
+TEXDEF txt122 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.0154687 APEX 0.5 0 0.109531 RAD 0.0078125
+   txt122 
+TEXDEF txt122 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.125 RAD 0.03125 
+   txt122 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.125 APEX 0.609531 0 0.125 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.125 APEX 0.5 0.109531 0.125 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.140469 APEX 0.5 0 0.234531 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.25 RAD 0.03125 
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.25 APEX 0.609531 0 0.25 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.25 APEX 0.5 0.109531 0.25 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.265469 APEX 0.5 0 0.359531 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.375 RAD 0.03125 
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.375 APEX 0.609531 0 0.375 RAD 0.0078125
+   txt123 
+TEXDEF txt123 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.375 APEX 0.5 0.109531 0.375 RAD 0.0078125
+   txt123 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.390469 APEX 0.5 0 0.484531 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.5 RAD 0.03125 
+   txt124 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.5 APEX 0.609531 0 0.5 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.5 APEX 0.5 0.109531 0.5 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.515469 APEX 0.5 0 0.609531 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.625 RAD 0.03125 
+   txt124 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.625 APEX 0.609531 0 0.625 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.625 APEX 0.5 0.109531 0.625 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.640469 APEX 0.5 0 0.734531 RAD 0.0078125
+   txt124 
+TEXDEF txt124 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.75 RAD 0.03125 
+   txt124 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.75 APEX 0.609531 0 0.75 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.75 APEX 0.5 0.109531 0.75 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.765469 APEX 0.5 0 0.859531 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 0.875 RAD 0.03125 
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 0.875 APEX 0.609531 0 0.875 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 0.875 APEX 0.5 0.109531 0.875 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0 0.890469 APEX 0.5 0 0.984531 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0 1 RAD 0.03125 
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0 1 APEX 0.609531 0 1 RAD 0.0078125
+   txt125 
+TEXDEF txt125 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.0154687 1 APEX 0.5 0.109531 1 RAD 0.0078125
+   txt125 
+TEXDEF txt126 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0 RAD 0.03125 
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0 APEX 0.609531 0.125 0 RAD 0.0078125
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0 APEX 0.5 0.234531 0 RAD 0.0078125
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.0154687 APEX 0.5 0.125 0.109531 RAD 0.0078125
+   txt126 
+TEXDEF txt126 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.125 RAD 0.03125 
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.125 APEX 0.609531 0.125 0.125 RAD 0.0078125
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.125 APEX 0.5 0.234531 0.125 RAD 0.0078125
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.140469 APEX 0.5 0.125 0.234531 RAD 0.0078125
+   txt126 
+TEXDEF txt126 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.25 RAD 0.03125 
+   txt126 
+TEXDEF txt126 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.25 APEX 0.609531 0.125 0.25 RAD 0.0078125
+   txt126 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.25 APEX 0.5 0.234531 0.25 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.265469 APEX 0.5 0.125 0.359531 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.375 RAD 0.03125 
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.375 APEX 0.609531 0.125 0.375 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.375 APEX 0.5 0.234531 0.375 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.390469 APEX 0.5 0.125 0.484531 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.5 RAD 0.03125 
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.5 APEX 0.609531 0.125 0.5 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.5 APEX 0.5 0.234531 0.5 RAD 0.0078125
+   txt127 
+TEXDEF txt127 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.515469 APEX 0.5 0.125 0.609531 RAD 0.0078125
+   txt127 
+TEXDEF txt128 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.625 RAD 0.03125 
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.625 APEX 0.609531 0.125 0.625 RAD 0.0078125
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.625 APEX 0.5 0.234531 0.625 RAD 0.0078125
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.640469 APEX 0.5 0.125 0.734531 RAD 0.0078125
+   txt128 
+TEXDEF txt128 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.75 RAD 0.03125 
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.75 APEX 0.609531 0.125 0.75 RAD 0.0078125
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.75 APEX 0.5 0.234531 0.75 RAD 0.0078125
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.765469 APEX 0.5 0.125 0.859531 RAD 0.0078125
+   txt128 
+TEXDEF txt128 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 0.875 RAD 0.03125 
+   txt128 
+TEXDEF txt128 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 0.875 APEX 0.609531 0.125 0.875 RAD 0.0078125
+   txt128 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 0.875 APEX 0.5 0.234531 0.875 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.125 0.890469 APEX 0.5 0.125 0.984531 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.125 1 RAD 0.03125 
+   txt129 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.125 1 APEX 0.609531 0.125 1 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.140469 1 APEX 0.5 0.234531 1 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0 RAD 0.03125 
+   txt129 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0 APEX 0.609531 0.25 0 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0 APEX 0.5 0.359531 0 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.0154687 APEX 0.5 0.25 0.109531 RAD 0.0078125
+   txt129 
+TEXDEF txt129 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.125 RAD 0.03125 
+   txt129 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.125 APEX 0.609531 0.25 0.125 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.125 APEX 0.5 0.359531 0.125 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.140469 APEX 0.5 0.25 0.234531 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.25 RAD 0.03125 
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.25 APEX 0.609531 0.25 0.25 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.25 APEX 0.5 0.359531 0.25 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.265469 APEX 0.5 0.25 0.359531 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.375 RAD 0.03125 
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.375 APEX 0.609531 0.25 0.375 RAD 0.0078125
+   txt130 
+TEXDEF txt130 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.375 APEX 0.5 0.359531 0.375 RAD 0.0078125
+   txt130 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.390469 APEX 0.5 0.25 0.484531 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.5 RAD 0.03125 
+   txt131 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.5 APEX 0.609531 0.25 0.5 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.5 APEX 0.5 0.359531 0.5 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.515469 APEX 0.5 0.25 0.609531 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.625 RAD 0.03125 
+   txt131 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.625 APEX 0.609531 0.25 0.625 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.625 APEX 0.5 0.359531 0.625 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.640469 APEX 0.5 0.25 0.734531 RAD 0.0078125
+   txt131 
+TEXDEF txt131 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.75 RAD 0.03125 
+   txt131 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.75 APEX 0.609531 0.25 0.75 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.75 APEX 0.5 0.359531 0.75 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.765469 APEX 0.5 0.25 0.859531 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 0.875 RAD 0.03125 
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 0.875 APEX 0.609531 0.25 0.875 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 0.875 APEX 0.5 0.359531 0.875 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.25 0.890469 APEX 0.5 0.25 0.984531 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.25 1 RAD 0.03125 
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.25 1 APEX 0.609531 0.25 1 RAD 0.0078125
+   txt132 
+TEXDEF txt132 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.265469 1 APEX 0.5 0.359531 1 RAD 0.0078125
+   txt132 
+TEXDEF txt133 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0 RAD 0.03125 
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0 APEX 0.609531 0.375 0 RAD 0.0078125
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0 APEX 0.5 0.484531 0 RAD 0.0078125
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.0154687 APEX 0.5 0.375 0.109531 RAD 0.0078125
+   txt133 
+TEXDEF txt133 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.125 RAD 0.03125 
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.125 APEX 0.609531 0.375 0.125 RAD 0.0078125
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.125 APEX 0.5 0.484531 0.125 RAD 0.0078125
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.140469 APEX 0.5 0.375 0.234531 RAD 0.0078125
+   txt133 
+TEXDEF txt133 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.25 RAD 0.03125 
+   txt133 
+TEXDEF txt133 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.25 APEX 0.609531 0.375 0.25 RAD 0.0078125
+   txt133 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.25 APEX 0.5 0.484531 0.25 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.265469 APEX 0.5 0.375 0.359531 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.375 RAD 0.03125 
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.375 APEX 0.609531 0.375 0.375 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.375 APEX 0.5 0.484531 0.375 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.390469 APEX 0.5 0.375 0.484531 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.5 RAD 0.03125 
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.5 APEX 0.609531 0.375 0.5 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.5 APEX 0.5 0.484531 0.5 RAD 0.0078125
+   txt134 
+TEXDEF txt134 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.515469 APEX 0.5 0.375 0.609531 RAD 0.0078125
+   txt134 
+TEXDEF txt135 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.625 RAD 0.03125 
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.625 APEX 0.609531 0.375 0.625 RAD 0.0078125
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.625 APEX 0.5 0.484531 0.625 RAD 0.0078125
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.640469 APEX 0.5 0.375 0.734531 RAD 0.0078125
+   txt135 
+TEXDEF txt135 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.75 RAD 0.03125 
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.75 APEX 0.609531 0.375 0.75 RAD 0.0078125
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.75 APEX 0.5 0.484531 0.75 RAD 0.0078125
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.765469 APEX 0.5 0.375 0.859531 RAD 0.0078125
+   txt135 
+TEXDEF txt135 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 0.875 RAD 0.03125 
+   txt135 
+TEXDEF txt135 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 0.875 APEX 0.609531 0.375 0.875 RAD 0.0078125
+   txt135 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 0.875 APEX 0.5 0.484531 0.875 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.375 0.890469 APEX 0.5 0.375 0.984531 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.375 1 RAD 0.03125 
+   txt136 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.375 1 APEX 0.609531 0.375 1 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.390469 1 APEX 0.5 0.484531 1 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0 RAD 0.03125 
+   txt136 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0 APEX 0.609531 0.5 0 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0 APEX 0.5 0.609531 0 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.0154687 APEX 0.5 0.5 0.109531 RAD 0.0078125
+   txt136 
+TEXDEF txt136 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.125 RAD 0.03125 
+   txt136 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.125 APEX 0.609531 0.5 0.125 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.125 APEX 0.5 0.609531 0.125 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.140469 APEX 0.5 0.5 0.234531 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.25 RAD 0.03125 
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.25 APEX 0.609531 0.5 0.25 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.25 APEX 0.5 0.609531 0.25 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.265469 APEX 0.5 0.5 0.359531 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.375 RAD 0.03125 
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.375 APEX 0.609531 0.5 0.375 RAD 0.0078125
+   txt137 
+TEXDEF txt137 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.375 APEX 0.5 0.609531 0.375 RAD 0.0078125
+   txt137 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.390469 APEX 0.5 0.5 0.484531 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.5 RAD 0.03125 
+   txt138 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.5 APEX 0.609531 0.5 0.5 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.5 APEX 0.5 0.609531 0.5 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.515469 APEX 0.5 0.5 0.609531 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.625 RAD 0.03125 
+   txt138 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.625 APEX 0.609531 0.5 0.625 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.625 APEX 0.5 0.609531 0.625 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.640469 APEX 0.5 0.5 0.734531 RAD 0.0078125
+   txt138 
+TEXDEF txt138 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.75 RAD 0.03125 
+   txt138 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.75 APEX 0.609531 0.5 0.75 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.75 APEX 0.5 0.609531 0.75 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.765469 APEX 0.5 0.5 0.859531 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 0.875 RAD 0.03125 
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 0.875 APEX 0.609531 0.5 0.875 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 0.875 APEX 0.5 0.609531 0.875 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.5 0.890469 APEX 0.5 0.5 0.984531 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.5 1 RAD 0.03125 
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.5 1 APEX 0.609531 0.5 1 RAD 0.0078125
+   txt139 
+TEXDEF txt139 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.515469 1 APEX 0.5 0.609531 1 RAD 0.0078125
+   txt139 
+TEXDEF txt140 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0 RAD 0.03125 
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0 APEX 0.609531 0.625 0 RAD 0.0078125
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0 APEX 0.5 0.734531 0 RAD 0.0078125
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.0154687 APEX 0.5 0.625 0.109531 RAD 0.0078125
+   txt140 
+TEXDEF txt140 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.125 RAD 0.03125 
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.125 APEX 0.609531 0.625 0.125 RAD 0.0078125
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.125 APEX 0.5 0.734531 0.125 RAD 0.0078125
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.140469 APEX 0.5 0.625 0.234531 RAD 0.0078125
+   txt140 
+TEXDEF txt140 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.25 RAD 0.03125 
+   txt140 
+TEXDEF txt140 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.25 APEX 0.609531 0.625 0.25 RAD 0.0078125
+   txt140 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.25 APEX 0.5 0.734531 0.25 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.265469 APEX 0.5 0.625 0.359531 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.375 RAD 0.03125 
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.375 APEX 0.609531 0.625 0.375 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.375 APEX 0.5 0.734531 0.375 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.390469 APEX 0.5 0.625 0.484531 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.5 RAD 0.03125 
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.5 APEX 0.609531 0.625 0.5 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.5 APEX 0.5 0.734531 0.5 RAD 0.0078125
+   txt141 
+TEXDEF txt141 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.515469 APEX 0.5 0.625 0.609531 RAD 0.0078125
+   txt141 
+TEXDEF txt142 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.625 RAD 0.03125 
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.625 APEX 0.609531 0.625 0.625 RAD 0.0078125
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.625 APEX 0.5 0.734531 0.625 RAD 0.0078125
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.640469 APEX 0.5 0.625 0.734531 RAD 0.0078125
+   txt142 
+TEXDEF txt142 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.75 RAD 0.03125 
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.75 APEX 0.609531 0.625 0.75 RAD 0.0078125
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.75 APEX 0.5 0.734531 0.75 RAD 0.0078125
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.765469 APEX 0.5 0.625 0.859531 RAD 0.0078125
+   txt142 
+TEXDEF txt142 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 0.875 RAD 0.03125 
+   txt142 
+TEXDEF txt142 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 0.875 APEX 0.609531 0.625 0.875 RAD 0.0078125
+   txt142 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 0.875 APEX 0.5 0.734531 0.875 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.625 0.890469 APEX 0.5 0.625 0.984531 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.625 1 RAD 0.03125 
+   txt143 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.625 1 APEX 0.609531 0.625 1 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.640469 1 APEX 0.5 0.734531 1 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0 RAD 0.03125 
+   txt143 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0 APEX 0.609531 0.75 0 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0 APEX 0.5 0.859531 0 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.0154687 APEX 0.5 0.75 0.109531 RAD 0.0078125
+   txt143 
+TEXDEF txt143 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.125 RAD 0.03125 
+   txt143 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.125 APEX 0.609531 0.75 0.125 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.125 APEX 0.5 0.859531 0.125 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.140469 APEX 0.5 0.75 0.234531 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.25 RAD 0.03125 
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.25 APEX 0.609531 0.75 0.25 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.25 APEX 0.5 0.859531 0.25 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.265469 APEX 0.5 0.75 0.359531 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.375 RAD 0.03125 
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.375 APEX 0.609531 0.75 0.375 RAD 0.0078125
+   txt144 
+TEXDEF txt144 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.375 APEX 0.5 0.859531 0.375 RAD 0.0078125
+   txt144 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.390469 APEX 0.5 0.75 0.484531 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.5 RAD 0.03125 
+   txt145 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.5 APEX 0.609531 0.75 0.5 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.5 APEX 0.5 0.859531 0.5 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.515469 APEX 0.5 0.75 0.609531 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.625 RAD 0.03125 
+   txt145 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.625 APEX 0.609531 0.75 0.625 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.625 APEX 0.5 0.859531 0.625 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.640469 APEX 0.5 0.75 0.734531 RAD 0.0078125
+   txt145 
+TEXDEF txt145 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.75 RAD 0.03125 
+   txt145 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.75 APEX 0.609531 0.75 0.75 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.75 APEX 0.5 0.859531 0.75 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.765469 APEX 0.5 0.75 0.859531 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 0.875 RAD 0.03125 
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 0.875 APEX 0.609531 0.75 0.875 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 0.875 APEX 0.5 0.859531 0.875 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.75 0.890469 APEX 0.5 0.75 0.984531 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.75 1 RAD 0.03125 
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.75 1 APEX 0.609531 0.75 1 RAD 0.0078125
+   txt146 
+TEXDEF txt146 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.765469 1 APEX 0.5 0.859531 1 RAD 0.0078125
+   txt146 
+TEXDEF txt147 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0 RAD 0.03125 
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0 APEX 0.609531 0.875 0 RAD 0.0078125
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0 APEX 0.5 0.984531 0 RAD 0.0078125
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.0154687 APEX 0.5 0.875 0.109531 RAD 0.0078125
+   txt147 
+TEXDEF txt147 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.125 RAD 0.03125 
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.125 APEX 0.609531 0.875 0.125 RAD 0.0078125
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.125 APEX 0.5 0.984531 0.125 RAD 0.0078125
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.140469 APEX 0.5 0.875 0.234531 RAD 0.0078125
+   txt147 
+TEXDEF txt147 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.25 RAD 0.03125 
+   txt147 
+TEXDEF txt147 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.25 APEX 0.609531 0.875 0.25 RAD 0.0078125
+   txt147 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.25 APEX 0.5 0.984531 0.25 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.265469 APEX 0.5 0.875 0.359531 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.375 RAD 0.03125 
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.375 APEX 0.609531 0.875 0.375 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.375 APEX 0.5 0.984531 0.375 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.390469 APEX 0.5 0.875 0.484531 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.5 RAD 0.03125 
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.5 APEX 0.609531 0.875 0.5 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.5 APEX 0.5 0.984531 0.5 RAD 0.0078125
+   txt148 
+TEXDEF txt148 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.515469 APEX 0.5 0.875 0.609531 RAD 0.0078125
+   txt148 
+TEXDEF txt149 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.625 RAD 0.03125 
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.625 APEX 0.609531 0.875 0.625 RAD 0.0078125
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.625 APEX 0.5 0.984531 0.625 RAD 0.0078125
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.640469 APEX 0.5 0.875 0.734531 RAD 0.0078125
+   txt149 
+TEXDEF txt149 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.75 RAD 0.03125 
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.75 APEX 0.609531 0.875 0.75 RAD 0.0078125
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.75 APEX 0.5 0.984531 0.75 RAD 0.0078125
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.765469 APEX 0.5 0.875 0.859531 RAD 0.0078125
+   txt149 
+TEXDEF txt149 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 0.875 RAD 0.03125 
+   txt149 
+TEXDEF txt149 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 0.875 APEX 0.609531 0.875 0.875 RAD 0.0078125
+   txt149 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 0.875 APEX 0.5 0.984531 0.875 RAD 0.0078125
+   txt150 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.875 0.890469 APEX 0.5 0.875 0.984531 RAD 0.0078125
+   txt150 
+TEXDEF txt150 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 0.875 1 RAD 0.03125 
+   txt150 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 0.875 1 APEX 0.609531 0.875 1 RAD 0.0078125
+   txt150 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 0.890469 1 APEX 0.5 0.984531 1 RAD 0.0078125
+   txt150 
+TEXDEF txt150 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0 RAD 0.03125 
+   txt150 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0 APEX 0.609531 1 0 RAD 0.0078125
+   txt150 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.0154687 APEX 0.5 1 0.109531 RAD 0.0078125
+   txt150 
+TEXDEF txt150 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.125 RAD 0.03125 
+   txt150 
+TEXDEF txt150 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.125 APEX 0.609531 1 0.125 RAD 0.0078125
+   txt150 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.140469 APEX 0.5 1 0.234531 RAD 0.0078125
+   txt151 
+TEXDEF txt151 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.25 RAD 0.03125 
+   txt151 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.25 APEX 0.609531 1 0.25 RAD 0.0078125
+   txt151 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.265469 APEX 0.5 1 0.359531 RAD 0.0078125
+   txt151 
+TEXDEF txt151 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.375 RAD 0.03125 
+   txt151 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.375 APEX 0.609531 1 0.375 RAD 0.0078125
+   txt151 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.390469 APEX 0.5 1 0.484531 RAD 0.0078125
+   txt151 
+TEXDEF txt151 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.5 RAD 0.03125 
+   txt151 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.5 APEX 0.609531 1 0.5 RAD 0.0078125
+   txt151 
+TEXDEF txt151 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.515469 APEX 0.5 1 0.609531 RAD 0.0078125
+   txt151 
+TEXDEF txt152 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.625 RAD 0.03125 
+   txt152 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.625 APEX 0.609531 1 0.625 RAD 0.0078125
+   txt152 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.640469 APEX 0.5 1 0.734531 RAD 0.0078125
+   txt152 
+TEXDEF txt152 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.75 RAD 0.03125 
+   txt152 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.75 APEX 0.609531 1 0.75 RAD 0.0078125
+   txt152 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.765469 APEX 0.5 1 0.859531 RAD 0.0078125
+   txt152 
+TEXDEF txt152 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 0.875 RAD 0.03125 
+   txt152 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 0.875 APEX 0.609531 1 0.875 RAD 0.0078125
+   txt152 
+TEXDEF txt152 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.5 1 0.890469 APEX 0.5 1 0.984531 RAD 0.0078125
+   txt152 
+TEXDEF txt152 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.5 1 1 RAD 0.03125 
+   txt152 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.515469 1 1 APEX 0.609531 1 1 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0 RAD 0.03125 
+   txt153 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0 APEX 0.734531 0 0 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0 APEX 0.625 0.109531 0 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.0154687 APEX 0.625 0 0.109531 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.125 RAD 0.03125 
+   txt153 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.125 APEX 0.734531 0 0.125 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.125 APEX 0.625 0.109531 0.125 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.140469 APEX 0.625 0 0.234531 RAD 0.0078125
+   txt153 
+TEXDEF txt153 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.25 RAD 0.03125 
+   txt153 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.25 APEX 0.734531 0 0.25 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.25 APEX 0.625 0.109531 0.25 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.265469 APEX 0.625 0 0.359531 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.375 RAD 0.03125 
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.375 APEX 0.734531 0 0.375 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.375 APEX 0.625 0.109531 0.375 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.390469 APEX 0.625 0 0.484531 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.5 RAD 0.03125 
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.5 APEX 0.734531 0 0.5 RAD 0.0078125
+   txt154 
+TEXDEF txt154 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.5 APEX 0.625 0.109531 0.5 RAD 0.0078125
+   txt154 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.515469 APEX 0.625 0 0.609531 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.625 RAD 0.03125 
+   txt155 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.625 APEX 0.734531 0 0.625 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.625 APEX 0.625 0.109531 0.625 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.640469 APEX 0.625 0 0.734531 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.75 RAD 0.03125 
+   txt155 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.75 APEX 0.734531 0 0.75 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.75 APEX 0.625 0.109531 0.75 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.765469 APEX 0.625 0 0.859531 RAD 0.0078125
+   txt155 
+TEXDEF txt155 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 0.875 RAD 0.03125 
+   txt155 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 0.875 APEX 0.734531 0 0.875 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 0.875 APEX 0.625 0.109531 0.875 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0 0.890469 APEX 0.625 0 0.984531 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0 1 RAD 0.03125 
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0 1 APEX 0.734531 0 1 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.0154687 1 APEX 0.625 0.109531 1 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0 RAD 0.03125 
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0 APEX 0.734531 0.125 0 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0 APEX 0.625 0.234531 0 RAD 0.0078125
+   txt156 
+TEXDEF txt156 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.0154687 APEX 0.625 0.125 0.109531 RAD 0.0078125
+   txt156 
+TEXDEF txt157 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.125 RAD 0.03125 
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.125 APEX 0.734531 0.125 0.125 RAD 0.0078125
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.125 APEX 0.625 0.234531 0.125 RAD 0.0078125
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.140469 APEX 0.625 0.125 0.234531 RAD 0.0078125
+   txt157 
+TEXDEF txt157 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.25 RAD 0.03125 
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.25 APEX 0.734531 0.125 0.25 RAD 0.0078125
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.25 APEX 0.625 0.234531 0.25 RAD 0.0078125
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.265469 APEX 0.625 0.125 0.359531 RAD 0.0078125
+   txt157 
+TEXDEF txt157 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.375 RAD 0.03125 
+   txt157 
+TEXDEF txt157 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.375 APEX 0.734531 0.125 0.375 RAD 0.0078125
+   txt157 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.375 APEX 0.625 0.234531 0.375 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.390469 APEX 0.625 0.125 0.484531 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.5 RAD 0.03125 
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.5 APEX 0.734531 0.125 0.5 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.5 APEX 0.625 0.234531 0.5 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.515469 APEX 0.625 0.125 0.609531 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.625 RAD 0.03125 
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.625 APEX 0.734531 0.125 0.625 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.625 APEX 0.625 0.234531 0.625 RAD 0.0078125
+   txt158 
+TEXDEF txt158 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.640469 APEX 0.625 0.125 0.734531 RAD 0.0078125
+   txt158 
+TEXDEF txt159 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.75 RAD 0.03125 
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.75 APEX 0.734531 0.125 0.75 RAD 0.0078125
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.75 APEX 0.625 0.234531 0.75 RAD 0.0078125
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.765469 APEX 0.625 0.125 0.859531 RAD 0.0078125
+   txt159 
+TEXDEF txt159 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 0.875 RAD 0.03125 
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 0.875 APEX 0.734531 0.125 0.875 RAD 0.0078125
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 0.875 APEX 0.625 0.234531 0.875 RAD 0.0078125
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.125 0.890469 APEX 0.625 0.125 0.984531 RAD 0.0078125
+   txt159 
+TEXDEF txt159 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.125 1 RAD 0.03125 
+   txt159 
+TEXDEF txt159 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.125 1 APEX 0.734531 0.125 1 RAD 0.0078125
+   txt159 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.140469 1 APEX 0.625 0.234531 1 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0 RAD 0.03125 
+   txt160 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0 APEX 0.734531 0.25 0 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0 APEX 0.625 0.359531 0 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.0154687 APEX 0.625 0.25 0.109531 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.125 RAD 0.03125 
+   txt160 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.125 APEX 0.734531 0.25 0.125 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.125 APEX 0.625 0.359531 0.125 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.140469 APEX 0.625 0.25 0.234531 RAD 0.0078125
+   txt160 
+TEXDEF txt160 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.25 RAD 0.03125 
+   txt160 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.25 APEX 0.734531 0.25 0.25 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.25 APEX 0.625 0.359531 0.25 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.265469 APEX 0.625 0.25 0.359531 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.375 RAD 0.03125 
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.375 APEX 0.734531 0.25 0.375 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.375 APEX 0.625 0.359531 0.375 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.390469 APEX 0.625 0.25 0.484531 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.5 RAD 0.03125 
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.5 APEX 0.734531 0.25 0.5 RAD 0.0078125
+   txt161 
+TEXDEF txt161 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.5 APEX 0.625 0.359531 0.5 RAD 0.0078125
+   txt161 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.515469 APEX 0.625 0.25 0.609531 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.625 RAD 0.03125 
+   txt162 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.625 APEX 0.734531 0.25 0.625 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.625 APEX 0.625 0.359531 0.625 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.640469 APEX 0.625 0.25 0.734531 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.75 RAD 0.03125 
+   txt162 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.75 APEX 0.734531 0.25 0.75 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.75 APEX 0.625 0.359531 0.75 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.765469 APEX 0.625 0.25 0.859531 RAD 0.0078125
+   txt162 
+TEXDEF txt162 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 0.875 RAD 0.03125 
+   txt162 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 0.875 APEX 0.734531 0.25 0.875 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 0.875 APEX 0.625 0.359531 0.875 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.25 0.890469 APEX 0.625 0.25 0.984531 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.25 1 RAD 0.03125 
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.25 1 APEX 0.734531 0.25 1 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.265469 1 APEX 0.625 0.359531 1 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0 RAD 0.03125 
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0 APEX 0.734531 0.375 0 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0 APEX 0.625 0.484531 0 RAD 0.0078125
+   txt163 
+TEXDEF txt163 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.0154687 APEX 0.625 0.375 0.109531 RAD 0.0078125
+   txt163 
+TEXDEF txt164 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.125 RAD 0.03125 
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.125 APEX 0.734531 0.375 0.125 RAD 0.0078125
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.125 APEX 0.625 0.484531 0.125 RAD 0.0078125
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.140469 APEX 0.625 0.375 0.234531 RAD 0.0078125
+   txt164 
+TEXDEF txt164 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.25 RAD 0.03125 
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.25 APEX 0.734531 0.375 0.25 RAD 0.0078125
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.25 APEX 0.625 0.484531 0.25 RAD 0.0078125
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.265469 APEX 0.625 0.375 0.359531 RAD 0.0078125
+   txt164 
+TEXDEF txt164 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.375 RAD 0.03125 
+   txt164 
+TEXDEF txt164 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.375 APEX 0.734531 0.375 0.375 RAD 0.0078125
+   txt164 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.375 APEX 0.625 0.484531 0.375 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.390469 APEX 0.625 0.375 0.484531 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.5 RAD 0.03125 
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.5 APEX 0.734531 0.375 0.5 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.5 APEX 0.625 0.484531 0.5 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.515469 APEX 0.625 0.375 0.609531 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.625 RAD 0.03125 
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.625 APEX 0.734531 0.375 0.625 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.625 APEX 0.625 0.484531 0.625 RAD 0.0078125
+   txt165 
+TEXDEF txt165 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.640469 APEX 0.625 0.375 0.734531 RAD 0.0078125
+   txt165 
+TEXDEF txt166 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.75 RAD 0.03125 
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.75 APEX 0.734531 0.375 0.75 RAD 0.0078125
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.75 APEX 0.625 0.484531 0.75 RAD 0.0078125
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.765469 APEX 0.625 0.375 0.859531 RAD 0.0078125
+   txt166 
+TEXDEF txt166 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 0.875 RAD 0.03125 
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 0.875 APEX 0.734531 0.375 0.875 RAD 0.0078125
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 0.875 APEX 0.625 0.484531 0.875 RAD 0.0078125
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.375 0.890469 APEX 0.625 0.375 0.984531 RAD 0.0078125
+   txt166 
+TEXDEF txt166 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.375 1 RAD 0.03125 
+   txt166 
+TEXDEF txt166 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.375 1 APEX 0.734531 0.375 1 RAD 0.0078125
+   txt166 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.390469 1 APEX 0.625 0.484531 1 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0 RAD 0.03125 
+   txt167 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0 APEX 0.734531 0.5 0 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0 APEX 0.625 0.609531 0 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.0154687 APEX 0.625 0.5 0.109531 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.125 RAD 0.03125 
+   txt167 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.125 APEX 0.734531 0.5 0.125 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.125 APEX 0.625 0.609531 0.125 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.140469 APEX 0.625 0.5 0.234531 RAD 0.0078125
+   txt167 
+TEXDEF txt167 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.25 RAD 0.03125 
+   txt167 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.25 APEX 0.734531 0.5 0.25 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.25 APEX 0.625 0.609531 0.25 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.265469 APEX 0.625 0.5 0.359531 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.375 RAD 0.03125 
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.375 APEX 0.734531 0.5 0.375 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.375 APEX 0.625 0.609531 0.375 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.390469 APEX 0.625 0.5 0.484531 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.5 RAD 0.03125 
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.5 APEX 0.734531 0.5 0.5 RAD 0.0078125
+   txt168 
+TEXDEF txt168 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.5 APEX 0.625 0.609531 0.5 RAD 0.0078125
+   txt168 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.515469 APEX 0.625 0.5 0.609531 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.625 RAD 0.03125 
+   txt169 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.625 APEX 0.734531 0.5 0.625 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.625 APEX 0.625 0.609531 0.625 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.640469 APEX 0.625 0.5 0.734531 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.75 RAD 0.03125 
+   txt169 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.75 APEX 0.734531 0.5 0.75 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.75 APEX 0.625 0.609531 0.75 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.765469 APEX 0.625 0.5 0.859531 RAD 0.0078125
+   txt169 
+TEXDEF txt169 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 0.875 RAD 0.03125 
+   txt169 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 0.875 APEX 0.734531 0.5 0.875 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 0.875 APEX 0.625 0.609531 0.875 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.5 0.890469 APEX 0.625 0.5 0.984531 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.5 1 RAD 0.03125 
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.5 1 APEX 0.734531 0.5 1 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.515469 1 APEX 0.625 0.609531 1 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0 RAD 0.03125 
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0 APEX 0.734531 0.625 0 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0 APEX 0.625 0.734531 0 RAD 0.0078125
+   txt170 
+TEXDEF txt170 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.0154687 APEX 0.625 0.625 0.109531 RAD 0.0078125
+   txt170 
+TEXDEF txt171 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.125 RAD 0.03125 
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.125 APEX 0.734531 0.625 0.125 RAD 0.0078125
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.125 APEX 0.625 0.734531 0.125 RAD 0.0078125
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.140469 APEX 0.625 0.625 0.234531 RAD 0.0078125
+   txt171 
+TEXDEF txt171 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.25 RAD 0.03125 
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.25 APEX 0.734531 0.625 0.25 RAD 0.0078125
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.25 APEX 0.625 0.734531 0.25 RAD 0.0078125
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.265469 APEX 0.625 0.625 0.359531 RAD 0.0078125
+   txt171 
+TEXDEF txt171 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.375 RAD 0.03125 
+   txt171 
+TEXDEF txt171 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.375 APEX 0.734531 0.625 0.375 RAD 0.0078125
+   txt171 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.375 APEX 0.625 0.734531 0.375 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.390469 APEX 0.625 0.625 0.484531 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.5 RAD 0.03125 
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.5 APEX 0.734531 0.625 0.5 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.5 APEX 0.625 0.734531 0.5 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.515469 APEX 0.625 0.625 0.609531 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.625 RAD 0.03125 
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.625 APEX 0.734531 0.625 0.625 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.625 APEX 0.625 0.734531 0.625 RAD 0.0078125
+   txt172 
+TEXDEF txt172 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.640469 APEX 0.625 0.625 0.734531 RAD 0.0078125
+   txt172 
+TEXDEF txt173 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.75 RAD 0.03125 
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.75 APEX 0.734531 0.625 0.75 RAD 0.0078125
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.75 APEX 0.625 0.734531 0.75 RAD 0.0078125
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.765469 APEX 0.625 0.625 0.859531 RAD 0.0078125
+   txt173 
+TEXDEF txt173 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 0.875 RAD 0.03125 
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 0.875 APEX 0.734531 0.625 0.875 RAD 0.0078125
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 0.875 APEX 0.625 0.734531 0.875 RAD 0.0078125
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.625 0.890469 APEX 0.625 0.625 0.984531 RAD 0.0078125
+   txt173 
+TEXDEF txt173 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.625 1 RAD 0.03125 
+   txt173 
+TEXDEF txt173 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.625 1 APEX 0.734531 0.625 1 RAD 0.0078125
+   txt173 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.640469 1 APEX 0.625 0.734531 1 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0 RAD 0.03125 
+   txt174 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0 APEX 0.734531 0.75 0 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0 APEX 0.625 0.859531 0 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.0154687 APEX 0.625 0.75 0.109531 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.125 RAD 0.03125 
+   txt174 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.125 APEX 0.734531 0.75 0.125 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.125 APEX 0.625 0.859531 0.125 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.140469 APEX 0.625 0.75 0.234531 RAD 0.0078125
+   txt174 
+TEXDEF txt174 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.25 RAD 0.03125 
+   txt174 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.25 APEX 0.734531 0.75 0.25 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.25 APEX 0.625 0.859531 0.25 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.265469 APEX 0.625 0.75 0.359531 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.375 RAD 0.03125 
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.375 APEX 0.734531 0.75 0.375 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.375 APEX 0.625 0.859531 0.375 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.390469 APEX 0.625 0.75 0.484531 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.5 RAD 0.03125 
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.5 APEX 0.734531 0.75 0.5 RAD 0.0078125
+   txt175 
+TEXDEF txt175 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.5 APEX 0.625 0.859531 0.5 RAD 0.0078125
+   txt175 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.515469 APEX 0.625 0.75 0.609531 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.625 RAD 0.03125 
+   txt176 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.625 APEX 0.734531 0.75 0.625 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.625 APEX 0.625 0.859531 0.625 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.640469 APEX 0.625 0.75 0.734531 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.75 RAD 0.03125 
+   txt176 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.75 APEX 0.734531 0.75 0.75 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.75 APEX 0.625 0.859531 0.75 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.765469 APEX 0.625 0.75 0.859531 RAD 0.0078125
+   txt176 
+TEXDEF txt176 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 0.875 RAD 0.03125 
+   txt176 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 0.875 APEX 0.734531 0.75 0.875 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 0.875 APEX 0.625 0.859531 0.875 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.75 0.890469 APEX 0.625 0.75 0.984531 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.75 1 RAD 0.03125 
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.75 1 APEX 0.734531 0.75 1 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.765469 1 APEX 0.625 0.859531 1 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0 RAD 0.03125 
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0 APEX 0.734531 0.875 0 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0 APEX 0.625 0.984531 0 RAD 0.0078125
+   txt177 
+TEXDEF txt177 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.0154687 APEX 0.625 0.875 0.109531 RAD 0.0078125
+   txt177 
+TEXDEF txt178 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.125 RAD 0.03125 
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.125 APEX 0.734531 0.875 0.125 RAD 0.0078125
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.125 APEX 0.625 0.984531 0.125 RAD 0.0078125
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.140469 APEX 0.625 0.875 0.234531 RAD 0.0078125
+   txt178 
+TEXDEF txt178 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.25 RAD 0.03125 
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.25 APEX 0.734531 0.875 0.25 RAD 0.0078125
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.25 APEX 0.625 0.984531 0.25 RAD 0.0078125
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.265469 APEX 0.625 0.875 0.359531 RAD 0.0078125
+   txt178 
+TEXDEF txt178 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.375 RAD 0.03125 
+   txt178 
+TEXDEF txt178 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.375 APEX 0.734531 0.875 0.375 RAD 0.0078125
+   txt178 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.375 APEX 0.625 0.984531 0.375 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.390469 APEX 0.625 0.875 0.484531 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.5 RAD 0.03125 
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.5 APEX 0.734531 0.875 0.5 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.5 APEX 0.625 0.984531 0.5 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.515469 APEX 0.625 0.875 0.609531 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.625 RAD 0.03125 
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.625 APEX 0.734531 0.875 0.625 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.625 APEX 0.625 0.984531 0.625 RAD 0.0078125
+   txt179 
+TEXDEF txt179 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.640469 APEX 0.625 0.875 0.734531 RAD 0.0078125
+   txt179 
+TEXDEF txt180 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.75 RAD 0.03125 
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.75 APEX 0.734531 0.875 0.75 RAD 0.0078125
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.75 APEX 0.625 0.984531 0.75 RAD 0.0078125
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.765469 APEX 0.625 0.875 0.859531 RAD 0.0078125
+   txt180 
+TEXDEF txt180 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 0.875 RAD 0.03125 
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 0.875 APEX 0.734531 0.875 0.875 RAD 0.0078125
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 0.875 APEX 0.625 0.984531 0.875 RAD 0.0078125
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.875 0.890469 APEX 0.625 0.875 0.984531 RAD 0.0078125
+   txt180 
+TEXDEF txt180 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 0.875 1 RAD 0.03125 
+   txt180 
+TEXDEF txt180 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 0.875 1 APEX 0.734531 0.875 1 RAD 0.0078125
+   txt180 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 0.890469 1 APEX 0.625 0.984531 1 RAD 0.0078125
+   txt181 
+TEXDEF txt181 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0 RAD 0.03125 
+   txt181 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0 APEX 0.734531 1 0 RAD 0.0078125
+   txt181 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.0154687 APEX 0.625 1 0.109531 RAD 0.0078125
+   txt181 
+TEXDEF txt181 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.125 RAD 0.03125 
+   txt181 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.125 APEX 0.734531 1 0.125 RAD 0.0078125
+   txt181 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.140469 APEX 0.625 1 0.234531 RAD 0.0078125
+   txt181 
+TEXDEF txt181 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.25 RAD 0.03125 
+   txt181 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.25 APEX 0.734531 1 0.25 RAD 0.0078125
+   txt181 
+TEXDEF txt181 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.265469 APEX 0.625 1 0.359531 RAD 0.0078125
+   txt181 
+TEXDEF txt182 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.375 RAD 0.03125 
+   txt182 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.375 APEX 0.734531 1 0.375 RAD 0.0078125
+   txt182 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.390469 APEX 0.625 1 0.484531 RAD 0.0078125
+   txt182 
+TEXDEF txt182 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.5 RAD 0.03125 
+   txt182 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.5 APEX 0.734531 1 0.5 RAD 0.0078125
+   txt182 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.515469 APEX 0.625 1 0.609531 RAD 0.0078125
+   txt182 
+TEXDEF txt182 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.625 RAD 0.03125 
+   txt182 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.625 APEX 0.734531 1 0.625 RAD 0.0078125
+   txt182 
+TEXDEF txt182 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.640469 APEX 0.625 1 0.734531 RAD 0.0078125
+   txt182 
+TEXDEF txt182 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.75 RAD 0.03125 
+   txt182 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.75 APEX 0.734531 1 0.75 RAD 0.0078125
+   txt183 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.765469 APEX 0.625 1 0.859531 RAD 0.0078125
+   txt183 
+TEXDEF txt183 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 0.875 RAD 0.03125 
+   txt183 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 0.875 APEX 0.734531 1 0.875 RAD 0.0078125
+   txt183 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.625 1 0.890469 APEX 0.625 1 0.984531 RAD 0.0078125
+   txt183 
+TEXDEF txt183 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.625 1 1 RAD 0.03125 
+   txt183 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.640469 1 1 APEX 0.734531 1 1 RAD 0.0078125
+   txt183 
+TEXDEF txt183 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0 RAD 0.03125 
+   txt183 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0 APEX 0.859531 0 0 RAD 0.0078125
+   txt183 
+TEXDEF txt183 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0 APEX 0.75 0.109531 0 RAD 0.0078125
+   txt183 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.0154687 APEX 0.75 0 0.109531 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.125 RAD 0.03125 
+   txt184 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.125 APEX 0.859531 0 0.125 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.125 APEX 0.75 0.109531 0.125 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.140469 APEX 0.75 0 0.234531 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.25 RAD 0.03125 
+   txt184 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.25 APEX 0.859531 0 0.25 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.25 APEX 0.75 0.109531 0.25 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.265469 APEX 0.75 0 0.359531 RAD 0.0078125
+   txt184 
+TEXDEF txt184 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.375 RAD 0.03125 
+   txt184 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.375 APEX 0.859531 0 0.375 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.375 APEX 0.75 0.109531 0.375 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.390469 APEX 0.75 0 0.484531 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.5 RAD 0.03125 
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.5 APEX 0.859531 0 0.5 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.5 APEX 0.75 0.109531 0.5 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.515469 APEX 0.75 0 0.609531 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.625 RAD 0.03125 
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.625 APEX 0.859531 0 0.625 RAD 0.0078125
+   txt185 
+TEXDEF txt185 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.625 APEX 0.75 0.109531 0.625 RAD 0.0078125
+   txt185 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.640469 APEX 0.75 0 0.734531 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.75 RAD 0.03125 
+   txt186 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.75 APEX 0.859531 0 0.75 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.75 APEX 0.75 0.109531 0.75 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.765469 APEX 0.75 0 0.859531 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 0.875 RAD 0.03125 
+   txt186 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 0.875 APEX 0.859531 0 0.875 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 0.875 APEX 0.75 0.109531 0.875 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0 0.890469 APEX 0.75 0 0.984531 RAD 0.0078125
+   txt186 
+TEXDEF txt186 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0 1 RAD 0.03125 
+   txt186 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0 1 APEX 0.859531 0 1 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.0154687 1 APEX 0.75 0.109531 1 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0 RAD 0.03125 
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0 APEX 0.859531 0.125 0 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0 APEX 0.75 0.234531 0 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.0154687 APEX 0.75 0.125 0.109531 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.125 RAD 0.03125 
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.125 APEX 0.859531 0.125 0.125 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.125 APEX 0.75 0.234531 0.125 RAD 0.0078125
+   txt187 
+TEXDEF txt187 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.140469 APEX 0.75 0.125 0.234531 RAD 0.0078125
+   txt187 
+TEXDEF txt188 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.25 RAD 0.03125 
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.25 APEX 0.859531 0.125 0.25 RAD 0.0078125
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.25 APEX 0.75 0.234531 0.25 RAD 0.0078125
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.265469 APEX 0.75 0.125 0.359531 RAD 0.0078125
+   txt188 
+TEXDEF txt188 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.375 RAD 0.03125 
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.375 APEX 0.859531 0.125 0.375 RAD 0.0078125
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.375 APEX 0.75 0.234531 0.375 RAD 0.0078125
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.390469 APEX 0.75 0.125 0.484531 RAD 0.0078125
+   txt188 
+TEXDEF txt188 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.5 RAD 0.03125 
+   txt188 
+TEXDEF txt188 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.5 APEX 0.859531 0.125 0.5 RAD 0.0078125
+   txt188 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.5 APEX 0.75 0.234531 0.5 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.515469 APEX 0.75 0.125 0.609531 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.625 RAD 0.03125 
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.625 APEX 0.859531 0.125 0.625 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.625 APEX 0.75 0.234531 0.625 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.640469 APEX 0.75 0.125 0.734531 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.75 RAD 0.03125 
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.75 APEX 0.859531 0.125 0.75 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.75 APEX 0.75 0.234531 0.75 RAD 0.0078125
+   txt189 
+TEXDEF txt189 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.765469 APEX 0.75 0.125 0.859531 RAD 0.0078125
+   txt189 
+TEXDEF txt190 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 0.875 RAD 0.03125 
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 0.875 APEX 0.859531 0.125 0.875 RAD 0.0078125
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 0.875 APEX 0.75 0.234531 0.875 RAD 0.0078125
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.125 0.890469 APEX 0.75 0.125 0.984531 RAD 0.0078125
+   txt190 
+TEXDEF txt190 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.125 1 RAD 0.03125 
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.125 1 APEX 0.859531 0.125 1 RAD 0.0078125
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.140469 1 APEX 0.75 0.234531 1 RAD 0.0078125
+   txt190 
+TEXDEF txt190 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0 RAD 0.03125 
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0 APEX 0.859531 0.25 0 RAD 0.0078125
+   txt190 
+TEXDEF txt190 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0 APEX 0.75 0.359531 0 RAD 0.0078125
+   txt190 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.0154687 APEX 0.75 0.25 0.109531 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.125 RAD 0.03125 
+   txt191 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.125 APEX 0.859531 0.25 0.125 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.125 APEX 0.75 0.359531 0.125 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.140469 APEX 0.75 0.25 0.234531 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.25 RAD 0.03125 
+   txt191 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.25 APEX 0.859531 0.25 0.25 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.25 APEX 0.75 0.359531 0.25 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.265469 APEX 0.75 0.25 0.359531 RAD 0.0078125
+   txt191 
+TEXDEF txt191 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.375 RAD 0.03125 
+   txt191 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.375 APEX 0.859531 0.25 0.375 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.375 APEX 0.75 0.359531 0.375 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.390469 APEX 0.75 0.25 0.484531 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.5 RAD 0.03125 
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.5 APEX 0.859531 0.25 0.5 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.5 APEX 0.75 0.359531 0.5 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.515469 APEX 0.75 0.25 0.609531 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.625 RAD 0.03125 
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.625 APEX 0.859531 0.25 0.625 RAD 0.0078125
+   txt192 
+TEXDEF txt192 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.625 APEX 0.75 0.359531 0.625 RAD 0.0078125
+   txt192 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.640469 APEX 0.75 0.25 0.734531 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.75 RAD 0.03125 
+   txt193 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.75 APEX 0.859531 0.25 0.75 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.75 APEX 0.75 0.359531 0.75 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.765469 APEX 0.75 0.25 0.859531 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 0.875 RAD 0.03125 
+   txt193 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 0.875 APEX 0.859531 0.25 0.875 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 0.875 APEX 0.75 0.359531 0.875 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.25 0.890469 APEX 0.75 0.25 0.984531 RAD 0.0078125
+   txt193 
+TEXDEF txt193 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.25 1 RAD 0.03125 
+   txt193 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.25 1 APEX 0.859531 0.25 1 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.265469 1 APEX 0.75 0.359531 1 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0 RAD 0.03125 
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0 APEX 0.859531 0.375 0 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0 APEX 0.75 0.484531 0 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.0154687 APEX 0.75 0.375 0.109531 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.125 RAD 0.03125 
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.125 APEX 0.859531 0.375 0.125 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.125 APEX 0.75 0.484531 0.125 RAD 0.0078125
+   txt194 
+TEXDEF txt194 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.140469 APEX 0.75 0.375 0.234531 RAD 0.0078125
+   txt194 
+TEXDEF txt195 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.25 RAD 0.03125 
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.25 APEX 0.859531 0.375 0.25 RAD 0.0078125
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.25 APEX 0.75 0.484531 0.25 RAD 0.0078125
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.265469 APEX 0.75 0.375 0.359531 RAD 0.0078125
+   txt195 
+TEXDEF txt195 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.375 RAD 0.03125 
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.375 APEX 0.859531 0.375 0.375 RAD 0.0078125
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.375 APEX 0.75 0.484531 0.375 RAD 0.0078125
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.390469 APEX 0.75 0.375 0.484531 RAD 0.0078125
+   txt195 
+TEXDEF txt195 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.5 RAD 0.03125 
+   txt195 
+TEXDEF txt195 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.5 APEX 0.859531 0.375 0.5 RAD 0.0078125
+   txt195 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.5 APEX 0.75 0.484531 0.5 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.515469 APEX 0.75 0.375 0.609531 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.625 RAD 0.03125 
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.625 APEX 0.859531 0.375 0.625 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.625 APEX 0.75 0.484531 0.625 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.640469 APEX 0.75 0.375 0.734531 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.75 RAD 0.03125 
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.75 APEX 0.859531 0.375 0.75 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.75 APEX 0.75 0.484531 0.75 RAD 0.0078125
+   txt196 
+TEXDEF txt196 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.765469 APEX 0.75 0.375 0.859531 RAD 0.0078125
+   txt196 
+TEXDEF txt197 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 0.875 RAD 0.03125 
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 0.875 APEX 0.859531 0.375 0.875 RAD 0.0078125
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 0.875 APEX 0.75 0.484531 0.875 RAD 0.0078125
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.375 0.890469 APEX 0.75 0.375 0.984531 RAD 0.0078125
+   txt197 
+TEXDEF txt197 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.375 1 RAD 0.03125 
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.375 1 APEX 0.859531 0.375 1 RAD 0.0078125
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.390469 1 APEX 0.75 0.484531 1 RAD 0.0078125
+   txt197 
+TEXDEF txt197 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0 RAD 0.03125 
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0 APEX 0.859531 0.5 0 RAD 0.0078125
+   txt197 
+TEXDEF txt197 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0 APEX 0.75 0.609531 0 RAD 0.0078125
+   txt197 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.0154687 APEX 0.75 0.5 0.109531 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.125 RAD 0.03125 
+   txt198 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.125 APEX 0.859531 0.5 0.125 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.125 APEX 0.75 0.609531 0.125 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.140469 APEX 0.75 0.5 0.234531 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.25 RAD 0.03125 
+   txt198 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.25 APEX 0.859531 0.5 0.25 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.25 APEX 0.75 0.609531 0.25 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.265469 APEX 0.75 0.5 0.359531 RAD 0.0078125
+   txt198 
+TEXDEF txt198 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.375 RAD 0.03125 
+   txt198 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.375 APEX 0.859531 0.5 0.375 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.375 APEX 0.75 0.609531 0.375 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.390469 APEX 0.75 0.5 0.484531 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.5 RAD 0.03125 
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.5 APEX 0.859531 0.5 0.5 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.5 APEX 0.75 0.609531 0.5 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.515469 APEX 0.75 0.5 0.609531 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.625 RAD 0.03125 
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.625 APEX 0.859531 0.5 0.625 RAD 0.0078125
+   txt199 
+TEXDEF txt199 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.625 APEX 0.75 0.609531 0.625 RAD 0.0078125
+   txt199 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.640469 APEX 0.75 0.5 0.734531 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.75 RAD 0.03125 
+   txt200 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.75 APEX 0.859531 0.5 0.75 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.75 APEX 0.75 0.609531 0.75 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.765469 APEX 0.75 0.5 0.859531 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 0.875 RAD 0.03125 
+   txt200 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 0.875 APEX 0.859531 0.5 0.875 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 0.875 APEX 0.75 0.609531 0.875 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.5 0.890469 APEX 0.75 0.5 0.984531 RAD 0.0078125
+   txt200 
+TEXDEF txt200 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.5 1 RAD 0.03125 
+   txt200 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.5 1 APEX 0.859531 0.5 1 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.515469 1 APEX 0.75 0.609531 1 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0 RAD 0.03125 
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0 APEX 0.859531 0.625 0 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0 APEX 0.75 0.734531 0 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.0154687 APEX 0.75 0.625 0.109531 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.125 RAD 0.03125 
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.125 APEX 0.859531 0.625 0.125 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.125 APEX 0.75 0.734531 0.125 RAD 0.0078125
+   txt201 
+TEXDEF txt201 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.140469 APEX 0.75 0.625 0.234531 RAD 0.0078125
+   txt201 
+TEXDEF txt202 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.25 RAD 0.03125 
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.25 APEX 0.859531 0.625 0.25 RAD 0.0078125
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.25 APEX 0.75 0.734531 0.25 RAD 0.0078125
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.265469 APEX 0.75 0.625 0.359531 RAD 0.0078125
+   txt202 
+TEXDEF txt202 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.375 RAD 0.03125 
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.375 APEX 0.859531 0.625 0.375 RAD 0.0078125
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.375 APEX 0.75 0.734531 0.375 RAD 0.0078125
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.390469 APEX 0.75 0.625 0.484531 RAD 0.0078125
+   txt202 
+TEXDEF txt202 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.5 RAD 0.03125 
+   txt202 
+TEXDEF txt202 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.5 APEX 0.859531 0.625 0.5 RAD 0.0078125
+   txt202 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.5 APEX 0.75 0.734531 0.5 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.515469 APEX 0.75 0.625 0.609531 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.625 RAD 0.03125 
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.625 APEX 0.859531 0.625 0.625 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.625 APEX 0.75 0.734531 0.625 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.640469 APEX 0.75 0.625 0.734531 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.75 RAD 0.03125 
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.75 APEX 0.859531 0.625 0.75 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.75 APEX 0.75 0.734531 0.75 RAD 0.0078125
+   txt203 
+TEXDEF txt203 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.765469 APEX 0.75 0.625 0.859531 RAD 0.0078125
+   txt203 
+TEXDEF txt204 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 0.875 RAD 0.03125 
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 0.875 APEX 0.859531 0.625 0.875 RAD 0.0078125
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 0.875 APEX 0.75 0.734531 0.875 RAD 0.0078125
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.625 0.890469 APEX 0.75 0.625 0.984531 RAD 0.0078125
+   txt204 
+TEXDEF txt204 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.625 1 RAD 0.03125 
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.625 1 APEX 0.859531 0.625 1 RAD 0.0078125
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.640469 1 APEX 0.75 0.734531 1 RAD 0.0078125
+   txt204 
+TEXDEF txt204 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0 RAD 0.03125 
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0 APEX 0.859531 0.75 0 RAD 0.0078125
+   txt204 
+TEXDEF txt204 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0 APEX 0.75 0.859531 0 RAD 0.0078125
+   txt204 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.0154687 APEX 0.75 0.75 0.109531 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.125 RAD 0.03125 
+   txt205 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.125 APEX 0.859531 0.75 0.125 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.125 APEX 0.75 0.859531 0.125 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.140469 APEX 0.75 0.75 0.234531 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.25 RAD 0.03125 
+   txt205 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.25 APEX 0.859531 0.75 0.25 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.25 APEX 0.75 0.859531 0.25 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.265469 APEX 0.75 0.75 0.359531 RAD 0.0078125
+   txt205 
+TEXDEF txt205 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.375 RAD 0.03125 
+   txt205 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.375 APEX 0.859531 0.75 0.375 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.375 APEX 0.75 0.859531 0.375 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.390469 APEX 0.75 0.75 0.484531 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.5 RAD 0.03125 
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.5 APEX 0.859531 0.75 0.5 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.5 APEX 0.75 0.859531 0.5 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.515469 APEX 0.75 0.75 0.609531 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.625 RAD 0.03125 
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.625 APEX 0.859531 0.75 0.625 RAD 0.0078125
+   txt206 
+TEXDEF txt206 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.625 APEX 0.75 0.859531 0.625 RAD 0.0078125
+   txt206 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.640469 APEX 0.75 0.75 0.734531 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.75 RAD 0.03125 
+   txt207 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.75 APEX 0.859531 0.75 0.75 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.75 APEX 0.75 0.859531 0.75 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.765469 APEX 0.75 0.75 0.859531 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 0.875 RAD 0.03125 
+   txt207 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 0.875 APEX 0.859531 0.75 0.875 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 0.875 APEX 0.75 0.859531 0.875 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.75 0.890469 APEX 0.75 0.75 0.984531 RAD 0.0078125
+   txt207 
+TEXDEF txt207 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.75 1 RAD 0.03125 
+   txt207 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.75 1 APEX 0.859531 0.75 1 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.765469 1 APEX 0.75 0.859531 1 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0 RAD 0.03125 
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0 APEX 0.859531 0.875 0 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0 APEX 0.75 0.984531 0 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.0154687 APEX 0.75 0.875 0.109531 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.125 RAD 0.03125 
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.125 APEX 0.859531 0.875 0.125 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.125 APEX 0.75 0.984531 0.125 RAD 0.0078125
+   txt208 
+TEXDEF txt208 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.140469 APEX 0.75 0.875 0.234531 RAD 0.0078125
+   txt208 
+TEXDEF txt209 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.25 RAD 0.03125 
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.25 APEX 0.859531 0.875 0.25 RAD 0.0078125
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.25 APEX 0.75 0.984531 0.25 RAD 0.0078125
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.265469 APEX 0.75 0.875 0.359531 RAD 0.0078125
+   txt209 
+TEXDEF txt209 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.375 RAD 0.03125 
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.375 APEX 0.859531 0.875 0.375 RAD 0.0078125
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.375 APEX 0.75 0.984531 0.375 RAD 0.0078125
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.390469 APEX 0.75 0.875 0.484531 RAD 0.0078125
+   txt209 
+TEXDEF txt209 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.5 RAD 0.03125 
+   txt209 
+TEXDEF txt209 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.5 APEX 0.859531 0.875 0.5 RAD 0.0078125
+   txt209 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.5 APEX 0.75 0.984531 0.5 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.515469 APEX 0.75 0.875 0.609531 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.625 RAD 0.03125 
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.625 APEX 0.859531 0.875 0.625 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.625 APEX 0.75 0.984531 0.625 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.640469 APEX 0.75 0.875 0.734531 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.75 RAD 0.03125 
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.75 APEX 0.859531 0.875 0.75 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.75 APEX 0.75 0.984531 0.75 RAD 0.0078125
+   txt210 
+TEXDEF txt210 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.765469 APEX 0.75 0.875 0.859531 RAD 0.0078125
+   txt210 
+TEXDEF txt211 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 0.875 RAD 0.03125 
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 0.875 APEX 0.859531 0.875 0.875 RAD 0.0078125
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 0.875 APEX 0.75 0.984531 0.875 RAD 0.0078125
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.875 0.890469 APEX 0.75 0.875 0.984531 RAD 0.0078125
+   txt211 
+TEXDEF txt211 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 0.875 1 RAD 0.03125 
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 0.875 1 APEX 0.859531 0.875 1 RAD 0.0078125
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 0.890469 1 APEX 0.75 0.984531 1 RAD 0.0078125
+   txt211 
+TEXDEF txt211 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0 RAD 0.03125 
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0 APEX 0.859531 1 0 RAD 0.0078125
+   txt211 
+TEXDEF txt211 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.0154687 APEX 0.75 1 0.109531 RAD 0.0078125
+   txt211 
+TEXDEF txt212 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.125 RAD 0.03125 
+   txt212 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.125 APEX 0.859531 1 0.125 RAD 0.0078125
+   txt212 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.140469 APEX 0.75 1 0.234531 RAD 0.0078125
+   txt212 
+TEXDEF txt212 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.25 RAD 0.03125 
+   txt212 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.25 APEX 0.859531 1 0.25 RAD 0.0078125
+   txt212 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.265469 APEX 0.75 1 0.359531 RAD 0.0078125
+   txt212 
+TEXDEF txt212 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.375 RAD 0.03125 
+   txt212 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.375 APEX 0.859531 1 0.375 RAD 0.0078125
+   txt212 
+TEXDEF txt212 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.390469 APEX 0.75 1 0.484531 RAD 0.0078125
+   txt212 
+TEXDEF txt212 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.5 RAD 0.03125 
+   txt212 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.5 APEX 0.859531 1 0.5 RAD 0.0078125
+   txt213 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.515469 APEX 0.75 1 0.609531 RAD 0.0078125
+   txt213 
+TEXDEF txt213 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.625 RAD 0.03125 
+   txt213 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.625 APEX 0.859531 1 0.625 RAD 0.0078125
+   txt213 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.640469 APEX 0.75 1 0.734531 RAD 0.0078125
+   txt213 
+TEXDEF txt213 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.75 RAD 0.03125 
+   txt213 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.75 APEX 0.859531 1 0.75 RAD 0.0078125
+   txt213 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.765469 APEX 0.75 1 0.859531 RAD 0.0078125
+   txt213 
+TEXDEF txt213 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 0.875 RAD 0.03125 
+   txt213 
+TEXDEF txt213 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 0.875 APEX 0.859531 1 0.875 RAD 0.0078125
+   txt213 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.75 1 0.890469 APEX 0.75 1 0.984531 RAD 0.0078125
+   txt214 
+TEXDEF txt214 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.75 1 1 RAD 0.03125 
+   txt214 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.765469 1 1 APEX 0.859531 1 1 RAD 0.0078125
+   txt214 
+TEXDEF txt214 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0 RAD 0.03125 
+   txt214 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0 APEX 0.984531 0 0 RAD 0.0078125
+   txt214 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0 APEX 0.875 0.109531 0 RAD 0.0078125
+   txt214 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.0154687 APEX 0.875 0 0.109531 RAD 0.0078125
+   txt214 
+TEXDEF txt214 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.125 RAD 0.03125 
+   txt214 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.125 APEX 0.984531 0 0.125 RAD 0.0078125
+   txt214 
+TEXDEF txt214 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.125 APEX 0.875 0.109531 0.125 RAD 0.0078125
+   txt214 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.140469 APEX 0.875 0 0.234531 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.25 RAD 0.03125 
+   txt215 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.25 APEX 0.984531 0 0.25 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.25 APEX 0.875 0.109531 0.25 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.265469 APEX 0.875 0 0.359531 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.375 RAD 0.03125 
+   txt215 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.375 APEX 0.984531 0 0.375 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.375 APEX 0.875 0.109531 0.375 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.390469 APEX 0.875 0 0.484531 RAD 0.0078125
+   txt215 
+TEXDEF txt215 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.5 RAD 0.03125 
+   txt215 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.5 APEX 0.984531 0 0.5 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.5 APEX 0.875 0.109531 0.5 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.515469 APEX 0.875 0 0.609531 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.625 RAD 0.03125 
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.625 APEX 0.984531 0 0.625 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.625 APEX 0.875 0.109531 0.625 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.640469 APEX 0.875 0 0.734531 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.75 RAD 0.03125 
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.75 APEX 0.984531 0 0.75 RAD 0.0078125
+   txt216 
+TEXDEF txt216 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.75 APEX 0.875 0.109531 0.75 RAD 0.0078125
+   txt216 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.765469 APEX 0.875 0 0.859531 RAD 0.0078125
+   txt217 
+TEXDEF txt217 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 0.875 RAD 0.03125 
+   txt217 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 0.875 APEX 0.984531 0 0.875 RAD 0.0078125
+   txt217 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 0.875 APEX 0.875 0.109531 0.875 RAD 0.0078125
+   txt217 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0 0.890469 APEX 0.875 0 0.984531 RAD 0.0078125
+   txt217 
+TEXDEF txt217 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0 1 RAD 0.03125 
+   txt217 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0 1 APEX 0.984531 0 1 RAD 0.0078125
+   txt217 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.0154687 1 APEX 0.875 0.109531 1 RAD 0.0078125
+   txt217 
+TEXDEF txt217 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0 RAD 0.03125 
+   txt217 
+TEXDEF txt217 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0 APEX 0.984531 0.125 0 RAD 0.0078125
+   txt217 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0 APEX 0.875 0.234531 0 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.0154687 APEX 0.875 0.125 0.109531 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.125 RAD 0.03125 
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.125 APEX 0.984531 0.125 0.125 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.125 APEX 0.875 0.234531 0.125 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.140469 APEX 0.875 0.125 0.234531 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.25 RAD 0.03125 
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.25 APEX 0.984531 0.125 0.25 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.25 APEX 0.875 0.234531 0.25 RAD 0.0078125
+   txt218 
+TEXDEF txt218 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.265469 APEX 0.875 0.125 0.359531 RAD 0.0078125
+   txt218 
+TEXDEF txt219 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.375 RAD 0.03125 
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.375 APEX 0.984531 0.125 0.375 RAD 0.0078125
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.375 APEX 0.875 0.234531 0.375 RAD 0.0078125
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.390469 APEX 0.875 0.125 0.484531 RAD 0.0078125
+   txt219 
+TEXDEF txt219 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.5 RAD 0.03125 
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.5 APEX 0.984531 0.125 0.5 RAD 0.0078125
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.5 APEX 0.875 0.234531 0.5 RAD 0.0078125
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.515469 APEX 0.875 0.125 0.609531 RAD 0.0078125
+   txt219 
+TEXDEF txt219 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.625 RAD 0.03125 
+   txt219 
+TEXDEF txt219 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.625 APEX 0.984531 0.125 0.625 RAD 0.0078125
+   txt219 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.625 APEX 0.875 0.234531 0.625 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.640469 APEX 0.875 0.125 0.734531 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.75 RAD 0.03125 
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.75 APEX 0.984531 0.125 0.75 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.75 APEX 0.875 0.234531 0.75 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.765469 APEX 0.875 0.125 0.859531 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 0.875 RAD 0.03125 
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 0.875 APEX 0.984531 0.125 0.875 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 0.875 APEX 0.875 0.234531 0.875 RAD 0.0078125
+   txt220 
+TEXDEF txt220 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.125 0.890469 APEX 0.875 0.125 0.984531 RAD 0.0078125
+   txt220 
+TEXDEF txt221 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.125 1 RAD 0.03125 
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.125 1 APEX 0.984531 0.125 1 RAD 0.0078125
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.140469 1 APEX 0.875 0.234531 1 RAD 0.0078125
+   txt221 
+TEXDEF txt221 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0 RAD 0.03125 
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0 APEX 0.984531 0.25 0 RAD 0.0078125
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0 APEX 0.875 0.359531 0 RAD 0.0078125
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.0154687 APEX 0.875 0.25 0.109531 RAD 0.0078125
+   txt221 
+TEXDEF txt221 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.125 RAD 0.03125 
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.125 APEX 0.984531 0.25 0.125 RAD 0.0078125
+   txt221 
+TEXDEF txt221 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.125 APEX 0.875 0.359531 0.125 RAD 0.0078125
+   txt221 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.140469 APEX 0.875 0.25 0.234531 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.25 RAD 0.03125 
+   txt222 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.25 APEX 0.984531 0.25 0.25 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.25 APEX 0.875 0.359531 0.25 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.265469 APEX 0.875 0.25 0.359531 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.375 RAD 0.03125 
+   txt222 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.375 APEX 0.984531 0.25 0.375 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.375 APEX 0.875 0.359531 0.375 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.390469 APEX 0.875 0.25 0.484531 RAD 0.0078125
+   txt222 
+TEXDEF txt222 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.5 RAD 0.03125 
+   txt222 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.5 APEX 0.984531 0.25 0.5 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.5 APEX 0.875 0.359531 0.5 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.515469 APEX 0.875 0.25 0.609531 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.625 RAD 0.03125 
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.625 APEX 0.984531 0.25 0.625 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.625 APEX 0.875 0.359531 0.625 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.640469 APEX 0.875 0.25 0.734531 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.75 RAD 0.03125 
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.75 APEX 0.984531 0.25 0.75 RAD 0.0078125
+   txt223 
+TEXDEF txt223 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.75 APEX 0.875 0.359531 0.75 RAD 0.0078125
+   txt223 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.765469 APEX 0.875 0.25 0.859531 RAD 0.0078125
+   txt224 
+TEXDEF txt224 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 0.875 RAD 0.03125 
+   txt224 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 0.875 APEX 0.984531 0.25 0.875 RAD 0.0078125
+   txt224 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 0.875 APEX 0.875 0.359531 0.875 RAD 0.0078125
+   txt224 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.25 0.890469 APEX 0.875 0.25 0.984531 RAD 0.0078125
+   txt224 
+TEXDEF txt224 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.25 1 RAD 0.03125 
+   txt224 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.25 1 APEX 0.984531 0.25 1 RAD 0.0078125
+   txt224 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.265469 1 APEX 0.875 0.359531 1 RAD 0.0078125
+   txt224 
+TEXDEF txt224 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0 RAD 0.03125 
+   txt224 
+TEXDEF txt224 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0 APEX 0.984531 0.375 0 RAD 0.0078125
+   txt224 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0 APEX 0.875 0.484531 0 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.0154687 APEX 0.875 0.375 0.109531 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.125 RAD 0.03125 
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.125 APEX 0.984531 0.375 0.125 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.125 APEX 0.875 0.484531 0.125 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.140469 APEX 0.875 0.375 0.234531 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.25 RAD 0.03125 
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.25 APEX 0.984531 0.375 0.25 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.25 APEX 0.875 0.484531 0.25 RAD 0.0078125
+   txt225 
+TEXDEF txt225 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.265469 APEX 0.875 0.375 0.359531 RAD 0.0078125
+   txt225 
+TEXDEF txt226 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.375 RAD 0.03125 
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.375 APEX 0.984531 0.375 0.375 RAD 0.0078125
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.375 APEX 0.875 0.484531 0.375 RAD 0.0078125
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.390469 APEX 0.875 0.375 0.484531 RAD 0.0078125
+   txt226 
+TEXDEF txt226 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.5 RAD 0.03125 
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.5 APEX 0.984531 0.375 0.5 RAD 0.0078125
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.5 APEX 0.875 0.484531 0.5 RAD 0.0078125
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.515469 APEX 0.875 0.375 0.609531 RAD 0.0078125
+   txt226 
+TEXDEF txt226 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.625 RAD 0.03125 
+   txt226 
+TEXDEF txt226 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.625 APEX 0.984531 0.375 0.625 RAD 0.0078125
+   txt226 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.625 APEX 0.875 0.484531 0.625 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.640469 APEX 0.875 0.375 0.734531 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.75 RAD 0.03125 
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.75 APEX 0.984531 0.375 0.75 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.75 APEX 0.875 0.484531 0.75 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.765469 APEX 0.875 0.375 0.859531 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 0.875 RAD 0.03125 
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 0.875 APEX 0.984531 0.375 0.875 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 0.875 APEX 0.875 0.484531 0.875 RAD 0.0078125
+   txt227 
+TEXDEF txt227 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.375 0.890469 APEX 0.875 0.375 0.984531 RAD 0.0078125
+   txt227 
+TEXDEF txt228 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.375 1 RAD 0.03125 
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.375 1 APEX 0.984531 0.375 1 RAD 0.0078125
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.390469 1 APEX 0.875 0.484531 1 RAD 0.0078125
+   txt228 
+TEXDEF txt228 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0 RAD 0.03125 
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0 APEX 0.984531 0.5 0 RAD 0.0078125
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0 APEX 0.875 0.609531 0 RAD 0.0078125
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.0154687 APEX 0.875 0.5 0.109531 RAD 0.0078125
+   txt228 
+TEXDEF txt228 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.125 RAD 0.03125 
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.125 APEX 0.984531 0.5 0.125 RAD 0.0078125
+   txt228 
+TEXDEF txt228 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.125 APEX 0.875 0.609531 0.125 RAD 0.0078125
+   txt228 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.140469 APEX 0.875 0.5 0.234531 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.25 RAD 0.03125 
+   txt229 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.25 APEX 0.984531 0.5 0.25 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.25 APEX 0.875 0.609531 0.25 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.265469 APEX 0.875 0.5 0.359531 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.375 RAD 0.03125 
+   txt229 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.375 APEX 0.984531 0.5 0.375 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.375 APEX 0.875 0.609531 0.375 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.390469 APEX 0.875 0.5 0.484531 RAD 0.0078125
+   txt229 
+TEXDEF txt229 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.5 RAD 0.03125 
+   txt229 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.5 APEX 0.984531 0.5 0.5 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.5 APEX 0.875 0.609531 0.5 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.515469 APEX 0.875 0.5 0.609531 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.625 RAD 0.03125 
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.625 APEX 0.984531 0.5 0.625 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.625 APEX 0.875 0.609531 0.625 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.640469 APEX 0.875 0.5 0.734531 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.75 RAD 0.03125 
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.75 APEX 0.984531 0.5 0.75 RAD 0.0078125
+   txt230 
+TEXDEF txt230 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.75 APEX 0.875 0.609531 0.75 RAD 0.0078125
+   txt230 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.765469 APEX 0.875 0.5 0.859531 RAD 0.0078125
+   txt231 
+TEXDEF txt231 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 0.875 RAD 0.03125 
+   txt231 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 0.875 APEX 0.984531 0.5 0.875 RAD 0.0078125
+   txt231 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 0.875 APEX 0.875 0.609531 0.875 RAD 0.0078125
+   txt231 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.5 0.890469 APEX 0.875 0.5 0.984531 RAD 0.0078125
+   txt231 
+TEXDEF txt231 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.5 1 RAD 0.03125 
+   txt231 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.5 1 APEX 0.984531 0.5 1 RAD 0.0078125
+   txt231 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.515469 1 APEX 0.875 0.609531 1 RAD 0.0078125
+   txt231 
+TEXDEF txt231 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0 RAD 0.03125 
+   txt231 
+TEXDEF txt231 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0 APEX 0.984531 0.625 0 RAD 0.0078125
+   txt231 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0 APEX 0.875 0.734531 0 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.0154687 APEX 0.875 0.625 0.109531 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.125 RAD 0.03125 
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.125 APEX 0.984531 0.625 0.125 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.125 APEX 0.875 0.734531 0.125 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.140469 APEX 0.875 0.625 0.234531 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.25 RAD 0.03125 
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.25 APEX 0.984531 0.625 0.25 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.25 APEX 0.875 0.734531 0.25 RAD 0.0078125
+   txt232 
+TEXDEF txt232 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.265469 APEX 0.875 0.625 0.359531 RAD 0.0078125
+   txt232 
+TEXDEF txt233 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.375 RAD 0.03125 
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.375 APEX 0.984531 0.625 0.375 RAD 0.0078125
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.375 APEX 0.875 0.734531 0.375 RAD 0.0078125
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.390469 APEX 0.875 0.625 0.484531 RAD 0.0078125
+   txt233 
+TEXDEF txt233 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.5 RAD 0.03125 
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.5 APEX 0.984531 0.625 0.5 RAD 0.0078125
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.5 APEX 0.875 0.734531 0.5 RAD 0.0078125
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.515469 APEX 0.875 0.625 0.609531 RAD 0.0078125
+   txt233 
+TEXDEF txt233 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.625 RAD 0.03125 
+   txt233 
+TEXDEF txt233 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.625 APEX 0.984531 0.625 0.625 RAD 0.0078125
+   txt233 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.625 APEX 0.875 0.734531 0.625 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.640469 APEX 0.875 0.625 0.734531 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.75 RAD 0.03125 
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.75 APEX 0.984531 0.625 0.75 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.75 APEX 0.875 0.734531 0.75 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.765469 APEX 0.875 0.625 0.859531 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 0.875 RAD 0.03125 
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 0.875 APEX 0.984531 0.625 0.875 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 0.875 APEX 0.875 0.734531 0.875 RAD 0.0078125
+   txt234 
+TEXDEF txt234 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.625 0.890469 APEX 0.875 0.625 0.984531 RAD 0.0078125
+   txt234 
+TEXDEF txt235 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.625 1 RAD 0.03125 
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.625 1 APEX 0.984531 0.625 1 RAD 0.0078125
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.640469 1 APEX 0.875 0.734531 1 RAD 0.0078125
+   txt235 
+TEXDEF txt235 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0 RAD 0.03125 
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0 APEX 0.984531 0.75 0 RAD 0.0078125
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0 APEX 0.875 0.859531 0 RAD 0.0078125
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.0154687 APEX 0.875 0.75 0.109531 RAD 0.0078125
+   txt235 
+TEXDEF txt235 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.125 RAD 0.03125 
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.125 APEX 0.984531 0.75 0.125 RAD 0.0078125
+   txt235 
+TEXDEF txt235 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.125 APEX 0.875 0.859531 0.125 RAD 0.0078125
+   txt235 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.140469 APEX 0.875 0.75 0.234531 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.25 RAD 0.03125 
+   txt236 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.25 APEX 0.984531 0.75 0.25 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.25 APEX 0.875 0.859531 0.25 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.265469 APEX 0.875 0.75 0.359531 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.375 RAD 0.03125 
+   txt236 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.375 APEX 0.984531 0.75 0.375 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.375 APEX 0.875 0.859531 0.375 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.390469 APEX 0.875 0.75 0.484531 RAD 0.0078125
+   txt236 
+TEXDEF txt236 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.5 RAD 0.03125 
+   txt236 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.5 APEX 0.984531 0.75 0.5 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.5 APEX 0.875 0.859531 0.5 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.515469 APEX 0.875 0.75 0.609531 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.625 RAD 0.03125 
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.625 APEX 0.984531 0.75 0.625 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.625 APEX 0.875 0.859531 0.625 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.640469 APEX 0.875 0.75 0.734531 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.75 RAD 0.03125 
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.75 APEX 0.984531 0.75 0.75 RAD 0.0078125
+   txt237 
+TEXDEF txt237 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.75 APEX 0.875 0.859531 0.75 RAD 0.0078125
+   txt237 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.765469 APEX 0.875 0.75 0.859531 RAD 0.0078125
+   txt238 
+TEXDEF txt238 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 0.875 RAD 0.03125 
+   txt238 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 0.875 APEX 0.984531 0.75 0.875 RAD 0.0078125
+   txt238 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 0.875 APEX 0.875 0.859531 0.875 RAD 0.0078125
+   txt238 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.75 0.890469 APEX 0.875 0.75 0.984531 RAD 0.0078125
+   txt238 
+TEXDEF txt238 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.75 1 RAD 0.03125 
+   txt238 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.75 1 APEX 0.984531 0.75 1 RAD 0.0078125
+   txt238 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.765469 1 APEX 0.875 0.859531 1 RAD 0.0078125
+   txt238 
+TEXDEF txt238 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0 RAD 0.03125 
+   txt238 
+TEXDEF txt238 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0 APEX 0.984531 0.875 0 RAD 0.0078125
+   txt238 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0 APEX 0.875 0.984531 0 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.0154687 APEX 0.875 0.875 0.109531 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.125 RAD 0.03125 
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.125 APEX 0.984531 0.875 0.125 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.125 APEX 0.875 0.984531 0.125 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.140469 APEX 0.875 0.875 0.234531 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.25 RAD 0.03125 
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.25 APEX 0.984531 0.875 0.25 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.25 APEX 0.875 0.984531 0.25 RAD 0.0078125
+   txt239 
+TEXDEF txt239 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.265469 APEX 0.875 0.875 0.359531 RAD 0.0078125
+   txt239 
+TEXDEF txt240 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.375 RAD 0.03125 
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.375 APEX 0.984531 0.875 0.375 RAD 0.0078125
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.375 APEX 0.875 0.984531 0.375 RAD 0.0078125
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.390469 APEX 0.875 0.875 0.484531 RAD 0.0078125
+   txt240 
+TEXDEF txt240 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.5 RAD 0.03125 
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.5 APEX 0.984531 0.875 0.5 RAD 0.0078125
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.5 APEX 0.875 0.984531 0.5 RAD 0.0078125
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.515469 APEX 0.875 0.875 0.609531 RAD 0.0078125
+   txt240 
+TEXDEF txt240 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.625 RAD 0.03125 
+   txt240 
+TEXDEF txt240 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.625 APEX 0.984531 0.875 0.625 RAD 0.0078125
+   txt240 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.625 APEX 0.875 0.984531 0.625 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.640469 APEX 0.875 0.875 0.734531 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.75 RAD 0.03125 
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.75 APEX 0.984531 0.875 0.75 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.75 APEX 0.875 0.984531 0.75 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.765469 APEX 0.875 0.875 0.859531 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 0.875 RAD 0.03125 
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 0.875 APEX 0.984531 0.875 0.875 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 0.875 APEX 0.875 0.984531 0.875 RAD 0.0078125
+   txt241 
+TEXDEF txt241 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.875 0.890469 APEX 0.875 0.875 0.984531 RAD 0.0078125
+   txt241 
+TEXDEF txt242 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 0.875 1 RAD 0.03125 
+   txt242 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 0.875 1 APEX 0.984531 0.875 1 RAD 0.0078125
+   txt242 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 0.890469 1 APEX 0.875 0.984531 1 RAD 0.0078125
+   txt242 
+TEXDEF txt242 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0 RAD 0.03125 
+   txt242 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0 APEX 0.984531 1 0 RAD 0.0078125
+   txt242 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.0154687 APEX 0.875 1 0.109531 RAD 0.0078125
+   txt242 
+TEXDEF txt242 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.125 RAD 0.03125 
+   txt242 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.125 APEX 0.984531 1 0.125 RAD 0.0078125
+   txt242 
+TEXDEF txt242 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.140469 APEX 0.875 1 0.234531 RAD 0.0078125
+   txt242 
+TEXDEF txt242 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.25 RAD 0.03125 
+   txt242 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.25 APEX 0.984531 1 0.25 RAD 0.0078125
+   txt243 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.265469 APEX 0.875 1 0.359531 RAD 0.0078125
+   txt243 
+TEXDEF txt243 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.375 RAD 0.03125 
+   txt243 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.375 APEX 0.984531 1 0.375 RAD 0.0078125
+   txt243 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.390469 APEX 0.875 1 0.484531 RAD 0.0078125
+   txt243 
+TEXDEF txt243 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.5 RAD 0.03125 
+   txt243 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.5 APEX 0.984531 1 0.5 RAD 0.0078125
+   txt243 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.515469 APEX 0.875 1 0.609531 RAD 0.0078125
+   txt243 
+TEXDEF txt243 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.625 RAD 0.03125 
+   txt243 
+TEXDEF txt243 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.625 APEX 0.984531 1 0.625 RAD 0.0078125
+   txt243 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.640469 APEX 0.875 1 0.734531 RAD 0.0078125
+   txt244 
+TEXDEF txt244 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.75 RAD 0.03125 
+   txt244 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.75 APEX 0.984531 1 0.75 RAD 0.0078125
+   txt244 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.765469 APEX 0.875 1 0.859531 RAD 0.0078125
+   txt244 
+TEXDEF txt244 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 0.875 RAD 0.03125 
+   txt244 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 0.875 APEX 0.984531 1 0.875 RAD 0.0078125
+   txt244 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.875 1 0.890469 APEX 0.875 1 0.984531 RAD 0.0078125
+   txt244 
+TEXDEF txt244 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 0.875 1 1 RAD 0.03125 
+   txt244 
+TEXDEF txt244 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.9 0.1 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 0.890469 1 1 APEX 0.984531 1 1 RAD 0.0078125
+   txt244 
+TEXDEF txt244 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0 RAD 0.03125 
+   txt244 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0 APEX 1 0.109531 0 RAD 0.0078125
+   txt245 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.0154687 APEX 1 0 0.109531 RAD 0.0078125
+   txt245 
+TEXDEF txt245 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.125 RAD 0.03125 
+   txt245 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.125 APEX 1 0.109531 0.125 RAD 0.0078125
+   txt245 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.140469 APEX 1 0 0.234531 RAD 0.0078125
+   txt245 
+TEXDEF txt245 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.25 RAD 0.03125 
+   txt245 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.25 APEX 1 0.109531 0.25 RAD 0.0078125
+   txt245 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.265469 APEX 1 0 0.359531 RAD 0.0078125
+   txt245 
+TEXDEF txt245 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.375 RAD 0.03125 
+   txt245 
+TEXDEF txt245 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.375 APEX 1 0.109531 0.375 RAD 0.0078125
+   txt245 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.390469 APEX 1 0 0.484531 RAD 0.0078125
+   txt246 
+TEXDEF txt246 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.5 RAD 0.03125 
+   txt246 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.5 APEX 1 0.109531 0.5 RAD 0.0078125
+   txt246 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.515469 APEX 1 0 0.609531 RAD 0.0078125
+   txt246 
+TEXDEF txt246 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.625 RAD 0.03125 
+   txt246 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.625 APEX 1 0.109531 0.625 RAD 0.0078125
+   txt246 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.640469 APEX 1 0 0.734531 RAD 0.0078125
+   txt246 
+TEXDEF txt246 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.75 RAD 0.03125 
+   txt246 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.75 APEX 1 0.109531 0.75 RAD 0.0078125
+   txt246 
+TEXDEF txt246 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.765469 APEX 1 0 0.859531 RAD 0.0078125
+   txt246 
+TEXDEF txt247 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 0.875 RAD 0.03125 
+   txt247 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 0.875 APEX 1 0.109531 0.875 RAD 0.0078125
+   txt247 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0 0.890469 APEX 1 0 0.984531 RAD 0.0078125
+   txt247 
+TEXDEF txt247 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0 1 RAD 0.03125 
+   txt247 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.0154687 1 APEX 1 0.109531 1 RAD 0.0078125
+   txt247 
+TEXDEF txt247 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0 RAD 0.03125 
+   txt247 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0 APEX 1 0.234531 0 RAD 0.0078125
+   txt247 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.0154687 APEX 1 0.125 0.109531 RAD 0.0078125
+   txt247 
+TEXDEF txt247 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.125 RAD 0.03125 
+   txt247 
+TEXDEF txt247 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.125 APEX 1 0.234531 0.125 RAD 0.0078125
+   txt247 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.140469 APEX 1 0.125 0.234531 RAD 0.0078125
+   txt248 
+TEXDEF txt248 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.25 RAD 0.03125 
+   txt248 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.25 APEX 1 0.234531 0.25 RAD 0.0078125
+   txt248 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.265469 APEX 1 0.125 0.359531 RAD 0.0078125
+   txt248 
+TEXDEF txt248 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.375 RAD 0.03125 
+   txt248 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.375 APEX 1 0.234531 0.375 RAD 0.0078125
+   txt248 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.390469 APEX 1 0.125 0.484531 RAD 0.0078125
+   txt248 
+TEXDEF txt248 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.5 RAD 0.03125 
+   txt248 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.5 APEX 1 0.234531 0.5 RAD 0.0078125
+   txt248 
+TEXDEF txt248 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.515469 APEX 1 0.125 0.609531 RAD 0.0078125
+   txt248 
+TEXDEF txt249 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.625 RAD 0.03125 
+   txt249 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.625 APEX 1 0.234531 0.625 RAD 0.0078125
+   txt249 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.640469 APEX 1 0.125 0.734531 RAD 0.0078125
+   txt249 
+TEXDEF txt249 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.75 RAD 0.03125 
+   txt249 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.75 APEX 1 0.234531 0.75 RAD 0.0078125
+   txt249 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.765469 APEX 1 0.125 0.859531 RAD 0.0078125
+   txt249 
+TEXDEF txt249 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 0.875 RAD 0.03125 
+   txt249 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 0.875 APEX 1 0.234531 0.875 RAD 0.0078125
+   txt249 
+TEXDEF txt249 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.125 0.890469 APEX 1 0.125 0.984531 RAD 0.0078125
+   txt249 
+TEXDEF txt249 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.125 1 RAD 0.03125 
+   txt249 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.140469 1 APEX 1 0.234531 1 RAD 0.0078125
+   txt250 
+TEXDEF txt250 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0 RAD 0.03125 
+   txt250 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0 APEX 1 0.359531 0 RAD 0.0078125
+   txt250 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.0154687 APEX 1 0.25 0.109531 RAD 0.0078125
+   txt250 
+TEXDEF txt250 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.125 RAD 0.03125 
+   txt250 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.125 APEX 1 0.359531 0.125 RAD 0.0078125
+   txt250 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.140469 APEX 1 0.25 0.234531 RAD 0.0078125
+   txt250 
+TEXDEF txt250 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.25 RAD 0.03125 
+   txt250 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.25 APEX 1 0.359531 0.25 RAD 0.0078125
+   txt250 
+TEXDEF txt250 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.265469 APEX 1 0.25 0.359531 RAD 0.0078125
+   txt250 
+TEXDEF txt251 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.375 RAD 0.03125 
+   txt251 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.375 APEX 1 0.359531 0.375 RAD 0.0078125
+   txt251 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.390469 APEX 1 0.25 0.484531 RAD 0.0078125
+   txt251 
+TEXDEF txt251 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.5 RAD 0.03125 
+   txt251 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.5 APEX 1 0.359531 0.5 RAD 0.0078125
+   txt251 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.515469 APEX 1 0.25 0.609531 RAD 0.0078125
+   txt251 
+TEXDEF txt251 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.625 RAD 0.03125 
+   txt251 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.625 APEX 1 0.359531 0.625 RAD 0.0078125
+   txt251 
+TEXDEF txt251 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.640469 APEX 1 0.25 0.734531 RAD 0.0078125
+   txt251 
+TEXDEF txt251 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.75 RAD 0.03125 
+   txt251 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.75 APEX 1 0.359531 0.75 RAD 0.0078125
+   txt252 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.765469 APEX 1 0.25 0.859531 RAD 0.0078125
+   txt252 
+TEXDEF txt252 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 0.875 RAD 0.03125 
+   txt252 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 0.875 APEX 1 0.359531 0.875 RAD 0.0078125
+   txt252 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.25 0.890469 APEX 1 0.25 0.984531 RAD 0.0078125
+   txt252 
+TEXDEF txt252 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.25 1 RAD 0.03125 
+   txt252 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.265469 1 APEX 1 0.359531 1 RAD 0.0078125
+   txt252 
+TEXDEF txt252 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0 RAD 0.03125 
+   txt252 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0 APEX 1 0.484531 0 RAD 0.0078125
+   txt252 
+TEXDEF txt252 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.0154687 APEX 1 0.375 0.109531 RAD 0.0078125
+   txt252 
+TEXDEF txt253 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.125 RAD 0.03125 
+   txt253 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.125 APEX 1 0.484531 0.125 RAD 0.0078125
+   txt253 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.140469 APEX 1 0.375 0.234531 RAD 0.0078125
+   txt253 
+TEXDEF txt253 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.25 RAD 0.03125 
+   txt253 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.25 APEX 1 0.484531 0.25 RAD 0.0078125
+   txt253 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.265469 APEX 1 0.375 0.359531 RAD 0.0078125
+   txt253 
+TEXDEF txt253 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.375 RAD 0.03125 
+   txt253 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.375 APEX 1 0.484531 0.375 RAD 0.0078125
+   txt253 
+TEXDEF txt253 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.390469 APEX 1 0.375 0.484531 RAD 0.0078125
+   txt253 
+TEXDEF txt253 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.5 RAD 0.03125 
+   txt253 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.5 APEX 1 0.484531 0.5 RAD 0.0078125
+   txt254 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.515469 APEX 1 0.375 0.609531 RAD 0.0078125
+   txt254 
+TEXDEF txt254 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.625 RAD 0.03125 
+   txt254 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.625 APEX 1 0.484531 0.625 RAD 0.0078125
+   txt254 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.640469 APEX 1 0.375 0.734531 RAD 0.0078125
+   txt254 
+TEXDEF txt254 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.75 RAD 0.03125 
+   txt254 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.75 APEX 1 0.484531 0.75 RAD 0.0078125
+   txt254 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.765469 APEX 1 0.375 0.859531 RAD 0.0078125
+   txt254 
+TEXDEF txt254 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 0.875 RAD 0.03125 
+   txt254 
+TEXDEF txt254 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 0.875 APEX 1 0.484531 0.875 RAD 0.0078125
+   txt254 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.375 0.890469 APEX 1 0.375 0.984531 RAD 0.0078125
+   txt255 
+TEXDEF txt255 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.375 1 RAD 0.03125 
+   txt255 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.390469 1 APEX 1 0.484531 1 RAD 0.0078125
+   txt255 
+TEXDEF txt255 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0 RAD 0.03125 
+   txt255 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0 APEX 1 0.609531 0 RAD 0.0078125
+   txt255 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.0154687 APEX 1 0.5 0.109531 RAD 0.0078125
+   txt255 
+TEXDEF txt255 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.125 RAD 0.03125 
+   txt255 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.125 APEX 1 0.609531 0.125 RAD 0.0078125
+   txt255 
+TEXDEF txt255 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.140469 APEX 1 0.5 0.234531 RAD 0.0078125
+   txt255 
+TEXDEF txt255 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.25 RAD 0.03125 
+   txt255 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.25 APEX 1 0.609531 0.25 RAD 0.0078125
+   txt256 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.265469 APEX 1 0.5 0.359531 RAD 0.0078125
+   txt256 
+TEXDEF txt256 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.375 RAD 0.03125 
+   txt256 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.375 APEX 1 0.609531 0.375 RAD 0.0078125
+   txt256 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.390469 APEX 1 0.5 0.484531 RAD 0.0078125
+   txt256 
+TEXDEF txt256 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.5 RAD 0.03125 
+   txt256 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.5 APEX 1 0.609531 0.5 RAD 0.0078125
+   txt256 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.515469 APEX 1 0.5 0.609531 RAD 0.0078125
+   txt256 
+TEXDEF txt256 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.625 RAD 0.03125 
+   txt256 
+TEXDEF txt256 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.625 APEX 1 0.609531 0.625 RAD 0.0078125
+   txt256 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.640469 APEX 1 0.5 0.734531 RAD 0.0078125
+   txt257 
+TEXDEF txt257 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.75 RAD 0.03125 
+   txt257 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.75 APEX 1 0.609531 0.75 RAD 0.0078125
+   txt257 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.765469 APEX 1 0.5 0.859531 RAD 0.0078125
+   txt257 
+TEXDEF txt257 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 0.875 RAD 0.03125 
+   txt257 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 0.875 APEX 1 0.609531 0.875 RAD 0.0078125
+   txt257 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.5 0.890469 APEX 1 0.5 0.984531 RAD 0.0078125
+   txt257 
+TEXDEF txt257 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.5 1 RAD 0.03125 
+   txt257 
+TEXDEF txt257 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.515469 1 APEX 1 0.609531 1 RAD 0.0078125
+   txt257 
+TEXDEF txt257 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0 RAD 0.03125 
+   txt257 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0 APEX 1 0.734531 0 RAD 0.0078125
+   txt258 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.0154687 APEX 1 0.625 0.109531 RAD 0.0078125
+   txt258 
+TEXDEF txt258 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.125 RAD 0.03125 
+   txt258 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.125 APEX 1 0.734531 0.125 RAD 0.0078125
+   txt258 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.140469 APEX 1 0.625 0.234531 RAD 0.0078125
+   txt258 
+TEXDEF txt258 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.25 RAD 0.03125 
+   txt258 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.25 APEX 1 0.734531 0.25 RAD 0.0078125
+   txt258 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.265469 APEX 1 0.625 0.359531 RAD 0.0078125
+   txt258 
+TEXDEF txt258 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.375 RAD 0.03125 
+   txt258 
+TEXDEF txt258 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.375 APEX 1 0.734531 0.375 RAD 0.0078125
+   txt258 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.390469 APEX 1 0.625 0.484531 RAD 0.0078125
+   txt259 
+TEXDEF txt259 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.5 RAD 0.03125 
+   txt259 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.5 APEX 1 0.734531 0.5 RAD 0.0078125
+   txt259 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.515469 APEX 1 0.625 0.609531 RAD 0.0078125
+   txt259 
+TEXDEF txt259 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.625 RAD 0.03125 
+   txt259 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.625 APEX 1 0.734531 0.625 RAD 0.0078125
+   txt259 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.640469 APEX 1 0.625 0.734531 RAD 0.0078125
+   txt259 
+TEXDEF txt259 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.75 RAD 0.03125 
+   txt259 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.75 APEX 1 0.734531 0.75 RAD 0.0078125
+   txt259 
+TEXDEF txt259 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.765469 APEX 1 0.625 0.859531 RAD 0.0078125
+   txt259 
+TEXDEF txt260 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 0.875 RAD 0.03125 
+   txt260 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 0.875 APEX 1 0.734531 0.875 RAD 0.0078125
+   txt260 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.625 0.890469 APEX 1 0.625 0.984531 RAD 0.0078125
+   txt260 
+TEXDEF txt260 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.625 1 RAD 0.03125 
+   txt260 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.640469 1 APEX 1 0.734531 1 RAD 0.0078125
+   txt260 
+TEXDEF txt260 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0 RAD 0.03125 
+   txt260 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0 APEX 1 0.859531 0 RAD 0.0078125
+   txt260 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.0154687 APEX 1 0.75 0.109531 RAD 0.0078125
+   txt260 
+TEXDEF txt260 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.125 RAD 0.03125 
+   txt260 
+TEXDEF txt260 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.125 APEX 1 0.859531 0.125 RAD 0.0078125
+   txt260 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.140469 APEX 1 0.75 0.234531 RAD 0.0078125
+   txt261 
+TEXDEF txt261 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.25 RAD 0.03125 
+   txt261 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.25 APEX 1 0.859531 0.25 RAD 0.0078125
+   txt261 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.265469 APEX 1 0.75 0.359531 RAD 0.0078125
+   txt261 
+TEXDEF txt261 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.375 RAD 0.03125 
+   txt261 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.375 APEX 1 0.859531 0.375 RAD 0.0078125
+   txt261 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.390469 APEX 1 0.75 0.484531 RAD 0.0078125
+   txt261 
+TEXDEF txt261 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.5 RAD 0.03125 
+   txt261 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.5 APEX 1 0.859531 0.5 RAD 0.0078125
+   txt261 
+TEXDEF txt261 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.515469 APEX 1 0.75 0.609531 RAD 0.0078125
+   txt261 
+TEXDEF txt262 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.625 RAD 0.03125 
+   txt262 
+TEXDEF txt262 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.625 APEX 1 0.859531 0.625 RAD 0.0078125
+   txt262 
+TEXDEF txt262 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.640469 APEX 1 0.75 0.734531 RAD 0.0078125
+   txt262 
+TEXDEF txt262 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.75 RAD 0.03125 
+   txt262 
+TEXDEF txt262 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.75 APEX 1 0.859531 0.75 RAD 0.0078125
+   txt262 
+TEXDEF txt262 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.765469 APEX 1 0.75 0.859531 RAD 0.0078125
+   txt262 
+TEXDEF txt262 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 0.875 RAD 0.03125 
+   txt262 
+TEXDEF txt262 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 0.875 APEX 1 0.859531 0.875 RAD 0.0078125
+   txt262 
+TEXDEF txt262 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.75 0.890469 APEX 1 0.75 0.984531 RAD 0.0078125
+   txt262 
+TEXDEF txt262 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.75 1 RAD 0.03125 
+   txt262 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.765469 1 APEX 1 0.859531 1 RAD 0.0078125
+   txt263 
+TEXDEF txt263 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0 RAD 0.03125 
+   txt263 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0 APEX 1 0.984531 0 RAD 0.0078125
+   txt263 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.0154687 APEX 1 0.875 0.109531 RAD 0.0078125
+   txt263 
+TEXDEF txt263 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.125 RAD 0.03125 
+   txt263 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.125 APEX 1 0.984531 0.125 RAD 0.0078125
+   txt263 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.140469 APEX 1 0.875 0.234531 RAD 0.0078125
+   txt263 
+TEXDEF txt263 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.25 RAD 0.03125 
+   txt263 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.25 APEX 1 0.984531 0.25 RAD 0.0078125
+   txt263 
+TEXDEF txt263 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.265469 APEX 1 0.875 0.359531 RAD 0.0078125
+   txt263 
+TEXDEF txt264 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.375 RAD 0.03125 
+   txt264 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.375 APEX 1 0.984531 0.375 RAD 0.0078125
+   txt264 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.390469 APEX 1 0.875 0.484531 RAD 0.0078125
+   txt264 
+TEXDEF txt264 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.5 RAD 0.03125 
+   txt264 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.5 APEX 1 0.984531 0.5 RAD 0.0078125
+   txt264 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.515469 APEX 1 0.875 0.609531 RAD 0.0078125
+   txt264 
+TEXDEF txt264 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.625 RAD 0.03125 
+   txt264 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.625 APEX 1 0.984531 0.625 RAD 0.0078125
+   txt264 
+TEXDEF txt264 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.640469 APEX 1 0.875 0.734531 RAD 0.0078125
+   txt264 
+TEXDEF txt264 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.75 RAD 0.03125 
+   txt264 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.75 APEX 1 0.984531 0.75 RAD 0.0078125
+   txt265 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.765469 APEX 1 0.875 0.859531 RAD 0.0078125
+   txt265 
+TEXDEF txt265 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 0.875 RAD 0.03125 
+   txt265 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 0.875 APEX 1 0.984531 0.875 RAD 0.0078125
+   txt265 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.875 0.890469 APEX 1 0.875 0.984531 RAD 0.0078125
+   txt265 
+TEXDEF txt265 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 0.875 1 RAD 0.03125 
+   txt265 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.9 0.1 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 0.890469 1 APEX 1 0.984531 1 RAD 0.0078125
+   txt265 
+TEXDEF txt265 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0 RAD 0.03125 
+   txt265 
+TEXDEF txt265 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.0154687 APEX 1 1 0.109531 RAD 0.0078125
+   txt265 
+TEXDEF txt265 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.125 RAD 0.03125 
+   txt265 
+TEXDEF txt266 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.140469 APEX 1 1 0.234531 RAD 0.0078125
+   txt266 
+TEXDEF txt266 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.25 RAD 0.03125 
+   txt266 
+TEXDEF txt266 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.265469 APEX 1 1 0.359531 RAD 0.0078125
+   txt266 
+TEXDEF txt266 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.375 RAD 0.03125 
+   txt266 
+TEXDEF txt266 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.390469 APEX 1 1 0.484531 RAD 0.0078125
+   txt266 
+TEXDEF txt266 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.5 RAD 0.03125 
+   txt266 
+TEXDEF txt266 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.515469 APEX 1 1 0.609531 RAD 0.0078125
+   txt266 
+TEXDEF txt266 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.625 RAD 0.03125 
+   txt266 
+TEXDEF txt266 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.640469 APEX 1 1 0.734531 RAD 0.0078125
+   txt266 
+TEXDEF txt266 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.75 RAD 0.03125 
+   txt266 
+TEXDEF txt267 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.765469 APEX 1 1 0.859531 RAD 0.0078125
+   txt267 
+TEXDEF txt267 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 0.875 RAD 0.03125 
+   txt267 
+TEXDEF txt267 AMBIENT 0.1  DIFFUSE 0.99  SPECULAR 0  OPACITY 1 
+ COLOR 0.1 0.1 0.9 
+ TEXFUNC 0 
+
+FCYLINDER
+ BASE 1 1 0.890469 APEX 1 1 0.984531 RAD 0.0078125
+   txt267 
+TEXDEF txt267 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+ COLOR 0.9 0.9 0.9 
+ TEXFUNC 0 
+
+ SPHERE CENTER 1 1 1 RAD 0.03125 
+   txt267 
+
+END_SCENE
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/model2.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/model2.dat
new file mode 100644
index 00000000..c57ce49c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/model2.dat
@@ -0,0 +1,104 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 512 512
+  VERBOSE 0
+
+CAMERA
+  ZOOM  1.0
+  ASPECTRATIO 1.0
+  ANTIALIASING 1
+  RAYDEPTH 12
+  CENTER    0.0 0.0 -5.0
+  VIEWDIR   0.0 0.0 1.0
+  UPDIR     0.0 1.0 0.0
+END_CAMERA
+
+LIGHT  
+  CENTER -5.0 0.0 -4.0   
+  RAD     0.2
+  COLOR   1.0 0.1  0.0 
+
+LIGHT
+  CENTER  4.0 5.0 -4.0  
+  RAD     0.2
+  COLOR   0.0 0.1  1.0
+
+LIGHT 
+  CENTER  4.0 1.5  3.0 
+  RAD     0.2
+  COLOR   0.5 0.5  0.5
+
+TRI
+  V0  0.0 -4.0 12.0
+  V1  4.0 -4.0 8.0
+  V2 -4.0 -4.0 8.0
+  TEXTURE
+    AMBIENT  0.1 DIFFUSE  0.2 SPECULAR 0.7 OPACITY 1.0
+    COLOR 1.0 1.0 1.0
+    TEXFUNC 0
+
+SPHERE
+  CENTER 0.0  0.0 5.0   
+  RAD 1.3 
+  TEXTURE 
+    AMBIENT  0.1 DIFFUSE  0.0 SPECULAR 0.9   OPACITY 1.0
+    COLOR 1.0 1.0 1.0  
+    TEXFUNC 0
+
+SPHERE
+  CENTER 1.0  0.0 4.3   
+  RAD 0.8 
+  TEXTURE  
+    AMBIENT  0.1 DIFFUSE  0.9 SPECULAR 0.0 OPACITY 1.0
+    COLOR 0.3 0.3 1.0
+    TEXFUNC 3
+      CENTER 1.0 0.0 4.3
+      ROTATE 0. 0.0 0.0
+      SCALE  1.0 1.0 1.0
+
+SPHERE
+  CENTER 0.0  2.0 8.0   
+  RAD 1.0
+  TEXTURE 
+    AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0 OPACITY 1.0
+    COLOR 1.0 0.0 1.0  
+    TEXFUNC 4
+      CENTER 0.0 1.0 8.0
+      ROTATE 0. 0.0 0.0
+      SCALE  1.0 1.0 1.0
+
+SPHERE
+  CENTER -1.0 -0.5 5.0 
+  RAD  1.0
+  TEXTURE
+    AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0  OPACITY 1.0
+    COLOR 1.0 1.0 0.5  
+    TEXFUNC 6
+      CENTER -1.0 -0.5 5.0
+      ROTATE 0. 0.0 0.0
+      SCALE  1.0 1.0 1.0
+
+PLANE 
+  CENTER 0.0 -5.0 0.0 
+  NORMAL 0.0  1.0 0.0  
+  TEXTURE 
+    AMBIENT  0.1 DIFFUSE  0.9 SPECULAR 0.0  OPACITY 1.0
+    COLOR  1.0 1.0 1.0 
+    TEXFUNC  1
+      CENTER 0.0 -5.0 0.0
+      ROTATE 0. 0.0 0.0
+      SCALE  1.0 1.0 1.0
+
+PLANE
+  CENTER 0.0 0.0 15.0  
+  NORMAL 0.0 0.0 -1.0  
+  TEXTURE 
+    AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0   OPACITY 1.0
+    COLOR 1.0 1.0 1.0 
+    TEXFUNC  3
+      CENTER 0.0 0.0 15.0
+      ROTATE 0. 0.0 0.0
+      SCALE  1.0 1.0 1.0
+
+END_SCENE
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/teapot.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/teapot.dat
new file mode 100644
index 00000000..105afcdd
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/teapot.dat
@@ -0,0 +1,9279 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 512 512
+  VERBOSE 0
+
+CAMERA
+  ZOOM 1.20711
+ASPECTRATIO 1.0
+  ANTIALIASING 0
+  RAYDEPTH 5
+  CENTER 4.86 7.2 5.4
+  VIEWDIR -0.475149 -0.703924 -0.527943
+  UPDIR -0.29537 -0.437585 0.84928
+
+END_CAMERA 
+
+BACKGROUND 0.078 0.361 0.753 
+
+LIGHT CENTER -3.1 9.8 12.1 RAD 0.002 COLOR 0.5 0.5 0.5
+
+LIGHT CENTER 11.3 5.1 8.8 RAD 0.002 COLOR 0.5 0.5 0.5
+
+TEXDEF txt001 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+PHONG METAL 0.5 PHONG_SIZE 4.81884
+ COLOR 1 1 1 
+ TEXFUNC 0 
+
+TRI 
+  V0 -4 -2.66667 0   V1 -2.66667 -2.66667 0   V2 -4 -1.33333 0 
+   txt001 
+TRI 
+  V0 -2.66667 -2.66667 0   V1 -2.66667 -1.33333 0   V2 -4 -1.33333 0 
+   txt001 
+TRI 
+  V0 -4 0 0   V1 -2.66667 0 0   V2 -4 1.33333 0 
+   txt001 
+TRI 
+  V0 -2.66667 0 0   V1 -2.66667 1.33333 0   V2 -4 1.33333 0 
+   txt001 
+TRI 
+  V0 -4 2.66667 0   V1 -2.66667 2.66667 0   V2 -4 4 0 
+   txt001 
+TRI 
+  V0 -2.66667 2.66667 0   V1 -2.66667 4 0   V2 -4 4 0 
+   txt001 
+TRI 
+  V0 -2.66667 -4 0   V1 -1.33333 -4 0   V2 -2.66667 -2.66667 0 
+   txt001 
+TRI 
+  V0 -1.33333 -4 0   V1 -1.33333 -2.66667 0   V2 -2.66667 -2.66667 0 
+   txt001 
+TRI 
+  V0 -2.66667 -1.33333 0   V1 -1.33333 -1.33333 0   V2 -2.66667 0 0 
+   txt001 
+TRI 
+  V0 -1.33333 -1.33333 0   V1 -1.33333 0 0   V2 -2.66667 0 0 
+   txt001 
+TRI 
+  V0 -2.66667 1.33333 0   V1 -1.33333 1.33333 0   V2 -2.66667 2.66667 0 
+   txt001 
+TRI 
+  V0 -1.33333 1.33333 0   V1 -1.33333 2.66667 0   V2 -2.66667 2.66667 0 
+   txt001 
+TRI 
+  V0 -1.33333 -2.66667 0   V1 0 -2.66667 0   V2 -1.33333 -1.33333 0 
+   txt001 
+TRI 
+  V0 0 -2.66667 0   V1 0 -1.33333 0   V2 -1.33333 -1.33333 0 
+   txt001 
+TRI 
+  V0 -1.33333 0 0   V1 0 0 0   V2 -1.33333 1.33333 0 
+   txt001 
+TRI 
+  V0 0 0 0   V1 0 1.33333 0   V2 -1.33333 1.33333 0 
+   txt001 
+TRI 
+  V0 -1.33333 2.66667 0   V1 0 2.66667 0   V2 -1.33333 4 0 
+   txt001 
+TRI 
+  V0 0 2.66667 0   V1 0 4 0   V2 -1.33333 4 0 
+   txt001 
+TRI 
+  V0 0 -4 0   V1 1.33333 -4 0   V2 0 -2.66667 0 
+   txt001 
+TRI 
+  V0 1.33333 -4 0   V1 1.33333 -2.66667 0   V2 0 -2.66667 0 
+   txt001 
+TRI 
+  V0 0 -1.33333 0   V1 1.33333 -1.33333 0   V2 0 0 0 
+   txt001 
+TRI 
+  V0 1.33333 -1.33333 0   V1 1.33333 0 0   V2 0 0 0 
+   txt001 
+TRI 
+  V0 0 1.33333 0   V1 1.33333 1.33333 0   V2 0 2.66667 0 
+   txt001 
+TRI 
+  V0 1.33333 1.33333 0   V1 1.33333 2.66667 0   V2 0 2.66667 0 
+   txt001 
+TRI 
+  V0 1.33333 -2.66667 0   V1 2.66667 -2.66667 0   V2 1.33333 -1.33333 0 
+   txt001 
+TRI 
+  V0 2.66667 -2.66667 0   V1 2.66667 -1.33333 0   V2 1.33333 -1.33333 0 
+   txt001 
+TRI 
+  V0 1.33333 0 0   V1 2.66667 0 0   V2 1.33333 1.33333 0 
+   txt001 
+TRI 
+  V0 2.66667 0 0   V1 2.66667 1.33333 0   V2 1.33333 1.33333 0 
+   txt001 
+TRI 
+  V0 1.33333 2.66667 0   V1 2.66667 2.66667 0   V2 1.33333 4 0 
+   txt001 
+TRI 
+  V0 2.66667 2.66667 0   V1 2.66667 4 0   V2 1.33333 4 0 
+   txt001 
+TRI 
+  V0 2.66667 -4 0   V1 4 -4 0   V2 2.66667 -2.66667 0 
+   txt001 
+TRI 
+  V0 4 -4 0   V1 4 -2.66667 0   V2 2.66667 -2.66667 0 
+   txt001 
+TRI 
+  V0 2.66667 -1.33333 0   V1 4 -1.33333 0   V2 2.66667 0 0 
+   txt001 
+TRI 
+  V0 4 -1.33333 0   V1 4 0 0   V2 2.66667 0 0 
+   txt001 
+TRI 
+  V0 2.66667 1.33333 0   V1 4 1.33333 0   V2 2.66667 2.66667 0 
+   txt001 
+TRI 
+  V0 4 1.33333 0   V1 4 2.66667 0   V2 2.66667 2.66667 0 
+   txt001 
+TEXDEF txt002 AMBIENT 0  DIFFUSE 0.5  SPECULAR 0.5  OPACITY 1 
+PHONG METAL 0.5 PHONG_SIZE 4.81884
+ COLOR 0.5 0.5 0.5 
+ TEXFUNC 0 
+
+TRI 
+  V0 -4 -4 0   V1 -2.66667 -4 0   V2 -4 -2.66667 0 
+   txt002 
+TRI 
+  V0 -2.66667 -4 0   V1 -2.66667 -2.66667 0   V2 -4 -2.66667 0 
+   txt002 
+TRI 
+  V0 -4 -1.33333 0   V1 -2.66667 -1.33333 0   V2 -4 0 0 
+   txt002 
+TRI 
+  V0 -2.66667 -1.33333 0   V1 -2.66667 0 0   V2 -4 0 0 
+   txt002 
+TRI 
+  V0 -4 1.33333 0   V1 -2.66667 1.33333 0   V2 -4 2.66667 0 
+   txt002 
+TRI 
+  V0 -2.66667 1.33333 0   V1 -2.66667 2.66667 0   V2 -4 2.66667 0 
+   txt002 
+TRI 
+  V0 -2.66667 -2.66667 0   V1 -1.33333 -2.66667 0   V2 -2.66667 -1.33333 0 
+   txt002 
+TRI 
+  V0 -1.33333 -2.66667 0   V1 -1.33333 -1.33333 0   V2 -2.66667 -1.33333 0 
+   txt002 
+TRI 
+  V0 -2.66667 0 0   V1 -1.33333 0 0   V2 -2.66667 1.33333 0 
+   txt002 
+TRI 
+  V0 -1.33333 0 0   V1 -1.33333 1.33333 0   V2 -2.66667 1.33333 0 
+   txt002 
+TRI 
+  V0 -2.66667 2.66667 0   V1 -1.33333 2.66667 0   V2 -2.66667 4 0 
+   txt002 
+TRI 
+  V0 -1.33333 2.66667 0   V1 -1.33333 4 0   V2 -2.66667 4 0 
+   txt002 
+TRI 
+  V0 -1.33333 -4 0   V1 0 -4 0   V2 -1.33333 -2.66667 0 
+   txt002 
+TRI 
+  V0 0 -4 0   V1 0 -2.66667 0   V2 -1.33333 -2.66667 0 
+   txt002 
+TRI 
+  V0 -1.33333 -1.33333 0   V1 0 -1.33333 0   V2 -1.33333 0 0 
+   txt002 
+TRI 
+  V0 0 -1.33333 0   V1 0 0 0   V2 -1.33333 0 0 
+   txt002 
+TRI 
+  V0 -1.33333 1.33333 0   V1 0 1.33333 0   V2 -1.33333 2.66667 0 
+   txt002 
+TRI 
+  V0 0 1.33333 0   V1 0 2.66667 0   V2 -1.33333 2.66667 0 
+   txt002 
+TRI 
+  V0 0 -2.66667 0   V1 1.33333 -2.66667 0   V2 0 -1.33333 0 
+   txt002 
+TRI 
+  V0 1.33333 -2.66667 0   V1 1.33333 -1.33333 0   V2 0 -1.33333 0 
+   txt002 
+TRI 
+  V0 0 0 0   V1 1.33333 0 0   V2 0 1.33333 0 
+   txt002 
+TRI 
+  V0 1.33333 0 0   V1 1.33333 1.33333 0   V2 0 1.33333 0 
+   txt002 
+TRI 
+  V0 0 2.66667 0   V1 1.33333 2.66667 0   V2 0 4 0 
+   txt002 
+TRI 
+  V0 1.33333 2.66667 0   V1 1.33333 4 0   V2 0 4 0 
+   txt002 
+TRI 
+  V0 1.33333 -4 0   V1 2.66667 -4 0   V2 1.33333 -2.66667 0 
+   txt002 
+TRI 
+  V0 2.66667 -4 0   V1 2.66667 -2.66667 0   V2 1.33333 -2.66667 0 
+   txt002 
+TRI 
+  V0 1.33333 -1.33333 0   V1 2.66667 -1.33333 0   V2 1.33333 0 0 
+   txt002 
+TRI 
+  V0 2.66667 -1.33333 0   V1 2.66667 0 0   V2 1.33333 0 0 
+   txt002 
+TRI 
+  V0 1.33333 1.33333 0   V1 2.66667 1.33333 0   V2 1.33333 2.66667 0 
+   txt002 
+TRI 
+  V0 2.66667 1.33333 0   V1 2.66667 2.66667 0   V2 1.33333 2.66667 0 
+   txt002 
+TRI 
+  V0 2.66667 -2.66667 0   V1 4 -2.66667 0   V2 2.66667 -1.33333 0 
+   txt002 
+TRI 
+  V0 4 -2.66667 0   V1 4 -1.33333 0   V2 2.66667 -1.33333 0 
+   txt002 
+TRI 
+  V0 2.66667 0 0   V1 4 0 0   V2 2.66667 1.33333 0 
+   txt002 
+TRI 
+  V0 4 0 0   V1 4 1.33333 0   V2 2.66667 1.33333 0 
+   txt002 
+TRI 
+  V0 2.66667 2.66667 0   V1 4 2.66667 0   V2 2.66667 4 0 
+   txt002 
+TRI 
+  V0 4 2.66667 0   V1 4 4 0   V2 2.66667 4 0 
+   txt002 
+TEXDEF txt003 AMBIENT 0  DIFFUSE 0.75  SPECULAR 0.25  OPACITY 1 
+PHONG PLASTIC 0.25 PHONG_SIZE 45.2776
+ COLOR 1 0.5 0.1 
+ TEXFUNC 0 
+
+STRI 
+  V0 1.4 0 2.4   V1 1.35074 -0.375926 2.4   V2 1.33276 -0.370922 2.45469 
+  N0 -0.902861 -0 -0.429934   N1 -0.871509 0.234929 -0.430442   N2 -0.953562 0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 1.33276 -0.370922 2.45469   V1 1.38137 0 2.45469   V2 1.4 0 2.4 
+  N0 -0.953562 0.257047 -0.156989   N1 -0.987636 -0 -0.156768   N2 -0.902861 -0 -0.429934 
+   txt003 
+STRI 
+  V0 1.35074 -0.375926 2.4   V1 1.21126 -0.711407 2.4   V2 1.19514 -0.701938 2.45469 
+  N0 -0.871509 0.234929 -0.430442   N1 -0.780517 0.4527 -0.43111   N2 -0.854265 0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 1.19514 -0.701938 2.45469   V1 1.33276 -0.370922 2.45469   V2 1.35074 -0.375926 2.4 
+  N0 -0.854265 0.495474 -0.157281   N1 -0.953562 0.257047 -0.156989   N2 -0.871509 0.234929 -0.430442 
+   txt003 
+STRI 
+  V0 1.21126 -0.711407 2.4   V1 0.994 -0.994 2.4   V2 0.98077 -0.98077 2.45469 
+  N0 -0.780517 0.4527 -0.43111   N1 -0.637936 0.637936 -0.431366   N2 -0.698293 0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 0.98077 -0.98077 2.45469   V1 1.19514 -0.701938 2.45469   V2 1.21126 -0.711407 2.4 
+  N0 -0.698293 0.698293 -0.157393   N1 -0.854265 0.495474 -0.157281   N2 -0.780517 0.4527 -0.43111 
+   txt003 
+STRI 
+  V0 0.994 -0.994 2.4   V1 0.711407 -1.21126 2.4   V2 0.701938 -1.19514 2.45469 
+  N0 -0.637936 0.637936 -0.431366   N1 -0.4527 0.780517 -0.43111   N2 -0.495474 0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 0.701938 -1.19514 2.45469   V1 0.98077 -0.98077 2.45469   V2 0.994 -0.994 2.4 
+  N0 -0.495474 0.854265 -0.157281   N1 -0.698293 0.698293 -0.157393   N2 -0.637936 0.637936 -0.431366 
+   txt003 
+STRI 
+  V0 0.711407 -1.21126 2.4   V1 0.375926 -1.35074 2.4   V2 0.370922 -1.33276 2.45469 
+  N0 -0.4527 0.780517 -0.43111   N1 -0.234929 0.871509 -0.430442   N2 -0.257047 0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 0.370922 -1.33276 2.45469   V1 0.701938 -1.19514 2.45469   V2 0.711407 -1.21126 2.4 
+  N0 -0.257047 0.953562 -0.156989   N1 -0.495474 0.854265 -0.157281   N2 -0.4527 0.780517 -0.43111 
+   txt003 
+STRI 
+  V0 0.375926 -1.35074 2.4   V1 0 -1.4 2.4   V2 0 -1.38137 2.45469 
+  N0 -0.234929 0.871509 -0.430442   N1 7.30595e-17 0.902861 -0.429934   N2 -9.89971e-17 0.987636 -0.156768 
+   txt003 
+STRI 
+  V0 0 -1.38137 2.45469   V1 0.370922 -1.33276 2.45469   V2 0.375926 -1.35074 2.4 
+  N0 -9.89971e-17 0.987636 -0.156768   N1 -0.257047 0.953562 -0.156989   N2 -0.234929 0.871509 -0.430442 
+   txt003 
+STRI 
+  V0 1.38137 0 2.45469   V1 1.33276 -0.370922 2.45469   V2 1.33555 -0.371699 2.4875 
+  N0 -0.987636 -0 -0.156768   N1 -0.953562 0.257047 -0.156989   N2 -0.849414 0.228972 0.475466 
+   txt003 
+STRI 
+  V0 1.33555 -0.371699 2.4875   V1 1.38426 0 2.4875   V2 1.38137 0 2.45469 
+  N0 -0.849414 0.228972 0.475466   N1 -0.880022 0 0.474933   N2 -0.987636 -0 -0.156768 
+   txt003 
+STRI 
+  V0 1.33276 -0.370922 2.45469   V1 1.19514 -0.701938 2.45469   V2 1.19764 -0.703409 2.4875 
+  N0 -0.953562 0.257047 -0.156989   N1 -0.854265 0.495474 -0.157281   N2 -0.760669 0.441188 0.476167 
+   txt003 
+STRI 
+  V0 1.19764 -0.703409 2.4875   V1 1.33555 -0.371699 2.4875   V2 1.33276 -0.370922 2.45469 
+  N0 -0.760669 0.441188 0.476167   N1 -0.849414 0.228972 0.475466   N2 -0.953562 0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 1.19514 -0.701938 2.45469   V1 0.98077 -0.98077 2.45469   V2 0.982824 -0.982824 2.4875 
+  N0 -0.854265 0.495474 -0.157281   N1 -0.698293 0.698293 -0.157393   N2 -0.621695 0.621695 0.476435 
+   txt003 
+STRI 
+  V0 0.982824 -0.982824 2.4875   V1 1.19764 -0.703409 2.4875   V2 1.19514 -0.701938 2.45469 
+  N0 -0.621695 0.621695 0.476435   N1 -0.760669 0.441188 0.476167   N2 -0.854265 0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 0.98077 -0.98077 2.45469   V1 0.701938 -1.19514 2.45469   V2 0.703409 -1.19764 2.4875 
+  N0 -0.698293 0.698293 -0.157393   N1 -0.495474 0.854265 -0.157281   N2 -0.441188 0.760669 0.476167 
+   txt003 
+STRI 
+  V0 0.703409 -1.19764 2.4875   V1 0.982824 -0.982824 2.4875   V2 0.98077 -0.98077 2.45469 
+  N0 -0.441188 0.760669 0.476167   N1 -0.621695 0.621695 0.476435   N2 -0.698293 0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 0.701938 -1.19514 2.45469   V1 0.370922 -1.33276 2.45469   V2 0.371699 -1.33555 2.4875 
+  N0 -0.495474 0.854265 -0.157281   N1 -0.257047 0.953562 -0.156989   N2 -0.228972 0.849414 0.475466 
+   txt003 
+STRI 
+  V0 0.371699 -1.33555 2.4875   V1 0.703409 -1.19764 2.4875   V2 0.701938 -1.19514 2.45469 
+  N0 -0.228972 0.849414 0.475466   N1 -0.441188 0.760669 0.476167   N2 -0.495474 0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 0.370922 -1.33276 2.45469   V1 0 -1.38137 2.45469   V2 0 -1.38426 2.4875 
+  N0 -0.257047 0.953562 -0.156989   N1 -9.89971e-17 0.987636 -0.156768   N2 -6.08179e-16 0.880022 0.474933 
+   txt003 
+STRI 
+  V0 0 -1.38426 2.4875   V1 0.371699 -1.33555 2.4875   V2 0.370922 -1.33276 2.45469 
+  N0 -6.08179e-16 0.880022 0.474933   N1 -0.228972 0.849414 0.475466   N2 -0.257047 0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 1.38426 0 2.4875   V1 1.33555 -0.371699 2.4875   V2 1.35376 -0.376765 2.49844 
+  N0 -0.880022 0 0.474933   N1 -0.849414 0.228972 0.475466   N2 2.13636e-15 -5.93089e-16 1 
+   txt003 
+STRI 
+  V0 1.35376 -0.376765 2.49844   V1 1.40312 0 2.49844   V2 1.38426 0 2.4875 
+  N0 2.13636e-15 -5.93089e-16 1   N1 2.22045e-15 0 1   N2 -0.880022 0 0.474933 
+   txt003 
+STRI 
+  V0 1.33555 -0.371699 2.4875   V1 1.19764 -0.703409 2.4875   V2 1.21396 -0.712995 2.49844 
+  N0 -0.849414 0.228972 0.475466   N1 -0.760669 0.441188 0.476167   N2 1.87966e-15 -1.16933e-15 1 
+   txt003 
+STRI 
+  V0 1.21396 -0.712995 2.49844   V1 1.35376 -0.376765 2.49844   V2 1.33555 -0.371699 2.4875 
+  N0 1.87966e-15 -1.16933e-15 1   N1 2.13636e-15 -5.93089e-16 1   N2 -0.849414 0.228972 0.475466 
+   txt003 
+STRI 
+  V0 1.19764 -0.703409 2.4875   V1 0.982824 -0.982824 2.4875   V2 0.996219 -0.996219 2.49844 
+  N0 -0.760669 0.441188 0.476167   N1 -0.621695 0.621695 0.476435   N2 1.4538e-15 -1.67359e-15 1 
+   txt003 
+STRI 
+  V0 0.996219 -0.996219 2.49844   V1 1.21396 -0.712995 2.49844   V2 1.19764 -0.703409 2.4875 
+  N0 1.4538e-15 -1.67359e-15 1   N1 1.87966e-15 -1.16933e-15 1   N2 -0.760669 0.441188 0.476167 
+   txt003 
+STRI 
+  V0 0.982824 -0.982824 2.4875   V1 0.703409 -1.19764 2.4875   V2 0.712995 -1.21396 2.49844 
+  N0 -0.621695 0.621695 0.476435   N1 -0.441188 0.760669 0.476167   N2 8.74229e-16 -2.05298e-15 1 
+   txt003 
+STRI 
+  V0 0.712995 -1.21396 2.49844   V1 0.996219 -0.996219 2.49844   V2 0.982824 -0.982824 2.4875 
+  N0 8.74229e-16 -2.05298e-15 1   N1 1.4538e-15 -1.67359e-15 1   N2 -0.621695 0.621695 0.476435 
+   txt003 
+STRI 
+  V0 0.703409 -1.19764 2.4875   V1 0.371699 -1.33555 2.4875   V2 0.376765 -1.35376 2.49844 
+  N0 -0.441188 0.760669 0.476167   N1 -0.228972 0.849414 0.475466   N2 1.77072e-16 -2.25214e-15 1 
+   txt003 
+STRI 
+  V0 0.376765 -1.35376 2.49844   V1 0.712995 -1.21396 2.49844   V2 0.703409 -1.19764 2.4875 
+  N0 1.77072e-16 -2.25214e-15 1   N1 8.74229e-16 -2.05298e-15 1   N2 -0.441188 0.760669 0.476167 
+   txt003 
+STRI 
+  V0 0.371699 -1.33555 2.4875   V1 0 -1.38426 2.4875   V2 0 -1.40312 2.49844 
+  N0 -0.228972 0.849414 0.475466   N1 -6.08179e-16 0.880022 0.474933   N2 -5.65179e-16 -2.22045e-15 1 
+   txt003 
+STRI 
+  V0 0 -1.40312 2.49844   V1 0.376765 -1.35376 2.49844   V2 0.371699 -1.33555 2.4875 
+  N0 -5.65179e-16 -2.22045e-15 1   N1 1.77072e-16 -2.25214e-15 1   N2 -0.228972 0.849414 0.475466 
+   txt003 
+STRI 
+  V0 1.40312 0 2.49844   V1 1.35376 -0.376765 2.49844   V2 1.38201 -0.384628 2.4875 
+  N0 2.22045e-15 0 1   N1 2.13636e-15 -5.93089e-16 1   N2 0.537012 -0.14476 0.831061 
+   txt003 
+STRI 
+  V0 1.38201 -0.384628 2.4875   V1 1.43241 0 2.4875   V2 1.40312 0 2.49844 
+  N0 0.537012 -0.14476 0.831061   N1 0.556738 0 0.830688   N2 2.22045e-15 0 1 
+   txt003 
+STRI 
+  V0 1.35376 -0.376765 2.49844   V1 1.21396 -0.712995 2.49844   V2 1.2393 -0.727875 2.4875 
+  N0 2.13636e-15 -5.93089e-16 1   N1 1.87966e-15 -1.16933e-15 1   N2 0.480481 -0.278679 0.83155 
+   txt003 
+STRI 
+  V0 1.2393 -0.727875 2.4875   V1 1.38201 -0.384628 2.4875   V2 1.35376 -0.376765 2.49844 
+  N0 0.480481 -0.278679 0.83155   N1 0.537012 -0.14476 0.831061   N2 2.13636e-15 -5.93089e-16 1 
+   txt003 
+STRI 
+  V0 1.21396 -0.712995 2.49844   V1 0.996219 -0.996219 2.49844   V2 1.01701 -1.01701 2.4875 
+  N0 1.87966e-15 -1.16933e-15 1   N1 1.4538e-15 -1.67359e-15 1   N2 0.392564 -0.392564 0.831737 
+   txt003 
+STRI 
+  V0 1.01701 -1.01701 2.4875   V1 1.2393 -0.727875 2.4875   V2 1.21396 -0.712995 2.49844 
+  N0 0.392564 -0.392564 0.831737   N1 0.480481 -0.278679 0.83155   N2 1.87966e-15 -1.16933e-15 1 
+   txt003 
+STRI 
+  V0 0.996219 -0.996219 2.49844   V1 0.712995 -1.21396 2.49844   V2 0.727875 -1.2393 2.4875 
+  N0 1.4538e-15 -1.67359e-15 1   N1 8.74229e-16 -2.05298e-15 1   N2 0.278679 -0.480481 0.83155 
+   txt003 
+STRI 
+  V0 0.727875 -1.2393 2.4875   V1 1.01701 -1.01701 2.4875   V2 0.996219 -0.996219 2.49844 
+  N0 0.278679 -0.480481 0.83155   N1 0.392564 -0.392564 0.831737   N2 1.4538e-15 -1.67359e-15 1 
+   txt003 
+STRI 
+  V0 0.712995 -1.21396 2.49844   V1 0.376765 -1.35376 2.49844   V2 0.384628 -1.38201 2.4875 
+  N0 8.74229e-16 -2.05298e-15 1   N1 1.77072e-16 -2.25214e-15 1   N2 0.14476 -0.537012 0.831061 
+   txt003 
+STRI 
+  V0 0.384628 -1.38201 2.4875   V1 0.727875 -1.2393 2.4875   V2 0.712995 -1.21396 2.49844 
+  N0 0.14476 -0.537012 0.831061   N1 0.278679 -0.480481 0.83155   N2 8.74229e-16 -2.05298e-15 1 
+   txt003 
+STRI 
+  V0 0.376765 -1.35376 2.49844   V1 0 -1.40312 2.49844   V2 0 -1.43241 2.4875 
+  N0 1.77072e-16 -2.25214e-15 1   N1 -5.65179e-16 -2.22045e-15 1   N2 -4.5989e-16 -0.556738 0.830688 
+   txt003 
+STRI 
+  V0 0 -1.43241 2.4875   V1 0.384628 -1.38201 2.4875   V2 0.376765 -1.35376 2.49844 
+  N0 -4.5989e-16 -0.556738 0.830688   N1 0.14476 -0.537012 0.831061   N2 1.77072e-16 -2.25214e-15 1 
+   txt003 
+STRI 
+  V0 1.43241 0 2.4875   V1 1.38201 -0.384628 2.4875   V2 1.41495 -0.393796 2.45469 
+  N0 0.556738 0 0.830688   N1 0.537012 -0.14476 0.831061   N2 0.755869 -0.203756 0.622211 
+   txt003 
+STRI 
+  V0 1.41495 -0.393796 2.45469   V1 1.46655 0 2.45469   V2 1.43241 0 2.4875 
+  N0 0.755869 -0.203756 0.622211   N1 0.783289 0 0.621658   N2 0.556738 0 0.830688 
+   txt003 
+STRI 
+  V0 1.38201 -0.384628 2.4875   V1 1.2393 -0.727875 2.4875   V2 1.26884 -0.745225 2.45469 
+  N0 0.537012 -0.14476 0.831061   N1 0.480481 -0.278679 0.83155   N2 0.67669 -0.39248 0.622937 
+   txt003 
+STRI 
+  V0 1.26884 -0.745225 2.45469   V1 1.41495 -0.393796 2.45469   V2 1.38201 -0.384628 2.4875 
+  N0 0.67669 -0.39248 0.622937   N1 0.755869 -0.203756 0.622211   N2 0.537012 -0.14476 0.831061 
+   txt003 
+STRI 
+  V0 1.2393 -0.727875 2.4875   V1 1.01701 -1.01701 2.4875   V2 1.04125 -1.04125 2.45469 
+  N0 0.480481 -0.278679 0.83155   N1 0.392564 -0.392564 0.831737   N2 0.552993 -0.552993 0.623215 
+   txt003 
+STRI 
+  V0 1.04125 -1.04125 2.45469   V1 1.26884 -0.745225 2.45469   V2 1.2393 -0.727875 2.4875 
+  N0 0.552993 -0.552993 0.623215   N1 0.67669 -0.39248 0.622937   N2 0.480481 -0.278679 0.83155 
+   txt003 
+STRI 
+  V0 1.01701 -1.01701 2.4875   V1 0.727875 -1.2393 2.4875   V2 0.745225 -1.26884 2.45469 
+  N0 0.392564 -0.392564 0.831737   N1 0.278679 -0.480481 0.83155   N2 0.39248 -0.67669 0.622937 
+   txt003 
+STRI 
+  V0 0.745225 -1.26884 2.45469   V1 1.04125 -1.04125 2.45469   V2 1.01701 -1.01701 2.4875 
+  N0 0.39248 -0.67669 0.622937   N1 0.552993 -0.552993 0.623215   N2 0.392564 -0.392564 0.831737 
+   txt003 
+STRI 
+  V0 0.727875 -1.2393 2.4875   V1 0.384628 -1.38201 2.4875   V2 0.393796 -1.41495 2.45469 
+  N0 0.278679 -0.480481 0.83155   N1 0.14476 -0.537012 0.831061   N2 0.203756 -0.755869 0.622211 
+   txt003 
+STRI 
+  V0 0.393796 -1.41495 2.45469   V1 0.745225 -1.26884 2.45469   V2 0.727875 -1.2393 2.4875 
+  N0 0.203756 -0.755869 0.622211   N1 0.39248 -0.67669 0.622937   N2 0.278679 -0.480481 0.83155 
+   txt003 
+STRI 
+  V0 0.384628 -1.38201 2.4875   V1 0 -1.43241 2.4875   V2 0 -1.46655 2.45469 
+  N0 0.14476 -0.537012 0.831061   N1 -4.5989e-16 -0.556738 0.830688   N2 -1.94969e-16 -0.783289 0.621658 
+   txt003 
+STRI 
+  V0 0 -1.46655 2.45469   V1 0.393796 -1.41495 2.45469   V2 0.384628 -1.38201 2.4875 
+  N0 -1.94969e-16 -0.783289 0.621658   N1 0.203756 -0.755869 0.622211   N2 0.14476 -0.537012 0.831061 
+   txt003 
+STRI 
+  V0 1.46655 0 2.45469   V1 1.41495 -0.393796 2.45469   V2 1.44722 -0.402778 2.4 
+  N0 0.783289 0 0.621658   N1 0.755869 -0.203756 0.622211   N2 0.871509 -0.234929 0.430442 
+   txt003 
+STRI 
+  V0 1.44722 -0.402778 2.4   V1 1.5 0 2.4   V2 1.46655 0 2.45469 
+  N0 0.871509 -0.234929 0.430442   N1 0.902861 0 0.429934   N2 0.783289 0 0.621658 
+   txt003 
+STRI 
+  V0 1.41495 -0.393796 2.45469   V1 1.26884 -0.745225 2.45469   V2 1.29778 -0.762222 2.4 
+  N0 0.755869 -0.203756 0.622211   N1 0.67669 -0.39248 0.622937   N2 0.780517 -0.4527 0.43111 
+   txt003 
+STRI 
+  V0 1.29778 -0.762222 2.4   V1 1.44722 -0.402778 2.4   V2 1.41495 -0.393796 2.45469 
+  N0 0.780517 -0.4527 0.43111   N1 0.871509 -0.234929 0.430442   N2 0.755869 -0.203756 0.622211 
+   txt003 
+STRI 
+  V0 1.26884 -0.745225 2.45469   V1 1.04125 -1.04125 2.45469   V2 1.065 -1.065 2.4 
+  N0 0.67669 -0.39248 0.622937   N1 0.552993 -0.552993 0.623215   N2 0.637936 -0.637936 0.431366 
+   txt003 
+STRI 
+  V0 1.065 -1.065 2.4   V1 1.29778 -0.762222 2.4   V2 1.26884 -0.745225 2.45469 
+  N0 0.637936 -0.637936 0.431366   N1 0.780517 -0.4527 0.43111   N2 0.67669 -0.39248 0.622937 
+   txt003 
+STRI 
+  V0 1.04125 -1.04125 2.45469   V1 0.745225 -1.26884 2.45469   V2 0.762222 -1.29778 2.4 
+  N0 0.552993 -0.552993 0.623215   N1 0.39248 -0.67669 0.622937   N2 0.4527 -0.780517 0.43111 
+   txt003 
+STRI 
+  V0 0.762222 -1.29778 2.4   V1 1.065 -1.065 2.4   V2 1.04125 -1.04125 2.45469 
+  N0 0.4527 -0.780517 0.43111   N1 0.637936 -0.637936 0.431366   N2 0.552993 -0.552993 0.623215 
+   txt003 
+STRI 
+  V0 0.745225 -1.26884 2.45469   V1 0.393796 -1.41495 2.45469   V2 0.402778 -1.44722 2.4 
+  N0 0.39248 -0.67669 0.622937   N1 0.203756 -0.755869 0.622211   N2 0.234929 -0.871509 0.430442 
+   txt003 
+STRI 
+  V0 0.402778 -1.44722 2.4   V1 0.762222 -1.29778 2.4   V2 0.745225 -1.26884 2.45469 
+  N0 0.234929 -0.871509 0.430442   N1 0.4527 -0.780517 0.43111   N2 0.39248 -0.67669 0.622937 
+   txt003 
+STRI 
+  V0 0.393796 -1.41495 2.45469   V1 0 -1.46655 2.45469   V2 0 -1.5 2.4 
+  N0 0.203756 -0.755869 0.622211   N1 -1.94969e-16 -0.783289 0.621658   N2 -6.81889e-17 -0.902861 0.429934 
+   txt003 
+STRI 
+  V0 0 -1.5 2.4   V1 0.402778 -1.44722 2.4   V2 0.393796 -1.41495 2.45469 
+  N0 -6.81889e-17 -0.902861 0.429934   N1 0.234929 -0.871509 0.430442   N2 0.203756 -0.755869 0.622211 
+   txt003 
+STRI 
+  V0 0 -1.4 2.4   V1 -0.375926 -1.35074 2.4   V2 -0.370922 -1.33276 2.45469 
+  N0 0 0.902861 -0.429934   N1 0.234929 0.871509 -0.430442   N2 0.257047 0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 -0.370922 -1.33276 2.45469   V1 0 -1.38137 2.45469   V2 0 -1.4 2.4 
+  N0 0.257047 0.953562 -0.156989   N1 0 0.987636 -0.156768   N2 0 0.902861 -0.429934 
+   txt003 
+STRI 
+  V0 -0.375926 -1.35074 2.4   V1 -0.711407 -1.21126 2.4   V2 -0.701938 -1.19514 2.45469 
+  N0 0.234929 0.871509 -0.430442   N1 0.4527 0.780517 -0.43111   N2 0.495474 0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 -0.701938 -1.19514 2.45469   V1 -0.370922 -1.33276 2.45469   V2 -0.375926 -1.35074 2.4 
+  N0 0.495474 0.854265 -0.157281   N1 0.257047 0.953562 -0.156989   N2 0.234929 0.871509 -0.430442 
+   txt003 
+STRI 
+  V0 -0.711407 -1.21126 2.4   V1 -0.994 -0.994 2.4   V2 -0.98077 -0.98077 2.45469 
+  N0 0.4527 0.780517 -0.43111   N1 0.637936 0.637936 -0.431366   N2 0.698293 0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 -0.98077 -0.98077 2.45469   V1 -0.701938 -1.19514 2.45469   V2 -0.711407 -1.21126 2.4 
+  N0 0.698293 0.698293 -0.157393   N1 0.495474 0.854265 -0.157281   N2 0.4527 0.780517 -0.43111 
+   txt003 
+STRI 
+  V0 -0.994 -0.994 2.4   V1 -1.21126 -0.711407 2.4   V2 -1.19514 -0.701938 2.45469 
+  N0 0.637936 0.637936 -0.431366   N1 0.780517 0.4527 -0.43111   N2 0.854265 0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 -1.19514 -0.701938 2.45469   V1 -0.98077 -0.98077 2.45469   V2 -0.994 -0.994 2.4 
+  N0 0.854265 0.495474 -0.157281   N1 0.698293 0.698293 -0.157393   N2 0.637936 0.637936 -0.431366 
+   txt003 
+STRI 
+  V0 -1.21126 -0.711407 2.4   V1 -1.35074 -0.375926 2.4   V2 -1.33276 -0.370922 2.45469 
+  N0 0.780517 0.4527 -0.43111   N1 0.871509 0.234929 -0.430442   N2 0.953562 0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 -1.33276 -0.370922 2.45469   V1 -1.19514 -0.701938 2.45469   V2 -1.21126 -0.711407 2.4 
+  N0 0.953562 0.257047 -0.156989   N1 0.854265 0.495474 -0.157281   N2 0.780517 0.4527 -0.43111 
+   txt003 
+STRI 
+  V0 -1.35074 -0.375926 2.4   V1 -1.4 0 2.4   V2 -1.38137 0 2.45469 
+  N0 0.871509 0.234929 -0.430442   N1 0.902861 -7.30595e-17 -0.429934   N2 0.987636 9.89971e-17 -0.156768 
+   txt003 
+STRI 
+  V0 -1.38137 0 2.45469   V1 -1.33276 -0.370922 2.45469   V2 -1.35074 -0.375926 2.4 
+  N0 0.987636 9.89971e-17 -0.156768   N1 0.953562 0.257047 -0.156989   N2 0.871509 0.234929 -0.430442 
+   txt003 
+STRI 
+  V0 0 -1.38137 2.45469   V1 -0.370922 -1.33276 2.45469   V2 -0.371699 -1.33555 2.4875 
+  N0 0 0.987636 -0.156768   N1 0.257047 0.953562 -0.156989   N2 0.228972 0.849414 0.475466 
+   txt003 
+STRI 
+  V0 -0.371699 -1.33555 2.4875   V1 0 -1.38426 2.4875   V2 0 -1.38137 2.45469 
+  N0 0.228972 0.849414 0.475466   N1 0 0.880022 0.474933   N2 0 0.987636 -0.156768 
+   txt003 
+STRI 
+  V0 -0.370922 -1.33276 2.45469   V1 -0.701938 -1.19514 2.45469   V2 -0.703409 -1.19764 2.4875 
+  N0 0.257047 0.953562 -0.156989   N1 0.495474 0.854265 -0.157281   N2 0.441188 0.760669 0.476167 
+   txt003 
+STRI 
+  V0 -0.703409 -1.19764 2.4875   V1 -0.371699 -1.33555 2.4875   V2 -0.370922 -1.33276 2.45469 
+  N0 0.441188 0.760669 0.476167   N1 0.228972 0.849414 0.475466   N2 0.257047 0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 -0.701938 -1.19514 2.45469   V1 -0.98077 -0.98077 2.45469   V2 -0.982824 -0.982824 2.4875 
+  N0 0.495474 0.854265 -0.157281   N1 0.698293 0.698293 -0.157393   N2 0.621695 0.621695 0.476435 
+   txt003 
+STRI 
+  V0 -0.982824 -0.982824 2.4875   V1 -0.703409 -1.19764 2.4875   V2 -0.701938 -1.19514 2.45469 
+  N0 0.621695 0.621695 0.476435   N1 0.441188 0.760669 0.476167   N2 0.495474 0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 -0.98077 -0.98077 2.45469   V1 -1.19514 -0.701938 2.45469   V2 -1.19764 -0.703409 2.4875 
+  N0 0.698293 0.698293 -0.157393   N1 0.854265 0.495474 -0.157281   N2 0.760669 0.441188 0.476167 
+   txt003 
+STRI 
+  V0 -1.19764 -0.703409 2.4875   V1 -0.982824 -0.982824 2.4875   V2 -0.98077 -0.98077 2.45469 
+  N0 0.760669 0.441188 0.476167   N1 0.621695 0.621695 0.476435   N2 0.698293 0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 -1.19514 -0.701938 2.45469   V1 -1.33276 -0.370922 2.45469   V2 -1.33555 -0.371699 2.4875 
+  N0 0.854265 0.495474 -0.157281   N1 0.953562 0.257047 -0.156989   N2 0.849414 0.228972 0.475466 
+   txt003 
+STRI 
+  V0 -1.33555 -0.371699 2.4875   V1 -1.19764 -0.703409 2.4875   V2 -1.19514 -0.701938 2.45469 
+  N0 0.849414 0.228972 0.475466   N1 0.760669 0.441188 0.476167   N2 0.854265 0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 -1.33276 -0.370922 2.45469   V1 -1.38137 0 2.45469   V2 -1.38426 0 2.4875 
+  N0 0.953562 0.257047 -0.156989   N1 0.987636 9.89971e-17 -0.156768   N2 0.880022 6.08179e-16 0.474933 
+   txt003 
+STRI 
+  V0 -1.38426 0 2.4875   V1 -1.33555 -0.371699 2.4875   V2 -1.33276 -0.370922 2.45469 
+  N0 0.880022 6.08179e-16 0.474933   N1 0.849414 0.228972 0.475466   N2 0.953562 0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 0 -1.38426 2.4875   V1 -0.371699 -1.33555 2.4875   V2 -0.376765 -1.35376 2.49844 
+  N0 0 0.880022 0.474933   N1 0.228972 0.849414 0.475466   N2 -5.93089e-16 -2.13636e-15 1 
+   txt003 
+STRI 
+  V0 -0.376765 -1.35376 2.49844   V1 0 -1.40312 2.49844   V2 0 -1.38426 2.4875 
+  N0 -5.93089e-16 -2.13636e-15 1   N1 0 -2.22045e-15 1   N2 0 0.880022 0.474933 
+   txt003 
+STRI 
+  V0 -0.371699 -1.33555 2.4875   V1 -0.703409 -1.19764 2.4875   V2 -0.712995 -1.21396 2.49844 
+  N0 0.228972 0.849414 0.475466   N1 0.441188 0.760669 0.476167   N2 -1.16933e-15 -1.87966e-15 1 
+   txt003 
+STRI 
+  V0 -0.712995 -1.21396 2.49844   V1 -0.376765 -1.35376 2.49844   V2 -0.371699 -1.33555 2.4875 
+  N0 -1.16933e-15 -1.87966e-15 1   N1 -5.93089e-16 -2.13636e-15 1   N2 0.228972 0.849414 0.475466 
+   txt003 
+STRI 
+  V0 -0.703409 -1.19764 2.4875   V1 -0.982824 -0.982824 2.4875   V2 -0.996219 -0.996219 2.49844 
+  N0 0.441188 0.760669 0.476167   N1 0.621695 0.621695 0.476435   N2 -1.67359e-15 -1.4538e-15 1 
+   txt003 
+STRI 
+  V0 -0.996219 -0.996219 2.49844   V1 -0.712995 -1.21396 2.49844   V2 -0.703409 -1.19764 2.4875 
+  N0 -1.67359e-15 -1.4538e-15 1   N1 -1.16933e-15 -1.87966e-15 1   N2 0.441188 0.760669 0.476167 
+   txt003 
+STRI 
+  V0 -0.982824 -0.982824 2.4875   V1 -1.19764 -0.703409 2.4875   V2 -1.21396 -0.712995 2.49844 
+  N0 0.621695 0.621695 0.476435   N1 0.760669 0.441188 0.476167   N2 -2.05298e-15 -8.74229e-16 1 
+   txt003 
+STRI 
+  V0 -1.21396 -0.712995 2.49844   V1 -0.996219 -0.996219 2.49844   V2 -0.982824 -0.982824 2.4875 
+  N0 -2.05298e-15 -8.74229e-16 1   N1 -1.67359e-15 -1.4538e-15 1   N2 0.621695 0.621695 0.476435 
+   txt003 
+STRI 
+  V0 -1.19764 -0.703409 2.4875   V1 -1.33555 -0.371699 2.4875   V2 -1.35376 -0.376765 2.49844 
+  N0 0.760669 0.441188 0.476167   N1 0.849414 0.228972 0.475466   N2 -2.25214e-15 -1.77072e-16 1 
+   txt003 
+STRI 
+  V0 -1.35376 -0.376765 2.49844   V1 -1.21396 -0.712995 2.49844   V2 -1.19764 -0.703409 2.4875 
+  N0 -2.25214e-15 -1.77072e-16 1   N1 -2.05298e-15 -8.74229e-16 1   N2 0.760669 0.441188 0.476167 
+   txt003 
+STRI 
+  V0 -1.33555 -0.371699 2.4875   V1 -1.38426 0 2.4875   V2 -1.40312 0 2.49844 
+  N0 0.849414 0.228972 0.475466   N1 0.880022 6.08179e-16 0.474933   N2 -2.22045e-15 5.65179e-16 1 
+   txt003 
+STRI 
+  V0 -1.40312 0 2.49844   V1 -1.35376 -0.376765 2.49844   V2 -1.33555 -0.371699 2.4875 
+  N0 -2.22045e-15 5.65179e-16 1   N1 -2.25214e-15 -1.77072e-16 1   N2 0.849414 0.228972 0.475466 
+   txt003 
+STRI 
+  V0 0 -1.40312 2.49844   V1 -0.376765 -1.35376 2.49844   V2 -0.384628 -1.38201 2.4875 
+  N0 0 -2.22045e-15 1   N1 -5.93089e-16 -2.13636e-15 1   N2 -0.14476 -0.537012 0.831061 
+   txt003 
+STRI 
+  V0 -0.384628 -1.38201 2.4875   V1 0 -1.43241 2.4875   V2 0 -1.40312 2.49844 
+  N0 -0.14476 -0.537012 0.831061   N1 0 -0.556738 0.830688   N2 0 -2.22045e-15 1 
+   txt003 
+STRI 
+  V0 -0.376765 -1.35376 2.49844   V1 -0.712995 -1.21396 2.49844   V2 -0.727875 -1.2393 2.4875 
+  N0 -5.93089e-16 -2.13636e-15 1   N1 -1.16933e-15 -1.87966e-15 1   N2 -0.278679 -0.480481 0.83155 
+   txt003 
+STRI 
+  V0 -0.727875 -1.2393 2.4875   V1 -0.384628 -1.38201 2.4875   V2 -0.376765 -1.35376 2.49844 
+  N0 -0.278679 -0.480481 0.83155   N1 -0.14476 -0.537012 0.831061   N2 -5.93089e-16 -2.13636e-15 1 
+   txt003 
+STRI 
+  V0 -0.712995 -1.21396 2.49844   V1 -0.996219 -0.996219 2.49844   V2 -1.01701 -1.01701 2.4875 
+  N0 -1.16933e-15 -1.87966e-15 1   N1 -1.67359e-15 -1.4538e-15 1   N2 -0.392564 -0.392564 0.831737 
+   txt003 
+STRI 
+  V0 -1.01701 -1.01701 2.4875   V1 -0.727875 -1.2393 2.4875   V2 -0.712995 -1.21396 2.49844 
+  N0 -0.392564 -0.392564 0.831737   N1 -0.278679 -0.480481 0.83155   N2 -1.16933e-15 -1.87966e-15 1 
+   txt003 
+STRI 
+  V0 -0.996219 -0.996219 2.49844   V1 -1.21396 -0.712995 2.49844   V2 -1.2393 -0.727875 2.4875 
+  N0 -1.67359e-15 -1.4538e-15 1   N1 -2.05298e-15 -8.74229e-16 1   N2 -0.480481 -0.278679 0.83155 
+   txt003 
+STRI 
+  V0 -1.2393 -0.727875 2.4875   V1 -1.01701 -1.01701 2.4875   V2 -0.996219 -0.996219 2.49844 
+  N0 -0.480481 -0.278679 0.83155   N1 -0.392564 -0.392564 0.831737   N2 -1.67359e-15 -1.4538e-15 1 
+   txt003 
+STRI 
+  V0 -1.21396 -0.712995 2.49844   V1 -1.35376 -0.376765 2.49844   V2 -1.38201 -0.384628 2.4875 
+  N0 -2.05298e-15 -8.74229e-16 1   N1 -2.25214e-15 -1.77072e-16 1   N2 -0.537012 -0.14476 0.831061 
+   txt003 
+STRI 
+  V0 -1.38201 -0.384628 2.4875   V1 -1.2393 -0.727875 2.4875   V2 -1.21396 -0.712995 2.49844 
+  N0 -0.537012 -0.14476 0.831061   N1 -0.480481 -0.278679 0.83155   N2 -2.05298e-15 -8.74229e-16 1 
+   txt003 
+STRI 
+  V0 -1.35376 -0.376765 2.49844   V1 -1.40312 0 2.49844   V2 -1.43241 0 2.4875 
+  N0 -2.25214e-15 -1.77072e-16 1   N1 -2.22045e-15 5.65179e-16 1   N2 -0.556738 4.5989e-16 0.830688 
+   txt003 
+STRI 
+  V0 -1.43241 0 2.4875   V1 -1.38201 -0.384628 2.4875   V2 -1.35376 -0.376765 2.49844 
+  N0 -0.556738 4.5989e-16 0.830688   N1 -0.537012 -0.14476 0.831061   N2 -2.25214e-15 -1.77072e-16 1 
+   txt003 
+STRI 
+  V0 0 -1.43241 2.4875   V1 -0.384628 -1.38201 2.4875   V2 -0.393796 -1.41495 2.45469 
+  N0 0 -0.556738 0.830688   N1 -0.14476 -0.537012 0.831061   N2 -0.203756 -0.755869 0.622211 
+   txt003 
+STRI 
+  V0 -0.393796 -1.41495 2.45469   V1 0 -1.46655 2.45469   V2 0 -1.43241 2.4875 
+  N0 -0.203756 -0.755869 0.622211   N1 0 -0.783289 0.621658   N2 0 -0.556738 0.830688 
+   txt003 
+STRI 
+  V0 -0.384628 -1.38201 2.4875   V1 -0.727875 -1.2393 2.4875   V2 -0.745225 -1.26884 2.45469 
+  N0 -0.14476 -0.537012 0.831061   N1 -0.278679 -0.480481 0.83155   N2 -0.39248 -0.67669 0.622937 
+   txt003 
+STRI 
+  V0 -0.745225 -1.26884 2.45469   V1 -0.393796 -1.41495 2.45469   V2 -0.384628 -1.38201 2.4875 
+  N0 -0.39248 -0.67669 0.622937   N1 -0.203756 -0.755869 0.622211   N2 -0.14476 -0.537012 0.831061 
+   txt003 
+STRI 
+  V0 -0.727875 -1.2393 2.4875   V1 -1.01701 -1.01701 2.4875   V2 -1.04125 -1.04125 2.45469 
+  N0 -0.278679 -0.480481 0.83155   N1 -0.392564 -0.392564 0.831737   N2 -0.552993 -0.552993 0.623215 
+   txt003 
+STRI 
+  V0 -1.04125 -1.04125 2.45469   V1 -0.745225 -1.26884 2.45469   V2 -0.727875 -1.2393 2.4875 
+  N0 -0.552993 -0.552993 0.623215   N1 -0.39248 -0.67669 0.622937   N2 -0.278679 -0.480481 0.83155 
+   txt003 
+STRI 
+  V0 -1.01701 -1.01701 2.4875   V1 -1.2393 -0.727875 2.4875   V2 -1.26884 -0.745225 2.45469 
+  N0 -0.392564 -0.392564 0.831737   N1 -0.480481 -0.278679 0.83155   N2 -0.67669 -0.39248 0.622937 
+   txt003 
+STRI 
+  V0 -1.26884 -0.745225 2.45469   V1 -1.04125 -1.04125 2.45469   V2 -1.01701 -1.01701 2.4875 
+  N0 -0.67669 -0.39248 0.622937   N1 -0.552993 -0.552993 0.623215   N2 -0.392564 -0.392564 0.831737 
+   txt003 
+STRI 
+  V0 -1.2393 -0.727875 2.4875   V1 -1.38201 -0.384628 2.4875   V2 -1.41495 -0.393796 2.45469 
+  N0 -0.480481 -0.278679 0.83155   N1 -0.537012 -0.14476 0.831061   N2 -0.755869 -0.203756 0.622211 
+   txt003 
+STRI 
+  V0 -1.41495 -0.393796 2.45469   V1 -1.26884 -0.745225 2.45469   V2 -1.2393 -0.727875 2.4875 
+  N0 -0.755869 -0.203756 0.622211   N1 -0.67669 -0.39248 0.622937   N2 -0.480481 -0.278679 0.83155 
+   txt003 
+STRI 
+  V0 -1.38201 -0.384628 2.4875   V1 -1.43241 0 2.4875   V2 -1.46655 0 2.45469 
+  N0 -0.537012 -0.14476 0.831061   N1 -0.556738 4.5989e-16 0.830688   N2 -0.783289 1.94969e-16 0.621658 
+   txt003 
+STRI 
+  V0 -1.46655 0 2.45469   V1 -1.41495 -0.393796 2.45469   V2 -1.38201 -0.384628 2.4875 
+  N0 -0.783289 1.94969e-16 0.621658   N1 -0.755869 -0.203756 0.622211   N2 -0.537012 -0.14476 0.831061 
+   txt003 
+STRI 
+  V0 0 -1.46655 2.45469   V1 -0.393796 -1.41495 2.45469   V2 -0.402778 -1.44722 2.4 
+  N0 0 -0.783289 0.621658   N1 -0.203756 -0.755869 0.622211   N2 -0.234929 -0.871509 0.430442 
+   txt003 
+STRI 
+  V0 -0.402778 -1.44722 2.4   V1 0 -1.5 2.4   V2 0 -1.46655 2.45469 
+  N0 -0.234929 -0.871509 0.430442   N1 0 -0.902861 0.429934   N2 0 -0.783289 0.621658 
+   txt003 
+STRI 
+  V0 -0.393796 -1.41495 2.45469   V1 -0.745225 -1.26884 2.45469   V2 -0.762222 -1.29778 2.4 
+  N0 -0.203756 -0.755869 0.622211   N1 -0.39248 -0.67669 0.622937   N2 -0.4527 -0.780517 0.43111 
+   txt003 
+STRI 
+  V0 -0.762222 -1.29778 2.4   V1 -0.402778 -1.44722 2.4   V2 -0.393796 -1.41495 2.45469 
+  N0 -0.4527 -0.780517 0.43111   N1 -0.234929 -0.871509 0.430442   N2 -0.203756 -0.755869 0.622211 
+   txt003 
+STRI 
+  V0 -0.745225 -1.26884 2.45469   V1 -1.04125 -1.04125 2.45469   V2 -1.065 -1.065 2.4 
+  N0 -0.39248 -0.67669 0.622937   N1 -0.552993 -0.552993 0.623215   N2 -0.637936 -0.637936 0.431366 
+   txt003 
+STRI 
+  V0 -1.065 -1.065 2.4   V1 -0.762222 -1.29778 2.4   V2 -0.745225 -1.26884 2.45469 
+  N0 -0.637936 -0.637936 0.431366   N1 -0.4527 -0.780517 0.43111   N2 -0.39248 -0.67669 0.622937 
+   txt003 
+STRI 
+  V0 -1.04125 -1.04125 2.45469   V1 -1.26884 -0.745225 2.45469   V2 -1.29778 -0.762222 2.4 
+  N0 -0.552993 -0.552993 0.623215   N1 -0.67669 -0.39248 0.622937   N2 -0.780517 -0.4527 0.43111 
+   txt003 
+STRI 
+  V0 -1.29778 -0.762222 2.4   V1 -1.065 -1.065 2.4   V2 -1.04125 -1.04125 2.45469 
+  N0 -0.780517 -0.4527 0.43111   N1 -0.637936 -0.637936 0.431366   N2 -0.552993 -0.552993 0.623215 
+   txt003 
+STRI 
+  V0 -1.26884 -0.745225 2.45469   V1 -1.41495 -0.393796 2.45469   V2 -1.44722 -0.402778 2.4 
+  N0 -0.67669 -0.39248 0.622937   N1 -0.755869 -0.203756 0.622211   N2 -0.871509 -0.234929 0.430442 
+   txt003 
+STRI 
+  V0 -1.44722 -0.402778 2.4   V1 -1.29778 -0.762222 2.4   V2 -1.26884 -0.745225 2.45469 
+  N0 -0.871509 -0.234929 0.430442   N1 -0.780517 -0.4527 0.43111   N2 -0.67669 -0.39248 0.622937 
+   txt003 
+STRI 
+  V0 -1.41495 -0.393796 2.45469   V1 -1.46655 0 2.45469   V2 -1.5 0 2.4 
+  N0 -0.755869 -0.203756 0.622211   N1 -0.783289 1.94969e-16 0.621658   N2 -0.902861 6.81889e-17 0.429934 
+   txt003 
+STRI 
+  V0 -1.5 0 2.4   V1 -1.44722 -0.402778 2.4   V2 -1.41495 -0.393796 2.45469 
+  N0 -0.902861 6.81889e-17 0.429934   N1 -0.871509 -0.234929 0.430442   N2 -0.755869 -0.203756 0.622211 
+   txt003 
+STRI 
+  V0 -1.4 0 2.4   V1 -1.35074 0.375926 2.4   V2 -1.33276 0.370922 2.45469 
+  N0 0.902861 0 -0.429934   N1 0.871509 -0.234929 -0.430442   N2 0.953562 -0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 -1.33276 0.370922 2.45469   V1 -1.38137 0 2.45469   V2 -1.4 0 2.4 
+  N0 0.953562 -0.257047 -0.156989   N1 0.987636 0 -0.156768   N2 0.902861 0 -0.429934 
+   txt003 
+STRI 
+  V0 -1.35074 0.375926 2.4   V1 -1.21126 0.711407 2.4   V2 -1.19514 0.701938 2.45469 
+  N0 0.871509 -0.234929 -0.430442   N1 0.780517 -0.4527 -0.43111   N2 0.854265 -0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 -1.19514 0.701938 2.45469   V1 -1.33276 0.370922 2.45469   V2 -1.35074 0.375926 2.4 
+  N0 0.854265 -0.495474 -0.157281   N1 0.953562 -0.257047 -0.156989   N2 0.871509 -0.234929 -0.430442 
+   txt003 
+STRI 
+  V0 -1.21126 0.711407 2.4   V1 -0.994 0.994 2.4   V2 -0.98077 0.98077 2.45469 
+  N0 0.780517 -0.4527 -0.43111   N1 0.637936 -0.637936 -0.431366   N2 0.698293 -0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 -0.98077 0.98077 2.45469   V1 -1.19514 0.701938 2.45469   V2 -1.21126 0.711407 2.4 
+  N0 0.698293 -0.698293 -0.157393   N1 0.854265 -0.495474 -0.157281   N2 0.780517 -0.4527 -0.43111 
+   txt003 
+STRI 
+  V0 -0.994 0.994 2.4   V1 -0.711407 1.21126 2.4   V2 -0.701938 1.19514 2.45469 
+  N0 0.637936 -0.637936 -0.431366   N1 0.4527 -0.780517 -0.43111   N2 0.495474 -0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 -0.701938 1.19514 2.45469   V1 -0.98077 0.98077 2.45469   V2 -0.994 0.994 2.4 
+  N0 0.495474 -0.854265 -0.157281   N1 0.698293 -0.698293 -0.157393   N2 0.637936 -0.637936 -0.431366 
+   txt003 
+STRI 
+  V0 -0.711407 1.21126 2.4   V1 -0.375926 1.35074 2.4   V2 -0.370922 1.33276 2.45469 
+  N0 0.4527 -0.780517 -0.43111   N1 0.234929 -0.871509 -0.430442   N2 0.257047 -0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 -0.370922 1.33276 2.45469   V1 -0.701938 1.19514 2.45469   V2 -0.711407 1.21126 2.4 
+  N0 0.257047 -0.953562 -0.156989   N1 0.495474 -0.854265 -0.157281   N2 0.4527 -0.780517 -0.43111 
+   txt003 
+STRI 
+  V0 -0.375926 1.35074 2.4   V1 0 1.4 2.4   V2 0 1.38137 2.45469 
+  N0 0.234929 -0.871509 -0.430442   N1 -7.30595e-17 -0.902861 -0.429934   N2 9.89971e-17 -0.987636 -0.156768 
+   txt003 
+STRI 
+  V0 0 1.38137 2.45469   V1 -0.370922 1.33276 2.45469   V2 -0.375926 1.35074 2.4 
+  N0 9.89971e-17 -0.987636 -0.156768   N1 0.257047 -0.953562 -0.156989   N2 0.234929 -0.871509 -0.430442 
+   txt003 
+STRI 
+  V0 -1.38137 0 2.45469   V1 -1.33276 0.370922 2.45469   V2 -1.33555 0.371699 2.4875 
+  N0 0.987636 0 -0.156768   N1 0.953562 -0.257047 -0.156989   N2 0.849414 -0.228972 0.475466 
+   txt003 
+STRI 
+  V0 -1.33555 0.371699 2.4875   V1 -1.38426 0 2.4875   V2 -1.38137 0 2.45469 
+  N0 0.849414 -0.228972 0.475466   N1 0.880022 -0 0.474933   N2 0.987636 0 -0.156768 
+   txt003 
+STRI 
+  V0 -1.33276 0.370922 2.45469   V1 -1.19514 0.701938 2.45469   V2 -1.19764 0.703409 2.4875 
+  N0 0.953562 -0.257047 -0.156989   N1 0.854265 -0.495474 -0.157281   N2 0.760669 -0.441188 0.476167 
+   txt003 
+STRI 
+  V0 -1.19764 0.703409 2.4875   V1 -1.33555 0.371699 2.4875   V2 -1.33276 0.370922 2.45469 
+  N0 0.760669 -0.441188 0.476167   N1 0.849414 -0.228972 0.475466   N2 0.953562 -0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 -1.19514 0.701938 2.45469   V1 -0.98077 0.98077 2.45469   V2 -0.982824 0.982824 2.4875 
+  N0 0.854265 -0.495474 -0.157281   N1 0.698293 -0.698293 -0.157393   N2 0.621695 -0.621695 0.476435 
+   txt003 
+STRI 
+  V0 -0.982824 0.982824 2.4875   V1 -1.19764 0.703409 2.4875   V2 -1.19514 0.701938 2.45469 
+  N0 0.621695 -0.621695 0.476435   N1 0.760669 -0.441188 0.476167   N2 0.854265 -0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 -0.98077 0.98077 2.45469   V1 -0.701938 1.19514 2.45469   V2 -0.703409 1.19764 2.4875 
+  N0 0.698293 -0.698293 -0.157393   N1 0.495474 -0.854265 -0.157281   N2 0.441188 -0.760669 0.476167 
+   txt003 
+STRI 
+  V0 -0.703409 1.19764 2.4875   V1 -0.982824 0.982824 2.4875   V2 -0.98077 0.98077 2.45469 
+  N0 0.441188 -0.760669 0.476167   N1 0.621695 -0.621695 0.476435   N2 0.698293 -0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 -0.701938 1.19514 2.45469   V1 -0.370922 1.33276 2.45469   V2 -0.371699 1.33555 2.4875 
+  N0 0.495474 -0.854265 -0.157281   N1 0.257047 -0.953562 -0.156989   N2 0.228972 -0.849414 0.475466 
+   txt003 
+STRI 
+  V0 -0.371699 1.33555 2.4875   V1 -0.703409 1.19764 2.4875   V2 -0.701938 1.19514 2.45469 
+  N0 0.228972 -0.849414 0.475466   N1 0.441188 -0.760669 0.476167   N2 0.495474 -0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 -0.370922 1.33276 2.45469   V1 0 1.38137 2.45469   V2 0 1.38426 2.4875 
+  N0 0.257047 -0.953562 -0.156989   N1 9.89971e-17 -0.987636 -0.156768   N2 6.08179e-16 -0.880022 0.474933 
+   txt003 
+STRI 
+  V0 0 1.38426 2.4875   V1 -0.371699 1.33555 2.4875   V2 -0.370922 1.33276 2.45469 
+  N0 6.08179e-16 -0.880022 0.474933   N1 0.228972 -0.849414 0.475466   N2 0.257047 -0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 -1.38426 0 2.4875   V1 -1.33555 0.371699 2.4875   V2 -1.35376 0.376765 2.49844 
+  N0 0.880022 -0 0.474933   N1 0.849414 -0.228972 0.475466   N2 -2.13636e-15 5.93089e-16 1 
+   txt003 
+STRI 
+  V0 -1.35376 0.376765 2.49844   V1 -1.40312 0 2.49844   V2 -1.38426 0 2.4875 
+  N0 -2.13636e-15 5.93089e-16 1   N1 -2.22045e-15 0 1   N2 0.880022 -0 0.474933 
+   txt003 
+STRI 
+  V0 -1.33555 0.371699 2.4875   V1 -1.19764 0.703409 2.4875   V2 -1.21396 0.712995 2.49844 
+  N0 0.849414 -0.228972 0.475466   N1 0.760669 -0.441188 0.476167   N2 -1.87966e-15 1.16933e-15 1 
+   txt003 
+STRI 
+  V0 -1.21396 0.712995 2.49844   V1 -1.35376 0.376765 2.49844   V2 -1.33555 0.371699 2.4875 
+  N0 -1.87966e-15 1.16933e-15 1   N1 -2.13636e-15 5.93089e-16 1   N2 0.849414 -0.228972 0.475466 
+   txt003 
+STRI 
+  V0 -1.19764 0.703409 2.4875   V1 -0.982824 0.982824 2.4875   V2 -0.996219 0.996219 2.49844 
+  N0 0.760669 -0.441188 0.476167   N1 0.621695 -0.621695 0.476435   N2 -1.4538e-15 1.67359e-15 1 
+   txt003 
+STRI 
+  V0 -0.996219 0.996219 2.49844   V1 -1.21396 0.712995 2.49844   V2 -1.19764 0.703409 2.4875 
+  N0 -1.4538e-15 1.67359e-15 1   N1 -1.87966e-15 1.16933e-15 1   N2 0.760669 -0.441188 0.476167 
+   txt003 
+STRI 
+  V0 -0.982824 0.982824 2.4875   V1 -0.703409 1.19764 2.4875   V2 -0.712995 1.21396 2.49844 
+  N0 0.621695 -0.621695 0.476435   N1 0.441188 -0.760669 0.476167   N2 -8.74229e-16 2.05298e-15 1 
+   txt003 
+STRI 
+  V0 -0.712995 1.21396 2.49844   V1 -0.996219 0.996219 2.49844   V2 -0.982824 0.982824 2.4875 
+  N0 -8.74229e-16 2.05298e-15 1   N1 -1.4538e-15 1.67359e-15 1   N2 0.621695 -0.621695 0.476435 
+   txt003 
+STRI 
+  V0 -0.703409 1.19764 2.4875   V1 -0.371699 1.33555 2.4875   V2 -0.376765 1.35376 2.49844 
+  N0 0.441188 -0.760669 0.476167   N1 0.228972 -0.849414 0.475466   N2 -1.77072e-16 2.25214e-15 1 
+   txt003 
+STRI 
+  V0 -0.376765 1.35376 2.49844   V1 -0.712995 1.21396 2.49844   V2 -0.703409 1.19764 2.4875 
+  N0 -1.77072e-16 2.25214e-15 1   N1 -8.74229e-16 2.05298e-15 1   N2 0.441188 -0.760669 0.476167 
+   txt003 
+STRI 
+  V0 -0.371699 1.33555 2.4875   V1 0 1.38426 2.4875   V2 0 1.40312 2.49844 
+  N0 0.228972 -0.849414 0.475466   N1 6.08179e-16 -0.880022 0.474933   N2 5.65179e-16 2.22045e-15 1 
+   txt003 
+STRI 
+  V0 0 1.40312 2.49844   V1 -0.376765 1.35376 2.49844   V2 -0.371699 1.33555 2.4875 
+  N0 5.65179e-16 2.22045e-15 1   N1 -1.77072e-16 2.25214e-15 1   N2 0.228972 -0.849414 0.475466 
+   txt003 
+STRI 
+  V0 -1.40312 0 2.49844   V1 -1.35376 0.376765 2.49844   V2 -1.38201 0.384628 2.4875 
+  N0 -2.22045e-15 0 1   N1 -2.13636e-15 5.93089e-16 1   N2 -0.537012 0.14476 0.831061 
+   txt003 
+STRI 
+  V0 -1.38201 0.384628 2.4875   V1 -1.43241 0 2.4875   V2 -1.40312 0 2.49844 
+  N0 -0.537012 0.14476 0.831061   N1 -0.556738 0 0.830688   N2 -2.22045e-15 0 1 
+   txt003 
+STRI 
+  V0 -1.35376 0.376765 2.49844   V1 -1.21396 0.712995 2.49844   V2 -1.2393 0.727875 2.4875 
+  N0 -2.13636e-15 5.93089e-16 1   N1 -1.87966e-15 1.16933e-15 1   N2 -0.480481 0.278679 0.83155 
+   txt003 
+STRI 
+  V0 -1.2393 0.727875 2.4875   V1 -1.38201 0.384628 2.4875   V2 -1.35376 0.376765 2.49844 
+  N0 -0.480481 0.278679 0.83155   N1 -0.537012 0.14476 0.831061   N2 -2.13636e-15 5.93089e-16 1 
+   txt003 
+STRI 
+  V0 -1.21396 0.712995 2.49844   V1 -0.996219 0.996219 2.49844   V2 -1.01701 1.01701 2.4875 
+  N0 -1.87966e-15 1.16933e-15 1   N1 -1.4538e-15 1.67359e-15 1   N2 -0.392564 0.392564 0.831737 
+   txt003 
+STRI 
+  V0 -1.01701 1.01701 2.4875   V1 -1.2393 0.727875 2.4875   V2 -1.21396 0.712995 2.49844 
+  N0 -0.392564 0.392564 0.831737   N1 -0.480481 0.278679 0.83155   N2 -1.87966e-15 1.16933e-15 1 
+   txt003 
+STRI 
+  V0 -0.996219 0.996219 2.49844   V1 -0.712995 1.21396 2.49844   V2 -0.727875 1.2393 2.4875 
+  N0 -1.4538e-15 1.67359e-15 1   N1 -8.74229e-16 2.05298e-15 1   N2 -0.278679 0.480481 0.83155 
+   txt003 
+STRI 
+  V0 -0.727875 1.2393 2.4875   V1 -1.01701 1.01701 2.4875   V2 -0.996219 0.996219 2.49844 
+  N0 -0.278679 0.480481 0.83155   N1 -0.392564 0.392564 0.831737   N2 -1.4538e-15 1.67359e-15 1 
+   txt003 
+STRI 
+  V0 -0.712995 1.21396 2.49844   V1 -0.376765 1.35376 2.49844   V2 -0.384628 1.38201 2.4875 
+  N0 -8.74229e-16 2.05298e-15 1   N1 -1.77072e-16 2.25214e-15 1   N2 -0.14476 0.537012 0.831061 
+   txt003 
+STRI 
+  V0 -0.384628 1.38201 2.4875   V1 -0.727875 1.2393 2.4875   V2 -0.712995 1.21396 2.49844 
+  N0 -0.14476 0.537012 0.831061   N1 -0.278679 0.480481 0.83155   N2 -8.74229e-16 2.05298e-15 1 
+   txt003 
+STRI 
+  V0 -0.376765 1.35376 2.49844   V1 0 1.40312 2.49844   V2 0 1.43241 2.4875 
+  N0 -1.77072e-16 2.25214e-15 1   N1 5.65179e-16 2.22045e-15 1   N2 4.5989e-16 0.556738 0.830688 
+   txt003 
+STRI 
+  V0 0 1.43241 2.4875   V1 -0.384628 1.38201 2.4875   V2 -0.376765 1.35376 2.49844 
+  N0 4.5989e-16 0.556738 0.830688   N1 -0.14476 0.537012 0.831061   N2 -1.77072e-16 2.25214e-15 1 
+   txt003 
+STRI 
+  V0 -1.43241 0 2.4875   V1 -1.38201 0.384628 2.4875   V2 -1.41495 0.393796 2.45469 
+  N0 -0.556738 0 0.830688   N1 -0.537012 0.14476 0.831061   N2 -0.755869 0.203756 0.622211 
+   txt003 
+STRI 
+  V0 -1.41495 0.393796 2.45469   V1 -1.46655 0 2.45469   V2 -1.43241 0 2.4875 
+  N0 -0.755869 0.203756 0.622211   N1 -0.783289 0 0.621658   N2 -0.556738 0 0.830688 
+   txt003 
+STRI 
+  V0 -1.38201 0.384628 2.4875   V1 -1.2393 0.727875 2.4875   V2 -1.26884 0.745225 2.45469 
+  N0 -0.537012 0.14476 0.831061   N1 -0.480481 0.278679 0.83155   N2 -0.67669 0.39248 0.622937 
+   txt003 
+STRI 
+  V0 -1.26884 0.745225 2.45469   V1 -1.41495 0.393796 2.45469   V2 -1.38201 0.384628 2.4875 
+  N0 -0.67669 0.39248 0.622937   N1 -0.755869 0.203756 0.622211   N2 -0.537012 0.14476 0.831061 
+   txt003 
+STRI 
+  V0 -1.2393 0.727875 2.4875   V1 -1.01701 1.01701 2.4875   V2 -1.04125 1.04125 2.45469 
+  N0 -0.480481 0.278679 0.83155   N1 -0.392564 0.392564 0.831737   N2 -0.552993 0.552993 0.623215 
+   txt003 
+STRI 
+  V0 -1.04125 1.04125 2.45469   V1 -1.26884 0.745225 2.45469   V2 -1.2393 0.727875 2.4875 
+  N0 -0.552993 0.552993 0.623215   N1 -0.67669 0.39248 0.622937   N2 -0.480481 0.278679 0.83155 
+   txt003 
+STRI 
+  V0 -1.01701 1.01701 2.4875   V1 -0.727875 1.2393 2.4875   V2 -0.745225 1.26884 2.45469 
+  N0 -0.392564 0.392564 0.831737   N1 -0.278679 0.480481 0.83155   N2 -0.39248 0.67669 0.622937 
+   txt003 
+STRI 
+  V0 -0.745225 1.26884 2.45469   V1 -1.04125 1.04125 2.45469   V2 -1.01701 1.01701 2.4875 
+  N0 -0.39248 0.67669 0.622937   N1 -0.552993 0.552993 0.623215   N2 -0.392564 0.392564 0.831737 
+   txt003 
+STRI 
+  V0 -0.727875 1.2393 2.4875   V1 -0.384628 1.38201 2.4875   V2 -0.393796 1.41495 2.45469 
+  N0 -0.278679 0.480481 0.83155   N1 -0.14476 0.537012 0.831061   N2 -0.203756 0.755869 0.622211 
+   txt003 
+STRI 
+  V0 -0.393796 1.41495 2.45469   V1 -0.745225 1.26884 2.45469   V2 -0.727875 1.2393 2.4875 
+  N0 -0.203756 0.755869 0.622211   N1 -0.39248 0.67669 0.622937   N2 -0.278679 0.480481 0.83155 
+   txt003 
+STRI 
+  V0 -0.384628 1.38201 2.4875   V1 0 1.43241 2.4875   V2 0 1.46655 2.45469 
+  N0 -0.14476 0.537012 0.831061   N1 4.5989e-16 0.556738 0.830688   N2 1.94969e-16 0.783289 0.621658 
+   txt003 
+STRI 
+  V0 0 1.46655 2.45469   V1 -0.393796 1.41495 2.45469   V2 -0.384628 1.38201 2.4875 
+  N0 1.94969e-16 0.783289 0.621658   N1 -0.203756 0.755869 0.622211   N2 -0.14476 0.537012 0.831061 
+   txt003 
+STRI 
+  V0 -1.46655 0 2.45469   V1 -1.41495 0.393796 2.45469   V2 -1.44722 0.402778 2.4 
+  N0 -0.783289 0 0.621658   N1 -0.755869 0.203756 0.622211   N2 -0.871509 0.234929 0.430442 
+   txt003 
+STRI 
+  V0 -1.44722 0.402778 2.4   V1 -1.5 0 2.4   V2 -1.46655 0 2.45469 
+  N0 -0.871509 0.234929 0.430442   N1 -0.902861 0 0.429934   N2 -0.783289 0 0.621658 
+   txt003 
+STRI 
+  V0 -1.41495 0.393796 2.45469   V1 -1.26884 0.745225 2.45469   V2 -1.29778 0.762222 2.4 
+  N0 -0.755869 0.203756 0.622211   N1 -0.67669 0.39248 0.622937   N2 -0.780517 0.4527 0.43111 
+   txt003 
+STRI 
+  V0 -1.29778 0.762222 2.4   V1 -1.44722 0.402778 2.4   V2 -1.41495 0.393796 2.45469 
+  N0 -0.780517 0.4527 0.43111   N1 -0.871509 0.234929 0.430442   N2 -0.755869 0.203756 0.622211 
+   txt003 
+STRI 
+  V0 -1.26884 0.745225 2.45469   V1 -1.04125 1.04125 2.45469   V2 -1.065 1.065 2.4 
+  N0 -0.67669 0.39248 0.622937   N1 -0.552993 0.552993 0.623215   N2 -0.637936 0.637936 0.431366 
+   txt003 
+STRI 
+  V0 -1.065 1.065 2.4   V1 -1.29778 0.762222 2.4   V2 -1.26884 0.745225 2.45469 
+  N0 -0.637936 0.637936 0.431366   N1 -0.780517 0.4527 0.43111   N2 -0.67669 0.39248 0.622937 
+   txt003 
+STRI 
+  V0 -1.04125 1.04125 2.45469   V1 -0.745225 1.26884 2.45469   V2 -0.762222 1.29778 2.4 
+  N0 -0.552993 0.552993 0.623215   N1 -0.39248 0.67669 0.622937   N2 -0.4527 0.780517 0.43111 
+   txt003 
+STRI 
+  V0 -0.762222 1.29778 2.4   V1 -1.065 1.065 2.4   V2 -1.04125 1.04125 2.45469 
+  N0 -0.4527 0.780517 0.43111   N1 -0.637936 0.637936 0.431366   N2 -0.552993 0.552993 0.623215 
+   txt003 
+STRI 
+  V0 -0.745225 1.26884 2.45469   V1 -0.393796 1.41495 2.45469   V2 -0.402778 1.44722 2.4 
+  N0 -0.39248 0.67669 0.622937   N1 -0.203756 0.755869 0.622211   N2 -0.234929 0.871509 0.430442 
+   txt003 
+STRI 
+  V0 -0.402778 1.44722 2.4   V1 -0.762222 1.29778 2.4   V2 -0.745225 1.26884 2.45469 
+  N0 -0.234929 0.871509 0.430442   N1 -0.4527 0.780517 0.43111   N2 -0.39248 0.67669 0.622937 
+   txt003 
+STRI 
+  V0 -0.393796 1.41495 2.45469   V1 0 1.46655 2.45469   V2 0 1.5 2.4 
+  N0 -0.203756 0.755869 0.622211   N1 1.94969e-16 0.783289 0.621658   N2 6.81889e-17 0.902861 0.429934 
+   txt003 
+STRI 
+  V0 0 1.5 2.4   V1 -0.402778 1.44722 2.4   V2 -0.393796 1.41495 2.45469 
+  N0 6.81889e-17 0.902861 0.429934   N1 -0.234929 0.871509 0.430442   N2 -0.203756 0.755869 0.622211 
+   txt003 
+STRI 
+  V0 0 1.4 2.4   V1 0.375926 1.35074 2.4   V2 0.370922 1.33276 2.45469 
+  N0 0 -0.902861 -0.429934   N1 -0.234929 -0.871509 -0.430442   N2 -0.257047 -0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 0.370922 1.33276 2.45469   V1 0 1.38137 2.45469   V2 0 1.4 2.4 
+  N0 -0.257047 -0.953562 -0.156989   N1 0 -0.987636 -0.156768   N2 0 -0.902861 -0.429934 
+   txt003 
+STRI 
+  V0 0.375926 1.35074 2.4   V1 0.711407 1.21126 2.4   V2 0.701938 1.19514 2.45469 
+  N0 -0.234929 -0.871509 -0.430442   N1 -0.4527 -0.780517 -0.43111   N2 -0.495474 -0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 0.701938 1.19514 2.45469   V1 0.370922 1.33276 2.45469   V2 0.375926 1.35074 2.4 
+  N0 -0.495474 -0.854265 -0.157281   N1 -0.257047 -0.953562 -0.156989   N2 -0.234929 -0.871509 -0.430442 
+   txt003 
+STRI 
+  V0 0.711407 1.21126 2.4   V1 0.994 0.994 2.4   V2 0.98077 0.98077 2.45469 
+  N0 -0.4527 -0.780517 -0.43111   N1 -0.637936 -0.637936 -0.431366   N2 -0.698293 -0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 0.98077 0.98077 2.45469   V1 0.701938 1.19514 2.45469   V2 0.711407 1.21126 2.4 
+  N0 -0.698293 -0.698293 -0.157393   N1 -0.495474 -0.854265 -0.157281   N2 -0.4527 -0.780517 -0.43111 
+   txt003 
+STRI 
+  V0 0.994 0.994 2.4   V1 1.21126 0.711407 2.4   V2 1.19514 0.701938 2.45469 
+  N0 -0.637936 -0.637936 -0.431366   N1 -0.780517 -0.4527 -0.43111   N2 -0.854265 -0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 1.19514 0.701938 2.45469   V1 0.98077 0.98077 2.45469   V2 0.994 0.994 2.4 
+  N0 -0.854265 -0.495474 -0.157281   N1 -0.698293 -0.698293 -0.157393   N2 -0.637936 -0.637936 -0.431366 
+   txt003 
+STRI 
+  V0 1.21126 0.711407 2.4   V1 1.35074 0.375926 2.4   V2 1.33276 0.370922 2.45469 
+  N0 -0.780517 -0.4527 -0.43111   N1 -0.871509 -0.234929 -0.430442   N2 -0.953562 -0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 1.33276 0.370922 2.45469   V1 1.19514 0.701938 2.45469   V2 1.21126 0.711407 2.4 
+  N0 -0.953562 -0.257047 -0.156989   N1 -0.854265 -0.495474 -0.157281   N2 -0.780517 -0.4527 -0.43111 
+   txt003 
+STRI 
+  V0 1.35074 0.375926 2.4   V1 1.4 0 2.4   V2 1.38137 0 2.45469 
+  N0 -0.871509 -0.234929 -0.430442   N1 -0.902861 7.30595e-17 -0.429934   N2 -0.987636 -9.89971e-17 -0.156768 
+   txt003 
+STRI 
+  V0 1.38137 0 2.45469   V1 1.33276 0.370922 2.45469   V2 1.35074 0.375926 2.4 
+  N0 -0.987636 -9.89971e-17 -0.156768   N1 -0.953562 -0.257047 -0.156989   N2 -0.871509 -0.234929 -0.430442 
+   txt003 
+STRI 
+  V0 0 1.38137 2.45469   V1 0.370922 1.33276 2.45469   V2 0.371699 1.33555 2.4875 
+  N0 0 -0.987636 -0.156768   N1 -0.257047 -0.953562 -0.156989   N2 -0.228972 -0.849414 0.475466 
+   txt003 
+STRI 
+  V0 0.371699 1.33555 2.4875   V1 0 1.38426 2.4875   V2 0 1.38137 2.45469 
+  N0 -0.228972 -0.849414 0.475466   N1 0 -0.880022 0.474933   N2 0 -0.987636 -0.156768 
+   txt003 
+STRI 
+  V0 0.370922 1.33276 2.45469   V1 0.701938 1.19514 2.45469   V2 0.703409 1.19764 2.4875 
+  N0 -0.257047 -0.953562 -0.156989   N1 -0.495474 -0.854265 -0.157281   N2 -0.441188 -0.760669 0.476167 
+   txt003 
+STRI 
+  V0 0.703409 1.19764 2.4875   V1 0.371699 1.33555 2.4875   V2 0.370922 1.33276 2.45469 
+  N0 -0.441188 -0.760669 0.476167   N1 -0.228972 -0.849414 0.475466   N2 -0.257047 -0.953562 -0.156989 
+   txt003 
+STRI 
+  V0 0.701938 1.19514 2.45469   V1 0.98077 0.98077 2.45469   V2 0.982824 0.982824 2.4875 
+  N0 -0.495474 -0.854265 -0.157281   N1 -0.698293 -0.698293 -0.157393   N2 -0.621695 -0.621695 0.476435 
+   txt003 
+STRI 
+  V0 0.982824 0.982824 2.4875   V1 0.703409 1.19764 2.4875   V2 0.701938 1.19514 2.45469 
+  N0 -0.621695 -0.621695 0.476435   N1 -0.441188 -0.760669 0.476167   N2 -0.495474 -0.854265 -0.157281 
+   txt003 
+STRI 
+  V0 0.98077 0.98077 2.45469   V1 1.19514 0.701938 2.45469   V2 1.19764 0.703409 2.4875 
+  N0 -0.698293 -0.698293 -0.157393   N1 -0.854265 -0.495474 -0.157281   N2 -0.760669 -0.441188 0.476167 
+   txt003 
+STRI 
+  V0 1.19764 0.703409 2.4875   V1 0.982824 0.982824 2.4875   V2 0.98077 0.98077 2.45469 
+  N0 -0.760669 -0.441188 0.476167   N1 -0.621695 -0.621695 0.476435   N2 -0.698293 -0.698293 -0.157393 
+   txt003 
+STRI 
+  V0 1.19514 0.701938 2.45469   V1 1.33276 0.370922 2.45469   V2 1.33555 0.371699 2.4875 
+  N0 -0.854265 -0.495474 -0.157281   N1 -0.953562 -0.257047 -0.156989   N2 -0.849414 -0.228972 0.475466 
+   txt003 
+STRI 
+  V0 1.33555 0.371699 2.4875   V1 1.19764 0.703409 2.4875   V2 1.19514 0.701938 2.45469 
+  N0 -0.849414 -0.228972 0.475466   N1 -0.760669 -0.441188 0.476167   N2 -0.854265 -0.495474 -0.157281 
+   txt003 
+STRI 
+  V0 1.33276 0.370922 2.45469   V1 1.38137 0 2.45469   V2 1.38426 0 2.4875 
+  N0 -0.953562 -0.257047 -0.156989   N1 -0.987636 -9.89971e-17 -0.156768   N2 -0.880022 -6.08179e-16 0.474933 
+   txt003 
+STRI 
+  V0 1.38426 0 2.4875   V1 1.33555 0.371699 2.4875   V2 1.33276 0.370922 2.45469 
+  N0 -0.880022 -6.08179e-16 0.474933   N1 -0.849414 -0.228972 0.475466   N2 -0.953562 -0.257047 -0.156989 
+   txt003 
+STRI 
+  V0 0 1.38426 2.4875   V1 0.371699 1.33555 2.4875   V2 0.376765 1.35376 2.49844 
+  N0 0 -0.880022 0.474933   N1 -0.228972 -0.849414 0.475466   N2 5.93089e-16 2.13636e-15 1 
+   txt003 
+STRI 
+  V0 0.376765 1.35376 2.49844   V1 0 1.40312 2.49844   V2 0 1.38426 2.4875 
+  N0 5.93089e-16 2.13636e-15 1   N1 -0 2.22045e-15 1   N2 0 -0.880022 0.474933 
+   txt003 
+STRI 
+  V0 0.371699 1.33555 2.4875   V1 0.703409 1.19764 2.4875   V2 0.712995 1.21396 2.49844 
+  N0 -0.228972 -0.849414 0.475466   N1 -0.441188 -0.760669 0.476167   N2 1.16933e-15 1.87966e-15 1 
+   txt003 
+STRI 
+  V0 0.712995 1.21396 2.49844   V1 0.376765 1.35376 2.49844   V2 0.371699 1.33555 2.4875 
+  N0 1.16933e-15 1.87966e-15 1   N1 5.93089e-16 2.13636e-15 1   N2 -0.228972 -0.849414 0.475466 
+   txt003 
+STRI 
+  V0 0.703409 1.19764 2.4875   V1 0.982824 0.982824 2.4875   V2 0.996219 0.996219 2.49844 
+  N0 -0.441188 -0.760669 0.476167   N1 -0.621695 -0.621695 0.476435   N2 1.67359e-15 1.4538e-15 1 
+   txt003 
+STRI 
+  V0 0.996219 0.996219 2.49844   V1 0.712995 1.21396 2.49844   V2 0.703409 1.19764 2.4875 
+  N0 1.67359e-15 1.4538e-15 1   N1 1.16933e-15 1.87966e-15 1   N2 -0.441188 -0.760669 0.476167 
+   txt003 
+STRI 
+  V0 0.982824 0.982824 2.4875   V1 1.19764 0.703409 2.4875   V2 1.21396 0.712995 2.49844 
+  N0 -0.621695 -0.621695 0.476435   N1 -0.760669 -0.441188 0.476167   N2 2.05298e-15 8.74229e-16 1 
+   txt003 
+STRI 
+  V0 1.21396 0.712995 2.49844   V1 0.996219 0.996219 2.49844   V2 0.982824 0.982824 2.4875 
+  N0 2.05298e-15 8.74229e-16 1   N1 1.67359e-15 1.4538e-15 1   N2 -0.621695 -0.621695 0.476435 
+   txt003 
+STRI 
+  V0 1.19764 0.703409 2.4875   V1 1.33555 0.371699 2.4875   V2 1.35376 0.376765 2.49844 
+  N0 -0.760669 -0.441188 0.476167   N1 -0.849414 -0.228972 0.475466   N2 2.25214e-15 1.77072e-16 1 
+   txt003 
+STRI 
+  V0 1.35376 0.376765 2.49844   V1 1.21396 0.712995 2.49844   V2 1.19764 0.703409 2.4875 
+  N0 2.25214e-15 1.77072e-16 1   N1 2.05298e-15 8.74229e-16 1   N2 -0.760669 -0.441188 0.476167 
+   txt003 
+STRI 
+  V0 1.33555 0.371699 2.4875   V1 1.38426 0 2.4875   V2 1.40312 0 2.49844 
+  N0 -0.849414 -0.228972 0.475466   N1 -0.880022 -6.08179e-16 0.474933   N2 2.22045e-15 -5.65179e-16 1 
+   txt003 
+STRI 
+  V0 1.40312 0 2.49844   V1 1.35376 0.376765 2.49844   V2 1.33555 0.371699 2.4875 
+  N0 2.22045e-15 -5.65179e-16 1   N1 2.25214e-15 1.77072e-16 1   N2 -0.849414 -0.228972 0.475466 
+   txt003 
+STRI 
+  V0 0 1.40312 2.49844   V1 0.376765 1.35376 2.49844   V2 0.384628 1.38201 2.4875 
+  N0 -0 2.22045e-15 1   N1 5.93089e-16 2.13636e-15 1   N2 0.14476 0.537012 0.831061 
+   txt003 
+STRI 
+  V0 0.384628 1.38201 2.4875   V1 0 1.43241 2.4875   V2 0 1.40312 2.49844 
+  N0 0.14476 0.537012 0.831061   N1 -0 0.556738 0.830688   N2 -0 2.22045e-15 1 
+   txt003 
+STRI 
+  V0 0.376765 1.35376 2.49844   V1 0.712995 1.21396 2.49844   V2 0.727875 1.2393 2.4875 
+  N0 5.93089e-16 2.13636e-15 1   N1 1.16933e-15 1.87966e-15 1   N2 0.278679 0.480481 0.83155 
+   txt003 
+STRI 
+  V0 0.727875 1.2393 2.4875   V1 0.384628 1.38201 2.4875   V2 0.376765 1.35376 2.49844 
+  N0 0.278679 0.480481 0.83155   N1 0.14476 0.537012 0.831061   N2 5.93089e-16 2.13636e-15 1 
+   txt003 
+STRI 
+  V0 0.712995 1.21396 2.49844   V1 0.996219 0.996219 2.49844   V2 1.01701 1.01701 2.4875 
+  N0 1.16933e-15 1.87966e-15 1   N1 1.67359e-15 1.4538e-15 1   N2 0.392564 0.392564 0.831737 
+   txt003 
+STRI 
+  V0 1.01701 1.01701 2.4875   V1 0.727875 1.2393 2.4875   V2 0.712995 1.21396 2.49844 
+  N0 0.392564 0.392564 0.831737   N1 0.278679 0.480481 0.83155   N2 1.16933e-15 1.87966e-15 1 
+   txt003 
+STRI 
+  V0 0.996219 0.996219 2.49844   V1 1.21396 0.712995 2.49844   V2 1.2393 0.727875 2.4875 
+  N0 1.67359e-15 1.4538e-15 1   N1 2.05298e-15 8.74229e-16 1   N2 0.480481 0.278679 0.83155 
+   txt003 
+STRI 
+  V0 1.2393 0.727875 2.4875   V1 1.01701 1.01701 2.4875   V2 0.996219 0.996219 2.49844 
+  N0 0.480481 0.278679 0.83155   N1 0.392564 0.392564 0.831737   N2 1.67359e-15 1.4538e-15 1 
+   txt003 
+STRI 
+  V0 1.21396 0.712995 2.49844   V1 1.35376 0.376765 2.49844   V2 1.38201 0.384628 2.4875 
+  N0 2.05298e-15 8.74229e-16 1   N1 2.25214e-15 1.77072e-16 1   N2 0.537012 0.14476 0.831061 
+   txt003 
+STRI 
+  V0 1.38201 0.384628 2.4875   V1 1.2393 0.727875 2.4875   V2 1.21396 0.712995 2.49844 
+  N0 0.537012 0.14476 0.831061   N1 0.480481 0.278679 0.83155   N2 2.05298e-15 8.74229e-16 1 
+   txt003 
+STRI 
+  V0 1.35376 0.376765 2.49844   V1 1.40312 0 2.49844   V2 1.43241 0 2.4875 
+  N0 2.25214e-15 1.77072e-16 1   N1 2.22045e-15 -5.65179e-16 1   N2 0.556738 -4.5989e-16 0.830688 
+   txt003 
+STRI 
+  V0 1.43241 0 2.4875   V1 1.38201 0.384628 2.4875   V2 1.35376 0.376765 2.49844 
+  N0 0.556738 -4.5989e-16 0.830688   N1 0.537012 0.14476 0.831061   N2 2.25214e-15 1.77072e-16 1 
+   txt003 
+STRI 
+  V0 0 1.43241 2.4875   V1 0.384628 1.38201 2.4875   V2 0.393796 1.41495 2.45469 
+  N0 -0 0.556738 0.830688   N1 0.14476 0.537012 0.831061   N2 0.203756 0.755869 0.622211 
+   txt003 
+STRI 
+  V0 0.393796 1.41495 2.45469   V1 0 1.46655 2.45469   V2 0 1.43241 2.4875 
+  N0 0.203756 0.755869 0.622211   N1 -0 0.783289 0.621658   N2 -0 0.556738 0.830688 
+   txt003 
+STRI 
+  V0 0.384628 1.38201 2.4875   V1 0.727875 1.2393 2.4875   V2 0.745225 1.26884 2.45469 
+  N0 0.14476 0.537012 0.831061   N1 0.278679 0.480481 0.83155   N2 0.39248 0.67669 0.622937 
+   txt003 
+STRI 
+  V0 0.745225 1.26884 2.45469   V1 0.393796 1.41495 2.45469   V2 0.384628 1.38201 2.4875 
+  N0 0.39248 0.67669 0.622937   N1 0.203756 0.755869 0.622211   N2 0.14476 0.537012 0.831061 
+   txt003 
+STRI 
+  V0 0.727875 1.2393 2.4875   V1 1.01701 1.01701 2.4875   V2 1.04125 1.04125 2.45469 
+  N0 0.278679 0.480481 0.83155   N1 0.392564 0.392564 0.831737   N2 0.552993 0.552993 0.623215 
+   txt003 
+STRI 
+  V0 1.04125 1.04125 2.45469   V1 0.745225 1.26884 2.45469   V2 0.727875 1.2393 2.4875 
+  N0 0.552993 0.552993 0.623215   N1 0.39248 0.67669 0.622937   N2 0.278679 0.480481 0.83155 
+   txt003 
+STRI 
+  V0 1.01701 1.01701 2.4875   V1 1.2393 0.727875 2.4875   V2 1.26884 0.745225 2.45469 
+  N0 0.392564 0.392564 0.831737   N1 0.480481 0.278679 0.83155   N2 0.67669 0.39248 0.622937 
+   txt003 
+STRI 
+  V0 1.26884 0.745225 2.45469   V1 1.04125 1.04125 2.45469   V2 1.01701 1.01701 2.4875 
+  N0 0.67669 0.39248 0.622937   N1 0.552993 0.552993 0.623215   N2 0.392564 0.392564 0.831737 
+   txt003 
+STRI 
+  V0 1.2393 0.727875 2.4875   V1 1.38201 0.384628 2.4875   V2 1.41495 0.393796 2.45469 
+  N0 0.480481 0.278679 0.83155   N1 0.537012 0.14476 0.831061   N2 0.755869 0.203756 0.622211 
+   txt003 
+STRI 
+  V0 1.41495 0.393796 2.45469   V1 1.26884 0.745225 2.45469   V2 1.2393 0.727875 2.4875 
+  N0 0.755869 0.203756 0.622211   N1 0.67669 0.39248 0.622937   N2 0.480481 0.278679 0.83155 
+   txt003 
+STRI 
+  V0 1.38201 0.384628 2.4875   V1 1.43241 0 2.4875   V2 1.46655 0 2.45469 
+  N0 0.537012 0.14476 0.831061   N1 0.556738 -4.5989e-16 0.830688   N2 0.783289 -1.94969e-16 0.621658 
+   txt003 
+STRI 
+  V0 1.46655 0 2.45469   V1 1.41495 0.393796 2.45469   V2 1.38201 0.384628 2.4875 
+  N0 0.783289 -1.94969e-16 0.621658   N1 0.755869 0.203756 0.622211   N2 0.537012 0.14476 0.831061 
+   txt003 
+STRI 
+  V0 0 1.46655 2.45469   V1 0.393796 1.41495 2.45469   V2 0.402778 1.44722 2.4 
+  N0 -0 0.783289 0.621658   N1 0.203756 0.755869 0.622211   N2 0.234929 0.871509 0.430442 
+   txt003 
+STRI 
+  V0 0.402778 1.44722 2.4   V1 0 1.5 2.4   V2 0 1.46655 2.45469 
+  N0 0.234929 0.871509 0.430442   N1 -0 0.902861 0.429934   N2 -0 0.783289 0.621658 
+   txt003 
+STRI 
+  V0 0.393796 1.41495 2.45469   V1 0.745225 1.26884 2.45469   V2 0.762222 1.29778 2.4 
+  N0 0.203756 0.755869 0.622211   N1 0.39248 0.67669 0.622937   N2 0.4527 0.780517 0.43111 
+   txt003 
+STRI 
+  V0 0.762222 1.29778 2.4   V1 0.402778 1.44722 2.4   V2 0.393796 1.41495 2.45469 
+  N0 0.4527 0.780517 0.43111   N1 0.234929 0.871509 0.430442   N2 0.203756 0.755869 0.622211 
+   txt003 
+STRI 
+  V0 0.745225 1.26884 2.45469   V1 1.04125 1.04125 2.45469   V2 1.065 1.065 2.4 
+  N0 0.39248 0.67669 0.622937   N1 0.552993 0.552993 0.623215   N2 0.637936 0.637936 0.431366 
+   txt003 
+STRI 
+  V0 1.065 1.065 2.4   V1 0.762222 1.29778 2.4   V2 0.745225 1.26884 2.45469 
+  N0 0.637936 0.637936 0.431366   N1 0.4527 0.780517 0.43111   N2 0.39248 0.67669 0.622937 
+   txt003 
+STRI 
+  V0 1.04125 1.04125 2.45469   V1 1.26884 0.745225 2.45469   V2 1.29778 0.762222 2.4 
+  N0 0.552993 0.552993 0.623215   N1 0.67669 0.39248 0.622937   N2 0.780517 0.4527 0.43111 
+   txt003 
+STRI 
+  V0 1.29778 0.762222 2.4   V1 1.065 1.065 2.4   V2 1.04125 1.04125 2.45469 
+  N0 0.780517 0.4527 0.43111   N1 0.637936 0.637936 0.431366   N2 0.552993 0.552993 0.623215 
+   txt003 
+STRI 
+  V0 1.26884 0.745225 2.45469   V1 1.41495 0.393796 2.45469   V2 1.44722 0.402778 2.4 
+  N0 0.67669 0.39248 0.622937   N1 0.755869 0.203756 0.622211   N2 0.871509 0.234929 0.430442 
+   txt003 
+STRI 
+  V0 1.44722 0.402778 2.4   V1 1.29778 0.762222 2.4   V2 1.26884 0.745225 2.45469 
+  N0 0.871509 0.234929 0.430442   N1 0.780517 0.4527 0.43111   N2 0.67669 0.39248 0.622937 
+   txt003 
+STRI 
+  V0 1.41495 0.393796 2.45469   V1 1.46655 0 2.45469   V2 1.5 0 2.4 
+  N0 0.755869 0.203756 0.622211   N1 0.783289 -1.94969e-16 0.621658   N2 0.902861 -6.81889e-17 0.429934 
+   txt003 
+STRI 
+  V0 1.5 0 2.4   V1 1.44722 0.402778 2.4   V2 1.41495 0.393796 2.45469 
+  N0 0.902861 -6.81889e-17 0.429934   N1 0.871509 0.234929 0.430442   N2 0.755869 0.203756 0.622211 
+   txt003 
+STRI 
+  V0 1.5 0 2.4   V1 1.44722 -0.402778 2.4   V2 1.56671 -0.436032 2.13785 
+  N0 0.902861 0 0.429934   N1 0.871509 -0.234929 0.430442   N2 0.875348 -0.235963 0.422003 
+   txt003 
+STRI 
+  V0 1.56671 -0.436032 2.13785   V1 1.62384 0 2.13785   V2 1.5 0 2.4 
+  N0 0.875348 -0.235963 0.422003   N1 0.906828 0 0.4215   N2 0.902861 0 0.429934 
+   txt003 
+STRI 
+  V0 1.44722 -0.402778 2.4   V1 1.29778 -0.762222 2.4   V2 1.40492 -0.825153 2.13785 
+  N0 0.871509 -0.234929 0.430442   N1 0.780517 -0.4527 0.43111   N2 0.783966 -0.4547 0.422664 
+   txt003 
+STRI 
+  V0 1.40492 -0.825153 2.13785   V1 1.56671 -0.436032 2.13785   V2 1.44722 -0.402778 2.4 
+  N0 0.783966 -0.4547 0.422664   N1 0.875348 -0.235963 0.422003   N2 0.871509 -0.234929 0.430442 
+   txt003 
+STRI 
+  V0 1.29778 -0.762222 2.4   V1 1.065 -1.065 2.4   V2 1.15293 -1.15293 2.13785 
+  N0 0.780517 -0.4527 0.43111   N1 0.637936 -0.637936 0.431366   N2 0.640758 -0.640758 0.422917 
+   txt003 
+STRI 
+  V0 1.15293 -1.15293 2.13785   V1 1.40492 -0.825153 2.13785   V2 1.29778 -0.762222 2.4 
+  N0 0.640758 -0.640758 0.422917   N1 0.783966 -0.4547 0.422664   N2 0.780517 -0.4527 0.43111 
+   txt003 
+STRI 
+  V0 1.065 -1.065 2.4   V1 0.762222 -1.29778 2.4   V2 0.825153 -1.40492 2.13785 
+  N0 0.637936 -0.637936 0.431366   N1 0.4527 -0.780517 0.43111   N2 0.4547 -0.783966 0.422664 
+   txt003 
+STRI 
+  V0 0.825153 -1.40492 2.13785   V1 1.15293 -1.15293 2.13785   V2 1.065 -1.065 2.4 
+  N0 0.4547 -0.783966 0.422664   N1 0.640758 -0.640758 0.422917   N2 0.637936 -0.637936 0.431366 
+   txt003 
+STRI 
+  V0 0.762222 -1.29778 2.4   V1 0.402778 -1.44722 2.4   V2 0.436032 -1.56671 2.13785 
+  N0 0.4527 -0.780517 0.43111   N1 0.234929 -0.871509 0.430442   N2 0.235963 -0.875348 0.422003 
+   txt003 
+STRI 
+  V0 0.436032 -1.56671 2.13785   V1 0.825153 -1.40492 2.13785   V2 0.762222 -1.29778 2.4 
+  N0 0.235963 -0.875348 0.422003   N1 0.4547 -0.783966 0.422664   N2 0.4527 -0.780517 0.43111 
+   txt003 
+STRI 
+  V0 0.402778 -1.44722 2.4   V1 0 -1.5 2.4   V2 2.22045e-16 -1.62384 2.13785 
+  N0 0.234929 -0.871509 0.430442   N1 -2.27296e-16 -0.902861 0.429934   N2 -2.05843e-16 -0.906828 0.4215 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.62384 2.13785   V1 0.436032 -1.56671 2.13785   V2 0.402778 -1.44722 2.4 
+  N0 -2.05843e-16 -0.906828 0.4215   N1 0.235963 -0.875348 0.422003   N2 0.234929 -0.871509 0.430442 
+   txt003 
+STRI 
+  V0 1.62384 0 2.13785   V1 1.56671 -0.436032 2.13785   V2 1.67949 -0.467421 1.87778 
+  N0 0.906828 0 0.4215   N1 0.875348 -0.235963 0.422003   N2 0.886771 -0.239043 0.395595 
+   txt003 
+STRI 
+  V0 1.67949 -0.467421 1.87778   V1 1.74074 0 1.87778   V2 1.62384 0 2.13785 
+  N0 0.886771 -0.239043 0.395595   N1 0.918633 0 0.395111   N2 0.906828 0 0.4215 
+   txt003 
+STRI 
+  V0 1.56671 -0.436032 2.13785   V1 1.40492 -0.825153 2.13785   V2 1.50606 -0.884554 1.87778 
+  N0 0.875348 -0.235963 0.422003   N1 0.783966 -0.4547 0.422664   N2 0.794229 -0.460653 0.39623 
+   txt003 
+STRI 
+  V0 1.50606 -0.884554 1.87778   V1 1.67949 -0.467421 1.87778   V2 1.56671 -0.436032 2.13785 
+  N0 0.794229 -0.460653 0.39623   N1 0.886771 -0.239043 0.395595   N2 0.875348 -0.235963 0.422003 
+   txt003 
+STRI 
+  V0 1.40492 -0.825153 2.13785   V1 1.15293 -1.15293 2.13785   V2 1.23593 -1.23593 1.87778 
+  N0 0.783966 -0.4547 0.422664   N1 0.640758 -0.640758 0.422917   N2 0.649156 -0.649156 0.396474 
+   txt003 
+STRI 
+  V0 1.23593 -1.23593 1.87778   V1 1.50606 -0.884554 1.87778   V2 1.40492 -0.825153 2.13785 
+  N0 0.649156 -0.649156 0.396474   N1 0.794229 -0.460653 0.39623   N2 0.783966 -0.4547 0.422664 
+   txt003 
+STRI 
+  V0 1.15293 -1.15293 2.13785   V1 0.825153 -1.40492 2.13785   V2 0.884554 -1.50606 1.87778 
+  N0 0.640758 -0.640758 0.422917   N1 0.4547 -0.783966 0.422664   N2 0.460653 -0.794229 0.39623 
+   txt003 
+STRI 
+  V0 0.884554 -1.50606 1.87778   V1 1.23593 -1.23593 1.87778   V2 1.15293 -1.15293 2.13785 
+  N0 0.460653 -0.794229 0.39623   N1 0.649156 -0.649156 0.396474   N2 0.640758 -0.640758 0.422917 
+   txt003 
+STRI 
+  V0 0.825153 -1.40492 2.13785   V1 0.436032 -1.56671 2.13785   V2 0.467421 -1.67949 1.87778 
+  N0 0.4547 -0.783966 0.422664   N1 0.235963 -0.875348 0.422003   N2 0.239043 -0.886771 0.395595 
+   txt003 
+STRI 
+  V0 0.467421 -1.67949 1.87778   V1 0.884554 -1.50606 1.87778   V2 0.825153 -1.40492 2.13785 
+  N0 0.239043 -0.886771 0.395595   N1 0.460653 -0.794229 0.39623   N2 0.4547 -0.783966 0.422664 
+   txt003 
+STRI 
+  V0 0.436032 -1.56671 2.13785   V1 2.22045e-16 -1.62384 2.13785   V2 0 -1.74074 1.87778 
+  N0 0.235963 -0.875348 0.422003   N1 -2.05843e-16 -0.906828 0.4215   N2 -1.79998e-16 -0.918633 0.395111 
+   txt003 
+STRI 
+  V0 0 -1.74074 1.87778   V1 0.467421 -1.67949 1.87778   V2 0.436032 -1.56671 2.13785 
+  N0 -1.79998e-16 -0.918633 0.395111   N1 0.239043 -0.886771 0.395595   N2 0.235963 -0.875348 0.422003 
+   txt003 
+STRI 
+  V0 1.74074 0 1.87778   V1 1.67949 -0.467421 1.87778   V2 1.77888 -0.495081 1.62188 
+  N0 0.918633 0 0.395111   N1 0.886771 -0.239043 0.395595   N2 0.90527 -0.244029 0.347757 
+   txt003 
+STRI 
+  V0 1.77888 -0.495081 1.62188   V1 1.84375 0 1.62188   V2 1.74074 0 1.87778 
+  N0 0.90527 -0.244029 0.347757   N1 0.937749 0 0.347314   N2 0.918633 0 0.395111 
+   txt003 
+STRI 
+  V0 1.67949 -0.467421 1.87778   V1 1.50606 -0.884554 1.87778   V2 1.59519 -0.936898 1.62188 
+  N0 0.886771 -0.239043 0.395595   N1 0.794229 -0.460653 0.39623   N2 0.810853 -0.470295 0.34834 
+   txt003 
+STRI 
+  V0 1.59519 -0.936898 1.62188   V1 1.77888 -0.495081 1.62188   V2 1.67949 -0.467421 1.87778 
+  N0 0.810853 -0.470295 0.34834   N1 0.90527 -0.244029 0.347757   N2 0.886771 -0.239043 0.395595 
+   txt003 
+STRI 
+  V0 1.50606 -0.884554 1.87778   V1 1.23593 -1.23593 1.87778   V2 1.30906 -1.30906 1.62188 
+  N0 0.794229 -0.460653 0.39623   N1 0.649156 -0.649156 0.396474   N2 0.662761 -0.662761 0.348563 
+   txt003 
+STRI 
+  V0 1.30906 -1.30906 1.62188   V1 1.59519 -0.936898 1.62188   V2 1.50606 -0.884554 1.87778 
+  N0 0.662761 -0.662761 0.348563   N1 0.810853 -0.470295 0.34834   N2 0.794229 -0.460653 0.39623 
+   txt003 
+STRI 
+  V0 1.23593 -1.23593 1.87778   V1 0.884554 -1.50606 1.87778   V2 0.936898 -1.59519 1.62187 
+  N0 0.649156 -0.649156 0.396474   N1 0.460653 -0.794229 0.39623   N2 0.470295 -0.810853 0.34834 
+   txt003 
+STRI 
+  V0 0.936898 -1.59519 1.62187   V1 1.30906 -1.30906 1.62188   V2 1.23593 -1.23593 1.87778 
+  N0 0.470295 -0.810853 0.34834   N1 0.662761 -0.662761 0.348563   N2 0.649156 -0.649156 0.396474 
+   txt003 
+STRI 
+  V0 0.884554 -1.50606 1.87778   V1 0.467421 -1.67949 1.87778   V2 0.495081 -1.77888 1.62187 
+  N0 0.460653 -0.794229 0.39623   N1 0.239043 -0.886771 0.395595   N2 0.244029 -0.90527 0.347757 
+   txt003 
+STRI 
+  V0 0.495081 -1.77888 1.62187   V1 0.936898 -1.59519 1.62187   V2 0.884554 -1.50606 1.87778 
+  N0 0.244029 -0.90527 0.347757   N1 0.470295 -0.810853 0.34834   N2 0.460653 -0.794229 0.39623 
+   txt003 
+STRI 
+  V0 0.467421 -1.67949 1.87778   V1 0 -1.74074 1.87778   V2 0 -1.84375 1.62187 
+  N0 0.239043 -0.886771 0.395595   N1 -1.79998e-16 -0.918633 0.395111   N2 -1.49384e-16 -0.937749 0.347314 
+   txt003 
+STRI 
+  V0 0 -1.84375 1.62187   V1 0.495081 -1.77888 1.62187   V2 0.467421 -1.67949 1.87778 
+  N0 -1.49384e-16 -0.937749 0.347314   N1 0.244029 -0.90527 0.347757   N2 0.239043 -0.886771 0.395595 
+   txt003 
+STRI 
+  V0 1.84375 0 1.62188   V1 1.77888 -0.495081 1.62188   V2 1.85816 -0.517147 1.37222 
+  N0 0.937749 0 0.347314   N1 0.90527 -0.244029 0.347757   N2 0.929073 -0.250446 0.272213 
+   txt003 
+STRI 
+  V0 1.85816 -0.517147 1.37222   V1 1.92593 0 1.37222   V2 1.84375 0 1.62188 
+  N0 0.929073 -0.250446 0.272213   N1 0.96234 0 0.271848   N2 0.937749 0 0.347314 
+   txt003 
+STRI 
+  V0 1.77888 -0.495081 1.62188   V1 1.59519 -0.936898 1.62188   V2 1.66628 -0.978656 1.37222 
+  N0 0.90527 -0.244029 0.347757   N1 0.810853 -0.470295 0.34834   N2 0.832247 -0.482704 0.272693 
+   txt003 
+STRI 
+  V0 1.66628 -0.978656 1.37222   V1 1.85816 -0.517147 1.37222   V2 1.77888 -0.495081 1.62188 
+  N0 0.832247 -0.482704 0.272693   N1 0.929073 -0.250446 0.272213   N2 0.90527 -0.244029 0.347757 
+   txt003 
+STRI 
+  V0 1.59519 -0.936898 1.62188   V1 1.30906 -1.30906 1.62188   V2 1.36741 -1.36741 1.37222 
+  N0 0.810853 -0.470295 0.34834   N1 0.662761 -0.662761 0.348563   N2 0.680271 -0.680271 0.272877 
+   txt003 
+STRI 
+  V0 1.36741 -1.36741 1.37222   V1 1.66628 -0.978656 1.37222   V2 1.59519 -0.936898 1.62188 
+  N0 0.680271 -0.680271 0.272877   N1 0.832247 -0.482704 0.272693   N2 0.810853 -0.470295 0.34834 
+   txt003 
+STRI 
+  V0 1.30906 -1.30906 1.62188   V1 0.936898 -1.59519 1.62187   V2 0.978656 -1.66628 1.37222 
+  N0 0.662761 -0.662761 0.348563   N1 0.470295 -0.810853 0.34834   N2 0.482704 -0.832247 0.272693 
+   txt003 
+STRI 
+  V0 0.978656 -1.66628 1.37222   V1 1.36741 -1.36741 1.37222   V2 1.30906 -1.30906 1.62188 
+  N0 0.482704 -0.832247 0.272693   N1 0.680271 -0.680271 0.272877   N2 0.662761 -0.662761 0.348563 
+   txt003 
+STRI 
+  V0 0.936898 -1.59519 1.62187   V1 0.495081 -1.77888 1.62187   V2 0.517147 -1.85816 1.37222 
+  N0 0.470295 -0.810853 0.34834   N1 0.244029 -0.90527 0.347757   N2 0.250446 -0.929073 0.272213 
+   txt003 
+STRI 
+  V0 0.517147 -1.85816 1.37222   V1 0.978656 -1.66628 1.37222   V2 0.936898 -1.59519 1.62187 
+  N0 0.250446 -0.929073 0.272213   N1 0.482704 -0.832247 0.272693   N2 0.470295 -0.810853 0.34834 
+   txt003 
+STRI 
+  V0 0.495081 -1.77888 1.62187   V1 0 -1.84375 1.62187   V2 2.22045e-16 -1.92593 1.37222 
+  N0 0.244029 -0.90527 0.347757   N1 -1.49384e-16 -0.937749 0.347314   N2 -1.11936e-16 -0.96234 0.271848 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.92593 1.37222   V1 0.517147 -1.85816 1.37222   V2 0.495081 -1.77888 1.62187 
+  N0 -1.11936e-16 -0.96234 0.271848   N1 0.250446 -0.929073 0.272213   N2 0.244029 -0.90527 0.347757 
+   txt003 
+STRI 
+  V0 1.92593 0 1.37222   V1 1.85816 -0.517147 1.37222   V2 1.91065 -0.531754 1.1309 
+  N0 0.96234 0 0.271848   N1 0.929073 -0.250446 0.272213   N2 0.953145 -0.256935 0.159686 
+   txt003 
+STRI 
+  V0 1.91065 -0.531754 1.1309   V1 1.98032 0 1.1309   V2 1.92593 0 1.37222 
+  N0 0.953145 -0.256935 0.159686   N1 0.987204 0 0.15946   N2 0.96234 0 0.271848 
+   txt003 
+STRI 
+  V0 1.85816 -0.517147 1.37222   V1 1.66628 -0.978656 1.37222   V2 1.71335 -1.0063 1.1309 
+  N0 0.929073 -0.250446 0.272213   N1 0.832247 -0.482704 0.272693   N2 0.853889 -0.495256 0.159982 
+   txt003 
+STRI 
+  V0 1.71335 -1.0063 1.1309   V1 1.91065 -0.531754 1.1309   V2 1.85816 -0.517147 1.37222 
+  N0 0.853889 -0.495256 0.159982   N1 0.953145 -0.256935 0.159686   N2 0.929073 -0.250446 0.272213 
+   txt003 
+STRI 
+  V0 1.66628 -0.978656 1.37222   V1 1.36741 -1.36741 1.37222   V2 1.40603 -1.40603 1.1309 
+  N0 0.832247 -0.482704 0.272693   N1 0.680271 -0.680271 0.272877   N2 0.697986 -0.697986 0.160096 
+   txt003 
+STRI 
+  V0 1.40603 -1.40603 1.1309   V1 1.71335 -1.0063 1.1309   V2 1.66628 -0.978656 1.37222 
+  N0 0.697986 -0.697986 0.160096   N1 0.853889 -0.495256 0.159982   N2 0.832247 -0.482704 0.272693 
+   txt003 
+STRI 
+  V0 1.36741 -1.36741 1.37222   V1 0.978656 -1.66628 1.37222   V2 1.0063 -1.71335 1.1309 
+  N0 0.680271 -0.680271 0.272877   N1 0.482704 -0.832247 0.272693   N2 0.495256 -0.853889 0.159982 
+   txt003 
+STRI 
+  V0 1.0063 -1.71335 1.1309   V1 1.40603 -1.40603 1.1309   V2 1.36741 -1.36741 1.37222 
+  N0 0.495256 -0.853889 0.159982   N1 0.697986 -0.697986 0.160096   N2 0.680271 -0.680271 0.272877 
+   txt003 
+STRI 
+  V0 0.978656 -1.66628 1.37222   V1 0.517147 -1.85816 1.37222   V2 0.531754 -1.91065 1.1309 
+  N0 0.482704 -0.832247 0.272693   N1 0.250446 -0.929073 0.272213   N2 0.256935 -0.953145 0.159686 
+   txt003 
+STRI 
+  V0 0.531754 -1.91065 1.1309   V1 1.0063 -1.71335 1.1309   V2 0.978656 -1.66628 1.37222 
+  N0 0.256935 -0.953145 0.159686   N1 0.495256 -0.853889 0.159982   N2 0.482704 -0.832247 0.272693 
+   txt003 
+STRI 
+  V0 0.517147 -1.85816 1.37222   V1 2.22045e-16 -1.92593 1.37222   V2 -2.22045e-16 -1.98032 1.1309 
+  N0 0.250446 -0.929073 0.272213   N1 -1.11936e-16 -0.96234 0.271848   N2 -6.38555e-17 -0.987204 0.15946 
+   txt003 
+STRI 
+  V0 -2.22045e-16 -1.98032 1.1309   V1 0.531754 -1.91065 1.1309   V2 0.517147 -1.85816 1.37222 
+  N0 -6.38555e-17 -0.987204 0.15946   N1 0.256935 -0.953145 0.159686   N2 0.250446 -0.929073 0.272213 
+   txt003 
+STRI 
+  V0 1.98032 0 1.1309   V1 1.91065 -0.531754 1.1309   V2 1.92963 -0.537037 0.9 
+  N0 0.987204 0 0.15946   N1 0.953145 -0.256935 0.159686   N2 0.965535 -0.260275 5.17854e-17 
+   txt003 
+STRI 
+  V0 1.92963 -0.537037 0.9   V1 2 0 0.9   V2 1.98032 0 1.1309 
+  N0 0.965535 -0.260275 5.17854e-17   N1 1 0 0   N2 0.987204 0 0.15946 
+   txt003 
+STRI 
+  V0 1.91065 -0.531754 1.1309   V1 1.71335 -1.0063 1.1309   V2 1.73037 -1.0163 0.9 
+  N0 0.953145 -0.256935 0.159686   N1 0.853889 -0.495256 0.159982   N2 0.865031 -0.501718 1.36587e-16 
+   txt003 
+STRI 
+  V0 1.73037 -1.0163 0.9   V1 1.92963 -0.537037 0.9   V2 1.91065 -0.531754 1.1309 
+  N0 0.865031 -0.501718 1.36587e-16   N1 0.965535 -0.260275 5.17854e-17   N2 0.953145 -0.256935 0.159686 
+   txt003 
+STRI 
+  V0 1.71335 -1.0063 1.1309   V1 1.40603 -1.40603 1.1309   V2 1.42 -1.42 0.9 
+  N0 0.853889 -0.495256 0.159982   N1 0.697986 -0.697986 0.160096   N2 0.707107 -0.707107 1.74455e-16 
+   txt003 
+STRI 
+  V0 1.42 -1.42 0.9   V1 1.73037 -1.0163 0.9   V2 1.71335 -1.0063 1.1309 
+  N0 0.707107 -0.707107 1.74455e-16   N1 0.865031 -0.501718 1.36587e-16   N2 0.853889 -0.495256 0.159982 
+   txt003 
+STRI 
+  V0 1.40603 -1.40603 1.1309   V1 1.0063 -1.71335 1.1309   V2 1.0163 -1.73037 0.9 
+  N0 0.697986 -0.697986 0.160096   N1 0.495256 -0.853889 0.159982   N2 0.501718 -0.865031 1.36587e-16 
+   txt003 
+STRI 
+  V0 1.0163 -1.73037 0.9   V1 1.42 -1.42 0.9   V2 1.40603 -1.40603 1.1309 
+  N0 0.501718 -0.865031 1.36587e-16   N1 0.707107 -0.707107 1.74455e-16   N2 0.697986 -0.697986 0.160096 
+   txt003 
+STRI 
+  V0 1.0063 -1.71335 1.1309   V1 0.531754 -1.91065 1.1309   V2 0.537037 -1.92963 0.9 
+  N0 0.495256 -0.853889 0.159982   N1 0.256935 -0.953145 0.159686   N2 0.260275 -0.965535 5.17854e-17 
+   txt003 
+STRI 
+  V0 0.537037 -1.92963 0.9   V1 1.0163 -1.73037 0.9   V2 1.0063 -1.71335 1.1309 
+  N0 0.260275 -0.965535 5.17854e-17   N1 0.501718 -0.865031 1.36587e-16   N2 0.495256 -0.853889 0.159982 
+   txt003 
+STRI 
+  V0 0.531754 -1.91065 1.1309   V1 -2.22045e-16 -1.98032 1.1309   V2 0 -2 0.9 
+  N0 0.256935 -0.953145 0.159686   N1 -6.38555e-17 -0.987204 0.15946   N2 0 -1 -0 
+   txt003 
+STRI 
+  V0 0 -2 0.9   V1 0.537037 -1.92963 0.9   V2 0.531754 -1.91065 1.1309 
+  N0 0 -1 -0   N1 0.260275 -0.965535 5.17854e-17   N2 0.256935 -0.953145 0.159686 
+   txt003 
+STRI 
+  V0 0 -1.5 2.4   V1 -0.402778 -1.44722 2.4   V2 -0.436032 -1.56671 2.13785 
+  N0 0 -0.902861 0.429934   N1 -0.234929 -0.871509 0.430442   N2 -0.235963 -0.875348 0.422003 
+   txt003 
+STRI 
+  V0 -0.436032 -1.56671 2.13785   V1 0 -1.62384 2.13785   V2 0 -1.5 2.4 
+  N0 -0.235963 -0.875348 0.422003   N1 0 -0.906828 0.4215   N2 0 -0.902861 0.429934 
+   txt003 
+STRI 
+  V0 -0.402778 -1.44722 2.4   V1 -0.762222 -1.29778 2.4   V2 -0.825153 -1.40492 2.13785 
+  N0 -0.234929 -0.871509 0.430442   N1 -0.4527 -0.780517 0.43111   N2 -0.4547 -0.783966 0.422664 
+   txt003 
+STRI 
+  V0 -0.825153 -1.40492 2.13785   V1 -0.436032 -1.56671 2.13785   V2 -0.402778 -1.44722 2.4 
+  N0 -0.4547 -0.783966 0.422664   N1 -0.235963 -0.875348 0.422003   N2 -0.234929 -0.871509 0.430442 
+   txt003 
+STRI 
+  V0 -0.762222 -1.29778 2.4   V1 -1.065 -1.065 2.4   V2 -1.15293 -1.15293 2.13785 
+  N0 -0.4527 -0.780517 0.43111   N1 -0.637936 -0.637936 0.431366   N2 -0.640758 -0.640758 0.422917 
+   txt003 
+STRI 
+  V0 -1.15293 -1.15293 2.13785   V1 -0.825153 -1.40492 2.13785   V2 -0.762222 -1.29778 2.4 
+  N0 -0.640758 -0.640758 0.422917   N1 -0.4547 -0.783966 0.422664   N2 -0.4527 -0.780517 0.43111 
+   txt003 
+STRI 
+  V0 -1.065 -1.065 2.4   V1 -1.29778 -0.762222 2.4   V2 -1.40492 -0.825153 2.13785 
+  N0 -0.637936 -0.637936 0.431366   N1 -0.780517 -0.4527 0.43111   N2 -0.783966 -0.4547 0.422664 
+   txt003 
+STRI 
+  V0 -1.40492 -0.825153 2.13785   V1 -1.15293 -1.15293 2.13785   V2 -1.065 -1.065 2.4 
+  N0 -0.783966 -0.4547 0.422664   N1 -0.640758 -0.640758 0.422917   N2 -0.637936 -0.637936 0.431366 
+   txt003 
+STRI 
+  V0 -1.29778 -0.762222 2.4   V1 -1.44722 -0.402778 2.4   V2 -1.56671 -0.436032 2.13785 
+  N0 -0.780517 -0.4527 0.43111   N1 -0.871509 -0.234929 0.430442   N2 -0.875348 -0.235963 0.422003 
+   txt003 
+STRI 
+  V0 -1.56671 -0.436032 2.13785   V1 -1.40492 -0.825153 2.13785   V2 -1.29778 -0.762222 2.4 
+  N0 -0.875348 -0.235963 0.422003   N1 -0.783966 -0.4547 0.422664   N2 -0.780517 -0.4527 0.43111 
+   txt003 
+STRI 
+  V0 -1.44722 -0.402778 2.4   V1 -1.5 0 2.4   V2 -1.62384 -2.22045e-16 2.13785 
+  N0 -0.871509 -0.234929 0.430442   N1 -0.902861 2.27296e-16 0.429934   N2 -0.906828 2.05843e-16 0.4215 
+   txt003 
+STRI 
+  V0 -1.62384 -2.22045e-16 2.13785   V1 -1.56671 -0.436032 2.13785   V2 -1.44722 -0.402778 2.4 
+  N0 -0.906828 2.05843e-16 0.4215   N1 -0.875348 -0.235963 0.422003   N2 -0.871509 -0.234929 0.430442 
+   txt003 
+STRI 
+  V0 0 -1.62384 2.13785   V1 -0.436032 -1.56671 2.13785   V2 -0.467421 -1.67949 1.87778 
+  N0 0 -0.906828 0.4215   N1 -0.235963 -0.875348 0.422003   N2 -0.239043 -0.886771 0.395595 
+   txt003 
+STRI 
+  V0 -0.467421 -1.67949 1.87778   V1 0 -1.74074 1.87778   V2 0 -1.62384 2.13785 
+  N0 -0.239043 -0.886771 0.395595   N1 0 -0.918633 0.395111   N2 0 -0.906828 0.4215 
+   txt003 
+STRI 
+  V0 -0.436032 -1.56671 2.13785   V1 -0.825153 -1.40492 2.13785   V2 -0.884554 -1.50606 1.87778 
+  N0 -0.235963 -0.875348 0.422003   N1 -0.4547 -0.783966 0.422664   N2 -0.460653 -0.794229 0.39623 
+   txt003 
+STRI 
+  V0 -0.884554 -1.50606 1.87778   V1 -0.467421 -1.67949 1.87778   V2 -0.436032 -1.56671 2.13785 
+  N0 -0.460653 -0.794229 0.39623   N1 -0.239043 -0.886771 0.395595   N2 -0.235963 -0.875348 0.422003 
+   txt003 
+STRI 
+  V0 -0.825153 -1.40492 2.13785   V1 -1.15293 -1.15293 2.13785   V2 -1.23593 -1.23593 1.87778 
+  N0 -0.4547 -0.783966 0.422664   N1 -0.640758 -0.640758 0.422917   N2 -0.649156 -0.649156 0.396474 
+   txt003 
+STRI 
+  V0 -1.23593 -1.23593 1.87778   V1 -0.884554 -1.50606 1.87778   V2 -0.825153 -1.40492 2.13785 
+  N0 -0.649156 -0.649156 0.396474   N1 -0.460653 -0.794229 0.39623   N2 -0.4547 -0.783966 0.422664 
+   txt003 
+STRI 
+  V0 -1.15293 -1.15293 2.13785   V1 -1.40492 -0.825153 2.13785   V2 -1.50606 -0.884554 1.87778 
+  N0 -0.640758 -0.640758 0.422917   N1 -0.783966 -0.4547 0.422664   N2 -0.794229 -0.460653 0.39623 
+   txt003 
+STRI 
+  V0 -1.50606 -0.884554 1.87778   V1 -1.23593 -1.23593 1.87778   V2 -1.15293 -1.15293 2.13785 
+  N0 -0.794229 -0.460653 0.39623   N1 -0.649156 -0.649156 0.396474   N2 -0.640758 -0.640758 0.422917 
+   txt003 
+STRI 
+  V0 -1.40492 -0.825153 2.13785   V1 -1.56671 -0.436032 2.13785   V2 -1.67949 -0.467421 1.87778 
+  N0 -0.783966 -0.4547 0.422664   N1 -0.875348 -0.235963 0.422003   N2 -0.886771 -0.239043 0.395595 
+   txt003 
+STRI 
+  V0 -1.67949 -0.467421 1.87778   V1 -1.50606 -0.884554 1.87778   V2 -1.40492 -0.825153 2.13785 
+  N0 -0.886771 -0.239043 0.395595   N1 -0.794229 -0.460653 0.39623   N2 -0.783966 -0.4547 0.422664 
+   txt003 
+STRI 
+  V0 -1.56671 -0.436032 2.13785   V1 -1.62384 -2.22045e-16 2.13785   V2 -1.74074 0 1.87778 
+  N0 -0.875348 -0.235963 0.422003   N1 -0.906828 2.05843e-16 0.4215   N2 -0.918633 1.79998e-16 0.395111 
+   txt003 
+STRI 
+  V0 -1.74074 0 1.87778   V1 -1.67949 -0.467421 1.87778   V2 -1.56671 -0.436032 2.13785 
+  N0 -0.918633 1.79998e-16 0.395111   N1 -0.886771 -0.239043 0.395595   N2 -0.875348 -0.235963 0.422003 
+   txt003 
+STRI 
+  V0 0 -1.74074 1.87778   V1 -0.467421 -1.67949 1.87778   V2 -0.495081 -1.77888 1.62188 
+  N0 0 -0.918633 0.395111   N1 -0.239043 -0.886771 0.395595   N2 -0.244029 -0.90527 0.347757 
+   txt003 
+STRI 
+  V0 -0.495081 -1.77888 1.62188   V1 0 -1.84375 1.62188   V2 0 -1.74074 1.87778 
+  N0 -0.244029 -0.90527 0.347757   N1 0 -0.937749 0.347314   N2 0 -0.918633 0.395111 
+   txt003 
+STRI 
+  V0 -0.467421 -1.67949 1.87778   V1 -0.884554 -1.50606 1.87778   V2 -0.936898 -1.59519 1.62188 
+  N0 -0.239043 -0.886771 0.395595   N1 -0.460653 -0.794229 0.39623   N2 -0.470295 -0.810853 0.34834 
+   txt003 
+STRI 
+  V0 -0.936898 -1.59519 1.62188   V1 -0.495081 -1.77888 1.62188   V2 -0.467421 -1.67949 1.87778 
+  N0 -0.470295 -0.810853 0.34834   N1 -0.244029 -0.90527 0.347757   N2 -0.239043 -0.886771 0.395595 
+   txt003 
+STRI 
+  V0 -0.884554 -1.50606 1.87778   V1 -1.23593 -1.23593 1.87778   V2 -1.30906 -1.30906 1.62188 
+  N0 -0.460653 -0.794229 0.39623   N1 -0.649156 -0.649156 0.396474   N2 -0.662761 -0.662761 0.348563 
+   txt003 
+STRI 
+  V0 -1.30906 -1.30906 1.62188   V1 -0.936898 -1.59519 1.62188   V2 -0.884554 -1.50606 1.87778 
+  N0 -0.662761 -0.662761 0.348563   N1 -0.470295 -0.810853 0.34834   N2 -0.460653 -0.794229 0.39623 
+   txt003 
+STRI 
+  V0 -1.23593 -1.23593 1.87778   V1 -1.50606 -0.884554 1.87778   V2 -1.59519 -0.936898 1.62187 
+  N0 -0.649156 -0.649156 0.396474   N1 -0.794229 -0.460653 0.39623   N2 -0.810853 -0.470295 0.34834 
+   txt003 
+STRI 
+  V0 -1.59519 -0.936898 1.62187   V1 -1.30906 -1.30906 1.62188   V2 -1.23593 -1.23593 1.87778 
+  N0 -0.810853 -0.470295 0.34834   N1 -0.662761 -0.662761 0.348563   N2 -0.649156 -0.649156 0.396474 
+   txt003 
+STRI 
+  V0 -1.50606 -0.884554 1.87778   V1 -1.67949 -0.467421 1.87778   V2 -1.77888 -0.495081 1.62187 
+  N0 -0.794229 -0.460653 0.39623   N1 -0.886771 -0.239043 0.395595   N2 -0.90527 -0.244029 0.347757 
+   txt003 
+STRI 
+  V0 -1.77888 -0.495081 1.62187   V1 -1.59519 -0.936898 1.62187   V2 -1.50606 -0.884554 1.87778 
+  N0 -0.90527 -0.244029 0.347757   N1 -0.810853 -0.470295 0.34834   N2 -0.794229 -0.460653 0.39623 
+   txt003 
+STRI 
+  V0 -1.67949 -0.467421 1.87778   V1 -1.74074 0 1.87778   V2 -1.84375 0 1.62187 
+  N0 -0.886771 -0.239043 0.395595   N1 -0.918633 1.79998e-16 0.395111   N2 -0.937749 1.49384e-16 0.347314 
+   txt003 
+STRI 
+  V0 -1.84375 0 1.62187   V1 -1.77888 -0.495081 1.62187   V2 -1.67949 -0.467421 1.87778 
+  N0 -0.937749 1.49384e-16 0.347314   N1 -0.90527 -0.244029 0.347757   N2 -0.886771 -0.239043 0.395595 
+   txt003 
+STRI 
+  V0 0 -1.84375 1.62188   V1 -0.495081 -1.77888 1.62188   V2 -0.517147 -1.85816 1.37222 
+  N0 0 -0.937749 0.347314   N1 -0.244029 -0.90527 0.347757   N2 -0.250446 -0.929073 0.272213 
+   txt003 
+STRI 
+  V0 -0.517147 -1.85816 1.37222   V1 0 -1.92593 1.37222   V2 0 -1.84375 1.62188 
+  N0 -0.250446 -0.929073 0.272213   N1 0 -0.96234 0.271848   N2 0 -0.937749 0.347314 
+   txt003 
+STRI 
+  V0 -0.495081 -1.77888 1.62188   V1 -0.936898 -1.59519 1.62188   V2 -0.978656 -1.66628 1.37222 
+  N0 -0.244029 -0.90527 0.347757   N1 -0.470295 -0.810853 0.34834   N2 -0.482704 -0.832247 0.272693 
+   txt003 
+STRI 
+  V0 -0.978656 -1.66628 1.37222   V1 -0.517147 -1.85816 1.37222   V2 -0.495081 -1.77888 1.62188 
+  N0 -0.482704 -0.832247 0.272693   N1 -0.250446 -0.929073 0.272213   N2 -0.244029 -0.90527 0.347757 
+   txt003 
+STRI 
+  V0 -0.936898 -1.59519 1.62188   V1 -1.30906 -1.30906 1.62188   V2 -1.36741 -1.36741 1.37222 
+  N0 -0.470295 -0.810853 0.34834   N1 -0.662761 -0.662761 0.348563   N2 -0.680271 -0.680271 0.272877 
+   txt003 
+STRI 
+  V0 -1.36741 -1.36741 1.37222   V1 -0.978656 -1.66628 1.37222   V2 -0.936898 -1.59519 1.62188 
+  N0 -0.680271 -0.680271 0.272877   N1 -0.482704 -0.832247 0.272693   N2 -0.470295 -0.810853 0.34834 
+   txt003 
+STRI 
+  V0 -1.30906 -1.30906 1.62188   V1 -1.59519 -0.936898 1.62187   V2 -1.66628 -0.978656 1.37222 
+  N0 -0.662761 -0.662761 0.348563   N1 -0.810853 -0.470295 0.34834   N2 -0.832247 -0.482704 0.272693 
+   txt003 
+STRI 
+  V0 -1.66628 -0.978656 1.37222   V1 -1.36741 -1.36741 1.37222   V2 -1.30906 -1.30906 1.62188 
+  N0 -0.832247 -0.482704 0.272693   N1 -0.680271 -0.680271 0.272877   N2 -0.662761 -0.662761 0.348563 
+   txt003 
+STRI 
+  V0 -1.59519 -0.936898 1.62187   V1 -1.77888 -0.495081 1.62187   V2 -1.85816 -0.517147 1.37222 
+  N0 -0.810853 -0.470295 0.34834   N1 -0.90527 -0.244029 0.347757   N2 -0.929073 -0.250446 0.272213 
+   txt003 
+STRI 
+  V0 -1.85816 -0.517147 1.37222   V1 -1.66628 -0.978656 1.37222   V2 -1.59519 -0.936898 1.62187 
+  N0 -0.929073 -0.250446 0.272213   N1 -0.832247 -0.482704 0.272693   N2 -0.810853 -0.470295 0.34834 
+   txt003 
+STRI 
+  V0 -1.77888 -0.495081 1.62187   V1 -1.84375 0 1.62187   V2 -1.92593 -2.22045e-16 1.37222 
+  N0 -0.90527 -0.244029 0.347757   N1 -0.937749 1.49384e-16 0.347314   N2 -0.96234 1.11936e-16 0.271848 
+   txt003 
+STRI 
+  V0 -1.92593 -2.22045e-16 1.37222   V1 -1.85816 -0.517147 1.37222   V2 -1.77888 -0.495081 1.62187 
+  N0 -0.96234 1.11936e-16 0.271848   N1 -0.929073 -0.250446 0.272213   N2 -0.90527 -0.244029 0.347757 
+   txt003 
+STRI 
+  V0 0 -1.92593 1.37222   V1 -0.517147 -1.85816 1.37222   V2 -0.531754 -1.91065 1.1309 
+  N0 0 -0.96234 0.271848   N1 -0.250446 -0.929073 0.272213   N2 -0.256935 -0.953145 0.159686 
+   txt003 
+STRI 
+  V0 -0.531754 -1.91065 1.1309   V1 0 -1.98032 1.1309   V2 0 -1.92593 1.37222 
+  N0 -0.256935 -0.953145 0.159686   N1 0 -0.987204 0.15946   N2 0 -0.96234 0.271848 
+   txt003 
+STRI 
+  V0 -0.517147 -1.85816 1.37222   V1 -0.978656 -1.66628 1.37222   V2 -1.0063 -1.71335 1.1309 
+  N0 -0.250446 -0.929073 0.272213   N1 -0.482704 -0.832247 0.272693   N2 -0.495256 -0.853889 0.159982 
+   txt003 
+STRI 
+  V0 -1.0063 -1.71335 1.1309   V1 -0.531754 -1.91065 1.1309   V2 -0.517147 -1.85816 1.37222 
+  N0 -0.495256 -0.853889 0.159982   N1 -0.256935 -0.953145 0.159686   N2 -0.250446 -0.929073 0.272213 
+   txt003 
+STRI 
+  V0 -0.978656 -1.66628 1.37222   V1 -1.36741 -1.36741 1.37222   V2 -1.40603 -1.40603 1.1309 
+  N0 -0.482704 -0.832247 0.272693   N1 -0.680271 -0.680271 0.272877   N2 -0.697986 -0.697986 0.160096 
+   txt003 
+STRI 
+  V0 -1.40603 -1.40603 1.1309   V1 -1.0063 -1.71335 1.1309   V2 -0.978656 -1.66628 1.37222 
+  N0 -0.697986 -0.697986 0.160096   N1 -0.495256 -0.853889 0.159982   N2 -0.482704 -0.832247 0.272693 
+   txt003 
+STRI 
+  V0 -1.36741 -1.36741 1.37222   V1 -1.66628 -0.978656 1.37222   V2 -1.71335 -1.0063 1.1309 
+  N0 -0.680271 -0.680271 0.272877   N1 -0.832247 -0.482704 0.272693   N2 -0.853889 -0.495256 0.159982 
+   txt003 
+STRI 
+  V0 -1.71335 -1.0063 1.1309   V1 -1.40603 -1.40603 1.1309   V2 -1.36741 -1.36741 1.37222 
+  N0 -0.853889 -0.495256 0.159982   N1 -0.697986 -0.697986 0.160096   N2 -0.680271 -0.680271 0.272877 
+   txt003 
+STRI 
+  V0 -1.66628 -0.978656 1.37222   V1 -1.85816 -0.517147 1.37222   V2 -1.91065 -0.531754 1.1309 
+  N0 -0.832247 -0.482704 0.272693   N1 -0.929073 -0.250446 0.272213   N2 -0.953145 -0.256935 0.159686 
+   txt003 
+STRI 
+  V0 -1.91065 -0.531754 1.1309   V1 -1.71335 -1.0063 1.1309   V2 -1.66628 -0.978656 1.37222 
+  N0 -0.953145 -0.256935 0.159686   N1 -0.853889 -0.495256 0.159982   N2 -0.832247 -0.482704 0.272693 
+   txt003 
+STRI 
+  V0 -1.85816 -0.517147 1.37222   V1 -1.92593 -2.22045e-16 1.37222   V2 -1.98032 2.22045e-16 1.1309 
+  N0 -0.929073 -0.250446 0.272213   N1 -0.96234 1.11936e-16 0.271848   N2 -0.987204 6.38555e-17 0.15946 
+   txt003 
+STRI 
+  V0 -1.98032 2.22045e-16 1.1309   V1 -1.91065 -0.531754 1.1309   V2 -1.85816 -0.517147 1.37222 
+  N0 -0.987204 6.38555e-17 0.15946   N1 -0.953145 -0.256935 0.159686   N2 -0.929073 -0.250446 0.272213 
+   txt003 
+STRI 
+  V0 0 -1.98032 1.1309   V1 -0.531754 -1.91065 1.1309   V2 -0.537037 -1.92963 0.9 
+  N0 0 -0.987204 0.15946   N1 -0.256935 -0.953145 0.159686   N2 -0.260275 -0.965535 5.17854e-17 
+   txt003 
+STRI 
+  V0 -0.537037 -1.92963 0.9   V1 0 -2 0.9   V2 0 -1.98032 1.1309 
+  N0 -0.260275 -0.965535 5.17854e-17   N1 -0 -1 -0   N2 0 -0.987204 0.15946 
+   txt003 
+STRI 
+  V0 -0.531754 -1.91065 1.1309   V1 -1.0063 -1.71335 1.1309   V2 -1.0163 -1.73037 0.9 
+  N0 -0.256935 -0.953145 0.159686   N1 -0.495256 -0.853889 0.159982   N2 -0.501718 -0.865031 1.36587e-16 
+   txt003 
+STRI 
+  V0 -1.0163 -1.73037 0.9   V1 -0.537037 -1.92963 0.9   V2 -0.531754 -1.91065 1.1309 
+  N0 -0.501718 -0.865031 1.36587e-16   N1 -0.260275 -0.965535 5.17854e-17   N2 -0.256935 -0.953145 0.159686 
+   txt003 
+STRI 
+  V0 -1.0063 -1.71335 1.1309   V1 -1.40603 -1.40603 1.1309   V2 -1.42 -1.42 0.9 
+  N0 -0.495256 -0.853889 0.159982   N1 -0.697986 -0.697986 0.160096   N2 -0.707107 -0.707107 1.74455e-16 
+   txt003 
+STRI 
+  V0 -1.42 -1.42 0.9   V1 -1.0163 -1.73037 0.9   V2 -1.0063 -1.71335 1.1309 
+  N0 -0.707107 -0.707107 1.74455e-16   N1 -0.501718 -0.865031 1.36587e-16   N2 -0.495256 -0.853889 0.159982 
+   txt003 
+STRI 
+  V0 -1.40603 -1.40603 1.1309   V1 -1.71335 -1.0063 1.1309   V2 -1.73037 -1.0163 0.9 
+  N0 -0.697986 -0.697986 0.160096   N1 -0.853889 -0.495256 0.159982   N2 -0.865031 -0.501718 1.36587e-16 
+   txt003 
+STRI 
+  V0 -1.73037 -1.0163 0.9   V1 -1.42 -1.42 0.9   V2 -1.40603 -1.40603 1.1309 
+  N0 -0.865031 -0.501718 1.36587e-16   N1 -0.707107 -0.707107 1.74455e-16   N2 -0.697986 -0.697986 0.160096 
+   txt003 
+STRI 
+  V0 -1.71335 -1.0063 1.1309   V1 -1.91065 -0.531754 1.1309   V2 -1.92963 -0.537037 0.9 
+  N0 -0.853889 -0.495256 0.159982   N1 -0.953145 -0.256935 0.159686   N2 -0.965535 -0.260275 5.17854e-17 
+   txt003 
+STRI 
+  V0 -1.92963 -0.537037 0.9   V1 -1.73037 -1.0163 0.9   V2 -1.71335 -1.0063 1.1309 
+  N0 -0.965535 -0.260275 5.17854e-17   N1 -0.865031 -0.501718 1.36587e-16   N2 -0.853889 -0.495256 0.159982 
+   txt003 
+STRI 
+  V0 -1.91065 -0.531754 1.1309   V1 -1.98032 2.22045e-16 1.1309   V2 -2 0 0.9 
+  N0 -0.953145 -0.256935 0.159686   N1 -0.987204 6.38555e-17 0.15946   N2 -1 0 0 
+   txt003 
+STRI 
+  V0 -2 0 0.9   V1 -1.92963 -0.537037 0.9   V2 -1.91065 -0.531754 1.1309 
+  N0 -1 0 0   N1 -0.965535 -0.260275 5.17854e-17   N2 -0.953145 -0.256935 0.159686 
+   txt003 
+STRI 
+  V0 -1.5 0 2.4   V1 -1.44722 0.402778 2.4   V2 -1.56671 0.436032 2.13785 
+  N0 -0.902861 0 0.429934   N1 -0.871509 0.234929 0.430442   N2 -0.875348 0.235963 0.422003 
+   txt003 
+STRI 
+  V0 -1.56671 0.436032 2.13785   V1 -1.62384 0 2.13785   V2 -1.5 0 2.4 
+  N0 -0.875348 0.235963 0.422003   N1 -0.906828 0 0.4215   N2 -0.902861 0 0.429934 
+   txt003 
+STRI 
+  V0 -1.44722 0.402778 2.4   V1 -1.29778 0.762222 2.4   V2 -1.40492 0.825153 2.13785 
+  N0 -0.871509 0.234929 0.430442   N1 -0.780517 0.4527 0.43111   N2 -0.783966 0.4547 0.422664 
+   txt003 
+STRI 
+  V0 -1.40492 0.825153 2.13785   V1 -1.56671 0.436032 2.13785   V2 -1.44722 0.402778 2.4 
+  N0 -0.783966 0.4547 0.422664   N1 -0.875348 0.235963 0.422003   N2 -0.871509 0.234929 0.430442 
+   txt003 
+STRI 
+  V0 -1.29778 0.762222 2.4   V1 -1.065 1.065 2.4   V2 -1.15293 1.15293 2.13785 
+  N0 -0.780517 0.4527 0.43111   N1 -0.637936 0.637936 0.431366   N2 -0.640758 0.640758 0.422917 
+   txt003 
+STRI 
+  V0 -1.15293 1.15293 2.13785   V1 -1.40492 0.825153 2.13785   V2 -1.29778 0.762222 2.4 
+  N0 -0.640758 0.640758 0.422917   N1 -0.783966 0.4547 0.422664   N2 -0.780517 0.4527 0.43111 
+   txt003 
+STRI 
+  V0 -1.065 1.065 2.4   V1 -0.762222 1.29778 2.4   V2 -0.825153 1.40492 2.13785 
+  N0 -0.637936 0.637936 0.431366   N1 -0.4527 0.780517 0.43111   N2 -0.4547 0.783966 0.422664 
+   txt003 
+STRI 
+  V0 -0.825153 1.40492 2.13785   V1 -1.15293 1.15293 2.13785   V2 -1.065 1.065 2.4 
+  N0 -0.4547 0.783966 0.422664   N1 -0.640758 0.640758 0.422917   N2 -0.637936 0.637936 0.431366 
+   txt003 
+STRI 
+  V0 -0.762222 1.29778 2.4   V1 -0.402778 1.44722 2.4   V2 -0.436032 1.56671 2.13785 
+  N0 -0.4527 0.780517 0.43111   N1 -0.234929 0.871509 0.430442   N2 -0.235963 0.875348 0.422003 
+   txt003 
+STRI 
+  V0 -0.436032 1.56671 2.13785   V1 -0.825153 1.40492 2.13785   V2 -0.762222 1.29778 2.4 
+  N0 -0.235963 0.875348 0.422003   N1 -0.4547 0.783966 0.422664   N2 -0.4527 0.780517 0.43111 
+   txt003 
+STRI 
+  V0 -0.402778 1.44722 2.4   V1 0 1.5 2.4   V2 -2.22045e-16 1.62384 2.13785 
+  N0 -0.234929 0.871509 0.430442   N1 2.27296e-16 0.902861 0.429934   N2 2.05843e-16 0.906828 0.4215 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.62384 2.13785   V1 -0.436032 1.56671 2.13785   V2 -0.402778 1.44722 2.4 
+  N0 2.05843e-16 0.906828 0.4215   N1 -0.235963 0.875348 0.422003   N2 -0.234929 0.871509 0.430442 
+   txt003 
+STRI 
+  V0 -1.62384 0 2.13785   V1 -1.56671 0.436032 2.13785   V2 -1.67949 0.467421 1.87778 
+  N0 -0.906828 0 0.4215   N1 -0.875348 0.235963 0.422003   N2 -0.886771 0.239043 0.395595 
+   txt003 
+STRI 
+  V0 -1.67949 0.467421 1.87778   V1 -1.74074 0 1.87778   V2 -1.62384 0 2.13785 
+  N0 -0.886771 0.239043 0.395595   N1 -0.918633 0 0.395111   N2 -0.906828 0 0.4215 
+   txt003 
+STRI 
+  V0 -1.56671 0.436032 2.13785   V1 -1.40492 0.825153 2.13785   V2 -1.50606 0.884554 1.87778 
+  N0 -0.875348 0.235963 0.422003   N1 -0.783966 0.4547 0.422664   N2 -0.794229 0.460653 0.39623 
+   txt003 
+STRI 
+  V0 -1.50606 0.884554 1.87778   V1 -1.67949 0.467421 1.87778   V2 -1.56671 0.436032 2.13785 
+  N0 -0.794229 0.460653 0.39623   N1 -0.886771 0.239043 0.395595   N2 -0.875348 0.235963 0.422003 
+   txt003 
+STRI 
+  V0 -1.40492 0.825153 2.13785   V1 -1.15293 1.15293 2.13785   V2 -1.23593 1.23593 1.87778 
+  N0 -0.783966 0.4547 0.422664   N1 -0.640758 0.640758 0.422917   N2 -0.649156 0.649156 0.396474 
+   txt003 
+STRI 
+  V0 -1.23593 1.23593 1.87778   V1 -1.50606 0.884554 1.87778   V2 -1.40492 0.825153 2.13785 
+  N0 -0.649156 0.649156 0.396474   N1 -0.794229 0.460653 0.39623   N2 -0.783966 0.4547 0.422664 
+   txt003 
+STRI 
+  V0 -1.15293 1.15293 2.13785   V1 -0.825153 1.40492 2.13785   V2 -0.884554 1.50606 1.87778 
+  N0 -0.640758 0.640758 0.422917   N1 -0.4547 0.783966 0.422664   N2 -0.460653 0.794229 0.39623 
+   txt003 
+STRI 
+  V0 -0.884554 1.50606 1.87778   V1 -1.23593 1.23593 1.87778   V2 -1.15293 1.15293 2.13785 
+  N0 -0.460653 0.794229 0.39623   N1 -0.649156 0.649156 0.396474   N2 -0.640758 0.640758 0.422917 
+   txt003 
+STRI 
+  V0 -0.825153 1.40492 2.13785   V1 -0.436032 1.56671 2.13785   V2 -0.467421 1.67949 1.87778 
+  N0 -0.4547 0.783966 0.422664   N1 -0.235963 0.875348 0.422003   N2 -0.239043 0.886771 0.395595 
+   txt003 
+STRI 
+  V0 -0.467421 1.67949 1.87778   V1 -0.884554 1.50606 1.87778   V2 -0.825153 1.40492 2.13785 
+  N0 -0.239043 0.886771 0.395595   N1 -0.460653 0.794229 0.39623   N2 -0.4547 0.783966 0.422664 
+   txt003 
+STRI 
+  V0 -0.436032 1.56671 2.13785   V1 -2.22045e-16 1.62384 2.13785   V2 0 1.74074 1.87778 
+  N0 -0.235963 0.875348 0.422003   N1 2.05843e-16 0.906828 0.4215   N2 1.79998e-16 0.918633 0.395111 
+   txt003 
+STRI 
+  V0 0 1.74074 1.87778   V1 -0.467421 1.67949 1.87778   V2 -0.436032 1.56671 2.13785 
+  N0 1.79998e-16 0.918633 0.395111   N1 -0.239043 0.886771 0.395595   N2 -0.235963 0.875348 0.422003 
+   txt003 
+STRI 
+  V0 -1.74074 0 1.87778   V1 -1.67949 0.467421 1.87778   V2 -1.77888 0.495081 1.62188 
+  N0 -0.918633 0 0.395111   N1 -0.886771 0.239043 0.395595   N2 -0.90527 0.244029 0.347757 
+   txt003 
+STRI 
+  V0 -1.77888 0.495081 1.62188   V1 -1.84375 0 1.62188   V2 -1.74074 0 1.87778 
+  N0 -0.90527 0.244029 0.347757   N1 -0.937749 0 0.347314   N2 -0.918633 0 0.395111 
+   txt003 
+STRI 
+  V0 -1.67949 0.467421 1.87778   V1 -1.50606 0.884554 1.87778   V2 -1.59519 0.936898 1.62188 
+  N0 -0.886771 0.239043 0.395595   N1 -0.794229 0.460653 0.39623   N2 -0.810853 0.470295 0.34834 
+   txt003 
+STRI 
+  V0 -1.59519 0.936898 1.62188   V1 -1.77888 0.495081 1.62188   V2 -1.67949 0.467421 1.87778 
+  N0 -0.810853 0.470295 0.34834   N1 -0.90527 0.244029 0.347757   N2 -0.886771 0.239043 0.395595 
+   txt003 
+STRI 
+  V0 -1.50606 0.884554 1.87778   V1 -1.23593 1.23593 1.87778   V2 -1.30906 1.30906 1.62188 
+  N0 -0.794229 0.460653 0.39623   N1 -0.649156 0.649156 0.396474   N2 -0.662761 0.662761 0.348563 
+   txt003 
+STRI 
+  V0 -1.30906 1.30906 1.62188   V1 -1.59519 0.936898 1.62188   V2 -1.50606 0.884554 1.87778 
+  N0 -0.662761 0.662761 0.348563   N1 -0.810853 0.470295 0.34834   N2 -0.794229 0.460653 0.39623 
+   txt003 
+STRI 
+  V0 -1.23593 1.23593 1.87778   V1 -0.884554 1.50606 1.87778   V2 -0.936898 1.59519 1.62187 
+  N0 -0.649156 0.649156 0.396474   N1 -0.460653 0.794229 0.39623   N2 -0.470295 0.810853 0.34834 
+   txt003 
+STRI 
+  V0 -0.936898 1.59519 1.62187   V1 -1.30906 1.30906 1.62188   V2 -1.23593 1.23593 1.87778 
+  N0 -0.470295 0.810853 0.34834   N1 -0.662761 0.662761 0.348563   N2 -0.649156 0.649156 0.396474 
+   txt003 
+STRI 
+  V0 -0.884554 1.50606 1.87778   V1 -0.467421 1.67949 1.87778   V2 -0.495081 1.77888 1.62187 
+  N0 -0.460653 0.794229 0.39623   N1 -0.239043 0.886771 0.395595   N2 -0.244029 0.90527 0.347757 
+   txt003 
+STRI 
+  V0 -0.495081 1.77888 1.62187   V1 -0.936898 1.59519 1.62187   V2 -0.884554 1.50606 1.87778 
+  N0 -0.244029 0.90527 0.347757   N1 -0.470295 0.810853 0.34834   N2 -0.460653 0.794229 0.39623 
+   txt003 
+STRI 
+  V0 -0.467421 1.67949 1.87778   V1 0 1.74074 1.87778   V2 0 1.84375 1.62187 
+  N0 -0.239043 0.886771 0.395595   N1 1.79998e-16 0.918633 0.395111   N2 1.49384e-16 0.937749 0.347314 
+   txt003 
+STRI 
+  V0 0 1.84375 1.62187   V1 -0.495081 1.77888 1.62187   V2 -0.467421 1.67949 1.87778 
+  N0 1.49384e-16 0.937749 0.347314   N1 -0.244029 0.90527 0.347757   N2 -0.239043 0.886771 0.395595 
+   txt003 
+STRI 
+  V0 -1.84375 0 1.62188   V1 -1.77888 0.495081 1.62188   V2 -1.85816 0.517147 1.37222 
+  N0 -0.937749 0 0.347314   N1 -0.90527 0.244029 0.347757   N2 -0.929073 0.250446 0.272213 
+   txt003 
+STRI 
+  V0 -1.85816 0.517147 1.37222   V1 -1.92593 0 1.37222   V2 -1.84375 0 1.62188 
+  N0 -0.929073 0.250446 0.272213   N1 -0.96234 0 0.271848   N2 -0.937749 0 0.347314 
+   txt003 
+STRI 
+  V0 -1.77888 0.495081 1.62188   V1 -1.59519 0.936898 1.62188   V2 -1.66628 0.978656 1.37222 
+  N0 -0.90527 0.244029 0.347757   N1 -0.810853 0.470295 0.34834   N2 -0.832247 0.482704 0.272693 
+   txt003 
+STRI 
+  V0 -1.66628 0.978656 1.37222   V1 -1.85816 0.517147 1.37222   V2 -1.77888 0.495081 1.62188 
+  N0 -0.832247 0.482704 0.272693   N1 -0.929073 0.250446 0.272213   N2 -0.90527 0.244029 0.347757 
+   txt003 
+STRI 
+  V0 -1.59519 0.936898 1.62188   V1 -1.30906 1.30906 1.62188   V2 -1.36741 1.36741 1.37222 
+  N0 -0.810853 0.470295 0.34834   N1 -0.662761 0.662761 0.348563   N2 -0.680271 0.680271 0.272877 
+   txt003 
+STRI 
+  V0 -1.36741 1.36741 1.37222   V1 -1.66628 0.978656 1.37222   V2 -1.59519 0.936898 1.62188 
+  N0 -0.680271 0.680271 0.272877   N1 -0.832247 0.482704 0.272693   N2 -0.810853 0.470295 0.34834 
+   txt003 
+STRI 
+  V0 -1.30906 1.30906 1.62188   V1 -0.936898 1.59519 1.62187   V2 -0.978656 1.66628 1.37222 
+  N0 -0.662761 0.662761 0.348563   N1 -0.470295 0.810853 0.34834   N2 -0.482704 0.832247 0.272693 
+   txt003 
+STRI 
+  V0 -0.978656 1.66628 1.37222   V1 -1.36741 1.36741 1.37222   V2 -1.30906 1.30906 1.62188 
+  N0 -0.482704 0.832247 0.272693   N1 -0.680271 0.680271 0.272877   N2 -0.662761 0.662761 0.348563 
+   txt003 
+STRI 
+  V0 -0.936898 1.59519 1.62187   V1 -0.495081 1.77888 1.62187   V2 -0.517147 1.85816 1.37222 
+  N0 -0.470295 0.810853 0.34834   N1 -0.244029 0.90527 0.347757   N2 -0.250446 0.929073 0.272213 
+   txt003 
+STRI 
+  V0 -0.517147 1.85816 1.37222   V1 -0.978656 1.66628 1.37222   V2 -0.936898 1.59519 1.62187 
+  N0 -0.250446 0.929073 0.272213   N1 -0.482704 0.832247 0.272693   N2 -0.470295 0.810853 0.34834 
+   txt003 
+STRI 
+  V0 -0.495081 1.77888 1.62187   V1 0 1.84375 1.62187   V2 -2.22045e-16 1.92593 1.37222 
+  N0 -0.244029 0.90527 0.347757   N1 1.49384e-16 0.937749 0.347314   N2 1.11936e-16 0.96234 0.271848 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.92593 1.37222   V1 -0.517147 1.85816 1.37222   V2 -0.495081 1.77888 1.62187 
+  N0 1.11936e-16 0.96234 0.271848   N1 -0.250446 0.929073 0.272213   N2 -0.244029 0.90527 0.347757 
+   txt003 
+STRI 
+  V0 -1.92593 0 1.37222   V1 -1.85816 0.517147 1.37222   V2 -1.91065 0.531754 1.1309 
+  N0 -0.96234 0 0.271848   N1 -0.929073 0.250446 0.272213   N2 -0.953145 0.256935 0.159686 
+   txt003 
+STRI 
+  V0 -1.91065 0.531754 1.1309   V1 -1.98032 0 1.1309   V2 -1.92593 0 1.37222 
+  N0 -0.953145 0.256935 0.159686   N1 -0.987204 0 0.15946   N2 -0.96234 0 0.271848 
+   txt003 
+STRI 
+  V0 -1.85816 0.517147 1.37222   V1 -1.66628 0.978656 1.37222   V2 -1.71335 1.0063 1.1309 
+  N0 -0.929073 0.250446 0.272213   N1 -0.832247 0.482704 0.272693   N2 -0.853889 0.495256 0.159982 
+   txt003 
+STRI 
+  V0 -1.71335 1.0063 1.1309   V1 -1.91065 0.531754 1.1309   V2 -1.85816 0.517147 1.37222 
+  N0 -0.853889 0.495256 0.159982   N1 -0.953145 0.256935 0.159686   N2 -0.929073 0.250446 0.272213 
+   txt003 
+STRI 
+  V0 -1.66628 0.978656 1.37222   V1 -1.36741 1.36741 1.37222   V2 -1.40603 1.40603 1.1309 
+  N0 -0.832247 0.482704 0.272693   N1 -0.680271 0.680271 0.272877   N2 -0.697986 0.697986 0.160096 
+   txt003 
+STRI 
+  V0 -1.40603 1.40603 1.1309   V1 -1.71335 1.0063 1.1309   V2 -1.66628 0.978656 1.37222 
+  N0 -0.697986 0.697986 0.160096   N1 -0.853889 0.495256 0.159982   N2 -0.832247 0.482704 0.272693 
+   txt003 
+STRI 
+  V0 -1.36741 1.36741 1.37222   V1 -0.978656 1.66628 1.37222   V2 -1.0063 1.71335 1.1309 
+  N0 -0.680271 0.680271 0.272877   N1 -0.482704 0.832247 0.272693   N2 -0.495256 0.853889 0.159982 
+   txt003 
+STRI 
+  V0 -1.0063 1.71335 1.1309   V1 -1.40603 1.40603 1.1309   V2 -1.36741 1.36741 1.37222 
+  N0 -0.495256 0.853889 0.159982   N1 -0.697986 0.697986 0.160096   N2 -0.680271 0.680271 0.272877 
+   txt003 
+STRI 
+  V0 -0.978656 1.66628 1.37222   V1 -0.517147 1.85816 1.37222   V2 -0.531754 1.91065 1.1309 
+  N0 -0.482704 0.832247 0.272693   N1 -0.250446 0.929073 0.272213   N2 -0.256935 0.953145 0.159686 
+   txt003 
+STRI 
+  V0 -0.531754 1.91065 1.1309   V1 -1.0063 1.71335 1.1309   V2 -0.978656 1.66628 1.37222 
+  N0 -0.256935 0.953145 0.159686   N1 -0.495256 0.853889 0.159982   N2 -0.482704 0.832247 0.272693 
+   txt003 
+STRI 
+  V0 -0.517147 1.85816 1.37222   V1 -2.22045e-16 1.92593 1.37222   V2 2.22045e-16 1.98032 1.1309 
+  N0 -0.250446 0.929073 0.272213   N1 1.11936e-16 0.96234 0.271848   N2 6.38555e-17 0.987204 0.15946 
+   txt003 
+STRI 
+  V0 2.22045e-16 1.98032 1.1309   V1 -0.531754 1.91065 1.1309   V2 -0.517147 1.85816 1.37222 
+  N0 6.38555e-17 0.987204 0.15946   N1 -0.256935 0.953145 0.159686   N2 -0.250446 0.929073 0.272213 
+   txt003 
+STRI 
+  V0 -1.98032 0 1.1309   V1 -1.91065 0.531754 1.1309   V2 -1.92963 0.537037 0.9 
+  N0 -0.987204 0 0.15946   N1 -0.953145 0.256935 0.159686   N2 -0.965535 0.260275 5.17854e-17 
+   txt003 
+STRI 
+  V0 -1.92963 0.537037 0.9   V1 -2 0 0.9   V2 -1.98032 0 1.1309 
+  N0 -0.965535 0.260275 5.17854e-17   N1 -1 0 0   N2 -0.987204 0 0.15946 
+   txt003 
+STRI 
+  V0 -1.91065 0.531754 1.1309   V1 -1.71335 1.0063 1.1309   V2 -1.73037 1.0163 0.9 
+  N0 -0.953145 0.256935 0.159686   N1 -0.853889 0.495256 0.159982   N2 -0.865031 0.501718 1.36587e-16 
+   txt003 
+STRI 
+  V0 -1.73037 1.0163 0.9   V1 -1.92963 0.537037 0.9   V2 -1.91065 0.531754 1.1309 
+  N0 -0.865031 0.501718 1.36587e-16   N1 -0.965535 0.260275 5.17854e-17   N2 -0.953145 0.256935 0.159686 
+   txt003 
+STRI 
+  V0 -1.71335 1.0063 1.1309   V1 -1.40603 1.40603 1.1309   V2 -1.42 1.42 0.9 
+  N0 -0.853889 0.495256 0.159982   N1 -0.697986 0.697986 0.160096   N2 -0.707107 0.707107 1.74455e-16 
+   txt003 
+STRI 
+  V0 -1.42 1.42 0.9   V1 -1.73037 1.0163 0.9   V2 -1.71335 1.0063 1.1309 
+  N0 -0.707107 0.707107 1.74455e-16   N1 -0.865031 0.501718 1.36587e-16   N2 -0.853889 0.495256 0.159982 
+   txt003 
+STRI 
+  V0 -1.40603 1.40603 1.1309   V1 -1.0063 1.71335 1.1309   V2 -1.0163 1.73037 0.9 
+  N0 -0.697986 0.697986 0.160096   N1 -0.495256 0.853889 0.159982   N2 -0.501718 0.865031 1.36587e-16 
+   txt003 
+STRI 
+  V0 -1.0163 1.73037 0.9   V1 -1.42 1.42 0.9   V2 -1.40603 1.40603 1.1309 
+  N0 -0.501718 0.865031 1.36587e-16   N1 -0.707107 0.707107 1.74455e-16   N2 -0.697986 0.697986 0.160096 
+   txt003 
+STRI 
+  V0 -1.0063 1.71335 1.1309   V1 -0.531754 1.91065 1.1309   V2 -0.537037 1.92963 0.9 
+  N0 -0.495256 0.853889 0.159982   N1 -0.256935 0.953145 0.159686   N2 -0.260275 0.965535 5.17854e-17 
+   txt003 
+STRI 
+  V0 -0.537037 1.92963 0.9   V1 -1.0163 1.73037 0.9   V2 -1.0063 1.71335 1.1309 
+  N0 -0.260275 0.965535 5.17854e-17   N1 -0.501718 0.865031 1.36587e-16   N2 -0.495256 0.853889 0.159982 
+   txt003 
+STRI 
+  V0 -0.531754 1.91065 1.1309   V1 2.22045e-16 1.98032 1.1309   V2 0 2 0.9 
+  N0 -0.256935 0.953145 0.159686   N1 6.38555e-17 0.987204 0.15946   N2 0 1 0 
+   txt003 
+STRI 
+  V0 0 2 0.9   V1 -0.537037 1.92963 0.9   V2 -0.531754 1.91065 1.1309 
+  N0 0 1 0   N1 -0.260275 0.965535 5.17854e-17   N2 -0.256935 0.953145 0.159686 
+   txt003 
+STRI 
+  V0 0 1.5 2.4   V1 0.402778 1.44722 2.4   V2 0.436032 1.56671 2.13785 
+  N0 -0 0.902861 0.429934   N1 0.234929 0.871509 0.430442   N2 0.235963 0.875348 0.422003 
+   txt003 
+STRI 
+  V0 0.436032 1.56671 2.13785   V1 0 1.62384 2.13785   V2 0 1.5 2.4 
+  N0 0.235963 0.875348 0.422003   N1 -0 0.906828 0.4215   N2 -0 0.902861 0.429934 
+   txt003 
+STRI 
+  V0 0.402778 1.44722 2.4   V1 0.762222 1.29778 2.4   V2 0.825153 1.40492 2.13785 
+  N0 0.234929 0.871509 0.430442   N1 0.4527 0.780517 0.43111   N2 0.4547 0.783966 0.422664 
+   txt003 
+STRI 
+  V0 0.825153 1.40492 2.13785   V1 0.436032 1.56671 2.13785   V2 0.402778 1.44722 2.4 
+  N0 0.4547 0.783966 0.422664   N1 0.235963 0.875348 0.422003   N2 0.234929 0.871509 0.430442 
+   txt003 
+STRI 
+  V0 0.762222 1.29778 2.4   V1 1.065 1.065 2.4   V2 1.15293 1.15293 2.13785 
+  N0 0.4527 0.780517 0.43111   N1 0.637936 0.637936 0.431366   N2 0.640758 0.640758 0.422917 
+   txt003 
+STRI 
+  V0 1.15293 1.15293 2.13785   V1 0.825153 1.40492 2.13785   V2 0.762222 1.29778 2.4 
+  N0 0.640758 0.640758 0.422917   N1 0.4547 0.783966 0.422664   N2 0.4527 0.780517 0.43111 
+   txt003 
+STRI 
+  V0 1.065 1.065 2.4   V1 1.29778 0.762222 2.4   V2 1.40492 0.825153 2.13785 
+  N0 0.637936 0.637936 0.431366   N1 0.780517 0.4527 0.43111   N2 0.783966 0.4547 0.422664 
+   txt003 
+STRI 
+  V0 1.40492 0.825153 2.13785   V1 1.15293 1.15293 2.13785   V2 1.065 1.065 2.4 
+  N0 0.783966 0.4547 0.422664   N1 0.640758 0.640758 0.422917   N2 0.637936 0.637936 0.431366 
+   txt003 
+STRI 
+  V0 1.29778 0.762222 2.4   V1 1.44722 0.402778 2.4   V2 1.56671 0.436032 2.13785 
+  N0 0.780517 0.4527 0.43111   N1 0.871509 0.234929 0.430442   N2 0.875348 0.235963 0.422003 
+   txt003 
+STRI 
+  V0 1.56671 0.436032 2.13785   V1 1.40492 0.825153 2.13785   V2 1.29778 0.762222 2.4 
+  N0 0.875348 0.235963 0.422003   N1 0.783966 0.4547 0.422664   N2 0.780517 0.4527 0.43111 
+   txt003 
+STRI 
+  V0 1.44722 0.402778 2.4   V1 1.5 0 2.4   V2 1.62384 2.22045e-16 2.13785 
+  N0 0.871509 0.234929 0.430442   N1 0.902861 -2.27296e-16 0.429934   N2 0.906828 -2.05843e-16 0.4215 
+   txt003 
+STRI 
+  V0 1.62384 2.22045e-16 2.13785   V1 1.56671 0.436032 2.13785   V2 1.44722 0.402778 2.4 
+  N0 0.906828 -2.05843e-16 0.4215   N1 0.875348 0.235963 0.422003   N2 0.871509 0.234929 0.430442 
+   txt003 
+STRI 
+  V0 0 1.62384 2.13785   V1 0.436032 1.56671 2.13785   V2 0.467421 1.67949 1.87778 
+  N0 -0 0.906828 0.4215   N1 0.235963 0.875348 0.422003   N2 0.239043 0.886771 0.395595 
+   txt003 
+STRI 
+  V0 0.467421 1.67949 1.87778   V1 0 1.74074 1.87778   V2 0 1.62384 2.13785 
+  N0 0.239043 0.886771 0.395595   N1 -0 0.918633 0.395111   N2 -0 0.906828 0.4215 
+   txt003 
+STRI 
+  V0 0.436032 1.56671 2.13785   V1 0.825153 1.40492 2.13785   V2 0.884554 1.50606 1.87778 
+  N0 0.235963 0.875348 0.422003   N1 0.4547 0.783966 0.422664   N2 0.460653 0.794229 0.39623 
+   txt003 
+STRI 
+  V0 0.884554 1.50606 1.87778   V1 0.467421 1.67949 1.87778   V2 0.436032 1.56671 2.13785 
+  N0 0.460653 0.794229 0.39623   N1 0.239043 0.886771 0.395595   N2 0.235963 0.875348 0.422003 
+   txt003 
+STRI 
+  V0 0.825153 1.40492 2.13785   V1 1.15293 1.15293 2.13785   V2 1.23593 1.23593 1.87778 
+  N0 0.4547 0.783966 0.422664   N1 0.640758 0.640758 0.422917   N2 0.649156 0.649156 0.396474 
+   txt003 
+STRI 
+  V0 1.23593 1.23593 1.87778   V1 0.884554 1.50606 1.87778   V2 0.825153 1.40492 2.13785 
+  N0 0.649156 0.649156 0.396474   N1 0.460653 0.794229 0.39623   N2 0.4547 0.783966 0.422664 
+   txt003 
+STRI 
+  V0 1.15293 1.15293 2.13785   V1 1.40492 0.825153 2.13785   V2 1.50606 0.884554 1.87778 
+  N0 0.640758 0.640758 0.422917   N1 0.783966 0.4547 0.422664   N2 0.794229 0.460653 0.39623 
+   txt003 
+STRI 
+  V0 1.50606 0.884554 1.87778   V1 1.23593 1.23593 1.87778   V2 1.15293 1.15293 2.13785 
+  N0 0.794229 0.460653 0.39623   N1 0.649156 0.649156 0.396474   N2 0.640758 0.640758 0.422917 
+   txt003 
+STRI 
+  V0 1.40492 0.825153 2.13785   V1 1.56671 0.436032 2.13785   V2 1.67949 0.467421 1.87778 
+  N0 0.783966 0.4547 0.422664   N1 0.875348 0.235963 0.422003   N2 0.886771 0.239043 0.395595 
+   txt003 
+STRI 
+  V0 1.67949 0.467421 1.87778   V1 1.50606 0.884554 1.87778   V2 1.40492 0.825153 2.13785 
+  N0 0.886771 0.239043 0.395595   N1 0.794229 0.460653 0.39623   N2 0.783966 0.4547 0.422664 
+   txt003 
+STRI 
+  V0 1.56671 0.436032 2.13785   V1 1.62384 2.22045e-16 2.13785   V2 1.74074 0 1.87778 
+  N0 0.875348 0.235963 0.422003   N1 0.906828 -2.05843e-16 0.4215   N2 0.918633 -1.79998e-16 0.395111 
+   txt003 
+STRI 
+  V0 1.74074 0 1.87778   V1 1.67949 0.467421 1.87778   V2 1.56671 0.436032 2.13785 
+  N0 0.918633 -1.79998e-16 0.395111   N1 0.886771 0.239043 0.395595   N2 0.875348 0.235963 0.422003 
+   txt003 
+STRI 
+  V0 0 1.74074 1.87778   V1 0.467421 1.67949 1.87778   V2 0.495081 1.77888 1.62188 
+  N0 -0 0.918633 0.395111   N1 0.239043 0.886771 0.395595   N2 0.244029 0.90527 0.347757 
+   txt003 
+STRI 
+  V0 0.495081 1.77888 1.62188   V1 0 1.84375 1.62188   V2 0 1.74074 1.87778 
+  N0 0.244029 0.90527 0.347757   N1 -0 0.937749 0.347314   N2 -0 0.918633 0.395111 
+   txt003 
+STRI 
+  V0 0.467421 1.67949 1.87778   V1 0.884554 1.50606 1.87778   V2 0.936898 1.59519 1.62188 
+  N0 0.239043 0.886771 0.395595   N1 0.460653 0.794229 0.39623   N2 0.470295 0.810853 0.34834 
+   txt003 
+STRI 
+  V0 0.936898 1.59519 1.62188   V1 0.495081 1.77888 1.62188   V2 0.467421 1.67949 1.87778 
+  N0 0.470295 0.810853 0.34834   N1 0.244029 0.90527 0.347757   N2 0.239043 0.886771 0.395595 
+   txt003 
+STRI 
+  V0 0.884554 1.50606 1.87778   V1 1.23593 1.23593 1.87778   V2 1.30906 1.30906 1.62188 
+  N0 0.460653 0.794229 0.39623   N1 0.649156 0.649156 0.396474   N2 0.662761 0.662761 0.348563 
+   txt003 
+STRI 
+  V0 1.30906 1.30906 1.62188   V1 0.936898 1.59519 1.62188   V2 0.884554 1.50606 1.87778 
+  N0 0.662761 0.662761 0.348563   N1 0.470295 0.810853 0.34834   N2 0.460653 0.794229 0.39623 
+   txt003 
+STRI 
+  V0 1.23593 1.23593 1.87778   V1 1.50606 0.884554 1.87778   V2 1.59519 0.936898 1.62187 
+  N0 0.649156 0.649156 0.396474   N1 0.794229 0.460653 0.39623   N2 0.810853 0.470295 0.34834 
+   txt003 
+STRI 
+  V0 1.59519 0.936898 1.62187   V1 1.30906 1.30906 1.62188   V2 1.23593 1.23593 1.87778 
+  N0 0.810853 0.470295 0.34834   N1 0.662761 0.662761 0.348563   N2 0.649156 0.649156 0.396474 
+   txt003 
+STRI 
+  V0 1.50606 0.884554 1.87778   V1 1.67949 0.467421 1.87778   V2 1.77888 0.495081 1.62187 
+  N0 0.794229 0.460653 0.39623   N1 0.886771 0.239043 0.395595   N2 0.90527 0.244029 0.347757 
+   txt003 
+STRI 
+  V0 1.77888 0.495081 1.62187   V1 1.59519 0.936898 1.62187   V2 1.50606 0.884554 1.87778 
+  N0 0.90527 0.244029 0.347757   N1 0.810853 0.470295 0.34834   N2 0.794229 0.460653 0.39623 
+   txt003 
+STRI 
+  V0 1.67949 0.467421 1.87778   V1 1.74074 0 1.87778   V2 1.84375 0 1.62187 
+  N0 0.886771 0.239043 0.395595   N1 0.918633 -1.79998e-16 0.395111   N2 0.937749 -1.49384e-16 0.347314 
+   txt003 
+STRI 
+  V0 1.84375 0 1.62187   V1 1.77888 0.495081 1.62187   V2 1.67949 0.467421 1.87778 
+  N0 0.937749 -1.49384e-16 0.347314   N1 0.90527 0.244029 0.347757   N2 0.886771 0.239043 0.395595 
+   txt003 
+STRI 
+  V0 0 1.84375 1.62188   V1 0.495081 1.77888 1.62188   V2 0.517147 1.85816 1.37222 
+  N0 -0 0.937749 0.347314   N1 0.244029 0.90527 0.347757   N2 0.250446 0.929073 0.272213 
+   txt003 
+STRI 
+  V0 0.517147 1.85816 1.37222   V1 0 1.92593 1.37222   V2 0 1.84375 1.62188 
+  N0 0.250446 0.929073 0.272213   N1 -0 0.96234 0.271848   N2 -0 0.937749 0.347314 
+   txt003 
+STRI 
+  V0 0.495081 1.77888 1.62188   V1 0.936898 1.59519 1.62188   V2 0.978656 1.66628 1.37222 
+  N0 0.244029 0.90527 0.347757   N1 0.470295 0.810853 0.34834   N2 0.482704 0.832247 0.272693 
+   txt003 
+STRI 
+  V0 0.978656 1.66628 1.37222   V1 0.517147 1.85816 1.37222   V2 0.495081 1.77888 1.62188 
+  N0 0.482704 0.832247 0.272693   N1 0.250446 0.929073 0.272213   N2 0.244029 0.90527 0.347757 
+   txt003 
+STRI 
+  V0 0.936898 1.59519 1.62188   V1 1.30906 1.30906 1.62188   V2 1.36741 1.36741 1.37222 
+  N0 0.470295 0.810853 0.34834   N1 0.662761 0.662761 0.348563   N2 0.680271 0.680271 0.272877 
+   txt003 
+STRI 
+  V0 1.36741 1.36741 1.37222   V1 0.978656 1.66628 1.37222   V2 0.936898 1.59519 1.62188 
+  N0 0.680271 0.680271 0.272877   N1 0.482704 0.832247 0.272693   N2 0.470295 0.810853 0.34834 
+   txt003 
+STRI 
+  V0 1.30906 1.30906 1.62188   V1 1.59519 0.936898 1.62187   V2 1.66628 0.978656 1.37222 
+  N0 0.662761 0.662761 0.348563   N1 0.810853 0.470295 0.34834   N2 0.832247 0.482704 0.272693 
+   txt003 
+STRI 
+  V0 1.66628 0.978656 1.37222   V1 1.36741 1.36741 1.37222   V2 1.30906 1.30906 1.62188 
+  N0 0.832247 0.482704 0.272693   N1 0.680271 0.680271 0.272877   N2 0.662761 0.662761 0.348563 
+   txt003 
+STRI 
+  V0 1.59519 0.936898 1.62187   V1 1.77888 0.495081 1.62187   V2 1.85816 0.517147 1.37222 
+  N0 0.810853 0.470295 0.34834   N1 0.90527 0.244029 0.347757   N2 0.929073 0.250446 0.272213 
+   txt003 
+STRI 
+  V0 1.85816 0.517147 1.37222   V1 1.66628 0.978656 1.37222   V2 1.59519 0.936898 1.62187 
+  N0 0.929073 0.250446 0.272213   N1 0.832247 0.482704 0.272693   N2 0.810853 0.470295 0.34834 
+   txt003 
+STRI 
+  V0 1.77888 0.495081 1.62187   V1 1.84375 0 1.62187   V2 1.92593 2.22045e-16 1.37222 
+  N0 0.90527 0.244029 0.347757   N1 0.937749 -1.49384e-16 0.347314   N2 0.96234 -1.11936e-16 0.271848 
+   txt003 
+STRI 
+  V0 1.92593 2.22045e-16 1.37222   V1 1.85816 0.517147 1.37222   V2 1.77888 0.495081 1.62187 
+  N0 0.96234 -1.11936e-16 0.271848   N1 0.929073 0.250446 0.272213   N2 0.90527 0.244029 0.347757 
+   txt003 
+STRI 
+  V0 0 1.92593 1.37222   V1 0.517147 1.85816 1.37222   V2 0.531754 1.91065 1.1309 
+  N0 -0 0.96234 0.271848   N1 0.250446 0.929073 0.272213   N2 0.256935 0.953145 0.159686 
+   txt003 
+STRI 
+  V0 0.531754 1.91065 1.1309   V1 0 1.98032 1.1309   V2 0 1.92593 1.37222 
+  N0 0.256935 0.953145 0.159686   N1 -0 0.987204 0.15946   N2 -0 0.96234 0.271848 
+   txt003 
+STRI 
+  V0 0.517147 1.85816 1.37222   V1 0.978656 1.66628 1.37222   V2 1.0063 1.71335 1.1309 
+  N0 0.250446 0.929073 0.272213   N1 0.482704 0.832247 0.272693   N2 0.495256 0.853889 0.159982 
+   txt003 
+STRI 
+  V0 1.0063 1.71335 1.1309   V1 0.531754 1.91065 1.1309   V2 0.517147 1.85816 1.37222 
+  N0 0.495256 0.853889 0.159982   N1 0.256935 0.953145 0.159686   N2 0.250446 0.929073 0.272213 
+   txt003 
+STRI 
+  V0 0.978656 1.66628 1.37222   V1 1.36741 1.36741 1.37222   V2 1.40603 1.40603 1.1309 
+  N0 0.482704 0.832247 0.272693   N1 0.680271 0.680271 0.272877   N2 0.697986 0.697986 0.160096 
+   txt003 
+STRI 
+  V0 1.40603 1.40603 1.1309   V1 1.0063 1.71335 1.1309   V2 0.978656 1.66628 1.37222 
+  N0 0.697986 0.697986 0.160096   N1 0.495256 0.853889 0.159982   N2 0.482704 0.832247 0.272693 
+   txt003 
+STRI 
+  V0 1.36741 1.36741 1.37222   V1 1.66628 0.978656 1.37222   V2 1.71335 1.0063 1.1309 
+  N0 0.680271 0.680271 0.272877   N1 0.832247 0.482704 0.272693   N2 0.853889 0.495256 0.159982 
+   txt003 
+STRI 
+  V0 1.71335 1.0063 1.1309   V1 1.40603 1.40603 1.1309   V2 1.36741 1.36741 1.37222 
+  N0 0.853889 0.495256 0.159982   N1 0.697986 0.697986 0.160096   N2 0.680271 0.680271 0.272877 
+   txt003 
+STRI 
+  V0 1.66628 0.978656 1.37222   V1 1.85816 0.517147 1.37222   V2 1.91065 0.531754 1.1309 
+  N0 0.832247 0.482704 0.272693   N1 0.929073 0.250446 0.272213   N2 0.953145 0.256935 0.159686 
+   txt003 
+STRI 
+  V0 1.91065 0.531754 1.1309   V1 1.71335 1.0063 1.1309   V2 1.66628 0.978656 1.37222 
+  N0 0.953145 0.256935 0.159686   N1 0.853889 0.495256 0.159982   N2 0.832247 0.482704 0.272693 
+   txt003 
+STRI 
+  V0 1.85816 0.517147 1.37222   V1 1.92593 2.22045e-16 1.37222   V2 1.98032 -2.22045e-16 1.1309 
+  N0 0.929073 0.250446 0.272213   N1 0.96234 -1.11936e-16 0.271848   N2 0.987204 -6.38555e-17 0.15946 
+   txt003 
+STRI 
+  V0 1.98032 -2.22045e-16 1.1309   V1 1.91065 0.531754 1.1309   V2 1.85816 0.517147 1.37222 
+  N0 0.987204 -6.38555e-17 0.15946   N1 0.953145 0.256935 0.159686   N2 0.929073 0.250446 0.272213 
+   txt003 
+STRI 
+  V0 0 1.98032 1.1309   V1 0.531754 1.91065 1.1309   V2 0.537037 1.92963 0.9 
+  N0 -0 0.987204 0.15946   N1 0.256935 0.953145 0.159686   N2 0.260275 0.965535 5.17854e-17 
+   txt003 
+STRI 
+  V0 0.537037 1.92963 0.9   V1 0 2 0.9   V2 0 1.98032 1.1309 
+  N0 0.260275 0.965535 5.17854e-17   N1 -0 1 0   N2 -0 0.987204 0.15946 
+   txt003 
+STRI 
+  V0 0.531754 1.91065 1.1309   V1 1.0063 1.71335 1.1309   V2 1.0163 1.73037 0.9 
+  N0 0.256935 0.953145 0.159686   N1 0.495256 0.853889 0.159982   N2 0.501718 0.865031 1.36587e-16 
+   txt003 
+STRI 
+  V0 1.0163 1.73037 0.9   V1 0.537037 1.92963 0.9   V2 0.531754 1.91065 1.1309 
+  N0 0.501718 0.865031 1.36587e-16   N1 0.260275 0.965535 5.17854e-17   N2 0.256935 0.953145 0.159686 
+   txt003 
+STRI 
+  V0 1.0063 1.71335 1.1309   V1 1.40603 1.40603 1.1309   V2 1.42 1.42 0.9 
+  N0 0.495256 0.853889 0.159982   N1 0.697986 0.697986 0.160096   N2 0.707107 0.707107 1.74455e-16 
+   txt003 
+STRI 
+  V0 1.42 1.42 0.9   V1 1.0163 1.73037 0.9   V2 1.0063 1.71335 1.1309 
+  N0 0.707107 0.707107 1.74455e-16   N1 0.501718 0.865031 1.36587e-16   N2 0.495256 0.853889 0.159982 
+   txt003 
+STRI 
+  V0 1.40603 1.40603 1.1309   V1 1.71335 1.0063 1.1309   V2 1.73037 1.0163 0.9 
+  N0 0.697986 0.697986 0.160096   N1 0.853889 0.495256 0.159982   N2 0.865031 0.501718 1.36587e-16 
+   txt003 
+STRI 
+  V0 1.73037 1.0163 0.9   V1 1.42 1.42 0.9   V2 1.40603 1.40603 1.1309 
+  N0 0.865031 0.501718 1.36587e-16   N1 0.707107 0.707107 1.74455e-16   N2 0.697986 0.697986 0.160096 
+   txt003 
+STRI 
+  V0 1.71335 1.0063 1.1309   V1 1.91065 0.531754 1.1309   V2 1.92963 0.537037 0.9 
+  N0 0.853889 0.495256 0.159982   N1 0.953145 0.256935 0.159686   N2 0.965535 0.260275 5.17854e-17 
+   txt003 
+STRI 
+  V0 1.92963 0.537037 0.9   V1 1.73037 1.0163 0.9   V2 1.71335 1.0063 1.1309 
+  N0 0.965535 0.260275 5.17854e-17   N1 0.865031 0.501718 1.36587e-16   N2 0.853889 0.495256 0.159982 
+   txt003 
+STRI 
+  V0 1.91065 0.531754 1.1309   V1 1.98032 -2.22045e-16 1.1309   V2 2 0 0.9 
+  N0 0.953145 0.256935 0.159686   N1 0.987204 -6.38555e-17 0.15946   N2 1 0 0 
+   txt003 
+STRI 
+  V0 2 0 0.9   V1 1.92963 0.537037 0.9   V2 1.91065 0.531754 1.1309 
+  N0 1 0 0   N1 0.965535 0.260275 5.17854e-17   N2 0.953145 0.256935 0.159686 
+   txt003 
+STRI 
+  V0 2 0 0.9   V1 1.92963 -0.537037 0.9   V2 1.8939 -0.527092 0.693403 
+  N0 1 0 0   N1 0.965535 -0.260275 0   N2 0.905874 -0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 1.8939 -0.527092 0.693403   V1 1.96296 0 0.693403   V2 2 0 0.9 
+  N0 0.905874 -0.244192 -0.346067   N1 0.938373 0 -0.345625   N2 1 0 0 
+   txt003 
+STRI 
+  V0 1.92963 -0.537037 0.9   V1 1.73037 -1.0163 0.9   V2 1.69833 -0.997476 0.693403 
+  N0 0.965535 -0.260275 0   N1 0.865031 -0.501718 0   N2 0.811395 -0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 1.69833 -0.997476 0.693403   V1 1.8939 -0.527092 0.693403   V2 1.92963 -0.537037 0.9 
+  N0 0.811395 -0.470609 -0.346647   N1 0.905874 -0.244192 -0.346067   N2 0.965535 -0.260275 0 
+   txt003 
+STRI 
+  V0 1.73037 -1.0163 0.9   V1 1.42 -1.42 0.9   V2 1.3937 -1.3937 0.693403 
+  N0 0.865031 -0.501718 0   N1 0.707107 -0.707107 0   N2 0.663205 -0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 1.3937 -1.3937 0.693403   V1 1.69833 -0.997476 0.693403   V2 1.73037 -1.0163 0.9 
+  N0 0.663205 -0.663205 -0.34687   N1 0.811395 -0.470609 -0.346647   N2 0.865031 -0.501718 0 
+   txt003 
+STRI 
+  V0 1.42 -1.42 0.9   V1 1.0163 -1.73037 0.9   V2 0.997476 -1.69833 0.693403 
+  N0 0.707107 -0.707107 0   N1 0.501718 -0.865031 0   N2 0.470609 -0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 0.997476 -1.69833 0.693403   V1 1.3937 -1.3937 0.693403   V2 1.42 -1.42 0.9 
+  N0 0.470609 -0.811395 -0.346647   N1 0.663205 -0.663205 -0.34687   N2 0.707107 -0.707107 0 
+   txt003 
+STRI 
+  V0 1.0163 -1.73037 0.9   V1 0.537037 -1.92963 0.9   V2 0.527092 -1.8939 0.693403 
+  N0 0.501718 -0.865031 0   N1 0.260275 -0.965535 0   N2 0.244192 -0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 0.527092 -1.8939 0.693403   V1 0.997476 -1.69833 0.693403   V2 1.0163 -1.73037 0.9 
+  N0 0.244192 -0.905874 -0.346067   N1 0.470609 -0.811395 -0.346647   N2 0.501718 -0.865031 0 
+   txt003 
+STRI 
+  V0 0.537037 -1.92963 0.9   V1 0 -2 0.9   V2 2.22045e-16 -1.96296 0.693403 
+  N0 0.260275 -0.965535 0   N1 -0 -1 -0   N2 -3.49072e-17 -0.938373 -0.345625 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.96296 0.693403   V1 0.527092 -1.8939 0.693403   V2 0.537037 -1.92963 0.9 
+  N0 -3.49072e-17 -0.938373 -0.345625   N1 0.244192 -0.905874 -0.346067   N2 0.260275 -0.965535 0 
+   txt003 
+STRI 
+  V0 1.96296 0 0.693403   V1 1.8939 -0.527092 0.693403   V2 1.80456 -0.502229 0.522222 
+  N0 0.938373 0 -0.345625   N1 0.905874 -0.244192 -0.346067   N2 0.782908 -0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 1.80456 -0.502229 0.522222   V1 1.87037 0 0.522222   V2 1.96296 0 0.693403 
+  N0 0.782908 -0.211045 -0.585248   N1 0.811257 0 -0.58469   N2 0.938373 0 -0.345625 
+   txt003 
+STRI 
+  V0 1.8939 -0.527092 0.693403   V1 1.69833 -0.997476 0.693403   V2 1.61822 -0.950425 0.522222 
+  N0 0.905874 -0.244192 -0.346067   N1 0.811395 -0.470609 -0.346647   N2 0.700957 -0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 1.61822 -0.950425 0.522222   V1 1.80456 -0.502229 0.522222   V2 1.8939 -0.527092 0.693403 
+  N0 0.700957 -0.406555 -0.58598   N1 0.782908 -0.211045 -0.585248   N2 0.905874 -0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 1.69833 -0.997476 0.693403   V1 1.3937 -1.3937 0.693403   V2 1.32796 -1.32796 0.522222 
+  N0 0.811395 -0.470609 -0.346647   N1 0.663205 -0.663205 -0.34687   N2 0.572843 -0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 1.32796 -1.32796 0.522222   V1 1.61822 -0.950425 0.522222   V2 1.69833 -0.997476 0.693403 
+  N0 0.572843 -0.572843 -0.586261   N1 0.700957 -0.406555 -0.58598   N2 0.811395 -0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 1.3937 -1.3937 0.693403   V1 0.997476 -1.69833 0.693403   V2 0.950425 -1.61822 0.522222 
+  N0 0.663205 -0.663205 -0.34687   N1 0.470609 -0.811395 -0.346647   N2 0.406555 -0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 0.950425 -1.61822 0.522222   V1 1.32796 -1.32796 0.522222   V2 1.3937 -1.3937 0.693403 
+  N0 0.406555 -0.700957 -0.58598   N1 0.572843 -0.572843 -0.586261   N2 0.663205 -0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 0.997476 -1.69833 0.693403   V1 0.527092 -1.8939 0.693403   V2 0.502229 -1.80456 0.522222 
+  N0 0.470609 -0.811395 -0.346647   N1 0.244192 -0.905874 -0.346067   N2 0.211045 -0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 0.502229 -1.80456 0.522222   V1 0.950425 -1.61822 0.522222   V2 0.997476 -1.69833 0.693403 
+  N0 0.211045 -0.782908 -0.585248   N1 0.406555 -0.700957 -0.58598   N2 0.470609 -0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 0.527092 -1.8939 0.693403   V1 2.22045e-16 -1.96296 0.693403   V2 2.22045e-16 -1.87037 0.522222 
+  N0 0.244192 -0.905874 -0.346067   N1 -3.49072e-17 -0.938373 -0.345625   N2 -6.19755e-17 -0.811257 -0.58469 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.87037 0.522222   V1 0.502229 -1.80456 0.522222   V2 0.527092 -1.8939 0.693403 
+  N0 -6.19755e-17 -0.811257 -0.58469   N1 0.211045 -0.782908 -0.585248   N2 0.244192 -0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 1.87037 0 0.522222   V1 1.80456 -0.502229 0.522222   V2 1.68843 -0.469907 0.384375 
+  N0 0.811257 0 -0.58469   N1 0.782908 -0.211045 -0.585248   N2 0.673539 -0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 1.68843 -0.469907 0.384375   V1 1.75 0 0.384375   V2 1.87037 0 0.522222 
+  N0 0.673539 -0.181563 -0.716506   N1 0.6981 0 -0.716   N2 0.811257 0 -0.58469 
+   txt003 
+STRI 
+  V0 1.80456 -0.502229 0.522222   V1 1.61822 -0.950425 0.522222   V2 1.51407 -0.889259 0.384375 
+  N0 0.782908 -0.211045 -0.585248   N1 0.700957 -0.406555 -0.58598   N2 0.602839 -0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 1.51407 -0.889259 0.384375   V1 1.68843 -0.469907 0.384375   V2 1.80456 -0.502229 0.522222 
+  N0 0.602839 -0.349647 -0.717169   N1 0.673539 -0.181563 -0.716506   N2 0.782908 -0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 1.61822 -0.950425 0.522222   V1 1.32796 -1.32796 0.522222   V2 1.2425 -1.2425 0.384375 
+  N0 0.700957 -0.406555 -0.58598   N1 0.572843 -0.572843 -0.586261   N2 0.492597 -0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 1.2425 -1.2425 0.384375   V1 1.51407 -0.889259 0.384375   V2 1.61822 -0.950425 0.522222 
+  N0 0.492597 -0.492597 -0.717423   N1 0.602839 -0.349647 -0.717169   N2 0.700957 -0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 1.32796 -1.32796 0.522222   V1 0.950425 -1.61822 0.522222   V2 0.889259 -1.51407 0.384375 
+  N0 0.572843 -0.572843 -0.586261   N1 0.406555 -0.700957 -0.58598   N2 0.349647 -0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 0.889259 -1.51407 0.384375   V1 1.2425 -1.2425 0.384375   V2 1.32796 -1.32796 0.522222 
+  N0 0.349647 -0.602839 -0.717169   N1 0.492597 -0.492597 -0.717423   N2 0.572843 -0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 0.950425 -1.61822 0.522222   V1 0.502229 -1.80456 0.522222   V2 0.469907 -1.68843 0.384375 
+  N0 0.406555 -0.700957 -0.58598   N1 0.211045 -0.782908 -0.585248   N2 0.181563 -0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 0.469907 -1.68843 0.384375   V1 0.889259 -1.51407 0.384375   V2 0.950425 -1.61822 0.522222 
+  N0 0.181563 -0.673539 -0.716506   N1 0.349647 -0.602839 -0.717169   N2 0.406555 -0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 0.502229 -1.80456 0.522222   V1 2.22045e-16 -1.87037 0.522222   V2 2.22045e-16 -1.75 0.384375 
+  N0 0.211045 -0.782908 -0.585248   N1 -6.19755e-17 -0.811257 -0.58469   N2 -8.11143e-17 -0.6981 -0.716 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.75 0.384375   V1 0.469907 -1.68843 0.384375   V2 0.502229 -1.80456 0.522222 
+  N0 -8.11143e-17 -0.6981 -0.716   N1 0.181563 -0.673539 -0.716506   N2 0.211045 -0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 1.75 0 0.384375   V1 1.68843 -0.469907 0.384375   V2 1.57229 -0.437586 0.277778 
+  N0 0.6981 0 -0.716   N1 0.673539 -0.181563 -0.716506   N2 0.61392 -0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 1.57229 -0.437586 0.277778   V1 1.62963 0 0.277778   V2 1.75 0 0.384375 
+  N0 0.61392 -0.165491 -0.771826   N1 0.636383 0 -0.771373   N2 0.6981 0 -0.716 
+   txt003 
+STRI 
+  V0 1.68843 -0.469907 0.384375   V1 1.51407 -0.889259 0.384375   V2 1.40993 -0.828093 0.277778 
+  N0 0.673539 -0.181563 -0.716506   N1 0.602839 -0.349647 -0.717169   N2 0.549392 -0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 1.40993 -0.828093 0.277778   V1 1.57229 -0.437586 0.277778   V2 1.68843 -0.469907 0.384375 
+  N0 0.549392 -0.318647 -0.77242   N1 0.61392 -0.165491 -0.771826   N2 0.673539 -0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 1.51407 -0.889259 0.384375   V1 1.2425 -1.2425 0.384375   V2 1.15704 -1.15704 0.277778 
+  N0 0.602839 -0.349647 -0.717169   N1 0.492597 -0.492597 -0.717423   N2 0.448897 -0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 1.15704 -1.15704 0.277778   V1 1.40993 -0.828093 0.277778   V2 1.51407 -0.889259 0.384375 
+  N0 0.448897 -0.448897 -0.772647   N1 0.549392 -0.318647 -0.77242   N2 0.602839 -0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 1.2425 -1.2425 0.384375   V1 0.889259 -1.51407 0.384375   V2 0.828093 -1.40993 0.277778 
+  N0 0.492597 -0.492597 -0.717423   N1 0.349647 -0.602839 -0.717169   N2 0.318647 -0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 0.828093 -1.40993 0.277778   V1 1.15704 -1.15704 0.277778   V2 1.2425 -1.2425 0.384375 
+  N0 0.318647 -0.549392 -0.77242   N1 0.448897 -0.448897 -0.772647   N2 0.492597 -0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 0.889259 -1.51407 0.384375   V1 0.469907 -1.68843 0.384375   V2 0.437586 -1.57229 0.277778 
+  N0 0.349647 -0.602839 -0.717169   N1 0.181563 -0.673539 -0.716506   N2 0.165491 -0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 0.437586 -1.57229 0.277778   V1 0.828093 -1.40993 0.277778   V2 0.889259 -1.51407 0.384375 
+  N0 0.165491 -0.61392 -0.771826   N1 0.318647 -0.549392 -0.77242   N2 0.349647 -0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 0.469907 -1.68843 0.384375   V1 2.22045e-16 -1.75 0.384375   V2 0 -1.62963 0.277778 
+  N0 0.181563 -0.673539 -0.716506   N1 -8.11143e-17 -0.6981 -0.716   N2 -1.97068e-16 -0.636383 -0.771373 
+   txt003 
+STRI 
+  V0 0 -1.62963 0.277778   V1 0.437586 -1.57229 0.277778   V2 0.469907 -1.68843 0.384375 
+  N0 -1.97068e-16 -0.636383 -0.771373   N1 0.165491 -0.61392 -0.771826   N2 0.181563 -0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 1.62963 0 0.277778   V1 1.57229 -0.437586 0.277778   V2 1.48296 -0.412723 0.200347 
+  N0 0.636383 0 -0.771373   N1 0.61392 -0.165491 -0.771826   N2 0.651276 -0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 1.48296 -0.412723 0.200347   V1 1.53704 0 0.200347   V2 1.62963 0 0.277778 
+  N0 0.651276 -0.175561 -0.738253   N1 0.675056 0 -0.737766   N2 0.636383 0 -0.771373 
+   txt003 
+STRI 
+  V0 1.57229 -0.437586 0.277778   V1 1.40993 -0.828093 0.277778   V2 1.32982 -0.781043 0.200347 
+  N0 0.61392 -0.165491 -0.771826   N1 0.549392 -0.318647 -0.77242   N2 0.582878 -0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 1.32982 -0.781043 0.200347   V1 1.48296 -0.412723 0.200347   V2 1.57229 -0.437586 0.277778 
+  N0 0.582878 -0.338069 -0.738893   N1 0.651276 -0.175561 -0.738253   N2 0.61392 -0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 1.40993 -0.828093 0.277778   V1 1.15704 -1.15704 0.277778   V2 1.0913 -1.0913 0.200347 
+  N0 0.549392 -0.318647 -0.77242   N1 0.448897 -0.448897 -0.772647   N2 0.476275 -0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 1.0913 -1.0913 0.200347   V1 1.32982 -0.781043 0.200347   V2 1.40993 -0.828093 0.277778 
+  N0 0.476275 -0.476275 -0.739137   N1 0.582878 -0.338069 -0.738893   N2 0.549392 -0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 1.15704 -1.15704 0.277778   V1 0.828093 -1.40993 0.277778   V2 0.781043 -1.32982 0.200347 
+  N0 0.448897 -0.448897 -0.772647   N1 0.318647 -0.549392 -0.77242   N2 0.338069 -0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 0.781043 -1.32982 0.200347   V1 1.0913 -1.0913 0.200347   V2 1.15704 -1.15704 0.277778 
+  N0 0.338069 -0.582878 -0.738893   N1 0.476275 -0.476275 -0.739137   N2 0.448897 -0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 0.828093 -1.40993 0.277778   V1 0.437586 -1.57229 0.277778   V2 0.412723 -1.48296 0.200347 
+  N0 0.318647 -0.549392 -0.77242   N1 0.165491 -0.61392 -0.771826   N2 0.175561 -0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 0.412723 -1.48296 0.200347   V1 0.781043 -1.32982 0.200347   V2 0.828093 -1.40993 0.277778 
+  N0 0.175561 -0.651276 -0.738253   N1 0.338069 -0.582878 -0.738893   N2 0.318647 -0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 0.437586 -1.57229 0.277778   V1 0 -1.62963 0.277778   V2 0 -1.53704 0.200347 
+  N0 0.165491 -0.61392 -0.771826   N1 -1.97068e-16 -0.636383 -0.771373   N2 -9.51605e-17 -0.675056 -0.737766 
+   txt003 
+STRI 
+  V0 0 -1.53704 0.200347   V1 0.412723 -1.48296 0.200347   V2 0.437586 -1.57229 0.277778 
+  N0 -9.51605e-17 -0.675056 -0.737766   N1 0.175561 -0.651276 -0.738253   N2 0.165491 -0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 1.53704 0 0.200347   V1 1.48296 -0.412723 0.200347   V2 1.44722 -0.402778 0.15 
+  N0 0.675056 0 -0.737766   N1 0.651276 -0.175561 -0.738253   N2 0.965535 -0.260275 0 
+   txt003 
+STRI 
+  V0 1.44722 -0.402778 0.15   V1 1.5 0 0.15   V2 1.53704 0 0.200347 
+  N0 0.965535 -0.260275 0   N1 1 0 0   N2 0.675056 0 -0.737766 
+   txt003 
+STRI 
+  V0 1.48296 -0.412723 0.200347   V1 1.32982 -0.781043 0.200347   V2 1.29778 -0.762222 0.15 
+  N0 0.651276 -0.175561 -0.738253   N1 0.582878 -0.338069 -0.738893   N2 0.865031 -0.501718 0 
+   txt003 
+STRI 
+  V0 1.29778 -0.762222 0.15   V1 1.44722 -0.402778 0.15   V2 1.48296 -0.412723 0.200347 
+  N0 0.865031 -0.501718 0   N1 0.965535 -0.260275 0   N2 0.651276 -0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 1.32982 -0.781043 0.200347   V1 1.0913 -1.0913 0.200347   V2 1.065 -1.065 0.15 
+  N0 0.582878 -0.338069 -0.738893   N1 0.476275 -0.476275 -0.739137   N2 0.707107 -0.707107 0 
+   txt003 
+STRI 
+  V0 1.065 -1.065 0.15   V1 1.29778 -0.762222 0.15   V2 1.32982 -0.781043 0.200347 
+  N0 0.707107 -0.707107 0   N1 0.865031 -0.501718 0   N2 0.582878 -0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 1.0913 -1.0913 0.200347   V1 0.781043 -1.32982 0.200347   V2 0.762222 -1.29778 0.15 
+  N0 0.476275 -0.476275 -0.739137   N1 0.338069 -0.582878 -0.738893   N2 0.501718 -0.865031 0 
+   txt003 
+STRI 
+  V0 0.762222 -1.29778 0.15   V1 1.065 -1.065 0.15   V2 1.0913 -1.0913 0.200347 
+  N0 0.501718 -0.865031 0   N1 0.707107 -0.707107 0   N2 0.476275 -0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 0.781043 -1.32982 0.200347   V1 0.412723 -1.48296 0.200347   V2 0.402778 -1.44722 0.15 
+  N0 0.338069 -0.582878 -0.738893   N1 0.175561 -0.651276 -0.738253   N2 0.260275 -0.965535 0 
+   txt003 
+STRI 
+  V0 0.402778 -1.44722 0.15   V1 0.762222 -1.29778 0.15   V2 0.781043 -1.32982 0.200347 
+  N0 0.260275 -0.965535 0   N1 0.501718 -0.865031 0   N2 0.338069 -0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 0.412723 -1.48296 0.200347   V1 0 -1.53704 0.200347   V2 0 -1.5 0.15 
+  N0 0.175561 -0.651276 -0.738253   N1 -9.51605e-17 -0.675056 -0.737766   N2 -0 -1 -0 
+   txt003 
+STRI 
+  V0 0 -1.5 0.15   V1 0.402778 -1.44722 0.15   V2 0.412723 -1.48296 0.200347 
+  N0 -0 -1 -0   N1 0.260275 -0.965535 0   N2 0.175561 -0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 0 -2 0.9   V1 -0.537037 -1.92963 0.9   V2 -0.527092 -1.8939 0.693403 
+  N0 -0 -1 -0   N1 -0.260275 -0.965535 -0   N2 -0.244192 -0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 -0.527092 -1.8939 0.693403   V1 0 -1.96296 0.693403   V2 0 -2 0.9 
+  N0 -0.244192 -0.905874 -0.346067   N1 -0 -0.938373 -0.345625   N2 -0 -1 -0 
+   txt003 
+STRI 
+  V0 -0.537037 -1.92963 0.9   V1 -1.0163 -1.73037 0.9   V2 -0.997476 -1.69833 0.693403 
+  N0 -0.260275 -0.965535 -0   N1 -0.501718 -0.865031 -0   N2 -0.470609 -0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 -0.997476 -1.69833 0.693403   V1 -0.527092 -1.8939 0.693403   V2 -0.537037 -1.92963 0.9 
+  N0 -0.470609 -0.811395 -0.346647   N1 -0.244192 -0.905874 -0.346067   N2 -0.260275 -0.965535 -0 
+   txt003 
+STRI 
+  V0 -1.0163 -1.73037 0.9   V1 -1.42 -1.42 0.9   V2 -1.3937 -1.3937 0.693403 
+  N0 -0.501718 -0.865031 -0   N1 -0.707107 -0.707107 -0   N2 -0.663205 -0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 -1.3937 -1.3937 0.693403   V1 -0.997476 -1.69833 0.693403   V2 -1.0163 -1.73037 0.9 
+  N0 -0.663205 -0.663205 -0.34687   N1 -0.470609 -0.811395 -0.346647   N2 -0.501718 -0.865031 -0 
+   txt003 
+STRI 
+  V0 -1.42 -1.42 0.9   V1 -1.73037 -1.0163 0.9   V2 -1.69833 -0.997476 0.693403 
+  N0 -0.707107 -0.707107 -0   N1 -0.865031 -0.501718 -0   N2 -0.811395 -0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 -1.69833 -0.997476 0.693403   V1 -1.3937 -1.3937 0.693403   V2 -1.42 -1.42 0.9 
+  N0 -0.811395 -0.470609 -0.346647   N1 -0.663205 -0.663205 -0.34687   N2 -0.707107 -0.707107 -0 
+   txt003 
+STRI 
+  V0 -1.73037 -1.0163 0.9   V1 -1.92963 -0.537037 0.9   V2 -1.8939 -0.527092 0.693403 
+  N0 -0.865031 -0.501718 -0   N1 -0.965535 -0.260275 -0   N2 -0.905874 -0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 -1.8939 -0.527092 0.693403   V1 -1.69833 -0.997476 0.693403   V2 -1.73037 -1.0163 0.9 
+  N0 -0.905874 -0.244192 -0.346067   N1 -0.811395 -0.470609 -0.346647   N2 -0.865031 -0.501718 -0 
+   txt003 
+STRI 
+  V0 -1.92963 -0.537037 0.9   V1 -2 0 0.9   V2 -1.96296 -2.22045e-16 0.693403 
+  N0 -0.965535 -0.260275 -0   N1 -1 0 0   N2 -0.938373 3.49072e-17 -0.345625 
+   txt003 
+STRI 
+  V0 -1.96296 -2.22045e-16 0.693403   V1 -1.8939 -0.527092 0.693403   V2 -1.92963 -0.537037 0.9 
+  N0 -0.938373 3.49072e-17 -0.345625   N1 -0.905874 -0.244192 -0.346067   N2 -0.965535 -0.260275 -0 
+   txt003 
+STRI 
+  V0 0 -1.96296 0.693403   V1 -0.527092 -1.8939 0.693403   V2 -0.502229 -1.80456 0.522222 
+  N0 -0 -0.938373 -0.345625   N1 -0.244192 -0.905874 -0.346067   N2 -0.211045 -0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 -0.502229 -1.80456 0.522222   V1 0 -1.87037 0.522222   V2 0 -1.96296 0.693403 
+  N0 -0.211045 -0.782908 -0.585248   N1 -0 -0.811257 -0.58469   N2 -0 -0.938373 -0.345625 
+   txt003 
+STRI 
+  V0 -0.527092 -1.8939 0.693403   V1 -0.997476 -1.69833 0.693403   V2 -0.950425 -1.61822 0.522222 
+  N0 -0.244192 -0.905874 -0.346067   N1 -0.470609 -0.811395 -0.346647   N2 -0.406555 -0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 -0.950425 -1.61822 0.522222   V1 -0.502229 -1.80456 0.522222   V2 -0.527092 -1.8939 0.693403 
+  N0 -0.406555 -0.700957 -0.58598   N1 -0.211045 -0.782908 -0.585248   N2 -0.244192 -0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 -0.997476 -1.69833 0.693403   V1 -1.3937 -1.3937 0.693403   V2 -1.32796 -1.32796 0.522222 
+  N0 -0.470609 -0.811395 -0.346647   N1 -0.663205 -0.663205 -0.34687   N2 -0.572843 -0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 -1.32796 -1.32796 0.522222   V1 -0.950425 -1.61822 0.522222   V2 -0.997476 -1.69833 0.693403 
+  N0 -0.572843 -0.572843 -0.586261   N1 -0.406555 -0.700957 -0.58598   N2 -0.470609 -0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 -1.3937 -1.3937 0.693403   V1 -1.69833 -0.997476 0.693403   V2 -1.61822 -0.950425 0.522222 
+  N0 -0.663205 -0.663205 -0.34687   N1 -0.811395 -0.470609 -0.346647   N2 -0.700957 -0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 -1.61822 -0.950425 0.522222   V1 -1.32796 -1.32796 0.522222   V2 -1.3937 -1.3937 0.693403 
+  N0 -0.700957 -0.406555 -0.58598   N1 -0.572843 -0.572843 -0.586261   N2 -0.663205 -0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 -1.69833 -0.997476 0.693403   V1 -1.8939 -0.527092 0.693403   V2 -1.80456 -0.502229 0.522222 
+  N0 -0.811395 -0.470609 -0.346647   N1 -0.905874 -0.244192 -0.346067   N2 -0.782908 -0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 -1.80456 -0.502229 0.522222   V1 -1.61822 -0.950425 0.522222   V2 -1.69833 -0.997476 0.693403 
+  N0 -0.782908 -0.211045 -0.585248   N1 -0.700957 -0.406555 -0.58598   N2 -0.811395 -0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 -1.8939 -0.527092 0.693403   V1 -1.96296 -2.22045e-16 0.693403   V2 -1.87037 -2.22045e-16 0.522222 
+  N0 -0.905874 -0.244192 -0.346067   N1 -0.938373 3.49072e-17 -0.345625   N2 -0.811257 6.19755e-17 -0.58469 
+   txt003 
+STRI 
+  V0 -1.87037 -2.22045e-16 0.522222   V1 -1.80456 -0.502229 0.522222   V2 -1.8939 -0.527092 0.693403 
+  N0 -0.811257 6.19755e-17 -0.58469   N1 -0.782908 -0.211045 -0.585248   N2 -0.905874 -0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 0 -1.87037 0.522222   V1 -0.502229 -1.80456 0.522222   V2 -0.469907 -1.68843 0.384375 
+  N0 -0 -0.811257 -0.58469   N1 -0.211045 -0.782908 -0.585248   N2 -0.181563 -0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 -0.469907 -1.68843 0.384375   V1 0 -1.75 0.384375   V2 0 -1.87037 0.522222 
+  N0 -0.181563 -0.673539 -0.716506   N1 -0 -0.6981 -0.716   N2 -0 -0.811257 -0.58469 
+   txt003 
+STRI 
+  V0 -0.502229 -1.80456 0.522222   V1 -0.950425 -1.61822 0.522222   V2 -0.889259 -1.51407 0.384375 
+  N0 -0.211045 -0.782908 -0.585248   N1 -0.406555 -0.700957 -0.58598   N2 -0.349647 -0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 -0.889259 -1.51407 0.384375   V1 -0.469907 -1.68843 0.384375   V2 -0.502229 -1.80456 0.522222 
+  N0 -0.349647 -0.602839 -0.717169   N1 -0.181563 -0.673539 -0.716506   N2 -0.211045 -0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 -0.950425 -1.61822 0.522222   V1 -1.32796 -1.32796 0.522222   V2 -1.2425 -1.2425 0.384375 
+  N0 -0.406555 -0.700957 -0.58598   N1 -0.572843 -0.572843 -0.586261   N2 -0.492597 -0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 -1.2425 -1.2425 0.384375   V1 -0.889259 -1.51407 0.384375   V2 -0.950425 -1.61822 0.522222 
+  N0 -0.492597 -0.492597 -0.717423   N1 -0.349647 -0.602839 -0.717169   N2 -0.406555 -0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 -1.32796 -1.32796 0.522222   V1 -1.61822 -0.950425 0.522222   V2 -1.51407 -0.889259 0.384375 
+  N0 -0.572843 -0.572843 -0.586261   N1 -0.700957 -0.406555 -0.58598   N2 -0.602839 -0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 -1.51407 -0.889259 0.384375   V1 -1.2425 -1.2425 0.384375   V2 -1.32796 -1.32796 0.522222 
+  N0 -0.602839 -0.349647 -0.717169   N1 -0.492597 -0.492597 -0.717423   N2 -0.572843 -0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 -1.61822 -0.950425 0.522222   V1 -1.80456 -0.502229 0.522222   V2 -1.68843 -0.469907 0.384375 
+  N0 -0.700957 -0.406555 -0.58598   N1 -0.782908 -0.211045 -0.585248   N2 -0.673539 -0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 -1.68843 -0.469907 0.384375   V1 -1.51407 -0.889259 0.384375   V2 -1.61822 -0.950425 0.522222 
+  N0 -0.673539 -0.181563 -0.716506   N1 -0.602839 -0.349647 -0.717169   N2 -0.700957 -0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 -1.80456 -0.502229 0.522222   V1 -1.87037 -2.22045e-16 0.522222   V2 -1.75 -2.22045e-16 0.384375 
+  N0 -0.782908 -0.211045 -0.585248   N1 -0.811257 6.19755e-17 -0.58469   N2 -0.6981 8.11143e-17 -0.716 
+   txt003 
+STRI 
+  V0 -1.75 -2.22045e-16 0.384375   V1 -1.68843 -0.469907 0.384375   V2 -1.80456 -0.502229 0.522222 
+  N0 -0.6981 8.11143e-17 -0.716   N1 -0.673539 -0.181563 -0.716506   N2 -0.782908 -0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 0 -1.75 0.384375   V1 -0.469907 -1.68843 0.384375   V2 -0.437586 -1.57229 0.277778 
+  N0 -0 -0.6981 -0.716   N1 -0.181563 -0.673539 -0.716506   N2 -0.165491 -0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 -0.437586 -1.57229 0.277778   V1 0 -1.62963 0.277778   V2 0 -1.75 0.384375 
+  N0 -0.165491 -0.61392 -0.771826   N1 -0 -0.636383 -0.771373   N2 -0 -0.6981 -0.716 
+   txt003 
+STRI 
+  V0 -0.469907 -1.68843 0.384375   V1 -0.889259 -1.51407 0.384375   V2 -0.828093 -1.40993 0.277778 
+  N0 -0.181563 -0.673539 -0.716506   N1 -0.349647 -0.602839 -0.717169   N2 -0.318647 -0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 -0.828093 -1.40993 0.277778   V1 -0.437586 -1.57229 0.277778   V2 -0.469907 -1.68843 0.384375 
+  N0 -0.318647 -0.549392 -0.77242   N1 -0.165491 -0.61392 -0.771826   N2 -0.181563 -0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 -0.889259 -1.51407 0.384375   V1 -1.2425 -1.2425 0.384375   V2 -1.15704 -1.15704 0.277778 
+  N0 -0.349647 -0.602839 -0.717169   N1 -0.492597 -0.492597 -0.717423   N2 -0.448897 -0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 -1.15704 -1.15704 0.277778   V1 -0.828093 -1.40993 0.277778   V2 -0.889259 -1.51407 0.384375 
+  N0 -0.448897 -0.448897 -0.772647   N1 -0.318647 -0.549392 -0.77242   N2 -0.349647 -0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 -1.2425 -1.2425 0.384375   V1 -1.51407 -0.889259 0.384375   V2 -1.40993 -0.828093 0.277778 
+  N0 -0.492597 -0.492597 -0.717423   N1 -0.602839 -0.349647 -0.717169   N2 -0.549392 -0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 -1.40993 -0.828093 0.277778   V1 -1.15704 -1.15704 0.277778   V2 -1.2425 -1.2425 0.384375 
+  N0 -0.549392 -0.318647 -0.77242   N1 -0.448897 -0.448897 -0.772647   N2 -0.492597 -0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 -1.51407 -0.889259 0.384375   V1 -1.68843 -0.469907 0.384375   V2 -1.57229 -0.437586 0.277778 
+  N0 -0.602839 -0.349647 -0.717169   N1 -0.673539 -0.181563 -0.716506   N2 -0.61392 -0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 -1.57229 -0.437586 0.277778   V1 -1.40993 -0.828093 0.277778   V2 -1.51407 -0.889259 0.384375 
+  N0 -0.61392 -0.165491 -0.771826   N1 -0.549392 -0.318647 -0.77242   N2 -0.602839 -0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 -1.68843 -0.469907 0.384375   V1 -1.75 -2.22045e-16 0.384375   V2 -1.62963 0 0.277778 
+  N0 -0.673539 -0.181563 -0.716506   N1 -0.6981 8.11143e-17 -0.716   N2 -0.636383 1.97068e-16 -0.771373 
+   txt003 
+STRI 
+  V0 -1.62963 0 0.277778   V1 -1.57229 -0.437586 0.277778   V2 -1.68843 -0.469907 0.384375 
+  N0 -0.636383 1.97068e-16 -0.771373   N1 -0.61392 -0.165491 -0.771826   N2 -0.673539 -0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 0 -1.62963 0.277778   V1 -0.437586 -1.57229 0.277778   V2 -0.412723 -1.48296 0.200347 
+  N0 -0 -0.636383 -0.771373   N1 -0.165491 -0.61392 -0.771826   N2 -0.175561 -0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 -0.412723 -1.48296 0.200347   V1 0 -1.53704 0.200347   V2 0 -1.62963 0.277778 
+  N0 -0.175561 -0.651276 -0.738253   N1 -0 -0.675056 -0.737766   N2 -0 -0.636383 -0.771373 
+   txt003 
+STRI 
+  V0 -0.437586 -1.57229 0.277778   V1 -0.828093 -1.40993 0.277778   V2 -0.781043 -1.32982 0.200347 
+  N0 -0.165491 -0.61392 -0.771826   N1 -0.318647 -0.549392 -0.77242   N2 -0.338069 -0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 -0.781043 -1.32982 0.200347   V1 -0.412723 -1.48296 0.200347   V2 -0.437586 -1.57229 0.277778 
+  N0 -0.338069 -0.582878 -0.738893   N1 -0.175561 -0.651276 -0.738253   N2 -0.165491 -0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 -0.828093 -1.40993 0.277778   V1 -1.15704 -1.15704 0.277778   V2 -1.0913 -1.0913 0.200347 
+  N0 -0.318647 -0.549392 -0.77242   N1 -0.448897 -0.448897 -0.772647   N2 -0.476275 -0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 -1.0913 -1.0913 0.200347   V1 -0.781043 -1.32982 0.200347   V2 -0.828093 -1.40993 0.277778 
+  N0 -0.476275 -0.476275 -0.739137   N1 -0.338069 -0.582878 -0.738893   N2 -0.318647 -0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 -1.15704 -1.15704 0.277778   V1 -1.40993 -0.828093 0.277778   V2 -1.32982 -0.781043 0.200347 
+  N0 -0.448897 -0.448897 -0.772647   N1 -0.549392 -0.318647 -0.77242   N2 -0.582878 -0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 -1.32982 -0.781043 0.200347   V1 -1.0913 -1.0913 0.200347   V2 -1.15704 -1.15704 0.277778 
+  N0 -0.582878 -0.338069 -0.738893   N1 -0.476275 -0.476275 -0.739137   N2 -0.448897 -0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 -1.40993 -0.828093 0.277778   V1 -1.57229 -0.437586 0.277778   V2 -1.48296 -0.412723 0.200347 
+  N0 -0.549392 -0.318647 -0.77242   N1 -0.61392 -0.165491 -0.771826   N2 -0.651276 -0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 -1.48296 -0.412723 0.200347   V1 -1.32982 -0.781043 0.200347   V2 -1.40993 -0.828093 0.277778 
+  N0 -0.651276 -0.175561 -0.738253   N1 -0.582878 -0.338069 -0.738893   N2 -0.549392 -0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 -1.57229 -0.437586 0.277778   V1 -1.62963 0 0.277778   V2 -1.53704 0 0.200347 
+  N0 -0.61392 -0.165491 -0.771826   N1 -0.636383 1.97068e-16 -0.771373   N2 -0.675056 9.51605e-17 -0.737766 
+   txt003 
+STRI 
+  V0 -1.53704 0 0.200347   V1 -1.48296 -0.412723 0.200347   V2 -1.57229 -0.437586 0.277778 
+  N0 -0.675056 9.51605e-17 -0.737766   N1 -0.651276 -0.175561 -0.738253   N2 -0.61392 -0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 0 -1.53704 0.200347   V1 -0.412723 -1.48296 0.200347   V2 -0.402778 -1.44722 0.15 
+  N0 -0 -0.675056 -0.737766   N1 -0.175561 -0.651276 -0.738253   N2 -0.260275 -0.965535 -0 
+   txt003 
+STRI 
+  V0 -0.402778 -1.44722 0.15   V1 0 -1.5 0.15   V2 0 -1.53704 0.200347 
+  N0 -0.260275 -0.965535 -0   N1 -0 -1 -0   N2 -0 -0.675056 -0.737766 
+   txt003 
+STRI 
+  V0 -0.412723 -1.48296 0.200347   V1 -0.781043 -1.32982 0.200347   V2 -0.762222 -1.29778 0.15 
+  N0 -0.175561 -0.651276 -0.738253   N1 -0.338069 -0.582878 -0.738893   N2 -0.501718 -0.865031 -0 
+   txt003 
+STRI 
+  V0 -0.762222 -1.29778 0.15   V1 -0.402778 -1.44722 0.15   V2 -0.412723 -1.48296 0.200347 
+  N0 -0.501718 -0.865031 -0   N1 -0.260275 -0.965535 -0   N2 -0.175561 -0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 -0.781043 -1.32982 0.200347   V1 -1.0913 -1.0913 0.200347   V2 -1.065 -1.065 0.15 
+  N0 -0.338069 -0.582878 -0.738893   N1 -0.476275 -0.476275 -0.739137   N2 -0.707107 -0.707107 -0 
+   txt003 
+STRI 
+  V0 -1.065 -1.065 0.15   V1 -0.762222 -1.29778 0.15   V2 -0.781043 -1.32982 0.200347 
+  N0 -0.707107 -0.707107 -0   N1 -0.501718 -0.865031 -0   N2 -0.338069 -0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 -1.0913 -1.0913 0.200347   V1 -1.32982 -0.781043 0.200347   V2 -1.29778 -0.762222 0.15 
+  N0 -0.476275 -0.476275 -0.739137   N1 -0.582878 -0.338069 -0.738893   N2 -0.865031 -0.501718 -0 
+   txt003 
+STRI 
+  V0 -1.29778 -0.762222 0.15   V1 -1.065 -1.065 0.15   V2 -1.0913 -1.0913 0.200347 
+  N0 -0.865031 -0.501718 -0   N1 -0.707107 -0.707107 -0   N2 -0.476275 -0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 -1.32982 -0.781043 0.200347   V1 -1.48296 -0.412723 0.200347   V2 -1.44722 -0.402778 0.15 
+  N0 -0.582878 -0.338069 -0.738893   N1 -0.651276 -0.175561 -0.738253   N2 -0.965535 -0.260275 -0 
+   txt003 
+STRI 
+  V0 -1.44722 -0.402778 0.15   V1 -1.29778 -0.762222 0.15   V2 -1.32982 -0.781043 0.200347 
+  N0 -0.965535 -0.260275 -0   N1 -0.865031 -0.501718 -0   N2 -0.582878 -0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 -1.48296 -0.412723 0.200347   V1 -1.53704 0 0.200347   V2 -1.5 0 0.15 
+  N0 -0.651276 -0.175561 -0.738253   N1 -0.675056 9.51605e-17 -0.737766   N2 -1 0 0 
+   txt003 
+STRI 
+  V0 -1.5 0 0.15   V1 -1.44722 -0.402778 0.15   V2 -1.48296 -0.412723 0.200347 
+  N0 -1 0 0   N1 -0.965535 -0.260275 -0   N2 -0.651276 -0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 -2 0 0.9   V1 -1.92963 0.537037 0.9   V2 -1.8939 0.527092 0.693403 
+  N0 -1 0 0   N1 -0.965535 0.260275 0   N2 -0.905874 0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 -1.8939 0.527092 0.693403   V1 -1.96296 0 0.693403   V2 -2 0 0.9 
+  N0 -0.905874 0.244192 -0.346067   N1 -0.938373 0 -0.345625   N2 -1 0 0 
+   txt003 
+STRI 
+  V0 -1.92963 0.537037 0.9   V1 -1.73037 1.0163 0.9   V2 -1.69833 0.997476 0.693403 
+  N0 -0.965535 0.260275 0   N1 -0.865031 0.501718 0   N2 -0.811395 0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 -1.69833 0.997476 0.693403   V1 -1.8939 0.527092 0.693403   V2 -1.92963 0.537037 0.9 
+  N0 -0.811395 0.470609 -0.346647   N1 -0.905874 0.244192 -0.346067   N2 -0.965535 0.260275 0 
+   txt003 
+STRI 
+  V0 -1.73037 1.0163 0.9   V1 -1.42 1.42 0.9   V2 -1.3937 1.3937 0.693403 
+  N0 -0.865031 0.501718 0   N1 -0.707107 0.707107 0   N2 -0.663205 0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 -1.3937 1.3937 0.693403   V1 -1.69833 0.997476 0.693403   V2 -1.73037 1.0163 0.9 
+  N0 -0.663205 0.663205 -0.34687   N1 -0.811395 0.470609 -0.346647   N2 -0.865031 0.501718 0 
+   txt003 
+STRI 
+  V0 -1.42 1.42 0.9   V1 -1.0163 1.73037 0.9   V2 -0.997476 1.69833 0.693403 
+  N0 -0.707107 0.707107 0   N1 -0.501718 0.865031 0   N2 -0.470609 0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 -0.997476 1.69833 0.693403   V1 -1.3937 1.3937 0.693403   V2 -1.42 1.42 0.9 
+  N0 -0.470609 0.811395 -0.346647   N1 -0.663205 0.663205 -0.34687   N2 -0.707107 0.707107 0 
+   txt003 
+STRI 
+  V0 -1.0163 1.73037 0.9   V1 -0.537037 1.92963 0.9   V2 -0.527092 1.8939 0.693403 
+  N0 -0.501718 0.865031 0   N1 -0.260275 0.965535 0   N2 -0.244192 0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 -0.527092 1.8939 0.693403   V1 -0.997476 1.69833 0.693403   V2 -1.0163 1.73037 0.9 
+  N0 -0.244192 0.905874 -0.346067   N1 -0.470609 0.811395 -0.346647   N2 -0.501718 0.865031 0 
+   txt003 
+STRI 
+  V0 -0.537037 1.92963 0.9   V1 0 2 0.9   V2 -2.22045e-16 1.96296 0.693403 
+  N0 -0.260275 0.965535 0   N1 -0 1 0   N2 3.49072e-17 0.938373 -0.345625 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.96296 0.693403   V1 -0.527092 1.8939 0.693403   V2 -0.537037 1.92963 0.9 
+  N0 3.49072e-17 0.938373 -0.345625   N1 -0.244192 0.905874 -0.346067   N2 -0.260275 0.965535 0 
+   txt003 
+STRI 
+  V0 -1.96296 0 0.693403   V1 -1.8939 0.527092 0.693403   V2 -1.80456 0.502229 0.522222 
+  N0 -0.938373 0 -0.345625   N1 -0.905874 0.244192 -0.346067   N2 -0.782908 0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 -1.80456 0.502229 0.522222   V1 -1.87037 0 0.522222   V2 -1.96296 0 0.693403 
+  N0 -0.782908 0.211045 -0.585248   N1 -0.811257 0 -0.58469   N2 -0.938373 0 -0.345625 
+   txt003 
+STRI 
+  V0 -1.8939 0.527092 0.693403   V1 -1.69833 0.997476 0.693403   V2 -1.61822 0.950425 0.522222 
+  N0 -0.905874 0.244192 -0.346067   N1 -0.811395 0.470609 -0.346647   N2 -0.700957 0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 -1.61822 0.950425 0.522222   V1 -1.80456 0.502229 0.522222   V2 -1.8939 0.527092 0.693403 
+  N0 -0.700957 0.406555 -0.58598   N1 -0.782908 0.211045 -0.585248   N2 -0.905874 0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 -1.69833 0.997476 0.693403   V1 -1.3937 1.3937 0.693403   V2 -1.32796 1.32796 0.522222 
+  N0 -0.811395 0.470609 -0.346647   N1 -0.663205 0.663205 -0.34687   N2 -0.572843 0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 -1.32796 1.32796 0.522222   V1 -1.61822 0.950425 0.522222   V2 -1.69833 0.997476 0.693403 
+  N0 -0.572843 0.572843 -0.586261   N1 -0.700957 0.406555 -0.58598   N2 -0.811395 0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 -1.3937 1.3937 0.693403   V1 -0.997476 1.69833 0.693403   V2 -0.950425 1.61822 0.522222 
+  N0 -0.663205 0.663205 -0.34687   N1 -0.470609 0.811395 -0.346647   N2 -0.406555 0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 -0.950425 1.61822 0.522222   V1 -1.32796 1.32796 0.522222   V2 -1.3937 1.3937 0.693403 
+  N0 -0.406555 0.700957 -0.58598   N1 -0.572843 0.572843 -0.586261   N2 -0.663205 0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 -0.997476 1.69833 0.693403   V1 -0.527092 1.8939 0.693403   V2 -0.502229 1.80456 0.522222 
+  N0 -0.470609 0.811395 -0.346647   N1 -0.244192 0.905874 -0.346067   N2 -0.211045 0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 -0.502229 1.80456 0.522222   V1 -0.950425 1.61822 0.522222   V2 -0.997476 1.69833 0.693403 
+  N0 -0.211045 0.782908 -0.585248   N1 -0.406555 0.700957 -0.58598   N2 -0.470609 0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 -0.527092 1.8939 0.693403   V1 -2.22045e-16 1.96296 0.693403   V2 -2.22045e-16 1.87037 0.522222 
+  N0 -0.244192 0.905874 -0.346067   N1 3.49072e-17 0.938373 -0.345625   N2 6.19755e-17 0.811257 -0.58469 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.87037 0.522222   V1 -0.502229 1.80456 0.522222   V2 -0.527092 1.8939 0.693403 
+  N0 6.19755e-17 0.811257 -0.58469   N1 -0.211045 0.782908 -0.585248   N2 -0.244192 0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 -1.87037 0 0.522222   V1 -1.80456 0.502229 0.522222   V2 -1.68843 0.469907 0.384375 
+  N0 -0.811257 0 -0.58469   N1 -0.782908 0.211045 -0.585248   N2 -0.673539 0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 -1.68843 0.469907 0.384375   V1 -1.75 0 0.384375   V2 -1.87037 0 0.522222 
+  N0 -0.673539 0.181563 -0.716506   N1 -0.6981 0 -0.716   N2 -0.811257 0 -0.58469 
+   txt003 
+STRI 
+  V0 -1.80456 0.502229 0.522222   V1 -1.61822 0.950425 0.522222   V2 -1.51407 0.889259 0.384375 
+  N0 -0.782908 0.211045 -0.585248   N1 -0.700957 0.406555 -0.58598   N2 -0.602839 0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 -1.51407 0.889259 0.384375   V1 -1.68843 0.469907 0.384375   V2 -1.80456 0.502229 0.522222 
+  N0 -0.602839 0.349647 -0.717169   N1 -0.673539 0.181563 -0.716506   N2 -0.782908 0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 -1.61822 0.950425 0.522222   V1 -1.32796 1.32796 0.522222   V2 -1.2425 1.2425 0.384375 
+  N0 -0.700957 0.406555 -0.58598   N1 -0.572843 0.572843 -0.586261   N2 -0.492597 0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 -1.2425 1.2425 0.384375   V1 -1.51407 0.889259 0.384375   V2 -1.61822 0.950425 0.522222 
+  N0 -0.492597 0.492597 -0.717423   N1 -0.602839 0.349647 -0.717169   N2 -0.700957 0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 -1.32796 1.32796 0.522222   V1 -0.950425 1.61822 0.522222   V2 -0.889259 1.51407 0.384375 
+  N0 -0.572843 0.572843 -0.586261   N1 -0.406555 0.700957 -0.58598   N2 -0.349647 0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 -0.889259 1.51407 0.384375   V1 -1.2425 1.2425 0.384375   V2 -1.32796 1.32796 0.522222 
+  N0 -0.349647 0.602839 -0.717169   N1 -0.492597 0.492597 -0.717423   N2 -0.572843 0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 -0.950425 1.61822 0.522222   V1 -0.502229 1.80456 0.522222   V2 -0.469907 1.68843 0.384375 
+  N0 -0.406555 0.700957 -0.58598   N1 -0.211045 0.782908 -0.585248   N2 -0.181563 0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 -0.469907 1.68843 0.384375   V1 -0.889259 1.51407 0.384375   V2 -0.950425 1.61822 0.522222 
+  N0 -0.181563 0.673539 -0.716506   N1 -0.349647 0.602839 -0.717169   N2 -0.406555 0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 -0.502229 1.80456 0.522222   V1 -2.22045e-16 1.87037 0.522222   V2 -2.22045e-16 1.75 0.384375 
+  N0 -0.211045 0.782908 -0.585248   N1 6.19755e-17 0.811257 -0.58469   N2 8.11143e-17 0.6981 -0.716 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.75 0.384375   V1 -0.469907 1.68843 0.384375   V2 -0.502229 1.80456 0.522222 
+  N0 8.11143e-17 0.6981 -0.716   N1 -0.181563 0.673539 -0.716506   N2 -0.211045 0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 -1.75 0 0.384375   V1 -1.68843 0.469907 0.384375   V2 -1.57229 0.437586 0.277778 
+  N0 -0.6981 0 -0.716   N1 -0.673539 0.181563 -0.716506   N2 -0.61392 0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 -1.57229 0.437586 0.277778   V1 -1.62963 0 0.277778   V2 -1.75 0 0.384375 
+  N0 -0.61392 0.165491 -0.771826   N1 -0.636383 0 -0.771373   N2 -0.6981 0 -0.716 
+   txt003 
+STRI 
+  V0 -1.68843 0.469907 0.384375   V1 -1.51407 0.889259 0.384375   V2 -1.40993 0.828093 0.277778 
+  N0 -0.673539 0.181563 -0.716506   N1 -0.602839 0.349647 -0.717169   N2 -0.549392 0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 -1.40993 0.828093 0.277778   V1 -1.57229 0.437586 0.277778   V2 -1.68843 0.469907 0.384375 
+  N0 -0.549392 0.318647 -0.77242   N1 -0.61392 0.165491 -0.771826   N2 -0.673539 0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 -1.51407 0.889259 0.384375   V1 -1.2425 1.2425 0.384375   V2 -1.15704 1.15704 0.277778 
+  N0 -0.602839 0.349647 -0.717169   N1 -0.492597 0.492597 -0.717423   N2 -0.448897 0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 -1.15704 1.15704 0.277778   V1 -1.40993 0.828093 0.277778   V2 -1.51407 0.889259 0.384375 
+  N0 -0.448897 0.448897 -0.772647   N1 -0.549392 0.318647 -0.77242   N2 -0.602839 0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 -1.2425 1.2425 0.384375   V1 -0.889259 1.51407 0.384375   V2 -0.828093 1.40993 0.277778 
+  N0 -0.492597 0.492597 -0.717423   N1 -0.349647 0.602839 -0.717169   N2 -0.318647 0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 -0.828093 1.40993 0.277778   V1 -1.15704 1.15704 0.277778   V2 -1.2425 1.2425 0.384375 
+  N0 -0.318647 0.549392 -0.77242   N1 -0.448897 0.448897 -0.772647   N2 -0.492597 0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 -0.889259 1.51407 0.384375   V1 -0.469907 1.68843 0.384375   V2 -0.437586 1.57229 0.277778 
+  N0 -0.349647 0.602839 -0.717169   N1 -0.181563 0.673539 -0.716506   N2 -0.165491 0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 -0.437586 1.57229 0.277778   V1 -0.828093 1.40993 0.277778   V2 -0.889259 1.51407 0.384375 
+  N0 -0.165491 0.61392 -0.771826   N1 -0.318647 0.549392 -0.77242   N2 -0.349647 0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 -0.469907 1.68843 0.384375   V1 -2.22045e-16 1.75 0.384375   V2 0 1.62963 0.277778 
+  N0 -0.181563 0.673539 -0.716506   N1 8.11143e-17 0.6981 -0.716   N2 1.97068e-16 0.636383 -0.771373 
+   txt003 
+STRI 
+  V0 0 1.62963 0.277778   V1 -0.437586 1.57229 0.277778   V2 -0.469907 1.68843 0.384375 
+  N0 1.97068e-16 0.636383 -0.771373   N1 -0.165491 0.61392 -0.771826   N2 -0.181563 0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 -1.62963 0 0.277778   V1 -1.57229 0.437586 0.277778   V2 -1.48296 0.412723 0.200347 
+  N0 -0.636383 0 -0.771373   N1 -0.61392 0.165491 -0.771826   N2 -0.651276 0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 -1.48296 0.412723 0.200347   V1 -1.53704 0 0.200347   V2 -1.62963 0 0.277778 
+  N0 -0.651276 0.175561 -0.738253   N1 -0.675056 0 -0.737766   N2 -0.636383 0 -0.771373 
+   txt003 
+STRI 
+  V0 -1.57229 0.437586 0.277778   V1 -1.40993 0.828093 0.277778   V2 -1.32982 0.781043 0.200347 
+  N0 -0.61392 0.165491 -0.771826   N1 -0.549392 0.318647 -0.77242   N2 -0.582878 0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 -1.32982 0.781043 0.200347   V1 -1.48296 0.412723 0.200347   V2 -1.57229 0.437586 0.277778 
+  N0 -0.582878 0.338069 -0.738893   N1 -0.651276 0.175561 -0.738253   N2 -0.61392 0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 -1.40993 0.828093 0.277778   V1 -1.15704 1.15704 0.277778   V2 -1.0913 1.0913 0.200347 
+  N0 -0.549392 0.318647 -0.77242   N1 -0.448897 0.448897 -0.772647   N2 -0.476275 0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 -1.0913 1.0913 0.200347   V1 -1.32982 0.781043 0.200347   V2 -1.40993 0.828093 0.277778 
+  N0 -0.476275 0.476275 -0.739137   N1 -0.582878 0.338069 -0.738893   N2 -0.549392 0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 -1.15704 1.15704 0.277778   V1 -0.828093 1.40993 0.277778   V2 -0.781043 1.32982 0.200347 
+  N0 -0.448897 0.448897 -0.772647   N1 -0.318647 0.549392 -0.77242   N2 -0.338069 0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 -0.781043 1.32982 0.200347   V1 -1.0913 1.0913 0.200347   V2 -1.15704 1.15704 0.277778 
+  N0 -0.338069 0.582878 -0.738893   N1 -0.476275 0.476275 -0.739137   N2 -0.448897 0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 -0.828093 1.40993 0.277778   V1 -0.437586 1.57229 0.277778   V2 -0.412723 1.48296 0.200347 
+  N0 -0.318647 0.549392 -0.77242   N1 -0.165491 0.61392 -0.771826   N2 -0.175561 0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 -0.412723 1.48296 0.200347   V1 -0.781043 1.32982 0.200347   V2 -0.828093 1.40993 0.277778 
+  N0 -0.175561 0.651276 -0.738253   N1 -0.338069 0.582878 -0.738893   N2 -0.318647 0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 -0.437586 1.57229 0.277778   V1 0 1.62963 0.277778   V2 0 1.53704 0.200347 
+  N0 -0.165491 0.61392 -0.771826   N1 1.97068e-16 0.636383 -0.771373   N2 9.51605e-17 0.675056 -0.737766 
+   txt003 
+STRI 
+  V0 0 1.53704 0.200347   V1 -0.412723 1.48296 0.200347   V2 -0.437586 1.57229 0.277778 
+  N0 9.51605e-17 0.675056 -0.737766   N1 -0.175561 0.651276 -0.738253   N2 -0.165491 0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 -1.53704 0 0.200347   V1 -1.48296 0.412723 0.200347   V2 -1.44722 0.402778 0.15 
+  N0 -0.675056 0 -0.737766   N1 -0.651276 0.175561 -0.738253   N2 -0.965535 0.260275 0 
+   txt003 
+STRI 
+  V0 -1.44722 0.402778 0.15   V1 -1.5 0 0.15   V2 -1.53704 0 0.200347 
+  N0 -0.965535 0.260275 0   N1 -1 0 0   N2 -0.675056 0 -0.737766 
+   txt003 
+STRI 
+  V0 -1.48296 0.412723 0.200347   V1 -1.32982 0.781043 0.200347   V2 -1.29778 0.762222 0.15 
+  N0 -0.651276 0.175561 -0.738253   N1 -0.582878 0.338069 -0.738893   N2 -0.865031 0.501718 0 
+   txt003 
+STRI 
+  V0 -1.29778 0.762222 0.15   V1 -1.44722 0.402778 0.15   V2 -1.48296 0.412723 0.200347 
+  N0 -0.865031 0.501718 0   N1 -0.965535 0.260275 0   N2 -0.651276 0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 -1.32982 0.781043 0.200347   V1 -1.0913 1.0913 0.200347   V2 -1.065 1.065 0.15 
+  N0 -0.582878 0.338069 -0.738893   N1 -0.476275 0.476275 -0.739137   N2 -0.707107 0.707107 0 
+   txt003 
+STRI 
+  V0 -1.065 1.065 0.15   V1 -1.29778 0.762222 0.15   V2 -1.32982 0.781043 0.200347 
+  N0 -0.707107 0.707107 0   N1 -0.865031 0.501718 0   N2 -0.582878 0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 -1.0913 1.0913 0.200347   V1 -0.781043 1.32982 0.200347   V2 -0.762222 1.29778 0.15 
+  N0 -0.476275 0.476275 -0.739137   N1 -0.338069 0.582878 -0.738893   N2 -0.501718 0.865031 0 
+   txt003 
+STRI 
+  V0 -0.762222 1.29778 0.15   V1 -1.065 1.065 0.15   V2 -1.0913 1.0913 0.200347 
+  N0 -0.501718 0.865031 0   N1 -0.707107 0.707107 0   N2 -0.476275 0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 -0.781043 1.32982 0.200347   V1 -0.412723 1.48296 0.200347   V2 -0.402778 1.44722 0.15 
+  N0 -0.338069 0.582878 -0.738893   N1 -0.175561 0.651276 -0.738253   N2 -0.260275 0.965535 0 
+   txt003 
+STRI 
+  V0 -0.402778 1.44722 0.15   V1 -0.762222 1.29778 0.15   V2 -0.781043 1.32982 0.200347 
+  N0 -0.260275 0.965535 0   N1 -0.501718 0.865031 0   N2 -0.338069 0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 -0.412723 1.48296 0.200347   V1 0 1.53704 0.200347   V2 0 1.5 0.15 
+  N0 -0.175561 0.651276 -0.738253   N1 9.51605e-17 0.675056 -0.737766   N2 -0 1 0 
+   txt003 
+STRI 
+  V0 0 1.5 0.15   V1 -0.402778 1.44722 0.15   V2 -0.412723 1.48296 0.200347 
+  N0 -0 1 0   N1 -0.260275 0.965535 0   N2 -0.175561 0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 0 2 0.9   V1 0.537037 1.92963 0.9   V2 0.527092 1.8939 0.693403 
+  N0 -0 1 0   N1 0.260275 0.965535 0   N2 0.244192 0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 0.527092 1.8939 0.693403   V1 0 1.96296 0.693403   V2 0 2 0.9 
+  N0 0.244192 0.905874 -0.346067   N1 0 0.938373 -0.345625   N2 -0 1 0 
+   txt003 
+STRI 
+  V0 0.537037 1.92963 0.9   V1 1.0163 1.73037 0.9   V2 0.997476 1.69833 0.693403 
+  N0 0.260275 0.965535 0   N1 0.501718 0.865031 0   N2 0.470609 0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 0.997476 1.69833 0.693403   V1 0.527092 1.8939 0.693403   V2 0.537037 1.92963 0.9 
+  N0 0.470609 0.811395 -0.346647   N1 0.244192 0.905874 -0.346067   N2 0.260275 0.965535 0 
+   txt003 
+STRI 
+  V0 1.0163 1.73037 0.9   V1 1.42 1.42 0.9   V2 1.3937 1.3937 0.693403 
+  N0 0.501718 0.865031 0   N1 0.707107 0.707107 0   N2 0.663205 0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 1.3937 1.3937 0.693403   V1 0.997476 1.69833 0.693403   V2 1.0163 1.73037 0.9 
+  N0 0.663205 0.663205 -0.34687   N1 0.470609 0.811395 -0.346647   N2 0.501718 0.865031 0 
+   txt003 
+STRI 
+  V0 1.42 1.42 0.9   V1 1.73037 1.0163 0.9   V2 1.69833 0.997476 0.693403 
+  N0 0.707107 0.707107 0   N1 0.865031 0.501718 0   N2 0.811395 0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 1.69833 0.997476 0.693403   V1 1.3937 1.3937 0.693403   V2 1.42 1.42 0.9 
+  N0 0.811395 0.470609 -0.346647   N1 0.663205 0.663205 -0.34687   N2 0.707107 0.707107 0 
+   txt003 
+STRI 
+  V0 1.73037 1.0163 0.9   V1 1.92963 0.537037 0.9   V2 1.8939 0.527092 0.693403 
+  N0 0.865031 0.501718 0   N1 0.965535 0.260275 0   N2 0.905874 0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 1.8939 0.527092 0.693403   V1 1.69833 0.997476 0.693403   V2 1.73037 1.0163 0.9 
+  N0 0.905874 0.244192 -0.346067   N1 0.811395 0.470609 -0.346647   N2 0.865031 0.501718 0 
+   txt003 
+STRI 
+  V0 1.92963 0.537037 0.9   V1 2 0 0.9   V2 1.96296 2.22045e-16 0.693403 
+  N0 0.965535 0.260275 0   N1 1 0 0   N2 0.938373 -3.49072e-17 -0.345625 
+   txt003 
+STRI 
+  V0 1.96296 2.22045e-16 0.693403   V1 1.8939 0.527092 0.693403   V2 1.92963 0.537037 0.9 
+  N0 0.938373 -3.49072e-17 -0.345625   N1 0.905874 0.244192 -0.346067   N2 0.965535 0.260275 0 
+   txt003 
+STRI 
+  V0 0 1.96296 0.693403   V1 0.527092 1.8939 0.693403   V2 0.502229 1.80456 0.522222 
+  N0 0 0.938373 -0.345625   N1 0.244192 0.905874 -0.346067   N2 0.211045 0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 0.502229 1.80456 0.522222   V1 0 1.87037 0.522222   V2 0 1.96296 0.693403 
+  N0 0.211045 0.782908 -0.585248   N1 0 0.811257 -0.58469   N2 0 0.938373 -0.345625 
+   txt003 
+STRI 
+  V0 0.527092 1.8939 0.693403   V1 0.997476 1.69833 0.693403   V2 0.950425 1.61822 0.522222 
+  N0 0.244192 0.905874 -0.346067   N1 0.470609 0.811395 -0.346647   N2 0.406555 0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 0.950425 1.61822 0.522222   V1 0.502229 1.80456 0.522222   V2 0.527092 1.8939 0.693403 
+  N0 0.406555 0.700957 -0.58598   N1 0.211045 0.782908 -0.585248   N2 0.244192 0.905874 -0.346067 
+   txt003 
+STRI 
+  V0 0.997476 1.69833 0.693403   V1 1.3937 1.3937 0.693403   V2 1.32796 1.32796 0.522222 
+  N0 0.470609 0.811395 -0.346647   N1 0.663205 0.663205 -0.34687   N2 0.572843 0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 1.32796 1.32796 0.522222   V1 0.950425 1.61822 0.522222   V2 0.997476 1.69833 0.693403 
+  N0 0.572843 0.572843 -0.586261   N1 0.406555 0.700957 -0.58598   N2 0.470609 0.811395 -0.346647 
+   txt003 
+STRI 
+  V0 1.3937 1.3937 0.693403   V1 1.69833 0.997476 0.693403   V2 1.61822 0.950425 0.522222 
+  N0 0.663205 0.663205 -0.34687   N1 0.811395 0.470609 -0.346647   N2 0.700957 0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 1.61822 0.950425 0.522222   V1 1.32796 1.32796 0.522222   V2 1.3937 1.3937 0.693403 
+  N0 0.700957 0.406555 -0.58598   N1 0.572843 0.572843 -0.586261   N2 0.663205 0.663205 -0.34687 
+   txt003 
+STRI 
+  V0 1.69833 0.997476 0.693403   V1 1.8939 0.527092 0.693403   V2 1.80456 0.502229 0.522222 
+  N0 0.811395 0.470609 -0.346647   N1 0.905874 0.244192 -0.346067   N2 0.782908 0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 1.80456 0.502229 0.522222   V1 1.61822 0.950425 0.522222   V2 1.69833 0.997476 0.693403 
+  N0 0.782908 0.211045 -0.585248   N1 0.700957 0.406555 -0.58598   N2 0.811395 0.470609 -0.346647 
+   txt003 
+STRI 
+  V0 1.8939 0.527092 0.693403   V1 1.96296 2.22045e-16 0.693403   V2 1.87037 2.22045e-16 0.522222 
+  N0 0.905874 0.244192 -0.346067   N1 0.938373 -3.49072e-17 -0.345625   N2 0.811257 -6.19755e-17 -0.58469 
+   txt003 
+STRI 
+  V0 1.87037 2.22045e-16 0.522222   V1 1.80456 0.502229 0.522222   V2 1.8939 0.527092 0.693403 
+  N0 0.811257 -6.19755e-17 -0.58469   N1 0.782908 0.211045 -0.585248   N2 0.905874 0.244192 -0.346067 
+   txt003 
+STRI 
+  V0 0 1.87037 0.522222   V1 0.502229 1.80456 0.522222   V2 0.469907 1.68843 0.384375 
+  N0 0 0.811257 -0.58469   N1 0.211045 0.782908 -0.585248   N2 0.181563 0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 0.469907 1.68843 0.384375   V1 0 1.75 0.384375   V2 0 1.87037 0.522222 
+  N0 0.181563 0.673539 -0.716506   N1 0 0.6981 -0.716   N2 0 0.811257 -0.58469 
+   txt003 
+STRI 
+  V0 0.502229 1.80456 0.522222   V1 0.950425 1.61822 0.522222   V2 0.889259 1.51407 0.384375 
+  N0 0.211045 0.782908 -0.585248   N1 0.406555 0.700957 -0.58598   N2 0.349647 0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 0.889259 1.51407 0.384375   V1 0.469907 1.68843 0.384375   V2 0.502229 1.80456 0.522222 
+  N0 0.349647 0.602839 -0.717169   N1 0.181563 0.673539 -0.716506   N2 0.211045 0.782908 -0.585248 
+   txt003 
+STRI 
+  V0 0.950425 1.61822 0.522222   V1 1.32796 1.32796 0.522222   V2 1.2425 1.2425 0.384375 
+  N0 0.406555 0.700957 -0.58598   N1 0.572843 0.572843 -0.586261   N2 0.492597 0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 1.2425 1.2425 0.384375   V1 0.889259 1.51407 0.384375   V2 0.950425 1.61822 0.522222 
+  N0 0.492597 0.492597 -0.717423   N1 0.349647 0.602839 -0.717169   N2 0.406555 0.700957 -0.58598 
+   txt003 
+STRI 
+  V0 1.32796 1.32796 0.522222   V1 1.61822 0.950425 0.522222   V2 1.51407 0.889259 0.384375 
+  N0 0.572843 0.572843 -0.586261   N1 0.700957 0.406555 -0.58598   N2 0.602839 0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 1.51407 0.889259 0.384375   V1 1.2425 1.2425 0.384375   V2 1.32796 1.32796 0.522222 
+  N0 0.602839 0.349647 -0.717169   N1 0.492597 0.492597 -0.717423   N2 0.572843 0.572843 -0.586261 
+   txt003 
+STRI 
+  V0 1.61822 0.950425 0.522222   V1 1.80456 0.502229 0.522222   V2 1.68843 0.469907 0.384375 
+  N0 0.700957 0.406555 -0.58598   N1 0.782908 0.211045 -0.585248   N2 0.673539 0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 1.68843 0.469907 0.384375   V1 1.51407 0.889259 0.384375   V2 1.61822 0.950425 0.522222 
+  N0 0.673539 0.181563 -0.716506   N1 0.602839 0.349647 -0.717169   N2 0.700957 0.406555 -0.58598 
+   txt003 
+STRI 
+  V0 1.80456 0.502229 0.522222   V1 1.87037 2.22045e-16 0.522222   V2 1.75 2.22045e-16 0.384375 
+  N0 0.782908 0.211045 -0.585248   N1 0.811257 -6.19755e-17 -0.58469   N2 0.6981 -8.11143e-17 -0.716 
+   txt003 
+STRI 
+  V0 1.75 2.22045e-16 0.384375   V1 1.68843 0.469907 0.384375   V2 1.80456 0.502229 0.522222 
+  N0 0.6981 -8.11143e-17 -0.716   N1 0.673539 0.181563 -0.716506   N2 0.782908 0.211045 -0.585248 
+   txt003 
+STRI 
+  V0 0 1.75 0.384375   V1 0.469907 1.68843 0.384375   V2 0.437586 1.57229 0.277778 
+  N0 0 0.6981 -0.716   N1 0.181563 0.673539 -0.716506   N2 0.165491 0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 0.437586 1.57229 0.277778   V1 0 1.62963 0.277778   V2 0 1.75 0.384375 
+  N0 0.165491 0.61392 -0.771826   N1 0 0.636383 -0.771373   N2 0 0.6981 -0.716 
+   txt003 
+STRI 
+  V0 0.469907 1.68843 0.384375   V1 0.889259 1.51407 0.384375   V2 0.828093 1.40993 0.277778 
+  N0 0.181563 0.673539 -0.716506   N1 0.349647 0.602839 -0.717169   N2 0.318647 0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 0.828093 1.40993 0.277778   V1 0.437586 1.57229 0.277778   V2 0.469907 1.68843 0.384375 
+  N0 0.318647 0.549392 -0.77242   N1 0.165491 0.61392 -0.771826   N2 0.181563 0.673539 -0.716506 
+   txt003 
+STRI 
+  V0 0.889259 1.51407 0.384375   V1 1.2425 1.2425 0.384375   V2 1.15704 1.15704 0.277778 
+  N0 0.349647 0.602839 -0.717169   N1 0.492597 0.492597 -0.717423   N2 0.448897 0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 1.15704 1.15704 0.277778   V1 0.828093 1.40993 0.277778   V2 0.889259 1.51407 0.384375 
+  N0 0.448897 0.448897 -0.772647   N1 0.318647 0.549392 -0.77242   N2 0.349647 0.602839 -0.717169 
+   txt003 
+STRI 
+  V0 1.2425 1.2425 0.384375   V1 1.51407 0.889259 0.384375   V2 1.40993 0.828093 0.277778 
+  N0 0.492597 0.492597 -0.717423   N1 0.602839 0.349647 -0.717169   N2 0.549392 0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 1.40993 0.828093 0.277778   V1 1.15704 1.15704 0.277778   V2 1.2425 1.2425 0.384375 
+  N0 0.549392 0.318647 -0.77242   N1 0.448897 0.448897 -0.772647   N2 0.492597 0.492597 -0.717423 
+   txt003 
+STRI 
+  V0 1.51407 0.889259 0.384375   V1 1.68843 0.469907 0.384375   V2 1.57229 0.437586 0.277778 
+  N0 0.602839 0.349647 -0.717169   N1 0.673539 0.181563 -0.716506   N2 0.61392 0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 1.57229 0.437586 0.277778   V1 1.40993 0.828093 0.277778   V2 1.51407 0.889259 0.384375 
+  N0 0.61392 0.165491 -0.771826   N1 0.549392 0.318647 -0.77242   N2 0.602839 0.349647 -0.717169 
+   txt003 
+STRI 
+  V0 1.68843 0.469907 0.384375   V1 1.75 2.22045e-16 0.384375   V2 1.62963 0 0.277778 
+  N0 0.673539 0.181563 -0.716506   N1 0.6981 -8.11143e-17 -0.716   N2 0.636383 -1.97068e-16 -0.771373 
+   txt003 
+STRI 
+  V0 1.62963 0 0.277778   V1 1.57229 0.437586 0.277778   V2 1.68843 0.469907 0.384375 
+  N0 0.636383 -1.97068e-16 -0.771373   N1 0.61392 0.165491 -0.771826   N2 0.673539 0.181563 -0.716506 
+   txt003 
+STRI 
+  V0 0 1.62963 0.277778   V1 0.437586 1.57229 0.277778   V2 0.412723 1.48296 0.200347 
+  N0 0 0.636383 -0.771373   N1 0.165491 0.61392 -0.771826   N2 0.175561 0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 0.412723 1.48296 0.200347   V1 0 1.53704 0.200347   V2 0 1.62963 0.277778 
+  N0 0.175561 0.651276 -0.738253   N1 0 0.675056 -0.737766   N2 0 0.636383 -0.771373 
+   txt003 
+STRI 
+  V0 0.437586 1.57229 0.277778   V1 0.828093 1.40993 0.277778   V2 0.781043 1.32982 0.200347 
+  N0 0.165491 0.61392 -0.771826   N1 0.318647 0.549392 -0.77242   N2 0.338069 0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 0.781043 1.32982 0.200347   V1 0.412723 1.48296 0.200347   V2 0.437586 1.57229 0.277778 
+  N0 0.338069 0.582878 -0.738893   N1 0.175561 0.651276 -0.738253   N2 0.165491 0.61392 -0.771826 
+   txt003 
+STRI 
+  V0 0.828093 1.40993 0.277778   V1 1.15704 1.15704 0.277778   V2 1.0913 1.0913 0.200347 
+  N0 0.318647 0.549392 -0.77242   N1 0.448897 0.448897 -0.772647   N2 0.476275 0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 1.0913 1.0913 0.200347   V1 0.781043 1.32982 0.200347   V2 0.828093 1.40993 0.277778 
+  N0 0.476275 0.476275 -0.739137   N1 0.338069 0.582878 -0.738893   N2 0.318647 0.549392 -0.77242 
+   txt003 
+STRI 
+  V0 1.15704 1.15704 0.277778   V1 1.40993 0.828093 0.277778   V2 1.32982 0.781043 0.200347 
+  N0 0.448897 0.448897 -0.772647   N1 0.549392 0.318647 -0.77242   N2 0.582878 0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 1.32982 0.781043 0.200347   V1 1.0913 1.0913 0.200347   V2 1.15704 1.15704 0.277778 
+  N0 0.582878 0.338069 -0.738893   N1 0.476275 0.476275 -0.739137   N2 0.448897 0.448897 -0.772647 
+   txt003 
+STRI 
+  V0 1.40993 0.828093 0.277778   V1 1.57229 0.437586 0.277778   V2 1.48296 0.412723 0.200347 
+  N0 0.549392 0.318647 -0.77242   N1 0.61392 0.165491 -0.771826   N2 0.651276 0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 1.48296 0.412723 0.200347   V1 1.32982 0.781043 0.200347   V2 1.40993 0.828093 0.277778 
+  N0 0.651276 0.175561 -0.738253   N1 0.582878 0.338069 -0.738893   N2 0.549392 0.318647 -0.77242 
+   txt003 
+STRI 
+  V0 1.57229 0.437586 0.277778   V1 1.62963 0 0.277778   V2 1.53704 0 0.200347 
+  N0 0.61392 0.165491 -0.771826   N1 0.636383 -1.97068e-16 -0.771373   N2 0.675056 -9.51605e-17 -0.737766 
+   txt003 
+STRI 
+  V0 1.53704 0 0.200347   V1 1.48296 0.412723 0.200347   V2 1.57229 0.437586 0.277778 
+  N0 0.675056 -9.51605e-17 -0.737766   N1 0.651276 0.175561 -0.738253   N2 0.61392 0.165491 -0.771826 
+   txt003 
+STRI 
+  V0 0 1.53704 0.200347   V1 0.412723 1.48296 0.200347   V2 0.402778 1.44722 0.15 
+  N0 0 0.675056 -0.737766   N1 0.175561 0.651276 -0.738253   N2 0.260275 0.965535 0 
+   txt003 
+STRI 
+  V0 0.402778 1.44722 0.15   V1 0 1.5 0.15   V2 0 1.53704 0.200347 
+  N0 0.260275 0.965535 0   N1 -0 1 0   N2 0 0.675056 -0.737766 
+   txt003 
+STRI 
+  V0 0.412723 1.48296 0.200347   V1 0.781043 1.32982 0.200347   V2 0.762222 1.29778 0.15 
+  N0 0.175561 0.651276 -0.738253   N1 0.338069 0.582878 -0.738893   N2 0.501718 0.865031 0 
+   txt003 
+STRI 
+  V0 0.762222 1.29778 0.15   V1 0.402778 1.44722 0.15   V2 0.412723 1.48296 0.200347 
+  N0 0.501718 0.865031 0   N1 0.260275 0.965535 0   N2 0.175561 0.651276 -0.738253 
+   txt003 
+STRI 
+  V0 0.781043 1.32982 0.200347   V1 1.0913 1.0913 0.200347   V2 1.065 1.065 0.15 
+  N0 0.338069 0.582878 -0.738893   N1 0.476275 0.476275 -0.739137   N2 0.707107 0.707107 0 
+   txt003 
+STRI 
+  V0 1.065 1.065 0.15   V1 0.762222 1.29778 0.15   V2 0.781043 1.32982 0.200347 
+  N0 0.707107 0.707107 0   N1 0.501718 0.865031 0   N2 0.338069 0.582878 -0.738893 
+   txt003 
+STRI 
+  V0 1.0913 1.0913 0.200347   V1 1.32982 0.781043 0.200347   V2 1.29778 0.762222 0.15 
+  N0 0.476275 0.476275 -0.739137   N1 0.582878 0.338069 -0.738893   N2 0.865031 0.501718 0 
+   txt003 
+STRI 
+  V0 1.29778 0.762222 0.15   V1 1.065 1.065 0.15   V2 1.0913 1.0913 0.200347 
+  N0 0.865031 0.501718 0   N1 0.707107 0.707107 0   N2 0.476275 0.476275 -0.739137 
+   txt003 
+STRI 
+  V0 1.32982 0.781043 0.200347   V1 1.48296 0.412723 0.200347   V2 1.44722 0.402778 0.15 
+  N0 0.582878 0.338069 -0.738893   N1 0.651276 0.175561 -0.738253   N2 0.965535 0.260275 0 
+   txt003 
+STRI 
+  V0 1.44722 0.402778 0.15   V1 1.29778 0.762222 0.15   V2 1.32982 0.781043 0.200347 
+  N0 0.965535 0.260275 0   N1 0.865031 0.501718 0   N2 0.582878 0.338069 -0.738893 
+   txt003 
+STRI 
+  V0 1.48296 0.412723 0.200347   V1 1.53704 0 0.200347   V2 1.5 0 0.15 
+  N0 0.651276 0.175561 -0.738253   N1 0.675056 -9.51605e-17 -0.737766   N2 1 0 0 
+   txt003 
+STRI 
+  V0 1.5 0 0.15   V1 1.44722 0.402778 0.15   V2 1.48296 0.412723 0.200347 
+  N0 1 0 0   N1 0.965535 0.260275 0   N2 0.651276 0.175561 -0.738253 
+   txt003 
+STRI 
+  V0 -1.6 0 2.025   V1 -1.59259 -0.125 2.04167   V2 -1.92704 -0.125 2.04055 
+  N0 -0 -0 -1   N1 -0 -0.298275 -0.95448   N2 0.0104256 -0.297446 -0.954682 
+   txt003 
+STRI 
+  V0 -1.92704 -0.125 2.04055   V1 -1.92454 0 2.02396   V2 -1.6 0 2.025 
+  N0 0.0104256 -0.297446 -0.954682   N1 0.0104645 0 -0.999945   N2 -0 -0 -1 
+   txt003 
+STRI 
+  V0 -1.59259 -0.125 2.04167   V1 -1.57407 -0.2 2.08333   V2 -1.9333 -0.2 2.08202 
+  N0 -0 -0.298275 -0.95448   N1 -0 -0.707107 -0.707107   N2 0.00846382 -0.706077 -0.708084 
+   txt003 
+STRI 
+  V0 -1.9333 -0.2 2.08202   V1 -1.92704 -0.125 2.04055   V2 -1.59259 -0.125 2.04167 
+  N0 0.00846382 -0.706077 -0.708084   N1 0.0104256 -0.297446 -0.954682   N2 -0 -0.298275 -0.95448 
+   txt003 
+STRI 
+  V0 -1.57407 -0.2 2.08333   V1 -1.55 -0.225 2.1375   V2 -1.94144 -0.225 2.13594 
+  N0 -0 -0.707107 -0.707107   N1 0 -1 0   N2 -1.61364e-18 -1 -2.43505e-19 
+   txt003 
+STRI 
+  V0 -1.94144 -0.225 2.13594   V1 -1.9333 -0.2 2.08202   V2 -1.57407 -0.2 2.08333 
+  N0 -1.61364e-18 -1 -2.43505e-19   N1 0.00846382 -0.706077 -0.708084   N2 -0 -0.707107 -0.707107 
+   txt003 
+STRI 
+  V0 -1.55 -0.225 2.1375   V1 -1.52593 -0.2 2.19167   V2 -1.94957 -0.2 2.18985 
+  N0 0 -1 0   N1 0 -0.707107 0.707107   N2 -0.00997559 -0.706181 0.707961 
+   txt003 
+STRI 
+  V0 -1.94957 -0.2 2.18985   V1 -1.94144 -0.225 2.13594   V2 -1.55 -0.225 2.1375 
+  N0 -0.00997559 -0.706181 0.707961   N1 -1.61364e-18 -1 -2.43505e-19   N2 0 -1 0 
+   txt003 
+STRI 
+  V0 -1.52593 -0.2 2.19167   V1 -1.50741 -0.125 2.23333   V2 -1.95583 -0.125 2.23133 
+  N0 0 -0.707107 0.707107   N1 0 -0.298275 0.95448   N2 -0.0140841 -0.297589 0.95459 
+   txt003 
+STRI 
+  V0 -1.95583 -0.125 2.23133   V1 -1.94957 -0.2 2.18985   V2 -1.52593 -0.2 2.19167 
+  N0 -0.0140841 -0.297589 0.95459   N1 -0.00997559 -0.706181 0.707961   N2 0 -0.707107 0.707107 
+   txt003 
+STRI 
+  V0 -1.50741 -0.125 2.23333   V1 -1.5 0 2.25   V2 -1.95833 0 2.24792 
+  N0 0 -0.298275 0.95448   N1 0 1.97373e-15 1   N2 -0.0149983 1.96426e-15 0.999888 
+   txt003 
+STRI 
+  V0 -1.95833 0 2.24792   V1 -1.95583 -0.125 2.23133   V2 -1.50741 -0.125 2.23333 
+  N0 -0.0149983 1.96426e-15 0.999888   N1 -0.0140841 -0.297589 0.95459   N2 0 -0.298275 0.95448 
+   txt003 
+STRI 
+  V0 -1.92454 0 2.02396   V1 -1.92704 -0.125 2.04055   V2 -2.20645 -0.125 2.03272 
+  N0 0.0104645 0 -0.999945   N1 0.0104256 -0.297446 -0.954682   N2 0.0510028 -0.296675 -0.953616 
+   txt003 
+STRI 
+  V0 -2.20645 -0.125 2.03272   V1 -2.1963 0 2.01667   V2 -1.92454 0 2.02396 
+  N0 0.0510028 -0.296675 -0.953616   N1 0.0510696 0 -0.998695   N2 0.0104645 0 -0.999945 
+   txt003 
+STRI 
+  V0 -1.92704 -0.125 2.04055   V1 -1.9333 -0.2 2.08202   V2 -2.23182 -0.2 2.07284 
+  N0 0.0104256 -0.297446 -0.954682   N1 0.00846382 -0.706077 -0.708084   N2 0.0415994 -0.706072 -0.706918 
+   txt003 
+STRI 
+  V0 -2.23182 -0.2 2.07284   V1 -2.20645 -0.125 2.03272   V2 -1.92704 -0.125 2.04055 
+  N0 0.0415994 -0.706072 -0.706918   N1 0.0510028 -0.296675 -0.953616   N2 0.0104256 -0.297446 -0.954682 
+   txt003 
+STRI 
+  V0 -1.9333 -0.2 2.08202   V1 -1.94144 -0.225 2.13594   V2 -2.26481 -0.225 2.125 
+  N0 0.00846382 -0.706077 -0.708084   N1 -1.61364e-18 -1 -2.43505e-19   N2 -7.69071e-18 -1 -4.86421e-18 
+   txt003 
+STRI 
+  V0 -2.26481 -0.225 2.125   V1 -2.23182 -0.2 2.07284   V2 -1.9333 -0.2 2.08202 
+  N0 -7.69071e-18 -1 -4.86421e-18   N1 0.0415994 -0.706072 -0.706918   N2 0.00846382 -0.706077 -0.708084 
+   txt003 
+STRI 
+  V0 -1.94144 -0.225 2.13594   V1 -1.94957 -0.2 2.18985   V2 -2.29781 -0.2 2.17716 
+  N0 -1.61364e-18 -1 -2.43505e-19   N1 -0.00997559 -0.706181 0.707961   N2 -0.0493858 -0.708239 0.704243 
+   txt003 
+STRI 
+  V0 -2.29781 -0.2 2.17716   V1 -2.26481 -0.225 2.125   V2 -1.94144 -0.225 2.13594 
+  N0 -0.0493858 -0.708239 0.704243   N1 -7.69071e-18 -1 -4.86421e-18   N2 -1.61364e-18 -1 -2.43505e-19 
+   txt003 
+STRI 
+  V0 -1.94957 -0.2 2.18985   V1 -1.95583 -0.125 2.23133   V2 -2.32318 -0.125 2.21728 
+  N0 -0.00997559 -0.706181 0.707961   N1 -0.0140841 -0.297589 0.95459   N2 -0.0701017 -0.299663 0.951466 
+   txt003 
+STRI 
+  V0 -2.32318 -0.125 2.21728   V1 -2.29781 -0.2 2.17716   V2 -1.94957 -0.2 2.18985 
+  N0 -0.0701017 -0.299663 0.951466   N1 -0.0493858 -0.708239 0.704243   N2 -0.00997559 -0.706181 0.707961 
+   txt003 
+STRI 
+  V0 -1.95583 -0.125 2.23133   V1 -1.95833 0 2.24792   V2 -2.33333 0 2.23333 
+  N0 -0.0140841 -0.297589 0.95459   N1 -0.0149983 1.96426e-15 0.999888   N2 -0.0747899 1.66682e-15 0.997199 
+   txt003 
+STRI 
+  V0 -2.33333 0 2.23333   V1 -2.32318 -0.125 2.21728   V2 -1.95583 -0.125 2.23133 
+  N0 -0.0747899 1.66682e-15 0.997199   N1 -0.0701017 -0.299663 0.951466   N2 -0.0140841 -0.297589 0.95459 
+   txt003 
+STRI 
+  V0 -2.1963 0 2.01667   V1 -2.20645 -0.125 2.03272   V2 -2.42824 -0.125 2.01146 
+  N0 0.0510696 0 -0.998695   N1 0.0510028 -0.296675 -0.953616   N2 0.148104 -0.301279 -0.941964 
+   txt003 
+STRI 
+  V0 -2.42824 -0.125 2.01146   V1 -2.4125 0 1.99687   V2 -2.1963 0 2.01667 
+  N0 0.148104 -0.301279 -0.941964   N1 0.14834 0 -0.988936   N2 0.0510696 0 -0.998695 
+   txt003 
+STRI 
+  V0 -2.20645 -0.125 2.03272   V1 -2.23182 -0.2 2.07284   V2 -2.46759 -0.2 2.04792 
+  N0 0.0510028 -0.296675 -0.953616   N1 0.0415994 -0.706072 -0.706918   N2 0.119688 -0.715388 -0.6884 
+   txt003 
+STRI 
+  V0 -2.46759 -0.2 2.04792   V1 -2.42824 -0.125 2.01146   V2 -2.20645 -0.125 2.03272 
+  N0 0.119688 -0.715388 -0.6884   N1 0.148104 -0.301279 -0.941964   N2 0.0510028 -0.296675 -0.953616 
+   txt003 
+STRI 
+  V0 -2.23182 -0.2 2.07284   V1 -2.26481 -0.225 2.125   V2 -2.51875 -0.225 2.09531 
+  N0 0.0415994 -0.706072 -0.706918   N1 -7.69071e-18 -1 -4.86421e-18   N2 -1.96915e-17 -1 -2.12543e-17 
+   txt003 
+STRI 
+  V0 -2.51875 -0.225 2.09531   V1 -2.46759 -0.2 2.04792   V2 -2.23182 -0.2 2.07284 
+  N0 -1.96915e-17 -1 -2.12543e-17   N1 0.119688 -0.715388 -0.6884   N2 0.0415994 -0.706072 -0.706918 
+   txt003 
+STRI 
+  V0 -2.26481 -0.225 2.125   V1 -2.29781 -0.2 2.17716   V2 -2.56991 -0.2 2.14271 
+  N0 -7.69071e-18 -1 -4.86421e-18   N1 -0.0493858 -0.708239 0.704243   N2 -0.141352 -0.724137 0.675015 
+   txt003 
+STRI 
+  V0 -2.56991 -0.2 2.14271   V1 -2.51875 -0.225 2.09531   V2 -2.26481 -0.225 2.125 
+  N0 -0.141352 -0.724137 0.675015   N1 -1.96915e-17 -1 -2.12543e-17   N2 -7.69071e-18 -1 -4.86421e-18 
+   txt003 
+STRI 
+  V0 -2.29781 -0.2 2.17716   V1 -2.32318 -0.125 2.21728   V2 -2.60926 -0.125 2.17917 
+  N0 -0.0493858 -0.708239 0.704243   N1 -0.0701017 -0.299663 0.951466   N2 -0.204668 -0.313917 0.927128 
+   txt003 
+STRI 
+  V0 -2.60926 -0.125 2.17917   V1 -2.56991 -0.2 2.14271   V2 -2.29781 -0.2 2.17716 
+  N0 -0.204668 -0.313917 0.927128   N1 -0.141352 -0.724137 0.675015   N2 -0.0493858 -0.708239 0.704243 
+   txt003 
+STRI 
+  V0 -2.32318 -0.125 2.21728   V1 -2.33333 0 2.23333   V2 -2.625 0 2.19375 
+  N0 -0.0701017 -0.299663 0.951466   N1 -0.0747899 1.66682e-15 0.997199   N2 -0.219512 1.81728e-15 0.97561 
+   txt003 
+STRI 
+  V0 -2.625 0 2.19375   V1 -2.60926 -0.125 2.17917   V2 -2.32318 -0.125 2.21728 
+  N0 -0.219512 1.81728e-15 0.97561   N1 -0.204668 -0.313917 0.927128   N2 -0.0701017 -0.299663 0.951466 
+   txt003 
+STRI 
+  V0 -2.4125 0 1.99687   V1 -2.42824 -0.125 2.01146   V2 -2.58985 -0.125 1.97006 
+  N0 0.14834 0 -0.988936   N1 0.148104 -0.301279 -0.941964   N2 0.359682 -0.323804 -0.875089 
+   txt003 
+STRI 
+  V0 -2.58985 -0.125 1.97006   V1 -2.57037 0 1.95833   V2 -2.4125 0 1.99687 
+  N0 0.359682 -0.323804 -0.875089   N1 0.364399 0 -0.931243   N2 0.14834 0 -0.988936 
+   txt003 
+STRI 
+  V0 -2.42824 -0.125 2.01146   V1 -2.46759 -0.2 2.04792   V2 -2.63855 -0.2 1.99938 
+  N0 0.148104 -0.301279 -0.941964   N1 0.119688 -0.715388 -0.6884   N2 0.275915 -0.747596 -0.604128 
+   txt003 
+STRI 
+  V0 -2.63855 -0.2 1.99938   V1 -2.58985 -0.125 1.97006   V2 -2.42824 -0.125 2.01146 
+  N0 0.275915 -0.747596 -0.604128   N1 0.359682 -0.323804 -0.875089   N2 0.148104 -0.301279 -0.941964 
+   txt003 
+STRI 
+  V0 -2.46759 -0.2 2.04792   V1 -2.51875 -0.225 2.09531   V2 -2.70185 -0.225 2.0375 
+  N0 0.119688 -0.715388 -0.6884   N1 -1.96915e-17 -1 -2.12543e-17   N2 -3.40413e-17 -1 -5.65364e-17 
+   txt003 
+STRI 
+  V0 -2.70185 -0.225 2.0375   V1 -2.63855 -0.2 1.99938   V2 -2.46759 -0.2 2.04792 
+  N0 -3.40413e-17 -1 -5.65364e-17   N1 0.275915 -0.747596 -0.604128   N2 0.119688 -0.715388 -0.6884 
+   txt003 
+STRI 
+  V0 -2.51875 -0.225 2.09531   V1 -2.56991 -0.2 2.14271   V2 -2.76516 -0.2 2.07562 
+  N0 -1.96915e-17 -1 -2.12543e-17   N1 -0.141352 -0.724137 0.675015   N2 -0.313659 -0.763673 0.564289 
+   txt003 
+STRI 
+  V0 -2.76516 -0.2 2.07562   V1 -2.70185 -0.225 2.0375   V2 -2.51875 -0.225 2.09531 
+  N0 -0.313659 -0.763673 0.564289   N1 -3.40413e-17 -1 -5.65364e-17   N2 -1.96915e-17 -1 -2.12543e-17 
+   txt003 
+STRI 
+  V0 -2.56991 -0.2 2.14271   V1 -2.60926 -0.125 2.17917   V2 -2.81385 -0.125 2.10494 
+  N0 -0.141352 -0.724137 0.675015   N1 -0.204668 -0.313917 0.927128   N2 -0.474611 -0.350859 0.807244 
+   txt003 
+STRI 
+  V0 -2.81385 -0.125 2.10494   V1 -2.76516 -0.2 2.07562   V2 -2.56991 -0.2 2.14271 
+  N0 -0.474611 -0.350859 0.807244   N1 -0.313659 -0.763673 0.564289   N2 -0.141352 -0.724137 0.675015 
+   txt003 
+STRI 
+  V0 -2.60926 -0.125 2.17917   V1 -2.625 0 2.19375   V2 -2.83333 0 2.11667 
+  N0 -0.204668 -0.313917 0.927128   N1 -0.219512 1.81728e-15 0.97561   N2 -0.514496 1.6713e-15 0.857493 
+   txt003 
+STRI 
+  V0 -2.83333 0 2.11667   V1 -2.81385 -0.125 2.10494   V2 -2.60926 -0.125 2.17917 
+  N0 -0.514496 1.6713e-15 0.857493   N1 -0.474611 -0.350859 0.807244   N2 -0.204668 -0.313917 0.927128 
+   txt003 
+STRI 
+  V0 -2.57037 0 1.95833   V1 -2.58985 -0.125 1.97006   V2 -2.6887 -0.125 1.90181 
+  N0 0.364399 0 -0.931243   N1 0.359682 -0.323804 -0.875089   N2 0.727532 -0.37029 -0.577566 
+   txt003 
+STRI 
+  V0 -2.6887 -0.125 1.90181   V1 -2.66713 0 1.89479   V2 -2.57037 0 1.95833 
+  N0 0.727532 -0.37029 -0.577566   N1 0.767382 0 -0.64119   N2 0.364399 0 -0.931243 
+   txt003 
+STRI 
+  V0 -2.58985 -0.125 1.97006   V1 -2.63855 -0.2 1.99938   V2 -2.74263 -0.2 1.91937 
+  N0 0.359682 -0.323804 -0.875089   N1 0.275915 -0.747596 -0.604128   N2 0.497152 -0.792374 -0.35353 
+   txt003 
+STRI 
+  V0 -2.74263 -0.2 1.91937   V1 -2.6887 -0.125 1.90181   V2 -2.58985 -0.125 1.97006 
+  N0 0.497152 -0.792374 -0.35353   N1 0.727532 -0.37029 -0.577566   N2 0.359682 -0.323804 -0.875089 
+   txt003 
+STRI 
+  V0 -2.63855 -0.2 1.99938   V1 -2.70185 -0.225 2.0375   V2 -2.81273 -0.225 1.94219 
+  N0 0.275915 -0.747596 -0.604128   N1 -3.40413e-17 -1 -5.65364e-17   N2 -3.3285e-17 -1 -1.02253e-16 
+   txt003 
+STRI 
+  V0 -2.81273 -0.225 1.94219   V1 -2.74263 -0.2 1.91937   V2 -2.63855 -0.2 1.99938 
+  N0 -3.3285e-17 -1 -1.02253e-16   N1 0.497152 -0.792374 -0.35353   N2 0.275915 -0.747596 -0.604128 
+   txt003 
+STRI 
+  V0 -2.70185 -0.225 2.0375   V1 -2.76516 -0.2 2.07562   V2 -2.88284 -0.2 1.96501 
+  N0 -3.40413e-17 -1 -5.65364e-17   N1 -0.313659 -0.763673 0.564289   N2 -0.519903 -0.799556 0.300684 
+   txt003 
+STRI 
+  V0 -2.88284 -0.2 1.96501   V1 -2.81273 -0.225 1.94219   V2 -2.70185 -0.225 2.0375 
+  N0 -0.519903 -0.799556 0.300684   N1 -3.3285e-17 -1 -1.02253e-16   N2 -3.40413e-17 -1 -5.65364e-17 
+   txt003 
+STRI 
+  V0 -2.76516 -0.2 2.07562   V1 -2.81385 -0.125 2.10494   V2 -2.93676 -0.125 1.98256 
+  N0 -0.313659 -0.763673 0.564289   N1 -0.474611 -0.350859 0.807244   N2 -0.810111 -0.385772 0.441476 
+   txt003 
+STRI 
+  V0 -2.93676 -0.125 1.98256   V1 -2.88284 -0.2 1.96501   V2 -2.76516 -0.2 2.07562 
+  N0 -0.810111 -0.385772 0.441476   N1 -0.519903 -0.799556 0.300684   N2 -0.313659 -0.763673 0.564289 
+   txt003 
+STRI 
+  V0 -2.81385 -0.125 2.10494   V1 -2.83333 0 2.11667   V2 -2.95833 0 1.98958 
+  N0 -0.474611 -0.350859 0.807244   N1 -0.514496 1.6713e-15 0.857493   N2 -0.882353 9.28814e-16 0.470588 
+   txt003 
+STRI 
+  V0 -2.95833 0 1.98958   V1 -2.93676 -0.125 1.98256   V2 -2.81385 -0.125 2.10494 
+  N0 -0.882353 9.28814e-16 0.470588   N1 -0.810111 -0.385772 0.441476   N2 -0.474611 -0.350859 0.807244 
+   txt003 
+STRI 
+  V0 -2.66713 0 1.89479   V1 -2.6887 -0.125 1.90181   V2 -2.72222 -0.125 1.8 
+  N0 0.767382 0 -0.64119   N1 0.727532 -0.37029 -0.577566   N2 0.923077 -0.384615 2.05733e-15 
+   txt003 
+STRI 
+  V0 -2.72222 -0.125 1.8   V1 -2.7 0 1.8   V2 -2.66713 0 1.89479 
+  N0 0.923077 -0.384615 2.05733e-15   N1 1 0 2.63164e-15   N2 0.767382 0 -0.64119 
+   txt003 
+STRI 
+  V0 -2.6887 -0.125 1.90181   V1 -2.74263 -0.2 1.91937   V2 -2.77778 -0.2 1.8 
+  N0 0.727532 -0.37029 -0.577566   N1 0.497152 -0.792374 -0.35353   N2 0.6 -0.8 8.24322e-16 
+   txt003 
+STRI 
+  V0 -2.77778 -0.2 1.8   V1 -2.72222 -0.125 1.8   V2 -2.6887 -0.125 1.90181 
+  N0 0.6 -0.8 8.24322e-16   N1 0.923077 -0.384615 2.05733e-15   N2 0.727532 -0.37029 -0.577566 
+   txt003 
+STRI 
+  V0 -2.74263 -0.2 1.91937   V1 -2.81273 -0.225 1.94219   V2 -2.85 -0.225 1.8 
+  N0 0.497152 -0.792374 -0.35353   N1 -3.3285e-17 -1 -1.02253e-16   N2 -1.21738e-31 -1 -1.23358e-16 
+   txt003 
+STRI 
+  V0 -2.85 -0.225 1.8   V1 -2.77778 -0.2 1.8   V2 -2.74263 -0.2 1.91937 
+  N0 -1.21738e-31 -1 -1.23358e-16   N1 0.6 -0.8 8.24322e-16   N2 0.497152 -0.792374 -0.35353 
+   txt003 
+STRI 
+  V0 -2.81273 -0.225 1.94219   V1 -2.88284 -0.2 1.96501   V2 -2.92222 -0.2 1.8 
+  N0 -3.3285e-17 -1 -1.02253e-16   N1 -0.519903 -0.799556 0.300684   N2 -0.6 -0.8 -3.10757e-16 
+   txt003 
+STRI 
+  V0 -2.92222 -0.2 1.8   V1 -2.85 -0.225 1.8   V2 -2.81273 -0.225 1.94219 
+  N0 -0.6 -0.8 -3.10757e-16   N1 -1.21738e-31 -1 -1.23358e-16   N2 -3.3285e-17 -1 -1.02253e-16 
+   txt003 
+STRI 
+  V0 -2.88284 -0.2 1.96501   V1 -2.93676 -0.125 1.98256   V2 -2.97778 -0.125 1.8 
+  N0 -0.519903 -0.799556 0.300684   N1 -0.810111 -0.385772 0.441476   N2 -0.923077 -0.384615 -1.1396e-16 
+   txt003 
+STRI 
+  V0 -2.97778 -0.125 1.8   V1 -2.92222 -0.2 1.8   V2 -2.88284 -0.2 1.96501 
+  N0 -0.923077 -0.384615 -1.1396e-16   N1 -0.6 -0.8 -3.10757e-16   N2 -0.519903 -0.799556 0.300684 
+   txt003 
+STRI 
+  V0 -2.93676 -0.125 1.98256   V1 -2.95833 0 1.98958   V2 -3 0 1.8 
+  N0 -0.810111 -0.385772 0.441476   N1 -0.882353 9.28814e-16 0.470588   N2 -1 -4.93432e-16 -0 
+   txt003 
+STRI 
+  V0 -3 0 1.8   V1 -2.97778 -0.125 1.8   V2 -2.93676 -0.125 1.98256 
+  N0 -1 -4.93432e-16 -0   N1 -0.923077 -0.384615 -1.1396e-16   N2 -0.810111 -0.385772 0.441476 
+   txt003 
+STRI 
+  V0 -1.5 0 2.25   V1 -1.50741 0.125 2.23333   V2 -1.95583 0.125 2.23133 
+  N0 0 -0 1   N1 0 0.298275 0.95448   N2 -0.0140841 0.297589 0.95459 
+   txt003 
+STRI 
+  V0 -1.95583 0.125 2.23133   V1 -1.95833 0 2.24792   V2 -1.5 0 2.25 
+  N0 -0.0140841 0.297589 0.95459   N1 -0.0149983 0 0.999888   N2 0 -0 1 
+   txt003 
+STRI 
+  V0 -1.50741 0.125 2.23333   V1 -1.52593 0.2 2.19167   V2 -1.94957 0.2 2.18985 
+  N0 0 0.298275 0.95448   N1 0 0.707107 0.707107   N2 -0.00997559 0.706181 0.707961 
+   txt003 
+STRI 
+  V0 -1.94957 0.2 2.18985   V1 -1.95583 0.125 2.23133   V2 -1.50741 0.125 2.23333 
+  N0 -0.00997559 0.706181 0.707961   N1 -0.0140841 0.297589 0.95459   N2 0 0.298275 0.95448 
+   txt003 
+STRI 
+  V0 -1.52593 0.2 2.19167   V1 -1.55 0.225 2.1375   V2 -1.94144 0.225 2.13594 
+  N0 0 0.707107 0.707107   N1 0 1 0   N2 -1.61364e-18 1 -2.43505e-19 
+   txt003 
+STRI 
+  V0 -1.94144 0.225 2.13594   V1 -1.94957 0.2 2.18985   V2 -1.52593 0.2 2.19167 
+  N0 -1.61364e-18 1 -2.43505e-19   N1 -0.00997559 0.706181 0.707961   N2 0 0.707107 0.707107 
+   txt003 
+STRI 
+  V0 -1.55 0.225 2.1375   V1 -1.57407 0.2 2.08333   V2 -1.9333 0.2 2.08202 
+  N0 0 1 0   N1 0 0.707107 -0.707107   N2 0.00846382 0.706077 -0.708084 
+   txt003 
+STRI 
+  V0 -1.9333 0.2 2.08202   V1 -1.94144 0.225 2.13594   V2 -1.55 0.225 2.1375 
+  N0 0.00846382 0.706077 -0.708084   N1 -1.61364e-18 1 -2.43505e-19   N2 0 1 0 
+   txt003 
+STRI 
+  V0 -1.57407 0.2 2.08333   V1 -1.59259 0.125 2.04167   V2 -1.92704 0.125 2.04055 
+  N0 0 0.707107 -0.707107   N1 0 0.298275 -0.95448   N2 0.0104256 0.297446 -0.954682 
+   txt003 
+STRI 
+  V0 -1.92704 0.125 2.04055   V1 -1.9333 0.2 2.08202   V2 -1.57407 0.2 2.08333 
+  N0 0.0104256 0.297446 -0.954682   N1 0.00846382 0.706077 -0.708084   N2 0 0.707107 -0.707107 
+   txt003 
+STRI 
+  V0 -1.59259 0.125 2.04167   V1 -1.6 0 2.025   V2 -1.92454 0 2.02396 
+  N0 0 0.298275 -0.95448   N1 -0 -4.93432e-16 -1   N2 0.0104645 -4.86951e-16 -0.999945 
+   txt003 
+STRI 
+  V0 -1.92454 0 2.02396   V1 -1.92704 0.125 2.04055   V2 -1.59259 0.125 2.04167 
+  N0 0.0104645 -4.86951e-16 -0.999945   N1 0.0104256 0.297446 -0.954682   N2 0 0.298275 -0.95448 
+   txt003 
+STRI 
+  V0 -1.95833 0 2.24792   V1 -1.95583 0.125 2.23133   V2 -2.32318 0.125 2.21728 
+  N0 -0.0149983 0 0.999888   N1 -0.0140841 0.297589 0.95459   N2 -0.0701017 0.299663 0.951466 
+   txt003 
+STRI 
+  V0 -2.32318 0.125 2.21728   V1 -2.33333 0 2.23333   V2 -1.95833 0 2.24792 
+  N0 -0.0701017 0.299663 0.951466   N1 -0.0747899 0 0.997199   N2 -0.0149983 0 0.999888 
+   txt003 
+STRI 
+  V0 -1.95583 0.125 2.23133   V1 -1.94957 0.2 2.18985   V2 -2.29781 0.2 2.17716 
+  N0 -0.0140841 0.297589 0.95459   N1 -0.00997559 0.706181 0.707961   N2 -0.0493858 0.708239 0.704243 
+   txt003 
+STRI 
+  V0 -2.29781 0.2 2.17716   V1 -2.32318 0.125 2.21728   V2 -1.95583 0.125 2.23133 
+  N0 -0.0493858 0.708239 0.704243   N1 -0.0701017 0.299663 0.951466   N2 -0.0140841 0.297589 0.95459 
+   txt003 
+STRI 
+  V0 -1.94957 0.2 2.18985   V1 -1.94144 0.225 2.13594   V2 -2.26481 0.225 2.125 
+  N0 -0.00997559 0.706181 0.707961   N1 -1.61364e-18 1 -2.43505e-19   N2 -7.69071e-18 1 -4.86421e-18 
+   txt003 
+STRI 
+  V0 -2.26481 0.225 2.125   V1 -2.29781 0.2 2.17716   V2 -1.94957 0.2 2.18985 
+  N0 -7.69071e-18 1 -4.86421e-18   N1 -0.0493858 0.708239 0.704243   N2 -0.00997559 0.706181 0.707961 
+   txt003 
+STRI 
+  V0 -1.94144 0.225 2.13594   V1 -1.9333 0.2 2.08202   V2 -2.23182 0.2 2.07284 
+  N0 -1.61364e-18 1 -2.43505e-19   N1 0.00846382 0.706077 -0.708084   N2 0.0415994 0.706072 -0.706918 
+   txt003 
+STRI 
+  V0 -2.23182 0.2 2.07284   V1 -2.26481 0.225 2.125   V2 -1.94144 0.225 2.13594 
+  N0 0.0415994 0.706072 -0.706918   N1 -7.69071e-18 1 -4.86421e-18   N2 -1.61364e-18 1 -2.43505e-19 
+   txt003 
+STRI 
+  V0 -1.9333 0.2 2.08202   V1 -1.92704 0.125 2.04055   V2 -2.20645 0.125 2.03272 
+  N0 0.00846382 0.706077 -0.708084   N1 0.0104256 0.297446 -0.954682   N2 0.0510028 0.296675 -0.953616 
+   txt003 
+STRI 
+  V0 -2.20645 0.125 2.03272   V1 -2.23182 0.2 2.07284   V2 -1.9333 0.2 2.08202 
+  N0 0.0510028 0.296675 -0.953616   N1 0.0415994 0.706072 -0.706918   N2 0.00846382 0.706077 -0.708084 
+   txt003 
+STRI 
+  V0 -1.92704 0.125 2.04055   V1 -1.92454 0 2.02396   V2 -2.1963 0 2.01667 
+  N0 0.0104256 0.297446 -0.954682   N1 0.0104645 -4.86951e-16 -0.999945   N2 0.0510696 -2.08595e-16 -0.998695 
+   txt003 
+STRI 
+  V0 -2.1963 0 2.01667   V1 -2.20645 0.125 2.03272   V2 -1.92704 0.125 2.04055 
+  N0 0.0510696 -2.08595e-16 -0.998695   N1 0.0510028 0.296675 -0.953616   N2 0.0104256 0.297446 -0.954682 
+   txt003 
+STRI 
+  V0 -2.33333 0 2.23333   V1 -2.32318 0.125 2.21728   V2 -2.60926 0.125 2.17917 
+  N0 -0.0747899 0 0.997199   N1 -0.0701017 0.299663 0.951466   N2 -0.204668 0.313917 0.927128 
+   txt003 
+STRI 
+  V0 -2.60926 0.125 2.17917   V1 -2.625 0 2.19375   V2 -2.33333 0 2.23333 
+  N0 -0.204668 0.313917 0.927128   N1 -0.219512 0 0.97561   N2 -0.0747899 0 0.997199 
+   txt003 
+STRI 
+  V0 -2.32318 0.125 2.21728   V1 -2.29781 0.2 2.17716   V2 -2.56991 0.2 2.14271 
+  N0 -0.0701017 0.299663 0.951466   N1 -0.0493858 0.708239 0.704243   N2 -0.141352 0.724137 0.675015 
+   txt003 
+STRI 
+  V0 -2.56991 0.2 2.14271   V1 -2.60926 0.125 2.17917   V2 -2.32318 0.125 2.21728 
+  N0 -0.141352 0.724137 0.675015   N1 -0.204668 0.313917 0.927128   N2 -0.0701017 0.299663 0.951466 
+   txt003 
+STRI 
+  V0 -2.29781 0.2 2.17716   V1 -2.26481 0.225 2.125   V2 -2.51875 0.225 2.09531 
+  N0 -0.0493858 0.708239 0.704243   N1 -7.69071e-18 1 -4.86421e-18   N2 -1.96915e-17 1 -2.12543e-17 
+   txt003 
+STRI 
+  V0 -2.51875 0.225 2.09531   V1 -2.56991 0.2 2.14271   V2 -2.29781 0.2 2.17716 
+  N0 -1.96915e-17 1 -2.12543e-17   N1 -0.141352 0.724137 0.675015   N2 -0.0493858 0.708239 0.704243 
+   txt003 
+STRI 
+  V0 -2.26481 0.225 2.125   V1 -2.23182 0.2 2.07284   V2 -2.46759 0.2 2.04792 
+  N0 -7.69071e-18 1 -4.86421e-18   N1 0.0415994 0.706072 -0.706918   N2 0.119688 0.715388 -0.6884 
+   txt003 
+STRI 
+  V0 -2.46759 0.2 2.04792   V1 -2.51875 0.225 2.09531   V2 -2.26481 0.225 2.125 
+  N0 0.119688 0.715388 -0.6884   N1 -1.96915e-17 1 -2.12543e-17   N2 -7.69071e-18 1 -4.86421e-18 
+   txt003 
+STRI 
+  V0 -2.23182 0.2 2.07284   V1 -2.20645 0.125 2.03272   V2 -2.42824 0.125 2.01146 
+  N0 0.0415994 0.706072 -0.706918   N1 0.0510028 0.296675 -0.953616   N2 0.148104 0.301279 -0.941964 
+   txt003 
+STRI 
+  V0 -2.42824 0.125 2.01146   V1 -2.46759 0.2 2.04792   V2 -2.23182 0.2 2.07284 
+  N0 0.148104 0.301279 -0.941964   N1 0.119688 0.715388 -0.6884   N2 0.0415994 0.706072 -0.706918 
+   txt003 
+STRI 
+  V0 -2.20645 0.125 2.03272   V1 -2.1963 0 2.01667   V2 -2.4125 0 1.99687 
+  N0 0.0510028 0.296675 -0.953616   N1 0.0510696 -2.08595e-16 -0.998695   N2 0.14834 -4.14777e-16 -0.988936 
+   txt003 
+STRI 
+  V0 -2.4125 0 1.99687   V1 -2.42824 0.125 2.01146   V2 -2.20645 0.125 2.03272 
+  N0 0.14834 -4.14777e-16 -0.988936   N1 0.148104 0.301279 -0.941964   N2 0.0510028 0.296675 -0.953616 
+   txt003 
+STRI 
+  V0 -2.625 0 2.19375   V1 -2.60926 0.125 2.17917   V2 -2.81385 0.125 2.10494 
+  N0 -0.219512 0 0.97561   N1 -0.204668 0.313917 0.927128   N2 -0.474611 0.350859 0.807244 
+   txt003 
+STRI 
+  V0 -2.81385 0.125 2.10494   V1 -2.83333 0 2.11667   V2 -2.625 0 2.19375 
+  N0 -0.474611 0.350859 0.807244   N1 -0.514496 0 0.857493   N2 -0.219512 0 0.97561 
+   txt003 
+STRI 
+  V0 -2.60926 0.125 2.17917   V1 -2.56991 0.2 2.14271   V2 -2.76516 0.2 2.07562 
+  N0 -0.204668 0.313917 0.927128   N1 -0.141352 0.724137 0.675015   N2 -0.313659 0.763673 0.564289 
+   txt003 
+STRI 
+  V0 -2.76516 0.2 2.07562   V1 -2.81385 0.125 2.10494   V2 -2.60926 0.125 2.17917 
+  N0 -0.313659 0.763673 0.564289   N1 -0.474611 0.350859 0.807244   N2 -0.204668 0.313917 0.927128 
+   txt003 
+STRI 
+  V0 -2.56991 0.2 2.14271   V1 -2.51875 0.225 2.09531   V2 -2.70185 0.225 2.0375 
+  N0 -0.141352 0.724137 0.675015   N1 -1.96915e-17 1 -2.12543e-17   N2 -3.40413e-17 1 -5.65364e-17 
+   txt003 
+STRI 
+  V0 -2.70185 0.225 2.0375   V1 -2.76516 0.2 2.07562   V2 -2.56991 0.2 2.14271 
+  N0 -3.40413e-17 1 -5.65364e-17   N1 -0.313659 0.763673 0.564289   N2 -0.141352 0.724137 0.675015 
+   txt003 
+STRI 
+  V0 -2.51875 0.225 2.09531   V1 -2.46759 0.2 2.04792   V2 -2.63855 0.2 1.99938 
+  N0 -1.96915e-17 1 -2.12543e-17   N1 0.119688 0.715388 -0.6884   N2 0.275915 0.747596 -0.604128 
+   txt003 
+STRI 
+  V0 -2.63855 0.2 1.99938   V1 -2.70185 0.225 2.0375   V2 -2.51875 0.225 2.09531 
+  N0 0.275915 0.747596 -0.604128   N1 -3.40413e-17 1 -5.65364e-17   N2 -1.96915e-17 1 -2.12543e-17 
+   txt003 
+STRI 
+  V0 -2.46759 0.2 2.04792   V1 -2.42824 0.125 2.01146   V2 -2.58985 0.125 1.97006 
+  N0 0.119688 0.715388 -0.6884   N1 0.148104 0.301279 -0.941964   N2 0.359682 0.323804 -0.875089 
+   txt003 
+STRI 
+  V0 -2.58985 0.125 1.97006   V1 -2.63855 0.2 1.99938   V2 -2.46759 0.2 2.04792 
+  N0 0.359682 0.323804 -0.875089   N1 0.275915 0.747596 -0.604128   N2 0.119688 0.715388 -0.6884 
+   txt003 
+STRI 
+  V0 -2.42824 0.125 2.01146   V1 -2.4125 0 1.99687   V2 -2.57037 0 1.95833 
+  N0 0.148104 0.301279 -0.941964   N1 0.14834 -4.14777e-16 -0.988936   N2 0.364399 -4.84479e-16 -0.931243 
+   txt003 
+STRI 
+  V0 -2.57037 0 1.95833   V1 -2.58985 0.125 1.97006   V2 -2.42824 0.125 2.01146 
+  N0 0.364399 -4.84479e-16 -0.931243   N1 0.359682 0.323804 -0.875089   N2 0.148104 0.301279 -0.941964 
+   txt003 
+STRI 
+  V0 -2.83333 0 2.11667   V1 -2.81385 0.125 2.10494   V2 -2.93676 0.125 1.98256 
+  N0 -0.514496 0 0.857493   N1 -0.474611 0.350859 0.807244   N2 -0.810111 0.385772 0.441476 
+   txt003 
+STRI 
+  V0 -2.93676 0.125 1.98256   V1 -2.95833 0 1.98958   V2 -2.83333 0 2.11667 
+  N0 -0.810111 0.385772 0.441476   N1 -0.882353 0 0.470588   N2 -0.514496 0 0.857493 
+   txt003 
+STRI 
+  V0 -2.81385 0.125 2.10494   V1 -2.76516 0.2 2.07562   V2 -2.88284 0.2 1.96501 
+  N0 -0.474611 0.350859 0.807244   N1 -0.313659 0.763673 0.564289   N2 -0.519903 0.799556 0.300684 
+   txt003 
+STRI 
+  V0 -2.88284 0.2 1.96501   V1 -2.93676 0.125 1.98256   V2 -2.81385 0.125 2.10494 
+  N0 -0.519903 0.799556 0.300684   N1 -0.810111 0.385772 0.441476   N2 -0.474611 0.350859 0.807244 
+   txt003 
+STRI 
+  V0 -2.76516 0.2 2.07562   V1 -2.70185 0.225 2.0375   V2 -2.81273 0.225 1.94219 
+  N0 -0.313659 0.763673 0.564289   N1 -3.40413e-17 1 -5.65364e-17   N2 -3.3285e-17 1 -1.02253e-16 
+   txt003 
+STRI 
+  V0 -2.81273 0.225 1.94219   V1 -2.88284 0.2 1.96501   V2 -2.76516 0.2 2.07562 
+  N0 -3.3285e-17 1 -1.02253e-16   N1 -0.519903 0.799556 0.300684   N2 -0.313659 0.763673 0.564289 
+   txt003 
+STRI 
+  V0 -2.70185 0.225 2.0375   V1 -2.63855 0.2 1.99938   V2 -2.74263 0.2 1.91937 
+  N0 -3.40413e-17 1 -5.65364e-17   N1 0.275915 0.747596 -0.604128   N2 0.497152 0.792374 -0.35353 
+   txt003 
+STRI 
+  V0 -2.74263 0.2 1.91937   V1 -2.81273 0.225 1.94219   V2 -2.70185 0.225 2.0375 
+  N0 0.497152 0.792374 -0.35353   N1 -3.3285e-17 1 -1.02253e-16   N2 -3.40413e-17 1 -5.65364e-17 
+   txt003 
+STRI 
+  V0 -2.63855 0.2 1.99938   V1 -2.58985 0.125 1.97006   V2 -2.6887 0.125 1.90181 
+  N0 0.275915 0.747596 -0.604128   N1 0.359682 0.323804 -0.875089   N2 0.727532 0.37029 -0.577566 
+   txt003 
+STRI 
+  V0 -2.6887 0.125 1.90181   V1 -2.74263 0.2 1.91937   V2 -2.63855 0.2 1.99938 
+  N0 0.727532 0.37029 -0.577566   N1 0.497152 0.792374 -0.35353   N2 0.275915 0.747596 -0.604128 
+   txt003 
+STRI 
+  V0 -2.58985 0.125 1.97006   V1 -2.57037 0 1.95833   V2 -2.66713 0 1.89479 
+  N0 0.359682 0.323804 -0.875089   N1 0.364399 -4.84479e-16 -0.931243   N2 0.767382 -3.16384e-16 -0.64119 
+   txt003 
+STRI 
+  V0 -2.66713 0 1.89479   V1 -2.6887 0.125 1.90181   V2 -2.58985 0.125 1.97006 
+  N0 0.767382 -3.16384e-16 -0.64119   N1 0.727532 0.37029 -0.577566   N2 0.359682 0.323804 -0.875089 
+   txt003 
+STRI 
+  V0 -2.95833 0 1.98958   V1 -2.93676 0.125 1.98256   V2 -2.97778 0.125 1.8 
+  N0 -0.882353 0 0.470588   N1 -0.810111 0.385772 0.441476   N2 -0.923077 0.384615 -1.1396e-16 
+   txt003 
+STRI 
+  V0 -2.97778 0.125 1.8   V1 -3 0 1.8   V2 -2.95833 0 1.98958 
+  N0 -0.923077 0.384615 -1.1396e-16   N1 -1 0 0   N2 -0.882353 0 0.470588 
+   txt003 
+STRI 
+  V0 -2.93676 0.125 1.98256   V1 -2.88284 0.2 1.96501   V2 -2.92222 0.2 1.8 
+  N0 -0.810111 0.385772 0.441476   N1 -0.519903 0.799556 0.300684   N2 -0.6 0.8 -3.10757e-16 
+   txt003 
+STRI 
+  V0 -2.92222 0.2 1.8   V1 -2.97778 0.125 1.8   V2 -2.93676 0.125 1.98256 
+  N0 -0.6 0.8 -3.10757e-16   N1 -0.923077 0.384615 -1.1396e-16   N2 -0.810111 0.385772 0.441476 
+   txt003 
+STRI 
+  V0 -2.88284 0.2 1.96501   V1 -2.81273 0.225 1.94219   V2 -2.85 0.225 1.8 
+  N0 -0.519903 0.799556 0.300684   N1 -3.3285e-17 1 -1.02253e-16   N2 -2.13041e-31 1 -1.23358e-16 
+   txt003 
+STRI 
+  V0 -2.85 0.225 1.8   V1 -2.92222 0.2 1.8   V2 -2.88284 0.2 1.96501 
+  N0 -2.13041e-31 1 -1.23358e-16   N1 -0.6 0.8 -3.10757e-16   N2 -0.519903 0.799556 0.300684 
+   txt003 
+STRI 
+  V0 -2.81273 0.225 1.94219   V1 -2.74263 0.2 1.91937   V2 -2.77778 0.2 1.8 
+  N0 -3.3285e-17 1 -1.02253e-16   N1 0.497152 0.792374 -0.35353   N2 0.6 0.8 8.24322e-16 
+   txt003 
+STRI 
+  V0 -2.77778 0.2 1.8   V1 -2.85 0.225 1.8   V2 -2.81273 0.225 1.94219 
+  N0 0.6 0.8 8.24322e-16   N1 -2.13041e-31 1 -1.23358e-16   N2 -3.3285e-17 1 -1.02253e-16 
+   txt003 
+STRI 
+  V0 -2.74263 0.2 1.91937   V1 -2.6887 0.125 1.90181   V2 -2.72222 0.125 1.8 
+  N0 0.497152 0.792374 -0.35353   N1 0.727532 0.37029 -0.577566   N2 0.923077 0.384615 2.05733e-15 
+   txt003 
+STRI 
+  V0 -2.72222 0.125 1.8   V1 -2.77778 0.2 1.8   V2 -2.74263 0.2 1.91937 
+  N0 0.923077 0.384615 2.05733e-15   N1 0.6 0.8 8.24322e-16   N2 0.497152 0.792374 -0.35353 
+   txt003 
+STRI 
+  V0 -2.6887 0.125 1.90181   V1 -2.66713 0 1.89479   V2 -2.7 0 1.8 
+  N0 0.727532 0.37029 -0.577566   N1 0.767382 -3.16384e-16 -0.64119   N2 1 4.93432e-16 2.63164e-15 
+   txt003 
+STRI 
+  V0 -2.7 0 1.8   V1 -2.72222 0.125 1.8   V2 -2.6887 0.125 1.90181 
+  N0 1 4.93432e-16 2.63164e-15   N1 0.923077 0.384615 2.05733e-15   N2 0.727532 0.37029 -0.577566 
+   txt003 
+STRI 
+  V0 -2.7 0 1.8   V1 -2.72222 -0.125 1.8   V2 -2.70418 -0.125 1.66398 
+  N0 1 0 0   N1 0.923077 -0.384615 0   N2 0.895972 -0.38623 0.219226 
+   txt003 
+STRI 
+  V0 -2.70418 -0.125 1.66398   V1 -2.68287 0 1.67083   V2 -2.7 0 1.8 
+  N0 0.895972 -0.38623 0.219226   N1 0.972045 0 0.234794   N2 1 0 0 
+   txt003 
+STRI 
+  V0 -2.72222 -0.125 1.8   V1 -2.77778 -0.2 1.8   V2 -2.75747 -0.2 1.64684 
+  N0 0.923077 -0.384615 0   N1 0.6 -0.8 0   N2 0.57987 -0.801541 0.145888 
+   txt003 
+STRI 
+  V0 -2.75747 -0.2 1.64684   V1 -2.70418 -0.125 1.66398   V2 -2.72222 -0.125 1.8 
+  N0 0.57987 -0.801541 0.145888   N1 0.895972 -0.38623 0.219226   N2 0.923077 -0.384615 0 
+   txt003 
+STRI 
+  V0 -2.77778 -0.2 1.8   V1 -2.85 -0.225 1.8   V2 -2.82674 -0.225 1.62457 
+  N0 0.6 -0.8 0   N1 -0 -1 -0   N2 9.48478e-19 -1 -2.94924e-18 
+   txt003 
+STRI 
+  V0 -2.82674 -0.225 1.62457   V1 -2.75747 -0.2 1.64684   V2 -2.77778 -0.2 1.8 
+  N0 9.48478e-19 -1 -2.94924e-18   N1 0.57987 -0.801541 0.145888   N2 0.6 -0.8 0 
+   txt003 
+STRI 
+  V0 -2.85 -0.225 1.8   V1 -2.92222 -0.2 1.8   V2 -2.896 -0.2 1.60229 
+  N0 -0 -1 -0   N1 -0.6 -0.8 -0   N2 -0.577707 -0.801752 -0.153129 
+   txt003 
+STRI 
+  V0 -2.896 -0.2 1.60229   V1 -2.82674 -0.225 1.62457   V2 -2.85 -0.225 1.8 
+  N0 -0.577707 -0.801752 -0.153129   N1 9.48478e-19 -1 -2.94924e-18   N2 -0 -1 -0 
+   txt003 
+STRI 
+  V0 -2.92222 -0.2 1.8   V1 -2.97778 -0.125 1.8   V2 -2.94929 -0.125 1.58515 
+  N0 -0.6 -0.8 -0   N1 -0.923077 -0.384615 -0   N2 -0.890548 -0.386679 -0.23959 
+   txt003 
+STRI 
+  V0 -2.94929 -0.125 1.58515   V1 -2.896 -0.2 1.60229   V2 -2.92222 -0.2 1.8 
+  N0 -0.890548 -0.386679 -0.23959   N1 -0.577707 -0.801752 -0.153129   N2 -0.6 -0.8 -0 
+   txt003 
+STRI 
+  V0 -2.97778 -0.125 1.8   V1 -3 0 1.8   V2 -2.9706 0 1.5783 
+  N0 -0.923077 -0.384615 -0   N1 -1 -9.86865e-16 -0   N2 -0.965311 -7.59377e-16 -0.261102 
+   txt003 
+STRI 
+  V0 -2.9706 0 1.5783   V1 -2.94929 -0.125 1.58515   V2 -2.97778 -0.125 1.8 
+  N0 -0.965311 -7.59377e-16 -0.261102   N1 -0.890548 -0.386679 -0.23959   N2 -0.923077 -0.384615 -0 
+   txt003 
+STRI 
+  V0 -2.68287 0 1.67083   V1 -2.70418 -0.125 1.66398   V2 -2.64829 -0.125 1.50535 
+  N0 0.972045 0 0.234794   N1 0.895972 -0.38623 0.219226   N2 0.842942 -0.376421 0.38439 
+   txt003 
+STRI 
+  V0 -2.64829 -0.125 1.50535   V1 -2.62963 0 1.51667   V2 -2.68287 0 1.67083 
+  N0 0.842942 -0.376421 0.38439   N1 0.913812 0 0.406138   N2 0.972045 0 0.234794 
+   txt003 
+STRI 
+  V0 -2.70418 -0.125 1.66398   V1 -2.75747 -0.2 1.64684   V2 -2.69492 -0.2 1.47706 
+  N0 0.895972 -0.38623 0.219226   N1 0.57987 -0.801541 0.145888   N2 0.548194 -0.793356 0.264707 
+   txt003 
+STRI 
+  V0 -2.69492 -0.2 1.47706   V1 -2.64829 -0.125 1.50535   V2 -2.70418 -0.125 1.66398 
+  N0 0.548194 -0.793356 0.264707   N1 0.842942 -0.376421 0.38439   N2 0.895972 -0.38623 0.219226 
+   txt003 
+STRI 
+  V0 -2.75747 -0.2 1.64684   V1 -2.82674 -0.225 1.62457   V2 -2.75556 -0.225 1.44028 
+  N0 0.57987 -0.801541 0.145888   N1 9.48478e-19 -1 -2.94924e-18   N2 5.73642e-18 -1 -9.4564e-18 
+   txt003 
+STRI 
+  V0 -2.75556 -0.225 1.44028   V1 -2.69492 -0.2 1.47706   V2 -2.75747 -0.2 1.64684 
+  N0 5.73642e-18 -1 -9.4564e-18   N1 0.548194 -0.793356 0.264707   N2 0.57987 -0.801541 0.145888 
+   txt003 
+STRI 
+  V0 -2.82674 -0.225 1.62457   V1 -2.896 -0.2 1.60229   V2 -2.81619 -0.2 1.4035 
+  N0 9.48478e-19 -1 -2.94924e-18   N1 -0.577707 -0.801752 -0.153129   N2 -0.534196 -0.794341 -0.289235 
+   txt003 
+STRI 
+  V0 -2.81619 -0.2 1.4035   V1 -2.75556 -0.225 1.44028   V2 -2.82674 -0.225 1.62457 
+  N0 -0.534196 -0.794341 -0.289235   N1 5.73642e-18 -1 -9.4564e-18   N2 9.48478e-19 -1 -2.94924e-18 
+   txt003 
+STRI 
+  V0 -2.896 -0.2 1.60229   V1 -2.94929 -0.125 1.58515   V2 -2.86283 -0.125 1.37521 
+  N0 -0.577707 -0.801752 -0.153129   N1 -0.890548 -0.386679 -0.23959   N2 -0.807437 -0.378466 -0.452558 
+   txt003 
+STRI 
+  V0 -2.86283 -0.125 1.37521   V1 -2.81619 -0.2 1.4035   V2 -2.896 -0.2 1.60229 
+  N0 -0.807437 -0.378466 -0.452558   N1 -0.534196 -0.794341 -0.289235   N2 -0.577707 -0.801752 -0.153129 
+   txt003 
+STRI 
+  V0 -2.94929 -0.125 1.58515   V1 -2.9706 0 1.5783   V2 -2.88148 0 1.36389 
+  N0 -0.890548 -0.386679 -0.23959   N1 -0.965311 -7.59377e-16 -0.261102   N2 -0.869653 -7.07402e-16 -0.493664 
+   txt003 
+STRI 
+  V0 -2.88148 0 1.36389   V1 -2.86283 -0.125 1.37521   V2 -2.94929 -0.125 1.58515 
+  N0 -0.869653 -7.07402e-16 -0.493664   N1 -0.807437 -0.378466 -0.452558   N2 -0.890548 -0.386679 -0.23959 
+   txt003 
+STRI 
+  V0 -2.62963 0 1.51667   V1 -2.64829 -0.125 1.50535   V2 -2.55185 -0.125 1.33576 
+  N0 0.913812 0 0.406138   N1 0.842942 -0.376421 0.38439   N2 0.772293 -0.349434 0.530527 
+   txt003 
+STRI 
+  V0 -2.55185 -0.125 1.33576   V1 -2.5375 0 1.35   V2 -2.62963 0 1.51667 
+  N0 0.772293 -0.349434 0.530527   N1 0.83205 0 0.5547   N2 0.913812 0 0.406138 
+   txt003 
+STRI 
+  V0 -2.64829 -0.125 1.50535   V1 -2.69492 -0.2 1.47706   V2 -2.58773 -0.2 1.30017 
+  N0 0.842942 -0.376421 0.38439   N1 0.548194 -0.793356 0.264707   N2 0.515846 -0.768155 0.379264 
+   txt003 
+STRI 
+  V0 -2.58773 -0.2 1.30017   V1 -2.55185 -0.125 1.33576   V2 -2.64829 -0.125 1.50535 
+  N0 0.515846 -0.768155 0.379264   N1 0.772293 -0.349434 0.530527   N2 0.842942 -0.376421 0.38439 
+   txt003 
+STRI 
+  V0 -2.69492 -0.2 1.47706   V1 -2.75556 -0.225 1.44028   V2 -2.63437 -0.225 1.25391 
+  N0 0.548194 -0.793356 0.264707   N1 5.73642e-18 -1 -9.4564e-18   N2 1.5603e-17 -1 -1.57299e-17 
+   txt003 
+STRI 
+  V0 -2.63437 -0.225 1.25391   V1 -2.58773 -0.2 1.30017   V2 -2.69492 -0.2 1.47706 
+  N0 1.5603e-17 -1 -1.57299e-17   N1 0.515846 -0.768155 0.379264   N2 0.548194 -0.793356 0.264707 
+   txt003 
+STRI 
+  V0 -2.75556 -0.225 1.44028   V1 -2.81619 -0.2 1.4035   V2 -2.68102 -0.2 1.20764 
+  N0 5.73642e-18 -1 -9.4564e-18   N1 -0.534196 -0.794341 -0.289235   N2 -0.486433 -0.770599 -0.411777 
+   txt003 
+STRI 
+  V0 -2.68102 -0.2 1.20764   V1 -2.63437 -0.225 1.25391   V2 -2.75556 -0.225 1.44028 
+  N0 -0.486433 -0.770599 -0.411777   N1 1.5603e-17 -1 -1.57299e-17   N2 5.73642e-18 -1 -9.4564e-18 
+   txt003 
+STRI 
+  V0 -2.81619 -0.2 1.4035   V1 -2.86283 -0.125 1.37521   V2 -2.7169 -0.125 1.17205 
+  N0 -0.534196 -0.794341 -0.289235   N1 -0.807437 -0.378466 -0.452558   N2 -0.700515 -0.35392 -0.619694 
+   txt003 
+STRI 
+  V0 -2.7169 -0.125 1.17205   V1 -2.68102 -0.2 1.20764   V2 -2.81619 -0.2 1.4035 
+  N0 -0.700515 -0.35392 -0.619694   N1 -0.486433 -0.770599 -0.411777   N2 -0.534196 -0.794341 -0.289235 
+   txt003 
+STRI 
+  V0 -2.86283 -0.125 1.37521   V1 -2.88148 0 1.36389   V2 -2.73125 0 1.15781 
+  N0 -0.807437 -0.378466 -0.452558   N1 -0.869653 -7.07402e-16 -0.493664   N2 -0.743581 -2.38916e-16 -0.668646 
+   txt003 
+STRI 
+  V0 -2.73125 0 1.15781   V1 -2.7169 -0.125 1.17205   V2 -2.86283 -0.125 1.37521 
+  N0 -0.743581 -2.38916e-16 -0.668646   N1 -0.700515 -0.35392 -0.619694   N2 -0.807437 -0.378466 -0.452558 
+   txt003 
+STRI 
+  V0 -2.5375 0 1.35   V1 -2.55185 -0.125 1.33576   V2 -2.41221 -0.125 1.16687 
+  N0 0.83205 0 0.5547   N1 0.772293 -0.349434 0.530527   N2 0.676612 -0.31353 0.666255 
+   txt003 
+STRI 
+  V0 -2.41221 -0.125 1.16687   V1 -2.4037 0 1.18333   V2 -2.5375 0 1.35 
+  N0 0.676612 -0.31353 0.666255   N1 0.722374 0 0.691503   N2 0.83205 0 0.5547 
+   txt003 
+STRI 
+  V0 -2.55185 -0.125 1.33576   V1 -2.58773 -0.2 1.30017   V2 -2.43347 -0.2 1.12572 
+  N0 0.772293 -0.349434 0.530527   N1 0.515846 -0.768155 0.379264   N2 0.471519 -0.729692 0.495195 
+   txt003 
+STRI 
+  V0 -2.43347 -0.2 1.12572   V1 -2.41221 -0.125 1.16687   V2 -2.55185 -0.125 1.33576 
+  N0 0.471519 -0.729692 0.495195   N1 0.676612 -0.31353 0.666255   N2 0.772293 -0.349434 0.530527 
+   txt003 
+STRI 
+  V0 -2.58773 -0.2 1.30017   V1 -2.63437 -0.225 1.25391   V2 -2.46111 -0.225 1.07222 
+  N0 0.515846 -0.768155 0.379264   N1 1.5603e-17 -1 -1.57299e-17   N2 3.17396e-17 -1 -1.63988e-17 
+   txt003 
+STRI 
+  V0 -2.46111 -0.225 1.07222   V1 -2.43347 -0.2 1.12572   V2 -2.58773 -0.2 1.30017 
+  N0 3.17396e-17 -1 -1.63988e-17   N1 0.471519 -0.729692 0.495195   N2 0.515846 -0.768155 0.379264 
+   txt003 
+STRI 
+  V0 -2.63437 -0.225 1.25391   V1 -2.68102 -0.2 1.20764   V2 -2.48875 -0.2 1.01872 
+  N0 1.5603e-17 -1 -1.57299e-17   N1 -0.486433 -0.770599 -0.411777   N2 -0.433172 -0.735531 -0.520919 
+   txt003 
+STRI 
+  V0 -2.48875 -0.2 1.01872   V1 -2.46111 -0.225 1.07222   V2 -2.63437 -0.225 1.25391 
+  N0 -0.433172 -0.735531 -0.520919   N1 3.17396e-17 -1 -1.63988e-17   N2 1.5603e-17 -1 -1.57299e-17 
+   txt003 
+STRI 
+  V0 -2.68102 -0.2 1.20764   V1 -2.7169 -0.125 1.17205   V2 -2.51001 -0.125 0.977572 
+  N0 -0.486433 -0.770599 -0.411777   N1 -0.700515 -0.35392 -0.619694   N2 -0.589822 -0.322549 -0.740319 
+   txt003 
+STRI 
+  V0 -2.51001 -0.125 0.977572   V1 -2.48875 -0.2 1.01872   V2 -2.68102 -0.2 1.20764 
+  N0 -0.589822 -0.322549 -0.740319   N1 -0.433172 -0.735531 -0.520919   N2 -0.486433 -0.770599 -0.411777 
+   txt003 
+STRI 
+  V0 -2.7169 -0.125 1.17205   V1 -2.73125 0 1.15781   V2 -2.51852 0 0.961111 
+  N0 -0.700515 -0.35392 -0.619694   N1 -0.743581 -2.38916e-16 -0.668646   N2 -0.617031 -2.64751e-17 -0.786939 
+   txt003 
+STRI 
+  V0 -2.51852 0 0.961111   V1 -2.51001 -0.125 0.977572   V2 -2.7169 -0.125 1.17205 
+  N0 -0.617031 -2.64751e-17 -0.786939   N1 -0.589822 -0.322549 -0.740319   N2 -0.700515 -0.35392 -0.619694 
+   txt003 
+STRI 
+  V0 -2.4037 0 1.18333   V1 -2.41221 -0.125 1.16687   V2 -2.22668 -0.125 1.01033 
+  N0 0.722374 0 0.691503   N1 0.676612 -0.31353 0.666255   N2 0.548733 -0.289562 0.784249 
+   txt003 
+STRI 
+  V0 -2.22668 -0.125 1.01033   V1 -2.22546 0 1.02917   V2 -2.4037 0 1.18333 
+  N0 0.548733 -0.289562 0.784249   N1 0.580973 0 0.813923   N2 0.722374 0 0.691503 
+   txt003 
+STRI 
+  V0 -2.41221 -0.125 1.16687   V1 -2.43347 -0.2 1.12572   V2 -2.22972 -0.2 0.963227 
+  N0 0.676612 -0.31353 0.666255   N1 0.471519 -0.729692 0.495195   N2 0.396971 -0.700023 0.593618 
+   txt003 
+STRI 
+  V0 -2.22972 -0.2 0.963227   V1 -2.22668 -0.125 1.01033   V2 -2.41221 -0.125 1.16687 
+  N0 0.396971 -0.700023 0.593618   N1 0.548733 -0.289562 0.784249   N2 0.676612 -0.31353 0.666255 
+   txt003 
+STRI 
+  V0 -2.43347 -0.2 1.12572   V1 -2.46111 -0.225 1.07222   V2 -2.23368 -0.225 0.901997 
+  N0 0.471519 -0.729692 0.495195   N1 3.17396e-17 -1 -1.63988e-17   N2 5.4409e-17 -1 -3.51585e-18 
+   txt003 
+STRI 
+  V0 -2.23368 -0.225 0.901997   V1 -2.22972 -0.2 0.963227   V2 -2.43347 -0.2 1.12572 
+  N0 5.4409e-17 -1 -3.51585e-18   N1 0.396971 -0.700023 0.593618   N2 0.471519 -0.729692 0.495195 
+   txt003 
+STRI 
+  V0 -2.46111 -0.225 1.07222   V1 -2.48875 -0.2 1.01872   V2 -2.23764 -0.2 0.840766 
+  N0 3.17396e-17 -1 -1.63988e-17   N1 -0.433172 -0.735531 -0.520919   N2 -0.367048 -0.708353 -0.60292 
+   txt003 
+STRI 
+  V0 -2.23764 -0.2 0.840766   V1 -2.23368 -0.225 0.901997   V2 -2.46111 -0.225 1.07222 
+  N0 -0.367048 -0.708353 -0.60292   N1 5.4409e-17 -1 -3.51585e-18   N2 3.17396e-17 -1 -1.63988e-17 
+   txt003 
+STRI 
+  V0 -2.48875 -0.2 1.01872   V1 -2.51001 -0.125 0.977572   V2 -2.24068 -0.125 0.793666 
+  N0 -0.433172 -0.735531 -0.520919   N1 -0.589822 -0.322549 -0.740319   N2 -0.485318 -0.301052 -0.820874 
+   txt003 
+STRI 
+  V0 -2.24068 -0.125 0.793666   V1 -2.23764 -0.2 0.840766   V2 -2.48875 -0.2 1.01872 
+  N0 -0.485318 -0.301052 -0.820874   N1 -0.367048 -0.708353 -0.60292   N2 -0.433172 -0.735531 -0.520919 
+   txt003 
+STRI 
+  V0 -2.51001 -0.125 0.977572   V1 -2.51852 0 0.961111   V2 -2.2419 0 0.774826 
+  N0 -0.589822 -0.322549 -0.740319   N1 -0.617031 -2.64751e-17 -0.786939   N2 -0.504836 2.02979e-16 -0.863216 
+   txt003 
+STRI 
+  V0 -2.2419 0 0.774826   V1 -2.24068 -0.125 0.793666   V2 -2.51001 -0.125 0.977572 
+  N0 -0.504836 2.02979e-16 -0.863216   N1 -0.485318 -0.301052 -0.820874   N2 -0.589822 -0.322549 -0.740319 
+   txt003 
+STRI 
+  V0 -2.22546 0 1.02917   V1 -2.22668 -0.125 1.01033   V2 -1.99259 -0.125 0.877778 
+  N0 0.580973 0 0.813923   N1 0.548733 -0.289562 0.784249   N2 0.390503 -0.30734 0.867784 
+   txt003 
+STRI 
+  V0 -1.99259 -0.125 0.877778   V1 -2 0 0.9   V2 -2.22546 0 1.02917 
+  N0 0.390503 -0.30734 0.867784   N1 0.410365 0 0.911922   N2 0.580973 0 0.813923 
+   txt003 
+STRI 
+  V0 -2.22668 -0.125 1.01033   V1 -2.22972 -0.2 0.963227   V2 -1.97407 -0.2 0.822222 
+  N0 0.548733 -0.289562 0.784249   N1 0.396971 -0.700023 0.593618   N2 0.285351 -0.718662 0.634113 
+   txt003 
+STRI 
+  V0 -1.97407 -0.2 0.822222   V1 -1.99259 -0.125 0.877778   V2 -2.22668 -0.125 1.01033 
+  N0 0.285351 -0.718662 0.634113   N1 0.390503 -0.30734 0.867784   N2 0.548733 -0.289562 0.784249 
+   txt003 
+STRI 
+  V0 -2.22972 -0.2 0.963227   V1 -2.23368 -0.225 0.901997   V2 -1.95 -0.225 0.75 
+  N0 0.396971 -0.700023 0.593618   N1 5.4409e-17 -1 -3.51585e-18   N2 7.83687e-17 -1 2.61229e-17 
+   txt003 
+STRI 
+  V0 -1.95 -0.225 0.75   V1 -1.97407 -0.2 0.822222   V2 -2.22972 -0.2 0.963227 
+  N0 7.83687e-17 -1 2.61229e-17   N1 0.285351 -0.718662 0.634113   N2 0.396971 -0.700023 0.593618 
+   txt003 
+STRI 
+  V0 -2.23368 -0.225 0.901997   V1 -2.23764 -0.2 0.840766   V2 -1.92593 -0.2 0.677778 
+  N0 5.4409e-17 -1 -3.51585e-18   N1 -0.367048 -0.708353 -0.60292   N2 -0.285351 -0.718662 -0.634113 
+   txt003 
+STRI 
+  V0 -1.92593 -0.2 0.677778   V1 -1.95 -0.225 0.75   V2 -2.23368 -0.225 0.901997 
+  N0 -0.285351 -0.718662 -0.634113   N1 7.83687e-17 -1 2.61229e-17   N2 5.4409e-17 -1 -3.51585e-18 
+   txt003 
+STRI 
+  V0 -2.23764 -0.2 0.840766   V1 -2.24068 -0.125 0.793666   V2 -1.90741 -0.125 0.622222 
+  N0 -0.367048 -0.708353 -0.60292   N1 -0.485318 -0.301052 -0.820874   N2 -0.390503 -0.30734 -0.867784 
+   txt003 
+STRI 
+  V0 -1.90741 -0.125 0.622222   V1 -1.92593 -0.2 0.677778   V2 -2.23764 -0.2 0.840766 
+  N0 -0.390503 -0.30734 -0.867784   N1 -0.285351 -0.718662 -0.634113   N2 -0.367048 -0.708353 -0.60292 
+   txt003 
+STRI 
+  V0 -2.24068 -0.125 0.793666   V1 -2.2419 0 0.774826   V2 -1.9 0 0.6 
+  N0 -0.485318 -0.301052 -0.820874   N1 -0.504836 2.02979e-16 -0.863216   N2 -0.410365 4.49972e-17 -0.911922 
+   txt003 
+STRI 
+  V0 -1.9 0 0.6   V1 -1.90741 -0.125 0.622222   V2 -2.24068 -0.125 0.793666 
+  N0 -0.410365 4.49972e-17 -0.911922   N1 -0.390503 -0.30734 -0.867784   N2 -0.485318 -0.301052 -0.820874 
+   txt003 
+STRI 
+  V0 -3 0 1.8   V1 -2.97778 0.125 1.8   V2 -2.94929 0.125 1.58515 
+  N0 -1 0 0   N1 -0.923077 0.384615 0   N2 -0.890548 0.386679 -0.23959 
+   txt003 
+STRI 
+  V0 -2.94929 0.125 1.58515   V1 -2.9706 0 1.5783   V2 -3 0 1.8 
+  N0 -0.890548 0.386679 -0.23959   N1 -0.965311 0 -0.261102   N2 -1 0 0 
+   txt003 
+STRI 
+  V0 -2.97778 0.125 1.8   V1 -2.92222 0.2 1.8   V2 -2.896 0.2 1.60229 
+  N0 -0.923077 0.384615 0   N1 -0.6 0.8 0   N2 -0.577707 0.801752 -0.153129 
+   txt003 
+STRI 
+  V0 -2.896 0.2 1.60229   V1 -2.94929 0.125 1.58515   V2 -2.97778 0.125 1.8 
+  N0 -0.577707 0.801752 -0.153129   N1 -0.890548 0.386679 -0.23959   N2 -0.923077 0.384615 0 
+   txt003 
+STRI 
+  V0 -2.92222 0.2 1.8   V1 -2.85 0.225 1.8   V2 -2.82674 0.225 1.62457 
+  N0 -0.6 0.8 0   N1 -0 1 0   N2 9.48478e-19 1 -2.94924e-18 
+   txt003 
+STRI 
+  V0 -2.82674 0.225 1.62457   V1 -2.896 0.2 1.60229   V2 -2.92222 0.2 1.8 
+  N0 9.48478e-19 1 -2.94924e-18   N1 -0.577707 0.801752 -0.153129   N2 -0.6 0.8 0 
+   txt003 
+STRI 
+  V0 -2.85 0.225 1.8   V1 -2.77778 0.2 1.8   V2 -2.75747 0.2 1.64684 
+  N0 -0 1 0   N1 0.6 0.8 0   N2 0.57987 0.801541 0.145888 
+   txt003 
+STRI 
+  V0 -2.75747 0.2 1.64684   V1 -2.82674 0.225 1.62457   V2 -2.85 0.225 1.8 
+  N0 0.57987 0.801541 0.145888   N1 9.48478e-19 1 -2.94924e-18   N2 -0 1 0 
+   txt003 
+STRI 
+  V0 -2.77778 0.2 1.8   V1 -2.72222 0.125 1.8   V2 -2.70418 0.125 1.66398 
+  N0 0.6 0.8 0   N1 0.923077 0.384615 0   N2 0.895972 0.38623 0.219226 
+   txt003 
+STRI 
+  V0 -2.70418 0.125 1.66398   V1 -2.75747 0.2 1.64684   V2 -2.77778 0.2 1.8 
+  N0 0.895972 0.38623 0.219226   N1 0.57987 0.801541 0.145888   N2 0.6 0.8 0 
+   txt003 
+STRI 
+  V0 -2.72222 0.125 1.8   V1 -2.7 0 1.8   V2 -2.68287 0 1.67083 
+  N0 0.923077 0.384615 0   N1 1 9.86865e-16 0   N2 0.972045 1.13306e-15 0.234794 
+   txt003 
+STRI 
+  V0 -2.68287 0 1.67083   V1 -2.70418 0.125 1.66398   V2 -2.72222 0.125 1.8 
+  N0 0.972045 1.13306e-15 0.234794   N1 0.895972 0.38623 0.219226   N2 0.923077 0.384615 0 
+   txt003 
+STRI 
+  V0 -2.9706 0 1.5783   V1 -2.94929 0.125 1.58515   V2 -2.86283 0.125 1.37521 
+  N0 -0.965311 0 -0.261102   N1 -0.890548 0.386679 -0.23959   N2 -0.807437 0.378466 -0.452558 
+   txt003 
+STRI 
+  V0 -2.86283 0.125 1.37521   V1 -2.88148 0 1.36389   V2 -2.9706 0 1.5783 
+  N0 -0.807437 0.378466 -0.452558   N1 -0.869653 0 -0.493664   N2 -0.965311 0 -0.261102 
+   txt003 
+STRI 
+  V0 -2.94929 0.125 1.58515   V1 -2.896 0.2 1.60229   V2 -2.81619 0.2 1.4035 
+  N0 -0.890548 0.386679 -0.23959   N1 -0.577707 0.801752 -0.153129   N2 -0.534196 0.794341 -0.289235 
+   txt003 
+STRI 
+  V0 -2.81619 0.2 1.4035   V1 -2.86283 0.125 1.37521   V2 -2.94929 0.125 1.58515 
+  N0 -0.534196 0.794341 -0.289235   N1 -0.807437 0.378466 -0.452558   N2 -0.890548 0.386679 -0.23959 
+   txt003 
+STRI 
+  V0 -2.896 0.2 1.60229   V1 -2.82674 0.225 1.62457   V2 -2.75556 0.225 1.44028 
+  N0 -0.577707 0.801752 -0.153129   N1 9.48478e-19 1 -2.94924e-18   N2 5.73642e-18 1 -9.4564e-18 
+   txt003 
+STRI 
+  V0 -2.75556 0.225 1.44028   V1 -2.81619 0.2 1.4035   V2 -2.896 0.2 1.60229 
+  N0 5.73642e-18 1 -9.4564e-18   N1 -0.534196 0.794341 -0.289235   N2 -0.577707 0.801752 -0.153129 
+   txt003 
+STRI 
+  V0 -2.82674 0.225 1.62457   V1 -2.75747 0.2 1.64684   V2 -2.69492 0.2 1.47706 
+  N0 9.48478e-19 1 -2.94924e-18   N1 0.57987 0.801541 0.145888   N2 0.548194 0.793356 0.264707 
+   txt003 
+STRI 
+  V0 -2.69492 0.2 1.47706   V1 -2.75556 0.225 1.44028   V2 -2.82674 0.225 1.62457 
+  N0 0.548194 0.793356 0.264707   N1 5.73642e-18 1 -9.4564e-18   N2 9.48478e-19 1 -2.94924e-18 
+   txt003 
+STRI 
+  V0 -2.75747 0.2 1.64684   V1 -2.70418 0.125 1.66398   V2 -2.64829 0.125 1.50535 
+  N0 0.57987 0.801541 0.145888   N1 0.895972 0.38623 0.219226   N2 0.842942 0.376421 0.38439 
+   txt003 
+STRI 
+  V0 -2.64829 0.125 1.50535   V1 -2.69492 0.2 1.47706   V2 -2.75747 0.2 1.64684 
+  N0 0.842942 0.376421 0.38439   N1 0.548194 0.793356 0.264707   N2 0.57987 0.801541 0.145888 
+   txt003 
+STRI 
+  V0 -2.70418 0.125 1.66398   V1 -2.68287 0 1.67083   V2 -2.62963 0 1.51667 
+  N0 0.895972 0.38623 0.219226   N1 0.972045 1.13306e-15 0.234794   N2 0.913812 1.42786e-15 0.406138 
+   txt003 
+STRI 
+  V0 -2.62963 0 1.51667   V1 -2.64829 0.125 1.50535   V2 -2.70418 0.125 1.66398 
+  N0 0.913812 1.42786e-15 0.406138   N1 0.842942 0.376421 0.38439   N2 0.895972 0.38623 0.219226 
+   txt003 
+STRI 
+  V0 -2.88148 0 1.36389   V1 -2.86283 0.125 1.37521   V2 -2.7169 0.125 1.17205 
+  N0 -0.869653 0 -0.493664   N1 -0.807437 0.378466 -0.452558   N2 -0.700515 0.35392 -0.619694 
+   txt003 
+STRI 
+  V0 -2.7169 0.125 1.17205   V1 -2.73125 0 1.15781   V2 -2.88148 0 1.36389 
+  N0 -0.700515 0.35392 -0.619694   N1 -0.743581 0 -0.668646   N2 -0.869653 0 -0.493664 
+   txt003 
+STRI 
+  V0 -2.86283 0.125 1.37521   V1 -2.81619 0.2 1.4035   V2 -2.68102 0.2 1.20764 
+  N0 -0.807437 0.378466 -0.452558   N1 -0.534196 0.794341 -0.289235   N2 -0.486433 0.770599 -0.411777 
+   txt003 
+STRI 
+  V0 -2.68102 0.2 1.20764   V1 -2.7169 0.125 1.17205   V2 -2.86283 0.125 1.37521 
+  N0 -0.486433 0.770599 -0.411777   N1 -0.700515 0.35392 -0.619694   N2 -0.807437 0.378466 -0.452558 
+   txt003 
+STRI 
+  V0 -2.81619 0.2 1.4035   V1 -2.75556 0.225 1.44028   V2 -2.63437 0.225 1.25391 
+  N0 -0.534196 0.794341 -0.289235   N1 5.73642e-18 1 -9.4564e-18   N2 1.5603e-17 1 -1.57299e-17 
+   txt003 
+STRI 
+  V0 -2.63437 0.225 1.25391   V1 -2.68102 0.2 1.20764   V2 -2.81619 0.2 1.4035 
+  N0 1.5603e-17 1 -1.57299e-17   N1 -0.486433 0.770599 -0.411777   N2 -0.534196 0.794341 -0.289235 
+   txt003 
+STRI 
+  V0 -2.75556 0.225 1.44028   V1 -2.69492 0.2 1.47706   V2 -2.58773 0.2 1.30017 
+  N0 5.73642e-18 1 -9.4564e-18   N1 0.548194 0.793356 0.264707   N2 0.515846 0.768155 0.379264 
+   txt003 
+STRI 
+  V0 -2.58773 0.2 1.30017   V1 -2.63437 0.225 1.25391   V2 -2.75556 0.225 1.44028 
+  N0 0.515846 0.768155 0.379264   N1 1.5603e-17 1 -1.57299e-17   N2 5.73642e-18 1 -9.4564e-18 
+   txt003 
+STRI 
+  V0 -2.69492 0.2 1.47706   V1 -2.64829 0.125 1.50535   V2 -2.55185 0.125 1.33576 
+  N0 0.548194 0.793356 0.264707   N1 0.842942 0.376421 0.38439   N2 0.772293 0.349434 0.530527 
+   txt003 
+STRI 
+  V0 -2.55185 0.125 1.33576   V1 -2.58773 0.2 1.30017   V2 -2.69492 0.2 1.47706 
+  N0 0.772293 0.349434 0.530527   N1 0.515846 0.768155 0.379264   N2 0.548194 0.793356 0.264707 
+   txt003 
+STRI 
+  V0 -2.64829 0.125 1.50535   V1 -2.62963 0 1.51667   V2 -2.5375 0 1.35 
+  N0 0.842942 0.376421 0.38439   N1 0.913812 1.42786e-15 0.406138   N2 0.83205 1.23168e-15 0.5547 
+   txt003 
+STRI 
+  V0 -2.5375 0 1.35   V1 -2.55185 0.125 1.33576   V2 -2.64829 0.125 1.50535 
+  N0 0.83205 1.23168e-15 0.5547   N1 0.772293 0.349434 0.530527   N2 0.842942 0.376421 0.38439 
+   txt003 
+STRI 
+  V0 -2.73125 0 1.15781   V1 -2.7169 0.125 1.17205   V2 -2.51001 0.125 0.977572 
+  N0 -0.743581 0 -0.668646   N1 -0.700515 0.35392 -0.619694   N2 -0.589822 0.322549 -0.740319 
+   txt003 
+STRI 
+  V0 -2.51001 0.125 0.977572   V1 -2.51852 0 0.961111   V2 -2.73125 0 1.15781 
+  N0 -0.589822 0.322549 -0.740319   N1 -0.617031 0 -0.786939   N2 -0.743581 0 -0.668646 
+   txt003 
+STRI 
+  V0 -2.7169 0.125 1.17205   V1 -2.68102 0.2 1.20764   V2 -2.48875 0.2 1.01872 
+  N0 -0.700515 0.35392 -0.619694   N1 -0.486433 0.770599 -0.411777   N2 -0.433172 0.735531 -0.520919 
+   txt003 
+STRI 
+  V0 -2.48875 0.2 1.01872   V1 -2.51001 0.125 0.977572   V2 -2.7169 0.125 1.17205 
+  N0 -0.433172 0.735531 -0.520919   N1 -0.589822 0.322549 -0.740319   N2 -0.700515 0.35392 -0.619694 
+   txt003 
+STRI 
+  V0 -2.68102 0.2 1.20764   V1 -2.63437 0.225 1.25391   V2 -2.46111 0.225 1.07222 
+  N0 -0.486433 0.770599 -0.411777   N1 1.5603e-17 1 -1.57299e-17   N2 3.17396e-17 1 -1.63988e-17 
+   txt003 
+STRI 
+  V0 -2.46111 0.225 1.07222   V1 -2.48875 0.2 1.01872   V2 -2.68102 0.2 1.20764 
+  N0 3.17396e-17 1 -1.63988e-17   N1 -0.433172 0.735531 -0.520919   N2 -0.486433 0.770599 -0.411777 
+   txt003 
+STRI 
+  V0 -2.63437 0.225 1.25391   V1 -2.58773 0.2 1.30017   V2 -2.43347 0.2 1.12572 
+  N0 1.5603e-17 1 -1.57299e-17   N1 0.515846 0.768155 0.379264   N2 0.471519 0.729692 0.495195 
+   txt003 
+STRI 
+  V0 -2.43347 0.2 1.12572   V1 -2.46111 0.225 1.07222   V2 -2.63437 0.225 1.25391 
+  N0 0.471519 0.729692 0.495195   N1 3.17396e-17 1 -1.63988e-17   N2 1.5603e-17 1 -1.57299e-17 
+   txt003 
+STRI 
+  V0 -2.58773 0.2 1.30017   V1 -2.55185 0.125 1.33576   V2 -2.41221 0.125 1.16687 
+  N0 0.515846 0.768155 0.379264   N1 0.772293 0.349434 0.530527   N2 0.676612 0.31353 0.666255 
+   txt003 
+STRI 
+  V0 -2.41221 0.125 1.16687   V1 -2.43347 0.2 1.12572   V2 -2.58773 0.2 1.30017 
+  N0 0.676612 0.31353 0.666255   N1 0.471519 0.729692 0.495195   N2 0.515846 0.768155 0.379264 
+   txt003 
+STRI 
+  V0 -2.55185 0.125 1.33576   V1 -2.5375 0 1.35   V2 -2.4037 0 1.18333 
+  N0 0.772293 0.349434 0.530527   N1 0.83205 1.23168e-15 0.5547   N2 0.722374 1.2247e-15 0.691503 
+   txt003 
+STRI 
+  V0 -2.4037 0 1.18333   V1 -2.41221 0.125 1.16687   V2 -2.55185 0.125 1.33576 
+  N0 0.722374 1.2247e-15 0.691503   N1 0.676612 0.31353 0.666255   N2 0.772293 0.349434 0.530527 
+   txt003 
+STRI 
+  V0 -2.51852 0 0.961111   V1 -2.51001 0.125 0.977572   V2 -2.24068 0.125 0.793666 
+  N0 -0.617031 0 -0.786939   N1 -0.589822 0.322549 -0.740319   N2 -0.485318 0.301052 -0.820874 
+   txt003 
+STRI 
+  V0 -2.24068 0.125 0.793666   V1 -2.2419 0 0.774826   V2 -2.51852 0 0.961111 
+  N0 -0.485318 0.301052 -0.820874   N1 -0.504836 0 -0.863216   N2 -0.617031 0 -0.786939 
+   txt003 
+STRI 
+  V0 -2.51001 0.125 0.977572   V1 -2.48875 0.2 1.01872   V2 -2.23764 0.2 0.840766 
+  N0 -0.589822 0.322549 -0.740319   N1 -0.433172 0.735531 -0.520919   N2 -0.367048 0.708353 -0.60292 
+   txt003 
+STRI 
+  V0 -2.23764 0.2 0.840766   V1 -2.24068 0.125 0.793666   V2 -2.51001 0.125 0.977572 
+  N0 -0.367048 0.708353 -0.60292   N1 -0.485318 0.301052 -0.820874   N2 -0.589822 0.322549 -0.740319 
+   txt003 
+STRI 
+  V0 -2.48875 0.2 1.01872   V1 -2.46111 0.225 1.07222   V2 -2.23368 0.225 0.901997 
+  N0 -0.433172 0.735531 -0.520919   N1 3.17396e-17 1 -1.63988e-17   N2 5.4409e-17 1 -3.51585e-18 
+   txt003 
+STRI 
+  V0 -2.23368 0.225 0.901997   V1 -2.23764 0.2 0.840766   V2 -2.48875 0.2 1.01872 
+  N0 5.4409e-17 1 -3.51585e-18   N1 -0.367048 0.708353 -0.60292   N2 -0.433172 0.735531 -0.520919 
+   txt003 
+STRI 
+  V0 -2.46111 0.225 1.07222   V1 -2.43347 0.2 1.12572   V2 -2.22972 0.2 0.963227 
+  N0 3.17396e-17 1 -1.63988e-17   N1 0.471519 0.729692 0.495195   N2 0.396971 0.700023 0.593618 
+   txt003 
+STRI 
+  V0 -2.22972 0.2 0.963227   V1 -2.23368 0.225 0.901997   V2 -2.46111 0.225 1.07222 
+  N0 0.396971 0.700023 0.593618   N1 5.4409e-17 1 -3.51585e-18   N2 3.17396e-17 1 -1.63988e-17 
+   txt003 
+STRI 
+  V0 -2.43347 0.2 1.12572   V1 -2.41221 0.125 1.16687   V2 -2.22668 0.125 1.01033 
+  N0 0.471519 0.729692 0.495195   N1 0.676612 0.31353 0.666255   N2 0.548733 0.289562 0.784249 
+   txt003 
+STRI 
+  V0 -2.22668 0.125 1.01033   V1 -2.22972 0.2 0.963227   V2 -2.43347 0.2 1.12572 
+  N0 0.548733 0.289562 0.784249   N1 0.396971 0.700023 0.593618   N2 0.471519 0.729692 0.495195 
+   txt003 
+STRI 
+  V0 -2.41221 0.125 1.16687   V1 -2.4037 0 1.18333   V2 -2.22546 0 1.02917 
+  N0 0.676612 0.31353 0.666255   N1 0.722374 1.2247e-15 0.691503   N2 0.580973 1.1041e-15 0.813923 
+   txt003 
+STRI 
+  V0 -2.22546 0 1.02917   V1 -2.22668 0.125 1.01033   V2 -2.41221 0.125 1.16687 
+  N0 0.580973 1.1041e-15 0.813923   N1 0.548733 0.289562 0.784249   N2 0.676612 0.31353 0.666255 
+   txt003 
+STRI 
+  V0 -2.2419 0 0.774826   V1 -2.24068 0.125 0.793666   V2 -1.90741 0.125 0.622222 
+  N0 -0.504836 0 -0.863216   N1 -0.485318 0.301052 -0.820874   N2 -0.390503 0.30734 -0.867784 
+   txt003 
+STRI 
+  V0 -1.90741 0.125 0.622222   V1 -1.9 0 0.6   V2 -2.2419 0 0.774826 
+  N0 -0.390503 0.30734 -0.867784   N1 -0.410365 0 -0.911922   N2 -0.504836 0 -0.863216 
+   txt003 
+STRI 
+  V0 -2.24068 0.125 0.793666   V1 -2.23764 0.2 0.840766   V2 -1.92593 0.2 0.677778 
+  N0 -0.485318 0.301052 -0.820874   N1 -0.367048 0.708353 -0.60292   N2 -0.285351 0.718662 -0.634113 
+   txt003 
+STRI 
+  V0 -1.92593 0.2 0.677778   V1 -1.90741 0.125 0.622222   V2 -2.24068 0.125 0.793666 
+  N0 -0.285351 0.718662 -0.634113   N1 -0.390503 0.30734 -0.867784   N2 -0.485318 0.301052 -0.820874 
+   txt003 
+STRI 
+  V0 -2.23764 0.2 0.840766   V1 -2.23368 0.225 0.901997   V2 -1.95 0.225 0.75 
+  N0 -0.367048 0.708353 -0.60292   N1 5.4409e-17 1 -3.51585e-18   N2 7.83687e-17 1 2.61229e-17 
+   txt003 
+STRI 
+  V0 -1.95 0.225 0.75   V1 -1.92593 0.2 0.677778   V2 -2.23764 0.2 0.840766 
+  N0 7.83687e-17 1 2.61229e-17   N1 -0.285351 0.718662 -0.634113   N2 -0.367048 0.708353 -0.60292 
+   txt003 
+STRI 
+  V0 -2.23368 0.225 0.901997   V1 -2.22972 0.2 0.963227   V2 -1.97407 0.2 0.822222 
+  N0 5.4409e-17 1 -3.51585e-18   N1 0.396971 0.700023 0.593618   N2 0.285351 0.718662 0.634113 
+   txt003 
+STRI 
+  V0 -1.97407 0.2 0.822222   V1 -1.95 0.225 0.75   V2 -2.23368 0.225 0.901997 
+  N0 0.285351 0.718662 0.634113   N1 7.83687e-17 1 2.61229e-17   N2 5.4409e-17 1 -3.51585e-18 
+   txt003 
+STRI 
+  V0 -2.22972 0.2 0.963227   V1 -2.22668 0.125 1.01033   V2 -1.99259 0.125 0.877778 
+  N0 0.396971 0.700023 0.593618   N1 0.548733 0.289562 0.784249   N2 0.390503 0.30734 0.867784 
+   txt003 
+STRI 
+  V0 -1.99259 0.125 0.877778   V1 -1.97407 0.2 0.822222   V2 -2.22972 0.2 0.963227 
+  N0 0.390503 0.30734 0.867784   N1 0.285351 0.718662 0.634113   N2 0.396971 0.700023 0.593618 
+   txt003 
+STRI 
+  V0 -2.22668 0.125 1.01033   V1 -2.22546 0 1.02917   V2 -2 0 0.9 
+  N0 0.548733 0.289562 0.784249   N1 0.580973 1.1041e-15 0.813923   N2 0.410365 1.30492e-15 0.911922 
+   txt003 
+STRI 
+  V0 -2 0 0.9   V1 -1.99259 0.125 0.877778   V2 -2.22668 0.125 1.01033 
+  N0 0.410365 1.30492e-15 0.911922   N1 0.390503 0.30734 0.867784   N2 0.548733 0.289562 0.784249 
+   txt003 
+STRI 
+  V0 1.7 0 1.425   V1 1.7 -0.275 1.36389   V2 2.07238 -0.262346 1.42521 
+  N0 -0 0 1   N1 -0.0157732 -0.461877 0.886804   N2 -0.291732 -0.426807 0.855995 
+   txt003 
+STRI 
+  V0 2.07238 -0.262346 1.42521   V1 2.0588 0 1.47639   V2 1.7 0 1.425 
+  N0 -0.291732 -0.426807 0.855995   N1 -0.333935 0 0.942596   N2 -0 0 1 
+   txt003 
+STRI 
+  V0 1.7 -0.275 1.36389   V1 1.7 -0.44 1.21111   V2 2.10633 -0.419753 1.29725 
+  N0 -0.0157732 -0.461877 0.886804   N1 -0.0291362 -0.857129 0.514277   N2 -0.135104 -0.834377 0.534381 
+   txt003 
+STRI 
+  V0 2.10633 -0.419753 1.29725   V1 2.07238 -0.262346 1.42521   V2 1.7 -0.275 1.36389 
+  N0 -0.135104 -0.834377 0.534381   N1 -0.291732 -0.426807 0.855995   N2 -0.0157732 -0.461877 0.886804 
+   txt003 
+STRI 
+  V0 1.7 -0.44 1.21111   V1 1.7 -0.495 1.0125   V2 2.15046 -0.472222 1.1309 
+  N0 -0.0291362 -0.857129 0.514277   N1 0 -1 -0   N2 0.110195 -0.99348 0.0292376 
+   txt003 
+STRI 
+  V0 2.15046 -0.472222 1.1309   V1 2.10633 -0.419753 1.29725   V2 1.7 -0.44 1.21111 
+  N0 0.110195 -0.99348 0.0292376   N1 -0.135104 -0.834377 0.534381   N2 -0.0291362 -0.857129 0.514277 
+   txt003 
+STRI 
+  V0 1.7 -0.495 1.0125   V1 1.7 -0.44 0.813889   V2 2.1946 -0.419753 0.964558 
+  N0 0 -1 -0   N1 0.0673462 -0.855546 -0.513328   N2 0.348602 -0.814337 -0.464038 
+   txt003 
+STRI 
+  V0 2.1946 -0.419753 0.964558   V1 2.15046 -0.472222 1.1309   V2 1.7 -0.495 1.0125 
+  N0 0.348602 -0.814337 -0.464038   N1 0.110195 -0.99348 0.0292376   N2 0 -1 -0 
+   txt003 
+STRI 
+  V0 1.7 -0.44 0.813889   V1 1.7 -0.275 0.661111   V2 2.22855 -0.262346 0.8366 
+  N0 0.0673462 -0.855546 -0.513328   N1 0.134339 -0.457747 -0.878875   N2 0.492146 -0.41068 -0.767551 
+   txt003 
+STRI 
+  V0 2.22855 -0.262346 0.8366   V1 2.1946 -0.419753 0.964558   V2 1.7 -0.44 0.813889 
+  N0 0.492146 -0.41068 -0.767551   N1 0.348602 -0.814337 -0.464038   N2 0.0673462 -0.855546 -0.513328 
+   txt003 
+STRI 
+  V0 1.7 -0.275 0.661111   V1 1.7 0 0.6   V2 2.24213 0 0.785417 
+  N0 0.134339 -0.457747 -0.878875   N1 0.158678 9.39168e-16 -0.98733   N2 0.528678 6.47717e-16 -0.848822 
+   txt003 
+STRI 
+  V0 2.24213 0 0.785417   V1 2.22855 -0.262346 0.8366   V2 1.7 -0.275 0.661111 
+  N0 0.528678 6.47717e-16 -0.848822   N1 0.492146 -0.41068 -0.767551   N2 0.134339 -0.457747 -0.878875 
+   txt003 
+STRI 
+  V0 2.0588 0 1.47639   V1 2.07238 -0.262346 1.42521   V2 2.29012 -0.23071 1.57202 
+  N0 -0.333935 0 0.942596   N1 -0.291732 -0.426807 0.855995   N2 -0.64585 -0.390219 0.656206 
+   txt003 
+STRI 
+  V0 2.29012 -0.23071 1.57202   V1 2.27037 0 1.61111   V2 2.0588 0 1.47639 
+  N0 -0.64585 -0.390219 0.656206   N1 -0.731055 0 0.682318   N2 -0.333935 0 0.942596 
+   txt003 
+STRI 
+  V0 2.07238 -0.262346 1.42521   V1 2.10633 -0.419753 1.29725   V2 2.33951 -0.369136 1.47428 
+  N0 -0.291732 -0.426807 0.855995   N1 -0.135104 -0.834377 0.534381   N2 -0.312511 -0.816863 0.484842 
+   txt003 
+STRI 
+  V0 2.33951 -0.369136 1.47428   V1 2.29012 -0.23071 1.57202   V2 2.07238 -0.262346 1.42521 
+  N0 -0.312511 -0.816863 0.484842   N1 -0.64585 -0.390219 0.656206   N2 -0.291732 -0.426807 0.855995 
+   txt003 
+STRI 
+  V0 2.10633 -0.419753 1.29725   V1 2.15046 -0.472222 1.1309   V2 2.4037 -0.415278 1.34722 
+  N0 -0.135104 -0.834377 0.534381   N1 0.110195 -0.99348 0.0292376   N2 0.215359 -0.970454 0.108813 
+   txt003 
+STRI 
+  V0 2.4037 -0.415278 1.34722   V1 2.33951 -0.369136 1.47428   V2 2.10633 -0.419753 1.29725 
+  N0 0.215359 -0.970454 0.108813   N1 -0.312511 -0.816863 0.484842   N2 -0.135104 -0.834377 0.534381 
+   txt003 
+STRI 
+  V0 2.15046 -0.472222 1.1309   V1 2.1946 -0.419753 0.964558   V2 2.4679 -0.369136 1.22016 
+  N0 0.110195 -0.99348 0.0292376   N1 0.348602 -0.814337 -0.464038   N2 0.627607 -0.733748 -0.260237 
+   txt003 
+STRI 
+  V0 2.4679 -0.369136 1.22016   V1 2.4037 -0.415278 1.34722   V2 2.15046 -0.472222 1.1309 
+  N0 0.627607 -0.733748 -0.260237   N1 0.215359 -0.970454 0.108813   N2 0.110195 -0.99348 0.0292376 
+   txt003 
+STRI 
+  V0 2.1946 -0.419753 0.964558   V1 2.22855 -0.262346 0.8366   V2 2.51728 -0.23071 1.12243 
+  N0 0.348602 -0.814337 -0.464038   N1 0.492146 -0.41068 -0.767551   N2 0.813963 -0.348056 -0.465103 
+   txt003 
+STRI 
+  V0 2.51728 -0.23071 1.12243   V1 2.4679 -0.369136 1.22016   V2 2.1946 -0.419753 0.964558 
+  N0 0.813963 -0.348056 -0.465103   N1 0.627607 -0.733748 -0.260237   N2 0.348602 -0.814337 -0.464038 
+   txt003 
+STRI 
+  V0 2.22855 -0.262346 0.8366   V1 2.24213 0 0.785417   V2 2.53704 0 1.08333 
+  N0 0.492146 -0.41068 -0.767551   N1 0.528678 6.47717e-16 -0.848822   N2 0.854063 9.88017e-16 -0.52017 
+   txt003 
+STRI 
+  V0 2.53704 0 1.08333   V1 2.51728 -0.23071 1.12243   V2 2.22855 -0.262346 0.8366 
+  N0 0.854063 9.88017e-16 -0.52017   N1 0.813963 -0.348056 -0.465103   N2 0.492146 -0.41068 -0.767551 
+   txt003 
+STRI 
+  V0 2.27037 0 1.61111   V1 2.29012 -0.23071 1.57202   V2 2.40972 -0.189583 1.77361 
+  N0 -0.731055 0 0.682318   N1 -0.64585 -0.390219 0.656206   N2 -0.835237 -0.363942 0.412221 
+   txt003 
+STRI 
+  V0 2.40972 -0.189583 1.77361   V1 2.3875 0 1.8   V2 2.27037 0 1.61111 
+  N0 -0.835237 -0.363942 0.412221   N1 -0.920582 0 0.39055   N2 -0.731055 0 0.682318 
+   txt003 
+STRI 
+  V0 2.29012 -0.23071 1.57202   V1 2.33951 -0.369136 1.47428   V2 2.46528 -0.303333 1.70764 
+  N0 -0.64585 -0.390219 0.656206   N1 -0.312511 -0.816863 0.484842   N2 -0.451323 -0.803033 0.38916 
+   txt003 
+STRI 
+  V0 2.46528 -0.303333 1.70764   V1 2.40972 -0.189583 1.77361   V2 2.29012 -0.23071 1.57202 
+  N0 -0.451323 -0.803033 0.38916   N1 -0.835237 -0.363942 0.412221   N2 -0.64585 -0.390219 0.656206 
+   txt003 
+STRI 
+  V0 2.33951 -0.369136 1.47428   V1 2.4037 -0.415278 1.34722   V2 2.5375 -0.34125 1.62187 
+  N0 -0.312511 -0.816863 0.484842   N1 0.215359 -0.970454 0.108813   N2 0.214084 -0.960035 0.180281 
+   txt003 
+STRI 
+  V0 2.5375 -0.34125 1.62187   V1 2.46528 -0.303333 1.70764   V2 2.33951 -0.369136 1.47428 
+  N0 0.214084 -0.960035 0.180281   N1 -0.451323 -0.803033 0.38916   N2 -0.312511 -0.816863 0.484842 
+   txt003 
+STRI 
+  V0 2.4037 -0.415278 1.34722   V1 2.4679 -0.369136 1.22016   V2 2.60972 -0.303333 1.53611 
+  N0 0.215359 -0.970454 0.108813   N1 0.627607 -0.733748 -0.260237   N2 0.705424 -0.704198 -0.0805066 
+   txt003 
+STRI 
+  V0 2.60972 -0.303333 1.53611   V1 2.5375 -0.34125 1.62187   V2 2.4037 -0.415278 1.34722 
+  N0 0.705424 -0.704198 -0.0805066   N1 0.214084 -0.960035 0.180281   N2 0.215359 -0.970454 0.108813 
+   txt003 
+STRI 
+  V0 2.4679 -0.369136 1.22016   V1 2.51728 -0.23071 1.12243   V2 2.66528 -0.189583 1.47014 
+  N0 0.627607 -0.733748 -0.260237   N1 0.813963 -0.348056 -0.465103   N2 0.913262 -0.329186 -0.239977 
+   txt003 
+STRI 
+  V0 2.66528 -0.189583 1.47014   V1 2.60972 -0.303333 1.53611   V2 2.4679 -0.369136 1.22016 
+  N0 0.913262 -0.329186 -0.239977   N1 0.705424 -0.704198 -0.0805066   N2 0.627607 -0.733748 -0.260237 
+   txt003 
+STRI 
+  V0 2.51728 -0.23071 1.12243   V1 2.53704 0 1.08333   V2 2.6875 0 1.44375 
+  N0 0.813963 -0.348056 -0.465103   N1 0.854063 9.88017e-16 -0.52017   N2 0.957826 1.83855e-15 -0.287348 
+   txt003 
+STRI 
+  V0 2.6875 0 1.44375   V1 2.66528 -0.189583 1.47014   V2 2.51728 -0.23071 1.12243 
+  N0 0.957826 1.83855e-15 -0.287348   N1 0.913262 -0.329186 -0.239977   N2 0.813963 -0.348056 -0.465103 
+   txt003 
+STRI 
+  V0 2.3875 0 1.8   V1 2.40972 -0.189583 1.77361   V2 2.48765 -0.148457 1.99928 
+  N0 -0.920582 0 0.39055   N1 -0.835237 -0.363942 0.412221   N2 -0.842821 -0.409176 0.34961 
+   txt003 
+STRI 
+  V0 2.48765 -0.148457 1.99928   V1 2.46296 0 2.01389   V2 2.3875 0 1.8 
+  N0 -0.842821 -0.409176 0.34961   N1 -0.948683 0 0.316228   N2 -0.920582 0 0.39055 
+   txt003 
+STRI 
+  V0 2.40972 -0.189583 1.77361   V1 2.46528 -0.303333 1.70764   V2 2.54938 -0.237531 1.96276 
+  N0 -0.835237 -0.363942 0.412221   N1 -0.451323 -0.803033 0.38916   N2 -0.452673 -0.821162 0.347535 
+   txt003 
+STRI 
+  V0 2.54938 -0.237531 1.96276   V1 2.48765 -0.148457 1.99928   V2 2.40972 -0.189583 1.77361 
+  N0 -0.452673 -0.821162 0.347535   N1 -0.842821 -0.409176 0.34961   N2 -0.835237 -0.363942 0.412221 
+   txt003 
+STRI 
+  V0 2.46528 -0.303333 1.70764   V1 2.5375 -0.34125 1.62187   V2 2.62963 -0.267222 1.91528 
+  N0 -0.451323 -0.803033 0.38916   N1 0.214084 -0.960035 0.180281   N2 0.113546 -0.974822 0.191909 
+   txt003 
+STRI 
+  V0 2.62963 -0.267222 1.91528   V1 2.54938 -0.237531 1.96276   V2 2.46528 -0.303333 1.70764 
+  N0 0.113546 -0.974822 0.191909   N1 -0.452673 -0.821162 0.347535   N2 -0.451323 -0.803033 0.38916 
+   txt003 
+STRI 
+  V0 2.5375 -0.34125 1.62187   V1 2.60972 -0.303333 1.53611   V2 2.70988 -0.237531 1.8678 
+  N0 0.214084 -0.960035 0.180281   N1 0.705424 -0.704198 -0.0805066   N2 0.60461 -0.794635 -0.0547983 
+   txt003 
+STRI 
+  V0 2.70988 -0.237531 1.8678   V1 2.62963 -0.267222 1.91528   V2 2.5375 -0.34125 1.62187 
+  N0 0.60461 -0.794635 -0.0547983   N1 0.113546 -0.974822 0.191909   N2 0.214084 -0.960035 0.180281 
+   txt003 
+STRI 
+  V0 2.60972 -0.303333 1.53611   V1 2.66528 -0.189583 1.47014   V2 2.7716 -0.148457 1.83128 
+  N0 0.705424 -0.704198 -0.0805066   N1 0.913262 -0.329186 -0.239977   N2 0.880144 -0.401503 -0.253261 
+   txt003 
+STRI 
+  V0 2.7716 -0.148457 1.83128   V1 2.70988 -0.237531 1.8678   V2 2.60972 -0.303333 1.53611 
+  N0 0.880144 -0.401503 -0.253261   N1 0.60461 -0.794635 -0.0547983   N2 0.705424 -0.704198 -0.0805066 
+   txt003 
+STRI 
+  V0 2.66528 -0.189583 1.47014   V1 2.6875 0 1.44375   V2 2.7963 0 1.81667 
+  N0 0.913262 -0.329186 -0.239977   N1 0.957826 1.83855e-15 -0.287348   N2 0.947588 3.02585e-15 -0.319493 
+   txt003 
+STRI 
+  V0 2.7963 0 1.81667   V1 2.7716 -0.148457 1.83128   V2 2.66528 -0.189583 1.47014 
+  N0 0.947588 3.02585e-15 -0.319493   N1 0.880144 -0.401503 -0.253261   N2 0.913262 -0.329186 -0.239977 
+   txt003 
+STRI 
+  V0 2.46296 0 2.01389   V1 2.48765 -0.148457 1.99928   V2 2.5804 -0.116821 2.21831 
+  N0 -0.948683 0 0.316228   N1 -0.842821 -0.409176 0.34961   N2 -0.723795 -0.498863 0.476715 
+   txt003 
+STRI 
+  V0 2.5804 -0.116821 2.21831   V1 2.54954 0 2.22361   V2 2.46296 0 2.01389 
+  N0 -0.723795 -0.498863 0.476715   N1 -0.874591 0 0.484861   N2 -0.948683 0 0.316228 
+   txt003 
+STRI 
+  V0 2.48765 -0.148457 1.99928   V1 2.54938 -0.237531 1.96276   V2 2.65756 -0.186914 2.20507 
+  N0 -0.842821 -0.409176 0.34961   N1 -0.452673 -0.821162 0.347535   N2 -0.365378 -0.851743 0.375544 
+   txt003 
+STRI 
+  V0 2.65756 -0.186914 2.20507   V1 2.5804 -0.116821 2.21831   V2 2.48765 -0.148457 1.99928 
+  N0 -0.365378 -0.851743 0.375544   N1 -0.723795 -0.498863 0.476715   N2 -0.842821 -0.409176 0.34961 
+   txt003 
+STRI 
+  V0 2.54938 -0.237531 1.96276   V1 2.62963 -0.267222 1.91528   V2 2.75787 -0.210278 2.18785 
+  N0 -0.452673 -0.821162 0.347535   N1 0.113546 -0.974822 0.191909   N2 0.0260102 -0.988113 0.151516 
+   txt003 
+STRI 
+  V0 2.75787 -0.210278 2.18785   V1 2.65756 -0.186914 2.20507   V2 2.54938 -0.237531 1.96276 
+  N0 0.0260102 -0.988113 0.151516   N1 -0.365378 -0.851743 0.375544   N2 -0.452673 -0.821162 0.347535 
+   txt003 
+STRI 
+  V0 2.62963 -0.267222 1.91528   V1 2.70988 -0.237531 1.8678   V2 2.85818 -0.186914 2.17063 
+  N0 0.113546 -0.974822 0.191909   N1 0.60461 -0.794635 -0.0547983   N2 0.417243 -0.88974 -0.185122 
+   txt003 
+STRI 
+  V0 2.85818 -0.186914 2.17063   V1 2.75787 -0.210278 2.18785   V2 2.62963 -0.267222 1.91528 
+  N0 0.417243 -0.88974 -0.185122   N1 0.0260102 -0.988113 0.151516   N2 0.113546 -0.974822 0.191909 
+   txt003 
+STRI 
+  V0 2.70988 -0.237531 1.8678   V1 2.7716 -0.148457 1.83128   V2 2.93534 -0.116821 2.15738 
+  N0 0.60461 -0.794635 -0.0547983   N1 0.880144 -0.401503 -0.253261   N2 0.70819 -0.492319 -0.506053 
+   txt003 
+STRI 
+  V0 2.93534 -0.116821 2.15738   V1 2.85818 -0.186914 2.17063   V2 2.70988 -0.237531 1.8678 
+  N0 0.70819 -0.492319 -0.506053   N1 0.417243 -0.88974 -0.185122   N2 0.60461 -0.794635 -0.0547983 
+   txt003 
+STRI 
+  V0 2.7716 -0.148457 1.83128   V1 2.7963 0 1.81667   V2 2.9662 0 2.15208 
+  N0 0.880144 -0.401503 -0.253261   N1 0.947588 3.02585e-15 -0.319493   N2 0.787582 4.30265e-15 -0.61621 
+   txt003 
+STRI 
+  V0 2.9662 0 2.15208   V1 2.93534 -0.116821 2.15738   V2 2.7716 -0.148457 1.83128 
+  N0 0.787582 4.30265e-15 -0.61621   N1 0.70819 -0.492319 -0.506053   N2 0.880144 -0.401503 -0.253261 
+   txt003 
+STRI 
+  V0 2.54954 0 2.22361   V1 2.5804 -0.116821 2.21831   V2 2.74444 -0.104167 2.4 
+  N0 -0.874591 0 0.484861   N1 -0.723795 -0.498863 0.476715   N2 -0.497164 -0.497164 0.711095 
+   txt003 
+STRI 
+  V0 2.74444 -0.104167 2.4   V1 2.7 0 2.4   V2 2.54954 0 2.22361 
+  N0 -0.497164 -0.497164 0.711095   N1 -0.6 0 0.8   N2 -0.874591 0 0.484861 
+   txt003 
+STRI 
+  V0 2.5804 -0.116821 2.21831   V1 2.65756 -0.186914 2.20507   V2 2.85556 -0.166667 2.4 
+  N0 -0.723795 -0.498863 0.476715   N1 -0.365378 -0.851743 0.375544   N2 -0.267368 -0.855576 0.443288 
+   txt003 
+STRI 
+  V0 2.85556 -0.166667 2.4   V1 2.74444 -0.104167 2.4   V2 2.5804 -0.116821 2.21831 
+  N0 -0.267368 -0.855576 0.443288   N1 -0.497164 -0.497164 0.711095   N2 -0.723795 -0.498863 0.476715 
+   txt003 
+STRI 
+  V0 2.65756 -0.186914 2.20507   V1 2.75787 -0.210278 2.18785   V2 3 -0.1875 2.4 
+  N0 -0.365378 -0.851743 0.375544   N1 0.0260102 -0.988113 0.151516   N2 0 -1 2.19303e-16 
+   txt003 
+STRI 
+  V0 3 -0.1875 2.4   V1 2.85556 -0.166667 2.4   V2 2.65756 -0.186914 2.20507 
+  N0 0 -1 2.19303e-16   N1 -0.267368 -0.855576 0.443288   N2 -0.365378 -0.851743 0.375544 
+   txt003 
+STRI 
+  V0 2.75787 -0.210278 2.18785   V1 2.85818 -0.186914 2.17063   V2 3.14444 -0.166667 2.4 
+  N0 0.0260102 -0.988113 0.151516   N1 0.417243 -0.88974 -0.185122   N2 0.250514 -0.801644 -0.54278 
+   txt003 
+STRI 
+  V0 3.14444 -0.166667 2.4   V1 3 -0.1875 2.4   V2 2.75787 -0.210278 2.18785 
+  N0 0.250514 -0.801644 -0.54278   N1 0 -1 2.19303e-16   N2 0.0260102 -0.988113 0.151516 
+   txt003 
+STRI 
+  V0 2.85818 -0.186914 2.17063   V1 2.93534 -0.116821 2.15738   V2 3.25556 -0.104167 2.4 
+  N0 0.417243 -0.88974 -0.185122   N1 0.70819 -0.492319 -0.506053   N2 0.366221 -0.366221 -0.855433 
+   txt003 
+STRI 
+  V0 3.25556 -0.104167 2.4   V1 3.14444 -0.166667 2.4   V2 2.85818 -0.186914 2.17063 
+  N0 0.366221 -0.366221 -0.855433   N1 0.250514 -0.801644 -0.54278   N2 0.417243 -0.88974 -0.185122 
+   txt003 
+STRI 
+  V0 2.93534 -0.116821 2.15738   V1 2.9662 0 2.15208   V2 3.3 0 2.4 
+  N0 0.70819 -0.492319 -0.506053   N1 0.787582 4.30265e-15 -0.61621   N2 0.384615 6.46776e-15 -0.923077 
+   txt003 
+STRI 
+  V0 3.3 0 2.4   V1 3.25556 -0.104167 2.4   V2 2.93534 -0.116821 2.15738 
+  N0 0.384615 6.46776e-15 -0.923077   N1 0.366221 -0.366221 -0.855433   N2 0.70819 -0.492319 -0.506053 
+   txt003 
+STRI 
+  V0 1.7 0 0.6   V1 1.7 0.275 0.661111   V2 2.22855 0.262346 0.8366 
+  N0 0.158678 0 -0.98733   N1 0.134339 0.457747 -0.878875   N2 0.492146 0.41068 -0.767551 
+   txt003 
+STRI 
+  V0 2.22855 0.262346 0.8366   V1 2.24213 0 0.785417   V2 1.7 0 0.6 
+  N0 0.492146 0.41068 -0.767551   N1 0.528678 0 -0.848822   N2 0.158678 0 -0.98733 
+   txt003 
+STRI 
+  V0 1.7 0.275 0.661111   V1 1.7 0.44 0.813889   V2 2.1946 0.419753 0.964558 
+  N0 0.134339 0.457747 -0.878875   N1 0.0673462 0.855546 -0.513328   N2 0.348602 0.814337 -0.464038 
+   txt003 
+STRI 
+  V0 2.1946 0.419753 0.964558   V1 2.22855 0.262346 0.8366   V2 1.7 0.275 0.661111 
+  N0 0.348602 0.814337 -0.464038   N1 0.492146 0.41068 -0.767551   N2 0.134339 0.457747 -0.878875 
+   txt003 
+STRI 
+  V0 1.7 0.44 0.813889   V1 1.7 0.495 1.0125   V2 2.15046 0.472222 1.1309 
+  N0 0.0673462 0.855546 -0.513328   N1 0 1 -0   N2 0.110195 0.99348 0.0292376 
+   txt003 
+STRI 
+  V0 2.15046 0.472222 1.1309   V1 2.1946 0.419753 0.964558   V2 1.7 0.44 0.813889 
+  N0 0.110195 0.99348 0.0292376   N1 0.348602 0.814337 -0.464038   N2 0.0673462 0.855546 -0.513328 
+   txt003 
+STRI 
+  V0 1.7 0.495 1.0125   V1 1.7 0.44 1.21111   V2 2.10633 0.419753 1.29725 
+  N0 0 1 -0   N1 -0.0291362 0.857129 0.514277   N2 -0.135104 0.834377 0.534381 
+   txt003 
+STRI 
+  V0 2.10633 0.419753 1.29725   V1 2.15046 0.472222 1.1309   V2 1.7 0.495 1.0125 
+  N0 -0.135104 0.834377 0.534381   N1 0.110195 0.99348 0.0292376   N2 0 1 -0 
+   txt003 
+STRI 
+  V0 1.7 0.44 1.21111   V1 1.7 0.275 1.36389   V2 2.07238 0.262346 1.42521 
+  N0 -0.0291362 0.857129 0.514277   N1 -0.0157732 0.461877 0.886804   N2 -0.291732 0.426807 0.855995 
+   txt003 
+STRI 
+  V0 2.07238 0.262346 1.42521   V1 2.10633 0.419753 1.29725   V2 1.7 0.44 1.21111 
+  N0 -0.291732 0.426807 0.855995   N1 -0.135104 0.834377 0.534381   N2 -0.0291362 0.857129 0.514277 
+   txt003 
+STRI 
+  V0 1.7 0.275 1.36389   V1 1.7 0 1.425   V2 2.0588 0 1.47639 
+  N0 -0.0157732 0.461877 0.886804   N1 0 -4.48575e-16 1   N2 -0.333935 -3.25455e-16 0.942596 
+   txt003 
+STRI 
+  V0 2.0588 0 1.47639   V1 2.07238 0.262346 1.42521   V2 1.7 0.275 1.36389 
+  N0 -0.333935 -3.25455e-16 0.942596   N1 -0.291732 0.426807 0.855995   N2 -0.0157732 0.461877 0.886804 
+   txt003 
+STRI 
+  V0 2.24213 0 0.785417   V1 2.22855 0.262346 0.8366   V2 2.51728 0.23071 1.12243 
+  N0 0.528678 0 -0.848822   N1 0.492146 0.41068 -0.767551   N2 0.813963 0.348056 -0.465103 
+   txt003 
+STRI 
+  V0 2.51728 0.23071 1.12243   V1 2.53704 0 1.08333   V2 2.24213 0 0.785417 
+  N0 0.813963 0.348056 -0.465103   N1 0.854063 0 -0.52017   N2 0.528678 0 -0.848822 
+   txt003 
+STRI 
+  V0 2.22855 0.262346 0.8366   V1 2.1946 0.419753 0.964558   V2 2.4679 0.369136 1.22016 
+  N0 0.492146 0.41068 -0.767551   N1 0.348602 0.814337 -0.464038   N2 0.627607 0.733748 -0.260237 
+   txt003 
+STRI 
+  V0 2.4679 0.369136 1.22016   V1 2.51728 0.23071 1.12243   V2 2.22855 0.262346 0.8366 
+  N0 0.627607 0.733748 -0.260237   N1 0.813963 0.348056 -0.465103   N2 0.492146 0.41068 -0.767551 
+   txt003 
+STRI 
+  V0 2.1946 0.419753 0.964558   V1 2.15046 0.472222 1.1309   V2 2.4037 0.415278 1.34722 
+  N0 0.348602 0.814337 -0.464038   N1 0.110195 0.99348 0.0292376   N2 0.215359 0.970454 0.108813 
+   txt003 
+STRI 
+  V0 2.4037 0.415278 1.34722   V1 2.4679 0.369136 1.22016   V2 2.1946 0.419753 0.964558 
+  N0 0.215359 0.970454 0.108813   N1 0.627607 0.733748 -0.260237   N2 0.348602 0.814337 -0.464038 
+   txt003 
+STRI 
+  V0 2.15046 0.472222 1.1309   V1 2.10633 0.419753 1.29725   V2 2.33951 0.369136 1.47428 
+  N0 0.110195 0.99348 0.0292376   N1 -0.135104 0.834377 0.534381   N2 -0.312511 0.816863 0.484842 
+   txt003 
+STRI 
+  V0 2.33951 0.369136 1.47428   V1 2.4037 0.415278 1.34722   V2 2.15046 0.472222 1.1309 
+  N0 -0.312511 0.816863 0.484842   N1 0.215359 0.970454 0.108813   N2 0.110195 0.99348 0.0292376 
+   txt003 
+STRI 
+  V0 2.10633 0.419753 1.29725   V1 2.07238 0.262346 1.42521   V2 2.29012 0.23071 1.57202 
+  N0 -0.135104 0.834377 0.534381   N1 -0.291732 0.426807 0.855995   N2 -0.64585 0.390219 0.656206 
+   txt003 
+STRI 
+  V0 2.29012 0.23071 1.57202   V1 2.33951 0.369136 1.47428   V2 2.10633 0.419753 1.29725 
+  N0 -0.64585 0.390219 0.656206   N1 -0.312511 0.816863 0.484842   N2 -0.135104 0.834377 0.534381 
+   txt003 
+STRI 
+  V0 2.07238 0.262346 1.42521   V1 2.0588 0 1.47639   V2 2.27037 0 1.61111 
+  N0 -0.291732 0.426807 0.855995   N1 -0.333935 -3.25455e-16 0.942596   N2 -0.731055 -1.69385e-16 0.682318 
+   txt003 
+STRI 
+  V0 2.27037 0 1.61111   V1 2.29012 0.23071 1.57202   V2 2.07238 0.262346 1.42521 
+  N0 -0.731055 -1.69385e-16 0.682318   N1 -0.64585 0.390219 0.656206   N2 -0.291732 0.426807 0.855995 
+   txt003 
+STRI 
+  V0 2.53704 0 1.08333   V1 2.51728 0.23071 1.12243   V2 2.66528 0.189583 1.47014 
+  N0 0.854063 0 -0.52017   N1 0.813963 0.348056 -0.465103   N2 0.913262 0.329186 -0.239977 
+   txt003 
+STRI 
+  V0 2.66528 0.189583 1.47014   V1 2.6875 0 1.44375   V2 2.53704 0 1.08333 
+  N0 0.913262 0.329186 -0.239977   N1 0.957826 0 -0.287348   N2 0.854063 0 -0.52017 
+   txt003 
+STRI 
+  V0 2.51728 0.23071 1.12243   V1 2.4679 0.369136 1.22016   V2 2.60972 0.303333 1.53611 
+  N0 0.813963 0.348056 -0.465103   N1 0.627607 0.733748 -0.260237   N2 0.705424 0.704198 -0.0805066 
+   txt003 
+STRI 
+  V0 2.60972 0.303333 1.53611   V1 2.66528 0.189583 1.47014   V2 2.51728 0.23071 1.12243 
+  N0 0.705424 0.704198 -0.0805066   N1 0.913262 0.329186 -0.239977   N2 0.813963 0.348056 -0.465103 
+   txt003 
+STRI 
+  V0 2.4679 0.369136 1.22016   V1 2.4037 0.415278 1.34722   V2 2.5375 0.34125 1.62188 
+  N0 0.627607 0.733748 -0.260237   N1 0.215359 0.970454 0.108813   N2 0.214084 0.960035 0.180281 
+   txt003 
+STRI 
+  V0 2.5375 0.34125 1.62188   V1 2.60972 0.303333 1.53611   V2 2.4679 0.369136 1.22016 
+  N0 0.214084 0.960035 0.180281   N1 0.705424 0.704198 -0.0805066   N2 0.627607 0.733748 -0.260237 
+   txt003 
+STRI 
+  V0 2.4037 0.415278 1.34722   V1 2.33951 0.369136 1.47428   V2 2.46528 0.303333 1.70764 
+  N0 0.215359 0.970454 0.108813   N1 -0.312511 0.816863 0.484842   N2 -0.451323 0.803033 0.38916 
+   txt003 
+STRI 
+  V0 2.46528 0.303333 1.70764   V1 2.5375 0.34125 1.62188   V2 2.4037 0.415278 1.34722 
+  N0 -0.451323 0.803033 0.38916   N1 0.214084 0.960035 0.180281   N2 0.215359 0.970454 0.108813 
+   txt003 
+STRI 
+  V0 2.33951 0.369136 1.47428   V1 2.29012 0.23071 1.57202   V2 2.40972 0.189583 1.77361 
+  N0 -0.312511 0.816863 0.484842   N1 -0.64585 0.390219 0.656206   N2 -0.835237 0.363942 0.412221 
+   txt003 
+STRI 
+  V0 2.40972 0.189583 1.77361   V1 2.46528 0.303333 1.70764   V2 2.33951 0.369136 1.47428 
+  N0 -0.835237 0.363942 0.412221   N1 -0.451323 0.803033 0.38916   N2 -0.312511 0.816863 0.484842 
+   txt003 
+STRI 
+  V0 2.29012 0.23071 1.57202   V1 2.27037 0 1.61111   V2 2.3875 0 1.8 
+  N0 -0.64585 0.390219 0.656206   N1 -0.731055 -1.69385e-16 0.682318   N2 -0.920582 -2.76813e-16 0.39055 
+   txt003 
+STRI 
+  V0 2.3875 0 1.8   V1 2.40972 0.189583 1.77361   V2 2.29012 0.23071 1.57202 
+  N0 -0.920582 -2.76813e-16 0.39055   N1 -0.835237 0.363942 0.412221   N2 -0.64585 0.390219 0.656206 
+   txt003 
+STRI 
+  V0 2.6875 0 1.44375   V1 2.66528 0.189583 1.47014   V2 2.7716 0.148457 1.83128 
+  N0 0.957826 0 -0.287348   N1 0.913262 0.329186 -0.239977   N2 0.880144 0.401503 -0.253261 
+   txt003 
+STRI 
+  V0 2.7716 0.148457 1.83128   V1 2.7963 0 1.81667   V2 2.6875 0 1.44375 
+  N0 0.880144 0.401503 -0.253261   N1 0.947588 0 -0.319493   N2 0.957826 0 -0.287348 
+   txt003 
+STRI 
+  V0 2.66528 0.189583 1.47014   V1 2.60972 0.303333 1.53611   V2 2.70988 0.237531 1.8678 
+  N0 0.913262 0.329186 -0.239977   N1 0.705424 0.704198 -0.0805066   N2 0.60461 0.794635 -0.0547983 
+   txt003 
+STRI 
+  V0 2.70988 0.237531 1.8678   V1 2.7716 0.148457 1.83128   V2 2.66528 0.189583 1.47014 
+  N0 0.60461 0.794635 -0.0547983   N1 0.880144 0.401503 -0.253261   N2 0.913262 0.329186 -0.239977 
+   txt003 
+STRI 
+  V0 2.60972 0.303333 1.53611   V1 2.5375 0.34125 1.62188   V2 2.62963 0.267222 1.91528 
+  N0 0.705424 0.704198 -0.0805066   N1 0.214084 0.960035 0.180281   N2 0.113546 0.974822 0.191909 
+   txt003 
+STRI 
+  V0 2.62963 0.267222 1.91528   V1 2.70988 0.237531 1.8678   V2 2.60972 0.303333 1.53611 
+  N0 0.113546 0.974822 0.191909   N1 0.60461 0.794635 -0.0547983   N2 0.705424 0.704198 -0.0805066 
+   txt003 
+STRI 
+  V0 2.5375 0.34125 1.62188   V1 2.46528 0.303333 1.70764   V2 2.54938 0.237531 1.96276 
+  N0 0.214084 0.960035 0.180281   N1 -0.451323 0.803033 0.38916   N2 -0.452673 0.821162 0.347535 
+   txt003 
+STRI 
+  V0 2.54938 0.237531 1.96276   V1 2.62963 0.267222 1.91528   V2 2.5375 0.34125 1.62188 
+  N0 -0.452673 0.821162 0.347535   N1 0.113546 0.974822 0.191909   N2 0.214084 0.960035 0.180281 
+   txt003 
+STRI 
+  V0 2.46528 0.303333 1.70764   V1 2.40972 0.189583 1.77361   V2 2.48765 0.148457 1.99928 
+  N0 -0.451323 0.803033 0.38916   N1 -0.835237 0.363942 0.412221   N2 -0.842821 0.409176 0.34961 
+   txt003 
+STRI 
+  V0 2.48765 0.148457 1.99928   V1 2.54938 0.237531 1.96276   V2 2.46528 0.303333 1.70764 
+  N0 -0.842821 0.409176 0.34961   N1 -0.452673 0.821162 0.347535   N2 -0.451323 0.803033 0.38916 
+   txt003 
+STRI 
+  V0 2.40972 0.189583 1.77361   V1 2.3875 0 1.8   V2 2.46296 0 2.01389 
+  N0 -0.835237 0.363942 0.412221   N1 -0.920582 -2.76813e-16 0.39055   N2 -0.948683 -4.59839e-16 0.316228 
+   txt003 
+STRI 
+  V0 2.46296 0 2.01389   V1 2.48765 0.148457 1.99928   V2 2.40972 0.189583 1.77361 
+  N0 -0.948683 -4.59839e-16 0.316228   N1 -0.842821 0.409176 0.34961   N2 -0.835237 0.363942 0.412221 
+   txt003 
+STRI 
+  V0 2.7963 0 1.81667   V1 2.7716 0.148457 1.83128   V2 2.93534 0.116821 2.15738 
+  N0 0.947588 0 -0.319493   N1 0.880144 0.401503 -0.253261   N2 0.70819 0.492319 -0.506053 
+   txt003 
+STRI 
+  V0 2.93534 0.116821 2.15738   V1 2.9662 0 2.15208   V2 2.7963 0 1.81667 
+  N0 0.70819 0.492319 -0.506053   N1 0.787582 0 -0.61621   N2 0.947588 0 -0.319493 
+   txt003 
+STRI 
+  V0 2.7716 0.148457 1.83128   V1 2.70988 0.237531 1.8678   V2 2.85818 0.186914 2.17063 
+  N0 0.880144 0.401503 -0.253261   N1 0.60461 0.794635 -0.0547983   N2 0.417243 0.88974 -0.185122 
+   txt003 
+STRI 
+  V0 2.85818 0.186914 2.17063   V1 2.93534 0.116821 2.15738   V2 2.7716 0.148457 1.83128 
+  N0 0.417243 0.88974 -0.185122   N1 0.70819 0.492319 -0.506053   N2 0.880144 0.401503 -0.253261 
+   txt003 
+STRI 
+  V0 2.70988 0.237531 1.8678   V1 2.62963 0.267222 1.91528   V2 2.75787 0.210278 2.18785 
+  N0 0.60461 0.794635 -0.0547983   N1 0.113546 0.974822 0.191909   N2 0.0260102 0.988113 0.151516 
+   txt003 
+STRI 
+  V0 2.75787 0.210278 2.18785   V1 2.85818 0.186914 2.17063   V2 2.70988 0.237531 1.8678 
+  N0 0.0260102 0.988113 0.151516   N1 0.417243 0.88974 -0.185122   N2 0.60461 0.794635 -0.0547983 
+   txt003 
+STRI 
+  V0 2.62963 0.267222 1.91528   V1 2.54938 0.237531 1.96276   V2 2.65756 0.186914 2.20507 
+  N0 0.113546 0.974822 0.191909   N1 -0.452673 0.821162 0.347535   N2 -0.365378 0.851743 0.375544 
+   txt003 
+STRI 
+  V0 2.65756 0.186914 2.20507   V1 2.75787 0.210278 2.18785   V2 2.62963 0.267222 1.91528 
+  N0 -0.365378 0.851743 0.375544   N1 0.0260102 0.988113 0.151516   N2 0.113546 0.974822 0.191909 
+   txt003 
+STRI 
+  V0 2.54938 0.237531 1.96276   V1 2.48765 0.148457 1.99928   V2 2.5804 0.116821 2.21831 
+  N0 -0.452673 0.821162 0.347535   N1 -0.842821 0.409176 0.34961   N2 -0.723795 0.498863 0.476715 
+   txt003 
+STRI 
+  V0 2.5804 0.116821 2.21831   V1 2.65756 0.186914 2.20507   V2 2.54938 0.237531 1.96276 
+  N0 -0.723795 0.498863 0.476715   N1 -0.365378 0.851743 0.375544   N2 -0.452673 0.821162 0.347535 
+   txt003 
+STRI 
+  V0 2.48765 0.148457 1.99928   V1 2.46296 0 2.01389   V2 2.54954 0 2.22361 
+  N0 -0.842821 0.409176 0.34961   N1 -0.948683 -4.59839e-16 0.316228   N2 -0.874591 -1.30753e-15 0.484861 
+   txt003 
+STRI 
+  V0 2.54954 0 2.22361   V1 2.5804 0.116821 2.21831   V2 2.48765 0.148457 1.99928 
+  N0 -0.874591 -1.30753e-15 0.484861   N1 -0.723795 0.498863 0.476715   N2 -0.842821 0.409176 0.34961 
+   txt003 
+STRI 
+  V0 2.9662 0 2.15208   V1 2.93534 0.116821 2.15738   V2 3.25556 0.104167 2.4 
+  N0 0.787582 0 -0.61621   N1 0.70819 0.492319 -0.506053   N2 0.366221 0.366221 -0.855433 
+   txt003 
+STRI 
+  V0 3.25556 0.104167 2.4   V1 3.3 0 2.4   V2 2.9662 0 2.15208 
+  N0 0.366221 0.366221 -0.855433   N1 0.384615 0 -0.923077   N2 0.787582 0 -0.61621 
+   txt003 
+STRI 
+  V0 2.93534 0.116821 2.15738   V1 2.85818 0.186914 2.17063   V2 3.14444 0.166667 2.4 
+  N0 0.70819 0.492319 -0.506053   N1 0.417243 0.88974 -0.185122   N2 0.250514 0.801644 -0.54278 
+   txt003 
+STRI 
+  V0 3.14444 0.166667 2.4   V1 3.25556 0.104167 2.4   V2 2.93534 0.116821 2.15738 
+  N0 0.250514 0.801644 -0.54278   N1 0.366221 0.366221 -0.855433   N2 0.70819 0.492319 -0.506053 
+   txt003 
+STRI 
+  V0 2.85818 0.186914 2.17063   V1 2.75787 0.210278 2.18785   V2 3 0.1875 2.4 
+  N0 0.417243 0.88974 -0.185122   N1 0.0260102 0.988113 0.151516   N2 4.05793e-32 1 2.19303e-16 
+   txt003 
+STRI 
+  V0 3 0.1875 2.4   V1 3.14444 0.166667 2.4   V2 2.85818 0.186914 2.17063 
+  N0 4.05793e-32 1 2.19303e-16   N1 0.250514 0.801644 -0.54278   N2 0.417243 0.88974 -0.185122 
+   txt003 
+STRI 
+  V0 2.75787 0.210278 2.18785   V1 2.65756 0.186914 2.20507   V2 2.85556 0.166667 2.4 
+  N0 0.0260102 0.988113 0.151516   N1 -0.365378 0.851743 0.375544   N2 -0.267368 0.855576 0.443288 
+   txt003 
+STRI 
+  V0 2.85556 0.166667 2.4   V1 3 0.1875 2.4   V2 2.75787 0.210278 2.18785 
+  N0 -0.267368 0.855576 0.443288   N1 4.05793e-32 1 2.19303e-16   N2 0.0260102 0.988113 0.151516 
+   txt003 
+STRI 
+  V0 2.65756 0.186914 2.20507   V1 2.5804 0.116821 2.21831   V2 2.74444 0.104167 2.4 
+  N0 -0.365378 0.851743 0.375544   N1 -0.723795 0.498863 0.476715   N2 -0.497164 0.497164 0.711095 
+   txt003 
+STRI 
+  V0 2.74444 0.104167 2.4   V1 2.85556 0.166667 2.4   V2 2.65756 0.186914 2.20507 
+  N0 -0.497164 0.497164 0.711095   N1 -0.267368 0.855576 0.443288   N2 -0.365378 0.851743 0.375544 
+   txt003 
+STRI 
+  V0 2.5804 0.116821 2.21831   V1 2.54954 0 2.22361   V2 2.7 0 2.4 
+  N0 -0.723795 0.498863 0.476715   N1 -0.874591 -1.30753e-15 0.484861   N2 -0.6 -3.55271e-15 0.8 
+   txt003 
+STRI 
+  V0 2.7 0 2.4   V1 2.74444 0.104167 2.4   V2 2.5804 0.116821 2.21831 
+  N0 -0.6 -3.55271e-15 0.8   N1 -0.497164 0.497164 0.711095   N2 -0.723795 0.498863 0.476715 
+   txt003 
+STRI 
+  V0 2.7 0 2.4   V1 2.74444 -0.104167 2.4   V2 2.79641 -0.10108 2.43193 
+  N0 -0.6 0 0.8   N1 -0.497164 -0.497164 0.711095   N2 -0.387052 -0.411886 0.824949 
+   txt003 
+STRI 
+  V0 2.79641 -0.10108 2.43193   V1 2.74907 0 2.43125   V2 2.7 0 2.4 
+  N0 -0.387052 -0.411886 0.824949   N1 -0.467888 0 0.883788   N2 -0.6 0 0.8 
+   txt003 
+STRI 
+  V0 2.74444 -0.104167 2.4   V1 2.85556 -0.166667 2.4   V2 2.91474 -0.161728 2.43361 
+  N0 -0.497164 -0.497164 0.711095   N1 -0.267368 -0.855576 0.443288   N2 -0.215548 -0.724209 0.655027 
+   txt003 
+STRI 
+  V0 2.91474 -0.161728 2.43361   V1 2.79641 -0.10108 2.43193   V2 2.74444 -0.104167 2.4 
+  N0 -0.215548 -0.724209 0.655027   N1 -0.387052 -0.411886 0.824949   N2 -0.497164 -0.497164 0.711095 
+   txt003 
+STRI 
+  V0 2.85556 -0.166667 2.4   V1 3 -0.1875 2.4   V2 3.06858 -0.181944 2.43581 
+  N0 -0.267368 -0.855576 0.443288   N1 0 -1 0   N2 -0.00489618 -0.939227 0.343261 
+   txt003 
+STRI 
+  V0 3.06858 -0.181944 2.43581   V1 2.91474 -0.161728 2.43361   V2 2.85556 -0.166667 2.4 
+  N0 -0.00489618 -0.939227 0.343261   N1 -0.215548 -0.724209 0.655027   N2 -0.267368 -0.855576 0.443288 
+   txt003 
+STRI 
+  V0 3 -0.1875 2.4   V1 3.14444 -0.166667 2.4   V2 3.22241 -0.161728 2.438 
+  N0 0 -1 0   N1 0.250514 -0.801644 -0.54278   N2 0.269127 -0.933284 -0.237808 
+   txt003 
+STRI 
+  V0 3.22241 -0.161728 2.438   V1 3.06858 -0.181944 2.43581   V2 3 -0.1875 2.4 
+  N0 0.269127 -0.933284 -0.237808   N1 -0.00489618 -0.939227 0.343261   N2 0 -1 0 
+   txt003 
+STRI 
+  V0 3.14444 -0.166667 2.4   V1 3.25556 -0.104167 2.4   V2 3.34075 -0.10108 2.43969 
+  N0 0.250514 -0.801644 -0.54278   N1 0.366221 -0.366221 -0.855433   N2 0.442187 -0.473386 -0.761824 
+   txt003 
+STRI 
+  V0 3.34075 -0.10108 2.43969   V1 3.22241 -0.161728 2.438   V2 3.14444 -0.166667 2.4 
+  N0 0.442187 -0.473386 -0.761824   N1 0.269127 -0.933284 -0.237808   N2 0.250514 -0.801644 -0.54278 
+   txt003 
+STRI 
+  V0 3.25556 -0.104167 2.4   V1 3.3 0 2.4   V2 3.38808 0 2.44036 
+  N0 0.366221 -0.366221 -0.855433   N1 0.384615 -2.55067e-15 -0.923077   N2 0.463425 -2.75328e-15 -0.886136 
+   txt003 
+STRI 
+  V0 3.38808 0 2.44036   V1 3.34075 -0.10108 2.43969   V2 3.25556 -0.104167 2.4 
+  N0 0.463425 -2.75328e-15 -0.886136   N1 0.442187 -0.473386 -0.761824   N2 0.366221 -0.366221 -0.855433 
+   txt003 
+STRI 
+  V0 2.74907 0 2.43125   V1 2.79641 -0.10108 2.43193   V2 2.83978 -0.0933642 2.45123 
+  N0 -0.467888 0 0.883788   N1 -0.387052 -0.411886 0.824949   N2 -0.253997 -0.272114 0.928138 
+   txt003 
+STRI 
+  V0 2.83978 -0.0933642 2.45123   V1 2.79259 0 2.45   V2 2.74907 0 2.43125 
+  N0 -0.253997 -0.272114 0.928138   N1 -0.306009 0 0.952029   N2 -0.467888 0 0.883788 
+   txt003 
+STRI 
+  V0 2.79641 -0.10108 2.43193   V1 2.91474 -0.161728 2.43361   V2 2.95775 -0.149383 2.45432 
+  N0 -0.387052 -0.411886 0.824949   N1 -0.215548 -0.724209 0.655027   N2 -0.14959 -0.481391 0.863647 
+   txt003 
+STRI 
+  V0 2.95775 -0.149383 2.45432   V1 2.83978 -0.0933642 2.45123   V2 2.79641 -0.10108 2.43193 
+  N0 -0.14959 -0.481391 0.863647   N1 -0.253997 -0.272114 0.928138   N2 -0.387052 -0.411886 0.824949 
+   txt003 
+STRI 
+  V0 2.91474 -0.161728 2.43361   V1 3.06858 -0.181944 2.43581   V2 3.11111 -0.168056 2.45833 
+  N0 -0.215548 -0.724209 0.655027   N1 -0.00489618 -0.939227 0.343261   N2 -0.0195232 -0.665415 0.746219 
+   txt003 
+STRI 
+  V0 3.11111 -0.168056 2.45833   V1 2.95775 -0.149383 2.45432   V2 2.91474 -0.161728 2.43361 
+  N0 -0.0195232 -0.665415 0.746219   N1 -0.14959 -0.481391 0.863647   N2 -0.215548 -0.724209 0.655027 
+   txt003 
+STRI 
+  V0 3.06858 -0.181944 2.43581   V1 3.22241 -0.161728 2.438   V2 3.26447 -0.149383 2.46235 
+  N0 -0.00489618 -0.939227 0.343261   N1 0.269127 -0.933284 -0.237808   N2 0.218115 -0.87054 0.44112 
+   txt003 
+STRI 
+  V0 3.26447 -0.149383 2.46235   V1 3.11111 -0.168056 2.45833   V2 3.06858 -0.181944 2.43581 
+  N0 0.218115 -0.87054 0.44112   N1 -0.0195232 -0.665415 0.746219   N2 -0.00489618 -0.939227 0.343261 
+   txt003 
+STRI 
+  V0 3.22241 -0.161728 2.438   V1 3.34075 -0.10108 2.43969   V2 3.38244 -0.0933642 2.46543 
+  N0 0.269127 -0.933284 -0.237808   N1 0.442187 -0.473386 -0.761824   N2 0.612385 -0.714958 -0.337372 
+   txt003 
+STRI 
+  V0 3.38244 -0.0933642 2.46543   V1 3.26447 -0.149383 2.46235   V2 3.22241 -0.161728 2.438 
+  N0 0.612385 -0.714958 -0.337372   N1 0.218115 -0.87054 0.44112   N2 0.269127 -0.933284 -0.237808 
+   txt003 
+STRI 
+  V0 3.34075 -0.10108 2.43969   V1 3.38808 0 2.44036   V2 3.42963 0 2.46667 
+  N0 0.442187 -0.473386 -0.761824   N1 0.463425 -2.75328e-15 -0.886136   N2 0.694136 -3.24605e-15 -0.719844 
+   txt003 
+STRI 
+  V0 3.42963 0 2.46667   V1 3.38244 -0.0933642 2.46543   V2 3.34075 -0.10108 2.43969 
+  N0 0.694136 -3.24605e-15 -0.719844   N1 0.612385 -0.714958 -0.337372   N2 0.442187 -0.473386 -0.761824 
+   txt003 
+STRI 
+  V0 2.79259 0 2.45   V1 2.83978 -0.0933642 2.45123   V2 2.86968 -0.0833333 2.45781 
+  N0 -0.306009 0 0.952029   N1 -0.253997 -0.272114 0.928138   N2 -0.0182321 0.0210195 0.999613 
+   txt003 
+STRI 
+  V0 2.86968 -0.0833333 2.45781   V1 2.825 0 2.45625   V2 2.79259 0 2.45 
+  N0 -0.0182321 0.0210195 0.999613   N1 2.22045e-15 0 1   N2 -0.306009 0 0.952029 
+   txt003 
+STRI 
+  V0 2.83978 -0.0933642 2.45123   V1 2.95775 -0.149383 2.45432   V2 2.98137 -0.133333 2.46172 
+  N0 -0.253997 -0.272114 0.928138   N1 -0.14959 -0.481391 0.863647   N2 -0.0369301 -0.00796532 0.999286 
+   txt003 
+STRI 
+  V0 2.98137 -0.133333 2.46172   V1 2.86968 -0.0833333 2.45781   V2 2.83978 -0.0933642 2.45123 
+  N0 -0.0369301 -0.00796532 0.999286   N1 -0.0182321 0.0210195 0.999613   N2 -0.253997 -0.272114 0.928138 
+   txt003 
+STRI 
+  V0 2.95775 -0.149383 2.45432   V1 3.11111 -0.168056 2.45833   V2 3.12656 -0.15 2.4668 
+  N0 -0.14959 -0.481391 0.863647   N1 -0.0195232 -0.665415 0.746219   N2 -0.0348909 -0.0594438 0.997622 
+   txt003 
+STRI 
+  V0 3.12656 -0.15 2.4668   V1 2.98137 -0.133333 2.46172   V2 2.95775 -0.149383 2.45432 
+  N0 -0.0348909 -0.0594438 0.997622   N1 -0.0369301 -0.00796532 0.999286   N2 -0.14959 -0.481391 0.863647 
+   txt003 
+STRI 
+  V0 3.11111 -0.168056 2.45833   V1 3.26447 -0.149383 2.46235   V2 3.27176 -0.133333 2.47187 
+  N0 -0.0195232 -0.665415 0.746219   N1 0.218115 -0.87054 0.44112   N2 -0.00787186 -0.108144 0.994104 
+   txt003 
+STRI 
+  V0 3.27176 -0.133333 2.47187   V1 3.12656 -0.15 2.4668   V2 3.11111 -0.168056 2.45833 
+  N0 -0.00787186 -0.108144 0.994104   N1 -0.0348909 -0.0594438 0.997622   N2 -0.0195232 -0.665415 0.746219 
+   txt003 
+STRI 
+  V0 3.26447 -0.149383 2.46235   V1 3.38244 -0.0933642 2.46543   V2 3.38345 -0.0833333 2.47578 
+  N0 0.218115 -0.87054 0.44112   N1 0.612385 -0.714958 -0.337372   N2 0.0539577 -0.111406 0.992309 
+   txt003 
+STRI 
+  V0 3.38345 -0.0833333 2.47578   V1 3.27176 -0.133333 2.47187   V2 3.26447 -0.149383 2.46235 
+  N0 0.0539577 -0.111406 0.992309   N1 -0.00787186 -0.108144 0.994104   N2 0.218115 -0.87054 0.44112 
+   txt003 
+STRI 
+  V0 3.38244 -0.0933642 2.46543   V1 3.42963 0 2.46667   V2 3.42813 0 2.47734 
+  N0 0.612385 -0.714958 -0.337372   N1 0.694136 -3.24605e-15 -0.719844   N2 0.106533 1.89241e-15 0.994309 
+   txt003 
+STRI 
+  V0 3.42813 0 2.47734   V1 3.38345 -0.0833333 2.47578   V2 3.38244 -0.0933642 2.46543 
+  N0 0.106533 1.89241e-15 0.994309   N1 0.0539577 -0.111406 0.992309   N2 0.612385 -0.714958 -0.337372 
+   txt003 
+STRI 
+  V0 2.825 0 2.45625   V1 2.86968 -0.0833333 2.45781   V2 2.88121 -0.0733025 2.45154 
+  N0 2.22045e-15 0 1   N1 -0.0182321 0.0210195 0.999613   N2 0.507715 0.682832 0.525324 
+   txt003 
+STRI 
+  V0 2.88121 -0.0733025 2.45154   V1 2.84074 0 2.45   V2 2.825 0 2.45625 
+  N0 0.507715 0.682832 0.525324   N1 0.913812 0 0.406138   N2 2.22045e-15 0 1 
+   txt003 
+STRI 
+  V0 2.86968 -0.0833333 2.45781   V1 2.98137 -0.133333 2.46172   V2 2.98237 -0.117284 2.4554 
+  N0 -0.0182321 0.0210195 0.999613   N1 -0.0369301 -0.00796532 0.999286   N2 0.148477 0.721529 0.676277 
+   txt003 
+STRI 
+  V0 2.98237 -0.117284 2.4554   V1 2.88121 -0.0733025 2.45154   V2 2.86968 -0.0833333 2.45781 
+  N0 0.148477 0.721529 0.676277   N1 0.507715 0.682832 0.525324   N2 -0.0182321 0.0210195 0.999613 
+   txt003 
+STRI 
+  V0 2.98137 -0.133333 2.46172   V1 3.12656 -0.15 2.4668   V2 3.11389 -0.131944 2.46042 
+  N0 -0.0369301 -0.00796532 0.999286   N1 -0.0348909 -0.0594438 0.997622   N2 -0.0300305 0.615625 0.787467 
+   txt003 
+STRI 
+  V0 3.11389 -0.131944 2.46042   V1 2.98237 -0.117284 2.4554   V2 2.98137 -0.133333 2.46172 
+  N0 -0.0300305 0.615625 0.787467   N1 0.148477 0.721529 0.676277   N2 -0.0369301 -0.00796532 0.999286 
+   txt003 
+STRI 
+  V0 3.12656 -0.15 2.4668   V1 3.27176 -0.133333 2.47187   V2 3.2454 -0.117284 2.46543 
+  N0 -0.0348909 -0.0594438 0.997622   N1 -0.00787186 -0.108144 0.994104   N2 -0.144371 0.459364 0.876437 
+   txt003 
+STRI 
+  V0 3.2454 -0.117284 2.46543   V1 3.11389 -0.131944 2.46042   V2 3.12656 -0.15 2.4668 
+  N0 -0.144371 0.459364 0.876437   N1 -0.0300305 0.615625 0.787467   N2 -0.0348909 -0.0594438 0.997622 
+   txt003 
+STRI 
+  V0 3.27176 -0.133333 2.47187   V1 3.38345 -0.0833333 2.47578   V2 3.34657 -0.0733025 2.46929 
+  N0 -0.00787186 -0.108144 0.994104   N1 0.0539577 -0.111406 0.992309   N2 -0.223743 0.242919 0.943891 
+   txt003 
+STRI 
+  V0 3.34657 -0.0733025 2.46929   V1 3.2454 -0.117284 2.46543   V2 3.27176 -0.133333 2.47187 
+  N0 -0.223743 0.242919 0.943891   N1 -0.144371 0.459364 0.876437   N2 -0.00787186 -0.108144 0.994104 
+   txt003 
+STRI 
+  V0 3.38345 -0.0833333 2.47578   V1 3.42813 0 2.47734   V2 3.38704 0 2.47083 
+  N0 0.0539577 -0.111406 0.992309   N1 0.106533 1.89241e-15 0.994309   N2 -0.253109 3.19224e-15 0.967438 
+   txt003 
+STRI 
+  V0 3.38704 0 2.47083   V1 3.34657 -0.0733025 2.46929   V2 3.38345 -0.0833333 2.47578 
+  N0 -0.253109 3.19224e-15 0.967438   N1 -0.223743 0.242919 0.943891   N2 0.0539577 -0.111406 0.992309 
+   txt003 
+STRI 
+  V0 2.84074 0 2.45   V1 2.88121 -0.0733025 2.45154   V2 2.86949 -0.0655864 2.43231 
+  N0 0.913812 0 0.406138   N1 0.507715 0.682832 0.525324   N2 0.577416 0.711734 -0.400031 
+   txt003 
+STRI 
+  V0 2.86949 -0.0655864 2.43231   V1 2.83426 0 2.43125   V2 2.84074 0 2.45 
+  N0 0.577416 0.711734 -0.400031   N1 0.789352 0 -0.613941   N2 0.913812 0 0.406138 
+   txt003 
+STRI 
+  V0 2.88121 -0.0733025 2.45154   V1 2.98237 -0.117284 2.4554   V2 2.95756 -0.104938 2.43496 
+  N0 0.507715 0.682832 0.525324   N1 0.148477 0.721529 0.676277   N2 0.241288 0.970358 -0.0136399 
+   txt003 
+STRI 
+  V0 2.95756 -0.104938 2.43496   V1 2.86949 -0.0655864 2.43231   V2 2.88121 -0.0733025 2.45154 
+  N0 0.241288 0.970358 -0.0136399   N1 0.577416 0.711734 -0.400031   N2 0.507715 0.682832 0.525324 
+   txt003 
+STRI 
+  V0 2.98237 -0.117284 2.4554   V1 3.11389 -0.131944 2.46042   V2 3.07205 -0.118056 2.43841 
+  N0 0.148477 0.721529 0.676277   N1 -0.0300305 0.615625 0.787467   N2 -0.0103804 0.938666 0.344672 
+   txt003 
+STRI 
+  V0 3.07205 -0.118056 2.43841   V1 2.95756 -0.104938 2.43496   V2 2.98237 -0.117284 2.4554 
+  N0 -0.0103804 0.938666 0.344672   N1 0.241288 0.970358 -0.0136399   N2 0.148477 0.721529 0.676277 
+   txt003 
+STRI 
+  V0 3.11389 -0.131944 2.46042   V1 3.2454 -0.117284 2.46543   V2 3.18654 -0.104938 2.44186 
+  N0 -0.0300305 0.615625 0.787467   N1 -0.144371 0.459364 0.876437   N2 -0.199105 0.721639 0.663019 
+   txt003 
+STRI 
+  V0 3.18654 -0.104938 2.44186   V1 3.07205 -0.118056 2.43841   V2 3.11389 -0.131944 2.46042 
+  N0 -0.199105 0.721639 0.663019   N1 -0.0103804 0.938666 0.344672   N2 -0.0300305 0.615625 0.787467 
+   txt003 
+STRI 
+  V0 3.2454 -0.117284 2.46543   V1 3.34657 -0.0733025 2.46929   V2 3.27461 -0.0655864 2.44451 
+  N0 -0.144371 0.459364 0.876437   N1 -0.223743 0.242919 0.943891   N2 -0.316294 0.364979 0.875641 
+   txt003 
+STRI 
+  V0 3.27461 -0.0655864 2.44451   V1 3.18654 -0.104938 2.44186   V2 3.2454 -0.117284 2.46543 
+  N0 -0.316294 0.364979 0.875641   N1 -0.199105 0.721639 0.663019   N2 -0.144371 0.459364 0.876437 
+   txt003 
+STRI 
+  V0 3.34657 -0.0733025 2.46929   V1 3.38704 0 2.47083   V2 3.30984 0 2.44557 
+  N0 -0.223743 0.242919 0.943891   N1 -0.253109 3.19224e-15 0.967438   N2 -0.349987 4.0695e-15 0.936755 
+   txt003 
+STRI 
+  V0 3.30984 0 2.44557   V1 3.27461 -0.0655864 2.44451   V2 3.34657 -0.0733025 2.46929 
+  N0 -0.349987 4.0695e-15 0.936755   N1 -0.316294 0.364979 0.875641   N2 -0.223743 0.242919 0.943891 
+   txt003 
+STRI 
+  V0 2.83426 0 2.43125   V1 2.86949 -0.0655864 2.43231   V2 2.82963 -0.0625 2.4 
+  N0 0.789352 0 -0.613941   N1 0.577416 0.711734 -0.400031   N2 0.483629 0.537366 -0.690899 
+   txt003 
+STRI 
+  V0 2.82963 -0.0625 2.4   V1 2.8 0 2.4   V2 2.83426 0 2.43125 
+  N0 0.483629 0.537366 -0.690899   N1 0.6 0 -0.8   N2 0.789352 0 -0.613941 
+   txt003 
+STRI 
+  V0 2.86949 -0.0655864 2.43231   V1 2.95756 -0.104938 2.43496   V2 2.9037 -0.1 2.4 
+  N0 0.577416 0.711734 -0.400031   N1 0.241288 0.970358 -0.0136399   N2 0.247465 0.879877 -0.405681 
+   txt003 
+STRI 
+  V0 2.9037 -0.1 2.4   V1 2.82963 -0.0625 2.4   V2 2.86949 -0.0655864 2.43231 
+  N0 0.247465 0.879877 -0.405681   N1 0.483629 0.537366 -0.690899   N2 0.577416 0.711734 -0.400031 
+   txt003 
+STRI 
+  V0 2.95756 -0.104938 2.43496   V1 3.07205 -0.118056 2.43841   V2 3 -0.1125 2.4 
+  N0 0.241288 0.970358 -0.0136399   N1 -0.0103804 0.938666 0.344672   N2 0 1 0 
+   txt003 
+STRI 
+  V0 3 -0.1125 2.4   V1 2.9037 -0.1 2.4   V2 2.95756 -0.104938 2.43496 
+  N0 0 1 0   N1 0.247465 0.879877 -0.405681   N2 0.241288 0.970358 -0.0136399 
+   txt003 
+STRI 
+  V0 3.07205 -0.118056 2.43841   V1 3.18654 -0.104938 2.44186   V2 3.0963 -0.1 2.4 
+  N0 -0.0103804 0.938666 0.344672   N1 -0.199105 0.721639 0.663019   N2 -0.236617 0.841304 0.486024 
+   txt003 
+STRI 
+  V0 3.0963 -0.1 2.4   V1 3 -0.1125 2.4   V2 3.07205 -0.118056 2.43841 
+  N0 -0.236617 0.841304 0.486024   N1 0 1 0   N2 -0.0103804 0.938666 0.344672 
+   txt003 
+STRI 
+  V0 3.18654 -0.104938 2.44186   V1 3.27461 -0.0655864 2.44451   V2 3.17037 -0.0625 2.4 
+  N0 -0.199105 0.721639 0.663019   N1 -0.316294 0.364979 0.875641   N2 -0.378646 0.420717 0.824393 
+   txt003 
+STRI 
+  V0 3.17037 -0.0625 2.4   V1 3.0963 -0.1 2.4   V2 3.18654 -0.104938 2.44186 
+  N0 -0.378646 0.420717 0.824393   N1 -0.236617 0.841304 0.486024   N2 -0.199105 0.721639 0.663019 
+   txt003 
+STRI 
+  V0 3.27461 -0.0655864 2.44451   V1 3.30984 0 2.44557   V2 3.2 0 2.4 
+  N0 -0.316294 0.364979 0.875641   N1 -0.349987 4.0695e-15 0.936755   N2 -0.410365 4.31973e-15 0.911922 
+   txt003 
+STRI 
+  V0 3.2 0 2.4   V1 3.17037 -0.0625 2.4   V2 3.27461 -0.0655864 2.44451 
+  N0 -0.410365 4.31973e-15 0.911922   N1 -0.378646 0.420717 0.824393   N2 -0.316294 0.364979 0.875641 
+   txt003 
+STRI 
+  V0 3.3 0 2.4   V1 3.25556 0.104167 2.4   V2 3.34075 0.10108 2.43969 
+  N0 0.384615 0 -0.923077   N1 0.366221 0.366221 -0.855433   N2 0.442187 0.473386 -0.761824 
+   txt003 
+STRI 
+  V0 3.34075 0.10108 2.43969   V1 3.38808 0 2.44036   V2 3.3 0 2.4 
+  N0 0.442187 0.473386 -0.761824   N1 0.463425 0 -0.886136   N2 0.384615 0 -0.923077 
+   txt003 
+STRI 
+  V0 3.25556 0.104167 2.4   V1 3.14444 0.166667 2.4   V2 3.22241 0.161728 2.438 
+  N0 0.366221 0.366221 -0.855433   N1 0.250514 0.801644 -0.54278   N2 0.269127 0.933284 -0.237808 
+   txt003 
+STRI 
+  V0 3.22241 0.161728 2.438   V1 3.34075 0.10108 2.43969   V2 3.25556 0.104167 2.4 
+  N0 0.269127 0.933284 -0.237808   N1 0.442187 0.473386 -0.761824   N2 0.366221 0.366221 -0.855433 
+   txt003 
+STRI 
+  V0 3.14444 0.166667 2.4   V1 3 0.1875 2.4   V2 3.06858 0.181944 2.43581 
+  N0 0.250514 0.801644 -0.54278   N1 0 1 -0   N2 -0.00489618 0.939227 0.343261 
+   txt003 
+STRI 
+  V0 3.06858 0.181944 2.43581   V1 3.22241 0.161728 2.438   V2 3.14444 0.166667 2.4 
+  N0 -0.00489618 0.939227 0.343261   N1 0.269127 0.933284 -0.237808   N2 0.250514 0.801644 -0.54278 
+   txt003 
+STRI 
+  V0 3 0.1875 2.4   V1 2.85556 0.166667 2.4   V2 2.91474 0.161728 2.43361 
+  N0 0 1 -0   N1 -0.267368 0.855576 0.443288   N2 -0.215548 0.724209 0.655027 
+   txt003 
+STRI 
+  V0 2.91474 0.161728 2.43361   V1 3.06858 0.181944 2.43581   V2 3 0.1875 2.4 
+  N0 -0.215548 0.724209 0.655027   N1 -0.00489618 0.939227 0.343261   N2 0 1 -0 
+   txt003 
+STRI 
+  V0 2.85556 0.166667 2.4   V1 2.74444 0.104167 2.4   V2 2.79641 0.10108 2.43193 
+  N0 -0.267368 0.855576 0.443288   N1 -0.497164 0.497164 0.711095   N2 -0.387052 0.411886 0.824949 
+   txt003 
+STRI 
+  V0 2.79641 0.10108 2.43193   V1 2.91474 0.161728 2.43361   V2 2.85556 0.166667 2.4 
+  N0 -0.387052 0.411886 0.824949   N1 -0.215548 0.724209 0.655027   N2 -0.267368 0.855576 0.443288 
+   txt003 
+STRI 
+  V0 2.74444 0.104167 2.4   V1 2.7 0 2.4   V2 2.74907 0 2.43125 
+  N0 -0.497164 0.497164 0.711095   N1 -0.6 2.24387e-29 0.8   N2 -0.467888 -4.75841e-16 0.883788 
+   txt003 
+STRI 
+  V0 2.74907 0 2.43125   V1 2.79641 0.10108 2.43193   V2 2.74444 0.104167 2.4 
+  N0 -0.467888 -4.75841e-16 0.883788   N1 -0.387052 0.411886 0.824949   N2 -0.497164 0.497164 0.711095 
+   txt003 
+STRI 
+  V0 3.38808 0 2.44036   V1 3.34075 0.10108 2.43969   V2 3.38244 0.0933642 2.46543 
+  N0 0.463425 0 -0.886136   N1 0.442187 0.473386 -0.761824   N2 0.612385 0.714958 -0.337372 
+   txt003 
+STRI 
+  V0 3.38244 0.0933642 2.46543   V1 3.42963 0 2.46667   V2 3.38808 0 2.44036 
+  N0 0.612385 0.714958 -0.337372   N1 0.694136 0 -0.719844   N2 0.463425 0 -0.886136 
+   txt003 
+STRI 
+  V0 3.34075 0.10108 2.43969   V1 3.22241 0.161728 2.438   V2 3.26447 0.149383 2.46235 
+  N0 0.442187 0.473386 -0.761824   N1 0.269127 0.933284 -0.237808   N2 0.218115 0.87054 0.44112 
+   txt003 
+STRI 
+  V0 3.26447 0.149383 2.46235   V1 3.38244 0.0933642 2.46543   V2 3.34075 0.10108 2.43969 
+  N0 0.218115 0.87054 0.44112   N1 0.612385 0.714958 -0.337372   N2 0.442187 0.473386 -0.761824 
+   txt003 
+STRI 
+  V0 3.22241 0.161728 2.438   V1 3.06858 0.181944 2.43581   V2 3.11111 0.168056 2.45833 
+  N0 0.269127 0.933284 -0.237808   N1 -0.00489618 0.939227 0.343261   N2 -0.0195232 0.665415 0.746219 
+   txt003 
+STRI 
+  V0 3.11111 0.168056 2.45833   V1 3.26447 0.149383 2.46235   V2 3.22241 0.161728 2.438 
+  N0 -0.0195232 0.665415 0.746219   N1 0.218115 0.87054 0.44112   N2 0.269127 0.933284 -0.237808 
+   txt003 
+STRI 
+  V0 3.06858 0.181944 2.43581   V1 2.91474 0.161728 2.43361   V2 2.95775 0.149383 2.45432 
+  N0 -0.00489618 0.939227 0.343261   N1 -0.215548 0.724209 0.655027   N2 -0.14959 0.481391 0.863647 
+   txt003 
+STRI 
+  V0 2.95775 0.149383 2.45432   V1 3.11111 0.168056 2.45833   V2 3.06858 0.181944 2.43581 
+  N0 -0.14959 0.481391 0.863647   N1 -0.0195232 0.665415 0.746219   N2 -0.00489618 0.939227 0.343261 
+   txt003 
+STRI 
+  V0 2.91474 0.161728 2.43361   V1 2.79641 0.10108 2.43193   V2 2.83978 0.0933642 2.45123 
+  N0 -0.215548 0.724209 0.655027   N1 -0.387052 0.411886 0.824949   N2 -0.253997 0.272114 0.928138 
+   txt003 
+STRI 
+  V0 2.83978 0.0933642 2.45123   V1 2.95775 0.149383 2.45432   V2 2.91474 0.161728 2.43361 
+  N0 -0.253997 0.272114 0.928138   N1 -0.14959 0.481391 0.863647   N2 -0.215548 0.724209 0.655027 
+   txt003 
+STRI 
+  V0 2.79641 0.10108 2.43193   V1 2.74907 0 2.43125   V2 2.79259 0 2.45 
+  N0 -0.387052 0.411886 0.824949   N1 -0.467888 -4.75841e-16 0.883788   N2 -0.306009 -1.09783e-15 0.952029 
+   txt003 
+STRI 
+  V0 2.79259 0 2.45   V1 2.83978 0.0933642 2.45123   V2 2.79641 0.10108 2.43193 
+  N0 -0.306009 -1.09783e-15 0.952029   N1 -0.253997 0.272114 0.928138   N2 -0.387052 0.411886 0.824949 
+   txt003 
+STRI 
+  V0 3.42963 0 2.46667   V1 3.38244 0.0933642 2.46543   V2 3.38345 0.0833333 2.47578 
+  N0 0.694136 0 -0.719844   N1 0.612385 0.714958 -0.337372   N2 0.0539577 0.111406 0.992309 
+   txt003 
+STRI 
+  V0 3.38345 0.0833333 2.47578   V1 3.42813 0 2.47734   V2 3.42963 0 2.46667 
+  N0 0.0539577 0.111406 0.992309   N1 0.106533 -0 0.994309   N2 0.694136 0 -0.719844 
+   txt003 
+STRI 
+  V0 3.38244 0.0933642 2.46543   V1 3.26447 0.149383 2.46235   V2 3.27176 0.133333 2.47188 
+  N0 0.612385 0.714958 -0.337372   N1 0.218115 0.87054 0.44112   N2 -0.00787186 0.108144 0.994104 
+   txt003 
+STRI 
+  V0 3.27176 0.133333 2.47188   V1 3.38345 0.0833333 2.47578   V2 3.38244 0.0933642 2.46543 
+  N0 -0.00787186 0.108144 0.994104   N1 0.0539577 0.111406 0.992309   N2 0.612385 0.714958 -0.337372 
+   txt003 
+STRI 
+  V0 3.26447 0.149383 2.46235   V1 3.11111 0.168056 2.45833   V2 3.12656 0.15 2.4668 
+  N0 0.218115 0.87054 0.44112   N1 -0.0195232 0.665415 0.746219   N2 -0.0348909 0.0594438 0.997622 
+   txt003 
+STRI 
+  V0 3.12656 0.15 2.4668   V1 3.27176 0.133333 2.47188   V2 3.26447 0.149383 2.46235 
+  N0 -0.0348909 0.0594438 0.997622   N1 -0.00787186 0.108144 0.994104   N2 0.218115 0.87054 0.44112 
+   txt003 
+STRI 
+  V0 3.11111 0.168056 2.45833   V1 2.95775 0.149383 2.45432   V2 2.98137 0.133333 2.46172 
+  N0 -0.0195232 0.665415 0.746219   N1 -0.14959 0.481391 0.863647   N2 -0.0369301 0.00796532 0.999286 
+   txt003 
+STRI 
+  V0 2.98137 0.133333 2.46172   V1 3.12656 0.15 2.4668   V2 3.11111 0.168056 2.45833 
+  N0 -0.0369301 0.00796532 0.999286   N1 -0.0348909 0.0594438 0.997622   N2 -0.0195232 0.665415 0.746219 
+   txt003 
+STRI 
+  V0 2.95775 0.149383 2.45432   V1 2.83978 0.0933642 2.45123   V2 2.86968 0.0833333 2.45781 
+  N0 -0.14959 0.481391 0.863647   N1 -0.253997 0.272114 0.928138   N2 -0.0182321 -0.0210195 0.999613 
+   txt003 
+STRI 
+  V0 2.86968 0.0833333 2.45781   V1 2.98137 0.133333 2.46172   V2 2.95775 0.149383 2.45432 
+  N0 -0.0182321 -0.0210195 0.999613   N1 -0.0369301 0.00796532 0.999286   N2 -0.14959 0.481391 0.863647 
+   txt003 
+STRI 
+  V0 2.83978 0.0933642 2.45123   V1 2.79259 0 2.45   V2 2.825 0 2.45625 
+  N0 -0.253997 0.272114 0.928138   N1 -0.306009 -1.09783e-15 0.952029   N2 2.22045e-15 -2.22045e-15 1 
+   txt003 
+STRI 
+  V0 2.825 0 2.45625   V1 2.86968 0.0833333 2.45781   V2 2.83978 0.0933642 2.45123 
+  N0 2.22045e-15 -2.22045e-15 1   N1 -0.0182321 -0.0210195 0.999613   N2 -0.253997 0.272114 0.928138 
+   txt003 
+STRI 
+  V0 3.42813 0 2.47734   V1 3.38345 0.0833333 2.47578   V2 3.34657 0.0733025 2.46929 
+  N0 0.106533 -0 0.994309   N1 0.0539577 0.111406 0.992309   N2 -0.223743 -0.242919 0.943891 
+   txt003 
+STRI 
+  V0 3.34657 0.0733025 2.46929   V1 3.38704 0 2.47083   V2 3.42813 0 2.47734 
+  N0 -0.223743 -0.242919 0.943891   N1 -0.253109 0 0.967438   N2 0.106533 -0 0.994309 
+   txt003 
+STRI 
+  V0 3.38345 0.0833333 2.47578   V1 3.27176 0.133333 2.47188   V2 3.2454 0.117284 2.46543 
+  N0 0.0539577 0.111406 0.992309   N1 -0.00787186 0.108144 0.994104   N2 -0.144371 -0.459364 0.876437 
+   txt003 
+STRI 
+  V0 3.2454 0.117284 2.46543   V1 3.34657 0.0733025 2.46929   V2 3.38345 0.0833333 2.47578 
+  N0 -0.144371 -0.459364 0.876437   N1 -0.223743 -0.242919 0.943891   N2 0.0539577 0.111406 0.992309 
+   txt003 
+STRI 
+  V0 3.27176 0.133333 2.47188   V1 3.12656 0.15 2.4668   V2 3.11389 0.131944 2.46042 
+  N0 -0.00787186 0.108144 0.994104   N1 -0.0348909 0.0594438 0.997622   N2 -0.0300305 -0.615625 0.787467 
+   txt003 
+STRI 
+  V0 3.11389 0.131944 2.46042   V1 3.2454 0.117284 2.46543   V2 3.27176 0.133333 2.47188 
+  N0 -0.0300305 -0.615625 0.787467   N1 -0.144371 -0.459364 0.876437   N2 -0.00787186 0.108144 0.994104 
+   txt003 
+STRI 
+  V0 3.12656 0.15 2.4668   V1 2.98137 0.133333 2.46172   V2 2.98237 0.117284 2.4554 
+  N0 -0.0348909 0.0594438 0.997622   N1 -0.0369301 0.00796532 0.999286   N2 0.148477 -0.721529 0.676277 
+   txt003 
+STRI 
+  V0 2.98237 0.117284 2.4554   V1 3.11389 0.131944 2.46042   V2 3.12656 0.15 2.4668 
+  N0 0.148477 -0.721529 0.676277   N1 -0.0300305 -0.615625 0.787467   N2 -0.0348909 0.0594438 0.997622 
+   txt003 
+STRI 
+  V0 2.98137 0.133333 2.46172   V1 2.86968 0.0833333 2.45781   V2 2.88121 0.0733025 2.45154 
+  N0 -0.0369301 0.00796532 0.999286   N1 -0.0182321 -0.0210195 0.999613   N2 0.507715 -0.682832 0.525324 
+   txt003 
+STRI 
+  V0 2.88121 0.0733025 2.45154   V1 2.98237 0.117284 2.4554   V2 2.98137 0.133333 2.46172 
+  N0 0.507715 -0.682832 0.525324   N1 0.148477 -0.721529 0.676277   N2 -0.0369301 0.00796532 0.999286 
+   txt003 
+STRI 
+  V0 2.86968 0.0833333 2.45781   V1 2.825 0 2.45625   V2 2.84074 0 2.45 
+  N0 -0.0182321 -0.0210195 0.999613   N1 2.22045e-15 -2.22045e-15 1   N2 0.913812 -4.13289e-15 0.406138 
+   txt003 
+STRI 
+  V0 2.84074 0 2.45   V1 2.88121 0.0733025 2.45154   V2 2.86968 0.0833333 2.45781 
+  N0 0.913812 -4.13289e-15 0.406138   N1 0.507715 -0.682832 0.525324   N2 -0.0182321 -0.0210195 0.999613 
+   txt003 
+STRI 
+  V0 3.38704 0 2.47083   V1 3.34657 0.0733025 2.46929   V2 3.27461 0.0655864 2.44451 
+  N0 -0.253109 0 0.967438   N1 -0.223743 -0.242919 0.943891   N2 -0.316294 -0.364979 0.875641 
+   txt003 
+STRI 
+  V0 3.27461 0.0655864 2.44451   V1 3.30984 0 2.44557   V2 3.38704 0 2.47083 
+  N0 -0.316294 -0.364979 0.875641   N1 -0.349987 0 0.936755   N2 -0.253109 0 0.967438 
+   txt003 
+STRI 
+  V0 3.34657 0.0733025 2.46929   V1 3.2454 0.117284 2.46543   V2 3.18654 0.104938 2.44186 
+  N0 -0.223743 -0.242919 0.943891   N1 -0.144371 -0.459364 0.876437   N2 -0.199105 -0.721639 0.663019 
+   txt003 
+STRI 
+  V0 3.18654 0.104938 2.44186   V1 3.27461 0.0655864 2.44451   V2 3.34657 0.0733025 2.46929 
+  N0 -0.199105 -0.721639 0.663019   N1 -0.316294 -0.364979 0.875641   N2 -0.223743 -0.242919 0.943891 
+   txt003 
+STRI 
+  V0 3.2454 0.117284 2.46543   V1 3.11389 0.131944 2.46042   V2 3.07205 0.118056 2.43841 
+  N0 -0.144371 -0.459364 0.876437   N1 -0.0300305 -0.615625 0.787467   N2 -0.0103804 -0.938666 0.344672 
+   txt003 
+STRI 
+  V0 3.07205 0.118056 2.43841   V1 3.18654 0.104938 2.44186   V2 3.2454 0.117284 2.46543 
+  N0 -0.0103804 -0.938666 0.344672   N1 -0.199105 -0.721639 0.663019   N2 -0.144371 -0.459364 0.876437 
+   txt003 
+STRI 
+  V0 3.11389 0.131944 2.46042   V1 2.98237 0.117284 2.4554   V2 2.95756 0.104938 2.43496 
+  N0 -0.0300305 -0.615625 0.787467   N1 0.148477 -0.721529 0.676277   N2 0.241288 -0.970358 -0.0136399 
+   txt003 
+STRI 
+  V0 2.95756 0.104938 2.43496   V1 3.07205 0.118056 2.43841   V2 3.11389 0.131944 2.46042 
+  N0 0.241288 -0.970358 -0.0136399   N1 -0.0103804 -0.938666 0.344672   N2 -0.0300305 -0.615625 0.787467 
+   txt003 
+STRI 
+  V0 2.98237 0.117284 2.4554   V1 2.88121 0.0733025 2.45154   V2 2.86949 0.0655864 2.43231 
+  N0 0.148477 -0.721529 0.676277   N1 0.507715 -0.682832 0.525324   N2 0.577416 -0.711734 -0.400031 
+   txt003 
+STRI 
+  V0 2.86949 0.0655864 2.43231   V1 2.95756 0.104938 2.43496   V2 2.98237 0.117284 2.4554 
+  N0 0.577416 -0.711734 -0.400031   N1 0.241288 -0.970358 -0.0136399   N2 0.148477 -0.721529 0.676277 
+   txt003 
+STRI 
+  V0 2.88121 0.0733025 2.45154   V1 2.84074 0 2.45   V2 2.83426 0 2.43125 
+  N0 0.507715 -0.682832 0.525324   N1 0.913812 -4.13289e-15 0.406138   N2 0.789352 -1.30938e-15 -0.613941 
+   txt003 
+STRI 
+  V0 2.83426 0 2.43125   V1 2.86949 0.0655864 2.43231   V2 2.88121 0.0733025 2.45154 
+  N0 0.789352 -1.30938e-15 -0.613941   N1 0.577416 -0.711734 -0.400031   N2 0.507715 -0.682832 0.525324 
+   txt003 
+STRI 
+  V0 3.30984 0 2.44557   V1 3.27461 0.0655864 2.44451   V2 3.17037 0.0625 2.4 
+  N0 -0.349987 0 0.936755   N1 -0.316294 -0.364979 0.875641   N2 -0.378646 -0.420717 0.824393 
+   txt003 
+STRI 
+  V0 3.17037 0.0625 2.4   V1 3.2 0 2.4   V2 3.30984 0 2.44557 
+  N0 -0.378646 -0.420717 0.824393   N1 -0.410365 0 0.911922   N2 -0.349987 0 0.936755 
+   txt003 
+STRI 
+  V0 3.27461 0.0655864 2.44451   V1 3.18654 0.104938 2.44186   V2 3.0963 0.1 2.4 
+  N0 -0.316294 -0.364979 0.875641   N1 -0.199105 -0.721639 0.663019   N2 -0.236617 -0.841304 0.486024 
+   txt003 
+STRI 
+  V0 3.0963 0.1 2.4   V1 3.17037 0.0625 2.4   V2 3.27461 0.0655864 2.44451 
+  N0 -0.236617 -0.841304 0.486024   N1 -0.378646 -0.420717 0.824393   N2 -0.316294 -0.364979 0.875641 
+   txt003 
+STRI 
+  V0 3.18654 0.104938 2.44186   V1 3.07205 0.118056 2.43841   V2 3 0.1125 2.4 
+  N0 -0.199105 -0.721639 0.663019   N1 -0.0103804 -0.938666 0.344672   N2 0 -1 0 
+   txt003 
+STRI 
+  V0 3 0.1125 2.4   V1 3.0963 0.1 2.4   V2 3.18654 0.104938 2.44186 
+  N0 0 -1 0   N1 -0.236617 -0.841304 0.486024   N2 -0.199105 -0.721639 0.663019 
+   txt003 
+STRI 
+  V0 3.07205 0.118056 2.43841   V1 2.95756 0.104938 2.43496   V2 2.9037 0.1 2.4 
+  N0 -0.0103804 -0.938666 0.344672   N1 0.241288 -0.970358 -0.0136399   N2 0.247465 -0.879877 -0.405681 
+   txt003 
+STRI 
+  V0 2.9037 0.1 2.4   V1 3 0.1125 2.4   V2 3.07205 0.118056 2.43841 
+  N0 0.247465 -0.879877 -0.405681   N1 0 -1 0   N2 -0.0103804 -0.938666 0.344672 
+   txt003 
+STRI 
+  V0 2.95756 0.104938 2.43496   V1 2.86949 0.0655864 2.43231   V2 2.82963 0.0625 2.4 
+  N0 0.241288 -0.970358 -0.0136399   N1 0.577416 -0.711734 -0.400031   N2 0.483629 -0.537366 -0.690899 
+   txt003 
+STRI 
+  V0 2.82963 0.0625 2.4   V1 2.9037 0.1 2.4   V2 2.95756 0.104938 2.43496 
+  N0 0.483629 -0.537366 -0.690899   N1 0.247465 -0.879877 -0.405681   N2 0.241288 -0.970358 -0.0136399 
+   txt003 
+STRI 
+  V0 2.86949 0.0655864 2.43231   V1 2.83426 0 2.43125   V2 2.8 0 2.4 
+  N0 0.577416 -0.711734 -0.400031   N1 0.789352 -1.30938e-15 -0.613941   N2 0.6 -3.73979e-29 -0.8 
+   txt003 
+STRI 
+  V0 2.8 0 2.4   V1 2.82963 0.0625 2.4   V2 2.86949 0.0655864 2.43231 
+  N0 0.6 -3.73979e-29 -0.8   N1 0.483629 -0.537366 -0.690899   N2 0.577416 -0.711734 -0.400031 
+   txt003 
+STRI 
+  V0 0.268946 -0.0750782 3.12708   V1 0.278704 0 3.12708   V2 0 0 3.15 
+  N0 0.241077 -0.0645609 0.968356   N1 0.249998 0 0.968246   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.241285 -0.141931 3.12708   V1 0.268946 -0.0750782 3.12708   V2 0 0 3.15 
+  N0 0.215548 -0.124615 0.968509   N1 0.241077 -0.0645609 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.19814 -0.19814 3.12708   V1 0.241285 -0.141931 3.12708   V2 0 0 3.15 
+  N0 0.175885 -0.175885 0.96857   N1 0.215548 -0.124615 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.141931 -0.241285 3.12708   V1 0.19814 -0.19814 3.12708   V2 0 0 3.15 
+  N0 0.124615 -0.215548 0.968509   N1 0.175885 -0.175885 0.96857   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.0750782 -0.268946 3.12708   V1 0.141931 -0.241285 3.12708   V2 0 0 3.15 
+  N0 0.0645609 -0.241077 0.968356   N1 0.124615 -0.215548 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0 -0.278704 3.12708   V1 0.0750782 -0.268946 3.12708   V2 0 0 3.15 
+  N0 -2.80184e-15 -0.249998 0.968246   N1 0.0645609 -0.241077 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.278704 0 3.12708   V1 0.268946 -0.0750782 3.12708   V2 0.350254 -0.0977709 3.06667 
+  N0 0.249998 0 0.968246   N1 0.241077 -0.0645609 0.968356   N2 0.955496 -0.255913 0.146755 
+   txt003 
+STRI 
+  V0 0.350254 -0.0977709 3.06667   V1 0.362963 0 3.06667   V2 0.278704 0 3.12708 
+  N0 0.955496 -0.255913 0.146755   N1 0.989203 0 0.146549   N2 0.249998 0 0.968246 
+   txt003 
+STRI 
+  V0 0.268946 -0.0750782 3.12708   V1 0.241285 -0.141931 3.12708   V2 0.314228 -0.184834 3.06667 
+  N0 0.241077 -0.0645609 0.968356   N1 0.215548 -0.124615 0.968509   N2 0.856312 -0.495088 0.147029 
+   txt003 
+STRI 
+  V0 0.314228 -0.184834 3.06667   V1 0.350254 -0.0977709 3.06667   V2 0.268946 -0.0750782 3.12708 
+  N0 0.856312 -0.495088 0.147029   N1 0.955496 -0.255913 0.146755   N2 0.241077 -0.0645609 0.968356 
+   txt003 
+STRI 
+  V0 0.241285 -0.141931 3.12708   V1 0.19814 -0.19814 3.12708   V2 0.258037 -0.258037 3.06667 
+  N0 0.215548 -0.124615 0.968509   N1 0.175885 -0.175885 0.96857   N2 0.699411 -0.699411 0.147135 
+   txt003 
+STRI 
+  V0 0.258037 -0.258037 3.06667   V1 0.314228 -0.184834 3.06667   V2 0.241285 -0.141931 3.12708 
+  N0 0.699411 -0.699411 0.147135   N1 0.856312 -0.495088 0.147029   N2 0.215548 -0.124615 0.968509 
+   txt003 
+STRI 
+  V0 0.19814 -0.19814 3.12708   V1 0.141931 -0.241285 3.12708   V2 0.184834 -0.314228 3.06667 
+  N0 0.175885 -0.175885 0.96857   N1 0.124615 -0.215548 0.968509   N2 0.495088 -0.856312 0.147029 
+   txt003 
+STRI 
+  V0 0.184834 -0.314228 3.06667   V1 0.258037 -0.258037 3.06667   V2 0.19814 -0.19814 3.12708 
+  N0 0.495088 -0.856312 0.147029   N1 0.699411 -0.699411 0.147135   N2 0.175885 -0.175885 0.96857 
+   txt003 
+STRI 
+  V0 0.141931 -0.241285 3.12708   V1 0.0750782 -0.268946 3.12708   V2 0.0977709 -0.350254 3.06667 
+  N0 0.124615 -0.215548 0.968509   N1 0.0645609 -0.241077 0.968356   N2 0.255913 -0.955496 0.146755 
+   txt003 
+STRI 
+  V0 0.0977709 -0.350254 3.06667   V1 0.184834 -0.314228 3.06667   V2 0.141931 -0.241285 3.12708 
+  N0 0.255913 -0.955496 0.146755   N1 0.495088 -0.856312 0.147029   N2 0.124615 -0.215548 0.968509 
+   txt003 
+STRI 
+  V0 0.0750782 -0.268946 3.12708   V1 0 -0.278704 3.12708   V2 0 -0.362963 3.06667 
+  N0 0.0645609 -0.241077 0.968356   N1 -2.80184e-15 -0.249998 0.968246   N2 -4.98112e-16 -0.989203 0.146549 
+   txt003 
+STRI 
+  V0 0 -0.362963 3.06667   V1 0.0977709 -0.350254 3.06667   V2 0.0750782 -0.268946 3.12708 
+  N0 -4.98112e-16 -0.989203 0.146549   N1 0.255913 -0.955496 0.146755   N2 0.0645609 -0.241077 0.968356 
+   txt003 
+STRI 
+  V0 0.362963 0 3.06667   V1 0.350254 -0.0977709 3.06667   V2 0.313617 -0.0875289 2.98125 
+  N0 0.989203 0 0.146549   N1 0.955496 -0.255913 0.146755   N2 0.753688 -0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 0.313617 -0.0875289 2.98125   V1 0.325 0 2.98125   V2 0.362963 0 3.06667 
+  N0 0.753688 -0.201937 -0.625441   N1 0.780869 0 -0.624695   N2 0.989203 0 0.146549 
+   txt003 
+STRI 
+  V0 0.350254 -0.0977709 3.06667   V1 0.314228 -0.184834 3.06667   V2 0.281352 -0.165481 2.98125 
+  N0 0.955496 -0.255913 0.146755   N1 0.856312 -0.495088 0.147029   N2 0.674735 -0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 0.281352 -0.165481 2.98125   V1 0.313617 -0.0875289 2.98125   V2 0.350254 -0.0977709 3.06667 
+  N0 0.674735 -0.390178 -0.626493   N1 0.753688 -0.201937 -0.625441   N2 0.955496 -0.255913 0.146755 
+   txt003 
+STRI 
+  V0 0.314228 -0.184834 3.06667   V1 0.258037 -0.258037 3.06667   V2 0.231031 -0.231031 2.98125 
+  N0 0.856312 -0.495088 0.147029   N1 0.699411 -0.699411 0.147135   N2 0.550896 -0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 0.231031 -0.231031 2.98125   V1 0.281352 -0.165481 2.98125   V2 0.314228 -0.184834 3.06667 
+  N0 0.550896 -0.550896 -0.626919   N1 0.674735 -0.390178 -0.626493   N2 0.856312 -0.495088 0.147029 
+   txt003 
+STRI 
+  V0 0.258037 -0.258037 3.06667   V1 0.184834 -0.314228 3.06667   V2 0.165481 -0.281352 2.98125 
+  N0 0.699411 -0.699411 0.147135   N1 0.495088 -0.856312 0.147029   N2 0.390178 -0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 0.165481 -0.281352 2.98125   V1 0.231031 -0.231031 2.98125   V2 0.258037 -0.258037 3.06667 
+  N0 0.390178 -0.674735 -0.626493   N1 0.550896 -0.550896 -0.626919   N2 0.699411 -0.699411 0.147135 
+   txt003 
+STRI 
+  V0 0.184834 -0.314228 3.06667   V1 0.0977709 -0.350254 3.06667   V2 0.0875289 -0.313617 2.98125 
+  N0 0.495088 -0.856312 0.147029   N1 0.255913 -0.955496 0.146755   N2 0.201937 -0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 0.0875289 -0.313617 2.98125   V1 0.165481 -0.281352 2.98125   V2 0.184834 -0.314228 3.06667 
+  N0 0.201937 -0.753688 -0.625441   N1 0.390178 -0.674735 -0.626493   N2 0.495088 -0.856312 0.147029 
+   txt003 
+STRI 
+  V0 0.0977709 -0.350254 3.06667   V1 0 -0.362963 3.06667   V2 -1.11022e-16 -0.325 2.98125 
+  N0 0.255913 -0.955496 0.146755   N1 -4.98112e-16 -0.989203 0.146549   N2 1.51803e-15 -0.780869 -0.624695 
+   txt003 
+STRI 
+  V0 -1.11022e-16 -0.325 2.98125   V1 0.0875289 -0.313617 2.98125   V2 0.0977709 -0.350254 3.06667 
+  N0 1.51803e-15 -0.780869 -0.624695   N1 0.201937 -0.753688 -0.625441   N2 0.255913 -0.955496 0.146755 
+   txt003 
+STRI 
+  V0 0.325 0 2.98125   V1 0.313617 -0.0875289 2.98125   V2 0.228728 -0.0638032 2.88333 
+  N0 0.780869 0 -0.624695   N1 0.753688 -0.201937 -0.625441   N2 0.721244 -0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 0.228728 -0.0638032 2.88333   V1 0.237037 0 2.88333   V2 0.325 0 2.98125 
+  N0 0.721244 -0.193465 -0.665116   N1 0.747409 0 -0.664364   N2 0.780869 0 -0.624695 
+   txt003 
+STRI 
+  V0 0.313617 -0.0875289 2.98125   V1 0.281352 -0.165481 2.98125   V2 0.20518 -0.120647 2.88333 
+  N0 0.753688 -0.201937 -0.625441   N1 0.674735 -0.390178 -0.626493   N2 0.645526 -0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 0.20518 -0.120647 2.88333   V1 0.228728 -0.0638032 2.88333   V2 0.313617 -0.0875289 2.98125 
+  N0 0.645526 -0.373497 -0.66618   N1 0.721244 -0.193465 -0.665116   N2 0.753688 -0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 0.281352 -0.165481 2.98125   V1 0.231031 -0.231031 2.98125   V2 0.168463 -0.168463 2.88333 
+  N0 0.674735 -0.390178 -0.626493   N1 0.550896 -0.550896 -0.626919   N2 0.527081 -0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 0.168463 -0.168463 2.88333   V1 0.20518 -0.120647 2.88333   V2 0.281352 -0.165481 2.98125 
+  N0 0.527081 -0.527081 -0.666611   N1 0.645526 -0.373497 -0.66618   N2 0.674735 -0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 0.231031 -0.231031 2.98125   V1 0.165481 -0.281352 2.98125   V2 0.120647 -0.20518 2.88333 
+  N0 0.550896 -0.550896 -0.626919   N1 0.390178 -0.674735 -0.626493   N2 0.373497 -0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 0.120647 -0.20518 2.88333   V1 0.168463 -0.168463 2.88333   V2 0.231031 -0.231031 2.98125 
+  N0 0.373497 -0.645526 -0.66618   N1 0.527081 -0.527081 -0.666611   N2 0.550896 -0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 0.165481 -0.281352 2.98125   V1 0.0875289 -0.313617 2.98125   V2 0.0638032 -0.228728 2.88333 
+  N0 0.390178 -0.674735 -0.626493   N1 0.201937 -0.753688 -0.625441   N2 0.193465 -0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 0.0638032 -0.228728 2.88333   V1 0.120647 -0.20518 2.88333   V2 0.165481 -0.281352 2.98125 
+  N0 0.193465 -0.721244 -0.665116   N1 0.373497 -0.645526 -0.66618   N2 0.390178 -0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 0.0875289 -0.313617 2.98125   V1 -1.11022e-16 -0.325 2.98125   V2 -1.11022e-16 -0.237037 2.88333 
+  N0 0.201937 -0.753688 -0.625441   N1 1.51803e-15 -0.780869 -0.624695   N2 2.42292e-15 -0.747409 -0.664364 
+   txt003 
+STRI 
+  V0 -1.11022e-16 -0.237037 2.88333   V1 0.0638032 -0.228728 2.88333   V2 0.0875289 -0.313617 2.98125 
+  N0 2.42292e-15 -0.747409 -0.664364   N1 0.193465 -0.721244 -0.665116   N2 0.201937 -0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 0.237037 0 2.88333   V1 0.228728 -0.0638032 2.88333   V2 0.165279 -0.0460445 2.78542 
+  N0 0.747409 0 -0.664364   N1 0.721244 -0.193465 -0.665116   N2 0.917897 -0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 0.165279 -0.0460445 2.78542   V1 0.171296 0 2.78542   V2 0.237037 0 2.88333 
+  N0 0.917897 -0.246906 -0.310647   N1 0.950775 0 -0.309882   N2 0.747409 0 -0.664364 
+   txt003 
+STRI 
+  V0 0.228728 -0.0638032 2.88333   V1 0.20518 -0.120647 2.88333   V2 0.148234 -0.0871056 2.78542 
+  N0 0.721244 -0.193465 -0.665116   N1 0.645526 -0.373497 -0.66618   N2 0.822132 -0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 0.148234 -0.0871056 2.78542   V1 0.165279 -0.0460445 2.78542   V2 0.228728 -0.0638032 2.88333 
+  N0 0.822132 -0.476337 -0.311772   N1 0.917897 -0.246906 -0.310647   N2 0.721244 -0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 0.20518 -0.120647 2.88333   V1 0.168463 -0.168463 2.88333   V2 0.121672 -0.121672 2.78542 
+  N0 0.645526 -0.373497 -0.66618   N1 0.527081 -0.527081 -0.666611   N2 0.671754 -0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 0.121672 -0.121672 2.78542   V1 0.148234 -0.0871056 2.78542   V2 0.20518 -0.120647 2.88333 
+  N0 0.671754 -0.671754 -0.312241   N1 0.822132 -0.476337 -0.311772   N2 0.645526 -0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 0.168463 -0.168463 2.88333   V1 0.120647 -0.20518 2.88333   V2 0.0871056 -0.148234 2.78542 
+  N0 0.527081 -0.527081 -0.666611   N1 0.373497 -0.645526 -0.66618   N2 0.476337 -0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 0.0871056 -0.148234 2.78542   V1 0.121672 -0.121672 2.78542   V2 0.168463 -0.168463 2.88333 
+  N0 0.476337 -0.822132 -0.311772   N1 0.671754 -0.671754 -0.312241   N2 0.527081 -0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 0.120647 -0.20518 2.88333   V1 0.0638032 -0.228728 2.88333   V2 0.0460445 -0.165279 2.78542 
+  N0 0.373497 -0.645526 -0.66618   N1 0.193465 -0.721244 -0.665116   N2 0.246906 -0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 0.0460445 -0.165279 2.78542   V1 0.0871056 -0.148234 2.78542   V2 0.120647 -0.20518 2.88333 
+  N0 0.246906 -0.917897 -0.310647   N1 0.476337 -0.822132 -0.311772   N2 0.373497 -0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 0.0638032 -0.228728 2.88333   V1 -1.11022e-16 -0.237037 2.88333   V2 -6.66134e-16 -0.171296 2.78542 
+  N0 0.193465 -0.721244 -0.665116   N1 2.42292e-15 -0.747409 -0.664364   N2 2.16507e-15 -0.950775 -0.309882 
+   txt003 
+STRI 
+  V0 -6.66134e-16 -0.171296 2.78542   V1 0.0460445 -0.165279 2.78542   V2 0.0638032 -0.228728 2.88333 
+  N0 2.16507e-15 -0.950775 -0.309882   N1 0.246906 -0.917897 -0.310647   N2 0.193465 -0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 0.171296 0 2.78542   V1 0.165279 -0.0460445 2.78542   V2 0.192963 -0.0537037 2.7 
+  N0 0.950775 0 -0.309882   N1 0.917897 -0.246906 -0.310647   N2 0.578783 -0.15602 0.800417 
+   txt003 
+STRI 
+  V0 0.192963 -0.0537037 2.7   V1 0.2 0 2.7   V2 0.171296 0 2.78542 
+  N0 0.578783 -0.15602 0.800417   N1 0.6 0 0.8   N2 0.950775 0 -0.309882 
+   txt003 
+STRI 
+  V0 0.165279 -0.0460445 2.78542   V1 0.148234 -0.0871056 2.78542   V2 0.173037 -0.10163 2.7 
+  N0 0.917897 -0.246906 -0.310647   N1 0.822132 -0.476337 -0.311772   N2 0.517905 -0.300385 0.800964 
+   txt003 
+STRI 
+  V0 0.173037 -0.10163 2.7   V1 0.192963 -0.0537037 2.7   V2 0.165279 -0.0460445 2.78542 
+  N0 0.517905 -0.300385 0.800964   N1 0.578783 -0.15602 0.800417   N2 0.917897 -0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 0.148234 -0.0871056 2.78542   V1 0.121672 -0.121672 2.78542   V2 0.142 -0.142 2.7 
+  N0 0.822132 -0.476337 -0.311772   N1 0.671754 -0.671754 -0.312241   N2 0.423155 -0.423155 0.801174 
+   txt003 
+STRI 
+  V0 0.142 -0.142 2.7   V1 0.173037 -0.10163 2.7   V2 0.148234 -0.0871056 2.78542 
+  N0 0.423155 -0.423155 0.801174   N1 0.517905 -0.300385 0.800964   N2 0.822132 -0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 0.121672 -0.121672 2.78542   V1 0.0871056 -0.148234 2.78542   V2 0.10163 -0.173037 2.7 
+  N0 0.671754 -0.671754 -0.312241   N1 0.476337 -0.822132 -0.311772   N2 0.300385 -0.517905 0.800964 
+   txt003 
+STRI 
+  V0 0.10163 -0.173037 2.7   V1 0.142 -0.142 2.7   V2 0.121672 -0.121672 2.78542 
+  N0 0.300385 -0.517905 0.800964   N1 0.423155 -0.423155 0.801174   N2 0.671754 -0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 0.0871056 -0.148234 2.78542   V1 0.0460445 -0.165279 2.78542   V2 0.0537037 -0.192963 2.7 
+  N0 0.476337 -0.822132 -0.311772   N1 0.246906 -0.917897 -0.310647   N2 0.15602 -0.578783 0.800417 
+   txt003 
+STRI 
+  V0 0.0537037 -0.192963 2.7   V1 0.10163 -0.173037 2.7   V2 0.0871056 -0.148234 2.78542 
+  N0 0.15602 -0.578783 0.800417   N1 0.300385 -0.517905 0.800964   N2 0.476337 -0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 0.0460445 -0.165279 2.78542   V1 -6.66134e-16 -0.171296 2.78542   V2 0 -0.2 2.7 
+  N0 0.246906 -0.917897 -0.310647   N1 2.16507e-15 -0.950775 -0.309882   N2 -3.17207e-15 -0.6 0.8 
+   txt003 
+STRI 
+  V0 0 -0.2 2.7   V1 0.0537037 -0.192963 2.7   V2 0.0460445 -0.165279 2.78542 
+  N0 -3.17207e-15 -0.6 0.8   N1 0.15602 -0.578783 0.800417   N2 0.246906 -0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 -0.0750782 -0.268946 3.12708   V1 0 -0.278704 3.12708   V2 0 0 3.15 
+  N0 -0.0645609 -0.241077 0.968356   N1 0 -0.249998 0.968246   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.141931 -0.241285 3.12708   V1 -0.0750782 -0.268946 3.12708   V2 0 0 3.15 
+  N0 -0.124615 -0.215548 0.968509   N1 -0.0645609 -0.241077 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.19814 -0.19814 3.12708   V1 -0.141931 -0.241285 3.12708   V2 0 0 3.15 
+  N0 -0.175885 -0.175885 0.96857   N1 -0.124615 -0.215548 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.241285 -0.141931 3.12708   V1 -0.19814 -0.19814 3.12708   V2 0 0 3.15 
+  N0 -0.215548 -0.124615 0.968509   N1 -0.175885 -0.175885 0.96857   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.268946 -0.0750782 3.12708   V1 -0.241285 -0.141931 3.12708   V2 0 0 3.15 
+  N0 -0.241077 -0.0645609 0.968356   N1 -0.215548 -0.124615 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.278704 0 3.12708   V1 -0.268946 -0.0750782 3.12708   V2 0 0 3.15 
+  N0 -0.249998 2.80184e-15 0.968246   N1 -0.241077 -0.0645609 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0 -0.278704 3.12708   V1 -0.0750782 -0.268946 3.12708   V2 -0.0977709 -0.350254 3.06667 
+  N0 0 -0.249998 0.968246   N1 -0.0645609 -0.241077 0.968356   N2 -0.255913 -0.955496 0.146755 
+   txt003 
+STRI 
+  V0 -0.0977709 -0.350254 3.06667   V1 0 -0.362963 3.06667   V2 0 -0.278704 3.12708 
+  N0 -0.255913 -0.955496 0.146755   N1 0 -0.989203 0.146549   N2 0 -0.249998 0.968246 
+   txt003 
+STRI 
+  V0 -0.0750782 -0.268946 3.12708   V1 -0.141931 -0.241285 3.12708   V2 -0.184834 -0.314228 3.06667 
+  N0 -0.0645609 -0.241077 0.968356   N1 -0.124615 -0.215548 0.968509   N2 -0.495088 -0.856312 0.147029 
+   txt003 
+STRI 
+  V0 -0.184834 -0.314228 3.06667   V1 -0.0977709 -0.350254 3.06667   V2 -0.0750782 -0.268946 3.12708 
+  N0 -0.495088 -0.856312 0.147029   N1 -0.255913 -0.955496 0.146755   N2 -0.0645609 -0.241077 0.968356 
+   txt003 
+STRI 
+  V0 -0.141931 -0.241285 3.12708   V1 -0.19814 -0.19814 3.12708   V2 -0.258037 -0.258037 3.06667 
+  N0 -0.124615 -0.215548 0.968509   N1 -0.175885 -0.175885 0.96857   N2 -0.699411 -0.699411 0.147135 
+   txt003 
+STRI 
+  V0 -0.258037 -0.258037 3.06667   V1 -0.184834 -0.314228 3.06667   V2 -0.141931 -0.241285 3.12708 
+  N0 -0.699411 -0.699411 0.147135   N1 -0.495088 -0.856312 0.147029   N2 -0.124615 -0.215548 0.968509 
+   txt003 
+STRI 
+  V0 -0.19814 -0.19814 3.12708   V1 -0.241285 -0.141931 3.12708   V2 -0.314228 -0.184834 3.06667 
+  N0 -0.175885 -0.175885 0.96857   N1 -0.215548 -0.124615 0.968509   N2 -0.856312 -0.495088 0.147029 
+   txt003 
+STRI 
+  V0 -0.314228 -0.184834 3.06667   V1 -0.258037 -0.258037 3.06667   V2 -0.19814 -0.19814 3.12708 
+  N0 -0.856312 -0.495088 0.147029   N1 -0.699411 -0.699411 0.147135   N2 -0.175885 -0.175885 0.96857 
+   txt003 
+STRI 
+  V0 -0.241285 -0.141931 3.12708   V1 -0.268946 -0.0750782 3.12708   V2 -0.350254 -0.0977709 3.06667 
+  N0 -0.215548 -0.124615 0.968509   N1 -0.241077 -0.0645609 0.968356   N2 -0.955496 -0.255913 0.146755 
+   txt003 
+STRI 
+  V0 -0.350254 -0.0977709 3.06667   V1 -0.314228 -0.184834 3.06667   V2 -0.241285 -0.141931 3.12708 
+  N0 -0.955496 -0.255913 0.146755   N1 -0.856312 -0.495088 0.147029   N2 -0.215548 -0.124615 0.968509 
+   txt003 
+STRI 
+  V0 -0.268946 -0.0750782 3.12708   V1 -0.278704 0 3.12708   V2 -0.362963 0 3.06667 
+  N0 -0.241077 -0.0645609 0.968356   N1 -0.249998 2.80184e-15 0.968246   N2 -0.989203 4.98112e-16 0.146549 
+   txt003 
+STRI 
+  V0 -0.362963 0 3.06667   V1 -0.350254 -0.0977709 3.06667   V2 -0.268946 -0.0750782 3.12708 
+  N0 -0.989203 4.98112e-16 0.146549   N1 -0.955496 -0.255913 0.146755   N2 -0.241077 -0.0645609 0.968356 
+   txt003 
+STRI 
+  V0 0 -0.362963 3.06667   V1 -0.0977709 -0.350254 3.06667   V2 -0.0875289 -0.313617 2.98125 
+  N0 0 -0.989203 0.146549   N1 -0.255913 -0.955496 0.146755   N2 -0.201937 -0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 -0.0875289 -0.313617 2.98125   V1 0 -0.325 2.98125   V2 0 -0.362963 3.06667 
+  N0 -0.201937 -0.753688 -0.625441   N1 -0 -0.780869 -0.624695   N2 0 -0.989203 0.146549 
+   txt003 
+STRI 
+  V0 -0.0977709 -0.350254 3.06667   V1 -0.184834 -0.314228 3.06667   V2 -0.165481 -0.281352 2.98125 
+  N0 -0.255913 -0.955496 0.146755   N1 -0.495088 -0.856312 0.147029   N2 -0.390178 -0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 -0.165481 -0.281352 2.98125   V1 -0.0875289 -0.313617 2.98125   V2 -0.0977709 -0.350254 3.06667 
+  N0 -0.390178 -0.674735 -0.626493   N1 -0.201937 -0.753688 -0.625441   N2 -0.255913 -0.955496 0.146755 
+   txt003 
+STRI 
+  V0 -0.184834 -0.314228 3.06667   V1 -0.258037 -0.258037 3.06667   V2 -0.231031 -0.231031 2.98125 
+  N0 -0.495088 -0.856312 0.147029   N1 -0.699411 -0.699411 0.147135   N2 -0.550896 -0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 -0.231031 -0.231031 2.98125   V1 -0.165481 -0.281352 2.98125   V2 -0.184834 -0.314228 3.06667 
+  N0 -0.550896 -0.550896 -0.626919   N1 -0.390178 -0.674735 -0.626493   N2 -0.495088 -0.856312 0.147029 
+   txt003 
+STRI 
+  V0 -0.258037 -0.258037 3.06667   V1 -0.314228 -0.184834 3.06667   V2 -0.281352 -0.165481 2.98125 
+  N0 -0.699411 -0.699411 0.147135   N1 -0.856312 -0.495088 0.147029   N2 -0.674735 -0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 -0.281352 -0.165481 2.98125   V1 -0.231031 -0.231031 2.98125   V2 -0.258037 -0.258037 3.06667 
+  N0 -0.674735 -0.390178 -0.626493   N1 -0.550896 -0.550896 -0.626919   N2 -0.699411 -0.699411 0.147135 
+   txt003 
+STRI 
+  V0 -0.314228 -0.184834 3.06667   V1 -0.350254 -0.0977709 3.06667   V2 -0.313617 -0.0875289 2.98125 
+  N0 -0.856312 -0.495088 0.147029   N1 -0.955496 -0.255913 0.146755   N2 -0.753688 -0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 -0.313617 -0.0875289 2.98125   V1 -0.281352 -0.165481 2.98125   V2 -0.314228 -0.184834 3.06667 
+  N0 -0.753688 -0.201937 -0.625441   N1 -0.674735 -0.390178 -0.626493   N2 -0.856312 -0.495088 0.147029 
+   txt003 
+STRI 
+  V0 -0.350254 -0.0977709 3.06667   V1 -0.362963 0 3.06667   V2 -0.325 1.11022e-16 2.98125 
+  N0 -0.955496 -0.255913 0.146755   N1 -0.989203 4.98112e-16 0.146549   N2 -0.780869 -1.51803e-15 -0.624695 
+   txt003 
+STRI 
+  V0 -0.325 1.11022e-16 2.98125   V1 -0.313617 -0.0875289 2.98125   V2 -0.350254 -0.0977709 3.06667 
+  N0 -0.780869 -1.51803e-15 -0.624695   N1 -0.753688 -0.201937 -0.625441   N2 -0.955496 -0.255913 0.146755 
+   txt003 
+STRI 
+  V0 0 -0.325 2.98125   V1 -0.0875289 -0.313617 2.98125   V2 -0.0638032 -0.228728 2.88333 
+  N0 -0 -0.780869 -0.624695   N1 -0.201937 -0.753688 -0.625441   N2 -0.193465 -0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 -0.0638032 -0.228728 2.88333   V1 0 -0.237037 2.88333   V2 0 -0.325 2.98125 
+  N0 -0.193465 -0.721244 -0.665116   N1 -0 -0.747409 -0.664364   N2 -0 -0.780869 -0.624695 
+   txt003 
+STRI 
+  V0 -0.0875289 -0.313617 2.98125   V1 -0.165481 -0.281352 2.98125   V2 -0.120647 -0.20518 2.88333 
+  N0 -0.201937 -0.753688 -0.625441   N1 -0.390178 -0.674735 -0.626493   N2 -0.373497 -0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 -0.120647 -0.20518 2.88333   V1 -0.0638032 -0.228728 2.88333   V2 -0.0875289 -0.313617 2.98125 
+  N0 -0.373497 -0.645526 -0.66618   N1 -0.193465 -0.721244 -0.665116   N2 -0.201937 -0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 -0.165481 -0.281352 2.98125   V1 -0.231031 -0.231031 2.98125   V2 -0.168463 -0.168463 2.88333 
+  N0 -0.390178 -0.674735 -0.626493   N1 -0.550896 -0.550896 -0.626919   N2 -0.527081 -0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 -0.168463 -0.168463 2.88333   V1 -0.120647 -0.20518 2.88333   V2 -0.165481 -0.281352 2.98125 
+  N0 -0.527081 -0.527081 -0.666611   N1 -0.373497 -0.645526 -0.66618   N2 -0.390178 -0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 -0.231031 -0.231031 2.98125   V1 -0.281352 -0.165481 2.98125   V2 -0.20518 -0.120647 2.88333 
+  N0 -0.550896 -0.550896 -0.626919   N1 -0.674735 -0.390178 -0.626493   N2 -0.645526 -0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 -0.20518 -0.120647 2.88333   V1 -0.168463 -0.168463 2.88333   V2 -0.231031 -0.231031 2.98125 
+  N0 -0.645526 -0.373497 -0.66618   N1 -0.527081 -0.527081 -0.666611   N2 -0.550896 -0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 -0.281352 -0.165481 2.98125   V1 -0.313617 -0.0875289 2.98125   V2 -0.228728 -0.0638032 2.88333 
+  N0 -0.674735 -0.390178 -0.626493   N1 -0.753688 -0.201937 -0.625441   N2 -0.721244 -0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 -0.228728 -0.0638032 2.88333   V1 -0.20518 -0.120647 2.88333   V2 -0.281352 -0.165481 2.98125 
+  N0 -0.721244 -0.193465 -0.665116   N1 -0.645526 -0.373497 -0.66618   N2 -0.674735 -0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 -0.313617 -0.0875289 2.98125   V1 -0.325 1.11022e-16 2.98125   V2 -0.237037 1.11022e-16 2.88333 
+  N0 -0.753688 -0.201937 -0.625441   N1 -0.780869 -1.51803e-15 -0.624695   N2 -0.747409 -2.42292e-15 -0.664364 
+   txt003 
+STRI 
+  V0 -0.237037 1.11022e-16 2.88333   V1 -0.228728 -0.0638032 2.88333   V2 -0.313617 -0.0875289 2.98125 
+  N0 -0.747409 -2.42292e-15 -0.664364   N1 -0.721244 -0.193465 -0.665116   N2 -0.753688 -0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 0 -0.237037 2.88333   V1 -0.0638032 -0.228728 2.88333   V2 -0.0460445 -0.165279 2.78542 
+  N0 -0 -0.747409 -0.664364   N1 -0.193465 -0.721244 -0.665116   N2 -0.246906 -0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 -0.0460445 -0.165279 2.78542   V1 0 -0.171296 2.78542   V2 0 -0.237037 2.88333 
+  N0 -0.246906 -0.917897 -0.310647   N1 -0 -0.950775 -0.309882   N2 -0 -0.747409 -0.664364 
+   txt003 
+STRI 
+  V0 -0.0638032 -0.228728 2.88333   V1 -0.120647 -0.20518 2.88333   V2 -0.0871056 -0.148234 2.78542 
+  N0 -0.193465 -0.721244 -0.665116   N1 -0.373497 -0.645526 -0.66618   N2 -0.476337 -0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 -0.0871056 -0.148234 2.78542   V1 -0.0460445 -0.165279 2.78542   V2 -0.0638032 -0.228728 2.88333 
+  N0 -0.476337 -0.822132 -0.311772   N1 -0.246906 -0.917897 -0.310647   N2 -0.193465 -0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 -0.120647 -0.20518 2.88333   V1 -0.168463 -0.168463 2.88333   V2 -0.121672 -0.121672 2.78542 
+  N0 -0.373497 -0.645526 -0.66618   N1 -0.527081 -0.527081 -0.666611   N2 -0.671754 -0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 -0.121672 -0.121672 2.78542   V1 -0.0871056 -0.148234 2.78542   V2 -0.120647 -0.20518 2.88333 
+  N0 -0.671754 -0.671754 -0.312241   N1 -0.476337 -0.822132 -0.311772   N2 -0.373497 -0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 -0.168463 -0.168463 2.88333   V1 -0.20518 -0.120647 2.88333   V2 -0.148234 -0.0871056 2.78542 
+  N0 -0.527081 -0.527081 -0.666611   N1 -0.645526 -0.373497 -0.66618   N2 -0.822132 -0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 -0.148234 -0.0871056 2.78542   V1 -0.121672 -0.121672 2.78542   V2 -0.168463 -0.168463 2.88333 
+  N0 -0.822132 -0.476337 -0.311772   N1 -0.671754 -0.671754 -0.312241   N2 -0.527081 -0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 -0.20518 -0.120647 2.88333   V1 -0.228728 -0.0638032 2.88333   V2 -0.165279 -0.0460445 2.78542 
+  N0 -0.645526 -0.373497 -0.66618   N1 -0.721244 -0.193465 -0.665116   N2 -0.917897 -0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 -0.165279 -0.0460445 2.78542   V1 -0.148234 -0.0871056 2.78542   V2 -0.20518 -0.120647 2.88333 
+  N0 -0.917897 -0.246906 -0.310647   N1 -0.822132 -0.476337 -0.311772   N2 -0.645526 -0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 -0.228728 -0.0638032 2.88333   V1 -0.237037 1.11022e-16 2.88333   V2 -0.171296 6.66134e-16 2.78542 
+  N0 -0.721244 -0.193465 -0.665116   N1 -0.747409 -2.42292e-15 -0.664364   N2 -0.950775 -2.16507e-15 -0.309882 
+   txt003 
+STRI 
+  V0 -0.171296 6.66134e-16 2.78542   V1 -0.165279 -0.0460445 2.78542   V2 -0.228728 -0.0638032 2.88333 
+  N0 -0.950775 -2.16507e-15 -0.309882   N1 -0.917897 -0.246906 -0.310647   N2 -0.721244 -0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 0 -0.171296 2.78542   V1 -0.0460445 -0.165279 2.78542   V2 -0.0537037 -0.192963 2.7 
+  N0 -0 -0.950775 -0.309882   N1 -0.246906 -0.917897 -0.310647   N2 -0.15602 -0.578783 0.800417 
+   txt003 
+STRI 
+  V0 -0.0537037 -0.192963 2.7   V1 0 -0.2 2.7   V2 0 -0.171296 2.78542 
+  N0 -0.15602 -0.578783 0.800417   N1 0 -0.6 0.8   N2 -0 -0.950775 -0.309882 
+   txt003 
+STRI 
+  V0 -0.0460445 -0.165279 2.78542   V1 -0.0871056 -0.148234 2.78542   V2 -0.10163 -0.173037 2.7 
+  N0 -0.246906 -0.917897 -0.310647   N1 -0.476337 -0.822132 -0.311772   N2 -0.300385 -0.517905 0.800964 
+   txt003 
+STRI 
+  V0 -0.10163 -0.173037 2.7   V1 -0.0537037 -0.192963 2.7   V2 -0.0460445 -0.165279 2.78542 
+  N0 -0.300385 -0.517905 0.800964   N1 -0.15602 -0.578783 0.800417   N2 -0.246906 -0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 -0.0871056 -0.148234 2.78542   V1 -0.121672 -0.121672 2.78542   V2 -0.142 -0.142 2.7 
+  N0 -0.476337 -0.822132 -0.311772   N1 -0.671754 -0.671754 -0.312241   N2 -0.423155 -0.423155 0.801174 
+   txt003 
+STRI 
+  V0 -0.142 -0.142 2.7   V1 -0.10163 -0.173037 2.7   V2 -0.0871056 -0.148234 2.78542 
+  N0 -0.423155 -0.423155 0.801174   N1 -0.300385 -0.517905 0.800964   N2 -0.476337 -0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 -0.121672 -0.121672 2.78542   V1 -0.148234 -0.0871056 2.78542   V2 -0.173037 -0.10163 2.7 
+  N0 -0.671754 -0.671754 -0.312241   N1 -0.822132 -0.476337 -0.311772   N2 -0.517905 -0.300385 0.800964 
+   txt003 
+STRI 
+  V0 -0.173037 -0.10163 2.7   V1 -0.142 -0.142 2.7   V2 -0.121672 -0.121672 2.78542 
+  N0 -0.517905 -0.300385 0.800964   N1 -0.423155 -0.423155 0.801174   N2 -0.671754 -0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 -0.148234 -0.0871056 2.78542   V1 -0.165279 -0.0460445 2.78542   V2 -0.192963 -0.0537037 2.7 
+  N0 -0.822132 -0.476337 -0.311772   N1 -0.917897 -0.246906 -0.310647   N2 -0.578783 -0.15602 0.800417 
+   txt003 
+STRI 
+  V0 -0.192963 -0.0537037 2.7   V1 -0.173037 -0.10163 2.7   V2 -0.148234 -0.0871056 2.78542 
+  N0 -0.578783 -0.15602 0.800417   N1 -0.517905 -0.300385 0.800964   N2 -0.822132 -0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 -0.165279 -0.0460445 2.78542   V1 -0.171296 6.66134e-16 2.78542   V2 -0.2 0 2.7 
+  N0 -0.917897 -0.246906 -0.310647   N1 -0.950775 -2.16507e-15 -0.309882   N2 -0.6 3.17207e-15 0.8 
+   txt003 
+STRI 
+  V0 -0.2 0 2.7   V1 -0.192963 -0.0537037 2.7   V2 -0.165279 -0.0460445 2.78542 
+  N0 -0.6 3.17207e-15 0.8   N1 -0.578783 -0.15602 0.800417   N2 -0.917897 -0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 -0.268946 0.0750782 3.12708   V1 -0.278704 0 3.12708   V2 0 0 3.15 
+  N0 -0.241077 0.0645609 0.968356   N1 -0.249998 0 0.968246   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.241285 0.141931 3.12708   V1 -0.268946 0.0750782 3.12708   V2 0 0 3.15 
+  N0 -0.215548 0.124615 0.968509   N1 -0.241077 0.0645609 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.19814 0.19814 3.12708   V1 -0.241285 0.141931 3.12708   V2 0 0 3.15 
+  N0 -0.175885 0.175885 0.96857   N1 -0.215548 0.124615 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.141931 0.241285 3.12708   V1 -0.19814 0.19814 3.12708   V2 0 0 3.15 
+  N0 -0.124615 0.215548 0.968509   N1 -0.175885 0.175885 0.96857   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.0750782 0.268946 3.12708   V1 -0.141931 0.241285 3.12708   V2 0 0 3.15 
+  N0 -0.0645609 0.241077 0.968356   N1 -0.124615 0.215548 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0 0.278704 3.12708   V1 -0.0750782 0.268946 3.12708   V2 0 0 3.15 
+  N0 2.80184e-15 0.249998 0.968246   N1 -0.0645609 0.241077 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 -0.278704 0 3.12708   V1 -0.268946 0.0750782 3.12708   V2 -0.350254 0.0977709 3.06667 
+  N0 -0.249998 0 0.968246   N1 -0.241077 0.0645609 0.968356   N2 -0.955496 0.255913 0.146755 
+   txt003 
+STRI 
+  V0 -0.350254 0.0977709 3.06667   V1 -0.362963 0 3.06667   V2 -0.278704 0 3.12708 
+  N0 -0.955496 0.255913 0.146755   N1 -0.989203 0 0.146549   N2 -0.249998 0 0.968246 
+   txt003 
+STRI 
+  V0 -0.268946 0.0750782 3.12708   V1 -0.241285 0.141931 3.12708   V2 -0.314228 0.184834 3.06667 
+  N0 -0.241077 0.0645609 0.968356   N1 -0.215548 0.124615 0.968509   N2 -0.856312 0.495088 0.147029 
+   txt003 
+STRI 
+  V0 -0.314228 0.184834 3.06667   V1 -0.350254 0.0977709 3.06667   V2 -0.268946 0.0750782 3.12708 
+  N0 -0.856312 0.495088 0.147029   N1 -0.955496 0.255913 0.146755   N2 -0.241077 0.0645609 0.968356 
+   txt003 
+STRI 
+  V0 -0.241285 0.141931 3.12708   V1 -0.19814 0.19814 3.12708   V2 -0.258037 0.258037 3.06667 
+  N0 -0.215548 0.124615 0.968509   N1 -0.175885 0.175885 0.96857   N2 -0.699411 0.699411 0.147135 
+   txt003 
+STRI 
+  V0 -0.258037 0.258037 3.06667   V1 -0.314228 0.184834 3.06667   V2 -0.241285 0.141931 3.12708 
+  N0 -0.699411 0.699411 0.147135   N1 -0.856312 0.495088 0.147029   N2 -0.215548 0.124615 0.968509 
+   txt003 
+STRI 
+  V0 -0.19814 0.19814 3.12708   V1 -0.141931 0.241285 3.12708   V2 -0.184834 0.314228 3.06667 
+  N0 -0.175885 0.175885 0.96857   N1 -0.124615 0.215548 0.968509   N2 -0.495088 0.856312 0.147029 
+   txt003 
+STRI 
+  V0 -0.184834 0.314228 3.06667   V1 -0.258037 0.258037 3.06667   V2 -0.19814 0.19814 3.12708 
+  N0 -0.495088 0.856312 0.147029   N1 -0.699411 0.699411 0.147135   N2 -0.175885 0.175885 0.96857 
+   txt003 
+STRI 
+  V0 -0.141931 0.241285 3.12708   V1 -0.0750782 0.268946 3.12708   V2 -0.0977709 0.350254 3.06667 
+  N0 -0.124615 0.215548 0.968509   N1 -0.0645609 0.241077 0.968356   N2 -0.255913 0.955496 0.146755 
+   txt003 
+STRI 
+  V0 -0.0977709 0.350254 3.06667   V1 -0.184834 0.314228 3.06667   V2 -0.141931 0.241285 3.12708 
+  N0 -0.255913 0.955496 0.146755   N1 -0.495088 0.856312 0.147029   N2 -0.124615 0.215548 0.968509 
+   txt003 
+STRI 
+  V0 -0.0750782 0.268946 3.12708   V1 0 0.278704 3.12708   V2 0 0.362963 3.06667 
+  N0 -0.0645609 0.241077 0.968356   N1 2.80184e-15 0.249998 0.968246   N2 4.98112e-16 0.989203 0.146549 
+   txt003 
+STRI 
+  V0 0 0.362963 3.06667   V1 -0.0977709 0.350254 3.06667   V2 -0.0750782 0.268946 3.12708 
+  N0 4.98112e-16 0.989203 0.146549   N1 -0.255913 0.955496 0.146755   N2 -0.0645609 0.241077 0.968356 
+   txt003 
+STRI 
+  V0 -0.362963 0 3.06667   V1 -0.350254 0.0977709 3.06667   V2 -0.313617 0.0875289 2.98125 
+  N0 -0.989203 0 0.146549   N1 -0.955496 0.255913 0.146755   N2 -0.753688 0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 -0.313617 0.0875289 2.98125   V1 -0.325 0 2.98125   V2 -0.362963 0 3.06667 
+  N0 -0.753688 0.201937 -0.625441   N1 -0.780869 0 -0.624695   N2 -0.989203 0 0.146549 
+   txt003 
+STRI 
+  V0 -0.350254 0.0977709 3.06667   V1 -0.314228 0.184834 3.06667   V2 -0.281352 0.165481 2.98125 
+  N0 -0.955496 0.255913 0.146755   N1 -0.856312 0.495088 0.147029   N2 -0.674735 0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 -0.281352 0.165481 2.98125   V1 -0.313617 0.0875289 2.98125   V2 -0.350254 0.0977709 3.06667 
+  N0 -0.674735 0.390178 -0.626493   N1 -0.753688 0.201937 -0.625441   N2 -0.955496 0.255913 0.146755 
+   txt003 
+STRI 
+  V0 -0.314228 0.184834 3.06667   V1 -0.258037 0.258037 3.06667   V2 -0.231031 0.231031 2.98125 
+  N0 -0.856312 0.495088 0.147029   N1 -0.699411 0.699411 0.147135   N2 -0.550896 0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 -0.231031 0.231031 2.98125   V1 -0.281352 0.165481 2.98125   V2 -0.314228 0.184834 3.06667 
+  N0 -0.550896 0.550896 -0.626919   N1 -0.674735 0.390178 -0.626493   N2 -0.856312 0.495088 0.147029 
+   txt003 
+STRI 
+  V0 -0.258037 0.258037 3.06667   V1 -0.184834 0.314228 3.06667   V2 -0.165481 0.281352 2.98125 
+  N0 -0.699411 0.699411 0.147135   N1 -0.495088 0.856312 0.147029   N2 -0.390178 0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 -0.165481 0.281352 2.98125   V1 -0.231031 0.231031 2.98125   V2 -0.258037 0.258037 3.06667 
+  N0 -0.390178 0.674735 -0.626493   N1 -0.550896 0.550896 -0.626919   N2 -0.699411 0.699411 0.147135 
+   txt003 
+STRI 
+  V0 -0.184834 0.314228 3.06667   V1 -0.0977709 0.350254 3.06667   V2 -0.0875289 0.313617 2.98125 
+  N0 -0.495088 0.856312 0.147029   N1 -0.255913 0.955496 0.146755   N2 -0.201937 0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 -0.0875289 0.313617 2.98125   V1 -0.165481 0.281352 2.98125   V2 -0.184834 0.314228 3.06667 
+  N0 -0.201937 0.753688 -0.625441   N1 -0.390178 0.674735 -0.626493   N2 -0.495088 0.856312 0.147029 
+   txt003 
+STRI 
+  V0 -0.0977709 0.350254 3.06667   V1 0 0.362963 3.06667   V2 1.11022e-16 0.325 2.98125 
+  N0 -0.255913 0.955496 0.146755   N1 4.98112e-16 0.989203 0.146549   N2 -1.51803e-15 0.780869 -0.624695 
+   txt003 
+STRI 
+  V0 1.11022e-16 0.325 2.98125   V1 -0.0875289 0.313617 2.98125   V2 -0.0977709 0.350254 3.06667 
+  N0 -1.51803e-15 0.780869 -0.624695   N1 -0.201937 0.753688 -0.625441   N2 -0.255913 0.955496 0.146755 
+   txt003 
+STRI 
+  V0 -0.325 0 2.98125   V1 -0.313617 0.0875289 2.98125   V2 -0.228728 0.0638032 2.88333 
+  N0 -0.780869 0 -0.624695   N1 -0.753688 0.201937 -0.625441   N2 -0.721244 0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 -0.228728 0.0638032 2.88333   V1 -0.237037 0 2.88333   V2 -0.325 0 2.98125 
+  N0 -0.721244 0.193465 -0.665116   N1 -0.747409 0 -0.664364   N2 -0.780869 0 -0.624695 
+   txt003 
+STRI 
+  V0 -0.313617 0.0875289 2.98125   V1 -0.281352 0.165481 2.98125   V2 -0.20518 0.120647 2.88333 
+  N0 -0.753688 0.201937 -0.625441   N1 -0.674735 0.390178 -0.626493   N2 -0.645526 0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 -0.20518 0.120647 2.88333   V1 -0.228728 0.0638032 2.88333   V2 -0.313617 0.0875289 2.98125 
+  N0 -0.645526 0.373497 -0.66618   N1 -0.721244 0.193465 -0.665116   N2 -0.753688 0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 -0.281352 0.165481 2.98125   V1 -0.231031 0.231031 2.98125   V2 -0.168463 0.168463 2.88333 
+  N0 -0.674735 0.390178 -0.626493   N1 -0.550896 0.550896 -0.626919   N2 -0.527081 0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 -0.168463 0.168463 2.88333   V1 -0.20518 0.120647 2.88333   V2 -0.281352 0.165481 2.98125 
+  N0 -0.527081 0.527081 -0.666611   N1 -0.645526 0.373497 -0.66618   N2 -0.674735 0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 -0.231031 0.231031 2.98125   V1 -0.165481 0.281352 2.98125   V2 -0.120647 0.20518 2.88333 
+  N0 -0.550896 0.550896 -0.626919   N1 -0.390178 0.674735 -0.626493   N2 -0.373497 0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 -0.120647 0.20518 2.88333   V1 -0.168463 0.168463 2.88333   V2 -0.231031 0.231031 2.98125 
+  N0 -0.373497 0.645526 -0.66618   N1 -0.527081 0.527081 -0.666611   N2 -0.550896 0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 -0.165481 0.281352 2.98125   V1 -0.0875289 0.313617 2.98125   V2 -0.0638032 0.228728 2.88333 
+  N0 -0.390178 0.674735 -0.626493   N1 -0.201937 0.753688 -0.625441   N2 -0.193465 0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 -0.0638032 0.228728 2.88333   V1 -0.120647 0.20518 2.88333   V2 -0.165481 0.281352 2.98125 
+  N0 -0.193465 0.721244 -0.665116   N1 -0.373497 0.645526 -0.66618   N2 -0.390178 0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 -0.0875289 0.313617 2.98125   V1 1.11022e-16 0.325 2.98125   V2 1.11022e-16 0.237037 2.88333 
+  N0 -0.201937 0.753688 -0.625441   N1 -1.51803e-15 0.780869 -0.624695   N2 -2.42292e-15 0.747409 -0.664364 
+   txt003 
+STRI 
+  V0 1.11022e-16 0.237037 2.88333   V1 -0.0638032 0.228728 2.88333   V2 -0.0875289 0.313617 2.98125 
+  N0 -2.42292e-15 0.747409 -0.664364   N1 -0.193465 0.721244 -0.665116   N2 -0.201937 0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 -0.237037 0 2.88333   V1 -0.228728 0.0638032 2.88333   V2 -0.165279 0.0460445 2.78542 
+  N0 -0.747409 0 -0.664364   N1 -0.721244 0.193465 -0.665116   N2 -0.917897 0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 -0.165279 0.0460445 2.78542   V1 -0.171296 0 2.78542   V2 -0.237037 0 2.88333 
+  N0 -0.917897 0.246906 -0.310647   N1 -0.950775 0 -0.309882   N2 -0.747409 0 -0.664364 
+   txt003 
+STRI 
+  V0 -0.228728 0.0638032 2.88333   V1 -0.20518 0.120647 2.88333   V2 -0.148234 0.0871056 2.78542 
+  N0 -0.721244 0.193465 -0.665116   N1 -0.645526 0.373497 -0.66618   N2 -0.822132 0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 -0.148234 0.0871056 2.78542   V1 -0.165279 0.0460445 2.78542   V2 -0.228728 0.0638032 2.88333 
+  N0 -0.822132 0.476337 -0.311772   N1 -0.917897 0.246906 -0.310647   N2 -0.721244 0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 -0.20518 0.120647 2.88333   V1 -0.168463 0.168463 2.88333   V2 -0.121672 0.121672 2.78542 
+  N0 -0.645526 0.373497 -0.66618   N1 -0.527081 0.527081 -0.666611   N2 -0.671754 0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 -0.121672 0.121672 2.78542   V1 -0.148234 0.0871056 2.78542   V2 -0.20518 0.120647 2.88333 
+  N0 -0.671754 0.671754 -0.312241   N1 -0.822132 0.476337 -0.311772   N2 -0.645526 0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 -0.168463 0.168463 2.88333   V1 -0.120647 0.20518 2.88333   V2 -0.0871056 0.148234 2.78542 
+  N0 -0.527081 0.527081 -0.666611   N1 -0.373497 0.645526 -0.66618   N2 -0.476337 0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 -0.0871056 0.148234 2.78542   V1 -0.121672 0.121672 2.78542   V2 -0.168463 0.168463 2.88333 
+  N0 -0.476337 0.822132 -0.311772   N1 -0.671754 0.671754 -0.312241   N2 -0.527081 0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 -0.120647 0.20518 2.88333   V1 -0.0638032 0.228728 2.88333   V2 -0.0460445 0.165279 2.78542 
+  N0 -0.373497 0.645526 -0.66618   N1 -0.193465 0.721244 -0.665116   N2 -0.246906 0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 -0.0460445 0.165279 2.78542   V1 -0.0871056 0.148234 2.78542   V2 -0.120647 0.20518 2.88333 
+  N0 -0.246906 0.917897 -0.310647   N1 -0.476337 0.822132 -0.311772   N2 -0.373497 0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 -0.0638032 0.228728 2.88333   V1 1.11022e-16 0.237037 2.88333   V2 6.66134e-16 0.171296 2.78542 
+  N0 -0.193465 0.721244 -0.665116   N1 -2.42292e-15 0.747409 -0.664364   N2 -2.16507e-15 0.950775 -0.309882 
+   txt003 
+STRI 
+  V0 6.66134e-16 0.171296 2.78542   V1 -0.0460445 0.165279 2.78542   V2 -0.0638032 0.228728 2.88333 
+  N0 -2.16507e-15 0.950775 -0.309882   N1 -0.246906 0.917897 -0.310647   N2 -0.193465 0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 -0.171296 0 2.78542   V1 -0.165279 0.0460445 2.78542   V2 -0.192963 0.0537037 2.7 
+  N0 -0.950775 0 -0.309882   N1 -0.917897 0.246906 -0.310647   N2 -0.578783 0.15602 0.800417 
+   txt003 
+STRI 
+  V0 -0.192963 0.0537037 2.7   V1 -0.2 0 2.7   V2 -0.171296 0 2.78542 
+  N0 -0.578783 0.15602 0.800417   N1 -0.6 0 0.8   N2 -0.950775 0 -0.309882 
+   txt003 
+STRI 
+  V0 -0.165279 0.0460445 2.78542   V1 -0.148234 0.0871056 2.78542   V2 -0.173037 0.10163 2.7 
+  N0 -0.917897 0.246906 -0.310647   N1 -0.822132 0.476337 -0.311772   N2 -0.517905 0.300385 0.800964 
+   txt003 
+STRI 
+  V0 -0.173037 0.10163 2.7   V1 -0.192963 0.0537037 2.7   V2 -0.165279 0.0460445 2.78542 
+  N0 -0.517905 0.300385 0.800964   N1 -0.578783 0.15602 0.800417   N2 -0.917897 0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 -0.148234 0.0871056 2.78542   V1 -0.121672 0.121672 2.78542   V2 -0.142 0.142 2.7 
+  N0 -0.822132 0.476337 -0.311772   N1 -0.671754 0.671754 -0.312241   N2 -0.423155 0.423155 0.801174 
+   txt003 
+STRI 
+  V0 -0.142 0.142 2.7   V1 -0.173037 0.10163 2.7   V2 -0.148234 0.0871056 2.78542 
+  N0 -0.423155 0.423155 0.801174   N1 -0.517905 0.300385 0.800964   N2 -0.822132 0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 -0.121672 0.121672 2.78542   V1 -0.0871056 0.148234 2.78542   V2 -0.10163 0.173037 2.7 
+  N0 -0.671754 0.671754 -0.312241   N1 -0.476337 0.822132 -0.311772   N2 -0.300385 0.517905 0.800964 
+   txt003 
+STRI 
+  V0 -0.10163 0.173037 2.7   V1 -0.142 0.142 2.7   V2 -0.121672 0.121672 2.78542 
+  N0 -0.300385 0.517905 0.800964   N1 -0.423155 0.423155 0.801174   N2 -0.671754 0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 -0.0871056 0.148234 2.78542   V1 -0.0460445 0.165279 2.78542   V2 -0.0537037 0.192963 2.7 
+  N0 -0.476337 0.822132 -0.311772   N1 -0.246906 0.917897 -0.310647   N2 -0.15602 0.578783 0.800417 
+   txt003 
+STRI 
+  V0 -0.0537037 0.192963 2.7   V1 -0.10163 0.173037 2.7   V2 -0.0871056 0.148234 2.78542 
+  N0 -0.15602 0.578783 0.800417   N1 -0.300385 0.517905 0.800964   N2 -0.476337 0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 -0.0460445 0.165279 2.78542   V1 6.66134e-16 0.171296 2.78542   V2 0 0.2 2.7 
+  N0 -0.246906 0.917897 -0.310647   N1 -2.16507e-15 0.950775 -0.309882   N2 3.17207e-15 0.6 0.8 
+   txt003 
+STRI 
+  V0 0 0.2 2.7   V1 -0.0537037 0.192963 2.7   V2 -0.0460445 0.165279 2.78542 
+  N0 3.17207e-15 0.6 0.8   N1 -0.15602 0.578783 0.800417   N2 -0.246906 0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 0.0750782 0.268946 3.12708   V1 0 0.278704 3.12708   V2 0 0 3.15 
+  N0 0.0645609 0.241077 0.968356   N1 -0 0.249998 0.968246   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.141931 0.241285 3.12708   V1 0.0750782 0.268946 3.12708   V2 0 0 3.15 
+  N0 0.124615 0.215548 0.968509   N1 0.0645609 0.241077 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.19814 0.19814 3.12708   V1 0.141931 0.241285 3.12708   V2 0 0 3.15 
+  N0 0.175885 0.175885 0.96857   N1 0.124615 0.215548 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.241285 0.141931 3.12708   V1 0.19814 0.19814 3.12708   V2 0 0 3.15 
+  N0 0.215548 0.124615 0.968509   N1 0.175885 0.175885 0.96857   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.268946 0.0750782 3.12708   V1 0.241285 0.141931 3.12708   V2 0 0 3.15 
+  N0 0.241077 0.0645609 0.968356   N1 0.215548 0.124615 0.968509   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0.278704 0 3.12708   V1 0.268946 0.0750782 3.12708   V2 0 0 3.15 
+  N0 0.249998 -2.80184e-15 0.968246   N1 0.241077 0.0645609 0.968356   N2 0 0 1 
+   txt003 
+STRI 
+  V0 0 0.278704 3.12708   V1 0.0750782 0.268946 3.12708   V2 0.0977709 0.350254 3.06667 
+  N0 -0 0.249998 0.968246   N1 0.0645609 0.241077 0.968356   N2 0.255913 0.955496 0.146755 
+   txt003 
+STRI 
+  V0 0.0977709 0.350254 3.06667   V1 0 0.362963 3.06667   V2 0 0.278704 3.12708 
+  N0 0.255913 0.955496 0.146755   N1 -0 0.989203 0.146549   N2 -0 0.249998 0.968246 
+   txt003 
+STRI 
+  V0 0.0750782 0.268946 3.12708   V1 0.141931 0.241285 3.12708   V2 0.184834 0.314228 3.06667 
+  N0 0.0645609 0.241077 0.968356   N1 0.124615 0.215548 0.968509   N2 0.495088 0.856312 0.147029 
+   txt003 
+STRI 
+  V0 0.184834 0.314228 3.06667   V1 0.0977709 0.350254 3.06667   V2 0.0750782 0.268946 3.12708 
+  N0 0.495088 0.856312 0.147029   N1 0.255913 0.955496 0.146755   N2 0.0645609 0.241077 0.968356 
+   txt003 
+STRI 
+  V0 0.141931 0.241285 3.12708   V1 0.19814 0.19814 3.12708   V2 0.258037 0.258037 3.06667 
+  N0 0.124615 0.215548 0.968509   N1 0.175885 0.175885 0.96857   N2 0.699411 0.699411 0.147135 
+   txt003 
+STRI 
+  V0 0.258037 0.258037 3.06667   V1 0.184834 0.314228 3.06667   V2 0.141931 0.241285 3.12708 
+  N0 0.699411 0.699411 0.147135   N1 0.495088 0.856312 0.147029   N2 0.124615 0.215548 0.968509 
+   txt003 
+STRI 
+  V0 0.19814 0.19814 3.12708   V1 0.241285 0.141931 3.12708   V2 0.314228 0.184834 3.06667 
+  N0 0.175885 0.175885 0.96857   N1 0.215548 0.124615 0.968509   N2 0.856312 0.495088 0.147029 
+   txt003 
+STRI 
+  V0 0.314228 0.184834 3.06667   V1 0.258037 0.258037 3.06667   V2 0.19814 0.19814 3.12708 
+  N0 0.856312 0.495088 0.147029   N1 0.699411 0.699411 0.147135   N2 0.175885 0.175885 0.96857 
+   txt003 
+STRI 
+  V0 0.241285 0.141931 3.12708   V1 0.268946 0.0750782 3.12708   V2 0.350254 0.0977709 3.06667 
+  N0 0.215548 0.124615 0.968509   N1 0.241077 0.0645609 0.968356   N2 0.955496 0.255913 0.146755 
+   txt003 
+STRI 
+  V0 0.350254 0.0977709 3.06667   V1 0.314228 0.184834 3.06667   V2 0.241285 0.141931 3.12708 
+  N0 0.955496 0.255913 0.146755   N1 0.856312 0.495088 0.147029   N2 0.215548 0.124615 0.968509 
+   txt003 
+STRI 
+  V0 0.268946 0.0750782 3.12708   V1 0.278704 0 3.12708   V2 0.362963 0 3.06667 
+  N0 0.241077 0.0645609 0.968356   N1 0.249998 -2.80184e-15 0.968246   N2 0.989203 -4.98112e-16 0.146549 
+   txt003 
+STRI 
+  V0 0.362963 0 3.06667   V1 0.350254 0.0977709 3.06667   V2 0.268946 0.0750782 3.12708 
+  N0 0.989203 -4.98112e-16 0.146549   N1 0.955496 0.255913 0.146755   N2 0.241077 0.0645609 0.968356 
+   txt003 
+STRI 
+  V0 0 0.362963 3.06667   V1 0.0977709 0.350254 3.06667   V2 0.0875289 0.313617 2.98125 
+  N0 -0 0.989203 0.146549   N1 0.255913 0.955496 0.146755   N2 0.201937 0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 0.0875289 0.313617 2.98125   V1 0 0.325 2.98125   V2 0 0.362963 3.06667 
+  N0 0.201937 0.753688 -0.625441   N1 0 0.780869 -0.624695   N2 -0 0.989203 0.146549 
+   txt003 
+STRI 
+  V0 0.0977709 0.350254 3.06667   V1 0.184834 0.314228 3.06667   V2 0.165481 0.281352 2.98125 
+  N0 0.255913 0.955496 0.146755   N1 0.495088 0.856312 0.147029   N2 0.390178 0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 0.165481 0.281352 2.98125   V1 0.0875289 0.313617 2.98125   V2 0.0977709 0.350254 3.06667 
+  N0 0.390178 0.674735 -0.626493   N1 0.201937 0.753688 -0.625441   N2 0.255913 0.955496 0.146755 
+   txt003 
+STRI 
+  V0 0.184834 0.314228 3.06667   V1 0.258037 0.258037 3.06667   V2 0.231031 0.231031 2.98125 
+  N0 0.495088 0.856312 0.147029   N1 0.699411 0.699411 0.147135   N2 0.550896 0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 0.231031 0.231031 2.98125   V1 0.165481 0.281352 2.98125   V2 0.184834 0.314228 3.06667 
+  N0 0.550896 0.550896 -0.626919   N1 0.390178 0.674735 -0.626493   N2 0.495088 0.856312 0.147029 
+   txt003 
+STRI 
+  V0 0.258037 0.258037 3.06667   V1 0.314228 0.184834 3.06667   V2 0.281352 0.165481 2.98125 
+  N0 0.699411 0.699411 0.147135   N1 0.856312 0.495088 0.147029   N2 0.674735 0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 0.281352 0.165481 2.98125   V1 0.231031 0.231031 2.98125   V2 0.258037 0.258037 3.06667 
+  N0 0.674735 0.390178 -0.626493   N1 0.550896 0.550896 -0.626919   N2 0.699411 0.699411 0.147135 
+   txt003 
+STRI 
+  V0 0.314228 0.184834 3.06667   V1 0.350254 0.0977709 3.06667   V2 0.313617 0.0875289 2.98125 
+  N0 0.856312 0.495088 0.147029   N1 0.955496 0.255913 0.146755   N2 0.753688 0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 0.313617 0.0875289 2.98125   V1 0.281352 0.165481 2.98125   V2 0.314228 0.184834 3.06667 
+  N0 0.753688 0.201937 -0.625441   N1 0.674735 0.390178 -0.626493   N2 0.856312 0.495088 0.147029 
+   txt003 
+STRI 
+  V0 0.350254 0.0977709 3.06667   V1 0.362963 0 3.06667   V2 0.325 -1.11022e-16 2.98125 
+  N0 0.955496 0.255913 0.146755   N1 0.989203 -4.98112e-16 0.146549   N2 0.780869 1.51803e-15 -0.624695 
+   txt003 
+STRI 
+  V0 0.325 -1.11022e-16 2.98125   V1 0.313617 0.0875289 2.98125   V2 0.350254 0.0977709 3.06667 
+  N0 0.780869 1.51803e-15 -0.624695   N1 0.753688 0.201937 -0.625441   N2 0.955496 0.255913 0.146755 
+   txt003 
+STRI 
+  V0 0 0.325 2.98125   V1 0.0875289 0.313617 2.98125   V2 0.0638032 0.228728 2.88333 
+  N0 0 0.780869 -0.624695   N1 0.201937 0.753688 -0.625441   N2 0.193465 0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 0.0638032 0.228728 2.88333   V1 0 0.237037 2.88333   V2 0 0.325 2.98125 
+  N0 0.193465 0.721244 -0.665116   N1 0 0.747409 -0.664364   N2 0 0.780869 -0.624695 
+   txt003 
+STRI 
+  V0 0.0875289 0.313617 2.98125   V1 0.165481 0.281352 2.98125   V2 0.120647 0.20518 2.88333 
+  N0 0.201937 0.753688 -0.625441   N1 0.390178 0.674735 -0.626493   N2 0.373497 0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 0.120647 0.20518 2.88333   V1 0.0638032 0.228728 2.88333   V2 0.0875289 0.313617 2.98125 
+  N0 0.373497 0.645526 -0.66618   N1 0.193465 0.721244 -0.665116   N2 0.201937 0.753688 -0.625441 
+   txt003 
+STRI 
+  V0 0.165481 0.281352 2.98125   V1 0.231031 0.231031 2.98125   V2 0.168463 0.168463 2.88333 
+  N0 0.390178 0.674735 -0.626493   N1 0.550896 0.550896 -0.626919   N2 0.527081 0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 0.168463 0.168463 2.88333   V1 0.120647 0.20518 2.88333   V2 0.165481 0.281352 2.98125 
+  N0 0.527081 0.527081 -0.666611   N1 0.373497 0.645526 -0.66618   N2 0.390178 0.674735 -0.626493 
+   txt003 
+STRI 
+  V0 0.231031 0.231031 2.98125   V1 0.281352 0.165481 2.98125   V2 0.20518 0.120647 2.88333 
+  N0 0.550896 0.550896 -0.626919   N1 0.674735 0.390178 -0.626493   N2 0.645526 0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 0.20518 0.120647 2.88333   V1 0.168463 0.168463 2.88333   V2 0.231031 0.231031 2.98125 
+  N0 0.645526 0.373497 -0.66618   N1 0.527081 0.527081 -0.666611   N2 0.550896 0.550896 -0.626919 
+   txt003 
+STRI 
+  V0 0.281352 0.165481 2.98125   V1 0.313617 0.0875289 2.98125   V2 0.228728 0.0638032 2.88333 
+  N0 0.674735 0.390178 -0.626493   N1 0.753688 0.201937 -0.625441   N2 0.721244 0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 0.228728 0.0638032 2.88333   V1 0.20518 0.120647 2.88333   V2 0.281352 0.165481 2.98125 
+  N0 0.721244 0.193465 -0.665116   N1 0.645526 0.373497 -0.66618   N2 0.674735 0.390178 -0.626493 
+   txt003 
+STRI 
+  V0 0.313617 0.0875289 2.98125   V1 0.325 -1.11022e-16 2.98125   V2 0.237037 -1.11022e-16 2.88333 
+  N0 0.753688 0.201937 -0.625441   N1 0.780869 1.51803e-15 -0.624695   N2 0.747409 2.42292e-15 -0.664364 
+   txt003 
+STRI 
+  V0 0.237037 -1.11022e-16 2.88333   V1 0.228728 0.0638032 2.88333   V2 0.313617 0.0875289 2.98125 
+  N0 0.747409 2.42292e-15 -0.664364   N1 0.721244 0.193465 -0.665116   N2 0.753688 0.201937 -0.625441 
+   txt003 
+STRI 
+  V0 0 0.237037 2.88333   V1 0.0638032 0.228728 2.88333   V2 0.0460445 0.165279 2.78542 
+  N0 0 0.747409 -0.664364   N1 0.193465 0.721244 -0.665116   N2 0.246906 0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 0.0460445 0.165279 2.78542   V1 0 0.171296 2.78542   V2 0 0.237037 2.88333 
+  N0 0.246906 0.917897 -0.310647   N1 0 0.950775 -0.309882   N2 0 0.747409 -0.664364 
+   txt003 
+STRI 
+  V0 0.0638032 0.228728 2.88333   V1 0.120647 0.20518 2.88333   V2 0.0871056 0.148234 2.78542 
+  N0 0.193465 0.721244 -0.665116   N1 0.373497 0.645526 -0.66618   N2 0.476337 0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 0.0871056 0.148234 2.78542   V1 0.0460445 0.165279 2.78542   V2 0.0638032 0.228728 2.88333 
+  N0 0.476337 0.822132 -0.311772   N1 0.246906 0.917897 -0.310647   N2 0.193465 0.721244 -0.665116 
+   txt003 
+STRI 
+  V0 0.120647 0.20518 2.88333   V1 0.168463 0.168463 2.88333   V2 0.121672 0.121672 2.78542 
+  N0 0.373497 0.645526 -0.66618   N1 0.527081 0.527081 -0.666611   N2 0.671754 0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 0.121672 0.121672 2.78542   V1 0.0871056 0.148234 2.78542   V2 0.120647 0.20518 2.88333 
+  N0 0.671754 0.671754 -0.312241   N1 0.476337 0.822132 -0.311772   N2 0.373497 0.645526 -0.66618 
+   txt003 
+STRI 
+  V0 0.168463 0.168463 2.88333   V1 0.20518 0.120647 2.88333   V2 0.148234 0.0871056 2.78542 
+  N0 0.527081 0.527081 -0.666611   N1 0.645526 0.373497 -0.66618   N2 0.822132 0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 0.148234 0.0871056 2.78542   V1 0.121672 0.121672 2.78542   V2 0.168463 0.168463 2.88333 
+  N0 0.822132 0.476337 -0.311772   N1 0.671754 0.671754 -0.312241   N2 0.527081 0.527081 -0.666611 
+   txt003 
+STRI 
+  V0 0.20518 0.120647 2.88333   V1 0.228728 0.0638032 2.88333   V2 0.165279 0.0460445 2.78542 
+  N0 0.645526 0.373497 -0.66618   N1 0.721244 0.193465 -0.665116   N2 0.917897 0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 0.165279 0.0460445 2.78542   V1 0.148234 0.0871056 2.78542   V2 0.20518 0.120647 2.88333 
+  N0 0.917897 0.246906 -0.310647   N1 0.822132 0.476337 -0.311772   N2 0.645526 0.373497 -0.66618 
+   txt003 
+STRI 
+  V0 0.228728 0.0638032 2.88333   V1 0.237037 -1.11022e-16 2.88333   V2 0.171296 -6.66134e-16 2.78542 
+  N0 0.721244 0.193465 -0.665116   N1 0.747409 2.42292e-15 -0.664364   N2 0.950775 2.16507e-15 -0.309882 
+   txt003 
+STRI 
+  V0 0.171296 -6.66134e-16 2.78542   V1 0.165279 0.0460445 2.78542   V2 0.228728 0.0638032 2.88333 
+  N0 0.950775 2.16507e-15 -0.309882   N1 0.917897 0.246906 -0.310647   N2 0.721244 0.193465 -0.665116 
+   txt003 
+STRI 
+  V0 0 0.171296 2.78542   V1 0.0460445 0.165279 2.78542   V2 0.0537037 0.192963 2.7 
+  N0 0 0.950775 -0.309882   N1 0.246906 0.917897 -0.310647   N2 0.15602 0.578783 0.800417 
+   txt003 
+STRI 
+  V0 0.0537037 0.192963 2.7   V1 0 0.2 2.7   V2 0 0.171296 2.78542 
+  N0 0.15602 0.578783 0.800417   N1 -0 0.6 0.8   N2 0 0.950775 -0.309882 
+   txt003 
+STRI 
+  V0 0.0460445 0.165279 2.78542   V1 0.0871056 0.148234 2.78542   V2 0.10163 0.173037 2.7 
+  N0 0.246906 0.917897 -0.310647   N1 0.476337 0.822132 -0.311772   N2 0.300385 0.517905 0.800964 
+   txt003 
+STRI 
+  V0 0.10163 0.173037 2.7   V1 0.0537037 0.192963 2.7   V2 0.0460445 0.165279 2.78542 
+  N0 0.300385 0.517905 0.800964   N1 0.15602 0.578783 0.800417   N2 0.246906 0.917897 -0.310647 
+   txt003 
+STRI 
+  V0 0.0871056 0.148234 2.78542   V1 0.121672 0.121672 2.78542   V2 0.142 0.142 2.7 
+  N0 0.476337 0.822132 -0.311772   N1 0.671754 0.671754 -0.312241   N2 0.423155 0.423155 0.801174 
+   txt003 
+STRI 
+  V0 0.142 0.142 2.7   V1 0.10163 0.173037 2.7   V2 0.0871056 0.148234 2.78542 
+  N0 0.423155 0.423155 0.801174   N1 0.300385 0.517905 0.800964   N2 0.476337 0.822132 -0.311772 
+   txt003 
+STRI 
+  V0 0.121672 0.121672 2.78542   V1 0.148234 0.0871056 2.78542   V2 0.173037 0.10163 2.7 
+  N0 0.671754 0.671754 -0.312241   N1 0.822132 0.476337 -0.311772   N2 0.517905 0.300385 0.800964 
+   txt003 
+STRI 
+  V0 0.173037 0.10163 2.7   V1 0.142 0.142 2.7   V2 0.121672 0.121672 2.78542 
+  N0 0.517905 0.300385 0.800964   N1 0.423155 0.423155 0.801174   N2 0.671754 0.671754 -0.312241 
+   txt003 
+STRI 
+  V0 0.148234 0.0871056 2.78542   V1 0.165279 0.0460445 2.78542   V2 0.192963 0.0537037 2.7 
+  N0 0.822132 0.476337 -0.311772   N1 0.917897 0.246906 -0.310647   N2 0.578783 0.15602 0.800417 
+   txt003 
+STRI 
+  V0 0.192963 0.0537037 2.7   V1 0.173037 0.10163 2.7   V2 0.148234 0.0871056 2.78542 
+  N0 0.578783 0.15602 0.800417   N1 0.517905 0.300385 0.800964   N2 0.822132 0.476337 -0.311772 
+   txt003 
+STRI 
+  V0 0.165279 0.0460445 2.78542   V1 0.171296 -6.66134e-16 2.78542   V2 0.2 0 2.7 
+  N0 0.917897 0.246906 -0.310647   N1 0.950775 2.16507e-15 -0.309882   N2 0.6 -3.17207e-15 0.8 
+   txt003 
+STRI 
+  V0 0.2 0 2.7   V1 0.192963 0.0537037 2.7   V2 0.165279 0.0460445 2.78542 
+  N0 0.6 -3.17207e-15 0.8   N1 0.578783 0.15602 0.800417   N2 0.917897 0.246906 -0.310647 
+   txt003 
+STRI 
+  V0 0.2 0 2.7   V1 0.192963 -0.0537037 2.7   V2 0.338579 -0.0942301 2.63611 
+  N0 0.6 0 0.8   N1 0.578783 -0.15602 0.800417   N2 0.258756 -0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 0.338579 -0.0942301 2.63611   V1 0.350926 0 2.63611   V2 0.2 0 2.7 
+  N0 0.258756 -0.0697517 0.963421   N1 0.268354 0 0.96332   N2 0.6 0 0.8 
+   txt003 
+STRI 
+  V0 0.192963 -0.0537037 2.7   V1 0.173037 -0.10163 2.7   V2 0.303616 -0.178322 2.63611 
+  N0 0.578783 -0.15602 0.800417   N1 0.517905 -0.300385 0.800964   N2 0.231413 -0.134219 0.963552 
+   txt003 
+STRI 
+  V0 0.303616 -0.178322 2.63611   V1 0.338579 -0.0942301 2.63611   V2 0.192963 -0.0537037 2.7 
+  N0 0.231413 -0.134219 0.963552   N1 0.258756 -0.0697517 0.963421   N2 0.578783 -0.15602 0.800417 
+   txt003 
+STRI 
+  V0 0.173037 -0.10163 2.7   V1 0.142 -0.142 2.7   V2 0.249157 -0.249157 2.63611 
+  N0 0.517905 -0.300385 0.800964   N1 0.423155 -0.423155 0.801174   N2 0.189037 -0.189037 0.963603 
+   txt003 
+STRI 
+  V0 0.249157 -0.249157 2.63611   V1 0.303616 -0.178322 2.63611   V2 0.173037 -0.10163 2.7 
+  N0 0.189037 -0.189037 0.963603   N1 0.231413 -0.134219 0.963552   N2 0.517905 -0.300385 0.800964 
+   txt003 
+STRI 
+  V0 0.142 -0.142 2.7   V1 0.10163 -0.173037 2.7   V2 0.178322 -0.303616 2.63611 
+  N0 0.423155 -0.423155 0.801174   N1 0.300385 -0.517905 0.800964   N2 0.134219 -0.231413 0.963552 
+   txt003 
+STRI 
+  V0 0.178322 -0.303616 2.63611   V1 0.249157 -0.249157 2.63611   V2 0.142 -0.142 2.7 
+  N0 0.134219 -0.231413 0.963552   N1 0.189037 -0.189037 0.963603   N2 0.423155 -0.423155 0.801174 
+   txt003 
+STRI 
+  V0 0.10163 -0.173037 2.7   V1 0.0537037 -0.192963 2.7   V2 0.0942301 -0.338579 2.63611 
+  N0 0.300385 -0.517905 0.800964   N1 0.15602 -0.578783 0.800417   N2 0.0697517 -0.258756 0.963421 
+   txt003 
+STRI 
+  V0 0.0942301 -0.338579 2.63611   V1 0.178322 -0.303616 2.63611   V2 0.10163 -0.173037 2.7 
+  N0 0.0697517 -0.258756 0.963421   N1 0.134219 -0.231413 0.963552   N2 0.300385 -0.517905 0.800964 
+   txt003 
+STRI 
+  V0 0.0537037 -0.192963 2.7   V1 0 -0.2 2.7   V2 5.55112e-17 -0.350926 2.63611 
+  N0 0.15602 -0.578783 0.800417   N1 -9.91271e-17 -0.6 0.8   N2 0 -0.268354 0.96332 
+   txt003 
+STRI 
+  V0 5.55112e-17 -0.350926 2.63611   V1 0.0942301 -0.338579 2.63611   V2 0.0537037 -0.192963 2.7 
+  N0 0 -0.268354 0.96332   N1 0.0697517 -0.258756 0.963421   N2 0.15602 -0.578783 0.800417 
+   txt003 
+STRI 
+  V0 0.350926 0 2.63611   V1 0.338579 -0.0942301 2.63611   V2 0.553875 -0.15415 2.58889 
+  N0 0.268354 0 0.96332   N1 0.258756 -0.0697517 0.963421   N2 0.162011 -0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 0.553875 -0.15415 2.58889   V1 0.574074 0 2.58889   V2 0.350926 0 2.63611 
+  N0 0.162011 -0.0436726 0.985822   N1 0.168031 0 0.985782   N2 0.268354 0 0.96332 
+   txt003 
+STRI 
+  V0 0.338579 -0.0942301 2.63611   V1 0.303616 -0.178322 2.63611   V2 0.49668 -0.291715 2.58889 
+  N0 0.258756 -0.0697517 0.963421   N1 0.231413 -0.134219 0.963552   N2 0.144879 -0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 0.49668 -0.291715 2.58889   V1 0.553875 -0.15415 2.58889   V2 0.338579 -0.0942301 2.63611 
+  N0 0.144879 -0.0840299 0.985875   N1 0.162011 -0.0436726 0.985822   N2 0.258756 -0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 0.303616 -0.178322 2.63611   V1 0.249157 -0.249157 2.63611   V2 0.407593 -0.407593 2.58889 
+  N0 0.231413 -0.134219 0.963552   N1 0.189037 -0.189037 0.963603   N2 0.118345 -0.118345 0.985895 
+   txt003 
+STRI 
+  V0 0.407593 -0.407593 2.58889   V1 0.49668 -0.291715 2.58889   V2 0.303616 -0.178322 2.63611 
+  N0 0.118345 -0.118345 0.985895   N1 0.144879 -0.0840299 0.985875   N2 0.231413 -0.134219 0.963552 
+   txt003 
+STRI 
+  V0 0.249157 -0.249157 2.63611   V1 0.178322 -0.303616 2.63611   V2 0.291715 -0.49668 2.58889 
+  N0 0.189037 -0.189037 0.963603   N1 0.134219 -0.231413 0.963552   N2 0.0840299 -0.144879 0.985875 
+   txt003 
+STRI 
+  V0 0.291715 -0.49668 2.58889   V1 0.407593 -0.407593 2.58889   V2 0.249157 -0.249157 2.63611 
+  N0 0.0840299 -0.144879 0.985875   N1 0.118345 -0.118345 0.985895   N2 0.189037 -0.189037 0.963603 
+   txt003 
+STRI 
+  V0 0.178322 -0.303616 2.63611   V1 0.0942301 -0.338579 2.63611   V2 0.15415 -0.553875 2.58889 
+  N0 0.134219 -0.231413 0.963552   N1 0.0697517 -0.258756 0.963421   N2 0.0436726 -0.162011 0.985822 
+   txt003 
+STRI 
+  V0 0.15415 -0.553875 2.58889   V1 0.291715 -0.49668 2.58889   V2 0.178322 -0.303616 2.63611 
+  N0 0.0436726 -0.162011 0.985822   N1 0.0840299 -0.144879 0.985875   N2 0.134219 -0.231413 0.963552 
+   txt003 
+STRI 
+  V0 0.0942301 -0.338579 2.63611   V1 5.55112e-17 -0.350926 2.63611   V2 2.22045e-16 -0.574074 2.58889 
+  N0 0.0697517 -0.258756 0.963421   N1 0 -0.268354 0.96332   N2 -1.93429e-17 -0.168031 0.985782 
+   txt003 
+STRI 
+  V0 2.22045e-16 -0.574074 2.58889   V1 0.15415 -0.553875 2.58889   V2 0.0942301 -0.338579 2.63611 
+  N0 -1.93429e-17 -0.168031 0.985782   N1 0.0436726 -0.162011 0.985822   N2 0.0697517 -0.258756 0.963421 
+   txt003 
+STRI 
+  V0 0.574074 0 2.58889   V1 0.553875 -0.15415 2.58889   V2 0.795972 -0.221528 2.55 
+  N0 0.168031 0 0.985782   N1 0.162011 -0.0436726 0.985822   N2 0.143025 -0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 0.795972 -0.221528 2.55   V1 0.825 0 2.55   V2 0.574074 0 2.58889 
+  N0 0.143025 -0.0385545 0.988968   N1 0.14834 0 0.988936   N2 0.168031 0 0.985782 
+   txt003 
+STRI 
+  V0 0.553875 -0.15415 2.58889   V1 0.49668 -0.291715 2.58889   V2 0.713778 -0.419222 2.55 
+  N0 0.162011 -0.0436726 0.985822   N1 0.144879 -0.0840299 0.985875   N2 0.127899 -0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 0.713778 -0.419222 2.55   V1 0.795972 -0.221528 2.55   V2 0.553875 -0.15415 2.58889 
+  N0 0.127899 -0.0741814 0.989009   N1 0.143025 -0.0385545 0.988968   N2 0.162011 -0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 0.49668 -0.291715 2.58889   V1 0.407593 -0.407593 2.58889   V2 0.58575 -0.58575 2.55 
+  N0 0.144879 -0.0840299 0.985875   N1 0.118345 -0.118345 0.985895   N2 0.104474 -0.104474 0.989025 
+   txt003 
+STRI 
+  V0 0.58575 -0.58575 2.55   V1 0.713778 -0.419222 2.55   V2 0.49668 -0.291715 2.58889 
+  N0 0.104474 -0.104474 0.989025   N1 0.127899 -0.0741814 0.989009   N2 0.144879 -0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 0.407593 -0.407593 2.58889   V1 0.291715 -0.49668 2.58889   V2 0.419222 -0.713778 2.55 
+  N0 0.118345 -0.118345 0.985895   N1 0.0840299 -0.144879 0.985875   N2 0.0741814 -0.127899 0.989009 
+   txt003 
+STRI 
+  V0 0.419222 -0.713778 2.55   V1 0.58575 -0.58575 2.55   V2 0.407593 -0.407593 2.58889 
+  N0 0.0741814 -0.127899 0.989009   N1 0.104474 -0.104474 0.989025   N2 0.118345 -0.118345 0.985895 
+   txt003 
+STRI 
+  V0 0.291715 -0.49668 2.58889   V1 0.15415 -0.553875 2.58889   V2 0.221528 -0.795972 2.55 
+  N0 0.0840299 -0.144879 0.985875   N1 0.0436726 -0.162011 0.985822   N2 0.0385545 -0.143025 0.988968 
+   txt003 
+STRI 
+  V0 0.221528 -0.795972 2.55   V1 0.419222 -0.713778 2.55   V2 0.291715 -0.49668 2.58889 
+  N0 0.0385545 -0.143025 0.988968   N1 0.0741814 -0.127899 0.989009   N2 0.0840299 -0.144879 0.985875 
+   txt003 
+STRI 
+  V0 0.15415 -0.553875 2.58889   V1 2.22045e-16 -0.574074 2.58889   V2 1.11022e-16 -0.825 2.55 
+  N0 0.0436726 -0.162011 0.985822   N1 -1.93429e-17 -0.168031 0.985782   N2 -2.37649e-17 -0.14834 0.988936 
+   txt003 
+STRI 
+  V0 1.11022e-16 -0.825 2.55   V1 0.221528 -0.795972 2.55   V2 0.15415 -0.553875 2.58889 
+  N0 -2.37649e-17 -0.14834 0.988936   N1 0.0385545 -0.143025 0.988968   N2 0.0436726 -0.162011 0.985822 
+   txt003 
+STRI 
+  V0 0.825 0 2.55   V1 0.795972 -0.221528 2.55   V2 1.02199 -0.284431 2.51111 
+  N0 0.14834 0 0.988936   N1 0.143025 -0.0385545 0.988968   N2 0.186699 -0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 1.02199 -0.284431 2.51111   V1 1.05926 0 2.51111   V2 0.825 0 2.55 
+  N0 0.186699 -0.0503275 0.981127   N1 0.193633 0 0.981074   N2 0.14834 0 0.988936 
+   txt003 
+STRI 
+  V0 0.795972 -0.221528 2.55   V1 0.713778 -0.419222 2.55   V2 0.916455 -0.538261 2.51111 
+  N0 0.143025 -0.0385545 0.988968   N1 0.127899 -0.0741814 0.989009   N2 0.166959 -0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 0.916455 -0.538261 2.51111   V1 1.02199 -0.284431 2.51111   V2 0.795972 -0.221528 2.55 
+  N0 0.166959 -0.0968361 0.981197   N1 0.186699 -0.0503275 0.981127   N2 0.143025 -0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 0.713778 -0.419222 2.55   V1 0.58575 -0.58575 2.55   V2 0.752074 -0.752074 2.51111 
+  N0 0.127899 -0.0741814 0.989009   N1 0.104474 -0.104474 0.989025   N2 0.136382 -0.136382 0.981224 
+   txt003 
+STRI 
+  V0 0.752074 -0.752074 2.51111   V1 0.916455 -0.538261 2.51111   V2 0.713778 -0.419222 2.55 
+  N0 0.136382 -0.136382 0.981224   N1 0.166959 -0.0968361 0.981197   N2 0.127899 -0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 0.58575 -0.58575 2.55   V1 0.419222 -0.713778 2.55   V2 0.538261 -0.916455 2.51111 
+  N0 0.104474 -0.104474 0.989025   N1 0.0741814 -0.127899 0.989009   N2 0.0968361 -0.166959 0.981197 
+   txt003 
+STRI 
+  V0 0.538261 -0.916455 2.51111   V1 0.752074 -0.752074 2.51111   V2 0.58575 -0.58575 2.55 
+  N0 0.0968361 -0.166959 0.981197   N1 0.136382 -0.136382 0.981224   N2 0.104474 -0.104474 0.989025 
+   txt003 
+STRI 
+  V0 0.419222 -0.713778 2.55   V1 0.221528 -0.795972 2.55   V2 0.284431 -1.02199 2.51111 
+  N0 0.0741814 -0.127899 0.989009   N1 0.0385545 -0.143025 0.988968   N2 0.0503275 -0.186699 0.981127 
+   txt003 
+STRI 
+  V0 0.284431 -1.02199 2.51111   V1 0.538261 -0.916455 2.51111   V2 0.419222 -0.713778 2.55 
+  N0 0.0503275 -0.186699 0.981127   N1 0.0968361 -0.166959 0.981197   N2 0.0741814 -0.127899 0.989009 
+   txt003 
+STRI 
+  V0 0.221528 -0.795972 2.55   V1 1.11022e-16 -0.825 2.55   V2 4.44089e-16 -1.05926 2.51111 
+  N0 0.0385545 -0.143025 0.988968   N1 -2.37649e-17 -0.14834 0.988936   N2 -7.24819e-17 -0.193633 0.981074 
+   txt003 
+STRI 
+  V0 4.44089e-16 -1.05926 2.51111   V1 0.284431 -1.02199 2.51111   V2 0.221528 -0.795972 2.55 
+  N0 -7.24819e-17 -0.193633 0.981074   N1 0.0503275 -0.186699 0.981127   N2 0.0385545 -0.143025 0.988968 
+   txt003 
+STRI 
+  V0 1.05926 0 2.51111   V1 1.02199 -0.284431 2.51111   V2 1.18904 -0.330924 2.46389 
+  N0 0.193633 0 0.981074   N1 0.186699 -0.0503275 0.981127   N2 0.376378 -0.101459 0.920894 
+   txt003 
+STRI 
+  V0 1.18904 -0.330924 2.46389   V1 1.23241 0 2.46389   V2 1.05926 0 2.51111 
+  N0 0.376378 -0.101459 0.920894   N1 0.390293 0 0.920691   N2 0.193633 0 0.981074 
+   txt003 
+STRI 
+  V0 1.02199 -0.284431 2.51111   V1 0.916455 -0.538261 2.51111   V2 1.06626 -0.626246 2.46389 
+  N0 0.186699 -0.0503275 0.981127   N1 0.166959 -0.0968361 0.981197   N2 0.336657 -0.195261 0.92116 
+   txt003 
+STRI 
+  V0 1.06626 -0.626246 2.46389   V1 1.18904 -0.330924 2.46389   V2 1.02199 -0.284431 2.51111 
+  N0 0.336657 -0.195261 0.92116   N1 0.376378 -0.101459 0.920894   N2 0.186699 -0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 0.916455 -0.538261 2.51111   V1 0.752074 -0.752074 2.51111   V2 0.875009 -0.875009 2.46389 
+  N0 0.166959 -0.0968361 0.981197   N1 0.136382 -0.136382 0.981224   N2 0.275025 -0.275025 0.921262 
+   txt003 
+STRI 
+  V0 0.875009 -0.875009 2.46389   V1 1.06626 -0.626246 2.46389   V2 0.916455 -0.538261 2.51111 
+  N0 0.275025 -0.275025 0.921262   N1 0.336657 -0.195261 0.92116   N2 0.166959 -0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 0.752074 -0.752074 2.51111   V1 0.538261 -0.916455 2.51111   V2 0.626246 -1.06626 2.46389 
+  N0 0.136382 -0.136382 0.981224   N1 0.0968361 -0.166959 0.981197   N2 0.195261 -0.336657 0.92116 
+   txt003 
+STRI 
+  V0 0.626246 -1.06626 2.46389   V1 0.875009 -0.875009 2.46389   V2 0.752074 -0.752074 2.51111 
+  N0 0.195261 -0.336657 0.92116   N1 0.275025 -0.275025 0.921262   N2 0.136382 -0.136382 0.981224 
+   txt003 
+STRI 
+  V0 0.538261 -0.916455 2.51111   V1 0.284431 -1.02199 2.51111   V2 0.330924 -1.18904 2.46389 
+  N0 0.0968361 -0.166959 0.981197   N1 0.0503275 -0.186699 0.981127   N2 0.101459 -0.376378 0.920894 
+   txt003 
+STRI 
+  V0 0.330924 -1.18904 2.46389   V1 0.626246 -1.06626 2.46389   V2 0.538261 -0.916455 2.51111 
+  N0 0.101459 -0.376378 0.920894   N1 0.195261 -0.336657 0.92116   N2 0.0968361 -0.166959 0.981197 
+   txt003 
+STRI 
+  V0 0.284431 -1.02199 2.51111   V1 4.44089e-16 -1.05926 2.51111   V2 4.44089e-16 -1.23241 2.46389 
+  N0 0.0503275 -0.186699 0.981127   N1 -7.24819e-17 -0.193633 0.981074   N2 -8.37138e-17 -0.390293 0.920691 
+   txt003 
+STRI 
+  V0 4.44089e-16 -1.23241 2.46389   V1 0.330924 -1.18904 2.46389   V2 0.284431 -1.02199 2.51111 
+  N0 -8.37138e-17 -0.390293 0.920691   N1 0.101459 -0.376378 0.920894   N2 0.0503275 -0.186699 0.981127 
+   txt003 
+STRI 
+  V0 1.23241 0 2.46389   V1 1.18904 -0.330924 2.46389   V2 1.25426 -0.349074 2.4 
+  N0 0.390293 0 0.920691   N1 0.376378 -0.101459 0.920894   N2 0.965535 -0.260275 -1.02004e-15 
+   txt003 
+STRI 
+  V0 1.25426 -0.349074 2.4   V1 1.3 0 2.4   V2 1.23241 0 2.46389 
+  N0 0.965535 -0.260275 -1.02004e-15   N1 1 0 -9.86865e-16   N2 0.390293 0 0.920691 
+   txt003 
+STRI 
+  V0 1.18904 -0.330924 2.46389   V1 1.06626 -0.626246 2.46389   V2 1.12474 -0.660593 2.4 
+  N0 0.376378 -0.101459 0.920894   N1 0.336657 -0.195261 0.92116   N2 0.865031 -0.501718 -9.69705e-16 
+   txt003 
+STRI 
+  V0 1.12474 -0.660593 2.4   V1 1.25426 -0.349074 2.4   V2 1.18904 -0.330924 2.46389 
+  N0 0.865031 -0.501718 -9.69705e-16   N1 0.965535 -0.260275 -1.02004e-15   N2 0.376378 -0.101459 0.920894 
+   txt003 
+STRI 
+  V0 1.06626 -0.626246 2.46389   V1 0.875009 -0.875009 2.46389   V2 0.923 -0.923 2.4 
+  N0 0.336657 -0.195261 0.92116   N1 0.275025 -0.275025 0.921262   N2 0.707107 -0.707107 -7.41433e-16 
+   txt003 
+STRI 
+  V0 0.923 -0.923 2.4   V1 1.12474 -0.660593 2.4   V2 1.06626 -0.626246 2.46389 
+  N0 0.707107 -0.707107 -7.41433e-16   N1 0.865031 -0.501718 -9.69705e-16   N2 0.336657 -0.195261 0.92116 
+   txt003 
+STRI 
+  V0 0.875009 -0.875009 2.46389   V1 0.626246 -1.06626 2.46389   V2 0.660593 -1.12474 2.4 
+  N0 0.275025 -0.275025 0.921262   N1 0.195261 -0.336657 0.92116   N2 0.501718 -0.865031 -4.67305e-16 
+   txt003 
+STRI 
+  V0 0.660593 -1.12474 2.4   V1 0.923 -0.923 2.4   V2 0.875009 -0.875009 2.46389 
+  N0 0.501718 -0.865031 -4.67305e-16   N1 0.707107 -0.707107 -7.41433e-16   N2 0.275025 -0.275025 0.921262 
+   txt003 
+STRI 
+  V0 0.626246 -1.06626 2.46389   V1 0.330924 -1.18904 2.46389   V2 0.349074 -1.25426 2.4 
+  N0 0.195261 -0.336657 0.92116   N1 0.101459 -0.376378 0.920894   N2 0.260275 -0.965535 -5.24893e-16 
+   txt003 
+STRI 
+  V0 0.349074 -1.25426 2.4   V1 0.660593 -1.12474 2.4   V2 0.626246 -1.06626 2.46389 
+  N0 0.260275 -0.965535 -5.24893e-16   N1 0.501718 -0.865031 -4.67305e-16   N2 0.195261 -0.336657 0.92116 
+   txt003 
+STRI 
+  V0 0.330924 -1.18904 2.46389   V1 4.44089e-16 -1.23241 2.46389   V2 6.66134e-16 -1.3 2.4 
+  N0 0.101459 -0.376378 0.920894   N1 -8.37138e-17 -0.390293 0.920691   N2 -4.06675e-16 -1 -1.4803e-15 
+   txt003 
+STRI 
+  V0 6.66134e-16 -1.3 2.4   V1 0.349074 -1.25426 2.4   V2 0.330924 -1.18904 2.46389 
+  N0 -4.06675e-16 -1 -1.4803e-15   N1 0.260275 -0.965535 -5.24893e-16   N2 0.101459 -0.376378 0.920894 
+   txt003 
+STRI 
+  V0 0 -0.2 2.7   V1 -0.0537037 -0.192963 2.7   V2 -0.0942301 -0.338579 2.63611 
+  N0 0 -0.6 0.8   N1 -0.15602 -0.578783 0.800417   N2 -0.0697517 -0.258756 0.963421 
+   txt003 
+STRI 
+  V0 -0.0942301 -0.338579 2.63611   V1 0 -0.350926 2.63611   V2 0 -0.2 2.7 
+  N0 -0.0697517 -0.258756 0.963421   N1 0 -0.268354 0.96332   N2 0 -0.6 0.8 
+   txt003 
+STRI 
+  V0 -0.0537037 -0.192963 2.7   V1 -0.10163 -0.173037 2.7   V2 -0.178322 -0.303616 2.63611 
+  N0 -0.15602 -0.578783 0.800417   N1 -0.300385 -0.517905 0.800964   N2 -0.134219 -0.231413 0.963552 
+   txt003 
+STRI 
+  V0 -0.178322 -0.303616 2.63611   V1 -0.0942301 -0.338579 2.63611   V2 -0.0537037 -0.192963 2.7 
+  N0 -0.134219 -0.231413 0.963552   N1 -0.0697517 -0.258756 0.963421   N2 -0.15602 -0.578783 0.800417 
+   txt003 
+STRI 
+  V0 -0.10163 -0.173037 2.7   V1 -0.142 -0.142 2.7   V2 -0.249157 -0.249157 2.63611 
+  N0 -0.300385 -0.517905 0.800964   N1 -0.423155 -0.423155 0.801174   N2 -0.189037 -0.189037 0.963603 
+   txt003 
+STRI 
+  V0 -0.249157 -0.249157 2.63611   V1 -0.178322 -0.303616 2.63611   V2 -0.10163 -0.173037 2.7 
+  N0 -0.189037 -0.189037 0.963603   N1 -0.134219 -0.231413 0.963552   N2 -0.300385 -0.517905 0.800964 
+   txt003 
+STRI 
+  V0 -0.142 -0.142 2.7   V1 -0.173037 -0.10163 2.7   V2 -0.303616 -0.178322 2.63611 
+  N0 -0.423155 -0.423155 0.801174   N1 -0.517905 -0.300385 0.800964   N2 -0.231413 -0.134219 0.963552 
+   txt003 
+STRI 
+  V0 -0.303616 -0.178322 2.63611   V1 -0.249157 -0.249157 2.63611   V2 -0.142 -0.142 2.7 
+  N0 -0.231413 -0.134219 0.963552   N1 -0.189037 -0.189037 0.963603   N2 -0.423155 -0.423155 0.801174 
+   txt003 
+STRI 
+  V0 -0.173037 -0.10163 2.7   V1 -0.192963 -0.0537037 2.7   V2 -0.338579 -0.0942301 2.63611 
+  N0 -0.517905 -0.300385 0.800964   N1 -0.578783 -0.15602 0.800417   N2 -0.258756 -0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 -0.338579 -0.0942301 2.63611   V1 -0.303616 -0.178322 2.63611   V2 -0.173037 -0.10163 2.7 
+  N0 -0.258756 -0.0697517 0.963421   N1 -0.231413 -0.134219 0.963552   N2 -0.517905 -0.300385 0.800964 
+   txt003 
+STRI 
+  V0 -0.192963 -0.0537037 2.7   V1 -0.2 0 2.7   V2 -0.350926 -5.55112e-17 2.63611 
+  N0 -0.578783 -0.15602 0.800417   N1 -0.6 9.91271e-17 0.8   N2 -0.268354 0 0.96332 
+   txt003 
+STRI 
+  V0 -0.350926 -5.55112e-17 2.63611   V1 -0.338579 -0.0942301 2.63611   V2 -0.192963 -0.0537037 2.7 
+  N0 -0.268354 0 0.96332   N1 -0.258756 -0.0697517 0.963421   N2 -0.578783 -0.15602 0.800417 
+   txt003 
+STRI 
+  V0 0 -0.350926 2.63611   V1 -0.0942301 -0.338579 2.63611   V2 -0.15415 -0.553875 2.58889 
+  N0 0 -0.268354 0.96332   N1 -0.0697517 -0.258756 0.963421   N2 -0.0436726 -0.162011 0.985822 
+   txt003 
+STRI 
+  V0 -0.15415 -0.553875 2.58889   V1 0 -0.574074 2.58889   V2 0 -0.350926 2.63611 
+  N0 -0.0436726 -0.162011 0.985822   N1 0 -0.168031 0.985782   N2 0 -0.268354 0.96332 
+   txt003 
+STRI 
+  V0 -0.0942301 -0.338579 2.63611   V1 -0.178322 -0.303616 2.63611   V2 -0.291715 -0.49668 2.58889 
+  N0 -0.0697517 -0.258756 0.963421   N1 -0.134219 -0.231413 0.963552   N2 -0.0840299 -0.144879 0.985875 
+   txt003 
+STRI 
+  V0 -0.291715 -0.49668 2.58889   V1 -0.15415 -0.553875 2.58889   V2 -0.0942301 -0.338579 2.63611 
+  N0 -0.0840299 -0.144879 0.985875   N1 -0.0436726 -0.162011 0.985822   N2 -0.0697517 -0.258756 0.963421 
+   txt003 
+STRI 
+  V0 -0.178322 -0.303616 2.63611   V1 -0.249157 -0.249157 2.63611   V2 -0.407593 -0.407593 2.58889 
+  N0 -0.134219 -0.231413 0.963552   N1 -0.189037 -0.189037 0.963603   N2 -0.118345 -0.118345 0.985895 
+   txt003 
+STRI 
+  V0 -0.407593 -0.407593 2.58889   V1 -0.291715 -0.49668 2.58889   V2 -0.178322 -0.303616 2.63611 
+  N0 -0.118345 -0.118345 0.985895   N1 -0.0840299 -0.144879 0.985875   N2 -0.134219 -0.231413 0.963552 
+   txt003 
+STRI 
+  V0 -0.249157 -0.249157 2.63611   V1 -0.303616 -0.178322 2.63611   V2 -0.49668 -0.291715 2.58889 
+  N0 -0.189037 -0.189037 0.963603   N1 -0.231413 -0.134219 0.963552   N2 -0.144879 -0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 -0.49668 -0.291715 2.58889   V1 -0.407593 -0.407593 2.58889   V2 -0.249157 -0.249157 2.63611 
+  N0 -0.144879 -0.0840299 0.985875   N1 -0.118345 -0.118345 0.985895   N2 -0.189037 -0.189037 0.963603 
+   txt003 
+STRI 
+  V0 -0.303616 -0.178322 2.63611   V1 -0.338579 -0.0942301 2.63611   V2 -0.553875 -0.15415 2.58889 
+  N0 -0.231413 -0.134219 0.963552   N1 -0.258756 -0.0697517 0.963421   N2 -0.162011 -0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 -0.553875 -0.15415 2.58889   V1 -0.49668 -0.291715 2.58889   V2 -0.303616 -0.178322 2.63611 
+  N0 -0.162011 -0.0436726 0.985822   N1 -0.144879 -0.0840299 0.985875   N2 -0.231413 -0.134219 0.963552 
+   txt003 
+STRI 
+  V0 -0.338579 -0.0942301 2.63611   V1 -0.350926 -5.55112e-17 2.63611   V2 -0.574074 -2.22045e-16 2.58889 
+  N0 -0.258756 -0.0697517 0.963421   N1 -0.268354 0 0.96332   N2 -0.168031 1.93429e-17 0.985782 
+   txt003 
+STRI 
+  V0 -0.574074 -2.22045e-16 2.58889   V1 -0.553875 -0.15415 2.58889   V2 -0.338579 -0.0942301 2.63611 
+  N0 -0.168031 1.93429e-17 0.985782   N1 -0.162011 -0.0436726 0.985822   N2 -0.258756 -0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 0 -0.574074 2.58889   V1 -0.15415 -0.553875 2.58889   V2 -0.221528 -0.795972 2.55 
+  N0 0 -0.168031 0.985782   N1 -0.0436726 -0.162011 0.985822   N2 -0.0385545 -0.143025 0.988968 
+   txt003 
+STRI 
+  V0 -0.221528 -0.795972 2.55   V1 0 -0.825 2.55   V2 0 -0.574074 2.58889 
+  N0 -0.0385545 -0.143025 0.988968   N1 0 -0.14834 0.988936   N2 0 -0.168031 0.985782 
+   txt003 
+STRI 
+  V0 -0.15415 -0.553875 2.58889   V1 -0.291715 -0.49668 2.58889   V2 -0.419222 -0.713778 2.55 
+  N0 -0.0436726 -0.162011 0.985822   N1 -0.0840299 -0.144879 0.985875   N2 -0.0741814 -0.127899 0.989009 
+   txt003 
+STRI 
+  V0 -0.419222 -0.713778 2.55   V1 -0.221528 -0.795972 2.55   V2 -0.15415 -0.553875 2.58889 
+  N0 -0.0741814 -0.127899 0.989009   N1 -0.0385545 -0.143025 0.988968   N2 -0.0436726 -0.162011 0.985822 
+   txt003 
+STRI 
+  V0 -0.291715 -0.49668 2.58889   V1 -0.407593 -0.407593 2.58889   V2 -0.58575 -0.58575 2.55 
+  N0 -0.0840299 -0.144879 0.985875   N1 -0.118345 -0.118345 0.985895   N2 -0.104474 -0.104474 0.989025 
+   txt003 
+STRI 
+  V0 -0.58575 -0.58575 2.55   V1 -0.419222 -0.713778 2.55   V2 -0.291715 -0.49668 2.58889 
+  N0 -0.104474 -0.104474 0.989025   N1 -0.0741814 -0.127899 0.989009   N2 -0.0840299 -0.144879 0.985875 
+   txt003 
+STRI 
+  V0 -0.407593 -0.407593 2.58889   V1 -0.49668 -0.291715 2.58889   V2 -0.713778 -0.419222 2.55 
+  N0 -0.118345 -0.118345 0.985895   N1 -0.144879 -0.0840299 0.985875   N2 -0.127899 -0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 -0.713778 -0.419222 2.55   V1 -0.58575 -0.58575 2.55   V2 -0.407593 -0.407593 2.58889 
+  N0 -0.127899 -0.0741814 0.989009   N1 -0.104474 -0.104474 0.989025   N2 -0.118345 -0.118345 0.985895 
+   txt003 
+STRI 
+  V0 -0.49668 -0.291715 2.58889   V1 -0.553875 -0.15415 2.58889   V2 -0.795972 -0.221528 2.55 
+  N0 -0.144879 -0.0840299 0.985875   N1 -0.162011 -0.0436726 0.985822   N2 -0.143025 -0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 -0.795972 -0.221528 2.55   V1 -0.713778 -0.419222 2.55   V2 -0.49668 -0.291715 2.58889 
+  N0 -0.143025 -0.0385545 0.988968   N1 -0.127899 -0.0741814 0.989009   N2 -0.144879 -0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 -0.553875 -0.15415 2.58889   V1 -0.574074 -2.22045e-16 2.58889   V2 -0.825 -1.11022e-16 2.55 
+  N0 -0.162011 -0.0436726 0.985822   N1 -0.168031 1.93429e-17 0.985782   N2 -0.14834 2.37649e-17 0.988936 
+   txt003 
+STRI 
+  V0 -0.825 -1.11022e-16 2.55   V1 -0.795972 -0.221528 2.55   V2 -0.553875 -0.15415 2.58889 
+  N0 -0.14834 2.37649e-17 0.988936   N1 -0.143025 -0.0385545 0.988968   N2 -0.162011 -0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 0 -0.825 2.55   V1 -0.221528 -0.795972 2.55   V2 -0.284431 -1.02199 2.51111 
+  N0 0 -0.14834 0.988936   N1 -0.0385545 -0.143025 0.988968   N2 -0.0503275 -0.186699 0.981127 
+   txt003 
+STRI 
+  V0 -0.284431 -1.02199 2.51111   V1 0 -1.05926 2.51111   V2 0 -0.825 2.55 
+  N0 -0.0503275 -0.186699 0.981127   N1 0 -0.193633 0.981074   N2 0 -0.14834 0.988936 
+   txt003 
+STRI 
+  V0 -0.221528 -0.795972 2.55   V1 -0.419222 -0.713778 2.55   V2 -0.538261 -0.916455 2.51111 
+  N0 -0.0385545 -0.143025 0.988968   N1 -0.0741814 -0.127899 0.989009   N2 -0.0968361 -0.166959 0.981197 
+   txt003 
+STRI 
+  V0 -0.538261 -0.916455 2.51111   V1 -0.284431 -1.02199 2.51111   V2 -0.221528 -0.795972 2.55 
+  N0 -0.0968361 -0.166959 0.981197   N1 -0.0503275 -0.186699 0.981127   N2 -0.0385545 -0.143025 0.988968 
+   txt003 
+STRI 
+  V0 -0.419222 -0.713778 2.55   V1 -0.58575 -0.58575 2.55   V2 -0.752074 -0.752074 2.51111 
+  N0 -0.0741814 -0.127899 0.989009   N1 -0.104474 -0.104474 0.989025   N2 -0.136382 -0.136382 0.981224 
+   txt003 
+STRI 
+  V0 -0.752074 -0.752074 2.51111   V1 -0.538261 -0.916455 2.51111   V2 -0.419222 -0.713778 2.55 
+  N0 -0.136382 -0.136382 0.981224   N1 -0.0968361 -0.166959 0.981197   N2 -0.0741814 -0.127899 0.989009 
+   txt003 
+STRI 
+  V0 -0.58575 -0.58575 2.55   V1 -0.713778 -0.419222 2.55   V2 -0.916455 -0.538261 2.51111 
+  N0 -0.104474 -0.104474 0.989025   N1 -0.127899 -0.0741814 0.989009   N2 -0.166959 -0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 -0.916455 -0.538261 2.51111   V1 -0.752074 -0.752074 2.51111   V2 -0.58575 -0.58575 2.55 
+  N0 -0.166959 -0.0968361 0.981197   N1 -0.136382 -0.136382 0.981224   N2 -0.104474 -0.104474 0.989025 
+   txt003 
+STRI 
+  V0 -0.713778 -0.419222 2.55   V1 -0.795972 -0.221528 2.55   V2 -1.02199 -0.284431 2.51111 
+  N0 -0.127899 -0.0741814 0.989009   N1 -0.143025 -0.0385545 0.988968   N2 -0.186699 -0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 -1.02199 -0.284431 2.51111   V1 -0.916455 -0.538261 2.51111   V2 -0.713778 -0.419222 2.55 
+  N0 -0.186699 -0.0503275 0.981127   N1 -0.166959 -0.0968361 0.981197   N2 -0.127899 -0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 -0.795972 -0.221528 2.55   V1 -0.825 -1.11022e-16 2.55   V2 -1.05926 -4.44089e-16 2.51111 
+  N0 -0.143025 -0.0385545 0.988968   N1 -0.14834 2.37649e-17 0.988936   N2 -0.193633 7.24819e-17 0.981074 
+   txt003 
+STRI 
+  V0 -1.05926 -4.44089e-16 2.51111   V1 -1.02199 -0.284431 2.51111   V2 -0.795972 -0.221528 2.55 
+  N0 -0.193633 7.24819e-17 0.981074   N1 -0.186699 -0.0503275 0.981127   N2 -0.143025 -0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 0 -1.05926 2.51111   V1 -0.284431 -1.02199 2.51111   V2 -0.330924 -1.18904 2.46389 
+  N0 0 -0.193633 0.981074   N1 -0.0503275 -0.186699 0.981127   N2 -0.101459 -0.376378 0.920894 
+   txt003 
+STRI 
+  V0 -0.330924 -1.18904 2.46389   V1 0 -1.23241 2.46389   V2 0 -1.05926 2.51111 
+  N0 -0.101459 -0.376378 0.920894   N1 0 -0.390293 0.920691   N2 0 -0.193633 0.981074 
+   txt003 
+STRI 
+  V0 -0.284431 -1.02199 2.51111   V1 -0.538261 -0.916455 2.51111   V2 -0.626246 -1.06626 2.46389 
+  N0 -0.0503275 -0.186699 0.981127   N1 -0.0968361 -0.166959 0.981197   N2 -0.195261 -0.336657 0.92116 
+   txt003 
+STRI 
+  V0 -0.626246 -1.06626 2.46389   V1 -0.330924 -1.18904 2.46389   V2 -0.284431 -1.02199 2.51111 
+  N0 -0.195261 -0.336657 0.92116   N1 -0.101459 -0.376378 0.920894   N2 -0.0503275 -0.186699 0.981127 
+   txt003 
+STRI 
+  V0 -0.538261 -0.916455 2.51111   V1 -0.752074 -0.752074 2.51111   V2 -0.875009 -0.875009 2.46389 
+  N0 -0.0968361 -0.166959 0.981197   N1 -0.136382 -0.136382 0.981224   N2 -0.275025 -0.275025 0.921262 
+   txt003 
+STRI 
+  V0 -0.875009 -0.875009 2.46389   V1 -0.626246 -1.06626 2.46389   V2 -0.538261 -0.916455 2.51111 
+  N0 -0.275025 -0.275025 0.921262   N1 -0.195261 -0.336657 0.92116   N2 -0.0968361 -0.166959 0.981197 
+   txt003 
+STRI 
+  V0 -0.752074 -0.752074 2.51111   V1 -0.916455 -0.538261 2.51111   V2 -1.06626 -0.626246 2.46389 
+  N0 -0.136382 -0.136382 0.981224   N1 -0.166959 -0.0968361 0.981197   N2 -0.336657 -0.195261 0.92116 
+   txt003 
+STRI 
+  V0 -1.06626 -0.626246 2.46389   V1 -0.875009 -0.875009 2.46389   V2 -0.752074 -0.752074 2.51111 
+  N0 -0.336657 -0.195261 0.92116   N1 -0.275025 -0.275025 0.921262   N2 -0.136382 -0.136382 0.981224 
+   txt003 
+STRI 
+  V0 -0.916455 -0.538261 2.51111   V1 -1.02199 -0.284431 2.51111   V2 -1.18904 -0.330924 2.46389 
+  N0 -0.166959 -0.0968361 0.981197   N1 -0.186699 -0.0503275 0.981127   N2 -0.376378 -0.101459 0.920894 
+   txt003 
+STRI 
+  V0 -1.18904 -0.330924 2.46389   V1 -1.06626 -0.626246 2.46389   V2 -0.916455 -0.538261 2.51111 
+  N0 -0.376378 -0.101459 0.920894   N1 -0.336657 -0.195261 0.92116   N2 -0.166959 -0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 -1.02199 -0.284431 2.51111   V1 -1.05926 -4.44089e-16 2.51111   V2 -1.23241 -4.44089e-16 2.46389 
+  N0 -0.186699 -0.0503275 0.981127   N1 -0.193633 7.24819e-17 0.981074   N2 -0.390293 8.37138e-17 0.920691 
+   txt003 
+STRI 
+  V0 -1.23241 -4.44089e-16 2.46389   V1 -1.18904 -0.330924 2.46389   V2 -1.02199 -0.284431 2.51111 
+  N0 -0.390293 8.37138e-17 0.920691   N1 -0.376378 -0.101459 0.920894   N2 -0.186699 -0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 0 -1.23241 2.46389   V1 -0.330924 -1.18904 2.46389   V2 -0.349074 -1.25426 2.4 
+  N0 0 -0.390293 0.920691   N1 -0.101459 -0.376378 0.920894   N2 -0.260275 -0.965535 -1.02004e-15 
+   txt003 
+STRI 
+  V0 -0.349074 -1.25426 2.4   V1 0 -1.3 2.4   V2 0 -1.23241 2.46389 
+  N0 -0.260275 -0.965535 -1.02004e-15   N1 -0 -1 -9.86865e-16   N2 0 -0.390293 0.920691 
+   txt003 
+STRI 
+  V0 -0.330924 -1.18904 2.46389   V1 -0.626246 -1.06626 2.46389   V2 -0.660593 -1.12474 2.4 
+  N0 -0.101459 -0.376378 0.920894   N1 -0.195261 -0.336657 0.92116   N2 -0.501718 -0.865031 -9.69705e-16 
+   txt003 
+STRI 
+  V0 -0.660593 -1.12474 2.4   V1 -0.349074 -1.25426 2.4   V2 -0.330924 -1.18904 2.46389 
+  N0 -0.501718 -0.865031 -9.69705e-16   N1 -0.260275 -0.965535 -1.02004e-15   N2 -0.101459 -0.376378 0.920894 
+   txt003 
+STRI 
+  V0 -0.626246 -1.06626 2.46389   V1 -0.875009 -0.875009 2.46389   V2 -0.923 -0.923 2.4 
+  N0 -0.195261 -0.336657 0.92116   N1 -0.275025 -0.275025 0.921262   N2 -0.707107 -0.707107 -7.41433e-16 
+   txt003 
+STRI 
+  V0 -0.923 -0.923 2.4   V1 -0.660593 -1.12474 2.4   V2 -0.626246 -1.06626 2.46389 
+  N0 -0.707107 -0.707107 -7.41433e-16   N1 -0.501718 -0.865031 -9.69705e-16   N2 -0.195261 -0.336657 0.92116 
+   txt003 
+STRI 
+  V0 -0.875009 -0.875009 2.46389   V1 -1.06626 -0.626246 2.46389   V2 -1.12474 -0.660593 2.4 
+  N0 -0.275025 -0.275025 0.921262   N1 -0.336657 -0.195261 0.92116   N2 -0.865031 -0.501718 -4.67305e-16 
+   txt003 
+STRI 
+  V0 -1.12474 -0.660593 2.4   V1 -0.923 -0.923 2.4   V2 -0.875009 -0.875009 2.46389 
+  N0 -0.865031 -0.501718 -4.67305e-16   N1 -0.707107 -0.707107 -7.41433e-16   N2 -0.275025 -0.275025 0.921262 
+   txt003 
+STRI 
+  V0 -1.06626 -0.626246 2.46389   V1 -1.18904 -0.330924 2.46389   V2 -1.25426 -0.349074 2.4 
+  N0 -0.336657 -0.195261 0.92116   N1 -0.376378 -0.101459 0.920894   N2 -0.965535 -0.260275 -5.24893e-16 
+   txt003 
+STRI 
+  V0 -1.25426 -0.349074 2.4   V1 -1.12474 -0.660593 2.4   V2 -1.06626 -0.626246 2.46389 
+  N0 -0.965535 -0.260275 -5.24893e-16   N1 -0.865031 -0.501718 -4.67305e-16   N2 -0.336657 -0.195261 0.92116 
+   txt003 
+STRI 
+  V0 -1.18904 -0.330924 2.46389   V1 -1.23241 -4.44089e-16 2.46389   V2 -1.3 -6.66134e-16 2.4 
+  N0 -0.376378 -0.101459 0.920894   N1 -0.390293 8.37138e-17 0.920691   N2 -1 4.06675e-16 -1.4803e-15 
+   txt003 
+STRI 
+  V0 -1.3 -6.66134e-16 2.4   V1 -1.25426 -0.349074 2.4   V2 -1.18904 -0.330924 2.46389 
+  N0 -1 4.06675e-16 -1.4803e-15   N1 -0.965535 -0.260275 -5.24893e-16   N2 -0.376378 -0.101459 0.920894 
+   txt003 
+STRI 
+  V0 -0.2 0 2.7   V1 -0.192963 0.0537037 2.7   V2 -0.338579 0.0942301 2.63611 
+  N0 -0.6 0 0.8   N1 -0.578783 0.15602 0.800417   N2 -0.258756 0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 -0.338579 0.0942301 2.63611   V1 -0.350926 0 2.63611   V2 -0.2 0 2.7 
+  N0 -0.258756 0.0697517 0.963421   N1 -0.268354 0 0.96332   N2 -0.6 0 0.8 
+   txt003 
+STRI 
+  V0 -0.192963 0.0537037 2.7   V1 -0.173037 0.10163 2.7   V2 -0.303616 0.178322 2.63611 
+  N0 -0.578783 0.15602 0.800417   N1 -0.517905 0.300385 0.800964   N2 -0.231413 0.134219 0.963552 
+   txt003 
+STRI 
+  V0 -0.303616 0.178322 2.63611   V1 -0.338579 0.0942301 2.63611   V2 -0.192963 0.0537037 2.7 
+  N0 -0.231413 0.134219 0.963552   N1 -0.258756 0.0697517 0.963421   N2 -0.578783 0.15602 0.800417 
+   txt003 
+STRI 
+  V0 -0.173037 0.10163 2.7   V1 -0.142 0.142 2.7   V2 -0.249157 0.249157 2.63611 
+  N0 -0.517905 0.300385 0.800964   N1 -0.423155 0.423155 0.801174   N2 -0.189037 0.189037 0.963603 
+   txt003 
+STRI 
+  V0 -0.249157 0.249157 2.63611   V1 -0.303616 0.178322 2.63611   V2 -0.173037 0.10163 2.7 
+  N0 -0.189037 0.189037 0.963603   N1 -0.231413 0.134219 0.963552   N2 -0.517905 0.300385 0.800964 
+   txt003 
+STRI 
+  V0 -0.142 0.142 2.7   V1 -0.10163 0.173037 2.7   V2 -0.178322 0.303616 2.63611 
+  N0 -0.423155 0.423155 0.801174   N1 -0.300385 0.517905 0.800964   N2 -0.134219 0.231413 0.963552 
+   txt003 
+STRI 
+  V0 -0.178322 0.303616 2.63611   V1 -0.249157 0.249157 2.63611   V2 -0.142 0.142 2.7 
+  N0 -0.134219 0.231413 0.963552   N1 -0.189037 0.189037 0.963603   N2 -0.423155 0.423155 0.801174 
+   txt003 
+STRI 
+  V0 -0.10163 0.173037 2.7   V1 -0.0537037 0.192963 2.7   V2 -0.0942301 0.338579 2.63611 
+  N0 -0.300385 0.517905 0.800964   N1 -0.15602 0.578783 0.800417   N2 -0.0697517 0.258756 0.963421 
+   txt003 
+STRI 
+  V0 -0.0942301 0.338579 2.63611   V1 -0.178322 0.303616 2.63611   V2 -0.10163 0.173037 2.7 
+  N0 -0.0697517 0.258756 0.963421   N1 -0.134219 0.231413 0.963552   N2 -0.300385 0.517905 0.800964 
+   txt003 
+STRI 
+  V0 -0.0537037 0.192963 2.7   V1 0 0.2 2.7   V2 -5.55112e-17 0.350926 2.63611 
+  N0 -0.15602 0.578783 0.800417   N1 9.91271e-17 0.6 0.8   N2 -0 0.268354 0.96332 
+   txt003 
+STRI 
+  V0 -5.55112e-17 0.350926 2.63611   V1 -0.0942301 0.338579 2.63611   V2 -0.0537037 0.192963 2.7 
+  N0 -0 0.268354 0.96332   N1 -0.0697517 0.258756 0.963421   N2 -0.15602 0.578783 0.800417 
+   txt003 
+STRI 
+  V0 -0.350926 0 2.63611   V1 -0.338579 0.0942301 2.63611   V2 -0.553875 0.15415 2.58889 
+  N0 -0.268354 0 0.96332   N1 -0.258756 0.0697517 0.963421   N2 -0.162011 0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 -0.553875 0.15415 2.58889   V1 -0.574074 0 2.58889   V2 -0.350926 0 2.63611 
+  N0 -0.162011 0.0436726 0.985822   N1 -0.168031 0 0.985782   N2 -0.268354 0 0.96332 
+   txt003 
+STRI 
+  V0 -0.338579 0.0942301 2.63611   V1 -0.303616 0.178322 2.63611   V2 -0.49668 0.291715 2.58889 
+  N0 -0.258756 0.0697517 0.963421   N1 -0.231413 0.134219 0.963552   N2 -0.144879 0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 -0.49668 0.291715 2.58889   V1 -0.553875 0.15415 2.58889   V2 -0.338579 0.0942301 2.63611 
+  N0 -0.144879 0.0840299 0.985875   N1 -0.162011 0.0436726 0.985822   N2 -0.258756 0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 -0.303616 0.178322 2.63611   V1 -0.249157 0.249157 2.63611   V2 -0.407593 0.407593 2.58889 
+  N0 -0.231413 0.134219 0.963552   N1 -0.189037 0.189037 0.963603   N2 -0.118345 0.118345 0.985895 
+   txt003 
+STRI 
+  V0 -0.407593 0.407593 2.58889   V1 -0.49668 0.291715 2.58889   V2 -0.303616 0.178322 2.63611 
+  N0 -0.118345 0.118345 0.985895   N1 -0.144879 0.0840299 0.985875   N2 -0.231413 0.134219 0.963552 
+   txt003 
+STRI 
+  V0 -0.249157 0.249157 2.63611   V1 -0.178322 0.303616 2.63611   V2 -0.291715 0.49668 2.58889 
+  N0 -0.189037 0.189037 0.963603   N1 -0.134219 0.231413 0.963552   N2 -0.0840299 0.144879 0.985875 
+   txt003 
+STRI 
+  V0 -0.291715 0.49668 2.58889   V1 -0.407593 0.407593 2.58889   V2 -0.249157 0.249157 2.63611 
+  N0 -0.0840299 0.144879 0.985875   N1 -0.118345 0.118345 0.985895   N2 -0.189037 0.189037 0.963603 
+   txt003 
+STRI 
+  V0 -0.178322 0.303616 2.63611   V1 -0.0942301 0.338579 2.63611   V2 -0.15415 0.553875 2.58889 
+  N0 -0.134219 0.231413 0.963552   N1 -0.0697517 0.258756 0.963421   N2 -0.0436726 0.162011 0.985822 
+   txt003 
+STRI 
+  V0 -0.15415 0.553875 2.58889   V1 -0.291715 0.49668 2.58889   V2 -0.178322 0.303616 2.63611 
+  N0 -0.0436726 0.162011 0.985822   N1 -0.0840299 0.144879 0.985875   N2 -0.134219 0.231413 0.963552 
+   txt003 
+STRI 
+  V0 -0.0942301 0.338579 2.63611   V1 -5.55112e-17 0.350926 2.63611   V2 -2.22045e-16 0.574074 2.58889 
+  N0 -0.0697517 0.258756 0.963421   N1 -0 0.268354 0.96332   N2 1.93429e-17 0.168031 0.985782 
+   txt003 
+STRI 
+  V0 -2.22045e-16 0.574074 2.58889   V1 -0.15415 0.553875 2.58889   V2 -0.0942301 0.338579 2.63611 
+  N0 1.93429e-17 0.168031 0.985782   N1 -0.0436726 0.162011 0.985822   N2 -0.0697517 0.258756 0.963421 
+   txt003 
+STRI 
+  V0 -0.574074 0 2.58889   V1 -0.553875 0.15415 2.58889   V2 -0.795972 0.221528 2.55 
+  N0 -0.168031 0 0.985782   N1 -0.162011 0.0436726 0.985822   N2 -0.143025 0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 -0.795972 0.221528 2.55   V1 -0.825 0 2.55   V2 -0.574074 0 2.58889 
+  N0 -0.143025 0.0385545 0.988968   N1 -0.14834 0 0.988936   N2 -0.168031 0 0.985782 
+   txt003 
+STRI 
+  V0 -0.553875 0.15415 2.58889   V1 -0.49668 0.291715 2.58889   V2 -0.713778 0.419222 2.55 
+  N0 -0.162011 0.0436726 0.985822   N1 -0.144879 0.0840299 0.985875   N2 -0.127899 0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 -0.713778 0.419222 2.55   V1 -0.795972 0.221528 2.55   V2 -0.553875 0.15415 2.58889 
+  N0 -0.127899 0.0741814 0.989009   N1 -0.143025 0.0385545 0.988968   N2 -0.162011 0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 -0.49668 0.291715 2.58889   V1 -0.407593 0.407593 2.58889   V2 -0.58575 0.58575 2.55 
+  N0 -0.144879 0.0840299 0.985875   N1 -0.118345 0.118345 0.985895   N2 -0.104474 0.104474 0.989025 
+   txt003 
+STRI 
+  V0 -0.58575 0.58575 2.55   V1 -0.713778 0.419222 2.55   V2 -0.49668 0.291715 2.58889 
+  N0 -0.104474 0.104474 0.989025   N1 -0.127899 0.0741814 0.989009   N2 -0.144879 0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 -0.407593 0.407593 2.58889   V1 -0.291715 0.49668 2.58889   V2 -0.419222 0.713778 2.55 
+  N0 -0.118345 0.118345 0.985895   N1 -0.0840299 0.144879 0.985875   N2 -0.0741814 0.127899 0.989009 
+   txt003 
+STRI 
+  V0 -0.419222 0.713778 2.55   V1 -0.58575 0.58575 2.55   V2 -0.407593 0.407593 2.58889 
+  N0 -0.0741814 0.127899 0.989009   N1 -0.104474 0.104474 0.989025   N2 -0.118345 0.118345 0.985895 
+   txt003 
+STRI 
+  V0 -0.291715 0.49668 2.58889   V1 -0.15415 0.553875 2.58889   V2 -0.221528 0.795972 2.55 
+  N0 -0.0840299 0.144879 0.985875   N1 -0.0436726 0.162011 0.985822   N2 -0.0385545 0.143025 0.988968 
+   txt003 
+STRI 
+  V0 -0.221528 0.795972 2.55   V1 -0.419222 0.713778 2.55   V2 -0.291715 0.49668 2.58889 
+  N0 -0.0385545 0.143025 0.988968   N1 -0.0741814 0.127899 0.989009   N2 -0.0840299 0.144879 0.985875 
+   txt003 
+STRI 
+  V0 -0.15415 0.553875 2.58889   V1 -2.22045e-16 0.574074 2.58889   V2 -1.11022e-16 0.825 2.55 
+  N0 -0.0436726 0.162011 0.985822   N1 1.93429e-17 0.168031 0.985782   N2 2.37649e-17 0.14834 0.988936 
+   txt003 
+STRI 
+  V0 -1.11022e-16 0.825 2.55   V1 -0.221528 0.795972 2.55   V2 -0.15415 0.553875 2.58889 
+  N0 2.37649e-17 0.14834 0.988936   N1 -0.0385545 0.143025 0.988968   N2 -0.0436726 0.162011 0.985822 
+   txt003 
+STRI 
+  V0 -0.825 0 2.55   V1 -0.795972 0.221528 2.55   V2 -1.02199 0.284431 2.51111 
+  N0 -0.14834 0 0.988936   N1 -0.143025 0.0385545 0.988968   N2 -0.186699 0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 -1.02199 0.284431 2.51111   V1 -1.05926 0 2.51111   V2 -0.825 0 2.55 
+  N0 -0.186699 0.0503275 0.981127   N1 -0.193633 0 0.981074   N2 -0.14834 0 0.988936 
+   txt003 
+STRI 
+  V0 -0.795972 0.221528 2.55   V1 -0.713778 0.419222 2.55   V2 -0.916455 0.538261 2.51111 
+  N0 -0.143025 0.0385545 0.988968   N1 -0.127899 0.0741814 0.989009   N2 -0.166959 0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 -0.916455 0.538261 2.51111   V1 -1.02199 0.284431 2.51111   V2 -0.795972 0.221528 2.55 
+  N0 -0.166959 0.0968361 0.981197   N1 -0.186699 0.0503275 0.981127   N2 -0.143025 0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 -0.713778 0.419222 2.55   V1 -0.58575 0.58575 2.55   V2 -0.752074 0.752074 2.51111 
+  N0 -0.127899 0.0741814 0.989009   N1 -0.104474 0.104474 0.989025   N2 -0.136382 0.136382 0.981224 
+   txt003 
+STRI 
+  V0 -0.752074 0.752074 2.51111   V1 -0.916455 0.538261 2.51111   V2 -0.713778 0.419222 2.55 
+  N0 -0.136382 0.136382 0.981224   N1 -0.166959 0.0968361 0.981197   N2 -0.127899 0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 -0.58575 0.58575 2.55   V1 -0.419222 0.713778 2.55   V2 -0.538261 0.916455 2.51111 
+  N0 -0.104474 0.104474 0.989025   N1 -0.0741814 0.127899 0.989009   N2 -0.0968361 0.166959 0.981197 
+   txt003 
+STRI 
+  V0 -0.538261 0.916455 2.51111   V1 -0.752074 0.752074 2.51111   V2 -0.58575 0.58575 2.55 
+  N0 -0.0968361 0.166959 0.981197   N1 -0.136382 0.136382 0.981224   N2 -0.104474 0.104474 0.989025 
+   txt003 
+STRI 
+  V0 -0.419222 0.713778 2.55   V1 -0.221528 0.795972 2.55   V2 -0.284431 1.02199 2.51111 
+  N0 -0.0741814 0.127899 0.989009   N1 -0.0385545 0.143025 0.988968   N2 -0.0503275 0.186699 0.981127 
+   txt003 
+STRI 
+  V0 -0.284431 1.02199 2.51111   V1 -0.538261 0.916455 2.51111   V2 -0.419222 0.713778 2.55 
+  N0 -0.0503275 0.186699 0.981127   N1 -0.0968361 0.166959 0.981197   N2 -0.0741814 0.127899 0.989009 
+   txt003 
+STRI 
+  V0 -0.221528 0.795972 2.55   V1 -1.11022e-16 0.825 2.55   V2 -4.44089e-16 1.05926 2.51111 
+  N0 -0.0385545 0.143025 0.988968   N1 2.37649e-17 0.14834 0.988936   N2 7.24819e-17 0.193633 0.981074 
+   txt003 
+STRI 
+  V0 -4.44089e-16 1.05926 2.51111   V1 -0.284431 1.02199 2.51111   V2 -0.221528 0.795972 2.55 
+  N0 7.24819e-17 0.193633 0.981074   N1 -0.0503275 0.186699 0.981127   N2 -0.0385545 0.143025 0.988968 
+   txt003 
+STRI 
+  V0 -1.05926 0 2.51111   V1 -1.02199 0.284431 2.51111   V2 -1.18904 0.330924 2.46389 
+  N0 -0.193633 0 0.981074   N1 -0.186699 0.0503275 0.981127   N2 -0.376378 0.101459 0.920894 
+   txt003 
+STRI 
+  V0 -1.18904 0.330924 2.46389   V1 -1.23241 0 2.46389   V2 -1.05926 0 2.51111 
+  N0 -0.376378 0.101459 0.920894   N1 -0.390293 0 0.920691   N2 -0.193633 0 0.981074 
+   txt003 
+STRI 
+  V0 -1.02199 0.284431 2.51111   V1 -0.916455 0.538261 2.51111   V2 -1.06626 0.626246 2.46389 
+  N0 -0.186699 0.0503275 0.981127   N1 -0.166959 0.0968361 0.981197   N2 -0.336657 0.195261 0.92116 
+   txt003 
+STRI 
+  V0 -1.06626 0.626246 2.46389   V1 -1.18904 0.330924 2.46389   V2 -1.02199 0.284431 2.51111 
+  N0 -0.336657 0.195261 0.92116   N1 -0.376378 0.101459 0.920894   N2 -0.186699 0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 -0.916455 0.538261 2.51111   V1 -0.752074 0.752074 2.51111   V2 -0.875009 0.875009 2.46389 
+  N0 -0.166959 0.0968361 0.981197   N1 -0.136382 0.136382 0.981224   N2 -0.275025 0.275025 0.921262 
+   txt003 
+STRI 
+  V0 -0.875009 0.875009 2.46389   V1 -1.06626 0.626246 2.46389   V2 -0.916455 0.538261 2.51111 
+  N0 -0.275025 0.275025 0.921262   N1 -0.336657 0.195261 0.92116   N2 -0.166959 0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 -0.752074 0.752074 2.51111   V1 -0.538261 0.916455 2.51111   V2 -0.626246 1.06626 2.46389 
+  N0 -0.136382 0.136382 0.981224   N1 -0.0968361 0.166959 0.981197   N2 -0.195261 0.336657 0.92116 
+   txt003 
+STRI 
+  V0 -0.626246 1.06626 2.46389   V1 -0.875009 0.875009 2.46389   V2 -0.752074 0.752074 2.51111 
+  N0 -0.195261 0.336657 0.92116   N1 -0.275025 0.275025 0.921262   N2 -0.136382 0.136382 0.981224 
+   txt003 
+STRI 
+  V0 -0.538261 0.916455 2.51111   V1 -0.284431 1.02199 2.51111   V2 -0.330924 1.18904 2.46389 
+  N0 -0.0968361 0.166959 0.981197   N1 -0.0503275 0.186699 0.981127   N2 -0.101459 0.376378 0.920894 
+   txt003 
+STRI 
+  V0 -0.330924 1.18904 2.46389   V1 -0.626246 1.06626 2.46389   V2 -0.538261 0.916455 2.51111 
+  N0 -0.101459 0.376378 0.920894   N1 -0.195261 0.336657 0.92116   N2 -0.0968361 0.166959 0.981197 
+   txt003 
+STRI 
+  V0 -0.284431 1.02199 2.51111   V1 -4.44089e-16 1.05926 2.51111   V2 -4.44089e-16 1.23241 2.46389 
+  N0 -0.0503275 0.186699 0.981127   N1 7.24819e-17 0.193633 0.981074   N2 8.37138e-17 0.390293 0.920691 
+   txt003 
+STRI 
+  V0 -4.44089e-16 1.23241 2.46389   V1 -0.330924 1.18904 2.46389   V2 -0.284431 1.02199 2.51111 
+  N0 8.37138e-17 0.390293 0.920691   N1 -0.101459 0.376378 0.920894   N2 -0.0503275 0.186699 0.981127 
+   txt003 
+STRI 
+  V0 -1.23241 0 2.46389   V1 -1.18904 0.330924 2.46389   V2 -1.25426 0.349074 2.4 
+  N0 -0.390293 0 0.920691   N1 -0.376378 0.101459 0.920894   N2 -0.965535 0.260275 -1.02004e-15 
+   txt003 
+STRI 
+  V0 -1.25426 0.349074 2.4   V1 -1.3 0 2.4   V2 -1.23241 0 2.46389 
+  N0 -0.965535 0.260275 -1.02004e-15   N1 -1 0 -9.86865e-16   N2 -0.390293 0 0.920691 
+   txt003 
+STRI 
+  V0 -1.18904 0.330924 2.46389   V1 -1.06626 0.626246 2.46389   V2 -1.12474 0.660593 2.4 
+  N0 -0.376378 0.101459 0.920894   N1 -0.336657 0.195261 0.92116   N2 -0.865031 0.501718 -9.69705e-16 
+   txt003 
+STRI 
+  V0 -1.12474 0.660593 2.4   V1 -1.25426 0.349074 2.4   V2 -1.18904 0.330924 2.46389 
+  N0 -0.865031 0.501718 -9.69705e-16   N1 -0.965535 0.260275 -1.02004e-15   N2 -0.376378 0.101459 0.920894 
+   txt003 
+STRI 
+  V0 -1.06626 0.626246 2.46389   V1 -0.875009 0.875009 2.46389   V2 -0.923 0.923 2.4 
+  N0 -0.336657 0.195261 0.92116   N1 -0.275025 0.275025 0.921262   N2 -0.707107 0.707107 -7.41433e-16 
+   txt003 
+STRI 
+  V0 -0.923 0.923 2.4   V1 -1.12474 0.660593 2.4   V2 -1.06626 0.626246 2.46389 
+  N0 -0.707107 0.707107 -7.41433e-16   N1 -0.865031 0.501718 -9.69705e-16   N2 -0.336657 0.195261 0.92116 
+   txt003 
+STRI 
+  V0 -0.875009 0.875009 2.46389   V1 -0.626246 1.06626 2.46389   V2 -0.660593 1.12474 2.4 
+  N0 -0.275025 0.275025 0.921262   N1 -0.195261 0.336657 0.92116   N2 -0.501718 0.865031 -4.67305e-16 
+   txt003 
+STRI 
+  V0 -0.660593 1.12474 2.4   V1 -0.923 0.923 2.4   V2 -0.875009 0.875009 2.46389 
+  N0 -0.501718 0.865031 -4.67305e-16   N1 -0.707107 0.707107 -7.41433e-16   N2 -0.275025 0.275025 0.921262 
+   txt003 
+STRI 
+  V0 -0.626246 1.06626 2.46389   V1 -0.330924 1.18904 2.46389   V2 -0.349074 1.25426 2.4 
+  N0 -0.195261 0.336657 0.92116   N1 -0.101459 0.376378 0.920894   N2 -0.260275 0.965535 -5.24893e-16 
+   txt003 
+STRI 
+  V0 -0.349074 1.25426 2.4   V1 -0.660593 1.12474 2.4   V2 -0.626246 1.06626 2.46389 
+  N0 -0.260275 0.965535 -5.24893e-16   N1 -0.501718 0.865031 -4.67305e-16   N2 -0.195261 0.336657 0.92116 
+   txt003 
+STRI 
+  V0 -0.330924 1.18904 2.46389   V1 -4.44089e-16 1.23241 2.46389   V2 -6.66134e-16 1.3 2.4 
+  N0 -0.101459 0.376378 0.920894   N1 8.37138e-17 0.390293 0.920691   N2 4.06675e-16 1 -1.4803e-15 
+   txt003 
+STRI 
+  V0 -6.66134e-16 1.3 2.4   V1 -0.349074 1.25426 2.4   V2 -0.330924 1.18904 2.46389 
+  N0 4.06675e-16 1 -1.4803e-15   N1 -0.260275 0.965535 -5.24893e-16   N2 -0.101459 0.376378 0.920894 
+   txt003 
+STRI 
+  V0 0 0.2 2.7   V1 0.0537037 0.192963 2.7   V2 0.0942301 0.338579 2.63611 
+  N0 -0 0.6 0.8   N1 0.15602 0.578783 0.800417   N2 0.0697517 0.258756 0.963421 
+   txt003 
+STRI 
+  V0 0.0942301 0.338579 2.63611   V1 0 0.350926 2.63611   V2 0 0.2 2.7 
+  N0 0.0697517 0.258756 0.963421   N1 -0 0.268354 0.96332   N2 -0 0.6 0.8 
+   txt003 
+STRI 
+  V0 0.0537037 0.192963 2.7   V1 0.10163 0.173037 2.7   V2 0.178322 0.303616 2.63611 
+  N0 0.15602 0.578783 0.800417   N1 0.300385 0.517905 0.800964   N2 0.134219 0.231413 0.963552 
+   txt003 
+STRI 
+  V0 0.178322 0.303616 2.63611   V1 0.0942301 0.338579 2.63611   V2 0.0537037 0.192963 2.7 
+  N0 0.134219 0.231413 0.963552   N1 0.0697517 0.258756 0.963421   N2 0.15602 0.578783 0.800417 
+   txt003 
+STRI 
+  V0 0.10163 0.173037 2.7   V1 0.142 0.142 2.7   V2 0.249157 0.249157 2.63611 
+  N0 0.300385 0.517905 0.800964   N1 0.423155 0.423155 0.801174   N2 0.189037 0.189037 0.963603 
+   txt003 
+STRI 
+  V0 0.249157 0.249157 2.63611   V1 0.178322 0.303616 2.63611   V2 0.10163 0.173037 2.7 
+  N0 0.189037 0.189037 0.963603   N1 0.134219 0.231413 0.963552   N2 0.300385 0.517905 0.800964 
+   txt003 
+STRI 
+  V0 0.142 0.142 2.7   V1 0.173037 0.10163 2.7   V2 0.303616 0.178322 2.63611 
+  N0 0.423155 0.423155 0.801174   N1 0.517905 0.300385 0.800964   N2 0.231413 0.134219 0.963552 
+   txt003 
+STRI 
+  V0 0.303616 0.178322 2.63611   V1 0.249157 0.249157 2.63611   V2 0.142 0.142 2.7 
+  N0 0.231413 0.134219 0.963552   N1 0.189037 0.189037 0.963603   N2 0.423155 0.423155 0.801174 
+   txt003 
+STRI 
+  V0 0.173037 0.10163 2.7   V1 0.192963 0.0537037 2.7   V2 0.338579 0.0942301 2.63611 
+  N0 0.517905 0.300385 0.800964   N1 0.578783 0.15602 0.800417   N2 0.258756 0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 0.338579 0.0942301 2.63611   V1 0.303616 0.178322 2.63611   V2 0.173037 0.10163 2.7 
+  N0 0.258756 0.0697517 0.963421   N1 0.231413 0.134219 0.963552   N2 0.517905 0.300385 0.800964 
+   txt003 
+STRI 
+  V0 0.192963 0.0537037 2.7   V1 0.2 0 2.7   V2 0.350926 5.55112e-17 2.63611 
+  N0 0.578783 0.15602 0.800417   N1 0.6 -9.91271e-17 0.8   N2 0.268354 0 0.96332 
+   txt003 
+STRI 
+  V0 0.350926 5.55112e-17 2.63611   V1 0.338579 0.0942301 2.63611   V2 0.192963 0.0537037 2.7 
+  N0 0.268354 0 0.96332   N1 0.258756 0.0697517 0.963421   N2 0.578783 0.15602 0.800417 
+   txt003 
+STRI 
+  V0 0 0.350926 2.63611   V1 0.0942301 0.338579 2.63611   V2 0.15415 0.553875 2.58889 
+  N0 -0 0.268354 0.96332   N1 0.0697517 0.258756 0.963421   N2 0.0436726 0.162011 0.985822 
+   txt003 
+STRI 
+  V0 0.15415 0.553875 2.58889   V1 0 0.574074 2.58889   V2 0 0.350926 2.63611 
+  N0 0.0436726 0.162011 0.985822   N1 -0 0.168031 0.985782   N2 -0 0.268354 0.96332 
+   txt003 
+STRI 
+  V0 0.0942301 0.338579 2.63611   V1 0.178322 0.303616 2.63611   V2 0.291715 0.49668 2.58889 
+  N0 0.0697517 0.258756 0.963421   N1 0.134219 0.231413 0.963552   N2 0.0840299 0.144879 0.985875 
+   txt003 
+STRI 
+  V0 0.291715 0.49668 2.58889   V1 0.15415 0.553875 2.58889   V2 0.0942301 0.338579 2.63611 
+  N0 0.0840299 0.144879 0.985875   N1 0.0436726 0.162011 0.985822   N2 0.0697517 0.258756 0.963421 
+   txt003 
+STRI 
+  V0 0.178322 0.303616 2.63611   V1 0.249157 0.249157 2.63611   V2 0.407593 0.407593 2.58889 
+  N0 0.134219 0.231413 0.963552   N1 0.189037 0.189037 0.963603   N2 0.118345 0.118345 0.985895 
+   txt003 
+STRI 
+  V0 0.407593 0.407593 2.58889   V1 0.291715 0.49668 2.58889   V2 0.178322 0.303616 2.63611 
+  N0 0.118345 0.118345 0.985895   N1 0.0840299 0.144879 0.985875   N2 0.134219 0.231413 0.963552 
+   txt003 
+STRI 
+  V0 0.249157 0.249157 2.63611   V1 0.303616 0.178322 2.63611   V2 0.49668 0.291715 2.58889 
+  N0 0.189037 0.189037 0.963603   N1 0.231413 0.134219 0.963552   N2 0.144879 0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 0.49668 0.291715 2.58889   V1 0.407593 0.407593 2.58889   V2 0.249157 0.249157 2.63611 
+  N0 0.144879 0.0840299 0.985875   N1 0.118345 0.118345 0.985895   N2 0.189037 0.189037 0.963603 
+   txt003 
+STRI 
+  V0 0.303616 0.178322 2.63611   V1 0.338579 0.0942301 2.63611   V2 0.553875 0.15415 2.58889 
+  N0 0.231413 0.134219 0.963552   N1 0.258756 0.0697517 0.963421   N2 0.162011 0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 0.553875 0.15415 2.58889   V1 0.49668 0.291715 2.58889   V2 0.303616 0.178322 2.63611 
+  N0 0.162011 0.0436726 0.985822   N1 0.144879 0.0840299 0.985875   N2 0.231413 0.134219 0.963552 
+   txt003 
+STRI 
+  V0 0.338579 0.0942301 2.63611   V1 0.350926 5.55112e-17 2.63611   V2 0.574074 2.22045e-16 2.58889 
+  N0 0.258756 0.0697517 0.963421   N1 0.268354 0 0.96332   N2 0.168031 -1.93429e-17 0.985782 
+   txt003 
+STRI 
+  V0 0.574074 2.22045e-16 2.58889   V1 0.553875 0.15415 2.58889   V2 0.338579 0.0942301 2.63611 
+  N0 0.168031 -1.93429e-17 0.985782   N1 0.162011 0.0436726 0.985822   N2 0.258756 0.0697517 0.963421 
+   txt003 
+STRI 
+  V0 0 0.574074 2.58889   V1 0.15415 0.553875 2.58889   V2 0.221528 0.795972 2.55 
+  N0 -0 0.168031 0.985782   N1 0.0436726 0.162011 0.985822   N2 0.0385545 0.143025 0.988968 
+   txt003 
+STRI 
+  V0 0.221528 0.795972 2.55   V1 0 0.825 2.55   V2 0 0.574074 2.58889 
+  N0 0.0385545 0.143025 0.988968   N1 -0 0.14834 0.988936   N2 -0 0.168031 0.985782 
+   txt003 
+STRI 
+  V0 0.15415 0.553875 2.58889   V1 0.291715 0.49668 2.58889   V2 0.419222 0.713778 2.55 
+  N0 0.0436726 0.162011 0.985822   N1 0.0840299 0.144879 0.985875   N2 0.0741814 0.127899 0.989009 
+   txt003 
+STRI 
+  V0 0.419222 0.713778 2.55   V1 0.221528 0.795972 2.55   V2 0.15415 0.553875 2.58889 
+  N0 0.0741814 0.127899 0.989009   N1 0.0385545 0.143025 0.988968   N2 0.0436726 0.162011 0.985822 
+   txt003 
+STRI 
+  V0 0.291715 0.49668 2.58889   V1 0.407593 0.407593 2.58889   V2 0.58575 0.58575 2.55 
+  N0 0.0840299 0.144879 0.985875   N1 0.118345 0.118345 0.985895   N2 0.104474 0.104474 0.989025 
+   txt003 
+STRI 
+  V0 0.58575 0.58575 2.55   V1 0.419222 0.713778 2.55   V2 0.291715 0.49668 2.58889 
+  N0 0.104474 0.104474 0.989025   N1 0.0741814 0.127899 0.989009   N2 0.0840299 0.144879 0.985875 
+   txt003 
+STRI 
+  V0 0.407593 0.407593 2.58889   V1 0.49668 0.291715 2.58889   V2 0.713778 0.419222 2.55 
+  N0 0.118345 0.118345 0.985895   N1 0.144879 0.0840299 0.985875   N2 0.127899 0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 0.713778 0.419222 2.55   V1 0.58575 0.58575 2.55   V2 0.407593 0.407593 2.58889 
+  N0 0.127899 0.0741814 0.989009   N1 0.104474 0.104474 0.989025   N2 0.118345 0.118345 0.985895 
+   txt003 
+STRI 
+  V0 0.49668 0.291715 2.58889   V1 0.553875 0.15415 2.58889   V2 0.795972 0.221528 2.55 
+  N0 0.144879 0.0840299 0.985875   N1 0.162011 0.0436726 0.985822   N2 0.143025 0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 0.795972 0.221528 2.55   V1 0.713778 0.419222 2.55   V2 0.49668 0.291715 2.58889 
+  N0 0.143025 0.0385545 0.988968   N1 0.127899 0.0741814 0.989009   N2 0.144879 0.0840299 0.985875 
+   txt003 
+STRI 
+  V0 0.553875 0.15415 2.58889   V1 0.574074 2.22045e-16 2.58889   V2 0.825 1.11022e-16 2.55 
+  N0 0.162011 0.0436726 0.985822   N1 0.168031 -1.93429e-17 0.985782   N2 0.14834 -2.37649e-17 0.988936 
+   txt003 
+STRI 
+  V0 0.825 1.11022e-16 2.55   V1 0.795972 0.221528 2.55   V2 0.553875 0.15415 2.58889 
+  N0 0.14834 -2.37649e-17 0.988936   N1 0.143025 0.0385545 0.988968   N2 0.162011 0.0436726 0.985822 
+   txt003 
+STRI 
+  V0 0 0.825 2.55   V1 0.221528 0.795972 2.55   V2 0.284431 1.02199 2.51111 
+  N0 -0 0.14834 0.988936   N1 0.0385545 0.143025 0.988968   N2 0.0503275 0.186699 0.981127 
+   txt003 
+STRI 
+  V0 0.284431 1.02199 2.51111   V1 0 1.05926 2.51111   V2 0 0.825 2.55 
+  N0 0.0503275 0.186699 0.981127   N1 -0 0.193633 0.981074   N2 -0 0.14834 0.988936 
+   txt003 
+STRI 
+  V0 0.221528 0.795972 2.55   V1 0.419222 0.713778 2.55   V2 0.538261 0.916455 2.51111 
+  N0 0.0385545 0.143025 0.988968   N1 0.0741814 0.127899 0.989009   N2 0.0968361 0.166959 0.981197 
+   txt003 
+STRI 
+  V0 0.538261 0.916455 2.51111   V1 0.284431 1.02199 2.51111   V2 0.221528 0.795972 2.55 
+  N0 0.0968361 0.166959 0.981197   N1 0.0503275 0.186699 0.981127   N2 0.0385545 0.143025 0.988968 
+   txt003 
+STRI 
+  V0 0.419222 0.713778 2.55   V1 0.58575 0.58575 2.55   V2 0.752074 0.752074 2.51111 
+  N0 0.0741814 0.127899 0.989009   N1 0.104474 0.104474 0.989025   N2 0.136382 0.136382 0.981224 
+   txt003 
+STRI 
+  V0 0.752074 0.752074 2.51111   V1 0.538261 0.916455 2.51111   V2 0.419222 0.713778 2.55 
+  N0 0.136382 0.136382 0.981224   N1 0.0968361 0.166959 0.981197   N2 0.0741814 0.127899 0.989009 
+   txt003 
+STRI 
+  V0 0.58575 0.58575 2.55   V1 0.713778 0.419222 2.55   V2 0.916455 0.538261 2.51111 
+  N0 0.104474 0.104474 0.989025   N1 0.127899 0.0741814 0.989009   N2 0.166959 0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 0.916455 0.538261 2.51111   V1 0.752074 0.752074 2.51111   V2 0.58575 0.58575 2.55 
+  N0 0.166959 0.0968361 0.981197   N1 0.136382 0.136382 0.981224   N2 0.104474 0.104474 0.989025 
+   txt003 
+STRI 
+  V0 0.713778 0.419222 2.55   V1 0.795972 0.221528 2.55   V2 1.02199 0.284431 2.51111 
+  N0 0.127899 0.0741814 0.989009   N1 0.143025 0.0385545 0.988968   N2 0.186699 0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 1.02199 0.284431 2.51111   V1 0.916455 0.538261 2.51111   V2 0.713778 0.419222 2.55 
+  N0 0.186699 0.0503275 0.981127   N1 0.166959 0.0968361 0.981197   N2 0.127899 0.0741814 0.989009 
+   txt003 
+STRI 
+  V0 0.795972 0.221528 2.55   V1 0.825 1.11022e-16 2.55   V2 1.05926 4.44089e-16 2.51111 
+  N0 0.143025 0.0385545 0.988968   N1 0.14834 -2.37649e-17 0.988936   N2 0.193633 -7.24819e-17 0.981074 
+   txt003 
+STRI 
+  V0 1.05926 4.44089e-16 2.51111   V1 1.02199 0.284431 2.51111   V2 0.795972 0.221528 2.55 
+  N0 0.193633 -7.24819e-17 0.981074   N1 0.186699 0.0503275 0.981127   N2 0.143025 0.0385545 0.988968 
+   txt003 
+STRI 
+  V0 0 1.05926 2.51111   V1 0.284431 1.02199 2.51111   V2 0.330924 1.18904 2.46389 
+  N0 -0 0.193633 0.981074   N1 0.0503275 0.186699 0.981127   N2 0.101459 0.376378 0.920894 
+   txt003 
+STRI 
+  V0 0.330924 1.18904 2.46389   V1 0 1.23241 2.46389   V2 0 1.05926 2.51111 
+  N0 0.101459 0.376378 0.920894   N1 -0 0.390293 0.920691   N2 -0 0.193633 0.981074 
+   txt003 
+STRI 
+  V0 0.284431 1.02199 2.51111   V1 0.538261 0.916455 2.51111   V2 0.626246 1.06626 2.46389 
+  N0 0.0503275 0.186699 0.981127   N1 0.0968361 0.166959 0.981197   N2 0.195261 0.336657 0.92116 
+   txt003 
+STRI 
+  V0 0.626246 1.06626 2.46389   V1 0.330924 1.18904 2.46389   V2 0.284431 1.02199 2.51111 
+  N0 0.195261 0.336657 0.92116   N1 0.101459 0.376378 0.920894   N2 0.0503275 0.186699 0.981127 
+   txt003 
+STRI 
+  V0 0.538261 0.916455 2.51111   V1 0.752074 0.752074 2.51111   V2 0.875009 0.875009 2.46389 
+  N0 0.0968361 0.166959 0.981197   N1 0.136382 0.136382 0.981224   N2 0.275025 0.275025 0.921262 
+   txt003 
+STRI 
+  V0 0.875009 0.875009 2.46389   V1 0.626246 1.06626 2.46389   V2 0.538261 0.916455 2.51111 
+  N0 0.275025 0.275025 0.921262   N1 0.195261 0.336657 0.92116   N2 0.0968361 0.166959 0.981197 
+   txt003 
+STRI 
+  V0 0.752074 0.752074 2.51111   V1 0.916455 0.538261 2.51111   V2 1.06626 0.626246 2.46389 
+  N0 0.136382 0.136382 0.981224   N1 0.166959 0.0968361 0.981197   N2 0.336657 0.195261 0.92116 
+   txt003 
+STRI 
+  V0 1.06626 0.626246 2.46389   V1 0.875009 0.875009 2.46389   V2 0.752074 0.752074 2.51111 
+  N0 0.336657 0.195261 0.92116   N1 0.275025 0.275025 0.921262   N2 0.136382 0.136382 0.981224 
+   txt003 
+STRI 
+  V0 0.916455 0.538261 2.51111   V1 1.02199 0.284431 2.51111   V2 1.18904 0.330924 2.46389 
+  N0 0.166959 0.0968361 0.981197   N1 0.186699 0.0503275 0.981127   N2 0.376378 0.101459 0.920894 
+   txt003 
+STRI 
+  V0 1.18904 0.330924 2.46389   V1 1.06626 0.626246 2.46389   V2 0.916455 0.538261 2.51111 
+  N0 0.376378 0.101459 0.920894   N1 0.336657 0.195261 0.92116   N2 0.166959 0.0968361 0.981197 
+   txt003 
+STRI 
+  V0 1.02199 0.284431 2.51111   V1 1.05926 4.44089e-16 2.51111   V2 1.23241 4.44089e-16 2.46389 
+  N0 0.186699 0.0503275 0.981127   N1 0.193633 -7.24819e-17 0.981074   N2 0.390293 -8.37138e-17 0.920691 
+   txt003 
+STRI 
+  V0 1.23241 4.44089e-16 2.46389   V1 1.18904 0.330924 2.46389   V2 1.02199 0.284431 2.51111 
+  N0 0.390293 -8.37138e-17 0.920691   N1 0.376378 0.101459 0.920894   N2 0.186699 0.0503275 0.981127 
+   txt003 
+STRI 
+  V0 0 1.23241 2.46389   V1 0.330924 1.18904 2.46389   V2 0.349074 1.25426 2.4 
+  N0 -0 0.390293 0.920691   N1 0.101459 0.376378 0.920894   N2 0.260275 0.965535 -1.02004e-15 
+   txt003 
+STRI 
+  V0 0.349074 1.25426 2.4   V1 0 1.3 2.4   V2 0 1.23241 2.46389 
+  N0 0.260275 0.965535 -1.02004e-15   N1 0 1 -9.86865e-16   N2 -0 0.390293 0.920691 
+   txt003 
+STRI 
+  V0 0.330924 1.18904 2.46389   V1 0.626246 1.06626 2.46389   V2 0.660593 1.12474 2.4 
+  N0 0.101459 0.376378 0.920894   N1 0.195261 0.336657 0.92116   N2 0.501718 0.865031 -9.69705e-16 
+   txt003 
+STRI 
+  V0 0.660593 1.12474 2.4   V1 0.349074 1.25426 2.4   V2 0.330924 1.18904 2.46389 
+  N0 0.501718 0.865031 -9.69705e-16   N1 0.260275 0.965535 -1.02004e-15   N2 0.101459 0.376378 0.920894 
+   txt003 
+STRI 
+  V0 0.626246 1.06626 2.46389   V1 0.875009 0.875009 2.46389   V2 0.923 0.923 2.4 
+  N0 0.195261 0.336657 0.92116   N1 0.275025 0.275025 0.921262   N2 0.707107 0.707107 -7.41433e-16 
+   txt003 
+STRI 
+  V0 0.923 0.923 2.4   V1 0.660593 1.12474 2.4   V2 0.626246 1.06626 2.46389 
+  N0 0.707107 0.707107 -7.41433e-16   N1 0.501718 0.865031 -9.69705e-16   N2 0.195261 0.336657 0.92116 
+   txt003 
+STRI 
+  V0 0.875009 0.875009 2.46389   V1 1.06626 0.626246 2.46389   V2 1.12474 0.660593 2.4 
+  N0 0.275025 0.275025 0.921262   N1 0.336657 0.195261 0.92116   N2 0.865031 0.501718 -4.67305e-16 
+   txt003 
+STRI 
+  V0 1.12474 0.660593 2.4   V1 0.923 0.923 2.4   V2 0.875009 0.875009 2.46389 
+  N0 0.865031 0.501718 -4.67305e-16   N1 0.707107 0.707107 -7.41433e-16   N2 0.275025 0.275025 0.921262 
+   txt003 
+STRI 
+  V0 1.06626 0.626246 2.46389   V1 1.18904 0.330924 2.46389   V2 1.25426 0.349074 2.4 
+  N0 0.336657 0.195261 0.92116   N1 0.376378 0.101459 0.920894   N2 0.965535 0.260275 -5.24893e-16 
+   txt003 
+STRI 
+  V0 1.25426 0.349074 2.4   V1 1.12474 0.660593 2.4   V2 1.06626 0.626246 2.46389 
+  N0 0.965535 0.260275 -5.24893e-16   N1 0.865031 0.501718 -4.67305e-16   N2 0.336657 0.195261 0.92116 
+   txt003 
+STRI 
+  V0 1.18904 0.330924 2.46389   V1 1.23241 4.44089e-16 2.46389   V2 1.3 6.66134e-16 2.4 
+  N0 0.376378 0.101459 0.920894   N1 0.390293 -8.37138e-17 0.920691   N2 1 -4.06675e-16 -1.4803e-15 
+   txt003 
+STRI 
+  V0 1.3 6.66134e-16 2.4   V1 1.25426 0.349074 2.4   V2 1.18904 0.330924 2.46389 
+  N0 1 -4.06675e-16 -1.4803e-15   N1 0.965535 0.260275 -5.24893e-16   N2 0.376378 0.101459 0.920894 
+   txt003 
+STRI 
+  V0 0.584584 0.162696 0.00590278   V1 0.605903 0 0.00590278   V2 0 0 0 
+  N0 0.0218614 0.00589307 -0.999744   N1 0.0226746 0 -0.999743   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.524218 0.307888 0.00590278   V1 0.584584 0.162696 0.00590278   V2 0 0 0 
+  N0 0.0195486 0.0113382 -0.999745   N1 0.0218614 0.00589307 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.430191 0.430191 0.00590278   V1 0.524218 0.307888 0.00590278   V2 0 0 0 
+  N0 0.015968 0.015968 -0.999745   N1 0.0195486 0.0113382 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.307888 0.524218 0.00590278   V1 0.430191 0.430191 0.00590278   V2 0 0 0 
+  N0 0.0113382 0.0195486 -0.999745   N1 0.015968 0.015968 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.162696 0.584584 0.00590278   V1 0.307888 0.524218 0.00590278   V2 0 0 0 
+  N0 0.00589307 0.0218614 -0.999744   N1 0.0113382 0.0195486 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0 0.605903 0.00590278   V1 0.162696 0.584584 0.00590278   V2 0 0 0 
+  N0 4.94615e-18 0.0226746 -0.999743   N1 0.00589307 0.0218614 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.605903 0 0.00590278   V1 0.584584 0.162696 0.00590278   V2 0.986255 0.274486 0.0222222 
+  N0 0.0226746 0 -0.999743   N1 0.0218614 0.00589307 -0.999744   N2 0.0601415 0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 0.986255 0.274486 0.0222222   V1 1.02222 0 0.0222222   V2 0.605903 0 0.00590278 
+  N0 0.0601415 0.0162121 -0.998058   N1 0.0623783 0 -0.998053   N2 0.0226746 0 -0.999743 
+   txt003 
+STRI 
+  V0 0.584584 0.162696 0.00590278   V1 0.524218 0.307888 0.00590278   V2 0.884412 0.51944 0.0222222 
+  N0 0.0218614 0.00589307 -0.999744   N1 0.0195486 0.0113382 -0.999745   N2 0.0537792 0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 0.884412 0.51944 0.0222222   V1 0.986255 0.274486 0.0222222   V2 0.584584 0.162696 0.00590278 
+  N0 0.0537792 0.0311919 -0.998066   N1 0.0601415 0.0162121 -0.998058   N2 0.0218614 0.00589307 -0.999744 
+   txt003 
+STRI 
+  V0 0.524218 0.307888 0.00590278   V1 0.430191 0.430191 0.00590278   V2 0.725778 0.725778 0.0222222 
+  N0 0.0195486 0.0113382 -0.999745   N1 0.015968 0.015968 -0.999745   N2 0.0439291 0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 0.725778 0.725778 0.0222222   V1 0.884412 0.51944 0.0222222   V2 0.524218 0.307888 0.00590278 
+  N0 0.0439291 0.0439291 -0.998068   N1 0.0537792 0.0311919 -0.998066   N2 0.0195486 0.0113382 -0.999745 
+   txt003 
+STRI 
+  V0 0.430191 0.430191 0.00590278   V1 0.307888 0.524218 0.00590278   V2 0.51944 0.884412 0.0222222 
+  N0 0.015968 0.015968 -0.999745   N1 0.0113382 0.0195486 -0.999745   N2 0.0311919 0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 0.51944 0.884412 0.0222222   V1 0.725778 0.725778 0.0222222   V2 0.430191 0.430191 0.00590278 
+  N0 0.0311919 0.0537792 -0.998066   N1 0.0439291 0.0439291 -0.998068   N2 0.015968 0.015968 -0.999745 
+   txt003 
+STRI 
+  V0 0.307888 0.524218 0.00590278   V1 0.162696 0.584584 0.00590278   V2 0.274486 0.986255 0.0222222 
+  N0 0.0113382 0.0195486 -0.999745   N1 0.00589307 0.0218614 -0.999744   N2 0.0162121 0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 0.274486 0.986255 0.0222222   V1 0.51944 0.884412 0.0222222   V2 0.307888 0.524218 0.00590278 
+  N0 0.0162121 0.0601415 -0.998058   N1 0.0311919 0.0537792 -0.998066   N2 0.0113382 0.0195486 -0.999745 
+   txt003 
+STRI 
+  V0 0.162696 0.584584 0.00590278   V1 0 0.605903 0.00590278   V2 -2.22045e-16 1.02222 0.0222222 
+  N0 0.00589307 0.0218614 -0.999744   N1 4.94615e-18 0.0226746 -0.999743   N2 0 0.0623783 -0.998053 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.02222 0.0222222   V1 0.274486 0.986255 0.0222222   V2 0.162696 0.584584 0.00590278 
+  N0 0 0.0623783 -0.998053   N1 0.0162121 0.0601415 -0.998058   N2 0.00589307 0.0218614 -0.999744 
+   txt003 
+STRI 
+  V0 1.02222 0 0.0222222   V1 0.986255 0.274486 0.0222222   V2 1.23918 0.344878 0.046875 
+  N0 0.0623783 0 -0.998053   N1 0.0601415 0.0162121 -0.998058   N2 0.136353 0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 1.23918 0.344878 0.046875   V1 1.28438 0 0.046875   V2 1.02222 0 0.0222222 
+  N0 0.136353 0.0367561 -0.989978   N1 0.141421 0 -0.989949   N2 0.0623783 0 -0.998053 
+   txt003 
+STRI 
+  V0 0.986255 0.274486 0.0222222   V1 0.884412 0.51944 0.0222222   V2 1.11122 0.652653 0.046875 
+  N0 0.0601415 0.0162121 -0.998058   N1 0.0537792 0.0311919 -0.998066   N2 0.121932 0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 1.11122 0.652653 0.046875   V1 1.23918 0.344878 0.046875   V2 0.986255 0.274486 0.0222222 
+  N0 0.121932 0.0707208 -0.990016   N1 0.136353 0.0367561 -0.989978   N2 0.0601415 0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 0.884412 0.51944 0.0222222   V1 0.725778 0.725778 0.0222222   V2 0.911906 0.911906 0.046875 
+  N0 0.0537792 0.0311919 -0.998066   N1 0.0439291 0.0439291 -0.998068   N2 0.0996006 0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 0.911906 0.911906 0.046875   V1 1.11122 0.652653 0.046875   V2 0.884412 0.51944 0.0222222 
+  N0 0.0996006 0.0996006 -0.99003   N1 0.121932 0.0707208 -0.990016   N2 0.0537792 0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 0.725778 0.725778 0.0222222   V1 0.51944 0.884412 0.0222222   V2 0.652653 1.11122 0.046875 
+  N0 0.0439291 0.0439291 -0.998068   N1 0.0311919 0.0537792 -0.998066   N2 0.0707208 0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 0.652653 1.11122 0.046875   V1 0.911906 0.911906 0.046875   V2 0.725778 0.725778 0.0222222 
+  N0 0.0707208 0.121932 -0.990016   N1 0.0996006 0.0996006 -0.99003   N2 0.0439291 0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 0.51944 0.884412 0.0222222   V1 0.274486 0.986255 0.0222222   V2 0.344878 1.23918 0.046875 
+  N0 0.0311919 0.0537792 -0.998066   N1 0.0162121 0.0601415 -0.998058   N2 0.0367561 0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 0.344878 1.23918 0.046875   V1 0.652653 1.11122 0.046875   V2 0.51944 0.884412 0.0222222 
+  N0 0.0367561 0.136353 -0.989978   N1 0.0707208 0.121932 -0.990016   N2 0.0311919 0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 0.274486 0.986255 0.0222222   V1 -2.22045e-16 1.02222 0.0222222   V2 2.22045e-16 1.28437 0.046875 
+  N0 0.0162121 0.0601415 -0.998058   N1 0 0.0623783 -0.998053   N2 0 0.141421 -0.989949 
+   txt003 
+STRI 
+  V0 2.22045e-16 1.28437 0.046875   V1 0.344878 1.23918 0.046875   V2 0.274486 0.986255 0.0222222 
+  N0 0 0.141421 -0.989949   N1 0.0367561 0.136353 -0.989978   N2 0.0162121 0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 1.28438 0 0.046875   V1 1.23918 0.344878 0.046875   V2 1.37754 0.383385 0.0777778 
+  N0 0.141421 0 -0.989949   N1 0.136353 0.0367561 -0.989978   N2 0.316788 0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 1.37754 0.383385 0.0777778   V1 1.42778 0 0.0777778   V2 1.28438 0 0.046875 
+  N0 0.316788 0.085395 -0.944644   N1 0.328521 0 -0.944497   N2 0.141421 0 -0.989949 
+   txt003 
+STRI 
+  V0 1.23918 0.344878 0.046875   V1 1.11122 0.652653 0.046875   V2 1.23529 0.725523 0.0777778 
+  N0 0.136353 0.0367561 -0.989978   N1 0.121932 0.0707208 -0.990016   N2 0.283331 0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 1.23529 0.725523 0.0777778   V1 1.37754 0.383385 0.0777778   V2 1.23918 0.344878 0.046875 
+  N0 0.283331 0.164332 -0.944838   N1 0.316788 0.085395 -0.944644   N2 0.136353 0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 1.11122 0.652653 0.046875   V1 0.911906 0.911906 0.046875   V2 1.01372 1.01372 0.0777778 
+  N0 0.121932 0.0707208 -0.990016   N1 0.0996006 0.0996006 -0.99003   N2 0.231454 0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 1.01372 1.01372 0.0777778   V1 1.23529 0.725523 0.0777778   V2 1.11122 0.652653 0.046875 
+  N0 0.231454 0.231454 -0.944912   N1 0.283331 0.164332 -0.944838   N2 0.121932 0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 0.911906 0.911906 0.046875   V1 0.652653 1.11122 0.046875   V2 0.725523 1.23529 0.0777778 
+  N0 0.0996006 0.0996006 -0.99003   N1 0.0707208 0.121932 -0.990016   N2 0.164332 0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 0.725523 1.23529 0.0777778   V1 1.01372 1.01372 0.0777778   V2 0.911906 0.911906 0.046875 
+  N0 0.164332 0.283331 -0.944838   N1 0.231454 0.231454 -0.944912   N2 0.0996006 0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 0.652653 1.11122 0.046875   V1 0.344878 1.23918 0.046875   V2 0.383385 1.37754 0.0777778 
+  N0 0.0707208 0.121932 -0.990016   N1 0.0367561 0.136353 -0.989978   N2 0.085395 0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 0.383385 1.37754 0.0777778   V1 0.725523 1.23529 0.0777778   V2 0.652653 1.11122 0.046875 
+  N0 0.085395 0.316788 -0.944644   N1 0.164332 0.283331 -0.944838   N2 0.0707208 0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 0.344878 1.23918 0.046875   V1 2.22045e-16 1.28437 0.046875   V2 -2.22045e-16 1.42778 0.0777778 
+  N0 0.0367561 0.136353 -0.989978   N1 0 0.141421 -0.989949   N2 6.08223e-17 0.328521 -0.944497 
+   txt003 
+STRI 
+  V0 -2.22045e-16 1.42778 0.0777778   V1 0.383385 1.37754 0.0777778   V2 0.344878 1.23918 0.046875 
+  N0 6.08223e-17 0.328521 -0.944497   N1 0.085395 0.316788 -0.944644   N2 0.0367561 0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 1.42778 0 0.0777778   V1 1.37754 0.383385 0.0777778   V2 1.4355 0.399515 0.112847 
+  N0 0.328521 0 -0.944497   N1 0.316788 0.085395 -0.944644   N2 0.743044 0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 1.4355 0.399515 0.112847   V1 1.48785 0 0.112847   V2 1.42778 0 0.0777778 
+  N0 0.743044 0.200299 -0.638566   N1 0.770022 0 -0.638018   N2 0.328521 0 -0.944497 
+   txt003 
+STRI 
+  V0 1.37754 0.383385 0.0777778   V1 1.23529 0.725523 0.0777778   V2 1.28726 0.756047 0.112847 
+  N0 0.316788 0.085395 -0.944644   N1 0.283331 0.164332 -0.944838   N2 0.665182 0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 1.28726 0.756047 0.112847   V1 1.4355 0.399515 0.112847   V2 1.37754 0.383385 0.0777778 
+  N0 0.665182 0.385806 -0.639286   N1 0.743044 0.200299 -0.638566   N2 0.316788 0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 1.23529 0.725523 0.0777778   V1 1.01372 1.01372 0.0777778   V2 1.05637 1.05637 0.112847 
+  N0 0.283331 0.164332 -0.944838   N1 0.231454 0.231454 -0.944912   N2 0.543581 0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 1.05637 1.05637 0.112847   V1 1.28726 0.756047 0.112847   V2 1.23529 0.725523 0.0777778 
+  N0 0.543581 0.543581 -0.639562   N1 0.665182 0.385806 -0.639286   N2 0.283331 0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 1.01372 1.01372 0.0777778   V1 0.725523 1.23529 0.0777778   V2 0.756047 1.28726 0.112847 
+  N0 0.231454 0.231454 -0.944912   N1 0.164332 0.283331 -0.944838   N2 0.385806 0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 0.756047 1.28726 0.112847   V1 1.05637 1.05637 0.112847   V2 1.01372 1.01372 0.0777778 
+  N0 0.385806 0.665182 -0.639286   N1 0.543581 0.543581 -0.639562   N2 0.231454 0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 0.725523 1.23529 0.0777778   V1 0.383385 1.37754 0.0777778   V2 0.399515 1.4355 0.112847 
+  N0 0.164332 0.283331 -0.944838   N1 0.085395 0.316788 -0.944644   N2 0.200299 0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 0.399515 1.4355 0.112847   V1 0.756047 1.28726 0.112847   V2 0.725523 1.23529 0.0777778 
+  N0 0.200299 0.743044 -0.638566   N1 0.385806 0.665182 -0.639286   N2 0.164332 0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 0.383385 1.37754 0.0777778   V1 -2.22045e-16 1.42778 0.0777778   V2 0 1.48785 0.112847 
+  N0 0.085395 0.316788 -0.944644   N1 6.08223e-17 0.328521 -0.944497   N2 1.36806e-16 0.770022 -0.638018 
+   txt003 
+STRI 
+  V0 0 1.48785 0.112847   V1 0.399515 1.4355 0.112847   V2 0.383385 1.37754 0.0777778 
+  N0 1.36806e-16 0.770022 -0.638018   N1 0.200299 0.743044 -0.638566   N2 0.085395 0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 1.48785 0 0.112847   V1 1.4355 0.399515 0.112847   V2 1.44722 0.402778 0.15 
+  N0 0.770022 0 -0.638018   N1 0.743044 0.200299 -0.638566   N2 0.965535 0.260275 -2.07142e-16 
+   txt003 
+STRI 
+  V0 1.44722 0.402778 0.15   V1 1.5 0 0.15   V2 1.48785 0 0.112847 
+  N0 0.965535 0.260275 -2.07142e-16   N1 1 0 0   N2 0.770022 0 -0.638018 
+   txt003 
+STRI 
+  V0 1.4355 0.399515 0.112847   V1 1.28726 0.756047 0.112847   V2 1.29778 0.762222 0.15 
+  N0 0.743044 0.200299 -0.638566   N1 0.665182 0.385806 -0.639286   N2 0.865031 0.501718 -5.46348e-16 
+   txt003 
+STRI 
+  V0 1.29778 0.762222 0.15   V1 1.44722 0.402778 0.15   V2 1.4355 0.399515 0.112847 
+  N0 0.865031 0.501718 -5.46348e-16   N1 0.965535 0.260275 -2.07142e-16   N2 0.743044 0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 1.28726 0.756047 0.112847   V1 1.05637 1.05637 0.112847   V2 1.065 1.065 0.15 
+  N0 0.665182 0.385806 -0.639286   N1 0.543581 0.543581 -0.639562   N2 0.707107 0.707107 -6.97819e-16 
+   txt003 
+STRI 
+  V0 1.065 1.065 0.15   V1 1.29778 0.762222 0.15   V2 1.28726 0.756047 0.112847 
+  N0 0.707107 0.707107 -6.97819e-16   N1 0.865031 0.501718 -5.46348e-16   N2 0.665182 0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 1.05637 1.05637 0.112847   V1 0.756047 1.28726 0.112847   V2 0.762222 1.29778 0.15 
+  N0 0.543581 0.543581 -0.639562   N1 0.385806 0.665182 -0.639286   N2 0.501718 0.865031 -5.46348e-16 
+   txt003 
+STRI 
+  V0 0.762222 1.29778 0.15   V1 1.065 1.065 0.15   V2 1.05637 1.05637 0.112847 
+  N0 0.501718 0.865031 -5.46348e-16   N1 0.707107 0.707107 -6.97819e-16   N2 0.543581 0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 0.756047 1.28726 0.112847   V1 0.399515 1.4355 0.112847   V2 0.402778 1.44722 0.15 
+  N0 0.385806 0.665182 -0.639286   N1 0.200299 0.743044 -0.638566   N2 0.260275 0.965535 -2.07142e-16 
+   txt003 
+STRI 
+  V0 0.402778 1.44722 0.15   V1 0.762222 1.29778 0.15   V2 0.756047 1.28726 0.112847 
+  N0 0.260275 0.965535 -2.07142e-16   N1 0.501718 0.865031 -5.46348e-16   N2 0.385806 0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 0.399515 1.4355 0.112847   V1 0 1.48785 0.112847   V2 0 1.5 0.15 
+  N0 0.200299 0.743044 -0.638566   N1 1.36806e-16 0.770022 -0.638018   N2 0 1 -0 
+   txt003 
+STRI 
+  V0 0 1.5 0.15   V1 0.402778 1.44722 0.15   V2 0.399515 1.4355 0.112847 
+  N0 0 1 -0   N1 0.260275 0.965535 -2.07142e-16   N2 0.200299 0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 -0.162696 0.584584 0.00590278   V1 0 0.605903 0.00590278   V2 0 0 0 
+  N0 -0.00589307 0.0218614 -0.999744   N1 0 0.0226746 -0.999743   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.307888 0.524218 0.00590278   V1 -0.162696 0.584584 0.00590278   V2 0 0 0 
+  N0 -0.0113382 0.0195486 -0.999745   N1 -0.00589307 0.0218614 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.430191 0.430191 0.00590278   V1 -0.307888 0.524218 0.00590278   V2 0 0 0 
+  N0 -0.015968 0.015968 -0.999745   N1 -0.0113382 0.0195486 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.524218 0.307888 0.00590278   V1 -0.430191 0.430191 0.00590278   V2 0 0 0 
+  N0 -0.0195486 0.0113382 -0.999745   N1 -0.015968 0.015968 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.584584 0.162696 0.00590278   V1 -0.524218 0.307888 0.00590278   V2 0 0 0 
+  N0 -0.0218614 0.00589307 -0.999744   N1 -0.0195486 0.0113382 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.605903 0 0.00590278   V1 -0.584584 0.162696 0.00590278   V2 0 0 0 
+  N0 -0.0226746 4.94615e-18 -0.999743   N1 -0.0218614 0.00589307 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0 0.605903 0.00590278   V1 -0.162696 0.584584 0.00590278   V2 -0.274486 0.986255 0.0222222 
+  N0 0 0.0226746 -0.999743   N1 -0.00589307 0.0218614 -0.999744   N2 -0.0162121 0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 -0.274486 0.986255 0.0222222   V1 0 1.02222 0.0222222   V2 0 0.605903 0.00590278 
+  N0 -0.0162121 0.0601415 -0.998058   N1 0 0.0623783 -0.998053   N2 0 0.0226746 -0.999743 
+   txt003 
+STRI 
+  V0 -0.162696 0.584584 0.00590278   V1 -0.307888 0.524218 0.00590278   V2 -0.51944 0.884412 0.0222222 
+  N0 -0.00589307 0.0218614 -0.999744   N1 -0.0113382 0.0195486 -0.999745   N2 -0.0311919 0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 -0.51944 0.884412 0.0222222   V1 -0.274486 0.986255 0.0222222   V2 -0.162696 0.584584 0.00590278 
+  N0 -0.0311919 0.0537792 -0.998066   N1 -0.0162121 0.0601415 -0.998058   N2 -0.00589307 0.0218614 -0.999744 
+   txt003 
+STRI 
+  V0 -0.307888 0.524218 0.00590278   V1 -0.430191 0.430191 0.00590278   V2 -0.725778 0.725778 0.0222222 
+  N0 -0.0113382 0.0195486 -0.999745   N1 -0.015968 0.015968 -0.999745   N2 -0.0439291 0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 -0.725778 0.725778 0.0222222   V1 -0.51944 0.884412 0.0222222   V2 -0.307888 0.524218 0.00590278 
+  N0 -0.0439291 0.0439291 -0.998068   N1 -0.0311919 0.0537792 -0.998066   N2 -0.0113382 0.0195486 -0.999745 
+   txt003 
+STRI 
+  V0 -0.430191 0.430191 0.00590278   V1 -0.524218 0.307888 0.00590278   V2 -0.884412 0.51944 0.0222222 
+  N0 -0.015968 0.015968 -0.999745   N1 -0.0195486 0.0113382 -0.999745   N2 -0.0537792 0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 -0.884412 0.51944 0.0222222   V1 -0.725778 0.725778 0.0222222   V2 -0.430191 0.430191 0.00590278 
+  N0 -0.0537792 0.0311919 -0.998066   N1 -0.0439291 0.0439291 -0.998068   N2 -0.015968 0.015968 -0.999745 
+   txt003 
+STRI 
+  V0 -0.524218 0.307888 0.00590278   V1 -0.584584 0.162696 0.00590278   V2 -0.986255 0.274486 0.0222222 
+  N0 -0.0195486 0.0113382 -0.999745   N1 -0.0218614 0.00589307 -0.999744   N2 -0.0601415 0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 -0.986255 0.274486 0.0222222   V1 -0.884412 0.51944 0.0222222   V2 -0.524218 0.307888 0.00590278 
+  N0 -0.0601415 0.0162121 -0.998058   N1 -0.0537792 0.0311919 -0.998066   N2 -0.0195486 0.0113382 -0.999745 
+   txt003 
+STRI 
+  V0 -0.584584 0.162696 0.00590278   V1 -0.605903 0 0.00590278   V2 -1.02222 -2.22045e-16 0.0222222 
+  N0 -0.0218614 0.00589307 -0.999744   N1 -0.0226746 4.94615e-18 -0.999743   N2 -0.0623783 -0 -0.998053 
+   txt003 
+STRI 
+  V0 -1.02222 -2.22045e-16 0.0222222   V1 -0.986255 0.274486 0.0222222   V2 -0.584584 0.162696 0.00590278 
+  N0 -0.0623783 -0 -0.998053   N1 -0.0601415 0.0162121 -0.998058   N2 -0.0218614 0.00589307 -0.999744 
+   txt003 
+STRI 
+  V0 0 1.02222 0.0222222   V1 -0.274486 0.986255 0.0222222   V2 -0.344878 1.23918 0.046875 
+  N0 0 0.0623783 -0.998053   N1 -0.0162121 0.0601415 -0.998058   N2 -0.0367561 0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 -0.344878 1.23918 0.046875   V1 0 1.28438 0.046875   V2 0 1.02222 0.0222222 
+  N0 -0.0367561 0.136353 -0.989978   N1 0 0.141421 -0.989949   N2 0 0.0623783 -0.998053 
+   txt003 
+STRI 
+  V0 -0.274486 0.986255 0.0222222   V1 -0.51944 0.884412 0.0222222   V2 -0.652653 1.11122 0.046875 
+  N0 -0.0162121 0.0601415 -0.998058   N1 -0.0311919 0.0537792 -0.998066   N2 -0.0707208 0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 -0.652653 1.11122 0.046875   V1 -0.344878 1.23918 0.046875   V2 -0.274486 0.986255 0.0222222 
+  N0 -0.0707208 0.121932 -0.990016   N1 -0.0367561 0.136353 -0.989978   N2 -0.0162121 0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 -0.51944 0.884412 0.0222222   V1 -0.725778 0.725778 0.0222222   V2 -0.911906 0.911906 0.046875 
+  N0 -0.0311919 0.0537792 -0.998066   N1 -0.0439291 0.0439291 -0.998068   N2 -0.0996006 0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 -0.911906 0.911906 0.046875   V1 -0.652653 1.11122 0.046875   V2 -0.51944 0.884412 0.0222222 
+  N0 -0.0996006 0.0996006 -0.99003   N1 -0.0707208 0.121932 -0.990016   N2 -0.0311919 0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 -0.725778 0.725778 0.0222222   V1 -0.884412 0.51944 0.0222222   V2 -1.11122 0.652653 0.046875 
+  N0 -0.0439291 0.0439291 -0.998068   N1 -0.0537792 0.0311919 -0.998066   N2 -0.121932 0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 -1.11122 0.652653 0.046875   V1 -0.911906 0.911906 0.046875   V2 -0.725778 0.725778 0.0222222 
+  N0 -0.121932 0.0707208 -0.990016   N1 -0.0996006 0.0996006 -0.99003   N2 -0.0439291 0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 -0.884412 0.51944 0.0222222   V1 -0.986255 0.274486 0.0222222   V2 -1.23918 0.344878 0.046875 
+  N0 -0.0537792 0.0311919 -0.998066   N1 -0.0601415 0.0162121 -0.998058   N2 -0.136353 0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 -1.23918 0.344878 0.046875   V1 -1.11122 0.652653 0.046875   V2 -0.884412 0.51944 0.0222222 
+  N0 -0.136353 0.0367561 -0.989978   N1 -0.121932 0.0707208 -0.990016   N2 -0.0537792 0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 -0.986255 0.274486 0.0222222   V1 -1.02222 -2.22045e-16 0.0222222   V2 -1.28437 2.22045e-16 0.046875 
+  N0 -0.0601415 0.0162121 -0.998058   N1 -0.0623783 -0 -0.998053   N2 -0.141421 -0 -0.989949 
+   txt003 
+STRI 
+  V0 -1.28437 2.22045e-16 0.046875   V1 -1.23918 0.344878 0.046875   V2 -0.986255 0.274486 0.0222222 
+  N0 -0.141421 -0 -0.989949   N1 -0.136353 0.0367561 -0.989978   N2 -0.0601415 0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 0 1.28438 0.046875   V1 -0.344878 1.23918 0.046875   V2 -0.383385 1.37754 0.0777778 
+  N0 0 0.141421 -0.989949   N1 -0.0367561 0.136353 -0.989978   N2 -0.085395 0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 -0.383385 1.37754 0.0777778   V1 0 1.42778 0.0777778   V2 0 1.28438 0.046875 
+  N0 -0.085395 0.316788 -0.944644   N1 0 0.328521 -0.944497   N2 0 0.141421 -0.989949 
+   txt003 
+STRI 
+  V0 -0.344878 1.23918 0.046875   V1 -0.652653 1.11122 0.046875   V2 -0.725523 1.23529 0.0777778 
+  N0 -0.0367561 0.136353 -0.989978   N1 -0.0707208 0.121932 -0.990016   N2 -0.164332 0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 -0.725523 1.23529 0.0777778   V1 -0.383385 1.37754 0.0777778   V2 -0.344878 1.23918 0.046875 
+  N0 -0.164332 0.283331 -0.944838   N1 -0.085395 0.316788 -0.944644   N2 -0.0367561 0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 -0.652653 1.11122 0.046875   V1 -0.911906 0.911906 0.046875   V2 -1.01372 1.01372 0.0777778 
+  N0 -0.0707208 0.121932 -0.990016   N1 -0.0996006 0.0996006 -0.99003   N2 -0.231454 0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 -1.01372 1.01372 0.0777778   V1 -0.725523 1.23529 0.0777778   V2 -0.652653 1.11122 0.046875 
+  N0 -0.231454 0.231454 -0.944912   N1 -0.164332 0.283331 -0.944838   N2 -0.0707208 0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 -0.911906 0.911906 0.046875   V1 -1.11122 0.652653 0.046875   V2 -1.23529 0.725523 0.0777778 
+  N0 -0.0996006 0.0996006 -0.99003   N1 -0.121932 0.0707208 -0.990016   N2 -0.283331 0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 -1.23529 0.725523 0.0777778   V1 -1.01372 1.01372 0.0777778   V2 -0.911906 0.911906 0.046875 
+  N0 -0.283331 0.164332 -0.944838   N1 -0.231454 0.231454 -0.944912   N2 -0.0996006 0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 -1.11122 0.652653 0.046875   V1 -1.23918 0.344878 0.046875   V2 -1.37754 0.383385 0.0777778 
+  N0 -0.121932 0.0707208 -0.990016   N1 -0.136353 0.0367561 -0.989978   N2 -0.316788 0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 -1.37754 0.383385 0.0777778   V1 -1.23529 0.725523 0.0777778   V2 -1.11122 0.652653 0.046875 
+  N0 -0.316788 0.085395 -0.944644   N1 -0.283331 0.164332 -0.944838   N2 -0.121932 0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 -1.23918 0.344878 0.046875   V1 -1.28437 2.22045e-16 0.046875   V2 -1.42778 -2.22045e-16 0.0777778 
+  N0 -0.136353 0.0367561 -0.989978   N1 -0.141421 -0 -0.989949   N2 -0.328521 6.08223e-17 -0.944497 
+   txt003 
+STRI 
+  V0 -1.42778 -2.22045e-16 0.0777778   V1 -1.37754 0.383385 0.0777778   V2 -1.23918 0.344878 0.046875 
+  N0 -0.328521 6.08223e-17 -0.944497   N1 -0.316788 0.085395 -0.944644   N2 -0.136353 0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 0 1.42778 0.0777778   V1 -0.383385 1.37754 0.0777778   V2 -0.399515 1.4355 0.112847 
+  N0 0 0.328521 -0.944497   N1 -0.085395 0.316788 -0.944644   N2 -0.200299 0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 -0.399515 1.4355 0.112847   V1 0 1.48785 0.112847   V2 0 1.42778 0.0777778 
+  N0 -0.200299 0.743044 -0.638566   N1 0 0.770022 -0.638018   N2 0 0.328521 -0.944497 
+   txt003 
+STRI 
+  V0 -0.383385 1.37754 0.0777778   V1 -0.725523 1.23529 0.0777778   V2 -0.756047 1.28726 0.112847 
+  N0 -0.085395 0.316788 -0.944644   N1 -0.164332 0.283331 -0.944838   N2 -0.385806 0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 -0.756047 1.28726 0.112847   V1 -0.399515 1.4355 0.112847   V2 -0.383385 1.37754 0.0777778 
+  N0 -0.385806 0.665182 -0.639286   N1 -0.200299 0.743044 -0.638566   N2 -0.085395 0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 -0.725523 1.23529 0.0777778   V1 -1.01372 1.01372 0.0777778   V2 -1.05637 1.05637 0.112847 
+  N0 -0.164332 0.283331 -0.944838   N1 -0.231454 0.231454 -0.944912   N2 -0.543581 0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 -1.05637 1.05637 0.112847   V1 -0.756047 1.28726 0.112847   V2 -0.725523 1.23529 0.0777778 
+  N0 -0.543581 0.543581 -0.639562   N1 -0.385806 0.665182 -0.639286   N2 -0.164332 0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 -1.01372 1.01372 0.0777778   V1 -1.23529 0.725523 0.0777778   V2 -1.28726 0.756047 0.112847 
+  N0 -0.231454 0.231454 -0.944912   N1 -0.283331 0.164332 -0.944838   N2 -0.665182 0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 -1.28726 0.756047 0.112847   V1 -1.05637 1.05637 0.112847   V2 -1.01372 1.01372 0.0777778 
+  N0 -0.665182 0.385806 -0.639286   N1 -0.543581 0.543581 -0.639562   N2 -0.231454 0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 -1.23529 0.725523 0.0777778   V1 -1.37754 0.383385 0.0777778   V2 -1.4355 0.399515 0.112847 
+  N0 -0.283331 0.164332 -0.944838   N1 -0.316788 0.085395 -0.944644   N2 -0.743044 0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 -1.4355 0.399515 0.112847   V1 -1.28726 0.756047 0.112847   V2 -1.23529 0.725523 0.0777778 
+  N0 -0.743044 0.200299 -0.638566   N1 -0.665182 0.385806 -0.639286   N2 -0.283331 0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 -1.37754 0.383385 0.0777778   V1 -1.42778 -2.22045e-16 0.0777778   V2 -1.48785 0 0.112847 
+  N0 -0.316788 0.085395 -0.944644   N1 -0.328521 6.08223e-17 -0.944497   N2 -0.770022 1.36806e-16 -0.638018 
+   txt003 
+STRI 
+  V0 -1.48785 0 0.112847   V1 -1.4355 0.399515 0.112847   V2 -1.37754 0.383385 0.0777778 
+  N0 -0.770022 1.36806e-16 -0.638018   N1 -0.743044 0.200299 -0.638566   N2 -0.316788 0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 0 1.48785 0.112847   V1 -0.399515 1.4355 0.112847   V2 -0.402778 1.44722 0.15 
+  N0 0 0.770022 -0.638018   N1 -0.200299 0.743044 -0.638566   N2 -0.260275 0.965535 -2.07142e-16 
+   txt003 
+STRI 
+  V0 -0.402778 1.44722 0.15   V1 0 1.5 0.15   V2 0 1.48785 0.112847 
+  N0 -0.260275 0.965535 -2.07142e-16   N1 0 1 -0   N2 0 0.770022 -0.638018 
+   txt003 
+STRI 
+  V0 -0.399515 1.4355 0.112847   V1 -0.756047 1.28726 0.112847   V2 -0.762222 1.29778 0.15 
+  N0 -0.200299 0.743044 -0.638566   N1 -0.385806 0.665182 -0.639286   N2 -0.501718 0.865031 -5.46348e-16 
+   txt003 
+STRI 
+  V0 -0.762222 1.29778 0.15   V1 -0.402778 1.44722 0.15   V2 -0.399515 1.4355 0.112847 
+  N0 -0.501718 0.865031 -5.46348e-16   N1 -0.260275 0.965535 -2.07142e-16   N2 -0.200299 0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 -0.756047 1.28726 0.112847   V1 -1.05637 1.05637 0.112847   V2 -1.065 1.065 0.15 
+  N0 -0.385806 0.665182 -0.639286   N1 -0.543581 0.543581 -0.639562   N2 -0.707107 0.707107 -6.97819e-16 
+   txt003 
+STRI 
+  V0 -1.065 1.065 0.15   V1 -0.762222 1.29778 0.15   V2 -0.756047 1.28726 0.112847 
+  N0 -0.707107 0.707107 -6.97819e-16   N1 -0.501718 0.865031 -5.46348e-16   N2 -0.385806 0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 -1.05637 1.05637 0.112847   V1 -1.28726 0.756047 0.112847   V2 -1.29778 0.762222 0.15 
+  N0 -0.543581 0.543581 -0.639562   N1 -0.665182 0.385806 -0.639286   N2 -0.865031 0.501718 -5.46348e-16 
+   txt003 
+STRI 
+  V0 -1.29778 0.762222 0.15   V1 -1.065 1.065 0.15   V2 -1.05637 1.05637 0.112847 
+  N0 -0.865031 0.501718 -5.46348e-16   N1 -0.707107 0.707107 -6.97819e-16   N2 -0.543581 0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 -1.28726 0.756047 0.112847   V1 -1.4355 0.399515 0.112847   V2 -1.44722 0.402778 0.15 
+  N0 -0.665182 0.385806 -0.639286   N1 -0.743044 0.200299 -0.638566   N2 -0.965535 0.260275 -2.07142e-16 
+   txt003 
+STRI 
+  V0 -1.44722 0.402778 0.15   V1 -1.29778 0.762222 0.15   V2 -1.28726 0.756047 0.112847 
+  N0 -0.965535 0.260275 -2.07142e-16   N1 -0.865031 0.501718 -5.46348e-16   N2 -0.665182 0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 -1.4355 0.399515 0.112847   V1 -1.48785 0 0.112847   V2 -1.5 0 0.15 
+  N0 -0.743044 0.200299 -0.638566   N1 -0.770022 1.36806e-16 -0.638018   N2 -1 0 0 
+   txt003 
+STRI 
+  V0 -1.5 0 0.15   V1 -1.44722 0.402778 0.15   V2 -1.4355 0.399515 0.112847 
+  N0 -1 0 0   N1 -0.965535 0.260275 -2.07142e-16   N2 -0.743044 0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 -0.584584 -0.162696 0.00590278   V1 -0.605903 0 0.00590278   V2 0 0 0 
+  N0 -0.0218614 -0.00589307 -0.999744   N1 -0.0226746 -0 -0.999743   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.524218 -0.307888 0.00590278   V1 -0.584584 -0.162696 0.00590278   V2 0 0 0 
+  N0 -0.0195486 -0.0113382 -0.999745   N1 -0.0218614 -0.00589307 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.430191 -0.430191 0.00590278   V1 -0.524218 -0.307888 0.00590278   V2 0 0 0 
+  N0 -0.015968 -0.015968 -0.999745   N1 -0.0195486 -0.0113382 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.307888 -0.524218 0.00590278   V1 -0.430191 -0.430191 0.00590278   V2 0 0 0 
+  N0 -0.0113382 -0.0195486 -0.999745   N1 -0.015968 -0.015968 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.162696 -0.584584 0.00590278   V1 -0.307888 -0.524218 0.00590278   V2 0 0 0 
+  N0 -0.00589307 -0.0218614 -0.999744   N1 -0.0113382 -0.0195486 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0 -0.605903 0.00590278   V1 -0.162696 -0.584584 0.00590278   V2 0 0 0 
+  N0 -4.94615e-18 -0.0226746 -0.999743   N1 -0.00589307 -0.0218614 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 -0.605903 0 0.00590278   V1 -0.584584 -0.162696 0.00590278   V2 -0.986255 -0.274486 0.0222222 
+  N0 -0.0226746 -0 -0.999743   N1 -0.0218614 -0.00589307 -0.999744   N2 -0.0601415 -0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 -0.986255 -0.274486 0.0222222   V1 -1.02222 0 0.0222222   V2 -0.605903 0 0.00590278 
+  N0 -0.0601415 -0.0162121 -0.998058   N1 -0.0623783 -0 -0.998053   N2 -0.0226746 -0 -0.999743 
+   txt003 
+STRI 
+  V0 -0.584584 -0.162696 0.00590278   V1 -0.524218 -0.307888 0.00590278   V2 -0.884412 -0.51944 0.0222222 
+  N0 -0.0218614 -0.00589307 -0.999744   N1 -0.0195486 -0.0113382 -0.999745   N2 -0.0537792 -0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 -0.884412 -0.51944 0.0222222   V1 -0.986255 -0.274486 0.0222222   V2 -0.584584 -0.162696 0.00590278 
+  N0 -0.0537792 -0.0311919 -0.998066   N1 -0.0601415 -0.0162121 -0.998058   N2 -0.0218614 -0.00589307 -0.999744 
+   txt003 
+STRI 
+  V0 -0.524218 -0.307888 0.00590278   V1 -0.430191 -0.430191 0.00590278   V2 -0.725778 -0.725778 0.0222222 
+  N0 -0.0195486 -0.0113382 -0.999745   N1 -0.015968 -0.015968 -0.999745   N2 -0.0439291 -0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 -0.725778 -0.725778 0.0222222   V1 -0.884412 -0.51944 0.0222222   V2 -0.524218 -0.307888 0.00590278 
+  N0 -0.0439291 -0.0439291 -0.998068   N1 -0.0537792 -0.0311919 -0.998066   N2 -0.0195486 -0.0113382 -0.999745 
+   txt003 
+STRI 
+  V0 -0.430191 -0.430191 0.00590278   V1 -0.307888 -0.524218 0.00590278   V2 -0.51944 -0.884412 0.0222222 
+  N0 -0.015968 -0.015968 -0.999745   N1 -0.0113382 -0.0195486 -0.999745   N2 -0.0311919 -0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 -0.51944 -0.884412 0.0222222   V1 -0.725778 -0.725778 0.0222222   V2 -0.430191 -0.430191 0.00590278 
+  N0 -0.0311919 -0.0537792 -0.998066   N1 -0.0439291 -0.0439291 -0.998068   N2 -0.015968 -0.015968 -0.999745 
+   txt003 
+STRI 
+  V0 -0.307888 -0.524218 0.00590278   V1 -0.162696 -0.584584 0.00590278   V2 -0.274486 -0.986255 0.0222222 
+  N0 -0.0113382 -0.0195486 -0.999745   N1 -0.00589307 -0.0218614 -0.999744   N2 -0.0162121 -0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 -0.274486 -0.986255 0.0222222   V1 -0.51944 -0.884412 0.0222222   V2 -0.307888 -0.524218 0.00590278 
+  N0 -0.0162121 -0.0601415 -0.998058   N1 -0.0311919 -0.0537792 -0.998066   N2 -0.0113382 -0.0195486 -0.999745 
+   txt003 
+STRI 
+  V0 -0.162696 -0.584584 0.00590278   V1 0 -0.605903 0.00590278   V2 2.22045e-16 -1.02222 0.0222222 
+  N0 -0.00589307 -0.0218614 -0.999744   N1 -4.94615e-18 -0.0226746 -0.999743   N2 0 -0.0623783 -0.998053 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.02222 0.0222222   V1 -0.274486 -0.986255 0.0222222   V2 -0.162696 -0.584584 0.00590278 
+  N0 0 -0.0623783 -0.998053   N1 -0.0162121 -0.0601415 -0.998058   N2 -0.00589307 -0.0218614 -0.999744 
+   txt003 
+STRI 
+  V0 -1.02222 0 0.0222222   V1 -0.986255 -0.274486 0.0222222   V2 -1.23918 -0.344878 0.046875 
+  N0 -0.0623783 -0 -0.998053   N1 -0.0601415 -0.0162121 -0.998058   N2 -0.136353 -0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 -1.23918 -0.344878 0.046875   V1 -1.28438 0 0.046875   V2 -1.02222 0 0.0222222 
+  N0 -0.136353 -0.0367561 -0.989978   N1 -0.141421 -0 -0.989949   N2 -0.0623783 -0 -0.998053 
+   txt003 
+STRI 
+  V0 -0.986255 -0.274486 0.0222222   V1 -0.884412 -0.51944 0.0222222   V2 -1.11122 -0.652653 0.046875 
+  N0 -0.0601415 -0.0162121 -0.998058   N1 -0.0537792 -0.0311919 -0.998066   N2 -0.121932 -0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 -1.11122 -0.652653 0.046875   V1 -1.23918 -0.344878 0.046875   V2 -0.986255 -0.274486 0.0222222 
+  N0 -0.121932 -0.0707208 -0.990016   N1 -0.136353 -0.0367561 -0.989978   N2 -0.0601415 -0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 -0.884412 -0.51944 0.0222222   V1 -0.725778 -0.725778 0.0222222   V2 -0.911906 -0.911906 0.046875 
+  N0 -0.0537792 -0.0311919 -0.998066   N1 -0.0439291 -0.0439291 -0.998068   N2 -0.0996006 -0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 -0.911906 -0.911906 0.046875   V1 -1.11122 -0.652653 0.046875   V2 -0.884412 -0.51944 0.0222222 
+  N0 -0.0996006 -0.0996006 -0.99003   N1 -0.121932 -0.0707208 -0.990016   N2 -0.0537792 -0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 -0.725778 -0.725778 0.0222222   V1 -0.51944 -0.884412 0.0222222   V2 -0.652653 -1.11122 0.046875 
+  N0 -0.0439291 -0.0439291 -0.998068   N1 -0.0311919 -0.0537792 -0.998066   N2 -0.0707208 -0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 -0.652653 -1.11122 0.046875   V1 -0.911906 -0.911906 0.046875   V2 -0.725778 -0.725778 0.0222222 
+  N0 -0.0707208 -0.121932 -0.990016   N1 -0.0996006 -0.0996006 -0.99003   N2 -0.0439291 -0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 -0.51944 -0.884412 0.0222222   V1 -0.274486 -0.986255 0.0222222   V2 -0.344878 -1.23918 0.046875 
+  N0 -0.0311919 -0.0537792 -0.998066   N1 -0.0162121 -0.0601415 -0.998058   N2 -0.0367561 -0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 -0.344878 -1.23918 0.046875   V1 -0.652653 -1.11122 0.046875   V2 -0.51944 -0.884412 0.0222222 
+  N0 -0.0367561 -0.136353 -0.989978   N1 -0.0707208 -0.121932 -0.990016   N2 -0.0311919 -0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 -0.274486 -0.986255 0.0222222   V1 2.22045e-16 -1.02222 0.0222222   V2 -2.22045e-16 -1.28437 0.046875 
+  N0 -0.0162121 -0.0601415 -0.998058   N1 0 -0.0623783 -0.998053   N2 0 -0.141421 -0.989949 
+   txt003 
+STRI 
+  V0 -2.22045e-16 -1.28437 0.046875   V1 -0.344878 -1.23918 0.046875   V2 -0.274486 -0.986255 0.0222222 
+  N0 0 -0.141421 -0.989949   N1 -0.0367561 -0.136353 -0.989978   N2 -0.0162121 -0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 -1.28438 0 0.046875   V1 -1.23918 -0.344878 0.046875   V2 -1.37754 -0.383385 0.0777778 
+  N0 -0.141421 -0 -0.989949   N1 -0.136353 -0.0367561 -0.989978   N2 -0.316788 -0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 -1.37754 -0.383385 0.0777778   V1 -1.42778 0 0.0777778   V2 -1.28438 0 0.046875 
+  N0 -0.316788 -0.085395 -0.944644   N1 -0.328521 -0 -0.944497   N2 -0.141421 -0 -0.989949 
+   txt003 
+STRI 
+  V0 -1.23918 -0.344878 0.046875   V1 -1.11122 -0.652653 0.046875   V2 -1.23529 -0.725523 0.0777778 
+  N0 -0.136353 -0.0367561 -0.989978   N1 -0.121932 -0.0707208 -0.990016   N2 -0.283331 -0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 -1.23529 -0.725523 0.0777778   V1 -1.37754 -0.383385 0.0777778   V2 -1.23918 -0.344878 0.046875 
+  N0 -0.283331 -0.164332 -0.944838   N1 -0.316788 -0.085395 -0.944644   N2 -0.136353 -0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 -1.11122 -0.652653 0.046875   V1 -0.911906 -0.911906 0.046875   V2 -1.01372 -1.01372 0.0777778 
+  N0 -0.121932 -0.0707208 -0.990016   N1 -0.0996006 -0.0996006 -0.99003   N2 -0.231454 -0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 -1.01372 -1.01372 0.0777778   V1 -1.23529 -0.725523 0.0777778   V2 -1.11122 -0.652653 0.046875 
+  N0 -0.231454 -0.231454 -0.944912   N1 -0.283331 -0.164332 -0.944838   N2 -0.121932 -0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 -0.911906 -0.911906 0.046875   V1 -0.652653 -1.11122 0.046875   V2 -0.725523 -1.23529 0.0777778 
+  N0 -0.0996006 -0.0996006 -0.99003   N1 -0.0707208 -0.121932 -0.990016   N2 -0.164332 -0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 -0.725523 -1.23529 0.0777778   V1 -1.01372 -1.01372 0.0777778   V2 -0.911906 -0.911906 0.046875 
+  N0 -0.164332 -0.283331 -0.944838   N1 -0.231454 -0.231454 -0.944912   N2 -0.0996006 -0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 -0.652653 -1.11122 0.046875   V1 -0.344878 -1.23918 0.046875   V2 -0.383385 -1.37754 0.0777778 
+  N0 -0.0707208 -0.121932 -0.990016   N1 -0.0367561 -0.136353 -0.989978   N2 -0.085395 -0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 -0.383385 -1.37754 0.0777778   V1 -0.725523 -1.23529 0.0777778   V2 -0.652653 -1.11122 0.046875 
+  N0 -0.085395 -0.316788 -0.944644   N1 -0.164332 -0.283331 -0.944838   N2 -0.0707208 -0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 -0.344878 -1.23918 0.046875   V1 -2.22045e-16 -1.28437 0.046875   V2 2.22045e-16 -1.42778 0.0777778 
+  N0 -0.0367561 -0.136353 -0.989978   N1 0 -0.141421 -0.989949   N2 -6.08223e-17 -0.328521 -0.944497 
+   txt003 
+STRI 
+  V0 2.22045e-16 -1.42778 0.0777778   V1 -0.383385 -1.37754 0.0777778   V2 -0.344878 -1.23918 0.046875 
+  N0 -6.08223e-17 -0.328521 -0.944497   N1 -0.085395 -0.316788 -0.944644   N2 -0.0367561 -0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 -1.42778 0 0.0777778   V1 -1.37754 -0.383385 0.0777778   V2 -1.4355 -0.399515 0.112847 
+  N0 -0.328521 -0 -0.944497   N1 -0.316788 -0.085395 -0.944644   N2 -0.743044 -0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 -1.4355 -0.399515 0.112847   V1 -1.48785 0 0.112847   V2 -1.42778 0 0.0777778 
+  N0 -0.743044 -0.200299 -0.638566   N1 -0.770022 -0 -0.638018   N2 -0.328521 -0 -0.944497 
+   txt003 
+STRI 
+  V0 -1.37754 -0.383385 0.0777778   V1 -1.23529 -0.725523 0.0777778   V2 -1.28726 -0.756047 0.112847 
+  N0 -0.316788 -0.085395 -0.944644   N1 -0.283331 -0.164332 -0.944838   N2 -0.665182 -0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 -1.28726 -0.756047 0.112847   V1 -1.4355 -0.399515 0.112847   V2 -1.37754 -0.383385 0.0777778 
+  N0 -0.665182 -0.385806 -0.639286   N1 -0.743044 -0.200299 -0.638566   N2 -0.316788 -0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 -1.23529 -0.725523 0.0777778   V1 -1.01372 -1.01372 0.0777778   V2 -1.05637 -1.05637 0.112847 
+  N0 -0.283331 -0.164332 -0.944838   N1 -0.231454 -0.231454 -0.944912   N2 -0.543581 -0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 -1.05637 -1.05637 0.112847   V1 -1.28726 -0.756047 0.112847   V2 -1.23529 -0.725523 0.0777778 
+  N0 -0.543581 -0.543581 -0.639562   N1 -0.665182 -0.385806 -0.639286   N2 -0.283331 -0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 -1.01372 -1.01372 0.0777778   V1 -0.725523 -1.23529 0.0777778   V2 -0.756047 -1.28726 0.112847 
+  N0 -0.231454 -0.231454 -0.944912   N1 -0.164332 -0.283331 -0.944838   N2 -0.385806 -0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 -0.756047 -1.28726 0.112847   V1 -1.05637 -1.05637 0.112847   V2 -1.01372 -1.01372 0.0777778 
+  N0 -0.385806 -0.665182 -0.639286   N1 -0.543581 -0.543581 -0.639562   N2 -0.231454 -0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 -0.725523 -1.23529 0.0777778   V1 -0.383385 -1.37754 0.0777778   V2 -0.399515 -1.4355 0.112847 
+  N0 -0.164332 -0.283331 -0.944838   N1 -0.085395 -0.316788 -0.944644   N2 -0.200299 -0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 -0.399515 -1.4355 0.112847   V1 -0.756047 -1.28726 0.112847   V2 -0.725523 -1.23529 0.0777778 
+  N0 -0.200299 -0.743044 -0.638566   N1 -0.385806 -0.665182 -0.639286   N2 -0.164332 -0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 -0.383385 -1.37754 0.0777778   V1 2.22045e-16 -1.42778 0.0777778   V2 0 -1.48785 0.112847 
+  N0 -0.085395 -0.316788 -0.944644   N1 -6.08223e-17 -0.328521 -0.944497   N2 -1.36806e-16 -0.770022 -0.638018 
+   txt003 
+STRI 
+  V0 0 -1.48785 0.112847   V1 -0.399515 -1.4355 0.112847   V2 -0.383385 -1.37754 0.0777778 
+  N0 -1.36806e-16 -0.770022 -0.638018   N1 -0.200299 -0.743044 -0.638566   N2 -0.085395 -0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 -1.48785 0 0.112847   V1 -1.4355 -0.399515 0.112847   V2 -1.44722 -0.402778 0.15 
+  N0 -0.770022 -0 -0.638018   N1 -0.743044 -0.200299 -0.638566   N2 -0.965535 -0.260275 -2.07142e-16 
+   txt003 
+STRI 
+  V0 -1.44722 -0.402778 0.15   V1 -1.5 0 0.15   V2 -1.48785 0 0.112847 
+  N0 -0.965535 -0.260275 -2.07142e-16   N1 -1 0 0   N2 -0.770022 -0 -0.638018 
+   txt003 
+STRI 
+  V0 -1.4355 -0.399515 0.112847   V1 -1.28726 -0.756047 0.112847   V2 -1.29778 -0.762222 0.15 
+  N0 -0.743044 -0.200299 -0.638566   N1 -0.665182 -0.385806 -0.639286   N2 -0.865031 -0.501718 -5.46348e-16 
+   txt003 
+STRI 
+  V0 -1.29778 -0.762222 0.15   V1 -1.44722 -0.402778 0.15   V2 -1.4355 -0.399515 0.112847 
+  N0 -0.865031 -0.501718 -5.46348e-16   N1 -0.965535 -0.260275 -2.07142e-16   N2 -0.743044 -0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 -1.28726 -0.756047 0.112847   V1 -1.05637 -1.05637 0.112847   V2 -1.065 -1.065 0.15 
+  N0 -0.665182 -0.385806 -0.639286   N1 -0.543581 -0.543581 -0.639562   N2 -0.707107 -0.707107 -6.97819e-16 
+   txt003 
+STRI 
+  V0 -1.065 -1.065 0.15   V1 -1.29778 -0.762222 0.15   V2 -1.28726 -0.756047 0.112847 
+  N0 -0.707107 -0.707107 -6.97819e-16   N1 -0.865031 -0.501718 -5.46348e-16   N2 -0.665182 -0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 -1.05637 -1.05637 0.112847   V1 -0.756047 -1.28726 0.112847   V2 -0.762222 -1.29778 0.15 
+  N0 -0.543581 -0.543581 -0.639562   N1 -0.385806 -0.665182 -0.639286   N2 -0.501718 -0.865031 -5.46348e-16 
+   txt003 
+STRI 
+  V0 -0.762222 -1.29778 0.15   V1 -1.065 -1.065 0.15   V2 -1.05637 -1.05637 0.112847 
+  N0 -0.501718 -0.865031 -5.46348e-16   N1 -0.707107 -0.707107 -6.97819e-16   N2 -0.543581 -0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 -0.756047 -1.28726 0.112847   V1 -0.399515 -1.4355 0.112847   V2 -0.402778 -1.44722 0.15 
+  N0 -0.385806 -0.665182 -0.639286   N1 -0.200299 -0.743044 -0.638566   N2 -0.260275 -0.965535 -2.07142e-16 
+   txt003 
+STRI 
+  V0 -0.402778 -1.44722 0.15   V1 -0.762222 -1.29778 0.15   V2 -0.756047 -1.28726 0.112847 
+  N0 -0.260275 -0.965535 -2.07142e-16   N1 -0.501718 -0.865031 -5.46348e-16   N2 -0.385806 -0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 -0.399515 -1.4355 0.112847   V1 0 -1.48785 0.112847   V2 0 -1.5 0.15 
+  N0 -0.200299 -0.743044 -0.638566   N1 -1.36806e-16 -0.770022 -0.638018   N2 0 -1 0 
+   txt003 
+STRI 
+  V0 0 -1.5 0.15   V1 -0.402778 -1.44722 0.15   V2 -0.399515 -1.4355 0.112847 
+  N0 0 -1 0   N1 -0.260275 -0.965535 -2.07142e-16   N2 -0.200299 -0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 0.162696 -0.584584 0.00590278   V1 0 -0.605903 0.00590278   V2 0 0 0 
+  N0 0.00589307 -0.0218614 -0.999744   N1 0 -0.0226746 -0.999743   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.307888 -0.524218 0.00590278   V1 0.162696 -0.584584 0.00590278   V2 0 0 0 
+  N0 0.0113382 -0.0195486 -0.999745   N1 0.00589307 -0.0218614 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.430191 -0.430191 0.00590278   V1 0.307888 -0.524218 0.00590278   V2 0 0 0 
+  N0 0.015968 -0.015968 -0.999745   N1 0.0113382 -0.0195486 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.524218 -0.307888 0.00590278   V1 0.430191 -0.430191 0.00590278   V2 0 0 0 
+  N0 0.0195486 -0.0113382 -0.999745   N1 0.015968 -0.015968 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.584584 -0.162696 0.00590278   V1 0.524218 -0.307888 0.00590278   V2 0 0 0 
+  N0 0.0218614 -0.00589307 -0.999744   N1 0.0195486 -0.0113382 -0.999745   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0.605903 0 0.00590278   V1 0.584584 -0.162696 0.00590278   V2 0 0 0 
+  N0 0.0226746 -4.94615e-18 -0.999743   N1 0.0218614 -0.00589307 -0.999744   N2 0 0 -1 
+   txt003 
+STRI 
+  V0 0 -0.605903 0.00590278   V1 0.162696 -0.584584 0.00590278   V2 0.274486 -0.986255 0.0222222 
+  N0 0 -0.0226746 -0.999743   N1 0.00589307 -0.0218614 -0.999744   N2 0.0162121 -0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 0.274486 -0.986255 0.0222222   V1 0 -1.02222 0.0222222   V2 0 -0.605903 0.00590278 
+  N0 0.0162121 -0.0601415 -0.998058   N1 0 -0.0623783 -0.998053   N2 0 -0.0226746 -0.999743 
+   txt003 
+STRI 
+  V0 0.162696 -0.584584 0.00590278   V1 0.307888 -0.524218 0.00590278   V2 0.51944 -0.884412 0.0222222 
+  N0 0.00589307 -0.0218614 -0.999744   N1 0.0113382 -0.0195486 -0.999745   N2 0.0311919 -0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 0.51944 -0.884412 0.0222222   V1 0.274486 -0.986255 0.0222222   V2 0.162696 -0.584584 0.00590278 
+  N0 0.0311919 -0.0537792 -0.998066   N1 0.0162121 -0.0601415 -0.998058   N2 0.00589307 -0.0218614 -0.999744 
+   txt003 
+STRI 
+  V0 0.307888 -0.524218 0.00590278   V1 0.430191 -0.430191 0.00590278   V2 0.725778 -0.725778 0.0222222 
+  N0 0.0113382 -0.0195486 -0.999745   N1 0.015968 -0.015968 -0.999745   N2 0.0439291 -0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 0.725778 -0.725778 0.0222222   V1 0.51944 -0.884412 0.0222222   V2 0.307888 -0.524218 0.00590278 
+  N0 0.0439291 -0.0439291 -0.998068   N1 0.0311919 -0.0537792 -0.998066   N2 0.0113382 -0.0195486 -0.999745 
+   txt003 
+STRI 
+  V0 0.430191 -0.430191 0.00590278   V1 0.524218 -0.307888 0.00590278   V2 0.884412 -0.51944 0.0222222 
+  N0 0.015968 -0.015968 -0.999745   N1 0.0195486 -0.0113382 -0.999745   N2 0.0537792 -0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 0.884412 -0.51944 0.0222222   V1 0.725778 -0.725778 0.0222222   V2 0.430191 -0.430191 0.00590278 
+  N0 0.0537792 -0.0311919 -0.998066   N1 0.0439291 -0.0439291 -0.998068   N2 0.015968 -0.015968 -0.999745 
+   txt003 
+STRI 
+  V0 0.524218 -0.307888 0.00590278   V1 0.584584 -0.162696 0.00590278   V2 0.986255 -0.274486 0.0222222 
+  N0 0.0195486 -0.0113382 -0.999745   N1 0.0218614 -0.00589307 -0.999744   N2 0.0601415 -0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 0.986255 -0.274486 0.0222222   V1 0.884412 -0.51944 0.0222222   V2 0.524218 -0.307888 0.00590278 
+  N0 0.0601415 -0.0162121 -0.998058   N1 0.0537792 -0.0311919 -0.998066   N2 0.0195486 -0.0113382 -0.999745 
+   txt003 
+STRI 
+  V0 0.584584 -0.162696 0.00590278   V1 0.605903 0 0.00590278   V2 1.02222 2.22045e-16 0.0222222 
+  N0 0.0218614 -0.00589307 -0.999744   N1 0.0226746 -4.94615e-18 -0.999743   N2 0.0623783 0 -0.998053 
+   txt003 
+STRI 
+  V0 1.02222 2.22045e-16 0.0222222   V1 0.986255 -0.274486 0.0222222   V2 0.584584 -0.162696 0.00590278 
+  N0 0.0623783 0 -0.998053   N1 0.0601415 -0.0162121 -0.998058   N2 0.0218614 -0.00589307 -0.999744 
+   txt003 
+STRI 
+  V0 0 -1.02222 0.0222222   V1 0.274486 -0.986255 0.0222222   V2 0.344878 -1.23918 0.046875 
+  N0 0 -0.0623783 -0.998053   N1 0.0162121 -0.0601415 -0.998058   N2 0.0367561 -0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 0.344878 -1.23918 0.046875   V1 0 -1.28438 0.046875   V2 0 -1.02222 0.0222222 
+  N0 0.0367561 -0.136353 -0.989978   N1 0 -0.141421 -0.989949   N2 0 -0.0623783 -0.998053 
+   txt003 
+STRI 
+  V0 0.274486 -0.986255 0.0222222   V1 0.51944 -0.884412 0.0222222   V2 0.652653 -1.11122 0.046875 
+  N0 0.0162121 -0.0601415 -0.998058   N1 0.0311919 -0.0537792 -0.998066   N2 0.0707208 -0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 0.652653 -1.11122 0.046875   V1 0.344878 -1.23918 0.046875   V2 0.274486 -0.986255 0.0222222 
+  N0 0.0707208 -0.121932 -0.990016   N1 0.0367561 -0.136353 -0.989978   N2 0.0162121 -0.0601415 -0.998058 
+   txt003 
+STRI 
+  V0 0.51944 -0.884412 0.0222222   V1 0.725778 -0.725778 0.0222222   V2 0.911906 -0.911906 0.046875 
+  N0 0.0311919 -0.0537792 -0.998066   N1 0.0439291 -0.0439291 -0.998068   N2 0.0996006 -0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 0.911906 -0.911906 0.046875   V1 0.652653 -1.11122 0.046875   V2 0.51944 -0.884412 0.0222222 
+  N0 0.0996006 -0.0996006 -0.99003   N1 0.0707208 -0.121932 -0.990016   N2 0.0311919 -0.0537792 -0.998066 
+   txt003 
+STRI 
+  V0 0.725778 -0.725778 0.0222222   V1 0.884412 -0.51944 0.0222222   V2 1.11122 -0.652653 0.046875 
+  N0 0.0439291 -0.0439291 -0.998068   N1 0.0537792 -0.0311919 -0.998066   N2 0.121932 -0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 1.11122 -0.652653 0.046875   V1 0.911906 -0.911906 0.046875   V2 0.725778 -0.725778 0.0222222 
+  N0 0.121932 -0.0707208 -0.990016   N1 0.0996006 -0.0996006 -0.99003   N2 0.0439291 -0.0439291 -0.998068 
+   txt003 
+STRI 
+  V0 0.884412 -0.51944 0.0222222   V1 0.986255 -0.274486 0.0222222   V2 1.23918 -0.344878 0.046875 
+  N0 0.0537792 -0.0311919 -0.998066   N1 0.0601415 -0.0162121 -0.998058   N2 0.136353 -0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 1.23918 -0.344878 0.046875   V1 1.11122 -0.652653 0.046875   V2 0.884412 -0.51944 0.0222222 
+  N0 0.136353 -0.0367561 -0.989978   N1 0.121932 -0.0707208 -0.990016   N2 0.0537792 -0.0311919 -0.998066 
+   txt003 
+STRI 
+  V0 0.986255 -0.274486 0.0222222   V1 1.02222 2.22045e-16 0.0222222   V2 1.28437 -2.22045e-16 0.046875 
+  N0 0.0601415 -0.0162121 -0.998058   N1 0.0623783 0 -0.998053   N2 0.141421 0 -0.989949 
+   txt003 
+STRI 
+  V0 1.28437 -2.22045e-16 0.046875   V1 1.23918 -0.344878 0.046875   V2 0.986255 -0.274486 0.0222222 
+  N0 0.141421 0 -0.989949   N1 0.136353 -0.0367561 -0.989978   N2 0.0601415 -0.0162121 -0.998058 
+   txt003 
+STRI 
+  V0 0 -1.28438 0.046875   V1 0.344878 -1.23918 0.046875   V2 0.383385 -1.37754 0.0777778 
+  N0 0 -0.141421 -0.989949   N1 0.0367561 -0.136353 -0.989978   N2 0.085395 -0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 0.383385 -1.37754 0.0777778   V1 0 -1.42778 0.0777778   V2 0 -1.28438 0.046875 
+  N0 0.085395 -0.316788 -0.944644   N1 0 -0.328521 -0.944497   N2 0 -0.141421 -0.989949 
+   txt003 
+STRI 
+  V0 0.344878 -1.23918 0.046875   V1 0.652653 -1.11122 0.046875   V2 0.725523 -1.23529 0.0777778 
+  N0 0.0367561 -0.136353 -0.989978   N1 0.0707208 -0.121932 -0.990016   N2 0.164332 -0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 0.725523 -1.23529 0.0777778   V1 0.383385 -1.37754 0.0777778   V2 0.344878 -1.23918 0.046875 
+  N0 0.164332 -0.283331 -0.944838   N1 0.085395 -0.316788 -0.944644   N2 0.0367561 -0.136353 -0.989978 
+   txt003 
+STRI 
+  V0 0.652653 -1.11122 0.046875   V1 0.911906 -0.911906 0.046875   V2 1.01372 -1.01372 0.0777778 
+  N0 0.0707208 -0.121932 -0.990016   N1 0.0996006 -0.0996006 -0.99003   N2 0.231454 -0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 1.01372 -1.01372 0.0777778   V1 0.725523 -1.23529 0.0777778   V2 0.652653 -1.11122 0.046875 
+  N0 0.231454 -0.231454 -0.944912   N1 0.164332 -0.283331 -0.944838   N2 0.0707208 -0.121932 -0.990016 
+   txt003 
+STRI 
+  V0 0.911906 -0.911906 0.046875   V1 1.11122 -0.652653 0.046875   V2 1.23529 -0.725523 0.0777778 
+  N0 0.0996006 -0.0996006 -0.99003   N1 0.121932 -0.0707208 -0.990016   N2 0.283331 -0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 1.23529 -0.725523 0.0777778   V1 1.01372 -1.01372 0.0777778   V2 0.911906 -0.911906 0.046875 
+  N0 0.283331 -0.164332 -0.944838   N1 0.231454 -0.231454 -0.944912   N2 0.0996006 -0.0996006 -0.99003 
+   txt003 
+STRI 
+  V0 1.11122 -0.652653 0.046875   V1 1.23918 -0.344878 0.046875   V2 1.37754 -0.383385 0.0777778 
+  N0 0.121932 -0.0707208 -0.990016   N1 0.136353 -0.0367561 -0.989978   N2 0.316788 -0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 1.37754 -0.383385 0.0777778   V1 1.23529 -0.725523 0.0777778   V2 1.11122 -0.652653 0.046875 
+  N0 0.316788 -0.085395 -0.944644   N1 0.283331 -0.164332 -0.944838   N2 0.121932 -0.0707208 -0.990016 
+   txt003 
+STRI 
+  V0 1.23918 -0.344878 0.046875   V1 1.28437 -2.22045e-16 0.046875   V2 1.42778 2.22045e-16 0.0777778 
+  N0 0.136353 -0.0367561 -0.989978   N1 0.141421 0 -0.989949   N2 0.328521 -6.08223e-17 -0.944497 
+   txt003 
+STRI 
+  V0 1.42778 2.22045e-16 0.0777778   V1 1.37754 -0.383385 0.0777778   V2 1.23918 -0.344878 0.046875 
+  N0 0.328521 -6.08223e-17 -0.944497   N1 0.316788 -0.085395 -0.944644   N2 0.136353 -0.0367561 -0.989978 
+   txt003 
+STRI 
+  V0 0 -1.42778 0.0777778   V1 0.383385 -1.37754 0.0777778   V2 0.399515 -1.4355 0.112847 
+  N0 0 -0.328521 -0.944497   N1 0.085395 -0.316788 -0.944644   N2 0.200299 -0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 0.399515 -1.4355 0.112847   V1 0 -1.48785 0.112847   V2 0 -1.42778 0.0777778 
+  N0 0.200299 -0.743044 -0.638566   N1 0 -0.770022 -0.638018   N2 0 -0.328521 -0.944497 
+   txt003 
+STRI 
+  V0 0.383385 -1.37754 0.0777778   V1 0.725523 -1.23529 0.0777778   V2 0.756047 -1.28726 0.112847 
+  N0 0.085395 -0.316788 -0.944644   N1 0.164332 -0.283331 -0.944838   N2 0.385806 -0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 0.756047 -1.28726 0.112847   V1 0.399515 -1.4355 0.112847   V2 0.383385 -1.37754 0.0777778 
+  N0 0.385806 -0.665182 -0.639286   N1 0.200299 -0.743044 -0.638566   N2 0.085395 -0.316788 -0.944644 
+   txt003 
+STRI 
+  V0 0.725523 -1.23529 0.0777778   V1 1.01372 -1.01372 0.0777778   V2 1.05637 -1.05637 0.112847 
+  N0 0.164332 -0.283331 -0.944838   N1 0.231454 -0.231454 -0.944912   N2 0.543581 -0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 1.05637 -1.05637 0.112847   V1 0.756047 -1.28726 0.112847   V2 0.725523 -1.23529 0.0777778 
+  N0 0.543581 -0.543581 -0.639562   N1 0.385806 -0.665182 -0.639286   N2 0.164332 -0.283331 -0.944838 
+   txt003 
+STRI 
+  V0 1.01372 -1.01372 0.0777778   V1 1.23529 -0.725523 0.0777778   V2 1.28726 -0.756047 0.112847 
+  N0 0.231454 -0.231454 -0.944912   N1 0.283331 -0.164332 -0.944838   N2 0.665182 -0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 1.28726 -0.756047 0.112847   V1 1.05637 -1.05637 0.112847   V2 1.01372 -1.01372 0.0777778 
+  N0 0.665182 -0.385806 -0.639286   N1 0.543581 -0.543581 -0.639562   N2 0.231454 -0.231454 -0.944912 
+   txt003 
+STRI 
+  V0 1.23529 -0.725523 0.0777778   V1 1.37754 -0.383385 0.0777778   V2 1.4355 -0.399515 0.112847 
+  N0 0.283331 -0.164332 -0.944838   N1 0.316788 -0.085395 -0.944644   N2 0.743044 -0.200299 -0.638566 
+   txt003 
+STRI 
+  V0 1.4355 -0.399515 0.112847   V1 1.28726 -0.756047 0.112847   V2 1.23529 -0.725523 0.0777778 
+  N0 0.743044 -0.200299 -0.638566   N1 0.665182 -0.385806 -0.639286   N2 0.283331 -0.164332 -0.944838 
+   txt003 
+STRI 
+  V0 1.37754 -0.383385 0.0777778   V1 1.42778 2.22045e-16 0.0777778   V2 1.48785 0 0.112847 
+  N0 0.316788 -0.085395 -0.944644   N1 0.328521 -6.08223e-17 -0.944497   N2 0.770022 -1.36806e-16 -0.638018 
+   txt003 
+STRI 
+  V0 1.48785 0 0.112847   V1 1.4355 -0.399515 0.112847   V2 1.37754 -0.383385 0.0777778 
+  N0 0.770022 -1.36806e-16 -0.638018   N1 0.743044 -0.200299 -0.638566   N2 0.316788 -0.085395 -0.944644 
+   txt003 
+STRI 
+  V0 0 -1.48785 0.112847   V1 0.399515 -1.4355 0.112847   V2 0.402778 -1.44722 0.15 
+  N0 0 -0.770022 -0.638018   N1 0.200299 -0.743044 -0.638566   N2 0.260275 -0.965535 -2.07142e-16 
+   txt003 
+STRI 
+  V0 0.402778 -1.44722 0.15   V1 0 -1.5 0.15   V2 0 -1.48785 0.112847 
+  N0 0.260275 -0.965535 -2.07142e-16   N1 0 -1 0   N2 0 -0.770022 -0.638018 
+   txt003 
+STRI 
+  V0 0.399515 -1.4355 0.112847   V1 0.756047 -1.28726 0.112847   V2 0.762222 -1.29778 0.15 
+  N0 0.200299 -0.743044 -0.638566   N1 0.385806 -0.665182 -0.639286   N2 0.501718 -0.865031 -5.46348e-16 
+   txt003 
+STRI 
+  V0 0.762222 -1.29778 0.15   V1 0.402778 -1.44722 0.15   V2 0.399515 -1.4355 0.112847 
+  N0 0.501718 -0.865031 -5.46348e-16   N1 0.260275 -0.965535 -2.07142e-16   N2 0.200299 -0.743044 -0.638566 
+   txt003 
+STRI 
+  V0 0.756047 -1.28726 0.112847   V1 1.05637 -1.05637 0.112847   V2 1.065 -1.065 0.15 
+  N0 0.385806 -0.665182 -0.639286   N1 0.543581 -0.543581 -0.639562   N2 0.707107 -0.707107 -6.97819e-16 
+   txt003 
+STRI 
+  V0 1.065 -1.065 0.15   V1 0.762222 -1.29778 0.15   V2 0.756047 -1.28726 0.112847 
+  N0 0.707107 -0.707107 -6.97819e-16   N1 0.501718 -0.865031 -5.46348e-16   N2 0.385806 -0.665182 -0.639286 
+   txt003 
+STRI 
+  V0 1.05637 -1.05637 0.112847   V1 1.28726 -0.756047 0.112847   V2 1.29778 -0.762222 0.15 
+  N0 0.543581 -0.543581 -0.639562   N1 0.665182 -0.385806 -0.639286   N2 0.865031 -0.501718 -5.46348e-16 
+   txt003 
+STRI 
+  V0 1.29778 -0.762222 0.15   V1 1.065 -1.065 0.15   V2 1.05637 -1.05637 0.112847 
+  N0 0.865031 -0.501718 -5.46348e-16   N1 0.707107 -0.707107 -6.97819e-16   N2 0.543581 -0.543581 -0.639562 
+   txt003 
+STRI 
+  V0 1.28726 -0.756047 0.112847   V1 1.4355 -0.399515 0.112847   V2 1.44722 -0.402778 0.15 
+  N0 0.665182 -0.385806 -0.639286   N1 0.743044 -0.200299 -0.638566   N2 0.965535 -0.260275 -2.07142e-16 
+   txt003 
+STRI 
+  V0 1.44722 -0.402778 0.15   V1 1.29778 -0.762222 0.15   V2 1.28726 -0.756047 0.112847 
+  N0 0.965535 -0.260275 -2.07142e-16   N1 0.865031 -0.501718 -5.46348e-16   N2 0.665182 -0.385806 -0.639286 
+   txt003 
+STRI 
+  V0 1.4355 -0.399515 0.112847   V1 1.48785 0 0.112847   V2 1.5 0 0.15 
+  N0 0.743044 -0.200299 -0.638566   N1 0.770022 -1.36806e-16 -0.638018   N2 1 0 0 
+   txt003 
+STRI 
+  V0 1.5 0 0.15   V1 1.44722 -0.402778 0.15   V2 1.4355 -0.399515 0.112847 
+  N0 1 0 0   N1 0.965535 -0.260275 -2.07142e-16   N2 0.743044 -0.200299 -0.638566 
+   txt003 
+
+END_SCENE
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/trypsin4pti.dat b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/trypsin4pti.dat
new file mode 100644
index 00000000..7d547f28
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/dat/trypsin4pti.dat
@@ -0,0 +1,538 @@
+BEGIN_SCENE
+  OUTFILE /dev/null
+  RESOLUTION 768 768
+  VERBOSE 0
+
+CAMERA
+  ZOOM  1.0
+  ASPECTRATIO 1.0
+  ANTIALIASING 0
+  RAYDEPTH  4 
+  CENTER    15.0 20.0 -50.0
+  VIEWDIR   0.0 0.0 1.0
+  UPDIR     0.0 1.0 0.0
+END_CAMERA
+
+
+LIGHT
+  CENTER  40.0 50.0 -40.0  
+  RAD     0.2
+  COLOR   0.5 0.5  0.5
+
+LIGHT 
+  CENTER  -40.0 20.0  -40.0 
+  RAD     0.2
+  COLOR   0.5 0.5  0.5
+
+
+TEXDEF O AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0 OPACITY 1.0 
+         PHONG PLASTIC 0.5 PHONG_SIZE 24.8
+         COLOR 1.0 0.0 0.0  TEXFUNC 0
+TEXALIAS OH O
+TEXALIAS OD1 O
+TEXALIAS OD2 O
+TEXALIAS OE1 O
+TEXALIAS OE2 O
+TEXALIAS OG O
+TEXALIAS OG1 O
+TEXALIAS OG2 O
+TEXALIAS OXT O
+
+TEXDEF C AMBIENT 0.1 DIFFUSE 0.5 SPECULAR 0.0 OPACITY 1.0 
+         PHONG PLASTIC 0.5 PHONG_SIZE 24.8
+         COLOR 0.5 0.5 0.5  TEXFUNC 0
+TEXALIAS CA C
+TEXALIAS CB C
+TEXALIAS CD C
+TEXALIAS CD1 C
+TEXALIAS CD2 C
+TEXALIAS CE C
+TEXALIAS CE1 C
+TEXALIAS CE2 C
+TEXALIAS CG C
+TEXALIAS CG1 C
+TEXALIAS CG2 C
+TEXALIAS CZ C
+
+TEXDEF N AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0 OPACITY 1.0 
+         PHONG PLASTIC 0.5 PHONG_SIZE 24.8
+         COLOR 0.5 0.5 1.0  TEXFUNC 0
+TEXALIAS ND2 N
+TEXALIAS NH1 N
+TEXALIAS NH2 N
+TEXALIAS NE N
+TEXALIAS NE2 N
+TEXALIAS NZ N
+
+TEXDEF SD AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0 OPACITY 1.0 
+         PHONG METAL 0.5 PHONG_SIZE 24.8
+         COLOR 1.0 1.0 1.0  TEXFUNC 0
+
+TEXDEF SG AMBIENT 0.1 DIFFUSE 0.9 SPECULAR 0.0 OPACITY 1.0 
+         PHONG PLASTIC 0.5 PHONG_SIZE 24.8
+         COLOR 1.0 1.0 1.0  TEXFUNC 0
+
+SPHERE  CENTER 26.465000 27.452000 -2.490000  RAD 1.0  N 
+SPHERE  CENTER 25.497000 26.862000 -1.573000  RAD 1.0  CA 
+SPHERE  CENTER 26.193001 26.179001 -0.437000  RAD 1.0  C 
+SPHERE  CENTER 27.270000 25.549000 -0.624000  RAD 1.0  O 
+SPHERE  CENTER 24.583000 25.804001 -2.239000  RAD 1.0  CB 
+SPHERE  CENTER 25.091000 24.375000 -2.409000  RAD 1.0  CG 
+SPHERE  CENTER 24.018999 23.427999 -2.996000  RAD 1.0  CD 
+SPHERE  CENTER 23.591000 24.028000 -4.287000  RAD 1.0  NE 
+SPHERE  CENTER 24.299000 23.972000 -5.389000  RAD 1.0  CZ 
+SPHERE  CENTER 25.431999 23.261000 -5.440000  RAD 1.0  NH1 
+SPHERE  CENTER 23.721001 24.372999 -6.467000  RAD 1.0  NH2 
+SPHERE  CENTER 25.667000 26.396000 0.708000  RAD 1.0  N 
+SPHERE  CENTER 26.222000 25.760000 1.891000  RAD 1.0  CA 
+SPHERE  CENTER 26.207001 24.242001 1.830000  RAD 1.0  C 
+SPHERE  CENTER 25.400000 23.576000 1.139000  RAD 1.0  O 
+SPHERE  CENTER 25.260000 26.207001 3.033000  RAD 1.0  CB 
+SPHERE  CENTER 24.511999 27.427999 2.493000  RAD 1.0  CG 
+SPHERE  CENTER 24.606001 27.382000 0.978000  RAD 1.0  CD 
+SPHERE  CENTER 27.170000 23.634001 2.462000  RAD 1.0  N 
+SPHERE  CENTER 27.284000 22.163000 2.498000  RAD 1.0  CA 
+SPHERE  CENTER 26.042999 21.506001 3.085000  RAD 1.0  C 
+SPHERE  CENTER 25.752001 20.350000 2.705000  RAD 1.0  O 
+SPHERE  CENTER 28.424999 21.747000 3.461000  RAD 1.0  CB 
+SPHERE  CENTER 29.791000 21.886000 2.787000  RAD 1.0  CG 
+SPHERE  CENTER 29.875000 22.104000 1.543000  RAD 1.0  OD1 
+SPHERE  CENTER 30.806000 21.500999 3.431000  RAD 1.0  OD2 
+SPHERE  CENTER 25.393999 22.184000 4.041000  RAD 1.0  N 
+SPHERE  CENTER 24.172001 21.584999 4.618000  RAD 1.0  CA 
+SPHERE  CENTER 23.009001 21.375000 3.624000  RAD 1.0  C 
+SPHERE  CENTER 22.082001 20.603001 3.921000  RAD 1.0  O 
+SPHERE  CENTER 23.691999 22.330999 5.862000  RAD 1.0  CB 
+SPHERE  CENTER 23.191999 23.778999 5.639000  RAD 1.0  CG 
+SPHERE  CENTER 21.961000 24.002001 5.060000  RAD 1.0  CD1 
+SPHERE  CENTER 23.951000 24.841000 6.050000  RAD 1.0  CD2 
+SPHERE  CENTER 21.497000 25.281000 4.869000  RAD 1.0  CE1 
+SPHERE  CENTER 23.510000 26.124001 5.854000  RAD 1.0  CE2 
+SPHERE  CENTER 22.277000 26.363001 5.249000  RAD 1.0  CZ 
+SPHERE  CENTER 23.094999 22.004000 2.522000  RAD 1.0  N 
+SPHERE  CENTER 22.106001 21.863001 1.467000  RAD 1.0  CA 
+SPHERE  CENTER 22.191999 20.518000 0.830000  RAD 1.0  C 
+SPHERE  CENTER 21.230000 20.068001 0.167000  RAD 1.0  O 
+SPHERE  CENTER 22.358000 22.903999 0.371000  RAD 1.0  CB 
+SPHERE  CENTER 22.145000 24.591999 0.888000  RAD 1.0  SG 
+SPHERE  CENTER 23.326000 19.826000 1.008000  RAD 1.0  N 
+SPHERE  CENTER 23.436001 18.459999 0.459000  RAD 1.0  CA 
+SPHERE  CENTER 22.958000 17.365000 1.407000  RAD 1.0  C 
+SPHERE  CENTER 22.938000 16.180000 0.999000  RAD 1.0  O 
+SPHERE  CENTER 24.898001 18.084000 0.131000  RAD 1.0  CB 
+SPHERE  CENTER 25.572001 19.129000 -0.776000  RAD 1.0  CG 
+SPHERE  CENTER 27.037001 18.695000 -1.116000  RAD 1.0  CD1 
+SPHERE  CENTER 24.791000 19.488001 -2.049000  RAD 1.0  CD2 
+SPHERE  CENTER 22.545000 17.716000 2.628000  RAD 1.0  N 
+SPHERE  CENTER 22.039000 16.646000 3.528000  RAD 1.0  CA 
+SPHERE  CENTER 20.615999 16.285000 3.113000  RAD 1.0  C 
+SPHERE  CENTER 19.860001 17.136000 2.576000  RAD 1.0  O 
+SPHERE  CENTER 21.764000 17.216999 4.920000  RAD 1.0  CB 
+SPHERE  CENTER 22.813999 18.035000 5.647000  RAD 1.0  CG 
+SPHERE  CENTER 22.152000 18.707001 6.870000  RAD 1.0  CD 
+SPHERE  CENTER 22.980000 19.100000 7.718000  RAD 1.0  OE1 
+SPHERE  CENTER 21.086000 19.403999 6.779000  RAD 1.0  OE2 
+SPHERE  CENTER 20.254000 15.031000 3.334000  RAD 1.0  N 
+SPHERE  CENTER 18.892000 14.554000 3.034000  RAD 1.0  CA 
+SPHERE  CENTER 17.954000 15.160000 4.079000  RAD 1.0  C 
+SPHERE  CENTER 18.443001 15.606000 5.146000  RAD 1.0  O 
+SPHERE  CENTER 18.910000 13.045000 3.274000  RAD 1.0  CB 
+SPHERE  CENTER 20.226000 12.742000 4.021000  RAD 1.0  CG 
+SPHERE  CENTER 21.107000 14.009000 3.934000  RAD 1.0  CD 
+SPHERE  CENTER 16.681999 15.232000 3.767000  RAD 1.0  N 
+SPHERE  CENTER 15.690000 15.852000 4.661000  RAD 1.0  CA 
+SPHERE  CENTER 15.550000 15.006000 5.916000  RAD 1.0  C 
+SPHERE  CENTER 15.693000 13.769000 5.836000  RAD 1.0  O 
+SPHERE  CENTER 14.367000 15.707000 3.867000  RAD 1.0  CB 
+SPHERE  CENTER 14.571000 14.716000 2.710000  RAD 1.0  CG 
+SPHERE  CENTER 16.090000 14.597000 2.574000  RAD 1.0  CD 
+SPHERE  CENTER 15.365000 15.630000 7.042000  RAD 1.0  N 
+SPHERE  CENTER 15.310000 14.908000 8.298000  RAD 1.0  CA 
+SPHERE  CENTER 13.953000 15.177000 8.952000  RAD 1.0  C 
+SPHERE  CENTER 13.699000 16.320000 9.382000  RAD 1.0  O 
+SPHERE  CENTER 16.532000 15.383000 9.122000  RAD 1.0  CB 
+SPHERE  CENTER 16.608000 14.781000 10.525000  RAD 1.0  CG 
+SPHERE  CENTER 17.132000 13.535000 10.707000  RAD 1.0  CD1 
+SPHERE  CENTER 16.155001 15.523000 11.588000  RAD 1.0  CD2 
+SPHERE  CENTER 17.216000 12.999000 11.982000  RAD 1.0  CE1 
+SPHERE  CENTER 16.266001 14.985000 12.862000  RAD 1.0  CE2 
+SPHERE  CENTER 16.808001 13.746000 13.047000  RAD 1.0  CZ 
+SPHERE  CENTER 16.878000 13.192000 14.372000  RAD 1.0  OH 
+SPHERE  CENTER 13.161000 14.146000 9.088000  RAD 1.0  N 
+SPHERE  CENTER 11.802000 14.321000 9.642000  RAD 1.0  CA 
+SPHERE  CENTER 11.855000 14.484000 11.146000  RAD 1.0  C 
+SPHERE  CENTER 11.105000 15.314000 11.759000  RAD 1.0  O 
+SPHERE  CENTER 10.963000 13.105000 9.273000  RAD 1.0  CB 
+SPHERE  CENTER 10.706000 13.192000 7.854000  RAD 1.0  OG1 
+SPHERE  CENTER 9.611000 13.152000 10.045000  RAD 1.0  CG2 
+SPHERE  CENTER 12.789000 13.760000 11.726000  RAD 1.0  N 
+SPHERE  CENTER 13.002000 13.922000 13.198000  RAD 1.0  CA 
+SPHERE  CENTER 12.107000 12.944000 13.909000  RAD 1.0  C 
+SPHERE  CENTER 11.333000 12.212000 13.239000  RAD 1.0  O 
+SPHERE  CENTER 12.235000 12.905000 15.210000  RAD 1.0  N 
+SPHERE  CENTER 11.516000 11.958000 16.066999  RAD 1.0  CA 
+SPHERE  CENTER 10.094000 12.319000 16.468000  RAD 1.0  C 
+SPHERE  CENTER 9.440000 11.442000 17.052000  RAD 1.0  O 
+SPHERE  CENTER 12.272000 11.936000 17.370001  RAD 1.0  CB 
+SPHERE  CENTER 13.164000 13.172000 17.399000  RAD 1.0  CG 
+SPHERE  CENTER 13.281000 13.627000 15.925000  RAD 1.0  CD 
+SPHERE  CENTER 9.629000 13.519000 16.214001  RAD 1.0  N 
+SPHERE  CENTER 8.290000 13.980000 16.615999  RAD 1.0  CA 
+SPHERE  CENTER 7.268000 13.720000 15.515000  RAD 1.0  C 
+SPHERE  CENTER 7.672000 13.397000 14.387000  RAD 1.0  O 
+SPHERE  CENTER 8.279000 15.441000 16.966999  RAD 1.0  CB 
+SPHERE  CENTER 9.221000 15.735000 18.490000  RAD 1.0  SG 
+SPHERE  CENTER 6.027000 13.680000 15.869000  RAD 1.0  N 
+SPHERE  CENTER 5.005000 13.220000 14.945000  RAD 1.0  CA 
+SPHERE  CENTER 3.964000 14.283000 14.630000  RAD 1.0  C 
+SPHERE  CENTER 2.777000 13.949000 14.377000  RAD 1.0  O 
+SPHERE  CENTER 4.310000 11.998000 15.592000  RAD 1.0  CB 
+SPHERE  CENTER 5.273000 10.848000 15.913000  RAD 1.0  CG 
+SPHERE  CENTER 5.781000 10.034000 14.702000  RAD 1.0  CD 
+SPHERE  CENTER 6.855000 9.016000 15.126000  RAD 1.0  CE 
+SPHERE  CENTER 7.357000 8.291000 13.953000  RAD 1.0  NZ 
+SPHERE  CENTER 4.325000 15.549000 14.618000  RAD 1.0  N 
+SPHERE  CENTER 3.513000 16.639999 14.122000  RAD 1.0  CA 
+SPHERE  CENTER 3.561000 16.615000 12.586000  RAD 1.0  C 
+SPHERE  CENTER 4.270000 15.752000 12.023000  RAD 1.0  O 
+SPHERE  CENTER 3.984000 17.995001 14.670000  RAD 1.0  CB 
+SPHERE  CENTER 2.781000 17.424999 11.943000  RAD 1.0  N 
+SPHERE  CENTER 2.700000 17.355000 10.457000  RAD 1.0  CA 
+SPHERE  CENTER 2.875000 18.731001 9.887000  RAD 1.0  C 
+SPHERE  CENTER 1.878000 19.469999 9.653000  RAD 1.0  O 
+SPHERE  CENTER 1.320000 16.787001 9.970000  RAD 1.0  CB 
+SPHERE  CENTER 1.186000 15.339000 10.395000  RAD 1.0  CG 
+SPHERE  CENTER -0.170000 14.751000 9.963000  RAD 1.0  CD 
+SPHERE  CENTER -1.132000 15.455000 10.801000  RAD 1.0  NE 
+SPHERE  CENTER -1.531000 14.913000 11.939000  RAD 1.0  CZ 
+SPHERE  CENTER -1.172000 13.658000 12.165000  RAD 1.0  NH1 
+SPHERE  CENTER -2.202000 15.647000 12.795000  RAD 1.0  NH2 
+SPHERE  CENTER 4.154000 19.110001 9.817000  RAD 1.0  N 
+SPHERE  CENTER 4.595000 20.444000 9.391000  RAD 1.0  CA 
+SPHERE  CENTER 5.249000 20.388000 8.012000  RAD 1.0  C 
+SPHERE  CENTER 6.193000 19.612000 7.834000  RAD 1.0  O 
+SPHERE  CENTER 5.590000 20.988001 10.452000  RAD 1.0  CB 
+SPHERE  CENTER 4.792000 21.062000 11.815000  RAD 1.0  CG1 
+SPHERE  CENTER 5.985000 22.451000 10.085000  RAD 1.0  CG2 
+SPHERE  CENTER 5.689000 21.535999 12.955000  RAD 1.0  CD1 
+SPHERE  CENTER 4.586000 20.955999 7.035000  RAD 1.0  N 
+SPHERE  CENTER 5.154000 20.879000 5.697000  RAD 1.0  CA 
+SPHERE  CENTER 6.286000 21.912001 5.572000  RAD 1.0  C 
+SPHERE  CENTER 6.156000 23.146000 5.785000  RAD 1.0  O 
+SPHERE  CENTER 4.095000 21.205000 4.648000  RAD 1.0  CB 
+SPHERE  CENTER 2.836000 20.316999 4.886000  RAD 1.0  CG1 
+SPHERE  CENTER 4.655000 20.930000 3.250000  RAD 1.0  CG2 
+SPHERE  CENTER 3.122000 18.813999 4.850000  RAD 1.0  CD1 
+SPHERE  CENTER 7.451000 21.372000 5.297000  RAD 1.0  N 
+SPHERE  CENTER 8.602000 22.257000 5.060000  RAD 1.0  CA 
+SPHERE  CENTER 9.150000 21.950001 3.673000  RAD 1.0  C 
+SPHERE  CENTER 8.840000 20.896000 3.088000  RAD 1.0  O 
+SPHERE  CENTER 9.698000 21.896999 6.092000  RAD 1.0  CB 
+SPHERE  CENTER 9.226000 22.299999 7.493000  RAD 1.0  CG 
+SPHERE  CENTER 9.248000 23.850000 7.622000  RAD 1.0  CD 
+SPHERE  CENTER 8.810000 24.311001 8.962000  RAD 1.0  NE 
+SPHERE  CENTER 9.575000 24.336000 10.075000  RAD 1.0  CZ 
+SPHERE  CENTER 10.888000 24.077000 10.044000  RAD 1.0  NH1 
+SPHERE  CENTER 9.050000 24.893000 11.170000  RAD 1.0  NH2 
+SPHERE  CENTER 10.178000 22.695000 3.318000  RAD 1.0  N 
+SPHERE  CENTER 10.959000 22.444000 2.085000  RAD 1.0  CA 
+SPHERE  CENTER 12.407000 22.010000 2.386000  RAD 1.0  C 
+SPHERE  CENTER 12.987000 22.511999 3.378000  RAD 1.0  O 
+SPHERE  CENTER 10.997000 23.770000 1.282000  RAD 1.0  CB 
+SPHERE  CENTER 9.641000 24.038000 0.627000  RAD 1.0  CG 
+SPHERE  CENTER 8.639000 24.591999 1.399000  RAD 1.0  CD1 
+SPHERE  CENTER 9.451000 23.725000 -0.691000  RAD 1.0  CD2 
+SPHERE  CENTER 7.403000 24.861000 0.831000  RAD 1.0  CE1 
+SPHERE  CENTER 8.213000 23.993000 -1.249000  RAD 1.0  CE2 
+SPHERE  CENTER 7.215000 24.576000 -0.494000  RAD 1.0  CZ 
+SPHERE  CENTER 5.879000 24.768999 -1.060000  RAD 1.0  OH 
+SPHERE  CENTER 12.977000 21.141001 1.535000  RAD 1.0  N 
+SPHERE  CENTER 14.449000 20.892000 1.626000  RAD 1.0  CA 
+SPHERE  CENTER 15.018000 21.045000 0.237000  RAD 1.0  C 
+SPHERE  CENTER 14.250000 20.837000 -0.740000  RAD 1.0  O 
+SPHERE  CENTER 14.664000 19.434999 2.142000  RAD 1.0  CB 
+SPHERE  CENTER 14.283000 18.275999 1.191000  RAD 1.0  CG 
+SPHERE  CENTER 15.290000 17.639000 0.506000  RAD 1.0  CD1 
+SPHERE  CENTER 12.962000 17.907000 0.976000  RAD 1.0  CD2 
+SPHERE  CENTER 14.981000 16.632000 -0.392000  RAD 1.0  CE1 
+SPHERE  CENTER 12.638000 16.909000 0.061000  RAD 1.0  CE2 
+SPHERE  CENTER 13.673000 16.261999 -0.626000  RAD 1.0  CZ 
+SPHERE  CENTER 16.336000 21.281000 0.152000  RAD 1.0  N 
+SPHERE  CENTER 16.948000 21.292000 -1.153000  RAD 1.0  CA 
+SPHERE  CENTER 17.365000 19.888000 -1.542000  RAD 1.0  C 
+SPHERE  CENTER 18.009001 19.184000 -0.744000  RAD 1.0  O 
+SPHERE  CENTER 18.188000 22.194000 -1.071000  RAD 1.0  CB 
+SPHERE  CENTER 18.906000 22.263000 -2.442000  RAD 1.0  CG 
+SPHERE  CENTER 20.089001 21.621000 -2.663000  RAD 1.0  CD1 
+SPHERE  CENTER 18.361000 23.033001 -3.436000  RAD 1.0  CD2 
+SPHERE  CENTER 20.733000 21.778999 -3.896000  RAD 1.0  CE1 
+SPHERE  CENTER 18.990999 23.184999 -4.662000  RAD 1.0  CE2 
+SPHERE  CENTER 20.184999 22.562000 -4.864000  RAD 1.0  CZ 
+SPHERE  CENTER 20.826000 22.768000 -6.115000  RAD 1.0  OH 
+SPHERE  CENTER 16.913000 19.452999 -2.726000  RAD 1.0  N 
+SPHERE  CENTER 17.295000 18.160000 -3.291000  RAD 1.0  CA 
+SPHERE  CENTER 18.406000 18.332001 -4.341000  RAD 1.0  C 
+SPHERE  CENTER 18.166000 18.843000 -5.464000  RAD 1.0  O 
+SPHERE  CENTER 16.052000 17.558001 -3.946000  RAD 1.0  CB 
+SPHERE  CENTER 16.354000 16.226999 -4.626000  RAD 1.0  CG 
+SPHERE  CENTER 17.531000 15.754000 -4.725000  RAD 1.0  OD1 
+SPHERE  CENTER 15.234000 15.549000 -4.870000  RAD 1.0  ND2 
+SPHERE  CENTER 19.655001 18.124001 -3.871000  RAD 1.0  N 
+SPHERE  CENTER 20.851000 18.420000 -4.681000  RAD 1.0  CA 
+SPHERE  CENTER 20.920000 17.650000 -6.010000  RAD 1.0  C 
+SPHERE  CENTER 21.385000 18.257000 -6.997000  RAD 1.0  O 
+SPHERE  CENTER 22.112000 18.070999 -3.866000  RAD 1.0  CB 
+SPHERE  CENTER 20.333000 16.480000 -6.081000  RAD 1.0  N 
+SPHERE  CENTER 20.243999 15.784000 -7.383000  RAD 1.0  CA 
+SPHERE  CENTER 19.287001 16.482000 -8.327000  RAD 1.0  C 
+SPHERE  CENTER 19.478001 16.368999 -9.556000  RAD 1.0  O 
+SPHERE  CENTER 19.732000 14.353000 -7.259000  RAD 1.0  CB 
+SPHERE  CENTER 20.799999 13.485000 -6.626000  RAD 1.0  CG 
+SPHERE  CENTER 20.299000 12.037000 -6.533000  RAD 1.0  CD 
+SPHERE  CENTER 21.386999 11.067000 -6.033000  RAD 1.0  CE 
+SPHERE  CENTER 21.820999 11.437000 -4.681000  RAD 1.0  NZ 
+SPHERE  CENTER 18.212999 17.041000 -7.772000  RAD 1.0  N 
+SPHERE  CENTER 17.181999 17.617001 -8.631000  RAD 1.0  CA 
+SPHERE  CENTER 17.468000 19.070000 -8.921000  RAD 1.0  C 
+SPHERE  CENTER 16.909000 19.707001 -9.863000  RAD 1.0  O 
+SPHERE  CENTER 15.833000 17.423000 -7.901000  RAD 1.0  CB 
+SPHERE  CENTER 18.299000 19.622000 -8.061000  RAD 1.0  N 
+SPHERE  CENTER 18.625999 21.035999 -8.237000  RAD 1.0  CA 
+SPHERE  CENTER 17.587999 22.051001 -7.738000  RAD 1.0  C 
+SPHERE  CENTER 17.702000 23.257999 -8.056000  RAD 1.0  O 
+SPHERE  CENTER 16.632000 21.566000 -6.970000  RAD 1.0  N 
+SPHERE  CENTER 15.576000 22.431999 -6.478000  RAD 1.0  CA 
+SPHERE  CENTER 14.947000 21.879999 -5.199000  RAD 1.0  C 
+SPHERE  CENTER 15.304000 20.784000 -4.719000  RAD 1.0  O 
+SPHERE  CENTER 14.553000 22.764999 -7.568000  RAD 1.0  CB 
+SPHERE  CENTER 14.018000 21.514000 -8.283000  RAD 1.0  CG 
+SPHERE  CENTER 13.211000 20.593000 -7.394000  RAD 1.0  CD1 
+SPHERE  CENTER 13.189000 21.898001 -9.518000  RAD 1.0  CD2 
+SPHERE  CENTER 14.114000 22.691999 -4.605000  RAD 1.0  N 
+SPHERE  CENTER 13.591000 22.299999 -3.306000  RAD 1.0  CA 
+SPHERE  CENTER 12.246000 21.612000 -3.398000  RAD 1.0  C 
+SPHERE  CENTER 11.508000 21.862000 -4.381000  RAD 1.0  O 
+SPHERE  CENTER 13.406000 23.628000 -2.540000  RAD 1.0  CB 
+SPHERE  CENTER 14.977000 24.433001 -2.196000  RAD 1.0  SG 
+SPHERE  CENTER 12.005000 20.672001 -2.530000  RAD 1.0  N 
+SPHERE  CENTER 10.813000 19.820999 -2.569000  RAD 1.0  CA 
+SPHERE  CENTER 10.208000 19.822001 -1.167000  RAD 1.0  C 
+SPHERE  CENTER 10.918000 20.218000 -0.210000  RAD 1.0  O 
+SPHERE  CENTER 11.110000 18.377001 -3.007000  RAD 1.0  CB 
+SPHERE  CENTER 11.604000 18.464001 -4.496000  RAD 1.0  CG 
+SPHERE  CENTER 12.041000 17.093000 -4.992000  RAD 1.0  CD 
+SPHERE  CENTER 12.104000 16.884001 -6.223000  RAD 1.0  OE1 
+SPHERE  CENTER 12.461000 16.246000 -4.115000  RAD 1.0  NE2 
+SPHERE  CENTER 8.983000 19.459000 -1.072000  RAD 1.0  N 
+SPHERE  CENTER 8.377000 19.427999 0.280000  RAD 1.0  CA 
+SPHERE  CENTER 8.573000 18.100000 0.950000  RAD 1.0  C 
+SPHERE  CENTER 8.785000 17.013000 0.347000  RAD 1.0  O 
+SPHERE  CENTER 6.844000 19.700001 0.273000  RAD 1.0  CB 
+SPHERE  CENTER 6.304000 18.825001 -0.706000  RAD 1.0  OG1 
+SPHERE  CENTER 6.585000 21.149000 -0.177000  RAD 1.0  CG2 
+SPHERE  CENTER 8.526000 18.187000 2.280000  RAD 1.0  N 
+SPHERE  CENTER 8.582000 16.999001 3.087000  RAD 1.0  CA 
+SPHERE  CENTER 7.801000 17.273001 4.382000  RAD 1.0  C 
+SPHERE  CENTER 7.554000 18.469000 4.665000  RAD 1.0  O 
+SPHERE  CENTER 10.066000 16.503000 3.399000  RAD 1.0  CB 
+SPHERE  CENTER 10.840000 17.323999 4.462000  RAD 1.0  CG 
+SPHERE  CENTER 11.188000 16.711000 5.670000  RAD 1.0  CD1 
+SPHERE  CENTER 11.224000 18.618999 4.188000  RAD 1.0  CD2 
+SPHERE  CENTER 11.912000 17.452999 6.617000  RAD 1.0  CE1 
+SPHERE  CENTER 11.948000 19.333000 5.129000  RAD 1.0  CE2 
+SPHERE  CENTER 12.277000 18.763000 6.344000  RAD 1.0  CZ 
+SPHERE  CENTER 7.455000 16.219999 5.116000  RAD 1.0  N 
+SPHERE  CENTER 6.756000 16.414000 6.390000  RAD 1.0  CA 
+SPHERE  CENTER 7.798000 16.358999 7.491000  RAD 1.0  C 
+SPHERE  CENTER 8.422000 15.296000 7.692000  RAD 1.0  O 
+SPHERE  CENTER 5.716000 15.281000 6.557000  RAD 1.0  CB 
+SPHERE  CENTER 4.973000 15.432000 7.882000  RAD 1.0  CG1 
+SPHERE  CENTER 4.667000 15.326000 5.371000  RAD 1.0  CG2 
+SPHERE  CENTER 7.953000 17.509001 8.095000  RAD 1.0  N 
+SPHERE  CENTER 8.816000 17.659000 9.286000  RAD 1.0  CA 
+SPHERE  CENTER 7.941000 17.294001 10.498000  RAD 1.0  C 
+SPHERE  CENTER 6.818000 17.832001 10.661000  RAD 1.0  O 
+SPHERE  CENTER 9.260000 19.136000 9.274000  RAD 1.0  CB 
+SPHERE  CENTER 10.066000 19.506001 10.540000  RAD 1.0  CG 
+SPHERE  CENTER 11.058000 18.667999 11.032000  RAD 1.0  CD1 
+SPHERE  CENTER 9.728000 20.677999 11.181000  RAD 1.0  CD2 
+SPHERE  CENTER 11.713000 19.021999 12.217000  RAD 1.0  CE1 
+SPHERE  CENTER 10.401000 21.042000 12.346000  RAD 1.0  CE2 
+SPHERE  CENTER 11.371000 20.211000 12.851000  RAD 1.0  CZ 
+SPHERE  CENTER 12.040000 20.579000 14.049000  RAD 1.0  OH 
+SPHERE  CENTER 8.505000 16.504999 11.400000  RAD 1.0  N 
+SPHERE  CENTER 7.774000 16.076000 12.622000  RAD 1.0  CA 
+SPHERE  CENTER 7.696000 17.099001 13.728000  RAD 1.0  C 
+SPHERE  CENTER 6.978000 16.834999 14.718000  RAD 1.0  O 
+SPHERE  CENTER 8.385000 18.202000 13.646000  RAD 1.0  N 
+SPHERE  CENTER 8.275000 19.365999 14.533000  RAD 1.0  CA 
+SPHERE  CENTER 9.338000 19.430000 15.620000  RAD 1.0  C 
+SPHERE  CENTER 9.309000 20.379999 16.415001  RAD 1.0  O 
+SPHERE  CENTER 10.317000 18.555000 15.610000  RAD 1.0  N 
+SPHERE  CENTER 11.453000 18.707001 16.541000  RAD 1.0  CA 
+SPHERE  CENTER 12.763000 18.232000 15.950000  RAD 1.0  C 
+SPHERE  CENTER 12.753000 17.224001 15.201000  RAD 1.0  O 
+SPHERE  CENTER 11.179000 18.055000 17.937000  RAD 1.0  CB 
+SPHERE  CENTER 11.154000 16.283001 17.922001  RAD 1.0  SG 
+SPHERE  CENTER 13.828000 18.788000 16.528999  RAD 1.0  N 
+SPHERE  CENTER 15.222000 18.386999 16.261999  RAD 1.0  CA 
+SPHERE  CENTER 15.644000 18.605000 14.798000  RAD 1.0  C 
+SPHERE  CENTER 16.306000 17.708000 14.224000  RAD 1.0  O 
+SPHERE  CENTER 15.486000 16.941000 16.719000  RAD 1.0  CB 
+SPHERE  CENTER 14.949000 16.624001 18.146999  RAD 1.0  CG 
+SPHERE  CENTER 15.484000 17.593000 19.195000  RAD 1.0  CD 
+SPHERE  CENTER 15.081000 17.068001 20.497000  RAD 1.0  NE 
+SPHERE  CENTER 15.268000 17.830999 21.573999  RAD 1.0  CZ 
+SPHERE  CENTER 15.870000 19.020000 21.452999  RAD 1.0  NH1 
+SPHERE  CENTER 14.930000 17.320999 22.753000  RAD 1.0  NH2 
+SPHERE  CENTER 15.154000 19.670000 14.180000  RAD 1.0  N 
+SPHERE  CENTER 15.461000 19.893999 12.733000  RAD 1.0  CA 
+SPHERE  CENTER 16.969000 19.924000 12.482000  RAD 1.0  C 
+SPHERE  CENTER 17.752001 20.431000 13.327000  RAD 1.0  O 
+SPHERE  CENTER 14.918000 21.275000 12.366000  RAD 1.0  CB 
+SPHERE  CENTER 17.282000 19.622000 11.271000  RAD 1.0  N 
+SPHERE  CENTER 18.584999 19.886999 10.687000  RAD 1.0  CA 
+SPHERE  CENTER 18.461000 21.087000 9.753000  RAD 1.0  C 
+SPHERE  CENTER 17.371000 21.708000 9.790000  RAD 1.0  O 
+SPHERE  CENTER 18.961000 18.612000 9.934000  RAD 1.0  CB 
+SPHERE  CENTER 19.486000 17.514999 10.843000  RAD 1.0  CG 
+SPHERE  CENTER 20.042999 16.424999 9.926000  RAD 1.0  CD 
+SPHERE  CENTER 20.782000 15.386000 10.779000  RAD 1.0  CE 
+SPHERE  CENTER 20.985001 14.137000 10.021000  RAD 1.0  NZ 
+SPHERE  CENTER 19.577000 21.643999 9.215000  RAD 1.0  N 
+SPHERE  CENTER 19.570999 22.903000 8.543000  RAD 1.0  CA 
+SPHERE  CENTER 18.898001 22.847000 7.144000  RAD 1.0  C 
+SPHERE  CENTER 18.476000 23.930000 6.690000  RAD 1.0  O 
+SPHERE  CENTER 20.981001 23.469999 8.429000  RAD 1.0  CB 
+SPHERE  CENTER 21.461000 24.047001 9.786000  RAD 1.0  CG 
+SPHERE  CENTER 22.614000 25.047001 9.608000  RAD 1.0  CD 
+SPHERE  CENTER 22.118999 26.403999 9.384000  RAD 1.0  NE 
+SPHERE  CENTER 22.948000 27.426001 9.370000  RAD 1.0  CZ 
+SPHERE  CENTER 24.253000 27.187000 9.415000  RAD 1.0  NH1 
+SPHERE  CENTER 22.472000 28.634001 9.297000  RAD 1.0  NH2 
+SPHERE  CENTER 18.870001 21.715000 6.474000  RAD 1.0  N 
+SPHERE  CENTER 18.209999 21.712999 5.169000  RAD 1.0  CA 
+SPHERE  CENTER 16.671000 21.559000 5.372000  RAD 1.0  C 
+SPHERE  CENTER 16.068001 20.466000 5.197000  RAD 1.0  O 
+SPHERE  CENTER 18.745001 20.506001 4.379000  RAD 1.0  CB 
+SPHERE  CENTER 18.295000 20.591999 2.909000  RAD 1.0  CG 
+SPHERE  CENTER 17.721001 21.629000 2.499000  RAD 1.0  OD1 
+SPHERE  CENTER 18.664000 19.563999 2.134000  RAD 1.0  ND2 
+SPHERE  CENTER 16.097000 22.643000 5.820000  RAD 1.0  N 
+SPHERE  CENTER 14.676000 22.662001 6.349000  RAD 1.0  CA 
+SPHERE  CENTER 14.157000 24.101999 6.384000  RAD 1.0  C 
+SPHERE  CENTER 14.715000 24.959000 7.120000  RAD 1.0  O 
+SPHERE  CENTER 14.577000 21.951000 7.736000  RAD 1.0  CB 
+SPHERE  CENTER 13.128000 21.861000 8.301000  RAD 1.0  CG 
+SPHERE  CENTER 12.432000 22.889000 8.208000  RAD 1.0  OD1 
+SPHERE  CENTER 12.975000 21.035000 9.288000  RAD 1.0  ND2 
+SPHERE  CENTER 13.324000 24.438000 5.381000  RAD 1.0  N 
+SPHERE  CENTER 12.918000 25.816999 5.120000  RAD 1.0  CA 
+SPHERE  CENTER 11.388000 25.961000 5.164000  RAD 1.0  C 
+SPHERE  CENTER 10.669000 24.966000 4.915000  RAD 1.0  O 
+SPHERE  CENTER 13.372000 26.372999 3.741000  RAD 1.0  CB 
+SPHERE  CENTER 14.913000 26.191999 3.701000  RAD 1.0  CG 
+SPHERE  CENTER 15.492000 25.002001 3.268000  RAD 1.0  CD1 
+SPHERE  CENTER 15.705000 27.252001 4.053000  RAD 1.0  CD2 
+SPHERE  CENTER 16.877001 24.881001 3.132000  RAD 1.0  CE1 
+SPHERE  CENTER 17.108999 27.125999 3.941000  RAD 1.0  CE2 
+SPHERE  CENTER 17.659000 25.957001 3.487000  RAD 1.0  CZ 
+SPHERE  CENTER 10.949000 27.146999 5.460000  RAD 1.0  N 
+SPHERE  CENTER 9.480000 27.343000 5.498000  RAD 1.0  CA 
+SPHERE  CENTER 8.875000 27.670000 4.157000  RAD 1.0  C 
+SPHERE  CENTER 7.634000 27.622999 4.057000  RAD 1.0  O 
+SPHERE  CENTER 9.045000 28.475000 6.433000  RAD 1.0  CB 
+SPHERE  CENTER 9.258000 27.945999 7.875000  RAD 1.0  CG 
+SPHERE  CENTER 9.119000 29.052000 8.948000  RAD 1.0  CD 
+SPHERE  CENTER 10.025000 28.736000 10.167000  RAD 1.0  CE 
+SPHERE  CENTER 9.826000 29.728001 11.231000  RAD 1.0  NZ 
+SPHERE  CENTER 9.687000 27.909000 3.152000  RAD 1.0  N 
+SPHERE  CENTER 9.124000 28.167999 1.840000  RAD 1.0  CA 
+SPHERE  CENTER 10.108000 27.719000 0.765000  RAD 1.0  C 
+SPHERE  CENTER 11.332000 27.660000 1.047000  RAD 1.0  O 
+SPHERE  CENTER 8.778000 29.648001 1.642000  RAD 1.0  CB 
+SPHERE  CENTER 10.000000 30.391001 1.484000  RAD 1.0  OG 
+SPHERE  CENTER 9.604000 27.471001 -0.422000  RAD 1.0  N 
+SPHERE  CENTER 10.526000 27.160999 -1.512000  RAD 1.0  CA 
+SPHERE  CENTER 11.423000 28.346001 -1.863000  RAD 1.0  C 
+SPHERE  CENTER 12.634000 28.115000 -2.136000  RAD 1.0  O 
+SPHERE  CENTER 9.782000 26.679001 -2.783000  RAD 1.0  CB 
+SPHERE  CENTER 10.966000 29.570000 -1.682000  RAD 1.0  N 
+SPHERE  CENTER 11.751000 30.764000 -1.998000  RAD 1.0  CA 
+SPHERE  CENTER 12.900000 30.964001 -1.040000  RAD 1.0  C 
+SPHERE  CENTER 14.032000 31.282000 -1.463000  RAD 1.0  O 
+SPHERE  CENTER 10.871000 32.021999 -2.024000  RAD 1.0  CB 
+SPHERE  CENTER 9.868000 32.069000 -3.200000  RAD 1.0  CG 
+SPHERE  CENTER 8.525000 31.417000 -2.847000  RAD 1.0  CD 
+SPHERE  CENTER 7.573000 31.562000 -3.638000  RAD 1.0  OE1 
+SPHERE  CENTER 8.368000 30.636999 -1.865000  RAD 1.0  OE2 
+SPHERE  CENTER 12.658000 30.686001 0.225000  RAD 1.0  N 
+SPHERE  CENTER 13.804000 30.775000 1.163000  RAD 1.0  CA 
+SPHERE  CENTER 14.824000 29.667000 0.941000  RAD 1.0  C 
+SPHERE  CENTER 16.058001 29.903999 1.049000  RAD 1.0  O 
+SPHERE  CENTER 13.347000 30.500000 2.601000  RAD 1.0  CB 
+SPHERE  CENTER 12.813000 31.775999 3.236000  RAD 1.0  CG 
+SPHERE  CENTER 12.716000 32.875000 2.613000  RAD 1.0  OD1 
+SPHERE  CENTER 12.096000 31.598000 4.247000  RAD 1.0  OD2 
+SPHERE  CENTER 14.305000 28.478001 0.644000  RAD 1.0  N 
+SPHERE  CENTER 15.128000 27.301001 0.379000  RAD 1.0  CA 
+SPHERE  CENTER 16.006001 27.523001 -0.852000  RAD 1.0  C 
+SPHERE  CENTER 17.247999 27.267000 -0.809000  RAD 1.0  O 
+SPHERE  CENTER 14.238000 26.045000 0.259000  RAD 1.0  CB 
+SPHERE  CENTER 15.047000 24.530001 -0.176000  RAD 1.0  SG 
+SPHERE  CENTER 15.384000 28.062000 -1.870000  RAD 1.0  N 
+SPHERE  CENTER 16.191999 28.302000 -3.048000  RAD 1.0  CA 
+SPHERE  CENTER 17.171000 29.452999 -2.841000  RAD 1.0  C 
+SPHERE  CENTER 18.246000 29.474001 -3.490000  RAD 1.0  O 
+SPHERE  CENTER 15.267000 28.570999 -4.266000  RAD 1.0  CB 
+SPHERE  CENTER 14.634000 27.261000 -4.708000  RAD 1.0  CG 
+SPHERE  CENTER 15.759000 25.962000 -5.253000  RAD 1.0  SD 
+SPHERE  CENTER 16.306999 26.625000 -6.805000  RAD 1.0  CE 
+SPHERE  CENTER 16.775999 30.469999 -2.099000  RAD 1.0  N 
+SPHERE  CENTER 17.652000 31.617001 -1.869000  RAD 1.0  CA 
+SPHERE  CENTER 18.910000 31.125999 -1.141000  RAD 1.0  C 
+SPHERE  CENTER 20.049999 31.469999 -1.556000  RAD 1.0  O 
+SPHERE  CENTER 16.934000 32.595001 -0.930000  RAD 1.0  CB 
+SPHERE  CENTER 17.721001 33.839001 -0.540000  RAD 1.0  CG 
+SPHERE  CENTER 16.740999 35.039001 -0.291000  RAD 1.0  CD 
+SPHERE  CENTER 15.472000 34.667999 0.404000  RAD 1.0  NE 
+SPHERE  CENTER 14.256000 34.889999 -0.074000  RAD 1.0  CZ 
+SPHERE  CENTER 13.983000 35.465000 -1.233000  RAD 1.0  NH1 
+SPHERE  CENTER 13.260000 34.542999 0.660000  RAD 1.0  NH2 
+SPHERE  CENTER 18.726999 30.198999 -0.237000  RAD 1.0  N 
+SPHERE  CENTER 19.889999 29.693001 0.496000  RAD 1.0  CA 
+SPHERE  CENTER 20.636999 28.649000 -0.297000  RAD 1.0  C 
+SPHERE  CENTER 21.871000 28.686001 -0.287000  RAD 1.0  O 
+SPHERE  CENTER 19.416000 29.106001 1.823000  RAD 1.0  CB 
+SPHERE  CENTER 18.643999 30.132000 2.537000  RAD 1.0  OG1 
+SPHERE  CENTER 20.615999 28.506001 2.662000  RAD 1.0  CG2 
+SPHERE  CENTER 19.988001 27.747000 -0.961000  RAD 1.0  N 
+SPHERE  CENTER 20.669001 26.563999 -1.471000  RAD 1.0  CA 
+SPHERE  CENTER 20.773001 26.534000 -2.963000  RAD 1.0  C 
+SPHERE  CENTER 21.341000 25.552999 -3.498000  RAD 1.0  O 
+SPHERE  CENTER 19.955999 25.260000 -1.056000  RAD 1.0  CB 
+SPHERE  CENTER 20.128000 24.914000 0.713000  RAD 1.0  SG 
+SPHERE  CENTER 20.132000 27.441999 -3.608000  RAD 1.0  N 
+SPHERE  CENTER 19.987000 27.268000 -5.071000  RAD 1.0  CA 
+SPHERE  CENTER 21.257000 27.575001 -5.849000  RAD 1.0  C 
+SPHERE  CENTER 21.386000 27.129000 -7.018000  RAD 1.0  O 
+SPHERE  CENTER 22.225000 28.049999 -5.113000  RAD 1.0  N 
+SPHERE  CENTER 23.639000 28.131001 -5.505000  RAD 1.0  CA 
+SPHERE  CENTER 23.886999 29.393000 -6.316000  RAD 1.0  C 
+SPHERE  CENTER 22.948999 30.065001 -6.822000  RAD 1.0  O 
+SPHERE  CENTER 25.146000 29.681000 -6.493000  RAD 1.0  N 
+SPHERE  CENTER 25.617001 30.840000 -7.256000  RAD 1.0  CA 
+SPHERE  CENTER 25.247999 30.735001 -8.729000  RAD 1.0  C 
+SPHERE  CENTER 24.962000 31.791000 -9.369000  RAD 1.0  O 
+SPHERE  CENTER 27.160000 30.980000 -7.146000  RAD 1.0  CB 
+SPHERE  CENTER 24.919001 29.594000 -9.172000  RAD 1.0  OXT 
+
+PLANE 
+  CENTER 0.0 -25.0 0.0 
+  NORMAL 0.0  1.0 0.0  
+  TEXTURE 
+    AMBIENT  0.1 DIFFUSE  0.9 SPECULAR 0.0  OPACITY 1.0 
+    COLOR  1.0 1.0 1.0 
+    TEXFUNC 0 
+	
+END_SCENE
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/gui.ico b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/gui.ico
new file mode 100644
index 00000000..d551aa3a
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/gui.ico differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/gui.rc b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/gui.rc
new file mode 100644
index 00000000..5a13d046
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/gui.rc
@@ -0,0 +1,90 @@
+// Microsoft Visual C++ generated resource script.
+//
+#include "resource.h"
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#define APSTUDIO_HIDDEN_SYMBOLS
+#include "windows.h"
+#undef APSTUDIO_HIDDEN_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// English (U.S.) resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_ENU)
+#ifdef _WIN32
+LANGUAGE LANG_ENGLISH, SUBLANG_ENGLISH_US
+#pragma code_page(1252)
+#endif //_WIN32
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Icon
+//
+
+// Icon with lowest ID value placed first to ensure application icon
+// remains consistent on all systems.
+IDI_GUI   ICON                    "gui.ico"
+IDI_SMALL               ICON                    "small.ico"
+
+
+#ifdef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// TEXTINCLUDE
+//
+
+1 TEXTINCLUDE 
+BEGIN
+    "resource.h\0"
+END
+
+2 TEXTINCLUDE 
+BEGIN
+    "#define APSTUDIO_HIDDEN_SYMBOLS\r\n"
+    "#include ""windows.h""\r\n"
+    "#undef APSTUDIO_HIDDEN_SYMBOLS\r\n"
+    "\0"
+END
+
+3 TEXTINCLUDE 
+BEGIN
+    "\r\n"
+    "\0"
+END
+
+#endif    // APSTUDIO_INVOKED
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// String Table
+//
+
+STRINGTABLE 
+BEGIN
+    IDS_APP_TITLE           "gui"
+    IDC_GUI   "GUI"
+END
+
+#endif    // English (U.S.) resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/resource.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/resource.h
new file mode 100644
index 00000000..4c49a395
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/resource.h
@@ -0,0 +1,28 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define IDC_MYICON                      2
+#define IDD_GUI    			102
+#define IDS_APP_TITLE                   103
+#define IDI_GUI           		107
+#define IDI_SMALL                       108
+#define IDC_GUI           		109
+#define IDR_MAINFRAME                   128
+#define IDC_STATIC                      -1
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/small.ico b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/small.ico
new file mode 100644
index 00000000..d551aa3a
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/small.ico differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.serial.vcxproj b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.serial.vcxproj
new file mode 100644
index 00000000..1969c6d6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.serial.vcxproj
@@ -0,0 +1,393 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="DDDebug|Win32">
+      <Configuration>DDDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|x64">
+      <Configuration>DDDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|Win32">
+      <Configuration>DDRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|x64">
+      <Configuration>DDRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}</ProjectGuid>
+    <RootNamespace>tachyon.serial</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\serial\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\serial\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN32;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalLibraryDirectories>$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalLibraryDirectories>$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN32;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalLibraryDirectories>$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalLibraryDirectories>$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ProjectReference Include="tachyon.vcxproj">
+      <Project>{924517df-2b6a-47d5-8a11-cc247cc4d810}</Project>
+      <Private>false</Private>
+      <CopyLocalSatelliteAssemblies>false</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </ProjectReference>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\src\trace.serial.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.sln b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.sln
new file mode 100644
index 00000000..86122734
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.sln
@@ -0,0 +1,94 @@
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tachyon.tbb", "tachyon.tbb.vcxproj", "{6E9B1702-78E0-4D64-B771-8B274D963B58}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tachyon.common", "tachyon.vcxproj", "{924517DF-2B6A-47D5-8A11-CC247CC4D810}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tachyon.serial", "tachyon.serial.vcxproj", "{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tachyon.tbb1d", "tachyon.tbb1d.vcxproj", "{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		_GDI Release|Win32 = _GDI Release|Win32
+		_GDI Release|x64 = _GDI Release|x64
+		DD Debug|Win32 = DD Debug|Win32
+		DD Debug|x64 = DD Debug|x64
+		DD Release|Win32 = DD Release|Win32
+		DD Release|x64 = DD Release|x64
+		GDI Debug|Win32 = GDI Debug|Win32
+		GDI Debug|x64 = GDI Debug|x64
+		Description = Tachyon ray-tracer example
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}._GDI Release|Win32.ActiveCfg = Release|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}._GDI Release|Win32.Build.0 = Release|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}._GDI Release|x64.ActiveCfg = Release|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}._GDI Release|x64.Build.0 = Release|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Debug|Win32.ActiveCfg = DDDebug|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Debug|Win32.Build.0 = DDDebug|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Debug|x64.ActiveCfg = DDDebug|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Debug|x64.Build.0 = DDDebug|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Release|Win32.ActiveCfg = DDRelease|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Release|Win32.Build.0 = DDRelease|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Release|x64.ActiveCfg = DDRelease|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.DD Release|x64.Build.0 = DDRelease|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.GDI Debug|Win32.ActiveCfg = Debug|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.GDI Debug|Win32.Build.0 = Debug|Win32
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.GDI Debug|x64.ActiveCfg = Debug|x64
+		{6E9B1702-78E0-4D64-B771-8B274D963B58}.GDI Debug|x64.Build.0 = Debug|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}._GDI Release|Win32.ActiveCfg = Release|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}._GDI Release|Win32.Build.0 = Release|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}._GDI Release|x64.ActiveCfg = Release|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}._GDI Release|x64.Build.0 = Release|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Debug|Win32.ActiveCfg = DDDebug|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Debug|Win32.Build.0 = DDDebug|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Debug|x64.ActiveCfg = DDDebug|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Debug|x64.Build.0 = DDDebug|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Release|Win32.ActiveCfg = DDRelease|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Release|Win32.Build.0 = DDRelease|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Release|x64.ActiveCfg = DDRelease|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.DD Release|x64.Build.0 = DDRelease|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.GDI Debug|Win32.ActiveCfg = Debug|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.GDI Debug|Win32.Build.0 = Debug|Win32
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.GDI Debug|x64.ActiveCfg = Debug|x64
+		{924517DF-2B6A-47D5-8A11-CC247CC4D810}.GDI Debug|x64.Build.0 = Debug|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}._GDI Release|Win32.ActiveCfg = Release|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}._GDI Release|Win32.Build.0 = Release|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}._GDI Release|x64.ActiveCfg = Release|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}._GDI Release|x64.Build.0 = Release|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Debug|Win32.ActiveCfg = DDDebug|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Debug|Win32.Build.0 = DDDebug|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Debug|x64.ActiveCfg = DDDebug|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Debug|x64.Build.0 = DDDebug|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Release|Win32.ActiveCfg = DDRelease|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Release|Win32.Build.0 = DDRelease|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Release|x64.ActiveCfg = DDRelease|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.DD Release|x64.Build.0 = DDRelease|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.GDI Debug|Win32.ActiveCfg = Debug|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.GDI Debug|Win32.Build.0 = Debug|Win32
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.GDI Debug|x64.ActiveCfg = Debug|x64
+		{924517DF-2B6A-47D5-8A11-CC047CC4D8E9}.GDI Debug|x64.Build.0 = Debug|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}._GDI Release|Win32.ActiveCfg = Release|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}._GDI Release|Win32.Build.0 = Release|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}._GDI Release|x64.ActiveCfg = Release|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}._GDI Release|x64.Build.0 = Release|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Debug|Win32.ActiveCfg = DDDebug|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Debug|Win32.Build.0 = DDDebug|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Debug|x64.ActiveCfg = DDDebug|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Debug|x64.Build.0 = DDDebug|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Release|Win32.ActiveCfg = DDRelease|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Release|Win32.Build.0 = DDRelease|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Release|x64.ActiveCfg = DDRelease|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.DD Release|x64.Build.0 = DDRelease|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.GDI Debug|Win32.ActiveCfg = Debug|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.GDI Debug|Win32.Build.0 = Debug|Win32
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.GDI Debug|x64.ActiveCfg = Debug|x64
+		{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}.GDI Debug|x64.Build.0 = Debug|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.tbb.vcxproj b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.tbb.vcxproj
new file mode 100644
index 00000000..2e7881ea
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.tbb.vcxproj
@@ -0,0 +1,445 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="DDDebug|Win32">
+      <Configuration>DDDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|x64">
+      <Configuration>DDDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|Win32">
+      <Configuration>DDRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|x64">
+      <Configuration>DDRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{6E9B1702-78E0-4D64-B771-8B274D963B58}</ProjectGuid>
+    <RootNamespace>tachyon.tbb</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ProjectReference Include="tachyon.vcxproj">
+      <Project>{924517df-2b6a-47d5-8a11-cc247cc4d810}</Project>
+      <Private>false</Private>
+      <CopyLocalSatelliteAssemblies>false</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </ProjectReference>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\src\trace.tbb.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.tbb1d.vcxproj b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.tbb1d.vcxproj
new file mode 100644
index 00000000..36106dee
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.tbb1d.vcxproj
@@ -0,0 +1,445 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="DDDebug|Win32">
+      <Configuration>DDDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|x64">
+      <Configuration>DDDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|Win32">
+      <Configuration>DDRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|x64">
+      <Configuration>DDRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{924517DF-2B6A-47D5-8A11-CC347CC4D8E9}</ProjectGuid>
+    <RootNamespace>tachyon.tbb1d</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\tbb1d\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\tbb1d\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;NDEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN32;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;WIN64;_WINDOWS;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <ProgramDataBaseFileName>$(IntDir)%(Filename).pdb</ProgramDataBaseFileName>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <LinkTimeCodeGeneration>UseLinkTimeCodeGeneration</LinkTimeCodeGeneration>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ProjectReference Include="tachyon.vcxproj">
+      <Project>{924517df-2b6a-47d5-8a11-cc247cc4d810}</Project>
+      <Private>false</Private>
+      <CopyLocalSatelliteAssemblies>false</CopyLocalSatelliteAssemblies>
+      <ReferenceOutputAssembly>true</ReferenceOutputAssembly>
+    </ProjectReference>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\src\trace.tbb1d.cpp" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.vcxproj b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.vcxproj
new file mode 100644
index 00000000..21502b24
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/tachyon.vcxproj
@@ -0,0 +1,455 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="DDDebug|Win32">
+      <Configuration>DDDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|x64">
+      <Configuration>DDDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|Win32">
+      <Configuration>DDRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|x64">
+      <Configuration>DDRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>tachyon.common</ProjectName>
+    <ProjectGuid>{924517DF-2B6A-47D5-8A11-CC247CC4D810}</ProjectGuid>
+    <RootNamespace>tachyon.common</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <InterproceduralOptimization>true</InterproceduralOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>StaticLibrary</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN32;_WINDOWS;_DEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X86 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN64;_WINDOWS;_DEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X64 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN32;_WINDOWS;NDEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X86 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN64;_WINDOWS;NDEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X64 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN32;_WINDOWS;NDEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X86 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN64;_WINDOWS;NDEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X64 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN32;_WINDOWS;_DEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <EnableEnhancedInstructionSet>StreamingSIMDExtensions2</EnableEnhancedInstructionSet>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X86 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>false</WholeProgramOptimization>
+      <PreprocessorDefinitions>DEFAULT_MODELFILE=balls.dat;EMULATE_PTHREADS;WIN64;_WINDOWS;_DEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <BasicRuntimeChecks>EnableFastChecks</BasicRuntimeChecks>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <WarningLevel>Level2</WarningLevel>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Lib>
+      <AdditionalOptions>/MACHINE:X64 %(AdditionalOptions)</AdditionalOptions>
+    </Lib>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\src\api.cpp" />
+    <ClCompile Include="..\src\apigeom.cpp" />
+    <ClCompile Include="..\src\apitrigeom.cpp" />
+    <ClCompile Include="..\src\bndbox.cpp" />
+    <ClCompile Include="..\src\box.cpp" />
+    <ClCompile Include="..\src\camera.cpp" />
+    <ClCompile Include="..\src\coordsys.cpp" />
+    <ClCompile Include="..\src\cylinder.cpp" />
+    <ClCompile Include="..\src\extvol.cpp" />
+    <ClCompile Include="..\src\global.cpp" />
+    <ClCompile Include="..\src\grid.cpp" />
+    <ClCompile Include="..\src\imageio.cpp" />
+    <ClCompile Include="..\src\imap.cpp" />
+    <ClCompile Include="..\src\intersect.cpp" />
+    <ClCompile Include="..\src\jpeg.cpp" />
+    <ClCompile Include="..\src\light.cpp" />
+    <ClCompile Include="..\src\main.cpp" />
+    <ClCompile Include="..\src\objbound.cpp" />
+    <ClCompile Include="..\src\parse.cpp" />
+    <ClCompile Include="..\src\plane.cpp" />
+    <ClCompile Include="..\src\ppm.cpp" />
+    <ClCompile Include="..\src\pthread.cpp" />
+    <ClCompile Include="..\src\quadric.cpp" />
+    <ClCompile Include="..\src\render.cpp" />
+    <ClCompile Include="..\src\ring.cpp" />
+    <ClCompile Include="..\src\shade.cpp" />
+    <ClCompile Include="..\src\sphere.cpp" />
+    <ClCompile Include="..\src\tachyon_video.cpp" />
+    <ClCompile Include="..\src\texture.cpp" />
+    <ClCompile Include="..\src\tgafile.cpp" />
+    <ClCompile Include="..\src\trace_rest.cpp" />
+    <ClCompile Include="..\src\triangle.cpp" />
+    <ClCompile Include="..\src\ui.cpp" />
+    <ClCompile Include="..\src\util.cpp" />
+    <ClCompile Include="..\src\vector.cpp" />
+    <ClCompile Include="..\src\vol.cpp" />
+    <ClCompile Include="..\..\..\common\gui\d2dvideo.cpp">
+      <AdditionalIncludeDirectories Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">_WINDOWS;_DEBUG</PreprocessorDefinitions>
+      <AdditionalIncludeDirectories Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">_WINDOWS;_DEBUG</PreprocessorDefinitions>
+      <AdditionalIncludeDirectories Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">_WINDOWS;NDEBUG</PreprocessorDefinitions>
+      <AdditionalIncludeDirectories Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">_WINDOWS;NDEBUG</PreprocessorDefinitions>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+    <ClCompile Include="..\..\..\common\gui\gdivideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">true</ExcludedFromBuild>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">_WINDOWS;_DEBUG</PreprocessorDefinitions>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">_WINDOWS;_DEBUG</PreprocessorDefinitions>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">_WINDOWS;NDEBUG</PreprocessorDefinitions>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Release|x64'">_WINDOWS;NDEBUG</PreprocessorDefinitions>
+    </ClCompile>
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\src\api.h" />
+    <ClInclude Include="..\src\apitrigeom.h" />
+    <ClInclude Include="..\src\bndbox.h" />
+    <ClInclude Include="..\src\box.h" />
+    <ClInclude Include="..\src\camera.h" />
+    <ClInclude Include="..\src\coordsys.h" />
+    <ClInclude Include="..\src\cylinder.h" />
+    <ClInclude Include="..\src\extvol.h" />
+    <ClInclude Include="..\src\global.h" />
+    <ClInclude Include="..\src\grid.h" />
+    <ClInclude Include="..\src\imageio.h" />
+    <ClInclude Include="..\src\imap.h" />
+    <ClInclude Include="..\src\intersect.h" />
+    <ClInclude Include="..\src\jpeg.h" />
+    <ClInclude Include="..\src\light.h" />
+    <ClInclude Include="..\src\machine.h" />
+    <ClInclude Include="..\src\macros.h" />
+    <ClInclude Include="..\src\objbound.h" />
+    <ClInclude Include="..\src\parse.h" />
+    <ClInclude Include="..\src\plane.h" />
+    <ClInclude Include="..\src\ppm.h" />
+    <ClInclude Include="..\src\pthread.h" />
+    <ClInclude Include="..\src\quadric.h" />
+    <ClInclude Include="..\src\render.h" />
+    <ClInclude Include="..\msvs\resource.h" />
+    <ClInclude Include="..\src\ring.h" />
+    <ClInclude Include="..\src\shade.h" />
+    <ClInclude Include="..\src\sphere.h" />
+    <ClInclude Include="..\src\tachyon_video.h" />
+    <ClInclude Include="..\src\texture.h" />
+    <ClInclude Include="..\src\tgafile.h" />
+    <ClInclude Include="..\src\trace.h" />
+    <ClInclude Include="..\src\triangle.h" />
+    <ClInclude Include="..\src\types.h" />
+    <ClInclude Include="..\src\ui.h" />
+    <ClInclude Include="..\src\util.h" />
+    <ClInclude Include="..\src\vector.h" />
+    <ClInclude Include="..\src\vol.h" />
+    <ClInclude Include="..\..\..\common\gui\video.h" />
+    <ClInclude Include="..\..\..\common\gui\winvideo.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\msvs\gui.ico" />
+    <None Include="..\msvs\small.ico" />
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="..\msvs\gui.rc" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml
new file mode 100644
index 00000000..df49ca82
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml
@@ -0,0 +1,15 @@
+﻿<Application
+    x:Class="tbbTachyon.App"
+    xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
+    xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
+    xmlns:local="using:tbbTachyon">
+
+    <Application.Resources>
+        <ResourceDictionary>
+            <ResourceDictionary.MergedDictionaries>
+                <ResourceDictionary Source="Common/StandardStyles.xaml"/>
+            </ResourceDictionary.MergedDictionaries>
+
+        </ResourceDictionary>
+    </Application.Resources>
+</Application>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml.cpp
new file mode 100644
index 00000000..ff153805
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml.cpp
@@ -0,0 +1,54 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "DirectXPage.xaml.h"
+
+using namespace tbbTachyon;
+
+using namespace Platform;
+using namespace Windows::ApplicationModel;
+using namespace Windows::ApplicationModel::Activation;
+using namespace Windows::Foundation;
+using namespace Windows::Foundation::Collections;
+using namespace Windows::Storage;
+using namespace Windows::UI::Xaml;
+using namespace Windows::UI::Xaml::Controls;
+using namespace Windows::UI::Xaml::Controls::Primitives;
+using namespace Windows::UI::Xaml::Data;
+using namespace Windows::UI::Xaml::Input;
+using namespace Windows::UI::Xaml::Interop;
+using namespace Windows::UI::Xaml::Media;
+using namespace Windows::UI::Xaml::Navigation;
+
+#include "src/tachyon_video.h"
+
+App::App()
+{
+    InitializeComponent();
+}
+
+void App::OnLaunched(Windows::ApplicationModel::Activation::LaunchActivatedEventArgs^ pArgs)
+{
+    m_directXPage = ref new DirectXPage();
+
+    // Place the frame in the current Window and ensure that it is active
+    Window::Current->Content = m_directXPage;
+    Window::Current->Activate();
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml.h
new file mode 100644
index 00000000..10740484
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/App.xaml.h
@@ -0,0 +1,41 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+#pragma once
+
+#include "App.g.h"
+#include "DirectXPage.xaml.h"
+
+namespace tbbTachyon
+{
+    /// <summary>
+    /// Provides application-specific behavior to supplement the default Application class.
+    /// </summary>
+    ref class App sealed
+    {
+    public:
+        App();
+        virtual void OnLaunched(Windows::ApplicationModel::Activation::LaunchActivatedEventArgs^ pArgs) override;
+
+    private:
+        DirectXPage^ m_directXPage;
+    };
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/Logo.png b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/Logo.png
new file mode 100644
index 00000000..bc91a8ef
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/Logo.png differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/SmallLogo.png b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/SmallLogo.png
new file mode 100644
index 00000000..cddf7a14
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/SmallLogo.png differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/SplashScreen.png b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/SplashScreen.png
new file mode 100644
index 00000000..37af2706
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/SplashScreen.png differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/StoreLogo.png b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/StoreLogo.png
new file mode 100644
index 00000000..42a13f0f
Binary files /dev/null and b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Assets/StoreLogo.png differ
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Common/StandardStyles.xaml b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Common/StandardStyles.xaml
new file mode 100644
index 00000000..81fb398e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Common/StandardStyles.xaml
@@ -0,0 +1,1007 @@
+﻿<!--
+    This file contains XAML styles that simplify application development.
+
+    These are not merely convenient, but are required by most Visual Studio project and item templates.
+    Removing, renaming, or otherwise modifying the content of these files may result in a project that
+    does not build, or that will not build once additional pages are added.  If variations on these
+    styles are desired it is recommended that you copy the content under a new name and modify your
+    private copy.
+-->
+
+<ResourceDictionary
+    xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
+    xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml">
+
+    <!-- Non-brush values that vary across themes -->
+    
+    <ResourceDictionary.ThemeDictionaries>
+        <ResourceDictionary x:Key="Default">
+            <x:String x:Key="BackButtonGlyph">&#xE071;</x:String>
+            <x:String x:Key="BackButtonSnappedGlyph">&#xE0BA;</x:String>
+        </ResourceDictionary>
+
+        <ResourceDictionary x:Key="HighContrast">
+            <x:String x:Key="BackButtonGlyph">&#xE0A6;</x:String>
+            <x:String x:Key="BackButtonSnappedGlyph">&#xE0C4;</x:String>
+        </ResourceDictionary>
+    </ResourceDictionary.ThemeDictionaries>
+
+    <!-- RichTextBlock styles -->
+
+    <Style x:Key="BasicRichTextStyle" TargetType="RichTextBlock">
+        <Setter Property="Foreground" Value="{StaticResource ApplicationForegroundThemeBrush}"/>
+        <Setter Property="FontSize" Value="{StaticResource ControlContentThemeFontSize}"/>
+        <Setter Property="FontFamily" Value="{StaticResource ContentControlThemeFontFamily}"/>
+        <Setter Property="TextTrimming" Value="WordEllipsis"/>
+        <Setter Property="TextWrapping" Value="Wrap"/>
+        <Setter Property="Typography.StylisticSet20" Value="True"/>
+        <Setter Property="Typography.DiscretionaryLigatures" Value="True"/>
+        <Setter Property="Typography.CaseSensitiveForms" Value="True"/>
+    </Style>
+
+    <Style x:Key="BaselineRichTextStyle" TargetType="RichTextBlock" BasedOn="{StaticResource BasicRichTextStyle}">
+        <Setter Property="LineHeight" Value="20"/>
+        <Setter Property="LineStackingStrategy" Value="BlockLineHeight"/>
+        <!-- Properly align text along its baseline -->
+        <Setter Property="RenderTransform">
+            <Setter.Value>
+                <TranslateTransform X="-1" Y="4"/>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <Style x:Key="ItemRichTextStyle" TargetType="RichTextBlock" BasedOn="{StaticResource BaselineRichTextStyle}"/>
+
+    <Style x:Key="BodyRichTextStyle" TargetType="RichTextBlock" BasedOn="{StaticResource BaselineRichTextStyle}">
+        <Setter Property="FontWeight" Value="SemiLight"/>
+    </Style>
+
+    <!-- TextBlock styles -->
+
+    <Style x:Key="BasicTextStyle" TargetType="TextBlock">
+        <Setter Property="Foreground" Value="{StaticResource ApplicationForegroundThemeBrush}"/>
+        <Setter Property="FontSize" Value="{StaticResource ControlContentThemeFontSize}"/>
+        <Setter Property="FontFamily" Value="{StaticResource ContentControlThemeFontFamily}"/>
+        <Setter Property="TextTrimming" Value="WordEllipsis"/>
+        <Setter Property="TextWrapping" Value="Wrap"/>
+        <Setter Property="Typography.StylisticSet20" Value="True"/>
+        <Setter Property="Typography.DiscretionaryLigatures" Value="True"/>
+        <Setter Property="Typography.CaseSensitiveForms" Value="True"/>
+    </Style>
+
+    <Style x:Key="BaselineTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BasicTextStyle}">
+        <Setter Property="LineHeight" Value="20"/>
+        <Setter Property="LineStackingStrategy" Value="BlockLineHeight"/>
+        <!-- Properly align text along its baseline -->
+        <Setter Property="RenderTransform">
+            <Setter.Value>
+                <TranslateTransform X="-1" Y="4"/>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <Style x:Key="HeaderTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BaselineTextStyle}">
+        <Setter Property="FontSize" Value="56"/>
+        <Setter Property="FontWeight" Value="Light"/>
+        <Setter Property="LineHeight" Value="40"/>
+        <Setter Property="RenderTransform">
+            <Setter.Value>
+                <TranslateTransform X="-2" Y="8"/>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <Style x:Key="SubheaderTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BaselineTextStyle}">
+        <Setter Property="FontSize" Value="26.667"/>
+        <Setter Property="FontWeight" Value="Light"/>
+        <Setter Property="LineHeight" Value="30"/>
+        <Setter Property="RenderTransform">
+            <Setter.Value>
+                <TranslateTransform X="-1" Y="6"/>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <Style x:Key="TitleTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BaselineTextStyle}">
+        <Setter Property="FontWeight" Value="SemiBold"/>
+    </Style>
+
+    <Style x:Key="ItemTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BaselineTextStyle}"/>
+
+    <Style x:Key="BodyTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BaselineTextStyle}">
+        <Setter Property="FontWeight" Value="SemiLight"/>
+    </Style>
+
+    <Style x:Key="CaptionTextStyle" TargetType="TextBlock" BasedOn="{StaticResource BaselineTextStyle}">
+        <Setter Property="FontSize" Value="12"/>
+        <Setter Property="Foreground" Value="{StaticResource ApplicationSecondaryForegroundThemeBrush}"/>
+    </Style>
+
+    <!-- Button styles -->
+
+    <!--
+        TextButtonStyle is used to style a Button using subheader-styled text with no other adornment.  This
+        style is used in the GroupedItemsPage as a group header and in the FileOpenPickerPage for triggering
+        commands.
+    -->
+    <Style x:Key="TextButtonStyle" TargetType="Button">
+        <Setter Property="MinWidth" Value="0"/>
+        <Setter Property="MinHeight" Value="0"/>
+        <Setter Property="Template">
+            <Setter.Value>
+                <ControlTemplate TargetType="Button">
+                    <Grid Background="Transparent">
+                        <TextBlock
+                            x:Name="Text"
+                            Text="{TemplateBinding Content}"
+                            Margin="3,-7,3,10"
+                            TextWrapping="NoWrap"
+                            Style="{StaticResource SubheaderTextStyle}"/>
+                        <Rectangle
+                            x:Name="FocusVisualWhite"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualWhiteStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="1.5"/>
+                        <Rectangle
+                            x:Name="FocusVisualBlack"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualBlackStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="0.5"/>
+
+                        <VisualStateManager.VisualStateGroups>
+                            <VisualStateGroup x:Name="CommonStates">
+                                <VisualState x:Name="Normal"/>
+                                <VisualState x:Name="PointerOver">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ApplicationPointerOverForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Pressed">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ApplicationPressedForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Disabled">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ButtonDisabledForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="FocusStates">
+                                <VisualState x:Name="Focused">
+                                    <Storyboard>
+                                        <DoubleAnimation Duration="0" To="1" Storyboard.TargetName="FocusVisualWhite" Storyboard.TargetProperty="Opacity"/>
+                                        <DoubleAnimation Duration="0" To="1" Storyboard.TargetName="FocusVisualBlack" Storyboard.TargetProperty="Opacity"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Unfocused"/>
+                            </VisualStateGroup>
+                        </VisualStateManager.VisualStateGroups>
+                    </Grid>
+                </ControlTemplate>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <!--
+        TextRadioButtonStyle is used to style a RadioButton using subheader-styled text with no other adornment.
+        This style is used in the SearchResultsPage to allow selection among filters.
+    -->
+    <Style x:Key="TextRadioButtonStyle" TargetType="RadioButton">
+        <Setter Property="MinWidth" Value="0"/>
+        <Setter Property="MinHeight" Value="0"/>
+        <Setter Property="Margin" Value="0,0,30,0"/>
+        <Setter Property="Template">
+            <Setter.Value>
+                <ControlTemplate TargetType="RadioButton">
+                    <Grid Background="Transparent">
+                        <TextBlock
+                            x:Name="Text"
+                            Text="{TemplateBinding Content}"
+                            Margin="3,-7,3,10"
+                            TextWrapping="NoWrap"
+                            Style="{StaticResource SubheaderTextStyle}"/>
+                        <Rectangle
+                            x:Name="FocusVisualWhite"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualWhiteStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="1.5"/>
+                        <Rectangle
+                            x:Name="FocusVisualBlack"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualBlackStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="0.5"/>
+
+                        <VisualStateManager.VisualStateGroups>
+                            <VisualStateGroup x:Name="CommonStates">
+                                <VisualState x:Name="Normal"/>
+                                <VisualState x:Name="PointerOver">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ApplicationPointerOverForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Pressed">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ApplicationPressedForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Disabled">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ButtonDisabledForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="FocusStates">
+                                <VisualState x:Name="Focused">
+                                    <Storyboard>
+                                        <DoubleAnimation Duration="0" To="1" Storyboard.TargetName="FocusVisualWhite" Storyboard.TargetProperty="Opacity"/>
+                                        <DoubleAnimation Duration="0" To="1" Storyboard.TargetName="FocusVisualBlack" Storyboard.TargetProperty="Opacity"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Unfocused"/>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="CheckStates">
+                                <VisualState x:Name="Checked"/>
+                                <VisualState x:Name="Unchecked">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Text" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource ApplicationSecondaryForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Indeterminate"/>
+                            </VisualStateGroup>
+                        </VisualStateManager.VisualStateGroups>
+                    </Grid>
+                </ControlTemplate>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <!--
+        AppBarButtonStyle is used to style a Button for use in an App Bar.  Content will be centered and should fit within
+        the 40-pixel radius glyph provided.  16-point Segoe UI Symbol is used for content text to simplify the use of glyphs
+        from that font.  AutomationProperties.Name is used for the text below the glyph.
+    -->
+    <Style x:Key="AppBarButtonStyle" TargetType="Button">
+        <Setter Property="Foreground" Value="{StaticResource AppBarItemForegroundThemeBrush}"/>
+        <Setter Property="VerticalAlignment" Value="Stretch"/>
+        <Setter Property="FontFamily" Value="Segoe UI Symbol"/>
+        <Setter Property="FontWeight" Value="Normal"/>
+        <Setter Property="FontSize" Value="20"/>
+        <Setter Property="AutomationProperties.ItemType" Value="App Bar Button"/>
+        <Setter Property="Template">
+            <Setter.Value>
+                <ControlTemplate TargetType="Button">
+                    <Grid x:Name="RootGrid" Width="100" Background="Transparent">
+                        <StackPanel VerticalAlignment="Top" Margin="0,12,0,11">
+                            <Grid Width="40" Height="40" Margin="0,0,0,5" HorizontalAlignment="Center">
+                                <TextBlock x:Name="BackgroundGlyph" Text="&#xE0A8;" FontFamily="Segoe UI Symbol" FontSize="53.333" Margin="-4,-19,0,0" Foreground="{StaticResource AppBarItemBackgroundThemeBrush}"/>
+                                <TextBlock x:Name="OutlineGlyph" Text="&#xE0A7;" FontFamily="Segoe UI Symbol" FontSize="53.333" Margin="-4,-19,0,0"/>
+                                <ContentPresenter x:Name="Content" HorizontalAlignment="Center" Margin="-1,-1,0,0" VerticalAlignment="Center"/>
+                            </Grid>
+                            <TextBlock
+                                x:Name="TextLabel"
+                                Text="{TemplateBinding AutomationProperties.Name}"
+                                Foreground="{StaticResource AppBarItemForegroundThemeBrush}"
+                                Margin="0,0,2,0"
+                                FontSize="12"
+                                TextAlignment="Center"
+                                Width="88"
+                                MaxHeight="32"
+                                TextTrimming="WordEllipsis"
+                                Style="{StaticResource BasicTextStyle}"/>
+                        </StackPanel>
+                        <Rectangle
+                                x:Name="FocusVisualWhite"
+                                IsHitTestVisible="False"
+                                Stroke="{StaticResource FocusVisualWhiteStrokeThemeBrush}"
+                                StrokeEndLineCap="Square"
+                                StrokeDashArray="1,1"
+                                Opacity="0"
+                                StrokeDashOffset="1.5"/>
+                        <Rectangle
+                                x:Name="FocusVisualBlack"
+                                IsHitTestVisible="False"
+                                Stroke="{StaticResource FocusVisualBlackStrokeThemeBrush}"
+                                StrokeEndLineCap="Square"
+                                StrokeDashArray="1,1"
+                                Opacity="0"
+                                StrokeDashOffset="0.5"/>
+
+                        <VisualStateManager.VisualStateGroups>
+                            <VisualStateGroup x:Name="ApplicationViewStates">
+                                <VisualState x:Name="FullScreenLandscape"/>
+                                <VisualState x:Name="Filled"/>
+                                <VisualState x:Name="FullScreenPortrait">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="TextLabel" Storyboard.TargetProperty="Visibility">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="Collapsed"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="RootGrid" Storyboard.TargetProperty="Width">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="60"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Snapped">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="TextLabel" Storyboard.TargetProperty="Visibility">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="Collapsed"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="RootGrid" Storyboard.TargetProperty="Width">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="60"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="CommonStates">
+                                <VisualState x:Name="Normal"/>
+                                <VisualState x:Name="PointerOver">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="BackgroundGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemPointerOverBackgroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Content" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemPointerOverForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Pressed">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="OutlineGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="BackgroundGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Content" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemPressedForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Disabled">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="OutlineGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemDisabledForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="Content" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemDisabledForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="TextLabel" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource AppBarItemDisabledForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="FocusStates">
+                                <VisualState x:Name="Focused">
+                                    <Storyboard>
+                                        <DoubleAnimation
+                                                Storyboard.TargetName="FocusVisualWhite"
+                                                Storyboard.TargetProperty="Opacity"
+                                                To="1"
+                                                Duration="0"/>
+                                        <DoubleAnimation
+                                                Storyboard.TargetName="FocusVisualBlack"
+                                                Storyboard.TargetProperty="Opacity"
+                                                To="1"
+                                                Duration="0"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Unfocused" />
+                                <VisualState x:Name="PointerFocused" />
+                            </VisualStateGroup>
+                        </VisualStateManager.VisualStateGroups>
+                    </Grid>
+                </ControlTemplate>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <!-- Standard App Bar buttons -->
+  
+    <Style x:Key="SkipBackAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="SkipBackAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Skip Back"/>
+        <Setter Property="Content" Value="&#xE100;"/>
+    </Style>
+    <Style x:Key="SkipAheadAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="SkipAheadAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Skip Ahead"/>
+        <Setter Property="Content" Value="&#xE101;"/>
+    </Style>
+    <Style x:Key="PlayAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="PlayAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Play"/>
+        <Setter Property="Content" Value="&#xE102;"/>
+    </Style>
+    <Style x:Key="PauseAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="PauseAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Pause"/>
+        <Setter Property="Content" Value="&#xE103;"/>
+    </Style>
+    <Style x:Key="EditAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="EditAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Edit"/>
+        <Setter Property="Content" Value="&#xE104;"/>
+    </Style>
+    <Style x:Key="SaveAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="SaveAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Save"/>
+        <Setter Property="Content" Value="&#xE105;"/>
+    </Style>
+    <Style x:Key="DeleteAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="DeleteAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Delete"/>
+        <Setter Property="Content" Value="&#xE106;"/>
+    </Style>
+    <Style x:Key="DiscardAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="DiscardAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Discard"/>
+        <Setter Property="Content" Value="&#xE107;"/>
+    </Style>
+    <Style x:Key="RemoveAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="RemoveAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Remove"/>
+        <Setter Property="Content" Value="&#xE108;"/>
+    </Style>
+    <Style x:Key="AddAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="AddAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Add"/>
+        <Setter Property="Content" Value="&#xE109;"/>
+    </Style>
+    <Style x:Key="NoAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="NoAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="No"/>
+        <Setter Property="Content" Value="&#xE10A;"/>
+    </Style>
+    <Style x:Key="YesAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="YesAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Yes"/>
+        <Setter Property="Content" Value="&#xE10B;"/>
+    </Style>
+    <Style x:Key="MoreAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="MoreAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="More"/>
+        <Setter Property="Content" Value="&#xE10C;"/>
+    </Style>
+    <Style x:Key="RedoAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="RedoAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Redo"/>
+        <Setter Property="Content" Value="&#xE10D;"/>
+    </Style>
+    <Style x:Key="UndoAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="UndoAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Undo"/>
+        <Setter Property="Content" Value="&#xE10E;"/>
+    </Style>
+    <Style x:Key="HomeAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="HomeAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Home"/>
+        <Setter Property="Content" Value="&#xE10F;"/>
+    </Style>
+    <Style x:Key="OutAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="OutAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Out"/>
+        <Setter Property="Content" Value="&#xE110;"/>
+    </Style>
+    <Style x:Key="NextAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="NextAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Next"/>
+        <Setter Property="Content" Value="&#xE111;"/>
+    </Style>
+    <Style x:Key="PreviousAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="PreviousAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Previous"/>
+        <Setter Property="Content" Value="&#xE112;"/>
+    </Style>
+    <Style x:Key="FavoriteAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="FavoriteAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Favorite"/>
+        <Setter Property="Content" Value="&#xE113;"/>
+    </Style>
+    <Style x:Key="PhotoAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="PhotoAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Photo"/>
+        <Setter Property="Content" Value="&#xE114;"/>
+    </Style>
+    <Style x:Key="SettingsAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="SettingsAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Settings"/>
+        <Setter Property="Content" Value="&#xE115;"/>
+    </Style>
+    <Style x:Key="VideoAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="VideoAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Video"/>
+        <Setter Property="Content" Value="&#xE116;"/>
+    </Style>
+    <Style x:Key="RefreshAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="RefreshAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Refresh"/>
+        <Setter Property="Content" Value="&#xE117;"/>
+    </Style>
+    <Style x:Key="DownloadAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="DownloadAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Download"/>
+        <Setter Property="Content" Value="&#xE118;"/>
+    </Style>
+    <Style x:Key="MailAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="MailAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Mail"/>
+        <Setter Property="Content" Value="&#xE119;"/>
+    </Style>
+    <Style x:Key="SearchAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="SearchAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Search"/>
+        <Setter Property="Content" Value="&#xE11A;"/>
+    </Style>
+    <Style x:Key="HelpAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="HelpAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Help"/>
+        <Setter Property="Content" Value="&#xE11B;"/>
+    </Style>
+    <Style x:Key="UploadAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="UploadAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Upload"/>
+        <Setter Property="Content" Value="&#xE11C;"/>
+    </Style>
+    <Style x:Key="PinAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="PinAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Pin"/>
+        <Setter Property="Content" Value="&#xE141;"/>
+    </Style>
+    <Style x:Key="UnpinAppBarButtonStyle" TargetType="Button" BasedOn="{StaticResource AppBarButtonStyle}">
+        <Setter Property="AutomationProperties.AutomationId" Value="UnpinAppBarButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Unpin"/>
+        <Setter Property="Content" Value="&#xE196;"/>
+    </Style>
+
+    <!-- Title area styles -->
+
+    <Style x:Key="PageHeaderTextStyle" TargetType="TextBlock" BasedOn="{StaticResource HeaderTextStyle}">
+        <Setter Property="TextWrapping" Value="NoWrap"/>
+        <Setter Property="VerticalAlignment" Value="Bottom"/>
+        <Setter Property="Margin" Value="0,0,30,40"/>
+    </Style>
+
+    <Style x:Key="PageSubheaderTextStyle" TargetType="TextBlock" BasedOn="{StaticResource SubheaderTextStyle}">
+        <Setter Property="TextWrapping" Value="NoWrap"/>
+        <Setter Property="VerticalAlignment" Value="Bottom"/>
+        <Setter Property="Margin" Value="0,0,0,40"/>
+    </Style>
+
+    <Style x:Key="SnappedPageHeaderTextStyle" TargetType="TextBlock" BasedOn="{StaticResource PageSubheaderTextStyle}">
+        <Setter Property="Margin" Value="0,0,18,40"/>
+    </Style>
+
+    <!--
+        BackButtonStyle is used to style a Button for use in the title area of a page.  Margins appropriate for
+        the conventional page layout are included as part of the style.
+    -->
+    <Style x:Key="BackButtonStyle" TargetType="Button">
+        <Setter Property="MinWidth" Value="0"/>
+        <Setter Property="Width" Value="48"/>
+        <Setter Property="Height" Value="48"/>
+        <Setter Property="Margin" Value="36,0,36,36"/>
+        <Setter Property="VerticalAlignment" Value="Bottom"/>
+        <Setter Property="FontFamily" Value="Segoe UI Symbol"/>
+        <Setter Property="FontWeight" Value="Normal"/>
+        <Setter Property="FontSize" Value="56"/>
+        <Setter Property="AutomationProperties.AutomationId" Value="BackButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Back"/>
+        <Setter Property="AutomationProperties.ItemType" Value="Navigation Button"/>
+        <Setter Property="Template">
+            <Setter.Value>
+                <ControlTemplate TargetType="Button">
+                    <Grid x:Name="RootGrid">
+                        <Grid Margin="-1,-16,0,0">
+                            <TextBlock x:Name="BackgroundGlyph" Text="&#xE0A8;" Foreground="{StaticResource BackButtonBackgroundThemeBrush}"/>
+                            <TextBlock x:Name="NormalGlyph" Text="{StaticResource BackButtonGlyph}" Foreground="{StaticResource BackButtonForegroundThemeBrush}"/>
+                            <TextBlock x:Name="ArrowGlyph" Text="&#xE0A6;" Foreground="{StaticResource BackButtonPressedForegroundThemeBrush}" Opacity="0"/>
+                        </Grid>
+                        <Rectangle
+                            x:Name="FocusVisualWhite"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualWhiteStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="1.5"/>
+                        <Rectangle
+                            x:Name="FocusVisualBlack"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualBlackStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="0.5"/>
+
+                        <VisualStateManager.VisualStateGroups>
+                            <VisualStateGroup x:Name="CommonStates">
+                                <VisualState x:Name="Normal" />
+                                <VisualState x:Name="PointerOver">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="BackgroundGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource BackButtonPointerOverBackgroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="NormalGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource BackButtonPointerOverForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Pressed">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="BackgroundGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource BackButtonForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="ArrowGlyph"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="1"
+                                            Duration="0"/>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="NormalGlyph"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="0"
+                                            Duration="0"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Disabled">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="RootGrid" Storyboard.TargetProperty="Visibility">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="Collapsed"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="FocusStates">
+                                <VisualState x:Name="Focused">
+                                    <Storyboard>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="FocusVisualWhite"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="1"
+                                            Duration="0"/>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="FocusVisualBlack"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="1"
+                                            Duration="0"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Unfocused" />
+                                <VisualState x:Name="PointerFocused" />
+                            </VisualStateGroup>
+                        </VisualStateManager.VisualStateGroups>
+                    </Grid>
+                </ControlTemplate>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <!--
+        PortraitBackButtonStyle is used to style a Button for use in the title area of a portrait page.  Margins appropriate
+        for the conventional page layout are included as part of the style.
+    -->
+    <Style x:Key="PortraitBackButtonStyle" TargetType="Button" BasedOn="{StaticResource BackButtonStyle}">
+        <Setter Property="Margin" Value="26,0,26,36"/>
+    </Style>
+
+    <!--
+        SnappedBackButtonStyle is used to style a Button for use in the title area of a snapped page.  Margins appropriate
+        for the conventional page layout are included as part of the style.
+        
+        The obvious duplication here is necessary as the glyphs used in snapped are not merely smaller versions of the same
+        glyph but are actually distinct.
+    -->
+    <Style x:Key="SnappedBackButtonStyle" TargetType="Button">
+        <Setter Property="MinWidth" Value="0"/>
+        <Setter Property="Margin" Value="20,0,0,0"/>
+        <Setter Property="VerticalAlignment" Value="Bottom"/>
+        <Setter Property="FontFamily" Value="Segoe UI Symbol"/>
+        <Setter Property="FontWeight" Value="Normal"/>
+        <Setter Property="FontSize" Value="26.66667"/>
+        <Setter Property="AutomationProperties.AutomationId" Value="BackButton"/>
+        <Setter Property="AutomationProperties.Name" Value="Back"/>
+        <Setter Property="AutomationProperties.ItemType" Value="Navigation Button"/>
+        <Setter Property="Template">
+            <Setter.Value>
+                <ControlTemplate TargetType="Button">
+                    <Grid x:Name="RootGrid" Width="36" Height="36" Margin="-3,0,7,33">
+                        <Grid Margin="-1,-1,0,0">
+                            <TextBlock x:Name="BackgroundGlyph" Text="&#xE0D4;" Foreground="{StaticResource BackButtonBackgroundThemeBrush}"/>
+                            <TextBlock x:Name="NormalGlyph" Text="{StaticResource BackButtonSnappedGlyph}" Foreground="{StaticResource BackButtonForegroundThemeBrush}"/>
+                            <TextBlock x:Name="ArrowGlyph" Text="&#xE0C4;" Foreground="{StaticResource BackButtonPressedForegroundThemeBrush}" Opacity="0"/>
+                        </Grid>
+                        <Rectangle
+                            x:Name="FocusVisualWhite"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualWhiteStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="1.5"/>
+                        <Rectangle
+                            x:Name="FocusVisualBlack"
+                            IsHitTestVisible="False"
+                            Stroke="{StaticResource FocusVisualBlackStrokeThemeBrush}"
+                            StrokeEndLineCap="Square"
+                            StrokeDashArray="1,1"
+                            Opacity="0"
+                            StrokeDashOffset="0.5"/>
+
+                        <VisualStateManager.VisualStateGroups>
+                            <VisualStateGroup x:Name="CommonStates">
+                                <VisualState x:Name="Normal" />
+                                <VisualState x:Name="PointerOver">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="BackgroundGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource BackButtonPointerOverBackgroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="NormalGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource BackButtonPointerOverForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Pressed">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="BackgroundGlyph" Storyboard.TargetProperty="Foreground">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="{StaticResource BackButtonForegroundThemeBrush}"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="ArrowGlyph"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="1"
+                                            Duration="0"/>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="NormalGlyph"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="0"
+                                            Duration="0"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Disabled">
+                                    <Storyboard>
+                                        <ObjectAnimationUsingKeyFrames Storyboard.TargetName="RootGrid" Storyboard.TargetProperty="Visibility">
+                                            <DiscreteObjectKeyFrame KeyTime="0" Value="Collapsed"/>
+                                        </ObjectAnimationUsingKeyFrames>
+                                    </Storyboard>
+                                </VisualState>
+                            </VisualStateGroup>
+                            <VisualStateGroup x:Name="FocusStates">
+                                <VisualState x:Name="Focused">
+                                    <Storyboard>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="FocusVisualWhite"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="1"
+                                            Duration="0"/>
+                                        <DoubleAnimation
+                                            Storyboard.TargetName="FocusVisualBlack"
+                                            Storyboard.TargetProperty="Opacity"
+                                            To="1"
+                                            Duration="0"/>
+                                    </Storyboard>
+                                </VisualState>
+                                <VisualState x:Name="Unfocused" />
+                                <VisualState x:Name="PointerFocused" />
+                            </VisualStateGroup>
+                        </VisualStateManager.VisualStateGroups>
+                    </Grid>
+                </ControlTemplate>
+            </Setter.Value>
+        </Setter>
+    </Style>
+
+    <!-- Item templates -->
+
+    <!-- Grid-appropriate 250 pixel square item template as seen in the GroupedItemsPage and ItemsPage -->
+    <DataTemplate x:Key="Standard250x250ItemTemplate">
+        <Grid HorizontalAlignment="Left" Width="250" Height="250">
+            <Border Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}">
+                <Image Source="{Binding Image}" Stretch="UniformToFill"/>
+            </Border>
+            <StackPanel VerticalAlignment="Bottom" Background="{StaticResource ListViewItemOverlayBackgroundThemeBrush}">
+                <TextBlock Text="{Binding Title}" Foreground="{StaticResource ListViewItemOverlayForegroundThemeBrush}" Style="{StaticResource TitleTextStyle}" Height="60" Margin="15,0,15,0"/>
+                <TextBlock Text="{Binding Subtitle}" Foreground="{StaticResource ListViewItemOverlaySecondaryForegroundThemeBrush}" Style="{StaticResource CaptionTextStyle}" TextWrapping="NoWrap" Margin="15,0,15,10"/>
+            </StackPanel>
+        </Grid>
+    </DataTemplate>
+
+    <!-- Grid-appropriate 500 by 130 pixel item template as seen in the GroupDetailPage -->
+    <DataTemplate x:Key="Standard500x130ItemTemplate">
+        <Grid Height="110" Width="480" Margin="10">
+            <Grid.ColumnDefinitions>
+                <ColumnDefinition Width="Auto"/>
+                <ColumnDefinition Width="*"/>
+            </Grid.ColumnDefinitions>
+            <Border Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}" Width="110" Height="110">
+                <Image Source="{Binding Image}" Stretch="UniformToFill"/>
+            </Border>
+            <StackPanel Grid.Column="1" VerticalAlignment="Top" Margin="10,0,0,0">
+                <TextBlock Text="{Binding Title}" Style="{StaticResource TitleTextStyle}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Subtitle}" Style="{StaticResource CaptionTextStyle}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Description}" Style="{StaticResource BodyTextStyle}" MaxHeight="60"/>
+            </StackPanel>
+        </Grid>
+    </DataTemplate>
+
+    <!-- List-appropriate 130 pixel high item template as seen in the SplitPage -->
+    <DataTemplate x:Key="Standard130ItemTemplate">
+        <Grid Height="110" Margin="6">
+            <Grid.ColumnDefinitions>
+                <ColumnDefinition Width="Auto"/>
+                <ColumnDefinition Width="*"/>
+            </Grid.ColumnDefinitions>
+            <Border Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}" Width="110" Height="110">
+                <Image Source="{Binding Image}" Stretch="UniformToFill"/>
+            </Border>
+            <StackPanel Grid.Column="1" VerticalAlignment="Top" Margin="10,0,0,0">
+                <TextBlock Text="{Binding Title}" Style="{StaticResource TitleTextStyle}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Subtitle}" Style="{StaticResource CaptionTextStyle}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Description}" Style="{StaticResource BodyTextStyle}" MaxHeight="60"/>
+            </StackPanel>
+        </Grid>
+    </DataTemplate>
+
+    <!--
+        List-appropriate 80 pixel high item template as seen in the SplitPage when Filled, and
+        the following pages when snapped: GroupedItemsPage, GroupDetailPage, and ItemsPage
+    -->
+    <DataTemplate x:Key="Standard80ItemTemplate">
+        <Grid Margin="6">
+            <Grid.ColumnDefinitions>
+                <ColumnDefinition Width="Auto"/>
+                <ColumnDefinition Width="*"/>
+            </Grid.ColumnDefinitions>
+            <Border Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}" Width="60" Height="60">
+                <Image Source="{Binding Image}" Stretch="UniformToFill"/>
+            </Border>
+            <StackPanel Grid.Column="1" Margin="10,0,0,0">
+                <TextBlock Text="{Binding Title}" Style="{StaticResource ItemTextStyle}" MaxHeight="40"/>
+                <TextBlock Text="{Binding Subtitle}" Style="{StaticResource CaptionTextStyle}" TextWrapping="NoWrap"/>
+            </StackPanel>
+        </Grid>
+    </DataTemplate>
+
+    <!-- Grid-appropriate 300 by 70 pixel item template as seen in the SearchResultsPage -->
+    <DataTemplate x:Key="StandardSmallIcon300x70ItemTemplate">
+        <Grid Width="294" Margin="6">
+            <Grid.ColumnDefinitions>
+                <ColumnDefinition Width="Auto"/>
+                <ColumnDefinition Width="*"/>
+            </Grid.ColumnDefinitions>
+            <Border Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}" Margin="0,0,0,10" Width="40" Height="40">
+                <Image Source="{Binding Image}" Stretch="UniformToFill"/>
+            </Border>
+            <StackPanel Grid.Column="1" Margin="10,-10,0,0">
+                <TextBlock Text="{Binding Title}" Style="{StaticResource BodyTextStyle}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Subtitle}" Style="{StaticResource BodyTextStyle}" Foreground="{StaticResource ApplicationSecondaryForegroundThemeBrush}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Description}" Style="{StaticResource BodyTextStyle}" Foreground="{StaticResource ApplicationSecondaryForegroundThemeBrush}" TextWrapping="NoWrap"/>
+            </StackPanel>
+        </Grid>
+    </DataTemplate>
+
+    <!-- List-appropriate 70 pixel high item template as seen in the SearchResultsPage when Snapped -->
+    <DataTemplate x:Key="StandardSmallIcon70ItemTemplate">
+        <Grid Margin="6">
+            <Grid.ColumnDefinitions>
+                <ColumnDefinition Width="Auto"/>
+                <ColumnDefinition Width="*"/>
+            </Grid.ColumnDefinitions>
+            <Border Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}" Margin="0,0,0,10" Width="40" Height="40">
+                <Image Source="{Binding Image}" Stretch="UniformToFill"/>
+            </Border>
+            <StackPanel Grid.Column="1" Margin="10,-10,0,0">
+                <TextBlock Text="{Binding Title}" Style="{StaticResource BodyTextStyle}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Subtitle}" Style="{StaticResource BodyTextStyle}" Foreground="{StaticResource ApplicationSecondaryForegroundThemeBrush}" TextWrapping="NoWrap"/>
+                <TextBlock Text="{Binding Description}" Style="{StaticResource BodyTextStyle}" Foreground="{StaticResource ApplicationSecondaryForegroundThemeBrush}" TextWrapping="NoWrap"/>
+            </StackPanel>
+        </Grid>
+    </DataTemplate>
+
+  <!--
+      190x130 pixel item template for displaying file previews as seen in the FileOpenPickerPage
+      Includes an elaborate tooltip to display title and description text
+  -->
+  <DataTemplate x:Key="StandardFileWithTooltip190x130ItemTemplate">
+        <Grid>
+            <Grid Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}">
+                <Image
+                    Source="{Binding Image}"
+                    Width="190"
+                    Height="130"
+                    HorizontalAlignment="Center"
+                    VerticalAlignment="Center"
+                    Stretch="Uniform"/>
+            </Grid>
+            <ToolTipService.Placement>Mouse</ToolTipService.Placement>
+            <ToolTipService.ToolTip>
+                <ToolTip>
+                    <ToolTip.Style>
+                        <Style TargetType="ToolTip">
+                            <Setter Property="BorderBrush" Value="{StaticResource ToolTipBackgroundThemeBrush}" />
+                            <Setter Property="Padding" Value="0" />
+                        </Style>
+                    </ToolTip.Style>
+
+                    <Grid Background="{StaticResource ApplicationPageBackgroundThemeBrush}">
+                        <Grid.ColumnDefinitions>
+                            <ColumnDefinition Width="Auto"/>
+                            <ColumnDefinition Width="*"/>
+                        </Grid.ColumnDefinitions>
+
+                        <Grid Background="{StaticResource ListViewItemPlaceholderBackgroundThemeBrush}" Margin="20">
+                            <Image
+                                Source="{Binding Image}"
+                                Width="160"
+                                Height="160"
+                                HorizontalAlignment="Center"
+                                VerticalAlignment="Center"
+                                Stretch="Uniform"/>
+                        </Grid>
+                        <StackPanel Width="200" Grid.Column="1" Margin="0,20,20,20">
+                            <TextBlock Text="{Binding Title}" TextWrapping="NoWrap" Style="{StaticResource BodyTextStyle}"/>
+                            <TextBlock Text="{Binding Description}" MaxHeight="140" Foreground="{StaticResource ApplicationSecondaryForegroundThemeBrush}" Style="{StaticResource BodyTextStyle}"/>
+                        </StackPanel>
+                    </Grid>   
+                </ToolTip>                
+            </ToolTipService.ToolTip>
+        </Grid>
+    </DataTemplate>
+
+    <!-- ScrollViewer styles -->
+
+    <Style x:Key="HorizontalScrollViewerStyle" TargetType="ScrollViewer">
+        <Setter Property="HorizontalScrollBarVisibility" Value="Auto"/>
+        <Setter Property="VerticalScrollBarVisibility" Value="Disabled"/>
+        <Setter Property="ScrollViewer.HorizontalScrollMode" Value="Enabled" />
+        <Setter Property="ScrollViewer.VerticalScrollMode" Value="Disabled" />
+        <Setter Property="ScrollViewer.ZoomMode" Value="Disabled" />
+    </Style>
+
+    <Style x:Key="VerticalScrollViewerStyle" TargetType="ScrollViewer">
+        <Setter Property="HorizontalScrollBarVisibility" Value="Disabled"/>
+        <Setter Property="VerticalScrollBarVisibility" Value="Auto"/>
+        <Setter Property="ScrollViewer.HorizontalScrollMode" Value="Disabled" />
+        <Setter Property="ScrollViewer.VerticalScrollMode" Value="Enabled" />
+        <Setter Property="ScrollViewer.ZoomMode" Value="Disabled" />
+    </Style>
+
+    <!-- Page layout roots typically use entrance animations and a theme-appropriate background color -->
+
+    <Style x:Key="LayoutRootStyle" TargetType="Panel">
+        <Setter Property="Background" Value="{StaticResource ApplicationPageBackgroundThemeBrush}"/>
+        <Setter Property="ChildrenTransitions">
+            <Setter.Value>
+                <TransitionCollection>
+                    <EntranceThemeTransition/>
+                </TransitionCollection>
+            </Setter.Value>
+        </Setter>
+    </Style>
+</ResourceDictionary>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXBase.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXBase.cpp
new file mode 100644
index 00000000..721d1c98
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXBase.cpp
@@ -0,0 +1,413 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "pch.h"
+#include "DirectXBase.h" 
+#include <windows.ui.xaml.media.dxinterop.h>
+#include <math.h>
+
+using namespace Microsoft::WRL;
+using namespace Windows::UI::Core;
+using namespace Windows::UI::Xaml::Controls;
+using namespace Windows::Foundation;
+using namespace Windows::Graphics::Display;
+using namespace D2D1;
+
+// Constructor.
+DirectXBase::DirectXBase() :
+    m_dpi(-1.0f)
+{
+}
+
+// Initialize the DirectX resources required to run.
+void DirectXBase::Initialize(CoreWindow^ window, SwapChainBackgroundPanel^ panel, float dpi)
+{
+    m_window = window;
+    m_panel = panel;
+
+    CreateDeviceIndependentResources();
+    CreateDeviceResources();
+    SetDpi(dpi);
+}
+
+// These are the resources required independent of the device.
+void DirectXBase::CreateDeviceIndependentResources()
+{
+    D2D1_FACTORY_OPTIONS options;
+    ZeroMemory(&options, sizeof(D2D1_FACTORY_OPTIONS));
+
+#if defined(_DEBUG)
+     // If the project is in a debug build, enable Direct2D debugging via SDK Layers
+    // TODO: investigate resource leaks reported by a debug version of a device.
+    // options.debugLevel = D2D1_DEBUG_LEVEL_INFORMATION;
+#endif
+
+    DX::ThrowIfFailed(
+        D2D1CreateFactory(
+            D2D1_FACTORY_TYPE_SINGLE_THREADED,
+            __uuidof(ID2D1Factory1),
+            &options,
+            &m_d2dFactory
+            )
+        );
+
+    DX::ThrowIfFailed(
+        DWriteCreateFactory(
+            DWRITE_FACTORY_TYPE_SHARED,
+            __uuidof(IDWriteFactory),
+            &m_dwriteFactory
+            )
+        );
+
+    DX::ThrowIfFailed(
+        CoCreateInstance(
+            CLSID_WICImagingFactory,
+            nullptr,
+            CLSCTX_INPROC_SERVER,
+            IID_PPV_ARGS(&m_wicFactory)
+            )
+        );
+}
+
+// These are the resources that depend on the device.
+void DirectXBase::CreateDeviceResources()
+{
+    // This flag adds support for surfaces with a different color channel ordering than the API default.
+    // It is recommended usage, and is required for compatibility with Direct2D.
+    UINT creationFlags = D3D11_CREATE_DEVICE_BGRA_SUPPORT;
+    ComPtr<IDXGIDevice> dxgiDevice;
+
+#if defined(_DEBUG)
+    // If the project is in a debug build, enable debugging via SDK Layers with this flag.
+    creationFlags |= D3D11_CREATE_DEVICE_DEBUG;
+#endif
+
+    // This array defines the set of DirectX hardware feature levels this app will support.
+    // Note the ordering should be preserved.
+    // Don't forget to declare your application's minimum required feature level in its
+    // description.  All applications are assumed to support 9.1 unless otherwise stated.
+    D3D_FEATURE_LEVEL featureLevels[] = 
+    {
+        D3D_FEATURE_LEVEL_11_1,
+        D3D_FEATURE_LEVEL_11_0,
+        D3D_FEATURE_LEVEL_10_1,
+        D3D_FEATURE_LEVEL_10_0,
+        D3D_FEATURE_LEVEL_9_3,
+        D3D_FEATURE_LEVEL_9_2,
+        D3D_FEATURE_LEVEL_9_1
+    };
+
+    // Create the DX11 API device object, and get a corresponding context.
+    ComPtr<ID3D11Device> device;
+    ComPtr<ID3D11DeviceContext> context;
+    DX::ThrowIfFailed(
+        D3D11CreateDevice(
+            nullptr,                    // specify null to use the default adapter
+            D3D_DRIVER_TYPE_HARDWARE,
+            0,                          // leave as 0 unless software device
+            creationFlags,              // optionally set debug and Direct2D compatibility flags
+            featureLevels,              // list of feature levels this app can support
+            ARRAYSIZE(featureLevels),   // number of entries in above list
+            D3D11_SDK_VERSION,          // always set this to D3D11_SDK_VERSION for Metro style apps
+            &device,                    // returns the Direct3D device created
+            &m_featureLevel,            // returns feature level of device created
+            &context                    // returns the device immediate context
+            )
+        );
+    // Get the DirectX11.1 device by QI off the DirectX11 one.
+    DX::ThrowIfFailed(
+        device.As(&m_d3dDevice)
+        );
+
+    // And get the corresponding device context in the same way.
+    DX::ThrowIfFailed(
+        context.As(&m_d3dContext)
+        );
+
+    // Obtain the underlying DXGI device of the Direct3D11.1 device.
+    DX::ThrowIfFailed(
+        m_d3dDevice.As(&dxgiDevice)
+        );
+
+    // Obtain the Direct2D device for 2-D rendering.
+    DX::ThrowIfFailed(
+        m_d2dFactory->CreateDevice(dxgiDevice.Get(), &m_d2dDevice)
+        );
+
+    // And get its corresponding device context object.
+    DX::ThrowIfFailed(
+        m_d2dDevice->CreateDeviceContext(
+            D2D1_DEVICE_CONTEXT_OPTIONS_NONE,
+            &m_d2dContext
+            )
+        );
+
+    // Release the swap chain (if it exists) as it will be incompatible with the new device.
+    m_swapChain = nullptr;
+}
+
+// Helps track the DPI in the helper class.
+// This is called in the dpiChanged event handler in the view class.
+void DirectXBase::SetDpi(float dpi)
+{
+    if (dpi != m_dpi)
+    {
+        // Save the DPI of this display in our class.
+        m_dpi = dpi;
+        
+        // Update Direct2D's stored DPI.
+        m_d2dContext->SetDpi(m_dpi, m_dpi);
+
+        // Often a DPI change implies a window size change. In some cases Windows will issues
+        // both a size changed event and a DPI changed event. In this case, the resulting bounds 
+        // will not change, and the window resize code will only be executed once.
+        UpdateForWindowSizeChange();
+    }
+}
+
+// This routine is called in the event handler for the view SizeChanged event.
+void DirectXBase::UpdateForWindowSizeChange()
+{
+    // Only handle window size changed if there is no pending DPI change.
+    if (m_dpi != DisplayProperties::LogicalDpi)
+        return;
+
+    if (m_window->Bounds.Width  != m_windowBounds.Width ||
+        m_window->Bounds.Height != m_windowBounds.Height)
+    {
+        m_d2dContext->SetTarget(nullptr);
+        m_d2dTargetBitmap = nullptr;
+        m_renderTargetView = nullptr;
+        m_depthStencilView = nullptr;
+        CreateWindowSizeDependentResources();
+    }
+}
+
+// Allocate all memory resources that change on a window SizeChanged event.
+void DirectXBase::CreateWindowSizeDependentResources()
+{
+    // Store the window bounds so the next time we get a SizeChanged event we can
+    // avoid rebuilding everything if the size is identical.
+    m_windowBounds = m_window->Bounds;
+
+    // Calculate the necessary swap chain and render target size in pixels.
+    m_renderTargetSize.Width = ConvertDipsToPixels(m_windowBounds.Width);
+    m_renderTargetSize.Height = ConvertDipsToPixels(m_windowBounds.Height);
+
+    // If the swap chain already exists, resize it.
+    if (m_swapChain != nullptr)
+    {
+        DX::ThrowIfFailed(
+            m_swapChain->ResizeBuffers(
+                2,
+                static_cast<UINT>(m_renderTargetSize.Width),
+                static_cast<UINT>(m_renderTargetSize.Height),
+                DXGI_FORMAT_B8G8R8A8_UNORM,
+                0
+                )
+            );
+    }
+    // Otherwise, create a new one.
+    else
+    {
+        // Allocate a descriptor.
+        DXGI_SWAP_CHAIN_DESC1 swapChainDesc = {0};
+        swapChainDesc.Width = static_cast<UINT>(m_renderTargetSize.Width); // Match the size of the windowm.
+        swapChainDesc.Height = static_cast<UINT>(m_renderTargetSize.Height);
+        swapChainDesc.Format = DXGI_FORMAT_B8G8R8A8_UNORM;           // This is the most common swapchain format.
+        swapChainDesc.Stereo = false; 
+        swapChainDesc.SampleDesc.Count = 1;                          // Don't use multi-sampling.
+        swapChainDesc.SampleDesc.Quality = 0;
+        swapChainDesc.BufferUsage = DXGI_USAGE_RENDER_TARGET_OUTPUT;
+        swapChainDesc.BufferCount = 2;                               // Use double buffering to enable flip.
+        swapChainDesc.Scaling = DXGI_SCALING_STRETCH;
+        swapChainDesc.SwapEffect = DXGI_SWAP_EFFECT_FLIP_SEQUENTIAL; // All Metro style apps must use this SwapEffect.
+        swapChainDesc.Flags = 0;
+
+        // Once the desired swap chain description is configured, it must be created on the same adapter as our D3D Device.
+
+        // First, retrieve the underlying DXGI Device from the D3D Device.
+        ComPtr<IDXGIDevice1> dxgiDevice;
+        DX::ThrowIfFailed(
+            m_d3dDevice.As(&dxgiDevice)
+            );
+
+        // Identify the physical adapter (GPU or card) this device is running on.
+        ComPtr<IDXGIAdapter> dxgiAdapter;
+        DX::ThrowIfFailed(
+            dxgiDevice->GetAdapter(&dxgiAdapter)
+            );
+
+        // And obtain the factory object that created it.
+        ComPtr<IDXGIFactory2> dxgiFactory;
+        DX::ThrowIfFailed(
+            dxgiAdapter->GetParent(IID_PPV_ARGS(&dxgiFactory))
+            );
+
+        // Create the swap chain and then associate it with the SwapChainBackgroundPanel.
+        DX::ThrowIfFailed(
+            dxgiFactory->CreateSwapChainForComposition(
+                m_d3dDevice.Get(),
+                &swapChainDesc,
+                nullptr,
+                &m_swapChain
+                )
+            );
+
+        ComPtr<ISwapChainBackgroundPanelNative> panelNative;
+        DX::ThrowIfFailed(
+            reinterpret_cast<IUnknown*>(m_panel)->QueryInterface(IID_PPV_ARGS(&panelNative))
+            );
+        
+        DX::ThrowIfFailed(
+            panelNative->SetSwapChain(m_swapChain.Get())
+            );
+
+        // Ensure that DXGI does not queue more than one frame at a time. This both reduces 
+        // latency and ensures that the application will only render after each VSync, minimizing 
+        // power consumption.
+        DX::ThrowIfFailed(
+            dxgiDevice->SetMaximumFrameLatency(1)
+            );
+    }
+
+    // Obtain the backbuffer for this window which will be the final 3D rendertarget.
+    ComPtr<ID3D11Texture2D> backBuffer;
+    DX::ThrowIfFailed(
+        m_swapChain->GetBuffer(0, IID_PPV_ARGS(&backBuffer))
+        );
+
+    // Create a view interface on the rendertarget to use on bind.
+    DX::ThrowIfFailed(
+        m_d3dDevice->CreateRenderTargetView(
+            backBuffer.Get(),
+            nullptr,
+            &m_renderTargetView
+            )
+        );
+
+    // Create a descriptor for the depth/stencil buffer.
+    CD3D11_TEXTURE2D_DESC depthStencilDesc(
+        DXGI_FORMAT_D24_UNORM_S8_UINT, 
+        static_cast<UINT>(m_renderTargetSize.Width),
+        static_cast<UINT>(m_renderTargetSize.Height),
+        1,
+        1,
+        D3D11_BIND_DEPTH_STENCIL
+        );
+
+    // Allocate a 2-D surface as the depth/stencil buffer.
+    ComPtr<ID3D11Texture2D> depthStencil;
+    DX::ThrowIfFailed(
+        m_d3dDevice->CreateTexture2D(
+            &depthStencilDesc,
+            nullptr,
+            &depthStencil
+            )
+        );
+
+    // Create a DepthStencil view on this surface to use on bind.
+    CD3D11_DEPTH_STENCIL_VIEW_DESC depthStencilViewDesc(D3D11_DSV_DIMENSION_TEXTURE2D);
+    DX::ThrowIfFailed(
+        m_d3dDevice->CreateDepthStencilView(
+            depthStencil.Get(),
+            &depthStencilViewDesc,
+            &m_depthStencilView
+            )
+        );
+
+    // Create a viewport descriptor of the full window size.
+    CD3D11_VIEWPORT viewport(
+        0.0f,
+        0.0f,
+        m_renderTargetSize.Width,
+        m_renderTargetSize.Height
+        );
+
+    // Set the current viewport using the descriptor.
+    m_d3dContext->RSSetViewports(1, &viewport);
+
+    // Now we set up the Direct2D render target bitmap linked to the swapchain. 
+    // Whenever we render to this bitmap, it will be directly rendered to the 
+    // swapchain associated with the window.
+    D2D1_BITMAP_PROPERTIES1 bitmapProperties = 
+        BitmapProperties1(
+            D2D1_BITMAP_OPTIONS_TARGET | D2D1_BITMAP_OPTIONS_CANNOT_DRAW,
+            PixelFormat(DXGI_FORMAT_B8G8R8A8_UNORM, D2D1_ALPHA_MODE_PREMULTIPLIED),
+            m_dpi,
+            m_dpi
+            );
+
+    // Direct2D needs the DXGI version of the backbuffer surface pointer.
+    ComPtr<IDXGISurface> dxgiBackBuffer;
+    DX::ThrowIfFailed(
+        m_swapChain->GetBuffer(0, IID_PPV_ARGS(&dxgiBackBuffer))
+        );
+
+    // Get a D2D surface from the DXGI back buffer to use as the D2D render target.
+    DX::ThrowIfFailed(
+        m_d2dContext->CreateBitmapFromDxgiSurface(
+            dxgiBackBuffer.Get(),
+            &bitmapProperties,
+            &m_d2dTargetBitmap
+            )
+        );
+
+    // So now we can set the Direct2D render target.
+    m_d2dContext->SetTarget(m_d2dTargetBitmap.Get());
+
+    // Set D2D text anti-alias mode to Grayscale to ensure proper rendering of text on intermediate surfaces.
+    m_d2dContext->SetTextAntialiasMode(D2D1_TEXT_ANTIALIAS_MODE_GRAYSCALE);
+}
+
+// Method to deliver the final image to the display.
+void DirectXBase::Present()
+{
+    // The application may optionally specify "dirty" or "scroll" rects to improve efficiency
+    // in certain scenarios.
+    DXGI_PRESENT_PARAMETERS parameters = {0};
+    parameters.DirtyRectsCount = 0;
+    parameters.pDirtyRects = nullptr;
+    parameters.pScrollRect = nullptr;
+    parameters.pScrollOffset = nullptr;
+    
+    // The first argument instructs DXGI to block until VSync, putting the application
+    // to sleep until the next VSync. This ensures we don't waste any cycles rendering
+    // frames that will never be displayed to the screen.
+    HRESULT hr = m_swapChain->Present1(1, 0, &parameters);
+
+    // If the device was removed either by a disconnect or a driver upgrade, we 
+    // must completely reinitialize the renderer.
+    if (hr == DXGI_ERROR_DEVICE_REMOVED || hr == DXGI_ERROR_DEVICE_RESET)
+    {
+        Initialize(m_window.Get(), m_panel, m_dpi);
+    }
+    else
+    {
+        DX::ThrowIfFailed(hr);
+    }
+}
+
+// Method to convert a length in device-independent pixels (DIPs) to a length in physical pixels.
+float DirectXBase::ConvertDipsToPixels(float dips)
+{
+    static const float dipsPerInch = 96.0f;
+    return floor(dips * m_dpi / dipsPerInch + 0.5f); // Round to nearest integer.
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXBase.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXBase.h
new file mode 100644
index 00000000..9964fb06
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXBase.h
@@ -0,0 +1,92 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#pragma once
+
+#include <wrl/client.h>
+#include <d3d11_1.h>
+#include <d2d1_1.h>
+#include <d2d1effects.h>
+#include <dwrite_1.h>
+#include <wincodec.h>
+#include "App.xaml.h"
+#include <agile.h>
+
+#pragma warning (disable: 4449)
+
+// Helper utilities to make DirectX APIs work with exceptions
+namespace DX
+{
+    inline void ThrowIfFailed(HRESULT hr)
+    {
+        if (FAILED(hr))
+        {
+            // Set a breakpoint on this line to catch DirectX API errors
+            throw Platform::Exception::CreateException(hr);
+        }
+    }
+}
+
+// Helper class that initializes DirectX APIs
+ref class DirectXBase abstract
+{
+internal:
+    DirectXBase();
+
+public:
+    virtual void Initialize(Windows::UI::Core::CoreWindow^ window, Windows::UI::Xaml::Controls::SwapChainBackgroundPanel^ panel, float dpi);
+    virtual void CreateDeviceIndependentResources();
+    virtual void CreateDeviceResources();
+    virtual void SetDpi(float dpi);
+    virtual void CreateWindowSizeDependentResources();
+    virtual void UpdateForWindowSizeChange();
+    virtual void Render() = 0;
+    virtual void Present();
+    virtual float ConvertDipsToPixels(float dips);
+
+protected private:
+
+    Platform::Agile<Windows::UI::Core::CoreWindow>         m_window;
+    Windows::UI::Xaml::Controls::SwapChainBackgroundPanel^ m_panel;
+
+    // Direct2D Objects
+    Microsoft::WRL::ComPtr<ID2D1Factory1>                  m_d2dFactory;
+    Microsoft::WRL::ComPtr<ID2D1Device>                    m_d2dDevice;
+    Microsoft::WRL::ComPtr<ID2D1DeviceContext>             m_d2dContext;
+    Microsoft::WRL::ComPtr<ID2D1Bitmap1>                   m_d2dTargetBitmap;
+
+    // DirectWrite & Windows Imaging Component Objects
+    Microsoft::WRL::ComPtr<IDWriteFactory1>                m_dwriteFactory;
+    Microsoft::WRL::ComPtr<IWICImagingFactory2>            m_wicFactory;
+
+    // Direct3D Objects
+    Microsoft::WRL::ComPtr<ID3D11Device1>                  m_d3dDevice;
+    Microsoft::WRL::ComPtr<ID3D11DeviceContext1>           m_d3dContext;
+    Microsoft::WRL::ComPtr<IDXGISwapChain1>                m_swapChain;
+    Microsoft::WRL::ComPtr<ID3D11RenderTargetView>         m_renderTargetView;
+    Microsoft::WRL::ComPtr<ID3D11DepthStencilView>         m_depthStencilView;
+
+    D3D_FEATURE_LEVEL                                      m_featureLevel;
+    Windows::Foundation::Size                              m_renderTargetSize;
+    Windows::Foundation::Rect                              m_windowBounds;
+    float                                                  m_dpi;
+};
+
+#pragma warning (default: 4449)
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml
new file mode 100644
index 00000000..a255074c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml
@@ -0,0 +1,31 @@
+﻿<SwapChainBackgroundPanel
+    x:Class="tbbTachyon.DirectXPage"
+    xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
+    xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
+    xmlns:local="using:tbbTachyon"
+    xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
+    xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
+    mc:Ignorable="d"
+    >
+    <SwapChainBackgroundPanel.RowDefinitions>
+        <RowDefinition Height="15*"/>
+        <RowDefinition Height="17*"/>
+    </SwapChainBackgroundPanel.RowDefinitions>
+    <Page Grid.RowSpan="2" Background="Black" MinHeight="100" MaxHeight="100">
+        <Page.BottomAppBar>
+            <AppBar Padding="10,0,10,0">
+                <Grid>
+                    <Grid.ColumnDefinitions>
+                        <ColumnDefinition Width="*" />
+                        <ColumnDefinition Width="100" />
+                        <ColumnDefinition Width="100" />
+                    </Grid.ColumnDefinitions>
+                    <TextBlock Grid.Column="0" x:Name="NumberOfThreadsTextBlock" Text="Number Of Threads: Auto" TextAlignment="Center" TextWrapping="Wrap" Height="54" FontSize="20" VerticalAlignment="Top" HorizontalAlignment="Center"/>
+                    <Slider Grid.Column="0" x:Name="ThreadsSlider" Minimum="0" Maximum="16" TickFrequency="1" TickPlacement="Outside" ValueChanged="ThreadsSliderValueChanged" Height="37" StepFrequency="1" IsThumbToolTipEnabled="False" />
+                    <Button Grid.Column="1" x:Name="ThreadsApply" Style="{StaticResource YesAppBarButtonStyle}" Tag="Apply this number of threads" AutomationProperties.Name="Apply" Click="ThreadsApply_Click" HorizontalAlignment="Right" Visibility="Collapsed"/>
+                    <Button Grid.Column="2" x:Name="Exit" Style="{StaticResource NoAppBarButtonStyle}" Tag="Exit" Click="Exit_Click" AutomationProperties.Name="Exit" HorizontalAlignment="Right" />
+                </Grid>
+            </AppBar>
+        </Page.BottomAppBar>
+    </Page>
+</SwapChainBackgroundPanel>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml.cpp
new file mode 100644
index 00000000..4a46c092
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml.cpp
@@ -0,0 +1,133 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+#include "pch.h"
+#include "DirectXPage.xaml.h"
+#include "tbb/tbb.h"
+
+using namespace tbbTachyon;
+
+using namespace Platform;
+using namespace Windows::Foundation;
+using namespace Windows::Foundation::Collections;
+using namespace Windows::UI::Input;
+using namespace Windows::UI::Core;
+using namespace Windows::UI::Xaml;
+using namespace Windows::UI::Xaml::Controls;
+using namespace Windows::UI::Xaml::Controls::Primitives;
+using namespace Windows::UI::Xaml::Data;
+using namespace Windows::UI::Xaml::Input;
+using namespace Windows::UI::Xaml::Media;
+using namespace Windows::UI::Xaml::Navigation;
+using namespace Windows::Graphics::Display;
+
+#include "src/tachyon_video.h"
+extern int volatile global_number_of_threads;
+extern volatile bool global_isCancelled;
+
+#pragma intrinsic(_BitScanReverse)
+static int log2( unsigned int x ) {
+    DWORD i;
+    _BitScanReverse(&i,(DWORD)x);
+    return (int)i;
+}
+
+const unsigned interval_step_power = 1;
+const unsigned num_interval_steps = 1 << (interval_step_power+1);
+
+DirectXPage::DirectXPage() :
+    m_renderNeeded(true)
+{
+    InitializeComponent();
+
+    m_renderer = ref new tbbTachyonRenderer();
+
+    m_renderer->Initialize(
+        Window::Current->CoreWindow,
+        this,
+        DisplayProperties::LogicalDpi
+        );
+
+    m_eventToken = CompositionTarget::Rendering::add(ref new EventHandler<Object^>(this, &DirectXPage::OnRendering));
+
+    int num_threads = 2*tbb::task_scheduler_init::default_num_threads();
+    // The thread slider has geometric sequence with several intermidiate steps for each interval between 2^N and 2^(N+1).
+    // The nearest (from below) the power of 2.
+    int i_base = log2(num_threads);
+    int base = 1 << i_base;
+    // The step size for the current interval.
+    int step = base / num_interval_steps;
+    // The number of steps inside the interval.
+    int i_step = (num_threads-base)/step;
+
+    ThreadsSlider->Maximum = (i_base-interval_step_power)*num_interval_steps + i_step;
+    global_number_of_threads = m_number_of_threads = tbb::task_scheduler_init::automatic;
+}
+
+DirectXPage::~DirectXPage()
+{
+}
+
+void DirectXPage::OnRendering(Platform::Object^ sender, Platform::Object^ args)
+{
+    if (m_renderNeeded){
+        m_renderer->Render();
+        m_renderer->Present();
+        m_renderNeeded = true;
+    }
+}
+
+void tbbTachyon::DirectXPage::ThreadsApply_Click(Platform::Object^ sender, Windows::UI::Xaml::RoutedEventArgs^ e)
+{
+    if (global_number_of_threads != m_number_of_threads){
+        global_number_of_threads = m_number_of_threads;
+        global_isCancelled = true;
+        video->running = false;
+        m_renderNeeded = true;
+        ThreadsApply->Visibility=Windows::UI::Xaml::Visibility::Collapsed;
+    }
+}
+
+void tbbTachyon::DirectXPage::Exit_Click(Platform::Object^ sender, Windows::UI::Xaml::RoutedEventArgs^ e)
+{
+    m_renderNeeded = false;
+    Application::Current->Exit();
+}
+
+void tbbTachyon::DirectXPage::ThreadsSliderValueChanged(Platform::Object^ sender, Windows::UI::Xaml::Controls::Primitives::RangeBaseValueChangedEventArgs^ e)
+{
+    int pos = (int) e->NewValue;
+
+    // The nearest (from below) the power of 2.
+    int base = pos<num_interval_steps ? 0 : 1 << (pos/num_interval_steps+interval_step_power);
+    // The step size for the current interval.
+    int step = max(1,base/num_interval_steps);
+    m_number_of_threads = base + (pos%num_interval_steps)*step;
+
+    if (m_number_of_threads == 0) m_number_of_threads = tbb::task_scheduler_init::automatic;
+
+    NumberOfThreadsTextBlock->Text="Number Of Threads: " + (m_number_of_threads == tbb::task_scheduler_init::automatic? "Auto": m_number_of_threads.ToString());
+    if (global_number_of_threads != m_number_of_threads){
+        ThreadsApply->Visibility=Windows::UI::Xaml::Visibility::Visible;
+    }else{
+        ThreadsApply->Visibility=Windows::UI::Xaml::Visibility::Collapsed;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml.h
new file mode 100644
index 00000000..274aa287
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/DirectXPage.xaml.h
@@ -0,0 +1,48 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#pragma once
+
+#include "DirectXPage.g.h"
+#include "tbbTachyonRenderer.h"
+
+namespace tbbTachyon
+{
+    [Windows::Foundation::Metadata::WebHostHidden]
+    public ref class DirectXPage sealed
+    {
+    public:
+        DirectXPage();
+
+    private:
+        ~DirectXPage();
+        void OnRendering(Object^ sender, Object^ args);
+
+        Windows::Foundation::EventRegistrationToken m_eventToken;
+
+        tbbTachyonRenderer^ m_renderer;
+        bool m_renderNeeded;
+        int m_number_of_threads;
+
+        void ThreadsSliderValueChanged(Platform::Object^ sender, Windows::UI::Xaml::Controls::Primitives::RangeBaseValueChangedEventArgs^ e);
+        void ThreadsApply_Click(Platform::Object^ sender, Windows::UI::Xaml::RoutedEventArgs^ e);
+        void Exit_Click(Platform::Object^ sender, Windows::UI::Xaml::RoutedEventArgs^ e);
+    };
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Package.appxmanifest b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Package.appxmanifest
new file mode 100644
index 00000000..ed4a813f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/Package.appxmanifest
@@ -0,0 +1,30 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Package xmlns="http://schemas.microsoft.com/appx/2010/manifest">
+  <Identity Name="36816596-d167-42e1-bcc0-cd3ec4577997" Publisher="CN=tbbtest" Version="1.0.0.18" />
+  <Properties>
+    <DisplayName>Tachyon Demo</DisplayName>
+    <PublisherDisplayName>test</PublisherDisplayName>
+    <Logo>Assets\StoreLogo.png</Logo>
+  </Properties>
+  <Prerequisites>
+    <OSMinVersion>6.2.0</OSMinVersion>
+    <OSMaxVersionTested>6.2.0</OSMaxVersionTested>
+  </Prerequisites>
+  <Resources>
+    <Resource Language="x-generate" />
+  </Resources>
+  <Applications>
+    <Application Id="App" Executable="$targetnametoken$.exe" EntryPoint="tbbTachyon.App">
+      <VisualElements DisplayName="Tachyon Demo" Logo="Assets\Logo.png" SmallLogo="Assets\SmallLogo.png" Description="Tachyon Demo demostrates how to use Intel(R) Threading Building Blocks library for Windows Store applications." ForegroundText="light" BackgroundColor="#464646">
+        <DefaultTile ShowName="allLogos" />
+        <SplashScreen Image="Assets\SplashScreen.png" />
+        <InitialRotationPreference>
+          <Rotation Preference="landscape" />
+        </InitialRotationPreference>
+      </VisualElements>
+    </Application>
+  </Applications>
+  <Capabilities>
+    <Capability Name="internetClient" />
+  </Capabilities>
+</Package>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/copy_libraries_and_assets.bat b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/copy_libraries_and_assets.bat
new file mode 100644
index 00000000..7dae5be7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/copy_libraries_and_assets.bat
@@ -0,0 +1,69 @@
+@echo on
+REM
+REM Copyright (c) 2005-2018 Intel Corporation
+REM
+REM Licensed under the Apache License, Version 2.0 (the "License");
+REM you may not use this file except in compliance with the License.
+REM You may obtain a copy of the License at
+REM
+REM     http://www.apache.org/licenses/LICENSE-2.0
+REM
+REM Unless required by applicable law or agreed to in writing, software
+REM distributed under the License is distributed on an "AS IS" BASIS,
+REM WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+REM See the License for the specific language governing permissions and
+REM limitations under the License.
+REM
+REM
+REM
+REM
+REM
+:: Getting parameters
+:: Architecture
+if ("%1") == ("") goto error0
+:: Release/Debug
+if ("%2") == ("") goto error0
+:: Output directory
+if (%3) == ("") goto error0
+set arch=%1
+if ("%2") == ("debug") set postfix=_debug
+set output_dir="%3"
+if ("%4") == ("") set dat_file="%output_dir%\..\..\dat\balls.dat"
+
+:: Actually we can set install root by ourselves
+if ("%TBBROOT%") == ("") set TBBROOT=%~dp0..\..\..\..\..\
+
+:: ordered from oldest to newest, so we end with newest available version
+if ("%VS110COMNTOOLS%") NEQ ("") set vc_dir=vc11_ui
+if ("%VS120COMNTOOLS%") NEQ ("") set vc_dir=vc12_ui
+echo Using %vc_dir% libraries
+
+if exist "%TBBROOT%\bin\%arch%\%vc_dir%\tbb%postfix%.dll" set interim_path=bin\%arch%
+if exist "%TBBROOT%..\redist\%arch%\tbb\%vc_dir%\tbb%postfix%.dll" set interim_path=..\redist\%arch%\tbb
+if exist "%TBBROOT%\lib\%arch%\%vc_dir%\tbb%postfix%.lib" set interim_lib_path=lib\%arch%
+if ("%interim_path%") == ("") goto error1
+if ("%interim_lib_path%") == ("") goto error1
+
+:: We know everything we wanted and there are no errors
+:: Copying binaries
+
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbb%postfix%.dll" "%output_dir%"
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbb%postfix%.pdb" "%output_dir%"
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbbmalloc%postfix%.dll" "%output_dir%"
+copy "%TBBROOT%\%interim_path%\%vc_dir%\tbbmalloc%postfix%.pdb" "%output_dir%"
+copy "%TBBROOT%\%interim_lib_path%\%vc_dir%\tbb%postfix%.lib" "%output_dir%"
+
+:: Copying DAT-file
+echo Using DAT-file %dat_file%
+if exist %dat_file% copy %dat_file% "%output_dir%\Assets\balls.dat"
+
+goto end
+:error0
+echo Custom build script usage: %0 [ia32 or intel64] [release or debug] [output dir] [dat-file]
+exit /B 1
+:error1
+echo Could not determine path to Intel TBB libraries
+exit /B 1
+
+:end
+exit /B 0
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/pch.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/pch.h
new file mode 100644
index 00000000..afcd2e9a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/pch.h
@@ -0,0 +1,29 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#pragma once
+
+#include <wrl/client.h>
+#include <d3d11_1.h>
+#include <d2d1_1.h>
+#include <d2d1effects.h>
+#include <dwrite_1.h>
+#include <wincodec.h>
+#include "App.xaml.h"
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.sln b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.sln
new file mode 100644
index 00000000..ed64646a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.sln
@@ -0,0 +1,34 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tbbTachyon", "tbbTachyon.vcxproj", "{E20CB432-6730-4021-A372-1C81A333518A}"
+EndProject
+Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "Solution Items", "Solution Items", "{E6DDEA39-7910-47F9-A0E3-56AD7E62ACBD}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{E20CB432-6730-4021-A372-1C81A333518A}.Debug|Win32.ActiveCfg = Debug|Win32
+		{E20CB432-6730-4021-A372-1C81A333518A}.Debug|Win32.Build.0 = Debug|Win32
+		{E20CB432-6730-4021-A372-1C81A333518A}.Debug|Win32.Deploy.0 = Debug|Win32
+		{E20CB432-6730-4021-A372-1C81A333518A}.Debug|x64.ActiveCfg = Debug|x64
+		{E20CB432-6730-4021-A372-1C81A333518A}.Debug|x64.Build.0 = Debug|x64
+		{E20CB432-6730-4021-A372-1C81A333518A}.Debug|x64.Deploy.0 = Debug|x64
+		{E20CB432-6730-4021-A372-1C81A333518A}.Release|Win32.ActiveCfg = Release|Win32
+		{E20CB432-6730-4021-A372-1C81A333518A}.Release|Win32.Build.0 = Release|Win32
+		{E20CB432-6730-4021-A372-1C81A333518A}.Release|Win32.Deploy.0 = Release|Win32
+		{E20CB432-6730-4021-A372-1C81A333518A}.Release|x64.ActiveCfg = Release|x64
+		{E20CB432-6730-4021-A372-1C81A333518A}.Release|x64.Build.0 = Release|x64
+		{E20CB432-6730-4021-A372-1C81A333518A}.Release|x64.Deploy.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.vcxproj b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.vcxproj
new file mode 100644
index 00000000..43f1c967
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.vcxproj
@@ -0,0 +1,239 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectGuid>{e20cb432-6730-4021-a372-1c81a333518a}</ProjectGuid>
+    <RootNamespace>tbbTachyon</RootNamespace>
+    <DefaultLanguage>en-US</DefaultLanguage>
+    <VCTargetsPath Condition="'$(VCTargetsPath11)' != '' and '$(VSVersion)' == '' and '$(VisualStudioVersion)' == ''">$(VCTargetsPath11)</VCTargetsPath>
+    <MinimumVisualStudioVersion>11.0</MinimumVisualStudioVersion>
+    <AppContainerApplication>true</AppContainerApplication>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <UseIntelTBB>true</UseIntelTBB>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v120</PlatformToolset>
+    <UseIntelTBB>true</UseIntelTBB>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+    <UseIntelTBB>true</UseIntelTBB>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <WholeProgramOptimization>false</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+    <UseIntelTBB>true</UseIntelTBB>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <PackageCertificateKeyFile>tbbTachyon_TemporaryKey.pfx</PackageCertificateKeyFile>
+    <AppxAutoIncrementPackageRevision>True</AppxAutoIncrementPackageRevision>
+    <PackageCertificateThumbprint>5E3EA4A6008AD66D2487EFC68BB366981685295D</PackageCertificateThumbprint>
+  </PropertyGroup>
+  <ItemDefinitionGroup>
+    <Link>
+      <AdditionalDependencies>d2d1.lib; d3d11.lib; dxgi.lib; ole32.lib; windowscodecs.lib; dwrite.lib; dxguid.lib; %(AdditionalDependencies)</AdditionalDependencies>
+      <GenerateWindowsMetadata>true</GenerateWindowsMetadata>
+      <LinkTimeCodeGeneration Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">Default</LinkTimeCodeGeneration>
+      <LinkTimeCodeGeneration Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">Default</LinkTimeCodeGeneration>
+      <LinkTimeCodeGeneration Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">Default</LinkTimeCodeGeneration>
+      <LinkTimeCodeGeneration Condition="'$(Configuration)|$(Platform)'=='Release|x64'">Default</LinkTimeCodeGeneration>
+    </Link>
+    <ClCompile>
+      <PrecompiledHeaderFile>pch.h</PrecompiledHeaderFile>
+      <PrecompiledHeaderOutputFile>$(IntDir)pch.pch</PrecompiledHeaderOutputFile>
+      <AdditionalIncludeDirectories>$(ProjectDir)\..\..\..\..\common;$(ProjectDir)\..\..;$(ProjectDir)\..\..\..\..\..\include;$(ProjectDir);$(IntermediateOutputPath);%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PrecompiledHeader Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">NotUsing</PrecompiledHeader>
+      <PrecompiledHeader Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">NotUsing</PrecompiledHeader>
+      <PrecompiledHeader Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">NotUsing</PrecompiledHeader>
+      <PrecompiledHeader Condition="'$(Configuration)|$(Platform)'=='Release|x64'">NotUsing</PrecompiledHeader>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">_DEBUG;_CRT_SECURE_NO_WARNINGS;_CRT_SECURE_NO_WARNINGS;_UNICODE;UNICODE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">_CRT_SECURE_NO_WARNINGS;_UNICODE;UNICODE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">_DEBUG;_CRT_SECURE_NO_WARNINGS;_UNICODE;UNICODE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <PreprocessorDefinitions Condition="'$(Configuration)|$(Platform)'=='Release|x64'">_CRT_SECURE_NO_WARNINGS;_UNICODE;UNICODE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <UseMSVC Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</UseMSVC>
+    </ClCompile>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClInclude Include="App.xaml.h">
+      <DependentUpon>App.xaml</DependentUpon>
+    </ClInclude>
+    <ClInclude Include="DirectXPage.xaml.h">
+      <DependentUpon>DirectXPage.xaml</DependentUpon>
+    </ClInclude>
+  </ItemGroup>
+  <ItemGroup>
+    <ApplicationDefinition Include="App.xaml">
+      <SubType>Designer</SubType>
+    </ApplicationDefinition>
+    <Page Include="Common\StandardStyles.xaml">
+      <SubType>Designer</SubType>
+    </Page>
+    <Page Include="DirectXPage.xaml">
+      <SubType>Designer</SubType>
+    </Page>
+  </ItemGroup>
+  <ItemGroup>
+    <AppxManifest Include="Package.appxmanifest">
+      <SubType>Designer</SubType>
+    </AppxManifest>
+    <None Include="Assets\balls.dat">
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</DeploymentContent>
+    </None>
+    <CustomBuild Include="copy_libraries_and_assets.bat">
+      <FileType>Document</FileType>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">call "$(SolutionDir)\copy_libraries_and_assets.bat" ia32 release "$(SolutionDir)"</Command>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">call "$(SolutionDir)\copy_libraries_and_assets.bat" ia32 debug "$(SolutionDir)"</Command>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">call "$(SolutionDir)\copy_libraries_and_assets.bat" intel64 debug "$(SolutionDir)"</Command>
+      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">call "$(SolutionDir)\copy_libraries_and_assets.bat" intel64 release "$(SolutionDir)"</Command>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">Copying libraries to the solution...</Message>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">Copying libraries to the solution...</Message>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">Copying libraries to the solution...</Message>
+      <Message Condition="'$(Configuration)|$(Platform)'=='Release|x64'">Copying libraries to the solution...</Message>
+      <TreatOutputAsContent Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</TreatOutputAsContent>
+      <TreatOutputAsContent Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</TreatOutputAsContent>
+      <TreatOutputAsContent Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</TreatOutputAsContent>
+      <TreatOutputAsContent Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</TreatOutputAsContent>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">tbb_debug.dll</Outputs>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">tbb_debug.dll</Outputs>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">tbb.dll</Outputs>
+      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">tbb.dll</Outputs>
+    </CustomBuild>
+    <None Include="tbb.dll">
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</DeploymentContent>
+      <FileType>CppCode</FileType>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</DeploymentContent>
+    </None>
+    <None Include="tbbmalloc.dll">
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">true</DeploymentContent>
+      <FileType>CppCode</FileType>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|x64'">true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</DeploymentContent>
+    </None>
+    <None Include="tbbmalloc_debug.dll">
+      <FileType>CppCode</FileType>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">true</DeploymentContent>
+    </None>
+    <None Include="tbbTachyon_TemporaryKey.pfx" />
+    <None Include="tbb_debug.dll">
+      <FileType>CppCode</FileType>
+      <DeploymentContent>true</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</DeploymentContent>
+      <DeploymentContent Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</DeploymentContent>
+    </None>
+  </ItemGroup>
+  <ItemGroup>
+    <Image Include="Assets\Logo.png" />
+    <Image Include="Assets\SmallLogo.png" />
+    <Image Include="Assets\StoreLogo.png" />
+    <Image Include="Assets\SplashScreen.png" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include=".\tbbTachyonRenderer.h" />
+    <ClInclude Include="DirectXBase.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\..\..\..\common\gui\convideo.cpp" />
+    <ClCompile Include="..\..\src\api.cpp" />
+    <ClCompile Include="..\..\src\apigeom.cpp" />
+    <ClCompile Include="..\..\src\apitrigeom.cpp" />
+    <ClCompile Include="..\..\src\bndbox.cpp" />
+    <ClCompile Include="..\..\src\box.cpp" />
+    <ClCompile Include="..\..\src\camera.cpp" />
+    <ClCompile Include="..\..\src\coordsys.cpp" />
+    <ClCompile Include="..\..\src\cylinder.cpp" />
+    <ClCompile Include="..\..\src\extvol.cpp" />
+    <ClCompile Include="..\..\src\global.cpp" />
+    <ClCompile Include="..\..\src\grid.cpp" />
+    <ClCompile Include="..\..\src\imageio.cpp" />
+    <ClCompile Include="..\..\src\imap.cpp" />
+    <ClCompile Include="..\..\src\intersect.cpp" />
+    <ClCompile Include="..\..\src\jpeg.cpp" />
+    <ClCompile Include="..\..\src\light.cpp" />
+    <ClCompile Include="..\..\src\main.cpp" />
+    <ClCompile Include="..\..\src\objbound.cpp" />
+    <ClCompile Include="..\..\src\parse.cpp" />
+    <ClCompile Include="..\..\src\plane.cpp" />
+    <ClCompile Include="..\..\src\ppm.cpp" />
+    <ClCompile Include="..\..\src\pthread.cpp" />
+    <ClCompile Include="..\..\src\quadric.cpp" />
+    <ClCompile Include="..\..\src\render.cpp" />
+    <ClCompile Include="..\..\src\ring.cpp" />
+    <ClCompile Include="..\..\src\shade.cpp" />
+    <ClCompile Include="..\..\src\sphere.cpp" />
+    <ClCompile Include="..\..\src\tachyon_video.cpp" />
+    <ClCompile Include="..\..\src\texture.cpp" />
+    <ClCompile Include="..\..\src\tgafile.cpp" />
+    <ClCompile Include="..\..\src\trace.tbb.cpp" />
+    <ClCompile Include="..\..\src\trace_rest.cpp" />
+    <ClCompile Include="..\..\src\triangle.cpp" />
+    <ClCompile Include="..\..\src\ui.cpp" />
+    <ClCompile Include="..\..\src\util.cpp" />
+    <ClCompile Include="..\..\src\vector.cpp" />
+    <ClCompile Include="..\..\src\vol.cpp" />
+    <ClCompile Include=".\tbbTachyonRenderer.cpp" />
+    <ClCompile Include="DirectXBase.cpp" />
+    <ClCompile Include="App.xaml.cpp">
+      <DependentUpon>App.xaml</DependentUpon>
+    </ClCompile>
+    <ClCompile Include="DirectXPage.xaml.cpp">
+      <DependentUpon>DirectXPage.xaml</DependentUpon>
+    </ClCompile>
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.vcxproj.filters b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.vcxproj.filters
new file mode 100644
index 00000000..54c92541
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyon.vcxproj.filters
@@ -0,0 +1,215 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup>
+    <Page Include="Common\StandardStyles.xaml">
+      <Filter>Resources\Common</Filter>
+    </Page>
+    <Image Include="Assets\Logo.png">
+      <Filter>Resources\Assets</Filter>
+    </Image>
+    <Image Include="Assets\SmallLogo.png">
+      <Filter>Resources\Assets</Filter>
+    </Image>
+    <Image Include="Assets\StoreLogo.png">
+      <Filter>Resources\Assets</Filter>
+    </Image>
+    <Image Include="Assets\SplashScreen.png">
+      <Filter>Resources\Assets</Filter>
+    </Image>
+    <Filter Include="Resources">
+      <UniqueIdentifier>{a5d732ac-1380-4b99-910c-c5685c48ec08}</UniqueIdentifier>
+    </Filter>
+    <Filter Include="Resources\Common">
+      <UniqueIdentifier>e20cb432-6730-4021-a372-1c81a333518a</UniqueIdentifier>
+    </Filter>
+    <Filter Include="Resources\Assets">
+      <UniqueIdentifier>ac5c7e6e-0221-4a78-85c7-20768e92cf5a</UniqueIdentifier>
+    </Filter>
+    <Page Include="DirectXPage.xaml">
+      <Filter>Frontend</Filter>
+    </Page>
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="App.xaml.cpp" />
+    <ClCompile Include="DirectXPage.xaml.cpp" />
+    <ClCompile Include="..\..\src\api.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\apigeom.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\apitrigeom.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\bndbox.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\box.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\camera.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\coordsys.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\cylinder.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\extvol.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\global.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\grid.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\imageio.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\imap.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\intersect.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\jpeg.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\light.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\objbound.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\parse.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\plane.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\ppm.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\pthread.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\quadric.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\render.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\ring.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\shade.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\sphere.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\tachyon_video.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\texture.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\tgafile.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\trace.tbb.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\trace_rest.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\triangle.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\ui.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\util.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\vector.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\vol.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\..\..\common\gui\convideo.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="..\..\src\main.cpp">
+      <Filter>Backend</Filter>
+    </ClCompile>
+    <ClCompile Include="DirectXBase.cpp">
+      <Filter>Frontend</Filter>
+    </ClCompile>
+    <ClCompile Include=".\tbbTachyonRenderer.cpp">
+      <Filter>Frontend</Filter>
+    </ClCompile>
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="App.xaml.h" />
+    <ClInclude Include="DirectXPage.xaml.h" />
+    <ClInclude Include="DirectXBase.h">
+      <Filter>Frontend</Filter>
+    </ClInclude>
+    <ClInclude Include=".\tbbTachyonRenderer.h">
+      <Filter>Frontend</Filter>
+    </ClInclude>
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="Assets\balls.dat">
+      <Filter>Resources\Assets</Filter>
+    </None>
+    <None Include="tbb.dll">
+      <Filter>Libraries</Filter>
+    </None>
+    <None Include="tbbmalloc.dll">
+      <Filter>Libraries</Filter>
+    </None>
+    <None Include="tbb_debug.dll">
+      <Filter>Libraries</Filter>
+    </None>
+    <None Include="tbbmalloc_debug.dll">
+      <Filter>Libraries</Filter>
+    </None>
+    <None Include="tbbTachyon_TemporaryKey.pfx">
+      <Filter>Frontend</Filter>
+    </None>
+  </ItemGroup>
+  <ItemGroup>
+    <Filter Include="Libraries">
+      <UniqueIdentifier>{a70d1cf5-5cc8-4f50-a6d2-92d2b973df86}</UniqueIdentifier>
+    </Filter>
+    <Filter Include="Scripts">
+      <UniqueIdentifier>{eb414f7a-2d2d-4ff5-93fe-458cc3021423}</UniqueIdentifier>
+    </Filter>
+    <Filter Include="Backend">
+      <UniqueIdentifier>{77eb2f1c-7dec-4360-8989-e9ad18034e10}</UniqueIdentifier>
+    </Filter>
+    <Filter Include="Frontend">
+      <UniqueIdentifier>{d825a994-3d08-4764-9945-ec9aafc1f496}</UniqueIdentifier>
+    </Filter>
+  </ItemGroup>
+  <ItemGroup>
+    <CustomBuild Include="copy_libraries_and_assets.bat">
+      <Filter>Scripts</Filter>
+    </CustomBuild>
+  </ItemGroup>
+  <ItemGroup>
+    <ApplicationDefinition Include="App.xaml">
+      <Filter>Frontend</Filter>
+    </ApplicationDefinition>
+  </ItemGroup>
+  <ItemGroup>
+    <AppxManifest Include="Package.appxmanifest">
+      <Filter>Frontend</Filter>
+    </AppxManifest>
+  </ItemGroup>
+</Project>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyonRenderer.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyonRenderer.cpp
new file mode 100644
index 00000000..3ebb1f66
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyonRenderer.cpp
@@ -0,0 +1,190 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "pch.h"
+#include "tbbTachyonRenderer.h"
+#include <DirectXMath.h>
+#include <process.h>
+#include <thread>
+#include "../../src/tachyon_video.h"
+#include "tbb/tbb.h"
+
+using namespace Microsoft::WRL;
+using namespace Windows::Foundation;
+using namespace Windows::Foundation::Collections;
+using namespace Windows::UI::Core;
+using namespace DirectX;
+
+tbbTachyonRenderer::tbbTachyonRenderer() :
+    m_renderNeeded(true)
+{
+}
+
+tbbTachyonRenderer::~tbbTachyonRenderer()
+{
+}
+
+void tbbTachyonRenderer::CreateDeviceIndependentResources()
+{
+    DirectXBase::CreateDeviceIndependentResources();
+
+    DX::ThrowIfFailed(
+        m_dwriteFactory->CreateTextFormat(
+        L"Segoe UI",
+        nullptr,
+        DWRITE_FONT_WEIGHT_NORMAL,
+        DWRITE_FONT_STYLE_NORMAL,
+        DWRITE_FONT_STRETCH_NORMAL,
+        32.0f,
+        L"en-US",
+        &m_textFormat
+        )
+        );
+
+    DX::ThrowIfFailed(
+        m_textFormat->SetTextAlignment(DWRITE_TEXT_ALIGNMENT_LEADING)
+        );
+
+}
+
+unsigned int __stdcall example_main(void*);
+
+float g_ratiox, g_ratioy;
+extern unsigned int *g_pImg;
+extern int g_sizex, g_sizey;
+extern int global_xsize, global_ysize;
+extern int volatile global_number_of_threads;
+extern volatile long global_startTime;
+extern volatile long global_elapsedTime;
+
+#define SHOW_TEXT 1
+
+void tbbTachyonRenderer::CreateDeviceResources()
+{
+
+    DirectXBase::CreateDeviceResources();
+
+    DX::ThrowIfFailed(
+        m_d2dContext->CreateSolidColorBrush(
+        D2D1::ColorF(D2D1::ColorF::Green),
+        &m_Brush
+        )
+        );
+
+    D2D1_BITMAP_PROPERTIES1 properties = D2D1::BitmapProperties1(
+        D2D1_BITMAP_OPTIONS_TARGET,
+        D2D1::PixelFormat(
+        DXGI_FORMAT_R8G8B8A8_UNORM,
+        D2D1_ALPHA_MODE_IGNORE
+        )
+        );
+
+
+    //Setting manual rendering size
+    global_xsize = 800;
+    global_ysize = int(global_xsize/m_window->Bounds.Width*m_window->Bounds.Height);
+    D2D1_SIZE_U opacityBitmapSize = D2D1::SizeU(global_xsize, global_ysize);
+
+    DX::ThrowIfFailed(
+        m_d2dContext->CreateBitmap(
+        opacityBitmapSize,
+        (BYTE*)g_pImg,
+        sizeof(unsigned int)*g_sizex,
+        &properties,
+        &m_opacityBitmap
+        )
+        );
+
+    m_d2dContext->SetTarget(m_opacityBitmap.Get());
+    m_d2dContext->BeginDraw();
+
+    m_d2dContext->Clear(D2D1::ColorF(D2D1::ColorF::Black, 0.0f));
+
+    DX::ThrowIfFailed(
+        m_d2dContext->EndDraw()
+        );
+
+    std::thread* thread_tmp=new std::thread(example_main, (void*)NULL);
+
+}
+
+void tbbTachyonRenderer::CreateWindowSizeDependentResources()
+{
+    DirectXBase::CreateWindowSizeDependentResources();
+}
+
+void tbbTachyonRenderer::Render()
+{
+    D2D1_SIZE_F size = m_d2dContext->GetSize();
+
+#if SHOW_TEXT
+    if (video && video->running)
+        global_elapsedTime=(long)(time(NULL)-global_startTime);
+    
+    Platform::String^ text= "Running in " +
+        (global_number_of_threads == tbb::task_scheduler_init::automatic? "all hardware threads: ":
+            global_number_of_threads.ToString() + (global_number_of_threads==1?" thread: ":" threads: ")) +
+        global_elapsedTime.ToString() + (global_elapsedTime>1?" seconds":" second");
+
+    g_ratiox=float(size.width/1024.0);
+    g_ratioy=float(size.height/512.0);
+
+    DX::ThrowIfFailed(
+        m_dwriteFactory->CreateTextLayout(
+        text->Data(),
+        text->Length(),
+        m_textFormat.Get(),
+        1000, // maxWidth
+        1000, // maxHeight
+        &m_textLayout
+        )
+        );
+
+    m_textLayout->GetMetrics(&m_textMetrics);
+#endif
+
+    m_d2dContext->BeginDraw();
+
+    if(g_pImg)m_opacityBitmap->CopyFromMemory( NULL,(BYTE*)g_pImg, sizeof(unsigned int)*g_sizex );
+
+    m_d2dContext->DrawBitmap( m_opacityBitmap.Get(), D2D1::RectF(0,0,size.width,size.height) );
+
+#if SHOW_TEXT
+    m_d2dContext->DrawTextLayout(
+        D2D1::Point2F(0.0f, 0.0f),
+        m_textLayout.Get(),
+        m_Brush.Get(),
+        D2D1_DRAW_TEXT_OPTIONS_CLIP
+        );
+#endif
+
+    HRESULT hr = m_d2dContext->EndDraw();
+
+    if (hr == D2DERR_RECREATE_TARGET){
+        m_d2dContext->SetTarget(nullptr);
+        m_d2dTargetBitmap = nullptr;
+        CreateWindowSizeDependentResources();
+    }else{
+        DX::ThrowIfFailed(hr);
+    }
+
+    m_renderNeeded = false;
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyonRenderer.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyonRenderer.h
new file mode 100644
index 00000000..dda3e02c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/msvs/win8ui/tbbTachyonRenderer.h
@@ -0,0 +1,46 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#pragma once
+
+#include <wrl.h>
+#include "DirectXBase.h"
+
+ref class tbbTachyonRenderer sealed : public DirectXBase
+{
+public:
+    tbbTachyonRenderer();
+    virtual void CreateDeviceIndependentResources() override;
+    virtual void CreateDeviceResources() override;
+    virtual void CreateWindowSizeDependentResources() override;
+    virtual void Render() override;
+    void Update(float timeTotal, float timeDelta);
+
+    void UpdateView(Windows::Foundation::Point deltaViewPosition);
+
+private:
+    Microsoft::WRL::ComPtr<ID2D1SolidColorBrush> m_Brush;
+    Microsoft::WRL::ComPtr<IDWriteTextFormat> m_textFormat;
+    Microsoft::WRL::ComPtr<ID2D1Bitmap1> m_opacityBitmap;
+    Microsoft::WRL::ComPtr<IDWriteTextLayout> m_textLayout;
+    DWRITE_TEXT_METRICS m_textMetrics;
+    bool m_renderNeeded;
+    ~tbbTachyonRenderer();
+};
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/readme.html b/xdl/third_party/tbb/examples/parallel_for/tachyon/readme.html
new file mode 100644
index 00000000..bec0b486
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/readme.html
@@ -0,0 +1,572 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Tachyon sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Tachyon sample</h1>
+	</div>
+	
+	<p>
+		Parallel raytracer / renderer that demonstrates the use of parallel_for.
+	</p>
+	<p><i>
+		This example includes software developed by John E. Stone. See
+		<a href="#copyright">here</a> for copyright information.
+	</i></p>
+	<p>
+		This example is a 2-D raytracer/renderer that visually shows different parallel scheduling
+		methods and their resulting speedup.  The code was parallelized by speculating
+		that each pixel could be rendered in parallel.  The resulting parallel code was
+		then checked for correctness by using Intel&reg; Thread Checker, which
+		pointed out where synchronization was needed.  Minimal synchronization was then
+		inserted into the parallel code.  The resulting parallel code exhibits good speedup.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Versions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><b>serial</b>
+				<dd>Original sequential version.
+				<dt><b>tbb1d</b>
+				<dd>Parallel version that uses Intel&reg; Threading Building Blocks (Intel&reg; TBB) and blocked_range to parallelize
+					over tasks that are groups of scan-lines.
+					<ul>
+					<li>By default, this version uses one thread per available processor. To change this
+					default, set the TBB_NUM_THREADS environment variable to the desired number of threads before running.
+					<li>This version uses the preview feature: auto_range_partitioner.  No grain size is provided to blocked_range.
+						The blocked_range class uses a default grain size of 1 when none is provided.  However, the auto_range_partitioner
+						controls the amount of range splitting dynamically at runtime, resulting in sub-ranges of varying sizes.
+					</ul>
+				<dt><b>tbb</b>
+				<dd>Parallel version that uses Intel TBB and blocked_range2d to parallelize
+					over tasks that are rectangular sub-areas.
+					<ul>
+					<li>By default, this version uses one thread per available processor.  To change this
+					default, set the TBB_NUM_THREADS environment variable to the desired number of threads before running.
+					<li>This version uses a reasonable task grain size by default.  To change this default,
+					set the TBB_GRAINSIZE environment variable to the desired grain size before running.
+					The grain size corresponds to the number of pixels (in the X or Y direction, for a
+					rectangular sub-area) in each parallel task.
+					</ul>
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="src/main.cpp">src/main.cpp</a>
+				<dd>Main program which parses command line options and runs the raytracer.
+				<dt><a href="src/tachyon_video.cpp">src/tachyon_video.cpp</a>
+				<dd>Source code for GUI interfaces.
+				<dt><a href="src/trace.serial.cpp">src/trace.serial.cpp</a>
+				<dd>Source code for original sequential version of example.
+				<dt><a href="src/trace.tbb1d.cpp">src/trace.tbb1d.cpp</a>
+				<dd>Source code for Intel TBB blocked_range (scan-line) version of example.
+				<dt><a href="src/trace.tbb.cpp">src/trace.tbb.cpp</a>
+				<dd>Source code for Intel TBB blocked_range2d (rectangular sub-area) version of example.
+				<dt>(src/*.cpp)
+				<dd>Remainder of source code for example.
+				<dt>(src/*.h)
+				<dd>Remainder of include files for example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="src/">src</a>
+				<dd>Contains source code and include files for the example.
+				<dt><a href="dat/">dat</a>
+				<dd>Contains data sets for running the example.
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+			<p>
+				For Windows* systems Microsoft* Visual Studio* projects are provided for each of the above example versions.
+			</p>
+
+			<p>
+			The Makefile supports the following build targets (in addition to the <a href="../../index.html">general</a> ones).
+			Here, &lt;<i>version</i>&gt; is one of the above versions of the example, i.e., {serial, tbb1d, tbb}.
+			</p>
+			<dl>
+				<dt><tt>make &lt;<i>version</i>&gt;[_debug]</tt>
+				<dd>Build and run a single version (release or debug).
+					Equivalent to 'make build_&lt;<i>version</i>&gt;[_debug] run_&lt;<i>version</i>&gt;'.
+				<dt><tt>make build_&lt;<i>version</i>&gt;[_debug]</tt>
+				<dd>Compile and link a single version (release or debug).
+					The resulting executable is left in the directory for the example.
+				<dt><tt>make run_&lt;<i>version</i>&gt;</tt>
+				<dd>Run a single version previously produced by one of the above commands.
+				<dt><tt>make [(above options or targets)] DATASET={820spheres, balls, balls3, lattice, model2,
+					teapot, trypsin4pti}</tt>
+				<dd>Build and run as above, but run with the specified data set.
+				<dt><tt>make [(above options or targets)] ARGS=-D</tt>
+				<dd>Build and run as above, but run with disabled run-time display updating for use in making performance measurements
+					<i>(strongly recommended when measuring performance or scalability; see note below)</i>.
+				<dt><tt>make [(above options or targets)] UI={con, gdi, d2d, x, mac}</tt>
+				<dd>Build and run as usual, but build with the specified GUI driver: console, GDI+*, Direct2D*, X11, or OpenGL*
+					(see the description of the <a href="../../common/index.html">common GUI code</a>
+					for more information on available graphics support).
+					For Linux* and macOS* systems, the best available driver is detected automatically by the Makefile.
+					For Windows* systems, UI=gdi is the default GUI driver; compiling with UI=d2d may offer superior
+					performance, but can only be used if the Microsoft* DirectX* SDK is installed on your system.
+					Use UI=con to build without the GUI for use in making performance measurements
+					<i>(strongly recommended when measuring performance or scalability; see note below)</i>.
+				<dt><tt>make [(above options or targets)] XARCH=x64</tt>
+				<dd>Build and run as above, but
+					also specify XARCH=x64 (or XARCH=AMD64 for older compilers) when building the example on Windows* as a 64-bit binary.
+				<dt><tt>make [(above options or targets)] DDLIB_DIR=&lt;<i>specify path to Direct Draw* SDK here</i>&gt;</tt>
+				<dd>If you experience ddraw.lib linking problems, specify the correct library directory via this option.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>
+				Building via the above make commands, or via Visual Studio projects on Windows* systems, produces executable files
+				named <tt>tachyon.&lt;<i>version</i>&gt;.exe</tt>.  To run these executables directly, use one or more of the following commands.
+			</p>
+			<dl>
+				<dt><tt>tachyon.&lt;<i>version</i>&gt; <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>tachyon.&lt;<i>version</i>&gt; [<i>dataset</i>=value] [<i>boundthresh</i>=value] [<i>no-display-updating</i>] [<i>nobounding</i>] [<i>silent</i>]</tt>
+				<dt><tt>tachyon.&lt;<i>version</i>&gt; [<i>dataset</i> [<i>boundthresh</i>]] [<i>no-display-updating</i>] [<i>nobounding</i>] [<i>silent</i>]</tt>
+				<dd><i>dataset</i> is the path/name of one of the *.dat files in the <a href="dat">dat</a> directory for the example.<br>
+					<i>boundthresh</i> is a bounding threshold value.<br>
+					<i>no-display-updating</i> - disable run-time display updating.<br>
+					<i>no-bounding</i> - disable bounding technique.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+				<dt><tt>tachyon.&lt;<i>version</i>&gt; [<i>dataset</i>] [<i>no-display-updating</i>]</tt>
+				<dd>Run this version (release or debug), but run with disabled run-time display updating
+					for use in making performance measurements
+					<i>(strongly recommended when measuring performance or scalability; see note below)</i>.
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the <tt>tbb</tt> example with the GUI turned off
+					(e.g., <tt>make UI=con tbb_debug</tt>; see also the build directions above).
+					<br>Run it with a small dataset, e.g., <tt>tachyon.tbb.exe dat/820spheres.dat no-display-updating</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Keys</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>While running with the GUI display turned on the following keyboard keys can be used:</p>
+			<dl>
+				<dt><tt>ESC</tt>
+				<dd>Interrupt the rendering and exit
+				<dt><tt><i>Any key</i></tt>
+				<dd>Enable repetition of rendering after the pause. Press ESC to stop the application.
+				<dt><tt>Space</tt>
+				<dd>Toggle run-time display updating mode while rendering (see no-display-updating above).
+				<dt><tt>p</tt>
+				<dd>Holds the picture after rendering completion. Press 'p' again to continue.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Notes</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<ul>
+			<li>While running with the GUI display turned on should yield reasonable performance in most cases, <i>running with the GUI
+				display turned off is strongly recommended</i> in order to demonstrate the full performance and scalability of the example.
+			</ul>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<a name="copyright"></a>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+
+			<p>
+			The original source for this example is
+			Copyright (c) 1994-2008 John E. Stone
+			All rights reserved.
+			</p>
+
+			<p>
+			Redistribution and use in source and binary forms, with or without
+			modification, are permitted provided that the following conditions
+			are met:
+			<ol>
+			<li>Redistributions of source code must retain the above copyright
+			   notice, this list of conditions and the following disclaimer.
+			<li>Redistributions in binary form must reproduce the above copyright
+			   notice, this list of conditions and the following disclaimer in the
+			   documentation and/or other materials provided with the distribution.
+			<li>The name of the author may not be used to endorse or promote products
+			   derived from this software without specific prior written permission.
+			</ol>
+			</p>
+
+			<p>
+			THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+			OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+			WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+			ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+			DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+			DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+			OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+			HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+			LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+			OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+			SUCH DAMAGE.
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/api.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/api.cpp
new file mode 100644
index 00000000..eec81e7d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/api.cpp
@@ -0,0 +1,418 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * api.cpp - This file contains all of the API calls that are defined for
+ *         external driver code to use.  
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+
+#include "box.h"
+#include "cylinder.h"
+#include "plane.h"
+#include "quadric.h"
+#include "ring.h"
+#include "sphere.h"
+#include "triangle.h"
+#include "vol.h"
+#include "extvol.h"
+
+#include "texture.h"
+#include "light.h"
+#include "render.h"
+#include "camera.h"
+#include "vector.h"
+#include "intersect.h"
+#include "shade.h"
+#include "util.h"
+#include "imap.h"
+#include "global.h"
+
+#include "tachyon_video.h"
+
+typedef void * SceneHandle;
+#include "api.h"
+
+
+vector rt_vector(apiflt x, apiflt y, apiflt z) {
+  vector v;
+
+  v.x = x;
+  v.y = y;
+  v.z = z;
+
+  return v;
+}
+
+color rt_color(apiflt r, apiflt g, apiflt b) {
+  color c;
+  
+  c.r = r;
+  c.g = g;
+  c.b = b;
+  
+  return c;
+}
+
+void rt_initialize() {
+  rpcmsg msg;
+
+  reset_object();
+  reset_lights();
+  InitTextures();
+
+  if (!parinitted) {
+    parinitted=1;
+
+    msg.type=1; /* setup a ping message */
+  }
+}
+
+void rt_renderscene(SceneHandle voidscene) {
+  scenedef * scene = (scenedef *) voidscene;
+  renderscene(*scene);
+}
+
+void rt_camerasetup(SceneHandle voidscene, apiflt zoom, apiflt aspectratio, 
+	int antialiasing, int raydepth, 
+	vector camcent, vector viewvec, vector upvec) {
+  scenedef * scene = (scenedef *) voidscene;
+
+  vector newupvec;
+  vector newviewvec;
+  vector newrightvec;
+ 
+  VCross((vector *) &upvec, &viewvec, &newrightvec);
+  VNorm(&newrightvec);
+
+  VCross((vector *) &viewvec, &newrightvec, &newupvec);
+  VNorm(&newupvec);
+
+  newviewvec=viewvec;
+  VNorm(&newviewvec);
+
+
+  scene->camzoom=zoom; 
+  scene->aspectratio=aspectratio;
+  scene->antialiasing=antialiasing;
+  scene->raydepth=raydepth; 
+  scene->camcent=camcent;
+  scene->camviewvec=newviewvec;
+  scene->camrightvec=newrightvec;
+  scene->camupvec=newupvec;
+}
+
+void rt_outputfile(SceneHandle voidscene, const char * outname) {
+  scenedef * scene = (scenedef *) voidscene;
+  strcpy((char *) &scene->outfilename, outname);
+}
+
+void rt_resolution(SceneHandle voidscene, int hres, int vres) {
+  scenedef * scene = (scenedef *) voidscene;
+  scene->hres=hres;
+  scene->vres=vres;
+}
+
+void rt_verbose(SceneHandle voidscene, int v) {
+  scenedef * scene = (scenedef *) voidscene;
+  scene->verbosemode = v;
+}
+
+void rt_rawimage(SceneHandle voidscene, unsigned char *rawimage) {
+  scenedef * scene = (scenedef *) voidscene;
+  scene->rawimage = rawimage;
+}
+
+void rt_background(SceneHandle voidscene, color col) {
+  scenedef * scene = (scenedef *) voidscene;
+  scene->background.r = col.r;
+  scene->background.g = col.g;
+  scene->background.b = col.b;
+}
+
+void rt_boundmode(SceneHandle voidscene, int mode) {
+  scenedef * scene = (scenedef *) voidscene;
+  scene->boundmode = mode;
+}
+
+void rt_boundthresh(SceneHandle voidscene, int threshold) {
+  scenedef * scene = (scenedef *) voidscene;
+ 
+  if (threshold > 1) {
+    scene->boundthresh = threshold;
+  }
+  else {
+    rtmesg("Ignoring out-of-range automatic bounding threshold.\n");
+    rtmesg("Automatic bounding threshold reset to default.\n");
+    scene->boundthresh = MAXOCTNODES;
+  }
+}
+
+void rt_displaymode(SceneHandle voidscene, int mode) {
+  scenedef * scene = (scenedef *) voidscene;
+  scene->displaymode = mode;
+}
+
+
+void rt_scenesetup(SceneHandle voidscene, char * outname, int hres, int vres, int verbose) {
+  rt_outputfile(voidscene, outname);
+  rt_resolution(voidscene, hres, vres);
+  rt_verbose(voidscene, verbose);
+}
+
+SceneHandle rt_newscene(void) {
+  scenedef * scene;
+  SceneHandle voidscene;
+
+  scene = (scenedef *) malloc(sizeof(scenedef));
+  memset(scene, 0, sizeof(scenedef));             /* clear all valuas to 0  */
+
+  voidscene = (SceneHandle) scene;
+
+  rt_outputfile(voidscene, "/dev/null");   /* default output file (.tga)   */
+  rt_resolution(voidscene, 512, 512);             /* 512x512 resolution     */
+  rt_verbose(voidscene, 0);                       /* verbose messages off   */
+  rt_rawimage(voidscene, NULL);                   /* raw image output off   */
+  rt_boundmode(voidscene, RT_BOUNDING_ENABLED);   /* spatial subdivision on */
+  rt_boundthresh(voidscene, MAXOCTNODES);         /* default threshold      */
+  rt_displaymode(voidscene, RT_DISPLAY_ENABLED);  /* video output on        */
+  rt_camerasetup(voidscene, 1.0, 1.0, 0, 6,
+                 rt_vector(0.0, 0.0, 0.0),
+                 rt_vector(0.0, 0.0, 1.0),
+                 rt_vector(0.0, 1.0, 0.0));
+ 
+  return scene;
+}
+
+void rt_deletescene(SceneHandle scene) {
+  if (scene != NULL)
+    free(scene);
+}
+
+void apitextotex(apitexture * apitex, texture * tex) {
+  switch(apitex->texturefunc) {
+    case 0: 
+      tex->texfunc=(color(*)(void *, void *, void *))(standard_texture);
+      break;
+
+    case 1: 
+      tex->texfunc=(color(*)(void *, void *, void *))(checker_texture);
+      break;
+
+    case 2: 
+      tex->texfunc=(color(*)(void *, void *, void *))(grit_texture);
+      break;
+
+    case 3: 
+      tex->texfunc=(color(*)(void *, void *, void *))(marble_texture);
+      break;
+
+    case 4: 
+      tex->texfunc=(color(*)(void *, void *, void *))(wood_texture);
+      break;
+
+    case 5: 
+      tex->texfunc=(color(*)(void *, void *, void *))(gnoise_texture);
+      break;
+	
+    case 6: 
+      tex->texfunc=(color(*)(void *, void *, void *))(cyl_checker_texture);
+      break;
+
+    case 7: 
+      tex->texfunc=(color(*)(void *, void *, void *))(image_sphere_texture);
+      tex->img=AllocateImage((char *)apitex->imap);
+      break;
+
+    case 8: 
+      tex->texfunc=(color(*)(void *, void *, void *))(image_cyl_texture);
+      tex->img=AllocateImage((char *)apitex->imap);
+      break;
+
+    case 9: 
+      tex->texfunc=(color(*)(void *, void *, void *))(image_plane_texture);
+      tex->img=AllocateImage((char *)apitex->imap);
+      break;
+
+    default: 
+      tex->texfunc=(color(*)(void *, void *, void *))(standard_texture);
+      break;
+  }
+
+       tex->ctr = apitex->ctr;
+       tex->rot = apitex->rot;
+     tex->scale = apitex->scale;
+      tex->uaxs = apitex->uaxs;
+      tex->vaxs = apitex->vaxs;
+   tex->ambient = apitex->ambient;
+   tex->diffuse = apitex->diffuse;
+  tex->specular = apitex->specular;
+   tex->opacity = apitex->opacity;
+       tex->col = apitex->col; 
+
+  tex->islight = 0;
+  tex->shadowcast = 1;
+  tex->phong = 0.0;
+  tex->phongexp = 0.0;
+  tex->phongtype = 0;
+}
+
+void * rt_texture(apitexture * apitex) {
+  texture * tex;
+
+  tex=(texture *)rt_getmem(sizeof(texture));
+  apitextotex(apitex, tex); 
+  return(tex);
+}
+
+void rt_tex_color(void * voidtex, color col) {
+  texture * tex = (texture *) voidtex;
+  tex->col = col;
+}
+
+void rt_tex_phong(void * voidtex, apiflt phong, apiflt phongexp, int type) {
+  texture * tex = (texture *) voidtex;
+  tex->phong = phong;
+  tex->phongexp = phongexp;
+  tex->phongtype = type;
+}
+
+void rt_light(void * tex, vector ctr, apiflt rad) {
+  point_light * li;
+
+  li=newlight(tex, (vector) ctr, rad);
+
+  li->tex->islight=1;
+  li->tex->shadowcast=1;
+  li->tex->diffuse=0.0;
+  li->tex->specular=0.0;
+  li->tex->opacity=1.0;
+
+  add_light(li);
+  add_object((object *)li);
+}
+
+void rt_scalarvol(void * tex, vector min, vector max,
+	int xs, int ys, int zs, char * fname, void * invol) {
+  add_object((object *) newscalarvol(tex, (vector)min, (vector)max, xs, ys, zs, fname, (scalarvol *) invol));
+}
+
+void rt_extvol(void * tex, vector min, vector max, int samples, flt (* evaluator)(flt, flt, flt)) {
+  add_object((object *) newextvol(tex, (vector)min, (vector)max, samples, evaluator));
+}
+
+void rt_box(void * tex, vector min, vector max) {
+  add_object((object *) newbox(tex, (vector)min, (vector)max));
+} 
+
+void rt_cylinder(void * tex, vector ctr, vector axis, apiflt rad) {
+  add_object(newcylinder(tex, (vector)ctr, (vector)axis, rad));
+}
+
+void rt_fcylinder(void * tex, vector ctr, vector axis, apiflt rad) {
+  add_object(newfcylinder(tex, (vector)ctr, (vector)axis, rad));
+}
+
+void rt_plane(void * tex, vector ctr, vector norm) {
+  add_object(newplane(tex, (vector)ctr, (vector)norm));
+} 
+
+void rt_ring(void * tex, vector ctr, vector norm, apiflt a, apiflt b) {
+  add_object(newring(tex, (vector)ctr, (vector)norm, a, b));
+} 
+
+void rt_sphere(void * tex, vector ctr, apiflt rad) {
+  add_object(newsphere(tex, (vector)ctr, rad));
+}
+
+void rt_tri(void * tex, vector v0, vector v1, vector v2) {
+  object * trn;
+
+  trn = newtri(tex, (vector)v0, (vector)v1, (vector)v2);
+
+  if (trn != NULL) { 
+    add_object(trn);
+  }
+} 
+
+void rt_stri(void * tex, vector v0, vector v1, vector v2, 
+		vector n0, vector n1, vector n2) {
+  object * trn;
+ 
+  trn = newstri(tex, (vector)v0, (vector)v1, (vector)v2, (vector)n0, (vector)n1, (vector)n2);
+
+  if (trn != NULL) { 
+    add_object(trn);
+  }
+} 
+
+void rt_quadsphere(void * tex, vector ctr, apiflt rad) {
+  quadric * q;
+  flt factor;
+  q=(quadric *) newquadric();
+  factor= 1.0 / (rad*rad);
+  q->tex=(texture *)tex;
+  q->ctr=ctr;
+ 
+  q->mat.a=factor;
+  q->mat.b=0.0;
+  q->mat.c=0.0;
+  q->mat.d=0.0;
+  q->mat.e=factor;
+  q->mat.f=0.0;
+  q->mat.g=0.0;
+  q->mat.h=factor;
+  q->mat.i=0.0;
+  q->mat.j=-1.0;
+ 
+  add_object((object *)q);
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/api.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/api.h
new file mode 100644
index 00000000..dcfa43c0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/api.h
@@ -0,0 +1,208 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*****************************************************************************
+ * api.h - The declarations and prototypes needed so that 3rd party driver   *
+ *         code can run the raytracer.  Third party driver code should       * 
+ *         only use the functions in this header file to interface with      *
+ *         the rendering engine.                                             *
+ *************************************************************************** */
+
+
+/* 
+ *  $Id: api.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+
+/********************************************/
+/* Types defined for use with the API calls */
+/********************************************/
+
+#ifdef USESINGLEFLT
+typedef float apiflt;   /* generic floating point number */
+#else
+typedef double apiflt;  /* generic floating point number */
+#endif
+
+typedef void * SceneHandle;
+
+typedef struct {
+  int texturefunc; /* which texture function to use */
+  color col;    /* base object color */
+  int shadowcast;  /* does the object cast a shadow */
+  apiflt ambient;  /* ambient lighting */
+  apiflt diffuse;  /* diffuse reflection */
+  apiflt specular; /* specular reflection */
+  apiflt opacity;  /* how opaque the object is */ 
+  vector ctr;   /* origin of texture */
+  vector rot;   /* rotation of texture around origin */
+  vector scale; /* scale of texture in x,y,z */ 
+  vector uaxs;  /* planar map u axis */
+  vector vaxs;  /* planar map v axis */
+  char imap[96];   /* name of image map */ 
+} apitexture;
+
+
+/*******************************************************************
+ *  NOTE: The value passed in apitexture.texturefunc corresponds to 
+ *        the meanings given in this table:
+ *
+ *   0 - No texture function is applied other than standard lighting.
+ *   1 - 3D checkerboard texture.  Red & Blue checkers through 3d space.
+ *   2 - Grit texture, roughens up the surface of the object a bit.
+ *   3 - 3D marble texture.  Makes a 3D swirl pattern through the object.
+ *   4 - 3D wood texture.  Makes a 3D wood pattern through the object.
+ *   5 - 3D gradient noise function.
+ *   6 - I've forgotten :-)
+ *   7 - Cylindrical Image Map  **** IMAGE MAPS REQUIRE the filename 
+ *   8 - Spherical Image Map         of the image be put in imap[]
+ *   9 - Planar Image Map            part of the texture...
+ *        planar requires uaxs, and vaxs..
+ *
+ *******************************************************************/
+
+/********************************************/
+/* Functions implemented to provide the API */
+/********************************************/
+
+vector rt_vector(apiflt x, apiflt y, apiflt z); /* helper to make vectors */
+color  rt_color(apiflt r, apiflt g, apiflt b);  /* helper to make colors */
+
+void rt_initialize();/* reset raytracer, memory deallocation */
+void rt_finalize(void); /* close down for good.. */
+
+SceneHandle rt_newscene(void);        /* allocate new scene */
+void rt_deletescene(SceneHandle); /* delete a scene */
+void rt_renderscene(SceneHandle); /* raytrace the current scene */  
+void rt_outputfile(SceneHandle, const char * outname); 
+void rt_resolution(SceneHandle, int hres, int vres);
+void rt_verbose(SceneHandle, int v);
+void rt_rawimage(SceneHandle, unsigned char *rawimage);
+void rt_background(SceneHandle, color);
+
+/* Parameter values for rt_boundmode() */
+#define RT_BOUNDING_DISABLED 0
+#define RT_BOUNDING_ENABLED  1
+
+void rt_boundmode(SceneHandle, int);
+void rt_boundthresh(SceneHandle, int);
+
+/* Parameter values for rt_displaymode() */
+#define RT_DISPLAY_DISABLED  0
+#define RT_DISPLAY_ENABLED   1
+
+void rt_displaymode(SceneHandle, int);
+
+void rt_scenesetup(SceneHandle, char *, int, int, int);
+  /* scene, output filename, horizontal resolution, vertical resolution,
+            verbose mode */
+
+
+void rt_camerasetup(SceneHandle, apiflt, apiflt, int, int,
+	vector, vector,  vector);
+  /* camera parms: scene, zoom, aspectratio, antialiasing, raydepth,
+		camera center, view direction, up direction */
+
+
+
+void * rt_texture(apitexture *);
+   /* pointer to the texture struct that would have been passed to each 
+      object() call in older revisions.. */
+
+
+
+
+void rt_light(void * , vector, apiflt);     /* add a light */
+  /* light parms: texture, center, radius */ 
+
+void rt_sphere(void *, vector, apiflt);    /* add a sphere */
+  /* sphere parms: texture, center, radius */
+
+void rt_scalarvol(void *, vector, vector,
+		 int, int, int, char *, void *); 
+
+void rt_extvol(void *, vector, vector, int, apiflt (* evaluator)(apiflt, apiflt, apiflt)); 
+
+void rt_box(void *, vector, vector);  
+  /* box parms: texture, min, max */
+
+void rt_plane(void *, vector, vector);  
+  /* plane parms: texture, center, normal */
+
+void rt_ring(void *, vector, vector, apiflt, apiflt); 
+  /* ring parms: texture, center, normal, inner, outer */
+
+void rt_tri(void *, vector, vector, vector);  
+  /* tri parms: texture, vertex 0, vertex 1, vertex 2 */
+
+void rt_stri(void *, vector, vector, vector, 
+			vector, vector, vector); 
+ /* stri parms: texture, vertex 0, vertex 1, vertex 2, norm 0, norm 1, norm 2 */
+
+void rt_heightfield(void *, vector, int, int, apiflt *, apiflt, apiflt);
+  /* field parms: texture, center, m, n, field, wx, wy */
+
+void rt_landscape(void *, int, int, vector,  apiflt, apiflt);
+
+void rt_quadsphere(void *, vector, apiflt); /* add quadric sphere */
+  /* sphere parms: texture, center, radius */
+
+void rt_cylinder(void *, vector, vector, apiflt);
+
+void rt_fcylinder(void *, vector, vector, apiflt);
+
+void rt_polycylinder(void *, vector *, int, apiflt);
+
+
+/* new texture handling routines */
+void rt_tex_color(void * voidtex, color col); 
+
+#define RT_PHONG_PLASTIC 0
+#define RT_PHONG_METAL   1
+void rt_tex_phong(void * voidtex, apiflt phong, apiflt phongexp, int type); 
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apigeom.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apigeom.cpp
new file mode 100644
index 00000000..e8b61198
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apigeom.cpp
@@ -0,0 +1,268 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * api.cpp - This file contains all of the API calls that are defined for
+ *         external driver code to use.  
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "api.h"
+#include "macros.h"
+#include "vector.h"
+
+#define MyVNorm(a)		VNorm ((vector *) a)
+
+void rt_polycylinder(void * tex, vector * points, int numpts, apiflt rad) {
+  vector a;
+  int i;
+
+  if ((points == NULL) || (numpts == 0)) {
+    return;
+  }
+
+  if (numpts > 0) {
+    rt_sphere(tex, points[0], rad);
+    
+    if (numpts > 1) {
+      for (i=1; i<numpts; i++) {
+        a.x = points[i].x - points[i-1].x;
+        a.y = points[i].y - points[i-1].y;
+        a.z = points[i].z - points[i-1].z;
+        
+        rt_fcylinder(tex, points[i-1], a, rad);
+        rt_sphere(tex, points[i], rad);
+      }
+    }
+  }
+}
+
+void rt_heightfield(void * tex, vector ctr, int m, int n, 
+                    apiflt * field, apiflt wx, apiflt wy) {
+  int xx,yy; 
+  vector v0, v1, v2; 
+  apiflt xoff, yoff, zoff;
+
+  xoff=ctr.x - (wx / 2.0);
+  yoff=ctr.z - (wy / 2.0);
+  zoff=ctr.y;
+
+  for (yy=0; yy<(n-1); yy++) { 
+    for (xx=0; xx<(m-1); xx++) {
+      v0.x=wx*(xx    )/(m*1.0) + xoff; 
+      v0.y=field[(yy    )*m + (xx    )] + zoff;
+      v0.z=wy*(yy    )/(n*1.0) + yoff;
+
+      v1.x=wx*(xx + 1)/(m*1.0) + xoff; 
+      v1.y=field[(yy    )*m + (xx + 1)] + zoff;
+      v1.z=wy*(yy    )/(n*1.0) + yoff;
+
+      v2.x=wx*(xx + 1)/(m*1.0) + xoff; 
+      v2.y=field[(yy + 1)*m + (xx + 1)] + zoff;
+      v2.z=wy*(yy + 1)/(n*1.0) + yoff;
+
+      rt_tri(tex, v1, v0, v2);
+
+      v0.x=wx*(xx    )/(m*1.0) + xoff;
+      v0.y=field[(yy    )*m + (xx    )] + zoff;
+      v0.z=wy*(yy    )/(n*1.0) + yoff;
+
+      v1.x=wx*(xx    )/(m*1.0) + xoff;
+      v1.y=field[(yy + 1)*m + (xx    )] + zoff;
+      v1.z=wy*(yy + 1)/(n*1.0) + yoff;
+
+      v2.x=wx*(xx + 1)/(m*1.0) + xoff;
+      v2.y=field[(yy + 1)*m + (xx + 1)] + zoff;
+      v2.z=wy*(yy + 1)/(n*1.0) + yoff;
+ 
+      rt_tri(tex, v0, v1, v2);
+    }
+  } 
+} /* end of heightfield */
+
+
+static void rt_sheightfield(void * tex, vector ctr, int m, int n, 
+                    apiflt * field, apiflt wx, apiflt wy) {
+  vector * vertices;
+  vector * normals;
+  vector offset;
+  apiflt xinc, yinc;
+  int x, y, addr; 
+   
+  vertices = (vector *) malloc(m*n*sizeof(vector));
+  normals = (vector *) malloc(m*n*sizeof(vector));
+
+  offset.x = ctr.x - (wx / 2.0);
+  offset.y = ctr.z - (wy / 2.0);
+  offset.z = ctr.y;
+
+  xinc = wx / ((apiflt) m);
+  yinc = wy / ((apiflt) n);
+
+  /* build vertex list */
+  for (y=0; y<n; y++) { 
+    for (x=0; x<m; x++) {
+      addr = y*m + x;
+      vertices[addr] = rt_vector(
+        x * xinc + offset.x,
+        field[addr] + offset.z,
+        y * yinc + offset.y);
+    }
+  }
+
+  /* build normals from vertex list */
+  for (x=1; x<m; x++) {
+    normals[x] = normals[(n - 1)*m + x] = rt_vector(0.0, 1.0, 0.0);
+  }
+  for (y=1; y<n; y++) {
+    normals[y*m] = normals[y*m + (m-1)] = rt_vector(0.0, 1.0, 0.0);
+  }
+  for (y=1; y<(n-1); y++) {
+    for (x=1; x<(m-1); x++) {
+      addr = y*m + x;
+
+      normals[addr] = rt_vector(
+        -(field[addr + 1] - field[addr - 1]) / (2.0 * xinc), 
+        1.0, 
+        -(field[addr + m] - field[addr - m]) / (2.0 * yinc));
+
+      MyVNorm(&normals[addr]);
+    }
+  }    
+
+  /* generate actual triangles */
+  for (y=0; y<(n-1); y++) {
+    for (x=0; x<(m-1); x++) {
+      addr = y*m + x;
+
+      rt_stri(tex, vertices[addr], vertices[addr + 1 + m], vertices[addr + 1],
+                   normals[addr], normals[addr + 1 + m], normals[addr + 1]);
+      rt_stri(tex, vertices[addr], vertices[addr + m], vertices[addr + 1 + m],
+                   normals[addr], normals[addr + m], normals[addr + 1 + m]);
+    }
+  }
+
+  free(normals);
+  free(vertices);
+} /* end of smoothed heightfield */
+
+
+static void adjust(apiflt *base, int xres, int yres, apiflt wx, apiflt wy, 
+		int xa, int ya, int x, int y, int xb, int yb) {
+  apiflt d, v;
+  
+  if (base[x + (xres*y)]==0.0) { 
+
+    d=(abs(xa - xb) / (xres * 1.0))*wx + (abs(ya - yb) / (yres * 1.0))*wy; 
+
+    v=(base[xa + (xres*ya)] + base[xb + (xres*yb)]) / 2.0 +
+       (((((rand() % 1000) - 500.0)/500.0)*d) / 8.0);
+
+    if (v < 0.0) v=0.0; 
+    if (v > (xres + yres)) v=(xres + yres);
+    base[x + (xres * y)]=v; 
+ } 
+}
+
+static void subdivide(apiflt *base, int xres, int yres, apiflt wx, apiflt wy,
+                  int x1, int y1, int x2, int y2) {
+  long x,y;
+
+  if (((x2 - x1) < 2) && ((y2 - y1) < 2)) { return; }
+
+  x=(x1 + x2) / 2;
+  y=(y1 + y2) / 2;
+
+  adjust(base, xres, yres, wx, wy, x1, y1, x, y1, x2, y1);
+  adjust(base, xres, yres, wx, wy, x2, y1, x2, y, x2, y2);
+  adjust(base, xres, yres, wx, wy, x1, y2, x, y2, x2, y2);
+  adjust(base, xres, yres, wx, wy, x1, y1, x1, y, x1, y2);
+
+ 
+  if (base[x + xres*y]==0.0) {
+    base[x + (xres * y)]=(base[x1 + xres*y1] + base[x2 + xres*y1] +
+                          base[x2 + xres*y2] + base[x1 + xres*y2]   )/4.0;
+  }
+ 
+  subdivide(base, xres, yres, wx, wy, x1, y1 ,x ,y);
+  subdivide(base, xres, yres, wx, wy, x, y1, x2, y);
+  subdivide(base, xres, yres, wx, wy, x, y, x2, y2);
+  subdivide(base, xres, yres, wx, wy, x1, y, x, y2);
+}
+
+void rt_landscape(void * tex, int m, int n, 
+              	vector ctr, apiflt wx, apiflt wy) {
+  int totalsize, x, y;
+  apiflt * field; 
+
+  totalsize=m*n;
+
+  srand(totalsize);
+
+  field=(apiflt *) malloc(totalsize*sizeof(apiflt));
+
+  for (y=0; y<n; y++) {
+    for (x=0; x<m; x++) {
+       field[x + y*m]=0.0;
+    }
+  }
+
+  field[0 + 0]=1.0 + (rand() % 100)/100.0;
+  field[m - 1]=1.0 + (rand() % 100)/100.0;
+  field[0     + m*(n - 1)]=1.0 + (rand() % 100)/100.0;
+  field[m - 1 + m*(n - 1)]=1.0 + (rand() % 100)/100.0;
+
+  subdivide(field, m, n, wx, wy, 0, 0, m-1, n-1);
+
+  rt_sheightfield(tex, ctr, m, n, field, wx, wy);
+
+  free(field);
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apitrigeom.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apitrigeom.cpp
new file mode 100644
index 00000000..7be974d8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apitrigeom.cpp
@@ -0,0 +1,226 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * apitrigeom.cpp - This file contains code for generating triangle tesselated
+ *                geometry, for use with OpenGL, XGL, etc.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "api.h"
+#include "macros.h"
+#include "vector.h"
+
+#define MyVNorm(a)		VNorm ((vector *) a)
+#define MyVCross(a,b,c)		VCross ((vector *) a, (vector *) b, (vector *) c)
+#define MyVAddS(x,a,b,c)	VAddS ((flt) x, (vector *) a, (vector *) b, (vector *) c)
+
+#define CYLFACETS 36
+#define RINGFACETS 36
+#define SPHEREFACETS 25
+
+void rt_tri_fcylinder(void * tex, vector ctr, vector axis, apiflt rad) {
+  vector x, y, z, tmp;
+  double u, v, u2, v2;
+  int j;
+  vector p1, p2, p3, p4;
+  vector n1, n2;
+
+  z = axis;
+  MyVNorm(&z);
+  tmp.x = z.y - 2.1111111;
+  tmp.y = -z.z + 3.14159267;
+  tmp.z = z.x - 3.915292342341;
+  MyVNorm(&z);
+  MyVNorm(&tmp);
+  MyVCross(&z, &tmp, &x);
+  MyVNorm(&x);
+  MyVCross(&x, &z, &y);
+  MyVNorm(&y);
+
+  for (j=0; j<CYLFACETS; j++) {
+     u = rad * sin((6.28 * j) / (CYLFACETS - 1.0));
+     v = rad * cos((6.28 * j) / (CYLFACETS - 1.0));
+    u2 = rad * sin((6.28 * (j + 1.0)) / (CYLFACETS - 1.0));
+    v2 = rad * cos((6.28 * (j + 1.0)) / (CYLFACETS - 1.0));
+
+    p1.x = p1.y = p1.z = 0.0;
+    p4 = p3 = p2 = p1;
+
+    MyVAddS(u, &x, &p1, &p1);
+    MyVAddS(v, &y, &p1, &p1);
+    n1 = p1;
+    MyVNorm(&n1);
+    MyVAddS(1.0, &ctr, &p1, &p1);
+  
+
+    MyVAddS(u2, &x, &p2, &p2);
+    MyVAddS(v2, &y, &p2, &p2);
+    n2 = p2;
+    MyVNorm(&n2);
+    MyVAddS(1.0, &ctr, &p2, &p2);
+
+    MyVAddS(1.0, &axis, &p1, &p3);
+    MyVAddS(1.0, &axis, &p2, &p4);
+
+    rt_stri(tex, p1, p2, p3, n1, n2, n1);
+    rt_stri(tex, p3, p2, p4, n1, n2, n2);
+  }
+}
+
+void rt_tri_cylinder(void * tex, vector ctr, vector axis, apiflt rad) {
+  rt_fcylinder(tex, ctr, axis, rad);
+}
+
+void rt_tri_ring(void * tex, vector ctr, vector norm, apiflt a, apiflt b) {
+  vector x, y, z, tmp;
+  double u, v, u2, v2;
+  int j;
+  vector p1, p2, p3, p4;
+  vector n1, n2;
+
+  z = norm;
+  MyVNorm(&z);
+  tmp.x = z.y - 2.1111111;
+  tmp.y = -z.z + 3.14159267;
+  tmp.z = z.x - 3.915292342341;
+  MyVNorm(&z);
+  MyVNorm(&tmp);
+  MyVCross(&z, &tmp, &x);
+  MyVNorm(&x);
+  MyVCross(&x, &z, &y);
+  MyVNorm(&y);
+
+  for (j=0; j<RINGFACETS; j++) {
+     u = sin((6.28 * j) / (RINGFACETS - 1.0));
+     v = cos((6.28 * j) / (RINGFACETS - 1.0));
+    u2 = sin((6.28 * (j + 1.0)) / (RINGFACETS - 1.0));
+    v2 = cos((6.28 * (j + 1.0)) / (RINGFACETS - 1.0));
+
+    p1.x = p1.y = p1.z = 0.0;
+    p4 = p3 = p2 = p1;
+
+    MyVAddS(u, &x, &p1, &p1);
+    MyVAddS(v, &y, &p1, &p1);
+    n1 = p1;
+    MyVNorm(&n1);
+    MyVAddS(a, &n1, &ctr, &p1);
+    MyVAddS(b, &n1, &ctr, &p3);
+
+    MyVAddS(u2, &x, &p2, &p2);
+    MyVAddS(v2, &y, &p2, &p2);
+    n2 = p2;
+    MyVNorm(&n2);
+    MyVAddS(a, &n2, &ctr, &p2);
+    MyVAddS(b, &n2, &ctr, &p4);
+
+    rt_stri(tex, p1, p2, p3, norm, norm, norm);
+    rt_stri(tex, p3, p2, p4, norm, norm, norm);
+
+  }
+} 
+
+void rt_tri_box(void * tex, vector min, vector max) {
+  /* -XY face */
+  rt_tri(tex, rt_vector(min.x, min.y, min.z),
+              rt_vector(min.x, max.y, min.z), 
+              rt_vector(max.x, max.y, min.z));
+  rt_tri(tex, rt_vector(min.x, min.y, min.z),
+              rt_vector(max.x, max.y, min.z), 
+              rt_vector(max.x, min.y, min.z));
+
+  /* +XY face */
+  rt_tri(tex, rt_vector(min.x, min.y, max.z),
+              rt_vector(max.x, max.y, max.z),
+              rt_vector(min.x, max.y, max.z)); 
+  rt_tri(tex, rt_vector(min.x, min.y, max.z),
+              rt_vector(max.x, min.y, max.z),
+              rt_vector(max.x, max.y, max.z)); 
+
+  /* -YZ face */
+  rt_tri(tex, rt_vector(min.x, min.y, min.z),
+              rt_vector(min.x, max.y, max.z),
+              rt_vector(min.x, min.y, max.z)); 
+  rt_tri(tex, rt_vector(min.x, min.y, min.z),
+              rt_vector(min.x, max.y, min.z),
+              rt_vector(min.x, max.y, max.z)); 
+
+  /* +YZ face */
+  rt_tri(tex, rt_vector(max.x, min.y, min.z),
+              rt_vector(max.x, min.y, max.z),
+              rt_vector(max.x, max.y, max.z));
+  rt_tri(tex, rt_vector(max.x, min.y, min.z),
+              rt_vector(max.x, max.y, max.z),
+              rt_vector(max.x, max.y, min.z));
+
+  /* -XZ face */
+  rt_tri(tex, rt_vector(min.x, min.y, min.z),
+              rt_vector(min.x, min.y, max.z), 
+              rt_vector(max.x, min.y, max.z));
+  rt_tri(tex, rt_vector(min.x, min.y, min.z),
+              rt_vector(max.x, min.y, max.z), 
+              rt_vector(max.x, min.y, min.z));
+
+  /* +XZ face */
+  rt_tri(tex, rt_vector(min.x, max.y, min.z),
+              rt_vector(max.x, max.y, max.z),
+              rt_vector(min.x, max.y, max.z)); 
+  rt_tri(tex, rt_vector(min.x, max.y, min.z),
+              rt_vector(max.x, max.y, min.z),
+              rt_vector(max.x, max.y, max.z)); 
+}
+
+void rt_tri_sphere(void * tex, vector ctr, apiflt rad) {
+}
+
+void rt_tri_plane(void * tex, vector ctr, vector norm) {
+  rt_tri_ring(tex, ctr, norm, 0.0, 10000.0);
+} 
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apitrigeom.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apitrigeom.h
new file mode 100644
index 00000000..9a04136c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/apitrigeom.h
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * apitrigeom.h - header for functions to generate triangle tesselated 
+ *                geometry for use with OpenGL, XGL, etc.
+ *
+ */
+
+void rt_tri_fcylinder(void * tex, vector ctr, vector axis, apiflt rad);
+void rt_tri_cylinder(void * tex, vector ctr, vector axis, apiflt rad);
+void rt_tri_ring(void * tex, vector ctr, vector norm, apiflt a, apiflt b);
+void rt_tri_plane(void * tex, vector ctr, vector norm);
+void rt_tri_box(void * tex, vector min, vector max);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/bndbox.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/bndbox.cpp
new file mode 100644
index 00000000..1d19283a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/bndbox.cpp
@@ -0,0 +1,182 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * bndbox.cpp - This file contains the functions for dealing with bounding boxes.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define BNDBOX_PRIVATE
+#include "bndbox.h"
+
+static object_methods bndbox_methods = {
+  (void (*)(void *, void *))(bndbox_intersect),
+  (void (*)(void *, void *, void *, void *))(NULL),
+  bndbox_bbox, 
+  free_bndbox 
+};
+
+
+bndbox * newbndbox(vector min, vector max) {
+  bndbox * b;
+  
+  b=(bndbox *) rt_getmem(sizeof(bndbox));
+  memset(b, 0, sizeof(bndbox));
+  b->min=min;
+  b->max=max;
+  b->methods = &bndbox_methods;
+
+  b->objlist=NULL;
+  b->tex=NULL;
+  b->nextobj=NULL;
+  return b;
+}
+
+
+static int bndbox_bbox(void * obj, vector * min, vector * max) {
+  bndbox * b = (bndbox *) obj;
+
+  *min = b->min;
+  *max = b->max;
+
+  return 1;
+}
+
+
+static void free_bndbox(void * v) {
+  bndbox * b = (bndbox *) v; 
+
+  free_objects(b->objlist);  
+ 
+  free(b);
+}
+
+
+static void bndbox_intersect(bndbox * bx, ray * ry) {
+  flt a, tx1, tx2, ty1, ty2, tz1, tz2;
+  flt tnear, tfar;
+  object * obj;
+  ray newray; 
+
+  /* eliminate bounded rays whose bounds do not intersect  */
+  /* the bounds of the box..                               */
+  if (ry->flags & RT_RAY_BOUNDED) {
+    if ((ry->s.x > bx->max.x) && (ry->e.x > bx->max.x)) return;
+    if ((ry->s.x < bx->min.x) && (ry->e.x < bx->min.x)) return;
+  
+    if ((ry->s.y > bx->max.y) && (ry->e.y > bx->max.y)) return;
+    if ((ry->s.y < bx->min.y) && (ry->e.y < bx->min.y)) return;
+
+    if ((ry->s.z > bx->max.z) && (ry->e.z > bx->max.z)) return;
+    if ((ry->s.z < bx->min.z) && (ry->e.z < bx->min.z)) return;
+  }
+
+  tnear= -FHUGE;
+  tfar= FHUGE;
+
+  if (ry->d.x == 0.0) {
+    if ((ry->o.x < bx->min.x) || (ry->o.x > bx->max.x)) return;
+  }
+  else { 
+    tx1 = (bx->min.x - ry->o.x) / ry->d.x;
+    tx2 = (bx->max.x - ry->o.x) / ry->d.x;
+    if (tx1 > tx2) { a=tx1; tx1=tx2; tx2=a; } 
+    if (tx1 > tnear) tnear=tx1;   
+    if (tx2 < tfar)   tfar=tx2;   
+  }  
+  if (tnear > tfar) return; 
+  if (tfar < 0.0) return;
+  
+  if (ry->d.y == 0.0) { 
+    if ((ry->o.y < bx->min.y) || (ry->o.y > bx->max.y)) return;
+  }
+  else { 
+    ty1 = (bx->min.y - ry->o.y) / ry->d.y;
+    ty2 = (bx->max.y - ry->o.y) / ry->d.y;
+    if (ty1 > ty2) { a=ty1; ty1=ty2; ty2=a; } 
+    if (ty1 > tnear) tnear=ty1;   
+    if (ty2 < tfar)   tfar=ty2;   
+  } 
+  if (tnear > tfar) return; 
+  if (tfar < 0.0) return;
+ 
+  if (ry->d.z == 0.0) { 
+    if ((ry->o.z < bx->min.z) || (ry->o.z > bx->max.z)) return;
+  }
+  else { 
+    tz1 = (bx->min.z - ry->o.z) / ry->d.z;
+    tz2 = (bx->max.z - ry->o.z) / ry->d.z;
+    if (tz1 > tz2) { a=tz1; tz1=tz2; tz2=a; } 
+    if (tz1 > tnear) tnear=tz1;   
+    if (tz2 < tfar)   tfar=tz2;   
+  } 
+  if (tnear > tfar) return; 
+  if (tfar < 0.0) return;
+
+
+  /* intersect all of the enclosed objects */
+  newray=*ry;
+  newray.flags |= RT_RAY_BOUNDED;
+
+  RAYPNT(newray.s , (*ry) , tnear); 
+  RAYPNT(newray.e , (*ry) , (tfar + EPSILON)); 
+ 
+  obj = bx->objlist;
+  while (obj != NULL) {
+    obj->methods->intersect(obj, &newray); 
+    obj = (object *)obj->nextobj;
+  }
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/bndbox.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/bndbox.h
new file mode 100644
index 00000000..968a4ab9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/bndbox.h
@@ -0,0 +1,74 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * bndbox.h - This file contains the defines for bounding boxes etc.
+ *
+ *  $Id: bndbox.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+ 
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector min;
+  vector max;
+  object * objlist;
+} bndbox; 
+
+bndbox * newbndbox(vector min, vector max);
+
+#ifdef BNDBOX_PRIVATE
+
+static int bndbox_bbox(void * obj, vector * min, vector * max);
+static void free_bndbox(void * v);
+static void bndbox_intersect(bndbox *, ray *);
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/box.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/box.cpp
new file mode 100644
index 00000000..57445a6b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/box.cpp
@@ -0,0 +1,168 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * box.cpp - This file contains the functions for dealing with boxes.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "box.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+int box_bbox(void * obj, vector * min, vector * max) {
+  box * b = (box *) obj;
+
+  *min = b->min;
+  *max = b->max;
+
+  return 1;
+}
+
+static object_methods box_methods = {
+  (void (*)(void *, void *))(box_intersect),
+  (void (*)(void *, void *, void *, void *))(box_normal),
+  box_bbox, 
+  free 
+};
+
+box * newbox(void * tex, vector min, vector max) {
+  box * b;
+  
+  b=(box *) rt_getmem(sizeof(box));
+  memset(b, 0, sizeof(box));
+  b->methods = &box_methods;
+  b->tex = (texture *)tex;
+  b->min = min; 
+  b->max = max;
+
+  return b;
+}
+
+void box_intersect(box * bx, ray * ry) {
+  flt a, tx1, tx2, ty1, ty2, tz1, tz2;
+  flt tnear, tfar;
+
+  tnear= -FHUGE;
+  tfar= FHUGE;
+
+  if (ry->d.x == 0.0) {
+    if ((ry->o.x < bx->min.x) || (ry->o.x > bx->max.x)) return;
+  }
+  else {
+    tx1 = (bx->min.x - ry->o.x) / ry->d.x;
+    tx2 = (bx->max.x - ry->o.x) / ry->d.x;
+    if (tx1 > tx2) { a=tx1; tx1=tx2; tx2=a; } 
+    if (tx1 > tnear) tnear=tx1;   
+    if (tx2 < tfar)   tfar=tx2;   
+  } 
+  if (tnear > tfar) return; 
+  if (tfar < 0.0) return;
+  
+  if (ry->d.y == 0.0) { 
+    if ((ry->o.y < bx->min.y) || (ry->o.y > bx->max.y)) return;
+  }
+  else {
+    ty1 = (bx->min.y - ry->o.y) / ry->d.y;
+    ty2 = (bx->max.y - ry->o.y) / ry->d.y;
+    if (ty1 > ty2) { a=ty1; ty1=ty2; ty2=a; } 
+    if (ty1 > tnear) tnear=ty1;   
+    if (ty2 < tfar)   tfar=ty2;   
+  }
+  if (tnear > tfar) return; 
+  if (tfar < 0.0) return;
+ 
+  if (ry->d.z == 0.0) { 
+    if ((ry->o.z < bx->min.z) || (ry->o.z > bx->max.z)) return;
+  }
+  else {
+    tz1 = (bx->min.z - ry->o.z) / ry->d.z;
+    tz2 = (bx->max.z - ry->o.z) / ry->d.z;
+    if (tz1 > tz2) { a=tz1; tz1=tz2; tz2=a; } 
+    if (tz1 > tnear) tnear=tz1;   
+    if (tz2 < tfar)   tfar=tz2;   
+  }
+  if (tnear > tfar) return; 
+  if (tfar < 0.0) return;
+
+  add_intersection(tnear, (object *) bx, ry);
+  add_intersection(tfar, (object *) bx, ry);
+}
+
+void box_normal(box * bx, vector  * pnt, ray * incident, vector * N) {
+  vector a, b, c; 
+  flt t;
+ 
+  c.x=(bx->max.x + bx->min.x) / 2.0;
+  c.y=(bx->max.y + bx->min.y) / 2.0;
+  c.z=(bx->max.z + bx->min.z) / 2.0;
+ 
+  VSub((vector *) pnt, &c, N);
+  b=(*N);
+
+  a.x=fabs(N->x);
+  a.y=fabs(N->y);
+  a.z=fabs(N->z);
+ 
+  N->x=0.0;  N->y=0.0;  N->z=0.0;
+
+  t=MYMAX(a.x, MYMAX(a.y, a.z));  
+
+  if (t==a.x) N->x=b.x;  
+
+  if (t==a.y) N->y=b.y; 
+
+  if (t==a.z) N->z=b.z;
+
+  VNorm(N);
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/box.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/box.h
new file mode 100644
index 00000000..eaf63a73
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/box.h
@@ -0,0 +1,69 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * box.h - This file contains the defines for boxes etc.
+ *
+ *  $Id: box.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+ 
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector min;
+  vector max;
+} box; 
+
+
+box * newbox(void * tex, vector min, vector max);
+void box_intersect(box *, ray *);
+void box_normal(box *, vector *, ray * incident, vector *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/camera.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/camera.cpp
new file mode 100644
index 00000000..d53c0fe4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/camera.cpp
@@ -0,0 +1,109 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * camera.cpp - This file contains all of the functions for doing camera work.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "camera.h"
+#include "util.h"
+
+ray camray(scenedef *scene, int x, int y) {
+  ray ray1, newray;
+  vector projcent;
+  vector projpixel;
+  flt px, py, sx, sy;
+
+  sx = (flt) scene->hres; 
+  sy = (flt) scene->vres;
+
+  /* calculate the width and height of the image plane given the */
+  /* aspect ratio, image resolution, and zoom factor */
+
+  px=((sx / sy) / scene->aspectratio) / scene->camzoom;
+  py=1.0 / scene->camzoom;    
+
+  /* assuming viewvec is a unit vector, then the center of the */
+  /* image plane is the camera center + vievec                 */
+  projcent.x = scene->camcent.x + scene->camviewvec.x;
+  projcent.y = scene->camcent.y + scene->camviewvec.y;
+  projcent.z = scene->camcent.z + scene->camviewvec.z;
+
+  /* starting from the center of the image plane, we move the   */
+  /* center of the pel we're calculating, to                    */ 
+  /* projcent + (rightvec * x distance)                         */
+  ray1.o=projcent;
+  ray1.d=scene->camrightvec;
+  projpixel=Raypnt(&ray1, ((x*px/sx) - (px / 2.0))); 
+
+  /* starting from the horizontally translated pel, we move the */
+  /* center of the pel we're calculating, to                    */ 
+  /* projcent + (upvec * y distance)                            */
+  ray1.o=projpixel;
+  ray1.d=scene->camupvec;
+  projpixel=Raypnt(&ray1, ((y*py/sy) - (py / 2.0)));
+
+  /* now that we have the exact pel center in the image plane */
+  /* we create the real primary ray that will be used by the  */
+  /* rest of the system.                                      */
+  /* The ray is expected to be re-normalized elsewhere, we're */
+  /* only really concerned about getting its direction right. */
+  newray.o=scene->camcent;
+  VSub(&projpixel, &scene->camcent, &newray.d);
+  newray.depth = scene->raydepth;
+  newray.flags = RT_RAY_REGULAR;  /* camera only generates primary rays */
+
+  return newray;
+}
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/camera.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/camera.h
new file mode 100644
index 00000000..726bd387
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/camera.h
@@ -0,0 +1,56 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * camera.h - This file contains the defines for camera routines etc.
+ *
+ *  $Id: camera.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+ray  camray(scenedef *, int, int);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/coordsys.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/coordsys.cpp
new file mode 100644
index 00000000..7576f92d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/coordsys.cpp
@@ -0,0 +1,96 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * coordsys.cpp -  Routines to translate from one coordinate system to another.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "coordsys.h"
+
+void xytopolar(flt x, flt y, flt rad, flt * u, flt * v) {
+  flt r1;
+  r1=x*x + y*y;  
+  *v=sqrt(r1 / (rad*rad));
+  if (y<0.0) 
+    *u=1.0 - acos(x/sqrt(r1))/TWOPI;
+  else 
+    *u= acos(x/sqrt(r1))/TWOPI; 
+}
+
+void xyztocyl(vector pnt, flt height, flt * u, flt * v) {
+  flt r1;
+
+  r1=pnt.x*pnt.x + pnt.y*pnt.y;
+
+  *v=pnt.z / height;
+  if (pnt.y<0.0) 
+    *u=1.0 - acos(pnt.x/sqrt(r1))/TWOPI;
+  else 
+    *u=acos(pnt.x/sqrt(r1))/TWOPI;
+}
+
+void xyztospr(vector pnt, flt * u, flt * v) {
+  flt r1, phi, theta;
+ 
+  r1=sqrt(pnt.x*pnt.x + pnt.y*pnt.y + pnt.z*pnt.z);
+
+  phi=acos(-pnt.y/r1);   
+  *v=phi/3.1415926;
+
+  theta=acos((pnt.x/r1)/sin(phi))/TWOPI;
+
+  if (pnt.z > 0.0) 
+    *u = theta;
+  else 
+    *u = 1 - theta; 
+}
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/coordsys.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/coordsys.h
new file mode 100644
index 00000000..05291885
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/coordsys.h
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * coordsys.h - defines for coordinate system routines.
+ *  
+ *  $Id: coordsys.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+#define TWOPI 6.2831853
+
+void xytopolar(flt, flt, flt, flt *, flt *);
+void xyztocyl(vector, flt, flt *, flt *);
+void xyztospr(vector, flt *, flt *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/cylinder.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/cylinder.cpp
new file mode 100644
index 00000000..52baa438
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/cylinder.cpp
@@ -0,0 +1,271 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * cylinder.cpp - This file contains the functions for dealing with cylinders.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define CYLINDER_PRIVATE 
+#include "cylinder.h"
+
+static object_methods cylinder_methods = {
+  (void (*)(void *, void *))(cylinder_intersect),
+  (void (*)(void *, void *, void *, void *))(cylinder_normal),
+  cylinder_bbox, 
+  free 
+};
+
+static object_methods fcylinder_methods = {
+  (void (*)(void *, void *))(fcylinder_intersect),
+  (void (*)(void *, void *, void *, void *))(cylinder_normal),
+  fcylinder_bbox, 
+  free 
+};
+
+
+object * newcylinder(void * tex, vector ctr, vector axis, flt rad) {
+  cylinder * c;
+  
+  c=(cylinder *) rt_getmem(sizeof(cylinder));
+  memset(c, 0, sizeof(cylinder));
+  c->methods = &cylinder_methods;
+
+  c->tex=(texture *) tex;
+  c->ctr=ctr;
+  c->axis=axis;
+  c->rad=rad;
+  return (object *) c;
+}
+
+static int cylinder_bbox(void * obj, vector * min, vector * max) {
+  return 0; /* infinite / unbounded object */
+}
+
+static void cylinder_intersect(cylinder * cyl, ray * ry) {
+  vector rc, n, D, O;  
+  flt t, s, tin, tout, ln, d; 
+
+  rc.x = ry->o.x - cyl->ctr.x;
+  rc.y = ry->o.y - cyl->ctr.y;
+  rc.z = ry->o.z - cyl->ctr.z; 
+
+  VCross(&ry->d, &cyl->axis, &n);
+
+  VDOT(ln, n, n);
+  ln=sqrt(ln);    /* finish length calculation */
+
+  if (ln == 0.0) {  /* ray is parallel to the cylinder.. */
+    VDOT(d, rc, cyl->axis);         
+    D.x = rc.x - d * cyl->axis.x; 
+    D.y = rc.y - d * cyl->axis.y;
+    D.z = rc.z - d * cyl->axis.z;
+    VDOT(d, D, D);
+    d = sqrt(d);
+    tin = -FHUGE;
+    tout = FHUGE;
+    /* if (d <= cyl->rad) then ray is inside cylinder.. else outside */
+  }
+
+  VNorm(&n);
+  VDOT(d, rc, n);
+  d = fabs(d); 
+
+  if (d <= cyl->rad) {  /* ray intersects cylinder.. */
+    VCross(&rc, &cyl->axis, &O);
+    VDOT(t, O, n);
+    t = - t / ln;
+    VCross(&n, &cyl->axis, &O); 
+    VNorm(&O);
+    VDOT(s, ry->d, O);
+    s = fabs(sqrt(cyl->rad*cyl->rad - d*d) / s);
+    tin = t - s;
+    add_intersection(tin, (object *) cyl, ry); 
+    tout = t + s;
+    add_intersection(tout, (object *) cyl, ry);
+  }
+}
+
+static void cylinder_normal(cylinder * cyl, vector * pnt, ray * incident, vector * N) {
+  vector a,b,c;
+  flt t;
+
+  VSub((vector *) pnt, &(cyl->ctr), &a);
+
+  c=cyl->axis;
+
+  VNorm(&c);
+ 
+  VDOT(t, a, c);
+
+  b.x = c.x * t + cyl->ctr.x; 
+  b.y = c.y * t + cyl->ctr.y;
+  b.z = c.z * t + cyl->ctr.z;
+
+  VSub(pnt, &b, N); 
+  VNorm(N);
+
+  if (VDot(N, &(incident->d)) > 0.0)  { /* make cylinder double sided */
+    N->x=-N->x;
+    N->y=-N->y;
+    N->z=-N->z;
+  } 
+}
+
+object * newfcylinder(void * tex, vector ctr, vector axis, flt rad) {
+  cylinder * c;
+  
+  c=(cylinder *) rt_getmem(sizeof(cylinder));
+  memset(c, 0, sizeof(cylinder));
+  c->methods = &fcylinder_methods;
+
+  c->tex=(texture *) tex;
+  c->ctr=ctr;
+  c->axis=axis;
+  c->rad=rad;
+
+  return (object *) c;
+}
+
+static int fcylinder_bbox(void * obj, vector * min, vector * max) {
+  cylinder * c = (cylinder *) obj;
+  vector mintmp, maxtmp;
+
+  mintmp.x = c->ctr.x;
+  mintmp.y = c->ctr.y;
+  mintmp.z = c->ctr.z;
+  maxtmp.x = c->ctr.x + c->axis.x;
+  maxtmp.y = c->ctr.y + c->axis.y;
+  maxtmp.z = c->ctr.z + c->axis.z;
+
+  min->x = MYMIN(mintmp.x, maxtmp.x);
+  min->y = MYMIN(mintmp.y, maxtmp.y);
+  min->z = MYMIN(mintmp.z, maxtmp.z);
+  min->x -= c->rad;
+  min->y -= c->rad;
+  min->z -= c->rad;
+
+  max->x = MYMAX(mintmp.x, maxtmp.x);
+  max->y = MYMAX(mintmp.y, maxtmp.y);
+  max->z = MYMAX(mintmp.z, maxtmp.z);
+  max->x += c->rad;
+  max->y += c->rad;
+  max->z += c->rad;
+
+  return 1;
+}
+
+
+static void fcylinder_intersect(cylinder * cyl, ray * ry) {
+  vector rc, n, O, hit, tmp2, ctmp4;
+  flt t, s, tin, tout, ln, d, tmp, tmp3;
+ 
+  rc.x = ry->o.x - cyl->ctr.x;  
+  rc.y = ry->o.y - cyl->ctr.y;
+  rc.z = ry->o.z - cyl->ctr.z;
+ 
+  VCross(&ry->d, &cyl->axis, &n);
+ 
+  VDOT(ln, n, n);
+  ln=sqrt(ln);    /* finish length calculation */
+ 
+  if (ln == 0.0) {  /* ray is parallel to the cylinder.. */
+    return;       /* in this case, we want to miss or go through the "hole" */
+  }
+ 
+  VNorm(&n);
+  VDOT(d, rc, n);
+  d = fabs(d);
+ 
+  if (d <= cyl->rad) {  /* ray intersects cylinder.. */
+    VCross(&rc, &cyl->axis, &O);
+    VDOT(t, O, n);
+    t = - t / ln;
+    VCross(&n, &cyl->axis, &O);
+    VNorm(&O);
+    VDOT(s, ry->d, O);
+    s = fabs(sqrt(cyl->rad*cyl->rad - d*d) / s);
+    tin = t - s;
+
+    RAYPNT(hit, (*ry), tin); 
+
+    ctmp4=cyl->axis;
+    VNorm(&ctmp4);
+
+    tmp2.x = hit.x - cyl->ctr.x;   
+    tmp2.y = hit.y - cyl->ctr.y;   
+    tmp2.z = hit.z - cyl->ctr.z;   
+
+    VDOT(tmp,  tmp2, ctmp4);
+    VDOT(tmp3, cyl->axis, cyl->axis);
+
+    if ((tmp > 0.0) && (tmp < sqrt(tmp3))) 
+      add_intersection(tin, (object *) cyl, ry);
+    tout = t + s;
+
+    RAYPNT(hit, (*ry), tout); 
+
+    tmp2.x = hit.x - cyl->ctr.x;   
+    tmp2.y = hit.y - cyl->ctr.y;   
+    tmp2.z = hit.z - cyl->ctr.z;   
+
+    VDOT(tmp,  tmp2, ctmp4); 
+    VDOT(tmp3, cyl->axis, cyl->axis);
+
+    if ((tmp > 0.0) && (tmp < sqrt(tmp3))) 
+      add_intersection(tout, (object *) cyl, ry);
+  }
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/cylinder.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/cylinder.h
new file mode 100644
index 00000000..e766454d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/cylinder.h
@@ -0,0 +1,78 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * cylinder.h - This file contains the defines for cylinders etc.
+ *
+ *  $Id: cylinder.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+object * newcylinder(void *, vector, vector, flt);
+object * newfcylinder(void *, vector, vector, flt);
+
+#ifdef CYLINDER_PRIVATE
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector ctr;
+  vector axis;
+  flt rad;
+} cylinder;
+
+static void cylinder_intersect(cylinder *, ray *);
+static void fcylinder_intersect(cylinder *, ray *);
+
+static int cylinder_bbox(void * obj, vector * min, vector * max);
+static int fcylinder_bbox(void * obj, vector * min, vector * max);
+
+static void cylinder_normal(cylinder *, vector *, ray *, vector *);
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/extvol.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/extvol.cpp
new file mode 100644
index 00000000..6dadb24d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/extvol.cpp
@@ -0,0 +1,311 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * extvol.cpp - Volume rendering helper routines etc.
+ */
+
+#include<stdio.h>
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "util.h"
+#include "box.h"
+#include "extvol.h"
+#include "trace.h"
+#include "sphere.h"
+#include "light.h"
+#include "shade.h"
+#include "global.h"
+
+
+int extvol_bbox(void * obj, vector * min, vector * max) {
+  box * b = (box *) obj;
+
+  *min = b->min;
+  *max = b->max;
+
+  return 1;
+}
+
+static object_methods extvol_methods = {
+  (void (*)(void *, void *))(box_intersect),
+  (void (*)(void *, void *, void *, void *))(box_normal),
+  extvol_bbox, 
+  free 
+};
+
+extvol * newextvol(void * voidtex, vector min, vector max, 
+                   int samples, flt (* evaluator)(flt, flt, flt)) { 
+  extvol * xvol;
+  texture * tex;
+  
+  tex = (texture *) voidtex;
+
+  xvol = (extvol *) rt_getmem(sizeof(extvol));
+  memset(xvol, 0, sizeof(extvol));
+
+  xvol->methods = &extvol_methods;
+
+  xvol->min=min;
+  xvol->max=max;
+  xvol->evaluator = evaluator;
+  xvol->ambient = tex->ambient;
+  xvol->diffuse = tex->diffuse;
+  xvol->opacity = tex->opacity;  
+  xvol->samples = samples;
+
+  xvol->tex = (texture *)rt_getmem(sizeof(texture));
+  memset(xvol->tex, 0, sizeof(texture));
+
+  xvol->tex->ctr.x = 0.0;
+  xvol->tex->ctr.y = 0.0;
+  xvol->tex->ctr.z = 0.0;
+  xvol->tex->rot = xvol->tex->ctr;
+  xvol->tex->scale = xvol->tex->ctr;
+  xvol->tex->uaxs = xvol->tex->ctr;
+  xvol->tex->vaxs = xvol->tex->ctr;
+  xvol->tex->islight = 0;
+  xvol->tex->shadowcast = 0;
+
+  xvol->tex->col=tex->col;
+  xvol->tex->ambient=1.0;
+  xvol->tex->diffuse=0.0;
+  xvol->tex->specular=0.0;
+  xvol->tex->opacity=1.0;
+  xvol->tex->img=NULL;
+  xvol->tex->texfunc=(color(*)(void *, void *, void *))(ext_volume_texture);
+  xvol->tex->obj = (void *) xvol; /* XXX hack! */
+
+  return xvol;
+}
+
+color ExtVoxelColor(flt scalar) {
+  color col;
+
+  if (scalar > 1.0) 
+    scalar = 1.0;
+
+  if (scalar < 0.0)
+    scalar = 0.0;
+
+  if (scalar < 0.5) {
+    col.g = 0.0;
+  }
+  else {
+    col.g = (scalar - 0.5) * 2.0;
+  }
+
+  col.r = scalar;
+  col.b = 1.0 - (scalar / 2.0);
+
+  return col;
+} 
+
+color ext_volume_texture(vector * hit, texture * tex, ray * ry) {
+  color col, col2;
+  box * bx;
+  extvol * xvol;
+  flt a, tx1, tx2, ty1, ty2, tz1, tz2;
+  flt tnear, tfar;
+  flt t, tdist, dt, ddt, sum, tt; 
+  vector pnt, bln;
+  flt scalar, transval; 
+  int i;
+  point_light * li;
+  color diffint; 
+  vector N, L;
+  flt inten;
+
+  col.r = 0.0;
+  col.g = 0.0;
+  col.b = 0.0;
+
+    bx = (box *) tex->obj;
+  xvol = (extvol *) tex->obj;
+ 
+  tnear= -FHUGE;
+  tfar= FHUGE;
+ 
+  if (ry->d.x == 0.0) {
+    if ((ry->o.x < bx->min.x) || (ry->o.x > bx->max.x)) return col;
+  }
+  else {
+    tx1 = (bx->min.x - ry->o.x) / ry->d.x;
+    tx2 = (bx->max.x - ry->o.x) / ry->d.x;
+    if (tx1 > tx2) { a=tx1; tx1=tx2; tx2=a; }
+    if (tx1 > tnear) tnear=tx1;
+    if (tx2 < tfar)   tfar=tx2;
+  }
+  if (tnear > tfar) return col;
+  if (tfar < 0.0) return col;
+ 
+ if (ry->d.y == 0.0) {
+    if ((ry->o.y < bx->min.y) || (ry->o.y > bx->max.y)) return col;
+  }
+  else {
+    ty1 = (bx->min.y - ry->o.y) / ry->d.y;
+    ty2 = (bx->max.y - ry->o.y) / ry->d.y;
+    if (ty1 > ty2) { a=ty1; ty1=ty2; ty2=a; }
+    if (ty1 > tnear) tnear=ty1;
+    if (ty2 < tfar)   tfar=ty2;
+  }
+  if (tnear > tfar) return col;
+  if (tfar < 0.0) return col;
+ 
+  if (ry->d.z == 0.0) {
+    if ((ry->o.z < bx->min.z) || (ry->o.z > bx->max.z)) return col;
+  }
+  else {
+    tz1 = (bx->min.z - ry->o.z) / ry->d.z;
+    tz2 = (bx->max.z - ry->o.z) / ry->d.z;
+    if (tz1 > tz2) { a=tz1; tz1=tz2; tz2=a; }
+    if (tz1 > tnear) tnear=tz1;
+    if (tz2 < tfar)   tfar=tz2;
+  }
+  if (tnear > tfar) return col;
+  if (tfar < 0.0) return col;
+ 
+  if (tnear < 0.0) tnear=0.0;
+ 
+  tdist = xvol->samples;
+
+  tt = (xvol->opacity / tdist); 
+
+  bln.x=fabs(bx->min.x - bx->max.x);
+  bln.y=fabs(bx->min.y - bx->max.y);
+  bln.z=fabs(bx->min.z - bx->max.z);
+  
+     dt = 1.0 / tdist; 
+    sum = 0.0;
+
+/* Accumulate color as the ray passes through the voxels */
+  for (t=tnear; t<=tfar; t+=dt) {
+    if (sum < 1.0) {
+      pnt.x=((ry->o.x + (ry->d.x * t)) - bx->min.x) / bln.x;
+      pnt.y=((ry->o.y + (ry->d.y * t)) - bx->min.y) / bln.y;
+      pnt.z=((ry->o.z + (ry->d.z * t)) - bx->min.z) / bln.z;
+
+      /* call external evaluator assume 0.0 -> 1.0 range.. */ 
+      scalar = xvol->evaluator(pnt.x, pnt.y, pnt.z);  
+
+      transval = tt * scalar; 
+      sum += transval; 
+
+      col2 = ExtVoxelColor(scalar);
+
+      col.r += transval * col2.r * xvol->ambient;
+      col.g += transval * col2.g * xvol->ambient;
+      col.b += transval * col2.b * xvol->ambient;
+
+      ddt = dt;
+
+      /* Add in diffuse shaded light sources (no shadows) */
+      if (xvol->diffuse > 0.0) {
+  
+        /* Calculate the Volume gradient at the voxel */
+        N.x = (xvol->evaluator(pnt.x - ddt, pnt.y, pnt.z)  -  
+              xvol->evaluator(pnt.x + ddt, pnt.y, pnt.z)) *  8.0 * tt; 
+  
+        N.y = (xvol->evaluator(pnt.x, pnt.y - ddt, pnt.z)  -  
+              xvol->evaluator(pnt.x, pnt.y + ddt, pnt.z)) *  8.0 * tt; 
+  
+        N.z = (xvol->evaluator(pnt.x, pnt.y, pnt.z - ddt)  -  
+              xvol->evaluator(pnt.x, pnt.y, pnt.z + ddt)) *  8.0 * tt; 
+ 
+        /* only light surfaces with enough of a normal.. */
+        if ((N.x*N.x + N.y*N.y + N.z*N.z) > 0.0) { 
+          diffint.r = 0.0; 
+          diffint.g = 0.0; 
+          diffint.b = 0.0; 
+    
+          /* add the contribution of each of the lights.. */
+          for (i=0; i<numlights; i++) {
+            li=lightlist[i];
+            VSUB(li->ctr, (*hit), L)
+            VNorm(&L);
+            VDOT(inten, N, L)
+    
+            /* only add light if its from the front of the surface */
+            /* could add back-lighting if we wanted to later.. */
+            if (inten > 0.0) {
+              diffint.r += inten*li->tex->col.r;
+              diffint.g += inten*li->tex->col.g;
+              diffint.b += inten*li->tex->col.b;
+            }
+          }   
+          col.r += col2.r * diffint.r * xvol->diffuse;
+          col.g += col2.g * diffint.g * xvol->diffuse;
+          col.b += col2.b * diffint.b * xvol->diffuse;
+        }
+      }
+    }   
+    else { 
+      sum=1.0;
+    }  
+  }
+
+  /* Add in transmitted ray from outside environment */
+  if (sum < 1.0) {      /* spawn transmission rays / refraction */
+    color transcol;
+
+    transcol = shade_transmission(ry, hit, 1.0 - sum);
+
+    col.r += transcol.r; /* add the transmitted ray  */
+    col.g += transcol.g; /* to the diffuse and       */
+    col.b += transcol.b; /* transmission total..     */
+  }
+
+  return col;
+}
+
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/extvol.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/extvol.h
new file mode 100644
index 00000000..4f298fc5
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/extvol.h
@@ -0,0 +1,73 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * vol.h - Volume rendering definitions etc.
+ *
+ *
+ *  $Id: extvol.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector min;
+  vector max;
+  flt ambient;
+  flt diffuse;
+  flt opacity;
+  int samples;
+  flt (* evaluator)(flt, flt, flt);
+} extvol;
+
+extvol * newextvol(void * voidtex, vector min, vector max, 
+                   int samples, flt (* evaluator)(flt, flt, flt));
+color ext_volume_texture(vector *, texture *, ray *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/global.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/global.cpp
new file mode 100644
index 00000000..f0e8b00c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/global.cpp
@@ -0,0 +1,74 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * global.cpp - any/all global data items etc should be in this file
+ */
+
+#include "types.h"
+#include "machine.h"
+#include "sphere.h"
+#include "light.h"
+
+/* stuff moved from intersect.c */
+object * rootobj = NULL; /* starts out empty. */
+
+point_light * lightlist[MAXLIGHTS];
+int numlights = 0;
+
+unsigned int numobjects = 0; /* used to assign unique object ID's */
+
+/* used in util.c */
+unsigned int rt_mem_in_use = 0;
+
+/* used in api.c */
+int parinitted = 0;
+
+int graphicswindowopen = 0;
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/global.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/global.h
new file mode 100644
index 00000000..2bf51bd3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/global.h
@@ -0,0 +1,68 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * global.h - any/all global data items etc should be in this file
+ *
+ *  $Id: global.h,v 1.2 2007-02-22 17:54:15 Exp $
+ *
+ */
+
+/* stuff moved from intersect.c */
+extern object * rootobj;
+
+extern point_light * lightlist[MAXLIGHTS];
+extern int numlights;
+
+extern unsigned int numobjects;
+
+extern unsigned int rt_mem_in_use;
+extern int parinitted;
+
+extern int graphicswindowopen;
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/grid.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/grid.cpp
new file mode 100644
index 00000000..691592b2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/grid.cpp
@@ -0,0 +1,679 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * grid.cpp - spatial subdivision efficiency structures
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define GRID_PRIVATE
+#include "grid.h"
+
+#ifndef cbrt
+#define     cbrt(x)     ((x) > 0.0 ? pow((double)(x), 1.0/3.0) : \
+                          ((x) < 0.0 ? -pow((double)-(x), 1.0/3.0) : 0.0))
+
+#define     qbrt(x)     ((x) > 0.0 ? pow((double)(x), 1.0/4.0) : \
+                          ((x) < 0.0 ? -pow((double)-(x), 1.0/4.0) : 0.0))
+
+#endif
+
+static object_methods grid_methods = {
+  (void (*)(void *, void *))(grid_intersect),
+  (void (*)(void *, void *, void *, void *))(NULL),
+  grid_bbox, 
+  grid_free 
+};
+
+extern bool silent_mode;
+
+object * newgrid(int xsize, int ysize, int zsize, vector min, vector max) {
+  grid * g;
+
+  g = (grid *) rt_getmem(sizeof(grid));
+  memset(g, 0, sizeof(grid));  
+
+  g->methods = &grid_methods;
+  g->id = new_objectid();
+
+  g->xsize = xsize;
+  g->ysize = ysize;
+  g->zsize = zsize;
+
+  g->min = min;
+  g->max = max;
+
+  VSub(&g->max, &g->min, &g->voxsize);
+  g->voxsize.x /= (flt) g->xsize; 
+  g->voxsize.y /= (flt) g->ysize; 
+  g->voxsize.z /= (flt) g->zsize; 
+
+  g->cells = (objectlist **) rt_getmem(xsize*ysize*zsize*sizeof(objectlist *));
+  memset(g->cells, 0, xsize*ysize*zsize * sizeof(objectlist *));
+
+/* fprintf(stderr, "New grid, size: %8d %8d %8d\n", g->xsize, g->ysize, g->zsize); */
+
+  return (object *) g;
+}
+
+static int grid_bbox(void * obj, vector * min, vector * max) {
+  grid * g = (grid *) obj;
+ 
+  *min = g->min;
+  *max = g->max;
+
+  return 1;
+}
+
+static void grid_free(void * v) {
+  int i, numvoxels;
+  grid * g = (grid *) v;
+ 
+  /* loop through all voxels and free the object lists */
+  numvoxels = g->xsize * g->ysize * g->zsize; 
+  for (i=0; i<numvoxels; i++) {
+    objectlist * lcur, * lnext;
+
+    lcur = g->cells[i];
+    while (lcur != NULL) {
+      lnext = lcur->next;
+      free(lcur);
+    }
+  }
+
+  /* free the grid cells */ 
+  free(g->cells);
+
+  /* free all objects on the grid object list */
+  free_objects(g->objects);   
+
+  free(g);
+}
+
+static void globalbound(object ** rootlist, vector * gmin, vector * gmax) {
+  vector min, max;
+  object * cur;
+
+  if (*rootlist == NULL)  /* don't bound non-existant objects */
+    return;
+
+  gmin->x =  FHUGE;   gmin->y =  FHUGE;   gmin->z =  FHUGE;
+  gmax->x = -FHUGE;   gmax->y = -FHUGE;   gmax->z = -FHUGE;
+
+  cur=*rootlist;
+  while (cur != NULL)  {  /* Go! */
+    min.x = -FHUGE; min.y = -FHUGE; min.z = -FHUGE;
+    max.x =  FHUGE; max.y =  FHUGE; max.z =  FHUGE;
+
+    if (cur->methods->bbox((void *) cur, &min, &max)) {
+      gmin->x = MYMIN( gmin->x , min.x);
+      gmin->y = MYMIN( gmin->y , min.y);
+      gmin->z = MYMIN( gmin->z , min.z);
+
+      gmax->x = MYMAX( gmax->x , max.x);
+      gmax->y = MYMAX( gmax->y , max.y);
+      gmax->z = MYMAX( gmax->z , max.z);
+    }
+
+    cur=(object *)cur->nextobj;
+  }
+}
+
+
+static int cellbound(grid *g, gridindex *index, vector * cmin, vector * cmax) {
+  vector min, max, cellmin, cellmax;
+  objectlist * cur;
+  int numinbounds = 0;
+
+  cur = g->cells[index->z*g->xsize*g->ysize + index->y*g->xsize + index->x]; 
+
+  if (cur == NULL)  /* don't bound non-existant objects */
+    return 0;
+
+  cellmin.x = voxel2x(g, index->x); 
+  cellmin.y = voxel2y(g, index->y); 
+  cellmin.z = voxel2z(g, index->z); 
+
+  cellmax.x = cellmin.x + g->voxsize.x;
+  cellmax.y = cellmin.y + g->voxsize.y;
+  cellmax.z = cellmin.z + g->voxsize.z;
+
+  cmin->x =  FHUGE;   cmin->y =  FHUGE;   cmin->z =  FHUGE;
+  cmax->x = -FHUGE;   cmax->y = -FHUGE;   cmax->z = -FHUGE;
+
+  while (cur != NULL)  {  /* Go! */
+    min.x = -FHUGE; min.y = -FHUGE; min.z = -FHUGE;
+    max.x =  FHUGE; max.y =  FHUGE; max.z =  FHUGE;
+
+    if (cur->obj->methods->bbox((void *) cur->obj, &min, &max)) {
+      if ((min.x >= cellmin.x) && (max.x <= cellmax.x) &&
+          (min.y >= cellmin.y) && (max.y <= cellmax.y) &&
+          (min.z >= cellmin.z) && (max.z <= cellmax.z)) {
+      
+        cmin->x = MYMIN( cmin->x , min.x);
+        cmin->y = MYMIN( cmin->y , min.y);
+        cmin->z = MYMIN( cmin->z , min.z);
+
+        cmax->x = MYMAX( cmax->x , max.x);
+        cmax->y = MYMAX( cmax->y , max.y);
+        cmax->z = MYMAX( cmax->z , max.z);
+      
+        numinbounds++;
+      }
+    }
+
+    cur=cur->next;
+  }
+ 
+  /* in case we get a 0.0 sized axis on the cell bounds, we'll */
+  /* use the original cell bounds */
+  if ((cmax->x - cmin->x) < EPSILON) {
+    cmax->x += EPSILON;
+    cmin->x -= EPSILON;
+  }
+  if ((cmax->y - cmin->y) < EPSILON) {
+    cmax->y += EPSILON;
+    cmin->y -= EPSILON;
+  }
+  if ((cmax->z - cmin->z) < EPSILON) {
+    cmax->z += EPSILON;
+    cmin->z -= EPSILON;
+  }
+
+  return numinbounds;
+}
+
+static int countobj(object * root) {
+  object * cur;     /* counts the number of objects on a list */
+  int numobj;
+
+  numobj=0;
+  cur=root;
+
+  while (cur != NULL) {
+    cur=(object *)cur->nextobj;
+    numobj++;
+  }
+  return numobj;
+}
+
+static int countobjlist(objectlist * root) {
+  objectlist * cur;
+  int numobj;
+
+  numobj=0; 
+  cur = root;
+
+  while (cur != NULL) {
+    cur = cur->next;
+    numobj++;
+  }
+  return numobj;
+}
+
+int engrid_scene(object ** list) {
+  grid * g;
+  int numobj, numcbrt;
+  vector gmin, gmax;
+  gridindex index;
+ 
+  if (*list == NULL)
+    return 0;
+
+  numobj = countobj(*list);
+
+  if ( !silent_mode )
+    fprintf(stderr, "Scene contains %d bounded objects.\n", numobj);
+
+  if (numobj > 16) {
+    numcbrt = (int) cbrt(4*numobj);
+    globalbound(list, &gmin, &gmax);
+
+    g = (grid *) newgrid(numcbrt, numcbrt, numcbrt, gmin, gmax);
+    engrid_objlist(g, list);
+
+    numobj = countobj(*list);
+    g->nextobj = *list;
+    *list = (object *) g;
+
+    /* now create subgrids.. */
+    for (index.z=0; index.z<g->zsize; index.z++) {
+      for (index.y=0; index.y<g->ysize; index.y++) {
+        for (index.x=0; index.x<g->xsize; index.x++) {
+          engrid_cell(g, &index);
+        }
+      }
+    } 
+  }
+
+  return 1;
+}
+
+
+void engrid_objlist(grid * g, object ** list) {
+  object * cur, * next, **prev;
+
+  if (*list == NULL) 
+    return;
+  
+  prev = list; 
+  cur = *list;
+
+  while (cur != NULL) {
+    next = (object *)cur->nextobj;
+
+    if (engrid_object(g, cur)) 
+      *prev = next;
+    else 
+      prev = (object **) &cur->nextobj;
+
+    cur = next;
+  } 
+}
+
+static int engrid_cell(grid * gold, gridindex *index) {
+  vector gmin, gmax, gsize;
+  flt len;
+  int numobj, numcbrt, xs, ys, zs;
+  grid * g;
+  objectlist **list;
+  objectlist * newobj;
+
+  list = &gold->cells[index->z*gold->xsize*gold->ysize + 
+                     index->y*gold->xsize  + index->x];
+
+  if (*list == NULL)
+    return 0;
+
+  numobj =  cellbound(gold, index, &gmin, &gmax);
+
+  VSub(&gmax, &gmin, &gsize);
+  len = 1.0 / (MYMAX( MYMAX(gsize.x, gsize.y), gsize.z ));
+  gsize.x *= len;  
+  gsize.y *= len;  
+  gsize.z *= len;  
+
+  if (numobj > 16) {
+    numcbrt = (int) cbrt(2*numobj); 
+    
+    xs = (int) ((flt) numcbrt * gsize.x);
+    if (xs < 1) xs = 1;
+    ys = (int) ((flt) numcbrt * gsize.y);
+    if (ys < 1) ys = 1;
+    zs = (int) ((flt) numcbrt * gsize.z);
+    if (zs < 1) zs = 1;
+
+    g = (grid *) newgrid(xs, ys, zs, gmin, gmax);
+    engrid_objectlist(g, list);
+
+    newobj = (objectlist *) rt_getmem(sizeof(objectlist));    
+    newobj->obj = (object *) g;
+    newobj->next = *list;
+    *list = newobj;
+
+    g->nextobj = gold->objects;
+    gold->objects = (object *) g;
+  }
+
+  return 1;
+}
+
+static int engrid_objectlist(grid * g, objectlist ** list) {
+  objectlist * cur, * next, **prev;
+  int numsucceeded = 0; 
+
+  if (*list == NULL) 
+    return 0;
+  
+  prev = list; 
+  cur = *list;
+
+  while (cur != NULL) {
+    next = cur->next;
+
+    if (engrid_object(g, cur->obj)) {
+      *prev = next;
+      free(cur);
+      numsucceeded++;
+    }
+    else {
+      prev = &cur->next;
+    }
+
+    cur = next;
+  } 
+
+  return numsucceeded;
+}
+
+
+
+static int engrid_object(grid * g, object * obj) {
+  vector omin, omax; 
+  gridindex low, high;
+  int x, y, z, zindex, yindex, voxindex;
+  objectlist * tmp;
+ 
+  if (obj->methods->bbox(obj, &omin, &omax)) { 
+    if (!pos2grid(g, &omin, &low) || !pos2grid(g, &omax, &high)) {
+      return 0; /* object is not wholly contained in the grid */
+    }
+  }
+  else {
+    return 0; /* object is unbounded */
+  }
+
+  /* add the object to the complete list of objects in the grid */
+  obj->nextobj = g->objects;
+  g->objects = obj;
+
+  /* add this object to all voxels it inhabits */
+  for (z=low.z; z<=high.z; z++) {
+    zindex = z * g->xsize * g->ysize;
+    for (y=low.y; y<=high.y; y++) {
+      yindex = y * g->xsize;
+      for (x=low.x; x<=high.x; x++) {
+        voxindex = x + yindex + zindex; 
+        tmp = (objectlist *) rt_getmem(sizeof(objectlist));
+        tmp->next = g->cells[voxindex];
+        tmp->obj = obj;
+        g->cells[voxindex] = tmp;
+      }
+    }
+  }
+ 
+  return 1;
+}
+
+static int pos2grid(grid * g, vector * pos, gridindex * index) {
+  index->x = (int) ((pos->x - g->min.x) / g->voxsize.x);
+  index->y = (int) ((pos->y - g->min.y) / g->voxsize.y);
+  index->z = (int) ((pos->z - g->min.z) / g->voxsize.z);
+  
+  if (index->x == g->xsize)
+    index->x--;
+  if (index->y == g->ysize)
+    index->y--;
+  if (index->z == g->zsize)
+    index->z--;
+
+  if (index->x < 0 || index->x > g->xsize ||
+      index->y < 0 || index->y > g->ysize ||
+      index->z < 0 || index->z > g->zsize) 
+    return 0;
+
+  if (pos->x < g->min.x || pos->x > g->max.x ||
+      pos->y < g->min.y || pos->y > g->max.y ||
+      pos->z < g->min.z || pos->z > g->max.z) 
+    return 0; 
+
+  return 1;
+}
+
+
+/* the real thing */
+static void grid_intersect(grid * g, ray * ry) {
+  flt tnear, tfar, offset;
+  vector curpos, tmax, tdelta, pdeltaX, pdeltaY, pdeltaZ, nXp, nYp, nZp;
+  gridindex curvox, step, out; 
+  int voxindex;
+  objectlist * cur;
+
+  if (ry->flags & RT_RAY_FINISHED)
+    return;
+
+  if (!grid_bounds_intersect(g, ry, &tnear, &tfar))
+    return;
+ 
+  if (ry->maxdist < tnear)
+    return;
+ 
+  curpos = Raypnt(ry, tnear); 
+  pos2grid(g, &curpos, &curvox);
+  offset = tnear;
+
+  /* Setup X iterator stuff */
+  if (fabs(ry->d.x) < EPSILON) {
+    tmax.x = FHUGE;
+    tdelta.x = 0.0;
+    step.x = 0;
+    out.x = 0; /* never goes out of bounds on this axis */
+  }
+  else if (ry->d.x < 0.0) {
+    tmax.x = offset + ((voxel2x(g, curvox.x) - curpos.x) / ry->d.x); 
+    tdelta.x = g->voxsize.x / - ry->d.x;
+    step.x = out.x = -1;
+  }
+  else {
+    tmax.x = offset + ((voxel2x(g, curvox.x + 1) - curpos.x) / ry->d.x);
+    tdelta.x = g->voxsize.x / ry->d.x;
+    step.x = 1;
+    out.x = g->xsize;
+  }
+
+  /* Setup Y iterator stuff */
+  if (fabs(ry->d.y) < EPSILON) {
+    tmax.y = FHUGE;
+    tdelta.y = 0.0; 
+    step.y = 0;
+    out.y = 0; /* never goes out of bounds on this axis */
+  }
+  else if (ry->d.y < 0.0) {
+    tmax.y = offset + ((voxel2y(g, curvox.y) - curpos.y) / ry->d.y);
+    tdelta.y = g->voxsize.y / - ry->d.y;
+    step.y = out.y = -1;
+  }
+  else {
+    tmax.y = offset + ((voxel2y(g, curvox.y + 1) - curpos.y) / ry->d.y);
+    tdelta.y = g->voxsize.y / ry->d.y;
+    step.y = 1;
+    out.y = g->ysize;
+  }
+
+  /* Setup Z iterator stuff */
+  if (fabs(ry->d.z) < EPSILON) {
+    tmax.z = FHUGE;
+    tdelta.z = 0.0; 
+    step.z = 0;
+    out.z = 0; /* never goes out of bounds on this axis */
+  }
+  else if (ry->d.z < 0.0) {
+    tmax.z = offset + ((voxel2z(g, curvox.z) - curpos.z) / ry->d.z);
+    tdelta.z = g->voxsize.z / - ry->d.z;
+    step.z = out.z = -1;
+  }
+  else {
+    tmax.z = offset + ((voxel2z(g, curvox.z + 1) - curpos.z) / ry->d.z);
+    tdelta.z = g->voxsize.z / ry->d.z;
+    step.z = 1;
+    out.z = g->zsize;
+  }
+
+  pdeltaX = ry->d;
+  VScale(&pdeltaX, tdelta.x);
+  pdeltaY = ry->d;
+  VScale(&pdeltaY, tdelta.y);
+  pdeltaZ = ry->d;
+  VScale(&pdeltaZ, tdelta.z);
+
+  nXp = Raypnt(ry, tmax.x);
+  nYp = Raypnt(ry, tmax.y);
+  nZp = Raypnt(ry, tmax.z);
+
+  voxindex = curvox.z*g->xsize*g->ysize + curvox.y*g->xsize + curvox.x; 
+  while (1) {
+    if (tmax.x < tmax.y && tmax.x < tmax.z) {
+      cur = g->cells[voxindex];
+      while (cur != NULL) {
+        if (ry->mbox[cur->obj->id] != ry->serial) {
+          ry->mbox[cur->obj->id] = ry->serial; 
+          cur->obj->methods->intersect(cur->obj, ry);
+        }
+        cur = cur->next;
+      }
+      curvox.x += step.x;
+      if (ry->maxdist < tmax.x || curvox.x == out.x) 
+        break; 
+      voxindex += step.x;
+      tmax.x += tdelta.x;
+      curpos = nXp;
+      nXp.x += pdeltaX.x;
+      nXp.y += pdeltaX.y;
+      nXp.z += pdeltaX.z;
+    }
+    else if (tmax.z < tmax.y) {
+      cur = g->cells[voxindex];
+      while (cur != NULL) {
+        if (ry->mbox[cur->obj->id] != ry->serial) {
+          ry->mbox[cur->obj->id] = ry->serial; 
+          cur->obj->methods->intersect(cur->obj, ry);
+        }
+        cur = cur->next;
+      }
+      curvox.z += step.z;
+      if (ry->maxdist < tmax.z || curvox.z == out.z) 
+        break;
+      voxindex += step.z*g->xsize*g->ysize;
+      tmax.z += tdelta.z;
+      curpos = nZp;
+      nZp.x += pdeltaZ.x;
+      nZp.y += pdeltaZ.y;
+      nZp.z += pdeltaZ.z;
+    }
+    else {
+      cur = g->cells[voxindex];
+      while (cur != NULL) {
+        if (ry->mbox[cur->obj->id] != ry->serial) {
+          ry->mbox[cur->obj->id] = ry->serial; 
+          cur->obj->methods->intersect(cur->obj, ry);
+        }
+        cur = cur->next;
+      }
+      curvox.y += step.y;
+      if (ry->maxdist < tmax.y || curvox.y == out.y) 
+        break;
+      voxindex += step.y*g->xsize;
+      tmax.y += tdelta.y;
+      curpos = nYp;
+      nYp.x += pdeltaY.x;
+      nYp.y += pdeltaY.y;
+      nYp.z += pdeltaY.z;
+    }
+
+    if (ry->flags & RT_RAY_FINISHED)
+      break;
+  }
+}
+
+static void voxel_intersect(grid * g, ray * ry, int voxindex) {
+  objectlist * cur;
+
+  cur = g->cells[voxindex];
+  while (cur != NULL) {
+    cur->obj->methods->intersect(cur->obj, ry);
+    cur = cur->next;
+  }
+}
+
+static int grid_bounds_intersect(grid * g, ray * ry, flt *nr, flt *fr) {
+  flt a, tx1, tx2, ty1, ty2, tz1, tz2;
+  flt tnear, tfar;
+
+  tnear= -FHUGE;
+  tfar= FHUGE;
+
+  if (ry->d.x == 0.0) {
+    if ((ry->o.x < g->min.x) || (ry->o.x > g->max.x)) return 0;
+  }
+  else {
+    tx1 = (g->min.x - ry->o.x) / ry->d.x;
+    tx2 = (g->max.x - ry->o.x) / ry->d.x;
+    if (tx1 > tx2) { a=tx1; tx1=tx2; tx2=a; }
+    if (tx1 > tnear) tnear=tx1;
+    if (tx2 < tfar)   tfar=tx2;
+  }
+  if (tnear > tfar) return 0;
+  if (tfar < 0.0) return 0;
+
+  if (ry->d.y == 0.0) {
+    if ((ry->o.y < g->min.y) || (ry->o.y > g->max.y)) return 0;
+  }
+  else {
+    ty1 = (g->min.y - ry->o.y) / ry->d.y;
+    ty2 = (g->max.y - ry->o.y) / ry->d.y;
+    if (ty1 > ty2) { a=ty1; ty1=ty2; ty2=a; }
+    if (ty1 > tnear) tnear=ty1;
+    if (ty2 < tfar)   tfar=ty2;
+  }
+  if (tnear > tfar) return 0;
+  if (tfar < 0.0) return 0;
+
+  if (ry->d.z == 0.0) {
+    if ((ry->o.z < g->min.z) || (ry->o.z > g->max.z)) return 0;
+  }
+  else {
+    tz1 = (g->min.z - ry->o.z) / ry->d.z;
+    tz2 = (g->max.z - ry->o.z) / ry->d.z;
+    if (tz1 > tz2) { a=tz1; tz1=tz2; tz2=a; }
+    if (tz1 > tnear) tnear=tz1;
+    if (tz2 < tfar)   tfar=tz2;
+  }
+  if (tnear > tfar) return 0;
+  if (tfar < 0.0) return 0;
+
+  *nr = tnear;
+  *fr = tfar; 
+  return 1;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/grid.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/grid.h
new file mode 100644
index 00000000..2cd4c2a1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/grid.h
@@ -0,0 +1,120 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * grid.h - spatial subdivision efficiency structures
+ *
+ * $Id: grid.h,v 1.2 2007-02-22 17:54:15 Exp $
+ * 
+ */
+
+int engrid_scene(object ** list);
+object * newgrid(int xsize, int ysize, int zsize, vector min, vector max);
+
+#ifdef GRID_PRIVATE
+
+typedef struct objectlist {
+  struct objectlist * next; /* next link in the list */
+  object * obj;             /* the actual object     */
+} objectlist; 
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  int xsize;           /* number of cells along the X direction */
+  int ysize;           /* number of cells along the Y direction */
+  int zsize;           /* number of cells along the Z direction */
+  vector min;          /* the minimum coords for the box containing the grid */
+  vector max;          /* the maximum coords for the box containing the grid */
+  vector voxsize;      /* the size of a grid cell/voxel */
+  object * objects;    /* all objects contained in the grid */
+  objectlist ** cells; /* the grid cells themselves */
+} grid;
+
+typedef struct {
+  int x;         /* Voxel X address */
+  int y;         /* Voxel Y address */
+  int z;         /* Voxel Z address */
+} gridindex; 
+
+/*
+ * Convert from voxel number along X/Y/Z to corresponding coordinate.
+ */
+#define voxel2x(g,X)  ((X) * (g->voxsize.x) + (g->min.x))
+#define voxel2y(g,Y)  ((Y) * (g->voxsize.y) + (g->min.y))
+#define voxel2z(g,Z)  ((Z) * (g->voxsize.z) + (g->min.z))
+
+/*
+ * And vice-versa.
+ */
+#define x2voxel(g,x)            (((x) - g->min.x) / g->voxsize.x)
+#define y2voxel(g,y)            (((y) - g->min.y) / g->voxsize.y)
+#define z2voxel(g,z)            (((z) - g->min.z) / g->voxsize.z)
+
+
+static int grid_bbox(void * obj, vector * min, vector * max);
+static void grid_free(void * v);
+
+static int cellbound(grid *g, gridindex *index, vector * cmin, vector * cmax);
+
+void engrid_objlist(grid * g, object ** list);
+static int engrid_object(grid * g, object * obj);
+
+static int engrid_objectlist(grid * g, objectlist ** list);
+static int engrid_cell(grid *, gridindex *);
+
+static int pos2grid(grid * g, vector * pos, gridindex * index);
+static void grid_intersect(grid *, ray *);
+static void voxel_intersect(grid * g, ray * ry, int voxaddr);
+static int grid_bounds_intersect(grid * g, ray * ry, flt *near, flt *far); 
+
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imageio.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imageio.cpp
new file mode 100644
index 00000000..97af7310
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imageio.cpp
@@ -0,0 +1,147 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ *  imageio.cpp - This file deals with reading/writing image files
+ */ 
+
+/* For our puposes, we're interested only in the 3 byte per pixel 24 bit
+ * truecolor sort of file..
+ */
+
+#include <stdio.h>
+#include "machine.h"
+#include "types.h"
+#include "util.h"
+#include "imageio.h"
+#include "ppm.h"     /* PPM files */
+#include "tgafile.h" /* Truevision Targa files */
+#include "jpeg.h"    /* JPEG files */
+
+static 
+int fakeimage(char * name, int * xres, int * yres, unsigned char ** imgdata) {
+  int i, imgsize;
+
+  fprintf(stderr, "Error loading image %s.  Faking it.\n", name);
+   
+  *xres = 2;
+  *yres = 2;
+  imgsize = 3 * (*xres) * (*yres);
+  *imgdata = (unsigned char *)rt_getmem(imgsize);
+  for (i=0; i<imgsize; i++) {
+    (*imgdata)[i] = 255;
+  }
+
+  return IMAGENOERR;
+}
+
+
+int readimage(rawimage * img) {
+  int rc;
+  int xres, yres;
+  unsigned char * imgdata = NULL;
+  char * name = img->name;
+
+  if (strstr(name, ".ppm")) { 
+    rc = readppm(name, &xres, &yres, &imgdata);
+  }
+  else if (strstr(name, ".tga")) {
+    rc = readtga(name, &xres, &yres, &imgdata);
+  }
+  else if (strstr(name, ".jpg")) {
+    rc = readjpeg(name, &xres, &yres, &imgdata);
+  }
+  else if (strstr(name, ".gif")) {
+    rc = IMAGEUNSUP; 
+  }
+  else if (strstr(name, ".png")) {
+    rc = IMAGEUNSUP; 
+  }
+  else if (strstr(name, ".tiff")) {
+    rc = IMAGEUNSUP; 
+  }
+  else if (strstr(name, ".rgb")) {
+    rc = IMAGEUNSUP; 
+  }
+  else if (strstr(name, ".xpm")) {
+    rc = IMAGEUNSUP; 
+  }
+  else {
+    rc = readppm(name, &xres, &yres, &imgdata);
+  } 
+
+  switch (rc) {
+    case IMAGEREADERR:
+      fprintf(stderr, "Short read encountered while loading image %s\n", name);
+      rc = IMAGENOERR; /* remap to non-fatal error */
+      break;
+
+    case IMAGEUNSUP:
+      fprintf(stderr, "Cannot read unsupported image format for image %s\n", name);
+      break;
+  }    
+
+  /* If the image load failed, create a tiny white colored image to fake it */ 
+  /* this allows a scene to render even when a file can't be loaded */
+  if (rc != IMAGENOERR) {
+    rc = fakeimage(name, &xres, &yres, &imgdata);
+  }
+
+  /* If we succeeded in loading the image, return it. */
+  if (rc == IMAGENOERR) { 
+    img->xres = xres;
+    img->yres = yres;
+    img->bpp = 3;  
+    img->data = imgdata;
+  }
+
+  return rc;
+}
+ 
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imageio.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imageio.h
new file mode 100644
index 00000000..f1dc972a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imageio.h
@@ -0,0 +1,65 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ *  imageio.h - This file deals with reading/writing image files 
+ *
+ *  $Id: imageio.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */ 
+
+/* For our puposes, we're interested only in the 3 byte per pixel 24 bit
+   truecolor sort of file.. */
+
+#define IMAGENOERR     0  /* no error */
+#define IMAGEBADFILE   1  /* can't find or can't open the file */
+#define IMAGEUNSUP     2  /* the image file is an unsupported format */
+#define IMAGEALLOCERR  3  /* not enough remaining memory to load this image */
+#define IMAGEREADERR   4  /* failed read, short reads etc */
+
+int readimage(rawimage *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imap.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imap.cpp
new file mode 100644
index 00000000..c2eaa0c1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imap.cpp
@@ -0,0 +1,168 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * imap.cpp - This file contains code for doing image map type things.  
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "imap.h"
+#include "util.h"
+#include "imageio.h"
+
+rawimage * imagelist[MAXIMGS];
+int numimages;
+
+void ResetImages(void) {
+  int i;
+  numimages=0;
+  for (i=0; i<MAXIMGS; i++) {
+    imagelist[i]=NULL;
+  }
+}
+
+void LoadImage(rawimage * image) {
+  if (!image->loaded) {
+    readimage(image);
+    image->loaded=1;
+  }
+}
+
+color ImageMap(rawimage * image, flt u, flt v) {
+  color col, colx, colx2;
+  flt x,y, px, py;
+  int x1, x2, y1, y2;
+  unsigned char * ptr;
+  unsigned char * ptr2;
+
+  if (!image->loaded) {   
+    LoadImage(image);
+    image->loaded=1;
+  }
+
+  if ((u <= 1.0) && (u >=0.0) && (v <= 1.0) && (v >= 0.0)) {
+    x=(image->xres - 1.0) * u; /* floating point X location */
+    y=(image->yres - 1.0) * v; /* floating point Y location */
+
+    px = x - ((int) x);
+    py = y - ((int) y);
+
+    x1 = (int) x;
+    x2 = x1 + 1;
+
+    y1 = (int) y;
+    y2 = y1 + 1;
+
+    ptr  = image->data + ((image->xres * y1) + x1) * 3; 
+    ptr2 = image->data + ((image->xres * y1) + x2) * 3; 
+
+    colx.r = (flt) ((flt)ptr[0] + px*((flt)ptr2[0] - (flt) ptr[0])) / 255.0; 
+    colx.g = (flt) ((flt)ptr[1] + px*((flt)ptr2[1] - (flt) ptr[1])) / 255.0; 
+    colx.b = (flt) ((flt)ptr[2] + px*((flt)ptr2[2] - (flt) ptr[2])) / 255.0; 
+
+    ptr  = image->data + ((image->xres * y2) + x1) * 3; 
+    ptr2 = image->data + ((image->xres * y2) + x2) * 3; 
+
+    colx2.r = ((flt)ptr[0] + px*((flt)ptr2[0] - (flt)ptr[0])) / 255.0; 
+    colx2.g = ((flt)ptr[1] + px*((flt)ptr2[1] - (flt)ptr[1])) / 255.0; 
+    colx2.b = ((flt)ptr[2] + px*((flt)ptr2[2] - (flt)ptr[2])) / 255.0; 
+
+    col.r = colx.r + py*(colx2.r - colx.r);
+    col.g = colx.g + py*(colx2.g - colx.g);
+    col.b = colx.b + py*(colx2.b - colx.b);
+
+  }
+  else {
+    col.r=0.0;
+    col.g=0.0;
+    col.b=0.0;
+  }
+  return col;
+} 
+
+rawimage * AllocateImage(char * filename) { 
+  rawimage * newimage = NULL;
+  int i, intable;
+  size_t len;
+
+  intable=0;
+  if (numimages!=0) {
+    for (i=0; i<numimages; i++) {
+      if (!strcmp(filename, imagelist[i]->name)) {
+        newimage=imagelist[i];
+        intable=1;
+      }
+    }
+  }
+
+  if (!intable) {
+    newimage=(rawimage *)rt_getmem(sizeof(rawimage));
+    newimage->loaded=0;
+    newimage->xres=0;
+    newimage->yres=0;
+    newimage->bpp=0;
+    newimage->data=NULL;
+    len=strlen(filename);
+    if (len > 80) rtbomb("Filename too long in image map!!"); 
+    strcpy(newimage->name, filename);
+
+    imagelist[numimages]=newimage;  /* add new one to the table       */ 
+    numimages++;                    /* increment the number of images */
+  }
+ 
+  return newimage;
+}
+
+void DeallocateImage(rawimage * image) {
+  image->loaded=0;
+  rt_freemem(image->data);
+}
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imap.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imap.h
new file mode 100644
index 00000000..db65f7af
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/imap.h
@@ -0,0 +1,61 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * imap.h - This file contains defines etc for doing image map type things.  
+ *
+ *  $Id: imap.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+void       ResetImage(void);
+void       LoadImage(rawimage *);
+color      ImageMap(rawimage *, flt, flt);
+rawimage * AllocateImage(char *);
+void       DeallocateImage(rawimage *);
+void       ResetImages(void);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/intersect.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/intersect.cpp
new file mode 100644
index 00000000..40f47107
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/intersect.cpp
@@ -0,0 +1,177 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * intersect.cpp - This file contains code for CSG and intersection routines.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "intersect.h"
+#include "light.h"
+#include "util.h"
+#include "global.h"
+
+unsigned int new_objectid(void) {
+  return numobjects++; /* global used to generate unique object ID's */
+}
+
+unsigned int max_objectid(void) {
+  return numobjects;
+}
+
+void add_object(object * obj) {
+  object * objtemp;
+
+  if (obj == NULL)
+    return;
+
+  obj->id = new_objectid();
+
+  objtemp = rootobj;
+  rootobj = obj;
+  obj->nextobj = objtemp;
+}
+
+void free_objects(object * start) {
+  object * cur;
+  object * cur2;
+
+  cur=start; 
+  while (cur->nextobj != NULL) { 
+    cur2=(object *)cur->nextobj;
+    cur->methods->free(cur);
+    cur=cur2;
+  }
+  free(cur);
+
+}
+
+void reset_object(void) {
+  if (rootobj != NULL)
+    free_objects(rootobj);
+
+  rootobj = NULL;
+  numobjects = 0; /* set number of objects back to 0 */
+}
+
+void intersect_objects(ray * intray) {
+  object * cur;
+  object temp;
+
+  temp.nextobj = rootobj; /* setup the initial object pointers.. */
+  cur = &temp;            /* ready, set                          */
+
+  while ((cur=(object *)cur->nextobj) != NULL)          
+    cur->methods->intersect(cur, intray); 
+}
+
+void reset_intersection(intersectstruct * intstruct) {
+  intstruct->num = 0;
+  intstruct->list[0].t = FHUGE;
+  intstruct->list[0].obj = NULL;
+  intstruct->list[1].t = FHUGE;
+  intstruct->list[1].obj = NULL;
+}
+
+void add_intersection(flt t, object * obj, ray * ry) {
+  intersectstruct * intstruct = ry->intstruct;
+
+  if (t > EPSILON) {
+
+    /* if we hit something before maxdist update maxdist */
+    if (t < ry->maxdist) {
+      ry->maxdist = t;
+
+      /* if we hit *anything* before maxdist, and we're firing a */
+      /* shadow ray, then we are finished ray tracing the shadow */
+      if (ry->flags & RT_RAY_SHADOW)
+        ry->flags |= RT_RAY_FINISHED;
+    }
+
+    intstruct->num++;
+    intstruct->list[intstruct->num].obj = obj;
+    intstruct->list[intstruct->num].t = t;
+  }
+}
+
+
+int closest_intersection(flt * t, object ** obj, intersectstruct * intstruct) {
+  int i;
+  *t=FHUGE;
+
+  for (i=1; i<=intstruct->num; i++) {
+    if (intstruct->list[i].t < *t) {
+        *t=intstruct->list[i].t;
+      *obj=intstruct->list[i].obj;
+    }
+  } 
+
+  return intstruct->num;
+}
+
+int shadow_intersection(intersectstruct * intstruct, flt maxdist) {
+  int i;
+  
+  if (intstruct->num > 0) {
+    for (i=1; i<=intstruct->num; i++) {
+      if ((intstruct->list[i].t < maxdist) && 
+          (intstruct->list[i].obj->tex->shadowcast == 1)) {
+        return 1;
+      }
+    }
+  }
+  
+  return 0;
+}
+
+
+
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/intersect.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/intersect.h
new file mode 100644
index 00000000..f58193fd
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/intersect.h
@@ -0,0 +1,67 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * intersect.h - This file contains the declarations and defines for the
+ *               functions that manage intersection, bounding and CSG..
+ *
+ *  $Id: intersect.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+unsigned int  new_objectid(void);
+unsigned int max_objectid(void);  
+void add_object(object *);
+void reset_object(void);
+void free_objects(object *);
+void intersect_objects(ray *);
+void reset_intersection(intersectstruct *);
+void add_intersection(flt, object *, ray *);
+int closest_intersection(flt *, object **, intersectstruct *);
+int next_intersection(object **, object *, intersectstruct *);
+int shadow_intersection(intersectstruct * intstruct, flt maxdist);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/jpeg.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/jpeg.cpp
new file mode 100644
index 00000000..c08af7b3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/jpeg.cpp
@@ -0,0 +1,129 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ *  jpeg.cpp - This file deals with JPEG format image files (reading/writing)
+ */ 
+
+/*
+ * This code requires support from the Independent JPEG Group's libjpeg.
+ * For our puposes, we're interested only in the 3 byte per pixel 24 bit
+ * RGB output.  Probably won't implement any decent checking at this point.
+ */ 
+
+#include <stdio.h>
+#include "machine.h"
+#include "types.h"
+#include "util.h"
+#include "imageio.h" /* error codes etc */
+#include "jpeg.h"    /* the protos for this file */
+
+#if !defined(USEJPEG)
+
+int readjpeg(char * name, int * xres, int * yres, unsigned char **imgdata) {
+  return IMAGEUNSUP;
+}
+
+#else
+
+#include "jpeglib.h" /* the IJG jpeg library headers */
+
+int readjpeg(char * name, int * xres, int * yres, unsigned char **imgdata) {
+  FILE * ifp;
+  struct jpeg_decompress_struct cinfo; /* JPEG decompression struct */
+  struct jpeg_error_mgr jerr;          /* JPEG Error handler */
+  JSAMPROW row_pointer[1];             /* output row buffer */
+  int row_stride;                      /* physical row width in output buf */
+
+  /* open input file before doing any JPEG decompression setup */
+  if ((ifp = fopen(name, "rb")) == NULL) 
+    return IMAGEBADFILE; /* Could not open image, return error */
+
+  /*
+   * Note: The Independent JPEG Group's library does not have a way
+   *       of returning errors without the use of setjmp/longjmp.
+   *       This is a problem in multi-threaded environment, since setjmp
+   *       and longjmp are declared thread-unsafe by many vendors currently.
+   *       For now, JPEG decompression errors will result in the "default"
+   *       error handling provided by the JPEG library, which is an error
+   *       message and a fatal call to exit().  I'll have to work around this
+   *       or find a reasonably thread-safe way of doing setjmp/longjmp..
+   */
+
+  cinfo.err = jpeg_std_error(&jerr); /* Set JPEG error handler to default */
+
+  jpeg_create_decompress(&cinfo);    /* Create decompression context      */ 
+  jpeg_stdio_src(&cinfo, ifp);       /* Set input mechanism to stdio type */
+  jpeg_read_header(&cinfo, TRUE);    /* Read the JPEG header for info     */
+  jpeg_start_decompress(&cinfo);     /* Prepare for actual decompression  */
+
+  *xres = cinfo.output_width;        /* set returned image width  */
+  *yres = cinfo.output_height;       /* set returned image height */
+
+  /* Calculate the size of a row in the image */
+  row_stride = cinfo.output_width * cinfo.output_components;
+
+  /* Allocate the image buffer which will be returned to the ray tracer */
+  *imgdata = (unsigned char *) malloc(row_stride * cinfo.output_height);
+
+  /* decompress the JPEG, one scanline at a time into the buffer */
+  while (cinfo.output_scanline < cinfo.output_height) {
+    row_pointer[0] = &((*imgdata)[(cinfo.output_scanline)*row_stride]);
+    jpeg_read_scanlines(&cinfo, row_pointer, 1);
+  }
+
+  jpeg_finish_decompress(&cinfo);   /* Tell the JPEG library to cleanup   */
+  jpeg_destroy_decompress(&cinfo);  /* Destroy JPEG decompression context */
+
+  fclose(ifp); /* Close the input file */
+
+  return IMAGENOERR;  /* No fatal errors */
+}
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/jpeg.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/jpeg.h
new file mode 100644
index 00000000..ab66353a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/jpeg.h
@@ -0,0 +1,56 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ *  jpeg.h - This file deals with JPEG format image files (reading/writing)
+ *
+ *  $Id: jpeg.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */ 
+
+int readjpeg(char * name, int * xres, int * yres, unsigned char **imgdata);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/light.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/light.cpp
new file mode 100644
index 00000000..dc1e38a1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/light.cpp
@@ -0,0 +1,128 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * light.cpp - This file contains declarations and defines for light sources.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define LIGHT_PRIVATE
+#include "light.h"
+
+static object_methods light_methods = {
+  (void (*)(void *, void *))(light_intersect),
+  (void (*)(void *, void *, void *, void *))(light_normal),
+  light_bbox, 
+  free 
+};
+
+point_light * newlight(void * tex, vector ctr, flt rad) {
+  point_light * l;
+  
+  l=(point_light *) rt_getmem(sizeof(point_light));
+  memset(l, 0, sizeof(point_light));
+  l->methods = &light_methods;
+
+  l->tex=(texture *)tex;
+  l->ctr=ctr;
+  l->rad=rad;
+
+  return l;
+}
+
+static int light_bbox(void * obj, vector * min, vector * max) {
+  return 0; /* lights are unbounded currently */
+}
+
+static void light_intersect(point_light * l, ray * ry) {
+  flt b, disc, t1, t2, temp;
+  vector V;
+
+  /* Lights do not cast shadows.. */
+  if (ry->flags & RT_RAY_SHADOW)
+    return;
+
+  VSUB(l->ctr, ry->o, V);
+  VDOT(b, V, ry->d); 
+  VDOT(temp, V, V);  
+
+  disc=b*b + l->rad*l->rad - temp;
+
+  if (disc<=0.0) return;
+  disc=sqrt(disc);
+
+  t2=b+disc;
+  if (t2 <= SPEPSILON) 
+    return;
+  add_intersection(t2, (object *) l, ry);  
+
+  t1=b-disc;
+  if (t1 > SPEPSILON) 
+    add_intersection(t1, (object *) l, ry);  
+}
+
+static void light_normal(point_light * l, vector * pnt, ray * incident, vector * N) {
+  VSub((vector *) pnt, &(l->ctr), N);
+
+  VNorm(N);
+
+  if (VDot(N, &(incident->d)) > 0.0)  {
+    N->x=-N->x;
+    N->y=-N->y;
+    N->z=-N->z;
+  } 
+}
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/light.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/light.h
new file mode 100644
index 00000000..0625ba7d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/light.h
@@ -0,0 +1,71 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * light.h - this file includes declarations and defines for light sources.
+ *
+ *  $Id: light.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector ctr;
+  flt rad;
+} point_light; 
+
+point_light * newlight(void *, vector, flt);
+
+#ifdef LIGHT_PRIVATE
+static int light_bbox(void * obj, vector * min, vector * max);
+static void light_intersect(point_light *, ray *);
+static void light_normal(point_light *, vector *, ray *, vector *);
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/machine.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/machine.h
new file mode 100644
index 00000000..a73ad104
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/machine.h
@@ -0,0 +1,66 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * machine.h - This is the machine specific include file
+ *
+ *  $Id: machine.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+#include <stdio.h>
+#include <cstdlib>
+#include <string.h>
+#include <math.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+
+using namespace std;
+
+#define STDTIME
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/macros.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/macros.h
new file mode 100644
index 00000000..c3a1fabc
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/macros.h
@@ -0,0 +1,79 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * macros.h - This file contains macro versions of functions that would be best 
+ * used as inlined code rather than function calls.
+ *
+ *  $Id: macros.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+#define MYMAX(a , b) ((a) > (b) ? (a) : (b))
+#define MYMIN(a , b) ((a) < (b) ? (a) : (b))
+
+#define VDOT(return, a, b) 				\
+ return=(a.x * b.x  +  a.y * b.y  +  a.z * b.z); 	\
+
+#define RAYPNT(c, a, b)		\
+c.x = a.o.x + ( a.d.x * b );	\
+c.y = a.o.y + ( a.d.y * b );	\
+c.z = a.o.z + ( a.d.z * b );	\
+
+
+#define VSUB(a, b, c)		\
+c.x = (a.x - b.x);		\
+c.y = (a.y - b.y);		\
+c.z = (a.z - b.z);		\
+
+
+#define VCROSS(a, b, c) 				\
+ c->x = (a->y * b->z) - (a->z * b->y);			\
+ c->y = (a->z * b->x) - (a->x * b->z);			\
+ c->z = (a->x * b->y) - (a->y * b->x);			\
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/main.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/main.cpp
new file mode 100644
index 00000000..a724df8a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/main.cpp
@@ -0,0 +1,385 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+#define VIDEO_WINMAIN_ARGS
+#include "types.h"
+#include "api.h"       /* The ray tracing library API */
+#include "parse.h"     /* Support for my own file format */
+#include "ui.h"
+#include "util.h"
+#include "tachyon_video.h"
+#include "../../../common/utility/utility.h"
+
+#if WIN8UI_EXAMPLE
+#include "tbb/tbb.h"
+volatile long global_startTime = 0;
+volatile long global_elapsedTime = 0;
+volatile bool global_isCancelled = false;
+volatile int global_number_of_threads;
+#endif
+
+SceneHandle global_scene;
+int global_xsize;     /*  size of graphic image rendered in window (from hres, vres)  */
+int global_ysize;
+int global_xwinsize;  /*  size of window (may be larger than above)  */
+int global_ywinsize;
+char *global_window_title;
+bool global_usegraphics;
+
+bool silent_mode = false; /* silent mode */
+
+class tachyon_video *video = 0;
+
+typedef struct {
+  int foundfilename;      /* was a model file name found in the args? */
+  char filename[1024];    /* model file to render */
+  int useoutfilename;     /* command line override of output filename */
+  char outfilename[1024]; /* name of output image file */
+  int verbosemode;        /* verbose flags */
+  int antialiasing;       /* antialiasing setting */
+  int displaymode;        /* display mode */
+  int boundmode;          /* bounding mode */
+  int boundthresh;        /* bounding threshold */
+  int usecamfile;         /* use camera file */
+  char camfilename[1024]; /* camera filename */
+} argoptions;
+
+void initoptions(argoptions * opt) {
+    memset(opt, 0, sizeof(argoptions));
+    opt->foundfilename = -1;
+    opt->useoutfilename = -1;
+    opt->verbosemode = -1;
+    opt->antialiasing = -1;
+    opt->displaymode = -1;
+    opt->boundmode = -1; 
+    opt->boundthresh = -1; 
+    opt->usecamfile = -1;
+}
+
+#if WIN8UI_EXAMPLE
+int CreateScene() {
+
+   char* filename = "Assets/balls.dat";
+
+    global_scene = rt_newscene();
+    rt_initialize();
+
+    if ( readmodel(filename, global_scene) != 0 ) {
+        rt_finalize();
+        return -1;
+    }
+
+    // need these early for create_graphics_window() so grab these here...
+    scenedef *scene = (scenedef *) global_scene;
+
+    // scene->hres and scene->vres should be equal to screen resolution
+    scene->hres = global_xwinsize = global_xsize;
+    scene->vres = global_ywinsize = global_ysize;  
+
+    return 0;
+}
+
+unsigned int __stdcall example_main(void *)
+{
+    try {
+
+        if ( CreateScene() != 0 )
+            exit(-1);
+
+        tachyon_video tachyon;
+        tachyon.threaded = true;
+        tachyon.init_console();
+
+        // always using window even if(!global_usegraphics)
+        global_usegraphics = 
+            tachyon.init_window(global_xwinsize, global_ywinsize);
+        if(!tachyon.running)
+            exit(-1);
+
+        video = &tachyon;
+
+        for(;;) {
+            global_elapsedTime = 0;
+            global_startTime=(long) time(NULL);
+            global_isCancelled=false;
+            if (video)video->running = true;
+            tbb::task_scheduler_init init (global_number_of_threads);
+            memset(g_pImg, 0, sizeof(unsigned int) * global_xsize * global_ysize);
+            tachyon.main_loop();
+            global_elapsedTime = (long)(time(NULL)-global_startTime);
+            video->running=false;
+            //The timer to restart drawing then it is complete.
+            int timer=50;
+            while( (  !global_isCancelled && (timer--)>0 ) ){
+                rt_sleep( 100 );
+            }
+        }
+        return NULL;
+
+    } catch ( std::exception& e ) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
+
+#elif __TBB_IOS
+
+#include "tbb/tbb.h"
+#include "CoreFoundation/CoreFoundation.h"
+extern "C" void get_screen_resolution(int *x, int *y);
+
+int CreateScene() {
+
+    CFURLRef balls_dat_url = CFBundleCopyResourceURL(CFBundleGetMainBundle(), CFSTR("balls"), CFSTR("dat"),NULL);
+    char filename[1024];
+    CFURLGetFileSystemRepresentation(balls_dat_url, true, (UInt8*)filename, (CFIndex)sizeof(filename));
+    CFRelease(balls_dat_url);
+
+    global_scene = rt_newscene();
+    rt_initialize();
+
+    if ( readmodel(filename, global_scene) != 0 ) {
+        rt_finalize();
+        return -1;
+    }
+
+    // need these early for create_graphics_window() so grab these here...
+    scenedef *scene = (scenedef *) global_scene;
+
+    get_screen_resolution(&global_xsize, &global_ysize);
+
+    // scene->hres and scene->vres should be equal to screen resolution
+    scene->hres = global_xwinsize = global_xsize;
+    scene->vres = global_ywinsize = global_ysize;
+    return 0;
+}
+
+int main (int argc, char *argv[]) {
+    try {
+
+        if ( CreateScene() != 0 ) return -1;
+
+        tachyon_video tachyon;
+        tachyon.threaded = true;
+        tachyon.init_console();
+
+        global_usegraphics = tachyon.init_window(global_xwinsize, global_ywinsize);
+        if(!tachyon.running) return -1;
+
+        //TODO: add a demo loop.
+        video = &tachyon;
+        if (video)video->running = true;
+        memset(g_pImg, 0, sizeof(unsigned int) * global_xsize * global_ysize);
+        tachyon.main_loop();
+        video->running=false;
+        return NULL;
+
+    } catch ( std::exception& e ) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
+
+#else
+
+static char *window_title_string (int argc, const char **argv)
+{
+    int i;
+    char *name;
+
+    name = (char *) malloc (8192);
+    char *title = getenv ("TITLE");
+    if( title ) strcpy( name, title );
+    else {
+        if(strrchr(argv[0], '\\')) strcpy (name, strrchr(argv[0], '\\')+1);
+        else if(strrchr(argv[0], '/')) strcpy (name, strrchr(argv[0], '/')+1);
+        else strcpy (name, *argv[0]?argv[0]:"Tachyon");
+    }
+    for (i = 1; i < argc; i++) {
+        strcat (name, " ");
+        strcat (name, argv[i]);
+    }
+#ifdef _DEBUG
+    strcat (name, " (DEBUG BUILD)");
+#endif
+    return name;
+}
+
+int useoptions(argoptions * opt, SceneHandle scene) {
+  if (opt->useoutfilename == 1) {
+    rt_outputfile(scene, opt->outfilename);
+  }
+
+  if (opt->verbosemode == 1) {
+    rt_verbose(scene, 1);
+  }
+
+  if (opt->antialiasing != -1) {
+    /* need new api code for this */
+  } 
+
+  if (opt->displaymode != -1) {
+    rt_displaymode(scene, opt->displaymode);
+  }
+
+  if (opt->boundmode != -1) {
+    rt_boundmode(scene, opt->boundmode);
+  }
+
+  if (opt->boundthresh != -1) {
+    rt_boundthresh(scene, opt->boundthresh);
+  }
+
+  return 0;
+}    
+
+argoptions ParseCommandLine(int argc, const char *argv[]) {
+    argoptions opt;
+
+    initoptions(&opt);
+
+    bool nobounding = false;
+    bool nodisp = false;
+
+    string filename;
+
+    utility::parse_cli_arguments(argc,argv,
+        utility::cli_argument_pack()
+        .positional_arg(filename,"dataset", "Model file")
+        .positional_arg(opt.boundthresh,"boundthresh","bounding threshold value")
+        .arg(nodisp,"no-display-updating","disable run-time display updating")
+        .arg(nobounding,"no-bounding","disable bounding technique")
+        .arg(silent_mode,"silent","no output except elapsed time")
+    );
+
+    strcpy(opt.filename, filename.c_str());
+
+    opt.displaymode = nodisp ? RT_DISPLAY_DISABLED : RT_DISPLAY_ENABLED;
+    opt.boundmode = nobounding ? RT_BOUNDING_DISABLED : RT_BOUNDING_ENABLED;
+
+    return opt;
+}
+
+int CreateScene(argoptions &opt) {
+    char *filename;
+
+    global_scene = rt_newscene();
+    rt_initialize();
+
+    /* process command line overrides */
+    useoptions(&opt, global_scene);
+
+#ifdef DEFAULT_MODELFILE
+#if  _WIN32||_WIN64
+#define _GLUE_FILENAME(x) "..\\dat\\" #x
+#else
+#define _GLUE_FILENAME(x) #x
+#endif
+#define GLUE_FILENAME(x) _GLUE_FILENAME(x)
+    if(opt.foundfilename == -1)
+        filename = GLUE_FILENAME(DEFAULT_MODELFILE);
+    else
+#endif//DEFAULT_MODELFILE
+        filename = opt.filename;
+
+    if ( readmodel(filename, global_scene) != 0 ) {
+        fprintf(stderr, "Parser returned a non-zero error code reading %s\n", filename);
+        fprintf(stderr, "Aborting Render...\n");
+        rt_finalize();
+        return -1;
+    }
+
+    // need these early for create_graphics_window() so grab these here...
+    scenedef *scene = (scenedef *) global_scene;
+    global_xsize = scene->hres;
+    global_ysize = scene->vres;
+    global_xwinsize = global_xsize;
+    global_ywinsize = global_ysize;  // add some here to leave extra blank space on bottom for status etc.
+
+    return 0;
+}
+
+int main (int argc, char *argv[]) {
+    try {
+        timer mainStartTime = gettimer();
+
+        global_window_title = window_title_string (argc, (const char**)argv);
+
+        argoptions opt = ParseCommandLine(argc, (const char**)argv);
+
+        if ( CreateScene(opt) != 0 )
+            return -1;
+
+        tachyon_video tachyon;
+        tachyon.threaded = true;
+        tachyon.init_console();
+
+        tachyon.title = global_window_title;
+        // always using window even if(!global_usegraphics)
+        global_usegraphics = 
+            tachyon.init_window(global_xwinsize, global_ywinsize);
+        if(!tachyon.running)
+            return -1;
+
+        video = &tachyon;
+        tachyon.main_loop();
+
+        utility::report_elapsed_time(timertime(mainStartTime, gettimer()));
+        return 0;
+    } catch ( std::exception& e ) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
+#endif
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/objbound.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/objbound.cpp
new file mode 100644
index 00000000..704f4042
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/objbound.cpp
@@ -0,0 +1,336 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * objbound.cpp - This file contains the functions to find bounding boxes
+ *              for the various primitives 
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "bndbox.h"
+
+#define OBJBOUND_PRIVATE
+#include "objbound.h"
+
+static void globalbound(object ** rootlist, vector * gmin, vector * gmax) {
+  vector min, max; 
+  object * cur;
+
+  if (*rootlist == NULL)  /* don't bound non-existant objects */
+    return;
+
+  gmin->x =  FHUGE;   gmin->y =  FHUGE;   gmin->z =  FHUGE;
+  gmax->x = -FHUGE;   gmax->y = -FHUGE;   gmax->z = -FHUGE;
+
+  cur=*rootlist;
+  while (cur != NULL)  {  /* Go! */ 
+    min.x = -FHUGE; min.y = -FHUGE; min.z = -FHUGE;
+    max.x =  FHUGE; max.y =  FHUGE; max.z =  FHUGE;
+
+    cur->methods->bbox((void *) cur, &min, &max);
+
+    gmin->x = MYMIN( gmin->x , min.x); 
+    gmin->y = MYMIN( gmin->y , min.y); 
+    gmin->z = MYMIN( gmin->z , min.z); 
+  
+    gmax->x = MYMAX( gmax->x , max.x); 
+    gmax->y = MYMAX( gmax->y , max.y); 
+    gmax->z = MYMAX( gmax->z , max.z); 
+
+    cur=(object *)cur->nextobj;
+  }
+}
+
+static int objinside(object * obj, vector * min, vector * max) {
+  vector omin, omax;
+
+  if (obj == NULL)  /* non-existant object, shouldn't get here */
+    return 0;
+
+  if (obj->methods->bbox((void *) obj, &omin, &omax)) {
+    if ((min->x <= omin.x) && (min->y <= omin.y) && (min->z <= omin.z) &&
+        (max->x >= omax.x) && (max->y >= omax.y) && (max->z >= omax.z)) { 
+      return 1;
+    }
+  }
+  return 0;
+}
+
+static int countobj(object * root) {
+  object * cur;     /* counts the number of objects on a list */
+  int numobj;
+
+  numobj=0;
+  cur=root;
+
+  while (cur != NULL) {
+    cur=(object *)cur->nextobj;
+    numobj++;
+  } 
+  return numobj;
+}
+
+static void movenextobj(object * thisobj, object ** root) {
+  object * cur, * tmp;
+
+  /* move the object after thisobj to the front of the object list  */
+  /*   headed by root */
+  if (thisobj != NULL) {
+    if (thisobj->nextobj != NULL) {
+      cur=(object *)thisobj->nextobj;            /* the object to be moved    */
+      thisobj->nextobj = cur->nextobj; /* link around the moved obj */
+      tmp=*root;                       /* store the root node       */
+      cur->nextobj=tmp;                /* attach root to cur        */ 
+      *root=cur;                       /* make cur, the new root    */
+    }
+  }
+}
+
+static void octreespace(object ** rootlist, int maxoctnodes) {
+  object * cur;
+  vector gmin, gmax, gctr;
+  vector cmin1, cmin2, cmin3, cmin4, cmin5, cmin6, cmin7, cmin8;
+  vector cmax1, cmax2, cmax3, cmax4, cmax5, cmax6, cmax7, cmax8;
+  bndbox * box1, * box2, * box3, * box4;
+  bndbox * box5, * box6, * box7, * box8;
+  int skipobj;
+
+  if (*rootlist == NULL)  /* don't subdivide non-existant data */
+    return;
+
+  skipobj=0;
+  globalbound(rootlist, &gmin, &gmax);  /* find global min and max */
+
+  gctr.x = ((gmax.x - gmin.x) / 2.0) + gmin.x;
+  gctr.y = ((gmax.y - gmin.y) / 2.0) + gmin.y;
+  gctr.z = ((gmax.z - gmin.z) / 2.0) + gmin.z;
+
+  cmin1=gmin;
+  cmax1=gctr;
+  box1 = newbndbox(cmin1, cmax1); 
+
+  cmin2=gmin;
+  cmin2.x=gctr.x;
+  cmax2=gmax;
+  cmax2.y=gctr.y;
+  cmax2.z=gctr.z;
+  box2 = newbndbox(cmin2, cmax2); 
+
+  cmin3=gmin;
+  cmin3.y=gctr.y;
+  cmax3=gmax;
+  cmax3.x=gctr.x;
+  cmax3.z=gctr.z;
+  box3 = newbndbox(cmin3, cmax3); 
+
+  cmin4=gmin;
+  cmin4.x=gctr.x;
+  cmin4.y=gctr.y;
+  cmax4=gmax;
+  cmax4.z=gctr.z;
+  box4 = newbndbox(cmin4, cmax4); 
+
+  cmin5=gmin;
+  cmin5.z=gctr.z;
+  cmax5=gctr;
+  cmax5.z=gmax.z;
+  box5 = newbndbox(cmin5, cmax5); 
+
+  cmin6=gctr;
+  cmin6.y=gmin.y;
+  cmax6=gmax;
+  cmax6.y=gctr.y;
+  box6 = newbndbox(cmin6, cmax6); 
+
+  cmin7=gctr;
+  cmin7.x=gmin.x;
+  cmax7=gctr;
+  cmax7.y=gmax.y;
+  cmax7.z=gmax.z;
+  box7 = newbndbox(cmin7, cmax7); 
+
+  cmin8=gctr;
+  cmax8=gmax;
+  box8 = newbndbox(cmin8, cmax8); 
+
+  cur = *rootlist;
+  while (cur != NULL)  {  
+    if (objinside((object *)cur->nextobj, &cmin1, &cmax1)) {
+      movenextobj(cur, &box1->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin2, &cmax2)) {
+      movenextobj(cur, &box2->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin3, &cmax3)) {
+      movenextobj(cur, &box3->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin4, &cmax4)) {
+      movenextobj(cur, &box4->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin5, &cmax5)) {
+      movenextobj(cur, &box5->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin6, &cmax6)) {
+      movenextobj(cur, &box6->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin7, &cmax7)) {
+      movenextobj(cur, &box7->objlist);  
+    }  
+    else if (objinside((object *)cur->nextobj, &cmin8, &cmax8)) {
+      movenextobj(cur, &box8->objlist);  
+    }  
+    else {
+      skipobj++; 
+      cur=(object *)cur->nextobj;
+    }
+  }     
+
+/* new scope, for redefinition of cur, and old */
+  { bndbox * cur, * old;
+  old=box1;
+  cur=box2; 
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+  cur=box3;
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+  cur=box4;
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+  cur=box5;
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+  cur=box6;
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+  cur=box7;
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+  cur=box8;
+  if (countobj(cur->objlist) > 0) {
+     old->nextobj=cur;
+     globalbound(&cur->objlist, &cur->min, &cur->max); 
+     old=cur; 
+  }      
+
+  old->nextobj=*rootlist;
+
+  if (countobj(box1->objlist) > 0) {
+    globalbound(&box1->objlist, &box1->min, &box1->max); 
+    *rootlist=(object *) box1;
+  }
+  else {
+    *rootlist=(object *) box1->nextobj;
+  }
+
+  } /**** end of special cur and old scope */
+
+  if (countobj(box1->objlist) > maxoctnodes) {
+    octreespace(&box1->objlist, maxoctnodes);
+  }
+  if (countobj(box2->objlist) > maxoctnodes) {
+    octreespace(&box2->objlist, maxoctnodes);
+  }
+  if (countobj(box3->objlist) > maxoctnodes) {
+    octreespace(&box3->objlist, maxoctnodes);
+  }
+  if (countobj(box4->objlist) > maxoctnodes) {
+    octreespace(&box4->objlist, maxoctnodes);
+  }
+  if (countobj(box5->objlist) > maxoctnodes) {
+    octreespace(&box5->objlist, maxoctnodes);
+  }
+  if (countobj(box6->objlist) > maxoctnodes) {
+    octreespace(&box6->objlist, maxoctnodes);
+  }
+  if (countobj(box7->objlist) > maxoctnodes) {
+    octreespace(&box7->objlist, maxoctnodes);
+  }
+  if (countobj(box8->objlist) > maxoctnodes) {
+    octreespace(&box8->objlist, maxoctnodes);
+  }
+}
+
+void dividespace(int maxoctnodes, object **toplist) {
+  bndbox * gbox;
+  vector gmin, gmax;
+
+  if (countobj(*toplist) > maxoctnodes) {
+    globalbound(toplist, &gmin, &gmax);  
+
+    octreespace(toplist, maxoctnodes); 
+
+    gbox = newbndbox(gmin, gmax);
+    gbox->objlist = NULL;
+    gbox->tex = NULL; 
+    gbox->nextobj=NULL;
+    gbox->objlist=*toplist;
+    *toplist=(object *) gbox;  
+  }
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/objbound.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/objbound.h
new file mode 100644
index 00000000..f40575f8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/objbound.h
@@ -0,0 +1,66 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*  
+ * objbound.h - defines for object bounding code.
+ *
+ *  $Id: objbound.h,v 1.2 2007-02-22 17:54:15 Exp $
+ */
+
+void dividespace(int, object **);
+
+#ifdef OBJBOUND_PRIVATE
+
+static void globalbound(object **, vector *, vector *);
+static int objinside(object * obj, vector * min, vector * max);
+static int countobj(object *);
+static void movenextobj(object *, object **);
+static void octreespace(object **, int);
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/parse.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/parse.cpp
new file mode 100644
index 00000000..ce3ebc5a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/parse.cpp
@@ -0,0 +1,863 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * parse.cpp - an UltraLame (tm) parser for simple data files...
+ */
+
+// Try preventing lots of GCC warnings about ignored results of fscanf etc.
+#if !__INTEL_COMPILER
+
+#if __GNUC__<4 || __GNUC__==4 && __GNUC_MINOR__<5
+// For older versions of GCC, disable use of __wur in GLIBC
+#undef _FORTIFY_SOURCE
+#define _FORTIFY_SOURCE 0
+#else
+// Starting from 4.5, GCC has a suppression option
+#pragma GCC diagnostic ignored "-Wunused-result"
+#endif
+
+#endif //__INTEL_COMPILER
+
+#include <stdio.h>
+#include <math.h>
+#include <string.h>
+#include <stdlib.h>
+#include <ctype.h> /* needed for toupper(), macro.. */
+
+#include "types.h"
+#include "api.h"      /* rendering API */
+
+#define PARSE_INTERNAL
+#include "parse.h" /* self protos */
+#undef PARSE_INTERNAL
+
+static texentry textable[NUMTEXS]; /* texture lookup table */
+static texentry defaulttex;     /* The default texture when a lookup fails */
+static int numtextures;         /* number of TEXDEF textures               */
+static int numobjectsparsed;    /* total number of objects parsed so far   */
+static color scenebackcol;   /* scene background color                  */
+
+static int stringcmp(const char * a, const char * b) {
+  size_t i, s, l;
+
+  s=strlen(a);
+  l=strlen(b);
+
+  if (s != l)
+    return 1;
+
+  for (i=0; i<s; i++) {
+    if (toupper(a[i]) != toupper(b[i])) {
+      return 1;
+    }
+  }
+  return 0;
+}
+
+static void reset_tex_table(void) {
+  apitexture apitex;
+
+  numtextures=0;
+  memset(&textable, 0, sizeof(textable));
+
+  apitex.col.r=1.0;
+  apitex.col.g=1.0;
+  apitex.col.b=1.0;
+  apitex.ambient=0.1;
+  apitex.diffuse=0.9;
+  apitex.specular=0.0;
+  apitex.opacity=1.0;
+  apitex.texturefunc=0;
+
+  defaulttex.tex=rt_texture(&apitex);
+}
+
+static errcode add_texture(void * tex, char name[TEXNAMELEN]) {
+  textable[numtextures].tex=tex;
+  strcpy(textable[numtextures].name, name);
+
+  numtextures++;
+  if (numtextures > NUMTEXS) {
+    fprintf(stderr, "Parse: %d textures allocated, texture slots full!\n", numtextures);
+    numtextures--; /* keep writing over last texture if we've run out.. */
+    return PARSEALLOCERR;
+  }
+
+  return PARSENOERR;
+}
+
+static void * find_texture(char name[TEXNAMELEN]) {
+  int i;
+
+  for (i=0; i<numtextures; i++) {
+    if (strcmp(name, textable[i].name) == 0)
+    return textable[i].tex;
+  }
+  fprintf(stderr, "Undefined texture '%s', using default. \n",name);
+  return(defaulttex.tex);
+}
+
+apiflt degtorad(apiflt deg) {
+  apiflt tmp;
+  tmp=deg * 3.1415926 / 180.0;
+  return tmp;
+}
+
+static void degvectoradvec(vector * degvec) {
+  vector tmp;
+
+  tmp.x=degtorad(degvec->x);
+  tmp.y=degtorad(degvec->y);
+  tmp.z=degtorad(degvec->z);
+  *degvec=tmp;
+}
+
+static void InitRot3d(RotMat * rot, apiflt x, apiflt y, apiflt z) {
+  rot->rx1=cos(y)*cos(z);
+  rot->rx2=sin(x)*sin(y)*cos(z) - cos(x)*sin(z);
+  rot->rx3=sin(x)*sin(z) + cos(x)*cos(z)*sin(y);
+
+  rot->ry1=cos(y)*sin(z);
+  rot->ry2=cos(x)*cos(z) + sin(x)*sin(y)*sin(z);
+  rot->ry3=cos(x)*sin(y)*sin(z) - sin(x)*cos(z);
+
+  rot->rz1=sin(y);
+  rot->rz2=sin(x)*cos(y);
+  rot->rz3=cos(x)*cos(y);
+}
+
+static void Rotate3d(RotMat * rot, vector * vec) {
+  vector tmp;
+  tmp.x=(vec->x*(rot->rx1) + vec->y*(rot->rx2) + vec->z*(rot->rx3));
+  tmp.y=(vec->x*(rot->ry1) + vec->y*(rot->ry2) + vec->z*(rot->ry3));
+  tmp.z=(vec->x*(rot->rz1) + vec->y*(rot->rz2) + vec->z*(rot->rz3));
+  *vec=tmp;
+}
+
+static void Scale3d(vector * scale, vector * vec) {
+  vec->x=vec->x * scale->x;
+  vec->y=vec->y * scale->y;
+  vec->z=vec->z * scale->z;
+}
+
+static void Trans3d(vector * trans, vector * vec) {
+  vec->x+=trans->x;
+  vec->y+=trans->y;
+  vec->z+=trans->z;
+}
+
+static errcode GetString(FILE * dfile, const char * string) {
+  char data[255];
+
+  fscanf(dfile,"%s",data);
+  if (stringcmp(data, string) != 0) {
+    fprintf(stderr, "parse: Expected %s, got %s \n",string, data);
+    fprintf(stderr, "parse: Error while parsing object: %d \n",numobjectsparsed);
+    return PARSEBADSYNTAX;
+  }
+
+  return PARSENOERR;
+}
+
+unsigned int readmodel(char * modelfile, SceneHandle scene) {
+  FILE * dfile;
+  errcode rc;
+
+  reset_tex_table();
+  dfile=NULL;
+
+  dfile=fopen(modelfile,"r");
+  if (dfile==NULL) {
+    return PARSEBADFILE;
+  }
+
+  rc = GetScenedefs(dfile, scene);
+  if (rc != PARSENOERR) {
+    fclose(dfile);
+    return rc;
+  }
+
+  scenebackcol.r = 0.0; /* default background is black */
+  scenebackcol.g = 0.0;
+  scenebackcol.b = 0.0;
+
+  numobjectsparsed=0;
+  while ((rc = GetObject(dfile, scene)) == PARSENOERR) {
+    numobjectsparsed++;
+  }
+  fclose(dfile);
+
+  if (rc == PARSEEOF)
+    rc = PARSENOERR;
+
+  rt_background(scene, scenebackcol);
+
+  return rc;
+}
+
+
+static errcode GetScenedefs(FILE * dfile, SceneHandle scene) {
+  vector Ccenter, Cview, Cup;
+  apiflt zoom, aspectratio;
+  int raydepth, antialiasing;
+  char outfilename[200];
+  int xres, yres, verbose;
+  float a,b,c;
+  errcode rc = PARSENOERR;
+
+  rc |= GetString(dfile, "BEGIN_SCENE");
+
+  rc |= GetString(dfile, "OUTFILE");
+  fscanf(dfile, "%s", outfilename);
+#ifdef _WIN32
+  if (strcmp (outfilename, "/dev/null") == 0) {
+    strcpy (outfilename, "NUL:");
+  }
+#endif
+
+  rc |= GetString(dfile, "RESOLUTION");
+  fscanf(dfile, "%d %d", &xres, &yres);
+
+  rc |= GetString(dfile, "VERBOSE");
+  fscanf(dfile, "%d", &verbose);
+
+  rt_scenesetup(scene, outfilename, xres, yres, verbose);
+
+  rc |= GetString(dfile, "CAMERA");
+
+  rc |= GetString(dfile, "ZOOM");
+  fscanf(dfile, "%f", &a);
+  zoom=a;
+
+  rc |= GetString(dfile, "ASPECTRATIO");
+  fscanf(dfile, "%f", &b);
+  aspectratio=b;
+
+  rc |= GetString(dfile, "ANTIALIASING");
+  fscanf(dfile, "%d", &antialiasing);
+
+  rc |= GetString(dfile, "RAYDEPTH");
+  fscanf(dfile, "%d", &raydepth);
+
+  rc |= GetString(dfile, "CENTER");
+  fscanf(dfile,"%f %f %f", &a, &b, &c);
+  Ccenter.x = a;
+  Ccenter.y = b;
+  Ccenter.z = c;
+
+  rc |= GetString(dfile, "VIEWDIR");
+  fscanf(dfile,"%f %f %f", &a, &b, &c);
+  Cview.x = a;
+  Cview.y = b;
+  Cview.z = c;
+
+  rc |= GetString(dfile, "UPDIR");
+  fscanf(dfile,"%f %f %f", &a, &b, &c);
+  Cup.x = a;
+  Cup.y = b;
+  Cup.z = c;
+
+  rc |= GetString(dfile, "END_CAMERA");   
+
+  rt_camerasetup(scene, zoom, aspectratio, antialiasing, raydepth,
+              Ccenter, Cview, Cup);
+
+
+  return rc;
+}
+
+static errcode GetObject(FILE * dfile, SceneHandle scene) {
+  char objtype[80];
+
+  fscanf(dfile, "%s", objtype);
+  if (!stringcmp(objtype, "END_SCENE")) {
+    return PARSEEOF; /* end parsing */
+  }
+  if (!stringcmp(objtype, "TEXDEF")) {
+    return GetTexDef(dfile);
+  }
+  if (!stringcmp(objtype, "TEXALIAS")) {
+    return GetTexAlias(dfile);
+  }
+  if (!stringcmp(objtype, "BACKGROUND")) {
+    return GetBackGnd(dfile);
+  }
+  if (!stringcmp(objtype, "CYLINDER")) {
+    return GetCylinder(dfile);
+  }
+  if (!stringcmp(objtype, "FCYLINDER")) {
+    return GetFCylinder(dfile);
+  }
+  if (!stringcmp(objtype, "POLYCYLINDER")) {
+    return GetPolyCylinder(dfile);
+  }
+  if (!stringcmp(objtype, "SPHERE")) {
+    return GetSphere(dfile);
+  }
+  if (!stringcmp(objtype, "PLANE")) {
+    return GetPlane(dfile);
+  }
+  if (!stringcmp(objtype, "RING")) {
+    return GetRing(dfile);
+  }
+  if (!stringcmp(objtype, "BOX")) {
+    return GetBox(dfile);
+  }
+  if (!stringcmp(objtype, "SCALARVOL")) {
+    return GetVol(dfile);
+  }
+  if (!stringcmp(objtype, "TRI")) {
+    return GetTri(dfile);
+  }
+  if (!stringcmp(objtype, "STRI")) {
+    return GetSTri(dfile);
+  }
+  if (!stringcmp(objtype, "LIGHT")) {
+    return GetLight(dfile);
+  }
+  if (!stringcmp(objtype, "SCAPE")) {
+    return GetLandScape(dfile);
+  }
+  if (!stringcmp(objtype, "TPOLYFILE")) {
+    return GetTPolyFile(dfile);
+  }
+
+  fprintf(stderr, "Found bad token: %s expected an object type\n", objtype);
+  return PARSEBADSYNTAX;
+}
+
+static errcode GetVector(FILE * dfile, vector * v1) {
+  float a, b, c;
+
+  fscanf(dfile, "%f %f %f", &a, &b, &c);
+  v1->x=a;
+  v1->y=b;
+  v1->z=c;
+
+  return PARSENOERR;
+}
+
+static errcode GetColor(FILE * dfile, color * c1) {
+  float r, g, b;
+  int rc;
+
+  rc = GetString(dfile, "COLOR");
+  fscanf(dfile, "%f %f %f", &r, &g, &b);
+  c1->r=r;
+  c1->g=g;
+  c1->b=b;
+
+  return rc;
+}
+
+static errcode GetTexDef(FILE * dfile) {
+  char texname[TEXNAMELEN];
+
+  fscanf(dfile, "%s", texname);
+  add_texture(GetTexBody(dfile), texname);
+
+  return PARSENOERR;
+}
+
+static errcode GetTexAlias(FILE * dfile) {
+  char texname[TEXNAMELEN];
+  char aliasname[TEXNAMELEN];
+
+  fscanf(dfile, "%s", texname);
+  fscanf(dfile, "%s", aliasname);
+  add_texture(find_texture(aliasname), texname);
+
+  return PARSENOERR;
+}
+
+
+static errcode GetTexture(FILE * dfile, void ** tex) {
+  char tmp[255];
+  errcode rc = PARSENOERR;
+
+  fscanf(dfile, "%s", tmp);
+  if (!stringcmp("TEXTURE", tmp)) {
+    *tex = GetTexBody(dfile);
+  }
+  else
+    *tex = find_texture(tmp);
+
+  return rc;
+}
+
+void * GetTexBody(FILE * dfile) {
+  char tmp[255];
+  float a,b,c,d, phong, phongexp, phongtype;
+  apitexture tex;
+  void * voidtex;
+  errcode rc;
+
+  rc = GetString(dfile, "AMBIENT");
+  fscanf(dfile, "%f", &a);
+  tex.ambient=a;
+
+  rc |= GetString(dfile, "DIFFUSE");
+  fscanf(dfile, "%f", &b);
+  tex.diffuse=b;
+
+  rc |= GetString(dfile, "SPECULAR");
+  fscanf(dfile, "%f", &c);
+  tex.specular=c;
+
+  rc |= GetString(dfile, "OPACITY");
+  fscanf(dfile, "%f", &d);
+  tex.opacity=d;
+
+  fscanf(dfile, "%s", tmp);
+  if (!stringcmp("PHONG", tmp)) {
+    fscanf(dfile, "%s", tmp);
+    if (!stringcmp("METAL", tmp)) {
+      phongtype = RT_PHONG_METAL;
+    }
+    else if (!stringcmp("PLASTIC", tmp)) {
+      phongtype = RT_PHONG_PLASTIC;
+    }
+    else {
+      phongtype = RT_PHONG_PLASTIC;
+    }
+
+    fscanf(dfile, "%f", &phong);
+    GetString(dfile, "PHONG_SIZE");
+    fscanf(dfile, "%f", &phongexp);
+    fscanf(dfile, "%s", tmp);
+  }
+  else {
+    phong = 0.0;
+    phongexp = 100.0;
+    phongtype = RT_PHONG_PLASTIC;
+  }
+
+  fscanf(dfile, "%f %f %f", &a, &b, &c);
+  tex.col.r = a;
+  tex.col.g = b;
+  tex.col.b = c;
+
+  rc |= GetString(dfile, "TEXFUNC");
+  fscanf(dfile, "%d", &tex.texturefunc);
+  if (tex.texturefunc >= 7) {    /* if its an image map, we need a filename */
+    fscanf(dfile, "%s", tex.imap);
+  }
+  if (tex.texturefunc != 0) {
+    rc |= GetString(dfile, "CENTER");
+    rc |= GetVector(dfile, &tex.ctr);
+    rc |= GetString(dfile, "ROTATE");
+    rc |= GetVector(dfile, &tex.rot);
+    rc |= GetString(dfile, "SCALE");
+    rc |= GetVector(dfile, &tex.scale);
+  }
+  if (tex.texturefunc == 9) {
+    rc |= GetString(dfile, "UAXIS");
+    rc |= GetVector(dfile, &tex.uaxs);
+    rc |= GetString(dfile, "VAXIS");
+    rc |= GetVector(dfile, &tex.vaxs);
+  }
+
+  voidtex = rt_texture(&tex);
+  rt_tex_phong(voidtex, phong, phongexp, (int) phongtype);
+
+  return voidtex;
+}
+
+static errcode GetLight(FILE * dfile) {
+  apiflt rad;
+  vector ctr;
+  apitexture tex;
+  float a;
+  errcode rc;
+
+  memset(&tex, 0, sizeof(apitexture));
+
+  rc = GetString(dfile,"CENTER");
+  rc |= GetVector(dfile, &ctr);
+  rc |= GetString(dfile,"RAD");
+  fscanf(dfile,"%f",&a);  /* read in radius */
+  rad=a;
+
+  rc |= GetColor(dfile, &tex.col);
+
+  rt_light(rt_texture(&tex), ctr, rad);
+
+  return rc;
+}
+
+static errcode GetBackGnd(FILE * dfile) {
+  float r,g,b;
+
+  fscanf(dfile, "%f %f %f", &r, &g, &b);
+
+  scenebackcol.r=r;
+  scenebackcol.g=g;
+  scenebackcol.b=b;
+
+  return PARSENOERR;
+}
+
+static errcode GetCylinder(FILE * dfile) {
+  apiflt rad;
+  vector ctr, axis;
+  void * tex;
+  float a;
+  errcode rc;
+
+  rc = GetString(dfile, "CENTER");
+  rc |= GetVector(dfile, &ctr);
+  rc |= GetString(dfile, "AXIS");
+  rc |= GetVector(dfile, &axis);
+  rc |= GetString(dfile, "RAD");
+  fscanf(dfile, "%f", &a);
+  rad=a;
+
+  rc |= GetTexture(dfile, &tex);
+  rt_cylinder(tex, ctr, axis, rad);
+
+  return rc;
+}
+
+static errcode GetFCylinder(FILE * dfile) {
+  apiflt rad;
+  vector ctr, axis;
+  vector pnt1, pnt2;
+  void * tex;
+  float a;
+  errcode rc;
+
+  rc = GetString(dfile, "BASE");
+  rc |= GetVector(dfile, &pnt1);
+  rc |= GetString(dfile, "APEX");
+  rc |= GetVector(dfile, &pnt2);
+
+  ctr=pnt1;
+  axis.x=pnt2.x - pnt1.x;
+  axis.y=pnt2.y - pnt1.y;
+  axis.z=pnt2.z - pnt1.z;
+
+  rc |= GetString(dfile, "RAD");
+  fscanf(dfile, "%f", &a);
+  rad=a;
+
+  rc |= GetTexture(dfile, &tex);
+  rt_fcylinder(tex, ctr, axis, rad);
+
+  return rc;
+}
+
+static errcode GetPolyCylinder(FILE * dfile) {
+  apiflt rad;
+  vector * temp;
+  void * tex;
+  float a;
+  int numpts, i;
+  errcode rc;
+
+  rc = GetString(dfile, "POINTS");
+  fscanf(dfile, "%d", &numpts);
+
+  temp = (vector *) malloc(numpts * sizeof(vector));
+
+  for (i=0; i<numpts; i++) {
+    rc |= GetVector(dfile, &temp[i]);
+  }
+
+  rc |= GetString(dfile, "RAD");
+  fscanf(dfile, "%f", &a);
+  rad=a;
+
+  rc |= GetTexture(dfile, &tex);
+  rt_polycylinder(tex, temp, numpts, rad);
+
+  free(temp);
+
+  return rc;
+}
+
+
+static errcode GetSphere(FILE * dfile) {
+  apiflt rad;
+  vector ctr;
+  void * tex;
+  float a;
+  errcode rc;
+
+  rc = GetString(dfile,"CENTER");
+  rc |= GetVector(dfile, &ctr);
+  rc |= GetString(dfile, "RAD");
+  fscanf(dfile,"%f",&a);
+  rad=a;
+
+  rc |= GetTexture(dfile, &tex);
+
+  rt_sphere(tex, ctr, rad);
+
+  return rc;
+}
+
+static errcode GetPlane(FILE * dfile) {
+  vector normal;
+  vector ctr;
+  void * tex;
+  errcode rc;
+
+  rc = GetString(dfile, "CENTER");
+  rc |= GetVector(dfile, &ctr);
+  rc |= GetString(dfile, "NORMAL");
+  rc |= GetVector(dfile, &normal);
+  rc |= GetTexture(dfile, &tex);
+
+  rt_plane(tex, ctr, normal);
+
+  return rc;
+}
+
+static errcode GetVol(FILE * dfile) {
+  vector min, max;
+  int x,y,z;
+  char fname[255];
+  void * tex;
+  errcode rc;
+
+  rc = GetString(dfile, "MIN");
+  rc |= GetVector(dfile, &min);
+  rc |= GetString(dfile, "MAX");
+  rc |= GetVector(dfile, &max);
+  rc |= GetString(dfile, "DIM");
+  fscanf(dfile, "%d %d %d ", &x, &y, &z);
+  rc |= GetString(dfile, "FILE");
+  fscanf(dfile, "%s", fname);
+  rc |= GetTexture(dfile, &tex);
+
+  rt_scalarvol(tex, min, max, x, y, z, fname, NULL);
+
+  return rc;
+}
+
+static errcode GetBox(FILE * dfile) {
+  vector min, max;
+  void * tex;
+  errcode rc;
+
+  rc = GetString(dfile, "MIN");
+  rc |= GetVector(dfile, &min);
+  rc |= GetString(dfile, "MAX");
+  rc |= GetVector(dfile, &max);
+  rc |= GetTexture(dfile, &tex);
+
+  rt_box(tex, min, max);
+
+  return rc;
+}
+
+static errcode GetRing(FILE * dfile) {
+  vector normal;
+  vector ctr;
+  void * tex;
+  float a,b;
+  errcode rc;
+
+  rc = GetString(dfile, "CENTER");
+  rc |= GetVector(dfile, &ctr);
+  rc |= GetString(dfile, "NORMAL");
+  rc |= GetVector(dfile, &normal);
+  rc |= GetString(dfile, "INNER");
+  fscanf(dfile, " %f ", &a);
+  rc |= GetString(dfile, "OUTER");
+  fscanf(dfile, " %f ", &b);
+  rc |= GetTexture(dfile, &tex);
+
+  rt_ring(tex, ctr, normal, a, b);
+
+  return rc;
+}
+
+static errcode GetTri(FILE * dfile) {
+  vector v0,v1,v2;
+  void * tex;
+  errcode rc;
+
+  rc = GetString(dfile, "V0");
+  rc |= GetVector(dfile, &v0);
+
+  rc |= GetString(dfile, "V1");
+  rc |= GetVector(dfile, &v1);
+
+  rc |= GetString(dfile, "V2");
+  rc |= GetVector(dfile, &v2);
+
+  rc |= GetTexture(dfile, &tex);
+
+  rt_tri(tex, v0, v1, v2);
+
+  return rc;
+}
+
+static errcode GetSTri(FILE * dfile) {
+  vector v0,v1,v2,n0,n1,n2;
+  void * tex;
+  errcode rc;
+
+  rc = GetString(dfile, "V0");
+  rc |= GetVector(dfile, &v0);
+
+  rc |= GetString(dfile, "V1");
+  rc |= GetVector(dfile, &v1);
+
+  rc |= GetString(dfile, "V2");
+  rc |= GetVector(dfile, &v2);
+
+  rc |= GetString(dfile, "N0");
+  rc |= GetVector(dfile, &n0);
+
+  rc |= GetString(dfile, "N1");
+  rc |= GetVector(dfile, &n1);
+
+  rc |= GetString(dfile, "N2");
+  rc |= GetVector(dfile, &n2);
+
+  rc |= GetTexture(dfile, &tex);
+
+  rt_stri(tex, v0, v1, v2, n0, n1, n2);
+
+  return rc;
+}
+
+static errcode GetLandScape(FILE * dfile) {
+  void * tex;
+  vector ctr;
+  apiflt wx, wy;
+  int m, n;
+  float a,b;
+  errcode rc;
+
+  rc = GetString(dfile, "RES");
+  fscanf(dfile, "%d %d", &m, &n);
+
+  rc |= GetString(dfile, "SCALE");
+  fscanf(dfile, "%f %f", &a, &b);
+  wx=a;
+  wy=b;
+
+  rc |= GetString(dfile, "CENTER");
+  rc |= GetVector(dfile, &ctr);
+
+  rc |= GetTexture(dfile, &tex);
+
+  rt_landscape(tex, m, n, ctr, wx, wy);
+
+  return rc;
+}
+
+static errcode GetTPolyFile(FILE * dfile) {
+  void * tex;
+  vector ctr, rot, scale;
+  vector v1, v2, v0;
+  char ifname[255];
+  FILE *ifp;
+  int v, totalpolys;
+  RotMat RotA;
+  errcode rc;
+
+  totalpolys=0;
+
+  rc = GetString(dfile, "SCALE");
+  rc |= GetVector(dfile, &scale);
+
+  rc |= GetString(dfile, "ROT");
+  rc |= GetVector(dfile, &rot);
+
+  degvectoradvec(&rot);
+  InitRot3d(&RotA, rot.x, rot.y, rot.z);
+
+  rc |= GetString(dfile, "CENTER");
+  rc |= GetVector(dfile, &ctr);
+
+  rc |= GetString(dfile, "FILE");
+  fscanf(dfile, "%s", ifname);
+
+  rc |= GetTexture(dfile, &tex);
+
+  if ((ifp=fopen(ifname, "r")) == NULL) {
+    fprintf(stderr, "Can't open data file %s for input!! Aborting...\n", ifname);
+    return PARSEBADSUBFILE;
+  }
+
+  while (!feof(ifp)) {
+    fscanf(ifp, "%d", &v);
+    if (v != 3) { break; }
+
+    totalpolys++;
+    v=0;
+
+    rc |= GetVector(ifp, &v0);
+    rc |= GetVector(ifp, &v1);
+    rc |= GetVector(ifp, &v2);
+
+    Scale3d(&scale, &v0);
+    Scale3d(&scale, &v1);
+    Scale3d(&scale, &v2);
+
+    Rotate3d(&RotA, &v0);
+    Rotate3d(&RotA, &v1);
+    Rotate3d(&RotA, &v2);
+
+    Trans3d(&ctr, &v0);
+    Trans3d(&ctr, &v1);
+    Trans3d(&ctr, &v2);
+
+    rt_tri(tex, v1, v0, v2);
+  }
+
+  fclose(ifp);
+
+  return rc;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/parse.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/parse.h
new file mode 100644
index 00000000..b16bd1e8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/parse.h
@@ -0,0 +1,111 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * parse.h - this file contains defines for model file reading.
+ *
+ *  $Id: parse.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+#define PARSENOERR       0
+#define PARSEBADFILE     1
+#define PARSEBADSUBFILE  2
+#define PARSEBADSYNTAX   4
+#define PARSEEOF         8
+#define PARSEALLOCERR    16
+ 
+unsigned int readmodel(char *, SceneHandle);
+
+#ifdef PARSE_INTERNAL
+#define NUMTEXS 32768
+#define TEXNAMELEN 24
+
+typedef struct {
+   double rx1; double rx2; double rx3;
+   double ry1; double ry2; double ry3;
+   double rz1; double rz2; double rz3;
+} RotMat;
+
+typedef struct {
+        char name[TEXNAMELEN];
+        void * tex;
+} texentry;
+
+#ifdef _ERRCODE_DEFINED
+#define errcode errcode_t
+#endif//_ERRCODE_DEFINED
+typedef unsigned int errcode;
+
+static errcode add_texture(void * tex, char name[TEXNAMELEN]);
+static errcode GetString(FILE *, const char *);
+static errcode GetScenedefs(FILE *, SceneHandle);
+static errcode GetColor(FILE *, color *);
+static errcode GetVector(FILE *, vector *);
+static errcode GetTexDef(FILE *);
+static errcode GetTexAlias(FILE *);
+static errcode GetTexture(FILE *, void **);
+void * GetTexBody(FILE *);
+static errcode GetBackGnd(FILE *);
+static errcode GetCylinder(FILE *);
+static errcode GetFCylinder(FILE *);
+static errcode GetPolyCylinder(FILE *);
+static errcode GetSphere(FILE *);
+static errcode GetPlane(FILE *);
+static errcode GetRing(FILE *);
+static errcode GetBox(FILE *);
+static errcode GetVol(FILE *);
+static errcode GetTri(FILE *);
+static errcode GetSTri(FILE *);
+static errcode GetLight(FILE *);
+static errcode GetLandScape(FILE *);
+static errcode GetTPolyFile(FILE *);
+static errcode GetMGFFile(FILE *, SceneHandle);
+static errcode GetObject(FILE *, SceneHandle);
+
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/plane.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/plane.cpp
new file mode 100644
index 00000000..5c34a26d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/plane.cpp
@@ -0,0 +1,105 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * plane.cpp - This file contains the functions for dealing with planes.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define PLANE_PRIVATE
+#include "plane.h"
+
+static object_methods plane_methods = {
+  (void (*)(void *, void *))(plane_intersect),
+  (void (*)(void *, void *, void *, void *))(plane_normal),
+  plane_bbox, 
+  free 
+};
+
+object * newplane(void * tex, vector ctr, vector norm) {
+  plane * p;
+  
+  p=(plane *) rt_getmem(sizeof(plane));
+  memset(p, 0, sizeof(plane));
+  p->methods = &plane_methods;
+
+  p->tex = (texture *)tex;
+  p->norm = norm;
+  VNorm(&p->norm);
+  p->d = -VDot(&ctr, &p->norm);
+
+  return (object *) p;
+}
+
+static int plane_bbox(void * obj, vector * min, vector * max) {
+  return 0;
+}
+
+static void plane_intersect(plane * pln, ray * ry) {
+  flt t,td;
+   
+  t=-(pln->d + VDot(&pln->norm, &ry->o));
+  td=VDot(&pln->norm, &ry->d); 
+  if (td != 0.0) {
+    t /= td;
+    if (t > 0.0)
+      add_intersection(t,(object *) pln, ry);
+  }
+}
+
+static void plane_normal(plane * pln, vector  * pnt, ray * incident, vector * N) {
+  *N=pln->norm;
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/plane.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/plane.h
new file mode 100644
index 00000000..474ca301
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/plane.h
@@ -0,0 +1,72 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * plane.h - This file contains the defines for planes etc.
+ *
+ *  $Id: plane.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+ 
+object * newplane(void * tex, vector ctr, vector norm);
+
+#ifdef PLANE_PRIVATE
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  flt d;
+  vector norm;
+} plane; 
+
+static void plane_intersect(plane *, ray *);
+static int plane_bbox(void * obj, vector * min, vector * max);
+static void plane_normal(plane *, vector *, ray * incident, vector *);
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ppm.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ppm.cpp
new file mode 100644
index 00000000..d63c1796
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ppm.cpp
@@ -0,0 +1,129 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ *  ppm.cpp - This file deals with PPM format image files (reading/writing)
+ */ 
+
+/* For our puposes, we're interested only in the 3 byte per pixel 24 bit
+   truecolor sort of file..  Probably won't implement any decent checking
+   at this point, probably choke on things like the # comments.. */
+
+// Try preventing lots of GCC warnings about ignored results of fscanf etc.
+#if !__INTEL_COMPILER
+
+#if __GNUC__<4 || __GNUC__==4 && __GNUC_MINOR__<5
+// For older versions of GCC, disable use of __wur in GLIBC
+#undef _FORTIFY_SOURCE
+#define _FORTIFY_SOURCE 0
+#else
+// Starting from 4.5, GCC has a suppression option
+#pragma GCC diagnostic ignored "-Wunused-result"
+#endif
+
+#endif //__INTEL_COMPILER
+
+#include <stdio.h>
+#include "machine.h"
+#include "types.h"
+#include "util.h"
+#include "imageio.h" /* error codes etc */
+#include "ppm.h"
+
+static int getint(FILE * dfile) {
+  char ch[200];
+  int i;
+  int num;
+
+  num=0; 
+  while (num==0) {
+    fscanf(dfile, "%s", ch);
+      while (ch[0]=='#') {
+        fgets(ch, 200, dfile);
+      }
+    num=sscanf(ch, "%d", &i);
+  }
+  return i;
+}
+
+int readppm(char * name, int * xres, int * yres, unsigned char **imgdata) {
+  char data[200];  
+  FILE * ifp;
+  int i;
+  size_t bytesread;
+  int datasize;
+ 
+  ifp=fopen(name, "r");  
+  if (ifp==NULL) {
+    return IMAGEBADFILE; /* couldn't open the file */
+  }
+  fscanf(ifp, "%s", data);
+ 
+  if (strcmp(data, "P6")) {
+     fclose(ifp);
+     return IMAGEUNSUP; /* not a format we support */
+  }
+
+  *xres=getint(ifp);
+  *yres=getint(ifp);
+      i=getint(ifp); /* eat the maxval number */
+  fread(&i, 1, 1, ifp); /* eat the newline */ 
+  datasize = 3 * (*xres) * (*yres);
+
+  *imgdata=(unsigned char *)rt_getmem(datasize); 
+
+  bytesread=fread(*imgdata, 1, datasize, ifp);   
+
+  fclose(ifp);
+
+  if (bytesread != datasize) 
+    return IMAGEREADERR;
+  
+  return IMAGENOERR;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ppm.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ppm.h
new file mode 100644
index 00000000..bcb3d172
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ppm.h
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ *  ppm.h - This file deals with PPM format image files (reading/writing)
+ *
+ *  $Id: ppm.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */ 
+
+/* For our puposes, we're interested only in the 3 byte per pixel 24 bit
+   truecolor sort of file..  Probably won't implement any decent checking
+   at this point, probably choke on things like the # comments.. */
+
+int readppm(char * name, int * xres, int * yres, unsigned char **imgdata);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/pthread.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/pthread.cpp
new file mode 100644
index 00000000..609ad97a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/pthread.cpp
@@ -0,0 +1,156 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#ifdef EMULATE_PTHREADS
+
+#include <assert.h>
+#include "pthread_w.h"
+
+/*
+    Basics
+*/
+
+int
+pthread_create (pthread_t *thread, pthread_attr_t *attr, void *(*start_routine) (void *), void *arg)
+{
+    pthread_t th;
+
+    if (thread == NULL) return EINVAL;
+    *thread = NULL;
+
+    if (start_routine == NULL) return EINVAL;
+
+    th = (pthread_t) malloc (sizeof (pthread_s));
+    memset (th, 0, sizeof (pthread_s));
+
+    th->winthread_handle = CreateThread (
+        NULL,
+        0,
+        (LPTHREAD_START_ROUTINE) start_routine,
+        arg,
+        0,
+        &th->winthread_id);
+    if (th->winthread_handle == NULL) return EAGAIN;  /*  GetLastError()  */
+
+    *thread = th;
+    return 0;
+}
+
+int
+pthread_join (pthread_t th, void **thread_return)
+{
+    BOOL b_ret;
+    DWORD dw_ret;
+
+    if (thread_return) *thread_return = NULL;
+
+    if ((th == NULL) || (th->winthread_handle == NULL)) return EINVAL;
+
+    dw_ret = WaitForSingleObject (th->winthread_handle, INFINITE);
+    if (dw_ret != WAIT_OBJECT_0) return ERROR_PTHREAD;  /*  dw_ret == WAIT_FAILED; GetLastError()  */
+
+    if (thread_return) {
+        BOOL e_ret;
+        DWORD exit_val;
+        e_ret = GetExitCodeThread (th->winthread_handle, &exit_val);
+        if (!e_ret) return ERROR_PTHREAD;  /*  GetLastError()  */
+        *thread_return = (void *)(size_t) exit_val;
+    }
+
+    b_ret = CloseHandle (th->winthread_handle);
+    if (!b_ret) return ERROR_PTHREAD;  /*  GetLastError()  */
+    memset (th, 0, sizeof (pthread_s));
+    free (th);
+    th = NULL;
+
+    return 0;
+}
+
+void
+pthread_exit (void *retval)
+{
+    /*  specific to PTHREAD_TO_WINTHREAD  */
+
+    ExitThread ((DWORD) ((size_t) retval));  /*  thread becomes signalled so its death can be waited upon  */
+    /*NOTREACHED*/
+    assert (0); return;  /*  void fnc; can't return an error code  */
+}
+
+/*
+    Mutex
+*/
+
+int
+pthread_mutex_init (pthread_mutex_t *mutex, pthread_mutexattr_t *mutex_attr)
+{
+    InitializeCriticalSection (&mutex->critsec);
+    return 0;
+}
+
+int
+pthread_mutex_destroy (pthread_mutex_t *mutex)
+{
+    return 0;
+}
+
+int
+pthread_mutex_lock (pthread_mutex_t *mutex)
+{
+    EnterCriticalSection (&mutex->critsec);
+    return 0;
+}
+
+int
+pthread_mutex_unlock (pthread_mutex_t *mutex)
+{
+    LeaveCriticalSection (&mutex->critsec);
+    return 0;
+}
+
+#endif  /*  EMULATE_PTHREADS  */
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/pthread_w.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/pthread_w.h
new file mode 100644
index 00000000..8837d702
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/pthread_w.h
@@ -0,0 +1,109 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#ifdef EMULATE_PTHREADS
+
+#ifndef _PTHREAD_H_DEFINED
+#define _PTHREAD_H_DEFINED
+
+#include <windows.h>
+#include <errno.h>
+#ifndef ENOTSUP
+#define ENOTSUP EPERM
+#endif
+
+/*  just need <stddef.h> on Windows to get size_t defined  */
+#include <stddef.h>
+
+#define ERROR_PTHREAD 1000
+#define ERROR_MODE 1001
+#define ERROR_UNIMPL 1002
+
+/*
+    Basics
+*/
+
+struct pthread_s {
+    HANDLE winthread_handle;
+    DWORD winthread_id;
+};
+typedef struct pthread_s *pthread_t;  /*  one of the few types that's pointer, not struct  */
+
+typedef struct {
+    int i;  /*  not yet defined...  */
+} pthread_attr_t;
+
+/*
+    Mutex
+*/
+
+typedef struct {
+    int i;  /*  not yet defined...  */
+} pthread_mutexattr_t;
+
+typedef struct {
+    CRITICAL_SECTION critsec;
+} pthread_mutex_t;
+
+/*
+    Function prototypes
+*/
+
+extern int pthread_create (pthread_t *thread, pthread_attr_t *attr, void *(*start_routine) (void *), void *arg);
+extern int pthread_join (pthread_t th, void **thread_return);
+extern void pthread_exit (void *retval);
+
+extern int pthread_mutex_init (pthread_mutex_t *mutex, pthread_mutexattr_t *mutex_attr);
+extern int pthread_mutex_destroy (pthread_mutex_t *mutex);
+extern int pthread_mutex_lock (pthread_mutex_t *mutex);
+extern int pthread_mutex_unlock (pthread_mutex_t *mutex);
+
+#endif  /*  _PTHREAD_H_DEFINED  */
+
+#endif  /*  EMULATE_PTHREADS  */
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/quadric.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/quadric.cpp
new file mode 100644
index 00000000..93e0ef88
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/quadric.cpp
@@ -0,0 +1,170 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * quadric.cpp - This file contains the functions for dealing with quadrics.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "quadric.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+int quadric_bbox(void * obj, vector * min, vector * max) {
+  return 0;
+}
+
+static object_methods quadric_methods = {
+  (void (*)(void *, void *))(quadric_intersect),
+  (void (*)(void *, void *, void *, void *))(quadric_normal),
+  quadric_bbox, 
+  free 
+};
+ 
+quadric * newquadric() {
+  quadric * q;
+ 
+  q=(quadric *) rt_getmem(sizeof(quadric));
+  memset(q, 0, sizeof(quadric));
+  q->ctr.x=0.0;
+  q->ctr.y=0.0;
+  q->ctr.z=0.0;
+  q->methods = &quadric_methods;
+ 
+  return q;
+}
+
+void quadric_intersect(quadric * q, ray * ry) {
+  flt Aq, Bq, Cq;
+  flt t1, t2;
+  flt disc;
+  vector rd;
+  vector ro;
+ 
+  rd=ry->d;
+  VNorm(&rd);
+
+  ro.x =  ry->o.x - q->ctr.x;
+  ro.y =  ry->o.y - q->ctr.y;
+  ro.z =  ry->o.z - q->ctr.z;
+
+
+  Aq = (q->mat.a*(rd.x * rd.x)) +
+        (2.0 * q->mat.b * rd.x * rd.y) +
+        (2.0 * q->mat.c * rd.x * rd.z) +
+        (q->mat.e * (rd.y * rd.y)) +
+        (2.0 * q->mat.f * rd.y * rd.z) +
+        (q->mat.h * (rd.z * rd.z));
+
+  Bq = 2.0 * (
+        (q->mat.a * ro.x * rd.x) +
+        (q->mat.b * ((ro.x * rd.y) + (rd.x * ro.y))) +
+        (q->mat.c * ((ro.x * rd.z) + (rd.x * ro.z))) +
+        (q->mat.d * rd.x) +
+        (q->mat.e * ro.y * rd.y) +
+        (q->mat.f * ((ro.y * rd.z) + (rd.y * ro.z))) +
+        (q->mat.g * rd.y) +
+        (q->mat.h * ro.z * rd.z) +
+        (q->mat.i * rd.z)
+        );
+
+  Cq = (q->mat.a * (ro.x * ro.x)) +
+        (2.0 * q->mat.b * ro.x * ro.y) +
+        (2.0 * q->mat.c * ro.x * ro.z) +
+        (2.0 * q->mat.d * ro.x) +
+        (q->mat.e * (ro.y * ro.y)) +
+        (2.0 * q->mat.f * ro.y * ro.z) +
+        (2.0 * q->mat.g * ro.y) +
+        (q->mat.h * (ro.z * ro.z)) +
+        (2.0 * q->mat.i * ro.z) +
+        q->mat.j;
+
+  if (Aq == 0.0) {
+          t1 = - Cq / Bq;
+          add_intersection(t1, (object *) q, ry);
+          }
+  else {
+    disc=(Bq*Bq - 4.0 * Aq * Cq);
+    if (disc > 0.0) {
+          disc=sqrt(disc);
+          t1 = (-Bq + disc) / (2.0 * Aq);
+          t2 = (-Bq - disc) / (2.0 * Aq);
+          add_intersection(t1, (object *) q, ry);
+          add_intersection(t2, (object *) q, ry); 
+          }
+  }
+}
+
+void quadric_normal(quadric * q, vector * pnt, ray * incident, vector * N) {
+
+  N->x = (q->mat.a*(pnt->x - q->ctr.x) + 
+	  q->mat.b*(pnt->y - q->ctr.y) + 
+	  q->mat.c*(pnt->z - q->ctr.z) + q->mat.d);
+
+  N->y = (q->mat.b*(pnt->x - q->ctr.x) + 
+	  q->mat.e*(pnt->y - q->ctr.y) + 
+	  q->mat.f*(pnt->z - q->ctr.z) + q->mat.g);
+
+  N->z = (q->mat.c*(pnt->x - q->ctr.x) + 
+	  q->mat.f*(pnt->y - q->ctr.y) + 
+	  q->mat.h*(pnt->z - q->ctr.z) + q->mat.i);
+
+  VNorm(N);
+
+  if (VDot(N, &(incident->d)) > 0.0)  {
+    N->x=-N->x;
+    N->y=-N->y;
+    N->z=-N->z;
+  } 
+}
+ 
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/quadric.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/quadric.h
new file mode 100644
index 00000000..8b58303f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/quadric.h
@@ -0,0 +1,75 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * quadric.h - This file contains the defines for quadrics.
+ *
+ *  $Id: quadric.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+typedef struct {
+  flt a; flt b; flt c;
+  flt d; flt e; flt f;
+  flt g; flt h; flt i; flt j;
+} quadmatrix;
+
+ 
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector ctr;
+  quadmatrix mat;
+} quadric; 
+
+
+quadric * newquadric(void);
+void quadric_intersect(quadric *, ray *);
+void quadric_normal(quadric *, vector *, ray *, vector *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/render.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/render.cpp
new file mode 100644
index 00000000..76c2e280
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/render.cpp
@@ -0,0 +1,91 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * render.cpp - This file contains the main program and driver for the raytracer.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "tgafile.h"
+#include "trace.h"
+#include "render.h"
+#include "util.h"
+#include "light.h"
+#include "global.h"
+#include "ui.h"
+#include "tachyon_video.h"
+#include "objbound.h"
+#include "grid.h"
+
+/* how many pieces to divide each scanline into */
+#define NUMHORZDIV 1  
+
+void renderscene(scenedef scene) {
+  //char msgtxt[2048];
+  //void * outfile;
+  /* Grid based accerlation scheme */
+  if (scene.boundmode == RT_BOUNDING_ENABLED) 
+    engrid_scene(&rootobj); /* grid */
+  /* Not used now
+  if (scene.verbosemode) { 
+    sprintf(msgtxt, "Opening %s for output.", scene.outfilename); 
+    rt_ui_message(MSG_0, msgtxt);
+  }
+
+  createtgafile(scene.outfilename,  
+                  (unsigned short) scene.hres, 
+                  (unsigned short) scene.vres);
+  outfile = opentgafile(scene.outfilename);
+  */
+
+  trace_region (scene, 0/*outfile*/, 0, 0, scene.hres, scene.vres);
+  //fclose((FILE *)outfile);
+} /* end of renderscene() */
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/render.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/render.h
new file mode 100644
index 00000000..29d68bb4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/render.h
@@ -0,0 +1,57 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * render.h - This file contains the defines for the top level functions 
+ *
+ *  $Id: render.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+
+void renderscene(scenedef); 
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ring.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ring.cpp
new file mode 100644
index 00000000..fe9e55d3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ring.cpp
@@ -0,0 +1,131 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * ring.cpp - This file contains the functions for dealing with rings.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define RING_PRIVATE
+#include "ring.h"
+
+static object_methods ring_methods = {
+  (void (*)(void *, void *))(ring_intersect),
+  (void (*)(void *, void *, void *, void *))(ring_normal),
+  ring_bbox, 
+  free 
+};
+
+object * newring(void * tex, vector ctr, vector norm, flt inrad, flt outrad) {
+  ring * r;
+  
+  r=(ring *) rt_getmem(sizeof(ring));
+  memset(r, 0, sizeof(ring));
+  r->methods = &ring_methods;
+
+  r->tex = (texture *)tex;
+  r->ctr = ctr;
+  r->norm = norm;
+  r->inrad = inrad;
+  r->outrad= outrad;
+
+  return (object *) r;
+}
+
+static int ring_bbox(void * obj, vector * min, vector * max) {
+  ring * r = (ring *) obj;
+
+  min->x = r->ctr.x - r->outrad;
+  min->y = r->ctr.y - r->outrad;
+  min->z = r->ctr.z - r->outrad;
+  max->x = r->ctr.x + r->outrad;
+  max->y = r->ctr.y + r->outrad;
+  max->z = r->ctr.z + r->outrad;
+
+  return 1;
+}
+
+static void ring_intersect(ring * rng, ray * ry) {
+  flt d;
+  flt t,td;
+  vector hit, pnt;
+  
+  d = -VDot(&(rng->ctr), &(rng->norm));
+   
+  t=-(d+VDot(&(rng->norm), &(ry->o)));
+  td=VDot(&(rng->norm),&(ry->d)); 
+  if (td != 0.0) {
+    t= t / td;
+    if (t>=0.0) {
+      hit=Raypnt(ry, t);
+      VSUB(hit, rng->ctr, pnt);
+      VDOT(td, pnt, pnt);
+      td=sqrt(td);
+      if ((td > rng->inrad) && (td < rng->outrad)) 
+        add_intersection(t,(object *) rng, ry);
+    }
+  }
+}
+
+static void ring_normal(ring * rng, vector  * pnt, ray * incident, vector * N) {
+  *N=rng->norm;
+  VNorm(N);
+  if (VDot(N, &(incident->d)) > 0.0)  {
+    N->x=-N->x;
+    N->y=-N->y;
+    N->z=-N->z;
+  } 
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ring.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ring.h
new file mode 100644
index 00000000..9c7ebde7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ring.h
@@ -0,0 +1,73 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * ring.h - This file contains the defines for rings etc.
+ *
+ *  $Id: ring.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+object * newring(void * tex, vector ctr, vector norm, flt in, flt out);
+
+#ifdef RING_PRIVATE 
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector ctr;
+  vector norm;
+  flt inrad;
+  flt outrad;
+} ring; 
+
+static int ring_bbox(void * obj, vector * min, vector * max);
+static void ring_intersect(ring *, ray *);
+static void ring_normal(ring *, vector *, ray * incident, vector *);
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/shade.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/shade.cpp
new file mode 100644
index 00000000..1317563f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/shade.cpp
@@ -0,0 +1,258 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * shade.cpp - This file contains the functions that perform surface shading.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "light.h"
+#include "intersect.h"
+#include "vector.h"
+#include "trace.h"
+#include "global.h"
+#include "shade.h"
+
+void reset_lights(void) {
+  numlights=0;
+}
+
+void add_light(point_light * li) {
+  lightlist[numlights]=li;
+  numlights++;
+}
+
+color shader(ray * incident) {
+  color col, diffuse, phongcol; 
+  vector N, L, hit;
+  ray shadowray;
+  flt inten, t, Llen;
+  object * obj;
+  int numints, i;
+  point_light * li;
+
+
+  numints=closest_intersection(&t, &obj, incident->intstruct);  
+		/* find the number of intersections */
+                /* and return the closest one.      */
+
+  if (numints < 1) {         
+    /* if there weren't any object intersections then return the */
+    /* background color for the pixel color.                     */
+    return incident->scene->background;
+  }
+
+  if (obj->tex->islight) {  /* if the current object is a light, then we  */
+    return obj->tex->col;   /* will only use the objects ambient color    */
+  }
+
+  RAYPNT(hit, (*incident), t)       /* find the point of intersection from t */ 
+  obj->methods->normal(obj, &hit, incident, &N);  /* find the surface normal */
+
+  /* execute the object's texture function */
+  col = obj->tex->texfunc(&hit, obj->tex, incident); 
+
+  diffuse.r = 0.0; 
+  diffuse.g = 0.0; 
+  diffuse.b = 0.0; 
+  phongcol = diffuse;
+
+  if ((obj->tex->diffuse > 0.0) || (obj->tex->phong > 0.0)) {  
+    for (i=0; i<numlights; i++) {   /* loop for light contributions */
+      li=lightlist[i];              /* set li=to the current light  */
+      VSUB(li->ctr, hit, L)         /* find the light vector        */
+
+      /* calculate the distance to the light from the hit point */
+      Llen = sqrt(L.x*L.x + L.y*L.y + L.z*L.z) + EPSILON;
+
+      L.x /= Llen; /* normalize the light direction vector */
+      L.y /= Llen;
+      L.z /= Llen;
+
+      VDOT(inten, N, L)             /* light intensity              */
+
+      /* add in diffuse lighting for this light if we're facing it */ 
+      if (inten > 0.0) {            
+        /* test for a shadow */
+        shadowray.intstruct = incident->intstruct;
+        shadowray.flags = RT_RAY_SHADOW | RT_RAY_BOUNDED; 
+        incident->serial++;
+        shadowray.serial = incident->serial;
+        shadowray.mbox = incident->mbox;
+        shadowray.o   = hit;
+        shadowray.d   = L;      
+        shadowray.maxdist = Llen;
+        shadowray.s   = hit;
+        shadowray.e = li->ctr;
+        shadowray.scene = incident->scene;
+        reset_intersection(incident->intstruct);
+        intersect_objects(&shadowray);
+
+        if (!shadow_intersection(incident->intstruct, Llen)) {
+          /* XXX now that opacity is in the code, have to be more careful */
+          ColorAddS(&diffuse, &li->tex->col, inten);
+
+          /* phong type specular highlights */
+          if (obj->tex->phong > 0.0) {
+            flt phongval;
+            phongval = shade_phong(incident, &hit, &N, &L, obj->tex->phongexp); 
+            if (obj->tex->phongtype) 
+              ColorAddS(&phongcol, &col, phongval);
+            else
+              ColorAddS(&phongcol, &(li->tex->col), phongval);
+          }
+        }
+      }  
+    } 
+  }
+
+  ColorScale(&diffuse, obj->tex->diffuse);
+
+  col.r *= (diffuse.r + obj->tex->ambient); /* do a product of the */
+  col.g *= (diffuse.g + obj->tex->ambient); /* diffuse intensity with  */
+  col.b *= (diffuse.b + obj->tex->ambient); /* object color + ambient  */
+
+  if (obj->tex->phong > 0.0) {
+    ColorAccum(&col, &phongcol);
+  }
+
+  /* spawn reflection rays if necessary */
+  /* note: this will overwrite the old intersection list */
+  if (obj->tex->specular > 0.0) {    
+    color specol;
+    specol = shade_reflection(incident, &hit, &N, obj->tex->specular);
+    ColorAccum(&col, &specol);
+  }
+
+  /* spawn transmission rays / refraction */
+  /* note: this will overwrite the old intersection list */
+  if (obj->tex->opacity < 1.0) {      
+    color transcol;
+    transcol = shade_transmission(incident, &hit, 1.0 - obj->tex->opacity);
+    ColorAccum(&col, &transcol);
+  }
+
+  return col;    /* return the color of the shaded pixel... */
+}
+
+
+color shade_reflection(ray * incident, vector * hit, vector * N, flt specular) {
+  ray specray;
+  color col;
+  vector R;
+ 
+  VAddS(-2.0 * (incident->d.x * N->x + 
+                incident->d.y * N->y + 
+                incident->d.z * N->z), N, &incident->d, &R);
+
+  specray.intstruct=incident->intstruct; /* what thread are we   */
+  specray.depth=incident->depth - 1;   /* go up a level in recursion depth */
+  specray.flags = RT_RAY_REGULAR;      /* infinite ray, to start with */
+  specray.serial = incident->serial + 1; /* next serial number */
+  specray.mbox = incident->mbox; 
+  specray.o=*hit; 
+  specray.d=R;			       /* reflect incident ray about normal */
+  specray.o=Raypnt(&specray, EPSILON); /* avoid numerical precision bugs */
+  specray.maxdist = FHUGE;             /* take any intersection */
+  specray.scene=incident->scene;       /* global scenedef info */
+  col=trace(&specray);                 /* trace specular reflection ray */ 
+
+  incident->serial = specray.serial;    /* update the serial number */
+
+  ColorScale(&col, specular);
+
+  return col;
+}
+
+
+color shade_transmission(ray * incident, vector * hit, flt trans) {
+  ray transray;
+  color col;
+
+  transray.intstruct=incident->intstruct; /* what thread are we   */
+  transray.depth=incident->depth - 1;    /* go up a level in recursion depth */
+  transray.flags = RT_RAY_REGULAR;       /* infinite ray, to start with */
+  transray.serial = incident->serial + 1; /* update serial number */
+  transray.mbox = incident->mbox;
+  transray.o=*hit; 
+  transray.d=incident->d;                /* ray continues along incident path */
+  transray.o=Raypnt(&transray, EPSILON); /* avoid numerical precision bugs */
+  transray.maxdist = FHUGE;              /* take any intersection */
+  transray.scene=incident->scene;        /* global scenedef info */
+  col=trace(&transray);                  /* trace transmission ray */  
+
+  incident->serial = transray.serial;
+
+  ColorScale(&col, trans);
+
+  return col;
+}
+
+flt shade_phong(ray * incident, vector * hit, 
+  vector * N, vector * L, flt specpower){
+  vector H, V;
+  flt inten;
+
+  V = incident->d;
+  VScale(&V, -1.0);
+  VAdd(&V, L, &H);
+  VScale(&H, 0.5);   
+  VNorm(&H);
+  inten = VDot(N, &H);
+  if (inten > 0.0) 
+    inten = pow(inten, specpower);
+  else 
+    inten = 0.0;
+
+  return inten;
+} 
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/shade.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/shade.h
new file mode 100644
index 00000000..10959bc2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/shade.h
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * shade.h - This file contains declarations and definitions for the shader.
+ *
+ *  $Id: shade.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+ 
+void reset_lights(void);
+void add_light(point_light *);
+
+color shader(ray *);
+color shade_reflection(ray *, vector *, vector *, flt);
+color shade_transmission(ray *, vector *, flt);
+flt shade_phong(ray * incident, vector * hit, vector * N, vector * L, flt specpower);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/sphere.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/sphere.cpp
new file mode 100644
index 00000000..2bf2502e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/sphere.cpp
@@ -0,0 +1,133 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * sphere.cpp - This file contains the functions for dealing with spheres.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "intersect.h"
+#include "util.h"
+
+#define SPHERE_PRIVATE
+#include "sphere.h"
+
+static object_methods sphere_methods = {
+  (void (*)(void *, void *))(sphere_intersect),
+  (void (*)(void *, void *, void *, void *))(sphere_normal),
+  sphere_bbox, 
+  free 
+};
+
+object * newsphere(void * tex, vector ctr, flt rad) {
+  sphere * s;
+  
+  s=(sphere *) rt_getmem(sizeof(sphere));
+  memset(s, 0, sizeof(sphere));
+  s->methods = &sphere_methods;
+
+  s->tex=(texture *)tex;
+  s->ctr=ctr;
+  s->rad=rad;
+
+  return (object *) s;
+}
+
+static int sphere_bbox(void * obj, vector * min, vector * max) {
+  sphere * s = (sphere *) obj;
+
+  min->x = s->ctr.x - s->rad;
+  min->y = s->ctr.y - s->rad;
+  min->z = s->ctr.z - s->rad;
+  max->x = s->ctr.x + s->rad;
+  max->y = s->ctr.y + s->rad;
+  max->z = s->ctr.z + s->rad;
+
+  return 1;
+}
+
+static void sphere_intersect(sphere * spr, ray * ry) {
+  flt b, disc, t1, t2, temp;
+  vector V;
+
+  VSUB(spr->ctr, ry->o, V);
+  VDOT(b, V, ry->d); 
+  VDOT(temp, V, V);  
+
+  disc=b*b + spr->rad*spr->rad - temp;
+
+  if (disc<=0.0) return;
+  disc=sqrt(disc);
+
+  t2=b+disc;
+  if (t2 <= SPEPSILON) 
+    return;
+  add_intersection(t2, (object *) spr, ry);  
+
+  t1=b-disc;
+  if (t1 > SPEPSILON) 
+    add_intersection(t1, (object *) spr, ry);  
+}
+
+static void sphere_normal(sphere * spr, vector * pnt, ray * incident, vector * N) {
+  VSub((vector *) pnt, &(spr->ctr), N);
+
+  VNorm(N);
+
+  if (VDot(N, &(incident->d)) > 0.0)  {
+    N->x=-N->x;
+    N->y=-N->y;
+    N->z=-N->z;
+  } 
+}
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/sphere.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/sphere.h
new file mode 100644
index 00000000..6a1ef547
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/sphere.h
@@ -0,0 +1,73 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * sphere.h - This file contains the defines for spheres etc.
+ *
+ *  $Id: sphere.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+object * newsphere(void *, vector, flt);
+
+#ifdef SPHERE_PRIVATE
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector ctr;
+  flt rad;
+} sphere;
+
+static int sphere_bbox(void * obj, vector * min, vector * max);
+static void sphere_intersect(sphere *, ray *);
+static void sphere_normal(sphere *, vector *, ray *, vector *);
+
+#endif /* SPHERE_PRIVATE */
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tachyon_video.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tachyon_video.cpp
new file mode 100644
index 00000000..44bd9d64
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tachyon_video.cpp
@@ -0,0 +1,120 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+#include "types.h"
+#include "api.h"       /* The ray tracing library API */
+#include "ui.h"
+#include "util.h"
+#include "tachyon_video.h"
+
+extern SceneHandle global_scene;
+extern char *global_window_title;
+extern bool global_usegraphics;
+
+void tachyon_video::on_process() {
+    char buf[8192];
+    flt runtime;
+    scenedef *scene = (scenedef *) global_scene;
+    updating_mode = scene->displaymode == RT_DISPLAY_ENABLED;
+    recycling = false;
+    pausing = false;
+    do {
+        updating = updating_mode;
+        timer start_timer = gettimer();
+        rt_renderscene(global_scene);
+        timer end_timer = gettimer();
+        runtime = timertime(start_timer, end_timer);
+        sprintf(buf, "%s: %.3f seconds", global_window_title, runtime);
+        rt_ui_message(MSG_0, buf);
+        title = buf; show_title(); // show time spent for rendering
+        if(!updating) {
+            updating = true;
+            drawing_memory dm = get_drawing_memory();
+            drawing_area drawing(0, 0, dm.sizex, dm.sizey);// invalidate whole screen
+        }
+        rt_finalize();
+        title = global_window_title; show_title(); // reset title to default
+    } while(recycling && running);
+}
+
+void tachyon_video::on_key(int key) {
+    key &= 0xff;
+    recycling = true;
+    if(key == esc_key) running = false;
+    else if(key == ' ') {
+        if(!updating) {
+            updating = true;
+            drawing_memory dm = get_drawing_memory();
+            drawing_area drawing(0, 0, dm.sizex, dm.sizey);// invalidate whole screen
+        }
+        updating = updating_mode = !updating_mode;
+    }
+    else if(key == 'p') {
+        pausing = !pausing;
+        if(pausing) {
+            title = "Press ESC to exit or 'p' to continue after rendering completion";
+            show_title();
+        }
+    }
+}
+
+void rt_finalize(void) {
+    timer t0, t1;
+    t0 = gettimer();
+    if(global_usegraphics)
+        do { rt_sleep(1); t1 = gettimer(); }
+        while( (timertime(t0, t1) < 10 || video->pausing) && video->next_frame());
+#ifdef _WINDOWS
+    else rt_sleep(10000);
+#endif
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tachyon_video.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tachyon_video.h
new file mode 100644
index 00000000..5b4b9dbd
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tachyon_video.h
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include "../../../common/gui/video.h"
+
+class tachyon_video : public video
+{
+public:
+    bool updating_mode;
+    bool recycling;
+    bool pausing;
+    void on_process();
+    void on_key(int key);
+};
+
+extern class tachyon_video *video;
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/texture.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/texture.cpp
new file mode 100644
index 00000000..11134b9d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/texture.cpp
@@ -0,0 +1,385 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * texture.cpp - This file contains functions for implementing textures.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "texture.h"
+#include "coordsys.h"
+#include "imap.h"
+#include "vector.h"
+#include "box.h"
+
+/* plain vanilla texture solely based on object color */
+color standard_texture(vector * hit, texture * tex, ray * ry) {
+  return tex->col;
+}
+
+/* cylindrical image map */
+color image_cyl_texture(vector * hit, texture * tex, ray * ry) {
+  vector rh;
+  flt u,v;
+ 
+  rh.x=hit->x - tex->ctr.x;
+  rh.z=hit->y - tex->ctr.y;
+  rh.y=hit->z - tex->ctr.z;
+ 
+  xyztocyl(rh, 1.0, &u, &v);
+
+  u = u * tex->scale.x;  
+  u = u + tex->rot.x;
+  u=fmod(u, 1.0);
+  if (u < 0.0) u+=1.0; 
+
+  v = v * tex->scale.y; 
+  v = v + tex->rot.y;
+  v=fmod(v, 1.0);
+  if (v < 0.0) v+=1.0; 
+
+  return ImageMap((rawimage *)tex->img, u, v); 
+}  
+
+/* spherical image map */
+color image_sphere_texture(vector * hit, texture * tex, ray * ry) {
+  vector rh;
+  flt u,v;
+ 
+  rh.x=hit->x - tex->ctr.x;
+  rh.y=hit->y - tex->ctr.y;
+  rh.z=hit->z - tex->ctr.z;
+ 
+  xyztospr(rh, &u, &v);
+
+  u = u * tex->scale.x;
+  u = u + tex->rot.x;
+  u=fmod(u, 1.0);
+  if (u < 0.0) u+=1.0;
+ 
+  v = v * tex->scale.y;
+  v = v + tex->rot.y;
+  v=fmod(v, 1.0);
+  if (v < 0.0) v+=1.0;
+ 
+  return ImageMap((rawimage *)tex->img, u, v);
+}
+
+/* planar image map */
+color image_plane_texture(vector * hit, texture * tex, ray * ry) {
+  vector pnt;
+  flt u,v;
+ 
+  pnt.x=hit->x - tex->ctr.x;
+  pnt.y=hit->y - tex->ctr.y;
+  pnt.z=hit->z - tex->ctr.z;
+
+  VDOT(u, tex->uaxs, pnt);
+/*  VDOT(len, tex->uaxs, tex->uaxs);
+  u = u / sqrt(len); */
+
+  VDOT(v, tex->vaxs, pnt); 
+/*  VDOT(len, tex->vaxs, tex->vaxs);
+  v = v / sqrt(len); */
+    
+
+  u = u * tex->scale.x;
+  u = u + tex->rot.x;
+  u = fmod(u, 1.0);
+  if (u < 0.0) u += 1.0;
+
+  v = v * tex->scale.y;
+  v = v + tex->rot.y;
+  v = fmod(v, 1.0);
+  if (v < 0.0) v += 1.0;
+
+  return ImageMap((rawimage *)tex->img, u, v);
+}
+
+color grit_texture(vector * hit, texture * tex, ray * ry) {
+  int rnum;
+  flt fnum;
+  color col;
+
+  rnum=rand() % 4096;
+  fnum=(rnum / 4096.0 * 0.2) + 0.8;
+
+  col.r=tex->col.r * fnum;
+  col.g=tex->col.g * fnum;
+  col.b=tex->col.b * fnum;
+
+  return col;
+}
+
+color checker_texture(vector * hit, texture * tex, ray * ry) {
+  long x,y,z;
+  flt xh,yh,zh;
+  color col;
+
+  xh=hit->x - tex->ctr.x; 
+  x=(long) ((fabs(xh) * 3) + 0.5);
+  x=x % 2;
+  yh=hit->y - tex->ctr.y;
+  y=(long) ((fabs(yh) * 3) + 0.5);
+  y=y % 2;
+  zh=hit->z - tex->ctr.z;
+  z=(long) ((fabs(zh) * 3) + 0.5);
+  z=z % 2;
+
+  if (((x + y + z) % 2)==1) {
+    col.r=1.0;
+    col.g=0.2;
+    col.b=0.0;
+  }
+  else {
+    col.r=0.0;
+    col.g=0.2;
+    col.b=1.0;
+  }
+
+  return col;
+}
+
+color cyl_checker_texture(vector * hit, texture * tex, ray * ry) {
+  long x,y;
+  vector rh;
+  flt u,v;
+  color col;
+ 
+  rh.x=hit->x - tex->ctr.x;
+  rh.y=hit->y - tex->ctr.y;
+  rh.z=hit->z - tex->ctr.z;
+
+  xyztocyl(rh, 1.0, &u, &v); 
+
+  x=(long) (fabs(u) * 18.0);
+  x=x % 2;
+  y=(long) (fabs(v) * 10.0);
+  y=y % 2;
+ 
+  if (((x + y) % 2)==1) {
+    col.r=1.0;
+    col.g=0.2;
+    col.b=0.0;
+  }
+  else {
+    col.r=0.0;
+    col.g=0.2;
+    col.b=1.0;
+  }
+ 
+  return col;
+}
+
+
+color wood_texture(vector * hit, texture * tex, ray * ry) {
+  flt radius, angle;
+  int grain;
+  color col;
+  flt x,y,z;
+
+  x=(hit->x - tex->ctr.x) * 1000;
+  y=(hit->y - tex->ctr.y) * 1000;
+  z=(hit->z - tex->ctr.z) * 1000;
+
+  radius=sqrt(x*x + z*z);
+  if (z == 0.0) 
+    angle=3.1415926/2.0;
+  else 
+    angle=atan(x / z);
+
+  radius=radius + 3.0 * sin(20 * angle + y / 150.0);
+  grain=((int) (radius + 0.5)) % 60;
+  if (grain < 40) {
+    col.r=0.8;
+    col.g=1.0;
+    col.b=0.2;
+  }
+  else {
+    col.r=0.0;
+    col.g=0.0;
+    col.b=0.0;
+  }     
+
+  return col;
+} 
+
+
+
+#define NMAX 28
+short int NoiseMatrix[NMAX][NMAX][NMAX];
+
+void InitNoise(void) {
+  byte x,y,z,i,j,k;
+
+  for (x=0; x<NMAX; x++) {
+    for (y=0; y<NMAX; y++) {
+      for (z=0; z<NMAX; z++) {
+        NoiseMatrix[x][y][z]=rand() % 12000;
+
+        if (x==NMAX-1) i=0; 
+        else i=x;
+
+        if (y==NMAX-1) j=0;
+        else j=y;
+
+        if (z==NMAX-1) k=0;
+        else k=z;
+
+        NoiseMatrix[x][y][z]=NoiseMatrix[i][j][k];
+      }
+    }
+  }
+}
+
+int Noise(flt x, flt y, flt z) {
+  byte ix, iy, iz;
+  flt ox, oy, oz;
+  int p000, p001, p010, p011;
+  int p100, p101, p110, p111;
+  int p00, p01, p10, p11;
+  int p0, p1;
+  int d00, d01, d10, d11;
+  int d0, d1, d;
+
+  x=fabs(x);
+  y=fabs(y);
+  z=fabs(z);
+
+  ix=((int) x) % (NMAX-1);
+  iy=((int) y) % (NMAX-1);
+  iz=((int) z) % (NMAX-1);
+
+  ox=(x - ((int) x));
+  oy=(y - ((int) y));
+  oz=(z - ((int) z));
+
+  p000=NoiseMatrix[ix][iy][iz];
+  p001=NoiseMatrix[ix][iy][iz+1];
+  p010=NoiseMatrix[ix][iy+1][iz];
+  p011=NoiseMatrix[ix][iy+1][iz+1];
+  p100=NoiseMatrix[ix+1][iy][iz];
+  p101=NoiseMatrix[ix+1][iy][iz+1];
+  p110=NoiseMatrix[ix+1][iy+1][iz];
+  p111=NoiseMatrix[ix+1][iy+1][iz+1];
+
+  d00=p100-p000;
+  d01=p101-p001;
+  d10=p110-p010;
+  d11=p111-p011;
+
+  p00=(int) ((int) d00*ox) + p000;
+  p01=(int) ((int) d01*ox) + p001;
+  p10=(int) ((int) d10*ox) + p010;
+  p11=(int) ((int) d11*ox) + p011;
+  d0=p10-p00;
+  d1=p11-p01;
+  p0=(int) ((int) d0*oy) + p00;
+  p1=(int) ((int) d1*oy) + p01;
+  d=p1-p0;
+
+  return (int) ((int) d*oz) + p0;
+}
+
+color marble_texture(vector * hit, texture * tex, ray * ry) {
+  flt i,d;
+  flt x,y,z;
+  color col;
+ 
+  x=hit->x;
+  y=hit->y; 
+  z=hit->z;
+
+  x=x * 1.0;
+
+  d=x + 0.0006 * Noise(x, (y * 1.0), (z * 1.0));
+  d=d*(((int) d) % 25);
+  i=0.0 + 0.10 * fabs(d - 10.0 - 20.0 * ((int) d * 0.05));
+  if (i > 1.0) i=1.0;
+  if (i < 0.0) i=0.0;  
+
+/*
+  col.r=i * tex->col.r;
+  col.g=i * tex->col.g;
+  col.b=i * tex->col.b;
+*/
+
+  col.r = (1.0 + sin(i * 6.28)) / 2.0;
+  col.g = (1.0 + sin(i * 16.28)) / 2.0;
+  col.b = (1.0 + cos(i * 30.28)) / 2.0;
+
+  return col;      
+}
+
+
+color gnoise_texture(vector * hit, texture * tex, ray * ry) {
+  color col;
+  flt f;
+
+  f=Noise((hit->x - tex->ctr.x), 
+          (hit->y - tex->ctr.y), 
+	  (hit->z - tex->ctr.z));
+
+  if (f < 0.01) f=0.01;
+  if (f > 1.0) f=1.0;
+
+  col.r=tex->col.r * f;
+  col.g=tex->col.g * f;
+  col.b=tex->col.b * f;
+
+  return col;
+}
+
+void InitTextures(void) {
+  InitNoise();
+  ResetImages();
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/texture.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/texture.h
new file mode 100644
index 00000000..be0b2a48
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/texture.h
@@ -0,0 +1,69 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * texture.h This file contains all of the includes and defines for the texture 
+ * mapping part of the shader.
+ *
+ *  $Id: texture.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+void InitTextures(void);
+color     standard_texture(vector *, texture *, ray *);
+color    image_cyl_texture(vector *, texture *, ray *);
+color image_sphere_texture(vector *, texture *, ray *);
+color  image_plane_texture(vector *, texture *, ray *);
+color      checker_texture(vector *, texture *, ray *);
+color  cyl_checker_texture(vector *, texture *, ray *);
+color         grit_texture(vector *, texture *, ray *);
+color         wood_texture(vector *, texture *, ray *);
+color       marble_texture(vector *, texture *, ray *);
+color       gnoise_texture(vector *, texture *, ray *);
+int Noise(flt, flt, flt);
+void InitTextures(void);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tgafile.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tgafile.cpp
new file mode 100644
index 00000000..2be6db56
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tgafile.cpp
@@ -0,0 +1,237 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * tgafile.cpp - This file contains the code to write 24 bit targa files...
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "util.h"
+#include "ui.h"
+#include "imageio.h"
+#include "tgafile.h"
+
+void createtgafile(char *name, unsigned short width, unsigned short height) {
+  int filesize;
+  FILE * ofp;
+
+  filesize = 3*width*height + 18 - 10;
+  
+  if (name==NULL) 
+    exit(1);
+  else {
+    ofp=fopen(name, "w+b");
+    if (ofp == NULL) {
+      char msgtxt[2048];
+      sprintf(msgtxt, "Cannot create %s for output!", name);
+      rt_ui_message(MSG_ERR, msgtxt);
+      rt_ui_message(MSG_ABORT, "Rendering Aborted.");
+      exit(1);
+    } 
+
+    fputc(0, ofp); /* IdLength      */
+    fputc(0, ofp); /* ColorMapType  */
+    fputc(2, ofp); /* ImageTypeCode */
+    fputc(0, ofp); /* ColorMapOrigin, low byte */
+    fputc(0, ofp); /* ColorMapOrigin, high byte */
+    fputc(0, ofp); /* ColorMapLength, low byte */
+    fputc(0, ofp); /* ColorMapLength, high byte */
+    fputc(0, ofp); /* ColorMapEntrySize */
+    fputc(0, ofp); /* XOrigin, low byte */
+    fputc(0, ofp); /* XOrigin, high byte */
+    fputc(0, ofp); /* YOrigin, low byte */
+    fputc(0, ofp); /* YOrigin, high byte */
+    fputc((width & 0xff),         ofp); /* Width, low byte */
+    fputc(((width >> 8) & 0xff),  ofp); /* Width, high byte */
+    fputc((height & 0xff),        ofp); /* Height, low byte */
+    fputc(((height >> 8) & 0xff), ofp); /* Height, high byte */
+    fputc(24, ofp);   /* ImagePixelSize */
+    fputc(0x20, ofp); /* ImageDescriptorByte 0x20 == flip vertically */
+
+    fseek(ofp, filesize, 0);
+    fprintf(ofp, "9876543210"); 
+
+    fclose(ofp);
+  } 
+}    
+
+void * opentgafile(char * filename) {
+  FILE * ofp;
+
+  ofp=fopen(filename, "r+b");
+  if (ofp == NULL) {
+    char msgtxt[2048];
+    sprintf(msgtxt, "Cannot open %s for output!", filename);
+    rt_ui_message(MSG_ERR, msgtxt);
+    rt_ui_message(MSG_ABORT, "Rendering Aborted.");
+    exit(1);
+  } 
+
+  return ofp;
+} 
+
+void writetgaregion(void * voidofp, 
+                    int iwidth, int iheight,
+                    int startx, int starty, 
+                    int stopx, int stopy, char * buffer) {
+  int y, totalx, totaly;
+  char * bufpos;
+  long filepos;
+  size_t numbytes;
+  FILE * ofp = (FILE *) voidofp;
+ 
+  totalx = stopx - startx + 1;
+  totaly = stopy - starty + 1;
+
+  for (y=0; y<totaly; y++) {
+    bufpos=buffer + (totalx*3)*(totaly-y-1);
+    filepos=18 + iwidth*3*(iheight - starty - totaly + y + 1) + (startx - 1)*3;
+
+    if (filepos >= 18) {
+      fseek(ofp, filepos, 0); 
+      numbytes = fwrite(bufpos, 3, totalx, ofp);
+
+      if (numbytes != totalx) {
+        char msgtxt[256];
+        sprintf(msgtxt, "File write problem, %d bytes written.", (int)numbytes);
+        rt_ui_message(MSG_ERR, msgtxt);
+      }
+    }
+    else {
+      rt_ui_message(MSG_ERR, "writetgaregion: file ptr out of range!!!\n");
+      return;  /* don't try to continue */
+    }
+  }
+}
+
+
+int readtga(char * name, int * xres, int * yres, unsigned char **imgdata) {
+  int format, width, height, w1, w2, h1, h2, depth, flags;
+  int imgsize, i, tmp;
+  size_t bytesread;
+  FILE * ifp;
+
+  ifp=fopen(name, "r");  
+  if (ifp==NULL) {
+    return IMAGEBADFILE; /* couldn't open the file */
+  }
+
+  /* read the targa header */
+  getc(ifp); /* ID length */
+  getc(ifp); /* colormap type */
+  format = getc(ifp); /* image type */
+  getc(ifp); /* color map origin */
+  getc(ifp); /* color map origin */
+  getc(ifp); /* color map length */
+  getc(ifp); /* color map length */
+  getc(ifp); /* color map entry size */
+  getc(ifp); /* x origin */
+  getc(ifp); /* x origin */
+  getc(ifp); /* y origin */
+  getc(ifp); /* y origin */
+  w1 = getc(ifp); /* width (low) */
+  w2 = getc(ifp); /* width (hi) */
+  h1 = getc(ifp); /* height (low) */
+  h2 = getc(ifp); /* height (hi) */
+  depth = getc(ifp); /* image pixel size */
+  flags = getc(ifp); /* image descriptor byte */
+
+  if ((format != 2) || (depth != 24)) {
+    fclose(ifp);
+    return IMAGEUNSUP; /* unsupported targa format */
+  }
+    
+
+  width = ((w2 << 8) | w1);
+  height = ((h2 << 8) | h1);
+
+  imgsize = 3 * width * height;
+  *imgdata = (unsigned char *)rt_getmem(imgsize);
+  bytesread = fread(*imgdata, 1, imgsize, ifp);
+  fclose(ifp);
+
+  /* flip image vertically */
+  if (flags == 0x20) {
+    int rowsize = 3 * width;
+    unsigned char * copytmp;
+
+    copytmp = (unsigned char *)malloc(rowsize);
+
+    for (i=0; i<height / 2; i++) {
+      memcpy(copytmp, &((*imgdata)[rowsize*i]), rowsize);
+      memcpy(&(*imgdata)[rowsize*i], &(*imgdata)[rowsize*(height - 1 - i)], rowsize);
+      memcpy(&(*imgdata)[rowsize*(height - 1 - i)], copytmp, rowsize);
+    }
+
+    free(copytmp);       
+  }
+
+
+  /* convert from BGR order to RGB order */
+  for (i=0; i<imgsize; i+=3) {
+    tmp = (*imgdata)[i]; /* Blue */
+    (*imgdata)[i] = (*imgdata)[i+2]; /* Red */
+    (*imgdata)[i+2] = tmp; /* Blue */
+  }
+
+  *xres = width;
+  *yres = height;
+
+  if (bytesread != imgsize) 
+    return IMAGEREADERR;
+
+  return IMAGENOERR;
+}
+
+
+
+
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tgafile.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tgafile.h
new file mode 100644
index 00000000..ddb54d14
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/tgafile.h
@@ -0,0 +1,61 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * tgafile.h - this file contains defines and structures for tgafile.c
+ *
+ *  $Id: tgafile.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+/* declare other functions */
+void createtgafile(char *, unsigned short, unsigned short);
+void * opentgafile(char *);
+void writetgaregion(void *, int, int, int, int, int, int, char *);
+
+int readtga(char * name, int * xres, int * yres, unsigned char **imgdata);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.h
new file mode 100644
index 00000000..24ee59c6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.h
@@ -0,0 +1,98 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * trace.h - This file contains the declarations and defines for the trace module
+ *
+ *   $Id: trace.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+extern char *global_buffer;
+
+typedef struct {
+        int tid;
+        int nthr;
+        scenedef scene;
+        char * buffer;
+        int startx;
+        int stopx;
+        int starty;
+        int stopy;
+        } thr_parms;
+
+typedef struct {
+        int startx;
+        int stopx;
+        int starty;
+        int stopy;
+        } patch;
+
+typedef struct {
+	void * tga;
+	int iwidth;
+	int iheight;
+	int startx;
+	int starty;
+	int stopx;
+	int stopy;
+	char * buffer;
+	} thr_io_parms;
+
+color trace(ray *);
+
+void * thread_trace(thr_parms * parms);
+
+void thread_trace1(thr_parms *, patch *, int depth); 
+void thread_trace2(thr_parms *, patch *); 
+
+void * thread_io(void *);
+
+void trace_shm(scenedef, /*char *,*/ int, int, int, int);
+
+void trace_region(scenedef, void *, int, int, int, int);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.serial.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.serial.cpp
new file mode 100644
index 00000000..c83a9974
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.serial.cpp
@@ -0,0 +1,177 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "tgafile.h"
+#include "trace.h"
+#include "light.h"
+#include "shade.h"
+#include "camera.h"
+#include "util.h"
+#include "intersect.h"
+#include "global.h"
+#include "ui.h"
+#include "tachyon_video.h"
+
+// shared but read-only so could be private too
+static thr_parms *all_parms;
+static scenedef scene;
+static int startx;
+static int stopx;
+static int starty;
+static int stopy;
+static flt jitterscale;
+static int totaly;
+
+static color_t render_one_pixel (int x, int y, unsigned int *local_mbox, unsigned int &serial,
+                                 int startx, int stopx, int starty, int stopy)
+{
+    /* private vars moved inside loop */
+    ray primary, sample;
+    color col, avcol;
+    int R,G,B;
+    intersectstruct local_intersections;    
+    int alias;
+    /* end private */
+
+    primary=camray(&scene, x, y);
+    primary.intstruct = &local_intersections;
+    primary.flags = RT_RAY_REGULAR;
+
+    serial++;
+    primary.serial = serial;  
+    primary.mbox = local_mbox;
+    primary.maxdist = FHUGE;
+    primary.scene = &scene;
+    col=trace(&primary);  
+
+    serial = primary.serial;
+
+    /* perform antialiasing if enabled.. */
+    if (scene.antialiasing > 0) {
+        for (alias=0; alias < scene.antialiasing; alias++) {
+
+            serial++; /* increment serial number */
+            sample=primary;  /* copy the regular primary ray to start with */
+            sample.serial = serial; 
+
+            {
+                sample.d.x+=((std::rand() % 100) - 50) / jitterscale;
+                sample.d.y+=((std::rand() % 100) - 50) / jitterscale;
+                sample.d.z+=((std::rand() % 100) - 50) / jitterscale;
+            }
+
+            avcol=trace(&sample);  
+
+            serial = sample.serial; /* update our overall serial # */
+
+            col.r += avcol.r;
+            col.g += avcol.g;
+            col.b += avcol.b;
+        }
+
+        col.r /= (scene.antialiasing + 1.0);
+        col.g /= (scene.antialiasing + 1.0);
+        col.b /= (scene.antialiasing + 1.0);
+    }
+
+    /* Handle overexposure and underexposure here... */
+    R=(int) (col.r*255);
+    if (R > 255) R = 255;
+    else if (R < 0) R = 0;
+
+    G=(int) (col.g*255);
+    if (G > 255) G = 255;
+    else if (G < 0) G = 0;
+
+    B=(int) (col.b*255);
+    if (B > 255) B = 255;
+    else if (B < 0) B = 0;
+
+    return video->get_color(R, G, B);
+
+}
+
+static void parallel_thread (void)
+{
+    // thread-local storage
+    unsigned int serial = 1;
+    unsigned int mboxsize = sizeof(unsigned int)*(max_objectid() + 20);
+    unsigned int * local_mbox = (unsigned int *) alloca(mboxsize);
+    memset(local_mbox,0,mboxsize);
+
+    for (int y = starty; y < stopy; y++) { {
+        drawing_area drawing(startx, totaly-y, stopx-startx, 1);
+        for (int x = startx; x < stopx; x++) {
+            color_t c = render_one_pixel (x, y, local_mbox, serial, startx, stopx, starty, stopy);
+            drawing.put_pixel(c);
+        } }
+        if(!video->next_frame()) return;
+    }
+}
+
+void * thread_trace(thr_parms * parms)
+{
+    // shared but read-only so could be private too
+    all_parms = parms;
+    scene = parms->scene;
+    startx = parms->startx;
+    stopx = parms->stopx;
+    starty = parms->starty;
+    stopy = parms->stopy;
+    jitterscale = 40.0*(scene.hres + scene.vres);
+    totaly = parms->scene.vres-1;
+
+    parallel_thread ();
+
+    return(NULL);  
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.simple.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.simple.cpp
new file mode 100644
index 00000000..db270e40
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.simple.cpp
@@ -0,0 +1,182 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "tgafile.h"
+#include "trace.h"
+#include "light.h"
+#include "shade.h"
+#include "camera.h"
+#include "util.h"
+#include "intersect.h"
+#include "global.h"
+#include "ui.h"
+#include "tachyon_video.h"
+
+// shared but read-only so could be private too
+static thr_parms *all_parms;
+static scenedef scene;
+static int startx;
+static int stopx;
+static int starty;
+static int stopy;
+static flt jitterscale;
+static int totaly;
+
+static color_t render_one_pixel (int x, int y, unsigned int *local_mbox, unsigned int &serial,
+                                 int startx, int stopx, int starty, int stopy)
+{
+    /* private vars moved inside loop */
+    ray primary;
+    color col;
+    int R,G,B;
+    intersectstruct local_intersections;
+    /* end private */
+
+    primary = camray(&scene, x, y);
+    primary.intstruct = &local_intersections;
+    primary.flags = RT_RAY_REGULAR;
+
+    serial++;
+    primary.serial = serial;
+    primary.mbox = local_mbox;
+    primary.maxdist = FHUGE;
+    primary.scene = &scene;
+    col = trace(&primary);
+    serial = primary.serial;
+
+    /* Handle overexposure and underexposure here... */
+    R = (int)(col.r * 255);
+    if ( R > 255 ) R = 255;
+    else if ( R < 0 ) R = 0;
+
+    G = (int)(col.g * 255);
+    if ( G > 255 ) G = 255;
+    else if ( G < 0 ) G = 0;
+
+    B = (int)(col.b * 255);
+    if ( B > 255 ) B = 255;
+    else if ( B < 0 ) B = 0;
+
+    return video->get_color(R, G, B);
+}
+
+#if DO_ITT_NOTIFY
+#include"ittnotify.h"
+#endif
+
+#define RUNTIME_SERIAL 1
+#define RUNTIME_OPENMP 2
+#define RUNTIME_CILK   3
+#define RUNTIME_TBB    4
+
+#ifndef RUNTIME
+#define RUNTIME RUNTIME_TBB
+#endif
+
+#if RUNTIME == RUNTIME_OPENMP
+#include <omp.h>
+#elif RUNTIME == RUNTIME_TBB
+#include <tbb/tbb.h>
+#endif
+
+static void parallel_thread(void)
+{
+    unsigned int mboxsize = sizeof(unsigned int)*(max_objectid() + 20);
+#if RUNTIME == RUNTIME_SERIAL
+    for ( int y = starty; y < stopy; y++ )
+#elif RUNTIME == RUNTIME_OPENMP
+#pragma omp parallel for
+    for ( int y = starty; y < stopy; y++ )
+#elif RUNTIME == RUNTIME_CILK
+    _Cilk_for(int y = starty; y < stopy; y++)
+#elif RUNTIME == RUNTIME_TBB
+    tbb::parallel_for(starty, stopy, [mboxsize] (int y)
+#endif
+    {
+        unsigned int serial = 1;
+        unsigned int local_mbox[mboxsize];
+        memset(local_mbox, 0, mboxsize);
+        drawing_area drawing(startx, totaly - y, stopx - startx, 1);
+        for ( int x = startx; x < stopx; x++ ) {
+            color_t c = render_one_pixel(x, y, local_mbox, serial, startx, stopx, starty, stopy);
+            drawing.put_pixel(c);
+        }
+        video->next_frame();
+    }
+#if RUNTIME == RUNTIME_TBB
+    );
+#endif
+}
+
+void * thread_trace(thr_parms * parms)
+{
+    // shared but read-only so could be private too
+    all_parms = parms;
+    scene = parms->scene;
+    startx = parms->startx;
+    stopx = parms->stopx;
+    starty = parms->starty;
+    stopy = parms->stopy;
+    jitterscale = 40.0*(scene.hres + scene.vres);
+    totaly = parms->scene.vres - 1;
+
+#if DO_ITT_NOTIFY
+    __itt_resume();
+#endif
+    parallel_thread();
+#if DO_ITT_NOTIFY
+    __itt_pause();
+#endif
+
+    return(NULL);
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.tbb.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.tbb.cpp
new file mode 100644
index 00000000..13761d56
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.tbb.cpp
@@ -0,0 +1,269 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "tgafile.h"
+#include "trace.h"
+#include "light.h"
+#include "shade.h"
+#include "camera.h"
+#include "util.h"
+#include "intersect.h"
+#include "global.h"
+#include "ui.h"
+#include "tachyon_video.h"
+
+// shared but read-only so could be private too
+static thr_parms *all_parms;
+static scenedef scene;
+static int startx;
+static int stopx;
+static int starty;
+static int stopy;
+static flt jitterscale;
+static int totaly;
+
+#ifdef MARK_RENDERING_AREA
+
+// rgb colors list for coloring image by each thread
+static const float inner_alpha = 0.3;
+static const float border_alpha = 0.5;
+#define NUM_COLORS 24
+static int colors[NUM_COLORS][3] = {
+    {255,110,0},    {220,254,0},    {102,254,0},    {0,21,254},     {97,0,254},     {254,30,0},
+    {20,41,8},      {144,238,38},   {184,214,139},  {28,95,20},     {139,173,148},  {188,228,183},
+    {145,47,56},    {204,147,193},  {45,202,143},   {204,171,143},  {143,160,204},  {220,173,3},
+    {1,152,231},    {79,235,237},   {52,193,72},    {67,136,151},   {78,87,179},    {143,255,9},
+};
+
+#include "tbb/atomic.h"
+#include "tbb/enumerable_thread_specific.h"
+// storage and counter for thread numbers in order of first task run
+typedef tbb::enumerable_thread_specific< int > thread_id_t;
+thread_id_t thread_ids (-1);
+tbb::atomic<int> thread_number;
+
+#endif
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/blocked_range2d.h"
+
+static tbb::spin_mutex MyMutex, MyMutex2;
+
+static color_t render_one_pixel (int x, int y, unsigned int *local_mbox, unsigned int &serial,
+                                 int startx, int stopx, int starty, int stopy
+#ifdef MARK_RENDERING_AREA
+                                 , int *blend, float alpha
+#endif
+)
+{
+    /* private vars moved inside loop */
+    ray primary, sample;
+    color col, avcol;
+    int R,G,B;
+    intersectstruct local_intersections;    
+    int alias;
+    /* end private */
+
+    primary=camray(&scene, x, y);
+    primary.intstruct = &local_intersections;
+    primary.flags = RT_RAY_REGULAR;
+
+    serial++;
+    primary.serial = serial;  
+    primary.mbox = local_mbox;
+    primary.maxdist = FHUGE;
+    primary.scene = &scene;
+    col=trace(&primary);  
+
+    serial = primary.serial;
+
+    /* perform antialiasing if enabled.. */
+    if (scene.antialiasing > 0) {
+        for (alias=0; alias < scene.antialiasing; alias++) {
+
+            serial++; /* increment serial number */
+            sample=primary;  /* copy the regular primary ray to start with */
+            sample.serial = serial; 
+
+            {
+                tbb::spin_mutex::scoped_lock lock (MyMutex);
+                sample.d.x+=((rand() % 100) - 50) / jitterscale;
+                sample.d.y+=((rand() % 100) - 50) / jitterscale;
+                sample.d.z+=((rand() % 100) - 50) / jitterscale;
+            }
+
+            avcol=trace(&sample);  
+
+            serial = sample.serial; /* update our overall serial # */
+
+            col.r += avcol.r;
+            col.g += avcol.g;
+            col.b += avcol.b;
+        }
+
+        col.r /= (scene.antialiasing + 1.0);
+        col.g /= (scene.antialiasing + 1.0);
+        col.b /= (scene.antialiasing + 1.0);
+    }
+
+    /* Handle overexposure and underexposure here... */
+    R=(int) (col.r*255);
+    if (R > 255) R = 255;
+    else if (R < 0) R = 0;
+
+    G=(int) (col.g*255);
+    if (G > 255) G = 255;
+    else if (G < 0) G = 0;
+
+    B=(int) (col.b*255);
+    if (B > 255) B = 255;
+    else if (B < 0) B = 0;
+
+#ifdef MARK_RENDERING_AREA
+    R = int((1.0 - alpha) * R + alpha * blend[0]);
+    G = int((1.0 - alpha) * G + alpha * blend[1]);
+    B = int((1.0 - alpha) * B + alpha * blend[2]);
+#endif
+    
+    return video->get_color(R, G, B);
+}
+
+class parallel_task {
+public:
+    void operator() (const tbb::blocked_range2d<int> &r) const
+    {
+       // task-local storage
+        unsigned int serial = 1;
+        unsigned int mboxsize = sizeof(unsigned int)*(max_objectid() + 20);
+        unsigned int * local_mbox = (unsigned int *) alloca(mboxsize);
+        memset(local_mbox,0,mboxsize);
+#ifdef MARK_RENDERING_AREA
+        // compute thread number while first task run
+        thread_id_t::reference thread_id = thread_ids.local();
+        if (thread_id == -1) thread_id = thread_number++;
+        // choose thread color
+        int pos = thread_id % NUM_COLORS;
+        if(video->running) {
+            drawing_area drawing(r.cols().begin(), totaly-r.rows().end(), r.cols().end() - r.cols().begin(), r.rows().end()-r.rows().begin());
+            for (int i = 1, y = r.rows().begin(); y != r.rows().end(); ++y, i++) {
+                drawing.set_pos(0, drawing.size_y-i);
+                for (int x = r.cols().begin(); x != r.cols().end(); x++) {
+                    int d = (y % 3 == 0) ? 2 : 1;
+                    drawing.put_pixel(video->get_color(colors[pos][0]/d, colors[pos][1]/d, colors[pos][2]/d));
+                }
+            }
+        }
+#endif
+        if(video->next_frame()) {
+            drawing_area drawing(r.cols().begin(), totaly-r.rows().end(), r.cols().end() - r.cols().begin(), r.rows().end()-r.rows().begin());
+            for (int i = 1, y = r.rows().begin(); y != r.rows().end(); ++y, i++) {
+                drawing.set_pos(0, drawing.size_y-i);
+                for (int x = r.cols().begin(); x != r.cols().end(); x++) {
+#ifdef MARK_RENDERING_AREA
+                    float alpha = y==r.rows().begin()||y==r.rows().end()-1||x==r.cols().begin()||x==r.cols().end()-1
+                                ? border_alpha : inner_alpha;
+                    color_t c = render_one_pixel (x, y, local_mbox, serial, startx, stopx, starty, stopy, colors[pos], alpha);
+#else
+                    color_t c = render_one_pixel (x, y, local_mbox, serial, startx, stopx, starty, stopy);
+#endif
+                    drawing.put_pixel(c);
+                }
+            }
+        }
+    }
+
+    parallel_task () {}
+};
+
+void * thread_trace(thr_parms * parms)
+{
+#if !WIN8UI_EXAMPLE
+    int n, nthreads = tbb::task_scheduler_init::automatic;
+    char *nthreads_str = getenv ("TBB_NUM_THREADS");
+    if (nthreads_str && (sscanf (nthreads_str, "%d", &n) > 0) && (n > 0)) nthreads = n;
+    tbb::task_scheduler_init init (nthreads);
+#endif
+
+    // shared but read-only so could be private too
+    all_parms = parms;
+    scene = parms->scene;
+    startx = parms->startx;
+    stopx = parms->stopx;
+    starty = parms->starty;
+    stopy = parms->stopy;
+    jitterscale = 40.0*(scene.hres + scene.vres);
+    totaly = parms->scene.vres;
+#ifdef MARK_RENDERING_AREA
+    thread_ids.clear();
+#endif
+
+    int grain_size = 8;
+//WIN8UI does not support getenv() function so using auto_partitioner unconditionally
+#if !WIN8UI_EXAMPLE
+    int g;
+    char *grain_str = getenv ("TBB_GRAINSIZE");
+    if (grain_str && (sscanf (grain_str, "%d", &g) > 0) && (g > 0)) grain_size = g;
+    char *sched_str = getenv ("TBB_PARTITIONER");
+    static tbb::affinity_partitioner g_ap; // reused across calls to thread_trace
+    if ( sched_str && !strncmp(sched_str, "aff", 3) )
+        tbb::parallel_for (tbb::blocked_range2d<int> (starty, stopy, grain_size, startx, stopx, grain_size), parallel_task (), g_ap);
+    else if ( sched_str && !strncmp(sched_str, "simp", 4) )
+        tbb::parallel_for (tbb::blocked_range2d<int> (starty, stopy, grain_size, startx, stopx, grain_size), parallel_task (), tbb::simple_partitioner());
+    else
+#endif
+        tbb::parallel_for (tbb::blocked_range2d<int> (starty, stopy, grain_size, startx, stopx, grain_size), parallel_task (), tbb::auto_partitioner());
+
+    return(NULL);  
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.tbb1d.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.tbb1d.cpp
new file mode 100644
index 00000000..3ff93213
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace.tbb1d.cpp
@@ -0,0 +1,205 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "tgafile.h"
+#include "trace.h"
+#include "light.h"
+#include "shade.h"
+#include "camera.h"
+#include "util.h"
+#include "intersect.h"
+#include "global.h"
+#include "ui.h"
+#include "tachyon_video.h"
+
+// shared but read-only so could be private too
+static thr_parms *all_parms;
+static scenedef scene;
+static int startx;
+static int stopx;
+static int starty;
+static int stopy;
+static flt jitterscale;
+static int totaly;
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/blocked_range.h"
+
+static tbb::spin_mutex MyMutex, MyMutex2;
+
+static color_t render_one_pixel (int x, int y, unsigned int *local_mbox, unsigned int &serial,
+                                 int startx, int stopx, int starty, int stopy)
+{
+    /* private vars moved inside loop */
+    ray primary, sample;
+    color col, avcol;
+    int R,G,B;
+    intersectstruct local_intersections;    
+    int alias;
+    /* end private */
+
+    primary=camray(&scene, x, y);
+    primary.intstruct = &local_intersections;
+    primary.flags = RT_RAY_REGULAR;
+
+    serial++;
+    primary.serial = serial;  
+    primary.mbox = local_mbox;
+    primary.maxdist = FHUGE;
+    primary.scene = &scene;
+    col=trace(&primary);  
+
+    serial = primary.serial;
+
+    /* perform antialiasing if enabled.. */
+    if (scene.antialiasing > 0) {
+        for (alias=0; alias < scene.antialiasing; alias++) {
+
+            serial++; /* increment serial number */
+            sample=primary;  /* copy the regular primary ray to start with */
+            sample.serial = serial; 
+
+            {
+                tbb::spin_mutex::scoped_lock lock (MyMutex);
+                sample.d.x+=((rand() % 100) - 50) / jitterscale;
+                sample.d.y+=((rand() % 100) - 50) / jitterscale;
+                sample.d.z+=((rand() % 100) - 50) / jitterscale;
+            }
+
+            avcol=trace(&sample);  
+
+            serial = sample.serial; /* update our overall serial # */
+
+            col.r += avcol.r;
+            col.g += avcol.g;
+            col.b += avcol.b;
+        }
+
+        col.r /= (scene.antialiasing + 1.0);
+        col.g /= (scene.antialiasing + 1.0);
+        col.b /= (scene.antialiasing + 1.0);
+    }
+
+    /* Handle overexposure and underexposure here... */
+    R=(int) (col.r*255);
+    if (R > 255) R = 255;
+    else if (R < 0) R = 0;
+
+    G=(int) (col.g*255);
+    if (G > 255) G = 255;
+    else if (G < 0) G = 0;
+
+    B=(int) (col.b*255);
+    if (B > 255) B = 255;
+    else if (B < 0) B = 0;
+
+    return video->get_color(R, G, B);
+
+}
+
+class parallel_task {
+public:
+    void operator() (const tbb::blocked_range<int> &r) const
+    {
+        // task-local storage
+        unsigned int serial = 1;
+        unsigned int mboxsize = sizeof(unsigned int)*(max_objectid() + 20);
+        unsigned int * local_mbox = (unsigned int *) alloca(mboxsize);
+        memset(local_mbox,0,mboxsize);
+
+        for (int y = r.begin(); y != r.end(); ++y) { {
+            drawing_area drawing(startx, totaly-y, stopx-startx, 1);
+            for (int x = startx; x < stopx; x++) {
+                color_t c = render_one_pixel (x, y, local_mbox, serial, startx, stopx, starty, stopy);
+                drawing.put_pixel(c);
+            } }
+            if(!video->next_frame()) return;
+        }
+    }
+
+    parallel_task () {}
+};
+
+void * thread_trace(thr_parms * parms)
+{
+    int n, nthreads = tbb::task_scheduler_init::automatic;
+    char *nthreads_str = getenv ("TBB_NUM_THREADS");
+    if (nthreads_str && (sscanf (nthreads_str, "%d", &n) > 0) && (n > 0)) nthreads = n;
+    tbb::task_scheduler_init init (nthreads);
+
+    // shared but read-only so could be private too
+    all_parms = parms;
+    scene = parms->scene;
+    startx = parms->startx;
+    stopx = parms->stopx;
+    starty = parms->starty;
+    stopy = parms->stopy;
+    jitterscale = 40.0*(scene.hres + scene.vres);
+    totaly = parms->scene.vres-1;
+
+    int g, grain_size = 1;
+    char *grain_str = getenv ("TBB_GRAINSIZE");
+    if (grain_str && (sscanf (grain_str, "%d", &g) > 0) && (g > 0)) grain_size = g;
+    char *sched_str = getenv ("TBB_PARTITIONER");
+    static tbb::affinity_partitioner g_ap;
+    if ( sched_str && !strncmp(sched_str, "aff", 3) )
+        tbb::parallel_for (tbb::blocked_range<int> (starty, stopy, grain_size), parallel_task (), g_ap );
+    else if ( sched_str && !strncmp(sched_str, "simp", 4) )
+        tbb::parallel_for (tbb::blocked_range<int> (starty, stopy, grain_size), parallel_task (), tbb::simple_partitioner() );
+    else
+        tbb::parallel_for (tbb::blocked_range<int> (starty, stopy, grain_size), parallel_task (), tbb::auto_partitioner() );
+
+    return(NULL);  
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace_rest.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace_rest.cpp
new file mode 100644
index 00000000..34864d47
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/trace_rest.cpp
@@ -0,0 +1,138 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * trace.cpp - This file contains the functions for firing primary rays
+ *           and handling subsequent calculations
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "tgafile.h"
+#include "trace.h"
+#include "light.h"
+#include "shade.h"
+#include "camera.h"
+#include "util.h"
+#include "intersect.h"
+#include "global.h"
+#include "ui.h"
+#include "tachyon_video.h"
+
+color trace(ray * primary) {
+  if (primary->depth > 0) {
+    VNorm(&primary->d);
+    reset_intersection(primary->intstruct);
+    intersect_objects(primary);
+    return shader(primary);
+  }
+
+  /* if ray is truncated, return the background as its color */
+  return primary->scene->background;
+}
+
+void * thread_io(void * parms) {
+  thr_io_parms p;
+
+  p= *((thr_io_parms *) parms);
+  writetgaregion(p.tga, p.iwidth, p.iheight, p.startx, p.starty, 
+		p.stopx, p.stopy, p.buffer);
+  free(p.buffer); /* free the buffer once we are done with it.. */
+  free(parms);
+
+  return(NULL);
+}
+
+void trace_shm(scenedef scene, /*char * buffer,  */ int startx, int stopx, int starty, int stopy) {
+
+  thr_parms * parms;
+
+  parms = (thr_parms *) rt_getmem(sizeof(thr_parms));  
+
+  parms->tid=0;
+  parms->nthr=1;
+  parms->scene=scene;
+  parms->startx=startx;
+  parms->stopx=stopx;
+  parms->starty=starty;
+  parms->stopy=stopy;
+
+  thread_trace(parms);
+
+  rt_freemem(parms);
+}
+
+void trace_region(scenedef scene, void * tga, int startx, int starty, int stopx, int stopy) {
+
+  if (scene.verbosemode) {
+    char msgtxt[2048];
+    sprintf(msgtxt, "Node %3d tracing region  %4d, %4d  --->  %4d, %4d \n", 0, startx,starty,stopx,stopy);
+    rt_ui_message(MSG_0, msgtxt);
+  }
+
+  trace_shm(scene, /*buffer,*/ startx, stopx, starty, stopy);
+/* not used now
+  writetgaregion(tga, scene.hres, scene.vres, 
+                 startx, starty, stopx, stopy, global_buffer);
+
+  if (scene.rawimage != NULL) {
+    int x, y;
+    int totalx = stopx - startx + 1;
+    for (y=starty; y<=stopy; y++) {
+      for (x=0; x<scene.hres; x++) {
+        scene.rawimage[(scene.vres-y)*scene.hres*3 + x*3] = global_buffer[(y-starty)*totalx*3 + x*3 + 2];
+        scene.rawimage[(scene.vres-y)*scene.hres*3 + x*3 +1] = global_buffer[(y-starty)*totalx*3 + x*3 + 1];
+        scene.rawimage[(scene.vres-y)*scene.hres*3 + x*3 +2] = global_buffer[(y-starty)*totalx*3 + x*3];
+      }
+    }
+  }
+*/
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/triangle.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/triangle.cpp
new file mode 100644
index 00000000..d80adce5
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/triangle.cpp
@@ -0,0 +1,245 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * triangle.cpp - This file contains the functions for dealing with triangles.
+ */
+ 
+#include "machine.h"
+#include "types.h"
+#include "vector.h"
+#include "macros.h"
+#include "intersect.h"
+#include "util.h"
+
+#define TRIANGLE_PRIVATE
+#include "triangle.h"
+
+static object_methods tri_methods = {
+  (void (*)(void *, void *))(tri_intersect),
+  (void (*)(void *, void *, void *, void *))(tri_normal),
+  tri_bbox, 
+  free 
+};
+
+static object_methods stri_methods = {
+  (void (*)(void *, void *))(tri_intersect),
+  (void (*)(void *, void *, void *, void *))(stri_normal),
+  tri_bbox, 
+  free 
+};
+
+object * newtri(void * tex, vector v0, vector v1, vector v2) {
+  tri * t;
+  vector edge1, edge2, edge3;
+
+  VSub(&v1, &v0, &edge1);
+  VSub(&v2, &v0, &edge2);
+  VSub(&v2, &v1, &edge3);
+
+  /* check to see if this will be a degenerate triangle before creation */
+  if ((VLength(&edge1) >= EPSILON) && 
+      (VLength(&edge2) >= EPSILON) && 
+      (VLength(&edge3) >= EPSILON)) {
+
+    t=(tri *) rt_getmem(sizeof(tri));
+
+    t->nextobj = NULL;
+    t->methods = &tri_methods;
+
+    t->tex = (texture *)tex;
+    t->v0 = v0;
+    t->edge1 = edge1;
+    t->edge2 = edge2;
+ 
+    return (object *) t;
+  }
+  
+  return NULL; /* was a degenerate triangle */
+}
+
+
+object * newstri(void * tex, vector v0, vector v1, vector v2,
+                           vector n0, vector n1, vector n2) {
+  stri * t;
+  vector edge1, edge2, edge3;
+
+  VSub(&v1, &v0, &edge1);
+  VSub(&v2, &v0, &edge2);
+  VSub(&v2, &v1, &edge3);
+
+  /* check to see if this will be a degenerate triangle before creation */
+  if ((VLength(&edge1) >= EPSILON) && 
+      (VLength(&edge2) >= EPSILON) &&
+      (VLength(&edge3) >= EPSILON)) {
+
+    t=(stri *) rt_getmem(sizeof(stri));
+
+    t->nextobj = NULL;
+    t->methods = &stri_methods;
+ 
+    t->tex = (texture *)tex;
+    t->v0 = v0;
+    t->edge1 = edge1;
+    t->edge2 = edge2;
+    t->n0 = n0;
+    t->n1 = n1;
+    t->n2 = n2;
+
+    return (object *) t;
+  }
+
+  return NULL; /* was a degenerate triangle */
+}
+
+#define CROSS(dest,v1,v2) \
+          dest.x=v1.y*v2.z-v1.z*v2.y; \
+          dest.y=v1.z*v2.x-v1.x*v2.z; \
+          dest.z=v1.x*v2.y-v1.y*v2.x;
+
+#define DOT(v1,v2) (v1.x*v2.x+v1.y*v2.y+v1.z*v2.z)
+
+#define SUB(dest,v1,v2) \
+          dest.x=v1.x-v2.x; \
+          dest.y=v1.y-v2.y; \
+          dest.z=v1.z-v2.z;
+
+static int tri_bbox(void * obj, vector * min, vector * max) {
+  tri * t = (tri *) obj;
+  vector v1, v2;
+
+  VAdd(&t->v0, &t->edge1, &v1); 
+  VAdd(&t->v0, &t->edge2, &v2); 
+
+  min->x = MYMIN( t->v0.x , MYMIN( v1.x , v2.x ));
+  min->y = MYMIN( t->v0.y , MYMIN( v1.y , v2.y ));
+  min->z = MYMIN( t->v0.z , MYMIN( v1.z , v2.z ));
+
+  max->x = MYMAX( t->v0.x , MYMAX( v1.x , v2.x ));
+  max->y = MYMAX( t->v0.y , MYMAX( v1.y , v2.y ));
+  max->z = MYMAX( t->v0.z , MYMAX( v1.z , v2.z ));
+
+  return 1;
+}
+
+static void tri_intersect(tri * trn, ray * ry) {
+  vector tvec, pvec, qvec;
+  flt det, inv_det, t, u, v;
+
+  /* begin calculating determinant - also used to calculate U parameter */
+  CROSS(pvec, ry->d, trn->edge2);
+
+  /* if determinant is near zero, ray lies in plane of triangle */
+  det = DOT(trn->edge1, pvec);
+
+   if (det > -EPSILON && det < EPSILON)
+     return;
+
+   inv_det = 1.0 / det;
+
+   /* calculate distance from vert0 to ray origin */
+   SUB(tvec, ry->o, trn->v0);
+
+   /* calculate U parameter and test bounds */
+   u = DOT(tvec, pvec) * inv_det;
+   if (u < 0.0 || u > 1.0)
+     return;
+
+   /* prepare to test V parameter */
+   CROSS(qvec, tvec, trn->edge1);
+
+   /* calculate V parameter and test bounds */
+   v = DOT(ry->d, qvec) * inv_det;
+   if (v < 0.0 || u + v > 1.0)
+     return;
+
+   /* calculate t, ray intersects triangle */
+   t = DOT(trn->edge2, qvec) * inv_det;
+
+  add_intersection(t,(object *) trn, ry);
+}
+
+
+static void tri_normal(tri * trn, vector  * pnt, ray * incident, vector * N) {
+
+  CROSS((*N), trn->edge1, trn->edge2);
+
+  VNorm(N);
+
+  if (VDot(N, &(incident->d)) > 0.0)  {
+    N->x=-N->x;
+    N->y=-N->y;
+    N->z=-N->z;
+  }
+}
+
+static void stri_normal(stri * trn, vector  * pnt, ray * incident, vector * N) {
+  flt U, V, W, lensqr;
+  vector P, tmp, norm;
+  
+  CROSS(norm, trn->edge1, trn->edge2);
+  lensqr = DOT(norm, norm); 
+
+  VSUB((*pnt), trn->v0, P);
+
+  CROSS(tmp, P, trn->edge2);
+  U = DOT(tmp, norm) / lensqr;   
+
+  CROSS(tmp, trn->edge1, P);
+  V = DOT(tmp, norm) / lensqr;   
+
+  W = 1.0 - (U + V);
+
+  N->x = W*trn->n0.x + U*trn->n1.x + V*trn->n2.x;
+  N->y = W*trn->n0.y + U*trn->n1.y + V*trn->n2.y;
+  N->z = W*trn->n0.z + U*trn->n1.z + V*trn->n2.z;
+
+  VNorm(N);
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/triangle.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/triangle.h
new file mode 100644
index 00000000..b71ad5c9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/triangle.h
@@ -0,0 +1,94 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * triangle.h - This file contains the defines for triangles etc.
+ *
+ *  $Id: triangle.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+object * newtri(void *, vector, vector, vector);
+object * newstri(void *, vector, vector, vector, vector, vector, vector);
+
+#ifdef TRIANGLE_PRIVATE
+
+#define TRIXMAJOR 0
+#define TRIYMAJOR 1
+#define TRIZMAJOR 2
+ 
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector edge2;
+  vector edge1;
+  vector v0;
+} tri; 
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+  vector edge2;
+  vector edge1;
+  vector v0;
+  vector n0;
+  vector n1;
+  vector n2;
+} stri; 
+
+static int tri_bbox(void * obj, vector * min, vector * max);
+
+static void tri_intersect(tri *, ray *);
+
+static void tri_normal(tri *, vector *, ray *, vector *);
+static void stri_normal(stri *, vector *, ray *, vector *);
+#endif
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/types.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/types.h
new file mode 100644
index 00000000..d92fd637
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/types.h
@@ -0,0 +1,226 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+#if __MINGW32__
+#include <malloc.h>
+#elif _WIN32
+#include <malloc.h>
+#define alloca _alloca
+#elif __FreeBSD__||__NetBSD__||__OpenBSD__
+#include <stdlib.h>
+#else
+#include <alloca.h>
+#endif
+
+/*
+ * types.h - This file contains all of the type definitions for the raytracer
+ *
+ *  $Id: types.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+#define MAXOCTNODES 25       /* subdivide octants /w > # of children */
+#define SPEPSILON 0.000001   /* amount to crawl down a ray           */
+#define EPSILON   0.000001   /* amount to crawl down a ray           */
+#define TWOPI 6.2831853      /* guess                                */
+#define FHUGE 1e18           /* biggest fp number we can represent   */
+
+/* Maximum internal table sizes */
+/* Use prime numbers for best memory system performance */
+#define INTTBSIZE 1024       /* maximum intersections we can hold    */
+#define MAXLIGHTS 39         /* maximum number of lights in a scene  */
+#define MAXIMGS   39         /* maxiumum number of distinct images   */
+#define RPCQSIZE  113	     /* number of RPC messages to queue      */
+
+/* Parameter values for rt_boundmode() */
+#define RT_BOUNDING_DISABLED 0  /* spatial subdivision/bounding disabled */
+#define RT_BOUNDING_ENABLED  1  /* spatial subdivision/bounding enabled  */
+
+/* Parameter values for rt_displaymode() */
+#define RT_DISPLAY_DISABLED  0  /* video output enabled  */
+#define RT_DISPLAY_ENABLED   1  /* video output disabled */
+
+/* Ray flags */
+#define RT_RAY_REGULAR   1
+#define RT_RAY_SHADOW    2
+#define RT_RAY_BOUNDED   4
+#define RT_RAY_FINISHED  8
+
+#ifdef USESINGLEFLT
+typedef float flt;   /* generic floating point number, using float */
+#else
+typedef double flt;  /* generic floating point number, using double */
+#endif
+
+typedef unsigned char byte; /* 1 byte */
+typedef signed int word;    /* 32 bit integer */
+
+typedef struct {
+   flt x;        /* X coordinate value */
+   flt y;        /* Y coordinate value */
+   flt z;        /* Z coordinate value */
+} vector;
+
+typedef struct {
+   flt r;        /* Red component   */
+   flt g;        /* Green component */
+   flt b;        /* Blue component  */
+} color;
+
+typedef struct {
+   byte r;       /* Red component   */
+   byte g;       /* Green component */
+   byte b;       /* Blue component  */
+} bytecolor;
+
+typedef struct {         /* Raw 24 bit image structure, for tga, ppm etc */
+  int loaded;            /* image memory residence flag    */
+  int xres;              /* image X axis size              */
+  int yres;              /* image Y axis size              */
+  int bpp;               /* image bits per pixel           */
+  char name[96];         /* image filename (with path)     */
+  unsigned char * data;  /* pointer to raw byte image data */
+} rawimage;
+
+typedef struct {         /* Scalar Volume Data */
+  int loaded;            /* Volume data memory residence flag */
+  int xres;		 /* volume X axis size                */
+  int yres;		 /* volume Y axis size                */
+  int zres;		 /* volume Z axis size                */
+  flt opacity;		 /* opacity per unit length           */
+  char name[96];         /* Volume data filename              */
+  unsigned char * data;  /* pointer to raw byte volume data   */
+} scalarvol;
+
+typedef struct {
+  color (* texfunc)(void *, void *, void *);
+  int shadowcast;  /* does the object cast a shadow */
+  int islight;	   /* light flag... */
+  color col;       /* base object color */
+  flt ambient;     /* ambient lighting */
+  flt diffuse; 	   /* diffuse reflection */
+  flt phong;       /* phong specular highlights */
+  flt phongexp;    /* phong exponent/shininess factor */
+  int phongtype;   /* phong type: 0 == plastic, nonzero == metal */
+  flt specular;    /* specular reflection */
+  flt opacity;     /* how opaque the object is */
+  vector ctr;      /* origin of texture */
+  vector rot;      /* rotation of texture about origin */
+  vector scale;    /* scale of texture in x,y,z */
+  vector uaxs;	   /* planar map U axis */
+  vector vaxs;	   /* planar map V axis */
+  void * img;      /* pointer to image for image mapping */
+  void * obj;      /* object ptr, hack for volume shaders for now */
+} texture;
+
+typedef struct {
+  void (* intersect)(void *, void *);              /* intersection func ptr  */
+  void (* normal)(void *, void *, void *, void *); /* normal function ptr    */
+  int (* bbox)(void *, vector *, vector *);        /* return the object bbox */
+  void (* free)(void *);                           /* free the object        */
+} object_methods;
+
+typedef struct {
+  unsigned int id;                      /* Unique Object serial number    */
+  void * nextobj;                       /* pointer to next object in list */
+  object_methods * methods;             /* this object's methods          */
+  texture * tex;                        /* object texture                 */
+} object;
+
+typedef struct {
+  object * obj;  /* to object we hit                        */
+  flt t;         /* distance along the ray to the hit point */
+} intersection;
+
+typedef struct {
+  int num;                      /* number of intersections    */
+  intersection closest;         /* closest intersection > 0.0 */
+  intersection list[INTTBSIZE]; /* list of all intersections  */
+} intersectstruct;
+
+typedef struct {
+  char outfilename[200];     /* name of the output image                */
+  unsigned char * rawimage;  /* pointer to a raw rgb image to be stored */
+  int hres;                  /* horizontal output image resolution      */
+  int vres;                  /* vertical output image resolution        */
+  flt aspectratio;           /* aspect ratio of output image            */
+  int raydepth;              /* maximum recursion depth                 */
+  int antialiasing;          /* number of antialiasing rays to fire     */
+  int verbosemode;           /* verbose reporting flag                  */
+  int boundmode;             /* automatic spatial subdivision flag      */
+  int boundthresh;           /* threshold number of subobjects          */
+  int displaymode;           /* run-time X11 display flag               */
+  vector camcent;            /* center of the camera in world coords    */
+  vector camviewvec;         /* view direction of the camera  (Z axis)  */
+  vector camrightvec;        /* right axis for the camera     (X axis)  */
+  vector camupvec;           /* up axis for the camera        (Y axis)  */
+  flt camzoom;               /* zoom factor for the camera              */
+  color background;          /* scene background color                  */
+} scenedef;
+
+typedef struct {
+   intersectstruct * intstruct; /* ptr to thread's intersection data       */
+   unsigned int depth;   /* levels left to recurse.. (maxdepth - curdepth) */
+   unsigned int flags;   /* ray flags, any special treatment needed etc    */
+   unsigned int serial;  /* serial number of the ray                       */
+   unsigned int * mbox;  /* mailbox array for optimizing intersections     */
+   vector o;             /* origin of the ray X,Y,Z                        */
+   vector d;             /* normalized direction of the ray                */
+   flt maxdist;          /* maximum distance to search for intersections   */
+   vector s;		 /* startpoint of the ray (may differ from origin  */
+   vector e;             /* endpoint of the ray if bounded                 */
+   scenedef * scene;     /* pointer to the scene, for global parms such as */
+                         /* background colors etc                          */
+} ray;
+
+typedef struct {
+  int type;      /* RPC call type            */
+  int from;      /* Sending processor        */
+  int len;       /* length of parms in bytes */
+  void * parms;  /* Parameters to RPC        */
+} rpcmsg;
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ui.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ui.cpp
new file mode 100644
index 00000000..4ab2bbfe
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ui.cpp
@@ -0,0 +1,115 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * ui.cpp - Contains functions for dealing with user interfaces
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "util.h"
+#include "ui.h"
+
+static void (* rt_static_ui_message) (int, const char *) = NULL;
+static void (* rt_static_ui_progress) (int) = NULL;
+static int (* rt_static_ui_checkaction) (void) = NULL;
+
+extern bool silent_mode;
+
+void set_rt_ui_message(void (* func) (int, const char *)) {
+  rt_static_ui_message = func;
+}
+
+void set_rt_ui_progress(void (* func) (int)) {
+  rt_static_ui_progress = func;
+}
+
+void rt_ui_message(int level, const char * msg) {
+  if (rt_static_ui_message == NULL) {
+    if ( !silent_mode ) {
+      fprintf(stderr, "%s\n", msg);
+      fflush (stderr);
+    }
+  } else {
+    rt_static_ui_message(level, msg);
+  }
+}
+
+void rt_ui_progress(int percent) {
+  if (rt_static_ui_progress != NULL)
+    rt_static_ui_progress(percent);
+  else {
+    if ( !silent_mode ) {
+      fprintf(stderr, "\r %3d%% Complete            \r", percent);
+      fflush(stderr);
+    }
+  }
+}
+
+int rt_ui_checkaction(void) {
+  if (rt_static_ui_checkaction != NULL) 
+    return rt_static_ui_checkaction();
+  else
+    return 0;
+}
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ui.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ui.h
new file mode 100644
index 00000000..fbd16dab
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/ui.h
@@ -0,0 +1,68 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * ui.h - defines for user interface functions
+ *
+ *  $Id: ui.h,v 1.2 2007-02-22 17:54:16 Exp $
+ */
+
+/* Different types of message, for levels of verbosity etc */
+#define MSG_0      100
+#define MSG_1      101
+#define MSG_2      102
+#define MSG_3      103
+#define MSG_4      104
+#define MSG_5      105
+#define MSG_ERR    200
+#define MSG_ABORT  300
+
+void rt_ui_message(int, const char *);
+void rt_ui_progress(int);
+int  rt_ui_checkaction(void);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/util.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/util.cpp
new file mode 100644
index 00000000..5c4999ca
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/util.cpp
@@ -0,0 +1,175 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * util.cpp - Contains all of the timing functions for various platforms.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "util.h"
+#include "light.h"
+#include "global.h"
+#include "ui.h"
+
+void rt_finalize(void);
+
+#if !defined( _WIN32 )
+#include <sys/time.h>
+#include <unistd.h>
+
+void rt_sleep(int msec) {
+    usleep(msec*1000);
+}
+
+#else //_WIN32
+
+#undef OLDUNIXTIME
+#undef STDTIME
+
+void rt_sleep(int msec) {
+#if !WIN8UI_EXAMPLE
+    Sleep(msec);
+#else
+    std::chrono::milliseconds sleep_time( msec );
+    std::this_thread::sleep_for( sleep_time );
+#endif
+}
+
+timer gettimer(void) {
+    return GetTickCount ();
+}
+
+flt timertime(timer st, timer fn) {
+   double ttime, start, end;
+
+   start = ((double) st) / ((double) 1000.00);
+     end = ((double) fn) / ((double) 1000.00);
+   ttime = end - start;
+
+   return ttime;
+}
+#endif  /*  _WIN32  */
+
+/* if we're on a Unix with gettimeofday() we'll use newer timers */
+#if defined( STDTIME )
+  struct timezone tz;
+
+timer gettimer(void) {
+  timer t;
+  gettimeofday(&t, &tz);
+  return t;
+} 
+  
+flt timertime(timer st, timer fn) {
+   double ttime, start, end;
+
+   start = (st.tv_sec+1.0*st.tv_usec / 1000000.0);
+     end = (fn.tv_sec+1.0*fn.tv_usec / 1000000.0);
+   ttime = end - start;
+
+   return ttime;
+}  
+#endif  /*  STDTIME  */
+
+
+
+/* use the old fashioned Unix time functions */
+#if defined( OLDUNIXTIME )
+timer gettimer(void) {
+  return time(NULL);
+}
+
+flt timertime(timer st, timer fn) {
+  return difftime(fn, st);;
+}
+#endif  /*  OLDUNIXTIME  */
+
+
+
+/* random other helper utility functions */
+int rt_meminuse(void) {
+  return rt_mem_in_use;
+}  
+
+void * rt_getmem(unsigned int bytes) {
+  void * mem;
+
+  mem=malloc( bytes );
+  if (mem!=NULL) { 
+    rt_mem_in_use += bytes;
+  } 
+  else {
+    rtbomb("No more memory!!!!");
+  }
+  return mem;
+}
+
+unsigned int rt_freemem(void * addr) {
+  unsigned int bytes;
+
+  free(addr);
+
+  bytes=0;
+  rt_mem_in_use -= bytes; 
+  return bytes;
+}
+
+void rtbomb(const char * msg) {
+    rt_ui_message(MSG_ERR, msg);
+    rt_ui_message(MSG_ABORT, "Rendering Aborted.");
+
+  rt_finalize();
+  exit(1);
+}
+
+void rtmesg(const char * msg) {
+    rt_ui_message(MSG_0, msg);
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/util.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/util.h
new file mode 100644
index 00000000..9be83160
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/util.h
@@ -0,0 +1,88 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * util.h - This file contains defines for the timer functions...
+ *
+ *  $Id: util.h,v 1.3 2007-02-22 17:54:17 Exp $
+ */
+
+#include "machine.h"
+
+#if defined( _WIN32 )
+  #include <windows.h>
+  #if defined(WINAPI_FAMILY) && (WINAPI_FAMILY == WINAPI_FAMILY_APP)
+    #define WIN8UI_EXAMPLE 1
+    #include <thread>
+    typedef ULONGLONG timer;
+    #ifdef GetTickCount
+      #undef GetTickCount 
+    #endif
+    #define GetTickCount GetTickCount64
+  #else
+    typedef DWORD timer;
+  #endif
+#else
+  #include <sys/time.h>
+  #include <unistd.h>
+  #if defined( STDTIME )
+    typedef timeval timer;
+  #elif defined ( OLDUNIXTIME )
+    typedef time_t timer;
+  #endif  /*  OLDUNIXTIME  */ /*  STDTIME  */
+ #endif  /*  _WIN32  */
+
+timer gettimer(void);
+flt timertime(timer st, timer fn);
+void rt_sleep(int);
+int rt_meminuse(void);
+void * rt_getmem(unsigned int);
+unsigned int rt_freemem(void *); 
+void rtbomb(const char *);
+void rtmesg(const char *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vector.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vector.cpp
new file mode 100644
index 00000000..54384991
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vector.cpp
@@ -0,0 +1,134 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/* 
+ * vector.cpp - This file contains all of the vector arithmetic functions.
+ */
+
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+
+flt VDot(vector *a, vector *b) {
+  return (a->x*b->x + a->y*b->y + a->z*b->z);
+}
+
+void VCross(vector * a, vector * b, vector * c) {
+  c->x = (a->y * b->z) - (a->z * b->y);
+  c->y = (a->z * b->x) - (a->x * b->z);
+  c->z = (a->x * b->y) - (a->y * b->x);
+}
+
+flt VLength(vector * a) {
+  return (flt) sqrt((a->x * a->x) + (a->y * a->y) + (a->z * a->z));
+}
+
+void VNorm(vector * a) {
+  flt len;
+
+  len=sqrt((a->x * a->x) + (a->y * a->y) + (a->z * a->z));
+  if (len != 0.0) {
+    a->x /= len;
+    a->y /= len;
+    a->z /= len;
+  }
+}
+
+void VAdd(vector * a, vector * b, vector * c) {
+  c->x = (a->x + b->x);
+  c->y = (a->y + b->y);
+  c->z = (a->z + b->z);
+}
+    
+void VSub(vector * a, vector * b, vector * c) {
+  c->x = (a->x - b->x);
+  c->y = (a->y - b->y);
+  c->z = (a->z - b->z);
+}
+
+void VAddS(flt a, vector * A, vector * B, vector * C) {
+  C->x = (a * A->x) + B->x;
+  C->y = (a * A->y) + B->y;
+  C->z = (a * A->z) + B->z;
+}
+
+vector Raypnt(ray * a, flt t) {
+  vector temp;
+
+  temp.x=a->o.x + (a->d.x * t);
+  temp.y=a->o.y + (a->d.y * t);
+  temp.z=a->o.z + (a->d.z * t);
+
+  return temp;
+}
+
+void VScale(vector * a, flt s) {
+  a->x *= s;
+  a->y *= s;
+  a->z *= s;
+}
+
+void ColorAddS(color * a, color * b, flt s) {
+  a->r += b->r * s;
+  a->g += b->g * s;
+  a->b += b->b * s;
+}
+
+void ColorAccum(color * a, color * b) {
+  a->r += b->r;
+  a->g += b->g;
+  a->b += b->b;
+}
+
+void ColorScale(color * a, flt s) {
+  a->r *= s;
+  a->g *= s;
+  a->b *= s;
+}
+
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vector.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vector.h
new file mode 100644
index 00000000..2e5232f4
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vector.h
@@ -0,0 +1,68 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * vector.h - This file contains declarations of vector functions
+ *
+ *  $Id: vector.h,v 1.2 2007-02-22 17:54:17 Exp $
+ */
+
+flt VDot(vector *, vector *);
+void VCross(vector *, vector *, vector *);
+flt VLength(vector *);
+void VNorm(vector *);
+void VAdd(vector *, vector *, vector *);
+void VSub(vector *, vector *, vector *);
+void VAddS(flt, vector *, vector *, vector *);
+vector Raypnt(ray *, flt);
+void VScale(vector * a, flt s); 
+
+void ColorAddS(color * a, color * b, flt s); 
+void ColorAccum(color * a, color * b); 
+void ColorScale(color * a, flt s); 
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vol.cpp b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vol.cpp
new file mode 100644
index 00000000..489e6c55
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vol.cpp
@@ -0,0 +1,302 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * vol.cpp - Volume rendering helper routines etc.
+ */
+
+#include <stdio.h>
+#include "machine.h"
+#include "types.h"
+#include "macros.h"
+#include "vector.h"
+#include "util.h"
+#include "vol.h"
+#include "box.h"
+#include "trace.h"
+#include "ui.h"
+#include "light.h"
+#include "shade.h"
+
+int scalarvol_bbox(void * obj, vector * min, vector * max) {
+  box * b = (box *) obj;
+
+  *min = b->min;
+  *max = b->max;
+
+  return 1;
+}
+
+void * newscalarvol(void * intex, vector min, vector max,
+                    int xs, int ys, int zs, char * fname, scalarvol * invol) {
+  box * bx;
+  texture * tx, * tex;
+  scalarvol * vol;
+
+  tex=(texture *)intex;
+  tex->shadowcast = 0; /* doesn't cast a shadow */
+
+  tx=(texture *)rt_getmem(sizeof(texture));
+
+  /* is the volume data already loaded? */
+  if (invol==NULL) {
+    vol=(scalarvol *)rt_getmem(sizeof(scalarvol));
+    vol->loaded=0;
+    vol->data=NULL;
+  }
+  else
+    vol=invol;
+
+  vol->opacity=tex->opacity;
+  vol->xres=xs;
+  vol->yres=ys;
+  vol->zres=zs;
+  strcpy(vol->name, fname);
+
+  tx->ctr.x = 0.0;
+  tx->ctr.y = 0.0;
+  tx->ctr.z = 0.0;
+  tx->rot   = tx->ctr;
+  tx->scale = tx->ctr;
+  tx->uaxs  = tx->ctr;
+  tx->vaxs  = tx->ctr;
+
+  tx->islight = 0;
+  tx->shadowcast = 0; /* doesn't cast a shadow */
+
+  tx->col = tex->col;
+  tx->ambient  = 1.0;
+  tx->diffuse  = 0.0;
+  tx->specular = 0.0;
+  tx->opacity  = 1.0;
+  tx->img = vol;
+  tx->texfunc = (color(*)(void *, void *, void *))(scalar_volume_texture);
+
+  bx=newbox(tx, min, max);
+  tx->obj = (void *) bx; /* XXX hack! */
+
+  return (void *) bx;
+}
+
+
+color VoxelColor(flt scalar) {
+  color col;
+
+  if (scalar > 1.0)
+    scalar = 1.0;
+
+  if (scalar < 0.0)
+    scalar = 0.0;
+
+  if (scalar < 0.25) {
+    col.r = scalar * 4.0;
+    col.g = 0.0;
+    col.b = 0.0;
+  }
+  else {
+    if (scalar < 0.75) {
+      col.r = 1.0;
+      col.g = (scalar - 0.25) * 2.0;
+      col.b = 0.0;
+    }
+    else {
+      col.r = 1.0;
+      col.g = 1.0;
+      col.b = (scalar - 0.75) * 4.0;
+    }
+  }
+
+  return col;
+}
+
+color scalar_volume_texture(vector * hit, texture * tex, ray * ry) {
+  color col, col2;
+  box * bx;
+  flt a, tx1, tx2, ty1, ty2, tz1, tz2;
+  flt tnear, tfar;
+  flt t, tdist, dt, sum, tt;
+  vector pnt, bln;
+  scalarvol * vol;
+  flt scalar, transval;
+  int x, y, z;
+  unsigned char * ptr;
+
+  bx=(box *) tex->obj;
+  vol=(scalarvol *)bx->tex->img;
+
+  col.r=0.0;
+  col.g=0.0;
+  col.b=0.0;
+
+  tnear= -FHUGE;
+  tfar= FHUGE;
+
+  if (ry->d.x == 0.0) {
+    if ((ry->o.x < bx->min.x) || (ry->o.x > bx->max.x)) return col;
+  }
+  else {
+    tx1 = (bx->min.x - ry->o.x) / ry->d.x;
+    tx2 = (bx->max.x - ry->o.x) / ry->d.x;
+    if (tx1 > tx2) { a=tx1; tx1=tx2; tx2=a; }
+    if (tx1 > tnear) tnear=tx1;
+    if (tx2 < tfar)   tfar=tx2;
+  }
+  if (tnear > tfar) return col;
+  if (tfar < 0.0) return col;
+
+ if (ry->d.y == 0.0) {
+    if ((ry->o.y < bx->min.y) || (ry->o.y > bx->max.y)) return col;
+  }
+  else {
+    ty1 = (bx->min.y - ry->o.y) / ry->d.y;
+    ty2 = (bx->max.y - ry->o.y) / ry->d.y;
+    if (ty1 > ty2) { a=ty1; ty1=ty2; ty2=a; }
+    if (ty1 > tnear) tnear=ty1;
+    if (ty2 < tfar)   tfar=ty2;
+  }
+  if (tnear > tfar) return col;
+  if (tfar < 0.0) return col;
+
+  if (ry->d.z == 0.0) {
+    if ((ry->o.z < bx->min.z) || (ry->o.z > bx->max.z)) return col;
+  }
+  else {
+    tz1 = (bx->min.z - ry->o.z) / ry->d.z;
+    tz2 = (bx->max.z - ry->o.z) / ry->d.z;
+    if (tz1 > tz2) { a=tz1; tz1=tz2; tz2=a; }
+    if (tz1 > tnear) tnear=tz1;
+    if (tz2 < tfar)   tfar=tz2;
+  }
+  if (tnear > tfar) return col;
+  if (tfar < 0.0) return col;
+
+  if (tnear < 0.0) tnear=0.0;
+
+  tdist=sqrt((flt) (vol->xres*vol->xres + vol->yres*vol->yres + vol->zres*vol->zres));
+  tt = (vol->opacity / tdist);
+
+  bln.x=fabs(bx->min.x - bx->max.x);
+  bln.y=fabs(bx->min.y - bx->max.y);
+  bln.z=fabs(bx->min.z - bx->max.z);
+
+  dt=sqrt(bln.x*bln.x + bln.y*bln.y + bln.z*bln.z) / tdist;
+  sum=0.0;
+
+  /* move the volume residency check out of loop.. */
+  if (!vol->loaded) {
+    LoadVol(vol);
+    vol->loaded=1;
+  }
+
+  for (t=tnear; t<=tfar; t+=dt) {
+    pnt.x=((ry->o.x + (ry->d.x * t)) - bx->min.x) / bln.x;
+    pnt.y=((ry->o.y + (ry->d.y * t)) - bx->min.y) / bln.y;
+    pnt.z=((ry->o.z + (ry->d.z * t)) - bx->min.z) / bln.z;
+
+    x=(int) ((vol->xres - 1.5) * pnt.x + 0.5);
+    y=(int) ((vol->yres - 1.5) * pnt.y + 0.5);
+    z=(int) ((vol->zres - 1.5) * pnt.z + 0.5);
+
+    ptr = vol->data + ((vol->xres * vol->yres * z) + (vol->xres * y) + x);
+
+    scalar = (flt) ((flt) 1.0 * ((int) ptr[0])) / 255.0;
+
+    sum += tt * scalar;
+
+    transval = tt * scalar;
+
+    col2 = VoxelColor(scalar);
+
+    if (sum < 1.0) {
+      col.r += transval * col2.r;
+      col.g += transval * col2.g;
+      col.b += transval * col2.b;
+      if (sum < 0.0) sum=0.0;
+    }
+    else {
+      sum=1.0;
+    }
+  }
+
+  if (sum < 1.0) {      /* spawn transmission rays / refraction */
+    color transcol;
+
+    transcol = shade_transmission(ry, hit, 1.0 - sum);
+
+    col.r += transcol.r; /* add the transmitted ray  */
+    col.g += transcol.g; /* to the diffuse and       */
+    col.b += transcol.b; /* transmission total..     */
+  }
+
+  return col;
+}
+
+void LoadVol(scalarvol * vol) {
+  FILE * dfile;
+  size_t status;
+  char msgtxt[2048];
+
+  dfile=fopen(vol->name, "r");
+  if (dfile==NULL) {
+    char msgtxt[2048];
+    sprintf(msgtxt, "Vol: can't open %s for input!!! Aborting\n",vol->name);
+    rt_ui_message(MSG_ERR, msgtxt);
+    rt_ui_message(MSG_ABORT, "Rendering Aborted.");
+    exit(1);
+  }
+
+  sprintf(msgtxt, "loading %dx%dx%d volume set from %s",
+      vol->xres, vol->yres, vol->zres, vol->name);
+  rt_ui_message(MSG_0, msgtxt);
+
+  vol->data = (unsigned char *)rt_getmem(vol->xres * vol->yres * vol->zres);
+
+  status=fread(vol->data, 1, (vol->xres * vol->yres * vol->zres), dfile);
+  fclose(dfile);
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vol.h b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vol.h
new file mode 100644
index 00000000..bea9cd6a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/src/vol.h
@@ -0,0 +1,63 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    The original source for this example is
+    Copyright (c) 1994-2008 John E. Stone
+    All rights reserved.
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. The name of the author may not be used to endorse or promote products
+       derived from this software without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
+    OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+    DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+*/
+
+/*
+ * vol.h - Volume rendering definitions etc.
+ *
+ *
+ *  $Id: vol.h,v 1.2 2007-02-22 17:54:17 Exp $
+ */
+
+
+void * newscalarvol(void * intex, vector min, vector max, 
+                    int xs, int ys, int zs, 
+                    char * fname, scalarvol * invol);
+
+void  LoadVol(scalarvol *);
+color scalar_volume_texture(vector *, texture *, ray *);
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..c8e03c61
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/project.pbxproj
@@ -0,0 +1,1295 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		840116E1152CBBF600B07E4D /* api.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B6152CBBF600B07E4D /* api.cpp */; };
+		840116E2152CBBF600B07E4D /* apigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B7152CBBF600B07E4D /* apigeom.cpp */; };
+		840116E3152CBBF600B07E4D /* apitrigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B8152CBBF600B07E4D /* apitrigeom.cpp */; };
+		840116E4152CBBF600B07E4D /* bndbox.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B9152CBBF600B07E4D /* bndbox.cpp */; };
+		840116E5152CBBF600B07E4D /* box.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BA152CBBF600B07E4D /* box.cpp */; };
+		840116E6152CBBF600B07E4D /* camera.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BB152CBBF600B07E4D /* camera.cpp */; };
+		840116E7152CBBF600B07E4D /* coordsys.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BC152CBBF600B07E4D /* coordsys.cpp */; };
+		840116E8152CBBF600B07E4D /* cylinder.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BD152CBBF600B07E4D /* cylinder.cpp */; };
+		840116E9152CBBF600B07E4D /* extvol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BE152CBBF600B07E4D /* extvol.cpp */; };
+		840116EA152CBBF600B07E4D /* global.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BF152CBBF600B07E4D /* global.cpp */; };
+		840116EB152CBBF600B07E4D /* grid.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C0152CBBF600B07E4D /* grid.cpp */; };
+		840116EC152CBBF600B07E4D /* imageio.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C1152CBBF600B07E4D /* imageio.cpp */; };
+		840116ED152CBBF600B07E4D /* imap.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C2152CBBF600B07E4D /* imap.cpp */; };
+		840116EE152CBBF600B07E4D /* intersect.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C3152CBBF600B07E4D /* intersect.cpp */; };
+		840116EF152CBBF600B07E4D /* jpeg.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C4152CBBF600B07E4D /* jpeg.cpp */; };
+		840116F0152CBBF600B07E4D /* light.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C5152CBBF600B07E4D /* light.cpp */; };
+		840116F1152CBBF600B07E4D /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C6152CBBF600B07E4D /* main.cpp */; };
+		840116F2152CBBF600B07E4D /* objbound.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C7152CBBF600B07E4D /* objbound.cpp */; };
+		840116F3152CBBF600B07E4D /* parse.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C8152CBBF600B07E4D /* parse.cpp */; };
+		840116F4152CBBF600B07E4D /* plane.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C9152CBBF600B07E4D /* plane.cpp */; };
+		840116F5152CBBF600B07E4D /* ppm.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CA152CBBF600B07E4D /* ppm.cpp */; };
+		840116F6152CBBF600B07E4D /* pthread.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CB152CBBF600B07E4D /* pthread.cpp */; };
+		840116F7152CBBF600B07E4D /* quadric.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CC152CBBF600B07E4D /* quadric.cpp */; };
+		840116F8152CBBF600B07E4D /* render.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CD152CBBF600B07E4D /* render.cpp */; };
+		840116F9152CBBF600B07E4D /* ring.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CE152CBBF600B07E4D /* ring.cpp */; };
+		840116FA152CBBF600B07E4D /* shade.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CF152CBBF600B07E4D /* shade.cpp */; };
+		840116FB152CBBF600B07E4D /* sphere.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D0152CBBF600B07E4D /* sphere.cpp */; };
+		840116FC152CBBF600B07E4D /* tachyon_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D1152CBBF600B07E4D /* tachyon_video.cpp */; };
+		840116FD152CBBF600B07E4D /* texture.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D2152CBBF600B07E4D /* texture.cpp */; };
+		840116FE152CBBF600B07E4D /* tgafile.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D3152CBBF600B07E4D /* tgafile.cpp */; };
+		840116FF152CBBF600B07E4D /* trace_rest.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D4152CBBF600B07E4D /* trace_rest.cpp */; };
+		84011707152CBBF600B07E4D /* triangle.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DC152CBBF600B07E4D /* triangle.cpp */; };
+		84011708152CBBF600B07E4D /* ui.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DD152CBBF600B07E4D /* ui.cpp */; };
+		84011709152CBBF600B07E4D /* util.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DE152CBBF600B07E4D /* util.cpp */; };
+		8401170A152CBBF600B07E4D /* vector.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DF152CBBF600B07E4D /* vector.cpp */; };
+		8401170B152CBBF600B07E4D /* vol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116E0152CBBF600B07E4D /* vol.cpp */; };
+		8401172A152D6E3E00B07E4D /* trace.tbb.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84011729152D6E3E00B07E4D /* trace.tbb.cpp */; };
+		8401172D152D6F6C00B07E4D /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		8401172E152D6F6C00B07E4D /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		8401172F152D6F6C00B07E4D /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		84011730152D6F6C00B07E4D /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		84011731152D6F6C00B07E4D /* api.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B6152CBBF600B07E4D /* api.cpp */; };
+		84011732152D6F6C00B07E4D /* apigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B7152CBBF600B07E4D /* apigeom.cpp */; };
+		84011733152D6F6C00B07E4D /* apitrigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B8152CBBF600B07E4D /* apitrigeom.cpp */; };
+		84011734152D6F6C00B07E4D /* bndbox.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B9152CBBF600B07E4D /* bndbox.cpp */; };
+		84011735152D6F6C00B07E4D /* box.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BA152CBBF600B07E4D /* box.cpp */; };
+		84011736152D6F6C00B07E4D /* camera.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BB152CBBF600B07E4D /* camera.cpp */; };
+		84011737152D6F6C00B07E4D /* coordsys.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BC152CBBF600B07E4D /* coordsys.cpp */; };
+		84011738152D6F6C00B07E4D /* cylinder.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BD152CBBF600B07E4D /* cylinder.cpp */; };
+		84011739152D6F6C00B07E4D /* extvol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BE152CBBF600B07E4D /* extvol.cpp */; };
+		8401173A152D6F6C00B07E4D /* global.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BF152CBBF600B07E4D /* global.cpp */; };
+		8401173B152D6F6C00B07E4D /* grid.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C0152CBBF600B07E4D /* grid.cpp */; };
+		8401173C152D6F6C00B07E4D /* imageio.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C1152CBBF600B07E4D /* imageio.cpp */; };
+		8401173D152D6F6C00B07E4D /* imap.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C2152CBBF600B07E4D /* imap.cpp */; };
+		8401173E152D6F6C00B07E4D /* intersect.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C3152CBBF600B07E4D /* intersect.cpp */; };
+		8401173F152D6F6C00B07E4D /* jpeg.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C4152CBBF600B07E4D /* jpeg.cpp */; };
+		84011740152D6F6C00B07E4D /* light.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C5152CBBF600B07E4D /* light.cpp */; };
+		84011741152D6F6C00B07E4D /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C6152CBBF600B07E4D /* main.cpp */; };
+		84011742152D6F6C00B07E4D /* objbound.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C7152CBBF600B07E4D /* objbound.cpp */; };
+		84011743152D6F6C00B07E4D /* parse.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C8152CBBF600B07E4D /* parse.cpp */; };
+		84011744152D6F6C00B07E4D /* plane.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C9152CBBF600B07E4D /* plane.cpp */; };
+		84011745152D6F6C00B07E4D /* ppm.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CA152CBBF600B07E4D /* ppm.cpp */; };
+		84011746152D6F6C00B07E4D /* pthread.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CB152CBBF600B07E4D /* pthread.cpp */; };
+		84011747152D6F6C00B07E4D /* quadric.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CC152CBBF600B07E4D /* quadric.cpp */; };
+		84011748152D6F6C00B07E4D /* render.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CD152CBBF600B07E4D /* render.cpp */; };
+		84011749152D6F6C00B07E4D /* ring.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CE152CBBF600B07E4D /* ring.cpp */; };
+		8401174A152D6F6C00B07E4D /* shade.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CF152CBBF600B07E4D /* shade.cpp */; };
+		8401174B152D6F6C00B07E4D /* sphere.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D0152CBBF600B07E4D /* sphere.cpp */; };
+		8401174C152D6F6C00B07E4D /* tachyon_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D1152CBBF600B07E4D /* tachyon_video.cpp */; };
+		8401174D152D6F6C00B07E4D /* texture.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D2152CBBF600B07E4D /* texture.cpp */; };
+		8401174E152D6F6C00B07E4D /* tgafile.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D3152CBBF600B07E4D /* tgafile.cpp */; };
+		8401174F152D6F6C00B07E4D /* trace_rest.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D4152CBBF600B07E4D /* trace_rest.cpp */; };
+		84011750152D6F6C00B07E4D /* triangle.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DC152CBBF600B07E4D /* triangle.cpp */; };
+		84011751152D6F6C00B07E4D /* ui.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DD152CBBF600B07E4D /* ui.cpp */; };
+		84011752152D6F6C00B07E4D /* util.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DE152CBBF600B07E4D /* util.cpp */; };
+		84011753152D6F6C00B07E4D /* vector.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DF152CBBF600B07E4D /* vector.cpp */; };
+		84011754152D6F6C00B07E4D /* vol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116E0152CBBF600B07E4D /* vol.cpp */; };
+		84011757152D6F6C00B07E4D /* OpenGL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D01775152744BD0008A4E0 /* OpenGL.framework */; };
+		84011758152D6F6C00B07E4D /* Cocoa.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D017551527431F0008A4E0 /* Cocoa.framework */; };
+		8401175B152D6F6C00B07E4D /* (null) in Resources */ = {isa = PBXBuildFile; };
+		8401175C152D6F6C00B07E4D /* InfoPlist.strings in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */; };
+		8401175D152D6F6C00B07E4D /* MainMenu.xib in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7E152CA97B00D59B95 /* MainMenu.xib */; };
+		84011766152D6F8400B07E4D /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		84011767152D6F8400B07E4D /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		84011768152D6F8400B07E4D /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		84011769152D6F8400B07E4D /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		8401176A152D6F8400B07E4D /* api.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B6152CBBF600B07E4D /* api.cpp */; };
+		8401176B152D6F8400B07E4D /* apigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B7152CBBF600B07E4D /* apigeom.cpp */; };
+		8401176C152D6F8400B07E4D /* apitrigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B8152CBBF600B07E4D /* apitrigeom.cpp */; };
+		8401176D152D6F8400B07E4D /* bndbox.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B9152CBBF600B07E4D /* bndbox.cpp */; };
+		8401176E152D6F8400B07E4D /* box.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BA152CBBF600B07E4D /* box.cpp */; };
+		8401176F152D6F8400B07E4D /* camera.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BB152CBBF600B07E4D /* camera.cpp */; };
+		84011770152D6F8400B07E4D /* coordsys.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BC152CBBF600B07E4D /* coordsys.cpp */; };
+		84011771152D6F8400B07E4D /* cylinder.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BD152CBBF600B07E4D /* cylinder.cpp */; };
+		84011772152D6F8400B07E4D /* extvol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BE152CBBF600B07E4D /* extvol.cpp */; };
+		84011773152D6F8400B07E4D /* global.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BF152CBBF600B07E4D /* global.cpp */; };
+		84011774152D6F8400B07E4D /* grid.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C0152CBBF600B07E4D /* grid.cpp */; };
+		84011775152D6F8400B07E4D /* imageio.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C1152CBBF600B07E4D /* imageio.cpp */; };
+		84011776152D6F8400B07E4D /* imap.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C2152CBBF600B07E4D /* imap.cpp */; };
+		84011777152D6F8400B07E4D /* intersect.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C3152CBBF600B07E4D /* intersect.cpp */; };
+		84011778152D6F8400B07E4D /* jpeg.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C4152CBBF600B07E4D /* jpeg.cpp */; };
+		84011779152D6F8400B07E4D /* light.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C5152CBBF600B07E4D /* light.cpp */; };
+		8401177A152D6F8400B07E4D /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C6152CBBF600B07E4D /* main.cpp */; };
+		8401177B152D6F8400B07E4D /* objbound.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C7152CBBF600B07E4D /* objbound.cpp */; };
+		8401177C152D6F8400B07E4D /* parse.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C8152CBBF600B07E4D /* parse.cpp */; };
+		8401177D152D6F8400B07E4D /* plane.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C9152CBBF600B07E4D /* plane.cpp */; };
+		8401177E152D6F8400B07E4D /* ppm.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CA152CBBF600B07E4D /* ppm.cpp */; };
+		8401177F152D6F8400B07E4D /* pthread.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CB152CBBF600B07E4D /* pthread.cpp */; };
+		84011780152D6F8400B07E4D /* quadric.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CC152CBBF600B07E4D /* quadric.cpp */; };
+		84011781152D6F8400B07E4D /* render.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CD152CBBF600B07E4D /* render.cpp */; };
+		84011782152D6F8400B07E4D /* ring.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CE152CBBF600B07E4D /* ring.cpp */; };
+		84011783152D6F8400B07E4D /* shade.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CF152CBBF600B07E4D /* shade.cpp */; };
+		84011784152D6F8400B07E4D /* sphere.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D0152CBBF600B07E4D /* sphere.cpp */; };
+		84011785152D6F8400B07E4D /* tachyon_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D1152CBBF600B07E4D /* tachyon_video.cpp */; };
+		84011786152D6F8400B07E4D /* texture.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D2152CBBF600B07E4D /* texture.cpp */; };
+		84011787152D6F8400B07E4D /* tgafile.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D3152CBBF600B07E4D /* tgafile.cpp */; };
+		84011788152D6F8400B07E4D /* trace_rest.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D4152CBBF600B07E4D /* trace_rest.cpp */; };
+		84011789152D6F8400B07E4D /* triangle.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DC152CBBF600B07E4D /* triangle.cpp */; };
+		8401178A152D6F8400B07E4D /* ui.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DD152CBBF600B07E4D /* ui.cpp */; };
+		8401178B152D6F8400B07E4D /* util.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DE152CBBF600B07E4D /* util.cpp */; };
+		8401178C152D6F8400B07E4D /* vector.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DF152CBBF600B07E4D /* vector.cpp */; };
+		8401178D152D6F8400B07E4D /* vol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116E0152CBBF600B07E4D /* vol.cpp */; };
+		84011790152D6F8400B07E4D /* OpenGL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D01775152744BD0008A4E0 /* OpenGL.framework */; };
+		84011791152D6F8400B07E4D /* Cocoa.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D017551527431F0008A4E0 /* Cocoa.framework */; };
+		84011794152D6F8400B07E4D /* (null) in Resources */ = {isa = PBXBuildFile; };
+		84011795152D6F8400B07E4D /* InfoPlist.strings in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */; };
+		84011796152D6F8400B07E4D /* MainMenu.xib in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7E152CA97B00D59B95 /* MainMenu.xib */; };
+		840117A1152D6FF900B07E4D /* trace.serial.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 8401179F152D6FD100B07E4D /* trace.serial.cpp */; };
+		840117A2152D701A00B07E4D /* trace.tbb1d.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 8401179D152D6FC600B07E4D /* trace.tbb1d.cpp */; };
+		84B8DA77152CA90100D59B95 /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		84B8DA7A152CA90100D59B95 /* (null) in Resources */ = {isa = PBXBuildFile; };
+		84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */; };
+		84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7E152CA97B00D59B95 /* MainMenu.xib */; };
+		84B8DA9A152CADF400D59B95 /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D017551527431F0008A4E0 /* Cocoa.framework */; };
+		84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D01775152744BD0008A4E0 /* OpenGL.framework */; };
+		D3E786C41C0E36AC006995F1 /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		D3E786C51C0E36B0006995F1 /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		D3E786C61C0E36BC006995F1 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		D3E786C71C0E36C1006995F1 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		D3E786C81C0E373D006995F1 /* trace.tbb.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84011729152D6E3E00B07E4D /* trace.tbb.cpp */; };
+		D3E786C91C0E3742006995F1 /* api.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B6152CBBF600B07E4D /* api.cpp */; };
+		D3E786CA1C0E375D006995F1 /* apigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B7152CBBF600B07E4D /* apigeom.cpp */; };
+		D3E786CB1C0E375D006995F1 /* apitrigeom.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B8152CBBF600B07E4D /* apitrigeom.cpp */; };
+		D3E786CC1C0E375D006995F1 /* bndbox.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116B9152CBBF600B07E4D /* bndbox.cpp */; };
+		D3E786CD1C0E375D006995F1 /* box.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BA152CBBF600B07E4D /* box.cpp */; };
+		D3E786CE1C0E375D006995F1 /* camera.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BB152CBBF600B07E4D /* camera.cpp */; };
+		D3E786CF1C0E375D006995F1 /* coordsys.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BC152CBBF600B07E4D /* coordsys.cpp */; };
+		D3E786D01C0E375D006995F1 /* cylinder.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BD152CBBF600B07E4D /* cylinder.cpp */; };
+		D3E786D11C0E375D006995F1 /* extvol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BE152CBBF600B07E4D /* extvol.cpp */; };
+		D3E786D21C0E375D006995F1 /* global.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116BF152CBBF600B07E4D /* global.cpp */; };
+		D3E786D31C0E375D006995F1 /* grid.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C0152CBBF600B07E4D /* grid.cpp */; };
+		D3E786D41C0E375D006995F1 /* imageio.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C1152CBBF600B07E4D /* imageio.cpp */; };
+		D3E786D51C0E375D006995F1 /* imap.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C2152CBBF600B07E4D /* imap.cpp */; };
+		D3E786D61C0E375D006995F1 /* intersect.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C3152CBBF600B07E4D /* intersect.cpp */; };
+		D3E786D71C0E375D006995F1 /* jpeg.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C4152CBBF600B07E4D /* jpeg.cpp */; };
+		D3E786D81C0E375D006995F1 /* light.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C5152CBBF600B07E4D /* light.cpp */; };
+		D3E786D91C0E375D006995F1 /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C6152CBBF600B07E4D /* main.cpp */; };
+		D3E786DA1C0E375D006995F1 /* objbound.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C7152CBBF600B07E4D /* objbound.cpp */; };
+		D3E786DB1C0E375D006995F1 /* parse.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C8152CBBF600B07E4D /* parse.cpp */; };
+		D3E786DC1C0E375D006995F1 /* plane.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116C9152CBBF600B07E4D /* plane.cpp */; };
+		D3E786DD1C0E375D006995F1 /* ppm.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CA152CBBF600B07E4D /* ppm.cpp */; };
+		D3E786DE1C0E375D006995F1 /* pthread.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CB152CBBF600B07E4D /* pthread.cpp */; };
+		D3E786DF1C0E375D006995F1 /* quadric.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CC152CBBF600B07E4D /* quadric.cpp */; };
+		D3E786E01C0E375D006995F1 /* render.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CD152CBBF600B07E4D /* render.cpp */; };
+		D3E786E11C0E375D006995F1 /* ring.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CE152CBBF600B07E4D /* ring.cpp */; };
+		D3E786E21C0E375D006995F1 /* shade.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116CF152CBBF600B07E4D /* shade.cpp */; };
+		D3E786E31C0E375D006995F1 /* sphere.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D0152CBBF600B07E4D /* sphere.cpp */; };
+		D3E786E41C0E375D006995F1 /* tachyon_video.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D1152CBBF600B07E4D /* tachyon_video.cpp */; };
+		D3E786E51C0E375D006995F1 /* texture.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D2152CBBF600B07E4D /* texture.cpp */; };
+		D3E786E61C0E375D006995F1 /* tgafile.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D3152CBBF600B07E4D /* tgafile.cpp */; };
+		D3E786E71C0E375D006995F1 /* trace_rest.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116D4152CBBF600B07E4D /* trace_rest.cpp */; };
+		D3E786E81C0E375D006995F1 /* triangle.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DC152CBBF600B07E4D /* triangle.cpp */; };
+		D3E786E91C0E375D006995F1 /* ui.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DD152CBBF600B07E4D /* ui.cpp */; };
+		D3E786EA1C0E375D006995F1 /* util.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DE152CBBF600B07E4D /* util.cpp */; };
+		D3E786EB1C0E375D006995F1 /* vector.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116DF152CBBF600B07E4D /* vector.cpp */; };
+		D3E786F21C0E394C006995F1 /* vol.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 840116E0152CBBF600B07E4D /* vol.cpp */; };
+		D3E786F71C0E3A33006995F1 /* iOS.storyboard in Resources */ = {isa = PBXBuildFile; fileRef = D3E786F51C0E3A27006995F1 /* iOS.storyboard */; };
+		D3E786FA1C0E3DF7006995F1 /* balls.dat in Resources */ = {isa = PBXBuildFile; fileRef = D3E786F81C0E3DEC006995F1 /* balls.dat */; };
+		D3E786FC1C0E44E3006995F1 /* CoreFoundation.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = D3E786FB1C0E44E3006995F1 /* CoreFoundation.framework */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C589702191B71600DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C589712191BF5700DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C589762191BFE300DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C589772191C02B00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXFileReference section */
+		84011691152CBBC900B07E4D /* api.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = api.h; path = ../src/api.h; sourceTree = "<group>"; };
+		84011692152CBBC900B07E4D /* apitrigeom.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = apitrigeom.h; path = ../src/apitrigeom.h; sourceTree = "<group>"; };
+		84011693152CBBC900B07E4D /* bndbox.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = bndbox.h; path = ../src/bndbox.h; sourceTree = "<group>"; };
+		84011694152CBBC900B07E4D /* box.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = box.h; path = ../src/box.h; sourceTree = "<group>"; };
+		84011695152CBBC900B07E4D /* camera.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = camera.h; path = ../src/camera.h; sourceTree = "<group>"; };
+		84011696152CBBC900B07E4D /* coordsys.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = coordsys.h; path = ../src/coordsys.h; sourceTree = "<group>"; };
+		84011697152CBBC900B07E4D /* cylinder.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = cylinder.h; path = ../src/cylinder.h; sourceTree = "<group>"; };
+		84011698152CBBC900B07E4D /* extvol.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = extvol.h; path = ../src/extvol.h; sourceTree = "<group>"; };
+		84011699152CBBC900B07E4D /* global.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = global.h; path = ../src/global.h; sourceTree = "<group>"; };
+		8401169A152CBBC900B07E4D /* grid.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = grid.h; path = ../src/grid.h; sourceTree = "<group>"; };
+		8401169B152CBBC900B07E4D /* imageio.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = imageio.h; path = ../src/imageio.h; sourceTree = "<group>"; };
+		8401169C152CBBC900B07E4D /* imap.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = imap.h; path = ../src/imap.h; sourceTree = "<group>"; };
+		8401169D152CBBC900B07E4D /* intersect.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = intersect.h; path = ../src/intersect.h; sourceTree = "<group>"; };
+		8401169E152CBBC900B07E4D /* jpeg.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = jpeg.h; path = ../src/jpeg.h; sourceTree = "<group>"; };
+		8401169F152CBBC900B07E4D /* light.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = light.h; path = ../src/light.h; sourceTree = "<group>"; };
+		840116A0152CBBC900B07E4D /* machine.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = machine.h; path = ../src/machine.h; sourceTree = "<group>"; };
+		840116A1152CBBC900B07E4D /* macros.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = macros.h; path = ../src/macros.h; sourceTree = "<group>"; };
+		840116A2152CBBC900B07E4D /* objbound.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = objbound.h; path = ../src/objbound.h; sourceTree = "<group>"; };
+		840116A3152CBBC900B07E4D /* parse.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = parse.h; path = ../src/parse.h; sourceTree = "<group>"; };
+		840116A4152CBBC900B07E4D /* plane.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = plane.h; path = ../src/plane.h; sourceTree = "<group>"; };
+		840116A5152CBBC900B07E4D /* ppm.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = ppm.h; path = ../src/ppm.h; sourceTree = "<group>"; };
+		840116A7152CBBC900B07E4D /* quadric.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = quadric.h; path = ../src/quadric.h; sourceTree = "<group>"; };
+		840116A8152CBBC900B07E4D /* render.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = render.h; path = ../src/render.h; sourceTree = "<group>"; };
+		840116A9152CBBC900B07E4D /* ring.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = ring.h; path = ../src/ring.h; sourceTree = "<group>"; };
+		840116AA152CBBC900B07E4D /* shade.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = shade.h; path = ../src/shade.h; sourceTree = "<group>"; };
+		840116AB152CBBC900B07E4D /* sphere.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = sphere.h; path = ../src/sphere.h; sourceTree = "<group>"; };
+		840116AC152CBBC900B07E4D /* tachyon_video.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = tachyon_video.h; path = ../src/tachyon_video.h; sourceTree = "<group>"; };
+		840116AD152CBBC900B07E4D /* texture.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = texture.h; path = ../src/texture.h; sourceTree = "<group>"; };
+		840116AE152CBBC900B07E4D /* tgafile.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = tgafile.h; path = ../src/tgafile.h; sourceTree = "<group>"; };
+		840116AF152CBBC900B07E4D /* trace.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = trace.h; path = ../src/trace.h; sourceTree = "<group>"; };
+		840116B0152CBBC900B07E4D /* triangle.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = triangle.h; path = ../src/triangle.h; sourceTree = "<group>"; };
+		840116B1152CBBC900B07E4D /* types.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = types.h; path = ../src/types.h; sourceTree = "<group>"; };
+		840116B2152CBBC900B07E4D /* ui.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = ui.h; path = ../src/ui.h; sourceTree = "<group>"; };
+		840116B3152CBBC900B07E4D /* util.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = util.h; path = ../src/util.h; sourceTree = "<group>"; };
+		840116B4152CBBC900B07E4D /* vector.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = vector.h; path = ../src/vector.h; sourceTree = "<group>"; };
+		840116B5152CBBC900B07E4D /* vol.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = vol.h; path = ../src/vol.h; sourceTree = "<group>"; };
+		840116B6152CBBF600B07E4D /* api.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = api.cpp; sourceTree = "<group>"; };
+		840116B7152CBBF600B07E4D /* apigeom.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = apigeom.cpp; sourceTree = "<group>"; };
+		840116B8152CBBF600B07E4D /* apitrigeom.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = apitrigeom.cpp; sourceTree = "<group>"; };
+		840116B9152CBBF600B07E4D /* bndbox.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = bndbox.cpp; sourceTree = "<group>"; };
+		840116BA152CBBF600B07E4D /* box.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = box.cpp; sourceTree = "<group>"; };
+		840116BB152CBBF600B07E4D /* camera.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = camera.cpp; sourceTree = "<group>"; };
+		840116BC152CBBF600B07E4D /* coordsys.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = coordsys.cpp; sourceTree = "<group>"; };
+		840116BD152CBBF600B07E4D /* cylinder.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = cylinder.cpp; sourceTree = "<group>"; };
+		840116BE152CBBF600B07E4D /* extvol.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = extvol.cpp; sourceTree = "<group>"; };
+		840116BF152CBBF600B07E4D /* global.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = global.cpp; sourceTree = "<group>"; };
+		840116C0152CBBF600B07E4D /* grid.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = grid.cpp; sourceTree = "<group>"; };
+		840116C1152CBBF600B07E4D /* imageio.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = imageio.cpp; sourceTree = "<group>"; };
+		840116C2152CBBF600B07E4D /* imap.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = imap.cpp; sourceTree = "<group>"; };
+		840116C3152CBBF600B07E4D /* intersect.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = intersect.cpp; sourceTree = "<group>"; };
+		840116C4152CBBF600B07E4D /* jpeg.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = jpeg.cpp; sourceTree = "<group>"; };
+		840116C5152CBBF600B07E4D /* light.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = light.cpp; sourceTree = "<group>"; };
+		840116C6152CBBF600B07E4D /* main.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = main.cpp; sourceTree = "<group>"; };
+		840116C7152CBBF600B07E4D /* objbound.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = objbound.cpp; sourceTree = "<group>"; };
+		840116C8152CBBF600B07E4D /* parse.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = parse.cpp; sourceTree = "<group>"; };
+		840116C9152CBBF600B07E4D /* plane.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = plane.cpp; sourceTree = "<group>"; };
+		840116CA152CBBF600B07E4D /* ppm.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = ppm.cpp; sourceTree = "<group>"; };
+		840116CB152CBBF600B07E4D /* pthread.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = pthread.cpp; sourceTree = "<group>"; };
+		840116CC152CBBF600B07E4D /* quadric.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = quadric.cpp; sourceTree = "<group>"; };
+		840116CD152CBBF600B07E4D /* render.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = render.cpp; sourceTree = "<group>"; };
+		840116CE152CBBF600B07E4D /* ring.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = ring.cpp; sourceTree = "<group>"; };
+		840116CF152CBBF600B07E4D /* shade.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = shade.cpp; sourceTree = "<group>"; };
+		840116D0152CBBF600B07E4D /* sphere.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = sphere.cpp; sourceTree = "<group>"; };
+		840116D1152CBBF600B07E4D /* tachyon_video.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = tachyon_video.cpp; sourceTree = "<group>"; };
+		840116D2152CBBF600B07E4D /* texture.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = texture.cpp; sourceTree = "<group>"; };
+		840116D3152CBBF600B07E4D /* tgafile.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = tgafile.cpp; sourceTree = "<group>"; };
+		840116D4152CBBF600B07E4D /* trace_rest.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = trace_rest.cpp; sourceTree = "<group>"; };
+		840116DC152CBBF600B07E4D /* triangle.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = triangle.cpp; sourceTree = "<group>"; };
+		840116DD152CBBF600B07E4D /* ui.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = ui.cpp; sourceTree = "<group>"; };
+		840116DE152CBBF600B07E4D /* util.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = util.cpp; sourceTree = "<group>"; };
+		840116DF152CBBF600B07E4D /* vector.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = vector.cpp; sourceTree = "<group>"; };
+		840116E0152CBBF600B07E4D /* vol.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = vol.cpp; sourceTree = "<group>"; };
+		84011729152D6E3E00B07E4D /* trace.tbb.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = trace.tbb.cpp; sourceTree = "<group>"; };
+		84011761152D6F6C00B07E4D /* tachyon.serial.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tachyon.serial.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		8401179A152D6F8400B07E4D /* tachyon.tbb1d.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tachyon.tbb1d.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		8401179D152D6FC600B07E4D /* trace.tbb1d.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = trace.tbb1d.cpp; sourceTree = "<group>"; };
+		8401179F152D6FD100B07E4D /* trace.serial.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = trace.serial.cpp; sourceTree = "<group>"; };
+		84B8DA6F152CA90100D59B95 /* main.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = main.m; path = ../../../common/gui/xcode/tbbExample/main.m; sourceTree = "<group>"; };
+		84B8DA70152CA90100D59B95 /* OpenGLView.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = OpenGLView.h; path = ../../../common/gui/xcode/tbbExample/OpenGLView.h; sourceTree = "<group>"; };
+		84B8DA71152CA90100D59B95 /* OpenGLView.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = OpenGLView.m; path = ../../../common/gui/xcode/tbbExample/OpenGLView.m; sourceTree = "<group>"; };
+		84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = tbbAppDelegate.h; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.h; sourceTree = "<group>"; };
+		84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = tbbAppDelegate.m; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.m; sourceTree = "<group>"; };
+		84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = "tbbExample-Prefix.pch"; path = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch"; sourceTree = "<group>"; };
+		84B8DA7D152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = text.plist.strings; name = en; path = InfoPlist.strings; sourceTree = "<group>"; };
+		84B8DA7F152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = file.xib; name = en; path = MainMenu.xib; sourceTree = "<group>"; };
+		84B8DA99152CADF400D59B95 /* macvideo.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = macvideo.cpp; path = ../../../common/gui/macvideo.cpp; sourceTree = "<group>"; };
+		84D017511527431F0008A4E0 /* tachyon.tbb.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tachyon.tbb.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		84D017551527431F0008A4E0 /* Cocoa.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Cocoa.framework; path = System/Library/Frameworks/Cocoa.framework; sourceTree = SDKROOT; };
+		84D017581527431F0008A4E0 /* AppKit.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = AppKit.framework; path = System/Library/Frameworks/AppKit.framework; sourceTree = SDKROOT; };
+		84D017591527431F0008A4E0 /* CoreData.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = CoreData.framework; path = System/Library/Frameworks/CoreData.framework; sourceTree = SDKROOT; };
+		84D0175A1527431F0008A4E0 /* Foundation.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Foundation.framework; path = System/Library/Frameworks/Foundation.framework; sourceTree = SDKROOT; };
+		84D01775152744BD0008A4E0 /* OpenGL.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = OpenGL.framework; path = System/Library/Frameworks/OpenGL.framework; sourceTree = SDKROOT; };
+		D3E786AD1C0E3588006995F1 /* tachyon.tbb.ios.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tachyon.tbb.ios.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		D3E786F51C0E3A27006995F1 /* iOS.storyboard */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = file.storyboard; name = iOS.storyboard; path = ../iOS.storyboard; sourceTree = "<group>"; };
+		D3E786F81C0E3DEC006995F1 /* balls.dat */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text; name = balls.dat; path = ../../../../../parallel_for/tachyon/dat/balls.dat; sourceTree = "<group>"; };
+		D3E786FB1C0E44E3006995F1 /* CoreFoundation.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = CoreFoundation.framework; path = Platforms/iPhoneOS.platform/Developer/SDKs/iPhoneOS9.1.sdk/System/Library/Frameworks/CoreFoundation.framework; sourceTree = DEVELOPER_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		84011756152D6F6C00B07E4D /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84011757152D6F6C00B07E4D /* OpenGL.framework in Frameworks */,
+				84011758152D6F6C00B07E4D /* Cocoa.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		8401178F152D6F8400B07E4D /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84011790152D6F8400B07E4D /* OpenGL.framework in Frameworks */,
+				84011791152D6F8400B07E4D /* Cocoa.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		84D0174E1527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */,
+				84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D3E786AA1C0E3588006995F1 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D3E786FC1C0E44E3006995F1 /* CoreFoundation.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		8401160E152CB8A600B07E4D /* Sources */ = {
+			isa = PBXGroup;
+			children = (
+				8401179F152D6FD100B07E4D /* trace.serial.cpp */,
+				8401179D152D6FC600B07E4D /* trace.tbb1d.cpp */,
+				84011729152D6E3E00B07E4D /* trace.tbb.cpp */,
+				840116B6152CBBF600B07E4D /* api.cpp */,
+				840116B7152CBBF600B07E4D /* apigeom.cpp */,
+				840116B8152CBBF600B07E4D /* apitrigeom.cpp */,
+				840116B9152CBBF600B07E4D /* bndbox.cpp */,
+				840116BA152CBBF600B07E4D /* box.cpp */,
+				840116BB152CBBF600B07E4D /* camera.cpp */,
+				840116BC152CBBF600B07E4D /* coordsys.cpp */,
+				840116BD152CBBF600B07E4D /* cylinder.cpp */,
+				840116BE152CBBF600B07E4D /* extvol.cpp */,
+				840116BF152CBBF600B07E4D /* global.cpp */,
+				840116C0152CBBF600B07E4D /* grid.cpp */,
+				840116C1152CBBF600B07E4D /* imageio.cpp */,
+				840116C2152CBBF600B07E4D /* imap.cpp */,
+				840116C3152CBBF600B07E4D /* intersect.cpp */,
+				840116C4152CBBF600B07E4D /* jpeg.cpp */,
+				840116C5152CBBF600B07E4D /* light.cpp */,
+				840116C6152CBBF600B07E4D /* main.cpp */,
+				840116C7152CBBF600B07E4D /* objbound.cpp */,
+				840116C8152CBBF600B07E4D /* parse.cpp */,
+				840116C9152CBBF600B07E4D /* plane.cpp */,
+				840116CA152CBBF600B07E4D /* ppm.cpp */,
+				840116CB152CBBF600B07E4D /* pthread.cpp */,
+				840116CC152CBBF600B07E4D /* quadric.cpp */,
+				840116CD152CBBF600B07E4D /* render.cpp */,
+				840116CE152CBBF600B07E4D /* ring.cpp */,
+				840116CF152CBBF600B07E4D /* shade.cpp */,
+				840116D0152CBBF600B07E4D /* sphere.cpp */,
+				840116D1152CBBF600B07E4D /* tachyon_video.cpp */,
+				840116D2152CBBF600B07E4D /* texture.cpp */,
+				840116D3152CBBF600B07E4D /* tgafile.cpp */,
+				840116D4152CBBF600B07E4D /* trace_rest.cpp */,
+				840116DC152CBBF600B07E4D /* triangle.cpp */,
+				840116DD152CBBF600B07E4D /* ui.cpp */,
+				840116DE152CBBF600B07E4D /* util.cpp */,
+				840116DF152CBBF600B07E4D /* vector.cpp */,
+				840116E0152CBBF600B07E4D /* vol.cpp */,
+			);
+			name = Sources;
+			path = ../src;
+			sourceTree = "<group>";
+		};
+		84011690152CBB3C00B07E4D /* Headers */ = {
+			isa = PBXGroup;
+			children = (
+				84011691152CBBC900B07E4D /* api.h */,
+				84011692152CBBC900B07E4D /* apitrigeom.h */,
+				84011693152CBBC900B07E4D /* bndbox.h */,
+				84011694152CBBC900B07E4D /* box.h */,
+				84011695152CBBC900B07E4D /* camera.h */,
+				84011696152CBBC900B07E4D /* coordsys.h */,
+				84011697152CBBC900B07E4D /* cylinder.h */,
+				84011698152CBBC900B07E4D /* extvol.h */,
+				84011699152CBBC900B07E4D /* global.h */,
+				8401169A152CBBC900B07E4D /* grid.h */,
+				8401169B152CBBC900B07E4D /* imageio.h */,
+				8401169C152CBBC900B07E4D /* imap.h */,
+				8401169D152CBBC900B07E4D /* intersect.h */,
+				8401169E152CBBC900B07E4D /* jpeg.h */,
+				8401169F152CBBC900B07E4D /* light.h */,
+				840116A0152CBBC900B07E4D /* machine.h */,
+				840116A1152CBBC900B07E4D /* macros.h */,
+				840116A2152CBBC900B07E4D /* objbound.h */,
+				840116A3152CBBC900B07E4D /* parse.h */,
+				840116A4152CBBC900B07E4D /* plane.h */,
+				840116A5152CBBC900B07E4D /* ppm.h */,
+				840116A7152CBBC900B07E4D /* quadric.h */,
+				840116A8152CBBC900B07E4D /* render.h */,
+				840116A9152CBBC900B07E4D /* ring.h */,
+				840116AA152CBBC900B07E4D /* shade.h */,
+				840116AB152CBBC900B07E4D /* sphere.h */,
+				840116AC152CBBC900B07E4D /* tachyon_video.h */,
+				840116AD152CBBC900B07E4D /* texture.h */,
+				840116AE152CBBC900B07E4D /* tgafile.h */,
+				840116AF152CBBC900B07E4D /* trace.h */,
+				840116B0152CBBC900B07E4D /* triangle.h */,
+				840116B1152CBBC900B07E4D /* types.h */,
+				840116B2152CBBC900B07E4D /* ui.h */,
+				840116B3152CBBC900B07E4D /* util.h */,
+				840116B4152CBBC900B07E4D /* vector.h */,
+				840116B5152CBBC900B07E4D /* vol.h */,
+			);
+			name = Headers;
+			sourceTree = "<group>";
+		};
+		84B8DA6C152CA8D900D59B95 /* tbbExample */ = {
+			isa = PBXGroup;
+			children = (
+				84011690152CBB3C00B07E4D /* Headers */,
+				8401160E152CB8A600B07E4D /* Sources */,
+				84B8DA98152CAD8600D59B95 /* Gui layer */,
+				84B8DA7B152CA97B00D59B95 /* Resources */,
+			);
+			name = tbbExample;
+			sourceTree = "<group>";
+		};
+		84B8DA7B152CA97B00D59B95 /* Resources */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */,
+				84B8DA7E152CA97B00D59B95 /* MainMenu.xib */,
+				D3E786F51C0E3A27006995F1 /* iOS.storyboard */,
+				D3E786F81C0E3DEC006995F1 /* balls.dat */,
+			);
+			name = Resources;
+			path = ../../../common/gui/xcode/tbbExample/en.lproj;
+			sourceTree = "<group>";
+		};
+		84B8DA98152CAD8600D59B95 /* Gui layer */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA99152CADF400D59B95 /* macvideo.cpp */,
+				84B8DA6F152CA90100D59B95 /* main.m */,
+				84B8DA70152CA90100D59B95 /* OpenGLView.h */,
+				84B8DA71152CA90100D59B95 /* OpenGLView.m */,
+				84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */,
+				84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */,
+				84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */,
+			);
+			name = "Gui layer";
+			sourceTree = "<group>";
+		};
+		84D017461527431F0008A4E0 = {
+			isa = PBXGroup;
+			children = (
+				84B8DA6C152CA8D900D59B95 /* tbbExample */,
+				84D017541527431F0008A4E0 /* Frameworks */,
+				84D017521527431F0008A4E0 /* Products */,
+			);
+			sourceTree = "<group>";
+		};
+		84D017521527431F0008A4E0 /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				84D017511527431F0008A4E0 /* tachyon.tbb.app */,
+				84011761152D6F6C00B07E4D /* tachyon.serial.app */,
+				8401179A152D6F8400B07E4D /* tachyon.tbb1d.app */,
+				D3E786AD1C0E3588006995F1 /* tachyon.tbb.ios.app */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+		84D017541527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXGroup;
+			children = (
+				D3E786FB1C0E44E3006995F1 /* CoreFoundation.framework */,
+				84D017581527431F0008A4E0 /* AppKit.framework */,
+				84D017591527431F0008A4E0 /* CoreData.framework */,
+				84D0175A1527431F0008A4E0 /* Foundation.framework */,
+				84D01775152744BD0008A4E0 /* OpenGL.framework */,
+				84D017551527431F0008A4E0 /* Cocoa.framework */,
+			);
+			name = Frameworks;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8401172B152D6F6C00B07E4D /* tachyon.serial */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 8401175E152D6F6C00B07E4D /* Build configuration list for PBXNativeTarget "tachyon.serial" */;
+			buildPhases = (
+				8401172C152D6F6C00B07E4D /* Sources */,
+				84011756152D6F6C00B07E4D /* Frameworks */,
+				8401175A152D6F6C00B07E4D /* Resources */,
+			);
+			buildRules = (
+				C3C589712191BF5700DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tachyon.serial;
+			productName = tbbExample;
+			productReference = 84011761152D6F6C00B07E4D /* tachyon.serial.app */;
+			productType = "com.apple.product-type.application";
+		};
+		84011764152D6F8400B07E4D /* tachyon.tbb1d */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 84011797152D6F8400B07E4D /* Build configuration list for PBXNativeTarget "tachyon.tbb1d" */;
+			buildPhases = (
+				84011765152D6F8400B07E4D /* Sources */,
+				8401178F152D6F8400B07E4D /* Frameworks */,
+				84011793152D6F8400B07E4D /* Resources */,
+			);
+			buildRules = (
+				C3C589772191C02B00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tachyon.tbb1d;
+			productName = tbbExample;
+			productReference = 8401179A152D6F8400B07E4D /* tachyon.tbb1d.app */;
+			productType = "com.apple.product-type.application";
+		};
+		84D017501527431F0008A4E0 /* tachyon.tbb */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tachyon.tbb" */;
+			buildPhases = (
+				84D0174D1527431F0008A4E0 /* Sources */,
+				84D0174E1527431F0008A4E0 /* Frameworks */,
+				84D0174F1527431F0008A4E0 /* Resources */,
+			);
+			buildRules = (
+				C3C589702191B71600DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tachyon.tbb;
+			productName = tbbExample;
+			productReference = 84D017511527431F0008A4E0 /* tachyon.tbb.app */;
+			productType = "com.apple.product-type.application";
+		};
+		D3E786AC1C0E3588006995F1 /* tachyon.tbb.ios */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = D3E786C31C0E3588006995F1 /* Build configuration list for PBXNativeTarget "tachyon.tbb.ios" */;
+			buildPhases = (
+				D3E786A91C0E3588006995F1 /* Sources */,
+				D3E786AA1C0E3588006995F1 /* Frameworks */,
+				D3E786AB1C0E3588006995F1 /* Resources */,
+			);
+			buildRules = (
+				C3C589762191BFE300DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tachyon.tbb.ios;
+			productName = tbbExample;
+			productReference = D3E786AD1C0E3588006995F1 /* tachyon.tbb.ios.app */;
+			productType = "com.apple.product-type.application";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		84D017481527431F0008A4E0 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				CLASSPREFIX = tbb;
+				LastUpgradeCheck = 1000;
+				TargetAttributes = {
+					D3E786AC1C0E3588006995F1 = {
+						CreatedOnToolsVersion = 7.1.1;
+						DevelopmentTeam = 7J8M3RM94C;
+					};
+				};
+			};
+			buildConfigurationList = 84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "tachyon" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 0;
+			knownRegions = (
+				en,
+				Base,
+			);
+			mainGroup = 84D017461527431F0008A4E0;
+			productRefGroup = 84D017521527431F0008A4E0 /* Products */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				84D017501527431F0008A4E0 /* tachyon.tbb */,
+				8401172B152D6F6C00B07E4D /* tachyon.serial */,
+				84011764152D6F8400B07E4D /* tachyon.tbb1d */,
+				D3E786AC1C0E3588006995F1 /* tachyon.tbb.ios */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXResourcesBuildPhase section */
+		8401175A152D6F6C00B07E4D /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				8401175B152D6F6C00B07E4D /* (null) in Resources */,
+				8401175C152D6F6C00B07E4D /* InfoPlist.strings in Resources */,
+				8401175D152D6F6C00B07E4D /* MainMenu.xib in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		84011793152D6F8400B07E4D /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84011794152D6F8400B07E4D /* (null) in Resources */,
+				84011795152D6F8400B07E4D /* InfoPlist.strings in Resources */,
+				84011796152D6F8400B07E4D /* MainMenu.xib in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		84D0174F1527431F0008A4E0 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA7A152CA90100D59B95 /* (null) in Resources */,
+				84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */,
+				84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D3E786AB1C0E3588006995F1 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D3E786FA1C0E3DF7006995F1 /* balls.dat in Resources */,
+				D3E786F71C0E3A33006995F1 /* iOS.storyboard in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXResourcesBuildPhase section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8401172C152D6F6C00B07E4D /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				840117A1152D6FF900B07E4D /* trace.serial.cpp in Sources */,
+				8401172D152D6F6C00B07E4D /* main.m in Sources */,
+				8401172E152D6F6C00B07E4D /* OpenGLView.m in Sources */,
+				8401172F152D6F6C00B07E4D /* tbbAppDelegate.m in Sources */,
+				84011730152D6F6C00B07E4D /* macvideo.cpp in Sources */,
+				84011731152D6F6C00B07E4D /* api.cpp in Sources */,
+				84011732152D6F6C00B07E4D /* apigeom.cpp in Sources */,
+				84011733152D6F6C00B07E4D /* apitrigeom.cpp in Sources */,
+				84011734152D6F6C00B07E4D /* bndbox.cpp in Sources */,
+				84011735152D6F6C00B07E4D /* box.cpp in Sources */,
+				84011736152D6F6C00B07E4D /* camera.cpp in Sources */,
+				84011737152D6F6C00B07E4D /* coordsys.cpp in Sources */,
+				84011738152D6F6C00B07E4D /* cylinder.cpp in Sources */,
+				84011739152D6F6C00B07E4D /* extvol.cpp in Sources */,
+				8401173A152D6F6C00B07E4D /* global.cpp in Sources */,
+				8401173B152D6F6C00B07E4D /* grid.cpp in Sources */,
+				8401173C152D6F6C00B07E4D /* imageio.cpp in Sources */,
+				8401173D152D6F6C00B07E4D /* imap.cpp in Sources */,
+				8401173E152D6F6C00B07E4D /* intersect.cpp in Sources */,
+				8401173F152D6F6C00B07E4D /* jpeg.cpp in Sources */,
+				84011740152D6F6C00B07E4D /* light.cpp in Sources */,
+				84011741152D6F6C00B07E4D /* main.cpp in Sources */,
+				84011742152D6F6C00B07E4D /* objbound.cpp in Sources */,
+				84011743152D6F6C00B07E4D /* parse.cpp in Sources */,
+				84011744152D6F6C00B07E4D /* plane.cpp in Sources */,
+				84011745152D6F6C00B07E4D /* ppm.cpp in Sources */,
+				84011746152D6F6C00B07E4D /* pthread.cpp in Sources */,
+				84011747152D6F6C00B07E4D /* quadric.cpp in Sources */,
+				84011748152D6F6C00B07E4D /* render.cpp in Sources */,
+				84011749152D6F6C00B07E4D /* ring.cpp in Sources */,
+				8401174A152D6F6C00B07E4D /* shade.cpp in Sources */,
+				8401174B152D6F6C00B07E4D /* sphere.cpp in Sources */,
+				8401174C152D6F6C00B07E4D /* tachyon_video.cpp in Sources */,
+				8401174D152D6F6C00B07E4D /* texture.cpp in Sources */,
+				8401174E152D6F6C00B07E4D /* tgafile.cpp in Sources */,
+				8401174F152D6F6C00B07E4D /* trace_rest.cpp in Sources */,
+				84011750152D6F6C00B07E4D /* triangle.cpp in Sources */,
+				84011751152D6F6C00B07E4D /* ui.cpp in Sources */,
+				84011752152D6F6C00B07E4D /* util.cpp in Sources */,
+				84011753152D6F6C00B07E4D /* vector.cpp in Sources */,
+				84011754152D6F6C00B07E4D /* vol.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		84011765152D6F8400B07E4D /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				840117A2152D701A00B07E4D /* trace.tbb1d.cpp in Sources */,
+				84011766152D6F8400B07E4D /* main.m in Sources */,
+				84011767152D6F8400B07E4D /* OpenGLView.m in Sources */,
+				84011768152D6F8400B07E4D /* tbbAppDelegate.m in Sources */,
+				84011769152D6F8400B07E4D /* macvideo.cpp in Sources */,
+				8401176A152D6F8400B07E4D /* api.cpp in Sources */,
+				8401176B152D6F8400B07E4D /* apigeom.cpp in Sources */,
+				8401176C152D6F8400B07E4D /* apitrigeom.cpp in Sources */,
+				8401176D152D6F8400B07E4D /* bndbox.cpp in Sources */,
+				8401176E152D6F8400B07E4D /* box.cpp in Sources */,
+				8401176F152D6F8400B07E4D /* camera.cpp in Sources */,
+				84011770152D6F8400B07E4D /* coordsys.cpp in Sources */,
+				84011771152D6F8400B07E4D /* cylinder.cpp in Sources */,
+				84011772152D6F8400B07E4D /* extvol.cpp in Sources */,
+				84011773152D6F8400B07E4D /* global.cpp in Sources */,
+				84011774152D6F8400B07E4D /* grid.cpp in Sources */,
+				84011775152D6F8400B07E4D /* imageio.cpp in Sources */,
+				84011776152D6F8400B07E4D /* imap.cpp in Sources */,
+				84011777152D6F8400B07E4D /* intersect.cpp in Sources */,
+				84011778152D6F8400B07E4D /* jpeg.cpp in Sources */,
+				84011779152D6F8400B07E4D /* light.cpp in Sources */,
+				8401177A152D6F8400B07E4D /* main.cpp in Sources */,
+				8401177B152D6F8400B07E4D /* objbound.cpp in Sources */,
+				8401177C152D6F8400B07E4D /* parse.cpp in Sources */,
+				8401177D152D6F8400B07E4D /* plane.cpp in Sources */,
+				8401177E152D6F8400B07E4D /* ppm.cpp in Sources */,
+				8401177F152D6F8400B07E4D /* pthread.cpp in Sources */,
+				84011780152D6F8400B07E4D /* quadric.cpp in Sources */,
+				84011781152D6F8400B07E4D /* render.cpp in Sources */,
+				84011782152D6F8400B07E4D /* ring.cpp in Sources */,
+				84011783152D6F8400B07E4D /* shade.cpp in Sources */,
+				84011784152D6F8400B07E4D /* sphere.cpp in Sources */,
+				84011785152D6F8400B07E4D /* tachyon_video.cpp in Sources */,
+				84011786152D6F8400B07E4D /* texture.cpp in Sources */,
+				84011787152D6F8400B07E4D /* tgafile.cpp in Sources */,
+				84011788152D6F8400B07E4D /* trace_rest.cpp in Sources */,
+				84011789152D6F8400B07E4D /* triangle.cpp in Sources */,
+				8401178A152D6F8400B07E4D /* ui.cpp in Sources */,
+				8401178B152D6F8400B07E4D /* util.cpp in Sources */,
+				8401178C152D6F8400B07E4D /* vector.cpp in Sources */,
+				8401178D152D6F8400B07E4D /* vol.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		84D0174D1527431F0008A4E0 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA77152CA90100D59B95 /* main.m in Sources */,
+				84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */,
+				84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */,
+				84B8DA9A152CADF400D59B95 /* macvideo.cpp in Sources */,
+				840116E1152CBBF600B07E4D /* api.cpp in Sources */,
+				840116E2152CBBF600B07E4D /* apigeom.cpp in Sources */,
+				840116E3152CBBF600B07E4D /* apitrigeom.cpp in Sources */,
+				840116E4152CBBF600B07E4D /* bndbox.cpp in Sources */,
+				840116E5152CBBF600B07E4D /* box.cpp in Sources */,
+				840116E6152CBBF600B07E4D /* camera.cpp in Sources */,
+				840116E7152CBBF600B07E4D /* coordsys.cpp in Sources */,
+				840116E8152CBBF600B07E4D /* cylinder.cpp in Sources */,
+				840116E9152CBBF600B07E4D /* extvol.cpp in Sources */,
+				840116EA152CBBF600B07E4D /* global.cpp in Sources */,
+				840116EB152CBBF600B07E4D /* grid.cpp in Sources */,
+				840116EC152CBBF600B07E4D /* imageio.cpp in Sources */,
+				840116ED152CBBF600B07E4D /* imap.cpp in Sources */,
+				840116EE152CBBF600B07E4D /* intersect.cpp in Sources */,
+				840116EF152CBBF600B07E4D /* jpeg.cpp in Sources */,
+				840116F0152CBBF600B07E4D /* light.cpp in Sources */,
+				840116F1152CBBF600B07E4D /* main.cpp in Sources */,
+				840116F2152CBBF600B07E4D /* objbound.cpp in Sources */,
+				840116F3152CBBF600B07E4D /* parse.cpp in Sources */,
+				840116F4152CBBF600B07E4D /* plane.cpp in Sources */,
+				840116F5152CBBF600B07E4D /* ppm.cpp in Sources */,
+				840116F6152CBBF600B07E4D /* pthread.cpp in Sources */,
+				840116F7152CBBF600B07E4D /* quadric.cpp in Sources */,
+				840116F8152CBBF600B07E4D /* render.cpp in Sources */,
+				840116F9152CBBF600B07E4D /* ring.cpp in Sources */,
+				840116FA152CBBF600B07E4D /* shade.cpp in Sources */,
+				840116FB152CBBF600B07E4D /* sphere.cpp in Sources */,
+				840116FC152CBBF600B07E4D /* tachyon_video.cpp in Sources */,
+				840116FD152CBBF600B07E4D /* texture.cpp in Sources */,
+				840116FE152CBBF600B07E4D /* tgafile.cpp in Sources */,
+				840116FF152CBBF600B07E4D /* trace_rest.cpp in Sources */,
+				84011707152CBBF600B07E4D /* triangle.cpp in Sources */,
+				84011708152CBBF600B07E4D /* ui.cpp in Sources */,
+				84011709152CBBF600B07E4D /* util.cpp in Sources */,
+				8401170A152CBBF600B07E4D /* vector.cpp in Sources */,
+				8401170B152CBBF600B07E4D /* vol.cpp in Sources */,
+				8401172A152D6E3E00B07E4D /* trace.tbb.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D3E786A91C0E3588006995F1 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D3E786E41C0E375D006995F1 /* tachyon_video.cpp in Sources */,
+				D3E786DE1C0E375D006995F1 /* pthread.cpp in Sources */,
+				D3E786CB1C0E375D006995F1 /* apitrigeom.cpp in Sources */,
+				D3E786E31C0E375D006995F1 /* sphere.cpp in Sources */,
+				D3E786CD1C0E375D006995F1 /* box.cpp in Sources */,
+				D3E786F21C0E394C006995F1 /* vol.cpp in Sources */,
+				D3E786D51C0E375D006995F1 /* imap.cpp in Sources */,
+				D3E786D71C0E375D006995F1 /* jpeg.cpp in Sources */,
+				D3E786E01C0E375D006995F1 /* render.cpp in Sources */,
+				D3E786D91C0E375D006995F1 /* main.cpp in Sources */,
+				D3E786DB1C0E375D006995F1 /* parse.cpp in Sources */,
+				D3E786D21C0E375D006995F1 /* global.cpp in Sources */,
+				D3E786C91C0E3742006995F1 /* api.cpp in Sources */,
+				D3E786DA1C0E375D006995F1 /* objbound.cpp in Sources */,
+				D3E786E51C0E375D006995F1 /* texture.cpp in Sources */,
+				D3E786EB1C0E375D006995F1 /* vector.cpp in Sources */,
+				D3E786CF1C0E375D006995F1 /* coordsys.cpp in Sources */,
+				D3E786D41C0E375D006995F1 /* imageio.cpp in Sources */,
+				D3E786E61C0E375D006995F1 /* tgafile.cpp in Sources */,
+				D3E786CE1C0E375D006995F1 /* camera.cpp in Sources */,
+				D3E786C81C0E373D006995F1 /* trace.tbb.cpp in Sources */,
+				D3E786C51C0E36B0006995F1 /* main.m in Sources */,
+				D3E786D81C0E375D006995F1 /* light.cpp in Sources */,
+				D3E786DC1C0E375D006995F1 /* plane.cpp in Sources */,
+				D3E786DF1C0E375D006995F1 /* quadric.cpp in Sources */,
+				D3E786E71C0E375D006995F1 /* trace_rest.cpp in Sources */,
+				D3E786C61C0E36BC006995F1 /* OpenGLView.m in Sources */,
+				D3E786D01C0E375D006995F1 /* cylinder.cpp in Sources */,
+				D3E786CC1C0E375D006995F1 /* bndbox.cpp in Sources */,
+				D3E786C71C0E36C1006995F1 /* tbbAppDelegate.m in Sources */,
+				D3E786E11C0E375D006995F1 /* ring.cpp in Sources */,
+				D3E786C41C0E36AC006995F1 /* macvideo.cpp in Sources */,
+				D3E786CA1C0E375D006995F1 /* apigeom.cpp in Sources */,
+				D3E786E91C0E375D006995F1 /* ui.cpp in Sources */,
+				D3E786D11C0E375D006995F1 /* extvol.cpp in Sources */,
+				D3E786E81C0E375D006995F1 /* triangle.cpp in Sources */,
+				D3E786DD1C0E375D006995F1 /* ppm.cpp in Sources */,
+				D3E786EA1C0E375D006995F1 /* util.cpp in Sources */,
+				D3E786D31C0E375D006995F1 /* grid.cpp in Sources */,
+				D3E786D61C0E375D006995F1 /* intersect.cpp in Sources */,
+				D3E786E21C0E375D006995F1 /* shade.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin PBXVariantGroup section */
+		84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7D152CA97B00D59B95 /* en */,
+			);
+			name = InfoPlist.strings;
+			sourceTree = "<group>";
+		};
+		84B8DA7E152CA97B00D59B95 /* MainMenu.xib */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7F152CA97B00D59B95 /* en */,
+			);
+			name = MainMenu.xib;
+			sourceTree = "<group>";
+		};
+/* End PBXVariantGroup section */
+
+/* Begin XCBuildConfiguration section */
+		8401175F152D6F6C00B07E4D /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = tachyon.serial;
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Debug64;
+		};
+		84011760152D6F6C00B07E4D /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = tachyon.serial;
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Release64;
+		};
+		84011798152D6F8400B07E4D /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = tachyon.tbb1d;
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Debug64;
+		};
+		84011799152D6F8400B07E4D /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = tachyon.tbb1d;
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Release64;
+		};
+		84D01770152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = YES;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+				);
+				GCC_SYMBOLS_PRIVATE_EXTERN = NO;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROO)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		84D01771152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = YES;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = YES;
+				DEBUG_INFORMATION_FORMAT = "dwarf-with-dsym";
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROO)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+		84D01773152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Debug64;
+		};
+		84D01774152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				COMBINE_HIDPI_IMAGES = YES;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Release64;
+		};
+		D3E786C11C0E3588006995F1 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				DEBUG_INFORMATION_FORMAT = dwarf;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				"GCC_PREPROCESSOR_DEFINITIONS[arch=*]" = (
+					"DEBUG=1",
+					"__TBB_IOS=1",
+					"$(inherited)",
+				);
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_TBB = YES;
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MTL_ENABLE_DEBUG_INFO = YES;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = tachyon.tbb.ios;
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = "1,2";
+			};
+			name = Debug64;
+		};
+		D3E786C21C0E3588006995F1 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				COPY_PHASE_STRIP = NO;
+				ENABLE_NS_ASSERTIONS = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				"GCC_PREPROCESSOR_DEFINITIONS[arch=*]" = "__TBB_IOS=1";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_TBB = YES;
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MTL_ENABLE_DEBUG_INFO = NO;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = tachyon.tbb.ios;
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = "1,2";
+				VALIDATE_PRODUCT = YES;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		8401175E152D6F6C00B07E4D /* Build configuration list for PBXNativeTarget "tachyon.serial" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				8401175F152D6F6C00B07E4D /* Debug64 */,
+				84011760152D6F6C00B07E4D /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		84011797152D6F8400B07E4D /* Build configuration list for PBXNativeTarget "tachyon.tbb1d" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84011798152D6F8400B07E4D /* Debug64 */,
+				84011799152D6F8400B07E4D /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "tachyon" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01770152743200008A4E0 /* Debug64 */,
+				84D01771152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tachyon.tbb" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01773152743200008A4E0 /* Debug64 */,
+				84D01774152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		D3E786C31C0E3588006995F1 /* Build configuration list for PBXNativeTarget "tachyon.tbb.ios" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				D3E786C11C0E3588006995F1 /* Debug64 */,
+				D3E786C21C0E3588006995F1 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 84D017481527431F0008A4E0 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.serial.xcscheme b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.serial.xcscheme
new file mode 100644
index 00000000..71a8bdf8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.serial.xcscheme
@@ -0,0 +1,104 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "8401172B152D6F6C00B07E4D"
+               BuildableName = "tachyon.serial.app"
+               BlueprintName = "tachyon.serial"
+               ReferencedContainer = "container:tachyon.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "8401172B152D6F6C00B07E4D"
+            BuildableName = "tachyon.serial.app"
+            BlueprintName = "tachyon.serial"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "NO"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "8401172B152D6F6C00B07E4D"
+            BuildableName = "tachyon.serial.app"
+            BlueprintName = "tachyon.serial"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <CommandLineArguments>
+         <CommandLineArgument
+            argument = "$(SRCROOT)/../dat/balls3.dat"
+            isEnabled = "YES">
+         </CommandLineArgument>
+      </CommandLineArguments>
+      <EnvironmentVariables>
+         <EnvironmentVariable
+            key = "DYLD_LIBRARY_PATH"
+            value = "$(SRCROOT)/../../../../lib"
+            isEnabled = "YES">
+         </EnvironmentVariable>
+      </EnvironmentVariables>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "8401172B152D6F6C00B07E4D"
+            BuildableName = "tachyon.serial.app"
+            BlueprintName = "tachyon.serial"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb.ios.xcscheme b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb.ios.xcscheme
new file mode 100644
index 00000000..66d6836e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb.ios.xcscheme
@@ -0,0 +1,97 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "D3E786AC1C0E3588006995F1"
+               BuildableName = "tachyon.tbb.ios.app"
+               BlueprintName = "tachyon.tbb.ios"
+               ReferencedContainer = "container:tachyon.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D3E786AC1C0E3588006995F1"
+            BuildableName = "tachyon.tbb.ios.app"
+            BlueprintName = "tachyon.tbb.ios"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Release"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "YES"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D3E786AC1C0E3588006995F1"
+            BuildableName = "tachyon.tbb.ios.app"
+            BlueprintName = "tachyon.tbb.ios"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <CommandLineArguments>
+         <CommandLineArgument
+            argument = ""
+            isEnabled = "NO">
+         </CommandLineArgument>
+      </CommandLineArguments>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D3E786AC1C0E3588006995F1"
+            BuildableName = "tachyon.tbb.ios.app"
+            BlueprintName = "tachyon.tbb.ios"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb.xcscheme b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb.xcscheme
new file mode 100644
index 00000000..35c5eab8
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb.xcscheme
@@ -0,0 +1,105 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "84D017501527431F0008A4E0"
+               BuildableName = "tbbExample.app"
+               BlueprintName = "tbbExample"
+               ReferencedContainer = "container:tbbExample.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tachyon.tbb.app"
+            BlueprintName = "tachyon.tbb"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      customWorkingDirectory = "/tmp"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "NO"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tachyon.tbb.app"
+            BlueprintName = "tachyon.tbb"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <CommandLineArguments>
+         <CommandLineArgument
+            argument = "$(SRCROOT)/../dat/balls3.dat"
+            isEnabled = "YES">
+         </CommandLineArgument>
+      </CommandLineArguments>
+      <EnvironmentVariables>
+         <EnvironmentVariable
+            key = "DYLD_LIBRARY_PATH"
+            value = "$(SRCROOT)/../../../../lib"
+            isEnabled = "YES">
+         </EnvironmentVariable>
+      </EnvironmentVariables>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:tbbExample.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb1d.xcscheme b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb1d.xcscheme
new file mode 100644
index 00000000..584392d2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_for/tachyon/xcode/tachyon.xcodeproj/xcshareddata/xcschemes/tachyon.tbb1d.xcscheme
@@ -0,0 +1,105 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "84D017501527431F0008A4E0"
+               BuildableName = "tbbExample.app"
+               BlueprintName = "tbbExample"
+               ReferencedContainer = "container:tbbExample.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84011764152D6F8400B07E4D"
+            BuildableName = "tachyon.tbb1d.app"
+            BlueprintName = "tachyon.tbb1d"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      customWorkingDirectory = "/tmp"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "NO"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84011764152D6F8400B07E4D"
+            BuildableName = "tachyon.tbb1d.app"
+            BlueprintName = "tachyon.tbb1d"
+            ReferencedContainer = "container:tachyon.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <CommandLineArguments>
+         <CommandLineArgument
+            argument = "$(SRCROOT)/../dat/balls3.dat"
+            isEnabled = "YES">
+         </CommandLineArgument>
+      </CommandLineArguments>
+      <EnvironmentVariables>
+         <EnvironmentVariable
+            key = "DYLD_LIBRARY_PATH"
+            value = "$(SRCROOT)/../../../../lib"
+            isEnabled = "YES">
+         </EnvironmentVariable>
+      </EnvironmentVariables>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:tbbExample.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/Makefile b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/Makefile
new file mode 100644
index 00000000..f2ef31de
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/Makefile
@@ -0,0 +1,64 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=convex_hull_bench
+ARGS=
+PERF_RUN_ARGS = silent auto 40000000
+LIGHT_ARGS = 4 400
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o convex_hull_sample convex_hull_sample.cpp -ltbb $(LIBS)
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o convex_hull_bench convex_hull_bench.cpp -ltbb $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o convex_hull_sample convex_hull_sample.cpp -ltbb_debug $(LIBS)
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o convex_hull_bench convex_hull_bench.cpp -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) convex_hull_bench convex_hull_sample *.o *.d
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./convex_hull_sample $(PERF_RUN_ARGS)
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+light_test:
+	$(run_cmd) ./$(PROG) $(LIGHT_ARGS)
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/Makefile.windows b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/Makefile.windows
new file mode 100644
index 00000000..3aaad81f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/Makefile.windows
@@ -0,0 +1,56 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+PROG=convex_hull_bench
+ARGS=
+PERF_RUN_ARGS = silent auto 40000000
+LIGHT_ARGS = 4 400
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+# Below, _SECURE_SCL=0 is for VC9 and earlier, and _ITERATOR_DEBUG_LEVEL=0 is for VC10 and later
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _ITERATOR_DEBUG_LEVEL=0 /D _SECURE_SCL=0 $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: compiler_check
+	$(CXX) convex_hull_sample.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:convex_hull_sample.exe
+	$(CXX) convex_hull_bench.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:convex_hull_bench.exe
+debug: compiler_check
+	$(CXX) convex_hull_sample.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:convex_hull_sample.exe
+	$(CXX) convex_hull_bench.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:convex_hull_bench.exe
+clean:
+	@cmd.exe /C del convex_hull*.exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+perf_build: release
+
+perf_run:
+	convex_hull_sample $(PERF_RUN_ARGS)
+
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull.h b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull.h
new file mode 100644
index 00000000..68060155
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull.h
@@ -0,0 +1,188 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __CONVEX_HULL_H__
+#define __CONVEX_HULL_H__
+
+#include <cassert>
+#include <cstdlib>
+#include <iostream>
+#include <iomanip>
+#include <sstream>
+#include <vector>
+#include <string>
+#include <cstring>
+#include <algorithm>
+#include <functional>
+#include <climits>
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "../../common/utility/utility.h"
+#include "../../common/utility/fast_random.h"
+
+using namespace std;
+
+namespace cfg {
+    // convex hull problem user set parameters
+    long   numberOfPoints  = 5000000; // problem size
+    utility::thread_number_range threads(tbb::task_scheduler_init::default_num_threads);
+
+    // convex hull grain sizes for 3 subproblems. Be sure 16*GS < 512Kb
+    const size_t generateGrainSize = 25000;
+    const size_t findExtremumGrainSize  = 25000;
+    const size_t divideGrainSize   = 25000;
+};
+
+namespace util {
+    bool                     silent = false;
+    bool                     verbose = false;
+    vector<string> OUTPUT;
+
+    // utility functionality
+    void ParseInputArgs(int argc, char* argv[]) {
+        utility::parse_cli_arguments(
+                argc,argv,
+                utility::cli_argument_pack()
+                    //"-h" option for displaying help is present implicitly
+                    .positional_arg(cfg::threads,"n-of-threads",utility::thread_number_range_desc)
+                    .positional_arg(cfg::numberOfPoints,"n-of-points","number of points")
+                    .arg(silent,"silent","no output except elapsed time")
+                    .arg(verbose,"verbose","turns verbose ON")
+        );
+        //disabling verbose if silent is specified
+        if (silent) verbose = false;;
+    }
+
+    template <typename T>
+    struct point {
+        T x;
+        T y;
+        //According to subparagraph 4 of paragraph 12.6.2 "Initializing bases and members" [class.base.init]
+        //of ANSI-ISO-IEC C++ 2003 standard, POD members will _not_ be initialized if they are not mentioned
+        //in the base-member initializer list.
+
+        //For more details why this needed please see comment in FillRNDPointsVector_buf
+        point() {}
+        point(T _x, T _y) : x(_x), y(_y) {}
+    };
+
+    std::ostream& operator<< (std::ostream& o, point<double> const& p) {
+        return o << "(" << p.x << "," << p.y << ")";
+    }
+
+    struct rng {
+        static const size_t max_rand = USHRT_MAX;
+        utility::FastRandom my_fast_random;
+        rng (size_t seed):my_fast_random(seed) {}
+        unsigned short operator()(){return my_fast_random.get();}
+        unsigned short operator()(size_t& seed){return my_fast_random.get(seed);}
+    };
+
+
+    template < typename T ,typename rng_functor_type>
+    point<T> GenerateRNDPoint(size_t& count, rng_functor_type random, size_t rand_max) {
+        /* generates random points on 2D plane so that the cluster
+        is somewhat circle shaped */
+        const size_t maxsize=500;
+        T x = random()*2.0/(double)rand_max - 1;
+        T y = random()*2.0/(double)rand_max - 1;
+        T r = (x*x + y*y);
+        if(r>1) {
+            count++;
+            if(count>10) {
+                if (random()/(double)rand_max > 0.5)
+                    x /= r;
+                if (random()/(double)rand_max > 0.5)
+                    y /= r;
+                count = 0;
+            }
+            else {
+                x /= r;
+                y /= r;
+            }
+        }
+
+        x = (x+1)*0.5*maxsize;
+        y = (y+1)*0.5*maxsize;
+
+        return point<T>(x,y);
+    }
+
+    template <typename Index>
+    struct edge {
+        Index start;
+        Index end;
+        edge(Index _p1, Index _p2) : start(_p1), end(_p2) {};
+    };
+
+    template <typename T>
+    ostream& operator <<(ostream& _ostr, point<T> _p) {
+        return _ostr << '(' << _p.x << ',' << _p.y << ')';
+    }
+
+    template <typename T>
+    istream& operator >>(istream& _istr, point<T> _p) {
+        return _istr >> _p.x >> _p.y;
+    }
+
+    template <typename T>
+    bool operator ==(point<T> p1, point<T> p2) {
+        return (p1.x == p2.x && p1.y == p2.y);
+    }
+
+    template <typename T>
+    bool operator !=(point<T> p1, point<T> p2) {
+        return !(p1 == p2);
+    }
+
+    template <typename T>
+    double cross_product(const point<T>& start, const point<T>& end1, const point<T>& end2) {
+        return ((end1.x-start.x)*(end2.y-start.y)-(end2.x-start.x)*(end1.y-start.y));
+    }
+
+    // Timing functions are based on TBB to always obtain wall-clock time
+    typedef tbb::tick_count my_time_t;
+
+    my_time_t gettime() {
+        return tbb::tick_count::now();
+    }
+
+    double time_diff(my_time_t start, my_time_t end) {
+        return (end-start).seconds();
+    }
+
+    void WriteResults(int nthreads, double initTime, double calcTime) {
+        if(verbose) {
+            cout << " Step by step hull construction:" << endl;
+            for(size_t i = 0; i < OUTPUT.size(); ++i)
+                cout << OUTPUT[i] << endl;
+        }
+        if (!silent){
+            cout
+                << "  Number of nodes:" << cfg::numberOfPoints
+                << "  Number of threads:" << nthreads
+                << "  Initialization time:" << setw(10) << setprecision(3) << initTime
+                << "  Calculation time:" << setw(10) << setprecision(3) << calcTime
+                << endl;
+        }
+    }
+};
+
+#endif // __CONVEX_HULL_H__
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull_bench.cpp b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull_bench.cpp
new file mode 100644
index 00000000..66750085
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull_bench.cpp
@@ -0,0 +1,635 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    This file contains a few implementations, so it may look overly complicated.
+    The most efficient implementation is also separated into convex_hull_sample.cpp
+*/
+#include "convex_hull.h"
+
+typedef util::point<double> point_t;
+
+#ifndef USETBB
+    #define USETBB      1
+#endif
+#ifndef USECONCVEC
+    #define USECONCVEC   1
+#endif
+
+#if !USETBB // Serial implementation of Quick Hull algorithm
+
+typedef std::vector< point_t > pointVec_t;
+
+void serial_initialize(pointVec_t &points);
+
+// C++ style serial code
+
+class FindXExtremum : public std::unary_function<const point_t&, void> {
+public:
+    typedef enum {
+        minX, maxX
+    } extremumType;
+
+    FindXExtremum(const point_t& frstPoint, extremumType exType_)
+        : extrXPoint(frstPoint), exType(exType_) {}
+
+    void operator()(const point_t& p) {
+        if(closerToExtremum(p))
+            extrXPoint = p;
+    }
+
+    operator point_t () {
+        return extrXPoint;
+    }
+
+private:
+    const extremumType   exType;
+    point_t              extrXPoint;
+
+    bool closerToExtremum(const point_t &p) const {
+        switch(exType) {
+        case minX:
+            return p.x<extrXPoint.x; break;
+        case maxX:
+            return p.x>extrXPoint.x; break;
+        }
+        return false; // avoid warning
+    }
+};
+
+template <FindXExtremum::extremumType type>
+point_t extremum(const pointVec_t &points) {
+    assert(!points.empty());
+    return std::for_each(points.begin(), points.end(), FindXExtremum(points[0], type));
+}
+
+class SplitByCP : public std::unary_function<const point_t&, void> {
+    pointVec_t          &reducedSet;
+    point_t              p1, p2;
+    point_t              farPoint;
+    double               howFar;
+public:
+
+    SplitByCP( point_t _p1, point_t _p2, pointVec_t &_reducedSet)
+        : p1(_p1), p2(_p2), reducedSet(_reducedSet), howFar(0), farPoint(p1) {}
+
+    void operator()(const point_t& p) {
+        double cp;
+        if( (p != p1) && (p != p2) ) {
+            cp = util::cross_product(p1, p2, p);
+            if(cp>0) {
+                reducedSet.push_back(p);
+                if(cp>howFar) {
+                    farPoint = p;
+                    howFar   = cp;
+                }
+            }
+        }
+    }
+
+    operator point_t (){
+        return farPoint;
+    }
+};
+
+point_t divide(const pointVec_t &P, pointVec_t &P_reduced, const point_t &p1, const point_t &p2) {
+    SplitByCP splitByCP(p1, p2, P_reduced);
+    point_t farPoint = std::for_each(P.begin(), P.end(), splitByCP);
+
+    if(util::verbose) {
+        std::stringstream ss;
+        ss << P.size() << " nodes in bucket"<< ", "
+            << "dividing by: [ " << p1 << ", " << p2 << " ], "
+            << "farthest node: " << farPoint;
+        util::OUTPUT.push_back(ss.str());
+    }
+
+    return farPoint;
+}
+
+void divide_and_conquer(const pointVec_t &P, pointVec_t &H, point_t p1, point_t p2) {
+    assert(P.size() >= 2);
+    pointVec_t P_reduced;
+    pointVec_t H1, H2;
+    point_t p_far = divide(P, P_reduced, p1, p2);
+    if (P_reduced.size()<2) {
+        H.push_back(p1);
+        H.insert(H.end(), P_reduced.begin(), P_reduced.end());
+    }
+    else {
+        divide_and_conquer(P_reduced, H1, p1, p_far);
+        divide_and_conquer(P_reduced, H2, p_far, p2);
+
+        H.insert(H.end(), H1.begin(), H1.end());
+        H.insert(H.end(), H2.begin(), H2.end());
+    }
+}
+
+void quickhull(const pointVec_t &points, pointVec_t &hull) {
+    if (points.size() < 2) {
+        hull.insert(hull.end(), points.begin(), points.end());
+        return;
+    }
+    point_t p_maxx = extremum<FindXExtremum::maxX>(points);
+    point_t p_minx = extremum<FindXExtremum::minX>(points);
+
+    pointVec_t H;
+
+    divide_and_conquer(points, hull, p_maxx, p_minx);
+    divide_and_conquer(points, H, p_minx, p_maxx);
+    hull.insert(hull.end(), H.begin(), H.end());
+}
+
+
+int main(int argc, char* argv[]) {
+    util::ParseInputArgs(argc, argv);
+
+    pointVec_t      points;
+    pointVec_t      hull;
+    util::my_time_t tm_init, tm_start, tm_end;
+
+    std::cout << "Starting serial version of QUICK HULL algorithm" << std::endl;
+
+    tm_init = util::gettime();
+    serial_initialize(points);
+    tm_start = util::gettime();
+    std::cout << "Init time: " << util::time_diff(tm_init, tm_start) << "  Points in input: " << points.size() << "\n";
+    tm_start = util::gettime();
+    quickhull(points, hull);
+    tm_end = util::gettime();
+    std::cout << "Serial time: " << util::time_diff(tm_start, tm_end) << "  Points in hull: " << hull.size() << "\n";
+}
+
+#else // USETBB - parallel version of Quick Hull algorithm
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+#include "tbb/blocked_range.h"
+
+typedef tbb::blocked_range<size_t> range_t;
+
+#if USECONCVEC
+#include "tbb/concurrent_vector.h"
+
+typedef tbb::concurrent_vector<point_t> pointVec_t;
+
+void appendVector(const point_t* src, size_t srcSize, pointVec_t& dest) {
+    std::copy(src, src + srcSize, dest.grow_by(srcSize));
+}
+
+void appendVector(const pointVec_t& src, pointVec_t& dest) {
+    std::copy(src.begin(), src.end(), dest.grow_by(src.size()));
+}
+
+void grow_vector_to_at_least(pointVec_t& vect, size_t size) {
+    vect.grow_to_at_least(size);
+}
+#else // USE STD::VECTOR - include spin_mutex.h and lock vector operations
+#include "tbb/spin_mutex.h"
+
+typedef tbb::spin_mutex      mutex_t;
+typedef std::vector<point_t> pointVec_t;
+
+void appendVector(mutex_t& insertMutex, const pointVec_t& src, pointVec_t& dest) {
+    mutex_t::scoped_lock lock(insertMutex);
+    dest.insert(dest.end(), src.begin(), src.end());
+}
+
+void appendVector(mutex_t& insertMutex, const point_t* src, size_t srcSize,
+                  pointVec_t& dest) {
+    mutex_t::scoped_lock lock(insertMutex);
+    dest.insert(dest.end(), src, src + srcSize);
+}
+
+void grow_vector_to_at_least(mutex_t& mutex, pointVec_t& vect, size_t size) {
+    mutex_t::scoped_lock lock(mutex);
+    if (vect.size()< size){
+        vect.resize(size);
+    }
+}
+#endif // USECONCVEC
+
+class FillRNDPointsVector {
+    pointVec_t          &points;
+public:
+    static const size_t  grainSize = cfg::generateGrainSize;
+#if !USECONCVEC
+    static mutex_t       pushBackMutex;
+#endif // USECONCVEC
+
+    explicit FillRNDPointsVector(pointVec_t& _points)
+        : points(_points){}
+
+    void operator()(const range_t& range) const {
+        util::rng the_rng(range.begin());
+        const size_t i_end = range.end();
+        size_t count = 0;
+#if USECONCVEC
+            points.grow_to_at_least(i_end);
+#else // Locked enlarge to a not thread-safe STD::VECTOR
+            grow_vector_to_at_least(pushBackMutex,points,i_end);
+#endif // USECONCVEC
+
+        for(size_t i = range.begin(); i != i_end; ++i) {
+            points[i]=util::GenerateRNDPoint<double>(count,the_rng,util::rng::max_rand);
+        }
+    }
+};
+
+class FillRNDPointsVector_buf {
+    pointVec_t          &points;
+public:
+    static const size_t  grainSize = cfg::generateGrainSize;
+#if !USECONCVEC
+    static mutex_t       insertMutex;
+#endif // USECONCVEC
+
+    explicit FillRNDPointsVector_buf(pointVec_t& _points)
+        : points(_points){}
+
+    void operator()(const range_t& range) const {
+        util::rng the_rng(range.begin());
+        const size_t i_end = range.end();
+        size_t count = 0, j = 0;
+        point_t tmp_vec[grainSize];
+
+        for(size_t i=range.begin(); i!=i_end; ++i) {
+            tmp_vec[j++] = util::GenerateRNDPoint<double>(count,the_rng,util::rng::max_rand);
+        }
+#if USECONCVEC
+        grow_vector_to_at_least(points,range.end());
+#else // USE STD::VECTOR
+        grow_vector_to_at_least(insertMutex,points,range.end());
+#endif // USECONCVEC
+        std::copy(tmp_vec, tmp_vec+j,points.begin()+range.begin());
+    }   
+};
+
+#if !USECONCVEC
+mutex_t FillRNDPointsVector::pushBackMutex   = mutex_t();
+mutex_t FillRNDPointsVector_buf::insertMutex = mutex_t();
+#endif
+
+template<typename BodyType>
+void initialize(pointVec_t &points) {
+    //This function generate the same series of point on every call.
+    //Reproducibility is needed for benchmarking to produce reliable results.
+    //It is achieved through the following points:
+    //      - FillRNDPointsVector_buf instance has its own local instance
+    //        of random number generator, which in turn does not use any global data
+    //      - tbb::simple_partitioner produce the same set of ranges on every call to
+    //        tbb::parallel_for
+    //      - local RNG instances are seeded by the starting indexes of corresponding ranges
+    //      - grow_to_at_least() enables putting points into the resulting vector in deterministic order
+    //        (unlike concurrent push_back or grow_by).
+
+    // In the buffered version, a temporary storage for as much as grainSize elements 
+    // is allocated inside the body. Since auto_partitioner may increase effective
+    // range size which would cause a crash, simple partitioner has to be used.
+
+    tbb::parallel_for(range_t(0, cfg::numberOfPoints, BodyType::grainSize),
+    BodyType(points), tbb::simple_partitioner());
+}
+
+class FindXExtremum {
+public:
+    typedef enum {
+        minX, maxX
+    } extremumType;
+
+    static const size_t  grainSize = cfg::findExtremumGrainSize;
+
+    FindXExtremum(const pointVec_t& points_, extremumType exType_)
+        : points(points_), exType(exType_), extrXPoint(points[0]) {}
+
+    FindXExtremum(const FindXExtremum& fxex, tbb::split)
+        : points(fxex.points), exType(fxex.exType), extrXPoint(fxex.extrXPoint) {}
+
+    void operator()(const range_t& range) {
+        const size_t i_end = range.end();
+        if(!range.empty()) {
+            for(size_t i = range.begin(); i != i_end; ++i) {
+                if(closerToExtremum(points[i])) {
+                    extrXPoint = points[i];
+                }
+            }
+        }
+    }
+
+    void join(const FindXExtremum &rhs) {
+        if(closerToExtremum(rhs.extrXPoint)) {
+            extrXPoint = rhs.extrXPoint;
+        }
+    }
+
+    point_t extremeXPoint() {
+        return extrXPoint;
+    }
+
+private:
+    const pointVec_t    &points;
+    const extremumType   exType;
+    point_t              extrXPoint;
+    bool closerToExtremum(const point_t &p) const {
+        switch(exType) {
+        case minX:
+            return p.x<extrXPoint.x; break;
+        case maxX:
+            return p.x>extrXPoint.x; break;
+        }
+        return false; // avoid warning
+    }
+};
+
+template <FindXExtremum::extremumType type>
+point_t extremum(const pointVec_t &P) {
+    FindXExtremum fxBody(P, type);
+    tbb::parallel_reduce(range_t(0, P.size(), FindXExtremum::grainSize), fxBody);
+    return fxBody.extremeXPoint();
+}
+
+class SplitByCP {
+    const pointVec_t    &initialSet;
+    pointVec_t          &reducedSet;
+    point_t              p1, p2;
+    point_t              farPoint;
+    double               howFar;
+public:
+    static const size_t grainSize = cfg::divideGrainSize;
+#if !USECONCVEC
+    static mutex_t      pushBackMutex;
+#endif // USECONCVEC
+
+    SplitByCP( point_t _p1, point_t _p2,
+        const pointVec_t &_initialSet, pointVec_t &_reducedSet)
+        : p1(_p1), p2(_p2),
+        initialSet(_initialSet), reducedSet(_reducedSet),
+        howFar(0), farPoint(p1) {
+    }
+
+    SplitByCP( SplitByCP& sbcp, tbb::split )
+        : p1(sbcp.p1), p2(sbcp.p2),
+        initialSet(sbcp.initialSet), reducedSet(sbcp.reducedSet),
+        howFar(0), farPoint(p1) {}
+
+    void operator()( const range_t& range ) {
+        const size_t i_end = range.end();
+        double cp;
+        for(size_t i=range.begin(); i!=i_end; ++i) {
+            if( (initialSet[i] != p1) && (initialSet[i] != p2) ) {
+                cp = util::cross_product(p1, p2, initialSet[i]);
+                if(cp>0) {
+#if USECONCVEC
+                    reducedSet.push_back(initialSet[i]);
+#else // Locked push_back to a not thread-safe STD::VECTOR
+                    {
+                        mutex_t::scoped_lock lock(pushBackMutex);
+                        reducedSet.push_back(initialSet[i]);
+                    }
+#endif // USECONCVEC
+                    if(cp>howFar) {
+                        farPoint = initialSet[i];
+                        howFar   = cp;
+                    }
+                }
+            }
+        }
+    }
+
+    void join(const SplitByCP& rhs) {
+        if(rhs.howFar>howFar) {
+            howFar   = rhs.howFar;
+            farPoint = rhs.farPoint;
+        }
+    }
+
+    point_t farthestPoint() const {
+        return farPoint;
+    }
+};
+
+class SplitByCP_buf {
+    const pointVec_t    &initialSet;
+    pointVec_t          &reducedSet;
+    point_t              p1, p2;
+    point_t              farPoint;
+    double               howFar;
+public:
+    static const size_t  grainSize = cfg::divideGrainSize;
+#if !USECONCVEC
+    static mutex_t       insertMutex;
+#endif // USECONCVEC
+
+    SplitByCP_buf( point_t _p1, point_t _p2,
+        const pointVec_t &_initialSet, pointVec_t &_reducedSet)
+        : p1(_p1), p2(_p2),
+        initialSet(_initialSet), reducedSet(_reducedSet),
+        howFar(0), farPoint(p1) {}
+
+    SplitByCP_buf(SplitByCP_buf& sbcp, tbb::split)
+        : p1(sbcp.p1), p2(sbcp.p2),
+        initialSet(sbcp.initialSet), reducedSet(sbcp.reducedSet),
+        howFar(0), farPoint(p1) {}
+
+    void operator()(const range_t& range) {
+        const size_t i_end = range.end();
+        size_t j = 0;
+        double cp;
+        point_t tmp_vec[grainSize];
+        for(size_t i = range.begin(); i != i_end; ++i) {
+            if( (initialSet[i] != p1) && (initialSet[i] != p2) ) {            
+                cp = util::cross_product(p1, p2, initialSet[i]);
+                if(cp>0) {
+                    tmp_vec[j++] = initialSet[i];
+                    if(cp>howFar) {
+                        farPoint = initialSet[i];
+                        howFar   = cp;
+                    }
+                }
+            }
+        }
+
+#if USECONCVEC
+        appendVector(tmp_vec, j, reducedSet);
+#else // USE STD::VECTOR
+        appendVector(insertMutex, tmp_vec, j, reducedSet);
+#endif // USECONCVEC
+    }
+
+    void join(const SplitByCP_buf& rhs) {
+        if(rhs.howFar>howFar) {
+            howFar   = rhs.howFar;
+            farPoint = rhs.farPoint;
+        }
+    }
+
+    point_t farthestPoint() const {
+        return farPoint;
+    }
+};
+
+#if !USECONCVEC
+mutex_t SplitByCP::pushBackMutex   = mutex_t();
+mutex_t SplitByCP_buf::insertMutex = mutex_t();
+#endif
+
+template <typename BodyType>
+point_t divide(const pointVec_t &P, pointVec_t &P_reduced,
+              const point_t &p1, const point_t &p2) {
+    BodyType body(p1, p2, P, P_reduced);
+    // Must use simple_partitioner (see the comment in initialize() above)
+    tbb::parallel_reduce(range_t(0, P.size(), BodyType::grainSize),
+                         body, tbb::simple_partitioner() );
+
+    if(util::verbose) {
+        std::stringstream ss;
+        ss << P.size() << " nodes in bucket"<< ", "
+            << "dividing by: [ " << p1 << ", " << p2 << " ], "
+            << "farthest node: " << body.farthestPoint();
+        util::OUTPUT.push_back(ss.str());
+    }
+
+    return body.farthestPoint();
+}
+
+void divide_and_conquer(const pointVec_t &P, pointVec_t &H,
+                        point_t p1, point_t p2, bool buffered) {
+    assert(P.size() >= 2);
+    pointVec_t P_reduced;
+    pointVec_t H1, H2;
+    point_t p_far;
+    
+    if(buffered) {
+        p_far = divide<SplitByCP_buf>(P, P_reduced, p1, p2);
+    } else {
+        p_far = divide<SplitByCP>(P, P_reduced, p1, p2);
+    }
+
+    if (P_reduced.size()<2) {
+        H.push_back(p1);
+#if USECONCVEC
+        appendVector(P_reduced, H);
+#else // insert into STD::VECTOR
+        H.insert(H.end(), P_reduced.begin(), P_reduced.end());
+#endif
+    }
+    else {
+        divide_and_conquer(P_reduced, H1, p1, p_far, buffered);
+        divide_and_conquer(P_reduced, H2, p_far, p2, buffered);
+
+#if USECONCVEC
+        appendVector(H1, H);
+        appendVector(H2, H);
+#else // insert into STD::VECTOR
+        H.insert(H.end(), H1.begin(), H1.end());
+        H.insert(H.end(), H2.begin(), H2.end());
+#endif
+    }
+}
+
+void quickhull(const pointVec_t &points, pointVec_t &hull, bool buffered) {
+    if (points.size() < 2) {
+#if USECONCVEC
+        appendVector(points, hull);
+#else // STD::VECTOR
+        hull.insert(hull.end(), points.begin(), points.end());
+#endif // USECONCVEC
+        return;
+    }
+
+    point_t p_maxx = extremum<FindXExtremum::maxX>(points);
+    point_t p_minx = extremum<FindXExtremum::minX>(points);
+
+    pointVec_t H;
+
+    divide_and_conquer(points, hull, p_maxx, p_minx, buffered);
+    divide_and_conquer(points, H, p_minx, p_maxx, buffered);
+#if USECONCVEC
+    appendVector(H, hull);
+#else // STD::VECTOR
+    hull.insert(hull.end(), H.begin(), H.end());
+#endif // USECONCVEC
+}
+
+int main(int argc, char* argv[]) {
+    util::ParseInputArgs(argc, argv);
+
+    int             nthreads;
+    util::my_time_t tm_init, tm_start, tm_end;
+
+#if USECONCVEC
+    std::cout << "Starting TBB unbuffered push_back version of QUICK HULL algorithm" << std::endl;
+#else
+    std::cout << "Starting STL locked unbuffered push_back version of QUICK HULL algorithm" << std::endl;
+#endif // USECONCVEC
+
+    for(nthreads=cfg::threads.first; nthreads<=cfg::threads.last; nthreads=cfg::threads.step(nthreads)) {
+        pointVec_t      points;
+        pointVec_t      hull;
+
+        tbb::task_scheduler_init init(nthreads);
+        tm_init = util::gettime();
+        initialize<FillRNDPointsVector>(points);
+        tm_start = util::gettime();
+        std::cout << "Parallel init time on " << nthreads << " threads: " << util::time_diff(tm_init, tm_start) << "  Points in input: " << points.size() << "\n";
+
+        tm_start = util::gettime();
+        quickhull(points, hull, false);
+        tm_end = util::gettime();
+        std::cout << "Time on " << nthreads << " threads: " << util::time_diff(tm_start, tm_end) << "  Points in hull: " << hull.size() << "\n";
+    }
+
+#if USECONCVEC 
+    std::cout << "Starting TBB buffered version of QUICK HULL algorithm" << std::endl;
+#else
+    std::cout << "Starting STL locked buffered version of QUICK HULL algorithm" << std::endl;
+#endif
+
+    for(nthreads=cfg::threads.first; nthreads<=cfg::threads.last; nthreads=cfg::threads.step(nthreads)) {
+        pointVec_t      points;
+        pointVec_t      hull;
+
+        tbb::task_scheduler_init init(nthreads);
+
+        tm_init = util::gettime();
+        initialize<FillRNDPointsVector_buf>(points);
+        tm_start = util::gettime();
+        std::cout << "Init time on " << nthreads << " threads: " << util::time_diff(tm_init, tm_start) << "  Points in input: " << points.size() << "\n";
+
+        tm_start = util::gettime();
+        quickhull(points, hull, true);
+        tm_end = util::gettime();
+        std::cout << "Time on " << nthreads << " threads: " << util::time_diff(tm_start, tm_end) << "  Points in hull: " << hull.size() << "\n";
+    }    
+
+    return 0;
+}
+
+#endif // USETBB
+
+void serial_initialize(pointVec_t &points) {
+    points.reserve(cfg::numberOfPoints);
+
+    unsigned int rseed=1;
+    for(size_t i=0, count=0; long(i)<cfg::numberOfPoints; ++i) {
+        points.push_back(util::GenerateRNDPoint<double>(count,&std::rand,RAND_MAX ));
+    }
+}
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull_sample.cpp b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull_sample.cpp
new file mode 100644
index 00000000..54a6753d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/convex_hull_sample.cpp
@@ -0,0 +1,297 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    This file contains the TBB-based implementation of convex hull algortihm.
+    It corresponds to the following settings in convex_hull_bench.cpp:
+    - USETBB defined to 1
+    - USECONCVEC defined to 1
+    - INIT_ONCE defined to 0
+    - only buffered version is used
+*/
+#include "convex_hull.h"
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+#include "tbb/blocked_range.h"
+#include "tbb/tick_count.h"
+#include "tbb/concurrent_vector.h"
+
+typedef util::point<double>               point_t;
+typedef tbb::concurrent_vector< point_t > pointVec_t;
+typedef tbb::blocked_range<size_t>        range_t;
+
+void appendVector(const point_t* src, size_t srcSize, pointVec_t& dest) {
+    std::copy(src, src + srcSize, dest.grow_by(srcSize));
+}
+
+void appendVector(const pointVec_t& src, pointVec_t& dest) {
+    std::copy(src.begin(), src.end(), dest.grow_by(src.size()));
+}
+class FillRNDPointsVector_buf {
+    pointVec_t          &points;
+public:
+    static const size_t  grainSize = cfg::generateGrainSize;
+
+    explicit FillRNDPointsVector_buf(pointVec_t& _points)
+        : points(_points) {}
+
+    void operator()(const range_t& range) const {
+        util::rng the_rng(range.begin());
+        const size_t i_end = range.end();
+        size_t count = 0, j = 0;
+        point_t tmp_vec[grainSize];
+
+        for(size_t i=range.begin(); i!=i_end; ++i) {
+            tmp_vec[j++] = util::GenerateRNDPoint<double>(count, the_rng, util::rng::max_rand);
+        }
+        //Here we have race condition. Elements being written to may be still under construction.
+        //For C++ 2003 it is workarounded by vector element type which default constructor does not touch memory,
+        //it being constructed on. See comments near default ctor of point class for more details.
+        //Strictly speaking it is UB.
+        //TODO: need to find more reliable/correct way
+        points.grow_to_at_least(range.end());
+        std::copy(tmp_vec, tmp_vec+j,points.begin()+range.begin());
+    }
+};
+
+void initialize(pointVec_t &points) {
+    //This function generate the same series of point on every call.
+    //Reproducibility is needed for benchmarking to produce reliable results.
+    //It is achieved through the following points:
+    //      - FillRNDPointsVector_buf instance has its own local instance
+    //        of random number generator, which in turn does not use any global data
+    //      - tbb::simple_partitioner produce the same set of ranges on every call to
+    //        tbb::parallel_for
+    //      - local RNG instances are seeded by the starting indexes of corresponding ranges
+    //      - grow_to_at_least() enables putting points into the resulting vector in deterministic order
+    //        (unlike concurrent push_back or grow_by).
+
+    // In the buffered version, a temporary storage for as much as grainSize elements 
+    // is allocated inside the body. Since auto_partitioner may increase effective
+    // range size which would cause a crash, simple partitioner has to be used.
+    tbb::parallel_for(range_t(0, cfg::numberOfPoints, FillRNDPointsVector_buf::grainSize),
+                      FillRNDPointsVector_buf(points), tbb::simple_partitioner());
+}
+
+class FindXExtremum {
+public:
+    typedef enum {
+        minX, maxX
+    } extremumType;
+
+    static const size_t  grainSize = cfg::findExtremumGrainSize;
+
+    FindXExtremum(const pointVec_t& points_, extremumType exType_)
+        : points(points_), exType(exType_), extrXPoint(points[0]) {}
+
+    FindXExtremum(const FindXExtremum& fxex, tbb::split)
+        // Can run in parallel with fxex.operator()() or fxex.join().
+        // The data race reported by tools is harmless.
+        : points(fxex.points), exType(fxex.exType), extrXPoint(fxex.extrXPoint) {}
+
+    void operator()(const range_t& range) {
+        const size_t i_end = range.end();
+        if(!range.empty()) {
+            for(size_t i = range.begin(); i != i_end; ++i) {
+                if(closerToExtremum(points[i])) {
+                    extrXPoint = points[i];
+                }
+            }
+        }
+    }
+
+    void join(const FindXExtremum &rhs) {
+        if(closerToExtremum(rhs.extrXPoint)) {
+            extrXPoint = rhs.extrXPoint;
+        }
+    }
+
+    point_t extremeXPoint() {
+        return extrXPoint;
+    }
+
+private:
+    const pointVec_t    &points;
+    const extremumType   exType;
+    point_t              extrXPoint;
+    bool closerToExtremum(const point_t &p) const {
+        switch(exType) {
+        case minX:
+            return p.x<extrXPoint.x; break;
+        case maxX:
+            return p.x>extrXPoint.x; break;
+        }
+        return false; // avoid warning
+    }
+};
+
+template <FindXExtremum::extremumType type>
+point_t extremum(const pointVec_t &P) {
+    FindXExtremum fxBody(P, type);
+    tbb::parallel_reduce(range_t(0, P.size(), FindXExtremum::grainSize), fxBody);
+    return fxBody.extremeXPoint();
+}
+
+class SplitByCP_buf {
+    const pointVec_t    &initialSet;
+    pointVec_t          &reducedSet;
+    point_t              p1, p2;
+    point_t              farPoint;
+    double               howFar;
+public:
+    static const size_t  grainSize = cfg::divideGrainSize;
+
+    SplitByCP_buf( point_t _p1, point_t _p2,
+        const pointVec_t &_initialSet, pointVec_t &_reducedSet)
+        : p1(_p1), p2(_p2),
+        initialSet(_initialSet), reducedSet(_reducedSet),
+        howFar(0), farPoint(p1) {}
+
+    SplitByCP_buf(SplitByCP_buf& sbcp, tbb::split)
+        : p1(sbcp.p1), p2(sbcp.p2),
+        initialSet(sbcp.initialSet), reducedSet(sbcp.reducedSet),
+        howFar(0), farPoint(p1) {}
+
+    void operator()(const range_t& range) {
+        const size_t i_end = range.end();
+        size_t j = 0;
+        double cp;
+        point_t tmp_vec[grainSize];
+        for(size_t i = range.begin(); i != i_end; ++i) {
+            if( (initialSet[i] != p1) && (initialSet[i] != p2) ) {            
+                cp = util::cross_product(p1, p2, initialSet[i]);
+                if(cp>0) {
+                    tmp_vec[j++] = initialSet[i];
+                    if(cp>howFar) {
+                        farPoint = initialSet[i];
+                        howFar   = cp;
+                    }
+                }
+            }
+        }
+
+        appendVector(tmp_vec, j, reducedSet);
+    }
+
+    void join(const SplitByCP_buf& rhs) {
+        if(rhs.howFar>howFar) {
+            howFar   = rhs.howFar;
+            farPoint = rhs.farPoint;
+        }
+    }
+
+    point_t farthestPoint() const {
+        return farPoint;
+    }
+};
+
+point_t divide(const pointVec_t &P, pointVec_t &P_reduced, 
+                   const point_t &p1, const point_t &p2) {
+    SplitByCP_buf sbcpb(p1, p2, P, P_reduced);
+    // Must use simple_partitioner (see the comment in initialize() above)
+    tbb::parallel_reduce(range_t(0, P.size(), SplitByCP_buf::grainSize),
+                         sbcpb, tbb::simple_partitioner());
+
+    if(util::verbose) {
+        std::stringstream ss;
+        ss << P.size() << " nodes in bucket"<< ", "
+            << "dividing by: [ " << p1 << ", " << p2 << " ], "
+            << "farthest node: " << sbcpb.farthestPoint();
+        util::OUTPUT.push_back(ss.str());
+    }
+
+    return sbcpb.farthestPoint();
+}
+
+void divide_and_conquer(const pointVec_t &P, pointVec_t &H,
+                            point_t p1, point_t p2) {
+    assert(P.size() >= 2);
+    pointVec_t P_reduced;
+    pointVec_t H1, H2;
+    point_t p_far = divide(P, P_reduced, p1, p2);
+    if (P_reduced.size()<2) {
+        H.push_back(p1);
+        appendVector(P_reduced, H);
+    }
+    else {
+        divide_and_conquer(P_reduced, H1, p1, p_far);
+        divide_and_conquer(P_reduced, H2, p_far, p2);
+
+        appendVector(H1, H);
+        appendVector(H2, H);
+    }
+}
+
+void quickhull(const pointVec_t &points, pointVec_t &hull) {
+    if (points.size() < 2) {
+        appendVector(points, hull);
+        return;
+    }
+
+    point_t p_maxx = extremum<FindXExtremum::maxX>(points);
+    point_t p_minx = extremum<FindXExtremum::minX>(points);
+
+    pointVec_t H;
+
+    divide_and_conquer(points, hull, p_maxx, p_minx);
+    divide_and_conquer(points, H, p_minx, p_maxx);
+
+    appendVector(H, hull);
+}
+
+int main(int argc, char* argv[]) {
+    util::my_time_t tm_main_begin = util::gettime();
+
+    util::ParseInputArgs(argc, argv);
+
+    pointVec_t      points;
+    pointVec_t      hull;
+    int             nthreads;
+
+    points.reserve(cfg::numberOfPoints);
+
+    if(!util::silent) {
+        std::cout << "Starting TBB-buffered version of QUICK HULL algorithm" << std::endl;
+    }
+
+    for(nthreads=cfg::threads.first; nthreads<=cfg::threads.last; nthreads=cfg::threads.step(nthreads)) {
+        tbb::task_scheduler_init init(nthreads);
+
+        points.clear();
+        util::my_time_t tm_init = util::gettime();
+        initialize(points);
+        util::my_time_t tm_start = util::gettime();
+        if(!util::silent) {
+            std::cout <<"Init time on "<<nthreads<<" threads: "<<util::time_diff(tm_init, tm_start)<<"  Points in input: "<<points.size()<<std::endl;
+        }
+
+        tm_start = util::gettime();
+        quickhull(points, hull);
+        util::my_time_t tm_end = util::gettime();
+        if(!util::silent) {
+            std::cout <<"Time on "<<nthreads<<" threads: "<<util::time_diff(tm_start, tm_end)<<"  Points in hull: "<<hull.size()<<std::endl;
+        }
+        hull.clear();
+    }
+    utility::report_elapsed_time(util::time_diff(tm_main_begin, util::gettime()));
+    return 0;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull.sln b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull.sln
new file mode 100644
index 00000000..e841d954
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull.sln
@@ -0,0 +1,38 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "convex_hull_sample", "convex_hull_sample.vcxproj", "{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}"
+EndProject
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "convex_hull_benchmark", "convex_hull_benchmark.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252A}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Debug|Win32.ActiveCfg = Debug|Win32
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Debug|Win32.Build.0 = Debug|Win32
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Debug|x64.ActiveCfg = Debug|x64
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Debug|x64.Build.0 = Debug|x64
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Release|Win32.ActiveCfg = Release|Win32
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Release|Win32.Build.0 = Release|Win32
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Release|x64.ActiveCfg = Release|x64
+		{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}.Release|x64.Build.0 = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull_benchmark.vcxproj b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull_benchmark.vcxproj
new file mode 100644
index 00000000..99067be6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull_benchmark.vcxproj
@@ -0,0 +1,206 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>convex_hull_benchmark</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252A}</ProjectGuid>
+    <RootNamespace>convex_hull_benchmark</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <Optimization>Full</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Full</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\convex_hull_bench.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\convex_hull.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull_sample.vcxproj b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull_sample.vcxproj
new file mode 100644
index 00000000..118b35d9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/msvs/convex_hull_sample.vcxproj
@@ -0,0 +1,203 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>convex_hull_sample</ProjectName>
+    <ProjectGuid>{5F897A77-EBD9-4462-94D4-06E2ADE47F3B}</ProjectGuid>
+    <RootNamespace>convex_hull_sample</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(ProjectName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(ProjectName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <Optimization>Full</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Full</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\convex_hull_sample.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\convex_hull.h" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/readme.html b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/readme.html
new file mode 100644
index 00000000..741f1e8d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/readme.html
@@ -0,0 +1,400 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Convex_hull sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Convex_hull sample</h1>
+	</div>
+	
+	<p>
+		Parallel version of convex hull algorithm (quick hull).
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="convex_hull_sample.cpp">convex_hull_sample.cpp</a>
+				<dd>Source code for parallel version of the example which uses parallel_reduce, parallel_for and concurrent_vector.
+				<dt><a href="convex_hull_bench.cpp">convex_hull_bench.cpp</a>
+				<dd>Source code for the version of the example that compares serial and parallel buffered and unbuffered implementations.
+				<dt><a href="convex_hull.h">convex_hull.h</a>
+				<dd>Include file for the example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>convex_hull_sample [<i>S</i>] [<i>M</i>[:<i>N</i>]] [-v]</tt>
+				<dd><i>S</i> is the number of points (problem size).
+					<i>M:N</i> are a range of numbers of threads to be used.
+					Use the -v option to turn on verbose output.
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Threading Tools:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size and the desired number of threads, e.g., <tt>convex_hull_sample&nbsp;500000&nbsp;4</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/xcode/convex_hull.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/xcode/convex_hull.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..49925d55
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/convex_hull/xcode/convex_hull.xcodeproj/project.pbxproj
@@ -0,0 +1,350 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A146114A0B94631F000C6B18 /* convex_hull_bench.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A14611490B94631F000C6B18 /* convex_hull_bench.cpp */; };
+		A1F593A60B8F042A00073279 /* convex_hull_sample.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* convex_hull_sample.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5895A218B677B00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594F40B8F4E7700073279 /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 2147483647;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		A14611490B94631F000C6B18 /* convex_hull_bench.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = convex_hull_bench.cpp; path = ../convex_hull_bench.cpp; sourceTree = SOURCE_ROOT; };
+		A146114C0B9463CB000C6B18 /* convex_hull.h */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.c.h; name = convex_hull.h; path = ../convex_hull.h; sourceTree = SOURCE_ROOT; };
+		A1F593A50B8F042A00073279 /* convex_hull_sample.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = convex_hull_sample.cpp; path = ../convex_hull_sample.cpp; sourceTree = SOURCE_ROOT; };
+		A1F594EB0B8F4B5600073279 /* convex_hull_bench */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = convex_hull_bench; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F594FA0B8F4EE000073279 /* convex_hull_sample */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = convex_hull_sample; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594E90B8F4B5600073279 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* convex_hull */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = convex_hull;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A146114C0B9463CB000C6B18 /* convex_hull.h */,
+				A14611490B94631F000C6B18 /* convex_hull_bench.cpp */,
+				A1F593A50B8F042A00073279 /* convex_hull_sample.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				A1F594EB0B8F4B5600073279 /* convex_hull_bench */,
+				A1F594FA0B8F4EE000073279 /* convex_hull_sample */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* convex_hull_sample */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "convex_hull_sample" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5895A218B677B00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = convex_hull_sample;
+			productInstallPath = "$(HOME)/bin";
+			productName = convex_hull;
+			productReference = A1F594FA0B8F4EE000073279 /* convex_hull_sample */;
+			productType = "com.apple.product-type.tool";
+		};
+		A1F594EA0B8F4B5600073279 /* convex_hull_bench */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = A1F594EE0B8F4B8200073279 /* Build configuration list for PBXNativeTarget "convex_hull_bench" */;
+			buildPhases = (
+				A1F594E80B8F4B5600073279 /* Sources */,
+				A1F594E90B8F4B5600073279 /* Frameworks */,
+				A1F594F40B8F4E7700073279 /* CopyFiles */,
+			);
+			buildRules = (
+			);
+			dependencies = (
+			);
+			name = convex_hull_bench;
+			productName = convex_hull_bench;
+			productReference = A1F594EB0B8F4B5600073279 /* convex_hull_bench */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "convex_hull" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* convex_hull */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* convex_hull_sample */,
+				A1F594EA0B8F4B5600073279 /* convex_hull_bench */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* convex_hull_sample.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		A1F594E80B8F4B5600073279 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A146114A0B94631F000C6B18 /* convex_hull_bench.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = convex_hull_sample;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = convex_hull_sample;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+		A1F594F00B8F4B8200073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = convex_hull_bench;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F594F20B8F4B8200073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = convex_hull_bench;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "convex_hull_sample" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "convex_hull" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		A1F594EE0B8F4B8200073279 /* Build configuration list for PBXNativeTarget "convex_hull_bench" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F594F00B8F4B8200073279 /* Debug64 */,
+				A1F594F20B8F4B8200073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/index.html b/xdl/third_party/tbb/examples/parallel_reduce/index.html
new file mode 100644
index 00000000..9649de1e
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/index.html
@@ -0,0 +1,346 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on parallel_reduce</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>parallel_reduce</code> algorithm</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the <code>parallel_reduce</code> algorithm.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="convex_hull/readme.html">convex_hull</a>
+				<dd>Parallel version of convex hull algorithm (quick hull).
+				<dt><a href="primes/readme.html">primes</a>
+				<dd>Parallel version of the Sieve of Eratosthenes.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/Makefile b/xdl/third_party/tbb/examples/parallel_reduce/primes/Makefile
new file mode 100644
index 00000000..731895b3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/Makefile
@@ -0,0 +1,68 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=primes
+ARGS=
+PERF_RUN_ARGS=silent  auto 1000000000 1000 20
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+TBBLIB = -ltbb
+TBBLIB_DEBUG = -ltbb_debug
+
+ifeq ($(offload), mic)
+override CXXFLAGS += -D__TBB_MIC_OFFLOAD=1
+# Replace -ltbb with -tbb in the offload mode
+TBBLIB = -tbb
+TBBLIB_DEBUG += -offload-option,mic,ld,"-ltbb_debug"
+endif
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: main.cpp primes.cpp 
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ $(TBBLIB) $(LIBS)
+
+debug: main.cpp primes.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ $(TBBLIB_DEBUG) $(LIBS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test: 
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/Makefile.windows b/xdl/third_party/tbb/examples/parallel_reduce/primes/Makefile.windows
new file mode 100644
index 00000000..f61d2ee6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/Makefile.windows
@@ -0,0 +1,52 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Primes
+ARGS=0:auto
+PERF_RUN_ARGS=silent  auto 1000000000 1000 20
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: compiler_check
+	$(CXX) main.cpp primes.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: compiler_check
+	$(CXX) main.cpp primes.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/main.cpp b/xdl/third_party/tbb/examples/parallel_reduce/primes/main.cpp
new file mode 100644
index 00000000..83579941
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/main.cpp
@@ -0,0 +1,124 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "primes.h"
+#include <cstdlib>
+#include <cstdio>
+#include <cstring>
+#include <cctype>
+#include <utility>
+#include <iostream>
+#include <sstream>
+#include "tbb/tick_count.h"
+
+#include "../../common/utility/utility.h"
+
+struct RunOptions{
+    //! NumberType of threads to use.
+    utility::thread_number_range threads;
+    //whether to suppress additional output
+    bool silentFlag;
+    //
+    NumberType n;
+    //! Grain size parameter
+    NumberType grainSize;
+    // number of time to repeat calculation
+    NumberType repeatNumber;
+
+    RunOptions(utility::thread_number_range threads_, NumberType grainSize_, NumberType n_, bool silentFlag_, NumberType repeatNumber_)
+        : threads(threads_), silentFlag(silentFlag_), n(n_), grainSize(grainSize_), repeatNumber(repeatNumber_)
+    {}
+};
+
+int do_get_default_num_threads() {
+    int threads;
+    #if __TBB_MIC_OFFLOAD
+    #pragma offload target(mic) out(threads)
+    #endif // __TBB_MIC_OFFLOAD
+    threads = tbb::task_scheduler_init::default_num_threads();
+    return threads;
+}
+
+int get_default_num_threads() {
+    static int threads = do_get_default_num_threads();
+    return threads;
+}
+
+//! Parse the command line.
+static RunOptions ParseCommandLine( int argc, const char* argv[] ) {
+    utility::thread_number_range threads( get_default_num_threads, 0, get_default_num_threads() );
+    NumberType grainSize = 1000;
+    bool silent = false;
+    NumberType number = 100000000;
+    NumberType repeatNumber = 1;
+
+    utility::parse_cli_arguments(argc,argv,
+        utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(number,"number","upper bound of range to search primes in, must be a positive integer")
+            .positional_arg(grainSize,"grain-size","must be a positive integer")
+            .positional_arg(repeatNumber,"n-of-repeats","repeat the calculation this number of times, must be a positive integer")
+            .arg(silent,"silent","no output except elapsed time")
+    );
+
+    RunOptions options(threads,grainSize, number, silent, repeatNumber);
+    return options;
+}
+
+int main( int argc, const char* argv[] ) {
+    tbb::tick_count mainBeginMark = tbb::tick_count::now();
+    RunOptions options =ParseCommandLine(argc,argv);
+
+    // Try different numbers of threads
+    for( int p=options.threads.first; p<=options.threads.last; p=options.threads.step(p) ) {
+        for (NumberType i=0; i<options.repeatNumber;++i){
+            tbb::tick_count iterationBeginMark = tbb::tick_count::now();
+            NumberType count = 0;
+            NumberType n = options.n;
+            if( p==0 ) {
+                #if __TBB_MIC_OFFLOAD
+                #pragma offload target(mic) in(n) out(count)
+                #endif // __TBB_MIC_OFFLOAD
+                count = SerialCountPrimes(n);
+            } else {
+                NumberType grainSize = options.grainSize;
+                #if __TBB_MIC_OFFLOAD
+                #pragma offload target(mic) in(n, p, grainSize) out(count)
+                #endif // __TBB_MIC_OFFLOAD
+                count = ParallelCountPrimes(n, p, grainSize);
+            }
+            tbb::tick_count iterationEndMark = tbb::tick_count::now();
+            if (!options.silentFlag){
+                std::cout
+                        <<"#primes from [2.." <<options.n<<"] = " << count
+                        <<" ("<<(iterationEndMark-iterationBeginMark).seconds()<< " sec with "
+                ;
+                if( 0 != p )
+                    std::cout<<p<<"-way parallelism";
+                else
+                    std::cout<<"serial code";
+                std::cout<<")\n" ;
+            }
+        }
+    }
+    utility::report_elapsed_time((tbb::tick_count::now()-mainBeginMark).seconds());
+    return 0;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/msvs/primes.sln b/xdl/third_party/tbb/examples/parallel_reduce/primes/msvs/primes.sln
new file mode 100644
index 00000000..d1310ebb
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/msvs/primes.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "primes", "primes.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252A}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252A}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/msvs/primes.vcxproj b/xdl/third_party/tbb/examples/parallel_reduce/primes/msvs/primes.vcxproj
new file mode 100644
index 00000000..697045eb
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/msvs/primes.vcxproj
@@ -0,0 +1,205 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>primes</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252A}</ProjectGuid>
+    <RootNamespace>primes</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\main.cpp" />
+    <ClCompile Include="..\primes.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\primes.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/primes.cpp b/xdl/third_party/tbb/examples/parallel_reduce/primes/primes.cpp
new file mode 100644
index 00000000..09f3a6ec
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/primes.cpp
@@ -0,0 +1,309 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Example program that computes number of prime numbers up to n, 
+// where n is a command line argument.  The algorithm here is a 
+// fairly efficient version of the sieve of Eratosthenes. 
+// The parallel version demonstrates how to use parallel_reduce,
+// and in particular how to exploit lazy splitting.
+
+#include "primes.h"
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (target(mic))
+#endif // __TBB_MIC_OFFLOAD
+#include <algorithm>
+#include <cassert>
+#include <cstdio>
+#include <cstring>
+#include <math.h>
+#include <cstdlib>
+#include <cctype>
+#include "tbb/parallel_reduce.h"
+#include "tbb/task_scheduler_init.h"
+
+using namespace std;
+
+//! If true, then print primes on stdout.
+static bool printPrimes = false;
+
+
+class Multiples {
+    inline NumberType strike( NumberType start, NumberType limit, NumberType stride ) {
+        // Hoist "my_is_composite" into register for sake of speed.
+        bool* is_composite = my_is_composite;
+        assert( stride>=2 );
+        for( ;start<limit; start+=stride ) 
+            is_composite[start] = true;
+        return start;
+    }
+    //! Window into conceptual sieve 
+    bool* my_is_composite;
+
+    //! Indexes into window
+    /** my_striker[k] is an index into my_composite corresponding to
+        an odd multiple multiple of my_factor[k]. */
+    NumberType* my_striker;
+
+    //! Prime numbers less than m.
+    NumberType* my_factor;
+public:
+    //! NumberType of factors in my_factor.
+    NumberType n_factor;
+    NumberType m;
+    Multiples( NumberType n ) {
+        m = NumberType(sqrt(double(n)));
+        // Round up to even
+        m += m&1;
+        my_is_composite = new bool[m/2];
+        my_striker = new NumberType[m/2];
+        my_factor = new NumberType[m/2];
+        n_factor = 0;
+        memset( my_is_composite, 0, m/2 );
+        for( NumberType i=3; i<m; i+=2 ) {
+            if( !my_is_composite[i/2] ) {
+                if( printPrimes )
+                    printf("%d\n",(int)i);
+                my_striker[n_factor] = strike( i/2, m/2, i );
+                my_factor[n_factor++] = i;
+            }
+        }
+    }
+
+    //! Find primes in range [start,window_size), advancing my_striker as we go.
+    /** Returns number of primes found. */
+    NumberType find_primes_in_window( NumberType start, NumberType window_size ) {
+        bool* is_composite = my_is_composite;
+        memset( is_composite, 0, window_size/2 );
+        for( size_t k=0; k<n_factor; ++k )
+            my_striker[k] = strike( my_striker[k]-m/2, window_size/2, my_factor[k] );
+        NumberType count = 0;
+        for( NumberType k=0; k<window_size/2; ++k ) {
+            if( !is_composite[k] ) {
+                if( printPrimes )
+                    printf("%ld\n",long(start+2*k+1));
+                ++count;
+            }
+        }
+        return count;
+    }
+
+    ~Multiples() {
+        delete[] my_factor;
+        delete[] my_striker;
+        delete[] my_is_composite;
+    }
+
+    //------------------------------------------------------------------------
+    // Begin extra members required by parallel version
+    //------------------------------------------------------------------------
+
+    // Splitting constructor
+    Multiples( const Multiples& f, tbb::split ) :
+        n_factor(f.n_factor),
+        m(f.m),
+        my_is_composite(NULL),
+        my_striker(NULL),
+        my_factor(f.my_factor)
+    {}
+
+    bool is_initialized() const {
+        return my_is_composite!=NULL;
+    }
+
+    void initialize( NumberType start ) { 
+        assert( start>=1 );
+        my_is_composite = new bool[m/2];
+        my_striker = new NumberType[m/2];
+        for( size_t k=0; k<n_factor; ++k ) {
+            NumberType f = my_factor[k];
+            NumberType p = (start-1)/f*f % m;
+            my_striker[k] = (p&1 ? p+2*f : p+f)/2;
+            assert( m/2<=my_striker[k] );
+        }
+    }
+
+    // Move other to *this.
+    void move( Multiples& other ) {
+        // The swap moves the contents of other to *this and causes the old contents
+        // of *this to be deleted later when other is destroyed.
+        std::swap( my_striker, other.my_striker );
+        std::swap( my_is_composite, other.my_is_composite );
+        // other.my_factor is a shared pointer that was copied by the splitting constructor.
+        // Set it to NULL to prevent premature deletion by the destructor of ~other.
+        assert(my_factor==other.my_factor);
+        other.my_factor = NULL;
+    }
+
+    //------------------------------------------------------------------------
+    // End extra methods required by parallel version
+    //------------------------------------------------------------------------
+};
+
+//! Count number of primes between 0 and n
+/** This is the serial version. */
+NumberType SerialCountPrimes( NumberType n ) {
+    // Two is special case
+    NumberType count = n>=2;
+    if( n>=3 ) {
+        Multiples multiples(n);
+        count += multiples.n_factor;
+        if( printPrimes ) 
+            printf("---\n");
+        NumberType window_size = multiples.m;
+        for( NumberType j=multiples.m; j<=n; j+=window_size ) { 
+            if( j+window_size>n+1 ) 
+                window_size = n+1-j;
+            count += multiples.find_primes_in_window( j, window_size );
+        }
+    }
+    return count;
+}
+
+//! Range of a sieve window.
+class SieveRange {
+    //! Width of full-size window into sieve.
+    const NumberType my_stride;
+
+    //! Always multiple of my_stride
+    NumberType my_begin;
+
+    //! One past last number in window.
+    NumberType my_end;
+
+    //! Width above which it is worth forking.
+    const NumberType my_grainsize;
+
+    bool assert_okay() const {
+        assert( my_begin%my_stride==0 );
+        assert( my_begin<=my_end );
+        assert( my_stride<=my_grainsize );
+        return true;
+    } 
+public:
+    //------------------------------------------------------------------------
+    // Begin signatures required by parallel_reduce
+    //------------------------------------------------------------------------
+    bool is_divisible() const {return my_end-my_begin>my_grainsize;}
+    bool empty() const {return my_end<=my_begin;}
+    SieveRange( SieveRange& r, tbb::split ) :
+        my_stride(r.my_stride), 
+        my_grainsize(r.my_grainsize),
+        my_end(r.my_end)
+    {
+        assert( r.is_divisible() );
+        assert( r.assert_okay() );
+        NumberType middle = r.my_begin + (r.my_end-r.my_begin+r.my_stride-1)/2;
+        middle = middle/my_stride*my_stride;
+        my_begin = middle;
+        r.my_end = middle;
+        assert( assert_okay() );
+        assert( r.assert_okay() );
+    }
+    //------------------------------------------------------------------------
+    // End of signatures required by parallel_reduce
+    //------------------------------------------------------------------------
+    NumberType begin() const {return my_begin;}
+    NumberType end() const {return my_end;}
+    SieveRange( NumberType begin, NumberType end, NumberType stride, NumberType grainsize ) :
+        my_begin(begin),
+        my_end(end),
+        my_stride(stride),      
+        my_grainsize(grainsize<stride?stride:grainsize)
+    {
+        assert( assert_okay() );
+    }
+};
+
+//! Loop body for parallel_reduce.
+/** parallel_reduce splits the sieve into subsieves.
+    Each subsieve handles a subrange of [0..n]. */
+class Sieve {
+public:
+    //! Prime Multiples to consider, and working storage for this subsieve.
+    ::Multiples multiples;
+
+    //! NumberType of primes found so far by this subsieve.
+    NumberType count;
+
+    //! Construct Sieve for counting primes in [0..n].
+    Sieve( NumberType n ) :
+        multiples(n),
+        count(0)
+    {}
+
+    //------------------------------------------------------------------------
+    // Begin signatures required by parallel_reduce
+    //------------------------------------------------------------------------
+    void operator()( const SieveRange& r ) {
+        NumberType m = multiples.m;
+        if( multiples.is_initialized() ) { 
+            // Simply reuse "Multiples" structure from previous window
+            // This works because parallel_reduce always applies
+            // *this from left to right.
+        } else {
+            // Need to initialize "Multiples" because *this is a forked copy
+            // that needs to be set up to start at r.begin().
+            multiples.initialize( r.begin() );
+        }
+        NumberType window_size = m;
+        for( NumberType j=r.begin(); j<r.end(); j+=window_size ) { 
+            assert( j%multiples.m==0 );
+            if( j+window_size>r.end() ) 
+                window_size = r.end()-j;
+            count += multiples.find_primes_in_window( j, window_size );
+        }
+    }
+    void join( Sieve& other ) {
+        count += other.count;
+        // Final value of multiples needs to final value of other multiples,
+        // so that *this can correctly process next window to right.
+        multiples.move( other.multiples );
+    }
+    Sieve( Sieve& other, tbb::split ) :
+        multiples(other.multiples,tbb::split()),
+        count(0)
+    {}
+    //------------------------------------------------------------------------
+    // End of signatures required by parallel_reduce
+    //------------------------------------------------------------------------
+};
+
+//! Count number of primes between 0 and n
+/** This is the parallel version. */
+NumberType ParallelCountPrimes( NumberType n , int number_of_threads, NumberType grain_size ) {
+    tbb::task_scheduler_init init(number_of_threads);
+
+    // Two is special case
+    NumberType count = n>=2;
+    if( n>=3 ) {
+        Sieve s(n);
+        count += s.multiples.n_factor;
+        if( printPrimes )
+            printf("---\n");
+        using namespace tbb;
+        // Explicit grain size and simple_partitioner() used here instead of automatic grainsize 
+        // determination becase we want SieveRange to be decomposed down to grainSize or smaller.  
+        // Doing so improves odds that the working set fits in cache when evaluating Sieve::operator().
+        parallel_reduce( SieveRange( s.multiples.m, n, s.multiples.m, grain_size ), s, simple_partitioner() );
+        count += s.count;
+    }
+    return count;
+}
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/primes.h b/xdl/third_party/tbb/examples/parallel_reduce/primes/primes.h
new file mode 100644
index 00000000..3ae92e1a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/primes.h
@@ -0,0 +1,44 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef PRIMES_H_
+#define PRIMES_H_
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (push,target(mic))
+#endif // __TBB_MIC_OFFLOAD
+
+#include "tbb/task_scheduler_init.h"
+#include <cstddef>
+typedef std::size_t NumberType;
+
+//! Count number of primes between 0 and n
+/** This is the serial version. */
+NumberType SerialCountPrimes( NumberType n);
+
+//! Count number of primes between 0 and n
+/** This is the parallel version. */
+NumberType ParallelCountPrimes( NumberType n, int numberOfThreads= tbb::task_scheduler_init::automatic, NumberType grainSize = 1000);
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (pop)
+#endif // __TBB_MIC_OFFLOAD
+
+#endif /* PRIMES_H_ */
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/readme.html b/xdl/third_party/tbb/examples/parallel_reduce/primes/readme.html
new file mode 100644
index 00000000..97120a0d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/readme.html
@@ -0,0 +1,407 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Primes sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Primes sample</h1>
+	</div>
+	
+	<p>
+		Parallel version of the Sieve of Eratosthenes.
+	<br><br>
+		The example can be built in the offload version to run on Intel&reg; Many Integrated Core (Intel&reg; MIC) Architecture based coprocessor (see <a href="../../index.html">build instructions</a>).
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="main.cpp">main.cpp</a>
+				<dd>Main program which parses command line options and runs the algorithm with different numbers of threads.
+				<dt><a href="primes.h">primes.h</a>
+				<dd>The Sieve of Eratosthenes interface.
+				<dt><a href="primes.cpp">primes.cpp</a>
+				<dd>The Sieve of Eratosthenes implementation.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>primes <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>primes [<i>n-of-threads</i>=value] [<i>number</i>=value] [<i>grain-size</i>=value] [<i>n-of-repeats</i>=value] [<i>silent</i>]</tt>
+				<dt><tt>primes [<i>n-of-threads</i> [<i>number</i> [<i>grain-size</i> [<i>n-of-repeats</i>]]]][<i>silent</i>]</tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>number</i> is an upper bound of range to search primes in, must be a positive integer.<br>
+					<i>grain-size</i> is an optional grain size, must be a positive integer. <br>
+					<i>n-of-repeats</i> is a number of the calculation repeats, must be a positive integer.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size and the desired number of threads, e.g., <tt>primes&nbsp;4&nbsp;100000</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/parallel_reduce/primes/xcode/primes.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/parallel_reduce/primes/xcode/primes.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..a3d8b619
--- /dev/null
+++ b/xdl/third_party/tbb/examples/parallel_reduce/primes/xcode/primes.xcodeproj/project.pbxproj
@@ -0,0 +1,268 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* primes.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* primes.cpp */; };
+		EA8D882D1301731B00385DE1 /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = EA8D882C1301731B00385DE1 /* main.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5895B218B692000DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* primes */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = primes; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* primes.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = primes.cpp; path = ../primes.cpp; sourceTree = SOURCE_ROOT; };
+		EA8D882B130172E400385DE1 /* primes.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = primes.h; path = ../primes.h; sourceTree = SOURCE_ROOT; };
+		EA8D882C1301731B00385DE1 /* main.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = main.cpp; path = ../main.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* primes */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = primes;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				EA8D882C1301731B00385DE1 /* main.cpp */,
+				EA8D882B130172E400385DE1 /* primes.h */,
+				A1F593A50B8F042A00073279 /* primes.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* primes */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* primes */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "primes" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5895B218B692000DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = primes;
+			productInstallPath = "$(HOME)/bin";
+			productName = primes;
+			productReference = 8DD76F6C0486A84900D96B5E /* primes */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "primes" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* primes */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* primes */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* primes.cpp in Sources */,
+				EA8D882D1301731B00385DE1 /* main.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = primes;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = primes;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "primes" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "primes" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/pipeline/index.html b/xdl/third_party/tbb/examples/pipeline/index.html
new file mode 100644
index 00000000..ec36081b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on pipeline algorithm</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>pipeline</code> algorithm</h1>
+	</div>
+	
+	<p>
+		This directory has examples of the <code>pipeline</code> algorithm.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="square/readme.html">square</a>
+				<dd>Another simple string transformation example that squares numbers read from a file.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/pipeline/square/Makefile b/xdl/third_party/tbb/examples/pipeline/square/Makefile
new file mode 100644
index 00000000..d4037ec3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/Makefile
@@ -0,0 +1,61 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=square
+ARGS=0 input.txt output.txt
+PERF_RUN_ARGS=auto input.txt output.txt silent
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+SOURCES = square.cpp gen_input.cpp
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: $(SOURCES)
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug: $(SOURCES)
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) $(PROG) *.o *.d input.txt output.txt
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: $(SOURCES)
+	$(CXX) -O2 -msse2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/pipeline/square/Makefile.windows b/xdl/third_party/tbb/examples/pipeline/square/Makefile.windows
new file mode 100644
index 00000000..0571c758
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/Makefile.windows
@@ -0,0 +1,50 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=square
+ARGS=0 input.txt output.txt
+PERF_RUN_ARGS=auto input.txt output.txt silent
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 $(CXXFLAGS) /D _CRT_SECURE_NO_DEPRECATE
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+SOURCES = square.cpp gen_input.cpp
+
+all: release test
+release: compiler_check
+	$(CXX) $(SOURCES) /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: compiler_check
+	$(CXX) $(SOURCES) /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe input.txt output.txt *.obj *.?db *.manifest gen_input.exe
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
+perf_build: release
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/pipeline/square/gen_input.cpp b/xdl/third_party/tbb/examples/pipeline/square/gen_input.cpp
new file mode 100644
index 00000000..f1690d5b
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/gen_input.cpp
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <stdexcept>
+
+#if _WIN32
+#include <io.h>
+#ifndef F_OK
+#define F_OK 0
+#endif
+#define access _access
+#else
+#include <unistd.h>
+#endif
+
+const long INPUT_SIZE = 1000000;
+
+//! Generates sample input for square.cpp
+void gen_input( const char *fname ) {
+    long num = INPUT_SIZE;
+    FILE *fptr = fopen(fname, "w");
+    if(!fptr) {
+        throw std::runtime_error("Could not open file for generating input");
+    }
+
+    int a=0;
+    int b=1;
+    for( long j=0; j<num; ++j ) {
+        fprintf(fptr, "%u\n",a);
+        b+=a;
+        a=(b-a)%10000;
+        if (a<0) a=-a;
+    }
+
+    if(fptr) {
+        fclose(fptr);
+    }
+}
+
+void generate_if_needed( const char *fname ) {
+    if ( access(fname, F_OK) != 0 )
+        gen_input(fname);
+}
diff --git a/xdl/third_party/tbb/examples/pipeline/square/msvs/square.sln b/xdl/third_party/tbb/examples/pipeline/square/msvs/square.sln
new file mode 100644
index 00000000..2c527ecc
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/msvs/square.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "square", "square.vcxproj", "{A21C0AEE-ADDC-45F0-A668-58FF10351D23}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Debug|Win32.ActiveCfg = Debug|Win32
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Debug|Win32.Build.0 = Debug|Win32
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Debug|x64.ActiveCfg = Debug|x64
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Debug|x64.Build.0 = Debug|x64
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Release|Win32.ActiveCfg = Release|Win32
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Release|Win32.Build.0 = Release|Win32
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Release|x64.ActiveCfg = Release|x64
+		{A21C0AEE-ADDC-45F0-A668-58FF10351D23}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/pipeline/square/msvs/square.vcxproj b/xdl/third_party/tbb/examples/pipeline/square/msvs/square.vcxproj
new file mode 100644
index 00000000..67aea8c7
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/msvs/square.vcxproj
@@ -0,0 +1,202 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>square</ProjectName>
+    <ProjectGuid>{A21C0AEE-ADDC-45F0-A668-58FF10351D23}</ProjectGuid>
+    <RootNamespace>square</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;_CRT_SECURE_NO_DEPRECATE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\gen_input.cpp" />
+    <ClCompile Include="..\square.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/pipeline/square/readme.html b/xdl/third_party/tbb/examples/pipeline/square/readme.html
new file mode 100644
index 00000000..11a5d642
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/readme.html
@@ -0,0 +1,417 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Square sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Square sample</h1>
+	</div>
+	
+	<p>
+		Text filter that demonstrates class pipeline. Example program reads a file 
+		containing decimal integers in text format, and changes each to its square.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="square.cpp">square.cpp</a>
+				<dd>Source code for example.
+				<dt><a href="gen_input.cpp">gen_input.cpp </a>
+				<dd>Source code for sample input generation.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+			Two additional targets for this example:
+			<dl>
+				<dt><tt>make gen_input</tt>
+				<dd>Create an input generator program that prints out a sequence of integers.
+				<dt><tt>make input.txt</tt>
+				<dd>Create an input file for the example (with help of <tt>gen_input</tt>).
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>square <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>square [<i>n-of-threads</i>=value] [<i>input-file</i>=value] [<i>output-file</i>=value] [<i>max-slice-size</i>=value] [<i>silent</i>]</tt>
+				<dt><tt>square [<i>n-of-threads</i> [<i>input-file</i> [<i>output-file</i> [<i>max-slice-size</i>]]]] [<i>silent</i>]</tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>input-file</i> is an input file name.<br>
+					<i>output-file</i> is an output file name. <br>
+					<i>max-slice-size</i> is the maximum number of characters in one slice.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+				<dt><tt>gen_input [<i>LN</i>] &gt; <i>inputfile</i></tt>
+				<dd>Generate a file named <i>inputfile</i> consisting of <i>LN</i> lines each containing one integer.
+					If not specified, <i>LN</i> is assumed to be 1000000.
+
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Prepare an <i>inputfile</i> with about 5,000 lines of text (see the instruction above).
+					<br>Run it with this <i>inputfile</i> and the desired number of threads,
+					e.g., <tt>square&nbsp;4&nbsp;<i>inputfile</i>&nbsp;<i>outputfile</i></tt>.
+				</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/pipeline/square/square.cpp b/xdl/third_party/tbb/examples/pipeline/square/square.cpp
new file mode 100644
index 00000000..c15be313
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/square.cpp
@@ -0,0 +1,279 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// Example program that reads a file of decimal integers in text format
+// and changes each to its square.
+// 
+#include "tbb/pipeline.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tbb_allocator.h"
+#include <cstring>
+#include <cstdlib>
+#include <cstdio>
+#include <cctype>
+#include "../../common/utility/utility.h"
+
+extern void generate_if_needed(const char*);
+
+using namespace std;
+
+//! Holds a slice of text.
+/** Instances *must* be allocated/freed using methods herein, because the C++ declaration
+    represents only the header of a much larger object in memory. */
+class TextSlice {
+    //! Pointer to one past last character in sequence
+    char* logical_end;
+    //! Pointer to one past last available byte in sequence.
+    char* physical_end;
+public:
+    //! Allocate a TextSlice object that can hold up to max_size characters.
+    static TextSlice* allocate( size_t max_size ) {
+        // +1 leaves room for a terminating null character.
+        TextSlice* t = (TextSlice*)tbb::tbb_allocator<char>().allocate( sizeof(TextSlice)+max_size+1 );
+        t->logical_end = t->begin();
+        t->physical_end = t->begin()+max_size;
+        return t;
+    }
+    //! Free a TextSlice object 
+    void free() {
+        tbb::tbb_allocator<char>().deallocate((char*)this,sizeof(TextSlice)+(physical_end-begin())+1);
+    } 
+    //! Pointer to beginning of sequence
+    char* begin() {return (char*)(this+1);}
+    //! Pointer to one past last character in sequence
+    char* end() {return logical_end;}
+    //! Length of sequence
+    size_t size() const {return logical_end-(char*)(this+1);}
+    //! Maximum number of characters that can be appended to sequence
+    size_t avail() const {return physical_end-logical_end;}
+    //! Append sequence [first,last) to this sequence.
+    void append( char* first, char* last ) {
+        memcpy( logical_end, first, last-first );
+        logical_end += last-first;
+    }
+    //! Set end() to given value.
+    void set_end( char* p ) {logical_end=p;}
+};
+
+size_t MAX_CHAR_PER_INPUT_SLICE = 4000;
+string InputFileName = "input.txt";
+string OutputFileName = "output.txt";
+
+class MyInputFilter: public tbb::filter {
+public:
+    MyInputFilter( FILE* input_file_ );
+    ~MyInputFilter();
+private:
+    FILE* input_file;
+    TextSlice* next_slice;
+    void* operator()(void*) /*override*/;
+};
+
+MyInputFilter::MyInputFilter( FILE* input_file_ ) : 
+    filter(serial_in_order),
+    input_file(input_file_),
+    next_slice( TextSlice::allocate( MAX_CHAR_PER_INPUT_SLICE ) )
+{ 
+}
+
+MyInputFilter::~MyInputFilter() {
+    next_slice->free();
+}
+ 
+void* MyInputFilter::operator()(void*) {
+    // Read characters into space that is available in the next slice.
+    size_t m = next_slice->avail();
+    size_t n = fread( next_slice->end(), 1, m, input_file );
+    if( !n && next_slice->size()==0 ) {
+        // No more characters to process
+        return NULL;
+    } else {
+        // Have more characters to process.
+        TextSlice& t = *next_slice;
+        next_slice = TextSlice::allocate( MAX_CHAR_PER_INPUT_SLICE );
+        char* p = t.end()+n;
+        if( n==m ) {
+            // Might have read partial number.  If so, transfer characters of partial number to next slice.
+            while( p>t.begin() && isdigit(p[-1]) ) 
+                --p;
+            next_slice->append( p, t.end()+n );
+        }
+        t.set_end(p);
+        return &t;
+    }
+}
+    
+//! Filter that changes each decimal number to its square.
+class MyTransformFilter: public tbb::filter {
+public:
+    MyTransformFilter();
+    void* operator()( void* item ) /*override*/;
+};
+
+MyTransformFilter::MyTransformFilter() : 
+    tbb::filter(parallel) 
+{}  
+
+void* MyTransformFilter::operator()( void* item ) {
+    TextSlice& input = *static_cast<TextSlice*>(item);
+    // Add terminating null so that strtol works right even if number is at end of the input.
+    *input.end() = '\0';
+    char* p = input.begin();
+    TextSlice& out = *TextSlice::allocate( 2*MAX_CHAR_PER_INPUT_SLICE );
+    char* q = out.begin();
+    for(;;) {
+        while( p<input.end() && !isdigit(*p) ) 
+            *q++ = *p++; 
+        if( p==input.end() ) 
+            break;
+        long x = strtol( p, &p, 10 );
+        // Note: no overflow checking is needed here, as we have twice the 
+        // input string length, but the square of a non-negative integer n 
+        // cannot have more than twice as many digits as n.
+        long y = x*x; 
+        sprintf(q,"%ld",y);
+        q = strchr(q,0);
+    }
+    out.set_end(q);
+    input.free();
+    return &out;
+}
+         
+//! Filter that writes each buffer to a file.
+class MyOutputFilter: public tbb::filter {
+    FILE* my_output_file;
+public:
+    MyOutputFilter( FILE* output_file );
+    void* operator()( void* item ) /*override*/;
+};
+
+MyOutputFilter::MyOutputFilter( FILE* output_file ) : 
+    tbb::filter(serial_in_order),
+    my_output_file(output_file)
+{
+}
+
+void* MyOutputFilter::operator()( void* item ) {
+    TextSlice& out = *static_cast<TextSlice*>(item);
+    size_t n = fwrite( out.begin(), 1, out.size(), my_output_file );
+    if( n!=out.size() ) {
+        fprintf(stderr,"Can't write into file '%s'\n", OutputFileName.c_str());
+        exit(1);
+    }
+    out.free();
+    return NULL;
+}
+
+bool silent = false;
+
+int run_pipeline( int nthreads )
+{
+    FILE* input_file = fopen( InputFileName.c_str(), "r" );
+    if( !input_file ) {
+        throw std::invalid_argument( ("Invalid input file name: "+InputFileName).c_str() );
+        return 0;
+    }
+    FILE* output_file = fopen( OutputFileName.c_str(), "w" );
+    if( !output_file ) {
+        throw std::invalid_argument( ("Invalid output file name: "+OutputFileName).c_str() );
+        return 0;
+    }
+
+    // Create the pipeline
+    tbb::pipeline pipeline;
+
+    // Create file-reading writing stage and add it to the pipeline
+    MyInputFilter input_filter( input_file );
+    pipeline.add_filter( input_filter );
+
+    // Create squaring stage and add it to the pipeline
+    MyTransformFilter transform_filter; 
+    pipeline.add_filter( transform_filter );
+
+    // Create file-writing stage and add it to the pipeline
+    MyOutputFilter output_filter( output_file );
+    pipeline.add_filter( output_filter );
+
+    // Run the pipeline
+    tbb::tick_count t0 = tbb::tick_count::now();
+    // Need more than one token in flight per thread to keep all threads 
+    // busy; 2-4 works
+    pipeline.run( nthreads*4 );
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    fclose( output_file );
+    fclose( input_file );
+
+    if ( !silent ) printf("time = %g\n", (t1-t0).seconds());
+
+    return 1;
+}
+
+int main( int argc, char* argv[] ) {
+    try {
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        // The 1st argument is the function to obtain 'auto' value; the 2nd is the default value
+        // The example interprets 0 threads as "run serially, then fully subscribed"
+        utility::thread_number_range threads( tbb::task_scheduler_init::default_num_threads, 0 );
+
+        utility::parse_cli_arguments(argc,argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(InputFileName,"input-file","input file name")
+            .positional_arg(OutputFileName,"output-file","output file name")
+            .positional_arg(MAX_CHAR_PER_INPUT_SLICE, "max-slice-size","the maximum number of characters in one slice")
+            .arg(silent,"silent","no output except elapsed time")
+            );
+        generate_if_needed( InputFileName.c_str() );
+
+        if ( threads.first ) {
+            for(int p = threads.first;  p <= threads.last; p=threads.step(p) ) {
+                if ( !silent ) printf("threads = %d ", p);
+                tbb::task_scheduler_init init(p);
+                if(!run_pipeline (p))
+                    return 1;
+            }
+        } else { // Number of threads wasn't set explicitly. Run serial and parallel version
+            { // serial run
+                if ( !silent ) printf("serial run   ");
+                tbb::task_scheduler_init init_serial(1);
+                if(!run_pipeline (1))
+                    return 1;
+            }
+            { // parallel run (number of threads is selected automatically)
+                if ( !silent ) printf("parallel run ");
+                tbb::task_scheduler_init init_parallel;
+                if(!run_pipeline (init_parallel.default_num_threads()))
+                    return 1;
+            }
+        }
+
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+
+        return 0;
+    } catch(std::exception& e) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/pipeline/square/xcode/square.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/pipeline/square/xcode/square.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..57ea0930
--- /dev/null
+++ b/xdl/third_party/tbb/examples/pipeline/square/xcode/square.xcodeproj/project.pbxproj
@@ -0,0 +1,266 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* square.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* square.cpp */; };
+		EA09E56116E4F19700CA4CF4 /* gen_input.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 6D0FC7170DE5BA4D0026B02B /* gen_input.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5895C218B69F900DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		6D0FC7170DE5BA4D0026B02B /* gen_input.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = gen_input.cpp; path = ../gen_input.cpp; sourceTree = SOURCE_ROOT; };
+		8DD76F6C0486A84900D96B5E /* square */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = square; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* square.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = square.cpp; path = ../square.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* square */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = square;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				6D0FC7170DE5BA4D0026B02B /* gen_input.cpp */,
+				A1F593A50B8F042A00073279 /* square.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* square */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* square */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "square" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5895C218B69F900DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = square;
+			productInstallPath = "$(HOME)/bin";
+			productName = square;
+			productReference = 8DD76F6C0486A84900D96B5E /* square */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "square" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* square */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* square */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				EA09E56116E4F19700CA4CF4 /* gen_input.cpp in Sources */,
+				A1F593A60B8F042A00073279 /* square.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = square;
+				REEXPORTED_LIBRARY_PATHS = "";
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = square;
+				REEXPORTED_LIBRARY_PATHS = "";
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "square" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "square" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/task/index.html b/xdl/third_party/tbb/examples/task/index.html
new file mode 100644
index 00000000..bc5ec71f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on task scheduler interface</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on task scheduler interface</h1>
+	</div>
+	
+	<p>
+		This directory has examples of how to use the raw task scheduler.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="tree_sum/readme.html">tree_sum</a>
+				<dd>Sum values in a tree.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/Makefile b/xdl/third_party/tbb/examples/task/tree_sum/Makefile
new file mode 100644
index 00000000..f396e877
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/Makefile
@@ -0,0 +1,59 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=tree_sum
+ARGS=
+PERF_RUN_ARGS=auto 100000000 silent
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbbmalloc -ltbb $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbbmalloc_debug -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+	$(run_cmd) ./$(PROG) stdmalloc $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/Makefile.windows b/xdl/third_party/tbb/examples/task/tree_sum/Makefile.windows
new file mode 100644
index 00000000..b71167a0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/Makefile.windows
@@ -0,0 +1,52 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Tree_sum
+ARGS=
+PERF_RUN_ARGS=auto 100000000 silent
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: compiler_check
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbbmalloc.lib tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: compiler_check
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbbmalloc_debug.lib tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+	$(PROG) stdmalloc $(ARGS)
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/OptimizedParallelSumTree.cpp b/xdl/third_party/tbb/examples/task/tree_sum/OptimizedParallelSumTree.cpp
new file mode 100644
index 00000000..a6552588
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/OptimizedParallelSumTree.cpp
@@ -0,0 +1,69 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "common.h"
+#include "tbb/task.h"
+
+class OptimizedSumTask: public tbb::task {
+    Value* const sum;
+    TreeNode* root;
+    bool is_continuation;
+    Value x, y;
+public:
+    OptimizedSumTask( TreeNode* root_, Value* sum_ ) : root(root_), sum(sum_), is_continuation(false) {
+    }
+    tbb::task* execute() /*override*/ {
+        tbb::task* next = NULL;
+        if( !is_continuation ) {
+            if( root->node_count<1000 ) {
+                *sum = SerialSumTree(root);
+            } else {
+                // Create tasks before spawning any of them.
+                tbb::task* a = NULL;
+                tbb::task* b = NULL;
+                if( root->left )
+                    a = new( allocate_child() ) OptimizedSumTask(root->left,&x);
+                if( root->right )
+                    b = new( allocate_child() ) OptimizedSumTask(root->right,&y);
+                recycle_as_continuation();
+                is_continuation = true;
+                set_ref_count( (a!=NULL)+(b!=NULL) );
+                if( a ) {
+                    if( b ) spawn(*b);
+                } else 
+                    a = b;
+                next = a;
+            }
+        } else {
+            *sum = root->value;
+            if( root->left ) *sum += x;
+            if( root->right ) *sum += y;
+        } 
+        return next;
+    }
+};
+
+Value OptimizedParallelSumTree( TreeNode* root ) {
+    Value sum;
+    OptimizedSumTask& a = *new(tbb::task::allocate_root()) OptimizedSumTask(root,&sum);
+    tbb::task::spawn_root_and_wait(a);
+    return sum;
+}
+
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/SerialSumTree.cpp b/xdl/third_party/tbb/examples/task/tree_sum/SerialSumTree.cpp
new file mode 100644
index 00000000..15d39768
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/SerialSumTree.cpp
@@ -0,0 +1,30 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "common.h"
+
+Value SerialSumTree( TreeNode* root ) {
+    Value result = root->value;
+    if( root->left )
+        result += SerialSumTree(root->left);
+    if( root->right )
+        result += SerialSumTree(root->right);
+    return result;
+}
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/SimpleParallelSumTree.cpp b/xdl/third_party/tbb/examples/task/tree_sum/SimpleParallelSumTree.cpp
new file mode 100644
index 00000000..6923a7b5
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/SimpleParallelSumTree.cpp
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "common.h"
+#include "tbb/task.h"
+
+class SimpleSumTask: public tbb::task {
+    Value* const sum;
+    TreeNode* root;
+public:
+    SimpleSumTask( TreeNode* root_, Value* sum_ ) : root(root_), sum(sum_) {}
+    task* execute() /*override*/ {
+        if( root->node_count<1000 ) {
+            *sum = SerialSumTree(root);
+        } else {
+            Value x, y;
+            int count = 1; 
+            tbb::task_list list;
+            if( root->left ) {
+                ++count;
+                list.push_back( *new( allocate_child() ) SimpleSumTask(root->left,&x) );
+            }
+            if( root->right ) {
+                ++count;
+                list.push_back( *new( allocate_child() ) SimpleSumTask(root->right,&y) );
+            }
+            // Argument to set_ref_count is one more than size of the list,
+            // because spawn_and_wait_for_all expects an augmented ref_count.
+            set_ref_count(count);
+            spawn_and_wait_for_all(list);
+            *sum = root->value;
+            if( root->left ) *sum += x;
+            if( root->right ) *sum += y;
+        }
+        return NULL;
+    }
+};
+
+Value SimpleParallelSumTree( TreeNode* root ) {
+    Value sum;
+    SimpleSumTask& a = *new(tbb::task::allocate_root()) SimpleSumTask(root,&sum);
+    tbb::task::spawn_root_and_wait(a);
+    return sum;
+}
+
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/TreeMaker.h b/xdl/third_party/tbb/examples/task/tree_sum/TreeMaker.h
new file mode 100644
index 00000000..029cbc20
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/TreeMaker.h
@@ -0,0 +1,116 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef TREE_MAKER_H_
+#define TREE_MAKER_H_
+
+#include "tbb/tick_count.h"
+#include "tbb/task.h"
+
+static double Pi = 3.14159265358979;
+
+const bool tbbmalloc = true;
+const bool stdmalloc = false;
+
+template<bool use_tbbmalloc>
+class TreeMaker {
+
+    class SubTreeCreationTask: public tbb::task {
+        TreeNode*& my_root;
+        bool is_continuation;
+        typedef TreeMaker<use_tbbmalloc> MyTreeMaker;
+
+    public:
+        SubTreeCreationTask( TreeNode*& root, long number_of_nodes ) : my_root(root), is_continuation(false) {
+            my_root = MyTreeMaker::allocate_node();
+            my_root->node_count = number_of_nodes;
+            my_root->value = Value(Pi*number_of_nodes);
+        }
+
+        tbb::task* execute() /*override*/ {
+            tbb::task* next = NULL;
+            if( !is_continuation ) {
+                long subtree_size = my_root->node_count - 1;
+                if( subtree_size<1000 ) { /* grainsize */
+                    my_root->left  = MyTreeMaker::do_in_one_thread(subtree_size/2);
+                    my_root->right = MyTreeMaker::do_in_one_thread(subtree_size - subtree_size/2);
+                } else {
+                    // Create tasks before spawning any of them.
+                    tbb::task* a = new( allocate_child() ) SubTreeCreationTask(my_root->left,subtree_size/2);
+                    tbb::task* b = new( allocate_child() ) SubTreeCreationTask(my_root->right,subtree_size - subtree_size/2);
+                    recycle_as_continuation();
+                    is_continuation = true;
+                    set_ref_count(2);
+                    spawn(*b);
+                    next = a;
+                }
+            } 
+            return next;
+        }
+    };
+
+public:
+    static TreeNode* allocate_node() {
+        return use_tbbmalloc? tbb::scalable_allocator<TreeNode>().allocate(1) : new TreeNode;
+    }
+
+    static TreeNode* do_in_one_thread( long number_of_nodes ) {
+        if( number_of_nodes==0 ) {
+            return NULL;
+        } else {
+            TreeNode* n = allocate_node();
+            n->node_count = number_of_nodes;
+            n->value = Value(Pi*number_of_nodes);
+            --number_of_nodes;
+            n->left  = do_in_one_thread( number_of_nodes/2 ); 
+            n->right = do_in_one_thread( number_of_nodes - number_of_nodes/2 );
+            return n;
+        }
+    }
+
+    static TreeNode* do_in_parallel( long number_of_nodes ) {
+        TreeNode* root_node;
+        SubTreeCreationTask& a = *new(tbb::task::allocate_root()) SubTreeCreationTask(root_node, number_of_nodes);
+        tbb::task::spawn_root_and_wait(a);
+        return root_node;
+    }
+
+    static TreeNode* create_and_time( long number_of_nodes, bool silent=false ) {
+        tbb::tick_count t0, t1;
+        TreeNode* root = allocate_node();
+        root->node_count = number_of_nodes;
+        root->value = Value(Pi*number_of_nodes);
+        --number_of_nodes;
+
+        t0 = tbb::tick_count::now();
+        root->left  = do_in_one_thread( number_of_nodes/2 );
+        t1 = tbb::tick_count::now();
+        if ( !silent ) printf ("%24s: time = %.1f msec\n", "half created serially", (t1-t0).seconds()*1000);
+
+        t0 = tbb::tick_count::now();
+        root->right = do_in_parallel( number_of_nodes - number_of_nodes/2 );
+        t1 = tbb::tick_count::now();
+        if ( !silent ) printf ("%24s: time = %.1f msec\n", "half done in parallel", (t1-t0).seconds()*1000);
+
+        return root;
+    }
+};
+
+#endif // TREE_MAKER_H_
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/common.h b/xdl/third_party/tbb/examples/task/tree_sum/common.h
new file mode 100644
index 00000000..ab152e56
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/common.h
@@ -0,0 +1,36 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+typedef float Value;
+
+struct TreeNode {
+    //! Pointer to left subtree
+    TreeNode* left; 
+    //! Pointer to right subtree
+    TreeNode* right;
+    //! Number of nodes in this subtree, including this node.
+    long node_count;
+    //! Value associated with the node.
+    Value value;
+};
+
+Value SerialSumTree( TreeNode* root );
+Value SimpleParallelSumTree( TreeNode* root );
+Value OptimizedParallelSumTree( TreeNode* root );
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/main.cpp b/xdl/third_party/tbb/examples/task/tree_sum/main.cpp
new file mode 100644
index 00000000..2f6ba885
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/main.cpp
@@ -0,0 +1,108 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "common.h"
+
+#include <cstdlib>
+#include <cstdio>
+#include <cstring>
+
+// The performance of this example can be significantly better when
+// the objects are allocated by the scalable_allocator instead of the
+// default "operator new".  The reason is that the scalable_allocator
+// typically packs small objects more tightly than the default "operator new",
+// resulting in a smaller memory footprint, and thus more efficient use of
+// cache and virtual memory.  Also the scalable_allocator works faster for
+// multi-threaded allocations.
+//
+// Pass stdmalloc as the 1st command line parameter to use the default "operator new"
+// and see the performance difference.
+#include "tbb/scalable_allocator.h"
+#include "TreeMaker.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+
+#include "../../common/utility/utility.h"
+
+using namespace std;
+
+void Run( const char* which, Value(*SumTree)(TreeNode*), TreeNode* root, bool silent) {
+    tbb::tick_count t0;
+    if ( !silent ) t0 = tbb::tick_count::now();
+    Value result = SumTree(root);
+    if ( !silent ) printf ("%24s: time = %.1f msec, sum=%g\n", which, (tbb::tick_count::now()-t0).seconds()*1000, result);
+}
+
+int main( int argc, const char *argv[] ) {
+    try{
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        // The 1st argument is the function to obtain 'auto' value; the 2nd is the default value
+        // The example interprets 0 threads as "run serially, then fully subscribed"
+        utility::thread_number_range threads( tbb::task_scheduler_init::default_num_threads, 0 );
+        long number_of_nodes = 10000000;
+        bool silent = false;
+        bool use_stdmalloc = false;
+
+        utility::parse_cli_arguments(argc,argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(number_of_nodes,"number-of-nodes","the number of nodes")
+            .arg(silent,"silent","no output except elapsed time")
+            .arg(use_stdmalloc,"stdmalloc","use standard allocator")
+        );
+
+        TreeNode* root;
+        { // In this scope, TBB will use default number of threads for tree creation
+            tbb::task_scheduler_init init;
+
+            if( use_stdmalloc ) {
+                if ( !silent ) printf("Tree creation using standard operator new\n");
+                root = TreeMaker<stdmalloc>::create_and_time( number_of_nodes, silent );
+            } else {
+                if ( !silent ) printf("Tree creation using TBB scalable allocator\n");
+                root = TreeMaker<tbbmalloc>::create_and_time( number_of_nodes, silent );
+            }
+        }
+
+        // Warm up caches
+        SerialSumTree(root);
+        if ( !silent ) printf("Calculations:\n");
+        if ( threads.first ) {
+            for(int p = threads.first;  p <= threads.last; p = threads.step(p) ) {
+                if ( !silent ) printf("threads = %d\n", p );
+                tbb::task_scheduler_init init( p );
+                Run ( "SimpleParallelSumTree", SimpleParallelSumTree, root, silent );
+                Run ( "OptimizedParallelSumTree", OptimizedParallelSumTree, root, silent );
+            }
+        } else { // Number of threads wasn't set explicitly. Run serial and two parallel versions
+            Run ( "SerialSumTree", SerialSumTree, root, silent );
+            tbb::task_scheduler_init init;
+            Run ( "SimpleParallelSumTree", SimpleParallelSumTree, root, silent );
+            Run ( "OptimizedParallelSumTree", OptimizedParallelSumTree, root, silent );
+        }
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+        return 0;
+    }catch(std::exception& e){
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/msvs/tree_sum.sln b/xdl/third_party/tbb/examples/task/tree_sum/msvs/tree_sum.sln
new file mode 100644
index 00000000..d1117130
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/msvs/tree_sum.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "tree_sum", "tree_sum.vcxproj", "{C931C7A2-074E-4150-9E7A-39A03250411E}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.ActiveCfg = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.Build.0 = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.ActiveCfg = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.Build.0 = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.ActiveCfg = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.Build.0 = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.ActiveCfg = Release|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/msvs/tree_sum.vcxproj b/xdl/third_party/tbb/examples/task/tree_sum/msvs/tree_sum.vcxproj
new file mode 100644
index 00000000..8f968711
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/msvs/tree_sum.vcxproj
@@ -0,0 +1,208 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>tree_sum</ProjectName>
+    <ProjectGuid>{C931C7A2-074E-4150-9E7A-39A03250411E}</ProjectGuid>
+    <RootNamespace>tree_sum</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClInclude Include="..\common.h" />
+    <ClInclude Include="..\TreeMaker.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <ClCompile Include="..\main.cpp" />
+    <ClCompile Include="..\OptimizedParallelSumTree.cpp" />
+    <ClCompile Include="..\SerialSumTree.cpp" />
+    <ClCompile Include="..\SimpleParallelSumTree.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/readme.html b/xdl/third_party/tbb/examples/task/tree_sum/readme.html
new file mode 100644
index 00000000..c2e7d5bc
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/readme.html
@@ -0,0 +1,423 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Tree_sum sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Tree_sum sample</h1>
+	</div>
+	
+	<p>
+		This directory contains a simple example that sums values in a tree.
+	<br><br>
+		The example exhibits some speedup, but not a lot,  because it quickly saturates 
+		the system bus on a multiprocessor.  For good speedup, there needs to be 
+		more computation cycles per memory reference.  The point of the example 
+		is to teach how to use the raw task interface, so the computation is
+		deliberately trivial.
+	<br><br>
+		The performance of this example is better when objects are allocated
+		by the scalable_allocator instead of
+		the default "operator new".  The reason is that the scalable_allocator typically
+		packs small objects more tightly than the default "operator new", resulting in
+		a smaller memory footprint, and thus more efficient use of cache and virtual memory.
+		In addition, the scalable_allocator performs better for multi-threaded allocations.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="SerialSumTree.cpp">SerialSumTree.cpp</a>
+				<dd>Sums sequentially.
+				<dt><a href="SimpleParallelSumTree.cpp">SimpleParallelSumTree.cpp</a><dt>
+				<dd>Sums in parallel without any fancy tricks.
+				<dt><a href="OptimizedParallelSumTree.cpp">OptimizedParallelSumTree.cpp</a><dt>
+				<dd>Sums in parallel, using "recycling" and "continuation-passing" tricks. 
+					In this case, it is only slightly faster than the simple version.
+				<dt><a href="common.h">common.h</a>
+				<dd>Shared declarations.
+				<dt><a href="main.cpp">main.cpp</a>
+				<dd>Main program which parses command line options and runs the algorithm.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>tree_sum <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>tree_sum [<i>n-of-threads</i>=value] [<i>number-of-nodes</i>=value] [<i>silent</i>] [<i>stdmalloc</i>]</tt>
+				<dt><tt>tree_sum [<i>n-of-threads</i> [<i>number-of-nodes</i>]] [<i>silent</i>] [<i>stdmalloc</i>]</tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for the default.<br>
+					<i>number-of-nodes</i> is the number of nodes in the tree.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+					<i>stdmalloc</i> - causes the default "operator new" to be used for memory allocations instead of the scalable_allocator.<br>
+
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size and the desired number of threads, e.g., <tt>tree_sum&nbsp;4&nbsp;100000</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/task/tree_sum/xcode/tree_sum.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/task/tree_sum/xcode/tree_sum.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..c0ad9721
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task/tree_sum/xcode/tree_sum.xcodeproj/project.pbxproj
@@ -0,0 +1,278 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		05593A110B8F4F4500DE73AB /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 05593A0C0B8F4F4500DE73AB /* main.cpp */; };
+		05593A120B8F4F4500DE73AB /* OptimizedParallelSumTree.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 05593A0D0B8F4F4500DE73AB /* OptimizedParallelSumTree.cpp */; };
+		05593A130B8F4F4500DE73AB /* SerialSumTree.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 05593A0E0B8F4F4500DE73AB /* SerialSumTree.cpp */; };
+		05593A140B8F4F4500DE73AB /* SimpleParallelSumTree.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 05593A0F0B8F4F4500DE73AB /* SimpleParallelSumTree.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C5895D218B6AA800DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		05593A0B0B8F4F4500DE73AB /* common.h */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.c.h; name = common.h; path = ../common.h; sourceTree = SOURCE_ROOT; };
+		05593A0C0B8F4F4500DE73AB /* main.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = main.cpp; path = ../main.cpp; sourceTree = SOURCE_ROOT; };
+		05593A0D0B8F4F4500DE73AB /* OptimizedParallelSumTree.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = OptimizedParallelSumTree.cpp; path = ../OptimizedParallelSumTree.cpp; sourceTree = SOURCE_ROOT; };
+		05593A0E0B8F4F4500DE73AB /* SerialSumTree.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = SerialSumTree.cpp; path = ../SerialSumTree.cpp; sourceTree = SOURCE_ROOT; };
+		05593A0F0B8F4F4500DE73AB /* SimpleParallelSumTree.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = SimpleParallelSumTree.cpp; path = ../SimpleParallelSumTree.cpp; sourceTree = SOURCE_ROOT; };
+		05593A4A0B8F51E000DE73AB /* tree_sum */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = tree_sum; sourceTree = BUILT_PRODUCTS_DIR; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* tree_sum */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = tree_sum;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				05593A0B0B8F4F4500DE73AB /* common.h */,
+				05593A0C0B8F4F4500DE73AB /* main.cpp */,
+				05593A0D0B8F4F4500DE73AB /* OptimizedParallelSumTree.cpp */,
+				05593A0E0B8F4F4500DE73AB /* SerialSumTree.cpp */,
+				05593A0F0B8F4F4500DE73AB /* SimpleParallelSumTree.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				05593A4A0B8F51E000DE73AB /* tree_sum */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* tree_sum */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "tree_sum" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C5895D218B6AA800DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tree_sum;
+			productInstallPath = "$(HOME)/bin";
+			productName = tree_sum;
+			productReference = 05593A4A0B8F51E000DE73AB /* tree_sum */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "tree_sum" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* tree_sum */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* tree_sum */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				05593A110B8F4F4500DE73AB /* main.cpp in Sources */,
+				05593A120B8F4F4500DE73AB /* OptimizedParallelSumTree.cpp in Sources */,
+				05593A130B8F4F4500DE73AB /* SerialSumTree.cpp in Sources */,
+				05593A140B8F4F4500DE73AB /* SimpleParallelSumTree.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = tree_sum;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = tree_sum;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+					"-ltbbmalloc_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+					"-ltbbmalloc",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "tree_sum" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "tree_sum" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/Makefile b/xdl/third_party/tbb/examples/task_arena/fractal/Makefile
new file mode 100644
index 00000000..6ed62ad9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/Makefile
@@ -0,0 +1,87 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+NAME=Fractal
+ARGS=auto
+PERF_RUN_ARGS=auto 1 1000000 silent
+LIGHT_ARGS=auto 1 1000
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+LIBS+= -lrt 
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+include ../../common/gui/Makefile.gmake
+
+SOURCES= ../../common/gui/$(UI)video.cpp fractal.cpp main.cpp
+
+override CXXFLAGS += $(UI_CXXFLAGS)
+
+all:	release test
+
+resources:
+ifeq ($(UI),mac)
+	mkdir -p $(APPRES)/en.lproj $(NAME).app/Contents/MacOS
+	cp ../../common/gui/xcode/tbbExample/tbbExample-Info.plist $(NAME).app/Contents/Info.plist
+	cp ../../common/gui/xcode/tbbExample/PkgInfo $(NAME).app/Contents
+	cp ../../common/gui/xcode/tbbExample/en.lproj/* $(APPRES)/en.lproj
+endif # macOS*
+
+release: $(SOURCES) resources
+ifeq ($(UI),mac)
+	$(CXX_UI) -O2 -DNDEBUG $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(EXE) $(SOURCES) $(MACUIOBJS) -ltbb $(LIBS)
+
+debug: resources
+ifeq ($(UI),mac)
+	$(CXX_UI) -g -O0 -DTBB_USE_DEBUG $(CXXFLAGS) -c $(MACUISOURCES)
+endif # macOS
+	$(CXX) -g -O0 -DTBB_USE_DEBUG $(CXXFLAGS) -o $(EXE) $(SOURCES) $(MACUIOBJS) -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) $(EXE) *.o *.d
+ifeq ($(UI),mac)
+	rm -rf $(NAME).app
+endif
+
+test:
+ifeq ($(UI),mac)
+	export DYLD_LIBRARY_PATH="$(DYLD_LIBRARY_PATH):$(TBBLIBSPATH)"; $(run_cmd) ./$(EXE) $(ARGS)
+else
+	$(run_cmd) ./$(EXE) $(ARGS)
+endif
+
+light_test:
+ifeq ($(UI),mac)
+	export DYLD_LIBRARY_PATH="$(DYLD_LIBRARY_PATH):$(TBBLIBSPATH)"; $(run_cmd) ./$(EXE) $(LIGHT_ARGS)
+else
+	$(run_cmd) ./$(EXE) $(LIGHT_ARGS)
+endif
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(EXE) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/Makefile.windows b/xdl/third_party/tbb/examples/task_arena/fractal/Makefile.windows
new file mode 100644
index 00000000..3327abd0
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/Makefile.windows
@@ -0,0 +1,66 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Fractal
+ARGS=auto
+PERF_RUN_ARGS=auto 1 1000000 silent
+LIGHT_ARGS=auto 1 1000
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+# Uncomment one of next lines to choose user interface type (console, gdiplus, direct draw)
+#UI = con
+UI = gdi
+#UI = dd
+
+# Machine architecture, auto-detected from TBB_TARGET_ARCH by default
+# Use XARCH variable to change it. See index.html for more information
+ARCH0 = $(TBB_TARGET_ARCH)-
+ARCH1 = $(ARCH0:ia32-=x86)
+ARCH2 = $(ARCH1:intel64-=AMD64)
+XARCH = $(ARCH2:-=x86)
+
+MAKEINC = ../../common/gui/Makefile.win
+SOURCES = fractal.cpp main.cpp 
+
+all: release test
+release: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=$(UI) CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS)" LFLAGS="$(LDFLAGS) tbb.lib $(LIBS)" XARCH=$(XARCH) RCNAME=gui SOURCE="$(SOURCES)" EXE=$(PROG).exe build_one
+debug: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=$(UI) DEBUG=_debug CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS) /D TBB_USE_DEBUG" LFLAGS="$(LDFLAGS) tbb_debug.lib $(LIBS)" XARCH=$(XARCH) RCNAME=gui SOURCE="$(SOURCES)" EXE=$(PROG).exe build_one
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest msvs\gui.res
+test:
+	$(PROG) $(ARGS)
+light_test:
+	$(PROG) $(LIGHT_ARGS)
+
+perf_build: compiler_check
+	@$(MAKE) -f $(MAKEINC) UI=con CXX="$(CXX)" CXXFLAGS="$(CXXFLAGS)" LFLAGS="$(LDFLAGS) tbb.lib $(LIBS)" XARCH=$(XARCH) RCNAME=gui SOURCE="$(SOURCES) " EXE=$(PROG).exe build_one
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
+
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
+
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/fractal.cpp b/xdl/third_party/tbb/examples/task_arena/fractal/fractal.cpp
new file mode 100644
index 00000000..b066d798
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/fractal.cpp
@@ -0,0 +1,305 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "fractal.h"
+
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range2d.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task_arena.h"
+#include "tbb/task_group.h"
+#include "tbb/tick_count.h"
+
+#include <math.h>
+#include <stdio.h>
+
+// Included for __TBB_CPP11_LAMBDAS_PRESENT definition
+#include "tbb/tbb_config.h"
+
+video *v;
+extern bool silent;
+extern bool schedule_auto;
+extern int grain_size;
+
+color_t fractal::calc_one_pixel( int x0, int y0 ) const {
+    unsigned int iter;
+    double fx0, fy0, xtemp, x, y, mu;
+
+    color_t color;
+
+    fx0 = (double)x0 - (double) size_x / 2.0;
+    fy0 = (double)y0 - (double) size_y / 2.0;
+    fx0 = fx0 / magn + cx;
+    fy0 = fy0 / magn + cy;
+
+    iter = 0; x = 0; y = 0;
+    mu = 0;
+
+    while (((x*x + y*y) <= 4) && (iter < max_iterations)) {
+        xtemp = x*x - y*y + fx0;
+        y = 2*x*y + fy0;
+        x = xtemp;
+        mu += exp(-sqrt(x*x+y*y));
+        iter++;
+    }
+
+    if (iter == max_iterations) {
+        // point corresponds to the mandelbrot set
+        color = v->get_color(255, 255, 255);
+        return color;
+    }
+
+    int b = (int)(256*mu);
+    int g = (b/8);
+    int r = (g/16);
+
+    b = b>255 ? 255 : b;
+    g = g>255 ? 255 : g;
+    r = r>255 ? 255 : r;
+
+    color = v->get_color(r, g, b);
+    return color;
+}
+
+void fractal::clear() {
+    drawing_area area( off_x, off_y, size_x, size_y, dm ) ;
+
+    // fill the rendering area with black color
+    for (int y=0; y<size_y; ++y) {
+        area.set_pos( 0, y );
+        for (int x=0; x<size_x; ++x) {
+            area.put_pixel( v->get_color(0, 0, 0) );
+        }
+    }
+}
+
+void fractal::draw_border( bool is_active ) {
+    color_t color = is_active ? v->get_color(0, 255, 0) // green color
+                                : v->get_color(96, 128, 96); // green-gray color
+
+    // top border
+    drawing_area area0( off_x-1, off_y-1, size_x+2, 1, dm );
+    for (int i=-1; i<size_x+1; ++i)
+        area0.put_pixel(color);
+    // bottom border
+    drawing_area area1( off_x-1, off_y+size_y, size_x+2, 1, dm );
+    for (int i=-1; i<size_x+1; ++i)
+        area1.put_pixel(color);
+    // left border
+    drawing_area area2( off_x-1, off_y, 1, size_y+2, dm );
+    for (int i=0; i<size_y; ++i)
+        area2.set_pixel(0, i, color);
+    // right border
+    drawing_area area3( size_x+off_x, off_y, 1, size_y+2, dm );
+    for (int i=0; i<size_y; ++i)
+        area3.set_pixel(0, i, color);
+}
+
+void fractal::render_rect( int x0, int y0, int x1, int y1 ) const {
+    // render the specified rectangle area
+    drawing_area area(off_x+x0, off_y+y0, x1-x0, y1-y0, dm);
+    for ( int y=y0; y<y1; ++y ) {
+        area.set_pos( 0, y-y0 );
+        for ( int x=x0; x<x1; ++x ) {
+            area.put_pixel( calc_one_pixel( x, y ) );
+        }
+    }
+}
+
+class fractal_body {
+    fractal &f;
+public:
+    void operator()( tbb::blocked_range2d<int> &r ) const {
+        if ( v->next_frame() )
+            f.render_rect( r.cols().begin(), r.rows().begin(), r.cols().end(), r.rows().end() );
+    }
+
+    fractal_body( fractal &_f ) : f(_f) {
+    }
+};
+
+void fractal::render( tbb::task_group_context &context ) {
+    // Make copy of fractal object and render fractal with parallel_for with
+    // the provided context and partitioner chosen by schedule_auto.
+    // Updates to fractal are not reflected in the render.
+    fractal f = *this;
+    fractal_body body(f);
+
+    if( schedule_auto )
+        tbb::parallel_for( tbb::blocked_range2d<int>(0, size_y, grain_size, 0, size_x, grain_size ),
+                body, tbb::auto_partitioner(), context);
+    else
+        tbb::parallel_for( tbb::blocked_range2d<int>(0, size_y, grain_size, 0, size_x, grain_size ),
+                body, tbb::simple_partitioner(), context);
+}
+
+void fractal::run( tbb::task_group_context &context ) {
+    clear();
+    context.reset();
+    render( context );
+}
+
+bool fractal::check_point( int x, int y ) const {
+    return x >= off_x && x <= off_x+size_x &&
+            y >= off_y && y <= off_y+size_y;
+}
+
+void fractal_group::calc_fractal( int num ) {
+    // calculate the fractal
+    fractal &f = num ? f1 : f0;
+
+    tbb::tick_count t0 = tbb::tick_count::now();
+    while ( v->next_frame() && num_frames[num] != 0 ) {
+        f.run( context[num] );
+        if ( num_frames[num]>0 ) num_frames[num] -= 1;
+    }
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    if ( !silent ) {
+        printf("  %s fractal finished. Time: %g\n", num ? "Second" : "First", (t1-t0).seconds());
+    }
+}
+
+void fractal_group::set_priorities() {
+    // set the high priority for the active area and the normal priority for another area
+    context[active].set_priority( tbb::priority_high );
+    context[active^1].set_priority( tbb::priority_low );
+}
+
+void fractal_group::switch_priorities( int new_active ) {
+    if( new_active!=-1 ) active = new_active;
+    else                 active = 1-active; // assumes 'active' is only 0 or 1
+    set_priorities();
+    draw_borders();
+}
+
+void fractal_group::set_num_frames_at_least( int n ) {
+    if ( num_frames[0]<n ) num_frames[0] = n;
+    if ( num_frames[1]<n ) num_frames[1] = n;
+}
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+class task_group_body {
+    fractal_group &fg;
+public:
+    task_group_body(fractal_group &_fg) : fg(_fg) { }
+
+    void operator() () const { fg.calc_fractal( 1 ); }
+};
+
+class arena_body {
+    task_group_body &tg_body;
+    tbb::task_group &task_group;
+public:
+    arena_body( task_group_body &_tg_body, tbb::task_group &_task_group )
+        :  tg_body( _tg_body ), task_group( _task_group )  { }
+
+    void operator() () const { task_group.run( tg_body ); }
+};
+
+class arena_body_wait {
+    tbb::task_group &group;
+public:
+    arena_body_wait( tbb::task_group &gr ) : group(gr) { }
+
+    void operator() () const { group.wait(); }
+};
+#endif
+
+void fractal_group::run( bool create_second_fractal ) {
+    // initialize task scheduler
+    tbb::task_scheduler_init init( num_threads );
+
+    // create contexts to manage fractal priorities
+    context = new tbb::task_group_context[2];
+
+    set_priorities();
+    draw_borders();
+
+    tbb::task_arena arena;
+    tbb::task_group gr;
+
+    // the second fractal is calculating on separated thread
+    if ( create_second_fractal ) {
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        arena.execute( [&] {
+            gr.run( [&] { calc_fractal( 1 ); } );
+        } );
+#else
+        task_group_body tg_body( *this );
+        arena_body a_body( tg_body, gr );
+        arena.execute( a_body );
+#endif
+    }
+
+    // calculate the first fractal
+    calc_fractal( 0 );
+
+    if ( create_second_fractal ) {
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        // wait for second fractal
+        arena.execute( [&] { gr.wait(); } );
+#else
+        arena.execute( arena_body_wait( gr ) );
+#endif
+    }
+
+    delete[] context;
+}
+
+void fractal_group::draw_borders() {
+    f0.draw_border( active==0 );
+    f1.draw_border( active==1 );
+}
+
+fractal_group::fractal_group( const drawing_memory &_dm, int _num_threads, unsigned int _max_iterations, int _num_frames ) : f0(_dm), f1(_dm), num_threads(_num_threads) {
+    // set rendering areas
+    f0.size_x = f1.size_x = _dm.sizex/2-4;
+    f0.size_y = f1.size_y = _dm.sizey-4;
+    f0.off_x = f0.off_y = f1.off_y = 2;
+    f1.off_x = f0.size_x+4+2;
+
+    // set fractals parameters
+    f0.cx = -0.6f; f0.cy = 0.0f; f0.magn = 200.0f;
+    f1.cx = -0.6f; f1.cy = 0.0f; f1.magn = 200.0f;
+    f0.max_iterations = f1.max_iterations = _max_iterations;
+
+    // initially the first fractal is active
+    active = 0;
+
+    num_frames[0] = num_frames[1] = _num_frames;
+}
+
+void fractal_group::mouse_click( int x, int y ) {
+    // assumption that the point is not inside any fractal area
+    int new_active = -1;
+
+    if ( f0.check_point( x, y ) ) {
+        // the point is inside the first fractal area
+        new_active = 0;
+    } else if ( f1.check_point( x, y ) ) {
+        // the point is inside the second fractal area
+        new_active = 1;
+    }
+
+    if ( new_active != -1 && new_active != active ) {
+        switch_priorities( new_active );
+    }
+}
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/fractal.h b/xdl/third_party/tbb/examples/task_arena/fractal/fractal.h
new file mode 100644
index 00000000..6712df7c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/fractal.h
@@ -0,0 +1,163 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef FRACTAL_H_
+#define FRACTAL_H_
+
+#include "../../common/gui/video.h"
+
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/atomic.h"
+
+//! Fractal class
+class fractal {
+    //! Left corner of the fractal area
+    int off_x, off_y;
+    //! Size of the fractal area
+    int size_x, size_y;
+
+    //! Fractal properties
+    float cx, cy;
+    float magn;
+    float step;
+    unsigned int max_iterations;
+
+    //! Drawing memory object for rendering
+    const drawing_memory &dm;
+
+    //! One pixel calculation routine
+    color_t calc_one_pixel( int x, int y ) const;
+    //! Clears the fractal area
+    void clear();
+    //! Draws the border around the fractal area
+    void draw_border( bool is_active );
+    //! Renders the fractal
+    void render( tbb::task_group_context &context );
+    //! Check if the point is inside the fractal area
+    bool check_point( int x, int y ) const;
+
+public:
+    //! Constructor
+    fractal( const drawing_memory &dm ) : step(0.2), dm(dm) {
+#if _MSC_VER && _WIN64 && !__INTEL_COMPILER
+        // Workaround for MSVC x64 compiler issue
+        volatile int i=0;
+#endif
+    }
+    //! Runs the fractal calculation
+    void run( tbb::task_group_context &context );
+    //! Renders the fractal rectangular area
+    void render_rect( int x0, int y0, int x1, int y1 ) const;
+
+    void move_up()   { cy += step; }
+    void move_down() { cy -= step; }
+    void move_left() { cx += step; }
+    void move_right(){ cx -= step; }
+
+    void zoom_in() { magn *= 2.; step /= 2.; }
+    void zoom_out(){ magn /= 2.; step *= 2.; }
+
+    void quality_inc() { max_iterations += max_iterations/2; }
+    void quality_dec() { max_iterations -= max_iterations/2; }
+
+    friend class fractal_group;
+};
+
+//! The group of fractals
+class fractal_group {
+    //! Fractals definition
+    fractal f0, f1;
+    //! Number of frames to calculate
+    tbb::atomic<int> num_frames[2];
+    //! Task group contexts to manage priorities
+    tbb::task_group_context *context;
+
+    //! Border type enumeration
+    enum BORDER_TYPE {
+        BORDER_INACTIVE = 0,
+        BORDER_ACTIVE
+    };
+
+    //! The number of the threads
+    int num_threads;
+    //! The active (high priority) fractal number
+    int active;
+
+    //! Draws the borders around the fractals
+    void draw_borders();
+    //! Sets priorities for fractals calculations
+    void set_priorities();
+
+public:
+    //! Constructor
+    fractal_group( const drawing_memory &_dm,
+            int num_threads = tbb::task_scheduler_init::automatic,
+            unsigned int max_iterations = 100000, int num_frames = 1 );
+    //! Run calculation
+    void run( bool create_second_fractal=true );
+    //! Mouse event handler
+    void mouse_click( int x, int y );
+    //! Fractal calculation routine
+    void calc_fractal( int num );
+    //! Get number of threads
+    int get_num_threads() const { return num_threads; }
+    //! Reset the number of frames to be not less than the given value
+    void set_num_frames_at_least( int n );
+    //! Switches the priorities of two fractals
+    void switch_priorities( int new_active=-1 );
+    //! Get active fractal
+    fractal& get_active_fractal() { return  active ? f1 : f0; }
+
+    void active_fractal_zoom_in() {
+        get_active_fractal().zoom_in();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_zoom_out() {
+        get_active_fractal().zoom_out();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_quality_inc() {
+        get_active_fractal().quality_inc();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_quality_dec() {
+        get_active_fractal().quality_dec();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_move_up() {
+        get_active_fractal().move_up();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_move_down() {
+        get_active_fractal().move_down();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_move_left() {
+        get_active_fractal().move_left();
+        context[active].cancel_group_execution();
+    }
+    void active_fractal_move_right() {
+        get_active_fractal().move_right();
+        context[active].cancel_group_execution();
+    }
+};
+
+#endif /* FRACTAL_H_ */
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/fractal_video.h b/xdl/third_party/tbb/examples/task_arena/fractal/fractal_video.h
new file mode 100644
index 00000000..c9e01414
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/fractal_video.h
@@ -0,0 +1,90 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef FRACTAL_VIDEO_H_
+#define FRACTAL_VIDEO_H_
+
+#include "../../common/gui/video.h"
+#include "fractal.h"
+
+extern video *v;
+extern bool single;
+
+class fractal_video : public video
+{
+    fractal_group *fg;
+
+private:
+    void on_mouse( int x, int y, int key ) {
+        if( key == 1 ) {
+            if ( fg ) {
+                fg->set_num_frames_at_least(20);
+                fg->mouse_click( x, y );
+            }
+        }
+    }
+
+    void on_key( int key ) {
+        switch ( key&0xff ) {
+            case esc_key:
+                running = false; break;
+            case ' ': // space
+                if( fg ) fg->switch_priorities(); break;
+
+            case 'q':
+                if( fg ) fg->active_fractal_zoom_in(); break;
+            case 'e':
+                if( fg ) fg->active_fractal_zoom_out(); break;
+
+            case 'r':
+                if( fg ) fg->active_fractal_quality_inc(); break;
+            case 'f':
+                if( fg ) fg->active_fractal_quality_dec(); break;
+
+            case 'w':
+                if( fg ) fg->active_fractal_move_up(); break;
+            case 'a':
+                if( fg ) fg->active_fractal_move_left(); break;
+            case 's':
+                if( fg ) fg->active_fractal_move_down(); break;
+            case 'd':
+                if( fg ) fg->active_fractal_move_right(); break;
+        }
+        if( fg ) fg->set_num_frames_at_least(20);
+    }
+
+    void on_process() {
+        if ( fg ) {
+            fg->run( !single );
+        }
+    }
+
+public:
+    fractal_video() :fg(0) {
+        title = "Dynamic Priorities in TBB: Fractal Example";
+        v = this;
+    }
+
+    void set_fractal_group( fractal_group &_fg ) {
+        fg = &_fg;
+    }
+};
+
+#endif /* FRACTAL_VIDEO_H_ */
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/main.cpp b/xdl/third_party/tbb/examples/task_arena/fractal/main.cpp
new file mode 100644
index 00000000..ce8f01af
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/main.cpp
@@ -0,0 +1,92 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define VIDEO_WINMAIN_ARGS
+
+#include <stdio.h>
+#include <iostream>
+
+#include "fractal.h"
+#include "fractal_video.h"
+
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+
+#include "../../common/utility/utility.h"
+
+bool silent = false;
+bool single = false;
+bool schedule_auto = false;
+int grain_size = 8;
+
+int main(int argc, char *argv[])
+{
+    try{
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        // It is used for console mode for test with different number of threads and also has
+        // meaning for GUI: threads.first  - use separate event/updating loop thread (>0) or not (0).
+        //                  threads.second - initialization value for scheduler
+        utility::thread_number_range threads( tbb::task_scheduler_init::default_num_threads );
+        int num_frames = -1;
+        int max_iterations = 1000000;
+
+        // command line parsing
+        utility::parse_cli_arguments(argc,argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(num_frames,"n-of-frames","number of frames the example processes internally")
+            .positional_arg(max_iterations,"max-of-iterations","maximum number of the fractal iterations")
+            .positional_arg(grain_size,"grain-size","the grain size value")
+            .arg(schedule_auto, "use-auto-partitioner", "use tbb::auto_partitioner")
+            .arg(silent, "silent", "no output except elapsed time")
+            .arg(single, "single", "process only one fractal")
+        );
+
+        fractal_video video;
+
+        // video layer init
+        if ( video.init_window(1024, 512) ) {
+            video.calc_fps = false;
+            video.threaded = threads.first > 0;
+            // initialize fractal group
+            fractal_group fg( video.get_drawing_memory(), threads.last, max_iterations, num_frames );
+            video.set_fractal_group( fg );
+            // main loop
+            video.main_loop();
+        }
+        else if ( video.init_console() ) {
+            // in console mode we always have limited number of frames
+            num_frames = num_frames<0 ? 1 : num_frames;
+            for(int p = threads.first;  p <= threads.last; p = threads.step(p) ) {
+                if ( !silent ) printf("Threads = %d\n", p);
+                fractal_group fg( video.get_drawing_memory(), p, max_iterations, num_frames );
+                fg.run( !single );
+            }
+        }
+        video.terminate();
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+        return 0;
+    } catch ( std::exception& e ) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+}
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/msvs/fractal.sln b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/fractal.sln
new file mode 100644
index 00000000..6b47c2bf
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/fractal.sln
@@ -0,0 +1,40 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "fractal", "fractal.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A2527}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		_GDIRelease|Win32 = _GDIRelease|Win32
+		_GDIRelease|x64 = _GDIRelease|x64
+		DDDebug|Win32 = DDDebug|Win32
+		DDDebug|x64 = DDDebug|x64
+		DDRelease|Win32 = DDRelease|Win32
+		DDRelease|x64 = DDRelease|x64
+		GDIDebug|Win32 = GDIDebug|Win32
+		GDIDebug|x64 = GDIDebug|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|Win32.ActiveCfg = GDIRelease|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|Win32.Build.0 = GDIRelease|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|x64.ActiveCfg = GDIRelease|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}._GDIRelease|x64.Build.0 = GDIRelease|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|Win32.ActiveCfg = DDDebug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|Win32.Build.0 = DDDebug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|x64.ActiveCfg = DDDebug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDDebug|x64.Build.0 = DDDebug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|Win32.ActiveCfg = DDRelease|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|Win32.Build.0 = DDRelease|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|x64.ActiveCfg = DDRelease|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.DDRelease|x64.Build.0 = DDRelease|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|Win32.ActiveCfg = GDIDebug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|Win32.Build.0 = GDIDebug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|x64.ActiveCfg = GDIDebug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A2527}.GDIDebug|x64.Build.0 = GDIDebug|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/msvs/fractal.vcxproj b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/fractal.vcxproj
new file mode 100644
index 00000000..34ad7858
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/fractal.vcxproj
@@ -0,0 +1,450 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="GDIDebug|Win32">
+      <Configuration>GDIDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="GDIDebug|x64">
+      <Configuration>GDIDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="GDIRelease|Win32">
+      <Configuration>GDIRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="GDIRelease|x64">
+      <Configuration>GDIRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|Win32">
+      <Configuration>DDDebug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDDebug|x64">
+      <Configuration>DDDebug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|Win32">
+      <Configuration>DDRelease</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="DDRelease|x64">
+      <Configuration>DDRelease</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>fractal</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A2527}</ProjectGuid>
+    <RootNamespace>fractal</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'">
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>MaxSpeed</Optimization>
+      <FavorSizeOrSpeed>Speed</FavorSizeOrSpeed>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_WINDOWS;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;$(DXSDK_DIR)\lib\x86;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">
+    <PreBuildEvent>
+      <Command>..\..\..\common\gui\dxcheck.bat</Command>
+    </PreBuildEvent>
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <OmitFramePointers>true</OmitFramePointers>
+      <WholeProgramOptimization>true</WholeProgramOptimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;$(DXSDK_DIR)\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_WINDOWS;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;$(DXSDK_DIR)\lib\x64;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Windows</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\fractal.cpp" />
+    <ClCompile Include="..\main.cpp" />
+    <ClCompile Include="..\..\..\common\gui\d2dvideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='GDIDebug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='GDIDebug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='GDIRelease|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='GDIRelease|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+    <ClCompile Include="..\..\..\common\gui\gdivideo.cpp">
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDDebug|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDDebug|x64'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDRelease|Win32'">true</ExcludedFromBuild>
+      <ExcludedFromBuild Condition="'$(Configuration)|$(Platform)'=='DDRelease|x64'">true</ExcludedFromBuild>
+    </ClCompile>
+  </ItemGroup>
+  <ItemGroup>
+    <ClInclude Include="..\fractal.h" />
+    <ClInclude Include="..\fractal_video.h" />
+    <ClInclude Include="resource.h" />
+    <ClInclude Include="..\..\..\common\gui\video.h" />
+    <ClInclude Include="..\..\..\common\gui\winvideo.h" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="gui.ico" />
+    <None Include="small.ico" />
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <ItemGroup>
+    <ResourceCompile Include="gui.rc" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/msvs/gui.ico b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/gui.ico
new file mode 100644
index 00000000..d551aa3a
Binary files /dev/null and b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/gui.ico differ
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/msvs/gui.rc b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/gui.rc
new file mode 100644
index 00000000..5a13d046
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/gui.rc
@@ -0,0 +1,90 @@
+// Microsoft Visual C++ generated resource script.
+//
+#include "resource.h"
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#define APSTUDIO_HIDDEN_SYMBOLS
+#include "windows.h"
+#undef APSTUDIO_HIDDEN_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// English (U.S.) resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_ENU)
+#ifdef _WIN32
+LANGUAGE LANG_ENGLISH, SUBLANG_ENGLISH_US
+#pragma code_page(1252)
+#endif //_WIN32
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Icon
+//
+
+// Icon with lowest ID value placed first to ensure application icon
+// remains consistent on all systems.
+IDI_GUI   ICON                    "gui.ico"
+IDI_SMALL               ICON                    "small.ico"
+
+
+#ifdef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// TEXTINCLUDE
+//
+
+1 TEXTINCLUDE 
+BEGIN
+    "resource.h\0"
+END
+
+2 TEXTINCLUDE 
+BEGIN
+    "#define APSTUDIO_HIDDEN_SYMBOLS\r\n"
+    "#include ""windows.h""\r\n"
+    "#undef APSTUDIO_HIDDEN_SYMBOLS\r\n"
+    "\0"
+END
+
+3 TEXTINCLUDE 
+BEGIN
+    "\r\n"
+    "\0"
+END
+
+#endif    // APSTUDIO_INVOKED
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// String Table
+//
+
+STRINGTABLE 
+BEGIN
+    IDS_APP_TITLE           "gui"
+    IDC_GUI   "GUI"
+END
+
+#endif    // English (U.S.) resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/msvs/resource.h b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/resource.h
new file mode 100644
index 00000000..23e23a68
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/resource.h
@@ -0,0 +1,28 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define IDC_MYICON                      2
+#define IDD_GUI                         102
+#define IDS_APP_TITLE                   103
+#define IDI_GUI                         107
+#define IDI_SMALL                       108
+#define IDC_GUI                         109
+#define IDR_MAINFRAME                   128
+#define IDC_STATIC                      -1
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/msvs/small.ico b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/small.ico
new file mode 100644
index 00000000..d551aa3a
Binary files /dev/null and b/xdl/third_party/tbb/examples/task_arena/fractal/msvs/small.ico differ
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/readme.html b/xdl/third_party/tbb/examples/task_arena/fractal/readme.html
new file mode 100644
index 00000000..c0538ac3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/readme.html
@@ -0,0 +1,447 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Fractal sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Fractal sample</h1>
+	</div>
+	
+	<p>
+		The example calculates two classical Mandelbrot fractals with different priorities. 
+	<br><br>
+		The application window is divided into two areas where fractals are rendered. With mouse click on an area the user can change the priority of the calculating fractal. In the clicked area the fractal priority is changed to be "high" and the priority of the other fractal is changed to "low". The fractal with "high" priority we will call active.
+		The example also has the console mode but in this mode the priorities could not be changed during execution.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="main.cpp">main.cpp</a>
+				<dd>Main program which parses command line options and runs the fractals calculation in GUI or Console mode.
+				<dt><a href="fractal.h">fractal.h</a>
+				<dd>Interfaces of fractal and fractal_group classes.
+				<dt><a href="fractal.cpp">fractal.cpp</a>
+				<dd>Implementations of fractal and fractal_group classes.
+				<dt><a href="fractal_video.h">fractal_video.h</a>
+				<dd>GUI mode support interface.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>fractal <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>fractal [<i>n-of-threads=value</i>] [<i>n-of-frames=value</i>] [<i>max-of-iterations=value</i>] [<i>grain-size=value</i>] [<i>silent</i>] [<i>single</i>]</tt>
+				<dt><tt>fractal [<i>n-of-threads</i> [<i>n-of-frames</i> [<i>max-of-iterations</i> [<i>grain-size</i>]]]] [<i>silent</i>] [<i>single</i>]</tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>n-of-frames</i> is a number of frames the example processes internally.<br>
+					<i>max-of-iterations</i> is a maximum number of the fractal iterations.<br>
+					<i>grain-size</i> is an optional grain size, must be a positive integer. <br>
+					<i>use-auto-partitioner</i> - use tbb::auto_partitioner.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+					<i>single</i> - process only one fractal.<br>
+
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small fractal iterations number and the desired number of threads, e.g., <tt>fractal&nbsp;4&nbsp;1&nbsp;10000</tt>.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Hot keys</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>
+				The following hot keys can be used in interactive execution mode when the example is compiled with the graphical user interface:
+			</p>
+			<dl>
+				<dt>&lt;left mouse button&gt;
+				<dd>Make the fractal active and change its priority to high
+				<dt>&lt;space&gt;
+				<dd>Switch priorities
+				<dt>&lt;w&gt;
+				<dd>Move the active fractal up
+				<dt>&lt;a&gt;
+				<dd>Move the active fractal to the left
+				<dt>&lt;s&gt;
+				<dd>Move the active fractal down
+				<dt>&lt;d&gt;
+				<dd>Move the active fractal to the right
+				<dt>&lt;q&gt;
+				<dd>Zoom in the active fractal
+				<dt>&lt;e&gt;
+				<dd>Zoom out the active fractal
+				<dt>&lt;r&gt;
+				<dd>Increase quality (count of iterations for each pixel) the active fractal
+				<dt>&lt;f&gt;
+				<dd>Decrease quality (count of iterations for each pixel) the active fractal
+				<dt>&lt;esc&gt;
+				<dd>Stop execution.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..30fcb404
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/project.pbxproj
@@ -0,0 +1,611 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		84011722152D687A00B07E4D /* fractal.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84011720152D687A00B07E4D /* fractal.cpp */; };
+		84B8DA77152CA90100D59B95 /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		84B8DA7A152CA90100D59B95 /* (null) in Resources */ = {isa = PBXBuildFile; };
+		84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */; };
+		84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */ = {isa = PBXBuildFile; fileRef = 84B8DA7E152CA97B00D59B95 /* MainMenu.xib */; };
+		84B8DA87152CA99C00D59B95 /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA82152CA99C00D59B95 /* main.cpp */; };
+		84B8DA9A152CADF400D59B95 /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D017551527431F0008A4E0 /* Cocoa.framework */; };
+		84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 84D01775152744BD0008A4E0 /* OpenGL.framework */; };
+		D31F32341C11798900A77D54 /* macvideo.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA99152CADF400D59B95 /* macvideo.cpp */; };
+		D31F32351C11798E00A77D54 /* main.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA6F152CA90100D59B95 /* main.m */; };
+		D31F32361C11799200A77D54 /* OpenGLView.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA71152CA90100D59B95 /* OpenGLView.m */; };
+		D31F32371C11799500A77D54 /* tbbAppDelegate.m in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */; };
+		D31F323A1C117A6200A77D54 /* iOS.storyboard in Resources */ = {isa = PBXBuildFile; fileRef = D31F32381C117A1700A77D54 /* iOS.storyboard */; };
+		D31F323B1C117BE300A77D54 /* main.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84B8DA82152CA99C00D59B95 /* main.cpp */; };
+		D31F323C1C117BE700A77D54 /* fractal.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 84011720152D687A00B07E4D /* fractal.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C589782191C36D00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+		C3C5897A2191DC7A00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXFileReference section */
+		8401171F152D687A00B07E4D /* fractal_video.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = fractal_video.h; path = ../fractal_video.h; sourceTree = "<group>"; };
+		84011720152D687A00B07E4D /* fractal.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = fractal.cpp; path = ../fractal.cpp; sourceTree = "<group>"; };
+		84011721152D687A00B07E4D /* fractal.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = fractal.h; path = ../fractal.h; sourceTree = "<group>"; };
+		84B8DA13152C9AC600D59B95 /* libtbb.dylib */ = {isa = PBXFileReference; lastKnownFileType = "compiled.mach-o.dylib"; name = libtbb.dylib; path = ../../../../lib/libtbb.dylib; sourceTree = "<group>"; };
+		84B8DA6F152CA90100D59B95 /* main.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = main.m; path = ../../../common/gui/xcode/tbbExample/main.m; sourceTree = "<group>"; };
+		84B8DA70152CA90100D59B95 /* OpenGLView.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = OpenGLView.h; path = ../../../common/gui/xcode/tbbExample/OpenGLView.h; sourceTree = "<group>"; };
+		84B8DA71152CA90100D59B95 /* OpenGLView.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = OpenGLView.m; path = ../../../common/gui/xcode/tbbExample/OpenGLView.m; sourceTree = "<group>"; };
+		84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = tbbAppDelegate.h; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.h; sourceTree = "<group>"; };
+		84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.objc; name = tbbAppDelegate.m; path = ../../../common/gui/xcode/tbbExample/tbbAppDelegate.m; sourceTree = "<group>"; };
+		84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = "tbbExample-Prefix.pch"; path = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch"; sourceTree = "<group>"; };
+		84B8DA7D152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = text.plist.strings; name = en; path = InfoPlist.strings; sourceTree = "<group>"; };
+		84B8DA7F152CA97B00D59B95 /* en */ = {isa = PBXFileReference; lastKnownFileType = file.xib; name = en; path = MainMenu.xib; sourceTree = "<group>"; };
+		84B8DA82152CA99C00D59B95 /* main.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = main.cpp; path = ../main.cpp; sourceTree = "<group>"; };
+		84B8DA99152CADF400D59B95 /* macvideo.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = macvideo.cpp; path = ../../../common/gui/macvideo.cpp; sourceTree = "<group>"; };
+		84D017511527431F0008A4E0 /* tbbExample.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tbbExample.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		84D017551527431F0008A4E0 /* Cocoa.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Cocoa.framework; path = System/Library/Frameworks/Cocoa.framework; sourceTree = SDKROOT; };
+		84D017581527431F0008A4E0 /* AppKit.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = AppKit.framework; path = System/Library/Frameworks/AppKit.framework; sourceTree = SDKROOT; };
+		84D017591527431F0008A4E0 /* CoreData.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = CoreData.framework; path = System/Library/Frameworks/CoreData.framework; sourceTree = SDKROOT; };
+		84D0175A1527431F0008A4E0 /* Foundation.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = Foundation.framework; path = System/Library/Frameworks/Foundation.framework; sourceTree = SDKROOT; };
+		84D01775152744BD0008A4E0 /* OpenGL.framework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.framework; name = OpenGL.framework; path = System/Library/Frameworks/OpenGL.framework; sourceTree = SDKROOT; };
+		D31F321D1C11796D00A77D54 /* tbbExample_ios.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = tbbExample_ios.app; sourceTree = BUILT_PRODUCTS_DIR; };
+		D31F32381C117A1700A77D54 /* iOS.storyboard */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = file.storyboard; name = iOS.storyboard; path = ../iOS.storyboard; sourceTree = "<group>"; };
+		D31F323F1C11B5C900A77D54 /* libtbb.dylib */ = {isa = PBXFileReference; lastKnownFileType = "compiled.mach-o.dylib"; name = libtbb.dylib; path = ../../../../lib/libtbb.dylib; sourceTree = "<group>"; };
+		D31F32401C11B5C900A77D54 /* libtbbmalloc.dylib */ = {isa = PBXFileReference; lastKnownFileType = "compiled.mach-o.dylib"; name = libtbbmalloc.dylib; path = ../../../../lib/libtbbmalloc.dylib; sourceTree = "<group>"; };
+		D31F32901C12E67300A77D54 /* libtbb.dylib */ = {isa = PBXFileReference; lastKnownFileType = "compiled.mach-o.dylib"; name = libtbb.dylib; path = ../../../../lib/ios/libtbb.dylib; sourceTree = "<group>"; };
+		D31F32911C12E67300A77D54 /* libtbbmalloc.dylib */ = {isa = PBXFileReference; lastKnownFileType = "compiled.mach-o.dylib"; name = libtbbmalloc.dylib; path = ../../../../lib/ios/libtbbmalloc.dylib; sourceTree = "<group>"; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		84D0174E1527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84D01776152744BD0008A4E0 /* OpenGL.framework in Frameworks */,
+				84D017561527431F0008A4E0 /* Cocoa.framework in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D31F321A1C11796D00A77D54 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		84011727152D68D200B07E4D /* Sources */ = {
+			isa = PBXGroup;
+			children = (
+				8401171F152D687A00B07E4D /* fractal_video.h */,
+				84B8DA82152CA99C00D59B95 /* main.cpp */,
+				84011720152D687A00B07E4D /* fractal.cpp */,
+				84011721152D687A00B07E4D /* fractal.h */,
+			);
+			name = Sources;
+			sourceTree = "<group>";
+		};
+		84B8DA6C152CA8D900D59B95 /* tbbExample */ = {
+			isa = PBXGroup;
+			children = (
+				84011727152D68D200B07E4D /* Sources */,
+				84B8DA98152CAD8600D59B95 /* Gui layer */,
+				84B8DA7B152CA97B00D59B95 /* Resources */,
+			);
+			name = tbbExample;
+			sourceTree = "<group>";
+		};
+		84B8DA7B152CA97B00D59B95 /* Resources */ = {
+			isa = PBXGroup;
+			children = (
+				D31F32381C117A1700A77D54 /* iOS.storyboard */,
+				84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */,
+				84B8DA7E152CA97B00D59B95 /* MainMenu.xib */,
+			);
+			name = Resources;
+			path = ../../../common/gui/xcode/tbbExample/en.lproj;
+			sourceTree = "<group>";
+		};
+		84B8DA98152CAD8600D59B95 /* Gui layer */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA99152CADF400D59B95 /* macvideo.cpp */,
+				84B8DA6F152CA90100D59B95 /* main.m */,
+				84B8DA70152CA90100D59B95 /* OpenGLView.h */,
+				84B8DA71152CA90100D59B95 /* OpenGLView.m */,
+				84B8DA72152CA90100D59B95 /* tbbAppDelegate.h */,
+				84B8DA73152CA90100D59B95 /* tbbAppDelegate.m */,
+				84B8DA75152CA90100D59B95 /* tbbExample-Prefix.pch */,
+			);
+			name = "Gui layer";
+			sourceTree = "<group>";
+		};
+		84D017461527431F0008A4E0 = {
+			isa = PBXGroup;
+			children = (
+				84B8DA6C152CA8D900D59B95 /* tbbExample */,
+				84D017541527431F0008A4E0 /* Frameworks */,
+				84D017521527431F0008A4E0 /* Products */,
+			);
+			sourceTree = "<group>";
+		};
+		84D017521527431F0008A4E0 /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				84D017511527431F0008A4E0 /* tbbExample.app */,
+				D31F321D1C11796D00A77D54 /* tbbExample_ios.app */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+		84D017541527431F0008A4E0 /* Frameworks */ = {
+			isa = PBXGroup;
+			children = (
+				D31F323F1C11B5C900A77D54 /* libtbb.dylib */,
+				D31F32401C11B5C900A77D54 /* libtbbmalloc.dylib */,
+				D31F32901C12E67300A77D54 /* libtbb.dylib */,
+				D31F32911C12E67300A77D54 /* libtbbmalloc.dylib */,
+				84D01775152744BD0008A4E0 /* OpenGL.framework */,
+				84D017551527431F0008A4E0 /* Cocoa.framework */,
+				84D017571527431F0008A4E0 /* Other Frameworks */,
+			);
+			name = Frameworks;
+			sourceTree = "<group>";
+		};
+		84D017571527431F0008A4E0 /* Other Frameworks */ = {
+			isa = PBXGroup;
+			children = (
+				84B8DA13152C9AC600D59B95 /* libtbb.dylib */,
+				84D017581527431F0008A4E0 /* AppKit.framework */,
+				84D017591527431F0008A4E0 /* CoreData.framework */,
+				84D0175A1527431F0008A4E0 /* Foundation.framework */,
+			);
+			name = "Other Frameworks";
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		84D017501527431F0008A4E0 /* tbbExample */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tbbExample" */;
+			buildPhases = (
+				84D0174D1527431F0008A4E0 /* Sources */,
+				84D0174E1527431F0008A4E0 /* Frameworks */,
+				84D0174F1527431F0008A4E0 /* Resources */,
+			);
+			buildRules = (
+				C3C589782191C36D00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tbbExample;
+			productName = tbbExample;
+			productReference = 84D017511527431F0008A4E0 /* tbbExample.app */;
+			productType = "com.apple.product-type.application";
+		};
+		D31F321C1C11796D00A77D54 /* tbbExample_ios */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = D31F32331C11796D00A77D54 /* Build configuration list for PBXNativeTarget "tbbExample_ios" */;
+			buildPhases = (
+				D31F32191C11796D00A77D54 /* Sources */,
+				D31F321A1C11796D00A77D54 /* Frameworks */,
+				D31F321B1C11796D00A77D54 /* Resources */,
+			);
+			buildRules = (
+				C3C5897A2191DC7A00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = tbbExample_ios;
+			productName = tbbExample_ios;
+			productReference = D31F321D1C11796D00A77D54 /* tbbExample_ios.app */;
+			productType = "com.apple.product-type.application";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		84D017481527431F0008A4E0 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				CLASSPREFIX = tbb;
+				LastUpgradeCheck = 1000;
+				TargetAttributes = {
+					D31F321C1C11796D00A77D54 = {
+						CreatedOnToolsVersion = 7.1.1;
+					};
+				};
+			};
+			buildConfigurationList = 84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "fractal" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 0;
+			knownRegions = (
+				en,
+				Base,
+			);
+			mainGroup = 84D017461527431F0008A4E0;
+			productRefGroup = 84D017521527431F0008A4E0 /* Products */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				84D017501527431F0008A4E0 /* tbbExample */,
+				D31F321C1C11796D00A77D54 /* tbbExample_ios */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXResourcesBuildPhase section */
+		84D0174F1527431F0008A4E0 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA7A152CA90100D59B95 /* (null) in Resources */,
+				84B8DA80152CA97B00D59B95 /* InfoPlist.strings in Resources */,
+				84B8DA81152CA97B00D59B95 /* MainMenu.xib in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D31F321B1C11796D00A77D54 /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D31F323A1C117A6200A77D54 /* iOS.storyboard in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXResourcesBuildPhase section */
+
+/* Begin PBXSourcesBuildPhase section */
+		84D0174D1527431F0008A4E0 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				84B8DA77152CA90100D59B95 /* main.m in Sources */,
+				84B8DA78152CA90100D59B95 /* OpenGLView.m in Sources */,
+				84B8DA79152CA90100D59B95 /* tbbAppDelegate.m in Sources */,
+				84B8DA87152CA99C00D59B95 /* main.cpp in Sources */,
+				84B8DA9A152CADF400D59B95 /* macvideo.cpp in Sources */,
+				84011722152D687A00B07E4D /* fractal.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		D31F32191C11796D00A77D54 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				D31F32351C11798E00A77D54 /* main.m in Sources */,
+				D31F323C1C117BE700A77D54 /* fractal.cpp in Sources */,
+				D31F32361C11799200A77D54 /* OpenGLView.m in Sources */,
+				D31F32371C11799500A77D54 /* tbbAppDelegate.m in Sources */,
+				D31F323B1C117BE300A77D54 /* main.cpp in Sources */,
+				D31F32341C11798900A77D54 /* macvideo.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin PBXVariantGroup section */
+		84B8DA7C152CA97B00D59B95 /* InfoPlist.strings */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7D152CA97B00D59B95 /* en */,
+			);
+			name = InfoPlist.strings;
+			sourceTree = "<group>";
+		};
+		84B8DA7E152CA97B00D59B95 /* MainMenu.xib */ = {
+			isa = PBXVariantGroup;
+			children = (
+				84B8DA7F152CA97B00D59B95 /* en */,
+			);
+			name = MainMenu.xib;
+			sourceTree = "<group>";
+		};
+/* End PBXVariantGroup section */
+
+/* Begin XCBuildConfiguration section */
+		84D01770152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = YES;
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+				);
+				GCC_SYMBOLS_PRIVATE_EXTERN = NO;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		84D01771152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = YES;
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = YES;
+				DEBUG_INFORMATION_FORMAT = "dwarf-with-dsym";
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_C_LANGUAGE_STANDARD = c11;
+				GCC_ENABLE_OBJC_EXCEPTIONS = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_VERSION = "";
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				ICC_CXX_LANG_DIALECT = "c++11";
+				ICC_TBB = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				SDKROOT = macosx;
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+		84D01773152743200008A4E0 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Debug64;
+		};
+		84D01774152743200008A4E0 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CLANG_ENABLE_OBJC_ARC = NO;
+				GCC_PRECOMPILE_PREFIX_HEADER = YES;
+				GCC_PREFIX_HEADER = "../../../common/gui/xcode/tbbExample/tbbExample-Prefix.pch";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.plist";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				RUN_CLANG_STATIC_ANALYZER = YES;
+				USER_HEADER_SEARCH_PATHS = "";
+				VERSION_INFO_BUILDER = "$(TARGET_NAME)";
+				WRAPPER_EXTENSION = app;
+			};
+			name = Release64;
+		};
+		D31F32311C11796D00A77D54 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				DEBUG_INFORMATION_FORMAT = dwarf;
+				DEVELOPMENT_TEAM = "";
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+					"__TBB_IOS=1",
+				);
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				MTL_ENABLE_DEBUG_INFO = YES;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = "1,2";
+			};
+			name = Debug64;
+		};
+		D31F32321C11796D00A77D54 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				CLANG_CXX_LANGUAGE_STANDARD = "c++0x";
+				CLANG_CXX_LIBRARY = "libc++";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				"CODE_SIGN_IDENTITY[sdk=iphoneos*]" = "iPhone Developer";
+				COPY_PHASE_STRIP = NO;
+				DEVELOPMENT_TEAM = "";
+				ENABLE_NS_ASSERTIONS = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_PREPROCESSOR_DEFINITIONS = "__TBB_IOS=1";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				INFOPLIST_FILE = "../../../common/gui/xcode/tbbExample/tbbExample-Info.ios.plist";
+				IPHONEOS_DEPLOYMENT_TARGET = 9.0;
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited) @executable_path";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				MTL_ENABLE_DEBUG_INFO = NO;
+				PRODUCT_BUNDLE_IDENTIFIER = com.tbb.example;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = iphoneos;
+				TARGETED_DEVICE_FAMILY = "1,2";
+				VALIDATE_PRODUCT = YES;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		84D0174B1527431F0008A4E0 /* Build configuration list for PBXProject "fractal" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01770152743200008A4E0 /* Debug64 */,
+				84D01771152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		84D01772152743200008A4E0 /* Build configuration list for PBXNativeTarget "tbbExample" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				84D01773152743200008A4E0 /* Debug64 */,
+				84D01774152743200008A4E0 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		D31F32331C11796D00A77D54 /* Build configuration list for PBXNativeTarget "tbbExample_ios" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				D31F32311C11796D00A77D54 /* Debug64 */,
+				D31F32321C11796D00A77D54 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 84D017481527431F0008A4E0 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme b/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme
new file mode 100644
index 00000000..3ce0e58c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/xcshareddata/xcschemes/tbbExample.ios.xcscheme
@@ -0,0 +1,91 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "0710"
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "D31F321C1C11796D00A77D54"
+               BuildableName = "tbbExample_ios.app"
+               BlueprintName = "tbbExample_ios"
+               ReferencedContainer = "container:fractal.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D31F321C1C11796D00A77D54"
+            BuildableName = "tbbExample_ios.app"
+            BlueprintName = "tbbExample_ios"
+            ReferencedContainer = "container:fractal.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "YES"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D31F321C1C11796D00A77D54"
+            BuildableName = "tbbExample_ios.app"
+            BlueprintName = "tbbExample_ios"
+            ReferencedContainer = "container:fractal.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "D31F321C1C11796D00A77D54"
+            BuildableName = "tbbExample_ios.app"
+            BlueprintName = "tbbExample_ios"
+            ReferencedContainer = "container:fractal.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme b/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme
new file mode 100644
index 00000000..5939fe1d
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/fractal/xcode/fractal.xcodeproj/xcshareddata/xcschemes/tbbExample.xcscheme
@@ -0,0 +1,93 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   version = "1.3">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "84D017501527431F0008A4E0"
+               BuildableName = "tbbExample.app"
+               BlueprintName = "tbbExample"
+               ReferencedContainer = "container:tbbExample.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      buildConfiguration = "Debug">
+      <Testables>
+      </Testables>
+      <MacroExpansion>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:fractal.xcodeproj">
+         </BuildableReference>
+      </MacroExpansion>
+   </TestAction>
+   <LaunchAction
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      customWorkingDirectory = "/tmp"
+      buildConfiguration = "Debug"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "NO"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:fractal.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <EnvironmentVariables>
+         <EnvironmentVariable
+            key = "DYLD_LIBRARY_PATH"
+            value = "$(SRCROOT)/../../../../lib"
+            isEnabled = "YES">
+         </EnvironmentVariable>
+      </EnvironmentVariables>
+      <AdditionalOptions>
+      </AdditionalOptions>
+   </LaunchAction>
+   <ProfileAction
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      buildConfiguration = "Release"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable>
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "84D017501527431F0008A4E0"
+            BuildableName = "tbbExample.app"
+            BlueprintName = "tbbExample"
+            ReferencedContainer = "container:tbbExample.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/xdl/third_party/tbb/examples/task_arena/index.html b/xdl/third_party/tbb/examples/task_arena/index.html
new file mode 100644
index 00000000..21be30d1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_arena/index.html
@@ -0,0 +1,343 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on task_arena feature</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on <code>task_arena</code> feature</h1>
+	</div>
+	
+	<p>
+		This directory has examples of how to use the <code>task_arena</code> feature.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="fractal/readme.html">fractal</a>
+				<dd>The example calculates two classical Mandelbrot fractals with different priorities.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/task_group/index.html b/xdl/third_party/tbb/examples/task_group/index.html
new file mode 100644
index 00000000..b06191ca
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/index.html
@@ -0,0 +1,343 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on task_group interface</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks<br>Samples on <code>task_group</code> interface</h1>
+	</div>
+	
+	<p>
+		This directory has examples of how to use <code>task_group</code> interface.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="sudoku/readme.html">Sudoku</a>
+				<dd>Compute all solutions for a Sudoku board.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/Makefile b/xdl/third_party/tbb/examples/task_group/sudoku/Makefile
new file mode 100644
index 00000000..07198e48
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/Makefile
@@ -0,0 +1,74 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=sudoku
+ARGS=4 input1 verbose
+PERF_RUN_ARGS=auto input1 silent
+
+# icpc by default
+ifneq (,$(shell which icc 2>/dev/null))
+    CXX=icpc
+endif
+
+# autodetect C++11 support
+include ../../common/examples-common.inc
+
+TBBLIB = -ltbb
+TBBLIB_DEBUG = -ltbb_debug
+
+ifneq (,$(filter icc icpc,$(CXX)))
+ifeq ($(offload), mic)
+override CXXFLAGS += -D__TBB_MIC_OFFLOAD=1
+# Replace -ltbb with -tbb in the offload mode
+TBBLIB = -tbb
+TBBLIB_DEBUG += -offload-option,mic,ld,"-ltbb_debug"
+endif
+endif
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ $(TBBLIB) $(LIBS) $(CXX0XFLAGS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ $(TBBLIB_DEBUG) $(LIBS) $(CXX0XFLAGS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
+
+perf_build: release
+
+perf_run:
+	$(run_cmd) ./$(PROG) $(PERF_RUN_ARGS)
+
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/Makefile.windows b/xdl/third_party/tbb/examples/task_group/sudoku/Makefile.windows
new file mode 100644
index 00000000..21d74ab9
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/Makefile.windows
@@ -0,0 +1,50 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=sudoku
+ARGS= 4 input1 verbose
+PERF_RUN_ARGS=auto input1 silent
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _CRT_SECURE_NO_DEPRECATE $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release:
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug:
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@$(CXX) >nul 2>&1 || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+
+perf_build: release
+
+perf_run:
+	$(PROG) $(PERF_RUN_ARGS)
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/input1 b/xdl/third_party/tbb/examples/task_group/sudoku/input1
new file mode 100644
index 00000000..65917520
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/input1
@@ -0,0 +1,19 @@
+1 0 0 9 0 0 0 8 0 0 8 0 2 0 0 0 0 0 0 0 5 0 0 0 7 0 0 0 5 2 1 0 0 4 0 0 0 0 0 0 0 5 0 0 7 4 0 0 7 0 0 0 3 0 0 3 0 0 0 2 0 0 5 0 0 0 0 0 0 1 0 0 5 0 0 0 1 0 0 0 0
+
+
+
+
+
+
+
+1 0 0  9 0 0  0 8 0
+0 8 0  2 0 0  0 0 0
+0 0 5  0 0 0  7 0 0
+
+0 5 2  1 0 0  4 0 0
+0 0 0  0 0 5  0 0 7
+4 0 0  7 0 0  0 3 0
+ 
+0 3 0  0 0 2  0 0 5
+0 0 0  0 0 0  1 0 0
+5 0 0  0 1 0  0 0 0
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/input2 b/xdl/third_party/tbb/examples/task_group/sudoku/input2
new file mode 100644
index 00000000..49514254
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/input2
@@ -0,0 +1,18 @@
+2 0 1 0 0 0 0 8 0 0 8 0 2 1 9 6 0 0 0 0 5 0 0 0 7 0 0 0 5 2 1 0 0 4 0 0 0 0 0 0 0 5 0 0 7 4 0 0 7 0 0 0 3 0 0 3 0 0 0 2 0 0 5 0 0 0 0 3 0 1 0 0 5 0 0 0 8 0 0 0 6
+
+
+
+
+
+
+2 0 1  0 0 0  0 8 0
+0 8 0  2 1 9  6 0 0
+0 0 5  0 0 0  7 0 0
+
+0 5 2  1 0 0  4 0 0
+0 0 0  0 0 5  0 0 7
+4 0 0  7 0 0  0 3 0
+ 
+0 3 0  0 0 2  0 0 5
+0 0 0  0 3 0  1 0 0
+5 0 0  0 8 0  0 0 6
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/input3 b/xdl/third_party/tbb/examples/task_group/sudoku/input3
new file mode 100644
index 00000000..e6cbb094
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/input3
@@ -0,0 +1,19 @@
+1 0 0 9 0 0 0 8 0 0 0 0 2 0 0 0 0 0 0 0 5 0 0 0 7 0 0 0 5 2 6 0 0 4 0 0 0 0 0 0 0 5 0 0 7 4 0 0 7 0 0 0 3 0 0 3 0 0 0 2 0 0 5 0 0 0 0 0 0 1 0 0 5 0 0 0 1 0 0 0 0
+
+
+
+
+
+
+
+1 0 0  9 0 0  0 8 0
+0 0 0  2 0 0  0 0 0
+0 0 5  0 0 0  7 0 0
+
+0 5 2  6 0 0  4 0 0
+0 0 0  0 0 5  0 0 7
+4 0 0  7 0 0  0 3 0
+ 
+0 3 0  0 0 2  0 0 5
+0 0 0  0 0 0  1 0 0
+5 0 0  0 1 0  0 0 0
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/input4 b/xdl/third_party/tbb/examples/task_group/sudoku/input4
new file mode 100644
index 00000000..9436cd77
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/input4
@@ -0,0 +1,19 @@
+1 0 0 9 0 0 0 8 0 0 0 0 2 0 0 0 0 0 0 0 5 0 0 0 7 0 0 0 0 2 6 0 0 0 0 0 0 0 0 0 0 5 0 0 7 4 0 0 0 0 0 0 3 0 0 3 0 0 0 2 0 0 5 0 0 0 0 0 0 1 0 0 5 0 0 0 1 0 0 0 0
+
+
+
+
+
+
+
+1 0 0  9 0 0  0 8 0
+0 0 0  2 0 0  0 0 0
+0 0 5  0 0 0  7 0 0
+
+0 0 2  6 0 0  0 0 0
+0 0 0  0 0 5  0 0 7
+4 0 0  0 0 0  0 3 0
+ 
+0 3 0  0 0 2  0 0 5
+0 0 0  0 0 0  1 0 0
+5 0 0  0 1 0  0 0 0
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/msvs/sudoku.sln b/xdl/third_party/tbb/examples/task_group/sudoku/msvs/sudoku.sln
new file mode 100644
index 00000000..66697c69
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/msvs/sudoku.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "sudoku", "sudoku.vcxproj", "{C931C7A2-074E-4150-9E7A-39A03250411E}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.ActiveCfg = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|Win32.Build.0 = Debug|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.ActiveCfg = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Debug|x64.Build.0 = Debug|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.ActiveCfg = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|Win32.Build.0 = Release|Win32
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.ActiveCfg = Release|x64
+		{C931C7A2-074E-4150-9E7A-39A03250411E}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/msvs/sudoku.vcxproj b/xdl/third_party/tbb/examples/task_group/sudoku/msvs/sudoku.vcxproj
new file mode 100644
index 00000000..beda25a3
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/msvs/sudoku.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>sudoku</ProjectName>
+    <ProjectGuid>{C931C7A2-074E-4150-9E7A-39A03250411E}</ProjectGuid>
+    <RootNamespace>sudoku</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;tbbmalloc_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;tbbmalloc.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\sudoku.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/readme.html b/xdl/third_party/tbb/examples/task_group/sudoku/readme.html
new file mode 100644
index 00000000..5685ebf6
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/readme.html
@@ -0,0 +1,417 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Sudoku sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Sudoku sample</h1>
+	</div>
+	
+	<p>
+		This directory contains a simple example that finds all solutions to a
+		Sudoku board.
+	<br><br>
+		It uses a straightforward state-space search algorithm
+		that exhibits OR-parallelism.  It can be optionally run until it
+		obtains just the first solution. The point of the example is to teach
+		how to use the task_group interface.
+	<br><br>
+		The example can be built in the offload version to run on Intel&reg; Many Integrated Core (Intel&reg; MIC) Architecture based coprocessor (see <a href="../../index.html">build instructions</a>).
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="sudoku.cpp">sudoku.cpp</a>
+				<dd>Driver.
+				<dt><a href="input1">input1</a>
+				<dd>Sample input file with modest number of solutions.
+				<dt><a href="input2">input2</a>
+				<dd>Sample input file with small number of solutions.
+				<dt><a href="input3">input3</a>
+				<dd>Sample input file with larger number of solutions.
+				<dt><a href="input4">input4</a>
+				<dd>Sample input file with very large number of solutions.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a>
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example with the Intel&reg; C++ Compiler (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>sudoku <i>-h</i></tt>
+				<dd>Prints the help for command line options
+				<dt><tt>sudoku [<i>n-of-threads</i>=value] [<i>filename</i>=value] [<i>verbose</i>] [<i>silent</i>] [<i>find-one</i>]</tt>
+				<dt><tt>sudoku [n-of-threads [filename]] [<i>verbose</i>] [<i>silent</i>] [<i>find-one</i>]</tt> 
+				<dd><i>n-of-threads</i> is the number of threads to use; a range of the form <i>low</i>[:<i>high</i>], where low and optional high are non-negative integers or 'auto' for a platform-specific default number.<br>
+					<i>filename</i> is an input filename.<br>
+					<i>verbose</i> - prints the first solution.<br>
+					<i>silent</i> - no output except elapsed time.<br>
+					<i>find-one</i> - stops after finding first solution.<br>
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Parallel Inspector:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small problem size and the desired number of threads, e.g., <tt>sudoku&nbsp;4&nbsp;input2</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/sudoku.cpp b/xdl/third_party/tbb/examples/task_group/sudoku/sudoku.cpp
new file mode 100644
index 00000000..f797157c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/sudoku.cpp
@@ -0,0 +1,333 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "../../common/utility/utility.h"
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (push,target(mic))
+#endif // __TBB_MIC_OFFLOAD
+
+#include <cstdio>
+#include <cstdlib>
+#include <string>
+
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task_group.h"
+
+#pragma warning(disable: 4996)
+
+const unsigned BOARD_SIZE=81;
+const unsigned BOARD_DIM=9;
+
+using namespace tbb;
+using namespace std;
+
+tbb::atomic<unsigned> nSols;
+bool find_one = false;
+bool verbose = false;
+unsigned short init_values[BOARD_SIZE] = {1,0,0,9,0,0,0,8,0,0,8,0,2,0,0,0,0,0,0,0,5,0,0,0,7,0,0,0,5,2,1,0,0,4,0,0,0,0,0,0,0,5,0,0,7,4,0,0,7,0,0,0,3,0,0,3,0,0,0,2,0,0,5,0,0,0,0,0,0,1,0,0,5,0,0,0,1,0,0,0,0};
+task_group *g;
+double solve_time;
+
+typedef struct {
+    unsigned short solved_element;
+    unsigned potential_set;
+} board_element;
+
+void read_board(const char *filename) {
+    FILE *fp;
+    int input;
+    fp = fopen(filename, "r");
+    if (!fp) { 
+        fprintf(stderr, "sudoku: Could not open input file '%s'.\n", filename);
+        exit(1);
+    }
+    for (unsigned i=0; i<BOARD_SIZE; ++i) {
+        if (fscanf(fp, "%d", &input))
+            init_values[i] = input;
+        else {
+            fprintf(stderr, "sudoku: Error in input file at entry %d, assuming 0.\n", i);
+            init_values[i] = 0;
+        }
+    }
+    fclose(fp);
+}
+
+void print_board(board_element *b) {
+    for (unsigned row=0; row<BOARD_DIM; ++row) {
+        for (unsigned col=0; col<BOARD_DIM; ++col) {
+            printf(" %d", b[row*BOARD_DIM+col].solved_element);
+            if (col==2 || col==5) printf(" |");
+        }
+        printf("\n");
+        if (row==2 || row==5) printf(" ---------------------\n");
+    }
+}
+
+void print_potential_board(board_element *b) {
+    for (unsigned row=0; row<BOARD_DIM; ++row) {
+        for (unsigned col=0; col<BOARD_DIM; ++col) {
+            if (b[row*BOARD_DIM+col].solved_element) 
+                printf("  %4d ", b[row*BOARD_DIM+col].solved_element);
+            else
+                printf(" [%4d]", b[row*BOARD_DIM+col].potential_set);
+            if (col==2 || col==5) printf(" |");
+        }
+        printf("\n");
+        if (row==2 || row==5)
+            printf(" ------------------------------------------------------------------\n");
+    }
+}
+
+void init_board(board_element *b) {
+    for (unsigned i=0; i<BOARD_SIZE; ++i)
+        b[i].solved_element = b[i].potential_set = 0;
+}
+
+void init_board(board_element *b, unsigned short arr[81]) {
+    for (unsigned i=0; i<BOARD_SIZE; ++i) {
+        b[i].solved_element = arr[i]; 
+        b[i].potential_set = 0;
+    }
+}
+
+void init_potentials(board_element *b) {
+    for (unsigned i=0; i<BOARD_SIZE; ++i)
+        b[i].potential_set = 0;
+}
+
+void copy_board(board_element *src, board_element *dst) {
+    for (unsigned i=0; i<BOARD_SIZE; ++i)
+        dst[i].solved_element = src[i].solved_element;
+}
+
+bool fixed_board(board_element *b) {
+    for (int i=BOARD_SIZE-1; i>=0; --i)
+        if (b[i].solved_element==0) return false;
+    return true;
+}
+
+bool in_row(board_element *b, unsigned row, unsigned col, unsigned short p) {
+    for (unsigned c=0; c<BOARD_DIM; ++c)
+        if (c!=col && b[row*BOARD_DIM+c].solved_element==p)  return true;
+    return false;
+}
+
+bool in_col(board_element *b, unsigned row, unsigned col, unsigned short p) {
+    for (unsigned r=0; r<BOARD_DIM; ++r)
+        if (r!=row && b[r*BOARD_DIM+col].solved_element==p)  return true;
+    return false;
+}
+
+bool in_block(board_element *b, unsigned row, unsigned col, unsigned short p) {
+    unsigned b_row = row/3 * 3, b_col = col/3 * 3;
+    for (unsigned i=b_row; i<b_row+3; ++i)
+        for (unsigned j=b_col; j<b_col+3; ++j)
+            if (!(i==row && j==col) && b[i*BOARD_DIM+j].solved_element==p) return true;
+    return false;
+}
+
+void calculate_potentials(board_element *b) {
+    for (unsigned i=0; i<BOARD_SIZE; ++i) {
+        b[i].potential_set = 0;
+        if (!b[i].solved_element) { // element is not yet fixed
+            unsigned row = i/BOARD_DIM, col = i%BOARD_DIM;
+            for (unsigned potential=1; potential<=BOARD_DIM; ++potential) {
+                if (!in_row(b, row, col, potential) && !in_col(b, row, col, potential)
+                    && !in_block(b, row, col, potential))
+                    b[i].potential_set |= 1<<(potential-1);
+            }
+        }
+    }
+}
+
+bool valid_board(board_element *b) {
+    bool success=true;
+    for (unsigned i=0; i<BOARD_SIZE; ++i) {
+        if (success && b[i].solved_element) { // element is fixed
+            unsigned row = i/BOARD_DIM, col = i%BOARD_DIM;
+            if (in_row(b, row, col, b[i].solved_element) || in_col(b, row, col, b[i].solved_element) || in_block(b, row, col, b[i].solved_element))
+                success = false;
+        }
+    }
+    return success;
+}
+
+bool examine_potentials(board_element *b, bool *progress) {
+    bool singletons = false;
+    for (unsigned i=0; i<BOARD_SIZE; ++i) {
+        if (b[i].solved_element==0 && b[i].potential_set==0) // empty set
+            return false;
+        switch (b[i].potential_set) {
+        case 1:   { b[i].solved_element = 1; singletons=true; break; }
+        case 2:   { b[i].solved_element = 2; singletons=true; break; }
+        case 4:   { b[i].solved_element = 3; singletons=true; break; }
+        case 8:   { b[i].solved_element = 4; singletons=true; break; }
+        case 16:  { b[i].solved_element = 5; singletons=true; break; }
+        case 32:  { b[i].solved_element = 6; singletons=true; break; }
+        case 64:  { b[i].solved_element = 7; singletons=true; break; }
+        case 128: { b[i].solved_element = 8; singletons=true; break; }
+        case 256: { b[i].solved_element = 9; singletons=true; break; }
+        }
+    }
+    *progress = singletons;
+    return valid_board(b);
+}
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+void partial_solve(board_element *b, unsigned first_potential_set);
+
+class PartialSolveBoard {
+    board_element *b;
+    unsigned first_potential_set;
+public:
+    PartialSolveBoard(board_element *_b, unsigned fps) :
+        b(_b), first_potential_set(fps) {}
+    void operator() () const {
+        partial_solve(b, first_potential_set);
+    }
+};
+#endif
+
+void partial_solve(board_element *b, unsigned first_potential_set) {
+    if (fixed_board(b)) {
+        if ( find_one )
+            g->cancel();
+        if (++nSols==1 && verbose) {
+            print_board(b);
+        }
+        free(b);
+        return;
+    }
+    calculate_potentials(b);
+    bool progress=true;
+    bool success = examine_potentials(b, &progress);
+    if (success && progress) {
+        partial_solve(b, first_potential_set);
+    } else if (success && !progress) {
+        board_element *new_board;
+        while (b[first_potential_set].solved_element!=0) ++first_potential_set;
+        for (unsigned short potential=1; potential<=BOARD_DIM; ++potential) {
+            if (1<<(potential-1) & b[first_potential_set].potential_set) {
+                new_board = (board_element *)malloc(BOARD_SIZE*sizeof(board_element));
+                copy_board(b, new_board);
+                new_board[first_potential_set].solved_element = potential;
+#if __TBB_CPP11_LAMBDAS_PRESENT
+                g->run( [=]{ partial_solve(new_board, first_potential_set); } );
+#else
+                g->run(PartialSolveBoard(new_board, first_potential_set));
+#endif
+            }
+        }
+        free(b);
+    }
+    else {
+        free(b);
+    }
+}
+
+unsigned solve(int p) {
+    task_scheduler_init init(p);
+    nSols = 0;
+    board_element *start_board = (board_element *)malloc(BOARD_SIZE*sizeof(board_element));
+    init_board(start_board, init_values);
+    g = new task_group;
+    tick_count t0 = tick_count::now();
+    partial_solve(start_board, 0);
+    g->wait();
+    solve_time = (tick_count::now() - t0).seconds();
+    delete g;
+    return nSols;
+}
+
+#if __TBB_MIC_OFFLOAD
+#pragma offload_attribute (pop)
+#endif // __TBB_MIC_OFFLOAD
+
+int do_get_default_num_threads() {
+    int threads;
+    #if __TBB_MIC_OFFLOAD
+    #pragma offload target(mic) out(threads)
+    #endif // __TBB_MIC_OFFLOAD
+    threads = tbb::task_scheduler_init::default_num_threads();
+    return threads;
+}
+
+int get_default_num_threads() {
+    static int threads = do_get_default_num_threads();
+    return threads;
+}
+
+int main(int argc, char *argv[]) {
+    try {
+        tbb::tick_count mainStartTime = tbb::tick_count::now();
+
+        utility::thread_number_range threads(get_default_num_threads);
+        string filename = "";
+        bool silent = false;
+
+        utility::parse_cli_arguments(argc,argv,
+            utility::cli_argument_pack()
+            //"-h" option for displaying help is present implicitly
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(filename,"filename","input filename")
+
+            .arg(verbose,"verbose","prints the first solution")
+            .arg(silent,"silent","no output except elapsed time")
+            .arg(find_one,"find-one","stops after finding first solution\n")
+        );
+
+        if ( silent ) verbose = false;
+
+        if ( !filename.empty() )
+            read_board( filename.c_str() );
+        // otherwise (if file name not specified), the default statically initialized board will be used.
+        for(int p = threads.first; p <= threads.last; p = threads.step(p) ) {
+            unsigned number;
+            #if __TBB_MIC_OFFLOAD
+            #pragma offload target(mic) in(init_values, p, verbose, find_one) out(number, solve_time)
+            {
+            #endif // __TBB_MIC_OFFLOAD
+            number = solve(p);
+            #if __TBB_MIC_OFFLOAD
+            }
+            #endif // __TBB_MIC_OFFLOAD
+
+            if ( !silent ) {
+                if ( find_one ) {
+                    printf("Sudoku: Time to find first solution on %d threads: %6.6f seconds.\n", p, solve_time);
+                }
+                else {
+                    printf("Sudoku: Time to find all %u solutions on %d threads: %6.6f seconds.\n", number, p, solve_time);
+                }
+            }
+        }
+
+        utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
+
+        return 0;
+    } catch(std::exception& e) {
+        std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
+        return 1;
+    }
+};
+
diff --git a/xdl/third_party/tbb/examples/task_group/sudoku/xcode/sudoku.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/task_group/sudoku/xcode/sudoku.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..835c82ce
--- /dev/null
+++ b/xdl/third_party/tbb/examples/task_group/sudoku/xcode/sudoku.xcodeproj/project.pbxproj
@@ -0,0 +1,258 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* sudoku.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* sudoku.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58961218C251E00DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* Sudoku */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = Sudoku; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* sudoku.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = sudoku.cpp; path = ../sudoku.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* Sudoku */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = Sudoku;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F593A50B8F042A00073279 /* sudoku.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* Sudoku */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* Sudoku */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Sudoku" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58961218C251E00DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = Sudoku;
+			productInstallPath = "$(HOME)/bin";
+			productName = Sudoku;
+			productReference = 8DD76F6C0486A84900D96B5E /* Sudoku */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "sudoku" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* Sudoku */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* Sudoku */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* sudoku.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = com.apple.compilers.llvm.clang.1_0;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Sudoku;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = com.apple.compilers.llvm.clang.1_0;
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Sudoku;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Sudoku" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "sudoku" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/Fibonacci.cpp b/xdl/third_party/tbb/examples/test_all/fibonacci/Fibonacci.cpp
new file mode 100644
index 00000000..b6a48c7c
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/Fibonacci.cpp
@@ -0,0 +1,609 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Example program that computes Fibonacci numbers in different ways.
+   Arguments are: [ Number [Threads [Repeats]]]
+   The defaults are Number=500 Threads=1:4 Repeats=1.
+
+   The point of this program is to check that the library is working properly.
+   Most of the computations are deliberately silly and not expected to
+   show any speedup on multiprocessors.
+*/
+
+// enable assertions
+#ifdef NDEBUG
+#undef NDEBUG
+#endif
+
+#include <cstdio>
+#include <cstdlib>
+#include <cassert>
+#include <utility>
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/blocked_range.h"
+#include "tbb/concurrent_vector.h"
+#include "tbb/concurrent_queue.h"
+#include "tbb/concurrent_hash_map.h"
+#include "tbb/parallel_while.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+#include "tbb/parallel_scan.h"
+#include "tbb/pipeline.h"
+#include "tbb/atomic.h"
+#include "tbb/mutex.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/queuing_mutex.h"
+#include "tbb/tbb_thread.h"
+
+using namespace std;
+using namespace tbb;
+
+//! type used for Fibonacci number computations
+typedef long long value;
+
+//! Matrix 2x2 class
+struct Matrix2x2
+{
+    //! Array of values
+    value v[2][2];
+    Matrix2x2() {}
+    Matrix2x2(value v00, value v01, value v10, value v11) {
+        v[0][0] = v00; v[0][1] = v01; v[1][0] = v10; v[1][1] = v11;
+    }
+    Matrix2x2 operator * (const Matrix2x2 &to) const; //< Multiply two Matrices
+};
+//! Identity matrix
+static const Matrix2x2 MatrixIdentity(1, 0, 0, 1);
+//! Default matrix to multiply
+static const Matrix2x2 Matrix1110(1, 1, 1, 0);
+//! Raw arrays matrices multiply
+void Matrix2x2Multiply(const value a[2][2], const value b[2][2], value c[2][2]);
+
+/////////////////////// Serial methods ////////////////////////
+
+//! Plain serial sum
+value SerialFib(int n)
+{
+    if(n < 2)
+        return n;
+    value a = 0, b = 1, sum; int i;
+    for( i = 2; i <= n; i++ )
+    {   // n is really index of Fibonacci number
+        sum = a + b; a = b; b = sum;
+    }
+    return sum;
+}
+//! Serial n-1 matrices multiplication
+value SerialMatrixFib(int n)
+{
+    value c[2][2], a[2][2] = {{1, 1}, {1, 0}}, b[2][2] = {{1, 1}, {1, 0}}; int i;
+    for(i = 2; i < n; i++)
+    {   // Using condition to prevent copying of values
+        if(i & 1) Matrix2x2Multiply(a, c, b);
+        else      Matrix2x2Multiply(a, b, c);
+    }
+    return (i & 1) ? c[0][0] : b[0][0]; // get result from upper left cell
+}
+//! Recursive summing. Just for complete list of serial algorithms, not used
+value SerialRecursiveFib(int n)
+{
+    value result;
+    if(n < 2)
+        result = n;
+    else
+        result = SerialRecursiveFib(n - 1) + SerialRecursiveFib(n - 2);
+    return result;
+}
+//! Introducing of queue method in serial
+value SerialQueueFib(int n)
+{
+    concurrent_queue<Matrix2x2> Q;
+    for(int i = 1; i < n; i++)
+        Q.push(Matrix1110);
+    Matrix2x2 A, B;
+    while(true) {
+        while( !Q.try_pop(A) ) this_tbb_thread::yield();
+        if(Q.empty()) break;
+        while( !Q.try_pop(B) ) this_tbb_thread::yield();
+        Q.push(A * B);
+    }
+    return A.v[0][0];
+}
+//! Trying to use concurrent_vector
+value SerialVectorFib(int n)
+{
+    concurrent_vector<value> A;
+    A.grow_by(2);
+    A[0] = 0; A[1] = 1;
+    for( int i = 2; i <= n; i++)
+    {
+        A.grow_to_at_least(i+1);
+        A[i] = A[i-1] + A[i-2];
+    }
+    return A[n];
+}
+
+///////////////////// Parallel methods ////////////////////////
+
+// *** Serial shared by mutexes *** //
+
+//! Shared glabals
+value SharedA = 0, SharedB = 1; int SharedI = 1, SharedN;
+
+//! Template task class which computes Fibonacci numbers with shared globals
+template<typename M>
+class SharedSerialFibBody {
+    M &mutex;
+public:
+    SharedSerialFibBody( M &m ) : mutex( m ) {}
+    //! main loop
+    void operator()( const blocked_range<int>& range ) const {
+        for(;;) {
+            typename M::scoped_lock lock( mutex );
+            if(SharedI >= SharedN) break;
+            value sum = SharedA + SharedB;
+            SharedA = SharedB; SharedB = sum;
+            ++SharedI;
+        }
+    }
+};
+
+//! Root function
+template<class M>
+value SharedSerialFib(int n)
+{
+    SharedA = 0; SharedB = 1; SharedI = 1; SharedN = n; M mutex;
+    parallel_for( blocked_range<int>(0,4,1), SharedSerialFibBody<M>( mutex ) );
+    return SharedB;
+}
+
+// *** Serial shared by concurrent hash map *** //
+
+//! Hash comparer
+struct IntHashCompare {
+    bool equal( const int j, const int k ) const { return j == k; }
+    unsigned long hash( const int k ) const { return (unsigned long)k; }   
+};
+//! NumbersTable type based on concurrent_hash_map
+typedef concurrent_hash_map<int, value, IntHashCompare> NumbersTable;
+//! task for serial method using shared concurrent_hash_map
+class ConcurrentHashSerialFibTask: public task {
+    NumbersTable &Fib;
+    int my_n;
+public:
+    //! constructor
+    ConcurrentHashSerialFibTask( NumbersTable &cht, int n ) : Fib(cht), my_n(n) { }
+    //! executing task
+    task* execute() /*override*/ {
+        for( int i = 2; i <= my_n; ++i ) { // there is no difference in to recycle or to make loop
+            NumbersTable::const_accessor f1, f2; // same as iterators
+            if( !Fib.find(f1, i-1) || !Fib.find(f2, i-2) ) {
+                // Something is seriously wrong, because i-1 and i-2 must have been inserted 
+                // earlier by this thread or another thread.
+                assert(0);
+            }
+            value sum = f1->second + f2->second;
+            NumbersTable::const_accessor fsum;
+            Fib.insert(fsum, make_pair(i, sum)); // inserting
+            assert( fsum->second == sum ); // check value
+        }
+        return 0;
+    }
+};
+
+//! Root function
+value ConcurrentHashSerialFib(int n)
+{
+    NumbersTable Fib; 
+    bool okay;
+    okay = Fib.insert( make_pair(0, 0) ); assert(okay); // assign initial values
+    okay = Fib.insert( make_pair(1, 1) ); assert(okay);
+
+    task_list list;
+    // allocate tasks
+    list.push_back(*new(task::allocate_root()) ConcurrentHashSerialFibTask(Fib, n));
+    list.push_back(*new(task::allocate_root()) ConcurrentHashSerialFibTask(Fib, n));
+    task::spawn_root_and_wait(list);
+    NumbersTable::const_accessor fresult;
+    okay = Fib.find( fresult, n );
+    assert(okay);
+    return fresult->second;
+}
+
+// *** Queue with parallel_for and parallel_while *** //
+
+//! Stream of matrices
+struct QueueStream {
+    volatile bool producer_is_done;
+    concurrent_queue<Matrix2x2> Queue;
+    //! Get pair of matricies if present
+    bool pop_if_present( pair<Matrix2x2, Matrix2x2> &mm ) {
+        // get first matrix if present
+        if(!Queue.try_pop(mm.first)) return false;
+        // get second matrix if present
+        if(!Queue.try_pop(mm.second)) {
+            // if not, then push back first matrix
+            Queue.push(mm.first); return false;
+        }
+        return true;
+    }
+};
+
+//! Functor for parallel_for which fills the queue
+struct parallel_forFibBody { 
+    QueueStream &my_stream;
+    //! fill functor arguments
+    parallel_forFibBody(QueueStream &s) : my_stream(s) { }
+    //! iterate thorough range
+    void operator()( const blocked_range<int> &range ) const {
+        int i_end = range.end();
+        for( int i = range.begin(); i != i_end; ++i ) {
+            my_stream.Queue.push( Matrix1110 ); // push initial matrix
+        }
+    }
+};
+//! Functor for parallel_while which process the queue
+class parallel_whileFibBody
+{
+    QueueStream &my_stream;
+    parallel_while<parallel_whileFibBody> &my_while;
+public:
+    typedef pair<Matrix2x2, Matrix2x2> argument_type;
+    //! fill functor arguments
+    parallel_whileFibBody(parallel_while<parallel_whileFibBody> &w, QueueStream &s)
+        : my_while(w), my_stream(s) { }
+    //! process pair of matrices
+    void operator() (argument_type mm) const {
+        mm.first = mm.first * mm.second;
+        // note: it can run concurrently with QueueStream::pop_if_present()
+        if(my_stream.Queue.try_pop(mm.second))
+             my_while.add( mm ); // now, two matrices available. Add next iteration.
+        else my_stream.Queue.push( mm.first ); // or push back calculated value if queue is empty
+    }
+};
+
+//! Parallel queue's filling task
+struct QueueInsertTask: public task {
+    QueueStream &my_stream;
+    int my_n;
+    //! fill task arguments
+    QueueInsertTask( int n, QueueStream &s ) : my_n(n), my_stream(s) { }
+    //! executing task
+    task* execute() /*override*/ {
+        // Execute of parallel pushing of n-1 initial matrices
+        parallel_for( blocked_range<int>( 1, my_n, 10 ), parallel_forFibBody(my_stream) ); 
+        my_stream.producer_is_done = true; 
+        return 0;
+    }
+};
+//! Parallel queue's processing task
+struct QueueProcessTask: public task {
+    QueueStream &my_stream;
+    //! fill task argument
+    QueueProcessTask( QueueStream &s ) : my_stream(s) { }
+    //! executing task
+    task* execute() /*override*/ {
+        while( !my_stream.producer_is_done || my_stream.Queue.unsafe_size()>1 ) {
+            parallel_while<parallel_whileFibBody> w; // run while loop in parallel
+            w.run( my_stream, parallel_whileFibBody( w, my_stream ) );
+        }
+        return 0;
+    }
+};
+//! Root function
+value ParallelQueueFib(int n)
+{
+    QueueStream stream;
+    stream.producer_is_done = false;
+    task_list list;
+    list.push_back(*new(task::allocate_root()) QueueInsertTask( n, stream ));
+    list.push_back(*new(task::allocate_root()) QueueProcessTask( stream ));
+    // If there is only a single thread, the first task in the list runs to completion
+    // before the second task in the list starts.
+    task::spawn_root_and_wait(list);
+    assert(stream.Queue.unsafe_size() == 1); // it is easy to lose some work
+    Matrix2x2 M; 
+    bool result = stream.Queue.try_pop( M ); // get last matrix
+    assert( result );
+    return M.v[0][0]; // and result number
+}
+
+// *** Queue with pipeline *** //
+
+//! filter to fills queue
+class InputFilter: public filter {
+    tbb::atomic<int> N; //< index of Fibonacci number minus 1
+public:
+    concurrent_queue<Matrix2x2> Queue;
+    //! fill filter arguments
+    InputFilter( int n ) : filter(false /*is not serial*/) { N = n; }
+    //! executing filter
+    void* operator()(void*) /*override*/ {
+        int n = --N;
+        if(n <= 0) return 0;
+        Queue.push( Matrix1110 );
+        return &Queue;
+    }
+};
+//! filter to process queue
+class MultiplyFilter: public filter {
+public:
+    MultiplyFilter( ) : filter(false /*is not serial*/) { }
+    //! executing filter
+    void* operator()(void*p) /*override*/ {
+        concurrent_queue<Matrix2x2> &Queue = *static_cast<concurrent_queue<Matrix2x2> *>(p);
+        Matrix2x2 m1, m2;
+        // get two elements
+        while( !Queue.try_pop( m1 ) ) this_tbb_thread::yield(); 
+        while( !Queue.try_pop( m2 ) ) this_tbb_thread::yield();
+        m1 = m1 * m2; // process them
+        Queue.push( m1 ); // and push back
+        return this; // just nothing
+    }
+};
+//! Root function
+value ParallelPipeFib(int n)
+{
+    InputFilter input( n-1 );
+    MultiplyFilter process;
+    // Create the pipeline
+    pipeline pipeline;
+    // add filters
+    pipeline.add_filter( input ); // first
+    pipeline.add_filter( process ); // second
+
+    input.Queue.push( Matrix1110 );
+    // Run the pipeline
+    pipeline.run( n ); // must be larger then max threads number
+    pipeline.clear(); // do not forget clear the pipeline
+
+    assert( input.Queue.unsafe_size()==1 );
+    Matrix2x2 M; 
+    bool result = input.Queue.try_pop( M ); // get last element
+    assert( result );
+    return M.v[0][0]; // get value
+}
+
+// *** parallel_reduce *** //
+
+//! Functor for parallel_reduce
+struct parallel_reduceFibBody {
+    Matrix2x2 sum;
+    int splitted;  //< flag to make one less operation for splitted bodies
+    //! Constructor fills sum with initial matrix
+    parallel_reduceFibBody() : sum( Matrix1110 ), splitted(0) { }
+    //! Splitting constructor
+    parallel_reduceFibBody( parallel_reduceFibBody& other, split ) : sum( Matrix1110 ), splitted(1/*note that it is splitted*/) {}
+    //! Join point
+    void join( parallel_reduceFibBody &s ) {
+        sum = sum * s.sum;
+    }
+    //! Process multiplications
+    void operator()( const blocked_range<int> &r ) {
+        for( int k = r.begin() + splitted; k < r.end(); ++k )
+            sum = sum * Matrix1110;
+        splitted = 0; // reset flag, because this method can be reused for next range
+    }
+};
+//! Root function
+value parallel_reduceFib(int n)
+{
+    parallel_reduceFibBody b;
+    parallel_reduce(blocked_range<int>(2, n, 3), b); // do parallel reduce on range [2, n) for b
+    return b.sum.v[0][0];
+}
+
+// *** parallel_scan *** //
+
+//! Functor for parallel_scan
+struct parallel_scanFibBody {
+    /** Though parallel_scan is usually used to accumulate running sums,
+        it can be used to accumulate running products too. */
+    Matrix2x2 product;
+    /** Pointer to output sequence */
+    value* const output;
+    //! Constructor sets product to identity matrix
+    parallel_scanFibBody(value* output_) : product( MatrixIdentity ), output(output_) {}
+    //! Splitting constructor
+    parallel_scanFibBody( parallel_scanFibBody &b, split) : product( MatrixIdentity ), output(b.output) {}
+    //! Method for merging summary information from a, which was split off from *this, into *this.
+    void reverse_join( parallel_scanFibBody &a ) {
+        // When using non-commutative reduction operation, reverse_join
+        // should put argument "a" on the left side of the operation.
+        // The reversal from the argument order is why the method is
+        // called "reverse_join" instead of "join".
+        product = a.product * product;
+    }
+    //! Method for assigning final result back to original body.
+    void assign( parallel_scanFibBody &b ) {
+        product = b.product;
+    }
+    //! Compute matrix running product.
+    /** Tag indicates whether is is the final scan over the range, or
+        just a helper "prescan" that is computing a partial reduction. */
+    template<typename Tag>
+    void operator()( const blocked_range<int> &r, Tag tag) {
+        for( int k = r.begin(); k < r.end(); ++k ) {
+            // Code performs an "exclusive" scan, which outputs a value *before* updating the product.
+            // For an "inclusive" scan, output the value after the update.
+            if( tag.is_final_scan() )
+                output[k] = product.v[0][1];
+            product = product * Matrix1110;
+        }
+    }
+};
+//! Root function
+value parallel_scanFib(int n)
+{
+    value* output = new value[n];
+    parallel_scanFibBody b(output);
+    parallel_scan(blocked_range<int>(0, n, 3), b);
+    // output[0..n-1] now contains the Fibonacci sequence (modulo integer wrap-around).
+    // Check the last two values for correctness.
+    assert( n<2 || output[n-2]+output[n-1]==b.product.v[0][1] );
+    delete[] output;
+    return b.product.v[0][1];
+}
+
+// *** Raw tasks *** //
+
+//! task class which computes Fibonacci numbers by Lucas formula
+struct FibTask: public task {
+    const int n;
+    value& sum;
+    value x, y;
+    bool second_phase; //< flag of continuation
+    // task arguments
+    FibTask( int n_, value& sum_ ) : 
+        n(n_), sum(sum_), second_phase(false)
+    {}
+    //! Execute task
+    task* execute() /*override*/ {
+        // Using Lucas' formula here
+        if( second_phase ) { // children finished
+            sum = n&1 ? x*x + y*y : x*x - y*y;
+            return NULL;
+        }
+        if( n <= 2 ) {
+            sum = n!=0;
+            return NULL;
+        } else {
+            recycle_as_continuation();  // repeat this task when children finish
+            second_phase = true; // mark second phase
+            FibTask& a = *new( allocate_child() ) FibTask( n/2 + 1, x );
+            FibTask& b = *new( allocate_child() ) FibTask( n/2 - 1 + (n&1), y );
+            set_ref_count(2);
+            spawn( a );
+            return &b;
+        }
+    }
+};
+//! Root function
+value ParallelTaskFib(int n) { 
+    value sum;
+    FibTask& a = *new(task::allocate_root()) FibTask(n, sum);
+    task::spawn_root_and_wait(a);
+    return sum;
+}
+
+/////////////////////////// Main ////////////////////////////////////////////////////
+
+//! A closed range of int.
+struct IntRange {
+    int low;
+    int high;
+    void set_from_string( const char* s );
+    IntRange( int low_, int high_ ) : low(low_), high(high_) {}
+};
+
+void IntRange::set_from_string( const char* s ) {
+    char* end;
+    high = low = strtol(s,&end,0);
+    switch( *end ) {
+    case ':': 
+        high = strtol(end+1,0,0); 
+        break;
+    case '\0':
+        break;
+    default:
+        printf("unexpected character = %c\n",*end);
+    }
+}
+
+//! Tick count for start
+static tick_count t0;
+
+//! Verbose output flag
+static bool Verbose = false;
+
+typedef value (*MeasureFunc)(int);
+//! Measure ticks count in loop [2..n]
+value Measure(const char *name, MeasureFunc func, int n)
+{
+    value result;
+    if(Verbose) printf("%s",name);
+    t0 = tick_count::now();
+    for(int number = 2; number <= n; number++)
+        result = func(number);
+    if(Verbose) printf("\t- in %f msec\n", (tick_count::now() - t0).seconds()*1000);
+    return result;
+}
+
+//! program entry
+int main(int argc, char* argv[])
+{
+    if(argc>1) Verbose = true;
+    int NumbersCount = argc>1 ? strtol(argv[1],0,0) : 500;
+    IntRange NThread(1,4);// Number of threads to use.
+    if(argc>2) NThread.set_from_string(argv[2]);
+    unsigned long ntrial = argc>3? (unsigned long)strtoul(argv[3],0,0) : 1;
+    value result, sum;
+
+    if(Verbose) printf("Fibonacci numbers example. Generating %d numbers..\n",  NumbersCount);
+
+    result = Measure("Serial loop", SerialFib, NumbersCount);
+    sum = Measure("Serial matrix", SerialMatrixFib, NumbersCount); assert(result == sum);
+    sum = Measure("Serial vector", SerialVectorFib, NumbersCount); assert(result == sum);
+    sum = Measure("Serial queue", SerialQueueFib, NumbersCount); assert(result == sum);
+    // now in parallel
+    for( unsigned long i=0; i<ntrial; ++i ) {
+        for(int threads = NThread.low; threads <= NThread.high; threads *= 2)
+        {
+            task_scheduler_init scheduler_init(threads);
+            if(Verbose) printf("\nThreads number is %d\n", threads);
+
+            sum = Measure("Shared serial (mutex)\t", SharedSerialFib<mutex>, NumbersCount); assert(result == sum);
+            sum = Measure("Shared serial (spin_mutex)", SharedSerialFib<spin_mutex>, NumbersCount); assert(result == sum);
+            sum = Measure("Shared serial (queuing_mutex)", SharedSerialFib<queuing_mutex>, NumbersCount); assert(result == sum);
+            sum = Measure("Shared serial (Conc.HashTable)", ConcurrentHashSerialFib, NumbersCount); assert(result == sum);
+            sum = Measure("Parallel while+for/queue", ParallelQueueFib, NumbersCount); assert(result == sum);
+            sum = Measure("Parallel pipe/queue\t", ParallelPipeFib, NumbersCount); assert(result == sum);
+            sum = Measure("Parallel reduce\t\t", parallel_reduceFib, NumbersCount); assert(result == sum);
+            sum = Measure("Parallel scan\t\t", parallel_scanFib, NumbersCount); assert(result == sum);
+            sum = Measure("Parallel tasks\t\t", ParallelTaskFib, NumbersCount); assert(result == sum);
+        }
+
+    #ifdef __GNUC__
+        if(Verbose) printf("Fibonacci number #%d modulo 2^64 is %lld\n\n", NumbersCount, result);
+    #else
+        if(Verbose) printf("Fibonacci number #%d modulo 2^64 is %I64d\n\n", NumbersCount, result);
+    #endif
+    }
+    if(!Verbose) printf("TEST PASSED\n");
+    return 0;
+}
+
+// Utils
+
+void Matrix2x2Multiply(const value a[2][2], const value b[2][2], value c[2][2])
+{
+    for( int i = 0; i <= 1; i++)
+        for( int j = 0; j <= 1; j++)
+            c[i][j] = a[i][0]*b[0][j] + a[i][1]*b[1][j];
+}
+
+Matrix2x2 Matrix2x2::operator *(const Matrix2x2 &to) const
+{
+    Matrix2x2 result;
+    Matrix2x2Multiply(v, to.v, result.v);
+    return result;
+}
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/Makefile b/xdl/third_party/tbb/examples/test_all/fibonacci/Makefile
new file mode 100644
index 00000000..69c2fb6f
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/Makefile
@@ -0,0 +1,52 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# GNU Makefile that builds and runs example.
+run_cmd=
+PROG=fibonacci
+ARGS=
+
+# The C++ compiler
+ifneq (,$(shell which icc 2>/dev/null))
+CXX=icc
+endif # icc
+
+ifeq ($(shell uname), Linux)
+ifeq ($(target), android)
+LIBS+= --sysroot=$(SYSROOT)
+run_cmd=../../common/android.linux.launcher.sh
+else
+LIBS+= -lrt 
+endif
+else ifeq ($(shell uname), Darwin)
+override CXXFLAGS += -Wl,-rpath,$(TBBROOT)/lib
+endif
+
+all:	release test
+
+release: *.cpp
+	$(CXX) -O2 -DNDEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb $(LIBS)
+
+debug: *.cpp
+	$(CXX) -O0 -g -DTBB_USE_DEBUG $(CXXFLAGS) -o $(PROG) $^ -ltbb_debug $(LIBS)
+
+clean:
+	$(RM) $(PROG) *.o *.d
+
+test:
+	$(run_cmd) ./$(PROG) $(ARGS)
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/Makefile.windows b/xdl/third_party/tbb/examples/test_all/fibonacci/Makefile.windows
new file mode 100644
index 00000000..fd6ff53a
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/Makefile.windows
@@ -0,0 +1,45 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Common Makefile that builds and runs example.
+
+# Just specify your program basename
+PROG=Fibonacci
+ARGS=
+
+# Trying to find if icl.exe is set
+CXX1 = $(TBB_CXX)-
+CXX2 = $(CXX1:icl.exe-=icl.exe)
+CXX  = $(CXX2:-=cl.exe)
+
+# The C++ compiler options
+MYCXXFLAGS = /TP /EHsc /W3 /nologo /D _CONSOLE /D _MBCS /D WIN32 /D _WIN32_WINNT=0x0501 $(CXXFLAGS)
+MYLDFLAGS =/INCREMENTAL:NO /NOLOGO /DEBUG /FIXED:NO $(LDFLAGS)
+
+all: release test
+release: compiler_check
+	$(CXX) *.cpp /MD /O2 /D NDEBUG $(MYCXXFLAGS) /link tbb.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+debug: compiler_check
+	$(CXX) *.cpp /MDd /Od /Zi /D TBB_USE_DEBUG /D _DEBUG $(MYCXXFLAGS) /link tbb_debug.lib $(LIBS) $(MYLDFLAGS) /OUT:$(PROG).exe
+clean:
+	@cmd.exe /C del $(PROG).exe *.obj *.?db *.manifest
+test:
+	$(PROG) $(ARGS)
+compiler_check:
+	@echo compiler_test>compiler_test && @$(CXX) /E compiler_test >nul 2>&1  || echo "$(CXX) command not found. Check if CXX=$(CXX) is set properly"
+	@cmd.exe /C del compiler_test
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/msvs/fibonacci.sln b/xdl/third_party/tbb/examples/test_all/fibonacci/msvs/fibonacci.sln
new file mode 100644
index 00000000..e1e689ac
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/msvs/fibonacci.sln
@@ -0,0 +1,28 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 2013
+VisualStudioVersion = 12.0.40629.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "fibonacci", "fibonacci.vcxproj", "{3AA40693-F93D-4D4B-B32E-068F511A252E}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Win32 = Debug|Win32
+		Debug|x64 = Debug|x64
+		Release|Win32 = Release|Win32
+		Release|x64 = Release|x64
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|Win32.ActiveCfg = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|Win32.Build.0 = Debug|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|x64.ActiveCfg = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Debug|x64.Build.0 = Debug|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|Win32.ActiveCfg = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|Win32.Build.0 = Release|Win32
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|x64.ActiveCfg = Release|x64
+		{3AA40693-F93D-4D4B-B32E-068F511A252E}.Release|x64.Build.0 = Release|x64
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+EndGlobal
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/msvs/fibonacci.vcxproj b/xdl/third_party/tbb/examples/test_all/fibonacci/msvs/fibonacci.vcxproj
new file mode 100644
index 00000000..39aba728
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/msvs/fibonacci.vcxproj
@@ -0,0 +1,201 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" ToolsVersion="12.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <ProjectName>fibonacci</ProjectName>
+    <ProjectGuid>{3AA40693-F93D-4D4B-B32E-068F511A252E}</ProjectGuid>
+    <RootNamespace>fibonacci</RootNamespace>
+    <Keyword>Win32Proj</Keyword>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <Import Project="..\..\..\common\toolset.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <CharacterSet>MultiByte</CharacterSet>
+    <PlatformToolset>v120</PlatformToolset>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="PropertySheets">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup>
+    <_ProjectFileVersion>10.0.40219.1</_ProjectFileVersion>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">$(TEMP)\tbb_examples\$(SolutionName)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">false</LinkIncremental>
+    <OutDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(Platform)\$(Configuration)\</OutDir>
+    <IntDir Condition="'$(Configuration)|$(Platform)'=='Release|x64'">$(TEMP)\tbb_examples\$(SolutionName)\$(Platform)\$(Configuration)\</IntDir>
+    <LinkIncremental Condition="'$(Configuration)|$(Platform)'=='Release|x64'">false</LinkIncremental>
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" />
+    <CodeAnalysisRuleSet Condition="'$(Configuration)|$(Platform)'=='Release|x64'">AllRules.ruleset</CodeAnalysisRuleSet>
+    <CodeAnalysisRules Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+    <CodeAnalysisRuleAssemblies Condition="'$(Configuration)|$(Platform)'=='Release|x64'" />
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <Optimization>Disabled</Optimization>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;_DEBUG;_CONSOLE;TBB_USE_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDebugDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb_debug.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 debug "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\ia32\vc_mt;$(TBBROOT)\lib\ia32\vc12;$(SolutionDir)\..\..\..\..\lib\ia32\vc_mt;$(SolutionDir)\..\..\..\..\lib\ia32\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX86</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  ia32 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Midl>
+      <TargetEnvironment>X64</TargetEnvironment>
+    </Midl>
+    <ClCompile>
+      <AdditionalIncludeDirectories>$(TBBROOT)\include;$(SolutionDir)\..\..\..\..\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+      <PreprocessorDefinitions>WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <RuntimeLibrary>MultiThreadedDLL</RuntimeLibrary>
+      <PrecompiledHeader>
+      </PrecompiledHeader>
+      <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
+    </ClCompile>
+    <Link>
+      <AdditionalDependencies>tbb.lib;%(AdditionalDependencies)</AdditionalDependencies>
+      <AdditionalLibraryDirectories>$(TBBROOT)\lib\intel64\vc_mt;$(TBBROOT)\lib\intel64\vc12;$(SolutionDir)\..\..\..\..\lib\intel64\vc_mt;$(SolutionDir)\..\..\..\..\lib\intel64\vc12;%(AdditionalLibraryDirectories)</AdditionalLibraryDirectories>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+      <SubSystem>Console</SubSystem>
+      <OptimizeReferences>true</OptimizeReferences>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <TargetMachine>MachineX64</TargetMachine>
+      <FixedBaseAddress>false</FixedBaseAddress>
+    </Link>
+    <PostBuildEvent>
+      <Message>Copying DLLs and PDBs</Message>
+      <Command>call "$(SolutionDir)\..\..\..\common\copy_libraries.bat"  intel64 release "$(OutDir)"</Command>
+    </PostBuildEvent>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\Fibonacci.cpp" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="..\readme.html" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
\ No newline at end of file
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/readme.html b/xdl/third_party/tbb/examples/test_all/fibonacci/readme.html
new file mode 100644
index 00000000..b0a3aab2
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/readme.html
@@ -0,0 +1,402 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Fibonacci sample</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Fibonacci sample</h1>
+	</div>
+	
+	<p>
+		This directory contains an example that computes Fibonacci numbers in several
+		different ways.
+	<br><br>
+		The purpose of the example is to exercise every include file
+		and class in Intel&reg; Threading Building Blocks.
+		Most of the computations are deliberately silly and not expected to
+		show any speedup on multiprocessors.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">System Requirements</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				For the most up to date system requirements, see the <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a>
+			</p>
+		</div>
+	</div>
+	
+	<div class="changes">
+		<div class="h3-alike">Files</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="Fibonacci.cpp">Fibonacci.cpp</a>
+				<dd>Source code for example.
+				<dt><a href="Makefile">Makefile</a>
+				<dd>Makefile for building the example.
+			</dl>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="msvs/">msvs</a> 
+				<dd>Contains Microsoft* Visual Studio* workspace for building and running the example (Windows* systems only).
+				<dt><a href="xcode/">xcode</a>
+				<dd>Contains Xcode* IDE workspace for building and running the example (macOS* systems only).
+			</dl>
+			<p>For information about the minimum supported version of IDE, see <a href="http://software.intel.com/en-us/articles/intel-threading-building-blocks-release-notes">release notes.</a></p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Build instructions</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<p>General build directions can be found <a href="../../index.html">here</a>.</p>
+		</div>
+	</div>
+
+	<div class="changes">
+		<div class="h3-alike">Usage</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><tt>fibonacci <i>K</i> [<i>M</i>[:<i>N</i>]] [<i>R</i>]</tt>
+				<dd>Calculates the <i>K</i>-th fibonacci number.
+					<i>M</i> and <i>N</i> are a range of numbers of threads to be used.
+					<i>R</i> is the number of times to repeat the calculation.
+				<dt>To run a short version of this example, e.g., for use with Intel&reg; Threading Tools:
+				<dd>Build a <i>debug</i> version of the example
+					(see the <a href="../../index.html">build instructions</a>).
+					<br>Run it with a small fibonacci number and the desired number of threads, e.g., <tt>fibonacci&nbsp;100&nbsp;4</tt>.
+			</dl>
+		</div>
+	</div>
+	
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>	
+	
+</body>
+</html>
diff --git a/xdl/third_party/tbb/examples/test_all/fibonacci/xcode/fibonacci.xcodeproj/project.pbxproj b/xdl/third_party/tbb/examples/test_all/fibonacci/xcode/fibonacci.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..e8c14e57
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/fibonacci/xcode/fibonacci.xcodeproj/project.pbxproj
@@ -0,0 +1,264 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 46;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		A1F593A60B8F042A00073279 /* Fibonacci.cpp in Sources */ = {isa = PBXBuildFile; fileRef = A1F593A50B8F042A00073279 /* Fibonacci.cpp */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXBuildRule section */
+		C3C58962218C273700DAC94C /* PBXBuildRule */ = {
+			isa = PBXBuildRule;
+			compilerSpec = com.intel.compilers.icc.latest;
+			fileType = sourcecode.cpp;
+			isEditable = 1;
+			outputFiles = (
+			);
+			script = "# Type a script or drag a script file from your workspace to insert its path.\n";
+		};
+/* End PBXBuildRule section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		8DD76F690486A84900D96B5E /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		8DD76F6C0486A84900D96B5E /* Fibonacci */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = Fibonacci; sourceTree = BUILT_PRODUCTS_DIR; };
+		A1F593A50B8F042A00073279 /* Fibonacci.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = Fibonacci.cpp; path = ../Fibonacci.cpp; sourceTree = SOURCE_ROOT; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		8DD76F660486A84900D96B5E /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		08FB7794FE84155DC02AAC07 /* Fibonacci */ = {
+			isa = PBXGroup;
+			children = (
+				08FB7795FE84155DC02AAC07 /* Source */,
+				1AB674ADFE9D54B511CA2CBB /* Products */,
+			);
+			name = Fibonacci;
+			sourceTree = "<group>";
+		};
+		08FB7795FE84155DC02AAC07 /* Source */ = {
+			isa = PBXGroup;
+			children = (
+				A1F593A50B8F042A00073279 /* Fibonacci.cpp */,
+			);
+			name = Source;
+			sourceTree = "<group>";
+		};
+		1AB674ADFE9D54B511CA2CBB /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				8DD76F6C0486A84900D96B5E /* Fibonacci */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		8DD76F620486A84900D96B5E /* Fibonacci */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Fibonacci" */;
+			buildPhases = (
+				8DD76F640486A84900D96B5E /* Sources */,
+				8DD76F660486A84900D96B5E /* Frameworks */,
+				8DD76F690486A84900D96B5E /* CopyFiles */,
+			);
+			buildRules = (
+				C3C58962218C273700DAC94C /* PBXBuildRule */,
+			);
+			dependencies = (
+			);
+			name = Fibonacci;
+			productInstallPath = "$(HOME)/bin";
+			productName = Fibonacci;
+			productReference = 8DD76F6C0486A84900D96B5E /* Fibonacci */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		08FB7793FE84155DC02AAC07 /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				LastUpgradeCheck = 1000;
+			};
+			buildConfigurationList = 1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "fibonacci" */;
+			compatibilityVersion = "Xcode 3.2";
+			developmentRegion = English;
+			hasScannedForEncodings = 1;
+			knownRegions = (
+				en,
+			);
+			mainGroup = 08FB7794FE84155DC02AAC07 /* Fibonacci */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				8DD76F620486A84900D96B5E /* Fibonacci */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXSourcesBuildPhase section */
+		8DD76F640486A84900D96B5E /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				A1F593A60B8F042A00073279 /* Fibonacci.cpp in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		A1F593C60B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				COPY_PHASE_STRIP = NO;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb_debug",
+				);
+				PRODUCT_NAME = Fibonacci;
+				ZERO_LINK = NO;
+			};
+			name = Debug64;
+		};
+		A1F593C70B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				GCC_GENERATE_DEBUGGING_SYMBOLS = NO;
+				GCC_VERSION = "";
+				HEADER_SEARCH_PATHS = "$(inherited)";
+				ICC_CXX_LANG_DIALECT = "c++11";
+				INSTALL_PATH = "$(HOME)/bin";
+				LD_RUNPATH_SEARCH_PATHS = "$(inherited)";
+				LIBRARY_SEARCH_PATHS = "$(inherited)";
+				PRODUCT_NAME = Fibonacci;
+				ZERO_LINK = NO;
+			};
+			name = Release64;
+		};
+		A1F593C80B8F0E6E00073279 /* Debug64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ENABLE_TESTABILITY = YES;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				ONLY_ACTIVE_ARCH = YES;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Debug64;
+		};
+		A1F593C90B8F0E6E00073279 /* Release64 */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				GCC_ENABLE_CPP_RTTI = YES;
+				GCC_MODEL_TUNING = "";
+				GCC_VERSION = "";
+				GCC_WARN_ABOUT_RETURN_TYPE = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				HEADER_SEARCH_PATHS = (
+					"$(TBBROOT)/include",
+					/opt/intel/tbb/include,
+				);
+				LD_RUNPATH_SEARCH_PATHS = "$(TBBROOT)/lib /opt/intel/tbb/lib";
+				LIBRARY_SEARCH_PATHS = (
+					"$(TBBROOT)/lib",
+					/opt/intel/tbb/lib,
+				);
+				MACOSX_DEPLOYMENT_TARGET = 10.11;
+				OTHER_CPLUSPLUSFLAGS = (
+					"$(OTHER_CFLAGS)",
+					"-m64",
+				);
+				OTHER_LDFLAGS = (
+					"-m64",
+					"-ltbb",
+				);
+				PRECOMPS_INCLUDE_HEADERS_FROM_BUILT_PRODUCTS_DIR = NO;
+				SYMROOT = "/tmp/tbb-$(USER)";
+				VALID_ARCHS = x86_64;
+			};
+			name = Release64;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		1DEB923108733DC60010E9CD /* Build configuration list for PBXNativeTarget "Fibonacci" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C60B8F0E6E00073279 /* Debug64 */,
+				A1F593C70B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+		1DEB923508733DC60010E9CD /* Build configuration list for PBXProject "fibonacci" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				A1F593C80B8F0E6E00073279 /* Debug64 */,
+				A1F593C90B8F0E6E00073279 /* Release64 */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Debug64;
+		};
+/* End XCConfigurationList section */
+	};
+	rootObject = 08FB7793FE84155DC02AAC07 /* Project object */;
+}
diff --git a/xdl/third_party/tbb/examples/test_all/index.html b/xdl/third_party/tbb/examples/test_all/index.html
new file mode 100644
index 00000000..764d60a1
--- /dev/null
+++ b/xdl/third_party/tbb/examples/test_all/index.html
@@ -0,0 +1,344 @@
+<!DOCTYPE html>
+<html xmlns:mso="urn:schemas-microsoft-com:office:office" xmlns:msdt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882">
+<head>
+	<meta charset="UTF-8">
+	<style>
+		::selection {
+			background: #b7ffb7;
+		}
+		::-moz-selection {
+			background: #b7ffb7;
+		}
+
+		body {
+			font-family: Arial, Helvetica, sans-serif;
+			font-size: 16px;
+			width: 800px;
+			margin: 0 auto;
+		}
+		#banner {
+			/* Div for banner */
+			float:left;
+			margin: 0px;
+			margin-bottom: 10px;
+			width: 100%;
+			background-color: #0071C5;
+			z-index: 0;
+		}
+		#banner .logo {
+			/* Apply to logo in banner. Add as class to image tag. */
+			float: left;
+			margin-right: 20px;
+			margin-left: 20px;
+			margin-top: 15px;
+			padding-bottom: 5px;
+		}
+		h1 {
+			text-align: center;
+			font-size: 36px;
+		}
+		h1.title {
+			/* Add as class to H1 in banner */
+			font-family: "Intel Clear", Verdana, Arial, sans-serif;
+			font-weight:normal;
+			color: #FFFFFF;
+			font-size: 170%;
+			margin-right: 40px;
+			margin-left: 40px;
+			padding-right: 20px;
+			text-indent: 20px;
+		}
+		.h3-alike {
+			display:inline;
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		h3 {
+			font-size: 1.17em;
+			font-weight: bold;
+			color: #0071C5;
+		}
+		.h4-alike {
+			display:inline;
+			font-size: 1.05em;
+			font-weight: bold;
+		}
+		pre {
+			font-family: "Consolas", Monaco, monospace;
+			font-size:small;
+			background: #fafafa;
+			margin: 0;
+			padding-left:20px;
+		}
+		#footer {
+			font-size: small;
+		}
+		code {
+			font-family: "Consolas", Monaco, monospace;
+		}
+		.code-block
+		{
+			padding-left:20px;
+		}
+		.changes {
+			margin: 1em 0;
+		}
+		.changes input:active {
+			position: relative;
+			top: 1px;
+		}
+		.changes input:hover:after {
+			padding-left: 16px;
+			font-size: 10px;
+			content: 'More';
+		}
+		.changes input:checked:hover:after {
+			content: 'Less';
+		}
+		.changes input + .show-hide {
+			display: none;
+		}
+		.changes input:checked + .show-hide {
+			display: block;
+		}
+
+		ul {
+			margin: 0;
+			padding: 0.5em 0 0.5em 2.5em;
+		}
+		ul li {
+			margin-bottom: 3px;
+		}
+		ul li:last-child {
+			margin-bottom: 0;
+		}
+		.disc {
+			list-style-type:disc
+		}
+		.circ {
+			list-style-type:circle
+		}
+		
+		.single {
+			padding: 0 0.5em;
+		}
+		
+		/* ------------------------------------------------- */
+		/* Table styles                                      */
+		table{
+			margin-bottom:5pt;
+			border-collapse:collapse;
+			margin-left:0px;
+			margin-top:0.3em;
+			font-size:10pt;
+		}
+		tr{
+			vertical-align:top;
+		}
+		th,
+		th h3{
+			padding:4px;
+			text-align:left;
+			background-color:#0071C5;
+			font-weight:bold;
+			margin-top:1px;
+			margin-bottom:0;
+			color:#FFFFFF;
+			font-size:10pt;
+			vertical-align:middle;
+		}
+		th{
+			border:1px #dddddd solid;
+			padding-top:2px;	 	 
+			padding-bottom:0px;
+			padding-right:3px;	 	 
+			padding-left:3px;
+		}
+		td{
+			border:1px #dddddd solid;
+			vertical-align:top;
+			font-size:100%;
+			text-align:left;
+			margin-bottom:0;
+		}
+		td,
+		td p{
+			margin-top:0;
+			margin-left:0;
+			text-align:left;
+			font-size:inherit;
+			line-height:120%;
+		}
+		td p{
+			margin-bottom:0;
+			padding-top:5px;
+			padding-bottom:5px;
+			padding-right:5px;
+			padding-left:1px;
+		}
+		.noborder{
+			border:0px none;
+		}
+		.noborder1stcol{
+			border:0px none;
+			padding-left:0pt;
+		}
+		td ol{
+			font-size:inherit;
+			margin-left:28px;
+		}
+		td ul{
+			font-size:inherit;
+			margin-left:24px;
+		}
+		.DefListTbl{
+			width:90%;
+			margin-left:-3pt;
+		}
+		.syntaxdiagramtbl{
+			margin-left:-3pt;
+		}
+		.sdtbl{
+		}
+		.sdrow{
+		}
+		.sdtblp{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		.idepara, .ide_para{
+			border:0px none;
+			font-size:inherit;
+			line-height:120%;
+			margin-bottom:0;
+			padding-bottom:0px;
+			padding-top:5px;
+			padding-left:0px;
+			padding-right:5px;
+			vertical-align:top;
+		}
+		
+		.specs {
+			border-collapse:collapse;
+		}
+		.specs td, .specs th {
+			font-size: 14px;
+		}
+		.specs td {
+			border: 1px solid black;
+		}
+		.specs td td, .specs td th {
+			border: none;
+		}
+		.specs	td, .specs td td, .specs td th {
+			padding: 0 0.2em 0.2em;
+			text-align: center;
+		}
+		.specs td tr:last-child td, 
+		.specs td tr:last-child th {
+			padding: 0 0.2em;
+		}
+		.serial-time {
+		}
+		.modified-time {
+		width: 6.5em;
+		}
+		.compiler {
+		}
+		.comp-opt {
+		}
+		.sys-specs {
+			width: 18em;
+		}
+		.note {
+			font-size:small;
+			font-style: italic;
+		}
+	</style>
+	<title>Intel&reg; Threading Building Blocks. Samples on all features</title>
+</head>
+<body>
+	
+	<div id="banner">
+		<img class="logo" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEMAAAAsCAYAAAA+aAX8AAAAAXNSR0IArs4c6QAAAARnQU1BAACx
+				jwv8YQUAAAAJcEhZcwAALiIAAC4iAari3ZIAAAAZdEVYdFNvZnR3YXJlAEFkb2JlIEltYWdlUmVh
+				ZHlxyWU8AAAIN0lEQVRoQ+WaCaxdUxSGW2ouatZWaVS15nkqkZhSVERQglLEPCam1BCixhqqCKUS
+				NIiYpxhqHmouIeaY5ylFzA/v1fev8+/j3N5737v3vtf3buNP/uy9/7X2Ovuse4a997m9mgltbW2L
+				wRHwcHgFfAx+AH+GCb/BT2fNmvUk5ZXwYOrrOsTcCU5CJ74pPBJeA5+Bn8LfOLmagf/f8Af4NrwD
+				ngg3wdTHh2pOMMB1Gejx8AE4M85mNqD/A7+D78GXkXQFTIMPwUfhdPg6/AxWTRw29b8QruPD9zwY
+				zPrwHPi2xxmg3QrfgDfD05BGU24EB1HvC3s7REXgtwDsDzeEY+Ak+AJsUfwE2sJdcBN37V4whiU4
+				+KGUM2JEBtpzUInZEa5g9y4FcYfAo+GLPmwOND2HFrXrnAUHWgnq0vzDB2+Bt0H9coPs1m3gmNvD
+				ZyITBu234Jp26XoQfCC80sfTAXVv7wOXskuPgnHoSvnTw9P49MDdyOauAQEXhWdC4Vd4ARxmc1OB
+				cW0Gv3U+lJDvKFa0ufMg4GXwR3gs7J57sRNoaWnR2+znLB2RkKds6jwItvbckIQiGO+eTkSby71t
+				qh100qtsUCJxmmpSw5i2gWebR1jWm2047T1gf0vyfViJEKi/TtHua7wMdNJs8U/zDzjUpqYA47k4
+				O704wY+kUZ2P+glQc5ldac9j323sF1cH2EB6h8BxYZdbRDeDOJ16UBJiHDFuMMdYbhjEGA8DxJ4h
+				jXIemmMpz6ccqbZ1JUlT/3SrHC+9XeB0MjzV9RHqKFAXVg2nBkH/lxxO8aZYbhjEKEuGQH1BuCKc
+				z1IAN61jAtiut1wZ+ByIkwa6r9t6ZmhSFZw9eL0gxiMw4SLLDYMYFZNRDbhpcpgwzXI5MOqSEvKM
+				Ue8D+xU4r/Xe+C8HB1ThkhFgNqAXk6FVqyZuA1LcItBXQd+WUvf6YMslwFZvMs7KvMP/SculwKa3
+				hfYPPsZpfsvS9QD9PRHbcOmUC9J+H2qfoRJ/0MHgFhHIQC8mQ8twxZ0Ji099vSGegn/TP0BdD/Db
+				Ycn0nna9yZiceQcetFwKDE/4oNtZCtDeXHoC7dWlU1Uyvs7U6sBHJ7FaBAPU82TYJUAzFnCU+1mq
+				COyfwGLi6k3G05l34BrL/wFxjA/0mKUcaNqBKiJODHclQ3sLCVqZprfEvVCLtThhiskRDFAvXhnv
+				QPlfi5uW7ytTL14Nr0Bd1pfDXy1Lv93h6koGLstCLR/SuPJ5SQBBD8hPZATbWs6BrdZk7B4dDNpT
+				Mjkw3bL0YjLOsxygPUWDyExtD1GNV6JAeyTUBlDCKtbrScYxhfjyj1s+B9o+dnifIj94AnpNyaC9
+				f3QwkNJCTnjOsvRiMi6xrHiaA3ycyYFNbcqBpisl/aoHWaspGdg03uIc43mb/gOilt3CREslQG80
+				GedmlkC1KyNPBnU9wOPWMp6Aut0S74HfwIQJ7ldTMjBPdBIiGWC0TRkQlseWNmR2tlwC9DmZjEmW
+				pQ/zOAKqtwdcrnW/DpOBPtp9Ii6F9lhL1yWIo2zUvVhxzYHeLVcG/QfT/iuTA3qwan+zGndVP8p2
+				k4G8E/wLW4D6PxTlnxgwaDEjaMe6n+USYOvqZKTbUrjQcor3ZSYHRtjULvCrmgwkfY5oRc9B+3Cb
+				S4FhIhS+gAtZLgH9Y6GWuQU6mwx9IEqYajlA+47CsZ6lGovFBDTNkA9xM4CmpXsAWySDUrPjqZQl
+				QBsfnSoB41UKAvS9ouJmDfpaDpTQ2WRcXYinCZm+pdyEtDClPgLloP0unABPp3lrpoZ+KkWskSgP
+				sVZMhlat2t7LQftE2aoCh0sVBOheXclyCYjTp7W19bUsZAQtJuPLTA39gOhg0D7PJtny1xj1tWA+
+				sUpAG2j7mZaqAh9tzPSVP+XStL+w/qY1XRlfWdOSYXvp7QKnU6Ayqk4jLZcB2zD4gv1iu52qkvG5
+				NKPsyrCuPs9aDtDeDr4EtS7RRyXNCgfYLPtYfoC33D0Hul6tE6jOfvsMhVqaT8PWG85PXR+WxlOP
+				pHUIHPNXDsif7NWAT773STdlX6vK4ebi4WRgWybZqFe86tBXUAw4BL+S7UTautTXo9yFcjdKPbsq
+				PuQTsKdbZ16YLzZrAgdRRvXLCF/Big/R/wXInn5dffdMt8opNs214Bz6cyqNbUDRcZwTIWjDt3m+
+				XtcBxq3pvL6p6mFftlFUE+i8JPxRCRGoawVbcVepGcF4V4eTGPNPHv+7NjUGAhzmQOl20fyhphlg
+				T4CxLcQw9WC9Gxb3P4Q37NY4CHJXCuhSW3JnwEXs0qNgSHqVbw210ZP2XwK0A65/6C6NgziaAU5X
+				wCIUHB4H86227gKH1+JtL3gd1N5sCdACbgZo5rtgnQKx+hLs/ixsdjBXBd2TtyKNhUOp1/dprgMQ
+				rx9x16fcn1KbttrIyf9OkICWw1KApvY2YyXbpSBobKf7OGXApFtI+5d3Qq1BDoL6V87GcDVc9Ivq
+				E4D+bjTQbc1i9demreDu8Ch0ffG6hdnmDMrvFbsSsAXczIGk3fwb4VYe+pwBB9Angkd83ADtqgkq
+				AjetdTTV1icDlfl+Qi3AP4elHEjaDXscHgFjPdNt4ID6S9B9sNLiKoelmuFuJbCpDJi+hvqz2qFw
+				iIfWc2AQusxPgvq484vH2eUgtpYHH0Hteeqb75ZwMQ+j+cDg9PlwFDwd6o9sr0KtbWI/tSPgp32M
+				76H+s6mNX3030df5neGq1OtbZDUbOIlFoFaha0L9j0qfCHeAerDqVtODU8+hNThZfR1fHHbpG6kx
+				9Or1LzUmVVz+HJXDAAAAAElFTkSuQmCC">
+		<h1 class="title">Intel&reg; Threading Building Blocks.<br>Samples on various features</h1>
+	</div>
+	
+	<p>
+		This directory contains programs that exercise various components of Intel&reg; Threading Building Blocks.
+	</p>
+
+	<div class="changes">
+		<div class="h3-alike">Directories</div>
+		<input type="checkbox" checked="checked">
+		<div class="show-hide">
+			<dl>
+				<dt><a href="fibonacci/readme.html">fibonacci</a>
+				<dd>Compute Fibonacci numbers in different ways.
+			</dl>
+		</div>
+	</div>
+	<br>
+	<a href="../index.html">Up to parent directory</a>
+	<hr>
+	<div class="changes">
+	<div class="h3-alike">Legal Information:</div>
+		<input type="checkbox">
+		<div class="show-hide">
+			<p>
+				Intel and the Intel logo are trademarks of Intel Corporation in the U.S. and/or other countries.
+				<br>* Other names and brands may be claimed as the property of others. 
+				<br>&copy; 2018, Intel Corporation
+			</p>
+		</div>
+	</div>
+</body>
+</html>
+
diff --git a/xdl/third_party/tbb/include/index.html b/xdl/third_party/tbb/include/index.html
new file mode 100644
index 00000000..6fdf71cb
--- /dev/null
+++ b/xdl/third_party/tbb/include/index.html
@@ -0,0 +1,25 @@
+<HTML>
+<BODY>
+
+<H2>Overview</H2>
+Include files for Intel&reg; Threading Building Blocks (Intel&reg; TBB).
+
+<H2>Directories</H2>
+<DL>
+<DT><A HREF="tbb/index.html">tbb</A>
+<DD>Include files for Intel TBB classes and functions.
+<DT><A HREF="serial/tbb/">serial/tbb</A>
+<DD>Include files for a sequential implementation of the parallel_for algorithm.
+</DL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/include/serial/tbb/parallel_for.h b/xdl/third_party/tbb/include/serial/tbb/parallel_for.h
new file mode 100644
index 00000000..e5959c22
--- /dev/null
+++ b/xdl/third_party/tbb/include/serial/tbb/parallel_for.h
@@ -0,0 +1,219 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_SERIAL_parallel_for_H
+#define __TBB_SERIAL_parallel_for_H
+
+#include "tbb_annotate.h"
+
+#ifndef __TBB_NORMAL_EXECUTION
+#include "tbb/blocked_range.h"
+#include "tbb/partitioner.h"
+#endif
+
+#if TBB_USE_EXCEPTIONS
+#include <stdexcept>
+#include <string> // required to construct std exception classes
+#else
+#include <cstdlib>
+#include <iostream>
+#endif
+
+namespace tbb {
+namespace serial {
+namespace interface9 {
+
+// parallel_for serial annotated implementation
+
+template< typename Range, typename Body, typename Partitioner >
+class start_for : tbb::internal::no_copy {
+    Range my_range;
+    const Body my_body;
+    typename Partitioner::task_partition_type my_partition;
+    void execute();
+
+    //! Constructor for root task.
+    start_for( const Range& range, const Body& body, Partitioner& partitioner ) :
+        my_range( range ),
+        my_body( body ),
+        my_partition( partitioner )
+    {
+    }
+
+    //! Splitting constructor used to generate children.
+    /** this becomes left child.  Newly constructed object is right child. */
+    start_for( start_for& parent_, typename Partitioner::split_type& split_obj ) :
+        my_range( parent_.my_range, split_obj ),
+        my_body( parent_.my_body ),
+        my_partition( parent_.my_partition, split_obj )
+    {
+    }
+
+public:
+    static void run(  const Range& range, const Body& body, Partitioner& partitioner ) {
+        if( !range.empty() ) {
+            ANNOTATE_SITE_BEGIN( tbb_parallel_for );
+            {
+                start_for a( range, body, partitioner );
+                a.execute();
+            }
+            ANNOTATE_SITE_END( tbb_parallel_for );
+        }
+    }
+};
+
+template< typename Range, typename Body, typename Partitioner >
+void start_for< Range, Body, Partitioner >::execute() {
+    if( !my_range.is_divisible() || !my_partition.is_divisible() ) {
+        ANNOTATE_TASK_BEGIN( tbb_parallel_for_range );
+        {
+            my_body( my_range );
+        }
+        ANNOTATE_TASK_END( tbb_parallel_for_range );
+    } else {
+        typename Partitioner::split_type split_obj;
+        start_for b( *this, split_obj );
+        this->execute(); // Execute the left interval first to keep the serial order.
+        b.execute();     // Execute the right interval then.
+    }
+}
+
+//! Parallel iteration over range with default partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body ) {
+    serial::interface9::start_for<Range,Body,const __TBB_DEFAULT_PARTITIONER>::run(range,body,__TBB_DEFAULT_PARTITIONER());
+}
+
+//! Parallel iteration over range with simple partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const simple_partitioner& partitioner ) {
+    serial::interface9::start_for<Range,Body,const simple_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel iteration over range with auto_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const auto_partitioner& partitioner ) {
+    serial::interface9::start_for<Range,Body,const auto_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel iteration over range with static_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const static_partitioner& partitioner ) {
+    serial::interface9::start_for<Range,Body,const static_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel iteration over range with affinity_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, affinity_partitioner& partitioner ) {
+    serial::interface9::start_for<Range,Body,affinity_partitioner>::run(range,body,partitioner);
+}
+
+//! Implementation of parallel iteration over stepped range of integers with explicit step and partitioner (ignored)
+template <typename Index, typename Function, typename Partitioner>
+void parallel_for_impl(Index first, Index last, Index step, const Function& f, Partitioner& ) {
+    if (step <= 0 ) {
+#if TBB_USE_EXCEPTIONS
+        throw std::invalid_argument( "nonpositive_step" );
+#else
+        std::cerr << "nonpositive step in a call to parallel_for" << std::endl;
+        std::abort();
+#endif
+    } else if (last > first) {
+        // Above "else" avoids "potential divide by zero" warning on some platforms
+        ANNOTATE_SITE_BEGIN( tbb_parallel_for );
+        for( Index i = first; i < last; i = i + step ) {
+            ANNOTATE_TASK_BEGIN( tbb_parallel_for_iteration );
+            { f( i ); }
+            ANNOTATE_TASK_END( tbb_parallel_for_iteration );
+        }
+        ANNOTATE_SITE_END( tbb_parallel_for );
+    }
+}
+
+//! Parallel iteration over a range of integers with explicit step and default partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, step, f, auto_partitioner());
+}
+//! Parallel iteration over a range of integers with explicit step and simple partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const simple_partitioner& p) {
+    parallel_for_impl<Index,Function,const simple_partitioner>(first, last, step, f, p);
+}
+//! Parallel iteration over a range of integers with explicit step and auto partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const auto_partitioner& p) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, step, f, p);
+}
+//! Parallel iteration over a range of integers with explicit step and static partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const static_partitioner& p) {
+    parallel_for_impl<Index,Function,const static_partitioner>(first, last, step, f, p);
+}
+//! Parallel iteration over a range of integers with explicit step and affinity partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, affinity_partitioner& p) {
+    parallel_for_impl(first, last, step, f, p);
+}
+
+//! Parallel iteration over a range of integers with default step and default partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, static_cast<Index>(1), f, auto_partitioner());
+}
+//! Parallel iteration over a range of integers with default step and simple partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const simple_partitioner& p) {
+    parallel_for_impl<Index,Function,const simple_partitioner>(first, last, static_cast<Index>(1), f, p);
+}
+//! Parallel iteration over a range of integers with default step and auto partitioner
+template <typename Index, typename Function>
+    void parallel_for(Index first, Index last, const Function& f, const auto_partitioner& p) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, static_cast<Index>(1), f, p);
+}
+//! Parallel iteration over a range of integers with default step and static partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const static_partitioner& p) {
+    parallel_for_impl<Index,Function,const static_partitioner>(first, last, static_cast<Index>(1), f, p);
+}
+//! Parallel iteration over a range of integers with default step and affinity_partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, affinity_partitioner& p) {
+    parallel_for_impl(first, last, static_cast<Index>(1), f, p);
+}
+
+} // namespace interfaceX
+
+using interface9::parallel_for;
+
+} // namespace serial
+
+#ifndef __TBB_NORMAL_EXECUTION
+using serial::interface9::parallel_for;
+#endif
+
+} // namespace tbb
+
+#endif /* __TBB_SERIAL_parallel_for_H */
diff --git a/xdl/third_party/tbb/include/serial/tbb/tbb_annotate.h b/xdl/third_party/tbb/include/serial/tbb/tbb_annotate.h
new file mode 100644
index 00000000..c16defea
--- /dev/null
+++ b/xdl/third_party/tbb/include/serial/tbb/tbb_annotate.h
@@ -0,0 +1,36 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_annotate_H
+#define __TBB_annotate_H
+
+// Macros used by the Intel(R) Parallel Advisor.
+#ifdef __TBB_NORMAL_EXECUTION
+    #define ANNOTATE_SITE_BEGIN( site )
+    #define ANNOTATE_SITE_END( site )
+    #define ANNOTATE_TASK_BEGIN( task )
+    #define ANNOTATE_TASK_END( task )
+    #define ANNOTATE_LOCK_ACQUIRE( lock )
+    #define ANNOTATE_LOCK_RELEASE( lock )
+#else
+    #include <advisor-annotate.h>
+#endif
+
+#endif /* __TBB_annotate_H */
diff --git a/xdl/third_party/tbb/include/tbb/aggregator.h b/xdl/third_party/tbb/include/tbb/aggregator.h
new file mode 100644
index 00000000..e25f096d
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/aggregator.h
@@ -0,0 +1,202 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__aggregator_H
+#define __TBB__aggregator_H
+
+#if !TBB_PREVIEW_AGGREGATOR
+#error Set TBB_PREVIEW_AGGREGATOR before including aggregator.h
+#endif
+
+#include "atomic.h"
+#include "tbb_profiling.h"
+
+namespace tbb {
+namespace interface6 {
+
+using namespace tbb::internal;
+
+class aggregator_operation {
+    template<typename handler_type> friend class aggregator_ext;
+    uintptr_t status;
+    aggregator_operation* my_next;
+public:
+    enum aggregator_operation_status { agg_waiting=0, agg_finished };
+    aggregator_operation() : status(agg_waiting), my_next(NULL) {}
+    /// Call start before handling this operation
+    void start() { call_itt_notify(acquired, &status); }
+    /// Call finish when done handling this operation
+    /** The operation will be released to its originating thread, and possibly deleted. */
+    void finish() { itt_store_word_with_release(status, uintptr_t(agg_finished)); }
+    aggregator_operation* next() { return itt_hide_load_word(my_next);}
+    void set_next(aggregator_operation* n) { itt_hide_store_word(my_next, n); }
+};
+
+namespace internal {
+
+class basic_operation_base : public aggregator_operation {
+    friend class basic_handler;
+    virtual void apply_body() = 0;
+public:
+    basic_operation_base() : aggregator_operation() {}
+    virtual ~basic_operation_base() {}
+};
+
+template<typename Body>
+class basic_operation : public basic_operation_base, no_assign {
+    const Body& my_body;
+    void apply_body() __TBB_override { my_body(); }
+public:
+    basic_operation(const Body& b) : basic_operation_base(), my_body(b) {}
+};
+
+class basic_handler {
+public:
+    basic_handler() {}
+    void operator()(aggregator_operation* op_list) const {
+        while (op_list) {
+            // ITT note: &(op_list->status) tag is used to cover accesses to the operation data.
+            // The executing thread "acquires" the tag (see start()) and then performs
+            // the associated operation w/o triggering a race condition diagnostics.
+            // A thread that created the operation is waiting for its status (see execute_impl()),
+            // so when this thread is done with the operation, it will "release" the tag
+            // and update the status (see finish()) to give control back to the waiting thread.
+            basic_operation_base& request = static_cast<basic_operation_base&>(*op_list);
+            // IMPORTANT: need to advance op_list to op_list->next() before calling request.finish()
+            op_list = op_list->next();
+            request.start();
+            request.apply_body();
+            request.finish();
+        }
+    }
+};
+
+} // namespace internal
+
+//! Aggregator base class and expert interface
+/** An aggregator for collecting operations coming from multiple sources and executing
+    them serially on a single thread. */
+template <typename handler_type>
+class aggregator_ext : tbb::internal::no_copy {
+public:
+    aggregator_ext(const handler_type& h) : handler_busy(0), handle_operations(h) { mailbox = NULL; }
+
+    //! EXPERT INTERFACE: Enter a user-made operation into the aggregator's mailbox.
+    /** Details of user-made operations must be handled by user-provided handler */
+    void process(aggregator_operation *op) { execute_impl(*op); }
+
+protected:
+    /** Place operation in mailbox, then either handle mailbox or wait for the operation
+        to be completed by a different thread. */
+    void execute_impl(aggregator_operation& op) {
+        aggregator_operation* res;
+
+        // ITT note: &(op.status) tag is used to cover accesses to this operation. This
+        // thread has created the operation, and now releases it so that the handler
+        // thread may handle the associated operation w/o triggering a race condition;
+        // thus this tag will be acquired just before the operation is handled in the
+        // handle_operations functor.
+        call_itt_notify(releasing, &(op.status));
+        // insert the operation into the list
+        do {
+            // ITT may flag the following line as a race; it is a false positive:
+            // This is an atomic read; we don't provide itt_hide_load_word for atomics
+            op.my_next = res = mailbox; // NOT A RACE
+        } while (mailbox.compare_and_swap(&op, res) != res);
+        if (!res) { // first in the list; handle the operations
+            // ITT note: &mailbox tag covers access to the handler_busy flag, which this
+            // waiting handler thread will try to set before entering handle_operations.
+            call_itt_notify(acquired, &mailbox);
+            start_handle_operations();
+            __TBB_ASSERT(op.status, NULL);
+        }
+        else { // not first; wait for op to be ready
+            call_itt_notify(prepare, &(op.status));
+            spin_wait_while_eq(op.status, uintptr_t(aggregator_operation::agg_waiting));
+            itt_load_word_with_acquire(op.status);
+        }
+    }
+
+
+private:
+    //! An atomically updated list (aka mailbox) of aggregator_operations
+    atomic<aggregator_operation *> mailbox;
+
+    //! Controls thread access to handle_operations
+    /** Behaves as boolean flag where 0=false, 1=true */
+    uintptr_t handler_busy;
+
+    handler_type handle_operations;
+
+    //! Trigger the handling of operations when the handler is free
+    void start_handle_operations() {
+        aggregator_operation *pending_operations;
+
+        // ITT note: &handler_busy tag covers access to mailbox as it is passed
+        // between active and waiting handlers.  Below, the waiting handler waits until
+        // the active handler releases, and the waiting handler acquires &handler_busy as
+        // it becomes the active_handler. The release point is at the end of this
+        // function, when all operations in mailbox have been handled by the
+        // owner of this aggregator.
+        call_itt_notify(prepare, &handler_busy);
+        // get handler_busy: only one thread can possibly spin here at a time
+        spin_wait_until_eq(handler_busy, uintptr_t(0));
+        call_itt_notify(acquired, &handler_busy);
+        // acquire fence not necessary here due to causality rule and surrounding atomics
+        __TBB_store_with_release(handler_busy, uintptr_t(1));
+
+        // ITT note: &mailbox tag covers access to the handler_busy flag itself.
+        // Capturing the state of the mailbox signifies that handler_busy has been
+        // set and a new active handler will now process that list's operations.
+        call_itt_notify(releasing, &mailbox);
+        // grab pending_operations
+        pending_operations = mailbox.fetch_and_store(NULL);
+
+        // handle all the operations
+        handle_operations(pending_operations);
+
+        // release the handler
+        itt_store_word_with_release(handler_busy, uintptr_t(0));
+    }
+};
+
+//! Basic aggregator interface
+class aggregator : private aggregator_ext<internal::basic_handler> {
+public:
+    aggregator() : aggregator_ext<internal::basic_handler>(internal::basic_handler()) {}
+    //! BASIC INTERFACE: Enter a function for exclusive execution by the aggregator.
+    /** The calling thread stores the function object in a basic_operation and
+        places the operation in the aggregator's mailbox */
+    template<typename Body>
+    void execute(const Body& b) {
+        internal::basic_operation<Body> op(b);
+        this->execute_impl(op);
+    }
+};
+
+} // namespace interface6
+
+using interface6::aggregator;
+using interface6::aggregator_ext;
+using interface6::aggregator_operation;
+
+} // namespace tbb
+
+#endif  // __TBB__aggregator_H
diff --git a/xdl/third_party/tbb/include/tbb/aligned_space.h b/xdl/third_party/tbb/include/tbb/aligned_space.h
new file mode 100644
index 00000000..f9e8e09a
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/aligned_space.h
@@ -0,0 +1,47 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_aligned_space_H
+#define __TBB_aligned_space_H
+
+#include "tbb_stddef.h"
+#include "tbb_machine.h"
+
+namespace tbb {
+
+//! Block of space aligned sufficiently to construct an array T with N elements.
+/** The elements are not constructed or destroyed by this class.
+    @ingroup memory_allocation */
+template<typename T,size_t N=1>
+class aligned_space {
+private:
+    typedef __TBB_TypeWithAlignmentAtLeastAsStrict(T) element_type;
+    element_type array[(sizeof(T)*N+sizeof(element_type)-1)/sizeof(element_type)];
+public:
+    //! Pointer to beginning of array
+    T* begin() const {return internal::punned_cast<T*>(this);}
+
+    //! Pointer to one past last element in array.
+    T* end() const {return begin()+N;}
+};
+
+} // namespace tbb
+
+#endif /* __TBB_aligned_space_H */
diff --git a/xdl/third_party/tbb/include/tbb/atomic.h b/xdl/third_party/tbb/include/tbb/atomic.h
new file mode 100644
index 00000000..29c85256
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/atomic.h
@@ -0,0 +1,558 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_atomic_H
+#define __TBB_atomic_H
+
+#include <cstddef>
+
+#if _MSC_VER
+#define __TBB_LONG_LONG __int64
+#else
+#define __TBB_LONG_LONG long long
+#endif /* _MSC_VER */
+
+#include "tbb_machine.h"
+
+#if _MSC_VER && !__INTEL_COMPILER
+    // Suppress overzealous compiler warnings till the end of the file
+    #pragma warning (push)
+    #pragma warning (disable: 4244 4267 4512)
+#endif
+
+namespace tbb {
+
+//! Specifies memory semantics.
+enum memory_semantics {
+    //! Sequential consistency
+    full_fence,
+    //! Acquire
+    acquire,
+    //! Release
+    release,
+    //! No ordering
+    relaxed
+};
+
+//! @cond INTERNAL
+namespace internal {
+
+#if __TBB_ALIGNAS_PRESENT
+    #define __TBB_DECL_ATOMIC_FIELD(t,f,a) alignas(a) t f;
+#elif __TBB_ATTRIBUTE_ALIGNED_PRESENT
+    #define __TBB_DECL_ATOMIC_FIELD(t,f,a) t f  __attribute__ ((aligned(a)));
+#elif __TBB_DECLSPEC_ALIGN_PRESENT
+    #define __TBB_DECL_ATOMIC_FIELD(t,f,a) __declspec(align(a)) t f;
+#else
+    #error Do not know syntax for forcing alignment.
+#endif
+
+template<size_t S>
+struct atomic_rep;           // Primary template declared, but never defined.
+
+template<>
+struct atomic_rep<1> {       // Specialization
+    typedef int8_t word;
+};
+template<>
+struct atomic_rep<2> {       // Specialization
+    typedef int16_t word;
+};
+template<>
+struct atomic_rep<4> {       // Specialization
+#if _MSC_VER && !_WIN64
+    // Work-around that avoids spurious /Wp64 warnings
+    typedef intptr_t word;
+#else
+    typedef int32_t word;
+#endif
+};
+#if __TBB_64BIT_ATOMICS
+template<>
+struct atomic_rep<8> {       // Specialization
+    typedef int64_t word;
+};
+#endif
+
+template<typename value_type, size_t size>
+struct aligned_storage;
+
+//the specializations are needed to please MSVC syntax of __declspec(align()) which accept _literal_ constants only
+#if __TBB_ATOMIC_CTORS
+    #define ATOMIC_STORAGE_PARTIAL_SPECIALIZATION(S)                  \
+    template<typename value_type>                                     \
+    struct aligned_storage<value_type,S> {                            \
+        __TBB_DECL_ATOMIC_FIELD(value_type,my_value,S)                \
+        aligned_storage() = default ;                                 \
+        constexpr aligned_storage(value_type value):my_value(value){} \
+    };                                                                \
+
+#else
+    #define ATOMIC_STORAGE_PARTIAL_SPECIALIZATION(S)                  \
+    template<typename value_type>                                     \
+    struct aligned_storage<value_type,S> {                            \
+        __TBB_DECL_ATOMIC_FIELD(value_type,my_value,S)                \
+    };                                                                \
+
+#endif
+
+template<typename value_type>
+struct aligned_storage<value_type,1> {
+    value_type my_value;
+#if __TBB_ATOMIC_CTORS
+    aligned_storage() = default ;
+    constexpr aligned_storage(value_type value):my_value(value){}
+#endif
+};
+
+ATOMIC_STORAGE_PARTIAL_SPECIALIZATION(2)
+ATOMIC_STORAGE_PARTIAL_SPECIALIZATION(4)
+#if __TBB_64BIT_ATOMICS
+ATOMIC_STORAGE_PARTIAL_SPECIALIZATION(8)
+#endif
+
+template<size_t Size, memory_semantics M>
+struct atomic_traits;        // Primary template declared, but not defined.
+
+#define __TBB_DECL_FENCED_ATOMIC_PRIMITIVES(S,M)                                                         \
+    template<> struct atomic_traits<S,M> {                                                               \
+        typedef atomic_rep<S>::word word;                                                                \
+        inline static word compare_and_swap( volatile void* location, word new_value, word comparand ) { \
+            return __TBB_machine_cmpswp##S##M(location,new_value,comparand);                             \
+        }                                                                                                \
+        inline static word fetch_and_add( volatile void* location, word addend ) {                       \
+            return __TBB_machine_fetchadd##S##M(location,addend);                                        \
+        }                                                                                                \
+        inline static word fetch_and_store( volatile void* location, word value ) {                      \
+            return __TBB_machine_fetchstore##S##M(location,value);                                       \
+        }                                                                                                \
+    };
+
+#define __TBB_DECL_ATOMIC_PRIMITIVES(S)                                                                  \
+    template<memory_semantics M>                                                                         \
+    struct atomic_traits<S,M> {                                                                          \
+        typedef atomic_rep<S>::word word;                                                                \
+        inline static word compare_and_swap( volatile void* location, word new_value, word comparand ) { \
+            return __TBB_machine_cmpswp##S(location,new_value,comparand);                                \
+        }                                                                                                \
+        inline static word fetch_and_add( volatile void* location, word addend ) {                       \
+            return __TBB_machine_fetchadd##S(location,addend);                                           \
+        }                                                                                                \
+        inline static word fetch_and_store( volatile void* location, word value ) {                      \
+            return __TBB_machine_fetchstore##S(location,value);                                          \
+        }                                                                                                \
+    };
+
+template<memory_semantics M>
+struct atomic_load_store_traits;    // Primary template declaration
+
+#define __TBB_DECL_ATOMIC_LOAD_STORE_PRIMITIVES(M)                      \
+    template<> struct atomic_load_store_traits<M> {                     \
+        template <typename T>                                           \
+        inline static T load( const volatile T& location ) {            \
+            return __TBB_load_##M( location );                          \
+        }                                                               \
+        template <typename T>                                           \
+        inline static void store( volatile T& location, T value ) {     \
+            __TBB_store_##M( location, value );                         \
+        }                                                               \
+    }
+
+#if __TBB_USE_FENCED_ATOMICS
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(1,full_fence)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(2,full_fence)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(4,full_fence)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(1,acquire)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(2,acquire)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(4,acquire)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(1,release)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(2,release)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(4,release)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(1,relaxed)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(2,relaxed)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(4,relaxed)
+#if __TBB_64BIT_ATOMICS
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(8,full_fence)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(8,acquire)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(8,release)
+__TBB_DECL_FENCED_ATOMIC_PRIMITIVES(8,relaxed)
+#endif
+#else /* !__TBB_USE_FENCED_ATOMICS */
+__TBB_DECL_ATOMIC_PRIMITIVES(1)
+__TBB_DECL_ATOMIC_PRIMITIVES(2)
+__TBB_DECL_ATOMIC_PRIMITIVES(4)
+#if __TBB_64BIT_ATOMICS
+__TBB_DECL_ATOMIC_PRIMITIVES(8)
+#endif
+#endif /* !__TBB_USE_FENCED_ATOMICS */
+
+__TBB_DECL_ATOMIC_LOAD_STORE_PRIMITIVES(full_fence);
+__TBB_DECL_ATOMIC_LOAD_STORE_PRIMITIVES(acquire);
+__TBB_DECL_ATOMIC_LOAD_STORE_PRIMITIVES(release);
+__TBB_DECL_ATOMIC_LOAD_STORE_PRIMITIVES(relaxed);
+
+//! Additive inverse of 1 for type T.
+/** Various compilers issue various warnings if -1 is used with various integer types.
+    The baroque expression below avoids all the warnings (we hope). */
+#define __TBB_MINUS_ONE(T) (T(T(0)-T(1)))
+
+//! Base class that provides basic functionality for atomic<T> without fetch_and_add.
+/** Works for any type T that has the same size as an integral type, has a trivial constructor/destructor,
+    and can be copied/compared by memcpy/memcmp. */
+template<typename T>
+struct atomic_impl {
+protected:
+    aligned_storage<T,sizeof(T)> my_storage;
+private:
+    //TODO: rechecks on recent versions of gcc if union is still the _only_ way to do a conversion without warnings
+    //! Union type used to convert type T to underlying integral type.
+    template<typename value_type>
+    union converter {
+        typedef typename atomic_rep<sizeof(value_type)>::word bits_type;
+        converter(){}
+        converter(value_type a_value) : value(a_value) {}
+        value_type value;
+        bits_type bits;
+    };
+
+    template<typename value_t>
+    static typename converter<value_t>::bits_type to_bits(value_t value){
+        return converter<value_t>(value).bits;
+    }
+    template<typename value_t>
+    static value_t to_value(typename converter<value_t>::bits_type bits){
+        converter<value_t> u;
+        u.bits = bits;
+        return u.value;
+    }
+
+    template<typename value_t>
+    union ptr_converter;            //Primary template declared, but never defined.
+
+    template<typename value_t>
+    union ptr_converter<value_t *> {
+        ptr_converter(){}
+        ptr_converter(value_t* a_value) : value(a_value) {}
+        value_t* value;
+        uintptr_t bits;
+    };
+    //TODO: check if making to_bits accepting reference (thus unifying it with to_bits_ref)
+    //does not hurt performance
+    template<typename value_t>
+    static typename converter<value_t>::bits_type & to_bits_ref(value_t& value){
+        //TODO: this #ifdef is temporary workaround, as union conversion seems to fail
+        //on suncc for 64 bit types for 32 bit target
+        #if !__SUNPRO_CC
+            return *(typename converter<value_t>::bits_type*)ptr_converter<value_t*>(&value).bits;
+        #else
+            return *(typename converter<value_t>::bits_type*)(&value);
+        #endif
+    }
+
+
+public:
+    typedef T value_type;
+
+#if __TBB_ATOMIC_CTORS
+    atomic_impl() = default ;
+    constexpr atomic_impl(value_type value):my_storage(value){}
+#endif
+    template<memory_semantics M>
+    value_type fetch_and_store( value_type value ) {
+          return to_value<value_type>(
+                  internal::atomic_traits<sizeof(value_type),M>::fetch_and_store( &my_storage.my_value, to_bits(value) )
+          );
+    }
+
+    value_type fetch_and_store( value_type value ) {
+        return fetch_and_store<full_fence>(value);
+    }
+
+    template<memory_semantics M>
+    value_type compare_and_swap( value_type value, value_type comparand ) {
+        return to_value<value_type>(
+                internal::atomic_traits<sizeof(value_type),M>::compare_and_swap( &my_storage.my_value, to_bits(value), to_bits(comparand) )
+        );
+    }
+
+    value_type compare_and_swap( value_type value, value_type comparand ) {
+        return compare_and_swap<full_fence>(value,comparand);
+    }
+
+    operator value_type() const volatile {                // volatile qualifier here for backwards compatibility
+        return  to_value<value_type>(
+                __TBB_load_with_acquire( to_bits_ref(my_storage.my_value) )
+        );
+    }
+
+    template<memory_semantics M>
+    value_type load () const {
+        return to_value<value_type>(
+                internal::atomic_load_store_traits<M>::load( to_bits_ref(my_storage.my_value) )
+        );
+    }
+
+    value_type load () const {
+        return load<acquire>();
+    }
+
+    template<memory_semantics M>
+    void store ( value_type value ) {
+        internal::atomic_load_store_traits<M>::store( to_bits_ref(my_storage.my_value), to_bits(value));
+    }
+
+    void store ( value_type value ) {
+        store<release>( value );
+    }
+
+protected:
+    value_type store_with_release( value_type rhs ) {
+       //TODO: unify with store<release>
+        __TBB_store_with_release( to_bits_ref(my_storage.my_value), to_bits(rhs) );
+        return rhs;
+    }
+};
+
+//! Base class that provides basic functionality for atomic<T> with fetch_and_add.
+/** I is the underlying type.
+    D is the difference type.
+    StepType should be char if I is an integral type, and T if I is a T*. */
+template<typename I, typename D, typename StepType>
+struct atomic_impl_with_arithmetic: atomic_impl<I> {
+public:
+    typedef I value_type;
+#if    __TBB_ATOMIC_CTORS
+    atomic_impl_with_arithmetic() = default ;
+    constexpr atomic_impl_with_arithmetic(value_type value): atomic_impl<I>(value){}
+#endif
+    template<memory_semantics M>
+    value_type fetch_and_add( D addend ) {
+        return value_type(internal::atomic_traits<sizeof(value_type),M>::fetch_and_add( &this->my_storage.my_value, addend*sizeof(StepType) ));
+    }
+
+    value_type fetch_and_add( D addend ) {
+        return fetch_and_add<full_fence>(addend);
+    }
+
+    template<memory_semantics M>
+    value_type fetch_and_increment() {
+        return fetch_and_add<M>(1);
+    }
+
+    value_type fetch_and_increment() {
+        return fetch_and_add(1);
+    }
+
+    template<memory_semantics M>
+    value_type fetch_and_decrement() {
+        return fetch_and_add<M>(__TBB_MINUS_ONE(D));
+    }
+
+    value_type fetch_and_decrement() {
+        return fetch_and_add(__TBB_MINUS_ONE(D));
+    }
+
+public:
+    value_type operator+=( D value ) {
+        return fetch_and_add(value)+value;
+    }
+
+    value_type operator-=( D value ) {
+        // Additive inverse of value computed using binary minus,
+        // instead of unary minus, for sake of avoiding compiler warnings.
+        return operator+=(D(0)-value);
+    }
+
+    value_type operator++() {
+        return fetch_and_add(1)+1;
+    }
+
+    value_type operator--() {
+        return fetch_and_add(__TBB_MINUS_ONE(D))-1;
+    }
+
+    value_type operator++(int) {
+        return fetch_and_add(1);
+    }
+
+    value_type operator--(int) {
+        return fetch_and_add(__TBB_MINUS_ONE(D));
+    }
+};
+
+} /* Internal */
+//! @endcond
+
+//! Primary template for atomic.
+/** See the Reference for details.
+    @ingroup synchronization */
+template<typename T>
+struct atomic: internal::atomic_impl<T> {
+#if __TBB_ATOMIC_CTORS
+    atomic() = default;
+    constexpr atomic(T arg): internal::atomic_impl<T>(arg) {}
+#endif
+    T operator=( T rhs ) {
+        // "this" required here in strict ISO C++ because store_with_release is a dependent name
+        return this->store_with_release(rhs);
+    }
+    atomic<T>& operator=( const atomic<T>& rhs ) {this->store_with_release(rhs); return *this;}
+};
+
+#if __TBB_ATOMIC_CTORS
+    #define __TBB_DECL_ATOMIC(T)                                                                    \
+        template<> struct atomic<T>: internal::atomic_impl_with_arithmetic<T,T,char> {              \
+            atomic() = default;                                                                     \
+            constexpr atomic(T arg): internal::atomic_impl_with_arithmetic<T,T,char>(arg) {}        \
+                                                                                                    \
+            T operator=( T rhs ) {return store_with_release(rhs);}                                  \
+            atomic<T>& operator=( const atomic<T>& rhs ) {store_with_release(rhs); return *this;}   \
+        };
+#else
+    #define __TBB_DECL_ATOMIC(T)                                                                    \
+        template<> struct atomic<T>: internal::atomic_impl_with_arithmetic<T,T,char> {              \
+            T operator=( T rhs ) {return store_with_release(rhs);}                                  \
+            atomic<T>& operator=( const atomic<T>& rhs ) {store_with_release(rhs); return *this;}   \
+        };
+#endif
+
+#if __TBB_64BIT_ATOMICS
+//TODO: consider adding non-default (and atomic) copy constructor for 32bit platform
+__TBB_DECL_ATOMIC(__TBB_LONG_LONG)
+__TBB_DECL_ATOMIC(unsigned __TBB_LONG_LONG)
+#else
+// test_atomic will verify that sizeof(long long)==8
+#endif
+__TBB_DECL_ATOMIC(long)
+__TBB_DECL_ATOMIC(unsigned long)
+
+#if _MSC_VER && !_WIN64
+#if __TBB_ATOMIC_CTORS
+/* Special version of __TBB_DECL_ATOMIC that avoids gratuitous warnings from cl /Wp64 option.
+   It is identical to __TBB_DECL_ATOMIC(unsigned) except that it replaces operator=(T)
+   with an operator=(U) that explicitly converts the U to a T.  Types T and U should be
+   type synonyms on the platform.  Type U should be the wider variant of T from the
+   perspective of /Wp64. */
+#define __TBB_DECL_ATOMIC_ALT(T,U) \
+    template<> struct atomic<T>: internal::atomic_impl_with_arithmetic<T,T,char> {             \
+        atomic() = default ;                                                                   \
+        constexpr atomic(T arg): internal::atomic_impl_with_arithmetic<T,T,char>(arg) {}       \
+        T operator=( U rhs ) {return store_with_release(T(rhs));}                              \
+        atomic<T>& operator=( const atomic<T>& rhs ) {store_with_release(rhs); return *this;}  \
+    };
+#else
+#define __TBB_DECL_ATOMIC_ALT(T,U) \
+    template<> struct atomic<T>: internal::atomic_impl_with_arithmetic<T,T,char> {             \
+        T operator=( U rhs ) {return store_with_release(T(rhs));}                              \
+        atomic<T>& operator=( const atomic<T>& rhs ) {store_with_release(rhs); return *this;}  \
+    };
+#endif
+__TBB_DECL_ATOMIC_ALT(unsigned,size_t)
+__TBB_DECL_ATOMIC_ALT(int,ptrdiff_t)
+#else
+__TBB_DECL_ATOMIC(unsigned)
+__TBB_DECL_ATOMIC(int)
+#endif /* _MSC_VER && !_WIN64 */
+
+__TBB_DECL_ATOMIC(unsigned short)
+__TBB_DECL_ATOMIC(short)
+__TBB_DECL_ATOMIC(char)
+__TBB_DECL_ATOMIC(signed char)
+__TBB_DECL_ATOMIC(unsigned char)
+
+#if !_MSC_VER || defined(_NATIVE_WCHAR_T_DEFINED)
+__TBB_DECL_ATOMIC(wchar_t)
+#endif /* _MSC_VER||!defined(_NATIVE_WCHAR_T_DEFINED) */
+
+//! Specialization for atomic<T*> with arithmetic and operator->.
+template<typename T> struct atomic<T*>: internal::atomic_impl_with_arithmetic<T*,ptrdiff_t,T> {
+#if __TBB_ATOMIC_CTORS
+    atomic() = default ;
+    constexpr atomic(T* arg): internal::atomic_impl_with_arithmetic<T*,ptrdiff_t,T>(arg) {}
+#endif
+    T* operator=( T* rhs ) {
+        // "this" required here in strict ISO C++ because store_with_release is a dependent name
+        return this->store_with_release(rhs);
+    }
+    atomic<T*>& operator=( const atomic<T*>& rhs ) {
+        this->store_with_release(rhs); return *this;
+    }
+    T* operator->() const {
+        return (*this);
+    }
+};
+
+//! Specialization for atomic<void*>, for sake of not allowing arithmetic or operator->.
+template<> struct atomic<void*>: internal::atomic_impl<void*> {
+#if __TBB_ATOMIC_CTORS
+    atomic() = default ;
+    constexpr atomic(void* arg): internal::atomic_impl<void*>(arg) {}
+#endif
+    void* operator=( void* rhs ) {
+        // "this" required here in strict ISO C++ because store_with_release is a dependent name
+        return this->store_with_release(rhs);
+    }
+    atomic<void*>& operator=( const atomic<void*>& rhs ) {
+        this->store_with_release(rhs); return *this;
+    }
+};
+
+// Helpers to workaround ugly syntax of calling template member function of a
+// template class with template argument dependent on template parameters.
+
+template <memory_semantics M, typename T>
+T load ( const atomic<T>& a ) { return a.template load<M>(); }
+
+template <memory_semantics M, typename T>
+void store ( atomic<T>& a, T value ) { a.template store<M>(value); }
+
+namespace interface6{
+//! Make an atomic for use in an initialization (list), as an alternative to zero-initialization or normal assignment.
+template<typename T>
+atomic<T> make_atomic(T t) {
+    atomic<T> a;
+    store<relaxed>(a,t);
+    return a;
+}
+}
+using interface6::make_atomic;
+
+namespace internal {
+template<memory_semantics M, typename T >
+void swap(atomic<T> & lhs, atomic<T> & rhs){
+    T tmp = load<M>(lhs);
+    store<M>(lhs,load<M>(rhs));
+    store<M>(rhs,tmp);
+}
+
+// only to aid in the gradual conversion of ordinary variables to proper atomics
+template<typename T>
+inline atomic<T>& as_atomic( T& t ) {
+    return (atomic<T>&)t;
+}
+} // namespace tbb::internal
+
+} // namespace tbb
+
+#if _MSC_VER && !__INTEL_COMPILER
+    #pragma warning (pop)
+#endif // warnings are restored
+
+#endif /* __TBB_atomic_H */
diff --git a/xdl/third_party/tbb/include/tbb/blocked_range.h b/xdl/third_party/tbb/include/tbb/blocked_range.h
new file mode 100644
index 00000000..3c754e54
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/blocked_range.h
@@ -0,0 +1,172 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_blocked_range_H
+#define __TBB_blocked_range_H
+
+#include "tbb_stddef.h"
+
+namespace tbb {
+
+namespace internal {
+
+// blocked_rangeNd_impl forward declaration in tbb::internal namespace to
+// name it as a friend for a tbb::blocked_range.
+template<typename Value, unsigned int N, typename>
+class blocked_rangeNd_impl;
+
+} // namespace internal
+
+/** \page range_req Requirements on range concept
+    Class \c R implementing the concept of range must define:
+    - \code R::R( const R& ); \endcode               Copy constructor
+    - \code R::~R(); \endcode                        Destructor
+    - \code bool R::is_divisible() const; \endcode   True if range can be partitioned into two subranges
+    - \code bool R::empty() const; \endcode          True if range is empty
+    - \code R::R( R& r, split ); \endcode            Split range \c r into two subranges.
+**/
+
+//! A range over which to iterate.
+/** @ingroup algorithms */
+template<typename Value>
+class blocked_range {
+public:
+    //! Type of a value
+    /** Called a const_iterator for sake of algorithms that need to treat a blocked_range
+        as an STL container. */
+    typedef Value const_iterator;
+
+    //! Type for size of a range
+    typedef std::size_t size_type;
+
+#if __TBB_DEPRECATED_BLOCKED_RANGE_DEFAULT_CTOR
+    //! Construct range with default-constructed values for begin, end, and grainsize.
+    /** Requires that Value have a default constructor. */
+    blocked_range() : my_end(), my_begin(), my_grainsize() {}
+#endif
+
+    //! Construct range over half-open interval [begin,end), with the given grainsize.
+    blocked_range( Value begin_, Value end_, size_type grainsize_=1 ) :
+        my_end(end_), my_begin(begin_), my_grainsize(grainsize_)
+    {
+        __TBB_ASSERT( my_grainsize>0, "grainsize must be positive" );
+    }
+
+    //! Beginning of range.
+    const_iterator begin() const {return my_begin;}
+
+    //! One past last value in range.
+    const_iterator end() const {return my_end;}
+
+    //! Size of the range
+    /** Unspecified if end()<begin(). */
+    size_type size() const {
+        __TBB_ASSERT( !(end()<begin()), "size() unspecified if end()<begin()" );
+        return size_type(my_end-my_begin);
+    }
+
+    //! The grain size for this range.
+    size_type grainsize() const {return my_grainsize;}
+
+    //------------------------------------------------------------------------
+    // Methods that implement Range concept
+    //------------------------------------------------------------------------
+
+    //! True if range is empty.
+    bool empty() const {return !(my_begin<my_end);}
+
+    //! True if range is divisible.
+    /** Unspecified if end()<begin(). */
+    bool is_divisible() const {return my_grainsize<size();}
+
+    //! Split range.
+    /** The new Range *this has the second part, the old range r has the first part.
+        Unspecified if end()<begin() or !is_divisible(). */
+    blocked_range( blocked_range& r, split ) :
+        my_end(r.my_end),
+        my_begin(do_split(r, split())),
+        my_grainsize(r.my_grainsize)
+    {
+        // only comparison 'less than' is required from values of blocked_range objects
+        __TBB_ASSERT( !(my_begin < r.my_end) && !(r.my_end < my_begin), "blocked_range has been split incorrectly" );
+    }
+
+#if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+    //! Static field to support proportional split
+    static const bool is_splittable_in_proportion = true;
+
+    //! Split range.
+    /** The new Range *this has the second part split according to specified proportion, the old range r has the first part.
+        Unspecified if end()<begin() or !is_divisible(). */
+    blocked_range( blocked_range& r, proportional_split& proportion ) :
+        my_end(r.my_end),
+        my_begin(do_split(r, proportion)),
+        my_grainsize(r.my_grainsize)
+    {
+        // only comparison 'less than' is required from values of blocked_range objects
+        __TBB_ASSERT( !(my_begin < r.my_end) && !(r.my_end < my_begin), "blocked_range has been split incorrectly" );
+    }
+#endif /* __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES */
+
+private:
+    /** NOTE: my_end MUST be declared before my_begin, otherwise the splitting constructor will break. */
+    Value my_end;
+    Value my_begin;
+    size_type my_grainsize;
+
+    //! Auxiliary function used by the splitting constructor.
+    static Value do_split( blocked_range& r, split )
+    {
+        __TBB_ASSERT( r.is_divisible(), "cannot split blocked_range that is not divisible" );
+        Value middle = r.my_begin + (r.my_end - r.my_begin) / 2u;
+        r.my_end = middle;
+        return middle;
+    }
+
+#if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+    static Value do_split( blocked_range& r, proportional_split& proportion )
+    {
+        __TBB_ASSERT( r.is_divisible(), "cannot split blocked_range that is not divisible" );
+
+        // usage of 32-bit floating point arithmetic is not enough to handle ranges of
+        // more than 2^24 iterations accurately. However, even on ranges with 2^64
+        // iterations the computational error approximately equals to 0.000001% which
+        // makes small impact on uniform distribution of such range's iterations (assuming
+        // all iterations take equal time to complete). See 'test_partitioner_whitebox'
+        // for implementation of an exact split algorithm
+        size_type right_part = size_type(float(r.size()) * float(proportion.right())
+                                         / float(proportion.left() + proportion.right()) + 0.5f);
+        return r.my_end = Value(r.my_end - right_part);
+    }
+#endif /* __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES */
+
+    template<typename RowValue, typename ColValue>
+    friend class blocked_range2d;
+
+    template<typename RowValue, typename ColValue, typename PageValue>
+    friend class blocked_range3d;
+
+    template<typename DimValue, unsigned int N, typename>
+    friend class internal::blocked_rangeNd_impl;
+};
+
+} // namespace tbb
+
+#endif /* __TBB_blocked_range_H */
diff --git a/xdl/third_party/tbb/include/tbb/blocked_range2d.h b/xdl/third_party/tbb/include/tbb/blocked_range2d.h
new file mode 100644
index 00000000..a33b0cd5
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/blocked_range2d.h
@@ -0,0 +1,108 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_blocked_range2d_H
+#define __TBB_blocked_range2d_H
+
+#include "tbb_stddef.h"
+#include "blocked_range.h"
+
+namespace tbb {
+
+//! A 2-dimensional range that models the Range concept.
+/** @ingroup algorithms */
+template<typename RowValue, typename ColValue=RowValue>
+class blocked_range2d {
+public:
+    //! Type for size of an iteration range
+    typedef blocked_range<RowValue> row_range_type;
+    typedef blocked_range<ColValue> col_range_type;
+
+private:
+    row_range_type my_rows;
+    col_range_type my_cols;
+
+public:
+
+    blocked_range2d( RowValue row_begin, RowValue row_end, typename row_range_type::size_type row_grainsize,
+                     ColValue col_begin, ColValue col_end, typename col_range_type::size_type col_grainsize ) :
+        my_rows(row_begin,row_end,row_grainsize),
+        my_cols(col_begin,col_end,col_grainsize)
+    {}
+
+    blocked_range2d( RowValue row_begin, RowValue row_end,
+                     ColValue col_begin, ColValue col_end ) :
+        my_rows(row_begin,row_end),
+        my_cols(col_begin,col_end)
+    {}
+
+    //! True if range is empty
+    bool empty() const {
+        // Range is empty if at least one dimension is empty.
+        return my_rows.empty() || my_cols.empty();
+    }
+
+    //! True if range is divisible into two pieces.
+    bool is_divisible() const {
+        return my_rows.is_divisible() || my_cols.is_divisible();
+    }
+
+    blocked_range2d( blocked_range2d& r, split ) :
+        my_rows(r.my_rows),
+        my_cols(r.my_cols)
+    {
+        split split_obj;
+        do_split(r, split_obj);
+    }
+
+#if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+    //! Static field to support proportional split
+    static const bool is_splittable_in_proportion = true;
+
+    blocked_range2d( blocked_range2d& r, proportional_split& proportion ) :
+        my_rows(r.my_rows),
+        my_cols(r.my_cols)
+    {
+        do_split(r, proportion);
+    }
+#endif /* __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES */
+
+    //! The rows of the iteration space
+    const row_range_type& rows() const {return my_rows;}
+
+    //! The columns of the iteration space
+    const col_range_type& cols() const {return my_cols;}
+
+private:
+
+    template <typename Split>
+    void do_split( blocked_range2d& r, Split& split_obj )
+    {
+        if( my_rows.size()*double(my_cols.grainsize()) < my_cols.size()*double(my_rows.grainsize()) ) {
+            my_cols.my_begin = col_range_type::do_split(r.my_cols, split_obj);
+        } else {
+            my_rows.my_begin = row_range_type::do_split(r.my_rows, split_obj);
+        }
+    }
+};
+
+} // namespace tbb
+
+#endif /* __TBB_blocked_range2d_H */
diff --git a/xdl/third_party/tbb/include/tbb/blocked_range3d.h b/xdl/third_party/tbb/include/tbb/blocked_range3d.h
new file mode 100644
index 00000000..d3db48cd
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/blocked_range3d.h
@@ -0,0 +1,127 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_blocked_range3d_H
+#define __TBB_blocked_range3d_H
+
+#include "tbb_stddef.h"
+#include "blocked_range.h"
+
+namespace tbb {
+
+//! A 3-dimensional range that models the Range concept.
+/** @ingroup algorithms */
+template<typename PageValue, typename RowValue=PageValue, typename ColValue=RowValue>
+class blocked_range3d {
+public:
+    //! Type for size of an iteration range
+    typedef blocked_range<PageValue> page_range_type;
+    typedef blocked_range<RowValue>  row_range_type;
+    typedef blocked_range<ColValue>  col_range_type;
+
+private:
+    page_range_type my_pages;
+    row_range_type  my_rows;
+    col_range_type  my_cols;
+
+public:
+
+    blocked_range3d( PageValue page_begin, PageValue page_end,
+                     RowValue  row_begin,  RowValue row_end,
+                     ColValue  col_begin,  ColValue col_end ) :
+        my_pages(page_begin,page_end),
+        my_rows(row_begin,row_end),
+        my_cols(col_begin,col_end)
+    {}
+
+    blocked_range3d( PageValue page_begin, PageValue page_end, typename page_range_type::size_type page_grainsize,
+                     RowValue  row_begin,  RowValue row_end,   typename row_range_type::size_type row_grainsize,
+                     ColValue  col_begin,  ColValue col_end,   typename col_range_type::size_type col_grainsize ) :
+        my_pages(page_begin,page_end,page_grainsize),
+        my_rows(row_begin,row_end,row_grainsize),
+        my_cols(col_begin,col_end,col_grainsize)
+    {}
+
+    //! True if range is empty
+    bool empty() const {
+        // Range is empty if at least one dimension is empty.
+        return my_pages.empty() || my_rows.empty() || my_cols.empty();
+    }
+
+    //! True if range is divisible into two pieces.
+    bool is_divisible() const {
+        return  my_pages.is_divisible() || my_rows.is_divisible() || my_cols.is_divisible();
+    }
+
+    blocked_range3d( blocked_range3d& r, split ) :
+        my_pages(r.my_pages),
+        my_rows(r.my_rows),
+        my_cols(r.my_cols)
+    {
+        split split_obj;
+        do_split(r, split_obj);
+    }
+
+#if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+    //! Static field to support proportional split
+    static const bool is_splittable_in_proportion = true;
+
+    blocked_range3d( blocked_range3d& r, proportional_split& proportion ) :
+        my_pages(r.my_pages),
+        my_rows(r.my_rows),
+        my_cols(r.my_cols)
+    {
+        do_split(r, proportion);
+    }
+#endif /* __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES */
+
+    //! The pages of the iteration space
+    const page_range_type& pages() const {return my_pages;}
+
+    //! The rows of the iteration space
+    const row_range_type& rows() const {return my_rows;}
+
+    //! The columns of the iteration space
+    const col_range_type& cols() const {return my_cols;}
+
+private:
+
+    template <typename Split>
+    void do_split( blocked_range3d& r, Split& split_obj)
+    {
+        if ( my_pages.size()*double(my_rows.grainsize()) < my_rows.size()*double(my_pages.grainsize()) ) {
+            if ( my_rows.size()*double(my_cols.grainsize()) < my_cols.size()*double(my_rows.grainsize()) ) {
+                my_cols.my_begin = col_range_type::do_split(r.my_cols, split_obj);
+            } else {
+                my_rows.my_begin = row_range_type::do_split(r.my_rows, split_obj);
+            }
+        } else {
+            if ( my_pages.size()*double(my_cols.grainsize()) < my_cols.size()*double(my_pages.grainsize()) ) {
+                my_cols.my_begin = col_range_type::do_split(r.my_cols, split_obj);
+            } else {
+                my_pages.my_begin = page_range_type::do_split(r.my_pages, split_obj);
+            }
+        }
+    }
+};
+
+} // namespace tbb
+
+#endif /* __TBB_blocked_range3d_H */
diff --git a/xdl/third_party/tbb/include/tbb/blocked_rangeNd.h b/xdl/third_party/tbb/include/tbb/blocked_rangeNd.h
new file mode 100644
index 00000000..d63860b2
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/blocked_rangeNd.h
@@ -0,0 +1,154 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_blocked_rangeNd_H
+#define __TBB_blocked_rangeNd_H
+
+#if ! TBB_PREVIEW_BLOCKED_RANGE_ND
+    #error Set TBB_PREVIEW_BLOCKED_RANGE_ND to include blocked_rangeNd.h
+#endif
+
+#include "tbb_config.h"
+
+// tbb::blocked_rangeNd requires C++11 support
+#if __TBB_CPP11_PRESENT && __TBB_CPP11_ARRAY_PRESENT && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT
+
+#include "internal/_template_helpers.h" // index_sequence, make_index_sequence
+
+#include <array>
+#include <algorithm>    // std::any_of
+#include <type_traits>  // std::is_same, std::enable_if
+
+#include "tbb/blocked_range.h"
+
+namespace tbb {
+namespace internal {
+
+/*
+    The blocked_rangeNd_impl uses make_index_sequence<N> to automatically generate a ctor with
+    exactly N arguments of the type tbb::blocked_range<Value>. Such ctor provides an opportunity
+    to use braced-init-list parameters to initialize each dimension.
+    Use of parameters, whose representation is a braced-init-list, but they're not
+    std::initializer_list or a reference to one, produces a non-deduced context
+    within template argument deduction.
+
+    NOTE: blocked_rangeNd must be exactly a templated alias to the blocked_rangeNd_impl
+    (and not e.g. a derived class), otherwise it would need to declare its own ctor
+    facing the same problem that the impl class solves.
+*/
+
+template<typename Value, unsigned int N, typename = make_index_sequence<N>>
+class blocked_rangeNd_impl;
+
+template<typename Value, unsigned int N, std::size_t... Is>
+class blocked_rangeNd_impl<Value, N, index_sequence<Is...>> {
+public:
+    //! Type of a value.
+    using value_type = Value;
+
+private:
+
+    //! Helper type to construct range with N tbb::blocked_range<value_type> objects.
+    template<std::size_t>
+    using dim_type_helper = tbb::blocked_range<value_type>;
+
+public:
+    blocked_rangeNd_impl() = delete;
+
+    //! Constructs N-dimensional range over N half-open intervals each represented as tbb::blocked_range<Value>.
+    blocked_rangeNd_impl(const dim_type_helper<Is>&... args) : my_dims{ {args...} } {}
+
+    //! Dimensionality of a range.
+    static constexpr unsigned int ndims() { return N; }
+
+    //! Range in certain dimension.
+    const tbb::blocked_range<value_type>& dim(unsigned int dimension) const {
+        __TBB_ASSERT(dimension < N, "out of bound");
+        return my_dims[dimension];
+    }
+
+    //------------------------------------------------------------------------
+    // Methods that implement Range concept
+    //------------------------------------------------------------------------
+
+    //! True if at least one dimension is empty.
+    bool empty() const {
+        return std::any_of(my_dims.begin(), my_dims.end(), [](const tbb::blocked_range<value_type>& d) {
+            return d.empty();
+        });
+    }
+
+    //! True if at least one dimension is divisible.
+    bool is_divisible() const {
+        return std::any_of(my_dims.begin(), my_dims.end(), [](const tbb::blocked_range<value_type>& d) {
+            return d.is_divisible();
+        });
+    }
+
+#if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+    //! Static field to support proportional split.
+    static const bool is_splittable_in_proportion = true;
+
+    blocked_rangeNd_impl(blocked_rangeNd_impl& r, proportional_split proportion) : my_dims(r.my_dims) {
+        do_split(r, proportion);
+    }
+#endif
+
+    blocked_rangeNd_impl(blocked_rangeNd_impl& r, split proportion) : my_dims(r.my_dims) {
+        do_split(r, proportion);
+    }
+
+private:
+    __TBB_STATIC_ASSERT(N != 0, "zero dimensional blocked_rangeNd can't be constructed");
+
+    //! Ranges in each dimension.
+    std::array<tbb::blocked_range<value_type>, N> my_dims;
+
+    template<typename split_type>
+    void do_split(blocked_rangeNd_impl& r, split_type proportion) {
+        __TBB_STATIC_ASSERT((is_same_type<split_type, split>::value
+                            || is_same_type<split_type, proportional_split>::value),
+                            "type of split object is incorrect");
+        __TBB_ASSERT(r.is_divisible(), "can't split not divisible range");
+
+        auto my_it = std::max_element(my_dims.begin(), my_dims.end(), [](const tbb::blocked_range<value_type>& first, const tbb::blocked_range<value_type>& second) {
+            return (first.size() * second.grainsize() < second.size() * first.grainsize());
+        });
+
+        auto r_it = r.my_dims.begin() + (my_it - my_dims.begin());
+
+        my_it->my_begin = tbb::blocked_range<value_type>::do_split(*r_it, proportion);
+
+        // (!(my_it->my_begin < r_it->my_end) && !(r_it->my_end < my_it->my_begin)) equals to
+        // (my_it->my_begin == r_it->my_end), but we can't use operator== due to Value concept
+        __TBB_ASSERT(!(my_it->my_begin < r_it->my_end) && !(r_it->my_end < my_it->my_begin),
+                     "blocked_range has been split incorrectly");
+    }
+};
+
+} // namespace internal
+
+template<typename Value, unsigned int N>
+using blocked_rangeNd = internal::blocked_rangeNd_impl<Value, N>;
+
+} // namespace tbb
+
+#endif /* __TBB_CPP11_PRESENT && __TBB_CPP11_ARRAY_PRESENT && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT */
+#endif /* __TBB_blocked_rangeNd_H */
diff --git a/xdl/third_party/tbb/include/tbb/cache_aligned_allocator.h b/xdl/third_party/tbb/include/tbb/cache_aligned_allocator.h
new file mode 100644
index 00000000..de29f306
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/cache_aligned_allocator.h
@@ -0,0 +1,137 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_cache_aligned_allocator_H
+#define __TBB_cache_aligned_allocator_H
+
+#include <new>
+#include "tbb_stddef.h"
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+ #include <utility> // std::forward
+#endif
+
+namespace tbb {
+
+//! @cond INTERNAL
+namespace internal {
+    //! Cache/sector line size.
+    /** @ingroup memory_allocation */
+    size_t __TBB_EXPORTED_FUNC NFS_GetLineSize();
+
+    //! Allocate memory on cache/sector line boundary.
+    /** @ingroup memory_allocation */
+    void* __TBB_EXPORTED_FUNC NFS_Allocate( size_t n_element, size_t element_size, void* hint );
+
+    //! Free memory allocated by NFS_Allocate.
+    /** Freeing a NULL pointer is allowed, but has no effect.
+        @ingroup memory_allocation */
+    void __TBB_EXPORTED_FUNC NFS_Free( void* );
+}
+//! @endcond
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for erroneous "unreferenced parameter" warning in method destroy.
+    #pragma warning (push)
+    #pragma warning (disable: 4100)
+#endif
+
+//! Meets "allocator" requirements of ISO C++ Standard, Section 20.1.5
+/** The members are ordered the same way they are in section 20.4.1
+    of the ISO C++ standard.
+    @ingroup memory_allocation */
+template<typename T>
+class cache_aligned_allocator {
+public:
+    typedef typename internal::allocator_type<T>::value_type value_type;
+    typedef value_type* pointer;
+    typedef const value_type* const_pointer;
+    typedef value_type& reference;
+    typedef const value_type& const_reference;
+    typedef size_t size_type;
+    typedef ptrdiff_t difference_type;
+    template<typename U> struct rebind {
+        typedef cache_aligned_allocator<U> other;
+    };
+
+    cache_aligned_allocator() throw() {}
+    cache_aligned_allocator( const cache_aligned_allocator& ) throw() {}
+    template<typename U> cache_aligned_allocator(const cache_aligned_allocator<U>&) throw() {}
+
+    pointer address(reference x) const {return &x;}
+    const_pointer address(const_reference x) const {return &x;}
+
+    //! Allocate space for n objects, starting on a cache/sector line.
+    pointer allocate( size_type n, const void* hint=0 ) {
+        // The "hint" argument is always ignored in NFS_Allocate thus const_cast shouldn't hurt
+        return pointer(internal::NFS_Allocate( n, sizeof(value_type), const_cast<void*>(hint) ));
+    }
+
+    //! Free block of memory that starts on a cache line
+    void deallocate( pointer p, size_type ) {
+        internal::NFS_Free(p);
+    }
+
+    //! Largest value for which method allocate might succeed.
+    size_type max_size() const throw() {
+        return (~size_t(0)-internal::NFS_MaxLineSize)/sizeof(value_type);
+    }
+
+    //! Copy-construct value at location pointed to by p.
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    template<typename U, typename... Args>
+    void construct(U *p, Args&&... args)
+        { ::new((void *)p) U(std::forward<Args>(args)...); }
+#else // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void construct( pointer p, value_type&& value ) {::new((void*)(p)) value_type(std::move(value));}
+#endif
+    void construct( pointer p, const value_type& value ) {::new((void*)(p)) value_type(value);}
+#endif // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+
+    //! Destroy value at location pointed to by p.
+    void destroy( pointer p ) {p->~value_type();}
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4100 is back
+
+//! Analogous to std::allocator<void>, as defined in ISO C++ Standard, Section 20.4.1
+/** @ingroup memory_allocation */
+template<>
+class cache_aligned_allocator<void> {
+public:
+    typedef void* pointer;
+    typedef const void* const_pointer;
+    typedef void value_type;
+    template<typename U> struct rebind {
+        typedef cache_aligned_allocator<U> other;
+    };
+};
+
+template<typename T, typename U>
+inline bool operator==( const cache_aligned_allocator<T>&, const cache_aligned_allocator<U>& ) {return true;}
+
+template<typename T, typename U>
+inline bool operator!=( const cache_aligned_allocator<T>&, const cache_aligned_allocator<U>& ) {return false;}
+
+} // namespace tbb
+
+#endif /* __TBB_cache_aligned_allocator_H */
diff --git a/xdl/third_party/tbb/include/tbb/combinable.h b/xdl/third_party/tbb/include/tbb/combinable.h
new file mode 100644
index 00000000..485ef4ed
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/combinable.h
@@ -0,0 +1,85 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_combinable_H
+#define __TBB_combinable_H
+
+#include "enumerable_thread_specific.h"
+#include "cache_aligned_allocator.h"
+
+namespace tbb {
+/** \name combinable
+    **/
+//@{
+//! Thread-local storage with optional reduction
+/** @ingroup containers */
+    template <typename T>
+    class combinable {
+
+    private:
+        typedef typename tbb::cache_aligned_allocator<T> my_alloc;
+        typedef typename tbb::enumerable_thread_specific<T, my_alloc, ets_no_key> my_ets_type;
+        my_ets_type my_ets;
+
+    public:
+
+        combinable() { }
+
+        template <typename finit>
+        explicit combinable( finit _finit) : my_ets(_finit) { }
+
+        //! destructor
+        ~combinable() { }
+
+        combinable( const combinable& other) : my_ets(other.my_ets) { }
+
+#if __TBB_ETS_USE_CPP11
+        combinable( combinable&& other) : my_ets( std::move(other.my_ets)) { }
+#endif
+
+        combinable & operator=( const combinable & other) {
+            my_ets = other.my_ets;
+            return *this;
+        }
+
+#if __TBB_ETS_USE_CPP11
+        combinable & operator=( combinable && other) {
+            my_ets=std::move(other.my_ets);
+            return *this;
+        }
+#endif
+
+        void clear() { my_ets.clear(); }
+
+        T& local() { return my_ets.local(); }
+
+        T& local(bool & exists) { return my_ets.local(exists); }
+
+        // combine_func_t has signature T(T,T) or T(const T&, const T&)
+        template <typename combine_func_t>
+        T combine(combine_func_t f_combine) { return my_ets.combine(f_combine); }
+
+        // combine_func_t has signature void(T) or void(const T&)
+        template <typename combine_func_t>
+        void combine_each(combine_func_t f_combine) { my_ets.combine_each(f_combine); }
+
+    };
+} // namespace tbb
+#endif /* __TBB_combinable_H */
diff --git a/xdl/third_party/tbb/include/tbb/compat/condition_variable b/xdl/third_party/tbb/include/tbb/compat/condition_variable
new file mode 100644
index 00000000..3ca1fefc
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/compat/condition_variable
@@ -0,0 +1,476 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_condition_variable_H
+#define __TBB_condition_variable_H
+
+#if _WIN32||_WIN64
+#include "../machine/windows_api.h"
+
+namespace tbb { 
+namespace interface5 {
+namespace internal { 
+struct condition_variable_using_event
+{
+    //! Event for blocking waiting threads.
+    HANDLE event;
+    //! Protects invariants involving n_waiters, release_count, and epoch.
+    CRITICAL_SECTION mutex;
+    //! Number of threads waiting on this condition variable
+    int n_waiters;
+    //! Number of threads remaining that should no longer wait on this condition variable.
+    int release_count;
+    //! To keep threads from waking up prematurely with earlier signals.
+    unsigned epoch;
+};
+}}} // namespace tbb::interface5::internal
+
+#ifndef CONDITION_VARIABLE_INIT
+typedef void* CONDITION_VARIABLE;
+typedef CONDITION_VARIABLE* PCONDITION_VARIABLE;
+#endif
+
+#else /* if not _WIN32||_WIN64 */
+#include <errno.h> // some systems need it for ETIMEDOUT
+#include <pthread.h>
+#if __linux__
+#include <ctime>
+#else /* generic Unix */
+#include <sys/time.h>
+#endif
+#endif /* _WIN32||_WIN64 */
+
+#include "../tbb_stddef.h"
+#include "../mutex.h"
+#include "../tbb_thread.h"
+#include "../tbb_exception.h"
+#include "../tbb_profiling.h"
+
+namespace tbb {
+
+namespace interface5 {
+
+// C++0x standard working draft 30.4.3
+// Lock tag types
+struct defer_lock_t { }; //! do not acquire ownership of the mutex
+struct try_to_lock_t { }; //! try to acquire ownership of the mutex without blocking
+struct adopt_lock_t { }; //! assume the calling thread has already
+const defer_lock_t defer_lock = {};
+const try_to_lock_t try_to_lock = {};
+const adopt_lock_t adopt_lock = {};
+
+// C++0x standard working draft 30.4.3.1
+//! lock_guard 
+template<typename M>
+class lock_guard : tbb::internal::no_copy {
+public:
+    //! mutex type
+    typedef M mutex_type;
+
+    //! Constructor
+    /** precondition: If mutex_type is not a recursive mutex, the calling thread
+        does not own the mutex m. */
+    explicit lock_guard(mutex_type& m) : pm(m) {m.lock();}
+    
+    //! Adopt_lock constructor
+    /** precondition: the calling thread owns the mutex m. */
+    lock_guard(mutex_type& m, adopt_lock_t) : pm(m) {}
+
+    //! Destructor
+    ~lock_guard() { pm.unlock(); }
+private:
+    mutex_type& pm;
+};
+
+// C++0x standard working draft 30.4.3.2
+//! unique_lock 
+template<typename M>
+class unique_lock : tbb::internal::no_copy {
+    friend class condition_variable;
+public:
+    typedef M mutex_type;
+
+    // 30.4.3.2.1 construct/copy/destroy
+    // NB: Without constructors that take an r-value reference to a unique_lock, the following constructor is of little use.
+    //! Constructor
+    /** postcondition: pm==0 && owns==false */
+    unique_lock() : pm(NULL), owns(false) {}
+
+    //! Constructor
+    /** precondition: if mutex_type is not a recursive mutex, the  calling thread
+        does not own the mutex m.  If the precondition is not met, a deadlock occurs.
+        postcondition: pm==&m and owns==true */
+    explicit unique_lock(mutex_type& m) : pm(&m) {m.lock(); owns=true;}
+
+    //! Defer_lock constructor
+    /** postcondition: pm==&m and owns==false */
+    unique_lock(mutex_type& m, defer_lock_t) : pm(&m), owns(false) {}
+
+    //! Try_to_lock constructor
+    /** precondition: if mutex_type is not a recursive mutex, the  calling thread
+       does not own the mutex m.  If the precondition is not met, a deadlock occurs.
+       postcondition: pm==&m and owns==res where res is the value returned by
+       the call to m.try_lock(). */
+    unique_lock(mutex_type& m, try_to_lock_t) : pm(&m) {owns = m.try_lock();}
+
+    //! Adopt_lock constructor
+    /** precondition: the calling thread owns the mutex. If it does not, mutex->unlock() would fail.
+        postcondition: pm==&m and owns==true */
+    unique_lock(mutex_type& m, adopt_lock_t) : pm(&m), owns(true) {}
+
+    //! Timed unique_lock acquisition.
+    /** To avoid requiring support for namespace chrono, this method deviates from the working draft in that 
+        it uses tbb::tick_count::interval_t to specify the time duration. */
+    unique_lock(mutex_type& m, const tick_count::interval_t &i) : pm(&m) {owns = try_lock_for( i );}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move constructor
+    /** postconditions: pm == src_p.pm and owns == src_p.owns (where src_p is the state of src just prior to this
+        construction), src.pm == 0 and src.owns == false. */
+    unique_lock(unique_lock && src): pm(NULL), owns(false) {this->swap(src);}
+
+    //! Move assignment
+    /** effects: If owns calls pm->unlock().
+        Postconditions: pm == src_p.pm and owns == src_p.owns (where src_p is the state of src just prior to this
+        assignment), src.pm == 0 and src.owns == false. */
+    unique_lock& operator=(unique_lock && src) {
+        if (owns)
+            this->unlock();
+        pm = NULL;
+        this->swap(src);
+        return *this;
+    }
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+    //! Destructor
+    ~unique_lock() { if( owns ) pm->unlock(); }
+
+    // 30.4.3.2.2 locking
+    //! Lock the mutex and own it.
+    void lock() {
+        if( pm ) {
+            if( !owns ) {
+                pm->lock();
+                owns = true;
+            } else 
+                throw_exception_v4( tbb::internal::eid_possible_deadlock );
+        } else 
+            throw_exception_v4( tbb::internal::eid_operation_not_permitted );
+        __TBB_ASSERT( owns, NULL );
+    }
+
+    //! Try to lock the mutex. 
+    /** If successful, note that this lock owns it. Otherwise, set it false. */
+    bool try_lock() {
+        if( pm ) {
+            if( !owns )
+                owns = pm->try_lock();
+            else
+                throw_exception_v4( tbb::internal::eid_possible_deadlock );
+        } else 
+            throw_exception_v4( tbb::internal::eid_operation_not_permitted );
+        return owns;
+    }
+ 
+    //! Try to lock the mutex. 
+    bool try_lock_for( const tick_count::interval_t &i );
+
+    //! Unlock the mutex
+    /** And note that this lock no longer owns it. */
+    void unlock() { 
+        if( owns ) {
+            pm->unlock();
+            owns = false;
+        } else
+            throw_exception_v4( tbb::internal::eid_operation_not_permitted );
+        __TBB_ASSERT( !owns, NULL );
+    }
+
+    // 30.4.3.2.3 modifiers
+    //! Swap the two unique locks
+    void swap(unique_lock& u) {
+        mutex_type* t_pm = u.pm;    u.pm   = pm;    pm   = t_pm;
+        bool t_owns      = u.owns;  u.owns = owns;  owns = t_owns;
+    }
+
+    //! Release control over the mutex.
+    mutex_type* release() {
+        mutex_type* o_pm = pm; 
+        pm = NULL; 
+        owns = false; 
+        return o_pm; 
+    }
+
+    // 30.4.3.2.4 observers
+    //! Does this lock own the mutex?
+    bool owns_lock() const { return owns; }
+
+    // TODO: Un-comment 'explicit' when the last non-C++0x compiler support is dropped
+    //! Does this lock own the mutex?
+    /*explicit*/ operator bool() const { return owns; }
+
+    //! Return the mutex that this lock currently has.
+    mutex_type* mutex() const { return pm; }
+
+private:
+    mutex_type* pm;
+    bool owns;
+};
+
+template<typename M>
+bool unique_lock<M>::try_lock_for( const tick_count::interval_t &i)
+{ 
+    const int unique_lock_tick = 100; /* microseconds; 0.1 milliseconds */
+    // the smallest wait-time is 0.1 milliseconds.
+    bool res = pm->try_lock();
+    int duration_in_micro; 
+    if( !res && (duration_in_micro=int(i.seconds()*1e6))>unique_lock_tick ) {
+        tick_count::interval_t i_100( double(unique_lock_tick)/1e6 /* seconds */); // 100 microseconds = 0.1*10E-3
+        do {
+            this_tbb_thread::sleep(i_100); // sleep for 100 micro seconds
+            duration_in_micro -= unique_lock_tick;
+            res = pm->try_lock();
+        } while( !res && duration_in_micro>unique_lock_tick );
+    }
+    return (owns=res);
+}
+
+//! Swap the two unique locks that have the mutexes of same type 
+template<typename M>
+void swap(unique_lock<M>& x, unique_lock<M>& y) { x.swap( y ); }
+
+namespace internal {
+
+#if _WIN32||_WIN64
+union condvar_impl_t {
+    condition_variable_using_event cv_event;
+    CONDITION_VARIABLE             cv_native;
+};
+void __TBB_EXPORTED_FUNC internal_initialize_condition_variable( condvar_impl_t& cv );
+void __TBB_EXPORTED_FUNC internal_destroy_condition_variable(    condvar_impl_t& cv );
+void __TBB_EXPORTED_FUNC internal_condition_variable_notify_one( condvar_impl_t& cv );
+void __TBB_EXPORTED_FUNC internal_condition_variable_notify_all( condvar_impl_t& cv );
+bool __TBB_EXPORTED_FUNC internal_condition_variable_wait( condvar_impl_t& cv, mutex* mtx, const tick_count::interval_t* i = NULL );
+
+#else /* if !(_WIN32||_WIN64), i.e., POSIX threads */
+typedef pthread_cond_t condvar_impl_t;
+#endif
+
+} // namespace internal
+
+//! cv_status
+/** C++0x standard working draft 30.5 */
+enum cv_status { no_timeout, timeout }; 
+
+//! condition variable
+/** C++0x standard working draft 30.5.1 
+    @ingroup synchronization */
+class condition_variable : tbb::internal::no_copy {
+public:
+    //! Constructor
+    condition_variable() { 
+#if _WIN32||_WIN64
+        internal_initialize_condition_variable( my_cv ); 
+#else
+        pthread_cond_init( &my_cv, NULL );
+#endif
+    }
+
+    //! Destructor
+    ~condition_variable() { 
+        //precondition: There shall be no thread blocked on *this.
+#if _WIN32||_WIN64
+        internal_destroy_condition_variable( my_cv );
+#else
+        pthread_cond_destroy( &my_cv );
+#endif
+    }
+
+    //! Notify one thread and wake it up
+    void notify_one() { 
+#if _WIN32||_WIN64
+        internal_condition_variable_notify_one( my_cv ); 
+#else
+        pthread_cond_signal( &my_cv );
+#endif
+    }
+
+    //! Notify all threads 
+    void notify_all() { 
+#if _WIN32||_WIN64
+        internal_condition_variable_notify_all( my_cv ); 
+#else
+        pthread_cond_broadcast( &my_cv );
+#endif
+    }
+
+    //! Release the mutex associated with the lock and wait on this condition variable
+    void wait(unique_lock<mutex>& lock);
+
+    //! Wait on this condition variable while pred is false
+    template <class Predicate>
+    void wait(unique_lock<mutex>& lock, Predicate pred) {
+        while( !pred() )
+            wait( lock );
+    }
+
+    //! Timed version of wait()
+    cv_status wait_for(unique_lock<mutex>& lock, const tick_count::interval_t &i );
+
+    //! Timed version of the predicated wait
+    /** The loop terminates when pred() returns true or when the time duration specified by rel_time (i) has elapsed. */
+    template<typename Predicate>
+    bool wait_for(unique_lock<mutex>& lock, const tick_count::interval_t &i, Predicate pred)
+    {
+        while( !pred() ) {
+            cv_status st = wait_for( lock, i );
+            if( st==timeout )
+                return pred();
+        }
+        return true;
+    }
+
+    // C++0x standard working draft. 30.2.3
+    typedef internal::condvar_impl_t* native_handle_type;
+
+    native_handle_type native_handle() { return (native_handle_type) &my_cv; }
+
+private:
+    internal::condvar_impl_t my_cv;
+};
+
+
+#if _WIN32||_WIN64
+inline void condition_variable::wait( unique_lock<mutex>& lock )
+{
+    __TBB_ASSERT( lock.owns, NULL );
+    lock.owns = false;
+    if( !internal_condition_variable_wait( my_cv, lock.mutex() ) ) {
+        int ec = GetLastError();
+        // on Windows 7, SleepConditionVariableCS() may return ERROR_TIMEOUT while the doc says it returns WAIT_TIMEOUT
+        __TBB_ASSERT_EX( ec!=WAIT_TIMEOUT&&ec!=ERROR_TIMEOUT, NULL );
+        lock.owns = true;
+        throw_exception_v4( tbb::internal::eid_condvar_wait_failed );
+    }
+    lock.owns = true;
+}
+
+inline cv_status condition_variable::wait_for( unique_lock<mutex>& lock, const tick_count::interval_t& i )
+{
+    cv_status rc = no_timeout;
+    __TBB_ASSERT( lock.owns, NULL );
+    lock.owns = false;
+    // condvar_wait could be SleepConditionVariableCS (or SleepConditionVariableSRW) or our own pre-vista cond_var_wait()
+    if( !internal_condition_variable_wait( my_cv, lock.mutex(), &i ) ) {
+        int ec = GetLastError();
+        if( ec==WAIT_TIMEOUT || ec==ERROR_TIMEOUT )
+            rc = timeout;
+        else {
+            lock.owns = true;
+            throw_exception_v4( tbb::internal::eid_condvar_wait_failed );
+        }
+    }
+    lock.owns = true;
+    return rc;
+}
+
+#else /* !(_WIN32||_WIN64) */
+inline void condition_variable::wait( unique_lock<mutex>& lock )
+{
+    __TBB_ASSERT( lock.owns, NULL );
+    lock.owns = false;
+    if( pthread_cond_wait( &my_cv, lock.mutex()->native_handle() ) ) {
+        lock.owns = true;
+        throw_exception_v4( tbb::internal::eid_condvar_wait_failed );
+    }
+    // upon successful return, the mutex has been locked and is owned by the calling thread.
+    lock.owns = true;
+}
+
+inline cv_status condition_variable::wait_for( unique_lock<mutex>& lock, const tick_count::interval_t& i )
+{
+#if __linux__
+    struct timespec req;
+    double sec = i.seconds();
+    clock_gettime( CLOCK_REALTIME, &req );
+    req.tv_sec  += static_cast<long>(sec);
+    req.tv_nsec += static_cast<long>( (sec - static_cast<long>(sec))*1e9 );
+#else /* generic Unix */
+    struct timeval tv;
+    struct timespec req;
+    double sec = i.seconds();
+    int status = gettimeofday(&tv, NULL);
+    __TBB_ASSERT_EX( status==0, "gettimeofday failed" );
+    req.tv_sec  = tv.tv_sec + static_cast<long>(sec);
+    req.tv_nsec = tv.tv_usec*1000 + static_cast<long>( (sec - static_cast<long>(sec))*1e9 );
+#endif /*(choice of OS) */
+    if( req.tv_nsec>=1e9 ) {
+        req.tv_sec  += 1;
+        req.tv_nsec -= static_cast<long int>(1e9);
+    }
+    __TBB_ASSERT( 0<=req.tv_nsec && req.tv_nsec<1e9, NULL );
+
+    int ec;
+    cv_status rc = no_timeout;
+    __TBB_ASSERT( lock.owns, NULL );
+    lock.owns = false;
+    if( ( ec=pthread_cond_timedwait( &my_cv, lock.mutex()->native_handle(), &req ) ) ) {
+        if( ec==ETIMEDOUT )
+            rc = timeout;
+        else {
+            __TBB_ASSERT( lock.try_lock()==false, NULL );
+            lock.owns = true;
+            throw_exception_v4( tbb::internal::eid_condvar_wait_failed );
+        }
+    }
+    lock.owns = true;
+    return rc;
+}
+#endif /* !(_WIN32||_WIN64) */
+
+} // namespace interface5
+
+__TBB_DEFINE_PROFILING_SET_NAME(interface5::condition_variable)
+
+} // namespace tbb 
+
+#if TBB_IMPLEMENT_CPP0X
+
+namespace std {
+
+using tbb::interface5::defer_lock_t;
+using tbb::interface5::try_to_lock_t;
+using tbb::interface5::adopt_lock_t;
+using tbb::interface5::defer_lock;
+using tbb::interface5::try_to_lock;
+using tbb::interface5::adopt_lock;
+using tbb::interface5::lock_guard;
+using tbb::interface5::unique_lock;
+using tbb::interface5::swap;   /* this is for void std::swap(unique_lock<M>&,unique_lock<M>&) */
+using tbb::interface5::condition_variable;
+using tbb::interface5::cv_status;
+using tbb::interface5::timeout;
+using tbb::interface5::no_timeout;
+
+} // namespace std 
+
+#endif /* TBB_IMPLEMENT_CPP0X */
+
+#endif /* __TBB_condition_variable_H */
diff --git a/xdl/third_party/tbb/include/tbb/compat/ppl.h b/xdl/third_party/tbb/include/tbb/compat/ppl.h
new file mode 100644
index 00000000..24a11917
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/compat/ppl.h
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_compat_ppl_H
+#define __TBB_compat_ppl_H
+
+#include "../task_group.h"
+#include "../parallel_invoke.h"
+#include "../parallel_for_each.h"
+#include "../parallel_for.h"
+#include "../tbb_exception.h"
+#include "../critical_section.h"
+#include "../reader_writer_lock.h"
+#include "../combinable.h"
+
+namespace Concurrency {
+
+#if __TBB_TASK_GROUP_CONTEXT
+    using tbb::task_handle;
+    using tbb::task_group_status;
+    using tbb::task_group;
+    using tbb::structured_task_group;
+    using tbb::invalid_multiple_scheduling;
+    using tbb::missing_wait;
+    using tbb::make_task;
+
+    using tbb::not_complete;
+    using tbb::complete;
+    using tbb::canceled;
+
+    using tbb::is_current_task_group_canceling;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+    using tbb::parallel_invoke;
+    using tbb::strict_ppl::parallel_for;
+    using tbb::parallel_for_each;
+    using tbb::critical_section;
+    using tbb::reader_writer_lock;
+    using tbb::combinable;
+
+    using tbb::improper_lock;
+
+} // namespace Concurrency
+
+#endif /* __TBB_compat_ppl_H */
diff --git a/xdl/third_party/tbb/include/tbb/compat/thread b/xdl/third_party/tbb/include/tbb/compat/thread
new file mode 100644
index 00000000..55801d4b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/compat/thread
@@ -0,0 +1,60 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_thread_H
+#define __TBB_thread_H
+
+#include "../tbb_config.h"
+
+#if TBB_IMPLEMENT_CPP0X
+
+#include "../tbb_thread.h"
+
+namespace std {
+
+typedef tbb::tbb_thread thread;
+
+namespace this_thread {
+    using tbb::this_tbb_thread::get_id;
+    using tbb::this_tbb_thread::yield;
+
+    inline void sleep_for(const tbb::tick_count::interval_t& rel_time) {
+        tbb::internal::thread_sleep_v3( rel_time );
+    }
+}
+
+} // namespace std
+
+#else /* TBB_IMPLEMENT_CPP0X */
+
+#define __TBB_COMPAT_THREAD_RECURSION_PROTECTOR 1
+#include <thread>
+#undef __TBB_COMPAT_THREAD_RECURSION_PROTECTOR
+
+#endif /* TBB_IMPLEMENT_CPP0X */
+
+#else /* __TBB_thread_H */
+
+#if __TBB_COMPAT_THREAD_RECURSION_PROTECTOR
+#error The tbb/compat/thread header attempts to include itself. \
+       Please make sure that {TBBROOT}/include/tbb/compat is NOT in include paths.
+#endif
+
+#endif /* __TBB_thread_H */
diff --git a/xdl/third_party/tbb/include/tbb/compat/tuple b/xdl/third_party/tbb/include/tbb/compat/tuple
new file mode 100644
index 00000000..fed7b9b1
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/compat/tuple
@@ -0,0 +1,488 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tuple_H
+#define __TBB_tuple_H
+
+#include <utility>
+#include "../tbb_stddef.h"
+
+// build preprocessor variables for varying number of arguments
+// Need the leading comma so the empty __TBB_T_PACK will not cause a syntax error.
+#if __TBB_VARIADIC_MAX <= 5
+#define __TBB_T_PACK
+#define __TBB_U_PACK
+#define __TBB_TYPENAME_T_PACK
+#define __TBB_TYPENAME_U_PACK
+#define __TBB_NULL_TYPE_PACK
+#define __TBB_REF_T_PARAM_PACK
+#define __TBB_CONST_REF_T_PARAM_PACK
+#define __TBB_T_PARAM_LIST_PACK
+#define __TBB_CONST_NULL_REF_PACK
+//
+#elif __TBB_VARIADIC_MAX == 6
+#define __TBB_T_PACK ,__T5
+#define __TBB_U_PACK ,__U5
+#define __TBB_TYPENAME_T_PACK , typename __T5
+#define __TBB_TYPENAME_U_PACK , typename __U5
+#define __TBB_NULL_TYPE_PACK , null_type
+#define __TBB_REF_T_PARAM_PACK ,__T5& t5
+#define __TBB_CONST_REF_T_PARAM_PACK ,const __T5& t5
+#define __TBB_T_PARAM_LIST_PACK ,t5
+#define __TBB_CONST_NULL_REF_PACK , const null_type&
+//
+#elif __TBB_VARIADIC_MAX == 7
+#define __TBB_T_PACK ,__T5, __T6
+#define __TBB_U_PACK ,__U5, __U6
+#define __TBB_TYPENAME_T_PACK , typename __T5 , typename __T6
+#define __TBB_TYPENAME_U_PACK , typename __U5 , typename __U6
+#define __TBB_NULL_TYPE_PACK , null_type, null_type
+#define __TBB_REF_T_PARAM_PACK ,__T5& t5, __T6& t6
+#define __TBB_CONST_REF_T_PARAM_PACK ,const __T5& t5, const __T6& t6
+#define __TBB_T_PARAM_LIST_PACK ,t5 ,t6
+#define __TBB_CONST_NULL_REF_PACK , const null_type&, const null_type&
+//
+#elif __TBB_VARIADIC_MAX == 8
+#define __TBB_T_PACK ,__T5, __T6, __T7
+#define __TBB_U_PACK ,__U5, __U6, __U7
+#define __TBB_TYPENAME_T_PACK , typename __T5 , typename __T6, typename __T7
+#define __TBB_TYPENAME_U_PACK , typename __U5 , typename __U6, typename __U7
+#define __TBB_NULL_TYPE_PACK , null_type, null_type, null_type
+#define __TBB_REF_T_PARAM_PACK ,__T5& t5, __T6& t6, __T7& t7
+#define __TBB_CONST_REF_T_PARAM_PACK , const __T5& t5, const __T6& t6, const __T7& t7
+#define __TBB_T_PARAM_LIST_PACK ,t5 ,t6 ,t7
+#define __TBB_CONST_NULL_REF_PACK , const null_type&, const null_type&, const null_type&
+//
+#elif __TBB_VARIADIC_MAX == 9
+#define __TBB_T_PACK ,__T5, __T6, __T7, __T8
+#define __TBB_U_PACK ,__U5, __U6, __U7, __U8
+#define __TBB_TYPENAME_T_PACK , typename __T5, typename __T6, typename __T7, typename __T8
+#define __TBB_TYPENAME_U_PACK , typename __U5, typename __U6, typename __U7, typename __U8
+#define __TBB_NULL_TYPE_PACK , null_type, null_type, null_type, null_type
+#define __TBB_REF_T_PARAM_PACK ,__T5& t5, __T6& t6, __T7& t7, __T8& t8
+#define __TBB_CONST_REF_T_PARAM_PACK , const __T5& t5, const __T6& t6, const __T7& t7, const __T8& t8
+#define __TBB_T_PARAM_LIST_PACK ,t5 ,t6 ,t7 ,t8
+#define __TBB_CONST_NULL_REF_PACK , const null_type&, const null_type&, const null_type&, const null_type&
+//
+#elif __TBB_VARIADIC_MAX >= 10
+#define __TBB_T_PACK ,__T5, __T6, __T7, __T8, __T9
+#define __TBB_U_PACK ,__U5, __U6, __U7, __U8, __U9
+#define __TBB_TYPENAME_T_PACK , typename __T5, typename __T6, typename __T7, typename __T8, typename __T9
+#define __TBB_TYPENAME_U_PACK , typename __U5, typename __U6, typename __U7, typename __U8, typename __U9
+#define __TBB_NULL_TYPE_PACK , null_type, null_type, null_type, null_type, null_type
+#define __TBB_REF_T_PARAM_PACK ,__T5& t5, __T6& t6, __T7& t7, __T8& t8, __T9& t9
+#define __TBB_CONST_REF_T_PARAM_PACK , const __T5& t5, const __T6& t6, const __T7& t7, const __T8& t8, const __T9& t9
+#define __TBB_T_PARAM_LIST_PACK ,t5 ,t6 ,t7 ,t8 ,t9
+#define __TBB_CONST_NULL_REF_PACK , const null_type&, const null_type&, const null_type&, const null_type&, const null_type&
+#endif
+
+
+
+namespace tbb {
+namespace interface5 {
+
+namespace internal {
+struct null_type { };
+}
+using internal::null_type;
+
+// tuple forward declaration
+template <typename __T0=null_type, typename __T1=null_type, typename __T2=null_type,
+          typename __T3=null_type, typename __T4=null_type
+#if __TBB_VARIADIC_MAX >= 6
+, typename __T5=null_type
+#if __TBB_VARIADIC_MAX >= 7
+, typename __T6=null_type
+#if __TBB_VARIADIC_MAX >= 8
+, typename __T7=null_type
+#if __TBB_VARIADIC_MAX >= 9
+, typename __T8=null_type
+#if __TBB_VARIADIC_MAX >= 10
+, typename __T9=null_type
+#endif
+#endif
+#endif
+#endif
+#endif
+>
+class tuple;
+
+namespace internal {
+
+// const null_type temp
+inline const null_type cnull() { return null_type(); }
+
+// cons forward declaration
+template <typename __HT, typename __TT> struct cons;
+
+// type of a component of the cons
+template<int __N, typename __T>
+struct component {
+    typedef typename __T::tail_type next;
+    typedef typename component<__N-1,next>::type type;
+};
+
+template<typename __T>
+struct component<0,__T> {
+    typedef typename __T::head_type type;
+};
+
+template<>
+struct component<0,null_type> {
+    typedef null_type type;
+};
+
+// const version of component
+
+template<int __N, typename __T>
+struct component<__N, const __T>
+{
+    typedef typename __T::tail_type next;
+    typedef const typename component<__N-1,next>::type type;
+};
+
+template<typename __T>
+struct component<0, const __T>
+{
+    typedef const typename __T::head_type type;
+};
+
+
+// helper class for getting components of cons
+template< int __N>
+struct get_helper {
+template<typename __HT, typename __TT>
+inline static typename component<__N, cons<__HT,__TT> >::type& get(cons<__HT,__TT>& ti) {
+    return get_helper<__N-1>::get(ti.tail);
+}
+template<typename __HT, typename __TT>
+inline static typename component<__N, cons<__HT,__TT> >::type const& get(const cons<__HT,__TT>& ti) {
+    return get_helper<__N-1>::get(ti.tail);
+}
+};
+
+template<>
+struct get_helper<0> {
+template<typename __HT, typename __TT>
+inline static typename component<0, cons<__HT,__TT> >::type& get(cons<__HT,__TT>& ti) {
+    return ti.head;
+}
+template<typename __HT, typename __TT>
+inline static typename component<0, cons<__HT,__TT> >::type const& get(const cons<__HT,__TT>& ti) {
+    return ti.head;
+}
+};
+
+// traits adaptor
+template <typename __T0, typename __T1, typename __T2, typename __T3, typename __T4 __TBB_TYPENAME_T_PACK>
+struct tuple_traits {
+    typedef cons <__T0, typename tuple_traits<__T1, __T2, __T3, __T4 __TBB_T_PACK , null_type>::U > U;
+};
+
+template <typename __T0>
+struct tuple_traits<__T0, null_type, null_type, null_type, null_type __TBB_NULL_TYPE_PACK > {
+    typedef cons<__T0, null_type> U;
+};
+
+template<>
+struct tuple_traits<null_type, null_type, null_type, null_type, null_type __TBB_NULL_TYPE_PACK > {
+    typedef null_type U;
+};
+
+
+// core cons defs
+template <typename __HT, typename __TT>
+struct cons{
+
+    typedef __HT head_type;
+    typedef __TT tail_type;
+
+    head_type head; 
+    tail_type tail;
+
+    static const int length = 1 + tail_type::length;
+
+    // default constructors
+    explicit cons() : head(), tail() { }
+
+    // non-default constructors
+    cons(head_type& h, const tail_type& t) : head(h), tail(t) { }
+
+    template <typename __T0, typename __T1, typename __T2, typename __T3, typename __T4 __TBB_TYPENAME_T_PACK >
+    cons(const __T0& t0, const __T1& t1, const __T2& t2, const __T3& t3, const __T4& t4 __TBB_CONST_REF_T_PARAM_PACK) :
+        head(t0), tail(t1, t2, t3, t4 __TBB_T_PARAM_LIST_PACK, cnull()) { }
+
+    template <typename __T0, typename __T1, typename __T2, typename __T3, typename __T4 __TBB_TYPENAME_T_PACK >
+    cons(__T0& t0, __T1& t1, __T2& t2, __T3& t3, __T4& t4 __TBB_REF_T_PARAM_PACK) :
+        head(t0), tail(t1, t2, t3, t4 __TBB_T_PARAM_LIST_PACK , cnull()) { }
+
+    template <typename __HT1, typename __TT1>
+    cons(const cons<__HT1,__TT1>& other) : head(other.head), tail(other.tail) { }
+
+    cons& operator=(const cons& other) { head = other.head; tail = other.tail; return *this; }
+
+    friend bool operator==(const cons& me, const cons& other) {
+        return me.head == other.head && me.tail == other.tail;
+    }
+    friend bool operator<(const cons& me, const cons& other)  {
+        return me.head < other.head || (!(other.head < me.head) && me.tail < other.tail);
+    }
+    friend bool operator>(const cons& me, const cons& other)  { return other<me; }
+    friend bool operator!=(const cons& me, const cons& other) { return !(me==other); }
+    friend bool operator>=(const cons& me, const cons& other) { return !(me<other); }
+    friend bool operator<=(const cons& me, const cons& other) { return !(me>other); }
+
+    template<typename __HT1, typename __TT1>
+    friend bool operator==(const cons<__HT,__TT>& me, const cons<__HT1,__TT1>& other) {
+        return me.head == other.head && me.tail == other.tail;
+    }
+
+    template<typename __HT1, typename __TT1>
+    friend bool operator<(const cons<__HT,__TT>& me, const cons<__HT1,__TT1>& other) {
+        return me.head < other.head || (!(other.head < me.head) && me.tail < other.tail);
+    }
+
+    template<typename __HT1, typename __TT1>
+    friend bool operator>(const cons<__HT,__TT>& me, const cons<__HT1,__TT1>& other) { return other<me; }
+
+    template<typename __HT1, typename __TT1>
+    friend bool operator!=(const cons<__HT,__TT>& me, const cons<__HT1,__TT1>& other) { return !(me==other); }
+
+    template<typename __HT1, typename __TT1>
+    friend bool operator>=(const cons<__HT,__TT>& me, const cons<__HT1,__TT1>& other) { return !(me<other); }
+
+    template<typename __HT1, typename __TT1>
+    friend bool operator<=(const cons<__HT,__TT>& me, const cons<__HT1,__TT1>& other) { return !(me>other); }
+
+
+};  // cons
+
+
+template <typename __HT>
+struct cons<__HT,null_type> { 
+
+    typedef __HT head_type;
+    typedef null_type tail_type;
+
+    head_type head; 
+
+    static const int length = 1;
+
+    // default constructor
+    cons() : head() { /*std::cout << "default constructor 1\n";*/ }
+
+    cons(const null_type&, const null_type&, const null_type&, const null_type&, const null_type& __TBB_CONST_NULL_REF_PACK) : head() { /*std::cout << "default constructor 2\n";*/ }
+
+    // non-default constructor
+    template<typename __T1>
+    cons(__T1& t1, const null_type&, const null_type&, const null_type&, const null_type& __TBB_CONST_NULL_REF_PACK) : head(t1) { /*std::cout << "non-default a1, t1== " << t1 << "\n";*/}
+
+    cons(head_type& h, const null_type& = null_type() ) : head(h) { }
+    cons(const head_type& t0, const null_type&, const null_type&, const null_type&, const null_type& __TBB_CONST_NULL_REF_PACK) : head(t0) { }
+
+    // converting constructor
+    template<typename __HT1>
+    cons(__HT1 h1, const null_type&, const null_type&, const null_type&, const null_type& __TBB_CONST_NULL_REF_PACK) : head(h1) { }
+
+    // copy constructor
+    template<typename __HT1>
+    cons( const cons<__HT1, null_type>& other) : head(other.head) { }
+
+    // assignment operator
+    cons& operator=(const cons& other) { head = other.head; return *this; }
+
+    friend bool operator==(const cons& me, const cons& other) { return me.head == other.head; }
+    friend bool operator<(const cons& me, const cons& other) { return me.head < other.head; }
+    friend bool operator>(const cons& me, const cons& other) { return other<me; }
+    friend bool operator!=(const cons& me, const cons& other) {return !(me==other); }
+    friend bool operator<=(const cons& me, const cons& other) {return !(me>other); }
+    friend bool operator>=(const cons& me, const cons& other) {return !(me<other); }
+
+    template<typename __HT1>
+    friend bool operator==(const cons<__HT,null_type>& me, const cons<__HT1,null_type>& other) {
+        return me.head == other.head;
+    }
+
+    template<typename __HT1>
+    friend bool operator<(const cons<__HT,null_type>& me, const cons<__HT1,null_type>& other) {
+        return me.head < other.head;
+    }
+
+    template<typename __HT1>
+    friend bool operator>(const cons<__HT,null_type>& me, const cons<__HT1,null_type>& other) { return other<me; }
+
+    template<typename __HT1>
+    friend bool operator!=(const cons<__HT,null_type>& me, const cons<__HT1,null_type>& other) { return !(me==other); }
+
+    template<typename __HT1>
+    friend bool operator<=(const cons<__HT,null_type>& me, const cons<__HT1,null_type>& other) { return !(me>other); }
+
+    template<typename __HT1>
+    friend bool operator>=(const cons<__HT,null_type>& me, const cons<__HT1,null_type>& other) { return !(me<other); }
+
+};  // cons
+
+template <>
+struct cons<null_type,null_type> { typedef null_type tail_type; static const int length = 0; };
+
+// wrapper for default constructor
+template<typename __T>
+inline const __T wrap_dcons(__T*) { return __T(); }
+
+} // namespace internal
+
+// tuple definition
+template<typename __T0, typename __T1, typename __T2, typename __T3, typename __T4 __TBB_TYPENAME_T_PACK >
+class tuple : public internal::tuple_traits<__T0, __T1, __T2, __T3, __T4 __TBB_T_PACK >::U {
+    // friends
+    template <typename __T> friend class tuple_size;
+    template<int __N, typename __T> friend struct tuple_element;
+
+    // stl components
+    typedef tuple<__T0,__T1,__T2,__T3,__T4 __TBB_T_PACK > value_type;
+    typedef value_type *pointer;
+    typedef const value_type *const_pointer;
+    typedef value_type &reference;
+    typedef const value_type &const_reference;
+    typedef size_t size_type;
+
+    typedef typename internal::tuple_traits<__T0,__T1,__T2,__T3, __T4 __TBB_T_PACK >::U my_cons;
+
+public:
+    tuple(const __T0& t0=internal::wrap_dcons((__T0*)NULL)
+          ,const __T1& t1=internal::wrap_dcons((__T1*)NULL)
+          ,const __T2& t2=internal::wrap_dcons((__T2*)NULL)
+          ,const __T3& t3=internal::wrap_dcons((__T3*)NULL)
+          ,const __T4& t4=internal::wrap_dcons((__T4*)NULL)
+#if __TBB_VARIADIC_MAX >= 6
+          ,const __T5& t5=internal::wrap_dcons((__T5*)NULL)
+#if __TBB_VARIADIC_MAX >= 7
+          ,const __T6& t6=internal::wrap_dcons((__T6*)NULL)
+#if __TBB_VARIADIC_MAX >= 8
+          ,const __T7& t7=internal::wrap_dcons((__T7*)NULL)
+#if __TBB_VARIADIC_MAX >= 9
+          ,const __T8& t8=internal::wrap_dcons((__T8*)NULL)
+#if __TBB_VARIADIC_MAX >= 10
+          ,const __T9& t9=internal::wrap_dcons((__T9*)NULL)
+#endif
+#endif
+#endif
+#endif
+#endif
+          ) :
+        my_cons(t0,t1,t2,t3,t4 __TBB_T_PARAM_LIST_PACK) { }
+
+    template<int __N>
+    struct internal_tuple_element {
+        typedef typename internal::component<__N,my_cons>::type type;
+    };
+
+    template<int __N>
+    typename internal_tuple_element<__N>::type& get() { return internal::get_helper<__N>::get(*this); }
+
+    template<int __N>
+    typename internal_tuple_element<__N>::type const& get() const { return internal::get_helper<__N>::get(*this); }
+
+    template<typename __U1, typename __U2>
+    tuple& operator=(const internal::cons<__U1,__U2>& other) {
+        my_cons::operator=(other);
+        return *this;
+    }
+
+    template<typename __U1, typename __U2>
+    tuple& operator=(const std::pair<__U1,__U2>& other) {
+        // __TBB_ASSERT(tuple_size<value_type>::value == 2, "Invalid size for pair to tuple assignment");
+        this->head = other.first;
+        this->tail.head = other.second;
+        return *this;
+    }
+
+    friend bool operator==(const tuple& me, const tuple& other) {return static_cast<const my_cons &>(me)==(other);}
+    friend bool operator<(const tuple& me,  const tuple& other) {return static_cast<const my_cons &>(me)<(other);}
+    friend bool operator>(const tuple& me,  const tuple& other) {return static_cast<const my_cons &>(me)>(other);}
+    friend bool operator!=(const tuple& me, const tuple& other) {return static_cast<const my_cons &>(me)!=(other);}
+    friend bool operator>=(const tuple& me, const tuple& other) {return static_cast<const my_cons &>(me)>=(other);}
+    friend bool operator<=(const tuple& me, const tuple& other) {return static_cast<const my_cons &>(me)<=(other);}
+
+};  // tuple
+
+// empty tuple
+template<>
+class tuple<null_type, null_type, null_type, null_type, null_type __TBB_NULL_TYPE_PACK > : public null_type {
+};
+
+// helper classes
+
+template < typename __T>
+class tuple_size {
+public:
+    static const size_t value = 1 + tuple_size<typename __T::tail_type>::value;
+};
+
+template <>
+class tuple_size<tuple<> > { 
+public:
+    static const size_t value = 0;
+};
+
+template <>
+class tuple_size<null_type> {
+public:
+    static const size_t value = 0;
+};
+
+template<int __N, typename __T>
+struct tuple_element {
+    typedef typename internal::component<__N, typename __T::my_cons>::type type;
+};
+
+template<int __N, typename __T0, typename __T1, typename __T2, typename __T3, typename __T4 __TBB_TYPENAME_T_PACK >
+inline static typename tuple_element<__N,tuple<__T0,__T1,__T2,__T3,__T4 __TBB_T_PACK > >::type&
+    get(tuple<__T0,__T1,__T2,__T3,__T4 __TBB_T_PACK >& t) { return internal::get_helper<__N>::get(t); }
+
+template<int __N, typename __T0, typename __T1, typename __T2, typename __T3, typename __T4 __TBB_TYPENAME_T_PACK >
+inline static typename tuple_element<__N,tuple<__T0,__T1,__T2,__T3,__T4 __TBB_T_PACK > >::type const&
+    get(const tuple<__T0,__T1,__T2,__T3,__T4 __TBB_T_PACK >& t) { return internal::get_helper<__N>::get(t); }
+
+}  // interface5
+} // tbb
+
+#if !__TBB_CPP11_TUPLE_PRESENT
+namespace tbb {
+    namespace flow {
+        using tbb::interface5::tuple;
+        using tbb::interface5::tuple_size;
+        using tbb::interface5::tuple_element;
+        using tbb::interface5::get;
+    }
+}
+#endif
+
+#undef __TBB_T_PACK
+#undef __TBB_U_PACK
+#undef __TBB_TYPENAME_T_PACK
+#undef __TBB_TYPENAME_U_PACK
+#undef __TBB_NULL_TYPE_PACK
+#undef __TBB_REF_T_PARAM_PACK
+#undef __TBB_CONST_REF_T_PARAM_PACK
+#undef __TBB_T_PARAM_LIST_PACK
+#undef __TBB_CONST_NULL_REF_PACK
+ 
+#endif /* __TBB_tuple_H */
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_hash_map.h b/xdl/third_party/tbb/include/tbb/concurrent_hash_map.h
new file mode 100644
index 00000000..c9030e79
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_hash_map.h
@@ -0,0 +1,1530 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_hash_map_H
+#define __TBB_concurrent_hash_map_H
+
+#include "tbb_stddef.h"
+#include <iterator>
+#include <utility>      // Need std::pair
+#include <cstring>      // Need std::memset
+#include __TBB_STD_SWAP_HEADER
+
+#include "cache_aligned_allocator.h"
+#include "tbb_allocator.h"
+#include "spin_rw_mutex.h"
+#include "atomic.h"
+#include "tbb_exception.h"
+#include "tbb_profiling.h"
+#include "internal/_tbb_hash_compare_impl.h"
+#if __TBB_INITIALIZER_LISTS_PRESENT
+#include <initializer_list>
+#endif
+#if TBB_USE_PERFORMANCE_WARNINGS || __TBB_STATISTICS
+#include <typeinfo>
+#endif
+#if __TBB_STATISTICS
+#include <stdio.h>
+#endif
+
+namespace tbb {
+
+namespace interface5 {
+
+    template<typename Key, typename T, typename HashCompare = tbb_hash_compare<Key>, typename A = tbb_allocator<std::pair<Key, T> > >
+    class concurrent_hash_map;
+
+    //! @cond INTERNAL
+    namespace internal {
+    using namespace tbb::internal;
+
+
+    //! Type of a hash code.
+    typedef size_t hashcode_t;
+    //! Node base type
+    struct hash_map_node_base : tbb::internal::no_copy {
+        //! Mutex type
+        typedef spin_rw_mutex mutex_t;
+        //! Scoped lock type for mutex
+        typedef mutex_t::scoped_lock scoped_t;
+        //! Next node in chain
+        hash_map_node_base *next;
+        mutex_t mutex;
+    };
+    //! Incompleteness flag value
+    static hash_map_node_base *const rehash_req = reinterpret_cast<hash_map_node_base*>(size_t(3));
+    //! Rehashed empty bucket flag
+    static hash_map_node_base *const empty_rehashed = reinterpret_cast<hash_map_node_base*>(size_t(0));
+    //! base class of concurrent_hash_map
+    class hash_map_base {
+    public:
+        //! Size type
+        typedef size_t size_type;
+        //! Type of a hash code.
+        typedef size_t hashcode_t;
+        //! Segment index type
+        typedef size_t segment_index_t;
+        //! Node base type
+        typedef hash_map_node_base node_base;
+        //! Bucket type
+        struct bucket : tbb::internal::no_copy {
+            //! Mutex type for buckets
+            typedef spin_rw_mutex mutex_t;
+            //! Scoped lock type for mutex
+            typedef mutex_t::scoped_lock scoped_t;
+            mutex_t mutex;
+            node_base *node_list;
+        };
+        //! Count of segments in the first block
+        static size_type const embedded_block = 1;
+        //! Count of segments in the first block
+        static size_type const embedded_buckets = 1<<embedded_block;
+        //! Count of segments in the first block
+        static size_type const first_block = 8; //including embedded_block. perfect with bucket size 16, so the allocations are power of 4096
+        //! Size of a pointer / table size
+        static size_type const pointers_per_table = sizeof(segment_index_t) * 8; // one segment per bit
+        //! Segment pointer
+        typedef bucket *segment_ptr_t;
+        //! Segment pointers table type
+        typedef segment_ptr_t segments_table_t[pointers_per_table];
+        //! Hash mask = sum of allocated segment sizes - 1
+        atomic<hashcode_t> my_mask;
+        //! Segment pointers table. Also prevents false sharing between my_mask and my_size
+        segments_table_t my_table;
+        //! Size of container in stored items
+        atomic<size_type> my_size; // It must be in separate cache line from my_mask due to performance effects
+        //! Zero segment
+        bucket my_embedded_segment[embedded_buckets];
+#if __TBB_STATISTICS
+        atomic<unsigned> my_info_resizes; // concurrent ones
+        mutable atomic<unsigned> my_info_restarts; // race collisions
+        atomic<unsigned> my_info_rehashes;  // invocations of rehash_bucket
+#endif
+        //! Constructor
+        hash_map_base() {
+            std::memset( this, 0, pointers_per_table*sizeof(segment_ptr_t) // 32*4=128   or 64*8=512
+                + sizeof(my_size) + sizeof(my_mask)  // 4+4 or 8+8
+                + embedded_buckets*sizeof(bucket) ); // n*8 or n*16
+            for( size_type i = 0; i < embedded_block; i++ ) // fill the table
+                my_table[i] = my_embedded_segment + segment_base(i);
+            my_mask = embedded_buckets - 1;
+            __TBB_ASSERT( embedded_block <= first_block, "The first block number must include embedded blocks");
+#if __TBB_STATISTICS
+            my_info_resizes = 0; // concurrent ones
+            my_info_restarts = 0; // race collisions
+            my_info_rehashes = 0;  // invocations of rehash_bucket
+#endif
+        }
+
+        //! @return segment index of given index in the array
+        static segment_index_t segment_index_of( size_type index ) {
+            return segment_index_t( __TBB_Log2( index|1 ) );
+        }
+
+        //! @return the first array index of given segment
+        static segment_index_t segment_base( segment_index_t k ) {
+            return (segment_index_t(1)<<k & ~segment_index_t(1));
+        }
+
+        //! @return segment size except for @arg k == 0
+        static size_type segment_size( segment_index_t k ) {
+            return size_type(1)<<k; // fake value for k==0
+        }
+
+        //! @return true if @arg ptr is valid pointer
+        static bool is_valid( void *ptr ) {
+            return reinterpret_cast<uintptr_t>(ptr) > uintptr_t(63);
+        }
+
+        //! Initialize buckets
+        static void init_buckets( segment_ptr_t ptr, size_type sz, bool is_initial ) {
+            if( is_initial ) std::memset( static_cast<void*>(ptr), 0, sz*sizeof(bucket) );
+            else for(size_type i = 0; i < sz; i++, ptr++) {
+                *reinterpret_cast<intptr_t*>(&ptr->mutex) = 0;
+                ptr->node_list = rehash_req;
+            }
+        }
+
+        //! Add node @arg n to bucket @arg b
+        static void add_to_bucket( bucket *b, node_base *n ) {
+            __TBB_ASSERT(b->node_list != rehash_req, NULL);
+            n->next = b->node_list;
+            b->node_list = n; // its under lock and flag is set
+        }
+
+        //! Exception safety helper
+        struct enable_segment_failsafe : tbb::internal::no_copy {
+            segment_ptr_t *my_segment_ptr;
+            enable_segment_failsafe(segments_table_t &table, segment_index_t k) : my_segment_ptr(&table[k]) {}
+            ~enable_segment_failsafe() {
+                if( my_segment_ptr ) *my_segment_ptr = 0; // indicate no allocation in progress
+            }
+        };
+
+        //! Enable segment
+        void enable_segment( segment_index_t k, bool is_initial = false ) {
+            __TBB_ASSERT( k, "Zero segment must be embedded" );
+            enable_segment_failsafe watchdog( my_table, k );
+            cache_aligned_allocator<bucket> alloc;
+            size_type sz;
+            __TBB_ASSERT( !is_valid(my_table[k]), "Wrong concurrent assignment");
+            if( k >= first_block ) {
+                sz = segment_size( k );
+                segment_ptr_t ptr = alloc.allocate( sz );
+                init_buckets( ptr, sz, is_initial );
+                itt_hide_store_word( my_table[k], ptr );
+                sz <<= 1;// double it to get entire capacity of the container
+            } else { // the first block
+                __TBB_ASSERT( k == embedded_block, "Wrong segment index" );
+                sz = segment_size( first_block );
+                segment_ptr_t ptr = alloc.allocate( sz - embedded_buckets );
+                init_buckets( ptr, sz - embedded_buckets, is_initial );
+                ptr -= segment_base(embedded_block);
+                for(segment_index_t i = embedded_block; i < first_block; i++) // calc the offsets
+                    itt_hide_store_word( my_table[i], ptr + segment_base(i) );
+            }
+            itt_store_word_with_release( my_mask, sz-1 );
+            watchdog.my_segment_ptr = 0;
+        }
+
+        //! Get bucket by (masked) hashcode
+        bucket *get_bucket( hashcode_t h ) const throw() { // TODO: add throw() everywhere?
+            segment_index_t s = segment_index_of( h );
+            h -= segment_base(s);
+            segment_ptr_t seg = my_table[s];
+            __TBB_ASSERT( is_valid(seg), "hashcode must be cut by valid mask for allocated segments" );
+            return &seg[h];
+        }
+
+        // internal serial rehashing helper
+        void mark_rehashed_levels( hashcode_t h ) throw () {
+            segment_index_t s = segment_index_of( h );
+            while( segment_ptr_t seg = my_table[++s] )
+                if( seg[h].node_list == rehash_req ) {
+                    seg[h].node_list = empty_rehashed;
+                    mark_rehashed_levels( h + ((hashcode_t)1<<s) ); // optimized segment_base(s)
+                }
+        }
+
+        //! Check for mask race
+        // Splitting into two functions should help inlining
+        inline bool check_mask_race( const hashcode_t h, hashcode_t &m ) const {
+            hashcode_t m_now, m_old = m;
+            m_now = (hashcode_t) itt_load_word_with_acquire( my_mask );
+            if( m_old != m_now )
+                return check_rehashing_collision( h, m_old, m = m_now );
+            return false;
+        }
+
+        //! Process mask race, check for rehashing collision
+        bool check_rehashing_collision( const hashcode_t h, hashcode_t m_old, hashcode_t m ) const {
+            __TBB_ASSERT(m_old != m, NULL); // TODO?: m arg could be optimized out by passing h = h&m
+            if( (h & m_old) != (h & m) ) { // mask changed for this hashcode, rare event
+                // condition above proves that 'h' has some other bits set beside 'm_old'
+                // find next applicable mask after m_old    //TODO: look at bsl instruction
+                for( ++m_old; !(h & m_old); m_old <<= 1 ) // at maximum few rounds depending on the first block size
+                    ;
+                m_old = (m_old<<1) - 1; // get full mask from a bit
+                __TBB_ASSERT((m_old&(m_old+1))==0 && m_old <= m, NULL);
+                // check whether it is rehashing/ed
+                if( itt_load_word_with_acquire(get_bucket(h & m_old)->node_list) != rehash_req )
+                {
+#if __TBB_STATISTICS
+                    my_info_restarts++; // race collisions
+#endif
+                    return true;
+                }
+            }
+            return false;
+        }
+
+        //! Insert a node and check for load factor. @return segment index to enable.
+        segment_index_t insert_new_node( bucket *b, node_base *n, hashcode_t mask ) {
+            size_type sz = ++my_size; // prefix form is to enforce allocation after the first item inserted
+            add_to_bucket( b, n );
+            // check load factor
+            if( sz >= mask ) { // TODO: add custom load_factor
+                segment_index_t new_seg = __TBB_Log2( mask+1 ); //optimized segment_index_of
+                __TBB_ASSERT( is_valid(my_table[new_seg-1]), "new allocations must not publish new mask until segment has allocated");
+                static const segment_ptr_t is_allocating = (segment_ptr_t)2;
+                if( !itt_hide_load_word(my_table[new_seg])
+                  && as_atomic(my_table[new_seg]).compare_and_swap(is_allocating, NULL) == NULL )
+                    return new_seg; // The value must be processed
+            }
+            return 0;
+        }
+
+        //! Prepare enough segments for number of buckets
+        void reserve(size_type buckets) {
+            if( !buckets-- ) return;
+            bool is_initial = !my_size;
+            for( size_type m = my_mask; buckets > m; m = my_mask )
+                enable_segment( segment_index_of( m+1 ), is_initial );
+        }
+        //! Swap hash_map_bases
+        void internal_swap(hash_map_base &table) {
+            using std::swap;
+            swap(this->my_mask, table.my_mask);
+            swap(this->my_size, table.my_size);
+            for(size_type i = 0; i < embedded_buckets; i++)
+                swap(this->my_embedded_segment[i].node_list, table.my_embedded_segment[i].node_list);
+            for(size_type i = embedded_block; i < pointers_per_table; i++)
+                swap(this->my_table[i], table.my_table[i]);
+        }
+    };
+
+    template<typename Iterator>
+    class hash_map_range;
+
+    //! Meets requirements of a forward iterator for STL */
+    /** Value is either the T or const T type of the container.
+        @ingroup containers */
+    template<typename Container, typename Value>
+    class hash_map_iterator
+        : public std::iterator<std::forward_iterator_tag,Value>
+    {
+        typedef Container map_type;
+        typedef typename Container::node node;
+        typedef hash_map_base::node_base node_base;
+        typedef hash_map_base::bucket bucket;
+
+        template<typename C, typename T, typename U>
+        friend bool operator==( const hash_map_iterator<C,T>& i, const hash_map_iterator<C,U>& j );
+
+        template<typename C, typename T, typename U>
+        friend bool operator!=( const hash_map_iterator<C,T>& i, const hash_map_iterator<C,U>& j );
+
+        template<typename C, typename T, typename U>
+        friend ptrdiff_t operator-( const hash_map_iterator<C,T>& i, const hash_map_iterator<C,U>& j );
+
+        template<typename C, typename U>
+        friend class hash_map_iterator;
+
+        template<typename I>
+        friend class hash_map_range;
+
+        void advance_to_next_bucket() { // TODO?: refactor to iterator_base class
+            size_t k = my_index+1;
+            __TBB_ASSERT( my_bucket, "advancing an invalid iterator?");
+            while( k <= my_map->my_mask ) {
+                // Following test uses 2's-complement wizardry
+                if( k&(k-2) ) // not the beginning of a segment
+                    ++my_bucket;
+                else my_bucket = my_map->get_bucket( k );
+                my_node = static_cast<node*>( my_bucket->node_list );
+                if( hash_map_base::is_valid(my_node) ) {
+                    my_index = k; return;
+                }
+                ++k;
+            }
+            my_bucket = 0; my_node = 0; my_index = k; // the end
+        }
+#if !defined(_MSC_VER) || defined(__INTEL_COMPILER)
+        template<typename Key, typename T, typename HashCompare, typename A>
+        friend class interface5::concurrent_hash_map;
+#else
+    public: // workaround
+#endif
+        //! concurrent_hash_map over which we are iterating.
+        const Container *my_map;
+
+        //! Index in hash table for current item
+        size_t my_index;
+
+        //! Pointer to bucket
+        const bucket *my_bucket;
+
+        //! Pointer to node that has current item
+        node *my_node;
+
+        hash_map_iterator( const Container &map, size_t index, const bucket *b, node_base *n );
+
+    public:
+        //! Construct undefined iterator
+        hash_map_iterator(): my_map(), my_index(), my_bucket(), my_node() {}
+        hash_map_iterator( const hash_map_iterator<Container,typename Container::value_type> &other ) :
+            my_map(other.my_map),
+            my_index(other.my_index),
+            my_bucket(other.my_bucket),
+            my_node(other.my_node)
+        {}
+        Value& operator*() const {
+            __TBB_ASSERT( hash_map_base::is_valid(my_node), "iterator uninitialized or at end of container?" );
+            return my_node->item;
+        }
+        Value* operator->() const {return &operator*();}
+        hash_map_iterator& operator++();
+
+        //! Post increment
+        hash_map_iterator operator++(int) {
+            hash_map_iterator old(*this);
+            operator++();
+            return old;
+        }
+    };
+
+    template<typename Container, typename Value>
+    hash_map_iterator<Container,Value>::hash_map_iterator( const Container &map, size_t index, const bucket *b, node_base *n ) :
+        my_map(&map),
+        my_index(index),
+        my_bucket(b),
+        my_node( static_cast<node*>(n) )
+    {
+        if( b && !hash_map_base::is_valid(n) )
+            advance_to_next_bucket();
+    }
+
+    template<typename Container, typename Value>
+    hash_map_iterator<Container,Value>& hash_map_iterator<Container,Value>::operator++() {
+        my_node = static_cast<node*>( my_node->next );
+        if( !my_node ) advance_to_next_bucket();
+        return *this;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator==( const hash_map_iterator<Container,T>& i, const hash_map_iterator<Container,U>& j ) {
+        return i.my_node == j.my_node && i.my_map == j.my_map;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator!=( const hash_map_iterator<Container,T>& i, const hash_map_iterator<Container,U>& j ) {
+        return i.my_node != j.my_node || i.my_map != j.my_map;
+    }
+
+    //! Range class used with concurrent_hash_map
+    /** @ingroup containers */
+    template<typename Iterator>
+    class hash_map_range {
+        typedef typename Iterator::map_type map_type;
+        Iterator my_begin;
+        Iterator my_end;
+        mutable Iterator my_midpoint;
+        size_t my_grainsize;
+        //! Set my_midpoint to point approximately half way between my_begin and my_end.
+        void set_midpoint() const;
+        template<typename U> friend class hash_map_range;
+    public:
+        //! Type for size of a range
+        typedef std::size_t size_type;
+        typedef typename Iterator::value_type value_type;
+        typedef typename Iterator::reference reference;
+        typedef typename Iterator::difference_type difference_type;
+        typedef Iterator iterator;
+
+        //! True if range is empty.
+        bool empty() const {return my_begin==my_end;}
+
+        //! True if range can be partitioned into two subranges.
+        bool is_divisible() const {
+            return my_midpoint!=my_end;
+        }
+        //! Split range.
+        hash_map_range( hash_map_range& r, split ) :
+            my_end(r.my_end),
+            my_grainsize(r.my_grainsize)
+        {
+            r.my_end = my_begin = r.my_midpoint;
+            __TBB_ASSERT( !empty(), "Splitting despite the range is not divisible" );
+            __TBB_ASSERT( !r.empty(), "Splitting despite the range is not divisible" );
+            set_midpoint();
+            r.set_midpoint();
+        }
+        //! type conversion
+        template<typename U>
+        hash_map_range( hash_map_range<U>& r) :
+            my_begin(r.my_begin),
+            my_end(r.my_end),
+            my_midpoint(r.my_midpoint),
+            my_grainsize(r.my_grainsize)
+        {}
+        //! Init range with container and grainsize specified
+        hash_map_range( const map_type &map, size_type grainsize_ = 1 ) :
+            my_begin( Iterator( map, 0, map.my_embedded_segment, map.my_embedded_segment->node_list ) ),
+            my_end( Iterator( map, map.my_mask + 1, 0, 0 ) ),
+            my_grainsize( grainsize_ )
+        {
+            __TBB_ASSERT( grainsize_>0, "grainsize must be positive" );
+            set_midpoint();
+        }
+        const Iterator& begin() const {return my_begin;}
+        const Iterator& end() const {return my_end;}
+        //! The grain size for this range.
+        size_type grainsize() const {return my_grainsize;}
+    };
+
+    template<typename Iterator>
+    void hash_map_range<Iterator>::set_midpoint() const {
+        // Split by groups of nodes
+        size_t m = my_end.my_index-my_begin.my_index;
+        if( m > my_grainsize ) {
+            m = my_begin.my_index + m/2u;
+            hash_map_base::bucket *b = my_begin.my_map->get_bucket(m);
+            my_midpoint = Iterator(*my_begin.my_map,m,b,b->node_list);
+        } else {
+            my_midpoint = my_end;
+        }
+        __TBB_ASSERT( my_begin.my_index <= my_midpoint.my_index,
+            "my_begin is after my_midpoint" );
+        __TBB_ASSERT( my_midpoint.my_index <= my_end.my_index,
+            "my_midpoint is after my_end" );
+        __TBB_ASSERT( my_begin != my_midpoint || my_begin == my_end,
+            "[my_begin, my_midpoint) range should not be empty" );
+    }
+
+    } // internal
+//! @endcond
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress "conditional expression is constant" warning.
+    #pragma warning( push )
+    #pragma warning( disable: 4127 )
+#endif
+
+//! Unordered map from Key to T.
+/** concurrent_hash_map is associative container with concurrent access.
+
+@par Compatibility
+    The class meets all Container Requirements from C++ Standard (See ISO/IEC 14882:2003(E), clause 23.1).
+
+@par Exception Safety
+    - Hash function is not permitted to throw an exception. User-defined types Key and T are forbidden from throwing an exception in destructors.
+    - If exception happens during insert() operations, it has no effect (unless exception raised by HashCompare::hash() function during grow_segment).
+    - If exception happens during operator=() operation, the container can have a part of source items, and methods size() and empty() can return wrong results.
+
+@par Changes since TBB 2.1
+    - Replaced internal algorithm and data structure. Patent is pending.
+    - Added buckets number argument for constructor
+
+@par Changes since TBB 2.0
+    - Fixed exception-safety
+    - Added template argument for allocator
+    - Added allocator argument in constructors
+    - Added constructor from a range of iterators
+    - Added several new overloaded insert() methods
+    - Added get_allocator()
+    - Added swap()
+    - Added count()
+    - Added overloaded erase(accessor &) and erase(const_accessor&)
+    - Added equal_range() [const]
+    - Added [const_]pointer, [const_]reference, and allocator_type types
+    - Added global functions: operator==(), operator!=(), and swap()
+
+    @ingroup containers */
+template<typename Key, typename T, typename HashCompare, typename Allocator>
+class concurrent_hash_map : protected internal::hash_map_base {
+    template<typename Container, typename Value>
+    friend class internal::hash_map_iterator;
+
+    template<typename I>
+    friend class internal::hash_map_range;
+
+public:
+    typedef Key key_type;
+    typedef T mapped_type;
+    typedef std::pair<const Key,T> value_type;
+    typedef hash_map_base::size_type size_type;
+    typedef ptrdiff_t difference_type;
+    typedef value_type *pointer;
+    typedef const value_type *const_pointer;
+    typedef value_type &reference;
+    typedef const value_type &const_reference;
+    typedef internal::hash_map_iterator<concurrent_hash_map,value_type> iterator;
+    typedef internal::hash_map_iterator<concurrent_hash_map,const value_type> const_iterator;
+    typedef internal::hash_map_range<iterator> range_type;
+    typedef internal::hash_map_range<const_iterator> const_range_type;
+    typedef Allocator allocator_type;
+
+protected:
+    friend class const_accessor;
+    struct node;
+    typedef typename Allocator::template rebind<node>::other node_allocator_type;
+    node_allocator_type my_allocator;
+    HashCompare my_hash_compare;
+
+    struct node : public node_base {
+        value_type item;
+        node( const Key &key ) : item(key, T()) {}
+        node( const Key &key, const T &t ) : item(key, t) {}
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        node( const Key &key, T &&t ) : item(key, std::move(t)) {}
+        node( value_type&& i ) : item(std::move(i)){}
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+        template<typename... Args>
+        node( Args&&... args ) : item(std::forward<Args>(args)...) {}
+#if __TBB_COPY_FROM_NON_CONST_REF_BROKEN
+        node( value_type& i ) : item(const_cast<const value_type&>(i)) {}
+#endif //__TBB_COPY_FROM_NON_CONST_REF_BROKEN
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+        node( const value_type& i ) : item(i) {}
+
+        // exception-safe allocation, see C++ Standard 2003, clause 5.3.4p17
+        void *operator new( size_t /*size*/, node_allocator_type &a ) {
+            void *ptr = a.allocate(1);
+            if(!ptr)
+                tbb::internal::throw_exception(tbb::internal::eid_bad_alloc);
+            return ptr;
+        }
+        // match placement-new form above to be called if exception thrown in constructor
+        void operator delete( void *ptr, node_allocator_type &a ) { a.deallocate(static_cast<node*>(ptr),1); }
+    };
+
+    void delete_node( node_base *n ) {
+        my_allocator.destroy( static_cast<node*>(n) );
+        my_allocator.deallocate( static_cast<node*>(n), 1);
+    }
+
+    static node* allocate_node_copy_construct(node_allocator_type& allocator, const Key &key, const T * t){
+        return  new( allocator ) node(key, *t);
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    static node* allocate_node_move_construct(node_allocator_type& allocator, const Key &key, const T * t){
+        return  new( allocator ) node(key, std::move(*const_cast<T*>(t)));
+    }
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename... Args>
+    static node* allocate_node_emplace_construct(node_allocator_type& allocator, Args&&... args){
+        return  new( allocator ) node(std::forward<Args>(args)...);
+    }
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    static node* allocate_node_default_construct(node_allocator_type& allocator, const Key &key, const T * ){
+        return  new( allocator ) node(key);
+    }
+
+    static node* do_not_allocate_node(node_allocator_type& , const Key &, const T * ){
+        __TBB_ASSERT(false,"this dummy function should not be called");
+        return NULL;
+    }
+
+    node *search_bucket( const key_type &key, bucket *b ) const {
+        node *n = static_cast<node*>( b->node_list );
+        while( is_valid(n) && !my_hash_compare.equal(key, n->item.first) )
+            n = static_cast<node*>( n->next );
+        __TBB_ASSERT(n != internal::rehash_req, "Search can be executed only for rehashed bucket");
+        return n;
+    }
+
+    //! bucket accessor is to find, rehash, acquire a lock, and access a bucket
+    class bucket_accessor : public bucket::scoped_t {
+        bucket *my_b;
+    public:
+        bucket_accessor( concurrent_hash_map *base, const hashcode_t h, bool writer = false ) { acquire( base, h, writer ); }
+        //! find a bucket by masked hashcode, optionally rehash, and acquire the lock
+        inline void acquire( concurrent_hash_map *base, const hashcode_t h, bool writer = false ) {
+            my_b = base->get_bucket( h );
+            // TODO: actually, notification is unnecessary here, just hiding double-check
+            if( itt_load_word_with_acquire(my_b->node_list) == internal::rehash_req
+                && try_acquire( my_b->mutex, /*write=*/true ) )
+            {
+                if( my_b->node_list == internal::rehash_req ) base->rehash_bucket( my_b, h ); //recursive rehashing
+            }
+            else bucket::scoped_t::acquire( my_b->mutex, writer );
+            __TBB_ASSERT( my_b->node_list != internal::rehash_req, NULL);
+        }
+        //! check whether bucket is locked for write
+        bool is_writer() { return bucket::scoped_t::is_writer; }
+        //! get bucket pointer
+        bucket *operator() () { return my_b; }
+    };
+
+    // TODO refactor to hash_base
+    void rehash_bucket( bucket *b_new, const hashcode_t h ) {
+        __TBB_ASSERT( *(intptr_t*)(&b_new->mutex), "b_new must be locked (for write)");
+        __TBB_ASSERT( h > 1, "The lowermost buckets can't be rehashed" );
+        __TBB_store_with_release(b_new->node_list, internal::empty_rehashed); // mark rehashed
+        hashcode_t mask = ( 1u<<__TBB_Log2( h ) ) - 1; // get parent mask from the topmost bit
+#if __TBB_STATISTICS
+        my_info_rehashes++; // invocations of rehash_bucket
+#endif
+
+        bucket_accessor b_old( this, h & mask );
+
+        mask = (mask<<1) | 1; // get full mask for new bucket
+        __TBB_ASSERT( (mask&(mask+1))==0 && (h & mask) == h, NULL );
+    restart:
+        for( node_base **p = &b_old()->node_list, *n = __TBB_load_with_acquire(*p); is_valid(n); n = *p ) {
+            hashcode_t c = my_hash_compare.hash( static_cast<node*>(n)->item.first );
+#if TBB_USE_ASSERT
+            hashcode_t bmask = h & (mask>>1);
+            bmask = bmask==0? 1 : ( 1u<<(__TBB_Log2( bmask )+1 ) ) - 1; // minimal mask of parent bucket
+            __TBB_ASSERT( (c & bmask) == (h & bmask), "hash() function changed for key in table" );
+#endif
+            if( (c & mask) == h ) {
+                if( !b_old.is_writer() )
+                    if( !b_old.upgrade_to_writer() ) {
+                        goto restart; // node ptr can be invalid due to concurrent erase
+                    }
+                *p = n->next; // exclude from b_old
+                add_to_bucket( b_new, n );
+            } else p = &n->next; // iterate to next item
+        }
+    }
+
+    struct call_clear_on_leave {
+        concurrent_hash_map* my_ch_map;
+        call_clear_on_leave( concurrent_hash_map* a_ch_map ) : my_ch_map(a_ch_map) {}
+        void dismiss() {my_ch_map = 0;}
+        ~call_clear_on_leave(){
+            if (my_ch_map){
+                my_ch_map->clear();
+            }
+        }
+    };
+public:
+
+    class accessor;
+    //! Combines data access, locking, and garbage collection.
+    class const_accessor : private node::scoped_t /*which derived from no_copy*/ {
+        friend class concurrent_hash_map<Key,T,HashCompare,Allocator>;
+        friend class accessor;
+    public:
+        //! Type of value
+        typedef const typename concurrent_hash_map::value_type value_type;
+
+        //! True if result is empty.
+        bool empty() const { return !my_node; }
+
+        //! Set to null
+        void release() {
+            if( my_node ) {
+                node::scoped_t::release();
+                my_node = 0;
+            }
+        }
+
+        //! Return reference to associated value in hash table.
+        const_reference operator*() const {
+            __TBB_ASSERT( my_node, "attempt to dereference empty accessor" );
+            return my_node->item;
+        }
+
+        //! Return pointer to associated value in hash table.
+        const_pointer operator->() const {
+            return &operator*();
+        }
+
+        //! Create empty result
+        const_accessor() : my_node(NULL) {}
+
+        //! Destroy result after releasing the underlying reference.
+        ~const_accessor() {
+            my_node = NULL; // scoped lock's release() is called in its destructor
+        }
+    protected:
+        bool is_writer() { return node::scoped_t::is_writer; }
+        node *my_node;
+        hashcode_t my_hash;
+    };
+
+    //! Allows write access to elements and combines data access, locking, and garbage collection.
+    class accessor: public const_accessor {
+    public:
+        //! Type of value
+        typedef typename concurrent_hash_map::value_type value_type;
+
+        //! Return reference to associated value in hash table.
+        reference operator*() const {
+            __TBB_ASSERT( this->my_node, "attempt to dereference empty accessor" );
+            return this->my_node->item;
+        }
+
+        //! Return pointer to associated value in hash table.
+        pointer operator->() const {
+            return &operator*();
+        }
+    };
+
+    //! Construct empty table.
+    explicit concurrent_hash_map( const allocator_type &a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a)
+    {}
+
+    explicit concurrent_hash_map( const HashCompare& compare, const allocator_type& a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a), my_hash_compare(compare)
+    {}
+
+    //! Construct empty table with n preallocated buckets. This number serves also as initial concurrency level.
+    concurrent_hash_map( size_type n, const allocator_type &a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a)
+    {
+        reserve( n );
+    }
+
+    concurrent_hash_map( size_type n, const HashCompare& compare, const allocator_type& a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a), my_hash_compare(compare)
+    {
+        reserve( n );
+    }
+
+    //! Copy constructor
+    concurrent_hash_map( const concurrent_hash_map &table, const allocator_type &a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a)
+    {
+        call_clear_on_leave scope_guard(this);
+        internal_copy(table);
+        scope_guard.dismiss();
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move constructor
+    concurrent_hash_map( concurrent_hash_map &&table )
+        : internal::hash_map_base(), my_allocator(std::move(table.get_allocator()))
+    {
+        swap(table);
+    }
+
+    //! Move constructor
+    concurrent_hash_map( concurrent_hash_map &&table, const allocator_type &a )
+        : internal::hash_map_base(), my_allocator(a)
+    {
+        if (a == table.get_allocator()){
+            this->swap(table);
+        }else{
+            call_clear_on_leave scope_guard(this);
+            internal_copy(std::make_move_iterator(table.begin()), std::make_move_iterator(table.end()), table.size());
+            scope_guard.dismiss();
+        }
+    }
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    //! Construction with copying iteration range and given allocator instance
+    template<typename I>
+    concurrent_hash_map( I first, I last, const allocator_type &a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a)
+    {
+        call_clear_on_leave scope_guard(this);
+        internal_copy(first, last, std::distance(first, last));
+        scope_guard.dismiss();
+    }
+
+    template<typename I>
+    concurrent_hash_map( I first, I last, const HashCompare& compare, const allocator_type& a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a), my_hash_compare(compare)
+    {
+        call_clear_on_leave scope_guard(this);
+        internal_copy(first, last, std::distance(first, last));
+        scope_guard.dismiss();
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Construct empty table with n preallocated buckets. This number serves also as initial concurrency level.
+    concurrent_hash_map( std::initializer_list<value_type> il, const allocator_type &a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a)
+    {
+        call_clear_on_leave scope_guard(this);
+        internal_copy(il.begin(), il.end(), il.size());
+        scope_guard.dismiss();
+    }
+
+    concurrent_hash_map( std::initializer_list<value_type> il, const HashCompare& compare, const allocator_type& a = allocator_type() )
+        : internal::hash_map_base(), my_allocator(a), my_hash_compare(compare)
+    {
+        call_clear_on_leave scope_guard(this);
+        internal_copy(il.begin(), il.end(), il.size());
+        scope_guard.dismiss();
+    }
+
+#endif //__TBB_INITIALIZER_LISTS_PRESENT
+
+    //! Assignment
+    concurrent_hash_map& operator=( const concurrent_hash_map &table ) {
+        if( this!=&table ) {
+            clear();
+            internal_copy(table);
+        }
+        return *this;
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move Assignment
+    concurrent_hash_map& operator=( concurrent_hash_map &&table ) {
+        if(this != &table){
+            typedef typename tbb::internal::allocator_traits<allocator_type>::propagate_on_container_move_assignment pocma_t;
+            if(pocma_t::value || this->my_allocator == table.my_allocator) {
+                concurrent_hash_map trash (std::move(*this));
+                //TODO: swapping allocators here may be a problem, replace with single direction moving iff pocma is set
+                this->swap(table);
+            } else {
+                //do per element move
+                concurrent_hash_map moved_copy(std::move(table), this->my_allocator);
+                this->swap(moved_copy);
+            }
+        }
+        return *this;
+    }
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Assignment
+    concurrent_hash_map& operator=( std::initializer_list<value_type> il ) {
+        clear();
+        internal_copy(il.begin(), il.end(), il.size());
+        return *this;
+    }
+#endif //__TBB_INITIALIZER_LISTS_PRESENT
+
+
+    //! Rehashes and optionally resizes the whole table.
+    /** Useful to optimize performance before or after concurrent operations.
+        Also enables using of find() and count() concurrent methods in serial context. */
+    void rehash(size_type n = 0);
+
+    //! Clear table
+    void clear();
+
+    //! Clear table and destroy it.
+    ~concurrent_hash_map() { clear(); }
+
+    //------------------------------------------------------------------------
+    // Parallel algorithm support
+    //------------------------------------------------------------------------
+    range_type range( size_type grainsize=1 ) {
+        return range_type( *this, grainsize );
+    }
+    const_range_type range( size_type grainsize=1 ) const {
+        return const_range_type( *this, grainsize );
+    }
+
+    //------------------------------------------------------------------------
+    // STL support - not thread-safe methods
+    //------------------------------------------------------------------------
+    iterator begin() { return iterator( *this, 0, my_embedded_segment, my_embedded_segment->node_list ); }
+    iterator end() { return iterator( *this, 0, 0, 0 ); }
+    const_iterator begin() const { return const_iterator( *this, 0, my_embedded_segment, my_embedded_segment->node_list ); }
+    const_iterator end() const { return const_iterator( *this, 0, 0, 0 ); }
+    std::pair<iterator, iterator> equal_range( const Key& key ) { return internal_equal_range( key, end() ); }
+    std::pair<const_iterator, const_iterator> equal_range( const Key& key ) const { return internal_equal_range( key, end() ); }
+
+    //! Number of items in table.
+    size_type size() const { return my_size; }
+
+    //! True if size()==0.
+    bool empty() const { return my_size == 0; }
+
+    //! Upper bound on size.
+    size_type max_size() const {return (~size_type(0))/sizeof(node);}
+
+    //! Returns the current number of buckets
+    size_type bucket_count() const { return my_mask+1; }
+
+    //! return allocator object
+    allocator_type get_allocator() const { return this->my_allocator; }
+
+    //! swap two instances. Iterators are invalidated
+    void swap( concurrent_hash_map &table );
+
+    //------------------------------------------------------------------------
+    // concurrent map operations
+    //------------------------------------------------------------------------
+
+    //! Return count of items (0 or 1)
+    size_type count( const Key &key ) const {
+        return const_cast<concurrent_hash_map*>(this)->lookup(/*insert*/false, key, NULL, NULL, /*write=*/false, &do_not_allocate_node );
+    }
+
+    //! Find item and acquire a read lock on the item.
+    /** Return true if item is found, false otherwise. */
+    bool find( const_accessor &result, const Key &key ) const {
+        result.release();
+        return const_cast<concurrent_hash_map*>(this)->lookup(/*insert*/false, key, NULL, &result, /*write=*/false, &do_not_allocate_node );
+    }
+
+    //! Find item and acquire a write lock on the item.
+    /** Return true if item is found, false otherwise. */
+    bool find( accessor &result, const Key &key ) {
+        result.release();
+        return lookup(/*insert*/false, key, NULL, &result, /*write=*/true, &do_not_allocate_node );
+    }
+
+    //! Insert item (if not already present) and acquire a read lock on the item.
+    /** Returns true if item is new. */
+    bool insert( const_accessor &result, const Key &key ) {
+        result.release();
+        return lookup(/*insert*/true, key, NULL, &result, /*write=*/false, &allocate_node_default_construct );
+    }
+
+    //! Insert item (if not already present) and acquire a write lock on the item.
+    /** Returns true if item is new. */
+    bool insert( accessor &result, const Key &key ) {
+        result.release();
+        return lookup(/*insert*/true, key, NULL, &result, /*write=*/true, &allocate_node_default_construct );
+    }
+
+    //! Insert item by copying if there is no such key present already and acquire a read lock on the item.
+    /** Returns true if item is new. */
+    bool insert( const_accessor &result, const value_type &value ) {
+        result.release();
+        return lookup(/*insert*/true, value.first, &value.second, &result, /*write=*/false, &allocate_node_copy_construct );
+    }
+
+    //! Insert item by copying if there is no such key present already and acquire a write lock on the item.
+    /** Returns true if item is new. */
+    bool insert( accessor &result, const value_type &value ) {
+        result.release();
+        return lookup(/*insert*/true, value.first, &value.second, &result, /*write=*/true, &allocate_node_copy_construct );
+    }
+
+    //! Insert item by copying if there is no such key present already
+    /** Returns true if item is inserted. */
+    bool insert( const value_type &value ) {
+        return lookup(/*insert*/true, value.first, &value.second, NULL, /*write=*/false, &allocate_node_copy_construct );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Insert item by copying if there is no such key present already and acquire a read lock on the item.
+    /** Returns true if item is new. */
+    bool insert( const_accessor &result, value_type && value ) {
+        return generic_move_insert(result, std::move(value));
+    }
+
+    //! Insert item by copying if there is no such key present already and acquire a write lock on the item.
+    /** Returns true if item is new. */
+    bool insert( accessor &result, value_type && value ) {
+        return generic_move_insert(result, std::move(value));
+    }
+
+    //! Insert item by copying if there is no such key present already
+    /** Returns true if item is inserted. */
+    bool insert( value_type && value ) {
+        return generic_move_insert(accessor_not_used(), std::move(value));
+    }
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    //! Insert item by copying if there is no such key present already and acquire a read lock on the item.
+    /** Returns true if item is new. */
+    template<typename... Args>
+    bool emplace( const_accessor &result, Args&&... args ) {
+        return generic_emplace(result, std::forward<Args>(args)...);
+    }
+
+    //! Insert item by copying if there is no such key present already and acquire a write lock on the item.
+    /** Returns true if item is new. */
+    template<typename... Args>
+    bool emplace( accessor &result, Args&&... args ) {
+        return generic_emplace(result, std::forward<Args>(args)...);
+    }
+
+    //! Insert item by copying if there is no such key present already
+    /** Returns true if item is inserted. */
+    template<typename... Args>
+    bool emplace( Args&&... args ) {
+        return generic_emplace(accessor_not_used(), std::forward<Args>(args)...);
+    }
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    //! Insert range [first, last)
+    template<typename I>
+    void insert( I first, I last ) {
+        for ( ; first != last; ++first )
+            insert( *first );
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Insert initializer list
+    void insert( std::initializer_list<value_type> il ) {
+        insert( il.begin(), il.end() );
+    }
+#endif //__TBB_INITIALIZER_LISTS_PRESENT
+
+    //! Erase item.
+    /** Return true if item was erased by particularly this call. */
+    bool erase( const Key& key );
+
+    //! Erase item by const_accessor.
+    /** Return true if item was erased by particularly this call. */
+    bool erase( const_accessor& item_accessor ) {
+        return exclude( item_accessor );
+    }
+
+    //! Erase item by accessor.
+    /** Return true if item was erased by particularly this call. */
+    bool erase( accessor& item_accessor ) {
+        return exclude( item_accessor );
+    }
+
+protected:
+    //! Insert or find item and optionally acquire a lock on the item.
+    bool lookup(bool op_insert, const Key &key, const T *t, const_accessor *result, bool write,  node* (*allocate_node)(node_allocator_type& ,  const Key &, const T * ), node *tmp_n = 0  ) ;
+
+    struct accessor_not_used { void release(){}};
+    friend const_accessor* accessor_location( accessor_not_used const& ){ return NULL;}
+    friend const_accessor* accessor_location( const_accessor & a )      { return &a;}
+
+    friend bool is_write_access_needed( accessor const& )           { return true;}
+    friend bool is_write_access_needed( const_accessor const& )     { return false;}
+    friend bool is_write_access_needed( accessor_not_used const& )  { return false;}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename Accessor>
+    bool generic_move_insert( Accessor && result, value_type && value ) {
+        result.release();
+        return lookup(/*insert*/true, value.first, &value.second, accessor_location(result), is_write_access_needed(result), &allocate_node_move_construct );
+    }
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename Accessor, typename... Args>
+    bool generic_emplace( Accessor && result, Args &&... args ) {
+        result.release();
+        node * node_ptr = allocate_node_emplace_construct(my_allocator, std::forward<Args>(args)...);
+        return lookup(/*insert*/true, node_ptr->item.first, NULL, accessor_location(result), is_write_access_needed(result), &do_not_allocate_node, node_ptr );
+    }
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    //! delete item by accessor
+    bool exclude( const_accessor &item_accessor );
+
+    //! Returns an iterator for an item defined by the key, or for the next item after it (if upper==true)
+    template<typename I>
+    std::pair<I, I> internal_equal_range( const Key& key, I end ) const;
+
+    //! Copy "source" to *this, where *this must start out empty.
+    void internal_copy( const concurrent_hash_map& source );
+
+    template<typename I>
+    void internal_copy( I first, I last, size_type reserve_size );
+
+    //! Fast find when no concurrent erasure is used. For internal use inside TBB only!
+    /** Return pointer to item with given key, or NULL if no such item exists.
+        Must not be called concurrently with erasure operations. */
+    const_pointer internal_fast_find( const Key& key ) const {
+        hashcode_t h = my_hash_compare.hash( key );
+        hashcode_t m = (hashcode_t) itt_load_word_with_acquire( my_mask );
+        node *n;
+    restart:
+        __TBB_ASSERT((m&(m+1))==0, "data structure is invalid");
+        bucket *b = get_bucket( h & m );
+        // TODO: actually, notification is unnecessary here, just hiding double-check
+        if( itt_load_word_with_acquire(b->node_list) == internal::rehash_req )
+        {
+            bucket::scoped_t lock;
+            if( lock.try_acquire( b->mutex, /*write=*/true ) ) {
+                if( b->node_list == internal::rehash_req)
+                    const_cast<concurrent_hash_map*>(this)->rehash_bucket( b, h & m ); //recursive rehashing
+            }
+            else lock.acquire( b->mutex, /*write=*/false );
+            __TBB_ASSERT(b->node_list!=internal::rehash_req,NULL);
+        }
+        n = search_bucket( key, b );
+        if( n )
+            return &n->item;
+        else if( check_mask_race( h, m ) )
+            goto restart;
+        return 0;
+    }
+};
+
+template<typename Key, typename T, typename HashCompare, typename A>
+bool concurrent_hash_map<Key,T,HashCompare,A>::lookup( bool op_insert, const Key &key, const T *t, const_accessor *result, bool write, node* (*allocate_node)(node_allocator_type& , const Key&, const T*), node *tmp_n ) {
+    __TBB_ASSERT( !result || !result->my_node, NULL );
+    bool return_value;
+    hashcode_t const h = my_hash_compare.hash( key );
+    hashcode_t m = (hashcode_t) itt_load_word_with_acquire( my_mask );
+    segment_index_t grow_segment = 0;
+    node *n;
+    restart:
+    {//lock scope
+        __TBB_ASSERT((m&(m+1))==0, "data structure is invalid");
+        return_value = false;
+        // get bucket
+        bucket_accessor b( this, h & m );
+
+        // find a node
+        n = search_bucket( key, b() );
+        if( op_insert ) {
+            // [opt] insert a key
+            if( !n ) {
+                if( !tmp_n ) {
+                    tmp_n = allocate_node(my_allocator, key, t);
+                }
+                if( !b.is_writer() && !b.upgrade_to_writer() ) { // TODO: improved insertion
+                    // Rerun search_list, in case another thread inserted the item during the upgrade.
+                    n = search_bucket( key, b() );
+                    if( is_valid(n) ) { // unfortunately, it did
+                        b.downgrade_to_reader();
+                        goto exists;
+                    }
+                }
+                if( check_mask_race(h, m) )
+                    goto restart; // b.release() is done in ~b().
+                // insert and set flag to grow the container
+                grow_segment = insert_new_node( b(), n = tmp_n, m );
+                tmp_n = 0;
+                return_value = true;
+            }
+        } else { // find or count
+            if( !n ) {
+                if( check_mask_race( h, m ) )
+                    goto restart; // b.release() is done in ~b(). TODO: replace by continue
+                return false;
+            }
+            return_value = true;
+        }
+    exists:
+        if( !result ) goto check_growth;
+        // TODO: the following seems as generic/regular operation
+        // acquire the item
+        if( !result->try_acquire( n->mutex, write ) ) {
+            for( tbb::internal::atomic_backoff backoff(true);; ) {
+                if( result->try_acquire( n->mutex, write ) ) break;
+                if( !backoff.bounded_pause() ) {
+                    // the wait takes really long, restart the operation
+                    b.release();
+                    __TBB_ASSERT( !op_insert || !return_value, "Can't acquire new item in locked bucket?" );
+                    __TBB_Yield();
+                    m = (hashcode_t) itt_load_word_with_acquire( my_mask );
+                    goto restart;
+                }
+            }
+        }
+    }//lock scope
+    result->my_node = n;
+    result->my_hash = h;
+check_growth:
+    // [opt] grow the container
+    if( grow_segment ) {
+#if __TBB_STATISTICS
+        my_info_resizes++; // concurrent ones
+#endif
+        enable_segment( grow_segment );
+    }
+    if( tmp_n ) // if op_insert only
+        delete_node( tmp_n );
+    return return_value;
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+template<typename I>
+std::pair<I, I> concurrent_hash_map<Key,T,HashCompare,A>::internal_equal_range( const Key& key, I end_ ) const {
+    hashcode_t h = my_hash_compare.hash( key );
+    hashcode_t m = my_mask;
+    __TBB_ASSERT((m&(m+1))==0, "data structure is invalid");
+    h &= m;
+    bucket *b = get_bucket( h );
+    while( b->node_list == internal::rehash_req ) {
+        m = ( 1u<<__TBB_Log2( h ) ) - 1; // get parent mask from the topmost bit
+        b = get_bucket( h &= m );
+    }
+    node *n = search_bucket( key, b );
+    if( !n )
+        return std::make_pair(end_, end_);
+    iterator lower(*this, h, b, n), upper(lower);
+    return std::make_pair(lower, ++upper);
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+bool concurrent_hash_map<Key,T,HashCompare,A>::exclude( const_accessor &item_accessor ) {
+    __TBB_ASSERT( item_accessor.my_node, NULL );
+    node_base *const n = item_accessor.my_node;
+    hashcode_t const h = item_accessor.my_hash;
+    hashcode_t m = (hashcode_t) itt_load_word_with_acquire( my_mask );
+    do {
+        // get bucket
+        bucket_accessor b( this, h & m, /*writer=*/true );
+        node_base **p = &b()->node_list;
+        while( *p && *p != n )
+            p = &(*p)->next;
+        if( !*p ) { // someone else was first
+            if( check_mask_race( h, m ) )
+                continue;
+            item_accessor.release();
+            return false;
+        }
+        __TBB_ASSERT( *p == n, NULL );
+        *p = n->next; // remove from container
+        my_size--;
+        break;
+    } while(true);
+    if( !item_accessor.is_writer() ) // need to get exclusive lock
+        item_accessor.upgrade_to_writer(); // return value means nothing here
+    item_accessor.release();
+    delete_node( n ); // Only one thread can delete it
+    return true;
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+bool concurrent_hash_map<Key,T,HashCompare,A>::erase( const Key &key ) {
+    node_base *n;
+    hashcode_t const h = my_hash_compare.hash( key );
+    hashcode_t m = (hashcode_t) itt_load_word_with_acquire( my_mask );
+restart:
+    {//lock scope
+        // get bucket
+        bucket_accessor b( this, h & m );
+    search:
+        node_base **p = &b()->node_list;
+        n = *p;
+        while( is_valid(n) && !my_hash_compare.equal(key, static_cast<node*>(n)->item.first ) ) {
+            p = &n->next;
+            n = *p;
+        }
+        if( !n ) { // not found, but mask could be changed
+            if( check_mask_race( h, m ) )
+                goto restart;
+            return false;
+        }
+        else if( !b.is_writer() && !b.upgrade_to_writer() ) {
+            if( check_mask_race( h, m ) ) // contended upgrade, check mask
+                goto restart;
+            goto search;
+        }
+        *p = n->next;
+        my_size--;
+    }
+    {
+        typename node::scoped_t item_locker( n->mutex, /*write=*/true );
+    }
+    // note: there should be no threads pretending to acquire this mutex again, do not try to upgrade const_accessor!
+    delete_node( n ); // Only one thread can delete it due to write lock on the bucket
+    return true;
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+void concurrent_hash_map<Key,T,HashCompare,A>::swap(concurrent_hash_map<Key,T,HashCompare,A> &table) {
+    //TODO: respect C++11 allocator_traits<A>::propogate_on_constainer_swap
+    using std::swap;
+    swap(this->my_allocator, table.my_allocator);
+    swap(this->my_hash_compare, table.my_hash_compare);
+    internal_swap(table);
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+void concurrent_hash_map<Key,T,HashCompare,A>::rehash(size_type sz) {
+    reserve( sz ); // TODO: add reduction of number of buckets as well
+    hashcode_t mask = my_mask;
+    hashcode_t b = (mask+1)>>1; // size or first index of the last segment
+    __TBB_ASSERT((b&(b-1))==0, NULL); // zero or power of 2
+    bucket *bp = get_bucket( b ); // only the last segment should be scanned for rehashing
+    for(; b <= mask; b++, bp++ ) {
+        node_base *n = bp->node_list;
+        __TBB_ASSERT( is_valid(n) || n == internal::empty_rehashed || n == internal::rehash_req, "Broken internal structure" );
+        __TBB_ASSERT( *reinterpret_cast<intptr_t*>(&bp->mutex) == 0, "concurrent or unexpectedly terminated operation during rehash() execution" );
+        if( n == internal::rehash_req ) { // rehash bucket, conditional because rehashing of a previous bucket may affect this one
+            hashcode_t h = b; bucket *b_old = bp;
+            do {
+                __TBB_ASSERT( h > 1, "The lowermost buckets can't be rehashed" );
+                hashcode_t m = ( 1u<<__TBB_Log2( h ) ) - 1; // get parent mask from the topmost bit
+                b_old = get_bucket( h &= m );
+            } while( b_old->node_list == internal::rehash_req );
+            // now h - is index of the root rehashed bucket b_old
+            mark_rehashed_levels( h ); // mark all non-rehashed children recursively across all segments
+            for( node_base **p = &b_old->node_list, *q = *p; is_valid(q); q = *p ) {
+                hashcode_t c = my_hash_compare.hash( static_cast<node*>(q)->item.first );
+                if( (c & mask) != h ) { // should be rehashed
+                    *p = q->next; // exclude from b_old
+                    bucket *b_new = get_bucket( c & mask );
+                    __TBB_ASSERT( b_new->node_list != internal::rehash_req, "hash() function changed for key in table or internal error" );
+                    add_to_bucket( b_new, q );
+                } else p = &q->next; // iterate to next item
+            }
+        }
+    }
+#if TBB_USE_PERFORMANCE_WARNINGS
+    int current_size = int(my_size), buckets = int(mask)+1, empty_buckets = 0, overpopulated_buckets = 0; // usage statistics
+    static bool reported = false;
+#endif
+#if TBB_USE_ASSERT || TBB_USE_PERFORMANCE_WARNINGS
+    for( b = 0; b <= mask; b++ ) {// only last segment should be scanned for rehashing
+        if( b & (b-2) ) ++bp; // not the beginning of a segment
+        else bp = get_bucket( b );
+        node_base *n = bp->node_list;
+        __TBB_ASSERT( *reinterpret_cast<intptr_t*>(&bp->mutex) == 0, "concurrent or unexpectedly terminated operation during rehash() execution" );
+        __TBB_ASSERT( is_valid(n) || n == internal::empty_rehashed, "Broken internal structure" );
+#if TBB_USE_PERFORMANCE_WARNINGS
+        if( n == internal::empty_rehashed ) empty_buckets++;
+        else if( n->next ) overpopulated_buckets++;
+#endif
+#if TBB_USE_ASSERT
+        for( ; is_valid(n); n = n->next ) {
+            hashcode_t h = my_hash_compare.hash( static_cast<node*>(n)->item.first ) & mask;
+            __TBB_ASSERT( h == b, "hash() function changed for key in table or internal error" );
+        }
+#endif
+    }
+#endif // TBB_USE_ASSERT || TBB_USE_PERFORMANCE_WARNINGS
+#if TBB_USE_PERFORMANCE_WARNINGS
+    if( buckets > current_size) empty_buckets -= buckets - current_size;
+    else overpopulated_buckets -= current_size - buckets; // TODO: load_factor?
+    if( !reported && buckets >= 512 && ( 2*empty_buckets > current_size || 2*overpopulated_buckets > current_size ) ) {
+        tbb::internal::runtime_warning(
+            "Performance is not optimal because the hash function produces bad randomness in lower bits in %s.\nSize: %d  Empties: %d  Overlaps: %d",
+#if __TBB_USE_OPTIONAL_RTTI
+            typeid(*this).name(),
+#else
+            "concurrent_hash_map",
+#endif
+            current_size, empty_buckets, overpopulated_buckets );
+        reported = true;
+    }
+#endif
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+void concurrent_hash_map<Key,T,HashCompare,A>::clear() {
+    hashcode_t m = my_mask;
+    __TBB_ASSERT((m&(m+1))==0, "data structure is invalid");
+#if TBB_USE_ASSERT || TBB_USE_PERFORMANCE_WARNINGS || __TBB_STATISTICS
+#if TBB_USE_PERFORMANCE_WARNINGS || __TBB_STATISTICS
+    int current_size = int(my_size), buckets = int(m)+1, empty_buckets = 0, overpopulated_buckets = 0; // usage statistics
+    static bool reported = false;
+#endif
+    bucket *bp = 0;
+    // check consistency
+    for( segment_index_t b = 0; b <= m; b++ ) {
+        if( b & (b-2) ) ++bp; // not the beginning of a segment
+        else bp = get_bucket( b );
+        node_base *n = bp->node_list;
+        __TBB_ASSERT( is_valid(n) || n == internal::empty_rehashed || n == internal::rehash_req, "Broken internal structure" );
+        __TBB_ASSERT( *reinterpret_cast<intptr_t*>(&bp->mutex) == 0, "concurrent or unexpectedly terminated operation during clear() execution" );
+#if TBB_USE_PERFORMANCE_WARNINGS || __TBB_STATISTICS
+        if( n == internal::empty_rehashed ) empty_buckets++;
+        else if( n == internal::rehash_req ) buckets--;
+        else if( n->next ) overpopulated_buckets++;
+#endif
+#if __TBB_EXTRA_DEBUG
+        for(; is_valid(n); n = n->next ) {
+            hashcode_t h = my_hash_compare.hash( static_cast<node*>(n)->item.first );
+            h &= m;
+            __TBB_ASSERT( h == b || get_bucket(h)->node_list == internal::rehash_req, "hash() function changed for key in table or internal error" );
+        }
+#endif
+    }
+#if TBB_USE_PERFORMANCE_WARNINGS || __TBB_STATISTICS
+#if __TBB_STATISTICS
+    printf( "items=%d buckets: capacity=%d rehashed=%d empty=%d overpopulated=%d"
+        " concurrent: resizes=%u rehashes=%u restarts=%u\n",
+        current_size, int(m+1), buckets, empty_buckets, overpopulated_buckets,
+        unsigned(my_info_resizes), unsigned(my_info_rehashes), unsigned(my_info_restarts) );
+    my_info_resizes = 0; // concurrent ones
+    my_info_restarts = 0; // race collisions
+    my_info_rehashes = 0;  // invocations of rehash_bucket
+#endif
+    if( buckets > current_size) empty_buckets -= buckets - current_size;
+    else overpopulated_buckets -= current_size - buckets; // TODO: load_factor?
+    if( !reported && buckets >= 512 && ( 2*empty_buckets > current_size || 2*overpopulated_buckets > current_size ) ) {
+        tbb::internal::runtime_warning(
+            "Performance is not optimal because the hash function produces bad randomness in lower bits in %s.\nSize: %d  Empties: %d  Overlaps: %d",
+#if __TBB_USE_OPTIONAL_RTTI
+            typeid(*this).name(),
+#else
+            "concurrent_hash_map",
+#endif
+            current_size, empty_buckets, overpopulated_buckets );
+        reported = true;
+    }
+#endif
+#endif // TBB_USE_ASSERT || TBB_USE_PERFORMANCE_WARNINGS || __TBB_STATISTICS
+    my_size = 0;
+    segment_index_t s = segment_index_of( m );
+    __TBB_ASSERT( s+1 == pointers_per_table || !my_table[s+1], "wrong mask or concurrent grow" );
+    cache_aligned_allocator<bucket> alloc;
+    do {
+        __TBB_ASSERT( is_valid( my_table[s] ), "wrong mask or concurrent grow" );
+        segment_ptr_t buckets_ptr = my_table[s];
+        size_type sz = segment_size( s ? s : 1 );
+        for( segment_index_t i = 0; i < sz; i++ )
+            for( node_base *n = buckets_ptr[i].node_list; is_valid(n); n = buckets_ptr[i].node_list ) {
+                buckets_ptr[i].node_list = n->next;
+                delete_node( n );
+            }
+        if( s >= first_block) // the first segment or the next
+            alloc.deallocate( buckets_ptr, sz );
+        else if( s == embedded_block && embedded_block != first_block )
+            alloc.deallocate( buckets_ptr, segment_size(first_block)-embedded_buckets );
+        if( s >= embedded_block ) my_table[s] = 0;
+    } while(s-- > 0);
+    my_mask = embedded_buckets - 1;
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+void concurrent_hash_map<Key,T,HashCompare,A>::internal_copy( const concurrent_hash_map& source ) {
+    hashcode_t mask = source.my_mask;
+    if( my_mask == mask ) { // optimized version
+        reserve( source.my_size ); // TODO: load_factor?
+        bucket *dst = 0, *src = 0;
+        bool rehash_required = false;
+        for( hashcode_t k = 0; k <= mask; k++ ) {
+            if( k & (k-2) ) ++dst,src++; // not the beginning of a segment
+            else { dst = get_bucket( k ); src = source.get_bucket( k ); }
+            __TBB_ASSERT( dst->node_list != internal::rehash_req, "Invalid bucket in destination table");
+            node *n = static_cast<node*>( src->node_list );
+            if( n == internal::rehash_req ) { // source is not rehashed, items are in previous buckets
+                rehash_required = true;
+                dst->node_list = internal::rehash_req;
+            } else for(; n; n = static_cast<node*>( n->next ) ) {
+                add_to_bucket( dst, new( my_allocator ) node(n->item.first, n->item.second) );
+                ++my_size; // TODO: replace by non-atomic op
+            }
+        }
+        if( rehash_required ) rehash();
+    } else internal_copy( source.begin(), source.end(), source.my_size );
+}
+
+template<typename Key, typename T, typename HashCompare, typename A>
+template<typename I>
+void concurrent_hash_map<Key,T,HashCompare,A>::internal_copy(I first, I last, size_type reserve_size) {
+    reserve( reserve_size ); // TODO: load_factor?
+    hashcode_t m = my_mask;
+    for(; first != last; ++first) {
+        hashcode_t h = my_hash_compare.hash( (*first).first );
+        bucket *b = get_bucket( h & m );
+        __TBB_ASSERT( b->node_list != internal::rehash_req, "Invalid bucket in destination table");
+        node *n = new( my_allocator ) node(*first);
+        add_to_bucket( b, n );
+        ++my_size; // TODO: replace by non-atomic op
+    }
+}
+
+} // namespace interface5
+
+using interface5::concurrent_hash_map;
+
+
+template<typename Key, typename T, typename HashCompare, typename A1, typename A2>
+inline bool operator==(const concurrent_hash_map<Key, T, HashCompare, A1> &a, const concurrent_hash_map<Key, T, HashCompare, A2> &b) {
+    if(a.size() != b.size()) return false;
+    typename concurrent_hash_map<Key, T, HashCompare, A1>::const_iterator i(a.begin()), i_end(a.end());
+    typename concurrent_hash_map<Key, T, HashCompare, A2>::const_iterator j, j_end(b.end());
+    for(; i != i_end; ++i) {
+        j = b.equal_range(i->first).first;
+        if( j == j_end || !(i->second == j->second) ) return false;
+    }
+    return true;
+}
+
+template<typename Key, typename T, typename HashCompare, typename A1, typename A2>
+inline bool operator!=(const concurrent_hash_map<Key, T, HashCompare, A1> &a, const concurrent_hash_map<Key, T, HashCompare, A2> &b)
+{    return !(a == b); }
+
+template<typename Key, typename T, typename HashCompare, typename A>
+inline void swap(concurrent_hash_map<Key, T, HashCompare, A> &a, concurrent_hash_map<Key, T, HashCompare, A> &b)
+{    a.swap( b ); }
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif // warning 4127 is back
+
+} // namespace tbb
+
+#endif /* __TBB_concurrent_hash_map_H */
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_lru_cache.h b/xdl/third_party/tbb/include/tbb/concurrent_lru_cache.h
new file mode 100644
index 00000000..197fafeb
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_lru_cache.h
@@ -0,0 +1,287 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_lru_cache_H
+#define __TBB_concurrent_lru_cache_H
+
+#if ! TBB_PREVIEW_CONCURRENT_LRU_CACHE
+    #error Set TBB_PREVIEW_CONCURRENT_LRU_CACHE to include concurrent_lru_cache.h
+#endif
+
+#include "tbb_stddef.h"
+
+#include <map>
+#include <list>
+#include <algorithm> // std::find
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#include <utility> // std::move
+#endif
+
+#include "atomic.h"
+#include "internal/_aggregator_impl.h"
+
+namespace tbb{
+namespace interface6 {
+
+
+template <typename key_type, typename value_type, typename value_functor_type = value_type (*)(key_type) >
+class concurrent_lru_cache : internal::no_assign{
+private:
+    typedef concurrent_lru_cache self_type;
+    typedef value_functor_type value_function_type;
+    typedef std::size_t ref_counter_type;
+    struct map_value_type;
+    typedef std::map<key_type, map_value_type> map_storage_type;
+    typedef std::list<typename map_storage_type::iterator> lru_list_type;
+    struct map_value_type {
+        value_type my_value;
+        ref_counter_type my_ref_counter;
+        typename lru_list_type::iterator my_lru_list_iterator;
+        bool my_is_ready;
+
+        map_value_type (value_type const& a_value,  ref_counter_type a_ref_counter,    typename lru_list_type::iterator a_lru_list_iterator, bool a_is_ready)
+            : my_value(a_value), my_ref_counter(a_ref_counter), my_lru_list_iterator (a_lru_list_iterator), my_is_ready(a_is_ready)
+        {}
+    };
+
+    class handle_object;
+
+    struct aggregator_operation;
+    typedef aggregator_operation aggregated_operation_type;
+    typedef tbb::internal::aggregating_functor<self_type,aggregated_operation_type> aggregator_function_type;
+    friend class tbb::internal::aggregating_functor<self_type,aggregated_operation_type>;
+    typedef tbb::internal::aggregator<aggregator_function_type, aggregated_operation_type> aggregator_type;
+
+private:
+    value_function_type my_value_function;
+    std::size_t const my_number_of_lru_history_items;
+    map_storage_type my_map_storage;
+    lru_list_type my_lru_list;
+    aggregator_type my_aggregator;
+
+public:
+    typedef handle_object handle;
+
+public:
+    concurrent_lru_cache(value_function_type f, std::size_t number_of_lru_history_items)
+        : my_value_function(f),my_number_of_lru_history_items(number_of_lru_history_items)
+    {
+        my_aggregator.initialize_handler(aggregator_function_type(this));
+    }
+
+    handle_object operator[](key_type k){
+        retrieve_aggregator_operation op(k);
+        my_aggregator.execute(&op);
+        if (op.is_new_value_needed()){
+             op.result().second.my_value = my_value_function(k);
+             __TBB_store_with_release(op.result().second.my_is_ready, true);
+        }else{
+            tbb::internal::spin_wait_while_eq(op.result().second.my_is_ready,false);
+        }
+        return handle_object(*this,op.result());
+    }
+private:
+    void signal_end_of_usage(typename map_storage_type::reference value_ref){
+        signal_end_of_usage_aggregator_operation op(value_ref);
+        my_aggregator.execute(&op);
+    }
+
+private:
+#if !__TBB_CPP11_RVALUE_REF_PRESENT
+    struct handle_move_t:no_assign{
+        concurrent_lru_cache & my_cache_ref;
+        typename map_storage_type::reference my_map_record_ref;
+        handle_move_t(concurrent_lru_cache & cache_ref, typename map_storage_type::reference value_ref):my_cache_ref(cache_ref),my_map_record_ref(value_ref) {};
+    };
+#endif
+    class handle_object {
+        concurrent_lru_cache * my_cache_pointer;
+        typename map_storage_type::pointer my_map_record_ptr;
+    public:
+        handle_object() : my_cache_pointer(), my_map_record_ptr() {}
+        handle_object(concurrent_lru_cache& cache_ref, typename map_storage_type::reference value_ref) : my_cache_pointer(&cache_ref), my_map_record_ptr(&value_ref) {}
+        operator bool() const {
+            return (my_cache_pointer && my_map_record_ptr);
+        }
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        // TODO: add check for double moved objects by special dedicated field
+        handle_object(handle_object&& src) : my_cache_pointer(src.my_cache_pointer), my_map_record_ptr(src.my_map_record_ptr) {
+            __TBB_ASSERT((src.my_cache_pointer && src.my_map_record_ptr) || (!src.my_cache_pointer && !src.my_map_record_ptr), "invalid state of moving object?");
+            src.my_cache_pointer = NULL;
+            src.my_map_record_ptr = NULL;
+        }
+        handle_object& operator=(handle_object&& src) {
+            __TBB_ASSERT((src.my_cache_pointer && src.my_map_record_ptr) || (!src.my_cache_pointer && !src.my_map_record_ptr), "invalid state of moving object?");
+            if (my_cache_pointer) {
+                my_cache_pointer->signal_end_of_usage(*my_map_record_ptr);
+            }
+            my_cache_pointer = src.my_cache_pointer;
+            my_map_record_ptr = src.my_map_record_ptr;
+            src.my_cache_pointer = NULL;
+            src.my_map_record_ptr = NULL;
+            return *this;
+        }
+#else
+        handle_object(handle_move_t m) : my_cache_pointer(&m.my_cache_ref), my_map_record_ptr(&m.my_map_record_ref) {}
+        handle_object& operator=(handle_move_t m) {
+            if (my_cache_pointer) {
+                my_cache_pointer->signal_end_of_usage(*my_map_record_ptr);
+            }
+            my_cache_pointer = &m.my_cache_ref;
+            my_map_record_ptr = &m.my_map_record_ref;
+            return *this;
+        }
+        operator handle_move_t(){
+            return move(*this);
+        }
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+        value_type& value(){
+            __TBB_ASSERT(my_cache_pointer,"get value from already moved object?");
+            __TBB_ASSERT(my_map_record_ptr,"get value from an invalid or already moved object?");
+            return my_map_record_ptr->second.my_value;
+        }
+        ~handle_object(){
+            if (my_cache_pointer){
+                my_cache_pointer->signal_end_of_usage(*my_map_record_ptr);
+            }
+        }
+    private:
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        // For source compatibility with C++03
+        friend handle_object&& move(handle_object& h){
+            return std::move(h);
+        }
+#else
+        friend handle_move_t move(handle_object& h){
+            return handle_object::move(h);
+        }
+        // TODO: add check for double moved objects by special dedicated field
+        static handle_move_t move(handle_object& h){
+            __TBB_ASSERT((h.my_cache_pointer && h.my_map_record_ptr) || (!h.my_cache_pointer && !h.my_map_record_ptr), "invalid state of moving object?");
+            concurrent_lru_cache * cache_pointer = h.my_cache_pointer;
+            typename map_storage_type::pointer map_record_ptr = h.my_map_record_ptr;
+            h.my_cache_pointer = NULL;
+            h.my_map_record_ptr = NULL;
+            return handle_move_t(*cache_pointer, *map_record_ptr);
+        }
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+    private:
+        void operator=(handle_object&);
+#if __SUNPRO_CC
+    // Presumably due to a compiler error, private copy constructor
+    // breaks expressions like handle h = cache[key];
+    public:
+#endif
+        handle_object(handle_object &);
+    };
+private:
+    //TODO: looks like aggregator_operation is a perfect match for statically typed variant type
+    struct aggregator_operation : tbb::internal::aggregated_operation<aggregator_operation>{
+        enum e_op_type {op_retive, op_signal_end_of_usage};
+        //TODO: try to use pointer to function apply_visitor here
+        //TODO: try virtual functions and measure the difference
+        e_op_type my_operation_type;
+        aggregator_operation(e_op_type operation_type): my_operation_type(operation_type) {}
+        void cast_and_handle(self_type& container ){
+            if (my_operation_type==op_retive){
+                static_cast<retrieve_aggregator_operation*>(this)->handle(container);
+            }else{
+                static_cast<signal_end_of_usage_aggregator_operation*>(this)->handle(container);
+            }
+        }
+    };
+    struct retrieve_aggregator_operation : aggregator_operation, private internal::no_assign {
+        key_type my_key;
+        typename map_storage_type::pointer my_result_map_record_pointer;
+        bool my_is_new_value_needed;
+        retrieve_aggregator_operation(key_type key):aggregator_operation(aggregator_operation::op_retive),my_key(key),my_is_new_value_needed(false){}
+        void handle(self_type& container ){
+            my_result_map_record_pointer = & container.retrieve_serial(my_key,my_is_new_value_needed);
+        }
+        typename map_storage_type::reference result(){ return * my_result_map_record_pointer; }
+        bool is_new_value_needed(){return my_is_new_value_needed;}
+    };
+    struct signal_end_of_usage_aggregator_operation : aggregator_operation, private internal::no_assign {
+        typename map_storage_type::reference my_map_record_ref;
+        signal_end_of_usage_aggregator_operation(typename map_storage_type::reference map_record_ref):aggregator_operation(aggregator_operation::op_signal_end_of_usage),my_map_record_ref(map_record_ref){}
+        void handle(self_type& container ){
+            container.signal_end_of_usage_serial(my_map_record_ref);
+        }
+    };
+
+private:
+   void handle_operations(aggregator_operation* op_list){
+       while(op_list){
+           op_list->cast_and_handle(*this);
+           aggregator_operation* tmp = op_list;
+           op_list=op_list->next;
+           tbb::internal::itt_store_word_with_release(tmp->status, uintptr_t(1));
+       }
+   }
+
+private:
+   typename map_storage_type::reference retrieve_serial(key_type k, bool& is_new_value_needed){
+        typename map_storage_type::iterator it = my_map_storage.find(k);
+        if (it == my_map_storage.end()){
+            it = my_map_storage.insert(it,std::make_pair(k,map_value_type(value_type(),0,my_lru_list.end(),false)));
+            is_new_value_needed = true;
+        }else {
+            typename lru_list_type::iterator list_it = it->second.my_lru_list_iterator;
+            if (list_it!=my_lru_list.end()) {
+                __TBB_ASSERT(!it->second.my_ref_counter,"item to be evicted should not have a live references");
+                //item is going to be used. Therefore it is not a subject for eviction
+                //so - remove it from LRU history.
+                my_lru_list.erase(list_it);
+                it->second.my_lru_list_iterator= my_lru_list.end();
+            }
+        }
+        ++(it->second.my_ref_counter);
+        return *it;
+    }
+
+    void signal_end_of_usage_serial(typename map_storage_type::reference map_record_ref){
+        typename map_storage_type::iterator it = my_map_storage.find(map_record_ref.first);
+        __TBB_ASSERT(it!=my_map_storage.end(),"cache should not return past-end iterators to outer world");
+        __TBB_ASSERT(&(*it) == &map_record_ref,"dangling reference has been returned to outside world? data race ?");
+        __TBB_ASSERT( my_lru_list.end()== std::find(my_lru_list.begin(),my_lru_list.end(),it),
+                "object in use should not be in list of unused objects ");
+        if (! --(it->second.my_ref_counter)){
+            //it was the last reference so put it to the LRU history
+            if (my_lru_list.size()>=my_number_of_lru_history_items){
+                //evict items in order to get a space
+                size_t number_of_elements_to_evict = 1 + my_lru_list.size() - my_number_of_lru_history_items;
+                for (size_t i=0; i<number_of_elements_to_evict; ++i){
+                    typename map_storage_type::iterator it_to_evict = my_lru_list.back();
+                    __TBB_ASSERT(!it_to_evict->second.my_ref_counter,"item to be evicted should not have a live references");
+                    my_lru_list.pop_back();
+                    my_map_storage.erase(it_to_evict);
+                }
+            }
+            my_lru_list.push_front(it);
+            it->second.my_lru_list_iterator = my_lru_list.begin();
+        }
+    }
+};
+} // namespace interface6
+
+using interface6::concurrent_lru_cache;
+
+} // namespace tbb
+#endif //__TBB_concurrent_lru_cache_H
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_priority_queue.h b/xdl/third_party/tbb/include/tbb/concurrent_priority_queue.h
new file mode 100644
index 00000000..ad4e85d8
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_priority_queue.h
@@ -0,0 +1,498 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_priority_queue_H
+#define __TBB_concurrent_priority_queue_H
+
+#include "atomic.h"
+#include "cache_aligned_allocator.h"
+#include "tbb_exception.h"
+#include "tbb_stddef.h"
+#include "tbb_profiling.h"
+#include "internal/_aggregator_impl.h"
+#include <vector>
+#include <iterator>
+#include <functional>
+#include __TBB_STD_SWAP_HEADER
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    #include <initializer_list>
+#endif
+
+#if __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT
+    #include <type_traits>
+#endif
+
+namespace tbb {
+namespace interface5 {
+namespace internal {
+#if __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT
+    template<typename T, bool C = std::is_copy_constructible<T>::value>
+    struct use_element_copy_constructor {
+        typedef tbb::internal::true_type type;
+    };
+    template<typename T>
+    struct use_element_copy_constructor <T,false> {
+        typedef tbb::internal::false_type type;
+    };
+#else
+    template<typename>
+    struct use_element_copy_constructor {
+        typedef tbb::internal::true_type type;
+    };
+#endif
+} // namespace internal
+
+using namespace tbb::internal;
+
+//! Concurrent priority queue
+template <typename T, typename Compare=std::less<T>, typename A=cache_aligned_allocator<T> >
+class concurrent_priority_queue {
+ public:
+    //! Element type in the queue.
+    typedef T value_type;
+
+    //! Reference type
+    typedef T& reference;
+
+    //! Const reference type
+    typedef const T& const_reference;
+
+    //! Integral type for representing size of the queue.
+    typedef size_t size_type;
+
+    //! Difference type for iterator
+    typedef ptrdiff_t difference_type;
+
+    //! Allocator type
+    typedef A allocator_type;
+
+    //! Constructs a new concurrent_priority_queue with default capacity
+    explicit concurrent_priority_queue(const allocator_type& a = allocator_type()) : mark(0), my_size(0), data(a)
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+    }
+
+    //! Constructs a new concurrent_priority_queue with init_sz capacity
+    explicit concurrent_priority_queue(size_type init_capacity, const allocator_type& a = allocator_type()) :
+        mark(0), my_size(0), data(a)
+    {
+        data.reserve(init_capacity);
+        my_aggregator.initialize_handler(my_functor_t(this));
+    }
+
+    //! [begin,end) constructor
+    template<typename InputIterator>
+    concurrent_priority_queue(InputIterator begin, InputIterator end, const allocator_type& a = allocator_type()) :
+        mark(0), data(begin, end, a)
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+        heapify();
+        my_size = data.size();
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Constructor from std::initializer_list
+    concurrent_priority_queue(std::initializer_list<T> init_list, const allocator_type &a = allocator_type()) :
+        mark(0),data(init_list.begin(), init_list.end(), a)
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+        heapify();
+        my_size = data.size();
+    }
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+    //! Copy constructor
+    /** This operation is unsafe if there are pending concurrent operations on the src queue. */
+    concurrent_priority_queue(const concurrent_priority_queue& src) : mark(src.mark),
+        my_size(src.my_size), data(src.data.begin(), src.data.end(), src.data.get_allocator())
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+        heapify();
+    }
+
+    //! Copy constructor with specific allocator
+    /** This operation is unsafe if there are pending concurrent operations on the src queue. */
+    concurrent_priority_queue(const concurrent_priority_queue& src, const allocator_type& a) : mark(src.mark),
+        my_size(src.my_size), data(src.data.begin(), src.data.end(), a)
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+        heapify();
+    }
+
+    //! Assignment operator
+    /** This operation is unsafe if there are pending concurrent operations on the src queue. */
+    concurrent_priority_queue& operator=(const concurrent_priority_queue& src) {
+        if (this != &src) {
+            vector_t(src.data.begin(), src.data.end(), src.data.get_allocator()).swap(data);
+            mark = src.mark;
+            my_size = src.my_size;
+        }
+        return *this;
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move constructor
+    /** This operation is unsafe if there are pending concurrent operations on the src queue. */
+    concurrent_priority_queue(concurrent_priority_queue&& src) : mark(src.mark),
+        my_size(src.my_size), data(std::move(src.data))
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+    }
+
+    //! Move constructor with specific allocator
+    /** This operation is unsafe if there are pending concurrent operations on the src queue. */
+    concurrent_priority_queue(concurrent_priority_queue&& src, const allocator_type& a) : mark(src.mark),
+        my_size(src.my_size),
+#if __TBB_ALLOCATOR_TRAITS_PRESENT
+        data(std::move(src.data), a)
+#else
+    // Some early version of C++11 STL vector does not have a constructor of vector(vector&& , allocator).
+    // It seems that the reason is absence of support of allocator_traits (stateful allocators).
+        data(a)
+#endif //__TBB_ALLOCATOR_TRAITS_PRESENT
+    {
+        my_aggregator.initialize_handler(my_functor_t(this));
+#if !__TBB_ALLOCATOR_TRAITS_PRESENT
+        if (a != src.data.get_allocator()){
+            data.reserve(src.data.size());
+            data.assign(std::make_move_iterator(src.data.begin()), std::make_move_iterator(src.data.end()));
+        }else{
+            data = std::move(src.data);
+        }
+#endif //!__TBB_ALLOCATOR_TRAITS_PRESENT
+    }
+
+    //! Move assignment operator
+    /** This operation is unsafe if there are pending concurrent operations on the src queue. */
+    concurrent_priority_queue& operator=( concurrent_priority_queue&& src) {
+        if (this != &src) {
+            mark = src.mark;
+            my_size = src.my_size;
+#if !__TBB_ALLOCATOR_TRAITS_PRESENT
+            if (data.get_allocator() != src.data.get_allocator()){
+                vector_t(std::make_move_iterator(src.data.begin()), std::make_move_iterator(src.data.end()), data.get_allocator()).swap(data);
+            }else
+#endif //!__TBB_ALLOCATOR_TRAITS_PRESENT
+            {
+                data = std::move(src.data);
+            }
+        }
+        return *this;
+    }
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    //! Assign the queue from [begin,end) range, not thread-safe
+    template<typename InputIterator>
+    void assign(InputIterator begin, InputIterator end) {
+        vector_t(begin, end, data.get_allocator()).swap(data);
+        mark = 0;
+        my_size = data.size();
+        heapify();
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Assign the queue from std::initializer_list, not thread-safe
+    void assign(std::initializer_list<T> il) { this->assign(il.begin(), il.end()); }
+
+    //! Assign from std::initializer_list, not thread-safe
+    concurrent_priority_queue& operator=(std::initializer_list<T> il) {
+        this->assign(il.begin(), il.end());
+        return *this;
+    }
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+    //! Returns true if empty, false otherwise
+    /** Returned value may not reflect results of pending operations.
+        This operation reads shared data and will trigger a race condition. */
+    bool empty() const { return size()==0; }
+
+    //! Returns the current number of elements contained in the queue
+    /** Returned value may not reflect results of pending operations.
+        This operation reads shared data and will trigger a race condition. */
+    size_type size() const { return __TBB_load_with_acquire(my_size); }
+
+    //! Pushes elem onto the queue, increasing capacity of queue if necessary
+    /** This operation can be safely used concurrently with other push, try_pop or emplace operations. */
+    void push(const_reference elem) {
+#if __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT
+        __TBB_STATIC_ASSERT( std::is_copy_constructible<value_type>::value, "The type is not copy constructible. Copying push operation is impossible." );
+#endif
+        cpq_operation op_data(elem, PUSH_OP);
+        my_aggregator.execute(&op_data);
+        if (op_data.status == FAILED) // exception thrown
+            throw_exception(eid_bad_alloc);
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Pushes elem onto the queue, increasing capacity of queue if necessary
+    /** This operation can be safely used concurrently with other push, try_pop or emplace operations. */
+    void push(value_type &&elem) {
+        cpq_operation op_data(elem, PUSH_RVALUE_OP);
+        my_aggregator.execute(&op_data);
+        if (op_data.status == FAILED) // exception thrown
+            throw_exception(eid_bad_alloc);
+    }
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    //! Constructs a new element using args as the arguments for its construction and pushes it onto the queue */
+    /** This operation can be safely used concurrently with other push, try_pop or emplace operations. */
+    template<typename... Args>
+    void emplace(Args&&... args) {
+        push(value_type(std::forward<Args>(args)...));
+    }
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! Gets a reference to and removes highest priority element
+    /** If a highest priority element was found, sets elem and returns true,
+        otherwise returns false.
+        This operation can be safely used concurrently with other push, try_pop or emplace operations. */
+    bool try_pop(reference elem) {
+        cpq_operation op_data(POP_OP);
+        op_data.elem = &elem;
+        my_aggregator.execute(&op_data);
+        return op_data.status==SUCCEEDED;
+    }
+
+    //! Clear the queue; not thread-safe
+    /** This operation is unsafe if there are pending concurrent operations on the queue.
+        Resets size, effectively emptying queue; does not free space.
+        May not clear elements added in pending operations. */
+    void clear() {
+        data.clear();
+        mark = 0;
+        my_size = 0;
+    }
+
+    //! Swap this queue with another; not thread-safe
+    /** This operation is unsafe if there are pending concurrent operations on the queue. */
+    void swap(concurrent_priority_queue& q) {
+        using std::swap;
+        data.swap(q.data);
+        swap(mark, q.mark);
+        swap(my_size, q.my_size);
+    }
+
+    //! Return allocator object
+    allocator_type get_allocator() const { return data.get_allocator(); }
+
+ private:
+    enum operation_type {INVALID_OP, PUSH_OP, POP_OP, PUSH_RVALUE_OP};
+    enum operation_status { WAIT=0, SUCCEEDED, FAILED };
+
+    class cpq_operation : public aggregated_operation<cpq_operation> {
+     public:
+        operation_type type;
+        union {
+            value_type *elem;
+            size_type sz;
+        };
+        cpq_operation(const_reference e, operation_type t) :
+            type(t), elem(const_cast<value_type*>(&e)) {}
+        cpq_operation(operation_type t) : type(t) {}
+    };
+
+    class my_functor_t {
+        concurrent_priority_queue<T, Compare, A> *cpq;
+     public:
+        my_functor_t() {}
+        my_functor_t(concurrent_priority_queue<T, Compare, A> *cpq_) : cpq(cpq_) {}
+        void operator()(cpq_operation* op_list) {
+            cpq->handle_operations(op_list);
+        }
+    };
+
+    typedef tbb::internal::aggregator< my_functor_t, cpq_operation > aggregator_t;
+    aggregator_t my_aggregator;
+    //! Padding added to avoid false sharing
+    char padding1[NFS_MaxLineSize - sizeof(aggregator_t)];
+    //! The point at which unsorted elements begin
+    size_type mark;
+    __TBB_atomic size_type my_size;
+    Compare compare;
+    //! Padding added to avoid false sharing
+    char padding2[NFS_MaxLineSize - (2*sizeof(size_type)) - sizeof(Compare)];
+    //! Storage for the heap of elements in queue, plus unheapified elements
+    /** data has the following structure:
+
+         binary unheapified
+          heap   elements
+        ____|_______|____
+        |       |       |
+        v       v       v
+        [_|...|_|_|...|_| |...| ]
+         0       ^       ^       ^
+                 |       |       |__capacity
+                 |       |__my_size
+                 |__mark
+
+        Thus, data stores the binary heap starting at position 0 through
+        mark-1 (it may be empty).  Then there are 0 or more elements
+        that have not yet been inserted into the heap, in positions
+        mark through my_size-1. */
+    typedef std::vector<value_type, allocator_type> vector_t;
+    vector_t data;
+
+    void handle_operations(cpq_operation *op_list) {
+        cpq_operation *tmp, *pop_list=NULL;
+
+        __TBB_ASSERT(mark == data.size(), NULL);
+
+        // First pass processes all constant (amortized; reallocation may happen) time pushes and pops.
+        while (op_list) {
+            // ITT note: &(op_list->status) tag is used to cover accesses to op_list
+            // node. This thread is going to handle the operation, and so will acquire it
+            // and perform the associated operation w/o triggering a race condition; the
+            // thread that created the operation is waiting on the status field, so when
+            // this thread is done with the operation, it will perform a
+            // store_with_release to give control back to the waiting thread in
+            // aggregator::insert_operation.
+            call_itt_notify(acquired, &(op_list->status));
+            __TBB_ASSERT(op_list->type != INVALID_OP, NULL);
+            tmp = op_list;
+            op_list = itt_hide_load_word(op_list->next);
+            if (tmp->type == POP_OP) {
+                if (mark < data.size() &&
+                    compare(data[0], data[data.size()-1])) {
+                    // there are newly pushed elems and the last one
+                    // is higher than top
+                    *(tmp->elem) = tbb::internal::move(data[data.size()-1]);
+                    __TBB_store_with_release(my_size, my_size-1);
+                    itt_store_word_with_release(tmp->status, uintptr_t(SUCCEEDED));
+                    data.pop_back();
+                    __TBB_ASSERT(mark<=data.size(), NULL);
+                }
+                else { // no convenient item to pop; postpone
+                    itt_hide_store_word(tmp->next, pop_list);
+                    pop_list = tmp;
+                }
+            } else { // PUSH_OP or PUSH_RVALUE_OP
+                __TBB_ASSERT(tmp->type == PUSH_OP || tmp->type == PUSH_RVALUE_OP, "Unknown operation" );
+                __TBB_TRY{
+                    if (tmp->type == PUSH_OP) {
+                        push_back_helper(*(tmp->elem), typename internal::use_element_copy_constructor<value_type>::type());
+                    } else {
+                        data.push_back(tbb::internal::move(*(tmp->elem)));
+                    }
+                    __TBB_store_with_release(my_size, my_size + 1);
+                    itt_store_word_with_release(tmp->status, uintptr_t(SUCCEEDED));
+                } __TBB_CATCH(...) {
+                    itt_store_word_with_release(tmp->status, uintptr_t(FAILED));
+                }
+            }
+        }
+
+        // second pass processes pop operations
+        while (pop_list) {
+            tmp = pop_list;
+            pop_list = itt_hide_load_word(pop_list->next);
+            __TBB_ASSERT(tmp->type == POP_OP, NULL);
+            if (data.empty()) {
+                itt_store_word_with_release(tmp->status, uintptr_t(FAILED));
+            }
+            else {
+                __TBB_ASSERT(mark<=data.size(), NULL);
+                if (mark < data.size() &&
+                    compare(data[0], data[data.size()-1])) {
+                    // there are newly pushed elems and the last one is
+                    // higher than top
+                    *(tmp->elem) = tbb::internal::move(data[data.size()-1]);
+                    __TBB_store_with_release(my_size, my_size-1);
+                    itt_store_word_with_release(tmp->status, uintptr_t(SUCCEEDED));
+                    data.pop_back();
+                }
+                else { // extract top and push last element down heap
+                    *(tmp->elem) = tbb::internal::move(data[0]);
+                    __TBB_store_with_release(my_size, my_size-1);
+                    itt_store_word_with_release(tmp->status, uintptr_t(SUCCEEDED));
+                    reheap();
+                }
+            }
+        }
+
+        // heapify any leftover pushed elements before doing the next
+        // batch of operations
+        if (mark<data.size()) heapify();
+        __TBB_ASSERT(mark == data.size(), NULL);
+    }
+
+    //! Merge unsorted elements into heap
+    void heapify() {
+        if (!mark && data.size()>0) mark = 1;
+        for (; mark<data.size(); ++mark) {
+            // for each unheapified element under size
+            size_type cur_pos = mark;
+            value_type to_place = tbb::internal::move(data[mark]);
+            do { // push to_place up the heap
+                size_type parent = (cur_pos-1)>>1;
+                if (!compare(data[parent], to_place)) break;
+                data[cur_pos] = tbb::internal::move(data[parent]);
+                cur_pos = parent;
+            } while( cur_pos );
+            data[cur_pos] = tbb::internal::move(to_place);
+        }
+    }
+
+    //! Re-heapify after an extraction
+    /** Re-heapify by pushing last element down the heap from the root. */
+    void reheap() {
+        size_type cur_pos=0, child=1;
+
+        while (child < mark) {
+            size_type target = child;
+            if (child+1 < mark && compare(data[child], data[child+1]))
+                ++target;
+            // target now has the higher priority child
+            if (compare(data[target], data[data.size()-1])) break;
+            data[cur_pos] = tbb::internal::move(data[target]);
+            cur_pos = target;
+            child = (cur_pos<<1)+1;
+        }
+        if (cur_pos != data.size()-1)
+            data[cur_pos] = tbb::internal::move(data[data.size()-1]);
+        data.pop_back();
+        if (mark > data.size()) mark = data.size();
+    }
+
+    void push_back_helper(const T& t, tbb::internal::true_type) {
+        data.push_back(t);
+    }
+
+    void push_back_helper(const T&, tbb::internal::false_type) {
+        __TBB_ASSERT( false, "The type is not copy constructible. Copying push operation is impossible." );
+    }
+};
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+// Deduction guide for the constructor from two iterators
+template<typename InputIterator,
+         typename T = typename std::iterator_traits<InputIterator>::value_type,
+         typename A = cache_aligned_allocator<T>
+> concurrent_priority_queue(InputIterator, InputIterator, const A& = A())
+-> concurrent_priority_queue<T, std::less<T>, A>;
+#endif /* __TBB_CPP17_DEDUCTION_GUIDES_PRESENT */
+} // namespace interface5
+
+using interface5::concurrent_priority_queue;
+
+} // namespace tbb
+
+#endif /* __TBB_concurrent_priority_queue_H */
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_queue.h b/xdl/third_party/tbb/include/tbb/concurrent_queue.h
new file mode 100644
index 00000000..98b434b2
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_queue.h
@@ -0,0 +1,476 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_queue_H
+#define __TBB_concurrent_queue_H
+
+#include "internal/_concurrent_queue_impl.h"
+
+namespace tbb {
+
+namespace strict_ppl {
+
+//! A high-performance thread-safe non-blocking concurrent queue.
+/** Multiple threads may each push and pop concurrently.
+    Assignment construction is not allowed.
+    @ingroup containers */
+template<typename T, typename A = cache_aligned_allocator<T> >
+class concurrent_queue: public internal::concurrent_queue_base_v3<T> {
+    template<typename Container, typename Value> friend class internal::concurrent_queue_iterator;
+
+    //! Allocator type
+    typedef typename A::template rebind<char>::other page_allocator_type;
+    page_allocator_type my_allocator;
+
+    //! Allocates a block of size n (bytes)
+    virtual void *allocate_block( size_t n ) __TBB_override {
+        void *b = reinterpret_cast<void*>(my_allocator.allocate( n ));
+        if( !b )
+            internal::throw_exception(internal::eid_bad_alloc);
+        return b;
+    }
+
+    //! Deallocates block created by allocate_block.
+    virtual void deallocate_block( void *b, size_t n ) __TBB_override {
+        my_allocator.deallocate( reinterpret_cast<char*>(b), n );
+    }
+
+    static void copy_construct_item(T* location, const void* src){
+        new (location) T(*static_cast<const T*>(src));
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    static void move_construct_item(T* location, const void* src) {
+        new (location) T( std::move(*static_cast<T*>(const_cast<void*>(src))) );
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+public:
+    //! Element type in the queue.
+    typedef T value_type;
+
+    //! Reference type
+    typedef T& reference;
+
+    //! Const reference type
+    typedef const T& const_reference;
+
+    //! Integral type for representing size of the queue.
+    typedef size_t size_type;
+
+    //! Difference type for iterator
+    typedef ptrdiff_t difference_type;
+
+    //! Allocator type
+    typedef A allocator_type;
+
+    //! Construct empty queue
+    explicit concurrent_queue(const allocator_type& a = allocator_type()) :
+        my_allocator( a )
+    {
+    }
+
+    //! [begin,end) constructor
+    template<typename InputIterator>
+    concurrent_queue( InputIterator begin, InputIterator end, const allocator_type& a = allocator_type()) :
+        my_allocator( a )
+    {
+        for( ; begin != end; ++begin )
+            this->push(*begin);
+    }
+
+    //! Copy constructor
+    concurrent_queue( const concurrent_queue& src, const allocator_type& a = allocator_type()) :
+        internal::concurrent_queue_base_v3<T>(), my_allocator( a )
+    {
+        this->assign( src, copy_construct_item );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move constructors
+    concurrent_queue( concurrent_queue&& src ) :
+        internal::concurrent_queue_base_v3<T>(), my_allocator( std::move(src.my_allocator) )
+    {
+        this->internal_swap( src );
+    }
+
+    concurrent_queue( concurrent_queue&& src, const allocator_type& a ) :
+        internal::concurrent_queue_base_v3<T>(), my_allocator( a )
+    {
+        // checking that memory allocated by one instance of allocator can be deallocated
+        // with another
+        if( my_allocator == src.my_allocator) {
+            this->internal_swap( src );
+        } else {
+            // allocators are different => performing per-element move
+            this->assign( src, move_construct_item );
+            src.clear();
+        }
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! Destroy queue
+    ~concurrent_queue();
+
+    //! Enqueue an item at tail of queue.
+    void push( const T& source ) {
+        this->internal_push( &source, copy_construct_item );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void push( T&& source ) {
+        this->internal_push( &source, move_construct_item );
+    }
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename... Arguments>
+    void emplace( Arguments&&... args ) {
+        push( T(std::forward<Arguments>( args )...) );
+    }
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! Attempt to dequeue an item from head of queue.
+    /** Does not wait for item to become available.
+        Returns true if successful; false otherwise. */
+    bool try_pop( T& result ) {
+        return this->internal_try_pop( &result );
+    }
+
+    //! Return the number of items in the queue; thread unsafe
+    size_type unsafe_size() const {return this->internal_size();}
+
+    //! Equivalent to size()==0.
+    bool empty() const {return this->internal_empty();}
+
+    //! Clear the queue. not thread-safe.
+    void clear() ;
+
+    //! Return allocator object
+    allocator_type get_allocator() const { return this->my_allocator; }
+
+    typedef internal::concurrent_queue_iterator<concurrent_queue,T> iterator;
+    typedef internal::concurrent_queue_iterator<concurrent_queue,const T> const_iterator;
+
+    //------------------------------------------------------------------------
+    // The iterators are intended only for debugging.  They are slow and not thread safe.
+    //------------------------------------------------------------------------
+    iterator unsafe_begin() {return iterator(*this);}
+    iterator unsafe_end() {return iterator();}
+    const_iterator unsafe_begin() const {return const_iterator(*this);}
+    const_iterator unsafe_end() const {return const_iterator();}
+} ;
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+// Deduction guide for the constructor from two iterators
+template<typename InputIterator,
+         typename T = typename std::iterator_traits<InputIterator>::value_type,
+         typename A = cache_aligned_allocator<T>
+> concurrent_queue(InputIterator, InputIterator, const A& = A())
+-> concurrent_queue<T, A>;
+#endif /* __TBB_CPP17_DEDUCTION_GUIDES_PRESENT */
+
+template<typename T, class A>
+concurrent_queue<T,A>::~concurrent_queue() {
+    clear();
+    this->internal_finish_clear();
+}
+
+template<typename T, class A>
+void concurrent_queue<T,A>::clear() {
+    T value;
+    while( !empty() ) try_pop(value);
+}
+
+} // namespace strict_ppl
+
+//! A high-performance thread-safe blocking concurrent bounded queue.
+/** This is the pre-PPL TBB concurrent queue which supports boundedness and blocking semantics.
+    Note that method names agree with the PPL-style concurrent queue.
+    Multiple threads may each push and pop concurrently.
+    Assignment construction is not allowed.
+    @ingroup containers */
+template<typename T, class A = cache_aligned_allocator<T> >
+class concurrent_bounded_queue: public internal::concurrent_queue_base_v8 {
+    template<typename Container, typename Value> friend class internal::concurrent_queue_iterator;
+
+    //! Allocator type
+    typedef typename A::template rebind<char>::other page_allocator_type;
+    page_allocator_type my_allocator;
+
+    typedef typename concurrent_queue_base_v3::padded_page<T> padded_page;
+    typedef typename concurrent_queue_base_v3::copy_specifics copy_specifics;
+
+    //! Class used to ensure exception-safety of method "pop"
+    class destroyer: internal::no_copy {
+        T& my_value;
+    public:
+        destroyer( T& value ) : my_value(value) {}
+        ~destroyer() {my_value.~T();}
+    };
+
+    T& get_ref( page& p, size_t index ) {
+        __TBB_ASSERT( index<items_per_page, NULL );
+        return (&static_cast<padded_page*>(static_cast<void*>(&p))->last)[index];
+    }
+
+    virtual void copy_item( page& dst, size_t index, const void* src ) __TBB_override {
+        new( &get_ref(dst,index) ) T(*static_cast<const T*>(src));
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    virtual void move_item( page& dst, size_t index, const void* src ) __TBB_override {
+        new( &get_ref(dst,index) ) T( std::move(*static_cast<T*>(const_cast<void*>(src))) );
+    }
+#else
+    virtual void move_item( page&, size_t, const void* ) __TBB_override {
+        __TBB_ASSERT( false, "Unreachable code" );
+    }
+#endif
+
+    virtual void copy_page_item( page& dst, size_t dindex, const page& src, size_t sindex ) __TBB_override {
+        new( &get_ref(dst,dindex) ) T( get_ref( const_cast<page&>(src), sindex ) );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    virtual void move_page_item( page& dst, size_t dindex, const page& src, size_t sindex ) __TBB_override {
+        new( &get_ref(dst,dindex) ) T( std::move(get_ref( const_cast<page&>(src), sindex )) );
+    }
+#else
+    virtual void move_page_item( page&, size_t, const page&, size_t ) __TBB_override {
+        __TBB_ASSERT( false, "Unreachable code" );
+    }
+#endif
+
+    virtual void assign_and_destroy_item( void* dst, page& src, size_t index ) __TBB_override {
+        T& from = get_ref(src,index);
+        destroyer d(from);
+        *static_cast<T*>(dst) = tbb::internal::move( from );
+    }
+
+    virtual page *allocate_page() __TBB_override {
+        size_t n = sizeof(padded_page) + (items_per_page-1)*sizeof(T);
+        page *p = reinterpret_cast<page*>(my_allocator.allocate( n ));
+        if( !p )
+            internal::throw_exception(internal::eid_bad_alloc);
+        return p;
+    }
+
+    virtual void deallocate_page( page *p ) __TBB_override {
+        size_t n = sizeof(padded_page) + (items_per_page-1)*sizeof(T);
+        my_allocator.deallocate( reinterpret_cast<char*>(p), n );
+    }
+
+public:
+    //! Element type in the queue.
+    typedef T value_type;
+
+    //! Allocator type
+    typedef A allocator_type;
+
+    //! Reference type
+    typedef T& reference;
+
+    //! Const reference type
+    typedef const T& const_reference;
+
+    //! Integral type for representing size of the queue.
+    /** Note that the size_type is a signed integral type.
+        This is because the size can be negative if there are pending pops without corresponding pushes. */
+    typedef std::ptrdiff_t size_type;
+
+    //! Difference type for iterator
+    typedef std::ptrdiff_t difference_type;
+
+    //! Construct empty queue
+    explicit concurrent_bounded_queue(const allocator_type& a = allocator_type()) :
+        concurrent_queue_base_v8( sizeof(T) ), my_allocator( a )
+    {
+    }
+
+    //! Copy constructor
+    concurrent_bounded_queue( const concurrent_bounded_queue& src, const allocator_type& a = allocator_type())
+        : concurrent_queue_base_v8( sizeof(T) ), my_allocator( a )
+    {
+        assign( src );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move constructors
+    concurrent_bounded_queue( concurrent_bounded_queue&& src )
+        : concurrent_queue_base_v8( sizeof(T) ), my_allocator( std::move(src.my_allocator) )
+    {
+        internal_swap( src );
+    }
+
+    concurrent_bounded_queue( concurrent_bounded_queue&& src, const allocator_type& a )
+        : concurrent_queue_base_v8( sizeof(T) ), my_allocator( a )
+    {
+        // checking that memory allocated by one instance of allocator can be deallocated
+        // with another
+        if( my_allocator == src.my_allocator) {
+            this->internal_swap( src );
+        } else {
+            // allocators are different => performing per-element move
+            this->move_content( src );
+            src.clear();
+        }
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! [begin,end) constructor
+    template<typename InputIterator>
+    concurrent_bounded_queue( InputIterator begin, InputIterator end,
+                              const allocator_type& a = allocator_type())
+        : concurrent_queue_base_v8( sizeof(T) ), my_allocator( a )
+    {
+        for( ; begin != end; ++begin )
+            internal_push_if_not_full(&*begin);
+    }
+
+    //! Destroy queue
+    ~concurrent_bounded_queue();
+
+    //! Enqueue an item at tail of queue.
+    void push( const T& source ) {
+        internal_push( &source );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move an item at tail of queue.
+    void push( T&& source ) {
+        internal_push_move( &source );
+    }
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename... Arguments>
+    void emplace( Arguments&&... args ) {
+        push( T(std::forward<Arguments>( args )...) );
+    }
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! Dequeue item from head of queue.
+    /** Block until an item becomes available, and then dequeue it. */
+    void pop( T& destination ) {
+        internal_pop( &destination );
+    }
+
+#if TBB_USE_EXCEPTIONS
+    //! Abort all pending queue operations
+    void abort() {
+        internal_abort();
+    }
+#endif
+
+    //! Enqueue an item at tail of queue if queue is not already full.
+    /** Does not wait for queue to become not full.
+        Returns true if item is pushed; false if queue was already full. */
+    bool try_push( const T& source ) {
+        return internal_push_if_not_full( &source );
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move an item at tail of queue if queue is not already full.
+    /** Does not wait for queue to become not full.
+        Returns true if item is pushed; false if queue was already full. */
+    bool try_push( T&& source ) {
+        return internal_push_move_if_not_full( &source );
+    }
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename... Arguments>
+    bool try_emplace( Arguments&&... args ) {
+        return try_push( T(std::forward<Arguments>( args )...) );
+    }
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! Attempt to dequeue an item from head of queue.
+    /** Does not wait for item to become available.
+        Returns true if successful; false otherwise. */
+    bool try_pop( T& destination ) {
+        return internal_pop_if_present( &destination );
+    }
+
+    //! Return number of pushes minus number of pops.
+    /** Note that the result can be negative if there are pops waiting for the
+        corresponding pushes.  The result can also exceed capacity() if there
+        are push operations in flight. */
+    size_type size() const {return internal_size();}
+
+    //! Equivalent to size()<=0.
+    bool empty() const {return internal_empty();}
+
+    //! Maximum number of allowed elements
+    size_type capacity() const {
+        return my_capacity;
+    }
+
+    //! Set the capacity
+    /** Setting the capacity to 0 causes subsequent try_push operations to always fail,
+        and subsequent push operations to block forever. */
+    void set_capacity( size_type new_capacity ) {
+        internal_set_capacity( new_capacity, sizeof(T) );
+    }
+
+    //! return allocator object
+    allocator_type get_allocator() const { return this->my_allocator; }
+
+    //! clear the queue. not thread-safe.
+    void clear() ;
+
+    typedef internal::concurrent_queue_iterator<concurrent_bounded_queue,T> iterator;
+    typedef internal::concurrent_queue_iterator<concurrent_bounded_queue,const T> const_iterator;
+
+    //------------------------------------------------------------------------
+    // The iterators are intended only for debugging.  They are slow and not thread safe.
+    //------------------------------------------------------------------------
+    iterator unsafe_begin() {return iterator(*this);}
+    iterator unsafe_end() {return iterator();}
+    const_iterator unsafe_begin() const {return const_iterator(*this);}
+    const_iterator unsafe_end() const {return const_iterator();}
+
+};
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+// guide for concurrent_bounded_queue(InputIterator, InputIterator, ...)
+template<typename InputIterator,
+         typename T = typename std::iterator_traits<InputIterator>::value_type,
+         typename A = cache_aligned_allocator<T>
+> concurrent_bounded_queue(InputIterator, InputIterator, const A& = A())
+-> concurrent_bounded_queue<T, A>;
+#endif /* __TBB_CPP17_DEDUCTION_GUIDES_PRESENT */
+
+template<typename T, class A>
+concurrent_bounded_queue<T,A>::~concurrent_bounded_queue() {
+    clear();
+    internal_finish_clear();
+}
+
+template<typename T, class A>
+void concurrent_bounded_queue<T,A>::clear() {
+    T value;
+    while( try_pop(value) ) /*noop*/;
+}
+
+using strict_ppl::concurrent_queue;
+
+} // namespace tbb
+
+#endif /* __TBB_concurrent_queue_H */
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_unordered_map.h b/xdl/third_party/tbb/include/tbb/concurrent_unordered_map.h
new file mode 100644
index 00000000..d8d1d703
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_unordered_map.h
@@ -0,0 +1,373 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Container implementations in this header are based on PPL implementations
+   provided by Microsoft. */
+
+#ifndef __TBB_concurrent_unordered_map_H
+#define __TBB_concurrent_unordered_map_H
+
+#include "internal/_concurrent_unordered_impl.h"
+
+namespace tbb
+{
+
+namespace interface5 {
+
+// Template class for hash map traits
+template<typename Key, typename T, typename Hash_compare, typename Allocator, bool Allow_multimapping>
+class concurrent_unordered_map_traits
+{
+protected:
+    typedef std::pair<const Key, T> value_type;
+    typedef Key key_type;
+    typedef Hash_compare hash_compare;
+    typedef typename Allocator::template rebind<value_type>::other allocator_type;
+    enum { allow_multimapping = Allow_multimapping };
+
+    concurrent_unordered_map_traits() : my_hash_compare() {}
+    concurrent_unordered_map_traits(const hash_compare& hc) : my_hash_compare(hc) {}
+
+    template<class Type1, class Type2>
+    static const Key& get_key(const std::pair<Type1, Type2>& value) {
+        return (value.first);
+    }
+
+    hash_compare my_hash_compare; // the comparator predicate for keys
+};
+
+template <typename Key, typename T, typename Hasher = tbb::tbb_hash<Key>, typename Key_equality = std::equal_to<Key>,
+         typename Allocator = tbb::tbb_allocator<std::pair<const Key, T> > >
+class concurrent_unordered_map :
+    public internal::concurrent_unordered_base< concurrent_unordered_map_traits<Key, T,
+    internal::hash_compare<Key, Hasher, Key_equality>, Allocator, false> >
+{
+    // Base type definitions
+    typedef internal::hash_compare<Key, Hasher, Key_equality> hash_compare;
+    typedef concurrent_unordered_map_traits<Key, T, hash_compare, Allocator, false> traits_type;
+    typedef internal::concurrent_unordered_base< traits_type > base_type;
+#if __TBB_EXTRA_DEBUG
+public:
+#endif
+    using traits_type::allow_multimapping;
+public:
+    using base_type::end;
+    using base_type::find;
+    using base_type::insert;
+
+    // Type definitions
+    typedef Key key_type;
+    typedef typename base_type::value_type value_type;
+    typedef T mapped_type;
+    typedef Hasher hasher;
+    typedef Key_equality key_equal;
+    typedef hash_compare key_compare;
+
+    typedef typename base_type::allocator_type allocator_type;
+    typedef typename base_type::pointer pointer;
+    typedef typename base_type::const_pointer const_pointer;
+    typedef typename base_type::reference reference;
+    typedef typename base_type::const_reference const_reference;
+
+    typedef typename base_type::size_type size_type;
+    typedef typename base_type::difference_type difference_type;
+
+    typedef typename base_type::iterator iterator;
+    typedef typename base_type::const_iterator const_iterator;
+    typedef typename base_type::iterator local_iterator;
+    typedef typename base_type::const_iterator const_local_iterator;
+
+    // Construction/destruction/copying
+    explicit concurrent_unordered_map(size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {}
+
+    concurrent_unordered_map(size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {}
+
+    concurrent_unordered_map(size_type n_of_buckets, const hasher& a_hasher, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {}
+
+    explicit concurrent_unordered_map(const Allocator& a) : base_type(base_type::initial_bucket_number, key_compare(), a)
+    {}
+
+    template <typename Iterator>
+    concurrent_unordered_map(Iterator first, Iterator last, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_map(Iterator first, Iterator last, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_map(Iterator first, Iterator last, size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Constructor from initializer_list
+    concurrent_unordered_map(std::initializer_list<value_type> il, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(il.begin(),il.end());
+    }
+
+    concurrent_unordered_map(std::initializer_list<value_type> il, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+    concurrent_unordered_map(std::initializer_list<value_type> il, size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#if !__TBB_IMPLICIT_MOVE_PRESENT
+    concurrent_unordered_map(const concurrent_unordered_map& table)
+        : base_type(table)
+    {}
+
+    concurrent_unordered_map& operator=(const concurrent_unordered_map& table)
+    {
+        return static_cast<concurrent_unordered_map&>(base_type::operator=(table));
+    }
+
+    concurrent_unordered_map(concurrent_unordered_map&& table)
+        : base_type(std::move(table))
+    {}
+
+    concurrent_unordered_map& operator=(concurrent_unordered_map&& table)
+    {
+        return static_cast<concurrent_unordered_map&>(base_type::operator=(std::move(table)));
+    }
+#endif //!__TBB_IMPLICIT_MOVE_PRESENT
+
+    concurrent_unordered_map(concurrent_unordered_map&& table, const Allocator& a) : base_type(std::move(table), a)
+    {}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    concurrent_unordered_map(const concurrent_unordered_map& table, const Allocator& a)
+        : base_type(table, a)
+    {}
+
+    // Observers
+    mapped_type& operator[](const key_type& key)
+    {
+        iterator where = find(key);
+
+        if (where == end())
+        {
+            where = insert(std::pair<key_type, mapped_type>(key, mapped_type())).first;
+        }
+
+        return ((*where).second);
+    }
+
+    mapped_type& at(const key_type& key)
+    {
+        iterator where = find(key);
+
+        if (where == end())
+        {
+            tbb::internal::throw_exception(tbb::internal::eid_invalid_key);
+        }
+
+        return ((*where).second);
+    }
+
+    const mapped_type& at(const key_type& key) const
+    {
+        const_iterator where = find(key);
+
+        if (where == end())
+        {
+            tbb::internal::throw_exception(tbb::internal::eid_invalid_key);
+        }
+
+        return ((*where).second);
+    }
+};
+
+template < typename Key, typename T, typename Hasher = tbb::tbb_hash<Key>, typename Key_equality = std::equal_to<Key>,
+        typename Allocator = tbb::tbb_allocator<std::pair<const Key, T> > >
+class concurrent_unordered_multimap :
+    public internal::concurrent_unordered_base< concurrent_unordered_map_traits< Key, T,
+    internal::hash_compare<Key, Hasher, Key_equality>, Allocator, true> >
+{
+    // Base type definitions
+    typedef internal::hash_compare<Key, Hasher, Key_equality> hash_compare;
+    typedef concurrent_unordered_map_traits<Key, T, hash_compare, Allocator, true> traits_type;
+    typedef internal::concurrent_unordered_base<traits_type> base_type;
+#if __TBB_EXTRA_DEBUG
+public:
+#endif
+    using traits_type::allow_multimapping;
+public:
+    using base_type::insert;
+
+    // Type definitions
+    typedef Key key_type;
+    typedef typename base_type::value_type value_type;
+    typedef T mapped_type;
+    typedef Hasher hasher;
+    typedef Key_equality key_equal;
+    typedef hash_compare key_compare;
+
+    typedef typename base_type::allocator_type allocator_type;
+    typedef typename base_type::pointer pointer;
+    typedef typename base_type::const_pointer const_pointer;
+    typedef typename base_type::reference reference;
+    typedef typename base_type::const_reference const_reference;
+
+    typedef typename base_type::size_type size_type;
+    typedef typename base_type::difference_type difference_type;
+
+    typedef typename base_type::iterator iterator;
+    typedef typename base_type::const_iterator const_iterator;
+    typedef typename base_type::iterator local_iterator;
+    typedef typename base_type::const_iterator const_local_iterator;
+
+    // Construction/destruction/copying
+    explicit concurrent_unordered_multimap(size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {}
+
+    concurrent_unordered_multimap(size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {}
+
+    concurrent_unordered_multimap(size_type n_of_buckets, const hasher& a_hasher, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {}
+
+    explicit concurrent_unordered_multimap(const Allocator& a) : base_type(base_type::initial_bucket_number, key_compare(), a)
+    {}
+
+    template <typename Iterator>
+    concurrent_unordered_multimap(Iterator first, Iterator last, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets,key_compare(a_hasher,a_keyeq), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_multimap(Iterator first, Iterator last, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_multimap(Iterator first, Iterator last, size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Constructor from initializer_list
+    concurrent_unordered_multimap(std::initializer_list<value_type> il, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(il.begin(),il.end());
+    }
+
+    concurrent_unordered_multimap(std::initializer_list<value_type> il, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+    concurrent_unordered_multimap(std::initializer_list<value_type> il, size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#if !__TBB_IMPLICIT_MOVE_PRESENT
+    concurrent_unordered_multimap(const concurrent_unordered_multimap& table)
+        : base_type(table)
+    {}
+
+    concurrent_unordered_multimap& operator=(const concurrent_unordered_multimap& table)
+    {
+        return static_cast<concurrent_unordered_multimap&>(base_type::operator=(table));
+    }
+
+    concurrent_unordered_multimap(concurrent_unordered_multimap&& table)
+        : base_type(std::move(table))
+    {}
+
+    concurrent_unordered_multimap& operator=(concurrent_unordered_multimap&& table)
+    {
+        return static_cast<concurrent_unordered_multimap&>(base_type::operator=(std::move(table)));
+    }
+#endif //!__TBB_IMPLICIT_MOVE_PRESENT
+
+    concurrent_unordered_multimap(concurrent_unordered_multimap&& table, const Allocator& a) : base_type(std::move(table), a)
+    {}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    concurrent_unordered_multimap(const concurrent_unordered_multimap& table, const Allocator& a)
+        : base_type(table, a)
+    {}
+};
+} // namespace interface5
+
+using interface5::concurrent_unordered_map;
+using interface5::concurrent_unordered_multimap;
+
+} // namespace tbb
+
+#endif// __TBB_concurrent_unordered_map_H
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_unordered_set.h b/xdl/third_party/tbb/include/tbb/concurrent_unordered_set.h
new file mode 100644
index 00000000..f8e8387b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_unordered_set.h
@@ -0,0 +1,329 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Container implementations in this header are based on PPL implementations
+   provided by Microsoft. */
+
+#ifndef __TBB_concurrent_unordered_set_H
+#define __TBB_concurrent_unordered_set_H
+
+#include "internal/_concurrent_unordered_impl.h"
+
+namespace tbb
+{
+
+namespace interface5 {
+
+// Template class for hash set traits
+template<typename Key, typename Hash_compare, typename Allocator, bool Allow_multimapping>
+class concurrent_unordered_set_traits
+{
+protected:
+    typedef Key value_type;
+    typedef Key key_type;
+    typedef Hash_compare hash_compare;
+    typedef typename Allocator::template rebind<value_type>::other allocator_type;
+    enum { allow_multimapping = Allow_multimapping };
+
+    concurrent_unordered_set_traits() : my_hash_compare() {}
+    concurrent_unordered_set_traits(const hash_compare& hc) : my_hash_compare(hc) {}
+
+    static const Key& get_key(const value_type& value) {
+        return value;
+    }
+
+    hash_compare my_hash_compare; // the comparator predicate for keys
+};
+
+template <typename Key, typename Hasher = tbb::tbb_hash<Key>, typename Key_equality = std::equal_to<Key>, typename Allocator = tbb::tbb_allocator<Key> >
+class concurrent_unordered_set : public internal::concurrent_unordered_base< concurrent_unordered_set_traits<Key, internal::hash_compare<Key, Hasher, Key_equality>, Allocator, false> >
+{
+    // Base type definitions
+    typedef internal::hash_compare<Key, Hasher, Key_equality> hash_compare;
+    typedef concurrent_unordered_set_traits<Key, hash_compare, Allocator, false> traits_type;
+    typedef internal::concurrent_unordered_base< traits_type > base_type;
+#if __TBB_EXTRA_DEBUG
+public:
+#endif
+    using traits_type::allow_multimapping;
+public:
+    using base_type::insert;
+
+    // Type definitions
+    typedef Key key_type;
+    typedef typename base_type::value_type value_type;
+    typedef Key mapped_type;
+    typedef Hasher hasher;
+    typedef Key_equality key_equal;
+    typedef hash_compare key_compare;
+
+    typedef typename base_type::allocator_type allocator_type;
+    typedef typename base_type::pointer pointer;
+    typedef typename base_type::const_pointer const_pointer;
+    typedef typename base_type::reference reference;
+    typedef typename base_type::const_reference const_reference;
+
+    typedef typename base_type::size_type size_type;
+    typedef typename base_type::difference_type difference_type;
+
+    typedef typename base_type::iterator iterator;
+    typedef typename base_type::const_iterator const_iterator;
+    typedef typename base_type::iterator local_iterator;
+    typedef typename base_type::const_iterator const_local_iterator;
+
+    // Construction/destruction/copying
+    explicit concurrent_unordered_set(size_type n_of_buckets = base_type::initial_bucket_number, const hasher& a_hasher = hasher(),
+        const key_equal& a_keyeq = key_equal(), const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {}
+
+    concurrent_unordered_set(size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {}
+
+    concurrent_unordered_set(size_type n_of_buckets, const hasher& a_hasher, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {}
+
+    explicit concurrent_unordered_set(const Allocator& a) : base_type(base_type::initial_bucket_number, key_compare(), a)
+    {}
+
+    template <typename Iterator>
+    concurrent_unordered_set(Iterator first, Iterator last, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(), const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_set(Iterator first, Iterator last, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_set(Iterator first, Iterator last, size_type n_of_buckets, const hasher& a_hasher, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Constructor from initializer_list
+    concurrent_unordered_set(std::initializer_list<value_type> il, size_type n_of_buckets = base_type::initial_bucket_number, const hasher& a_hasher = hasher(),
+        const key_equal& a_keyeq = key_equal(), const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(il.begin(),il.end());
+    }
+
+    concurrent_unordered_set(std::initializer_list<value_type> il, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+    concurrent_unordered_set(std::initializer_list<value_type> il, size_type n_of_buckets, const hasher& a_hasher, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#if !__TBB_IMPLICIT_MOVE_PRESENT
+    concurrent_unordered_set(const concurrent_unordered_set& table)
+        : base_type(table)
+    {}
+
+    concurrent_unordered_set& operator=(const concurrent_unordered_set& table)
+    {
+        return static_cast<concurrent_unordered_set&>(base_type::operator=(table));
+    }
+
+    concurrent_unordered_set(concurrent_unordered_set&& table)
+        : base_type(std::move(table))
+    {}
+
+    concurrent_unordered_set& operator=(concurrent_unordered_set&& table)
+    {
+        return static_cast<concurrent_unordered_set&>(base_type::operator=(std::move(table)));
+    }
+#endif //!__TBB_IMPLICIT_MOVE_PRESENT
+
+    concurrent_unordered_set(concurrent_unordered_set&& table, const Allocator& a)
+        : base_type(std::move(table), a)
+    {}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    concurrent_unordered_set(const concurrent_unordered_set& table, const Allocator& a)
+        : base_type(table, a)
+    {}
+
+};
+
+template <typename Key, typename Hasher = tbb::tbb_hash<Key>, typename Key_equality = std::equal_to<Key>,
+         typename Allocator = tbb::tbb_allocator<Key> >
+class concurrent_unordered_multiset :
+    public internal::concurrent_unordered_base< concurrent_unordered_set_traits<Key,
+    internal::hash_compare<Key, Hasher, Key_equality>, Allocator, true> >
+{
+    // Base type definitions
+    typedef internal::hash_compare<Key, Hasher, Key_equality> hash_compare;
+    typedef concurrent_unordered_set_traits<Key, hash_compare, Allocator, true> traits_type;
+    typedef internal::concurrent_unordered_base< traits_type > base_type;
+#if __TBB_EXTRA_DEBUG
+public:
+#endif
+    using traits_type::allow_multimapping;
+public:
+    using base_type::insert;
+
+    // Type definitions
+    typedef Key key_type;
+    typedef typename base_type::value_type value_type;
+    typedef Key mapped_type;
+    typedef Hasher hasher;
+    typedef Key_equality key_equal;
+    typedef hash_compare key_compare;
+
+    typedef typename base_type::allocator_type allocator_type;
+    typedef typename base_type::pointer pointer;
+    typedef typename base_type::const_pointer const_pointer;
+    typedef typename base_type::reference reference;
+    typedef typename base_type::const_reference const_reference;
+
+    typedef typename base_type::size_type size_type;
+    typedef typename base_type::difference_type difference_type;
+
+    typedef typename base_type::iterator iterator;
+    typedef typename base_type::const_iterator const_iterator;
+    typedef typename base_type::iterator local_iterator;
+    typedef typename base_type::const_iterator const_local_iterator;
+
+    // Construction/destruction/copying
+    explicit concurrent_unordered_multiset(size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {}
+
+    concurrent_unordered_multiset(size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {}
+
+    concurrent_unordered_multiset(size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {}
+
+    explicit concurrent_unordered_multiset(const Allocator& a) : base_type(base_type::initial_bucket_number, key_compare(), a)
+    {}
+
+    template <typename Iterator>
+    concurrent_unordered_multiset(Iterator first, Iterator last, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(),
+        const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_multiset(Iterator first, Iterator last, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+    template <typename Iterator>
+    concurrent_unordered_multiset(Iterator first, Iterator last, size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(first, last);
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Constructor from initializer_list
+    concurrent_unordered_multiset(std::initializer_list<value_type> il, size_type n_of_buckets = base_type::initial_bucket_number,
+        const hasher& a_hasher = hasher(), const key_equal& a_keyeq = key_equal(), const allocator_type& a = allocator_type())
+        : base_type(n_of_buckets, key_compare(a_hasher, a_keyeq), a)
+    {
+        insert(il.begin(),il.end());
+    }
+
+    concurrent_unordered_multiset(std::initializer_list<value_type> il, size_type n_of_buckets, const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(hasher(), key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+    concurrent_unordered_multiset(std::initializer_list<value_type> il, size_type n_of_buckets, const hasher& a_hasher,
+        const allocator_type& a)
+        : base_type(n_of_buckets, key_compare(a_hasher, key_equal()), a)
+    {
+        insert(il.begin(), il.end());
+    }
+
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#if !__TBB_IMPLICIT_MOVE_PRESENT
+    concurrent_unordered_multiset(const concurrent_unordered_multiset& table)
+        : base_type(table)
+    {}
+
+    concurrent_unordered_multiset& operator=(const concurrent_unordered_multiset& table)
+    {
+        return static_cast<concurrent_unordered_multiset&>(base_type::operator=(table));
+    }
+
+    concurrent_unordered_multiset(concurrent_unordered_multiset&& table)
+        : base_type(std::move(table))
+    {}
+
+    concurrent_unordered_multiset& operator=(concurrent_unordered_multiset&& table)
+    {
+        return static_cast<concurrent_unordered_multiset&>(base_type::operator=(std::move(table)));
+    }
+#endif //!__TBB_IMPLICIT_MOVE_PRESENT
+
+    concurrent_unordered_multiset(concurrent_unordered_multiset&& table, const Allocator& a)
+        : base_type(std::move(table), a)
+    {
+    }
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+    concurrent_unordered_multiset(const concurrent_unordered_multiset& table, const Allocator& a)
+        : base_type(table, a)
+    {}
+};
+} // namespace interface5
+
+using interface5::concurrent_unordered_set;
+using interface5::concurrent_unordered_multiset;
+
+} // namespace tbb
+
+#endif// __TBB_concurrent_unordered_set_H
diff --git a/xdl/third_party/tbb/include/tbb/concurrent_vector.h b/xdl/third_party/tbb/include/tbb/concurrent_vector.h
new file mode 100644
index 00000000..e4a9448b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/concurrent_vector.h
@@ -0,0 +1,1382 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_vector_H
+#define __TBB_concurrent_vector_H
+
+#include "tbb_stddef.h"
+#include "tbb_exception.h"
+#include "atomic.h"
+#include "cache_aligned_allocator.h"
+#include "blocked_range.h"
+#include "tbb_machine.h"
+#include "tbb_profiling.h"
+#include <new>
+#include <cstring>   // for memset()
+#include __TBB_STD_SWAP_HEADER
+#include <algorithm>
+#include <iterator>
+
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    // VS2008/VC9 seems to have an issue; limits pull in math.h
+    #pragma warning( push )
+    #pragma warning( disable: 4985 )
+#endif
+#include <limits> /* std::numeric_limits */
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    #pragma warning( pop )
+#endif
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    #include <initializer_list>
+#endif
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (push)
+#if defined(_Wp64)
+    #pragma warning (disable: 4267)
+#endif
+    #pragma warning (disable: 4127) //warning C4127: conditional expression is constant
+#endif
+
+namespace tbb {
+
+template<typename T, class A = cache_aligned_allocator<T> >
+class concurrent_vector;
+
+//! @cond INTERNAL
+namespace internal {
+
+    template<typename Container, typename Value>
+    class vector_iterator;
+
+    //! Bad allocation marker
+    static void *const vector_allocation_error_flag = reinterpret_cast<void*>(size_t(63));
+
+    //! Exception helper function
+    template<typename T>
+    void handle_unconstructed_elements(T* array, size_t n_of_elements){
+        std::memset( static_cast<void*>(array), 0, n_of_elements * sizeof( T ) );
+    }
+
+    //! Base class of concurrent vector implementation.
+    /** @ingroup containers */
+    class concurrent_vector_base_v3 {
+    protected:
+
+        // Basic types declarations
+        typedef size_t segment_index_t;
+        typedef size_t size_type;
+
+        // Using enumerations due to Mac linking problems of static const variables
+        enum {
+            // Size constants
+            default_initial_segments = 1, // 2 initial items
+            //! Number of slots for segment pointers inside the class
+            pointers_per_short_table = 3, // to fit into 8 words of entire structure
+            pointers_per_long_table = sizeof(segment_index_t) * 8 // one segment per bit
+        };
+
+        struct segment_not_used {};
+        struct segment_allocated {};
+        struct segment_allocation_failed {};
+
+        class segment_t;
+        class segment_value_t {
+            void* array;
+        private:
+            //TODO: More elegant way to grant access to selected functions _only_?
+            friend class segment_t;
+            explicit segment_value_t(void* an_array):array(an_array) {}
+        public:
+            friend bool operator==(segment_value_t const& lhs, segment_not_used ) { return lhs.array == 0;}
+            friend bool operator==(segment_value_t const& lhs, segment_allocated) { return lhs.array > internal::vector_allocation_error_flag;}
+            friend bool operator==(segment_value_t const& lhs, segment_allocation_failed) { return lhs.array == internal::vector_allocation_error_flag;}
+            template<typename argument_type>
+            friend bool operator!=(segment_value_t const& lhs, argument_type arg) { return ! (lhs == arg);}
+
+            template<typename T>
+            T* pointer() const {  return static_cast<T*>(const_cast<void*>(array)); }
+        };
+
+        friend void enforce_segment_allocated(segment_value_t const& s, internal::exception_id exception = eid_bad_last_alloc){
+            if(s != segment_allocated()){
+                internal::throw_exception(exception);
+            }
+        }
+
+        // Segment pointer.
+        class segment_t {
+            atomic<void*> array;
+        public:
+            segment_t(){ store<relaxed>(segment_not_used());}
+            //Copy ctor and assignment operator are defined to ease using of stl algorithms.
+            //These algorithms usually not a synchronization point, so, semantic is
+            //intentionally relaxed here.
+            segment_t(segment_t const& rhs ){ array.store<relaxed>(rhs.array.load<relaxed>());}
+
+            void swap(segment_t & rhs ){
+                tbb::internal::swap<relaxed>(array, rhs.array);
+            }
+
+            segment_t& operator=(segment_t const& rhs ){
+                array.store<relaxed>(rhs.array.load<relaxed>());
+                return *this;
+            }
+
+            template<memory_semantics M>
+            segment_value_t load() const { return segment_value_t(array.load<M>());}
+
+            template<memory_semantics M>
+            void store(segment_not_used) {
+                array.store<M>(0);
+            }
+
+            template<memory_semantics M>
+            void store(segment_allocation_failed) {
+                __TBB_ASSERT(load<relaxed>() != segment_allocated(),"transition from \"allocated\" to \"allocation failed\" state looks non-logical");
+                array.store<M>(internal::vector_allocation_error_flag);
+            }
+
+            template<memory_semantics M>
+            void store(void* allocated_segment_pointer) __TBB_NOEXCEPT(true) {
+                __TBB_ASSERT(segment_value_t(allocated_segment_pointer) == segment_allocated(),
+                     "other overloads of store should be used for marking segment as not_used or allocation_failed" );
+                array.store<M>(allocated_segment_pointer);
+            }
+
+#if TBB_USE_ASSERT
+            ~segment_t() {
+                __TBB_ASSERT(load<relaxed>() != segment_allocated(), "should have been freed by clear" );
+            }
+#endif /* TBB_USE_ASSERT */
+        };
+        friend void swap(segment_t & , segment_t & ) __TBB_NOEXCEPT(true);
+
+        // Data fields
+
+        //! allocator function pointer
+        void* (*vector_allocator_ptr)(concurrent_vector_base_v3 &, size_t);
+
+        //! count of segments in the first block
+        atomic<size_type> my_first_block;
+
+        //! Requested size of vector
+        atomic<size_type> my_early_size;
+
+        //! Pointer to the segments table
+        atomic<segment_t*> my_segment;
+
+        //! embedded storage of segment pointers
+        segment_t my_storage[pointers_per_short_table];
+
+        // Methods
+
+        concurrent_vector_base_v3() {
+            //Here the semantic is intentionally relaxed.
+            //The reason this is next:
+            //Object that is in middle of construction (i.e. its constructor is not yet finished)
+            //cannot be used concurrently until the construction is finished.
+            //Thus to flag other threads that construction is finished, some synchronization with
+            //acquire-release semantic should be done by the (external) code that uses the vector.
+            //So, no need to do the synchronization inside the vector.
+
+            my_early_size.store<relaxed>(0);
+            my_first_block.store<relaxed>(0); // here is not default_initial_segments
+            my_segment.store<relaxed>(my_storage);
+        }
+
+        __TBB_EXPORTED_METHOD ~concurrent_vector_base_v3();
+
+        //these helpers methods use the fact that segments are allocated so
+        //that every segment size is a (increasing) power of 2.
+        //with one exception 0 segment has size of 2 as well segment 1;
+        //e.g. size of segment with index of 3 is 2^3=8;
+        static segment_index_t segment_index_of( size_type index ) {
+            return segment_index_t( __TBB_Log2( index|1 ) );
+        }
+
+        static segment_index_t segment_base( segment_index_t k ) {
+            return (segment_index_t(1)<<k & ~segment_index_t(1));
+        }
+
+        static inline segment_index_t segment_base_index_of( segment_index_t &index ) {
+            segment_index_t k = segment_index_of( index );
+            index -= segment_base(k);
+            return k;
+        }
+
+        static size_type segment_size( segment_index_t k ) {
+            return segment_index_t(1)<<k; // fake value for k==0
+        }
+
+
+        static bool is_first_element_in_segment(size_type element_index){
+            //check if element_index is a power of 2 that is at least 2.
+            //The idea is to detect if the iterator crosses a segment boundary,
+            //and 2 is the minimal index for which it's true
+            __TBB_ASSERT(element_index, "there should be no need to call "
+                                        "is_first_element_in_segment for 0th element" );
+            return is_power_of_two_at_least( element_index, 2 );
+        }
+
+        //! An operation on an n-element array starting at begin.
+        typedef void (__TBB_EXPORTED_FUNC *internal_array_op1)(void* begin, size_type n );
+
+        //! An operation on n-element destination array and n-element source array.
+        typedef void (__TBB_EXPORTED_FUNC *internal_array_op2)(void* dst, const void* src, size_type n );
+
+        //! Internal structure for compact()
+        struct internal_segments_table {
+            segment_index_t first_block;
+            segment_t table[pointers_per_long_table];
+        };
+
+        void __TBB_EXPORTED_METHOD internal_reserve( size_type n, size_type element_size, size_type max_size );
+        size_type __TBB_EXPORTED_METHOD internal_capacity() const;
+        void internal_grow( size_type start, size_type finish, size_type element_size, internal_array_op2 init, const void *src );
+        size_type __TBB_EXPORTED_METHOD internal_grow_by( size_type delta, size_type element_size, internal_array_op2 init, const void *src );
+        void* __TBB_EXPORTED_METHOD internal_push_back( size_type element_size, size_type& index );
+        segment_index_t __TBB_EXPORTED_METHOD internal_clear( internal_array_op1 destroy );
+        void* __TBB_EXPORTED_METHOD internal_compact( size_type element_size, void *table, internal_array_op1 destroy, internal_array_op2 copy );
+        void __TBB_EXPORTED_METHOD internal_copy( const concurrent_vector_base_v3& src, size_type element_size, internal_array_op2 copy );
+        void __TBB_EXPORTED_METHOD internal_assign( const concurrent_vector_base_v3& src, size_type element_size,
+                              internal_array_op1 destroy, internal_array_op2 assign, internal_array_op2 copy );
+        //! Obsolete
+        void __TBB_EXPORTED_METHOD internal_throw_exception(size_type) const;
+        void __TBB_EXPORTED_METHOD internal_swap(concurrent_vector_base_v3& v);
+
+        void __TBB_EXPORTED_METHOD internal_resize( size_type n, size_type element_size, size_type max_size, const void *src,
+                                                    internal_array_op1 destroy, internal_array_op2 init );
+        size_type __TBB_EXPORTED_METHOD internal_grow_to_at_least_with_result( size_type new_size, size_type element_size, internal_array_op2 init, const void *src );
+
+        //! Deprecated entry point for backwards compatibility to TBB 2.1.
+        void __TBB_EXPORTED_METHOD internal_grow_to_at_least( size_type new_size, size_type element_size, internal_array_op2 init, const void *src );
+private:
+        //! Private functionality
+        class helper;
+        friend class helper;
+
+        template<typename Container, typename Value>
+        friend class vector_iterator;
+
+    };
+
+    inline void swap(concurrent_vector_base_v3::segment_t & lhs, concurrent_vector_base_v3::segment_t & rhs) __TBB_NOEXCEPT(true) {
+        lhs.swap(rhs);
+    }
+
+    typedef concurrent_vector_base_v3 concurrent_vector_base;
+
+    //! Meets requirements of a forward iterator for STL and a Value for a blocked_range.*/
+    /** Value is either the T or const T type of the container.
+        @ingroup containers */
+    template<typename Container, typename Value>
+    class vector_iterator
+    {
+        //! concurrent_vector over which we are iterating.
+        Container* my_vector;
+
+        //! Index into the vector
+        size_t my_index;
+
+        //! Caches my_vector-&gt;internal_subscript(my_index)
+        /** NULL if cached value is not available */
+        mutable Value* my_item;
+
+        template<typename C, typename T>
+        friend vector_iterator<C,T> operator+( ptrdiff_t offset, const vector_iterator<C,T>& v );
+
+        template<typename C, typename T, typename U>
+        friend bool operator==( const vector_iterator<C,T>& i, const vector_iterator<C,U>& j );
+
+        template<typename C, typename T, typename U>
+        friend bool operator<( const vector_iterator<C,T>& i, const vector_iterator<C,U>& j );
+
+        template<typename C, typename T, typename U>
+        friend ptrdiff_t operator-( const vector_iterator<C,T>& i, const vector_iterator<C,U>& j );
+
+        template<typename C, typename U>
+        friend class internal::vector_iterator;
+
+#if !__TBB_TEMPLATE_FRIENDS_BROKEN
+        template<typename T, class A>
+        friend class tbb::concurrent_vector;
+#else
+public:
+#endif
+
+        vector_iterator( const Container& vector, size_t index, void *ptr = 0 ) :
+            my_vector(const_cast<Container*>(&vector)),
+            my_index(index),
+            my_item(static_cast<Value*>(ptr))
+        {}
+
+    public:
+        //! Default constructor
+        vector_iterator() : my_vector(NULL), my_index(~size_t(0)), my_item(NULL) {}
+
+        vector_iterator( const vector_iterator<Container,typename Container::value_type>& other ) :
+            my_vector(other.my_vector),
+            my_index(other.my_index),
+            my_item(other.my_item)
+        {}
+
+        vector_iterator operator+( ptrdiff_t offset ) const {
+            return vector_iterator( *my_vector, my_index+offset );
+        }
+        vector_iterator &operator+=( ptrdiff_t offset ) {
+            my_index+=offset;
+            my_item = NULL;
+            return *this;
+        }
+        vector_iterator operator-( ptrdiff_t offset ) const {
+            return vector_iterator( *my_vector, my_index-offset );
+        }
+        vector_iterator &operator-=( ptrdiff_t offset ) {
+            my_index-=offset;
+            my_item = NULL;
+            return *this;
+        }
+        Value& operator*() const {
+            Value* item = my_item;
+            if( !item ) {
+                item = my_item = &my_vector->internal_subscript(my_index);
+            }
+            __TBB_ASSERT( item==&my_vector->internal_subscript(my_index), "corrupt cache" );
+            return *item;
+        }
+        Value& operator[]( ptrdiff_t k ) const {
+            return my_vector->internal_subscript(my_index+k);
+        }
+        Value* operator->() const {return &operator*();}
+
+        //! Pre increment
+        vector_iterator& operator++() {
+            size_t element_index = ++my_index;
+            if( my_item ) {
+                //TODO: consider using of knowledge about "first_block optimization" here as well?
+                if( concurrent_vector_base::is_first_element_in_segment(element_index)) {
+                    //if the iterator crosses a segment boundary, the pointer become invalid
+                    //as possibly next segment is in another memory location
+                    my_item= NULL;
+                } else {
+                    ++my_item;
+                }
+            }
+            return *this;
+        }
+
+        //! Pre decrement
+        vector_iterator& operator--() {
+            __TBB_ASSERT( my_index>0, "operator--() applied to iterator already at beginning of concurrent_vector" );
+            size_t element_index = my_index--;
+            if( my_item ) {
+                if(concurrent_vector_base::is_first_element_in_segment(element_index)) {
+                    //if the iterator crosses a segment boundary, the pointer become invalid
+                    //as possibly next segment is in another memory location
+                    my_item= NULL;
+                } else {
+                    --my_item;
+                }
+            }
+            return *this;
+        }
+
+        //! Post increment
+        vector_iterator operator++(int) {
+            vector_iterator result = *this;
+            operator++();
+            return result;
+        }
+
+        //! Post decrement
+        vector_iterator operator--(int) {
+            vector_iterator result = *this;
+            operator--();
+            return result;
+        }
+
+        // STL support
+
+        typedef ptrdiff_t difference_type;
+        typedef Value value_type;
+        typedef Value* pointer;
+        typedef Value& reference;
+        typedef std::random_access_iterator_tag iterator_category;
+    };
+
+    template<typename Container, typename T>
+    vector_iterator<Container,T> operator+( ptrdiff_t offset, const vector_iterator<Container,T>& v ) {
+        return vector_iterator<Container,T>( *v.my_vector, v.my_index+offset );
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator==( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return i.my_index==j.my_index && i.my_vector == j.my_vector;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator!=( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return !(i==j);
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator<( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return i.my_index<j.my_index;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator>( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return j<i;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator>=( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return !(i<j);
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator<=( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return !(j<i);
+    }
+
+    template<typename Container, typename T, typename U>
+    ptrdiff_t operator-( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return ptrdiff_t(i.my_index)-ptrdiff_t(j.my_index);
+    }
+
+    template<typename T, class A>
+    class allocator_base {
+    public:
+        typedef typename A::template
+            rebind<T>::other allocator_type;
+        allocator_type my_allocator;
+
+        allocator_base(const allocator_type &a = allocator_type() ) : my_allocator(a) {}
+
+    };
+
+} // namespace internal
+//! @endcond
+
+//! Concurrent vector container
+/** concurrent_vector is a container having the following main properties:
+    - It provides random indexed access to its elements. The index of the first element is 0.
+    - It ensures safe concurrent growing its size (different threads can safely append new elements).
+    - Adding new elements does not invalidate existing iterators and does not change indices of existing items.
+
+@par Compatibility
+    The class meets all Container Requirements and Reversible Container Requirements from
+    C++ Standard (See ISO/IEC 14882:2003(E), clause 23.1). But it doesn't meet
+    Sequence Requirements due to absence of insert() and erase() methods.
+
+@par Exception Safety
+    Methods working with memory allocation and/or new elements construction can throw an
+    exception if allocator fails to allocate memory or element's default constructor throws one.
+    Concurrent vector's element of type T must conform to the following requirements:
+    - Throwing an exception is forbidden for destructor of T.
+    - Default constructor of T must not throw an exception OR its non-virtual destructor must safely work when its object memory is zero-initialized.
+    .
+    Otherwise, the program's behavior is undefined.
+@par
+    If an exception happens inside growth or assignment operation, an instance of the vector becomes invalid unless it is stated otherwise in the method documentation.
+    Invalid state means:
+    - There are no guarantees that all items were initialized by a constructor. The rest of items is zero-filled, including item where exception happens.
+    - An invalid vector instance cannot be repaired; it is unable to grow anymore.
+    - Size and capacity reported by the vector are incorrect, and calculated as if the failed operation were successful.
+    - Attempt to access not allocated elements using operator[] or iterators results in access violation or segmentation fault exception, and in case of using at() method a C++ exception is thrown.
+    .
+    If a concurrent grow operation successfully completes, all the elements it has added to the vector will remain valid and accessible even if one of subsequent grow operations fails.
+
+@par Fragmentation
+    Unlike an STL vector, a concurrent_vector does not move existing elements if it needs
+    to allocate more memory. The container is divided into a series of contiguous arrays of
+    elements. The first reservation, growth, or assignment operation determines the size of
+    the first array. Using small number of elements as initial size incurs fragmentation that
+    may increase element access time. Internal layout can be optimized by method compact() that
+    merges several smaller arrays into one solid.
+
+@par Changes since TBB 2.1
+    - Fixed guarantees of concurrent_vector::size() and grow_to_at_least() methods to assure elements are allocated.
+    - Methods end()/rbegin()/back() are partly thread-safe since they use size() to get the end of vector
+    - Added resize() methods (not thread-safe)
+    - Added cbegin/cend/crbegin/crend methods
+    - Changed return type of methods grow* and push_back to iterator
+
+@par Changes since TBB 2.0
+    - Implemented exception-safety guarantees
+    - Added template argument for allocator
+    - Added allocator argument in constructors
+    - Faster index calculation
+    - First growth call specifies a number of segments to be merged in the first allocation.
+    - Fixed memory blow up for swarm of vector's instances of small size
+    - Added grow_by(size_type n, const_reference t) growth using copying constructor to init new items.
+    - Added STL-like constructors.
+    - Added operators ==, < and derivatives
+    - Added at() method, approved for using after an exception was thrown inside the vector
+    - Added get_allocator() method.
+    - Added assign() methods
+    - Added compact() method to defragment first segments
+    - Added swap() method
+    - range() defaults on grainsize = 1 supporting auto grainsize algorithms.
+
+    @ingroup containers */
+template<typename T, class A>
+class concurrent_vector: protected internal::allocator_base<T, A>,
+                         private internal::concurrent_vector_base {
+private:
+    template<typename I>
+    class generic_range_type: public blocked_range<I> {
+    public:
+        typedef T value_type;
+        typedef T& reference;
+        typedef const T& const_reference;
+        typedef I iterator;
+        typedef ptrdiff_t difference_type;
+        generic_range_type( I begin_, I end_, size_t grainsize_ = 1) : blocked_range<I>(begin_,end_,grainsize_) {}
+        template<typename U>
+        generic_range_type( const generic_range_type<U>& r) : blocked_range<I>(r.begin(),r.end(),r.grainsize()) {}
+        generic_range_type( generic_range_type& r, split ) : blocked_range<I>(r,split()) {}
+    };
+
+    template<typename C, typename U>
+    friend class internal::vector_iterator;
+
+public:
+    //------------------------------------------------------------------------
+    // STL compatible types
+    //------------------------------------------------------------------------
+    typedef internal::concurrent_vector_base_v3::size_type size_type;
+    typedef typename internal::allocator_base<T, A>::allocator_type allocator_type;
+
+    typedef T value_type;
+    typedef ptrdiff_t difference_type;
+    typedef T& reference;
+    typedef const T& const_reference;
+    typedef T *pointer;
+    typedef const T *const_pointer;
+
+    typedef internal::vector_iterator<concurrent_vector,T> iterator;
+    typedef internal::vector_iterator<concurrent_vector,const T> const_iterator;
+
+#if !defined(_MSC_VER) || _CPPLIB_VER>=300
+    // Assume ISO standard definition of std::reverse_iterator
+    typedef std::reverse_iterator<iterator> reverse_iterator;
+    typedef std::reverse_iterator<const_iterator> const_reverse_iterator;
+#else
+    // Use non-standard std::reverse_iterator
+    typedef std::reverse_iterator<iterator,T,T&,T*> reverse_iterator;
+    typedef std::reverse_iterator<const_iterator,T,const T&,const T*> const_reverse_iterator;
+#endif /* defined(_MSC_VER) && (_MSC_VER<1300) */
+
+    //------------------------------------------------------------------------
+    // Parallel algorithm support
+    //------------------------------------------------------------------------
+    typedef generic_range_type<iterator> range_type;
+    typedef generic_range_type<const_iterator> const_range_type;
+
+    //------------------------------------------------------------------------
+    // STL compatible constructors & destructors
+    //------------------------------------------------------------------------
+
+    //! Construct empty vector.
+    explicit concurrent_vector(const allocator_type &a = allocator_type())
+        : internal::allocator_base<T, A>(a), internal::concurrent_vector_base()
+    {
+        vector_allocator_ptr = &internal_allocator;
+    }
+
+    //Constructors are not required to have synchronization
+    //(for more details see comment in the concurrent_vector_base constructor).
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Constructor from initializer_list
+    concurrent_vector(std::initializer_list<T> init_list, const allocator_type &a = allocator_type())
+        : internal::allocator_base<T, A>(a), internal::concurrent_vector_base()
+    {
+        vector_allocator_ptr = &internal_allocator;
+        __TBB_TRY {
+            internal_assign_iterators(init_list.begin(), init_list.end());
+        } __TBB_CATCH(...) {
+            segment_t *table = my_segment.load<relaxed>();;
+            internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>());
+            __TBB_RETHROW();
+        }
+
+    }
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+    //! Copying constructor
+    concurrent_vector( const concurrent_vector& vector, const allocator_type& a = allocator_type() )
+        : internal::allocator_base<T, A>(a), internal::concurrent_vector_base()
+    {
+        vector_allocator_ptr = &internal_allocator;
+        __TBB_TRY {
+            internal_copy(vector, sizeof(T), &copy_array);
+        } __TBB_CATCH(...) {
+            segment_t *table = my_segment.load<relaxed>();
+            internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>());
+            __TBB_RETHROW();
+        }
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move constructor
+    //TODO add __TBB_NOEXCEPT(true) and static_assert(std::has_nothrow_move_constructor<A>::value)
+    concurrent_vector( concurrent_vector&& source)
+        : internal::allocator_base<T, A>(std::move(source)), internal::concurrent_vector_base()
+    {
+        vector_allocator_ptr = &internal_allocator;
+        concurrent_vector_base_v3::internal_swap(source);
+    }
+
+    concurrent_vector( concurrent_vector&& source, const allocator_type& a)
+        : internal::allocator_base<T, A>(a), internal::concurrent_vector_base()
+    {
+        vector_allocator_ptr = &internal_allocator;
+        //C++ standard requires instances of an allocator being compared for equality,
+        //which means that memory allocated by one instance is possible to deallocate with the other one.
+        if (a == source.my_allocator) {
+            concurrent_vector_base_v3::internal_swap(source);
+        } else {
+            __TBB_TRY {
+                internal_copy(source, sizeof(T), &move_array);
+            } __TBB_CATCH(...) {
+                segment_t *table = my_segment.load<relaxed>();
+                internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>());
+                __TBB_RETHROW();
+            }
+        }
+    }
+
+#endif
+
+    //! Copying constructor for vector with different allocator type
+    template<class M>
+    concurrent_vector( const concurrent_vector<T, M>& vector, const allocator_type& a = allocator_type() )
+        : internal::allocator_base<T, A>(a), internal::concurrent_vector_base()
+    {
+        vector_allocator_ptr = &internal_allocator;
+        __TBB_TRY {
+            internal_copy(vector.internal_vector_base(), sizeof(T), &copy_array);
+        } __TBB_CATCH(...) {
+            segment_t *table = my_segment.load<relaxed>();
+            internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>() );
+            __TBB_RETHROW();
+        }
+    }
+
+    //! Construction with initial size specified by argument n
+    explicit concurrent_vector(size_type n)
+    {
+        vector_allocator_ptr = &internal_allocator;
+        __TBB_TRY {
+            internal_resize( n, sizeof(T), max_size(), NULL, &destroy_array, &initialize_array );
+        } __TBB_CATCH(...) {
+            segment_t *table = my_segment.load<relaxed>();
+            internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>() );
+            __TBB_RETHROW();
+        }
+    }
+
+    //! Construction with initial size specified by argument n, initialization by copying of t, and given allocator instance
+    concurrent_vector(size_type n, const_reference t, const allocator_type& a = allocator_type())
+        : internal::allocator_base<T, A>(a)
+    {
+        vector_allocator_ptr = &internal_allocator;
+        __TBB_TRY {
+            internal_resize( n, sizeof(T), max_size(), static_cast<const void*>(&t), &destroy_array, &initialize_array_by );
+        } __TBB_CATCH(...) {
+            segment_t *table = my_segment.load<relaxed>();
+            internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>() );
+            __TBB_RETHROW();
+        }
+    }
+
+    //! Construction with copying iteration range and given allocator instance
+    template<class I>
+    concurrent_vector(I first, I last, const allocator_type &a = allocator_type())
+        : internal::allocator_base<T, A>(a)
+    {
+        vector_allocator_ptr = &internal_allocator;
+        __TBB_TRY {
+            internal_assign_range(first, last, static_cast<is_integer_tag<std::numeric_limits<I>::is_integer> *>(0) );
+        } __TBB_CATCH(...) {
+            segment_t *table = my_segment.load<relaxed>();
+            internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>() );
+            __TBB_RETHROW();
+        }
+    }
+
+    //! Assignment
+    concurrent_vector& operator=( const concurrent_vector& vector ) {
+        if( this != &vector )
+            internal_assign(vector, sizeof(T), &destroy_array, &assign_array, &copy_array);
+        return *this;
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //TODO: add __TBB_NOEXCEPT()
+    //! Move assignment
+    concurrent_vector& operator=( concurrent_vector&& other ) {
+        __TBB_ASSERT(this != &other, "Move assignment to itself is prohibited ");
+        typedef typename tbb::internal::allocator_traits<A>::propagate_on_container_move_assignment pocma_t;
+        if(pocma_t::value || this->my_allocator == other.my_allocator) {
+            concurrent_vector trash (std::move(*this));
+            internal_swap(other);
+            if (pocma_t::value) {
+                this->my_allocator = std::move(other.my_allocator);
+            }
+        } else {
+            internal_assign(other, sizeof(T), &destroy_array, &move_assign_array, &move_array);
+        }
+        return *this;
+    }
+#endif
+    //TODO: add an template assignment operator? (i.e. with different element type)
+
+    //! Assignment for vector with different allocator type
+    template<class M>
+    concurrent_vector& operator=( const concurrent_vector<T, M>& vector ) {
+        if( static_cast<void*>( this ) != static_cast<const void*>( &vector ) )
+            internal_assign(vector.internal_vector_base(),
+                sizeof(T), &destroy_array, &assign_array, &copy_array);
+        return *this;
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Assignment for initializer_list
+    concurrent_vector& operator=( std::initializer_list<T> init_list ) {
+        internal_clear(&destroy_array);
+        internal_assign_iterators(init_list.begin(), init_list.end());
+        return *this;
+    }
+#endif //#if __TBB_INITIALIZER_LISTS_PRESENT
+
+    //------------------------------------------------------------------------
+    // Concurrent operations
+    //------------------------------------------------------------------------
+    //! Grow by "delta" elements.
+    /** Returns iterator pointing to the first new element. */
+    iterator grow_by( size_type delta ) {
+        return iterator(*this, delta ? internal_grow_by( delta, sizeof(T), &initialize_array, NULL ) : my_early_size.load());
+    }
+
+    //! Grow by "delta" elements using copying constructor.
+    /** Returns iterator pointing to the first new element. */
+    iterator grow_by( size_type delta, const_reference t ) {
+        return iterator(*this, delta ? internal_grow_by( delta, sizeof(T), &initialize_array_by, static_cast<const void*>(&t) ) : my_early_size.load());
+    }
+
+    /** Returns iterator pointing to the first new element. */
+    template<typename I>
+    iterator grow_by( I first, I last ) {
+        typename std::iterator_traits<I>::difference_type delta = std::distance(first, last);
+        __TBB_ASSERT( delta >= 0, NULL);
+
+        return iterator(*this, delta ? internal_grow_by(delta, sizeof(T), &copy_range<I>, static_cast<const void*>(&first)) : my_early_size.load());
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    /** Returns iterator pointing to the first new element. */
+    iterator grow_by( std::initializer_list<T> init_list ) {
+        return grow_by( init_list.begin(), init_list.end() );
+    }
+#endif //#if __TBB_INITIALIZER_LISTS_PRESENT
+
+    //! Append minimal sequence of elements such that size()>=n.
+    /** The new elements are default constructed.  Blocks until all elements in range [0..n) are allocated.
+        May return while other elements are being constructed by other threads.
+        Returns iterator that points to beginning of appended sequence.
+        If no elements were appended, returns iterator pointing to nth element. */
+    iterator grow_to_at_least( size_type n ) {
+        size_type m=0;
+        if( n ) {
+            m = internal_grow_to_at_least_with_result( n, sizeof(T), &initialize_array, NULL );
+            if( m>n ) m=n;
+        }
+        return iterator(*this, m);
+    };
+
+    /** Analogous to grow_to_at_least( size_type n ) with exception that the new
+        elements are initialized by copying of t instead of default construction. */
+    iterator grow_to_at_least( size_type n, const_reference t ) {
+        size_type m=0;
+        if( n ) {
+            m = internal_grow_to_at_least_with_result( n, sizeof(T), &initialize_array_by, &t);
+            if( m>n ) m=n;
+        }
+        return iterator(*this, m);
+    };
+
+    //! Push item
+    /** Returns iterator pointing to the new element. */
+    iterator push_back( const_reference item )
+    {
+        push_back_helper prolog(*this);
+        new(prolog.internal_push_back_result()) T(item);
+        return prolog.return_iterator_and_dismiss();
+    }
+
+#if    __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Push item, move-aware
+    /** Returns iterator pointing to the new element. */
+    iterator push_back(  T&& item )
+    {
+        push_back_helper prolog(*this);
+        new(prolog.internal_push_back_result()) T(std::move(item));
+        return prolog.return_iterator_and_dismiss();
+    }
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    //! Push item, create item "in place" with provided arguments
+    /** Returns iterator pointing to the new element. */
+    template<typename... Args>
+    iterator emplace_back(  Args&&... args )
+    {
+        push_back_helper prolog(*this);
+        new(prolog.internal_push_back_result()) T(std::forward<Args>(args)...);
+        return prolog.return_iterator_and_dismiss();
+    }
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+    //! Get reference to element at given index.
+    /** This method is thread-safe for concurrent reads, and also while growing the vector,
+        as long as the calling thread has checked that index < size(). */
+    reference operator[]( size_type index ) {
+        return internal_subscript(index);
+    }
+
+    //! Get const reference to element at given index.
+    const_reference operator[]( size_type index ) const {
+        return internal_subscript(index);
+    }
+
+    //! Get reference to element at given index. Throws exceptions on errors.
+    reference at( size_type index ) {
+        return internal_subscript_with_exceptions(index);
+    }
+
+    //! Get const reference to element at given index. Throws exceptions on errors.
+    const_reference at( size_type index ) const {
+        return internal_subscript_with_exceptions(index);
+    }
+
+    //! Get range for iterating with parallel algorithms
+    range_type range( size_t grainsize = 1 ) {
+        return range_type( begin(), end(), grainsize );
+    }
+
+    //! Get const range for iterating with parallel algorithms
+    const_range_type range( size_t grainsize = 1 ) const {
+        return const_range_type( begin(), end(), grainsize );
+    }
+
+    //------------------------------------------------------------------------
+    // Capacity
+    //------------------------------------------------------------------------
+    //! Return size of vector. It may include elements under construction
+    size_type size() const {
+        size_type sz = my_early_size, cp = internal_capacity();
+        return cp < sz ? cp : sz;
+    }
+
+    //! Return false if vector is not empty or has elements under construction at least.
+    bool empty() const {return !my_early_size;}
+
+    //! Maximum size to which array can grow without allocating more memory. Concurrent allocations are not included in the value.
+    size_type capacity() const {return internal_capacity();}
+
+    //! Allocate enough space to grow to size n without having to allocate more memory later.
+    /** Like most of the methods provided for STL compatibility, this method is *not* thread safe.
+        The capacity afterwards may be bigger than the requested reservation. */
+    void reserve( size_type n ) {
+        if( n )
+            internal_reserve(n, sizeof(T), max_size());
+    }
+
+    //! Resize the vector. Not thread-safe.
+    void resize( size_type n ) {
+        internal_resize( n, sizeof(T), max_size(), NULL, &destroy_array, &initialize_array );
+    }
+
+    //! Resize the vector, copy t for new elements. Not thread-safe.
+    void resize( size_type n, const_reference t ) {
+        internal_resize( n, sizeof(T), max_size(), static_cast<const void*>(&t), &destroy_array, &initialize_array_by );
+    }
+
+    //! Optimize memory usage and fragmentation.
+    void shrink_to_fit();
+
+    //! Upper bound on argument to reserve.
+    size_type max_size() const {return (~size_type(0))/sizeof(T);}
+
+    //------------------------------------------------------------------------
+    // STL support
+    //------------------------------------------------------------------------
+
+    //! start iterator
+    iterator begin() {return iterator(*this,0);}
+    //! end iterator
+    iterator end() {return iterator(*this,size());}
+    //! start const iterator
+    const_iterator begin() const {return const_iterator(*this,0);}
+    //! end const iterator
+    const_iterator end() const {return const_iterator(*this,size());}
+    //! start const iterator
+    const_iterator cbegin() const {return const_iterator(*this,0);}
+    //! end const iterator
+    const_iterator cend() const {return const_iterator(*this,size());}
+    //! reverse start iterator
+    reverse_iterator rbegin() {return reverse_iterator(end());}
+    //! reverse end iterator
+    reverse_iterator rend() {return reverse_iterator(begin());}
+    //! reverse start const iterator
+    const_reverse_iterator rbegin() const {return const_reverse_iterator(end());}
+    //! reverse end const iterator
+    const_reverse_iterator rend() const {return const_reverse_iterator(begin());}
+    //! reverse start const iterator
+    const_reverse_iterator crbegin() const {return const_reverse_iterator(end());}
+    //! reverse end const iterator
+    const_reverse_iterator crend() const {return const_reverse_iterator(begin());}
+    //! the first item
+    reference front() {
+        __TBB_ASSERT( size()>0, NULL);
+        const segment_value_t& segment_value = my_segment[0].template load<relaxed>();
+        return (segment_value.template pointer<T>())[0];
+    }
+    //! the first item const
+    const_reference front() const {
+        __TBB_ASSERT( size()>0, NULL);
+        const segment_value_t& segment_value = my_segment[0].template load<relaxed>();
+        return (segment_value.template pointer<const T>())[0];
+    }
+    //! the last item
+    reference back() {
+        __TBB_ASSERT( size()>0, NULL);
+        return internal_subscript( size()-1 );
+    }
+    //! the last item const
+    const_reference back() const {
+        __TBB_ASSERT( size()>0, NULL);
+        return internal_subscript( size()-1 );
+    }
+    //! return allocator object
+    allocator_type get_allocator() const { return this->my_allocator; }
+
+    //! assign n items by copying t item
+    void assign(size_type n, const_reference t) {
+        clear();
+        internal_resize( n, sizeof(T), max_size(), static_cast<const void*>(&t), &destroy_array, &initialize_array_by );
+    }
+
+    //! assign range [first, last)
+    template<class I>
+    void assign(I first, I last) {
+        clear(); internal_assign_range( first, last, static_cast<is_integer_tag<std::numeric_limits<I>::is_integer> *>(0) );
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! assigns an initializer list
+    void assign(std::initializer_list<T> init_list) {
+        clear(); internal_assign_iterators( init_list.begin(), init_list.end());
+    }
+#endif //# __TBB_INITIALIZER_LISTS_PRESENT
+
+    //! swap two instances
+    void swap(concurrent_vector &vector) {
+        using std::swap;
+        if( this != &vector ) {
+            concurrent_vector_base_v3::internal_swap(static_cast<concurrent_vector_base_v3&>(vector));
+            swap(this->my_allocator, vector.my_allocator);
+        }
+    }
+
+    //! Clear container while keeping memory allocated.
+    /** To free up the memory, use in conjunction with method compact(). Not thread safe **/
+    void clear() {
+        internal_clear(&destroy_array);
+    }
+
+    //! Clear and destroy vector.
+    ~concurrent_vector() {
+        segment_t *table = my_segment.load<relaxed>();
+        internal_free_segments( table, internal_clear(&destroy_array), my_first_block.load<relaxed>() );
+        // base class destructor call should be then
+    }
+
+    const internal::concurrent_vector_base_v3 &internal_vector_base() const { return *this; }
+private:
+    //! Allocate k items
+    static void *internal_allocator(internal::concurrent_vector_base_v3 &vb, size_t k) {
+        return static_cast<concurrent_vector<T, A>&>(vb).my_allocator.allocate(k);
+    }
+    //! Free k segments from table
+    void internal_free_segments(segment_t table[], segment_index_t k, segment_index_t first_block);
+
+    //! Get reference to element at given index.
+    T& internal_subscript( size_type index ) const;
+
+    //! Get reference to element at given index with errors checks
+    T& internal_subscript_with_exceptions( size_type index ) const;
+
+    //! assign n items by copying t
+    void internal_assign_n(size_type n, const_pointer p) {
+        internal_resize( n, sizeof(T), max_size(), static_cast<const void*>(p), &destroy_array, p? &initialize_array_by : &initialize_array );
+    }
+
+    //! helper class
+    template<bool B> class is_integer_tag;
+
+    //! assign integer items by copying when arguments are treated as iterators. See C++ Standard 2003 23.1.1p9
+    template<class I>
+    void internal_assign_range(I first, I last, is_integer_tag<true> *) {
+        internal_assign_n(static_cast<size_type>(first), &static_cast<T&>(last));
+    }
+    //! inline proxy assign by iterators
+    template<class I>
+    void internal_assign_range(I first, I last, is_integer_tag<false> *) {
+        internal_assign_iterators(first, last);
+    }
+    //! assign by iterators
+    template<class I>
+    void internal_assign_iterators(I first, I last);
+
+    //these functions are marked __TBB_EXPORTED_FUNC as they are called from within the library
+
+    //! Construct n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC initialize_array( void* begin, const void*, size_type n );
+
+    //! Copy-construct n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC initialize_array_by( void* begin, const void* src, size_type n );
+
+    //! Copy-construct n instances of T by copying single element pointed to by src, starting at "dst".
+    static void __TBB_EXPORTED_FUNC copy_array( void* dst, const void* src, size_type n );
+
+#if __TBB_MOVE_IF_NOEXCEPT_PRESENT
+    //! Either opy or move-construct n instances of T, starting at "dst" by copying according element of src array.
+    static void __TBB_EXPORTED_FUNC move_array_if_noexcept( void* dst, const void* src, size_type n );
+#endif //__TBB_MOVE_IF_NO_EXCEPT_PRESENT
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! Move-construct n instances of T, starting at "dst" by copying according element of src array.
+    static void __TBB_EXPORTED_FUNC move_array( void* dst, const void* src, size_type n );
+
+    //! Move-assign (using operator=) n instances of T, starting at "dst" by assigning according element of src array.
+    static void __TBB_EXPORTED_FUNC move_assign_array( void* dst, const void* src, size_type n );
+#endif
+    //! Copy-construct n instances of T, starting at "dst" by iterator range of [p_type_erased_iterator, p_type_erased_iterator+n).
+    template<typename Iterator>
+    static void __TBB_EXPORTED_FUNC copy_range( void* dst, const void* p_type_erased_iterator, size_type n );
+
+    //! Assign (using operator=) n instances of T, starting at "dst" by assigning according element of src array.
+    static void __TBB_EXPORTED_FUNC assign_array( void* dst, const void* src, size_type n );
+
+    //! Destroy n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC destroy_array( void* begin, size_type n );
+
+    //! Exception-aware helper class for filling a segment by exception-danger operators of user class
+    class internal_loop_guide : internal::no_copy {
+    public:
+        const pointer array;
+        const size_type n;
+        size_type i;
+
+        static const T* as_const_pointer(const void *ptr) { return static_cast<const T *>(ptr); }
+        static T* as_pointer(const void *src) { return static_cast<T*>(const_cast<void *>(src)); }
+
+        internal_loop_guide(size_type ntrials, void *ptr)
+            : array(as_pointer(ptr)), n(ntrials), i(0) {}
+        void init() {   for(; i < n; ++i) new( &array[i] ) T(); }
+        void init(const void *src) { for(; i < n; ++i) new( &array[i] ) T(*as_const_pointer(src)); }
+        void copy(const void *src) { for(; i < n; ++i) new( &array[i] ) T(as_const_pointer(src)[i]); }
+        void assign(const void *src) { for(; i < n; ++i) array[i] = as_const_pointer(src)[i]; }
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        void move_assign(const void *src)       { for(; i < n; ++i) array[i]         =  std::move(as_pointer(src)[i]);   }
+        void move_construct(const void *src)    { for(; i < n; ++i) new( &array[i] ) T( std::move(as_pointer(src)[i]) ); }
+#endif
+#if __TBB_MOVE_IF_NOEXCEPT_PRESENT
+        void move_construct_if_noexcept(const void *src)    { for(; i < n; ++i) new( &array[i] ) T( std::move_if_noexcept(as_pointer(src)[i]) ); }
+#endif //__TBB_MOVE_IF_NOEXCEPT_PRESENT
+
+        //TODO: rename to construct_range
+        template<class I> void iterate(I &src) { for(; i < n; ++i, ++src) new( &array[i] ) T( *src ); }
+        ~internal_loop_guide() {
+            if(i < n) {// if an exception was raised, fill the rest of items with zeros
+                internal::handle_unconstructed_elements(array+i, n-i);
+            }
+        }
+    };
+
+    struct push_back_helper : internal::no_copy{
+        struct element_construction_guard : internal::no_copy{
+            pointer element;
+
+            element_construction_guard(pointer an_element) : element (an_element){}
+            void dismiss(){ element = NULL; }
+            ~element_construction_guard(){
+                if (element){
+                    internal::handle_unconstructed_elements(element, 1);
+                }
+            }
+        };
+
+        concurrent_vector & v;
+        size_type k;
+        element_construction_guard g;
+
+        push_back_helper(concurrent_vector & vector) :
+            v(vector),
+            g (static_cast<T*>(v.internal_push_back(sizeof(T),k)))
+        {}
+
+        pointer internal_push_back_result(){ return g.element;}
+        iterator return_iterator_and_dismiss(){
+            pointer ptr = g.element;
+            g.dismiss();
+            return iterator(v, k, ptr);
+        }
+    };
+};
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+// Deduction guide for the constructor from two iterators
+template<typename I,
+         typename T = typename std::iterator_traits<I>::value_type,
+         typename A = cache_aligned_allocator<T>
+> concurrent_vector(I, I, const A& = A())
+-> concurrent_vector<T, A>;
+
+// Deduction guide for the constructor from a vector and allocator
+template<typename T, typename A1, typename A2>
+concurrent_vector(const concurrent_vector<T, A1> &, const A2 &)
+-> concurrent_vector<T, A2>;
+
+// Deduction guide for the constructor from an initializer_list
+template<typename T, typename A = cache_aligned_allocator<T>
+> concurrent_vector(std::initializer_list<T>, const A& = A())
+-> concurrent_vector<T, A>;
+#endif /* __TBB_CPP17_DEDUCTION_GUIDES_PRESENT */
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+#pragma warning (push)
+#pragma warning (disable: 4701) // potentially uninitialized local variable "old"
+#endif
+template<typename T, class A>
+void concurrent_vector<T, A>::shrink_to_fit() {
+    internal_segments_table old;
+    __TBB_TRY {
+        internal_array_op2 copy_or_move_array =
+#if __TBB_MOVE_IF_NOEXCEPT_PRESENT
+                &move_array_if_noexcept
+#else
+                &copy_array
+#endif
+        ;
+        if( internal_compact( sizeof(T), &old, &destroy_array, copy_or_move_array ) )
+            internal_free_segments( old.table, pointers_per_long_table, old.first_block ); // free joined and unnecessary segments
+    } __TBB_CATCH(...) {
+        if( old.first_block ) // free segment allocated for compacting. Only for support of exceptions in ctor of user T[ype]
+            internal_free_segments( old.table, 1, old.first_block );
+        __TBB_RETHROW();
+    }
+}
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+#pragma warning (pop)
+#endif // warning 4701 is back
+
+template<typename T, class A>
+void concurrent_vector<T, A>::internal_free_segments(segment_t table[], segment_index_t k, segment_index_t first_block) {
+    // Free the arrays
+    while( k > first_block ) {
+        --k;
+        segment_value_t segment_value = table[k].load<relaxed>();
+        table[k].store<relaxed>(segment_not_used());
+        if( segment_value == segment_allocated() ) // check for correct segment pointer
+            this->my_allocator.deallocate( (segment_value.pointer<T>()), segment_size(k) );
+    }
+    segment_value_t segment_value = table[0].load<relaxed>();
+    if( segment_value == segment_allocated() ) {
+        __TBB_ASSERT( first_block > 0, NULL );
+        while(k > 0) table[--k].store<relaxed>(segment_not_used());
+        this->my_allocator.deallocate( (segment_value.pointer<T>()), segment_size(first_block) );
+    }
+}
+
+template<typename T, class A>
+T& concurrent_vector<T, A>::internal_subscript( size_type index ) const {
+    //TODO: unify both versions of internal_subscript
+    __TBB_ASSERT( index < my_early_size, "index out of bounds" );
+    size_type j = index;
+    segment_index_t k = segment_base_index_of( j );
+    __TBB_ASSERT( my_segment.load<acquire>() != my_storage || k < pointers_per_short_table, "index is being allocated" );
+    //no need in load with acquire (load<acquire>) since thread works in own space or gets
+    //the information about added elements via some form of external synchronization
+    //TODO: why not make a load of my_segment relaxed as well ?
+    //TODO: add an assertion that my_segment[k] is properly aligned to please ITT
+    segment_value_t segment_value =  my_segment[k].template load<relaxed>();
+    __TBB_ASSERT( segment_value != segment_allocation_failed(), "the instance is broken by bad allocation. Use at() instead" );
+    __TBB_ASSERT( segment_value != segment_not_used(), "index is being allocated" );
+    return (( segment_value.pointer<T>()))[j];
+}
+
+template<typename T, class A>
+T& concurrent_vector<T, A>::internal_subscript_with_exceptions( size_type index ) const {
+    if( index >= my_early_size )
+        internal::throw_exception(internal::eid_out_of_range); // throw std::out_of_range
+    size_type j = index;
+    segment_index_t k = segment_base_index_of( j );
+    //TODO: refactor this condition into separate helper function, e.g. fits_into_small_table
+    if( my_segment.load<acquire>() == my_storage && k >= pointers_per_short_table )
+        internal::throw_exception(internal::eid_segment_range_error); // throw std::range_error
+    // no need in load with acquire (load<acquire>) since thread works in own space or gets
+    //the information about added elements via some form of external synchronization
+    //TODO: why not make a load of my_segment relaxed as well ?
+    //TODO: add an assertion that my_segment[k] is properly aligned to please ITT
+    segment_value_t segment_value =  my_segment[k].template load<relaxed>();
+    enforce_segment_allocated(segment_value, internal::eid_index_range_error);
+    return (segment_value.pointer<T>())[j];
+}
+
+template<typename T, class A> template<class I>
+void concurrent_vector<T, A>::internal_assign_iterators(I first, I last) {
+    __TBB_ASSERT(my_early_size == 0, NULL);
+    size_type n = std::distance(first, last);
+    if( !n ) return;
+    internal_reserve(n, sizeof(T), max_size());
+    my_early_size = n;
+    segment_index_t k = 0;
+    //TODO: unify segment iteration code with concurrent_base_v3::helper
+    size_type sz = segment_size( my_first_block );
+    while( sz < n ) {
+        internal_loop_guide loop(sz, my_segment[k].template load<relaxed>().template pointer<void>());
+        loop.iterate(first);
+        n -= sz;
+        if( !k ) k = my_first_block;
+        else { ++k; sz <<= 1; }
+    }
+    internal_loop_guide loop(n, my_segment[k].template load<relaxed>().template pointer<void>());
+    loop.iterate(first);
+}
+
+template<typename T, class A>
+void concurrent_vector<T, A>::initialize_array( void* begin, const void *, size_type n ) {
+    internal_loop_guide loop(n, begin); loop.init();
+}
+
+template<typename T, class A>
+void concurrent_vector<T, A>::initialize_array_by( void* begin, const void *src, size_type n ) {
+    internal_loop_guide loop(n, begin); loop.init(src);
+}
+
+template<typename T, class A>
+void concurrent_vector<T, A>::copy_array( void* dst, const void* src, size_type n ) {
+    internal_loop_guide loop(n, dst); loop.copy(src);
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<typename T, class A>
+void concurrent_vector<T, A>::move_array( void* dst, const void* src, size_type n ) {
+    internal_loop_guide loop(n, dst); loop.move_construct(src);
+}
+template<typename T, class A>
+void concurrent_vector<T, A>::move_assign_array( void* dst, const void* src, size_type n ) {
+    internal_loop_guide loop(n, dst); loop.move_assign(src);
+}
+#endif
+
+#if __TBB_MOVE_IF_NOEXCEPT_PRESENT
+template<typename T, class A>
+void concurrent_vector<T, A>::move_array_if_noexcept( void* dst, const void* src, size_type n ) {
+    internal_loop_guide loop(n, dst); loop.move_construct_if_noexcept(src);
+}
+#endif //__TBB_MOVE_IF_NOEXCEPT_PRESENT
+
+template<typename T, class A>
+template<typename I>
+void concurrent_vector<T, A>::copy_range( void* dst, const void* p_type_erased_iterator, size_type n ){
+    internal_loop_guide loop(n, dst);
+    loop.iterate( *(static_cast<I*>(const_cast<void*>(p_type_erased_iterator))) );
+}
+
+template<typename T, class A>
+void concurrent_vector<T, A>::assign_array( void* dst, const void* src, size_type n ) {
+    internal_loop_guide loop(n, dst); loop.assign(src);
+}
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warning
+    #pragma warning (push)
+    #pragma warning (disable: 4189)
+#endif
+template<typename T, class A>
+void concurrent_vector<T, A>::destroy_array( void* begin, size_type n ) {
+    T* array = static_cast<T*>(begin);
+    for( size_type j=n; j>0; --j )
+        array[j-1].~T(); // destructors are supposed to not throw any exceptions
+}
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4189 is back
+
+// concurrent_vector's template functions
+template<typename T, class A1, class A2>
+inline bool operator==(const concurrent_vector<T, A1> &a, const concurrent_vector<T, A2> &b) {
+    //TODO: call size() only once per vector (in operator==)
+    // Simply:    return a.size() == b.size() && std::equal(a.begin(), a.end(), b.begin());
+    if(a.size() != b.size()) return false;
+    typename concurrent_vector<T, A1>::const_iterator i(a.begin());
+    typename concurrent_vector<T, A2>::const_iterator j(b.begin());
+    for(; i != a.end(); ++i, ++j)
+        if( !(*i == *j) ) return false;
+    return true;
+}
+
+template<typename T, class A1, class A2>
+inline bool operator!=(const concurrent_vector<T, A1> &a, const concurrent_vector<T, A2> &b)
+{    return !(a == b); }
+
+template<typename T, class A1, class A2>
+inline bool operator<(const concurrent_vector<T, A1> &a, const concurrent_vector<T, A2> &b)
+{    return (std::lexicographical_compare(a.begin(), a.end(), b.begin(), b.end())); }
+
+template<typename T, class A1, class A2>
+inline bool operator>(const concurrent_vector<T, A1> &a, const concurrent_vector<T, A2> &b)
+{    return b < a; }
+
+template<typename T, class A1, class A2>
+inline bool operator<=(const concurrent_vector<T, A1> &a, const concurrent_vector<T, A2> &b)
+{    return !(b < a); }
+
+template<typename T, class A1, class A2>
+inline bool operator>=(const concurrent_vector<T, A1> &a, const concurrent_vector<T, A2> &b)
+{    return !(a < b); }
+
+template<typename T, class A>
+inline void swap(concurrent_vector<T, A> &a, concurrent_vector<T, A> &b)
+{    a.swap( b ); }
+
+} // namespace tbb
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4267,4127 are back
+
+#endif /* __TBB_concurrent_vector_H */
diff --git a/xdl/third_party/tbb/include/tbb/critical_section.h b/xdl/third_party/tbb/include/tbb/critical_section.h
new file mode 100644
index 00000000..8c4c9c70
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/critical_section.h
@@ -0,0 +1,133 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_CRITICAL_SECTION_H_
+#define _TBB_CRITICAL_SECTION_H_
+
+#if _WIN32||_WIN64
+#include "machine/windows_api.h"
+#else
+#include <pthread.h>
+#include <errno.h>
+#endif  // _WIN32||WIN64
+
+#include "tbb_stddef.h"
+#include "tbb_thread.h"
+#include "tbb_exception.h"
+
+#include "tbb_profiling.h"
+
+namespace tbb {
+
+    namespace internal {
+class critical_section_v4 : internal::no_copy {
+#if _WIN32||_WIN64
+    CRITICAL_SECTION my_impl;
+#else
+    pthread_mutex_t my_impl;
+#endif
+    tbb_thread::id my_tid;
+public:
+
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    critical_section_v4() {
+#if _WIN32||_WIN64
+        InitializeCriticalSectionEx( &my_impl, 4000, 0 );
+#else
+        pthread_mutex_init(&my_impl, NULL);
+#endif
+        internal_construct();
+    }
+
+    ~critical_section_v4() {
+        __TBB_ASSERT(my_tid == tbb_thread::id(), "Destroying a still-held critical section");
+#if _WIN32||_WIN64
+        DeleteCriticalSection(&my_impl);
+#else
+        pthread_mutex_destroy(&my_impl);
+#endif
+    }
+
+    class scoped_lock : internal::no_copy {
+    private:
+        critical_section_v4 &my_crit;
+    public:
+        scoped_lock( critical_section_v4& lock_me) :my_crit(lock_me) {
+            my_crit.lock();
+        }
+
+        ~scoped_lock() {
+            my_crit.unlock();
+        }
+    };
+
+    void lock() {
+        tbb_thread::id local_tid = this_tbb_thread::get_id();
+        if(local_tid == my_tid) throw_exception( eid_improper_lock );
+#if _WIN32||_WIN64
+        EnterCriticalSection( &my_impl );
+#else
+        int rval = pthread_mutex_lock(&my_impl);
+        __TBB_ASSERT_EX(!rval, "critical_section::lock: pthread_mutex_lock failed");
+#endif
+        __TBB_ASSERT(my_tid == tbb_thread::id(), NULL);
+        my_tid = local_tid;
+    }
+
+    bool try_lock() {
+        bool gotlock;
+        tbb_thread::id local_tid = this_tbb_thread::get_id();
+        if(local_tid == my_tid) return false;
+#if _WIN32||_WIN64
+        gotlock = TryEnterCriticalSection( &my_impl ) != 0;
+#else
+        int rval = pthread_mutex_trylock(&my_impl);
+        // valid returns are 0 (locked) and [EBUSY]
+        __TBB_ASSERT(rval == 0 || rval == EBUSY, "critical_section::trylock: pthread_mutex_trylock failed");
+        gotlock = rval == 0;
+#endif
+        if(gotlock)  {
+            my_tid = local_tid;
+        }
+        return gotlock;
+    }
+
+    void unlock() {
+        __TBB_ASSERT(this_tbb_thread::get_id() == my_tid, "thread unlocking critical_section is not thread that locked it");
+        my_tid = tbb_thread::id();
+#if _WIN32||_WIN64
+        LeaveCriticalSection( &my_impl );
+#else
+        int rval = pthread_mutex_unlock(&my_impl);
+        __TBB_ASSERT_EX(!rval, "critical_section::unlock: pthread_mutex_unlock failed");
+#endif
+    }
+
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = true;
+}; // critical_section_v4
+} // namespace internal
+typedef internal::critical_section_v4 critical_section;
+
+__TBB_DEFINE_PROFILING_SET_NAME(critical_section)
+} // namespace tbb
+#endif  // _TBB_CRITICAL_SECTION_H_
diff --git a/xdl/third_party/tbb/include/tbb/enumerable_thread_specific.h b/xdl/third_party/tbb/include/tbb/enumerable_thread_specific.h
new file mode 100644
index 00000000..cd9c18aa
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/enumerable_thread_specific.h
@@ -0,0 +1,1137 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_enumerable_thread_specific_H
+#define __TBB_enumerable_thread_specific_H
+
+#include "atomic.h"
+#include "concurrent_vector.h"
+#include "tbb_thread.h"
+#include "tbb_allocator.h"
+#include "cache_aligned_allocator.h"
+#include "aligned_space.h"
+#include "internal/_template_helpers.h"
+#include "internal/_tbb_hash_compare_impl.h"
+#include "tbb_profiling.h"
+#include <string.h>  // for memcpy
+
+#if _WIN32||_WIN64
+#include "machine/windows_api.h"
+#else
+#include <pthread.h>
+#endif
+
+#define __TBB_ETS_USE_CPP11 \
+    (__TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT \
+     && __TBB_CPP11_DECLTYPE_PRESENT && __TBB_CPP11_LAMBDAS_PRESENT)
+
+namespace tbb {
+
+//! enum for selecting between single key and key-per-instance versions
+enum ets_key_usage_type { ets_key_per_instance, ets_no_key };
+
+namespace interface6 {
+
+    // Forward declaration to use in internal classes
+    template <typename T, typename Allocator, ets_key_usage_type ETS_key_type>
+    class enumerable_thread_specific;
+
+    //! @cond
+    namespace internal {
+
+        using namespace tbb::internal;
+
+        template<ets_key_usage_type ETS_key_type>
+        class ets_base: tbb::internal::no_copy {
+        protected:
+            typedef tbb_thread::id key_type;
+#if __TBB_PROTECTED_NESTED_CLASS_BROKEN
+        public:
+#endif
+            struct slot;
+
+            struct array {
+                array* next;
+                size_t lg_size;
+                slot& at( size_t k ) {
+                    return ((slot*)(void*)(this+1))[k];
+                }
+                size_t size() const {return size_t(1)<<lg_size;}
+                size_t mask() const {return size()-1;}
+                size_t start( size_t h ) const {
+                    return h>>(8*sizeof(size_t)-lg_size);
+                }
+            };
+            struct slot {
+                key_type key;
+                void* ptr;
+                bool empty() const {return key == key_type();}
+                bool match( key_type k ) const {return key == k;}
+                bool claim( key_type k ) {
+                    // TODO: maybe claim ptr, because key_type is not guaranteed to fit into word size
+                    return atomic_compare_and_swap(key, k, key_type()) == key_type();
+                }
+            };
+#if __TBB_PROTECTED_NESTED_CLASS_BROKEN
+        protected:
+#endif
+
+            //! Root of linked list of arrays of decreasing size.
+            /** NULL if and only if my_count==0.
+                Each array in the list is half the size of its predecessor. */
+            atomic<array*> my_root;
+            atomic<size_t> my_count;
+            virtual void* create_local() = 0;
+            virtual void* create_array(size_t _size) = 0;  // _size in bytes
+            virtual void free_array(void* ptr, size_t _size) = 0; // _size in bytes
+            array* allocate( size_t lg_size ) {
+                size_t n = size_t(1)<<lg_size;
+                array* a = static_cast<array*>(create_array( sizeof(array)+n*sizeof(slot) ));
+                a->lg_size = lg_size;
+                std::memset( a+1, 0, n*sizeof(slot) );
+                return a;
+            }
+            void free(array* a) {
+                size_t n = size_t(1)<<(a->lg_size);
+                free_array( (void *)a, size_t(sizeof(array)+n*sizeof(slot)) );
+            }
+
+            ets_base() {my_root=NULL; my_count=0;}
+            virtual ~ets_base();  // g++ complains if this is not virtual
+            void* table_lookup( bool& exists );
+            void table_clear();
+            // The following functions are not used in concurrent context,
+            // so we don't need synchronization and ITT annotations there.
+            void table_elementwise_copy( const ets_base& other,
+                                         void*(*add_element)(ets_base&, void*) ) {
+                __TBB_ASSERT(!my_root,NULL);
+                __TBB_ASSERT(!my_count,NULL);
+                if( !other.my_root ) return;
+                array* root = my_root = allocate(other.my_root->lg_size);
+                root->next = NULL;
+                my_count = other.my_count;
+                size_t mask = root->mask();
+                for( array* r=other.my_root; r; r=r->next ) {
+                    for( size_t i=0; i<r->size(); ++i ) {
+                        slot& s1 = r->at(i);
+                        if( !s1.empty() ) {
+                            for( size_t j = root->start(tbb::tbb_hash<key_type>()(s1.key)); ; j=(j+1)&mask ) {
+                                slot& s2 = root->at(j);
+                                if( s2.empty() ) {
+                                    s2.ptr = add_element(*this, s1.ptr);
+                                    s2.key = s1.key;
+                                    break;
+                                }
+                                else if( s2.match(s1.key) )
+                                    break;
+                            }
+                        }
+                    }
+                }
+            }
+            void table_swap( ets_base& other ) {
+               __TBB_ASSERT(this!=&other, "Don't swap an instance with itself");
+               tbb::internal::swap<relaxed>(my_root, other.my_root);
+               tbb::internal::swap<relaxed>(my_count, other.my_count);
+            }
+        };
+
+        template<ets_key_usage_type ETS_key_type>
+        ets_base<ETS_key_type>::~ets_base() {
+            __TBB_ASSERT(!my_root, NULL);
+        }
+
+        template<ets_key_usage_type ETS_key_type>
+        void ets_base<ETS_key_type>::table_clear() {
+            while( array* r = my_root ) {
+                my_root = r->next;
+                free(r);
+            }
+            my_count = 0;
+        }
+
+        template<ets_key_usage_type ETS_key_type>
+        void* ets_base<ETS_key_type>::table_lookup( bool& exists ) {
+            const key_type k = tbb::this_tbb_thread::get_id();
+
+            __TBB_ASSERT(k != key_type(),NULL);
+            void* found;
+            size_t h = tbb::tbb_hash<key_type>()(k);
+            for( array* r=my_root; r; r=r->next ) {
+                call_itt_notify(acquired,r);
+                size_t mask=r->mask();
+                for(size_t i = r->start(h); ;i=(i+1)&mask) {
+                    slot& s = r->at(i);
+                    if( s.empty() ) break;
+                    if( s.match(k) ) {
+                        if( r==my_root ) {
+                            // Success at top level
+                            exists = true;
+                            return s.ptr;
+                        } else {
+                            // Success at some other level.  Need to insert at top level.
+                            exists = true;
+                            found = s.ptr;
+                            goto insert;
+                        }
+                    }
+                }
+            }
+            // Key does not yet exist.  The density of slots in the table does not exceed 0.5,
+            // for if this will occur a new table is allocated with double the current table
+            // size, which is swapped in as the new root table.  So an empty slot is guaranteed.
+            exists = false;
+            found = create_local();
+            {
+                size_t c = ++my_count;
+                array* r = my_root;
+                call_itt_notify(acquired,r);
+                if( !r || c>r->size()/2 ) {
+                    size_t s = r ? r->lg_size : 2;
+                    while( c>size_t(1)<<(s-1) ) ++s;
+                    array* a = allocate(s);
+                    for(;;) {
+                        a->next = r;
+                        call_itt_notify(releasing,a);
+                        array* new_r = my_root.compare_and_swap(a,r);
+                        if( new_r==r ) break;
+                        call_itt_notify(acquired, new_r);
+                        if( new_r->lg_size>=s ) {
+                            // Another thread inserted an equal or  bigger array, so our array is superfluous.
+                            free(a);
+                            break;
+                        }
+                        r = new_r;
+                    }
+                }
+            }
+        insert:
+        // Whether a slot has been found in an older table, or if it has been inserted at this level,
+        // it has already been accounted for in the total.  Guaranteed to be room for it, and it is
+        // not present, so search for empty slot and use it.
+            array* ir = my_root;
+            call_itt_notify(acquired, ir);
+            size_t mask = ir->mask();
+            for(size_t i = ir->start(h);;i=(i+1)&mask) {
+                slot& s = ir->at(i);
+                if( s.empty() ) {
+                    if( s.claim(k) ) {
+                        s.ptr = found;
+                        return found;
+                    }
+                }
+            }
+        }
+
+        //! Specialization that exploits native TLS
+        template <>
+        class ets_base<ets_key_per_instance>: protected ets_base<ets_no_key> {
+            typedef ets_base<ets_no_key> super;
+#if _WIN32||_WIN64
+#if __TBB_WIN8UI_SUPPORT
+            typedef DWORD tls_key_t;
+            void create_key() { my_key = FlsAlloc(NULL); }
+            void destroy_key() { FlsFree(my_key); }
+            void set_tls(void * value) { FlsSetValue(my_key, (LPVOID)value); }
+            void* get_tls() { return (void *)FlsGetValue(my_key); }
+#else
+            typedef DWORD tls_key_t;
+            void create_key() { my_key = TlsAlloc(); }
+            void destroy_key() { TlsFree(my_key); }
+            void set_tls(void * value) { TlsSetValue(my_key, (LPVOID)value); }
+            void* get_tls() { return (void *)TlsGetValue(my_key); }
+#endif
+#else
+            typedef pthread_key_t tls_key_t;
+            void create_key() { pthread_key_create(&my_key, NULL); }
+            void destroy_key() { pthread_key_delete(my_key); }
+            void set_tls( void * value ) const { pthread_setspecific(my_key, value); }
+            void* get_tls() const { return pthread_getspecific(my_key); }
+#endif
+            tls_key_t my_key;
+            virtual void* create_local() __TBB_override = 0;
+            virtual void* create_array(size_t _size) __TBB_override = 0;  // _size in bytes
+            virtual void free_array(void* ptr, size_t _size) __TBB_override = 0; // size in bytes
+        protected:
+            ets_base() {create_key();}
+            ~ets_base() {destroy_key();}
+            void* table_lookup( bool& exists ) {
+                void* found = get_tls();
+                if( found ) {
+                    exists=true;
+                } else {
+                    found = super::table_lookup(exists);
+                    set_tls(found);
+                }
+                return found;
+            }
+            void table_clear() {
+                destroy_key();
+                create_key();
+                super::table_clear();
+            }
+            void table_swap( ets_base& other ) {
+               using std::swap;
+               __TBB_ASSERT(this!=&other, "Don't swap an instance with itself");
+               swap(my_key, other.my_key);
+               super::table_swap(other);
+            }
+        };
+
+        //! Random access iterator for traversing the thread local copies.
+        template< typename Container, typename Value >
+        class enumerable_thread_specific_iterator
+#if defined(_WIN64) && defined(_MSC_VER)
+            // Ensure that Microsoft's internal template function _Val_type works correctly.
+            : public std::iterator<std::random_access_iterator_tag,Value>
+#endif /* defined(_WIN64) && defined(_MSC_VER) */
+        {
+            //! current position in the concurrent_vector
+
+            Container *my_container;
+            typename Container::size_type my_index;
+            mutable Value *my_value;
+
+            template<typename C, typename T>
+            friend enumerable_thread_specific_iterator<C,T>
+            operator+( ptrdiff_t offset, const enumerable_thread_specific_iterator<C,T>& v );
+
+            template<typename C, typename T, typename U>
+            friend bool operator==( const enumerable_thread_specific_iterator<C,T>& i,
+                                    const enumerable_thread_specific_iterator<C,U>& j );
+
+            template<typename C, typename T, typename U>
+            friend bool operator<( const enumerable_thread_specific_iterator<C,T>& i,
+                                   const enumerable_thread_specific_iterator<C,U>& j );
+
+            template<typename C, typename T, typename U>
+            friend ptrdiff_t operator-( const enumerable_thread_specific_iterator<C,T>& i,
+                                        const enumerable_thread_specific_iterator<C,U>& j );
+
+            template<typename C, typename U>
+            friend class enumerable_thread_specific_iterator;
+
+            public:
+
+            enumerable_thread_specific_iterator( const Container &container, typename Container::size_type index ) :
+                my_container(&const_cast<Container &>(container)), my_index(index), my_value(NULL) {}
+
+            //! Default constructor
+            enumerable_thread_specific_iterator() : my_container(NULL), my_index(0), my_value(NULL) {}
+
+            template<typename U>
+            enumerable_thread_specific_iterator( const enumerable_thread_specific_iterator<Container, U>& other ) :
+                    my_container( other.my_container ), my_index( other.my_index), my_value( const_cast<Value *>(other.my_value) ) {}
+
+            enumerable_thread_specific_iterator operator+( ptrdiff_t offset ) const {
+                return enumerable_thread_specific_iterator(*my_container, my_index + offset);
+            }
+
+            enumerable_thread_specific_iterator &operator+=( ptrdiff_t offset ) {
+                my_index += offset;
+                my_value = NULL;
+                return *this;
+            }
+
+            enumerable_thread_specific_iterator operator-( ptrdiff_t offset ) const {
+                return enumerable_thread_specific_iterator( *my_container, my_index-offset );
+            }
+
+            enumerable_thread_specific_iterator &operator-=( ptrdiff_t offset ) {
+                my_index -= offset;
+                my_value = NULL;
+                return *this;
+            }
+
+            Value& operator*() const {
+                Value* value = my_value;
+                if( !value ) {
+                    value = my_value = (*my_container)[my_index].value();
+                }
+                __TBB_ASSERT( value==(*my_container)[my_index].value(), "corrupt cache" );
+                return *value;
+            }
+
+            Value& operator[]( ptrdiff_t k ) const {
+               return (*my_container)[my_index + k].value;
+            }
+
+            Value* operator->() const {return &operator*();}
+
+            enumerable_thread_specific_iterator& operator++() {
+                ++my_index;
+                my_value = NULL;
+                return *this;
+            }
+
+            enumerable_thread_specific_iterator& operator--() {
+                --my_index;
+                my_value = NULL;
+                return *this;
+            }
+
+            //! Post increment
+            enumerable_thread_specific_iterator operator++(int) {
+                enumerable_thread_specific_iterator result = *this;
+                ++my_index;
+                my_value = NULL;
+                return result;
+            }
+
+            //! Post decrement
+            enumerable_thread_specific_iterator operator--(int) {
+                enumerable_thread_specific_iterator result = *this;
+                --my_index;
+                my_value = NULL;
+                return result;
+            }
+
+            // STL support
+            typedef ptrdiff_t difference_type;
+            typedef Value value_type;
+            typedef Value* pointer;
+            typedef Value& reference;
+            typedef std::random_access_iterator_tag iterator_category;
+        };
+
+        template<typename Container, typename T>
+        enumerable_thread_specific_iterator<Container,T>
+        operator+( ptrdiff_t offset, const enumerable_thread_specific_iterator<Container,T>& v ) {
+            return enumerable_thread_specific_iterator<Container,T>( v.my_container, v.my_index + offset );
+        }
+
+        template<typename Container, typename T, typename U>
+        bool operator==( const enumerable_thread_specific_iterator<Container,T>& i,
+                         const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return i.my_index==j.my_index && i.my_container == j.my_container;
+        }
+
+        template<typename Container, typename T, typename U>
+        bool operator!=( const enumerable_thread_specific_iterator<Container,T>& i,
+                         const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return !(i==j);
+        }
+
+        template<typename Container, typename T, typename U>
+        bool operator<( const enumerable_thread_specific_iterator<Container,T>& i,
+                        const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return i.my_index<j.my_index;
+        }
+
+        template<typename Container, typename T, typename U>
+        bool operator>( const enumerable_thread_specific_iterator<Container,T>& i,
+                        const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return j<i;
+        }
+
+        template<typename Container, typename T, typename U>
+        bool operator>=( const enumerable_thread_specific_iterator<Container,T>& i,
+                         const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return !(i<j);
+        }
+
+        template<typename Container, typename T, typename U>
+        bool operator<=( const enumerable_thread_specific_iterator<Container,T>& i,
+                         const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return !(j<i);
+        }
+
+        template<typename Container, typename T, typename U>
+        ptrdiff_t operator-( const enumerable_thread_specific_iterator<Container,T>& i,
+                             const enumerable_thread_specific_iterator<Container,U>& j ) {
+            return i.my_index-j.my_index;
+        }
+
+    template<typename SegmentedContainer, typename Value >
+        class segmented_iterator
+#if defined(_WIN64) && defined(_MSC_VER)
+        : public std::iterator<std::input_iterator_tag, Value>
+#endif
+        {
+            template<typename C, typename T, typename U>
+            friend bool operator==(const segmented_iterator<C,T>& i, const segmented_iterator<C,U>& j);
+
+            template<typename C, typename T, typename U>
+            friend bool operator!=(const segmented_iterator<C,T>& i, const segmented_iterator<C,U>& j);
+
+            template<typename C, typename U>
+            friend class segmented_iterator;
+
+            public:
+
+                segmented_iterator() {my_segcont = NULL;}
+
+                segmented_iterator( const SegmentedContainer& _segmented_container ) :
+                    my_segcont(const_cast<SegmentedContainer*>(&_segmented_container)),
+                    outer_iter(my_segcont->end()) { }
+
+                ~segmented_iterator() {}
+
+                typedef typename SegmentedContainer::iterator outer_iterator;
+                typedef typename SegmentedContainer::value_type InnerContainer;
+                typedef typename InnerContainer::iterator inner_iterator;
+
+                // STL support
+                typedef ptrdiff_t difference_type;
+                typedef Value value_type;
+                typedef typename SegmentedContainer::size_type size_type;
+                typedef Value* pointer;
+                typedef Value& reference;
+                typedef std::input_iterator_tag iterator_category;
+
+                // Copy Constructor
+                template<typename U>
+                segmented_iterator(const segmented_iterator<SegmentedContainer, U>& other) :
+                    my_segcont(other.my_segcont),
+                    outer_iter(other.outer_iter),
+                    // can we assign a default-constructed iterator to inner if we're at the end?
+                    inner_iter(other.inner_iter)
+                {}
+
+                // assignment
+                template<typename U>
+                segmented_iterator& operator=( const segmented_iterator<SegmentedContainer, U>& other) {
+                    if(this != &other) {
+                        my_segcont = other.my_segcont;
+                        outer_iter = other.outer_iter;
+                        if(outer_iter != my_segcont->end()) inner_iter = other.inner_iter;
+                    }
+                    return *this;
+                }
+
+                // allow assignment of outer iterator to segmented iterator.  Once it is
+                // assigned, move forward until a non-empty inner container is found or
+                // the end of the outer container is reached.
+                segmented_iterator& operator=(const outer_iterator& new_outer_iter) {
+                    __TBB_ASSERT(my_segcont != NULL, NULL);
+                    // check that this iterator points to something inside the segmented container
+                    for(outer_iter = new_outer_iter ;outer_iter!=my_segcont->end(); ++outer_iter) {
+                        if( !outer_iter->empty() ) {
+                            inner_iter = outer_iter->begin();
+                            break;
+                        }
+                    }
+                    return *this;
+                }
+
+                // pre-increment
+                segmented_iterator& operator++() {
+                    advance_me();
+                    return *this;
+                }
+
+                // post-increment
+                segmented_iterator operator++(int) {
+                    segmented_iterator tmp = *this;
+                    operator++();
+                    return tmp;
+                }
+
+                bool operator==(const outer_iterator& other_outer) const {
+                    __TBB_ASSERT(my_segcont != NULL, NULL);
+                    return (outer_iter == other_outer &&
+                            (outer_iter == my_segcont->end() || inner_iter == outer_iter->begin()));
+                }
+
+                bool operator!=(const outer_iterator& other_outer) const {
+                    return !operator==(other_outer);
+
+                }
+
+                // (i)* RHS
+                reference operator*() const {
+                    __TBB_ASSERT(my_segcont != NULL, NULL);
+                    __TBB_ASSERT(outer_iter != my_segcont->end(), "Dereferencing a pointer at end of container");
+                    __TBB_ASSERT(inner_iter != outer_iter->end(), NULL); // should never happen
+                    return *inner_iter;
+                }
+
+                // i->
+                pointer operator->() const { return &operator*();}
+
+            private:
+                SegmentedContainer*             my_segcont;
+                outer_iterator outer_iter;
+                inner_iterator inner_iter;
+
+                void advance_me() {
+                    __TBB_ASSERT(my_segcont != NULL, NULL);
+                    __TBB_ASSERT(outer_iter != my_segcont->end(), NULL); // not true if there are no inner containers
+                    __TBB_ASSERT(inner_iter != outer_iter->end(), NULL); // not true if the inner containers are all empty.
+                    ++inner_iter;
+                    while(inner_iter == outer_iter->end() && ++outer_iter != my_segcont->end()) {
+                        inner_iter = outer_iter->begin();
+                    }
+                }
+        };    // segmented_iterator
+
+        template<typename SegmentedContainer, typename T, typename U>
+        bool operator==( const segmented_iterator<SegmentedContainer,T>& i,
+                         const segmented_iterator<SegmentedContainer,U>& j ) {
+            if(i.my_segcont != j.my_segcont) return false;
+            if(i.my_segcont == NULL) return true;
+            if(i.outer_iter != j.outer_iter) return false;
+            if(i.outer_iter == i.my_segcont->end()) return true;
+            return i.inner_iter == j.inner_iter;
+        }
+
+        // !=
+        template<typename SegmentedContainer, typename T, typename U>
+        bool operator!=( const segmented_iterator<SegmentedContainer,T>& i,
+                         const segmented_iterator<SegmentedContainer,U>& j ) {
+            return !(i==j);
+        }
+
+        template<typename T>
+        struct construct_by_default: tbb::internal::no_assign {
+            void construct(void*where) {new(where) T();} // C++ note: the () in T() ensure zero initialization.
+            construct_by_default( int ) {}
+        };
+
+        template<typename T>
+        struct construct_by_exemplar: tbb::internal::no_assign {
+            const T exemplar;
+            void construct(void*where) {new(where) T(exemplar);}
+            construct_by_exemplar( const T& t ) : exemplar(t) {}
+#if __TBB_ETS_USE_CPP11
+            construct_by_exemplar( T&& t ) : exemplar(std::move(t)) {}
+#endif
+        };
+
+        template<typename T, typename Finit>
+        struct construct_by_finit: tbb::internal::no_assign {
+            Finit f;
+            void construct(void* where) {new(where) T(f());}
+            construct_by_finit( const Finit& f_ ) : f(f_) {}
+#if __TBB_ETS_USE_CPP11
+            construct_by_finit( Finit&& f_ ) : f(std::move(f_)) {}
+#endif
+        };
+
+#if __TBB_ETS_USE_CPP11
+        template<typename T, typename... P>
+        struct construct_by_args: tbb::internal::no_assign {
+            internal::stored_pack<P...> pack;
+            void construct(void* where) {
+                internal::call( [where](const typename strip<P>::type&... args ){
+                   new(where) T(args...);
+                }, pack );
+            }
+            construct_by_args( P&& ... args ) : pack(std::forward<P>(args)...) {}
+        };
+#endif
+
+        // storage for initialization function pointer
+        // TODO: consider removing the template parameter T here and in callback_leaf
+        template<typename T>
+        class callback_base {
+        public:
+            // Clone *this
+            virtual callback_base* clone() const = 0;
+            // Destruct and free *this
+            virtual void destroy() = 0;
+            // Need virtual destructor to satisfy GCC compiler warning
+            virtual ~callback_base() { }
+            // Construct T at where
+            virtual void construct(void* where) = 0;
+        };
+
+        template <typename T, typename Constructor>
+        class callback_leaf: public callback_base<T>, Constructor {
+#if __TBB_ETS_USE_CPP11
+            template<typename... P> callback_leaf( P&& ... params ) : Constructor(std::forward<P>(params)...) {}
+#else
+            template<typename X> callback_leaf( const X& x ) : Constructor(x) {}
+#endif
+            // TODO: make the construction/destruction consistent (use allocator.construct/destroy)
+            typedef typename tbb::tbb_allocator<callback_leaf> my_allocator_type;
+
+            callback_base<T>* clone() const __TBB_override {
+                return make(*this);
+            }
+
+            void destroy() __TBB_override {
+                my_allocator_type().destroy(this);
+                my_allocator_type().deallocate(this,1);
+            }
+
+            void construct(void* where) __TBB_override {
+                Constructor::construct(where);
+            }
+        public:
+#if __TBB_ETS_USE_CPP11
+            template<typename... P>
+            static callback_base<T>* make( P&& ... params ) {
+                void* where = my_allocator_type().allocate(1);
+                return new(where) callback_leaf( std::forward<P>(params)... );
+            }
+#else
+            template<typename X>
+            static callback_base<T>* make( const X& x ) {
+                void* where = my_allocator_type().allocate(1);
+                return new(where) callback_leaf(x);
+            }
+#endif
+        };
+
+        //! Template for recording construction of objects in table
+        /** All maintenance of the space will be done explicitly on push_back,
+            and all thread local copies must be destroyed before the concurrent
+            vector is deleted.
+
+            The flag is_built is initialized to false.  When the local is
+            successfully-constructed, set the flag to true or call value_committed().
+            If the constructor throws, the flag will be false.
+        */
+        template<typename U>
+        struct ets_element {
+            tbb::aligned_space<U> my_space;
+            bool is_built;
+            ets_element() { is_built = false; }  // not currently-built
+            U* value() { return my_space.begin(); }
+            U* value_committed() { is_built = true; return my_space.begin(); }
+            ~ets_element() {
+                if(is_built) {
+                    my_space.begin()->~U();
+                    is_built = false;
+                }
+            }
+        };
+
+        // A predicate that can be used for a compile-time compatibility check of ETS instances
+        // Ideally, it should have been declared inside the ETS class, but unfortunately
+        // in that case VS2013 does not enable the variadic constructor.
+        template<typename T, typename ETS> struct is_compatible_ets { static const bool value = false; };
+        template<typename T, typename U, typename A, ets_key_usage_type C>
+        struct is_compatible_ets< T, enumerable_thread_specific<U,A,C> > { static const bool value = internal::is_same_type<T,U>::value; };
+
+#if __TBB_ETS_USE_CPP11
+        // A predicate that checks whether, for a variable 'foo' of type T, foo() is a valid expression
+        template <typename T>
+        class is_callable_no_args {
+        private:
+            typedef char yes[1];
+            typedef char no [2];
+
+            template<typename U> static yes& decide( decltype(declval<U>()())* );
+            template<typename U> static no&  decide(...);
+        public:
+            static const bool value = (sizeof(decide<T>(NULL)) == sizeof(yes));
+        };
+#endif
+
+    } // namespace internal
+    //! @endcond
+
+    //! The enumerable_thread_specific container
+    /** enumerable_thread_specific has the following properties:
+        - thread-local copies are lazily created, with default, exemplar or function initialization.
+        - thread-local copies do not move (during lifetime, and excepting clear()) so the address of a copy is invariant.
+        - the contained objects need not have operator=() defined if combine is not used.
+        - enumerable_thread_specific containers may be copy-constructed or assigned.
+        - thread-local copies can be managed by hash-table, or can be accessed via TLS storage for speed.
+        - outside of parallel contexts, the contents of all thread-local copies are accessible by iterator or using combine or combine_each methods
+
+    @par Segmented iterator
+        When the thread-local objects are containers with input_iterators defined, a segmented iterator may
+        be used to iterate over all the elements of all thread-local copies.
+
+    @par combine and combine_each
+        - Both methods are defined for enumerable_thread_specific.
+        - combine() requires the type T have operator=() defined.
+        - neither method modifies the contents of the object (though there is no guarantee that the applied methods do not modify the object.)
+        - Both are evaluated in serial context (the methods are assumed to be non-benign.)
+
+    @ingroup containers */
+    template <typename T,
+              typename Allocator=cache_aligned_allocator<T>,
+              ets_key_usage_type ETS_key_type=ets_no_key >
+    class enumerable_thread_specific: internal::ets_base<ETS_key_type> {
+
+        template<typename U, typename A, ets_key_usage_type C> friend class enumerable_thread_specific;
+
+        typedef internal::padded< internal::ets_element<T> > padded_element;
+
+        //! A generic range, used to create range objects from the iterators
+        template<typename I>
+        class generic_range_type: public blocked_range<I> {
+        public:
+            typedef T value_type;
+            typedef T& reference;
+            typedef const T& const_reference;
+            typedef I iterator;
+            typedef ptrdiff_t difference_type;
+            generic_range_type( I begin_, I end_, size_t grainsize_ = 1) : blocked_range<I>(begin_,end_,grainsize_) {}
+            template<typename U>
+            generic_range_type( const generic_range_type<U>& r) : blocked_range<I>(r.begin(),r.end(),r.grainsize()) {}
+            generic_range_type( generic_range_type& r, split ) : blocked_range<I>(r,split()) {}
+        };
+
+        typedef typename Allocator::template rebind< padded_element >::other padded_allocator_type;
+        typedef tbb::concurrent_vector< padded_element, padded_allocator_type > internal_collection_type;
+
+        internal::callback_base<T> *my_construct_callback;
+
+        internal_collection_type my_locals;
+
+        // TODO: consider unifying the callback mechanism for all create_local* methods below
+        //   (likely non-compatible and requires interface version increase)
+        void* create_local() __TBB_override {
+            padded_element& lref = *my_locals.grow_by(1);
+            my_construct_callback->construct(lref.value());
+            return lref.value_committed();
+        }
+
+        static void* create_local_by_copy( internal::ets_base<ets_no_key>& base, void* p ) {
+            enumerable_thread_specific& ets = static_cast<enumerable_thread_specific&>(base);
+            padded_element& lref = *ets.my_locals.grow_by(1);
+            new(lref.value()) T(*static_cast<T*>(p));
+            return lref.value_committed();
+        }
+
+#if __TBB_ETS_USE_CPP11
+        static void* create_local_by_move( internal::ets_base<ets_no_key>& base, void* p ) {
+            enumerable_thread_specific& ets = static_cast<enumerable_thread_specific&>(base);
+            padded_element& lref = *ets.my_locals.grow_by(1);
+            new(lref.value()) T(std::move(*static_cast<T*>(p)));
+            return lref.value_committed();
+        }
+#endif
+
+        typedef typename Allocator::template rebind< uintptr_t >::other array_allocator_type;
+
+        // _size is in bytes
+        void* create_array(size_t _size) __TBB_override {
+            size_t nelements = (_size + sizeof(uintptr_t) -1) / sizeof(uintptr_t);
+            return array_allocator_type().allocate(nelements);
+        }
+
+        void free_array( void* _ptr, size_t _size) __TBB_override {
+            size_t nelements = (_size + sizeof(uintptr_t) -1) / sizeof(uintptr_t);
+            array_allocator_type().deallocate( reinterpret_cast<uintptr_t *>(_ptr),nelements);
+        }
+
+    public:
+
+        //! Basic types
+        typedef Allocator allocator_type;
+        typedef T value_type;
+        typedef T& reference;
+        typedef const T& const_reference;
+        typedef T* pointer;
+        typedef const T* const_pointer;
+        typedef typename internal_collection_type::size_type size_type;
+        typedef typename internal_collection_type::difference_type difference_type;
+
+        // Iterator types
+        typedef typename internal::enumerable_thread_specific_iterator< internal_collection_type, value_type > iterator;
+        typedef typename internal::enumerable_thread_specific_iterator< internal_collection_type, const value_type > const_iterator;
+
+        // Parallel range types
+        typedef generic_range_type< iterator > range_type;
+        typedef generic_range_type< const_iterator > const_range_type;
+
+        //! Default constructor.  Each local instance of T is default constructed.
+        enumerable_thread_specific() : my_construct_callback(
+            internal::callback_leaf<T,internal::construct_by_default<T> >::make(/*dummy argument*/0)
+        ){}
+
+        //! Constructor with initializer functor.  Each local instance of T is constructed by T(finit()).
+        template <typename Finit
+#if __TBB_ETS_USE_CPP11
+                  , typename = typename internal::enable_if<internal::is_callable_no_args<typename internal::strip<Finit>::type>::value>::type
+#endif
+        >
+        explicit enumerable_thread_specific( Finit finit ) : my_construct_callback(
+            internal::callback_leaf<T,internal::construct_by_finit<T,Finit> >::make( tbb::internal::move(finit) )
+        ){}
+
+        //! Constructor with exemplar. Each local instance of T is copy-constructed from the exemplar.
+        explicit enumerable_thread_specific( const T& exemplar ) : my_construct_callback(
+            internal::callback_leaf<T,internal::construct_by_exemplar<T> >::make( exemplar )
+        ){}
+
+#if __TBB_ETS_USE_CPP11
+        explicit enumerable_thread_specific( T&& exemplar ) : my_construct_callback(
+            internal::callback_leaf<T,internal::construct_by_exemplar<T> >::make( std::move(exemplar) )
+        ){}
+
+        //! Variadic constructor with initializer arguments.  Each local instance of T is constructed by T(args...)
+        template <typename P1, typename... P,
+                  typename = typename internal::enable_if<!internal::is_callable_no_args<typename internal::strip<P1>::type>::value
+                                                          && !internal::is_compatible_ets<T, typename internal::strip<P1>::type>::value
+                                                          && !internal::is_same_type<T, typename internal::strip<P1>::type>::value
+                                                         >::type>
+        enumerable_thread_specific( P1&& arg1, P&& ... args ) : my_construct_callback(
+            internal::callback_leaf<T,internal::construct_by_args<T,P1,P...> >::make( std::forward<P1>(arg1), std::forward<P>(args)... )
+        ){}
+#endif
+
+        //! Destructor
+        ~enumerable_thread_specific() {
+            if(my_construct_callback) my_construct_callback->destroy();
+            // Deallocate the hash table before overridden free_array() becomes inaccessible
+            this->internal::ets_base<ets_no_key>::table_clear();
+        }
+
+        //! returns reference to local, discarding exists
+        reference local() {
+            bool exists;
+            return local(exists);
+        }
+
+        //! Returns reference to calling thread's local copy, creating one if necessary
+        reference local(bool& exists)  {
+            void* ptr = this->table_lookup(exists);
+            return *(T*)ptr;
+        }
+
+        //! Get the number of local copies
+        size_type size() const { return my_locals.size(); }
+
+        //! true if there have been no local copies created
+        bool empty() const { return my_locals.empty(); }
+
+        //! begin iterator
+        iterator begin() { return iterator( my_locals, 0 ); }
+        //! end iterator
+        iterator end() { return iterator(my_locals, my_locals.size() ); }
+
+        //! begin const iterator
+        const_iterator begin() const { return const_iterator(my_locals, 0); }
+
+        //! end const iterator
+        const_iterator end() const { return const_iterator(my_locals, my_locals.size()); }
+
+        //! Get range for parallel algorithms
+        range_type range( size_t grainsize=1 ) { return range_type( begin(), end(), grainsize ); }
+
+        //! Get const range for parallel algorithms
+        const_range_type range( size_t grainsize=1 ) const { return const_range_type( begin(), end(), grainsize ); }
+
+        //! Destroys local copies
+        void clear() {
+            my_locals.clear();
+            this->table_clear();
+            // callback is not destroyed
+        }
+
+    private:
+
+        template<typename A2, ets_key_usage_type C2>
+        void internal_copy(const enumerable_thread_specific<T, A2, C2>& other) {
+#if __TBB_ETS_USE_CPP11 && TBB_USE_ASSERT
+            // this tests is_compatible_ets
+            __TBB_STATIC_ASSERT( (internal::is_compatible_ets<T, typename internal::strip<decltype(other)>::type>::value), "is_compatible_ets fails" );
+#endif
+            // Initialize my_construct_callback first, so that it is valid even if rest of this routine throws an exception.
+            my_construct_callback = other.my_construct_callback->clone();
+            __TBB_ASSERT(my_locals.size()==0,NULL);
+            my_locals.reserve(other.size());
+            this->table_elementwise_copy( other, create_local_by_copy );
+        }
+
+        void internal_swap(enumerable_thread_specific& other) {
+            using std::swap;
+            __TBB_ASSERT( this!=&other, NULL );
+            swap(my_construct_callback, other.my_construct_callback);
+            // concurrent_vector::swap() preserves storage space,
+            // so addresses to the vector kept in ETS hash table remain valid.
+            swap(my_locals, other.my_locals);
+            this->internal::ets_base<ETS_key_type>::table_swap(other);
+        }
+
+#if __TBB_ETS_USE_CPP11
+        template<typename A2, ets_key_usage_type C2>
+        void internal_move(enumerable_thread_specific<T, A2, C2>&& other) {
+#if TBB_USE_ASSERT
+            // this tests is_compatible_ets
+            __TBB_STATIC_ASSERT( (internal::is_compatible_ets<T, typename internal::strip<decltype(other)>::type>::value), "is_compatible_ets fails" );
+#endif
+            my_construct_callback = other.my_construct_callback;
+            other.my_construct_callback = NULL;
+            __TBB_ASSERT(my_locals.size()==0,NULL);
+            my_locals.reserve(other.size());
+            this->table_elementwise_copy( other, create_local_by_move );
+        }
+#endif
+
+    public:
+
+        enumerable_thread_specific( const enumerable_thread_specific& other )
+        : internal::ets_base<ETS_key_type>() /* prevents GCC warnings with -Wextra */
+        {
+            internal_copy(other);
+        }
+
+        template<typename Alloc, ets_key_usage_type Cachetype>
+        enumerable_thread_specific( const enumerable_thread_specific<T, Alloc, Cachetype>& other )
+        {
+            internal_copy(other);
+        }
+
+#if __TBB_ETS_USE_CPP11
+        enumerable_thread_specific( enumerable_thread_specific&& other ) : my_construct_callback()
+        {
+            internal_swap(other);
+        }
+
+        template<typename Alloc, ets_key_usage_type Cachetype>
+        enumerable_thread_specific( enumerable_thread_specific<T, Alloc, Cachetype>&& other ) : my_construct_callback()
+        {
+            internal_move(std::move(other));
+        }
+#endif
+
+        enumerable_thread_specific& operator=( const enumerable_thread_specific& other )
+        {
+            if( this != &other ) {
+                this->clear();
+                my_construct_callback->destroy();
+                internal_copy( other );
+            }
+            return *this;
+        }
+
+        template<typename Alloc, ets_key_usage_type Cachetype>
+        enumerable_thread_specific& operator=( const enumerable_thread_specific<T, Alloc, Cachetype>& other )
+        {
+            __TBB_ASSERT( static_cast<void*>(this)!=static_cast<const void*>(&other), NULL ); // Objects of different types
+            this->clear();
+            my_construct_callback->destroy();
+            internal_copy(other);
+            return *this;
+        }
+
+#if __TBB_ETS_USE_CPP11
+        enumerable_thread_specific& operator=( enumerable_thread_specific&& other )
+        {
+            if( this != &other )
+                internal_swap(other);
+            return *this;
+        }
+
+        template<typename Alloc, ets_key_usage_type Cachetype>
+        enumerable_thread_specific& operator=( enumerable_thread_specific<T, Alloc, Cachetype>&& other )
+        {
+            __TBB_ASSERT( static_cast<void*>(this)!=static_cast<const void*>(&other), NULL ); // Objects of different types
+            this->clear();
+            my_construct_callback->destroy();
+            internal_move(std::move(other));
+            return *this;
+        }
+#endif
+
+        // combine_func_t has signature T(T,T) or T(const T&, const T&)
+        template <typename combine_func_t>
+        T combine(combine_func_t f_combine) {
+            if(begin() == end()) {
+                internal::ets_element<T> location;
+                my_construct_callback->construct(location.value());
+                return *location.value_committed();
+            }
+            const_iterator ci = begin();
+            T my_result = *ci;
+            while(++ci != end())
+                my_result = f_combine( my_result, *ci );
+            return my_result;
+        }
+
+        // combine_func_t takes T by value or by [const] reference, and returns nothing
+        template <typename combine_func_t>
+        void combine_each(combine_func_t f_combine) {
+            for(iterator ci = begin(); ci != end(); ++ci) {
+                f_combine( *ci );
+            }
+        }
+
+    }; // enumerable_thread_specific
+
+    template< typename Container >
+    class flattened2d {
+
+        // This intermediate typedef is to address issues with VC7.1 compilers
+        typedef typename Container::value_type conval_type;
+
+    public:
+
+        //! Basic types
+        typedef typename conval_type::size_type size_type;
+        typedef typename conval_type::difference_type difference_type;
+        typedef typename conval_type::allocator_type allocator_type;
+        typedef typename conval_type::value_type value_type;
+        typedef typename conval_type::reference reference;
+        typedef typename conval_type::const_reference const_reference;
+        typedef typename conval_type::pointer pointer;
+        typedef typename conval_type::const_pointer const_pointer;
+
+        typedef typename internal::segmented_iterator<Container, value_type> iterator;
+        typedef typename internal::segmented_iterator<Container, const value_type> const_iterator;
+
+        flattened2d( const Container &c, typename Container::const_iterator b, typename Container::const_iterator e ) :
+            my_container(const_cast<Container*>(&c)), my_begin(b), my_end(e) { }
+
+        explicit flattened2d( const Container &c ) :
+            my_container(const_cast<Container*>(&c)), my_begin(c.begin()), my_end(c.end()) { }
+
+        iterator begin() { return iterator(*my_container) = my_begin; }
+        iterator end() { return iterator(*my_container) = my_end; }
+        const_iterator begin() const { return const_iterator(*my_container) = my_begin; }
+        const_iterator end() const { return const_iterator(*my_container) = my_end; }
+
+        size_type size() const {
+            size_type tot_size = 0;
+            for(typename Container::const_iterator i = my_begin; i != my_end; ++i) {
+                tot_size += i->size();
+            }
+            return tot_size;
+        }
+
+    private:
+
+        Container *my_container;
+        typename Container::const_iterator my_begin;
+        typename Container::const_iterator my_end;
+
+    };
+
+    template <typename Container>
+    flattened2d<Container> flatten2d(const Container &c, const typename Container::const_iterator b, const typename Container::const_iterator e) {
+        return flattened2d<Container>(c, b, e);
+    }
+
+    template <typename Container>
+    flattened2d<Container> flatten2d(const Container &c) {
+        return flattened2d<Container>(c);
+    }
+
+} // interface6
+
+namespace internal {
+using interface6::internal::segmented_iterator;
+}
+
+using interface6::enumerable_thread_specific;
+using interface6::flattened2d;
+using interface6::flatten2d;
+
+} // namespace tbb
+
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/flow_graph.h b/xdl/third_party/tbb/include/tbb/flow_graph.h
new file mode 100644
index 00000000..ee8c39dd
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/flow_graph.h
@@ -0,0 +1,3957 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_flow_graph_H
+#define __TBB_flow_graph_H
+
+#include "tbb_stddef.h"
+#include "atomic.h"
+#include "spin_mutex.h"
+#include "null_mutex.h"
+#include "spin_rw_mutex.h"
+#include "null_rw_mutex.h"
+#include "task.h"
+#include "cache_aligned_allocator.h"
+#include "tbb_exception.h"
+#include "internal/_template_helpers.h"
+#include "internal/_aggregator_impl.h"
+#include "tbb_profiling.h"
+#include "task_arena.h"
+
+#if __TBB_PREVIEW_ASYNC_MSG
+#include <vector>    // std::vector in internal::async_storage
+#include <memory>    // std::shared_ptr in async_msg
+#endif
+
+#if __TBB_PREVIEW_STREAMING_NODE
+// For streaming_node
+#include <array>            // std::array
+#include <unordered_map>    // std::unordered_map
+#include <type_traits>      // std::decay, std::true_type, std::false_type
+#endif // __TBB_PREVIEW_STREAMING_NODE
+
+#if TBB_DEPRECATED_FLOW_ENQUEUE
+#define FLOW_SPAWN(a) tbb::task::enqueue((a))
+#else
+#define FLOW_SPAWN(a) tbb::task::spawn((a))
+#endif
+
+// use the VC10 or gcc version of tuple if it is available.
+#if __TBB_CPP11_TUPLE_PRESENT
+    #include <tuple>
+namespace tbb {
+    namespace flow {
+        using std::tuple;
+        using std::tuple_size;
+        using std::tuple_element;
+        using std::get;
+    }
+}
+#else
+    #include "compat/tuple"
+#endif
+
+#include<list>
+#include<queue>
+
+/** @file
+  \brief The graph related classes and functions
+
+  There are some applications that best express dependencies as messages
+  passed between nodes in a graph.  These messages may contain data or
+  simply act as signals that a predecessors has completed. The graph
+  class and its associated node classes can be used to express such
+  applications.
+*/
+
+namespace tbb {
+namespace flow {
+
+//! An enumeration the provides the two most common concurrency levels: unlimited and serial
+enum concurrency { unlimited = 0, serial = 1 };
+
+namespace interface10 {
+
+//! A generic null type
+struct null_type {};
+
+//! An empty class used for messages that mean "I'm done"
+class continue_msg {};
+
+//! Forward declaration section
+template< typename T > class sender;
+template< typename T > class receiver;
+class continue_receiver;
+template< typename T > class limiter_node;  // needed for resetting decrementer
+template< typename R, typename B > class run_and_put_task;
+
+namespace internal {
+
+template<typename T, typename M> class successor_cache;
+template<typename T, typename M> class broadcast_cache;
+template<typename T, typename M> class round_robin_cache;
+template<typename T, typename M> class predecessor_cache;
+template<typename T, typename M> class reservable_predecessor_cache;
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+// Holder of edges both for caches and for those nodes which do not have predecessor caches.
+// C == receiver< ... > or sender< ... >, depending.
+template<typename C>
+class edge_container {
+
+public:
+    typedef std::list<C *, tbb::tbb_allocator<C *> > edge_list_type;
+
+    void add_edge(C &s) {
+        built_edges.push_back(&s);
+    }
+
+    void delete_edge(C &s) {
+        for (typename edge_list_type::iterator i = built_edges.begin(); i != built_edges.end(); ++i) {
+            if (*i == &s) {
+                (void)built_edges.erase(i);
+                return;  // only remove one predecessor per request
+            }
+        }
+    }
+
+    void copy_edges(edge_list_type &v) {
+        v = built_edges;
+    }
+
+    size_t edge_count() {
+        return (size_t)(built_edges.size());
+    }
+
+    void clear() {
+        built_edges.clear();
+    }
+
+    // methods remove the statement from all predecessors/successors liste in the edge
+    // container.
+    template< typename S > void sender_extract(S &s);
+    template< typename R > void receiver_extract(R &r);
+
+private:
+    edge_list_type built_edges;
+};  // class edge_container
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+} // namespace internal
+
+} // namespace interface10
+} // namespace flow
+} // namespace tbb
+
+//! The graph class
+#include "internal/_flow_graph_impl.h"
+
+namespace tbb {
+namespace flow {
+namespace interface10 {
+
+// enqueue left task if necessary. Returns the non-enqueued task if there is one.
+static inline tbb::task *combine_tasks(graph& g, tbb::task * left, tbb::task * right) {
+    // if no RHS task, don't change left.
+    if (right == NULL) return left;
+    // right != NULL
+    if (left == NULL) return right;
+    if (left == SUCCESSFULLY_ENQUEUED) return right;
+    // left contains a task
+    if (right != SUCCESSFULLY_ENQUEUED) {
+        // both are valid tasks
+        internal::spawn_in_graph_arena(g, *left);
+        return right;
+    }
+    return left;
+}
+
+#if __TBB_PREVIEW_ASYNC_MSG
+
+template < typename T > class async_msg;
+
+namespace internal {
+
+template < typename T > class async_storage;
+
+template< typename T, typename = void >
+struct async_helpers {
+    typedef async_msg<T> async_type;
+    typedef T filtered_type;
+
+    static const bool is_async_type = false;
+
+    static const void* to_void_ptr(const T& t) {
+        return static_cast<const void*>(&t);
+    }
+
+    static void* to_void_ptr(T& t) {
+        return static_cast<void*>(&t);
+    }
+
+    static const T& from_void_ptr(const void* p) {
+        return *static_cast<const T*>(p);
+    }
+
+    static T& from_void_ptr(void* p) {
+        return *static_cast<T*>(p);
+    }
+
+    static task* try_put_task_wrapper_impl(receiver<T>* const this_recv, const void *p, bool is_async) {
+        if (is_async) {
+            // This (T) is NOT async and incoming 'A<X> t' IS async
+            // Get data from async_msg
+            const async_msg<filtered_type>& msg = async_helpers< async_msg<filtered_type> >::from_void_ptr(p);
+            task* const new_task = msg.my_storage->subscribe(*this_recv, this_recv->graph_reference());
+            // finalize() must be called after subscribe() because set() can be called in finalize()
+            // and 'this_recv' client must be subscribed by this moment
+            msg.finalize();
+            return new_task;
+        }
+        else {
+            // Incoming 't' is NOT async
+            return this_recv->try_put_task(from_void_ptr(p));
+        }
+    }
+};
+
+template< typename T >
+struct async_helpers< T, typename std::enable_if< std::is_base_of<async_msg<typename T::async_msg_data_type>, T>::value >::type > {
+    typedef T async_type;
+    typedef typename T::async_msg_data_type filtered_type;
+
+    static const bool is_async_type = true;
+
+    // Receiver-classes use const interfaces
+    static const void* to_void_ptr(const T& t) {
+        return static_cast<const void*>(&static_cast<const async_msg<filtered_type>&>(t));
+    }
+
+    static void* to_void_ptr(T& t) {
+        return static_cast<void*>(&static_cast<async_msg<filtered_type>&>(t));
+    }
+
+    // Sender-classes use non-const interfaces
+    static const T& from_void_ptr(const void* p) {
+        return *static_cast<const T*>(static_cast<const async_msg<filtered_type>*>(p));
+    }
+
+    static T& from_void_ptr(void* p) {
+        return *static_cast<T*>(static_cast<async_msg<filtered_type>*>(p));
+    }
+
+    // Used in receiver<T> class
+    static task* try_put_task_wrapper_impl(receiver<T>* const this_recv, const void *p, bool is_async) {
+        if (is_async) {
+            // Both are async
+            return this_recv->try_put_task(from_void_ptr(p));
+        }
+        else {
+            // This (T) is async and incoming 'X t' is NOT async
+            // Create async_msg for X
+            const filtered_type& t = async_helpers<filtered_type>::from_void_ptr(p);
+            const T msg(t);
+            return this_recv->try_put_task(msg);
+        }
+    }
+};
+
+class untyped_receiver;
+
+class untyped_sender {
+    template< typename, typename > friend class internal::predecessor_cache;
+    template< typename, typename > friend class internal::reservable_predecessor_cache;
+public:
+    //! The successor type for this node
+    typedef untyped_receiver successor_type;
+
+    virtual ~untyped_sender() {}
+
+    // NOTE: Following part of PUBLIC section is copy-paste from original sender<T> class
+
+    // TODO: Prevent untyped successor registration
+
+    //! Add a new successor to this node
+    virtual bool register_successor( successor_type &r ) = 0;
+
+    //! Removes a successor from this node
+    virtual bool remove_successor( successor_type &r ) = 0;
+
+    //! Releases the reserved item
+    virtual bool try_release( ) { return false; }
+
+    //! Consumes the reserved item
+    virtual bool try_consume( ) { return false; }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    //! interface to record edges for traversal & deletion
+    typedef internal::edge_container<successor_type> built_successors_type;
+    typedef built_successors_type::edge_list_type successor_list_type;
+    virtual built_successors_type &built_successors()                   = 0;
+    virtual void    internal_add_built_successor( successor_type & )    = 0;
+    virtual void    internal_delete_built_successor( successor_type & ) = 0;
+    virtual void    copy_successors( successor_list_type &)             = 0;
+    virtual size_t  successor_count()                                   = 0;
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+protected:
+    //! Request an item from the sender
+    template< typename X >
+    bool try_get( X &t ) {
+        return try_get_wrapper( internal::async_helpers<X>::to_void_ptr(t), internal::async_helpers<X>::is_async_type );
+    }
+
+    //! Reserves an item in the sender
+    template< typename X >
+    bool try_reserve( X &t ) {
+        return try_reserve_wrapper( internal::async_helpers<X>::to_void_ptr(t), internal::async_helpers<X>::is_async_type );
+    }
+
+    virtual bool try_get_wrapper( void* p, bool is_async ) = 0;
+    virtual bool try_reserve_wrapper( void* p, bool is_async ) = 0;
+};
+
+class untyped_receiver  {
+    template< typename, typename > friend class run_and_put_task;
+    template< typename > friend class limiter_node;
+
+    template< typename, typename > friend class internal::broadcast_cache;
+    template< typename, typename > friend class internal::round_robin_cache;
+    template< typename, typename > friend class internal::successor_cache;
+
+#if __TBB_PREVIEW_OPENCL_NODE
+    template< typename, typename > friend class proxy_dependency_receiver;
+#endif /* __TBB_PREVIEW_OPENCL_NODE */
+public:
+    //! The predecessor type for this node
+    typedef untyped_sender predecessor_type;
+
+    //! Destructor
+    virtual ~untyped_receiver() {}
+
+    //! Put an item to the receiver
+    template<typename X>
+    bool try_put(const X& t) {
+        task *res = try_put_task(t);
+        if (!res) return false;
+        if (res != SUCCESSFULLY_ENQUEUED) internal::spawn_in_graph_arena(graph_reference(), *res);
+        return true;
+    }
+
+    // NOTE: Following part of PUBLIC section is copy-paste from original receiver<T> class
+
+    // TODO: Prevent untyped predecessor registration
+
+    //! Add a predecessor to the node
+    virtual bool register_predecessor( predecessor_type & ) { return false; }
+
+    //! Remove a predecessor from the node
+    virtual bool remove_predecessor( predecessor_type & ) { return false; }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef internal::edge_container<predecessor_type> built_predecessors_type;
+    typedef built_predecessors_type::edge_list_type predecessor_list_type;
+    virtual built_predecessors_type &built_predecessors()                  = 0;
+    virtual void   internal_add_built_predecessor( predecessor_type & )    = 0;
+    virtual void   internal_delete_built_predecessor( predecessor_type & ) = 0;
+    virtual void   copy_predecessors( predecessor_list_type & )            = 0;
+    virtual size_t predecessor_count()                                     = 0;
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+protected:
+    template<typename X>
+    task *try_put_task(const X& t) {
+        return try_put_task_wrapper( internal::async_helpers<X>::to_void_ptr(t), internal::async_helpers<X>::is_async_type );
+    }
+
+    virtual task* try_put_task_wrapper( const void* p, bool is_async ) = 0;
+
+    virtual graph& graph_reference() = 0;
+
+    // NOTE: Following part of PROTECTED and PRIVATE sections is copy-paste from original receiver<T> class
+
+    //! put receiver back in initial state
+    virtual void reset_receiver(reset_flags f = rf_reset_protocol) = 0;
+
+    virtual bool is_continue_receiver() { return false; }
+};
+
+} // namespace internal
+
+//! Pure virtual template class that defines a sender of messages of type T
+template< typename T >
+class sender : public internal::untyped_sender {
+public:
+    //! The output type of this sender
+    typedef T output_type;
+
+    typedef typename internal::async_helpers<T>::filtered_type filtered_type;
+
+    //! Request an item from the sender
+    virtual bool try_get( T & ) { return false; }
+
+    //! Reserves an item in the sender
+    virtual bool try_reserve( T & ) { return false; }
+
+protected:
+    virtual bool try_get_wrapper( void* p, bool is_async ) __TBB_override {
+        // Both async OR both are NOT async
+        if ( internal::async_helpers<T>::is_async_type == is_async ) {
+            return try_get( internal::async_helpers<T>::from_void_ptr(p) );
+        }
+        // Else: this (T) is async OR incoming 't' is async
+        __TBB_ASSERT(false, "async_msg interface does not support 'pull' protocol in try_get()");
+        return false;
+    }
+
+    virtual bool try_reserve_wrapper( void* p, bool is_async ) __TBB_override {
+        // Both async OR both are NOT async
+        if ( internal::async_helpers<T>::is_async_type == is_async ) {
+            return try_reserve( internal::async_helpers<T>::from_void_ptr(p) );
+        }
+        // Else: this (T) is async OR incoming 't' is async
+        __TBB_ASSERT(false, "async_msg interface does not support 'pull' protocol in try_reserve()");
+        return false;
+    }
+};  // class sender<T>
+
+//! Pure virtual template class that defines a receiver of messages of type T
+template< typename T >
+class receiver : public internal::untyped_receiver {
+    template< typename > friend class internal::async_storage;
+    template< typename, typename > friend struct internal::async_helpers;
+public:
+    //! The input type of this receiver
+    typedef T input_type;
+
+    typedef typename internal::async_helpers<T>::filtered_type filtered_type;
+
+    //! Put an item to the receiver
+    bool try_put( const typename internal::async_helpers<T>::filtered_type& t ) {
+        return internal::untyped_receiver::try_put(t);
+    }
+
+    bool try_put( const typename internal::async_helpers<T>::async_type& t ) {
+        return internal::untyped_receiver::try_put(t);
+    }
+
+protected:
+    virtual task* try_put_task_wrapper( const void *p, bool is_async ) __TBB_override {
+        return internal::async_helpers<T>::try_put_task_wrapper_impl(this, p, is_async);
+    }
+
+    //! Put item to successor; return task to run the successor if possible.
+    virtual task *try_put_task(const T& t) = 0;
+
+}; // class receiver<T>
+
+#else // __TBB_PREVIEW_ASYNC_MSG
+
+//! Pure virtual template class that defines a sender of messages of type T
+template< typename T >
+class sender {
+public:
+    //! The output type of this sender
+    typedef T output_type;
+
+    //! The successor type for this node
+    typedef receiver<T> successor_type;
+
+    virtual ~sender() {}
+
+    // NOTE: Following part of PUBLIC section is partly copy-pasted in sender<T> under #if __TBB_PREVIEW_ASYNC_MSG
+
+    //! Add a new successor to this node
+    virtual bool register_successor( successor_type &r ) = 0;
+
+    //! Removes a successor from this node
+    virtual bool remove_successor( successor_type &r ) = 0;
+
+    //! Request an item from the sender
+    virtual bool try_get( T & ) { return false; }
+
+    //! Reserves an item in the sender
+    virtual bool try_reserve( T & ) { return false; }
+
+    //! Releases the reserved item
+    virtual bool try_release( ) { return false; }
+
+    //! Consumes the reserved item
+    virtual bool try_consume( ) { return false; }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    //! interface to record edges for traversal & deletion
+    typedef typename  internal::edge_container<successor_type> built_successors_type;
+    typedef typename  built_successors_type::edge_list_type successor_list_type;
+    virtual built_successors_type &built_successors()                   = 0;
+    virtual void    internal_add_built_successor( successor_type & )    = 0;
+    virtual void    internal_delete_built_successor( successor_type & ) = 0;
+    virtual void    copy_successors( successor_list_type &)             = 0;
+    virtual size_t  successor_count()                                   = 0;
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+};  // class sender<T>
+
+//! Pure virtual template class that defines a receiver of messages of type T
+template< typename T >
+class receiver {
+public:
+    //! The input type of this receiver
+    typedef T input_type;
+
+    //! The predecessor type for this node
+    typedef sender<T> predecessor_type;
+
+    //! Destructor
+    virtual ~receiver() {}
+
+    //! Put an item to the receiver
+    bool try_put( const T& t ) {
+        task *res = try_put_task(t);
+        if (!res) return false;
+        if (res != SUCCESSFULLY_ENQUEUED) internal::spawn_in_graph_arena(graph_reference(), *res);
+        return true;
+    }
+
+    //! put item to successor; return task to run the successor if possible.
+protected:
+    template< typename R, typename B > friend class run_and_put_task;
+    template< typename X, typename Y > friend class internal::broadcast_cache;
+    template< typename X, typename Y > friend class internal::round_robin_cache;
+    virtual task *try_put_task(const T& t) = 0;
+    virtual graph& graph_reference() = 0;
+public:
+    // NOTE: Following part of PUBLIC and PROTECTED sections is copy-pasted in receiver<T> under #if __TBB_PREVIEW_ASYNC_MSG
+
+    //! Add a predecessor to the node
+    virtual bool register_predecessor( predecessor_type & ) { return false; }
+
+    //! Remove a predecessor from the node
+    virtual bool remove_predecessor( predecessor_type & ) { return false; }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename internal::edge_container<predecessor_type> built_predecessors_type;
+    typedef typename built_predecessors_type::edge_list_type predecessor_list_type;
+    virtual built_predecessors_type &built_predecessors()                  = 0;
+    virtual void   internal_add_built_predecessor( predecessor_type & )    = 0;
+    virtual void   internal_delete_built_predecessor( predecessor_type & ) = 0;
+    virtual void   copy_predecessors( predecessor_list_type & )            = 0;
+    virtual size_t predecessor_count()                                     = 0;
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+protected:
+    //! put receiver back in initial state
+    template<typename U> friend class limiter_node;
+    virtual void reset_receiver(reset_flags f = rf_reset_protocol) = 0;
+
+    template<typename TT, typename M> friend class internal::successor_cache;
+    virtual bool is_continue_receiver() { return false; }
+
+#if __TBB_PREVIEW_OPENCL_NODE
+    template< typename, typename > friend class proxy_dependency_receiver;
+#endif /* __TBB_PREVIEW_OPENCL_NODE */
+}; // class receiver<T>
+
+#endif // __TBB_PREVIEW_ASYNC_MSG
+
+//! Base class for receivers of completion messages
+/** These receivers automatically reset, but cannot be explicitly waited on */
+class continue_receiver : public receiver< continue_msg > {
+public:
+
+    //! The input type
+    typedef continue_msg input_type;
+
+    //! The predecessor type for this node
+    typedef receiver<input_type>::predecessor_type predecessor_type;
+
+    //! Constructor
+    explicit continue_receiver(
+        __TBB_FLOW_GRAPH_PRIORITY_ARG1(int number_of_predecessors, node_priority_t priority)) {
+        my_predecessor_count = my_initial_predecessor_count = number_of_predecessors;
+        my_current_count = 0;
+        __TBB_FLOW_GRAPH_PRIORITY_EXPR( my_priority = priority; )
+    }
+
+    //! Copy constructor
+    continue_receiver( const continue_receiver& src ) : receiver<continue_msg>() {
+        my_predecessor_count = my_initial_predecessor_count = src.my_initial_predecessor_count;
+        my_current_count = 0;
+        __TBB_FLOW_GRAPH_PRIORITY_EXPR( my_priority = src.my_priority; )
+    }
+
+    //! Increments the trigger threshold
+    bool register_predecessor( predecessor_type & ) __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        ++my_predecessor_count;
+        return true;
+    }
+
+    //! Decrements the trigger threshold
+    /** Does not check to see if the removal of the predecessor now makes the current count
+        exceed the new threshold.  So removing a predecessor while the graph is active can cause
+        unexpected results. */
+    bool remove_predecessor( predecessor_type & ) __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        --my_predecessor_count;
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef internal::edge_container<predecessor_type> built_predecessors_type;
+    typedef built_predecessors_type::edge_list_type predecessor_list_type;
+    built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+
+    void internal_add_built_predecessor( predecessor_type &s) __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        my_built_predecessors.add_edge( s );
+    }
+
+    void internal_delete_built_predecessor( predecessor_type &s) __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        my_built_predecessors.delete_edge(s);
+    }
+
+    void copy_predecessors( predecessor_list_type &v) __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        my_built_predecessors.copy_edges(v);
+    }
+
+    size_t predecessor_count() __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        return my_built_predecessors.edge_count();
+    }
+
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+protected:
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    // execute body is supposed to be too small to create a task for.
+    task *try_put_task( const input_type & ) __TBB_override {
+        {
+            spin_mutex::scoped_lock l(my_mutex);
+            if ( ++my_current_count < my_predecessor_count )
+                return SUCCESSFULLY_ENQUEUED;
+            else
+                my_current_count = 0;
+        }
+        task * res = execute();
+        return res? res : SUCCESSFULLY_ENQUEUED;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    // continue_receiver must contain its own built_predecessors because it does
+    // not have a node_cache.
+    built_predecessors_type my_built_predecessors;
+#endif
+    spin_mutex my_mutex;
+    int my_predecessor_count;
+    int my_current_count;
+    int my_initial_predecessor_count;
+    __TBB_FLOW_GRAPH_PRIORITY_EXPR( node_priority_t my_priority; )
+    // the friend declaration in the base class did not eliminate the "protected class"
+    // error in gcc 4.1.2
+    template<typename U> friend class limiter_node;
+
+    void reset_receiver( reset_flags f ) __TBB_override {
+        my_current_count = 0;
+        if (f & rf_clear_edges) {
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            my_built_predecessors.clear();
+#endif
+            my_predecessor_count = my_initial_predecessor_count;
+        }
+    }
+
+    //! Does whatever should happen when the threshold is reached
+    /** This should be very fast or else spawn a task.  This is
+        called while the sender is blocked in the try_put(). */
+    virtual task * execute() = 0;
+    template<typename TT, typename M> friend class internal::successor_cache;
+    bool is_continue_receiver() __TBB_override { return true; }
+
+}; // class continue_receiver
+
+}  // interfaceX
+
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+    template <typename K, typename T>
+    K key_from_message( const T &t ) {
+        return t.key();
+    }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+
+    using interface10::sender;
+    using interface10::receiver;
+    using interface10::continue_receiver;
+}  // flow
+}  // tbb
+
+#include "internal/_flow_graph_trace_impl.h"
+#include "internal/_tbb_hash_compare_impl.h"
+
+namespace tbb {
+namespace flow {
+namespace interface10 {
+
+#include "internal/_flow_graph_body_impl.h"
+#include "internal/_flow_graph_cache_impl.h"
+#include "internal/_flow_graph_types_impl.h"
+#if __TBB_PREVIEW_ASYNC_MSG
+#include "internal/_flow_graph_async_msg_impl.h"
+#endif
+using namespace internal::graph_policy_namespace;
+
+template <typename C, typename N>
+graph_iterator<C,N>::graph_iterator(C *g, bool begin) : my_graph(g), current_node(NULL)
+{
+    if (begin) current_node = my_graph->my_nodes;
+    //else it is an end iterator by default
+}
+
+template <typename C, typename N>
+typename graph_iterator<C,N>::reference graph_iterator<C,N>::operator*() const {
+    __TBB_ASSERT(current_node, "graph_iterator at end");
+    return *operator->();
+}
+
+template <typename C, typename N>
+typename graph_iterator<C,N>::pointer graph_iterator<C,N>::operator->() const {
+    return current_node;
+}
+
+template <typename C, typename N>
+void graph_iterator<C,N>::internal_forward() {
+    if (current_node) current_node = current_node->next;
+}
+
+//! Constructs a graph with isolated task_group_context
+inline graph::graph() : my_nodes(NULL), my_nodes_last(NULL), my_task_arena(NULL) {
+    prepare_task_arena();
+    own_context = true;
+    cancelled = false;
+    caught_exception = false;
+    my_context = new task_group_context(tbb::internal::FLOW_TASKS);
+    my_root_task = (new (task::allocate_root(*my_context)) empty_task);
+    my_root_task->set_ref_count(1);
+    tbb::internal::fgt_graph(this);
+    my_is_active = true;
+}
+
+inline graph::graph(task_group_context& use_this_context) :
+    my_context(&use_this_context), my_nodes(NULL), my_nodes_last(NULL), my_task_arena(NULL) {
+    prepare_task_arena();
+    own_context = false;
+    my_root_task = (new (task::allocate_root(*my_context)) empty_task);
+    my_root_task->set_ref_count(1);
+    tbb::internal::fgt_graph(this);
+    my_is_active = true;
+}
+
+inline graph::~graph() {
+    wait_for_all();
+    my_root_task->set_ref_count(0);
+    tbb::task::destroy(*my_root_task);
+    if (own_context) delete my_context;
+    delete my_task_arena;
+}
+
+inline void graph::reserve_wait() {
+    if (my_root_task) {
+        my_root_task->increment_ref_count();
+        tbb::internal::fgt_reserve_wait(this);
+    }
+}
+
+inline void graph::release_wait() {
+    if (my_root_task) {
+        tbb::internal::fgt_release_wait(this);
+        my_root_task->decrement_ref_count();
+    }
+}
+
+inline void graph::register_node(graph_node *n) {
+    n->next = NULL;
+    {
+        spin_mutex::scoped_lock lock(nodelist_mutex);
+        n->prev = my_nodes_last;
+        if (my_nodes_last) my_nodes_last->next = n;
+        my_nodes_last = n;
+        if (!my_nodes) my_nodes = n;
+    }
+}
+
+inline void graph::remove_node(graph_node *n) {
+    {
+        spin_mutex::scoped_lock lock(nodelist_mutex);
+        __TBB_ASSERT(my_nodes && my_nodes_last, "graph::remove_node: Error: no registered nodes");
+        if (n->prev) n->prev->next = n->next;
+        if (n->next) n->next->prev = n->prev;
+        if (my_nodes_last == n) my_nodes_last = n->prev;
+        if (my_nodes == n) my_nodes = n->next;
+    }
+    n->prev = n->next = NULL;
+}
+
+inline void graph::reset( reset_flags f ) {
+    // reset context
+    internal::deactivate_graph(*this);
+
+    if(my_context) my_context->reset();
+    cancelled = false;
+    caught_exception = false;
+    // reset all the nodes comprising the graph
+    for(iterator ii = begin(); ii != end(); ++ii) {
+        graph_node *my_p = &(*ii);
+        my_p->reset_node(f);
+    }
+    // Reattach the arena. Might be useful to run the graph in a particular task_arena
+    // while not limiting graph lifetime to a single task_arena::execute() call.
+    prepare_task_arena( /*reinit=*/true );
+    internal::activate_graph(*this);
+    // now spawn the tasks necessary to start the graph
+    for(task_list_type::iterator rti = my_reset_task_list.begin(); rti != my_reset_task_list.end(); ++rti) {
+        internal::spawn_in_graph_arena(*this, *(*rti));
+    }
+    my_reset_task_list.clear();
+}
+
+inline graph::iterator graph::begin() { return iterator(this, true); }
+
+inline graph::iterator graph::end() { return iterator(this, false); }
+
+inline graph::const_iterator graph::begin() const { return const_iterator(this, true); }
+
+inline graph::const_iterator graph::end() const { return const_iterator(this, false); }
+
+inline graph::const_iterator graph::cbegin() const { return const_iterator(this, true); }
+
+inline graph::const_iterator graph::cend() const { return const_iterator(this, false); }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+inline void graph::set_name(const char *name) {
+    tbb::internal::fgt_graph_desc(this, name);
+}
+#endif
+
+inline graph_node::graph_node(graph& g) : my_graph(g) {
+    my_graph.register_node(this);
+}
+
+inline graph_node::~graph_node() {
+    my_graph.remove_node(this);
+}
+
+#include "internal/_flow_graph_node_impl.h"
+
+//! An executable node that acts as a source, i.e. it has no predecessors
+template < typename Output >
+class source_node : public graph_node, public sender< Output > {
+public:
+    //! The type of the output message, which is complete
+    typedef Output output_type;
+
+    //! The type of successors of this node
+    typedef typename sender<output_type>::successor_type successor_type;
+
+    //Source node has no input type
+    typedef null_type input_type;
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename sender<output_type>::built_successors_type built_successors_type;
+    typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+
+    //! Constructor for a node with a successor
+    template< typename Body >
+    source_node( graph &g, Body body, bool is_active = true )
+        : graph_node(g), my_active(is_active), init_my_active(is_active),
+        my_body( new internal::source_body_leaf< output_type, Body>(body) ),
+        my_init_body( new internal::source_body_leaf< output_type, Body>(body) ),
+        my_reserved(false), my_has_cached_item(false)
+    {
+        my_successors.set_owner(this);
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_SOURCE_NODE, &this->my_graph,
+                                           static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+    //! Copy constructor
+    source_node( const source_node& src ) :
+        graph_node(src.my_graph), sender<Output>(),
+        my_active(src.init_my_active),
+        init_my_active(src.init_my_active), my_body( src.my_init_body->clone() ), my_init_body(src.my_init_body->clone() ),
+        my_reserved(false), my_has_cached_item(false)
+    {
+        my_successors.set_owner(this);
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_SOURCE_NODE, &this->my_graph,
+                                           static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+    //! The destructor
+    ~source_node() { delete my_body; delete my_init_body; }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+    //! Add a new successor to this node
+    bool register_successor( successor_type &r ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        my_successors.register_successor(r);
+        if ( my_active )
+            spawn_put();
+        return true;
+    }
+
+    //! Removes a successor from this node
+    bool remove_successor( successor_type &r ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        my_successors.remove_successor(r);
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+    built_successors_type &built_successors() __TBB_override { return my_successors.built_successors(); }
+
+    void internal_add_built_successor( successor_type &r) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        my_successors.internal_add_built_successor(r);
+    }
+
+    void internal_delete_built_successor( successor_type &r) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        my_successors.internal_delete_built_successor(r);
+    }
+
+    size_t successor_count() __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        return my_successors.successor_count();
+    }
+
+    void copy_successors(successor_list_type &v) __TBB_override {
+        spin_mutex::scoped_lock l(my_mutex);
+        my_successors.copy_successors(v);
+    }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    //! Request an item from the node
+    bool try_get( output_type &v ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        if ( my_reserved )
+            return false;
+
+        if ( my_has_cached_item ) {
+            v = my_cached_item;
+            my_has_cached_item = false;
+            return true;
+        }
+        // we've been asked to provide an item, but we have none.  enqueue a task to
+        // provide one.
+        spawn_put();
+        return false;
+    }
+
+    //! Reserves an item.
+    bool try_reserve( output_type &v ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        if ( my_reserved ) {
+            return false;
+        }
+
+        if ( my_has_cached_item ) {
+            v = my_cached_item;
+            my_reserved = true;
+            return true;
+        } else {
+            return false;
+        }
+    }
+
+    //! Release a reserved item.
+    /** true = item has been released and so remains in sender, dest must request or reserve future items */
+    bool try_release( ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        __TBB_ASSERT( my_reserved && my_has_cached_item, "releasing non-existent reservation" );
+        my_reserved = false;
+        if(!my_successors.empty())
+            spawn_put();
+        return true;
+    }
+
+    //! Consumes a reserved item
+    bool try_consume( ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        __TBB_ASSERT( my_reserved && my_has_cached_item, "consuming non-existent reservation" );
+        my_reserved = false;
+        my_has_cached_item = false;
+        if ( !my_successors.empty() ) {
+            spawn_put();
+        }
+        return true;
+    }
+
+    //! Activates a node that was created in the inactive state
+    void activate() {
+        spin_mutex::scoped_lock lock(my_mutex);
+        my_active = true;
+        if (!my_successors.empty())
+            spawn_put();
+    }
+
+    template<typename Body>
+    Body copy_function_object() {
+        internal::source_body<output_type> &body_ref = *this->my_body;
+        return dynamic_cast< internal::source_body_leaf<output_type, Body> & >(body_ref).get_body();
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract( ) __TBB_override {
+        my_successors.built_successors().sender_extract(*this);   // removes "my_owner" == this from each successor
+        my_active = init_my_active;
+        my_reserved = false;
+        if(my_has_cached_item) my_has_cached_item = false;
+    }
+#endif
+
+protected:
+
+    //! resets the source_node to its initial state
+    void reset_node( reset_flags f) __TBB_override {
+        my_active = init_my_active;
+        my_reserved =false;
+        if(my_has_cached_item) {
+            my_has_cached_item = false;
+        }
+        if(f & rf_clear_edges) my_successors.clear();
+        if(f & rf_reset_bodies) {
+            internal::source_body<output_type> *tmp = my_init_body->clone();
+            delete my_body;
+            my_body = tmp;
+        }
+        if(my_active)
+            internal::add_task_to_graph_reset_list(this->my_graph, create_put_task());
+    }
+
+private:
+    spin_mutex my_mutex;
+    bool my_active;
+    bool init_my_active;
+    internal::source_body<output_type> *my_body;
+    internal::source_body<output_type> *my_init_body;
+    internal::broadcast_cache< output_type > my_successors;
+    bool my_reserved;
+    bool my_has_cached_item;
+    output_type my_cached_item;
+
+    // used by apply_body_bypass, can invoke body of node.
+    bool try_reserve_apply_body(output_type &v) {
+        spin_mutex::scoped_lock lock(my_mutex);
+        if ( my_reserved ) {
+            return false;
+        }
+        if ( !my_has_cached_item ) {
+            tbb::internal::fgt_begin_body( my_body );
+            bool r = (*my_body)(my_cached_item);
+            tbb::internal::fgt_end_body( my_body );
+            if (r) {
+                my_has_cached_item = true;
+            }
+        }
+        if ( my_has_cached_item ) {
+            v = my_cached_item;
+            my_reserved = true;
+            return true;
+        } else {
+            return false;
+        }
+    }
+
+    // when resetting, and if the source_node was created with my_active == true, then
+    // when we reset the node we must store a task to run the node, and spawn it only
+    // after the reset is complete and is_active() is again true.  This is why we don't
+    // test for is_active() here.
+    task* create_put_task() {
+        return ( new ( task::allocate_additional_child_of( *(this->my_graph.root_task()) ) )
+                        internal:: source_task_bypass < source_node< output_type > >( *this ) );
+    }
+
+    //! Spawns a task that applies the body
+    void spawn_put( ) {
+        if(internal::is_graph_active(this->my_graph)) {
+            internal::spawn_in_graph_arena(this->my_graph, *create_put_task());
+        }
+    }
+
+    friend class internal::source_task_bypass< source_node< output_type > >;
+    //! Applies the body.  Returning SUCCESSFULLY_ENQUEUED okay; forward_task_bypass will handle it.
+    task * apply_body_bypass( ) {
+        output_type v;
+        if ( !try_reserve_apply_body(v) )
+            return NULL;
+
+        task *last_task = my_successors.try_put_task(v);
+        if ( last_task )
+            try_consume();
+        else
+            try_release();
+        return last_task;
+    }
+};  // class source_node
+
+//! Implements a function node that supports Input -> Output
+template < typename Input, typename Output = continue_msg, typename Policy = queueing, typename Allocator=cache_aligned_allocator<Input> >
+class function_node : public graph_node, public internal::function_input<Input,Output,Policy,Allocator>, public internal::function_output<Output> {
+public:
+    typedef Input input_type;
+    typedef Output output_type;
+    typedef internal::function_input<input_type,output_type,Policy,Allocator> input_impl_type;
+    typedef internal::function_input_queue<input_type, Allocator> input_queue_type;
+    typedef internal::function_output<output_type> fOutput_type;
+    typedef typename input_impl_type::predecessor_type predecessor_type;
+    typedef typename fOutput_type::successor_type successor_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename input_impl_type::predecessor_list_type predecessor_list_type;
+    typedef typename fOutput_type::successor_list_type successor_list_type;
+#endif
+    using input_impl_type::my_predecessors;
+
+    //! Constructor
+    // input_queue_type is allocated here, but destroyed in the function_input_base.
+    // TODO: pass the graph_buffer_policy to the function_input_base so it can all
+    // be done in one place.  This would be an interface-breaking change.
+    template< typename Body >
+    function_node(
+        graph &g, size_t concurrency,
+        __TBB_FLOW_GRAPH_PRIORITY_ARG1( Body body, node_priority_t priority = tbb::flow::internal::no_priority )
+    ) : graph_node(g), input_impl_type(g, concurrency, __TBB_FLOW_GRAPH_PRIORITY_ARG1(body, priority)) {
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_FUNCTION_NODE, &this->my_graph,
+                static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+    //! Copy constructor
+    function_node( const function_node& src ) :
+        graph_node(src.my_graph),
+        input_impl_type(src),
+        fOutput_type() {
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_FUNCTION_NODE, &this->my_graph,
+                static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract( ) __TBB_override {
+        my_predecessors.built_predecessors().receiver_extract(*this);
+        successors().built_successors().sender_extract(*this);
+    }
+#endif
+
+protected:
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    using input_impl_type::try_put_task;
+
+    internal::broadcast_cache<output_type> &successors () __TBB_override { return fOutput_type::my_successors; }
+
+    void reset_node(reset_flags f) __TBB_override {
+        input_impl_type::reset_function_input(f);
+        // TODO: use clear() instead.
+        if(f & rf_clear_edges) {
+            successors().clear();
+            my_predecessors.clear();
+        }
+        __TBB_ASSERT(!(f & rf_clear_edges) || successors().empty(), "function_node successors not empty");
+        __TBB_ASSERT(this->my_predecessors.empty(), "function_node predecessors not empty");
+    }
+
+};  // class function_node
+
+//! implements a function node that supports Input -> (set of outputs)
+// Output is a tuple of output types.
+template < typename Input, typename Output, typename Policy = queueing, typename Allocator=cache_aligned_allocator<Input> >
+class multifunction_node :
+    public graph_node,
+    public internal::multifunction_input
+    <
+        Input,
+        typename internal::wrap_tuple_elements<
+            tbb::flow::tuple_size<Output>::value,  // #elements in tuple
+            internal::multifunction_output,  // wrap this around each element
+            Output // the tuple providing the types
+        >::type,
+        Policy,
+        Allocator
+    > {
+protected:
+    static const int N = tbb::flow::tuple_size<Output>::value;
+public:
+    typedef Input input_type;
+    typedef null_type output_type;
+    typedef typename internal::wrap_tuple_elements<N,internal::multifunction_output, Output>::type output_ports_type;
+    typedef internal::multifunction_input<input_type, output_ports_type, Policy, Allocator> input_impl_type;
+    typedef internal::function_input_queue<input_type, Allocator> input_queue_type;
+private:
+    typedef typename internal::multifunction_input<input_type, output_ports_type, Policy, Allocator> base_type;
+    using input_impl_type::my_predecessors;
+public:
+    template<typename Body>
+    multifunction_node(
+        graph &g, size_t concurrency,
+        __TBB_FLOW_GRAPH_PRIORITY_ARG1( Body body, node_priority_t priority = tbb::flow::internal::no_priority )
+    ) : graph_node(g), base_type(g, concurrency, __TBB_FLOW_GRAPH_PRIORITY_ARG1(body, priority)) {
+        tbb::internal::fgt_multioutput_node_with_body<N>(
+            tbb::internal::FLOW_MULTIFUNCTION_NODE,
+            &this->my_graph, static_cast<receiver<input_type> *>(this),
+            this->output_ports(), this->my_body
+        );
+    }
+
+    multifunction_node( const multifunction_node &other) :
+        graph_node(other.my_graph), base_type(other) {
+        tbb::internal::fgt_multioutput_node_with_body<N>( tbb::internal::FLOW_MULTIFUNCTION_NODE,
+                &this->my_graph, static_cast<receiver<input_type> *>(this),
+                this->output_ports(), this->my_body );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_multioutput_node_desc( this, name );
+    }
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract( ) __TBB_override {
+        my_predecessors.built_predecessors().receiver_extract(*this);
+        base_type::extract();
+    }
+#endif
+    // all the guts are in multifunction_input...
+protected:
+    void reset_node(reset_flags f) __TBB_override { base_type::reset(f); }
+};  // multifunction_node
+
+//! split_node: accepts a tuple as input, forwards each element of the tuple to its
+//  successors.  The node has unlimited concurrency, so it does not reject inputs.
+template<typename TupleType, typename Allocator=cache_aligned_allocator<TupleType> >
+class split_node : public graph_node, public receiver<TupleType> {
+    static const int N = tbb::flow::tuple_size<TupleType>::value;
+    typedef receiver<TupleType> base_type;
+public:
+    typedef TupleType input_type;
+    typedef Allocator allocator_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename base_type::predecessor_type predecessor_type;
+    typedef typename base_type::predecessor_list_type predecessor_list_type;
+    typedef internal::predecessor_cache<input_type, null_mutex > predecessor_cache_type;
+    typedef typename predecessor_cache_type::built_predecessors_type built_predecessors_type;
+#endif
+
+    typedef typename internal::wrap_tuple_elements<
+            N,  // #elements in tuple
+            internal::multifunction_output,  // wrap this around each element
+            TupleType // the tuple providing the types
+        >::type  output_ports_type;
+
+    explicit split_node(graph &g) : graph_node(g)
+    {
+        tbb::internal::fgt_multioutput_node<N>(tbb::internal::FLOW_SPLIT_NODE, &this->my_graph,
+            static_cast<receiver<input_type> *>(this), this->output_ports());
+    }
+    split_node( const split_node & other) : graph_node(other.my_graph), base_type(other)
+    {
+        tbb::internal::fgt_multioutput_node<N>(tbb::internal::FLOW_SPLIT_NODE, &this->my_graph,
+            static_cast<receiver<input_type> *>(this), this->output_ports());
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_multioutput_node_desc( this, name );
+    }
+#endif
+
+    output_ports_type &output_ports() { return my_output_ports; }
+
+protected:
+    task *try_put_task(const TupleType& t) __TBB_override {
+        // Sending split messages in parallel is not justified, as overheads would prevail.
+        // Also, we do not have successors here. So we just tell the task returned here is successful.
+        return internal::emit_element<N>::emit_this(this->my_graph, t, output_ports());
+    }
+    void reset_node(reset_flags f) __TBB_override {
+        if (f & rf_clear_edges)
+            internal::clear_element<N>::clear_this(my_output_ports);
+
+        __TBB_ASSERT(!(f & rf_clear_edges) || internal::clear_element<N>::this_empty(my_output_ports), "split_node reset failed");
+    }
+    void reset_receiver(reset_flags /*f*/) __TBB_override {}
+    graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+private: //! split_node doesn't use this "predecessors" functionality; so, we have "dummies" here;
+    void extract() __TBB_override {}
+
+    //! Adds to list of predecessors added by make_edge
+    void internal_add_built_predecessor(predecessor_type&) __TBB_override {}
+
+    //! removes from to list of predecessors (used by remove_edge)
+    void internal_delete_built_predecessor(predecessor_type&) __TBB_override {}
+
+    size_t predecessor_count() __TBB_override { return 0; }
+
+    void copy_predecessors(predecessor_list_type&) __TBB_override {}
+
+    built_predecessors_type &built_predecessors() __TBB_override { return my_predessors; }
+
+    //! dummy member
+    built_predecessors_type my_predessors;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+private:
+    output_ports_type my_output_ports;
+};
+
+//! Implements an executable node that supports continue_msg -> Output
+template <typename Output, typename Policy = internal::Policy<void> >
+class continue_node : public graph_node, public internal::continue_input<Output, Policy>,
+                      public internal::function_output<Output> {
+public:
+    typedef continue_msg input_type;
+    typedef Output output_type;
+    typedef internal::continue_input<Output, Policy> input_impl_type;
+    typedef internal::function_output<output_type> fOutput_type;
+    typedef typename input_impl_type::predecessor_type predecessor_type;
+    typedef typename fOutput_type::successor_type successor_type;
+
+    //! Constructor for executable node with continue_msg -> Output
+    template <typename Body >
+    continue_node(
+        graph &g,
+        __TBB_FLOW_GRAPH_PRIORITY_ARG1( Body body, node_priority_t priority = tbb::flow::internal::no_priority )
+    ) : graph_node(g), input_impl_type( g, __TBB_FLOW_GRAPH_PRIORITY_ARG1(body, priority) ) {
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_CONTINUE_NODE, &this->my_graph,
+                                           static_cast<receiver<input_type> *>(this),
+                                           static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+    //! Constructor for executable node with continue_msg -> Output
+    template <typename Body >
+    continue_node(
+        graph &g, int number_of_predecessors,
+        __TBB_FLOW_GRAPH_PRIORITY_ARG1( Body body, node_priority_t priority = tbb::flow::internal::no_priority )
+    ) : graph_node(g)
+      , input_impl_type(g, number_of_predecessors, __TBB_FLOW_GRAPH_PRIORITY_ARG1(body, priority)) {
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_CONTINUE_NODE, &this->my_graph,
+                                           static_cast<receiver<input_type> *>(this),
+                                           static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+    //! Copy constructor
+    continue_node( const continue_node& src ) :
+        graph_node(src.my_graph), input_impl_type(src),
+        internal::function_output<Output>() {
+        tbb::internal::fgt_node_with_body( tbb::internal::FLOW_CONTINUE_NODE, &this->my_graph,
+                                           static_cast<receiver<input_type> *>(this),
+                                           static_cast<sender<output_type> *>(this), this->my_body );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract() __TBB_override {
+        input_impl_type::my_built_predecessors.receiver_extract(*this);
+        successors().built_successors().sender_extract(*this);
+    }
+#endif
+
+protected:
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    using input_impl_type::try_put_task;
+    internal::broadcast_cache<output_type> &successors () __TBB_override { return fOutput_type::my_successors; }
+
+    void reset_node(reset_flags f) __TBB_override {
+        input_impl_type::reset_receiver(f);
+        if(f & rf_clear_edges)successors().clear();
+        __TBB_ASSERT(!(f & rf_clear_edges) || successors().empty(), "continue_node not reset");
+    }
+};  // continue_node
+
+//! Forwards messages of type T to all successors
+template <typename T>
+class broadcast_node : public graph_node, public receiver<T>, public sender<T> {
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+    typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+private:
+    internal::broadcast_cache<input_type> my_successors;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    internal::edge_container<predecessor_type> my_built_predecessors;
+    spin_mutex pred_mutex;  // serialize accesses on edge_container
+#endif
+public:
+
+    explicit broadcast_node(graph& g) : graph_node(g) {
+        my_successors.set_owner( this );
+        tbb::internal::fgt_node( tbb::internal::FLOW_BROADCAST_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this) );
+    }
+
+    // Copy constructor
+    broadcast_node( const broadcast_node& src ) :
+        graph_node(src.my_graph), receiver<T>(), sender<T>()
+    {
+        my_successors.set_owner( this );
+        tbb::internal::fgt_node( tbb::internal::FLOW_BROADCAST_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+    //! Adds a successor
+    bool register_successor( successor_type &r ) __TBB_override {
+        my_successors.register_successor( r );
+        return true;
+    }
+
+    //! Removes s as a successor
+    bool remove_successor( successor_type &r ) __TBB_override {
+        my_successors.remove_successor( r );
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename sender<T>::built_successors_type built_successors_type;
+
+    built_successors_type &built_successors() __TBB_override { return my_successors.built_successors(); }
+
+    void internal_add_built_successor(successor_type &r) __TBB_override {
+        my_successors.internal_add_built_successor(r);
+    }
+
+    void internal_delete_built_successor(successor_type &r) __TBB_override {
+        my_successors.internal_delete_built_successor(r);
+    }
+
+    size_t successor_count() __TBB_override {
+        return my_successors.successor_count();
+    }
+
+    void copy_successors(successor_list_type &v) __TBB_override {
+        my_successors.copy_successors(v);
+    }
+
+    typedef typename receiver<T>::built_predecessors_type built_predecessors_type;
+
+    built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+
+    void internal_add_built_predecessor( predecessor_type &p) __TBB_override {
+        spin_mutex::scoped_lock l(pred_mutex);
+        my_built_predecessors.add_edge(p);
+    }
+
+    void internal_delete_built_predecessor( predecessor_type &p) __TBB_override {
+        spin_mutex::scoped_lock l(pred_mutex);
+        my_built_predecessors.delete_edge(p);
+    }
+
+    size_t predecessor_count() __TBB_override {
+        spin_mutex::scoped_lock l(pred_mutex);
+        return my_built_predecessors.edge_count();
+    }
+
+    void copy_predecessors(predecessor_list_type &v) __TBB_override {
+        spin_mutex::scoped_lock l(pred_mutex);
+        my_built_predecessors.copy_edges(v);
+    }
+
+    void extract() __TBB_override {
+        my_built_predecessors.receiver_extract(*this);
+        my_successors.built_successors().sender_extract(*this);
+    }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+protected:
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    //! build a task to run the successor if possible.  Default is old behavior.
+    task *try_put_task(const T& t) __TBB_override {
+        task *new_task = my_successors.try_put_task(t);
+        if (!new_task) new_task = SUCCESSFULLY_ENQUEUED;
+        return new_task;
+    }
+
+    graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    void reset_receiver(reset_flags /*f*/) __TBB_override {}
+
+    void reset_node(reset_flags f) __TBB_override {
+        if (f&rf_clear_edges) {
+           my_successors.clear();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+           my_built_predecessors.clear();
+#endif
+        }
+        __TBB_ASSERT(!(f & rf_clear_edges) || my_successors.empty(), "Error resetting broadcast_node");
+    }
+};  // broadcast_node
+
+//! Forwards messages in arbitrary order
+template <typename T, typename A=cache_aligned_allocator<T> >
+class buffer_node : public graph_node, public internal::reservable_item_buffer<T, A>, public receiver<T>, public sender<T> {
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+    typedef buffer_node<T, A> class_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+    typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+protected:
+    typedef size_t size_type;
+    internal::round_robin_cache< T, null_rw_mutex > my_successors;
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    internal::edge_container<predecessor_type> my_built_predecessors;
+#endif
+
+    friend class internal::forward_task_bypass< buffer_node< T, A > >;
+
+    enum op_type {reg_succ, rem_succ, req_item, res_item, rel_res, con_res, put_item, try_fwd_task
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        , add_blt_succ, del_blt_succ,
+        add_blt_pred, del_blt_pred,
+        blt_succ_cnt, blt_pred_cnt,
+        blt_succ_cpy, blt_pred_cpy   // create vector copies of preds and succs
+#endif
+    };
+
+    // implements the aggregator_operation concept
+    class buffer_operation : public internal::aggregated_operation< buffer_operation > {
+    public:
+        char type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        task * ltask;
+        union {
+            input_type *elem;
+            successor_type *r;
+            predecessor_type *p;
+            size_t cnt_val;
+            successor_list_type *svec;
+            predecessor_list_type *pvec;
+        };
+#else
+        T *elem;
+        task * ltask;
+        successor_type *r;
+#endif
+        buffer_operation(const T& e, op_type t) : type(char(t))
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                                                  , ltask(NULL), elem(const_cast<T*>(&e))
+#else
+                                                  , elem(const_cast<T*>(&e)) , ltask(NULL)
+#endif
+        {}
+        buffer_operation(op_type t) : type(char(t)),  ltask(NULL) {}
+    };
+
+    bool forwarder_busy;
+    typedef internal::aggregating_functor<class_type, buffer_operation> handler_type;
+    friend class internal::aggregating_functor<class_type, buffer_operation>;
+    internal::aggregator< handler_type, buffer_operation> my_aggregator;
+
+    virtual void handle_operations(buffer_operation *op_list) {
+        handle_operations_impl(op_list, this);
+    }
+
+    template<typename derived_type>
+    void handle_operations_impl(buffer_operation *op_list, derived_type* derived) {
+        __TBB_ASSERT(static_cast<class_type*>(derived) == this, "'this' is not a base class for derived");
+
+        buffer_operation *tmp = NULL;
+        bool try_forwarding = false;
+        while (op_list) {
+            tmp = op_list;
+            op_list = op_list->next;
+            switch (tmp->type) {
+            case reg_succ: internal_reg_succ(tmp); try_forwarding = true; break;
+            case rem_succ: internal_rem_succ(tmp); break;
+            case req_item: internal_pop(tmp); break;
+            case res_item: internal_reserve(tmp); break;
+            case rel_res:  internal_release(tmp); try_forwarding = true; break;
+            case con_res:  internal_consume(tmp); try_forwarding = true; break;
+            case put_item: try_forwarding = internal_push(tmp); break;
+            case try_fwd_task: internal_forward_task(tmp); break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            // edge recording
+            case add_blt_succ: internal_add_built_succ(tmp); break;
+            case del_blt_succ: internal_del_built_succ(tmp); break;
+            case add_blt_pred: internal_add_built_pred(tmp); break;
+            case del_blt_pred: internal_del_built_pred(tmp); break;
+            case blt_succ_cnt: internal_succ_cnt(tmp); break;
+            case blt_pred_cnt: internal_pred_cnt(tmp); break;
+            case blt_succ_cpy: internal_copy_succs(tmp); break;
+            case blt_pred_cpy: internal_copy_preds(tmp); break;
+#endif
+            }
+        }
+
+        derived->order();
+
+        if (try_forwarding && !forwarder_busy) {
+            if(internal::is_graph_active(this->my_graph)) {
+                forwarder_busy = true;
+                task *new_task = new(task::allocate_additional_child_of(*(this->my_graph.root_task()))) internal::
+                        forward_task_bypass
+                        < buffer_node<input_type, A> >(*this);
+                // tmp should point to the last item handled by the aggregator.  This is the operation
+                // the handling thread enqueued.  So modifying that record will be okay.
+                // workaround for icc bug
+                tbb::task *z = tmp->ltask;
+                graph &g = this->my_graph;
+                tmp->ltask = combine_tasks(g, z, new_task);  // in case the op generated a task
+            }
+        }
+    }  // handle_operations
+
+    inline task *grab_forwarding_task( buffer_operation &op_data) {
+        return op_data.ltask;
+    }
+
+    inline bool enqueue_forwarding_task(buffer_operation &op_data) {
+        task *ft = grab_forwarding_task(op_data);
+        if(ft) {
+            internal::spawn_in_graph_arena(graph_reference(), *ft);
+            return true;
+        }
+        return false;
+    }
+
+    //! This is executed by an enqueued task, the "forwarder"
+    virtual task *forward_task() {
+        buffer_operation op_data(try_fwd_task);
+        task *last_task = NULL;
+        do {
+            op_data.status = internal::WAIT;
+            op_data.ltask = NULL;
+            my_aggregator.execute(&op_data);
+
+            // workaround for icc bug
+            tbb::task *xtask = op_data.ltask;
+            graph& g = this->my_graph;
+            last_task = combine_tasks(g, last_task, xtask);
+        } while (op_data.status ==internal::SUCCEEDED);
+        return last_task;
+    }
+
+    //! Register successor
+    virtual void internal_reg_succ(buffer_operation *op) {
+        my_successors.register_successor(*(op->r));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    //! Remove successor
+    virtual void internal_rem_succ(buffer_operation *op) {
+        my_successors.remove_successor(*(op->r));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename sender<T>::built_successors_type built_successors_type;
+
+    built_successors_type &built_successors() __TBB_override { return my_successors.built_successors(); }
+
+    virtual void internal_add_built_succ(buffer_operation *op) {
+        my_successors.internal_add_built_successor(*(op->r));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_del_built_succ(buffer_operation *op) {
+        my_successors.internal_delete_built_successor(*(op->r));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    typedef typename receiver<T>::built_predecessors_type built_predecessors_type;
+
+    built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+
+    virtual void internal_add_built_pred(buffer_operation *op) {
+        my_built_predecessors.add_edge(*(op->p));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_del_built_pred(buffer_operation *op) {
+        my_built_predecessors.delete_edge(*(op->p));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_succ_cnt(buffer_operation *op) {
+        op->cnt_val = my_successors.successor_count();
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_pred_cnt(buffer_operation *op) {
+        op->cnt_val = my_built_predecessors.edge_count();
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_copy_succs(buffer_operation *op) {
+        my_successors.copy_successors(*(op->svec));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_copy_preds(buffer_operation *op) {
+        my_built_predecessors.copy_edges(*(op->pvec));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+private:
+    void order() {}
+
+    bool is_item_valid() {
+        return this->my_item_valid(this->my_tail - 1);
+    }
+
+    void try_put_and_add_task(task*& last_task) {
+        task *new_task = my_successors.try_put_task(this->back());
+        if (new_task) {
+            // workaround for icc bug
+            graph& g = this->my_graph;
+            last_task = combine_tasks(g, last_task, new_task);
+            this->destroy_back();
+        }
+    }
+
+protected:
+    //! Tries to forward valid items to successors
+    virtual void internal_forward_task(buffer_operation *op) {
+        internal_forward_task_impl(op, this);
+    }
+
+    template<typename derived_type>
+    void internal_forward_task_impl(buffer_operation *op, derived_type* derived) {
+        __TBB_ASSERT(static_cast<class_type*>(derived) == this, "'this' is not a base class for derived");
+
+        if (this->my_reserved || !derived->is_item_valid()) {
+            __TBB_store_with_release(op->status, internal::FAILED);
+            this->forwarder_busy = false;
+            return;
+        }
+        // Try forwarding, giving each successor a chance
+        task * last_task = NULL;
+        size_type counter = my_successors.size();
+        for (; counter > 0 && derived->is_item_valid(); --counter)
+            derived->try_put_and_add_task(last_task);
+
+        op->ltask = last_task;  // return task
+        if (last_task && !counter) {
+            __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        }
+        else {
+            __TBB_store_with_release(op->status, internal::FAILED);
+            forwarder_busy = false;
+        }
+    }
+
+    virtual bool internal_push(buffer_operation *op) {
+        this->push_back(*(op->elem));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        return true;
+    }
+
+    virtual void internal_pop(buffer_operation *op) {
+        if(this->pop_back(*(op->elem))) {
+            __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        }
+        else {
+            __TBB_store_with_release(op->status, internal::FAILED);
+        }
+    }
+
+    virtual void internal_reserve(buffer_operation *op) {
+        if(this->reserve_front(*(op->elem))) {
+            __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        }
+        else {
+            __TBB_store_with_release(op->status, internal::FAILED);
+        }
+    }
+
+    virtual void internal_consume(buffer_operation *op) {
+        this->consume_front();
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+    virtual void internal_release(buffer_operation *op) {
+        this->release_front();
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+public:
+    //! Constructor
+    explicit buffer_node( graph &g ) : graph_node(g), internal::reservable_item_buffer<T>(),
+        forwarder_busy(false) {
+        my_successors.set_owner(this);
+        my_aggregator.initialize_handler(handler_type(this));
+        tbb::internal::fgt_node( tbb::internal::FLOW_BUFFER_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor
+    buffer_node( const buffer_node& src ) : graph_node(src.my_graph),
+        internal::reservable_item_buffer<T>(), receiver<T>(), sender<T>() {
+        forwarder_busy = false;
+        my_successors.set_owner(this);
+        my_aggregator.initialize_handler(handler_type(this));
+        tbb::internal::fgt_node( tbb::internal::FLOW_BUFFER_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+    //
+    // message sender implementation
+    //
+
+    //! Adds a new successor.
+    /** Adds successor r to the list of successors; may forward tasks.  */
+    bool register_successor( successor_type &r ) __TBB_override {
+        buffer_operation op_data(reg_succ);
+        op_data.r = &r;
+        my_aggregator.execute(&op_data);
+        (void)enqueue_forwarding_task(op_data);
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void internal_add_built_successor( successor_type &r) __TBB_override {
+        buffer_operation op_data(add_blt_succ);
+        op_data.r = &r;
+        my_aggregator.execute(&op_data);
+    }
+
+    void internal_delete_built_successor( successor_type &r) __TBB_override {
+        buffer_operation op_data(del_blt_succ);
+        op_data.r = &r;
+        my_aggregator.execute(&op_data);
+    }
+
+    void internal_add_built_predecessor( predecessor_type &p) __TBB_override {
+        buffer_operation op_data(add_blt_pred);
+        op_data.p = &p;
+        my_aggregator.execute(&op_data);
+    }
+
+    void internal_delete_built_predecessor( predecessor_type &p) __TBB_override {
+        buffer_operation op_data(del_blt_pred);
+        op_data.p = &p;
+        my_aggregator.execute(&op_data);
+    }
+
+    size_t predecessor_count() __TBB_override {
+        buffer_operation op_data(blt_pred_cnt);
+        my_aggregator.execute(&op_data);
+        return op_data.cnt_val;
+    }
+
+    size_t successor_count() __TBB_override {
+        buffer_operation op_data(blt_succ_cnt);
+        my_aggregator.execute(&op_data);
+        return op_data.cnt_val;
+    }
+
+    void copy_predecessors( predecessor_list_type &v ) __TBB_override {
+        buffer_operation op_data(blt_pred_cpy);
+        op_data.pvec = &v;
+        my_aggregator.execute(&op_data);
+    }
+
+    void copy_successors( successor_list_type &v ) __TBB_override {
+        buffer_operation op_data(blt_succ_cpy);
+        op_data.svec = &v;
+        my_aggregator.execute(&op_data);
+    }
+
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    //! Removes a successor.
+    /** Removes successor r from the list of successors.
+        It also calls r.remove_predecessor(*this) to remove this node as a predecessor. */
+    bool remove_successor( successor_type &r ) __TBB_override {
+        r.remove_predecessor(*this);
+        buffer_operation op_data(rem_succ);
+        op_data.r = &r;
+        my_aggregator.execute(&op_data);
+        // even though this operation does not cause a forward, if we are the handler, and
+        // a forward is scheduled, we may be the first to reach this point after the aggregator,
+        // and so should check for the task.
+        (void)enqueue_forwarding_task(op_data);
+        return true;
+    }
+
+    //! Request an item from the buffer_node
+    /**  true = v contains the returned item<BR>
+         false = no item has been returned */
+    bool try_get( T &v ) __TBB_override {
+        buffer_operation op_data(req_item);
+        op_data.elem = &v;
+        my_aggregator.execute(&op_data);
+        (void)enqueue_forwarding_task(op_data);
+        return (op_data.status==internal::SUCCEEDED);
+    }
+
+    //! Reserves an item.
+    /**  false = no item can be reserved<BR>
+         true = an item is reserved */
+    bool try_reserve( T &v ) __TBB_override {
+        buffer_operation op_data(res_item);
+        op_data.elem = &v;
+        my_aggregator.execute(&op_data);
+        (void)enqueue_forwarding_task(op_data);
+        return (op_data.status==internal::SUCCEEDED);
+    }
+
+    //! Release a reserved item.
+    /**  true = item has been released and so remains in sender */
+    bool try_release() __TBB_override {
+        buffer_operation op_data(rel_res);
+        my_aggregator.execute(&op_data);
+        (void)enqueue_forwarding_task(op_data);
+        return true;
+    }
+
+    //! Consumes a reserved item.
+    /** true = item is removed from sender and reservation removed */
+    bool try_consume() __TBB_override {
+        buffer_operation op_data(con_res);
+        my_aggregator.execute(&op_data);
+        (void)enqueue_forwarding_task(op_data);
+        return true;
+    }
+
+protected:
+
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    //! receive an item, return a task *if possible
+    task *try_put_task(const T &t) __TBB_override {
+        buffer_operation op_data(t, put_item);
+        my_aggregator.execute(&op_data);
+        task *ft = grab_forwarding_task(op_data);
+        // sequencer_nodes can return failure (if an item has been previously inserted)
+        // We have to spawn the returned task if our own operation fails.
+
+        if(ft && op_data.status ==internal::FAILED) {
+            // we haven't succeeded queueing the item, but for some reason the
+            // call returned a task (if another request resulted in a successful
+            // forward this could happen.)  Queue the task and reset the pointer.
+            internal::spawn_in_graph_arena(graph_reference(), *ft); ft = NULL;
+        }
+        else if(!ft && op_data.status ==internal::SUCCEEDED) {
+            ft = SUCCESSFULLY_ENQUEUED;
+        }
+        return ft;
+    }
+
+    graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    void reset_receiver(reset_flags /*f*/) __TBB_override { }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+public:
+    void extract() __TBB_override {
+        my_built_predecessors.receiver_extract(*this);
+        my_successors.built_successors().sender_extract(*this);
+    }
+#endif
+
+protected:
+    void reset_node( reset_flags f) __TBB_override {
+        internal::reservable_item_buffer<T, A>::reset();
+        // TODO: just clear structures
+        if (f&rf_clear_edges) {
+            my_successors.clear();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            my_built_predecessors.clear();
+#endif
+        }
+        forwarder_busy = false;
+    }
+};  // buffer_node
+
+//! Forwards messages in FIFO order
+template <typename T, typename A=cache_aligned_allocator<T> >
+class queue_node : public buffer_node<T, A> {
+protected:
+    typedef buffer_node<T, A> base_type;
+    typedef typename base_type::size_type size_type;
+    typedef typename base_type::buffer_operation queue_operation;
+    typedef queue_node class_type;
+
+private:
+    template<typename, typename> friend class buffer_node;
+
+    bool is_item_valid() {
+        return this->my_item_valid(this->my_head);
+    }
+
+    void try_put_and_add_task(task*& last_task) {
+        task *new_task = this->my_successors.try_put_task(this->front());
+        if (new_task) {
+            // workaround for icc bug
+            graph& graph_ref = this->graph_reference();
+            last_task = combine_tasks(graph_ref, last_task, new_task);
+            this->destroy_front();
+        }
+    }
+
+protected:
+    void internal_forward_task(queue_operation *op) __TBB_override {
+        this->internal_forward_task_impl(op, this);
+    }
+
+    void internal_pop(queue_operation *op) __TBB_override {
+        if ( this->my_reserved || !this->my_item_valid(this->my_head)){
+            __TBB_store_with_release(op->status, internal::FAILED);
+        }
+        else {
+            this->pop_front(*(op->elem));
+            __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        }
+    }
+    void internal_reserve(queue_operation *op) __TBB_override {
+        if (this->my_reserved || !this->my_item_valid(this->my_head)) {
+            __TBB_store_with_release(op->status, internal::FAILED);
+        }
+        else {
+            this->reserve_front(*(op->elem));
+            __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        }
+    }
+    void internal_consume(queue_operation *op) __TBB_override {
+        this->consume_front();
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+    }
+
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+
+    //! Constructor
+    explicit queue_node( graph &g ) : base_type(g) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_QUEUE_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor
+    queue_node( const queue_node& src) : base_type(src) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_QUEUE_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+protected:
+    void reset_node( reset_flags f) __TBB_override {
+        base_type::reset_node(f);
+    }
+};  // queue_node
+
+//! Forwards messages in sequence order
+template< typename T, typename A=cache_aligned_allocator<T> >
+class sequencer_node : public queue_node<T, A> {
+    internal::function_body< T, size_t > *my_sequencer;
+    // my_sequencer should be a benign function and must be callable
+    // from a parallel context.  Does this mean it needn't be reset?
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+
+    //! Constructor
+    template< typename Sequencer >
+    sequencer_node( graph &g, const Sequencer& s ) : queue_node<T, A>(g),
+        my_sequencer(new internal::function_body_leaf< T, size_t, Sequencer>(s) ) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_SEQUENCER_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor
+    sequencer_node( const sequencer_node& src ) : queue_node<T, A>(src),
+        my_sequencer( src.my_sequencer->clone() ) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_SEQUENCER_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Destructor
+    ~sequencer_node() { delete my_sequencer; }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+protected:
+    typedef typename buffer_node<T, A>::size_type size_type;
+    typedef typename buffer_node<T, A>::buffer_operation sequencer_operation;
+
+private:
+    bool internal_push(sequencer_operation *op) __TBB_override {
+        size_type tag = (*my_sequencer)(*(op->elem));
+#if !TBB_DEPRECATED_SEQUENCER_DUPLICATES
+        if (tag < this->my_head) {
+            // have already emitted a message with this tag
+            __TBB_store_with_release(op->status, internal::FAILED);
+            return false;
+        }
+#endif
+        // cannot modify this->my_tail now; the buffer would be inconsistent.
+        size_t new_tail = (tag+1 > this->my_tail) ? tag+1 : this->my_tail;
+
+        if (this->size(new_tail) > this->capacity()) {
+            this->grow_my_array(this->size(new_tail));
+        }
+        this->my_tail = new_tail;
+
+        const internal::op_stat res = this->place_item(tag, *(op->elem)) ? internal::SUCCEEDED : internal::FAILED;
+        __TBB_store_with_release(op->status, res);
+        return res ==internal::SUCCEEDED;
+    }
+};  // sequencer_node
+
+//! Forwards messages in priority order
+template< typename T, typename Compare = std::less<T>, typename A=cache_aligned_allocator<T> >
+class priority_queue_node : public buffer_node<T, A> {
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef buffer_node<T,A> base_type;
+    typedef priority_queue_node class_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+
+    //! Constructor
+    explicit priority_queue_node( graph &g ) : buffer_node<T, A>(g), mark(0) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_PRIORITY_QUEUE_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor
+    priority_queue_node( const priority_queue_node &src ) : buffer_node<T, A>(src), mark(0) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_PRIORITY_QUEUE_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+protected:
+
+    void reset_node( reset_flags f) __TBB_override {
+        mark = 0;
+        base_type::reset_node(f);
+    }
+
+    typedef typename buffer_node<T, A>::size_type size_type;
+    typedef typename buffer_node<T, A>::item_type item_type;
+    typedef typename buffer_node<T, A>::buffer_operation prio_operation;
+
+    //! Tries to forward valid items to successors
+    void internal_forward_task(prio_operation *op) __TBB_override {
+        this->internal_forward_task_impl(op, this);
+    }
+
+    void handle_operations(prio_operation *op_list) __TBB_override {
+        this->handle_operations_impl(op_list, this);
+    }
+
+    bool internal_push(prio_operation *op) __TBB_override {
+        prio_push(*(op->elem));
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        return true;
+    }
+
+    void internal_pop(prio_operation *op) __TBB_override {
+        // if empty or already reserved, don't pop
+        if ( this->my_reserved == true || this->my_tail == 0 ) {
+            __TBB_store_with_release(op->status, internal::FAILED);
+            return;
+        }
+
+        *(op->elem) = prio();
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        prio_pop();
+
+    }
+
+    // pops the highest-priority item, saves copy
+    void internal_reserve(prio_operation *op) __TBB_override {
+        if (this->my_reserved == true || this->my_tail == 0) {
+            __TBB_store_with_release(op->status, internal::FAILED);
+            return;
+        }
+        this->my_reserved = true;
+        *(op->elem) = prio();
+        reserved_item = *(op->elem);
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        prio_pop();
+    }
+
+    void internal_consume(prio_operation *op) __TBB_override {
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        this->my_reserved = false;
+        reserved_item = input_type();
+    }
+
+    void internal_release(prio_operation *op) __TBB_override {
+        __TBB_store_with_release(op->status, internal::SUCCEEDED);
+        prio_push(reserved_item);
+        this->my_reserved = false;
+        reserved_item = input_type();
+    }
+
+private:
+    template<typename, typename> friend class buffer_node;
+
+    void order() {
+        if (mark < this->my_tail) heapify();
+        __TBB_ASSERT(mark == this->my_tail, "mark unequal after heapify");
+    }
+
+    bool is_item_valid() {
+        return this->my_tail > 0;
+    }
+
+    void try_put_and_add_task(task*& last_task) {
+        task * new_task = this->my_successors.try_put_task(this->prio());
+        if (new_task) {
+            // workaround for icc bug
+            graph& graph_ref = this->graph_reference();
+            last_task = combine_tasks(graph_ref, last_task, new_task);
+            prio_pop();
+        }
+    }
+
+private:
+    Compare compare;
+    size_type mark;
+
+    input_type reserved_item;
+
+    // in case a reheap has not been done after a push, check if the mark item is higher than the 0'th item
+    bool prio_use_tail() {
+        __TBB_ASSERT(mark <= this->my_tail, "mark outside bounds before test");
+        return mark < this->my_tail && compare(this->get_my_item(0), this->get_my_item(this->my_tail - 1));
+    }
+
+    // prio_push: checks that the item will fit, expand array if necessary, put at end
+    void prio_push(const T &src) {
+        if ( this->my_tail >= this->my_array_size )
+            this->grow_my_array( this->my_tail + 1 );
+        (void) this->place_item(this->my_tail, src);
+        ++(this->my_tail);
+        __TBB_ASSERT(mark < this->my_tail, "mark outside bounds after push");
+    }
+
+    // prio_pop: deletes highest priority item from the array, and if it is item
+    // 0, move last item to 0 and reheap.  If end of array, just destroy and decrement tail
+    // and mark.  Assumes the array has already been tested for emptiness; no failure.
+    void prio_pop()  {
+        if (prio_use_tail()) {
+            // there are newly pushed elements; last one higher than top
+            // copy the data
+            this->destroy_item(this->my_tail-1);
+            --(this->my_tail);
+            __TBB_ASSERT(mark <= this->my_tail, "mark outside bounds after pop");
+            return;
+        }
+        this->destroy_item(0);
+        if(this->my_tail > 1) {
+            // push the last element down heap
+            __TBB_ASSERT(this->my_item_valid(this->my_tail - 1), NULL);
+            this->move_item(0,this->my_tail - 1);
+        }
+        --(this->my_tail);
+        if(mark > this->my_tail) --mark;
+        if (this->my_tail > 1) // don't reheap for heap of size 1
+            reheap();
+        __TBB_ASSERT(mark <= this->my_tail, "mark outside bounds after pop");
+    }
+
+    const T& prio() {
+        return this->get_my_item(prio_use_tail() ? this->my_tail-1 : 0);
+    }
+
+    // turn array into heap
+    void heapify() {
+        if(this->my_tail == 0) {
+            mark = 0;
+            return;
+        }
+        if (!mark) mark = 1;
+        for (; mark<this->my_tail; ++mark) { // for each unheaped element
+            size_type cur_pos = mark;
+            input_type to_place;
+            this->fetch_item(mark,to_place);
+            do { // push to_place up the heap
+                size_type parent = (cur_pos-1)>>1;
+                if (!compare(this->get_my_item(parent), to_place))
+                    break;
+                this->move_item(cur_pos, parent);
+                cur_pos = parent;
+            } while( cur_pos );
+            (void) this->place_item(cur_pos, to_place);
+        }
+    }
+
+    // otherwise heapified array with new root element; rearrange to heap
+    void reheap() {
+        size_type cur_pos=0, child=1;
+        while (child < mark) {
+            size_type target = child;
+            if (child+1<mark &&
+                compare(this->get_my_item(child),
+                        this->get_my_item(child+1)))
+                ++target;
+            // target now has the higher priority child
+            if (compare(this->get_my_item(target),
+                        this->get_my_item(cur_pos)))
+                break;
+            // swap
+            this->swap_items(cur_pos, target);
+            cur_pos = target;
+            child = (cur_pos<<1)+1;
+        }
+    }
+};  // priority_queue_node
+
+//! Forwards messages only if the threshold has not been reached
+/** This node forwards items until its threshold is reached.
+    It contains no buffering.  If the downstream node rejects, the
+    message is dropped. */
+template< typename T >
+class limiter_node : public graph_node, public receiver< T >, public sender< T > {
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename receiver<input_type>::built_predecessors_type built_predecessors_type;
+    typedef typename sender<output_type>::built_successors_type built_successors_type;
+    typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+    typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+    //TODO: There is a lack of predefined types for its controlling "decrementer" port. It should be fixed later.
+
+private:
+    size_t my_threshold;
+    size_t my_count; //number of successful puts
+    size_t my_tries; //number of active put attempts
+    internal::reservable_predecessor_cache< T, spin_mutex > my_predecessors;
+    spin_mutex my_mutex;
+    internal::broadcast_cache< T > my_successors;
+    int init_decrement_predecessors;
+
+    friend class internal::forward_task_bypass< limiter_node<T> >;
+
+    // Let decrementer call decrement_counter()
+    friend class internal::decrementer< limiter_node<T> >;
+
+    bool check_conditions() {  // always called under lock
+        return ( my_count + my_tries < my_threshold && !my_predecessors.empty() && !my_successors.empty() );
+    }
+
+    // only returns a valid task pointer or NULL, never SUCCESSFULLY_ENQUEUED
+    task *forward_task() {
+        input_type v;
+        task *rval = NULL;
+        bool reserved = false;
+            {
+                spin_mutex::scoped_lock lock(my_mutex);
+                if ( check_conditions() )
+                    ++my_tries;
+                else
+                    return NULL;
+            }
+
+        //SUCCESS
+        // if we can reserve and can put, we consume the reservation
+        // we increment the count and decrement the tries
+        if ( (my_predecessors.try_reserve(v)) == true ){
+            reserved=true;
+            if ( (rval = my_successors.try_put_task(v)) != NULL ){
+                {
+                    spin_mutex::scoped_lock lock(my_mutex);
+                    ++my_count;
+                    --my_tries;
+                    my_predecessors.try_consume();
+                    if ( check_conditions() ) {
+                        if ( internal::is_graph_active(this->my_graph) ) {
+                            task *rtask = new ( task::allocate_additional_child_of( *(this->my_graph.root_task()) ) )
+                                internal::forward_task_bypass< limiter_node<T> >( *this );
+                            internal::spawn_in_graph_arena(graph_reference(), *rtask);
+                        }
+                    }
+                }
+                return rval;
+            }
+        }
+        //FAILURE
+        //if we can't reserve, we decrement the tries
+        //if we can reserve but can't put, we decrement the tries and release the reservation
+        {
+            spin_mutex::scoped_lock lock(my_mutex);
+            --my_tries;
+            if (reserved) my_predecessors.try_release();
+            if ( check_conditions() ) {
+                if ( internal::is_graph_active(this->my_graph) ) {
+                    task *rtask = new ( task::allocate_additional_child_of( *(this->my_graph.root_task()) ) )
+                        internal::forward_task_bypass< limiter_node<T> >( *this );
+                    __TBB_ASSERT(!rval, "Have two tasks to handle");
+                    return rtask;
+                }
+            }
+            return rval;
+        }
+    }
+
+    void forward() {
+        __TBB_ASSERT(false, "Should never be called");
+        return;
+    }
+
+    task * decrement_counter() {
+        {
+            spin_mutex::scoped_lock lock(my_mutex);
+            if(my_count) --my_count;
+        }
+        return forward_task();
+    }
+
+public:
+    //! The internal receiver< continue_msg > that decrements the count
+    internal::decrementer< limiter_node<T> > decrement;
+
+    //! Constructor
+    limiter_node(graph &g, size_t threshold, int num_decrement_predecessors=0) :
+        graph_node(g), my_threshold(threshold), my_count(0), my_tries(0),
+        init_decrement_predecessors(num_decrement_predecessors),
+        decrement(num_decrement_predecessors)
+    {
+        my_predecessors.set_owner(this);
+        my_successors.set_owner(this);
+        decrement.set_owner(this);
+        tbb::internal::fgt_node( tbb::internal::FLOW_LIMITER_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<receiver<continue_msg> *>(&decrement),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor
+    limiter_node( const limiter_node& src ) :
+        graph_node(src.my_graph), receiver<T>(), sender<T>(),
+        my_threshold(src.my_threshold), my_count(0), my_tries(0),
+        init_decrement_predecessors(src.init_decrement_predecessors),
+        decrement(src.init_decrement_predecessors)
+    {
+        my_predecessors.set_owner(this);
+        my_successors.set_owner(this);
+        decrement.set_owner(this);
+        tbb::internal::fgt_node( tbb::internal::FLOW_LIMITER_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<receiver<continue_msg> *>(&decrement),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+    //! Replace the current successor with this new successor
+    bool register_successor( successor_type &r ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        bool was_empty = my_successors.empty();
+        my_successors.register_successor(r);
+        //spawn a forward task if this is the only successor
+        if ( was_empty && !my_predecessors.empty() && my_count + my_tries < my_threshold ) {
+            if ( internal::is_graph_active(this->my_graph) ) {
+                task* task = new ( task::allocate_additional_child_of( *(this->my_graph.root_task()) ) )
+                            internal::forward_task_bypass < limiter_node<T> >( *this );
+                internal::spawn_in_graph_arena(graph_reference(), *task);
+            }
+        }
+        return true;
+    }
+
+    //! Removes a successor from this node
+    /** r.remove_predecessor(*this) is also called. */
+    bool remove_successor( successor_type &r ) __TBB_override {
+        r.remove_predecessor(*this);
+        my_successors.remove_successor(r);
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    built_successors_type &built_successors() __TBB_override { return my_successors.built_successors(); }
+    built_predecessors_type &built_predecessors() __TBB_override { return my_predecessors.built_predecessors(); }
+
+    void internal_add_built_successor(successor_type &src) __TBB_override {
+        my_successors.internal_add_built_successor(src);
+    }
+
+    void internal_delete_built_successor(successor_type &src) __TBB_override {
+        my_successors.internal_delete_built_successor(src);
+    }
+
+    size_t successor_count() __TBB_override { return my_successors.successor_count(); }
+
+    void copy_successors(successor_list_type &v) __TBB_override {
+        my_successors.copy_successors(v);
+    }
+
+    void internal_add_built_predecessor(predecessor_type &src) __TBB_override {
+        my_predecessors.internal_add_built_predecessor(src);
+    }
+
+    void internal_delete_built_predecessor(predecessor_type &src) __TBB_override {
+        my_predecessors.internal_delete_built_predecessor(src);
+    }
+
+    size_t predecessor_count() __TBB_override { return my_predecessors.predecessor_count(); }
+
+    void copy_predecessors(predecessor_list_type &v) __TBB_override {
+        my_predecessors.copy_predecessors(v);
+    }
+
+    void extract() __TBB_override {
+        my_count = 0;
+        my_successors.built_successors().sender_extract(*this);
+        my_predecessors.built_predecessors().receiver_extract(*this);
+        decrement.built_predecessors().receiver_extract(decrement);
+    }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    //! Adds src to the list of cached predecessors.
+    bool register_predecessor( predecessor_type &src ) __TBB_override {
+        spin_mutex::scoped_lock lock(my_mutex);
+        my_predecessors.add( src );
+        if ( my_count + my_tries < my_threshold && !my_successors.empty() && internal::is_graph_active(this->my_graph) ) {
+            task* task = new ( task::allocate_additional_child_of( *(this->my_graph.root_task()) ) )
+                        internal::forward_task_bypass < limiter_node<T> >( *this );
+            internal::spawn_in_graph_arena(graph_reference(), *task);
+        }
+        return true;
+    }
+
+    //! Removes src from the list of cached predecessors.
+    bool remove_predecessor( predecessor_type &src ) __TBB_override {
+        my_predecessors.remove( src );
+        return true;
+    }
+
+protected:
+
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    //! Puts an item to this receiver
+    task *try_put_task( const T &t ) __TBB_override {
+        {
+            spin_mutex::scoped_lock lock(my_mutex);
+            if ( my_count + my_tries >= my_threshold )
+                return NULL;
+            else
+                ++my_tries;
+        }
+
+        task * rtask = my_successors.try_put_task(t);
+
+        if ( !rtask ) {  // try_put_task failed.
+            spin_mutex::scoped_lock lock(my_mutex);
+            --my_tries;
+            if (check_conditions() && internal::is_graph_active(this->my_graph)) {
+                rtask = new ( task::allocate_additional_child_of( *(this->my_graph.root_task()) ) )
+                    internal::forward_task_bypass< limiter_node<T> >( *this );
+            }
+        }
+        else {
+            spin_mutex::scoped_lock lock(my_mutex);
+            ++my_count;
+            --my_tries;
+             }
+        return rtask;
+    }
+
+    graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    void reset_receiver(reset_flags /*f*/) __TBB_override {
+        __TBB_ASSERT(false,NULL);  // should never be called
+    }
+
+    void reset_node( reset_flags f) __TBB_override {
+        my_count = 0;
+        if(f & rf_clear_edges) {
+            my_predecessors.clear();
+            my_successors.clear();
+        }
+        else
+        {
+            my_predecessors.reset( );
+        }
+        decrement.reset_receiver(f);
+    }
+};  // limiter_node
+
+#include "internal/_flow_graph_join_impl.h"
+
+using internal::reserving_port;
+using internal::queueing_port;
+using internal::key_matching_port;
+using internal::input_port;
+using internal::tag_value;
+
+template<typename OutputTuple, typename JP=queueing> class join_node;
+
+template<typename OutputTuple>
+class join_node<OutputTuple,reserving>: public internal::unfolded_join_node<tbb::flow::tuple_size<OutputTuple>::value, reserving_port, OutputTuple, reserving> {
+private:
+    static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+    typedef typename internal::unfolded_join_node<N, reserving_port, OutputTuple, reserving> unfolded_type;
+public:
+    typedef OutputTuple output_type;
+    typedef typename unfolded_type::input_ports_type input_ports_type;
+    explicit join_node(graph &g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_RESERVING, &this->my_graph,
+                                            this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    join_node(const join_node &other) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_RESERVING, &this->my_graph,
+                                            this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+};
+
+template<typename OutputTuple>
+class join_node<OutputTuple,queueing>: public internal::unfolded_join_node<tbb::flow::tuple_size<OutputTuple>::value, queueing_port, OutputTuple, queueing> {
+private:
+    static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+    typedef typename internal::unfolded_join_node<N, queueing_port, OutputTuple, queueing> unfolded_type;
+public:
+    typedef OutputTuple output_type;
+    typedef typename unfolded_type::input_ports_type input_ports_type;
+    explicit join_node(graph &g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_QUEUEING, &this->my_graph,
+                                            this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    join_node(const join_node &other) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_QUEUEING, &this->my_graph,
+                                            this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+};
+
+// template for key_matching join_node
+// tag_matching join_node is a specialization of key_matching, and is source-compatible.
+template<typename OutputTuple, typename K, typename KHash>
+class join_node<OutputTuple, key_matching<K, KHash> > : public internal::unfolded_join_node<tbb::flow::tuple_size<OutputTuple>::value,
+      key_matching_port, OutputTuple, key_matching<K,KHash> > {
+private:
+    static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+    typedef typename internal::unfolded_join_node<N, key_matching_port, OutputTuple, key_matching<K,KHash> > unfolded_type;
+public:
+    typedef OutputTuple output_type;
+    typedef typename unfolded_type::input_ports_type input_ports_type;
+
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+    join_node(graph &g) : unfolded_type(g) {}
+#endif  /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+
+    template<typename __TBB_B0, typename __TBB_B1>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1) : unfolded_type(g, b0, b1) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2) : unfolded_type(g, b0, b1, b2) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3) : unfolded_type(g, b0, b1, b2, b3) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3, typename __TBB_B4>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3, __TBB_B4 b4) :
+            unfolded_type(g, b0, b1, b2, b3, b4) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+#if __TBB_VARIADIC_MAX >= 6
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3, typename __TBB_B4,
+        typename __TBB_B5>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3, __TBB_B4 b4, __TBB_B5 b5) :
+            unfolded_type(g, b0, b1, b2, b3, b4, b5) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+#endif
+#if __TBB_VARIADIC_MAX >= 7
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3, typename __TBB_B4,
+        typename __TBB_B5, typename __TBB_B6>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3, __TBB_B4 b4, __TBB_B5 b5, __TBB_B6 b6) :
+            unfolded_type(g, b0, b1, b2, b3, b4, b5, b6) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+#endif
+#if __TBB_VARIADIC_MAX >= 8
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3, typename __TBB_B4,
+        typename __TBB_B5, typename __TBB_B6, typename __TBB_B7>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3, __TBB_B4 b4, __TBB_B5 b5, __TBB_B6 b6,
+            __TBB_B7 b7) : unfolded_type(g, b0, b1, b2, b3, b4, b5, b6, b7) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+#endif
+#if __TBB_VARIADIC_MAX >= 9
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3, typename __TBB_B4,
+        typename __TBB_B5, typename __TBB_B6, typename __TBB_B7, typename __TBB_B8>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3, __TBB_B4 b4, __TBB_B5 b5, __TBB_B6 b6,
+            __TBB_B7 b7, __TBB_B8 b8) : unfolded_type(g, b0, b1, b2, b3, b4, b5, b6, b7, b8) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+#endif
+#if __TBB_VARIADIC_MAX >= 10
+    template<typename __TBB_B0, typename __TBB_B1, typename __TBB_B2, typename __TBB_B3, typename __TBB_B4,
+        typename __TBB_B5, typename __TBB_B6, typename __TBB_B7, typename __TBB_B8, typename __TBB_B9>
+    join_node(graph &g, __TBB_B0 b0, __TBB_B1 b1, __TBB_B2 b2, __TBB_B3 b3, __TBB_B4 b4, __TBB_B5 b5, __TBB_B6 b6,
+            __TBB_B7 b7, __TBB_B8 b8, __TBB_B9 b9) : unfolded_type(g, b0, b1, b2, b3, b4, b5, b6, b7, b8, b9) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+#endif
+    join_node(const join_node &other) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_JOIN_NODE_TAG_MATCHING, &this->my_graph,
+                                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+};
+
+// indexer node
+#include "internal/_flow_graph_indexer_impl.h"
+
+// TODO: Implement interface with variadic template or tuple
+template<typename T0, typename T1=null_type, typename T2=null_type, typename T3=null_type,
+                      typename T4=null_type, typename T5=null_type, typename T6=null_type,
+                      typename T7=null_type, typename T8=null_type, typename T9=null_type> class indexer_node;
+
+//indexer node specializations
+template<typename T0>
+class indexer_node<T0> : public internal::unfolded_indexer_node<tuple<T0> > {
+private:
+    static const int N = 1;
+public:
+    typedef tuple<T0> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+     void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+
+template<typename T0, typename T1>
+class indexer_node<T0, T1> : public internal::unfolded_indexer_node<tuple<T0, T1> > {
+private:
+    static const int N = 2;
+public:
+    typedef tuple<T0, T1> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+     void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+
+template<typename T0, typename T1, typename T2>
+class indexer_node<T0, T1, T2> : public internal::unfolded_indexer_node<tuple<T0, T1, T2> > {
+private:
+    static const int N = 3;
+public:
+    typedef tuple<T0, T1, T2> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+
+template<typename T0, typename T1, typename T2, typename T3>
+class indexer_node<T0, T1, T2, T3> : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3> > {
+private:
+    static const int N = 4;
+public:
+    typedef tuple<T0, T1, T2, T3> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+
+template<typename T0, typename T1, typename T2, typename T3, typename T4>
+class indexer_node<T0, T1, T2, T3, T4> : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3, T4> > {
+private:
+    static const int N = 5;
+public:
+    typedef tuple<T0, T1, T2, T3, T4> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3, T4> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+
+#if __TBB_VARIADIC_MAX >= 6
+template<typename T0, typename T1, typename T2, typename T3, typename T4, typename T5>
+class indexer_node<T0, T1, T2, T3, T4, T5> : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3, T4, T5> > {
+private:
+    static const int N = 6;
+public:
+    typedef tuple<T0, T1, T2, T3, T4, T5> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3, T4, T5> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+#endif //variadic max 6
+
+#if __TBB_VARIADIC_MAX >= 7
+template<typename T0, typename T1, typename T2, typename T3, typename T4, typename T5,
+         typename T6>
+class indexer_node<T0, T1, T2, T3, T4, T5, T6> : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3, T4, T5, T6> > {
+private:
+    static const int N = 7;
+public:
+    typedef tuple<T0, T1, T2, T3, T4, T5, T6> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3, T4, T5, T6> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+#endif //variadic max 7
+
+#if __TBB_VARIADIC_MAX >= 8
+template<typename T0, typename T1, typename T2, typename T3, typename T4, typename T5,
+         typename T6, typename T7>
+class indexer_node<T0, T1, T2, T3, T4, T5, T6, T7> : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3, T4, T5, T6, T7> > {
+private:
+    static const int N = 8;
+public:
+    typedef tuple<T0, T1, T2, T3, T4, T5, T6, T7> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3, T4, T5, T6, T7> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+#endif //variadic max 8
+
+#if __TBB_VARIADIC_MAX >= 9
+template<typename T0, typename T1, typename T2, typename T3, typename T4, typename T5,
+         typename T6, typename T7, typename T8>
+class indexer_node<T0, T1, T2, T3, T4, T5, T6, T7, T8> : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3, T4, T5, T6, T7, T8> > {
+private:
+    static const int N = 9;
+public:
+    typedef tuple<T0, T1, T2, T3, T4, T5, T6, T7, T8> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3, T4, T5, T6, T7, T8> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+#endif //variadic max 9
+
+#if __TBB_VARIADIC_MAX >= 10
+template<typename T0, typename T1, typename T2, typename T3, typename T4, typename T5,
+         typename T6, typename T7, typename T8, typename T9>
+class indexer_node/*default*/ : public internal::unfolded_indexer_node<tuple<T0, T1, T2, T3, T4, T5, T6, T7, T8, T9> > {
+private:
+    static const int N = 10;
+public:
+    typedef tuple<T0, T1, T2, T3, T4, T5, T6, T7, T8, T9> InputTuple;
+    typedef typename internal::tagged_msg<size_t, T0, T1, T2, T3, T4, T5, T6, T7, T8, T9> output_type;
+    typedef typename internal::unfolded_indexer_node<InputTuple> unfolded_type;
+    indexer_node(graph& g) : unfolded_type(g) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+    // Copy constructor
+    indexer_node( const indexer_node& other ) : unfolded_type(other) {
+        tbb::internal::fgt_multiinput_node<N>( tbb::internal::FLOW_INDEXER_NODE, &this->my_graph,
+                                           this->input_ports(), static_cast< sender< output_type > *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+};
+#endif //variadic max 10
+
+#if __TBB_PREVIEW_ASYNC_MSG
+inline void internal_make_edge( internal::untyped_sender &p, internal::untyped_receiver &s ) {
+#else
+template< typename T >
+inline void internal_make_edge( sender<T> &p, receiver<T> &s ) {
+#endif
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    s.internal_add_built_predecessor(p);
+    p.internal_add_built_successor(s);
+#endif
+    p.register_successor( s );
+    tbb::internal::fgt_make_edge( &p, &s );
+}
+
+//! Makes an edge between a single predecessor and a single successor
+template< typename T >
+inline void make_edge( sender<T> &p, receiver<T> &s ) {
+    internal_make_edge( p, s );
+}
+
+#if __TBB_PREVIEW_ASYNC_MSG
+template< typename TS, typename TR,
+    typename = typename tbb::internal::enable_if<tbb::internal::is_same_type<TS, internal::untyped_sender>::value
+                                              || tbb::internal::is_same_type<TR, internal::untyped_receiver>::value>::type>
+inline void make_edge( TS &p, TR &s ) {
+    internal_make_edge( p, s );
+}
+
+template< typename T >
+inline void make_edge( sender<T> &p, receiver<typename T::async_msg_data_type> &s ) {
+    internal_make_edge( p, s );
+}
+
+template< typename T >
+inline void make_edge( sender<typename T::async_msg_data_type> &p, receiver<T> &s ) {
+    internal_make_edge( p, s );
+}
+
+#endif // __TBB_PREVIEW_ASYNC_MSG
+
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+//Makes an edge from port 0 of a multi-output predecessor to port 0 of a multi-input successor.
+template< typename T, typename V,
+          typename = typename T::output_ports_type, typename = typename V::input_ports_type >
+inline void make_edge( T& output, V& input) {
+    make_edge(get<0>(output.output_ports()), get<0>(input.input_ports()));
+}
+
+//Makes an edge from port 0 of a multi-output predecessor to a receiver.
+template< typename T, typename R,
+          typename = typename T::output_ports_type >
+inline void make_edge( T& output, receiver<R>& input) {
+     make_edge(get<0>(output.output_ports()), input);
+}
+
+//Makes an edge from a sender to port 0 of a multi-input successor.
+template< typename S,  typename V,
+          typename = typename V::input_ports_type >
+inline void make_edge( sender<S>& output, V& input) {
+     make_edge(output, get<0>(input.input_ports()));
+}
+#endif
+
+#if __TBB_PREVIEW_ASYNC_MSG
+inline void internal_remove_edge( internal::untyped_sender &p, internal::untyped_receiver &s ) {
+#else
+template< typename T >
+inline void internal_remove_edge( sender<T> &p, receiver<T> &s ) {
+#endif
+    p.remove_successor( s );
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    // TODO: should we try to remove p from the predecessor list of s, in case the edge is reversed?
+    p.internal_delete_built_successor(s);
+    s.internal_delete_built_predecessor(p);
+#endif
+    tbb::internal::fgt_remove_edge( &p, &s );
+}
+
+//! Removes an edge between a single predecessor and a single successor
+template< typename T >
+inline void remove_edge( sender<T> &p, receiver<T> &s ) {
+    internal_remove_edge( p, s );
+}
+
+#if __TBB_PREVIEW_ASYNC_MSG
+template< typename TS, typename TR,
+    typename = typename tbb::internal::enable_if<tbb::internal::is_same_type<TS, internal::untyped_sender>::value
+                                              || tbb::internal::is_same_type<TR, internal::untyped_receiver>::value>::type>
+inline void remove_edge( TS &p, TR &s ) {
+    internal_remove_edge( p, s );
+}
+
+template< typename T >
+inline void remove_edge( sender<T> &p, receiver<typename T::async_msg_data_type> &s ) {
+    internal_remove_edge( p, s );
+}
+
+template< typename T >
+inline void remove_edge( sender<typename T::async_msg_data_type> &p, receiver<T> &s ) {
+    internal_remove_edge( p, s );
+}
+#endif // __TBB_PREVIEW_ASYNC_MSG
+
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+//Removes an edge between port 0 of a multi-output predecessor and port 0 of a multi-input successor.
+template< typename T, typename V,
+          typename = typename T::output_ports_type, typename = typename V::input_ports_type >
+inline void remove_edge( T& output, V& input) {
+    remove_edge(get<0>(output.output_ports()), get<0>(input.input_ports()));
+}
+
+//Removes an edge between port 0 of a multi-output predecessor and a receiver.
+template< typename T, typename R,
+          typename = typename T::output_ports_type >
+inline void remove_edge( T& output, receiver<R>& input) {
+     remove_edge(get<0>(output.output_ports()), input);
+}
+//Removes an edge between a sender and port 0 of a multi-input successor.
+template< typename S,  typename V,
+          typename = typename V::input_ports_type >
+inline void remove_edge( sender<S>& output, V& input) {
+     remove_edge(output, get<0>(input.input_ports()));
+}
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+template<typename C >
+template< typename S >
+void internal::edge_container<C>::sender_extract( S &s ) {
+    edge_list_type e = built_edges;
+    for ( typename edge_list_type::iterator i = e.begin(); i != e.end(); ++i ) {
+        remove_edge(s, **i);
+    }
+}
+
+template<typename C >
+template< typename R >
+void internal::edge_container<C>::receiver_extract( R &r ) {
+    edge_list_type e = built_edges;
+    for ( typename edge_list_type::iterator i = e.begin(); i != e.end(); ++i ) {
+        remove_edge(**i, r);
+    }
+}
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+//! Returns a copy of the body from a function or continue node
+template< typename Body, typename Node >
+Body copy_body( Node &n ) {
+    return n.template copy_function_object<Body>();
+}
+
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+//composite_node
+template< typename InputTuple, typename OutputTuple > class composite_node;
+
+template< typename... InputTypes, typename... OutputTypes>
+class composite_node <tbb::flow::tuple<InputTypes...>, tbb::flow::tuple<OutputTypes...> > : public graph_node{
+
+public:
+    typedef tbb::flow::tuple< receiver<InputTypes>&... > input_ports_type;
+    typedef tbb::flow::tuple< sender<OutputTypes>&... > output_ports_type;
+
+private:
+    std::unique_ptr<input_ports_type> my_input_ports;
+    std::unique_ptr<output_ports_type> my_output_ports;
+
+    static const size_t NUM_INPUTS = sizeof...(InputTypes);
+    static const size_t NUM_OUTPUTS = sizeof...(OutputTypes);
+
+protected:
+    void reset_node(reset_flags) __TBB_override {}
+
+public:
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    composite_node( graph &g, const char *type_name = "composite_node" ) : graph_node(g) {
+        tbb::internal::fgt_multiinput_multioutput_node( tbb::internal::FLOW_COMPOSITE_NODE, this, &this->my_graph );
+        tbb::internal::fgt_multiinput_multioutput_node_desc( this, type_name );
+    }
+#else
+    composite_node( graph &g ) : graph_node(g) {
+        tbb::internal::fgt_multiinput_multioutput_node( tbb::internal::FLOW_COMPOSITE_NODE, this, &this->my_graph );
+    }
+#endif
+
+    template<typename T1, typename T2>
+    void set_external_ports(T1&& input_ports_tuple, T2&& output_ports_tuple) {
+        __TBB_STATIC_ASSERT(NUM_INPUTS == tbb::flow::tuple_size<input_ports_type>::value, "number of arguments does not match number of input ports");
+        __TBB_STATIC_ASSERT(NUM_OUTPUTS == tbb::flow::tuple_size<output_ports_type>::value, "number of arguments does not match number of output ports");
+        my_input_ports = tbb::internal::make_unique<input_ports_type>(std::forward<T1>(input_ports_tuple));
+        my_output_ports = tbb::internal::make_unique<output_ports_type>(std::forward<T2>(output_ports_tuple));
+
+        tbb::internal::fgt_internal_input_alias_helper<T1, NUM_INPUTS>::alias_port( this, input_ports_tuple);
+        tbb::internal::fgt_internal_output_alias_helper<T2, NUM_OUTPUTS>::alias_port( this, output_ports_tuple);
+    }
+
+    template< typename... NodeTypes >
+    void add_visible_nodes(const NodeTypes&... n) { internal::add_nodes_impl(this, true, n...); }
+
+    template< typename... NodeTypes >
+    void add_nodes(const NodeTypes&... n) { internal::add_nodes_impl(this, false, n...); }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_multiinput_multioutput_node_desc( this, name );
+    }
+#endif
+
+    input_ports_type& input_ports() {
+         __TBB_ASSERT(my_input_ports, "input ports not set, call set_external_ports to set input ports");
+         return *my_input_ports;
+    }
+
+    output_ports_type& output_ports() {
+         __TBB_ASSERT(my_output_ports, "output ports not set, call set_external_ports to set output ports");
+         return *my_output_ports;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract() __TBB_override {
+        __TBB_ASSERT(false, "Current composite_node implementation does not support extract");
+    }
+#endif
+};  // class composite_node
+
+//composite_node with only input ports
+template< typename... InputTypes>
+class composite_node <tbb::flow::tuple<InputTypes...>, tbb::flow::tuple<> > : public graph_node {
+public:
+    typedef tbb::flow::tuple< receiver<InputTypes>&... > input_ports_type;
+
+private:
+    std::unique_ptr<input_ports_type> my_input_ports;
+    static const size_t NUM_INPUTS = sizeof...(InputTypes);
+
+protected:
+    void reset_node(reset_flags) __TBB_override {}
+
+public:
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    composite_node( graph &g, const char *type_name = "composite_node") : graph_node(g) {
+        tbb::internal::fgt_composite( this, &g );
+        tbb::internal::fgt_multiinput_multioutput_node_desc( this, type_name );
+    }
+#else
+    composite_node( graph &g ) : graph_node(g) {
+        tbb::internal::fgt_composite( this, &g );
+    }
+#endif
+
+   template<typename T>
+   void set_external_ports(T&& input_ports_tuple) {
+       __TBB_STATIC_ASSERT(NUM_INPUTS == tbb::flow::tuple_size<input_ports_type>::value, "number of arguments does not match number of input ports");
+
+       my_input_ports = tbb::internal::make_unique<input_ports_type>(std::forward<T>(input_ports_tuple));
+
+       tbb::internal::fgt_internal_input_alias_helper<T, NUM_INPUTS>::alias_port( this, std::forward<T>(input_ports_tuple));
+   }
+
+    template< typename... NodeTypes >
+    void add_visible_nodes(const NodeTypes&... n) { internal::add_nodes_impl(this, true, n...); }
+
+    template< typename... NodeTypes >
+    void add_nodes( const NodeTypes&... n) { internal::add_nodes_impl(this, false, n...); }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_multiinput_multioutput_node_desc( this, name );
+    }
+#endif
+
+    input_ports_type& input_ports() {
+         __TBB_ASSERT(my_input_ports, "input ports not set, call set_external_ports to set input ports");
+         return *my_input_ports;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract() __TBB_override {
+        __TBB_ASSERT(false, "Current composite_node implementation does not support extract");
+    }
+#endif
+
+};  // class composite_node
+
+//composite_nodes with only output_ports
+template<typename... OutputTypes>
+class composite_node <tbb::flow::tuple<>, tbb::flow::tuple<OutputTypes...> > : public graph_node {
+public:
+    typedef tbb::flow::tuple< sender<OutputTypes>&... > output_ports_type;
+
+private:
+    std::unique_ptr<output_ports_type> my_output_ports;
+    static const size_t NUM_OUTPUTS = sizeof...(OutputTypes);
+
+protected:
+    void reset_node(reset_flags) __TBB_override {}
+
+public:
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    composite_node( graph &g, const char *type_name = "composite_node") : graph_node(g) {
+        tbb::internal::fgt_composite( this, &g );
+        tbb::internal::fgt_multiinput_multioutput_node_desc( this, type_name );
+    }
+#else
+    composite_node( graph &g ) : graph_node(g) {
+        tbb::internal::fgt_composite( this, &g );
+    }
+#endif
+
+   template<typename T>
+   void set_external_ports(T&& output_ports_tuple) {
+       __TBB_STATIC_ASSERT(NUM_OUTPUTS == tbb::flow::tuple_size<output_ports_type>::value, "number of arguments does not match number of output ports");
+
+       my_output_ports = tbb::internal::make_unique<output_ports_type>(std::forward<T>(output_ports_tuple));
+
+       tbb::internal::fgt_internal_output_alias_helper<T, NUM_OUTPUTS>::alias_port( this, std::forward<T>(output_ports_tuple));
+   }
+
+    template<typename... NodeTypes >
+    void add_visible_nodes(const NodeTypes&... n) { internal::add_nodes_impl(this, true, n...); }
+
+    template<typename... NodeTypes >
+    void add_nodes(const NodeTypes&... n) { internal::add_nodes_impl(this, false, n...); }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_multiinput_multioutput_node_desc( this, name );
+    }
+#endif
+
+    output_ports_type& output_ports() {
+         __TBB_ASSERT(my_output_ports, "output ports not set, call set_external_ports to set output ports");
+         return *my_output_ports;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    void extract() __TBB_override {
+        __TBB_ASSERT(false, "Current composite_node implementation does not support extract");
+    }
+#endif
+
+};  // class composite_node
+
+#endif // __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+namespace internal {
+
+template<typename Gateway>
+class async_body_base: tbb::internal::no_assign {
+public:
+    typedef Gateway gateway_type;
+
+    async_body_base(gateway_type *gateway): my_gateway(gateway) { }
+    void set_gateway(gateway_type *gateway) {
+        my_gateway = gateway;
+    }
+
+protected:
+    gateway_type *my_gateway;
+};
+
+template<typename Input, typename Ports, typename Gateway, typename Body>
+class async_body: public async_body_base<Gateway> {
+public:
+    typedef async_body_base<Gateway> base_type;
+    typedef Gateway gateway_type;
+
+    async_body(const Body &body, gateway_type *gateway)
+        : base_type(gateway), my_body(body) { }
+
+    void operator()( const Input &v, Ports & ) {
+        my_body(v, *this->my_gateway);
+    }
+
+    Body get_body() { return my_body; }
+
+private:
+    Body my_body;
+};
+
+}
+
+//! Implements async node
+template < typename Input, typename Output,
+           typename Policy = queueing_lightweight,
+           typename Allocator=cache_aligned_allocator<Input> >
+class async_node : public multifunction_node< Input, tuple< Output >, Policy, Allocator >, public sender< Output > {
+    typedef multifunction_node< Input, tuple< Output >, Policy, Allocator > base_type;
+    typedef typename internal::multifunction_input<Input, typename base_type::output_ports_type, Policy, Allocator> mfn_input_type;
+
+public:
+    typedef Input input_type;
+    typedef Output output_type;
+    typedef receiver<input_type> receiver_type;
+    typedef typename receiver_type::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+    typedef receiver_gateway<output_type> gateway_type;
+    typedef internal::async_body_base<gateway_type> async_body_base_type;
+    typedef typename base_type::output_ports_type output_ports_type;
+
+private:
+    struct try_put_functor {
+        typedef internal::multifunction_output<Output> output_port_type;
+        output_port_type *port;
+        // TODO: pass value by copy since we do not want to block asynchronous thread.
+        const Output *value;
+        bool result;
+        try_put_functor(output_port_type &p, const Output &v) : port(&p), value(&v), result(false) { }
+        void operator()() {
+            result = port->try_put(*value);
+        }
+    };
+
+    class receiver_gateway_impl: public receiver_gateway<Output> {
+    public:
+        receiver_gateway_impl(async_node* node): my_node(node) {}
+        void reserve_wait() __TBB_override {
+            tbb::internal::fgt_async_reserve(static_cast<typename async_node::receiver_type *>(my_node), &my_node->my_graph);
+            my_node->my_graph.reserve_wait();
+        }
+
+        void release_wait() __TBB_override {
+            my_node->my_graph.release_wait();
+            tbb::internal::fgt_async_commit(static_cast<typename async_node::receiver_type *>(my_node), &my_node->my_graph);
+        }
+
+        //! Implements gateway_type::try_put for an external activity to submit a message to FG
+        bool try_put(const Output &i) __TBB_override {
+            return my_node->try_put_impl(i);
+        }
+
+    private:
+        async_node* my_node;
+    } my_gateway;
+
+    //The substitute of 'this' for member construction, to prevent compiler warnings
+    async_node* self() { return this; }
+
+    //! Implements gateway_type::try_put for an external activity to submit a message to FG
+    bool try_put_impl(const Output &i) {
+        internal::multifunction_output<Output> &port_0 = internal::output_port<0>(*this);
+        tbb::internal::fgt_async_try_put_begin(this, &port_0);
+        try_put_functor tpf(port_0, i);
+        internal::execute_in_graph_arena(this->my_graph, tpf);
+        tbb::internal::fgt_async_try_put_end(this, &port_0);
+        return tpf.result;
+    }
+
+public:
+    template<typename Body>
+    async_node(
+        graph &g, size_t concurrency,
+        __TBB_FLOW_GRAPH_PRIORITY_ARG1( Body body, node_priority_t priority = tbb::flow::internal::no_priority )
+    ) : base_type(
+        g, concurrency,
+        internal::async_body<Input, typename base_type::output_ports_type, gateway_type, Body>
+        (body, &my_gateway) __TBB_FLOW_GRAPH_PRIORITY_ARG0(priority) ), my_gateway(self()) {
+        tbb::internal::fgt_multioutput_node_with_body<1>(
+            tbb::internal::FLOW_ASYNC_NODE,
+            &this->my_graph, static_cast<receiver<input_type> *>(this),
+            this->output_ports(), this->my_body
+        );
+    }
+
+    async_node( const async_node &other ) : base_type(other), sender<Output>(), my_gateway(self()) {
+        static_cast<async_body_base_type*>(this->my_body->get_body_ptr())->set_gateway(&my_gateway);
+        static_cast<async_body_base_type*>(this->my_init_body->get_body_ptr())->set_gateway(&my_gateway);
+
+        tbb::internal::fgt_multioutput_node_with_body<1>( tbb::internal::FLOW_ASYNC_NODE,
+                &this->my_graph, static_cast<receiver<input_type> *>(this),
+                this->output_ports(), this->my_body );
+    }
+
+    gateway_type& gateway() {
+        return my_gateway;
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_multioutput_node_desc( this, name );
+    }
+#endif
+
+    // Define sender< Output >
+
+    //! Add a new successor to this node
+    bool register_successor( successor_type &r ) __TBB_override {
+        return internal::output_port<0>(*this).register_successor(r);
+    }
+
+    //! Removes a successor from this node
+    bool remove_successor( successor_type &r ) __TBB_override {
+        return internal::output_port<0>(*this).remove_successor(r);
+    }
+
+    template<typename Body>
+    Body copy_function_object() {
+        typedef internal::multifunction_body<input_type, typename base_type::output_ports_type> mfn_body_type;
+        typedef internal::async_body<Input, typename base_type::output_ports_type, gateway_type, Body> async_body_type;
+        mfn_body_type &body_ref = *this->my_body;
+        async_body_type ab = *static_cast<async_body_type*>(dynamic_cast< internal::multifunction_body_leaf<input_type, typename base_type::output_ports_type, async_body_type> & >(body_ref).get_body_ptr());
+        return ab.get_body();
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    //! interface to record edges for traversal & deletion
+    typedef typename  internal::edge_container<successor_type> built_successors_type;
+    typedef typename  built_successors_type::edge_list_type successor_list_type;
+    built_successors_type &built_successors() __TBB_override {
+        return internal::output_port<0>(*this).built_successors();
+    }
+
+    void internal_add_built_successor( successor_type &r ) __TBB_override {
+        internal::output_port<0>(*this).internal_add_built_successor(r);
+    }
+
+    void internal_delete_built_successor( successor_type &r ) __TBB_override {
+        internal::output_port<0>(*this).internal_delete_built_successor(r);
+    }
+
+    void copy_successors( successor_list_type &l ) __TBB_override {
+        internal::output_port<0>(*this).copy_successors(l);
+    }
+
+    size_t  successor_count() __TBB_override {
+        return internal::output_port<0>(*this).successor_count();
+    }
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+protected:
+
+    void reset_node( reset_flags f) __TBB_override {
+       base_type::reset_node(f);
+    }
+};
+
+#if __TBB_PREVIEW_STREAMING_NODE
+#include "internal/_flow_graph_streaming_node.h"
+#endif // __TBB_PREVIEW_STREAMING_NODE
+
+} // interfaceX
+
+
+namespace interface10a {
+
+using namespace interface10;
+namespace internal = interface10::internal;
+
+template< typename T >
+class overwrite_node : public graph_node, public receiver<T>, public sender<T> {
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename receiver<input_type>::built_predecessors_type built_predecessors_type;
+    typedef typename sender<output_type>::built_successors_type built_successors_type;
+    typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+    typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+
+    explicit overwrite_node(graph &g) : graph_node(g), my_buffer_is_valid(false) {
+        my_successors.set_owner( this );
+        tbb::internal::fgt_node( tbb::internal::FLOW_OVERWRITE_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor; doesn't take anything from src; default won't work
+    overwrite_node( const overwrite_node& src ) :
+        graph_node(src.my_graph), receiver<T>(), sender<T>(), my_buffer_is_valid(false)
+    {
+        my_successors.set_owner( this );
+        tbb::internal::fgt_node( tbb::internal::FLOW_OVERWRITE_NODE, &this->my_graph,
+                                 static_cast<receiver<input_type> *>(this), static_cast<sender<output_type> *>(this) );
+    }
+
+    ~overwrite_node() {}
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+   bool register_successor( successor_type &s ) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        if (my_buffer_is_valid && internal::is_graph_active( my_graph )) {
+            // We have a valid value that must be forwarded immediately.
+            bool ret = s.try_put( my_buffer );
+            if ( ret ) {
+                // We add the successor that accepted our put
+                my_successors.register_successor( s );
+            } else {
+                // In case of reservation a race between the moment of reservation and register_successor can appear,
+                // because failed reserve does not mean that register_successor is not ready to put a message immediately.
+                // We have some sort of infinite loop: reserving node tries to set pull state for the edge,
+                // but overwrite_node tries to return push state back. That is why we have to break this loop with task creation.
+                task *rtask = new ( task::allocate_additional_child_of( *( my_graph.root_task() ) ) )
+                    register_predecessor_task( *this, s );
+                internal::spawn_in_graph_arena( my_graph, *rtask );
+            }
+        } else {
+            // No valid value yet, just add as successor
+            my_successors.register_successor( s );
+        }
+        return true;
+    }
+
+    bool remove_successor( successor_type &s ) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_successors.remove_successor(s);
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+    built_successors_type   &built_successors()   __TBB_override { return my_successors.built_successors(); }
+
+    void internal_add_built_successor( successor_type &s) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_successors.internal_add_built_successor(s);
+    }
+
+    void internal_delete_built_successor( successor_type &s) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_successors.internal_delete_built_successor(s);
+    }
+
+    size_t successor_count() __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        return my_successors.successor_count();
+    }
+
+    void copy_successors(successor_list_type &v) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_successors.copy_successors(v);
+    }
+
+    void internal_add_built_predecessor( predecessor_type &p) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_built_predecessors.add_edge(p);
+    }
+
+    void internal_delete_built_predecessor( predecessor_type &p) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_built_predecessors.delete_edge(p);
+    }
+
+    size_t predecessor_count() __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        return my_built_predecessors.edge_count();
+    }
+
+    void copy_predecessors( predecessor_list_type &v ) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        my_built_predecessors.copy_edges(v);
+    }
+
+    void extract() __TBB_override {
+        my_buffer_is_valid = false;
+        built_successors().sender_extract(*this);
+        built_predecessors().receiver_extract(*this);
+    }
+
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    bool try_get( input_type &v ) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        if ( my_buffer_is_valid ) {
+            v = my_buffer;
+            return true;
+        }
+        return false;
+    }
+
+    //! Reserves an item
+    bool try_reserve( T &v ) __TBB_override {
+        return try_get(v);
+    }
+
+    //! Releases the reserved item
+    bool try_release() __TBB_override { return true; }
+
+    //! Consumes the reserved item
+    bool try_consume() __TBB_override { return true; }
+
+    bool is_valid() {
+       spin_mutex::scoped_lock l( my_mutex );
+       return my_buffer_is_valid;
+    }
+
+    void clear() {
+       spin_mutex::scoped_lock l( my_mutex );
+       my_buffer_is_valid = false;
+    }
+
+protected:
+
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    task * try_put_task( const input_type &v ) __TBB_override {
+        spin_mutex::scoped_lock l( my_mutex );
+        return try_put_task_impl(v);
+    }
+
+    task * try_put_task_impl(const input_type &v) {
+        my_buffer = v;
+        my_buffer_is_valid = true;
+        task * rtask = my_successors.try_put_task(v);
+        if (!rtask) rtask = SUCCESSFULLY_ENQUEUED;
+        return rtask;
+    }
+
+    graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    //! Breaks an infinite loop between the node reservation and register_successor call
+    struct register_predecessor_task : public graph_task {
+
+        register_predecessor_task(predecessor_type& owner, successor_type& succ) :
+            o(owner), s(succ) {};
+
+        tbb::task* execute() __TBB_override {
+            if (!s.register_predecessor(o)) {
+                o.register_successor(s);
+            }
+            return NULL;
+        }
+
+        predecessor_type& o;
+        successor_type& s;
+    };
+
+    spin_mutex my_mutex;
+    internal::broadcast_cache< input_type, null_rw_mutex > my_successors;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    internal::edge_container<predecessor_type> my_built_predecessors;
+#endif
+    input_type my_buffer;
+    bool my_buffer_is_valid;
+    void reset_receiver(reset_flags /*f*/) __TBB_override {}
+
+    void reset_node( reset_flags f) __TBB_override {
+        my_buffer_is_valid = false;
+       if (f&rf_clear_edges) {
+           my_successors.clear();
+       }
+    }
+};  // overwrite_node
+
+template< typename T >
+class write_once_node : public overwrite_node<T> {
+public:
+    typedef T input_type;
+    typedef T output_type;
+    typedef overwrite_node<T> base_type;
+    typedef typename receiver<input_type>::predecessor_type predecessor_type;
+    typedef typename sender<output_type>::successor_type successor_type;
+
+    //! Constructor
+    explicit write_once_node(graph& g) : base_type(g) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_WRITE_ONCE_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+    //! Copy constructor: call base class copy constructor
+    write_once_node( const write_once_node& src ) : base_type(src) {
+        tbb::internal::fgt_node( tbb::internal::FLOW_WRITE_ONCE_NODE, &(this->my_graph),
+                                 static_cast<receiver<input_type> *>(this),
+                                 static_cast<sender<output_type> *>(this) );
+    }
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name( const char *name ) __TBB_override {
+        tbb::internal::fgt_node_desc( this, name );
+    }
+#endif
+
+protected:
+    template< typename R, typename B > friend class run_and_put_task;
+    template<typename X, typename Y> friend class internal::broadcast_cache;
+    template<typename X, typename Y> friend class internal::round_robin_cache;
+    task *try_put_task( const T &v ) __TBB_override {
+        spin_mutex::scoped_lock l( this->my_mutex );
+        return this->my_buffer_is_valid ? NULL : this->try_put_task_impl(v);
+    }
+};
+} // interfaceX
+
+    using interface10::reset_flags;
+    using interface10::rf_reset_protocol;
+    using interface10::rf_reset_bodies;
+    using interface10::rf_clear_edges;
+
+    using interface10::graph;
+    using interface10::graph_node;
+    using interface10::continue_msg;
+
+    using interface10::source_node;
+    using interface10::function_node;
+    using interface10::multifunction_node;
+    using interface10::split_node;
+    using interface10::internal::output_port;
+    using interface10::indexer_node;
+    using interface10::internal::tagged_msg;
+    using interface10::internal::cast_to;
+    using interface10::internal::is_a;
+    using interface10::continue_node;
+    using interface10a::overwrite_node;
+    using interface10a::write_once_node;
+    using interface10::broadcast_node;
+    using interface10::buffer_node;
+    using interface10::queue_node;
+    using interface10::sequencer_node;
+    using interface10::priority_queue_node;
+    using interface10::limiter_node;
+    using namespace interface10::internal::graph_policy_namespace;
+    using interface10::join_node;
+    using interface10::input_port;
+    using interface10::copy_body;
+    using interface10::make_edge;
+    using interface10::remove_edge;
+    using interface10::internal::tag_value;
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+    using interface10::composite_node;
+#endif
+    using interface10::async_node;
+#if __TBB_PREVIEW_ASYNC_MSG
+    using interface10::async_msg;
+#endif
+#if __TBB_PREVIEW_STREAMING_NODE
+    using interface10::port_ref;
+    using interface10::streaming_node;
+#endif // __TBB_PREVIEW_STREAMING_NODE
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+    using internal::node_priority_t;
+    using internal::no_priority;
+#endif
+
+
+} // flow
+} // tbb
+
+#undef __TBB_PFG_RESET_ARG
+#undef __TBB_COMMA
+
+#endif // __TBB_flow_graph_H
diff --git a/xdl/third_party/tbb/include/tbb/flow_graph_abstractions.h b/xdl/third_party/tbb/include/tbb/flow_graph_abstractions.h
new file mode 100644
index 00000000..890ce761
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/flow_graph_abstractions.h
@@ -0,0 +1,57 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_flow_graph_abstractions_H
+#define __TBB_flow_graph_abstractions_H
+
+namespace tbb {
+namespace flow {
+namespace interface10 {
+
+//! Pure virtual template classes that define interfaces for async communication
+class graph_proxy {
+public:
+    //! Inform a graph that messages may come from outside, to prevent premature graph completion
+    virtual void reserve_wait() = 0;
+
+    //! Inform a graph that a previous call to reserve_wait is no longer in effect
+    virtual void release_wait() = 0;
+
+    virtual ~graph_proxy() {}
+};
+
+template <typename Input>
+class receiver_gateway : public graph_proxy {
+public:
+    //! Type of inputing data into FG.
+    typedef Input input_type;
+
+    //! Submit signal from an asynchronous activity to FG.
+    virtual bool try_put(const input_type&) = 0;
+};
+
+} //interfaceX
+
+using interface10::graph_proxy;
+using interface10::receiver_gateway;
+
+} //flow
+} //tbb
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/flow_graph_opencl_node.h b/xdl/third_party/tbb/include/tbb/flow_graph_opencl_node.h
new file mode 100644
index 00000000..6c24900b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/flow_graph_opencl_node.h
@@ -0,0 +1,1486 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_flow_graph_opencl_node_H
+#define __TBB_flow_graph_opencl_node_H
+
+#include "tbb/tbb_config.h"
+#if __TBB_PREVIEW_OPENCL_NODE
+
+#include "flow_graph.h"
+
+#include <vector>
+#include <string>
+#include <algorithm>
+#include <iostream>
+#include <fstream>
+#include <map>
+#include <mutex>
+
+#ifdef __APPLE__
+#include <OpenCL/opencl.h>
+#else
+#include <CL/cl.h>
+#endif
+
+namespace tbb {
+namespace flow {
+
+namespace interface10 {
+
+template <typename DeviceFilter>
+class opencl_factory;
+
+namespace opencl_info {
+class default_opencl_factory;
+}
+
+template <typename Factory>
+class opencl_program;
+
+inline void enforce_cl_retcode(cl_int err, std::string msg) {
+    if (err != CL_SUCCESS) {
+        std::cerr << msg << "; error code: " << err << std::endl;
+        throw msg;
+    }
+}
+
+template <typename T>
+T event_info(cl_event e, cl_event_info i) {
+    T res;
+    enforce_cl_retcode(clGetEventInfo(e, i, sizeof(res), &res, NULL), "Failed to get OpenCL event information");
+    return res;
+}
+
+template <typename T>
+T device_info(cl_device_id d, cl_device_info i) {
+    T res;
+    enforce_cl_retcode(clGetDeviceInfo(d, i, sizeof(res), &res, NULL), "Failed to get OpenCL device information");
+    return res;
+}
+
+template <>
+inline std::string device_info<std::string>(cl_device_id d, cl_device_info i) {
+    size_t required;
+    enforce_cl_retcode(clGetDeviceInfo(d, i, 0, NULL, &required), "Failed to get OpenCL device information");
+
+    char *buff = (char*)alloca(required);
+    enforce_cl_retcode(clGetDeviceInfo(d, i, required, buff, NULL), "Failed to get OpenCL device information");
+
+    return buff;
+}
+
+template <typename T>
+T platform_info(cl_platform_id p, cl_platform_info i) {
+    T res;
+    enforce_cl_retcode(clGetPlatformInfo(p, i, sizeof(res), &res, NULL), "Failed to get OpenCL platform information");
+    return res;
+}
+
+template <>
+inline std::string platform_info<std::string>(cl_platform_id p, cl_platform_info  i) {
+    size_t required;
+    enforce_cl_retcode(clGetPlatformInfo(p, i, 0, NULL, &required), "Failed to get OpenCL platform information");
+
+    char *buff = (char*)alloca(required);
+    enforce_cl_retcode(clGetPlatformInfo(p, i, required, buff, NULL), "Failed to get OpenCL platform information");
+
+    return buff;
+}
+
+
+class opencl_device {
+public:
+    typedef size_t device_id_type;
+    enum : device_id_type {
+        unknown = device_id_type( -2 ),
+        host = device_id_type( -1 )
+    };
+
+    opencl_device() : my_device_id( unknown ), my_cl_device_id( NULL ), my_cl_command_queue( NULL ) {}
+
+    opencl_device( cl_device_id d_id ) : my_device_id( unknown ), my_cl_device_id( d_id ), my_cl_command_queue( NULL ) {}
+
+    opencl_device( cl_device_id cl_d_id, device_id_type device_id ) : my_device_id( device_id ), my_cl_device_id( cl_d_id ), my_cl_command_queue( NULL ) {}
+
+    std::string platform_profile() const {
+        return platform_info<std::string>( platform_id(), CL_PLATFORM_PROFILE );
+    }
+    std::string platform_version() const {
+        return platform_info<std::string>( platform_id(), CL_PLATFORM_VERSION );
+    }
+    std::string platform_name() const {
+        return platform_info<std::string>( platform_id(), CL_PLATFORM_NAME );
+    }
+    std::string platform_vendor() const {
+        return platform_info<std::string>( platform_id(), CL_PLATFORM_VENDOR );
+    }
+    std::string platform_extensions() const {
+        return platform_info<std::string>( platform_id(), CL_PLATFORM_EXTENSIONS );
+    }
+
+    template <typename T>
+    void info( cl_device_info i, T &t ) const {
+        t = device_info<T>( my_cl_device_id, i );
+    }
+    std::string version() const {
+        // The version string format: OpenCL<space><major_version.minor_version><space><vendor-specific information>
+        return device_info<std::string>( my_cl_device_id, CL_DEVICE_VERSION );
+    }
+    int major_version() const {
+        int major;
+        std::sscanf( version().c_str(), "OpenCL %d", &major );
+        return major;
+    }
+    int minor_version() const {
+        int major, minor;
+        std::sscanf( version().c_str(), "OpenCL %d.%d", &major, &minor );
+        return minor;
+    }
+    bool out_of_order_exec_mode_on_host_present() const {
+#if CL_VERSION_2_0
+        if ( major_version() >= 2 )
+            return (device_info<cl_command_queue_properties>( my_cl_device_id, CL_DEVICE_QUEUE_ON_HOST_PROPERTIES ) & CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE) != 0;
+        else
+#endif /* CL_VERSION_2_0 */
+            return (device_info<cl_command_queue_properties>( my_cl_device_id, CL_DEVICE_QUEUE_PROPERTIES ) & CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE) != 0;
+    }
+    bool out_of_order_exec_mode_on_device_present() const {
+#if CL_VERSION_2_0
+        if ( major_version() >= 2 )
+            return (device_info<cl_command_queue_properties>( my_cl_device_id, CL_DEVICE_QUEUE_ON_DEVICE_PROPERTIES ) & CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE) != 0;
+        else
+#endif /* CL_VERSION_2_0 */
+            return false;
+    }
+    std::array<size_t, 3> max_work_item_sizes() const {
+        return device_info<std::array<size_t, 3>>( my_cl_device_id, CL_DEVICE_MAX_WORK_ITEM_SIZES );
+    }
+    size_t max_work_group_size() const {
+        return device_info<size_t>( my_cl_device_id, CL_DEVICE_MAX_WORK_GROUP_SIZE );
+    }
+    bool built_in_kernel_available( const std::string& k ) const {
+        const std::string semi = ";";
+        // Added semicolumns to force an exact match (to avoid a partial match, e.g. "add" is partly matched with "madd").
+        return (semi + built_in_kernels() + semi).find( semi + k + semi ) != std::string::npos;
+    }
+    std::string built_in_kernels() const {
+        return device_info<std::string>( my_cl_device_id, CL_DEVICE_BUILT_IN_KERNELS );
+    }
+    std::string name() const {
+        return device_info<std::string>( my_cl_device_id, CL_DEVICE_NAME );
+    }
+    cl_bool available() const {
+        return device_info<cl_bool>( my_cl_device_id, CL_DEVICE_AVAILABLE );
+    }
+    cl_bool compiler_available() const {
+        return device_info<cl_bool>( my_cl_device_id, CL_DEVICE_COMPILER_AVAILABLE );
+    }
+    cl_bool linker_available() const {
+        return device_info<cl_bool>( my_cl_device_id, CL_DEVICE_LINKER_AVAILABLE );
+    }
+    bool extension_available( const std::string &ext ) const {
+        const std::string space = " ";
+        // Added space to force an exact match (to avoid a partial match, e.g. "ext" is partly matched with "ext2").
+        return (space + extensions() + space).find( space + ext + space ) != std::string::npos;
+    }
+    std::string extensions() const {
+        return device_info<std::string>( my_cl_device_id, CL_DEVICE_EXTENSIONS );
+    }
+
+    cl_device_type type() const {
+        return device_info<cl_device_type>( my_cl_device_id, CL_DEVICE_TYPE );
+    }
+
+    std::string vendor() const {
+        return device_info<std::string>( my_cl_device_id, CL_DEVICE_VENDOR );
+    }
+
+    cl_uint address_bits() const {
+        return device_info<cl_uint>( my_cl_device_id, CL_DEVICE_ADDRESS_BITS );
+    }
+
+    cl_device_id device_id() const {
+        return my_cl_device_id;
+    }
+
+    cl_command_queue command_queue() const {
+        return my_cl_command_queue;
+    }
+
+    void set_command_queue( cl_command_queue cmd_queue ) {
+        my_cl_command_queue = cmd_queue;
+    }
+
+    cl_platform_id platform_id() const {
+        return device_info<cl_platform_id>( my_cl_device_id, CL_DEVICE_PLATFORM );
+    }
+
+private:
+
+    device_id_type my_device_id;
+    cl_device_id my_cl_device_id;
+    cl_command_queue my_cl_command_queue;
+
+    friend bool operator==(opencl_device d1, opencl_device d2) { return d1.my_cl_device_id == d2.my_cl_device_id; }
+
+    template <typename DeviceFilter>
+    friend class opencl_factory;
+    template <typename Factory>
+    friend class opencl_memory;
+    template <typename Factory>
+    friend class opencl_program;
+
+#if TBB_USE_ASSERT
+    template <typename T, typename Factory>
+    friend class opencl_buffer;
+#endif
+};
+
+class opencl_device_list {
+    typedef std::vector<opencl_device> container_type;
+public:
+    typedef container_type::iterator iterator;
+    typedef container_type::const_iterator const_iterator;
+    typedef container_type::size_type size_type;
+
+    opencl_device_list() {}
+    opencl_device_list( std::initializer_list<opencl_device> il ) : my_container( il ) {}
+
+    void add( opencl_device d ) { my_container.push_back( d ); }
+    size_type size() const { return my_container.size(); }
+    bool empty() const { return my_container.empty(); }
+    iterator begin() { return my_container.begin(); }
+    iterator end() { return my_container.end(); }
+    const_iterator begin() const { return my_container.begin(); }
+    const_iterator end() const { return my_container.end(); }
+    const_iterator cbegin() const { return my_container.cbegin(); }
+    const_iterator cend() const { return my_container.cend(); }
+
+private:
+    container_type my_container;
+};
+
+namespace internal {
+
+// Retrieve all OpenCL devices from machine
+inline opencl_device_list find_available_devices() {
+    opencl_device_list opencl_devices;
+
+    cl_uint num_platforms;
+    enforce_cl_retcode(clGetPlatformIDs(0, NULL, &num_platforms), "clGetPlatformIDs failed");
+
+    std::vector<cl_platform_id> platforms(num_platforms);
+    enforce_cl_retcode(clGetPlatformIDs(num_platforms, platforms.data(), NULL), "clGetPlatformIDs failed");
+
+    cl_uint num_devices;
+    std::vector<cl_platform_id>::iterator platforms_it = platforms.begin();
+    cl_uint num_all_devices = 0;
+    while (platforms_it != platforms.end()) {
+        cl_int err = clGetDeviceIDs(*platforms_it, CL_DEVICE_TYPE_ALL, 0, NULL, &num_devices);
+        if (err == CL_DEVICE_NOT_FOUND) {
+            platforms_it = platforms.erase(platforms_it);
+        }
+        else {
+            enforce_cl_retcode(err, "clGetDeviceIDs failed");
+            num_all_devices += num_devices;
+            ++platforms_it;
+        }
+    }
+
+    std::vector<cl_device_id> devices(num_all_devices);
+    std::vector<cl_device_id>::iterator devices_it = devices.begin();
+    for (auto p = platforms.begin(); p != platforms.end(); ++p) {
+        enforce_cl_retcode(clGetDeviceIDs((*p), CL_DEVICE_TYPE_ALL, (cl_uint)std::distance(devices_it, devices.end()), &*devices_it, &num_devices), "clGetDeviceIDs failed");
+        devices_it += num_devices;
+    }
+
+    for (auto d = devices.begin(); d != devices.end(); ++d) {
+        opencl_devices.add(opencl_device((*d)));
+    }
+
+    return opencl_devices;
+}
+
+} // namespace internal
+
+// TODO: consider this namespace as public API
+namespace opencl_info {
+
+    inline const opencl_device_list& available_devices() {
+        // Static storage for all available OpenCL devices on machine
+        static const opencl_device_list my_devices = internal::find_available_devices();
+        return my_devices;
+    }
+
+} // namespace opencl_info
+
+
+class callback_base : tbb::internal::no_copy {
+public:
+    virtual void call() = 0;
+    virtual ~callback_base() {}
+};
+
+template <typename Callback, typename T>
+class callback : public callback_base {
+    Callback my_callback;
+    T my_data;
+public:
+    callback( Callback c, const T& t ) : my_callback( c ), my_data( t ) {}
+
+    void call() __TBB_override {
+        my_callback( my_data );
+    }
+};
+
+template <typename T, typename Factory = opencl_info::default_opencl_factory>
+class opencl_async_msg : public async_msg<T> {
+public:
+    typedef T value_type;
+
+    opencl_async_msg() : my_callback_flag_ptr( std::make_shared< tbb::atomic<bool>>() ) {
+        my_callback_flag_ptr->store<tbb::relaxed>(false);
+    }
+
+    explicit opencl_async_msg( const T& data ) : my_data(data), my_callback_flag_ptr( std::make_shared<tbb::atomic<bool>>() ) {
+        my_callback_flag_ptr->store<tbb::relaxed>(false);
+    }
+
+    opencl_async_msg( const T& data, cl_event event ) : my_data(data), my_event(event), my_is_event(true), my_callback_flag_ptr( std::make_shared<tbb::atomic<bool>>() ) {
+        my_callback_flag_ptr->store<tbb::relaxed>(false);
+        enforce_cl_retcode( clRetainEvent( my_event ), "Failed to retain an event" );
+    }
+
+    T& data( bool wait = true ) {
+        if ( my_is_event && wait ) {
+            enforce_cl_retcode( clWaitForEvents( 1, &my_event ), "Failed to wait for an event" );
+            enforce_cl_retcode( clReleaseEvent( my_event ), "Failed to release an event" );
+            my_is_event = false;
+        }
+        return my_data;
+    }
+
+    const T& data( bool wait = true ) const {
+        if ( my_is_event && wait ) {
+            enforce_cl_retcode( clWaitForEvents( 1, &my_event ), "Failed to wait for an event" );
+            enforce_cl_retcode( clReleaseEvent( my_event ), "Failed to release an event" );
+            my_is_event = false;
+        }
+        return my_data;
+    }
+
+    opencl_async_msg( const opencl_async_msg &dmsg ) : async_msg<T>(dmsg),
+        my_data(dmsg.my_data), my_event(dmsg.my_event), my_is_event( dmsg.my_is_event ),
+        my_callback_flag_ptr(dmsg.my_callback_flag_ptr)
+    {
+        if ( my_is_event )
+            enforce_cl_retcode( clRetainEvent( my_event ), "Failed to retain an event" );
+    }
+
+    opencl_async_msg( opencl_async_msg &&dmsg ) : async_msg<T>(std::move(dmsg)),
+        my_data(std::move(dmsg.my_data)), my_event(dmsg.my_event), my_is_event(dmsg.my_is_event),
+        my_callback_flag_ptr( std::move(dmsg.my_callback_flag_ptr) )
+    {
+        dmsg.my_is_event = false;
+    }
+
+    opencl_async_msg& operator=(const opencl_async_msg &dmsg) {
+        async_msg<T>::operator =(dmsg);
+
+        // Release original event
+        if ( my_is_event )
+            enforce_cl_retcode( clReleaseEvent( my_event ), "Failed to retain an event" );
+
+        my_data = dmsg.my_data;
+        my_event = dmsg.my_event;
+        my_is_event = dmsg.my_is_event;
+
+        // Retain copied event
+        if ( my_is_event )
+            enforce_cl_retcode( clRetainEvent( my_event ), "Failed to retain an event" );
+
+        my_callback_flag_ptr = dmsg.my_callback_flag_ptr;
+        return *this;
+    }
+
+    ~opencl_async_msg() {
+        if ( my_is_event )
+            enforce_cl_retcode( clReleaseEvent( my_event ), "Failed to release an event" );
+    }
+
+    cl_event const * get_event() const { return my_is_event ? &my_event : NULL; }
+    void set_event( cl_event e ) const {
+        if ( my_is_event ) {
+            cl_command_queue cq = event_info<cl_command_queue>( my_event, CL_EVENT_COMMAND_QUEUE );
+            if ( cq != event_info<cl_command_queue>( e, CL_EVENT_COMMAND_QUEUE ) )
+                enforce_cl_retcode( clFlush( cq ), "Failed to flush an OpenCL command queue" );
+            enforce_cl_retcode( clReleaseEvent( my_event ), "Failed to release an event" );
+        }
+        my_is_event = true;
+        my_event = e;
+        clRetainEvent( my_event );
+    }
+
+    void clear_event() const {
+        if ( my_is_event ) {
+            enforce_cl_retcode( clFlush( event_info<cl_command_queue>( my_event, CL_EVENT_COMMAND_QUEUE ) ), "Failed to flush an OpenCL command queue" );
+            enforce_cl_retcode( clReleaseEvent( my_event ), "Failed to release an event" );
+        }
+        my_is_event = false;
+    }
+
+    template <typename Callback>
+    void register_callback( Callback c ) const {
+        __TBB_ASSERT( my_is_event, "The OpenCL event is not set" );
+        enforce_cl_retcode( clSetEventCallback( my_event, CL_COMPLETE, register_callback_func, new callback<Callback, T>( c, my_data ) ), "Failed to set an OpenCL callback" );
+    }
+
+    operator T&() { return data(); }
+    operator const T&() const { return data(); }
+
+protected:
+    // Overridden in this derived class to inform that
+    // async calculation chain is over
+    void finalize() const __TBB_override {
+        receive_if_memory_object(*this);
+        if (! my_callback_flag_ptr->fetch_and_store(true)) {
+            opencl_async_msg a(*this);
+            if (my_is_event) {
+                register_callback([a](const T& t) mutable {
+                    a.set(t);
+                });
+            }
+            else {
+                a.set(my_data);
+            }
+        }
+        clear_event();
+    }
+
+private:
+    static void CL_CALLBACK register_callback_func( cl_event, cl_int event_command_exec_status, void *data ) {
+        tbb::internal::suppress_unused_warning( event_command_exec_status );
+        __TBB_ASSERT( event_command_exec_status == CL_COMPLETE, NULL );
+        __TBB_ASSERT( data, NULL );
+        callback_base *c = static_cast<callback_base*>(data);
+        c->call();
+        delete c;
+    }
+
+    T my_data;
+    mutable cl_event my_event;
+    mutable bool my_is_event = false;
+
+    std::shared_ptr< tbb::atomic<bool> > my_callback_flag_ptr;
+};
+
+template <typename K, typename T, typename Factory>
+K key_from_message( const opencl_async_msg<T, Factory> &dmsg ) {
+    using tbb::flow::key_from_message;
+    const T &t = dmsg.data( false );
+    __TBB_STATIC_ASSERT( true, "" );
+    return key_from_message<K, T>( t );
+}
+
+template <typename Factory>
+class opencl_memory {
+public:
+    opencl_memory() {}
+    opencl_memory( Factory &f ) : my_host_ptr( NULL ), my_factory( &f ), my_sending_event_present( false ) {
+        my_curr_device_id = my_factory->devices().begin()->my_device_id;
+    }
+
+    ~opencl_memory() {
+        if ( my_sending_event_present ) enforce_cl_retcode( clReleaseEvent( my_sending_event ), "Failed to release an event for the OpenCL buffer" );
+        enforce_cl_retcode( clReleaseMemObject( my_cl_mem ), "Failed to release an memory object" );
+    }
+
+    cl_mem get_cl_mem() const {
+        return my_cl_mem;
+    }
+
+    void* get_host_ptr() {
+        if ( !my_host_ptr ) {
+            opencl_async_msg<void*, Factory> d = receive( NULL );
+            d.data();
+            __TBB_ASSERT( d.data() == my_host_ptr, NULL );
+        }
+        return my_host_ptr;
+    }
+
+    Factory *factory() const { return my_factory; }
+
+    opencl_async_msg<void*, Factory> receive(const cl_event *e) {
+        opencl_async_msg<void*, Factory> d;
+        if (e) {
+            d = opencl_async_msg<void*, Factory>(my_host_ptr, *e);
+        } else {
+            d = opencl_async_msg<void*, Factory>(my_host_ptr);
+        }
+
+        // Concurrent receives are prohibited so we do not worry about synchronization.
+        if (my_curr_device_id.load<tbb::relaxed>() != opencl_device::host) {
+            map_memory(*my_factory->devices().begin(), d);
+            my_curr_device_id.store<tbb::relaxed>(opencl_device::host);
+            my_host_ptr = d.data(false);
+        }
+        // Release the sending event
+        if (my_sending_event_present) {
+            enforce_cl_retcode(clReleaseEvent(my_sending_event), "Failed to release an event");
+            my_sending_event_present = false;
+        }
+        return d;
+    }
+
+    opencl_async_msg<void*, Factory> send(opencl_device device, const cl_event *e) {
+        opencl_device::device_id_type device_id = device.my_device_id;
+        if (!my_factory->is_same_context(my_curr_device_id.load<tbb::acquire>(), device_id)) {
+            {
+                tbb::spin_mutex::scoped_lock lock(my_sending_lock);
+                if (!my_factory->is_same_context(my_curr_device_id.load<tbb::relaxed>(), device_id)) {
+                    __TBB_ASSERT(my_host_ptr, "The buffer has not been mapped");
+                    opencl_async_msg<void*, Factory> d(my_host_ptr);
+                    my_factory->enqueue_unmap_buffer(device, *this, d);
+                    my_sending_event = *d.get_event();
+                    my_sending_event_present = true;
+                    enforce_cl_retcode(clRetainEvent(my_sending_event), "Failed to retain an event");
+                    my_host_ptr = NULL;
+                    my_curr_device_id.store<tbb::release>(device_id);
+                }
+            }
+            __TBB_ASSERT(my_sending_event_present, NULL);
+        }
+
+        // !e means that buffer has come from the host
+        if (!e && my_sending_event_present) e = &my_sending_event;
+
+        __TBB_ASSERT(!my_host_ptr, "The buffer has not been unmapped");
+        return e ? opencl_async_msg<void*, Factory>(NULL, *e) : opencl_async_msg<void*, Factory>(NULL);
+    }
+
+    virtual void map_memory( opencl_device, opencl_async_msg<void*, Factory> & ) = 0;
+protected:
+    cl_mem my_cl_mem;
+    tbb::atomic<opencl_device::device_id_type> my_curr_device_id;
+    void* my_host_ptr;
+    Factory *my_factory;
+
+    tbb::spin_mutex my_sending_lock;
+    bool my_sending_event_present;
+    cl_event my_sending_event;
+};
+
+template <typename Factory>
+class opencl_buffer_impl : public opencl_memory<Factory> {
+    size_t my_size;
+public:
+    opencl_buffer_impl( size_t size, Factory& f ) : opencl_memory<Factory>( f ), my_size( size ) {
+        cl_int err;
+        this->my_cl_mem = clCreateBuffer( this->my_factory->context(), CL_MEM_ALLOC_HOST_PTR, size, NULL, &err );
+        enforce_cl_retcode( err, "Failed to create an OpenCL buffer" );
+    }
+
+    // The constructor for subbuffers.
+    opencl_buffer_impl( cl_mem m, size_t index, size_t size, Factory& f ) : opencl_memory<Factory>( f ), my_size( size ) {
+        cl_int err;
+        cl_buffer_region region = { index, size };
+        this->my_cl_mem = clCreateSubBuffer( m, 0, CL_BUFFER_CREATE_TYPE_REGION, &region, &err );
+        enforce_cl_retcode( err, "Failed to create an OpenCL subbuffer" );
+    }
+
+    size_t size() const {
+        return my_size;
+    }
+
+    void map_memory( opencl_device device, opencl_async_msg<void*, Factory> &dmsg ) __TBB_override {
+        this->my_factory->enqueue_map_buffer( device, *this, dmsg );
+    }
+
+#if TBB_USE_ASSERT
+    template <typename, typename>
+    friend class opencl_buffer;
+#endif
+};
+
+enum access_type {
+    read_write,
+    write_only,
+    read_only
+};
+
+template <typename T, typename Factory = opencl_info::default_opencl_factory>
+class opencl_subbuffer;
+
+template <typename T, typename Factory = opencl_info::default_opencl_factory>
+class opencl_buffer {
+public:
+    typedef cl_mem native_object_type;
+    typedef opencl_buffer memory_object_type;
+    typedef Factory opencl_factory_type;
+
+    template<access_type a> using iterator = T*;
+
+    template <access_type a>
+    iterator<a> access() const {
+        T* ptr = (T*)my_impl->get_host_ptr();
+        __TBB_ASSERT( ptr, NULL );
+        return iterator<a>( ptr );
+    }
+
+    T* data() const { return &access<read_write>()[0]; }
+
+    template <access_type a = read_write>
+    iterator<a> begin() const { return access<a>(); }
+
+    template <access_type a = read_write>
+    iterator<a> end() const { return access<a>()+my_impl->size()/sizeof(T); }
+
+    size_t size() const { return my_impl->size()/sizeof(T); }
+
+    T& operator[] ( ptrdiff_t k ) { return begin()[k]; }
+
+    opencl_buffer() {}
+    opencl_buffer( size_t size );
+    opencl_buffer( Factory &f, size_t size ) : my_impl( std::make_shared<impl_type>( size*sizeof(T), f ) ) {}
+
+    cl_mem native_object() const {
+        return my_impl->get_cl_mem();
+    }
+
+    const opencl_buffer& memory_object() const {
+        return *this;
+    }
+
+    void send( opencl_device device, opencl_async_msg<opencl_buffer, Factory> &dependency ) const {
+        __TBB_ASSERT( dependency.data( /*wait = */false ) == *this, NULL );
+        opencl_async_msg<void*, Factory> d = my_impl->send( device, dependency.get_event() );
+        const cl_event *e = d.get_event();
+        if ( e ) dependency.set_event( *e );
+        else dependency.clear_event();
+    }
+    void receive( const opencl_async_msg<opencl_buffer, Factory> &dependency ) const {
+        __TBB_ASSERT( dependency.data( /*wait = */false ) == *this, NULL );
+        opencl_async_msg<void*, Factory> d = my_impl->receive( dependency.get_event() );
+        const cl_event *e = d.get_event();
+        if ( e ) dependency.set_event( *e );
+        else dependency.clear_event();
+    }
+
+    opencl_subbuffer<T, Factory> subbuffer( size_t index, size_t size ) const;
+private:
+    // The constructor for subbuffers.
+    opencl_buffer( Factory &f, cl_mem m, size_t index, size_t size ) : my_impl( std::make_shared<impl_type>( m, index*sizeof(T), size*sizeof(T), f ) ) {}
+
+    typedef opencl_buffer_impl<Factory> impl_type;
+
+    std::shared_ptr<impl_type> my_impl;
+
+    friend bool operator==(const opencl_buffer<T, Factory> &lhs, const opencl_buffer<T, Factory> &rhs) {
+        return lhs.my_impl == rhs.my_impl;
+    }
+
+    template <typename>
+    friend class opencl_factory;
+    template <typename, typename>
+    friend class opencl_subbuffer;
+};
+
+template <typename T, typename Factory>
+class opencl_subbuffer : public opencl_buffer<T, Factory> {
+    opencl_buffer<T, Factory> my_owner;
+public:
+    opencl_subbuffer() {}
+    opencl_subbuffer( const opencl_buffer<T, Factory> &owner, size_t index, size_t size ) :
+        opencl_buffer<T, Factory>( *owner.my_impl->factory(), owner.native_object(), index, size ), my_owner( owner ) {}
+};
+
+template <typename T, typename Factory>
+opencl_subbuffer<T, Factory> opencl_buffer<T, Factory>::subbuffer( size_t index, size_t size ) const {
+    return opencl_subbuffer<T, Factory>( *this, index, size );
+}
+
+
+#define is_typedef(type)                                                    \
+    template <typename T>                                                   \
+    struct is_##type {                                                      \
+        template <typename C>                                               \
+        static std::true_type check( typename C::type* );                   \
+        template <typename C>                                               \
+        static std::false_type check( ... );                                \
+                                                                            \
+        static const bool value = decltype(check<T>(0))::value;             \
+    }
+
+is_typedef( native_object_type );
+is_typedef( memory_object_type );
+
+template <typename T>
+typename std::enable_if<is_native_object_type<T>::value, typename T::native_object_type>::type get_native_object( const T &t ) {
+    return t.native_object();
+}
+
+template <typename T>
+typename std::enable_if<!is_native_object_type<T>::value, T>::type get_native_object( T t ) {
+    return t;
+}
+
+// send_if_memory_object checks if the T type has memory_object_type and call the send method for the object.
+template <typename T, typename Factory>
+typename std::enable_if<is_memory_object_type<T>::value>::type send_if_memory_object( opencl_device device, opencl_async_msg<T, Factory> &dmsg ) {
+    const T &t = dmsg.data( false );
+    typedef typename T::memory_object_type mem_obj_t;
+    mem_obj_t mem_obj = t.memory_object();
+    opencl_async_msg<mem_obj_t, Factory> d( mem_obj );
+    if ( dmsg.get_event() ) d.set_event( *dmsg.get_event() );
+    mem_obj.send( device, d );
+    if ( d.get_event() ) dmsg.set_event( *d.get_event() );
+}
+
+template <typename T>
+typename std::enable_if<is_memory_object_type<T>::value>::type send_if_memory_object( opencl_device device, T &t ) {
+    typedef typename T::memory_object_type mem_obj_t;
+    mem_obj_t mem_obj = t.memory_object();
+    opencl_async_msg<mem_obj_t, typename mem_obj_t::opencl_factory_type> dmsg( mem_obj );
+    mem_obj.send( device, dmsg );
+}
+
+template <typename T>
+typename std::enable_if<!is_memory_object_type<T>::value>::type send_if_memory_object( opencl_device, T& ) {};
+
+// receive_if_memory_object checks if the T type has memory_object_type and call the receive method for the object.
+template <typename T, typename Factory>
+typename std::enable_if<is_memory_object_type<T>::value>::type receive_if_memory_object( const opencl_async_msg<T, Factory> &dmsg ) {
+    const T &t = dmsg.data( false );
+    typedef typename T::memory_object_type mem_obj_t;
+    mem_obj_t mem_obj = t.memory_object();
+    opencl_async_msg<mem_obj_t, Factory> d( mem_obj );
+    if ( dmsg.get_event() ) d.set_event( *dmsg.get_event() );
+    mem_obj.receive( d );
+    if ( d.get_event() ) dmsg.set_event( *d.get_event() );
+}
+
+template <typename T>
+typename std::enable_if<!is_memory_object_type<T>::value>::type  receive_if_memory_object( const T& ) {}
+
+class opencl_range {
+public:
+    typedef size_t range_index_type;
+    typedef std::array<range_index_type, 3> nd_range_type;
+
+    template <typename G = std::initializer_list<int>, typename L = std::initializer_list<int>,
+        typename = typename std::enable_if<!std::is_same<typename std::decay<G>::type, opencl_range>::value>::type>
+    opencl_range(G&& global_work = std::initializer_list<int>({ 0 }), L&& local_work = std::initializer_list<int>({ 0, 0, 0 })) {
+        auto g_it = global_work.begin();
+        auto l_it = local_work.begin();
+        my_global_work_size = { size_t(-1), size_t(-1), size_t(-1) };
+        // my_local_work_size is still uninitialized
+        for (int s = 0; s < 3 && g_it != global_work.end(); ++g_it, ++l_it, ++s) {
+            __TBB_ASSERT(l_it != local_work.end(), "global_work & local_work must have same size");
+            my_global_work_size[s] = *g_it;
+            my_local_work_size[s] = *l_it;
+        }
+    }
+
+    const nd_range_type& global_range() const { return my_global_work_size; }
+    const nd_range_type& local_range() const { return my_local_work_size; }
+
+private:
+    nd_range_type my_global_work_size;
+    nd_range_type my_local_work_size;
+};
+
+template <typename DeviceFilter>
+class opencl_factory {
+public:
+    template<typename T> using async_msg_type = opencl_async_msg<T, opencl_factory<DeviceFilter>>;
+    typedef opencl_device device_type;
+
+    class kernel : tbb::internal::no_assign {
+    public:
+        kernel( const kernel& k ) : my_factory( k.my_factory ) {
+            // Clone my_cl_kernel via opencl_program
+            size_t ret_size = 0;
+
+            std::vector<char> kernel_name;
+            for ( size_t curr_size = 32;; curr_size <<= 1 ) {
+                kernel_name.resize( curr_size <<= 1 );
+                enforce_cl_retcode( clGetKernelInfo( k.my_cl_kernel, CL_KERNEL_FUNCTION_NAME, curr_size, kernel_name.data(), &ret_size ), "Failed to get kernel info" );
+                if ( ret_size < curr_size ) break;
+            }
+
+            cl_program program;
+            enforce_cl_retcode( clGetKernelInfo( k.my_cl_kernel, CL_KERNEL_PROGRAM, sizeof(program), &program, &ret_size ), "Failed to get kernel info" );
+            __TBB_ASSERT( ret_size == sizeof(program), NULL );
+
+            my_cl_kernel = opencl_program< factory_type >( my_factory, program ).get_cl_kernel( kernel_name.data() );
+        }
+
+        ~kernel() {
+            enforce_cl_retcode( clReleaseKernel( my_cl_kernel ), "Failed to release a kernel" );
+        }
+
+    private:
+        typedef opencl_factory<DeviceFilter> factory_type;
+
+        kernel( const cl_kernel& k, factory_type& f ) : my_cl_kernel( k ), my_factory( f ) {}
+
+        // Data
+        cl_kernel my_cl_kernel;
+        factory_type& my_factory;
+
+        template <typename DeviceFilter_>
+        friend class opencl_factory;
+
+        template <typename Factory>
+        friend class opencl_program;
+    };
+
+    typedef kernel kernel_type;
+
+    // 'range_type' enables kernel_executor with range support
+    // it affects expectations for enqueue_kernel(.....) interface method
+    typedef opencl_range range_type;
+
+    opencl_factory() {}
+    ~opencl_factory() {
+        if ( my_devices.size() ) {
+            for ( auto d = my_devices.begin(); d != my_devices.end(); ++d ) {
+                enforce_cl_retcode( clReleaseCommandQueue( (*d).my_cl_command_queue ), "Failed to release a command queue" );
+            }
+            enforce_cl_retcode( clReleaseContext( my_cl_context ), "Failed to release a context" );
+        }
+    }
+
+    bool init( const opencl_device_list &device_list ) {
+        tbb::spin_mutex::scoped_lock lock( my_devices_mutex );
+        if ( !my_devices.size() ) {
+            my_devices = device_list;
+            return true;
+        }
+        return false;
+    }
+
+
+private:
+    template <typename Factory>
+    void enqueue_map_buffer( opencl_device device, opencl_buffer_impl<Factory> &buffer, opencl_async_msg<void*, Factory>& dmsg ) {
+        cl_event const* e1 = dmsg.get_event();
+        cl_event e2;
+        cl_int err;
+        void *ptr = clEnqueueMapBuffer( device.my_cl_command_queue, buffer.get_cl_mem(), false, CL_MAP_READ | CL_MAP_WRITE, 0, buffer.size(),
+            e1 == NULL ? 0 : 1, e1, &e2, &err );
+        enforce_cl_retcode( err, "Failed to map a buffer" );
+        dmsg.data( false ) = ptr;
+        dmsg.set_event( e2 );
+        enforce_cl_retcode( clReleaseEvent( e2 ), "Failed to release an event" );
+    }
+
+
+    template <typename Factory>
+    void enqueue_unmap_buffer( opencl_device device, opencl_memory<Factory> &memory, opencl_async_msg<void*, Factory>& dmsg ) {
+        cl_event const* e1 = dmsg.get_event();
+        cl_event e2;
+        enforce_cl_retcode(
+            clEnqueueUnmapMemObject( device.my_cl_command_queue, memory.get_cl_mem(), memory.get_host_ptr(), e1 == NULL ? 0 : 1, e1, &e2 ),
+           "Failed to unmap a buffer" );
+        dmsg.set_event( e2 );
+        enforce_cl_retcode( clReleaseEvent( e2 ), "Failed to release an event" );
+    }
+
+    // --------- Kernel argument & event list helpers --------- //
+    template <size_t NUM_ARGS, typename T>
+    void process_one_arg( const kernel_type& kernel, std::array<cl_event, NUM_ARGS>&, int&, int& place, const T& t ) {
+        auto p = get_native_object(t);
+        enforce_cl_retcode( clSetKernelArg(kernel.my_cl_kernel, place++, sizeof(p), &p), "Failed to set a kernel argument" );
+    }
+
+    template <size_t NUM_ARGS, typename T, typename F>
+    void process_one_arg( const kernel_type& kernel, std::array<cl_event, NUM_ARGS>& events, int& num_events, int& place, const opencl_async_msg<T, F>& msg ) {
+        __TBB_ASSERT((static_cast<typename std::array<cl_event, NUM_ARGS>::size_type>(num_events) < events.size()), NULL);
+
+        const cl_event * const e = msg.get_event();
+        if (e != NULL) {
+            events[num_events++] = *e;
+        }
+
+        process_one_arg( kernel, events, num_events, place, msg.data(false) );
+    }
+
+    template <size_t NUM_ARGS, typename T, typename ...Rest>
+    void process_arg_list( const kernel_type& kernel, std::array<cl_event, NUM_ARGS>& events, int& num_events, int& place, const T& t, const Rest&... args ) {
+        process_one_arg( kernel, events, num_events, place, t );
+        process_arg_list( kernel, events, num_events, place, args... );
+    }
+
+    template <size_t NUM_ARGS>
+    void process_arg_list( const kernel_type&, std::array<cl_event, NUM_ARGS>&, int&, int& ) {}
+    // ------------------------------------------- //
+    template <typename T>
+    void update_one_arg( cl_event, T& ) {}
+
+    template <typename T, typename F>
+    void update_one_arg( cl_event e, opencl_async_msg<T, F>& msg ) {
+        msg.set_event( e );
+    }
+
+    template <typename T, typename ...Rest>
+    void update_arg_list( cl_event e, T& t, Rest&... args ) {
+        update_one_arg( e, t );
+        update_arg_list( e, args... );
+    }
+
+    void update_arg_list( cl_event ) {}
+    // ------------------------------------------- //
+public:
+    template <typename ...Args>
+    void send_kernel( opencl_device device, const kernel_type& kernel, const range_type& work_size, Args&... args ) {
+        std::array<cl_event, sizeof...(Args)> events;
+        int num_events = 0;
+        int place = 0;
+        process_arg_list( kernel, events, num_events, place, args... );
+
+        const cl_event e = send_kernel_impl( device, kernel.my_cl_kernel, work_size, num_events, events.data() );
+
+        update_arg_list(e, args...);
+
+        // Release our own reference to cl_event
+        enforce_cl_retcode( clReleaseEvent(e), "Failed to release an event" );
+    }
+
+    // ------------------------------------------- //
+    template <typename T, typename ...Rest>
+    void send_data(opencl_device device, T& t, Rest&... args) {
+        send_if_memory_object( device, t );
+        send_data( device, args... );
+    }
+
+    void send_data(opencl_device) {}
+    // ------------------------------------------- //
+
+private:
+    cl_event send_kernel_impl( opencl_device device, const cl_kernel& kernel,
+        const range_type& work_size, cl_uint num_events, cl_event* event_list ) {
+        const typename range_type::nd_range_type g_offset = { { 0, 0, 0 } };
+        const typename range_type::nd_range_type& g_size = work_size.global_range();
+        const typename range_type::nd_range_type& l_size = work_size.local_range();
+        cl_uint s;
+        for ( s = 1; s < 3 && g_size[s] != size_t(-1); ++s) {}
+        cl_event event;
+        enforce_cl_retcode(
+            clEnqueueNDRangeKernel( device.my_cl_command_queue, kernel, s,
+                g_offset.data(), g_size.data(), l_size[0] ? l_size.data() : NULL, num_events, num_events ? event_list : NULL, &event ),
+            "Failed to enqueue a kernel" );
+        return event;
+    }
+
+    // ------------------------------------------- //
+    template <typename T>
+    bool get_event_from_one_arg( cl_event&, const T& ) {
+        return false;
+    }
+
+    template <typename T, typename F>
+    bool get_event_from_one_arg( cl_event& e, const opencl_async_msg<T, F>& msg) {
+        cl_event const *e_ptr = msg.get_event();
+
+        if ( e_ptr != NULL ) {
+            e = *e_ptr;
+            return true;
+        }
+
+        return false;
+    }
+
+    template <typename T, typename ...Rest>
+    bool get_event_from_args( cl_event& e, const T& t, const Rest&... args ) {
+        if ( get_event_from_one_arg( e, t ) ) {
+            return true;
+        }
+
+        return get_event_from_args( e, args... );
+    }
+
+    bool get_event_from_args( cl_event& ) {
+        return false;
+    }
+    // ------------------------------------------- //
+
+    struct finalize_fn : tbb::internal::no_assign {
+        virtual ~finalize_fn() {}
+        virtual void operator() () {}
+    };
+
+    template<typename Fn>
+    struct finalize_fn_leaf : public finalize_fn {
+        Fn my_fn;
+        finalize_fn_leaf(Fn fn) : my_fn(fn) {}
+        void operator() () __TBB_override { my_fn(); }
+    };
+
+    static void CL_CALLBACK finalize_callback(cl_event, cl_int event_command_exec_status, void *data) {
+        tbb::internal::suppress_unused_warning(event_command_exec_status);
+        __TBB_ASSERT(event_command_exec_status == CL_COMPLETE, NULL);
+
+        finalize_fn * const fn_ptr = static_cast<finalize_fn*>(data);
+        __TBB_ASSERT(fn_ptr != NULL, "Invalid finalize function pointer");
+        (*fn_ptr)();
+
+        // Function pointer was created by 'new' & this callback must be called once only
+        delete fn_ptr;
+    }
+public:
+    template <typename FinalizeFn, typename ...Args>
+    void finalize( opencl_device device, FinalizeFn fn, Args&... args ) {
+        cl_event e;
+
+        if ( get_event_from_args( e, args... ) ) {
+            enforce_cl_retcode( clSetEventCallback( e, CL_COMPLETE, finalize_callback,
+                new finalize_fn_leaf<FinalizeFn>(fn) ), "Failed to set a callback" );
+        }
+
+        enforce_cl_retcode( clFlush( device.my_cl_command_queue ), "Failed to flush an OpenCL command queue" );
+    }
+
+    const opencl_device_list& devices() {
+        std::call_once( my_once_flag, &opencl_factory::init_once, this );
+        return my_devices;
+    }
+
+private:
+    bool is_same_context( opencl_device::device_id_type d1, opencl_device::device_id_type d2 ) {
+        __TBB_ASSERT( d1 != opencl_device::unknown && d2 != opencl_device::unknown, NULL );
+        // Currently, factory supports only one context so if the both devices are not host it means the are in the same context.
+        if ( d1 != opencl_device::host && d2 != opencl_device::host )
+            return true;
+        return d1 == d2;
+    }
+private:
+    opencl_factory( const opencl_factory& );
+    opencl_factory& operator=(const opencl_factory&);
+
+    cl_context context() {
+        std::call_once( my_once_flag, &opencl_factory::init_once, this );
+        return my_cl_context;
+    }
+
+    void init_once() {
+        {
+            tbb::spin_mutex::scoped_lock lock(my_devices_mutex);
+            if (!my_devices.size())
+                my_devices = DeviceFilter()( opencl_info::available_devices() );
+        }
+
+        enforce_cl_retcode(my_devices.size() ? CL_SUCCESS : CL_INVALID_DEVICE, "No devices in the device list");
+        cl_platform_id platform_id = my_devices.begin()->platform_id();
+        for (opencl_device_list::iterator it = ++my_devices.begin(); it != my_devices.end(); ++it)
+            enforce_cl_retcode(it->platform_id() == platform_id ? CL_SUCCESS : CL_INVALID_PLATFORM, "All devices should be in the same platform");
+
+        std::vector<cl_device_id> cl_device_ids;
+        for (auto d = my_devices.begin(); d != my_devices.end(); ++d) {
+            cl_device_ids.push_back((*d).my_cl_device_id);
+        }
+
+        cl_context_properties context_properties[3] = { CL_CONTEXT_PLATFORM, (cl_context_properties)platform_id, (cl_context_properties)NULL };
+        cl_int err;
+        cl_context ctx = clCreateContext(context_properties,
+            (cl_uint)cl_device_ids.size(),
+            cl_device_ids.data(),
+            NULL, NULL, &err);
+        enforce_cl_retcode(err, "Failed to create context");
+        my_cl_context = ctx;
+
+        size_t device_counter = 0;
+        for (auto d = my_devices.begin(); d != my_devices.end(); d++) {
+            (*d).my_device_id = device_counter++;
+            cl_int err2;
+            cl_command_queue cq;
+#if CL_VERSION_2_0
+            if ((*d).major_version() >= 2) {
+                if ((*d).out_of_order_exec_mode_on_host_present()) {
+                    cl_queue_properties props[] = { CL_QUEUE_PROPERTIES, CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE, 0 };
+                    cq = clCreateCommandQueueWithProperties(ctx, (*d).my_cl_device_id, props, &err2);
+                } else {
+                    cl_queue_properties props[] = { 0 };
+                    cq = clCreateCommandQueueWithProperties(ctx, (*d).my_cl_device_id, props, &err2);
+                }
+            } else
+#endif
+            {
+                cl_command_queue_properties props = (*d).out_of_order_exec_mode_on_host_present() ? CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE : 0;
+                // Suppress "declared deprecated" warning for the next line.
+#if __TBB_GCC_WARNING_SUPPRESSION_PRESENT
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wdeprecated-declarations"
+#endif
+#if _MSC_VER || __INTEL_COMPILER
+#pragma warning( push )
+#if __INTEL_COMPILER
+#pragma warning (disable: 1478)
+#else
+#pragma warning (disable: 4996)
+#endif
+#endif
+                cq = clCreateCommandQueue(ctx, (*d).my_cl_device_id, props, &err2);
+#if _MSC_VER || __INTEL_COMPILER
+#pragma warning( pop )
+#endif
+#if __TBB_GCC_WARNING_SUPPRESSION_PRESENT
+#pragma GCC diagnostic pop
+#endif
+            }
+            enforce_cl_retcode(err2, "Failed to create command queue");
+            (*d).my_cl_command_queue = cq;
+        }
+    }
+
+    std::once_flag my_once_flag;
+    opencl_device_list my_devices;
+    cl_context my_cl_context;
+
+    tbb::spin_mutex my_devices_mutex;
+
+    template <typename Factory>
+    friend class opencl_program;
+    template <typename Factory>
+    friend class opencl_buffer_impl;
+    template <typename Factory>
+    friend class opencl_memory;
+}; // class opencl_factory
+
+// TODO: consider this namespace as public API
+namespace opencl_info {
+
+// Default types
+
+template <typename Factory>
+struct default_device_selector {
+    opencl_device operator()(Factory& f) {
+        __TBB_ASSERT(!f.devices().empty(), "No available devices");
+        return *(f.devices().begin());
+    }
+};
+
+struct default_device_filter {
+    opencl_device_list operator()(const opencl_device_list &devices) {
+        opencl_device_list dl;
+        cl_platform_id platform_id = devices.begin()->platform_id();
+        for (opencl_device_list::const_iterator it = devices.cbegin(); it != devices.cend(); ++it) {
+            if (it->platform_id() == platform_id) {
+                dl.add(*it);
+            }
+        }
+        return dl;
+    }
+};
+
+class default_opencl_factory : public opencl_factory < default_device_filter >, tbb::internal::no_copy {
+public:
+    template<typename T> using async_msg_type = opencl_async_msg<T, default_opencl_factory>;
+
+    friend default_opencl_factory& default_factory();
+
+private:
+    default_opencl_factory() = default;
+};
+
+inline default_opencl_factory& default_factory() {
+    static default_opencl_factory default_factory;
+    return default_factory;
+}
+
+} // namespace opencl_info
+
+template <typename T, typename Factory>
+opencl_buffer<T, Factory>::opencl_buffer( size_t size ) : my_impl( std::make_shared<impl_type>( size*sizeof(T), opencl_info::default_factory() ) ) {}
+
+
+enum class opencl_program_type {
+    SOURCE,
+    PRECOMPILED,
+    SPIR
+};
+
+template <typename Factory = opencl_info::default_opencl_factory>
+class opencl_program : tbb::internal::no_assign {
+public:
+    typedef typename Factory::kernel_type kernel_type;
+
+    opencl_program( Factory& factory, opencl_program_type type, const std::string& program_name ) : my_factory( factory ), my_type(type) , my_arg_str( program_name) {}
+    opencl_program( Factory& factory, const char* program_name ) : opencl_program( factory, std::string( program_name ) ) {}
+    opencl_program( Factory& factory, const std::string& program_name ) : opencl_program( factory, opencl_program_type::SOURCE, program_name ) {}
+
+    opencl_program( opencl_program_type type, const std::string& program_name ) : opencl_program( opencl_info::default_factory(), type, program_name ) {}
+    opencl_program( const char* program_name ) : opencl_program( opencl_info::default_factory(), program_name ) {}
+    opencl_program( const std::string& program_name ) : opencl_program( opencl_info::default_factory(), program_name ) {}
+    opencl_program( opencl_program_type type ) : opencl_program( opencl_info::default_factory(), type ) {}
+
+    opencl_program( const opencl_program &src ) : my_factory( src.my_factory ), my_type( src.type ), my_arg_str( src.my_arg_str ), my_cl_program( src.my_cl_program ) {
+        // Set my_do_once_flag to the called state.
+        std::call_once( my_do_once_flag, [](){} );
+    }
+
+    kernel_type get_kernel( const std::string& k ) const {
+        return kernel_type( get_cl_kernel(k), my_factory );
+    }
+
+private:
+    opencl_program( Factory& factory, cl_program program ) : my_factory( factory ), my_cl_program( program ) {
+        // Set my_do_once_flag to the called state.
+        std::call_once( my_do_once_flag, [](){} );
+    }
+
+    cl_kernel get_cl_kernel( const std::string& k ) const {
+        std::call_once( my_do_once_flag, [this, &k](){ this->init( k ); } );
+        cl_int err;
+        cl_kernel kernel = clCreateKernel( my_cl_program, k.c_str(), &err );
+        enforce_cl_retcode( err, std::string( "Failed to create kernel: " ) + k );
+        return kernel;
+    }
+
+    class file_reader {
+    public:
+        file_reader( const std::string& filepath ) {
+            std::ifstream file_descriptor( filepath, std::ifstream::binary );
+            if ( !file_descriptor.is_open() ) {
+                std::string str = std::string( "Could not open file: " ) + filepath;
+                std::cerr << str << std::endl;
+                throw str;
+            }
+            file_descriptor.seekg( 0, file_descriptor.end );
+            size_t length = size_t( file_descriptor.tellg() );
+            file_descriptor.seekg( 0, file_descriptor.beg );
+            my_content.resize( length );
+            char* begin = &*my_content.begin();
+            file_descriptor.read( begin, length );
+            file_descriptor.close();
+        }
+        const char* content() { return &*my_content.cbegin(); }
+        size_t length() { return my_content.length(); }
+    private:
+        std::string my_content;
+    };
+
+    class opencl_program_builder {
+    public:
+        typedef void (CL_CALLBACK *cl_callback_type)(cl_program, void*);
+        opencl_program_builder( Factory& f, const std::string& name, cl_program program,
+                                cl_uint num_devices, cl_device_id* device_list,
+                                const char* options, cl_callback_type callback,
+                                void* user_data ) {
+            cl_int err = clBuildProgram( program, num_devices, device_list, options,
+                                         callback, user_data );
+            if( err == CL_SUCCESS )
+                return;
+            std::string str = std::string( "Failed to build program: " ) + name;
+            if ( err == CL_BUILD_PROGRAM_FAILURE ) {
+                const opencl_device_list &devices = f.devices();
+                for ( auto d = devices.begin(); d != devices.end(); ++d ) {
+                    std::cerr << "Build log for device: " << (*d).name() << std::endl;
+                    size_t log_size;
+                    cl_int query_err = clGetProgramBuildInfo(
+                        program, (*d).my_cl_device_id, CL_PROGRAM_BUILD_LOG, 0, NULL,
+                        &log_size );
+                    enforce_cl_retcode( query_err, "Failed to get build log size" );
+                    if( log_size ) {
+                        std::vector<char> output;
+                        output.resize( log_size );
+                        query_err = clGetProgramBuildInfo(
+                            program, (*d).my_cl_device_id, CL_PROGRAM_BUILD_LOG,
+                            output.size(), output.data(), NULL );
+                        enforce_cl_retcode( query_err, "Failed to get build output" );
+                        std::cerr << output.data() << std::endl;
+                    } else {
+                        std::cerr << "No build log available" << std::endl;
+                    }
+                }
+            }
+            enforce_cl_retcode( err, str );
+        }
+    };
+
+    class opencl_device_filter {
+    public:
+        template<typename Filter>
+        opencl_device_filter( cl_uint& num_devices, cl_device_id* device_list,
+                              Filter filter, const char* message ) {
+            for ( cl_uint i = 0; i < num_devices; ++i )
+                if ( filter(device_list[i]) ) {
+                    device_list[i--] = device_list[--num_devices];
+                }
+            if ( !num_devices )
+                enforce_cl_retcode( CL_DEVICE_NOT_AVAILABLE, message );
+        }
+    };
+
+    void init( const std::string& ) const {
+        cl_uint num_devices;
+        enforce_cl_retcode( clGetContextInfo( my_factory.context(), CL_CONTEXT_NUM_DEVICES, sizeof( num_devices ), &num_devices, NULL ),
+            "Failed to get OpenCL context info" );
+        if ( !num_devices )
+            enforce_cl_retcode( CL_DEVICE_NOT_FOUND, "No supported devices found" );
+        cl_device_id *device_list = (cl_device_id *)alloca( num_devices*sizeof( cl_device_id ) );
+        enforce_cl_retcode( clGetContextInfo( my_factory.context(), CL_CONTEXT_DEVICES, num_devices*sizeof( cl_device_id ), device_list, NULL ),
+            "Failed to get OpenCL context info" );
+        const char *options = NULL;
+        switch ( my_type ) {
+        case opencl_program_type::SOURCE: {
+            file_reader fr( my_arg_str );
+            const char *s[] = { fr.content() };
+            const size_t l[] = { fr.length() };
+            cl_int err;
+            my_cl_program = clCreateProgramWithSource( my_factory.context(), 1, s, l, &err );
+            enforce_cl_retcode( err, std::string( "Failed to create program: " ) + my_arg_str );
+            opencl_device_filter(
+                num_devices, device_list,
+                []( const opencl_device& d ) -> bool {
+                    return !d.compiler_available() || !d.linker_available();
+                }, "No one device supports building program from sources" );
+            opencl_program_builder(
+                my_factory, my_arg_str, my_cl_program, num_devices, device_list,
+                options, /*callback*/ NULL, /*user data*/NULL );
+            break;
+        }
+        case opencl_program_type::SPIR:
+            options = "-x spir";
+        case opencl_program_type::PRECOMPILED: {
+            file_reader fr( my_arg_str );
+            std::vector<const unsigned char*> s(
+                num_devices, reinterpret_cast<const unsigned char*>(fr.content()) );
+            std::vector<size_t> l( num_devices, fr.length() );
+            std::vector<cl_int> bin_statuses( num_devices, -1 );
+            cl_int err;
+            my_cl_program = clCreateProgramWithBinary( my_factory.context(), num_devices,
+                                                       device_list, l.data(), s.data(),
+                                                       bin_statuses.data(), &err );
+            if( err != CL_SUCCESS ) {
+                std::string statuses_str;
+                for (auto st = bin_statuses.begin(); st != bin_statuses.end(); ++st) {
+                    statuses_str += std::to_string((*st));
+                }
+
+                enforce_cl_retcode( err, std::string( "Failed to create program, error " + std::to_string( err ) + " : " ) + my_arg_str +
+                                    std::string( ", binary_statuses = " ) + statuses_str );
+            }
+            opencl_program_builder(
+                my_factory, my_arg_str, my_cl_program, num_devices, device_list,
+                options, /*callback*/ NULL, /*user data*/NULL );
+            break;
+        }
+        default:
+            __TBB_ASSERT( false, "Unsupported program type" );
+        }
+    }
+
+    Factory& my_factory;
+    opencl_program_type my_type;
+    std::string my_arg_str;
+    mutable cl_program my_cl_program;
+    mutable std::once_flag my_do_once_flag;
+
+    template <typename DeviceFilter>
+    friend class opencl_factory;
+
+    template <typename DeviceFilter>
+    friend class opencl_factory<DeviceFilter>::kernel;
+};
+
+template<typename... Args>
+class opencl_node;
+
+template<typename JP, typename Factory, typename... Ports>
+class opencl_node< tuple<Ports...>, JP, Factory > : public streaming_node< tuple<Ports...>, JP, Factory > {
+    typedef streaming_node < tuple<Ports...>, JP, Factory > base_type;
+public:
+    typedef typename base_type::kernel_type kernel_type;
+
+    opencl_node( graph &g, const kernel_type& kernel )
+        : base_type( g, kernel, opencl_info::default_device_selector< opencl_info::default_opencl_factory >(), opencl_info::default_factory() )
+    {
+        tbb::internal::fgt_multiinput_multioutput_node( tbb::internal::FLOW_OPENCL_NODE, this, &this->my_graph );
+    }
+
+    opencl_node( graph &g, const kernel_type& kernel, Factory &f )
+        : base_type( g, kernel, opencl_info::default_device_selector <Factory >(), f )
+    {
+        tbb::internal::fgt_multiinput_multioutput_node( tbb::internal::FLOW_OPENCL_NODE, this, &this->my_graph );
+    }
+
+    template <typename DeviceSelector>
+    opencl_node( graph &g, const kernel_type& kernel, DeviceSelector d, Factory &f)
+        : base_type( g, kernel, d, f)
+    {
+        tbb::internal::fgt_multiinput_multioutput_node( tbb::internal::FLOW_OPENCL_NODE, this, &this->my_graph );
+    }
+};
+
+template<typename JP, typename... Ports>
+class opencl_node< tuple<Ports...>, JP > : public opencl_node < tuple<Ports...>, JP, opencl_info::default_opencl_factory > {
+    typedef opencl_node < tuple<Ports...>, JP, opencl_info::default_opencl_factory > base_type;
+public:
+    typedef typename base_type::kernel_type kernel_type;
+
+    opencl_node( graph &g, const kernel_type& kernel )
+        : base_type( g, kernel, opencl_info::default_device_selector< opencl_info::default_opencl_factory >(), opencl_info::default_factory() )
+    {}
+
+    template <typename DeviceSelector>
+    opencl_node( graph &g, const kernel_type& kernel, DeviceSelector d )
+        : base_type( g, kernel, d, opencl_info::default_factory() )
+    {}
+};
+
+template<typename... Ports>
+class opencl_node< tuple<Ports...> > : public opencl_node < tuple<Ports...>, queueing, opencl_info::default_opencl_factory > {
+    typedef opencl_node < tuple<Ports...>, queueing, opencl_info::default_opencl_factory > base_type;
+public:
+    typedef typename base_type::kernel_type kernel_type;
+
+    opencl_node( graph &g, const kernel_type& kernel )
+        : base_type( g, kernel, opencl_info::default_device_selector< opencl_info::default_opencl_factory >(), opencl_info::default_factory() )
+    {}
+
+    template <typename DeviceSelector>
+    opencl_node( graph &g, const kernel_type& kernel, DeviceSelector d )
+        : base_type( g, kernel, d, opencl_info::default_factory() )
+    {}
+};
+
+} // namespace interface10
+
+using interface10::opencl_node;
+using interface10::read_only;
+using interface10::read_write;
+using interface10::write_only;
+using interface10::opencl_buffer;
+using interface10::opencl_subbuffer;
+using interface10::opencl_device;
+using interface10::opencl_device_list;
+using interface10::opencl_program;
+using interface10::opencl_program_type;
+using interface10::opencl_async_msg;
+using interface10::opencl_factory;
+using interface10::opencl_range;
+
+} // namespace flow
+} // namespace tbb
+#endif /* __TBB_PREVIEW_OPENCL_NODE */
+
+#endif // __TBB_flow_graph_opencl_node_H
diff --git a/xdl/third_party/tbb/include/tbb/gfx_factory.h b/xdl/third_party/tbb/include/tbb/gfx_factory.h
new file mode 100644
index 00000000..f2a70c56
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/gfx_factory.h
@@ -0,0 +1,359 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_flow_graph_gfx_factory_H
+#define __TBB_flow_graph_gfx_factory_H
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_PREVIEW_GFX_FACTORY
+
+#include <vector>
+#include <future>
+#include <mutex>
+#include <iostream>
+
+#include <gfx/gfx_rt.h>
+#include <gfx/gfx_intrin.h>
+#include <gfx/gfx_types.h>
+
+namespace tbb {
+
+namespace flow {
+
+namespace interface9 {
+
+template <typename T>
+class gfx_buffer;
+
+namespace gfx_offload {
+
+    typedef GfxTaskId task_id_type;
+
+    //-----------------------------------------------------------------------
+    // GFX errors checkers.
+    // For more debug output, set GFX_LOG_OFFLOAD=2 macro
+    //-----------------------------------------------------------------------
+
+    // TODO: reconsider error handling approach. If exception is the right way
+    // then need to define and document a specific exception type.
+    inline void throw_gfx_exception() {
+        std::string msg = "GFX error occurred: " + std::to_string(_GFX_get_last_error());
+        std::cerr << msg << std::endl;
+        throw msg;
+    }
+
+    inline void check_enqueue_retcode(task_id_type err) {
+        if (err == 0) {
+            throw_gfx_exception();
+        }
+    }
+
+    inline void check_gfx_retcode(task_id_type err) {
+        if (err != GFX_SUCCESS) {
+            throw_gfx_exception();
+        }
+    }
+
+    //---------------------------------------------------------------------
+    // GFX asynchronous offload and share API
+    //---------------------------------------------------------------------
+
+    // Sharing and unsharing data API
+    template<typename DataType, typename SizeType>
+    void share(DataType* p, SizeType n) { check_gfx_retcode(_GFX_share(p, sizeof(*p)*n)); }
+    template<typename DataType>
+    void unshare(DataType* p) { check_gfx_retcode(_GFX_unshare(p)); }
+
+    // Retrieving array pointer from shared gfx_buffer
+    // Other types remain the same
+    template <typename T>
+    T* raw_data(gfx_buffer<T>& buffer) { return buffer.data(); }
+    template <typename T>
+    const T* raw_data(const gfx_buffer<T>& buffer) { return buffer.data(); }
+    template <typename T>
+    T& raw_data(T& data) { return data; }
+    template <typename T>
+    const T& raw_data(const T& data) { return data; }
+
+    // Kernel enqueuing on device with arguments
+    template <typename F, typename ...ArgType>
+    task_id_type run_kernel(F ptr, ArgType&... args) {
+        task_id_type id = _GFX_offload(ptr, raw_data(args)...);
+
+        // Check if something during offload went wrong (ex: driver initialization failure)
+        gfx_offload::check_enqueue_retcode(id);
+
+        return id;
+    }
+
+    // Waiting for tasks completion
+    void wait_for_task(task_id_type id) { check_gfx_retcode(_GFX_wait(id)); }
+
+} // namespace gfx_offload
+
+template <typename T>
+class gfx_buffer {
+public:
+
+    typedef typename std::vector<T>::iterator iterator;
+    typedef typename std::vector<T>::const_iterator const_iterator;
+
+    typedef std::size_t size_type;
+
+    gfx_buffer() : my_vector_ptr(std::make_shared< std::vector<T> >()) {}
+    gfx_buffer(size_type size) : my_vector_ptr(std::make_shared< std::vector<T> >(size)) {}
+
+    T* data() { return &(my_vector_ptr->front()); }
+    const T* data() const { return &(my_vector_ptr->front()); }
+
+    size_type size() const { return my_vector_ptr->size(); }
+
+    const_iterator cbegin() const { return my_vector_ptr->cbegin(); }
+    const_iterator cend() const { return my_vector_ptr->cend(); }
+    iterator begin() { return my_vector_ptr->begin(); }
+    iterator end() { return my_vector_ptr->end(); }
+
+    T& operator[](size_type pos) { return (*my_vector_ptr)[pos]; }
+    const T& operator[](size_type pos) const { return (*my_vector_ptr)[pos]; }
+
+private:
+    std::shared_ptr< std::vector<T> > my_vector_ptr;
+};
+
+template<typename T>
+class gfx_async_msg : public tbb::flow::async_msg<T> {
+public:
+    typedef gfx_offload::task_id_type kernel_id_type;
+
+    gfx_async_msg() : my_task_id(0) {}
+    gfx_async_msg(const T& input_data) : my_data(input_data), my_task_id(0) {}
+
+    T& data() { return my_data; }
+    const T& data() const { return my_data; }
+
+    void set_task_id(kernel_id_type id) { my_task_id = id; }
+    kernel_id_type task_id() const { return my_task_id; }
+
+private:
+    T my_data;
+    kernel_id_type my_task_id;
+};
+
+class gfx_factory {
+private:
+
+    // Wrapper for GFX kernel which is just a function
+    class func_wrapper {
+    public:
+
+        template <typename F>
+        func_wrapper(F ptr) { my_ptr = reinterpret_cast<void*>(ptr); }
+
+        template<typename ...Args>
+        void operator()(Args&&... args) {}
+
+        operator void*() { return my_ptr; }
+
+    private:
+        void* my_ptr;
+    };
+
+public:
+
+    // Device specific types
+    template<typename T> using async_msg_type = gfx_async_msg<T>;
+
+    typedef func_wrapper kernel_type;
+
+    // Empty device type that is needed for Factory Concept
+    // but is not used in gfx_factory
+    typedef struct {} device_type;
+
+    typedef gfx_offload::task_id_type kernel_id_type;
+
+    gfx_factory(tbb::flow::graph& g) : m_graph(g), current_task_id(0) {}
+
+    // Upload data to the device
+    template <typename ...Args>
+    void send_data(device_type /*device*/, Args&... args) {
+        send_data_impl(args...);
+    }
+
+    // Run kernel on the device
+    template <typename ...Args>
+    void send_kernel(device_type /*device*/, const kernel_type& kernel, Args&... args) {
+        // Get packed T data from async_msg<T> and pass it to kernel
+        kernel_id_type id = gfx_offload::run_kernel(kernel, args.data()...);
+
+        // Set id to async_msg
+        set_kernel_id(id, args...);
+
+        // Extend the graph lifetime until the callback completion.
+        m_graph.reserve_wait();
+
+        // Mutex for future assignment
+        std::lock_guard<std::mutex> lock(future_assignment_mutex);
+
+        // Set callback that waits for kernel execution
+        callback_future = std::async(std::launch::async, &gfx_factory::callback<Args...>, this, id, args...);
+    }
+
+    // Finalization action after the kernel run
+    template <typename FinalizeFn, typename ...Args>
+    void finalize(device_type /*device*/, FinalizeFn fn, Args&... /*args*/) {
+        fn();
+    }
+
+    // Empty device selector.
+    // No way to choose a device with GFX API.
+    class dummy_device_selector {
+    public:
+        device_type operator()(gfx_factory& /*factory*/) {
+            return device_type();
+        }
+    };
+
+private:
+
+    //---------------------------------------------------------------------
+    // Callback for kernel result
+    //---------------------------------------------------------------------
+
+    template <typename ...Args>
+    void callback(kernel_id_type id, Args... args) {
+        // Waiting for specific tasks id to complete
+        {
+            std::lock_guard<std::mutex> lock(task_wait_mutex);
+            if (current_task_id < id) {
+                gfx_offload::wait_for_task(id);
+                current_task_id = id;
+            }
+        }
+
+        // Get result from device and set to async_msg (args)
+        receive_data(args...);
+
+        // Data was sent to the graph, release the reference
+        m_graph.release_wait();
+    }
+
+    //---------------------------------------------------------------------
+    // send_data() arguments processing
+    //---------------------------------------------------------------------
+
+    // GFX buffer shared data with device that will be executed on
+    template <typename T>
+    void share_data(T) {}
+
+    template <typename T>
+    void share_data(gfx_buffer<T>& buffer) {
+        gfx_offload::share(buffer.data(), buffer.size());
+    }
+
+    template <typename T>
+    void send_arg(T) {}
+
+    template <typename T>
+    void send_arg(async_msg_type<T>& msg) {
+        share_data(msg.data());
+    }
+
+    void send_data_impl() {}
+
+    template <typename T, typename ...Rest>
+    void send_data_impl(T& arg, Rest&... args) {
+        send_arg(arg);
+        send_data_impl(args...);
+    }
+
+    //----------------------------------------------------------------------
+    // send_kernel() arguments processing
+    //----------------------------------------------------------------------
+
+    template <typename T>
+    void set_kernel_id_arg(kernel_id_type, T) {}
+
+    template <typename T>
+    void set_kernel_id_arg(kernel_id_type id, async_msg_type<T>& msg) {
+        msg.set_task_id(id);
+    }
+
+    void set_kernel_id(kernel_id_type) {}
+
+    template <typename T, typename ...Rest>
+    void set_kernel_id(kernel_id_type id, T& arg, Rest&... args) {
+        set_kernel_id_arg(id, arg);
+        set_kernel_id(id, args...);
+    }
+
+    //-----------------------------------------------------------------------
+    // Arguments processing after kernel execution.
+    // Unsharing buffers and forwarding results to the graph
+    //-----------------------------------------------------------------------
+
+    // After kernel execution the data should be unshared
+    template <typename T>
+    void unshare_data(T) {}
+
+    template <typename T>
+    void unshare_data(gfx_buffer<T>& buffer) {
+        gfx_offload::unshare(buffer.data());
+    }
+
+    template <typename T>
+    void receive_arg(T) {}
+
+    template <typename T>
+    void receive_arg(async_msg_type<T>& msg) {
+        unshare_data(msg.data());
+        msg.set(msg.data());
+    }
+
+    void receive_data() {}
+
+    template <typename T, typename ...Rest>
+    void receive_data(T& arg, Rest&... args) {
+        receive_arg(arg);
+        receive_data(args...);
+    }
+
+    //-----------------------------------------------------------------------
+    int current_task_id;
+
+    std::future<void> callback_future;
+    tbb::flow::graph& m_graph;
+
+    std::mutex future_assignment_mutex;
+    std::mutex task_wait_mutex;
+};
+
+} // namespace interface9
+
+using interface9::gfx_factory;
+using interface9::gfx_buffer;
+
+} // namespace flow
+
+} // namespace tbb
+
+#endif // __TBB_PREVIEW_GFX_FACTORY
+
+#endif // __TBB_flow_graph_gfx_factory_H
diff --git a/xdl/third_party/tbb/include/tbb/global_control.h b/xdl/third_party/tbb/include/tbb/global_control.h
new file mode 100644
index 00000000..7a8d0c35
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/global_control.h
@@ -0,0 +1,86 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_global_control_H
+#define __TBB_global_control_H
+
+#if !TBB_PREVIEW_GLOBAL_CONTROL && !__TBB_BUILD
+#error Set TBB_PREVIEW_GLOBAL_CONTROL before including global_control.h
+#endif
+
+#include "tbb_stddef.h"
+
+namespace tbb {
+namespace interface9 {
+
+class global_control {
+public:
+    enum parameter {
+        max_allowed_parallelism,
+        thread_stack_size,
+        parameter_max // insert new parameters above this point
+    };
+
+    global_control(parameter p, size_t value) :
+        my_value(value), my_next(NULL), my_param(p) {
+        __TBB_ASSERT(my_param < parameter_max, "Invalid parameter");
+#if __TBB_WIN8UI_SUPPORT
+        // For Windows Store* apps it's impossible to set stack size
+        if (p==thread_stack_size)
+            return;
+#elif __TBB_x86_64 && (_WIN32 || _WIN64)
+        if (p==thread_stack_size)
+            __TBB_ASSERT_RELEASE((unsigned)value == value, "Stack size is limited to unsigned int range");
+#endif
+        if (my_param==max_allowed_parallelism)
+            __TBB_ASSERT_RELEASE(my_value>0, "max_allowed_parallelism cannot be 0.");
+        internal_create();
+    }
+
+    ~global_control() {
+        __TBB_ASSERT(my_param < parameter_max, "Invalid parameter. Probably the object was corrupted.");
+#if __TBB_WIN8UI_SUPPORT
+        // For Windows Store* apps it's impossible to set stack size
+        if (my_param==thread_stack_size)
+            return;
+#endif
+        internal_destroy();
+    }
+
+    static size_t active_value(parameter p) {
+        __TBB_ASSERT(p < parameter_max, "Invalid parameter");
+        return active_value((int)p);
+    }
+private:
+    size_t    my_value;
+    global_control *my_next;
+    parameter my_param;
+
+    void __TBB_EXPORTED_METHOD internal_create();
+    void __TBB_EXPORTED_METHOD internal_destroy();
+    static size_t __TBB_EXPORTED_FUNC active_value(int param);
+};
+} // namespace interface9
+
+using interface9::global_control;
+
+} // tbb
+
+#endif // __TBB_global_control_H
diff --git a/xdl/third_party/tbb/include/tbb/index.html b/xdl/third_party/tbb/include/tbb/index.html
new file mode 100644
index 00000000..ad157bb8
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/index.html
@@ -0,0 +1,29 @@
+<HTML>
+<BODY>
+
+<H2>Overview</H2>
+Include files for Intel&reg; Threading Building Blocks classes and functions.
+
+<BR><A HREF=".">Click here</A> to see all files in the directory.
+
+<H2>Directories</H2>
+<DL>
+<DT><A HREF="compat">compat</A>
+<DD>Include files for source level compatibility with other frameworks.
+<DT><A HREF="internal">internal</A>
+<DD>Include files with implementation details; not for direct use.
+<DT><A HREF="machine">machine</A>
+<DD>Include files for low-level architecture specific functionality; not for direct use.
+</DL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/include/tbb/internal/_aggregator_impl.h b/xdl/third_party/tbb/include/tbb/internal/_aggregator_impl.h
new file mode 100644
index 00000000..2a85da6a
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_aggregator_impl.h
@@ -0,0 +1,184 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__aggregator_impl_H
+#define __TBB__aggregator_impl_H
+
+#include "../atomic.h"
+#if !__TBBMALLOC_BUILD
+#include "../tbb_profiling.h"
+#endif
+
+namespace tbb {
+namespace interface6 {
+namespace internal {
+
+using namespace tbb::internal;
+
+//! aggregated_operation base class
+template <typename Derived>
+class aggregated_operation {
+ public:
+    //! Zero value means "wait" status, all other values are "user" specified values and are defined into the scope of a class which uses "status".
+    uintptr_t status;
+
+    Derived *next;
+    aggregated_operation() : status(0), next(NULL) {}
+};
+
+//! Aggregator base class
+/** An aggregator for collecting operations coming from multiple sources and executing
+    them serially on a single thread.  operation_type must be derived from
+    aggregated_operation. The parameter handler_type is a functor that will be passed the
+    list of operations and is expected to handle each operation appropriately, setting the
+    status of each operation to non-zero.*/
+template < typename operation_type >
+class aggregator_generic {
+public:
+    aggregator_generic() : handler_busy(false) { pending_operations = NULL; }
+
+    //! Execute an operation
+    /** Places an operation into the waitlist (pending_operations), and either handles the list,
+        or waits for the operation to complete, or returns.
+        The long_life_time parameter specifies the life time of the given operation object.
+        Operations with long_life_time == true may be accessed after execution.
+        A "short" life time operation (long_life_time == false) can be destroyed
+        during execution, and so any access to it after it was put into the waitlist,
+        including status check, is invalid. As a consequence, waiting for completion
+        of such operation causes undefined behavior.
+    */
+    template < typename handler_type >
+    void execute(operation_type *op, handler_type &handle_operations, bool long_life_time = true) {
+        operation_type *res;
+        // op->status should be read before inserting the operation into the
+        // aggregator waitlist since it can become invalid after executing a
+        // handler (if the operation has 'short' life time.)
+        const uintptr_t status = op->status;
+
+        // ITT note: &(op->status) tag is used to cover accesses to this op node. This
+        // thread has created the operation, and now releases it so that the handler
+        // thread may handle the associated operation w/o triggering a race condition;
+        // thus this tag will be acquired just before the operation is handled in the
+        // handle_operations functor.
+        call_itt_notify(releasing, &(op->status));
+        // insert the operation in the queue.
+        do {
+            // Tools may flag the following line as a race; it is a false positive:
+            // This is an atomic read; we don't provide itt_hide_load_word for atomics
+            op->next = res = pending_operations; // NOT A RACE
+        } while (pending_operations.compare_and_swap(op, res) != res);
+        if (!res) { // first in the list; handle the operations.
+            // ITT note: &pending_operations tag covers access to the handler_busy flag,
+            // which this waiting handler thread will try to set before entering
+            // handle_operations.
+            call_itt_notify(acquired, &pending_operations);
+            start_handle_operations(handle_operations);
+            // The operation with 'short' life time can already be destroyed.
+            if (long_life_time)
+                __TBB_ASSERT(op->status, NULL);
+        }
+        // not first; wait for op to be ready.
+        else if (!status) { // operation is blocking here.
+            __TBB_ASSERT(long_life_time, "Waiting for an operation object that might be destroyed during processing.");
+            call_itt_notify(prepare, &(op->status));
+            spin_wait_while_eq(op->status, uintptr_t(0));
+            itt_load_word_with_acquire(op->status);
+        }
+    }
+
+ private:
+    //! An atomically updated list (aka mailbox) of pending operations
+    atomic<operation_type *> pending_operations;
+    //! Controls thread access to handle_operations
+    uintptr_t handler_busy;
+
+    //! Trigger the handling of operations when the handler is free
+    template < typename handler_type >
+    void start_handle_operations( handler_type &handle_operations ) {
+        operation_type *op_list;
+
+        // ITT note: &handler_busy tag covers access to pending_operations as it is passed
+        // between active and waiting handlers.  Below, the waiting handler waits until
+        // the active handler releases, and the waiting handler acquires &handler_busy as
+        // it becomes the active_handler. The release point is at the end of this
+        // function, when all operations in pending_operations have been handled by the
+        // owner of this aggregator.
+        call_itt_notify(prepare, &handler_busy);
+        // get the handler_busy:
+        // only one thread can possibly spin here at a time
+        spin_wait_until_eq(handler_busy, uintptr_t(0));
+        call_itt_notify(acquired, &handler_busy);
+        // acquire fence not necessary here due to causality rule and surrounding atomics
+        __TBB_store_with_release(handler_busy, uintptr_t(1));
+
+        // ITT note: &pending_operations tag covers access to the handler_busy flag
+        // itself. Capturing the state of the pending_operations signifies that
+        // handler_busy has been set and a new active handler will now process that list's
+        // operations.
+        call_itt_notify(releasing, &pending_operations);
+        // grab pending_operations
+        op_list = pending_operations.fetch_and_store(NULL);
+
+        // handle all the operations
+        handle_operations(op_list);
+
+        // release the handler
+        itt_store_word_with_release(handler_busy, uintptr_t(0));
+    }
+};
+
+template < typename handler_type, typename operation_type >
+class aggregator : public aggregator_generic<operation_type> {
+    handler_type handle_operations;
+public:
+    aggregator() {}
+    explicit aggregator(handler_type h) : handle_operations(h) {}
+
+    void initialize_handler(handler_type h) { handle_operations = h; }
+
+    void execute(operation_type *op) {
+        aggregator_generic<operation_type>::execute(op, handle_operations);
+    }
+};
+
+// the most-compatible friend declaration (vs, gcc, icc) is
+//    template<class U, class V> friend class aggregating_functor;
+template<typename aggregating_class, typename operation_list>
+class aggregating_functor {
+    aggregating_class *fi;
+public:
+    aggregating_functor() {}
+    aggregating_functor(aggregating_class *fi_) : fi(fi_) {}
+    void operator()(operation_list* op_list) { fi->handle_operations(op_list); }
+};
+
+} // namespace internal
+} // namespace interface6
+
+namespace internal {
+    using interface6::internal::aggregated_operation;
+    using interface6::internal::aggregator_generic;
+    using interface6::internal::aggregator;
+    using interface6::internal::aggregating_functor;
+} // namespace internal
+
+} // namespace tbb
+
+#endif  // __TBB__aggregator_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_concurrent_queue_impl.h b/xdl/third_party/tbb/include/tbb/internal/_concurrent_queue_impl.h
new file mode 100644
index 00000000..172588ac
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_concurrent_queue_impl.h
@@ -0,0 +1,1075 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__concurrent_queue_impl_H
+#define __TBB__concurrent_queue_impl_H
+
+#ifndef __TBB_concurrent_queue_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#include "../tbb_stddef.h"
+#include "../tbb_machine.h"
+#include "../atomic.h"
+#include "../spin_mutex.h"
+#include "../cache_aligned_allocator.h"
+#include "../tbb_exception.h"
+#include "../tbb_profiling.h"
+#include <new>
+#include __TBB_STD_SWAP_HEADER
+#include <iterator>
+
+namespace tbb {
+
+#if !__TBB_TEMPLATE_FRIENDS_BROKEN
+
+// forward declaration
+namespace strict_ppl {
+template<typename T, typename A> class concurrent_queue;
+}
+
+template<typename T, typename A> class concurrent_bounded_queue;
+
+#endif
+
+//! For internal use only.
+namespace strict_ppl {
+
+//! @cond INTERNAL
+namespace internal {
+
+using namespace tbb::internal;
+
+typedef size_t ticket;
+
+template<typename T> class micro_queue ;
+template<typename T> class micro_queue_pop_finalizer ;
+template<typename T> class concurrent_queue_base_v3;
+template<typename T> struct concurrent_queue_rep;
+
+//! parts of concurrent_queue_rep that do not have references to micro_queue
+/**
+ * For internal use only.
+ */
+struct concurrent_queue_rep_base : no_copy {
+    template<typename T> friend class micro_queue;
+    template<typename T> friend class concurrent_queue_base_v3;
+
+protected:
+    //! Approximately n_queue/golden ratio
+    static const size_t phi = 3;
+
+public:
+    // must be power of 2
+    static const size_t n_queue = 8;
+
+    //! Prefix on a page
+    struct page {
+        page* next;
+        uintptr_t mask;
+    };
+
+    atomic<ticket> head_counter;
+    char pad1[NFS_MaxLineSize-sizeof(atomic<ticket>)];
+    atomic<ticket> tail_counter;
+    char pad2[NFS_MaxLineSize-sizeof(atomic<ticket>)];
+
+    //! Always a power of 2
+    size_t items_per_page;
+
+    //! Size of an item
+    size_t item_size;
+
+    //! number of invalid entries in the queue
+    atomic<size_t> n_invalid_entries;
+
+    char pad3[NFS_MaxLineSize-sizeof(size_t)-sizeof(size_t)-sizeof(atomic<size_t>)];
+} ;
+
+inline bool is_valid_page(const concurrent_queue_rep_base::page* p) {
+    return uintptr_t(p)>1;
+}
+
+//! Abstract class to define interface for page allocation/deallocation
+/**
+ * For internal use only.
+ */
+class concurrent_queue_page_allocator
+{
+    template<typename T> friend class micro_queue ;
+    template<typename T> friend class micro_queue_pop_finalizer ;
+protected:
+    virtual ~concurrent_queue_page_allocator() {}
+private:
+    virtual concurrent_queue_rep_base::page* allocate_page() = 0;
+    virtual void deallocate_page( concurrent_queue_rep_base::page* p ) = 0;
+} ;
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+// unary minus operator applied to unsigned type, result still unsigned
+#pragma warning( push )
+#pragma warning( disable: 4146 )
+#endif
+
+//! A queue using simple locking.
+/** For efficiency, this class has no constructor.
+    The caller is expected to zero-initialize it. */
+template<typename T>
+class micro_queue : no_copy {
+public:
+    typedef void (*item_constructor_t)(T* location, const void* src);
+private:
+    typedef concurrent_queue_rep_base::page page;
+
+    //! Class used to ensure exception-safety of method "pop"
+    class destroyer: no_copy {
+        T& my_value;
+    public:
+        destroyer( T& value ) : my_value(value) {}
+        ~destroyer() {my_value.~T();}
+    };
+
+    void copy_item( page& dst, size_t dindex, const void* src, item_constructor_t construct_item ) {
+        construct_item( &get_ref(dst, dindex), src );
+    }
+
+    void copy_item( page& dst, size_t dindex, const page& src, size_t sindex,
+        item_constructor_t construct_item )
+    {
+        T& src_item = get_ref( const_cast<page&>(src), sindex );
+        construct_item( &get_ref(dst, dindex), static_cast<const void*>(&src_item) );
+    }
+
+    void assign_and_destroy_item( void* dst, page& src, size_t index ) {
+        T& from = get_ref(src,index);
+        destroyer d(from);
+        *static_cast<T*>(dst) = tbb::internal::move( from );
+    }
+
+    void spin_wait_until_my_turn( atomic<ticket>& counter, ticket k, concurrent_queue_rep_base& rb ) const ;
+
+public:
+    friend class micro_queue_pop_finalizer<T>;
+
+    struct padded_page: page {
+        //! Not defined anywhere - exists to quiet warnings.
+        padded_page();
+        //! Not defined anywhere - exists to quiet warnings.
+        void operator=( const padded_page& );
+        //! Must be last field.
+        T last;
+    };
+
+    static T& get_ref( page& p, size_t index ) {
+        return (&static_cast<padded_page*>(static_cast<void*>(&p))->last)[index];
+    }
+
+    atomic<page*> head_page;
+    atomic<ticket> head_counter;
+
+    atomic<page*> tail_page;
+    atomic<ticket> tail_counter;
+
+    spin_mutex page_mutex;
+
+    void push( const void* item, ticket k, concurrent_queue_base_v3<T>& base,
+        item_constructor_t construct_item ) ;
+
+    bool pop( void* dst, ticket k, concurrent_queue_base_v3<T>& base ) ;
+
+    micro_queue& assign( const micro_queue& src, concurrent_queue_base_v3<T>& base,
+        item_constructor_t construct_item ) ;
+
+    page* make_copy( concurrent_queue_base_v3<T>& base, const page* src_page, size_t begin_in_page,
+        size_t end_in_page, ticket& g_index, item_constructor_t construct_item ) ;
+
+    void invalidate_page_and_rethrow( ticket k ) ;
+};
+
+template<typename T>
+void micro_queue<T>::spin_wait_until_my_turn( atomic<ticket>& counter, ticket k, concurrent_queue_rep_base& rb ) const {
+    for( atomic_backoff b(true);;b.pause() ) {
+        ticket c = counter;
+        if( c==k ) return;
+        else if( c&1 ) {
+            ++rb.n_invalid_entries;
+            throw_exception( eid_bad_last_alloc );
+        }
+    }
+}
+
+template<typename T>
+void micro_queue<T>::push( const void* item, ticket k, concurrent_queue_base_v3<T>& base,
+    item_constructor_t construct_item )
+{
+    k &= -concurrent_queue_rep_base::n_queue;
+    page* p = NULL;
+    size_t index = modulo_power_of_two( k/concurrent_queue_rep_base::n_queue, base.my_rep->items_per_page);
+    if( !index ) {
+        __TBB_TRY {
+            concurrent_queue_page_allocator& pa = base;
+            p = pa.allocate_page();
+        } __TBB_CATCH (...) {
+            ++base.my_rep->n_invalid_entries;
+            invalidate_page_and_rethrow( k );
+        }
+        p->mask = 0;
+        p->next = NULL;
+    }
+
+    if( tail_counter != k ) spin_wait_until_my_turn( tail_counter, k, *base.my_rep );
+    call_itt_notify(acquired, &tail_counter);
+
+    if( p ) {
+        spin_mutex::scoped_lock lock( page_mutex );
+        page* q = tail_page;
+        if( is_valid_page(q) )
+            q->next = p;
+        else
+            head_page = p;
+        tail_page = p;
+    } else {
+        p = tail_page;
+    }
+
+    __TBB_TRY {
+        copy_item( *p, index, item, construct_item );
+        // If no exception was thrown, mark item as present.
+        itt_hide_store_word(p->mask,  p->mask | uintptr_t(1)<<index);
+        call_itt_notify(releasing, &tail_counter);
+        tail_counter += concurrent_queue_rep_base::n_queue;
+    } __TBB_CATCH (...) {
+        ++base.my_rep->n_invalid_entries;
+        call_itt_notify(releasing, &tail_counter);
+        tail_counter += concurrent_queue_rep_base::n_queue;
+        __TBB_RETHROW();
+    }
+}
+
+template<typename T>
+bool micro_queue<T>::pop( void* dst, ticket k, concurrent_queue_base_v3<T>& base ) {
+    k &= -concurrent_queue_rep_base::n_queue;
+    if( head_counter!=k ) spin_wait_until_eq( head_counter, k );
+    call_itt_notify(acquired, &head_counter);
+    if( tail_counter==k ) spin_wait_while_eq( tail_counter, k );
+    call_itt_notify(acquired, &tail_counter);
+    page *p = head_page;
+    __TBB_ASSERT( p, NULL );
+    size_t index = modulo_power_of_two( k/concurrent_queue_rep_base::n_queue, base.my_rep->items_per_page );
+    bool success = false;
+    {
+        micro_queue_pop_finalizer<T> finalizer( *this, base, k+concurrent_queue_rep_base::n_queue, index==base.my_rep->items_per_page-1 ? p : NULL );
+        if( p->mask & uintptr_t(1)<<index ) {
+            success = true;
+            assign_and_destroy_item( dst, *p, index );
+        } else {
+            --base.my_rep->n_invalid_entries;
+        }
+    }
+    return success;
+}
+
+template<typename T>
+micro_queue<T>& micro_queue<T>::assign( const micro_queue<T>& src, concurrent_queue_base_v3<T>& base,
+    item_constructor_t construct_item )
+{
+    head_counter = src.head_counter;
+    tail_counter = src.tail_counter;
+
+    const page* srcp = src.head_page;
+    if( is_valid_page(srcp) ) {
+        ticket g_index = head_counter;
+        __TBB_TRY {
+            size_t n_items  = (tail_counter-head_counter)/concurrent_queue_rep_base::n_queue;
+            size_t index = modulo_power_of_two( head_counter/concurrent_queue_rep_base::n_queue, base.my_rep->items_per_page );
+            size_t end_in_first_page = (index+n_items<base.my_rep->items_per_page)?(index+n_items):base.my_rep->items_per_page;
+
+            head_page = make_copy( base, srcp, index, end_in_first_page, g_index, construct_item );
+            page* cur_page = head_page;
+
+            if( srcp != src.tail_page ) {
+                for( srcp = srcp->next; srcp!=src.tail_page; srcp=srcp->next ) {
+                    cur_page->next = make_copy( base, srcp, 0, base.my_rep->items_per_page, g_index, construct_item );
+                    cur_page = cur_page->next;
+                }
+
+                __TBB_ASSERT( srcp==src.tail_page, NULL );
+                size_t last_index = modulo_power_of_two( tail_counter/concurrent_queue_rep_base::n_queue, base.my_rep->items_per_page );
+                if( last_index==0 ) last_index = base.my_rep->items_per_page;
+
+                cur_page->next = make_copy( base, srcp, 0, last_index, g_index, construct_item );
+                cur_page = cur_page->next;
+            }
+            tail_page = cur_page;
+        } __TBB_CATCH (...) {
+            invalidate_page_and_rethrow( g_index );
+        }
+    } else {
+        head_page = tail_page = NULL;
+    }
+    return *this;
+}
+
+template<typename T>
+void micro_queue<T>::invalidate_page_and_rethrow( ticket k ) {
+    // Append an invalid page at address 1 so that no more pushes are allowed.
+    page* invalid_page = (page*)uintptr_t(1);
+    {
+        spin_mutex::scoped_lock lock( page_mutex );
+        itt_store_word_with_release(tail_counter, k+concurrent_queue_rep_base::n_queue+1);
+        page* q = tail_page;
+        if( is_valid_page(q) )
+            q->next = invalid_page;
+        else
+            head_page = invalid_page;
+        tail_page = invalid_page;
+    }
+    __TBB_RETHROW();
+}
+
+template<typename T>
+concurrent_queue_rep_base::page* micro_queue<T>::make_copy( concurrent_queue_base_v3<T>& base,
+    const concurrent_queue_rep_base::page* src_page, size_t begin_in_page, size_t end_in_page,
+    ticket& g_index, item_constructor_t construct_item )
+{
+    concurrent_queue_page_allocator& pa = base;
+    page* new_page = pa.allocate_page();
+    new_page->next = NULL;
+    new_page->mask = src_page->mask;
+    for( ; begin_in_page!=end_in_page; ++begin_in_page, ++g_index )
+        if( new_page->mask & uintptr_t(1)<<begin_in_page )
+            copy_item( *new_page, begin_in_page, *src_page, begin_in_page, construct_item );
+    return new_page;
+}
+
+template<typename T>
+class micro_queue_pop_finalizer: no_copy {
+    typedef concurrent_queue_rep_base::page page;
+    ticket my_ticket;
+    micro_queue<T>& my_queue;
+    page* my_page;
+    concurrent_queue_page_allocator& allocator;
+public:
+    micro_queue_pop_finalizer( micro_queue<T>& queue, concurrent_queue_base_v3<T>& b, ticket k, page* p ) :
+        my_ticket(k), my_queue(queue), my_page(p), allocator(b)
+    {}
+    ~micro_queue_pop_finalizer() ;
+};
+
+template<typename T>
+micro_queue_pop_finalizer<T>::~micro_queue_pop_finalizer() {
+    page* p = my_page;
+    if( is_valid_page(p) ) {
+        spin_mutex::scoped_lock lock( my_queue.page_mutex );
+        page* q = p->next;
+        my_queue.head_page = q;
+        if( !is_valid_page(q) ) {
+            my_queue.tail_page = NULL;
+        }
+    }
+    itt_store_word_with_release(my_queue.head_counter, my_ticket);
+    if( is_valid_page(p) ) {
+        allocator.deallocate_page( p );
+    }
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning( pop )
+#endif // warning 4146 is back
+
+template<typename T> class concurrent_queue_iterator_rep ;
+template<typename T> class concurrent_queue_iterator_base_v3;
+
+//! representation of concurrent_queue_base
+/**
+ * the class inherits from concurrent_queue_rep_base and defines an array of micro_queue<T>'s
+ */
+template<typename T>
+struct concurrent_queue_rep : public concurrent_queue_rep_base {
+    micro_queue<T> array[n_queue];
+
+    //! Map ticket to an array index
+    static size_t index( ticket k ) {
+        return k*phi%n_queue;
+    }
+
+    micro_queue<T>& choose( ticket k ) {
+        // The formula here approximates LRU in a cache-oblivious way.
+        return array[index(k)];
+    }
+};
+
+//! base class of concurrent_queue
+/**
+ * The class implements the interface defined by concurrent_queue_page_allocator
+ * and has a pointer to an instance of concurrent_queue_rep.
+ */
+template<typename T>
+class concurrent_queue_base_v3: public concurrent_queue_page_allocator {
+private:
+    //! Internal representation
+    concurrent_queue_rep<T>* my_rep;
+
+    friend struct concurrent_queue_rep<T>;
+    friend class micro_queue<T>;
+    friend class concurrent_queue_iterator_rep<T>;
+    friend class concurrent_queue_iterator_base_v3<T>;
+
+protected:
+    typedef typename concurrent_queue_rep<T>::page page;
+
+private:
+    typedef typename micro_queue<T>::padded_page padded_page;
+    typedef typename micro_queue<T>::item_constructor_t item_constructor_t;
+
+    virtual page *allocate_page() __TBB_override {
+        concurrent_queue_rep<T>& r = *my_rep;
+        size_t n = sizeof(padded_page) + (r.items_per_page-1)*sizeof(T);
+        return reinterpret_cast<page*>(allocate_block ( n ));
+    }
+
+    virtual void deallocate_page( concurrent_queue_rep_base::page *p ) __TBB_override {
+        concurrent_queue_rep<T>& r = *my_rep;
+        size_t n = sizeof(padded_page) + (r.items_per_page-1)*sizeof(T);
+        deallocate_block( reinterpret_cast<void*>(p), n );
+    }
+
+    //! custom allocator
+    virtual void *allocate_block( size_t n ) = 0;
+
+    //! custom de-allocator
+    virtual void deallocate_block( void *p, size_t n ) = 0;
+
+protected:
+    concurrent_queue_base_v3();
+
+    virtual ~concurrent_queue_base_v3() {
+#if TBB_USE_ASSERT
+        size_t nq = my_rep->n_queue;
+        for( size_t i=0; i<nq; i++ )
+            __TBB_ASSERT( my_rep->array[i].tail_page==NULL, "pages were not freed properly" );
+#endif /* TBB_USE_ASSERT */
+        cache_aligned_allocator<concurrent_queue_rep<T> >().deallocate(my_rep,1);
+    }
+
+    //! Enqueue item at tail of queue
+    void internal_push( const void* src, item_constructor_t construct_item ) {
+         concurrent_queue_rep<T>& r = *my_rep;
+         ticket k = r.tail_counter++;
+         r.choose(k).push( src, k, *this, construct_item );
+    }
+
+    //! Attempt to dequeue item from queue.
+    /** NULL if there was no item to dequeue. */
+    bool internal_try_pop( void* dst ) ;
+
+    //! Get size of queue; result may be invalid if queue is modified concurrently
+    size_t internal_size() const ;
+
+    //! check if the queue is empty; thread safe
+    bool internal_empty() const ;
+
+    //! free any remaining pages
+    /* note that the name may be misleading, but it remains so due to a historical accident. */
+    void internal_finish_clear() ;
+
+    //! Obsolete
+    void internal_throw_exception() const {
+        throw_exception( eid_bad_alloc );
+    }
+
+    //! copy or move internal representation
+    void assign( const concurrent_queue_base_v3& src, item_constructor_t construct_item ) ;
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! swap internal representation
+    void internal_swap( concurrent_queue_base_v3& src ) {
+        std::swap( my_rep, src.my_rep );
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+};
+
+template<typename T>
+concurrent_queue_base_v3<T>::concurrent_queue_base_v3() {
+    const size_t item_size = sizeof(T);
+    my_rep = cache_aligned_allocator<concurrent_queue_rep<T> >().allocate(1);
+    __TBB_ASSERT( (size_t)my_rep % NFS_GetLineSize()==0, "alignment error" );
+    __TBB_ASSERT( (size_t)&my_rep->head_counter % NFS_GetLineSize()==0, "alignment error" );
+    __TBB_ASSERT( (size_t)&my_rep->tail_counter % NFS_GetLineSize()==0, "alignment error" );
+    __TBB_ASSERT( (size_t)&my_rep->array % NFS_GetLineSize()==0, "alignment error" );
+    memset(static_cast<void*>(my_rep),0,sizeof(concurrent_queue_rep<T>));
+    my_rep->item_size = item_size;
+    my_rep->items_per_page = item_size<=  8 ? 32 :
+                             item_size<= 16 ? 16 :
+                             item_size<= 32 ?  8 :
+                             item_size<= 64 ?  4 :
+                             item_size<=128 ?  2 :
+                             1;
+}
+
+template<typename T>
+bool concurrent_queue_base_v3<T>::internal_try_pop( void* dst ) {
+    concurrent_queue_rep<T>& r = *my_rep;
+    ticket k;
+    do {
+        k = r.head_counter;
+        for(;;) {
+            if( (ptrdiff_t)(r.tail_counter-k)<=0 ) {
+                // Queue is empty
+                return false;
+            }
+            // Queue had item with ticket k when we looked.  Attempt to get that item.
+            ticket tk=k;
+#if defined(_MSC_VER) && defined(_Wp64)
+    #pragma warning (push)
+    #pragma warning (disable: 4267)
+#endif
+            k = r.head_counter.compare_and_swap( tk+1, tk );
+#if defined(_MSC_VER) && defined(_Wp64)
+    #pragma warning (pop)
+#endif
+            if( k==tk )
+                break;
+            // Another thread snatched the item, retry.
+        }
+    } while( !r.choose( k ).pop( dst, k, *this ) );
+    return true;
+}
+
+template<typename T>
+size_t concurrent_queue_base_v3<T>::internal_size() const {
+    concurrent_queue_rep<T>& r = *my_rep;
+    __TBB_ASSERT( sizeof(ptrdiff_t)<=sizeof(size_t), NULL );
+    ticket hc = r.head_counter;
+    size_t nie = r.n_invalid_entries;
+    ticket tc = r.tail_counter;
+    __TBB_ASSERT( hc!=tc || !nie, NULL );
+    ptrdiff_t sz = tc-hc-nie;
+    return sz<0 ? 0 :  size_t(sz);
+}
+
+template<typename T>
+bool concurrent_queue_base_v3<T>::internal_empty() const {
+    concurrent_queue_rep<T>& r = *my_rep;
+    ticket tc = r.tail_counter;
+    ticket hc = r.head_counter;
+    // if tc!=r.tail_counter, the queue was not empty at some point between the two reads.
+    return tc==r.tail_counter && tc==hc+r.n_invalid_entries ;
+}
+
+template<typename T>
+void concurrent_queue_base_v3<T>::internal_finish_clear() {
+    concurrent_queue_rep<T>& r = *my_rep;
+    size_t nq = r.n_queue;
+    for( size_t i=0; i<nq; ++i ) {
+        page* tp = r.array[i].tail_page;
+        if( is_valid_page(tp) ) {
+            __TBB_ASSERT( r.array[i].head_page==tp, "at most one page should remain" );
+            deallocate_page( tp );
+            r.array[i].tail_page = NULL;
+        } else
+            __TBB_ASSERT( !is_valid_page(r.array[i].head_page), "head page pointer corrupt?" );
+    }
+}
+
+template<typename T>
+void concurrent_queue_base_v3<T>::assign( const concurrent_queue_base_v3& src,
+    item_constructor_t construct_item )
+{
+    concurrent_queue_rep<T>& r = *my_rep;
+    r.items_per_page = src.my_rep->items_per_page;
+
+    // copy concurrent_queue_rep data
+    r.head_counter = src.my_rep->head_counter;
+    r.tail_counter = src.my_rep->tail_counter;
+    r.n_invalid_entries = src.my_rep->n_invalid_entries;
+
+    // copy or move micro_queues
+    for( size_t i = 0; i < r.n_queue; ++i )
+        r.array[i].assign( src.my_rep->array[i], *this, construct_item);
+
+    __TBB_ASSERT( r.head_counter==src.my_rep->head_counter && r.tail_counter==src.my_rep->tail_counter,
+            "the source concurrent queue should not be concurrently modified." );
+}
+
+template<typename Container, typename Value> class concurrent_queue_iterator;
+
+template<typename T>
+class concurrent_queue_iterator_rep: no_assign {
+    typedef typename micro_queue<T>::padded_page padded_page;
+public:
+    ticket head_counter;
+    const concurrent_queue_base_v3<T>& my_queue;
+    typename concurrent_queue_base_v3<T>::page* array[concurrent_queue_rep<T>::n_queue];
+    concurrent_queue_iterator_rep( const concurrent_queue_base_v3<T>& queue ) :
+        head_counter(queue.my_rep->head_counter),
+        my_queue(queue)
+    {
+        for( size_t k=0; k<concurrent_queue_rep<T>::n_queue; ++k )
+            array[k] = queue.my_rep->array[k].head_page;
+    }
+
+    //! Set item to point to kth element.  Return true if at end of queue or item is marked valid; false otherwise.
+    bool get_item( T*& item, size_t k ) ;
+};
+
+template<typename T>
+bool concurrent_queue_iterator_rep<T>::get_item( T*& item, size_t k ) {
+    if( k==my_queue.my_rep->tail_counter ) {
+        item = NULL;
+        return true;
+    } else {
+        typename concurrent_queue_base_v3<T>::page* p = array[concurrent_queue_rep<T>::index(k)];
+        __TBB_ASSERT(p,NULL);
+        size_t i = modulo_power_of_two( k/concurrent_queue_rep<T>::n_queue, my_queue.my_rep->items_per_page );
+        item = &micro_queue<T>::get_ref(*p,i);
+        return (p->mask & uintptr_t(1)<<i)!=0;
+    }
+}
+
+//! Constness-independent portion of concurrent_queue_iterator.
+/** @ingroup containers */
+template<typename Value>
+class concurrent_queue_iterator_base_v3 : no_assign {
+    //! Represents concurrent_queue over which we are iterating.
+    /** NULL if one past last element in queue. */
+    concurrent_queue_iterator_rep<Value>* my_rep;
+
+    template<typename C, typename T, typename U>
+    friend bool operator==( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j );
+
+    template<typename C, typename T, typename U>
+    friend bool operator!=( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j );
+protected:
+    //! Pointer to current item
+    Value* my_item;
+
+    //! Default constructor
+    concurrent_queue_iterator_base_v3() : my_rep(NULL), my_item(NULL) {
+#if __TBB_GCC_OPTIMIZER_ORDERING_BROKEN
+        __TBB_compiler_fence();
+#endif
+    }
+
+    //! Copy constructor
+    concurrent_queue_iterator_base_v3( const concurrent_queue_iterator_base_v3& i )
+    : no_assign(), my_rep(NULL), my_item(NULL) {
+        assign(i);
+    }
+
+    //! Construct iterator pointing to head of queue.
+    concurrent_queue_iterator_base_v3( const concurrent_queue_base_v3<Value>& queue ) ;
+
+    //! Assignment
+    void assign( const concurrent_queue_iterator_base_v3<Value>& other ) ;
+
+    //! Advance iterator one step towards tail of queue.
+    void advance() ;
+
+    //! Destructor
+    ~concurrent_queue_iterator_base_v3() {
+        cache_aligned_allocator<concurrent_queue_iterator_rep<Value> >().deallocate(my_rep, 1);
+        my_rep = NULL;
+    }
+};
+
+template<typename Value>
+concurrent_queue_iterator_base_v3<Value>::concurrent_queue_iterator_base_v3( const concurrent_queue_base_v3<Value>& queue ) {
+    my_rep = cache_aligned_allocator<concurrent_queue_iterator_rep<Value> >().allocate(1);
+    new( my_rep ) concurrent_queue_iterator_rep<Value>(queue);
+    size_t k = my_rep->head_counter;
+    if( !my_rep->get_item(my_item, k) ) advance();
+}
+
+template<typename Value>
+void concurrent_queue_iterator_base_v3<Value>::assign( const concurrent_queue_iterator_base_v3<Value>& other ) {
+    if( my_rep!=other.my_rep ) {
+        if( my_rep ) {
+            cache_aligned_allocator<concurrent_queue_iterator_rep<Value> >().deallocate(my_rep, 1);
+            my_rep = NULL;
+        }
+        if( other.my_rep ) {
+            my_rep = cache_aligned_allocator<concurrent_queue_iterator_rep<Value> >().allocate(1);
+            new( my_rep ) concurrent_queue_iterator_rep<Value>( *other.my_rep );
+        }
+    }
+    my_item = other.my_item;
+}
+
+template<typename Value>
+void concurrent_queue_iterator_base_v3<Value>::advance() {
+    __TBB_ASSERT( my_item, "attempt to increment iterator past end of queue" );
+    size_t k = my_rep->head_counter;
+    const concurrent_queue_base_v3<Value>& queue = my_rep->my_queue;
+#if TBB_USE_ASSERT
+    Value* tmp;
+    my_rep->get_item(tmp,k);
+    __TBB_ASSERT( my_item==tmp, NULL );
+#endif /* TBB_USE_ASSERT */
+    size_t i = modulo_power_of_two( k/concurrent_queue_rep<Value>::n_queue, queue.my_rep->items_per_page );
+    if( i==queue.my_rep->items_per_page-1 ) {
+        typename concurrent_queue_base_v3<Value>::page*& root = my_rep->array[concurrent_queue_rep<Value>::index(k)];
+        root = root->next;
+    }
+    // advance k
+    my_rep->head_counter = ++k;
+    if( !my_rep->get_item(my_item, k) ) advance();
+}
+
+//! Similar to C++0x std::remove_cv
+/** "tbb_" prefix added to avoid overload confusion with C++0x implementations. */
+template<typename T> struct tbb_remove_cv {typedef T type;};
+template<typename T> struct tbb_remove_cv<const T> {typedef T type;};
+template<typename T> struct tbb_remove_cv<volatile T> {typedef T type;};
+template<typename T> struct tbb_remove_cv<const volatile T> {typedef T type;};
+
+//! Meets requirements of a forward iterator for STL.
+/** Value is either the T or const T type of the container.
+    @ingroup containers */
+template<typename Container, typename Value>
+class concurrent_queue_iterator: public concurrent_queue_iterator_base_v3<typename tbb_remove_cv<Value>::type>,
+        public std::iterator<std::forward_iterator_tag,Value> {
+#if !__TBB_TEMPLATE_FRIENDS_BROKEN
+    template<typename T, class A>
+    friend class ::tbb::strict_ppl::concurrent_queue;
+#else
+public:
+#endif
+    //! Construct iterator pointing to head of queue.
+    explicit concurrent_queue_iterator( const concurrent_queue_base_v3<typename tbb_remove_cv<Value>::type>& queue ) :
+        concurrent_queue_iterator_base_v3<typename tbb_remove_cv<Value>::type>(queue)
+    {
+    }
+
+public:
+    concurrent_queue_iterator() {}
+
+    /** If Value==Container::value_type, then this routine is the copy constructor.
+        If Value==const Container::value_type, then this routine is a conversion constructor. */
+    concurrent_queue_iterator( const concurrent_queue_iterator<Container,typename Container::value_type>& other ) :
+        concurrent_queue_iterator_base_v3<typename tbb_remove_cv<Value>::type>(other)
+    {}
+
+    //! Iterator assignment
+    concurrent_queue_iterator& operator=( const concurrent_queue_iterator& other ) {
+        this->assign(other);
+        return *this;
+    }
+
+    //! Reference to current item
+    Value& operator*() const {
+        return *static_cast<Value*>(this->my_item);
+    }
+
+    Value* operator->() const {return &operator*();}
+
+    //! Advance to next item in queue
+    concurrent_queue_iterator& operator++() {
+        this->advance();
+        return *this;
+    }
+
+    //! Post increment
+    Value* operator++(int) {
+        Value* result = &operator*();
+        operator++();
+        return result;
+    }
+}; // concurrent_queue_iterator
+
+
+template<typename C, typename T, typename U>
+bool operator==( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j ) {
+    return i.my_item==j.my_item;
+}
+
+template<typename C, typename T, typename U>
+bool operator!=( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j ) {
+    return i.my_item!=j.my_item;
+}
+
+} // namespace internal
+
+//! @endcond
+
+} // namespace strict_ppl
+
+//! @cond INTERNAL
+namespace internal {
+
+class concurrent_queue_rep;
+class concurrent_queue_iterator_rep;
+class concurrent_queue_iterator_base_v3;
+template<typename Container, typename Value> class concurrent_queue_iterator;
+
+//! For internal use only.
+/** Type-independent portion of concurrent_queue.
+    @ingroup containers */
+class concurrent_queue_base_v3: no_copy {
+private:
+    //! Internal representation
+    concurrent_queue_rep* my_rep;
+
+    friend class concurrent_queue_rep;
+    friend struct micro_queue;
+    friend class micro_queue_pop_finalizer;
+    friend class concurrent_queue_iterator_rep;
+    friend class concurrent_queue_iterator_base_v3;
+protected:
+    //! Prefix on a page
+    struct page {
+        page* next;
+        uintptr_t mask;
+    };
+
+    //! Capacity of the queue
+    ptrdiff_t my_capacity;
+
+    //! Always a power of 2
+    size_t items_per_page;
+
+    //! Size of an item
+    size_t item_size;
+
+    enum copy_specifics { copy, move };
+
+#if __TBB_PROTECTED_NESTED_CLASS_BROKEN
+public:
+#endif
+    template<typename T>
+    struct padded_page: page {
+        //! Not defined anywhere - exists to quiet warnings.
+        padded_page();
+        //! Not defined anywhere - exists to quiet warnings.
+        void operator=( const padded_page& );
+        //! Must be last field.
+        T last;
+    };
+
+private:
+    virtual void copy_item( page& dst, size_t index, const void* src ) = 0;
+    virtual void assign_and_destroy_item( void* dst, page& src, size_t index ) = 0;
+protected:
+    __TBB_EXPORTED_METHOD concurrent_queue_base_v3( size_t item_size );
+    virtual __TBB_EXPORTED_METHOD ~concurrent_queue_base_v3();
+
+    //! Enqueue item at tail of queue using copy operation
+    void __TBB_EXPORTED_METHOD internal_push( const void* src );
+
+    //! Dequeue item from head of queue
+    void __TBB_EXPORTED_METHOD internal_pop( void* dst );
+
+    //! Abort all pending queue operations
+    void __TBB_EXPORTED_METHOD internal_abort();
+
+    //! Attempt to enqueue item onto queue using copy operation
+    bool __TBB_EXPORTED_METHOD internal_push_if_not_full( const void* src );
+
+    //! Attempt to dequeue item from queue.
+    /** NULL if there was no item to dequeue. */
+    bool __TBB_EXPORTED_METHOD internal_pop_if_present( void* dst );
+
+    //! Get size of queue
+    ptrdiff_t __TBB_EXPORTED_METHOD internal_size() const;
+
+    //! Check if the queue is emtpy
+    bool __TBB_EXPORTED_METHOD internal_empty() const;
+
+    //! Set the queue capacity
+    void __TBB_EXPORTED_METHOD internal_set_capacity( ptrdiff_t capacity, size_t element_size );
+
+    //! custom allocator
+    virtual page *allocate_page() = 0;
+
+    //! custom de-allocator
+    virtual void deallocate_page( page *p ) = 0;
+
+    //! free any remaining pages
+    /* note that the name may be misleading, but it remains so due to a historical accident. */
+    void __TBB_EXPORTED_METHOD internal_finish_clear() ;
+
+    //! throw an exception
+    void __TBB_EXPORTED_METHOD internal_throw_exception() const;
+
+    //! copy internal representation
+    void __TBB_EXPORTED_METHOD assign( const concurrent_queue_base_v3& src ) ;
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    //! swap queues
+    void internal_swap( concurrent_queue_base_v3& src ) {
+        std::swap( my_capacity, src.my_capacity );
+        std::swap( items_per_page, src.items_per_page );
+        std::swap( item_size, src.item_size );
+        std::swap( my_rep, src.my_rep );
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    //! Enqueues item at tail of queue using specified operation (copy or move)
+    void internal_insert_item( const void* src, copy_specifics op_type );
+
+    //! Attempts to enqueue at tail of queue using specified operation (copy or move)
+    bool internal_insert_if_not_full( const void* src, copy_specifics op_type );
+
+    //! Assigns one queue to another using specified operation (copy or move)
+    void internal_assign( const concurrent_queue_base_v3& src, copy_specifics op_type );
+private:
+    virtual void copy_page_item( page& dst, size_t dindex, const page& src, size_t sindex ) = 0;
+};
+
+//! For internal use only.
+/** Backward compatible modification of concurrent_queue_base_v3
+    @ingroup containers */
+class concurrent_queue_base_v8: public concurrent_queue_base_v3 {
+protected:
+    concurrent_queue_base_v8( size_t item_sz ) : concurrent_queue_base_v3( item_sz ) {}
+
+    //! move items
+    void __TBB_EXPORTED_METHOD move_content( concurrent_queue_base_v8& src ) ;
+
+    //! Attempt to enqueue item onto queue using move operation
+    bool __TBB_EXPORTED_METHOD internal_push_move_if_not_full( const void* src );
+
+    //! Enqueue item at tail of queue using move operation
+    void __TBB_EXPORTED_METHOD internal_push_move( const void* src );
+private:
+    friend struct micro_queue;
+    virtual void move_page_item( page& dst, size_t dindex, const page& src, size_t sindex ) = 0;
+    virtual void move_item( page& dst, size_t index, const void* src ) = 0;
+};
+
+//! Type-independent portion of concurrent_queue_iterator.
+/** @ingroup containers */
+class concurrent_queue_iterator_base_v3 {
+    //! concurrent_queue over which we are iterating.
+    /** NULL if one past last element in queue. */
+    concurrent_queue_iterator_rep* my_rep;
+
+    template<typename C, typename T, typename U>
+    friend bool operator==( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j );
+
+    template<typename C, typename T, typename U>
+    friend bool operator!=( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j );
+
+    void initialize( const concurrent_queue_base_v3& queue, size_t offset_of_data );
+protected:
+    //! Pointer to current item
+    void* my_item;
+
+    //! Default constructor
+    concurrent_queue_iterator_base_v3() : my_rep(NULL), my_item(NULL) {}
+
+    //! Copy constructor
+    concurrent_queue_iterator_base_v3( const concurrent_queue_iterator_base_v3& i ) : my_rep(NULL), my_item(NULL) {
+        assign(i);
+    }
+
+    //! Obsolete entry point for constructing iterator pointing to head of queue.
+    /** Does not work correctly for SSE types. */
+    __TBB_EXPORTED_METHOD concurrent_queue_iterator_base_v3( const concurrent_queue_base_v3& queue );
+
+    //! Construct iterator pointing to head of queue.
+    __TBB_EXPORTED_METHOD concurrent_queue_iterator_base_v3( const concurrent_queue_base_v3& queue, size_t offset_of_data );
+
+    //! Assignment
+    void __TBB_EXPORTED_METHOD assign( const concurrent_queue_iterator_base_v3& i );
+
+    //! Advance iterator one step towards tail of queue.
+    void __TBB_EXPORTED_METHOD advance();
+
+    //! Destructor
+    __TBB_EXPORTED_METHOD ~concurrent_queue_iterator_base_v3();
+};
+
+typedef concurrent_queue_iterator_base_v3 concurrent_queue_iterator_base;
+
+//! Meets requirements of a forward iterator for STL.
+/** Value is either the T or const T type of the container.
+    @ingroup containers */
+template<typename Container, typename Value>
+class concurrent_queue_iterator: public concurrent_queue_iterator_base,
+        public std::iterator<std::forward_iterator_tag,Value> {
+
+#if !__TBB_TEMPLATE_FRIENDS_BROKEN
+    template<typename T, class A>
+    friend class ::tbb::concurrent_bounded_queue;
+#else
+public:
+#endif
+
+    //! Construct iterator pointing to head of queue.
+    explicit concurrent_queue_iterator( const concurrent_queue_base_v3& queue ) :
+        concurrent_queue_iterator_base_v3(queue,__TBB_offsetof(concurrent_queue_base_v3::padded_page<Value>,last))
+    {
+    }
+
+public:
+    concurrent_queue_iterator() {}
+
+    /** If Value==Container::value_type, then this routine is the copy constructor.
+        If Value==const Container::value_type, then this routine is a conversion constructor. */
+    concurrent_queue_iterator( const concurrent_queue_iterator<Container,typename Container::value_type>& other ) :
+        concurrent_queue_iterator_base_v3(other)
+    {}
+
+    //! Iterator assignment
+    concurrent_queue_iterator& operator=( const concurrent_queue_iterator& other ) {
+        assign(other);
+        return *this;
+    }
+
+    //! Reference to current item
+    Value& operator*() const {
+        return *static_cast<Value*>(my_item);
+    }
+
+    Value* operator->() const {return &operator*();}
+
+    //! Advance to next item in queue
+    concurrent_queue_iterator& operator++() {
+        advance();
+        return *this;
+    }
+
+    //! Post increment
+    Value* operator++(int) {
+        Value* result = &operator*();
+        operator++();
+        return result;
+    }
+}; // concurrent_queue_iterator
+
+
+template<typename C, typename T, typename U>
+bool operator==( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j ) {
+    return i.my_item==j.my_item;
+}
+
+template<typename C, typename T, typename U>
+bool operator!=( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j ) {
+    return i.my_item!=j.my_item;
+}
+
+} // namespace internal;
+
+//! @endcond
+
+} // namespace tbb
+
+#endif /* __TBB__concurrent_queue_impl_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_concurrent_unordered_impl.h b/xdl/third_party/tbb/include/tbb/internal/_concurrent_unordered_impl.h
new file mode 100644
index 00000000..2e68e2ff
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_concurrent_unordered_impl.h
@@ -0,0 +1,1522 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Container implementations in this header are based on PPL implementations
+   provided by Microsoft. */
+
+#ifndef __TBB__concurrent_unordered_impl_H
+#define __TBB__concurrent_unordered_impl_H
+#if !defined(__TBB_concurrent_unordered_map_H) && !defined(__TBB_concurrent_unordered_set_H) && !defined(__TBB_concurrent_hash_map_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#include "../tbb_stddef.h"
+
+#include <iterator>
+#include <utility>      // Need std::pair
+#include <functional>   // Need std::equal_to (in ../concurrent_unordered_*.h)
+#include <string>       // For tbb_hasher
+#include <cstring>      // Need std::memset
+#include __TBB_STD_SWAP_HEADER
+
+#include "../atomic.h"
+#include "../tbb_exception.h"
+#include "../tbb_allocator.h"
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    #include <initializer_list>
+#endif
+
+#include "_tbb_hash_compare_impl.h"
+
+namespace tbb {
+namespace interface5 {
+//! @cond INTERNAL
+namespace internal {
+
+template <typename T, typename Allocator>
+class split_ordered_list;
+template <typename Traits>
+class concurrent_unordered_base;
+
+// Forward list iterators (without skipping dummy elements)
+template<class Solist, typename Value>
+class flist_iterator : public std::iterator<std::forward_iterator_tag, Value>
+{
+    template <typename T, typename Allocator>
+    friend class split_ordered_list;
+    template <typename Traits>
+    friend class concurrent_unordered_base;
+    template<class M, typename V>
+    friend class flist_iterator;
+
+    typedef typename Solist::nodeptr_t nodeptr_t;
+public:
+    typedef typename Solist::value_type value_type;
+    typedef typename Solist::difference_type difference_type;
+    typedef typename Solist::pointer pointer;
+    typedef typename Solist::reference reference;
+
+    flist_iterator() : my_node_ptr(0) {}
+    flist_iterator( const flist_iterator<Solist, typename Solist::value_type> &other )
+        : my_node_ptr(other.my_node_ptr) {}
+
+    reference operator*() const { return my_node_ptr->my_element; }
+    pointer operator->() const { return &**this; }
+
+    flist_iterator& operator++() {
+        my_node_ptr = my_node_ptr->my_next;
+        return *this;
+    }
+
+    flist_iterator operator++(int) {
+        flist_iterator tmp = *this;
+        ++*this;
+        return tmp;
+    }
+
+protected:
+    flist_iterator(nodeptr_t pnode) : my_node_ptr(pnode) {}
+    nodeptr_t get_node_ptr() const { return my_node_ptr; }
+
+    nodeptr_t my_node_ptr;
+
+    template<typename M, typename T, typename U>
+    friend bool operator==( const flist_iterator<M,T> &i, const flist_iterator<M,U> &j );
+    template<typename M, typename T, typename U>
+    friend bool operator!=( const flist_iterator<M,T>& i, const flist_iterator<M,U>& j );
+};
+
+template<typename Solist, typename T, typename U>
+bool operator==( const flist_iterator<Solist,T> &i, const flist_iterator<Solist,U> &j ) {
+    return i.my_node_ptr == j.my_node_ptr;
+}
+template<typename Solist, typename T, typename U>
+bool operator!=( const flist_iterator<Solist,T>& i, const flist_iterator<Solist,U>& j ) {
+    return i.my_node_ptr != j.my_node_ptr;
+}
+
+// Split-order list iterators, needed to skip dummy elements
+template<class Solist, typename Value>
+class solist_iterator : public flist_iterator<Solist, Value>
+{
+    typedef flist_iterator<Solist, Value> base_type;
+    typedef typename Solist::nodeptr_t nodeptr_t;
+    using base_type::get_node_ptr;
+    template <typename T, typename Allocator>
+    friend class split_ordered_list;
+    template<class M, typename V>
+    friend class solist_iterator;
+    template<typename M, typename T, typename U>
+    friend bool operator==( const solist_iterator<M,T> &i, const solist_iterator<M,U> &j );
+    template<typename M, typename T, typename U>
+    friend bool operator!=( const solist_iterator<M,T>& i, const solist_iterator<M,U>& j );
+
+    const Solist *my_list_ptr;
+    solist_iterator(nodeptr_t pnode, const Solist *plist) : base_type(pnode), my_list_ptr(plist) {}
+
+public:
+    typedef typename Solist::value_type value_type;
+    typedef typename Solist::difference_type difference_type;
+    typedef typename Solist::pointer pointer;
+    typedef typename Solist::reference reference;
+
+    solist_iterator() {}
+    solist_iterator(const solist_iterator<Solist, typename Solist::value_type> &other )
+        : base_type(other), my_list_ptr(other.my_list_ptr) {}
+
+    reference operator*() const {
+        return this->base_type::operator*();
+    }
+
+    pointer operator->() const {
+        return (&**this);
+    }
+
+    solist_iterator& operator++() {
+        do ++(*(base_type *)this);
+        while (get_node_ptr() != NULL && get_node_ptr()->is_dummy());
+
+        return (*this);
+    }
+
+    solist_iterator operator++(int) {
+        solist_iterator tmp = *this;
+        do ++*this;
+        while (get_node_ptr() != NULL && get_node_ptr()->is_dummy());
+
+        return (tmp);
+    }
+};
+
+template<typename Solist, typename T, typename U>
+bool operator==( const solist_iterator<Solist,T> &i, const solist_iterator<Solist,U> &j ) {
+    return i.my_node_ptr == j.my_node_ptr && i.my_list_ptr == j.my_list_ptr;
+}
+template<typename Solist, typename T, typename U>
+bool operator!=( const solist_iterator<Solist,T>& i, const solist_iterator<Solist,U>& j ) {
+    return i.my_node_ptr != j.my_node_ptr || i.my_list_ptr != j.my_list_ptr;
+}
+
+// Forward type and class definitions
+typedef size_t sokey_t;
+
+
+// Forward list in which elements are sorted in a split-order
+template <typename T, typename Allocator>
+class split_ordered_list
+{
+public:
+    typedef split_ordered_list<T, Allocator> self_type;
+    typedef typename Allocator::template rebind<T>::other allocator_type;
+    struct node;
+    typedef node *nodeptr_t;
+
+    typedef typename allocator_type::size_type size_type;
+    typedef typename allocator_type::difference_type difference_type;
+    typedef typename allocator_type::pointer pointer;
+    typedef typename allocator_type::const_pointer const_pointer;
+    typedef typename allocator_type::reference reference;
+    typedef typename allocator_type::const_reference const_reference;
+    typedef typename allocator_type::value_type value_type;
+
+    typedef solist_iterator<self_type, const value_type> const_iterator;
+    typedef solist_iterator<self_type, value_type> iterator;
+    typedef flist_iterator<self_type, const value_type> raw_const_iterator;
+    typedef flist_iterator<self_type, value_type> raw_iterator;
+
+    // Node that holds the element in a split-ordered list
+    struct node : tbb::internal::no_assign
+    {
+    private:
+        // for compilers that try to generate default constructors though they are not needed.
+        node();  // VS 2008, 2010, 2012
+    public:
+        // Initialize the node with the given order key
+        void init(sokey_t order_key) {
+            my_order_key = order_key;
+            my_next = NULL;
+        }
+
+        // Return the order key (needed for hashing)
+        sokey_t get_order_key() const { // TODO: remove
+            return my_order_key;
+        }
+
+        // Inserts the new element in the list in an atomic fashion
+        nodeptr_t atomic_set_next(nodeptr_t new_node, nodeptr_t current_node)
+        {
+            // Try to change the next pointer on the current element to a new element, only if it still points to the cached next
+            nodeptr_t exchange_node = tbb::internal::as_atomic(my_next).compare_and_swap(new_node, current_node);
+
+            if (exchange_node == current_node) // TODO: why this branch?
+            {
+                // Operation succeeded, return the new node
+                return new_node;
+            }
+            else
+            {
+                // Operation failed, return the "interfering" node
+                return exchange_node;
+            }
+        }
+
+        // Checks if this element in the list is a dummy, order enforcing node. Dummy nodes are used by buckets
+        // in the hash table to quickly index into the right subsection of the split-ordered list.
+        bool is_dummy() const {
+            return (my_order_key & 0x1) == 0;
+        }
+
+
+        nodeptr_t  my_next;      // Next element in the list
+        value_type my_element;   // Element storage
+        sokey_t    my_order_key; // Order key for this element
+    };
+
+    // Allocate a new node with the given order key; used to allocate dummy nodes
+    nodeptr_t create_node(sokey_t order_key) {
+        nodeptr_t pnode = my_node_allocator.allocate(1);
+        pnode->init(order_key);
+        return (pnode);
+    }
+
+    // Allocate a new node with the given order key and value
+    template<typename Arg>
+    nodeptr_t create_node(sokey_t order_key, __TBB_FORWARDING_REF(Arg) t,
+                          /*AllowCreate=*/tbb::internal::true_type=tbb::internal::true_type()){
+        nodeptr_t pnode = my_node_allocator.allocate(1);
+
+        //TODO: use RAII scoped guard instead of explicit catch
+        __TBB_TRY {
+            new(static_cast<void*>(&pnode->my_element)) T(tbb::internal::forward<Arg>(t));
+            pnode->init(order_key);
+        } __TBB_CATCH(...) {
+            my_node_allocator.deallocate(pnode, 1);
+            __TBB_RETHROW();
+        }
+
+        return (pnode);
+    }
+
+    // A helper to avoid excessive requiremens in internal_insert
+    template<typename Arg>
+    nodeptr_t create_node(sokey_t, __TBB_FORWARDING_REF(Arg),
+                          /*AllowCreate=*/tbb::internal::false_type){
+        __TBB_ASSERT(false, "This compile-time helper should never get called");
+        return nodeptr_t();
+    }
+
+    // Allocate a new node with the given parameters for constructing value
+    template<typename __TBB_PARAMETER_PACK Args>
+    nodeptr_t create_node_v( __TBB_FORWARDING_REF(Args) __TBB_PARAMETER_PACK args){
+        nodeptr_t pnode = my_node_allocator.allocate(1);
+
+        //TODO: use RAII scoped guard instead of explicit catch
+        __TBB_TRY {
+            new(static_cast<void*>(&pnode->my_element)) T(__TBB_PACK_EXPANSION(tbb::internal::forward<Args>(args)));
+        } __TBB_CATCH(...) {
+            my_node_allocator.deallocate(pnode, 1);
+            __TBB_RETHROW();
+        }
+
+        return (pnode);
+    }
+
+   split_ordered_list(allocator_type a = allocator_type())
+       : my_node_allocator(a), my_element_count(0)
+    {
+        // Immediately allocate a dummy node with order key of 0. This node
+        // will always be the head of the list.
+        my_head = create_node(sokey_t(0));
+    }
+
+    ~split_ordered_list()
+    {
+        // Clear the list
+        clear();
+
+        // Remove the head element which is not cleared by clear()
+        nodeptr_t pnode = my_head;
+        my_head = NULL;
+
+        __TBB_ASSERT(pnode != NULL && pnode->my_next == NULL, "Invalid head list node");
+
+        destroy_node(pnode);
+    }
+
+    // Common forward list functions
+
+    allocator_type get_allocator() const {
+        return (my_node_allocator);
+    }
+
+    void clear() {
+        nodeptr_t pnext;
+        nodeptr_t pnode = my_head;
+
+        __TBB_ASSERT(my_head != NULL, "Invalid head list node");
+        pnext = pnode->my_next;
+        pnode->my_next = NULL;
+        pnode = pnext;
+
+        while (pnode != NULL)
+        {
+            pnext = pnode->my_next;
+            destroy_node(pnode);
+            pnode = pnext;
+        }
+
+        my_element_count = 0;
+    }
+
+    // Returns a first non-dummy element in the SOL
+    iterator begin() {
+        return first_real_iterator(raw_begin());
+    }
+
+    // Returns a first non-dummy element in the SOL
+    const_iterator begin() const {
+        return first_real_iterator(raw_begin());
+    }
+
+    iterator end() {
+        return (iterator(0, this));
+    }
+
+    const_iterator end() const {
+        return (const_iterator(0, this));
+    }
+
+    const_iterator cbegin() const {
+        return (((const self_type *)this)->begin());
+    }
+
+    const_iterator cend() const {
+        return (((const self_type *)this)->end());
+    }
+
+    // Checks if the number of elements (non-dummy) is 0
+    bool empty() const {
+        return (my_element_count == 0);
+    }
+
+    // Returns the number of non-dummy elements in the list
+    size_type size() const {
+        return my_element_count;
+    }
+
+    // Returns the maximum size of the list, determined by the allocator
+    size_type max_size() const {
+        return my_node_allocator.max_size();
+    }
+
+    // Swaps 'this' list with the passed in one
+    void swap(self_type& other)
+    {
+        if (this == &other)
+        {
+            // Nothing to do
+            return;
+        }
+
+            std::swap(my_element_count, other.my_element_count);
+            std::swap(my_head, other.my_head);
+    }
+
+    // Split-order list functions
+
+    // Returns a first element in the SOL, which is always a dummy
+    raw_iterator raw_begin() {
+        return raw_iterator(my_head);
+    }
+
+    // Returns a first element in the SOL, which is always a dummy
+    raw_const_iterator raw_begin() const {
+        return raw_const_iterator(my_head);
+    }
+
+    raw_iterator raw_end() {
+        return raw_iterator(0);
+    }
+
+    raw_const_iterator raw_end() const {
+        return raw_const_iterator(0);
+    }
+
+    static sokey_t get_order_key(const raw_const_iterator& it) {
+        return it.get_node_ptr()->get_order_key();
+    }
+
+    static sokey_t get_safe_order_key(const raw_const_iterator& it) {
+        if( !it.get_node_ptr() )  return ~sokey_t(0);
+        return it.get_node_ptr()->get_order_key();
+    }
+
+    // Returns a public iterator version of the internal iterator. Public iterator must not
+    // be a dummy private iterator.
+    iterator get_iterator(raw_iterator it) {
+        __TBB_ASSERT(it.get_node_ptr() == NULL || !it.get_node_ptr()->is_dummy(), "Invalid user node (dummy)");
+        return iterator(it.get_node_ptr(), this);
+    }
+
+    // Returns a public iterator version of the internal iterator. Public iterator must not
+    // be a dummy private iterator.
+    const_iterator get_iterator(raw_const_iterator it) const {
+        __TBB_ASSERT(it.get_node_ptr() == NULL || !it.get_node_ptr()->is_dummy(), "Invalid user node (dummy)");
+        return const_iterator(it.get_node_ptr(), this);
+    }
+
+    // Returns a non-const version of the raw_iterator
+    raw_iterator get_iterator(raw_const_iterator it) {
+        return raw_iterator(it.get_node_ptr());
+    }
+
+    // Returns a non-const version of the iterator
+    static iterator get_iterator(const_iterator it) {
+        return iterator(it.my_node_ptr, it.my_list_ptr);
+    }
+
+    // Returns a public iterator version of a first non-dummy internal iterator at or after
+    // the passed in internal iterator.
+    iterator first_real_iterator(raw_iterator it)
+    {
+        // Skip all dummy, internal only iterators
+        while (it != raw_end() && it.get_node_ptr()->is_dummy())
+            ++it;
+
+        return iterator(it.get_node_ptr(), this);
+    }
+
+    // Returns a public iterator version of a first non-dummy internal iterator at or after
+    // the passed in internal iterator.
+    const_iterator first_real_iterator(raw_const_iterator it) const
+    {
+        // Skip all dummy, internal only iterators
+        while (it != raw_end() && it.get_node_ptr()->is_dummy())
+            ++it;
+
+        return const_iterator(it.get_node_ptr(), this);
+    }
+
+    // Erase an element using the allocator
+    void destroy_node(nodeptr_t pnode) {
+        if (!pnode->is_dummy()) my_node_allocator.destroy(pnode);
+        my_node_allocator.deallocate(pnode, 1);
+    }
+
+    // Try to insert a new element in the list.
+    // If insert fails, return the node that was inserted instead.
+    static nodeptr_t try_insert_atomic(nodeptr_t previous, nodeptr_t new_node, nodeptr_t current_node) {
+        new_node->my_next = current_node;
+        return previous->atomic_set_next(new_node, current_node);
+    }
+
+    // Insert a new element between passed in iterators
+    std::pair<iterator, bool> try_insert(raw_iterator it, raw_iterator next, nodeptr_t pnode, size_type *new_count)
+    {
+        nodeptr_t inserted_node = try_insert_atomic(it.get_node_ptr(), pnode, next.get_node_ptr());
+
+        if (inserted_node == pnode)
+        {
+            // If the insert succeeded, check that the order is correct and increment the element count
+            check_range(it, next);
+            *new_count = tbb::internal::as_atomic(my_element_count).fetch_and_increment();
+            return std::pair<iterator, bool>(iterator(pnode, this), true);
+        }
+        else
+        {
+            return std::pair<iterator, bool>(end(), false);
+        }
+    }
+
+    // Insert a new dummy element, starting search at a parent dummy element
+    raw_iterator insert_dummy(raw_iterator it, sokey_t order_key)
+    {
+        raw_iterator last = raw_end();
+        raw_iterator where = it;
+
+        __TBB_ASSERT(where != last, "Invalid head node");
+
+        ++where;
+
+        // Create a dummy element up front, even though it may be discarded (due to concurrent insertion)
+        nodeptr_t dummy_node = create_node(order_key);
+
+        for (;;)
+        {
+            __TBB_ASSERT(it != last, "Invalid head list node");
+
+            // If the head iterator is at the end of the list, or past the point where this dummy
+            // node needs to be inserted, then try to insert it.
+            if (where == last || get_order_key(where) > order_key)
+            {
+                __TBB_ASSERT(get_order_key(it) < order_key, "Invalid node order in the list");
+
+                // Try to insert it in the right place
+                nodeptr_t inserted_node = try_insert_atomic(it.get_node_ptr(), dummy_node, where.get_node_ptr());
+
+                if (inserted_node == dummy_node)
+                {
+                    // Insertion succeeded, check the list for order violations
+                    check_range(it, where);
+                    return raw_iterator(dummy_node);
+                }
+                else
+                {
+                    // Insertion failed: either dummy node was inserted by another thread, or
+                    // a real element was inserted at exactly the same place as dummy node.
+                    // Proceed with the search from the previous location where order key was
+                    // known to be larger (note: this is legal only because there is no safe
+                    // concurrent erase operation supported).
+                    where = it;
+                    ++where;
+                    continue;
+                }
+            }
+            else if (get_order_key(where) == order_key)
+            {
+                // Another dummy node with the same value found, discard the new one.
+                destroy_node(dummy_node);
+                return where;
+            }
+
+            // Move the iterator forward
+            it = where;
+            ++where;
+        }
+
+    }
+
+    // This erase function can handle both real and dummy nodes
+    void erase_node(raw_iterator previous, raw_const_iterator& where)
+    {
+        nodeptr_t pnode = (where++).get_node_ptr();
+        nodeptr_t prevnode = previous.get_node_ptr();
+        __TBB_ASSERT(prevnode->my_next == pnode, "Erase must take consecutive iterators");
+        prevnode->my_next = pnode->my_next;
+
+        destroy_node(pnode);
+    }
+
+    // Erase the element (previous node needs to be passed because this is a forward only list)
+    iterator erase_node(raw_iterator previous, const_iterator where)
+    {
+        raw_const_iterator it = where;
+        erase_node(previous, it);
+        my_element_count--;
+
+        return get_iterator(first_real_iterator(it));
+    }
+
+    // Move all elements from the passed in split-ordered list to this one
+    void move_all(self_type& source)
+    {
+        raw_const_iterator first = source.raw_begin();
+        raw_const_iterator last = source.raw_end();
+
+        if (first == last)
+            return;
+
+        nodeptr_t previous_node = my_head;
+        raw_const_iterator begin_iterator = first++;
+
+        // Move all elements one by one, including dummy ones
+        for (raw_const_iterator it = first; it != last;)
+        {
+            nodeptr_t pnode = it.get_node_ptr();
+
+            nodeptr_t dummy_node = pnode->is_dummy() ? create_node(pnode->get_order_key()) : create_node(pnode->get_order_key(), pnode->my_element);
+            previous_node = try_insert_atomic(previous_node, dummy_node, NULL);
+            __TBB_ASSERT(previous_node != NULL, "Insertion must succeed");
+            raw_const_iterator where = it++;
+            source.erase_node(get_iterator(begin_iterator), where);
+        }
+        check_range();
+    }
+
+
+private:
+    //Need to setup private fields of split_ordered_list in move constructor and assignment of concurrent_unordered_base
+    template <typename Traits>
+    friend class concurrent_unordered_base;
+
+    // Check the list for order violations
+    void check_range( raw_iterator first, raw_iterator last )
+    {
+#if TBB_USE_ASSERT
+        for (raw_iterator it = first; it != last; ++it)
+        {
+            raw_iterator next = it;
+            ++next;
+
+            __TBB_ASSERT(next == raw_end() || get_order_key(next) >= get_order_key(it), "!!! List order inconsistency !!!");
+        }
+#else
+        tbb::internal::suppress_unused_warning(first, last);
+#endif
+    }
+    void check_range()
+    {
+#if TBB_USE_ASSERT
+        check_range( raw_begin(), raw_end() );
+#endif
+    }
+
+    typename allocator_type::template rebind<node>::other my_node_allocator;  // allocator object for nodes
+    size_type                                             my_element_count;   // Total item count, not counting dummy nodes
+    nodeptr_t                                             my_head;            // pointer to head node
+};
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+#pragma warning(push)
+#pragma warning(disable: 4127) // warning C4127: conditional expression is constant
+#endif
+
+template <typename Traits>
+class concurrent_unordered_base : public Traits
+{
+protected:
+    // Type definitions
+    typedef concurrent_unordered_base<Traits> self_type;
+    typedef typename Traits::value_type value_type;
+    typedef typename Traits::key_type key_type;
+    typedef typename Traits::hash_compare hash_compare;
+    typedef typename Traits::allocator_type allocator_type;
+    typedef typename hash_compare::hasher hasher;
+    typedef typename hash_compare::key_equal key_equal;
+    typedef typename allocator_type::pointer pointer;
+    typedef typename allocator_type::const_pointer const_pointer;
+    typedef typename allocator_type::reference reference;
+    typedef typename allocator_type::const_reference const_reference;
+    typedef typename allocator_type::size_type size_type;
+    typedef typename allocator_type::difference_type difference_type;
+    typedef split_ordered_list<value_type, typename Traits::allocator_type> solist_t;
+    typedef typename solist_t::nodeptr_t nodeptr_t;
+    // Iterators that walk the entire split-order list, including dummy nodes
+    typedef typename solist_t::raw_iterator raw_iterator;
+    typedef typename solist_t::raw_const_iterator raw_const_iterator;
+    typedef typename solist_t::iterator iterator; // TODO: restore const iterator for unordered_sets
+    typedef typename solist_t::const_iterator const_iterator;
+    typedef iterator local_iterator;
+    typedef const_iterator const_local_iterator;
+    using Traits::my_hash_compare;
+    using Traits::get_key;
+    using Traits::allow_multimapping;
+
+    static const size_type initial_bucket_number = 8;                               // Initial number of buckets
+private:
+    typedef std::pair<iterator, iterator> pairii_t;
+    typedef std::pair<const_iterator, const_iterator> paircc_t;
+
+    static size_type const pointers_per_table = sizeof(size_type) * 8;              // One bucket segment per bit
+    static const size_type initial_bucket_load = 4;                                // Initial maximum number of elements per bucket
+
+    struct call_internal_clear_on_exit{
+        concurrent_unordered_base* my_instance;
+        call_internal_clear_on_exit(concurrent_unordered_base* instance) : my_instance(instance) {}
+        void dismiss(){ my_instance = NULL;}
+        ~call_internal_clear_on_exit(){
+            if (my_instance){
+                my_instance->internal_clear();
+            }
+        }
+    };
+protected:
+    // Constructors/Destructors
+    concurrent_unordered_base(size_type n_of_buckets = initial_bucket_number,
+        const hash_compare& hc = hash_compare(), const allocator_type& a = allocator_type())
+        : Traits(hc), my_solist(a),
+          my_allocator(a), my_maximum_bucket_size((float) initial_bucket_load)
+    {
+        if( n_of_buckets == 0) ++n_of_buckets;
+        my_number_of_buckets = size_type(1)<<__TBB_Log2((uintptr_t)n_of_buckets*2-1); // round up to power of 2
+        internal_init();
+    }
+
+    concurrent_unordered_base(const concurrent_unordered_base& right, const allocator_type& a)
+        : Traits(right.my_hash_compare), my_solist(a), my_allocator(a)
+    {
+        internal_init();
+        internal_copy(right);
+    }
+
+    concurrent_unordered_base(const concurrent_unordered_base& right)
+        : Traits(right.my_hash_compare), my_solist(right.get_allocator()), my_allocator(right.get_allocator())
+    {
+        //FIXME:exception safety seems to be broken here
+        internal_init();
+        internal_copy(right);
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    concurrent_unordered_base(concurrent_unordered_base&& right)
+        : Traits(right.my_hash_compare), my_solist(right.get_allocator()), my_allocator(right.get_allocator()),
+          my_maximum_bucket_size(float(initial_bucket_load))
+    {
+        my_number_of_buckets = initial_bucket_number;
+        internal_init();
+        swap(right);
+    }
+
+    concurrent_unordered_base(concurrent_unordered_base&& right, const allocator_type& a)
+        : Traits(right.my_hash_compare), my_solist(a), my_allocator(a)
+    {
+        call_internal_clear_on_exit clear_buckets_on_exception(this);
+
+        internal_init();
+        if (a == right.get_allocator()){
+            my_number_of_buckets = initial_bucket_number;
+            my_maximum_bucket_size = float(initial_bucket_load);
+            this->swap(right);
+        }else{
+            my_maximum_bucket_size = right.my_maximum_bucket_size;
+            my_number_of_buckets = right.my_number_of_buckets;
+            my_solist.my_element_count = right.my_solist.my_element_count;
+
+            if (! right.my_solist.empty()){
+                nodeptr_t previous_node = my_solist.my_head;
+
+                // Move all elements one by one, including dummy ones
+                for (raw_const_iterator it = ++(right.my_solist.raw_begin()), last = right.my_solist.raw_end(); it != last; ++it)
+                {
+                    const nodeptr_t pnode = it.get_node_ptr();
+                    nodeptr_t node;
+                    if (pnode->is_dummy()) {
+                        node = my_solist.create_node(pnode->get_order_key());
+                        size_type bucket = __TBB_ReverseBits(pnode->get_order_key()) % my_number_of_buckets;
+                        set_bucket(bucket, node);
+                    }else{
+                        node = my_solist.create_node(pnode->get_order_key(), std::move(pnode->my_element));
+                    }
+
+                    previous_node = my_solist.try_insert_atomic(previous_node, node, NULL);
+                    __TBB_ASSERT(previous_node != NULL, "Insertion of node failed. Concurrent inserts in constructor ?");
+                }
+                my_solist.check_range();
+            }
+        }
+
+        clear_buckets_on_exception.dismiss();
+    }
+
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+    concurrent_unordered_base& operator=(const concurrent_unordered_base& right) {
+        if (this != &right)
+            internal_copy(right);
+        return (*this);
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    concurrent_unordered_base& operator=(concurrent_unordered_base&& other)
+    {
+        if(this != &other){
+            typedef typename tbb::internal::allocator_traits<allocator_type>::propagate_on_container_move_assignment pocma_t;
+            if(pocma_t::value || this->my_allocator == other.my_allocator) {
+                concurrent_unordered_base trash (std::move(*this));
+                swap(other);
+                if (pocma_t::value) {
+                    using std::swap;
+                    //TODO: swapping allocators here may be a problem, replace with single direction moving
+                    swap(this->my_solist.my_node_allocator, other.my_solist.my_node_allocator);
+                    swap(this->my_allocator, other.my_allocator);
+                }
+            } else {
+                concurrent_unordered_base moved_copy(std::move(other),this->my_allocator);
+                this->swap(moved_copy);
+            }
+        }
+        return *this;
+    }
+
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! assignment operator from initializer_list
+    concurrent_unordered_base& operator=(std::initializer_list<value_type> il)
+    {
+        this->clear();
+        this->insert(il.begin(),il.end());
+        return (*this);
+    }
+#endif // __TBB_INITIALIZER_LISTS_PRESENT
+
+
+    ~concurrent_unordered_base() {
+        // Delete all node segments
+        internal_clear();
+    }
+
+public:
+    allocator_type get_allocator() const {
+        return my_solist.get_allocator();
+    }
+
+    // Size and capacity function
+    bool empty() const {
+        return my_solist.empty();
+    }
+
+    size_type size() const {
+        return my_solist.size();
+    }
+
+    size_type max_size() const {
+        return my_solist.max_size();
+    }
+
+    // Iterators
+    iterator begin() {
+        return my_solist.begin();
+    }
+
+    const_iterator begin() const {
+        return my_solist.begin();
+    }
+
+    iterator end() {
+        return my_solist.end();
+    }
+
+    const_iterator end() const {
+        return my_solist.end();
+    }
+
+    const_iterator cbegin() const {
+        return my_solist.cbegin();
+    }
+
+    const_iterator cend() const {
+        return my_solist.cend();
+    }
+
+    // Parallel traversal support
+    class const_range_type : tbb::internal::no_assign {
+        const concurrent_unordered_base &my_table;
+        raw_const_iterator my_begin_node;
+        raw_const_iterator my_end_node;
+        mutable raw_const_iterator my_midpoint_node;
+    public:
+        //! Type for size of a range
+        typedef typename concurrent_unordered_base::size_type size_type;
+        typedef typename concurrent_unordered_base::value_type value_type;
+        typedef typename concurrent_unordered_base::reference reference;
+        typedef typename concurrent_unordered_base::difference_type difference_type;
+        typedef typename concurrent_unordered_base::const_iterator iterator;
+
+        //! True if range is empty.
+        bool empty() const {return my_begin_node == my_end_node;}
+
+        //! True if range can be partitioned into two subranges.
+        bool is_divisible() const {
+            return my_midpoint_node != my_end_node;
+        }
+        //! Split range.
+        const_range_type( const_range_type &r, split ) :
+            my_table(r.my_table), my_end_node(r.my_end_node)
+        {
+            r.my_end_node = my_begin_node = r.my_midpoint_node;
+            __TBB_ASSERT( !empty(), "Splitting despite the range is not divisible" );
+            __TBB_ASSERT( !r.empty(), "Splitting despite the range is not divisible" );
+            set_midpoint();
+            r.set_midpoint();
+        }
+        //! Init range with container and grainsize specified
+        const_range_type( const concurrent_unordered_base &a_table ) :
+            my_table(a_table), my_begin_node(a_table.my_solist.begin()),
+            my_end_node(a_table.my_solist.end())
+        {
+            set_midpoint();
+        }
+        iterator begin() const { return my_table.my_solist.get_iterator(my_begin_node); }
+        iterator end() const { return my_table.my_solist.get_iterator(my_end_node); }
+        //! The grain size for this range.
+        size_type grainsize() const { return 1; }
+
+        //! Set my_midpoint_node to point approximately half way between my_begin_node and my_end_node.
+        void set_midpoint() const {
+            if( my_begin_node == my_end_node ) // not divisible
+                my_midpoint_node = my_end_node;
+            else {
+                sokey_t begin_key = solist_t::get_safe_order_key(my_begin_node);
+                sokey_t end_key = solist_t::get_safe_order_key(my_end_node);
+                size_t mid_bucket = __TBB_ReverseBits( begin_key + (end_key-begin_key)/2 ) % my_table.my_number_of_buckets;
+                while ( !my_table.is_initialized(mid_bucket) ) mid_bucket = my_table.get_parent(mid_bucket);
+                if(__TBB_ReverseBits(mid_bucket) > begin_key) {
+                    // found a dummy_node between begin and end
+                    my_midpoint_node = my_table.my_solist.first_real_iterator(my_table.get_bucket( mid_bucket ));
+                }
+                else {
+                    // didn't find a dummy node between begin and end.
+                    my_midpoint_node = my_end_node;
+                }
+#if TBB_USE_ASSERT
+                {
+                    sokey_t mid_key = solist_t::get_safe_order_key(my_midpoint_node);
+                    __TBB_ASSERT( begin_key < mid_key, "my_begin_node is after my_midpoint_node" );
+                    __TBB_ASSERT( mid_key <= end_key, "my_midpoint_node is after my_end_node" );
+                }
+#endif // TBB_USE_ASSERT
+            }
+        }
+    };
+
+    class range_type : public const_range_type {
+    public:
+        typedef typename concurrent_unordered_base::iterator iterator;
+        //! Split range.
+        range_type( range_type &r, split ) : const_range_type( r, split() ) {}
+        //! Init range with container and grainsize specified
+        range_type( const concurrent_unordered_base &a_table ) : const_range_type(a_table) {}
+
+        iterator begin() const { return solist_t::get_iterator( const_range_type::begin() ); }
+        iterator end() const { return solist_t::get_iterator( const_range_type::end() ); }
+    };
+
+    range_type range() {
+        return range_type( *this );
+    }
+
+    const_range_type range() const {
+        return const_range_type( *this );
+    }
+
+    // Modifiers
+    std::pair<iterator, bool> insert(const value_type& value) {
+        return internal_insert</*AllowCreate=*/tbb::internal::true_type>(value);
+    }
+
+    iterator insert(const_iterator, const value_type& value) {
+        // Ignore hint
+        return insert(value).first;
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    std::pair<iterator, bool> insert(value_type&& value) {
+        return internal_insert</*AllowCreate=*/tbb::internal::true_type>(std::move(value));
+    }
+
+    iterator insert(const_iterator, value_type&& value) {
+        // Ignore hint
+        return insert(std::move(value)).first;
+    }
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename... Args>
+    std::pair<iterator, bool> emplace(Args&&... args) {
+        nodeptr_t pnode = my_solist.create_node_v(tbb::internal::forward<Args>(args)...);
+        const sokey_t hashed_element_key = (sokey_t) my_hash_compare(get_key(pnode->my_element));
+        const sokey_t order_key = split_order_key_regular(hashed_element_key);
+        pnode->init(order_key);
+
+        return internal_insert</*AllowCreate=*/tbb::internal::false_type>(pnode->my_element, pnode);
+    }
+
+    template<typename... Args>
+    iterator emplace_hint(const_iterator, Args&&... args) {
+        // Ignore hint
+        return emplace(tbb::internal::forward<Args>(args)...).first;
+    }
+
+#endif // __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+    template<class Iterator>
+    void insert(Iterator first, Iterator last) {
+        for (Iterator it = first; it != last; ++it)
+            insert(*it);
+    }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    //! Insert initializer list
+    void insert(std::initializer_list<value_type> il) {
+        insert(il.begin(), il.end());
+    }
+#endif
+
+    iterator unsafe_erase(const_iterator where) {
+        return internal_erase(where);
+    }
+
+    iterator unsafe_erase(const_iterator first, const_iterator last) {
+        while (first != last)
+            unsafe_erase(first++);
+        return my_solist.get_iterator(first);
+    }
+
+    size_type unsafe_erase(const key_type& key) {
+        pairii_t where = equal_range(key);
+        size_type item_count = internal_distance(where.first, where.second);
+        unsafe_erase(where.first, where.second);
+        return item_count;
+    }
+
+    void swap(concurrent_unordered_base& right) {
+        if (this != &right) {
+            std::swap(my_hash_compare, right.my_hash_compare); // TODO: check what ADL meant here
+            my_solist.swap(right.my_solist);
+            internal_swap_buckets(right);
+            std::swap(my_number_of_buckets, right.my_number_of_buckets);
+            std::swap(my_maximum_bucket_size, right.my_maximum_bucket_size);
+        }
+    }
+
+    // Observers
+    hasher hash_function() const {
+        return my_hash_compare.my_hash_object;
+    }
+
+    key_equal key_eq() const {
+        return my_hash_compare.my_key_compare_object;
+    }
+
+    void clear() {
+        // Clear list
+        my_solist.clear();
+
+        // Clear buckets
+        internal_clear();
+
+        // Initialize bucket 0
+        __TBB_ASSERT(my_buckets[0] == NULL, NULL);
+        raw_iterator dummy_node = my_solist.raw_begin();
+        set_bucket(0, dummy_node);
+    }
+
+    // Lookup
+    iterator find(const key_type& key) {
+        return internal_find(key);
+    }
+
+    const_iterator find(const key_type& key) const {
+        return const_cast<self_type*>(this)->internal_find(key);
+    }
+
+    size_type count(const key_type& key) const {
+        if(allow_multimapping) {
+            paircc_t answer = equal_range(key);
+            size_type item_count = internal_distance(answer.first, answer.second);
+            return item_count;
+        } else {
+            return const_cast<self_type*>(this)->internal_find(key) == end()?0:1;
+        }
+    }
+
+    std::pair<iterator, iterator> equal_range(const key_type& key) {
+        return internal_equal_range(key);
+    }
+
+    std::pair<const_iterator, const_iterator> equal_range(const key_type& key) const {
+        return const_cast<self_type*>(this)->internal_equal_range(key);
+    }
+
+    // Bucket interface - for debugging
+    size_type unsafe_bucket_count() const {
+        return my_number_of_buckets;
+    }
+
+    size_type unsafe_max_bucket_count() const {
+        return segment_size(pointers_per_table-1);
+    }
+
+    size_type unsafe_bucket_size(size_type bucket) {
+        size_type item_count = 0;
+        if (is_initialized(bucket)) {
+            raw_iterator it = get_bucket(bucket);
+            ++it;
+            for (; it != my_solist.raw_end() && !it.get_node_ptr()->is_dummy(); ++it)
+                ++item_count;
+        }
+        return item_count;
+    }
+
+    size_type unsafe_bucket(const key_type& key) const {
+        sokey_t order_key = (sokey_t) my_hash_compare(key);
+        size_type bucket = order_key % my_number_of_buckets;
+        return bucket;
+    }
+
+    // If the bucket is initialized, return a first non-dummy element in it
+    local_iterator unsafe_begin(size_type bucket) {
+        if (!is_initialized(bucket))
+            return end();
+
+        raw_iterator it = get_bucket(bucket);
+        return my_solist.first_real_iterator(it);
+    }
+
+    // If the bucket is initialized, return a first non-dummy element in it
+    const_local_iterator unsafe_begin(size_type bucket) const
+    {
+        if (!is_initialized(bucket))
+            return end();
+
+        raw_const_iterator it = get_bucket(bucket);
+        return my_solist.first_real_iterator(it);
+    }
+
+    // @REVIEW: Takes O(n)
+    // Returns the iterator after the last non-dummy element in the bucket
+    local_iterator unsafe_end(size_type bucket)
+    {
+        if (!is_initialized(bucket))
+            return end();
+
+        raw_iterator it = get_bucket(bucket);
+
+        // Find the end of the bucket, denoted by the dummy element
+        do ++it;
+        while(it != my_solist.raw_end() && !it.get_node_ptr()->is_dummy());
+
+        // Return the first real element past the end of the bucket
+        return my_solist.first_real_iterator(it);
+    }
+
+    // @REVIEW: Takes O(n)
+    // Returns the iterator after the last non-dummy element in the bucket
+    const_local_iterator unsafe_end(size_type bucket) const
+    {
+        if (!is_initialized(bucket))
+            return end();
+
+        raw_const_iterator it = get_bucket(bucket);
+
+        // Find the end of the bucket, denoted by the dummy element
+        do ++it;
+        while(it != my_solist.raw_end() && !it.get_node_ptr()->is_dummy());
+
+        // Return the first real element past the end of the bucket
+        return my_solist.first_real_iterator(it);
+    }
+
+    const_local_iterator unsafe_cbegin(size_type bucket) const {
+        return ((const self_type *) this)->unsafe_begin(bucket);
+    }
+
+    const_local_iterator unsafe_cend(size_type bucket) const {
+        return ((const self_type *) this)->unsafe_end(bucket);
+    }
+
+    // Hash policy
+    float load_factor() const {
+        return (float) size() / (float) unsafe_bucket_count();
+    }
+
+    float max_load_factor() const {
+        return my_maximum_bucket_size;
+    }
+
+    void max_load_factor(float newmax) {
+        if (newmax != newmax || newmax < 0)
+            tbb::internal::throw_exception(tbb::internal::eid_invalid_load_factor);
+        my_maximum_bucket_size = newmax;
+    }
+
+    // This function is a noop, because the underlying split-ordered list
+    // is already sorted, so an increase in the bucket number will be
+    // reflected next time this bucket is touched.
+    void rehash(size_type buckets) {
+        size_type current_buckets = my_number_of_buckets;
+        if (current_buckets >= buckets)
+            return;
+        my_number_of_buckets = size_type(1)<<__TBB_Log2((uintptr_t)buckets*2-1); // round up to power of 2
+    }
+
+private:
+
+    // Initialize the hash and keep the first bucket open
+    void internal_init() {
+        // Initialize the array of segment pointers
+        memset(my_buckets, 0, sizeof(my_buckets));
+
+        // Initialize bucket 0
+        raw_iterator dummy_node = my_solist.raw_begin();
+        set_bucket(0, dummy_node);
+    }
+
+    void internal_clear() {
+        for (size_type index = 0; index < pointers_per_table; ++index) {
+            if (my_buckets[index] != NULL) {
+                size_type sz = segment_size(index);
+                for (size_type index2 = 0; index2 < sz; ++index2)
+                    my_allocator.destroy(&my_buckets[index][index2]);
+                my_allocator.deallocate(my_buckets[index], sz);
+                my_buckets[index] = 0;
+            }
+        }
+    }
+
+    void internal_copy(const self_type& right) {
+        clear();
+
+        my_maximum_bucket_size = right.my_maximum_bucket_size;
+        my_number_of_buckets = right.my_number_of_buckets;
+
+        __TBB_TRY {
+            insert(right.begin(), right.end());
+            my_hash_compare = right.my_hash_compare;
+        } __TBB_CATCH(...) {
+            my_solist.clear();
+            __TBB_RETHROW();
+        }
+    }
+
+    void internal_swap_buckets(concurrent_unordered_base& right)
+    {
+        // Swap all node segments
+        for (size_type index = 0; index < pointers_per_table; ++index)
+        {
+            raw_iterator * iterator_pointer = my_buckets[index];
+            my_buckets[index] = right.my_buckets[index];
+            right.my_buckets[index] = iterator_pointer;
+        }
+    }
+
+    //TODO: why not use std::distance?
+    // Hash APIs
+    static size_type internal_distance(const_iterator first, const_iterator last)
+    {
+        size_type num = 0;
+
+        for (const_iterator it = first; it != last; ++it)
+            ++num;
+
+        return num;
+    }
+
+    // Insert an element in the hash given its value
+    template<typename AllowCreate, typename ValueType>
+    std::pair<iterator, bool> internal_insert(__TBB_FORWARDING_REF(ValueType) value, nodeptr_t pnode = NULL)
+    {
+        const key_type *pkey = &get_key(value);
+        sokey_t hash_key = (sokey_t) my_hash_compare(*pkey);
+        size_type new_count = 0;
+        sokey_t order_key = split_order_key_regular(hash_key);
+        raw_iterator previous = prepare_bucket(hash_key);
+        raw_iterator last = my_solist.raw_end();
+        __TBB_ASSERT(previous != last, "Invalid head node");
+
+        // First node is a dummy node
+        for (raw_iterator where = previous;;)
+        {
+            ++where;
+            if (where == last || solist_t::get_order_key(where) > order_key ||
+                // if multimapped, stop at the first item equal to us.
+                (allow_multimapping && solist_t::get_order_key(where) == order_key &&
+                 !my_hash_compare(get_key(*where), *pkey))) // TODO: fix negation
+            {
+                if (!pnode) {
+                    pnode = my_solist.create_node(order_key, tbb::internal::forward<ValueType>(value), AllowCreate());
+                    // If the value was moved, the known reference to key might be invalid
+                    pkey = &get_key(pnode->my_element);
+                }
+
+                // Try to insert 'pnode' between 'previous' and 'where'
+                std::pair<iterator, bool> result = my_solist.try_insert(previous, where, pnode, &new_count);
+
+                if (result.second)
+                {
+                    // Insertion succeeded, adjust the table size, if needed
+                    adjust_table_size(new_count, my_number_of_buckets);
+                    return result;
+                }
+                else
+                {
+                    // Insertion failed: either the same node was inserted by another thread, or
+                    // another element was inserted at exactly the same place as this node.
+                    // Proceed with the search from the previous location where order key was
+                    // known to be larger (note: this is legal only because there is no safe
+                    // concurrent erase operation supported).
+                    where = previous;
+                    continue;
+                }
+            }
+            else if (!allow_multimapping && solist_t::get_order_key(where) == order_key &&
+                     !my_hash_compare(get_key(*where), *pkey)) // TODO: fix negation
+            { // Element already in the list, return it
+                 if (pnode)
+                     my_solist.destroy_node(pnode);
+                return std::pair<iterator, bool>(my_solist.get_iterator(where), false);
+            }
+            // Move the iterator forward
+            previous = where;
+        }
+    }
+
+    // Find the element in the split-ordered list
+    iterator internal_find(const key_type& key)
+    {
+        sokey_t hash_key = (sokey_t) my_hash_compare(key);
+        sokey_t order_key = split_order_key_regular(hash_key);
+        raw_iterator last = my_solist.raw_end();
+
+        for (raw_iterator it = prepare_bucket(hash_key); it != last; ++it)
+        {
+            if (solist_t::get_order_key(it) > order_key)
+            {
+                // If the order key is smaller than the current order key, the element
+                // is not in the hash.
+                return end();
+            }
+            else if (solist_t::get_order_key(it) == order_key)
+            {
+                // The fact that order keys match does not mean that the element is found.
+                // Key function comparison has to be performed to check whether this is the
+                // right element. If not, keep searching while order key is the same.
+                if (!my_hash_compare(get_key(*it), key)) // TODO: fix negation
+                    return my_solist.get_iterator(it);
+            }
+        }
+
+        return end();
+    }
+
+    // Erase an element from the list. This is not a concurrency safe function.
+    iterator internal_erase(const_iterator it)
+    {
+        sokey_t hash_key = (sokey_t) my_hash_compare(get_key(*it));
+        raw_iterator previous = prepare_bucket(hash_key);
+        raw_iterator last = my_solist.raw_end();
+        __TBB_ASSERT(previous != last, "Invalid head node");
+
+        // First node is a dummy node
+        for (raw_iterator where = previous; ; previous = where) {
+            ++where;
+            if (where == last)
+                return end();
+            else if (my_solist.get_iterator(where) == it)
+                return my_solist.erase_node(previous, it);
+        }
+    }
+
+    // Return the [begin, end) pair of iterators with the same key values.
+    // This operation makes sense only if mapping is many-to-one.
+    pairii_t internal_equal_range(const key_type& key)
+    {
+        sokey_t hash_key = (sokey_t) my_hash_compare(key);
+        sokey_t order_key = split_order_key_regular(hash_key);
+        raw_iterator end_it = my_solist.raw_end();
+
+        for (raw_iterator it = prepare_bucket(hash_key); it != end_it; ++it)
+        {
+            if (solist_t::get_order_key(it) > order_key)
+            {
+                // There is no element with the given key
+                return pairii_t(end(), end());
+            }
+            else if (solist_t::get_order_key(it) == order_key &&
+                     !my_hash_compare(get_key(*it), key)) // TODO: fix negation; also below
+            {
+                iterator first = my_solist.get_iterator(it);
+                iterator last = first;
+                do ++last; while( allow_multimapping && last != end() && !my_hash_compare(get_key(*last), key) );
+                return pairii_t(first, last);
+            }
+        }
+
+        return pairii_t(end(), end());
+    }
+
+    // Bucket APIs
+    void init_bucket(size_type bucket)
+    {
+        // Bucket 0 has no parent.
+        __TBB_ASSERT( bucket != 0, "The first bucket must always be initialized");
+
+        size_type parent_bucket = get_parent(bucket);
+
+        // All parent_bucket buckets have to be initialized before this bucket is
+        if (!is_initialized(parent_bucket))
+            init_bucket(parent_bucket);
+
+        raw_iterator parent = get_bucket(parent_bucket);
+
+        // Create a dummy first node in this bucket
+        raw_iterator dummy_node = my_solist.insert_dummy(parent, split_order_key_dummy(bucket));
+        set_bucket(bucket, dummy_node);
+    }
+
+    void adjust_table_size(size_type total_elements, size_type current_size)
+    {
+        // Grow the table by a factor of 2 if possible and needed
+        if ( ((float) total_elements / (float) current_size) > my_maximum_bucket_size )
+        {
+            // Double the size of the hash only if size has not changed in between loads
+            my_number_of_buckets.compare_and_swap(2u*current_size, current_size);
+            //Simple "my_number_of_buckets.compare_and_swap( current_size<<1, current_size );" does not work for VC8
+            //due to overzealous compiler warnings in /Wp64 mode
+        }
+    }
+
+    size_type get_parent(size_type bucket) const
+    {
+        // Unsets bucket's most significant turned-on bit
+        size_type msb = __TBB_Log2((uintptr_t)bucket);
+        return bucket & ~(size_type(1) << msb);
+    }
+
+
+    // Dynamic sized array (segments)
+    //! @return segment index of given index in the array
+    static size_type segment_index_of( size_type index ) {
+        return size_type( __TBB_Log2( uintptr_t(index|1) ) );
+    }
+
+    //! @return the first array index of given segment
+    static size_type segment_base( size_type k ) {
+        return (size_type(1)<<k & ~size_type(1));
+    }
+
+    //! @return segment size
+    static size_type segment_size( size_type k ) {
+        return k? size_type(1)<<k : 2;
+    }
+
+    raw_iterator get_bucket(size_type bucket) const {
+        size_type segment = segment_index_of(bucket);
+        bucket -= segment_base(segment);
+        __TBB_ASSERT( my_buckets[segment], "bucket must be in an allocated segment" );
+        return my_buckets[segment][bucket];
+    }
+
+    raw_iterator prepare_bucket(sokey_t hash_key) {
+        size_type bucket = hash_key % my_number_of_buckets;
+        size_type segment = segment_index_of(bucket);
+        size_type index = bucket - segment_base(segment);
+        if (my_buckets[segment] == NULL || my_buckets[segment][index].get_node_ptr() == NULL)
+            init_bucket(bucket);
+        return my_buckets[segment][index];
+    }
+
+    void set_bucket(size_type bucket, raw_iterator dummy_head) {
+        size_type segment = segment_index_of(bucket);
+        bucket -= segment_base(segment);
+
+        if (my_buckets[segment] == NULL) {
+            size_type sz = segment_size(segment);
+            raw_iterator * new_segment = my_allocator.allocate(sz);
+            std::memset(static_cast<void*>(new_segment), 0, sz*sizeof(raw_iterator));
+
+            if (my_buckets[segment].compare_and_swap( new_segment, NULL) != NULL)
+                my_allocator.deallocate(new_segment, sz);
+        }
+
+        my_buckets[segment][bucket] = dummy_head;
+    }
+
+    bool is_initialized(size_type bucket) const {
+        size_type segment = segment_index_of(bucket);
+        bucket -= segment_base(segment);
+
+        if (my_buckets[segment] == NULL)
+            return false;
+
+        raw_iterator it = my_buckets[segment][bucket];
+        return (it.get_node_ptr() != NULL);
+    }
+
+    // Utilities for keys
+
+    // A regular order key has its original hash value reversed and the last bit set
+    sokey_t split_order_key_regular(sokey_t order_key) const {
+        return __TBB_ReverseBits(order_key) | 0x1;
+    }
+
+    // A dummy order key has its original hash value reversed and the last bit unset
+    sokey_t split_order_key_dummy(sokey_t order_key) const {
+        return __TBB_ReverseBits(order_key) & ~sokey_t(0x1);
+    }
+
+    // Shared variables
+    atomic<size_type>                                             my_number_of_buckets;       // Current table size
+    solist_t                                                      my_solist;                  // List where all the elements are kept
+    typename allocator_type::template rebind<raw_iterator>::other my_allocator;               // Allocator object for segments
+    float                                                         my_maximum_bucket_size;     // Maximum size of the bucket
+    atomic<raw_iterator*>                                         my_buckets[pointers_per_table]; // The segment table
+};
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+#pragma warning(pop) // warning 4127 is back
+#endif
+
+} // namespace internal
+//! @endcond
+} // namespace interface5
+} // namespace tbb
+#endif // __TBB__concurrent_unordered_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_async_msg_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_async_msg_impl.h
new file mode 100644
index 00000000..cb249987
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_async_msg_impl.h
@@ -0,0 +1,157 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_async_msg_impl_H
+#define __TBB__flow_graph_async_msg_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+namespace internal {
+
+template <typename T>
+class async_storage {
+public:
+    typedef receiver<T> async_storage_client;
+
+    async_storage() : my_graph(nullptr) {
+        my_data_ready.store<tbb::relaxed>(false);
+    }
+
+    ~async_storage() {
+        // Release reference to the graph if async_storage
+        // was destructed before set() call
+        if (my_graph) {
+            my_graph->release_wait();
+            my_graph = nullptr;
+        }
+    }
+
+    template<typename C>
+    async_storage(C&& data) : my_graph(nullptr), my_data( std::forward<C>(data) ) {
+        using namespace tbb::internal;
+        __TBB_STATIC_ASSERT( (is_same_type<typename strip<C>::type, typename strip<T>::type>::value), "incoming type must be T" );
+
+        my_data_ready.store<tbb::relaxed>(true);
+    }
+
+    template<typename C>
+    bool set(C&& data) {
+        using namespace tbb::internal;
+        __TBB_STATIC_ASSERT( (is_same_type<typename strip<C>::type, typename strip<T>::type>::value), "incoming type must be T" );
+
+        {
+            tbb::spin_mutex::scoped_lock locker(my_mutex);
+
+            if (my_data_ready.load<tbb::relaxed>()) {
+                __TBB_ASSERT(false, "double set() call");
+                return false;
+            }
+
+            my_data = std::forward<C>(data);
+            my_data_ready.store<tbb::release>(true);
+        }
+
+        // Thread sync is on my_data_ready flag
+        for (typename subscriber_list_type::iterator it = my_clients.begin(); it != my_clients.end(); ++it) {
+            (*it)->try_put(my_data);
+        }
+
+        // Data was sent, release reference to the graph
+        if (my_graph) {
+            my_graph->release_wait();
+            my_graph = nullptr;
+        }
+
+        return true;
+    }
+
+    task* subscribe(async_storage_client& client, graph& g) {
+        if (! my_data_ready.load<tbb::acquire>())
+        {
+            tbb::spin_mutex::scoped_lock locker(my_mutex);
+
+            if (! my_data_ready.load<tbb::relaxed>()) {
+#if TBB_USE_ASSERT
+                for (typename subscriber_list_type::iterator it = my_clients.begin(); it != my_clients.end(); ++it) {
+                    __TBB_ASSERT(*it != &client, "unexpected double subscription");
+                }
+#endif // TBB_USE_ASSERT
+
+                // Increase graph lifetime
+                my_graph = &g;
+                my_graph->reserve_wait();
+
+                // Subscribe
+                my_clients.push_back(&client);
+                return SUCCESSFULLY_ENQUEUED;
+            }
+        }
+
+        __TBB_ASSERT(my_data_ready.load<tbb::relaxed>(), "data is NOT ready");
+        return client.try_put_task(my_data);
+    }
+
+private:
+    graph* my_graph;
+    tbb::spin_mutex my_mutex;
+    tbb::atomic<bool> my_data_ready;
+    T my_data;
+    typedef std::vector<async_storage_client*> subscriber_list_type;
+    subscriber_list_type my_clients;
+};
+
+} // namespace internal
+
+template <typename T>
+class async_msg {
+    template< typename > friend class receiver;
+    template< typename, typename > friend struct internal::async_helpers;
+public:
+    typedef T async_msg_data_type;
+
+    async_msg() : my_storage(std::make_shared< internal::async_storage<T> >()) {}
+
+    async_msg(const T& t) : my_storage(std::make_shared< internal::async_storage<T> >(t)) {}
+
+    async_msg(T&& t) : my_storage(std::make_shared< internal::async_storage<T> >( std::move(t) )) {}
+
+    virtual ~async_msg() {}
+
+    void set(const T& t) {
+        my_storage->set(t);
+    }
+
+    void set(T&& t) {
+        my_storage->set( std::move(t) );
+    }
+
+protected:
+    // Can be overridden in derived class to inform that 
+    // async calculation chain is over
+    virtual void finalize() const {}
+
+private:
+    typedef std::shared_ptr< internal::async_storage<T> > async_storage_ptr;
+    async_storage_ptr my_storage;
+};
+
+#endif  // __TBB__flow_graph_async_msg_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_body_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_body_impl.h
new file mode 100644
index 00000000..25380a9f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_body_impl.h
@@ -0,0 +1,378 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_body_impl_H
+#define __TBB__flow_graph_body_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+// included in namespace tbb::flow::interfaceX (in flow_graph.h)
+
+namespace internal {
+
+typedef tbb::internal::uint64_t tag_value;
+
+using tbb::internal::strip;
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+
+template<typename ... Policies> struct Policy {};
+
+template<typename ... Policies> struct has_policy;
+
+template<typename ExpectedPolicy, typename FirstPolicy, typename ...Policies>
+struct has_policy<ExpectedPolicy, FirstPolicy, Policies...> :
+    tbb::internal::bool_constant<has_policy<ExpectedPolicy, FirstPolicy>::value ||
+                                 has_policy<ExpectedPolicy, Policies...>::value> {};
+
+template<typename ExpectedPolicy, typename SinglePolicy>
+struct has_policy<ExpectedPolicy, SinglePolicy> :
+    tbb::internal::bool_constant<tbb::internal::is_same_type<ExpectedPolicy, SinglePolicy>::value> {};
+
+template<typename ExpectedPolicy, typename ...Policies>
+struct has_policy<ExpectedPolicy, Policy<Policies...> > : has_policy<ExpectedPolicy, Policies...> {};
+
+#else
+
+template<typename P1, typename P2 = void> struct Policy {};
+
+template<typename ExpectedPolicy, typename SinglePolicy>
+struct has_policy : tbb::internal::bool_constant<tbb::internal::is_same_type<ExpectedPolicy, SinglePolicy>::value> {};
+
+template<typename ExpectedPolicy, typename P>
+struct has_policy<ExpectedPolicy, Policy<P> > : has_policy<ExpectedPolicy, P> {};
+
+template<typename ExpectedPolicy, typename P1, typename P2>
+struct has_policy<ExpectedPolicy, Policy<P1, P2> > :
+    tbb::internal::bool_constant<has_policy<ExpectedPolicy, P1>::value || has_policy<ExpectedPolicy, P2>::value> {};
+
+#endif
+
+namespace graph_policy_namespace {
+
+    struct rejecting { };
+    struct reserving { };
+    struct queueing  { };
+    struct lightweight  { };
+
+    // K == type of field used for key-matching.  Each tag-matching port will be provided
+    // functor that, given an object accepted by the port, will return the
+    /// field of type K being used for matching.
+    template<typename K, typename KHash=tbb_hash_compare<typename strip<K>::type > >
+    struct key_matching {
+        typedef K key_type;
+        typedef typename strip<K>::type base_key_type;
+        typedef KHash hash_compare_type;
+    };
+
+    // old tag_matching join's new specifier
+    typedef key_matching<tag_value> tag_matching;
+
+    // Aliases for Policy combinations
+    typedef interface10::internal::Policy<queueing, lightweight> queueing_lightweight;
+    typedef interface10::internal::Policy<rejecting, lightweight>  rejecting_lightweight;
+
+} // namespace graph_policy_namespace
+
+// -------------- function_body containers ----------------------
+
+//! A functor that takes no input and generates a value of type Output
+template< typename Output >
+class source_body : tbb::internal::no_assign {
+public:
+    virtual ~source_body() {}
+    virtual bool operator()(Output &output) = 0;
+    virtual source_body* clone() = 0;
+};
+
+//! The leaf for source_body
+template< typename Output, typename Body>
+class source_body_leaf : public source_body<Output> {
+public:
+    source_body_leaf( const Body &_body ) : body(_body) { }
+    bool operator()(Output &output) __TBB_override { return body( output ); }
+    source_body_leaf* clone() __TBB_override {
+        return new source_body_leaf< Output, Body >(body);
+    }
+    Body get_body() { return body; }
+private:
+    Body body;
+};
+
+//! A functor that takes an Input and generates an Output
+template< typename Input, typename Output >
+class function_body : tbb::internal::no_assign {
+public:
+    virtual ~function_body() {}
+    virtual Output operator()(const Input &input) = 0;
+    virtual function_body* clone() = 0;
+};
+
+//! the leaf for function_body
+template <typename Input, typename Output, typename B>
+class function_body_leaf : public function_body< Input, Output > {
+public:
+    function_body_leaf( const B &_body ) : body(_body) { }
+    Output operator()(const Input &i) __TBB_override { return body(i); }
+    B get_body() { return body; }
+    function_body_leaf* clone() __TBB_override {
+        return new function_body_leaf< Input, Output, B >(body);
+    }
+private:
+    B body;
+};
+
+//! the leaf for function_body specialized for Input and output of continue_msg
+template <typename B>
+class function_body_leaf< continue_msg, continue_msg, B> : public function_body< continue_msg, continue_msg > {
+public:
+    function_body_leaf( const B &_body ) : body(_body) { }
+    continue_msg operator()( const continue_msg &i ) __TBB_override {
+        body(i);
+        return i;
+    }
+    B get_body() { return body; }
+    function_body_leaf* clone() __TBB_override {
+        return new function_body_leaf< continue_msg, continue_msg, B >(body);
+    }
+private:
+    B body;
+};
+
+//! the leaf for function_body specialized for Output of continue_msg
+template <typename Input, typename B>
+class function_body_leaf< Input, continue_msg, B> : public function_body< Input, continue_msg > {
+public:
+    function_body_leaf( const B &_body ) : body(_body) { }
+    continue_msg operator()(const Input &i) __TBB_override {
+        body(i);
+        return continue_msg();
+    }
+    B get_body() { return body; }
+    function_body_leaf* clone() __TBB_override {
+        return new function_body_leaf< Input, continue_msg, B >(body);
+    }
+private:
+    B body;
+};
+
+//! the leaf for function_body specialized for Input of continue_msg
+template <typename Output, typename B>
+class function_body_leaf< continue_msg, Output, B > : public function_body< continue_msg, Output > {
+public:
+    function_body_leaf( const B &_body ) : body(_body) { }
+    Output operator()(const continue_msg &i) __TBB_override {
+        return body(i);
+    }
+    B get_body() { return body; }
+    function_body_leaf* clone() __TBB_override {
+        return new function_body_leaf< continue_msg, Output, B >(body);
+    }
+private:
+    B body;
+};
+
+//! function_body that takes an Input and a set of output ports
+template<typename Input, typename OutputSet>
+class multifunction_body : tbb::internal::no_assign {
+public:
+    virtual ~multifunction_body () {}
+    virtual void operator()(const Input &/* input*/, OutputSet &/*oset*/) = 0;
+    virtual multifunction_body* clone() = 0;
+    virtual void* get_body_ptr() = 0;
+};
+
+//! leaf for multifunction.  OutputSet can be a std::tuple or a vector.
+template<typename Input, typename OutputSet, typename B >
+class multifunction_body_leaf : public multifunction_body<Input, OutputSet> {
+public:
+    multifunction_body_leaf(const B &_body) : body(_body) { }
+    void operator()(const Input &input, OutputSet &oset) __TBB_override {
+        body(input, oset); // body may explicitly put() to one or more of oset.
+    }
+    void* get_body_ptr() __TBB_override { return &body; }
+    multifunction_body_leaf* clone() __TBB_override {
+        return new multifunction_body_leaf<Input, OutputSet,B>(body);
+    }
+
+private:
+    B body;
+};
+
+// ------ function bodies for hash_buffers and key-matching joins.
+
+template<typename Input, typename Output>
+class type_to_key_function_body : tbb::internal::no_assign {
+    public:
+        virtual ~type_to_key_function_body() {}
+        virtual Output operator()(const Input &input) = 0;  // returns an Output
+        virtual type_to_key_function_body* clone() = 0;
+};
+
+// specialization for ref output
+template<typename Input, typename Output>
+class type_to_key_function_body<Input,Output&> : tbb::internal::no_assign {
+    public:
+        virtual ~type_to_key_function_body() {}
+        virtual const Output & operator()(const Input &input) = 0;  // returns a const Output&
+        virtual type_to_key_function_body* clone() = 0;
+};
+
+template <typename Input, typename Output, typename B>
+class type_to_key_function_body_leaf : public type_to_key_function_body<Input, Output> {
+public:
+    type_to_key_function_body_leaf( const B &_body ) : body(_body) { }
+    Output operator()(const Input &i) __TBB_override { return body(i); }
+    B get_body() { return body; }
+    type_to_key_function_body_leaf* clone() __TBB_override {
+        return new type_to_key_function_body_leaf< Input, Output, B>(body);
+    }
+private:
+    B body;
+};
+
+template <typename Input, typename Output, typename B>
+class type_to_key_function_body_leaf<Input,Output&,B> : public type_to_key_function_body< Input, Output&> {
+public:
+    type_to_key_function_body_leaf( const B &_body ) : body(_body) { }
+    const Output& operator()(const Input &i) __TBB_override {
+        return body(i);
+    }
+    B get_body() { return body; }
+    type_to_key_function_body_leaf* clone() __TBB_override {
+        return new type_to_key_function_body_leaf< Input, Output&, B>(body);
+    }
+private:
+    B body;
+};
+
+// --------------------------- end of function_body containers ------------------------
+
+// --------------------------- node task bodies ---------------------------------------
+
+//! A task that calls a node's forward_task function
+template< typename NodeType >
+class forward_task_bypass : public graph_task {
+
+    NodeType &my_node;
+
+public:
+
+    forward_task_bypass( NodeType &n
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+                         , node_priority_t node_priority = no_priority
+    ) : graph_task(node_priority),
+#else
+    ) :
+#endif
+    my_node(n) {}
+
+    task *execute() __TBB_override {
+        task * new_task = my_node.forward_task();
+        if (new_task == SUCCESSFULLY_ENQUEUED) new_task = NULL;
+        return new_task;
+    }
+};
+
+//! A task that calls a node's apply_body_bypass function, passing in an input of type Input
+//  return the task* unless it is SUCCESSFULLY_ENQUEUED, in which case return NULL
+template< typename NodeType, typename Input >
+class apply_body_task_bypass : public graph_task {
+
+    NodeType &my_node;
+    Input my_input;
+
+public:
+
+    apply_body_task_bypass( NodeType &n, const Input &i
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+                            , node_priority_t node_priority = no_priority
+    ) : graph_task(node_priority),
+#else
+    ) :
+#endif
+        my_node(n), my_input(i) {}
+
+    task *execute() __TBB_override {
+        task * next_task = my_node.apply_body_bypass( my_input );
+        if(next_task == SUCCESSFULLY_ENQUEUED) next_task = NULL;
+        return next_task;
+    }
+};
+
+//! A task that calls a node's apply_body_bypass function with no input
+template< typename NodeType >
+class source_task_bypass : public graph_task {
+
+    NodeType &my_node;
+
+public:
+
+    source_task_bypass( NodeType &n ) : my_node(n) {}
+
+    task *execute() __TBB_override {
+        task *new_task = my_node.apply_body_bypass( );
+        if(new_task == SUCCESSFULLY_ENQUEUED) return NULL;
+        return new_task;
+    }
+};
+
+// ------------------------ end of node task bodies -----------------------------------
+
+//! An empty functor that takes an Input and returns a default constructed Output
+template< typename Input, typename Output >
+struct empty_body {
+    Output operator()( const Input & ) const { return Output(); }
+};
+
+template<typename T>
+class decrementer : public continue_receiver, tbb::internal::no_copy {
+
+    T *my_node;
+
+    task *execute() __TBB_override {
+        return my_node->decrement_counter();
+    }
+
+protected:
+
+    graph& graph_reference() __TBB_override {
+        return my_node->my_graph;
+    }
+
+public:
+
+    typedef continue_msg input_type;
+    typedef continue_msg output_type;
+    decrementer( int number_of_predecessors = 0 )
+        : continue_receiver(
+            __TBB_FLOW_GRAPH_PRIORITY_ARG1(number_of_predecessors, tbb::flow::internal::no_priority)
+        )
+        , my_node(NULL)
+    {}
+    void set_owner( T *node ) { my_node = node; }
+};
+
+} // namespace internal
+
+#endif // __TBB__flow_graph_body_impl_H
+
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_cache_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_cache_impl.h
new file mode 100644
index 00000000..de22b8c7
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_cache_impl.h
@@ -0,0 +1,562 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_cache_impl_H
+#define __TBB__flow_graph_cache_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+// included in namespace tbb::flow::interfaceX (in flow_graph.h)
+
+namespace internal {
+
+//! A node_cache maintains a std::queue of elements of type T.  Each operation is protected by a lock.
+template< typename T, typename M=spin_mutex >
+class node_cache {
+    public:
+
+    typedef size_t size_type;
+
+    bool empty() {
+        typename mutex_type::scoped_lock lock( my_mutex );
+        return internal_empty();
+    }
+
+    void add( T &n ) {
+        typename mutex_type::scoped_lock lock( my_mutex );
+        internal_push(n);
+    }
+
+    void remove( T &n ) {
+        typename mutex_type::scoped_lock lock( my_mutex );
+        for ( size_t i = internal_size(); i != 0; --i ) {
+            T &s = internal_pop();
+            if ( &s == &n )  return;  // only remove one predecessor per request
+            internal_push(s);
+        }
+    }
+
+    void clear() {
+        while( !my_q.empty()) (void)my_q.pop();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        my_built_predecessors.clear();
+#endif
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef edge_container<T> built_predecessors_type;
+    built_predecessors_type &built_predecessors() { return my_built_predecessors; }
+
+    typedef typename edge_container<T>::edge_list_type predecessor_list_type;
+    void internal_add_built_predecessor( T &n ) {
+        typename mutex_type::scoped_lock lock( my_mutex );
+        my_built_predecessors.add_edge(n);
+    }
+
+    void internal_delete_built_predecessor( T &n ) {
+        typename mutex_type::scoped_lock lock( my_mutex );
+        my_built_predecessors.delete_edge(n);
+    }
+
+    void copy_predecessors( predecessor_list_type &v) {
+        typename mutex_type::scoped_lock lock( my_mutex );
+        my_built_predecessors.copy_edges(v);
+    }
+
+    size_t predecessor_count() {
+        typename mutex_type::scoped_lock lock(my_mutex);
+        return (size_t)(my_built_predecessors.edge_count());
+    }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+protected:
+
+    typedef M mutex_type;
+    mutex_type my_mutex;
+    std::queue< T * > my_q;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    built_predecessors_type my_built_predecessors;
+#endif
+
+    // Assumes lock is held
+    inline bool internal_empty( )  {
+        return my_q.empty();
+    }
+
+    // Assumes lock is held
+    inline size_type internal_size( )  {
+        return my_q.size();
+    }
+
+    // Assumes lock is held
+    inline void internal_push( T &n )  {
+        my_q.push(&n);
+    }
+
+    // Assumes lock is held
+    inline T &internal_pop() {
+        T *v = my_q.front();
+        my_q.pop();
+        return *v;
+    }
+
+};
+
+//! A cache of predecessors that only supports try_get
+template< typename T, typename M=spin_mutex >
+#if __TBB_PREVIEW_ASYNC_MSG
+// TODO: make predecessor_cache type T-independent when async_msg becomes regular feature
+class predecessor_cache : public node_cache< untyped_sender, M > {
+#else
+class predecessor_cache : public node_cache< sender<T>, M > {
+#endif // __TBB_PREVIEW_ASYNC_MSG
+public:
+    typedef M mutex_type;
+    typedef T output_type;
+#if __TBB_PREVIEW_ASYNC_MSG
+    typedef untyped_sender predecessor_type;
+    typedef untyped_receiver successor_type;
+#else
+    typedef sender<output_type> predecessor_type;
+    typedef receiver<output_type> successor_type;
+#endif // __TBB_PREVIEW_ASYNC_MSG
+
+    predecessor_cache( ) : my_owner( NULL ) { }
+
+    void set_owner( successor_type *owner ) { my_owner = owner; }
+
+    bool get_item( output_type &v ) {
+
+        bool msg = false;
+
+        do {
+            predecessor_type *src;
+            {
+                typename mutex_type::scoped_lock lock(this->my_mutex);
+                if ( this->internal_empty() ) {
+                    break;
+                }
+                src = &this->internal_pop();
+            }
+
+            // Try to get from this sender
+            msg = src->try_get( v );
+
+            if (msg == false) {
+                // Relinquish ownership of the edge
+                if (my_owner)
+                    src->register_successor( *my_owner );
+            } else {
+                // Retain ownership of the edge
+                this->add(*src);
+            }
+        } while ( msg == false );
+        return msg;
+    }
+
+    // If we are removing arcs (rf_clear_edges), call clear() rather than reset().
+    void reset() {
+        if (my_owner) {
+            for(;;) {
+                predecessor_type *src;
+                {
+                    if (this->internal_empty()) break;
+                    src = &this->internal_pop();
+                }
+                src->register_successor( *my_owner );
+            }
+        }
+    }
+
+protected:
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    using node_cache< predecessor_type, M >::my_built_predecessors;
+#endif
+    successor_type *my_owner;
+};
+
+//! An cache of predecessors that supports requests and reservations
+// TODO: make reservable_predecessor_cache type T-independent when async_msg becomes regular feature
+template< typename T, typename M=spin_mutex >
+class reservable_predecessor_cache : public predecessor_cache< T, M > {
+public:
+    typedef M mutex_type;
+    typedef T output_type;
+#if __TBB_PREVIEW_ASYNC_MSG
+    typedef untyped_sender predecessor_type;
+    typedef untyped_receiver successor_type;
+#else
+    typedef sender<T> predecessor_type;
+    typedef receiver<T> successor_type;
+#endif // __TBB_PREVIEW_ASYNC_MSG
+
+    reservable_predecessor_cache( ) : reserved_src(NULL) { }
+
+    bool
+    try_reserve( output_type &v ) {
+        bool msg = false;
+
+        do {
+            {
+                typename mutex_type::scoped_lock lock(this->my_mutex);
+                if ( reserved_src || this->internal_empty() )
+                    return false;
+
+                reserved_src = &this->internal_pop();
+            }
+
+            // Try to get from this sender
+            msg = reserved_src->try_reserve( v );
+
+            if (msg == false) {
+                typename mutex_type::scoped_lock lock(this->my_mutex);
+                // Relinquish ownership of the edge
+                reserved_src->register_successor( *this->my_owner );
+                reserved_src = NULL;
+            } else {
+                // Retain ownership of the edge
+                this->add( *reserved_src );
+            }
+        } while ( msg == false );
+
+        return msg;
+    }
+
+    bool
+    try_release( ) {
+        reserved_src->try_release( );
+        reserved_src = NULL;
+        return true;
+    }
+
+    bool
+    try_consume( ) {
+        reserved_src->try_consume( );
+        reserved_src = NULL;
+        return true;
+    }
+
+    void reset( ) {
+        reserved_src = NULL;
+        predecessor_cache<T,M>::reset( );
+    }
+
+    void clear() {
+        reserved_src = NULL;
+        predecessor_cache<T,M>::clear();
+    }
+
+private:
+    predecessor_type *reserved_src;
+};
+
+
+//! An abstract cache of successors
+// TODO: make successor_cache type T-independent when async_msg becomes regular feature
+template<typename T, typename M=spin_rw_mutex >
+class successor_cache : tbb::internal::no_copy {
+protected:
+
+    typedef M mutex_type;
+    mutex_type my_mutex;
+
+#if __TBB_PREVIEW_ASYNC_MSG
+    typedef untyped_receiver successor_type;
+    typedef untyped_receiver *pointer_type;
+    typedef untyped_sender owner_type;
+#else
+    typedef receiver<T> successor_type;
+    typedef receiver<T> *pointer_type;
+    typedef sender<T> owner_type;
+#endif // __TBB_PREVIEW_ASYNC_MSG
+    typedef std::list< pointer_type > successors_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    edge_container<successor_type> my_built_successors;
+#endif
+    successors_type my_successors;
+
+    owner_type *my_owner;
+
+public:
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename edge_container<successor_type>::edge_list_type successor_list_type;
+
+    edge_container<successor_type> &built_successors() { return my_built_successors; }
+
+    void internal_add_built_successor( successor_type &r) {
+        typename mutex_type::scoped_lock l(my_mutex, true);
+        my_built_successors.add_edge( r );
+    }
+
+    void internal_delete_built_successor( successor_type &r) {
+        typename mutex_type::scoped_lock l(my_mutex, true);
+        my_built_successors.delete_edge(r);
+    }
+
+    void copy_successors( successor_list_type &v) {
+        typename mutex_type::scoped_lock l(my_mutex, false);
+        my_built_successors.copy_edges(v);
+    }
+
+    size_t successor_count() {
+        typename mutex_type::scoped_lock l(my_mutex,false);
+        return my_built_successors.edge_count();
+    }
+
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    successor_cache( ) : my_owner(NULL) {}
+
+    void set_owner( owner_type *owner ) { my_owner = owner; }
+
+    virtual ~successor_cache() {}
+
+    void register_successor( successor_type &r ) {
+        typename mutex_type::scoped_lock l(my_mutex, true);
+        my_successors.push_back( &r );
+    }
+
+    void remove_successor( successor_type &r ) {
+        typename mutex_type::scoped_lock l(my_mutex, true);
+        for ( typename successors_type::iterator i = my_successors.begin();
+              i != my_successors.end(); ++i ) {
+            if ( *i == & r ) {
+                my_successors.erase(i);
+                break;
+            }
+        }
+    }
+
+    bool empty() {
+        typename mutex_type::scoped_lock l(my_mutex, false);
+        return my_successors.empty();
+    }
+
+    void clear() {
+        my_successors.clear();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        my_built_successors.clear();
+#endif
+    }
+
+#if !__TBB_PREVIEW_ASYNC_MSG
+    virtual task * try_put_task( const T &t ) = 0;
+#endif // __TBB_PREVIEW_ASYNC_MSG
+ };  // successor_cache<T>
+
+//! An abstract cache of successors, specialized to continue_msg
+template<>
+class successor_cache< continue_msg > : tbb::internal::no_copy {
+protected:
+
+    typedef spin_rw_mutex mutex_type;
+    mutex_type my_mutex;
+
+#if __TBB_PREVIEW_ASYNC_MSG
+    typedef untyped_receiver successor_type;
+    typedef untyped_receiver *pointer_type;
+#else
+    typedef receiver<continue_msg> successor_type;
+    typedef receiver<continue_msg> *pointer_type;
+#endif // __TBB_PREVIEW_ASYNC_MSG
+    typedef std::list< pointer_type > successors_type;
+    successors_type my_successors;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    edge_container<successor_type> my_built_successors;
+    typedef edge_container<successor_type>::edge_list_type successor_list_type;
+#endif
+
+    sender<continue_msg> *my_owner;
+
+public:
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+    edge_container<successor_type> &built_successors() { return my_built_successors; }
+
+    void internal_add_built_successor( successor_type &r) {
+        mutex_type::scoped_lock l(my_mutex, true);
+        my_built_successors.add_edge( r );
+    }
+
+    void internal_delete_built_successor( successor_type &r) {
+        mutex_type::scoped_lock l(my_mutex, true);
+        my_built_successors.delete_edge(r);
+    }
+
+    void copy_successors( successor_list_type &v) {
+        mutex_type::scoped_lock l(my_mutex, false);
+        my_built_successors.copy_edges(v);
+    }
+
+    size_t successor_count() {
+        mutex_type::scoped_lock l(my_mutex,false);
+        return my_built_successors.edge_count();
+    }
+
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    successor_cache( ) : my_owner(NULL) {}
+
+    void set_owner( sender<continue_msg> *owner ) { my_owner = owner; }
+
+    virtual ~successor_cache() {}
+
+    void register_successor( successor_type &r ) {
+        mutex_type::scoped_lock l(my_mutex, true);
+        my_successors.push_back( &r );
+        if ( my_owner && r.is_continue_receiver() ) {
+            r.register_predecessor( *my_owner );
+        }
+    }
+
+    void remove_successor( successor_type &r ) {
+        mutex_type::scoped_lock l(my_mutex, true);
+        for ( successors_type::iterator i = my_successors.begin();
+              i != my_successors.end(); ++i ) {
+            if ( *i == & r ) {
+                // TODO: Check if we need to test for continue_receiver before
+                // removing from r.
+                if ( my_owner )
+                    r.remove_predecessor( *my_owner );
+                my_successors.erase(i);
+                break;
+            }
+        }
+    }
+
+    bool empty() {
+        mutex_type::scoped_lock l(my_mutex, false);
+        return my_successors.empty();
+    }
+
+    void clear() {
+        my_successors.clear();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        my_built_successors.clear();
+#endif
+    }
+
+#if !__TBB_PREVIEW_ASYNC_MSG
+    virtual task * try_put_task( const continue_msg &t ) = 0;
+#endif // __TBB_PREVIEW_ASYNC_MSG
+
+};  // successor_cache< continue_msg >
+
+//! A cache of successors that are broadcast to
+// TODO: make broadcast_cache type T-independent when async_msg becomes regular feature
+template<typename T, typename M=spin_rw_mutex>
+class broadcast_cache : public successor_cache<T, M> {
+    typedef M mutex_type;
+    typedef typename successor_cache<T,M>::successors_type successors_type;
+
+public:
+
+    broadcast_cache( ) {}
+
+    // as above, but call try_put_task instead, and return the last task we received (if any)
+#if __TBB_PREVIEW_ASYNC_MSG
+    template<typename X>
+    task * try_put_task( const X &t ) {
+#else
+    task * try_put_task( const T &t ) __TBB_override {
+#endif // __TBB_PREVIEW_ASYNC_MSG
+        task * last_task = NULL;
+        bool upgraded = true;
+        typename mutex_type::scoped_lock l(this->my_mutex, upgraded);
+        typename successors_type::iterator i = this->my_successors.begin();
+        while ( i != this->my_successors.end() ) {
+            task *new_task = (*i)->try_put_task(t);
+            // workaround for icc bug
+            graph& graph_ref = (*i)->graph_reference();
+            last_task = combine_tasks(graph_ref, last_task, new_task);  // enqueue if necessary
+            if(new_task) {
+                ++i;
+            }
+            else {  // failed
+                if ( (*i)->register_predecessor(*this->my_owner) ) {
+                    if (!upgraded) {
+                        l.upgrade_to_writer();
+                        upgraded = true;
+                    }
+                    i = this->my_successors.erase(i);
+                } else {
+                    ++i;
+                }
+            }
+        }
+        return last_task;
+    }
+
+};
+
+//! A cache of successors that are put in a round-robin fashion
+// TODO: make round_robin_cache type T-independent when async_msg becomes regular feature
+template<typename T, typename M=spin_rw_mutex >
+class round_robin_cache : public successor_cache<T, M> {
+    typedef size_t size_type;
+    typedef M mutex_type;
+    typedef typename successor_cache<T,M>::successors_type successors_type;
+
+public:
+
+    round_robin_cache( ) {}
+
+    size_type size() {
+        typename mutex_type::scoped_lock l(this->my_mutex, false);
+        return this->my_successors.size();
+    }
+
+#if __TBB_PREVIEW_ASYNC_MSG
+    template<typename X>
+    task * try_put_task( const X &t ) {
+#else
+    task *try_put_task( const T &t ) __TBB_override {
+#endif // __TBB_PREVIEW_ASYNC_MSG
+        bool upgraded = true;
+        typename mutex_type::scoped_lock l(this->my_mutex, upgraded);
+        typename successors_type::iterator i = this->my_successors.begin();
+        while ( i != this->my_successors.end() ) {
+            task *new_task = (*i)->try_put_task(t);
+            if ( new_task ) {
+                return new_task;
+            } else {
+               if ( (*i)->register_predecessor(*this->my_owner) ) {
+                   if (!upgraded) {
+                       l.upgrade_to_writer();
+                       upgraded = true;
+                   }
+                   i = this->my_successors.erase(i);
+               }
+               else {
+                   ++i;
+               }
+            }
+        }
+        return NULL;
+    }
+};
+
+} // namespace internal
+
+#endif // __TBB__flow_graph_cache_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_impl.h
new file mode 100644
index 00000000..0aadf44a
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_impl.h
@@ -0,0 +1,505 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_flow_graph_impl_H
+#define __TBB_flow_graph_impl_H
+
+#include "../tbb_stddef.h"
+#include "../task.h"
+#include "../task_arena.h"
+#include "../flow_graph_abstractions.h"
+
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+#include "../concurrent_priority_queue.h"
+#endif
+
+#include <list>
+
+#if TBB_DEPRECATED_FLOW_ENQUEUE
+#define FLOW_SPAWN(a) tbb::task::enqueue((a))
+#else
+#define FLOW_SPAWN(a) tbb::task::spawn((a))
+#endif
+
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+#define __TBB_FLOW_GRAPH_PRIORITY_EXPR( expr ) expr
+#define __TBB_FLOW_GRAPH_PRIORITY_ARG0( priority ) , priority
+#define __TBB_FLOW_GRAPH_PRIORITY_ARG1( arg1, priority ) arg1, priority
+#else
+#define __TBB_FLOW_GRAPH_PRIORITY_EXPR( expr )
+#define __TBB_FLOW_GRAPH_PRIORITY_ARG0( priority )
+#define __TBB_FLOW_GRAPH_PRIORITY_ARG1( arg1, priority ) arg1
+#endif // __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+
+namespace tbb {
+namespace flow {
+
+namespace internal {
+static tbb::task * const SUCCESSFULLY_ENQUEUED = (task *)-1;
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+typedef unsigned int node_priority_t;
+static const node_priority_t no_priority = node_priority_t(0);
+#endif
+}
+
+namespace interface10 {
+
+using tbb::flow::internal::SUCCESSFULLY_ENQUEUED;
+
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+using tbb::flow::internal::node_priority_t;
+using tbb::flow::internal::no_priority;
+//! Base class for tasks generated by graph nodes.
+struct graph_task : public task {
+    graph_task( node_priority_t node_priority = no_priority ) : priority( node_priority ) {}
+    node_priority_t priority;
+};
+#else
+typedef task graph_task;
+#endif /* __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES */
+
+
+class graph;
+class graph_node;
+
+template <typename GraphContainerType, typename GraphNodeType>
+class graph_iterator {
+    friend class graph;
+    friend class graph_node;
+public:
+    typedef size_t size_type;
+    typedef GraphNodeType value_type;
+    typedef GraphNodeType* pointer;
+    typedef GraphNodeType& reference;
+    typedef const GraphNodeType& const_reference;
+    typedef std::forward_iterator_tag iterator_category;
+
+    //! Default constructor
+    graph_iterator() : my_graph(NULL), current_node(NULL) {}
+
+    //! Copy constructor
+    graph_iterator(const graph_iterator& other) :
+        my_graph(other.my_graph), current_node(other.current_node)
+    {}
+
+    //! Assignment
+    graph_iterator& operator=(const graph_iterator& other) {
+        if (this != &other) {
+            my_graph = other.my_graph;
+            current_node = other.current_node;
+        }
+        return *this;
+    }
+
+    //! Dereference
+    reference operator*() const;
+
+    //! Dereference
+    pointer operator->() const;
+
+    //! Equality
+    bool operator==(const graph_iterator& other) const {
+        return ((my_graph == other.my_graph) && (current_node == other.current_node));
+    }
+
+    //! Inequality
+    bool operator!=(const graph_iterator& other) const { return !(operator==(other)); }
+
+    //! Pre-increment
+    graph_iterator& operator++() {
+        internal_forward();
+        return *this;
+    }
+
+    //! Post-increment
+    graph_iterator operator++(int) {
+        graph_iterator result = *this;
+        operator++();
+        return result;
+    }
+
+private:
+    // the graph over which we are iterating
+    GraphContainerType *my_graph;
+    // pointer into my_graph's my_nodes list
+    pointer current_node;
+
+    //! Private initializing constructor for begin() and end() iterators
+    graph_iterator(GraphContainerType *g, bool begin);
+    void internal_forward();
+};  // class graph_iterator
+
+// flags to modify the behavior of the graph reset().  Can be combined.
+enum reset_flags {
+    rf_reset_protocol = 0,
+    rf_reset_bodies = 1 << 0,  // delete the current node body, reset to a copy of the initial node body.
+    rf_clear_edges = 1 << 1   // delete edges
+};
+
+namespace internal {
+
+void activate_graph(graph& g);
+void deactivate_graph(graph& g);
+bool is_graph_active(graph& g);
+void spawn_in_graph_arena(graph& g, tbb::task& arena_task);
+void add_task_to_graph_reset_list(graph& g, tbb::task *tp);
+template<typename F> void execute_in_graph_arena(graph& g, F& f);
+
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+struct graph_task_comparator {
+    bool operator()(const graph_task* left, const graph_task* right) {
+        return left->priority < right->priority;
+    }
+};
+
+typedef tbb::concurrent_priority_queue<graph_task*, graph_task_comparator> graph_task_priority_queue_t;
+
+class priority_task_selector : public task {
+public:
+    priority_task_selector(graph_task_priority_queue_t& priority_queue)
+        : my_priority_queue(priority_queue) {}
+    task* execute() __TBB_override {
+        graph_task* t = NULL;
+        bool result = my_priority_queue.try_pop(t);
+        __TBB_ASSERT_EX( result, "Number of critical tasks for scheduler and tasks"
+                         " in graph's priority queue mismatched" );
+        __TBB_ASSERT( t && t != SUCCESSFULLY_ENQUEUED,
+                      "Incorrect task submitted to graph priority queue" );
+        __TBB_ASSERT( t->priority != tbb::flow::internal::no_priority,
+                      "Tasks from graph's priority queue must have priority" );
+        task* t_next = t->execute();
+        task::destroy(*t);
+        return t_next;
+    }
+private:
+    graph_task_priority_queue_t& my_priority_queue;
+};
+#endif /* __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES */
+
+}
+
+//! The graph class
+/** This class serves as a handle to the graph */
+class graph : tbb::internal::no_copy, public tbb::flow::graph_proxy {
+    friend class graph_node;
+
+    template< typename Body >
+    class run_task : public graph_task {
+    public:
+        run_task(Body& body
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+                 , node_priority_t node_priority = no_priority
+        ) : graph_task(node_priority),
+#else
+        ) :
+#endif
+        my_body(body) { }
+        tbb::task *execute() __TBB_override {
+            my_body();
+            return NULL;
+        }
+    private:
+        Body my_body;
+    };
+
+    template< typename Receiver, typename Body >
+    class run_and_put_task : public graph_task {
+    public:
+        run_and_put_task(Receiver &r, Body& body) : my_receiver(r), my_body(body) {}
+        tbb::task *execute() __TBB_override {
+            tbb::task *res = my_receiver.try_put_task(my_body());
+            if (res == SUCCESSFULLY_ENQUEUED) res = NULL;
+            return res;
+        }
+    private:
+        Receiver &my_receiver;
+        Body my_body;
+    };
+    typedef std::list<tbb::task *> task_list_type;
+
+    class wait_functor {
+        tbb::task* graph_root_task;
+    public:
+        wait_functor(tbb::task* t) : graph_root_task(t) {}
+        void operator()() const { graph_root_task->wait_for_all(); }
+    };
+
+    //! A functor that spawns a task
+    class spawn_functor : tbb::internal::no_assign {
+        tbb::task& spawn_task;
+    public:
+        spawn_functor(tbb::task& t) : spawn_task(t) {}
+        void operator()() const {
+            FLOW_SPAWN(spawn_task);
+        }
+    };
+
+    void prepare_task_arena(bool reinit = false) {
+        if (reinit) {
+            __TBB_ASSERT(my_task_arena, "task arena is NULL");
+            my_task_arena->terminate();
+            my_task_arena->initialize(tbb::task_arena::attach());
+        }
+        else {
+            __TBB_ASSERT(my_task_arena == NULL, "task arena is not NULL");
+            my_task_arena = new tbb::task_arena(tbb::task_arena::attach());
+        }
+        if (!my_task_arena->is_active()) // failed to attach
+            my_task_arena->initialize(); // create a new, default-initialized arena
+        __TBB_ASSERT(my_task_arena->is_active(), "task arena is not active");
+    }
+
+public:
+    //! Constructs a graph with isolated task_group_context
+    graph();
+
+    //! Constructs a graph with use_this_context as context
+    explicit graph(tbb::task_group_context& use_this_context);
+
+    //! Destroys the graph.
+    /** Calls wait_for_all, then destroys the root task and context. */
+    ~graph();
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    void set_name(const char *name);
+#endif
+
+    void increment_wait_count() {
+        reserve_wait();
+    }
+
+    void decrement_wait_count() {
+        release_wait();
+    }
+
+    //! Used to register that an external entity may still interact with the graph.
+    /** The graph will not return from wait_for_all until a matching number of decrement_wait_count calls
+    is made. */
+    void reserve_wait() __TBB_override;
+
+    //! Deregisters an external entity that may have interacted with the graph.
+    /** The graph will not return from wait_for_all until all the number of decrement_wait_count calls
+    matches the number of increment_wait_count calls. */
+    void release_wait() __TBB_override;
+
+    //! Spawns a task that runs a body and puts its output to a specific receiver
+    /** The task is spawned as a child of the graph. This is useful for running tasks
+    that need to block a wait_for_all() on the graph.  For example a one-off source. */
+    template< typename Receiver, typename Body >
+    void run(Receiver &r, Body body) {
+        if (internal::is_graph_active(*this)) {
+            task* rtask = new (task::allocate_additional_child_of(*root_task()))
+                run_and_put_task< Receiver, Body >(r, body);
+            my_task_arena->execute(spawn_functor(*rtask));
+        }
+    }
+
+    //! Spawns a task that runs a function object
+    /** The task is spawned as a child of the graph. This is useful for running tasks
+    that need to block a wait_for_all() on the graph. For example a one-off source. */
+    template< typename Body >
+    void run(Body body) {
+        if (internal::is_graph_active(*this)) {
+            task* rtask = new (task::allocate_additional_child_of(*root_task())) run_task< Body >(body);
+            my_task_arena->execute(spawn_functor(*rtask));
+        }
+    }
+
+    //! Wait until graph is idle and decrement_wait_count calls equals increment_wait_count calls.
+    /** The waiting thread will go off and steal work while it is block in the wait_for_all. */
+    void wait_for_all() {
+        cancelled = false;
+        caught_exception = false;
+        if (my_root_task) {
+#if TBB_USE_EXCEPTIONS
+            try {
+#endif
+                my_task_arena->execute(wait_functor(my_root_task));
+                cancelled = my_context->is_group_execution_cancelled();
+#if TBB_USE_EXCEPTIONS
+            }
+            catch (...) {
+                my_root_task->set_ref_count(1);
+                my_context->reset();
+                caught_exception = true;
+                cancelled = true;
+                throw;
+            }
+#endif
+            // TODO: the "if" condition below is just a work-around to support the concurrent wait
+            // mode. The cancellation and exception mechanisms are still broken in this mode.
+            // Consider using task group not to re-implement the same functionality.
+            if (!(my_context->traits() & tbb::task_group_context::concurrent_wait)) {
+                my_context->reset();  // consistent with behavior in catch()
+                my_root_task->set_ref_count(1);
+            }
+        }
+    }
+
+    //! Returns the root task of the graph
+    tbb::task * root_task() {
+        return my_root_task;
+    }
+
+    // ITERATORS
+    template<typename C, typename N>
+    friend class graph_iterator;
+
+    // Graph iterator typedefs
+    typedef graph_iterator<graph, graph_node> iterator;
+    typedef graph_iterator<const graph, const graph_node> const_iterator;
+
+    // Graph iterator constructors
+    //! start iterator
+    iterator begin();
+    //! end iterator
+    iterator end();
+    //! start const iterator
+    const_iterator begin() const;
+    //! end const iterator
+    const_iterator end() const;
+    //! start const iterator
+    const_iterator cbegin() const;
+    //! end const iterator
+    const_iterator cend() const;
+
+    //! return status of graph execution
+    bool is_cancelled() { return cancelled; }
+    bool exception_thrown() { return caught_exception; }
+
+    // thread-unsafe state reset.
+    void reset(reset_flags f = rf_reset_protocol);
+
+private:
+    tbb::task *my_root_task;
+    tbb::task_group_context *my_context;
+    bool own_context;
+    bool cancelled;
+    bool caught_exception;
+    bool my_is_active;
+    task_list_type my_reset_task_list;
+
+    graph_node *my_nodes, *my_nodes_last;
+
+    tbb::spin_mutex nodelist_mutex;
+    void register_node(graph_node *n);
+    void remove_node(graph_node *n);
+
+    tbb::task_arena* my_task_arena;
+
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+    internal::graph_task_priority_queue_t my_priority_queue;
+#endif
+
+    friend void internal::activate_graph(graph& g);
+    friend void internal::deactivate_graph(graph& g);
+    friend bool internal::is_graph_active(graph& g);
+    friend void internal::spawn_in_graph_arena(graph& g, tbb::task& arena_task);
+    friend void internal::add_task_to_graph_reset_list(graph& g, tbb::task *tp);
+    template<typename F> friend void internal::execute_in_graph_arena(graph& g, F& f);
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+    template<typename Input, typename Output, typename Policy, typename Allocator>
+    friend class async_node;
+#endif
+
+    friend class tbb::interface7::internal::task_arena_base;
+
+};  // class graph
+
+//! The base of all graph nodes.
+class graph_node : tbb::internal::no_copy {
+    friend class graph;
+    template<typename C, typename N>
+    friend class graph_iterator;
+protected:
+    graph& my_graph;
+    graph_node *next, *prev;
+public:
+    explicit graph_node(graph& g);
+
+    virtual ~graph_node();
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    virtual void set_name(const char *name) = 0;
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    virtual void extract() = 0;
+#endif
+
+protected:
+    // performs the reset on an individual node.
+    virtual void reset_node(reset_flags f = rf_reset_protocol) = 0;
+};  // class graph_node
+
+namespace internal {
+
+inline void activate_graph(graph& g) {
+    g.my_is_active = true;
+}
+
+inline void deactivate_graph(graph& g) {
+    g.my_is_active = false;
+}
+
+inline bool is_graph_active(graph& g) {
+    return g.my_is_active;
+}
+
+//! Executes custom functor inside graph arena
+template<typename F>
+inline void execute_in_graph_arena(graph& g, F& f) {
+    if (is_graph_active(g)) {
+        __TBB_ASSERT(g.my_task_arena && g.my_task_arena->is_active(), NULL);
+        g.my_task_arena->execute(f);
+    }
+}
+
+//! Spawns a task inside graph arena
+inline void spawn_in_graph_arena(graph& g, tbb::task& arena_task) {
+    task* task_to_spawn = &arena_task;
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+    // TODO: change flow graph's interfaces to work with graph_task type instead of tbb::task.
+    graph_task* t = static_cast<graph_task*>(&arena_task);
+    if( t->priority != no_priority ) {
+        //! Non-preemptive priority pattern. The original task is submitted as a work item to the
+        //! priority queue, and a new critical task is created to take and execute a work item with
+        //! the highest known priority. The reference counting responsibility is transferred (via
+        //! allocate_continuation) to the new task.
+        task_to_spawn = new( t->allocate_continuation() ) priority_task_selector(g.my_priority_queue);
+        tbb::internal::make_critical( *task_to_spawn );
+        g.my_priority_queue.push(t);
+    }
+#endif /* __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES */
+    graph::spawn_functor s_fn(*task_to_spawn);
+    execute_in_graph_arena(g, s_fn);
+}
+
+inline void add_task_to_graph_reset_list(graph& g, tbb::task *tp) {
+    g.my_reset_task_list.push_back(tp);
+}
+
+} // namespace internal
+
+} // namespace interface10
+} // namespace flow
+} // namespace tbb
+
+#endif // __TBB_flow_graph_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_indexer_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_indexer_impl.h
new file mode 100644
index 00000000..01a6fd36
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_indexer_impl.h
@@ -0,0 +1,484 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_indexer_impl_H
+#define __TBB__flow_graph_indexer_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#include "_flow_graph_types_impl.h"
+
+namespace internal {
+
+    // Output of the indexer_node is a tbb::flow::tagged_msg, and will be of
+    // the form  tagged_msg<tag, result>
+    // where the value of tag will indicate which result was put to the
+    // successor.
+
+    template<typename IndexerNodeBaseType, typename T, size_t K>
+    task* do_try_put(const T &v, void *p) {
+        typename IndexerNodeBaseType::output_type o(K, v);
+        return reinterpret_cast<IndexerNodeBaseType *>(p)->try_put_task(&o);
+    }
+
+    template<typename TupleTypes,int N>
+    struct indexer_helper {
+        template<typename IndexerNodeBaseType, typename PortTuple>
+        static inline void set_indexer_node_pointer(PortTuple &my_input, IndexerNodeBaseType *p, graph& g) {
+            typedef typename tuple_element<N-1, TupleTypes>::type T;
+            task *(*indexer_node_put_task)(const T&, void *) = do_try_put<IndexerNodeBaseType, T, N-1>;
+            tbb::flow::get<N-1>(my_input).set_up(p, indexer_node_put_task, g);
+            indexer_helper<TupleTypes,N-1>::template set_indexer_node_pointer<IndexerNodeBaseType,PortTuple>(my_input, p, g);
+        }
+        template<typename InputTuple>
+        static inline void reset_inputs(InputTuple &my_input, reset_flags f) {
+            indexer_helper<TupleTypes,N-1>::reset_inputs(my_input, f);
+            tbb::flow::get<N-1>(my_input).reset_receiver(f);
+        }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        template<typename InputTuple>
+        static inline void extract(InputTuple &my_input) {
+            indexer_helper<TupleTypes,N-1>::extract(my_input);
+            tbb::flow::get<N-1>(my_input).extract_receiver();
+        }
+#endif
+    };
+
+    template<typename TupleTypes>
+    struct indexer_helper<TupleTypes,1> {
+        template<typename IndexerNodeBaseType, typename PortTuple>
+        static inline void set_indexer_node_pointer(PortTuple &my_input, IndexerNodeBaseType *p, graph& g) {
+            typedef typename tuple_element<0, TupleTypes>::type T;
+            task *(*indexer_node_put_task)(const T&, void *) = do_try_put<IndexerNodeBaseType, T, 0>;
+            tbb::flow::get<0>(my_input).set_up(p, indexer_node_put_task, g);
+        }
+        template<typename InputTuple>
+        static inline void reset_inputs(InputTuple &my_input, reset_flags f) {
+            tbb::flow::get<0>(my_input).reset_receiver(f);
+        }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        template<typename InputTuple>
+        static inline void extract(InputTuple &my_input) {
+            tbb::flow::get<0>(my_input).extract_receiver();
+        }
+#endif
+    };
+
+    template<typename T>
+    class indexer_input_port : public receiver<T> {
+    private:
+        void* my_indexer_ptr;
+        typedef task* (* forward_function_ptr)(T const &, void* );
+        forward_function_ptr my_try_put_task;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        spin_mutex my_pred_mutex;
+        typedef typename receiver<T>::built_predecessors_type built_predecessors_type;
+        built_predecessors_type my_built_predecessors;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+        graph* my_graph;
+    public:
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        indexer_input_port() : my_pred_mutex(), my_graph(NULL) {}
+        indexer_input_port( const indexer_input_port & other) : receiver<T>(), my_pred_mutex(), my_graph(other.my_graph) {
+        }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+        void set_up(void* p, forward_function_ptr f, graph& g) {
+            my_indexer_ptr = p;
+            my_try_put_task = f;
+            my_graph = &g;
+        }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename receiver<T>::predecessor_list_type predecessor_list_type;
+        typedef typename receiver<T>::predecessor_type predecessor_type;
+
+        built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+
+        size_t predecessor_count() __TBB_override {
+            spin_mutex::scoped_lock l(my_pred_mutex);
+            return my_built_predecessors.edge_count();
+        }
+        void internal_add_built_predecessor(predecessor_type &p) __TBB_override {
+            spin_mutex::scoped_lock l(my_pred_mutex);
+            my_built_predecessors.add_edge(p);
+        }
+        void internal_delete_built_predecessor(predecessor_type &p) __TBB_override {
+            spin_mutex::scoped_lock l(my_pred_mutex);
+            my_built_predecessors.delete_edge(p);
+        }
+        void copy_predecessors( predecessor_list_type &v) __TBB_override {
+            spin_mutex::scoped_lock l(my_pred_mutex);
+            my_built_predecessors.copy_edges(v);
+        }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+    protected:
+        template< typename R, typename B > friend class run_and_put_task;
+        template<typename X, typename Y> friend class internal::broadcast_cache;
+        template<typename X, typename Y> friend class internal::round_robin_cache;
+        task *try_put_task(const T &v) __TBB_override {
+            return my_try_put_task(v, my_indexer_ptr);
+        }
+
+        graph& graph_reference() __TBB_override {
+            return *my_graph;
+        }
+
+    public:
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void reset_receiver(reset_flags f) __TBB_override { if(f&rf_clear_edges) my_built_predecessors.clear(); }
+#else
+        void reset_receiver(reset_flags /*f*/) __TBB_override { }
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract_receiver() { my_built_predecessors.receiver_extract(*this); }
+#endif
+    };
+
+    template<typename InputTuple, typename OutputType, typename StructTypes>
+    class indexer_node_FE {
+    public:
+        static const int N = tbb::flow::tuple_size<InputTuple>::value;
+        typedef OutputType output_type;
+        typedef InputTuple input_type;
+
+        // Some versions of Intel(R) C++ Compiler fail to generate an implicit constructor for the class which has std::tuple as a member.
+        indexer_node_FE() : my_inputs() {}
+
+        input_type &input_ports() { return my_inputs; }
+    protected:
+        input_type my_inputs;
+    };
+
+    //! indexer_node_base
+    template<typename InputTuple, typename OutputType, typename StructTypes>
+    class indexer_node_base : public graph_node, public indexer_node_FE<InputTuple, OutputType,StructTypes>,
+                           public sender<OutputType> {
+    protected:
+       using graph_node::my_graph;
+    public:
+        static const size_t N = tbb::flow::tuple_size<InputTuple>::value;
+        typedef OutputType output_type;
+        typedef StructTypes tuple_types;
+        typedef typename sender<output_type>::successor_type successor_type;
+        typedef indexer_node_FE<InputTuple, output_type,StructTypes> input_ports_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename sender<output_type>::built_successors_type built_successors_type;
+        typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+
+    private:
+        // ----------- Aggregator ------------
+        enum op_type { reg_succ, rem_succ, try__put_task
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            , add_blt_succ, del_blt_succ,
+             blt_succ_cnt, blt_succ_cpy
+#endif
+        };
+        typedef indexer_node_base<InputTuple,output_type,StructTypes> class_type;
+
+        class indexer_node_base_operation : public aggregated_operation<indexer_node_base_operation> {
+        public:
+            char type;
+            union {
+                output_type const *my_arg;
+                successor_type *my_succ;
+                task *bypass_t;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                size_t cnt_val;
+                successor_list_type *succv;
+#endif
+            };
+            indexer_node_base_operation(const output_type* e, op_type t) :
+                type(char(t)), my_arg(e) {}
+            indexer_node_base_operation(const successor_type &s, op_type t) : type(char(t)),
+                my_succ(const_cast<successor_type *>(&s)) {}
+            indexer_node_base_operation(op_type t) : type(char(t)) {}
+        };
+
+        typedef internal::aggregating_functor<class_type, indexer_node_base_operation> handler_type;
+        friend class internal::aggregating_functor<class_type, indexer_node_base_operation>;
+        aggregator<handler_type, indexer_node_base_operation> my_aggregator;
+
+        void handle_operations(indexer_node_base_operation* op_list) {
+            indexer_node_base_operation *current;
+            while(op_list) {
+                current = op_list;
+                op_list = op_list->next;
+                switch(current->type) {
+
+                case reg_succ:
+                    my_successors.register_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+
+                case rem_succ:
+                    my_successors.remove_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case try__put_task: {
+                        current->bypass_t = my_successors.try_put_task(*(current->my_arg));
+                        __TBB_store_with_release(current->status, SUCCEEDED);  // return of try_put_task actual return value
+                    }
+                    break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                case add_blt_succ:
+                    my_successors.internal_add_built_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case del_blt_succ:
+                    my_successors.internal_delete_built_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_succ_cnt:
+                    current->cnt_val = my_successors.successor_count();
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_succ_cpy:
+                    my_successors.copy_successors(*(current->succv));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+                }
+            }
+        }
+        // ---------- end aggregator -----------
+    public:
+        indexer_node_base(graph& g) : graph_node(g), input_ports_type() {
+            indexer_helper<StructTypes,N>::set_indexer_node_pointer(this->my_inputs, this, g);
+            my_successors.set_owner(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        indexer_node_base(const indexer_node_base& other) : graph_node(other.my_graph), input_ports_type(), sender<output_type>() {
+            indexer_helper<StructTypes,N>::set_indexer_node_pointer(this->my_inputs, this, other.my_graph);
+            my_successors.set_owner(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        bool register_successor(successor_type &r) __TBB_override {
+            indexer_node_base_operation op_data(r, reg_succ);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        bool remove_successor( successor_type &r) __TBB_override {
+            indexer_node_base_operation op_data(r, rem_succ);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        task * try_put_task(output_type const *v) { // not a virtual method in this class
+            indexer_node_base_operation op_data(v, try__put_task);
+            my_aggregator.execute(&op_data);
+            return op_data.bypass_t;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+        built_successors_type &built_successors() __TBB_override { return my_successors.built_successors(); }
+
+        void internal_add_built_successor( successor_type &r) __TBB_override {
+            indexer_node_base_operation op_data(r, add_blt_succ);
+            my_aggregator.execute(&op_data);
+        }
+
+        void internal_delete_built_successor( successor_type &r) __TBB_override {
+            indexer_node_base_operation op_data(r, del_blt_succ);
+            my_aggregator.execute(&op_data);
+        }
+
+        size_t successor_count() __TBB_override {
+            indexer_node_base_operation op_data(blt_succ_cnt);
+            my_aggregator.execute(&op_data);
+            return op_data.cnt_val;
+        }
+
+        void copy_successors( successor_list_type &v) __TBB_override {
+            indexer_node_base_operation op_data(blt_succ_cpy);
+            op_data.succv = &v;
+            my_aggregator.execute(&op_data);
+        }
+        void extract() __TBB_override {
+            my_successors.built_successors().sender_extract(*this);
+            indexer_helper<StructTypes,N>::extract(this->my_inputs);
+        }
+#endif /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+    protected:
+        void reset_node(reset_flags f) __TBB_override {
+            if(f & rf_clear_edges) {
+                my_successors.clear();
+                indexer_helper<StructTypes,N>::reset_inputs(this->my_inputs,f);
+            }
+        }
+
+    private:
+        broadcast_cache<output_type, null_rw_mutex> my_successors;
+    };  //indexer_node_base
+
+
+    template<int N, typename InputTuple> struct input_types;
+
+    template<typename InputTuple>
+    struct input_types<1, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename internal::tagged_msg<size_t, first_type > type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<2, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type> type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<3, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type> type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<4, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type> type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<5, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename tuple_element<4, InputTuple>::type fifth_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type, fifth_type> type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<6, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename tuple_element<4, InputTuple>::type fifth_type;
+        typedef typename tuple_element<5, InputTuple>::type sixth_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type, fifth_type, sixth_type> type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<7, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename tuple_element<4, InputTuple>::type fifth_type;
+        typedef typename tuple_element<5, InputTuple>::type sixth_type;
+        typedef typename tuple_element<6, InputTuple>::type seventh_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type, fifth_type, sixth_type,
+                                                      seventh_type> type;
+    };
+
+
+    template<typename InputTuple>
+    struct input_types<8, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename tuple_element<4, InputTuple>::type fifth_type;
+        typedef typename tuple_element<5, InputTuple>::type sixth_type;
+        typedef typename tuple_element<6, InputTuple>::type seventh_type;
+        typedef typename tuple_element<7, InputTuple>::type eighth_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type, fifth_type, sixth_type,
+                                                      seventh_type, eighth_type> type;
+    };
+
+
+    template<typename InputTuple>
+    struct input_types<9, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename tuple_element<4, InputTuple>::type fifth_type;
+        typedef typename tuple_element<5, InputTuple>::type sixth_type;
+        typedef typename tuple_element<6, InputTuple>::type seventh_type;
+        typedef typename tuple_element<7, InputTuple>::type eighth_type;
+        typedef typename tuple_element<8, InputTuple>::type nineth_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type, fifth_type, sixth_type,
+                                                      seventh_type, eighth_type, nineth_type> type;
+    };
+
+    template<typename InputTuple>
+    struct input_types<10, InputTuple> {
+        typedef typename tuple_element<0, InputTuple>::type first_type;
+        typedef typename tuple_element<1, InputTuple>::type second_type;
+        typedef typename tuple_element<2, InputTuple>::type third_type;
+        typedef typename tuple_element<3, InputTuple>::type fourth_type;
+        typedef typename tuple_element<4, InputTuple>::type fifth_type;
+        typedef typename tuple_element<5, InputTuple>::type sixth_type;
+        typedef typename tuple_element<6, InputTuple>::type seventh_type;
+        typedef typename tuple_element<7, InputTuple>::type eighth_type;
+        typedef typename tuple_element<8, InputTuple>::type nineth_type;
+        typedef typename tuple_element<9, InputTuple>::type tenth_type;
+        typedef typename internal::tagged_msg<size_t, first_type, second_type, third_type,
+                                                      fourth_type, fifth_type, sixth_type,
+                                                      seventh_type, eighth_type, nineth_type,
+                                                      tenth_type> type;
+    };
+
+    // type generators
+    template<typename OutputTuple>
+    struct indexer_types : public input_types<tuple_size<OutputTuple>::value, OutputTuple> {
+        static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+        typedef typename input_types<N, OutputTuple>::type output_type;
+        typedef typename wrap_tuple_elements<N,indexer_input_port,OutputTuple>::type input_ports_type;
+        typedef internal::indexer_node_FE<input_ports_type,output_type,OutputTuple> indexer_FE_type;
+        typedef internal::indexer_node_base<input_ports_type, output_type, OutputTuple> indexer_base_type;
+    };
+
+    template<class OutputTuple>
+    class unfolded_indexer_node : public indexer_types<OutputTuple>::indexer_base_type {
+    public:
+        typedef typename indexer_types<OutputTuple>::input_ports_type input_ports_type;
+        typedef OutputTuple tuple_types;
+        typedef typename indexer_types<OutputTuple>::output_type output_type;
+    private:
+        typedef typename indexer_types<OutputTuple>::indexer_base_type base_type;
+    public:
+        unfolded_indexer_node(graph& g) : base_type(g) {}
+        unfolded_indexer_node(const unfolded_indexer_node &other) : base_type(other) {}
+    };
+
+} /* namespace internal */
+
+#endif  /* __TBB__flow_graph_indexer_impl_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_item_buffer_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_item_buffer_impl.h
new file mode 100644
index 00000000..546d264f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_item_buffer_impl.h
@@ -0,0 +1,288 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_item_buffer_impl_H
+#define __TBB__flow_graph_item_buffer_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#include "tbb/internal/_flow_graph_types_impl.h"  // for aligned_pair
+
+// in namespace tbb::flow::interfaceX (included in _flow_graph_node_impl.h)
+
+    //! Expandable buffer of items.  The possible operations are push, pop,
+    //* tests for empty and so forth.  No mutual exclusion is built in.
+    //* objects are constructed into and explicitly-destroyed.  get_my_item gives
+    // a read-only reference to the item in the buffer.  set_my_item may be called
+    // with either an empty or occupied slot.
+
+    using internal::aligned_pair;
+    using internal::alignment_of;
+
+namespace internal {
+
+    template <typename T, typename A=cache_aligned_allocator<T> >
+    class item_buffer {
+    public:
+        typedef T item_type;
+        enum buffer_item_state { no_item=0, has_item=1, reserved_item=2 };
+    protected:
+        typedef size_t size_type;
+        typedef typename aligned_pair<item_type, buffer_item_state>::type buffer_item_type;
+        typedef typename A::template rebind<buffer_item_type>::other allocator_type;
+
+        buffer_item_type *my_array;
+        size_type my_array_size;
+        static const size_type initial_buffer_size = 4;
+        size_type my_head;
+        size_type my_tail;
+
+        bool buffer_empty() const { return my_head == my_tail; }
+
+        buffer_item_type &item(size_type i) {
+            __TBB_ASSERT(!(size_type(&(my_array[i&(my_array_size-1)].second))%alignment_of<buffer_item_state>::value),NULL);
+            __TBB_ASSERT(!(size_type(&(my_array[i&(my_array_size-1)].first))%alignment_of<item_type>::value), NULL);
+            return my_array[i & (my_array_size - 1) ];
+        }
+
+        const buffer_item_type &item(size_type i) const {
+            __TBB_ASSERT(!(size_type(&(my_array[i&(my_array_size-1)].second))%alignment_of<buffer_item_state>::value), NULL);
+            __TBB_ASSERT(!(size_type(&(my_array[i&(my_array_size-1)].first))%alignment_of<item_type>::value), NULL);
+            return my_array[i & (my_array_size-1)];
+        }
+
+        bool my_item_valid(size_type i) const { return (i < my_tail) && (i >= my_head) && (item(i).second != no_item); }
+        bool my_item_reserved(size_type i) const { return item(i).second == reserved_item; }
+
+        // object management in buffer
+        const item_type &get_my_item(size_t i) const {
+            __TBB_ASSERT(my_item_valid(i),"attempt to get invalid item");
+            item_type *itm = (tbb::internal::punned_cast<item_type *>(&(item(i).first)));
+            return *(const item_type *)itm;
+        }
+
+        // may be called with an empty slot or a slot that has already been constructed into.
+        void set_my_item(size_t i, const item_type &o) {
+            if(item(i).second != no_item) {
+                destroy_item(i);
+            }
+            new(&(item(i).first)) item_type(o);
+            item(i).second = has_item;
+        }
+
+        // destructively-fetch an object from the buffer
+        void fetch_item(size_t i, item_type &o) {
+            __TBB_ASSERT(my_item_valid(i), "Trying to fetch an empty slot");
+            o = get_my_item(i);  // could have std::move assign semantics
+            destroy_item(i);
+        }
+
+        // move an existing item from one slot to another.  The moved-to slot must be unoccupied,
+        // the moved-from slot must exist and not be reserved.  The after, from will be empty,
+        // to will be occupied but not reserved
+        void move_item(size_t to, size_t from) {
+            __TBB_ASSERT(!my_item_valid(to), "Trying to move to a non-empty slot");
+            __TBB_ASSERT(my_item_valid(from), "Trying to move from an empty slot");
+            set_my_item(to, get_my_item(from));   // could have std::move semantics
+            destroy_item(from);
+
+        }
+
+        // put an item in an empty slot.  Return true if successful, else false
+        bool place_item(size_t here, const item_type &me) {
+#if !TBB_DEPRECATED_SEQUENCER_DUPLICATES
+            if(my_item_valid(here)) return false;
+#endif
+            set_my_item(here, me);
+            return true;
+        }
+
+        // could be implemented with std::move semantics
+        void swap_items(size_t i, size_t j) {
+            __TBB_ASSERT(my_item_valid(i) && my_item_valid(j), "attempt to swap invalid item(s)");
+            item_type temp = get_my_item(i);
+            set_my_item(i, get_my_item(j));
+            set_my_item(j, temp);
+        }
+
+        void destroy_item(size_type i) {
+            __TBB_ASSERT(my_item_valid(i), "destruction of invalid item");
+            (tbb::internal::punned_cast<item_type *>(&(item(i).first)))->~item_type();
+            item(i).second = no_item;
+        }
+
+        // returns the front element
+        const item_type& front() const
+        {
+            __TBB_ASSERT(my_item_valid(my_head), "attempt to fetch head non-item");
+            return get_my_item(my_head);
+        }
+
+        // returns  the back element
+        const item_type& back() const
+        {
+            __TBB_ASSERT(my_item_valid(my_tail - 1), "attempt to fetch head non-item");
+            return get_my_item(my_tail - 1);
+        }
+
+        // following methods are for reservation of the front of a bufffer.
+        void reserve_item(size_type i) { __TBB_ASSERT(my_item_valid(i) && !my_item_reserved(i), "item cannot be reserved"); item(i).second = reserved_item; }
+        void release_item(size_type i) { __TBB_ASSERT(my_item_reserved(i), "item is not reserved"); item(i).second = has_item; }
+
+        void destroy_front() { destroy_item(my_head); ++my_head; }
+        void destroy_back() { destroy_item(my_tail-1); --my_tail; }
+
+        // we have to be able to test against a new tail value without changing my_tail
+        // grow_array doesn't work if we change my_tail when the old array is too small
+        size_type size(size_t new_tail = 0) { return (new_tail ? new_tail : my_tail) - my_head; }
+        size_type capacity() { return my_array_size; }
+        // sequencer_node does not use this method, so we don't
+        // need a version that passes in the new_tail value.
+        bool buffer_full() { return size() >= capacity(); }
+
+        //! Grows the internal array.
+        void grow_my_array( size_t minimum_size ) {
+            // test that we haven't made the structure inconsistent.
+            __TBB_ASSERT(capacity() >= my_tail - my_head, "total items exceed capacity");
+            size_type new_size = my_array_size ? 2*my_array_size : initial_buffer_size;
+            while( new_size<minimum_size )
+                new_size*=2;
+
+            buffer_item_type* new_array = allocator_type().allocate(new_size);
+
+            // initialize validity to "no"
+            for( size_type i=0; i<new_size; ++i ) { new_array[i].second = no_item; }
+
+            for( size_type i=my_head; i<my_tail; ++i) {
+                if(my_item_valid(i)) {  // sequencer_node may have empty slots
+                    // placement-new copy-construct; could be std::move
+                    char *new_space = (char *)&(new_array[i&(new_size-1)].first);
+                    (void)new(new_space) item_type(get_my_item(i));
+                    new_array[i&(new_size-1)].second = item(i).second;
+                }
+            }
+
+            clean_up_buffer(/*reset_pointers*/false);
+
+            my_array = new_array;
+            my_array_size = new_size;
+        }
+
+        bool push_back(item_type &v) {
+            if(buffer_full()) {
+                grow_my_array(size() + 1);
+            }
+            set_my_item(my_tail, v);
+            ++my_tail;
+            return true;
+        }
+
+        bool pop_back(item_type &v) {
+            if (!my_item_valid(my_tail-1)) {
+                return false;
+            }
+            v = this->back();
+            destroy_back();
+            return true;
+        }
+
+        bool pop_front(item_type &v) {
+            if(!my_item_valid(my_head)) {
+                return false;
+            }
+            v = this->front();
+            destroy_front();
+            return true;
+        }
+
+        // This is used both for reset and for grow_my_array.  In the case of grow_my_array
+        // we want to retain the values of the head and tail.
+        void clean_up_buffer(bool reset_pointers) {
+            if (my_array) {
+                for( size_type i=my_head; i<my_tail; ++i ) {
+                    if(my_item_valid(i))
+                        destroy_item(i);
+                }
+                allocator_type().deallocate(my_array,my_array_size);
+            }
+            my_array = NULL;
+            if(reset_pointers) {
+                my_head = my_tail = my_array_size = 0;
+            }
+        }
+
+    public:
+        //! Constructor
+        item_buffer( ) : my_array(NULL), my_array_size(0),
+            my_head(0), my_tail(0) {
+            grow_my_array(initial_buffer_size);
+        }
+
+        ~item_buffer() {
+            clean_up_buffer(/*reset_pointers*/true);
+        }
+
+        void reset() { clean_up_buffer(/*reset_pointers*/true); grow_my_array(initial_buffer_size); }
+
+    };
+
+    //! item_buffer with reservable front-end.  NOTE: if reserving, do not
+    //* complete operation with pop_front(); use consume_front().
+    //* No synchronization built-in.
+    template<typename T, typename A=cache_aligned_allocator<T> >
+    class reservable_item_buffer : public item_buffer<T, A> {
+    protected:
+        using item_buffer<T, A>::my_item_valid;
+        using item_buffer<T, A>::my_head;
+
+    public:
+        reservable_item_buffer() : item_buffer<T, A>(), my_reserved(false) {}
+        void reset() {my_reserved = false; item_buffer<T,A>::reset(); }
+    protected:
+
+        bool reserve_front(T &v) {
+            if(my_reserved || !my_item_valid(this->my_head)) return false;
+            my_reserved = true;
+            // reserving the head
+            v = this->front();
+            this->reserve_item(this->my_head);
+            return true;
+        }
+
+        void consume_front() {
+            __TBB_ASSERT(my_reserved, "Attempt to consume a non-reserved item");
+            this->destroy_front();
+            my_reserved = false;
+        }
+
+        void release_front() {
+            __TBB_ASSERT(my_reserved, "Attempt to release a non-reserved item");
+            this->release_item(this->my_head);
+            my_reserved = false;
+        }
+
+        bool my_reserved;
+    };
+
+}  // namespace internal
+
+#endif // __TBB__flow_graph_item_buffer_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_join_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_join_impl.h
new file mode 100644
index 00000000..bd2fe64a
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_join_impl.h
@@ -0,0 +1,2003 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_join_impl_H
+#define __TBB__flow_graph_join_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+namespace internal {
+
+    struct forwarding_base : tbb::internal::no_assign {
+        forwarding_base(graph &g) : graph_ref(g) {}
+        virtual ~forwarding_base() {}
+        // decrement_port_count may create a forwarding task.  If we cannot handle the task
+        // ourselves, ask decrement_port_count to deal with it.
+        virtual task * decrement_port_count(bool handle_task) = 0;
+        virtual void increment_port_count() = 0;
+        // moved here so input ports can queue tasks
+        graph& graph_ref;
+    };
+
+    // specialization that lets us keep a copy of the current_key for building results.
+    // KeyType can be a reference type.
+    template<typename KeyType>
+    struct matching_forwarding_base : public forwarding_base {
+        typedef typename tbb::internal::strip<KeyType>::type current_key_type;
+        matching_forwarding_base(graph &g) : forwarding_base(g) { }
+        virtual task * increment_key_count(current_key_type const & /*t*/, bool /*handle_task*/) = 0; // {return NULL;}
+        current_key_type current_key; // so ports can refer to FE's desired items
+    };
+
+    template< int N >
+    struct join_helper {
+
+        template< typename TupleType, typename PortType >
+        static inline void set_join_node_pointer(TupleType &my_input, PortType *port) {
+            tbb::flow::get<N-1>( my_input ).set_join_node_pointer(port);
+            join_helper<N-1>::set_join_node_pointer( my_input, port );
+        }
+        template< typename TupleType >
+        static inline void consume_reservations( TupleType &my_input ) {
+            tbb::flow::get<N-1>( my_input ).consume();
+            join_helper<N-1>::consume_reservations( my_input );
+        }
+
+        template< typename TupleType >
+        static inline void release_my_reservation( TupleType &my_input ) {
+            tbb::flow::get<N-1>( my_input ).release();
+        }
+
+        template <typename TupleType>
+        static inline void release_reservations( TupleType &my_input) {
+            join_helper<N-1>::release_reservations(my_input);
+            release_my_reservation(my_input);
+        }
+
+        template< typename InputTuple, typename OutputTuple >
+        static inline bool reserve( InputTuple &my_input, OutputTuple &out) {
+            if ( !tbb::flow::get<N-1>( my_input ).reserve( tbb::flow::get<N-1>( out ) ) ) return false;
+            if ( !join_helper<N-1>::reserve( my_input, out ) ) {
+                release_my_reservation( my_input );
+                return false;
+            }
+            return true;
+        }
+
+        template<typename InputTuple, typename OutputTuple>
+        static inline bool get_my_item( InputTuple &my_input, OutputTuple &out) {
+            bool res = tbb::flow::get<N-1>(my_input).get_item(tbb::flow::get<N-1>(out) ); // may fail
+            return join_helper<N-1>::get_my_item(my_input, out) && res;       // do get on other inputs before returning
+        }
+
+        template<typename InputTuple, typename OutputTuple>
+        static inline bool get_items(InputTuple &my_input, OutputTuple &out) {
+            return get_my_item(my_input, out);
+        }
+
+        template<typename InputTuple>
+        static inline void reset_my_port(InputTuple &my_input) {
+            join_helper<N-1>::reset_my_port(my_input);
+            tbb::flow::get<N-1>(my_input).reset_port();
+        }
+
+        template<typename InputTuple>
+        static inline void reset_ports(InputTuple& my_input) {
+            reset_my_port(my_input);
+        }
+
+        template<typename InputTuple, typename KeyFuncTuple>
+        static inline void set_key_functors(InputTuple &my_input, KeyFuncTuple &my_key_funcs) {
+            tbb::flow::get<N-1>(my_input).set_my_key_func(tbb::flow::get<N-1>(my_key_funcs));
+            tbb::flow::get<N-1>(my_key_funcs) = NULL;
+            join_helper<N-1>::set_key_functors(my_input, my_key_funcs);
+        }
+
+        template< typename KeyFuncTuple>
+        static inline void copy_key_functors(KeyFuncTuple &my_inputs, KeyFuncTuple &other_inputs) {
+            if(tbb::flow::get<N-1>(other_inputs).get_my_key_func()) {
+                tbb::flow::get<N-1>(my_inputs).set_my_key_func(tbb::flow::get<N-1>(other_inputs).get_my_key_func()->clone());
+            }
+            join_helper<N-1>::copy_key_functors(my_inputs, other_inputs);
+        }
+
+        template<typename InputTuple>
+        static inline void reset_inputs(InputTuple &my_input, reset_flags f) {
+            join_helper<N-1>::reset_inputs(my_input, f);
+            tbb::flow::get<N-1>(my_input).reset_receiver(f);
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        template<typename InputTuple>
+        static inline void extract_inputs(InputTuple &my_input) {
+            join_helper<N-1>::extract_inputs(my_input);
+            tbb::flow::get<N-1>(my_input).extract_receiver();
+        }
+#endif
+    };  // join_helper<N>
+
+    template< >
+    struct join_helper<1> {
+
+        template< typename TupleType, typename PortType >
+        static inline void set_join_node_pointer(TupleType &my_input, PortType *port) {
+            tbb::flow::get<0>( my_input ).set_join_node_pointer(port);
+        }
+
+        template< typename TupleType >
+        static inline void consume_reservations( TupleType &my_input ) {
+            tbb::flow::get<0>( my_input ).consume();
+        }
+
+        template< typename TupleType >
+        static inline void release_my_reservation( TupleType &my_input ) {
+            tbb::flow::get<0>( my_input ).release();
+        }
+
+        template<typename TupleType>
+        static inline void release_reservations( TupleType &my_input) {
+            release_my_reservation(my_input);
+        }
+
+        template< typename InputTuple, typename OutputTuple >
+        static inline bool reserve( InputTuple &my_input, OutputTuple &out) {
+            return tbb::flow::get<0>( my_input ).reserve( tbb::flow::get<0>( out ) );
+        }
+
+        template<typename InputTuple, typename OutputTuple>
+        static inline bool get_my_item( InputTuple &my_input, OutputTuple &out) {
+            return tbb::flow::get<0>(my_input).get_item(tbb::flow::get<0>(out));
+        }
+
+        template<typename InputTuple, typename OutputTuple>
+        static inline bool get_items(InputTuple &my_input, OutputTuple &out) {
+            return get_my_item(my_input, out);
+        }
+
+        template<typename InputTuple>
+        static inline void reset_my_port(InputTuple &my_input) {
+            tbb::flow::get<0>(my_input).reset_port();
+        }
+
+        template<typename InputTuple>
+        static inline void reset_ports(InputTuple& my_input) {
+            reset_my_port(my_input);
+        }
+
+        template<typename InputTuple, typename KeyFuncTuple>
+        static inline void set_key_functors(InputTuple &my_input, KeyFuncTuple &my_key_funcs) {
+            tbb::flow::get<0>(my_input).set_my_key_func(tbb::flow::get<0>(my_key_funcs));
+            tbb::flow::get<0>(my_key_funcs) = NULL;
+        }
+
+        template< typename KeyFuncTuple>
+        static inline void copy_key_functors(KeyFuncTuple &my_inputs, KeyFuncTuple &other_inputs) {
+            if(tbb::flow::get<0>(other_inputs).get_my_key_func()) {
+                tbb::flow::get<0>(my_inputs).set_my_key_func(tbb::flow::get<0>(other_inputs).get_my_key_func()->clone());
+            }
+        }
+        template<typename InputTuple>
+        static inline void reset_inputs(InputTuple &my_input, reset_flags f) {
+            tbb::flow::get<0>(my_input).reset_receiver(f);
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        template<typename InputTuple>
+        static inline void extract_inputs(InputTuple &my_input) {
+            tbb::flow::get<0>(my_input).extract_receiver();
+        }
+#endif
+    };  // join_helper<1>
+
+    //! The two-phase join port
+    template< typename T >
+    class reserving_port : public receiver<T> {
+    public:
+        typedef T input_type;
+        typedef typename receiver<input_type>::predecessor_type predecessor_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+        typedef typename receiver<input_type>::built_predecessors_type built_predecessors_type;
+#endif
+    private:
+        // ----------- Aggregator ------------
+        enum op_type { reg_pred, rem_pred, res_item, rel_res, con_res
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            , add_blt_pred, del_blt_pred, blt_pred_cnt, blt_pred_cpy
+#endif
+        };
+        enum op_stat {WAIT=0, SUCCEEDED, FAILED};
+        typedef reserving_port<T> class_type;
+
+        class reserving_port_operation : public aggregated_operation<reserving_port_operation> {
+        public:
+            char type;
+            union {
+                T *my_arg;
+                predecessor_type *my_pred;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                size_t cnt_val;
+                predecessor_list_type *plist;
+#endif
+            };
+            reserving_port_operation(const T& e, op_type t) :
+                type(char(t)), my_arg(const_cast<T*>(&e)) {}
+            reserving_port_operation(const predecessor_type &s, op_type t) : type(char(t)),
+                my_pred(const_cast<predecessor_type *>(&s)) {}
+            reserving_port_operation(op_type t) : type(char(t)) {}
+        };
+
+        typedef internal::aggregating_functor<class_type, reserving_port_operation> handler_type;
+        friend class internal::aggregating_functor<class_type, reserving_port_operation>;
+        aggregator<handler_type, reserving_port_operation> my_aggregator;
+
+        void handle_operations(reserving_port_operation* op_list) {
+            reserving_port_operation *current;
+            bool no_predecessors;
+            while(op_list) {
+                current = op_list;
+                op_list = op_list->next;
+                switch(current->type) {
+                case reg_pred:
+                    no_predecessors = my_predecessors.empty();
+                    my_predecessors.add(*(current->my_pred));
+                    if ( no_predecessors ) {
+                        (void) my_join->decrement_port_count(true); // may try to forward
+                    }
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case rem_pred:
+                    my_predecessors.remove(*(current->my_pred));
+                    if(my_predecessors.empty()) my_join->increment_port_count();
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case res_item:
+                    if ( reserved ) {
+                        __TBB_store_with_release(current->status, FAILED);
+                    }
+                    else if ( my_predecessors.try_reserve( *(current->my_arg) ) ) {
+                        reserved = true;
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                    } else {
+                        if ( my_predecessors.empty() ) {
+                            my_join->increment_port_count();
+                        }
+                        __TBB_store_with_release(current->status, FAILED);
+                    }
+                    break;
+                case rel_res:
+                    reserved = false;
+                    my_predecessors.try_release( );
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case con_res:
+                    reserved = false;
+                    my_predecessors.try_consume( );
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                case add_blt_pred:
+                    my_predecessors.internal_add_built_predecessor(*(current->my_pred));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case del_blt_pred:
+                    my_predecessors.internal_delete_built_predecessor(*(current->my_pred));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_pred_cnt:
+                    current->cnt_val = my_predecessors.predecessor_count();
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_pred_cpy:
+                    my_predecessors.copy_predecessors(*(current->plist));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+                }
+            }
+        }
+
+    protected:
+        template< typename R, typename B > friend class run_and_put_task;
+        template<typename X, typename Y> friend class internal::broadcast_cache;
+        template<typename X, typename Y> friend class internal::round_robin_cache;
+        task *try_put_task( const T & ) __TBB_override {
+            return NULL;
+        }
+
+        graph& graph_reference() __TBB_override {
+            return my_join->graph_ref;
+        }
+
+    public:
+
+        //! Constructor
+        reserving_port() : reserved(false) {
+            my_join = NULL;
+            my_predecessors.set_owner( this );
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        // copy constructor
+        reserving_port(const reserving_port& /* other */) : receiver<T>() {
+            reserved = false;
+            my_join = NULL;
+            my_predecessors.set_owner( this );
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        void set_join_node_pointer(forwarding_base *join) {
+            my_join = join;
+        }
+
+        //! Add a predecessor
+        bool register_predecessor( predecessor_type &src ) __TBB_override {
+            reserving_port_operation op_data(src, reg_pred);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        //! Remove a predecessor
+        bool remove_predecessor( predecessor_type &src ) __TBB_override {
+            reserving_port_operation op_data(src, rem_pred);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        //! Reserve an item from the port
+        bool reserve( T &v ) {
+            reserving_port_operation op_data(v, res_item);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        //! Release the port
+        void release( ) {
+            reserving_port_operation op_data(rel_res);
+            my_aggregator.execute(&op_data);
+        }
+
+        //! Complete use of the port
+        void consume( ) {
+            reserving_port_operation op_data(con_res);
+            my_aggregator.execute(&op_data);
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        built_predecessors_type &built_predecessors() __TBB_override { return my_predecessors.built_predecessors(); }
+        void internal_add_built_predecessor(predecessor_type &src) __TBB_override {
+            reserving_port_operation op_data(src, add_blt_pred);
+            my_aggregator.execute(&op_data);
+        }
+
+        void internal_delete_built_predecessor(predecessor_type &src) __TBB_override {
+            reserving_port_operation op_data(src, del_blt_pred);
+            my_aggregator.execute(&op_data);
+        }
+
+        size_t predecessor_count() __TBB_override {
+            reserving_port_operation op_data(blt_pred_cnt);
+            my_aggregator.execute(&op_data);
+            return op_data.cnt_val;
+        }
+
+        void copy_predecessors(predecessor_list_type &l) __TBB_override {
+            reserving_port_operation op_data(blt_pred_cpy);
+            op_data.plist = &l;
+            my_aggregator.execute(&op_data);
+        }
+
+        void extract_receiver() {
+            my_predecessors.built_predecessors().receiver_extract(*this);
+        }
+
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+        void reset_receiver( reset_flags f) __TBB_override {
+            if(f & rf_clear_edges) my_predecessors.clear();
+            else
+            my_predecessors.reset();
+            reserved = false;
+            __TBB_ASSERT(!(f&rf_clear_edges) || my_predecessors.empty(), "port edges not removed");
+        }
+
+    private:
+        forwarding_base *my_join;
+        reservable_predecessor_cache< T, null_mutex > my_predecessors;
+        bool reserved;
+    };  // reserving_port
+
+    //! queueing join_port
+    template<typename T>
+    class queueing_port : public receiver<T>, public item_buffer<T> {
+    public:
+        typedef T input_type;
+        typedef typename receiver<input_type>::predecessor_type predecessor_type;
+        typedef queueing_port<T> class_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename receiver<input_type>::built_predecessors_type built_predecessors_type;
+        typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+#endif
+
+    // ----------- Aggregator ------------
+    private:
+        enum op_type { get__item, res_port, try__put_task
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            , add_blt_pred, del_blt_pred, blt_pred_cnt, blt_pred_cpy
+#endif
+        };
+        enum op_stat {WAIT=0, SUCCEEDED, FAILED};
+
+        class queueing_port_operation : public aggregated_operation<queueing_port_operation> {
+        public:
+            char type;
+            T my_val;
+            T *my_arg;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            predecessor_type *pred;
+            size_t cnt_val;
+            predecessor_list_type *plist;
+#endif
+            task * bypass_t;
+            // constructor for value parameter
+            queueing_port_operation(const T& e, op_type t) :
+                type(char(t)), my_val(e)
+                , bypass_t(NULL)
+            {}
+            // constructor for pointer parameter
+            queueing_port_operation(const T* p, op_type t) :
+                type(char(t)), my_arg(const_cast<T*>(p))
+                , bypass_t(NULL)
+            {}
+            // constructor with no parameter
+            queueing_port_operation(op_type t) : type(char(t))
+                , bypass_t(NULL)
+            {}
+        };
+
+        typedef internal::aggregating_functor<class_type, queueing_port_operation> handler_type;
+        friend class internal::aggregating_functor<class_type, queueing_port_operation>;
+        aggregator<handler_type, queueing_port_operation> my_aggregator;
+
+        void handle_operations(queueing_port_operation* op_list) {
+            queueing_port_operation *current;
+            bool was_empty;
+            while(op_list) {
+                current = op_list;
+                op_list = op_list->next;
+                switch(current->type) {
+                case try__put_task: {
+                        task *rtask = NULL;
+                        was_empty = this->buffer_empty();
+                        this->push_back(current->my_val);
+                        if (was_empty) rtask = my_join->decrement_port_count(false);
+                        else
+                            rtask = SUCCESSFULLY_ENQUEUED;
+                        current->bypass_t = rtask;
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                    }
+                    break;
+                case get__item:
+                    if(!this->buffer_empty()) {
+                        *(current->my_arg) = this->front();
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                    }
+                    else {
+                        __TBB_store_with_release(current->status, FAILED);
+                    }
+                    break;
+                case res_port:
+                    __TBB_ASSERT(this->my_item_valid(this->my_head), "No item to reset");
+                    this->destroy_front();
+                    if(this->my_item_valid(this->my_head)) {
+                        (void)my_join->decrement_port_count(true);
+                    }
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                case add_blt_pred:
+                    my_built_predecessors.add_edge(*(current->pred));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case del_blt_pred:
+                    my_built_predecessors.delete_edge(*(current->pred));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_pred_cnt:
+                    current->cnt_val = my_built_predecessors.edge_count();
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_pred_cpy:
+                    my_built_predecessors.copy_edges(*(current->plist));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+                }
+            }
+        }
+    // ------------ End Aggregator ---------------
+
+    protected:
+        template< typename R, typename B > friend class run_and_put_task;
+        template<typename X, typename Y> friend class internal::broadcast_cache;
+        template<typename X, typename Y> friend class internal::round_robin_cache;
+        task *try_put_task(const T &v) __TBB_override {
+            queueing_port_operation op_data(v, try__put_task);
+            my_aggregator.execute(&op_data);
+            __TBB_ASSERT(op_data.status == SUCCEEDED || !op_data.bypass_t, "inconsistent return from aggregator");
+            if(!op_data.bypass_t) return SUCCESSFULLY_ENQUEUED;
+            return op_data.bypass_t;
+        }
+
+        graph& graph_reference() __TBB_override {
+            return my_join->graph_ref;
+        }
+
+    public:
+
+        //! Constructor
+        queueing_port() : item_buffer<T>() {
+            my_join = NULL;
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        //! copy constructor
+        queueing_port(const queueing_port& /* other */) : receiver<T>(), item_buffer<T>() {
+            my_join = NULL;
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        //! record parent for tallying available items
+        void set_join_node_pointer(forwarding_base *join) {
+            my_join = join;
+        }
+
+        bool get_item( T &v ) {
+            queueing_port_operation op_data(&v, get__item);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        // reset_port is called when item is accepted by successor, but
+        // is initiated by join_node.
+        void reset_port() {
+            queueing_port_operation op_data(res_port);
+            my_aggregator.execute(&op_data);
+            return;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+
+        void internal_add_built_predecessor(predecessor_type &p) __TBB_override {
+            queueing_port_operation op_data(add_blt_pred);
+            op_data.pred = &p;
+            my_aggregator.execute(&op_data);
+        }
+
+        void internal_delete_built_predecessor(predecessor_type &p) __TBB_override {
+            queueing_port_operation op_data(del_blt_pred);
+            op_data.pred = &p;
+            my_aggregator.execute(&op_data);
+        }
+
+        size_t predecessor_count() __TBB_override {
+            queueing_port_operation op_data(blt_pred_cnt);
+            my_aggregator.execute(&op_data);
+            return op_data.cnt_val;
+        }
+
+        void copy_predecessors(predecessor_list_type &l) __TBB_override {
+            queueing_port_operation op_data(blt_pred_cpy);
+            op_data.plist = &l;
+            my_aggregator.execute(&op_data);
+        }
+
+        void extract_receiver() {
+            item_buffer<T>::reset();
+            my_built_predecessors.receiver_extract(*this);
+        }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+        void reset_receiver(reset_flags f) __TBB_override {
+            tbb::internal::suppress_unused_warning(f);
+            item_buffer<T>::reset();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            if (f & rf_clear_edges)
+                my_built_predecessors.clear();
+#endif
+        }
+
+    private:
+        forwarding_base *my_join;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        edge_container<predecessor_type> my_built_predecessors;
+#endif
+    };  // queueing_port
+
+#include "_flow_graph_tagged_buffer_impl.h"
+
+    template<typename K>
+    struct count_element {
+        K my_key;
+        size_t my_value;
+    };
+
+    // method to access the key in the counting table
+    // the ref has already been removed from K
+    template< typename K >
+    struct key_to_count_functor {
+        typedef count_element<K> table_item_type;
+        const K& operator()(const table_item_type& v) { return v.my_key; }
+    };
+
+    // the ports can have only one template parameter.  We wrap the types needed in
+    // a traits type
+    template< class TraitsType >
+    class key_matching_port :
+        public receiver<typename TraitsType::T>,
+        public hash_buffer< typename TraitsType::K, typename TraitsType::T, typename TraitsType::TtoK,
+                typename TraitsType::KHash > {
+    public:
+        typedef TraitsType traits;
+        typedef key_matching_port<traits> class_type;
+        typedef typename TraitsType::T input_type;
+        typedef typename TraitsType::K key_type;
+        typedef typename tbb::internal::strip<key_type>::type noref_key_type;
+        typedef typename receiver<input_type>::predecessor_type predecessor_type;
+        typedef typename TraitsType::TtoK type_to_key_func_type;
+        typedef typename TraitsType::KHash hash_compare_type;
+        typedef hash_buffer< key_type, input_type, type_to_key_func_type, hash_compare_type > buffer_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename receiver<input_type>::built_predecessors_type built_predecessors_type;
+        typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+#endif
+    private:
+// ----------- Aggregator ------------
+    private:
+        enum op_type { try__put, get__item, res_port
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+           , add_blt_pred, del_blt_pred, blt_pred_cnt, blt_pred_cpy
+#endif
+        };
+        enum op_stat {WAIT=0, SUCCEEDED, FAILED};
+
+        class key_matching_port_operation : public aggregated_operation<key_matching_port_operation> {
+        public:
+            char type;
+            input_type my_val;
+            input_type *my_arg;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            predecessor_type *pred;
+            size_t cnt_val;
+            predecessor_list_type *plist;
+#endif
+            // constructor for value parameter
+            key_matching_port_operation(const input_type& e, op_type t) :
+                type(char(t)), my_val(e) {}
+            // constructor for pointer parameter
+            key_matching_port_operation(const input_type* p, op_type t) :
+                type(char(t)), my_arg(const_cast<input_type*>(p)) {}
+            // constructor with no parameter
+            key_matching_port_operation(op_type t) : type(char(t)) {}
+        };
+
+        typedef internal::aggregating_functor<class_type, key_matching_port_operation> handler_type;
+        friend class internal::aggregating_functor<class_type, key_matching_port_operation>;
+        aggregator<handler_type, key_matching_port_operation> my_aggregator;
+
+        void handle_operations(key_matching_port_operation* op_list) {
+            key_matching_port_operation *current;
+            while(op_list) {
+                current = op_list;
+                op_list = op_list->next;
+                switch(current->type) {
+                case try__put: {
+                        bool was_inserted = this->insert_with_key(current->my_val);
+                        // return failure if a duplicate insertion occurs
+                        __TBB_store_with_release(current->status, was_inserted ? SUCCEEDED : FAILED);
+                    }
+                    break;
+                case get__item:
+                    // use current_key from FE for item
+                    if(!this->find_with_key(my_join->current_key, *(current->my_arg))) {
+                        __TBB_ASSERT(false, "Failed to find item corresponding to current_key.");
+                    }
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case res_port:
+                    // use current_key from FE for item
+                    this->delete_with_key(my_join->current_key);
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                case add_blt_pred:
+                    my_built_predecessors.add_edge(*(current->pred));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case del_blt_pred:
+                    my_built_predecessors.delete_edge(*(current->pred));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_pred_cnt:
+                    current->cnt_val = my_built_predecessors.edge_count();
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_pred_cpy:
+                    my_built_predecessors.copy_edges(*(current->plist));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#endif
+                }
+            }
+        }
+// ------------ End Aggregator ---------------
+    protected:
+        template< typename R, typename B > friend class run_and_put_task;
+        template<typename X, typename Y> friend class internal::broadcast_cache;
+        template<typename X, typename Y> friend class internal::round_robin_cache;
+        task *try_put_task(const input_type& v) __TBB_override {
+            key_matching_port_operation op_data(v, try__put);
+            task *rtask = NULL;
+            my_aggregator.execute(&op_data);
+            if(op_data.status == SUCCEEDED) {
+                rtask = my_join->increment_key_count((*(this->get_key_func()))(v), false);  // may spawn
+                // rtask has to reflect the return status of the try_put
+                if(!rtask) rtask = SUCCESSFULLY_ENQUEUED;
+            }
+            return rtask;
+        }
+
+        graph& graph_reference() __TBB_override {
+            return my_join->graph_ref;
+        }
+
+    public:
+
+        key_matching_port() : receiver<input_type>(), buffer_type() {
+            my_join = NULL;
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        // copy constructor
+        key_matching_port(const key_matching_port& /*other*/) : receiver<input_type>(), buffer_type() {
+            my_join = NULL;
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        ~key_matching_port() { }
+
+        void set_join_node_pointer(forwarding_base *join) {
+            my_join = dynamic_cast<matching_forwarding_base<key_type>*>(join);
+        }
+
+        void set_my_key_func(type_to_key_func_type *f) { this->set_key_func(f); }
+
+        type_to_key_func_type* get_my_key_func() { return this->get_key_func(); }
+
+        bool get_item( input_type &v ) {
+            // aggregator uses current_key from FE for Key
+            key_matching_port_operation op_data(&v, get__item);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        built_predecessors_type &built_predecessors() __TBB_override { return my_built_predecessors; }
+
+        void internal_add_built_predecessor(predecessor_type &p) __TBB_override {
+            key_matching_port_operation op_data(add_blt_pred);
+            op_data.pred = &p;
+            my_aggregator.execute(&op_data);
+        }
+
+        void internal_delete_built_predecessor(predecessor_type &p) __TBB_override {
+            key_matching_port_operation op_data(del_blt_pred);
+            op_data.pred = &p;
+            my_aggregator.execute(&op_data);
+        }
+
+        size_t predecessor_count() __TBB_override {
+            key_matching_port_operation op_data(blt_pred_cnt);
+            my_aggregator.execute(&op_data);
+            return op_data.cnt_val;
+        }
+
+        void copy_predecessors(predecessor_list_type &l) __TBB_override {
+            key_matching_port_operation op_data(blt_pred_cpy);
+            op_data.plist = &l;
+            my_aggregator.execute(&op_data);
+        }
+#endif
+
+        // reset_port is called when item is accepted by successor, but
+        // is initiated by join_node.
+        void reset_port() {
+            key_matching_port_operation op_data(res_port);
+            my_aggregator.execute(&op_data);
+            return;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract_receiver() {
+            buffer_type::reset();
+            my_built_predecessors.receiver_extract(*this);
+        }
+#endif
+        void reset_receiver(reset_flags f ) __TBB_override {
+            tbb::internal::suppress_unused_warning(f);
+            buffer_type::reset();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+           if (f & rf_clear_edges)
+              my_built_predecessors.clear();
+#endif
+        }
+
+    private:
+        // my_join forwarding base used to count number of inputs that
+        // received key.
+        matching_forwarding_base<key_type> *my_join;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        edge_container<predecessor_type> my_built_predecessors;
+#endif
+    };  // key_matching_port
+
+    using namespace graph_policy_namespace;
+
+    template<typename JP, typename InputTuple, typename OutputTuple>
+    class join_node_base;
+
+    //! join_node_FE : implements input port policy
+    template<typename JP, typename InputTuple, typename OutputTuple>
+    class join_node_FE;
+
+    template<typename InputTuple, typename OutputTuple>
+    class join_node_FE<reserving, InputTuple, OutputTuple> : public forwarding_base {
+    public:
+        static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+        typedef OutputTuple output_type;
+        typedef InputTuple input_type;
+        typedef join_node_base<reserving, InputTuple, OutputTuple> base_node_type; // for forwarding
+
+        join_node_FE(graph &g) : forwarding_base(g), my_node(NULL) {
+            ports_with_no_inputs = N;
+            join_helper<N>::set_join_node_pointer(my_inputs, this);
+        }
+
+        join_node_FE(const join_node_FE& other) : forwarding_base((other.forwarding_base::graph_ref)), my_node(NULL) {
+            ports_with_no_inputs = N;
+            join_helper<N>::set_join_node_pointer(my_inputs, this);
+        }
+
+        void set_my_node(base_node_type *new_my_node) { my_node = new_my_node; }
+
+       void increment_port_count() __TBB_override {
+            ++ports_with_no_inputs;
+        }
+
+        // if all input_ports have predecessors, spawn forward to try and consume tuples
+        task * decrement_port_count(bool handle_task) __TBB_override {
+            if(ports_with_no_inputs.fetch_and_decrement() == 1) {
+                if(internal::is_graph_active(this->graph_ref)) {
+                    task *rtask = new ( task::allocate_additional_child_of( *(this->graph_ref.root_task()) ) )
+                        forward_task_bypass<base_node_type>(*my_node);
+                    if(!handle_task) return rtask;
+                    internal::spawn_in_graph_arena(this->graph_ref, *rtask);
+                }
+            }
+            return NULL;
+        }
+
+        input_type &input_ports() { return my_inputs; }
+
+    protected:
+
+        void reset(  reset_flags f) {
+            // called outside of parallel contexts
+            ports_with_no_inputs = N;
+            join_helper<N>::reset_inputs(my_inputs, f);
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract( ) {
+            // called outside of parallel contexts
+            ports_with_no_inputs = N;
+            join_helper<N>::extract_inputs(my_inputs);
+        }
+#endif
+
+        // all methods on input ports should be called under mutual exclusion from join_node_base.
+
+        bool tuple_build_may_succeed() {
+            return !ports_with_no_inputs;
+        }
+
+        bool try_to_make_tuple(output_type &out) {
+            if(ports_with_no_inputs) return false;
+            return join_helper<N>::reserve(my_inputs, out);
+        }
+
+        void tuple_accepted() {
+            join_helper<N>::consume_reservations(my_inputs);
+        }
+        void tuple_rejected() {
+            join_helper<N>::release_reservations(my_inputs);
+        }
+
+        input_type my_inputs;
+        base_node_type *my_node;
+        atomic<size_t> ports_with_no_inputs;
+    };  // join_node_FE<reserving, ... >
+
+    template<typename InputTuple, typename OutputTuple>
+    class join_node_FE<queueing, InputTuple, OutputTuple> : public forwarding_base {
+    public:
+        static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+        typedef OutputTuple output_type;
+        typedef InputTuple input_type;
+        typedef join_node_base<queueing, InputTuple, OutputTuple> base_node_type; // for forwarding
+
+        join_node_FE(graph &g) : forwarding_base(g), my_node(NULL) {
+            ports_with_no_items = N;
+            join_helper<N>::set_join_node_pointer(my_inputs, this);
+        }
+
+        join_node_FE(const join_node_FE& other) : forwarding_base((other.forwarding_base::graph_ref)), my_node(NULL) {
+            ports_with_no_items = N;
+            join_helper<N>::set_join_node_pointer(my_inputs, this);
+        }
+
+        // needed for forwarding
+        void set_my_node(base_node_type *new_my_node) { my_node = new_my_node; }
+
+        void reset_port_count() {
+            ports_with_no_items = N;
+        }
+
+        // if all input_ports have items, spawn forward to try and consume tuples
+        task * decrement_port_count(bool handle_task) __TBB_override
+        {
+            if(ports_with_no_items.fetch_and_decrement() == 1) {
+                if(internal::is_graph_active(this->graph_ref)) {
+                    task *rtask = new ( task::allocate_additional_child_of( *(this->graph_ref.root_task()) ) )
+                        forward_task_bypass <base_node_type>(*my_node);
+                    if(!handle_task) return rtask;
+                    internal::spawn_in_graph_arena(this->graph_ref, *rtask);
+                }
+            }
+            return NULL;
+        }
+
+        void increment_port_count() __TBB_override { __TBB_ASSERT(false, NULL); }  // should never be called
+
+        input_type &input_ports() { return my_inputs; }
+
+    protected:
+
+        void reset(  reset_flags f) {
+            reset_port_count();
+            join_helper<N>::reset_inputs(my_inputs, f );
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract() {
+            reset_port_count();
+            join_helper<N>::extract_inputs(my_inputs);
+        }
+#endif
+        // all methods on input ports should be called under mutual exclusion from join_node_base.
+
+        bool tuple_build_may_succeed() {
+            return !ports_with_no_items;
+        }
+
+        bool try_to_make_tuple(output_type &out) {
+            if(ports_with_no_items) return false;
+            return join_helper<N>::get_items(my_inputs, out);
+        }
+
+        void tuple_accepted() {
+            reset_port_count();
+            join_helper<N>::reset_ports(my_inputs);
+        }
+        void tuple_rejected() {
+            // nothing to do.
+        }
+
+        input_type my_inputs;
+        base_node_type *my_node;
+        atomic<size_t> ports_with_no_items;
+    };  // join_node_FE<queueing, ...>
+
+    // key_matching join front-end.
+    template<typename InputTuple, typename OutputTuple, typename K, typename KHash>
+    class join_node_FE<key_matching<K,KHash>, InputTuple, OutputTuple> : public matching_forwarding_base<K>,
+             // buffer of key value counts
+              public hash_buffer<   // typedefed below to key_to_count_buffer_type
+                  typename tbb::internal::strip<K>::type&,        // force ref type on K
+                  count_element<typename tbb::internal::strip<K>::type>,
+                  internal::type_to_key_function_body<
+                      count_element<typename tbb::internal::strip<K>::type>,
+                      typename tbb::internal::strip<K>::type& >,
+                  KHash >,
+             // buffer of output items
+             public item_buffer<OutputTuple> {
+    public:
+        static const int N = tbb::flow::tuple_size<OutputTuple>::value;
+        typedef OutputTuple output_type;
+        typedef InputTuple input_type;
+        typedef K key_type;
+        typedef typename tbb::internal::strip<key_type>::type unref_key_type;
+        typedef KHash key_hash_compare;
+        // must use K without ref.
+        typedef count_element<unref_key_type> count_element_type;
+        // method that lets us refer to the key of this type.
+        typedef key_to_count_functor<unref_key_type> key_to_count_func;
+        typedef internal::type_to_key_function_body< count_element_type, unref_key_type&> TtoK_function_body_type;
+        typedef internal::type_to_key_function_body_leaf<count_element_type, unref_key_type&, key_to_count_func> TtoK_function_body_leaf_type;
+        // this is the type of the special table that keeps track of the number of discrete
+        // elements corresponding to each key that we've seen.
+        typedef hash_buffer< unref_key_type&, count_element_type, TtoK_function_body_type, key_hash_compare >
+                 key_to_count_buffer_type;
+        typedef item_buffer<output_type> output_buffer_type;
+        typedef join_node_base<key_matching<key_type,key_hash_compare>, InputTuple, OutputTuple> base_node_type; // for forwarding
+        typedef matching_forwarding_base<key_type> forwarding_base_type;
+
+// ----------- Aggregator ------------
+        // the aggregator is only needed to serialize the access to the hash table.
+        // and the output_buffer_type base class
+    private:
+        enum op_type { res_count, inc_count, may_succeed, try_make };
+        enum op_stat {WAIT=0, SUCCEEDED, FAILED};
+        typedef join_node_FE<key_matching<key_type,key_hash_compare>, InputTuple, OutputTuple> class_type;
+
+        class key_matching_FE_operation : public aggregated_operation<key_matching_FE_operation> {
+        public:
+            char type;
+            unref_key_type my_val;
+            output_type* my_output;
+            task *bypass_t;
+            bool enqueue_task;
+            // constructor for value parameter
+            key_matching_FE_operation(const unref_key_type& e , bool q_task , op_type t) : type(char(t)), my_val(e),
+                 my_output(NULL), bypass_t(NULL), enqueue_task(q_task) {}
+            key_matching_FE_operation(output_type *p, op_type t) : type(char(t)), my_output(p), bypass_t(NULL),
+                 enqueue_task(true) {}
+            // constructor with no parameter
+            key_matching_FE_operation(op_type t) : type(char(t)), my_output(NULL), bypass_t(NULL), enqueue_task(true) {}
+        };
+
+        typedef internal::aggregating_functor<class_type, key_matching_FE_operation> handler_type;
+        friend class internal::aggregating_functor<class_type, key_matching_FE_operation>;
+        aggregator<handler_type, key_matching_FE_operation> my_aggregator;
+
+        // called from aggregator, so serialized
+        // returns a task pointer if the a task would have been enqueued but we asked that
+        // it be returned.  Otherwise returns NULL.
+        task * fill_output_buffer(unref_key_type &t, bool should_enqueue, bool handle_task) {
+            output_type l_out;
+            task *rtask = NULL;
+            bool do_fwd = should_enqueue && this->buffer_empty() && internal::is_graph_active(this->graph_ref);
+            this->current_key = t;
+            this->delete_with_key(this->current_key);   // remove the key
+            if(join_helper<N>::get_items(my_inputs, l_out)) {  //  <== call back
+                this->push_back(l_out);
+                if(do_fwd) {  // we enqueue if receiving an item from predecessor, not if successor asks for item
+                    rtask = new ( task::allocate_additional_child_of( *(this->graph_ref.root_task()) ) )
+                        forward_task_bypass<base_node_type>(*my_node);
+                    if(handle_task) {
+                        internal::spawn_in_graph_arena(this->graph_ref, *rtask);
+                        rtask = NULL;
+                    }
+                    do_fwd = false;
+                }
+                // retire the input values
+                join_helper<N>::reset_ports(my_inputs);  //  <== call back
+            }
+            else {
+                __TBB_ASSERT(false, "should have had something to push");
+            }
+            return rtask;
+        }
+
+        void handle_operations(key_matching_FE_operation* op_list) {
+            key_matching_FE_operation *current;
+            while(op_list) {
+                current = op_list;
+                op_list = op_list->next;
+                switch(current->type) {
+                case res_count:  // called from BE
+                    {
+                        this->destroy_front();
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                    }
+                    break;
+                case inc_count: {  // called from input ports
+                        count_element_type *p = 0;
+                        unref_key_type &t = current->my_val;
+                        bool do_enqueue = current->enqueue_task;
+                        if(!(this->find_ref_with_key(t,p))) {
+                            count_element_type ev;
+                            ev.my_key = t;
+                            ev.my_value = 0;
+                            this->insert_with_key(ev);
+                            if(!(this->find_ref_with_key(t,p))) {
+                                __TBB_ASSERT(false, "should find key after inserting it");
+                            }
+                        }
+                        if(++(p->my_value) == size_t(N)) {
+                            task *rtask = fill_output_buffer(t, true, do_enqueue);
+                            __TBB_ASSERT(!rtask || !do_enqueue, "task should not be returned");
+                            current->bypass_t = rtask;
+                        }
+                    }
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case may_succeed:  // called from BE
+                    __TBB_store_with_release(current->status, this->buffer_empty() ? FAILED : SUCCEEDED);
+                    break;
+                case try_make:  // called from BE
+                    if(this->buffer_empty()) {
+                        __TBB_store_with_release(current->status, FAILED);
+                    }
+                    else {
+                        *(current->my_output) = this->front();
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                    }
+                    break;
+                }
+            }
+        }
+// ------------ End Aggregator ---------------
+
+    public:
+        template<typename FunctionTuple>
+        join_node_FE(graph &g, FunctionTuple &TtoK_funcs) : forwarding_base_type(g), my_node(NULL) {
+            join_helper<N>::set_join_node_pointer(my_inputs, this);
+            join_helper<N>::set_key_functors(my_inputs, TtoK_funcs);
+            my_aggregator.initialize_handler(handler_type(this));
+                    TtoK_function_body_type *cfb = new TtoK_function_body_leaf_type(key_to_count_func());
+            this->set_key_func(cfb);
+        }
+
+        join_node_FE(const join_node_FE& other) : forwarding_base_type((other.forwarding_base_type::graph_ref)), key_to_count_buffer_type(),
+        output_buffer_type() {
+            my_node = NULL;
+            join_helper<N>::set_join_node_pointer(my_inputs, this);
+            join_helper<N>::copy_key_functors(my_inputs, const_cast<input_type &>(other.my_inputs));
+            my_aggregator.initialize_handler(handler_type(this));
+            TtoK_function_body_type *cfb = new TtoK_function_body_leaf_type(key_to_count_func());
+            this->set_key_func(cfb);
+        }
+
+        // needed for forwarding
+        void set_my_node(base_node_type *new_my_node) { my_node = new_my_node; }
+
+        void reset_port_count() {  // called from BE
+            key_matching_FE_operation op_data(res_count);
+            my_aggregator.execute(&op_data);
+            return;
+        }
+
+        // if all input_ports have items, spawn forward to try and consume tuples
+        // return a task if we are asked and did create one.
+        task *increment_key_count(unref_key_type const & t, bool handle_task) __TBB_override {  // called from input_ports
+            key_matching_FE_operation op_data(t, handle_task, inc_count);
+            my_aggregator.execute(&op_data);
+            return op_data.bypass_t;
+        }
+
+        task *decrement_port_count(bool /*handle_task*/) __TBB_override { __TBB_ASSERT(false, NULL); return NULL; }
+
+        void increment_port_count() __TBB_override { __TBB_ASSERT(false, NULL); }  // should never be called
+
+        input_type &input_ports() { return my_inputs; }
+
+    protected:
+
+        void reset(  reset_flags f ) {
+            // called outside of parallel contexts
+            join_helper<N>::reset_inputs(my_inputs, f);
+
+            key_to_count_buffer_type::reset();
+            output_buffer_type::reset();
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract() {
+            // called outside of parallel contexts
+            join_helper<N>::extract_inputs(my_inputs);
+            key_to_count_buffer_type::reset();  // have to reset the tag counts
+            output_buffer_type::reset();  // also the queue of outputs
+            // my_node->current_tag = NO_TAG;
+        }
+#endif
+        // all methods on input ports should be called under mutual exclusion from join_node_base.
+
+        bool tuple_build_may_succeed() {  // called from back-end
+            key_matching_FE_operation op_data(may_succeed);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        // cannot lock while calling back to input_ports.  current_key will only be set
+        // and reset under the aggregator, so it will remain consistent.
+        bool try_to_make_tuple(output_type &out) {
+            key_matching_FE_operation op_data(&out,try_make);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        void tuple_accepted() {
+            reset_port_count();  // reset current_key after ports reset.
+        }
+
+        void tuple_rejected() {
+            // nothing to do.
+        }
+
+        input_type my_inputs;  // input ports
+        base_node_type *my_node;
+    }; // join_node_FE<key_matching<K,KHash>, InputTuple, OutputTuple>
+
+    //! join_node_base
+    template<typename JP, typename InputTuple, typename OutputTuple>
+    class join_node_base : public graph_node, public join_node_FE<JP, InputTuple, OutputTuple>,
+                           public sender<OutputTuple> {
+    protected:
+        using graph_node::my_graph;
+    public:
+        typedef OutputTuple output_type;
+
+        typedef typename sender<output_type>::successor_type successor_type;
+        typedef join_node_FE<JP, InputTuple, OutputTuple> input_ports_type;
+        using input_ports_type::tuple_build_may_succeed;
+        using input_ports_type::try_to_make_tuple;
+        using input_ports_type::tuple_accepted;
+        using input_ports_type::tuple_rejected;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename sender<output_type>::built_successors_type built_successors_type;
+        typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+
+    private:
+        // ----------- Aggregator ------------
+        enum op_type { reg_succ, rem_succ, try__get, do_fwrd, do_fwrd_bypass
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            , add_blt_succ, del_blt_succ, blt_succ_cnt, blt_succ_cpy
+#endif
+        };
+        enum op_stat {WAIT=0, SUCCEEDED, FAILED};
+        typedef join_node_base<JP,InputTuple,OutputTuple> class_type;
+
+        class join_node_base_operation : public aggregated_operation<join_node_base_operation> {
+        public:
+            char type;
+            union {
+                output_type *my_arg;
+                successor_type *my_succ;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                size_t cnt_val;
+                successor_list_type *slist;
+#endif
+            };
+            task *bypass_t;
+            join_node_base_operation(const output_type& e, op_type t) : type(char(t)),
+                my_arg(const_cast<output_type*>(&e)), bypass_t(NULL) {}
+            join_node_base_operation(const successor_type &s, op_type t) : type(char(t)),
+                my_succ(const_cast<successor_type *>(&s)), bypass_t(NULL) {}
+            join_node_base_operation(op_type t) : type(char(t)), bypass_t(NULL) {}
+        };
+
+        typedef internal::aggregating_functor<class_type, join_node_base_operation> handler_type;
+        friend class internal::aggregating_functor<class_type, join_node_base_operation>;
+        bool forwarder_busy;
+        aggregator<handler_type, join_node_base_operation> my_aggregator;
+
+        void handle_operations(join_node_base_operation* op_list) {
+            join_node_base_operation *current;
+            while(op_list) {
+                current = op_list;
+                op_list = op_list->next;
+                switch(current->type) {
+                case reg_succ: {
+                        my_successors.register_successor(*(current->my_succ));
+                        if(tuple_build_may_succeed() && !forwarder_busy && internal::is_graph_active(my_graph)) {
+                            task *rtask = new ( task::allocate_additional_child_of(*(my_graph.root_task())) )
+                                    forward_task_bypass
+                                    <join_node_base<JP,InputTuple,OutputTuple> >(*this);
+                            internal::spawn_in_graph_arena(my_graph, *rtask);
+                            forwarder_busy = true;
+                        }
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                    }
+                    break;
+                case rem_succ:
+                    my_successors.remove_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case try__get:
+                    if(tuple_build_may_succeed()) {
+                        if(try_to_make_tuple(*(current->my_arg))) {
+                            tuple_accepted();
+                            __TBB_store_with_release(current->status, SUCCEEDED);
+                        }
+                        else __TBB_store_with_release(current->status, FAILED);
+                    }
+                    else __TBB_store_with_release(current->status, FAILED);
+                    break;
+                case do_fwrd_bypass: {
+                        bool build_succeeded;
+                        task *last_task = NULL;
+                        output_type out;
+                        if(tuple_build_may_succeed()) {  // checks output queue of FE
+                            do {
+                                build_succeeded = try_to_make_tuple(out);  // fetch front_end of queue
+                                if(build_succeeded) {
+                                    task *new_task = my_successors.try_put_task(out);
+                                    last_task = combine_tasks(my_graph, last_task, new_task);
+                                    if(new_task) {
+                                        tuple_accepted();
+                                    }
+                                    else {
+                                        tuple_rejected();
+                                        build_succeeded = false;
+                                    }
+                                }
+                            } while(build_succeeded);
+                        }
+                        current->bypass_t = last_task;
+                        __TBB_store_with_release(current->status, SUCCEEDED);
+                        forwarder_busy = false;
+                    }
+                    break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                case add_blt_succ:
+                    my_successors.internal_add_built_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case del_blt_succ:
+                    my_successors.internal_delete_built_successor(*(current->my_succ));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_succ_cnt:
+                    current->cnt_val = my_successors.successor_count();
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+                case blt_succ_cpy:
+                    my_successors.copy_successors(*(current->slist));
+                    __TBB_store_with_release(current->status, SUCCEEDED);
+                    break;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+                }
+            }
+        }
+        // ---------- end aggregator -----------
+    public:
+        join_node_base(graph &g) : graph_node(g), input_ports_type(g), forwarder_busy(false) {
+            my_successors.set_owner(this);
+            input_ports_type::set_my_node(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        join_node_base(const join_node_base& other) :
+            graph_node(other.graph_node::my_graph), input_ports_type(other),
+            sender<OutputTuple>(), forwarder_busy(false), my_successors() {
+            my_successors.set_owner(this);
+            input_ports_type::set_my_node(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        template<typename FunctionTuple>
+        join_node_base(graph &g, FunctionTuple f) : graph_node(g), input_ports_type(g, f), forwarder_busy(false) {
+            my_successors.set_owner(this);
+            input_ports_type::set_my_node(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        bool register_successor(successor_type &r) __TBB_override {
+            join_node_base_operation op_data(r, reg_succ);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        bool remove_successor( successor_type &r) __TBB_override {
+            join_node_base_operation op_data(r, rem_succ);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+        bool try_get( output_type &v) __TBB_override {
+            join_node_base_operation op_data(v, try__get);
+            my_aggregator.execute(&op_data);
+            return op_data.status == SUCCEEDED;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        built_successors_type &built_successors() __TBB_override { return my_successors.built_successors(); }
+
+        void internal_add_built_successor( successor_type &r) __TBB_override {
+            join_node_base_operation op_data(r, add_blt_succ);
+            my_aggregator.execute(&op_data);
+        }
+
+        void internal_delete_built_successor( successor_type &r) __TBB_override {
+            join_node_base_operation op_data(r, del_blt_succ);
+            my_aggregator.execute(&op_data);
+        }
+
+        size_t successor_count() __TBB_override {
+            join_node_base_operation op_data(blt_succ_cnt);
+            my_aggregator.execute(&op_data);
+            return op_data.cnt_val;
+        }
+
+        void copy_successors(successor_list_type &l) __TBB_override {
+            join_node_base_operation op_data(blt_succ_cpy);
+            op_data.slist = &l;
+            my_aggregator.execute(&op_data);
+        }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract() __TBB_override {
+            input_ports_type::extract();
+            my_successors.built_successors().sender_extract(*this);
+        }
+#endif
+
+    protected:
+
+        void reset_node(reset_flags f) __TBB_override {
+            input_ports_type::reset(f);
+            if(f & rf_clear_edges) my_successors.clear();
+        }
+
+    private:
+        broadcast_cache<output_type, null_rw_mutex> my_successors;
+
+        friend class forward_task_bypass< join_node_base<JP, InputTuple, OutputTuple> >;
+        task *forward_task() {
+            join_node_base_operation op_data(do_fwrd_bypass);
+            my_aggregator.execute(&op_data);
+            return op_data.bypass_t;
+        }
+
+    };  // join_node_base
+
+    // join base class type generator
+    template<int N, template<class> class PT, typename OutputTuple, typename JP>
+    struct join_base {
+        typedef typename internal::join_node_base<JP, typename wrap_tuple_elements<N,PT,OutputTuple>::type, OutputTuple> type;
+    };
+
+    template<int N, typename OutputTuple, typename K, typename KHash>
+    struct join_base<N, key_matching_port, OutputTuple, key_matching<K,KHash> > {
+        typedef key_matching<K, KHash> key_traits_type;
+        typedef K key_type;
+        typedef KHash key_hash_compare;
+        typedef typename internal::join_node_base< key_traits_type,
+                // ports type
+                typename wrap_key_tuple_elements<N,key_matching_port,key_traits_type,OutputTuple>::type,
+                OutputTuple > type;
+    };
+
+    //! unfolded_join_node : passes input_ports_type to join_node_base.  We build the input port type
+    //  using tuple_element.  The class PT is the port type (reserving_port, queueing_port, key_matching_port)
+    //  and should match the typename.
+
+    template<int N, template<class> class PT, typename OutputTuple, typename JP>
+    class unfolded_join_node : public join_base<N,PT,OutputTuple,JP>::type {
+    public:
+        typedef typename wrap_tuple_elements<N, PT, OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<JP, input_ports_type, output_type > base_type;
+    public:
+        unfolded_join_node(graph &g) : base_type(g) {}
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+    template <typename K, typename T>
+    struct key_from_message_body {
+        K operator()(const T& t) const {
+            using tbb::flow::key_from_message;
+            return key_from_message<K>(t);
+        }
+    };
+    // Adds const to reference type
+    template <typename K, typename T>
+    struct key_from_message_body<K&,T> {
+        const K& operator()(const T& t) const {
+            using tbb::flow::key_from_message;
+            return key_from_message<const K&>(t);
+        }
+    };
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+    // key_matching unfolded_join_node.  This must be a separate specialization because the constructors
+    // differ.
+
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<2,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<2,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+    public:
+        typedef typename wrap_key_tuple_elements<2,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash>, input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 2, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<3,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<3,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+    public:
+        typedef typename wrap_key_tuple_elements<3,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash>, input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 3, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<4,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<4,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+    public:
+        typedef typename wrap_key_tuple_elements<4,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash>, input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 4, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<5,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<5,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+        typedef typename tbb::flow::tuple_element<4, OutputTuple>::type T4;
+    public:
+        typedef typename wrap_key_tuple_elements<5,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash> , input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename internal::type_to_key_function_body<T4, K> *f4_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p, f4_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>()),
+                    new internal::type_to_key_function_body_leaf<T4, K, key_from_message_body<K,T4> >(key_from_message_body<K,T4>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3, typename Body4>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3, Body4 body4) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3),
+                    new internal::type_to_key_function_body_leaf<T4, K, Body4>(body4)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 5, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+
+#if __TBB_VARIADIC_MAX >= 6
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<6,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<6,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+        typedef typename tbb::flow::tuple_element<4, OutputTuple>::type T4;
+        typedef typename tbb::flow::tuple_element<5, OutputTuple>::type T5;
+    public:
+        typedef typename wrap_key_tuple_elements<6,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash> , input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename internal::type_to_key_function_body<T4, K> *f4_p;
+        typedef typename internal::type_to_key_function_body<T5, K> *f5_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p, f4_p, f5_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>()),
+                    new internal::type_to_key_function_body_leaf<T4, K, key_from_message_body<K,T4> >(key_from_message_body<K,T4>()),
+                    new internal::type_to_key_function_body_leaf<T5, K, key_from_message_body<K,T5> >(key_from_message_body<K,T5>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3, typename Body4, typename Body5>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3, Body4 body4, Body5 body5)
+                : base_type(g, func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3),
+                    new internal::type_to_key_function_body_leaf<T4, K, Body4>(body4),
+                    new internal::type_to_key_function_body_leaf<T5, K, Body5>(body5)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 6, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 7
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<7,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<7,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+        typedef typename tbb::flow::tuple_element<4, OutputTuple>::type T4;
+        typedef typename tbb::flow::tuple_element<5, OutputTuple>::type T5;
+        typedef typename tbb::flow::tuple_element<6, OutputTuple>::type T6;
+    public:
+        typedef typename wrap_key_tuple_elements<7,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash> , input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename internal::type_to_key_function_body<T4, K> *f4_p;
+        typedef typename internal::type_to_key_function_body<T5, K> *f5_p;
+        typedef typename internal::type_to_key_function_body<T6, K> *f6_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p, f4_p, f5_p, f6_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>()),
+                    new internal::type_to_key_function_body_leaf<T4, K, key_from_message_body<K,T4> >(key_from_message_body<K,T4>()),
+                    new internal::type_to_key_function_body_leaf<T5, K, key_from_message_body<K,T5> >(key_from_message_body<K,T5>()),
+                    new internal::type_to_key_function_body_leaf<T6, K, key_from_message_body<K,T6> >(key_from_message_body<K,T6>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3, typename Body4,
+                 typename Body5, typename Body6>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3, Body4 body4,
+                Body5 body5, Body6 body6) : base_type(g, func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3),
+                    new internal::type_to_key_function_body_leaf<T4, K, Body4>(body4),
+                    new internal::type_to_key_function_body_leaf<T5, K, Body5>(body5),
+                    new internal::type_to_key_function_body_leaf<T6, K, Body6>(body6)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 7, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 8
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<8,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<8,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+        typedef typename tbb::flow::tuple_element<4, OutputTuple>::type T4;
+        typedef typename tbb::flow::tuple_element<5, OutputTuple>::type T5;
+        typedef typename tbb::flow::tuple_element<6, OutputTuple>::type T6;
+        typedef typename tbb::flow::tuple_element<7, OutputTuple>::type T7;
+    public:
+        typedef typename wrap_key_tuple_elements<8,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash> , input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename internal::type_to_key_function_body<T4, K> *f4_p;
+        typedef typename internal::type_to_key_function_body<T5, K> *f5_p;
+        typedef typename internal::type_to_key_function_body<T6, K> *f6_p;
+        typedef typename internal::type_to_key_function_body<T7, K> *f7_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p, f4_p, f5_p, f6_p, f7_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>()),
+                    new internal::type_to_key_function_body_leaf<T4, K, key_from_message_body<K,T4> >(key_from_message_body<K,T4>()),
+                    new internal::type_to_key_function_body_leaf<T5, K, key_from_message_body<K,T5> >(key_from_message_body<K,T5>()),
+                    new internal::type_to_key_function_body_leaf<T6, K, key_from_message_body<K,T6> >(key_from_message_body<K,T6>()),
+                    new internal::type_to_key_function_body_leaf<T7, K, key_from_message_body<K,T7> >(key_from_message_body<K,T7>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3, typename Body4,
+                 typename Body5, typename Body6, typename Body7>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3, Body4 body4,
+                Body5 body5, Body6 body6, Body7 body7) : base_type(g, func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3),
+                    new internal::type_to_key_function_body_leaf<T4, K, Body4>(body4),
+                    new internal::type_to_key_function_body_leaf<T5, K, Body5>(body5),
+                    new internal::type_to_key_function_body_leaf<T6, K, Body6>(body6),
+                    new internal::type_to_key_function_body_leaf<T7, K, Body7>(body7)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 8, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 9
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<9,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<9,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+        typedef typename tbb::flow::tuple_element<4, OutputTuple>::type T4;
+        typedef typename tbb::flow::tuple_element<5, OutputTuple>::type T5;
+        typedef typename tbb::flow::tuple_element<6, OutputTuple>::type T6;
+        typedef typename tbb::flow::tuple_element<7, OutputTuple>::type T7;
+        typedef typename tbb::flow::tuple_element<8, OutputTuple>::type T8;
+    public:
+        typedef typename wrap_key_tuple_elements<9,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash> , input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename internal::type_to_key_function_body<T4, K> *f4_p;
+        typedef typename internal::type_to_key_function_body<T5, K> *f5_p;
+        typedef typename internal::type_to_key_function_body<T6, K> *f6_p;
+        typedef typename internal::type_to_key_function_body<T7, K> *f7_p;
+        typedef typename internal::type_to_key_function_body<T8, K> *f8_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p, f4_p, f5_p, f6_p, f7_p, f8_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>()),
+                    new internal::type_to_key_function_body_leaf<T4, K, key_from_message_body<K,T4> >(key_from_message_body<K,T4>()),
+                    new internal::type_to_key_function_body_leaf<T5, K, key_from_message_body<K,T5> >(key_from_message_body<K,T5>()),
+                    new internal::type_to_key_function_body_leaf<T6, K, key_from_message_body<K,T6> >(key_from_message_body<K,T6>()),
+                    new internal::type_to_key_function_body_leaf<T7, K, key_from_message_body<K,T7> >(key_from_message_body<K,T7>()),
+                    new internal::type_to_key_function_body_leaf<T8, K, key_from_message_body<K,T8> >(key_from_message_body<K,T8>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3, typename Body4,
+                 typename Body5, typename Body6, typename Body7, typename Body8>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3, Body4 body4,
+                Body5 body5, Body6 body6, Body7 body7, Body8 body8) : base_type(g, func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3),
+                    new internal::type_to_key_function_body_leaf<T4, K, Body4>(body4),
+                    new internal::type_to_key_function_body_leaf<T5, K, Body5>(body5),
+                    new internal::type_to_key_function_body_leaf<T6, K, Body6>(body6),
+                    new internal::type_to_key_function_body_leaf<T7, K, Body7>(body7),
+                    new internal::type_to_key_function_body_leaf<T8, K, Body8>(body8)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 9, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 10
+    template<typename OutputTuple, typename K, typename KHash>
+    class unfolded_join_node<10,key_matching_port,OutputTuple,key_matching<K,KHash> > : public
+            join_base<10,key_matching_port,OutputTuple,key_matching<K,KHash> >::type {
+        typedef typename tbb::flow::tuple_element<0, OutputTuple>::type T0;
+        typedef typename tbb::flow::tuple_element<1, OutputTuple>::type T1;
+        typedef typename tbb::flow::tuple_element<2, OutputTuple>::type T2;
+        typedef typename tbb::flow::tuple_element<3, OutputTuple>::type T3;
+        typedef typename tbb::flow::tuple_element<4, OutputTuple>::type T4;
+        typedef typename tbb::flow::tuple_element<5, OutputTuple>::type T5;
+        typedef typename tbb::flow::tuple_element<6, OutputTuple>::type T6;
+        typedef typename tbb::flow::tuple_element<7, OutputTuple>::type T7;
+        typedef typename tbb::flow::tuple_element<8, OutputTuple>::type T8;
+        typedef typename tbb::flow::tuple_element<9, OutputTuple>::type T9;
+    public:
+        typedef typename wrap_key_tuple_elements<10,key_matching_port,key_matching<K,KHash>,OutputTuple>::type input_ports_type;
+        typedef OutputTuple output_type;
+    private:
+        typedef join_node_base<key_matching<K,KHash> , input_ports_type, output_type > base_type;
+        typedef typename internal::type_to_key_function_body<T0, K> *f0_p;
+        typedef typename internal::type_to_key_function_body<T1, K> *f1_p;
+        typedef typename internal::type_to_key_function_body<T2, K> *f2_p;
+        typedef typename internal::type_to_key_function_body<T3, K> *f3_p;
+        typedef typename internal::type_to_key_function_body<T4, K> *f4_p;
+        typedef typename internal::type_to_key_function_body<T5, K> *f5_p;
+        typedef typename internal::type_to_key_function_body<T6, K> *f6_p;
+        typedef typename internal::type_to_key_function_body<T7, K> *f7_p;
+        typedef typename internal::type_to_key_function_body<T8, K> *f8_p;
+        typedef typename internal::type_to_key_function_body<T9, K> *f9_p;
+        typedef typename tbb::flow::tuple< f0_p, f1_p, f2_p, f3_p, f4_p, f5_p, f6_p, f7_p, f8_p, f9_p > func_initializer_type;
+    public:
+#if __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING
+        unfolded_join_node(graph &g) : base_type(g,
+                func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, key_from_message_body<K,T0> >(key_from_message_body<K,T0>()),
+                    new internal::type_to_key_function_body_leaf<T1, K, key_from_message_body<K,T1> >(key_from_message_body<K,T1>()),
+                    new internal::type_to_key_function_body_leaf<T2, K, key_from_message_body<K,T2> >(key_from_message_body<K,T2>()),
+                    new internal::type_to_key_function_body_leaf<T3, K, key_from_message_body<K,T3> >(key_from_message_body<K,T3>()),
+                    new internal::type_to_key_function_body_leaf<T4, K, key_from_message_body<K,T4> >(key_from_message_body<K,T4>()),
+                    new internal::type_to_key_function_body_leaf<T5, K, key_from_message_body<K,T5> >(key_from_message_body<K,T5>()),
+                    new internal::type_to_key_function_body_leaf<T6, K, key_from_message_body<K,T6> >(key_from_message_body<K,T6>()),
+                    new internal::type_to_key_function_body_leaf<T7, K, key_from_message_body<K,T7> >(key_from_message_body<K,T7>()),
+                    new internal::type_to_key_function_body_leaf<T8, K, key_from_message_body<K,T8> >(key_from_message_body<K,T8>()),
+                    new internal::type_to_key_function_body_leaf<T9, K, key_from_message_body<K,T9> >(key_from_message_body<K,T9>())
+                    ) ) {
+        }
+#endif /* __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING */
+        template<typename Body0, typename Body1, typename Body2, typename Body3, typename Body4,
+            typename Body5, typename Body6, typename Body7, typename Body8, typename Body9>
+        unfolded_join_node(graph &g, Body0 body0, Body1 body1, Body2 body2, Body3 body3, Body4 body4,
+                Body5 body5, Body6 body6, Body7 body7, Body8 body8, Body9 body9) : base_type(g, func_initializer_type(
+                    new internal::type_to_key_function_body_leaf<T0, K, Body0>(body0),
+                    new internal::type_to_key_function_body_leaf<T1, K, Body1>(body1),
+                    new internal::type_to_key_function_body_leaf<T2, K, Body2>(body2),
+                    new internal::type_to_key_function_body_leaf<T3, K, Body3>(body3),
+                    new internal::type_to_key_function_body_leaf<T4, K, Body4>(body4),
+                    new internal::type_to_key_function_body_leaf<T5, K, Body5>(body5),
+                    new internal::type_to_key_function_body_leaf<T6, K, Body6>(body6),
+                    new internal::type_to_key_function_body_leaf<T7, K, Body7>(body7),
+                    new internal::type_to_key_function_body_leaf<T8, K, Body8>(body8),
+                    new internal::type_to_key_function_body_leaf<T9, K, Body9>(body9)
+                    ) ) {
+            __TBB_STATIC_ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 10, "wrong number of body initializers");
+        }
+        unfolded_join_node(const unfolded_join_node &other) : base_type(other) {}
+    };
+#endif
+
+    //! templated function to refer to input ports of the join node
+    template<size_t N, typename JNT>
+    typename tbb::flow::tuple_element<N, typename JNT::input_ports_type>::type &input_port(JNT &jn) {
+        return tbb::flow::get<N>(jn.input_ports());
+    }
+
+}
+#endif // __TBB__flow_graph_join_impl_H
+
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_node_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_node_impl.h
new file mode 100644
index 00000000..7ed776af
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_node_impl.h
@@ -0,0 +1,896 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_node_impl_H
+#define __TBB__flow_graph_node_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#include "_flow_graph_item_buffer_impl.h"
+
+//! @cond INTERNAL
+namespace internal {
+
+    using tbb::internal::aggregated_operation;
+    using tbb::internal::aggregating_functor;
+    using tbb::internal::aggregator;
+
+     template< typename T, typename A >
+     class function_input_queue : public item_buffer<T,A> {
+     public:
+         bool empty() const {
+             return this->buffer_empty();
+         }
+
+         const T& front() const {
+             return this->item_buffer<T, A>::front();
+         }
+
+         bool pop( T& t ) {
+             return this->pop_front( t );
+         }
+
+         void pop() {
+             this->destroy_front();
+         }
+
+         bool push( T& t ) {
+             return this->push_back( t );
+         }
+     };
+
+    //! Input and scheduling for a function node that takes a type Input as input
+    //  The only up-ref is apply_body_impl, which should implement the function
+    //  call and any handling of the result.
+    template< typename Input, typename Policy, typename A, typename ImplType >
+    class function_input_base : public receiver<Input>, tbb::internal::no_assign {
+        enum op_type {reg_pred, rem_pred, try_fwd, tryput_bypass, app_body_bypass, occupy_concurrency
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            , add_blt_pred, del_blt_pred,
+            blt_pred_cnt, blt_pred_cpy   // create vector copies of preds and succs
+#endif
+        };
+        typedef function_input_base<Input, Policy, A, ImplType> class_type;
+
+    public:
+
+        //! The input type of this receiver
+        typedef Input input_type;
+        typedef typename receiver<input_type>::predecessor_type predecessor_type;
+        typedef predecessor_cache<input_type, null_mutex > predecessor_cache_type;
+        typedef function_input_queue<input_type, A> input_queue_type;
+        typedef typename A::template rebind< input_queue_type >::other queue_allocator_type;
+        __TBB_STATIC_ASSERT(!((internal::has_policy<queueing, Policy>::value) && (internal::has_policy<rejecting, Policy>::value)),
+                              "queueing and rejecting policies can't be specified simultaneously");
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename predecessor_cache_type::built_predecessors_type built_predecessors_type;
+        typedef typename receiver<input_type>::predecessor_list_type predecessor_list_type;
+#endif
+
+        //! Constructor for function_input_base
+        function_input_base(
+            graph &g, __TBB_FLOW_GRAPH_PRIORITY_ARG1(size_t max_concurrency, node_priority_t priority)
+        ) : my_graph_ref(g), my_max_concurrency(max_concurrency)
+          , __TBB_FLOW_GRAPH_PRIORITY_ARG1(my_concurrency(0), my_priority(priority))
+          , my_queue(!internal::has_policy<rejecting, Policy>::value ? new input_queue_type() : NULL)
+          , forwarder_busy(false)
+        {
+            my_predecessors.set_owner(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        //! Copy constructor
+        function_input_base( const function_input_base& src)
+            : receiver<Input>(), tbb::internal::no_assign()
+            , my_graph_ref(src.my_graph_ref), my_max_concurrency(src.my_max_concurrency)
+            , __TBB_FLOW_GRAPH_PRIORITY_ARG1(my_concurrency(0), my_priority(src.my_priority))
+            , my_queue(src.my_queue ? new input_queue_type() : NULL), forwarder_busy(false)
+        {
+            my_predecessors.set_owner(this);
+            my_aggregator.initialize_handler(handler_type(this));
+        }
+
+        //! Destructor
+        // The queue is allocated by the constructor for {multi}function_node.
+        // TODO: pass the graph_buffer_policy to the base so it can allocate the queue instead.
+        // This would be an interface-breaking change.
+        virtual ~function_input_base() {
+            if ( my_queue ) delete my_queue;
+        }
+
+        task* try_put_task( const input_type& t) __TBB_override {
+            return try_put_task_impl(t, internal::has_policy<lightweight, Policy>());
+        }
+
+        //! Adds src to the list of cached predecessors.
+        bool register_predecessor( predecessor_type &src ) __TBB_override {
+            operation_type op_data(reg_pred);
+            op_data.r = &src;
+            my_aggregator.execute(&op_data);
+            return true;
+        }
+
+        //! Removes src from the list of cached predecessors.
+        bool remove_predecessor( predecessor_type &src ) __TBB_override {
+            operation_type op_data(rem_pred);
+            op_data.r = &src;
+            my_aggregator.execute(&op_data);
+            return true;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        //! Adds to list of predecessors added by make_edge
+        void internal_add_built_predecessor( predecessor_type &src) __TBB_override {
+            operation_type op_data(add_blt_pred);
+            op_data.r = &src;
+            my_aggregator.execute(&op_data);
+        }
+
+        //! removes from to list of predecessors (used by remove_edge)
+        void internal_delete_built_predecessor( predecessor_type &src) __TBB_override {
+            operation_type op_data(del_blt_pred);
+            op_data.r = &src;
+            my_aggregator.execute(&op_data);
+        }
+
+        size_t predecessor_count() __TBB_override {
+            operation_type op_data(blt_pred_cnt);
+            my_aggregator.execute(&op_data);
+            return op_data.cnt_val;
+        }
+
+        void copy_predecessors(predecessor_list_type &v) __TBB_override {
+            operation_type op_data(blt_pred_cpy);
+            op_data.predv = &v;
+            my_aggregator.execute(&op_data);
+        }
+
+        built_predecessors_type &built_predecessors() __TBB_override {
+            return my_predecessors.built_predecessors();
+        }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+    protected:
+
+        void reset_function_input_base( reset_flags f) {
+            my_concurrency = 0;
+            if(my_queue) {
+                my_queue->reset();
+            }
+            reset_receiver(f);
+            forwarder_busy = false;
+        }
+
+        graph& my_graph_ref;
+        const size_t my_max_concurrency;
+        size_t my_concurrency;
+        __TBB_FLOW_GRAPH_PRIORITY_EXPR( node_priority_t my_priority; )
+        input_queue_type *my_queue;
+        predecessor_cache<input_type, null_mutex > my_predecessors;
+
+        void reset_receiver( reset_flags f) __TBB_override {
+            if( f & rf_clear_edges) my_predecessors.clear();
+            else
+                my_predecessors.reset();
+            __TBB_ASSERT(!(f & rf_clear_edges) || my_predecessors.empty(), "function_input_base reset failed");
+        }
+
+        graph& graph_reference() __TBB_override {
+            return my_graph_ref;
+        }
+
+        task* try_get_postponed_task(const input_type& i) {
+            operation_type op_data(i, app_body_bypass);  // tries to pop an item or get_item
+            my_aggregator.execute(&op_data);
+            return op_data.bypass_t;
+        }
+
+    private:
+
+        friend class apply_body_task_bypass< class_type, input_type >;
+        friend class forward_task_bypass< class_type >;
+
+        class operation_type : public aggregated_operation< operation_type > {
+        public:
+            char type;
+            union {
+                input_type *elem;
+                predecessor_type *r;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                size_t cnt_val;
+                predecessor_list_type *predv;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+            };
+            tbb::task *bypass_t;
+            operation_type(const input_type& e, op_type t) :
+                type(char(t)), elem(const_cast<input_type*>(&e)) {}
+            operation_type(op_type t) : type(char(t)), r(NULL) {}
+        };
+
+        bool forwarder_busy;
+        typedef internal::aggregating_functor<class_type, operation_type> handler_type;
+        friend class internal::aggregating_functor<class_type, operation_type>;
+        aggregator< handler_type, operation_type > my_aggregator;
+
+        task* perform_queued_requests() {
+            task* new_task = NULL;
+            if(my_queue) {
+                if(!my_queue->empty()) {
+                    ++my_concurrency;
+                    new_task = create_body_task(my_queue->front());
+
+                    my_queue->pop();
+                }
+            }
+            else {
+                input_type i;
+                if(my_predecessors.get_item(i)) {
+                    ++my_concurrency;
+                    new_task = create_body_task(i);
+                }
+            }
+            return new_task;
+        }
+        void handle_operations(operation_type *op_list) {
+            operation_type *tmp;
+            while (op_list) {
+                tmp = op_list;
+                op_list = op_list->next;
+                switch (tmp->type) {
+                case reg_pred:
+                    my_predecessors.add(*(tmp->r));
+                    __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    if (!forwarder_busy) {
+                        forwarder_busy = true;
+                        spawn_forward_task();
+                    }
+                    break;
+                case rem_pred:
+                    my_predecessors.remove(*(tmp->r));
+                    __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    break;
+                case app_body_bypass: {
+                        tmp->bypass_t = NULL;
+                        __TBB_ASSERT(my_max_concurrency != 0, NULL);
+                        --my_concurrency;
+                        if(my_concurrency<my_max_concurrency)
+                            tmp->bypass_t = perform_queued_requests();
+
+                        __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    }
+                    break;
+                case tryput_bypass: internal_try_put_task(tmp);  break;
+                case try_fwd: internal_forward(tmp);  break;
+                case occupy_concurrency:
+                    if (my_concurrency < my_max_concurrency) {
+                        ++my_concurrency;
+                        __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    } else {
+                        __TBB_store_with_release(tmp->status, FAILED);
+                    }
+                    break;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+                case add_blt_pred: {
+                         my_predecessors.internal_add_built_predecessor(*(tmp->r));
+                        __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    }
+                    break;
+                case del_blt_pred:
+                    my_predecessors.internal_delete_built_predecessor(*(tmp->r));
+                    __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    break;
+                case blt_pred_cnt:
+                    tmp->cnt_val = my_predecessors.predecessor_count();
+                    __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    break;
+                case blt_pred_cpy:
+                    my_predecessors.copy_predecessors( *(tmp->predv) );
+                    __TBB_store_with_release(tmp->status, SUCCEEDED);
+                    break;
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+                }
+            }
+        }
+
+        //! Put to the node, but return the task instead of enqueueing it
+        void internal_try_put_task(operation_type *op) {
+            __TBB_ASSERT(my_max_concurrency != 0, NULL);
+            if (my_concurrency < my_max_concurrency) {
+               ++my_concurrency;
+               task * new_task = create_body_task(*(op->elem));
+               op->bypass_t = new_task;
+               __TBB_store_with_release(op->status, SUCCEEDED);
+           } else if ( my_queue && my_queue->push(*(op->elem)) ) {
+               op->bypass_t = SUCCESSFULLY_ENQUEUED;
+               __TBB_store_with_release(op->status, SUCCEEDED);
+           } else {
+               op->bypass_t = NULL;
+               __TBB_store_with_release(op->status, FAILED);
+           }
+        }
+
+        //! Creates tasks for postponed messages if available and if concurrency allows
+        void internal_forward(operation_type *op) {
+            op->bypass_t = NULL;
+            if (my_concurrency < my_max_concurrency || !my_max_concurrency)
+                op->bypass_t = perform_queued_requests();
+            if(op->bypass_t)
+                __TBB_store_with_release(op->status, SUCCEEDED);
+            else {
+                forwarder_busy = false;
+                __TBB_store_with_release(op->status, FAILED);
+            }
+        }
+
+        task* internal_try_put_bypass( const input_type& t ) {
+            operation_type op_data(t, tryput_bypass);
+            my_aggregator.execute(&op_data);
+            if( op_data.status == internal::SUCCEEDED ) {
+                return op_data.bypass_t;
+            }
+            return NULL;
+        }
+
+        task* try_put_task_impl( const input_type& t, /*lightweight=*/tbb::internal::true_type ) {
+            if( my_max_concurrency == 0 ) {
+                return apply_body_bypass(t);
+            } else {
+                operation_type check_op(t, occupy_concurrency);
+                my_aggregator.execute(&check_op);
+                if( check_op.status == internal::SUCCEEDED ) {
+                    return apply_body_bypass(t);
+                }
+                return internal_try_put_bypass(t);
+            }
+        }
+
+        task* try_put_task_impl( const input_type& t, /*lightweight=*/tbb::internal::false_type ) {
+            if( my_max_concurrency == 0 ) {
+                return create_body_task(t);
+            } else {
+                return internal_try_put_bypass(t);
+            }
+        }
+
+        //! Applies the body to the provided input
+        //  then decides if more work is available
+        task * apply_body_bypass( const input_type &i ) {
+            return static_cast<ImplType *>(this)->apply_body_impl_bypass(i);
+        }
+
+        //! allocates a task to apply a body
+        inline task * create_body_task( const input_type &input ) {
+            return (internal::is_graph_active(my_graph_ref)) ?
+                new( task::allocate_additional_child_of(*(my_graph_ref.root_task())) )
+                apply_body_task_bypass < class_type, input_type >(
+                    *this, __TBB_FLOW_GRAPH_PRIORITY_ARG1(input, my_priority))
+                : NULL;
+        }
+
+       //! This is executed by an enqueued task, the "forwarder"
+       task* forward_task() {
+           operation_type op_data(try_fwd);
+           task* rval = NULL;
+           do {
+               op_data.status = WAIT;
+               my_aggregator.execute(&op_data);
+               if(op_data.status == SUCCEEDED) {
+                   task* ttask = op_data.bypass_t;
+                   __TBB_ASSERT( ttask && ttask != SUCCESSFULLY_ENQUEUED, NULL );
+                   rval = combine_tasks(my_graph_ref, rval, ttask);
+               }
+           } while (op_data.status == SUCCEEDED);
+           return rval;
+       }
+
+       inline task *create_forward_task() {
+           return (internal::is_graph_active(my_graph_ref)) ?
+               new( task::allocate_additional_child_of(*(my_graph_ref.root_task())) )
+               forward_task_bypass< class_type >( __TBB_FLOW_GRAPH_PRIORITY_ARG1(*this, my_priority) )
+               : NULL;
+       }
+
+       //! Spawns a task that calls forward()
+       inline void spawn_forward_task() {
+           task* tp = create_forward_task();
+           if(tp) {
+               internal::spawn_in_graph_arena(graph_reference(), *tp);
+           }
+       }
+    };  // function_input_base
+
+    //! Implements methods for a function node that takes a type Input as input and sends
+    //  a type Output to its successors.
+    template< typename Input, typename Output, typename Policy, typename A>
+    class function_input : public function_input_base<Input, Policy, A, function_input<Input,Output,Policy,A> > {
+    public:
+        typedef Input input_type;
+        typedef Output output_type;
+        typedef function_body<input_type, output_type> function_body_type;
+        typedef function_input<Input, Output, Policy,A> my_class;
+        typedef function_input_base<Input, Policy, A, my_class> base_type;
+        typedef function_input_queue<input_type, A> input_queue_type;
+
+        // constructor
+        template<typename Body>
+        function_input(
+            graph &g, size_t max_concurrency,
+            __TBB_FLOW_GRAPH_PRIORITY_ARG1(Body& body, node_priority_t priority)
+        ) : base_type(g, __TBB_FLOW_GRAPH_PRIORITY_ARG1(max_concurrency, priority))
+          , my_body( new internal::function_body_leaf< input_type, output_type, Body>(body) )
+          , my_init_body( new internal::function_body_leaf< input_type, output_type, Body>(body) ) {
+        }
+
+        //! Copy constructor
+        function_input( const function_input& src ) :
+                base_type(src),
+                my_body( src.my_init_body->clone() ),
+                my_init_body(src.my_init_body->clone() ) {
+        }
+
+        ~function_input() {
+            delete my_body;
+            delete my_init_body;
+        }
+
+        template< typename Body >
+        Body copy_function_object() {
+            function_body_type &body_ref = *this->my_body;
+            return dynamic_cast< internal::function_body_leaf<input_type, output_type, Body> & >(body_ref).get_body();
+        }
+
+        output_type apply_body_impl( const input_type& i) {
+            // There is an extra copied needed to capture the
+            // body execution without the try_put
+            tbb::internal::fgt_begin_body( my_body );
+            output_type v = (*my_body)(i);
+            tbb::internal::fgt_end_body( my_body );
+            return v;
+        }
+
+        //TODO: consider moving into the base class
+        task * apply_body_impl_bypass( const input_type &i) {
+            output_type v = apply_body_impl(i);
+#if TBB_DEPRECATED_MESSAGE_FLOW_ORDER
+            task* successor_task = successors().try_put_task(v);
+#endif
+            task* postponed_task = NULL;
+            if( base_type::my_max_concurrency != 0 ) {
+                postponed_task = base_type::try_get_postponed_task(i);
+                __TBB_ASSERT( !postponed_task || postponed_task != SUCCESSFULLY_ENQUEUED, NULL );
+            }
+#if TBB_DEPRECATED_MESSAGE_FLOW_ORDER
+            graph& g = base_type::my_graph_ref;
+            return combine_tasks(g, successor_task, postponed_task);
+#else
+            if( postponed_task ) {
+                // make the task available for other workers since we do not know successors'
+                // execution policy
+                internal::spawn_in_graph_arena(base_type::graph_reference(), *postponed_task);
+            }
+            task* successor_task = successors().try_put_task(v);
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (push)
+#pragma warning (disable: 4127)  /* suppress conditional expression is constant */
+#endif
+            if(internal::has_policy<lightweight, Policy>::value) {
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (pop)
+#endif
+                if(!successor_task) {
+                    // Return confirmative status since current
+                    // node's body has been executed anyway
+                    successor_task = SUCCESSFULLY_ENQUEUED;
+                }
+            }
+            return successor_task;
+#endif /* TBB_DEPRECATED_MESSAGE_FLOW_ORDER */
+        }
+
+    protected:
+
+        void reset_function_input(reset_flags f) {
+            base_type::reset_function_input_base(f);
+            if(f & rf_reset_bodies) {
+                function_body_type *tmp = my_init_body->clone();
+                delete my_body;
+                my_body = tmp;
+            }
+        }
+
+        function_body_type *my_body;
+        function_body_type *my_init_body;
+        virtual broadcast_cache<output_type > &successors() = 0;
+
+    };  // function_input
+
+
+    // helper templates to clear the successor edges of the output ports of an multifunction_node
+    template<int N> struct clear_element {
+        template<typename P> static void clear_this(P &p) {
+            (void)tbb::flow::get<N-1>(p).successors().clear();
+            clear_element<N-1>::clear_this(p);
+        }
+        template<typename P> static bool this_empty(P &p) {
+            if(tbb::flow::get<N-1>(p).successors().empty())
+                return clear_element<N-1>::this_empty(p);
+            return false;
+        }
+    };
+
+    template<> struct clear_element<1> {
+        template<typename P> static void clear_this(P &p) {
+            (void)tbb::flow::get<0>(p).successors().clear();
+        }
+        template<typename P> static bool this_empty(P &p) {
+            return tbb::flow::get<0>(p).successors().empty();
+        }
+    };
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    // helper templates to extract the output ports of an multifunction_node from graph
+    template<int N> struct extract_element {
+        template<typename P> static void extract_this(P &p) {
+            (void)tbb::flow::get<N-1>(p).successors().built_successors().sender_extract(tbb::flow::get<N-1>(p));
+            extract_element<N-1>::extract_this(p);
+        }
+    };
+
+    template<> struct extract_element<1> {
+        template<typename P> static void extract_this(P &p) {
+            (void)tbb::flow::get<0>(p).successors().built_successors().sender_extract(tbb::flow::get<0>(p));
+        }
+    };
+#endif
+
+    //! Implements methods for a function node that takes a type Input as input
+    //  and has a tuple of output ports specified.
+    template< typename Input, typename OutputPortSet, typename Policy, typename A>
+    class multifunction_input : public function_input_base<Input, Policy, A, multifunction_input<Input,OutputPortSet,Policy,A> > {
+    public:
+        static const int N = tbb::flow::tuple_size<OutputPortSet>::value;
+        typedef Input input_type;
+        typedef OutputPortSet output_ports_type;
+        typedef multifunction_body<input_type, output_ports_type> multifunction_body_type;
+        typedef multifunction_input<Input, OutputPortSet, Policy, A> my_class;
+        typedef function_input_base<Input, Policy, A, my_class> base_type;
+        typedef function_input_queue<input_type, A> input_queue_type;
+
+        // constructor
+        template<typename Body>
+        multifunction_input(graph &g, size_t max_concurrency,
+                            __TBB_FLOW_GRAPH_PRIORITY_ARG1(Body& body, node_priority_t priority)
+        ) : base_type(g, __TBB_FLOW_GRAPH_PRIORITY_ARG1(max_concurrency, priority))
+          , my_body( new internal::multifunction_body_leaf<input_type, output_ports_type, Body>(body) )
+          , my_init_body( new internal::multifunction_body_leaf<input_type, output_ports_type, Body>(body) ) {
+        }
+
+        //! Copy constructor
+        multifunction_input( const multifunction_input& src ) :
+                base_type(src),
+                my_body( src.my_init_body->clone() ),
+                my_init_body(src.my_init_body->clone() ) {
+        }
+
+        ~multifunction_input() {
+            delete my_body;
+            delete my_init_body;
+        }
+
+        template< typename Body >
+        Body copy_function_object() {
+            multifunction_body_type &body_ref = *this->my_body;
+            return *static_cast<Body*>(dynamic_cast< internal::multifunction_body_leaf<input_type, output_ports_type, Body> & >(body_ref).get_body_ptr());
+        }
+
+        // for multifunction nodes we do not have a single successor as such.  So we just tell
+        // the task we were successful.
+        //TODO: consider moving common parts with implementation in function_input into separate function
+        task * apply_body_impl_bypass( const input_type &i) {
+            tbb::internal::fgt_begin_body( my_body );
+            (*my_body)(i, my_output_ports);
+            tbb::internal::fgt_end_body( my_body );
+            task* ttask = NULL;
+            if(base_type::my_max_concurrency != 0) {
+                ttask = base_type::try_get_postponed_task(i);
+            }
+            return ttask ? ttask : SUCCESSFULLY_ENQUEUED;
+        }
+
+        output_ports_type &output_ports(){ return my_output_ports; }
+
+    protected:
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        void extract() {
+            extract_element<N>::extract_this(my_output_ports);
+        }
+#endif
+
+        void reset(reset_flags f) {
+            base_type::reset_function_input_base(f);
+            if(f & rf_clear_edges)clear_element<N>::clear_this(my_output_ports);
+            if(f & rf_reset_bodies) {
+                multifunction_body_type *tmp = my_init_body->clone();
+                delete my_body;
+                my_body = tmp;
+            }
+            __TBB_ASSERT(!(f & rf_clear_edges) || clear_element<N>::this_empty(my_output_ports), "multifunction_node reset failed");
+        }
+
+        multifunction_body_type *my_body;
+        multifunction_body_type *my_init_body;
+        output_ports_type my_output_ports;
+
+    };  // multifunction_input
+
+    // template to refer to an output port of a multifunction_node
+    template<size_t N, typename MOP>
+    typename tbb::flow::tuple_element<N, typename MOP::output_ports_type>::type &output_port(MOP &op) {
+        return tbb::flow::get<N>(op.output_ports());
+    }
+
+    inline void check_task_and_spawn(graph& g, task* t) {
+        if (t && t != SUCCESSFULLY_ENQUEUED) {
+            internal::spawn_in_graph_arena(g, *t);
+        }
+    }
+
+    // helper structs for split_node
+    template<int N>
+    struct emit_element {
+        template<typename T, typename P>
+        static task* emit_this(graph& g, const T &t, P &p) {
+            // TODO: consider to collect all the tasks in task_list and spawn them all at once
+            task* last_task = tbb::flow::get<N-1>(p).try_put_task(tbb::flow::get<N-1>(t));
+            check_task_and_spawn(g, last_task);
+            return emit_element<N-1>::emit_this(g,t,p);
+        }
+    };
+
+    template<>
+    struct emit_element<1> {
+        template<typename T, typename P>
+        static task* emit_this(graph& g, const T &t, P &p) {
+            task* last_task = tbb::flow::get<0>(p).try_put_task(tbb::flow::get<0>(t));
+            check_task_and_spawn(g, last_task);
+            return SUCCESSFULLY_ENQUEUED;
+        }
+    };
+
+    //! Implements methods for an executable node that takes continue_msg as input
+    template< typename Output, typename Policy>
+    class continue_input : public continue_receiver {
+    public:
+
+        //! The input type of this receiver
+        typedef continue_msg input_type;
+
+        //! The output type of this receiver
+        typedef Output output_type;
+        typedef function_body<input_type, output_type> function_body_type;
+        typedef continue_input<output_type, Policy> class_type;
+
+        template< typename Body >
+        continue_input( graph &g, __TBB_FLOW_GRAPH_PRIORITY_ARG1(Body& body, node_priority_t priority) )
+            : continue_receiver(__TBB_FLOW_GRAPH_PRIORITY_ARG1(/*number_of_predecessors=*/0, priority))
+            , my_graph_ref(g)
+            , my_body( new internal::function_body_leaf< input_type, output_type, Body>(body) )
+            , my_init_body( new internal::function_body_leaf< input_type, output_type, Body>(body) )
+            { }
+
+        template< typename Body >
+        continue_input( graph &g, int number_of_predecessors,
+                        __TBB_FLOW_GRAPH_PRIORITY_ARG1(Body& body, node_priority_t priority)
+        ) : continue_receiver( __TBB_FLOW_GRAPH_PRIORITY_ARG1(number_of_predecessors, priority) )
+          , my_graph_ref(g)
+          , my_body( new internal::function_body_leaf< input_type, output_type, Body>(body) )
+          , my_init_body( new internal::function_body_leaf< input_type, output_type, Body>(body) )
+        { }
+
+        continue_input( const continue_input& src ) : continue_receiver(src),
+            my_graph_ref(src.my_graph_ref),
+            my_body( src.my_init_body->clone() ),
+            my_init_body( src.my_init_body->clone() ) {}
+
+        ~continue_input() {
+            delete my_body;
+            delete my_init_body;
+        }
+
+        template< typename Body >
+        Body copy_function_object() {
+            function_body_type &body_ref = *my_body;
+            return dynamic_cast< internal::function_body_leaf<input_type, output_type, Body> & >(body_ref).get_body();
+        }
+
+        void reset_receiver( reset_flags f) __TBB_override {
+            continue_receiver::reset_receiver(f);
+            if(f & rf_reset_bodies) {
+                function_body_type *tmp = my_init_body->clone();
+                delete my_body;
+                my_body = tmp;
+            }
+        }
+
+    protected:
+
+        graph& my_graph_ref;
+        function_body_type *my_body;
+        function_body_type *my_init_body;
+
+        virtual broadcast_cache<output_type > &successors() = 0;
+
+        friend class apply_body_task_bypass< class_type, continue_msg >;
+
+        //! Applies the body to the provided input
+        task *apply_body_bypass( input_type ) {
+            // There is an extra copied needed to capture the
+            // body execution without the try_put
+            tbb::internal::fgt_begin_body( my_body );
+            output_type v = (*my_body)( continue_msg() );
+            tbb::internal::fgt_end_body( my_body );
+            return successors().try_put_task( v );
+        }
+
+        task* execute() __TBB_override {
+            if(!internal::is_graph_active(my_graph_ref)) {
+                return NULL;
+            }
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (push)
+#pragma warning (disable: 4127)  /* suppress conditional expression is constant */
+#endif
+            if(internal::has_policy<lightweight, Policy>::value) {
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (pop)
+#endif
+                return apply_body_bypass( continue_msg() );
+            }
+            else {
+                return new ( task::allocate_additional_child_of( *(my_graph_ref.root_task()) ) )
+                       apply_body_task_bypass< class_type, continue_msg >(
+                           *this, __TBB_FLOW_GRAPH_PRIORITY_ARG1(continue_msg(), my_priority) );
+            }
+        }
+
+        graph& graph_reference() __TBB_override {
+            return my_graph_ref;
+        }
+    };  // continue_input
+
+    //! Implements methods for both executable and function nodes that puts Output to its successors
+    template< typename Output >
+    class function_output : public sender<Output> {
+    public:
+
+        template<int N> friend struct clear_element;
+        typedef Output output_type;
+        typedef typename sender<output_type>::successor_type successor_type;
+        typedef broadcast_cache<output_type> broadcast_cache_type;
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename sender<output_type>::built_successors_type built_successors_type;
+        typedef typename sender<output_type>::successor_list_type successor_list_type;
+#endif
+
+        function_output() { my_successors.set_owner(this); }
+        function_output(const function_output & /*other*/) : sender<output_type>() {
+            my_successors.set_owner(this);
+        }
+
+        //! Adds a new successor to this node
+        bool register_successor( successor_type &r ) __TBB_override {
+            successors().register_successor( r );
+            return true;
+        }
+
+        //! Removes a successor from this node
+        bool remove_successor( successor_type &r ) __TBB_override {
+            successors().remove_successor( r );
+            return true;
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        built_successors_type &built_successors() __TBB_override { return successors().built_successors(); }
+
+
+        void internal_add_built_successor( successor_type &r) __TBB_override {
+            successors().internal_add_built_successor( r );
+        }
+
+        void internal_delete_built_successor( successor_type &r) __TBB_override {
+            successors().internal_delete_built_successor( r );
+        }
+
+        size_t successor_count() __TBB_override {
+            return successors().successor_count();
+        }
+
+        void  copy_successors( successor_list_type &v) __TBB_override {
+            successors().copy_successors(v);
+        }
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+        // for multifunction_node.  The function_body that implements
+        // the node will have an input and an output tuple of ports.  To put
+        // an item to a successor, the body should
+        //
+        //    get<I>(output_ports).try_put(output_value);
+        //
+        // if task pointer is returned will always spawn and return true, else
+        // return value will be bool returned from successors.try_put.
+        task *try_put_task(const output_type &i) { // not a virtual method in this class
+            return my_successors.try_put_task(i);
+        }
+
+        broadcast_cache_type &successors() { return my_successors; }
+    protected:
+        broadcast_cache_type my_successors;
+
+    };  // function_output
+
+    template< typename Output >
+    class multifunction_output : public function_output<Output> {
+    public:
+        typedef Output output_type;
+        typedef function_output<output_type> base_type;
+        using base_type::my_successors;
+
+        multifunction_output() : base_type() {my_successors.set_owner(this);}
+        multifunction_output( const multifunction_output &/*other*/) : base_type() { my_successors.set_owner(this); }
+
+        bool try_put(const output_type &i) {
+            task *res = try_put_task(i);
+            if(!res) return false;
+            if(res != SUCCESSFULLY_ENQUEUED) {
+                FLOW_SPAWN(*res); // TODO: Spawn task inside arena
+            }
+            return true;
+        }
+
+    protected:
+
+        task* try_put_task(const output_type &i) {
+            return my_successors.try_put_task(i);
+        }
+
+        template <int N> friend struct emit_element;
+
+    };  // multifunction_output
+
+//composite_node
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+    template<typename CompositeType>
+    void add_nodes_impl(CompositeType*, bool) {}
+
+    template< typename CompositeType, typename NodeType1, typename... NodeTypes >
+    void add_nodes_impl(CompositeType *c_node, bool visible, const NodeType1& n1, const NodeTypes&... n) {
+        void *addr = const_cast<NodeType1 *>(&n1);
+
+        fgt_alias_port(c_node, addr, visible);
+        add_nodes_impl(c_node, visible, n...);
+    }
+#endif
+
+}  // internal
+
+#endif // __TBB__flow_graph_node_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_streaming_node.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_streaming_node.h
new file mode 100644
index 00000000..dae3e7a2
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_streaming_node.h
@@ -0,0 +1,745 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_flow_graph_streaming_H
+#define __TBB_flow_graph_streaming_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#if __TBB_PREVIEW_STREAMING_NODE
+
+// Included in namespace tbb::flow::interfaceX (in flow_graph.h)
+
+namespace internal {
+
+template <int N1, int N2>
+struct port_ref_impl {
+    // "+1" since the port_ref range is a closed interval (includes its endpoints).
+    static const int size = N2 - N1 + 1;
+};
+
+} // internal
+
+// The purpose of the port_ref_impl is the pretty syntax: the deduction of a compile-time constant is processed from the return type.
+// So it is possible to use this helper without parentheses, e.g. "port_ref<0>".
+template <int N1, int N2 = N1>
+internal::port_ref_impl<N1,N2> port_ref() {
+    return internal::port_ref_impl<N1,N2>();
+};
+
+namespace internal {
+
+template <typename T>
+struct num_arguments {
+    static const int value = 1;
+};
+
+template <int N1, int N2>
+struct num_arguments<port_ref_impl<N1,N2>(*)()> {
+    static const int value = port_ref_impl<N1,N2>::size;
+};
+
+template <int N1, int N2>
+struct num_arguments<port_ref_impl<N1,N2>> {
+    static const int value = port_ref_impl<N1,N2>::size;
+};
+
+template <typename... Args>
+void ignore_return_values( Args&&... ) {}
+
+template <typename T>
+T or_return_values( T&& t ) { return t; }
+template <typename T, typename... Rest>
+T or_return_values( T&& t, Rest&&... rest ) {
+    return t | or_return_values( std::forward<Rest>(rest)... );
+}
+
+template<typename JP>
+struct key_from_policy {
+    typedef size_t type;
+    typedef std::false_type is_key_matching;
+};
+
+template<typename Key>
+struct key_from_policy< key_matching<Key> > {
+    typedef Key type;
+    typedef std::true_type is_key_matching;
+};
+
+template<typename Key>
+struct key_from_policy< key_matching<Key&> > {
+    typedef const Key &type;
+    typedef std::true_type is_key_matching;
+};
+
+template<typename Device, typename Key>
+class streaming_device_with_key {
+    Device my_device;
+    typename std::decay<Key>::type my_key;
+public:
+    // TODO: investigate why default constructor is required
+    streaming_device_with_key() {}
+    streaming_device_with_key( const Device& d, Key k ) : my_device( d ), my_key( k ) {}
+    Key key() const { return my_key; }
+    const Device& device() const { return my_device; }
+};
+
+// --------- Kernel argument helpers --------- //
+template <typename T>
+struct is_port_ref_impl {
+    typedef std::false_type type;
+};
+
+template <int N1, int N2>
+struct is_port_ref_impl< port_ref_impl<N1, N2> > {
+    typedef std::true_type type;
+};
+
+template <int N1, int N2>
+struct is_port_ref_impl< port_ref_impl<N1, N2>( * )()  > {
+    typedef std::true_type type;
+};
+
+template <typename T>
+struct is_port_ref {
+    typedef typename is_port_ref_impl< typename tbb::internal::strip<T>::type >::type type;
+};
+
+template <typename ...Args1>
+struct convert_and_call_impl;
+
+template <typename A1, typename ...Args1>
+struct convert_and_call_impl<A1, Args1...> {
+    static const size_t my_delta = 1; // Index 0 contains device
+
+    template <typename F, typename Tuple, typename ...Args2>
+    static void doit(F& f, Tuple& t, A1& a1, Args1&... args1, Args2&... args2) {
+        convert_and_call_impl<A1, Args1...>::doit_impl(typename is_port_ref<A1>::type(), f, t, a1, args1..., args2...);
+    }
+    template <typename F, typename Tuple, typename ...Args2>
+    static void doit_impl(std::false_type, F& f, Tuple& t, A1& a1, Args1&... args1, Args2&... args2) {
+        convert_and_call_impl<Args1...>::doit(f, t, args1..., args2..., a1);
+    }
+    template <typename F, typename Tuple, int N1, int N2, typename ...Args2>
+    static void doit_impl(std::true_type x, F& f, Tuple& t, port_ref_impl<N1, N2>, Args1&... args1, Args2&... args2) {
+        convert_and_call_impl<port_ref_impl<N1 + 1,N2>, Args1...>::doit_impl(x, f, t, port_ref<N1 + 1, N2>(), args1...,
+            args2..., std::get<N1 + my_delta>(t));
+    }
+    template <typename F, typename Tuple, int N, typename ...Args2>
+    static void doit_impl(std::true_type, F& f, Tuple& t, port_ref_impl<N, N>, Args1&... args1, Args2&... args2) {
+        convert_and_call_impl<Args1...>::doit(f, t, args1..., args2..., std::get<N + my_delta>(t));
+    }
+
+    template <typename F, typename Tuple, int N1, int N2, typename ...Args2>
+    static void doit_impl(std::true_type x, F& f, Tuple& t, port_ref_impl<N1, N2>(* fn)(), Args1&... args1, Args2&... args2) {
+        doit_impl(x, f, t, fn(), args1..., args2...);
+    }
+    template <typename F, typename Tuple, int N, typename ...Args2>
+    static void doit_impl(std::true_type x, F& f, Tuple& t, port_ref_impl<N, N>(* fn)(), Args1&... args1, Args2&... args2) {
+        doit_impl(x, f, t, fn(), args1..., args2...);
+    }
+};
+
+template <>
+struct convert_and_call_impl<> {
+    template <typename F, typename Tuple, typename ...Args2>
+    static void doit(F& f, Tuple&, Args2&... args2) {
+        f(args2...);
+    }
+};
+// ------------------------------------------- //
+
+template<typename JP, typename StreamFactory, typename... Ports>
+struct streaming_node_traits {
+    // Do not use 'using' instead of 'struct' because Microsoft Visual C++ 12.0 fails to compile.
+    template <typename T>
+    struct async_msg_type {
+        typedef typename StreamFactory::template async_msg_type<T> type;
+    };
+
+    typedef tuple< typename async_msg_type<Ports>::type... > input_tuple;
+    typedef input_tuple output_tuple;
+    typedef tuple< streaming_device_with_key< typename StreamFactory::device_type, typename key_from_policy<JP>::type >,
+        typename async_msg_type<Ports>::type... > kernel_input_tuple;
+
+    // indexer_node parameters pack expansion workaround for VS2013 for streaming_node
+    typedef indexer_node< typename async_msg_type<Ports>::type... > indexer_node_type;
+};
+
+// Default empty implementation
+template<typename StreamFactory, typename KernelInputTuple, typename = void>
+class kernel_executor_helper {
+    typedef typename StreamFactory::device_type device_type;
+    typedef typename StreamFactory::kernel_type kernel_type;
+    typedef KernelInputTuple kernel_input_tuple;
+protected:
+    template <typename ...Args>
+    void enqueue_kernel_impl( kernel_input_tuple&, StreamFactory& factory, device_type device, const kernel_type& kernel, Args&... args ) const {
+        factory.send_kernel( device, kernel, args... );
+    }
+};
+
+// Implementation for StreamFactory supporting range
+template<typename StreamFactory, typename KernelInputTuple>
+class kernel_executor_helper<StreamFactory, KernelInputTuple, typename tbb::internal::void_t< typename StreamFactory::range_type >::type > {
+    typedef typename StreamFactory::device_type device_type;
+    typedef typename StreamFactory::kernel_type kernel_type;
+    typedef KernelInputTuple kernel_input_tuple;
+
+    typedef typename StreamFactory::range_type range_type;
+
+    // Container for randge. It can contain either port references or real range.
+    struct range_wrapper {
+        virtual range_type get_range( const kernel_input_tuple &ip ) const = 0;
+        virtual range_wrapper *clone() const = 0;
+        virtual ~range_wrapper() {}
+    };
+
+    struct range_value : public range_wrapper {
+        range_value( const range_type& value ) : my_value(value) {}
+
+        range_value( range_type&& value ) : my_value(std::move(value)) {}
+
+        range_type get_range( const kernel_input_tuple & ) const __TBB_override {
+            return my_value;
+        }
+
+        range_wrapper *clone() const __TBB_override {
+            return new range_value(my_value);
+        }
+    private:
+        range_type my_value;
+    };
+
+    template <int N>
+    struct range_mapper : public range_wrapper {
+        range_mapper() {}
+
+        range_type get_range( const kernel_input_tuple &ip ) const __TBB_override {
+            // "+1" since get<0>(ip) is StreamFactory::device.
+            return get<N + 1>(ip).data(false);
+        }
+
+        range_wrapper *clone() const __TBB_override {
+            return new range_mapper<N>;
+        }
+    };
+
+protected:
+    template <typename ...Args>
+    void enqueue_kernel_impl( kernel_input_tuple& ip, StreamFactory& factory, device_type device, const kernel_type& kernel, Args&... args ) const {
+        __TBB_ASSERT(my_range_wrapper, "Range is not set. Call set_range() before running streaming_node.");
+        factory.send_kernel( device, kernel, my_range_wrapper->get_range(ip), args... );
+    }
+
+public:
+    kernel_executor_helper() : my_range_wrapper(NULL) {}
+
+    kernel_executor_helper(const kernel_executor_helper& executor) : my_range_wrapper(executor.my_range_wrapper ? executor.my_range_wrapper->clone() : NULL) {}
+
+    kernel_executor_helper(kernel_executor_helper&& executor) : my_range_wrapper(executor.my_range_wrapper) {
+        // Set moving holder mappers to NULL to prevent double deallocation
+        executor.my_range_wrapper = NULL;
+    }
+
+    ~kernel_executor_helper() {
+        if (my_range_wrapper) delete my_range_wrapper;
+    }
+
+    void set_range(const range_type& work_size) {
+        my_range_wrapper = new range_value(work_size);
+    }
+
+    void set_range(range_type&& work_size) {
+        my_range_wrapper = new range_value(std::move(work_size));
+    }
+
+    template <int N>
+    void set_range(port_ref_impl<N, N>) {
+        my_range_wrapper = new range_mapper<N>;
+    }
+
+    template <int N>
+    void set_range(port_ref_impl<N, N>(*)()) {
+        my_range_wrapper = new range_mapper<N>;
+    }
+
+private:
+    range_wrapper* my_range_wrapper;
+};
+
+} // internal
+
+/*
+/---------------------------------------- streaming_node ------------------------------------\
+|                                                                                            |
+|   /--------------\   /----------------------\   /-----------\   /----------------------\   |
+|   |              |   |    (device_with_key) O---O           |   |                      |   |
+|   |              |   |                      |   |           |   |                      |   |
+O---O indexer_node O---O device_selector_node O---O join_node O---O      kernel_node     O---O
+|   |              |   | (multifunction_node) |   |           |   | (multifunction_node) |   |
+O---O              |   |                      O---O           |   |                      O---O
+|   \--------------/   \----------------------/   \-----------/   \----------------------/   |
+|                                                                                            |
+\--------------------------------------------------------------------------------------------/
+*/
+template<typename... Args>
+class streaming_node;
+
+template<typename... Ports, typename JP, typename StreamFactory>
+class streaming_node< tuple<Ports...>, JP, StreamFactory >
+    : public composite_node < typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::input_tuple,
+                              typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::output_tuple >
+    , public internal::kernel_executor_helper< StreamFactory, typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::kernel_input_tuple >
+{
+    typedef typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::input_tuple input_tuple;
+    typedef typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::output_tuple output_tuple;
+    typedef typename internal::key_from_policy<JP>::type key_type;
+protected:
+    typedef typename StreamFactory::device_type device_type;
+    typedef typename StreamFactory::kernel_type kernel_type;
+private:
+    typedef internal::streaming_device_with_key<device_type, key_type> device_with_key_type;
+    typedef composite_node<input_tuple, output_tuple> base_type;
+    static const size_t NUM_INPUTS = tuple_size<input_tuple>::value;
+    static const size_t NUM_OUTPUTS = tuple_size<output_tuple>::value;
+
+    typedef typename internal::make_sequence<NUM_INPUTS>::type input_sequence;
+    typedef typename internal::make_sequence<NUM_OUTPUTS>::type output_sequence;
+
+    typedef typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::indexer_node_type indexer_node_type;
+    typedef typename indexer_node_type::output_type indexer_node_output_type;
+    typedef typename internal::streaming_node_traits<JP, StreamFactory, Ports...>::kernel_input_tuple kernel_input_tuple;
+    typedef multifunction_node<indexer_node_output_type, kernel_input_tuple> device_selector_node;
+    typedef multifunction_node<kernel_input_tuple, output_tuple> kernel_multifunction_node;
+
+    template <int... S>
+    typename base_type::input_ports_type get_input_ports( internal::sequence<S...> ) {
+        return std::tie( internal::input_port<S>( my_indexer_node )... );
+    }
+
+    template <int... S>
+    typename base_type::output_ports_type get_output_ports( internal::sequence<S...> ) {
+        return std::tie( internal::output_port<S>( my_kernel_node )... );
+    }
+
+    typename base_type::input_ports_type get_input_ports() {
+        return get_input_ports( input_sequence() );
+    }
+
+    typename base_type::output_ports_type get_output_ports() {
+        return get_output_ports( output_sequence() );
+    }
+
+    template <int N>
+    int make_Nth_edge() {
+        make_edge( internal::output_port<N>( my_device_selector_node ), internal::input_port<N>( my_join_node ) );
+        return 0;
+    }
+
+    template <int... S>
+    void make_edges( internal::sequence<S...> ) {
+        make_edge( my_indexer_node, my_device_selector_node );
+        make_edge( my_device_selector_node, my_join_node );
+        internal::ignore_return_values( make_Nth_edge<S + 1>()... );
+        make_edge( my_join_node, my_kernel_node );
+    }
+
+    void make_edges() {
+        make_edges( input_sequence() );
+    }
+
+    class device_selector_base {
+    public:
+        virtual void operator()( const indexer_node_output_type &v, typename device_selector_node::output_ports_type &op ) = 0;
+        virtual device_selector_base *clone( streaming_node &n ) const = 0;
+        virtual ~device_selector_base() {}
+    };
+
+    template <typename UserFunctor>
+    class device_selector : public device_selector_base, tbb::internal::no_assign {
+    public:
+        device_selector( UserFunctor uf, streaming_node &n, StreamFactory &f )
+            : my_dispatch_funcs( create_dispatch_funcs( input_sequence() ) )
+            , my_user_functor( uf ), my_node(n), my_factory( f )
+        {
+            my_port_epoches.fill( 0 );
+        }
+
+        void operator()( const indexer_node_output_type &v, typename device_selector_node::output_ports_type &op ) __TBB_override {
+            (this->*my_dispatch_funcs[ v.tag() ])( my_port_epoches[ v.tag() ], v, op );
+            __TBB_ASSERT( (tbb::internal::is_same_type<typename internal::key_from_policy<JP>::is_key_matching, std::false_type>::value)
+                || my_port_epoches[v.tag()] == 0, "Epoch is changed when key matching is requested" );
+        }
+
+        device_selector_base *clone( streaming_node &n ) const __TBB_override {
+            return new device_selector( my_user_functor, n, my_factory );
+        }
+    private:
+        typedef void(device_selector<UserFunctor>::*send_and_put_fn_type)(size_t &, const indexer_node_output_type &, typename device_selector_node::output_ports_type &);
+        typedef std::array < send_and_put_fn_type, NUM_INPUTS > dispatch_funcs_type;
+
+        template <int... S>
+        static dispatch_funcs_type create_dispatch_funcs( internal::sequence<S...> ) {
+            dispatch_funcs_type dispatch = { { &device_selector<UserFunctor>::send_and_put_impl<S>... } };
+            return dispatch;
+        }
+
+        template <typename T>
+        key_type get_key( std::false_type, const T &, size_t &epoch ) {
+            __TBB_STATIC_ASSERT( (tbb::internal::is_same_type<key_type, size_t>::value), "" );
+            return epoch++;
+        }
+
+        template <typename T>
+        key_type get_key( std::true_type, const T &t, size_t &/*epoch*/ ) {
+            using tbb::flow::key_from_message;
+            return key_from_message<key_type>( t );
+        }
+
+        template <int N>
+        void send_and_put_impl( size_t &epoch, const indexer_node_output_type &v, typename device_selector_node::output_ports_type &op ) {
+            typedef typename tuple_element<N + 1, typename device_selector_node::output_ports_type>::type::output_type elem_type;
+            elem_type e = internal::cast_to<elem_type>( v );
+            device_type device = get_device( get_key( typename internal::key_from_policy<JP>::is_key_matching(), e, epoch ), get<0>( op ) );
+            my_factory.send_data( device, e );
+            get<N + 1>( op ).try_put( e );
+        }
+
+        template< typename DevicePort >
+        device_type get_device( key_type key, DevicePort& dp ) {
+            typename std::unordered_map<typename std::decay<key_type>::type, epoch_desc>::iterator it = my_devices.find( key );
+            if ( it == my_devices.end() ) {
+                device_type d = my_user_functor( my_factory );
+                std::tie( it, std::ignore ) = my_devices.insert( std::make_pair( key, d ) );
+                bool res = dp.try_put( device_with_key_type( d, key ) );
+                __TBB_ASSERT_EX( res, NULL );
+                my_node.notify_new_device( d );
+            }
+            epoch_desc &e = it->second;
+            device_type d = e.my_device;
+            if ( ++e.my_request_number == NUM_INPUTS ) my_devices.erase( it );
+            return d;
+        }
+
+        struct epoch_desc {
+            epoch_desc(device_type d ) : my_device( d ), my_request_number( 0 ) {}
+            device_type my_device;
+            size_t my_request_number;
+        };
+
+        std::unordered_map<typename std::decay<key_type>::type, epoch_desc> my_devices;
+        std::array<size_t, NUM_INPUTS> my_port_epoches;
+        dispatch_funcs_type my_dispatch_funcs;
+        UserFunctor my_user_functor;
+        streaming_node &my_node;
+        StreamFactory &my_factory;
+    };
+
+    class device_selector_body {
+    public:
+        device_selector_body( device_selector_base *d ) : my_device_selector( d ) {}
+
+        void operator()( const indexer_node_output_type &v, typename device_selector_node::output_ports_type &op ) {
+            (*my_device_selector)(v, op);
+        }
+    private:
+        device_selector_base *my_device_selector;
+    };
+
+    class args_storage_base : tbb::internal::no_copy {
+    public:
+        typedef typename kernel_multifunction_node::output_ports_type output_ports_type;
+
+        virtual void enqueue( kernel_input_tuple &ip, output_ports_type &op, const streaming_node &n ) = 0;
+        virtual void send( device_type d ) = 0;
+        virtual args_storage_base *clone() const = 0;
+        virtual ~args_storage_base () {}
+
+    protected:
+        args_storage_base( const kernel_type& kernel, StreamFactory &f )
+            : my_kernel( kernel ), my_factory( f )
+        {}
+
+        args_storage_base( const args_storage_base &k )
+            : my_kernel( k.my_kernel ), my_factory( k.my_factory )
+        {}
+
+        const kernel_type my_kernel;
+        StreamFactory &my_factory;
+    };
+
+    template <typename... Args>
+    class args_storage : public args_storage_base {
+        typedef typename args_storage_base::output_ports_type output_ports_type;
+
+        // ---------- Update events helpers ---------- //
+        template <int N>
+        bool do_try_put( const kernel_input_tuple& ip, output_ports_type &op ) const {
+            const auto& t = get<N + 1>( ip );
+            auto &port = get<N>( op );
+            return port.try_put( t );
+        }
+
+        template <int... S>
+        bool do_try_put( const kernel_input_tuple& ip, output_ports_type &op, internal::sequence<S...> ) const {
+            return internal::or_return_values( do_try_put<S>( ip, op )... );
+        }
+
+        // ------------------------------------------- //
+        class run_kernel_func : tbb::internal::no_assign {
+        public:
+            run_kernel_func( kernel_input_tuple &ip, const streaming_node &node, const args_storage& storage )
+                : my_kernel_func( ip, node, storage, get<0>(ip).device() ) {}
+
+            // It is immpossible to use Args... because a function pointer cannot be casted to a function reference implicitly.
+            // Allow the compiler to deduce types for function pointers automatically.
+            template <typename... FnArgs>
+            void operator()( FnArgs&... args ) {
+                internal::convert_and_call_impl<FnArgs...>::doit( my_kernel_func, my_kernel_func.my_ip, args... );
+            }
+        private:
+            struct kernel_func : tbb::internal::no_copy {
+                kernel_input_tuple &my_ip;
+                const streaming_node &my_node;
+                const args_storage& my_storage;
+                device_type my_device;
+
+                kernel_func( kernel_input_tuple &ip, const streaming_node &node, const args_storage& storage, device_type device )
+                    : my_ip( ip ), my_node( node ), my_storage( storage ), my_device( device )
+                {}
+
+                template <typename... FnArgs>
+                void operator()( FnArgs&... args ) {
+                    my_node.enqueue_kernel( my_ip, my_storage.my_factory, my_device, my_storage.my_kernel, args... );
+                }
+            } my_kernel_func;
+        };
+
+        template<typename FinalizeFn>
+        class run_finalize_func : tbb::internal::no_assign {
+        public:
+            run_finalize_func( kernel_input_tuple &ip, StreamFactory &factory, FinalizeFn fn )
+                : my_ip( ip ), my_finalize_func( factory, get<0>(ip).device(), fn ) {}
+
+            // It is immpossible to use Args... because a function pointer cannot be casted to a function reference implicitly.
+            // Allow the compiler to deduce types for function pointers automatically.
+            template <typename... FnArgs>
+            void operator()( FnArgs&... args ) {
+                internal::convert_and_call_impl<FnArgs...>::doit( my_finalize_func, my_ip, args... );
+            }
+        private:
+            kernel_input_tuple &my_ip;
+
+            struct finalize_func : tbb::internal::no_assign {
+                StreamFactory &my_factory;
+                device_type my_device;
+                FinalizeFn my_fn;
+
+                finalize_func( StreamFactory &factory, device_type device, FinalizeFn fn )
+                    : my_factory(factory), my_device(device), my_fn(fn) {}
+
+                template <typename... FnArgs>
+                void operator()( FnArgs&... args ) {
+                    my_factory.finalize( my_device, my_fn, args... );
+                }
+            } my_finalize_func;
+        };
+
+        template<typename FinalizeFn>
+        static run_finalize_func<FinalizeFn> make_run_finalize_func( kernel_input_tuple &ip, StreamFactory &factory, FinalizeFn fn ) {
+            return run_finalize_func<FinalizeFn>( ip, factory, fn );
+        }
+
+        class send_func : tbb::internal::no_assign {
+        public:
+            send_func( StreamFactory &factory, device_type d )
+                : my_factory(factory), my_device( d ) {}
+
+            template <typename... FnArgs>
+            void operator()( FnArgs&... args ) {
+                my_factory.send_data( my_device, args... );
+            }
+        private:
+            StreamFactory &my_factory;
+            device_type my_device;
+        };
+
+    public:
+        args_storage( const kernel_type& kernel, StreamFactory &f, Args&&... args )
+            : args_storage_base( kernel, f )
+            , my_args_pack( std::forward<Args>(args)... )
+        {}
+
+        args_storage( const args_storage &k ) : args_storage_base( k ), my_args_pack( k.my_args_pack ) {}
+
+        args_storage( const args_storage_base &k, Args&&... args ) : args_storage_base( k ), my_args_pack( std::forward<Args>(args)... ) {}
+
+        void enqueue( kernel_input_tuple &ip, output_ports_type &op, const streaming_node &n ) __TBB_override {
+            // Make const qualified args_pack (from non-const)
+            const args_pack_type& const_args_pack = my_args_pack;
+            // factory.enqure_kernel() gets
+            //  - 'ip' tuple elements by reference and updates it (and 'ip') with dependencies
+            //  - arguments (from my_args_pack) by const-reference via const_args_pack
+            tbb::internal::call( run_kernel_func( ip, n, *this ), const_args_pack );
+
+            if (! do_try_put( ip, op, input_sequence() ) ) {
+                graph& g = n.my_graph;
+                // No one message was passed to successors so set a callback to extend the graph lifetime until the kernel completion.
+                g.increment_wait_count();
+
+                // factory.finalize() gets
+                //  - 'ip' tuple elements by reference, so 'ip' might be changed
+                //  - arguments (from my_args_pack) by const-reference via const_args_pack
+                tbb::internal::call( make_run_finalize_func(ip, this->my_factory, [&g] {
+                    g.decrement_wait_count();
+                }), const_args_pack );
+            }
+        }
+
+        void send( device_type d ) __TBB_override {
+            // factory.send() gets arguments by reference and updates these arguments with dependencies
+            // (it gets but usually ignores port_ref-s)
+            tbb::internal::call( send_func( this->my_factory, d ), my_args_pack );
+        }
+
+        args_storage_base *clone() const __TBB_override {
+            // Create new args_storage with copying constructor.
+            return new args_storage<Args...>( *this );
+        }
+
+    private:
+        typedef tbb::internal::stored_pack<Args...> args_pack_type;
+        args_pack_type my_args_pack;
+    };
+
+    // Body for kernel_multifunction_node.
+    class kernel_body : tbb::internal::no_assign {
+    public:
+        kernel_body( const streaming_node &node ) : my_node( node ) {}
+
+        void operator()( kernel_input_tuple ip, typename args_storage_base::output_ports_type &op ) {
+            __TBB_ASSERT( (my_node.my_args_storage != NULL), "No arguments storage" );
+            // 'ip' is passed by value to create local copy for updating inside enqueue_kernel()
+            my_node.my_args_storage->enqueue( ip, op, my_node );
+        }
+    private:
+        const streaming_node &my_node;
+    };
+
+    template <typename T, typename U = typename internal::is_port_ref<T>::type >
+    struct wrap_to_async {
+        typedef T type; // Keep port_ref as it is
+    };
+
+    template <typename T>
+    struct wrap_to_async<T, std::false_type> {
+        typedef typename StreamFactory::template async_msg_type< typename tbb::internal::strip<T>::type > type;
+    };
+
+    template <typename... Args>
+    args_storage_base *make_args_storage(const args_storage_base& storage, Args&&... args) const {
+        // In this variadic template convert all simple types 'T' into 'async_msg_type<T>'
+        return new args_storage<Args...>(storage, std::forward<Args>(args)...);
+    }
+
+    void notify_new_device( device_type d ) {
+        my_args_storage->send( d );
+    }
+
+    template <typename ...Args>
+    void enqueue_kernel( kernel_input_tuple& ip, StreamFactory& factory, device_type device, const kernel_type& kernel, Args&... args ) const {
+        this->enqueue_kernel_impl( ip, factory, device, kernel, args... );
+    }
+
+public:
+    template <typename DeviceSelector>
+    streaming_node( graph &g, const kernel_type& kernel, DeviceSelector d, StreamFactory &f )
+        : base_type( g )
+        , my_indexer_node( g )
+        , my_device_selector( new device_selector<DeviceSelector>( d, *this, f ) )
+        , my_device_selector_node( g, serial, device_selector_body( my_device_selector ) )
+        , my_join_node( g )
+        , my_kernel_node( g, serial, kernel_body( *this ) )
+        // By default, streaming_node maps all its ports to the kernel arguments on a one-to-one basis.
+        , my_args_storage( make_args_storage( args_storage<>(kernel, f), port_ref<0, NUM_INPUTS - 1>() ) )
+    {
+        base_type::set_external_ports( get_input_ports(), get_output_ports() );
+        make_edges();
+    }
+
+    streaming_node( const streaming_node &node )
+        : base_type( node.my_graph )
+        , my_indexer_node( node.my_indexer_node )
+        , my_device_selector( node.my_device_selector->clone( *this ) )
+        , my_device_selector_node( node.my_graph, serial, device_selector_body( my_device_selector ) )
+        , my_join_node( node.my_join_node )
+        , my_kernel_node( node.my_graph, serial, kernel_body( *this ) )
+        , my_args_storage( node.my_args_storage->clone() )
+    {
+        base_type::set_external_ports( get_input_ports(), get_output_ports() );
+        make_edges();
+    }
+
+    streaming_node( streaming_node &&node )
+        : base_type( node.my_graph )
+        , my_indexer_node( std::move( node.my_indexer_node ) )
+        , my_device_selector( node.my_device_selector->clone(*this) )
+        , my_device_selector_node( node.my_graph, serial, device_selector_body( my_device_selector ) )
+        , my_join_node( std::move( node.my_join_node ) )
+        , my_kernel_node( node.my_graph, serial, kernel_body( *this ) )
+        , my_args_storage( node.my_args_storage )
+    {
+        base_type::set_external_ports( get_input_ports(), get_output_ports() );
+        make_edges();
+        // Set moving node mappers to NULL to prevent double deallocation.
+        node.my_args_storage = NULL;
+    }
+
+    ~streaming_node() {
+        if ( my_args_storage ) delete my_args_storage;
+        if ( my_device_selector ) delete my_device_selector;
+    }
+
+    template <typename... Args>
+    void set_args( Args&&... args ) {
+        // Copy the base class of args_storage and create new storage for "Args...".
+        args_storage_base * const new_args_storage = make_args_storage( *my_args_storage, typename wrap_to_async<Args>::type(std::forward<Args>(args))...);
+        delete my_args_storage;
+        my_args_storage = new_args_storage;
+    }
+
+protected:
+    void reset_node( reset_flags = rf_reset_protocol ) __TBB_override { __TBB_ASSERT( false, "Not implemented yet" ); }
+
+private:
+    indexer_node_type my_indexer_node;
+    device_selector_base *my_device_selector;
+    device_selector_node my_device_selector_node;
+    join_node<kernel_input_tuple, JP> my_join_node;
+    kernel_multifunction_node my_kernel_node;
+
+    args_storage_base *my_args_storage;
+};
+
+#endif // __TBB_PREVIEW_STREAMING_NODE
+#endif // __TBB_flow_graph_streaming_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_tagged_buffer_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_tagged_buffer_impl.h
new file mode 100644
index 00000000..e0546264
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_tagged_buffer_impl.h
@@ -0,0 +1,253 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// a hash table buffer that can expand, and can support as many deletions as
+// additions, list-based, with elements of list held in array (for destruction
+// management), multiplicative hashing (like ets).  No synchronization built-in.
+//
+
+#ifndef __TBB__flow_graph_hash_buffer_impl_H
+#define __TBB__flow_graph_hash_buffer_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+// included in namespace tbb::flow::interfaceX::internal
+
+// elements in the table are a simple list; we need pointer to next element to
+// traverse the chain
+template<typename ValueType>
+struct buffer_element_type {
+    // the second parameter below is void * because we can't forward-declare the type
+    // itself, so we just reinterpret_cast below.
+    typedef typename aligned_pair<ValueType, void *>::type type;
+};
+
+template
+    <
+     typename Key,         // type of key within ValueType
+     typename ValueType,
+     typename ValueToKey,  // abstract method that returns "const Key" or "const Key&" given ValueType
+     typename HashCompare, // has hash and equal
+     typename Allocator=tbb::cache_aligned_allocator< typename aligned_pair<ValueType, void *>::type >
+    >
+class hash_buffer : public HashCompare {
+public:
+    static const size_t INITIAL_SIZE = 8;  // initial size of the hash pointer table
+    typedef ValueType value_type;
+    typedef typename buffer_element_type< value_type >::type element_type;
+    typedef value_type *pointer_type;
+    typedef element_type *list_array_type;  // array we manage manually
+    typedef list_array_type *pointer_array_type;
+    typedef typename Allocator::template rebind<list_array_type>::other pointer_array_allocator_type;
+    typedef typename Allocator::template rebind<element_type>::other elements_array_allocator;
+    typedef typename tbb::internal::strip<Key>::type Knoref;
+
+private:
+    ValueToKey *my_key;
+    size_t my_size;
+    size_t nelements;
+    pointer_array_type pointer_array;    // pointer_array[my_size]
+    list_array_type elements_array;      // elements_array[my_size / 2]
+    element_type* free_list;
+
+    size_t mask() { return my_size - 1; }
+
+    void set_up_free_list( element_type **p_free_list, list_array_type la, size_t sz) {
+        for(size_t i=0; i < sz - 1; ++i ) {  // construct free list
+            la[i].second = &(la[i+1]);
+        }
+        la[sz-1].second = NULL;
+        *p_free_list = (element_type *)&(la[0]);
+    }
+
+    // cleanup for exceptions
+    struct DoCleanup {
+        pointer_array_type *my_pa;
+        list_array_type *my_elements;
+        size_t my_size;
+
+        DoCleanup(pointer_array_type &pa, list_array_type &my_els, size_t sz) :
+            my_pa(&pa), my_elements(&my_els), my_size(sz) {  }
+        ~DoCleanup() {
+            if(my_pa) {
+                size_t dont_care = 0;
+                internal_free_buffer(*my_pa, *my_elements, my_size, dont_care);
+            }
+        }
+    };
+
+    // exception-safety requires we do all the potentially-throwing operations first
+    void grow_array() {
+        size_t new_size = my_size*2;
+        size_t new_nelements = nelements;  // internal_free_buffer zeroes this
+        list_array_type new_elements_array = NULL;
+        pointer_array_type new_pointer_array = NULL;
+        list_array_type new_free_list = NULL;
+        {
+            DoCleanup my_cleanup(new_pointer_array, new_elements_array, new_size);
+            new_elements_array = elements_array_allocator().allocate(my_size);
+            new_pointer_array = pointer_array_allocator_type().allocate(new_size);
+            for(size_t i=0; i < new_size; ++i) new_pointer_array[i] = NULL;
+            set_up_free_list(&new_free_list, new_elements_array, my_size );
+
+            for(size_t i=0; i < my_size; ++i) {
+                for( element_type* op = pointer_array[i]; op; op = (element_type *)(op->second)) {
+                    value_type *ov = reinterpret_cast<value_type *>(&(op->first));
+                    // could have std::move semantics
+                    internal_insert_with_key(new_pointer_array, new_size, new_free_list, *ov);
+                }
+            }
+            my_cleanup.my_pa = NULL;
+            my_cleanup.my_elements = NULL;
+        }
+
+        internal_free_buffer(pointer_array, elements_array, my_size, nelements);
+        free_list = new_free_list;
+        pointer_array = new_pointer_array;
+        elements_array = new_elements_array;
+        my_size = new_size;
+        nelements = new_nelements;
+    }
+
+    // v should have perfect forwarding if std::move implemented.
+    // we use this method to move elements in grow_array, so can't use class fields
+    void internal_insert_with_key( element_type **p_pointer_array, size_t p_sz, list_array_type &p_free_list,
+            const value_type &v) {
+        size_t l_mask = p_sz-1;
+        __TBB_ASSERT(my_key, "Error: value-to-key functor not provided");
+        size_t h = this->hash((*my_key)(v)) & l_mask;
+        __TBB_ASSERT(p_free_list, "Error: free list not set up.");
+        element_type* my_elem = p_free_list; p_free_list = (element_type *)(p_free_list->second);
+        (void) new(&(my_elem->first)) value_type(v);
+        my_elem->second = p_pointer_array[h];
+        p_pointer_array[h] = my_elem;
+    }
+
+    void internal_initialize_buffer() {
+        pointer_array = pointer_array_allocator_type().allocate(my_size);
+        for(size_t i = 0; i < my_size; ++i) pointer_array[i] = NULL;
+        elements_array = elements_array_allocator().allocate(my_size / 2);
+        set_up_free_list(&free_list, elements_array, my_size / 2);
+    }
+
+    // made static so an enclosed class can use to properly dispose of the internals
+    static void internal_free_buffer( pointer_array_type &pa, list_array_type &el, size_t &sz, size_t &ne ) {
+        if(pa) {
+            for(size_t i = 0; i < sz; ++i ) {
+                element_type *p_next;
+                for( element_type *p = pa[i]; p; p = p_next) {
+                    p_next = (element_type *)p->second;
+                    internal::punned_cast<value_type *>(&(p->first))->~value_type();
+                }
+            }
+            pointer_array_allocator_type().deallocate(pa, sz);
+            pa = NULL;
+        }
+        // Separate test (if allocation of pa throws, el may be allocated.
+        // but no elements will be constructed.)
+        if(el) {
+            elements_array_allocator().deallocate(el, sz / 2);
+            el = NULL;
+        }
+        sz = INITIAL_SIZE;
+        ne = 0;
+    }
+
+public:
+    hash_buffer() : my_key(NULL), my_size(INITIAL_SIZE), nelements(0) {
+        internal_initialize_buffer();
+    }
+
+    ~hash_buffer() {
+        internal_free_buffer(pointer_array, elements_array, my_size, nelements);
+        if(my_key) delete my_key;
+    }
+
+    void reset() {
+        internal_free_buffer(pointer_array, elements_array, my_size, nelements);
+        internal_initialize_buffer();
+    }
+
+    // Take ownership of func object allocated with new.
+    // This method is only used internally, so can't be misused by user.
+    void set_key_func(ValueToKey *vtk) { my_key = vtk; }
+    // pointer is used to clone()
+    ValueToKey* get_key_func() { return my_key; }
+
+    bool insert_with_key(const value_type &v) {
+        pointer_type p = NULL;
+        __TBB_ASSERT(my_key, "Error: value-to-key functor not provided");
+        if(find_ref_with_key((*my_key)(v), p)) {
+            p->~value_type();
+            (void) new(p) value_type(v);  // copy-construct into the space
+            return false;
+        }
+        ++nelements;
+        if(nelements*2 > my_size) grow_array();
+        internal_insert_with_key(pointer_array, my_size, free_list, v);
+        return true;
+    }
+
+    // returns true and sets v to array element if found, else returns false.
+    bool find_ref_with_key(const Knoref& k, pointer_type &v) {
+        size_t i = this->hash(k) & mask();
+        for(element_type* p = pointer_array[i]; p; p = (element_type *)(p->second)) {
+            pointer_type pv = reinterpret_cast<pointer_type>(&(p->first));
+            __TBB_ASSERT(my_key, "Error: value-to-key functor not provided");
+            if(this->equal((*my_key)(*pv), k)) {
+                v = pv;
+                return true;
+            }
+        }
+        return false;
+    }
+
+    bool find_with_key( const Knoref& k, value_type &v) {
+        value_type *p;
+        if(find_ref_with_key(k, p)) {
+            v = *p;
+            return true;
+        }
+        else
+            return false;
+    }
+
+    void delete_with_key(const Knoref& k) {
+        size_t h = this->hash(k) & mask();
+        element_type* prev = NULL;
+        for(element_type* p = pointer_array[h]; p; prev = p, p = (element_type *)(p->second)) {
+            value_type *vp = reinterpret_cast<value_type *>(&(p->first));
+            __TBB_ASSERT(my_key, "Error: value-to-key functor not provided");
+            if(this->equal((*my_key)(*vp), k)) {
+                vp->~value_type();
+                if(prev) prev->second = p->second;
+                else pointer_array[h] = (element_type *)(p->second);
+                p->second = free_list;
+                free_list = p;
+                --nelements;
+                return;
+            }
+        }
+        __TBB_ASSERT(false, "key not found for delete");
+    }
+};
+#endif // __TBB__flow_graph_hash_buffer_impl_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_trace_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_trace_impl.h
new file mode 100644
index 00000000..68ca515e
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_trace_impl.h
@@ -0,0 +1,335 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _FGT_GRAPH_TRACE_IMPL_H
+#define _FGT_GRAPH_TRACE_IMPL_H
+
+#include "../tbb_profiling.h"
+
+namespace tbb {
+    namespace internal {
+
+#if TBB_USE_THREADING_TOOLS
+
+static inline void fgt_alias_port(void *node, void *p, bool visible) {
+    if(visible)
+        itt_relation_add( ITT_DOMAIN_FLOW, node, FLOW_NODE, __itt_relation_is_parent_of, p, FLOW_NODE );
+    else
+        itt_relation_add( ITT_DOMAIN_FLOW, p, FLOW_NODE, __itt_relation_is_child_of, node, FLOW_NODE );
+}
+
+static inline void fgt_composite ( void *node, void *graph ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, node, FLOW_NODE, graph, FLOW_GRAPH, FLOW_COMPOSITE_NODE );
+}
+
+static inline void fgt_internal_alias_input_port( void *node, void *p, string_index name_index ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, p, FLOW_INPUT_PORT, node, FLOW_NODE, name_index );
+    itt_relation_add( ITT_DOMAIN_FLOW, node, FLOW_NODE, __itt_relation_is_parent_of, p, FLOW_INPUT_PORT );
+}
+
+static inline void fgt_internal_alias_output_port( void *node, void *p, string_index name_index ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, p, FLOW_OUTPUT_PORT, node, FLOW_NODE, name_index );
+    itt_relation_add( ITT_DOMAIN_FLOW, node, FLOW_NODE, __itt_relation_is_parent_of, p, FLOW_OUTPUT_PORT );
+}
+
+template<typename InputType>
+void alias_input_port(void *node, tbb::flow::receiver<InputType>* port, string_index name_index) {
+    // TODO: Make fgt_internal_alias_input_port a function template?
+    fgt_internal_alias_input_port( node, port, name_index);
+}
+
+template < typename PortsTuple, int N >
+struct fgt_internal_input_alias_helper {
+    static void alias_port( void *node, PortsTuple &ports ) {
+        alias_input_port( node, &(tbb::flow::get<N-1>(ports)), static_cast<tbb::internal::string_index>(FLOW_INPUT_PORT_0 + N - 1) );
+        fgt_internal_input_alias_helper<PortsTuple, N-1>::alias_port( node, ports );
+    }
+};
+
+template < typename PortsTuple >
+struct fgt_internal_input_alias_helper<PortsTuple, 0> {
+    static void alias_port( void * /* node */, PortsTuple & /* ports */ ) { }
+};
+
+template<typename OutputType>
+void alias_output_port(void *node, tbb::flow::sender<OutputType>* port, string_index name_index) {
+    // TODO: Make fgt_internal_alias_output_port a function template?
+    fgt_internal_alias_output_port( node, static_cast<void *>(port), name_index);
+}
+
+template < typename PortsTuple, int N >
+struct fgt_internal_output_alias_helper {
+    static void alias_port( void *node, PortsTuple &ports ) {
+        alias_output_port( node, &(tbb::flow::get<N-1>(ports)), static_cast<tbb::internal::string_index>(FLOW_OUTPUT_PORT_0 + N - 1) );
+        fgt_internal_output_alias_helper<PortsTuple, N-1>::alias_port( node, ports );
+    }
+};
+
+template < typename PortsTuple >
+struct fgt_internal_output_alias_helper<PortsTuple, 0> {
+    static void alias_port( void * /*node*/, PortsTuple &/*ports*/ ) {
+    }
+};
+
+static inline void fgt_internal_create_input_port( void *node, void *p, string_index name_index ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, p, FLOW_INPUT_PORT, node, FLOW_NODE, name_index );
+}
+
+static inline void fgt_internal_create_output_port( void *node, void *p, string_index name_index ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, p, FLOW_OUTPUT_PORT, node, FLOW_NODE, name_index );
+}
+
+template<typename InputType>
+void register_input_port(void *node, tbb::flow::receiver<InputType>* port, string_index name_index) {
+    // TODO: Make fgt_internal_create_input_port a function template?
+    // In C++03 dependent name lookup from the template definition context
+    // works only for function declarations with external linkage:
+    // http://www.open-std.org/JTC1/SC22/WG21/docs/cwg_defects.html#561
+    fgt_internal_create_input_port(node, static_cast<void*>(port), name_index);
+}
+
+template < typename PortsTuple, int N >
+struct fgt_internal_input_helper {
+    static void register_port( void *node, PortsTuple &ports ) {
+        register_input_port( node, &(tbb::flow::get<N-1>(ports)), static_cast<tbb::internal::string_index>(FLOW_INPUT_PORT_0 + N - 1) );
+        fgt_internal_input_helper<PortsTuple, N-1>::register_port( node, ports );
+    }
+};
+
+template < typename PortsTuple >
+struct fgt_internal_input_helper<PortsTuple, 1> {
+    static void register_port( void *node, PortsTuple &ports ) {
+        register_input_port( node, &(tbb::flow::get<0>(ports)), FLOW_INPUT_PORT_0 );
+    }
+};
+
+template<typename OutputType>
+void register_output_port(void *node, tbb::flow::sender<OutputType>* port, string_index name_index) {
+    // TODO: Make fgt_internal_create_output_port a function template?
+    fgt_internal_create_output_port( node, static_cast<void *>(port), name_index);
+}
+
+template < typename PortsTuple, int N >
+struct fgt_internal_output_helper {
+    static void register_port( void *node, PortsTuple &ports ) {
+        register_output_port( node, &(tbb::flow::get<N-1>(ports)), static_cast<tbb::internal::string_index>(FLOW_OUTPUT_PORT_0 + N - 1) );
+        fgt_internal_output_helper<PortsTuple, N-1>::register_port( node, ports );
+    }
+};
+
+template < typename PortsTuple >
+struct fgt_internal_output_helper<PortsTuple,1> {
+    static void register_port( void *node, PortsTuple &ports ) {
+        register_output_port( node, &(tbb::flow::get<0>(ports)), FLOW_OUTPUT_PORT_0 );
+    }
+};
+
+template< typename NodeType >
+void fgt_multioutput_node_desc( const NodeType *node, const char *desc ) {
+    void *addr =  (void *)( static_cast< tbb::flow::receiver< typename NodeType::input_type > * >(const_cast< NodeType *>(node)) );
+    itt_metadata_str_add( ITT_DOMAIN_FLOW, addr, FLOW_NODE, FLOW_OBJECT_NAME, desc );
+}
+
+template< typename NodeType >
+void fgt_multiinput_multioutput_node_desc( const NodeType *node, const char *desc ) {
+    void *addr =  const_cast<NodeType *>(node);
+    itt_metadata_str_add( ITT_DOMAIN_FLOW, addr, FLOW_NODE, FLOW_OBJECT_NAME, desc );
+}
+
+template< typename NodeType >
+static inline void fgt_node_desc( const NodeType *node, const char *desc ) {
+    void *addr =  (void *)( static_cast< tbb::flow::sender< typename NodeType::output_type > * >(const_cast< NodeType *>(node)) );
+    itt_metadata_str_add( ITT_DOMAIN_FLOW, addr, FLOW_NODE, FLOW_OBJECT_NAME, desc );
+}
+
+static inline void fgt_graph_desc( void *g, const char *desc ) {
+    itt_metadata_str_add( ITT_DOMAIN_FLOW, g, FLOW_GRAPH, FLOW_OBJECT_NAME, desc );
+}
+
+static inline void fgt_body( void *node, void *body ) {
+    itt_relation_add( ITT_DOMAIN_FLOW, body, FLOW_BODY, __itt_relation_is_child_of, node, FLOW_NODE );
+}
+
+template< int N, typename PortsTuple >
+static inline void fgt_multioutput_node( string_index t, void *g, void *input_port, PortsTuple &ports ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, input_port, FLOW_NODE, g, FLOW_GRAPH, t );
+    fgt_internal_create_input_port( input_port, input_port, FLOW_INPUT_PORT_0 );
+    fgt_internal_output_helper<PortsTuple, N>::register_port( input_port, ports );
+}
+
+template< int N, typename PortsTuple >
+static inline void fgt_multioutput_node_with_body( string_index t, void *g, void *input_port, PortsTuple &ports, void *body ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, input_port, FLOW_NODE, g, FLOW_GRAPH, t );
+    fgt_internal_create_input_port( input_port, input_port, FLOW_INPUT_PORT_0 );
+    fgt_internal_output_helper<PortsTuple, N>::register_port( input_port, ports );
+    fgt_body( input_port, body );
+}
+
+template< int N, typename PortsTuple >
+static inline void fgt_multiinput_node( string_index t, void *g, PortsTuple &ports, void *output_port) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, output_port, FLOW_NODE, g, FLOW_GRAPH, t );
+    fgt_internal_create_output_port( output_port, output_port, FLOW_OUTPUT_PORT_0 );
+    fgt_internal_input_helper<PortsTuple, N>::register_port( output_port, ports );
+}
+
+static inline void fgt_multiinput_multioutput_node( string_index t, void *n, void *g ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, n, FLOW_NODE, g, FLOW_GRAPH, t );
+}
+
+static inline void fgt_node( string_index t, void *g, void *output_port ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, output_port, FLOW_NODE, g, FLOW_GRAPH, t );
+    fgt_internal_create_output_port( output_port, output_port, FLOW_OUTPUT_PORT_0 );
+}
+
+static inline void fgt_node_with_body( string_index t, void *g, void *output_port, void *body ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, output_port, FLOW_NODE, g, FLOW_GRAPH, t );
+    fgt_internal_create_output_port( output_port, output_port, FLOW_OUTPUT_PORT_0 );
+    fgt_body( output_port, body );
+}
+
+
+static inline void fgt_node( string_index t, void *g, void *input_port, void *output_port ) {
+    fgt_node( t, g, output_port );
+    fgt_internal_create_input_port( output_port, input_port, FLOW_INPUT_PORT_0 );
+}
+
+static inline void fgt_node_with_body( string_index t, void *g, void *input_port, void *output_port, void *body ) {
+    fgt_node_with_body( t, g, output_port, body );
+    fgt_internal_create_input_port( output_port, input_port, FLOW_INPUT_PORT_0 );
+}
+
+
+static inline void  fgt_node( string_index t, void *g, void *input_port, void *decrement_port, void *output_port ) {
+    fgt_node( t, g, input_port, output_port );
+    fgt_internal_create_input_port( output_port, decrement_port, FLOW_INPUT_PORT_1 );
+}
+
+static inline void fgt_make_edge( void *output_port, void *input_port ) {
+    itt_relation_add( ITT_DOMAIN_FLOW, output_port, FLOW_OUTPUT_PORT, __itt_relation_is_predecessor_to, input_port, FLOW_INPUT_PORT);
+}
+
+static inline void fgt_remove_edge( void *output_port, void *input_port ) {
+    itt_relation_add( ITT_DOMAIN_FLOW, output_port, FLOW_OUTPUT_PORT, __itt_relation_is_sibling_of, input_port, FLOW_INPUT_PORT);
+}
+
+static inline void fgt_graph( void *g ) {
+    itt_make_task_group( ITT_DOMAIN_FLOW, g, FLOW_GRAPH, NULL, FLOW_NULL, FLOW_GRAPH );
+}
+
+static inline void fgt_begin_body( void *body ) {
+    itt_task_begin( ITT_DOMAIN_FLOW, body, FLOW_BODY, NULL, FLOW_NULL, FLOW_BODY );
+}
+
+static inline void fgt_end_body( void * ) {
+    itt_task_end( ITT_DOMAIN_FLOW );
+}
+
+static inline void fgt_async_try_put_begin( void *node, void *port ) {
+    itt_task_begin( ITT_DOMAIN_FLOW, port, FLOW_OUTPUT_PORT, node, FLOW_NODE, FLOW_OUTPUT_PORT );
+}
+
+static inline void fgt_async_try_put_end( void *, void * ) {
+    itt_task_end( ITT_DOMAIN_FLOW );
+}
+
+static inline void fgt_async_reserve( void *node, void *graph ) {
+    itt_region_begin( ITT_DOMAIN_FLOW, node, FLOW_NODE, graph, FLOW_GRAPH, FLOW_NULL );
+}
+
+static inline void fgt_async_commit( void *node, void * /*graph*/) {
+    itt_region_end( ITT_DOMAIN_FLOW, node, FLOW_NODE );
+}
+
+static inline void fgt_reserve_wait( void *graph ) {
+    itt_region_begin( ITT_DOMAIN_FLOW, graph, FLOW_GRAPH, NULL, FLOW_NULL, FLOW_NULL );
+}
+
+static inline void fgt_release_wait( void *graph ) {
+    itt_region_end( ITT_DOMAIN_FLOW, graph, FLOW_GRAPH );
+}
+
+#else // TBB_USE_THREADING_TOOLS
+
+static inline void fgt_alias_port(void * /*node*/, void * /*p*/, bool /*visible*/ ) { }
+
+static inline void fgt_composite ( void * /*node*/, void * /*graph*/ ) { }
+
+static inline void fgt_graph( void * /*g*/ ) { }
+
+template< typename NodeType >
+static inline void fgt_multioutput_node_desc( const NodeType * /*node*/, const char * /*desc*/ ) { }
+
+template< typename NodeType >
+static inline void fgt_node_desc( const NodeType * /*node*/, const char * /*desc*/ ) { }
+
+static inline void fgt_graph_desc( void * /*g*/, const char * /*desc*/ ) { }
+
+static inline void fgt_body( void * /*node*/, void * /*body*/ ) { }
+
+template< int N, typename PortsTuple >
+static inline void fgt_multioutput_node( string_index /*t*/, void * /*g*/, void * /*input_port*/, PortsTuple & /*ports*/ ) { }
+
+template< int N, typename PortsTuple >
+static inline void fgt_multioutput_node_with_body( string_index /*t*/, void * /*g*/, void * /*input_port*/, PortsTuple & /*ports*/, void * /*body*/ ) { }
+
+template< int N, typename PortsTuple >
+static inline void fgt_multiinput_node( string_index /*t*/, void * /*g*/, PortsTuple & /*ports*/, void * /*output_port*/ ) { }
+
+static inline void fgt_multiinput_multioutput_node( string_index /*t*/, void * /*node*/, void * /*graph*/ ) { }
+
+static inline void fgt_node( string_index /*t*/, void * /*g*/, void * /*output_port*/ ) { }
+static inline void fgt_node( string_index /*t*/, void * /*g*/, void * /*input_port*/, void * /*output_port*/ ) { }
+static inline void  fgt_node( string_index /*t*/, void * /*g*/, void * /*input_port*/, void * /*decrement_port*/, void * /*output_port*/ ) { }
+
+static inline void fgt_node_with_body( string_index /*t*/, void * /*g*/, void * /*output_port*/, void * /*body*/ ) { }
+static inline void fgt_node_with_body( string_index /*t*/, void * /*g*/, void * /*input_port*/, void * /*output_port*/, void * /*body*/ ) { }
+
+static inline void fgt_make_edge( void * /*output_port*/, void * /*input_port*/ ) { }
+static inline void fgt_remove_edge( void * /*output_port*/, void * /*input_port*/ ) { }
+
+static inline void fgt_begin_body( void * /*body*/ ) { }
+static inline void fgt_end_body( void *  /*body*/) { }
+
+static inline void fgt_async_try_put_begin( void * /*node*/, void * /*port*/ ) { }
+static inline void fgt_async_try_put_end( void * /*node*/ , void * /*port*/ ) { }
+static inline void fgt_async_reserve( void * /*node*/, void * /*graph*/ ) { }
+static inline void fgt_async_commit( void * /*node*/, void * /*graph*/ ) { }
+static inline void fgt_reserve_wait( void * /*graph*/ ) { }
+static inline void fgt_release_wait( void * /*graph*/ ) { }
+
+template< typename NodeType >
+void fgt_multiinput_multioutput_node_desc( const NodeType * /*node*/, const char * /*desc*/ ) { }
+
+template < typename PortsTuple, int N >
+struct fgt_internal_input_alias_helper {
+    static void alias_port( void * /*node*/, PortsTuple & /*ports*/ ) { }
+};
+
+template < typename PortsTuple, int N >
+struct fgt_internal_output_alias_helper {
+    static void alias_port( void * /*node*/, PortsTuple & /*ports*/ ) { }
+};
+
+#endif // TBB_USE_THREADING_TOOLS
+
+    } // namespace internal
+} // namespace tbb
+
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/internal/_flow_graph_types_impl.h b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_types_impl.h
new file mode 100644
index 00000000..e2d1c9fe
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_flow_graph_types_impl.h
@@ -0,0 +1,713 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__flow_graph_types_impl_H
+#define __TBB__flow_graph_types_impl_H
+
+#ifndef __TBB_flow_graph_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+// included in namespace tbb::flow::interfaceX
+
+namespace internal {
+
+    // the change to key_matching (adding a K and KHash template parameter, making it a class)
+    // means we have to pass this data to the key_matching_port.  All the ports have only one
+    // template parameter, so we have to wrap the following types in a trait:
+    //
+    //    . K == key_type
+    //    . KHash == hash and compare for Key
+    //    . TtoK == function_body that given an object of T, returns its K
+    //    . T == type accepted by port, and stored in the hash table
+    //
+    // The port will have an additional parameter on node construction, which is a function_body
+    // that accepts a const T& and returns a K which is the field in T which is its K.
+    template<typename Kp, typename KHashp, typename Tp>
+    struct KeyTrait {
+        typedef Kp K;
+        typedef Tp T;
+        typedef internal::type_to_key_function_body<T,K> TtoK;
+        typedef KHashp KHash;
+    };
+
+// wrap each element of a tuple in a template, and make a tuple of the result.
+    template<int N, template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements;
+
+    // A wrapper that generates the traits needed for each port of a key-matching join,
+    // and the type of the tuple of input ports.
+    template<int N, template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements;
+
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<1, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<1, PT, KeyTraits, TypeTuple > {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0> > type;
+    };
+
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<2, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<2, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1> > type;
+    };
+
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<3, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<3, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2> > type;
+    };
+
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<4, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<4, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>,
+                PT<KeyTrait3> > type;
+    };
+
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<5, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<4,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<5, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<4,TypeTuple>::type> KeyTrait4;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>,
+                PT<KeyTrait3>, PT<KeyTrait4> > type;
+    };
+
+#if __TBB_VARIADIC_MAX >= 6
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<6, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<4,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<5,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<6, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<4,TypeTuple>::type> KeyTrait4;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<5,TypeTuple>::type> KeyTrait5;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>, PT<KeyTrait3>,
+                PT<KeyTrait4>, PT<KeyTrait5> > type;
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 7
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<7, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<4,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<5,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<6,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<7, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<4,TypeTuple>::type> KeyTrait4;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<5,TypeTuple>::type> KeyTrait5;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<6,TypeTuple>::type> KeyTrait6;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>, PT<KeyTrait3>,
+                PT<KeyTrait4>, PT<KeyTrait5>, PT<KeyTrait6> > type;
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 8
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<8, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<4,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<5,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<6,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<7,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<8, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<4,TypeTuple>::type> KeyTrait4;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<5,TypeTuple>::type> KeyTrait5;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<6,TypeTuple>::type> KeyTrait6;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<7,TypeTuple>::type> KeyTrait7;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>, PT<KeyTrait3>,
+                PT<KeyTrait4>, PT<KeyTrait5>, PT<KeyTrait6>, PT<KeyTrait7> > type;
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 9
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<9, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<4,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<5,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<6,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<7,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<8,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<9, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<4,TypeTuple>::type> KeyTrait4;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<5,TypeTuple>::type> KeyTrait5;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<6,TypeTuple>::type> KeyTrait6;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<7,TypeTuple>::type> KeyTrait7;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<8,TypeTuple>::type> KeyTrait8;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>, PT<KeyTrait3>,
+                PT<KeyTrait4>, PT<KeyTrait5>, PT<KeyTrait6>, PT<KeyTrait7>, PT<KeyTrait8> > type;
+    };
+#endif
+
+#if __TBB_VARIADIC_MAX >= 10
+    template<template<class> class PT, typename TypeTuple>
+    struct wrap_tuple_elements<10, PT, TypeTuple> {
+        typedef typename tbb::flow::tuple<
+                PT<typename tbb::flow::tuple_element<0,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<1,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<2,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<3,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<4,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<5,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<6,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<7,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<8,TypeTuple>::type>,
+                PT<typename tbb::flow::tuple_element<9,TypeTuple>::type> >
+            type;
+    };
+
+    template<template<class> class PT, typename KeyTraits, typename TypeTuple>
+    struct wrap_key_tuple_elements<10, PT, KeyTraits, TypeTuple> {
+        typedef typename KeyTraits::key_type K;
+        typedef typename KeyTraits::hash_compare_type KHash;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<0,TypeTuple>::type> KeyTrait0;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<1,TypeTuple>::type> KeyTrait1;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<2,TypeTuple>::type> KeyTrait2;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<3,TypeTuple>::type> KeyTrait3;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<4,TypeTuple>::type> KeyTrait4;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<5,TypeTuple>::type> KeyTrait5;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<6,TypeTuple>::type> KeyTrait6;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<7,TypeTuple>::type> KeyTrait7;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<8,TypeTuple>::type> KeyTrait8;
+        typedef KeyTrait<K, KHash, typename tbb::flow::tuple_element<9,TypeTuple>::type> KeyTrait9;
+        typedef typename tbb::flow::tuple< PT<KeyTrait0>, PT<KeyTrait1>, PT<KeyTrait2>, PT<KeyTrait3>,
+                PT<KeyTrait4>, PT<KeyTrait5>, PT<KeyTrait6>, PT<KeyTrait7>, PT<KeyTrait8>,
+                PT<KeyTrait9> > type;
+    };
+#endif
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template< int... S > class sequence {};
+
+    template< int N, int... S >
+    struct make_sequence : make_sequence < N - 1, N - 1, S... > {};
+
+    template< int... S >
+    struct make_sequence < 0, S... > {
+        typedef sequence<S...> type;
+    };
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    // Until C++14 std::initializer_list does not guarantee life time of contained objects.
+    template <typename T>
+    class initializer_list_wrapper {
+    public:
+        typedef T value_type;
+        typedef const T& reference;
+        typedef const T& const_reference;
+        typedef size_t size_type;
+
+        typedef T* iterator;
+        typedef const T* const_iterator;
+
+        initializer_list_wrapper( std::initializer_list<T> il ) __TBB_NOEXCEPT( true ) : my_begin( static_cast<T*>(malloc( il.size()*sizeof( T ) )) ) {
+            iterator dst = my_begin;
+            for ( typename std::initializer_list<T>::const_iterator src = il.begin(); src != il.end(); ++src )
+                new (dst++) T( *src );
+            my_end = dst;
+        }
+
+        initializer_list_wrapper( const initializer_list_wrapper<T>& ilw ) __TBB_NOEXCEPT( true ) : my_begin( static_cast<T*>(malloc( ilw.size()*sizeof( T ) )) ) {
+            iterator dst = my_begin;
+            for ( typename std::initializer_list<T>::const_iterator src = ilw.begin(); src != ilw.end(); ++src )
+                new (dst++) T( *src );
+            my_end = dst;
+        }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        initializer_list_wrapper( initializer_list_wrapper<T>&& ilw ) __TBB_NOEXCEPT( true ) : my_begin( ilw.my_begin ), my_end( ilw.my_end ) {
+            ilw.my_begin = ilw.my_end = NULL;
+        }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+        ~initializer_list_wrapper() {
+            if ( my_begin )
+                free( my_begin );
+        }
+
+        const_iterator begin() const __TBB_NOEXCEPT(true) { return my_begin; }
+        const_iterator end() const __TBB_NOEXCEPT(true) { return my_end; }
+        size_t size() const __TBB_NOEXCEPT(true) { return (size_t)(my_end - my_begin); }
+
+    private:
+        iterator my_begin;
+        iterator my_end;
+    };
+#endif /* __TBB_INITIALIZER_LISTS_PRESENT */
+
+//! type mimicking std::pair but with trailing fill to ensure each element of an array
+//* will have the correct alignment
+    template<typename T1, typename T2, size_t REM>
+    struct type_plus_align {
+        char first[sizeof(T1)];
+        T2 second;
+        char fill1[REM];
+    };
+
+    template<typename T1, typename T2>
+    struct type_plus_align<T1,T2,0> {
+        char first[sizeof(T1)];
+        T2 second;
+    };
+
+    template<class U> struct alignment_of {
+        typedef struct { char t; U    padded; } test_alignment;
+        static const size_t value = sizeof(test_alignment) - sizeof(U);
+    };
+
+    // T1, T2 are actual types stored.  The space defined for T1 in the type returned
+    // is a char array of the correct size.  Type T2 should be trivially-constructible,
+    // T1 must be explicitly managed.
+    template<typename T1, typename T2>
+    struct aligned_pair {
+        static const size_t t1_align = alignment_of<T1>::value;
+        static const size_t t2_align = alignment_of<T2>::value;
+        typedef type_plus_align<T1, T2, 0 > just_pair;
+        static const size_t max_align = t1_align < t2_align ? t2_align : t1_align;
+        static const size_t extra_bytes = sizeof(just_pair) % max_align;
+        static const size_t remainder = extra_bytes ? max_align - extra_bytes : 0;
+    public:
+        typedef type_plus_align<T1,T2,remainder> type;
+    };  // aligned_pair
+
+// support for variant type
+// type we use when we're not storing a value
+struct default_constructed { };
+
+// type which contains another type, tests for what type is contained, and references to it.
+// internal::Wrapper<T>
+//     void CopyTo( void *newSpace) : builds a Wrapper<T> copy of itself in newSpace
+
+// struct to allow us to copy and test the type of objects
+struct WrapperBase {
+    virtual ~WrapperBase() {}
+    virtual void CopyTo(void* /*newSpace*/) const {  }
+};
+
+// Wrapper<T> contains a T, with the ability to test what T is.  The Wrapper<T> can be
+// constructed from a T, can be copy-constructed from another Wrapper<T>, and can be
+// examined via value(), but not modified.
+template<typename T>
+struct Wrapper: public WrapperBase {
+    typedef T value_type;
+    typedef T* pointer_type;
+private:
+    T value_space;
+public:
+    const value_type &value() const { return value_space; }
+
+private:
+    Wrapper();
+
+    // on exception will ensure the Wrapper will contain only a trivially-constructed object
+    struct _unwind_space {
+        pointer_type space;
+        _unwind_space(pointer_type p) : space(p) {}
+        ~_unwind_space() {
+            if(space) (void) new (space) Wrapper<default_constructed>(default_constructed());
+        }
+    };
+public:
+    explicit Wrapper( const T& other ) : value_space(other) { }
+    explicit Wrapper(const Wrapper& other) : value_space(other.value_space) { }
+
+    void CopyTo(void* newSpace) const __TBB_override {
+        _unwind_space guard((pointer_type)newSpace);
+        (void) new(newSpace) Wrapper(value_space);
+        guard.space = NULL;
+    }
+    ~Wrapper() { }
+};
+
+// specialization for array objects
+template<typename T, size_t N>
+struct Wrapper<T[N]> : public WrapperBase {
+    typedef T value_type;
+    typedef T* pointer_type;
+    // space must be untyped.
+    typedef T ArrayType[N];
+private:
+    // The space is not of type T[N] because when copy-constructing, it would be
+    // default-initialized and then copied to in some fashion, resulting in two
+    // constructions and one destruction per element.  If the type is char[ ], we
+    // placement new into each element, resulting in one construction per element.
+    static const size_t space_size = sizeof(ArrayType) / sizeof(char);
+    char value_space[space_size];
+
+
+    // on exception will ensure the already-built objects will be destructed
+    // (the value_space is a char array, so it is already trivially-destructible.)
+    struct _unwind_class {
+        pointer_type space;
+        int    already_built;
+        _unwind_class(pointer_type p) : space(p), already_built(0) {}
+        ~_unwind_class() {
+            if(space) {
+                for(size_t i = already_built; i > 0 ; --i ) space[i-1].~value_type();
+                (void) new(space) Wrapper<default_constructed>(default_constructed());
+            }
+        }
+    };
+public:
+    const ArrayType &value() const {
+        char *vp = const_cast<char *>(value_space);
+        return reinterpret_cast<ArrayType &>(*vp);
+    }
+
+private:
+    Wrapper();
+public:
+    // have to explicitly construct because other decays to a const value_type*
+    explicit Wrapper(const ArrayType& other) {
+        _unwind_class guard((pointer_type)value_space);
+        pointer_type vp = reinterpret_cast<pointer_type>(&value_space);
+        for(size_t i = 0; i < N; ++i ) {
+            (void) new(vp++) value_type(other[i]);
+            ++(guard.already_built);
+        }
+        guard.space = NULL;
+    }
+    explicit Wrapper(const Wrapper& other) : WrapperBase() {
+        // we have to do the heavy lifting to copy contents
+        _unwind_class guard((pointer_type)value_space);
+        pointer_type dp = reinterpret_cast<pointer_type>(value_space);
+        pointer_type sp = reinterpret_cast<pointer_type>(const_cast<char *>(other.value_space));
+        for(size_t i = 0; i < N; ++i, ++dp, ++sp) {
+            (void) new(dp) value_type(*sp);
+            ++(guard.already_built);
+        }
+        guard.space = NULL;
+    }
+
+    void CopyTo(void* newSpace) const __TBB_override {
+        (void) new(newSpace) Wrapper(*this);  // exceptions handled in copy constructor
+    }
+
+    ~Wrapper() {
+        // have to destroy explicitly in reverse order
+        pointer_type vp = reinterpret_cast<pointer_type>(&value_space);
+        for(size_t i = N; i > 0 ; --i ) vp[i-1].~value_type();
+    }
+};
+
+// given a tuple, return the type of the element that has the maximum alignment requirement.
+// Given a tuple and that type, return the number of elements of the object with the max
+// alignment requirement that is at least as big as the largest object in the tuple.
+
+template<bool, class T1, class T2> struct pick_one;
+template<class T1, class T2> struct pick_one<true , T1, T2> { typedef T1 type; };
+template<class T1, class T2> struct pick_one<false, T1, T2> { typedef T2 type; };
+
+template< template<class> class Selector, typename T1, typename T2 >
+struct pick_max {
+    typedef typename pick_one< (Selector<T1>::value > Selector<T2>::value), T1, T2 >::type type;
+};
+
+template<typename T> struct size_of { static const int value = sizeof(T); };
+
+template< size_t N, class Tuple, template<class> class Selector > struct pick_tuple_max {
+    typedef typename pick_tuple_max<N-1, Tuple, Selector>::type LeftMaxType;
+    typedef typename tbb::flow::tuple_element<N-1, Tuple>::type ThisType;
+    typedef typename pick_max<Selector, LeftMaxType, ThisType>::type type;
+};
+
+template< class Tuple, template<class> class Selector > struct pick_tuple_max<0, Tuple, Selector> {
+    typedef typename tbb::flow::tuple_element<0, Tuple>::type type;
+};
+
+// is the specified type included in a tuple?
+template<class Q, size_t N, class Tuple>
+struct is_element_of {
+    typedef typename tbb::flow::tuple_element<N-1, Tuple>::type T_i;
+    static const bool value = tbb::internal::is_same_type<Q,T_i>::value || is_element_of<Q,N-1,Tuple>::value;
+};
+
+template<class Q, class Tuple>
+struct is_element_of<Q,0,Tuple> {
+    typedef typename tbb::flow::tuple_element<0, Tuple>::type T_i;
+    static const bool value = tbb::internal::is_same_type<Q,T_i>::value;
+};
+
+// allow the construction of types that are listed tuple.  If a disallowed type
+// construction is written, a method involving this type is created.  The
+// type has no definition, so a syntax error is generated.
+template<typename T> struct ERROR_Type_Not_allowed_In_Tagged_Msg_Not_Member_Of_Tuple;
+
+template<typename T, bool BUILD_IT> struct do_if;
+template<typename T>
+struct do_if<T, true> {
+    static void construct(void *mySpace, const T& x) {
+        (void) new(mySpace) Wrapper<T>(x);
+    }
+};
+template<typename T>
+struct do_if<T, false> {
+    static void construct(void * /*mySpace*/, const T& x) {
+        // This method is instantiated when the type T does not match any of the
+        // element types in the Tuple in variant<Tuple>.
+        ERROR_Type_Not_allowed_In_Tagged_Msg_Not_Member_Of_Tuple<T>::bad_type(x);
+    }
+};
+
+// Tuple tells us the allowed types that variant can hold.  It determines the alignment of the space in
+// Wrapper, and how big Wrapper is.
+//
+// the object can only be tested for type, and a read-only reference can be fetched by cast_to<T>().
+
+using tbb::internal::punned_cast;
+struct tagged_null_type {};
+template<typename TagType, typename T0, typename T1=tagged_null_type, typename T2=tagged_null_type, typename T3=tagged_null_type,
+                           typename T4=tagged_null_type, typename T5=tagged_null_type, typename T6=tagged_null_type,
+                           typename T7=tagged_null_type, typename T8=tagged_null_type, typename T9=tagged_null_type>
+class tagged_msg {
+    typedef tbb::flow::tuple<T0, T1, T2, T3, T4
+                  //TODO: Should we reject lists longer than a tuple can hold?
+                  #if __TBB_VARIADIC_MAX >= 6
+                  , T5
+                  #endif
+                  #if __TBB_VARIADIC_MAX >= 7
+                  , T6
+                  #endif
+                  #if __TBB_VARIADIC_MAX >= 8
+                  , T7
+                  #endif
+                  #if __TBB_VARIADIC_MAX >= 9
+                  , T8
+                  #endif
+                  #if __TBB_VARIADIC_MAX >= 10
+                  , T9
+                  #endif
+                  > Tuple;
+
+private:
+    class variant {
+        static const size_t N = tbb::flow::tuple_size<Tuple>::value;
+        typedef typename pick_tuple_max<N, Tuple, alignment_of>::type AlignType;
+        typedef typename pick_tuple_max<N, Tuple, size_of>::type MaxSizeType;
+        static const size_t MaxNBytes = (sizeof(Wrapper<MaxSizeType>)+sizeof(AlignType)-1);
+        static const size_t MaxNElements = MaxNBytes/sizeof(AlignType);
+        typedef typename tbb::aligned_space<AlignType, MaxNElements> SpaceType;
+        SpaceType my_space;
+        static const size_t MaxSize = sizeof(SpaceType);
+
+    public:
+        variant() { (void) new(&my_space) Wrapper<default_constructed>(default_constructed()); }
+
+        template<typename T>
+        variant( const T& x ) {
+            do_if<T, is_element_of<T, N, Tuple>::value>::construct(&my_space,x);
+        }
+
+        variant(const variant& other) {
+            const WrapperBase * h = punned_cast<const WrapperBase *>(&(other.my_space));
+            h->CopyTo(&my_space);
+        }
+
+        // assignment must destroy and re-create the Wrapper type, as there is no way
+        // to create a Wrapper-to-Wrapper assign even if we find they agree in type.
+        void operator=( const variant& rhs ) {
+            if(&rhs != this) {
+                WrapperBase *h = punned_cast<WrapperBase *>(&my_space);
+                h->~WrapperBase();
+                const WrapperBase *ch = punned_cast<const WrapperBase *>(&(rhs.my_space));
+                ch->CopyTo(&my_space);
+            }
+        }
+
+        template<typename U>
+        const U& variant_cast_to() const {
+            const Wrapper<U> *h = dynamic_cast<const Wrapper<U>*>(punned_cast<const WrapperBase *>(&my_space));
+            if(!h) {
+                tbb::internal::throw_exception(tbb::internal::eid_bad_tagged_msg_cast);
+            }
+            return h->value();
+        }
+        template<typename U>
+        bool variant_is_a() const { return dynamic_cast<const Wrapper<U>*>(punned_cast<const WrapperBase *>(&my_space)) != NULL; }
+
+        bool variant_is_default_constructed() const {return variant_is_a<default_constructed>();}
+
+        ~variant() {
+            WrapperBase *h = punned_cast<WrapperBase *>(&my_space);
+            h->~WrapperBase();
+        }
+    }; //class variant
+
+    TagType my_tag;
+    variant my_msg;
+
+public:
+    tagged_msg(): my_tag(TagType(~0)), my_msg(){}
+
+    template<typename T, typename R>
+    tagged_msg(T const &index, R const &value) : my_tag(index), my_msg(value) {}
+
+    #if __TBB_CONST_REF_TO_ARRAY_TEMPLATE_PARAM_BROKEN
+    template<typename T, typename R, size_t N>
+    tagged_msg(T const &index,  R (&value)[N]) : my_tag(index), my_msg(value) {}
+    #endif
+
+    void set_tag(TagType const &index) {my_tag = index;}
+    TagType tag() const {return my_tag;}
+
+    template<typename V>
+    const V& cast_to() const {return my_msg.template variant_cast_to<V>();}
+
+    template<typename V>
+    bool is_a() const {return my_msg.template variant_is_a<V>();}
+
+    bool is_default_constructed() const {return my_msg.variant_is_default_constructed();}
+}; //class tagged_msg
+
+// template to simplify cast and test for tagged_msg in template contexts
+template<typename V, typename T>
+const V& cast_to(T const &t) { return t.template cast_to<V>(); }
+
+template<typename V, typename T>
+bool is_a(T const &t) { return t.template is_a<V>(); }
+
+enum op_stat { WAIT = 0, SUCCEEDED, FAILED };
+
+}  // namespace internal
+
+#endif  /* __TBB__flow_graph_types_impl_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_mutex_padding.h b/xdl/third_party/tbb/include/tbb/internal/_mutex_padding.h
new file mode 100644
index 00000000..8d098a4e
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_mutex_padding.h
@@ -0,0 +1,102 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_mutex_padding_H
+#define __TBB_mutex_padding_H
+
+// wrapper for padding mutexes to be alone on a cache line, without requiring they be allocated
+// from a pool.  Because we allow them to be defined anywhere they must be two cache lines in size.
+
+
+namespace tbb {
+namespace interface7 {
+namespace internal {
+
+static const size_t cache_line_size = 64;
+
+// Pad a mutex to occupy a number of full cache lines sufficient to avoid false sharing
+// with other data; space overhead is up to 2*cache_line_size-1.
+template<typename Mutex, bool is_rw> class padded_mutex;
+
+template<typename Mutex>
+class padded_mutex<Mutex,false> : tbb::internal::mutex_copy_deprecated_and_disabled {
+    typedef long pad_type;
+    pad_type my_pad[((sizeof(Mutex)+cache_line_size-1)/cache_line_size+1)*cache_line_size/sizeof(pad_type)];
+
+    Mutex *impl() { return (Mutex *)((uintptr_t(this)|(cache_line_size-1))+1);}
+
+public:
+    static const bool is_rw_mutex = Mutex::is_rw_mutex;
+    static const bool is_recursive_mutex = Mutex::is_recursive_mutex;
+    static const bool is_fair_mutex = Mutex::is_fair_mutex;
+
+    padded_mutex() { new(impl()) Mutex(); }
+    ~padded_mutex() { impl()->~Mutex(); }
+
+    //! Represents acquisition of a mutex.
+    class scoped_lock :  tbb::internal::no_copy {
+        typename Mutex::scoped_lock my_scoped_lock;
+    public:
+        scoped_lock() : my_scoped_lock() {}
+        scoped_lock( padded_mutex& m ) : my_scoped_lock(*m.impl()) { }
+        ~scoped_lock() {  }
+
+        void acquire( padded_mutex& m ) { my_scoped_lock.acquire(*m.impl()); }
+        bool try_acquire( padded_mutex& m ) { return my_scoped_lock.try_acquire(*m.impl()); }
+        void release() { my_scoped_lock.release(); }
+    };
+};
+
+template<typename Mutex>
+class padded_mutex<Mutex,true> : tbb::internal::mutex_copy_deprecated_and_disabled {
+    typedef long pad_type;
+    pad_type my_pad[((sizeof(Mutex)+cache_line_size-1)/cache_line_size+1)*cache_line_size/sizeof(pad_type)];
+
+    Mutex *impl() { return (Mutex *)((uintptr_t(this)|(cache_line_size-1))+1);}
+
+public:
+    static const bool is_rw_mutex = Mutex::is_rw_mutex;
+    static const bool is_recursive_mutex = Mutex::is_recursive_mutex;
+    static const bool is_fair_mutex = Mutex::is_fair_mutex;
+
+    padded_mutex() { new(impl()) Mutex(); }
+    ~padded_mutex() { impl()->~Mutex(); }
+
+    //! Represents acquisition of a mutex.
+    class scoped_lock :  tbb::internal::no_copy {
+        typename Mutex::scoped_lock my_scoped_lock;
+    public:
+        scoped_lock() : my_scoped_lock() {}
+        scoped_lock( padded_mutex& m, bool write = true ) : my_scoped_lock(*m.impl(),write) { }
+        ~scoped_lock() {  }
+
+        void acquire( padded_mutex& m, bool write = true ) { my_scoped_lock.acquire(*m.impl(),write); }
+        bool try_acquire( padded_mutex& m, bool write = true ) { return my_scoped_lock.try_acquire(*m.impl(),write); }
+        bool upgrade_to_writer() { return my_scoped_lock.upgrade_to_writer(); }
+        bool downgrade_to_reader() { return my_scoped_lock.downgrade_to_reader(); }
+        void release() { my_scoped_lock.release(); }
+    };
+};
+
+} // namespace internal
+} // namespace interface7
+} // namespace tbb
+
+#endif /* __TBB_mutex_padding_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_range_iterator.h b/xdl/third_party/tbb/include/tbb/internal/_range_iterator.h
new file mode 100644
index 00000000..68ae28f6
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_range_iterator.h
@@ -0,0 +1,70 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_range_iterator_H
+#define __TBB_range_iterator_H
+
+#include "../tbb_stddef.h"
+
+#if __TBB_CPP11_STD_BEGIN_END_PRESENT && __TBB_CPP11_AUTO_PRESENT && __TBB_CPP11_DECLTYPE_PRESENT
+    #include <iterator>
+#endif
+
+namespace tbb {
+    // iterators to first and last elements of container
+    namespace internal {
+
+#if __TBB_CPP11_STD_BEGIN_END_PRESENT && __TBB_CPP11_AUTO_PRESENT && __TBB_CPP11_DECLTYPE_PRESENT
+        using std::begin;
+        using std::end;
+        template<typename Container>
+        auto first(Container& c)-> decltype(begin(c))  {return begin(c);}
+
+        template<typename Container>
+        auto first(const Container& c)-> decltype(begin(c))  {return begin(c);}
+
+        template<typename Container>
+        auto last(Container& c)-> decltype(begin(c))  {return end(c);}
+
+        template<typename Container>
+        auto last(const Container& c)-> decltype(begin(c)) {return end(c);}
+#else
+        template<typename Container>
+        typename Container::iterator first(Container& c) {return c.begin();}
+
+        template<typename Container>
+        typename Container::const_iterator first(const Container& c) {return c.begin();}
+
+        template<typename Container>
+        typename Container::iterator last(Container& c) {return c.end();}
+
+        template<typename Container>
+        typename Container::const_iterator last(const Container& c) {return c.end();}
+#endif
+
+        template<typename T, size_t size>
+        T* first(T (&arr) [size]) {return arr;}
+
+        template<typename T, size_t size>
+        T* last(T (&arr) [size]) {return arr + size;}
+    } //namespace internal
+}  //namespace tbb
+
+#endif // __TBB_range_iterator_H
diff --git a/xdl/third_party/tbb/include/tbb/internal/_tbb_hash_compare_impl.h b/xdl/third_party/tbb/include/tbb/internal/_tbb_hash_compare_impl.h
new file mode 100644
index 00000000..2bcbdedc
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_tbb_hash_compare_impl.h
@@ -0,0 +1,109 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// must be included outside namespaces.
+#ifndef __TBB_tbb_hash_compare_impl_H
+#define __TBB_tbb_hash_compare_impl_H
+
+#include <string>
+
+namespace tbb {
+namespace interface5 {
+namespace internal {
+
+// Template class for hash compare
+template<typename Key, typename Hasher, typename Key_equality>
+class hash_compare
+{
+public:
+    typedef Hasher hasher;
+    typedef Key_equality key_equal;
+
+    hash_compare() {}
+
+    hash_compare(Hasher a_hasher) : my_hash_object(a_hasher) {}
+
+    hash_compare(Hasher a_hasher, Key_equality a_keyeq) : my_hash_object(a_hasher), my_key_compare_object(a_keyeq) {}
+
+    size_t operator()(const Key& key) const {
+        return ((size_t)my_hash_object(key));
+    }
+
+    bool operator()(const Key& key1, const Key& key2) const {
+        // TODO: get rid of the result invertion
+        return (!my_key_compare_object(key1, key2));
+    }
+
+    Hasher       my_hash_object;        // The hash object
+    Key_equality my_key_compare_object; // The equality comparator object
+};
+
+//! Hash multiplier
+static const size_t hash_multiplier = tbb::internal::select_size_t_constant<2654435769U, 11400714819323198485ULL>::value;
+
+} // namespace internal
+
+//! Hasher functions
+template<typename T>
+inline size_t tbb_hasher( const T& t ) {
+    return static_cast<size_t>( t ) * internal::hash_multiplier;
+}
+template<typename P>
+inline size_t tbb_hasher( P* ptr ) {
+    size_t const h = reinterpret_cast<size_t>( ptr );
+    return (h >> 3) ^ h;
+}
+template<typename E, typename S, typename A>
+inline size_t tbb_hasher( const std::basic_string<E,S,A>& s ) {
+    size_t h = 0;
+    for( const E* c = s.c_str(); *c; ++c )
+        h = static_cast<size_t>(*c) ^ (h * internal::hash_multiplier);
+    return h;
+}
+template<typename F, typename S>
+inline size_t tbb_hasher( const std::pair<F,S>& p ) {
+    return tbb_hasher(p.first) ^ tbb_hasher(p.second);
+}
+
+} // namespace interface5
+using interface5::tbb_hasher;
+
+// Template class for hash compare
+template<typename Key>
+class tbb_hash
+{
+public:
+    tbb_hash() {}
+
+    size_t operator()(const Key& key) const
+    {
+        return tbb_hasher(key);
+    }
+};
+
+//! hash_compare that is default argument for concurrent_hash_map
+template<typename Key>
+struct tbb_hash_compare {
+    static size_t hash( const Key& a ) { return tbb_hasher(a); }
+    static bool equal( const Key& a, const Key& b ) { return a == b; }
+};
+
+}  // namespace tbb
+#endif  /*  __TBB_tbb_hash_compare_impl_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_tbb_strings.h b/xdl/third_party/tbb/include/tbb/internal/_tbb_strings.h
new file mode 100644
index 00000000..6172bc4e
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_tbb_strings.h
@@ -0,0 +1,80 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+TBB_STRING_RESOURCE(FLOW_BROADCAST_NODE, "broadcast_node")
+TBB_STRING_RESOURCE(FLOW_BUFFER_NODE, "buffer_node")
+TBB_STRING_RESOURCE(FLOW_CONTINUE_NODE, "continue_node")
+TBB_STRING_RESOURCE(FLOW_FUNCTION_NODE, "function_node")
+TBB_STRING_RESOURCE(FLOW_JOIN_NODE_QUEUEING, "join_node (queueing)")
+TBB_STRING_RESOURCE(FLOW_JOIN_NODE_RESERVING, "join_node (reserving)")
+TBB_STRING_RESOURCE(FLOW_JOIN_NODE_TAG_MATCHING, "join_node (tag_matching)")
+TBB_STRING_RESOURCE(FLOW_LIMITER_NODE, "limiter_node")
+TBB_STRING_RESOURCE(FLOW_MULTIFUNCTION_NODE, "multifunction_node")
+TBB_STRING_RESOURCE(FLOW_OR_NODE, "or_node") //no longer in use, kept for backward compatibility
+TBB_STRING_RESOURCE(FLOW_OVERWRITE_NODE, "overwrite_node")
+TBB_STRING_RESOURCE(FLOW_PRIORITY_QUEUE_NODE, "priority_queue_node")
+TBB_STRING_RESOURCE(FLOW_QUEUE_NODE, "queue_node")
+TBB_STRING_RESOURCE(FLOW_SEQUENCER_NODE, "sequencer_node")
+TBB_STRING_RESOURCE(FLOW_SOURCE_NODE, "source_node")
+TBB_STRING_RESOURCE(FLOW_SPLIT_NODE, "split_node")
+TBB_STRING_RESOURCE(FLOW_WRITE_ONCE_NODE, "write_once_node")
+TBB_STRING_RESOURCE(FLOW_BODY, "body")
+TBB_STRING_RESOURCE(FLOW_GRAPH, "graph")
+TBB_STRING_RESOURCE(FLOW_NODE, "node")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT, "input_port")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_0, "input_port_0")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_1, "input_port_1")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_2, "input_port_2")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_3, "input_port_3")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_4, "input_port_4")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_5, "input_port_5")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_6, "input_port_6")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_7, "input_port_7")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_8, "input_port_8")
+TBB_STRING_RESOURCE(FLOW_INPUT_PORT_9, "input_port_9")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT, "output_port")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_0, "output_port_0")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_1, "output_port_1")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_2, "output_port_2")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_3, "output_port_3")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_4, "output_port_4")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_5, "output_port_5")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_6, "output_port_6")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_7, "output_port_7")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_8, "output_port_8")
+TBB_STRING_RESOURCE(FLOW_OUTPUT_PORT_9, "output_port_9")
+TBB_STRING_RESOURCE(FLOW_OBJECT_NAME, "object_name")
+TBB_STRING_RESOURCE(FLOW_NULL, "null")
+TBB_STRING_RESOURCE(FLOW_INDEXER_NODE, "indexer_node")
+TBB_STRING_RESOURCE(FLOW_COMPOSITE_NODE, "composite_node")
+TBB_STRING_RESOURCE(FLOW_ASYNC_NODE, "async_node")
+TBB_STRING_RESOURCE(FLOW_OPENCL_NODE, "opencl_node")
+TBB_STRING_RESOURCE(ALGORITHM, "tbb_algorithm")
+TBB_STRING_RESOURCE(PARALLEL_FOR, "tbb_parallel_for")
+TBB_STRING_RESOURCE(PARALLEL_DO, "tbb_parallel_do")
+TBB_STRING_RESOURCE(PARALLEL_INVOKE, "tbb_parallel_invoke")
+TBB_STRING_RESOURCE(PARALLEL_REDUCE, "tbb_parallel_reduce")
+TBB_STRING_RESOURCE(PARALLEL_SCAN, "tbb_parallel_scan")
+TBB_STRING_RESOURCE(PARALLEL_SORT, "tbb_parallel_sort")
+TBB_STRING_RESOURCE(CUSTOM_CTX, "tbb_custom")
+TBB_STRING_RESOURCE(FLOW_TASKS, "tbb_flow_graph")
+TBB_STRING_RESOURCE(PARALLEL_FOR_TASK, "tbb_parallel_for_task")
+// TODO: Drop following string prefix "fgt_" here and in FGA's collector
+TBB_STRING_RESOURCE(USER_EVENT, "fgt_user_event")
diff --git a/xdl/third_party/tbb/include/tbb/internal/_tbb_trace_impl.h b/xdl/third_party/tbb/include/tbb/internal/_tbb_trace_impl.h
new file mode 100644
index 00000000..24021d04
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_tbb_trace_impl.h
@@ -0,0 +1,59 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _FGT_TBB_TRACE_IMPL_H
+#define _FGT_TBB_TRACE_IMPL_H
+
+#include "../tbb_profiling.h"
+
+namespace tbb {
+    namespace internal {
+
+#if TBB_PREVIEW_ALGORITHM_TRACE
+        static inline void fgt_algorithm( string_index t, void *algorithm, void *parent ) {
+            itt_make_task_group( ITT_DOMAIN_FLOW, algorithm, ALGORITHM, parent, ALGORITHM, t );
+        }
+        static inline void fgt_begin_algorithm( string_index t, void *algorithm ) {
+            itt_task_begin( ITT_DOMAIN_FLOW, algorithm, ALGORITHM, NULL, FLOW_NULL, t );
+        }
+        static inline void fgt_end_algorithm( void * ) {
+            itt_task_end( ITT_DOMAIN_FLOW );
+        }
+        static inline void fgt_alg_begin_body( string_index t, void *body, void *algorithm ) {
+            itt_task_begin( ITT_DOMAIN_FLOW, body, FLOW_BODY, algorithm, ALGORITHM, t );
+        }
+        static inline void fgt_alg_end_body( void * ) {
+            itt_task_end( ITT_DOMAIN_FLOW );
+        }
+
+#else // TBB_PREVIEW_ALGORITHM_TRACE
+
+        static inline void fgt_algorithm( string_index /*t*/, void * /*algorithm*/, void * /*parent*/ ) { }
+        static inline void fgt_begin_algorithm( string_index /*t*/, void * /*algorithm*/ ) { }
+        static inline void fgt_end_algorithm( void * ) { }
+        static inline void fgt_alg_begin_body( string_index /*t*/, void * /*body*/, void * /*algorithm*/ ) { }
+        static inline void fgt_alg_end_body( void * ) { }
+
+#endif // TBB_PREVIEW_ALGORITHM_TRACEE
+
+    } // namespace internal
+} // namespace tbb
+
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/internal/_tbb_windef.h b/xdl/third_party/tbb/include/tbb/internal/_tbb_windef.h
new file mode 100644
index 00000000..938c949d
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_tbb_windef.h
@@ -0,0 +1,73 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_windef_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif /* __TBB_tbb_windef_H */
+
+// Check that the target Windows version has all API calls requried for TBB.
+// Do not increase the version in condition beyond 0x0500 without prior discussion!
+#if defined(_WIN32_WINNT) && _WIN32_WINNT<0x0501
+#error TBB is unable to run on old Windows versions; _WIN32_WINNT must be 0x0501 or greater.
+#endif
+
+#if !defined(_MT)
+#error TBB requires linkage with multithreaded C/C++ runtime library. \
+       Choose multithreaded DLL runtime in project settings, or use /MD[d] compiler switch.
+#endif
+
+// Workaround for the problem with MVSC headers failing to define namespace std
+namespace std {
+  using ::size_t; using ::ptrdiff_t;
+}
+
+#define __TBB_STRING_AUX(x) #x
+#define __TBB_STRING(x) __TBB_STRING_AUX(x)
+
+// Default setting of TBB_USE_DEBUG
+#ifdef TBB_USE_DEBUG
+#    if TBB_USE_DEBUG
+#        if !defined(_DEBUG)
+#            pragma message(__FILE__ "(" __TBB_STRING(__LINE__) ") : Warning: Recommend using /MDd if compiling with TBB_USE_DEBUG!=0")
+#        endif
+#    else
+#        if defined(_DEBUG)
+#            pragma message(__FILE__ "(" __TBB_STRING(__LINE__) ") : Warning: Recommend using /MD if compiling with TBB_USE_DEBUG==0")
+#        endif
+#    endif
+#endif
+
+#if (__TBB_BUILD || __TBBMALLOC_BUILD) && !defined(__TBB_NO_IMPLICIT_LINKAGE)
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+#endif
+
+#if _MSC_VER
+    #if !__TBB_NO_IMPLICIT_LINKAGE
+        #ifdef __TBB_LIB_NAME
+	        #pragma comment(lib, __TBB_STRING(__TBB_LIB_NAME))
+        #else
+			#ifdef _DEBUG
+				#pragma comment(lib, "tbb_debug.lib")
+			#else
+				#pragma comment(lib, "tbb.lib")
+			#endif
+        #endif
+    #endif
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/internal/_template_helpers.h b/xdl/third_party/tbb/include/tbb/internal/_template_helpers.h
new file mode 100644
index 00000000..09af157e
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_template_helpers.h
@@ -0,0 +1,181 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_template_helpers_H
+#define __TBB_template_helpers_H
+
+#include <utility>
+#include <cstddef>
+
+namespace tbb { namespace internal {
+
+//! Enables one or the other code branches
+template<bool Condition, typename T = void> struct enable_if {};
+template<typename T> struct enable_if<true, T> { typedef T type; };
+
+//! Strips its template type argument from cv- and ref-qualifiers
+template<typename T> struct strip                     { typedef T type; };
+template<typename T> struct strip<const T>            { typedef T type; };
+template<typename T> struct strip<volatile T>         { typedef T type; };
+template<typename T> struct strip<const volatile T>   { typedef T type; };
+template<typename T> struct strip<T&>                 { typedef T type; };
+template<typename T> struct strip<const T&>           { typedef T type; };
+template<typename T> struct strip<volatile T&>        { typedef T type; };
+template<typename T> struct strip<const volatile T&>  { typedef T type; };
+//! Specialization for function pointers
+template<typename T> struct strip<T(&)()>             { typedef T(*type)(); };
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<typename T> struct strip<T&&>                { typedef T type; };
+template<typename T> struct strip<const T&&>          { typedef T type; };
+template<typename T> struct strip<volatile T&&>       { typedef T type; };
+template<typename T> struct strip<const volatile T&&> { typedef T type; };
+#endif
+//! Specialization for arrays converts to a corresponding pointer
+template<typename T, std::size_t N> struct strip<T(&)[N]>                { typedef T* type; };
+template<typename T, std::size_t N> struct strip<const T(&)[N]>          { typedef const T* type; };
+template<typename T, std::size_t N> struct strip<volatile T(&)[N]>       { typedef volatile T* type; };
+template<typename T, std::size_t N> struct strip<const volatile T(&)[N]> { typedef const volatile T* type; };
+
+//! Detects whether two given types are the same
+template<class U, class V> struct is_same_type      { static const bool value = false; };
+template<class W>          struct is_same_type<W,W> { static const bool value = true; };
+
+template<typename T> struct is_ref { static const bool value = false; };
+template<typename U> struct is_ref<U&> { static const bool value = true; };
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+//! std::void_t internal implementation (to avoid GCC < 4.7 "template aliases" absence)
+template<typename...> struct void_t { typedef void type; };
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+
+//! Allows to store a function parameter pack as a variable and later pass it to another function
+template< typename... Types >
+struct stored_pack;
+
+template<>
+struct stored_pack<>
+{
+    typedef stored_pack<> pack_type;
+    stored_pack() {}
+
+    // Friend front-end functions
+    template< typename F, typename Pack > friend void call( F&& f, Pack&& p );
+    template< typename Ret, typename F, typename Pack > friend Ret call_and_return( F&& f, Pack&& p );
+
+protected:
+    // Ideally, ref-qualified non-static methods would be used,
+    // but that would greatly reduce the set of compilers where it works.
+    template< typename Ret, typename F, typename... Preceding >
+    static Ret call( F&& f, const pack_type& /*pack*/, Preceding&&... params ) {
+        return std::forward<F>(f)( std::forward<Preceding>(params)... );
+    }
+    template< typename Ret, typename F, typename... Preceding >
+    static Ret call( F&& f, pack_type&& /*pack*/, Preceding&&... params ) {
+        return std::forward<F>(f)( std::forward<Preceding>(params)... );
+    }
+};
+
+template< typename T, typename... Types >
+struct stored_pack<T, Types...> : stored_pack<Types...>
+{
+    typedef stored_pack<T, Types...> pack_type;
+    typedef stored_pack<Types...> pack_remainder;
+    // Since lifetime of original values is out of control, copies should be made.
+    // Thus references should be stripped away from the deduced type.
+    typename strip<T>::type leftmost_value;
+
+    // Here rvalue references act in the same way as forwarding references,
+    // as long as class template parameters were deduced via forwarding references.
+    stored_pack( T&& t, Types&&... types )
+    : pack_remainder(std::forward<Types>(types)...), leftmost_value(std::forward<T>(t)) {}
+
+    // Friend front-end functions
+    template< typename F, typename Pack > friend void call( F&& f, Pack&& p );
+    template< typename Ret, typename F, typename Pack > friend Ret call_and_return( F&& f, Pack&& p );
+
+protected:
+    template< typename Ret, typename F, typename... Preceding >
+    static Ret call( F&& f, pack_type& pack, Preceding&&... params ) {
+        return pack_remainder::template call<Ret>(
+            std::forward<F>(f), static_cast<pack_remainder&>(pack),
+            std::forward<Preceding>(params)... , pack.leftmost_value
+        );
+    }
+    template< typename Ret, typename F, typename... Preceding >
+    static Ret call( F&& f, const pack_type& pack, Preceding&&... params ) {
+        return pack_remainder::template call<Ret>(
+            std::forward<F>(f), static_cast<const pack_remainder&>(pack),
+            std::forward<Preceding>(params)... , pack.leftmost_value
+        );
+    }
+    template< typename Ret, typename F, typename... Preceding >
+    static Ret call( F&& f, pack_type&& pack, Preceding&&... params ) {
+        return pack_remainder::template call<Ret>(
+            std::forward<F>(f), static_cast<pack_remainder&&>(pack),
+            std::forward<Preceding>(params)... , std::move(pack.leftmost_value)
+        );
+    }
+};
+
+//! Calls the given function with arguments taken from a stored_pack
+template< typename F, typename Pack >
+void call( F&& f, Pack&& p ) {
+    strip<Pack>::type::template call<void>( std::forward<F>(f), std::forward<Pack>(p) );
+}
+
+template< typename Ret, typename F, typename Pack >
+Ret call_and_return( F&& f, Pack&& p ) {
+    return strip<Pack>::type::template call<Ret>( std::forward<F>(f), std::forward<Pack>(p) );
+}
+
+template< typename... Types >
+stored_pack<Types...> save_pack( Types&&... types ) {
+    return stored_pack<Types...>( std::forward<Types>(types)... );
+}
+
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+
+#if __TBB_CPP14_INTEGER_SEQUENCE_PRESENT
+
+using std::index_sequence;
+using std::make_index_sequence;
+
+#elif __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT
+
+template<std::size_t... S> class index_sequence {};
+
+template<std::size_t N, std::size_t... S>
+struct make_index_sequence_impl : make_index_sequence_impl < N - 1, N - 1, S... > {};
+
+template<std::size_t... S>
+struct make_index_sequence_impl <0, S...> {
+    using type = index_sequence<S...>;
+};
+
+template<std::size_t N>
+using make_index_sequence = typename tbb::internal::make_index_sequence_impl<N>::type;
+
+#endif /* __TBB_CPP14_INTEGER_SEQUENCE_PRESENT */
+
+} } // namespace internal, namespace tbb
+
+#endif /* __TBB_template_helpers_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_x86_eliding_mutex_impl.h b/xdl/third_party/tbb/include/tbb/internal/_x86_eliding_mutex_impl.h
new file mode 100644
index 00000000..f0117998
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_x86_eliding_mutex_impl.h
@@ -0,0 +1,148 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__x86_eliding_mutex_impl_H
+#define __TBB__x86_eliding_mutex_impl_H
+
+#ifndef __TBB_spin_mutex_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#if ( __TBB_x86_32 || __TBB_x86_64 )
+
+namespace tbb {
+namespace interface7 {
+namespace internal {
+
+template<typename Mutex, bool is_rw>
+class padded_mutex;
+
+//! An eliding lock that occupies a single byte.
+/** A x86_eliding_mutex is an HLE-enabled spin mutex. It is recommended to
+    put the mutex on a cache line that is not shared by the data it protects.
+    It should be used for locking short critical sections where the lock is
+    contended but the data it protects are not.  If zero-initialized, the
+    mutex is considered unheld.
+    @ingroup synchronization */
+class x86_eliding_mutex : tbb::internal::mutex_copy_deprecated_and_disabled {
+    //! 0 if lock is released, 1 if lock is acquired.
+    __TBB_atomic_flag flag;
+
+    friend class padded_mutex<x86_eliding_mutex, false>;
+
+public:
+    //! Construct unacquired lock.
+    /** Equivalent to zero-initialization of *this. */
+    x86_eliding_mutex() : flag(0) {}
+
+// bug in gcc 3.x.x causes syntax error in spite of the friend declaration above.
+// Make the scoped_lock public in that case.
+#if __TBB_USE_X86_ELIDING_MUTEX || __TBB_GCC_VERSION < 40000
+#else
+    // by default we will not provide the scoped_lock interface.  The user
+    // should use the padded version of the mutex.  scoped_lock is used in
+    // padded_mutex template.
+private:
+#endif
+    // scoped_lock in padded_mutex<> is the interface to use.
+    //! Represents acquisition of a mutex.
+    class scoped_lock : tbb::internal::no_copy {
+    private:
+        //! Points to currently held mutex, or NULL if no lock is held.
+        x86_eliding_mutex* my_mutex;
+
+    public:
+        //! Construct without acquiring a mutex.
+        scoped_lock() : my_mutex(NULL) {}
+
+        //! Construct and acquire lock on a mutex.
+        scoped_lock( x86_eliding_mutex& m ) : my_mutex(NULL) { acquire(m); }
+
+        //! Acquire lock.
+        void acquire( x86_eliding_mutex& m ) {
+            __TBB_ASSERT( !my_mutex, "already holding a lock" );
+
+            my_mutex=&m;
+            my_mutex->lock();
+        }
+
+        //! Try acquiring lock (non-blocking)
+        /** Return true if lock acquired; false otherwise. */
+        bool try_acquire( x86_eliding_mutex& m ) {
+            __TBB_ASSERT( !my_mutex, "already holding a lock" );
+
+            bool result = m.try_lock();
+            if( result ) {
+                my_mutex = &m;
+            }
+            return result;
+        }
+
+        //! Release lock
+        void release() {
+            __TBB_ASSERT( my_mutex, "release on scoped_lock that is not holding a lock" );
+
+            my_mutex->unlock();
+            my_mutex = NULL;
+        }
+
+        //! Destroy lock.  If holding a lock, releases the lock first.
+        ~scoped_lock() {
+            if( my_mutex ) {
+                release();
+            }
+        }
+    };
+#if __TBB_USE_X86_ELIDING_MUTEX || __TBB_GCC_VERSION < 40000
+#else
+public:
+#endif  /* __TBB_USE_X86_ELIDING_MUTEX */
+
+    // Mutex traits
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = false;
+
+    // ISO C++0x compatibility methods
+
+    //! Acquire lock
+    void lock() {
+        __TBB_LockByteElided(flag);
+    }
+
+    //! Try acquiring lock (non-blocking)
+    /** Return true if lock acquired; false otherwise. */
+    bool try_lock() {
+        return __TBB_TryLockByteElided(flag);
+    }
+
+    //! Release lock
+    void unlock() {
+        __TBB_UnlockByteElided( flag );
+    }
+}; // end of x86_eliding_mutex
+
+} // namespace internal
+} // namespace interface7
+} // namespace tbb
+
+#endif /* ( __TBB_x86_32 || __TBB_x86_64 ) */
+
+#endif /* __TBB__x86_eliding_mutex_impl_H */
diff --git a/xdl/third_party/tbb/include/tbb/internal/_x86_rtm_rw_mutex_impl.h b/xdl/third_party/tbb/include/tbb/internal/_x86_rtm_rw_mutex_impl.h
new file mode 100644
index 00000000..c268b930
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/internal/_x86_rtm_rw_mutex_impl.h
@@ -0,0 +1,225 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB__x86_rtm_rw_mutex_impl_H
+#define __TBB__x86_rtm_rw_mutex_impl_H
+
+#ifndef __TBB_spin_rw_mutex_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#if __TBB_TSX_AVAILABLE
+
+#include "../tbb_stddef.h"
+#include "../tbb_machine.h"
+#include "../tbb_profiling.h"
+#include "../spin_rw_mutex.h"
+
+namespace tbb {
+namespace interface8 {
+namespace internal {
+
+enum RTM_type {
+    RTM_not_in_mutex,
+    RTM_transacting_reader,
+    RTM_transacting_writer,
+    RTM_real_reader,
+    RTM_real_writer
+};
+
+static const unsigned long speculation_granularity = 64;
+
+//! Fast, unfair, spinning speculation-enabled reader-writer lock with backoff and
+//  writer-preference
+/** @ingroup synchronization */
+class x86_rtm_rw_mutex: private spin_rw_mutex {
+#if __TBB_USE_X86_RTM_RW_MUTEX || __TBB_GCC_VERSION < 40000
+// bug in gcc 3.x.x causes syntax error in spite of the friend declaration below.
+// Make the scoped_lock public in that case.
+public:
+#else
+private:
+#endif
+    friend class interface7::internal::padded_mutex<x86_rtm_rw_mutex,true>;
+    class scoped_lock;   // should be private
+    friend class scoped_lock;
+private:
+    //! @cond INTERNAL
+
+    //! Internal construct unacquired mutex.
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    //! Internal acquire write lock.
+    // only_speculate == true if we're doing a try_lock, else false.
+    void __TBB_EXPORTED_METHOD internal_acquire_writer(x86_rtm_rw_mutex::scoped_lock&, bool only_speculate=false);
+
+    //! Internal acquire read lock.
+    // only_speculate == true if we're doing a try_lock, else false.
+    void __TBB_EXPORTED_METHOD internal_acquire_reader(x86_rtm_rw_mutex::scoped_lock&, bool only_speculate=false);
+
+    //! Internal upgrade reader to become a writer.
+    bool __TBB_EXPORTED_METHOD internal_upgrade( x86_rtm_rw_mutex::scoped_lock& );
+
+    //! Out of line code for downgrading a writer to a reader.
+    bool __TBB_EXPORTED_METHOD internal_downgrade( x86_rtm_rw_mutex::scoped_lock& );
+
+    //! Internal try_acquire write lock.
+    bool __TBB_EXPORTED_METHOD internal_try_acquire_writer( x86_rtm_rw_mutex::scoped_lock& );
+
+    //! Internal release lock.
+    void __TBB_EXPORTED_METHOD internal_release( x86_rtm_rw_mutex::scoped_lock& );
+
+    static x86_rtm_rw_mutex* internal_get_mutex( const spin_rw_mutex::scoped_lock& lock )
+    {
+        return static_cast<x86_rtm_rw_mutex*>( lock.mutex );
+    }
+    static void internal_set_mutex( spin_rw_mutex::scoped_lock& lock, spin_rw_mutex* mtx )
+    {
+        lock.mutex = mtx;
+    }
+    //! @endcond
+public:
+    //! Construct unacquired mutex.
+    x86_rtm_rw_mutex() {
+        w_flag = false;
+#if TBB_USE_THREADING_TOOLS
+        internal_construct();
+#endif
+    }
+
+#if TBB_USE_ASSERT
+    //! Empty destructor.
+    ~x86_rtm_rw_mutex() {}
+#endif /* TBB_USE_ASSERT */
+
+    // Mutex traits
+    static const bool is_rw_mutex = true;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = false;
+
+#if __TBB_USE_X86_RTM_RW_MUTEX || __TBB_GCC_VERSION < 40000
+#else
+    // by default we will not provide the scoped_lock interface.  The user
+    // should use the padded version of the mutex.  scoped_lock is used in
+    // padded_mutex template.
+private:
+#endif
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    // Speculation-enabled scoped lock for spin_rw_mutex
+    // The idea is to be able to reuse the acquire/release methods of spin_rw_mutex
+    // and its scoped lock wherever possible.  The only way to use a speculative lock is to use
+    // a scoped_lock. (because transaction_state must be local)
+
+    class scoped_lock : tbb::internal::no_copy {
+        friend class x86_rtm_rw_mutex;
+        spin_rw_mutex::scoped_lock my_scoped_lock;
+
+        RTM_type transaction_state;
+
+    public:
+        //! Construct lock that has not acquired a mutex.
+        /** Equivalent to zero-initialization of *this. */
+        scoped_lock() : my_scoped_lock(), transaction_state(RTM_not_in_mutex) {
+        }
+
+        //! Acquire lock on given mutex.
+        scoped_lock( x86_rtm_rw_mutex& m, bool write = true ) : my_scoped_lock(),
+            transaction_state(RTM_not_in_mutex) {
+            acquire(m, write);
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if(transaction_state != RTM_not_in_mutex) release();
+        }
+
+        //! Acquire lock on given mutex.
+        void acquire( x86_rtm_rw_mutex& m, bool write = true ) {
+            if( write ) m.internal_acquire_writer(*this);
+            else        m.internal_acquire_reader(*this);
+        }
+
+        //! Release lock
+        void release() {
+            x86_rtm_rw_mutex* mutex = x86_rtm_rw_mutex::internal_get_mutex(my_scoped_lock);
+            __TBB_ASSERT( mutex, "lock is not acquired" );
+            __TBB_ASSERT( transaction_state!=RTM_not_in_mutex, "lock is not acquired" );
+            return mutex->internal_release(*this);
+        }
+
+        //! Upgrade reader to become a writer.
+        /** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+        bool upgrade_to_writer() {
+            x86_rtm_rw_mutex* mutex = x86_rtm_rw_mutex::internal_get_mutex(my_scoped_lock);
+            __TBB_ASSERT( mutex, "lock is not acquired" );
+            __TBB_ASSERT( transaction_state==RTM_transacting_reader || transaction_state==RTM_real_reader, "Invalid state for upgrade" );
+            return mutex->internal_upgrade(*this);
+        }
+
+        //! Downgrade writer to become a reader.
+        /** Returns whether the downgrade happened without releasing and re-acquiring the lock */
+        bool downgrade_to_reader() {
+            x86_rtm_rw_mutex* mutex = x86_rtm_rw_mutex::internal_get_mutex(my_scoped_lock);
+            __TBB_ASSERT( mutex, "lock is not acquired" );
+            __TBB_ASSERT( transaction_state==RTM_transacting_writer || transaction_state==RTM_real_writer, "Invalid state for downgrade" );
+            return mutex->internal_downgrade(*this);
+        }
+
+        //! Attempt to acquire mutex.
+        /** returns true if successful.  */
+        bool try_acquire( x86_rtm_rw_mutex& m, bool write = true ) {
+#if TBB_USE_ASSERT
+            x86_rtm_rw_mutex* mutex = x86_rtm_rw_mutex::internal_get_mutex(my_scoped_lock);
+            __TBB_ASSERT( !mutex, "lock is already acquired" );
+#endif
+            // have to assign m to our mutex.
+            // cannot set the mutex, because try_acquire in spin_rw_mutex depends on it being NULL.
+            if(write) return m.internal_try_acquire_writer(*this);
+            // speculatively acquire the lock.  If this fails, do try_acquire on the spin_rw_mutex.
+            m.internal_acquire_reader(*this, /*only_speculate=*/true);
+            if(transaction_state == RTM_transacting_reader) return true;
+            if( my_scoped_lock.try_acquire(m, false)) {
+                transaction_state = RTM_real_reader;
+                return true;
+            }
+            return false;
+        }
+
+        };  // class x86_rtm_rw_mutex::scoped_lock
+
+    // ISO C++0x compatibility methods not provided because we cannot maintain
+    // state about whether a thread is in a transaction.
+
+private:
+    char pad[speculation_granularity-sizeof(spin_rw_mutex)]; // padding
+
+    // If true, writer holds the spin_rw_mutex.
+    tbb::atomic<bool> w_flag;  // want this on a separate cache line
+
+};  // x86_rtm_rw_mutex
+
+}  // namespace internal
+}  // namespace interface8
+}  // namespace tbb
+
+#endif  /* __TBB_TSX_AVAILABLE */
+#endif /* __TBB__x86_rtm_rw_mutex_impl_H */
diff --git a/xdl/third_party/tbb/include/tbb/iterators.h b/xdl/third_party/tbb/include/tbb/iterators.h
new file mode 100644
index 00000000..85b3032d
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/iterators.h
@@ -0,0 +1,282 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_iterators_H
+#define __TBB_iterators_H
+
+#include <iterator>
+#include <limits>
+
+#include "tbb_config.h"
+#include "tbb_stddef.h"
+
+#if __TBB_CPP11_PRESENT
+
+#include <type_traits>
+
+namespace tbb {
+
+template <typename IntType>
+class counting_iterator {
+public:
+    typedef typename std::make_signed<IntType>::type difference_type;
+    typedef IntType value_type;
+    typedef const IntType* pointer;
+    typedef const IntType& reference;
+    typedef std::random_access_iterator_tag iterator_category;
+
+    explicit counting_iterator(IntType init): my_counter(init) { __TBB_STATIC_ASSERT(std::numeric_limits<IntType>::is_integer, "Integer required."); }
+
+    reference operator*() const { return my_counter; }
+    value_type operator[](difference_type i) const { return *(*this + i); }
+
+    difference_type operator-(const counting_iterator& it) const { return my_counter - it.my_counter; }
+
+    counting_iterator& operator+=(difference_type forward) { my_counter += forward; return *this; }
+    counting_iterator& operator-=(difference_type backward) { return *this += -backward; }
+    counting_iterator& operator++() { return *this += 1; }
+    counting_iterator& operator--() { return *this -= 1; }
+
+    counting_iterator operator++(int) {
+        counting_iterator it(*this);
+        ++(*this);
+        return it;
+    }
+    counting_iterator operator--(int) {
+        counting_iterator it(*this);
+        --(*this);
+        return it;
+    }
+
+    counting_iterator operator-(difference_type backward) const { return counting_iterator(my_counter - backward); }
+    counting_iterator operator+(difference_type forward) const { return counting_iterator(my_counter + forward); }
+    friend counting_iterator operator+(difference_type forward, const counting_iterator it) { return it + forward; }
+
+    bool operator==(const counting_iterator& it) const { return *this - it == 0; }
+    bool operator!=(const counting_iterator& it) const { return !(*this == it); }
+    bool operator<(const counting_iterator& it) const {return *this - it < 0; }
+    bool operator>(const counting_iterator& it) const { return it < *this; }
+    bool operator<=(const counting_iterator& it) const { return !(*this > it); }
+    bool operator>=(const counting_iterator& it) const { return !(*this < it); }
+
+private:
+    IntType my_counter;
+};
+} //namespace tbb
+
+
+#include <tuple>
+
+#include "internal/_template_helpers.h" // index_sequence, make_index_sequence
+
+namespace tbb {
+namespace internal {
+
+template<size_t N>
+struct tuple_util {
+    template<typename TupleType, typename DifferenceType>
+    static void increment(TupleType& it, DifferenceType forward) {
+        std::get<N-1>(it) += forward;
+        tuple_util<N-1>::increment(it, forward);
+    }
+    template<typename TupleType, typename DifferenceType>
+    static bool check_sync(const TupleType& it1, const TupleType& it2, DifferenceType val) {
+        if(std::get<N-1>(it1) - std::get<N-1>(it2) != val)
+            return false;
+        return tuple_util<N-1>::check_sync(it1, it2, val);
+    }
+};
+
+template<>
+struct tuple_util<0> {
+    template<typename TupleType, typename DifferenceType>
+    static void increment(TupleType&, DifferenceType) {}
+    template<typename TupleType, typename DifferenceType>
+    static bool check_sync(const TupleType&, const TupleType&, DifferenceType) { return true;}
+};
+
+template <typename TupleReturnType>
+struct make_references {
+    template <typename TupleType, std::size_t... Is>
+    TupleReturnType operator()(const TupleType& t, tbb::internal::index_sequence<Is...>) {
+        return std::tie((*std::get<Is>(t))...);
+    }
+};
+
+} //namespace internal
+
+template <typename... Types>
+class zip_iterator {
+    static const std::size_t num_types = sizeof...(Types);
+    typedef typename std::tuple<Types...> it_types;
+public:
+    typedef typename std::make_signed<std::size_t>::type difference_type;
+    typedef std::tuple<typename std::iterator_traits<Types>::value_type...> value_type;
+    typedef std::tuple<typename std::iterator_traits<Types>::reference...> reference;
+    typedef std::tuple<typename std::iterator_traits<Types>::pointer...> pointer;
+    typedef std::random_access_iterator_tag iterator_category;
+
+    explicit zip_iterator(Types... args): my_it(std::make_tuple(args...)) {}
+
+    reference operator*() const {
+        return tbb::internal::make_references<reference>()(my_it, tbb::internal::make_index_sequence<num_types>());
+    }
+    reference operator[](difference_type i) const { return *(*this + i); }
+
+    difference_type operator-(const zip_iterator& it) const {
+        __TBB_ASSERT(internal::tuple_util<num_types>::check_sync(my_it, it.my_it, std::get<0>(my_it) - std::get<0>(it.my_it)),
+                     "Components of zip_iterator are not synchronous");
+        return std::get<0>(my_it) - std::get<0>(it.my_it);
+    }
+
+    zip_iterator& operator+=(difference_type forward) {
+        internal::tuple_util<num_types>::increment(my_it, forward);
+        return *this;
+    }
+    zip_iterator& operator-=(difference_type backward) { return *this += -backward; }
+    zip_iterator& operator++() { return *this += 1; }
+    zip_iterator& operator--() { return *this -= 1; }
+
+    zip_iterator operator++(int) {
+        zip_iterator it(*this);
+        ++(*this);
+        return it;
+    }
+    zip_iterator operator--(int) {
+        zip_iterator it(*this);
+        --(*this);
+        return it;
+    }
+
+    zip_iterator operator-(difference_type backward) const {
+        zip_iterator it(*this);
+        return it -= backward;
+    }
+    zip_iterator operator+(difference_type forward) const {
+        zip_iterator it(*this);
+        return it += forward;
+    }
+    friend zip_iterator operator+(difference_type forward, const zip_iterator& it) { return it + forward; }
+
+    bool operator==(const zip_iterator& it) const {
+        return *this - it == 0;
+    }
+    bool operator!=(const zip_iterator& it) const { return !(*this == it); }
+    bool operator<(const zip_iterator& it) const { return *this - it < 0; }
+    bool operator>(const zip_iterator& it) const { return it < *this; }
+    bool operator<=(const zip_iterator& it) const { return !(*this > it); }
+    bool operator>=(const zip_iterator& it) const { return !(*this < it); }
+
+private:
+    it_types my_it;
+};
+
+template<typename... T>
+zip_iterator<T...> make_zip_iterator(T... args) { return zip_iterator<T...>(args...); }
+
+template <typename UnaryFunc, typename Iter>
+class transform_iterator {
+public:
+    typedef typename std::iterator_traits<Iter>::value_type value_type;
+    typedef typename std::iterator_traits<Iter>::difference_type difference_type;
+#if __TBB_CPP17_INVOKE_RESULT_PRESENT
+    typedef typename std::invoke_result<UnaryFunc, typename std::iterator_traits<Iter>::reference>::type reference;
+#else
+    typedef typename std::result_of<UnaryFunc(typename std::iterator_traits<Iter>::reference)>::type reference;
+#endif
+    typedef typename std::iterator_traits<Iter>::pointer pointer;
+    typedef typename std::random_access_iterator_tag iterator_category;
+
+    transform_iterator(Iter it, UnaryFunc unary_func): my_it(it), my_unary_func(unary_func) {
+        __TBB_STATIC_ASSERT((std::is_same<typename std::iterator_traits<Iter>::iterator_category,
+                             std::random_access_iterator_tag>::value), "Random access iterator required.");
+    }
+    transform_iterator(const transform_iterator& input) : my_it(input.my_it), my_unary_func(input.my_unary_func) { }
+    transform_iterator& operator=(const transform_iterator& input) {
+        my_it = input.my_it;
+        return *this;
+    }
+    reference operator*() const {
+        return my_unary_func(*my_it);
+    }
+    reference operator[](difference_type i) const {
+        return *(*this + i);
+    }
+    transform_iterator& operator++() {
+        ++my_it;
+        return *this;
+    }
+    transform_iterator& operator--() {
+        --my_it;
+        return *this;
+    }
+    transform_iterator operator++(int) {
+        transform_iterator it(*this);
+        ++(*this);
+        return it;
+    }
+    transform_iterator operator--(int) {
+        transform_iterator it(*this);
+        --(*this);
+        return it;
+    }
+    transform_iterator operator+(difference_type forward) const {
+        return { my_it + forward, my_unary_func };
+    }
+    transform_iterator operator-(difference_type backward) const {
+        return { my_it - backward, my_unary_func };
+    }
+    transform_iterator& operator+=(difference_type forward) {
+        my_it += forward;
+        return *this;
+    }
+    transform_iterator& operator-=(difference_type backward) {
+        my_it -= backward;
+        return *this;
+    }
+    friend transform_iterator operator+(difference_type forward, const transform_iterator& it) {
+        return it + forward;
+    }
+    difference_type operator-(const transform_iterator& it) const {
+        return my_it - it.my_it;
+    }
+    bool operator==(const transform_iterator& it) const { return *this - it == 0; }
+    bool operator!=(const transform_iterator& it) const { return !(*this == it); }
+    bool operator<(const transform_iterator& it) const { return *this - it < 0; }
+    bool operator>(const transform_iterator& it) const { return it < *this; }
+    bool operator<=(const transform_iterator& it) const { return !(*this > it); }
+    bool operator>=(const transform_iterator& it) const { return !(*this < it); }
+
+    Iter base() const { return my_it; }
+private:
+    Iter my_it;
+    const UnaryFunc my_unary_func;
+};
+
+template<typename UnaryFunc, typename Iter>
+transform_iterator<UnaryFunc, Iter> make_transform_iterator(Iter it, UnaryFunc unary_func) {
+    return transform_iterator<UnaryFunc, Iter>(it, unary_func);
+}
+
+} //namespace tbb
+
+#endif //__TBB_CPP11_PRESENT
+
+#endif /* __TBB_iterators_H */
diff --git a/xdl/third_party/tbb/include/tbb/machine/gcc_arm.h b/xdl/third_party/tbb/include/tbb/machine/gcc_arm.h
new file mode 100644
index 00000000..7fac0f25
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/gcc_arm.h
@@ -0,0 +1,220 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    Platform isolation layer for the ARMv7-a architecture.
+*/
+
+#ifndef __TBB_machine_H
+#error Do not include this file directly; include tbb_machine.h instead
+#endif
+
+#if __ARM_ARCH_7A__
+
+#include <sys/param.h>
+#include <unistd.h>
+
+#define __TBB_WORDSIZE 4
+
+// Traditionally ARM is little-endian.
+// Note that, since only the layout of aligned 32-bit words is of interest,
+// any apparent PDP-endianness of 32-bit words at half-word alignment or
+// any little-endian ordering of big-endian 32-bit words in 64-bit quantities
+// may be disregarded for this setting.
+#if __BIG_ENDIAN__ || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_BIG_ENDIAN__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_BIG
+#elif __LITTLE_ENDIAN__ || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+#elif defined(__BYTE_ORDER__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_UNSUPPORTED
+#else
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_DETECT
+#endif
+
+
+#define __TBB_compiler_fence()    __asm__ __volatile__("": : :"memory")
+#define __TBB_full_memory_fence() __asm__ __volatile__("dmb ish": : :"memory")
+#define __TBB_control_consistency_helper() __TBB_full_memory_fence()
+#define __TBB_acquire_consistency_helper() __TBB_full_memory_fence()
+#define __TBB_release_consistency_helper() __TBB_full_memory_fence()
+
+//--------------------------------------------------
+// Compare and swap
+//--------------------------------------------------
+
+/**
+ * Atomic CAS for 32 bit values, if *ptr==comparand, then *ptr=value, returns *ptr
+ * @param ptr pointer to value in memory to be swapped with value if *ptr==comparand
+ * @param value value to assign *ptr to if *ptr==comparand
+ * @param comparand value to compare with *ptr
+ * @return value originally in memory at ptr, regardless of success
+*/
+static inline int32_t __TBB_machine_cmpswp4(volatile void *ptr, int32_t value, int32_t comparand )
+{
+    int32_t oldval, res;
+
+    __TBB_full_memory_fence();
+
+    do {
+    __asm__ __volatile__(
+        "ldrex      %1, [%3]\n"
+        "mov        %0, #0\n"
+        "cmp        %1, %4\n"
+        "it         eq\n"
+        "strexeq    %0, %5, [%3]\n"
+        : "=&r" (res), "=&r" (oldval), "+Qo" (*(volatile int32_t*)ptr)
+        : "r" ((volatile int32_t *)ptr), "Ir" (comparand), "r" (value)
+        : "cc");
+    } while (res);
+
+    __TBB_full_memory_fence();
+
+    return oldval;
+}
+
+/**
+ * Atomic CAS for 64 bit values, if *ptr==comparand, then *ptr=value, returns *ptr
+ * @param ptr pointer to value in memory to be swapped with value if *ptr==comparand
+ * @param value value to assign *ptr to if *ptr==comparand
+ * @param comparand value to compare with *ptr
+ * @return value originally in memory at ptr, regardless of success
+ */
+static inline int64_t __TBB_machine_cmpswp8(volatile void *ptr, int64_t value, int64_t comparand )
+{
+    int64_t oldval;
+    int32_t res;
+
+    __TBB_full_memory_fence();
+
+    do {
+        __asm__ __volatile__(
+            "mov        %0, #0\n"
+            "ldrexd     %1, %H1, [%3]\n"
+            "cmp        %1, %4\n"
+            "it         eq\n"
+            "cmpeq      %H1, %H4\n"
+            "it         eq\n"
+            "strexdeq   %0, %5, %H5, [%3]"
+        : "=&r" (res), "=&r" (oldval), "+Qo" (*(volatile int64_t*)ptr)
+        : "r" ((volatile int64_t *)ptr), "r" (comparand), "r" (value)
+        : "cc");
+    } while (res);
+
+    __TBB_full_memory_fence();
+
+    return oldval;
+}
+
+static inline int32_t __TBB_machine_fetchadd4(volatile void* ptr, int32_t addend)
+{
+    unsigned long tmp;
+    int32_t result, tmp2;
+
+    __TBB_full_memory_fence();
+
+    __asm__ __volatile__(
+"1:     ldrex   %0, [%4]\n"
+"       add     %3, %0, %5\n"
+"       strex   %1, %3, [%4]\n"
+"       cmp     %1, #0\n"
+"       bne     1b\n"
+    : "=&r" (result), "=&r" (tmp), "+Qo" (*(volatile int32_t*)ptr), "=&r"(tmp2)
+    : "r" ((volatile int32_t *)ptr), "Ir" (addend)
+    : "cc");
+
+    __TBB_full_memory_fence();
+
+    return result;
+}
+
+static inline int64_t __TBB_machine_fetchadd8(volatile void *ptr, int64_t addend)
+{
+    unsigned long tmp;
+    int64_t result, tmp2;
+
+    __TBB_full_memory_fence();
+
+    __asm__ __volatile__(
+"1:     ldrexd  %0, %H0, [%4]\n"
+"       adds    %3, %0, %5\n"
+"       adc     %H3, %H0, %H5\n"
+"       strexd  %1, %3, %H3, [%4]\n"
+"       cmp     %1, #0\n"
+"       bne     1b"
+    : "=&r" (result), "=&r" (tmp), "+Qo" (*(volatile int64_t*)ptr), "=&r"(tmp2)
+    : "r" ((volatile int64_t *)ptr), "r" (addend)
+    : "cc");
+
+
+    __TBB_full_memory_fence();
+
+    return result;
+}
+
+namespace tbb {
+namespace internal {
+    template <typename T, size_t S>
+    struct machine_load_store_relaxed {
+        static inline T load ( const volatile T& location ) {
+            const T value = location;
+
+            /*
+            * An extra memory barrier is required for errata #761319
+            * Please see http://infocenter.arm.com/help/topic/com.arm.doc.uan0004a
+            */
+            __TBB_acquire_consistency_helper();
+            return value;
+        }
+
+        static inline void store ( volatile T& location, T value ) {
+            location = value;
+        }
+    };
+}} // namespaces internal, tbb
+
+// Machine specific atomic operations
+
+#define __TBB_CompareAndSwap4(P,V,C) __TBB_machine_cmpswp4(P,V,C)
+#define __TBB_CompareAndSwap8(P,V,C) __TBB_machine_cmpswp8(P,V,C)
+
+// Use generics for some things
+#define __TBB_USE_GENERIC_PART_WORD_CAS                         1
+#define __TBB_USE_GENERIC_PART_WORD_FETCH_ADD                   1
+#define __TBB_USE_GENERIC_PART_WORD_FETCH_STORE                 1
+#define __TBB_USE_GENERIC_FETCH_STORE                           1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_DWORD_LOAD_STORE                      1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE     1
+#elif defined __aarch64__
+// Generic gcc implementations are fine for ARMv8-a except __TBB_PAUSE.
+#include "gcc_generic.h"
+#else
+#error compilation requires an ARMv7-a or ARMv8-a architecture.
+#endif // __ARM_ARCH_7A__
+
+inline void __TBB_machine_pause (int32_t delay)
+{
+    while(delay>0)
+    {
+        __asm__ __volatile__("yield" ::: "memory");
+        delay--;
+    }
+}
+#define __TBB_Pause(V) __TBB_machine_pause(V)
diff --git a/xdl/third_party/tbb/include/tbb/machine/gcc_generic.h b/xdl/third_party/tbb/include/tbb/machine/gcc_generic.h
new file mode 100644
index 00000000..390c1c2e
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/gcc_generic.h
@@ -0,0 +1,237 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_gcc_generic_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_gcc_generic_H
+
+#include <stdint.h>
+#include <unistd.h>
+
+#define __TBB_WORDSIZE __SIZEOF_POINTER__
+
+#if __TBB_GCC_64BIT_ATOMIC_BUILTINS_BROKEN
+    #define __TBB_64BIT_ATOMICS 0
+#endif
+
+/** FPU control setting not available for non-Intel architectures on Android **/
+#if __ANDROID__ && __TBB_generic_arch
+    #define __TBB_CPU_CTL_ENV_PRESENT 0
+#endif
+
+// __BYTE_ORDER__ is used in accordance with http://gcc.gnu.org/onlinedocs/cpp/Common-Predefined-Macros.html,
+// but __BIG_ENDIAN__ or __LITTLE_ENDIAN__ may be more commonly found instead.
+#if __BIG_ENDIAN__ || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_BIG_ENDIAN__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_BIG
+#elif __LITTLE_ENDIAN__ || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+#elif defined(__BYTE_ORDER__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_UNSUPPORTED
+#else
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_DETECT
+#endif
+
+#if __TBB_GCC_VERSION < 40700
+// Use __sync_* builtins
+
+/** As this generic implementation has absolutely no information about underlying
+    hardware, its performance most likely will be sub-optimal because of full memory
+    fence usages where a more lightweight synchronization means (or none at all)
+    could suffice. Thus if you use this header to enable TBB on a new platform,
+    consider forking it and relaxing below helpers as appropriate. **/
+#define __TBB_acquire_consistency_helper()  __sync_synchronize()
+#define __TBB_release_consistency_helper()  __sync_synchronize()
+#define __TBB_full_memory_fence()           __sync_synchronize()
+#define __TBB_control_consistency_helper()  __sync_synchronize()
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,T)                                                         \
+inline T __TBB_machine_cmpswp##S( volatile void *ptr, T value, T comparand ) {                    \
+    return __sync_val_compare_and_swap(reinterpret_cast<volatile T *>(ptr),comparand,value);      \
+}                                                                                                 \
+inline T __TBB_machine_fetchadd##S( volatile void *ptr, T value ) {                               \
+    return __sync_fetch_and_add(reinterpret_cast<volatile T *>(ptr),value);                       \
+}
+
+#define __TBB_USE_GENERIC_FETCH_STORE 1
+
+#else
+// __TBB_GCC_VERSION >= 40700; use __atomic_* builtins available since gcc 4.7
+
+#define __TBB_compiler_fence()              __asm__ __volatile__("": : :"memory")
+// Acquire and release fence intrinsics in GCC might miss compiler fence.
+// Adding it at both sides of an intrinsic, as we do not know what reordering can be made.
+#define __TBB_acquire_consistency_helper()  __TBB_compiler_fence(); __atomic_thread_fence(__ATOMIC_ACQUIRE); __TBB_compiler_fence()
+#define __TBB_release_consistency_helper()  __TBB_compiler_fence(); __atomic_thread_fence(__ATOMIC_RELEASE); __TBB_compiler_fence()
+#define __TBB_full_memory_fence()           __atomic_thread_fence(__ATOMIC_SEQ_CST)
+#define __TBB_control_consistency_helper()  __TBB_acquire_consistency_helper()
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,T)                                                         \
+inline T __TBB_machine_cmpswp##S( volatile void *ptr, T value, T comparand ) {                    \
+    (void)__atomic_compare_exchange_n(reinterpret_cast<volatile T *>(ptr), &comparand, value,     \
+                                      false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST);                 \
+    return comparand;                                                                             \
+}                                                                                                 \
+inline T __TBB_machine_fetchadd##S( volatile void *ptr, T value ) {                               \
+    return __atomic_fetch_add(reinterpret_cast<volatile T *>(ptr), value, __ATOMIC_SEQ_CST);      \
+}                                                                                                 \
+inline T __TBB_machine_fetchstore##S( volatile void *ptr, T value ) {                             \
+    return __atomic_exchange_n(reinterpret_cast<volatile T *>(ptr), value, __ATOMIC_SEQ_CST);     \
+}
+
+#endif // __TBB_GCC_VERSION < 40700
+
+__TBB_MACHINE_DEFINE_ATOMICS(1,int8_t)
+__TBB_MACHINE_DEFINE_ATOMICS(2,int16_t)
+__TBB_MACHINE_DEFINE_ATOMICS(4,int32_t)
+__TBB_MACHINE_DEFINE_ATOMICS(8,int64_t)
+
+#undef __TBB_MACHINE_DEFINE_ATOMICS
+
+typedef unsigned char __TBB_Flag;
+typedef __TBB_atomic __TBB_Flag __TBB_atomic_flag;
+
+#if __TBB_GCC_VERSION < 40700
+// Use __sync_* builtins
+
+// Use generic machine_load_store functions if there are no builtin atomics
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+static inline void __TBB_machine_or( volatile void *ptr, uintptr_t addend ) {
+    __sync_fetch_and_or(reinterpret_cast<volatile uintptr_t *>(ptr),addend);
+}
+
+static inline void __TBB_machine_and( volatile void *ptr, uintptr_t addend ) {
+    __sync_fetch_and_and(reinterpret_cast<volatile uintptr_t *>(ptr),addend);
+}
+
+inline bool __TBB_machine_try_lock_byte( __TBB_atomic_flag &flag ) {
+    return __sync_lock_test_and_set(&flag,1)==0;
+}
+
+inline void __TBB_machine_unlock_byte( __TBB_atomic_flag &flag ) {
+    __sync_lock_release(&flag);
+}
+
+#else
+// __TBB_GCC_VERSION >= 40700; use __atomic_* builtins available since gcc 4.7
+
+static inline void __TBB_machine_or( volatile void *ptr, uintptr_t addend ) {
+    __atomic_fetch_or(reinterpret_cast<volatile uintptr_t *>(ptr),addend,__ATOMIC_SEQ_CST);
+}
+
+static inline void __TBB_machine_and( volatile void *ptr, uintptr_t addend ) {
+    __atomic_fetch_and(reinterpret_cast<volatile uintptr_t *>(ptr),addend,__ATOMIC_SEQ_CST);
+}
+
+inline bool __TBB_machine_try_lock_byte( __TBB_atomic_flag &flag ) {
+    return !__atomic_test_and_set(&flag,__ATOMIC_ACQUIRE);
+}
+
+inline void __TBB_machine_unlock_byte( __TBB_atomic_flag &flag ) {
+    __atomic_clear(&flag,__ATOMIC_RELEASE);
+}
+
+namespace tbb { namespace internal {
+
+/** GCC atomic operation intrinsics might miss compiler fence.
+    Adding it after load-with-acquire, before store-with-release, and
+    on both sides of sequentially consistent operations is sufficient for correctness. **/
+
+template <typename T, int MemOrder>
+inline T __TBB_machine_atomic_load( const volatile T& location) {
+    if (MemOrder == __ATOMIC_SEQ_CST) __TBB_compiler_fence();
+    T value = __atomic_load_n(&location, MemOrder);
+    if (MemOrder != __ATOMIC_RELAXED) __TBB_compiler_fence();
+    return value;
+}
+
+template <typename T, int MemOrder>
+inline void __TBB_machine_atomic_store( volatile T& location, T value) {
+    if (MemOrder != __ATOMIC_RELAXED) __TBB_compiler_fence();
+    __atomic_store_n(&location, value, MemOrder);
+    if (MemOrder == __ATOMIC_SEQ_CST) __TBB_compiler_fence();
+}
+
+template <typename T, size_t S>
+struct machine_load_store {
+    static T load_with_acquire ( const volatile T& location ) {
+        return __TBB_machine_atomic_load<T, __ATOMIC_ACQUIRE>(location);
+    }
+    static void store_with_release ( volatile T &location, T value ) {
+        __TBB_machine_atomic_store<T, __ATOMIC_RELEASE>(location, value);
+    }
+};
+
+template <typename T, size_t S>
+struct machine_load_store_relaxed {
+    static inline T load ( const volatile T& location ) {
+        return __TBB_machine_atomic_load<T, __ATOMIC_RELAXED>(location);
+    }
+    static inline void store ( volatile T& location, T value ) {
+        __TBB_machine_atomic_store<T, __ATOMIC_RELAXED>(location, value);
+    }
+};
+
+template <typename T, size_t S>
+struct machine_load_store_seq_cst {
+    static T load ( const volatile T& location ) {
+        return __TBB_machine_atomic_load<T, __ATOMIC_SEQ_CST>(location);
+    }
+    static void store ( volatile T &location, T value ) {
+        __TBB_machine_atomic_store<T, __ATOMIC_SEQ_CST>(location, value);
+    }
+};
+
+}} // namespace tbb::internal
+
+#endif // __TBB_GCC_VERSION < 40700
+
+// Machine specific atomic operations
+#define __TBB_AtomicOR(P,V)     __TBB_machine_or(P,V)
+#define __TBB_AtomicAND(P,V)    __TBB_machine_and(P,V)
+
+#define __TBB_TryLockByte   __TBB_machine_try_lock_byte
+#define __TBB_UnlockByte    __TBB_machine_unlock_byte
+
+// __builtin_clz counts the number of leading zeroes
+namespace tbb{ namespace internal { namespace gcc_builtins {
+    inline int clz(unsigned int x){ return __builtin_clz(x); };
+    inline int clz(unsigned long int x){ return __builtin_clzl(x); };
+    inline int clz(unsigned long long int x){ return __builtin_clzll(x); };
+}}}
+// logarithm is the index of the most significant non-zero bit
+static inline intptr_t __TBB_machine_lg( uintptr_t x ) {
+    // If P is a power of 2 and x<P, then (P-1)-x == (P-1) XOR x
+    return (sizeof(x)*8 - 1) ^ tbb::internal::gcc_builtins::clz(x);
+}
+
+#define __TBB_Log2(V)  __TBB_machine_lg(V)
+
+#if __TBB_WORDSIZE==4
+    #define __TBB_USE_GENERIC_DWORD_LOAD_STORE              1
+#endif
+
+#if __TBB_x86_32 || __TBB_x86_64
+#include "gcc_ia32_common.h"
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/machine/gcc_ia32_common.h b/xdl/third_party/tbb/include/tbb/machine/gcc_ia32_common.h
new file mode 100644
index 00000000..7ace018d
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/gcc_ia32_common.h
@@ -0,0 +1,113 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_machine_gcc_ia32_common_H
+#define __TBB_machine_gcc_ia32_common_H
+
+#ifndef __TBB_Log2
+//TODO: Add a higher-level function, e.g. tbb::internal::log2(), into tbb_stddef.h, which
+//uses __TBB_Log2 and contains the assert and remove the assert from here and all other
+//platform-specific headers.
+template <typename T>
+static inline intptr_t __TBB_machine_lg( T x ) {
+    __TBB_ASSERT(x>0, "The logarithm of a non-positive value is undefined.");
+    uintptr_t j, i = x;
+    __asm__("bsr %1,%0" : "=r"(j) : "r"(i));
+    return j;
+}
+#define __TBB_Log2(V)  __TBB_machine_lg(V)
+#endif /* !__TBB_Log2 */
+
+#ifndef __TBB_Pause
+//TODO: check if raising a ratio of pause instructions to loop control instructions
+//(via e.g. loop unrolling) gives any benefit for HT.  E.g, the current implementation
+//does about 2 CPU-consuming instructions for every pause instruction.  Perhaps for
+//high pause counts it should use an unrolled loop to raise the ratio, and thus free
+//up more integer cycles for the other hyperthread.  On the other hand, if the loop is
+//unrolled too far, it won't fit in the core's loop cache, and thus take away
+//instruction decode slots from the other hyperthread.
+
+//TODO: check if use of gcc __builtin_ia32_pause intrinsic gives a "some how" better performing code
+static inline void __TBB_machine_pause( int32_t delay ) {
+    for (int32_t i = 0; i < delay; i++) {
+       __asm__ __volatile__("pause;");
+    }
+    return;
+}
+#define __TBB_Pause(V) __TBB_machine_pause(V)
+#endif /* !__TBB_Pause */
+
+namespace tbb { namespace internal { typedef uint64_t machine_tsc_t; } }
+static inline tbb::internal::machine_tsc_t __TBB_machine_time_stamp() {
+#if __INTEL_COMPILER
+    return _rdtsc();
+#else
+    tbb::internal::uint32_t hi, lo;
+    __asm__ __volatile__("rdtsc" : "=d"(hi), "=a"(lo));
+    return (tbb::internal::machine_tsc_t( hi ) << 32) | lo;
+#endif
+}
+#define __TBB_time_stamp() __TBB_machine_time_stamp()
+
+// API to retrieve/update FPU control setting
+#ifndef __TBB_CPU_CTL_ENV_PRESENT
+#define __TBB_CPU_CTL_ENV_PRESENT 1
+namespace tbb {
+namespace internal {
+class cpu_ctl_env {
+private:
+    int     mxcsr;
+    short   x87cw;
+    static const int MXCSR_CONTROL_MASK = ~0x3f; /* all except last six status bits */
+public:
+    bool operator!=( const cpu_ctl_env& ctl ) const { return mxcsr != ctl.mxcsr || x87cw != ctl.x87cw; }
+    void get_env() {
+    #if __TBB_ICC_12_0_INL_ASM_FSTCW_BROKEN
+        cpu_ctl_env loc_ctl;
+        __asm__ __volatile__ (
+                "stmxcsr %0\n\t"
+                "fstcw %1"
+                : "=m"(loc_ctl.mxcsr), "=m"(loc_ctl.x87cw)
+        );
+        *this = loc_ctl;
+    #else
+        __asm__ __volatile__ (
+                "stmxcsr %0\n\t"
+                "fstcw %1"
+                : "=m"(mxcsr), "=m"(x87cw)
+        );
+    #endif
+        mxcsr &= MXCSR_CONTROL_MASK;
+    }
+    void set_env() const {
+        __asm__ __volatile__ (
+                "ldmxcsr %0\n\t"
+                "fldcw %1"
+                : : "m"(mxcsr), "m"(x87cw)
+        );
+    }
+};
+} // namespace internal
+} // namespace tbb
+#endif /* !__TBB_CPU_CTL_ENV_PRESENT */
+
+#include "gcc_itsx.h"
+
+#endif /* __TBB_machine_gcc_ia32_common_H */
diff --git a/xdl/third_party/tbb/include/tbb/machine/gcc_itsx.h b/xdl/third_party/tbb/include/tbb/machine/gcc_itsx.h
new file mode 100644
index 00000000..78b1a960
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/gcc_itsx.h
@@ -0,0 +1,123 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_gcc_itsx_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_gcc_itsx_H
+
+#define __TBB_OP_XACQUIRE 0xF2
+#define __TBB_OP_XRELEASE 0xF3
+#define __TBB_OP_LOCK     0xF0
+
+#define __TBB_STRINGIZE_INTERNAL(arg) #arg
+#define __TBB_STRINGIZE(arg) __TBB_STRINGIZE_INTERNAL(arg)
+
+#ifdef __TBB_x86_64
+#define __TBB_r_out "=r"
+#else
+#define __TBB_r_out "=q"
+#endif
+
+inline static uint8_t __TBB_machine_try_lock_elided( volatile uint8_t* lk )
+{
+    uint8_t value = 1;
+    __asm__ volatile (".byte " __TBB_STRINGIZE(__TBB_OP_XACQUIRE)"; lock; xchgb %0, %1;"
+                      : __TBB_r_out(value), "=m"(*lk)  : "0"(value), "m"(*lk) : "memory" );
+    return uint8_t(value^1);
+}
+
+inline static void __TBB_machine_try_lock_elided_cancel()
+{
+    // 'pause' instruction aborts HLE/RTM transactions
+    __asm__ volatile ("pause\n" : : : "memory" );
+}
+
+inline static void __TBB_machine_unlock_elided( volatile uint8_t* lk )
+{
+    __asm__ volatile (".byte " __TBB_STRINGIZE(__TBB_OP_XRELEASE)"; movb $0, %0"
+                      : "=m"(*lk) : "m"(*lk) : "memory" );
+}
+
+#if __TBB_TSX_INTRINSICS_PRESENT
+#include <immintrin.h>
+
+#define __TBB_machine_is_in_transaction _xtest
+#define __TBB_machine_begin_transaction _xbegin
+#define __TBB_machine_end_transaction   _xend
+#define __TBB_machine_transaction_conflict_abort() _xabort(0xff)
+
+#else
+
+/*!
+ * Check if the instruction is executed in a transaction or not
+ */
+inline static bool __TBB_machine_is_in_transaction()
+{
+    int8_t res = 0;
+#if __TBB_x86_32
+    __asm__ volatile (".byte 0x0F; .byte 0x01; .byte 0xD6;\n"
+                      "setz %0" : "=q"(res) : : "memory" );
+#else
+    __asm__ volatile (".byte 0x0F; .byte 0x01; .byte 0xD6;\n"
+                      "setz %0" : "=r"(res) : : "memory" );
+#endif
+    return res==0;
+}
+
+/*!
+ * Enter speculative execution mode.
+ * @return -1 on success
+ *         abort cause ( or 0 ) on abort
+ */
+inline static uint32_t __TBB_machine_begin_transaction()
+{
+    uint32_t res = ~uint32_t(0);   // success value
+    __asm__ volatile ("1: .byte  0xC7; .byte 0xF8;\n"           //  XBEGIN <abort-offset>
+                      "   .long  2f-1b-6\n"                     //  2f-1b == difference in addresses of start
+                                                                //  of XBEGIN and the MOVL
+                                                                //  2f - 1b - 6 == that difference minus the size of the
+                                                                //  XBEGIN instruction.  This is the abort offset to
+                                                                //  2: below.
+                      "    jmp   3f\n"                          //  success (leave -1 in res)
+                      "2:  movl  %%eax,%0\n"                    //  store failure code in res
+                      "3:"
+                      :"=r"(res):"0"(res):"memory","%eax");
+    return res;
+}
+
+/*!
+ * Attempt to commit/end transaction
+ */
+inline static void __TBB_machine_end_transaction()
+{
+    __asm__ volatile (".byte 0x0F; .byte 0x01; .byte 0xD5" :::"memory");   // XEND
+}
+
+/*
+ * aborts with code 0xFF (lock already held)
+ */
+inline static void __TBB_machine_transaction_conflict_abort()
+{
+    __asm__ volatile (".byte 0xC6; .byte 0xF8; .byte 0xFF" :::"memory");
+}
+
+#endif /* __TBB_TSX_INTRINSICS_PRESENT */
diff --git a/xdl/third_party/tbb/include/tbb/machine/ibm_aix51.h b/xdl/third_party/tbb/include/tbb/machine/ibm_aix51.h
new file mode 100644
index 00000000..961d88b4
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/ibm_aix51.h
@@ -0,0 +1,70 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// TODO: revise by comparing with mac_ppc.h
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_ibm_aix51_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_ibm_aix51_H
+
+#define __TBB_WORDSIZE 8
+#define __TBB_ENDIANNESS __TBB_ENDIAN_BIG // assumption based on operating system
+
+#include <stdint.h>
+#include <unistd.h>
+#include <sched.h>
+
+extern "C" {
+int32_t __TBB_machine_cas_32 (volatile void* ptr, int32_t value, int32_t comparand);
+int64_t __TBB_machine_cas_64 (volatile void* ptr, int64_t value, int64_t comparand);
+void __TBB_machine_flush ();
+void __TBB_machine_lwsync ();
+void __TBB_machine_isync ();
+}
+
+// Mapping of old entry point names retained for the sake of backward binary compatibility
+#define __TBB_machine_cmpswp4 __TBB_machine_cas_32
+#define __TBB_machine_cmpswp8 __TBB_machine_cas_64
+
+#define __TBB_Yield() sched_yield()
+
+#define __TBB_USE_GENERIC_PART_WORD_CAS                     1
+#define __TBB_USE_GENERIC_FETCH_ADD                         1
+#define __TBB_USE_GENERIC_FETCH_STORE                       1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+#if __GNUC__
+    #define __TBB_control_consistency_helper() __asm__ __volatile__( "isync": : :"memory")
+    #define __TBB_acquire_consistency_helper() __asm__ __volatile__("lwsync": : :"memory")
+    #define __TBB_release_consistency_helper() __asm__ __volatile__("lwsync": : :"memory")
+    #define __TBB_full_memory_fence()          __asm__ __volatile__(  "sync": : :"memory")
+#else
+    // IBM C++ Compiler does not support inline assembly
+    // TODO: Since XL 9.0 or earlier GCC syntax is supported. Replace with more
+    //       lightweight implementation (like in mac_ppc.h)
+    #define __TBB_control_consistency_helper() __TBB_machine_isync ()
+    #define __TBB_acquire_consistency_helper() __TBB_machine_lwsync ()
+    #define __TBB_release_consistency_helper() __TBB_machine_lwsync ()
+    #define __TBB_full_memory_fence()          __TBB_machine_flush ()
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/machine/icc_generic.h b/xdl/third_party/tbb/include/tbb/machine/icc_generic.h
new file mode 100644
index 00000000..13077419
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/icc_generic.h
@@ -0,0 +1,262 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_icc_generic_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#if ! __TBB_ICC_BUILTIN_ATOMICS_PRESENT
+    #error "Intel C++ Compiler of at least 12.0 version is needed to use ICC intrinsics port"
+#endif
+
+#define __TBB_machine_icc_generic_H
+
+//ICC mimics the "native" target compiler
+#if _MSC_VER
+    #include "msvc_ia32_common.h"
+#else
+    #include "gcc_ia32_common.h"
+#endif
+
+//TODO: Make __TBB_WORDSIZE macro optional for ICC intrinsics port.
+//As compiler intrinsics are used for all the operations it is possible to do.
+
+#if __TBB_x86_32
+    #define __TBB_WORDSIZE 4
+#else
+    #define __TBB_WORDSIZE 8
+#endif
+#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+
+//__TBB_compiler_fence() defined just in case, as it seems not to be used on its own anywhere else
+#ifndef __TBB_compiler_fence
+#if _MSC_VER
+    //TODO: any way to use same intrinsics on windows and linux?
+    #pragma intrinsic(_ReadWriteBarrier)
+    #define __TBB_compiler_fence()    _ReadWriteBarrier()
+#else
+    #define __TBB_compiler_fence()    __asm__ __volatile__("": : :"memory")
+#endif
+#endif
+
+#ifndef __TBB_full_memory_fence
+#if _MSC_VER
+    //TODO: any way to use same intrinsics on windows and linux?
+    #pragma intrinsic(_mm_mfence)
+    #define __TBB_full_memory_fence() _mm_mfence()
+#else
+    #define __TBB_full_memory_fence() __asm__ __volatile__("mfence": : :"memory")
+#endif
+#endif
+
+#ifndef __TBB_control_consistency_helper
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#endif
+
+namespace tbb { namespace internal {
+//TODO: is there any way to reuse definition of memory_order enum from ICC instead of copy paste.
+//however it seems unlikely that ICC will silently change exact enum values, as they are defined
+//in the ISO exactly like this.
+//TODO: add test that exact values of the enum are same as in the ISO C++11
+typedef enum memory_order {
+    memory_order_relaxed, memory_order_consume, memory_order_acquire,
+    memory_order_release, memory_order_acq_rel, memory_order_seq_cst
+} memory_order;
+
+namespace icc_intrinsics_port {
+    template <typename T>
+    T convert_argument(T value){
+        return value;
+    }
+    //The overload below is needed to have explicit conversion of pointer to void* in argument list.
+    //compiler bug?
+    //TODO: add according broken macro and recheck with ICC 13.0 if the overload is still needed
+    template <typename T>
+    void* convert_argument(T* value){
+        return (void*)value;
+    }
+}
+//TODO: code below is a bit repetitive, consider simplifying it
+template <typename T, size_t S>
+struct machine_load_store {
+    static T load_with_acquire ( const volatile T& location ) {
+        return __atomic_load_explicit(&location, memory_order_acquire);
+    }
+    static void store_with_release ( volatile T &location, T value ) {
+        __atomic_store_explicit(&location, icc_intrinsics_port::convert_argument(value), memory_order_release);
+    }
+};
+
+template <typename T, size_t S>
+struct machine_load_store_relaxed {
+    static inline T load ( const T& location ) {
+        return __atomic_load_explicit(&location, memory_order_relaxed);
+    }
+    static inline void store (  T& location, T value ) {
+        __atomic_store_explicit(&location, icc_intrinsics_port::convert_argument(value), memory_order_relaxed);
+    }
+};
+
+template <typename T, size_t S>
+struct machine_load_store_seq_cst {
+    static T load ( const volatile T& location ) {
+        return __atomic_load_explicit(&location, memory_order_seq_cst);
+    }
+
+    static void store ( volatile T &location, T value ) {
+        __atomic_store_explicit(&location, value, memory_order_seq_cst);
+    }
+};
+
+}} // namespace tbb::internal
+
+namespace tbb{ namespace internal { namespace icc_intrinsics_port{
+    typedef enum memory_order_map {
+        relaxed = memory_order_relaxed,
+        acquire = memory_order_acquire,
+        release = memory_order_release,
+        full_fence=  memory_order_seq_cst
+    } memory_order_map;
+}}}// namespace tbb::internal
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,T,M)                                                     \
+inline T __TBB_machine_cmpswp##S##M( volatile void *ptr, T value, T comparand ) {               \
+    __atomic_compare_exchange_strong_explicit(                                                  \
+            (T*)ptr                                                                             \
+            ,&comparand                                                                         \
+            ,value                                                                              \
+            , tbb::internal::icc_intrinsics_port::M                                             \
+            , tbb::internal::icc_intrinsics_port::M);                                           \
+    return comparand;                                                                           \
+}                                                                                               \
+                                                                                                \
+inline T __TBB_machine_fetchstore##S##M(volatile void *ptr, T value) {                          \
+    return __atomic_exchange_explicit((T*)ptr, value, tbb::internal::icc_intrinsics_port::M);   \
+}                                                                                               \
+                                                                                                \
+inline T __TBB_machine_fetchadd##S##M(volatile void *ptr, T value) {                            \
+    return __atomic_fetch_add_explicit((T*)ptr, value, tbb::internal::icc_intrinsics_port::M);  \
+}                                                                                               \
+
+__TBB_MACHINE_DEFINE_ATOMICS(1,tbb::internal::int8_t, full_fence)
+__TBB_MACHINE_DEFINE_ATOMICS(1,tbb::internal::int8_t, acquire)
+__TBB_MACHINE_DEFINE_ATOMICS(1,tbb::internal::int8_t, release)
+__TBB_MACHINE_DEFINE_ATOMICS(1,tbb::internal::int8_t, relaxed)
+
+__TBB_MACHINE_DEFINE_ATOMICS(2,tbb::internal::int16_t, full_fence)
+__TBB_MACHINE_DEFINE_ATOMICS(2,tbb::internal::int16_t, acquire)
+__TBB_MACHINE_DEFINE_ATOMICS(2,tbb::internal::int16_t, release)
+__TBB_MACHINE_DEFINE_ATOMICS(2,tbb::internal::int16_t, relaxed)
+
+__TBB_MACHINE_DEFINE_ATOMICS(4,tbb::internal::int32_t, full_fence)
+__TBB_MACHINE_DEFINE_ATOMICS(4,tbb::internal::int32_t, acquire)
+__TBB_MACHINE_DEFINE_ATOMICS(4,tbb::internal::int32_t, release)
+__TBB_MACHINE_DEFINE_ATOMICS(4,tbb::internal::int32_t, relaxed)
+
+__TBB_MACHINE_DEFINE_ATOMICS(8,tbb::internal::int64_t, full_fence)
+__TBB_MACHINE_DEFINE_ATOMICS(8,tbb::internal::int64_t, acquire)
+__TBB_MACHINE_DEFINE_ATOMICS(8,tbb::internal::int64_t, release)
+__TBB_MACHINE_DEFINE_ATOMICS(8,tbb::internal::int64_t, relaxed)
+
+
+#undef __TBB_MACHINE_DEFINE_ATOMICS
+
+#define __TBB_USE_FENCED_ATOMICS                            1
+
+namespace tbb { namespace internal {
+#if __TBB_FORCE_64BIT_ALIGNMENT_BROKEN
+__TBB_MACHINE_DEFINE_LOAD8_GENERIC_FENCED(full_fence)
+__TBB_MACHINE_DEFINE_STORE8_GENERIC_FENCED(full_fence)
+
+__TBB_MACHINE_DEFINE_LOAD8_GENERIC_FENCED(acquire)
+__TBB_MACHINE_DEFINE_STORE8_GENERIC_FENCED(release)
+
+__TBB_MACHINE_DEFINE_LOAD8_GENERIC_FENCED(relaxed)
+__TBB_MACHINE_DEFINE_STORE8_GENERIC_FENCED(relaxed)
+
+template <typename T>
+struct machine_load_store<T,8> {
+    static T load_with_acquire ( const volatile T& location ) {
+        if( tbb::internal::is_aligned(&location,8)) {
+            return __atomic_load_explicit(&location, memory_order_acquire);
+        } else {
+            return __TBB_machine_generic_load8acquire(&location);
+        }
+    }
+    static void store_with_release ( volatile T &location, T value ) {
+        if( tbb::internal::is_aligned(&location,8)) {
+            __atomic_store_explicit(&location, icc_intrinsics_port::convert_argument(value), memory_order_release);
+        } else {
+            return __TBB_machine_generic_store8release(&location,value);
+        }
+    }
+};
+
+template <typename T>
+struct machine_load_store_relaxed<T,8> {
+    static T load( const volatile T& location ) {
+        if( tbb::internal::is_aligned(&location,8)) {
+            return __atomic_load_explicit(&location, memory_order_relaxed);
+        } else {
+            return __TBB_machine_generic_load8relaxed(&location);
+        }
+    }
+    static void store( volatile T &location, T value ) {
+        if( tbb::internal::is_aligned(&location,8)) {
+            __atomic_store_explicit(&location, icc_intrinsics_port::convert_argument(value), memory_order_relaxed);
+        } else {
+            return __TBB_machine_generic_store8relaxed(&location,value);
+        }
+    }
+};
+
+template <typename T >
+struct machine_load_store_seq_cst<T,8> {
+    static T load ( const volatile T& location ) {
+        if( tbb::internal::is_aligned(&location,8)) {
+            return __atomic_load_explicit(&location, memory_order_seq_cst);
+        } else {
+            return __TBB_machine_generic_load8full_fence(&location);
+        }
+
+    }
+
+    static void store ( volatile T &location, T value ) {
+        if( tbb::internal::is_aligned(&location,8)) {
+            __atomic_store_explicit(&location, value, memory_order_seq_cst);
+        } else {
+            return __TBB_machine_generic_store8full_fence(&location,value);
+        }
+
+    }
+};
+
+#endif
+}} // namespace tbb::internal
+template <typename T>
+inline void __TBB_machine_OR( T *operand, T addend ) {
+    __atomic_fetch_or_explicit(operand, addend, tbb::internal::memory_order_seq_cst);
+}
+
+template <typename T>
+inline void __TBB_machine_AND( T *operand, T addend ) {
+    __atomic_fetch_and_explicit(operand, addend, tbb::internal::memory_order_seq_cst);
+}
+
diff --git a/xdl/third_party/tbb/include/tbb/machine/linux_common.h b/xdl/third_party/tbb/include/tbb/machine/linux_common.h
new file mode 100644
index 00000000..7c5e0344
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/linux_common.h
@@ -0,0 +1,109 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_machine_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#include <sched.h>
+#define __TBB_Yield()  sched_yield()
+
+#include <unistd.h>
+/* Futex definitions */
+#include <sys/syscall.h>
+
+#if defined(SYS_futex)
+/* This header file is included for Linux and some other systems that may support futexes.*/
+
+#define __TBB_USE_FUTEX 1
+
+#if defined(__has_include)
+#define __TBB_has_include __has_include
+#else
+#define __TBB_has_include(x) 0
+#endif
+
+/*
+If available, use typical headers where futex API is defined. While Linux and OpenBSD
+are known to provide such headers, other systems might have them as well.
+*/
+#if defined(__linux__) || __TBB_has_include(<linux/futex.h>)
+#include <linux/futex.h>
+#elif defined(__OpenBSD__) || __TBB_has_include(<sys/futex.h>)
+#include <sys/futex.h>
+#endif
+
+#include <limits.h>
+#include <errno.h>
+
+/*
+Some systems might not define the macros or use different names. In such case we expect
+the actual parameter values to match Linux: 0 for wait, 1 for wake.
+*/
+#if defined(FUTEX_WAIT_PRIVATE)
+#define __TBB_FUTEX_WAIT FUTEX_WAIT_PRIVATE
+#elif defined(FUTEX_WAIT)
+#define __TBB_FUTEX_WAIT FUTEX_WAIT
+#else
+#define __TBB_FUTEX_WAIT 0
+#endif
+
+#if defined(FUTEX_WAKE_PRIVATE)
+#define __TBB_FUTEX_WAKE FUTEX_WAKE_PRIVATE
+#elif defined(FUTEX_WAKE)
+#define __TBB_FUTEX_WAKE FUTEX_WAKE
+#else
+#define __TBB_FUTEX_WAKE 1
+#endif
+
+#ifndef __TBB_ASSERT
+#error machine specific headers must be included after tbb_stddef.h
+#endif
+
+namespace tbb {
+
+namespace internal {
+
+inline int futex_wait( void *futex, int comparand ) {
+    int r = syscall( SYS_futex,futex,__TBB_FUTEX_WAIT,comparand,NULL,NULL,0 );
+#if TBB_USE_ASSERT
+    int e = errno;
+    __TBB_ASSERT( r==0||r==EWOULDBLOCK||(r==-1&&(e==EAGAIN||e==EINTR)), "futex_wait failed." );
+#endif /* TBB_USE_ASSERT */
+    return r;
+}
+
+inline int futex_wakeup_one( void *futex ) {
+    int r = ::syscall( SYS_futex,futex,__TBB_FUTEX_WAKE,1,NULL,NULL,0 );
+    __TBB_ASSERT( r==0||r==1, "futex_wakeup_one: more than one thread woken up?" );
+    return r;
+}
+
+inline int futex_wakeup_all( void *futex ) {
+    int r = ::syscall( SYS_futex,futex,__TBB_FUTEX_WAKE,INT_MAX,NULL,NULL,0 );
+    __TBB_ASSERT( r>=0, "futex_wakeup_all: error in waking up threads" );
+    return r;
+}
+
+} /* namespace internal */
+
+} /* namespace tbb */
+
+#endif /* SYS_futex */
diff --git a/xdl/third_party/tbb/include/tbb/machine/linux_ia32.h b/xdl/third_party/tbb/include/tbb/machine/linux_ia32.h
new file mode 100644
index 00000000..917c9573
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/linux_ia32.h
@@ -0,0 +1,232 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_linux_ia32_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_linux_ia32_H
+
+#include <stdint.h>
+#include "gcc_ia32_common.h"
+
+#define __TBB_WORDSIZE 4
+#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+
+#define __TBB_compiler_fence() __asm__ __volatile__("": : :"memory")
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
+#define __TBB_release_consistency_helper() __TBB_compiler_fence()
+#define __TBB_full_memory_fence()          __asm__ __volatile__("mfence": : :"memory")
+
+#if __TBB_ICC_ASM_VOLATILE_BROKEN
+#define __TBB_VOLATILE
+#else
+#define __TBB_VOLATILE volatile
+#endif
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,T,X,R)                                        \
+static inline T __TBB_machine_cmpswp##S (volatile void *ptr, T value, T comparand )  \
+{                                                                                    \
+    T result;                                                                        \
+                                                                                     \
+    __asm__ __volatile__("lock\ncmpxchg" X " %2,%1"                                  \
+                          : "=a"(result), "=m"(*(__TBB_VOLATILE T*)ptr)              \
+                          : "q"(value), "0"(comparand), "m"(*(__TBB_VOLATILE T*)ptr) \
+                          : "memory");                                               \
+    return result;                                                                   \
+}                                                                                    \
+                                                                                     \
+static inline T __TBB_machine_fetchadd##S(volatile void *ptr, T addend)              \
+{                                                                                    \
+    T result;                                                                        \
+    __asm__ __volatile__("lock\nxadd" X " %0,%1"                                     \
+                          : R (result), "=m"(*(__TBB_VOLATILE T*)ptr)                \
+                          : "0"(addend), "m"(*(__TBB_VOLATILE T*)ptr)                \
+                          : "memory");                                               \
+    return result;                                                                   \
+}                                                                                    \
+                                                                                     \
+static inline  T __TBB_machine_fetchstore##S(volatile void *ptr, T value)            \
+{                                                                                    \
+    T result;                                                                        \
+    __asm__ __volatile__("lock\nxchg" X " %0,%1"                                     \
+                          : R (result), "=m"(*(__TBB_VOLATILE T*)ptr)                \
+                          : "0"(value), "m"(*(__TBB_VOLATILE T*)ptr)                 \
+                          : "memory");                                               \
+    return result;                                                                   \
+}                                                                                    \
+
+__TBB_MACHINE_DEFINE_ATOMICS(1,int8_t,"","=q")
+__TBB_MACHINE_DEFINE_ATOMICS(2,int16_t,"","=r")
+__TBB_MACHINE_DEFINE_ATOMICS(4,int32_t,"l","=r")
+
+#if __INTEL_COMPILER
+#pragma warning( push )
+// reference to EBX in a function requiring stack alignment
+#pragma warning( disable: 998 )
+#endif
+
+#if __TBB_GCC_CAS8_BUILTIN_INLINING_BROKEN
+#define  __TBB_IA32_CAS8_NOINLINE  __attribute__ ((noinline))
+#else
+#define  __TBB_IA32_CAS8_NOINLINE
+#endif
+
+static inline __TBB_IA32_CAS8_NOINLINE int64_t __TBB_machine_cmpswp8 (volatile void *ptr, int64_t value, int64_t comparand )  {
+//TODO: remove the extra part of condition once __TBB_GCC_BUILTIN_ATOMICS_PRESENT is lowered to gcc version 4.1.2
+#if (__TBB_GCC_BUILTIN_ATOMICS_PRESENT || (__TBB_GCC_VERSION >= 40102)) && !__TBB_GCC_64BIT_ATOMIC_BUILTINS_BROKEN
+    return __sync_val_compare_and_swap( reinterpret_cast<volatile int64_t*>(ptr), comparand, value );
+#else /* !__TBB_GCC_BUILTIN_ATOMICS_PRESENT */
+    //TODO: look like ICC 13.0 has some issues with this code, investigate it more deeply
+    int64_t result;
+    union {
+        int64_t i64;
+        int32_t i32[2];
+    };
+    i64 = value;
+#if __PIC__
+    /* compiling position-independent code */
+    // EBX register preserved for compliance with position-independent code rules on IA32
+    int32_t tmp;
+    __asm__ __volatile__ (
+            "movl  %%ebx,%2\n\t"
+            "movl  %5,%%ebx\n\t"
+#if __GNUC__==3
+            "lock\n\t cmpxchg8b %1\n\t"
+#else
+            "lock\n\t cmpxchg8b (%3)\n\t"
+#endif
+            "movl  %2,%%ebx"
+             : "=A"(result)
+             , "=m"(*(__TBB_VOLATILE int64_t *)ptr)
+             , "=m"(tmp)
+#if __GNUC__==3
+             : "m"(*(__TBB_VOLATILE int64_t *)ptr)
+#else
+             : "SD"(ptr)
+#endif
+             , "0"(comparand)
+             , "m"(i32[0]), "c"(i32[1])
+             : "memory"
+#if __INTEL_COMPILER
+             ,"ebx"
+#endif
+    );
+#else /* !__PIC__ */
+    __asm__ __volatile__ (
+            "lock\n\t cmpxchg8b %1\n\t"
+             : "=A"(result), "=m"(*(__TBB_VOLATILE int64_t *)ptr)
+             : "m"(*(__TBB_VOLATILE int64_t *)ptr)
+             , "0"(comparand)
+             , "b"(i32[0]), "c"(i32[1])
+             : "memory"
+    );
+#endif /* __PIC__ */
+    return result;
+#endif /* !__TBB_GCC_BUILTIN_ATOMICS_PRESENT */
+}
+
+#undef __TBB_IA32_CAS8_NOINLINE
+
+#if __INTEL_COMPILER
+#pragma warning( pop )
+#endif // warning 998 is back
+
+static inline void __TBB_machine_or( volatile void *ptr, uint32_t addend ) {
+    __asm__ __volatile__("lock\norl %1,%0" : "=m"(*(__TBB_VOLATILE uint32_t *)ptr) : "r"(addend), "m"(*(__TBB_VOLATILE uint32_t *)ptr) : "memory");
+}
+
+static inline void __TBB_machine_and( volatile void *ptr, uint32_t addend ) {
+    __asm__ __volatile__("lock\nandl %1,%0" : "=m"(*(__TBB_VOLATILE uint32_t *)ptr) : "r"(addend), "m"(*(__TBB_VOLATILE uint32_t *)ptr) : "memory");
+}
+
+//TODO: Check if it possible and profitable for IA-32 architecture on (Linux* and Windows*)
+//to use of 64-bit load/store via floating point registers together with full fence
+//for sequentially consistent load/store, instead of CAS.
+
+#if __clang__
+#define __TBB_fildq  "fildll"
+#define __TBB_fistpq "fistpll"
+#else
+#define __TBB_fildq  "fildq"
+#define __TBB_fistpq "fistpq"
+#endif
+
+static inline int64_t __TBB_machine_aligned_load8 (const volatile void *ptr) {
+    __TBB_ASSERT(tbb::internal::is_aligned(ptr,8),"__TBB_machine_aligned_load8 should be used with 8 byte aligned locations only \n");
+    int64_t result;
+    __asm__ __volatile__ ( __TBB_fildq  " %1\n\t"
+                           __TBB_fistpq " %0" :  "=m"(result) : "m"(*(const __TBB_VOLATILE uint64_t*)ptr) : "memory" );
+    return result;
+}
+
+static inline void __TBB_machine_aligned_store8 (volatile void *ptr, int64_t value ) {
+    __TBB_ASSERT(tbb::internal::is_aligned(ptr,8),"__TBB_machine_aligned_store8 should be used with 8 byte aligned locations only \n");
+    // Aligned store
+    __asm__ __volatile__ ( __TBB_fildq  " %1\n\t"
+                           __TBB_fistpq " %0" :  "=m"(*(__TBB_VOLATILE int64_t*)ptr) : "m"(value) : "memory" );
+}
+
+static inline int64_t __TBB_machine_load8 (const volatile void *ptr) {
+#if __TBB_FORCE_64BIT_ALIGNMENT_BROKEN
+    if( tbb::internal::is_aligned(ptr,8)) {
+#endif
+        return __TBB_machine_aligned_load8(ptr);
+#if __TBB_FORCE_64BIT_ALIGNMENT_BROKEN
+    } else {
+        // Unaligned load
+        return __TBB_machine_cmpswp8(const_cast<void*>(ptr),0,0);
+    }
+#endif
+}
+
+//! Handles misaligned 8-byte store
+/** Defined in tbb_misc.cpp */
+extern "C" void __TBB_machine_store8_slow( volatile void *ptr, int64_t value );
+extern "C" void __TBB_machine_store8_slow_perf_warning( volatile void *ptr );
+
+static inline void __TBB_machine_store8(volatile void *ptr, int64_t value) {
+#if __TBB_FORCE_64BIT_ALIGNMENT_BROKEN
+    if( tbb::internal::is_aligned(ptr,8)) {
+#endif
+        __TBB_machine_aligned_store8(ptr,value);
+#if __TBB_FORCE_64BIT_ALIGNMENT_BROKEN
+    } else {
+        // Unaligned store
+#if TBB_USE_PERFORMANCE_WARNINGS
+        __TBB_machine_store8_slow_perf_warning(ptr);
+#endif /* TBB_USE_PERFORMANCE_WARNINGS */
+        __TBB_machine_store8_slow(ptr,value);
+    }
+#endif
+}
+
+// Machine specific atomic operations
+#define __TBB_AtomicOR(P,V) __TBB_machine_or(P,V)
+#define __TBB_AtomicAND(P,V) __TBB_machine_and(P,V)
+
+#define __TBB_USE_GENERIC_DWORD_FETCH_ADD                   1
+#define __TBB_USE_GENERIC_DWORD_FETCH_STORE                 1
+#define __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE           1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
diff --git a/xdl/third_party/tbb/include/tbb/machine/linux_ia64.h b/xdl/third_party/tbb/include/tbb/machine/linux_ia64.h
new file mode 100644
index 00000000..0510ecc2
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/linux_ia64.h
@@ -0,0 +1,181 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_linux_ia64_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_linux_ia64_H
+
+#include <stdint.h>
+#include <ia64intrin.h>
+
+#define __TBB_WORDSIZE 8
+#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+
+#if __INTEL_COMPILER
+    #define __TBB_compiler_fence()
+    #define __TBB_control_consistency_helper() __TBB_compiler_fence()
+    #define __TBB_acquire_consistency_helper()
+    #define __TBB_release_consistency_helper()
+    #define __TBB_full_memory_fence()          __mf()
+#else
+    #define __TBB_compiler_fence() __asm__ __volatile__("": : :"memory")
+    #define __TBB_control_consistency_helper() __TBB_compiler_fence()
+    // Even though GCC imbues volatile loads with acquire semantics, it sometimes moves
+    // loads over the acquire fence. The following helpers stop such incorrect code motion.
+    #define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
+    #define __TBB_release_consistency_helper() __TBB_compiler_fence()
+    #define __TBB_full_memory_fence()          __asm__ __volatile__("mf": : :"memory")
+#endif /* !__INTEL_COMPILER */
+
+// Most of the functions will be in a .s file
+// TODO: revise dynamic_link, memory pools and etc. if the library dependency is removed.
+
+extern "C" {
+    int8_t __TBB_machine_fetchadd1__TBB_full_fence (volatile void *ptr, int8_t addend);
+    int8_t __TBB_machine_fetchadd1acquire(volatile void *ptr, int8_t addend);
+    int8_t __TBB_machine_fetchadd1release(volatile void *ptr, int8_t addend);
+
+    int16_t __TBB_machine_fetchadd2__TBB_full_fence (volatile void *ptr, int16_t addend);
+    int16_t __TBB_machine_fetchadd2acquire(volatile void *ptr, int16_t addend);
+    int16_t __TBB_machine_fetchadd2release(volatile void *ptr, int16_t addend);
+
+    int32_t __TBB_machine_fetchadd4__TBB_full_fence (volatile void *ptr, int32_t value);
+    int32_t __TBB_machine_fetchadd4acquire(volatile void *ptr, int32_t addend);
+    int32_t __TBB_machine_fetchadd4release(volatile void *ptr, int32_t addend);
+
+    int64_t __TBB_machine_fetchadd8__TBB_full_fence (volatile void *ptr, int64_t value);
+    int64_t __TBB_machine_fetchadd8acquire(volatile void *ptr, int64_t addend);
+    int64_t __TBB_machine_fetchadd8release(volatile void *ptr, int64_t addend);
+
+    int8_t __TBB_machine_fetchstore1__TBB_full_fence (volatile void *ptr, int8_t value);
+    int8_t __TBB_machine_fetchstore1acquire(volatile void *ptr, int8_t value);
+    int8_t __TBB_machine_fetchstore1release(volatile void *ptr, int8_t value);
+
+    int16_t __TBB_machine_fetchstore2__TBB_full_fence (volatile void *ptr, int16_t value);
+    int16_t __TBB_machine_fetchstore2acquire(volatile void *ptr, int16_t value);
+    int16_t __TBB_machine_fetchstore2release(volatile void *ptr, int16_t value);
+
+    int32_t __TBB_machine_fetchstore4__TBB_full_fence (volatile void *ptr, int32_t value);
+    int32_t __TBB_machine_fetchstore4acquire(volatile void *ptr, int32_t value);
+    int32_t __TBB_machine_fetchstore4release(volatile void *ptr, int32_t value);
+
+    int64_t __TBB_machine_fetchstore8__TBB_full_fence (volatile void *ptr, int64_t value);
+    int64_t __TBB_machine_fetchstore8acquire(volatile void *ptr, int64_t value);
+    int64_t __TBB_machine_fetchstore8release(volatile void *ptr, int64_t value);
+
+    int8_t __TBB_machine_cmpswp1__TBB_full_fence (volatile void *ptr, int8_t value, int8_t comparand);
+    int8_t __TBB_machine_cmpswp1acquire(volatile void *ptr, int8_t value, int8_t comparand);
+    int8_t __TBB_machine_cmpswp1release(volatile void *ptr, int8_t value, int8_t comparand);
+
+    int16_t __TBB_machine_cmpswp2__TBB_full_fence (volatile void *ptr, int16_t value, int16_t comparand);
+    int16_t __TBB_machine_cmpswp2acquire(volatile void *ptr, int16_t value, int16_t comparand);
+    int16_t __TBB_machine_cmpswp2release(volatile void *ptr, int16_t value, int16_t comparand);
+
+    int32_t __TBB_machine_cmpswp4__TBB_full_fence (volatile void *ptr, int32_t value, int32_t comparand);
+    int32_t __TBB_machine_cmpswp4acquire(volatile void *ptr, int32_t value, int32_t comparand);
+    int32_t __TBB_machine_cmpswp4release(volatile void *ptr, int32_t value, int32_t comparand);
+
+    int64_t __TBB_machine_cmpswp8__TBB_full_fence (volatile void *ptr, int64_t value, int64_t comparand);
+    int64_t __TBB_machine_cmpswp8acquire(volatile void *ptr, int64_t value, int64_t comparand);
+    int64_t __TBB_machine_cmpswp8release(volatile void *ptr, int64_t value, int64_t comparand);
+
+    int64_t __TBB_machine_lg(uint64_t value);
+    void __TBB_machine_pause(int32_t delay);
+    bool __TBB_machine_trylockbyte( volatile unsigned char &ptr );
+    int64_t __TBB_machine_lockbyte( volatile unsigned char &ptr );
+
+    //! Retrieves the current RSE backing store pointer. IA64 specific.
+    void* __TBB_get_bsp();
+
+    int32_t __TBB_machine_load1_relaxed(const void *ptr);
+    int32_t __TBB_machine_load2_relaxed(const void *ptr);
+    int32_t __TBB_machine_load4_relaxed(const void *ptr);
+    int64_t __TBB_machine_load8_relaxed(const void *ptr);
+
+    void __TBB_machine_store1_relaxed(void *ptr, int32_t value);
+    void __TBB_machine_store2_relaxed(void *ptr, int32_t value);
+    void __TBB_machine_store4_relaxed(void *ptr, int32_t value);
+    void __TBB_machine_store8_relaxed(void *ptr, int64_t value);
+} // extern "C"
+
+// Mapping old entry points to the names corresponding to the new full_fence identifier.
+#define __TBB_machine_fetchadd1full_fence   __TBB_machine_fetchadd1__TBB_full_fence
+#define __TBB_machine_fetchadd2full_fence   __TBB_machine_fetchadd2__TBB_full_fence
+#define __TBB_machine_fetchadd4full_fence   __TBB_machine_fetchadd4__TBB_full_fence
+#define __TBB_machine_fetchadd8full_fence   __TBB_machine_fetchadd8__TBB_full_fence
+#define __TBB_machine_fetchstore1full_fence __TBB_machine_fetchstore1__TBB_full_fence
+#define __TBB_machine_fetchstore2full_fence __TBB_machine_fetchstore2__TBB_full_fence
+#define __TBB_machine_fetchstore4full_fence __TBB_machine_fetchstore4__TBB_full_fence
+#define __TBB_machine_fetchstore8full_fence __TBB_machine_fetchstore8__TBB_full_fence
+#define __TBB_machine_cmpswp1full_fence     __TBB_machine_cmpswp1__TBB_full_fence
+#define __TBB_machine_cmpswp2full_fence     __TBB_machine_cmpswp2__TBB_full_fence
+#define __TBB_machine_cmpswp4full_fence     __TBB_machine_cmpswp4__TBB_full_fence
+#define __TBB_machine_cmpswp8full_fence     __TBB_machine_cmpswp8__TBB_full_fence
+
+// Mapping relaxed operations to the entry points implementing them.
+/** On IA64 RMW operations implicitly have acquire semantics. Thus one cannot
+    actually have completely relaxed RMW operation here. **/
+#define __TBB_machine_fetchadd1relaxed      __TBB_machine_fetchadd1acquire
+#define __TBB_machine_fetchadd2relaxed      __TBB_machine_fetchadd2acquire
+#define __TBB_machine_fetchadd4relaxed      __TBB_machine_fetchadd4acquire
+#define __TBB_machine_fetchadd8relaxed      __TBB_machine_fetchadd8acquire
+#define __TBB_machine_fetchstore1relaxed    __TBB_machine_fetchstore1acquire
+#define __TBB_machine_fetchstore2relaxed    __TBB_machine_fetchstore2acquire
+#define __TBB_machine_fetchstore4relaxed    __TBB_machine_fetchstore4acquire
+#define __TBB_machine_fetchstore8relaxed    __TBB_machine_fetchstore8acquire
+#define __TBB_machine_cmpswp1relaxed        __TBB_machine_cmpswp1acquire
+#define __TBB_machine_cmpswp2relaxed        __TBB_machine_cmpswp2acquire
+#define __TBB_machine_cmpswp4relaxed        __TBB_machine_cmpswp4acquire
+#define __TBB_machine_cmpswp8relaxed        __TBB_machine_cmpswp8acquire
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,V)                               \
+    template <typename T>                                               \
+    struct machine_load_store_relaxed<T,S> {                      \
+        static inline T load ( const T& location ) {                    \
+            return (T)__TBB_machine_load##S##_relaxed(&location);       \
+        }                                                               \
+        static inline void store ( T& location, T value ) {             \
+            __TBB_machine_store##S##_relaxed(&location, (V)value);      \
+        }                                                               \
+    }
+
+namespace tbb {
+namespace internal {
+    __TBB_MACHINE_DEFINE_ATOMICS(1,int8_t);
+    __TBB_MACHINE_DEFINE_ATOMICS(2,int16_t);
+    __TBB_MACHINE_DEFINE_ATOMICS(4,int32_t);
+    __TBB_MACHINE_DEFINE_ATOMICS(8,int64_t);
+}} // namespaces internal, tbb
+
+#undef __TBB_MACHINE_DEFINE_ATOMICS
+
+#define __TBB_USE_FENCED_ATOMICS                            1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+// Definition of Lock functions
+#define __TBB_TryLockByte(P) __TBB_machine_trylockbyte(P)
+#define __TBB_LockByte(P)    __TBB_machine_lockbyte(P)
+
+// Definition of other utility functions
+#define __TBB_Pause(V) __TBB_machine_pause(V)
+#define __TBB_Log2(V)  __TBB_machine_lg(V)
diff --git a/xdl/third_party/tbb/include/tbb/machine/linux_intel64.h b/xdl/third_party/tbb/include/tbb/machine/linux_intel64.h
new file mode 100644
index 00000000..5bd491d3
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/linux_intel64.h
@@ -0,0 +1,96 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_linux_intel64_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_linux_intel64_H
+
+#include <stdint.h>
+#include "gcc_ia32_common.h"
+
+#define __TBB_WORDSIZE 8
+#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+
+#define __TBB_compiler_fence() __asm__ __volatile__("": : :"memory")
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
+#define __TBB_release_consistency_helper() __TBB_compiler_fence()
+
+#ifndef __TBB_full_memory_fence
+#define __TBB_full_memory_fence() __asm__ __volatile__("mfence": : :"memory")
+#endif
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,T,X)                                          \
+static inline T __TBB_machine_cmpswp##S (volatile void *ptr, T value, T comparand )  \
+{                                                                                    \
+    T result;                                                                        \
+                                                                                     \
+    __asm__ __volatile__("lock\ncmpxchg" X " %2,%1"                                  \
+                          : "=a"(result), "=m"(*(volatile T*)ptr)                    \
+                          : "q"(value), "0"(comparand), "m"(*(volatile T*)ptr)       \
+                          : "memory");                                               \
+    return result;                                                                   \
+}                                                                                    \
+                                                                                     \
+static inline T __TBB_machine_fetchadd##S(volatile void *ptr, T addend)              \
+{                                                                                    \
+    T result;                                                                        \
+    __asm__ __volatile__("lock\nxadd" X " %0,%1"                                     \
+                          : "=r"(result),"=m"(*(volatile T*)ptr)                     \
+                          : "0"(addend), "m"(*(volatile T*)ptr)                      \
+                          : "memory");                                               \
+    return result;                                                                   \
+}                                                                                    \
+                                                                                     \
+static inline  T __TBB_machine_fetchstore##S(volatile void *ptr, T value)            \
+{                                                                                    \
+    T result;                                                                        \
+    __asm__ __volatile__("lock\nxchg" X " %0,%1"                                     \
+                          : "=r"(result),"=m"(*(volatile T*)ptr)                     \
+                          : "0"(value), "m"(*(volatile T*)ptr)                       \
+                          : "memory");                                               \
+    return result;                                                                   \
+}                                                                                    \
+
+__TBB_MACHINE_DEFINE_ATOMICS(1,int8_t,"")
+__TBB_MACHINE_DEFINE_ATOMICS(2,int16_t,"")
+__TBB_MACHINE_DEFINE_ATOMICS(4,int32_t,"")
+__TBB_MACHINE_DEFINE_ATOMICS(8,int64_t,"q")
+
+#undef __TBB_MACHINE_DEFINE_ATOMICS
+
+static inline void __TBB_machine_or( volatile void *ptr, uint64_t value ) {
+    __asm__ __volatile__("lock\norq %1,%0" : "=m"(*(volatile uint64_t*)ptr) : "r"(value), "m"(*(volatile uint64_t*)ptr) : "memory");
+}
+
+static inline void __TBB_machine_and( volatile void *ptr, uint64_t value ) {
+    __asm__ __volatile__("lock\nandq %1,%0" : "=m"(*(volatile uint64_t*)ptr) : "r"(value), "m"(*(volatile uint64_t*)ptr) : "memory");
+}
+
+#define __TBB_AtomicOR(P,V) __TBB_machine_or(P,V)
+#define __TBB_AtomicAND(P,V) __TBB_machine_and(P,V)
+
+#define __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE           1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
diff --git a/xdl/third_party/tbb/include/tbb/machine/mac_ppc.h b/xdl/third_party/tbb/include/tbb/machine/mac_ppc.h
new file mode 100644
index 00000000..f68091f1
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/mac_ppc.h
@@ -0,0 +1,313 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_gcc_power_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_gcc_power_H
+
+#include <stdint.h>
+#include <unistd.h>
+
+// TODO: rename to gcc_power.h?
+// This file is for Power Architecture with compilers supporting GNU inline-assembler syntax (currently GNU g++ and IBM XL).
+// Note that XL V9.0 (sometimes?) has trouble dealing with empty input and/or clobber lists, so they should be avoided.
+
+#if __powerpc64__ || __ppc64__
+    // IBM XL documents __powerpc64__ (and __PPC64__).
+    // Apple documents __ppc64__ (with __ppc__ only on 32-bit).
+    #define __TBB_WORDSIZE 8
+#else
+    #define __TBB_WORDSIZE 4
+#endif
+
+// Traditionally Power Architecture is big-endian.
+// Little-endian could be just an address manipulation (compatibility with TBB not verified),
+// or normal little-endian (on more recent systems). Embedded PowerPC systems may support
+// page-specific endianness, but then one endianness must be hidden from TBB so that it still sees only one.
+#if __BIG_ENDIAN__ || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_BIG_ENDIAN__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_BIG
+#elif __LITTLE_ENDIAN__ || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+#elif defined(__BYTE_ORDER__)
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_UNSUPPORTED
+#else
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_DETECT
+#endif
+
+// On Power Architecture, (lock-free) 64-bit atomics require 64-bit hardware:
+#if __TBB_WORDSIZE==8
+    // Do not change the following definition, because TBB itself will use 64-bit atomics in 64-bit builds.
+    #define __TBB_64BIT_ATOMICS 1
+#elif __bgp__
+    // Do not change the following definition, because this is known 32-bit hardware.
+    #define __TBB_64BIT_ATOMICS 0
+#else
+    // To enable 64-bit atomics in 32-bit builds, set the value below to 1 instead of 0.
+    // You must make certain that the program will only use them on actual 64-bit hardware
+    // (which typically means that the entire program is only executed on such hardware),
+    // because their implementation involves machine instructions that are illegal elsewhere.
+    // The setting can be chosen independently per compilation unit,
+    // which also means that TBB itself does not need to be rebuilt.
+    // Alternatively (but only for the current architecture and TBB version),
+    // override the default as a predefined macro when invoking the compiler.
+    #ifndef __TBB_64BIT_ATOMICS
+    #define __TBB_64BIT_ATOMICS 0
+    #endif
+#endif
+
+inline int32_t __TBB_machine_cmpswp4 (volatile void *ptr, int32_t value, int32_t comparand )
+{
+    int32_t result;
+
+    __asm__ __volatile__("sync\n"
+                         "0:\n\t"
+                         "lwarx %[res],0,%[ptr]\n\t"     /* load w/ reservation */
+                         "cmpw %[res],%[cmp]\n\t"        /* compare against comparand */
+                         "bne- 1f\n\t"                   /* exit if not same */
+                         "stwcx. %[val],0,%[ptr]\n\t"    /* store new value */
+                         "bne- 0b\n"                     /* retry if reservation lost */
+                         "1:\n\t"                        /* the exit */
+                         "isync"
+                         : [res]"=&r"(result)
+                         , "+m"(* (int32_t*) ptr)        /* redundant with "memory" */
+                         : [ptr]"r"(ptr)
+                         , [val]"r"(value)
+                         , [cmp]"r"(comparand)
+                         : "memory"                      /* compiler full fence */
+                         , "cr0"                         /* clobbered by cmp and/or stwcx. */
+                         );
+    return result;
+}
+
+#if __TBB_WORDSIZE==8
+
+inline int64_t __TBB_machine_cmpswp8 (volatile void *ptr, int64_t value, int64_t comparand )
+{
+    int64_t result;
+    __asm__ __volatile__("sync\n"
+                         "0:\n\t"
+                         "ldarx %[res],0,%[ptr]\n\t"     /* load w/ reservation */
+                         "cmpd %[res],%[cmp]\n\t"        /* compare against comparand */
+                         "bne- 1f\n\t"                   /* exit if not same */
+                         "stdcx. %[val],0,%[ptr]\n\t"    /* store new value */
+                         "bne- 0b\n"                     /* retry if reservation lost */
+                         "1:\n\t"                        /* the exit */
+                         "isync"
+                         : [res]"=&r"(result)
+                         , "+m"(* (int64_t*) ptr)        /* redundant with "memory" */
+                         : [ptr]"r"(ptr)
+                         , [val]"r"(value)
+                         , [cmp]"r"(comparand)
+                         : "memory"                      /* compiler full fence */
+                         , "cr0"                         /* clobbered by cmp and/or stdcx. */
+                         );
+    return result;
+}
+
+#elif __TBB_64BIT_ATOMICS /* && __TBB_WORDSIZE==4 */
+
+inline int64_t __TBB_machine_cmpswp8 (volatile void *ptr, int64_t value, int64_t comparand )
+{
+    int64_t result;
+    int64_t value_register, comparand_register, result_register; // dummy variables to allocate registers
+    __asm__ __volatile__("sync\n\t"
+                         "ld %[val],%[valm]\n\t"
+                         "ld %[cmp],%[cmpm]\n"
+                         "0:\n\t"
+                         "ldarx %[res],0,%[ptr]\n\t"     /* load w/ reservation */
+                         "cmpd %[res],%[cmp]\n\t"        /* compare against comparand */
+                         "bne- 1f\n\t"                   /* exit if not same */
+                         "stdcx. %[val],0,%[ptr]\n\t"    /* store new value */
+                         "bne- 0b\n"                     /* retry if reservation lost */
+                         "1:\n\t"                        /* the exit */
+                         "std %[res],%[resm]\n\t"
+                         "isync"
+                         : [resm]"=m"(result)
+                         , [res] "=&r"(   result_register)
+                         , [val] "=&r"(    value_register)
+                         , [cmp] "=&r"(comparand_register)
+                         , "+m"(* (int64_t*) ptr)        /* redundant with "memory" */
+                         : [ptr] "r"(ptr)
+                         , [valm]"m"(value)
+                         , [cmpm]"m"(comparand)
+                         : "memory"                      /* compiler full fence */
+                         , "cr0"                         /* clobbered by cmpd and/or stdcx. */
+                         );
+    return result;
+}
+
+#endif /* __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS */
+
+#define __TBB_MACHINE_DEFINE_LOAD_STORE(S,ldx,stx,cmpx)                                                       \
+    template <typename T>                                                                                     \
+    struct machine_load_store<T,S> {                                                                          \
+        static inline T load_with_acquire(const volatile T& location) {                                       \
+            T result;                                                                                         \
+            __asm__ __volatile__(ldx " %[res],0(%[ptr])\n"                                                    \
+                                 "0:\n\t"                                                                     \
+                                 cmpx " %[res],%[res]\n\t"                                                    \
+                                 "bne- 0b\n\t"                                                                \
+                                 "isync"                                                                      \
+                                 : [res]"=r"(result)                                                          \
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */                       \
+                                 , "m"(location)       /* redundant with "memory" */                          \
+                                 : "memory"            /* compiler acquire fence */                           \
+                                 , "cr0"               /* clobbered by cmpw/cmpd */);                         \
+            return result;                                                                                    \
+        }                                                                                                     \
+        static inline void store_with_release(volatile T &location, T value) {                                \
+            __asm__ __volatile__("lwsync\n\t"                                                                 \
+                                 stx " %[val],0(%[ptr])"                                                      \
+                                 : "=m"(location)      /* redundant with "memory" */                          \
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */                       \
+                                 , [val]"r"(value)                                                            \
+                                 : "memory"/*compiler release fence*/ /*(cr0 not affected)*/);                \
+        }                                                                                                     \
+    };                                                                                                        \
+                                                                                                              \
+    template <typename T>                                                                                     \
+    struct machine_load_store_relaxed<T,S> {                                                                  \
+        static inline T load (const __TBB_atomic T& location) {                                               \
+            T result;                                                                                         \
+            __asm__ __volatile__(ldx " %[res],0(%[ptr])"                                                      \
+                                 : [res]"=r"(result)                                                          \
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */                       \
+                                 , "m"(location)                                                              \
+                                 ); /*(no compiler fence)*/ /*(cr0 not affected)*/                            \
+            return result;                                                                                    \
+        }                                                                                                     \
+        static inline void store (__TBB_atomic T &location, T value) {                                        \
+            __asm__ __volatile__(stx " %[val],0(%[ptr])"                                                      \
+                                 : "=m"(location)                                                             \
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */                       \
+                                 , [val]"r"(value)                                                            \
+                                 ); /*(no compiler fence)*/ /*(cr0 not affected)*/                            \
+        }                                                                                                     \
+    };
+
+namespace tbb {
+namespace internal {
+    __TBB_MACHINE_DEFINE_LOAD_STORE(1,"lbz","stb","cmpw")
+    __TBB_MACHINE_DEFINE_LOAD_STORE(2,"lhz","sth","cmpw")
+    __TBB_MACHINE_DEFINE_LOAD_STORE(4,"lwz","stw","cmpw")
+
+#if __TBB_WORDSIZE==8
+
+    __TBB_MACHINE_DEFINE_LOAD_STORE(8,"ld" ,"std","cmpd")
+
+#elif __TBB_64BIT_ATOMICS /* && __TBB_WORDSIZE==4 */
+
+    template <typename T>
+    struct machine_load_store<T,8> {
+        static inline T load_with_acquire(const volatile T& location) {
+            T result;
+            T result_register; // dummy variable to allocate a register
+            __asm__ __volatile__("ld %[res],0(%[ptr])\n\t"
+                                 "std %[res],%[resm]\n"
+                                 "0:\n\t"
+                                 "cmpd %[res],%[res]\n\t"
+                                 "bne- 0b\n\t"
+                                 "isync"
+                                 : [resm]"=m"(result)
+                                 , [res]"=&r"(result_register)
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */
+                                 , "m"(location)       /* redundant with "memory" */
+                                 : "memory"            /* compiler acquire fence */
+                                 , "cr0"               /* clobbered by cmpd */);
+            return result;
+        }
+
+        static inline void store_with_release(volatile T &location, T value) {
+            T value_register; // dummy variable to allocate a register
+            __asm__ __volatile__("lwsync\n\t"
+                                 "ld %[val],%[valm]\n\t"
+                                 "std %[val],0(%[ptr])"
+                                 : "=m"(location)      /* redundant with "memory" */
+                                 , [val]"=&r"(value_register)
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */
+                                 , [valm]"m"(value)
+                                 : "memory"/*compiler release fence*/ /*(cr0 not affected)*/);
+        }
+    };
+
+    struct machine_load_store_relaxed<T,8> {
+        static inline T load (const volatile T& location) {
+            T result;
+            T result_register; // dummy variable to allocate a register
+            __asm__ __volatile__("ld %[res],0(%[ptr])\n\t"
+                                 "std %[res],%[resm]"
+                                 : [resm]"=m"(result)
+                                 , [res]"=&r"(result_register)
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */
+                                 , "m"(location)
+                                 ); /*(no compiler fence)*/ /*(cr0 not affected)*/
+            return result;
+        }
+
+        static inline void store (volatile T &location, T value) {
+            T value_register; // dummy variable to allocate a register
+            __asm__ __volatile__("ld %[val],%[valm]\n\t"
+                                 "std %[val],0(%[ptr])"
+                                 : "=m"(location)
+                                 , [val]"=&r"(value_register)
+                                 : [ptr]"b"(&location) /* cannot use register 0 here */
+                                 , [valm]"m"(value)
+                                 ); /*(no compiler fence)*/ /*(cr0 not affected)*/
+        }
+    };
+    #define __TBB_machine_load_store_relaxed_8
+
+#endif /* __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS */
+
+}} // namespaces internal, tbb
+
+#undef __TBB_MACHINE_DEFINE_LOAD_STORE
+
+#define __TBB_USE_GENERIC_PART_WORD_CAS                     1
+#define __TBB_USE_GENERIC_FETCH_ADD                         1
+#define __TBB_USE_GENERIC_FETCH_STORE                       1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+#define __TBB_control_consistency_helper() __asm__ __volatile__("isync": : :"memory")
+#define __TBB_full_memory_fence()          __asm__ __volatile__( "sync": : :"memory")
+
+static inline intptr_t __TBB_machine_lg( uintptr_t x ) {
+    __TBB_ASSERT(x, "__TBB_Log2(0) undefined");
+    // cntlzd/cntlzw starts counting at 2^63/2^31 (ignoring any higher-order bits), and does not affect cr0
+#if __TBB_WORDSIZE==8
+    __asm__ __volatile__ ("cntlzd %0,%0" : "+r"(x));
+    return 63-static_cast<intptr_t>(x);
+#else
+    __asm__ __volatile__ ("cntlzw %0,%0" : "+r"(x));
+    return 31-static_cast<intptr_t>(x);
+#endif
+}
+#define __TBB_Log2(V) __TBB_machine_lg(V)
+
+// Assumes implicit alignment for any 32-bit value
+typedef uint32_t __TBB_Flag;
+#define __TBB_Flag __TBB_Flag
+
+inline bool __TBB_machine_trylockbyte( __TBB_atomic __TBB_Flag &flag ) {
+    return __TBB_machine_cmpswp4(&flag,1,0)==0;
+}
+#define __TBB_TryLockByte(P) __TBB_machine_trylockbyte(P)
diff --git a/xdl/third_party/tbb/include/tbb/machine/macos_common.h b/xdl/third_party/tbb/include/tbb/machine/macos_common.h
new file mode 100644
index 00000000..0b7dd374
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/macos_common.h
@@ -0,0 +1,133 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_macos_common_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_macos_common_H
+
+#include <sched.h>
+#define __TBB_Yield()  sched_yield()
+
+// __TBB_HardwareConcurrency
+
+#include <sys/types.h>
+#include <sys/sysctl.h>
+
+static inline int __TBB_macos_available_cpu() {
+    int name[2] = {CTL_HW, HW_AVAILCPU};
+    int ncpu;
+    size_t size = sizeof(ncpu);
+    sysctl( name, 2, &ncpu, &size, NULL, 0 );
+    return ncpu;
+}
+
+#define __TBB_HardwareConcurrency() __TBB_macos_available_cpu()
+
+#ifndef __TBB_full_memory_fence
+    // TBB has not recognized the architecture (none of the architecture abstraction
+    // headers was included).
+    #define __TBB_UnknownArchitecture 1
+#endif
+
+#if __TBB_UnknownArchitecture
+// Implementation of atomic operations based on OS provided primitives
+#include <libkern/OSAtomic.h>
+
+static inline int64_t __TBB_machine_cmpswp8_OsX(volatile void *ptr, int64_t value, int64_t comparand)
+{
+    __TBB_ASSERT( tbb::internal::is_aligned(ptr,8), "address not properly aligned for macOS* atomics");
+    int64_t* address = (int64_t*)ptr;
+    while( !OSAtomicCompareAndSwap64Barrier(comparand, value, address) ){
+#if __TBB_WORDSIZE==8
+        int64_t snapshot = *address;
+#else
+        int64_t snapshot = OSAtomicAdd64( 0, address );
+#endif
+        if( snapshot!=comparand ) return snapshot;
+    }
+    return comparand;
+}
+
+#define __TBB_machine_cmpswp8 __TBB_machine_cmpswp8_OsX
+
+#endif /* __TBB_UnknownArchitecture */
+
+#if __TBB_UnknownArchitecture
+
+#ifndef __TBB_WORDSIZE
+#define __TBB_WORDSIZE __SIZEOF_POINTER__
+#endif
+
+#ifdef __TBB_ENDIANNESS
+    // Already determined based on hardware architecture.
+#elif __BIG_ENDIAN__
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_BIG
+#elif __LITTLE_ENDIAN__
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+#else
+    #define __TBB_ENDIANNESS __TBB_ENDIAN_UNSUPPORTED
+#endif
+
+/** As this generic implementation has absolutely no information about underlying
+    hardware, its performance most likely will be sub-optimal because of full memory
+    fence usages where a more lightweight synchronization means (or none at all)
+    could suffice. Thus if you use this header to enable TBB on a new platform,
+    consider forking it and relaxing below helpers as appropriate. **/
+#define __TBB_control_consistency_helper() OSMemoryBarrier()
+#define __TBB_acquire_consistency_helper() OSMemoryBarrier()
+#define __TBB_release_consistency_helper() OSMemoryBarrier()
+#define __TBB_full_memory_fence()          OSMemoryBarrier()
+
+static inline int32_t __TBB_machine_cmpswp4(volatile void *ptr, int32_t value, int32_t comparand)
+{
+    __TBB_ASSERT( tbb::internal::is_aligned(ptr,4), "address not properly aligned for macOS atomics");
+    int32_t* address = (int32_t*)ptr;
+    while( !OSAtomicCompareAndSwap32Barrier(comparand, value, address) ){
+        int32_t snapshot = *address;
+        if( snapshot!=comparand ) return snapshot;
+    }
+    return comparand;
+}
+
+static inline int32_t __TBB_machine_fetchadd4(volatile void *ptr, int32_t addend)
+{
+    __TBB_ASSERT( tbb::internal::is_aligned(ptr,4), "address not properly aligned for macOS atomics");
+    return OSAtomicAdd32Barrier(addend, (int32_t*)ptr) - addend;
+}
+
+static inline int64_t __TBB_machine_fetchadd8(volatile void *ptr, int64_t addend)
+{
+    __TBB_ASSERT( tbb::internal::is_aligned(ptr,8), "address not properly aligned for macOS atomics");
+    return OSAtomicAdd64Barrier(addend, (int64_t*)ptr) - addend;
+}
+
+#define __TBB_USE_GENERIC_PART_WORD_CAS                     1
+#define __TBB_USE_GENERIC_PART_WORD_FETCH_ADD               1
+#define __TBB_USE_GENERIC_FETCH_STORE                       1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#if __TBB_WORDSIZE == 4
+    #define __TBB_USE_GENERIC_DWORD_LOAD_STORE              1
+#endif
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+#endif /* __TBB_UnknownArchitecture */
diff --git a/xdl/third_party/tbb/include/tbb/machine/mic_common.h b/xdl/third_party/tbb/include/tbb/machine/mic_common.h
new file mode 100644
index 00000000..aab75671
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/mic_common.h
@@ -0,0 +1,57 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_mic_common_H
+#define __TBB_mic_common_H
+
+#ifndef __TBB_machine_H
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#if ! __TBB_DEFINE_MIC
+    #error mic_common.h should be included only when building for Intel(R) Many Integrated Core Architecture
+#endif
+
+#ifndef __TBB_PREFETCHING
+#define __TBB_PREFETCHING 1
+#endif
+#if __TBB_PREFETCHING
+#include <immintrin.h>
+#define __TBB_cl_prefetch(p) _mm_prefetch((const char*)p, _MM_HINT_T1)
+#define __TBB_cl_evict(p) _mm_clevict(p, _MM_HINT_T1)
+#endif
+
+/** Intel(R) Many Integrated Core Architecture does not support mfence and pause instructions **/
+#define __TBB_full_memory_fence() __asm__ __volatile__("lock; addl $0,(%%rsp)":::"memory")
+#define __TBB_Pause(x) _mm_delay_32(16*(x))
+#define __TBB_STEALING_PAUSE 1500/16
+#include <sched.h>
+#define __TBB_Yield() sched_yield()
+
+/** Specifics **/
+#define __TBB_STEALING_ABORT_ON_CONTENTION 1
+#define __TBB_YIELD2P 1
+#define __TBB_HOARD_NONLOCAL_TASKS 1
+
+#if ! ( __FreeBSD__ || __linux__ )
+    #error Intel(R) Many Integrated Core Compiler does not define __FreeBSD__ or __linux__ anymore. Check for the __TBB_XXX_BROKEN defined under __FreeBSD__ or __linux__.
+#endif /* ! ( __FreeBSD__ || __linux__ ) */
+
+#endif /* __TBB_mic_common_H */
diff --git a/xdl/third_party/tbb/include/tbb/machine/msvc_armv7.h b/xdl/third_party/tbb/include/tbb/machine/msvc_armv7.h
new file mode 100644
index 00000000..d11da0a9
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/msvc_armv7.h
@@ -0,0 +1,171 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_msvc_armv7_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_msvc_armv7_H
+
+#include <intrin.h>
+#include <float.h>
+
+#define __TBB_WORDSIZE 4
+
+#define __TBB_ENDIANNESS __TBB_ENDIAN_UNSUPPORTED
+
+#if defined(TBB_WIN32_USE_CL_BUILTINS)
+// We can test this on _M_IX86
+#pragma intrinsic(_ReadWriteBarrier)
+#pragma intrinsic(_mm_mfence)
+#define __TBB_compiler_fence()    _ReadWriteBarrier()
+#define __TBB_full_memory_fence() _mm_mfence()
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
+#define __TBB_release_consistency_helper() __TBB_compiler_fence()
+#else
+//Now __dmb(_ARM_BARRIER_SY) is used for both compiler and memory fences
+//This might be changed later after testing
+#define __TBB_compiler_fence()    __dmb(_ARM_BARRIER_SY)
+#define __TBB_full_memory_fence() __dmb(_ARM_BARRIER_SY)
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#define __TBB_acquire_consistency_helper() __TBB_full_memory_fence()
+#define __TBB_release_consistency_helper() __TBB_full_memory_fence()
+#endif
+
+//--------------------------------------------------
+// Compare and swap
+//--------------------------------------------------
+
+/**
+ * Atomic CAS for 32 bit values, if *ptr==comparand, then *ptr=value, returns *ptr
+ * @param ptr pointer to value in memory to be swapped with value if *ptr==comparand
+ * @param value value to assign *ptr to if *ptr==comparand
+ * @param comparand value to compare with *ptr
+ * @return value originally in memory at ptr, regardless of success
+*/
+
+#define __TBB_MACHINE_DEFINE_ATOMICS_CMPSWP(S,T,F)                                               \
+inline T __TBB_machine_cmpswp##S( volatile void *ptr, T value, T comparand ) {                   \
+    return _InterlockedCompareExchange##F(reinterpret_cast<volatile T *>(ptr),value,comparand);  \
+}                                                                                                \
+
+#define __TBB_MACHINE_DEFINE_ATOMICS_FETCHADD(S,T,F)                                             \
+inline T __TBB_machine_fetchadd##S( volatile void *ptr, T value ) {                              \
+    return _InterlockedExchangeAdd##F(reinterpret_cast<volatile T *>(ptr),value);                \
+}                                                                                                \
+
+__TBB_MACHINE_DEFINE_ATOMICS_CMPSWP(1,char,8)
+__TBB_MACHINE_DEFINE_ATOMICS_CMPSWP(2,short,16)
+__TBB_MACHINE_DEFINE_ATOMICS_CMPSWP(4,long,)
+__TBB_MACHINE_DEFINE_ATOMICS_CMPSWP(8,__int64,64)
+__TBB_MACHINE_DEFINE_ATOMICS_FETCHADD(4,long,)
+#if defined(TBB_WIN32_USE_CL_BUILTINS)
+// No _InterlockedExchangeAdd64 intrinsic on _M_IX86
+#define __TBB_64BIT_ATOMICS 0
+#else
+__TBB_MACHINE_DEFINE_ATOMICS_FETCHADD(8,__int64,64)
+#endif
+
+inline void __TBB_machine_pause (int32_t delay )
+{
+    while(delay>0)
+    {
+        __TBB_compiler_fence();
+        delay--;
+    }
+}
+
+// API to retrieve/update FPU control setting
+#define __TBB_CPU_CTL_ENV_PRESENT 1
+
+namespace tbb {
+namespace internal {
+
+template <typename T, size_t S>
+struct machine_load_store_relaxed {
+    static inline T load ( const volatile T& location ) {
+        const T value = location;
+
+        /*
+        * An extra memory barrier is required for errata #761319
+        * Please see http://infocenter.arm.com/help/topic/com.arm.doc.uan0004a
+        */
+        __TBB_acquire_consistency_helper();
+        return value;
+    }
+
+    static inline void store ( volatile T& location, T value ) {
+        location = value;
+    }
+};
+
+class cpu_ctl_env {
+private:
+    unsigned int my_ctl;
+public:
+    bool operator!=( const cpu_ctl_env& ctl ) const { return my_ctl != ctl.my_ctl; }
+    void get_env() { my_ctl = _control87(0, 0); }
+    void set_env() const { _control87( my_ctl, ~0U ); }
+};
+
+} // namespace internal
+} // namespaces tbb
+
+// Machine specific atomic operations
+#define __TBB_CompareAndSwap4(P,V,C) __TBB_machine_cmpswp4(P,V,C)
+#define __TBB_CompareAndSwap8(P,V,C) __TBB_machine_cmpswp8(P,V,C)
+#define __TBB_Pause(V) __TBB_machine_pause(V)
+
+// Use generics for some things
+#define __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE               1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_PART_WORD_FETCH_ADD                   1
+#define __TBB_USE_GENERIC_PART_WORD_FETCH_STORE                 1
+#define __TBB_USE_GENERIC_FETCH_STORE                           1
+#define __TBB_USE_GENERIC_DWORD_LOAD_STORE                      1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE     1
+
+#if defined(TBB_WIN32_USE_CL_BUILTINS)
+#if !__TBB_WIN8UI_SUPPORT
+extern "C" __declspec(dllimport) int __stdcall SwitchToThread( void );
+#define __TBB_Yield()  SwitchToThread()
+#else
+#include<thread>
+#define __TBB_Yield()  std::this_thread::yield()
+#endif
+#else
+#define __TBB_Yield() __yield()
+#endif
+
+// Machine specific atomic operations
+#define __TBB_AtomicOR(P,V)     __TBB_machine_OR(P,V)
+#define __TBB_AtomicAND(P,V)    __TBB_machine_AND(P,V)
+
+template <typename T1,typename T2>
+inline void __TBB_machine_OR( T1 *operand, T2 addend ) {
+    _InterlockedOr((long volatile *)operand, (long)addend);
+}
+
+template <typename T1,typename T2>
+inline void __TBB_machine_AND( T1 *operand, T2 addend ) {
+    _InterlockedAnd((long volatile *)operand, (long)addend);
+}
+
diff --git a/xdl/third_party/tbb/include/tbb/machine/msvc_ia32_common.h b/xdl/third_party/tbb/include/tbb/machine/msvc_ia32_common.h
new file mode 100644
index 00000000..613acafa
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/msvc_ia32_common.h
@@ -0,0 +1,279 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_msvc_ia32_common_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_msvc_ia32_common_H
+
+#include <intrin.h>
+
+//TODO: consider moving this macro to tbb_config.h and using where MSVC asm is used
+#if  !_M_X64 || __INTEL_COMPILER
+    #define __TBB_X86_MSVC_INLINE_ASM_AVAILABLE 1
+#else
+    //MSVC in x64 mode does not accept inline assembler
+    #define __TBB_X86_MSVC_INLINE_ASM_AVAILABLE 0
+    #define __TBB_NO_X86_MSVC_INLINE_ASM_MSG "The compiler being used is not supported (outdated?)"
+#endif
+
+#if _M_X64
+    #define __TBB_r(reg_name) r##reg_name
+    #define __TBB_W(name) name##64
+    namespace tbb { namespace internal { namespace msvc_intrinsics {
+        typedef __int64 word;
+    }}}
+#else
+    #define __TBB_r(reg_name) e##reg_name
+    #define __TBB_W(name) name
+    namespace tbb { namespace internal { namespace msvc_intrinsics {
+        typedef long word;
+    }}}
+#endif
+
+#if __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT
+    // S is the operand size in bytes, B is the suffix for intrinsics for that size
+    #define __TBB_MACHINE_DEFINE_ATOMICS(S,B,T,U)                                           \
+    __pragma(intrinsic( _InterlockedCompareExchange##B ))                                   \
+    static inline T __TBB_machine_cmpswp##S ( volatile void * ptr, U value, U comparand ) { \
+        return _InterlockedCompareExchange##B ( (T*)ptr, value, comparand );                \
+    }                                                                                       \
+    __pragma(intrinsic( _InterlockedExchangeAdd##B ))                                       \
+    static inline T __TBB_machine_fetchadd##S ( volatile void * ptr, U addend ) {           \
+        return _InterlockedExchangeAdd##B ( (T*)ptr, addend );                              \
+    }                                                                                       \
+    __pragma(intrinsic( _InterlockedExchange##B ))                                          \
+    static inline T __TBB_machine_fetchstore##S ( volatile void * ptr, U value ) {          \
+        return _InterlockedExchange##B ( (T*)ptr, value );                                  \
+    }
+
+    // Atomic intrinsics for 1, 2, and 4 bytes are available for x86 & x64
+    __TBB_MACHINE_DEFINE_ATOMICS(1,8,char,__int8)
+    __TBB_MACHINE_DEFINE_ATOMICS(2,16,short,__int16)
+    __TBB_MACHINE_DEFINE_ATOMICS(4,,long,__int32)
+
+    #if __TBB_WORDSIZE==8
+    __TBB_MACHINE_DEFINE_ATOMICS(8,64,__int64,__int64)
+    #endif
+
+    #undef __TBB_MACHINE_DEFINE_ATOMICS
+#endif /* __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT */
+
+#if _MSC_VER>=1300 || __INTEL_COMPILER>=1100
+    #pragma intrinsic(_ReadWriteBarrier)
+    #pragma intrinsic(_mm_mfence)
+    #define __TBB_compiler_fence()    _ReadWriteBarrier()
+    #define __TBB_full_memory_fence() _mm_mfence()
+#elif __TBB_X86_MSVC_INLINE_ASM_AVAILABLE
+    #define __TBB_compiler_fence()    __asm { __asm nop }
+    #define __TBB_full_memory_fence() __asm { __asm mfence }
+#else
+    #error Unsupported compiler; define __TBB_{control,acquire,release}_consistency_helper to support it
+#endif
+
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
+#define __TBB_release_consistency_helper() __TBB_compiler_fence()
+
+#if (_MSC_VER>=1300) || (__INTEL_COMPILER)
+    #pragma intrinsic(_mm_pause)
+    namespace tbb { namespace internal { namespace msvc_intrinsics {
+        static inline void pause (uintptr_t delay ) {
+            for (;delay>0; --delay )
+                _mm_pause();
+        }
+    }}}
+    #define __TBB_Pause(V) tbb::internal::msvc_intrinsics::pause(V)
+    #define __TBB_SINGLE_PAUSE _mm_pause()
+#else
+    #if !__TBB_X86_MSVC_INLINE_ASM_AVAILABLE
+        #error __TBB_NO_X86_MSVC_INLINE_ASM_MSG
+    #endif
+    namespace tbb { namespace internal { namespace msvc_inline_asm
+        static inline void pause (uintptr_t delay ) {
+            _asm
+            {
+                mov __TBB_r(ax), delay
+              __TBB_L1:
+                pause
+                add __TBB_r(ax), -1
+                jne __TBB_L1
+            }
+            return;
+        }
+    }}}
+    #define __TBB_Pause(V) tbb::internal::msvc_inline_asm::pause(V)
+    #define __TBB_SINGLE_PAUSE __asm pause
+#endif
+
+#if (_MSC_VER>=1400 && !__INTEL_COMPILER) || (__INTEL_COMPILER>=1200)
+// MSVC did not have this intrinsic prior to VC8.
+// ICL 11.1 fails to compile a TBB example if __TBB_Log2 uses the intrinsic.
+    #pragma intrinsic(__TBB_W(_BitScanReverse))
+    namespace tbb { namespace internal { namespace msvc_intrinsics {
+        static inline uintptr_t lg_bsr( uintptr_t i ){
+            unsigned long j;
+            __TBB_W(_BitScanReverse)( &j, i );
+            return j;
+        }
+    }}}
+    #define __TBB_Log2(V) tbb::internal::msvc_intrinsics::lg_bsr(V)
+#else
+    #if !__TBB_X86_MSVC_INLINE_ASM_AVAILABLE
+        #error __TBB_NO_X86_MSVC_INLINE_ASM_MSG
+    #endif
+    namespace tbb { namespace internal { namespace msvc_inline_asm {
+        static inline uintptr_t lg_bsr( uintptr_t i ){
+            uintptr_t j;
+            __asm
+            {
+                bsr __TBB_r(ax), i
+                mov j, __TBB_r(ax)
+            }
+            return j;
+        }
+    }}}
+    #define __TBB_Log2(V) tbb::internal::msvc_inline_asm::lg_bsr(V)
+#endif
+
+#if _MSC_VER>=1400
+    #pragma intrinsic(__TBB_W(_InterlockedOr))
+    #pragma intrinsic(__TBB_W(_InterlockedAnd))
+    namespace tbb { namespace internal { namespace msvc_intrinsics {
+        static inline void lock_or( volatile void *operand, intptr_t addend ){
+            __TBB_W(_InterlockedOr)((volatile word*)operand, addend);
+        }
+        static inline void lock_and( volatile void *operand, intptr_t addend ){
+            __TBB_W(_InterlockedAnd)((volatile word*)operand, addend);
+        }
+    }}}
+    #define __TBB_AtomicOR(P,V)  tbb::internal::msvc_intrinsics::lock_or(P,V)
+    #define __TBB_AtomicAND(P,V) tbb::internal::msvc_intrinsics::lock_and(P,V)
+#else
+    #if !__TBB_X86_MSVC_INLINE_ASM_AVAILABLE
+        #error __TBB_NO_X86_MSVC_INLINE_ASM_MSG
+    #endif
+    namespace tbb { namespace internal { namespace msvc_inline_asm {
+        static inline void lock_or( volatile void *operand, __int32 addend ) {
+            __asm
+            {
+                mov eax, addend
+                mov edx, [operand]
+                lock or [edx], eax
+            }
+         }
+         static inline void lock_and( volatile void *operand, __int32 addend ) {
+            __asm
+            {
+                mov eax, addend
+                mov edx, [operand]
+                lock and [edx], eax
+            }
+         }
+    }}}
+    #define __TBB_AtomicOR(P,V)  tbb::internal::msvc_inline_asm::lock_or(P,V)
+    #define __TBB_AtomicAND(P,V) tbb::internal::msvc_inline_asm::lock_and(P,V)
+#endif
+
+#pragma intrinsic(__rdtsc)
+namespace tbb { namespace internal { typedef uint64_t machine_tsc_t; } }
+static inline tbb::internal::machine_tsc_t __TBB_machine_time_stamp() {
+    return __rdtsc();
+}
+#define __TBB_time_stamp() __TBB_machine_time_stamp()
+
+// API to retrieve/update FPU control setting
+#define __TBB_CPU_CTL_ENV_PRESENT 1
+
+namespace tbb { namespace internal { class cpu_ctl_env; } }
+#if __TBB_X86_MSVC_INLINE_ASM_AVAILABLE
+    inline void __TBB_get_cpu_ctl_env ( tbb::internal::cpu_ctl_env* ctl ) {
+        __asm {
+            __asm mov     __TBB_r(ax), ctl
+            __asm stmxcsr [__TBB_r(ax)]
+            __asm fstcw   [__TBB_r(ax)+4]
+        }
+    }
+    inline void __TBB_set_cpu_ctl_env ( const tbb::internal::cpu_ctl_env* ctl ) {
+        __asm {
+            __asm mov     __TBB_r(ax), ctl
+            __asm ldmxcsr [__TBB_r(ax)]
+            __asm fldcw   [__TBB_r(ax)+4]
+        }
+    }
+#else
+    extern "C" {
+        void __TBB_EXPORTED_FUNC __TBB_get_cpu_ctl_env ( tbb::internal::cpu_ctl_env* );
+        void __TBB_EXPORTED_FUNC __TBB_set_cpu_ctl_env ( const tbb::internal::cpu_ctl_env* );
+    }
+#endif
+
+namespace tbb {
+namespace internal {
+class cpu_ctl_env {
+private:
+    int         mxcsr;
+    short       x87cw;
+    static const int MXCSR_CONTROL_MASK = ~0x3f; /* all except last six status bits */
+public:
+    bool operator!=( const cpu_ctl_env& ctl ) const { return mxcsr != ctl.mxcsr || x87cw != ctl.x87cw; }
+    void get_env() {
+        __TBB_get_cpu_ctl_env( this );
+        mxcsr &= MXCSR_CONTROL_MASK;
+    }
+    void set_env() const { __TBB_set_cpu_ctl_env( this ); }
+};
+} // namespace internal
+} // namespace tbb
+
+#if !__TBB_WIN8UI_SUPPORT
+extern "C" __declspec(dllimport) int __stdcall SwitchToThread( void );
+#define __TBB_Yield()  SwitchToThread()
+#else
+#include<thread>
+#define __TBB_Yield()  std::this_thread::yield()
+#endif
+
+#undef __TBB_r
+#undef __TBB_W
+#undef __TBB_word
+
+extern "C" {
+    __int8 __TBB_EXPORTED_FUNC __TBB_machine_try_lock_elided (volatile void* ptr);
+    void   __TBB_EXPORTED_FUNC __TBB_machine_unlock_elided (volatile void* ptr);
+
+    // 'pause' instruction aborts HLE/RTM transactions
+    inline static void __TBB_machine_try_lock_elided_cancel() { __TBB_SINGLE_PAUSE; }
+
+#if __TBB_TSX_INTRINSICS_PRESENT
+    #define __TBB_machine_is_in_transaction _xtest
+    #define __TBB_machine_begin_transaction _xbegin
+    #define __TBB_machine_end_transaction   _xend
+    // The value (0xFF) below comes from the
+    // Intel(R) 64 and IA-32 Architectures Optimization Reference Manual 12.4.5 lock not free
+    #define __TBB_machine_transaction_conflict_abort() _xabort(0xFF)
+#else
+    __int8           __TBB_EXPORTED_FUNC __TBB_machine_is_in_transaction();
+    unsigned __int32 __TBB_EXPORTED_FUNC __TBB_machine_begin_transaction();
+    void             __TBB_EXPORTED_FUNC __TBB_machine_end_transaction();
+    void             __TBB_EXPORTED_FUNC __TBB_machine_transaction_conflict_abort();
+#endif /* __TBB_TSX_INTRINSICS_PRESENT */
+}
diff --git a/xdl/third_party/tbb/include/tbb/machine/sunos_sparc.h b/xdl/third_party/tbb/include/tbb/machine/sunos_sparc.h
new file mode 100644
index 00000000..d0548eff
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/sunos_sparc.h
@@ -0,0 +1,203 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_sunos_sparc_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_sunos_sparc_H
+
+#include <stdint.h>
+#include <unistd.h>
+
+#define __TBB_WORDSIZE 8
+// Big endian is assumed for SPARC.
+// While hardware may support page-specific bi-endianness, only big endian pages may be exposed to TBB
+#define __TBB_ENDIANNESS __TBB_ENDIAN_BIG
+
+/** To those working on SPARC hardware. Consider relaxing acquire and release
+    consistency helpers to no-op (as this port covers TSO mode only). **/
+#define __TBB_compiler_fence()             __asm__ __volatile__ ("": : :"memory")
+#define __TBB_control_consistency_helper() __TBB_compiler_fence()
+#define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
+#define __TBB_release_consistency_helper() __TBB_compiler_fence()
+#define __TBB_full_memory_fence()          __asm__ __volatile__("membar #LoadLoad|#LoadStore|#StoreStore|#StoreLoad": : : "memory")
+
+//--------------------------------------------------
+// Compare and swap
+//--------------------------------------------------
+
+/**
+ * Atomic CAS for 32 bit values, if *ptr==comparand, then *ptr=value, returns *ptr
+ * @param ptr pointer to value in memory to be swapped with value if *ptr==comparand
+ * @param value value to assign *ptr to if *ptr==comparand
+ * @param comparand value to compare with *ptr
+ ( @return value originally in memory at ptr, regardless of success
+*/
+static inline int32_t __TBB_machine_cmpswp4(volatile void *ptr, int32_t value, int32_t comparand ){
+  int32_t result;
+  __asm__ __volatile__(
+                       "cas\t[%5],%4,%1"
+                       : "=m"(*(int32_t *)ptr), "=r"(result)
+                       : "m"(*(int32_t *)ptr), "1"(value), "r"(comparand), "r"(ptr)
+                       : "memory");
+  return result;
+}
+
+/**
+ * Atomic CAS for 64 bit values, if *ptr==comparand, then *ptr=value, returns *ptr
+ * @param ptr pointer to value in memory to be swapped with value if *ptr==comparand
+ * @param value value to assign *ptr to if *ptr==comparand
+ * @param comparand value to compare with *ptr
+ ( @return value originally in memory at ptr, regardless of success
+ */
+static inline int64_t __TBB_machine_cmpswp8(volatile void *ptr, int64_t value, int64_t comparand ){
+  int64_t result;
+  __asm__ __volatile__(
+                       "casx\t[%5],%4,%1"
+               : "=m"(*(int64_t *)ptr), "=r"(result)
+               : "m"(*(int64_t *)ptr), "1"(value), "r"(comparand), "r"(ptr)
+               : "memory");
+  return result;
+}
+
+//---------------------------------------------------
+// Fetch and add
+//---------------------------------------------------
+
+/**
+ * Atomic fetch and add for 32 bit values, in this case implemented by continuously checking success of atomicity
+ * @param ptr pointer to value to add addend to
+ * @param addened value to add to *ptr
+ * @return value at ptr before addened was added
+ */
+static inline int32_t __TBB_machine_fetchadd4(volatile void *ptr, int32_t addend){
+  int32_t result;
+  __asm__ __volatile__ (
+                        "0:\t add\t %3, %4, %0\n"           // do addition
+                        "\t cas\t [%2], %3, %0\n"           // cas to store result in memory
+                        "\t cmp\t %3, %0\n"                 // check if value from memory is original
+                        "\t bne,a,pn\t %%icc, 0b\n"         // if not try again
+                        "\t mov %0, %3\n"                   // use branch delay slot to move new value in memory to be added
+               : "=&r"(result), "=m"(*(int32_t *)ptr)
+               : "r"(ptr), "r"(*(int32_t *)ptr), "r"(addend), "m"(*(int32_t *)ptr)
+               : "ccr", "memory");
+  return result;
+}
+
+/**
+ * Atomic fetch and add for 64 bit values, in this case implemented by continuously checking success of atomicity
+ * @param ptr pointer to value to add addend to
+ * @param addened value to add to *ptr
+ * @return value at ptr before addened was added
+ */
+static inline int64_t __TBB_machine_fetchadd8(volatile void *ptr, int64_t addend){
+  int64_t result;
+  __asm__ __volatile__ (
+                        "0:\t add\t %3, %4, %0\n"           // do addition
+                        "\t casx\t [%2], %3, %0\n"          // cas to store result in memory
+                        "\t cmp\t %3, %0\n"                 // check if value from memory is original
+                        "\t bne,a,pn\t %%xcc, 0b\n"         // if not try again
+                        "\t mov %0, %3\n"                   // use branch delay slot to move new value in memory to be added
+                : "=&r"(result), "=m"(*(int64_t *)ptr)
+                : "r"(ptr), "r"(*(int64_t *)ptr), "r"(addend), "m"(*(int64_t *)ptr)
+                : "ccr", "memory");
+  return result;
+}
+
+//--------------------------------------------------------
+// Logarithm (base two, integer)
+//--------------------------------------------------------
+
+static inline int64_t __TBB_machine_lg( uint64_t x ) {
+    __TBB_ASSERT(x, "__TBB_Log2(0) undefined");
+    uint64_t count;
+    // one hot encode
+    x |= (x >> 1);
+    x |= (x >> 2);
+    x |= (x >> 4);
+    x |= (x >> 8);
+    x |= (x >> 16);
+    x |= (x >> 32);
+    // count 1's
+    __asm__ ("popc %1, %0" : "=r"(count) : "r"(x) );
+    return count-1;
+}
+
+//--------------------------------------------------------
+
+static inline void __TBB_machine_or( volatile void *ptr, uint64_t value ) {
+  __asm__ __volatile__ (
+                        "0:\t or\t %2, %3, %%g1\n"          // do operation
+                        "\t casx\t [%1], %2, %%g1\n"        // cas to store result in memory
+                        "\t cmp\t %2, %%g1\n"               // check if value from memory is original
+                        "\t bne,a,pn\t %%xcc, 0b\n"         // if not try again
+                        "\t mov %%g1, %2\n"                 // use branch delay slot to move new value in memory to be added
+                : "=m"(*(int64_t *)ptr)
+                : "r"(ptr), "r"(*(int64_t *)ptr), "r"(value), "m"(*(int64_t *)ptr)
+                : "ccr", "g1", "memory");
+}
+
+static inline void __TBB_machine_and( volatile void *ptr, uint64_t value ) {
+  __asm__ __volatile__ (
+                        "0:\t and\t %2, %3, %%g1\n"         // do operation
+                        "\t casx\t [%1], %2, %%g1\n"        // cas to store result in memory
+                        "\t cmp\t %2, %%g1\n"               // check if value from memory is original
+                        "\t bne,a,pn\t %%xcc, 0b\n"         // if not try again
+                        "\t mov %%g1, %2\n"                 // use branch delay slot to move new value in memory to be added
+                : "=m"(*(int64_t *)ptr)
+                : "r"(ptr), "r"(*(int64_t *)ptr), "r"(value), "m"(*(int64_t *)ptr)
+                : "ccr", "g1", "memory");
+}
+
+
+static inline void __TBB_machine_pause( int32_t delay ) {
+    // do nothing, inlined, doesn't matter
+}
+
+// put 0xff in memory location, return memory value,
+//  generic trylockbyte puts 0x01, however this is fine
+//  because all that matters is that 0 is unlocked
+static inline bool __TBB_machine_trylockbyte(unsigned char &flag){
+    unsigned char result;
+    __asm__ __volatile__ (
+            "ldstub\t [%2], %0\n"
+        : "=r"(result), "=m"(flag)
+        : "r"(&flag), "m"(flag)
+        : "memory");
+    return result == 0;
+}
+
+#define __TBB_USE_GENERIC_PART_WORD_CAS                     1
+#define __TBB_USE_GENERIC_PART_WORD_FETCH_ADD               1
+#define __TBB_USE_GENERIC_FETCH_STORE                       1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+#define __TBB_AtomicOR(P,V) __TBB_machine_or(P,V)
+#define __TBB_AtomicAND(P,V) __TBB_machine_and(P,V)
+
+// Definition of other functions
+#define __TBB_Pause(V) __TBB_machine_pause(V)
+#define __TBB_Log2(V)  __TBB_machine_lg(V)
+
+#define __TBB_TryLockByte(P) __TBB_machine_trylockbyte(P)
diff --git a/xdl/third_party/tbb/include/tbb/machine/windows_api.h b/xdl/third_party/tbb/include/tbb/machine/windows_api.h
new file mode 100644
index 00000000..b7fccb41
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/windows_api.h
@@ -0,0 +1,69 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_machine_windows_api_H
+#define __TBB_machine_windows_api_H
+
+#if _WIN32 || _WIN64
+
+#include <windows.h>
+
+#if _WIN32_WINNT < 0x0600
+// The following Windows API function is declared explicitly;
+// otherwise it fails to compile by VS2005.
+#if !defined(WINBASEAPI) || (_WIN32_WINNT < 0x0501 && _MSC_VER == 1400)
+#define __TBB_WINBASEAPI extern "C"
+#else
+#define __TBB_WINBASEAPI WINBASEAPI
+#endif
+__TBB_WINBASEAPI BOOL WINAPI TryEnterCriticalSection( LPCRITICAL_SECTION );
+__TBB_WINBASEAPI BOOL WINAPI InitializeCriticalSectionAndSpinCount( LPCRITICAL_SECTION, DWORD );
+// Overloading WINBASEAPI macro and using local functions missing in Windows XP/2003
+#define InitializeCriticalSectionEx inlineInitializeCriticalSectionEx
+#define CreateSemaphoreEx inlineCreateSemaphoreEx
+#define CreateEventEx inlineCreateEventEx
+inline BOOL WINAPI inlineInitializeCriticalSectionEx( LPCRITICAL_SECTION lpCriticalSection, DWORD dwSpinCount, DWORD )
+{
+    return InitializeCriticalSectionAndSpinCount( lpCriticalSection, dwSpinCount );
+}
+inline HANDLE WINAPI inlineCreateSemaphoreEx( LPSECURITY_ATTRIBUTES lpSemaphoreAttributes, LONG lInitialCount, LONG lMaximumCount, LPCTSTR lpName, DWORD, DWORD )
+{
+    return CreateSemaphore( lpSemaphoreAttributes, lInitialCount, lMaximumCount, lpName );
+}
+inline HANDLE WINAPI inlineCreateEventEx( LPSECURITY_ATTRIBUTES lpEventAttributes, LPCTSTR lpName, DWORD dwFlags, DWORD )
+{
+    BOOL manual_reset = dwFlags&0x00000001 ? TRUE : FALSE; // CREATE_EVENT_MANUAL_RESET
+    BOOL initial_set  = dwFlags&0x00000002 ? TRUE : FALSE; // CREATE_EVENT_INITIAL_SET
+    return CreateEvent( lpEventAttributes, manual_reset, initial_set, lpName );
+}
+#endif
+
+#if defined(RTL_SRWLOCK_INIT)
+#ifndef __TBB_USE_SRWLOCK
+// TODO: turn it on when bug 1952 will be fixed
+#define __TBB_USE_SRWLOCK 0
+#endif
+#endif
+
+#else
+#error tbb/machine/windows_api.h should only be used for Windows based platforms
+#endif // _WIN32 || _WIN64
+
+#endif // __TBB_machine_windows_api_H
diff --git a/xdl/third_party/tbb/include/tbb/machine/windows_ia32.h b/xdl/third_party/tbb/include/tbb/machine/windows_ia32.h
new file mode 100644
index 00000000..169d14f9
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/windows_ia32.h
@@ -0,0 +1,109 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_windows_ia32_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_windows_ia32_H
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (push)
+    #pragma warning (disable: 4244 4267)
+#endif
+
+#include "msvc_ia32_common.h"
+
+#define __TBB_WORDSIZE 4
+#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+
+extern "C" {
+    __int64 __TBB_EXPORTED_FUNC __TBB_machine_cmpswp8 (volatile void *ptr, __int64 value, __int64 comparand );
+    __int64 __TBB_EXPORTED_FUNC __TBB_machine_fetchadd8 (volatile void *ptr, __int64 addend );
+    __int64 __TBB_EXPORTED_FUNC __TBB_machine_fetchstore8 (volatile void *ptr, __int64 value );
+    void __TBB_EXPORTED_FUNC __TBB_machine_store8 (volatile void *ptr, __int64 value );
+    __int64 __TBB_EXPORTED_FUNC __TBB_machine_load8 (const volatile void *ptr);
+}
+
+#if !__TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT
+
+#define __TBB_MACHINE_DEFINE_ATOMICS(S,T,U,A,C) \
+static inline T __TBB_machine_cmpswp##S ( volatile void * ptr, U value, U comparand ) { \
+    T result; \
+    volatile T *p = (T *)ptr; \
+    __asm \
+    { \
+       __asm mov edx, p \
+       __asm mov C , value \
+       __asm mov A , comparand \
+       __asm lock cmpxchg [edx], C \
+       __asm mov result, A \
+    } \
+    return result; \
+} \
+\
+static inline T __TBB_machine_fetchadd##S ( volatile void * ptr, U addend ) { \
+    T result; \
+    volatile T *p = (T *)ptr; \
+    __asm \
+    { \
+        __asm mov edx, p \
+        __asm mov A, addend \
+        __asm lock xadd [edx], A \
+        __asm mov result, A \
+    } \
+    return result; \
+}\
+\
+static inline T __TBB_machine_fetchstore##S ( volatile void * ptr, U value ) { \
+    T result; \
+    volatile T *p = (T *)ptr; \
+    __asm \
+    { \
+        __asm mov edx, p \
+        __asm mov A, value \
+        __asm lock xchg [edx], A \
+        __asm mov result, A \
+    } \
+    return result; \
+}
+
+
+__TBB_MACHINE_DEFINE_ATOMICS(1, __int8, __int8, al, cl)
+__TBB_MACHINE_DEFINE_ATOMICS(2, __int16, __int16, ax, cx)
+__TBB_MACHINE_DEFINE_ATOMICS(4, ptrdiff_t, ptrdiff_t, eax, ecx)
+
+#undef __TBB_MACHINE_DEFINE_ATOMICS
+
+#endif /* __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT */
+
+//TODO: Check if it possible and profitable for IA-32 architecture on (Linux and Windows)
+//to use of 64-bit load/store via floating point registers together with full fence
+//for sequentially consistent load/store, instead of CAS.
+#define __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE           1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
+
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warnings 4244, 4267 are back
diff --git a/xdl/third_party/tbb/include/tbb/machine/windows_intel64.h b/xdl/third_party/tbb/include/tbb/machine/windows_intel64.h
new file mode 100644
index 00000000..2103c90f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/machine/windows_intel64.h
@@ -0,0 +1,74 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !defined(__TBB_machine_H) || defined(__TBB_machine_windows_intel64_H)
+#error Do not #include this internal file directly; use public TBB headers instead.
+#endif
+
+#define __TBB_machine_windows_intel64_H
+
+#define __TBB_WORDSIZE 8
+#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
+
+#include "msvc_ia32_common.h"
+
+#if !__TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT
+
+#include <intrin.h>
+#pragma intrinsic(_InterlockedCompareExchange,_InterlockedExchangeAdd,_InterlockedExchange)
+#pragma intrinsic(_InterlockedCompareExchange64,_InterlockedExchangeAdd64,_InterlockedExchange64)
+
+// ATTENTION: if you ever change argument types in machine-specific primitives,
+// please take care of atomic_word<> specializations in tbb/atomic.h
+extern "C" {
+    __int8 __TBB_EXPORTED_FUNC __TBB_machine_cmpswp1 (volatile void *ptr, __int8 value, __int8 comparand );
+    __int8 __TBB_EXPORTED_FUNC __TBB_machine_fetchadd1 (volatile void *ptr, __int8 addend );
+    __int8 __TBB_EXPORTED_FUNC __TBB_machine_fetchstore1 (volatile void *ptr, __int8 value );
+    __int16 __TBB_EXPORTED_FUNC __TBB_machine_cmpswp2 (volatile void *ptr, __int16 value, __int16 comparand );
+    __int16 __TBB_EXPORTED_FUNC __TBB_machine_fetchadd2 (volatile void *ptr, __int16 addend );
+    __int16 __TBB_EXPORTED_FUNC __TBB_machine_fetchstore2 (volatile void *ptr, __int16 value );
+}
+
+inline long __TBB_machine_cmpswp4 (volatile void *ptr, __int32 value, __int32 comparand ) {
+    return _InterlockedCompareExchange( (long*)ptr, value, comparand );
+}
+inline long __TBB_machine_fetchadd4 (volatile void *ptr, __int32 addend ) {
+    return _InterlockedExchangeAdd( (long*)ptr, addend );
+}
+inline long __TBB_machine_fetchstore4 (volatile void *ptr, __int32 value ) {
+    return _InterlockedExchange( (long*)ptr, value );
+}
+
+inline __int64 __TBB_machine_cmpswp8 (volatile void *ptr, __int64 value, __int64 comparand ) {
+    return _InterlockedCompareExchange64( (__int64*)ptr, value, comparand );
+}
+inline __int64 __TBB_machine_fetchadd8 (volatile void *ptr, __int64 addend ) {
+    return _InterlockedExchangeAdd64( (__int64*)ptr, addend );
+}
+inline __int64 __TBB_machine_fetchstore8 (volatile void *ptr, __int64 value ) {
+    return _InterlockedExchange64( (__int64*)ptr, value );
+}
+
+#endif /* __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT */
+
+#define __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE           1
+#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE            1
+#define __TBB_USE_GENERIC_RELAXED_LOAD_STORE                1
+#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
diff --git a/xdl/third_party/tbb/include/tbb/memory_pool.h b/xdl/third_party/tbb/include/tbb/memory_pool.h
new file mode 100644
index 00000000..26c64c4f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/memory_pool.h
@@ -0,0 +1,279 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_memory_pool_H
+#define __TBB_memory_pool_H
+
+#if !TBB_PREVIEW_MEMORY_POOL
+#error Set TBB_PREVIEW_MEMORY_POOL to include memory_pool.h
+#endif
+/** @file */
+
+#include "scalable_allocator.h"
+#include <new> // std::bad_alloc
+#include <stdexcept> // std::runtime_error, std::invalid_argument
+// required in C++03 to construct std::runtime_error and std::invalid_argument
+#include <string>
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+#include <utility> // std::forward
+#endif
+
+#if __TBB_EXTRA_DEBUG
+#define __TBBMALLOC_ASSERT ASSERT
+#else
+#define __TBBMALLOC_ASSERT(a,b) ((void)0)
+#endif
+
+namespace tbb {
+namespace interface6 {
+//! @cond INTERNAL
+namespace internal {
+
+//! Base of thread-safe pool allocator for variable-size requests
+class pool_base : tbb::internal::no_copy {
+    // Pool interface is separate from standard allocator classes because it has
+    // to maintain internal state, no copy or assignment. Move and swap are possible.
+public:
+    //! Reset pool to reuse its memory (free all objects at once)
+    void recycle() { rml::pool_reset(my_pool); }
+
+    //! The "malloc" analogue to allocate block of memory of size bytes
+    void *malloc(size_t size) { return rml::pool_malloc(my_pool, size); }
+
+    //! The "free" analogue to discard a previously allocated piece of memory.
+    void free(void* ptr) { rml::pool_free(my_pool, ptr); }
+
+    //! The "realloc" analogue complementing pool_malloc.
+    // Enables some low-level optimization possibilities
+    void *realloc(void* ptr, size_t size) {
+        return rml::pool_realloc(my_pool, ptr, size);
+    }
+
+protected:
+    //! destroy pool - must be called in a child class
+    void destroy() { rml::pool_destroy(my_pool); }
+
+    rml::MemoryPool *my_pool;
+};
+
+} // namespace internal
+//! @endcond
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for erroneous "unreferenced parameter" warning in method destroy.
+    #pragma warning (push)
+    #pragma warning (disable: 4100)
+#endif
+
+//! Meets "allocator" requirements of ISO C++ Standard, Section 20.1.5
+/** @ingroup memory_allocation */
+template<typename T, typename P = internal::pool_base>
+class memory_pool_allocator {
+protected:
+    typedef P pool_type;
+    pool_type *my_pool;
+    template<typename U, typename R>
+    friend class memory_pool_allocator;
+    template<typename V, typename U, typename R>
+    friend bool operator==( const memory_pool_allocator<V,R>& a, const memory_pool_allocator<U,R>& b);
+    template<typename V, typename U, typename R>
+    friend bool operator!=( const memory_pool_allocator<V,R>& a, const memory_pool_allocator<U,R>& b);
+public:
+    typedef typename tbb::internal::allocator_type<T>::value_type value_type;
+    typedef value_type* pointer;
+    typedef const value_type* const_pointer;
+    typedef value_type& reference;
+    typedef const value_type& const_reference;
+    typedef size_t size_type;
+    typedef ptrdiff_t difference_type;
+    template<typename U> struct rebind {
+        typedef memory_pool_allocator<U, P> other;
+    };
+
+    explicit memory_pool_allocator(pool_type &pool) throw() : my_pool(&pool) {}
+    memory_pool_allocator(const memory_pool_allocator& src) throw() : my_pool(src.my_pool) {}
+    template<typename U>
+    memory_pool_allocator(const memory_pool_allocator<U,P>& src) throw() : my_pool(src.my_pool) {}
+
+    pointer address(reference x) const { return &x; }
+    const_pointer address(const_reference x) const { return &x; }
+
+    //! Allocate space for n objects.
+    pointer allocate( size_type n, const void* /*hint*/ = 0) {
+        pointer p = static_cast<pointer>( my_pool->malloc( n*sizeof(value_type) ) );
+        if (!p)
+            tbb::internal::throw_exception(std::bad_alloc());
+        return p;
+    }
+    //! Free previously allocated block of memory.
+    void deallocate( pointer p, size_type ) {
+        my_pool->free(p);
+    }
+    //! Largest value for which method allocate might succeed.
+    size_type max_size() const throw() {
+        size_type max = static_cast<size_type>(-1) / sizeof (value_type);
+        return (max > 0 ? max : 1);
+    }
+    //! Copy-construct value at location pointed to by p.
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    template<typename U, typename... Args>
+    void construct(U *p, Args&&... args)
+        { ::new((void *)p) U(std::forward<Args>(args)...); }
+#else // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void construct( pointer p, value_type&& value ) {::new((void*)(p)) value_type(std::move(value));}
+#endif
+    void construct( pointer p, const value_type& value ) { ::new((void*)(p)) value_type(value); }
+#endif // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+
+    //! Destroy value at location pointed to by p.
+    void destroy( pointer p ) { p->~value_type(); }
+
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4100 is back
+
+//! Analogous to std::allocator<void>, as defined in ISO C++ Standard, Section 20.4.1
+/** @ingroup memory_allocation */
+template<typename P>
+class memory_pool_allocator<void, P> {
+public:
+    typedef P pool_type;
+    typedef void* pointer;
+    typedef const void* const_pointer;
+    typedef void value_type;
+    template<typename U> struct rebind {
+        typedef memory_pool_allocator<U, P> other;
+    };
+
+    explicit memory_pool_allocator( pool_type &pool) throw() : my_pool(&pool) {}
+    memory_pool_allocator( const memory_pool_allocator& src) throw() : my_pool(src.my_pool) {}
+    template<typename U>
+    memory_pool_allocator(const memory_pool_allocator<U,P>& src) throw() : my_pool(src.my_pool) {}
+
+protected:
+    pool_type *my_pool;
+    template<typename U, typename R>
+    friend class memory_pool_allocator;
+    template<typename V, typename U, typename R>
+    friend bool operator==( const memory_pool_allocator<V,R>& a, const memory_pool_allocator<U,R>& b);
+    template<typename V, typename U, typename R>
+    friend bool operator!=( const memory_pool_allocator<V,R>& a, const memory_pool_allocator<U,R>& b);
+};
+
+template<typename T, typename U, typename P>
+inline bool operator==( const memory_pool_allocator<T,P>& a, const memory_pool_allocator<U,P>& b) {return a.my_pool==b.my_pool;}
+
+template<typename T, typename U, typename P>
+inline bool operator!=( const memory_pool_allocator<T,P>& a, const memory_pool_allocator<U,P>& b) {return a.my_pool!=b.my_pool;}
+
+
+//! Thread-safe growable pool allocator for variable-size requests
+template <typename Alloc>
+class memory_pool : public internal::pool_base {
+    Alloc my_alloc; // TODO: base-class optimization
+    static void *allocate_request(intptr_t pool_id, size_t & bytes);
+    static int deallocate_request(intptr_t pool_id, void*, size_t raw_bytes);
+
+public:
+    //! construct pool with underlying allocator
+    explicit memory_pool(const Alloc &src = Alloc());
+
+    //! destroy pool
+    ~memory_pool() { destroy(); } // call the callbacks first and destroy my_alloc latter
+
+};
+
+class fixed_pool : public internal::pool_base {
+    void *my_buffer;
+    size_t my_size;
+    inline static void *allocate_request(intptr_t pool_id, size_t & bytes);
+
+public:
+    //! construct pool with underlying allocator
+    inline fixed_pool(void *buf, size_t size);
+    //! destroy pool
+    ~fixed_pool() { destroy(); }
+};
+
+//////////////// Implementation ///////////////
+
+template <typename Alloc>
+memory_pool<Alloc>::memory_pool(const Alloc &src) : my_alloc(src) {
+    rml::MemPoolPolicy args(allocate_request, deallocate_request,
+                            sizeof(typename Alloc::value_type));
+    rml::MemPoolError res = rml::pool_create_v1(intptr_t(this), &args, &my_pool);
+    if (res!=rml::POOL_OK)
+        tbb::internal::throw_exception(std::runtime_error("Can't create pool"));
+}
+template <typename Alloc>
+void *memory_pool<Alloc>::allocate_request(intptr_t pool_id, size_t & bytes) {
+    memory_pool<Alloc> &self = *reinterpret_cast<memory_pool<Alloc>*>(pool_id);
+    const size_t unit_size = sizeof(typename Alloc::value_type);
+    __TBBMALLOC_ASSERT( 0 == bytes%unit_size, NULL);
+    void *ptr;
+    __TBB_TRY { ptr = self.my_alloc.allocate( bytes/unit_size ); }
+    __TBB_CATCH(...) { return 0; }
+    return ptr;
+}
+#if __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+    // Workaround for erroneous "unreachable code" warning in the template below.
+    // Specific for VC++ 17-18 compiler
+    #pragma warning (push)
+    #pragma warning (disable: 4702)
+#endif
+template <typename Alloc>
+int memory_pool<Alloc>::deallocate_request(intptr_t pool_id, void* raw_ptr, size_t raw_bytes) {
+    memory_pool<Alloc> &self = *reinterpret_cast<memory_pool<Alloc>*>(pool_id);
+    const size_t unit_size = sizeof(typename Alloc::value_type);
+    __TBBMALLOC_ASSERT( 0 == raw_bytes%unit_size, NULL);
+    self.my_alloc.deallocate( static_cast<typename Alloc::value_type*>(raw_ptr), raw_bytes/unit_size );
+    return 0;
+}
+#if __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+    #pragma warning (pop)
+#endif
+inline fixed_pool::fixed_pool(void *buf, size_t size) : my_buffer(buf), my_size(size) {
+    if (!buf || !size)
+        // TODO: improve support for mode with exceptions disabled
+        tbb::internal::throw_exception(std::invalid_argument("Zero in parameter is invalid"));
+    rml::MemPoolPolicy args(allocate_request, 0, size, /*fixedPool=*/true);
+    rml::MemPoolError res = rml::pool_create_v1(intptr_t(this), &args, &my_pool);
+    if (res!=rml::POOL_OK)
+        tbb::internal::throw_exception(std::runtime_error("Can't create pool"));
+}
+inline void *fixed_pool::allocate_request(intptr_t pool_id, size_t & bytes) {
+    fixed_pool &self = *reinterpret_cast<fixed_pool*>(pool_id);
+    __TBBMALLOC_ASSERT(0 != self.my_size, "The buffer must not be used twice.");
+    bytes = self.my_size;
+    self.my_size = 0; // remember that buffer has been used
+    return self.my_buffer;
+}
+
+} //namespace interface6
+using interface6::memory_pool_allocator;
+using interface6::memory_pool;
+using interface6::fixed_pool;
+} //namespace tbb
+
+#undef __TBBMALLOC_ASSERT
+#endif// __TBB_memory_pool_H
diff --git a/xdl/third_party/tbb/include/tbb/mutex.h b/xdl/third_party/tbb/include/tbb/mutex.h
new file mode 100644
index 00000000..c499be3d
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/mutex.h
@@ -0,0 +1,233 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_mutex_H
+#define __TBB_mutex_H
+
+#if _WIN32||_WIN64
+#include "machine/windows_api.h"
+#else
+#include <pthread.h>
+#endif /* _WIN32||_WIN64 */
+
+#include <new>
+#include "aligned_space.h"
+#include "tbb_stddef.h"
+#include "tbb_profiling.h"
+
+namespace tbb {
+
+//! Wrapper around the platform's native lock.
+/** @ingroup synchronization */
+class mutex : internal::mutex_copy_deprecated_and_disabled {
+public:
+    //! Construct unacquired mutex.
+    mutex() {
+#if TBB_USE_ASSERT || TBB_USE_THREADING_TOOLS
+    internal_construct();
+#else
+  #if _WIN32||_WIN64
+        InitializeCriticalSectionEx(&impl, 4000, 0);
+  #else
+        int error_code = pthread_mutex_init(&impl,NULL);
+        if( error_code )
+            tbb::internal::handle_perror(error_code,"mutex: pthread_mutex_init failed");
+  #endif /* _WIN32||_WIN64*/
+#endif /* TBB_USE_ASSERT */
+    };
+
+    ~mutex() {
+#if TBB_USE_ASSERT
+        internal_destroy();
+#else
+  #if _WIN32||_WIN64
+        DeleteCriticalSection(&impl);
+  #else
+        pthread_mutex_destroy(&impl);
+
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    };
+
+    class scoped_lock;
+    friend class scoped_lock;
+
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    class scoped_lock : internal::no_copy {
+    public:
+        //! Construct lock that has not acquired a mutex.
+        scoped_lock() : my_mutex(NULL) {};
+
+        //! Acquire lock on given mutex.
+        scoped_lock( mutex& mutex ) {
+            acquire( mutex );
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if( my_mutex )
+                release();
+        }
+
+        //! Acquire lock on given mutex.
+        void acquire( mutex& mutex ) {
+#if TBB_USE_ASSERT
+            internal_acquire(mutex);
+#else
+            mutex.lock();
+            my_mutex = &mutex;
+#endif /* TBB_USE_ASSERT */
+        }
+
+        //! Try acquire lock on given mutex.
+        bool try_acquire( mutex& mutex ) {
+#if TBB_USE_ASSERT
+            return internal_try_acquire (mutex);
+#else
+            bool result = mutex.try_lock();
+            if( result )
+                my_mutex = &mutex;
+            return result;
+#endif /* TBB_USE_ASSERT */
+        }
+
+        //! Release lock
+        void release() {
+#if TBB_USE_ASSERT
+            internal_release ();
+#else
+            my_mutex->unlock();
+            my_mutex = NULL;
+#endif /* TBB_USE_ASSERT */
+        }
+
+    private:
+        //! The pointer to the current mutex to work
+        mutex* my_mutex;
+
+        //! All checks from acquire using mutex.state were moved here
+        void __TBB_EXPORTED_METHOD internal_acquire( mutex& m );
+
+        //! All checks from try_acquire using mutex.state were moved here
+        bool __TBB_EXPORTED_METHOD internal_try_acquire( mutex& m );
+
+        //! All checks from release using mutex.state were moved here
+        void __TBB_EXPORTED_METHOD internal_release();
+
+        friend class mutex;
+    };
+
+    // Mutex traits
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = false;
+
+    // ISO C++0x compatibility methods
+
+    //! Acquire lock
+    void lock() {
+#if TBB_USE_ASSERT
+        aligned_space<scoped_lock> tmp;
+        new(tmp.begin()) scoped_lock(*this);
+#else
+  #if _WIN32||_WIN64
+        EnterCriticalSection(&impl);
+  #else
+        int error_code = pthread_mutex_lock(&impl);
+        if( error_code )
+            tbb::internal::handle_perror(error_code,"mutex: pthread_mutex_lock failed");
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    }
+
+    //! Try acquiring lock (non-blocking)
+    /** Return true if lock acquired; false otherwise. */
+    bool try_lock() {
+#if TBB_USE_ASSERT
+        aligned_space<scoped_lock> tmp;
+        scoped_lock& s = *tmp.begin();
+        s.my_mutex = NULL;
+        return s.internal_try_acquire(*this);
+#else
+  #if _WIN32||_WIN64
+        return TryEnterCriticalSection(&impl)!=0;
+  #else
+        return pthread_mutex_trylock(&impl)==0;
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    }
+
+    //! Release lock
+    void unlock() {
+#if TBB_USE_ASSERT
+        aligned_space<scoped_lock> tmp;
+        scoped_lock& s = *tmp.begin();
+        s.my_mutex = this;
+        s.internal_release();
+#else
+  #if _WIN32||_WIN64
+        LeaveCriticalSection(&impl);
+  #else
+        pthread_mutex_unlock(&impl);
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    }
+
+    //! Return native_handle
+  #if _WIN32||_WIN64
+    typedef LPCRITICAL_SECTION native_handle_type;
+  #else
+    typedef pthread_mutex_t* native_handle_type;
+  #endif
+    native_handle_type native_handle() { return (native_handle_type) &impl; }
+
+    enum state_t {
+        INITIALIZED=0x1234,
+        DESTROYED=0x789A,
+        HELD=0x56CD
+    };
+private:
+#if _WIN32||_WIN64
+    CRITICAL_SECTION impl;
+    enum state_t state;
+#else
+    pthread_mutex_t impl;
+#endif /* _WIN32||_WIN64 */
+
+    //! All checks from mutex constructor using mutex.state were moved here
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    //! All checks from mutex destructor using mutex.state were moved here
+    void __TBB_EXPORTED_METHOD internal_destroy();
+
+#if _WIN32||_WIN64
+public:
+    //!  Set the internal state
+    void set_state( state_t to ) { state = to; }
+#endif
+};
+
+__TBB_DEFINE_PROFILING_SET_NAME(mutex)
+
+} // namespace tbb
+
+#endif /* __TBB_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/null_mutex.h b/xdl/third_party/tbb/include/tbb/null_mutex.h
new file mode 100644
index 00000000..84cf6582
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/null_mutex.h
@@ -0,0 +1,54 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_null_mutex_H
+#define __TBB_null_mutex_H
+
+#include "tbb_stddef.h"
+
+namespace tbb {
+
+//! A mutex which does nothing
+/** A null_mutex does no operation and simulates success.
+    @ingroup synchronization */
+class null_mutex : internal::mutex_copy_deprecated_and_disabled {
+public:
+    //! Represents acquisition of a mutex.
+    class scoped_lock : internal::no_copy {
+    public:
+        scoped_lock() {}
+        scoped_lock( null_mutex& ) {}
+        ~scoped_lock() {}
+        void acquire( null_mutex& ) {}
+        bool try_acquire( null_mutex& ) { return true; }
+        void release() {}
+    };
+
+    null_mutex() {}
+
+    // Mutex traits
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = true;
+    static const bool is_fair_mutex = true;
+};
+
+}
+
+#endif /* __TBB_null_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/null_rw_mutex.h b/xdl/third_party/tbb/include/tbb/null_rw_mutex.h
new file mode 100644
index 00000000..c762b1ce
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/null_rw_mutex.h
@@ -0,0 +1,56 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_null_rw_mutex_H
+#define __TBB_null_rw_mutex_H
+
+#include "tbb_stddef.h"
+
+namespace tbb {
+
+//! A rw mutex which does nothing
+/** A null_rw_mutex is a rw mutex that does nothing and simulates successful operation.
+    @ingroup synchronization */
+class null_rw_mutex : internal::mutex_copy_deprecated_and_disabled {
+public:
+    //! Represents acquisition of a mutex.
+    class scoped_lock : internal::no_copy {
+    public:
+        scoped_lock() {}
+        scoped_lock( null_rw_mutex& , bool = true ) {}
+        ~scoped_lock() {}
+        void acquire( null_rw_mutex& , bool = true ) {}
+        bool upgrade_to_writer() { return true; }
+        bool downgrade_to_reader() { return true; }
+        bool try_acquire( null_rw_mutex& , bool = true ) { return true; }
+        void release() {}
+    };
+
+    null_rw_mutex() {}
+
+    // Mutex traits
+    static const bool is_rw_mutex = true;
+    static const bool is_recursive_mutex = true;
+    static const bool is_fair_mutex = true;
+};
+
+}
+
+#endif /* __TBB_null_rw_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/parallel_do.h b/xdl/third_party/tbb/include/tbb/parallel_do.h
new file mode 100644
index 00000000..e5979f5f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_do.h
@@ -0,0 +1,551 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_do_H
+#define __TBB_parallel_do_H
+
+#include "internal/_range_iterator.h"
+#include "internal/_template_helpers.h"
+#include "task.h"
+#include "aligned_space.h"
+#include <iterator>
+
+namespace tbb {
+namespace interface9 {
+//! @cond INTERNAL
+namespace internal {
+    template<typename Body, typename Item> class parallel_do_feeder_impl;
+} // namespace internal
+//! @endcond
+
+//! Class the user supplied algorithm body uses to add new tasks
+/** \param Item Work item type **/
+    template<typename Item>
+    class parallel_do_feeder: ::tbb::internal::no_copy
+    {
+        parallel_do_feeder() {}
+        virtual ~parallel_do_feeder () {}
+        virtual void internal_add_copy( const Item& item ) = 0;
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        virtual void internal_add_move( Item&& item ) = 0;
+#endif
+        template<typename Body_, typename Item_> friend class internal::parallel_do_feeder_impl;
+    public:
+        //! Add a work item to a running parallel_do.
+        void add( const Item& item ) {internal_add_copy(item);}
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        void add( Item&& item ) {internal_add_move(std::move(item));}
+#endif
+    };
+
+//! @cond INTERNAL
+namespace internal {
+    template<typename Body> class do_group_task;
+
+    //! For internal use only.
+    /** Selects one of the two possible forms of function call member operator.
+        @ingroup algorithms **/
+    template<class Body, typename Item>
+    class parallel_do_operator_selector
+    {
+        typedef parallel_do_feeder<Item> Feeder;
+        template<typename A1, typename A2, typename CvItem >
+        static void internal_call( const Body& obj, __TBB_FORWARDING_REF(A1) arg1, A2&, void (Body::*)(CvItem) const ) {
+            obj(tbb::internal::forward<A1>(arg1));
+        }
+        template<typename A1, typename A2, typename CvItem >
+        static void internal_call( const Body& obj, __TBB_FORWARDING_REF(A1) arg1, A2& arg2, void (Body::*)(CvItem, parallel_do_feeder<Item>&) const ) {
+            obj(tbb::internal::forward<A1>(arg1), arg2);
+        }
+        template<typename A1, typename A2, typename CvItem >
+        static void internal_call( const Body& obj, __TBB_FORWARDING_REF(A1) arg1, A2&, void (Body::*)(CvItem&) const ) {
+            obj(arg1);
+        }
+        template<typename A1, typename A2, typename CvItem >
+        static void internal_call( const Body& obj, __TBB_FORWARDING_REF(A1) arg1, A2& arg2, void (Body::*)(CvItem&, parallel_do_feeder<Item>&) const ) {
+            obj(arg1, arg2);
+        }
+    public:
+        template<typename A1, typename A2>
+        static void call( const Body& obj, __TBB_FORWARDING_REF(A1) arg1, A2& arg2 )
+        {
+            internal_call( obj, tbb::internal::forward<A1>(arg1), arg2, &Body::operator() );
+        }
+    };
+
+    //! For internal use only.
+    /** Executes one iteration of a do.
+        @ingroup algorithms */
+    template<typename Body, typename Item>
+    class do_iteration_task: public task
+    {
+        typedef parallel_do_feeder_impl<Body, Item> feeder_type;
+
+        Item my_value;
+        feeder_type& my_feeder;
+
+        do_iteration_task( const Item& value, feeder_type& feeder ) :
+            my_value(value), my_feeder(feeder)
+        {}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        do_iteration_task( Item&& value, feeder_type& feeder ) :
+            my_value(std::move(value)), my_feeder(feeder)
+        {}
+#endif
+
+        task* execute() __TBB_override
+        {
+            parallel_do_operator_selector<Body, Item>::call(*my_feeder.my_body, tbb::internal::move(my_value), my_feeder);
+            return NULL;
+        }
+
+        template<typename Body_, typename Item_> friend class parallel_do_feeder_impl;
+    }; // class do_iteration_task
+
+    template<typename Iterator, typename Body, typename Item>
+    class do_iteration_task_iter: public task
+    {
+        typedef parallel_do_feeder_impl<Body, Item> feeder_type;
+
+        Iterator my_iter;
+        feeder_type& my_feeder;
+
+        do_iteration_task_iter( const Iterator& iter, feeder_type& feeder ) :
+            my_iter(iter), my_feeder(feeder)
+        {}
+
+        task* execute() __TBB_override
+        {
+            parallel_do_operator_selector<Body, Item>::call(*my_feeder.my_body, *my_iter, my_feeder);
+            return NULL;
+        }
+
+        template<typename Iterator_, typename Body_, typename Item_> friend class do_group_task_forward;
+        template<typename Body_, typename Item_> friend class do_group_task_input;
+        template<typename Iterator_, typename Body_, typename Item_> friend class do_task_iter;
+    }; // class do_iteration_task_iter
+
+    //! For internal use only.
+    /** Implements new task adding procedure.
+        @ingroup algorithms **/
+    template<class Body, typename Item>
+    class parallel_do_feeder_impl : public parallel_do_feeder<Item>
+    {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        //Avoiding use of copy constructor in a virtual method if the type does not support it
+        void internal_add_copy_impl(std::true_type, const Item& item) {
+            typedef do_iteration_task<Body, Item> iteration_type;
+            iteration_type& t = *new (task::allocate_additional_child_of(*my_barrier)) iteration_type(item, *this);
+            task::spawn(t);
+        }
+        void internal_add_copy_impl(std::false_type, const Item&) {
+            __TBB_ASSERT(false, "Overloading for r-value reference doesn't work or it's not movable and not copyable object");
+        }
+        void internal_add_copy( const Item& item ) __TBB_override
+        {
+#if __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT
+            internal_add_copy_impl(typename std::is_copy_constructible<Item>::type(), item);
+#else
+            internal_add_copy_impl(std::true_type(), item);
+#endif
+        }
+        void internal_add_move( Item&& item ) __TBB_override
+        {
+            typedef do_iteration_task<Body, Item> iteration_type;
+            iteration_type& t = *new (task::allocate_additional_child_of(*my_barrier)) iteration_type(std::move(item), *this);
+            task::spawn(t);
+        }
+#else /* ! __TBB_CPP11_RVALUE_REF_PRESENT */
+        void internal_add_copy(const Item& item) __TBB_override {
+            typedef do_iteration_task<Body, Item> iteration_type;
+            iteration_type& t = *new (task::allocate_additional_child_of(*my_barrier)) iteration_type(item, *this);
+            task::spawn(t);
+        }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+    public:
+        const Body* my_body;
+        empty_task* my_barrier;
+
+        parallel_do_feeder_impl()
+        {
+            my_barrier = new( task::allocate_root() ) empty_task();
+            __TBB_ASSERT(my_barrier, "root task allocation failed");
+        }
+
+#if __TBB_TASK_GROUP_CONTEXT
+        parallel_do_feeder_impl(tbb::task_group_context &context)
+        {
+            my_barrier = new( task::allocate_root(context) ) empty_task();
+            __TBB_ASSERT(my_barrier, "root task allocation failed");
+        }
+#endif
+
+        ~parallel_do_feeder_impl()
+        {
+            my_barrier->destroy(*my_barrier);
+        }
+    }; // class parallel_do_feeder_impl
+
+
+    //! For internal use only
+    /** Unpacks a block of iterations.
+        @ingroup algorithms */
+
+    template<typename Iterator, typename Body, typename Item>
+    class do_group_task_forward: public task
+    {
+        static const size_t max_arg_size = 4;
+
+        typedef parallel_do_feeder_impl<Body, Item> feeder_type;
+
+        feeder_type& my_feeder;
+        Iterator my_first;
+        size_t my_size;
+
+        do_group_task_forward( Iterator first, size_t size, feeder_type& feeder )
+            : my_feeder(feeder), my_first(first), my_size(size)
+        {}
+
+        task* execute() __TBB_override
+        {
+            typedef do_iteration_task_iter<Iterator, Body, Item> iteration_type;
+            __TBB_ASSERT( my_size>0, NULL );
+            task_list list;
+            task* t;
+            size_t k=0;
+            for(;;) {
+                t = new( allocate_child() ) iteration_type( my_first, my_feeder );
+                ++my_first;
+                if( ++k==my_size ) break;
+                list.push_back(*t);
+            }
+            set_ref_count(int(k+1));
+            spawn(list);
+            spawn_and_wait_for_all(*t);
+            return NULL;
+        }
+
+        template<typename Iterator_, typename Body_, typename _Item> friend class do_task_iter;
+    }; // class do_group_task_forward
+
+    template<typename Body, typename Item>
+    class do_group_task_input: public task
+    {
+        static const size_t max_arg_size = 4;
+
+        typedef parallel_do_feeder_impl<Body, Item> feeder_type;
+
+        feeder_type& my_feeder;
+        size_t my_size;
+        aligned_space<Item, max_arg_size> my_arg;
+
+        do_group_task_input( feeder_type& feeder )
+            : my_feeder(feeder), my_size(0)
+        {}
+
+        task* execute() __TBB_override
+        {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+            typedef std::move_iterator<Item*> Item_iterator;
+#else
+            typedef Item* Item_iterator;
+#endif
+            typedef do_iteration_task_iter<Item_iterator, Body, Item> iteration_type;
+            __TBB_ASSERT( my_size>0, NULL );
+            task_list list;
+            task* t;
+            size_t k=0;
+            for(;;) {
+                t = new( allocate_child() ) iteration_type( Item_iterator(my_arg.begin() + k), my_feeder );
+                if( ++k==my_size ) break;
+                list.push_back(*t);
+            }
+            set_ref_count(int(k+1));
+            spawn(list);
+            spawn_and_wait_for_all(*t);
+            return NULL;
+        }
+
+        ~do_group_task_input(){
+            for( size_t k=0; k<my_size; ++k)
+                (my_arg.begin() + k)->~Item();
+        }
+
+        template<typename Iterator_, typename Body_, typename Item_> friend class do_task_iter;
+    }; // class do_group_task_input
+
+    //! For internal use only.
+    /** Gets block of iterations and packages them into a do_group_task.
+        @ingroup algorithms */
+    template<typename Iterator, typename Body, typename Item>
+    class do_task_iter: public task
+    {
+        typedef parallel_do_feeder_impl<Body, Item> feeder_type;
+
+    public:
+        do_task_iter( Iterator first, Iterator last , feeder_type& feeder ) :
+            my_first(first), my_last(last), my_feeder(feeder)
+        {}
+
+    private:
+        Iterator my_first;
+        Iterator my_last;
+        feeder_type& my_feeder;
+
+        /* Do not merge run(xxx) and run_xxx() methods. They are separated in order
+            to make sure that compilers will eliminate unused argument of type xxx
+            (that is will not put it on stack). The sole purpose of this argument
+            is overload resolution.
+
+            An alternative could be using template functions, but explicit specialization
+            of member function templates is not supported for non specialized class
+            templates. Besides template functions would always fall back to the least
+            efficient variant (the one for input iterators) in case of iterators having
+            custom tags derived from basic ones. */
+        task* execute() __TBB_override
+        {
+            typedef typename std::iterator_traits<Iterator>::iterator_category iterator_tag;
+            return run( (iterator_tag*)NULL );
+        }
+
+        /** This is the most restricted variant that operates on input iterators or
+            iterators with unknown tags (tags not derived from the standard ones). **/
+        inline task* run( void* ) { return run_for_input_iterator(); }
+
+        task* run_for_input_iterator() {
+            typedef do_group_task_input<Body, Item> block_type;
+
+            block_type& t = *new( allocate_additional_child_of(*my_feeder.my_barrier) ) block_type(my_feeder);
+            size_t k=0;
+            while( !(my_first == my_last) ) {
+                // Move semantics are automatically used when supported by the iterator
+                new (t.my_arg.begin() + k) Item(*my_first);
+                ++my_first;
+                if( ++k==block_type::max_arg_size ) {
+                    if ( !(my_first == my_last) )
+                        recycle_to_reexecute();
+                    break;
+                }
+            }
+            if( k==0 ) {
+                destroy(t);
+                return NULL;
+            } else {
+                t.my_size = k;
+                return &t;
+            }
+        }
+
+        inline task* run( std::forward_iterator_tag* ) { return run_for_forward_iterator(); }
+
+        task* run_for_forward_iterator() {
+            typedef do_group_task_forward<Iterator, Body, Item> block_type;
+
+            Iterator first = my_first;
+            size_t k=0;
+            while( !(my_first==my_last) ) {
+                ++my_first;
+                if( ++k==block_type::max_arg_size ) {
+                    if ( !(my_first==my_last) )
+                        recycle_to_reexecute();
+                    break;
+                }
+            }
+            return k==0 ? NULL : new( allocate_additional_child_of(*my_feeder.my_barrier) ) block_type(first, k, my_feeder);
+        }
+
+        inline task* run( std::random_access_iterator_tag* ) { return run_for_random_access_iterator(); }
+
+        task* run_for_random_access_iterator() {
+            typedef do_group_task_forward<Iterator, Body, Item> block_type;
+            typedef do_iteration_task_iter<Iterator, Body, Item> iteration_type;
+
+            size_t k = static_cast<size_t>(my_last-my_first);
+            if( k > block_type::max_arg_size ) {
+                Iterator middle = my_first + k/2;
+
+                empty_task& c = *new( allocate_continuation() ) empty_task;
+                do_task_iter& b = *new( c.allocate_child() ) do_task_iter(middle, my_last, my_feeder);
+                recycle_as_child_of(c);
+
+                my_last = middle;
+                c.set_ref_count(2);
+                c.spawn(b);
+                return this;
+            }else if( k != 0 ) {
+                task_list list;
+                task* t;
+                size_t k1=0;
+                for(;;) {
+                    t = new( allocate_child() ) iteration_type(my_first, my_feeder);
+                    ++my_first;
+                    if( ++k1==k ) break;
+                    list.push_back(*t);
+                }
+                set_ref_count(int(k+1));
+                spawn(list);
+                spawn_and_wait_for_all(*t);
+            }
+            return NULL;
+        }
+    }; // class do_task_iter
+
+    //! For internal use only.
+    /** Implements parallel iteration over a range.
+        @ingroup algorithms */
+    template<typename Iterator, typename Body, typename Item>
+    void run_parallel_do( Iterator first, Iterator last, const Body& body
+#if __TBB_TASK_GROUP_CONTEXT
+        , task_group_context& context
+#endif
+        )
+    {
+        typedef do_task_iter<Iterator, Body, Item> root_iteration_task;
+#if __TBB_TASK_GROUP_CONTEXT
+        parallel_do_feeder_impl<Body, Item> feeder(context);
+#else
+        parallel_do_feeder_impl<Body, Item> feeder;
+#endif
+        feeder.my_body = &body;
+
+        root_iteration_task &t = *new( feeder.my_barrier->allocate_child() ) root_iteration_task(first, last, feeder);
+
+        feeder.my_barrier->set_ref_count(2);
+        feeder.my_barrier->spawn_and_wait_for_all(t);
+    }
+
+    //! For internal use only.
+    /** Detects types of Body's operator function arguments.
+        @ingroup algorithms **/
+    template<typename Iterator, typename Body, typename Item>
+    void select_parallel_do( Iterator first, Iterator last, const Body& body, void (Body::*)(Item) const
+#if __TBB_TASK_GROUP_CONTEXT
+        , task_group_context& context
+#endif
+        )
+    {
+        run_parallel_do<Iterator, Body, typename ::tbb::internal::strip<Item>::type>( first, last, body
+#if __TBB_TASK_GROUP_CONTEXT
+            , context
+#endif
+            );
+    }
+
+    //! For internal use only.
+    /** Detects types of Body's operator function arguments.
+        @ingroup algorithms **/
+    template<typename Iterator, typename Body, typename Item, typename _Item>
+    void select_parallel_do( Iterator first, Iterator last, const Body& body, void (Body::*)(Item, parallel_do_feeder<_Item>&) const
+#if __TBB_TASK_GROUP_CONTEXT
+        , task_group_context& context
+#endif
+        )
+    {
+        run_parallel_do<Iterator, Body, typename ::tbb::internal::strip<Item>::type>( first, last, body
+#if __TBB_TASK_GROUP_CONTEXT
+            , context
+#endif
+            );
+    }
+
+} // namespace internal
+} // namespace interface9
+//! @endcond
+
+/** \page parallel_do_body_req Requirements on parallel_do body
+    Class \c Body implementing the concept of parallel_do body must define:
+    - \code
+        B::operator()(
+                cv_item_type item,
+                parallel_do_feeder<item_type>& feeder
+        ) const
+
+        OR
+
+        B::operator()( cv_item_type& item ) const
+      \endcode                                               Process item.
+                                                             May be invoked concurrently  for the same \c this but different \c item.
+
+    - \code item_type( const item_type& ) \endcode
+                                                             Copy a work item.
+    - \code ~item_type() \endcode                            Destroy a work item
+**/
+
+/** \name parallel_do
+    See also requirements on \ref parallel_do_body_req "parallel_do Body". **/
+//@{
+//! Parallel iteration over a range, with optional addition of more work.
+/** @ingroup algorithms */
+template<typename Iterator, typename Body>
+void parallel_do( Iterator first, Iterator last, const Body& body )
+{
+    if ( first == last )
+        return;
+#if __TBB_TASK_GROUP_CONTEXT
+    task_group_context context(internal::PARALLEL_DO);
+#endif
+    interface9::internal::select_parallel_do( first, last, body, &Body::operator()
+#if __TBB_TASK_GROUP_CONTEXT
+        , context
+#endif
+        );
+}
+
+template<typename Range, typename Body>
+void parallel_do(Range& rng, const Body& body) {
+    parallel_do(tbb::internal::first(rng), tbb::internal::last(rng), body);
+}
+
+template<typename Range, typename Body>
+void parallel_do(const Range& rng, const Body& body) {
+    parallel_do(tbb::internal::first(rng), tbb::internal::last(rng), body);
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Parallel iteration over a range, with optional addition of more work and user-supplied context
+/** @ingroup algorithms */
+template<typename Iterator, typename Body>
+void parallel_do( Iterator first, Iterator last, const Body& body, task_group_context& context  )
+{
+    if ( first == last )
+        return;
+    interface9::internal::select_parallel_do( first, last, body, &Body::operator(), context );
+}
+
+template<typename Range, typename Body>
+void parallel_do(Range& rng, const Body& body, task_group_context& context) {
+    parallel_do(tbb::internal::first(rng), tbb::internal::last(rng), body, context);
+}
+
+template<typename Range, typename Body>
+void parallel_do(const Range& rng, const Body& body, task_group_context& context) {
+    parallel_do(tbb::internal::first(rng), tbb::internal::last(rng), body, context);
+}
+
+#endif // __TBB_TASK_GROUP_CONTEXT
+
+//@}
+
+using interface9::parallel_do_feeder;
+
+} // namespace
+
+#endif /* __TBB_parallel_do_H */
diff --git a/xdl/third_party/tbb/include/tbb/parallel_for.h b/xdl/third_party/tbb/include/tbb/parallel_for.h
new file mode 100644
index 00000000..bfd87227
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_for.h
@@ -0,0 +1,423 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_for_H
+#define __TBB_parallel_for_H
+
+#include <new>
+#include "task.h"
+#include "partitioner.h"
+#include "blocked_range.h"
+#include "tbb_exception.h"
+#include "internal/_tbb_trace_impl.h"
+
+namespace tbb {
+
+namespace interface9 {
+//! @cond INTERNAL
+namespace internal {
+
+    //! allocate right task with new parent
+    void* allocate_sibling(task* start_for_task, size_t bytes);
+
+    //! Task type used in parallel_for
+    /** @ingroup algorithms */
+    template<typename Range, typename Body, typename Partitioner>
+    class start_for: public task {
+        Range my_range;
+        const Body my_body;
+        typename Partitioner::task_partition_type my_partition;
+        task* execute() __TBB_override;
+
+        //! Update affinity info, if any.
+        void note_affinity( affinity_id id ) __TBB_override {
+            my_partition.note_affinity( id );
+        }
+
+    public:
+        //! Constructor for root task.
+        start_for( const Range& range, const Body& body, Partitioner& partitioner ) :
+            my_range(range),
+            my_body(body),
+            my_partition(partitioner)
+        {
+            tbb::internal::fgt_algorithm(tbb::internal::PARALLEL_FOR_TASK, this, NULL);
+        }
+        //! Splitting constructor used to generate children.
+        /** parent_ becomes left child.  Newly constructed object is right child. */
+        start_for( start_for& parent_, typename Partitioner::split_type& split_obj) :
+            my_range(parent_.my_range, split_obj),
+            my_body(parent_.my_body),
+            my_partition(parent_.my_partition, split_obj)
+        {
+            my_partition.set_affinity(*this);
+            tbb::internal::fgt_algorithm(tbb::internal::PARALLEL_FOR_TASK, this, (void *)&parent_);
+        }
+        //! Construct right child from the given range as response to the demand.
+        /** parent_ remains left child.  Newly constructed object is right child. */
+        start_for( start_for& parent_, const Range& r, depth_t d ) :
+            my_range(r),
+            my_body(parent_.my_body),
+            my_partition(parent_.my_partition, split())
+        {
+            my_partition.set_affinity(*this);
+            my_partition.align_depth( d );
+            tbb::internal::fgt_algorithm(tbb::internal::PARALLEL_FOR_TASK, this, (void *)&parent_);
+        }
+        static void run(  const Range& range, const Body& body, Partitioner& partitioner ) {
+            if( !range.empty() ) {
+#if !__TBB_TASK_GROUP_CONTEXT || TBB_JOIN_OUTER_TASK_GROUP
+                start_for& a = *new(task::allocate_root()) start_for(range,body,partitioner);
+#else
+                // Bound context prevents exceptions from body to affect nesting or sibling algorithms,
+                // and allows users to handle exceptions safely by wrapping parallel_for in the try-block.
+                task_group_context context(PARALLEL_FOR);
+                start_for& a = *new(task::allocate_root(context)) start_for(range,body,partitioner);
+#endif /* __TBB_TASK_GROUP_CONTEXT && !TBB_JOIN_OUTER_TASK_GROUP */
+		// REGION BEGIN
+                fgt_begin_algorithm( tbb::internal::PARALLEL_FOR_TASK, (void*)&context );
+                task::spawn_root_and_wait(a);
+                fgt_end_algorithm( (void*)&context );
+		// REGION END
+            }
+        }
+#if __TBB_TASK_GROUP_CONTEXT
+        static void run(  const Range& range, const Body& body, Partitioner& partitioner, task_group_context& context ) {
+            if( !range.empty() ) {
+                start_for& a = *new(task::allocate_root(context)) start_for(range,body,partitioner);
+		// REGION BEGIN
+                fgt_begin_algorithm( tbb::internal::PARALLEL_FOR_TASK, (void*)&context );
+                task::spawn_root_and_wait(a);
+                fgt_end_algorithm( (void*)&context );
+		// END REGION
+            }
+        }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+        //! Run body for range, serves as callback for partitioner
+        void run_body( Range &r ) { 
+            fgt_alg_begin_body( tbb::internal::PARALLEL_FOR_TASK, (void *)const_cast<Body*>(&(this->my_body)), (void*)this );
+            my_body( r ); 
+            fgt_alg_end_body( (void *)const_cast<Body*>(&(this->my_body)) );
+        }
+
+        //! spawn right task, serves as callback for partitioner
+        void offer_work(typename Partitioner::split_type& split_obj) {
+            spawn( *new( allocate_sibling(static_cast<task*>(this), sizeof(start_for)) ) start_for(*this, split_obj) );
+        }
+        //! spawn right task, serves as callback for partitioner
+        void offer_work(const Range& r, depth_t d = 0) {
+            spawn( *new( allocate_sibling(static_cast<task*>(this), sizeof(start_for)) ) start_for(*this, r, d) );
+        }
+    };
+
+    //! allocate right task with new parent
+    // TODO: 'inline' here is to avoid multiple definition error but for sake of code size this should not be inlined
+    inline void* allocate_sibling(task* start_for_task, size_t bytes) {
+        task* parent_ptr = new( start_for_task->allocate_continuation() ) flag_task();
+        start_for_task->set_parent(parent_ptr);
+        parent_ptr->set_ref_count(2);
+        return &parent_ptr->allocate_child().allocate(bytes);
+    }
+
+    //! execute task for parallel_for
+    template<typename Range, typename Body, typename Partitioner>
+    task* start_for<Range,Body,Partitioner>::execute() {
+        my_partition.check_being_stolen( *this );
+        my_partition.execute(*this, my_range);
+        return NULL;
+    }
+} // namespace internal
+//! @endcond
+} // namespace interfaceX
+
+//! @cond INTERNAL
+namespace internal {
+    using interface9::internal::start_for;
+
+    //! Calls the function with values from range [begin, end) with a step provided
+    template<typename Function, typename Index>
+    class parallel_for_body : internal::no_assign {
+        const Function &my_func;
+        const Index my_begin;
+        const Index my_step;
+    public:
+        parallel_for_body( const Function& _func, Index& _begin, Index& _step )
+            : my_func(_func), my_begin(_begin), my_step(_step) {}
+
+        void operator()( const tbb::blocked_range<Index>& r ) const {
+            // A set of local variables to help the compiler with vectorization of the following loop.
+            Index b = r.begin();
+            Index e = r.end();
+            Index ms = my_step;
+            Index k = my_begin + b*ms;
+
+#if __INTEL_COMPILER
+#pragma ivdep
+#if __TBB_ASSERT_ON_VECTORIZATION_FAILURE
+#pragma vector always assert
+#endif
+#endif
+            for ( Index i = b; i < e; ++i, k += ms ) {
+                my_func( k );
+            }
+        }
+    };
+} // namespace internal
+//! @endcond
+
+// Requirements on Range concept are documented in blocked_range.h
+
+/** \page parallel_for_body_req Requirements on parallel_for body
+    Class \c Body implementing the concept of parallel_for body must define:
+    - \code Body::Body( const Body& ); \endcode                 Copy constructor
+    - \code Body::~Body(); \endcode                             Destructor
+    - \code void Body::operator()( Range& r ) const; \endcode   Function call operator applying the body to range \c r.
+**/
+
+/** \name parallel_for
+    See also requirements on \ref range_req "Range" and \ref parallel_for_body_req "parallel_for Body". **/
+//@{
+
+//! Parallel iteration over range with default partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body ) {
+    internal::start_for<Range,Body,const __TBB_DEFAULT_PARTITIONER>::run(range,body,__TBB_DEFAULT_PARTITIONER());
+}
+
+//! Parallel iteration over range with simple partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const simple_partitioner& partitioner ) {
+    internal::start_for<Range,Body,const simple_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel iteration over range with auto_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const auto_partitioner& partitioner ) {
+    internal::start_for<Range,Body,const auto_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel iteration over range with static_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const static_partitioner& partitioner ) {
+    internal::start_for<Range,Body,const static_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel iteration over range with affinity_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, affinity_partitioner& partitioner ) {
+    internal::start_for<Range,Body,affinity_partitioner>::run(range,body,partitioner);
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Parallel iteration over range with default partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, task_group_context& context ) {
+    internal::start_for<Range,Body,const __TBB_DEFAULT_PARTITIONER>::run(range, body, __TBB_DEFAULT_PARTITIONER(), context);
+}
+
+//! Parallel iteration over range with simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const simple_partitioner& partitioner, task_group_context& context ) {
+    internal::start_for<Range,Body,const simple_partitioner>::run(range, body, partitioner, context);
+}
+
+//! Parallel iteration over range with auto_partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const auto_partitioner& partitioner, task_group_context& context ) {
+    internal::start_for<Range,Body,const auto_partitioner>::run(range, body, partitioner, context);
+}
+
+//! Parallel iteration over range with static_partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, const static_partitioner& partitioner, task_group_context& context ) {
+    internal::start_for<Range,Body,const static_partitioner>::run(range, body, partitioner, context);
+}
+
+//! Parallel iteration over range with affinity_partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_for( const Range& range, const Body& body, affinity_partitioner& partitioner, task_group_context& context ) {
+    internal::start_for<Range,Body,affinity_partitioner>::run(range,body,partitioner, context);
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+//@}
+
+namespace strict_ppl {
+
+//@{
+//! Implementation of parallel iteration over stepped range of integers with explicit step and partitioner
+template <typename Index, typename Function, typename Partitioner>
+void parallel_for_impl(Index first, Index last, Index step, const Function& f, Partitioner& partitioner) {
+    if (step <= 0 )
+        internal::throw_exception(internal::eid_nonpositive_step); // throws std::invalid_argument
+    else if (last > first) {
+        // Above "else" avoids "potential divide by zero" warning on some platforms
+        Index end = (last - first - Index(1)) / step + Index(1);
+        tbb::blocked_range<Index> range(static_cast<Index>(0), end);
+        internal::parallel_for_body<Function, Index> body(f, first, step);
+        tbb::parallel_for(range, body, partitioner);
+    }
+}
+
+//! Parallel iteration over a range of integers with a step provided and default partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, step, f, auto_partitioner());
+}
+//! Parallel iteration over a range of integers with a step provided and simple partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const simple_partitioner& partitioner) {
+    parallel_for_impl<Index,Function,const simple_partitioner>(first, last, step, f, partitioner);
+}
+//! Parallel iteration over a range of integers with a step provided and auto partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const auto_partitioner& partitioner) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, step, f, partitioner);
+}
+//! Parallel iteration over a range of integers with a step provided and static partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const static_partitioner& partitioner) {
+    parallel_for_impl<Index,Function,const static_partitioner>(first, last, step, f, partitioner);
+}
+//! Parallel iteration over a range of integers with a step provided and affinity partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, affinity_partitioner& partitioner) {
+    parallel_for_impl(first, last, step, f, partitioner);
+}
+
+//! Parallel iteration over a range of integers with a default step value and default partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, static_cast<Index>(1), f, auto_partitioner());
+}
+//! Parallel iteration over a range of integers with a default step value and simple partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const simple_partitioner& partitioner) {
+    parallel_for_impl<Index,Function,const simple_partitioner>(first, last, static_cast<Index>(1), f, partitioner);
+}
+//! Parallel iteration over a range of integers with a default step value and auto partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const auto_partitioner& partitioner) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, static_cast<Index>(1), f, partitioner);
+}
+//! Parallel iteration over a range of integers with a default step value and static partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const static_partitioner& partitioner) {
+    parallel_for_impl<Index,Function,const static_partitioner>(first, last, static_cast<Index>(1), f, partitioner);
+}
+//! Parallel iteration over a range of integers with a default step value and affinity partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, affinity_partitioner& partitioner) {
+    parallel_for_impl(first, last, static_cast<Index>(1), f, partitioner);
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Implementation of parallel iteration over stepped range of integers with explicit step, task group context, and partitioner
+template <typename Index, typename Function, typename Partitioner>
+void parallel_for_impl(Index first, Index last, Index step, const Function& f, Partitioner& partitioner, tbb::task_group_context &context) {
+    if (step <= 0 )
+        internal::throw_exception(internal::eid_nonpositive_step); // throws std::invalid_argument
+    else if (last > first) {
+        // Above "else" avoids "potential divide by zero" warning on some platforms
+        Index end = (last - first - Index(1)) / step + Index(1);
+        tbb::blocked_range<Index> range(static_cast<Index>(0), end);
+        internal::parallel_for_body<Function, Index> body(f, first, step);
+        tbb::parallel_for(range, body, partitioner, context);
+    }
+}
+
+//! Parallel iteration over a range of integers with explicit step, task group context, and default partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, step, f, auto_partitioner(), context);
+}
+//! Parallel iteration over a range of integers with explicit step, task group context, and simple partitioner
+ template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const simple_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const simple_partitioner>(first, last, step, f, partitioner, context);
+}
+//! Parallel iteration over a range of integers with explicit step, task group context, and auto partitioner
+ template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const auto_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, step, f, partitioner, context);
+}
+//! Parallel iteration over a range of integers with explicit step, task group context, and static partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, const static_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const static_partitioner>(first, last, step, f, partitioner, context);
+}
+//! Parallel iteration over a range of integers with explicit step, task group context, and affinity partitioner
+ template <typename Index, typename Function>
+void parallel_for(Index first, Index last, Index step, const Function& f, affinity_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl(first, last, step, f, partitioner, context);
+}
+
+
+//! Parallel iteration over a range of integers with a default step value, explicit task group context, and default partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, static_cast<Index>(1), f, auto_partitioner(), context);
+}
+//! Parallel iteration over a range of integers with a default step value, explicit task group context, and simple partitioner
+ template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const simple_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const simple_partitioner>(first, last, static_cast<Index>(1), f, partitioner, context);
+}
+//! Parallel iteration over a range of integers with a default step value, explicit task group context, and auto partitioner
+ template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const auto_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const auto_partitioner>(first, last, static_cast<Index>(1), f, partitioner, context);
+}
+//! Parallel iteration over a range of integers with a default step value, explicit task group context, and static partitioner
+template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, const static_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl<Index,Function,const static_partitioner>(first, last, static_cast<Index>(1), f, partitioner, context);
+}
+//! Parallel iteration over a range of integers with a default step value, explicit task group context, and affinity_partitioner
+ template <typename Index, typename Function>
+void parallel_for(Index first, Index last, const Function& f, affinity_partitioner& partitioner, tbb::task_group_context &context) {
+    parallel_for_impl(first, last, static_cast<Index>(1), f, partitioner, context);
+}
+
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+//@}
+
+} // namespace strict_ppl
+
+using strict_ppl::parallel_for;
+
+} // namespace tbb
+
+#if TBB_PREVIEW_SERIAL_SUBSET
+#define __TBB_NORMAL_EXECUTION
+#include "../serial/tbb/parallel_for.h"
+#undef __TBB_NORMAL_EXECUTION
+#endif
+
+#endif /* __TBB_parallel_for_H */
diff --git a/xdl/third_party/tbb/include/tbb/parallel_for_each.h b/xdl/third_party/tbb/include/tbb/parallel_for_each.h
new file mode 100644
index 00000000..d912fab0
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_for_each.h
@@ -0,0 +1,137 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_for_each_H
+#define __TBB_parallel_for_each_H
+
+#include "parallel_do.h"
+#include "parallel_for.h"
+
+namespace tbb {
+
+//! @cond INTERNAL
+namespace internal {
+    // The class calls user function in operator()
+    template <typename Function, typename Iterator>
+    class parallel_for_each_body_do : internal::no_assign {
+        const Function &my_func;
+    public:
+        parallel_for_each_body_do(const Function &_func) : my_func(_func) {}
+
+        void operator()(typename std::iterator_traits<Iterator>::reference value) const {
+            my_func(value);
+        }
+    };
+
+    // The class calls user function in operator()
+    template <typename Function, typename Iterator>
+    class parallel_for_each_body_for : internal::no_assign {
+        const Function &my_func;
+    public:
+        parallel_for_each_body_for(const Function &_func) : my_func(_func) {}
+
+        void operator()(tbb::blocked_range<Iterator> range) const {
+#if __INTEL_COMPILER
+#pragma ivdep
+#endif
+            for(Iterator it = range.begin(), end = range.end(); it != end; ++it) {
+                my_func(*it);
+            }
+        }
+    };
+
+    template<typename Iterator, typename Function, typename Generic>
+    struct parallel_for_each_impl {
+#if __TBB_TASK_GROUP_CONTEXT
+        static void doit(Iterator first, Iterator last, const Function& f, task_group_context &context) {
+            internal::parallel_for_each_body_do<Function, Iterator> body(f);
+            tbb::parallel_do(first, last, body, context);
+        }
+#endif
+        static void doit(Iterator first, Iterator last, const Function& f) {
+            internal::parallel_for_each_body_do<Function, Iterator> body(f);
+            tbb::parallel_do(first, last, body);
+        }
+    };
+    template<typename Iterator, typename Function>
+    struct parallel_for_each_impl<Iterator, Function, std::random_access_iterator_tag> {
+#if __TBB_TASK_GROUP_CONTEXT
+        static void doit(Iterator first, Iterator last, const Function& f, task_group_context &context) {
+            internal::parallel_for_each_body_for<Function, Iterator> body(f);
+            tbb::parallel_for(tbb::blocked_range<Iterator>(first, last), body, context);
+        }
+#endif
+        static void doit(Iterator first, Iterator last, const Function& f) {
+            internal::parallel_for_each_body_for<Function, Iterator> body(f);
+            tbb::parallel_for(tbb::blocked_range<Iterator>(first, last), body);
+        }
+    };
+} // namespace internal
+//! @endcond
+
+/** \name parallel_for_each
+    **/
+//@{
+//! Calls function f for all items from [first, last) interval using user-supplied context
+/** @ingroup algorithms */
+#if __TBB_TASK_GROUP_CONTEXT
+template<typename Iterator, typename Function>
+void parallel_for_each(Iterator first, Iterator last, const Function& f, task_group_context &context) {
+    internal::parallel_for_each_impl<Iterator, Function, typename std::iterator_traits<Iterator>::iterator_category>::doit(first, last, f, context);
+}
+
+//! Calls function f for all items from rng using user-supplied context
+/** @ingroup algorithms */
+template<typename Range, typename Function>
+void parallel_for_each(Range& rng, const Function& f, task_group_context& context) {
+    parallel_for_each(tbb::internal::first(rng), tbb::internal::last(rng), f, context);
+}
+
+//! Calls function f for all items from const rng user-supplied context
+/** @ingroup algorithms */
+template<typename Range, typename Function>
+void parallel_for_each(const Range& rng, const Function& f, task_group_context& context) {
+    parallel_for_each(tbb::internal::first(rng), tbb::internal::last(rng), f, context);
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//! Uses default context
+template<typename Iterator, typename Function>
+void parallel_for_each(Iterator first, Iterator last, const Function& f) {
+    internal::parallel_for_each_impl<Iterator, Function, typename std::iterator_traits<Iterator>::iterator_category>::doit(first, last, f);
+}
+
+//! Uses default context
+template<typename Range, typename Function>
+void parallel_for_each(Range& rng, const Function& f) {
+    parallel_for_each(tbb::internal::first(rng), tbb::internal::last(rng), f);
+}
+
+//! Uses default context
+template<typename Range, typename Function>
+void parallel_for_each(const Range& rng, const Function& f) {
+    parallel_for_each(tbb::internal::first(rng), tbb::internal::last(rng), f);
+}
+
+//@}
+
+} // namespace
+
+#endif /* __TBB_parallel_for_each_H */
diff --git a/xdl/third_party/tbb/include/tbb/parallel_invoke.h b/xdl/third_party/tbb/include/tbb/parallel_invoke.h
new file mode 100644
index 00000000..07fa6a77
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_invoke.h
@@ -0,0 +1,458 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_invoke_H
+#define __TBB_parallel_invoke_H
+
+#include "task.h"
+#include "tbb_profiling.h"
+
+#if __TBB_VARIADIC_PARALLEL_INVOKE
+    #include <utility> // std::forward
+#endif
+
+namespace tbb {
+
+#if !__TBB_TASK_GROUP_CONTEXT
+    /** Dummy to avoid cluttering the bulk of the header with enormous amount of ifdefs. **/
+    struct task_group_context {
+        task_group_context(tbb::internal::string_index){}
+    };
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//! @cond INTERNAL
+namespace internal {
+    // Simple task object, executing user method
+    template<typename function>
+    class function_invoker : public task{
+    public:
+        function_invoker(const function& _function) : my_function(_function) {}
+    private:
+        const function &my_function;
+        task* execute() __TBB_override
+        {
+            my_function();
+            return NULL;
+        }
+    };
+
+    // The class spawns two or three child tasks
+    template <size_t N, typename function1, typename function2, typename function3>
+    class spawner : public task {
+    private:
+        const function1& my_func1;
+        const function2& my_func2;
+        const function3& my_func3;
+        bool is_recycled;
+
+        task* execute () __TBB_override {
+            if(is_recycled){
+                return NULL;
+            }else{
+                __TBB_ASSERT(N==2 || N==3, "Number of arguments passed to spawner is wrong");
+                set_ref_count(N);
+                recycle_as_safe_continuation();
+                internal::function_invoker<function2>* invoker2 = new (allocate_child()) internal::function_invoker<function2>(my_func2);
+                __TBB_ASSERT(invoker2, "Child task allocation failed");
+                spawn(*invoker2);
+                size_t n = N; // To prevent compiler warnings
+                if (n>2) {
+                    internal::function_invoker<function3>* invoker3 = new (allocate_child()) internal::function_invoker<function3>(my_func3);
+                    __TBB_ASSERT(invoker3, "Child task allocation failed");
+                    spawn(*invoker3);
+                }
+                my_func1();
+                is_recycled = true;
+                return NULL;
+            }
+        } // execute
+
+    public:
+        spawner(const function1& _func1, const function2& _func2, const function3& _func3) : my_func1(_func1), my_func2(_func2), my_func3(_func3), is_recycled(false) {}
+    };
+
+    // Creates and spawns child tasks
+    class parallel_invoke_helper : public empty_task {
+    public:
+        // Dummy functor class
+        class parallel_invoke_noop {
+        public:
+            void operator() () const {}
+        };
+        // Creates a helper object with user-defined number of children expected
+        parallel_invoke_helper(int number_of_children)
+        {
+            set_ref_count(number_of_children + 1);
+        }
+
+#if __TBB_VARIADIC_PARALLEL_INVOKE
+        void add_children() {}
+        void add_children(tbb::task_group_context&) {}
+
+        template <typename function>
+        void add_children(function&& _func)
+        {
+            internal::function_invoker<function>* invoker = new (allocate_child()) internal::function_invoker<function>(std::forward<function>(_func));
+            __TBB_ASSERT(invoker, "Child task allocation failed");
+            spawn(*invoker);
+        }
+
+        template<typename function>
+        void add_children(function&& _func, tbb::task_group_context&)
+        {
+            add_children(std::forward<function>(_func));
+        }
+
+        // Adds child(ren) task(s) and spawns them
+        template <typename function1, typename function2, typename... function>
+        void add_children(function1&& _func1, function2&& _func2, function&&... _func)
+        {
+            // The third argument is dummy, it is ignored actually.
+            parallel_invoke_noop noop;
+            typedef internal::spawner<2, function1, function2, parallel_invoke_noop> spawner_type;
+            spawner_type & sub_root = *new(allocate_child()) spawner_type(std::forward<function1>(_func1), std::forward<function2>(_func2), noop);
+            spawn(sub_root);
+            add_children(std::forward<function>(_func)...);
+        }
+#else
+        // Adds child task and spawns it
+        template <typename function>
+        void add_children (const function &_func)
+        {
+            internal::function_invoker<function>* invoker = new (allocate_child()) internal::function_invoker<function>(_func);
+            __TBB_ASSERT(invoker, "Child task allocation failed");
+            spawn(*invoker);
+        }
+
+        // Adds a task with multiple child tasks and spawns it
+        // two arguments
+        template <typename function1, typename function2>
+        void add_children (const function1& _func1, const function2& _func2)
+        {
+            // The third argument is dummy, it is ignored actually.
+            parallel_invoke_noop noop;
+            internal::spawner<2, function1, function2, parallel_invoke_noop>& sub_root = *new(allocate_child())internal::spawner<2, function1, function2, parallel_invoke_noop>(_func1, _func2, noop);
+            spawn(sub_root);
+        }
+        // three arguments
+        template <typename function1, typename function2, typename function3>
+        void add_children (const function1& _func1, const function2& _func2, const function3& _func3)
+        {
+            internal::spawner<3, function1, function2, function3>& sub_root = *new(allocate_child())internal::spawner<3, function1, function2, function3>(_func1, _func2, _func3);
+            spawn(sub_root);
+        }
+#endif // __TBB_VARIADIC_PARALLEL_INVOKE
+
+        // Waits for all child tasks
+        template <typename F0>
+        void run_and_finish(const F0& f0)
+        {
+            internal::function_invoker<F0>* invoker = new (allocate_child()) internal::function_invoker<F0>(f0);
+            __TBB_ASSERT(invoker, "Child task allocation failed");
+            spawn_and_wait_for_all(*invoker);
+        }
+    };
+    // The class destroys root if exception occurred as well as in normal case
+    class parallel_invoke_cleaner: internal::no_copy {
+    public:
+#if __TBB_TASK_GROUP_CONTEXT
+        parallel_invoke_cleaner(int number_of_children, tbb::task_group_context& context)
+            : root(*new(task::allocate_root(context)) internal::parallel_invoke_helper(number_of_children))
+#else
+        parallel_invoke_cleaner(int number_of_children, tbb::task_group_context&)
+            : root(*new(task::allocate_root()) internal::parallel_invoke_helper(number_of_children))
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
+        {}
+
+        ~parallel_invoke_cleaner(){
+            root.destroy(root);
+        }
+        internal::parallel_invoke_helper& root;
+    };
+
+#if __TBB_VARIADIC_PARALLEL_INVOKE
+//  Determine whether the last parameter in a pack is task_group_context
+    template<typename... T> struct impl_selector; // to workaround a GCC bug
+
+    template<typename T1, typename... T> struct impl_selector<T1, T...> {
+        typedef typename impl_selector<T...>::type type;
+    };
+
+    template<typename T> struct impl_selector<T> {
+        typedef false_type type;
+    };
+    template<> struct impl_selector<task_group_context&> {
+        typedef true_type  type;
+    };
+
+    // Select task_group_context parameter from the back of a pack
+    inline task_group_context& get_context( task_group_context& tgc ) { return tgc; }
+
+    template<typename T1, typename... T>
+    task_group_context& get_context( T1&& /*ignored*/, T&&... t )
+    { return get_context( std::forward<T>(t)... ); }
+
+    // task_group_context is known to be at the back of the parameter pack
+    template<typename F0, typename F1, typename... F>
+    void parallel_invoke_impl(true_type, F0&& f0, F1&& f1, F&&... f) {
+        __TBB_STATIC_ASSERT(sizeof...(F)>0, "Variadic parallel_invoke implementation broken?");
+        // # of child tasks: f0, f1, and a task for each two elements of the pack except the last
+        const size_t number_of_children = 2 + sizeof...(F)/2;
+        parallel_invoke_cleaner cleaner(number_of_children, get_context(std::forward<F>(f)...));
+        parallel_invoke_helper& root = cleaner.root;
+
+        root.add_children(std::forward<F>(f)...);
+        root.add_children(std::forward<F1>(f1));
+        root.run_and_finish(std::forward<F0>(f0));
+    }
+
+    // task_group_context is not in the pack, needs to be added
+    template<typename F0, typename F1, typename... F>
+    void parallel_invoke_impl(false_type, F0&& f0, F1&& f1, F&&... f) {
+        tbb::task_group_context context(PARALLEL_INVOKE);
+        // Add context to the arguments, and redirect to the other overload
+        parallel_invoke_impl(true_type(), std::forward<F0>(f0), std::forward<F1>(f1), std::forward<F>(f)..., context);
+    }
+#endif
+} // namespace internal
+//! @endcond
+
+/** \name parallel_invoke
+    **/
+//@{
+//! Executes a list of tasks in parallel and waits for all tasks to complete.
+/** @ingroup algorithms */
+
+#if __TBB_VARIADIC_PARALLEL_INVOKE
+
+// parallel_invoke for two or more arguments via variadic templates
+// presence of task_group_context is defined automatically
+template<typename F0, typename F1, typename... F>
+void parallel_invoke(F0&& f0, F1&& f1, F&&... f) {
+    typedef typename internal::impl_selector<internal::false_type, F...>::type selector_type;
+    internal::parallel_invoke_impl(selector_type(), std::forward<F0>(f0), std::forward<F1>(f1), std::forward<F>(f)...);
+}
+
+#else
+
+// parallel_invoke with user-defined context
+// two arguments
+template<typename F0, typename F1 >
+void parallel_invoke(const F0& f0, const F1& f1, tbb::task_group_context& context) {
+    internal::parallel_invoke_cleaner cleaner(2, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f1);
+
+    root.run_and_finish(f0);
+}
+
+// three arguments
+template<typename F0, typename F1, typename F2 >
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, tbb::task_group_context& context) {
+    internal::parallel_invoke_cleaner cleaner(3, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f2);
+    root.add_children(f1);
+
+    root.run_and_finish(f0);
+}
+
+// four arguments
+template<typename F0, typename F1, typename F2, typename F3>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(4, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f3);
+    root.add_children(f2);
+    root.add_children(f1);
+
+    root.run_and_finish(f0);
+}
+
+// five arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4 >
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(3, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f4, f3);
+    root.add_children(f2, f1);
+
+    root.run_and_finish(f0);
+}
+
+// six arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4, typename F5>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4, const F5& f5,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(3, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f5, f4, f3);
+    root.add_children(f2, f1);
+
+    root.run_and_finish(f0);
+}
+
+// seven arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4, typename F5, typename F6>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(3, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f6, f5, f4);
+    root.add_children(f3, f2, f1);
+
+    root.run_and_finish(f0);
+}
+
+// eight arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4,
+         typename F5, typename F6, typename F7>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6, const F7& f7,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(4, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f7, f6, f5);
+    root.add_children(f4, f3);
+    root.add_children(f2, f1);
+
+    root.run_and_finish(f0);
+}
+
+// nine arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4,
+         typename F5, typename F6, typename F7, typename F8>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6, const F7& f7, const F8& f8,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(4, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f8, f7, f6);
+    root.add_children(f5, f4, f3);
+    root.add_children(f2, f1);
+
+    root.run_and_finish(f0);
+}
+
+// ten arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4,
+         typename F5, typename F6, typename F7, typename F8, typename F9>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6, const F7& f7, const F8& f8, const F9& f9,
+                     tbb::task_group_context& context)
+{
+    internal::parallel_invoke_cleaner cleaner(4, context);
+    internal::parallel_invoke_helper& root = cleaner.root;
+
+    root.add_children(f9, f8, f7);
+    root.add_children(f6, f5, f4);
+    root.add_children(f3, f2, f1);
+
+    root.run_and_finish(f0);
+}
+
+// two arguments
+template<typename F0, typename F1>
+void parallel_invoke(const F0& f0, const F1& f1) {
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1>(f0, f1, context);
+}
+// three arguments
+template<typename F0, typename F1, typename F2>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2) {
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2>(f0, f1, f2, context);
+}
+// four arguments
+template<typename F0, typename F1, typename F2, typename F3 >
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3) {
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3>(f0, f1, f2, f3, context);
+}
+// five arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4) {
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3, F4>(f0, f1, f2, f3, f4, context);
+}
+// six arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4, typename F5>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4, const F5& f5) {
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3, F4, F5>(f0, f1, f2, f3, f4, f5, context);
+}
+// seven arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4, typename F5, typename F6>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6)
+{
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3, F4, F5, F6>(f0, f1, f2, f3, f4, f5, f6, context);
+}
+// eight arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4,
+         typename F5, typename F6, typename F7>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6, const F7& f7)
+{
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3, F4, F5, F6, F7>(f0, f1, f2, f3, f4, f5, f6, f7, context);
+}
+// nine arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4,
+         typename F5, typename F6, typename F7, typename F8>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6, const F7& f7, const F8& f8)
+{
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3, F4, F5, F6, F7, F8>(f0, f1, f2, f3, f4, f5, f6, f7, f8, context);
+}
+// ten arguments
+template<typename F0, typename F1, typename F2, typename F3, typename F4,
+         typename F5, typename F6, typename F7, typename F8, typename F9>
+void parallel_invoke(const F0& f0, const F1& f1, const F2& f2, const F3& f3, const F4& f4,
+                     const F5& f5, const F6& f6, const F7& f7, const F8& f8, const F9& f9)
+{
+    task_group_context context(internal::PARALLEL_INVOKE);
+    parallel_invoke<F0, F1, F2, F3, F4, F5, F6, F7, F8, F9>(f0, f1, f2, f3, f4, f5, f6, f7, f8, f9, context);
+}
+#endif // __TBB_VARIADIC_PARALLEL_INVOKE
+//@}
+
+} // namespace
+
+#endif /* __TBB_parallel_invoke_H */
diff --git a/xdl/third_party/tbb/include/tbb/parallel_reduce.h b/xdl/third_party/tbb/include/tbb/parallel_reduce.h
new file mode 100644
index 00000000..9429d191
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_reduce.h
@@ -0,0 +1,655 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_reduce_H
+#define __TBB_parallel_reduce_H
+
+#include <new>
+#include "task.h"
+#include "aligned_space.h"
+#include "partitioner.h"
+#include "tbb_profiling.h"
+
+namespace tbb {
+
+namespace interface9 {
+//! @cond INTERNAL
+namespace internal {
+
+    using namespace tbb::internal;
+
+    /** Values for reduction_context. */
+    enum {
+        root_task, left_child, right_child
+    };
+
+    /** Represented as a char, not enum, for compactness. */
+    typedef char reduction_context;
+
+    //! Task type used to combine the partial results of parallel_reduce.
+    /** @ingroup algorithms */
+    template<typename Body>
+    class finish_reduce: public flag_task {
+        //! Pointer to body, or NULL if the left child has not yet finished.
+        bool has_right_zombie;
+        const reduction_context my_context;
+        Body* my_body;
+        aligned_space<Body> zombie_space;
+        finish_reduce( reduction_context context_ ) :
+            has_right_zombie(false), // TODO: substitute by flag_task::child_stolen?
+            my_context(context_),
+            my_body(NULL)
+        {
+        }
+        ~finish_reduce() {
+            if( has_right_zombie )
+                zombie_space.begin()->~Body();
+        }
+        task* execute() __TBB_override {
+            if( has_right_zombie ) {
+                // Right child was stolen.
+                Body* s = zombie_space.begin();
+                my_body->join( *s );
+                // Body::join() won't be called if canceled. Defer destruction to destructor
+            }
+            if( my_context==left_child )
+                itt_store_word_with_release( static_cast<finish_reduce*>(parent())->my_body, my_body );
+            return NULL;
+        }
+        template<typename Range,typename Body_, typename Partitioner>
+        friend class start_reduce;
+    };
+
+    //! allocate right task with new parent
+    void allocate_sibling(task* start_reduce_task, task *tasks[], size_t start_bytes, size_t finish_bytes);
+
+    //! Task type used to split the work of parallel_reduce.
+    /** @ingroup algorithms */
+    template<typename Range, typename Body, typename Partitioner>
+    class start_reduce: public task {
+        typedef finish_reduce<Body> finish_type;
+        Body* my_body;
+        Range my_range;
+        typename Partitioner::task_partition_type my_partition;
+        reduction_context my_context;
+        task* execute() __TBB_override;
+        //! Update affinity info, if any
+        void note_affinity( affinity_id id ) __TBB_override {
+            my_partition.note_affinity( id );
+        }
+        template<typename Body_>
+        friend class finish_reduce;
+
+public:
+        //! Constructor used for root task
+        start_reduce( const Range& range, Body* body, Partitioner& partitioner ) :
+            my_body(body),
+            my_range(range),
+            my_partition(partitioner),
+            my_context(root_task)
+        {
+        }
+        //! Splitting constructor used to generate children.
+        /** parent_ becomes left child.  Newly constructed object is right child. */
+        start_reduce( start_reduce& parent_, typename Partitioner::split_type& split_obj ) :
+            my_body(parent_.my_body),
+            my_range(parent_.my_range, split_obj),
+            my_partition(parent_.my_partition, split_obj),
+            my_context(right_child)
+        {
+            my_partition.set_affinity(*this);
+            parent_.my_context = left_child;
+        }
+        //! Construct right child from the given range as response to the demand.
+        /** parent_ remains left child.  Newly constructed object is right child. */
+        start_reduce( start_reduce& parent_, const Range& r, depth_t d ) :
+            my_body(parent_.my_body),
+            my_range(r),
+            my_partition(parent_.my_partition, split()),
+            my_context(right_child)
+        {
+            my_partition.set_affinity(*this);
+            my_partition.align_depth( d ); // TODO: move into constructor of partitioner
+            parent_.my_context = left_child;
+        }
+        static void run( const Range& range, Body& body, Partitioner& partitioner ) {
+            if( !range.empty() ) {
+#if !__TBB_TASK_GROUP_CONTEXT || TBB_JOIN_OUTER_TASK_GROUP
+                task::spawn_root_and_wait( *new(task::allocate_root()) start_reduce(range,&body,partitioner) );
+#else
+                // Bound context prevents exceptions from body to affect nesting or sibling algorithms,
+                // and allows users to handle exceptions safely by wrapping parallel_for in the try-block.
+                task_group_context context(PARALLEL_REDUCE);
+                task::spawn_root_and_wait( *new(task::allocate_root(context)) start_reduce(range,&body,partitioner) );
+#endif /* __TBB_TASK_GROUP_CONTEXT && !TBB_JOIN_OUTER_TASK_GROUP */
+            }
+        }
+#if __TBB_TASK_GROUP_CONTEXT
+        static void run( const Range& range, Body& body, Partitioner& partitioner, task_group_context& context ) {
+            if( !range.empty() )
+                task::spawn_root_and_wait( *new(task::allocate_root(context)) start_reduce(range,&body,partitioner) );
+        }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+        //! Run body for range
+        void run_body( Range &r ) { (*my_body)( r ); }
+
+        //! spawn right task, serves as callback for partitioner
+        // TODO: remove code duplication from 'offer_work' methods
+        void offer_work(typename Partitioner::split_type& split_obj) {
+            task *tasks[2];
+            allocate_sibling(static_cast<task*>(this), tasks, sizeof(start_reduce), sizeof(finish_type));
+            new((void*)tasks[0]) finish_type(my_context);
+            new((void*)tasks[1]) start_reduce(*this, split_obj);
+            spawn(*tasks[1]);
+        }
+        //! spawn right task, serves as callback for partitioner
+        void offer_work(const Range& r, depth_t d = 0) {
+            task *tasks[2];
+            allocate_sibling(static_cast<task*>(this), tasks, sizeof(start_reduce), sizeof(finish_type));
+            new((void*)tasks[0]) finish_type(my_context);
+            new((void*)tasks[1]) start_reduce(*this, r, d);
+            spawn(*tasks[1]);
+        }
+    };
+
+    //! allocate right task with new parent
+    // TODO: 'inline' here is to avoid multiple definition error but for sake of code size this should not be inlined
+    inline void allocate_sibling(task* start_reduce_task, task *tasks[], size_t start_bytes, size_t finish_bytes) {
+        tasks[0] = &start_reduce_task->allocate_continuation().allocate(finish_bytes);
+        start_reduce_task->set_parent(tasks[0]);
+        tasks[0]->set_ref_count(2);
+        tasks[1] = &tasks[0]->allocate_child().allocate(start_bytes);
+    }
+
+    template<typename Range, typename Body, typename Partitioner>
+    task* start_reduce<Range,Body,Partitioner>::execute() {
+        my_partition.check_being_stolen( *this );
+        if( my_context==right_child ) {
+            finish_type* parent_ptr = static_cast<finish_type*>(parent());
+            if( !itt_load_word_with_acquire(parent_ptr->my_body) ) { // TODO: replace by is_stolen_task() or by parent_ptr->ref_count() == 2???
+                my_body = new( parent_ptr->zombie_space.begin() ) Body(*my_body,split());
+                parent_ptr->has_right_zombie = true;
+            }
+        } else __TBB_ASSERT(my_context==root_task,NULL);// because left leaf spawns right leafs without recycling
+        my_partition.execute(*this, my_range);
+        if( my_context==left_child ) {
+            finish_type* parent_ptr = static_cast<finish_type*>(parent());
+            __TBB_ASSERT(my_body!=parent_ptr->zombie_space.begin(),NULL);
+            itt_store_word_with_release(parent_ptr->my_body, my_body );
+        }
+        return NULL;
+    }
+
+    //! Task type used to combine the partial results of parallel_deterministic_reduce.
+    /** @ingroup algorithms */
+    template<typename Body>
+    class finish_deterministic_reduce: public task {
+        Body &my_left_body;
+        Body my_right_body;
+
+        finish_deterministic_reduce( Body &body ) :
+            my_left_body( body ),
+            my_right_body( body, split() )
+        {
+        }
+        task* execute() __TBB_override {
+            my_left_body.join( my_right_body );
+            return NULL;
+        }
+        template<typename Range,typename Body_, typename Partitioner>
+        friend class start_deterministic_reduce;
+    };
+
+    //! Task type used to split the work of parallel_deterministic_reduce.
+    /** @ingroup algorithms */
+    template<typename Range, typename Body, typename Partitioner>
+    class start_deterministic_reduce: public task {
+        typedef finish_deterministic_reduce<Body> finish_type;
+        Body &my_body;
+        Range my_range;
+        typename Partitioner::task_partition_type my_partition;
+        task* execute() __TBB_override;
+
+        //! Constructor used for root task
+        start_deterministic_reduce( const Range& range, Body& body, Partitioner& partitioner ) :
+            my_body( body ),
+            my_range( range ),
+            my_partition( partitioner )
+        {
+        }
+        //! Splitting constructor used to generate children.
+        /** parent_ becomes left child.  Newly constructed object is right child. */
+        start_deterministic_reduce( start_deterministic_reduce& parent_, finish_type& c, typename Partitioner::split_type& split_obj ) :
+            my_body( c.my_right_body ),
+            my_range( parent_.my_range, split_obj ),
+            my_partition( parent_.my_partition, split_obj )
+        {
+        }
+
+public:
+        static void run( const Range& range, Body& body, Partitioner& partitioner ) {
+            if( !range.empty() ) {
+#if !__TBB_TASK_GROUP_CONTEXT || TBB_JOIN_OUTER_TASK_GROUP
+                task::spawn_root_and_wait( *new(task::allocate_root()) start_deterministic_reduce(range,&body,partitioner) );
+#else
+                // Bound context prevents exceptions from body to affect nesting or sibling algorithms,
+                // and allows users to handle exceptions safely by wrapping parallel_for in the try-block.
+                task_group_context context(PARALLEL_REDUCE);
+                task::spawn_root_and_wait( *new(task::allocate_root(context)) start_deterministic_reduce(range,body,partitioner) );
+#endif /* __TBB_TASK_GROUP_CONTEXT && !TBB_JOIN_OUTER_TASK_GROUP */
+            }
+        }
+#if __TBB_TASK_GROUP_CONTEXT
+        static void run( const Range& range, Body& body, Partitioner& partitioner, task_group_context& context ) {
+            if( !range.empty() )
+                task::spawn_root_and_wait( *new(task::allocate_root(context)) start_deterministic_reduce(range,body,partitioner) );
+        }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+        void offer_work( typename Partitioner::split_type& split_obj) {
+            task* tasks[2];
+            allocate_sibling(static_cast<task*>(this), tasks, sizeof(start_deterministic_reduce), sizeof(finish_type));
+            new((void*)tasks[0]) finish_type(my_body);
+            new((void*)tasks[1]) start_deterministic_reduce(*this, *static_cast<finish_type*>(tasks[0]), split_obj);
+            spawn(*tasks[1]);
+        }
+
+        void run_body( Range &r ) { my_body(r); }
+    };
+
+    template<typename Range, typename Body, typename Partitioner>
+    task* start_deterministic_reduce<Range,Body, Partitioner>::execute() {
+        my_partition.execute(*this, my_range);
+        return NULL;
+    }
+} // namespace internal
+//! @endcond
+} //namespace interfaceX
+
+//! @cond INTERNAL
+namespace internal {
+    using interface9::internal::start_reduce;
+    using interface9::internal::start_deterministic_reduce;
+    //! Auxiliary class for parallel_reduce; for internal use only.
+    /** The adaptor class that implements \ref parallel_reduce_body_req "parallel_reduce Body"
+        using given \ref parallel_reduce_lambda_req "anonymous function objects".
+     **/
+    /** @ingroup algorithms */
+    template<typename Range, typename Value, typename RealBody, typename Reduction>
+    class lambda_reduce_body {
+
+//FIXME: decide if my_real_body, my_reduction, and identity_element should be copied or referenced
+//       (might require some performance measurements)
+
+        const Value&     identity_element;
+        const RealBody&  my_real_body;
+        const Reduction& my_reduction;
+        Value            my_value;
+        lambda_reduce_body& operator= ( const lambda_reduce_body& other );
+    public:
+        lambda_reduce_body( const Value& identity, const RealBody& body, const Reduction& reduction )
+            : identity_element(identity)
+            , my_real_body(body)
+            , my_reduction(reduction)
+            , my_value(identity)
+        { }
+        lambda_reduce_body( const lambda_reduce_body& other )
+            : identity_element(other.identity_element)
+            , my_real_body(other.my_real_body)
+            , my_reduction(other.my_reduction)
+            , my_value(other.my_value)
+        { }
+        lambda_reduce_body( lambda_reduce_body& other, tbb::split )
+            : identity_element(other.identity_element)
+            , my_real_body(other.my_real_body)
+            , my_reduction(other.my_reduction)
+            , my_value(other.identity_element)
+        { }
+        void operator()(Range& range) {
+            my_value = my_real_body(range, const_cast<const Value&>(my_value));
+        }
+        void join( lambda_reduce_body& rhs ) {
+            my_value = my_reduction(const_cast<const Value&>(my_value), const_cast<const Value&>(rhs.my_value));
+        }
+        Value result() const {
+            return my_value;
+        }
+    };
+
+} // namespace internal
+//! @endcond
+
+// Requirements on Range concept are documented in blocked_range.h
+
+/** \page parallel_reduce_body_req Requirements on parallel_reduce body
+    Class \c Body implementing the concept of parallel_reduce body must define:
+    - \code Body::Body( Body&, split ); \endcode        Splitting constructor.
+                                                        Must be able to run concurrently with operator() and method \c join
+    - \code Body::~Body(); \endcode                     Destructor
+    - \code void Body::operator()( Range& r ); \endcode Function call operator applying body to range \c r
+                                                        and accumulating the result
+    - \code void Body::join( Body& b ); \endcode        Join results.
+                                                        The result in \c b should be merged into the result of \c this
+**/
+
+/** \page parallel_reduce_lambda_req Requirements on parallel_reduce anonymous function objects (lambda functions)
+    TO BE DOCUMENTED
+**/
+
+/** \name parallel_reduce
+    See also requirements on \ref range_req "Range" and \ref parallel_reduce_body_req "parallel_reduce Body". **/
+//@{
+
+//! Parallel iteration with reduction and default partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body ) {
+    internal::start_reduce<Range,Body, const __TBB_DEFAULT_PARTITIONER>::run( range, body, __TBB_DEFAULT_PARTITIONER() );
+}
+
+//! Parallel iteration with reduction and simple_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, const simple_partitioner& partitioner ) {
+    internal::start_reduce<Range,Body,const simple_partitioner>::run( range, body, partitioner );
+}
+
+//! Parallel iteration with reduction and auto_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, const auto_partitioner& partitioner ) {
+    internal::start_reduce<Range,Body,const auto_partitioner>::run( range, body, partitioner );
+}
+
+//! Parallel iteration with reduction and static_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, const static_partitioner& partitioner ) {
+    internal::start_reduce<Range,Body,const static_partitioner>::run( range, body, partitioner );
+}
+
+//! Parallel iteration with reduction and affinity_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, affinity_partitioner& partitioner ) {
+    internal::start_reduce<Range,Body,affinity_partitioner>::run( range, body, partitioner );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Parallel iteration with reduction, default partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, task_group_context& context ) {
+    internal::start_reduce<Range,Body,const __TBB_DEFAULT_PARTITIONER>::run( range, body, __TBB_DEFAULT_PARTITIONER(), context );
+}
+
+//! Parallel iteration with reduction, simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, const simple_partitioner& partitioner, task_group_context& context ) {
+    internal::start_reduce<Range,Body,const simple_partitioner>::run( range, body, partitioner, context );
+}
+
+//! Parallel iteration with reduction, auto_partitioner and user-supplied context
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, const auto_partitioner& partitioner, task_group_context& context ) {
+    internal::start_reduce<Range,Body,const auto_partitioner>::run( range, body, partitioner, context );
+}
+
+//! Parallel iteration with reduction, static_partitioner and user-supplied context
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, const static_partitioner& partitioner, task_group_context& context ) {
+    internal::start_reduce<Range,Body,const static_partitioner>::run( range, body, partitioner, context );
+}
+
+//! Parallel iteration with reduction, affinity_partitioner and user-supplied context
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_reduce( const Range& range, Body& body, affinity_partitioner& partitioner, task_group_context& context ) {
+    internal::start_reduce<Range,Body,affinity_partitioner>::run( range, body, partitioner, context );
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+/** parallel_reduce overloads that work with anonymous function objects
+    (see also \ref parallel_reduce_lambda_req "requirements on parallel_reduce anonymous function objects"). **/
+
+//! Parallel iteration with reduction and default partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const __TBB_DEFAULT_PARTITIONER>
+                          ::run(range, body, __TBB_DEFAULT_PARTITIONER() );
+    return body.result();
+}
+
+//! Parallel iteration with reduction and simple_partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       const simple_partitioner& partitioner ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const simple_partitioner>
+                          ::run(range, body, partitioner );
+    return body.result();
+}
+
+//! Parallel iteration with reduction and auto_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       const auto_partitioner& partitioner ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const auto_partitioner>
+                          ::run( range, body, partitioner );
+    return body.result();
+}
+
+//! Parallel iteration with reduction and static_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       const static_partitioner& partitioner ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const static_partitioner>
+                                        ::run( range, body, partitioner );
+    return body.result();
+}
+
+//! Parallel iteration with reduction and affinity_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       affinity_partitioner& partitioner ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,affinity_partitioner>
+                                        ::run( range, body, partitioner );
+    return body.result();
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Parallel iteration with reduction, default partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       task_group_context& context ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const __TBB_DEFAULT_PARTITIONER>
+                          ::run( range, body, __TBB_DEFAULT_PARTITIONER(), context );
+    return body.result();
+}
+
+//! Parallel iteration with reduction, simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       const simple_partitioner& partitioner, task_group_context& context ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const simple_partitioner>
+                          ::run( range, body, partitioner, context );
+    return body.result();
+}
+
+//! Parallel iteration with reduction, auto_partitioner and user-supplied context
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       const auto_partitioner& partitioner, task_group_context& context ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const auto_partitioner>
+                          ::run( range, body, partitioner, context );
+    return body.result();
+}
+
+//! Parallel iteration with reduction, static_partitioner and user-supplied context
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       const static_partitioner& partitioner, task_group_context& context ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,const static_partitioner>
+                                        ::run( range, body, partitioner, context );
+    return body.result();
+}
+
+//! Parallel iteration with reduction, affinity_partitioner and user-supplied context
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+                       affinity_partitioner& partitioner, task_group_context& context ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>,affinity_partitioner>
+                                        ::run( range, body, partitioner, context );
+    return body.result();
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//! Parallel iteration with deterministic reduction and default simple partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_deterministic_reduce( const Range& range, Body& body ) {
+    internal::start_deterministic_reduce<Range, Body, const simple_partitioner>::run(range, body, simple_partitioner());
+}
+
+//! Parallel iteration with deterministic reduction and simple partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_deterministic_reduce( const Range& range, Body& body, const simple_partitioner& partitioner ) {
+    internal::start_deterministic_reduce<Range, Body, const simple_partitioner>::run(range, body, partitioner);
+}
+
+//! Parallel iteration with deterministic reduction and static partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_deterministic_reduce( const Range& range, Body& body, const static_partitioner& partitioner ) {
+    internal::start_deterministic_reduce<Range, Body, const static_partitioner>::run(range, body, partitioner);
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Parallel iteration with deterministic reduction, default simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_deterministic_reduce( const Range& range, Body& body, task_group_context& context ) {
+    internal::start_deterministic_reduce<Range,Body, const simple_partitioner>::run( range, body, simple_partitioner(), context );
+}
+
+//! Parallel iteration with deterministic reduction, simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_deterministic_reduce( const Range& range, Body& body, const simple_partitioner& partitioner, task_group_context& context ) {
+    internal::start_deterministic_reduce<Range, Body, const simple_partitioner>::run(range, body, partitioner, context);
+}
+
+//! Parallel iteration with deterministic reduction, static partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_deterministic_reduce( const Range& range, Body& body, const static_partitioner& partitioner, task_group_context& context ) {
+    internal::start_deterministic_reduce<Range, Body, const static_partitioner>::run(range, body, partitioner, context);
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+/** parallel_reduce overloads that work with anonymous function objects
+    (see also \ref parallel_reduce_lambda_req "requirements on parallel_reduce anonymous function objects"). **/
+
+//! Parallel iteration with deterministic reduction and default simple partitioner.
+// TODO: consider making static_partitioner the default
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_deterministic_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction ) {
+    return parallel_deterministic_reduce(range, identity, real_body, reduction, simple_partitioner());
+}
+
+//! Parallel iteration with deterministic reduction and simple partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_deterministic_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction, const simple_partitioner& partitioner ) {
+    internal::lambda_reduce_body<Range,Value,RealBody,Reduction> body(identity, real_body, reduction);
+    internal::start_deterministic_reduce<Range,internal::lambda_reduce_body<Range,Value,RealBody,Reduction>, const simple_partitioner>
+                          ::run(range, body, partitioner);
+    return body.result();
+}
+
+//! Parallel iteration with deterministic reduction and static partitioner.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_deterministic_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction, const static_partitioner& partitioner ) {
+    internal::lambda_reduce_body<Range, Value, RealBody, Reduction> body(identity, real_body, reduction);
+    internal::start_deterministic_reduce<Range, internal::lambda_reduce_body<Range, Value, RealBody, Reduction>, const static_partitioner>
+        ::run(range, body, partitioner);
+    return body.result();
+}
+#if __TBB_TASK_GROUP_CONTEXT
+//! Parallel iteration with deterministic reduction, default simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_deterministic_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+    task_group_context& context ) {
+    return parallel_deterministic_reduce(range, identity, real_body, reduction, simple_partitioner(), context);
+}
+
+//! Parallel iteration with deterministic reduction, simple partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_deterministic_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+    const simple_partitioner& partitioner, task_group_context& context ) {
+    internal::lambda_reduce_body<Range, Value, RealBody, Reduction> body(identity, real_body, reduction);
+    internal::start_deterministic_reduce<Range, internal::lambda_reduce_body<Range, Value, RealBody, Reduction>, const simple_partitioner>
+        ::run(range, body, partitioner, context);
+    return body.result();
+}
+
+//! Parallel iteration with deterministic reduction, static partitioner and user-supplied context.
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename RealBody, typename Reduction>
+Value parallel_deterministic_reduce( const Range& range, const Value& identity, const RealBody& real_body, const Reduction& reduction,
+    const static_partitioner& partitioner, task_group_context& context ) {
+    internal::lambda_reduce_body<Range, Value, RealBody, Reduction> body(identity, real_body, reduction);
+    internal::start_deterministic_reduce<Range, internal::lambda_reduce_body<Range, Value, RealBody, Reduction>, const static_partitioner>
+        ::run(range, body, partitioner, context);
+    return body.result();
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+//@}
+
+} // namespace tbb
+
+#endif /* __TBB_parallel_reduce_H */
diff --git a/xdl/third_party/tbb/include/tbb/parallel_scan.h b/xdl/third_party/tbb/include/tbb/parallel_scan.h
new file mode 100644
index 00000000..73da6f36
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_scan.h
@@ -0,0 +1,414 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_scan_H
+#define __TBB_parallel_scan_H
+
+#include "task.h"
+#include "aligned_space.h"
+#include <new>
+#include "partitioner.h"
+
+namespace tbb {
+
+//! Used to indicate that the initial scan is being performed.
+/** @ingroup algorithms */
+struct pre_scan_tag {
+    static bool is_final_scan() {return false;}
+    operator bool() {return is_final_scan();}
+};
+
+//! Used to indicate that the final scan is being performed.
+/** @ingroup algorithms */
+struct final_scan_tag {
+    static bool is_final_scan() {return true;}
+    operator bool() {return is_final_scan();}
+};
+
+//! @cond INTERNAL
+namespace internal {
+
+    //! Performs final scan for a leaf
+    /** @ingroup algorithms */
+    template<typename Range, typename Body>
+    class final_sum: public task {
+    public:
+        Body my_body;
+    private:
+        aligned_space<Range> my_range;
+        //! Where to put result of last subrange, or NULL if not last subrange.
+        Body* my_stuff_last;
+    public:
+        final_sum( Body& body_ ) :
+            my_body(body_,split())
+        {
+            poison_pointer(my_stuff_last);
+        }
+        ~final_sum() {
+            my_range.begin()->~Range();
+        }
+        void finish_construction( const Range& range_, Body* stuff_last_ ) {
+            new( my_range.begin() ) Range(range_);
+            my_stuff_last = stuff_last_;
+        }
+    private:
+        task* execute() __TBB_override {
+            my_body( *my_range.begin(), final_scan_tag() );
+            if( my_stuff_last )
+                my_stuff_last->assign(my_body);
+            return NULL;
+        }
+    };
+
+    //! Split work to be done in the scan.
+    /** @ingroup algorithms */
+    template<typename Range, typename Body>
+    class sum_node: public task {
+        typedef final_sum<Range,Body> final_sum_type;
+    public:
+        final_sum_type *my_incoming;
+        final_sum_type *my_body;
+        Body *my_stuff_last;
+    private:
+        final_sum_type *my_left_sum;
+        sum_node *my_left;
+        sum_node *my_right;
+        bool my_left_is_final;
+        Range my_range;
+        sum_node( const Range range_, bool left_is_final_ ) :
+            my_stuff_last(NULL),
+            my_left_sum(NULL),
+            my_left(NULL),
+            my_right(NULL),
+            my_left_is_final(left_is_final_),
+            my_range(range_)
+        {
+            // Poison fields that will be set by second pass.
+            poison_pointer(my_body);
+            poison_pointer(my_incoming);
+        }
+        task* create_child( const Range& range_, final_sum_type& f, sum_node* n, final_sum_type* incoming_, Body* stuff_last_ ) {
+            if( !n ) {
+                f.recycle_as_child_of( *this );
+                f.finish_construction( range_, stuff_last_ );
+                return &f;
+            } else {
+                n->my_body = &f;
+                n->my_incoming = incoming_;
+                n->my_stuff_last = stuff_last_;
+                return n;
+            }
+        }
+        task* execute() __TBB_override {
+            if( my_body ) {
+                if( my_incoming )
+                    my_left_sum->my_body.reverse_join( my_incoming->my_body );
+                recycle_as_continuation();
+                sum_node& c = *this;
+                task* b = c.create_child(Range(my_range,split()),*my_left_sum,my_right,my_left_sum,my_stuff_last);
+                task* a = my_left_is_final ? NULL : c.create_child(my_range,*my_body,my_left,my_incoming,NULL);
+                set_ref_count( (a!=NULL)+(b!=NULL) );
+                my_body = NULL;
+                if( a ) spawn(*b);
+                else a = b;
+                return a;
+            } else {
+                return NULL;
+            }
+        }
+        template<typename Range_,typename Body_,typename Partitioner_>
+        friend class start_scan;
+
+        template<typename Range_,typename Body_>
+        friend class finish_scan;
+    };
+
+    //! Combine partial results
+    /** @ingroup algorithms */
+    template<typename Range, typename Body>
+    class finish_scan: public task {
+        typedef sum_node<Range,Body> sum_node_type;
+        typedef final_sum<Range,Body> final_sum_type;
+        final_sum_type** const my_sum;
+        sum_node_type*& my_return_slot;
+    public:
+        final_sum_type* my_right_zombie;
+        sum_node_type& my_result;
+
+        task* execute() __TBB_override {
+            __TBB_ASSERT( my_result.ref_count()==(my_result.my_left!=NULL)+(my_result.my_right!=NULL), NULL );
+            if( my_result.my_left )
+                my_result.my_left_is_final = false;
+            if( my_right_zombie && my_sum )
+                ((*my_sum)->my_body).reverse_join(my_result.my_left_sum->my_body);
+            __TBB_ASSERT( !my_return_slot, NULL );
+            if( my_right_zombie || my_result.my_right ) {
+                my_return_slot = &my_result;
+            } else {
+                destroy( my_result );
+            }
+            if( my_right_zombie && !my_sum && !my_result.my_right ) {
+                destroy(*my_right_zombie);
+                my_right_zombie = NULL;
+            }
+            return NULL;
+        }
+
+        finish_scan( sum_node_type*& return_slot_, final_sum_type** sum_, sum_node_type& result_ ) :
+            my_sum(sum_),
+            my_return_slot(return_slot_),
+            my_right_zombie(NULL),
+            my_result(result_)
+        {
+            __TBB_ASSERT( !my_return_slot, NULL );
+        }
+    };
+
+    //! Initial task to split the work
+    /** @ingroup algorithms */
+    template<typename Range, typename Body, typename Partitioner=simple_partitioner>
+    class start_scan: public task {
+        typedef sum_node<Range,Body> sum_node_type;
+        typedef final_sum<Range,Body> final_sum_type;
+        final_sum_type* my_body;
+        /** Non-null if caller is requesting total. */
+        final_sum_type** my_sum;
+        sum_node_type** my_return_slot;
+        /** Null if computing root. */
+        sum_node_type* my_parent_sum;
+        bool my_is_final;
+        bool my_is_right_child;
+        Range my_range;
+        typename Partitioner::partition_type my_partition;
+        task* execute() __TBB_override ;
+    public:
+        start_scan( sum_node_type*& return_slot_, start_scan& parent_, sum_node_type* parent_sum_ ) :
+            my_body(parent_.my_body),
+            my_sum(parent_.my_sum),
+            my_return_slot(&return_slot_),
+            my_parent_sum(parent_sum_),
+            my_is_final(parent_.my_is_final),
+            my_is_right_child(false),
+            my_range(parent_.my_range,split()),
+            my_partition(parent_.my_partition,split())
+        {
+            __TBB_ASSERT( !*my_return_slot, NULL );
+        }
+
+        start_scan( sum_node_type*& return_slot_, const Range& range_, final_sum_type& body_, const Partitioner& partitioner_) :
+            my_body(&body_),
+            my_sum(NULL),
+            my_return_slot(&return_slot_),
+            my_parent_sum(NULL),
+            my_is_final(true),
+            my_is_right_child(false),
+            my_range(range_),
+            my_partition(partitioner_)
+        {
+            __TBB_ASSERT( !*my_return_slot, NULL );
+        }
+
+        static void run( const Range& range_, Body& body_, const Partitioner& partitioner_ ) {
+            if( !range_.empty() ) {
+                typedef internal::start_scan<Range,Body,Partitioner> start_pass1_type;
+                internal::sum_node<Range,Body>* root = NULL;
+                final_sum_type* temp_body = new(task::allocate_root()) final_sum_type( body_ );
+                start_pass1_type& pass1 = *new(task::allocate_root()) start_pass1_type(
+                    /*my_return_slot=*/root,
+                    range_,
+                    *temp_body,
+                    partitioner_ );
+                temp_body->my_body.reverse_join(body_);
+                task::spawn_root_and_wait( pass1 );
+                if( root ) {
+                    root->my_body = temp_body;
+                    root->my_incoming = NULL;
+                    root->my_stuff_last = &body_;
+                    task::spawn_root_and_wait( *root );
+                } else {
+                    body_.assign(temp_body->my_body);
+                    temp_body->finish_construction( range_, NULL );
+                    temp_body->destroy(*temp_body);
+                }
+            }
+        }
+    };
+
+    template<typename Range, typename Body, typename Partitioner>
+    task* start_scan<Range,Body,Partitioner>::execute() {
+        typedef internal::finish_scan<Range,Body> finish_pass1_type;
+        finish_pass1_type* p = my_parent_sum ? static_cast<finish_pass1_type*>( parent() ) : NULL;
+        // Inspecting p->result.left_sum would ordinarily be a race condition.
+        // But we inspect it only if we are not a stolen task, in which case we
+        // know that task assigning to p->result.left_sum has completed.
+        bool treat_as_stolen = my_is_right_child && (is_stolen_task() || my_body!=p->my_result.my_left_sum);
+        if( treat_as_stolen ) {
+            // Invocation is for right child that has been really stolen or needs to be virtually stolen
+            p->my_right_zombie = my_body = new( allocate_root() ) final_sum_type(my_body->my_body);
+            my_is_final = false;
+        }
+        task* next_task = NULL;
+        if( (my_is_right_child && !treat_as_stolen) || !my_range.is_divisible() || my_partition.should_execute_range(*this) ) {
+            if( my_is_final )
+                (my_body->my_body)( my_range, final_scan_tag() );
+            else if( my_sum )
+                (my_body->my_body)( my_range, pre_scan_tag() );
+            if( my_sum )
+                *my_sum = my_body;
+            __TBB_ASSERT( !*my_return_slot, NULL );
+        } else {
+            sum_node_type* result;
+            if( my_parent_sum )
+                result = new(allocate_additional_child_of(*my_parent_sum)) sum_node_type(my_range,/*my_left_is_final=*/my_is_final);
+            else
+                result = new(task::allocate_root()) sum_node_type(my_range,/*my_left_is_final=*/my_is_final);
+            finish_pass1_type& c = *new( allocate_continuation()) finish_pass1_type(*my_return_slot,my_sum,*result);
+            // Split off right child
+            start_scan& b = *new( c.allocate_child() ) start_scan( /*my_return_slot=*/result->my_right, *this, result );
+            b.my_is_right_child = true;
+            // Left child is recycling of *this.  Must recycle this before spawning b,
+            // otherwise b might complete and decrement c.ref_count() to zero, which
+            // would cause c.execute() to run prematurely.
+            recycle_as_child_of(c);
+            c.set_ref_count(2);
+            c.spawn(b);
+            my_sum = &result->my_left_sum;
+            my_return_slot = &result->my_left;
+            my_is_right_child = false;
+            next_task = this;
+            my_parent_sum = result;
+            __TBB_ASSERT( !*my_return_slot, NULL );
+        }
+        return next_task;
+    }
+
+    template<typename Range, typename Value, typename Scan, typename ReverseJoin>
+    class lambda_scan_body : no_assign {
+        Value               my_sum;
+        const Value&        identity_element;
+        const Scan&         my_scan;
+        const ReverseJoin&  my_reverse_join;
+    public:
+        lambda_scan_body( const Value& identity, const Scan& scan, const ReverseJoin& rev_join)
+            : my_sum(identity)
+            , identity_element(identity)
+            , my_scan(scan)
+            , my_reverse_join(rev_join) {}
+
+        lambda_scan_body( lambda_scan_body& b, split )
+            : my_sum(b.identity_element)
+            , identity_element(b.identity_element)
+            , my_scan(b.my_scan)
+            , my_reverse_join(b.my_reverse_join) {}
+
+        template<typename Tag>
+        void operator()( const Range& r, Tag tag ) {
+            my_sum = my_scan(r, my_sum, tag);
+        }
+
+        void reverse_join( lambda_scan_body& a ) {
+            my_sum = my_reverse_join(a.my_sum, my_sum);
+        }
+
+        void assign( lambda_scan_body& b ) {
+            my_sum = b.my_sum;
+        }
+
+        Value result() const {
+            return my_sum;
+        }
+    };
+} // namespace internal
+//! @endcond
+
+// Requirements on Range concept are documented in blocked_range.h
+
+/** \page parallel_scan_body_req Requirements on parallel_scan body
+    Class \c Body implementing the concept of parallel_scan body must define:
+    - \code Body::Body( Body&, split ); \endcode    Splitting constructor.
+                                                    Split \c b so that \c this and \c b can accumulate separately
+    - \code Body::~Body(); \endcode                 Destructor
+    - \code void Body::operator()( const Range& r, pre_scan_tag ); \endcode
+                                                    Preprocess iterations for range \c r
+    - \code void Body::operator()( const Range& r, final_scan_tag ); \endcode
+                                                    Do final processing for iterations of range \c r
+    - \code void Body::reverse_join( Body& a ); \endcode
+                                                    Merge preprocessing state of \c a into \c this, where \c a was
+                                                    created earlier from \c b by b's splitting constructor
+**/
+
+/** \name parallel_scan
+    See also requirements on \ref range_req "Range" and \ref parallel_scan_body_req "parallel_scan Body". **/
+//@{
+
+//! Parallel prefix with default partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_scan( const Range& range, Body& body ) {
+    internal::start_scan<Range,Body,__TBB_DEFAULT_PARTITIONER>::run(range,body,__TBB_DEFAULT_PARTITIONER());
+}
+
+//! Parallel prefix with simple_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_scan( const Range& range, Body& body, const simple_partitioner& partitioner ) {
+    internal::start_scan<Range,Body,simple_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel prefix with auto_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Body>
+void parallel_scan( const Range& range, Body& body, const auto_partitioner& partitioner ) {
+    internal::start_scan<Range,Body,auto_partitioner>::run(range,body,partitioner);
+}
+
+//! Parallel prefix with default partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename Scan, typename ReverseJoin>
+Value parallel_scan( const Range& range, const Value& identity, const Scan& scan, const ReverseJoin& reverse_join ) {
+    internal::lambda_scan_body<Range, Value, Scan, ReverseJoin> body(identity, scan, reverse_join);
+    tbb::parallel_scan(range,body,__TBB_DEFAULT_PARTITIONER());
+    return body.result();
+}
+
+//! Parallel prefix with simple_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename Scan, typename ReverseJoin>
+Value parallel_scan( const Range& range, const Value& identity, const Scan& scan, const ReverseJoin& reverse_join, const simple_partitioner& partitioner ) {
+    internal::lambda_scan_body<Range, Value, Scan, ReverseJoin> body(identity, scan, reverse_join);
+    tbb::parallel_scan(range,body,partitioner);
+    return body.result();
+}
+
+//! Parallel prefix with auto_partitioner
+/** @ingroup algorithms **/
+template<typename Range, typename Value, typename Scan, typename ReverseJoin>
+Value parallel_scan( const Range& range, const Value& identity, const Scan& scan, const ReverseJoin& reverse_join, const auto_partitioner& partitioner ) {
+    internal::lambda_scan_body<Range, Value, Scan, ReverseJoin> body(identity, scan, reverse_join);
+    tbb::parallel_scan(range,body,partitioner);
+    return body.result();
+}
+
+//@}
+
+} // namespace tbb
+
+#endif /* __TBB_parallel_scan_H */
+
diff --git a/xdl/third_party/tbb/include/tbb/parallel_sort.h b/xdl/third_party/tbb/include/tbb/parallel_sort.h
new file mode 100644
index 00000000..753bf3c0
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_sort.h
@@ -0,0 +1,255 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_sort_H
+#define __TBB_parallel_sort_H
+
+#include "parallel_for.h"
+#include "blocked_range.h"
+#include "internal/_range_iterator.h"
+#include <algorithm>
+#include <iterator>
+#include <functional>
+#if __TBB_TASK_GROUP_CONTEXT
+    #include "tbb_profiling.h"
+#endif
+
+namespace tbb {
+
+namespace interface9 {
+//! @cond INTERNAL
+namespace internal {
+
+using tbb::internal::no_assign;
+
+//! Range used in quicksort to split elements into subranges based on a value.
+/** The split operation selects a splitter and places all elements less than or equal
+    to the value in the first range and the remaining elements in the second range.
+    @ingroup algorithms */
+template<typename RandomAccessIterator, typename Compare>
+class quick_sort_range: private no_assign {
+
+    inline size_t median_of_three(const RandomAccessIterator &array, size_t l, size_t m, size_t r) const {
+        return comp(array[l], array[m]) ? ( comp(array[m], array[r]) ? m : ( comp( array[l], array[r]) ? r : l ) )
+                                        : ( comp(array[r], array[m]) ? m : ( comp( array[r], array[l] ) ? r : l ) );
+    }
+
+    inline size_t pseudo_median_of_nine( const RandomAccessIterator &array, const quick_sort_range &range ) const {
+        size_t offset = range.size/8u;
+        return median_of_three(array,
+                               median_of_three(array, 0, offset, offset*2),
+                               median_of_three(array, offset*3, offset*4, offset*5),
+                               median_of_three(array, offset*6, offset*7, range.size - 1) );
+
+    }
+
+    size_t split_range( quick_sort_range& range ) {
+        using std::iter_swap;
+        RandomAccessIterator array = range.begin;
+        RandomAccessIterator key0 = range.begin;
+        size_t m = pseudo_median_of_nine(array, range);
+        if (m) iter_swap ( array, array+m );
+
+        size_t i=0;
+        size_t j=range.size;
+        // Partition interval [i+1,j-1] with key *key0.
+        for(;;) {
+            __TBB_ASSERT( i<j, NULL );
+            // Loop must terminate since array[l]==*key0.
+            do {
+                --j;
+                __TBB_ASSERT( i<=j, "bad ordering relation?" );
+            } while( comp( *key0, array[j] ));
+            do {
+                __TBB_ASSERT( i<=j, NULL );
+                if( i==j ) goto partition;
+                ++i;
+            } while( comp( array[i],*key0 ));
+            if( i==j ) goto partition;
+            iter_swap( array+i, array+j );
+        }
+partition:
+        // Put the partition key were it belongs
+        iter_swap( array+j, key0 );
+        // array[l..j) is less or equal to key.
+        // array(j..r) is greater or equal to key.
+        // array[j] is equal to key
+        i=j+1;
+        size_t new_range_size = range.size-i;
+        range.size = j;
+        return new_range_size;
+    }
+
+public:
+
+    static const size_t grainsize = 500;
+    const Compare &comp;
+    size_t size;
+    RandomAccessIterator begin;
+
+    quick_sort_range( RandomAccessIterator begin_, size_t size_, const Compare &comp_ ) :
+        comp(comp_), size(size_), begin(begin_) {}
+
+    bool empty() const {return size==0;}
+    bool is_divisible() const {return size>=grainsize;}
+
+    quick_sort_range( quick_sort_range& range, split )
+        : comp(range.comp)
+        , size(split_range(range))
+          // +1 accounts for the pivot element, which is at its correct place
+          // already and, therefore, is not included into subranges.
+        , begin(range.begin+range.size+1) {}
+};
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Body class used to test if elements in a range are presorted
+/** @ingroup algorithms */
+template<typename RandomAccessIterator, typename Compare>
+class quick_sort_pretest_body : no_assign {
+    const Compare &comp;
+
+public:
+    quick_sort_pretest_body(const Compare &_comp) : comp(_comp) {}
+
+    void operator()( const blocked_range<RandomAccessIterator>& range ) const {
+        task &my_task = task::self();
+        RandomAccessIterator my_end = range.end();
+
+        int i = 0;
+        for (RandomAccessIterator k = range.begin(); k != my_end; ++k, ++i) {
+            if ( i%64 == 0 && my_task.is_cancelled() ) break;
+
+            // The k-1 is never out-of-range because the first chunk starts at begin+serial_cutoff+1
+            if ( comp( *(k), *(k-1) ) ) {
+                my_task.cancel_group_execution();
+                break;
+            }
+        }
+    }
+
+};
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//! Body class used to sort elements in a range that is smaller than the grainsize.
+/** @ingroup algorithms */
+template<typename RandomAccessIterator, typename Compare>
+struct quick_sort_body {
+    void operator()( const quick_sort_range<RandomAccessIterator,Compare>& range ) const {
+        //SerialQuickSort( range.begin, range.size, range.comp );
+        std::sort( range.begin, range.begin + range.size, range.comp );
+    }
+};
+
+//! Wrapper method to initiate the sort by calling parallel_for.
+/** @ingroup algorithms */
+template<typename RandomAccessIterator, typename Compare>
+void parallel_quick_sort( RandomAccessIterator begin, RandomAccessIterator end, const Compare& comp ) {
+#if __TBB_TASK_GROUP_CONTEXT
+    task_group_context my_context(PARALLEL_SORT);
+    const int serial_cutoff = 9;
+
+    __TBB_ASSERT( begin + serial_cutoff < end, "min_parallel_size is smaller than serial cutoff?" );
+    RandomAccessIterator k = begin;
+    for ( ; k != begin + serial_cutoff; ++k ) {
+        if ( comp( *(k+1), *k ) ) {
+            goto do_parallel_quick_sort;
+        }
+    }
+
+    parallel_for( blocked_range<RandomAccessIterator>(k+1, end),
+                  quick_sort_pretest_body<RandomAccessIterator,Compare>(comp),
+                  auto_partitioner(),
+                  my_context);
+
+    if (my_context.is_group_execution_cancelled())
+do_parallel_quick_sort:
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+        parallel_for( quick_sort_range<RandomAccessIterator,Compare>(begin, end-begin, comp ),
+                      quick_sort_body<RandomAccessIterator,Compare>(),
+                      auto_partitioner() );
+}
+
+} // namespace internal
+//! @endcond
+} // namespace interfaceX
+
+/** \page parallel_sort_iter_req Requirements on iterators for parallel_sort
+    Requirements on the iterator type \c It and its value type \c T for \c parallel_sort:
+
+    - \code void iter_swap( It a, It b ) \endcode Swaps the values of the elements the given
+    iterators \c a and \c b are pointing to. \c It should be a random access iterator.
+
+    - \code bool Compare::operator()( const T& x, const T& y ) \endcode True if x comes before y;
+**/
+
+/** \name parallel_sort
+    See also requirements on \ref parallel_sort_iter_req "iterators for parallel_sort". **/
+//@{
+
+//! Sorts the data in [begin,end) using the given comparator
+/** The compare function object is used for all comparisons between elements during sorting.
+    The compare object must define a bool operator() function.
+    @ingroup algorithms **/
+template<typename RandomAccessIterator, typename Compare>
+void parallel_sort( RandomAccessIterator begin, RandomAccessIterator end, const Compare& comp) {
+    const int min_parallel_size = 500;
+    if( end > begin ) {
+        if (end - begin < min_parallel_size) {
+            std::sort(begin, end, comp);
+        } else {
+            interface9::internal::parallel_quick_sort(begin, end, comp);
+        }
+    }
+}
+
+//! Sorts the data in [begin,end) with a default comparator \c std::less<RandomAccessIterator>
+/** @ingroup algorithms **/
+template<typename RandomAccessIterator>
+inline void parallel_sort( RandomAccessIterator begin, RandomAccessIterator end ) {
+    parallel_sort( begin, end, std::less< typename std::iterator_traits<RandomAccessIterator>::value_type >() );
+}
+
+//! Sorts the data in rng using the given comparator
+/** @ingroup algorithms **/
+template<typename Range, typename Compare>
+void parallel_sort(Range& rng, const Compare& comp) {
+    parallel_sort(tbb::internal::first(rng), tbb::internal::last(rng), comp);
+}
+
+//! Sorts the data in rng with a default comparator \c std::less<RandomAccessIterator>
+/** @ingroup algorithms **/
+template<typename Range>
+void parallel_sort(Range& rng) {
+    parallel_sort(tbb::internal::first(rng), tbb::internal::last(rng));
+}
+
+//! Sorts the data in the range \c [begin,end) with a default comparator \c std::less<T>
+/** @ingroup algorithms **/
+template<typename T>
+inline void parallel_sort( T * begin, T * end ) {
+    parallel_sort( begin, end, std::less< T >() );
+}
+//@}
+
+
+} // namespace tbb
+
+#endif
+
diff --git a/xdl/third_party/tbb/include/tbb/parallel_while.h b/xdl/third_party/tbb/include/tbb/parallel_while.h
new file mode 100644
index 00000000..be9f5794
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/parallel_while.h
@@ -0,0 +1,186 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_parallel_while
+#define __TBB_parallel_while
+
+#include "task.h"
+#include <new>
+
+namespace tbb {
+
+template<typename Body>
+class parallel_while;
+
+//! @cond INTERNAL
+namespace internal {
+
+    template<typename Stream, typename Body> class while_task;
+
+    //! For internal use only.
+    /** Executes one iteration of a while.
+        @ingroup algorithms */
+    template<typename Body>
+    class while_iteration_task: public task {
+        const Body& my_body;
+        typename Body::argument_type my_value;
+        task* execute() __TBB_override {
+            my_body(my_value);
+            return NULL;
+        }
+        while_iteration_task( const typename Body::argument_type& value, const Body& body ) :
+            my_body(body), my_value(value)
+        {}
+        template<typename Body_> friend class while_group_task;
+        friend class tbb::parallel_while<Body>;
+    };
+
+    //! For internal use only
+    /** Unpacks a block of iterations.
+        @ingroup algorithms */
+    template<typename Body>
+    class while_group_task: public task {
+        static const size_t max_arg_size = 4;
+        const Body& my_body;
+        size_t size;
+        typename Body::argument_type my_arg[max_arg_size];
+        while_group_task( const Body& body ) : my_body(body), size(0) {}
+        task* execute() __TBB_override {
+            typedef while_iteration_task<Body> iteration_type;
+            __TBB_ASSERT( size>0, NULL );
+            task_list list;
+            task* t;
+            size_t k=0;
+            for(;;) {
+                t = new( allocate_child() ) iteration_type(my_arg[k],my_body);
+                if( ++k==size ) break;
+                list.push_back(*t);
+            }
+            set_ref_count(int(k+1));
+            spawn(list);
+            spawn_and_wait_for_all(*t);
+            return NULL;
+        }
+        template<typename Stream, typename Body_> friend class while_task;
+    };
+
+    //! For internal use only.
+    /** Gets block of iterations from a stream and packages them into a while_group_task.
+        @ingroup algorithms */
+    template<typename Stream, typename Body>
+    class while_task: public task {
+        Stream& my_stream;
+        const Body& my_body;
+        empty_task& my_barrier;
+        task* execute() __TBB_override {
+            typedef while_group_task<Body> block_type;
+            block_type& t = *new( allocate_additional_child_of(my_barrier) ) block_type(my_body);
+            size_t k=0;
+            while( my_stream.pop_if_present(t.my_arg[k]) ) {
+                if( ++k==block_type::max_arg_size ) {
+                    // There might be more iterations.
+                    recycle_to_reexecute();
+                    break;
+                }
+            }
+            if( k==0 ) {
+                destroy(t);
+                return NULL;
+            } else {
+                t.size = k;
+                return &t;
+            }
+        }
+        while_task( Stream& stream, const Body& body, empty_task& barrier ) :
+            my_stream(stream),
+            my_body(body),
+            my_barrier(barrier)
+        {}
+        friend class tbb::parallel_while<Body>;
+    };
+
+} // namespace internal
+//! @endcond
+
+//! Parallel iteration over a stream, with optional addition of more work.
+/** The Body b has the requirement: \n
+        "b(v)"                      \n
+        "b.argument_type"           \n
+    where v is an argument_type
+    @ingroup algorithms */
+template<typename Body>
+class parallel_while: internal::no_copy {
+public:
+    //! Construct empty non-running parallel while.
+    parallel_while() : my_body(NULL), my_barrier(NULL) {}
+
+    //! Destructor cleans up data members before returning.
+    ~parallel_while() {
+        if( my_barrier ) {
+            my_barrier->destroy(*my_barrier);
+            my_barrier = NULL;
+        }
+    }
+
+    //! Type of items
+    typedef typename Body::argument_type value_type;
+
+    //! Apply body.apply to each item in the stream.
+    /** A Stream s has the requirements \n
+         "S::value_type"                \n
+         "s.pop_if_present(value) is convertible to bool */
+    template<typename Stream>
+    void run( Stream& stream, const Body& body );
+
+    //! Add a work item while running.
+    /** Should be executed only by body.apply or a thread spawned therefrom. */
+    void add( const value_type& item );
+
+private:
+    const Body* my_body;
+    empty_task* my_barrier;
+};
+
+template<typename Body>
+template<typename Stream>
+void parallel_while<Body>::run( Stream& stream, const Body& body ) {
+    using namespace internal;
+    empty_task& barrier = *new( task::allocate_root() ) empty_task();
+    my_body = &body;
+    my_barrier = &barrier;
+    my_barrier->set_ref_count(2);
+    while_task<Stream,Body>& w = *new( my_barrier->allocate_child() ) while_task<Stream,Body>( stream, body, barrier );
+    my_barrier->spawn_and_wait_for_all(w);
+    my_barrier->destroy(*my_barrier);
+    my_barrier = NULL;
+    my_body = NULL;
+}
+
+template<typename Body>
+void parallel_while<Body>::add( const value_type& item ) {
+    __TBB_ASSERT(my_barrier,"attempt to add to parallel_while that is not running");
+    typedef internal::while_iteration_task<Body> iteration_type;
+    iteration_type& i = *new( task::allocate_additional_child_of(*my_barrier) ) iteration_type(item,*my_body);
+    task::self().spawn( i );
+}
+
+} // namespace
+
+#endif /* __TBB_parallel_while */
diff --git a/xdl/third_party/tbb/include/tbb/partitioner.h b/xdl/third_party/tbb/include/tbb/partitioner.h
new file mode 100644
index 00000000..fed7a8bf
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/partitioner.h
@@ -0,0 +1,693 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_partitioner_H
+#define __TBB_partitioner_H
+
+#ifndef __TBB_INITIAL_CHUNKS
+// initial task divisions per thread
+#define __TBB_INITIAL_CHUNKS 2
+#endif
+#ifndef __TBB_RANGE_POOL_CAPACITY
+// maximum number of elements in range pool
+#define __TBB_RANGE_POOL_CAPACITY 8
+#endif
+#ifndef __TBB_INIT_DEPTH
+// initial value for depth of range pool
+#define __TBB_INIT_DEPTH 5
+#endif
+#ifndef __TBB_DEMAND_DEPTH_ADD
+// when imbalance is found range splits this value times more
+#define __TBB_DEMAND_DEPTH_ADD 1
+#endif
+#ifndef __TBB_STATIC_THRESHOLD
+// necessary number of clocks for the work to be distributed among all tasks
+#define __TBB_STATIC_THRESHOLD 40000
+#endif
+#if __TBB_DEFINE_MIC
+#define __TBB_NONUNIFORM_TASK_CREATION 1
+#ifdef __TBB_time_stamp
+#define __TBB_USE_MACHINE_TIME_STAMPS 1
+#define __TBB_task_duration() __TBB_STATIC_THRESHOLD
+#endif // __TBB_machine_time_stamp
+#endif // __TBB_DEFINE_MIC
+
+#include "task.h"
+#include "task_arena.h"
+#include "aligned_space.h"
+#include "atomic.h"
+#include "internal/_template_helpers.h"
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    #pragma warning (push)
+    #pragma warning (disable: 4244)
+#endif
+
+namespace tbb {
+
+class auto_partitioner;
+class simple_partitioner;
+class static_partitioner;
+class affinity_partitioner;
+
+namespace interface9 {
+    namespace internal {
+        class affinity_partition_type;
+    }
+}
+
+namespace internal { //< @cond INTERNAL
+size_t __TBB_EXPORTED_FUNC get_initial_auto_partitioner_divisor();
+
+//! Defines entry point for affinity partitioner into tbb run-time library.
+class affinity_partitioner_base_v3: no_copy {
+    friend class tbb::affinity_partitioner;
+    friend class tbb::interface9::internal::affinity_partition_type;
+    //! Array that remembers affinities of tree positions to affinity_id.
+    /** NULL if my_size==0. */
+    affinity_id* my_array;
+    //! Number of elements in my_array.
+    size_t my_size;
+    //! Zeros the fields.
+    affinity_partitioner_base_v3() : my_array(NULL), my_size(0) {}
+    //! Deallocates my_array.
+    ~affinity_partitioner_base_v3() {resize(0);}
+    //! Resize my_array.
+    /** Retains values if resulting size is the same. */
+    void __TBB_EXPORTED_METHOD resize( unsigned factor );
+};
+
+//! Provides backward-compatible methods for partition objects without affinity.
+class partition_type_base {
+public:
+    void set_affinity( task & ) {}
+    void note_affinity( task::affinity_id ) {}
+    task* continue_after_execute_range() {return NULL;}
+    bool decide_whether_to_delay() {return false;}
+    void spawn_or_delay( bool, task& b ) {
+        task::spawn(b);
+    }
+};
+
+template<typename Range, typename Body, typename Partitioner> class start_scan;
+
+} //< namespace internal @endcond
+
+namespace serial {
+namespace interface9 {
+template<typename Range, typename Body, typename Partitioner> class start_for;
+}
+}
+
+namespace interface9 {
+//! @cond INTERNAL
+namespace internal {
+using namespace tbb::internal;
+template<typename Range, typename Body, typename Partitioner> class start_for;
+template<typename Range, typename Body, typename Partitioner> class start_reduce;
+template<typename Range, typename Body, typename Partitioner> class start_deterministic_reduce;
+
+//! Join task node that contains shared flag for stealing feedback
+class flag_task: public task {
+public:
+    tbb::atomic<bool> my_child_stolen;
+    flag_task() { my_child_stolen = false; }
+    task* execute() __TBB_override { return NULL; }
+    static void mark_task_stolen(task &t) {
+        tbb::atomic<bool> &flag = static_cast<flag_task*>(t.parent())->my_child_stolen;
+#if TBB_USE_THREADING_TOOLS
+        // Threading tools respect lock prefix but report false-positive data-race via plain store
+        flag.fetch_and_store<release>(true);
+#else
+        flag = true;
+#endif //TBB_USE_THREADING_TOOLS
+    }
+    static bool is_peer_stolen(task &t) {
+        return static_cast<flag_task*>(t.parent())->my_child_stolen;
+    }
+};
+
+//! Depth is a relative depth of recursive division inside a range pool. Relative depth allows
+//! infinite absolute depth of the recursion for heavily unbalanced workloads with range represented
+//! by a number that cannot fit into machine word.
+typedef unsigned char depth_t;
+
+//! Range pool stores ranges of type T in a circular buffer with MaxCapacity
+template <typename T, depth_t MaxCapacity>
+class range_vector {
+    depth_t my_head;
+    depth_t my_tail;
+    depth_t my_size;
+    depth_t my_depth[MaxCapacity]; // relative depths of stored ranges
+    tbb::aligned_space<T, MaxCapacity> my_pool;
+
+public:
+    //! initialize via first range in pool
+    range_vector(const T& elem) : my_head(0), my_tail(0), my_size(1) {
+        my_depth[0] = 0;
+        new( static_cast<void *>(my_pool.begin()) ) T(elem);//TODO: std::move?
+    }
+    ~range_vector() {
+        while( !empty() ) pop_back();
+    }
+    bool empty() const { return my_size == 0; }
+    depth_t size() const { return my_size; }
+    //! Populates range pool via ranges up to max depth or while divisible
+    //! max_depth starts from 0, e.g. value 2 makes 3 ranges in the pool up to two 1/4 pieces
+    void split_to_fill(depth_t max_depth) {
+        while( my_size < MaxCapacity && is_divisible(max_depth) ) {
+            depth_t prev = my_head;
+            my_head = (my_head + 1) % MaxCapacity;
+            new(my_pool.begin()+my_head) T(my_pool.begin()[prev]); // copy TODO: std::move?
+            my_pool.begin()[prev].~T(); // instead of assignment
+            new(my_pool.begin()+prev) T(my_pool.begin()[my_head], split()); // do 'inverse' split
+            my_depth[my_head] = ++my_depth[prev];
+            my_size++;
+        }
+    }
+    void pop_back() {
+        __TBB_ASSERT(my_size > 0, "range_vector::pop_back() with empty size");
+        my_pool.begin()[my_head].~T();
+        my_size--;
+        my_head = (my_head + MaxCapacity - 1) % MaxCapacity;
+    }
+    void pop_front() {
+        __TBB_ASSERT(my_size > 0, "range_vector::pop_front() with empty size");
+        my_pool.begin()[my_tail].~T();
+        my_size--;
+        my_tail = (my_tail + 1) % MaxCapacity;
+    }
+    T& back() {
+        __TBB_ASSERT(my_size > 0, "range_vector::back() with empty size");
+        return my_pool.begin()[my_head];
+    }
+    T& front() {
+        __TBB_ASSERT(my_size > 0, "range_vector::front() with empty size");
+        return my_pool.begin()[my_tail];
+    }
+    //! similarly to front(), returns depth of the first range in the pool
+    depth_t front_depth() {
+        __TBB_ASSERT(my_size > 0, "range_vector::front_depth() with empty size");
+        return my_depth[my_tail];
+    }
+    depth_t back_depth() {
+        __TBB_ASSERT(my_size > 0, "range_vector::back_depth() with empty size");
+        return my_depth[my_head];
+    }
+    bool is_divisible(depth_t max_depth) {
+        return back_depth() < max_depth && back().is_divisible();
+    }
+};
+
+//! Provides default methods for partition objects and common algorithm blocks.
+template <typename Partition>
+struct partition_type_base {
+    typedef split split_type;
+    // decision makers
+    void set_affinity( task & ) {}
+    void note_affinity( task::affinity_id ) {}
+    bool check_being_stolen(task &) { return false; } // part of old should_execute_range()
+    bool check_for_demand(task &) { return false; }
+    bool is_divisible() { return true; } // part of old should_execute_range()
+    depth_t max_depth() { return 0; }
+    void align_depth(depth_t) { }
+    template <typename Range> split_type get_split() { return split(); }
+    Partition& self() { return *static_cast<Partition*>(this); } // CRTP helper
+
+    template<typename StartType, typename Range>
+    void work_balance(StartType &start, Range &range) {
+        start.run_body( range ); // simple partitioner goes always here
+    }
+
+    template<typename StartType, typename Range>
+    void execute(StartType &start, Range &range) {
+        // The algorithm in a few words ([]-denotes calls to decision methods of partitioner):
+        // [If this task is stolen, adjust depth and divisions if necessary, set flag].
+        // If range is divisible {
+        //    Spread the work while [initial divisions left];
+        //    Create trap task [if necessary];
+        // }
+        // If not divisible or [max depth is reached], execute, else do the range pool part
+        if ( range.is_divisible() ) {
+            if ( self().is_divisible() ) {
+                do { // split until is divisible
+                    typename Partition::split_type split_obj = self().template get_split<Range>();
+                    start.offer_work( split_obj );
+                } while ( range.is_divisible() && self().is_divisible() );
+            }
+        }
+        self().work_balance(start, range);
+    }
+};
+
+//! Class determines whether template parameter has static boolean constant
+//! 'is_splittable_in_proportion' initialized with value of 'true' or not.
+/** If template parameter has such field that has been initialized with non-zero
+*  value then class field will be set to 'true', otherwise - 'false'
+*/
+template <typename Range>
+class is_splittable_in_proportion {
+private:
+    typedef char yes[1];
+    typedef char no[2];
+
+    template <typename range_type> static yes& decide(typename enable_if<range_type::is_splittable_in_proportion>::type *);
+    template <typename range_type> static no& decide(...);
+public:
+    // equals to 'true' if and only if static const variable 'is_splittable_in_proportion' of template parameter
+    // initialized with the value of 'true'
+    static const bool value = (sizeof(decide<Range>(0)) == sizeof(yes));
+};
+
+//! Provides default splitting strategy for partition objects.
+template <typename Partition>
+struct adaptive_mode : partition_type_base<Partition> {
+    typedef Partition my_partition;
+    size_t my_divisor;
+    // For affinity_partitioner, my_divisor indicates the number of affinity array indices the task reserves.
+    // A task which has only one index must produce the right split without reserved index in order to avoid
+    // it to be overwritten in note_affinity() of the created (right) task.
+    // I.e. a task created deeper than the affinity array can remember must not save its affinity (LIFO order)
+    static const unsigned factor = 1;
+    adaptive_mode() : my_divisor(tbb::internal::get_initial_auto_partitioner_divisor() / 4 * my_partition::factor) {}
+    adaptive_mode(adaptive_mode &src, split) : my_divisor(do_split(src, split())) {}
+    /*! Override do_split methods in order to specify splitting strategy */
+    size_t do_split(adaptive_mode &src, split) {
+        return src.my_divisor /= 2u;
+    }
+};
+
+//! Provides proportional splitting strategy for partition objects
+template <typename Partition>
+struct proportional_mode : adaptive_mode<Partition> {
+    typedef Partition my_partition;
+    using partition_type_base<Partition>::self; // CRTP helper to get access to derived classes
+
+    proportional_mode() : adaptive_mode<Partition>() {}
+    proportional_mode(proportional_mode &src, split) : adaptive_mode<Partition>(src, split()) {}
+    proportional_mode(proportional_mode &src, const proportional_split& split_obj) { self().my_divisor = do_split(src, split_obj); }
+    size_t do_split(proportional_mode &src, const proportional_split& split_obj) {
+#if __TBB_ENABLE_RANGE_FEEDBACK
+        size_t portion = size_t(float(src.my_divisor) * float(split_obj.right())
+                                / float(split_obj.left() + split_obj.right()) + 0.5f);
+#else
+        size_t portion = split_obj.right() * my_partition::factor;
+#endif
+        portion = (portion + my_partition::factor/2) & (0ul - my_partition::factor);
+#if __TBB_ENABLE_RANGE_FEEDBACK
+        /** Corner case handling */
+        if (!portion)
+            portion = my_partition::factor;
+        else if (portion == src.my_divisor)
+            portion = src.my_divisor - my_partition::factor;
+#endif
+        src.my_divisor -= portion;
+        return portion;
+    }
+    bool is_divisible() { // part of old should_execute_range()
+        return self().my_divisor > my_partition::factor;
+    }
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress "conditional expression is constant" warning.
+    #pragma warning( push )
+    #pragma warning( disable: 4127 )
+#endif
+    template <typename Range>
+    proportional_split get_split() {
+        if (is_splittable_in_proportion<Range>::value) {
+            size_t size = self().my_divisor / my_partition::factor;
+#if __TBB_NONUNIFORM_TASK_CREATION
+            size_t right = (size + 2) / 3;
+#else
+            size_t right = size / 2;
+#endif
+            size_t left = size - right;
+            return proportional_split(left, right);
+        } else {
+            return proportional_split(1, 1);
+        }
+    }
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif // warning 4127 is back
+};
+
+static size_t get_initial_partition_head() {
+    int current_index = tbb::this_task_arena::current_thread_index();
+    if (current_index == tbb::task_arena::not_initialized)
+        current_index = 0;
+    return size_t(current_index);
+}
+
+//! Provides default linear indexing of partitioner's sequence
+template <typename Partition>
+struct linear_affinity_mode : proportional_mode<Partition> {
+    size_t my_head;
+    size_t my_max_affinity;
+    using proportional_mode<Partition>::self;
+    linear_affinity_mode() : proportional_mode<Partition>(), my_head(get_initial_partition_head()),
+                             my_max_affinity(self().my_divisor) {}
+    linear_affinity_mode(linear_affinity_mode &src, split) : proportional_mode<Partition>(src, split())
+        , my_head((src.my_head + src.my_divisor) % src.my_max_affinity), my_max_affinity(src.my_max_affinity) {}
+    linear_affinity_mode(linear_affinity_mode &src, const proportional_split& split_obj) : proportional_mode<Partition>(src, split_obj)
+        , my_head((src.my_head + src.my_divisor) % src.my_max_affinity), my_max_affinity(src.my_max_affinity) {}
+    void set_affinity( task &t ) {
+        if( self().my_divisor )
+            t.set_affinity( affinity_id(my_head) + 1 );
+    }
+};
+
+/*! Determine work-balance phase implementing splitting & stealing actions */
+template<class Mode>
+struct dynamic_grainsize_mode : Mode {
+    using Mode::self;
+#ifdef __TBB_USE_MACHINE_TIME_STAMPS
+    tbb::internal::machine_tsc_t my_dst_tsc;
+#endif
+    enum {
+        begin = 0,
+        run,
+        pass
+    } my_delay;
+    depth_t my_max_depth;
+    static const unsigned range_pool_size = __TBB_RANGE_POOL_CAPACITY;
+    dynamic_grainsize_mode(): Mode()
+#ifdef __TBB_USE_MACHINE_TIME_STAMPS
+        , my_dst_tsc(0)
+#endif
+        , my_delay(begin)
+        , my_max_depth(__TBB_INIT_DEPTH) {}
+    dynamic_grainsize_mode(dynamic_grainsize_mode& p, split)
+        : Mode(p, split())
+#ifdef __TBB_USE_MACHINE_TIME_STAMPS
+        , my_dst_tsc(0)
+#endif
+        , my_delay(pass)
+        , my_max_depth(p.my_max_depth) {}
+    dynamic_grainsize_mode(dynamic_grainsize_mode& p, const proportional_split& split_obj)
+        : Mode(p, split_obj)
+#ifdef __TBB_USE_MACHINE_TIME_STAMPS
+        , my_dst_tsc(0)
+#endif
+        , my_delay(begin)
+        , my_max_depth(p.my_max_depth) {}
+    bool check_being_stolen( task &t) { // part of old should_execute_range()
+        if( !(self().my_divisor / Mode::my_partition::factor) ) { // if not from the top P tasks of binary tree
+            self().my_divisor = 1; // TODO: replace by on-stack flag (partition_state's member)?
+            if( t.is_stolen_task() && t.parent()->ref_count() >= 2 ) { // runs concurrently with the left task
+#if __TBB_USE_OPTIONAL_RTTI
+                // RTTI is available, check whether the cast is valid
+                __TBB_ASSERT(dynamic_cast<flag_task*>(t.parent()), 0);
+                // correctness of the cast relies on avoiding the root task for which:
+                // - initial value of my_divisor != 0 (protected by separate assertion)
+                // - is_stolen_task() always returns false for the root task.
+#endif
+                flag_task::mark_task_stolen(t);
+                if( !my_max_depth ) my_max_depth++;
+                my_max_depth += __TBB_DEMAND_DEPTH_ADD;
+                return true;
+            }
+        }
+        return false;
+    }
+    depth_t max_depth() { return my_max_depth; }
+    void align_depth(depth_t base) {
+        __TBB_ASSERT(base <= my_max_depth, 0);
+        my_max_depth -= base;
+    }
+    template<typename StartType, typename Range>
+    void work_balance(StartType &start, Range &range) {
+        if( !range.is_divisible() || !self().max_depth() ) {
+            start.run_body( range ); // simple partitioner goes always here
+        }
+        else { // do range pool
+            internal::range_vector<Range, range_pool_size> range_pool(range);
+            do {
+                range_pool.split_to_fill(self().max_depth()); // fill range pool
+                if( self().check_for_demand( start ) ) {
+                    if( range_pool.size() > 1 ) {
+                        start.offer_work( range_pool.front(), range_pool.front_depth() );
+                        range_pool.pop_front();
+                        continue;
+                    }
+                    if( range_pool.is_divisible(self().max_depth()) ) // was not enough depth to fork a task
+                        continue; // note: next split_to_fill() should split range at least once
+                }
+                start.run_body( range_pool.back() );
+                range_pool.pop_back();
+            } while( !range_pool.empty() && !start.is_cancelled() );
+        }
+    }
+    bool check_for_demand( task &t ) {
+        if( pass == my_delay ) {
+            if( self().my_divisor > 1 ) // produce affinitized tasks while they have slot in array
+                return true; // do not do my_max_depth++ here, but be sure range_pool is splittable once more
+            else if( self().my_divisor && my_max_depth ) { // make balancing task
+                self().my_divisor = 0; // once for each task; depth will be decreased in align_depth()
+                return true;
+            }
+            else if( flag_task::is_peer_stolen(t) ) {
+                my_max_depth += __TBB_DEMAND_DEPTH_ADD;
+                return true;
+            }
+        } else if( begin == my_delay ) {
+#ifndef __TBB_USE_MACHINE_TIME_STAMPS
+            my_delay = pass;
+#else
+            my_dst_tsc = __TBB_time_stamp() + __TBB_task_duration();
+            my_delay = run;
+        } else if( run == my_delay ) {
+            if( __TBB_time_stamp() < my_dst_tsc ) {
+                __TBB_ASSERT(my_max_depth > 0, NULL);
+                 my_max_depth--; // increase granularity since tasks seem having too small work
+                return false;
+            }
+            my_delay = pass;
+            return true;
+#endif // __TBB_USE_MACHINE_TIME_STAMPS
+        }
+        return false;
+    }
+};
+
+class auto_partition_type: public dynamic_grainsize_mode<adaptive_mode<auto_partition_type> > {
+public:
+    auto_partition_type( const auto_partitioner& )
+        : dynamic_grainsize_mode<adaptive_mode<auto_partition_type> >() {
+        my_divisor *= __TBB_INITIAL_CHUNKS;
+    }
+    auto_partition_type( auto_partition_type& src, split)
+        : dynamic_grainsize_mode<adaptive_mode<auto_partition_type> >(src, split()) {}
+    bool is_divisible() { // part of old should_execute_range()
+        if( my_divisor > 1 ) return true;
+        if( my_divisor && my_max_depth ) { // can split the task. TODO: on-stack flag instead
+            // keep same fragmentation while splitting for the local task pool
+            my_max_depth--;
+            my_divisor = 0; // decrease max_depth once per task
+            return true;
+        } else return false;
+    }
+    bool check_for_demand(task &t) {
+        if( flag_task::is_peer_stolen(t) ) {
+            my_max_depth += __TBB_DEMAND_DEPTH_ADD;
+            return true;
+        } else return false;
+    }
+};
+
+class simple_partition_type: public partition_type_base<simple_partition_type> {
+public:
+    simple_partition_type( const simple_partitioner& ) {}
+    simple_partition_type( const simple_partition_type&, split ) {}
+    //! simplified algorithm
+    template<typename StartType, typename Range>
+    void execute(StartType &start, Range &range) {
+        split_type split_obj = split(); // start.offer_work accepts split_type as reference
+        while( range.is_divisible() )
+            start.offer_work( split_obj );
+        start.run_body( range );
+    }
+};
+
+class static_partition_type : public linear_affinity_mode<static_partition_type> {
+public:
+    typedef proportional_split split_type;
+    static_partition_type( const static_partitioner& )
+        : linear_affinity_mode<static_partition_type>() {}
+    static_partition_type( static_partition_type& p, split )
+        : linear_affinity_mode<static_partition_type>(p, split()) {}
+    static_partition_type( static_partition_type& p, const proportional_split& split_obj )
+        : linear_affinity_mode<static_partition_type>(p, split_obj) {}
+};
+
+class affinity_partition_type : public dynamic_grainsize_mode<linear_affinity_mode<affinity_partition_type> > {
+    static const unsigned factor_power = 4; // TODO: get a unified formula based on number of computing units
+    tbb::internal::affinity_id* my_array;
+public:
+    static const unsigned factor = 1 << factor_power; // number of slots in affinity array per task
+    typedef proportional_split split_type;
+    affinity_partition_type( tbb::internal::affinity_partitioner_base_v3& ap )
+        : dynamic_grainsize_mode<linear_affinity_mode<affinity_partition_type> >() {
+        __TBB_ASSERT( (factor&(factor-1))==0, "factor must be power of two" );
+        ap.resize(factor);
+        my_array = ap.my_array;
+        my_max_depth = factor_power + 1;
+        __TBB_ASSERT( my_max_depth < __TBB_RANGE_POOL_CAPACITY, 0 );
+    }
+    affinity_partition_type(affinity_partition_type& p, split)
+        : dynamic_grainsize_mode<linear_affinity_mode<affinity_partition_type> >(p, split())
+        , my_array(p.my_array) {}
+    affinity_partition_type(affinity_partition_type& p, const proportional_split& split_obj)
+        : dynamic_grainsize_mode<linear_affinity_mode<affinity_partition_type> >(p, split_obj)
+        , my_array(p.my_array) {}
+    void set_affinity( task &t ) {
+        if( my_divisor ) {
+            if( !my_array[my_head] )
+                // TODO: consider new ideas with my_array for both affinity and static partitioner's, then code reuse
+                t.set_affinity( affinity_id(my_head / factor + 1) );
+            else
+                t.set_affinity( my_array[my_head] );
+        }
+    }
+    void note_affinity( task::affinity_id id ) {
+        if( my_divisor )
+            my_array[my_head] = id;
+    }
+};
+
+//! Backward-compatible partition for auto and affinity partition objects.
+class old_auto_partition_type: public tbb::internal::partition_type_base {
+    size_t num_chunks;
+    static const size_t VICTIM_CHUNKS = 4;
+public:
+    bool should_execute_range(const task &t) {
+        if( num_chunks<VICTIM_CHUNKS && t.is_stolen_task() )
+            num_chunks = VICTIM_CHUNKS;
+        return num_chunks==1;
+    }
+    old_auto_partition_type( const auto_partitioner& )
+      : num_chunks(internal::get_initial_auto_partitioner_divisor()*__TBB_INITIAL_CHUNKS/4) {}
+    old_auto_partition_type( const affinity_partitioner& )
+      : num_chunks(internal::get_initial_auto_partitioner_divisor()*__TBB_INITIAL_CHUNKS/4) {}
+    old_auto_partition_type( old_auto_partition_type& pt, split ) {
+        num_chunks = pt.num_chunks = (pt.num_chunks+1u) / 2u;
+    }
+};
+
+} // namespace interfaceX::internal
+//! @endcond
+} // namespace interfaceX
+
+//! A simple partitioner
+/** Divides the range until the range is not divisible.
+    @ingroup algorithms */
+class simple_partitioner {
+public:
+    simple_partitioner() {}
+private:
+    template<typename Range, typename Body, typename Partitioner> friend class serial::interface9::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_reduce;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_deterministic_reduce;
+    template<typename Range, typename Body, typename Partitioner> friend class internal::start_scan;
+    // backward compatibility
+    class partition_type: public internal::partition_type_base {
+    public:
+        bool should_execute_range(const task& ) {return false;}
+        partition_type( const simple_partitioner& ) {}
+        partition_type( const partition_type&, split ) {}
+    };
+    // new implementation just extends existing interface
+    typedef interface9::internal::simple_partition_type task_partition_type;
+
+    // TODO: consider to make split_type public
+    typedef interface9::internal::simple_partition_type::split_type split_type;
+};
+
+//! An auto partitioner
+/** The range is initial divided into several large chunks.
+    Chunks are further subdivided into smaller pieces if demand detected and they are divisible.
+    @ingroup algorithms */
+class auto_partitioner {
+public:
+    auto_partitioner() {}
+
+private:
+    template<typename Range, typename Body, typename Partitioner> friend class serial::interface9::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_reduce;
+    template<typename Range, typename Body, typename Partitioner> friend class internal::start_scan;
+    // backward compatibility
+    typedef interface9::internal::old_auto_partition_type partition_type;
+    // new implementation just extends existing interface
+    typedef interface9::internal::auto_partition_type task_partition_type;
+
+    // TODO: consider to make split_type public
+    typedef interface9::internal::auto_partition_type::split_type split_type;
+};
+
+//! A static partitioner
+class static_partitioner {
+public:
+    static_partitioner() {}
+private:
+    template<typename Range, typename Body, typename Partitioner> friend class serial::interface9::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_reduce;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_deterministic_reduce;
+    template<typename Range, typename Body, typename Partitioner> friend class internal::start_scan;
+    // backward compatibility
+    typedef interface9::internal::old_auto_partition_type partition_type;
+    // new implementation just extends existing interface
+    typedef interface9::internal::static_partition_type task_partition_type;
+
+    // TODO: consider to make split_type public
+    typedef interface9::internal::static_partition_type::split_type split_type;
+};
+
+//! An affinity partitioner
+class affinity_partitioner: internal::affinity_partitioner_base_v3 {
+public:
+    affinity_partitioner() {}
+
+private:
+    template<typename Range, typename Body, typename Partitioner> friend class serial::interface9::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_for;
+    template<typename Range, typename Body, typename Partitioner> friend class interface9::internal::start_reduce;
+    template<typename Range, typename Body, typename Partitioner> friend class internal::start_scan;
+    // backward compatibility - for parallel_scan only
+    typedef interface9::internal::old_auto_partition_type partition_type;
+    // new implementation just extends existing interface
+    typedef interface9::internal::affinity_partition_type task_partition_type;
+
+    // TODO: consider to make split_type public
+    typedef interface9::internal::affinity_partition_type::split_type split_type;
+};
+
+} // namespace tbb
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4244 is back
+#undef __TBB_INITIAL_CHUNKS
+#undef __TBB_RANGE_POOL_CAPACITY
+#undef __TBB_INIT_DEPTH
+#endif /* __TBB_partitioner_H */
diff --git a/xdl/third_party/tbb/include/tbb/pipeline.h b/xdl/third_party/tbb/include/tbb/pipeline.h
new file mode 100644
index 00000000..5521da50
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/pipeline.h
@@ -0,0 +1,665 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_pipeline_H
+#define __TBB_pipeline_H
+
+#include "atomic.h"
+#include "task.h"
+#include "tbb_allocator.h"
+#include <cstddef>
+
+#if __TBB_CPP11_TYPE_PROPERTIES_PRESENT || __TBB_TR1_TYPE_PROPERTIES_IN_STD_PRESENT
+#include <type_traits>
+#endif
+
+namespace tbb {
+
+class pipeline;
+class filter;
+
+//! @cond INTERNAL
+namespace internal {
+
+// The argument for PIPELINE_VERSION should be an integer between 2 and 9
+#define __TBB_PIPELINE_VERSION(x) ((unsigned char)(x-2)<<1)
+
+typedef unsigned long Token;
+typedef long tokendiff_t;
+class stage_task;
+class input_buffer;
+class pipeline_root_task;
+class pipeline_cleaner;
+
+} // namespace internal
+
+namespace interface6 {
+    template<typename T, typename U> class filter_t;
+
+    namespace internal {
+        class pipeline_proxy;
+    }
+}
+
+//! @endcond
+
+//! A stage in a pipeline.
+/** @ingroup algorithms */
+class filter: internal::no_copy {
+private:
+    //! Value used to mark "not in pipeline"
+    static filter* not_in_pipeline() {return reinterpret_cast<filter*>(intptr_t(-1));}
+protected:
+    //! The lowest bit 0 is for parallel vs. serial
+    static const unsigned char filter_is_serial = 0x1;
+
+    //! 4th bit distinguishes ordered vs unordered filters.
+    /** The bit was not set for parallel filters in TBB 2.1 and earlier,
+        but is_ordered() function always treats parallel filters as out of order. */
+    static const unsigned char filter_is_out_of_order = 0x1<<4;
+
+    //! 5th bit distinguishes thread-bound and regular filters.
+    static const unsigned char filter_is_bound = 0x1<<5;
+
+    //! 6th bit marks input filters emitting small objects
+    static const unsigned char filter_may_emit_null = 0x1<<6;
+
+    //! 7th bit defines exception propagation mode expected by the application.
+    static const unsigned char exact_exception_propagation =
+#if TBB_USE_CAPTURED_EXCEPTION
+            0x0;
+#else
+            0x1<<7;
+#endif /* TBB_USE_CAPTURED_EXCEPTION */
+
+    static const unsigned char current_version = __TBB_PIPELINE_VERSION(5);
+    static const unsigned char version_mask = 0x7<<1; // bits 1-3 are for version
+public:
+    enum mode {
+        //! processes multiple items in parallel and in no particular order
+        parallel = current_version | filter_is_out_of_order,
+        //! processes items one at a time; all such filters process items in the same order
+        serial_in_order = current_version | filter_is_serial,
+        //! processes items one at a time and in no particular order
+        serial_out_of_order = current_version | filter_is_serial | filter_is_out_of_order,
+        //! @deprecated use serial_in_order instead
+        serial = serial_in_order
+    };
+protected:
+    explicit filter( bool is_serial_ ) :
+        next_filter_in_pipeline(not_in_pipeline()),
+        my_input_buffer(NULL),
+        my_filter_mode(static_cast<unsigned char>((is_serial_ ? serial : parallel) | exact_exception_propagation)),
+        prev_filter_in_pipeline(not_in_pipeline()),
+        my_pipeline(NULL),
+        next_segment(NULL)
+    {}
+
+    explicit filter( mode filter_mode ) :
+        next_filter_in_pipeline(not_in_pipeline()),
+        my_input_buffer(NULL),
+        my_filter_mode(static_cast<unsigned char>(filter_mode | exact_exception_propagation)),
+        prev_filter_in_pipeline(not_in_pipeline()),
+        my_pipeline(NULL),
+        next_segment(NULL)
+    {}
+
+    // signal end-of-input for concrete_filters
+    void __TBB_EXPORTED_METHOD set_end_of_input();
+
+public:
+    //! True if filter is serial.
+    bool is_serial() const {
+        return bool( my_filter_mode & filter_is_serial );
+    }
+
+    //! True if filter must receive stream in order.
+    bool is_ordered() const {
+        return (my_filter_mode & (filter_is_out_of_order|filter_is_serial))==filter_is_serial;
+    }
+
+    //! True if filter is thread-bound.
+    bool is_bound() const {
+        return ( my_filter_mode & filter_is_bound )==filter_is_bound;
+    }
+
+    //! true if an input filter can emit null
+    bool object_may_be_null() {
+        return ( my_filter_mode & filter_may_emit_null ) == filter_may_emit_null;
+    }
+
+    //! Operate on an item from the input stream, and return item for output stream.
+    /** Returns NULL if filter is a sink. */
+    virtual void* operator()( void* item ) = 0;
+
+    //! Destroy filter.
+    /** If the filter was added to a pipeline, the pipeline must be destroyed first. */
+    virtual __TBB_EXPORTED_METHOD ~filter();
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Destroys item if pipeline was cancelled.
+    /** Required to prevent memory leaks.
+        Note it can be called concurrently even for serial filters.*/
+    virtual void finalize( void* /*item*/ ) {};
+#endif
+
+private:
+    //! Pointer to next filter in the pipeline.
+    filter* next_filter_in_pipeline;
+
+    //! has the filter not yet processed all the tokens it will ever see?
+    //  (pipeline has not yet reached end_of_input or this filter has not yet
+    //  seen the last token produced by input_filter)
+    bool has_more_work();
+
+    //! Buffer for incoming tokens, or NULL if not required.
+    /** The buffer is required if the filter is serial or follows a thread-bound one. */
+    internal::input_buffer* my_input_buffer;
+
+    friend class internal::stage_task;
+    friend class internal::pipeline_root_task;
+    friend class pipeline;
+    friend class thread_bound_filter;
+
+    //! Storage for filter mode and dynamically checked implementation version.
+    const unsigned char my_filter_mode;
+
+    //! Pointer to previous filter in the pipeline.
+    filter* prev_filter_in_pipeline;
+
+    //! Pointer to the pipeline.
+    pipeline* my_pipeline;
+
+    //! Pointer to the next "segment" of filters, or NULL if not required.
+    /** In each segment, the first filter is not thread-bound but follows a thread-bound one. */
+    filter* next_segment;
+};
+
+//! A stage in a pipeline served by a user thread.
+/** @ingroup algorithms */
+class thread_bound_filter: public filter {
+public:
+    enum result_type {
+        // item was processed
+        success,
+        // item is currently not available
+        item_not_available,
+        // there are no more items to process
+        end_of_stream
+    };
+protected:
+    explicit thread_bound_filter(mode filter_mode):
+         filter(static_cast<mode>(filter_mode | filter::filter_is_bound))
+    {
+        __TBB_ASSERT(filter_mode & filter::filter_is_serial, "thread-bound filters must be serial");
+    }
+public:
+    //! If a data item is available, invoke operator() on that item.
+    /** This interface is non-blocking.
+        Returns 'success' if an item was processed.
+        Returns 'item_not_available' if no item can be processed now
+        but more may arrive in the future, or if token limit is reached.
+        Returns 'end_of_stream' if there are no more items to process. */
+    result_type __TBB_EXPORTED_METHOD try_process_item();
+
+    //! Wait until a data item becomes available, and invoke operator() on that item.
+    /** This interface is blocking.
+        Returns 'success' if an item was processed.
+        Returns 'end_of_stream' if there are no more items to process.
+        Never returns 'item_not_available', as it blocks until another return condition applies. */
+    result_type __TBB_EXPORTED_METHOD process_item();
+
+private:
+    //! Internal routine for item processing
+    result_type internal_process_item(bool is_blocking);
+};
+
+//! A processing pipeline that applies filters to items.
+/** @ingroup algorithms */
+class pipeline {
+public:
+    //! Construct empty pipeline.
+    __TBB_EXPORTED_METHOD pipeline();
+
+    /** Though the current implementation declares the destructor virtual, do not rely on this
+        detail.  The virtualness is deprecated and may disappear in future versions of TBB. */
+    virtual __TBB_EXPORTED_METHOD ~pipeline();
+
+    //! Add filter to end of pipeline.
+    void __TBB_EXPORTED_METHOD add_filter( filter& filter_ );
+
+    //! Run the pipeline to completion.
+    void __TBB_EXPORTED_METHOD run( size_t max_number_of_live_tokens );
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Run the pipeline to completion with user-supplied context.
+    void __TBB_EXPORTED_METHOD run( size_t max_number_of_live_tokens, tbb::task_group_context& context );
+#endif
+
+    //! Remove all filters from the pipeline.
+    void __TBB_EXPORTED_METHOD clear();
+
+private:
+    friend class internal::stage_task;
+    friend class internal::pipeline_root_task;
+    friend class filter;
+    friend class thread_bound_filter;
+    friend class internal::pipeline_cleaner;
+    friend class tbb::interface6::internal::pipeline_proxy;
+
+    //! Pointer to first filter in the pipeline.
+    filter* filter_list;
+
+    //! Pointer to location where address of next filter to be added should be stored.
+    filter* filter_end;
+
+    //! task who's reference count is used to determine when all stages are done.
+    task* end_counter;
+
+    //! Number of idle tokens waiting for input stage.
+    atomic<internal::Token> input_tokens;
+
+    //! Global counter of tokens
+    atomic<internal::Token> token_counter;
+
+    //! False until fetch_input returns NULL.
+    bool end_of_input;
+
+    //! True if the pipeline contains a thread-bound filter; false otherwise.
+    bool has_thread_bound_filters;
+
+    //! Remove filter from pipeline.
+    void remove_filter( filter& filter_ );
+
+    //! Not used, but retained to satisfy old export files.
+    void __TBB_EXPORTED_METHOD inject_token( task& self );
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Does clean up if pipeline is cancelled or exception occurred
+    void clear_filters();
+#endif
+};
+
+//------------------------------------------------------------------------
+// Support for lambda-friendly parallel_pipeline interface
+//------------------------------------------------------------------------
+
+namespace interface6 {
+
+namespace internal {
+    template<typename T, typename U, typename Body> class concrete_filter;
+}
+
+//! input_filter control to signal end-of-input for parallel_pipeline
+class flow_control {
+    bool is_pipeline_stopped;
+    flow_control() { is_pipeline_stopped = false; }
+    template<typename T, typename U, typename Body> friend class internal::concrete_filter;
+public:
+    void stop() { is_pipeline_stopped = true; }
+};
+
+//! @cond INTERNAL
+namespace internal {
+
+template<typename T> struct tbb_large_object {enum { value = sizeof(T) > sizeof(void *) }; };
+
+// Obtain type properties in one or another way
+#if   __TBB_CPP11_TYPE_PROPERTIES_PRESENT
+template<typename T> struct tbb_trivially_copyable { enum { value = std::is_trivially_copyable<T>::value }; };
+#elif __TBB_TR1_TYPE_PROPERTIES_IN_STD_PRESENT
+template<typename T> struct tbb_trivially_copyable { enum { value = std::has_trivial_copy_constructor<T>::value }; };
+#else
+// Explicitly list the types we wish to be placed as-is in the pipeline input_buffers.
+template<typename T> struct tbb_trivially_copyable { enum { value = false }; };
+template<typename T> struct tbb_trivially_copyable <T*> { enum { value = true }; };
+template<> struct tbb_trivially_copyable <short> { enum { value = true }; };
+template<> struct tbb_trivially_copyable <unsigned short> { enum { value = true }; };
+template<> struct tbb_trivially_copyable <int> { enum { value = !tbb_large_object<int>::value }; };
+template<> struct tbb_trivially_copyable <unsigned int> { enum { value = !tbb_large_object<int>::value }; };
+template<> struct tbb_trivially_copyable <long> { enum { value = !tbb_large_object<long>::value }; };
+template<> struct tbb_trivially_copyable <unsigned long> { enum { value = !tbb_large_object<long>::value }; };
+template<> struct tbb_trivially_copyable <float> { enum { value = !tbb_large_object<float>::value }; };
+template<> struct tbb_trivially_copyable <double> { enum { value = !tbb_large_object<double>::value }; };
+#endif // Obtaining type properties
+
+template<typename T> struct is_large_object {enum { value = tbb_large_object<T>::value || !tbb_trivially_copyable<T>::value }; };
+
+template<typename T, bool> class token_helper;
+
+// large object helper (uses tbb_allocator)
+template<typename T>
+class token_helper<T, true> {
+    public:
+    typedef typename tbb::tbb_allocator<T> allocator;
+    typedef T* pointer;
+    typedef T value_type;
+    static pointer create_token(const value_type & source) {
+        pointer output_t = allocator().allocate(1);
+        return new (output_t) T(source);
+    }
+    static value_type & token(pointer & t) { return *t;}
+    static void * cast_to_void_ptr(pointer ref) { return (void *) ref; }
+    static pointer cast_from_void_ptr(void * ref) { return (pointer)ref; }
+    static void destroy_token(pointer token) {
+        allocator().destroy(token);
+        allocator().deallocate(token,1);
+    }
+};
+
+// pointer specialization
+template<typename T>
+class token_helper<T*, false > {
+    public:
+    typedef T* pointer;
+    typedef T* value_type;
+    static pointer create_token(const value_type & source) { return source; }
+    static value_type & token(pointer & t) { return t;}
+    static void * cast_to_void_ptr(pointer ref) { return (void *)ref; }
+    static pointer cast_from_void_ptr(void * ref) { return (pointer)ref; }
+    static void destroy_token( pointer /*token*/) {}
+};
+
+// small object specialization (converts void* to the correct type, passes objects directly.)
+template<typename T>
+class token_helper<T, false> {
+    typedef union {
+        T actual_value;
+        void * void_overlay;
+    } type_to_void_ptr_map;
+    public:
+    typedef T pointer;  // not really a pointer in this case.
+    typedef T value_type;
+    static pointer create_token(const value_type & source) {
+        return source; }
+    static value_type & token(pointer & t) { return t;}
+    static void * cast_to_void_ptr(pointer ref) {
+        type_to_void_ptr_map mymap;
+        mymap.void_overlay = NULL;
+        mymap.actual_value = ref;
+        return mymap.void_overlay;
+    }
+    static pointer cast_from_void_ptr(void * ref) {
+        type_to_void_ptr_map mymap;
+        mymap.void_overlay = ref;
+        return mymap.actual_value;
+    }
+    static void destroy_token( pointer /*token*/) {}
+};
+
+template<typename T, typename U, typename Body>
+class concrete_filter: public tbb::filter {
+    const Body& my_body;
+    typedef token_helper<T,is_large_object<T>::value > t_helper;
+    typedef typename t_helper::pointer t_pointer;
+    typedef token_helper<U,is_large_object<U>::value > u_helper;
+    typedef typename u_helper::pointer u_pointer;
+
+    void* operator()(void* input) __TBB_override {
+        t_pointer temp_input = t_helper::cast_from_void_ptr(input);
+        u_pointer output_u = u_helper::create_token(my_body(t_helper::token(temp_input)));
+        t_helper::destroy_token(temp_input);
+        return u_helper::cast_to_void_ptr(output_u);
+    }
+
+    void finalize(void * input) __TBB_override {
+        t_pointer temp_input = t_helper::cast_from_void_ptr(input);
+        t_helper::destroy_token(temp_input);
+    }
+
+public:
+    concrete_filter(tbb::filter::mode filter_mode, const Body& body) : filter(filter_mode), my_body(body) {}
+};
+
+// input
+template<typename U, typename Body>
+class concrete_filter<void,U,Body>: public filter {
+    const Body& my_body;
+    typedef token_helper<U, is_large_object<U>::value > u_helper;
+    typedef typename u_helper::pointer u_pointer;
+
+    void* operator()(void*) __TBB_override {
+        flow_control control;
+        u_pointer output_u = u_helper::create_token(my_body(control));
+        if(control.is_pipeline_stopped) {
+            u_helper::destroy_token(output_u);
+            set_end_of_input();
+            return NULL;
+        }
+        return u_helper::cast_to_void_ptr(output_u);
+    }
+
+public:
+    concrete_filter(tbb::filter::mode filter_mode, const Body& body) :
+        filter(static_cast<tbb::filter::mode>(filter_mode | filter_may_emit_null)),
+        my_body(body)
+    {}
+};
+
+template<typename T, typename Body>
+class concrete_filter<T,void,Body>: public filter {
+    const Body& my_body;
+    typedef token_helper<T, is_large_object<T>::value > t_helper;
+    typedef typename t_helper::pointer t_pointer;
+
+    void* operator()(void* input) __TBB_override {
+        t_pointer temp_input = t_helper::cast_from_void_ptr(input);
+        my_body(t_helper::token(temp_input));
+        t_helper::destroy_token(temp_input);
+        return NULL;
+    }
+    void finalize(void* input) __TBB_override {
+        t_pointer temp_input = t_helper::cast_from_void_ptr(input);
+        t_helper::destroy_token(temp_input);
+    }
+
+public:
+    concrete_filter(tbb::filter::mode filter_mode, const Body& body) : filter(filter_mode), my_body(body) {}
+};
+
+template<typename Body>
+class concrete_filter<void,void,Body>: public filter {
+    const Body& my_body;
+
+    /** Override privately because it is always called virtually */
+    void* operator()(void*) __TBB_override {
+        flow_control control;
+        my_body(control);
+        void* output = control.is_pipeline_stopped ? NULL : (void*)(intptr_t)-1;
+        return output;
+    }
+public:
+    concrete_filter(filter::mode filter_mode, const Body& body) : filter(filter_mode), my_body(body) {}
+};
+
+//! The class that represents an object of the pipeline for parallel_pipeline().
+/** It primarily serves as RAII class that deletes heap-allocated filter instances. */
+class pipeline_proxy {
+    tbb::pipeline my_pipe;
+public:
+    pipeline_proxy( const filter_t<void,void>& filter_chain );
+    ~pipeline_proxy() {
+        while( filter* f = my_pipe.filter_list )
+            delete f; // filter destructor removes it from the pipeline
+    }
+    tbb::pipeline* operator->() { return &my_pipe; }
+};
+
+//! Abstract base class that represents a node in a parse tree underlying a filter_t.
+/** These nodes are always heap-allocated and can be shared by filter_t objects. */
+class filter_node: tbb::internal::no_copy {
+    /** Count must be atomic because it is hidden state for user, but might be shared by threads. */
+    tbb::atomic<intptr_t> ref_count;
+protected:
+    filter_node() {
+        ref_count = 0;
+#ifdef __TBB_TEST_FILTER_NODE_COUNT
+        ++(__TBB_TEST_FILTER_NODE_COUNT);
+#endif
+    }
+public:
+    //! Add concrete_filter to pipeline
+    virtual void add_to( pipeline& ) = 0;
+    //! Increment reference count
+    void add_ref() {++ref_count;}
+    //! Decrement reference count and delete if it becomes zero.
+    void remove_ref() {
+        __TBB_ASSERT(ref_count>0,"ref_count underflow");
+        if( --ref_count==0 )
+            delete this;
+    }
+    virtual ~filter_node() {
+#ifdef __TBB_TEST_FILTER_NODE_COUNT
+        --(__TBB_TEST_FILTER_NODE_COUNT);
+#endif
+    }
+};
+
+//! Node in parse tree representing result of make_filter.
+template<typename T, typename U, typename Body>
+class filter_node_leaf: public filter_node  {
+    const tbb::filter::mode mode;
+    const Body body;
+    void add_to( pipeline& p ) __TBB_override {
+        concrete_filter<T,U,Body>* f = new concrete_filter<T,U,Body>(mode,body);
+        p.add_filter( *f );
+    }
+public:
+    filter_node_leaf( tbb::filter::mode m, const Body& b ) : mode(m), body(b) {}
+};
+
+//! Node in parse tree representing join of two filters.
+class filter_node_join: public filter_node {
+    friend class filter_node; // to suppress GCC 3.2 warnings
+    filter_node& left;
+    filter_node& right;
+    ~filter_node_join() {
+       left.remove_ref();
+       right.remove_ref();
+    }
+    void add_to( pipeline& p ) __TBB_override {
+        left.add_to(p);
+        right.add_to(p);
+    }
+public:
+    filter_node_join( filter_node& x, filter_node& y ) : left(x), right(y) {
+       left.add_ref();
+       right.add_ref();
+    }
+};
+
+} // namespace internal
+//! @endcond
+
+//! Create a filter to participate in parallel_pipeline
+template<typename T, typename U, typename Body>
+filter_t<T,U> make_filter(tbb::filter::mode mode, const Body& body) {
+    return new internal::filter_node_leaf<T,U,Body>(mode, body);
+}
+
+template<typename T, typename V, typename U>
+filter_t<T,U> operator& (const filter_t<T,V>& left, const filter_t<V,U>& right) {
+    __TBB_ASSERT(left.root,"cannot use default-constructed filter_t as left argument of '&'");
+    __TBB_ASSERT(right.root,"cannot use default-constructed filter_t as right argument of '&'");
+    return new internal::filter_node_join(*left.root,*right.root);
+}
+
+//! Class representing a chain of type-safe pipeline filters
+template<typename T, typename U>
+class filter_t {
+    typedef internal::filter_node filter_node;
+    filter_node* root;
+    filter_t( filter_node* root_ ) : root(root_) {
+        root->add_ref();
+    }
+    friend class internal::pipeline_proxy;
+    template<typename T_, typename U_, typename Body>
+    friend filter_t<T_,U_> make_filter(tbb::filter::mode, const Body& );
+    template<typename T_, typename V_, typename U_>
+    friend filter_t<T_,U_> operator& (const filter_t<T_,V_>& , const filter_t<V_,U_>& );
+public:
+    // TODO: add move-constructors, move-assignment, etc. where C++11 is available.
+    filter_t() : root(NULL) {}
+    filter_t( const filter_t<T,U>& rhs ) : root(rhs.root) {
+        if( root ) root->add_ref();
+    }
+    template<typename Body>
+    filter_t( tbb::filter::mode mode, const Body& body ) :
+        root( new internal::filter_node_leaf<T,U,Body>(mode, body) ) {
+        root->add_ref();
+    }
+
+    void operator=( const filter_t<T,U>& rhs ) {
+        // Order of operations below carefully chosen so that reference counts remain correct
+        // in unlikely event that remove_ref throws exception.
+        filter_node* old = root;
+        root = rhs.root;
+        if( root ) root->add_ref();
+        if( old ) old->remove_ref();
+    }
+    ~filter_t() {
+        if( root ) root->remove_ref();
+    }
+    void clear() {
+        // Like operator= with filter_t() on right side.
+        if( root ) {
+            filter_node* old = root;
+            root = NULL;
+            old->remove_ref();
+        }
+    }
+};
+
+inline internal::pipeline_proxy::pipeline_proxy( const filter_t<void,void>& filter_chain ) : my_pipe() {
+    __TBB_ASSERT( filter_chain.root, "cannot apply parallel_pipeline to default-constructed filter_t"  );
+    filter_chain.root->add_to(my_pipe);
+}
+
+inline void parallel_pipeline(size_t max_number_of_live_tokens, const filter_t<void,void>& filter_chain
+#if __TBB_TASK_GROUP_CONTEXT
+    , tbb::task_group_context& context
+#endif
+    ) {
+    internal::pipeline_proxy pipe(filter_chain);
+    // tbb::pipeline::run() is called via the proxy
+    pipe->run(max_number_of_live_tokens
+#if __TBB_TASK_GROUP_CONTEXT
+              , context
+#endif
+    );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+inline void parallel_pipeline(size_t max_number_of_live_tokens, const filter_t<void,void>& filter_chain) {
+    tbb::task_group_context context;
+    parallel_pipeline(max_number_of_live_tokens, filter_chain, context);
+}
+#endif // __TBB_TASK_GROUP_CONTEXT
+
+} // interface6
+
+using interface6::flow_control;
+using interface6::filter_t;
+using interface6::make_filter;
+using interface6::parallel_pipeline;
+
+} // tbb
+
+#endif /* __TBB_pipeline_H */
diff --git a/xdl/third_party/tbb/include/tbb/queuing_mutex.h b/xdl/third_party/tbb/include/tbb/queuing_mutex.h
new file mode 100644
index 00000000..70924991
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/queuing_mutex.h
@@ -0,0 +1,111 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_queuing_mutex_H
+#define __TBB_queuing_mutex_H
+
+#include <cstring>
+#include "atomic.h"
+#include "tbb_profiling.h"
+
+namespace tbb {
+
+//! Queuing mutex with local-only spinning.
+/** @ingroup synchronization */
+class queuing_mutex : internal::mutex_copy_deprecated_and_disabled {
+public:
+    //! Construct unacquired mutex.
+    queuing_mutex() {
+        q_tail = NULL;
+#if TBB_USE_THREADING_TOOLS
+        internal_construct();
+#endif
+    }
+
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    class scoped_lock: internal::no_copy {
+        //! Initialize fields to mean "no lock held".
+        void initialize() {
+            mutex = NULL;
+            going = 0;
+#if TBB_USE_ASSERT
+            internal::poison_pointer(next);
+#endif /* TBB_USE_ASSERT */
+        }
+
+    public:
+        //! Construct lock that has not acquired a mutex.
+        /** Equivalent to zero-initialization of *this. */
+        scoped_lock() {initialize();}
+
+        //! Acquire lock on given mutex.
+        scoped_lock( queuing_mutex& m ) {
+            initialize();
+            acquire(m);
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if( mutex ) release();
+        }
+
+        //! Acquire lock on given mutex.
+        void __TBB_EXPORTED_METHOD acquire( queuing_mutex& m );
+
+        //! Acquire lock on given mutex if free (i.e. non-blocking)
+        bool __TBB_EXPORTED_METHOD try_acquire( queuing_mutex& m );
+
+        //! Release lock.
+        void __TBB_EXPORTED_METHOD release();
+
+    private:
+        //! The pointer to the mutex owned, or NULL if not holding a mutex.
+        queuing_mutex* mutex;
+
+        //! The pointer to the next competitor for a mutex
+        scoped_lock *next;
+
+        //! The local spin-wait variable
+        /** Inverted (0 - blocked, 1 - acquired the mutex) for the sake of
+            zero-initialization.  Defining it as an entire word instead of
+            a byte seems to help performance slightly. */
+        uintptr_t going;
+    };
+
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    // Mutex traits
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = true;
+
+private:
+    //! The last competitor requesting the lock
+    atomic<scoped_lock*> q_tail;
+
+};
+
+__TBB_DEFINE_PROFILING_SET_NAME(queuing_mutex)
+
+} // namespace tbb
+
+#endif /* __TBB_queuing_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/queuing_rw_mutex.h b/xdl/third_party/tbb/include/tbb/queuing_rw_mutex.h
new file mode 100644
index 00000000..9dd8444b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/queuing_rw_mutex.h
@@ -0,0 +1,152 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_queuing_rw_mutex_H
+#define __TBB_queuing_rw_mutex_H
+
+#include <cstring>
+#include "atomic.h"
+#include "tbb_profiling.h"
+
+namespace tbb {
+
+//! Queuing reader-writer mutex with local-only spinning.
+/** Adapted from Krieger, Stumm, et al. pseudocode at
+    http://www.eecg.toronto.edu/parallel/pubs_abs.html#Krieger_etal_ICPP93
+    @ingroup synchronization */
+class queuing_rw_mutex : internal::mutex_copy_deprecated_and_disabled {
+public:
+    //! Construct unacquired mutex.
+    queuing_rw_mutex() {
+        q_tail = NULL;
+#if TBB_USE_THREADING_TOOLS
+        internal_construct();
+#endif
+    }
+
+    //! Destructor asserts if the mutex is acquired, i.e. q_tail is non-NULL
+    ~queuing_rw_mutex() {
+#if TBB_USE_ASSERT
+        __TBB_ASSERT( !q_tail, "destruction of an acquired mutex");
+#endif
+    }
+
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    class scoped_lock: internal::no_copy {
+        //! Initialize fields to mean "no lock held".
+        void initialize() {
+            my_mutex = NULL;
+            my_internal_lock = 0;
+            my_going = 0;
+#if TBB_USE_ASSERT
+            my_state = 0xFF; // Set to invalid state
+            internal::poison_pointer(my_next);
+            internal::poison_pointer(my_prev);
+#endif /* TBB_USE_ASSERT */
+        }
+
+    public:
+        //! Construct lock that has not acquired a mutex.
+        /** Equivalent to zero-initialization of *this. */
+        scoped_lock() {initialize();}
+
+        //! Acquire lock on given mutex.
+        scoped_lock( queuing_rw_mutex& m, bool write=true ) {
+            initialize();
+            acquire(m,write);
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if( my_mutex ) release();
+        }
+
+        //! Acquire lock on given mutex.
+        void acquire( queuing_rw_mutex& m, bool write=true );
+
+        //! Acquire lock on given mutex if free (i.e. non-blocking)
+        bool try_acquire( queuing_rw_mutex& m, bool write=true );
+
+        //! Release lock.
+        void release();
+
+        //! Upgrade reader to become a writer.
+        /** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+        bool upgrade_to_writer();
+
+        //! Downgrade writer to become a reader.
+        bool downgrade_to_reader();
+
+    private:
+        //! The pointer to the mutex owned, or NULL if not holding a mutex.
+        queuing_rw_mutex* my_mutex;
+
+        //! The pointer to the previous and next competitors for a mutex
+        scoped_lock *__TBB_atomic my_prev, *__TBB_atomic my_next;
+
+        typedef unsigned char state_t;
+
+        //! State of the request: reader, writer, active reader, other service states
+        atomic<state_t> my_state;
+
+        //! The local spin-wait variable
+        /** Corresponds to "spin" in the pseudocode but inverted for the sake of zero-initialization */
+        unsigned char __TBB_atomic my_going;
+
+        //! A tiny internal lock
+        unsigned char my_internal_lock;
+
+        //! Acquire the internal lock
+        void acquire_internal_lock();
+
+        //! Try to acquire the internal lock
+        /** Returns true if lock was successfully acquired. */
+        bool try_acquire_internal_lock();
+
+        //! Release the internal lock
+        void release_internal_lock();
+
+        //! Wait for internal lock to be released
+        void wait_for_release_of_internal_lock();
+
+        //! A helper function
+        void unblock_or_wait_on_internal_lock( uintptr_t );
+    };
+
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    // Mutex traits
+    static const bool is_rw_mutex = true;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = true;
+
+private:
+    //! The last competitor requesting the lock
+    atomic<scoped_lock*> q_tail;
+
+};
+
+__TBB_DEFINE_PROFILING_SET_NAME(queuing_rw_mutex)
+
+} // namespace tbb
+
+#endif /* __TBB_queuing_rw_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/reader_writer_lock.h b/xdl/third_party/tbb/include/tbb/reader_writer_lock.h
new file mode 100644
index 00000000..f2546d5c
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/reader_writer_lock.h
@@ -0,0 +1,232 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_reader_writer_lock_H
+#define __TBB_reader_writer_lock_H
+
+#include "tbb_thread.h"
+#include "tbb_allocator.h"
+#include "atomic.h"
+
+namespace tbb {
+namespace interface5 {
+//! Writer-preference reader-writer lock with local-only spinning on readers.
+/** Loosely adapted from Mellor-Crummey and Scott pseudocode at
+    http://www.cs.rochester.edu/research/synchronization/pseudocode/rw.html#s_wp
+    @ingroup synchronization */
+    class reader_writer_lock : tbb::internal::no_copy {
+ public:
+    friend class scoped_lock;
+    friend class scoped_lock_read;
+    //! Status type for nodes associated with lock instances
+    /** waiting_nonblocking: the wait state for nonblocking lock
+          instances; for writes, these transition straight to active
+          states; for reads, these are unused.
+
+        waiting: the start and spin state for all lock instances; these will
+          transition to active state when appropriate.  Non-blocking write locks
+          transition from this state to waiting_nonblocking immediately.
+
+        active: the active state means that the lock instance holds
+          the lock; it will transition to invalid state during node deletion
+
+        invalid: the end state for all nodes; this is set in the
+          destructor so if we encounter this state, we are looking at
+          memory that has already been freed
+
+        The state diagrams below describe the status transitions.
+        Single arrows indicate that the thread that owns the node is
+        responsible for the transition; double arrows indicate that
+        any thread could make the transition.
+
+        State diagram for scoped_lock status:
+
+        waiting ----------> waiting_nonblocking
+          |     _____________/       |
+          V    V                     V
+        active -----------------> invalid
+
+        State diagram for scoped_lock_read status:
+
+        waiting
+          |
+          V
+        active ----------------->invalid
+
+    */
+    enum status_t { waiting_nonblocking, waiting, active, invalid };
+
+    //! Constructs a new reader_writer_lock
+    reader_writer_lock() {
+        internal_construct();
+    }
+
+    //! Destructs a reader_writer_lock object
+    ~reader_writer_lock() {
+        internal_destroy();
+    }
+
+    //! The scoped lock pattern for write locks
+    /** Scoped locks help avoid the common problem of forgetting to release the lock.
+        This type also serves as the node for queuing locks. */
+    class scoped_lock : tbb::internal::no_copy {
+    public:
+        friend class reader_writer_lock;
+
+        //! Construct with blocking attempt to acquire write lock on the passed-in lock
+        scoped_lock(reader_writer_lock& lock) {
+            internal_construct(lock);
+        }
+
+        //! Destructor, releases the write lock
+        ~scoped_lock() {
+            internal_destroy();
+        }
+
+        void* operator new(size_t s) {
+            return tbb::internal::allocate_via_handler_v3(s);
+        }
+        void operator delete(void* p) {
+            tbb::internal::deallocate_via_handler_v3(p);
+        }
+
+    private:
+        //! The pointer to the mutex to lock
+        reader_writer_lock *mutex;
+        //! The next queued competitor for the mutex
+        scoped_lock* next;
+        //! Status flag of the thread associated with this node
+        atomic<status_t> status;
+
+        //! Construct scoped_lock that is not holding lock
+        scoped_lock();
+
+        void __TBB_EXPORTED_METHOD internal_construct(reader_writer_lock&);
+        void __TBB_EXPORTED_METHOD internal_destroy();
+   };
+
+    //! The scoped lock pattern for read locks
+    class scoped_lock_read : tbb::internal::no_copy {
+    public:
+        friend class reader_writer_lock;
+
+        //! Construct with blocking attempt to acquire read lock on the passed-in lock
+        scoped_lock_read(reader_writer_lock& lock) {
+            internal_construct(lock);
+        }
+
+        //! Destructor, releases the read lock
+        ~scoped_lock_read() {
+            internal_destroy();
+        }
+
+        void* operator new(size_t s) {
+            return tbb::internal::allocate_via_handler_v3(s);
+        }
+        void operator delete(void* p) {
+            tbb::internal::deallocate_via_handler_v3(p);
+        }
+
+    private:
+        //! The pointer to the mutex to lock
+        reader_writer_lock *mutex;
+        //! The next queued competitor for the mutex
+        scoped_lock_read *next;
+        //! Status flag of the thread associated with this node
+        atomic<status_t> status;
+
+        //! Construct scoped_lock_read that is not holding lock
+        scoped_lock_read();
+
+        void __TBB_EXPORTED_METHOD internal_construct(reader_writer_lock&);
+        void __TBB_EXPORTED_METHOD internal_destroy();
+    };
+
+    //! Acquires the reader_writer_lock for write.
+    /** If the lock is currently held in write mode by another
+        context, the writer will block by spinning on a local
+        variable.  Exceptions thrown: improper_lock The context tries
+        to acquire a reader_writer_lock that it already has write
+        ownership of.*/
+    void __TBB_EXPORTED_METHOD lock();
+
+    //! Tries to acquire the reader_writer_lock for write.
+    /** This function does not block.  Return Value: True or false,
+        depending on whether the lock is acquired or not.  If the lock
+        is already held by this acquiring context, try_lock() returns
+        false. */
+    bool __TBB_EXPORTED_METHOD try_lock();
+
+    //! Acquires the reader_writer_lock for read.
+    /** If the lock is currently held by a writer, this reader will
+        block and wait until the writers are done.  Exceptions thrown:
+        improper_lock The context tries to acquire a
+        reader_writer_lock that it already has write ownership of. */
+    void __TBB_EXPORTED_METHOD lock_read();
+
+    //! Tries to acquire the reader_writer_lock for read.
+    /** This function does not block.  Return Value: True or false,
+        depending on whether the lock is acquired or not.  */
+    bool __TBB_EXPORTED_METHOD try_lock_read();
+
+    //! Releases the reader_writer_lock
+    void __TBB_EXPORTED_METHOD unlock();
+
+ private:
+    void __TBB_EXPORTED_METHOD internal_construct();
+    void __TBB_EXPORTED_METHOD internal_destroy();
+
+    //! Attempts to acquire write lock
+    /** If unavailable, spins in blocking case, returns false in non-blocking case. */
+    bool start_write(scoped_lock *);
+    //! Sets writer_head to w and attempts to unblock
+    void set_next_writer(scoped_lock *w);
+    //! Relinquishes write lock to next waiting writer or group of readers
+    void end_write(scoped_lock *);
+    //! Checks if current thread holds write lock
+    bool is_current_writer();
+
+    //! Attempts to acquire read lock
+    /** If unavailable, spins in blocking case, returns false in non-blocking case. */
+    void start_read(scoped_lock_read *);
+    //! Unblocks pending readers
+    void unblock_readers();
+    //! Relinquishes read lock by decrementing counter; last reader wakes pending writer
+    void end_read();
+
+    //! The list of pending readers
+    atomic<scoped_lock_read*> reader_head;
+    //! The list of pending writers
+    atomic<scoped_lock*> writer_head;
+    //! The last node in the list of pending writers
+    atomic<scoped_lock*> writer_tail;
+    //! Writer that owns the mutex; tbb_thread::id() otherwise.
+    tbb_thread::id my_current_writer;
+    //! Status of mutex
+    atomic<uintptr_t> rdr_count_and_flags; // used with __TBB_AtomicOR, which assumes uintptr_t
+};
+
+} // namespace interface5
+
+using interface5::reader_writer_lock;
+
+} // namespace tbb
+
+#endif /* __TBB_reader_writer_lock_H */
diff --git a/xdl/third_party/tbb/include/tbb/recursive_mutex.h b/xdl/third_party/tbb/include/tbb/recursive_mutex.h
new file mode 100644
index 00000000..ffebee54
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/recursive_mutex.h
@@ -0,0 +1,234 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_recursive_mutex_H
+#define __TBB_recursive_mutex_H
+
+#if _WIN32||_WIN64
+#include "machine/windows_api.h"
+#else
+#include <pthread.h>
+#endif /* _WIN32||_WIN64 */
+
+#include <new>
+#include "aligned_space.h"
+#include "tbb_stddef.h"
+#include "tbb_profiling.h"
+
+namespace tbb {
+//! Mutex that allows recursive mutex acquisition.
+/** Mutex that allows recursive mutex acquisition.
+    @ingroup synchronization */
+class recursive_mutex : internal::mutex_copy_deprecated_and_disabled {
+public:
+    //! Construct unacquired recursive_mutex.
+    recursive_mutex() {
+#if TBB_USE_ASSERT || TBB_USE_THREADING_TOOLS
+        internal_construct();
+#else
+  #if _WIN32||_WIN64
+        InitializeCriticalSectionEx(&impl, 4000, 0);
+  #else
+        pthread_mutexattr_t mtx_attr;
+        int error_code = pthread_mutexattr_init( &mtx_attr );
+        if( error_code )
+            tbb::internal::handle_perror(error_code,"recursive_mutex: pthread_mutexattr_init failed");
+
+        pthread_mutexattr_settype( &mtx_attr, PTHREAD_MUTEX_RECURSIVE );
+        error_code = pthread_mutex_init( &impl, &mtx_attr );
+        if( error_code )
+            tbb::internal::handle_perror(error_code,"recursive_mutex: pthread_mutex_init failed");
+
+        pthread_mutexattr_destroy( &mtx_attr );
+  #endif /* _WIN32||_WIN64*/
+#endif /* TBB_USE_ASSERT */
+    };
+
+    ~recursive_mutex() {
+#if TBB_USE_ASSERT
+        internal_destroy();
+#else
+  #if _WIN32||_WIN64
+        DeleteCriticalSection(&impl);
+  #else
+        pthread_mutex_destroy(&impl);
+
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    };
+
+    class scoped_lock;
+    friend class scoped_lock;
+
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    class scoped_lock: internal::no_copy {
+    public:
+        //! Construct lock that has not acquired a recursive_mutex.
+        scoped_lock() : my_mutex(NULL) {};
+
+        //! Acquire lock on given mutex.
+        scoped_lock( recursive_mutex& mutex ) {
+#if TBB_USE_ASSERT
+            my_mutex = &mutex;
+#endif /* TBB_USE_ASSERT */
+            acquire( mutex );
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if( my_mutex )
+                release();
+        }
+
+        //! Acquire lock on given mutex.
+        void acquire( recursive_mutex& mutex ) {
+#if TBB_USE_ASSERT
+            internal_acquire( mutex );
+#else
+            my_mutex = &mutex;
+            mutex.lock();
+#endif /* TBB_USE_ASSERT */
+        }
+
+        //! Try acquire lock on given recursive_mutex.
+        bool try_acquire( recursive_mutex& mutex ) {
+#if TBB_USE_ASSERT
+            return internal_try_acquire( mutex );
+#else
+            bool result = mutex.try_lock();
+            if( result )
+                my_mutex = &mutex;
+            return result;
+#endif /* TBB_USE_ASSERT */
+        }
+
+        //! Release lock
+        void release() {
+#if TBB_USE_ASSERT
+            internal_release();
+#else
+            my_mutex->unlock();
+            my_mutex = NULL;
+#endif /* TBB_USE_ASSERT */
+        }
+
+    private:
+        //! The pointer to the current recursive_mutex to work
+        recursive_mutex* my_mutex;
+
+        //! All checks from acquire using mutex.state were moved here
+        void __TBB_EXPORTED_METHOD internal_acquire( recursive_mutex& m );
+
+        //! All checks from try_acquire using mutex.state were moved here
+        bool __TBB_EXPORTED_METHOD internal_try_acquire( recursive_mutex& m );
+
+        //! All checks from release using mutex.state were moved here
+        void __TBB_EXPORTED_METHOD internal_release();
+
+        friend class recursive_mutex;
+    };
+
+    // Mutex traits
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = true;
+    static const bool is_fair_mutex = false;
+
+    // C++0x compatibility interface
+
+    //! Acquire lock
+    void lock() {
+#if TBB_USE_ASSERT
+        aligned_space<scoped_lock> tmp;
+        new(tmp.begin()) scoped_lock(*this);
+#else
+  #if _WIN32||_WIN64
+        EnterCriticalSection(&impl);
+  #else
+        int error_code = pthread_mutex_lock(&impl);
+        if( error_code )
+            tbb::internal::handle_perror(error_code,"recursive_mutex: pthread_mutex_lock failed");
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    }
+
+    //! Try acquiring lock (non-blocking)
+    /** Return true if lock acquired; false otherwise. */
+    bool try_lock() {
+#if TBB_USE_ASSERT
+        aligned_space<scoped_lock> tmp;
+        return (new(tmp.begin()) scoped_lock)->internal_try_acquire(*this);
+#else
+  #if _WIN32||_WIN64
+        return TryEnterCriticalSection(&impl)!=0;
+  #else
+        return pthread_mutex_trylock(&impl)==0;
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    }
+
+    //! Release lock
+    void unlock() {
+#if TBB_USE_ASSERT
+        aligned_space<scoped_lock> tmp;
+        scoped_lock& s = *tmp.begin();
+        s.my_mutex = this;
+        s.internal_release();
+#else
+  #if _WIN32||_WIN64
+        LeaveCriticalSection(&impl);
+  #else
+        pthread_mutex_unlock(&impl);
+  #endif /* _WIN32||_WIN64 */
+#endif /* TBB_USE_ASSERT */
+    }
+
+    //! Return native_handle
+  #if _WIN32||_WIN64
+    typedef LPCRITICAL_SECTION native_handle_type;
+  #else
+    typedef pthread_mutex_t* native_handle_type;
+  #endif
+    native_handle_type native_handle() { return (native_handle_type) &impl; }
+
+private:
+#if _WIN32||_WIN64
+    CRITICAL_SECTION impl;
+    enum state_t {
+        INITIALIZED=0x1234,
+        DESTROYED=0x789A,
+    } state;
+#else
+    pthread_mutex_t impl;
+#endif /* _WIN32||_WIN64 */
+
+    //! All checks from mutex constructor using mutex.state were moved here
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    //! All checks from mutex destructor using mutex.state were moved here
+    void __TBB_EXPORTED_METHOD internal_destroy();
+};
+
+__TBB_DEFINE_PROFILING_SET_NAME(recursive_mutex)
+
+} // namespace tbb
+
+#endif /* __TBB_recursive_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/runtime_loader.h b/xdl/third_party/tbb/include/tbb/runtime_loader.h
new file mode 100644
index 00000000..9db7291f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/runtime_loader.h
@@ -0,0 +1,180 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_runtime_loader_H
+#define __TBB_runtime_loader_H
+
+#if ! TBB_PREVIEW_RUNTIME_LOADER
+    #error Set TBB_PREVIEW_RUNTIME_LOADER to include runtime_loader.h
+#endif
+
+#include "tbb_stddef.h"
+#include <climits>
+
+#if _MSC_VER
+    #if ! __TBB_NO_IMPLICIT_LINKAGE
+        #ifdef _DEBUG
+            #pragma comment( linker, "/nodefaultlib:tbb_debug.lib" )
+            #pragma comment( linker, "/defaultlib:tbbproxy_debug.lib" )
+        #else
+            #pragma comment( linker, "/nodefaultlib:tbb.lib" )
+            #pragma comment( linker, "/defaultlib:tbbproxy.lib" )
+        #endif
+    #endif
+#endif
+
+namespace tbb {
+
+namespace interface6 {
+
+//! Load TBB at runtime.
+/*!
+
+\b Usage:
+
+In source code:
+
+\code
+#include "tbb/runtime_loader.h"
+
+char const * path[] = { "<install dir>/lib/ia32", NULL };
+tbb::runtime_loader loader( path );
+
+// Now use TBB.
+\endcode
+
+Link with \c tbbproxy.lib (or \c libtbbproxy.a) instead of \c tbb.lib (\c libtbb.dylib,
+\c libtbb.so).
+
+TBB library will be loaded at runtime from \c <install dir>/lib/ia32 directory.
+
+\b Attention:
+
+All \c runtime_loader objects (in the same module, i.e. exe or dll) share some global state.
+The most noticeable piece of global state is loaded TBB library.
+There are some implications:
+
+    -   Only one TBB library can be loaded per module.
+
+    -   If one object has already loaded TBB library, another object will not load TBB.
+        If the loaded TBB library is suitable for the second object, both will use TBB
+        cooperatively, otherwise the second object will report an error.
+
+    -   \c runtime_loader objects will not work (correctly) in parallel due to absence of
+        synchronization.
+
+*/
+
+class runtime_loader : tbb::internal::no_copy {
+
+    public:
+
+        //! Error mode constants.
+        enum error_mode {
+            em_status,     //!< Save status of operation and continue.
+            em_throw,      //!< Throw an exception of tbb::runtime_loader::error_code type.
+            em_abort       //!< Print message to \c stderr and call \c abort().
+        }; // error_mode
+
+        //! Error codes.
+        enum error_code {
+            ec_ok,         //!< No errors.
+            ec_bad_call,   //!< Invalid function call (e. g. load() called when TBB is already loaded).
+            ec_bad_arg,    //!< Invalid argument passed.
+            ec_bad_lib,    //!< Invalid library found (e. g. \c TBB_runtime_version symbol not found).
+            ec_bad_ver,    //!< TBB found but version is not suitable.
+            ec_no_lib      //!< No suitable TBB library found.
+        }; // error_code
+
+        //! Initialize object but do not load TBB.
+        runtime_loader( error_mode mode = em_abort );
+
+        //! Initialize object and load TBB.
+        /*!
+            See load() for details.
+
+            If error mode is \c em_status, call status() to check whether TBB was loaded or not.
+        */
+        runtime_loader(
+            char const * path[],                           //!< List of directories to search TBB in.
+            int          min_ver = TBB_INTERFACE_VERSION,  //!< Minimal suitable version of TBB.
+            int          max_ver = INT_MAX,                //!< Maximal suitable version of TBB.
+            error_mode   mode    = em_abort                //!< Error mode for this object.
+        );
+
+        //! Destroy object.
+        ~runtime_loader();
+
+        //! Load TBB.
+        /*!
+            The method searches the directories specified in \c path[] array for the TBB library.
+            When the library is found, it is loaded and its version is checked. If the version is
+            not suitable, the library is unloaded, and the search continues.
+
+            \b Note:
+
+            For security reasons, avoid using relative directory names. For example, never load
+            TBB from current (\c "."), parent (\c "..") or any other relative directory (like
+            \c "lib" ). Use only absolute directory names (e. g. "/usr/local/lib").
+
+            For the same security reasons, avoid using system default directories (\c "") on
+            Windows. (See http://www.microsoft.com/technet/security/advisory/2269637.mspx for
+            details.)
+
+            Neglecting these rules may cause your program to execute 3-rd party malicious code.
+
+            \b Errors:
+                -   \c ec_bad_call - TBB already loaded by this object.
+                -   \c ec_bad_arg - \p min_ver and/or \p max_ver negative or zero,
+                    or \p min_ver > \p max_ver.
+                -   \c ec_bad_ver - TBB of unsuitable version already loaded by another object.
+                -   \c ec_no_lib - No suitable library found.
+        */
+        error_code
+        load(
+            char const * path[],                           //!< List of directories to search TBB in.
+            int          min_ver = TBB_INTERFACE_VERSION,  //!< Minimal suitable version of TBB.
+            int          max_ver = INT_MAX                 //!< Maximal suitable version of TBB.
+
+        );
+
+
+        //! Report status.
+        /*!
+            If error mode is \c em_status, the function returns status of the last operation.
+        */
+        error_code status();
+
+    private:
+
+        error_mode const my_mode;
+        error_code       my_status;
+        bool             my_loaded;
+
+}; // class runtime_loader
+
+} // namespace interface6
+
+using interface6::runtime_loader;
+
+} // namespace tbb
+
+#endif /* __TBB_runtime_loader_H */
+
diff --git a/xdl/third_party/tbb/include/tbb/scalable_allocator.h b/xdl/third_party/tbb/include/tbb/scalable_allocator.h
new file mode 100644
index 00000000..6656544b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/scalable_allocator.h
@@ -0,0 +1,342 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_scalable_allocator_H
+#define __TBB_scalable_allocator_H
+/** @file */
+
+#include <stddef.h> /* Need ptrdiff_t and size_t from here. */
+#if !_MSC_VER
+#include <stdint.h> /* Need intptr_t from here. */
+#endif
+
+#if !defined(__cplusplus) && __ICC==1100
+    #pragma warning (push)
+    #pragma warning (disable: 991)
+#endif
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+#if _MSC_VER >= 1400
+#define __TBB_EXPORTED_FUNC   __cdecl
+#else
+#define __TBB_EXPORTED_FUNC
+#endif
+
+/** The "malloc" analogue to allocate block of memory of size bytes.
+  * @ingroup memory_allocation */
+void * __TBB_EXPORTED_FUNC scalable_malloc (size_t size);
+
+/** The "free" analogue to discard a previously allocated piece of memory.
+    @ingroup memory_allocation */
+void   __TBB_EXPORTED_FUNC scalable_free (void* ptr);
+
+/** The "realloc" analogue complementing scalable_malloc.
+    @ingroup memory_allocation */
+void * __TBB_EXPORTED_FUNC scalable_realloc (void* ptr, size_t size);
+
+/** The "calloc" analogue complementing scalable_malloc.
+    @ingroup memory_allocation */
+void * __TBB_EXPORTED_FUNC scalable_calloc (size_t nobj, size_t size);
+
+/** The "posix_memalign" analogue.
+    @ingroup memory_allocation */
+int __TBB_EXPORTED_FUNC scalable_posix_memalign (void** memptr, size_t alignment, size_t size);
+
+/** The "_aligned_malloc" analogue.
+    @ingroup memory_allocation */
+void * __TBB_EXPORTED_FUNC scalable_aligned_malloc (size_t size, size_t alignment);
+
+/** The "_aligned_realloc" analogue.
+    @ingroup memory_allocation */
+void * __TBB_EXPORTED_FUNC scalable_aligned_realloc (void* ptr, size_t size, size_t alignment);
+
+/** The "_aligned_free" analogue.
+    @ingroup memory_allocation */
+void __TBB_EXPORTED_FUNC scalable_aligned_free (void* ptr);
+
+/** The analogue of _msize/malloc_size/malloc_usable_size.
+    Returns the usable size of a memory block previously allocated by scalable_*,
+    or 0 (zero) if ptr does not point to such a block.
+    @ingroup memory_allocation */
+size_t __TBB_EXPORTED_FUNC scalable_msize (void* ptr);
+
+/* Results for scalable_allocation_* functions */
+typedef enum {
+    TBBMALLOC_OK,
+    TBBMALLOC_INVALID_PARAM,
+    TBBMALLOC_UNSUPPORTED,
+    TBBMALLOC_NO_MEMORY,
+    TBBMALLOC_NO_EFFECT
+} ScalableAllocationResult;
+
+/* Setting TBB_MALLOC_USE_HUGE_PAGES environment variable to 1 enables huge pages.
+   scalable_allocation_mode call has priority over environment variable. */
+typedef enum {
+    TBBMALLOC_USE_HUGE_PAGES,  /* value turns using huge pages on and off */
+    /* deprecated, kept for backward compatibility only */
+    USE_HUGE_PAGES = TBBMALLOC_USE_HUGE_PAGES,
+    /* try to limit memory consumption value Bytes, clean internal buffers
+       if limit is exceeded, but not prevents from requesting memory from OS */
+    TBBMALLOC_SET_SOFT_HEAP_LIMIT
+} AllocationModeParam;
+
+/** Set TBB allocator-specific allocation modes.
+    @ingroup memory_allocation */
+int __TBB_EXPORTED_FUNC scalable_allocation_mode(int param, intptr_t value);
+
+typedef enum {
+    /* Clean internal allocator buffers for all threads.
+       Returns TBBMALLOC_NO_EFFECT if no buffers cleaned,
+       TBBMALLOC_OK if some memory released from buffers. */
+    TBBMALLOC_CLEAN_ALL_BUFFERS,
+    /* Clean internal allocator buffer for current thread only.
+       Return values same as for TBBMALLOC_CLEAN_ALL_BUFFERS. */
+    TBBMALLOC_CLEAN_THREAD_BUFFERS
+} ScalableAllocationCmd;
+
+/** Call TBB allocator-specific commands.
+    @ingroup memory_allocation */
+int __TBB_EXPORTED_FUNC scalable_allocation_command(int cmd, void *param);
+
+#ifdef __cplusplus
+} /* extern "C" */
+#endif /* __cplusplus */
+
+#ifdef __cplusplus
+
+//! The namespace rml contains components of low-level memory pool interface.
+namespace rml {
+class MemoryPool;
+
+typedef void *(*rawAllocType)(intptr_t pool_id, size_t &bytes);
+// returns non-zero in case of error
+typedef int   (*rawFreeType)(intptr_t pool_id, void* raw_ptr, size_t raw_bytes);
+
+/*
+MemPoolPolicy extension must be compatible with such structure fields layout
+
+struct MemPoolPolicy {
+    rawAllocType pAlloc;
+    rawFreeType  pFree;
+    size_t       granularity;   // granularity of pAlloc allocations
+};
+*/
+
+struct MemPoolPolicy {
+    enum {
+        TBBMALLOC_POOL_VERSION = 1
+    };
+
+    rawAllocType pAlloc;
+    rawFreeType  pFree;
+                 // granularity of pAlloc allocations. 0 means default used.
+    size_t       granularity;
+    int          version;
+                 // all memory consumed at 1st pAlloc call and never returned,
+                 // no more pAlloc calls after 1st
+    unsigned     fixedPool : 1,
+                 // memory consumed but returned only at pool termination
+                 keepAllMemory : 1,
+                 reserved : 30;
+
+    MemPoolPolicy(rawAllocType pAlloc_, rawFreeType pFree_,
+                  size_t granularity_ = 0, bool fixedPool_ = false,
+                  bool keepAllMemory_ = false) :
+        pAlloc(pAlloc_), pFree(pFree_), granularity(granularity_), version(TBBMALLOC_POOL_VERSION),
+        fixedPool(fixedPool_), keepAllMemory(keepAllMemory_),
+        reserved(0) {}
+};
+
+// enums have same values as appropriate enums from ScalableAllocationResult
+// TODO: use ScalableAllocationResult in pool_create directly
+enum MemPoolError {
+    // pool created successfully
+    POOL_OK = TBBMALLOC_OK,
+    // invalid policy parameters found
+    INVALID_POLICY = TBBMALLOC_INVALID_PARAM,
+     // requested pool policy is not supported by allocator library
+    UNSUPPORTED_POLICY = TBBMALLOC_UNSUPPORTED,
+    // lack of memory during pool creation
+    NO_MEMORY = TBBMALLOC_NO_MEMORY,
+    // action takes no effect
+    NO_EFFECT = TBBMALLOC_NO_EFFECT
+};
+
+MemPoolError pool_create_v1(intptr_t pool_id, const MemPoolPolicy *policy,
+                            rml::MemoryPool **pool);
+
+bool  pool_destroy(MemoryPool* memPool);
+void *pool_malloc(MemoryPool* memPool, size_t size);
+void *pool_realloc(MemoryPool* memPool, void *object, size_t size);
+void *pool_aligned_malloc(MemoryPool* mPool, size_t size, size_t alignment);
+void *pool_aligned_realloc(MemoryPool* mPool, void *ptr, size_t size, size_t alignment);
+bool  pool_reset(MemoryPool* memPool);
+bool  pool_free(MemoryPool *memPool, void *object);
+MemoryPool *pool_identify(void *object);
+
+} // namespace rml
+
+#include <new>      /* To use new with the placement argument */
+
+/* Ensure that including this header does not cause implicit linkage with TBB */
+#ifndef __TBB_NO_IMPLICIT_LINKAGE
+    #define __TBB_NO_IMPLICIT_LINKAGE 1
+    #include "tbb_stddef.h"
+    #undef  __TBB_NO_IMPLICIT_LINKAGE
+#else
+    #include "tbb_stddef.h"
+#endif
+
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+ #include <utility> // std::forward
+#endif
+
+namespace tbb {
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for erroneous "unreferenced parameter" warning in method destroy.
+    #pragma warning (push)
+    #pragma warning (disable: 4100)
+#endif
+
+//! @cond INTERNAL
+namespace internal {
+
+#if TBB_USE_EXCEPTIONS
+// forward declaration is for inlining prevention
+template<typename E> __TBB_NOINLINE( void throw_exception(const E &e) );
+#endif
+
+// keep throw in a separate function to prevent code bloat
+template<typename E>
+void throw_exception(const E &e) {
+    __TBB_THROW(e);
+}
+
+} // namespace internal
+//! @endcond
+
+//! Meets "allocator" requirements of ISO C++ Standard, Section 20.1.5
+/** The members are ordered the same way they are in section 20.4.1
+    of the ISO C++ standard.
+    @ingroup memory_allocation */
+template<typename T>
+class scalable_allocator {
+public:
+    typedef typename internal::allocator_type<T>::value_type value_type;
+    typedef value_type* pointer;
+    typedef const value_type* const_pointer;
+    typedef value_type& reference;
+    typedef const value_type& const_reference;
+    typedef size_t size_type;
+    typedef ptrdiff_t difference_type;
+    template<class U> struct rebind {
+        typedef scalable_allocator<U> other;
+    };
+
+    scalable_allocator() throw() {}
+    scalable_allocator( const scalable_allocator& ) throw() {}
+    template<typename U> scalable_allocator(const scalable_allocator<U>&) throw() {}
+
+    pointer address(reference x) const {return &x;}
+    const_pointer address(const_reference x) const {return &x;}
+
+    //! Allocate space for n objects.
+    pointer allocate( size_type n, const void* /*hint*/ =0 ) {
+        pointer p = static_cast<pointer>( scalable_malloc( n * sizeof(value_type) ) );
+        if (!p)
+            internal::throw_exception(std::bad_alloc());
+        return p;
+    }
+
+    //! Free previously allocated block of memory
+    void deallocate( pointer p, size_type ) {
+        scalable_free( p );
+    }
+
+    //! Largest value for which method allocate might succeed.
+    size_type max_size() const throw() {
+        size_type absolutemax = static_cast<size_type>(-1) / sizeof (value_type);
+        return (absolutemax > 0 ? absolutemax : 1);
+    }
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    template<typename U, typename... Args>
+    void construct(U *p, Args&&... args)
+        { ::new((void *)p) U(std::forward<Args>(args)...); }
+#else /* __TBB_ALLOCATOR_CONSTRUCT_VARIADIC */
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void construct( pointer p, value_type&& value ) { ::new((void*)(p)) value_type( std::move( value ) ); }
+#endif
+    void construct( pointer p, const value_type& value ) {::new((void*)(p)) value_type(value);}
+#endif /* __TBB_ALLOCATOR_CONSTRUCT_VARIADIC */
+    void destroy( pointer p ) {p->~value_type();}
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif /* warning 4100 is back */
+
+//! Analogous to std::allocator<void>, as defined in ISO C++ Standard, Section 20.4.1
+/** @ingroup memory_allocation */
+template<>
+class scalable_allocator<void> {
+public:
+    typedef void* pointer;
+    typedef const void* const_pointer;
+    typedef void value_type;
+    template<class U> struct rebind {
+        typedef scalable_allocator<U> other;
+    };
+};
+
+template<typename T, typename U>
+inline bool operator==( const scalable_allocator<T>&, const scalable_allocator<U>& ) {return true;}
+
+template<typename T, typename U>
+inline bool operator!=( const scalable_allocator<T>&, const scalable_allocator<U>& ) {return false;}
+
+} // namespace tbb
+
+#if _MSC_VER
+    #if (__TBB_BUILD || __TBBMALLOC_BUILD) && !defined(__TBBMALLOC_NO_IMPLICIT_LINKAGE)
+        #define __TBBMALLOC_NO_IMPLICIT_LINKAGE 1
+    #endif
+
+    #if !__TBBMALLOC_NO_IMPLICIT_LINKAGE
+        #ifdef _DEBUG
+            #pragma comment(lib, "tbbmalloc_debug.lib")
+        #else
+            #pragma comment(lib, "tbbmalloc.lib")
+        #endif
+    #endif
+
+
+#endif
+
+#endif /* __cplusplus */
+
+#if !defined(__cplusplus) && __ICC==1100
+    #pragma warning (pop)
+#endif /* ICC 11.0 warning 991 is back */
+
+#endif /* __TBB_scalable_allocator_H */
diff --git a/xdl/third_party/tbb/include/tbb/spin_mutex.h b/xdl/third_party/tbb/include/tbb/spin_mutex.h
new file mode 100644
index 00000000..76bbf891
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/spin_mutex.h
@@ -0,0 +1,212 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_spin_mutex_H
+#define __TBB_spin_mutex_H
+
+#include <cstddef>
+#include <new>
+#include "aligned_space.h"
+#include "tbb_stddef.h"
+#include "tbb_machine.h"
+#include "tbb_profiling.h"
+#include "internal/_mutex_padding.h"
+
+namespace tbb {
+
+//! A lock that occupies a single byte.
+/** A spin_mutex is a spin mutex that fits in a single byte.
+    It should be used only for locking short critical sections
+    (typically less than 20 instructions) when fairness is not an issue.
+    If zero-initialized, the mutex is considered unheld.
+    @ingroup synchronization */
+class spin_mutex : internal::mutex_copy_deprecated_and_disabled {
+    //! 0 if lock is released, 1 if lock is acquired.
+    __TBB_atomic_flag flag;
+
+public:
+    //! Construct unacquired lock.
+    /** Equivalent to zero-initialization of *this. */
+    spin_mutex() : flag(0) {
+#if TBB_USE_THREADING_TOOLS
+        internal_construct();
+#endif
+    }
+
+    //! Represents acquisition of a mutex.
+    class scoped_lock : internal::no_copy {
+    private:
+        //! Points to currently held mutex, or NULL if no lock is held.
+        spin_mutex* my_mutex;
+
+        //! Value to store into spin_mutex::flag to unlock the mutex.
+        /** This variable is no longer used. Instead, 0 and 1 are used to
+            represent that the lock is free and acquired, respectively.
+            We keep the member variable here to ensure backward compatibility */
+        __TBB_Flag my_unlock_value;
+
+        //! Like acquire, but with ITT instrumentation.
+        void __TBB_EXPORTED_METHOD internal_acquire( spin_mutex& m );
+
+        //! Like try_acquire, but with ITT instrumentation.
+        bool __TBB_EXPORTED_METHOD internal_try_acquire( spin_mutex& m );
+
+        //! Like release, but with ITT instrumentation.
+        void __TBB_EXPORTED_METHOD internal_release();
+
+        friend class spin_mutex;
+
+    public:
+        //! Construct without acquiring a mutex.
+        scoped_lock() : my_mutex(NULL), my_unlock_value(0) {}
+
+        //! Construct and acquire lock on a mutex.
+        scoped_lock( spin_mutex& m ) : my_unlock_value(0) {
+            internal::suppress_unused_warning(my_unlock_value);
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            my_mutex=NULL;
+            internal_acquire(m);
+#else
+            my_mutex=&m;
+            __TBB_LockByte(m.flag);
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT*/
+        }
+
+        //! Acquire lock.
+        void acquire( spin_mutex& m ) {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            internal_acquire(m);
+#else
+            my_mutex = &m;
+            __TBB_LockByte(m.flag);
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT*/
+        }
+
+        //! Try acquiring lock (non-blocking)
+        /** Return true if lock acquired; false otherwise. */
+        bool try_acquire( spin_mutex& m ) {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            return internal_try_acquire(m);
+#else
+            bool result = __TBB_TryLockByte(m.flag);
+            if( result )
+                my_mutex = &m;
+            return result;
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT*/
+        }
+
+        //! Release lock
+        void release() {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            internal_release();
+#else
+            __TBB_UnlockByte(my_mutex->flag);
+            my_mutex = NULL;
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+        }
+
+        //! Destroy lock.  If holding a lock, releases the lock first.
+        ~scoped_lock() {
+            if( my_mutex ) {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+                internal_release();
+#else
+                __TBB_UnlockByte(my_mutex->flag);
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+            }
+        }
+    };
+
+    //! Internal constructor with ITT instrumentation.
+    void __TBB_EXPORTED_METHOD internal_construct();
+
+    // Mutex traits
+    static const bool is_rw_mutex = false;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = false;
+
+    // ISO C++0x compatibility methods
+
+    //! Acquire lock
+    void lock() {
+#if TBB_USE_THREADING_TOOLS
+        aligned_space<scoped_lock> tmp;
+        new(tmp.begin()) scoped_lock(*this);
+#else
+        __TBB_LockByte(flag);
+#endif /* TBB_USE_THREADING_TOOLS*/
+    }
+
+    //! Try acquiring lock (non-blocking)
+    /** Return true if lock acquired; false otherwise. */
+    bool try_lock() {
+#if TBB_USE_THREADING_TOOLS
+        aligned_space<scoped_lock> tmp;
+        return (new(tmp.begin()) scoped_lock)->internal_try_acquire(*this);
+#else
+        return __TBB_TryLockByte(flag);
+#endif /* TBB_USE_THREADING_TOOLS*/
+    }
+
+    //! Release lock
+    void unlock() {
+#if TBB_USE_THREADING_TOOLS
+        aligned_space<scoped_lock> tmp;
+        scoped_lock& s = *tmp.begin();
+        s.my_mutex = this;
+        s.internal_release();
+#else
+        __TBB_UnlockByte(flag);
+#endif /* TBB_USE_THREADING_TOOLS */
+    }
+
+    friend class scoped_lock;
+}; // end of spin_mutex
+
+__TBB_DEFINE_PROFILING_SET_NAME(spin_mutex)
+
+} // namespace tbb
+
+#if ( __TBB_x86_32 || __TBB_x86_64 )
+#include "internal/_x86_eliding_mutex_impl.h"
+#endif
+
+namespace tbb {
+//! A cross-platform spin mutex with speculative lock acquisition.
+/** On platforms with proper HW support, this lock may speculatively execute
+    its critical sections, using HW mechanisms to detect real data races and
+    ensure atomicity of the critical sections. In particular, it uses
+    Intel(R) Transactional Synchronization Extensions (Intel(R) TSX).
+    Without such HW support, it behaves like a spin_mutex.
+    It should be used for locking short critical sections where the lock is
+    contended but the data it protects are not.  If zero-initialized, the
+    mutex is considered unheld.
+    @ingroup synchronization */
+
+#if ( __TBB_x86_32 || __TBB_x86_64 )
+typedef interface7::internal::padded_mutex<interface7::internal::x86_eliding_mutex,false> speculative_spin_mutex;
+#else
+typedef interface7::internal::padded_mutex<spin_mutex,false> speculative_spin_mutex;
+#endif
+__TBB_DEFINE_PROFILING_SET_NAME(speculative_spin_mutex)
+
+} // namespace tbb
+
+#endif /* __TBB_spin_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/spin_rw_mutex.h b/xdl/third_party/tbb/include/tbb/spin_rw_mutex.h
new file mode 100644
index 00000000..835ca6c6
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/spin_rw_mutex.h
@@ -0,0 +1,256 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_spin_rw_mutex_H
+#define __TBB_spin_rw_mutex_H
+
+#include "tbb_stddef.h"
+#include "tbb_machine.h"
+#include "tbb_profiling.h"
+#include "internal/_mutex_padding.h"
+
+namespace tbb {
+
+#if __TBB_TSX_AVAILABLE
+namespace interface8 { namespace internal {
+    class x86_rtm_rw_mutex;
+}}
+#endif
+
+class spin_rw_mutex_v3;
+typedef spin_rw_mutex_v3 spin_rw_mutex;
+
+//! Fast, unfair, spinning reader-writer lock with backoff and writer-preference
+/** @ingroup synchronization */
+class spin_rw_mutex_v3 : internal::mutex_copy_deprecated_and_disabled {
+    //! @cond INTERNAL
+
+    //! Internal acquire write lock.
+    bool __TBB_EXPORTED_METHOD internal_acquire_writer();
+
+    //! Out of line code for releasing a write lock.
+    /** This code has debug checking and instrumentation for Intel(R) Thread Checker and Intel(R) Thread Profiler. */
+    void __TBB_EXPORTED_METHOD internal_release_writer();
+
+    //! Internal acquire read lock.
+    void __TBB_EXPORTED_METHOD internal_acquire_reader();
+
+    //! Internal upgrade reader to become a writer.
+    bool __TBB_EXPORTED_METHOD internal_upgrade();
+
+    //! Out of line code for downgrading a writer to a reader.
+    /** This code has debug checking and instrumentation for Intel(R) Thread Checker and Intel(R) Thread Profiler. */
+    void __TBB_EXPORTED_METHOD internal_downgrade();
+
+    //! Internal release read lock.
+    void __TBB_EXPORTED_METHOD internal_release_reader();
+
+    //! Internal try_acquire write lock.
+    bool __TBB_EXPORTED_METHOD internal_try_acquire_writer();
+
+    //! Internal try_acquire read lock.
+    bool __TBB_EXPORTED_METHOD internal_try_acquire_reader();
+
+    //! @endcond
+public:
+    //! Construct unacquired mutex.
+    spin_rw_mutex_v3() : state(0) {
+#if TBB_USE_THREADING_TOOLS
+        internal_construct();
+#endif
+    }
+
+#if TBB_USE_ASSERT
+    //! Destructor asserts if the mutex is acquired, i.e. state is zero.
+    ~spin_rw_mutex_v3() {
+        __TBB_ASSERT( !state, "destruction of an acquired mutex");
+    };
+#endif /* TBB_USE_ASSERT */
+
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    class scoped_lock : internal::no_copy {
+#if __TBB_TSX_AVAILABLE
+        friend class tbb::interface8::internal::x86_rtm_rw_mutex;
+#endif
+    public:
+        //! Construct lock that has not acquired a mutex.
+        /** Equivalent to zero-initialization of *this. */
+        scoped_lock() : mutex(NULL), is_writer(false) {}
+
+        //! Acquire lock on given mutex.
+        scoped_lock( spin_rw_mutex& m, bool write = true ) : mutex(NULL) {
+            acquire(m, write);
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if( mutex ) release();
+        }
+
+        //! Acquire lock on given mutex.
+        void acquire( spin_rw_mutex& m, bool write = true ) {
+            __TBB_ASSERT( !mutex, "holding mutex already" );
+            is_writer = write;
+            mutex = &m;
+            if( write ) mutex->internal_acquire_writer();
+            else        mutex->internal_acquire_reader();
+        }
+
+        //! Upgrade reader to become a writer.
+        /** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+        bool upgrade_to_writer() {
+            __TBB_ASSERT( mutex, "mutex is not acquired" );
+            __TBB_ASSERT( !is_writer, "not a reader" );
+            is_writer = true;
+            return mutex->internal_upgrade();
+        }
+
+        //! Release lock.
+        void release() {
+            __TBB_ASSERT( mutex, "mutex is not acquired" );
+            spin_rw_mutex *m = mutex;
+            mutex = NULL;
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            if( is_writer ) m->internal_release_writer();
+            else            m->internal_release_reader();
+#else
+            if( is_writer ) __TBB_AtomicAND( &m->state, READERS );
+            else            __TBB_FetchAndAddWrelease( &m->state, -(intptr_t)ONE_READER);
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+        }
+
+        //! Downgrade writer to become a reader.
+        bool downgrade_to_reader() {
+            __TBB_ASSERT( mutex, "mutex is not acquired" );
+            __TBB_ASSERT( is_writer, "not a writer" );
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            mutex->internal_downgrade();
+#else
+            __TBB_FetchAndAddW( &mutex->state, ((intptr_t)ONE_READER-WRITER));
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+            is_writer = false;
+            return true;
+        }
+
+        //! Try acquire lock on given mutex.
+        bool try_acquire( spin_rw_mutex& m, bool write = true ) {
+            __TBB_ASSERT( !mutex, "holding mutex already" );
+            bool result;
+            is_writer = write;
+            result = write? m.internal_try_acquire_writer()
+                          : m.internal_try_acquire_reader();
+            if( result )
+                mutex = &m;
+            return result;
+        }
+
+    protected:
+
+        //! The pointer to the current mutex that is held, or NULL if no mutex is held.
+        spin_rw_mutex* mutex;
+
+        //! If mutex!=NULL, then is_writer is true if holding a writer lock, false if holding a reader lock.
+        /** Not defined if not holding a lock. */
+        bool is_writer;
+    };
+
+    // Mutex traits
+    static const bool is_rw_mutex = true;
+    static const bool is_recursive_mutex = false;
+    static const bool is_fair_mutex = false;
+
+    // ISO C++0x compatibility methods
+
+    //! Acquire writer lock
+    void lock() {internal_acquire_writer();}
+
+    //! Try acquiring writer lock (non-blocking)
+    /** Return true if lock acquired; false otherwise. */
+    bool try_lock() {return internal_try_acquire_writer();}
+
+    //! Release lock
+    void unlock() {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+        if( state&WRITER ) internal_release_writer();
+        else               internal_release_reader();
+#else
+        if( state&WRITER ) __TBB_AtomicAND( &state, READERS );
+        else               __TBB_FetchAndAddWrelease( &state, -(intptr_t)ONE_READER);
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+    }
+
+    // Methods for reader locks that resemble ISO C++0x compatibility methods.
+
+    //! Acquire reader lock
+    void lock_read() {internal_acquire_reader();}
+
+    //! Try acquiring reader lock (non-blocking)
+    /** Return true if reader lock acquired; false otherwise. */
+    bool try_lock_read() {return internal_try_acquire_reader();}
+
+protected:
+    typedef intptr_t state_t;
+    static const state_t WRITER = 1;
+    static const state_t WRITER_PENDING = 2;
+    static const state_t READERS = ~(WRITER | WRITER_PENDING);
+    static const state_t ONE_READER = 4;
+    static const state_t BUSY = WRITER | READERS;
+    //! State of lock
+    /** Bit 0 = writer is holding lock
+        Bit 1 = request by a writer to acquire lock (hint to readers to wait)
+        Bit 2..N = number of readers holding lock */
+    state_t state;
+
+private:
+    void __TBB_EXPORTED_METHOD internal_construct();
+};
+
+__TBB_DEFINE_PROFILING_SET_NAME(spin_rw_mutex)
+
+} // namespace tbb
+
+#if __TBB_TSX_AVAILABLE
+#include "internal/_x86_rtm_rw_mutex_impl.h"
+#endif
+
+namespace tbb {
+namespace interface8 {
+//! A cross-platform spin reader/writer mutex with speculative lock acquisition.
+/** On platforms with proper HW support, this lock may speculatively execute
+    its critical sections, using HW mechanisms to detect real data races and
+    ensure atomicity of the critical sections. In particular, it uses
+    Intel(R) Transactional Synchronization Extensions (Intel(R) TSX).
+    Without such HW support, it behaves like a spin_rw_mutex.
+    It should be used for locking short critical sections where the lock is
+    contended but the data it protects are not.
+    @ingroup synchronization */
+#if __TBB_TSX_AVAILABLE
+typedef interface7::internal::padded_mutex<tbb::interface8::internal::x86_rtm_rw_mutex,true> speculative_spin_rw_mutex;
+#else
+typedef interface7::internal::padded_mutex<tbb::spin_rw_mutex,true> speculative_spin_rw_mutex;
+#endif
+}  // namespace interface8
+
+using interface8::speculative_spin_rw_mutex;
+__TBB_DEFINE_PROFILING_SET_NAME(speculative_spin_rw_mutex)
+} // namespace tbb
+#endif /* __TBB_spin_rw_mutex_H */
diff --git a/xdl/third_party/tbb/include/tbb/task.h b/xdl/third_party/tbb/include/tbb/task.h
new file mode 100644
index 00000000..1e7d84f2
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/task.h
@@ -0,0 +1,1100 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_task_H
+#define __TBB_task_H
+
+#include "tbb_stddef.h"
+#include "tbb_machine.h"
+#include "tbb_profiling.h"
+#include <climits>
+
+typedef struct ___itt_caller *__itt_caller;
+
+namespace tbb {
+
+class task;
+class task_list;
+class task_group_context;
+
+// MSVC does not allow taking the address of a member that was defined
+// privately in task_base and made public in class task via a using declaration.
+#if _MSC_VER || (__GNUC__==3 && __GNUC_MINOR__<3)
+#define __TBB_TASK_BASE_ACCESS public
+#else
+#define __TBB_TASK_BASE_ACCESS private
+#endif
+
+namespace internal { //< @cond INTERNAL
+
+    class allocate_additional_child_of_proxy: no_assign {
+        //! No longer used, but retained for binary layout compatibility.  Always NULL.
+        task* self;
+        task& parent;
+    public:
+        explicit allocate_additional_child_of_proxy( task& parent_ ) : self(NULL), parent(parent_) {}
+        task& __TBB_EXPORTED_METHOD allocate( size_t size ) const;
+        void __TBB_EXPORTED_METHOD free( task& ) const;
+    };
+
+    struct cpu_ctl_env_space { int space[sizeof(internal::uint64_t)/sizeof(int)]; };
+} //< namespace internal @endcond
+
+namespace interface5 {
+    namespace internal {
+        //! Base class for methods that became static in TBB 3.0.
+        /** TBB's evolution caused the "this" argument for several methods to become obsolete.
+            However, for backwards binary compatibility, the new methods need distinct names,
+            otherwise the One Definition Rule would be broken.  Hence the new methods are
+            defined in this private base class, and then exposed in class task via
+            using declarations. */
+        class task_base: tbb::internal::no_copy {
+        __TBB_TASK_BASE_ACCESS:
+            friend class tbb::task;
+
+            //! Schedule task for execution when a worker becomes available.
+            static void spawn( task& t );
+
+            //! Spawn multiple tasks and clear list.
+            static void spawn( task_list& list );
+
+            //! Like allocate_child, except that task's parent becomes "t", not this.
+            /** Typically used in conjunction with schedule_to_reexecute to implement while loops.
+               Atomically increments the reference count of t.parent() */
+            static tbb::internal::allocate_additional_child_of_proxy allocate_additional_child_of( task& t ) {
+                return tbb::internal::allocate_additional_child_of_proxy(t);
+            }
+
+            //! Destroy a task.
+            /** Usually, calling this method is unnecessary, because a task is
+                implicitly deleted after its execute() method runs.  However,
+                sometimes a task needs to be explicitly deallocated, such as
+                when a root task is used as the parent in spawn_and_wait_for_all. */
+            static void __TBB_EXPORTED_FUNC destroy( task& victim );
+        };
+    } // internal
+} // interface5
+
+//! @cond INTERNAL
+namespace internal {
+
+    class scheduler: no_copy {
+    public:
+        //! For internal use only
+        virtual void spawn( task& first, task*& next ) = 0;
+
+        //! For internal use only
+        virtual void wait_for_all( task& parent, task* child ) = 0;
+
+        //! For internal use only
+        virtual void spawn_root_and_wait( task& first, task*& next ) = 0;
+
+        //! Pure virtual destructor;
+        //  Have to have it just to shut up overzealous compilation warnings
+        virtual ~scheduler() = 0;
+
+        //! For internal use only
+        virtual void enqueue( task& t, void* reserved ) = 0;
+    };
+
+    //! A reference count
+    /** Should always be non-negative.  A signed type is used so that underflow can be detected. */
+    typedef intptr_t reference_count;
+
+    //! An id as used for specifying affinity.
+    typedef unsigned short affinity_id;
+
+#if __TBB_TASK_ISOLATION
+    //! A tag for task isolation.
+    typedef intptr_t isolation_tag;
+    const isolation_tag no_isolation = 0;
+#endif /* __TBB_TASK_ISOLATION */
+
+#if __TBB_TASK_GROUP_CONTEXT
+    class generic_scheduler;
+
+    struct context_list_node_t {
+        context_list_node_t *my_prev,
+                            *my_next;
+    };
+
+    class allocate_root_with_context_proxy: no_assign {
+        task_group_context& my_context;
+    public:
+        allocate_root_with_context_proxy ( task_group_context& ctx ) : my_context(ctx) {}
+        task& __TBB_EXPORTED_METHOD allocate( size_t size ) const;
+        void __TBB_EXPORTED_METHOD free( task& ) const;
+    };
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+    class allocate_root_proxy: no_assign {
+    public:
+        static task& __TBB_EXPORTED_FUNC allocate( size_t size );
+        static void __TBB_EXPORTED_FUNC free( task& );
+    };
+
+    class allocate_continuation_proxy: no_assign {
+    public:
+        task& __TBB_EXPORTED_METHOD allocate( size_t size ) const;
+        void __TBB_EXPORTED_METHOD free( task& ) const;
+    };
+
+    class allocate_child_proxy: no_assign {
+    public:
+        task& __TBB_EXPORTED_METHOD allocate( size_t size ) const;
+        void __TBB_EXPORTED_METHOD free( task& ) const;
+    };
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    // TODO: move to class methods when critical task API becomes public
+    void make_critical( task& t );
+    bool is_critical( task& t );
+#endif
+
+    //! Memory prefix to a task object.
+    /** This class is internal to the library.
+        Do not reference it directly, except within the library itself.
+        Fields are ordered in way that preserves backwards compatibility and yields good packing on
+        typical 32-bit and 64-bit platforms. New fields should be added at the beginning for
+        backward compatibility with accesses to the task prefix inlined into application code. To
+        prevent ODR violation, the class shall have the same layout in all application translation
+        units. If some fields are conditional (e.g. enabled by preview macros) and might get
+        skipped, use reserved fields to adjust the layout.
+
+        In case task prefix size exceeds 32 or 64 bytes on IA32 and Intel64 architectures
+        correspondingly, consider dynamic setting of task_alignment and task_prefix_reservation_size
+        based on the maximal operand size supported by the current CPU.
+
+        @ingroup task_scheduling */
+    class task_prefix {
+    private:
+        friend class tbb::task;
+        friend class tbb::interface5::internal::task_base;
+        friend class tbb::task_list;
+        friend class internal::scheduler;
+        friend class internal::allocate_root_proxy;
+        friend class internal::allocate_child_proxy;
+        friend class internal::allocate_continuation_proxy;
+        friend class internal::allocate_additional_child_of_proxy;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        friend void make_critical( task& );
+        friend bool is_critical( task& );
+#endif
+
+#if __TBB_TASK_ISOLATION
+        //! The tag used for task isolation.
+        isolation_tag isolation;
+#else
+        intptr_t reserved_space_for_task_isolation_tag;
+#endif /* __TBB_TASK_ISOLATION */
+
+#if __TBB_TASK_GROUP_CONTEXT
+        //! Shared context that is used to communicate asynchronous state changes
+        /** Currently it is used to broadcast cancellation requests generated both
+            by users and as the result of unhandled exceptions in the task::execute()
+            methods. */
+        task_group_context  *context;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+        //! The scheduler that allocated the task, or NULL if the task is big.
+        /** Small tasks are pooled by the scheduler that allocated the task.
+            If a scheduler needs to free a small task allocated by another scheduler,
+            it returns the task to that other scheduler.  This policy avoids
+            memory space blowup issues for memory allocators that allocate from
+            thread-specific pools. */
+        scheduler* origin;
+
+#if __TBB_TASK_PRIORITY
+        union {
+#endif /* __TBB_TASK_PRIORITY */
+        //! Obsolete. The scheduler that owns the task.
+        /** Retained only for the sake of backward binary compatibility.
+            Still used by inline methods in the task.h header. **/
+        scheduler* owner;
+
+#if __TBB_TASK_PRIORITY
+        //! Pointer to the next offloaded lower priority task.
+        /** Used to maintain a list of offloaded tasks inside the scheduler. **/
+        task* next_offloaded;
+        };
+#endif /* __TBB_TASK_PRIORITY */
+
+        //! The task whose reference count includes me.
+        /** In the "blocking style" of programming, this field points to the parent task.
+            In the "continuation-passing style" of programming, this field points to the
+            continuation of the parent. */
+        tbb::task* parent;
+
+        //! Reference count used for synchronization.
+        /** In the "continuation-passing style" of programming, this field is
+            the difference of the number of allocated children minus the
+            number of children that have completed.
+            In the "blocking style" of programming, this field is one more than the difference. */
+        __TBB_atomic reference_count ref_count;
+
+        //! Obsolete. Used to be scheduling depth before TBB 2.2
+        /** Retained only for the sake of backward binary compatibility.
+            Not used by TBB anymore. **/
+        int depth;
+
+        //! A task::state_type, stored as a byte for compactness.
+        /** This state is exposed to users via method task::state(). */
+        unsigned char state;
+
+        //! Miscellaneous state that is not directly visible to users, stored as a byte for compactness.
+        /** 0x0 -> version 1.0 task
+            0x1 -> version >=2.1 task
+            0x10 -> task was enqueued
+            0x20 -> task_proxy
+            0x40 -> task has live ref_count
+            0x80 -> a stolen task */
+        unsigned char extra_state;
+
+        affinity_id affinity;
+
+        //! "next" field for list of task
+        tbb::task* next;
+
+        //! The task corresponding to this task_prefix.
+        tbb::task& task() {return *reinterpret_cast<tbb::task*>(this+1);}
+    };
+
+} // namespace internal
+//! @endcond
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+#if __TBB_TASK_PRIORITY
+namespace internal {
+    static const int priority_stride_v4 = INT_MAX / 4;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    // TODO: move into priority_t enum when critical tasks become public feature
+    static const int priority_critical = priority_stride_v4 * 3 + priority_stride_v4 / 3 * 2;
+#endif
+}
+
+enum priority_t {
+    priority_normal = internal::priority_stride_v4 * 2,
+    priority_low = priority_normal - internal::priority_stride_v4,
+    priority_high = priority_normal + internal::priority_stride_v4
+};
+
+#endif /* __TBB_TASK_PRIORITY */
+
+#if TBB_USE_CAPTURED_EXCEPTION
+    class tbb_exception;
+#else
+    namespace internal {
+        class tbb_exception_ptr;
+    }
+#endif /* !TBB_USE_CAPTURED_EXCEPTION */
+
+class task_scheduler_init;
+namespace interface7 { class task_arena; }
+
+//! Used to form groups of tasks
+/** @ingroup task_scheduling
+    The context services explicit cancellation requests from user code, and unhandled
+    exceptions intercepted during tasks execution. Intercepting an exception results
+    in generating internal cancellation requests (which is processed in exactly the
+    same way as external ones).
+
+    The context is associated with one or more root tasks and defines the cancellation
+    group that includes all the descendants of the corresponding root task(s). Association
+    is established when a context object is passed as an argument to the task::allocate_root()
+    method. See task_group_context::task_group_context for more details.
+
+    The context can be bound to another one, and other contexts can be bound to it,
+    forming a tree-like structure: parent -> this -> children. Arrows here designate
+    cancellation propagation direction. If a task in a cancellation group is cancelled
+    all the other tasks in this group and groups bound to it (as children) get cancelled too.
+
+    IMPLEMENTATION NOTE:
+    When adding new members to task_group_context or changing types of existing ones,
+    update the size of both padding buffers (_leading_padding and _trailing_padding)
+    appropriately. See also VERSIONING NOTE at the constructor definition below. **/
+class task_group_context : internal::no_copy {
+private:
+    friend class internal::generic_scheduler;
+    friend class task_scheduler_init;
+    friend class interface7::task_arena;
+
+#if TBB_USE_CAPTURED_EXCEPTION
+    typedef tbb_exception exception_container_type;
+#else
+    typedef internal::tbb_exception_ptr exception_container_type;
+#endif
+
+    enum version_traits_word_layout {
+        traits_offset = 16,
+        version_mask = 0xFFFF,
+        traits_mask = 0xFFFFul << traits_offset
+    };
+
+public:
+    enum kind_type {
+        isolated,
+        bound
+    };
+
+    enum traits_type {
+        exact_exception = 0x0001ul << traits_offset,
+#if __TBB_FP_CONTEXT
+        fp_settings     = 0x0002ul << traits_offset,
+#endif
+        concurrent_wait = 0x0004ul << traits_offset,
+#if TBB_USE_CAPTURED_EXCEPTION
+        default_traits = 0
+#else
+        default_traits = exact_exception
+#endif /* !TBB_USE_CAPTURED_EXCEPTION */
+    };
+
+private:
+    enum state {
+        may_have_children = 1,
+        // the following enumerations must be the last, new 2^x values must go above
+        next_state_value, low_unused_state_bit = (next_state_value-1)*2
+    };
+
+    union {
+        //! Flavor of this context: bound or isolated.
+        // TODO: describe asynchronous use, and whether any memory semantics are needed
+        __TBB_atomic kind_type my_kind;
+        uintptr_t _my_kind_aligner;
+    };
+
+    //! Pointer to the context of the parent cancellation group. NULL for isolated contexts.
+    task_group_context *my_parent;
+
+    //! Used to form the thread specific list of contexts without additional memory allocation.
+    /** A context is included into the list of the current thread when its binding to
+        its parent happens. Any context can be present in the list of one thread only. **/
+    internal::context_list_node_t my_node;
+
+    //! Used to set and maintain stack stitching point for Intel Performance Tools.
+    __itt_caller itt_caller;
+
+    //! Leading padding protecting accesses to frequently used members from false sharing.
+    /** Read accesses to the field my_cancellation_requested are on the hot path inside
+        the scheduler. This padding ensures that this field never shares the same cache
+        line with a local variable that is frequently written to. **/
+    char _leading_padding[internal::NFS_MaxLineSize
+                          - 2 * sizeof(uintptr_t)- sizeof(void*) - sizeof(internal::context_list_node_t)
+                          - sizeof(__itt_caller)
+#if __TBB_FP_CONTEXT
+                          - sizeof(internal::cpu_ctl_env_space)
+#endif
+                         ];
+
+#if __TBB_FP_CONTEXT
+    //! Space for platform-specific FPU settings.
+    /** Must only be accessed inside TBB binaries, and never directly in user
+        code or inline methods. */
+    internal::cpu_ctl_env_space my_cpu_ctl_env;
+#endif
+
+    //! Specifies whether cancellation was requested for this task group.
+    uintptr_t my_cancellation_requested;
+
+    //! Version for run-time checks and behavioral traits of the context.
+    /** Version occupies low 16 bits, and traits (zero or more ORed enumerators
+        from the traits_type enumerations) take the next 16 bits.
+        Original (zeroth) version of the context did not support any traits. **/
+    uintptr_t my_version_and_traits;
+
+    //! Pointer to the container storing exception being propagated across this task group.
+    exception_container_type *my_exception;
+
+    //! Scheduler instance that registered this context in its thread specific list.
+    internal::generic_scheduler *my_owner;
+
+    //! Internal state (combination of state flags, currently only may_have_children).
+    uintptr_t my_state;
+
+#if __TBB_TASK_PRIORITY
+    //! Priority level of the task group (in normalized representation)
+    intptr_t my_priority;
+#endif /* __TBB_TASK_PRIORITY */
+
+    //! Decription of algorithm for scheduler based instrumentation.
+    internal::string_index my_name;
+
+    //! Trailing padding protecting accesses to frequently used members from false sharing
+    /** \sa _leading_padding **/
+    char _trailing_padding[internal::NFS_MaxLineSize - 2 * sizeof(uintptr_t) - 2 * sizeof(void*)
+#if __TBB_TASK_PRIORITY
+                           - sizeof(intptr_t)
+#endif /* __TBB_TASK_PRIORITY */
+                           - sizeof(internal::string_index)
+                          ];
+
+public:
+    //! Default & binding constructor.
+    /** By default a bound context is created. That is this context will be bound
+        (as child) to the context of the task calling task::allocate_root(this_context)
+        method. Cancellation requests passed to the parent context are propagated
+        to all the contexts bound to it. Similarly priority change is propagated
+        from the parent context to its children.
+
+        If task_group_context::isolated is used as the argument, then the tasks associated
+        with this context will never be affected by events in any other context.
+
+        Creating isolated contexts involve much less overhead, but they have limited
+        utility. Normally when an exception occurs in an algorithm that has nested
+        ones running, it is desirably to have all the nested algorithms cancelled
+        as well. Such a behavior requires nested algorithms to use bound contexts.
+
+        There is one good place where using isolated algorithms is beneficial. It is
+        a master thread. That is if a particular algorithm is invoked directly from
+        the master thread (not from a TBB task), supplying it with explicitly
+        created isolated context will result in a faster algorithm startup.
+
+        VERSIONING NOTE:
+        Implementation(s) of task_group_context constructor(s) cannot be made
+        entirely out-of-line because the run-time version must be set by the user
+        code. This will become critically important for binary compatibility, if
+        we ever have to change the size of the context object.
+
+        Boosting the runtime version will also be necessary if new data fields are
+        introduced in the currently unused padding areas and these fields are updated
+        by inline methods. **/
+    task_group_context ( kind_type relation_with_parent = bound,
+                         uintptr_t t = default_traits )
+        : my_kind(relation_with_parent)
+        , my_version_and_traits(3 | t)
+        , my_name(internal::CUSTOM_CTX)
+    {
+        init();
+    }
+
+    // Custom constructor for instrumentation of tbb algorithm
+    task_group_context ( internal::string_index name )
+        : my_kind(bound)
+        , my_version_and_traits(3 | default_traits)
+        , my_name(name)
+    {
+        init();
+    }
+
+    // Do not introduce standalone unbind method since it will break state propagation assumptions
+    __TBB_EXPORTED_METHOD ~task_group_context ();
+
+    //! Forcefully reinitializes the context after the task tree it was associated with is completed.
+    /** Because the method assumes that all the tasks that used to be associated with
+        this context have already finished, calling it while the context is still
+        in use somewhere in the task hierarchy leads to undefined behavior.
+
+        IMPORTANT: This method is not thread safe!
+
+        The method does not change the context's parent if it is set. **/
+    void __TBB_EXPORTED_METHOD reset ();
+
+    //! Initiates cancellation of all tasks in this cancellation group and its subordinate groups.
+    /** \return false if cancellation has already been requested, true otherwise.
+
+        Note that canceling never fails. When false is returned, it just means that
+        another thread (or this one) has already sent cancellation request to this
+        context or to one of its ancestors (if this context is bound). It is guaranteed
+        that when this method is concurrently called on the same not yet cancelled
+        context, true will be returned by one and only one invocation. **/
+    bool __TBB_EXPORTED_METHOD cancel_group_execution ();
+
+    //! Returns true if the context received cancellation request.
+    bool __TBB_EXPORTED_METHOD is_group_execution_cancelled () const;
+
+    //! Records the pending exception, and cancels the task group.
+    /** May be called only from inside a catch-block. If the context is already
+        cancelled, does nothing.
+        The method brings the task group associated with this context exactly into
+        the state it would be in, if one of its tasks threw the currently pending
+        exception during its execution. In other words, it emulates the actions
+        of the scheduler's dispatch loop exception handler. **/
+    void __TBB_EXPORTED_METHOD register_pending_exception ();
+
+#if __TBB_FP_CONTEXT
+    //! Captures the current FPU control settings to the context.
+    /** Because the method assumes that all the tasks that used to be associated with
+        this context have already finished, calling it while the context is still
+        in use somewhere in the task hierarchy leads to undefined behavior.
+
+        IMPORTANT: This method is not thread safe!
+
+        The method does not change the FPU control settings of the context's parent. **/
+    void __TBB_EXPORTED_METHOD capture_fp_settings ();
+#endif
+
+#if __TBB_TASK_PRIORITY
+    //! Changes priority of the task group
+    void set_priority ( priority_t );
+
+    //! Retrieves current priority of the current task group
+    priority_t priority () const;
+#endif /* __TBB_TASK_PRIORITY */
+
+    //! Returns the context's trait
+    uintptr_t traits() const { return my_version_and_traits & traits_mask; }
+
+protected:
+    //! Out-of-line part of the constructor.
+    /** Singled out to ensure backward binary compatibility of the future versions. **/
+    void __TBB_EXPORTED_METHOD init ();
+
+private:
+    friend class task;
+    friend class internal::allocate_root_with_context_proxy;
+
+    static const kind_type binding_required = bound;
+    static const kind_type binding_completed = kind_type(bound+1);
+    static const kind_type detached = kind_type(binding_completed+1);
+    static const kind_type dying = kind_type(detached+1);
+
+    //! Propagates any state change detected to *this, and as an optimisation possibly also upward along the heritage line.
+    template <typename T>
+    void propagate_task_group_state ( T task_group_context::*mptr_state, task_group_context& src, T new_state );
+
+    //! Registers this context with the local scheduler and binds it to its parent context
+    void bind_to ( internal::generic_scheduler *local_sched );
+
+    //! Registers this context with the local scheduler
+    void register_with ( internal::generic_scheduler *local_sched );
+
+#if __TBB_FP_CONTEXT
+    //! Copies FPU control setting from another context
+    // TODO: Consider adding #else stub in order to omit #if sections in other code
+    void copy_fp_settings( const task_group_context &src );
+#endif /* __TBB_FP_CONTEXT */
+}; // class task_group_context
+
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//! Base class for user-defined tasks.
+/** @ingroup task_scheduling */
+class task: __TBB_TASK_BASE_ACCESS interface5::internal::task_base {
+
+    //! Set reference count
+    void __TBB_EXPORTED_METHOD internal_set_ref_count( int count );
+
+    //! Decrement reference count and return its new value.
+    internal::reference_count __TBB_EXPORTED_METHOD internal_decrement_ref_count();
+
+protected:
+    //! Default constructor.
+    task() {prefix().extra_state=1;}
+
+public:
+    //! Destructor.
+    virtual ~task() {}
+
+    //! Should be overridden by derived classes.
+    virtual task* execute() = 0;
+
+    //! Enumeration of task states that the scheduler considers.
+    enum state_type {
+        //! task is running, and will be destroyed after method execute() completes.
+        executing,
+        //! task to be rescheduled.
+        reexecute,
+        //! task is in ready pool, or is going to be put there, or was just taken off.
+        ready,
+        //! task object is freshly allocated or recycled.
+        allocated,
+        //! task object is on free list, or is going to be put there, or was just taken off.
+        freed,
+        //! task to be recycled as continuation
+        recycle
+#if __TBB_RECYCLE_TO_ENQUEUE
+        //! task to be scheduled for starvation-resistant execution
+        ,to_enqueue
+#endif
+    };
+
+    //------------------------------------------------------------------------
+    // Allocating tasks
+    //------------------------------------------------------------------------
+
+    //! Returns proxy for overloaded new that allocates a root task.
+    static internal::allocate_root_proxy allocate_root() {
+        return internal::allocate_root_proxy();
+    }
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Returns proxy for overloaded new that allocates a root task associated with user supplied context.
+    static internal::allocate_root_with_context_proxy allocate_root( task_group_context& ctx ) {
+        return internal::allocate_root_with_context_proxy(ctx);
+    }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+    //! Returns proxy for overloaded new that allocates a continuation task of *this.
+    /** The continuation's parent becomes the parent of *this. */
+    internal::allocate_continuation_proxy& allocate_continuation() {
+        return *reinterpret_cast<internal::allocate_continuation_proxy*>(this);
+    }
+
+    //! Returns proxy for overloaded new that allocates a child task of *this.
+    internal::allocate_child_proxy& allocate_child() {
+        return *reinterpret_cast<internal::allocate_child_proxy*>(this);
+    }
+
+    //! Define recommended static form via import from base class.
+    using task_base::allocate_additional_child_of;
+
+#if __TBB_DEPRECATED_TASK_INTERFACE
+    //! Destroy a task.
+    /** Usually, calling this method is unnecessary, because a task is
+        implicitly deleted after its execute() method runs.  However,
+        sometimes a task needs to be explicitly deallocated, such as
+        when a root task is used as the parent in spawn_and_wait_for_all. */
+    void __TBB_EXPORTED_METHOD destroy( task& t );
+#else /* !__TBB_DEPRECATED_TASK_INTERFACE */
+    //! Define recommended static form via import from base class.
+    using task_base::destroy;
+#endif /* !__TBB_DEPRECATED_TASK_INTERFACE */
+
+    //------------------------------------------------------------------------
+    // Recycling of tasks
+    //------------------------------------------------------------------------
+
+    //! Change this to be a continuation of its former self.
+    /** The caller must guarantee that the task's refcount does not become zero until
+        after the method execute() returns.  Typically, this is done by having
+        method execute() return a pointer to a child of the task.  If the guarantee
+        cannot be made, use method recycle_as_safe_continuation instead.
+
+        Because of the hazard, this method may be deprecated in the future. */
+    void recycle_as_continuation() {
+        __TBB_ASSERT( prefix().state==executing, "execute not running?" );
+        prefix().state = allocated;
+    }
+
+    //! Recommended to use, safe variant of recycle_as_continuation
+    /** For safety, it requires additional increment of ref_count.
+        With no descendants and ref_count of 1, it has the semantics of recycle_to_reexecute. */
+    void recycle_as_safe_continuation() {
+        __TBB_ASSERT( prefix().state==executing, "execute not running?" );
+        prefix().state = recycle;
+    }
+
+    //! Change this to be a child of new_parent.
+    void recycle_as_child_of( task& new_parent ) {
+        internal::task_prefix& p = prefix();
+        __TBB_ASSERT( prefix().state==executing||prefix().state==allocated, "execute not running, or already recycled" );
+        __TBB_ASSERT( prefix().ref_count==0, "no child tasks allowed when recycled as a child" );
+        __TBB_ASSERT( p.parent==NULL, "parent must be null" );
+        __TBB_ASSERT( new_parent.prefix().state<=recycle, "corrupt parent's state" );
+        __TBB_ASSERT( new_parent.prefix().state!=freed, "parent already freed" );
+        p.state = allocated;
+        p.parent = &new_parent;
+#if __TBB_TASK_GROUP_CONTEXT
+        p.context = new_parent.prefix().context;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    }
+
+    //! Schedule this for reexecution after current execute() returns.
+    /** Made obsolete by recycle_as_safe_continuation; may become deprecated. */
+    void recycle_to_reexecute() {
+        __TBB_ASSERT( prefix().state==executing, "execute not running, or already recycled" );
+        __TBB_ASSERT( prefix().ref_count==0, "no child tasks allowed when recycled for reexecution" );
+        prefix().state = reexecute;
+    }
+
+#if __TBB_RECYCLE_TO_ENQUEUE
+    //! Schedule this to enqueue after descendant tasks complete.
+    /** Save enqueue/spawn difference, it has the semantics of recycle_as_safe_continuation. */
+    void recycle_to_enqueue() {
+        __TBB_ASSERT( prefix().state==executing, "execute not running, or already recycled" );
+        prefix().state = to_enqueue;
+    }
+#endif /* __TBB_RECYCLE_TO_ENQUEUE */
+
+    //------------------------------------------------------------------------
+    // Spawning and blocking
+    //------------------------------------------------------------------------
+
+    //! Set reference count
+    void set_ref_count( int count ) {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+        internal_set_ref_count(count);
+#else
+        prefix().ref_count = count;
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+    }
+
+    //! Atomically increment reference count.
+    /** Has acquire semantics */
+    void increment_ref_count() {
+        __TBB_FetchAndIncrementWacquire( &prefix().ref_count );
+    }
+
+    //! Atomically adds to reference count and returns its new value.
+    /** Has release-acquire semantics */
+    int add_ref_count( int count ) {
+        internal::call_itt_notify( internal::releasing, &prefix().ref_count );
+        internal::reference_count k = count+__TBB_FetchAndAddW( &prefix().ref_count, count );
+        __TBB_ASSERT( k>=0, "task's reference count underflowed" );
+        if( k==0 )
+            internal::call_itt_notify( internal::acquired, &prefix().ref_count );
+        return int(k);
+    }
+
+    //! Atomically decrement reference count and returns its new value.
+    /** Has release semantics. */
+    int decrement_ref_count() {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+        return int(internal_decrement_ref_count());
+#else
+        return int(__TBB_FetchAndDecrementWrelease( &prefix().ref_count ))-1;
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+    }
+
+    //! Define recommended static forms via import from base class.
+    using task_base::spawn;
+
+    //! Similar to spawn followed by wait_for_all, but more efficient.
+    void spawn_and_wait_for_all( task& child ) {
+        prefix().owner->wait_for_all( *this, &child );
+    }
+
+    //! Similar to spawn followed by wait_for_all, but more efficient.
+    void __TBB_EXPORTED_METHOD spawn_and_wait_for_all( task_list& list );
+
+    //! Spawn task allocated by allocate_root, wait for it to complete, and deallocate it.
+    static void spawn_root_and_wait( task& root ) {
+        root.prefix().owner->spawn_root_and_wait( root, root.prefix().next );
+    }
+
+    //! Spawn root tasks on list and wait for all of them to finish.
+    /** If there are more tasks than worker threads, the tasks are spawned in
+        order of front to back. */
+    static void spawn_root_and_wait( task_list& root_list );
+
+    //! Wait for reference count to become one, and set reference count to zero.
+    /** Works on tasks while waiting. */
+    void wait_for_all() {
+        prefix().owner->wait_for_all( *this, NULL );
+    }
+
+    //! Enqueue task for starvation-resistant execution.
+#if __TBB_TASK_PRIORITY
+    /** The task will be enqueued on the normal priority level disregarding the
+        priority of its task group.
+
+        The rationale of such semantics is that priority of an enqueued task is
+        statically fixed at the moment of its enqueuing, while task group priority
+        is dynamic. Thus automatic priority inheritance would be generally a subject
+        to the race, which may result in unexpected behavior.
+
+        Use enqueue() overload with explicit priority value and task::group_priority()
+        method to implement such priority inheritance when it is really necessary. **/
+#endif /* __TBB_TASK_PRIORITY */
+    static void enqueue( task& t ) {
+        t.prefix().owner->enqueue( t, NULL );
+    }
+
+#if __TBB_TASK_PRIORITY
+    //! Enqueue task for starvation-resistant execution on the specified priority level.
+    static void enqueue( task& t, priority_t p ) {
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        __TBB_ASSERT(p == priority_low || p == priority_normal || p == priority_high
+                     || p == internal::priority_critical, "Invalid priority level value");
+#else
+        __TBB_ASSERT(p == priority_low || p == priority_normal || p == priority_high, "Invalid priority level value");
+#endif
+        t.prefix().owner->enqueue( t, (void*)p );
+    }
+#endif /* __TBB_TASK_PRIORITY */
+
+    //! The innermost task being executed or destroyed by the current thread at the moment.
+    static task& __TBB_EXPORTED_FUNC self();
+
+    //! task on whose behalf this task is working, or NULL if this is a root.
+    task* parent() const {return prefix().parent;}
+
+    //! sets parent task pointer to specified value
+    void set_parent(task* p) {
+#if __TBB_TASK_GROUP_CONTEXT
+        __TBB_ASSERT(!p || prefix().context == p->prefix().context, "The tasks must be in the same context");
+#endif
+        prefix().parent = p;
+    }
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! This method is deprecated and will be removed in the future.
+    /** Use method group() instead. **/
+    task_group_context* context() {return prefix().context;}
+
+    //! Pointer to the task group descriptor.
+    task_group_context* group () { return prefix().context; }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+    //! True if task was stolen from the task pool of another thread.
+    bool is_stolen_task() const {
+        return (prefix().extra_state & 0x80)!=0;
+    }
+
+    //------------------------------------------------------------------------
+    // Debugging
+    //------------------------------------------------------------------------
+
+    //! Current execution state
+    state_type state() const {return state_type(prefix().state);}
+
+    //! The internal reference count.
+    int ref_count() const {
+#if TBB_USE_ASSERT
+        internal::reference_count ref_count_ = prefix().ref_count;
+        __TBB_ASSERT( ref_count_==int(ref_count_), "integer overflow error");
+#endif
+        return int(prefix().ref_count);
+    }
+
+    //! Obsolete, and only retained for the sake of backward compatibility. Always returns true.
+    bool __TBB_EXPORTED_METHOD is_owned_by_current_thread() const;
+
+    //------------------------------------------------------------------------
+    // Affinity
+    //------------------------------------------------------------------------
+
+    //! An id as used for specifying affinity.
+    /** Guaranteed to be integral type.  Value of 0 means no affinity. */
+    typedef internal::affinity_id affinity_id;
+
+    //! Set affinity for this task.
+    void set_affinity( affinity_id id ) {prefix().affinity = id;}
+
+    //! Current affinity of this task
+    affinity_id affinity() const {return prefix().affinity;}
+
+    //! Invoked by scheduler to notify task that it ran on unexpected thread.
+    /** Invoked before method execute() runs, if task is stolen, or task has
+        affinity but will be executed on another thread.
+
+        The default action does nothing. */
+    virtual void __TBB_EXPORTED_METHOD note_affinity( affinity_id id );
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Moves this task from its current group into another one.
+    /** Argument ctx specifies the new group.
+
+        The primary purpose of this method is to associate unique task group context
+        with a task allocated for subsequent enqueuing. In contrast to spawned tasks
+        enqueued ones normally outlive the scope where they were created. This makes
+        traditional usage model where task group context are allocated locally on
+        the stack inapplicable. Dynamic allocation of context objects is performance
+        inefficient. Method change_group() allows to make task group context object
+        a member of the task class, and then associate it with its containing task
+        object in the latter's constructor. **/
+    void __TBB_EXPORTED_METHOD change_group ( task_group_context& ctx );
+
+    //! Initiates cancellation of all tasks in this cancellation group and its subordinate groups.
+    /** \return false if cancellation has already been requested, true otherwise. **/
+    bool cancel_group_execution () { return prefix().context->cancel_group_execution(); }
+
+    //! Returns true if the context has received cancellation request.
+    bool is_cancelled () const { return prefix().context->is_group_execution_cancelled(); }
+#else
+    bool is_cancelled () const { return false; }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#if __TBB_TASK_PRIORITY
+    //! Changes priority of the task group this task belongs to.
+    void set_group_priority ( priority_t p ) {  prefix().context->set_priority(p); }
+
+    //! Retrieves current priority of the task group this task belongs to.
+    priority_t group_priority () const { return prefix().context->priority(); }
+
+#endif /* __TBB_TASK_PRIORITY */
+
+private:
+    friend class interface5::internal::task_base;
+    friend class task_list;
+    friend class internal::scheduler;
+    friend class internal::allocate_root_proxy;
+#if __TBB_TASK_GROUP_CONTEXT
+    friend class internal::allocate_root_with_context_proxy;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    friend class internal::allocate_continuation_proxy;
+    friend class internal::allocate_child_proxy;
+    friend class internal::allocate_additional_child_of_proxy;
+
+    //! Get reference to corresponding task_prefix.
+    /** Version tag prevents loader on Linux from using the wrong symbol in debug builds. **/
+    internal::task_prefix& prefix( internal::version_tag* = NULL ) const {
+        return reinterpret_cast<internal::task_prefix*>(const_cast<task*>(this))[-1];
+    }
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    friend void internal::make_critical( task& );
+    friend bool internal::is_critical( task& );
+#endif
+}; // class task
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+namespace internal {
+inline void make_critical( task& t ) { t.prefix().extra_state |= 0x8; }
+inline bool is_critical( task& t ) { return bool((t.prefix().extra_state & 0x8) != 0); }
+} // namespace internal
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+
+//! task that does nothing.  Useful for synchronization.
+/** @ingroup task_scheduling */
+class empty_task: public task {
+    task* execute() __TBB_override {
+        return NULL;
+    }
+};
+
+//! @cond INTERNAL
+namespace internal {
+    template<typename F>
+    class function_task : public task {
+#if __TBB_ALLOW_MUTABLE_FUNCTORS
+        F my_func;
+#else
+        const F my_func;
+#endif
+        task* execute() __TBB_override {
+            my_func();
+            return NULL;
+        }
+    public:
+        function_task( const F& f ) : my_func(f) {}
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        function_task( F&& f ) : my_func( std::move(f) ) {}
+#endif
+    };
+} // namespace internal
+//! @endcond
+
+//! A list of children.
+/** Used for method task::spawn_children
+    @ingroup task_scheduling */
+class task_list: internal::no_copy {
+private:
+    task* first;
+    task** next_ptr;
+    friend class task;
+    friend class interface5::internal::task_base;
+public:
+    //! Construct empty list
+    task_list() : first(NULL), next_ptr(&first) {}
+
+    //! Destroys the list, but does not destroy the task objects.
+    ~task_list() {}
+
+    //! True if list if empty; false otherwise.
+    bool empty() const {return !first;}
+
+    //! Push task onto back of list.
+    void push_back( task& task ) {
+        task.prefix().next = NULL;
+        *next_ptr = &task;
+        next_ptr = &task.prefix().next;
+    }
+#if __TBB_TODO
+    // TODO: add this method and implement&document the local execution ordering. See more in generic_scheduler::local_spawn
+    //! Push task onto front of list (FIFO local execution, like individual spawning in the same order).
+    void push_front( task& task ) {
+        if( empty() ) {
+            push_back(task);
+        } else {
+            task.prefix().next = first;
+            first = &task;
+        }
+    }
+#endif
+    //! Pop the front task from the list.
+    task& pop_front() {
+        __TBB_ASSERT( !empty(), "attempt to pop item from empty task_list" );
+        task* result = first;
+        first = result->prefix().next;
+        if( !first ) next_ptr = &first;
+        return *result;
+    }
+
+    //! Clear the list
+    void clear() {
+        first=NULL;
+        next_ptr=&first;
+    }
+};
+
+inline void interface5::internal::task_base::spawn( task& t ) {
+    t.prefix().owner->spawn( t, t.prefix().next );
+}
+
+inline void interface5::internal::task_base::spawn( task_list& list ) {
+    if( task* t = list.first ) {
+        t->prefix().owner->spawn( *t, *list.next_ptr );
+        list.clear();
+    }
+}
+
+inline void task::spawn_root_and_wait( task_list& root_list ) {
+    if( task* t = root_list.first ) {
+        t->prefix().owner->spawn_root_and_wait( *t, *root_list.next_ptr );
+        root_list.clear();
+    }
+}
+
+} // namespace tbb
+
+inline void *operator new( size_t bytes, const tbb::internal::allocate_root_proxy& ) {
+    return &tbb::internal::allocate_root_proxy::allocate(bytes);
+}
+
+inline void operator delete( void* task, const tbb::internal::allocate_root_proxy& ) {
+    tbb::internal::allocate_root_proxy::free( *static_cast<tbb::task*>(task) );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+inline void *operator new( size_t bytes, const tbb::internal::allocate_root_with_context_proxy& p ) {
+    return &p.allocate(bytes);
+}
+
+inline void operator delete( void* task, const tbb::internal::allocate_root_with_context_proxy& p ) {
+    p.free( *static_cast<tbb::task*>(task) );
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+inline void *operator new( size_t bytes, const tbb::internal::allocate_continuation_proxy& p ) {
+    return &p.allocate(bytes);
+}
+
+inline void operator delete( void* task, const tbb::internal::allocate_continuation_proxy& p ) {
+    p.free( *static_cast<tbb::task*>(task) );
+}
+
+inline void *operator new( size_t bytes, const tbb::internal::allocate_child_proxy& p ) {
+    return &p.allocate(bytes);
+}
+
+inline void operator delete( void* task, const tbb::internal::allocate_child_proxy& p ) {
+    p.free( *static_cast<tbb::task*>(task) );
+}
+
+inline void *operator new( size_t bytes, const tbb::internal::allocate_additional_child_of_proxy& p ) {
+    return &p.allocate(bytes);
+}
+
+inline void operator delete( void* task, const tbb::internal::allocate_additional_child_of_proxy& p ) {
+    p.free( *static_cast<tbb::task*>(task) );
+}
+
+#endif /* __TBB_task_H */
diff --git a/xdl/third_party/tbb/include/tbb/task_arena.h b/xdl/third_party/tbb/include/tbb/task_arena.h
new file mode 100644
index 00000000..fcdf6cda
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/task_arena.h
@@ -0,0 +1,419 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_task_arena_H
+#define __TBB_task_arena_H
+
+#include "task.h"
+#include "tbb_exception.h"
+#include "internal/_template_helpers.h"
+#if TBB_USE_THREADING_TOOLS
+#include "atomic.h" // for as_atomic
+#endif
+#include "aligned_space.h"
+
+namespace tbb {
+
+namespace this_task_arena {
+    int max_concurrency();
+} // namespace this_task_arena
+
+//! @cond INTERNAL
+namespace internal {
+    //! Internal to library. Should not be used by clients.
+    /** @ingroup task_scheduling */
+    class arena;
+    class task_scheduler_observer_v3;
+} // namespace internal
+//! @endcond
+
+namespace interface7 {
+class task_arena;
+
+//! @cond INTERNAL
+namespace internal {
+using namespace tbb::internal; //e.g. function_task from task.h
+
+class delegate_base : no_assign {
+public:
+    virtual void operator()() const = 0;
+    virtual ~delegate_base() {}
+};
+
+// If decltype is availabe, the helper detects the return type of functor of specified type,
+// otherwise it defines the void type.
+template <typename F>
+struct return_type_or_void {
+#if __TBB_CPP11_DECLTYPE_PRESENT && !__TBB_CPP11_DECLTYPE_OF_FUNCTION_RETURN_TYPE_BROKEN
+    typedef decltype(declval<F>()()) type;
+#else
+    typedef void type;
+#endif
+};
+
+template<typename F, typename R>
+class delegated_function : public delegate_base {
+    F &my_func;
+    tbb::aligned_space<R> my_return_storage;
+    // The function should be called only once.
+    void operator()() const __TBB_override {
+        new (my_return_storage.begin()) R(my_func());
+    }
+public:
+    delegated_function(F& f) : my_func(f) {}
+    // The function can be called only after operator() and only once.
+    R consume_result() const {
+        return tbb::internal::move(*(my_return_storage.begin()));
+    }
+    ~delegated_function() {
+        my_return_storage.begin()->~R();
+    }
+};
+
+template<typename F>
+class delegated_function<F,void> : public delegate_base {
+    F &my_func;
+    void operator()() const __TBB_override {
+        my_func();
+    }
+public:
+    delegated_function(F& f) : my_func(f) {}
+    void consume_result() const {}
+
+    friend class task_arena_base;
+};
+
+class task_arena_base {
+protected:
+    //! NULL if not currently initialized.
+    internal::arena* my_arena;
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! default context of the arena
+    task_group_context *my_context;
+#endif
+
+    //! Concurrency level for deferred initialization
+    int my_max_concurrency;
+
+    //! Reserved master slots
+    unsigned my_master_slots;
+
+    //! Special settings
+    intptr_t my_version_and_traits;
+
+    enum {
+        default_flags = 0
+#if __TBB_TASK_GROUP_CONTEXT
+        | (task_group_context::default_traits & task_group_context::exact_exception)  // 0 or 1 << 16
+        , exact_exception_flag = task_group_context::exact_exception // used to specify flag for context directly
+#endif
+    };
+
+    task_arena_base(int max_concurrency, unsigned reserved_for_masters)
+        : my_arena(0)
+#if __TBB_TASK_GROUP_CONTEXT
+        , my_context(0)
+#endif
+        , my_max_concurrency(max_concurrency)
+        , my_master_slots(reserved_for_masters)
+        , my_version_and_traits(default_flags)
+        {}
+
+    void __TBB_EXPORTED_METHOD internal_initialize();
+    void __TBB_EXPORTED_METHOD internal_terminate();
+    void __TBB_EXPORTED_METHOD internal_attach();
+    void __TBB_EXPORTED_METHOD internal_enqueue( task&, intptr_t ) const;
+    void __TBB_EXPORTED_METHOD internal_execute( delegate_base& ) const;
+    void __TBB_EXPORTED_METHOD internal_wait() const;
+    static int __TBB_EXPORTED_FUNC internal_current_slot();
+    static int __TBB_EXPORTED_FUNC internal_max_concurrency( const task_arena * );
+public:
+    //! Typedef for number of threads that is automatic.
+    static const int automatic = -1;
+    static const int not_initialized = -2;
+
+};
+
+#if __TBB_TASK_ISOLATION
+void __TBB_EXPORTED_FUNC isolate_within_arena( delegate_base& d, intptr_t reserved = 0 );
+
+template<typename R, typename F>
+R isolate_impl(F& f) {
+    delegated_function<F, R> d(f);
+    isolate_within_arena(d);
+    return d.consume_result();
+}
+#endif /* __TBB_TASK_ISOLATION */
+} // namespace internal
+//! @endcond
+
+/** 1-to-1 proxy representation class of scheduler's arena
+ * Constructors set up settings only, real construction is deferred till the first method invocation
+ * Destructor only removes one of the references to the inner arena representation.
+ * Final destruction happens when all the references (and the work) are gone.
+ */
+class task_arena : public internal::task_arena_base {
+    friend class tbb::internal::task_scheduler_observer_v3;
+    friend int tbb::this_task_arena::max_concurrency();
+    bool my_initialized;
+    void mark_initialized() {
+        __TBB_ASSERT( my_arena, "task_arena initialization is incomplete" );
+#if __TBB_TASK_GROUP_CONTEXT
+        __TBB_ASSERT( my_context, "task_arena initialization is incomplete" );
+#endif
+#if TBB_USE_THREADING_TOOLS
+        // Actual synchronization happens in internal_initialize & internal_attach.
+        // The race on setting my_initialized is benign, but should be hidden from Intel(R) Inspector
+        internal::as_atomic(my_initialized).fetch_and_store<release>(true);
+#else
+        my_initialized = true;
+#endif
+    }
+
+    template<typename F>
+    void enqueue_impl( __TBB_FORWARDING_REF(F) f
+#if __TBB_TASK_PRIORITY
+        , priority_t p = priority_t(0)
+#endif
+    ) {
+#if !__TBB_TASK_PRIORITY
+        intptr_t p = 0;
+#endif
+        initialize();
+#if __TBB_TASK_GROUP_CONTEXT
+        internal_enqueue(*new(task::allocate_root(*my_context)) internal::function_task< typename internal::strip<F>::type >(internal::forward<F>(f)), p);
+#else
+        internal_enqueue(*new(task::allocate_root()) internal::function_task< typename internal::strip<F>::type >(internal::forward<F>(f)), p);
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    }
+
+    template<typename R, typename F>
+    R execute_impl(F& f) {
+        initialize();
+        internal::delegated_function<F, R> d(f);
+        internal_execute(d);
+        return d.consume_result();
+    }
+
+public:
+    //! Creates task_arena with certain concurrency limits
+    /** Sets up settings only, real construction is deferred till the first method invocation
+     *  @arg max_concurrency specifies total number of slots in arena where threads work
+     *  @arg reserved_for_masters specifies number of slots to be used by master threads only.
+     *       Value of 1 is default and reflects behavior of implicit arenas.
+     **/
+    task_arena(int max_concurrency_ = automatic, unsigned reserved_for_masters = 1)
+        : task_arena_base(max_concurrency_, reserved_for_masters)
+        , my_initialized(false)
+    {}
+
+    //! Copies settings from another task_arena
+    task_arena(const task_arena &s) // copy settings but not the reference or instance
+        : task_arena_base(s.my_max_concurrency, s.my_master_slots)
+        , my_initialized(false)
+    {}
+
+    //! Tag class used to indicate the "attaching" constructor
+    struct attach {};
+
+    //! Creates an instance of task_arena attached to the current arena of the thread
+    explicit task_arena( attach )
+        : task_arena_base(automatic, 1) // use default settings if attach fails
+        , my_initialized(false)
+    {
+        internal_attach();
+        if( my_arena ) my_initialized = true;
+    }
+
+    //! Forces allocation of the resources for the task_arena as specified in constructor arguments
+    inline void initialize() {
+        if( !my_initialized ) {
+            internal_initialize();
+            mark_initialized();
+        }
+    }
+
+    //! Overrides concurrency level and forces initialization of internal representation
+    inline void initialize(int max_concurrency_, unsigned reserved_for_masters = 1) {
+        // TODO: decide if this call must be thread-safe
+        __TBB_ASSERT(!my_arena, "Impossible to modify settings of an already initialized task_arena");
+        if( !my_initialized ) {
+            my_max_concurrency = max_concurrency_;
+            my_master_slots = reserved_for_masters;
+            initialize();
+        }
+    }
+
+    //! Attaches this instance to the current arena of the thread
+    inline void initialize(attach) {
+        // TODO: decide if this call must be thread-safe
+        __TBB_ASSERT(!my_arena, "Impossible to modify settings of an already initialized task_arena");
+        if( !my_initialized ) {
+            internal_attach();
+            if ( !my_arena ) internal_initialize();
+            mark_initialized();
+        }
+    }
+
+    //! Removes the reference to the internal arena representation.
+    //! Not thread safe wrt concurrent invocations of other methods.
+    inline void terminate() {
+        if( my_initialized ) {
+            internal_terminate();
+            my_initialized = false;
+        }
+    }
+
+    //! Removes the reference to the internal arena representation, and destroys the external object.
+    //! Not thread safe wrt concurrent invocations of other methods.
+    ~task_arena() {
+        terminate();
+    }
+
+    //! Returns true if the arena is active (initialized); false otherwise.
+    //! The name was chosen to match a task_scheduler_init method with the same semantics.
+    bool is_active() const { return my_initialized; }
+
+    //! Enqueues a task into the arena to process a functor, and immediately returns.
+    //! Does not require the calling thread to join the arena
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename F>
+    void enqueue( F&& f ) {
+        enqueue_impl(std::forward<F>(f));
+    }
+#else
+    template<typename F>
+    void enqueue( const F& f ) {
+        enqueue_impl(f);
+    }
+#endif
+
+#if __TBB_TASK_PRIORITY
+    //! Enqueues a task with priority p into the arena to process a functor f, and immediately returns.
+    //! Does not require the calling thread to join the arena
+    template<typename F>
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void enqueue( F&& f, priority_t p ) {
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        __TBB_ASSERT(p == priority_low || p == priority_normal || p == priority_high
+                     || p == internal::priority_critical, "Invalid priority level value");
+#else
+        __TBB_ASSERT(p == priority_low || p == priority_normal || p == priority_high, "Invalid priority level value");
+#endif
+        enqueue_impl(std::forward<F>(f), p);
+    }
+#else
+    void enqueue( const F& f, priority_t p ) {
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        __TBB_ASSERT(p == priority_low || p == priority_normal || p == priority_high
+                     || p == internal::priority_critical, "Invalid priority level value");
+#else
+        __TBB_ASSERT(p == priority_low || p == priority_normal || p == priority_high, "Invalid priority level value");
+#endif
+        enqueue_impl(f,p);
+    }
+#endif
+#endif// __TBB_TASK_PRIORITY
+
+    //! Joins the arena and executes a mutable functor, then returns
+    //! If not possible to join, wraps the functor into a task, enqueues it and waits for task completion
+    //! Can decrement the arena demand for workers, causing a worker to leave and free a slot to the calling thread
+    //! Since C++11, the method returns the value returned by functor (prior to C++11 it returns void).
+    template<typename F>
+    typename internal::return_type_or_void<F>::type execute(F& f) {
+        return execute_impl<typename internal::return_type_or_void<F>::type>(f);
+    }
+
+    //! Joins the arena and executes a constant functor, then returns
+    //! If not possible to join, wraps the functor into a task, enqueues it and waits for task completion
+    //! Can decrement the arena demand for workers, causing a worker to leave and free a slot to the calling thread
+    //! Since C++11, the method returns the value returned by functor (prior to C++11 it returns void).
+    template<typename F>
+    typename internal::return_type_or_void<F>::type execute(const F& f) {
+        return execute_impl<typename internal::return_type_or_void<F>::type>(f);
+    }
+
+#if __TBB_EXTRA_DEBUG
+    //! Wait for all work in the arena to be completed
+    //! Even submitted by other application threads
+    //! Joins arena if/when possible (in the same way as execute())
+    void debug_wait_until_empty() {
+        initialize();
+        internal_wait();
+    }
+#endif //__TBB_EXTRA_DEBUG
+
+    //! Returns the index, aka slot number, of the calling thread in its current arena
+    //! This method is deprecated and replaced with this_task_arena::current_thread_index()
+    inline static int current_thread_index() {
+        return internal_current_slot();
+    }
+
+    //! Returns the maximal number of threads that can work inside the arena
+    inline int max_concurrency() const {
+        // Handle special cases inside the library
+        return (my_max_concurrency>1) ? my_max_concurrency : internal_max_concurrency(this);
+    }
+};
+
+#if __TBB_TASK_ISOLATION
+namespace this_task_arena {
+    //! Executes a mutable functor in isolation within the current task arena.
+    //! Since C++11, the method returns the value returned by functor (prior to C++11 it returns void).
+    template<typename F>
+    typename internal::return_type_or_void<F>::type isolate(F& f) {
+        return internal::isolate_impl<typename internal::return_type_or_void<F>::type>(f);
+    }
+
+    //! Executes a constant functor in isolation within the current task arena.
+    //! Since C++11, the method returns the value returned by functor (prior to C++11 it returns void).
+    template<typename F>
+    typename internal::return_type_or_void<F>::type isolate(const F& f) {
+        return internal::isolate_impl<typename internal::return_type_or_void<F>::type>(f);
+    }
+}
+#endif /* __TBB_TASK_ISOLATION */
+} // namespace interfaceX
+
+using interface7::task_arena;
+#if __TBB_TASK_ISOLATION
+namespace this_task_arena {
+    using namespace interface7::this_task_arena;
+}
+#endif /* __TBB_TASK_ISOLATION */
+
+namespace this_task_arena {
+    //! Returns the index, aka slot number, of the calling thread in its current arena
+    inline int current_thread_index() {
+        int idx = tbb::task_arena::current_thread_index();
+        return idx == -1 ? tbb::task_arena::not_initialized : idx;
+    }
+
+    //! Returns the maximal number of threads that can work inside the arena
+    inline int max_concurrency() {
+        return tbb::task_arena::internal_max_concurrency(NULL);
+    }
+} // namespace this_task_arena
+
+} // namespace tbb
+
+#endif /* __TBB_task_arena_H */
diff --git a/xdl/third_party/tbb/include/tbb/task_group.h b/xdl/third_party/tbb/include/tbb/task_group.h
new file mode 100644
index 00000000..42fd724a
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/task_group.h
@@ -0,0 +1,261 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_task_group_H
+#define __TBB_task_group_H
+
+#include "task.h"
+#include "tbb_exception.h"
+#include "internal/_template_helpers.h"
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+namespace tbb {
+
+namespace internal {
+    template<typename F> class task_handle_task;
+}
+
+class task_group;
+class structured_task_group;
+
+template<typename F>
+class task_handle : internal::no_assign {
+    template<typename _F> friend class internal::task_handle_task;
+    friend class task_group;
+    friend class structured_task_group;
+
+    static const intptr_t scheduled = 0x1;
+
+    F my_func;
+    intptr_t my_state;
+
+    void mark_scheduled () {
+        // The check here is intentionally lax to avoid the impact of interlocked operation
+        if ( my_state & scheduled )
+            internal::throw_exception( internal::eid_invalid_multiple_scheduling );
+        my_state |= scheduled;
+    }
+public:
+    task_handle( const F& f ) : my_func(f), my_state(0) {}
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    task_handle( F&& f ) : my_func( std::move(f)), my_state(0) {}
+#endif
+
+    void operator() () const { my_func(); }
+};
+
+enum task_group_status {
+    not_complete,
+    complete,
+    canceled
+};
+
+namespace internal {
+
+template<typename F>
+class task_handle_task : public task {
+    task_handle<F>& my_handle;
+    task* execute() __TBB_override {
+        my_handle();
+        return NULL;
+    }
+public:
+    task_handle_task( task_handle<F>& h ) : my_handle(h) { h.mark_scheduled(); }
+};
+
+class task_group_base : internal::no_copy {
+    class ref_count_guard : internal::no_copy {
+        task& my_task;
+    public:
+        ref_count_guard(task& t) : my_task(t) {
+            my_task.increment_ref_count();
+        }
+        ~ref_count_guard() {
+            my_task.decrement_ref_count();
+        }
+    };
+protected:
+    empty_task* my_root;
+    task_group_context my_context;
+
+    task& owner () { return *my_root; }
+
+    template<typename F>
+    task_group_status internal_run_and_wait( F& f ) {
+        __TBB_TRY {
+            if ( !my_context.is_group_execution_cancelled() ) {
+                // We need to increase the reference count of the root task to notify waiters that
+                // this task group has some work in progress.
+                ref_count_guard guard(*my_root);
+                f();
+            }
+        } __TBB_CATCH( ... ) {
+            my_context.register_pending_exception();
+        }
+        return wait();
+    }
+
+    template<typename Task, typename F>
+    void internal_run( __TBB_FORWARDING_REF(F) f ) {
+        owner().spawn( *new( owner().allocate_additional_child_of(*my_root) ) Task( internal::forward<F>(f) ));
+    }
+
+public:
+    task_group_base( uintptr_t traits = 0 )
+        : my_context(task_group_context::bound, task_group_context::default_traits | traits)
+    {
+        my_root = new( task::allocate_root(my_context) ) empty_task;
+        my_root->set_ref_count(1);
+    }
+
+    ~task_group_base() __TBB_NOEXCEPT(false) {
+        if( my_root->ref_count() > 1 ) {
+#if __TBB_CPP17_UNCAUGHT_EXCEPTIONS_PRESENT
+            bool stack_unwinding_in_progress = std::uncaught_exceptions() > 0;
+#else
+            bool stack_unwinding_in_progress = std::uncaught_exception();
+#endif
+            // Always attempt to do proper cleanup to avoid inevitable memory corruption
+            // in case of missing wait (for the sake of better testability & debuggability)
+            if ( !is_canceling() )
+                cancel();
+            __TBB_TRY {
+                my_root->wait_for_all();
+            } __TBB_CATCH (...) {
+                task::destroy(*my_root);
+                __TBB_RETHROW();
+            }
+            task::destroy(*my_root);
+            if ( !stack_unwinding_in_progress )
+                internal::throw_exception( internal::eid_missing_wait );
+        }
+        else {
+            task::destroy(*my_root);
+        }
+    }
+
+    template<typename F>
+    void run( task_handle<F>& h ) {
+        internal_run< internal::task_handle_task<F> >( h );
+    }
+
+    task_group_status wait() {
+        __TBB_TRY {
+            my_root->wait_for_all();
+        } __TBB_CATCH( ... ) {
+            my_context.reset();
+            __TBB_RETHROW();
+        }
+        if ( my_context.is_group_execution_cancelled() ) {
+            // TODO: the reset method is not thread-safe. Ensure the correct behavior.
+            my_context.reset();
+            return canceled;
+        }
+        return complete;
+    }
+
+    bool is_canceling() {
+        return my_context.is_group_execution_cancelled();
+    }
+
+    void cancel() {
+        my_context.cancel_group_execution();
+    }
+}; // class task_group_base
+
+} // namespace internal
+
+class task_group : public internal::task_group_base {
+public:
+    task_group () : task_group_base( task_group_context::concurrent_wait ) {}
+
+#if __SUNPRO_CC
+    template<typename F>
+    void run( task_handle<F>& h ) {
+        internal_run< internal::task_handle_task<F> >( h );
+    }
+#else
+    using task_group_base::run;
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename F>
+    void run( F&& f ) {
+        internal_run< internal::function_task< typename internal::strip<F>::type > >( std::forward< F >(f) );
+    }
+#else
+    template<typename F>
+    void run(const F& f) {
+        internal_run<internal::function_task<F> >(f);
+    }
+#endif
+
+    template<typename F>
+    task_group_status run_and_wait( const F& f ) {
+        return internal_run_and_wait<const F>( f );
+    }
+
+    // TODO: add task_handle rvalues support
+    template<typename F>
+    task_group_status run_and_wait( task_handle<F>& h ) {
+      h.mark_scheduled();
+      return internal_run_and_wait< task_handle<F> >( h );
+    }
+}; // class task_group
+
+class structured_task_group : public internal::task_group_base {
+public:
+    // TODO: add task_handle rvalues support
+    template<typename F>
+    task_group_status run_and_wait ( task_handle<F>& h ) {
+        h.mark_scheduled();
+        return internal_run_and_wait< task_handle<F> >( h );
+    }
+
+    task_group_status wait() {
+        task_group_status res = task_group_base::wait();
+        my_root->set_ref_count(1);
+        return res;
+    }
+}; // class structured_task_group
+
+inline
+bool is_current_task_group_canceling() {
+    return task::self().is_cancelled();
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<class F>
+task_handle< typename internal::strip<F>::type > make_task( F&& f ) {
+    return task_handle< typename internal::strip<F>::type >( std::forward<F>(f) );
+}
+#else
+template<class F>
+task_handle<F> make_task( const F& f ) {
+    return task_handle<F>( f );
+}
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+} // namespace tbb
+
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#endif /* __TBB_task_group_H */
diff --git a/xdl/third_party/tbb/include/tbb/task_scheduler_init.h b/xdl/third_party/tbb/include/tbb/task_scheduler_init.h
new file mode 100644
index 00000000..c559fd0a
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/task_scheduler_init.h
@@ -0,0 +1,161 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_task_scheduler_init_H
+#define __TBB_task_scheduler_init_H
+
+#include "tbb_stddef.h"
+#include "limits.h"
+#if __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+#include <new> // nothrow_t
+#endif
+
+namespace tbb {
+
+typedef std::size_t stack_size_type;
+
+//! @cond INTERNAL
+namespace internal {
+    //! Internal to library. Should not be used by clients.
+    /** @ingroup task_scheduling */
+    class scheduler;
+} // namespace internal
+//! @endcond
+
+//! Class delimiting the scope of task scheduler activity.
+/** A thread can construct a task_scheduler_init object and keep it alive
+    while it uses TBB's tasking subsystem (including parallel algorithms).
+
+    This class allows to customize properties of the TBB task pool to some extent.
+    For example it can limit concurrency level of parallel work initiated by the
+    given thread. It also can be used to specify stack size of the TBB worker threads,
+    though this setting is not effective if the thread pool has already been created.
+
+    If a parallel construct is used without task_scheduler_init object previously
+    created, the scheduler will be initialized automatically with default settings,
+    and will persist until this thread exits. Default concurrency level is defined
+    as described in task_scheduler_init::initialize().
+    @ingroup task_scheduling */
+class task_scheduler_init: internal::no_copy {
+    enum ExceptionPropagationMode {
+        propagation_mode_exact = 1u,
+        propagation_mode_captured = 2u,
+        propagation_mode_mask = propagation_mode_exact | propagation_mode_captured
+    };
+
+    /** NULL if not currently initialized. */
+    internal::scheduler* my_scheduler;
+
+    bool internal_terminate( bool blocking );
+#if __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+    bool __TBB_EXPORTED_METHOD internal_blocking_terminate( bool throwing );
+#endif
+public:
+
+    //! Typedef for number of threads that is automatic.
+    static const int automatic = -1;
+
+    //! Argument to initialize() or constructor that causes initialization to be deferred.
+    static const int deferred = -2;
+
+    //! Ensure that scheduler exists for this thread
+    /** A value of -1 lets TBB decide on the number of threads, which is usually
+        maximal hardware concurrency for this process, that is the number of logical
+        CPUs on the machine (possibly limited by the processor affinity mask of this
+        process (Windows) or of this thread (Linux, FreeBSD). It is preferable option
+        for production code because it helps to avoid nasty surprises when several
+        TBB based components run side-by-side or in a nested fashion inside the same
+        process.
+
+        The number_of_threads is ignored if any other task_scheduler_inits
+        currently exist.  A thread may construct multiple task_scheduler_inits.
+        Doing so does no harm because the underlying scheduler is reference counted. */
+    void __TBB_EXPORTED_METHOD initialize( int number_of_threads=automatic );
+
+    //! The overloaded method with stack size parameter
+    /** Overloading is necessary to preserve ABI compatibility */
+    void __TBB_EXPORTED_METHOD initialize( int number_of_threads, stack_size_type thread_stack_size );
+
+    //! Inverse of method initialize.
+    void __TBB_EXPORTED_METHOD terminate();
+
+#if __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+#if TBB_USE_EXCEPTIONS
+    //! terminate() that waits for worker threads termination. Throws exception on error.
+    void blocking_terminate() {
+        internal_blocking_terminate( /*throwing=*/true );
+    }
+#endif
+    //! terminate() that waits for worker threads termination. Returns false on error.
+    bool blocking_terminate(const std::nothrow_t&) __TBB_NOEXCEPT(true) {
+        return internal_blocking_terminate( /*throwing=*/false );
+    }
+#endif // __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+
+    //! Shorthand for default constructor followed by call to initialize(number_of_threads).
+    task_scheduler_init( int number_of_threads=automatic, stack_size_type thread_stack_size=0 ) : my_scheduler(NULL)
+    {
+        // Two lowest order bits of the stack size argument may be taken to communicate
+        // default exception propagation mode of the client to be used when the
+        // client manually creates tasks in the master thread and does not use
+        // explicit task group context object. This is necessary because newer
+        // TBB binaries with exact propagation enabled by default may be used
+        // by older clients that expect tbb::captured_exception wrapper.
+        // All zeros mean old client - no preference.
+        __TBB_ASSERT( !(thread_stack_size & propagation_mode_mask), "Requested stack size is not aligned" );
+#if TBB_USE_EXCEPTIONS
+        thread_stack_size |= TBB_USE_CAPTURED_EXCEPTION ? propagation_mode_captured : propagation_mode_exact;
+#endif /* TBB_USE_EXCEPTIONS */
+        initialize( number_of_threads, thread_stack_size );
+    }
+
+    //! Destroy scheduler for this thread if thread has no other live task_scheduler_inits.
+    ~task_scheduler_init() {
+        if( my_scheduler )
+            terminate();
+        internal::poison_pointer( my_scheduler );
+    }
+    //! Returns the number of threads TBB scheduler would create if initialized by default.
+    /** Result returned by this method does not depend on whether the scheduler
+        has already been initialized.
+
+        Because tbb 2.0 does not support blocking tasks yet, you may use this method
+        to boost the number of threads in the tbb's internal pool, if your tasks are
+        doing I/O operations. The optimal number of additional threads depends on how
+        much time your tasks spend in the blocked state.
+
+        Before TBB 3.0 U4 this method returned the number of logical CPU in the
+        system. Currently on Windows, Linux and FreeBSD it returns the number of
+        logical CPUs available to the current process in accordance with its affinity
+        mask.
+
+        NOTE: The return value of this method never changes after its first invocation.
+        This means that changes in the process affinity mask that took place after
+        this method was first invoked will not affect the number of worker threads
+        in the TBB worker threads pool. */
+    static int __TBB_EXPORTED_FUNC default_num_threads ();
+
+    //! Returns true if scheduler is active (initialized); false otherwise
+    bool is_active() const { return my_scheduler != NULL; }
+};
+
+} // namespace tbb
+
+#endif /* __TBB_task_scheduler_init_H */
diff --git a/xdl/third_party/tbb/include/tbb/task_scheduler_observer.h b/xdl/third_party/tbb/include/tbb/task_scheduler_observer.h
new file mode 100644
index 00000000..a2020d73
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/task_scheduler_observer.h
@@ -0,0 +1,174 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_task_scheduler_observer_H
+#define __TBB_task_scheduler_observer_H
+
+#include "atomic.h"
+#if __TBB_ARENA_OBSERVER || __TBB_SLEEP_PERMISSION
+#include "task_arena.h"
+#endif
+
+#if __TBB_SCHEDULER_OBSERVER
+
+namespace tbb {
+namespace interface6 {
+class task_scheduler_observer;
+}
+namespace internal {
+
+class observer_proxy;
+class observer_list;
+
+class task_scheduler_observer_v3 {
+    friend class observer_proxy;
+    friend class observer_list;
+    friend class interface6::task_scheduler_observer;
+
+    //! Pointer to the proxy holding this observer.
+    /** Observers are proxied by the scheduler to maintain persistent lists of them. **/
+    observer_proxy* my_proxy;
+
+    //! Counter preventing the observer from being destroyed while in use by the scheduler.
+    /** Valid only when observation is on. **/
+    atomic<intptr_t> my_busy_count;
+
+public:
+    //! Enable or disable observation
+    /** For local observers the method can be used only when the current thread
+        has the task scheduler initialized or is attached to an arena.
+
+        Repeated calls with the same state are no-ops. **/
+    void __TBB_EXPORTED_METHOD observe( bool state=true );
+
+    //! Returns true if observation is enabled, false otherwise.
+    bool is_observing() const {return my_proxy!=NULL;}
+
+    //! Construct observer with observation disabled.
+    task_scheduler_observer_v3() : my_proxy(NULL) { my_busy_count.store<relaxed>(0); }
+
+    //! Entry notification
+    /** Invoked from inside observe(true) call and whenever a worker enters the arena
+        this observer is associated with. If a thread is already in the arena when
+        the observer is activated, the entry notification is called before it
+        executes the first stolen task.
+
+        Obsolete semantics. For global observers it is called by a thread before
+        the first steal since observation became enabled. **/
+    virtual void on_scheduler_entry( bool /*is_worker*/ ) {}
+
+    //! Exit notification
+    /** Invoked from inside observe(false) call and whenever a worker leaves the
+        arena this observer is associated with.
+
+        Obsolete semantics. For global observers it is called by a thread before
+        the first steal since observation became enabled. **/
+    virtual void on_scheduler_exit( bool /*is_worker*/ ) {}
+
+    //! Destructor automatically switches observation off if it is enabled.
+    virtual ~task_scheduler_observer_v3() { if(my_proxy) observe(false);}
+};
+
+} // namespace internal
+
+#if __TBB_ARENA_OBSERVER || __TBB_SLEEP_PERMISSION
+namespace interface6 {
+class task_scheduler_observer : public internal::task_scheduler_observer_v3 {
+    friend class internal::task_scheduler_observer_v3;
+    friend class internal::observer_proxy;
+    friend class internal::observer_list;
+
+    /** Negative numbers with the largest absolute value to minimize probability
+        of coincidence in case of a bug in busy count usage. **/
+    // TODO: take more high bits for version number
+    static const intptr_t v6_trait = (intptr_t)((~(uintptr_t)0 >> 1) + 1);
+
+    //! contains task_arena pointer or tag indicating local or global semantics of the observer
+    intptr_t my_context_tag;
+    enum { global_tag = 0, implicit_tag = 1 };
+
+public:
+    //! Construct local or global observer in inactive state (observation disabled).
+    /** For a local observer entry/exit notifications are invoked whenever a worker
+        thread joins/leaves the arena of the observer's owner thread. If a thread is
+        already in the arena when the observer is activated, the entry notification is
+        called before it executes the first stolen task. **/
+    /** TODO: Obsolete.
+        Global observer semantics is obsolete as it violates master thread isolation
+        guarantees and is not composable. Thus the current default behavior of the
+        constructor is obsolete too and will be changed in one of the future versions
+        of the library. **/
+    explicit task_scheduler_observer( bool local = false ) {
+#if  __TBB_ARENA_OBSERVER
+        my_context_tag = local? implicit_tag : global_tag;
+#else
+        __TBB_ASSERT_EX( !local, NULL );
+        my_context_tag = global_tag;
+#endif
+    }
+
+#if  __TBB_ARENA_OBSERVER
+    //! Construct local observer for a given arena in inactive state (observation disabled).
+    /** entry/exit notifications are invoked whenever a thread joins/leaves arena.
+        If a thread is already in the arena when the observer is activated, the entry notification
+        is called before it executes the first stolen task. **/
+    explicit task_scheduler_observer( task_arena & a) {
+        my_context_tag = (intptr_t)&a;
+    }
+#endif /* __TBB_ARENA_OBSERVER */
+
+    /** Destructor protects instance of the observer from concurrent notification.
+       It is recommended to disable observation before destructor of a derived class starts,
+       otherwise it can lead to concurrent notification callback on partly destroyed object **/
+    virtual ~task_scheduler_observer() { if(my_proxy) observe(false); }
+
+    //! Enable or disable observation
+    /** Warning: concurrent invocations of this method are not safe.
+        Repeated calls with the same state are no-ops. **/
+    void observe( bool state=true ) {
+        if( state && !my_proxy ) {
+            __TBB_ASSERT( !my_busy_count, "Inconsistent state of task_scheduler_observer instance");
+            my_busy_count.store<relaxed>(v6_trait);
+        }
+        internal::task_scheduler_observer_v3::observe(state);
+    }
+
+#if  __TBB_SLEEP_PERMISSION
+    //! Return commands for may_sleep()
+    enum { keep_awake = false, allow_sleep = true };
+
+    //! The callback can be invoked by a worker thread before it goes to sleep.
+    /** If it returns false ('keep_awake'), the thread will keep spinning and looking for work.
+        It will not be called for master threads. **/
+    virtual bool may_sleep() { return allow_sleep; }
+#endif /*__TBB_SLEEP_PERMISSION*/
+};
+
+} //namespace interface6
+using interface6::task_scheduler_observer;
+#else /*__TBB_ARENA_OBSERVER || __TBB_SLEEP_PERMISSION*/
+typedef tbb::internal::task_scheduler_observer_v3 task_scheduler_observer;
+#endif /*__TBB_ARENA_OBSERVER || __TBB_SLEEP_PERMISSION*/
+
+} // namespace tbb
+
+#endif /* __TBB_SCHEDULER_OBSERVER */
+
+#endif /* __TBB_task_scheduler_observer_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb.h b/xdl/third_party/tbb/include/tbb/tbb.h
new file mode 100644
index 00000000..8908b867
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb.h
@@ -0,0 +1,89 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_H
+#define __TBB_tbb_H
+
+/**
+    This header bulk-includes declarations or definitions of all the functionality
+    provided by TBB (save for tbbmalloc and 3rd party dependent headers).
+
+    If you use only a few TBB constructs, consider including specific headers only.
+    Any header listed below can be included independently of others.
+**/
+
+#if TBB_PREVIEW_AGGREGATOR
+#include "aggregator.h"
+#endif
+#include "aligned_space.h"
+#include "atomic.h"
+#include "blocked_range.h"
+#include "blocked_range2d.h"
+#include "blocked_range3d.h"
+#if TBB_PREVIEW_BLOCKED_RANGE_ND
+#include "blocked_rangeNd.h"
+#endif
+#include "cache_aligned_allocator.h"
+#include "combinable.h"
+#include "concurrent_hash_map.h"
+#if TBB_PREVIEW_CONCURRENT_LRU_CACHE
+#include "concurrent_lru_cache.h"
+#endif
+#include "concurrent_priority_queue.h"
+#include "concurrent_queue.h"
+#include "concurrent_unordered_map.h"
+#include "concurrent_unordered_set.h"
+#include "concurrent_vector.h"
+#include "critical_section.h"
+#include "enumerable_thread_specific.h"
+#include "flow_graph.h"
+#if TBB_PREVIEW_GLOBAL_CONTROL
+#include "global_control.h"
+#endif
+#include "iterators.h"
+#include "mutex.h"
+#include "null_mutex.h"
+#include "null_rw_mutex.h"
+#include "parallel_do.h"
+#include "parallel_for.h"
+#include "parallel_for_each.h"
+#include "parallel_invoke.h"
+#include "parallel_reduce.h"
+#include "parallel_scan.h"
+#include "parallel_sort.h"
+#include "partitioner.h"
+#include "pipeline.h"
+#include "queuing_mutex.h"
+#include "queuing_rw_mutex.h"
+#include "reader_writer_lock.h"
+#include "recursive_mutex.h"
+#include "spin_mutex.h"
+#include "spin_rw_mutex.h"
+#include "task.h"
+#include "task_arena.h"
+#include "task_group.h"
+#include "task_scheduler_init.h"
+#include "task_scheduler_observer.h"
+#include "tbb_allocator.h"
+#include "tbb_exception.h"
+#include "tbb_thread.h"
+#include "tick_count.h"
+
+#endif /* __TBB_tbb_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_allocator.h b/xdl/third_party/tbb/include/tbb/tbb_allocator.h
new file mode 100644
index 00000000..162e4e3b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_allocator.h
@@ -0,0 +1,207 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_allocator_H
+#define __TBB_tbb_allocator_H
+
+#include "tbb_stddef.h"
+#include <new>
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+ #include <utility> // std::forward
+#endif
+#include <cstring>
+
+namespace tbb {
+
+//! @cond INTERNAL
+namespace internal {
+
+    //! Deallocates memory using FreeHandler
+    /** The function uses scalable_free if scalable allocator is available and free if not*/
+    void __TBB_EXPORTED_FUNC deallocate_via_handler_v3( void *p );
+
+    //! Allocates memory using MallocHandler
+    /** The function uses scalable_malloc if scalable allocator is available and malloc if not*/
+    void* __TBB_EXPORTED_FUNC allocate_via_handler_v3( size_t n );
+
+    //! Returns true if standard malloc/free are used to work with memory.
+    bool __TBB_EXPORTED_FUNC is_malloc_used_v3();
+}
+//! @endcond
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for erroneous "unreferenced parameter" warning in method destroy.
+    #pragma warning (push)
+    #pragma warning (disable: 4100)
+#endif
+
+//! Meets "allocator" requirements of ISO C++ Standard, Section 20.1.5
+/** The class selects the best memory allocation mechanism available
+    from scalable_malloc and standard malloc.
+    The members are ordered the same way they are in section 20.4.1
+    of the ISO C++ standard.
+    @ingroup memory_allocation */
+template<typename T>
+class tbb_allocator {
+public:
+    typedef typename internal::allocator_type<T>::value_type value_type;
+    typedef value_type* pointer;
+    typedef const value_type* const_pointer;
+    typedef value_type& reference;
+    typedef const value_type& const_reference;
+    typedef size_t size_type;
+    typedef ptrdiff_t difference_type;
+    template<typename U> struct rebind {
+        typedef tbb_allocator<U> other;
+    };
+
+    //! Specifies current allocator
+    enum malloc_type {
+        scalable,
+        standard
+    };
+
+    tbb_allocator() throw() {}
+    tbb_allocator( const tbb_allocator& ) throw() {}
+    template<typename U> tbb_allocator(const tbb_allocator<U>&) throw() {}
+
+    pointer address(reference x) const {return &x;}
+    const_pointer address(const_reference x) const {return &x;}
+
+    //! Allocate space for n objects.
+    pointer allocate( size_type n, const void* /*hint*/ = 0) {
+        return pointer(internal::allocate_via_handler_v3( n * sizeof(value_type) ));
+    }
+
+    //! Free previously allocated block of memory.
+    void deallocate( pointer p, size_type ) {
+        internal::deallocate_via_handler_v3(p);
+    }
+
+    //! Largest value for which method allocate might succeed.
+    size_type max_size() const throw() {
+        size_type max = static_cast<size_type>(-1) / sizeof (value_type);
+        return (max > 0 ? max : 1);
+    }
+
+    //! Copy-construct value at location pointed to by p.
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    template<typename U, typename... Args>
+    void construct(U *p, Args&&... args)
+        { ::new((void *)p) U(std::forward<Args>(args)...); }
+#else // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void construct( pointer p, value_type&& value ) {::new((void*)(p)) value_type(std::move(value));}
+#endif
+    void construct( pointer p, const value_type& value ) {::new((void*)(p)) value_type(value);}
+#endif // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+
+    //! Destroy value at location pointed to by p.
+    void destroy( pointer p ) {p->~value_type();}
+
+    //! Returns current allocator
+    static malloc_type allocator_type() {
+        return internal::is_malloc_used_v3() ? standard : scalable;
+    }
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4100 is back
+
+//! Analogous to std::allocator<void>, as defined in ISO C++ Standard, Section 20.4.1
+/** @ingroup memory_allocation */
+template<>
+class tbb_allocator<void> {
+public:
+    typedef void* pointer;
+    typedef const void* const_pointer;
+    typedef void value_type;
+    template<typename U> struct rebind {
+        typedef tbb_allocator<U> other;
+    };
+};
+
+template<typename T, typename U>
+inline bool operator==( const tbb_allocator<T>&, const tbb_allocator<U>& ) {return true;}
+
+template<typename T, typename U>
+inline bool operator!=( const tbb_allocator<T>&, const tbb_allocator<U>& ) {return false;}
+
+//! Meets "allocator" requirements of ISO C++ Standard, Section 20.1.5
+/** The class is an adapter over an actual allocator that fills the allocation
+    using memset function with template argument C as the value.
+    The members are ordered the same way they are in section 20.4.1
+    of the ISO C++ standard.
+    @ingroup memory_allocation */
+template <typename T, template<typename X> class Allocator = tbb_allocator>
+class zero_allocator : public Allocator<T>
+{
+public:
+    typedef Allocator<T> base_allocator_type;
+    typedef typename base_allocator_type::value_type value_type;
+    typedef typename base_allocator_type::pointer pointer;
+    typedef typename base_allocator_type::const_pointer const_pointer;
+    typedef typename base_allocator_type::reference reference;
+    typedef typename base_allocator_type::const_reference const_reference;
+    typedef typename base_allocator_type::size_type size_type;
+    typedef typename base_allocator_type::difference_type difference_type;
+    template<typename U> struct rebind {
+        typedef zero_allocator<U, Allocator> other;
+    };
+
+    zero_allocator() throw() { }
+    zero_allocator(const zero_allocator &a) throw() : base_allocator_type( a ) { }
+    template<typename U>
+    zero_allocator(const zero_allocator<U> &a) throw() : base_allocator_type( Allocator<U>( a ) ) { }
+
+    pointer allocate(const size_type n, const void *hint = 0 ) {
+        pointer ptr = base_allocator_type::allocate( n, hint );
+        std::memset( static_cast<void*>(ptr), 0, n * sizeof(value_type) );
+        return ptr;
+    }
+};
+
+//! Analogous to std::allocator<void>, as defined in ISO C++ Standard, Section 20.4.1
+/** @ingroup memory_allocation */
+template<template<typename T> class Allocator>
+class zero_allocator<void, Allocator> : public Allocator<void> {
+public:
+    typedef Allocator<void> base_allocator_type;
+    typedef typename base_allocator_type::value_type value_type;
+    typedef typename base_allocator_type::pointer pointer;
+    typedef typename base_allocator_type::const_pointer const_pointer;
+    template<typename U> struct rebind {
+        typedef zero_allocator<U, Allocator> other;
+    };
+};
+
+template<typename T1, template<typename X1> class B1, typename T2, template<typename X2> class B2>
+inline bool operator==( const zero_allocator<T1,B1> &a, const zero_allocator<T2,B2> &b) {
+    return static_cast< B1<T1> >(a) == static_cast< B2<T2> >(b);
+}
+template<typename T1, template<typename X1> class B1, typename T2, template<typename X2> class B2>
+inline bool operator!=( const zero_allocator<T1,B1> &a, const zero_allocator<T2,B2> &b) {
+    return static_cast< B1<T1> >(a) != static_cast< B2<T2> >(b);
+}
+
+} // namespace tbb
+
+#endif /* __TBB_tbb_allocator_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_config.h b/xdl/third_party/tbb/include/tbb/tbb_config.h
new file mode 100644
index 00000000..07affd70
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_config.h
@@ -0,0 +1,818 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_config_H
+#define __TBB_tbb_config_H
+
+/** This header is supposed to contain macro definitions and C style comments only.
+    The macros defined here are intended to control such aspects of TBB build as
+    - presence of compiler features
+    - compilation modes
+    - feature sets
+    - known compiler/platform issues
+**/
+
+/* This macro marks incomplete code or comments describing ideas which are considered for the future.
+ * See also for plain comment with TODO and FIXME marks for small improvement opportunities.
+ */
+#define __TBB_TODO 0
+
+/* Check which standard library we use. */
+/* __TBB_SYMBOL is defined only while processing exported symbols list where C++ is not allowed. */
+#if !defined(__TBB_SYMBOL) && !__TBB_CONFIG_PREPROC_ONLY
+    #include <cstddef>
+#endif
+
+// note that when ICC or Clang is in use, __TBB_GCC_VERSION might not fully match
+// the actual GCC version on the system.
+#define __TBB_GCC_VERSION (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__)
+
+// Since GNU libstdc++ does not have a convenient macro for its version,
+// we rely on the version of GCC or the user-specified macro below.
+// The format of TBB_USE_GLIBCXX_VERSION should match the __TBB_GCC_VERSION above,
+// e.g. it should be set to 40902 for libstdc++ coming with GCC 4.9.2.
+#ifdef TBB_USE_GLIBCXX_VERSION
+#define __TBB_GLIBCXX_VERSION TBB_USE_GLIBCXX_VERSION
+#elif __GLIBCPP__ || __GLIBCXX__
+#define __TBB_GLIBCXX_VERSION __TBB_GCC_VERSION
+//TODO: analyze __GLIBCXX__ instead of __TBB_GCC_VERSION ?
+#endif
+
+#if __clang__
+    // according to clang documentation, version can be vendor specific
+    #define __TBB_CLANG_VERSION (__clang_major__ * 10000 + __clang_minor__ * 100 + __clang_patchlevel__)
+#endif
+
+/** Target OS is either iOS* or iOS* simulator **/
+#if __ENVIRONMENT_IPHONE_OS_VERSION_MIN_REQUIRED__
+    #define __TBB_IOS 1
+#endif
+
+#if __APPLE__
+    #if __INTEL_COMPILER && __ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__ > 1099 \
+                         && __ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__ < 101000
+        // ICC does not correctly set the macro if -mmacosx-min-version is not specified
+        #define __TBB_MACOS_TARGET_VERSION  (100000 + 10*(__ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__ - 1000))
+    #else
+        #define __TBB_MACOS_TARGET_VERSION  __ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__
+    #endif
+#endif
+
+/** Preprocessor symbols to determine HW architecture **/
+
+#if _WIN32||_WIN64
+#   if defined(_M_X64)||defined(__x86_64__)  // the latter for MinGW support
+#       define __TBB_x86_64 1
+#   elif defined(_M_IA64)
+#       define __TBB_ipf 1
+#   elif defined(_M_IX86)||defined(__i386__) // the latter for MinGW support
+#       define __TBB_x86_32 1
+#   else
+#       define __TBB_generic_arch 1
+#   endif
+#else /* Assume generic Unix */
+#   if !__linux__ && !__APPLE__
+#       define __TBB_generic_os 1
+#   endif
+#   if __TBB_IOS
+#       define __TBB_generic_arch 1
+#   elif __x86_64__
+#       define __TBB_x86_64 1
+#   elif __ia64__
+#       define __TBB_ipf 1
+#   elif __i386__||__i386  // __i386 is for Sun OS
+#       define __TBB_x86_32 1
+#   else
+#       define __TBB_generic_arch 1
+#   endif
+#endif
+
+#if __MIC__ || __MIC2__
+#define __TBB_DEFINE_MIC 1
+#endif
+
+#define __TBB_TSX_AVAILABLE  ((__TBB_x86_32 || __TBB_x86_64) && !__TBB_DEFINE_MIC)
+
+/** Presence of compiler features **/
+
+#if __INTEL_COMPILER == 9999 && __INTEL_COMPILER_BUILD_DATE == 20110811
+/* Intel(R) Composer XE 2011 Update 6 incorrectly sets __INTEL_COMPILER. Fix it. */
+    #undef __INTEL_COMPILER
+    #define __INTEL_COMPILER 1210
+#endif
+
+#if __clang__ && !__INTEL_COMPILER
+#define __TBB_USE_OPTIONAL_RTTI __has_feature(cxx_rtti)
+#elif defined(_CPPRTTI)
+#define __TBB_USE_OPTIONAL_RTTI 1
+#else
+#define __TBB_USE_OPTIONAL_RTTI (__GXX_RTTI || __RTTI || __INTEL_RTTI__)
+#endif
+
+#if __TBB_GCC_VERSION >= 40400 && !defined(__INTEL_COMPILER)
+    /** warning suppression pragmas available in GCC since 4.4 **/
+    #define __TBB_GCC_WARNING_SUPPRESSION_PRESENT 1
+#endif
+
+/* Select particular features of C++11 based on compiler version.
+   ICC 12.1 (Linux*), GCC 4.3 and higher, clang 2.9 and higher
+   set __GXX_EXPERIMENTAL_CXX0X__ in c++11 mode.
+
+   Compilers that mimics other compilers (ICC, clang) must be processed before
+   compilers they mimic (GCC, MSVC).
+
+   TODO: The following conditions should be extended when new compilers/runtimes
+   support added.
+ */
+
+/**
+    __TBB_CPP11_PRESENT macro indicates that the compiler supports vast majority of C++11 features.
+    Depending on the compiler, some features might still be unsupported or work incorrectly.
+    Use it when enabling C++11 features individually is not practical, and be aware that
+    some "good enough" compilers might be excluded. **/
+#define __TBB_CPP11_PRESENT (__cplusplus >= 201103L || _MSC_VER >= 1900)
+
+#define __TBB_CPP17_FALLTHROUGH_PRESENT (__cplusplus >= 201703L)
+#define __TBB_FALLTHROUGH_PRESENT       (__TBB_GCC_VERSION >= 70000 && !__INTEL_COMPILER)
+
+/** C++11 mode detection macros for Intel(R) C++ Compiler (enabled by -std=c++XY option):
+    __INTEL_CXX11_MODE__ for version >=13.0 (not available for ICC 15.0 if -std=c++14 is used),
+    __STDC_HOSTED__ for version >=12.0 (useful only on Windows),
+    __GXX_EXPERIMENTAL_CXX0X__ for version >=12.0 on Linux and macOS. **/
+#if __INTEL_COMPILER &&  !__INTEL_CXX11_MODE__
+    // __INTEL_CXX11_MODE__ is not set, try to deduce it
+    #define __INTEL_CXX11_MODE__ (__GXX_EXPERIMENTAL_CXX0X__ || (_MSC_VER && __STDC_HOSTED__))
+#endif
+
+// Intel(R) C++ Compiler offloading API to the Intel(R) Graphics Technology presence macro
+// TODO: add support for ICC 15.00 _GFX_enqueue API and then decrease Intel C++ Compiler supported version
+// TODO: add linux support and restict it with (__linux__ && __TBB_x86_64 && !__ANDROID__) macro
+#if __INTEL_COMPILER >= 1600 && _WIN32
+#define __TBB_GFX_PRESENT 1
+#endif
+
+#if __INTEL_COMPILER && (!_MSC_VER || __INTEL_CXX11_MODE__)
+    //  On Windows, C++11 features supported by Visual Studio 2010 and higher are enabled by default,
+    //  so in absence of /Qstd= use MSVC branch for feature detection.
+    //  On other platforms, no -std= means C++03.
+
+    #define __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT          (__INTEL_CXX11_MODE__ && __VARIADIC_TEMPLATES)
+    // Both r-value reference support in compiler and std::move/std::forward
+    // presence in C++ standard library is checked.
+    #define __TBB_CPP11_RVALUE_REF_PRESENT                  ((_MSC_VER >= 1700 || __GXX_EXPERIMENTAL_CXX0X__ && (__TBB_GLIBCXX_VERSION >= 40500 || _LIBCPP_VERSION)) && __INTEL_COMPILER >= 1400)
+    #define __TBB_IMPLICIT_MOVE_PRESENT                     (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1400 && (_MSC_VER >= 1900 || __TBB_GCC_VERSION >= 40600 || __clang__))
+    #if  _MSC_VER >= 1600
+        #define __TBB_EXCEPTION_PTR_PRESENT                 ( __INTEL_COMPILER > 1300                                                \
+                                                            /*ICC 12.1 Upd 10 and 13 beta Upd 2 fixed exception_ptr linking  issue*/ \
+                                                            || (__INTEL_COMPILER == 1300 && __INTEL_COMPILER_BUILD_DATE >= 20120530) \
+                                                            || (__INTEL_COMPILER == 1210 && __INTEL_COMPILER_BUILD_DATE >= 20120410) )
+    /** libstdc++ that comes with GCC 4.6 use C++11 features not supported by ICC 12.1.
+     *  Because of that ICC 12.1 does not support C++11 mode with gcc 4.6 (or higher),
+     *  and therefore does not define __GXX_EXPERIMENTAL_CXX0X__ macro **/
+    #elif __TBB_GLIBCXX_VERSION >= 40404 && __TBB_GLIBCXX_VERSION < 40600
+        #define __TBB_EXCEPTION_PTR_PRESENT                 (__GXX_EXPERIMENTAL_CXX0X__ && __INTEL_COMPILER >= 1200)
+    #elif __TBB_GLIBCXX_VERSION >= 40600
+        #define __TBB_EXCEPTION_PTR_PRESENT                 (__GXX_EXPERIMENTAL_CXX0X__ && __INTEL_COMPILER >= 1300)
+    #elif _LIBCPP_VERSION
+        #define __TBB_EXCEPTION_PTR_PRESENT                 __GXX_EXPERIMENTAL_CXX0X__
+    #else
+        #define __TBB_EXCEPTION_PTR_PRESENT                 0
+    #endif
+    #define __TBB_STATIC_ASSERT_PRESENT                     (__INTEL_CXX11_MODE__ || _MSC_VER >= 1600)
+    #define __TBB_CPP11_TUPLE_PRESENT                       (_MSC_VER >= 1600 || __GXX_EXPERIMENTAL_CXX0X__ && (__TBB_GLIBCXX_VERSION >= 40300 || _LIBCPP_VERSION))
+    #define __TBB_INITIALIZER_LISTS_PRESENT                 (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1400 && (_MSC_VER >= 1800 || __TBB_GLIBCXX_VERSION >= 40400 || _LIBCPP_VERSION))
+    #define __TBB_CONSTEXPR_PRESENT                         (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1400)
+    #define __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT        (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1200)
+    /** ICC seems to disable support of noexcept event in c++11 when compiling in compatibility mode for gcc <4.6 **/
+    #define __TBB_NOEXCEPT_PRESENT                          (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1300 && (__TBB_GLIBCXX_VERSION >= 40600 || _LIBCPP_VERSION || _MSC_VER))
+    #define __TBB_CPP11_STD_BEGIN_END_PRESENT               (_MSC_VER >= 1700 || __GXX_EXPERIMENTAL_CXX0X__ && __INTEL_COMPILER >= 1310 && (__TBB_GLIBCXX_VERSION >= 40600 || _LIBCPP_VERSION))
+    #define __TBB_CPP11_AUTO_PRESENT                        (_MSC_VER >= 1600 || __GXX_EXPERIMENTAL_CXX0X__ && __INTEL_COMPILER >= 1210)
+    #define __TBB_CPP11_DECLTYPE_PRESENT                    (_MSC_VER >= 1600 || __GXX_EXPERIMENTAL_CXX0X__ && __INTEL_COMPILER >= 1210)
+    #define __TBB_CPP11_LAMBDAS_PRESENT                     (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1200)
+    #define __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT  (_MSC_VER >= 1800 || __GXX_EXPERIMENTAL_CXX0X__ && __INTEL_COMPILER >= 1210)
+    #define __TBB_OVERRIDE_PRESENT                          (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1400)
+    #define __TBB_ALIGNAS_PRESENT                           (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1500)
+    #define __TBB_CPP11_TEMPLATE_ALIASES_PRESENT            (__INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1210)
+    #define __TBB_CPP14_INTEGER_SEQUENCE_PRESENT            (__cplusplus >= 201402L)
+    #define __TBB_CPP17_DEDUCTION_GUIDES_PRESENT            __INTEL_COMPILER > 1900
+    #define __TBB_CPP17_INVOKE_RESULT_PRESENT               (__cplusplus >= 201703L)
+#elif __clang__
+/** TODO: these options need to be rechecked **/
+    #define __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT          __has_feature(__cxx_variadic_templates__)
+    #define __TBB_CPP11_RVALUE_REF_PRESENT                  (__has_feature(__cxx_rvalue_references__) && (_LIBCPP_VERSION || __TBB_GLIBCXX_VERSION >= 40500))
+    #define __TBB_IMPLICIT_MOVE_PRESENT                     __has_feature(cxx_implicit_moves)
+/** TODO: extend exception_ptr related conditions to cover libstdc++ **/
+    #define __TBB_EXCEPTION_PTR_PRESENT                     (__cplusplus >= 201103L && (_LIBCPP_VERSION || __TBB_GLIBCXX_VERSION >= 40600))
+    #define __TBB_STATIC_ASSERT_PRESENT                     __has_feature(__cxx_static_assert__)
+    /**Clang (preprocessor) has problems with dealing with expression having __has_include in #ifs
+     * used inside C++ code. (At least version that comes with OS X 10.8 : Apple LLVM version 4.2 (clang-425.0.28) (based on LLVM 3.2svn)) **/
+    #if (__GXX_EXPERIMENTAL_CXX0X__ && __has_include(<tuple>))
+        #define __TBB_CPP11_TUPLE_PRESENT                   1
+    #endif
+    #if (__has_feature(__cxx_generalized_initializers__) && __has_include(<initializer_list>))
+        #define __TBB_INITIALIZER_LISTS_PRESENT             1
+    #endif
+    #define __TBB_CONSTEXPR_PRESENT                         __has_feature(__cxx_constexpr__)
+    #define __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT        (__has_feature(__cxx_defaulted_functions__) && __has_feature(__cxx_deleted_functions__))
+    /**For some unknown reason  __has_feature(__cxx_noexcept) does not yield true for all cases. Compiler bug ? **/
+    #define __TBB_NOEXCEPT_PRESENT                          (__cplusplus >= 201103L)
+    #define __TBB_CPP11_STD_BEGIN_END_PRESENT               (__has_feature(__cxx_range_for__) && (_LIBCPP_VERSION || __TBB_GLIBCXX_VERSION >= 40600))
+    #define __TBB_CPP11_AUTO_PRESENT                        __has_feature(__cxx_auto_type__)
+    #define __TBB_CPP11_DECLTYPE_PRESENT                    __has_feature(__cxx_decltype__)
+    #define __TBB_CPP11_LAMBDAS_PRESENT                     __has_feature(cxx_lambdas)
+    #define __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT  __has_feature(cxx_default_function_template_args)
+    #define __TBB_OVERRIDE_PRESENT                          __has_feature(cxx_override_control)
+    #define __TBB_ALIGNAS_PRESENT                           __has_feature(cxx_alignas)
+    #define __TBB_CPP11_TEMPLATE_ALIASES_PRESENT            __has_feature(cxx_alias_templates)
+    #define __TBB_CPP14_INTEGER_SEQUENCE_PRESENT            (__cplusplus >= 201402L)
+    #define __TBB_CPP17_DEDUCTION_GUIDES_PRESENT            (__has_feature(__cpp_deduction_guides))
+    #define __TBB_CPP17_INVOKE_RESULT_PRESENT               (__has_feature(__cpp_lib_is_invocable))
+#elif __GNUC__
+    #define __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT          __GXX_EXPERIMENTAL_CXX0X__
+    #define __TBB_CPP11_VARIADIC_FIXED_LENGTH_EXP_PRESENT   (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40700)
+    #define __TBB_CPP11_RVALUE_REF_PRESENT                  (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40500)
+    #define __TBB_IMPLICIT_MOVE_PRESENT                     (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40600)
+    /** __GCC_HAVE_SYNC_COMPARE_AND_SWAP_4 here is a substitution for _GLIBCXX_ATOMIC_BUILTINS_4, which is a prerequisite
+        for exception_ptr but cannot be used in this file because it is defined in a header, not by the compiler.
+        If the compiler has no atomic intrinsics, the C++ library should not expect those as well. **/
+    #define __TBB_EXCEPTION_PTR_PRESENT                     (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40404 && __GCC_HAVE_SYNC_COMPARE_AND_SWAP_4)
+    #define __TBB_STATIC_ASSERT_PRESENT                     (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40300)
+    #define __TBB_CPP11_TUPLE_PRESENT                       (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40300)
+    #define __TBB_INITIALIZER_LISTS_PRESENT                 (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400)
+    /** gcc seems have to support constexpr from 4.4 but tests in (test_atomic) seeming reasonable fail to compile prior 4.6**/
+    #define __TBB_CONSTEXPR_PRESENT                         (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400)
+    #define __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT        (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400)
+    #define __TBB_NOEXCEPT_PRESENT                          (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40600)
+    #define __TBB_CPP11_STD_BEGIN_END_PRESENT               (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40600)
+    #define __TBB_CPP11_AUTO_PRESENT                        (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400)
+    #define __TBB_CPP11_DECLTYPE_PRESENT                    (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400)
+    #define __TBB_CPP11_LAMBDAS_PRESENT                     (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40500)
+    #define __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT  (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40300)
+    #define __TBB_OVERRIDE_PRESENT                          (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40700)
+    #define __TBB_ALIGNAS_PRESENT                           (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40800)
+    #define __TBB_CPP11_TEMPLATE_ALIASES_PRESENT            (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40700)
+    #define __TBB_CPP14_INTEGER_SEQUENCE_PRESENT            (__cplusplus >= 201402L     && __TBB_GCC_VERSION >= 50000)
+    #define __TBB_CPP17_DEDUCTION_GUIDES_PRESENT            (__cpp_deduction_guides >= 201606)
+    #define __TBB_CPP17_INVOKE_RESULT_PRESENT               (__cplusplus >= 201703L     && __TBB_GCC_VERSION >= 70000)
+#elif _MSC_VER
+    // These definitions are also used with Intel C++ Compiler in "default" mode (__INTEL_CXX11_MODE__ == 0);
+    // see a comment in "__INTEL_COMPILER" section above.
+
+    #define __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT          (_MSC_VER >= 1800)
+    // Contains a workaround for ICC 13
+    #define __TBB_CPP11_RVALUE_REF_PRESENT                  (_MSC_VER >= 1700 && (!__INTEL_COMPILER || __INTEL_COMPILER >= 1400))
+    #define __TBB_IMPLICIT_MOVE_PRESENT                     (_MSC_VER >= 1900)
+    #define __TBB_EXCEPTION_PTR_PRESENT                     (_MSC_VER >= 1600)
+    #define __TBB_STATIC_ASSERT_PRESENT                     (_MSC_VER >= 1600)
+    #define __TBB_CPP11_TUPLE_PRESENT                       (_MSC_VER >= 1600)
+    #define __TBB_INITIALIZER_LISTS_PRESENT                 (_MSC_VER >= 1800)
+    #define __TBB_CONSTEXPR_PRESENT                         (_MSC_VER >= 1900)
+    #define __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT        (_MSC_VER >= 1800)
+    #define __TBB_NOEXCEPT_PRESENT                          (_MSC_VER >= 1900)
+    #define __TBB_CPP11_STD_BEGIN_END_PRESENT               (_MSC_VER >= 1700)
+    #define __TBB_CPP11_AUTO_PRESENT                        (_MSC_VER >= 1600)
+    #define __TBB_CPP11_DECLTYPE_PRESENT                    (_MSC_VER >= 1600)
+    #define __TBB_CPP11_LAMBDAS_PRESENT                     (_MSC_VER >= 1600)
+    #define __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT  (_MSC_VER >= 1800)
+    #define __TBB_OVERRIDE_PRESENT                          (_MSC_VER >= 1700)
+    #define __TBB_ALIGNAS_PRESENT                           (_MSC_VER >= 1900)
+    #define __TBB_CPP11_TEMPLATE_ALIASES_PRESENT            (_MSC_VER >= 1800)
+    #define __TBB_CPP14_INTEGER_SEQUENCE_PRESENT            (_MSC_VER >= 1900)
+    #define __TBB_CPP17_DEDUCTION_GUIDES_PRESENT            (_MSVC_LANG >= 201703L)
+    #define __TBB_CPP17_INVOKE_RESULT_PRESENT               (__TBB_MSVC_CPP_VER >= 201703L && _MSC_VER >= 1914)
+#else
+    #define __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT          0
+    #define __TBB_CPP11_RVALUE_REF_PRESENT                  0
+    #define __TBB_IMPLICIT_MOVE_PRESENT                     0
+    #define __TBB_EXCEPTION_PTR_PRESENT                     0
+    #define __TBB_STATIC_ASSERT_PRESENT                     0
+    #define __TBB_CPP11_TUPLE_PRESENT                       0
+    #define __TBB_INITIALIZER_LISTS_PRESENT                 0
+    #define __TBB_CONSTEXPR_PRESENT                         0
+    #define __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT        0
+    #define __TBB_NOEXCEPT_PRESENT                          0
+    #define __TBB_CPP11_STD_BEGIN_END_PRESENT               0
+    #define __TBB_CPP11_AUTO_PRESENT                        0
+    #define __TBB_CPP11_DECLTYPE_PRESENT                    0
+    #define __TBB_CPP11_LAMBDAS_PRESENT                     0
+    #define __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT  0
+    #define __TBB_OVERRIDE_PRESENT                          0
+    #define __TBB_ALIGNAS_PRESENT                           0
+    #define __TBB_CPP11_TEMPLATE_ALIASES_PRESENT            0
+    #define __TBB_CPP14_INTEGER_SEQUENCE_PRESENT            (__cplusplus >= 201402L)
+    #define __TBB_CPP17_DEDUCTION_GUIDES_PRESENT            0
+    #define __TBB_CPP17_INVOKE_RESULT_PRESENT               0
+#endif
+
+// C++11 standard library features
+
+#define __TBB_CPP11_ARRAY_PRESENT                           (_MSC_VER >= 1700 || _LIBCPP_VERSION || __GXX_EXPERIMENTAL_CXX0X__ && __TBB_GLIBCXX_VERSION >= 40300)
+
+#ifndef __TBB_CPP11_VARIADIC_FIXED_LENGTH_EXP_PRESENT
+#define __TBB_CPP11_VARIADIC_FIXED_LENGTH_EXP_PRESENT       __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif
+#define __TBB_CPP11_VARIADIC_TUPLE_PRESENT                  (!_MSC_VER || _MSC_VER >= 1800)
+
+#define __TBB_CPP11_TYPE_PROPERTIES_PRESENT                 (_LIBCPP_VERSION || _MSC_VER >= 1700 || (__TBB_GLIBCXX_VERSION >= 50000 && __GXX_EXPERIMENTAL_CXX0X__))
+#define __TBB_TR1_TYPE_PROPERTIES_IN_STD_PRESENT            (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GLIBCXX_VERSION >= 40300 || _MSC_VER >= 1600)
+// GCC supported some of type properties since 4.7
+#define __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT           (__GXX_EXPERIMENTAL_CXX0X__ && __TBB_GLIBCXX_VERSION >= 40700 || __TBB_CPP11_TYPE_PROPERTIES_PRESENT)
+
+// In GCC, std::move_if_noexcept appeared later than noexcept
+#define __TBB_MOVE_IF_NOEXCEPT_PRESENT                      (__TBB_NOEXCEPT_PRESENT && (__TBB_GLIBCXX_VERSION >= 40700 || _MSC_VER >= 1900 || _LIBCPP_VERSION))
+#define __TBB_ALLOCATOR_TRAITS_PRESENT                      (__cplusplus >= 201103L && _LIBCPP_VERSION  || _MSC_VER >= 1700 ||  \
+                                                            __GXX_EXPERIMENTAL_CXX0X__ && __TBB_GLIBCXX_VERSION >= 40700 && !(__TBB_GLIBCXX_VERSION == 40700 && __TBB_DEFINE_MIC))
+#define __TBB_MAKE_EXCEPTION_PTR_PRESENT                    (__TBB_EXCEPTION_PTR_PRESENT && (_MSC_VER >= 1700 || __TBB_GLIBCXX_VERSION >= 40600 || _LIBCPP_VERSION))
+
+// Due to libc++ limitations in C++03 mode, do not pass rvalues to std::make_shared()
+#define __TBB_CPP11_SMART_POINTERS_PRESENT                  ( _MSC_VER >= 1600 || _LIBCPP_VERSION   \
+                                                            || ((__cplusplus >= 201103L || __GXX_EXPERIMENTAL_CXX0X__)  \
+                                                            && (__TBB_GLIBCXX_VERSION >= 40500 || __TBB_GLIBCXX_VERSION >= 40400 && __TBB_USE_OPTIONAL_RTTI)) )
+
+#define __TBB_CPP11_FUTURE_PRESENT                          (_MSC_VER >= 1700 || __TBB_GLIBCXX_VERSION >= 40600 && __GXX_EXPERIMENTAL_CXX0X__ || _LIBCPP_VERSION)
+
+#define __TBB_CPP11_GET_NEW_HANDLER_PRESENT                 (_MSC_VER >= 1900 || __TBB_GLIBCXX_VERSION >= 40900 && __GXX_EXPERIMENTAL_CXX0X__ || _LIBCPP_VERSION)
+
+#define __TBB_CPP17_UNCAUGHT_EXCEPTIONS_PRESENT             (_MSC_VER >= 1900 || __GLIBCXX__ && __cpp_lib_uncaught_exceptions \
+                                                            || _LIBCPP_VERSION >= 3700 && (!__TBB_MACOS_TARGET_VERSION || __TBB_MACOS_TARGET_VERSION >= 101200))
+
+// std::swap is in <utility> only since C++11, though MSVC had it at least since VS2005
+#if _MSC_VER>=1400 || _LIBCPP_VERSION || __GXX_EXPERIMENTAL_CXX0X__
+#define __TBB_STD_SWAP_HEADER <utility>
+#else
+#define __TBB_STD_SWAP_HEADER <algorithm>
+#endif
+
+//TODO: not clear how exactly this macro affects exception_ptr - investigate
+// On linux ICC fails to find existing std::exception_ptr in libstdc++ without this define
+#if __INTEL_COMPILER && __GNUC__ && __TBB_EXCEPTION_PTR_PRESENT && !defined(__GCC_HAVE_SYNC_COMPARE_AND_SWAP_4)
+    #define __GCC_HAVE_SYNC_COMPARE_AND_SWAP_4 1
+#endif
+
+// Work around a bug in MinGW32
+#if __MINGW32__ && __TBB_EXCEPTION_PTR_PRESENT && !defined(_GLIBCXX_ATOMIC_BUILTINS_4)
+    #define _GLIBCXX_ATOMIC_BUILTINS_4
+#endif
+
+#if __GNUC__ || __SUNPRO_CC || __IBMCPP__
+    /* ICC defines __GNUC__ and so is covered */
+    #define __TBB_ATTRIBUTE_ALIGNED_PRESENT 1
+#elif _MSC_VER && (_MSC_VER >= 1300 || __INTEL_COMPILER)
+    #define __TBB_DECLSPEC_ALIGN_PRESENT 1
+#endif
+
+/* Actually ICC supports gcc __sync_* intrinsics starting 11.1,
+ * but 64 bit support for 32 bit target comes in later ones*/
+/* TODO: change the version back to 4.1.2 once macro __TBB_WORD_SIZE become optional */
+/* Assumed that all clang versions have these gcc compatible intrinsics. */
+#if __TBB_GCC_VERSION >= 40306 || __INTEL_COMPILER >= 1200 || __clang__
+    /** built-in atomics available in GCC since 4.1.2 **/
+    #define __TBB_GCC_BUILTIN_ATOMICS_PRESENT 1
+#endif
+
+#if __TBB_GCC_VERSION >= 70000 && !__INTEL_COMPILER && !__clang__
+    // After GCC7 there was possible reordering problem in generic atomic load/store operations.
+    // So always using builtins.
+    #define TBB_USE_GCC_BUILTINS 1
+#endif
+
+#if __INTEL_COMPILER >= 1200
+    /** built-in C++11 style atomics available in ICC since 12.0 **/
+    #define __TBB_ICC_BUILTIN_ATOMICS_PRESENT 1
+#endif
+
+#if _MSC_VER>=1600 && (!__INTEL_COMPILER || __INTEL_COMPILER>=1310)
+    #define __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT 1
+#endif
+
+#define __TBB_TSX_INTRINSICS_PRESENT ((__RTM__ || _MSC_VER>=1700 || __INTEL_COMPILER>=1300) && !__TBB_DEFINE_MIC && !__ANDROID__)
+
+/** Macro helpers **/
+#define __TBB_CONCAT_AUX(A,B) A##B
+// The additional level of indirection is needed to expand macros A and B (not to get the AB macro).
+// See [cpp.subst] and [cpp.concat] for more details.
+#define __TBB_CONCAT(A,B) __TBB_CONCAT_AUX(A,B)
+// The IGNORED argument and comma are needed to always have 2 arguments (even when A is empty).
+#define __TBB_IS_MACRO_EMPTY(A,IGNORED) __TBB_CONCAT_AUX(__TBB_MACRO_EMPTY,A)
+#define __TBB_MACRO_EMPTY 1
+
+/** User controlled TBB features & modes **/
+#ifndef TBB_USE_DEBUG
+/*
+There are four cases that are supported:
+  1. "_DEBUG is undefined" means "no debug";
+  2. "_DEBUG defined to something that is evaluated to 0" (including "garbage", as per [cpp.cond]) means "no debug";
+  3. "_DEBUG defined to something that is evaluated to a non-zero value" means "debug";
+  4. "_DEBUG defined to nothing (empty)" means "debug".
+*/
+#ifdef _DEBUG
+// Check if _DEBUG is empty.
+#define __TBB_IS__DEBUG_EMPTY (__TBB_IS_MACRO_EMPTY(_DEBUG,IGNORED)==__TBB_MACRO_EMPTY)
+#if __TBB_IS__DEBUG_EMPTY
+#define TBB_USE_DEBUG 1
+#else
+#define TBB_USE_DEBUG _DEBUG
+#endif /* __TBB_IS__DEBUG_EMPTY */
+#else
+#define TBB_USE_DEBUG 0
+#endif
+#endif /* TBB_USE_DEBUG */
+
+#ifndef TBB_USE_ASSERT
+#define TBB_USE_ASSERT TBB_USE_DEBUG
+#endif /* TBB_USE_ASSERT */
+
+#ifndef TBB_USE_THREADING_TOOLS
+#define TBB_USE_THREADING_TOOLS TBB_USE_DEBUG
+#endif /* TBB_USE_THREADING_TOOLS */
+
+#ifndef TBB_USE_PERFORMANCE_WARNINGS
+#ifdef TBB_PERFORMANCE_WARNINGS
+#define TBB_USE_PERFORMANCE_WARNINGS TBB_PERFORMANCE_WARNINGS
+#else
+#define TBB_USE_PERFORMANCE_WARNINGS TBB_USE_DEBUG
+#endif /* TBB_PERFORMANCE_WARNINGS */
+#endif /* TBB_USE_PERFORMANCE_WARNINGS */
+
+#if __TBB_DEFINE_MIC
+    #if TBB_USE_EXCEPTIONS
+        #error The platform does not properly support exception handling. Please do not set TBB_USE_EXCEPTIONS macro or set it to 0.
+    #elif !defined(TBB_USE_EXCEPTIONS)
+        #define TBB_USE_EXCEPTIONS 0
+    #endif
+#elif !(__EXCEPTIONS || defined(_CPPUNWIND) || __SUNPRO_CC)
+    #if TBB_USE_EXCEPTIONS
+        #error Compilation settings do not support exception handling. Please do not set TBB_USE_EXCEPTIONS macro or set it to 0.
+    #elif !defined(TBB_USE_EXCEPTIONS)
+        #define TBB_USE_EXCEPTIONS 0
+    #endif
+#elif !defined(TBB_USE_EXCEPTIONS)
+    #define TBB_USE_EXCEPTIONS 1
+#endif
+
+#ifndef TBB_IMPLEMENT_CPP0X
+/** By default, use C++11 classes if available **/
+    #if __clang__
+        /* Old versions of Intel C++ Compiler do not have __has_include or cannot use it in #define */
+        #if (__INTEL_COMPILER && (__INTEL_COMPILER < 1500 || __INTEL_COMPILER == 1500 && __INTEL_COMPILER_UPDATE <= 1))
+            #define TBB_IMPLEMENT_CPP0X (__cplusplus < 201103L || !_LIBCPP_VERSION)
+        #else
+            #define TBB_IMPLEMENT_CPP0X (__cplusplus < 201103L || (!__has_include(<thread>) && !__has_include(<condition_variable>)))
+        #endif
+    #elif __GNUC__
+        #define TBB_IMPLEMENT_CPP0X (__TBB_GCC_VERSION < 40400 || !__GXX_EXPERIMENTAL_CXX0X__)
+    #elif _MSC_VER
+        #define TBB_IMPLEMENT_CPP0X (_MSC_VER < 1700)
+    #else
+        // TODO: Reconsider general approach to be more reliable, e.g. (!(__cplusplus >= 201103L && __ STDC_HOSTED__))
+        #define TBB_IMPLEMENT_CPP0X (!__STDCPP_THREADS__)
+    #endif
+#endif /* TBB_IMPLEMENT_CPP0X */
+
+/* TBB_USE_CAPTURED_EXCEPTION should be explicitly set to either 0 or 1, as it is used as C++ const */
+#ifndef TBB_USE_CAPTURED_EXCEPTION
+    /** IA-64 architecture pre-built TBB binaries do not support exception_ptr. **/
+    #if __TBB_EXCEPTION_PTR_PRESENT && !defined(__ia64__)
+        #define TBB_USE_CAPTURED_EXCEPTION 0
+    #else
+        #define TBB_USE_CAPTURED_EXCEPTION 1
+    #endif
+#else /* defined TBB_USE_CAPTURED_EXCEPTION */
+    #if !TBB_USE_CAPTURED_EXCEPTION && !__TBB_EXCEPTION_PTR_PRESENT
+        #error Current runtime does not support std::exception_ptr. Set TBB_USE_CAPTURED_EXCEPTION and make sure that your code is ready to catch tbb::captured_exception.
+    #endif
+#endif /* defined TBB_USE_CAPTURED_EXCEPTION */
+
+/** Check whether the request to use GCC atomics can be satisfied **/
+#if TBB_USE_GCC_BUILTINS && !__TBB_GCC_BUILTIN_ATOMICS_PRESENT
+    #error "GCC atomic built-ins are not supported."
+#endif
+
+/** Internal TBB features & modes **/
+
+/** __TBB_WEAK_SYMBOLS_PRESENT denotes that the system supports the weak symbol mechanism **/
+#ifndef __TBB_WEAK_SYMBOLS_PRESENT
+#define __TBB_WEAK_SYMBOLS_PRESENT ( !_WIN32 && !__APPLE__ && !__sun && (__TBB_GCC_VERSION >= 40000 || __INTEL_COMPILER ) )
+#endif
+
+/** __TBB_DYNAMIC_LOAD_ENABLED describes the system possibility to load shared libraries at run time **/
+#ifndef __TBB_DYNAMIC_LOAD_ENABLED
+    #define __TBB_DYNAMIC_LOAD_ENABLED 1
+#endif
+
+/** __TBB_SOURCE_DIRECTLY_INCLUDED is a mode used in whitebox testing when
+    it's necessary to test internal functions not exported from TBB DLLs
+**/
+#if (_WIN32||_WIN64) && (__TBB_SOURCE_DIRECTLY_INCLUDED || TBB_USE_PREVIEW_BINARY)
+    #define __TBB_NO_IMPLICIT_LINKAGE 1
+    #define __TBBMALLOC_NO_IMPLICIT_LINKAGE 1
+#endif
+
+#ifndef __TBB_COUNT_TASK_NODES
+    #define __TBB_COUNT_TASK_NODES TBB_USE_ASSERT
+#endif
+
+#ifndef __TBB_TASK_GROUP_CONTEXT
+    #define __TBB_TASK_GROUP_CONTEXT 1
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#ifndef __TBB_SCHEDULER_OBSERVER
+    #define __TBB_SCHEDULER_OBSERVER 1
+#endif /* __TBB_SCHEDULER_OBSERVER */
+
+#ifndef __TBB_FP_CONTEXT
+    #define __TBB_FP_CONTEXT __TBB_TASK_GROUP_CONTEXT
+#endif /* __TBB_FP_CONTEXT */
+
+#if __TBB_FP_CONTEXT && !__TBB_TASK_GROUP_CONTEXT
+    #error __TBB_FP_CONTEXT requires __TBB_TASK_GROUP_CONTEXT to be enabled
+#endif
+
+#define __TBB_RECYCLE_TO_ENQUEUE __TBB_BUILD // keep non-official
+
+#ifndef __TBB_ARENA_OBSERVER
+    #define __TBB_ARENA_OBSERVER ((__TBB_BUILD||TBB_PREVIEW_LOCAL_OBSERVER)&& __TBB_SCHEDULER_OBSERVER)
+#endif /* __TBB_ARENA_OBSERVER */
+
+#ifndef __TBB_SLEEP_PERMISSION
+    #define __TBB_SLEEP_PERMISSION ((__TBB_CPF_BUILD||TBB_PREVIEW_LOCAL_OBSERVER)&& __TBB_SCHEDULER_OBSERVER)
+#endif /* __TBB_SLEEP_PERMISSION */
+
+#ifndef __TBB_TASK_ISOLATION
+    #define __TBB_TASK_ISOLATION 1
+#endif /* __TBB_TASK_ISOLATION */
+
+#if TBB_USE_EXCEPTIONS && !__TBB_TASK_GROUP_CONTEXT
+    #error TBB_USE_EXCEPTIONS requires __TBB_TASK_GROUP_CONTEXT to be enabled
+#endif
+
+#ifndef __TBB_TASK_PRIORITY
+    #define __TBB_TASK_PRIORITY (__TBB_TASK_GROUP_CONTEXT)
+#endif /* __TBB_TASK_PRIORITY */
+
+#if __TBB_TASK_PRIORITY && !__TBB_TASK_GROUP_CONTEXT
+    #error __TBB_TASK_PRIORITY requires __TBB_TASK_GROUP_CONTEXT to be enabled
+#endif
+
+#if TBB_PREVIEW_WAITING_FOR_WORKERS || __TBB_BUILD
+    #define __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE 1
+#endif
+
+#ifndef __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    #define __TBB_ENQUEUE_ENFORCED_CONCURRENCY 1
+#endif
+
+#if !defined(__TBB_SURVIVE_THREAD_SWITCH) && \
+          (_WIN32 || _WIN64 || __APPLE__ || (__linux__ && !__ANDROID__))
+    #define __TBB_SURVIVE_THREAD_SWITCH 1
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+#ifndef __TBB_DEFAULT_PARTITIONER
+#define __TBB_DEFAULT_PARTITIONER tbb::auto_partitioner
+#endif
+
+#ifndef __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+#define __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES 1
+#endif
+
+#ifndef __TBB_ENABLE_RANGE_FEEDBACK
+#define __TBB_ENABLE_RANGE_FEEDBACK 0
+#endif
+
+#ifdef _VARIADIC_MAX
+    #define __TBB_VARIADIC_MAX _VARIADIC_MAX
+#else
+    #if _MSC_VER == 1700
+        #define __TBB_VARIADIC_MAX 5 // VS11 setting, issue resolved in VS12
+    #elif _MSC_VER == 1600
+        #define __TBB_VARIADIC_MAX 10 // VS10 setting
+    #else
+        #define __TBB_VARIADIC_MAX 15
+    #endif
+#endif
+
+/** __TBB_WIN8UI_SUPPORT enables support of Windows* Store Apps and limit a possibility to load
+    shared libraries at run time only from application container **/
+#if defined(WINAPI_FAMILY) && WINAPI_FAMILY == WINAPI_FAMILY_APP
+    #define __TBB_WIN8UI_SUPPORT 1
+#else
+    #define __TBB_WIN8UI_SUPPORT 0
+#endif
+
+/** Macros of the form __TBB_XXX_BROKEN denote known issues that are caused by
+    the bugs in compilers, standard or OS specific libraries. They should be
+    removed as soon as the corresponding bugs are fixed or the buggy OS/compiler
+    versions go out of the support list.
+**/
+
+#if __SIZEOF_POINTER__ < 8 && __ANDROID__ && __TBB_GCC_VERSION <= 40403 && !__GCC_HAVE_SYNC_COMPARE_AND_SWAP_8
+    /** Necessary because on Android 8-byte CAS and F&A are not available for some processor architectures,
+        but no mandatory warning message appears from GCC 4.4.3. Instead, only a linkage error occurs when
+        these atomic operations are used (such as in unit test test_atomic.exe). **/
+    #define __TBB_GCC_64BIT_ATOMIC_BUILTINS_BROKEN 1
+#elif __TBB_x86_32 && __TBB_GCC_VERSION == 40102 && ! __GNUC_RH_RELEASE__
+    /** GCC 4.1.2 erroneously emit call to external function for 64 bit sync_ intrinsics.
+        However these functions are not defined anywhere. It seems that this problem was fixed later on
+        and RHEL got an updated version of gcc 4.1.2. **/
+    #define __TBB_GCC_64BIT_ATOMIC_BUILTINS_BROKEN 1
+#endif
+
+#if __GNUC__ && __TBB_x86_64 && __INTEL_COMPILER == 1200
+    #define __TBB_ICC_12_0_INL_ASM_FSTCW_BROKEN 1
+#endif
+
+#if _MSC_VER && __INTEL_COMPILER && (__INTEL_COMPILER<1110 || __INTEL_COMPILER==1110 && __INTEL_COMPILER_BUILD_DATE < 20091012)
+    /** Necessary to avoid ICL error (or warning in non-strict mode):
+        "exception specification for implicitly declared virtual destructor is
+        incompatible with that of overridden one". **/
+    #define __TBB_DEFAULT_DTOR_THROW_SPEC_BROKEN 1
+#endif
+
+#if !__INTEL_COMPILER && (_MSC_VER && _MSC_VER < 1500 || __GNUC__ && __TBB_GCC_VERSION < 40102)
+    /** gcc 3.4.6 (and earlier) and VS2005 (and earlier) do not allow declaring template class as a friend
+        of classes defined in other namespaces. **/
+    #define __TBB_TEMPLATE_FRIENDS_BROKEN 1
+#endif
+
+#if __GLIBC__==2 && __GLIBC_MINOR__==3 ||  (__APPLE__ && ( __INTEL_COMPILER==1200 && !TBB_USE_DEBUG))
+    /** Macro controlling EH usages in TBB tests.
+        Some older versions of glibc crash when exception handling happens concurrently. **/
+    #define __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN 1
+#endif
+
+#if (_WIN32||_WIN64) && __INTEL_COMPILER == 1110
+    /** That's a bug in Intel C++ Compiler 11.1.044/IA-32 architecture/Windows* OS, that leads to a worker thread crash on the thread's startup. **/
+    #define __TBB_ICL_11_1_CODE_GEN_BROKEN 1
+#endif
+
+#if __clang__ || (__GNUC__==3 && __GNUC_MINOR__==3 && !defined(__INTEL_COMPILER))
+    /** Bugs with access to nested classes declared in protected area */
+    #define __TBB_PROTECTED_NESTED_CLASS_BROKEN 1
+#endif
+
+#if __MINGW32__ && __TBB_GCC_VERSION < 40200
+    /** MinGW has a bug with stack alignment for routines invoked from MS RTLs.
+        Since GCC 4.2, the bug can be worked around via a special attribute. **/
+    #define __TBB_SSE_STACK_ALIGNMENT_BROKEN 1
+#endif
+
+#if __TBB_GCC_VERSION==40300 && !__INTEL_COMPILER && !__clang__
+    /* GCC of this version may rashly ignore control dependencies */
+    #define __TBB_GCC_OPTIMIZER_ORDERING_BROKEN 1
+#endif
+
+#if __FreeBSD__
+    /** A bug in FreeBSD 8.0 results in kernel panic when there is contention
+        on a mutex created with this attribute. **/
+    #define __TBB_PRIO_INHERIT_BROKEN 1
+
+    /** A bug in FreeBSD 8.0 results in test hanging when an exception occurs
+        during (concurrent?) object construction by means of placement new operator. **/
+    #define __TBB_PLACEMENT_NEW_EXCEPTION_SAFETY_BROKEN 1
+#endif /* __FreeBSD__ */
+
+#if (__linux__ || __APPLE__) && __i386__ && defined(__INTEL_COMPILER)
+    /** The Intel C++ Compiler for IA-32 architecture (Linux* OS|macOS) crashes or generates
+        incorrect code when __asm__ arguments have a cast to volatile. **/
+    #define __TBB_ICC_ASM_VOLATILE_BROKEN 1
+#endif
+
+#if !__INTEL_COMPILER && (_MSC_VER && _MSC_VER < 1700 || __GNUC__==3 && __GNUC_MINOR__<=2)
+    /** Bug in GCC 3.2 and MSVC compilers that sometimes return 0 for __alignof(T)
+        when T has not yet been instantiated. **/
+    #define __TBB_ALIGNOF_NOT_INSTANTIATED_TYPES_BROKEN 1
+#endif
+
+#if __TBB_DEFINE_MIC
+    /** Main thread and user's thread have different default thread affinity masks. **/
+    #define __TBB_MAIN_THREAD_AFFINITY_BROKEN 1
+#endif
+
+#if __GXX_EXPERIMENTAL_CXX0X__ && !defined(__EXCEPTIONS) && \
+    ((!__INTEL_COMPILER && !__clang__ && (__TBB_GCC_VERSION>=40400 && __TBB_GCC_VERSION<40600)) || \
+     (__INTEL_COMPILER<=1400 && (__TBB_GLIBCXX_VERSION>=40400 && __TBB_GLIBCXX_VERSION<=40801)))
+/* There is an issue for specific GCC toolchain when C++11 is enabled
+   and exceptions are disabled:
+   exceprion_ptr.h/nested_exception.h use throw unconditionally.
+   GCC can ignore 'throw' since 4.6; but with ICC the issue still exists.
+ */
+    #define __TBB_LIBSTDCPP_EXCEPTION_HEADERS_BROKEN 1
+#endif
+
+#if __INTEL_COMPILER==1300 && __TBB_GLIBCXX_VERSION>=40700 && defined(__GXX_EXPERIMENTAL_CXX0X__)
+/* Some C++11 features used inside libstdc++ are not supported by Intel C++ Compiler. */
+    #define __TBB_ICC_13_0_CPP11_STDLIB_SUPPORT_BROKEN 1
+#endif
+
+#if (__GNUC__==4 && __GNUC_MINOR__==4 ) && !defined(__INTEL_COMPILER) && !defined(__clang__)
+    /** excessive warnings related to strict aliasing rules in GCC 4.4 **/
+    #define __TBB_GCC_STRICT_ALIASING_BROKEN 1
+    /* topical remedy: #pragma GCC diagnostic ignored "-Wstrict-aliasing" */
+    #if !__TBB_GCC_WARNING_SUPPRESSION_PRESENT
+        #error Warning suppression is not supported, while should.
+    #endif
+#endif
+
+/* In a PIC mode some versions of GCC 4.1.2 generate incorrect inlined code for 8 byte __sync_val_compare_and_swap intrinsic */
+#if __TBB_GCC_VERSION == 40102 && __PIC__ && !defined(__INTEL_COMPILER) && !defined(__clang__)
+    #define __TBB_GCC_CAS8_BUILTIN_INLINING_BROKEN 1
+#endif
+
+#if __TBB_x86_32 && ( __INTEL_COMPILER || (__GNUC__==5 && __GNUC_MINOR__>=2 && __GXX_EXPERIMENTAL_CXX0X__) \
+    || (__GNUC__==3 && __GNUC_MINOR__==3) || (__MINGW32__ && __GNUC__==4 && __GNUC_MINOR__==5) || __SUNPRO_CC )
+    // Some compilers for IA-32 architecture fail to provide 8-byte alignment of objects on the stack,
+    // even if the object specifies 8-byte alignment. On such platforms, the implementation
+    // of 64 bit atomics for IA-32 architecture (e.g. atomic<long long>) use different tactics
+    // depending upon whether the object is properly aligned or not.
+    #define __TBB_FORCE_64BIT_ALIGNMENT_BROKEN 1
+#else
+    // Define to 0 explicitly because the macro is used in a compiled code of test_atomic
+    #define __TBB_FORCE_64BIT_ALIGNMENT_BROKEN 0
+#endif
+
+#if __GNUC__ && !__INTEL_COMPILER && !__clang__ && __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT && __TBB_GCC_VERSION < 40700
+    #define __TBB_ZERO_INIT_WITH_DEFAULTED_CTOR_BROKEN 1
+#endif
+
+#if _MSC_VER && _MSC_VER <= 1800 && !__INTEL_COMPILER
+    // With MSVC, when an array is passed by const reference to a template function,
+    // constness from the function parameter may get propagated to the template parameter.
+    #define __TBB_CONST_REF_TO_ARRAY_TEMPLATE_PARAM_BROKEN 1
+#endif
+
+// A compiler bug: a disabled copy constructor prevents use of the moving constructor
+#define __TBB_IF_NO_COPY_CTOR_MOVE_SEMANTICS_BROKEN (_MSC_VER && (__INTEL_COMPILER >= 1300 && __INTEL_COMPILER <= 1310) && !__INTEL_CXX11_MODE__)
+
+#define __TBB_CPP11_DECLVAL_BROKEN (_MSC_VER == 1600 || (__GNUC__ && __TBB_GCC_VERSION < 40500) )
+// Intel C++ Compiler has difficulties with copying std::pair with VC11 std::reference_wrapper being a const member
+#define __TBB_COPY_FROM_NON_CONST_REF_BROKEN (_MSC_VER == 1700 && __INTEL_COMPILER && __INTEL_COMPILER < 1600)
+
+// The implicit upcasting of the tuple of a reference of a derived class to a base class fails on icc 13.X if the system's gcc environment is 4.8
+// Also in gcc 4.4 standard library the implementation of the tuple<&> conversion (tuple<A&> a = tuple<B&>, B is inherited from A) is broken.
+#if __GXX_EXPERIMENTAL_CXX0X__ && __GLIBCXX__ && ((__INTEL_COMPILER >=1300 && __INTEL_COMPILER <=1310 && __TBB_GLIBCXX_VERSION>=40700) || (__TBB_GLIBCXX_VERSION < 40500))
+#define __TBB_UPCAST_OF_TUPLE_OF_REF_BROKEN 1
+#endif
+
+// In some cases decltype of a function adds a reference to a return type.
+#define __TBB_CPP11_DECLTYPE_OF_FUNCTION_RETURN_TYPE_BROKEN (_MSC_VER == 1600 && !__INTEL_COMPILER)
+
+/** End of __TBB_XXX_BROKEN macro section **/
+
+#if defined(_MSC_VER) && _MSC_VER>=1500 && !defined(__INTEL_COMPILER)
+    // A macro to suppress erroneous or benign "unreachable code" MSVC warning (4702)
+    #define __TBB_MSVC_UNREACHABLE_CODE_IGNORED 1
+#endif
+
+#define __TBB_ATOMIC_CTORS     (__TBB_CONSTEXPR_PRESENT && __TBB_DEFAULTED_AND_DELETED_FUNC_PRESENT && (!__TBB_ZERO_INIT_WITH_DEFAULTED_CTOR_BROKEN))
+
+// Many OS versions (Android 4.0.[0-3] for example) need workaround for dlopen to avoid non-recursive loader lock hang
+// Setting the workaround for all compile targets ($APP_PLATFORM) below Android 4.4 (android-19)
+#if __ANDROID__
+#include <android/api-level.h>
+#define __TBB_USE_DLOPEN_REENTRANCY_WORKAROUND  (__ANDROID_API__ < 19)
+#endif
+
+#define __TBB_ALLOCATOR_CONSTRUCT_VARIADIC      (__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT)
+
+#define __TBB_VARIADIC_PARALLEL_INVOKE          (TBB_PREVIEW_VARIADIC_PARALLEL_INVOKE && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT)
+#define __TBB_FLOW_GRAPH_CPP11_FEATURES         (__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT \
+                                                && __TBB_CPP11_SMART_POINTERS_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_AUTO_PRESENT) \
+                                                && __TBB_CPP11_VARIADIC_TUPLE_PRESENT && __TBB_CPP11_DEFAULT_FUNC_TEMPLATE_ARGS_PRESENT \
+                                                && !__TBB_UPCAST_OF_TUPLE_OF_REF_BROKEN
+#define __TBB_PREVIEW_STREAMING_NODE            (__TBB_CPP11_VARIADIC_FIXED_LENGTH_EXP_PRESENT && __TBB_FLOW_GRAPH_CPP11_FEATURES \
+                                                && TBB_PREVIEW_FLOW_GRAPH_NODES && !TBB_IMPLEMENT_CPP0X && !__TBB_UPCAST_OF_TUPLE_OF_REF_BROKEN)
+#define __TBB_PREVIEW_OPENCL_NODE               (__TBB_PREVIEW_STREAMING_NODE && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT)
+#define __TBB_PREVIEW_MESSAGE_BASED_KEY_MATCHING (TBB_PREVIEW_FLOW_GRAPH_FEATURES || __TBB_PREVIEW_OPENCL_NODE)
+#define __TBB_PREVIEW_ASYNC_MSG                 (TBB_PREVIEW_FLOW_GRAPH_FEATURES && __TBB_FLOW_GRAPH_CPP11_FEATURES)
+
+#define __TBB_PREVIEW_GFX_FACTORY               (__TBB_GFX_PRESENT && TBB_PREVIEW_FLOW_GRAPH_FEATURES && !__TBB_MIC_OFFLOAD \
+                                                && __TBB_FLOW_GRAPH_CPP11_FEATURES && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT \
+                                                && __TBB_CPP11_FUTURE_PRESENT)
+
+
+#ifndef __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+#define __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES     TBB_PREVIEW_FLOW_GRAPH_FEATURES
+#endif
+
+#ifndef __TBB_PREVIEW_CRITICAL_TASKS
+#define __TBB_PREVIEW_CRITICAL_TASKS            (__TBB_CPF_BUILD || __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES)
+#endif
+
+#endif /* __TBB_tbb_config_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_disable_exceptions.h b/xdl/third_party/tbb/include/tbb/tbb_disable_exceptions.h
new file mode 100644
index 00000000..be1bb11b
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_disable_exceptions.h
@@ -0,0 +1,35 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//! To disable use of exceptions, include this header before any other header file from the library.
+
+//! The macro that prevents use of exceptions in the library files
+#undef  TBB_USE_EXCEPTIONS
+#define TBB_USE_EXCEPTIONS 0
+
+//! Prevent compilers from issuing exception related warnings.
+/** Note that the warnings are suppressed for all the code after this header is included. */
+#if _MSC_VER
+#if __INTEL_COMPILER
+    #pragma warning (disable: 583)
+#else
+    #pragma warning (disable: 4530 4577)
+#endif
+#endif
diff --git a/xdl/third_party/tbb/include/tbb/tbb_exception.h b/xdl/third_party/tbb/include/tbb/tbb_exception.h
new file mode 100644
index 00000000..af0ec6db
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_exception.h
@@ -0,0 +1,360 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_exception_H
+#define __TBB_exception_H
+
+#include "tbb_stddef.h"
+#include <exception>
+#include <new>    // required for bad_alloc definition, operators new
+#include <string> // required to construct std exception classes
+
+namespace tbb {
+
+//! Exception for concurrent containers
+class bad_last_alloc : public std::bad_alloc {
+public:
+    const char* what() const throw() __TBB_override;
+#if __TBB_DEFAULT_DTOR_THROW_SPEC_BROKEN
+    ~bad_last_alloc() throw() __TBB_override {}
+#endif
+};
+
+//! Exception for PPL locks
+class improper_lock : public std::exception {
+public:
+    const char* what() const throw() __TBB_override;
+};
+
+//! Exception for user-initiated abort
+class user_abort : public std::exception {
+public:
+    const char* what() const throw() __TBB_override;
+};
+
+//! Exception for missing wait on structured_task_group
+class missing_wait : public std::exception {
+public:
+    const char* what() const throw() __TBB_override;
+};
+
+//! Exception for repeated scheduling of the same task_handle
+class invalid_multiple_scheduling : public std::exception {
+public:
+    const char* what() const throw() __TBB_override;
+};
+
+namespace internal {
+//! Obsolete
+void __TBB_EXPORTED_FUNC throw_bad_last_alloc_exception_v4();
+
+enum exception_id {
+    eid_bad_alloc = 1,
+    eid_bad_last_alloc,
+    eid_nonpositive_step,
+    eid_out_of_range,
+    eid_segment_range_error,
+    eid_index_range_error,
+    eid_missing_wait,
+    eid_invalid_multiple_scheduling,
+    eid_improper_lock,
+    eid_possible_deadlock,
+    eid_operation_not_permitted,
+    eid_condvar_wait_failed,
+    eid_invalid_load_factor,
+    eid_reserved, // free slot for backward compatibility, can be reused.
+    eid_invalid_swap,
+    eid_reservation_length_error,
+    eid_invalid_key,
+    eid_user_abort,
+    eid_reserved1,
+#if __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+    // This id is used only from inside the library and only for support of CPF functionality.
+    // So, if we drop the functionality, eid_reserved1 can be safely renamed and reused.
+    eid_blocking_thread_join_impossible = eid_reserved1,
+#endif
+    eid_bad_tagged_msg_cast,
+    //! The last enumerator tracks the number of defined IDs. It must remain the last one.
+    /** When adding new IDs, place them immediately _before_ this comment (that is
+        _after_ all the existing IDs. NEVER insert new IDs between the existing ones. **/
+    eid_max
+};
+
+//! Gathers all throw operators in one place.
+/** Its purpose is to minimize code bloat that can be caused by throw operators
+    scattered in multiple places, especially in templates. **/
+void __TBB_EXPORTED_FUNC throw_exception_v4 ( exception_id );
+
+//! Versionless convenience wrapper for throw_exception_v4()
+inline void throw_exception ( exception_id eid ) { throw_exception_v4(eid); }
+
+} // namespace internal
+} // namespace tbb
+
+#if __TBB_TASK_GROUP_CONTEXT
+#include "tbb_allocator.h"
+#include <typeinfo> //for typeid
+
+namespace tbb {
+
+//! Interface to be implemented by all exceptions TBB recognizes and propagates across the threads.
+/** If an unhandled exception of the type derived from tbb::tbb_exception is intercepted
+    by the TBB scheduler in one of the worker threads, it is delivered to and re-thrown in
+    the root thread. The root thread is the thread that has started the outermost algorithm
+    or root task sharing the same task_group_context with the guilty algorithm/task (the one
+    that threw the exception first).
+
+    Note: when documentation mentions workers with respect to exception handling,
+    masters are implied as well, because they are completely equivalent in this context.
+    Consequently a root thread can be master or worker thread.
+
+    NOTE: In case of nested algorithms or complex task hierarchies when the nested
+    levels share (explicitly or by means of implicit inheritance) the task group
+    context of the outermost level, the exception may be (re-)thrown multiple times
+    (ultimately - in each worker on each nesting level) before reaching the root
+    thread at the outermost level. IMPORTANT: if you intercept an exception derived
+    from this class on a nested level, you must re-throw it in the catch block by means
+    of the "throw;" operator.
+
+    TBB provides two implementations of this interface: tbb::captured_exception and
+    template class tbb::movable_exception. See their declarations for more info. **/
+class tbb_exception : public std::exception
+{
+    /** No operator new is provided because the TBB usage model assumes dynamic
+        creation of the TBB exception objects only by means of applying move()
+        operation on an exception thrown out of TBB scheduler. **/
+    void* operator new ( size_t );
+
+public:
+#if __clang__
+    // At -O3 or even -O2 optimization level, Clang may fully throw away an empty destructor
+    // of tbb_exception from destructors of derived classes. As a result, it does not create
+    // vtable for tbb_exception, which is a required part of TBB binary interface.
+    // Making the destructor non-empty (with just a semicolon) prevents that optimization.
+    ~tbb_exception() throw() { /* keep the semicolon! */ ; }
+#endif
+
+    //! Creates and returns pointer to the deep copy of this exception object.
+    /** Move semantics is allowed. **/
+    virtual tbb_exception* move() throw() = 0;
+
+    //! Destroys objects created by the move() method.
+    /** Frees memory and calls destructor for this exception object.
+        Can and must be used only on objects created by the move method. **/
+    virtual void destroy() throw() = 0;
+
+    //! Throws this exception object.
+    /** Make sure that if you have several levels of derivation from this interface
+        you implement or override this method on the most derived level. The implementation
+        is as simple as "throw *this;". Failure to do this will result in exception
+        of a base class type being thrown. **/
+    virtual void throw_self() = 0;
+
+    //! Returns RTTI name of the originally intercepted exception
+    virtual const char* name() const throw() = 0;
+
+    //! Returns the result of originally intercepted exception's what() method.
+    virtual const char* what() const throw() __TBB_override = 0;
+
+    /** Operator delete is provided only to allow using existing smart pointers
+        with TBB exception objects obtained as the result of applying move()
+        operation on an exception thrown out of TBB scheduler.
+
+        When overriding method move() make sure to override operator delete as well
+        if memory is allocated not by TBB's scalable allocator. **/
+    void operator delete ( void* p ) {
+        internal::deallocate_via_handler_v3(p);
+    }
+};
+
+//! This class is used by TBB to propagate information about unhandled exceptions into the root thread.
+/** Exception of this type is thrown by TBB in the root thread (thread that started a parallel
+    algorithm ) if an unhandled exception was intercepted during the algorithm execution in one
+    of the workers.
+    \sa tbb::tbb_exception **/
+class captured_exception : public tbb_exception
+{
+public:
+    captured_exception( const captured_exception& src )
+        : tbb_exception(src), my_dynamic(false)
+    {
+        set(src.my_exception_name, src.my_exception_info);
+    }
+
+    captured_exception( const char* name_, const char* info )
+        : my_dynamic(false)
+    {
+        set(name_, info);
+    }
+
+    __TBB_EXPORTED_METHOD ~captured_exception() throw();
+
+    captured_exception& operator= ( const captured_exception& src ) {
+        if ( this != &src ) {
+            clear();
+            set(src.my_exception_name, src.my_exception_info);
+        }
+        return *this;
+    }
+
+    captured_exception* __TBB_EXPORTED_METHOD move() throw() __TBB_override;
+
+    void __TBB_EXPORTED_METHOD destroy() throw() __TBB_override;
+
+    void throw_self() __TBB_override { __TBB_THROW(*this); }
+
+    const char* __TBB_EXPORTED_METHOD name() const throw() __TBB_override;
+
+    const char* __TBB_EXPORTED_METHOD what() const throw() __TBB_override;
+
+    void __TBB_EXPORTED_METHOD set( const char* name, const char* info ) throw();
+    void __TBB_EXPORTED_METHOD clear() throw();
+
+private:
+    //! Used only by method move().
+    captured_exception() {}
+
+    //! Functionally equivalent to {captured_exception e(name,info); return e.move();}
+    static captured_exception* allocate( const char* name, const char* info );
+
+    bool my_dynamic;
+    const char* my_exception_name;
+    const char* my_exception_info;
+};
+
+//! Template that can be used to implement exception that transfers arbitrary ExceptionData to the root thread
+/** Code using TBB can instantiate this template with an arbitrary ExceptionData type
+    and throw this exception object. Such exceptions are intercepted by the TBB scheduler
+    and delivered to the root thread ().
+    \sa tbb::tbb_exception **/
+template<typename ExceptionData>
+class movable_exception : public tbb_exception
+{
+    typedef movable_exception<ExceptionData> self_type;
+
+public:
+    movable_exception( const ExceptionData& data_ )
+        : my_exception_data(data_)
+        , my_dynamic(false)
+        , my_exception_name(
+#if TBB_USE_EXCEPTIONS
+        typeid(self_type).name()
+#else /* !TBB_USE_EXCEPTIONS */
+        "movable_exception"
+#endif /* !TBB_USE_EXCEPTIONS */
+        )
+    {}
+
+    movable_exception( const movable_exception& src ) throw ()
+        : tbb_exception(src)
+        , my_exception_data(src.my_exception_data)
+        , my_dynamic(false)
+        , my_exception_name(src.my_exception_name)
+    {}
+
+    ~movable_exception() throw() {}
+
+    const movable_exception& operator= ( const movable_exception& src ) {
+        if ( this != &src ) {
+            my_exception_data = src.my_exception_data;
+            my_exception_name = src.my_exception_name;
+        }
+        return *this;
+    }
+
+    ExceptionData& data() throw() { return my_exception_data; }
+
+    const ExceptionData& data() const throw() { return my_exception_data; }
+
+    const char* name() const throw() __TBB_override { return my_exception_name; }
+
+    const char* what() const throw() __TBB_override { return "tbb::movable_exception"; }
+
+    movable_exception* move() throw() __TBB_override {
+        void* e = internal::allocate_via_handler_v3(sizeof(movable_exception));
+        if ( e ) {
+            ::new (e) movable_exception(*this);
+            ((movable_exception*)e)->my_dynamic = true;
+        }
+        return (movable_exception*)e;
+    }
+    void destroy() throw() __TBB_override {
+        __TBB_ASSERT ( my_dynamic, "Method destroy can be called only on dynamically allocated movable_exceptions" );
+        if ( my_dynamic ) {
+            this->~movable_exception();
+            internal::deallocate_via_handler_v3(this);
+        }
+    }
+    void throw_self() __TBB_override { __TBB_THROW( *this ); }
+
+protected:
+    //! User data
+    ExceptionData  my_exception_data;
+
+private:
+    //! Flag specifying whether this object has been dynamically allocated (by the move method)
+    bool my_dynamic;
+
+    //! RTTI name of this class
+    /** We rely on the fact that RTTI names are static string constants. **/
+    const char* my_exception_name;
+};
+
+#if !TBB_USE_CAPTURED_EXCEPTION
+namespace internal {
+
+//! Exception container that preserves the exact copy of the original exception
+/** This class can be used only when the appropriate runtime support (mandated
+    by C++11) is present **/
+class tbb_exception_ptr {
+    std::exception_ptr  my_ptr;
+
+public:
+    static tbb_exception_ptr* allocate();
+    static tbb_exception_ptr* allocate( const tbb_exception& tag );
+    //! This overload uses move semantics (i.e. it empties src)
+    static tbb_exception_ptr* allocate( captured_exception& src );
+
+    //! Destroys this objects
+    /** Note that objects of this type can be created only by the allocate() method. **/
+    void destroy() throw();
+
+    //! Throws the contained exception .
+    void throw_self() { std::rethrow_exception(my_ptr); }
+
+private:
+    tbb_exception_ptr( const std::exception_ptr& src ) : my_ptr(src) {}
+    tbb_exception_ptr( const captured_exception& src ) :
+        #if __TBB_MAKE_EXCEPTION_PTR_PRESENT
+            my_ptr(std::make_exception_ptr(src))  // the final function name in C++11
+        #else
+            my_ptr(std::copy_exception(src))      // early C++0x drafts name
+        #endif
+    {}
+}; // class tbb::internal::tbb_exception_ptr
+
+} // namespace internal
+#endif /* !TBB_USE_CAPTURED_EXCEPTION */
+
+} // namespace tbb
+
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#endif /* __TBB_exception_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_machine.h b/xdl/third_party/tbb/include/tbb/tbb_machine.h
new file mode 100644
index 00000000..e79d82e6
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_machine.h
@@ -0,0 +1,982 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_machine_H
+#define __TBB_machine_H
+
+/** This header provides basic platform abstraction layer by hooking up appropriate
+    architecture/OS/compiler specific headers from the /include/tbb/machine directory.
+    If a plug-in header does not implement all the required APIs, it must specify
+    the missing ones by setting one or more of the following macros:
+
+    __TBB_USE_GENERIC_PART_WORD_CAS
+    __TBB_USE_GENERIC_PART_WORD_FETCH_ADD
+    __TBB_USE_GENERIC_PART_WORD_FETCH_STORE
+    __TBB_USE_GENERIC_FETCH_ADD
+    __TBB_USE_GENERIC_FETCH_STORE
+    __TBB_USE_GENERIC_DWORD_FETCH_ADD
+    __TBB_USE_GENERIC_DWORD_FETCH_STORE
+    __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE
+    __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE
+    __TBB_USE_GENERIC_RELAXED_LOAD_STORE
+    __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE
+
+    In this case tbb_machine.h will add missing functionality based on a minimal set
+    of APIs that are required to be implemented by all plug-n headers as described
+    further.
+    Note that these generic implementations may be sub-optimal for a particular
+    architecture, and thus should be relied upon only after careful evaluation
+    or as the last resort.
+
+    Additionally __TBB_64BIT_ATOMICS can be set to 0 on a 32-bit architecture to
+    indicate that the port is not going to support double word atomics. It may also
+    be set to 1 explicitly, though normally this is not necessary as tbb_machine.h
+    will set it automatically.
+
+    __TBB_ENDIANNESS macro can be defined by the implementation as well.
+    It is used only if __TBB_USE_GENERIC_PART_WORD_CAS is set (or for testing),
+    and must specify the layout of aligned 16-bit and 32-bit data anywhere within a process
+    (while the details of unaligned 16-bit or 32-bit data or of 64-bit data are irrelevant).
+    The layout must be the same at all relevant memory locations within the current process;
+    in case of page-specific endianness, one endianness must be kept "out of sight".
+    Possible settings, reflecting hardware and possibly O.S. convention, are:
+    -  __TBB_ENDIAN_BIG for big-endian data,
+    -  __TBB_ENDIAN_LITTLE for little-endian data,
+    -  __TBB_ENDIAN_DETECT for run-time detection iff exactly one of the above,
+    -  __TBB_ENDIAN_UNSUPPORTED to prevent undefined behavior if none of the above.
+
+    Prerequisites for each architecture port
+    ----------------------------------------
+    The following functions and macros have no generic implementation. Therefore they must be
+    implemented in each machine architecture specific header either as a conventional
+    function or as a functional macro.
+
+    __TBB_WORDSIZE
+        This is the size of machine word in bytes, i.e. for 32 bit systems it
+        should be defined to 4.
+
+    __TBB_Yield()
+        Signals OS that the current thread is willing to relinquish the remainder
+        of its time quantum.
+
+    __TBB_full_memory_fence()
+        Must prevent all memory operations from being reordered across it (both
+        by hardware and compiler). All such fences must be totally ordered (or
+        sequentially consistent).
+
+    __TBB_machine_cmpswp4( volatile void *ptr, int32_t value, int32_t comparand )
+        Must be provided if __TBB_USE_FENCED_ATOMICS is not set.
+
+    __TBB_machine_cmpswp8( volatile void *ptr, int32_t value, int64_t comparand )
+        Must be provided for 64-bit architectures if __TBB_USE_FENCED_ATOMICS is not set,
+        and for 32-bit architectures if __TBB_64BIT_ATOMICS is set
+
+    __TBB_machine_<op><S><fence>(...), where
+        <op> = {cmpswp, fetchadd, fetchstore}
+        <S> = {1, 2, 4, 8}
+        <fence> = {full_fence, acquire, release, relaxed}
+        Must be provided if __TBB_USE_FENCED_ATOMICS is set.
+
+    __TBB_control_consistency_helper()
+        Bridges the memory-semantics gap between architectures providing only
+        implicit C++0x "consume" semantics (like Power Architecture) and those
+        also implicitly obeying control dependencies (like IA-64 architecture).
+        It must be used only in conditional code where the condition is itself
+        data-dependent, and will then make subsequent code behave as if the
+        original data dependency were acquired.
+        It needs only a compiler fence where implied by the architecture
+        either specifically (like IA-64 architecture) or because generally stronger
+        "acquire" semantics are enforced (like x86).
+        It is always valid, though potentially suboptimal, to replace
+        control with acquire on the load and then remove the helper.
+
+    __TBB_acquire_consistency_helper(), __TBB_release_consistency_helper()
+        Must be provided if __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE is set.
+        Enforce acquire and release semantics in generic implementations of fenced
+        store and load operations. Depending on the particular architecture/compiler
+        combination they may be a hardware fence, a compiler fence, both or nothing.
+ **/
+
+#include "tbb_stddef.h"
+
+namespace tbb {
+namespace internal { //< @cond INTERNAL
+
+////////////////////////////////////////////////////////////////////////////////
+// Overridable helpers declarations
+//
+// A machine/*.h file may choose to define these templates, otherwise it must
+// request default implementation by setting appropriate __TBB_USE_GENERIC_XXX macro(s).
+//
+template <typename T, std::size_t S>
+struct machine_load_store;
+
+template <typename T, std::size_t S>
+struct machine_load_store_relaxed;
+
+template <typename T, std::size_t S>
+struct machine_load_store_seq_cst;
+//
+// End of overridable helpers declarations
+////////////////////////////////////////////////////////////////////////////////
+
+template<size_t S> struct atomic_selector;
+
+template<> struct atomic_selector<1> {
+    typedef int8_t word;
+    inline static word fetch_store ( volatile void* location, word value );
+};
+
+template<> struct atomic_selector<2> {
+    typedef int16_t word;
+    inline static word fetch_store ( volatile void* location, word value );
+};
+
+template<> struct atomic_selector<4> {
+#if _MSC_VER && !_WIN64
+    // Work-around that avoids spurious /Wp64 warnings
+    typedef intptr_t word;
+#else
+    typedef int32_t word;
+#endif
+    inline static word fetch_store ( volatile void* location, word value );
+};
+
+template<> struct atomic_selector<8> {
+    typedef int64_t word;
+    inline static word fetch_store ( volatile void* location, word value );
+};
+
+}} //< namespaces internal @endcond, tbb
+
+#define __TBB_MACHINE_DEFINE_STORE8_GENERIC_FENCED(M)                                        \
+    inline void __TBB_machine_generic_store8##M(volatile void *ptr, int64_t value) {         \
+        for(;;) {                                                                            \
+            int64_t result = *(volatile int64_t *)ptr;                                       \
+            if( __TBB_machine_cmpswp8##M(ptr,value,result)==result ) break;                  \
+        }                                                                                    \
+    }                                                                                        \
+
+#define __TBB_MACHINE_DEFINE_LOAD8_GENERIC_FENCED(M)                                         \
+    inline int64_t __TBB_machine_generic_load8##M(const volatile void *ptr) {                \
+        /* Comparand and new value may be anything, they only must be equal, and      */     \
+        /* the value should have a low probability to be actually found in 'location'.*/     \
+        const int64_t anyvalue = 2305843009213693951LL;                                      \
+        return __TBB_machine_cmpswp8##M(const_cast<volatile void *>(ptr),anyvalue,anyvalue); \
+    }                                                                                        \
+
+// The set of allowed values for __TBB_ENDIANNESS (see above for details)
+#define __TBB_ENDIAN_UNSUPPORTED -1
+#define __TBB_ENDIAN_LITTLE       0
+#define __TBB_ENDIAN_BIG          1
+#define __TBB_ENDIAN_DETECT       2
+
+#if _WIN32||_WIN64
+
+#ifdef _MANAGED
+#pragma managed(push, off)
+#endif
+
+    #if __MINGW64__ || __MINGW32__
+        extern "C" __declspec(dllimport) int __stdcall SwitchToThread( void );
+        #define __TBB_Yield()  SwitchToThread()
+        #if (TBB_USE_GCC_BUILTINS && __TBB_GCC_BUILTIN_ATOMICS_PRESENT)
+            #include "machine/gcc_generic.h"
+        #elif __MINGW64__
+            #include "machine/linux_intel64.h"
+        #elif __MINGW32__
+            #include "machine/linux_ia32.h"
+        #endif
+    #elif (TBB_USE_ICC_BUILTINS && __TBB_ICC_BUILTIN_ATOMICS_PRESENT)
+        #include "machine/icc_generic.h"
+    #elif defined(_M_IX86) && !defined(__TBB_WIN32_USE_CL_BUILTINS)
+        #include "machine/windows_ia32.h"
+    #elif defined(_M_X64)
+        #include "machine/windows_intel64.h"
+    #elif defined(_M_ARM) || defined(__TBB_WIN32_USE_CL_BUILTINS)
+        #include "machine/msvc_armv7.h"
+    #endif
+
+#ifdef _MANAGED
+#pragma managed(pop)
+#endif
+
+#elif __TBB_DEFINE_MIC
+
+    #include "machine/mic_common.h"
+    #if (TBB_USE_ICC_BUILTINS && __TBB_ICC_BUILTIN_ATOMICS_PRESENT)
+        #include "machine/icc_generic.h"
+    #else
+        #include "machine/linux_intel64.h"
+    #endif
+
+#elif __linux__ || __FreeBSD__ || __NetBSD__ || __OpenBSD__
+
+    #if (TBB_USE_GCC_BUILTINS && __TBB_GCC_BUILTIN_ATOMICS_PRESENT)
+        #include "machine/gcc_generic.h"
+    #elif (TBB_USE_ICC_BUILTINS && __TBB_ICC_BUILTIN_ATOMICS_PRESENT)
+        #include "machine/icc_generic.h"
+    #elif __i386__
+        #include "machine/linux_ia32.h"
+    #elif __x86_64__
+        #include "machine/linux_intel64.h"
+    #elif __ia64__
+        #include "machine/linux_ia64.h"
+    #elif __powerpc__
+        #include "machine/mac_ppc.h"
+    #elif __ARM_ARCH_7A__ || __aarch64__
+        #include "machine/gcc_arm.h"
+    #elif __TBB_GCC_BUILTIN_ATOMICS_PRESENT
+        #include "machine/gcc_generic.h"
+    #endif
+    #include "machine/linux_common.h"
+
+#elif __APPLE__
+    //TODO:  TBB_USE_GCC_BUILTINS is not used for Mac, Sun, Aix
+    #if (TBB_USE_ICC_BUILTINS && __TBB_ICC_BUILTIN_ATOMICS_PRESENT)
+        #include "machine/icc_generic.h"
+    #elif __TBB_x86_32
+        #include "machine/linux_ia32.h"
+    #elif __TBB_x86_64
+        #include "machine/linux_intel64.h"
+    #elif __POWERPC__
+        #include "machine/mac_ppc.h"
+    #endif
+    #include "machine/macos_common.h"
+
+#elif _AIX
+
+    #include "machine/ibm_aix51.h"
+
+#elif __sun || __SUNPRO_CC
+
+    #define __asm__ asm
+    #define __volatile__ volatile
+
+    #if __i386  || __i386__
+        #include "machine/linux_ia32.h"
+    #elif __x86_64__
+        #include "machine/linux_intel64.h"
+    #elif __sparc
+        #include "machine/sunos_sparc.h"
+    #endif
+    #include <sched.h>
+
+    #define __TBB_Yield() sched_yield()
+
+#endif /* OS selection */
+
+#ifndef __TBB_64BIT_ATOMICS
+    #define __TBB_64BIT_ATOMICS 1
+#endif
+
+//TODO: replace usage of these functions with usage of tbb::atomic, and then remove them
+//TODO: map functions with W suffix to use cast to tbb::atomic and according op, i.e. as_atomic().op()
+// Special atomic functions
+#if __TBB_USE_FENCED_ATOMICS
+    #define __TBB_machine_cmpswp1   __TBB_machine_cmpswp1full_fence
+    #define __TBB_machine_cmpswp2   __TBB_machine_cmpswp2full_fence
+    #define __TBB_machine_cmpswp4   __TBB_machine_cmpswp4full_fence
+    #define __TBB_machine_cmpswp8   __TBB_machine_cmpswp8full_fence
+
+    #if __TBB_WORDSIZE==8
+        #define __TBB_machine_fetchadd8             __TBB_machine_fetchadd8full_fence
+        #define __TBB_machine_fetchstore8           __TBB_machine_fetchstore8full_fence
+        #define __TBB_FetchAndAddWrelease(P,V)      __TBB_machine_fetchadd8release(P,V)
+        #define __TBB_FetchAndIncrementWacquire(P)  __TBB_machine_fetchadd8acquire(P,1)
+        #define __TBB_FetchAndDecrementWrelease(P)  __TBB_machine_fetchadd8release(P,(-1))
+    #else
+        #define __TBB_machine_fetchadd4             __TBB_machine_fetchadd4full_fence
+        #define __TBB_machine_fetchstore4           __TBB_machine_fetchstore4full_fence
+        #define __TBB_FetchAndAddWrelease(P,V)      __TBB_machine_fetchadd4release(P,V)
+        #define __TBB_FetchAndIncrementWacquire(P)  __TBB_machine_fetchadd4acquire(P,1)
+        #define __TBB_FetchAndDecrementWrelease(P)  __TBB_machine_fetchadd4release(P,(-1))
+    #endif /* __TBB_WORDSIZE==4 */
+#else /* !__TBB_USE_FENCED_ATOMICS */
+    #define __TBB_FetchAndAddWrelease(P,V)      __TBB_FetchAndAddW(P,V)
+    #define __TBB_FetchAndIncrementWacquire(P)  __TBB_FetchAndAddW(P,1)
+    #define __TBB_FetchAndDecrementWrelease(P)  __TBB_FetchAndAddW(P,(-1))
+#endif /* !__TBB_USE_FENCED_ATOMICS */
+
+#if __TBB_WORDSIZE==4
+    #define __TBB_CompareAndSwapW(P,V,C)    __TBB_machine_cmpswp4(P,V,C)
+    #define __TBB_FetchAndAddW(P,V)         __TBB_machine_fetchadd4(P,V)
+    #define __TBB_FetchAndStoreW(P,V)       __TBB_machine_fetchstore4(P,V)
+#elif  __TBB_WORDSIZE==8
+    #if __TBB_USE_GENERIC_DWORD_LOAD_STORE || __TBB_USE_GENERIC_DWORD_FETCH_ADD || __TBB_USE_GENERIC_DWORD_FETCH_STORE
+        #error These macros should only be used on 32-bit platforms.
+    #endif
+
+    #define __TBB_CompareAndSwapW(P,V,C)    __TBB_machine_cmpswp8(P,V,C)
+    #define __TBB_FetchAndAddW(P,V)         __TBB_machine_fetchadd8(P,V)
+    #define __TBB_FetchAndStoreW(P,V)       __TBB_machine_fetchstore8(P,V)
+#else /* __TBB_WORDSIZE != 8 */
+    #error Unsupported machine word size.
+#endif /* __TBB_WORDSIZE */
+
+#ifndef __TBB_Pause
+    inline void __TBB_Pause(int32_t) {
+        __TBB_Yield();
+    }
+#endif
+
+namespace tbb {
+
+//! Sequentially consistent full memory fence.
+inline void atomic_fence () { __TBB_full_memory_fence(); }
+
+namespace internal { //< @cond INTERNAL
+
+//! Class that implements exponential backoff.
+/** See implementation of spin_wait_while_eq for an example. */
+class atomic_backoff : no_copy {
+    //! Time delay, in units of "pause" instructions.
+    /** Should be equal to approximately the number of "pause" instructions
+        that take the same time as an context switch. Must be a power of two.*/
+    static const int32_t LOOPS_BEFORE_YIELD = 16;
+    int32_t count;
+public:
+    // In many cases, an object of this type is initialized eagerly on hot path,
+    // as in for(atomic_backoff b; ; b.pause()) { /*loop body*/ }
+    // For this reason, the construction cost must be very small!
+    atomic_backoff() : count(1) {}
+    // This constructor pauses immediately; do not use on hot paths!
+    atomic_backoff( bool ) : count(1) { pause(); }
+
+    //! Pause for a while.
+    void pause() {
+        if( count<=LOOPS_BEFORE_YIELD ) {
+            __TBB_Pause(count);
+            // Pause twice as long the next time.
+            count*=2;
+        } else {
+            // Pause is so long that we might as well yield CPU to scheduler.
+            __TBB_Yield();
+        }
+    }
+
+    //! Pause for a few times and return false if saturated.
+    bool bounded_pause() {
+        __TBB_Pause(count);
+        if( count<LOOPS_BEFORE_YIELD ) {
+            // Pause twice as long the next time.
+            count*=2;
+            return true;
+        } else {
+            return false;
+        }
+    }
+
+    void reset() {
+        count = 1;
+    }
+};
+
+//! Spin WHILE the value of the variable is equal to a given value
+/** T and U should be comparable types. */
+template<typename T, typename U>
+void spin_wait_while_eq( const volatile T& location, U value ) {
+    atomic_backoff backoff;
+    while( location==value ) backoff.pause();
+}
+
+//! Spin UNTIL the value of the variable is equal to a given value
+/** T and U should be comparable types. */
+template<typename T, typename U>
+void spin_wait_until_eq( const volatile T& location, const U value ) {
+    atomic_backoff backoff;
+    while( location!=value ) backoff.pause();
+}
+
+template <typename predicate_type>
+void spin_wait_while(predicate_type condition){
+    atomic_backoff backoff;
+    while( condition() ) backoff.pause();
+}
+
+////////////////////////////////////////////////////////////////////////////////
+// Generic compare-and-swap applied to only a part of a machine word.
+//
+#ifndef __TBB_ENDIANNESS
+#define __TBB_ENDIANNESS __TBB_ENDIAN_DETECT
+#endif
+
+#if __TBB_USE_GENERIC_PART_WORD_CAS && __TBB_ENDIANNESS==__TBB_ENDIAN_UNSUPPORTED
+#error Generic implementation of part-word CAS may not be used with __TBB_ENDIAN_UNSUPPORTED
+#endif
+
+#if __TBB_ENDIANNESS!=__TBB_ENDIAN_UNSUPPORTED
+//
+// This function is the only use of __TBB_ENDIANNESS.
+// The following restrictions/limitations apply for this operation:
+//  - T must be an integer type of at most 4 bytes for the casts and calculations to work
+//  - T must also be less than 4 bytes to avoid compiler warnings when computing mask
+//      (and for the operation to be useful at all, so no workaround is applied)
+//  - the architecture must consistently use either little-endian or big-endian (same for all locations)
+//
+// TODO: static_assert for the type requirements stated above
+template<typename T>
+inline T __TBB_MaskedCompareAndSwap (volatile T * const ptr, const T value, const T comparand ) {
+    struct endianness{ static bool is_big_endian(){
+        #if __TBB_ENDIANNESS==__TBB_ENDIAN_DETECT
+            const uint32_t probe = 0x03020100;
+            return (((const char*)(&probe))[0]==0x03);
+        #elif __TBB_ENDIANNESS==__TBB_ENDIAN_BIG || __TBB_ENDIANNESS==__TBB_ENDIAN_LITTLE
+            return __TBB_ENDIANNESS==__TBB_ENDIAN_BIG;
+        #else
+            #error Unexpected value of __TBB_ENDIANNESS
+        #endif
+    }};
+
+    const uint32_t byte_offset            = (uint32_t) ((uintptr_t)ptr & 0x3);
+    volatile uint32_t * const aligned_ptr = (uint32_t*)((uintptr_t)ptr - byte_offset );
+
+    // location of T within uint32_t for a C++ shift operation
+    const uint32_t bits_to_shift     = 8*(endianness::is_big_endian() ? (4 - sizeof(T) - (byte_offset)) : byte_offset);
+    const uint32_t mask              = (((uint32_t)1<<(sizeof(T)*8)) - 1 )<<bits_to_shift;
+    // for signed T, any sign extension bits in cast value/comparand are immediately clipped by mask
+    const uint32_t shifted_comparand = ((uint32_t)comparand << bits_to_shift)&mask;
+    const uint32_t shifted_value     = ((uint32_t)value     << bits_to_shift)&mask;
+
+    for( atomic_backoff b;;b.pause() ) {
+        const uint32_t surroundings  = *aligned_ptr & ~mask ; // may have changed during the pause
+        const uint32_t big_comparand = surroundings | shifted_comparand ;
+        const uint32_t big_value     = surroundings | shifted_value     ;
+        // __TBB_machine_cmpswp4 presumed to have full fence.
+        // Cast shuts up /Wp64 warning
+        const uint32_t big_result = (uint32_t)__TBB_machine_cmpswp4( aligned_ptr, big_value, big_comparand );
+        if( big_result == big_comparand                    // CAS succeeded
+          || ((big_result ^ big_comparand) & mask) != 0)   // CAS failed and the bits of interest have changed
+        {
+            return T((big_result & mask) >> bits_to_shift);
+        }
+        else continue;                                     // CAS failed but the bits of interest were not changed
+    }
+}
+#endif // __TBB_ENDIANNESS!=__TBB_ENDIAN_UNSUPPORTED
+////////////////////////////////////////////////////////////////////////////////
+
+template<size_t S, typename T>
+inline T __TBB_CompareAndSwapGeneric (volatile void *ptr, T value, T comparand );
+
+template<>
+inline int8_t __TBB_CompareAndSwapGeneric <1,int8_t> (volatile void *ptr, int8_t value, int8_t comparand ) {
+#if __TBB_USE_GENERIC_PART_WORD_CAS
+    return __TBB_MaskedCompareAndSwap<int8_t>((volatile int8_t *)ptr,value,comparand);
+#else
+    return __TBB_machine_cmpswp1(ptr,value,comparand);
+#endif
+}
+
+template<>
+inline int16_t __TBB_CompareAndSwapGeneric <2,int16_t> (volatile void *ptr, int16_t value, int16_t comparand ) {
+#if __TBB_USE_GENERIC_PART_WORD_CAS
+    return __TBB_MaskedCompareAndSwap<int16_t>((volatile int16_t *)ptr,value,comparand);
+#else
+    return __TBB_machine_cmpswp2(ptr,value,comparand);
+#endif
+}
+
+template<>
+inline int32_t __TBB_CompareAndSwapGeneric <4,int32_t> (volatile void *ptr, int32_t value, int32_t comparand ) {
+    // Cast shuts up /Wp64 warning
+    return (int32_t)__TBB_machine_cmpswp4(ptr,value,comparand);
+}
+
+#if __TBB_64BIT_ATOMICS
+template<>
+inline int64_t __TBB_CompareAndSwapGeneric <8,int64_t> (volatile void *ptr, int64_t value, int64_t comparand ) {
+    return __TBB_machine_cmpswp8(ptr,value,comparand);
+}
+#endif
+
+template<size_t S, typename T>
+inline T __TBB_FetchAndAddGeneric (volatile void *ptr, T addend) {
+    T result;
+    for( atomic_backoff b;;b.pause() ) {
+        result = *reinterpret_cast<volatile T *>(ptr);
+        // __TBB_CompareAndSwapGeneric presumed to have full fence.
+        if( __TBB_CompareAndSwapGeneric<S,T> ( ptr, result+addend, result )==result )
+            break;
+    }
+    return result;
+}
+
+template<size_t S, typename T>
+inline T __TBB_FetchAndStoreGeneric (volatile void *ptr, T value) {
+    T result;
+    for( atomic_backoff b;;b.pause() ) {
+        result = *reinterpret_cast<volatile T *>(ptr);
+        // __TBB_CompareAndSwapGeneric presumed to have full fence.
+        if( __TBB_CompareAndSwapGeneric<S,T> ( ptr, value, result )==result )
+            break;
+    }
+    return result;
+}
+
+#if __TBB_USE_GENERIC_PART_WORD_CAS
+#define __TBB_machine_cmpswp1 tbb::internal::__TBB_CompareAndSwapGeneric<1,int8_t>
+#define __TBB_machine_cmpswp2 tbb::internal::__TBB_CompareAndSwapGeneric<2,int16_t>
+#endif
+
+#if __TBB_USE_GENERIC_FETCH_ADD || __TBB_USE_GENERIC_PART_WORD_FETCH_ADD
+#define __TBB_machine_fetchadd1 tbb::internal::__TBB_FetchAndAddGeneric<1,int8_t>
+#define __TBB_machine_fetchadd2 tbb::internal::__TBB_FetchAndAddGeneric<2,int16_t>
+#endif
+
+#if __TBB_USE_GENERIC_FETCH_ADD
+#define __TBB_machine_fetchadd4 tbb::internal::__TBB_FetchAndAddGeneric<4,int32_t>
+#endif
+
+#if __TBB_USE_GENERIC_FETCH_ADD || __TBB_USE_GENERIC_DWORD_FETCH_ADD
+#define __TBB_machine_fetchadd8 tbb::internal::__TBB_FetchAndAddGeneric<8,int64_t>
+#endif
+
+#if __TBB_USE_GENERIC_FETCH_STORE || __TBB_USE_GENERIC_PART_WORD_FETCH_STORE
+#define __TBB_machine_fetchstore1 tbb::internal::__TBB_FetchAndStoreGeneric<1,int8_t>
+#define __TBB_machine_fetchstore2 tbb::internal::__TBB_FetchAndStoreGeneric<2,int16_t>
+#endif
+
+#if __TBB_USE_GENERIC_FETCH_STORE
+#define __TBB_machine_fetchstore4 tbb::internal::__TBB_FetchAndStoreGeneric<4,int32_t>
+#endif
+
+#if __TBB_USE_GENERIC_FETCH_STORE || __TBB_USE_GENERIC_DWORD_FETCH_STORE
+#define __TBB_machine_fetchstore8 tbb::internal::__TBB_FetchAndStoreGeneric<8,int64_t>
+#endif
+
+#if __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE
+#define __TBB_MACHINE_DEFINE_ATOMIC_SELECTOR_FETCH_STORE(S)                                             \
+    atomic_selector<S>::word atomic_selector<S>::fetch_store ( volatile void* location, word value ) {  \
+        return __TBB_machine_fetchstore##S( location, value );                                          \
+    }
+
+__TBB_MACHINE_DEFINE_ATOMIC_SELECTOR_FETCH_STORE(1)
+__TBB_MACHINE_DEFINE_ATOMIC_SELECTOR_FETCH_STORE(2)
+__TBB_MACHINE_DEFINE_ATOMIC_SELECTOR_FETCH_STORE(4)
+__TBB_MACHINE_DEFINE_ATOMIC_SELECTOR_FETCH_STORE(8)
+
+#undef __TBB_MACHINE_DEFINE_ATOMIC_SELECTOR_FETCH_STORE
+#endif /* __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE */
+
+#if __TBB_USE_GENERIC_DWORD_LOAD_STORE
+/*TODO: find a more elegant way to handle function names difference*/
+#if ! __TBB_USE_FENCED_ATOMICS
+    /* This name forwarding is needed for generic implementation of
+     * load8/store8 defined below (via macro) to pick the right CAS function*/
+    #define   __TBB_machine_cmpswp8full_fence __TBB_machine_cmpswp8
+#endif
+__TBB_MACHINE_DEFINE_LOAD8_GENERIC_FENCED(full_fence)
+__TBB_MACHINE_DEFINE_STORE8_GENERIC_FENCED(full_fence)
+
+#if ! __TBB_USE_FENCED_ATOMICS
+    #undef   __TBB_machine_cmpswp8full_fence
+#endif
+
+#define __TBB_machine_store8 tbb::internal::__TBB_machine_generic_store8full_fence
+#define __TBB_machine_load8  tbb::internal::__TBB_machine_generic_load8full_fence
+#endif /* __TBB_USE_GENERIC_DWORD_LOAD_STORE */
+
+#if __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE
+/** Fenced operations use volatile qualifier to prevent compiler from optimizing
+    them out, and on architectures with weak memory ordering to induce compiler
+    to generate code with appropriate acquire/release semantics.
+    On architectures like IA32, Intel64 (and likely Sparc TSO) volatile has
+    no effect on code gen, and consistency helpers serve as a compiler fence (the
+    latter being true for IA64/gcc as well to fix a bug in some gcc versions).
+    This code assumes that the generated instructions will operate atomically,
+    which typically requires a type that can be moved in a single instruction,
+    cooperation from the compiler for effective use of such an instruction,
+    and appropriate alignment of the data. **/
+template <typename T, size_t S>
+struct machine_load_store {
+    static T load_with_acquire ( const volatile T& location ) {
+        T to_return = location;
+        __TBB_acquire_consistency_helper();
+        return to_return;
+    }
+    static void store_with_release ( volatile T &location, T value ) {
+        __TBB_release_consistency_helper();
+        location = value;
+    }
+};
+
+//in general, plain load and store of 32bit compiler is not atomic for 64bit types
+#if __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS
+template <typename T>
+struct machine_load_store<T,8> {
+    static T load_with_acquire ( const volatile T& location ) {
+        return (T)__TBB_machine_load8( (const volatile void*)&location );
+    }
+    static void store_with_release ( volatile T& location, T value ) {
+        __TBB_machine_store8( (volatile void*)&location, (int64_t)value );
+    }
+};
+#endif /* __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS */
+#endif /* __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE */
+
+#if __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE
+template <typename T, size_t S>
+struct machine_load_store_seq_cst {
+    static T load ( const volatile T& location ) {
+        __TBB_full_memory_fence();
+        return machine_load_store<T,S>::load_with_acquire( location );
+    }
+#if __TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE
+    static void store ( volatile T &location, T value ) {
+        atomic_selector<S>::fetch_store( (volatile void*)&location, (typename atomic_selector<S>::word)value );
+    }
+#else /* !__TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE */
+    static void store ( volatile T &location, T value ) {
+        machine_load_store<T,S>::store_with_release( location, value );
+        __TBB_full_memory_fence();
+    }
+#endif /* !__TBB_USE_FETCHSTORE_AS_FULL_FENCED_STORE */
+};
+
+#if __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS
+/** The implementation does not use functions __TBB_machine_load8/store8 as they
+    are not required to be sequentially consistent. **/
+template <typename T>
+struct machine_load_store_seq_cst<T,8> {
+    static T load ( const volatile T& location ) {
+        // Comparand and new value may be anything, they only must be equal, and
+        // the value should have a low probability to be actually found in 'location'.
+        const int64_t anyvalue = 2305843009213693951LL;
+        return __TBB_machine_cmpswp8( (volatile void*)const_cast<volatile T*>(&location), anyvalue, anyvalue );
+    }
+    static void store ( volatile T &location, T value ) {
+#if __TBB_GCC_VERSION >= 40702
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wmaybe-uninitialized"
+#endif
+        // An atomic initialization leads to reading of uninitialized memory
+        int64_t result = (volatile int64_t&)location;
+#if __TBB_GCC_VERSION >= 40702
+#pragma GCC diagnostic pop
+#endif
+        while ( __TBB_machine_cmpswp8((volatile void*)&location, (int64_t)value, result) != result )
+            result = (volatile int64_t&)location;
+    }
+};
+#endif /* __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS */
+#endif /*__TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE */
+
+#if __TBB_USE_GENERIC_RELAXED_LOAD_STORE
+// Relaxed operations add volatile qualifier to prevent compiler from optimizing them out.
+/** Volatile should not incur any additional cost on IA32, Intel64, and Sparc TSO
+    architectures. However on architectures with weak memory ordering compiler may
+    generate code with acquire/release semantics for operations on volatile data. **/
+template <typename T, size_t S>
+struct machine_load_store_relaxed {
+    static inline T load ( const volatile T& location ) {
+        return location;
+    }
+    static inline void store ( volatile T& location, T value ) {
+        location = value;
+    }
+};
+
+#if __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS
+template <typename T>
+struct machine_load_store_relaxed<T,8> {
+    static inline T load ( const volatile T& location ) {
+        return (T)__TBB_machine_load8( (const volatile void*)&location );
+    }
+    static inline void store ( volatile T& location, T value ) {
+        __TBB_machine_store8( (volatile void*)&location, (int64_t)value );
+    }
+};
+#endif /* __TBB_WORDSIZE==4 && __TBB_64BIT_ATOMICS */
+#endif /* __TBB_USE_GENERIC_RELAXED_LOAD_STORE */
+
+#undef __TBB_WORDSIZE //this macro is forbidden to use outside of atomic machinery
+
+template<typename T>
+inline T __TBB_load_with_acquire(const volatile T &location) {
+    return machine_load_store<T,sizeof(T)>::load_with_acquire( location );
+}
+template<typename T, typename V>
+inline void __TBB_store_with_release(volatile T& location, V value) {
+    machine_load_store<T,sizeof(T)>::store_with_release( location, T(value) );
+}
+//! Overload that exists solely to avoid /Wp64 warnings.
+inline void __TBB_store_with_release(volatile size_t& location, size_t value) {
+    machine_load_store<size_t,sizeof(size_t)>::store_with_release( location, value );
+}
+
+template<typename T>
+inline T __TBB_load_full_fence(const volatile T &location) {
+    return machine_load_store_seq_cst<T,sizeof(T)>::load( location );
+}
+template<typename T, typename V>
+inline void __TBB_store_full_fence(volatile T& location, V value) {
+    machine_load_store_seq_cst<T,sizeof(T)>::store( location, T(value) );
+}
+//! Overload that exists solely to avoid /Wp64 warnings.
+inline void __TBB_store_full_fence(volatile size_t& location, size_t value) {
+    machine_load_store_seq_cst<size_t,sizeof(size_t)>::store( location, value );
+}
+
+template<typename T>
+inline T __TBB_load_relaxed (const volatile T& location) {
+    return machine_load_store_relaxed<T,sizeof(T)>::load( const_cast<T&>(location) );
+}
+template<typename T, typename V>
+inline void __TBB_store_relaxed ( volatile T& location, V value ) {
+    machine_load_store_relaxed<T,sizeof(T)>::store( const_cast<T&>(location), T(value) );
+}
+//! Overload that exists solely to avoid /Wp64 warnings.
+inline void __TBB_store_relaxed ( volatile size_t& location, size_t value ) {
+    machine_load_store_relaxed<size_t,sizeof(size_t)>::store( const_cast<size_t&>(location), value );
+}
+
+// Macro __TBB_TypeWithAlignmentAtLeastAsStrict(T) should be a type with alignment at least as
+// strict as type T.  The type should have a trivial default constructor and destructor, so that
+// arrays of that type can be declared without initializers.
+// It is correct (but perhaps a waste of space) if __TBB_TypeWithAlignmentAtLeastAsStrict(T) expands
+// to a type bigger than T.
+// The default definition here works on machines where integers are naturally aligned and the
+// strictest alignment is 64.
+#ifndef __TBB_TypeWithAlignmentAtLeastAsStrict
+
+#if __TBB_ALIGNAS_PRESENT
+
+// Use C++11 keywords alignas and alignof
+#define __TBB_DefineTypeWithAlignment(PowerOf2)       \
+struct alignas(PowerOf2) __TBB_machine_type_with_alignment_##PowerOf2 { \
+    uint32_t member[PowerOf2/sizeof(uint32_t)];       \
+};
+#define __TBB_alignof(T) alignof(T)
+
+#elif __TBB_ATTRIBUTE_ALIGNED_PRESENT
+
+#define __TBB_DefineTypeWithAlignment(PowerOf2)       \
+struct __TBB_machine_type_with_alignment_##PowerOf2 { \
+    uint32_t member[PowerOf2/sizeof(uint32_t)];       \
+} __attribute__((aligned(PowerOf2)));
+#define __TBB_alignof(T) __alignof__(T)
+
+#elif __TBB_DECLSPEC_ALIGN_PRESENT
+
+#define __TBB_DefineTypeWithAlignment(PowerOf2)       \
+__declspec(align(PowerOf2))                           \
+struct __TBB_machine_type_with_alignment_##PowerOf2 { \
+    uint32_t member[PowerOf2/sizeof(uint32_t)];       \
+};
+#define __TBB_alignof(T) __alignof(T)
+
+#else /* A compiler with unknown syntax for data alignment */
+#error Must define __TBB_TypeWithAlignmentAtLeastAsStrict(T)
+#endif
+
+/* Now declare types aligned to useful powers of two */
+__TBB_DefineTypeWithAlignment(8) // i386 ABI says that uint64_t is aligned on 4 bytes  
+__TBB_DefineTypeWithAlignment(16)
+__TBB_DefineTypeWithAlignment(32)
+__TBB_DefineTypeWithAlignment(64)
+
+typedef __TBB_machine_type_with_alignment_64 __TBB_machine_type_with_strictest_alignment;
+
+// Primary template is a declaration of incomplete type so that it fails with unknown alignments
+template<size_t N> struct type_with_alignment;
+
+// Specializations for allowed alignments
+template<> struct type_with_alignment<1> { char member; };
+template<> struct type_with_alignment<2> { uint16_t member; };
+template<> struct type_with_alignment<4> { uint32_t member; };
+template<> struct type_with_alignment<8> { __TBB_machine_type_with_alignment_8 member; };
+template<> struct type_with_alignment<16> {__TBB_machine_type_with_alignment_16 member; };
+template<> struct type_with_alignment<32> {__TBB_machine_type_with_alignment_32 member; };
+template<> struct type_with_alignment<64> {__TBB_machine_type_with_alignment_64 member; };
+
+#if __TBB_ALIGNOF_NOT_INSTANTIATED_TYPES_BROKEN
+//! Work around for bug in GNU 3.2 and MSVC compilers.
+/** Bug is that compiler sometimes returns 0 for __alignof(T) when T has not yet been instantiated.
+    The work-around forces instantiation by forcing computation of sizeof(T) before __alignof(T). */
+template<size_t Size, typename T>
+struct work_around_alignment_bug {
+    static const size_t alignment = __TBB_alignof(T);
+};
+#define __TBB_TypeWithAlignmentAtLeastAsStrict(T) tbb::internal::type_with_alignment<tbb::internal::work_around_alignment_bug<sizeof(T),T>::alignment>
+#else
+#define __TBB_TypeWithAlignmentAtLeastAsStrict(T) tbb::internal::type_with_alignment<__TBB_alignof(T)>
+#endif  /* __TBB_ALIGNOF_NOT_INSTANTIATED_TYPES_BROKEN */
+
+#endif  /* __TBB_TypeWithAlignmentAtLeastAsStrict */
+
+// Template class here is to avoid instantiation of the static data for modules that don't use it
+template<typename T>
+struct reverse {
+    static const T byte_table[256];
+};
+// An efficient implementation of the reverse function utilizes a 2^8 lookup table holding the bit-reversed
+// values of [0..2^8 - 1]. Those values can also be computed on the fly at a slightly higher cost.
+template<typename T>
+const T reverse<T>::byte_table[256] = {
+    0x00, 0x80, 0x40, 0xC0, 0x20, 0xA0, 0x60, 0xE0, 0x10, 0x90, 0x50, 0xD0, 0x30, 0xB0, 0x70, 0xF0,
+    0x08, 0x88, 0x48, 0xC8, 0x28, 0xA8, 0x68, 0xE8, 0x18, 0x98, 0x58, 0xD8, 0x38, 0xB8, 0x78, 0xF8,
+    0x04, 0x84, 0x44, 0xC4, 0x24, 0xA4, 0x64, 0xE4, 0x14, 0x94, 0x54, 0xD4, 0x34, 0xB4, 0x74, 0xF4,
+    0x0C, 0x8C, 0x4C, 0xCC, 0x2C, 0xAC, 0x6C, 0xEC, 0x1C, 0x9C, 0x5C, 0xDC, 0x3C, 0xBC, 0x7C, 0xFC,
+    0x02, 0x82, 0x42, 0xC2, 0x22, 0xA2, 0x62, 0xE2, 0x12, 0x92, 0x52, 0xD2, 0x32, 0xB2, 0x72, 0xF2,
+    0x0A, 0x8A, 0x4A, 0xCA, 0x2A, 0xAA, 0x6A, 0xEA, 0x1A, 0x9A, 0x5A, 0xDA, 0x3A, 0xBA, 0x7A, 0xFA,
+    0x06, 0x86, 0x46, 0xC6, 0x26, 0xA6, 0x66, 0xE6, 0x16, 0x96, 0x56, 0xD6, 0x36, 0xB6, 0x76, 0xF6,
+    0x0E, 0x8E, 0x4E, 0xCE, 0x2E, 0xAE, 0x6E, 0xEE, 0x1E, 0x9E, 0x5E, 0xDE, 0x3E, 0xBE, 0x7E, 0xFE,
+    0x01, 0x81, 0x41, 0xC1, 0x21, 0xA1, 0x61, 0xE1, 0x11, 0x91, 0x51, 0xD1, 0x31, 0xB1, 0x71, 0xF1,
+    0x09, 0x89, 0x49, 0xC9, 0x29, 0xA9, 0x69, 0xE9, 0x19, 0x99, 0x59, 0xD9, 0x39, 0xB9, 0x79, 0xF9,
+    0x05, 0x85, 0x45, 0xC5, 0x25, 0xA5, 0x65, 0xE5, 0x15, 0x95, 0x55, 0xD5, 0x35, 0xB5, 0x75, 0xF5,
+    0x0D, 0x8D, 0x4D, 0xCD, 0x2D, 0xAD, 0x6D, 0xED, 0x1D, 0x9D, 0x5D, 0xDD, 0x3D, 0xBD, 0x7D, 0xFD,
+    0x03, 0x83, 0x43, 0xC3, 0x23, 0xA3, 0x63, 0xE3, 0x13, 0x93, 0x53, 0xD3, 0x33, 0xB3, 0x73, 0xF3,
+    0x0B, 0x8B, 0x4B, 0xCB, 0x2B, 0xAB, 0x6B, 0xEB, 0x1B, 0x9B, 0x5B, 0xDB, 0x3B, 0xBB, 0x7B, 0xFB,
+    0x07, 0x87, 0x47, 0xC7, 0x27, 0xA7, 0x67, 0xE7, 0x17, 0x97, 0x57, 0xD7, 0x37, 0xB7, 0x77, 0xF7,
+    0x0F, 0x8F, 0x4F, 0xCF, 0x2F, 0xAF, 0x6F, 0xEF, 0x1F, 0x9F, 0x5F, 0xDF, 0x3F, 0xBF, 0x7F, 0xFF
+};
+
+} // namespace internal @endcond
+} // namespace tbb
+
+// Preserving access to legacy APIs
+using tbb::internal::__TBB_load_with_acquire;
+using tbb::internal::__TBB_store_with_release;
+
+// Mapping historically used names to the ones expected by atomic_load_store_traits
+#define __TBB_load_acquire  __TBB_load_with_acquire
+#define __TBB_store_release __TBB_store_with_release
+
+#ifndef __TBB_Log2
+inline intptr_t __TBB_Log2( uintptr_t x ) {
+    if( x==0 ) return -1;
+    intptr_t result = 0;
+
+#if !defined(_M_ARM)
+    uintptr_t tmp_;
+    if( sizeof(x)>4 && (tmp_ = ((uint64_t)x)>>32) ) { x=tmp_; result += 32; }
+#endif
+    if( uintptr_t tmp = x>>16 ) { x=tmp; result += 16; }
+    if( uintptr_t tmp = x>>8 )  { x=tmp; result += 8; }
+    if( uintptr_t tmp = x>>4 )  { x=tmp; result += 4; }
+    if( uintptr_t tmp = x>>2 )  { x=tmp; result += 2; }
+
+    return (x&2)? result+1: result;
+}
+#endif
+
+#ifndef __TBB_AtomicOR
+inline void __TBB_AtomicOR( volatile void *operand, uintptr_t addend ) {
+    for( tbb::internal::atomic_backoff b;;b.pause() ) {
+        uintptr_t tmp = *(volatile uintptr_t *)operand;
+        uintptr_t result = __TBB_CompareAndSwapW(operand, tmp|addend, tmp);
+        if( result==tmp ) break;
+    }
+}
+#endif
+
+#ifndef __TBB_AtomicAND
+inline void __TBB_AtomicAND( volatile void *operand, uintptr_t addend ) {
+    for( tbb::internal::atomic_backoff b;;b.pause() ) {
+        uintptr_t tmp = *(volatile uintptr_t *)operand;
+        uintptr_t result = __TBB_CompareAndSwapW(operand, tmp&addend, tmp);
+        if( result==tmp ) break;
+    }
+}
+#endif
+
+#if __TBB_PREFETCHING
+#ifndef __TBB_cl_prefetch
+#error This platform does not define cache management primitives required for __TBB_PREFETCHING
+#endif
+
+#ifndef __TBB_cl_evict
+#define __TBB_cl_evict(p)
+#endif
+#endif
+
+#ifndef __TBB_Flag
+typedef unsigned char __TBB_Flag;
+#endif
+typedef __TBB_atomic __TBB_Flag __TBB_atomic_flag;
+
+#ifndef __TBB_TryLockByte
+inline bool __TBB_TryLockByte( __TBB_atomic_flag &flag ) {
+    return __TBB_machine_cmpswp1(&flag,1,0)==0;
+}
+#endif
+
+#ifndef __TBB_LockByte
+inline __TBB_Flag __TBB_LockByte( __TBB_atomic_flag& flag ) {
+    tbb::internal::atomic_backoff backoff;
+    while( !__TBB_TryLockByte(flag) ) backoff.pause();
+    return 0;
+}
+#endif
+
+#ifndef  __TBB_UnlockByte
+#define __TBB_UnlockByte(addr) __TBB_store_with_release((addr),0)
+#endif
+
+// lock primitives with Intel(R) Transactional Synchronization Extensions (Intel(R) TSX)
+#if ( __TBB_x86_32 || __TBB_x86_64 )  /* only on ia32/intel64 */
+inline void __TBB_TryLockByteElidedCancel() { __TBB_machine_try_lock_elided_cancel(); }
+
+inline bool __TBB_TryLockByteElided( __TBB_atomic_flag& flag ) {
+    bool res = __TBB_machine_try_lock_elided( &flag )!=0;
+    // to avoid the "lemming" effect, we need to abort the transaction
+    // if  __TBB_machine_try_lock_elided returns false (i.e., someone else
+    // has acquired the mutex non-speculatively).
+    if( !res ) __TBB_TryLockByteElidedCancel();
+    return res;
+}
+
+inline void __TBB_LockByteElided( __TBB_atomic_flag& flag )
+{
+    for(;;) {
+        tbb::internal::spin_wait_while_eq( flag, 1 );
+        if( __TBB_machine_try_lock_elided( &flag ) )
+            return;
+        // Another thread acquired the lock "for real".
+        // To avoid the "lemming" effect, we abort the transaction.
+        __TBB_TryLockByteElidedCancel();
+    }
+}
+
+inline void __TBB_UnlockByteElided( __TBB_atomic_flag& flag ) {
+    __TBB_machine_unlock_elided( &flag );
+}
+#endif
+
+#ifndef __TBB_ReverseByte
+inline unsigned char __TBB_ReverseByte(unsigned char src) {
+    return tbb::internal::reverse<unsigned char>::byte_table[src];
+}
+#endif
+
+template<typename T>
+T __TBB_ReverseBits(T src) {
+    T dst;
+    unsigned char *original = (unsigned char *) &src;
+    unsigned char *reversed = (unsigned char *) &dst;
+
+    for( int i = sizeof(T)-1; i >= 0; i-- )
+        reversed[i] = __TBB_ReverseByte( original[sizeof(T)-i-1] );
+
+    return dst;
+}
+
+#endif /* __TBB_machine_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_profiling.h b/xdl/third_party/tbb/include/tbb/tbb_profiling.h
new file mode 100644
index 00000000..bc22a83f
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_profiling.h
@@ -0,0 +1,344 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_profiling_H
+#define __TBB_profiling_H
+
+namespace tbb {
+    namespace internal {
+
+        // include list of index names
+        #define TBB_STRING_RESOURCE(index_name,str) index_name,
+        enum string_index {
+           #include "internal/_tbb_strings.h"
+           NUM_STRINGS
+        };
+        #undef TBB_STRING_RESOURCE
+
+        enum itt_relation
+        {
+        __itt_relation_is_unknown = 0,
+        __itt_relation_is_dependent_on,         /**< "A is dependent on B" means that A cannot start until B completes */
+        __itt_relation_is_sibling_of,           /**< "A is sibling of B" means that A and B were created as a group */
+        __itt_relation_is_parent_of,            /**< "A is parent of B" means that A created B */
+        __itt_relation_is_continuation_of,      /**< "A is continuation of B" means that A assumes the dependencies of B */
+        __itt_relation_is_child_of,             /**< "A is child of B" means that A was created by B (inverse of is_parent_of) */
+        __itt_relation_is_continued_by,         /**< "A is continued by B" means that B assumes the dependencies of A (inverse of is_continuation_of) */
+        __itt_relation_is_predecessor_to        /**< "A is predecessor to B" means that B cannot start until A completes (inverse of is_dependent_on) */
+        };
+
+    }
+}
+
+// Check if the tools support is enabled
+#if (_WIN32||_WIN64||__linux__) && !__MINGW32__ && TBB_USE_THREADING_TOOLS
+
+#if _WIN32||_WIN64
+#include <stdlib.h>  /* mbstowcs_s */
+#endif
+#include "tbb_stddef.h"
+
+namespace tbb {
+    namespace internal {
+
+#if _WIN32||_WIN64
+        void __TBB_EXPORTED_FUNC itt_set_sync_name_v3( void *obj, const wchar_t* name );
+        inline size_t multibyte_to_widechar( wchar_t* wcs, const char* mbs, size_t bufsize) {
+#if _MSC_VER>=1400
+            size_t len;
+            mbstowcs_s( &len, wcs, bufsize, mbs, _TRUNCATE );
+            return len;   // mbstowcs_s counts null terminator
+#else
+            size_t len = mbstowcs( wcs, mbs, bufsize );
+            if(wcs && len!=size_t(-1) )
+                wcs[len<bufsize-1? len: bufsize-1] = wchar_t('\0');
+            return len+1; // mbstowcs does not count null terminator
+#endif
+        }
+#else
+        void __TBB_EXPORTED_FUNC itt_set_sync_name_v3( void *obj, const char* name );
+#endif
+    } // namespace internal
+} // namespace tbb
+
+//! Macro __TBB_DEFINE_PROFILING_SET_NAME(T) defines "set_name" methods for sync objects of type T
+/** Should be used in the "tbb" namespace only.
+    Don't place semicolon after it to avoid compiler warnings. **/
+#if _WIN32||_WIN64
+    #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type)                       \
+        namespace profiling {                                                       \
+            inline void set_name( sync_object_type& obj, const wchar_t* name ) {    \
+                tbb::internal::itt_set_sync_name_v3( &obj, name );                  \
+            }                                                                       \
+            inline void set_name( sync_object_type& obj, const char* name ) {       \
+                size_t len = tbb::internal::multibyte_to_widechar(NULL, name, 0);   \
+                wchar_t *wname = new wchar_t[len];                                  \
+                tbb::internal::multibyte_to_widechar(wname, name, len);             \
+                set_name( obj, wname );                                             \
+                delete[] wname;                                                     \
+            }                                                                       \
+        }
+#else /* !WIN */
+    #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type)                       \
+        namespace profiling {                                                       \
+            inline void set_name( sync_object_type& obj, const char* name ) {       \
+                tbb::internal::itt_set_sync_name_v3( &obj, name );                  \
+            }                                                                       \
+        }
+#endif /* !WIN */
+
+#else /* no tools support */
+
+#if _WIN32||_WIN64
+    #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type)               \
+        namespace profiling {                                               \
+            inline void set_name( sync_object_type&, const wchar_t* ) {}    \
+            inline void set_name( sync_object_type&, const char* ) {}       \
+        }
+#else /* !WIN */
+    #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type)               \
+        namespace profiling {                                               \
+            inline void set_name( sync_object_type&, const char* ) {}       \
+        }
+#endif /* !WIN */
+
+#endif /* no tools support */
+
+#include "atomic.h"
+// Need these to work regardless of tools support
+namespace tbb {
+    namespace internal {
+
+        enum notify_type {prepare=0, cancel, acquired, releasing};
+
+        const uintptr_t NUM_NOTIFY_TYPES = 4; // set to # elements in enum above
+
+        void __TBB_EXPORTED_FUNC call_itt_notify_v5(int t, void *ptr);
+        void __TBB_EXPORTED_FUNC itt_store_pointer_with_release_v3(void *dst, void *src);
+        void* __TBB_EXPORTED_FUNC itt_load_pointer_with_acquire_v3(const void *src);
+        void* __TBB_EXPORTED_FUNC itt_load_pointer_v3( const void* src );
+        enum itt_domain_enum { ITT_DOMAIN_FLOW=0, ITT_DOMAIN_MAIN=1, ITT_DOMAIN_ALGO=2, ITT_NUM_DOMAINS };
+
+        void __TBB_EXPORTED_FUNC itt_make_task_group_v7( itt_domain_enum domain, void *group, unsigned long long group_extra,
+                                                         void *parent, unsigned long long parent_extra, string_index name_index );
+        void __TBB_EXPORTED_FUNC itt_metadata_str_add_v7( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
+                                                          string_index key, const char *value );
+        void __TBB_EXPORTED_FUNC itt_relation_add_v7( itt_domain_enum domain, void *addr0, unsigned long long addr0_extra,
+                                                      itt_relation relation, void *addr1, unsigned long long addr1_extra );
+        void __TBB_EXPORTED_FUNC itt_task_begin_v7( itt_domain_enum domain, void *task, unsigned long long task_extra,
+                                                    void *parent, unsigned long long parent_extra, string_index name_index );
+        void __TBB_EXPORTED_FUNC itt_task_end_v7( itt_domain_enum domain );
+
+        void __TBB_EXPORTED_FUNC itt_region_begin_v9( itt_domain_enum domain, void *region, unsigned long long region_extra,
+                                                      void *parent, unsigned long long parent_extra, string_index name_index );
+        void __TBB_EXPORTED_FUNC itt_region_end_v9( itt_domain_enum domain, void *region, unsigned long long region_extra );
+
+        // two template arguments are to workaround /Wp64 warning with tbb::atomic specialized for unsigned type
+        template <typename T, typename U>
+        inline void itt_store_word_with_release(tbb::atomic<T>& dst, U src) {
+#if TBB_USE_THREADING_TOOLS
+            // This assertion should be replaced with static_assert
+            __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
+            itt_store_pointer_with_release_v3(&dst, (void *)uintptr_t(src));
+#else
+            dst = src;
+#endif // TBB_USE_THREADING_TOOLS
+        }
+
+        template <typename T>
+        inline T itt_load_word_with_acquire(const tbb::atomic<T>& src) {
+#if TBB_USE_THREADING_TOOLS
+            // This assertion should be replaced with static_assert
+            __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+            // Workaround for overzealous compiler warnings
+            #pragma warning (push)
+            #pragma warning (disable: 4311)
+#endif
+            T result = (T)itt_load_pointer_with_acquire_v3(&src);
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+            #pragma warning (pop)
+#endif
+            return result;
+#else
+            return src;
+#endif // TBB_USE_THREADING_TOOLS
+        }
+
+        template <typename T>
+        inline void itt_store_word_with_release(T& dst, T src) {
+#if TBB_USE_THREADING_TOOLS
+            // This assertion should be replaced with static_assert
+            __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
+            itt_store_pointer_with_release_v3(&dst, (void *)src);
+#else
+            __TBB_store_with_release(dst, src);
+#endif // TBB_USE_THREADING_TOOLS
+        }
+
+        template <typename T>
+        inline T itt_load_word_with_acquire(const T& src) {
+#if TBB_USE_THREADING_TOOLS
+            // This assertion should be replaced with static_assert
+            __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized");
+            return (T)itt_load_pointer_with_acquire_v3(&src);
+#else
+            return __TBB_load_with_acquire(src);
+#endif // TBB_USE_THREADING_TOOLS
+        }
+
+        template <typename T>
+        inline void itt_hide_store_word(T& dst, T src) {
+#if TBB_USE_THREADING_TOOLS
+            //TODO: This assertion should be replaced with static_assert
+            __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized");
+            itt_store_pointer_with_release_v3(&dst, (void *)src);
+#else
+            dst = src;
+#endif
+        }
+
+        //TODO: rename to itt_hide_load_word_relaxed
+        template <typename T>
+        inline T itt_hide_load_word(const T& src) {
+#if TBB_USE_THREADING_TOOLS
+            //TODO: This assertion should be replaced with static_assert
+            __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
+            return (T)itt_load_pointer_v3(&src);
+#else
+            return src;
+#endif
+        }
+
+#if TBB_USE_THREADING_TOOLS
+        inline void call_itt_notify(notify_type t, void *ptr) {
+            call_itt_notify_v5((int)t, ptr);
+        }
+
+        inline void itt_make_task_group( itt_domain_enum domain, void *group, unsigned long long group_extra,
+                                         void *parent, unsigned long long parent_extra, string_index name_index ) {
+            itt_make_task_group_v7( domain, group, group_extra, parent, parent_extra, name_index );
+        }
+
+        inline void itt_metadata_str_add( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
+                                          string_index key, const char *value ) {
+            itt_metadata_str_add_v7( domain, addr, addr_extra, key, value );
+        }
+
+        inline void itt_relation_add( itt_domain_enum domain, void *addr0, unsigned long long addr0_extra,
+                                      itt_relation relation, void *addr1, unsigned long long addr1_extra ) {
+            itt_relation_add_v7( domain, addr0, addr0_extra, relation, addr1, addr1_extra );
+        }
+
+        inline void itt_task_begin( itt_domain_enum domain, void *task, unsigned long long task_extra,
+                                                        void *parent, unsigned long long parent_extra, string_index name_index ) {
+            itt_task_begin_v7( domain, task, task_extra, parent, parent_extra, name_index );
+        }
+
+        inline void itt_task_end( itt_domain_enum domain ) {
+            itt_task_end_v7( domain );
+        }
+
+        inline void itt_region_begin( itt_domain_enum domain, void *region, unsigned long long region_extra,
+                                      void *parent, unsigned long long parent_extra, string_index name_index ) {
+            itt_region_begin_v9( domain, region, region_extra, parent, parent_extra, name_index );
+        }
+
+        inline void itt_region_end( itt_domain_enum domain, void *region, unsigned long long region_extra  ) {
+            itt_region_end_v9( domain, region, region_extra );
+        }
+#else
+        inline void call_itt_notify(notify_type /*t*/, void* /*ptr*/) {}
+
+        inline void itt_make_task_group( itt_domain_enum /*domain*/, void* /*group*/, unsigned long long /*group_extra*/,
+                                         void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) {}
+
+        inline void itt_metadata_str_add( itt_domain_enum /*domain*/, void* /*addr*/, unsigned long long /*addr_extra*/,
+                                          string_index /*key*/, const char* /*value*/ ) {}
+
+        inline void itt_relation_add( itt_domain_enum /*domain*/, void* /*addr0*/, unsigned long long /*addr0_extra*/,
+                                      itt_relation /*relation*/, void* /*addr1*/, unsigned long long /*addr1_extra*/ ) {}
+
+        inline void itt_task_begin( itt_domain_enum /*domain*/, void* /*task*/, unsigned long long /*task_extra*/,
+                                    void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) {}
+
+        inline void itt_task_end( itt_domain_enum /*domain*/ ) {}
+
+        inline void itt_region_begin( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/,
+                                      void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) {}
+
+        inline void itt_region_end( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/ ) {}
+#endif // TBB_USE_THREADING_TOOLS
+
+    } // namespace internal
+} // namespace tbb
+
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+#include <string>
+
+namespace tbb {
+namespace profiling {
+namespace interface10 {
+
+#if TBB_USE_THREADING_TOOLS && !(TBB_USE_THREADING_TOOLS == 2)
+class event {
+/** This class supports user event traces through itt.
+    Common use-case is tagging data flow graph tasks (data-id)
+    and visualization by Intel Advisor Flow Graph Analyzer (FGA)  **/
+//  TODO: Replace implementation by itt user event api.
+
+    const std::string my_name;
+
+    static void emit_trace(const std::string &input) {
+        itt_metadata_str_add( tbb::internal::ITT_DOMAIN_FLOW, NULL, tbb::internal::FLOW_NULL, tbb::internal::USER_EVENT, ( "FGA::DATAID::" + input ).c_str() );
+    }
+
+public:
+    event(const std::string &input)
+              : my_name( input )
+    { }
+
+    void emit() {
+        emit_trace(my_name);
+    }
+
+    static void emit(const std::string &description) {
+        emit_trace(description);
+    }
+
+};
+#else // TBB_USE_THREADING_TOOLS && !(TBB_USE_THREADING_TOOLS == 2)
+// Using empty struct if user event tracing is disabled:
+struct event {
+    event(const std::string &) { }
+
+    void emit() { }
+
+    static void emit(const std::string &) { }
+};
+#endif // TBB_USE_THREADING_TOOLS && !(TBB_USE_THREADING_TOOLS == 2)
+
+} // interfaceX
+using interface10::event;
+} // namespace profiling
+} // namespace tbb
+#endif // TBB_PREVIEW_FLOW_GRAPH_TRACE
+
+#endif /* __TBB_profiling_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_stddef.h b/xdl/third_party/tbb/include/tbb/tbb_stddef.h
new file mode 100644
index 00000000..83803ce0
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_stddef.h
@@ -0,0 +1,557 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_stddef_H
+#define __TBB_tbb_stddef_H
+
+// Marketing-driven product version
+#define TBB_VERSION_MAJOR 2019
+#define TBB_VERSION_MINOR 0
+
+// Engineering-focused interface version
+#define TBB_INTERFACE_VERSION 11003
+#define TBB_INTERFACE_VERSION_MAJOR TBB_INTERFACE_VERSION/1000
+
+// The oldest major interface version still supported
+// To be used in SONAME, manifests, etc.
+#define TBB_COMPATIBLE_INTERFACE_VERSION 2
+
+#define __TBB_STRING_AUX(x) #x
+#define __TBB_STRING(x) __TBB_STRING_AUX(x)
+
+// We do not need defines below for resource processing on windows
+#if !defined RC_INVOKED
+
+// Define groups for Doxygen documentation
+/**
+ * @defgroup algorithms         Algorithms
+ * @defgroup containers         Containers
+ * @defgroup memory_allocation  Memory Allocation
+ * @defgroup synchronization    Synchronization
+ * @defgroup timing             Timing
+ * @defgroup task_scheduling    Task Scheduling
+ */
+
+// Simple text that is displayed on the main page of Doxygen documentation.
+/**
+ * \mainpage Main Page
+ *
+ * Click the tabs above for information about the
+ * - <a href="./modules.html">Modules</a> (groups of functionality) implemented by the library
+ * - <a href="./annotated.html">Classes</a> provided by the library
+ * - <a href="./files.html">Files</a> constituting the library.
+ * .
+ * Please note that significant part of TBB functionality is implemented in the form of
+ * template functions, descriptions of which are not accessible on the <a href="./annotated.html">Classes</a>
+ * tab. Use <a href="./modules.html">Modules</a> or <a href="./namespacemembers.html">Namespace/Namespace Members</a>
+ * tabs to find them.
+ *
+ * Additional pieces of information can be found here
+ * - \subpage concepts
+ * .
+ */
+
+/** \page concepts TBB concepts
+
+    A concept is a set of requirements to a type, which are necessary and sufficient
+    for the type to model a particular behavior or a set of behaviors. Some concepts
+    are specific to a particular algorithm (e.g. algorithm body), while other ones
+    are common to several algorithms (e.g. range concept).
+
+    All TBB algorithms make use of different classes implementing various concepts.
+    Implementation classes are supplied by the user as type arguments of template
+    parameters and/or as objects passed as function call arguments. The library
+    provides predefined  implementations of some concepts (e.g. several kinds of
+    \ref range_req "ranges"), while other ones must always be implemented by the user.
+
+    TBB defines a set of minimal requirements each concept must conform to. Here is
+    the list of different concepts hyperlinked to the corresponding requirements specifications:
+    - \subpage range_req
+    - \subpage parallel_do_body_req
+    - \subpage parallel_for_body_req
+    - \subpage parallel_reduce_body_req
+    - \subpage parallel_scan_body_req
+    - \subpage parallel_sort_iter_req
+**/
+
+// tbb_config.h should be included the first since it contains macro definitions used in other headers
+#include "tbb_config.h"
+
+#if _MSC_VER >=1400
+    #define __TBB_EXPORTED_FUNC   __cdecl
+    #define __TBB_EXPORTED_METHOD __thiscall
+#else
+    #define __TBB_EXPORTED_FUNC
+    #define __TBB_EXPORTED_METHOD
+#endif
+
+#if __INTEL_COMPILER || _MSC_VER
+#define __TBB_NOINLINE(decl) __declspec(noinline) decl
+#elif __GNUC__
+#define __TBB_NOINLINE(decl) decl __attribute__ ((noinline))
+#else
+#define __TBB_NOINLINE(decl) decl
+#endif
+
+#if __TBB_NOEXCEPT_PRESENT
+#define __TBB_NOEXCEPT(expression) noexcept(expression)
+#else
+#define __TBB_NOEXCEPT(expression)
+#endif
+
+#include <cstddef>      /* Need size_t and ptrdiff_t */
+
+#if _MSC_VER
+    #define __TBB_tbb_windef_H
+    #include "internal/_tbb_windef.h"
+    #undef __TBB_tbb_windef_H
+#endif
+#if !defined(_MSC_VER) || _MSC_VER>=1600
+    #include <stdint.h>
+#endif
+
+//! Type for an assertion handler
+typedef void(*assertion_handler_type)( const char* filename, int line, const char* expression, const char * comment );
+
+#if __TBBMALLOC_BUILD
+namespace rml { namespace internal {
+ #define __TBB_ASSERT_RELEASE(predicate,message) ((predicate)?((void)0) : rml::internal::assertion_failure(__FILE__,__LINE__,#predicate,message))
+#else
+namespace tbb {
+ #define __TBB_ASSERT_RELEASE(predicate,message) ((predicate)?((void)0) : tbb::assertion_failure(__FILE__,__LINE__,#predicate,message))
+#endif
+
+    //! Set assertion handler and return previous value of it.
+    assertion_handler_type __TBB_EXPORTED_FUNC set_assertion_handler( assertion_handler_type new_handler );
+
+    //! Process an assertion failure.
+    /** Normally called from __TBB_ASSERT macro.
+        If assertion handler is null, print message for assertion failure and abort.
+        Otherwise call the assertion handler. */
+    void __TBB_EXPORTED_FUNC assertion_failure( const char* filename, int line, const char* expression, const char* comment );
+
+#if __TBBMALLOC_BUILD
+}}  // namespace rml::internal
+#else
+} // namespace tbb
+#endif
+
+#if TBB_USE_ASSERT
+
+    //! Assert that predicate is true.
+    /** If predicate is false, print assertion failure message.
+        If the comment argument is not NULL, it is printed as part of the failure message.
+        The comment argument has no other effect. */
+    #define __TBB_ASSERT(predicate,message) __TBB_ASSERT_RELEASE(predicate,message)
+
+    #define __TBB_ASSERT_EX __TBB_ASSERT
+
+#else /* !TBB_USE_ASSERT */
+
+    //! No-op version of __TBB_ASSERT.
+    #define __TBB_ASSERT(predicate,comment) ((void)0)
+    //! "Extended" version is useful to suppress warnings if a variable is only used with an assert
+    #define __TBB_ASSERT_EX(predicate,comment) ((void)(1 && (predicate)))
+
+#endif /* !TBB_USE_ASSERT */
+
+//! The namespace tbb contains all components of the library.
+namespace tbb {
+
+    namespace internal {
+#if _MSC_VER && _MSC_VER<1600
+        typedef __int8 int8_t;
+        typedef __int16 int16_t;
+        typedef __int32 int32_t;
+        typedef __int64 int64_t;
+        typedef unsigned __int8 uint8_t;
+        typedef unsigned __int16 uint16_t;
+        typedef unsigned __int32 uint32_t;
+        typedef unsigned __int64 uint64_t;
+#else /* Posix */
+        using ::int8_t;
+        using ::int16_t;
+        using ::int32_t;
+        using ::int64_t;
+        using ::uint8_t;
+        using ::uint16_t;
+        using ::uint32_t;
+        using ::uint64_t;
+#endif /* Posix */
+    } // namespace internal
+
+    using std::size_t;
+    using std::ptrdiff_t;
+
+//! The function returns the interface version of the TBB shared library being used.
+/**
+ * The version it returns is determined at runtime, not at compile/link time.
+ * So it can be different than the value of TBB_INTERFACE_VERSION obtained at compile time.
+ */
+extern "C" int __TBB_EXPORTED_FUNC TBB_runtime_interface_version();
+
+/**
+ * @cond INTERNAL
+ * @brief Identifiers declared inside namespace internal should never be used directly by client code.
+ */
+namespace internal {
+
+//! Compile-time constant that is upper bound on cache line/sector size.
+/** It should be used only in situations where having a compile-time upper
+    bound is more useful than a run-time exact answer.
+    @ingroup memory_allocation */
+const size_t NFS_MaxLineSize = 128;
+
+/** Label for data that may be accessed from different threads, and that may eventually become wrapped
+    in a formal atomic type.
+
+    Note that no problems have yet been observed relating to the definition currently being empty,
+    even if at least "volatile" would seem to be in order to avoid data sometimes temporarily hiding
+    in a register (although "volatile" as a "poor man's atomic" lacks several other features of a proper
+    atomic, some of which are now provided instead through specialized functions).
+
+    Note that usage is intentionally compatible with a definition as qualifier "volatile",
+    both as a way to have the compiler help enforce use of the label and to quickly rule out
+    one potential issue.
+
+    Note however that, with some architecture/compiler combinations, e.g. on IA-64 architecture, "volatile"
+    also has non-portable memory semantics that are needlessly expensive for "relaxed" operations.
+
+    Note that this must only be applied to data that will not change bit patterns when cast to/from
+    an integral type of the same length; tbb::atomic must be used instead for, e.g., floating-point types.
+
+    TODO: apply wherever relevant **/
+#define __TBB_atomic // intentionally empty, see above
+
+#if __TBB_OVERRIDE_PRESENT
+#define __TBB_override override
+#else
+#define __TBB_override // formal comment only
+#endif
+
+#if __TBB_CPP17_FALLTHROUGH_PRESENT
+#define __TBB_fallthrough [[fallthrough]]
+#elif __TBB_FALLTHROUGH_PRESENT
+#define __TBB_fallthrough __attribute__ ((fallthrough))
+#else
+#define __TBB_fallthrough
+#endif
+
+template<class T, size_t S, size_t R>
+struct padded_base : T {
+    char pad[S - R];
+};
+template<class T, size_t S> struct padded_base<T, S, 0> : T {};
+
+//! Pads type T to fill out to a multiple of cache line size.
+template<class T, size_t S = NFS_MaxLineSize>
+struct padded : padded_base<T, S, sizeof(T) % S> {};
+
+//! Extended variant of the standard offsetof macro
+/** The standard offsetof macro is not sufficient for TBB as it can be used for
+    POD-types only. The constant 0x1000 (not NULL) is necessary to appease GCC. **/
+#define __TBB_offsetof(class_name, member_name) \
+    ((ptrdiff_t)&(reinterpret_cast<class_name*>(0x1000)->member_name) - 0x1000)
+
+//! Returns address of the object containing a member with the given name and address
+#define __TBB_get_object_ref(class_name, member_name, member_addr) \
+    (*reinterpret_cast<class_name*>((char*)member_addr - __TBB_offsetof(class_name, member_name)))
+
+//! Throws std::runtime_error with what() returning error_code description prefixed with aux_info
+void __TBB_EXPORTED_FUNC handle_perror( int error_code, const char* aux_info );
+
+#if TBB_USE_EXCEPTIONS
+    #define __TBB_TRY try
+    #define __TBB_CATCH(e) catch(e)
+    #define __TBB_THROW(e) throw e
+    #define __TBB_RETHROW() throw
+#else /* !TBB_USE_EXCEPTIONS */
+    inline bool __TBB_false() { return false; }
+    #define __TBB_TRY
+    #define __TBB_CATCH(e) if ( tbb::internal::__TBB_false() )
+    #define __TBB_THROW(e) tbb::internal::suppress_unused_warning(e)
+    #define __TBB_RETHROW() ((void)0)
+#endif /* !TBB_USE_EXCEPTIONS */
+
+//! Report a runtime warning.
+void __TBB_EXPORTED_FUNC runtime_warning( const char* format, ... );
+
+#if TBB_USE_ASSERT
+static void* const poisoned_ptr = reinterpret_cast<void*>(-1);
+
+//! Set p to invalid pointer value.
+//  Also works for regular (non-__TBB_atomic) pointers.
+template<typename T>
+inline void poison_pointer( T* __TBB_atomic & p ) { p = reinterpret_cast<T*>(poisoned_ptr); }
+
+/** Expected to be used in assertions only, thus no empty form is defined. **/
+template<typename T>
+inline bool is_poisoned( T* p ) { return p == reinterpret_cast<T*>(poisoned_ptr); }
+#else
+template<typename T>
+inline void poison_pointer( T* __TBB_atomic & ) {/*do nothing*/}
+#endif /* !TBB_USE_ASSERT */
+
+//! Cast between unrelated pointer types.
+/** This method should be used sparingly as a last resort for dealing with
+    situations that inherently break strict ISO C++ aliasing rules. */
+// T is a pointer type because it will be explicitly provided by the programmer as a template argument;
+// U is a referent type to enable the compiler to check that "ptr" is a pointer, deducing U in the process.
+template<typename T, typename U>
+inline T punned_cast( U* ptr ) {
+    uintptr_t x = reinterpret_cast<uintptr_t>(ptr);
+    return reinterpret_cast<T>(x);
+}
+
+//! Base class for types that should not be assigned.
+class no_assign {
+    // Deny assignment
+    void operator=( const no_assign& );
+public:
+#if __GNUC__
+    //! Explicitly define default construction, because otherwise gcc issues gratuitous warning.
+    no_assign() {}
+#endif /* __GNUC__ */
+};
+
+//! Base class for types that should not be copied or assigned.
+class no_copy: no_assign {
+    //! Deny copy construction
+    no_copy( const no_copy& );
+public:
+    //! Allow default construction
+    no_copy() {}
+};
+
+#if TBB_DEPRECATED_MUTEX_COPYING
+class mutex_copy_deprecated_and_disabled {};
+#else
+// By default various implementations of mutexes are not copy constructible
+// and not copy assignable.
+class mutex_copy_deprecated_and_disabled : no_copy {};
+#endif
+
+//! A function to check if passed in pointer is aligned on a specific border
+template<typename T>
+inline bool is_aligned(T* pointer, uintptr_t alignment) {
+    return 0==((uintptr_t)pointer & (alignment-1));
+}
+
+//! A function to check if passed integer is a power of 2
+template<typename integer_type>
+inline bool is_power_of_two(integer_type arg) {
+    return arg && (0 == (arg & (arg - 1)));
+}
+
+//! A function to compute arg modulo divisor where divisor is a power of 2.
+template<typename argument_integer_type, typename divisor_integer_type>
+inline argument_integer_type modulo_power_of_two(argument_integer_type arg, divisor_integer_type divisor) {
+    __TBB_ASSERT( is_power_of_two(divisor), "Divisor should be a power of two" );
+    return (arg & (divisor - 1));
+}
+
+
+//! A function to determine if arg is a power of 2 at least as big as another power of 2.
+// i.e. for strictly positive i and j, with j being a power of 2,
+// determines whether i==j<<k for some nonnegative k (so i==j yields true).
+template<typename argument_integer_type, typename power2_integer_type>
+inline bool is_power_of_two_at_least(argument_integer_type arg, power2_integer_type power2) {
+    __TBB_ASSERT( is_power_of_two(power2), "Divisor should be a power of two" );
+    return 0 == (arg & (arg - power2));
+}
+
+//! Utility template function to prevent "unused" warnings by various compilers.
+template<typename T1> void suppress_unused_warning( const T1& ) {}
+template<typename T1, typename T2> void suppress_unused_warning( const T1&, const T2& ) {}
+template<typename T1, typename T2, typename T3> void suppress_unused_warning( const T1&, const T2&, const T3& ) {}
+
+// Struct to be used as a version tag for inline functions.
+/** Version tag can be necessary to prevent loader on Linux from using the wrong
+    symbol in debug builds (when inline functions are compiled as out-of-line). **/
+struct version_tag_v3 {};
+
+typedef version_tag_v3 version_tag;
+
+} // internal
+
+//! Dummy type that distinguishes splitting constructor from copy constructor.
+/**
+ * See description of parallel_for and parallel_reduce for example usages.
+ * @ingroup algorithms
+ */
+class split {
+};
+
+//! Type enables transmission of splitting proportion from partitioners to range objects
+/**
+ * In order to make use of such facility Range objects must implement
+ * splitting constructor with this type passed and initialize static
+ * constant boolean field 'is_splittable_in_proportion' with the value
+ * of 'true'
+ */
+class proportional_split: internal::no_assign {
+public:
+    proportional_split(size_t _left = 1, size_t _right = 1) : my_left(_left), my_right(_right) { }
+
+    size_t left() const { return my_left; }
+    size_t right() const { return my_right; }
+
+    // used when range does not support proportional split
+    operator split() const { return split(); }
+
+#if __TBB_ENABLE_RANGE_FEEDBACK
+    void set_proportion(size_t _left, size_t _right) {
+        my_left = _left;
+        my_right = _right;
+    }
+#endif
+private:
+    size_t my_left, my_right;
+};
+
+} // tbb
+
+// Following is a set of classes and functions typically used in compile-time "metaprogramming".
+// TODO: move all that to a separate header
+
+#if __TBB_ALLOCATOR_TRAITS_PRESENT || __TBB_CPP11_SMART_POINTERS_PRESENT
+#include <memory> // for allocator_traits, unique_ptr
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT || __TBB_CPP11_DECLTYPE_PRESENT || _LIBCPP_VERSION
+#include <utility> // for std::move, std::forward, std::declval
+#endif
+
+namespace tbb {
+namespace internal {
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    template<typename T, typename... Args>
+    std::unique_ptr<T> make_unique(Args&&... args) {
+        return std::unique_ptr<T>(new T(std::forward<Args>(args)...));
+    }
+#endif
+
+//! Class for determining type of std::allocator<T>::value_type.
+template<typename T>
+struct allocator_type {
+    typedef T value_type;
+};
+
+#if _MSC_VER
+//! Microsoft std::allocator has non-standard extension that strips const from a type.
+template<typename T>
+struct allocator_type<const T> {
+    typedef T value_type;
+};
+#endif
+
+// Ad-hoc implementation of true_type & false_type
+// Intended strictly for internal use! For public APIs (traits etc), use C++11 analogues.
+template <bool v>
+struct bool_constant {
+    static /*constexpr*/ const bool value = v;
+};
+typedef bool_constant<true> true_type;
+typedef bool_constant<false> false_type;
+
+#if __TBB_ALLOCATOR_TRAITS_PRESENT
+using std::allocator_traits;
+#else
+template<typename allocator>
+struct allocator_traits{
+    typedef tbb::internal::false_type propagate_on_container_move_assignment;
+};
+#endif
+
+//! A template to select either 32-bit or 64-bit constant as compile time, depending on machine word size.
+template <unsigned u, unsigned long long ull >
+struct select_size_t_constant {
+    //Explicit cast is needed to avoid compiler warnings about possible truncation.
+    //The value of the right size,   which is selected by ?:, is anyway not truncated or promoted.
+    static const size_t value = (size_t)((sizeof(size_t)==sizeof(u)) ? u : ull);
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+using std::move;
+using std::forward;
+#elif defined(_LIBCPP_NAMESPACE)
+// libc++ defines "pre-C++11 move and forward" similarly to ours; use it to avoid name conflicts in some cases.
+using std::_LIBCPP_NAMESPACE::move;
+using std::_LIBCPP_NAMESPACE::forward;
+#else
+// It is assumed that cv qualifiers, if any, are part of the deduced type.
+template <typename T>
+T& move( T& x ) { return x; }
+template <typename T>
+T& forward( T& x ) { return x; }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+// Helper macros to simplify writing templates working with both C++03 and C++11.
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#define  __TBB_FORWARDING_REF(A) A&&
+#else
+// It is assumed that cv qualifiers, if any, are part of a deduced type.
+// Thus this macro should not be used in public interfaces.
+#define  __TBB_FORWARDING_REF(A) A&
+#endif
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#define __TBB_PARAMETER_PACK ...
+#define __TBB_PACK_EXPANSION(A) A...
+#else
+#define __TBB_PARAMETER_PACK
+#define __TBB_PACK_EXPANSION(A) A
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+
+#if __TBB_CPP11_DECLTYPE_PRESENT
+#if __TBB_CPP11_DECLVAL_BROKEN
+// Ad-hoc implementation of std::declval
+template <class T> __TBB_FORWARDING_REF(T) declval() /*noexcept*/;
+#else
+using std::declval;
+#endif
+#endif
+
+template <bool condition>
+struct STATIC_ASSERTION_FAILED;
+
+template <>
+struct STATIC_ASSERTION_FAILED<false> { enum {value=1};};
+
+template<>
+struct STATIC_ASSERTION_FAILED<true>; //intentionally left undefined to cause compile time error
+
+//! @endcond
+}} // namespace tbb::internal
+
+#if __TBB_STATIC_ASSERT_PRESENT
+#define __TBB_STATIC_ASSERT(condition,msg) static_assert(condition,msg)
+#else
+//please note condition is intentionally inverted to get a bit more understandable error msg
+#define __TBB_STATIC_ASSERT_IMPL1(condition,msg,line)       \
+    enum {static_assert_on_line_##line = tbb::internal::STATIC_ASSERTION_FAILED<!(condition)>::value}
+
+#define __TBB_STATIC_ASSERT_IMPL(condition,msg,line) __TBB_STATIC_ASSERT_IMPL1(condition,msg,line)
+//! Verify condition, at compile time
+#define __TBB_STATIC_ASSERT(condition,msg) __TBB_STATIC_ASSERT_IMPL(condition,msg,__LINE__)
+#endif
+
+#endif /* RC_INVOKED */
+#endif /* __TBB_tbb_stddef_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbb_thread.h b/xdl/third_party/tbb/include/tbb/tbb_thread.h
new file mode 100644
index 00000000..75d18b94
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbb_thread.h
@@ -0,0 +1,332 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_thread_H
+#define __TBB_tbb_thread_H
+
+#include "tbb_stddef.h"
+
+#if _WIN32||_WIN64
+#include "machine/windows_api.h"
+#define __TBB_NATIVE_THREAD_ROUTINE unsigned WINAPI
+#define __TBB_NATIVE_THREAD_ROUTINE_PTR(r) unsigned (WINAPI* r)( void* )
+namespace tbb { namespace internal {
+#if __TBB_WIN8UI_SUPPORT
+    typedef size_t thread_id_type;
+#else  // __TBB_WIN8UI_SUPPORT
+    typedef DWORD thread_id_type;
+#endif // __TBB_WIN8UI_SUPPORT
+}} //namespace tbb::internal
+#else
+#define __TBB_NATIVE_THREAD_ROUTINE void*
+#define __TBB_NATIVE_THREAD_ROUTINE_PTR(r) void* (*r)( void* )
+#include <pthread.h>
+namespace tbb { namespace internal {
+    typedef pthread_t thread_id_type;
+}} //namespace tbb::internal
+#endif // _WIN32||_WIN64
+
+#include "atomic.h"
+#include "internal/_tbb_hash_compare_impl.h"
+#include "tick_count.h"
+
+#include __TBB_STD_SWAP_HEADER
+#include <iosfwd>
+
+namespace tbb {
+
+namespace internal {
+    class tbb_thread_v3;
+}
+
+inline void swap( internal::tbb_thread_v3& t1, internal::tbb_thread_v3& t2 ) __TBB_NOEXCEPT(true);
+
+namespace internal {
+
+    //! Allocate a closure
+    void* __TBB_EXPORTED_FUNC allocate_closure_v3( size_t size );
+    //! Free a closure allocated by allocate_closure_v3
+    void __TBB_EXPORTED_FUNC free_closure_v3( void* );
+
+    struct thread_closure_base {
+        void* operator new( size_t size ) {return allocate_closure_v3(size);}
+        void operator delete( void* ptr ) {free_closure_v3(ptr);}
+    };
+
+    template<class F> struct thread_closure_0: thread_closure_base {
+        F function;
+
+        static __TBB_NATIVE_THREAD_ROUTINE start_routine( void* c ) {
+            thread_closure_0 *self = static_cast<thread_closure_0*>(c);
+            self->function();
+            delete self;
+            return 0;
+        }
+        thread_closure_0( const F& f ) : function(f) {}
+    };
+    //! Structure used to pass user function with 1 argument to thread.
+    template<class F, class X> struct thread_closure_1: thread_closure_base {
+        F function;
+        X arg1;
+        //! Routine passed to Windows's _beginthreadex by thread::internal_start() inside tbb.dll
+        static __TBB_NATIVE_THREAD_ROUTINE start_routine( void* c ) {
+            thread_closure_1 *self = static_cast<thread_closure_1*>(c);
+            self->function(self->arg1);
+            delete self;
+            return 0;
+        }
+        thread_closure_1( const F& f, const X& x ) : function(f), arg1(x) {}
+    };
+    template<class F, class X, class Y> struct thread_closure_2: thread_closure_base {
+        F function;
+        X arg1;
+        Y arg2;
+        //! Routine passed to Windows's _beginthreadex by thread::internal_start() inside tbb.dll
+        static __TBB_NATIVE_THREAD_ROUTINE start_routine( void* c ) {
+            thread_closure_2 *self = static_cast<thread_closure_2*>(c);
+            self->function(self->arg1, self->arg2);
+            delete self;
+            return 0;
+        }
+        thread_closure_2( const F& f, const X& x, const Y& y ) : function(f), arg1(x), arg2(y) {}
+    };
+
+    //! Versioned thread class.
+    class tbb_thread_v3 {
+#if __TBB_IF_NO_COPY_CTOR_MOVE_SEMANTICS_BROKEN
+        // Workaround for a compiler bug: declaring the copy constructor as public
+        // enables use of the moving constructor.
+        // The definition is not provided in order to prohibit copying.
+    public:
+#endif
+        tbb_thread_v3(const tbb_thread_v3&); // = delete;   // Deny access
+    public:
+#if _WIN32||_WIN64
+        typedef HANDLE native_handle_type;
+#else
+        typedef pthread_t native_handle_type;
+#endif // _WIN32||_WIN64
+
+        class id;
+        //! Constructs a thread object that does not represent a thread of execution.
+        tbb_thread_v3() __TBB_NOEXCEPT(true) : my_handle(0)
+#if _WIN32||_WIN64
+            , my_thread_id(0)
+#endif // _WIN32||_WIN64
+        {}
+
+        //! Constructs an object and executes f() in a new thread
+        template <class F> explicit tbb_thread_v3(F f) {
+            typedef internal::thread_closure_0<F> closure_type;
+            internal_start(closure_type::start_routine, new closure_type(f));
+        }
+        //! Constructs an object and executes f(x) in a new thread
+        template <class F, class X> tbb_thread_v3(F f, X x) {
+            typedef internal::thread_closure_1<F,X> closure_type;
+            internal_start(closure_type::start_routine, new closure_type(f,x));
+        }
+        //! Constructs an object and executes f(x,y) in a new thread
+        template <class F, class X, class Y> tbb_thread_v3(F f, X x, Y y) {
+            typedef internal::thread_closure_2<F,X,Y> closure_type;
+            internal_start(closure_type::start_routine, new closure_type(f,x,y));
+        }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        tbb_thread_v3(tbb_thread_v3&& x) __TBB_NOEXCEPT(true)
+            : my_handle(x.my_handle)
+#if _WIN32||_WIN64
+            , my_thread_id(x.my_thread_id)
+#endif
+        {
+            x.internal_wipe();
+        }
+        tbb_thread_v3& operator=(tbb_thread_v3&& x) __TBB_NOEXCEPT(true) {
+            internal_move(x);
+            return *this;
+        }
+    private:
+        tbb_thread_v3& operator=(const tbb_thread_v3& x); // = delete;
+    public:
+#else  // __TBB_CPP11_RVALUE_REF_PRESENT
+        tbb_thread_v3& operator=(tbb_thread_v3& x) {
+            internal_move(x);
+            return *this;
+        }
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+        void swap( tbb_thread_v3& t ) __TBB_NOEXCEPT(true) {tbb::swap( *this, t );}
+        bool joinable() const __TBB_NOEXCEPT(true) {return my_handle!=0; }
+        //! The completion of the thread represented by *this happens before join() returns.
+        void __TBB_EXPORTED_METHOD join();
+        //! When detach() returns, *this no longer represents the possibly continuing thread of execution.
+        void __TBB_EXPORTED_METHOD detach();
+        ~tbb_thread_v3() {if( joinable() ) detach();}
+        inline id get_id() const __TBB_NOEXCEPT(true);
+        native_handle_type native_handle() { return my_handle; }
+
+        //! The number of hardware thread contexts.
+        /** Before TBB 3.0 U4 this methods returned the number of logical CPU in
+            the system. Currently on Windows, Linux and FreeBSD it returns the
+            number of logical CPUs available to the current process in accordance
+            with its affinity mask.
+
+            NOTE: The return value of this method never changes after its first
+            invocation. This means that changes in the process affinity mask that
+            took place after this method was first invoked will not affect the
+            number of worker threads in the TBB worker threads pool. **/
+        static unsigned __TBB_EXPORTED_FUNC hardware_concurrency() __TBB_NOEXCEPT(true);
+    private:
+        native_handle_type my_handle;
+#if _WIN32||_WIN64
+        thread_id_type my_thread_id;
+#endif // _WIN32||_WIN64
+
+        void internal_wipe() __TBB_NOEXCEPT(true) {
+            my_handle = 0;
+#if _WIN32||_WIN64
+            my_thread_id = 0;
+#endif
+        }
+        void internal_move(tbb_thread_v3& x) __TBB_NOEXCEPT(true) {
+            if (joinable()) detach();
+            my_handle = x.my_handle;
+#if _WIN32||_WIN64
+            my_thread_id = x.my_thread_id;
+#endif // _WIN32||_WIN64
+            x.internal_wipe();
+        }
+
+        /** Runs start_routine(closure) on another thread and sets my_handle to the handle of the created thread. */
+        void __TBB_EXPORTED_METHOD internal_start( __TBB_NATIVE_THREAD_ROUTINE_PTR(start_routine),
+                             void* closure );
+        friend void __TBB_EXPORTED_FUNC move_v3( tbb_thread_v3& t1, tbb_thread_v3& t2 );
+        friend void tbb::swap( tbb_thread_v3& t1, tbb_thread_v3& t2 ) __TBB_NOEXCEPT(true);
+    };
+
+    class tbb_thread_v3::id {
+        thread_id_type my_id;
+        id( thread_id_type id_ ) : my_id(id_) {}
+
+        friend class tbb_thread_v3;
+    public:
+        id() __TBB_NOEXCEPT(true) : my_id(0) {}
+
+        friend bool operator==( tbb_thread_v3::id x, tbb_thread_v3::id y ) __TBB_NOEXCEPT(true);
+        friend bool operator!=( tbb_thread_v3::id x, tbb_thread_v3::id y ) __TBB_NOEXCEPT(true);
+        friend bool operator<( tbb_thread_v3::id x, tbb_thread_v3::id y ) __TBB_NOEXCEPT(true);
+        friend bool operator<=( tbb_thread_v3::id x, tbb_thread_v3::id y ) __TBB_NOEXCEPT(true);
+        friend bool operator>( tbb_thread_v3::id x, tbb_thread_v3::id y ) __TBB_NOEXCEPT(true);
+        friend bool operator>=( tbb_thread_v3::id x, tbb_thread_v3::id y ) __TBB_NOEXCEPT(true);
+
+        template<class charT, class traits>
+        friend std::basic_ostream<charT, traits>&
+        operator<< (std::basic_ostream<charT, traits> &out,
+                    tbb_thread_v3::id id)
+        {
+            out << id.my_id;
+            return out;
+        }
+        friend tbb_thread_v3::id __TBB_EXPORTED_FUNC thread_get_id_v3();
+
+        friend inline size_t tbb_hasher( const tbb_thread_v3::id& id ) {
+            __TBB_STATIC_ASSERT(sizeof(id.my_id) <= sizeof(size_t), "Implementaion assumes that thread_id_type fits into machine word");
+            return tbb::tbb_hasher(id.my_id);
+        }
+
+        // A workaround for lack of tbb::atomic<id> (which would require id to be POD in C++03).
+        friend id atomic_compare_and_swap(id& location, const id& value, const id& comparand){
+            return as_atomic(location.my_id).compare_and_swap(value.my_id, comparand.my_id);
+        }
+    }; // tbb_thread_v3::id
+
+    tbb_thread_v3::id tbb_thread_v3::get_id() const __TBB_NOEXCEPT(true) {
+#if _WIN32||_WIN64
+        return id(my_thread_id);
+#else
+        return id(my_handle);
+#endif // _WIN32||_WIN64
+    }
+
+    void __TBB_EXPORTED_FUNC move_v3( tbb_thread_v3& t1, tbb_thread_v3& t2 );
+    tbb_thread_v3::id __TBB_EXPORTED_FUNC thread_get_id_v3();
+    void __TBB_EXPORTED_FUNC thread_yield_v3();
+    void __TBB_EXPORTED_FUNC thread_sleep_v3(const tick_count::interval_t &i);
+
+    inline bool operator==(tbb_thread_v3::id x, tbb_thread_v3::id y) __TBB_NOEXCEPT(true)
+    {
+        return x.my_id == y.my_id;
+    }
+    inline bool operator!=(tbb_thread_v3::id x, tbb_thread_v3::id y) __TBB_NOEXCEPT(true)
+    {
+        return x.my_id != y.my_id;
+    }
+    inline bool operator<(tbb_thread_v3::id x, tbb_thread_v3::id y) __TBB_NOEXCEPT(true)
+    {
+        return x.my_id < y.my_id;
+    }
+    inline bool operator<=(tbb_thread_v3::id x, tbb_thread_v3::id y) __TBB_NOEXCEPT(true)
+    {
+        return x.my_id <= y.my_id;
+    }
+    inline bool operator>(tbb_thread_v3::id x, tbb_thread_v3::id y) __TBB_NOEXCEPT(true)
+    {
+        return x.my_id > y.my_id;
+    }
+    inline bool operator>=(tbb_thread_v3::id x, tbb_thread_v3::id y) __TBB_NOEXCEPT(true)
+    {
+        return x.my_id >= y.my_id;
+    }
+
+} // namespace internal;
+
+//! Users reference thread class by name tbb_thread
+typedef internal::tbb_thread_v3 tbb_thread;
+
+using internal::operator==;
+using internal::operator!=;
+using internal::operator<;
+using internal::operator>;
+using internal::operator<=;
+using internal::operator>=;
+
+inline void move( tbb_thread& t1, tbb_thread& t2 ) {
+    internal::move_v3(t1, t2);
+}
+
+inline void swap( internal::tbb_thread_v3& t1, internal::tbb_thread_v3& t2 )  __TBB_NOEXCEPT(true) {
+    std::swap(t1.my_handle, t2.my_handle);
+#if _WIN32||_WIN64
+    std::swap(t1.my_thread_id, t2.my_thread_id);
+#endif /* _WIN32||_WIN64 */
+}
+
+namespace this_tbb_thread {
+    inline tbb_thread::id get_id() { return internal::thread_get_id_v3(); }
+    //! Offers the operating system the opportunity to schedule another thread.
+    inline void yield() { internal::thread_yield_v3(); }
+    //! The current thread blocks at least until the time specified.
+    inline void sleep(const tick_count::interval_t &i) {
+        internal::thread_sleep_v3(i);
+    }
+}  // namespace this_tbb_thread
+
+} // namespace tbb
+
+#endif /* __TBB_tbb_thread_H */
diff --git a/xdl/third_party/tbb/include/tbb/tbbmalloc_proxy.h b/xdl/third_party/tbb/include/tbb/tbbmalloc_proxy.h
new file mode 100644
index 00000000..66a8f9e4
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tbbmalloc_proxy.h
@@ -0,0 +1,66 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+Replacing the standard memory allocation routines in Microsoft* C/C++ RTL
+(malloc/free, global new/delete, etc.) with the TBB memory allocator.
+
+Include the following header to a source of any binary which is loaded during
+application startup
+
+#include "tbb/tbbmalloc_proxy.h"
+
+or add following parameters to the linker options for the binary which is
+loaded during application startup. It can be either exe-file or dll.
+
+For win32
+tbbmalloc_proxy.lib /INCLUDE:"___TBB_malloc_proxy"
+win64
+tbbmalloc_proxy.lib /INCLUDE:"__TBB_malloc_proxy"
+*/
+
+#ifndef __TBB_tbbmalloc_proxy_H
+#define __TBB_tbbmalloc_proxy_H
+
+#if _MSC_VER
+
+#ifdef _DEBUG
+    #pragma comment(lib, "tbbmalloc_proxy_debug.lib")
+#else
+    #pragma comment(lib, "tbbmalloc_proxy.lib")
+#endif
+
+#if defined(_WIN64)
+    #pragma comment(linker, "/include:__TBB_malloc_proxy")
+#else
+    #pragma comment(linker, "/include:___TBB_malloc_proxy")
+#endif
+
+#else
+/* Primarily to support MinGW */
+
+extern "C" void __TBB_malloc_proxy();
+struct __TBB_malloc_proxy_caller {
+    __TBB_malloc_proxy_caller() { __TBB_malloc_proxy(); }
+} volatile __TBB_malloc_proxy_helper_object;
+
+#endif // _MSC_VER
+
+#endif //__TBB_tbbmalloc_proxy_H
diff --git a/xdl/third_party/tbb/include/tbb/tick_count.h b/xdl/third_party/tbb/include/tbb/tick_count.h
new file mode 100644
index 00000000..de49f9e0
--- /dev/null
+++ b/xdl/third_party/tbb/include/tbb/tick_count.h
@@ -0,0 +1,140 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tick_count_H
+#define __TBB_tick_count_H
+
+#include "tbb_stddef.h"
+
+#if _WIN32||_WIN64
+#include "machine/windows_api.h"
+#elif __linux__
+#include <ctime>
+#else /* generic Unix */
+#include <sys/time.h>
+#endif /* (choice of OS) */
+
+namespace tbb {
+
+//! Absolute timestamp
+/** @ingroup timing */
+class tick_count {
+public:
+    //! Relative time interval.
+    class interval_t {
+        long long value;
+        explicit interval_t( long long value_ ) : value(value_) {}
+    public:
+        //! Construct a time interval representing zero time duration
+        interval_t() : value(0) {};
+
+        //! Construct a time interval representing sec seconds time  duration
+        explicit interval_t( double sec );
+
+        //! Return the length of a time interval in seconds
+        double seconds() const;
+
+        friend class tbb::tick_count;
+
+        //! Extract the intervals from the tick_counts and subtract them.
+        friend interval_t operator-( const tick_count& t1, const tick_count& t0 );
+
+        //! Add two intervals.
+        friend interval_t operator+( const interval_t& i, const interval_t& j ) {
+            return interval_t(i.value+j.value);
+        }
+
+        //! Subtract two intervals.
+        friend interval_t operator-( const interval_t& i, const interval_t& j ) {
+            return interval_t(i.value-j.value);
+        }
+
+        //! Accumulation operator
+        interval_t& operator+=( const interval_t& i ) {value += i.value; return *this;}
+
+        //! Subtraction operator
+        interval_t& operator-=( const interval_t& i ) {value -= i.value; return *this;}
+    private:
+        static long long ticks_per_second(){
+#if _WIN32||_WIN64
+            LARGE_INTEGER qpfreq;
+            int rval = QueryPerformanceFrequency(&qpfreq);
+            __TBB_ASSERT_EX(rval, "QueryPerformanceFrequency returned zero");
+            return static_cast<long long>(qpfreq.QuadPart);
+#elif __linux__
+            return static_cast<long long>(1E9);
+#else /* generic Unix */
+            return static_cast<long long>(1E6);
+#endif /* (choice of OS) */
+        }
+    };
+
+    //! Construct an absolute timestamp initialized to zero.
+    tick_count() : my_count(0) {};
+
+    //! Return current time.
+    static tick_count now();
+
+    //! Subtract two timestamps to get the time interval between
+    friend interval_t operator-( const tick_count& t1, const tick_count& t0 );
+
+    //! Return the resolution of the clock in seconds per tick.
+    static double resolution() { return 1.0 / interval_t::ticks_per_second(); }
+
+private:
+    long long my_count;
+};
+
+inline tick_count tick_count::now() {
+    tick_count result;
+#if _WIN32||_WIN64
+    LARGE_INTEGER qpcnt;
+    int rval = QueryPerformanceCounter(&qpcnt);
+    __TBB_ASSERT_EX(rval, "QueryPerformanceCounter failed");
+    result.my_count = qpcnt.QuadPart;
+#elif __linux__
+    struct timespec ts;
+    int status = clock_gettime( CLOCK_REALTIME, &ts );
+    __TBB_ASSERT_EX( status==0, "CLOCK_REALTIME not supported" );
+    result.my_count = static_cast<long long>(1000000000UL)*static_cast<long long>(ts.tv_sec) + static_cast<long long>(ts.tv_nsec);
+#else /* generic Unix */
+    struct timeval tv;
+    int status = gettimeofday(&tv, NULL);
+    __TBB_ASSERT_EX( status==0, "gettimeofday failed" );
+    result.my_count = static_cast<long long>(1000000)*static_cast<long long>(tv.tv_sec) + static_cast<long long>(tv.tv_usec);
+#endif /*(choice of OS) */
+    return result;
+}
+
+inline tick_count::interval_t::interval_t( double sec ) {
+    value = static_cast<long long>(sec*interval_t::ticks_per_second());
+}
+
+inline tick_count::interval_t operator-( const tick_count& t1, const tick_count& t0 ) {
+    return tick_count::interval_t( t1.my_count-t0.my_count );
+}
+
+inline double tick_count::interval_t::seconds() const {
+    return value*tick_count::resolution();
+}
+
+} // namespace tbb
+
+#endif /* __TBB_tick_count_H */
diff --git a/xdl/third_party/tbb/index.html b/xdl/third_party/tbb/index.html
new file mode 100644
index 00000000..46e21031
--- /dev/null
+++ b/xdl/third_party/tbb/index.html
@@ -0,0 +1,50 @@
+<HTML>
+<BODY>
+<H2>Overview</H2>
+Top level directory for Intel&reg; Threading Building Blocks (Intel&reg; TBB).
+<H2>Common directories</H2>
+<DL>
+<DT><A HREF="include/index.html">include</A>
+<DD>Include files required for compiling code that uses the library.
+<DT><A HREF="examples/index.html">examples</A>
+<DD>Examples of how to use the library.
+<DT><A HREF="python/index.html">python</A>
+<DD>Python* API for Intel TBB.
+</DL>
+<H2>Intel TBB source package</H2>
+<P>
+To build Intel TBB, use the <A HREF=Makefile>top-level Makefile</A>; see also the <A HREF=build/index.html#build>build directions</A>.
+To port Intel TBB to a new platform, operating system or architecture, see the <A HREF=build/index.html#port>porting directions</A>.
+</P>
+<H3>Files</H3>
+<DL>
+<DT><A HREF="Makefile">Makefile</A>
+<DD>Top-level Makefile for Intel TBB. See also the <A HREF=build/index.html#build>build directions</A>.
+</DL>
+<H3>Directories</H3>
+<DL>
+<DT><A HREF="src/index.html">src</A>
+<DD>Source code for the library.
+<DT><A HREF="build/index.html">build</A>, <A HREF="jni/">jni</A>
+<DD>Internal Makefile infrastructure for Intel TBB. Do not use directly; see the <A HREF=build/index.html#build>build directions</A>.
+</DL>
+<H2>Intel TBB binary package</H2>
+<H3>Directories</H3>
+<DL>
+<DT><A HREF="doc/html/index.html">doc</A>
+<DD>Documentation for the library.
+<DT><A HREF="bin">bin</A>
+<DD>Start-up scripts for sourcing library for Linux* OS and macOS*. For Windows* OS: start-up scripts and dynamic-link libraries.
+<DT><A HREF="lib">lib</A>
+<DD>Platform-specific binary files for the library.
+</DL>
+<HR>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/jni/Android.mk b/xdl/third_party/tbb/jni/Android.mk
new file mode 100644
index 00000000..01bdd88c
--- /dev/null
+++ b/xdl/third_party/tbb/jni/Android.mk
@@ -0,0 +1,66 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+export tbb_root?=$(NDK_PROJECT_PATH)
+
+ifeq (armeabi-v7a,$(APP_ABI))
+	export SYSROOT:=$(NDK_ROOT)/platforms/$(APP_PLATFORM)/arch-arm
+else ifeq (arm64-v8a,$(APP_ABI))
+	export SYSROOT:=$(NDK_ROOT)/platforms/$(APP_PLATFORM)/arch-arm64
+else
+	export SYSROOT:=$(NDK_ROOT)/platforms/$(APP_PLATFORM)/arch-$(APP_ABI)
+endif
+
+ifeq (windows,$(tbb_os))
+	export CPATH_SEPARATOR :=;
+else
+	export CPATH_SEPARATOR :=:
+endif
+
+export ANDROID_NDK_ROOT:=$(NDK_ROOT)
+export ndk_version:=$(lastword $(subst -, ,$(ANDROID_NDK_ROOT)))
+ndk_version:= $(firstword $(subst /, ,$(ndk_version)))
+ndk_version:= $(firstword $(subst \, ,$(ndk_version)))
+
+ifeq (clang,$(compiler))
+	ifeq (,$(findstring $(ndk_version),ifeq (,$(findstring $(ndk_version),$(foreach v, 7 8 9 10 11 12,r$(v) r$(v)b r$(v)c r$(v)d r$(v)e)))))
+		TBB_RTL :=llvm-libc++
+	else
+		TBB_RTL :=llvm-libc++/libcxx
+	endif
+	TBB_RTL_LIB :=llvm-libc++
+	TBB_RTL_FILE :=libc++_shared.so
+else
+	TBB_RTL :=gnu-libstdc++/$(NDK_TOOLCHAIN_VERSION)
+	TBB_RTL_LIB :=$(TBB_RTL)
+	TBB_RTL_FILE :=libgnustl_shared.so
+endif
+
+export CPATH := $(SYSROOT)/usr/include$(CPATH_SEPARATOR)$(NDK_ROOT)/sources/cxx-stl/$(TBB_RTL)/include$(CPATH_SEPARATOR)$(NDK_ROOT)/sources/cxx-stl/$(TBB_RTL)/libs/$(APP_ABI)/include$(CPATH_SEPARATOR)$(NDK_ROOT)/sources/android/support/include
+
+LIB_STL_ANDROID_DIR := $(NDK_ROOT)/sources/cxx-stl/$(TBB_RTL_LIB)/libs/$(APP_ABI)
+#LIB_STL_ANDROID is required to be set up for copying Android specific library to a device next to test
+export LIB_STL_ANDROID := $(LIB_STL_ANDROID_DIR)/$(TBB_RTL_FILE)
+export CPLUS_LIB_PATH := $(SYSROOT)/usr/lib -L$(LIB_STL_ANDROID_DIR)
+export target_os_version:=$(APP_PLATFORM)
+export tbb_tool_prefix:=$(TOOLCHAIN_PREFIX)
+export TARGET_CXX
+export TARGET_CC
+export TARGET_CFLAGS
+
+include $(NDK_PROJECT_PATH)/src/Makefile
diff --git a/xdl/third_party/tbb/jni/Application.mk b/xdl/third_party/tbb/jni/Application.mk
new file mode 100644
index 00000000..6ffa1917
--- /dev/null
+++ b/xdl/third_party/tbb/jni/Application.mk
@@ -0,0 +1,71 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+ifndef tbb_os
+
+  # Windows sets environment variable OS; for other systems, ask uname
+  ifeq ($(OS),)
+    OS:=$(shell uname)
+    ifeq ($(OS),)
+      $(error "Cannot detect operating system")
+    endif
+    export tbb_os=$(OS)
+  endif
+
+  ifeq ($(OS), Windows_NT)
+    export tbb_os=windows
+  endif
+  ifeq ($(OS), Linux)
+    export tbb_os=linux
+  endif
+  ifeq ($(OS), Darwin)
+    export tbb_os=macos
+  endif
+
+endif
+
+export compiler?=clang
+export arch?=ia32
+export target?=android
+
+ifeq (ia32,$(arch))
+    APP_ABI:=x86
+    export TRIPLE:=i686-linux-android
+else ifeq (intel64,$(arch))
+    APP_ABI:=x86_64
+    export TRIPLE:=x86_64-linux-android
+else ifeq (arm,$(arch))
+    APP_ABI:=armeabi-v7a
+    export TRIPLE:=arm-linux-androideabi
+else ifeq (arm64,$(arch))
+    APP_ABI:=arm64-v8a
+    export TRIPLE:=aarch64-linux-android
+else
+    APP_ABI:=$(arch)
+endif
+
+api_version?=21
+export API_LEVEL:=$(api_version)
+APP_PLATFORM:=android-$(api_version)
+
+ifeq (clang,$(compiler))
+    NDK_TOOLCHAIN_VERSION:=clang
+    APP_STL:=c++_shared
+else
+    NDK_TOOLCHAIN_VERSION:=4.9
+endif
diff --git a/xdl/third_party/tbb/python/Makefile b/xdl/third_party/tbb/python/Makefile
new file mode 100644
index 00000000..e92cb440
--- /dev/null
+++ b/xdl/third_party/tbb/python/Makefile
@@ -0,0 +1,48 @@
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+tbb_root?=..
+include $(tbb_root)/build/common.inc
+.PHONY: all release test install test-install
+
+export TBBROOT=$(abspath $(tbb_root))
+SRC=$(tbb_root)/python/*.py $(tbb_root)/python/tbb/*
+PY_SETUP=python $(tbb_root)/python/setup.py
+
+all: install test
+
+clean:
+	$(PY_SETUP) clean -b$(CURDIR)
+
+release: CC=$(compiler)
+release: $(SRC) rml
+	$(PY_SETUP) build -b$(CURDIR) -f check
+
+install: CC=$(compiler)
+install: $(SRC) rml
+	$(PY_SETUP) build -b$(CURDIR) install
+
+test:
+	python -m tbb test
+
+rml:
+ifeq (linux,$(tbb_os))
+	$(MAKE) -C "$(work_dir)_release" -rf $(tbb_root)/python/rml/Makefile cfg=release rml
+rml_%:
+	$(MAKE) -C "$(work_dir)_release" -rf $(tbb_root)/python/rml/Makefile cfg=release $(subst rml_,,$@)
+endif
diff --git a/xdl/third_party/tbb/python/TBB.py b/xdl/third_party/tbb/python/TBB.py
new file mode 100644
index 00000000..7a6ff8e9
--- /dev/null
+++ b/xdl/third_party/tbb/python/TBB.py
@@ -0,0 +1,28 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+from tbb import *
+from tbb import __all__, __doc__
+
+if __name__ == "__main__":
+    from tbb import _main
+    import sys
+    sys.exit(_main())
diff --git a/xdl/third_party/tbb/python/index.html b/xdl/third_party/tbb/python/index.html
new file mode 100644
index 00000000..e9d30964
--- /dev/null
+++ b/xdl/third_party/tbb/python/index.html
@@ -0,0 +1,84 @@
+<HTML>
+<BODY>
+<H2>Python* API for Intel&reg; Threading Building Blocks (Intel&reg; TBB).
+</H2>
+
+<H2>Overview</H2>
+It is a preview Python* module which unlocks opportunities for additional performance in multi-threaded and multiprocess Python programs by enabling threading composability
+between two or more thread-enabled libraries like Numpy, Scipy, Sklearn, Dask, Joblib, and etc.
+<p></p>
+The biggest improvement can be achieved when a task pool like the ThreadPool or Pool from the Python standard library or libraries like Dask or Joblib (used either in multi-threading or multi-processing mode)
+execute tasks calling compute-intensive functions of Numpy/Scipy/Sklearn/PyDAAL which in turn are parallelized using Intel&reg; Math Kernel Library or/and Intel&reg; TBB.
+<p></p>
+The module implements Pool class with the standard interface using Intel&reg; TBB which can be used to replace Python's ThreadPool.
+Thanks to the monkey-patching technique implemented in class Monkey, no source code change is needed in order to enable threading composability in Python programs.
+<p></p>
+For more information and examples, please refer to <A HREF="http://software.intel.com/en-us/blogs/2016/04/04/unleash-parallel-performance-of-python-programs">online blog</A>.
+
+<H2>Directories</H2>
+<DL>
+<DT><A HREF="rml">rml</A>
+<DD>The folder contains sources for building the plugin with cross-process dynamic thread scheduler implementation.
+<DT><A HREF="tbb">tbb</A>
+<DD>The folder contains Python module sources.
+</DL>
+
+<H2>Files</H2>
+<DL>
+<DT><A HREF="setup.py">setup.py</A>
+<DD>Standard Python setup script.
+<DT><A HREF="Makefile">Makefile</A>
+<DD>Internal Makefile for building, installing, and testing. See below.
+<DT><A HREF="TBB.py">TBB.py</A>
+<DD>Alternative entry point for Python module.
+</DL>
+
+<A NAME=build><H2>Build and install</H2></A>
+For accessing targets defined in python/Makefile, please use
+<A HREF="../src/index.html">src/Makefile</A>
+instead and build runtime libraries before working with Python.
+<DL>
+<DT><TT>make -C ../src python_all</TT>
+<DD>Install and test as described below.
+<DT><TT>make -C ../src python_install</TT>
+<DD>Install module into Python environment.
+<DT><TT>make -C ../src python_test</TT>
+<DD>Test installed Intel&reg; TBB module for Python.
+<DT><TT>make -C ../src python_release</TT>
+<DD>Recompile Python module. Result is located in Intel&reg; TBB build directory.
+<DT><TT>make  -C ../src python_clean</TT>
+<DD>Remove any intermediate files produced by the commands above. Does not remove installed module.
+</DL>
+
+<H2>Command-line interface</H2>
+<DL>
+<DT><TT>python -m tbb -h</TT>
+<DD>Print documentation on command-line interface</DD>
+<DT><TT>pydoc tbb</TT>
+<DD>Read built-in documentation for Python interfaces.</DD>
+<DT><TT>python-tbb your_script.py</TT>
+<DT><TT>python -m tbb your_script.py</TT>
+<DD>Run your_script.py in context of `with tbb.Monkey():` when Intel&reg; TBB is enabled. By default only multi-threading will be covered.</DD>
+<DT><TT>python -m tbb --ipc your_script.py</TT>
+<DD>Run your_script.py in context of `with tbb.Monkey():` when Intel&reg; TBB enabled in both multi-threading and multi-processing modes.</DD>
+</DL>
+
+<H2>System Requirements</H2>
+The Python module was not tested on older versions of Python thus we require at least Python versions 2.7 and 3.5 or higher.<BR>
+SWIG must be of version 3.0.6 or higher<BR>
+OS versions:
+Microsoft* Windows* Server 2012,
+Microsoft* Windows* 10,
+Ubuntu* 14.04 LTS,
+Red Hat* Enterprise Linux* 7.
+<HR>
+<A href="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2016-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/python/rml/Makefile b/xdl/third_party/tbb/python/rml/Makefile
new file mode 100644
index 00000000..ef55ad9d
--- /dev/null
+++ b/xdl/third_party/tbb/python/rml/Makefile
@@ -0,0 +1,155 @@
+# Copyright (c) 2017-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+.NOTPARALLEL:
+
+tbb_root ?= ../..
+BUILDING_PHASE=0
+TEST_RESOURCE = $(RML.RES)
+include $(tbb_root)/build/common.inc
+DEBUG_SUFFIX=$(findstring _debug,_$(cfg))
+
+ifneq (linux,$(target))
+$(error "IPC RML is supported on Linux only")
+endif
+
+.PHONY: default rml test clean
+
+# default target
+default: rml test
+
+RML_ROOT ?= $(tbb_root)/src/rml
+RML_SERVER_ROOT = $(RML_ROOT)/server
+# TODO: new API needs to be added for this server, exposing everything
+RML.DEF =
+
+VPATH = $(tbb_root)/src/tbb $(tbb_root)/src/tbb/$(ASSEMBLY_SOURCE)
+VPATH += $(tbb_root)/python/rml $(RML_ROOT)/test $(tbb_root)/src/test
+VPATH += $(tbb_root)/src/rml/client
+
+include $(tbb_root)/build/common_rules.inc
+
+#--------------------------------------------------------------------------
+# Define rules for making the RML server shared library and client objects.
+#--------------------------------------------------------------------------
+
+# Object files that make up RML server
+RML_SERVER.OBJ = ipc_server.$(OBJ)
+
+# Object files that RML clients need
+RML_TBB_CLIENT.OBJ ?= ipc_utils.$(OBJ)
+RML.OBJ = $(RML_SERVER.OBJ) $(RML_TBB_CLIENT.OBJ)
+ifeq (windows,$(tbb_os))
+RML_ASM.OBJ = $(if $(findstring intel64,$(arch)),$(TBB_ASM.OBJ))
+endif
+ifeq (linux,$(tbb_os))
+RML_ASM.OBJ = $(if $(findstring ia64,$(arch)),$(TBB_ASM.OBJ))
+endif
+
+RML_TBB_DEP= cache_aligned_allocator_rml.$(OBJ) dynamic_link_rml.$(OBJ) tbb_misc_rml.$(OBJ) tbb_misc_ex_rml.$(OBJ)
+TBB_DEP_NON_RML_TEST?= cache_aligned_allocator_rml.$(OBJ) dynamic_link_rml.$(OBJ) $(RML_ASM.OBJ) tbb_misc_rml.$(OBJ) tbb_misc_ex_rml.$(OBJ)
+ifeq ($(cfg),debug)
+RML_TBB_DEP+= spin_mutex_rml.$(OBJ)
+TBB_DEP_RML_TEST?= $(RML_ASM.OBJ) tbb_misc_rml.$(OBJ)
+else
+TBB_DEP_RML_TEST?= $(RML_ASM.OBJ)
+endif
+LIBS += $(LIBDL)
+TBB_DEP_RML_TEST =  rml_tbb.$(OBJ) dynamic_link_rml.$(OBJ)
+
+INCLUDES += $(INCLUDE_KEY)$(RML_ROOT)/include $(INCLUDE_KEY).
+T_INCLUDES = $(INCLUDES) $(INCLUDE_KEY)$(tbb_root)/src/test $(INCLUDE_KEY)$(RML_SERVER_ROOT)
+
+# Suppress superfluous warnings for RML compilation
+R_CPLUS_FLAGS =  $(subst DO_ITT_NOTIFY,DO_ITT_NOTIFY=0,$(CPLUS_FLAGS)) $(WARNING_SUPPRESS) \
+		 $(DEFINE_KEY)TBB_USE_THREADING_TOOLS=0 $(DEFINE_KEY)__TBB_RML_STATIC=1 $(DEFINE_KEY)__TBB_NO_IMPLICIT_LINKAGE=1
+
+%.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(R_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(INCLUDES) $<
+
+tbb_misc_rml.$(OBJ) $(RML_SERVER.OBJ): version_string.ver
+
+RML_TEST.OBJ = test_job_automaton.$(OBJ) test_thread_monitor.$(OBJ) test_rml_tbb.$(OBJ)
+
+$(RML_TBB_DEP): %_rml.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(OUTPUTOBJ_KEY)$@ $(R_CPLUS_FLAGS) $(PIC_KEY) $(DSE_KEY) $(INCLUDES) $<
+
+$(RML_TEST.OBJ): %.$(OBJ): %.cpp
+	$(CPLUS) $(COMPILE_ONLY) $(R_CPLUS_FLAGS) $(PIC_KEY) $(T_INCLUDES) $<
+
+ifneq (,$(RML.DEF))
+rml.def: $(RML.DEF)
+	$(CPLUS) $(PREPROC_ONLY) $< $(CPLUS_FLAGS) $(INCLUDES) > $@
+
+LIB_LINK_FLAGS += $(EXPORT_KEY)rml.def
+$(RML.DLL): rml.def
+endif
+
+$(RML.DLL): CPLUS_FLAGS += $(SDL_FLAGS)
+$(RML.DLL): BUILDING_LIBRARY = $(RML.DLL)
+$(RML.DLL): $(RML_TBB_DEP) $(RML.OBJ) $(RML.RES) $(RML_NO_VERSION.DLL) $(RML_ASM.OBJ)
+	$(LIB_LINK_CMD) $(LIB_OUTPUT_KEY)$(RML.DLL) $(RML.OBJ) $(RML_TBB_DEP) $(RML_ASM.OBJ) $(RML.RES) $(LIB_LINK_LIBS) $(LIB_LINK_FLAGS)
+
+ifneq (,$(RML_NO_VERSION.DLL))
+$(RML_NO_VERSION.DLL):
+	echo "INPUT ($(RML.DLL))" > $(RML_NO_VERSION.DLL)
+endif
+
+rml: rml_dll
+rml_dll: $(RML.DLL)
+
+#------------------------------------------------------
+# End of rules for making the RML server shared library
+#------------------------------------------------------
+
+#------------------------------------------------------
+# Define rules for making the RML unit tests
+#------------------------------------------------------
+
+add_debug=$(basename $(1))_debug$(suffix $(1))
+cross_suffix=$(if $(crosstest),$(if $(DEBUG_SUFFIX),$(subst _debug,,$(1)),$(call add_debug,$(1))),$(1))
+
+RML_TESTS = test_job_automaton.$(TEST_EXT) test_thread_monitor.$(TEST_EXT)
+RML_CUSTOM_TESTS = test_rml_tbb.$(TEST_EXT)
+
+test_rml_tbb.$(TEST_EXT): test_rml_tbb.$(OBJ) $(RML_TBB_CLIENT.OBJ) $(TBB_DEP_RML_TEST)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) test_rml_tbb.$(OBJ) $(RML_TBB_CLIENT.OBJ) $(TBB_DEP_RML_TEST) $(LIBS) $(LINK_FLAGS)
+
+$(RML_TESTS): %.$(TEST_EXT): %.$(OBJ) $(TBB_DEP_NON_RML_TEST)
+	$(CPLUS) $(OUTPUT_KEY)$@ $(CPLUS_FLAGS) $< $(TBB_DEP_NON_RML_TEST) $(LIBS) $(LINK_FLAGS)
+
+export IPC_ENABLE=1
+### run_cmd is usually empty
+test: $(call cross_suffix,$(RML.DLL)) $(TEST_PREREQUISITE) $(RML_TESTS) $(RML_CUSTOM_TESTS)
+	$(run_cmd) ./test_job_automaton.$(TEST_EXT) $(args)
+	$(run_cmd) ./test_thread_monitor.$(TEST_EXT) $(args)
+#TODO:	$(run_cmd) ./test_rml_tbb.$(TEST_EXT) $(args)
+#TODO:	IPC_ENABLE=1 LD_PRELOAD=$(abspath libirml.so.1) $(MAKE) -rf $(tbb_root)/src/Makefile cfg=release tbb_test_release
+
+#------------------------------------------------------
+# End of rules for making the TBBMalloc unit tests
+#------------------------------------------------------
+
+# Include automatically generated dependencies
+-include *.d
+
+clean:
+	-rm -rf *.o *.so* *.d *.def version_string.ver
+	-rm -rf $(work_dir)_release/libirml*
+	-rm -rf $(work_dir)_debug/libirml*
diff --git a/xdl/third_party/tbb/python/rml/ipc_server.cpp b/xdl/third_party/tbb/python/rml/ipc_server.cpp
new file mode 100644
index 00000000..3d72fa7b
--- /dev/null
+++ b/xdl/third_party/tbb/python/rml/ipc_server.cpp
@@ -0,0 +1,1119 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "rml_tbb.h"
+#include "../server/thread_monitor.h"
+#include "tbb/atomic.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/scheduler_common.h"
+#include "tbb/governor.h"
+#include "tbb/tbb_misc.h"
+
+#include "ipc_utils.h"
+
+#include <fcntl.h>
+
+namespace rml {
+namespace internal {
+
+static const char* IPC_ENABLE_VAR_NAME = "IPC_ENABLE";
+
+typedef versioned_object::version_type version_type;
+
+extern "C" factory::status_type __RML_open_factory(factory& f, version_type& server_version, version_type client_version) {
+    if( !tbb::internal::rml::get_enable_flag( IPC_ENABLE_VAR_NAME ) ) {
+        return factory::st_incompatible;
+    }
+
+    // Hack to keep this library from being closed
+    static tbb::atomic<bool> one_time_flag;
+    if( one_time_flag.compare_and_swap(true,false)==false ) {
+        __TBB_ASSERT( (size_t)f.library_handle!=factory::c_dont_unload, NULL );
+#if _WIN32||_WIN64
+        f.library_handle = reinterpret_cast<HMODULE>(factory::c_dont_unload);
+#else
+        f.library_handle = reinterpret_cast<void*>(factory::c_dont_unload);
+#endif
+    }
+    // End of hack
+
+    return factory::st_success;
+}
+
+extern "C" void __RML_close_factory(factory& f) {
+}
+
+class ipc_thread_monitor : public thread_monitor {
+public:
+    ipc_thread_monitor() : thread_monitor() {}
+
+#if USE_WINTHREAD
+#elif USE_PTHREAD
+    static handle_type launch(thread_routine_type thread_routine, void* arg, size_t stack_size);
+#endif
+};
+
+#if USE_WINTHREAD
+#elif USE_PTHREAD
+inline ipc_thread_monitor::handle_type ipc_thread_monitor::launch(void* (*thread_routine)(void*), void* arg, size_t stack_size) {
+    pthread_attr_t s;
+    if( pthread_attr_init( &s ) ) return 0;
+    if( stack_size>0 ) {
+        if( pthread_attr_setstacksize( &s, stack_size ) ) return 0;
+    }
+    pthread_t handle;
+    if( pthread_create( &handle, &s, thread_routine, arg ) ) return 0;
+    if( pthread_attr_destroy( &s ) ) return 0;
+    return handle;
+}
+#endif
+
+}} //rml::internal
+
+using rml::internal::ipc_thread_monitor;
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+typedef ipc_thread_monitor::handle_type thread_handle;
+
+class ipc_server;
+
+static const char* IPC_MAX_THREADS_VAR_NAME = "MAX_THREADS";
+static const char* IPC_ACTIVE_SEM_PREFIX = "/__IPC_active";
+static const char* IPC_STOP_SEM_PREFIX = "/__IPC_stop";
+static const char* IPC_ACTIVE_SEM_VAR_NAME = "IPC_ACTIVE_SEMAPHORE";
+static const char* IPC_STOP_SEM_VAR_NAME = "IPC_STOP_SEMAPHORE";
+static const mode_t IPC_SEM_MODE = 0660;
+
+static tbb::atomic<int> my_global_thread_count;
+
+char* get_active_sem_name() {
+    char* value = getenv( IPC_ACTIVE_SEM_VAR_NAME );
+    if( value!=NULL && strlen( value )>0 ) {
+        char* sem_name = new char[strlen( value ) + 1];
+        __TBB_ASSERT( sem_name!=NULL, NULL );
+        strcpy( sem_name, value );
+        return sem_name;
+    } else {
+        return get_shared_name( IPC_ACTIVE_SEM_PREFIX );
+    }
+}
+
+char* get_stop_sem_name() {
+    char* value = getenv( IPC_STOP_SEM_VAR_NAME );
+    if( value!=NULL && strlen( value )>0 ) {
+        char* sem_name = new char[strlen( value ) + 1];
+        __TBB_ASSERT( sem_name!=NULL, NULL );
+        strcpy( sem_name, value );
+        return sem_name;
+    } else {
+        return get_shared_name( IPC_STOP_SEM_PREFIX );
+    }
+}
+
+static void release_thread_sem(sem_t* my_sem) {
+    int old;
+    do {
+        old = my_global_thread_count;
+        if( old<=0 ) return;
+    } while( my_global_thread_count.compare_and_swap(old-1, old)!=old );
+    if( old>0 ) {
+        sem_post( my_sem );
+    }
+}
+
+extern "C" void set_active_sem_name() {
+    char* templ = new char[strlen( IPC_ACTIVE_SEM_PREFIX ) + strlen( "_XXXXXX" ) + 1];
+    __TBB_ASSERT( templ!=NULL, NULL );
+    strcpy( templ, IPC_ACTIVE_SEM_PREFIX );
+    strcpy( templ + strlen( IPC_ACTIVE_SEM_PREFIX ), "_XXXXXX" );
+    char* sem_name = mktemp( templ );
+    if( sem_name!=NULL ) {
+        int status = setenv( IPC_ACTIVE_SEM_VAR_NAME, sem_name, 1 );
+        __TBB_ASSERT_EX( status==0, NULL );
+    }
+    delete[] templ;
+}
+
+extern "C" void set_stop_sem_name() {
+    char* templ = new char[strlen( IPC_STOP_SEM_PREFIX ) + strlen( "_XXXXXX" ) + 1];
+    __TBB_ASSERT( templ!=NULL, NULL );
+    strcpy( templ, IPC_STOP_SEM_PREFIX );
+    strcpy( templ + strlen( IPC_STOP_SEM_PREFIX ), "_XXXXXX" );
+    char* sem_name = mktemp( templ );
+    if( sem_name!=NULL ) {
+        int status = setenv( IPC_STOP_SEM_VAR_NAME, sem_name, 1 );
+        __TBB_ASSERT_EX( status==0, NULL );
+    }
+    delete[] templ;
+}
+
+extern "C" void release_resources() {
+    if( my_global_thread_count!=0 ) {
+        char* active_sem_name = get_active_sem_name();
+        sem_t* my_active_sem = sem_open( active_sem_name, O_CREAT );
+        __TBB_ASSERT( my_active_sem, "Unable to open active threads semaphore" );
+        delete[] active_sem_name;
+
+        do {
+            release_thread_sem( my_active_sem );
+        } while( my_global_thread_count!=0 );
+    }
+}
+
+extern "C" void release_semaphores() {
+    int status = 0;
+    char* sem_name = NULL;
+
+    sem_name = get_active_sem_name();
+    if( sem_name==NULL ) {
+        runtime_warning("Can not get RML semaphore name");
+        return;
+    }
+    status = sem_unlink( sem_name );
+    if( status!=0 ) {
+        if( errno==ENOENT ) {
+            /* There is no semaphore with the given name, nothing to do */
+        } else {
+            runtime_warning("Can not release RML semaphore");
+            return;
+        }
+    }
+    delete[] sem_name;
+
+    sem_name = get_stop_sem_name();
+    if( sem_name==NULL ) {
+        runtime_warning( "Can not get RML semaphore name" );
+        return;
+    }
+    status = sem_unlink( sem_name );
+    if( status!=0 ) {
+        if( errno==ENOENT ) {
+            /* There is no semaphore with the given name, nothing to do */
+        } else {
+            runtime_warning("Can not release RML semaphore");
+            return;
+        }
+    }
+    delete[] sem_name;
+}
+
+class ipc_worker: no_copy {
+protected:
+    //! State in finite-state machine that controls the worker.
+    /** State diagram:
+                    /----------stop---\
+                    |           ^     |
+                    V           |     |
+        init --> starting --> normal  |
+          |         |           |     |
+          |         V           |     |
+          \------> quit <-------/<----/
+      */
+    enum state_t {
+        //! *this is initialized
+        st_init,
+        //! *this has associated thread that is starting up.
+        st_starting,
+        //! Associated thread is doing normal life sequence.
+        st_normal,
+        //! Associated thread is stopped but can be started again.
+        st_stop,
+        //! Associated thread has ended normal life sequence and promises to never touch *this again.
+        st_quit
+    };
+    atomic<state_t> my_state;
+
+    //! Associated server
+    ipc_server& my_server;
+
+    //! Associated client
+    tbb_client& my_client;
+
+    //! index used for avoiding the 64K aliasing problem
+    const size_t my_index;
+
+    //! Monitor for sleeping when there is no work to do.
+    /** The invariant that holds for sleeping workers is:
+        "my_slack<=0 && my_state==st_normal && I am on server's list of asleep threads" */
+    ipc_thread_monitor my_thread_monitor;
+
+    //! Handle of the OS thread associated with this worker
+    thread_handle my_handle;
+
+    //! Link for list of workers that are sleeping or have no associated thread.
+    ipc_worker* my_next;
+
+    friend class ipc_server;
+
+    //! Actions executed by the associated thread
+    void run();
+
+    //! Wake up associated thread (or launch a thread if there is none)
+    bool wake_or_launch();
+
+    //! Called by a thread (usually not the associated thread) to commence termination.
+    void start_shutdown(bool join);
+
+    //! Called by a thread (usually not the associated thread) to commence stopping.
+    void start_stopping(bool join);
+
+    static __RML_DECL_THREAD_ROUTINE thread_routine(void* arg);
+
+    static void release_handle(thread_handle my_handle, bool join);
+
+protected:
+    ipc_worker(ipc_server& server, tbb_client& client, const size_t i) :
+        my_server(server),
+        my_client(client),
+        my_index(i)
+    {
+        my_state = st_init;
+    }
+};
+
+static const size_t cache_line_size = tbb::internal::NFS_MaxLineSize;
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about uninstantiable class
+    #pragma warning(push)
+    #pragma warning(disable:4510 4610)
+#endif
+class padded_ipc_worker: public ipc_worker {
+    char pad[cache_line_size - sizeof(ipc_worker)%cache_line_size];
+public:
+    padded_ipc_worker(ipc_server& server, tbb_client& client, const size_t i)
+    : ipc_worker( server,client,i ) { suppress_unused_warning(pad); }
+};
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+class ipc_waker : public padded_ipc_worker {
+private:
+    static __RML_DECL_THREAD_ROUTINE thread_routine(void* arg);
+    void run();
+    bool wake_or_launch();
+
+    friend class ipc_server;
+
+public:
+    ipc_waker(ipc_server& server, tbb_client& client, const size_t i)
+    : padded_ipc_worker( server, client, i ) {}
+};
+
+class ipc_stopper : public padded_ipc_worker {
+private:
+    static __RML_DECL_THREAD_ROUTINE thread_routine(void* arg);
+    void run();
+    bool wake_or_launch();
+
+    friend class ipc_server;
+
+public:
+    ipc_stopper(ipc_server& server, tbb_client& client, const size_t i)
+    : padded_ipc_worker( server, client, i ) {}
+};
+
+class ipc_server: public tbb_server, no_copy {
+private:
+    tbb_client& my_client;
+    //! Maximum number of threads to be created.
+    /** Threads are created lazily, so maximum might not actually be reached. */
+    tbb_client::size_type my_n_thread;
+
+    //! Stack size for each thread. */
+    const size_t my_stack_size;
+
+    //! Number of jobs that could use their associated thread minus number of active threads.
+    /** If negative, indicates oversubscription.
+        If positive, indicates that more threads should run.
+        Can be lowered asynchronously, but must be raised only while holding my_asleep_list_mutex,
+        because raising it impacts the invariant for sleeping threads. */
+    atomic<int> my_slack;
+
+    //! Counter used to determine when to delete this.
+    atomic<int> my_ref_count;
+
+    padded_ipc_worker* my_thread_array;
+
+    //! List of workers that are asleep or committed to sleeping until notified by another thread.
+    tbb::atomic<ipc_worker*> my_asleep_list_root;
+
+    //! Protects my_asleep_list_root
+    typedef scheduler_mutex_type asleep_list_mutex_type;
+    asleep_list_mutex_type my_asleep_list_mutex;
+
+    //! Should server wait workers while terminate
+    const bool my_join_workers;
+
+    //! Service thread for waking of workers
+    ipc_waker* my_waker;
+
+    //! Service thread to stop threads
+    ipc_stopper* my_stopper;
+
+    //! Semaphore to account active threads
+    sem_t* my_active_sem;
+
+    //! Semaphore to account stop threads
+    sem_t* my_stop_sem;
+
+#if TBB_USE_ASSERT
+    atomic<int> my_net_slack_requests;
+#endif /* TBB_USE_ASSERT */
+
+    //! Wake up to two sleeping workers, if there are any sleeping.
+    /** The call is used to propagate a chain reaction where each thread wakes up two threads,
+        which in turn each wake up two threads, etc. */
+    void propagate_chain_reaction() {
+        // First test of a double-check idiom.  Second test is inside wake_some(0).
+        if( my_slack>0 ) {
+            int active_threads = 0;
+            if( try_get_active_thread() ) {
+                ++active_threads;
+                if( try_get_active_thread() ) {
+                    ++active_threads;
+                }
+                wake_some( 0, active_threads );
+            }
+        }
+    }
+
+    //! Try to add t to list of sleeping workers
+    bool try_insert_in_asleep_list(ipc_worker& t);
+
+    //! Try to add t to list of sleeping workers even if there is some work to do
+    bool try_insert_in_asleep_list_forced(ipc_worker& t);
+
+    //! Equivalent of adding additional_slack to my_slack and waking up to 2 threads if my_slack permits.
+    void wake_some(int additional_slack, int active_threads);
+
+    //! Equivalent of adding additional_slack to my_slack and waking up to 1 thread if my_slack permits.
+    void wake_one_forced(int additional_slack);
+
+    //! Stop one thread from asleep list
+    bool stop_one();
+
+    //! Wait for active thread
+    bool wait_active_thread();
+
+    //! Try to get active thread
+    bool try_get_active_thread();
+
+    //! Release active thread
+    void release_active_thread();
+
+    //! Wait for thread to stop
+    bool wait_stop_thread();
+
+    //! Add thread to stop list
+    void add_stop_thread();
+
+    void remove_server_ref() {
+        if( --my_ref_count==0 ) {
+            my_client.acknowledge_close_connection();
+            this->~ipc_server();
+            tbb::cache_aligned_allocator<ipc_server>().deallocate( this, 1 );
+        }
+    }
+
+    friend class ipc_worker;
+    friend class ipc_waker;
+    friend class ipc_stopper;
+public:
+    ipc_server(tbb_client& client);
+    virtual ~ipc_server();
+
+    version_type version() const __TBB_override {
+        return 0;
+    }
+
+    void request_close_connection(bool /*exiting*/) __TBB_override {
+        my_waker->start_shutdown(false);
+        my_stopper->start_shutdown(false);
+        for( size_t i=0; i<my_n_thread; ++i )
+            my_thread_array[i].start_shutdown( my_join_workers );
+        remove_server_ref();
+    }
+
+    void yield() __TBB_override {__TBB_Yield();}
+
+    void independent_thread_number_changed(int) __TBB_override { __TBB_ASSERT( false, NULL ); }
+
+    unsigned default_concurrency() const __TBB_override { return my_n_thread - 1; }
+
+    void adjust_job_count_estimate(int delta) __TBB_override;
+
+#if _WIN32||_WIN64
+    void register_master(::rml::server::execution_resource_t&) __TBB_override {}
+    void unregister_master(::rml::server::execution_resource_t) __TBB_override {}
+#endif /* _WIN32||_WIN64 */
+};
+
+//------------------------------------------------------------------------
+// Methods of ipc_worker
+//------------------------------------------------------------------------
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about an initialized variable 'sink_for_alloca' not referenced
+    #pragma warning(push)
+    #pragma warning(disable:4189)
+#endif
+#if __MINGW32__ && __GNUC__==4 &&__GNUC_MINOR__>=2 && !__MINGW64__
+// ensure that stack is properly aligned
+__attribute__((force_align_arg_pointer))
+#endif
+__RML_DECL_THREAD_ROUTINE ipc_worker::thread_routine(void* arg) {
+    ipc_worker* self = static_cast<ipc_worker*>(arg);
+    AVOID_64K_ALIASING( self->my_index );
+    self->run();
+    return 0;
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+void ipc_worker::release_handle(thread_handle handle, bool join) {
+    if( join )
+        ipc_thread_monitor::join( handle );
+    else
+        ipc_thread_monitor::detach_thread( handle );
+}
+
+void ipc_worker::start_shutdown(bool join) {
+    state_t s;
+
+    do {
+        s = my_state;
+        __TBB_ASSERT( s!=st_quit, NULL );
+    } while( my_state.compare_and_swap( st_quit, s )!=s );
+    if( s==st_normal || s==st_starting ) {
+        // May have invalidated invariant for sleeping, so wake up the thread.
+        // Note that the notify() here occurs without maintaining invariants for my_slack.
+        // It does not matter, because my_state==st_quit overrides checking of my_slack.
+        my_thread_monitor.notify();
+        // Do not need release handle in st_init state,
+        // because in this case the thread wasn't started yet.
+        // For st_starting release is done at launch site.
+        if( s==st_normal )
+            release_handle( my_handle, join );
+    }
+}
+
+void ipc_worker::start_stopping(bool join) {
+    state_t s;
+
+    do {
+        s = my_state;
+    } while( my_state.compare_and_swap( st_stop, s )!=s );
+    if( s==st_normal || s==st_starting ) {
+        // May have invalidated invariant for sleeping, so wake up the thread.
+        // Note that the notify() here occurs without maintaining invariants for my_slack.
+        // It does not matter, because my_state==st_quit overrides checking of my_slack.
+        my_thread_monitor.notify();
+        // Do not need release handle in st_init state,
+        // because in this case the thread wasn't started yet.
+        // For st_starting release is done at launch site.
+        if( s==st_normal )
+            release_handle( my_handle, join );
+    }
+}
+
+void ipc_worker::run() {
+    my_server.propagate_chain_reaction();
+
+    // Transiting to st_normal here would require setting my_handle,
+    // which would create race with the launching thread and
+    // complications in handle management on Windows.
+
+    ::rml::job& j = *my_client.create_one_job();
+    state_t state = my_state;
+    while( state!=st_quit && state!=st_stop ) {
+        if( my_server.my_slack>=0 ) {
+            my_client.process(j);
+        } else {
+            ipc_thread_monitor::cookie c;
+            // Prepare to wait
+            my_thread_monitor.prepare_wait(c);
+            // Check/set the invariant for sleeping
+            state = my_state;
+            if( state!=st_quit && state!=st_stop && my_server.try_insert_in_asleep_list(*this) ) {
+                if( my_server.my_n_thread > 1 ) my_server.release_active_thread();
+                my_thread_monitor.commit_wait(c);
+                my_server.propagate_chain_reaction();
+            } else {
+                // Invariant broken
+                my_thread_monitor.cancel_wait();
+            }
+        }
+        state = my_state;
+    }
+    my_client.cleanup(j);
+
+    my_server.remove_server_ref();
+}
+
+inline bool ipc_worker::wake_or_launch() {
+    if( ( my_state==st_init && my_state.compare_and_swap( st_starting, st_init )==st_init ) ||
+        ( my_state==st_stop && my_state.compare_and_swap( st_starting, st_stop )==st_stop ) ) {
+        // after this point, remove_server_ref() must be done by created thread
+#if USE_WINTHREAD
+        my_handle = ipc_thread_monitor::launch( thread_routine, this, my_server.my_stack_size, &this->my_index );
+#elif USE_PTHREAD
+        {
+        affinity_helper fpa;
+        fpa.protect_affinity_mask( /*restore_process_mask=*/true );
+        my_handle = ipc_thread_monitor::launch( thread_routine, this, my_server.my_stack_size );
+        if( my_handle == 0 ) {
+            // Unable to create new thread for process
+            // However, this is expected situation for the use cases of this coordination server
+            state_t s = my_state.compare_and_swap( st_init, st_starting );
+            if (st_starting != s) {
+                // Do shutdown during startup. my_handle can't be released
+                // by start_shutdown, because my_handle value might be not set yet
+                // at time of transition from st_starting to st_quit.
+                __TBB_ASSERT( s==st_quit, NULL );
+                release_handle( my_handle, my_server.my_join_workers );
+            }
+            return false;
+        } else {
+            my_server.my_ref_count++;
+        }
+        // Implicit destruction of fpa resets original affinity mask.
+        }
+#endif /* USE_PTHREAD */
+        state_t s = my_state.compare_and_swap( st_normal, st_starting );
+        if( st_starting!=s ) {
+            // Do shutdown during startup. my_handle can't be released
+            // by start_shutdown, because my_handle value might be not set yet
+            // at time of transition from st_starting to st_quit.
+            __TBB_ASSERT( s==st_quit, NULL );
+            release_handle( my_handle, my_server.my_join_workers );
+        }
+    }
+    else {
+        my_thread_monitor.notify();
+    }
+
+    return true;
+}
+
+//------------------------------------------------------------------------
+// Methods of ipc_waker
+//------------------------------------------------------------------------
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about an initialized variable 'sink_for_alloca' not referenced
+    #pragma warning(push)
+    #pragma warning(disable:4189)
+#endif
+#if __MINGW32__ && __GNUC__==4 &&__GNUC_MINOR__>=2 && !__MINGW64__
+// ensure that stack is properly aligned
+__attribute__((force_align_arg_pointer))
+#endif
+__RML_DECL_THREAD_ROUTINE ipc_waker::thread_routine(void* arg) {
+    ipc_waker* self = static_cast<ipc_waker*>(arg);
+    AVOID_64K_ALIASING( self->my_index );
+    self->run();
+    return 0;
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+void ipc_waker::run() {
+    // Transiting to st_normal here would require setting my_handle,
+    // which would create race with the launching thread and
+    // complications in handle management on Windows.
+
+    while( my_state!=st_quit ) {
+        bool have_to_sleep = false;
+        if( my_server.my_slack>0 ) {
+            if( my_server.wait_active_thread() ) {
+                if( my_server.my_slack>0 ) {
+                    my_server.wake_some( 0, 1 );
+                } else {
+                    my_server.release_active_thread();
+                    have_to_sleep = true;
+                }
+            }
+        } else {
+            have_to_sleep = true;
+        }
+        if( have_to_sleep ) {
+            ipc_thread_monitor::cookie c;
+            // Prepare to wait
+            my_thread_monitor.prepare_wait(c);
+            // Check/set the invariant for sleeping
+            if( my_state!=st_quit && my_server.my_slack<0 ) {
+                my_thread_monitor.commit_wait(c);
+            } else {
+                // Invariant broken
+                my_thread_monitor.cancel_wait();
+            }
+        }
+    }
+
+    my_server.remove_server_ref();
+}
+
+inline bool ipc_waker::wake_or_launch() {
+    if( my_state==st_init && my_state.compare_and_swap( st_starting, st_init )==st_init ) {
+        // after this point, remove_server_ref() must be done by created thread
+#if USE_WINTHREAD
+        my_handle = ipc_thread_monitor::launch( thread_routine, this, my_server.my_stack_size, &this->my_index );
+#elif USE_PTHREAD
+        {
+        affinity_helper fpa;
+        fpa.protect_affinity_mask( /*restore_process_mask=*/true );
+        my_handle = ipc_thread_monitor::launch( thread_routine, this, my_server.my_stack_size );
+        if( my_handle == 0 ) {
+            runtime_warning( "Unable to create new thread for process %d", getpid() );
+            state_t s = my_state.compare_and_swap( st_init, st_starting );
+            if (st_starting != s) {
+                // Do shutdown during startup. my_handle can't be released
+                // by start_shutdown, because my_handle value might be not set yet
+                // at time of transition from st_starting to st_quit.
+                __TBB_ASSERT( s==st_quit, NULL );
+                release_handle( my_handle, my_server.my_join_workers );
+            }
+            return false;
+        } else {
+            my_server.my_ref_count++;
+        }
+        // Implicit destruction of fpa resets original affinity mask.
+        }
+#endif /* USE_PTHREAD */
+        state_t s = my_state.compare_and_swap( st_normal, st_starting );
+        if( st_starting!=s ) {
+            // Do shutdown during startup. my_handle can't be released
+            // by start_shutdown, because my_handle value might be not set yet
+            // at time of transition from st_starting to st_quit.
+            __TBB_ASSERT( s==st_quit, NULL );
+            release_handle( my_handle, my_server.my_join_workers );
+        }
+    }
+    else {
+        my_thread_monitor.notify();
+    }
+
+    return true;
+}
+
+//------------------------------------------------------------------------
+// Methods of ipc_stopper
+//------------------------------------------------------------------------
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about an initialized variable 'sink_for_alloca' not referenced
+    #pragma warning(push)
+    #pragma warning(disable:4189)
+#endif
+#if __MINGW32__ && __GNUC__==4 &&__GNUC_MINOR__>=2 && !__MINGW64__
+// ensure that stack is properly aligned
+__attribute__((force_align_arg_pointer))
+#endif
+__RML_DECL_THREAD_ROUTINE ipc_stopper::thread_routine(void* arg) {
+    ipc_stopper* self = static_cast<ipc_stopper*>(arg);
+    AVOID_64K_ALIASING( self->my_index );
+    self->run();
+    return 0;
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+void ipc_stopper::run() {
+    // Transiting to st_normal here would require setting my_handle,
+    // which would create race with the launching thread and
+    // complications in handle management on Windows.
+
+    while( my_state!=st_quit ) {
+        if( my_server.wait_stop_thread() ) {
+            if( my_state!=st_quit ) {
+                if( !my_server.stop_one() ) {
+                    my_server.add_stop_thread();
+                    prolonged_pause();
+                }
+            }
+        }
+    }
+
+    my_server.remove_server_ref();
+}
+
+inline bool ipc_stopper::wake_or_launch() {
+    if( my_state==st_init && my_state.compare_and_swap( st_starting, st_init )==st_init ) {
+        // after this point, remove_server_ref() must be done by created thread
+#if USE_WINTHREAD
+        my_handle = ipc_thread_monitor::launch( thread_routine, this, my_server.my_stack_size, &this->my_index );
+#elif USE_PTHREAD
+        {
+        affinity_helper fpa;
+        fpa.protect_affinity_mask( /*restore_process_mask=*/true );
+        my_handle = ipc_thread_monitor::launch( thread_routine, this, my_server.my_stack_size );
+        if( my_handle == 0 ) {
+            runtime_warning( "Unable to create new thread for process %d", getpid() );
+            state_t s = my_state.compare_and_swap( st_init, st_starting );
+            if (st_starting != s) {
+                // Do shutdown during startup. my_handle can't be released
+                // by start_shutdown, because my_handle value might be not set yet
+                // at time of transition from st_starting to st_quit.
+                __TBB_ASSERT( s==st_quit, NULL );
+                release_handle( my_handle, my_server.my_join_workers );
+            }
+            return false;
+        } else {
+            my_server.my_ref_count++;
+        }
+        // Implicit destruction of fpa resets original affinity mask.
+        }
+#endif /* USE_PTHREAD */
+        state_t s = my_state.compare_and_swap( st_normal, st_starting );
+        if( st_starting!=s ) {
+            // Do shutdown during startup. my_handle can't be released
+            // by start_shutdown, because my_handle value might be not set yet
+            // at time of transition from st_starting to st_quit.
+            __TBB_ASSERT( s==st_quit, NULL );
+            release_handle( my_handle, my_server.my_join_workers );
+        }
+    }
+    else {
+        my_thread_monitor.notify();
+    }
+
+    return true;
+}
+
+//------------------------------------------------------------------------
+// Methods of ipc_server
+//------------------------------------------------------------------------
+ipc_server::ipc_server(tbb_client& client) :
+    my_client( client ),
+    my_stack_size( client.min_stack_size() ),
+    my_thread_array(NULL),
+    my_join_workers(false),
+    my_waker(NULL),
+    my_stopper(NULL)
+{
+    my_ref_count = 1;
+    my_slack = 0;
+#if TBB_USE_ASSERT
+    my_net_slack_requests = 0;
+#endif /* TBB_USE_ASSERT */
+    my_n_thread = get_num_threads(IPC_MAX_THREADS_VAR_NAME);
+    if( my_n_thread==0 ) {
+        my_n_thread = AvailableHwConcurrency();
+        __TBB_ASSERT( my_n_thread>0, NULL );
+    }
+
+    my_asleep_list_root = NULL;
+    my_thread_array = tbb::cache_aligned_allocator<padded_ipc_worker>().allocate( my_n_thread );
+    memset( my_thread_array, 0, sizeof(padded_ipc_worker)*my_n_thread );
+    for( size_t i=0; i<my_n_thread; ++i ) {
+        ipc_worker* t = new( &my_thread_array[i] ) padded_ipc_worker( *this, client, i );
+        t->my_next = my_asleep_list_root;
+        my_asleep_list_root = t;
+    }
+
+    my_waker = tbb::cache_aligned_allocator<ipc_waker>().allocate(1);
+    memset( my_waker, 0, sizeof(ipc_waker) );
+    new( my_waker ) ipc_waker( *this, client, my_n_thread );
+
+    my_stopper = tbb::cache_aligned_allocator<ipc_stopper>().allocate(1);
+    memset( my_stopper, 0, sizeof(ipc_stopper) );
+    new( my_stopper ) ipc_stopper( *this, client, my_n_thread + 1 );
+
+    char* active_sem_name = get_active_sem_name();
+    my_active_sem = sem_open( active_sem_name, O_CREAT, IPC_SEM_MODE, my_n_thread - 1 );
+    __TBB_ASSERT( my_active_sem, "Unable to open active threads semaphore" );
+    delete[] active_sem_name;
+
+    char* stop_sem_name = get_stop_sem_name();
+    my_stop_sem = sem_open( stop_sem_name, O_CREAT, IPC_SEM_MODE, 0 );
+    __TBB_ASSERT( my_stop_sem, "Unable to open stop threads semaphore" );
+    delete[] stop_sem_name;
+}
+
+ipc_server::~ipc_server() {
+    __TBB_ASSERT( my_net_slack_requests==0, NULL );
+
+    for( size_t i=my_n_thread; i--; )
+        my_thread_array[i].~padded_ipc_worker();
+    tbb::cache_aligned_allocator<padded_ipc_worker>().deallocate( my_thread_array, my_n_thread );
+    tbb::internal::poison_pointer( my_thread_array );
+
+    my_waker->~ipc_waker();
+    tbb::cache_aligned_allocator<ipc_waker>().deallocate( my_waker, 1 );
+    tbb::internal::poison_pointer( my_waker );
+
+    my_stopper->~ipc_stopper();
+    tbb::cache_aligned_allocator<ipc_stopper>().deallocate( my_stopper, 1 );
+    tbb::internal::poison_pointer( my_stopper );
+
+    sem_close( my_active_sem );
+    sem_close( my_stop_sem );
+}
+
+inline bool ipc_server::try_insert_in_asleep_list(ipc_worker& t) {
+    asleep_list_mutex_type::scoped_lock lock;
+    if( !lock.try_acquire( my_asleep_list_mutex ) )
+        return false;
+    // Contribute to slack under lock so that if another takes that unit of slack,
+    // it sees us sleeping on the list and wakes us up.
+    int k = ++my_slack;
+    if( k<=0 ) {
+        t.my_next = my_asleep_list_root;
+        my_asleep_list_root = &t;
+        return true;
+    } else {
+        --my_slack;
+        return false;
+    }
+}
+
+inline bool ipc_server::try_insert_in_asleep_list_forced(ipc_worker& t) {
+    asleep_list_mutex_type::scoped_lock lock;
+    if( !lock.try_acquire( my_asleep_list_mutex ) )
+        return false;
+    // Contribute to slack under lock so that if another takes that unit of slack,
+    // it sees us sleeping on the list and wakes us up.
+    ++my_slack;
+    t.my_next = my_asleep_list_root;
+    my_asleep_list_root = &t;
+    return true;
+}
+
+inline bool ipc_server::wait_active_thread() {
+    if( sem_wait( my_active_sem ) == 0 ) {
+        ++my_global_thread_count;
+        return true;
+    }
+    return false;
+}
+
+inline bool ipc_server::try_get_active_thread() {
+    if( sem_trywait( my_active_sem ) == 0 ) {
+        ++my_global_thread_count;
+        return true;
+    }
+    return false;
+}
+
+inline void ipc_server::release_active_thread() {
+    release_thread_sem( my_active_sem );
+}
+
+inline bool ipc_server::wait_stop_thread() {
+    struct timespec ts;
+    if( clock_gettime( CLOCK_REALTIME, &ts )==0 ) {
+        ts.tv_sec++;
+        if( sem_timedwait( my_stop_sem, &ts )==0 ) {
+            return true;
+        }
+    }
+    return false;
+}
+
+inline void ipc_server::add_stop_thread() {
+    sem_post( my_stop_sem );
+}
+
+void ipc_server::wake_some( int additional_slack, int active_threads ) {
+    __TBB_ASSERT( additional_slack>=0, NULL );
+    ipc_worker* wakee[2];
+    ipc_worker **w = wakee;
+    {
+        asleep_list_mutex_type::scoped_lock lock(my_asleep_list_mutex);
+        while( active_threads>0 && my_asleep_list_root && w<wakee+2 ) {
+            if( additional_slack>0 ) {
+                if( additional_slack+my_slack<=0 ) // additional demand does not exceed surplus supply
+                    break;
+                --additional_slack;
+            } else {
+                // Chain reaction; Try to claim unit of slack
+                int old;
+                do {
+                    old = my_slack;
+                    if( old<=0 ) goto done;
+                } while( my_slack.compare_and_swap( old-1, old )!=old );
+            }
+            // Pop sleeping worker to combine with claimed unit of slack
+            my_asleep_list_root = (*w++ = my_asleep_list_root)->my_next;
+            --active_threads;
+        }
+        if( additional_slack ) {
+            // Contribute our unused slack to my_slack.
+            my_slack += additional_slack;
+        }
+    }
+done:
+    while( w>wakee ) {
+        if( !(*--w)->wake_or_launch() ) {
+            add_stop_thread();
+            do {
+            } while( !try_insert_in_asleep_list_forced(**w) );
+            release_active_thread();
+        }
+    }
+    while( active_threads ) {
+        release_active_thread();
+        --active_threads;
+    }
+}
+
+void ipc_server::wake_one_forced( int additional_slack ) {
+    __TBB_ASSERT( additional_slack>=0, NULL );
+    ipc_worker* wakee[1];
+    ipc_worker **w = wakee;
+    {
+        asleep_list_mutex_type::scoped_lock lock(my_asleep_list_mutex);
+        while( my_asleep_list_root && w<wakee+1 ) {
+            if( additional_slack>0 ) {
+                if( additional_slack+my_slack<=0 ) // additional demand does not exceed surplus supply
+                    break;
+                --additional_slack;
+            } else {
+                // Chain reaction; Try to claim unit of slack
+                int old;
+                do {
+                    old = my_slack;
+                    if( old<=0 ) goto done;
+                } while( my_slack.compare_and_swap( old-1, old )!=old );
+            }
+            // Pop sleeping worker to combine with claimed unit of slack
+            my_asleep_list_root = (*w++ = my_asleep_list_root)->my_next;
+        }
+        if( additional_slack ) {
+            // Contribute our unused slack to my_slack.
+            my_slack += additional_slack;
+        }
+    }
+done:
+    while( w>wakee ) {
+        if( !(*--w)->wake_or_launch() ) {
+            add_stop_thread();
+            do {
+            } while( !try_insert_in_asleep_list_forced(**w) );
+        }
+    }
+}
+
+bool ipc_server::stop_one() {
+    ipc_worker* current = NULL;
+    ipc_worker* next = NULL;
+    {
+        asleep_list_mutex_type::scoped_lock lock(my_asleep_list_mutex);
+        if( my_asleep_list_root ) {
+            current = my_asleep_list_root;
+            if( current->my_state==ipc_worker::st_normal ) {
+                next = current->my_next;
+                while( next!= NULL && next->my_state==ipc_worker::st_normal ) {
+                    current = next;
+                    next = current->my_next;
+                }
+                current->start_stopping( my_join_workers );
+                return true;
+            }
+        }
+    }
+    return false;
+}
+
+void ipc_server::adjust_job_count_estimate( int delta ) {
+#if TBB_USE_ASSERT
+    my_net_slack_requests+=delta;
+#endif /* TBB_USE_ASSERT */
+    if( my_n_thread > 1 ) {
+        if( delta<0 ) {
+            my_slack+=delta;
+        } else if( delta>0 ) {
+            int active_threads = 0;
+            if( try_get_active_thread() ) {
+                ++active_threads;
+                if( try_get_active_thread() ) {
+                    ++active_threads;
+                }
+            }
+            wake_some( delta, active_threads );
+
+            if( !my_waker->wake_or_launch() ) {
+                add_stop_thread();
+            }
+            if( !my_stopper->wake_or_launch() ) {
+                add_stop_thread();
+            }
+        }
+    } else { // Corner case when RML shouldn't provide any worker thread but client has to have at least one
+        if( delta<0 ) {
+            my_slack += delta;
+        } else {
+            wake_one_forced( delta );
+        }
+    }
+}
+
+//------------------------------------------------------------------------
+// RML factory methods
+//------------------------------------------------------------------------
+
+#if USE_PTHREAD
+
+static tbb_client* my_global_client = NULL;
+static tbb_server* my_global_server = NULL;
+
+void rml_atexit() {
+    release_resources();
+}
+
+void rml_atfork_child() {
+    if( my_global_server!=NULL && my_global_client!=NULL ) {
+        ipc_server* server = static_cast<ipc_server*>( my_global_server );
+        server->~ipc_server();
+        memset( server, 0, sizeof(ipc_server) );
+        new( server ) ipc_server( *my_global_client );
+        pthread_atfork( NULL, NULL, rml_atfork_child );
+        atexit( rml_atexit );
+    }
+}
+
+#endif /* USE_PTHREAD */
+
+extern "C" tbb_factory::status_type __TBB_make_rml_server(tbb_factory& f, tbb_server*& server, tbb_client& client) {
+    server = new( tbb::cache_aligned_allocator<ipc_server>().allocate(1) ) ipc_server(client);
+#if USE_PTHREAD
+    my_global_client = &client;
+    my_global_server = server;
+    pthread_atfork( NULL, NULL, rml_atfork_child );
+    atexit( rml_atexit );
+#endif /* USE_PTHREAD */
+    if( getenv( "RML_DEBUG" ) ) {
+        runtime_warning("IPC server is started");
+    }
+    return tbb_factory::st_success;
+}
+
+extern "C" void __TBB_call_with_my_server_info(::rml::server_info_callback_t cb, void* arg) {
+}
+
+} // namespace rml
+} // namespace internal
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/python/rml/ipc_utils.cpp b/xdl/third_party/tbb/python/rml/ipc_utils.cpp
new file mode 100644
index 00000000..d21325c0
--- /dev/null
+++ b/xdl/third_party/tbb/python/rml/ipc_utils.cpp
@@ -0,0 +1,144 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "ipc_utils.h"
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <limits.h>
+#include <string.h>
+#include <unistd.h>
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+#define MAX_STR_LEN 255
+#define STARTTIME_ITEM_ID 21
+
+static char* get_stat_item(char* line, int item_id) {
+    int id = 0, i = 0;
+
+    while( id!=item_id ) {
+        while( line[i]!='(' && line[i]!=' ' && line[i]!='\0' ) {
+            ++i;
+        }
+        if( line[i]==' ' ) {
+            ++id;
+            ++i;
+        } else if( line[i]=='(' ) {
+            while( line[i]!=')' && line[i]!='\0' ) {
+               ++i;
+            }
+            if( line[i]==')' ) {
+                ++i;
+            } else {
+                return NULL;
+            }
+        } else {
+            return NULL;
+        }
+    }
+
+    return line + i;
+}
+
+unsigned long long get_start_time(int pid) {
+    const char* stat_file_path_template = "/proc/%d/stat";
+    char stat_file_path[MAX_STR_LEN + 1];
+    sprintf( stat_file_path, stat_file_path_template, pid );
+
+    FILE* stat_file = fopen( stat_file_path, "rt" );
+    if( stat_file==NULL ) {
+        return 0;
+    }
+
+    char stat_line[MAX_STR_LEN + 1];
+    char* line = fgets( stat_line, MAX_STR_LEN, stat_file );
+    if( line==NULL ) {
+        return 0;
+    }
+
+    char* starttime_str = get_stat_item( stat_line, STARTTIME_ITEM_ID );
+    if( starttime_str==NULL ) {
+        return 0;
+    }
+
+    unsigned long long starttime = strtoull( starttime_str, NULL, 10 );
+    if( starttime==ULLONG_MAX ) {
+        return 0;
+    }
+
+    return starttime;
+}
+
+char* get_shared_name(const char* prefix, int pid, unsigned long long time) {
+    const char* name_template = "%s_%d_%llu";
+    const int digits_in_int = 10;
+    const int digits_in_long = 20;
+
+    int len = strlen( name_template ) + strlen( prefix ) + digits_in_int + digits_in_long + 1;
+    char* name = new char[len];
+    sprintf( name, name_template, prefix, pid, time );
+
+    return name;
+}
+
+char* get_shared_name(const char* prefix) {
+    int pid = getpgrp();
+    unsigned long long time = get_start_time( pid );
+    return get_shared_name( prefix, pid, time );
+}
+
+int get_num_threads(const char* env_var) {
+    if( env_var==NULL ) {
+        return 0;
+    }
+
+    char* value = getenv( env_var );
+    if( value==NULL ) {
+        return 0;
+    }
+
+    int num_threads = (int)strtol( value, NULL, 10 );
+    return num_threads;
+}
+
+bool get_enable_flag(const char* env_var) {
+    if( env_var==NULL ) {
+        return false;
+    }
+
+    char* value = getenv( env_var );
+    if( value==NULL ) {
+        return false;
+    }
+
+    if( strcmp( value, "0" ) == 0 ||
+        strcmp( value, "false" ) == 0 ||
+        strcmp( value, "False" ) == 0 ||
+        strcmp( value, "FALSE" ) == 0 ) {
+        return false;
+    }
+
+    return true;
+}
+
+}}} //tbb::internal::rml
diff --git a/xdl/third_party/tbb/python/rml/ipc_utils.h b/xdl/third_party/tbb/python/rml/ipc_utils.h
new file mode 100644
index 00000000..82f128e6
--- /dev/null
+++ b/xdl/third_party/tbb/python/rml/ipc_utils.h
@@ -0,0 +1,34 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __IPC_UTILS_H
+#define __IPC_UTILS_H
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+char* get_shared_name(const char* prefix);
+int get_num_threads(const char* env_var);
+bool get_enable_flag(const char* env_var);
+
+}}} //tbb::internal::rml
+
+#endif
diff --git a/xdl/third_party/tbb/python/setup.py b/xdl/third_party/tbb/python/setup.py
new file mode 100644
index 00000000..bb6c2e2a
--- /dev/null
+++ b/xdl/third_party/tbb/python/setup.py
@@ -0,0 +1,124 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+# System imports
+from __future__ import print_function
+from glob import glob
+import platform
+import os
+
+from distutils.core import *
+from distutils.command.build import build
+
+rundir = os.getcwd()
+os.chdir(os.path.abspath(os.path.dirname(__file__)))
+
+if any(i in os.environ for i in ["CC", "CXX"]):
+    if "CC" not in os.environ:
+        os.environ['CC'] = os.environ['CXX']
+    if "CXX" not in os.environ:
+        os.environ['CXX'] = os.environ['CC']
+    if platform.system() == 'Linux':
+        os.environ['LDSHARED'] = os.environ['CXX'] + " -shared"
+    print("Environment specifies CC=%s CXX=%s"%(os.environ['CC'], os.environ['CXX']))
+
+intel_compiler = os.getenv('CC', '') in ['icl', 'icpc', 'icc']
+try:
+    tbb_root = os.environ['TBBROOT']
+    print("Using TBBROOT=", tbb_root)
+except:
+    tbb_root = '..'
+    if not intel_compiler:
+        print("Warning: TBBROOT env var is not set and Intel's compiler is not used. It might lead\n"
+              "    !!!: to compile/link problems. Source tbbvars.sh/.csh file to set environment")
+use_compiler_tbb = intel_compiler and tbb_root == '..'
+if use_compiler_tbb:
+    print("Using Intel TBB from Intel's compiler")
+if platform.system() == 'Windows':
+    if intel_compiler:
+        os.environ['DISTUTILS_USE_SDK'] = '1'  # Enable environment settings in distutils
+        os.environ['MSSdk'] = '1'
+        print("Using compiler settings from environment")
+    tbb_flag = ['/Qtbb'] if use_compiler_tbb else []
+    tbb_flag += ['/EHsc'] # for Python 2
+    compile_flags = ['/Qstd=c++11'] if intel_compiler else []
+else:
+    tbb_flag = ['-tbb'] if use_compiler_tbb else []
+    compile_flags = ['-std=c++11', '-Wno-unused-variable']
+
+_tbb = Extension("tbb._api", ["tbb/api.i"],
+        include_dirs=[os.path.join(tbb_root, 'include')] if not use_compiler_tbb else [],
+        swig_opts   =['-c++', '-O', '-threads'] + (  # add '-builtin' later
+              ['-I' + os.path.join(tbb_root, 'include')] if not use_compiler_tbb else []),
+        extra_compile_args=compile_flags + tbb_flag,
+        extra_link_args=tbb_flag,
+        libraries   =(['tbb'] if not use_compiler_tbb else []) +
+                     (['irml'] if platform.system() == "Linux" else []),   # TODO: why do we need this?
+        library_dirs=[ rundir,                                              # for custom-builds
+                       os.path.join(tbb_root, 'lib', 'intel64', 'gcc4.4'),  # for Linux
+                       os.path.join(tbb_root, 'lib'),                       # for MacOS
+                       os.path.join(tbb_root, 'lib', 'intel64', 'vc_mt'),   # for Windows
+                     ] if not use_compiler_tbb else [],
+        language    ='c++',
+        )
+
+
+class TBBBuild(build):
+    sub_commands = [  # define build order
+        ('build_ext', build.has_ext_modules),
+        ('build_py', build.has_pure_modules),
+    ]
+
+
+setup(  name        ="TBB",
+        description ="Python API for Intel TBB",
+        long_description="Python API to Intel(R) Threading Building Blocks library (Intel(R) TBB) "
+                         "extended with standard Pool implementation and monkey-patching",
+        url         ="https://software.intel.com/en-us/intel-tbb",
+        author      ="Intel Corporation",
+        author_email="inteltbbdevelopers@intel.com",
+        license     ="Dual license: Apache or Proprietary",
+        version     ="0.1",
+        classifiers =[
+            'Development Status :: 4 - Beta',
+            'Environment :: Console',
+            'Environment :: Plugins',
+            'Intended Audience :: Developers',
+            'Intended Audience :: System Administrators',
+            'Intended Audience :: Other Audience',
+            'Intended Audience :: Science/Research',
+            'License :: OSI Approved :: Apache Software License',
+            'Operating System :: MacOS :: MacOS X',
+            'Operating System :: Microsoft :: Windows',
+            'Operating System :: POSIX :: Linux',
+            'Programming Language :: Python',
+            'Programming Language :: Python :: 2',
+            'Programming Language :: Python :: 3',
+            'Programming Language :: C++',
+            'Topic :: System :: Hardware :: Symmetric Multi-processing',
+            'Topic :: Software Development :: Libraries',
+          ],
+        keywords='TBB multiprocessing multithreading composable parallelism',
+        ext_modules=[_tbb],
+        packages=['tbb'],
+        py_modules=['TBB'],
+        cmdclass={'build': TBBBuild}
+)
diff --git a/xdl/third_party/tbb/python/tbb/__init__.py b/xdl/third_party/tbb/python/tbb/__init__.py
new file mode 100644
index 00000000..1e1d7d5d
--- /dev/null
+++ b/xdl/third_party/tbb/python/tbb/__init__.py
@@ -0,0 +1,323 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+from __future__ import print_function
+
+import multiprocessing.pool
+import ctypes
+import atexit
+import sys
+import os
+ 
+from .api import  *
+from .api import __all__ as api__all
+from .pool import *
+from .pool import __all__ as pool__all
+
+__all__ = ["Monkey", "is_active"] + api__all + pool__all
+
+__doc__ = """
+Python API for Intel(R) Threading Building Blocks library (Intel(R) TBB)
+extended with standard Python's pools implementation and monkey-patching.
+
+Command-line interface example:
+$  python -m tbb $your_script.py
+Runs your_script.py in context of tbb.Monkey
+"""
+
+is_active = False
+""" Indicates whether TBB context is activated """
+
+ipc_enabled = False
+""" Indicates whether IPC mode is enabled """
+
+libirml = "libirml.so.1"
+
+
+def _test(arg=None):
+    """Some tests"""
+    import platform
+    if platform.system() == "Linux":
+        ctypes.CDLL(libirml)
+        assert 256 == os.system("ldd "+_api.__file__+"| grep -E 'libimf|libsvml|libintlc'")
+    from .test import test
+    test(arg)
+    print("done")
+
+
+def tbb_process_pool_worker27(inqueue, outqueue, initializer=None, initargs=(),
+                            maxtasks=None):
+    from multiprocessing.pool import worker
+    worker(inqueue, outqueue, initializer, initargs, maxtasks)
+    if ipc_enabled:
+        try:
+            librml = ctypes.CDLL(libirml)
+            librml.release_resources()
+        except:
+            print("Warning: Can not load ", libirml, file=sys.stderr)
+
+
+class TBBProcessPool27(multiprocessing.pool.Pool):
+    def _repopulate_pool(self):
+        """Bring the number of pool processes up to the specified number,
+        for use after reaping workers which have exited.
+        """
+        from multiprocessing.util import debug
+
+        for i in range(self._processes - len(self._pool)):
+            w = self.Process(target=tbb_process_pool_worker27,
+                             args=(self._inqueue, self._outqueue,
+                                   self._initializer,
+                                   self._initargs, self._maxtasksperchild)
+                            )
+            self._pool.append(w)
+            w.name = w.name.replace('Process', 'PoolWorker')
+            w.daemon = True
+            w.start()
+            debug('added worker')
+
+    def __del__(self):
+        self.close()
+        for p in self._pool:
+            p.join()
+
+    def __exit__(self, *args):
+        self.close()
+        for p in self._pool:
+            p.join()
+
+
+def tbb_process_pool_worker3(inqueue, outqueue, initializer=None, initargs=(),
+                            maxtasks=None, wrap_exception=False):
+    from multiprocessing.pool import worker
+    worker(inqueue, outqueue, initializer, initargs, maxtasks, wrap_exception)
+    if ipc_enabled:
+        try:
+            librml = ctypes.CDLL(libirml)
+            librml.release_resources()
+        except:
+            print("Warning: Can not load ", libirml, file=sys.stderr)
+
+
+class TBBProcessPool3(multiprocessing.pool.Pool):
+    def _repopulate_pool(self):
+        """Bring the number of pool processes up to the specified number,
+        for use after reaping workers which have exited.
+        """
+        from multiprocessing.util import debug
+
+        for i in range(self._processes - len(self._pool)):
+            w = self.Process(target=tbb_process_pool_worker3,
+                             args=(self._inqueue, self._outqueue,
+                                   self._initializer,
+                                   self._initargs, self._maxtasksperchild,
+                                   self._wrap_exception)
+                            )
+            self._pool.append(w)
+            w.name = w.name.replace('Process', 'PoolWorker')
+            w.daemon = True
+            w.start()
+            debug('added worker')
+
+    def __del__(self):
+        self.close()
+        for p in self._pool:
+            p.join()
+
+    def __exit__(self, *args):
+        self.close()
+        for p in self._pool:
+            p.join()
+
+
+class Monkey:
+    """
+    Context manager which replaces standard multiprocessing.pool
+    implementations with tbb.pool using monkey-patching. It also enables TBB
+    threading for Intel(R) Math Kernel Library (Intel(R) MKL). For example:
+
+        with tbb.Monkey():
+            run_my_numpy_code()
+
+    It allows multiple parallel tasks to be executed on the same thread pool
+    and coordinate number of threads across multiple processes thus avoiding
+    overheads from oversubscription.
+    """
+    _items   = {}
+    _modules = {}
+
+    def __init__(self, max_num_threads=None, benchmark=False):
+        """
+        Create context manager for running under TBB scheduler.
+        :param max_num_threads: if specified, limits maximal number of threads
+        :param benchmark: if specified, blocks in initialization until requested number of threads are ready
+        """
+        if max_num_threads:
+            self.ctl = global_control(global_control.max_allowed_parallelism, int(max_num_threads))
+        if benchmark:
+            if not max_num_threads:
+               max_num_threads = default_num_threads()
+            from .api import _concurrency_barrier
+            _concurrency_barrier(int(max_num_threads))
+
+    def _patch(self, class_name, module_name, obj):
+        m = self._modules[class_name] = __import__(module_name, globals(),
+                                                   locals(), [class_name])
+        if m == None:
+            return
+        oldattr = getattr(m, class_name, None)
+        if oldattr == None:
+            self._modules[class_name] = None
+            return
+        self._items[class_name] = oldattr
+        setattr(m, class_name, obj)
+
+    def __enter__(self):
+        global is_active
+        assert is_active == False, "tbb.Monkey does not support nesting yet"
+        is_active = True
+        self.env = os.getenv('MKL_THREADING_LAYER')
+        os.environ['MKL_THREADING_LAYER'] = 'TBB'
+
+        if ipc_enabled:
+            if sys.version_info.major == 2 and sys.version_info.minor >= 7:
+                self._patch("Pool", "multiprocessing.pool", TBBProcessPool27)
+            elif sys.version_info.major == 3 and sys.version_info.minor >= 5:
+                self._patch("Pool", "multiprocessing.pool", TBBProcessPool3)
+        self._patch("ThreadPool", "multiprocessing.pool", Pool)
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        global is_active
+        assert is_active == True, "modified?"
+        is_active = False
+        if self.env is None:
+            del os.environ['MKL_THREADING_LAYER']
+        else:
+            os.environ['MKL_THREADING_LAYER'] = self.env
+        for name in self._items.keys():
+            setattr(self._modules[name], name, self._items[name])
+
+
+def init_sem_name():
+    try:
+        librml = ctypes.CDLL(libirml)
+        librml.set_active_sem_name()
+        librml.set_stop_sem_name()
+    except Exception as e:
+        print("Warning: Can not initialize name of shared semaphores:", e,
+              file=sys.stderr)
+
+
+def tbb_atexit():
+    if ipc_enabled:
+        try:
+            librml = ctypes.CDLL(libirml)
+            librml.release_semaphores()
+        except:
+            print("Warning: Can not release shared semaphores",
+                  file=sys.stderr)
+
+
+def _main():
+    # Run the module specified as the next command line argument
+    # python -m TBB user_app.py
+    global ipc_enabled
+
+    import platform
+    import argparse
+    parser = argparse.ArgumentParser(prog="python -m tbb", description="""
+                Run your Python script in context of tbb.Monkey, which
+                replaces standard Python pools and threading layer of
+                Intel(R) Math Kernel Library by implementation based on
+                Intel(R) Threading Building Blocks. It enables multiple parallel
+                tasks to be executed on the same thread pool and coordinate
+                number of threads across multiple processes thus avoiding
+                overheads from oversubscription.
+             """, formatter_class=argparse.ArgumentDefaultsHelpFormatter)
+    if platform.system() == "Linux":
+        parser.add_argument('--ipc', action='store_true',
+                        help="Enable inter-process (IPC) coordination between Intel TBB schedulers")
+        parser.add_argument('-a', '--allocator', action='store_true',
+                        help="Enable Intel TBB scalable allocator as a replacement for standard memory allocator")
+        parser.add_argument('--allocator-huge-pages', action='store_true',
+                        help="Enable huge pages for Intel TBB allocator (implies: -a)")
+    parser.add_argument('-p', '--max-num-threads', default=default_num_threads(), type=int,
+                        help="Initialize Intel TBB with P max number of threads per process", metavar='P')
+    parser.add_argument('-b', '--benchmark', action='store_true',
+                        help="Block Intel TBB initialization until all the threads are created before continue the script. "
+                        "This is necessary for performance benchmarks that want to exclude lazy scheduler initialization effects from the measurements")
+    parser.add_argument('-v', '--verbose', action='store_true',
+                        help="Request verbose and version information")
+    parser.add_argument('-m', action='store_true', dest='module',
+                        help="Executes following as a module")
+    parser.add_argument('name', help="Script or module name")
+    parser.add_argument('args', nargs=argparse.REMAINDER,
+                        help="Command line arguments")
+    args = parser.parse_args()
+
+    if args.verbose:
+        os.environ["TBB_VERSION"] = "1"
+    if platform.system() == "Linux":
+        if args.allocator_huge_pages:
+            args.allocator = True
+        if args.allocator and not os.environ.get("_TBB_MALLOC_PRELOAD"):
+            libtbbmalloc_lib = 'libtbbmalloc_proxy.so.2'
+            ld_preload = 'LD_PRELOAD'
+            os.environ["_TBB_MALLOC_PRELOAD"] = "1"
+            preload_list = filter(None, os.environ.get(ld_preload, "").split(':'))
+            if libtbbmalloc_lib in preload_list:
+                print('Info:', ld_preload, "contains", libtbbmalloc_lib, "already\n")
+            else:
+                os.environ[ld_preload] = ':'.join([libtbbmalloc_lib] + list(preload_list))
+
+            if args.allocator_huge_pages:
+                assert platform.system() == "Linux"
+                try:
+                    with open('/proc/sys/vm/nr_hugepages', 'r') as f:
+                        pages = int(f.read())
+                    if pages == 0:
+                        print("TBB: Pre-allocated huge pages are not currently reserved in the system. To reserve, run e.g.:\n"
+                              "\tsudo sh -c 'echo 2000 > /proc/sys/vm/nr_hugepages'")
+                    os.environ["TBB_MALLOC_USE_HUGE_PAGES"] = "1"
+                except:
+                    print("TBB: Failed to read number of pages from /proc/sys/vm/nr_hugepages\n"
+                          "\tIs the Linux kernel configured with the huge pages feature?")
+                    sys.exit(1)
+
+            os.execl(sys.executable, sys.executable, '-m', 'tbb', *sys.argv[1:])
+            assert False, "Re-execution failed"
+
+    sys.argv = [args.name] + args.args
+    ipc_enabled = platform.system() == "Linux" and args.ipc
+    os.environ["IPC_ENABLE"] = "1" if ipc_enabled else "0"
+    if ipc_enabled:
+        atexit.register(tbb_atexit)
+        init_sem_name()
+    if not os.environ.get("KMP_BLOCKTIME"): # TODO move
+        os.environ["KMP_BLOCKTIME"] = "0"
+    if '_' + args.name in globals():
+        return globals()['_' + args.name](*args.args)
+    else:
+        import runpy
+        runf = runpy.run_module if args.module else runpy.run_path
+        with Monkey(max_num_threads=args.max_num_threads, benchmark=args.benchmark):
+            runf(args.name, run_name='__main__')
diff --git a/xdl/third_party/tbb/python/tbb/__main__.py b/xdl/third_party/tbb/python/tbb/__main__.py
new file mode 100644
index 00000000..2c125c1f
--- /dev/null
+++ b/xdl/third_party/tbb/python/tbb/__main__.py
@@ -0,0 +1,24 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+from . import _main
+from sys import exit
+exit(_main())
diff --git a/xdl/third_party/tbb/python/tbb/api.i b/xdl/third_party/tbb/python/tbb/api.i
new file mode 100644
index 00000000..88e3d87b
--- /dev/null
+++ b/xdl/third_party/tbb/python/tbb/api.i
@@ -0,0 +1,180 @@
+%pythonbegin %{
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+
+__all__ = ["task_arena", "task_group", "task_scheduler_init", "global_control", "default_num_threads"]
+%}
+%begin %{
+/* Defines Python wrappers for Intel(R) Threading Building Blocks (Intel TBB).*/
+%}
+%module api
+
+#if SWIG_VERSION < 0x030001
+#error SWIG version 3.0.6 or newer is required for correct functioning
+#endif
+
+%{
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#define TBB_PREVIEW_WAITING_FOR_WORKERS 1
+#include <tbb/tbb.h>
+#include <tbb/compat/condition_variable>
+#if TBB_IMPLEMENT_CPP0X
+namespace std { using tbb::mutex; }
+#define unique_ptr auto_ptr
+#else
+#include <condition_variable>
+#include <mutex>
+#include <memory>
+#endif
+using namespace tbb;
+
+class PyCaller : public swig::SwigPtr_PyObject {
+public:
+    // icpc 2013 does not support simple using SwigPtr_PyObject::SwigPtr_PyObject;
+    PyCaller(const PyCaller& s) : SwigPtr_PyObject(s) {}
+    PyCaller(PyObject *p, bool initial = true) : SwigPtr_PyObject(p, initial) {}
+
+    void operator()() const {
+        SWIG_PYTHON_THREAD_BEGIN_BLOCK;
+        PyObject* r = PyObject_CallFunctionObjArgs((PyObject*)*this, NULL);
+        if(r) Py_DECREF(r);
+        SWIG_PYTHON_THREAD_END_BLOCK;
+    }
+};
+
+struct ArenaPyCaller {
+    task_arena *my_arena;
+    PyObject *my_callable;
+    ArenaPyCaller(task_arena *a, PyObject *c) : my_arena(a), my_callable(c) {
+        SWIG_PYTHON_THREAD_BEGIN_BLOCK;
+        Py_XINCREF(c);
+        SWIG_PYTHON_THREAD_END_BLOCK;
+    }
+    void operator()() const {
+        my_arena->execute(PyCaller(my_callable, false));
+    }
+};
+
+struct barrier_data {
+    std::condition_variable event;
+    std::mutex m;
+    int worker_threads, full_threads;
+};
+
+class barrier_task : public tbb::task {
+    barrier_data &b;
+public:
+    barrier_task(barrier_data &d) : b(d) {}
+    /*override*/ tbb::task *execute() {
+        std::unique_lock<std::mutex> lock(b.m);
+        if(++b.worker_threads >= b.full_threads)
+            b.event.notify_all();
+        else while(b.worker_threads < b.full_threads)
+            b.event.wait(lock);
+        return NULL;
+    }
+};
+
+void _concurrency_barrier(int threads = tbb::task_scheduler_init::automatic) {
+    if(threads == task_scheduler_init::automatic)
+        threads = task_scheduler_init::default_num_threads();
+    if(threads < 2)
+        return;
+    std::unique_ptr<global_control> g(
+        (global_control::active_value(global_control::max_allowed_parallelism) < unsigned(threads))?
+            new global_control(global_control::max_allowed_parallelism, threads) : NULL);
+    barrier_data b;
+    b.worker_threads = 0;
+    b.full_threads = threads-1;
+    for(int i = 0; i < b.full_threads; i++)
+        tbb::task::enqueue( *new( tbb::task::allocate_root() ) barrier_task(b) );
+    std::unique_lock<std::mutex> lock(b.m);
+    b.event.wait(lock);
+};
+
+%}
+
+void _concurrency_barrier(int threads = tbb::task_scheduler_init::automatic);
+
+namespace tbb {
+    class task_scheduler_init {
+    public:
+        //! Typedef for number of threads that is automatic.
+        static const int automatic = -1;
+        //! Argument to initialize() or constructor that causes initialization to be deferred.
+        static const int deferred = -2;
+        task_scheduler_init( int max_threads=automatic,
+                             size_t thread_stack_size=0 );
+        ~task_scheduler_init();
+        void initialize( int max_threads=automatic );
+        void terminate();
+        static int default_num_threads();
+        bool is_active() const;
+        void blocking_terminate();
+    };
+
+    class task_arena {
+    public:
+        static const int automatic = -1;
+        static int current_thread_index();
+        task_arena(int max_concurrency = automatic, unsigned reserved_for_masters = 1);
+        task_arena(const task_arena &s);
+        ~task_arena();
+        void initialize();
+        void initialize(int max_concurrency, unsigned reserved_for_masters = 1);
+        void terminate();
+        bool is_active();
+        %extend {
+        void enqueue( PyObject *c ) { $self->enqueue(PyCaller(c)); }
+        void execute( PyObject *c ) { $self->execute(PyCaller(c)); }
+        };
+    };
+
+    class task_group {
+    public:
+        task_group();
+        ~task_group();
+        void wait(); 
+        bool is_canceling();
+        void cancel();
+        %extend {
+        void run( PyObject *c ) { $self->run(PyCaller(c)); }
+        void run( PyObject *c, task_arena *a ) { $self->run(ArenaPyCaller(a, c)); }
+        };
+    };
+
+    class global_control {
+    public:
+        enum parameter {
+            max_allowed_parallelism,
+            thread_stack_size,
+            parameter_max // insert new parameters above this point
+        };
+        global_control(parameter param, size_t value);
+        ~global_control();
+        static size_t active_value(parameter param);
+    };
+
+} // tbb
+
+// Additional definitions for Python part of the module
+%pythoncode %{
+default_num_threads = task_scheduler_init_default_num_threads
+%}
diff --git a/xdl/third_party/tbb/python/tbb/pool.py b/xdl/third_party/tbb/python/tbb/pool.py
new file mode 100644
index 00000000..360ec539
--- /dev/null
+++ b/xdl/third_party/tbb/python/tbb/pool.py
@@ -0,0 +1,635 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Based on the software developed by:
+# Copyright (c) 2008,2016 david decotigny (Pool of threads)
+# Copyright (c) 2006-2008, R Oudkerk (multiprocessing.Pool)
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+#
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. Neither the name of author nor the names of any contributors may be
+#    used to endorse or promote products derived from this software
+#    without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS "AS IS" AND
+# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+# ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+# SUCH DAMAGE.
+#
+
+# @brief Python Pool implementation based on TBB with monkey-patching
+#
+# See http://docs.python.org/dev/library/multiprocessing.html
+# Differences: added imap_async and imap_unordered_async, and terminate()
+# has to be called explicitly (it's not registered by atexit).
+#
+# The general idea is that we submit works to a workqueue, either as
+# single Jobs (one function to call), or JobSequences (batch of
+# Jobs). Each Job is associated with an ApplyResult object which has 2
+# states: waiting for the Job to complete, or Ready. Instead of
+# waiting for the jobs to finish, we wait for their ApplyResult object
+# to become ready: an event mechanism is used for that.
+# When we apply a function to several arguments in "parallel", we need
+# a way to wait for all/part of the Jobs to be processed: that's what
+# "collectors" are for; they group and wait for a set of ApplyResult
+# objects. Once a collector is ready to be used, we can use a
+# CollectorIterator to iterate over the result values it's collecting.
+#
+# The methods of a Pool object use all these concepts and expose
+# them to their caller in a very simple way.
+
+import sys
+import threading
+import traceback
+from .api import *
+
+__all__ = ["Pool", "TimeoutError"]
+__doc__ = """
+Standard Python Pool implementation based on Python API
+for Intel(R) Threading Building Blocks library (Intel(R) TBB)
+"""
+
+
+class TimeoutError(Exception):
+    """Raised when a result is not available within the given timeout"""
+    pass
+
+
+class Pool(object):
+    """
+    The Pool class provides standard multiprocessing.Pool interface
+    which is mapped onto Intel(R) TBB tasks executing in its thread pool
+    """
+
+    def __init__(self, nworkers=0, name="Pool"):
+        """
+        \param nworkers (integer) number of worker threads to start
+        \param name (string) prefix for the worker threads' name
+        """
+        self._closed = False
+        self._tasks = task_group()
+        self._pool = [None,]*default_num_threads()  # Dask asks for len(_pool)
+
+    def apply(self, func, args=(), kwds=dict()):
+        """Equivalent of the apply() builtin function. It blocks till
+        the result is ready."""
+        return self.apply_async(func, args, kwds).get()
+
+    def map(self, func, iterable, chunksize=None):
+        """A parallel equivalent of the map() builtin function. It
+        blocks till the result is ready.
+
+        This method chops the iterable into a number of chunks which
+        it submits to the process pool as separate tasks. The
+        (approximate) size of these chunks can be specified by setting
+        chunksize to a positive integer."""
+        return self.map_async(func, iterable, chunksize).get()
+
+    def imap(self, func, iterable, chunksize=1):
+        """
+        An equivalent of itertools.imap().
+
+        The chunksize argument is the same as the one used by the
+        map() method. For very long iterables using a large value for
+        chunksize can make the job complete much faster than
+        using the default value of 1.
+
+        Also if chunksize is 1 then the next() method of the iterator
+        returned by the imap() method has an optional timeout
+        parameter: next(timeout) will raise processing.TimeoutError if
+        the result cannot be returned within timeout seconds.
+        """
+        collector = OrderedResultCollector(as_iterator=True)
+        self._create_sequences(func, iterable, chunksize, collector)
+        return iter(collector)
+
+    def imap_unordered(self, func, iterable, chunksize=1):
+        """The same as imap() except that the ordering of the results
+        from the returned iterator should be considered
+        arbitrary. (Only when there is only one worker process is the
+        order guaranteed to be "correct".)"""
+        collector = UnorderedResultCollector()
+        self._create_sequences(func, iterable, chunksize, collector)
+        return iter(collector)
+
+    def apply_async(self, func, args=(), kwds=dict(), callback=None):
+        """A variant of the apply() method which returns an
+        ApplyResult object.
+
+        If callback is specified then it should be a callable which
+        accepts a single argument. When the result becomes ready,
+        callback is applied to it (unless the call failed). callback
+        should complete immediately since otherwise the thread which
+        handles the results will get blocked."""
+        assert not self._closed  # No lock here. We assume it's atomic...
+        apply_result = ApplyResult(callback=callback)
+        job = Job(func, args, kwds, apply_result)
+        self._tasks.run(job)
+        return apply_result
+
+    def map_async(self, func, iterable, chunksize=None, callback=None):
+        """A variant of the map() method which returns a ApplyResult
+        object.
+
+        If callback is specified then it should be a callable which
+        accepts a single argument. When the result becomes ready
+        callback is applied to it (unless the call failed). callback
+        should complete immediately since otherwise the thread which
+        handles the results will get blocked."""
+        apply_result = ApplyResult(callback=callback)
+        collector    = OrderedResultCollector(apply_result, as_iterator=False)
+        if not self._create_sequences(func, iterable, chunksize, collector):
+          apply_result._set_value([])
+        return apply_result
+
+    def imap_async(self, func, iterable, chunksize=None, callback=None):
+        """A variant of the imap() method which returns an ApplyResult
+        object that provides an iterator (next method(timeout)
+        available).
+
+        If callback is specified then it should be a callable which
+        accepts a single argument. When the resulting iterator becomes
+        ready, callback is applied to it (unless the call
+        failed). callback should complete immediately since otherwise
+        the thread which handles the results will get blocked."""
+        apply_result = ApplyResult(callback=callback)
+        collector    = OrderedResultCollector(apply_result, as_iterator=True)
+        if not self._create_sequences(func, iterable, chunksize, collector):
+          apply_result._set_value(iter([]))
+        return apply_result
+
+    def imap_unordered_async(self, func, iterable, chunksize=None,
+                             callback=None):
+        """A variant of the imap_unordered() method which returns an
+        ApplyResult object that provides an iterator (next
+        method(timeout) available).
+
+        If callback is specified then it should be a callable which
+        accepts a single argument. When the resulting iterator becomes
+        ready, callback is applied to it (unless the call
+        failed). callback should complete immediately since otherwise
+        the thread which handles the results will get blocked."""
+        apply_result = ApplyResult(callback=callback)
+        collector    = UnorderedResultCollector(apply_result)
+        if not self._create_sequences(func, iterable, chunksize, collector):
+          apply_result._set_value(iter([]))
+        return apply_result
+
+    def close(self):
+        """Prevents any more tasks from being submitted to the
+        pool. Once all the tasks have been completed the worker
+        processes will exit."""
+        # No lock here. We assume it's sufficiently atomic...
+        self._closed = True
+
+    def terminate(self):
+        """Stops the worker processes immediately without completing
+        outstanding work. When the pool object is garbage collected
+        terminate() will be called immediately."""
+        self.close()
+        self._tasks.cancel()
+
+    def join(self):
+        """Wait for the worker processes to exit. One must call
+        close() or terminate() before using join()."""
+        self._tasks.wait()
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        self.join()
+
+    def __del__(self):
+        self.terminate()
+        self.join()
+
+    def _create_sequences(self, func, iterable, chunksize, collector):
+        """
+        Create callable objects to process and pushes them on the
+        work queue. Each work unit is meant to process a slice of
+        iterable of size chunksize. If collector is specified, then
+        the ApplyResult objects associated with the jobs will notify
+        collector when their result becomes ready.
+
+        \return the list callable objects (basically: JobSequences)
+        pushed onto the work queue
+        """
+        assert not self._closed  # No lock here. We assume it's atomic...
+        it_ = iter(iterable)
+        exit_loop = False
+        sequences = []
+        while not exit_loop:
+            seq = []
+            for _ in range(chunksize or 1):
+                try:
+                    arg = next(it_)
+                except StopIteration:
+                    exit_loop = True
+                    break
+                apply_result = ApplyResult(collector)
+                job = Job(func, (arg,), {}, apply_result)
+                seq.append(job)
+            if seq:
+                sequences.append(JobSequence(seq))
+        for t in sequences:
+            self._tasks.run(t)
+        return sequences
+
+
+class Job:
+    """A work unit that corresponds to the execution of a single function"""
+
+    def __init__(self, func, args, kwds, apply_result):
+        """
+        \param func/args/kwds used to call the function
+        \param apply_result ApplyResult object that holds the result
+        of the function call
+        """
+        self._func = func
+        self._args = args
+        self._kwds = kwds
+        self._result = apply_result
+
+    def __call__(self):
+        """
+        Call the function with the args/kwds and tell the ApplyResult
+        that its result is ready. Correctly handles the exceptions
+        happening during the execution of the function
+        """
+        try:
+            result = self._func(*self._args, **self._kwds)
+        except:
+            self._result._set_exception()
+        else:
+            self._result._set_value(result)
+
+
+class JobSequence:
+    """A work unit that corresponds to the processing of a continuous
+    sequence of Job objects"""
+
+    def __init__(self, jobs):
+        self._jobs = jobs
+
+    def __call__(self):
+        """
+        Call all the Job objects that have been specified
+        """
+        for job in self._jobs:
+            job()
+
+
+class ApplyResult(object):
+    """An object associated with a Job object that holds its result:
+    it's available during the whole life the Job and after, even when
+    the Job didn't process yet. It's possible to use this object to
+    wait for the result/exception of the job to be available.
+
+    The result objects returns by the Pool::*_async() methods are of
+    this type"""
+
+    def __init__(self, collector=None, callback=None):
+        """
+        \param collector when not None, the notify_ready() method of
+        the collector will be called when the result from the Job is
+        ready
+        \param callback when not None, function to call when the
+        result becomes available (this is the paramater passed to the
+        Pool::*_async() methods.
+        """
+        self._success = False
+        self._event = threading.Event()
+        self._data = None
+        self._collector = None
+        self._callback = callback
+
+        if collector is not None:
+            collector.register_result(self)
+            self._collector = collector
+
+    def get(self, timeout=None):
+        """
+        Returns the result when it arrives. If timeout is not None and
+        the result does not arrive within timeout seconds then
+        TimeoutError is raised. If the remote call raised an exception
+        then that exception will be reraised by get().
+        """
+        if not self.wait(timeout):
+            raise TimeoutError("Result not available within %fs" % timeout)
+        if self._success:
+            return self._data
+        if sys.version_info[0] == 3:
+            raise self._data[0](self._data[1]).with_traceback(self._data[2])
+        else:
+            exec("raise self._data[0], self._data[1], self._data[2]")
+
+    def wait(self, timeout=None):
+        """Waits until the result is available or until timeout
+        seconds pass."""
+        self._event.wait(timeout)
+        return self._event.isSet()
+
+    def ready(self):
+        """Returns whether the call has completed."""
+        return self._event.isSet()
+
+    def successful(self):
+        """Returns whether the call completed without raising an
+        exception. Will raise AssertionError if the result is not
+        ready."""
+        assert self.ready()
+        return self._success
+
+    def _set_value(self, value):
+        """Called by a Job object to tell the result is ready, and
+        provides the value of this result. The object will become
+        ready and successful. The collector's notify_ready() method
+        will be called, and the callback method too"""
+        assert not self.ready()
+        self._data = value
+        self._success = True
+        self._event.set()
+        if self._collector is not None:
+            self._collector.notify_ready(self)
+        if self._callback is not None:
+            try:
+                self._callback(value)
+            except:
+                traceback.print_exc()
+
+    def _set_exception(self):
+        """Called by a Job object to tell that an exception occurred
+        during the processing of the function. The object will become
+        ready but not successful. The collector's notify_ready()
+        method will be called, but NOT the callback method"""
+        # traceback.print_exc()
+        assert not self.ready()
+        self._data = sys.exc_info()
+        self._success = False
+        self._event.set()
+        if self._collector is not None:
+            self._collector.notify_ready(self)
+
+
+class AbstractResultCollector(object):
+    """ABC to define the interface of a ResultCollector object. It is
+    basically an object which knows whuich results it's waiting for,
+    and which is able to get notify when they get available. It is
+    also able to provide an iterator over the results when they are
+    available"""
+
+    def __init__(self, to_notify):
+        """
+        \param to_notify ApplyResult object to notify when all the
+        results we're waiting for become available. Can be None.
+        """
+        self._to_notify = to_notify
+
+    def register_result(self, apply_result):
+        """Used to identify which results we're waiting for. Will
+        always be called BEFORE the Jobs get submitted to the work
+        queue, and BEFORE the __iter__ and _get_result() methods can
+        be called
+        \param apply_result ApplyResult object to add in our collection
+        """
+        raise NotImplementedError("Children classes must implement it")
+
+    def notify_ready(self, apply_result):
+        """Called by the ApplyResult object (already registered via
+        register_result()) that it is now ready (ie. the Job's result
+        is available or an exception has been raised).
+        \param apply_result ApplyResult object telling us that the job
+        has been processed
+        """
+        raise NotImplementedError("Children classes must implement it")
+
+    def _get_result(self, idx, timeout=None):
+        """Called by the CollectorIterator object to retrieve the
+        result's values one after another (order defined by the
+        implementation)
+        \param idx The index of the result we want, wrt collector's order
+        \param timeout integer telling how long to wait (in seconds)
+        for the result at index idx to be available, or None (wait
+        forever)
+        """
+        raise NotImplementedError("Children classes must implement it")
+
+    def __iter__(self):
+        """Return a new CollectorIterator object for this collector"""
+        return CollectorIterator(self)
+
+
+class CollectorIterator(object):
+    """An iterator that allows to iterate over the result values
+    available in the given collector object. Equipped with an extended
+    next() method accepting a timeout argument. Created by the
+    AbstractResultCollector::__iter__() method"""
+
+    def __init__(self, collector):
+        """\param AbstractResultCollector instance"""
+        self._collector = collector
+        self._idx = 0
+
+    def __iter__(self):
+        return self
+
+    def next(self, timeout=None):
+        """Return the next result value in the sequence. Raise
+        StopIteration at the end. Can raise the exception raised by
+        the Job"""
+        try:
+            apply_result = self._collector._get_result(self._idx, timeout)
+        except IndexError:
+            # Reset for next time
+            self._idx = 0
+            raise StopIteration
+        except:
+            self._idx = 0
+            raise
+        self._idx += 1
+        assert apply_result.ready()
+        return apply_result.get(0)
+
+    def __next__(self):
+        return self.next()
+
+
+class UnorderedResultCollector(AbstractResultCollector):
+    """An AbstractResultCollector implementation that collects the
+    values of the ApplyResult objects in the order they become ready. The
+    CollectorIterator object returned by __iter__() will iterate over
+    them in the order they become ready"""
+
+    def __init__(self, to_notify=None):
+        """
+        \param to_notify ApplyResult object to notify when all the
+        results we're waiting for become available. Can be None.
+        """
+        AbstractResultCollector.__init__(self, to_notify)
+        self._cond = threading.Condition()
+        self._collection = []
+        self._expected = 0
+
+    def register_result(self, apply_result):
+        """Used to identify which results we're waiting for. Will
+        always be called BEFORE the Jobs get submitted to the work
+        queue, and BEFORE the __iter__ and _get_result() methods can
+        be called
+        \param apply_result ApplyResult object to add in our collection
+        """
+        self._expected += 1
+
+    def _get_result(self, idx, timeout=None):
+        """Called by the CollectorIterator object to retrieve the
+        result's values one after another, in the order the results have
+        become available.
+        \param idx The index of the result we want, wrt collector's order
+        \param timeout integer telling how long to wait (in seconds)
+        for the result at index idx to be available, or None (wait
+        forever)
+        """
+        self._cond.acquire()
+        try:
+            if idx >= self._expected:
+                raise IndexError
+            elif idx < len(self._collection):
+                return self._collection[idx]
+            elif idx != len(self._collection):
+                # Violation of the sequence protocol
+                raise IndexError()
+            else:
+                self._cond.wait(timeout=timeout)
+                try:
+                    return self._collection[idx]
+                except IndexError:
+                    # Still not added !
+                    raise TimeoutError("Timeout while waiting for results")
+        finally:
+            self._cond.release()
+
+    def notify_ready(self, apply_result=None):
+        """Called by the ApplyResult object (already registered via
+        register_result()) that it is now ready (ie. the Job's result
+        is available or an exception has been raised).
+        \param apply_result ApplyResult object telling us that the job
+        has been processed
+        """
+        first_item = False
+        self._cond.acquire()
+        try:
+            self._collection.append(apply_result)
+            first_item = (len(self._collection) == 1)
+
+            self._cond.notifyAll()
+        finally:
+            self._cond.release()
+
+        if first_item and self._to_notify is not None:
+            self._to_notify._set_value(iter(self))
+
+
+class OrderedResultCollector(AbstractResultCollector):
+    """An AbstractResultCollector implementation that collects the
+    values of the ApplyResult objects in the order they have been
+    submitted. The CollectorIterator object returned by __iter__()
+    will iterate over them in the order they have been submitted"""
+
+    def __init__(self, to_notify=None, as_iterator=True):
+        """
+        \param to_notify ApplyResult object to notify when all the
+        results we're waiting for become available. Can be None.
+        \param as_iterator boolean telling whether the result value
+        set on to_notify should be an iterator (available as soon as 1
+        result arrived) or a list (available only after the last
+        result arrived)
+        """
+        AbstractResultCollector.__init__(self, to_notify)
+        self._results = []
+        self._lock = threading.Lock()
+        self._remaining = 0
+        self._as_iterator = as_iterator
+
+    def register_result(self, apply_result):
+        """Used to identify which results we're waiting for. Will
+        always be called BEFORE the Jobs get submitted to the work
+        queue, and BEFORE the __iter__ and _get_result() methods can
+        be called
+        \param apply_result ApplyResult object to add in our collection
+        """
+        self._results.append(apply_result)
+        self._remaining += 1
+
+    def _get_result(self, idx, timeout=None):
+        """Called by the CollectorIterator object to retrieve the
+        result's values one after another (order defined by the
+        implementation)
+        \param idx The index of the result we want, wrt collector's order
+        \param timeout integer telling how long to wait (in seconds)
+        for the result at index idx to be available, or None (wait
+        forever)
+        """
+        res = self._results[idx]
+        res.wait(timeout)
+        return res
+
+    def notify_ready(self, apply_result):
+        """Called by the ApplyResult object (already registered via
+        register_result()) that it is now ready (ie. the Job's result
+        is available or an exception has been raised).
+        \param apply_result ApplyResult object telling us that the job
+        has been processed
+        """
+        got_first = False
+        got_last = False
+        self._lock.acquire()
+        try:
+            assert self._remaining > 0
+            got_first = (len(self._results) == self._remaining)
+            self._remaining -= 1
+            got_last = (self._remaining == 0)
+        finally:
+            self._lock.release()
+
+        if self._to_notify is not None:
+            if self._as_iterator and got_first:
+                self._to_notify._set_value(iter(self))
+            elif not self._as_iterator and got_last:
+                try:
+                    lst = [r.get(0) for r in self._results]
+                except:
+                    self._to_notify._set_exception()
+                else:
+                    self._to_notify._set_value(lst)
diff --git a/xdl/third_party/tbb/python/tbb/test.py b/xdl/third_party/tbb/python/tbb/test.py
new file mode 100644
index 00000000..7b78faab
--- /dev/null
+++ b/xdl/third_party/tbb/python/tbb/test.py
@@ -0,0 +1,199 @@
+#!/usr/bin/env python
+#
+# Copyright (c) 2016-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+# Based on the software developed by:
+# Copyright (c) 2008,2016 david decotigny (Pool of threads)
+# Copyright (c) 2006-2008, R Oudkerk (multiprocessing.Pool)
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+#
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. Neither the name of author nor the names of any contributors may be
+#    used to endorse or promote products derived from this software
+#    without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS "AS IS" AND
+# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+# ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+# SUCH DAMAGE.
+#
+
+from __future__ import print_function
+import time
+import threading
+
+from .api import *
+from .pool import *
+
+
+def test(arg=None):
+    if arg == "-v":
+        def say(*x):
+            print(*x)
+    else:
+        def say(*x):
+            pass
+    say("Start Pool testing")
+
+    get_tid = lambda: threading.current_thread().ident
+
+    def return42():
+        return 42
+
+    def f(x):
+        return x * x
+
+    def work(mseconds):
+        res = str(mseconds)
+        if mseconds < 0:
+            mseconds = -mseconds
+        say("[%d] Start to work for %fms..." % (get_tid(), mseconds*10))
+        time.sleep(mseconds/100.)
+        say("[%d] Work done (%fms)." % (get_tid(), mseconds*10))
+        return res
+
+    ### Test copy/pasted from multiprocessing
+    pool = Pool(4)  # start worker threads
+
+    # edge cases
+    assert pool.map(return42, []) == []
+    assert pool.apply_async(return42, []).get() == 42
+    assert pool.apply(return42, []) == 42
+    assert list(pool.imap(return42, iter([]))) == []
+    assert list(pool.imap_unordered(return42, iter([]))) == []
+    assert pool.map_async(return42, []).get() == []
+    assert list(pool.imap_async(return42, iter([])).get()) == []
+    assert list(pool.imap_unordered_async(return42, iter([])).get()) == []
+
+    # basic tests
+    result = pool.apply_async(f, (10,))  # evaluate "f(10)" asynchronously
+    assert result.get(timeout=1) == 100  # ... unless slow computer
+    assert list(pool.map(f, range(10))) == list(map(f, range(10)))
+    it = pool.imap(f, range(10))
+    assert next(it) == 0
+    assert next(it) == 1
+    assert next(it) == 4
+
+    # Test apply_sync exceptions
+    result = pool.apply_async(time.sleep, (3,))
+    try:
+        say(result.get(timeout=1))  # raises `TimeoutError`
+    except TimeoutError:
+        say("Good. Got expected timeout exception.")
+    else:
+        assert False, "Expected exception !"
+    assert result.get() is None  # sleep() returns None
+
+    def cb(s):
+        say("Result ready: %s" % s)
+
+    # Test imap()
+    assert list(pool.imap(work, range(10, 3, -1), chunksize=4)) == list(map(
+        str, range(10, 3, -1)))
+
+    # Test imap_unordered()
+    assert sorted(pool.imap_unordered(work, range(10, 3, -1))) == sorted(map(
+        str, range(10, 3, -1)))
+
+    # Test map_async()
+    result = pool.map_async(work, range(10), callback=cb)
+    try:
+        result.get(timeout=0.01)  # raises `TimeoutError`
+    except TimeoutError:
+        say("Good. Got expected timeout exception.")
+    else:
+        assert False, "Expected exception !"
+    say(result.get())
+
+    # Test imap_async()
+    result = pool.imap_async(work, range(3, 10), callback=cb)
+    try:
+        result.get(timeout=0.01)  # raises `TimeoutError`
+    except TimeoutError:
+        say("Good. Got expected timeout exception.")
+    else:
+        assert False, "Expected exception !"
+    for i in result.get():
+        say("Item:", i)
+    say("### Loop again:")
+    for i in result.get():
+        say("Item2:", i)
+
+    # Test imap_unordered_async()
+    result = pool.imap_unordered_async(work, range(10, 3, -1), callback=cb)
+    try:
+        say(result.get(timeout=0.01))  # raises `TimeoutError`
+    except TimeoutError:
+        say("Good. Got expected timeout exception.")
+    else:
+        assert False, "Expected exception !"
+    for i in result.get():
+        say("Item1:", i)
+    for i in result.get():
+        say("Item2:", i)
+    r = result.get()
+    for i in r:
+        say("Item3:", i)
+    for i in r:
+        say("Item4:", i)
+    for i in r:
+        say("Item5:", i)
+
+    #
+    # The case for the exceptions
+    #
+
+    # Exceptions in imap_unordered_async()
+    result = pool.imap_unordered_async(work, range(2, -10, -1), callback=cb)
+    time.sleep(3)
+    try:
+        for i in result.get():
+            say("Got item:", i)
+    except (IOError, ValueError):
+        say("Good. Got expected exception")
+
+    # Exceptions in imap_async()
+    result = pool.imap_async(work, range(2, -10, -1), callback=cb)
+    time.sleep(3)
+    try:
+        for i in result.get():
+            say("Got item:", i)
+    except (IOError, ValueError):
+        say("Good. Got expected exception")
+
+    # Stop the test: need to stop the pool !!!
+    pool.terminate()
+    pool.join()
+
+
diff --git a/xdl/third_party/tbb/src/Makefile b/xdl/third_party/tbb/src/Makefile
new file mode 100644
index 00000000..17cedc64
--- /dev/null
+++ b/xdl/third_party/tbb/src/Makefile
@@ -0,0 +1,269 @@
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+tbb_root?=..
+examples_root:=$(tbb_root)/examples
+include $(tbb_root)/build/common.inc
+
+#workaround for non-depend targets tbb and tbbmalloc which both depend on version_string.ver
+#According to documentation, recursively invoked make commands can process their targets in parallel
+.NOTPARALLEL:
+
+.PHONY: all tbb tbbmalloc tbbproxy test test_no_depends release debug examples clean
+
+all: release debug examples
+
+tbb: tbb_release tbb_debug
+
+tbbmalloc: tbbmalloc_release tbbmalloc_debug
+
+tbbproxy: tbbproxy_release tbbproxy_debug
+
+rml: rml_release rml_debug
+
+test: tbbmalloc_test_release $(if $(use_proxy),tbbproxy_test_release) tbb_test_release tbbmalloc_test_debug $(if $(use_proxy),tbbproxy_test_debug) tbb_test_debug
+ifeq (,$(findstring skip,$(target:android=skip) $(offload:mic=skip)))
+test: rml_test_debug rml_test_release
+endif
+
+test_no_depends: tbbmalloc_test_release_no_depends $(if $(use_proxy),tbbproxy_test_release_no_depends) tbb_test_release_no_depends tbbmalloc_test_debug_no_depends $(if $(use_proxy),tbbproxy_test_debug_no_depends) tbb_test_debug_no_depends
+	@echo done
+
+release: tbb_release tbbmalloc_release $(if $(use_proxy),tbbproxy_release)
+release: $(call cross_cfg,tbbmalloc_test_release) $(call cross_cfg,test_release)
+
+debug: tbb_debug tbbmalloc_debug $(if $(use_proxy),tbbproxy_debug)
+debug: $(call cross_cfg,tbbmalloc_test_debug) $(call cross_cfg, test_debug)
+
+examples: tbb tbbmalloc examples_debug clean_examples examples_release
+
+examples_no_depends: examples_release_no_depends examples_debug_no_depends
+
+clean: clean_release clean_debug clean_examples
+	@echo clean done
+
+.PHONY: full
+full:
+	$(MAKE) -sir --no-print-directory -f Makefile tbb_root=.. clean all
+ifeq ($(tbb_os),windows)
+	$(MAKE) -sir --no-print-directory -f Makefile tbb_root=.. compiler=icl clean all native_examples
+else
+	$(MAKE) -sir --no-print-directory -f Makefile tbb_root=.. compiler=icc clean all native_examples
+endif
+ifeq ($(arch),intel64)
+	$(MAKE) -sir --no-print-directory -f Makefile tbb_root=.. arch=ia32 clean all
+endif
+# it doesn't test compiler=icc arch=ia32 on intel64 systems due to environment settings of icc
+
+native_examples: tbb tbbmalloc
+	$(MAKE) -C $(examples_root) -r -f Makefile tbb_root=.. compiler=$(native_compiler) debug test
+	$(MAKE) -C $(examples_root) -r -f Makefile tbb_root=.. compiler=$(native_compiler) clean release test
+
+../examples/% examples/%::
+	$(MAKE) -C $(examples_root) -r -f Makefile tbb_root=.. $(subst examples/,,$(subst ../,,$@))
+
+debug_%:: cfg:=$(if $(findstring file,$(origin cfg)),debug,$(cfg))
+debug_%:: export run_cmd=$(debugger)
+debug_malloc_% test_malloc_% debug_ScalableAlloc% test_ScalableAlloc%:: TESTFILE=tbbmalloc
+debug_rml_% test_rml_%:: TESTFILE=rml
+debug_runtime_load% test_runtime_load%:: TESTFILE=tbbproxy
+debug_% test_% stress_% time_% perf_%:: TESTFILE?=test
+debug_% test_% stress_% time_% perf_%::
+	$(MAKE) -C "$(work_dir)_$(cfg)" -r -f $(tbb_root)/build/Makefile.$(TESTFILE) cfg=$(cfg) $(subst .cpp,,$@)
+
+clean_%::
+ifeq ($(origin cfg),file)
+	@$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.test cfg=release $@
+	@$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.test cfg=debug $@
+else
+	@$(MAKE) -C "$(work_dir)_$(cfg)"  -r -f $(tbb_root)/build/Makefile.test $@
+endif
+
+python_%: mkdir_release
+	$(MAKE) -C "$(work_dir)_release" -rf $(tbb_root)/python/Makefile $(subst python_,,$@)
+
+.PHONY: test_release test_debug test_release_no_depends test_debug_no_depends
+.PHONY: tbb_release tbb_debug tbb_test_release tbb_test_debug tbb_test_release_no_depends tbb_test_debug_no_depends
+# do not delete double-space after -C option
+tbb_release: mkdir_release
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbb cfg=release
+
+tbb_debug: mkdir_debug
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbb cfg=debug
+
+tbb_test: tbb_test_release tbb_test_debug
+
+tbb_test_release: $(call cross_cfg,tbb_release) $(if $(use_proxy),$(call cross_cfg,tbbproxy_release)) tbb_test_release_no_depends
+tbb_test_release_no_depends:$(call cross_cfg,mkdir_release)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_release)"  -r -f $(tbb_root)/build/Makefile.test cfg=release
+
+tbb_test_debug: $(call cross_cfg,tbb_debug) $(if $(use_proxy),$(call cross_cfg,tbbproxy_debug)) tbb_test_debug_no_depends
+tbb_test_debug_no_depends:$(call cross_cfg,mkdir_debug)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_debug)"  -r -f $(tbb_root)/build/Makefile.test cfg=debug
+# backward compatibility
+test_release: tbb_test_release
+test_debug: tbb_test_debug
+test_release_no_depends: tbb_test_release_no_depends
+test_debug_no_depends: tbb_test_debug_no_depends
+
+.PHONY: tbbmalloc_release tbbmalloc_debug
+.PHONY: tbbmalloc_dll_release tbbmalloc_dll_debug tbbmalloc_proxy_dll_release tbbmalloc_proxy_dll_debug
+.PHONY: tbbmalloc_test tbbmalloc_test_release tbbmalloc_test_debug tbbmalloc_test_release_no_depends tbbmalloc_test_debug_no_depends
+
+tbbmalloc_release: mkdir_release
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=release malloc
+
+tbbmalloc_debug: mkdir_debug
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=debug malloc
+
+tbbmalloc_dll_release: mkdir_release
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=release malloc_dll
+
+tbbmalloc_proxy_dll_release: mkdir_release
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=release  malloc_proxy_dll
+
+tbbmalloc_dll_debug: mkdir_debug
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=debug malloc_dll
+
+tbbmalloc_proxy_dll_debug: mkdir_debug
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=debug malloc_proxy_dll
+
+tbbmalloc_test: tbbmalloc_test_release tbbmalloc_test_debug
+
+tbbmalloc_test_release: $(call cross_cfg,tbbmalloc_release) tbbmalloc_test_release_no_depends
+tbbmalloc_test_release_no_depends: $(call cross_cfg,mkdir_release)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_release)"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=release malloc_test_no_depends
+
+tbbmalloc_test_debug: $(call cross_cfg,tbbmalloc_debug) tbbmalloc_test_debug_no_depends
+tbbmalloc_test_debug_no_depends: $(call cross_cfg,mkdir_debug)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_debug)"  -r -f $(tbb_root)/build/Makefile.tbbmalloc cfg=debug malloc_test_no_depends
+
+.PHONY: tbbproxy_release tbbproxy_debug
+.PHONY: tbbproxy_test tbbproxy_test_release tbbproxy_test_debug tbbproxy_test_release_no_depends tbbproxy_test_debug_no_depends
+
+tbbproxy_release: mkdir_release tbb_release
+	$(MAKE) -C "$(work_dir)_release" -r -f $(tbb_root)/build/Makefile.tbbproxy cfg=release tbbproxy
+
+tbbproxy_debug: mkdir_debug tbb_debug
+	$(MAKE) -C "$(work_dir)_debug" -r -f $(tbb_root)/build/Makefile.tbbproxy cfg=debug tbbproxy
+
+tbbproxy_test: tbbproxy_test_release tbbproxy_test_debug
+
+tbbproxy_test_release: $(call cross_cfg,tbb_release) $(call cross_cfg,tbbproxy_release) tbbproxy_test_release_no_depends
+tbbproxy_test_release_no_depends:$(call cross_cfg,mkdir_release)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_release)" -r -f $(tbb_root)/build/Makefile.tbbproxy cfg=release tbbproxy_test
+
+tbbproxy_test_debug: $(call cross_cfg,tbb_debug) $(call cross_cfg,tbbproxy_debug) tbbproxy_test_debug_no_depends
+tbbproxy_test_debug_no_depends: $(call cross_cfg,mkdir_debug)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_debug)"   -r -f $(tbb_root)/build/Makefile.tbbproxy cfg=debug tbbproxy_test
+
+.PHONY: rml_release rml_debug rml_test_release rml_test_debug
+.PHONY: rml_test_release_no_depends rml_test_debug_no_depends
+
+rml_release: mkdir_release
+	$(MAKE) -C "$(work_dir)_release"  -r -f $(tbb_root)/build/Makefile.rml cfg=release rml
+
+rml_debug: mkdir_debug
+	$(MAKE) -C "$(work_dir)_debug"  -r -f $(tbb_root)/build/Makefile.rml cfg=debug rml
+
+rml_test: rml_test_release rml_test_debug
+
+rml_test_release: $(call cross_cfg,rml_release) rml_test_release_no_depends
+rml_test_release_no_depends: $(call cross_cfg,mkdir_release)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_release)"  -r -f $(tbb_root)/build/Makefile.rml cfg=release rml_test
+
+rml_test_debug: $(call cross_cfg,rml_debug) rml_test_debug_no_depends
+rml_test_debug_no_depends: $(call cross_cfg,mkdir_debug)
+	$(MAKE) -C "$(call cross_cfg,$(work_dir)_debug)"  -r -f $(tbb_root)/build/Makefile.rml cfg=debug rml_test
+
+.PHONY: examples_release examples_debug examples_release_no_depends examples_debug_no_depends
+
+examples_release: tbb_release tbbmalloc_release examples_release_no_depends
+examples_release_no_depends:
+	$(MAKE) -C $(examples_root) -r -f Makefile tbb_root=.. release test UI=con
+
+examples_debug: tbb_debug tbbmalloc_debug examples_debug_no_depends
+examples_debug_no_depends:
+	$(MAKE) -C $(examples_root) -r -f Makefile tbb_root=.. debug test UI=con
+
+.PHONY: clean_release clean_debug clean_examples
+
+clean_release:
+	$(shell $(RM) $(work_dir)_release$(SLASH)*.* >$(NUL) 2>$(NUL))
+	$(shell $(RD) $(work_dir)_release >$(NUL) 2>$(NUL))
+
+clean_debug:
+	$(shell $(RM) $(work_dir)_debug$(SLASH)*.* >$(NUL) 2>$(NUL))
+	$(shell $(RD) $(work_dir)_debug >$(NUL) 2>$(NUL))
+
+clean_examples:
+	$(shell $(MAKE) -s -i -r -C $(examples_root) -f Makefile tbb_root=.. clean >$(NUL) 2>$(NUL))
+
+.PHONY: mkdir_release mkdir_debug codecov do_codecov info tbbvars shell
+
+mkdir_release:
+	$(shell $(MD) "$(work_dir)_release" >$(NUL) 2>$(NUL))
+	@echo Created $(work_dir)_release directory
+
+mkdir_debug:
+	$(shell $(MD) "$(work_dir)_debug" >$(NUL) 2>$(NUL))
+	@echo Created $(work_dir)_debug directory
+
+ifeq ($(compiler),$(if $(findstring windows,$(tbb_os)),icl,icc))
+codecov: codecov=yes
+codecov: do_codecov
+	$(MAKE) -C "$(work_dir)_release" -r -f $(tbb_root)/build/Makefile.test cfg=release codecov_gen
+else
+codecov:
+	$(error Only Intel(R) C++ Compiler is supported for code coverage)
+endif
+
+export codecov
+
+do_codecov: tbb_root=..
+do_codecov:
+	$(MAKE) RML=yes tbbmalloc_test_release test_release
+	$(MAKE) clean_test_* cfg=release
+	$(MAKE) RML=yes crosstest=yes tbbmalloc_test_debug test_debug
+	$(MAKE) clean_test_* cfg=release
+	$(MAKE) rml_test_release
+	$(MAKE) clean_test_* cfg=release
+	$(MAKE) crosstest=yes rml_test_debug
+
+info:
+	@echo OS: $(tbb_os)
+	@echo arch=$(arch)
+	@echo compiler=$(compiler)
+	@echo runtime=$(runtime)
+	@echo tbb_build_prefix=$(tbb_build_prefix)
+	@echo work_dir=$(abspath $(tbb_build_dir)$(SLASH)$(tbb_build_prefix)_$(cfg))
+
+# [usage]$ source `make <options> tbbvars`.sh
+tbbvars:
+	@echo $(tbb_build_dir)$(SLASH)$(tbb_build_prefix)_$(cfg)$(SLASH)tbbvars
+
+symbols: args=$(if $(findstring cl,$(compiler)), dumpbin /section:.text *.obj|findstr COMDAT , nm -Pg *.o|grep ' T '|cut -f1 -d' ')
+symbols: shell
+
+shell:
+ifdef BUILDING_PHASE
+	-$(run_cmd) $(shell_cmd)
+else
+	@$(MAKE) -C "$(work_dir)_$(cfg)" -rf $(tbb_root)/src/Makefile BUILDING_PHASE=1 shell shell_cmd="$(if $(args),$(args),$(SHELL))"
+endif
+
diff --git a/xdl/third_party/tbb/src/index.html b/xdl/third_party/tbb/src/index.html
new file mode 100644
index 00000000..11cefe96
--- /dev/null
+++ b/xdl/third_party/tbb/src/index.html
@@ -0,0 +1,76 @@
+<HTML>
+<BODY>
+
+<H2>Overview</H2>
+This directory contains the source code and unit tests for Intel&reg; Threading Building Blocks.
+
+<H2>Directories</H2>
+<DL>
+<DT><A HREF="tbb">tbb</A>
+<DD>Source code of the TBB library core.
+<DT><A HREF="tbbmalloc">tbbmalloc</A>
+<DD>Source code of the TBB scalable memory allocator.
+<DT><A HREF="test">test</A>
+<DD>Source code of the TBB unit tests.
+<DT><A HREF="rml">rml</A>
+<DD>Source code of the Resource Management Layer (RML).
+<DT><A HREF="perf">perf</A>
+<DD>Source code of microbenchmarks.
+<DT><A HREF="old">old</A>
+<DD>Source code of deprecated TBB entities that are still shipped as part of the TBB library for the sake of backward compatibility.
+</DL>
+
+<h2>Files</h2>
+<dl>
+<dt><a href="Makefile">Makefile</a>
+<dd>Advanced Makefile for developing and debugging of TBB. See the <a href="../build/index.html#build">basic build directions</a>. Additional targets and options:
+    <dt><tt>make test_{name} time_{name}</tt>
+    <dd>Make and run individual test or benchmark.
+    <dt><tt>make stress_{name}</tt>
+    <dd>Equivalent to 'make test_{name}' but runs until a failure detected or terminated by user.
+    <dt><tt>make run_cmd="{command}" [(above options or targets)]</tt>
+    <dd>Command prefix for tests execution. Also, "run_cmd=-" will ignore test execution failures. See also -k and -i options of the GNU make for more options to keep building and testing despite of failures.
+    <dt><tt>make debug_{name}</tt>
+    <dd>Equivalent to 'make test_{name}' but compiles in debug mode and runs under debugger ("run_cmd=$(debugger)").
+    <dt><tt>make args="{command-line arguments}" [(above options or targets)]</tt>
+    <dd>Additional arguments for the run.
+    <dt><tt>make repeat="{N}" [(above options or targets)]</tt>
+    <dd>Repeats execution N times.
+    <dt><tt>make clean_{filename}</tt>
+    <dd>Removes executable, object, and other intermediate files with specified filename ('*' also works).
+    <dt><tt>make cfg={debug|release} [(above options or targets)]</tt>
+    <dd>Specifies a build mode or corresponding directory to work in.
+    <dt><tt>make tbb_strict=1 [(above options or targets)]</tt>
+    <dd>Enables warnings as errors.
+    <dt><tt>make examples/{target}</tt>
+    <dd>Invokes examples/Makefile with specified target. Available in the open-source version only.
+        For the commercial version, you can download Intel TBB Samples at the <a href="https://software.intel.com/en-us/product-code-samples?topic=20828">Intel&reg; Software Product Samples and Tutorials</a> website.
+    <dt><tt>make python_{target} [compiler={icl, icc}]</tt>
+    <dd>Invokes Makefile with the specified target in <a href="../python/index.html">python</a> directory. E.g. 'python_install' target builds and installs the module into Python.
+    <dt><tt>make clean_release clean_debug clean_examples</tt>
+    <dd>Removes release or debug build directories, or cleans all examples. The target <tt>clean_examples</tt> is available in the open-source version only.
+    <dt><tt>make test_no_depends</tt>
+    <dd>Equivalent to 'make test' but does not check for libraries updates.
+    <dt><tt>make info</tt>
+    <dd>Output information about build configuration and directories.
+    <dt><tt>make cpp0x=1 [(above options or targets)]</tt>
+    <dd>Enables C++0x extensions like lambdas for compilers that implement them as experimental features.
+    <dt><tt>make CXXFLAGS={Flags} [(above options or targets)]</tt>
+    <dd>Specifies additional options for compiler.
+    <dt><tt>make target={name} [(above options or targets)]</tt>
+    <dd>Includes additional build/{name}.inc file after OS-specific one.
+    <dt><tt>make extra_inc={filename} [(above options or targets)]</tt>
+    <dd>Includes additional makefile.
+    </dl>
+
+<HR/>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/src/old/concurrent_queue_v2.cpp b/xdl/third_party/tbb/src/old/concurrent_queue_v2.cpp
new file mode 100644
index 00000000..4f6cf1f1
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/concurrent_queue_v2.cpp
@@ -0,0 +1,365 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "concurrent_queue_v2.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/atomic.h"
+#include <cstring>
+#include <stdio.h>
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif
+
+#define RECORD_EVENTS 0
+
+namespace tbb {
+
+namespace internal {
+
+class concurrent_queue_rep;
+
+//! A queue using simple locking.
+/** For efficiency, this class has no constructor.
+    The caller is expected to zero-initialize it. */
+struct micro_queue {
+    typedef concurrent_queue_base::page page;
+    typedef size_t ticket;
+
+    atomic<page*> head_page;
+    atomic<ticket> head_counter;
+
+    atomic<page*> tail_page;
+    atomic<ticket> tail_counter;
+
+    spin_mutex page_mutex;
+
+    class push_finalizer: no_copy {
+        ticket my_ticket;
+        micro_queue& my_queue;
+    public:
+        push_finalizer( micro_queue& queue, ticket k ) :
+            my_ticket(k), my_queue(queue)
+        {}
+        ~push_finalizer() {
+            my_queue.tail_counter = my_ticket;
+        }
+    };
+
+    void push( const void* item, ticket k, concurrent_queue_base& base );
+
+    class pop_finalizer: no_copy {
+        ticket my_ticket;
+        micro_queue& my_queue;
+        page* my_page;
+    public:
+        pop_finalizer( micro_queue& queue, ticket k, page* p ) :
+            my_ticket(k), my_queue(queue), my_page(p)
+        {}
+        ~pop_finalizer() {
+            page* p = my_page;
+            if( p ) {
+                spin_mutex::scoped_lock lock( my_queue.page_mutex );
+                page* q = p->next;
+                my_queue.head_page = q;
+                if( !q ) {
+                    my_queue.tail_page = NULL;
+                }
+            }
+            my_queue.head_counter = my_ticket;
+            if( p )
+                operator delete(p);
+        }
+    };
+
+    bool pop( void* dst, ticket k, concurrent_queue_base& base );
+};
+
+//! Internal representation of a ConcurrentQueue.
+/** For efficiency, this class has no constructor.
+    The caller is expected to zero-initialize it. */
+class concurrent_queue_rep {
+public:
+    typedef size_t ticket;
+
+private:
+    friend struct micro_queue;
+
+    //! Approximately n_queue/golden ratio
+    static const size_t phi = 3;
+
+public:
+    //! Must be power of 2
+    static const size_t n_queue = 8;
+
+    //! Map ticket to an array index
+    static size_t index( ticket k ) {
+        return k*phi%n_queue;
+    }
+
+    atomic<ticket> head_counter;
+    char pad1[NFS_MaxLineSize-sizeof(atomic<ticket>)];
+
+    atomic<ticket> tail_counter;
+    char pad2[NFS_MaxLineSize-sizeof(atomic<ticket>)];
+    micro_queue array[n_queue];
+
+    micro_queue& choose( ticket k ) {
+        // The formula here approximates LRU in a cache-oblivious way.
+        return array[index(k)];
+    }
+
+    //! Value for effective_capacity that denotes unbounded queue.
+    static const ptrdiff_t infinite_capacity = ptrdiff_t(~size_t(0)/2);
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // unary minus operator applied to unsigned type, result still unsigned
+    #pragma warning( push )
+    #pragma warning( disable: 4146 )
+#endif
+
+//------------------------------------------------------------------------
+// micro_queue
+//------------------------------------------------------------------------
+void micro_queue::push( const void* item, ticket k, concurrent_queue_base& base ) {
+    k &= -concurrent_queue_rep::n_queue;
+    page* p = NULL;
+    size_t index = modulo_power_of_two( k/concurrent_queue_rep::n_queue, base.items_per_page );
+    if( !index ) {
+        size_t n = sizeof(page) + base.items_per_page*base.item_size;
+        p = static_cast<page*>(operator new( n ));
+        p->mask = 0;
+        p->next = NULL;
+    }
+    {
+        push_finalizer finalizer( *this, k+concurrent_queue_rep::n_queue );
+        spin_wait_until_eq( tail_counter, k );
+        if( p ) {
+            spin_mutex::scoped_lock lock( page_mutex );
+            if( page* q = tail_page )
+                q->next = p;
+            else
+                head_page = p;
+            tail_page = p;
+        } else {
+            p = tail_page;
+        }
+        base.copy_item( *p, index, item );
+        // If no exception was thrown, mark item as present.
+        p->mask |= uintptr_t(1)<<index;
+    }
+}
+
+bool micro_queue::pop( void* dst, ticket k, concurrent_queue_base& base ) {
+    k &= -concurrent_queue_rep::n_queue;
+    spin_wait_until_eq( head_counter, k );
+    spin_wait_while_eq( tail_counter, k );
+    page *p = head_page;
+    __TBB_ASSERT( p, NULL );
+    size_t index = modulo_power_of_two( k/concurrent_queue_rep::n_queue, base.items_per_page );
+    bool success = false;
+    {
+        pop_finalizer finalizer( *this, k+concurrent_queue_rep::n_queue, index==base.items_per_page-1 ? p : NULL );
+        if( p->mask & uintptr_t(1)<<index ) {
+            success = true;
+            base.assign_and_destroy_item( dst, *p, index );
+        }
+    }
+    return success;
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif
+
+//------------------------------------------------------------------------
+// concurrent_queue_base
+//------------------------------------------------------------------------
+concurrent_queue_base::concurrent_queue_base( size_t item_sz ) {
+    items_per_page = item_sz<=  8 ? 32 :
+                     item_sz<= 16 ? 16 :
+                     item_sz<= 32 ?  8 :
+                     item_sz<= 64 ?  4 :
+                     item_sz<=128 ?  2 :
+                     1;
+    my_capacity = size_t(-1)/(item_sz>1 ? item_sz : 2);
+    my_rep = cache_aligned_allocator<concurrent_queue_rep>().allocate(1);
+    __TBB_ASSERT( (size_t)my_rep % NFS_GetLineSize()==0, "alignment error" );
+    __TBB_ASSERT( (size_t)&my_rep->head_counter % NFS_GetLineSize()==0, "alignment error" );
+    __TBB_ASSERT( (size_t)&my_rep->tail_counter % NFS_GetLineSize()==0, "alignment error" );
+    __TBB_ASSERT( (size_t)&my_rep->array % NFS_GetLineSize()==0, "alignment error" );
+    std::memset(static_cast<void*>(my_rep),0,sizeof(concurrent_queue_rep));
+    this->item_size = item_sz;
+}
+
+concurrent_queue_base::~concurrent_queue_base() {
+    size_t nq = my_rep->n_queue;
+    for( size_t i=0; i<nq; i++ ) {
+        page* tp = my_rep->array[i].tail_page;
+        __TBB_ASSERT( my_rep->array[i].head_page==tp, "at most one page should remain" );
+        if( tp!=NULL )
+            delete tp;
+    }
+    cache_aligned_allocator<concurrent_queue_rep>().deallocate(my_rep,1);
+}
+
+void concurrent_queue_base::internal_push( const void* src ) {
+    concurrent_queue_rep& r = *my_rep;
+    concurrent_queue_rep::ticket k  = r.tail_counter++;
+    if( my_capacity<concurrent_queue_rep::infinite_capacity ) {
+        // Capacity is limited, wait to not exceed it
+        atomic_backoff backoff;
+        while( (ptrdiff_t)(k-r.head_counter)>=const_cast<volatile ptrdiff_t&>(my_capacity) )
+            backoff.pause();
+    }
+    r.choose(k).push(src,k,*this);
+}
+
+void concurrent_queue_base::internal_pop( void* dst ) {
+    concurrent_queue_rep& r = *my_rep;
+    concurrent_queue_rep::ticket k;
+    do {
+        k = r.head_counter++;
+    } while( !r.choose(k).pop(dst,k,*this) );
+}
+
+bool concurrent_queue_base::internal_pop_if_present( void* dst ) {
+    concurrent_queue_rep& r = *my_rep;
+    concurrent_queue_rep::ticket k;
+    do {
+        for( atomic_backoff b;;b.pause() ) {
+            k = r.head_counter;
+            if( r.tail_counter<=k ) {
+                // Queue is empty
+                return false;
+            }
+            // Queue had item with ticket k when we looked.  Attempt to get that item.
+            if( r.head_counter.compare_and_swap(k+1,k)==k ) {
+                break;
+            }
+            // Another thread snatched the item, so pause and retry.
+        }
+    } while( !r.choose(k).pop(dst,k,*this) );
+    return true;
+}
+
+bool concurrent_queue_base::internal_push_if_not_full( const void* src ) {
+    concurrent_queue_rep& r = *my_rep;
+    concurrent_queue_rep::ticket k;
+    for( atomic_backoff b;;b.pause() ) {
+        k = r.tail_counter;
+        if( (ptrdiff_t)(k-r.head_counter)>=my_capacity ) {
+            // Queue is full
+            return false;
+        }
+        // Queue had empty slot with ticket k when we looked.  Attempt to claim that slot.
+        if( r.tail_counter.compare_and_swap(k+1,k)==k )
+            break;
+        // Another thread claimed the slot, so pause and retry.
+    }
+    r.choose(k).push(src,k,*this);
+    return true;
+}
+
+ptrdiff_t concurrent_queue_base::internal_size() const {
+    __TBB_ASSERT( sizeof(ptrdiff_t)<=sizeof(size_t), NULL );
+    return ptrdiff_t(my_rep->tail_counter-my_rep->head_counter);
+}
+
+void concurrent_queue_base::internal_set_capacity( ptrdiff_t capacity, size_t /*item_sz*/ ) {
+    my_capacity = capacity<0 ? concurrent_queue_rep::infinite_capacity : capacity;
+}
+
+//------------------------------------------------------------------------
+// concurrent_queue_iterator_rep
+//------------------------------------------------------------------------
+class  concurrent_queue_iterator_rep: no_assign {
+public:
+    typedef concurrent_queue_rep::ticket ticket;
+    ticket head_counter;
+    const concurrent_queue_base& my_queue;
+    concurrent_queue_base::page* array[concurrent_queue_rep::n_queue];
+    concurrent_queue_iterator_rep( const concurrent_queue_base& queue ) :
+        head_counter(queue.my_rep->head_counter),
+        my_queue(queue)
+    {
+        const concurrent_queue_rep& rep = *queue.my_rep;
+        for( size_t k=0; k<concurrent_queue_rep::n_queue; ++k )
+            array[k] = rep.array[k].head_page;
+    }
+    //! Get pointer to kth element
+    void* choose( size_t k ) {
+        if( k==my_queue.my_rep->tail_counter )
+            return NULL;
+        else {
+            concurrent_queue_base::page* p = array[concurrent_queue_rep::index(k)];
+            __TBB_ASSERT(p,NULL);
+            size_t i = modulo_power_of_two( k/concurrent_queue_rep::n_queue, my_queue.items_per_page );
+            return static_cast<unsigned char*>(static_cast<void*>(p+1)) + my_queue.item_size*i;
+        }
+    }
+};
+
+//------------------------------------------------------------------------
+// concurrent_queue_iterator_base
+//------------------------------------------------------------------------
+concurrent_queue_iterator_base::concurrent_queue_iterator_base( const concurrent_queue_base& queue ) {
+    my_rep = new concurrent_queue_iterator_rep(queue);
+    my_item = my_rep->choose(my_rep->head_counter);
+}
+
+void concurrent_queue_iterator_base::assign( const concurrent_queue_iterator_base& other ) {
+    if( my_rep!=other.my_rep ) {
+        if( my_rep ) {
+            delete my_rep;
+            my_rep = NULL;
+        }
+        if( other.my_rep ) {
+            my_rep = new concurrent_queue_iterator_rep( *other.my_rep );
+        }
+    }
+    my_item = other.my_item;
+}
+
+void concurrent_queue_iterator_base::advance() {
+    __TBB_ASSERT( my_item, "attempt to increment iterator past end of queue" );
+    size_t k = my_rep->head_counter;
+    const concurrent_queue_base& queue = my_rep->my_queue;
+    __TBB_ASSERT( my_item==my_rep->choose(k), NULL );
+    size_t i = modulo_power_of_two( k/concurrent_queue_rep::n_queue, queue.items_per_page );
+    if( i==queue.items_per_page-1 ) {
+        concurrent_queue_base::page*& root = my_rep->array[concurrent_queue_rep::index(k)];
+        root = root->next;
+    }
+    my_rep->head_counter = k+1;
+    my_item = my_rep->choose(k+1);
+}
+
+concurrent_queue_iterator_base::~concurrent_queue_iterator_base() {
+    delete my_rep;
+    my_rep = NULL;
+}
+
+} // namespace internal
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/old/concurrent_queue_v2.h b/xdl/third_party/tbb/src/old/concurrent_queue_v2.h
new file mode 100644
index 00000000..f6165bfc
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/concurrent_queue_v2.h
@@ -0,0 +1,324 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_queue_H
+#define __TBB_concurrent_queue_H
+
+#include "tbb/tbb_stddef.h"
+#include <new>
+
+namespace tbb {
+
+template<typename T> class concurrent_queue;
+
+//! @cond INTERNAL
+namespace internal {
+
+class concurrent_queue_rep;
+class concurrent_queue_iterator_rep;
+template<typename Container, typename Value> class concurrent_queue_iterator;
+
+//! For internal use only.
+/** Type-independent portion of concurrent_queue.
+    @ingroup containers */
+class concurrent_queue_base: no_copy {
+    //! Internal representation
+    concurrent_queue_rep* my_rep;
+
+    friend class concurrent_queue_rep;
+    friend struct micro_queue;
+    friend class concurrent_queue_iterator_rep;
+    friend class concurrent_queue_iterator_base;
+
+    // In C++ 1998/2003 (but quite likely not beyond), friend micro_queue's rights
+    // do not apply to the declaration of micro_queue::pop_finalizer::my_page,
+    // as a member of a class nested within that friend class, so...
+public:
+    //! Prefix on a page
+    struct page {
+        page* next;
+        uintptr_t mask; 
+    };
+
+protected:
+    //! Capacity of the queue
+    ptrdiff_t my_capacity;
+   
+    //! Always a power of 2
+    size_t items_per_page;
+
+    //! Size of an item
+    size_t item_size;
+private:
+    virtual void copy_item( page& dst, size_t index, const void* src ) = 0;
+    virtual void assign_and_destroy_item( void* dst, page& src, size_t index ) = 0;
+protected:
+    __TBB_EXPORTED_METHOD concurrent_queue_base( size_t item_size );
+    virtual __TBB_EXPORTED_METHOD ~concurrent_queue_base();
+
+    //! Enqueue item at tail of queue
+    void __TBB_EXPORTED_METHOD internal_push( const void* src );
+
+    //! Dequeue item from head of queue
+    void __TBB_EXPORTED_METHOD internal_pop( void* dst );
+
+    //! Attempt to enqueue item onto queue.
+    bool __TBB_EXPORTED_METHOD internal_push_if_not_full( const void* src );
+
+    //! Attempt to dequeue item from queue.
+    /** NULL if there was no item to dequeue. */
+    bool __TBB_EXPORTED_METHOD internal_pop_if_present( void* dst );
+
+    //! Get size of queue
+    ptrdiff_t __TBB_EXPORTED_METHOD internal_size() const;
+
+    void __TBB_EXPORTED_METHOD internal_set_capacity( ptrdiff_t capacity, size_t element_size );
+};
+
+//! Type-independent portion of concurrent_queue_iterator.
+/** @ingroup containers */
+class concurrent_queue_iterator_base : no_assign{
+    //! concurrent_queue over which we are iterating.
+    /** NULL if one past last element in queue. */
+    concurrent_queue_iterator_rep* my_rep;
+
+    template<typename C, typename T, typename U>
+    friend bool operator==( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j );
+
+    template<typename C, typename T, typename U>
+    friend bool operator!=( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j );
+protected:
+    //! Pointer to current item
+    mutable void* my_item;
+
+    //! Default constructor
+    __TBB_EXPORTED_METHOD concurrent_queue_iterator_base() : my_rep(NULL), my_item(NULL) {}
+
+    //! Copy constructor
+    concurrent_queue_iterator_base( const concurrent_queue_iterator_base& i ) : my_rep(NULL), my_item(NULL) {
+        assign(i);
+    }
+
+    //! Construct iterator pointing to head of queue.
+    concurrent_queue_iterator_base( const concurrent_queue_base& queue );
+
+    //! Assignment
+    void __TBB_EXPORTED_METHOD assign( const concurrent_queue_iterator_base& i );
+
+    //! Advance iterator one step towards tail of queue.
+    void __TBB_EXPORTED_METHOD advance();
+
+    //! Destructor
+    __TBB_EXPORTED_METHOD ~concurrent_queue_iterator_base();
+};
+
+//! Meets requirements of a forward iterator for STL.
+/** Value is either the T or const T type of the container.
+    @ingroup containers */
+template<typename Container, typename Value>
+class concurrent_queue_iterator: public concurrent_queue_iterator_base {
+#if !defined(_MSC_VER) || defined(__INTEL_COMPILER)
+    template<typename T>
+    friend class ::tbb::concurrent_queue;
+#else
+public: // workaround for MSVC
+#endif 
+    //! Construct iterator pointing to head of queue.
+    concurrent_queue_iterator( const concurrent_queue_base& queue ) :
+        concurrent_queue_iterator_base(queue)
+    {
+    }
+public:
+    concurrent_queue_iterator() {}
+
+    /** If Value==Container::value_type, then this routine is the copy constructor. 
+        If Value==const Container::value_type, then this routine is a conversion constructor. */
+    concurrent_queue_iterator( const concurrent_queue_iterator<Container,typename Container::value_type>& other ) :
+        concurrent_queue_iterator_base(other)
+    {}
+
+    //! Iterator assignment
+    concurrent_queue_iterator& operator=( const concurrent_queue_iterator& other ) {
+        assign(other);
+        return *this;
+    }
+
+    //! Reference to current item 
+    Value& operator*() const {
+        return *static_cast<Value*>(my_item);
+    }
+
+    Value* operator->() const {return &operator*();}
+
+    //! Advance to next item in queue
+    concurrent_queue_iterator& operator++() {
+        advance();
+        return *this;
+    }
+
+    //! Post increment
+    Value* operator++(int) {
+        Value* result = &operator*();
+        operator++();
+        return result;
+    }
+}; // concurrent_queue_iterator
+
+template<typename C, typename T, typename U>
+bool operator==( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j ) {
+    return i.my_item==j.my_item;
+}
+
+template<typename C, typename T, typename U>
+bool operator!=( const concurrent_queue_iterator<C,T>& i, const concurrent_queue_iterator<C,U>& j ) {
+    return i.my_item!=j.my_item;
+}
+
+} // namespace internal;
+//! @endcond
+
+//! A high-performance thread-safe queue.
+/** Multiple threads may each push and pop concurrently.
+    Assignment and copy construction are not allowed.
+    @ingroup containers */
+template<typename T>
+class concurrent_queue: public internal::concurrent_queue_base {
+    template<typename Container, typename Value> friend class internal::concurrent_queue_iterator;
+
+    //! Class used to ensure exception-safety of method "pop" 
+    class destroyer {
+        T& my_value;
+    public:
+        destroyer( T& value ) : my_value(value) {}
+        ~destroyer() {my_value.~T();}          
+    };
+
+    T& get_ref( page& pg, size_t index ) {
+        __TBB_ASSERT( index<items_per_page, NULL );
+        return static_cast<T*>(static_cast<void*>(&pg+1))[index];
+    }
+
+    virtual void copy_item( page& dst, size_t index, const void* src ) __TBB_override {
+        new( &get_ref(dst,index) ) T(*static_cast<const T*>(src));
+    }
+
+    virtual void assign_and_destroy_item( void* dst, page& src, size_t index ) __TBB_override {
+        T& from = get_ref(src,index);
+        destroyer d(from);
+        *static_cast<T*>(dst) = from;
+    }
+
+public:
+    //! Element type in the queue.
+    typedef T value_type;
+
+    //! Reference type
+    typedef T& reference;
+
+    //! Const reference type
+    typedef const T& const_reference;
+
+    //! Integral type for representing size of the queue.
+    /** Note that the size_type is a signed integral type.
+        This is because the size can be negative if there are pending pops without corresponding pushes. */
+    typedef std::ptrdiff_t size_type;
+
+    //! Difference type for iterator
+    typedef std::ptrdiff_t difference_type;
+
+    //! Construct empty queue
+    concurrent_queue() : 
+        concurrent_queue_base( sizeof(T) )
+    {
+    }
+
+    //! Destroy queue
+    ~concurrent_queue();
+
+    //! Enqueue an item at tail of queue.
+    void push( const T& source ) {
+        internal_push( &source );
+    }
+
+    //! Dequeue item from head of queue.
+    /** Block until an item becomes available, and then dequeue it. */
+    void pop( T& destination ) {
+        internal_pop( &destination );
+    }
+
+    //! Enqueue an item at tail of queue if queue is not already full.
+    /** Does not wait for queue to become not full.
+        Returns true if item is pushed; false if queue was already full. */
+    bool push_if_not_full( const T& source ) {
+        return internal_push_if_not_full( &source );
+    }
+
+    //! Attempt to dequeue an item from head of queue.
+    /** Does not wait for item to become available.
+        Returns true if successful; false otherwise. */
+    bool pop_if_present( T& destination ) {
+        return internal_pop_if_present( &destination );
+    }
+
+    //! Return number of pushes minus number of pops.
+    /** Note that the result can be negative if there are pops waiting for the 
+        corresponding pushes.  The result can also exceed capacity() if there 
+        are push operations in flight. */
+    size_type size() const {return internal_size();}
+
+    //! Equivalent to size()<=0.
+    bool empty() const {return size()<=0;}
+
+    //! Maximum number of allowed elements
+    size_type capacity() const {
+        return my_capacity;
+    }
+
+    //! Set the capacity
+    /** Setting the capacity to 0 causes subsequent push_if_not_full operations to always fail,
+        and subsequent push operations to block forever. */
+    void set_capacity( size_type new_capacity ) {
+        internal_set_capacity( new_capacity, sizeof(T) );
+    }
+
+    typedef internal::concurrent_queue_iterator<concurrent_queue,T> iterator;
+    typedef internal::concurrent_queue_iterator<concurrent_queue,const T> const_iterator;
+
+    //------------------------------------------------------------------------
+    // The iterators are intended only for debugging.  They are slow and not thread safe.
+    //------------------------------------------------------------------------
+    iterator begin() {return iterator(*this);}
+    iterator end() {return iterator();}
+    const_iterator begin() const {return const_iterator(*this);}
+    const_iterator end() const {return const_iterator();}
+    
+}; 
+
+template<typename T>
+concurrent_queue<T>::~concurrent_queue() {
+    while( !empty() ) {
+        T value;
+        internal_pop(&value);
+    }
+}
+
+} // namespace tbb
+
+#endif /* __TBB_concurrent_queue_H */
diff --git a/xdl/third_party/tbb/src/old/concurrent_vector_v2.cpp b/xdl/third_party/tbb/src/old/concurrent_vector_v2.cpp
new file mode 100644
index 00000000..edc64b17
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/concurrent_vector_v2.cpp
@@ -0,0 +1,256 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "concurrent_vector_v2.h"
+#include "tbb/tbb_machine.h"
+#include "../tbb/itt_notify.h"
+#include "tbb/task.h"
+
+#include <stdexcept> // std::length_error
+#include <cstring>
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif
+
+namespace tbb {
+
+namespace internal {
+
+void concurrent_vector_base::internal_grow_to_at_least( size_type new_size, size_type element_size, internal_array_op1 init ) {
+    size_type e = my_early_size;
+    while( e<new_size ) {
+        size_type f = my_early_size.compare_and_swap(new_size,e);
+        if( f==e ) {
+            internal_grow( e, new_size, element_size, init );
+            return;
+        }
+        e = f;
+    }
+}
+
+class concurrent_vector_base::helper {
+    static void extend_segment( concurrent_vector_base& v );
+public:
+    static segment_index_t find_segment_end( const concurrent_vector_base& v ) {
+        const size_t pointers_per_long_segment = sizeof(void*)==4 ? 32 : 64;
+        const size_t pointers_per_short_segment = 2;
+        //unsigned u = v.my_segment==v.my_storage ? pointers_per_short_segment : pointers_per_long_segment;
+        segment_index_t u = v.my_segment==(&(v.my_storage[0])) ? pointers_per_short_segment : pointers_per_long_segment;
+        segment_index_t k = 0;
+        while( k<u && v.my_segment[k].array )
+            ++k;
+        return k;
+    }
+    static void extend_segment_if_necessary( concurrent_vector_base& v, size_t k ) {
+        const size_t pointers_per_short_segment = 2;
+        if( k>=pointers_per_short_segment && v.my_segment==v.my_storage ) {
+            extend_segment(v);
+        }
+    }
+};
+
+void concurrent_vector_base::helper::extend_segment( concurrent_vector_base& v ) {
+    const size_t pointers_per_long_segment = sizeof(void*)==4 ? 32 : 64;
+    segment_t* s = (segment_t*)NFS_Allocate( pointers_per_long_segment, sizeof(segment_t), NULL );
+    std::memset( static_cast<void*>(s), 0, pointers_per_long_segment*sizeof(segment_t) );
+    // If other threads are trying to set pointers in the short segment, wait for them to finish their
+    // assignments before we copy the short segment to the long segment.
+    atomic_backoff backoff;
+    while( !v.my_storage[0].array || !v.my_storage[1].array ) backoff.pause();
+    s[0] = v.my_storage[0];
+    s[1] = v.my_storage[1];
+    if( v.my_segment.compare_and_swap( s, v.my_storage )!=v.my_storage )
+        NFS_Free(s);
+}
+
+concurrent_vector_base::size_type concurrent_vector_base::internal_capacity() const {
+    return segment_base( helper::find_segment_end(*this) );
+}
+
+void concurrent_vector_base::internal_reserve( size_type n, size_type element_size, size_type max_size ) {
+    if( n>max_size ) {
+        __TBB_THROW( std::length_error("argument to concurrent_vector::reserve exceeds concurrent_vector::max_size()") );
+    }
+    for( segment_index_t k = helper::find_segment_end(*this); segment_base(k)<n; ++k ) {
+        helper::extend_segment_if_necessary(*this,k);
+        size_t m = segment_size(k);
+        __TBB_ASSERT( !my_segment[k].array, "concurrent operation during reserve(...)?" );
+        my_segment[k].array = NFS_Allocate( m, element_size, NULL );
+    }
+}
+
+void concurrent_vector_base::internal_copy( const concurrent_vector_base& src, size_type element_size, internal_array_op2 copy ) {
+    size_type n = src.my_early_size;
+    my_early_size = n;
+    my_segment = my_storage;
+    if( n ) {
+        size_type b;
+        for( segment_index_t k=0; (b=segment_base(k))<n; ++k ) {
+            helper::extend_segment_if_necessary(*this,k);
+            size_t m = segment_size(k);
+            __TBB_ASSERT( !my_segment[k].array, "concurrent operation during copy construction?" );
+            my_segment[k].array = NFS_Allocate( m, element_size, NULL );
+            if( m>n-b ) m = n-b;
+            copy( my_segment[k].array, src.my_segment[k].array, m );
+        }
+    }
+}
+
+void concurrent_vector_base::internal_assign( const concurrent_vector_base& src, size_type element_size, internal_array_op1 destroy, internal_array_op2 assign, internal_array_op2 copy ) {
+    size_type n = src.my_early_size;
+    while( my_early_size>n ) {
+        segment_index_t k = segment_index_of( my_early_size-1 );
+        size_type b=segment_base(k);
+        size_type new_end = b>=n ? b : n;
+        __TBB_ASSERT( my_early_size>new_end, NULL );
+        destroy( (char*)my_segment[k].array+element_size*(new_end-b), my_early_size-new_end );
+        my_early_size = new_end;
+    }
+    size_type dst_initialized_size = my_early_size;
+    my_early_size = n;
+    size_type b;
+    for( segment_index_t k=0; (b=segment_base(k))<n; ++k ) {
+        helper::extend_segment_if_necessary(*this,k);
+        size_t m = segment_size(k);
+        if( !my_segment[k].array )
+            my_segment[k].array = NFS_Allocate( m, element_size, NULL );
+        if( m>n-b ) m = n-b; 
+        size_type a = 0;
+        if( dst_initialized_size>b ) {
+            a = dst_initialized_size-b;
+            if( a>m ) a = m;
+            assign( my_segment[k].array, src.my_segment[k].array, a );
+            m -= a;
+            a *= element_size;
+        }
+        if( m>0 )
+            copy( (char*)my_segment[k].array+a, (char*)src.my_segment[k].array+a, m );
+    }
+    __TBB_ASSERT( src.my_early_size==n, "detected use of concurrent_vector::operator= with right side that was concurrently modified" );
+}
+
+void* concurrent_vector_base::internal_push_back( size_type element_size, size_type& index ) {
+    __TBB_ASSERT( sizeof(my_early_size)==sizeof(reference_count), NULL );
+    //size_t tmp = __TBB_FetchAndIncrementWacquire(*(tbb::internal::reference_count*)&my_early_size);
+    size_t tmp = __TBB_FetchAndIncrementWacquire((tbb::internal::reference_count*)&my_early_size);
+    index = tmp;
+    segment_index_t k_old = segment_index_of( tmp );
+    size_type base = segment_base(k_old);
+    helper::extend_segment_if_necessary(*this,k_old);
+    segment_t& s = my_segment[k_old];
+    void* array = s.array;
+    if( !array ) {
+        // FIXME - consider factoring this out and share with internal_grow_by
+	if( base==tmp ) {
+	    __TBB_ASSERT( !s.array, NULL );
+            size_t n = segment_size(k_old);
+	    array = NFS_Allocate( n, element_size, NULL );
+	    ITT_NOTIFY( sync_releasing, &s.array );
+	    s.array = array;
+	} else {
+	    ITT_NOTIFY(sync_prepare, &s.array);
+	    spin_wait_while_eq( s.array, (void*)0 );
+	    ITT_NOTIFY(sync_acquired, &s.array);
+	    array = s.array;
+	}
+    }
+    size_type j_begin = tmp-base;
+    return (void*)((char*)array+element_size*j_begin);
+}
+
+concurrent_vector_base::size_type concurrent_vector_base::internal_grow_by( size_type delta, size_type element_size, internal_array_op1 init ) {
+    size_type result = my_early_size.fetch_and_add(delta);
+    internal_grow( result, result+delta, element_size, init );
+    return result;
+}
+
+void concurrent_vector_base::internal_grow( const size_type start, size_type finish, size_type element_size, internal_array_op1 init ) {
+    __TBB_ASSERT( start<finish, "start must be less than finish" );
+    size_t tmp = start;
+    do {
+        segment_index_t k_old = segment_index_of( tmp );
+        size_type base = segment_base(k_old);
+        size_t n = segment_size(k_old);
+        helper::extend_segment_if_necessary(*this,k_old);
+        segment_t& s = my_segment[k_old];
+        void* array = s.array;
+        if( !array ) {
+            if( base==tmp ) {
+                __TBB_ASSERT( !s.array, NULL );
+                array = NFS_Allocate( n, element_size, NULL );
+                ITT_NOTIFY( sync_releasing, &s.array );
+                s.array = array;
+            } else {
+                ITT_NOTIFY(sync_prepare, &s.array);
+                spin_wait_while_eq( s.array, (void*)0 );
+                ITT_NOTIFY(sync_acquired, &s.array);
+                array = s.array;
+            }
+        }
+        size_type j_begin = tmp-base;
+        size_type j_end = n > finish-base ? finish-base : n;
+        (*init)( (void*)((char*)array+element_size*j_begin), j_end-j_begin );
+        tmp = base+j_end;
+    } while( tmp<finish );
+}
+
+void concurrent_vector_base::internal_clear( internal_array_op1 destroy, bool reclaim_storage ) {
+    // Set "my_early_size" early, so that subscripting errors can be caught.
+    // FIXME - doing so may be hurting exception safety
+    __TBB_ASSERT( my_segment, NULL );
+    size_type finish = my_early_size;
+    my_early_size = 0;
+    while( finish>0 ) {
+        segment_index_t k_old = segment_index_of(finish-1);
+        segment_t& s = my_segment[k_old];
+        __TBB_ASSERT( s.array, NULL );
+        size_type base = segment_base(k_old);
+        size_type j_end = finish-base;
+        __TBB_ASSERT( j_end, NULL );
+        (*destroy)( s.array, j_end );
+        finish = base;
+    }
+
+    // Free the arrays
+    if( reclaim_storage ) {
+        size_t k = helper::find_segment_end(*this);
+        while( k>0 ) {
+            --k;
+            segment_t& s = my_segment[k];
+            void* array = s.array;
+            s.array = NULL;
+            NFS_Free( array );
+        }
+        // Clear short segment.
+        my_storage[0].array = NULL;
+        my_storage[1].array = NULL;
+        segment_t* s = my_segment;
+        if( s!=my_storage ) {
+            my_segment = my_storage;
+            NFS_Free( s );
+        }
+    }
+}
+
+} // namespace internal
+
+} // tbb
diff --git a/xdl/third_party/tbb/src/old/concurrent_vector_v2.h b/xdl/third_party/tbb/src/old/concurrent_vector_v2.h
new file mode 100644
index 00000000..c1766999
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/concurrent_vector_v2.h
@@ -0,0 +1,512 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_vector_H
+#define __TBB_concurrent_vector_H
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/atomic.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/blocked_range.h"
+#include "tbb/tbb_machine.h"
+#include <new>
+#include <iterator>
+
+namespace tbb {
+
+template<typename T>
+class concurrent_vector;
+
+//! @cond INTERNAL
+namespace internal {
+
+    //! Base class of concurrent vector implementation.
+    /** @ingroup containers */
+    class concurrent_vector_base {
+    protected:
+
+        // Basic types declarations
+        typedef unsigned long segment_index_t;
+        typedef size_t size_type;
+
+        //! Log2 of "min_segment_size".
+        static const int lg_min_segment_size = 4;
+
+        //! Minimum size (in physical items) of a segment.
+        static const int min_segment_size = segment_index_t(1)<<lg_min_segment_size;
+
+        static segment_index_t segment_index_of( size_t index ) {
+            uintptr_t i = index|1<<(lg_min_segment_size-1);
+            uintptr_t j = __TBB_Log2(i);
+            return segment_index_t(j-(lg_min_segment_size-1));
+        }
+
+        static segment_index_t segment_base( segment_index_t k ) {
+            return min_segment_size>>1<<k & -min_segment_size;
+        }
+
+        static segment_index_t segment_size( segment_index_t k ) {
+            segment_index_t result = k==0 ? min_segment_size : min_segment_size/2<<k;
+            __TBB_ASSERT( result==segment_base(k+1)-segment_base(k), NULL );
+            return result;
+        }
+
+        void __TBB_EXPORTED_METHOD internal_reserve( size_type n, size_type element_size, size_type max_size );
+
+        size_type __TBB_EXPORTED_METHOD internal_capacity() const;
+
+        //! Requested size of vector
+        atomic<size_type> my_early_size;
+
+        /** Can be zero-initialized. */
+        struct segment_t {
+            /** Declared volatile because in weak memory model, must have ld.acq/st.rel  */
+            void* volatile array;
+#if TBB_USE_ASSERT
+            ~segment_t() {
+                __TBB_ASSERT( !array, "should have been set to NULL by clear" );
+            }
+#endif /* TBB_USE_ASSERT */
+        };
+
+        // Data fields
+
+        //! Pointer to the segments table
+        atomic<segment_t*> my_segment;
+
+        //! embedded storage of segment pointers
+        segment_t my_storage[2];
+
+        // Methods
+
+        concurrent_vector_base() {
+            my_early_size = 0;
+            my_storage[0].array = NULL;
+            my_storage[1].array = NULL;
+            my_segment = my_storage;
+        }
+
+        //! An operation on an n-element array starting at begin.
+        typedef void(__TBB_EXPORTED_FUNC *internal_array_op1)(void* begin, size_type n );
+
+        //! An operation on n-element destination array and n-element source array.
+        typedef void(__TBB_EXPORTED_FUNC *internal_array_op2)(void* dst, const void* src, size_type n );
+
+        void __TBB_EXPORTED_METHOD internal_grow_to_at_least( size_type new_size, size_type element_size, internal_array_op1 init );
+        void internal_grow( size_type start, size_type finish, size_type element_size, internal_array_op1 init );
+        size_type __TBB_EXPORTED_METHOD internal_grow_by( size_type delta, size_type element_size, internal_array_op1 init );
+        void* __TBB_EXPORTED_METHOD internal_push_back( size_type element_size, size_type& index );
+        void __TBB_EXPORTED_METHOD internal_clear( internal_array_op1 destroy, bool reclaim_storage );
+        void __TBB_EXPORTED_METHOD internal_copy( const concurrent_vector_base& src, size_type element_size, internal_array_op2 copy );
+        void __TBB_EXPORTED_METHOD internal_assign( const concurrent_vector_base& src, size_type element_size,
+                              internal_array_op1 destroy, internal_array_op2 assign, internal_array_op2 copy );
+private:
+        //! Private functionality that does not cross DLL boundary.
+        class helper;
+        friend class helper;
+    };
+
+    //! Meets requirements of a forward iterator for STL and a Value for a blocked_range.*/
+    /** Value is either the T or const T type of the container.
+        @ingroup containers */
+    template<typename Container, typename Value>
+    class vector_iterator
+#if defined(_WIN64) && defined(_MSC_VER)
+        // Ensure that Microsoft's internal template function _Val_type works correctly.
+        : public std::iterator<std::random_access_iterator_tag,Value>
+#endif /* defined(_WIN64) && defined(_MSC_VER) */
+    {
+        //! concurrent_vector over which we are iterating.
+        Container* my_vector;
+
+        //! Index into the vector
+        size_t my_index;
+
+        //! Caches my_vector-&gt;internal_subscript(my_index)
+        /** NULL if cached value is not available */
+        mutable Value* my_item;
+
+        template<typename C, typename T, typename U>
+        friend bool operator==( const vector_iterator<C,T>& i, const vector_iterator<C,U>& j );
+
+        template<typename C, typename T, typename U>
+        friend bool operator<( const vector_iterator<C,T>& i, const vector_iterator<C,U>& j );
+
+        template<typename C, typename T, typename U>
+        friend ptrdiff_t operator-( const vector_iterator<C,T>& i, const vector_iterator<C,U>& j );
+
+        template<typename C, typename U>
+        friend class internal::vector_iterator;
+
+#if !defined(_MSC_VER) || defined(__INTEL_COMPILER)
+        template<typename T>
+        friend class tbb::concurrent_vector;
+#else
+public: // workaround for MSVC
+#endif
+
+        vector_iterator( const Container& vector, size_t index ) :
+            my_vector(const_cast<Container*>(&vector)),
+            my_index(index),
+            my_item(NULL)
+        {}
+
+    public:
+        //! Default constructor
+        vector_iterator() : my_vector(NULL), my_index(~size_t(0)), my_item(NULL) {}
+
+        vector_iterator( const vector_iterator<Container,typename Container::value_type>& other ) :
+            my_vector(other.my_vector),
+            my_index(other.my_index),
+            my_item(other.my_item)
+        {}
+
+        vector_iterator operator+( ptrdiff_t offset ) const {
+            return vector_iterator( *my_vector, my_index+offset );
+        }
+        friend vector_iterator operator+( ptrdiff_t offset, const vector_iterator& v ) {
+            return vector_iterator( *v.my_vector, v.my_index+offset );
+        }
+        vector_iterator operator+=( ptrdiff_t offset ) {
+            my_index+=offset;
+            my_item = NULL;
+            return *this;
+        }
+        vector_iterator operator-( ptrdiff_t offset ) const {
+            return vector_iterator( *my_vector, my_index-offset );
+        }
+        vector_iterator operator-=( ptrdiff_t offset ) {
+            my_index-=offset;
+            my_item = NULL;
+            return *this;
+        }
+        Value& operator*() const {
+            Value* item = my_item;
+            if( !item ) {
+                item = my_item = &my_vector->internal_subscript(my_index);
+            }
+            __TBB_ASSERT( item==&my_vector->internal_subscript(my_index), "corrupt cache" );
+            return *item;
+        }
+        Value& operator[]( ptrdiff_t k ) const {
+            return my_vector->internal_subscript(my_index+k);
+        }
+        Value* operator->() const {return &operator*();}
+
+        //! Pre increment
+        vector_iterator& operator++() {
+            size_t k = ++my_index;
+            if( my_item ) {
+                // Following test uses 2's-complement wizardry and fact that
+                // min_segment_size is a power of 2.
+                if( (k& k-concurrent_vector<Container>::min_segment_size)==0 ) {
+                    // k is a power of two that is at least k-min_segment_size  
+                    my_item= NULL;
+                } else {
+                    ++my_item;
+                }
+            }
+            return *this;
+        }
+
+        //! Pre decrement
+        vector_iterator& operator--() {
+            __TBB_ASSERT( my_index>0, "operator--() applied to iterator already at beginning of concurrent_vector" );
+            size_t k = my_index--;
+            if( my_item ) {
+                // Following test uses 2's-complement wizardry and fact that
+                // min_segment_size is a power of 2.
+                if( (k& k-concurrent_vector<Container>::min_segment_size)==0 ) {
+                    // k is a power of two that is at least k-min_segment_size  
+                    my_item= NULL;
+                } else {
+                    --my_item;
+                }
+            }
+            return *this;
+        }
+
+        //! Post increment
+        vector_iterator operator++(int) {
+            vector_iterator result = *this;
+            operator++();
+            return result;
+        }
+
+        //! Post decrement
+        vector_iterator operator--(int) {
+            vector_iterator result = *this;
+            operator--();
+            return result;
+        }
+
+        // STL support
+
+        typedef ptrdiff_t difference_type;
+        typedef Value value_type;
+        typedef Value* pointer;
+        typedef Value& reference;
+        typedef std::random_access_iterator_tag iterator_category;
+    };
+
+    template<typename Container, typename T, typename U>
+    bool operator==( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return i.my_index==j.my_index;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator!=( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return !(i==j);
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator<( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return i.my_index<j.my_index;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator>( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return j<i;
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator>=( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return !(i<j);
+    }
+
+    template<typename Container, typename T, typename U>
+    bool operator<=( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return !(j<i);
+    }
+
+    template<typename Container, typename T, typename U>
+    ptrdiff_t operator-( const vector_iterator<Container,T>& i, const vector_iterator<Container,U>& j ) {
+        return ptrdiff_t(i.my_index)-ptrdiff_t(j.my_index);
+    }
+
+} // namespace internal
+//! @endcond
+
+//! Concurrent vector
+/** @ingroup containers */
+template<typename T>
+class concurrent_vector: private internal::concurrent_vector_base {
+public:
+    using internal::concurrent_vector_base::size_type;
+private:
+    template<typename I>
+    class generic_range_type: public blocked_range<I> {
+    public:
+        typedef T value_type;
+        typedef T& reference;
+        typedef const T& const_reference;
+        typedef I iterator;
+        typedef ptrdiff_t difference_type;
+        generic_range_type( I begin_, I end_, size_t grainsize_ ) : blocked_range<I>(begin_,end_,grainsize_) {}
+        generic_range_type( generic_range_type& r, split ) : blocked_range<I>(r,split()) {}
+    };
+
+    template<typename C, typename U>
+    friend class internal::vector_iterator;
+public:
+    typedef T& reference;
+    typedef const T& const_reference;
+    typedef T value_type;
+    typedef ptrdiff_t difference_type;
+
+    //! Construct empty vector.
+    concurrent_vector() {}
+
+    //! Copy a vector.
+    concurrent_vector( const concurrent_vector& vector ) : internal::concurrent_vector_base()
+    { internal_copy(vector,sizeof(T),&copy_array); }
+
+    //! Assignment
+    concurrent_vector& operator=( const concurrent_vector& vector ) {
+        if( this!=&vector )
+            internal_assign(vector,sizeof(T),&destroy_array,&assign_array,&copy_array);
+        return *this;
+    }
+
+    //! Clear and destroy vector.
+    ~concurrent_vector() {internal_clear(&destroy_array,/*reclaim_storage=*/true);}
+
+    //------------------------------------------------------------------------
+    // Concurrent operations
+    //------------------------------------------------------------------------
+    //! Grow by "delta" elements.
+    /** Returns old size. */
+    size_type grow_by( size_type delta ) {
+        return delta ? internal_grow_by( delta, sizeof(T), &initialize_array ) : my_early_size.load();
+    }
+
+    //! Grow array until it has at least n elements.
+    void grow_to_at_least( size_type n ) {
+        if( my_early_size<n )
+            internal_grow_to_at_least( n, sizeof(T), &initialize_array );
+    };
+
+    //! Push item
+    size_type push_back( const_reference item ) {
+        size_type k;
+        new( internal_push_back(sizeof(T),k) ) T(item);
+        return k;
+    }
+
+    //! Get reference to element at given index.
+    /** This method is thread-safe for concurrent reads, and also while growing the vector,
+        as long as the calling thread has checked that index&lt;size(). */
+    reference operator[]( size_type index ) {
+        return internal_subscript(index);
+    }
+
+    //! Get const reference to element at given index.
+    const_reference operator[]( size_type index ) const {
+        return internal_subscript(index);
+    }
+
+    //------------------------------------------------------------------------
+    // STL support (iterators)
+    //------------------------------------------------------------------------
+    typedef internal::vector_iterator<concurrent_vector,T> iterator;
+    typedef internal::vector_iterator<concurrent_vector,const T> const_iterator;
+
+#if !defined(_MSC_VER) || _CPPLIB_VER>=300
+    // Assume ISO standard definition of std::reverse_iterator
+    typedef std::reverse_iterator<iterator> reverse_iterator;
+    typedef std::reverse_iterator<const_iterator> const_reverse_iterator;
+#else
+    // Use non-standard std::reverse_iterator
+    typedef std::reverse_iterator<iterator,T,T&,T*> reverse_iterator;
+    typedef std::reverse_iterator<const_iterator,T,const T&,const T*> const_reverse_iterator;
+#endif /* defined(_MSC_VER) && (_MSC_VER<1300) */
+
+    // Forward sequence 
+    iterator begin() {return iterator(*this,0);}
+    iterator end() {return iterator(*this,size());}
+    const_iterator begin() const {return const_iterator(*this,0);}
+    const_iterator end() const {return const_iterator(*this,size());}
+
+    // Reverse sequence
+    reverse_iterator rbegin() {return reverse_iterator(end());}
+    reverse_iterator rend() {return reverse_iterator(begin());}
+    const_reverse_iterator rbegin() const {return const_reverse_iterator(end());}
+    const_reverse_iterator rend() const {return const_reverse_iterator(begin());}
+
+    //------------------------------------------------------------------------
+    // Support for TBB algorithms (ranges)
+    //------------------------------------------------------------------------
+    typedef generic_range_type<iterator> range_type;
+    typedef generic_range_type<const_iterator> const_range_type;
+
+    //! Get range to use with parallel algorithms
+    range_type range( size_t grainsize = 1 ) {
+        return range_type( begin(), end(), grainsize );
+    }
+
+    //! Get const range for iterating with parallel algorithms
+    const_range_type range( size_t grainsize = 1 ) const {
+        return const_range_type( begin(), end(), grainsize );
+    }
+
+    //------------------------------------------------------------------------
+    // Size and capacity
+    //------------------------------------------------------------------------
+    //! Return size of vector.
+    size_type size() const {return my_early_size;}
+
+    //! Return false if vector is not empty.
+    bool empty() const {return !my_early_size;}
+
+    //! Maximum size to which array can grow without allocating more memory.
+    size_type capacity() const {return internal_capacity();}
+
+    //! Allocate enough space to grow to size n without having to allocate more memory later.
+    /** Like most of the methods provided for STL compatibility, this method is *not* thread safe.
+        The capacity afterwards may be bigger than the requested reservation. */
+    void reserve( size_type n ) {
+        if( n )
+            internal_reserve(n, sizeof(T), max_size());
+    }
+
+    //! Upper bound on argument to reserve.
+    size_type max_size() const {return (~size_t(0))/sizeof(T);}
+
+    //! Not thread safe
+    /** Does not change capacity. */
+    void clear() {internal_clear(&destroy_array,/*reclaim_storage=*/false);}
+private:
+    //! Get reference to element at given index.
+    T& internal_subscript( size_type index ) const;
+
+    //! Construct n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC initialize_array( void* begin, size_type n );
+
+    //! Construct n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC copy_array( void* dst, const void* src, size_type n );
+
+    //! Assign n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC assign_array( void* dst, const void* src, size_type n );
+
+    //! Destroy n instances of T, starting at "begin".
+    static void __TBB_EXPORTED_FUNC destroy_array( void* begin, size_type n );
+};
+
+template<typename T>
+T& concurrent_vector<T>::internal_subscript( size_type index ) const {
+    __TBB_ASSERT( index<size(), "index out of bounds" );
+    segment_index_t k = segment_index_of( index );
+    size_type j = index-segment_base(k);
+    return static_cast<T*>(my_segment[k].array)[j];
+}
+
+template<typename T>
+void concurrent_vector<T>::initialize_array( void* begin, size_type n ) {
+    T* array = static_cast<T*>(begin);
+    for( size_type j=0; j<n; ++j )
+        new( &array[j] ) T();
+}
+
+template<typename T>
+void concurrent_vector<T>::copy_array( void* dst, const void* src, size_type n ) {
+    T* d = static_cast<T*>(dst);
+    const T* s = static_cast<const T*>(src);
+    for( size_type j=0; j<n; ++j )
+        new( &d[j] ) T(s[j]);
+}
+
+template<typename T>
+void concurrent_vector<T>::assign_array( void* dst, const void* src, size_type n ) {
+    T* d = static_cast<T*>(dst);
+    const T* s = static_cast<const T*>(src);
+    for( size_type j=0; j<n; ++j )
+        d[j] = s[j];
+}
+
+template<typename T>
+void concurrent_vector<T>::destroy_array( void* begin, size_type n ) {
+    T* array = static_cast<T*>(begin);
+    for( size_type j=n; j>0; --j )
+        array[j-1].~T();
+}
+
+} // namespace tbb
+
+#endif /* __TBB_concurrent_vector_H */
diff --git a/xdl/third_party/tbb/src/old/spin_rw_mutex_v2.cpp b/xdl/third_party/tbb/src/old/spin_rw_mutex_v2.cpp
new file mode 100644
index 00000000..2f72013d
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/spin_rw_mutex_v2.cpp
@@ -0,0 +1,156 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "spin_rw_mutex_v2.h"
+#include "tbb/tbb_machine.h"
+#include "../tbb/itt_notify.h"
+#include "tbb/atomic.h"
+
+namespace tbb {
+
+using namespace internal;
+
+static inline bool CAS(volatile uintptr_t &addr, uintptr_t newv, uintptr_t oldv) {
+    return as_atomic(addr).compare_and_swap(newv, oldv) == oldv;
+}
+
+//! Signal that write lock is released
+void spin_rw_mutex::internal_itt_releasing(spin_rw_mutex *mutex) {
+    __TBB_ASSERT_EX(mutex, NULL); // To prevent compiler warnings
+    ITT_NOTIFY(sync_releasing, mutex);
+}
+
+//! Acquire write (exclusive) lock on the given mutex.
+bool spin_rw_mutex::internal_acquire_writer(spin_rw_mutex *mutex)
+{
+    ITT_NOTIFY(sync_prepare, mutex);
+    for( atomic_backoff backoff;;backoff.pause() ) {
+        state_t s = mutex->state;
+        if( !(s & BUSY) ) { // no readers, no writers
+            if( CAS(mutex->state, WRITER, s) )
+                break; // successfully stored writer flag
+            backoff.reset(); // we could be very close to complete op.
+        } else if( !(s & WRITER_PENDING) ) { // no pending writers
+            __TBB_AtomicOR(&mutex->state, WRITER_PENDING);
+        }
+    }
+    ITT_NOTIFY(sync_acquired, mutex);
+    __TBB_ASSERT( (mutex->state & BUSY)==WRITER, "invalid state of a write lock" );
+    return false;
+}
+
+//! Release write lock on the given mutex
+void spin_rw_mutex::internal_release_writer(spin_rw_mutex *mutex) {
+    __TBB_ASSERT( (mutex->state & BUSY)==WRITER, "invalid state of a write lock" );
+    ITT_NOTIFY(sync_releasing, mutex);
+    mutex->state = 0; 
+}
+
+//! Acquire read (shared) lock on the given mutex.
+void spin_rw_mutex::internal_acquire_reader(spin_rw_mutex *mutex) {
+    ITT_NOTIFY(sync_prepare, mutex);
+    for( atomic_backoff backoff;;backoff.pause() ) {
+        state_t s = mutex->state;
+        if( !(s & (WRITER|WRITER_PENDING)) ) { // no writer or write requests
+            if( CAS(mutex->state, s+ONE_READER, s) )
+                break; // successfully stored increased number of readers
+            backoff.reset(); // we could be very close to complete op.
+        }
+    }
+    ITT_NOTIFY(sync_acquired, mutex);
+    __TBB_ASSERT( mutex->state & READERS, "invalid state of a read lock: no readers" );
+    __TBB_ASSERT( !(mutex->state & WRITER), "invalid state of a read lock: active writer" );
+}
+
+//! Upgrade reader to become a writer.
+/** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+bool spin_rw_mutex::internal_upgrade(spin_rw_mutex *mutex) {
+    state_t s = mutex->state;
+    __TBB_ASSERT( s & READERS, "invalid state before upgrade: no readers " );
+    __TBB_ASSERT( !(s & WRITER), "invalid state before upgrade: active writer " );
+    // check and set writer-pending flag
+    // required conditions: either no pending writers, or we are the only reader
+    // (with multiple readers and pending writer, another upgrade could have been requested)
+    while( (s & READERS)==ONE_READER || !(s & WRITER_PENDING) ) {
+        if( CAS(mutex->state, s | WRITER_PENDING, s) )
+        {
+            ITT_NOTIFY(sync_prepare, mutex);
+            atomic_backoff backoff;
+            while( (mutex->state & READERS) != ONE_READER ) backoff.pause();
+            __TBB_ASSERT(mutex->state == (ONE_READER | WRITER_PENDING),"invalid state when upgrading to writer");
+            // both new readers and writers are blocked at this time
+            mutex->state = WRITER;
+            ITT_NOTIFY(sync_acquired, mutex);
+            __TBB_ASSERT( (mutex->state & BUSY) == WRITER, "invalid state after upgrade" );
+            return true; // successfully upgraded
+        } else {
+            s = mutex->state; // re-read
+        }
+    }
+    // slow reacquire
+    internal_release_reader(mutex);
+    return internal_acquire_writer(mutex); // always returns false
+}
+
+//! Downgrade writer to a reader
+void spin_rw_mutex::internal_downgrade(spin_rw_mutex *mutex) {
+    __TBB_ASSERT( (mutex->state & BUSY) == WRITER, "invalid state before downgrade" );
+    ITT_NOTIFY(sync_releasing, mutex);
+    mutex->state = ONE_READER;
+    __TBB_ASSERT( mutex->state & READERS, "invalid state after downgrade: no readers" );
+    __TBB_ASSERT( !(mutex->state & WRITER), "invalid state after downgrade: active writer" );
+}
+
+//! Release read lock on the given mutex
+void spin_rw_mutex::internal_release_reader(spin_rw_mutex *mutex)
+{
+    __TBB_ASSERT( mutex->state & READERS, "invalid state of a read lock: no readers" );
+    __TBB_ASSERT( !(mutex->state & WRITER), "invalid state of a read lock: active writer" );
+    ITT_NOTIFY(sync_releasing, mutex); // release reader
+    __TBB_FetchAndAddWrelease((volatile void *)&(mutex->state),-(intptr_t)ONE_READER);
+}
+
+//! Try to acquire write lock on the given mutex
+bool spin_rw_mutex::internal_try_acquire_writer( spin_rw_mutex * mutex )
+{
+    // for a writer: only possible to acquire if no active readers or writers
+    state_t s = mutex->state; // on IA-64 architecture, this volatile load has acquire semantic
+    if( !(s & BUSY) ) // no readers, no writers; mask is 1..1101
+        if( CAS(mutex->state, WRITER, s) ) {
+            ITT_NOTIFY(sync_acquired, mutex);
+            return true; // successfully stored writer flag
+        }
+    return false;
+}
+
+//! Try to acquire read lock on the given mutex
+bool spin_rw_mutex::internal_try_acquire_reader( spin_rw_mutex * mutex )
+{
+    // for a reader: acquire if no active or waiting writers
+    state_t s = mutex->state;    // on IA-64 architecture, a load of volatile variable has acquire semantic
+    while( !(s & (WRITER|WRITER_PENDING)) ) // no writers
+        if( CAS(mutex->state, s+ONE_READER, s) ) {
+            ITT_NOTIFY(sync_acquired, mutex);
+            return true; // successfully stored increased number of readers
+        }
+    return false;
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/old/spin_rw_mutex_v2.h b/xdl/third_party/tbb/src/old/spin_rw_mutex_v2.h
new file mode 100644
index 00000000..27a55d1f
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/spin_rw_mutex_v2.h
@@ -0,0 +1,175 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_spin_rw_mutex_H
+#define __TBB_spin_rw_mutex_H
+
+#include "tbb/tbb_stddef.h"
+
+namespace tbb {
+
+//! Fast, unfair, spinning reader-writer lock with backoff and writer-preference
+/** @ingroup synchronization */
+class spin_rw_mutex {
+    //! @cond INTERNAL
+
+    //! Present so that 1.0 headers work with 1.1 dynamic library.
+    static void __TBB_EXPORTED_FUNC internal_itt_releasing(spin_rw_mutex *);
+
+    //! Internal acquire write lock.
+    static bool __TBB_EXPORTED_FUNC internal_acquire_writer(spin_rw_mutex *);
+
+    //! Out of line code for releasing a write lock.
+    /** This code has debug checking and instrumentation for Intel(R) Thread Checker and Intel(R) Thread Profiler. */
+    static void __TBB_EXPORTED_FUNC internal_release_writer(spin_rw_mutex *);
+
+    //! Internal acquire read lock.
+    static void __TBB_EXPORTED_FUNC internal_acquire_reader(spin_rw_mutex *);
+
+    //! Internal upgrade reader to become a writer.
+    static bool __TBB_EXPORTED_FUNC internal_upgrade(spin_rw_mutex *);
+
+    //! Out of line code for downgrading a writer to a reader.
+    /** This code has debug checking and instrumentation for Intel(R) Thread Checker and Intel(R) Thread Profiler. */
+    static void __TBB_EXPORTED_FUNC internal_downgrade(spin_rw_mutex *);
+
+    //! Internal release read lock.
+    static void __TBB_EXPORTED_FUNC internal_release_reader(spin_rw_mutex *);
+
+    //! Internal try_acquire write lock.
+    static bool __TBB_EXPORTED_FUNC internal_try_acquire_writer(spin_rw_mutex *);
+
+    //! Internal try_acquire read lock.
+    static bool __TBB_EXPORTED_FUNC internal_try_acquire_reader(spin_rw_mutex *);
+
+    //! @endcond
+public:
+    //! Construct unacquired mutex.
+    spin_rw_mutex() : state(0) {}
+
+#if TBB_USE_ASSERT
+    //! Destructor asserts if the mutex is acquired, i.e. state is zero.
+    ~spin_rw_mutex() {
+        __TBB_ASSERT( !state, "destruction of an acquired mutex");
+    };
+#endif /* TBB_USE_ASSERT */
+
+    //! The scoped locking pattern
+    /** It helps to avoid the common problem of forgetting to release lock.
+        It also nicely provides the "node" for queuing locks. */
+    class scoped_lock : internal::no_copy {
+    public:
+        //! Construct lock that has not acquired a mutex.
+        /** Equivalent to zero-initialization of *this. */
+        scoped_lock() : mutex(NULL) {}
+
+        //! Construct and acquire lock on given mutex.
+        scoped_lock( spin_rw_mutex& m, bool write = true ) : mutex(NULL) {
+            acquire(m, write);
+        }
+
+        //! Release lock (if lock is held).
+        ~scoped_lock() {
+            if( mutex ) release();
+        }
+
+        //! Acquire lock on given mutex.
+        void acquire( spin_rw_mutex& m, bool write = true ) {
+            __TBB_ASSERT( !mutex, "holding mutex already" );
+            mutex = &m;
+            is_writer = write;
+            if( write ) internal_acquire_writer(mutex);
+            else        internal_acquire_reader(mutex);
+        }
+
+        //! Upgrade reader to become a writer.
+        /** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+        bool upgrade_to_writer() {
+            __TBB_ASSERT( mutex, "lock is not acquired" );
+            __TBB_ASSERT( !is_writer, "not a reader" );
+            is_writer = true;
+            return internal_upgrade(mutex);
+        }
+
+        //! Release lock.
+        void release() {
+            __TBB_ASSERT( mutex, "lock is not acquired" );
+            spin_rw_mutex *m = mutex; 
+            mutex = NULL;
+            if( is_writer ) {
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+                internal_release_writer(m);
+#else
+                m->state = 0; 
+#endif /* TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT */
+            } else {
+                internal_release_reader(m);
+            }
+        };
+
+        //! Downgrade writer to become a reader.
+        bool downgrade_to_reader() {
+            __TBB_ASSERT( mutex, "lock is not acquired" );
+            __TBB_ASSERT( is_writer, "not a writer" );
+#if TBB_USE_THREADING_TOOLS||TBB_USE_ASSERT
+            internal_downgrade(mutex);
+#else
+            mutex->state = 4; // Bit 2 - reader, 00..00100
+#endif
+            is_writer = false;
+            return true;
+        }
+
+        //! Try acquire lock on given mutex.
+        bool try_acquire( spin_rw_mutex& m, bool write = true ) {
+            __TBB_ASSERT( !mutex, "holding mutex already" );
+            bool result;
+            is_writer = write; 
+            result = write? internal_try_acquire_writer(&m)
+                          : internal_try_acquire_reader(&m);
+            if( result ) mutex = &m;
+            return result;
+        }
+
+    private:
+        //! The pointer to the current mutex that is held, or NULL if no mutex is held.
+        spin_rw_mutex* mutex;
+
+        //! If mutex!=NULL, then is_writer is true if holding a writer lock, false if holding a reader lock.
+        /** Not defined if not holding a lock. */
+        bool is_writer;
+    };
+
+private:
+    typedef uintptr_t state_t;
+    static const state_t WRITER = 1;
+    static const state_t WRITER_PENDING = 2;
+    static const state_t READERS = ~(WRITER | WRITER_PENDING);
+    static const state_t ONE_READER = 4;
+    static const state_t BUSY = WRITER | READERS;
+    /** Bit 0 = writer is holding lock
+        Bit 1 = request by a writer to acquire lock (hint to readers to wait)
+        Bit 2..N = number of readers holding lock */
+    volatile state_t state;
+};
+
+} // namespace tbb
+
+#endif /* __TBB_spin_rw_mutex_H */
diff --git a/xdl/third_party/tbb/src/old/task_v2.cpp b/xdl/third_party/tbb/src/old/task_v2.cpp
new file mode 100644
index 00000000..6607e7ec
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/task_v2.cpp
@@ -0,0 +1,38 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*  This compilation unit provides definition of task::destroy( task& )
+    that is binary compatible with TBB 2.x. In TBB 3.0, the method became
+    static, and its name decoration changed, though the definition remained.
+
+    The macro switch should be set prior to including task.h
+    or any TBB file that might bring task.h up.
+*/
+#define __TBB_DEPRECATED_TASK_INTERFACE 1
+#include "tbb/task.h"
+
+namespace tbb {
+
+void task::destroy( task& victim ) {
+    // Forward to static version
+    task_base::destroy( victim );
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/old/test_concurrent_queue_v2.cpp b/xdl/third_party/tbb/src/old/test_concurrent_queue_v2.cpp
new file mode 100644
index 00000000..666eb456
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/test_concurrent_queue_v2.cpp
@@ -0,0 +1,348 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "old/concurrent_queue_v2.h"
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+
+#include "../test/harness_assert.h"
+#include "../test/harness.h"
+
+static tbb::atomic<long> FooConstructed;
+static tbb::atomic<long> FooDestroyed;
+
+enum state_t{
+    LIVE=0x1234,
+    DEAD=0xDEAD
+};
+
+class Foo {
+    state_t state;
+public:
+    int thread_id;
+    int serial;
+    Foo() : state(LIVE) {
+        ++FooConstructed;
+    }
+    Foo( const Foo& item ) : state(LIVE) {
+        ASSERT( item.state==LIVE, NULL );
+        ++FooConstructed;
+        thread_id = item.thread_id;
+        serial = item.serial;
+    }
+    ~Foo() {
+        ASSERT( state==LIVE, NULL );
+        ++FooDestroyed;
+        state=DEAD;
+        thread_id=DEAD;
+        serial=DEAD;
+    }
+    void operator=( Foo& item ) {
+        ASSERT( item.state==LIVE, NULL );
+        ASSERT( state==LIVE, NULL );
+        thread_id = item.thread_id;
+        serial = item.serial;
+    }
+    bool is_const() {return false;}
+    bool is_const() const {return true;}
+};
+
+const size_t MAXTHREAD = 256;
+
+static int Sum[MAXTHREAD];
+
+//! Count of various pop operations
+/** [0] = pop_if_present that failed
+    [1] = pop_if_present that succeeded
+    [2] = pop */
+static tbb::atomic<long> PopKind[3];
+
+const int M = 10000;
+
+struct Body: NoAssign {
+    tbb::concurrent_queue<Foo>* queue;
+    const int nthread;
+    Body( int nthread_ ) : nthread(nthread_) {}
+    void operator()( long thread_id ) const {
+        long pop_kind[3] = {0,0,0};
+        int serial[MAXTHREAD+1];
+        memset( serial, 0, nthread*sizeof(unsigned) );
+        ASSERT( thread_id<nthread, NULL );
+
+        long sum = 0;
+        for( long j=0; j<M; ++j ) {
+            Foo f;
+            f.thread_id = DEAD;
+            f.serial = DEAD;
+            bool prepopped = false;
+            if( j&1 ) {
+                prepopped = queue->pop_if_present(f);
+                ++pop_kind[prepopped];
+            }
+            Foo g;
+            g.thread_id = thread_id;
+            g.serial = j+1;
+            queue->push( g );
+            if( !prepopped ) {
+                queue->pop(f);
+                ++pop_kind[2];
+            }
+            ASSERT( f.thread_id<=nthread, NULL );
+            ASSERT( f.thread_id==nthread || serial[f.thread_id]<f.serial, "partial order violation" );
+            serial[f.thread_id] = f.serial;
+            sum += f.serial-1;
+        }
+        Sum[thread_id] = sum;
+        for( int k=0; k<3; ++k )
+            PopKind[k] += pop_kind[k];
+    }
+};
+
+void TestPushPop( int prefill, ptrdiff_t capacity, int nthread ) {
+    ASSERT( nthread>0, "nthread must be positive" );
+    if( prefill+1>=capacity )
+        return;
+    bool success = false;
+    for( int k=0; k<3; ++k )
+        PopKind[k] = 0;
+    for( int trial=0; !success; ++trial ) {
+        FooConstructed = 0;
+        FooDestroyed = 0;
+        Body body(nthread);
+        tbb::concurrent_queue<Foo> queue;
+        queue.set_capacity( capacity );
+        body.queue = &queue;
+        for( int i=0; i<prefill; ++i ) {
+            Foo f;
+            f.thread_id = nthread;
+            f.serial = 1+i;
+            queue.push(f);
+            ASSERT( queue.size()==i+1, NULL );
+            ASSERT( !queue.empty(), NULL );
+        }
+        tbb::tick_count t0 = tbb::tick_count::now();
+        NativeParallelFor( nthread, body );
+        tbb::tick_count t1 = tbb::tick_count::now();
+        double timing = (t1-t0).seconds();
+        if( Verbose )
+            printf("prefill=%d capacity=%d time = %g = %g nsec/operation\n", prefill, int(capacity), timing, timing/(2*M*nthread)*1.E9);
+        int sum = 0;
+        for( int k=0; k<nthread; ++k )
+            sum += Sum[k];
+        int expected = nthread*((M-1)*M/2) + ((prefill-1)*prefill)/2;
+        for( int i=prefill; --i>=0; ) {
+            ASSERT( !queue.empty(), NULL );
+            Foo f;
+            queue.pop(f);
+            ASSERT( queue.size()==i, NULL );
+            sum += f.serial-1;
+        }
+        ASSERT( queue.empty(), NULL );
+        ASSERT( queue.size()==0, NULL );
+        if( sum!=expected )
+            printf("sum=%d expected=%d\n",sum,expected);
+        ASSERT( FooConstructed==FooDestroyed, NULL );
+
+        success = true;
+        if( nthread>1 && prefill==0 ) {
+            // Check that pop_if_present got sufficient exercise
+            for( int k=0; k<2; ++k ) {
+#if (_WIN32||_WIN64)
+                // The TBB library on Windows seems to have a tough time generating
+                // the desired interleavings for pop_if_present, so the code tries longer, and settles
+                // for fewer desired interleavings.
+                const int max_trial = 100;
+                const int min_requirement = 20;
+#else
+                const int min_requirement = 100;
+                const int max_trial = 20;
+#endif /* _WIN32||_WIN64 */
+                if( PopKind[k]<min_requirement ) {
+                    if( trial>=max_trial ) {
+                        if( Verbose )
+                            printf("Warning: %d threads had only %ld pop_if_present operations %s after %d trials (expected at least %d). "
+                                    "This problem may merely be unlucky scheduling. "
+                                    "Investigate only if it happens repeatedly.\n",
+                                    nthread, long(PopKind[k]), k==0?"failed":"succeeded", max_trial, min_requirement);
+                        else
+                            printf("Warning: the number of %s pop_if_present operations is less than expected for %d threads. Investigate if it happens repeatedly.\n",
+                                   k==0?"failed":"succeeded", nthread );
+                    } else {
+                        success = false;
+                    }
+               }
+            }
+        }
+    }
+}
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAux( Iterator1 i, Iterator2 j, int size ) {
+    Iterator1 old_i; // assigned at first iteration below
+    for( int k=0; k<size; ++k ) {
+        ASSERT( i!=j, NULL );
+        ASSERT( !(i==j), NULL );
+        // Test "->"
+        ASSERT( k+1==i->serial, NULL );
+        if( k&1 ) {
+            // Test post-increment
+            Foo f = *old_i++;
+            ASSERT( k+1==f.serial, NULL );
+            // Test assignment
+            i = old_i;
+        } else {
+            // Test pre-increment
+            if( k<size-1 ) {
+                Foo f = *++i;
+                ASSERT( k+2==f.serial, NULL );
+            } else ++i;
+            // Test assignment
+            old_i = i;
+        }
+    }
+    ASSERT( !(i!=j), NULL );
+    ASSERT( i==j, NULL );
+}
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAssignment( Iterator2 j ) {
+    Iterator1 i(j);
+    ASSERT( i==j, NULL );
+    ASSERT( !(i!=j), NULL );
+    Iterator1 k;
+    k = j;
+    ASSERT( k==j, NULL );
+    ASSERT( !(k!=j), NULL );
+}
+
+//! Test the iterators for concurrent_queue
+void TestIterator() {
+    tbb::concurrent_queue<Foo> queue;
+    tbb::concurrent_queue<Foo>& const_queue = queue;
+    for( int j=0; j<500; ++j ) {
+        TestIteratorAux(       queue.begin(),       queue.end(), j );
+        TestIteratorAux( const_queue.begin(), const_queue.end(), j );
+        TestIteratorAux( const_queue.begin(),       queue.end(), j );
+        TestIteratorAux(       queue.begin(), const_queue.end(), j );
+        Foo f;
+        f.serial = j+1;
+        queue.push(f);
+    }
+    TestIteratorAssignment<tbb::concurrent_queue<Foo>::const_iterator>( const_queue.begin() );
+    TestIteratorAssignment<tbb::concurrent_queue<Foo>::const_iterator>(       queue.begin() );
+    TestIteratorAssignment<tbb::concurrent_queue<Foo>::      iterator>(       queue.begin() );
+}
+
+void TestConcurrentQueueType() {
+    AssertSameType( tbb::concurrent_queue<Foo>::value_type(), Foo() );
+    Foo f;
+    const Foo g;
+    tbb::concurrent_queue<Foo>::reference r = f;
+    ASSERT( &r==&f, NULL );
+    ASSERT( !r.is_const(), NULL );
+    tbb::concurrent_queue<Foo>::const_reference cr = g;
+    ASSERT( &cr==&g, NULL );
+    ASSERT( cr.is_const(), NULL );
+}
+
+template<typename T>
+void TestEmptyQueue() {
+    const tbb::concurrent_queue<T> queue;
+    ASSERT( queue.size()==0, NULL );
+    ASSERT( queue.capacity()>0, NULL );
+    ASSERT( size_t(queue.capacity())>=size_t(-1)/(sizeof(void*)+sizeof(T)), NULL );
+}
+
+void TestFullQueue() {
+    for( int n=0; n<10; ++n ) {
+        FooConstructed = 0;
+        FooDestroyed = 0;
+        tbb::concurrent_queue<Foo> queue;
+        queue.set_capacity(n);
+        for( int i=0; i<=n; ++i ) {
+            Foo f;
+            f.serial = i;
+            bool result = queue.push_if_not_full( f );
+            ASSERT( result==(i<n), NULL );
+        }
+        for( int i=0; i<=n; ++i ) {
+            Foo f;
+            bool result = queue.pop_if_present( f );
+            ASSERT( result==(i<n), NULL );
+            ASSERT( !result || f.serial==i, NULL );
+        }
+        ASSERT( FooConstructed==FooDestroyed, NULL );
+    }
+}
+
+template<typename T>
+struct TestNegativeQueueBody: NoAssign {
+    tbb::concurrent_queue<T>& queue;
+    const int nthread;
+    TestNegativeQueueBody( tbb::concurrent_queue<T>& q, int n ) : queue(q), nthread(n) {}
+    void operator()( int k ) const {
+        if( k==0 ) {
+            int number_of_pops = nthread-1;
+            // Wait for all pops to pend.
+            while( queue.size()>-number_of_pops ) {
+                __TBB_Yield();
+            }
+            for( int i=0; ; ++i ) {
+                ASSERT( queue.size()==i-number_of_pops, NULL );
+                ASSERT( queue.empty()==(queue.size()<=0), NULL );
+                if( i==number_of_pops ) break;
+                // Satisfy another pop
+                queue.push( T() );
+            }
+        } else {
+            // Pop item from queue
+            T item;
+            queue.pop(item);
+        }
+    }
+};
+
+//! Test a queue with a negative size.
+template<typename T>
+void TestNegativeQueue( int nthread ) {
+    tbb::concurrent_queue<T> queue;
+    NativeParallelFor( nthread, TestNegativeQueueBody<T>(queue,nthread) );
+}
+
+int TestMain () {
+    TestEmptyQueue<char>();
+    TestEmptyQueue<Foo>();
+    TestFullQueue();
+    TestConcurrentQueueType();
+    TestIterator();
+
+    // Test concurrent operations
+    for( int nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        TestNegativeQueue<Foo>(nthread);
+        for( int prefill=0; prefill<64; prefill+=(1+prefill/3) ) {
+            TestPushPop(prefill,ptrdiff_t(-1),nthread);
+            TestPushPop(prefill,ptrdiff_t(1),nthread);
+            TestPushPop(prefill,ptrdiff_t(2),nthread);
+            TestPushPop(prefill,ptrdiff_t(10),nthread);
+            TestPushPop(prefill,ptrdiff_t(100),nthread);
+        }
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/old/test_concurrent_vector_v2.cpp b/xdl/third_party/tbb/src/old/test_concurrent_vector_v2.cpp
new file mode 100644
index 00000000..a5750484
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/test_concurrent_vector_v2.cpp
@@ -0,0 +1,558 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "concurrent_vector_v2.h"
+#include <cstdio>
+#include <cstdlib>
+#include "../test/harness_assert.h"
+
+tbb::atomic<long> FooCount;
+
+//! Problem size
+const size_t N = 500000;
+
+struct Foo {
+    int my_bar;
+public:
+    enum State {
+        DefaultInitialized=0x1234,
+        CopyInitialized=0x89ab,
+        Destroyed=0x5678
+    } state;
+    int& bar() {
+        ASSERT( state==DefaultInitialized||state==CopyInitialized, NULL );
+        return my_bar;
+    }
+    int bar() const {
+        ASSERT( state==DefaultInitialized||state==CopyInitialized, NULL );
+        return my_bar;
+    }
+    static const int initial_value_of_bar = 42;
+    Foo() {
+        state = DefaultInitialized;
+        ++FooCount;
+        my_bar = initial_value_of_bar;
+    }
+    Foo( const Foo& foo ) {
+        state = CopyInitialized;
+        ++FooCount;
+        my_bar = foo.my_bar;
+    }
+    ~Foo() {
+        ASSERT( state==DefaultInitialized||state==CopyInitialized, NULL );
+        state = Destroyed;
+        my_bar = ~initial_value_of_bar;
+        --FooCount;
+    }
+    bool is_const() const {return true;}
+    bool is_const() {return false;}
+};
+
+class FooWithAssign: public Foo {
+public:
+    void operator=( const FooWithAssign& x ) {
+        ASSERT( x.state==DefaultInitialized||x.state==CopyInitialized, NULL );
+        ASSERT( state==DefaultInitialized||state==CopyInitialized, NULL );
+        my_bar = x.my_bar;
+    }
+};
+
+inline void NextSize( int& s ) {
+    if( s<=32 ) ++s;
+    else s += s/10;
+}
+
+static void CheckVector( const tbb::concurrent_vector<Foo>& cv, size_t expected_size, size_t old_size ) {
+    ASSERT( cv.size()==expected_size, NULL );
+    ASSERT( cv.empty()==(expected_size==0), NULL );
+    for( int j=0; j<int(expected_size); ++j ) {
+        if( cv[j].bar()!=~j )
+            std::printf("ERROR on line %d for old_size=%ld expected_size=%ld j=%d\n",__LINE__,long(old_size),long(expected_size),j);
+    }
+}
+
+void TestResizeAndCopy() {
+    typedef tbb::concurrent_vector<Foo> vector_t;
+    for( int old_size=0; old_size<=128; NextSize( old_size ) ) {
+        for( int new_size=old_size; new_size<=128; NextSize( new_size ) ) {
+            long count = FooCount;
+            vector_t v;
+            ASSERT( count==FooCount, NULL );
+            v.grow_by(old_size);
+            ASSERT( count+old_size==FooCount, NULL );
+            for( int j=0; j<old_size; ++j )
+                v[j].bar() = j*j;
+            v.grow_to_at_least(new_size);
+            ASSERT( count+new_size==FooCount, NULL );
+            for( int j=0; j<new_size; ++j ) {
+                int expected = j<old_size ? j*j : Foo::initial_value_of_bar;
+                if( v[j].bar()!=expected )
+                    std::printf("ERROR on line %d for old_size=%ld new_size=%ld v[%ld].bar()=%d != %d\n",__LINE__,long(old_size),long(new_size),long(j),v[j].bar(), expected);
+            }
+            ASSERT( v.size()==size_t(new_size), NULL );
+            for( int j=0; j<new_size; ++j ) {
+                v[j].bar() = ~j;
+            }
+            const vector_t& cv = v;
+            // Try copy constructor
+            vector_t copy_of_v(cv);
+            CheckVector(cv,new_size,old_size);
+            v.clear();
+            ASSERT( v.empty(), NULL );
+            CheckVector(copy_of_v,new_size,old_size);
+        }
+    }
+}
+
+void TestCapacity() {
+    for( size_t old_size=0; old_size<=10000; old_size=(old_size<5 ? old_size+1 : 3*old_size) ) {
+        for( size_t new_size=0; new_size<=10000; new_size=(new_size<5 ? new_size+1 : 3*new_size) ) {
+            long count = FooCount;
+            {
+                typedef tbb::concurrent_vector<Foo> vector_t;
+                vector_t v;
+                v.reserve( old_size );
+                ASSERT( v.capacity()>=old_size, NULL );
+                v.reserve( new_size );
+                ASSERT( v.capacity()>=old_size, NULL );
+                ASSERT( v.capacity()>=new_size, NULL );
+                for( size_t i=0; i<2*new_size; ++i ) {
+                    ASSERT( size_t(FooCount)==count+i, NULL );
+                    size_t j = v.grow_by(1);
+                    ASSERT( j==i, NULL );
+                }
+            }
+            ASSERT( FooCount==count, NULL );
+        }
+    }
+}
+
+struct AssignElement {
+    typedef tbb::concurrent_vector<int>::range_type::iterator iterator;
+    iterator base;
+    void operator()( const tbb::concurrent_vector<int>::range_type& range ) const {
+        for( iterator i=range.begin(); i!=range.end(); ++i ) {
+            if( *i!=0 )
+                std::printf("ERROR for v[%ld]\n", long(i-base));
+            *i = int(i-base);
+        }
+    }
+    AssignElement( iterator base_ ) : base(base_) {}
+};
+
+struct CheckElement {
+    typedef tbb::concurrent_vector<int>::const_range_type::iterator iterator;
+    iterator base;
+    void operator()( const tbb::concurrent_vector<int>::const_range_type& range ) const {
+        for( iterator i=range.begin(); i!=range.end(); ++i )
+            if( *i != int(i-base) )
+                std::printf("ERROR for v[%ld]\n", long(i-base));
+    }
+    CheckElement( iterator base_ ) : base(base_) {}
+};
+
+#include "tbb/tick_count.h"
+#include "tbb/parallel_for.h"
+#include "../test/harness.h"
+
+//! Test parallel access by iterators
+void TestParallelFor( int nthread ) {
+    typedef tbb::concurrent_vector<int> vector_t;
+    vector_t v;
+    v.grow_to_at_least(N);
+    tbb::tick_count t0 = tbb::tick_count::now();
+    if( Verbose )
+        std::printf("Calling parallel_for.h with %ld threads\n",long(nthread));
+    tbb::parallel_for( v.range(10000), AssignElement(v.begin()) );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    const vector_t& u = v;
+    tbb::parallel_for( u.range(10000), CheckElement(u.begin()) );
+    tbb::tick_count t2 = tbb::tick_count::now();
+    if( Verbose )
+        std::printf("Time for parallel_for.h: assign time = %8.5f, check time = %8.5f\n",
+               (t1-t0).seconds(),(t2-t1).seconds());
+    for( long i=0; size_t(i)<v.size(); ++i )
+        if( v[i]!=i )
+            std::printf("ERROR for v[%ld]\n", i);
+}
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAssignment( Iterator2 j ) {
+    Iterator1 i(j);
+    ASSERT( i==j, NULL );
+    ASSERT( !(i!=j), NULL );
+    Iterator1 k;
+    k = j;
+    ASSERT( k==j, NULL );
+    ASSERT( !(k!=j), NULL );
+}
+
+template<typename Iterator, typename T>
+void TestIteratorTraits() {
+    AssertSameType( static_cast<typename Iterator::difference_type*>(0), static_cast<ptrdiff_t*>(0) );
+    AssertSameType( static_cast<typename Iterator::value_type*>(0), static_cast<T*>(0) );
+    AssertSameType( static_cast<typename Iterator::pointer*>(0), static_cast<T**>(0) );
+    AssertSameType( static_cast<typename Iterator::iterator_category*>(0), static_cast<std::random_access_iterator_tag*>(0) );
+    T x;
+    typename Iterator::reference xr = x;
+    typename Iterator::pointer xp = &x;
+    ASSERT( &xr==xp, NULL );
+}
+
+template<typename Vector, typename Iterator>
+void CheckConstIterator( const Vector& u, int i, const Iterator& cp ) {
+    typename Vector::const_reference pref = *cp;
+    if( pref.bar()!=i )
+        std::printf("ERROR for u[%ld] using const_iterator\n", long(i));
+    typename Vector::difference_type delta = cp-u.begin();
+    ASSERT( delta==i, NULL );
+    if( u[i].bar()!=i )
+        std::printf("ERROR for u[%ld] using subscripting\n", long(i));
+    ASSERT( u.begin()[i].bar()==i, NULL );
+}
+
+template<typename Iterator1, typename Iterator2, typename V>
+void CheckIteratorComparison( V& u ) {
+    Iterator1 i = u.begin();
+    for( int i_count=0; i_count<100; ++i_count ) {
+        Iterator2 j = u.begin();
+        for( int j_count=0; j_count<100; ++j_count ) {
+            ASSERT( (i==j)==(i_count==j_count), NULL );
+            ASSERT( (i!=j)==(i_count!=j_count), NULL );
+            ASSERT( (i-j)==(i_count-j_count), NULL );
+            ASSERT( (i<j)==(i_count<j_count), NULL );
+            ASSERT( (i>j)==(i_count>j_count), NULL );
+            ASSERT( (i<=j)==(i_count<=j_count), NULL );
+            ASSERT( (i>=j)==(i_count>=j_count), NULL );
+            ++j;
+        }
+        ++i;
+    }
+}
+
+//! Test sequential iterators for vector type V.
+/** Also does timing. */
+template<typename V>
+void TestSequentialFor() {
+    V v;
+    v.grow_by(N);
+
+    // Check iterator
+    tbb::tick_count t0 = tbb::tick_count::now();
+    typename V::iterator p = v.begin();
+    ASSERT( !(*p).is_const(), NULL );
+    ASSERT( !p->is_const(), NULL );
+    for( int i=0; size_t(i)<v.size(); ++i, ++p ) {
+        if( (*p).state!=Foo::DefaultInitialized )
+            std::printf("ERROR for v[%ld]\n", long(i));
+        typename V::reference pref = *p;
+        pref.bar() = i;
+        typename V::difference_type delta = p-v.begin();
+        ASSERT( delta==i, NULL );
+        ASSERT( -delta<=0, "difference type not signed?" );
+    }
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    // Check const_iterator going forwards
+    const V& u = v;
+    typename V::const_iterator cp = u.begin();
+    ASSERT( (*cp).is_const(), NULL );
+    ASSERT( cp->is_const(), NULL );
+    for( int i=0; size_t(i)<u.size(); ++i, ++cp ) {
+        CheckConstIterator(u,i,cp);
+    }
+    tbb::tick_count t2 = tbb::tick_count::now();
+    if( Verbose )
+        std::printf("Time for serial for:  assign time = %8.5f, check time = %8.5f\n",
+               (t1-t0).seconds(),(t2-t1).seconds());
+
+    // Now go backwards
+    cp = u.end();
+    for( int i=int(u.size()); i>0; ) {
+        --i;
+        --cp;
+        if( i>0 ) {
+            typename V::const_iterator cp_old = cp--;
+            int here = (*cp_old).bar();
+            ASSERT( here==u[i].bar(), NULL );
+            typename V::const_iterator cp_new = cp++;
+            int prev = (*cp_new).bar();
+            ASSERT( prev==u[i-1].bar(), NULL );
+        }
+        CheckConstIterator(u,i,cp);
+    }
+
+    // Now go forwards and backwards
+    cp = u.begin();
+    ptrdiff_t k = 0;
+    for( size_t i=0; i<u.size(); ++i ) {
+        CheckConstIterator(u,int(k),cp);
+        typename V::difference_type delta = i*3 % u.size();
+        if( 0<=k+delta && size_t(k+delta)<u.size() ) {
+            cp += delta;
+            k += delta;
+        }
+        delta = i*7 % u.size();
+        if( 0<=k-delta && size_t(k-delta)<u.size() ) {
+            if( i&1 )
+                cp -= delta;            // Test operator-=
+            else
+                cp = cp - delta;        // Test operator-
+            k -= delta;
+        }
+    }
+
+    for( int i=0; size_t(i)<u.size(); i=(i<50?i+1:i*3) )
+        for( int j=-i; size_t(i+j)<u.size(); j=(j<50?j+1:j*5) ) {
+            ASSERT( (u.begin()+i)[j].bar()==i+j, NULL );
+            ASSERT( (v.begin()+i)[j].bar()==i+j, NULL );
+            ASSERT( (i+u.begin())[j].bar()==i+j, NULL );
+            ASSERT( (i+v.begin())[j].bar()==i+j, NULL );
+        }
+
+    CheckIteratorComparison<typename V::iterator, typename V::iterator>(v);
+    CheckIteratorComparison<typename V::iterator, typename V::const_iterator>(v);
+    CheckIteratorComparison<typename V::const_iterator, typename V::iterator>(v);
+    CheckIteratorComparison<typename V::const_iterator, typename V::const_iterator>(v);
+
+    TestIteratorAssignment<typename V::const_iterator>( u.begin() );
+    TestIteratorAssignment<typename V::const_iterator>( v.begin() );
+    TestIteratorAssignment<typename V::iterator>( v.begin() );
+
+    // Check reverse_iterator
+    typename V::reverse_iterator rp = v.rbegin();
+    for( size_t i=v.size(); i>0; --i, ++rp ) {
+        typename V::reference pref = *rp;
+        ASSERT( size_t(pref.bar())==i-1, NULL );
+        ASSERT( rp!=v.rend(), NULL );
+    }
+    ASSERT( rp==v.rend(), NULL );
+
+    // Check const_reverse_iterator
+    typename V::const_reverse_iterator crp = u.rbegin();
+    for( size_t i=v.size(); i>0; --i, ++crp ) {
+        typename V::const_reference cpref = *crp;
+        ASSERT( size_t(cpref.bar())==i-1, NULL );
+        ASSERT( crp!=u.rend(), NULL );
+    }
+    ASSERT( crp==u.rend(), NULL );
+
+    TestIteratorAssignment<typename V::const_reverse_iterator>( u.rbegin() );
+    TestIteratorAssignment<typename V::reverse_iterator>( v.rbegin() );
+}
+
+static const size_t Modulus = 7;
+
+typedef tbb::concurrent_vector<Foo> MyVector;
+
+class GrowToAtLeast {
+    MyVector& my_vector;
+public:
+    void operator()( const tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            size_t n = my_vector.size();
+            size_t k = n==0 ? 0 : i % (2*n+1);
+            my_vector.grow_to_at_least(k+1);
+            ASSERT( my_vector.size()>=k+1, NULL );
+        }
+    }
+    GrowToAtLeast( MyVector& vector ) : my_vector(vector) {}
+};
+
+void TestConcurrentGrowToAtLeast() {
+    MyVector v;
+    for( size_t s=1; s<1000; s*=10 ) {
+        tbb::parallel_for( tbb::blocked_range<size_t>(0,1000000,100), GrowToAtLeast(v) );
+    }
+}
+
+//! Test concurrent invocations of method concurrent_vector::grow_by
+class GrowBy {
+    MyVector& my_vector;
+public:
+    void operator()( const tbb::blocked_range<int>& range ) const {
+        for( int i=range.begin(); i!=range.end(); ++i ) {
+            if( i%3 ) {
+                Foo& element = my_vector[my_vector.grow_by(1)];
+                element.bar() = i;
+            } else {
+                Foo f;
+                f.bar() = i;
+                size_t k = my_vector.push_back( f );
+                ASSERT( my_vector[k].bar()==i, NULL );
+            }
+        }
+    }
+    GrowBy( MyVector& vector ) : my_vector(vector) {}
+};
+
+//! Test concurrent invocations of method concurrent_vector::grow_by
+void TestConcurrentGrowBy( int nthread ) {
+    int m = 100000;
+    MyVector v;
+    tbb::parallel_for( tbb::blocked_range<int>(0,m,1000), GrowBy(v) );
+    ASSERT( v.size()==size_t(m), NULL );
+
+    // Verify that v is a permutation of 0..m
+    int inversions = 0;
+    bool* found = new bool[m];
+    memset( found, 0, m );
+    for( int i=0; i<m; ++i ) {
+        int index = v[i].bar();
+        ASSERT( !found[index], NULL );
+        found[index] = true;
+        if( i>0 )
+            inversions += v[i].bar()<v[i-1].bar();
+    }
+    for( int i=0; i<m; ++i ) {
+        ASSERT( found[i], NULL );
+        ASSERT( nthread>1 || v[i].bar()==i, "sequential execution is wrong" );
+    }
+    delete[] found;
+    if( nthread>1 && inversions<m/10 )
+        std::printf("Warning: not much concurrency in TestConcurrentGrowBy\n");
+}
+
+//! Test the assignment operator
+void TestAssign() {
+    typedef tbb::concurrent_vector<FooWithAssign> vector_t;
+    for( int dst_size=1; dst_size<=128; NextSize( dst_size ) ) {
+        for( int src_size=2; src_size<=128; NextSize( src_size ) ) {
+            vector_t u;
+            u.grow_to_at_least(src_size);
+            for( int i=0; i<src_size; ++i )
+                u[i].bar() = i*i;
+            vector_t v;
+            v.grow_to_at_least(dst_size);
+            for( int i=0; i<dst_size; ++i )
+                v[i].bar() = -i;
+            v = u;
+            u.clear();
+            ASSERT( u.size()==0, NULL );
+            ASSERT( v.size()==size_t(src_size), NULL );
+            for( int i=0; i<src_size; ++i )
+                ASSERT( v[i].bar()==(i*i), NULL );
+        }
+    }
+}
+
+//------------------------------------------------------------------------
+// Regression test for problem where on oversubscription caused
+// concurrent_vector::grow_by to run very slowly (TR#196).
+//------------------------------------------------------------------------
+
+#include "tbb/task_scheduler_init.h"
+#include <math.h>
+
+typedef unsigned long Number;
+
+static tbb::concurrent_vector<Number> Primes;
+
+class FindPrimes {
+    bool is_prime( Number val ) const {
+        int limit, factor = 3;
+        if( val<5u )
+            return val==2;
+        else {
+            limit = long(sqrtf(float(val))+0.5f);
+            while( factor<=limit && val % factor )
+                ++factor;
+            return factor>limit;
+        }
+    }
+public:
+    void operator()( const tbb::blocked_range<Number>& r ) const {
+        for( Number i=r.begin(); i!=r.end(); ++i ) {
+            if( i%2 && is_prime(i) ) {
+                Primes[Primes.grow_by(1)] = i;
+            }
+        }
+    }
+};
+
+static double TimeFindPrimes( int nthread ) {
+    Primes.clear();
+    tbb::task_scheduler_init init(nthread);
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for( tbb::blocked_range<Number>(0,1000000,500), FindPrimes() );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    return (t1-t0).seconds();
+}
+
+static void TestFindPrimes() {
+    // Time fully subscribed run.
+    double t2 = TimeFindPrimes( tbb::task_scheduler_init::automatic );
+
+    // Time parallel run that is very likely oversubscribed.
+    double t128 = TimeFindPrimes(128);
+
+    if( Verbose )
+        std::printf("TestFindPrimes: t2==%g t128=%g\n", t2, t128 );
+
+    // We allow the 128-thread run a little extra time to allow for thread overhead.
+    // Theoretically, following test will fail on machine with >128 processors.
+    // But that situation is not going to come up in the near future,
+    // and the generalization to fix the issue is not worth the trouble.
+    if( t128>1.10*t2 ) {
+        std::printf("Warning: grow_by is pathetically slow: t2==%g t128=%g\n", t2, t128);
+    }
+}
+
+//------------------------------------------------------------------------
+// Test compatibility with STL sort.
+//------------------------------------------------------------------------
+
+#include <algorithm>
+
+void TestSort() {
+    for( int n=1; n<100; n*=3 ) {
+        tbb::concurrent_vector<int> array;
+        array.grow_by( n );
+        for( int i=0; i<n; ++i )
+            array[i] = (i*7)%n;
+        std::sort( array.begin(), array.end() );
+        for( int i=0; i<n; ++i )
+            ASSERT( array[i]==i, NULL );
+    }
+}
+
+//------------------------------------------------------------------------
+
+int TestMain () {
+    if( MinThread<1 ) {
+        std::printf("ERROR: MinThread=%d, but must be at least 1\n",MinThread);
+    }
+
+    TestIteratorTraits<tbb::concurrent_vector<Foo>::iterator,Foo>();
+    TestIteratorTraits<tbb::concurrent_vector<Foo>::const_iterator,const Foo>();
+    TestSequentialFor<tbb::concurrent_vector<Foo> > ();
+    TestResizeAndCopy();
+    TestAssign();
+    TestCapacity();
+    for( int nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        tbb::task_scheduler_init init( nthread );
+        TestParallelFor( nthread );
+        TestConcurrentGrowToAtLeast();
+        TestConcurrentGrowBy( nthread );
+    }
+    TestFindPrimes();
+    TestSort();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/old/test_mutex_v2.cpp b/xdl/third_party/tbb/src/old/test_mutex_v2.cpp
new file mode 100644
index 00000000..90c94dab
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/test_mutex_v2.cpp
@@ -0,0 +1,242 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 1
+#define HARNESS_DEFAULT_MAX_THREADS 3
+
+//------------------------------------------------------------------------
+// Test TBB mutexes when used with parallel_for.h
+//
+// Usage: test_Mutex.exe [-v] nthread
+//
+// The -v option causes timing information to be printed.
+//
+// Compile with _OPENMP and -openmp
+//------------------------------------------------------------------------
+#include "../test/harness_defs.h"
+#include "tbb/atomic.h"
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+#include "tbb/tick_count.h"
+#include "../test/harness.h"
+#include "spin_rw_mutex_v2.h"
+#include <cstdlib>
+#include <cstdio>
+
+// This test deliberately avoids a "using tbb" statement,
+// so that the error of putting types in the wrong namespace will be caught.
+
+template<typename M>
+struct Counter {
+    typedef M mutex_type;
+    M mutex;
+    volatile long value;
+};
+
+//! Function object for use with parallel_for.h.
+template<typename C>
+struct AddOne: NoAssign {
+    C& counter;
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            if( i&1 ) {
+                // Try implicit acquire and explicit release
+                typename C::mutex_type::scoped_lock lock(counter.mutex);
+                counter.value = counter.value+1;
+                lock.release();
+            } else {
+                // Try explicit acquire and implicit release
+                typename C::mutex_type::scoped_lock lock;
+                lock.acquire(counter.mutex);
+                counter.value = counter.value+1;
+            }
+        }
+    }
+    AddOne( C& counter_ ) : counter(counter_) {}
+};
+
+//! Generic test of a TBB mutex type M.
+/** Does not test features specific to reader-writer locks. */
+template<typename M>
+void Test( const char * name ) {
+    if( Verbose ) {
+        printf("%s time = ",name);
+        fflush(stdout);
+    }
+    Counter<M> counter;
+    counter.value = 0;
+    const int n = 100000;
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,n,n/10),AddOne<Counter<M> >(counter));
+    tbb::tick_count t1 = tbb::tick_count::now();
+    if( Verbose )
+        printf("%g usec\n",(t1-t0).seconds());
+    if( counter.value!=n )
+        printf("ERROR for %s: counter.value=%ld\n",name,counter.value);
+}
+
+template<typename M, size_t N>
+struct Invariant {
+    typedef M mutex_type;
+    M mutex;
+    const char* mutex_name;
+    volatile long value[N];
+    Invariant( const char* mutex_name_ ) :
+        mutex_name(mutex_name_)
+    {
+        for( size_t k=0; k<N; ++k )
+            value[k] = 0;
+    }
+    void update() {
+        for( size_t k=0; k<N; ++k )
+            ++value[k];
+    }
+    bool value_is( long expected_value ) const {
+        long tmp;
+        for( size_t k=0; k<N; ++k )
+            if( (tmp=value[k])!=expected_value ) {
+                printf("ERROR: %ld!=%ld\n", tmp, expected_value);
+                return false;
+            }
+        return true;
+    }
+    bool is_okay() {
+        return value_is( value[0] );
+    }
+};
+
+//! Function object for use with parallel_for.h.
+template<typename I>
+struct TwiddleInvariant: NoAssign {
+    I& invariant;
+    TwiddleInvariant( I& invariant_ ) : invariant(invariant_) {}
+
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            //! Every 8th access is a write access
+            const bool write = (i%8)==7;
+            bool okay = true;
+            bool lock_kept = true;
+            if( (i/8)&1 ) {
+                // Try implicit acquire and explicit release
+                typename I::mutex_type::scoped_lock lock(invariant.mutex,write);
+                execute_aux(lock, i, write, okay, lock_kept);
+                lock.release();
+            } else {
+                // Try explicit acquire and implicit release
+                typename I::mutex_type::scoped_lock lock;
+                lock.acquire(invariant.mutex,write);
+                execute_aux(lock, i, write, okay, lock_kept);
+            }
+            if( !okay ) {
+                printf( "ERROR for %s at %ld: %s %s %s %s\n",invariant.mutex_name, long(i),
+                        write     ? "write,"                  : "read,",
+                        write     ? (i%16==7?"downgrade,":"") : (i%8==3?"upgrade,":""),
+                        lock_kept ? "lock kept,"              : "lock not kept,", // TODO: only if downgrade/upgrade
+                        (i/8)&1   ? "impl/expl"               : "expl/impl" );
+            }
+        }
+    }
+private:
+    void execute_aux(typename I::mutex_type::scoped_lock & lock, const size_t i, const bool write, bool & okay, bool & lock_kept) const {
+        if( write ) {
+            long my_value = invariant.value[0];
+            invariant.update();
+            if( i%16==7 ) {
+                lock_kept = lock.downgrade_to_reader();
+                if( !lock_kept )
+                    my_value = invariant.value[0] - 1;
+                okay = invariant.value_is(my_value+1);
+            }
+        } else {
+            okay = invariant.is_okay();
+            if( i%8==3 ) {
+                long my_value = invariant.value[0];
+                lock_kept = lock.upgrade_to_writer();
+                if( !lock_kept )
+                    my_value = invariant.value[0];
+                invariant.update();
+                okay = invariant.value_is(my_value+1);
+            }
+        }
+    }
+};
+
+/** This test is generic so that we can test any other kinds of ReaderWriter locks we write later. */
+template<typename M>
+void TestReaderWriterLock( const char * mutex_name ) {
+    if( Verbose ) {
+        printf("%s readers & writers time = ",mutex_name);
+        fflush(stdout);
+    }
+    Invariant<M,8> invariant(mutex_name);
+    const size_t n = 500000;
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,n,n/100),TwiddleInvariant<Invariant<M,8> >(invariant));
+    tbb::tick_count t1 = tbb::tick_count::now();
+    // There is either a writer or a reader upgraded to a writer for each 4th iteration
+    long expected_value = n/4;
+    if( !invariant.value_is(expected_value) )
+        printf("ERROR for %s: final invariant value is wrong\n",mutex_name);
+    if( Verbose )
+        printf("%g usec\n", (t1-t0).seconds());
+}
+
+/** Test try_acquire functionality of a non-reenterable mutex */
+template<typename M>
+void TestTryAcquire_OneThread( const char * mutex_name ) {
+    M tested_mutex;
+    typename M::scoped_lock lock1;
+    if( lock1.try_acquire(tested_mutex) )
+        lock1.release();
+    else
+        printf("ERROR for %s: try_acquire failed though it should not\n", mutex_name);
+    {
+        typename M::scoped_lock lock2(tested_mutex);
+        if( lock1.try_acquire(tested_mutex) )
+            printf("ERROR for %s: try_acquire succeeded though it should not\n", mutex_name);
+    }
+    if( lock1.try_acquire(tested_mutex) )
+        lock1.release();
+    else
+        printf("ERROR for %s: try_acquire failed though it should not\n", mutex_name);
+}
+
+#include "tbb/task_scheduler_init.h"
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init( p );
+        if( Verbose )
+            printf( "testing with %d workers\n", static_cast<int>(p) );
+        const int n = 3;
+        // Run each test several times.
+        for( int i=0; i<n; ++i ) {
+            Test<tbb::spin_rw_mutex>( "Spin RW Mutex" );
+            TestTryAcquire_OneThread<tbb::spin_rw_mutex>("Spin RW Mutex"); // only tests try_acquire for writers
+            TestReaderWriterLock<tbb::spin_rw_mutex>( "Spin RW Mutex" );
+        }
+        if( Verbose )
+            printf( "calling destructor for task_scheduler_init\n" );
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/old/test_task_scheduler_observer_v3.cpp b/xdl/third_party/tbb/src/old/test_task_scheduler_observer_v3.cpp
new file mode 100644
index 00000000..b5691303
--- /dev/null
+++ b/xdl/third_party/tbb/src/old/test_task_scheduler_observer_v3.cpp
@@ -0,0 +1,121 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//TODO: when removing TBB_PREVIEW_LOCAL_OBSERVER, change the header or defines here
+#include "tbb/task_scheduler_observer.h"
+
+typedef uintptr_t FlagType;
+const int MaxFlagIndex = sizeof(FlagType)*8-1;
+
+class MyObserver: public tbb::task_scheduler_observer {
+    FlagType flags;
+    void on_scheduler_entry( bool is_worker ) __TBB_override;
+    void on_scheduler_exit( bool is_worker ) __TBB_override;
+public:
+    MyObserver( FlagType flags_ ) : flags(flags_) {
+        observe(true);
+    }
+};
+
+#include "harness_assert.h"
+#include "tbb/atomic.h"
+
+tbb::atomic<int> EntryCount;
+tbb::atomic<int> ExitCount;
+
+struct State {
+    FlagType MyFlags;
+    bool IsMaster;
+    State() : MyFlags(), IsMaster() {}
+};
+
+#include "../tbb/tls.h"
+tbb::internal::tls<State*> LocalState;
+
+void MyObserver::on_scheduler_entry( bool is_worker ) {
+    State& state = *LocalState;
+    ASSERT( is_worker==!state.IsMaster, NULL );
+    ++EntryCount;
+    state.MyFlags |= flags;
+}
+
+void MyObserver::on_scheduler_exit( bool is_worker ) {
+    State& state = *LocalState;
+    ASSERT( is_worker==!state.IsMaster, NULL );
+    ++ExitCount;
+    state.MyFlags &= ~flags;
+}
+
+#include "tbb/task.h"
+
+class FibTask: public tbb::task {
+    const int n;
+    FlagType flags;
+public:
+    FibTask( int n_, FlagType flags_ ) : n(n_), flags(flags_) {}
+    tbb::task* execute() __TBB_override {
+        ASSERT( !(~LocalState->MyFlags & flags), NULL );
+        if( n>=2 ) {
+            set_ref_count(3);
+            spawn(*new( allocate_child() ) FibTask(n-1,flags));
+            spawn_and_wait_for_all(*new( allocate_child() ) FibTask(n-2,flags));
+        }
+        return NULL;
+    }
+};
+
+void DoFib( FlagType flags ) {
+    tbb::task* t = new( tbb::task::allocate_root() ) FibTask(10,flags);
+    tbb::task::spawn_root_and_wait(*t);
+}
+
+#include "tbb/task_scheduler_init.h"
+#include "harness.h"
+
+class DoTest {
+    int nthread;
+public:
+    DoTest( int n ) : nthread(n) {}
+    void operator()( int i ) const {
+        LocalState->IsMaster = true;
+        if( i==0 ) {   
+            tbb::task_scheduler_init init(nthread);
+            DoFib(0);
+        } else {
+            FlagType f = i<=MaxFlagIndex? 1<<i : 0;
+            MyObserver w(f);
+            tbb::task_scheduler_init init(nthread);
+            DoFib(f);
+        }
+    }
+};
+
+void TestObserver( int p, int q ) {
+    NativeParallelFor( p, DoTest(q) );
+}
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) 
+        for( int q=MinThread; q<=MaxThread; ++q ) 
+            TestObserver(p,q);
+    ASSERT( EntryCount>0, "on_scheduler_entry not exercised" );
+    ASSERT( ExitCount>0, "on_scheduler_exit not exercised" );
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/perf/coarse_grained_raii_lru_cache.h b/xdl/third_party/tbb/src/perf/coarse_grained_raii_lru_cache.h
new file mode 100644
index 00000000..76e0d3e8
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/coarse_grained_raii_lru_cache.h
@@ -0,0 +1,147 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef coarse_grained_raii_lru_cache_H
+#define coarse_grained_raii_lru_cache_H
+
+#include <map>
+#include <list>
+#include <utility>
+#include <algorithm>
+
+#include "tbb/spin_mutex.h"
+#include "tbb/tbb_stddef.h"
+template <typename key_type, typename value_type, typename value_functor_type = value_type (*)(key_type) >
+class coarse_grained_raii_lru_cache : tbb::internal::no_assign{
+    typedef value_functor_type value_function_type;
+
+    typedef std::size_t ref_counter_type;
+    struct map_value_type;
+    typedef std::map<key_type, map_value_type> map_storage_type;
+    typedef std::list<typename map_storage_type::iterator> lru_list_type;
+    struct map_value_type {
+        value_type my_value;
+        ref_counter_type my_ref_counter;
+        typename lru_list_type::iterator my_lru_list_iterator;
+        bool my_is_ready;
+
+        map_value_type (value_type const& a_value,  ref_counter_type a_ref_counter,    typename lru_list_type::iterator a_lru_list_iterator, bool a_is_ready)
+            : my_value(a_value), my_ref_counter(a_ref_counter), my_lru_list_iterator (a_lru_list_iterator)
+            ,my_is_ready(a_is_ready)
+        {}
+    };
+
+    class handle_object;
+public:
+    typedef handle_object handle;
+
+    coarse_grained_raii_lru_cache(value_function_type f, std::size_t number_of_lru_history_items): my_value_function(f),my_number_of_lru_history_items(number_of_lru_history_items){}
+    handle_object operator[](key_type k){
+        tbb::spin_mutex::scoped_lock lock(my_mutex);
+        bool is_new_value_needed = false;
+        typename map_storage_type::iterator it = my_map_storage.find(k);
+        if (it == my_map_storage.end()){
+            it = my_map_storage.insert(it,std::make_pair(k,map_value_type(value_type(),0,my_lru_list.end(),false)));
+            is_new_value_needed = true;
+        }else {
+            typename lru_list_type::iterator list_it = it->second.my_lru_list_iterator;
+            if (list_it!=my_lru_list.end()) {
+                my_lru_list.erase(list_it);
+                it->second.my_lru_list_iterator= my_lru_list.end();
+            }
+        }
+        typename map_storage_type::reference value_ref = *it;
+        //increase ref count
+        ++(value_ref.second.my_ref_counter);
+        if (is_new_value_needed){
+            lock.release();
+            value_ref.second.my_value = my_value_function(k);
+            __TBB_store_with_release(value_ref.second.my_is_ready, true);
+
+        }else{
+            if (!value_ref.second.my_is_ready){
+                lock.release();
+                tbb::internal::spin_wait_while_eq(value_ref.second.my_is_ready,false);
+            }
+        }
+        return handle_object(*this,(value_ref));
+    }
+private:
+    void signal_end_of_usage(typename map_storage_type::reference value_ref){
+        tbb::spin_mutex::scoped_lock lock(my_mutex);
+        typename map_storage_type::iterator it = my_map_storage.find(value_ref.first);
+        __TBB_ASSERT(it!=my_map_storage.end(),"cache should not return past-end iterators to outer world");
+        __TBB_ASSERT(&(*it) == &value_ref,"dangling reference has been returned to outside world? data race ?");
+        __TBB_ASSERT( my_lru_list.end()== std::find(my_lru_list.begin(),my_lru_list.end(),it),
+                "object in use should not be in list of unused objects ");
+        if (! --(it->second.my_ref_counter)){ //decrease ref count, and check if it was the last reference
+            if (my_lru_list.size()>=my_number_of_lru_history_items){
+                size_t number_of_elements_to_evict = 1 + my_lru_list.size() - my_number_of_lru_history_items;
+                for (size_t i=0; i<number_of_elements_to_evict; ++i){
+                    typename map_storage_type::iterator it_to_evict = my_lru_list.back();
+                    my_lru_list.pop_back();
+                    my_map_storage.erase(it_to_evict);
+                }
+            }
+            my_lru_list.push_front(it);
+            it->second.my_lru_list_iterator = my_lru_list.begin();
+        }
+    }
+private:
+    value_function_type my_value_function;
+    std::size_t const my_number_of_lru_history_items;
+    map_storage_type my_map_storage;
+    lru_list_type my_lru_list;
+    tbb::spin_mutex my_mutex;
+private:
+    struct handle_move_t:tbb::internal::no_assign{
+        coarse_grained_raii_lru_cache & my_cache_ref;
+        typename map_storage_type::reference my_value_ref;
+        handle_move_t(coarse_grained_raii_lru_cache & cache_ref, typename map_storage_type::reference value_ref):my_cache_ref(cache_ref),my_value_ref(value_ref) {};
+    };
+    class handle_object {
+        coarse_grained_raii_lru_cache * my_cache_pointer;
+        typename map_storage_type::reference my_value_ref;
+    public:
+        handle_object(coarse_grained_raii_lru_cache & cache_ref, typename map_storage_type::reference value_ref):my_cache_pointer(&cache_ref), my_value_ref(value_ref) {}
+        handle_object(handle_move_t m):my_cache_pointer(&m.my_cache_ref), my_value_ref(m.my_value_ref){}
+        operator handle_move_t(){ return move(*this);}
+        value_type& value(){return my_value_ref.second.my_value;}
+        ~handle_object(){
+            if (my_cache_pointer){
+                my_cache_pointer->signal_end_of_usage(my_value_ref);
+            }
+        }
+    private:
+        friend handle_move_t move(handle_object& h){
+            return handle_object::move(h);
+        }
+        static handle_move_t move(handle_object& h){
+            __TBB_ASSERT(h.my_cache_pointer,"move from the same object twice ?");
+            coarse_grained_raii_lru_cache * cache_pointer = NULL;
+            std::swap(cache_pointer,h.my_cache_pointer);
+            return handle_move_t(*cache_pointer,h.my_value_ref);
+        }
+    private:
+        void operator=(handle_object&);
+        handle_object(handle_object &);
+    };
+};
+#endif //coarse_grained_raii_lru_cache_H
diff --git a/xdl/third_party/tbb/src/perf/cpq_pdes.cpp b/xdl/third_party/tbb/src/perf/cpq_pdes.cpp
new file mode 100644
index 00000000..6acf0f7f
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/cpq_pdes.cpp
@@ -0,0 +1,230 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstdlib>
+#include <cmath>
+#include <queue>
+#include "tbb/tbb_stddef.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/tick_count.h"
+#include "tbb/blocked_range.h"
+#include "../test/harness.h"
+#include "tbb/concurrent_priority_queue.h"
+
+#pragma warning(disable: 4996)
+
+#define IMPL_STL 0
+#define IMPL_CPQ 1
+
+using namespace tbb;
+
+//const int contention = 75; // degree contention.  100 = 0 us busy_wait, 50 = 50*contention_unit us
+const double contention_unit = 0.025; // in microseconds (us)
+const double throughput_window = 30; // in seconds
+const int num_initial_events = 10000; // number of initial events in the queue
+const int min_elapse = 20; // min contention_units to elapse between event spawns
+const int max_elapse = 40; // max contention_units to elapse between event spawns
+const int min_spawn = 0; // min number of events to spawn
+const int max_spawn = 2; // max number of events to spawn
+
+tbb::atomic<unsigned int> operation_count;
+tbb::tick_count start;
+bool done;
+
+class event {
+public:
+    int timestamp;
+    int elapse;
+    int spawn;
+};
+
+class timestamp_compare {
+public:
+    bool operator()(event e1, event e2) {
+        return e2.timestamp<e1.timestamp;
+    }
+};
+
+spin_mutex *my_mutex;
+std::priority_queue<event, std::vector<event>, timestamp_compare > *stl_cpq;
+concurrent_priority_queue<event, timestamp_compare > *lfc_pq;
+
+unsigned int one_us_iters = 429; // default value
+
+// if user wants to calibrate to microseconds on particular machine, call this at beginning of program
+// sets one_us_iters to number of iters to busy_wait for approx. 1 us
+void calibrate_busy_wait() {
+    const unsigned niter = 1000000;
+    tbb::tick_count t0 = tbb::tick_count::now();
+    for (volatile unsigned int i=0; i<niter; ++i) continue;
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    one_us_iters = (unsigned int)(niter/(t1-t0).seconds())*1e-6;
+    printf("one_us_iters: %d\n", one_us_iters);
+}
+
+void busy_wait(double us)
+{
+    unsigned int iter = us*one_us_iters;
+    for (volatile unsigned int i=0; i<iter; ++i) continue;
+}
+
+
+void do_push(event elem, int nThr, int impl) {
+    if (impl == IMPL_STL) {
+        if (nThr == 1) {
+            stl_cpq->push(elem);
+        }
+        else {
+            tbb::spin_mutex::scoped_lock myLock(*my_mutex);
+            stl_cpq->push(elem);
+        }
+    }
+    else {
+        lfc_pq->push(elem);
+    }
+}
+
+bool do_pop(event& elem, int nThr, int impl) {
+    if (impl == IMPL_STL) {
+        if (nThr == 1) {
+            if (!stl_cpq->empty()) {
+                elem = stl_cpq->top();
+                stl_cpq->pop();
+                return true;
+            }
+        }
+        else {
+            tbb::spin_mutex::scoped_lock myLock(*my_mutex);
+            if (!stl_cpq->empty()) {
+                elem = stl_cpq->top();
+                stl_cpq->pop();
+                return true;
+            }
+        }
+    }
+    else {
+        if (lfc_pq->try_pop(elem)) {
+            return true;
+        }
+    }
+    return false;
+}
+
+struct TestPDESloadBody : NoAssign {
+    int nThread;
+    int implementation;
+
+    TestPDESloadBody(int nThread_, int implementation_) : 
+        nThread(nThread_), implementation(implementation_) {}
+    
+    void operator()(const int threadID) const {
+        if (threadID == nThread) {
+            sleep(throughput_window);
+            done = true;
+        }
+        else {
+            event e, tmp;
+            unsigned int num_operations = 0;
+            for (;;) {
+                // pop an event
+                if (do_pop(e, nThread, implementation)) {
+                    num_operations++;
+                    // do the event
+                    busy_wait(e.elapse*contention_unit);
+                    while (e.spawn > 0) {
+                        tmp.spawn = ((e.spawn+1-min_spawn) % ((max_spawn-min_spawn)+1))+min_spawn;
+                        tmp.timestamp = e.timestamp + e.elapse;
+                        e.timestamp = tmp.timestamp;
+                        e.elapse = ((e.elapse+1-min_elapse) % ((max_elapse-min_elapse)+1))+min_elapse;
+                        tmp.elapse = e.elapse;
+                        do_push(tmp, nThread, implementation);
+                        num_operations++;
+                        e.spawn--;
+                        busy_wait(e.elapse*contention_unit);
+                        if (done) break;
+                    }
+                }
+                if (done) break;
+            }
+            operation_count += num_operations;
+        }
+    }
+};
+
+void preload_queue(int nThr, int impl) {
+    event an_event;
+    for (int i=0; i<num_initial_events; ++i) {
+        an_event.timestamp = 0;
+        an_event.elapse = (int)rand() % (max_elapse+1);
+        an_event.spawn = (int)rand() % (max_spawn+1);
+        do_push(an_event, nThr, impl);
+    }
+}
+
+void TestPDESload(int nThreads) {
+    REPORT("%4d", nThreads);
+
+    operation_count = 0;
+    done = false;
+    stl_cpq = new std::priority_queue<event, std::vector<event>, timestamp_compare >;
+    preload_queue(nThreads, IMPL_STL);
+    TestPDESloadBody my_stl_test(nThreads, IMPL_STL);
+    start = tbb::tick_count::now();
+    NativeParallelFor(nThreads+1, my_stl_test);
+    delete stl_cpq;
+
+    REPORT(" %10d", operation_count/throughput_window);
+    
+    operation_count = 0;
+    done = false;
+    lfc_pq = new concurrent_priority_queue<event, timestamp_compare >;
+    preload_queue(nThreads, IMPL_CPQ);
+    TestPDESloadBody my_cpq_test(nThreads, IMPL_CPQ);
+    start = tbb::tick_count::now();
+    NativeParallelFor(nThreads+1, my_cpq_test);
+    delete lfc_pq;
+
+    REPORT(" %10d\n", operation_count/throughput_window);
+}
+
+int TestMain() {
+    srand(42);
+    if (MinThread < 1)
+        MinThread = 1;
+    //calibrate_busy_wait();
+    cache_aligned_allocator<spin_mutex> my_mutex_allocator;
+    my_mutex = (spin_mutex *)my_mutex_allocator.allocate(1);
+
+    REPORT("#Thr ");
+    REPORT("STL        ");
+#ifdef LINEARIZABLE
+    REPORT("CPQ_L\n"); 
+#else
+    REPORT("CPQ_N\n"); 
+#endif
+    for (int p = MinThread; p <= MaxThread; ++p) {
+        TestPDESload(p);
+    }
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/perf/fibonacci_impl_tbb.cpp b/xdl/third_party/tbb/src/perf/fibonacci_impl_tbb.cpp
new file mode 100644
index 00000000..168883ac
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/fibonacci_impl_tbb.cpp
@@ -0,0 +1,78 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstdio>
+#include <cstdlib>
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task.h"
+#include "tbb/tick_count.h"
+
+extern long CutOff;
+
+long SerialFib( const long n ) {
+    if( n<2 )
+        return n;
+    else
+        return SerialFib(n-1)+SerialFib(n-2);
+}
+
+struct FibContinuation: public tbb::task {
+    long* const sum;
+    long x, y;
+    FibContinuation( long* sum_ ) : sum(sum_) {}
+    tbb::task* execute() {
+        *sum = x+y;
+        return NULL;
+    }
+};
+
+struct FibTask: public tbb::task {
+    long n;
+    long * sum;
+    FibTask( const long n_, long * const sum_ ) :
+        n(n_), sum(sum_)
+    {}
+    tbb::task* execute() {
+        if( n<CutOff ) {
+            *sum = SerialFib(n);
+            return NULL;
+        } else {
+            FibContinuation& c = 
+                *new( allocate_continuation() ) FibContinuation(sum);
+            FibTask& b = *new( c.allocate_child() ) FibTask(n-1,&c.y);
+            recycle_as_child_of(c);
+            n -= 2;
+            sum = &c.x;
+            // Set ref_count to "two children".
+            c.set_ref_count(2);
+            c.spawn( b );
+            return this;
+        }
+    }
+};
+
+long ParallelFib( const long n ) {
+    long sum = 0;
+    FibTask& a = *new(tbb::task::allocate_root()) FibTask(n,&sum);
+    tbb::task::spawn_root_and_wait(a);
+    return sum;
+}
+
diff --git a/xdl/third_party/tbb/src/perf/perf.cpp b/xdl/third_party/tbb/src/perf/perf.cpp
new file mode 100644
index 00000000..d9910cc0
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/perf.cpp
@@ -0,0 +1,860 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "perf.h"
+
+#include <cstdlib>
+#include <cmath>
+#include <vector>
+#include <algorithm>
+#include <cassert>
+
+#include "tbb/tick_count.h"
+
+#define HARNESS_CUSTOM_MAIN 1
+#include "../src/test/harness.h"
+#include "../src/test/harness_barrier.h"
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task.h"
+#include "tbb/atomic.h"
+
+#if  __linux__ || __APPLE__ || __FreeBSD__ || __NetBSD__
+    #include <sys/resource.h>
+#endif
+
+__TBB_PERF_API int NumCpus = tbb::task_scheduler_init::default_num_threads(),
+                   NumThreads,
+                   MaxConcurrency;
+
+namespace Perf {
+
+SessionSettings theSettings;
+
+namespace internal {
+
+    typedef std::vector<duration_t> durations_t;
+
+    static uintptr_t NumRuns = 7;
+    static duration_t RunDuration = 0.01;
+
+    static const int RateFieldLen = 10;
+    static const int OvhdFieldLen = 12;
+
+    const char* TestNameColumnTitle = "Test name";
+    const char* WorkloadNameColumnTitle = "Workload";
+
+    size_t TitleFieldLen = 0;
+    size_t WorkloadFieldLen = 0;
+
+    int TotalConfigs = 0;
+    int MaxTbbMasters = 1;
+
+    //! Defines the mapping between threads and cores in the undersubscription mode
+    /** When adding new enumerator, insert it before amLast, and do not specify
+        its value explicitly. **/
+    enum AffinitizationMode {
+        amFirst = 0,
+        amDense = amFirst,
+        amSparse,
+        //! Used to track the number of supported affinitization modes
+        amLast
+    };
+
+    static const int NumAffinitizationModes = amLast - amFirst; 
+
+    const char* AffinitizationModeNames[] = { "dense", "sparse" };
+
+    int NumActiveAffModes = 1;
+
+    //! Settings of a test run configuration
+    struct RunConfig {
+        int my_maxConcurrency;
+        int my_numThreads;      // For task scheduler tests this is number of workers + 1
+        int my_numMasters;      // Used for task scheduler tests only
+        int my_affinityMode;    // Used for task scheduler tests only
+        int my_workloadID;
+
+        int NumMasters () const {
+            return theSettings.my_opts & UseTaskScheduler ? my_numMasters : my_numThreads;
+        }
+    };
+
+    double StandardDeviation ( double avg, const durations_t& d ) {
+        double  std_dev = 0;
+        for ( uintptr_t i = 0; i < d.size(); ++i ) {
+            double  dev = fabs(d[i] - avg);
+            std_dev += dev * dev;
+        }
+        std_dev = sqrt(std_dev / d.size());
+        return std_dev / avg * 100;
+    }
+
+    void Statistics ( const durations_t& d, 
+                      duration_t& avgTime, double& stdDev, 
+                      duration_t& minTime, duration_t& maxTime )
+    {
+        minTime = maxTime = avgTime = d[0];
+        for ( size_t i = 1; i < d.size(); ++i ) {
+            avgTime += d[i];
+            if ( minTime > d[i] )
+                minTime = d[i];
+            else if ( maxTime < d[i] )
+                maxTime = d[i];
+        }
+        avgTime = avgTime / d.size();
+        stdDev = StandardDeviation( avgTime, d );
+    }
+
+    //! Timing data for the series of repeated runs and results of their statistical processing
+    struct TimingSeries {
+        //! Statistical timing series
+        durations_t my_durations;
+        
+        //! Average time obtained from my_durations data
+        duration_t  my_avgTime;
+
+        //! Minimal time obtained from my_durations data
+        duration_t  my_minTime;
+
+        //! Minimal time obtained from my_durations data
+        duration_t  my_maxTime;
+
+        //! Standard deviation of my_avgTime value (per cent)
+        double  my_stdDev;
+
+        TimingSeries ( uintptr_t nruns = NumRuns )
+            : my_durations(nruns), my_avgTime(0), my_minTime(0), my_maxTime(0)
+        {}
+
+        void CalculateStatistics () {
+            Statistics( my_durations, my_avgTime, my_stdDev, my_minTime, my_maxTime );
+        }
+    }; // struct TimingSeries
+
+    //! Settings and timing results for a test run configuration
+    struct RunResults {
+        //! Run configuration settings
+        RunConfig   my_config;
+        
+        //! Timing results for this run configuration
+        TimingSeries my_timing;
+    };
+
+    typedef std::vector<const char*>    names_t;
+    typedef std::vector<TimingSeries>   timings_t;
+    typedef std::vector<RunResults>     test_results_t;
+
+    enum TestMethods {
+        idRunSerial = 0x01,
+        idOnStart = 0x02,
+        idOnFinish = 0x04,
+        idPrePostProcess = idOnStart | idOnFinish
+    };
+
+    //! Set of flags identifying methods not overridden by the currently active test
+    /** Used as a scratch var. **/
+    uintptr_t g_absentMethods;
+
+    //! Test object and timing results for all of its configurations 
+    struct TestResults {
+        //! Pointer to the test object interface
+        Test*           my_test;
+
+        //! Set of flags identifying optional methods overridden by my_test
+        /** A set of ORed TestMethods flags **/
+        uintptr_t       my_availableMethods;
+        
+        //! Vector of serial times for each workload supported by this test
+        /** Element index in the vector serves as a zero based workload ID. **/
+        timings_t       my_serialBaselines;
+        
+        //! Common baselines for both parallel and serial variants
+        /** Element index in the vector serves as a zero based workload ID. **/
+        timings_t       my_baselines;
+
+        //! Strings identifying workloads to be used in output
+        names_t         my_workloadNames;
+
+        //! Vector of timings for all run configurations of my_test
+        test_results_t  my_results;
+
+        const char*     my_testName;
+
+        mutable bool    my_hasOwnership;
+
+        TestResults ( Test* t, const char* className, bool takeOwnership )
+            : my_test(t), my_availableMethods(0), my_testName(className), my_hasOwnership(takeOwnership)
+        {}
+
+        TestResults ( const TestResults& tr )
+            : my_test(tr.my_test)
+            , my_availableMethods(0)
+            , my_testName(tr.my_testName)
+            , my_hasOwnership(tr.my_hasOwnership)
+        {
+            tr.my_hasOwnership = false;
+        }
+
+        ~TestResults () {
+            for ( size_t i = 0; i < my_workloadNames.size(); ++i )
+                delete my_workloadNames[i];
+            if ( my_hasOwnership )
+                delete my_test;
+        }
+    }; // struct TestResults
+
+    typedef std::vector<TestResults> session_t;
+
+    session_t theSession;
+
+    TimingSeries CalibrationTiming;
+
+    const uintptr_t CacheSize = 8*1024*1024;
+    volatile intptr_t W[CacheSize];
+
+    struct WiperBody {
+        void operator()( int ) const {
+            volatile intptr_t sink = 0;
+            for ( uintptr_t i = 0; i < CacheSize; ++i )
+                sink += W[i];
+        }
+    };
+
+    void TraceHistogram ( const durations_t& t, const char* histogramFileName ) {
+        FILE* f = histogramFileName ? fopen(histogramFileName, "wt") : stdout;
+        uintptr_t  n = t.size();
+        const uintptr_t num_buckets = 100;
+        double  min_val = *std::min_element(t.begin(), t.end()),
+                max_val = *std::max_element(t.begin(), t.end()),
+                bucket_size = (max_val - min_val) / num_buckets;
+        std::vector<uintptr_t> hist(num_buckets + 1, 0);
+        for ( uintptr_t i = 0; i < n; ++i )
+            ++hist[uintptr_t((t[i]-min_val)/bucket_size)];
+        ASSERT (hist[num_buckets] == 1, "");
+        ++hist[num_buckets - 1];
+        hist.resize(num_buckets);
+        fprintf (f, "Histogram: nvals = %u, min = %g, max = %g, nbuckets = %u\n", (unsigned)n, min_val, max_val, (unsigned)num_buckets);
+        double bucket = min_val;
+        for ( uintptr_t i = 0; i < num_buckets; ++i, bucket+=bucket_size )
+            fprintf (f, "%12g\t%u\n", bucket, (unsigned)hist[i]);
+        fclose(f);
+    }
+
+#if _MSC_VER
+    typedef DWORD_PTR cpu_set_t;
+
+    class AffinityHelper {
+        static const unsigned MaxAffinitySetSize = sizeof(cpu_set_t) * 8;
+        static unsigned AffinitySetSize;
+
+        //! Mapping from a CPU index to a valid affinity cpu_mask
+        /** The first element is not used. **/
+        static cpu_set_t m_affinities[MaxAffinitySetSize + 1];
+
+        static cpu_set_t m_processMask;
+
+        class Initializer {
+        public:
+            Initializer () {
+                SYSTEM_INFO si;
+                GetNativeSystemInfo(&si);
+                ASSERT( si.dwNumberOfProcessors <= MaxAffinitySetSize, "Too many CPUs" );
+                AffinitySetSize = min (si.dwNumberOfProcessors, MaxAffinitySetSize);
+                cpu_set_t systemMask = 0;
+                GetProcessAffinityMask( GetCurrentProcess(), &m_processMask, &systemMask );
+                cpu_set_t cpu_mask = 1;
+                for ( DWORD i = 0; i < AffinitySetSize; ++i ) {
+                    while ( !(cpu_mask & m_processMask) && cpu_mask )
+                        cpu_mask <<= 1;
+                    ASSERT( cpu_mask != 0, "Process affinity set is culled?" );
+                    m_affinities[i] = cpu_mask;
+                    cpu_mask <<= 1;
+                }
+            }
+        }; // class AffinityHelper::Initializer
+
+        static Initializer m_initializer;
+
+    public:
+        static cpu_set_t CpuAffinity ( int cpuIndex ) {
+            return m_affinities[cpuIndex % AffinitySetSize];
+        }
+
+        static const cpu_set_t& ProcessMask () { return m_processMask; }
+    }; // class AffinityHelper
+
+    unsigned AffinityHelper::AffinitySetSize = 0;
+    cpu_set_t AffinityHelper::m_affinities[AffinityHelper::MaxAffinitySetSize + 1] = {0};
+    cpu_set_t AffinityHelper::m_processMask = 0;
+    AffinityHelper::Initializer AffinityHelper::m_initializer;
+
+    #define CPU_ZERO(cpu_mask)              (*cpu_mask = 0)
+    #define CPU_SET(cpu_idx, cpu_mask)      (*cpu_mask |= AffinityHelper::CpuAffinity(cpu_idx))
+    #define CPU_CLR(cpu_idx, cpu_mask)      (*cpu_mask &= ~AffinityHelper::CpuAffinity(cpu_idx))
+    #define CPU_ISSET(cpu_idx, cpu_mask)    ((*cpu_mask & AffinityHelper::CpuAffinity(cpu_idx)) != 0)
+
+#elif __linux__ /* end of _MSC_VER */
+
+    #include <unistd.h>
+    #include <sys/types.h>
+    #include <linux/unistd.h>
+
+    pid_t gettid() { return (pid_t)syscall(__NR_gettid); }
+
+    #define GET_MASK(cpu_set) (*(unsigned*)(void*)&cpu_set)
+    #define RES_STAT(res) (res != 0 ? "failed" : "ok")
+
+    class AffinityHelper {
+        static cpu_set_t m_processMask;
+
+        class Initializer {
+        public:
+            Initializer () {
+                CPU_ZERO (&m_processMask);
+                int res = sched_getaffinity( getpid(), sizeof(cpu_set_t), &m_processMask );
+                ASSERT ( res == 0, "sched_getaffinity failed" );
+            }
+        }; // class AffinityHelper::Initializer
+
+        static Initializer m_initializer;
+
+    public:
+        static const cpu_set_t& ProcessMask () { return m_processMask; }
+    }; // class AffinityHelper
+
+    cpu_set_t AffinityHelper::m_processMask;
+    AffinityHelper::Initializer AffinityHelper::m_initializer;
+#endif /* __linux__ */
+
+    bool PinTheThread ( int cpu_idx, tbb::atomic<int>& nThreads ) {
+    #if _MSC_VER || __linux__
+        cpu_set_t orig_mask, target_mask;
+        CPU_ZERO( &target_mask );
+        CPU_SET( cpu_idx, &target_mask );
+        ASSERT ( CPU_ISSET(cpu_idx, &target_mask), "CPU_SET failed" );
+    #endif
+    #if _MSC_VER
+        orig_mask = SetThreadAffinityMask( GetCurrentThread(), target_mask );
+        if ( !orig_mask )
+            return false;
+    #elif __linux__
+        CPU_ZERO( &orig_mask );
+        int res = sched_getaffinity( gettid(), sizeof(cpu_set_t), &orig_mask );
+        ASSERT ( res == 0, "sched_getaffinity failed" );
+        res = sched_setaffinity( gettid(), sizeof(cpu_set_t), &target_mask );
+        ASSERT ( res == 0, "sched_setaffinity failed" );
+    #endif /* _MSC_VER */
+        --nThreads;
+        while ( nThreads )
+            __TBB_Yield();
+    #if _MSC_VER
+        SetThreadPriority (GetCurrentThread(), THREAD_PRIORITY_HIGHEST);
+    #endif
+        return true;
+    }
+
+    class AffinitySetterTask : tbb::task {
+        static bool m_result;
+        static tbb::atomic<int> m_nThreads;
+        int m_idx;
+
+        tbb::task* execute () {
+            //TestAffinityOps();
+            m_result = PinTheThread( m_idx, m_nThreads );
+            return NULL;
+        }
+
+    public:
+        AffinitySetterTask ( int idx ) : m_idx(idx) {}
+
+        friend bool AffinitizeTBB ( int, int /*mode*/ );
+    };
+
+    bool AffinitySetterTask::m_result = true;
+    tbb::atomic<int> AffinitySetterTask::m_nThreads;
+
+    bool AffinitizeTBB ( int p, int affMode ) {
+    #if _MSC_VER
+        SetThreadPriority (GetCurrentThread(), THREAD_PRIORITY_HIGHEST);
+        SetPriorityClass (GetCurrentProcess(), HIGH_PRIORITY_CLASS);
+    #endif
+        AffinitySetterTask::m_result = true;
+        AffinitySetterTask::m_nThreads = p;
+        tbb::task_list  tl;
+        for ( int i = 0; i < p; ++i ) {
+            tbb::task &t = *new( tbb::task::allocate_root() ) AffinitySetterTask( affMode == amSparse ? i * NumCpus / p : i );
+            t.set_affinity( tbb::task::affinity_id(i + 1) );
+            tl.push_back( t );
+        }
+        tbb::task::spawn_root_and_wait(tl);
+        return AffinitySetterTask::m_result;
+    }
+
+    inline 
+    void Affinitize ( int p, int affMode ) {
+        if ( !AffinitizeTBB (p, affMode) )
+            REPORT("Warning: Failed to set affinity for %d TBB threads\n", p);
+    }
+
+    class TbbWorkersTrapper {
+        tbb::atomic<int> my_refcount;
+        tbb::task *my_root;
+        tbb::task_group_context my_context;
+        Harness::SpinBarrier my_barrier;
+
+        friend class TrapperTask;
+
+        class TrapperTask : public tbb::task {
+            TbbWorkersTrapper& my_owner;
+
+            tbb::task* execute () {
+                my_owner.my_barrier.wait();
+                my_owner.my_root->wait_for_all();
+                my_owner.my_barrier.wait();
+                return NULL;
+            }
+        public:
+            TrapperTask ( TbbWorkersTrapper& owner ) : my_owner(owner) {}
+        };
+
+    public:
+        TbbWorkersTrapper ()
+            : my_context(tbb::task_group_context::bound, 
+                         tbb::task_group_context::default_traits | tbb::task_group_context::concurrent_wait)
+        {
+            my_root = new ( tbb::task::allocate_root(my_context) ) tbb::empty_task;
+            my_root->set_ref_count(2);
+            my_barrier.initialize(NumThreads);
+            for ( int i = 1; i < NumThreads; ++i )
+                tbb::task::spawn( *new(tbb::task::allocate_root()) TrapperTask(*this) );
+            my_barrier.wait(); // Wait util all workers are ready
+        }
+
+        ~TbbWorkersTrapper () {
+            my_root->decrement_ref_count();
+            my_barrier.wait(); // Make sure no tasks are referencing us
+            tbb::task::destroy(*my_root);
+        }
+    }; // TbbWorkersTrapper
+
+
+#if __TBB_STATISTICS
+    static bool StatisticsMode = true;
+#else
+    static bool StatisticsMode = false;
+#endif
+
+//! Suppresses silly warning
+inline bool __TBB_bool( bool b ) { return b; }
+
+#define START_WORKERS(needScheduler, p, a, setWorkersAffinity, trapWorkers) \
+    tbb::task_scheduler_init init(tbb::task_scheduler_init::deferred);      \
+    TbbWorkersTrapper *trapper = NULL;                                      \
+    if ( theSettings.my_opts & UseTaskScheduler                   \
+         && (needScheduler) && ((setWorkersAffinity) || (trapWorkers)) )    \
+    {                                                                       \
+        init.initialize( p );                                               \
+        if ( __TBB_bool(setWorkersAffinity) )                               \
+            Affinitize( p, a );                                             \
+        if ( __TBB_bool(trapWorkers) )                                      \
+            trapper = new TbbWorkersTrapper;                                \
+    }
+
+#define STOP_WORKERS()  \
+    if ( theSettings.my_opts & UseTaskScheduler && init.is_active() ) {     \
+        if ( trapper )                                                      \
+            delete trapper;                                                 \
+        init.terminate();                                                   \
+        /* Give asynchronous deinitialization time to complete */           \
+        Harness::Sleep(50);                                                 \
+    }
+
+    typedef void (Test::*RunMemFnPtr)( Test::ThreadInfo& );
+
+    TimingSeries *TlsTimings;
+    Harness::SpinBarrier  multipleMastersBarrier;
+
+    class TimingFunctor {
+        Test* my_test;
+        RunConfig *my_cfg;
+        RunMemFnPtr my_fnRun;
+        size_t my_numRuns;
+        size_t my_numRepeats;
+        uintptr_t my_availableMethods;
+
+        duration_t TimeSingleRun ( Test::ThreadInfo& ti ) const {
+            if ( my_availableMethods & idOnStart )
+                my_test->OnStart(ti);
+            // Warming run
+            (my_test->*my_fnRun)(ti);
+            multipleMastersBarrier.wait();
+            tbb::tick_count t0 = tbb::tick_count::now();
+            (my_test->*my_fnRun)(ti);
+            duration_t t = (tbb::tick_count::now() - t0).seconds();
+            if ( my_availableMethods & idOnFinish )
+                my_test->OnFinish(ti);
+            return t;
+        }
+
+    public:
+        TimingFunctor ( Test* test, RunConfig *cfg, RunMemFnPtr fnRun, 
+                        size_t numRuns, size_t nRepeats, uintptr_t availableMethods )
+            : my_test(test), my_cfg(cfg), my_fnRun(fnRun)
+            , my_numRuns(numRuns), my_numRepeats(nRepeats), my_availableMethods(availableMethods)
+        {}
+
+        void operator()( int tid ) const {
+            Test::ThreadInfo ti = { tid, NULL };
+            durations_t &d = TlsTimings[tid].my_durations;
+            bool singleMaster = my_cfg->my_numMasters == 1;
+            START_WORKERS( (!singleMaster || (singleMaster && StatisticsMode)) && my_fnRun != &Test::RunSerial, 
+                            my_cfg->my_numThreads, my_cfg->my_affinityMode, singleMaster, singleMaster );
+            for ( uintptr_t k = 0; k < my_numRuns; ++k )  {
+                if ( my_numRepeats > 1 ) {
+                    d[k] = 0;
+                    if ( my_availableMethods & idPrePostProcess ) {
+                        for ( uintptr_t i = 0; i < my_numRepeats; ++i )
+                            d[k] += TimeSingleRun(ti);
+                    }
+                    else {
+                        multipleMastersBarrier.wait();
+                        tbb::tick_count t0 = tbb::tick_count::now();
+                        for ( uintptr_t i = 0; i < my_numRepeats; ++i )
+                            (my_test->*my_fnRun)(ti);
+                        d[k] = (tbb::tick_count::now() - t0).seconds();
+                    }
+                    d[k] /= my_numRepeats;
+                }
+                else
+                    d[k] = TimeSingleRun(ti);
+            }
+            STOP_WORKERS();
+            TlsTimings[tid].CalculateStatistics();
+        }
+    }; // class TimingFunctor
+    
+    void DoTiming ( TestResults& tr, RunConfig &cfg, RunMemFnPtr fnRun, size_t nRepeats, TimingSeries& ts ) {
+        int numThreads = cfg.NumMasters();
+        size_t numRuns = ts.my_durations.size() / numThreads;
+        TimingFunctor body( tr.my_test, &cfg, fnRun, numRuns, nRepeats, tr.my_availableMethods );
+        multipleMastersBarrier.initialize(numThreads);
+        tr.my_test->SetWorkload(cfg.my_workloadID);
+        if ( numThreads == 1 ) {
+            TimingSeries *t = TlsTimings;
+            TlsTimings = &ts;
+            body(0);
+            TlsTimings = t;
+        }
+        else {
+            ts.my_durations.resize(numThreads * numRuns);
+            NativeParallelFor( numThreads, body );
+            for ( int i = 0, j = 0; i < numThreads; ++i ) {
+                durations_t &d = TlsTimings[i].my_durations;
+                for ( size_t k = 0; k < numRuns; ++k, ++j )
+                    ts.my_durations[j] = d[k];
+            }
+            ts.CalculateStatistics();
+        }
+    }
+
+    //! Runs the test function, does statistical processing, and, if title is nonzero, prints results.
+    /** If histogramFileName is a string, the histogram of individual runs is generated and stored
+        in a file with the given name. If it is NULL then the histogram is printed on the console.
+        By default no histogram is generated. 
+        The histogram format is: "rate bucket start" "number of tests in this bucket". **/
+    void RunTestImpl ( TestResults& tr, RunConfig &cfg, RunMemFnPtr pfnTest, TimingSeries& ts ) {
+        // nRepeats is a number of repeated calls to the test function made as 
+        // part of the same run. It is determined experimentally by the following 
+        // calibration process so that the total run time was approx. RunDuration.
+        // This is helpful to increase the measurement precision in case of very 
+        // short tests.
+        size_t nRepeats = 1;
+        // A minimal stats is enough when doing calibration
+        CalibrationTiming.my_durations.resize( (NumRuns < 4 ? NumRuns : 3) * cfg.NumMasters() );
+        // There's no need to be too precise when calculating nRepeats. And reasonably 
+        // far extrapolation can speed up the process significantly.
+        for (;;) {
+            DoTiming( tr, cfg, pfnTest, nRepeats, CalibrationTiming );
+            if ( CalibrationTiming.my_avgTime * nRepeats > 1e-4 )
+                break;
+            nRepeats *= 2;
+        }
+        nRepeats *= (uintptr_t)ceil( RunDuration / (CalibrationTiming.my_avgTime * nRepeats) );
+
+        DoTiming(tr, cfg, pfnTest, nRepeats, ts);
+
+        // No histogram for baseline measurements
+        if ( pfnTest != &Test::RunSerial && pfnTest != &Test::Baseline ) {
+            const char* histogramName = theSettings.my_histogramName;
+            if ( histogramName != NoHistogram && tr.my_test->HistogramName() != DefaultHistogram )
+                histogramName = tr.my_test->HistogramName();
+            if ( histogramName != NoHistogram )
+                TraceHistogram( ts.my_durations, histogramName );
+        }
+    } // RunTestImpl
+
+    typedef void (*TestActionFn) ( TestResults&, int mastersRange, int w, int p, int m, int a, int& numTests );
+
+    int TestResultIndex ( int mastersRange, int w, int p, int m, int a ) {
+        return ((w * (MaxThread - MinThread + 1) + (p - MinThread)) * mastersRange + m) * NumActiveAffModes + a;
+    }
+
+    void RunTest ( TestResults& tr, int mastersRange, int w, int p, int m, int a, int& numTests ) {
+        size_t r = TestResultIndex(mastersRange, w, p, m, a);
+        ASSERT( r < tr.my_results.size(), NULL );
+        RunConfig &rc = tr.my_results[r].my_config;
+        rc.my_maxConcurrency = MaxConcurrency;
+        rc.my_numThreads = p;
+        rc.my_numMasters = m + tr.my_test->MinNumMasters();
+        rc.my_affinityMode = a;
+        rc.my_workloadID = w;
+        RunTestImpl( tr, rc, &Test::Run, tr.my_results[r].my_timing );
+        printf( "Running tests: %04.1f%%\r",  ++numTests * 100. / TotalConfigs ); fflush(stdout);
+    }
+
+    void WalkTests ( TestActionFn fn, int& numTests, bool setAffinity, bool trapWorkers, bool multipleMasters ) {
+        for ( int p = MinThread; p <= MaxThread; ++p ) {
+            NumThreads = p;
+            MaxConcurrency = p < NumCpus ? p : NumCpus;
+            for ( int a = 0; a < NumActiveAffModes; ++a ) {
+                START_WORKERS( multipleMasters || !StatisticsMode, p, a, setAffinity, trapWorkers );
+                for ( size_t i = 0; i < theSession.size(); ++i ) {
+                    TestResults &tr = theSession[i];
+                    Test *t = tr.my_test;
+                    int mastersRange = t->MaxNumMasters() - t->MinNumMasters() + 1;
+                    int numWorkloads = theSettings.my_opts & UseSmallestWorkloadOnly ? 1 : t->NumWorkloads();
+                    for ( int w = 0; w < numWorkloads; ++w ) {
+                        if ( multipleMasters )
+                            for ( int m = 1; m < mastersRange; ++m )
+                                fn( tr, mastersRange, w, p, m, a, numTests );
+                        else
+                            fn( tr, mastersRange, w, p, 0, a, numTests );
+                    }
+                }
+                STOP_WORKERS();
+            }
+        }
+    }
+
+    void RunTests () {
+        int numTests = 0;
+        WalkTests( &RunTest, numTests, !StatisticsMode, !StatisticsMode, false );
+        if ( MaxTbbMasters > 1 )
+            WalkTests( &RunTest, numTests, true, false, true );
+    }
+
+    void InitTestData ( TestResults& tr, int mastersRange, int w, int p, int m, int a, int& ) {
+        size_t r = TestResultIndex(mastersRange, w, p, m, a);
+        ASSERT( r < tr.my_results.size(), NULL );
+        tr.my_results[r].my_timing.my_durations.resize( 
+            (theSettings.my_opts & UseTaskScheduler ? tr.my_test->MinNumMasters() + m : p) * NumRuns );
+    }
+
+    char WorkloadName[MaxWorkloadNameLen + 1];
+
+    void PrepareTests () {
+        printf( "Initializing...\r" );
+        NumActiveAffModes = theSettings.my_opts & UseAffinityModes ? NumAffinitizationModes : 1;
+        TotalConfigs = 0;
+        TitleFieldLen = strlen( TestNameColumnTitle );
+        WorkloadFieldLen = strlen( WorkloadNameColumnTitle );
+        int numThreads = MaxThread - MinThread + 1;
+        int numConfigsBase = numThreads * NumActiveAffModes;
+        int totalWorkloads = 0;
+        for ( size_t i = 0; i < theSession.size(); ++i ) {
+            TestResults &tr = theSession[i];
+            Test &t = *tr.my_test;
+            int numWorkloads = theSettings.my_opts & UseSmallestWorkloadOnly ? 1 : t.NumWorkloads();
+            int numConfigs = numConfigsBase * numWorkloads;
+            if ( t.MaxNumMasters() > 1 ) {
+                ASSERT( theSettings.my_opts & UseTaskScheduler, "Multiple masters mode is only valid for task scheduler tests" );
+                if ( MaxTbbMasters < t.MaxNumMasters() )
+                    MaxTbbMasters = t.MaxNumMasters();
+                numConfigs *= t.MaxNumMasters() - t.MinNumMasters() + 1;
+            }
+            totalWorkloads += numWorkloads;
+            TotalConfigs += numConfigs;
+
+            const char* testName = t.Name();
+            if ( testName )
+                tr.my_testName = testName;
+            ASSERT( tr.my_testName, "Neither Test::Name() is implemented, nor RTTI is enabled" );
+            TitleFieldLen = max( TitleFieldLen, strlen(tr.my_testName) );
+
+            tr.my_results.resize( numConfigs );
+            tr.my_serialBaselines.resize( numWorkloads );
+            tr.my_baselines.resize( numWorkloads );
+            tr.my_workloadNames.resize( numWorkloads );
+        }
+        TimingSeries tmpTiming;
+        TlsTimings = &tmpTiming; // All measurements are serial here
+        int n = 0;
+        for ( size_t i = 0; i < theSession.size(); ++i ) {
+            TestResults &tr = theSession[i];
+            Test &t = *tr.my_test;
+            // Detect which methods are overridden by the test implementation
+            g_absentMethods = 0;
+            Test::ThreadInfo ti = { 0 };
+            t.SetWorkload(0);
+            t.OnStart(ti);
+            t.RunSerial(ti);
+            t.OnFinish(ti);
+            if ( theSettings.my_opts & UseSerialBaseline && !(g_absentMethods & idRunSerial) )
+                tr.my_availableMethods |= idRunSerial;
+            if ( !(g_absentMethods & idOnStart) )
+                tr.my_availableMethods |= idOnStart;
+
+            RunConfig rc = { 1, 1, 1, 0, 0 };
+            int numWorkloads = theSettings.my_opts & UseSmallestWorkloadOnly ? 1 : t.NumWorkloads();
+            for ( int w = 0; w < numWorkloads; ++w ) {
+                WorkloadName[0] = 0;
+                t.SetWorkload(w);
+                if ( !WorkloadName[0] )
+                    sprintf( WorkloadName, "%d", w );
+                size_t len = strlen(WorkloadName);
+                tr.my_workloadNames[w] = new char[len + 1];
+                strcpy ( (char*)tr.my_workloadNames[w], WorkloadName );
+                WorkloadFieldLen = max( WorkloadFieldLen, len );
+
+                rc.my_workloadID = w;
+                if ( theSettings.my_opts & UseBaseline )
+                    RunTestImpl( tr, rc, &Test::Baseline, tr.my_baselines[w] );
+                if ( tr.my_availableMethods & idRunSerial )
+                    RunTestImpl( tr, rc, &Test::RunSerial, tr.my_serialBaselines[w] );
+                printf( "Measuring baselines: %04.1f%%\r",  ++n * 100. / totalWorkloads ); fflush(stdout);
+            }
+        }
+        TlsTimings = new TimingSeries[MaxThread + MaxTbbMasters - 1];
+        if ( theSettings.my_opts & UseTaskScheduler ? MaxTbbMasters : MaxThread )
+            WalkTests( &InitTestData, n, false, false, theSettings.my_opts & UseTaskScheduler ? true : false );
+        CalibrationTiming.my_durations.reserve( MaxTbbMasters * 3 );
+        printf( "                                                          \r");
+    }
+
+    FILE* ResFile = NULL;
+
+    void Report ( char const* fmt, ... ) {
+        va_list args;
+        if ( ResFile ) {
+            va_start( args, fmt );
+            vfprintf( ResFile, fmt, args );
+            va_end( args );
+        }
+        va_start( args, fmt );
+        vprintf( fmt, args );
+        va_end( args );
+    }
+
+    void PrintResults () {
+        if ( theSettings.my_resFile )
+            ResFile = fopen( theSettings.my_resFile, "w" );
+        Report( "%-*s %-*s %s", TitleFieldLen, "Test-name", WorkloadFieldLen, "Workload", 
+                                MaxTbbMasters > 1 ? "W    M    " : "T    " );
+        if ( theSettings.my_opts & UseAffinityModes )
+            Report( "Aff  " );
+        Report( "%-*s SD,%%  %-*s %-*s %-*s ",
+                RateFieldLen, "Avg.time", OvhdFieldLen, "Par.ovhd,%",
+                RateFieldLen, "Min.time", RateFieldLen, "Max.time" );
+        Report( " | Repeats = %lu, CPUs %d\n", (unsigned long)NumRuns, NumCpus );
+        for ( size_t i = 0; i < theSession.size(); ++i ) {
+            TestResults &tr = theSession[i];
+            for ( size_t j = 0; j < tr.my_results.size(); ++j ) {
+                RunResults &rr = tr.my_results[j];
+                RunConfig &rc = rr.my_config;
+                int w = rc.my_workloadID;
+                TimingSeries &ts = rr.my_timing;
+                duration_t baselineTime = tr.my_baselines[w].my_avgTime,
+                           cleanTime = ts.my_avgTime - baselineTime;
+                Report( "%-*s %-*s ", TitleFieldLen, tr.my_testName, WorkloadFieldLen, tr.my_workloadNames[w] );
+                if ( MaxTbbMasters > 1 )
+                    Report( "%-4d %-4d ", rc.my_numThreads - 1, rc.my_numMasters );
+                else
+                    Report( "%-4d ", rc.my_numThreads );
+                if ( theSettings.my_opts & UseAffinityModes )
+                    Report( "%%-8s ", AffinitizationModeNames[rc.my_affinityMode] );
+                Report( "%-*.2e %-6.1f ", RateFieldLen, cleanTime, ts.my_stdDev);
+                if ( tr.my_availableMethods & idRunSerial  ) {
+                    duration_t serialTime = (tr.my_serialBaselines[w].my_avgTime - baselineTime) / rc.my_maxConcurrency;
+                    Report( "%-*.1f ", OvhdFieldLen, 100*(cleanTime - serialTime)/serialTime );
+                }
+                else
+                    Report( "%*s%*s ", OvhdFieldLen/2, "-", OvhdFieldLen - OvhdFieldLen/2, "" );
+                Report( "%-*.2e %-*.2e ", RateFieldLen, ts.my_minTime - baselineTime, RateFieldLen, ts.my_maxTime - baselineTime);
+                Report( "\n" );
+            }
+        }
+        delete [] TlsTimings;
+        if ( ResFile )
+            fclose(ResFile);
+    }
+
+    __TBB_PERF_API void RegisterTest ( Test* t, const char* className, bool takeOwnership ) {
+        // Just collect test objects at this stage
+        theSession.push_back( TestResults(t, className, takeOwnership) );
+    }
+
+} // namespace internal
+
+__TBB_PERF_API void Test::Baseline ( ThreadInfo& ) {}
+
+__TBB_PERF_API void Test::RunSerial ( ThreadInfo& ) { internal::g_absentMethods |= internal::idRunSerial; }
+
+__TBB_PERF_API void Test::OnStart ( ThreadInfo& ) { internal::g_absentMethods |= internal::idOnStart; }
+
+__TBB_PERF_API void Test::OnFinish ( ThreadInfo& ) { internal::g_absentMethods |= internal::idOnFinish; }
+
+__TBB_PERF_API void WipeCaches () { NativeParallelFor( NumCpus, internal::WiperBody() ); }
+
+__TBB_PERF_API void EmptyFunc () {}
+__TBB_PERF_API void AnchorFunc ( void* ) {}
+__TBB_PERF_API void AnchorFunc2 ( void*, void* ) {}
+
+__TBB_PERF_API void SetWorkloadName( const char* format, ... ) {
+    internal::WorkloadName[MaxWorkloadNameLen] = 0;
+    va_list args;
+    va_start(args, format);
+    vsnprintf( internal::WorkloadName, MaxWorkloadNameLen, format, args );
+    va_end(args);
+}
+
+
+__TBB_PERF_API int TestMain( int argc, char* argv[], const SessionSettings* defaultSettings ) {
+#if _MSC_VER
+    HANDLE hMutex = CreateMutex( NULL, FALSE, "Global\\TBB_OMP_PerfSession" );
+    WaitForSingleObject( hMutex, INFINITE );
+#endif
+    MinThread = MaxThread = NumCpus;
+    if ( defaultSettings )
+        theSettings = *defaultSettings;
+    ParseCommandLine( argc, argv );  // May override data in theSettings
+
+    internal::PrepareTests ();
+    internal::RunTests ();
+    internal::PrintResults();
+    REPORT("\n");
+#if _MSC_VER
+    ReleaseMutex( hMutex );
+    CloseHandle( hMutex );
+#endif
+    return 0;
+}
+
+} // namespace Perf
diff --git a/xdl/third_party/tbb/src/perf/perf.h b/xdl/third_party/tbb/src/perf/perf.h
new file mode 100644
index 00000000..dea3283c
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/perf.h
@@ -0,0 +1,257 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __tbb_perf_h__
+#define __tbb_perf_h__
+
+#ifndef TBB_PERF_TYPEINFO
+#define TBB_PERF_TYPEINFO 1
+#endif
+
+#if TBB_PERF_TYPEINFO
+    #include <typeinfo>
+    #define __TBB_PERF_TEST_CLASS_NAME(T) typeid(T).name()
+#else /* !TBB_PERF_TYPEINFO */
+    #define __TBB_PERF_TEST_CLASS_NAME(T) NULL
+#endif /* !TBB_PERF_TYPEINFO */
+
+
+#include "tbb/tick_count.h"
+
+// TODO: Fix build scripts to provide more reliable build phase identification means
+#ifndef __TBB_PERF_API
+#if _USRDLL
+    #if _MSC_VER
+        #define __TBB_PERF_API __declspec(dllexport)
+    #else /* !_MSC_VER */
+        #define __TBB_PERF_API
+    #endif /* !_MSC_VER */
+#else /* !_USRDLL */
+    #if _MSC_VER
+        #define __TBB_PERF_API __declspec(dllimport)
+    #else /* !_MSC_VER */
+        #define __TBB_PERF_API
+    #endif /* !_MSC_VER */
+#endif /* !_USRDLL */
+#endif /* !__TBB_PERF_API */
+
+#if _WIN32||_WIN64
+
+namespace Perf {
+    typedef unsigned __int64 tick_t;
+    #if defined(_M_X64)
+        inline tick_t rdtsc () { return __rdtsc(); }
+    #elif _M_IX86
+        inline tick_t rdtsc () { __asm { rdtsc } }
+    #else
+        #error Unsupported ISA
+    #endif
+} // namespace Perf
+
+#elif __linux__ || __APPLE__
+
+#include <stdint.h>
+
+namespace Perf {
+    typedef uint64_t tick_t;
+    #if __x86_64__ || __i386__ || __i386
+        inline tick_t rdtsc () {
+            uint32_t lo, hi;
+            __asm__ __volatile__ ( "rdtsc" : "=a" (lo), "=d" (hi) );
+            return (tick_t)lo | ((tick_t)hi) << 32;
+        }
+    #else
+        #error Unsupported ISA
+    #endif
+} // namespace Perf
+
+#else
+    #error Unsupported OS
+#endif /* OS */
+
+__TBB_PERF_API extern int NumThreads,
+                          MaxConcurrency,
+                          NumCpus;
+
+// Functions and global variables provided by the benchmarking framework
+namespace Perf {
+
+typedef double duration_t;
+
+static const int MaxWorkloadNameLen = 64;
+
+static const char* NoHistogram = (char*)-1;
+static const char* DefaultHistogram = (char*)-2;
+
+__TBB_PERF_API void AnchorFunc ( void* );
+__TBB_PERF_API void AnchorFunc2 ( void*, void*  );
+
+//! Helper that can be used in the preprocess handler to clean caches
+/** Cleaning caches is necessary to obtain reproducible results when a test
+    accesses significant ranges of memory. **/
+__TBB_PERF_API void WipeCaches ();
+
+//! Specifies the name to be used to designate the current workload in output
+/** Should be used from Test::SetWorkload(). If necessary workload name will be
+    truncated to MaxWorkloadNameLen characters. **/
+__TBB_PERF_API void SetWorkloadName( const char* format, ... );
+
+class __TBB_PERF_API Test {
+public:
+    virtual ~Test () {}
+
+    //! Struct used by tests running in multiple masters mode
+    struct ThreadInfo {
+        //! Zero based thread ID
+        int     tid;
+        //! Pointer to test specific data
+        /** If used by the test, should be initialized by OnStartLocal(), and 
+            finalized by OnFinishLocal(). **/
+        void*   data;
+    };
+
+    ////////////////////////////////////////////////////////////////////////////////
+    // Mandatory methods
+    
+    //! Returns the number of workloads supported
+    virtual int NumWorkloads () = 0;
+
+    //! Set workload info for the subsequent calls to Run() and RunSerial()
+    /** This method can use global helper function Perf::SetWorkloadName() in order
+        to specify the name of the current workload, which will be used in output
+        to designate the workload. If SetWorkloadName is not called, workloadIndex
+        will be used for this purpose.
+
+        When testing task scheduler, make sure that this method does not trigger
+        its automatic initialization. **/
+    virtual void SetWorkload ( int workloadIndex ) = 0;
+
+    //! Test implementation
+    /** Called by the timing framework several times in a loop to achieve approx.
+        RunDuration time, and this loop is timed NumRuns times to collect statistics.
+        Argument ti specifies information about the master thread calling this method. **/
+    virtual void Run ( ThreadInfo& ti ) = 0;
+
+    ////////////////////////////////////////////////////////////////////////////////
+    // Optional methods
+
+    //! Returns short title string to be used in the regular output to identify the test
+    /** Should uniquely identify the test among other ones in the given benchmark suite.
+        If not implemented, the test implementation class' RTTI name is used. **/
+    virtual const char* Name () { return NULL; };
+
+    //! Returns minimal number of master threads
+    /** Used for task scheduler tests only (when UseTbbScheduler option is specified 
+        in session settings). **/
+    virtual int MinNumMasters () { return 1; }
+
+    //! Returns maximal number of master threads
+    /** Used for task scheduler tests only (when UseTbbScheduler option is specified 
+        in session settings). **/
+    virtual int MaxNumMasters () { return 1; }
+
+    //! Executes serial workload equivalent to the one processed by Run()
+    /** Called by the timing framework several times in a loop to collect statistics. **/
+    virtual void RunSerial ( ThreadInfo& ti );
+
+    //! Invoked before each call to Run() 
+    /** Can be used to preinitialize data necessary for the test, clean up 
+        caches (see Perf::WipeCaches), etc.
+        In multiple masters mode this method is called on each thread. **/
+    virtual void OnStart ( ThreadInfo& ti );
+
+    //! Invoked after each call to Run() 
+    /** Can be used to free resources allocated by OnStart().
+        Note that this method must work correctly independently of whether Run(),
+        RunSerial() or nothing is called between OnStart() and OnFinish().
+        In multiple masters mode this method is called on each thread. **/
+    virtual void OnFinish ( ThreadInfo& ti );
+
+    //! Functionality, the cost of which has to be factored out from timing results
+    /** Applies to both parallel and serial versions. **/
+    virtual void Baseline ( ThreadInfo& );
+
+    //! Returns description string to be used in the benchmark info/summary output
+    virtual const char* Description () { return NULL; }
+
+    //! Specifies if the histogram of individual run times in a series
+    /** If the method is not overridden, histogramName argument of TestMain is used. **/
+    virtual const char* HistogramName () { return DefaultHistogram; }
+}; // class Test
+
+namespace internal {
+    __TBB_PERF_API void RegisterTest ( Test*, const char* testClassName, bool takeOwnership );
+}
+
+template<class T>
+void RegisterTest() { internal::RegisterTest( new T, __TBB_PERF_TEST_CLASS_NAME(T), true ); }
+
+template<class T>
+void RegisterTest( T& t ) { internal::RegisterTest( &t, __TBB_PERF_TEST_CLASS_NAME(T), false ); }
+
+enum SessionOptions {
+    //! Use Test::RunSerial if present
+    UseBaseline = 0x01,
+    UseSerialBaseline = 0x02,
+    UseBaselines = UseBaseline | UseSerialBaseline,
+    UseTaskScheduler = 0x10,
+    UseAffinityModes = 0x20,
+    UseSmallestWorkloadOnly = 0x40
+};
+
+struct SessionSettings {
+    //! A combination of SessionOptions flags
+    uintptr_t my_opts;
+
+    //! Name of a file to store performance results
+    /** These results are duplicates of what is printed on the console. **/
+    const char* my_resFile;
+
+    //! Output destination for the histogram of individual run times in a series
+    /** If it is a string, the histogram is stored in a file with such name. 
+        If it is NULL, the histogram is printed on the console. By default histograms
+        are suppressed.
+
+        The histogram is formatted as two column table: 
+        "time bucket start" "number of tests in this bucket"
+        
+        When this setting enables histogram generation, an individual test 
+        can override it by implementing HistogramName method. **/
+    const char* my_histogramName;
+
+    SessionSettings ( uintptr_t opts = 0, const char* resFile = NULL, const char* histogram = NoHistogram )
+        : my_opts(opts)
+        , my_resFile(resFile)
+        , my_histogramName(histogram)
+    {}
+}; // struct SessionSettings
+
+//! Benchmarking session entry point
+/** Executes all the individual tests registered previously by means of 
+    RegisterTest<MycrotestImpl> **/
+__TBB_PERF_API int TestMain( int argc, char* argv[],
+                             const SessionSettings* defaultSettings = NULL );
+
+
+} // namespace Perf
+
+#endif /* __tbb_perf_h__ */
+
+
diff --git a/xdl/third_party/tbb/src/perf/perf_sched.cpp b/xdl/third_party/tbb/src/perf/perf_sched.cpp
new file mode 100644
index 00000000..97b92ef0
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/perf_sched.cpp
@@ -0,0 +1,456 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "perf.h"
+
+#include <cmath>
+
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+
+#define NUM_CHILD_TASKS     2096
+#define NUM_ROOT_TASKS      256
+
+#define N               100000000
+#define FINEST_GRAIN    10
+#define FINE_GRAIN      50
+#define MED_GRAIN       200
+#define COARSE_GRAIN    1000
+
+
+typedef int count_t;
+
+const count_t N_finest = (count_t)(N/log((double)N)/10);
+const count_t N_fine = N_finest * 20;
+const count_t N_med = N_fine * (count_t)log((double)N) / 5;
+
+class StaticTaskHolder {
+public:
+    tbb::task *my_leafTaskPtr;
+    StaticTaskHolder ();
+};
+
+static StaticTaskHolder s_tasks;
+
+static count_t NumIterations;
+static count_t NumLeafTasks;
+static count_t NumRootTasks;
+
+class LeafTaskBase : public tbb::task {
+public:
+    count_t my_ID;
+
+    LeafTaskBase () {}
+    LeafTaskBase ( count_t id ) : my_ID(id) {}
+};
+
+class SimpleLeafTask : public LeafTaskBase {
+    task* execute () {
+        volatile count_t anchor = 0;
+        for ( count_t i=0; i < NumIterations; ++i )
+            anchor += i;
+        return NULL;
+    }
+public:
+    SimpleLeafTask ( count_t ) {}
+};
+
+StaticTaskHolder::StaticTaskHolder () {
+    static SimpleLeafTask s_t1(0);
+    my_leafTaskPtr = &s_t1;
+}
+
+class Test_SPMC : public Perf::Test {
+protected:
+    static const int numWorkloads = 4;
+    static const count_t workloads[numWorkloads];
+
+    LeafTaskBase* my_leafTaskPtr;
+
+    const char* Name () { return "SPMC"; }
+
+    int NumWorkloads () { return numWorkloads; }
+
+    void SetWorkload ( int idx ) {
+        NumRootTasks = 1;
+        NumIterations = workloads[idx];
+        NumLeafTasks = NUM_CHILD_TASKS * NUM_ROOT_TASKS / (NumIterations > 1000 ? 32 : 8);
+        Perf::SetWorkloadName( "%dx%d", NumLeafTasks, NumIterations );
+    }
+    
+    void Run ( ThreadInfo& ) {
+        tbb::empty_task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+        r.set_ref_count( NumLeafTasks + 1 );
+        for ( count_t i = 0; i < NumLeafTasks; ++i )
+            r.spawn( *new(r.allocate_child()) SimpleLeafTask(0) );
+        r.wait_for_all();
+        tbb::task::destroy(r);
+    }
+
+    void RunSerial ( ThreadInfo& ) {
+        const count_t n = NumLeafTasks * NumRootTasks;
+        for ( count_t i=0; i < n; ++i ) {
+            my_leafTaskPtr->my_ID = i;
+            my_leafTaskPtr->execute();
+        }
+    }
+
+public:
+    Test_SPMC ( LeafTaskBase* leafTaskPtr = NULL ) {
+        static SimpleLeafTask t(0);
+        my_leafTaskPtr = leafTaskPtr ? leafTaskPtr : &t;
+    }
+}; // class Test_SPMC
+
+const count_t Test_SPMC::workloads[Test_SPMC::numWorkloads] = { 1, 50, 500, 5000 };
+
+template<class LeafTask>
+class LeavesLauncherTask : public tbb::task {
+    count_t my_groupId;
+
+    task* execute () {
+        count_t base = my_groupId * NumLeafTasks;
+        set_ref_count(NumLeafTasks + 1);
+        for ( count_t i = 0; i < NumLeafTasks; ++i )
+            spawn( *new(allocate_child()) LeafTask(base + i) );
+        wait_for_all();
+        return NULL;
+    }
+public:
+    LeavesLauncherTask ( count_t groupId ) : my_groupId(groupId) {}
+};
+
+template<class LeafTask>
+void RunShallowTree () {
+    tbb::empty_task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    r.set_ref_count( NumRootTasks + 1 );
+    for ( count_t i = 0; i < NumRootTasks; ++i )
+        r.spawn( *new(r.allocate_child()) LeavesLauncherTask<LeafTask>(i) );
+    r.wait_for_all();
+    tbb::task::destroy(r);
+}
+
+class Test_ShallowTree : public Test_SPMC {
+    const char* Name () { return "ShallowTree"; }
+
+    void SetWorkload ( int idx ) {
+        NumRootTasks = NUM_ROOT_TASKS;
+        NumIterations = workloads[idx];
+        NumLeafTasks = NumIterations > 200 ? NUM_CHILD_TASKS / 10 : 
+                            (NumIterations > 50 ? NUM_CHILD_TASKS / 2 : NUM_CHILD_TASKS * 2);
+        Perf::SetWorkloadName( "%dx%d", NumRootTasks * NumLeafTasks, NumIterations );
+    }
+
+    void Run ( ThreadInfo& ) {
+        RunShallowTree<SimpleLeafTask>();
+    }
+}; // class Test_ShallowTree
+
+class LeafTaskSkewed : public LeafTaskBase {
+    task* execute () {
+        volatile count_t anchor = 0;
+        double K = (double)NumRootTasks * NumLeafTasks;
+        count_t n = count_t(sqrt(double(my_ID)) * double(my_ID) * my_ID / (4 * K * K));
+        for ( count_t i = 0; i < n; ++i )
+            anchor += i;
+        return NULL;
+    }
+public:
+    LeafTaskSkewed ( count_t id ) : LeafTaskBase(id) {}
+};
+
+class Test_ShallowTree_Skewed : public Test_SPMC {
+    static LeafTaskSkewed SerialTaskBody;
+
+    const char* Name () { return "ShallowTree_Skewed"; }
+
+    int NumWorkloads () { return 1; }
+
+    void SetWorkload ( int ) {
+        NumRootTasks = NUM_ROOT_TASKS;
+        NumLeafTasks = NUM_CHILD_TASKS;
+        Perf::SetWorkloadName( "%d", NumRootTasks * NumLeafTasks );
+    }
+
+    void Run ( ThreadInfo& ) {
+        RunShallowTree<LeafTaskSkewed>();
+    }
+
+public:
+    Test_ShallowTree_Skewed () : Test_SPMC(&SerialTaskBody) {}
+}; // class Test_ShallowTree_Skewed
+
+LeafTaskSkewed Test_ShallowTree_Skewed::SerialTaskBody(0);
+
+typedef tbb::blocked_range<count_t> range_t;
+
+static count_t  IterRange = N,
+                IterGrain = 1;
+
+enum PartitionerType {
+    SimplePartitioner = 0,
+    AutoPartitioner = 1
+};
+
+class Test_Algs : public Perf::Test {
+protected:
+    static const int numWorkloads = 4;
+    static const count_t algRanges[numWorkloads];
+    static const count_t algGrains[numWorkloads];
+
+    tbb::simple_partitioner    my_simplePartitioner;
+    tbb::auto_partitioner    my_autoPartitioner;
+    PartitionerType my_partitionerType;
+
+    bool UseAutoPartitioner () const { return my_partitionerType == AutoPartitioner; }
+
+    int NumWorkloads () { return UseAutoPartitioner() ? 3 : numWorkloads; }
+
+    void SetWorkload ( int idx ) {
+        if ( UseAutoPartitioner() ) {
+            IterRange = algRanges[idx ? numWorkloads - 1 : 0];
+            IterGrain = idx > 1 ? algGrains[numWorkloads - 1] : 1;
+        }
+        else {
+            IterRange = algRanges[idx];
+            IterGrain = algGrains[idx];
+        }
+        Perf::SetWorkloadName( "%d/%d", IterRange, IterGrain );
+    }
+public:
+    Test_Algs ( PartitionerType pt = SimplePartitioner ) : my_partitionerType(pt) {}
+}; // class Test_Algs
+
+const count_t Test_Algs::algRanges[] = {N_finest, N_fine, N_med, N};
+const count_t Test_Algs::algGrains[] = {1, FINE_GRAIN, MED_GRAIN, COARSE_GRAIN};
+
+template <typename Body>
+class Test_PFor : public Test_Algs {
+protected:
+    void Run ( ThreadInfo& ) {
+        if ( UseAutoPartitioner() )
+            tbb::parallel_for( range_t(0, IterRange, IterGrain), Body(), my_autoPartitioner );
+        else
+            tbb::parallel_for( range_t(0, IterRange, IterGrain), Body(), my_simplePartitioner );
+    }
+
+    void RunSerial ( ThreadInfo& ) {
+        Body body;
+        body( range_t(0, IterRange, IterGrain) );
+    }
+public:
+    Test_PFor ( PartitionerType pt = SimplePartitioner ) : Test_Algs(pt) {}
+}; // class Test_PFor
+
+class SimpleForBody {
+public:
+    void operator()( const range_t& r ) const {
+        count_t end = r.end();
+        volatile count_t anchor = 0;
+        for( count_t i = r.begin(); i < end; ++i )
+            anchor += i;
+    }
+}; // class SimpleForBody
+
+class Test_PFor_Simple : public Test_PFor<SimpleForBody> {
+protected:
+    const char* Name () { return UseAutoPartitioner() ? "PFor-AP" : "PFor"; }
+public:
+    Test_PFor_Simple ( PartitionerType pt = SimplePartitioner ) : Test_PFor<SimpleForBody>(pt) {}
+}; // class Test_PFor_Simple
+
+class SkewedForBody {
+public:
+    void operator()( const range_t& r ) const {
+        count_t end = (r.end() + 1) * (r.end() + 1);
+        volatile count_t anchor = 0;
+        for( count_t i = r.begin() * r.begin(); i < end; ++i )
+            anchor += i;
+    }
+}; // class SkewedForBody
+
+class Test_PFor_Skewed : public Test_PFor<SkewedForBody> {
+    typedef Test_PFor<SkewedForBody> base_type;
+protected:
+    const char* Name () { return UseAutoPartitioner() ? "PFor-Skewed-AP" : "PFor-Skewed"; }
+
+    void SetWorkload ( int idx ) {
+        base_type::SetWorkload(idx);
+        IterRange = (count_t)(sqrt((double)IterRange) * sqrt(sqrt((double)N / IterRange)));
+        Perf::SetWorkloadName( "%d", IterRange );
+    }
+
+public:
+    Test_PFor_Skewed ( PartitionerType pt = SimplePartitioner ) : base_type(pt) {}
+}; // class Test_PFor_Skewed
+
+PartitionerType gPartitionerType;
+count_t NestingRange;
+count_t NestingGrain;
+
+class NestingForBody {
+    count_t my_depth;
+    tbb::simple_partitioner my_simplePartitioner;
+    tbb::auto_partitioner my_autoPartitioner;
+    
+    template<class Partitioner>
+    void run ( const range_t& r, Partitioner& p ) const {
+        count_t end = r.end();
+        if ( my_depth > 1 )
+            for ( count_t i = r.begin(); i < end; ++i )
+                tbb::parallel_for( range_t(0, IterRange, IterGrain), NestingForBody(my_depth - 1), p );
+        else
+            for ( count_t i = r.begin(); i < end; ++i )
+                tbb::parallel_for( range_t(0, IterRange, IterGrain), SimpleForBody(), p );
+    }
+public:
+    void operator()( const range_t& r ) const {
+        if ( gPartitionerType == AutoPartitioner )
+            run( r, my_autoPartitioner );
+        else
+            run( r, my_simplePartitioner );
+    }
+    NestingForBody ( count_t depth = 1 ) : my_depth(depth) {}
+}; // class NestingForBody
+
+enum NestingType {
+    HollowNesting,
+    ShallowNesting,
+    DeepNesting
+};
+
+class Test_PFor_Nested : public Test_Algs {
+    typedef Test_Algs base_type;
+
+    NestingType my_nestingType;
+    count_t my_nestingDepth;
+
+protected:
+    const char* Name () {
+        static const char* names[] = { "PFor-HollowNested", "PFor-HollowNested-AP",
+                                       "PFor-ShallowNested", "PFor-ShallowNested-AP",
+                                       "PFor-DeeplyNested", "PFor-DeeplyNested-AP" };
+        return names[my_nestingType * 2 + my_partitionerType];
+    }
+
+    int NumWorkloads () { return my_nestingType == ShallowNesting ? (UseAutoPartitioner() ? 3 : 2) : 1; }
+
+    void SetWorkload ( int idx ) {
+        gPartitionerType = my_partitionerType;
+        if ( my_nestingType == DeepNesting ) {
+            NestingRange = 1024;
+            IterGrain = NestingGrain = 1;
+            IterRange = 4;
+            my_nestingDepth = 4;
+        }
+        else if ( my_nestingType == ShallowNesting ) {
+            int i = idx ? numWorkloads - 1 : 0;
+            count_t baseRange = algRanges[i];
+            count_t baseGrain = !UseAutoPartitioner() || idx > 1 ? algGrains[i] : 1;
+            NestingRange = IterRange = (count_t)sqrt((double)baseRange);
+            NestingGrain = IterGrain = (count_t)sqrt((double)baseGrain);
+        }
+        else {
+            NestingRange = N / 100;
+            NestingGrain = COARSE_GRAIN / 10;
+            IterRange = 2;
+            IterGrain = 1;
+        }
+        Perf::SetWorkloadName( "%d/%d", NestingRange, NestingGrain );
+    }
+
+    void Run ( ThreadInfo& ) {
+        if ( UseAutoPartitioner() )
+            tbb::parallel_for( range_t(0, NestingRange, NestingGrain), NestingForBody(my_nestingDepth), my_autoPartitioner );
+        else
+            tbb::parallel_for( range_t(0, NestingRange, NestingGrain), NestingForBody(my_nestingDepth), my_simplePartitioner );
+    }
+
+    void RunSerial ( ThreadInfo& ) {
+        for ( int i = 0; i < NestingRange; ++i ) {
+            SimpleForBody body;
+            body( range_t(0, IterRange, IterGrain) );
+        }
+    }
+public:
+    Test_PFor_Nested ( NestingType nt, PartitionerType pt ) : base_type(pt), my_nestingType(nt), my_nestingDepth(1) {}
+}; // class Test_PFor_Nested
+
+class SimpleReduceBody {
+public:
+    count_t my_sum;
+    SimpleReduceBody () : my_sum(0) {}
+    SimpleReduceBody ( SimpleReduceBody&, tbb::split ) : my_sum(0) {}
+    void join( SimpleReduceBody& rhs ) { my_sum += rhs.my_sum;}
+    void operator()( const range_t& r ) {
+        count_t end = r.end();
+        volatile count_t anchor = 0;
+        for( count_t i = r.begin(); i < end; ++i )
+            anchor += i;
+        my_sum = anchor;
+    }
+}; // class SimpleReduceBody
+
+class Test_PReduce : public Test_Algs {
+protected:
+    const char* Name () { return UseAutoPartitioner() ? "PReduce-AP" : "PReduce"; }
+
+    void Run ( ThreadInfo& ) {
+        SimpleReduceBody body;
+        if ( UseAutoPartitioner() )
+            tbb::parallel_reduce( range_t(0, IterRange, IterGrain), body, my_autoPartitioner );
+        else
+            tbb::parallel_reduce( range_t(0, IterRange, IterGrain), body, my_simplePartitioner );
+    }
+
+    void RunSerial ( ThreadInfo& ) {
+        SimpleReduceBody body;
+        body( range_t(0, IterRange, IterGrain) );
+    }
+public:
+    Test_PReduce ( PartitionerType pt = SimplePartitioner ) : Test_Algs(pt) {}
+}; // class Test_PReduce
+
+int main( int argc, char* argv[] ) {
+    Perf::SessionSettings opts (Perf::UseTaskScheduler | Perf::UseSerialBaseline, "perf_sched.txt");   // Perf::UseBaseline, Perf::UseSmallestWorkloadOnly
+    Perf::RegisterTest<Test_SPMC>();
+    Perf::RegisterTest<Test_ShallowTree>();
+    Perf::RegisterTest<Test_ShallowTree_Skewed>();
+    Test_PFor_Simple pf_sp(SimplePartitioner), pf_ap(AutoPartitioner);
+    Perf::RegisterTest(pf_sp);
+    Perf::RegisterTest(pf_ap);
+    Test_PReduce pr_sp(SimplePartitioner), pr_ap(AutoPartitioner);
+    Perf::RegisterTest(pr_sp);
+    Perf::RegisterTest(pr_ap);
+    Test_PFor_Skewed pf_s_sp(SimplePartitioner), pf_s_ap(AutoPartitioner);
+    Perf::RegisterTest(pf_s_sp);
+    Perf::RegisterTest(pf_s_ap);
+    Test_PFor_Nested pf_hn_sp(HollowNesting, SimplePartitioner), pf_hn_ap(HollowNesting, AutoPartitioner),
+                     pf_sn_sp(ShallowNesting, SimplePartitioner), pf_sn_ap(ShallowNesting, AutoPartitioner),
+                     pf_dn_sp(DeepNesting, SimplePartitioner), pf_dn_ap(DeepNesting, AutoPartitioner);
+    Perf::RegisterTest(pf_hn_sp);
+    Perf::RegisterTest(pf_hn_ap);
+    Perf::RegisterTest(pf_sn_sp);
+    Perf::RegisterTest(pf_sn_ap);
+    Perf::RegisterTest(pf_dn_sp);
+    Perf::RegisterTest(pf_dn_ap);
+    return Perf::TestMain(argc, argv, &opts);
+}
diff --git a/xdl/third_party/tbb/src/perf/run_statistics.sh b/xdl/third_party/tbb/src/perf/run_statistics.sh
new file mode 100644
index 00000000..f3e20207
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/run_statistics.sh
@@ -0,0 +1,32 @@
+#!/bin/bash
+#
+# Copyright (c) 2005-2018 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+#
+#
+#
+
+export LD_LIBRARY_PATH=.:$LD_LIBRARY_PATH
+#setting output format .csv, 'pivot' - is pivot table mode, ++ means append
+export STAT_FORMAT=pivot-csv++
+#check existing files because of apend mode
+ls *.csv
+rm -i *.csv
+#setting a delimiter in txt or csv file
+#export STAT_DELIMITER=,
+export STAT_RUNINFO1=Host=`hostname -s`
+#append a suffix after the filename
+#export STAT_SUFFIX=$STAT_RUNINFO1
+for ((i=1;i<=${repeat:=100};++i)); do echo $i of $repeat: && STAT_RUNINFO2=Run=$i $* || break; done
diff --git a/xdl/third_party/tbb/src/perf/statistics.cpp b/xdl/third_party/tbb/src/perf/statistics.cpp
new file mode 100644
index 00000000..8b660c26
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/statistics.cpp
@@ -0,0 +1,444 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "statistics.h"
+#include "statistics_xml.h"
+
+#define COUNT_PARAMETERS 3
+
+#ifdef _MSC_VER
+#define snprintf _snprintf
+#endif
+
+void GetTime(char* buff,int size_buff) 
+{
+    tm *newtime;
+    time_t timer;
+    time(&timer);
+    newtime=localtime(&timer);
+    strftime(buff,size_buff,"%H:%M:%S",newtime); 
+}
+
+void GetDate(char* buff,int size_buff) 
+{
+    tm *newtime;
+    time_t timer;
+    time(&timer);  
+    newtime=localtime(&timer);
+    strftime(buff,size_buff,"%Y-%m-%d",newtime); 
+}
+
+
+StatisticsCollector::TestCase StatisticsCollector::SetTestCase(const char *name, const char *mode, int threads)
+{
+    string KeyName(name);
+    switch (SortMode)
+    {
+    case ByThreads: KeyName += Format("_%02d_%s", threads, mode); break;
+    default:
+    case ByAlg: KeyName += Format("_%s_%02d", mode, threads); break;
+    }
+    CurrentKey = Statistics[KeyName];
+    if(!CurrentKey) {
+        CurrentKey = new StatisticResults;
+        CurrentKey->Mode = mode;
+        CurrentKey->Name = name;
+        CurrentKey->Threads = threads;
+        CurrentKey->Results.reserve(RoundTitles.size());
+        Statistics[KeyName] = CurrentKey;
+    }
+    return TestCase(CurrentKey);
+}
+
+StatisticsCollector::~StatisticsCollector()
+{
+    for(Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+        delete i->second;
+}
+
+void StatisticsCollector::ReserveRounds(size_t index)
+{
+    size_t i = RoundTitles.size();
+    if (i > index) return;
+    char buf[16];
+    RoundTitles.resize(index+1);
+    for(; i <= index; i++) {
+        snprintf( buf, 15, "%u", unsigned(i+1) );
+        RoundTitles[i] = buf;
+    }
+    for(Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++) {
+        if(!i->second) printf("!!!'%s' = NULL\n", i->first.c_str());
+        else i->second->Results.reserve(index+1);
+    }
+}
+
+void StatisticsCollector::AddRoundResult(const TestCase &key, value_t v)
+{
+    ReserveRounds(key.access->Results.size());
+    key.access->Results.push_back(v);
+}
+
+void StatisticsCollector::SetRoundTitle(size_t index, const char *fmt, ...)
+{
+    vargf2buff(buff, 128, fmt);
+    ReserveRounds(index);
+    RoundTitles[index] = buff;
+}
+
+void StatisticsCollector::AddStatisticValue(const TestCase &key, const char *type, const char *fmt, ...)
+{
+    vargf2buff(buff, 128, fmt);
+    AnalysisTitles.insert(type);
+    key.access->Analysis[type] = buff;
+}
+
+void StatisticsCollector::AddStatisticValue(const char *type, const char *fmt, ...)
+{
+    vargf2buff(buff, 128, fmt);
+    AnalysisTitles.insert(type);
+    CurrentKey->Analysis[type] = buff;
+}
+
+void StatisticsCollector::SetRunInfo(const char *title, const char *fmt, ...)
+{
+    vargf2buff(buff, 256, fmt);
+    RunInfo.push_back(make_pair(title, buff));
+}
+
+void StatisticsCollector::SetStatisticFormula(const char *name, const char *formula)
+{
+    Formulas[name] = formula;
+}
+
+void StatisticsCollector::SetTitle(const char *fmt, ...)
+{
+    vargf2buff(buff, 256, fmt);
+    Title = buff;
+}
+
+string ExcelFormula(const string &fmt, size_t place, size_t rounds, bool is_horizontal)
+{
+    char buff[16];
+    if(is_horizontal)
+        snprintf(buff, 15, "RC[%u]:RC[%u]", unsigned(place), unsigned(place+rounds-1));
+    else
+        snprintf(buff, 15, "R[%u]C:R[%u]C", unsigned(place+1), unsigned(place+rounds));
+    string result(fmt); size_t pos = 0;
+    while ( (pos = result.find("ROUNDS", pos, 6)) != string::npos )
+        result.replace(pos, 6, buff);
+    return result;
+}
+
+void StatisticsCollector::Print(int dataOutput, const char *ModeName)
+{
+    FILE *OutputFile;
+    const char *file_suffix = getenv("STAT_SUFFIX");
+    if( !file_suffix ) file_suffix = "";
+    const char *file_format = getenv("STAT_FORMAT");
+    if( file_format ) {
+        dataOutput = 0;
+        if( strstr(file_format, "con")||strstr(file_format, "std") ) dataOutput |= StatisticsCollector::Stdout;
+        if( strstr(file_format, "txt")||strstr(file_format, "csv") ) dataOutput |= StatisticsCollector::TextFile;
+        if( strstr(file_format, "excel")||strstr(file_format, "xml") ) dataOutput |= StatisticsCollector::ExcelXML;
+        if( strstr(file_format, "htm") ) dataOutput |= StatisticsCollector::HTMLFile;
+        if( strstr(file_format, "pivot") ) dataOutput |= StatisticsCollector::PivotMode;
+    }
+    for(int i = 1; i < 10; i++) {
+        string env = Format("STAT_RUNINFO%d", i);
+        const char *info = getenv(env.c_str());
+        if( info ) {
+            string title(info);
+            size_t pos = title.find('=');
+            if( pos != string::npos ) {
+                env = title.substr(pos+1);
+                title.resize(pos);
+            } else env = title;
+            RunInfo.push_back(make_pair(title, env));
+        }
+    }
+
+    if (dataOutput & StatisticsCollector::Stdout)
+    {
+        printf("\n-=# %s #=-\n", Title.c_str());
+        if(SortMode == ByThreads)
+            printf("    Name    |  #  | %s ", ModeName);
+        else
+            printf("    Name    | %s |  #  ", ModeName);
+        for (AnalysisTitles_t::iterator i = AnalysisTitles.begin(); i != AnalysisTitles.end(); i++)
+            printf("|%s", i->c_str()+1);
+
+        for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+        {
+            if(SortMode == ByThreads)
+                printf("\n%12s|% 5d|%6s", i->second->Name.c_str(), i->second->Threads, i->second->Mode.c_str());
+            else
+                printf("\n%12s|%6s|% 5d", i->second->Name.c_str(), i->second->Mode.c_str(), i->second->Threads);
+            Analysis_t &analisis = i->second->Analysis;
+            AnalysisTitles_t::iterator t = AnalysisTitles.begin();
+            for (Analysis_t::iterator a = analisis.begin(); a != analisis.end(); t++)
+            {
+                char fmt[8]; snprintf(fmt, 7, "|%% %us", unsigned(max(size_t(3), t->size())));
+                if(*t != a->first)
+                    printf(fmt, "");
+                else {
+                    printf(fmt, a->second.c_str()); a++;
+                }
+            }
+        }
+        printf("\n");
+    }
+    if (dataOutput & StatisticsCollector::TextFile)
+    {
+        bool append = false;
+        const char *file_ext = ".txt";
+        if( file_format && strstr(file_format, "++") ) append = true;
+        if( file_format && strstr(file_format, "csv") ) file_ext = ".csv";
+        if ((OutputFile = fopen((Name+file_suffix+file_ext).c_str(), append?"at":"wt")) == NULL) {
+            printf("Can't open .txt file\n");
+        } else {
+            const char *delim = getenv("STAT_DELIMITER");
+            if( !delim || !delim[0] ) {
+                if( file_format && strstr(file_format, "csv") ) delim = ",";
+                else delim = "\t";
+            }
+            if( !append || !ftell(OutputFile) ) { // header needed
+                append = false;
+                if(SortMode == ByThreads) fprintf(OutputFile, "Name%s#%s%s", delim, delim, ModeName);
+                else fprintf(OutputFile, "Name%s%s%s#", delim, ModeName, delim);
+                for( size_t k = 0; k < RunInfo.size(); k++ )
+                    fprintf(OutputFile, "%s%s", delim, RunInfo[k].first.c_str());
+            }
+            if(dataOutput & StatisticsCollector::PivotMode) {
+                if( !append) fprintf(OutputFile, "%sColumn%sValue", delim, delim);
+                for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+                {
+                    string RowHead;
+                    if(SortMode == ByThreads)
+                        RowHead = Format("\n%s%s%d%s%s%s", i->second->Name.c_str(), delim, i->second->Threads, delim, i->second->Mode.c_str(), delim);
+                    else
+                        RowHead = Format("\n%s%s%s%s%d%s", i->second->Name.c_str(), delim, i->second->Mode.c_str(), delim, i->second->Threads, delim);
+                    for( size_t k = 0; k < RunInfo.size(); k++ )
+                        RowHead.append(RunInfo[k].second + delim);
+                    Analysis_t &analisis = i->second->Analysis;
+                    for (Analysis_t::iterator a = analisis.begin(); a != analisis.end(); ++a)
+                        fprintf(OutputFile, "%s%s%s%s", RowHead.c_str(), a->first.c_str(), delim, a->second.c_str());
+                    Results_t &r = i->second->Results;
+                    for (size_t k = 0; k < r.size(); k++) {
+                        fprintf(OutputFile, "%s%s%s", RowHead.c_str(), RoundTitles[k].c_str(), delim);
+                        fprintf(OutputFile, ResultsFmt, r[k]);
+                    }
+                }
+            } else {
+                if( !append ) {
+                    for( size_t k = 0; k < RunInfo.size(); k++ )
+                        fprintf(OutputFile, "%s%s", delim, RunInfo[k].first.c_str());
+                    for (AnalysisTitles_t::iterator i = AnalysisTitles.begin(); i != AnalysisTitles.end(); i++)
+                        fprintf(OutputFile, "%s%s", delim, i->c_str()+1);
+                    for (size_t i = 0; i < RoundTitles.size(); i++)
+                        fprintf(OutputFile, "%s%s", delim, RoundTitles[i].c_str());
+                }
+                for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+                {
+                    if(SortMode == ByThreads)
+                        fprintf(OutputFile, "\n%s%s%d%s%s", i->second->Name.c_str(), delim, i->second->Threads, delim, i->second->Mode.c_str());
+                    else
+                        fprintf(OutputFile, "\n%s%s%s%s%d", i->second->Name.c_str(), delim, i->second->Mode.c_str(), delim, i->second->Threads);
+                    for( size_t k = 0; k < RunInfo.size(); k++ )
+                        fprintf(OutputFile, "%s%s", delim, RunInfo[k].second.c_str());
+                    Analysis_t &analisis = i->second->Analysis;
+                    AnalysisTitles_t::iterator t = AnalysisTitles.begin();
+                    for (Analysis_t::iterator a = analisis.begin(); a != analisis.end(); ++t) {
+                        fprintf(OutputFile, "%s", delim);
+                        if(*t == a->first) {
+                            fprintf(OutputFile, "%s", a->second.c_str()); ++a;
+                        }
+                    }
+                    //data
+                    Results_t &r = i->second->Results;
+                    for (size_t k = 0; k < r.size(); k++)
+                    {
+                        fprintf(OutputFile, "%s", delim);
+                        fprintf(OutputFile, ResultsFmt, r[k]);
+                    }
+                }
+            }
+            fprintf(OutputFile, "\n");
+            fclose(OutputFile);
+        }
+    }
+    if (dataOutput & StatisticsCollector::HTMLFile)
+    {
+        if ((OutputFile = fopen((Name+file_suffix+".html").c_str(), "w+t")) == NULL) {
+            printf("Can't open .html file\n");
+        } else {
+            char TimerBuff[100], DateBuff[100];
+            GetTime(TimerBuff,sizeof(TimerBuff));
+            GetDate(DateBuff,sizeof(DateBuff));
+            fprintf(OutputFile, "<html><head>\n<title>%s</title>\n</head><body>\n", Title.c_str());
+            //-----------------------
+            fprintf(OutputFile, "<table id=\"h\" style=\"position:absolute;top:20\" border=1 cellspacing=0 cellpadding=2>\n");
+            fprintf(OutputFile, "<tr><td><a name=hr href=#vr onclick=\"v.style.visibility='visible';"
+                                "h.style.visibility='hidden';\">Flip[H]</a></td>"
+                                "<td>%s</td><td>%s</td><td colspan=%u>%s",
+                DateBuff, TimerBuff, unsigned(AnalysisTitles.size() + RoundTitles.size()), Title.c_str());
+            for( size_t k = 0; k < RunInfo.size(); k++ )
+                fprintf(OutputFile, "; %s: %s", RunInfo[k].first.c_str(), RunInfo[k].second.c_str());
+            fprintf(OutputFile, "</td></tr>\n<tr bgcolor=#CCFFFF><td>Name</td><td>Threads</td><td>%s</td>", ModeName);
+            for (AnalysisTitles_t::iterator i = AnalysisTitles.begin(); i != AnalysisTitles.end(); i++)
+                fprintf(OutputFile, "<td>%s</td>", i->c_str()+1);
+            for (size_t i = 0; i < RoundTitles.size(); i++)
+                fprintf(OutputFile, "<td>%s</td>", RoundTitles[i].c_str());
+            for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+            {
+                fprintf(OutputFile, "</tr>\n<tr><td bgcolor=#CCFFCC>%s</td><td bgcolor=#CCFFCC>%d</td><td bgcolor=#CCFFCC>%4s</td>",
+                    i->second->Name.c_str(), i->second->Threads, i->second->Mode.c_str());
+                //statistics
+                AnalysisTitles_t::iterator t = AnalysisTitles.begin();
+                for (Analysis_t::iterator j = i->second->Analysis.begin(); j != i->second->Analysis.end(); t++)
+                {
+                    fprintf(OutputFile, "<td bgcolor=#FFFF99>%s</td>", (*t != j->first)?" ":(i->second->Analysis[j->first]).c_str());
+                    if(*t == j->first) j++;
+                }
+                //data
+                Results_t &r = i->second->Results;
+                for (size_t k = 0; k < r.size(); k++)
+                {
+                    fprintf(OutputFile, "<td>");
+                    fprintf(OutputFile, ResultsFmt, r[k]);
+                    fprintf(OutputFile, "</td>");
+                }
+            }
+            fprintf(OutputFile, "</tr>\n</table>\n");
+            //////////////////////////////////////////////////////
+            fprintf(OutputFile, "<table id=\"v\" style=\"visibility:hidden;position:absolute;top:20\" border=1 cellspacing=0 cellpadding=2>\n");
+            fprintf(OutputFile, "<tr><td><a name=vr href=#hr onclick=\"h.style.visibility='visible';"
+                                "v.style.visibility='hidden';\">Flip[V]</a></td>\n"
+                                "<td>%s</td><td>%s</td><td colspan=%u>%s</td>", 
+                DateBuff, TimerBuff, unsigned(max(Statistics.size()-2,size_t(1))), Title.c_str());
+
+            fprintf(OutputFile, "</tr>\n<tr bgcolor=#CCFFCC><td bgcolor=#CCFFFF>Name</td>");
+            for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+                fprintf(OutputFile, "<td>%s</td>", i->second->Name.c_str());
+            fprintf(OutputFile, "</tr>\n<tr bgcolor=#CCFFCC><td bgcolor=#CCFFFF>Threads</td>");
+            for (Statistics_t::iterator n = Statistics.begin(); n != Statistics.end(); n++)
+                fprintf(OutputFile, "<td>%d</td>", n->second->Threads);
+            fprintf(OutputFile, "</tr>\n<tr bgcolor=#CCFFCC><td bgcolor=#CCFFFF>%s</td>", ModeName);
+            for (Statistics_t::iterator m = Statistics.begin(); m != Statistics.end(); m++)
+                fprintf(OutputFile, "<td>%s</td>", m->second->Mode.c_str());
+
+            for (AnalysisTitles_t::iterator t = AnalysisTitles.begin(); t != AnalysisTitles.end(); t++)
+            {
+                fprintf(OutputFile, "</tr>\n<tr bgcolor=#FFFF99><td bgcolor=#CCFFFF>%s</td>", t->c_str()+1);
+                for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+                    fprintf(OutputFile, "<td>%s</td>", i->second->Analysis.count(*t)?i->second->Analysis[*t].c_str():" ");
+            }
+
+            for (size_t r = 0; r < RoundTitles.size(); r++)
+            {
+                fprintf(OutputFile, "</tr>\n<tr><td bgcolor=#CCFFFF>%s</td>", RoundTitles[r].c_str());
+                for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+                {
+                    Results_t &result = i->second->Results;
+                    fprintf(OutputFile, "<td>");
+                    if(result.size() > r)
+                        fprintf(OutputFile, ResultsFmt, result[r]);
+                    fprintf(OutputFile, "</td>");
+                }
+            }
+            fprintf(OutputFile, "</tr>\n</table>\n</body></html>\n");
+            fclose(OutputFile);
+        }
+    }
+    if (dataOutput & StatisticsCollector::ExcelXML)
+    {
+        if ((OutputFile = fopen((Name+file_suffix+".xml").c_str(), "w+t")) == NULL) {
+            printf("Can't open .xml file\n");
+        } else {
+            // TODO:PivotMode
+            char UserName[100];
+            char TimerBuff[100], DateBuff[100];
+#if _WIN32 || _WIN64
+            strcpy(UserName,getenv("USERNAME"));
+#else
+            strcpy(UserName,getenv("USER"));
+#endif
+            //--------------------------------
+            GetTime(TimerBuff,sizeof(TimerBuff));
+            GetDate(DateBuff,sizeof(DateBuff));
+            //--------------------------
+            fprintf(OutputFile, XMLHead, UserName, TimerBuff);
+            fprintf(OutputFile, XMLStyles);
+            fprintf(OutputFile, XMLBeginSheet, "Horizontal");
+            fprintf(OutputFile, XMLNames,1,1,1,int(AnalysisTitles.size()+Formulas.size()+COUNT_PARAMETERS));
+            fprintf(OutputFile, XMLBeginTable, int(RoundTitles.size()+Formulas.size()+AnalysisTitles.size()+COUNT_PARAMETERS+1/*title*/), int(Statistics.size()+1));
+            fprintf(OutputFile, XMLBRow);
+            fprintf(OutputFile, XMLCellTopName);
+            fprintf(OutputFile, XMLCellTopThread);
+            fprintf(OutputFile, XMLCellTopMode, ModeName);
+            for (AnalysisTitles_t::iterator j = AnalysisTitles.begin(); j != AnalysisTitles.end(); j++)
+                fprintf(OutputFile, XMLAnalysisTitle, j->c_str()+1);
+            for (Formulas_t::iterator j = Formulas.begin(); j != Formulas.end(); j++)
+                fprintf(OutputFile, XMLAnalysisTitle, j->first.c_str()+1);
+            for (RoundTitles_t::iterator j = RoundTitles.begin(); j != RoundTitles.end(); j++)
+                fprintf(OutputFile, XMLAnalysisTitle, j->c_str());
+            string Info = Title;
+            for( size_t k = 0; k < RunInfo.size(); k++ )
+                Info.append("; " + RunInfo[k].first + "=" + RunInfo[k].second);
+            fprintf(OutputFile, XMLCellEmptyWhite, Info.c_str());
+            fprintf(OutputFile, XMLERow);
+            //------------------------
+            for (Statistics_t::iterator i = Statistics.begin(); i != Statistics.end(); i++)
+            {
+                fprintf(OutputFile, XMLBRow);
+                fprintf(OutputFile, XMLCellName,  i->second->Name.c_str());
+                fprintf(OutputFile, XMLCellThread,i->second->Threads);
+                fprintf(OutputFile, XMLCellMode,  i->second->Mode.c_str());
+                //statistics
+                AnalysisTitles_t::iterator at = AnalysisTitles.begin();
+                for (Analysis_t::iterator j = i->second->Analysis.begin(); j != i->second->Analysis.end(); at++)
+                {
+                    fprintf(OutputFile, XMLCellAnalysis, (*at != j->first)?"":(i->second->Analysis[j->first]).c_str());
+                    if(*at == j->first) j++;
+                }
+                //formulas
+                size_t place = 0;
+                Results_t &v = i->second->Results;
+                for (Formulas_t::iterator f = Formulas.begin(); f != Formulas.end(); f++, place++)
+                    fprintf(OutputFile, XMLCellFormula, ExcelFormula(f->second, Formulas.size()-place, v.size(), true).c_str());
+                //data
+                for (size_t k = 0; k < v.size(); k++)
+                {
+                    fprintf(OutputFile, XMLCellData, v[k]);
+                }
+                if(v.size() < RoundTitles.size())
+                    fprintf(OutputFile, XMLMergeRow, int(RoundTitles.size() - v.size()));
+                fprintf(OutputFile, XMLERow);
+            }
+            //------------------------
+            fprintf(OutputFile, XMLEndTable);
+            fprintf(OutputFile, XMLWorkSheetProperties,1,1,3,3,int(RoundTitles.size()+AnalysisTitles.size()+Formulas.size()+COUNT_PARAMETERS));
+            fprintf(OutputFile, XMLAutoFilter,1,1,1,int(AnalysisTitles.size()+Formulas.size()+COUNT_PARAMETERS));
+            fprintf(OutputFile, XMLEndWorkSheet);
+            //----------------------------------------
+            fprintf(OutputFile, XMLEndWorkbook);
+            fclose(OutputFile);
+        }
+    }
+}
diff --git a/xdl/third_party/tbb/src/perf/statistics.h b/xdl/third_party/tbb/src/perf/statistics.h
new file mode 100644
index 00000000..c60aa372
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/statistics.h
@@ -0,0 +1,191 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Internal Intel tool
+
+#ifndef __STATISTICS_H__
+#define __STATISTICS_H__
+
+#define _CRT_SECURE_NO_DEPRECATE 1
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <stdarg.h>
+#include <vector>
+#include <map>
+#include <set>
+#include <string>
+#include <time.h>
+
+using namespace std;
+typedef double value_t;
+
+/*
+   Statistical collector class.
+
+   Resulting table output:
+        +---------------------------------------------------------------------------+
+        | [Date] <Title>...                                                         |
+        +----------+----v----+--v---+----------------+------------+-..-+------------+
+        | TestName | Threads | Mode | Rounds results | Stat_type1 | .. | Stat_typeN |
+        +----------+---------+------+-+-+-+-..-+-+-+-+------------+-..-+------------+
+        |          |         |      | | | | .. | | | |            |    |            |
+        ..        ...       ...     ..................            ......           ..
+        |          |         |      | | | | .. | | | |            |    |            |
+        +----------+---------+------+-+-+-+-..-+-+-+-+------------+-..-+------------+
+
+   Iterating table output:
+        +---------------------------------------------------------------------------+
+        | [Date] <TestName>, Threads: <N>, Mode: <M>; for <Title>...                |
+        +----------+----v----+--v---+----------------+------------+-..-+------------+
+
+*/
+
+class StatisticsCollector
+{
+public:
+    typedef map<string, string> Analysis_t;
+    typedef vector<value_t> Results_t;
+
+protected:
+    StatisticsCollector(const StatisticsCollector &);
+
+    struct StatisticResults
+    {
+        string              Name;
+        string              Mode;
+        int                 Threads;
+        Results_t           Results;
+        Analysis_t          Analysis;
+    };
+
+    // internal members
+    //bool OpenFile;
+    StatisticResults *CurrentKey;
+    string Title;
+    const char /**Name,*/ *ResultsFmt;
+    string Name;
+    //! Data
+    typedef map<string, StatisticResults*> Statistics_t;
+    Statistics_t Statistics;
+    typedef vector<string> RoundTitles_t;
+    RoundTitles_t RoundTitles;
+    //TODO: merge those into one structure
+    typedef map<string, string> Formulas_t;
+    Formulas_t   Formulas;
+    typedef set<string> AnalysisTitles_t;
+    AnalysisTitles_t AnalysisTitles;
+    typedef vector<pair<string, string> > RunInfo_t;
+    RunInfo_t RunInfo;
+
+public:
+    struct TestCase {
+        StatisticResults *access;
+        TestCase() : access(0) {}
+        TestCase(StatisticResults *link) : access(link) {}
+        const char *getName() const { return access->Name.c_str(); }
+        const char *getMode() const { return access->Mode.c_str(); }
+        int getThreads()       const { return access->Threads; }
+        const Results_t &getResults() const { return access->Results; }
+        const Analysis_t &getAnalysis() const { return access->Analysis; }
+    };
+
+    enum Sorting {
+        ByThreads, ByAlg
+    };
+
+    //! Data and output types
+    enum DataOutput {
+        // Verbosity level enumeration
+        Statistic = 1,     //< Analytical data - computed after all iterations and rounds passed
+        Result    = 2,     //< Testing data    - collected after all iterations passed
+        Iteration = 3,     //< Verbose data    - collected at each iteration (for each size - in case of containers)
+        // ExtraVerbose is not applicabe yet :) be happy, but flexibility is always welcome
+
+        // Next constants are bit-fields
+        Stdout   = 1<<8,    //< Output to the console
+        TextFile = 1<<9,    //< Output to plain text file "name.txt" (delimiter is TAB by default)
+        ExcelXML = 1<<10,   //< Output to Excel-readable XML-file "name.xml"
+        HTMLFile = 1<<11,   //< Output to HTML file "name.html"
+        PivotMode= 1<<15    //< Puts all the rounds into one columt to better fit for pivot table in Excel
+    };
+
+    //! Constructor. Specify tests set name which used as name of output files
+    StatisticsCollector(const char *name, Sorting mode = ByThreads, const char *fmt = "%g")
+        :  CurrentKey(NULL), ResultsFmt(fmt), Name(name), SortMode(mode) {}
+
+    ~StatisticsCollector();
+
+    //! Set tests set title, supporting printf-like arguments
+    void SetTitle(const char *fmt, ...);
+
+    //! Specify next test key
+    TestCase SetTestCase(const char *name, const char *mode, int threads);
+    //! Specify next test key
+    void SetTestCase(const TestCase &t) { SetTestCase(t.getName(), t.getMode(), t.getThreads()); }
+    //! Reserve specified number of rounds. Use for efficiency. Used mostly internally
+    void ReserveRounds(size_t index);
+    //! Add result of the measure
+    void AddRoundResult(const TestCase &, value_t v);
+    //! Add result of the current measure
+    void AddRoundResult(value_t v) { if(CurrentKey) AddRoundResult(TestCase(CurrentKey), v); }
+    //! Add title of round
+    void SetRoundTitle(size_t index, const char *fmt, ...);
+    //! Add numbered title of round
+    void SetRoundTitle(size_t index, int num) { SetRoundTitle(index, "%d", num); }
+    //! Get number of rounds
+    size_t GetRoundsCount() const { return RoundTitles.size(); }
+    // Set statistic value for the test
+    void AddStatisticValue(const TestCase &, const char *type, const char *fmt, ...);
+    // Set statistic value for the current test
+    void AddStatisticValue(const char *type, const char *fmt, ...);
+    //! Add Excel-processing formulas. @arg formula can contain more than one instances of
+    //! ROUNDS template which transforms into the range of cells with result values
+    //TODO://! #1 .. #n templates represent data cells from the first to the last
+    //TODO: merge with Analisis
+    void SetStatisticFormula(const char *name, const char *formula);
+    //! Add information about run or compile parameters
+    void SetRunInfo(const char *title, const char *fmt, ...);
+    void SetRunInfo(const char *title, int num) { SetRunInfo(title, "%d", num); }
+
+    //! Data output
+    void Print(int dataOutput, const char *ModeName = "Mode");
+
+private:
+    Sorting SortMode;
+};
+
+//! using: Func(const char *fmt, ...) { vargf2buff(buff, 128, fmt);...
+#define vargf2buff(name, size, fmt) \
+    char name[size]; memset(name, 0, size); \
+    va_list args; va_start(args, fmt); \
+    vsnprintf(name, size-1, fmt, args); \
+    va_end(args);
+
+
+inline std::string Format(const char *fmt, ...) {
+    vargf2buff(buf, 1024, fmt); // from statistics.h
+    return std::string(buf);
+}
+
+#ifdef STATISTICS_INLINE
+#include "statistics.cpp"
+#endif
+#endif //__STATISTICS_H__
diff --git a/xdl/third_party/tbb/src/perf/statistics_xml.h b/xdl/third_party/tbb/src/perf/statistics_xml.h
new file mode 100644
index 00000000..48a3d7e7
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/statistics_xml.h
@@ -0,0 +1,200 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+const char XMLBRow[]=
+"   <Row>\n";
+
+const char XMLERow[]=
+"   </Row>\n";
+
+const char XMLHead[]=
+"<?xml version=\"1.0\"?>\n"
+"<?mso-application progid=\"Excel.Sheet\"?>\n\
+<Workbook xmlns=\"urn:schemas-microsoft-com:office:spreadsheet\"\n\
+ xmlns:o=\"urn:schemas-microsoft-com:office:office\"\n\
+ xmlns:x=\"urn:schemas-microsoft-com:office:excel\"\n\
+ xmlns:ss=\"urn:schemas-microsoft-com:office:spreadsheet\"\n\
+ xmlns:html=\"http://www.w3.org/TR/REC-html40\">\n\
+ <DocumentProperties xmlns=\"urn:schemas-microsoft-com:office:office\">\n\
+  <Author>%s</Author>\n\
+  <Created>%s</Created>\n\
+  <Company>Intel Corporation</Company>\n\
+ </DocumentProperties>\n\
+ <ExcelWorkbook xmlns=\"urn:schemas-microsoft-com:office:excel\">\n\
+  <RefModeR1C1/>\n\
+ </ExcelWorkbook>\n";
+ 
+ const char XMLStyles[]=
+ " <Styles>\n\
+  <Style ss:ID=\"Default\" ss:Name=\"Normal\">\n\
+   <Alignment ss:Vertical=\"Bottom\" ss:Horizontal=\"Left\" ss:WrapText=\"0\"/>\n\
+  </Style>\n\
+  <Style ss:ID=\"s26\">\n\
+   <Alignment ss:Vertical=\"Top\"  ss:Horizontal=\"Left\" ss:WrapText=\"0\"/>\n\
+   <Borders>\n\
+    <Border ss:Position=\"Bottom\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Left\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Right\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Top\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+   </Borders>\n\
+   <Interior ss:Color=\"#FFFF99\" ss:Pattern=\"Solid\"/>\n\
+  </Style>\n\
+  <Style ss:ID=\"s25\">\n\
+   <Alignment ss:Vertical=\"Top\"  ss:Horizontal=\"Left\" ss:WrapText=\"0\"/>\n\
+   <Borders>\n\
+    <Border ss:Position=\"Bottom\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Left\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Right\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Top\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+   </Borders>\n\
+   <Interior ss:Color=\"#CCFFFF\" ss:Pattern=\"Solid\"/>\n\
+  </Style>\n\
+  <Style ss:ID=\"s24\">\n\
+   <Alignment ss:Vertical=\"Top\"  ss:Horizontal=\"Left\" ss:WrapText=\"0\"/>\n\
+   <Borders>\n\
+    <Border ss:Position=\"Bottom\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Left\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Right\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Top\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+   </Borders>\n\
+   <Interior ss:Color=\"#CCFFCC\" ss:Pattern=\"Solid\"/>\n\
+  </Style>\n\
+  <Style ss:ID=\"s23\">\n\
+   <Alignment ss:Vertical=\"Top\"  ss:Horizontal=\"Left\" ss:WrapText=\"0\"/>\n\
+   <Borders>\n\
+    <Border ss:Position=\"Bottom\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Left\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Right\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+    <Border ss:Position=\"Top\" ss:LineStyle=\"Continuous\" ss:Weight=\"1\"/>\n\
+   </Borders>\n\
+  </Style>\n\
+ </Styles>\n";
+
+const char XMLBeginSheet[]=
+" <Worksheet ss:Name=\"%s\">\n";
+
+const char XMLNames[]=
+"  <Names>\n\
+   <NamedRange ss:Name=\"_FilterDatabase\" ss:RefersTo=\"R%dC%d:R%dC%d\" ss:Hidden=\"1\"/>\n\
+  </Names>\n";
+
+const char XMLBeginTable[]=
+"  <Table ss:ExpandedColumnCount=\"%d\" ss:ExpandedRowCount=\"%d\" x:FullColumns=\"1\"\n\
+   x:FullRows=\"1\">\n";
+   
+const char XMLColumsHorizontalTable[]=
+"   <Column ss:Index=\"1\" ss:Width=\"108.75\"/>\n\
+   <Column ss:Index=\"%d\" ss:Width=\"77.25\" ss:Span=\"%d\"/>\n";
+ 
+const char XMLColumsVerticalTable[]= 
+"   <Column ss:Index=\"1\" ss:Width=\"77.25\" ss:Span=\"%d\"/>\n";
+
+const char XMLNameAndTime[]=
+"    <Cell><Data ss:Type=\"String\">%s</Data></Cell>\n\
+    <Cell><Data ss:Type=\"String\">%s</Data></Cell>\n\
+    <Cell><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+const char XMLTableParamAndTitle[]=
+"    <Cell><Data ss:Type=\"Number\">%d</Data></Cell>\n\
+    <Cell><Data ss:Type=\"Number\">%d</Data></Cell>\n\
+    <Cell><Data ss:Type=\"Number\">%d</Data></Cell>\n\
+    <Cell><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+//--------------
+const char XMLCellTopName[]=
+"   <Cell ss:StyleID=\"s25\"><Data ss:Type=\"String\">Name</Data></Cell>\n";
+const char XMLCellTopThread[]=
+"   <Cell ss:StyleID=\"s25\"><Data ss:Type=\"String\">Threads</Data></Cell>\n";
+const char XMLCellTopMode[]=
+"   <Cell ss:StyleID=\"s25\"><Data ss:Type=\"String\">%s</Data></Cell>\n";
+//---------------------
+const char XMLAnalysisTitle[]=
+"   <Cell ss:StyleID=\"s25\"><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+const char XMLCellName[]=
+"    <Cell ss:StyleID=\"s24\"><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+const char XMLCellThread[]=
+"    <Cell ss:StyleID=\"s24\"><Data ss:Type=\"Number\">%d</Data></Cell>\n";
+
+const char XMLCellMode[]=
+"    <Cell ss:StyleID=\"s24\"><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+const char XMLCellAnalysis[]=
+"    <Cell ss:StyleID=\"s26\"><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+const char XMLCellFormula[]=
+"    <Cell ss:StyleID=\"s26\" ss:Formula=\"%s\"><Data ss:Type=\"Number\"></Data></Cell>\n";
+
+const char XMLCellData[]=
+"    <Cell ss:StyleID=\"s23\"><Data ss:Type=\"Number\">%g</Data></Cell>\n";
+
+const char XMLMergeRow[]=
+"   <Cell ss:StyleID=\"s23\" ss:MergeAcross=\"%d\" ><Data ss:Type=\"String\"></Data></Cell>\n";
+
+const char XMLCellEmptyWhite[]=
+"    <Cell><Data ss:Type=\"String\">%s</Data></Cell>\n";
+
+const char XMLCellEmptyTitle[]=
+"    <Cell ss:StyleID=\"s25\"><Data ss:Type=\"String\"></Data></Cell>\n";
+
+const char XMLEndTable[]=
+"  </Table>\n";
+
+const char XMLAutoFilter[]=
+"  <AutoFilter x:Range=\"R%dC%d:R%dC%d\" xmlns=\"urn:schemas-microsoft-com:office:excel\">\n\
+  </AutoFilter>\n";
+
+const char XMLEndWorkSheet[]=
+ " </Worksheet>\n";
+
+const char XMLWorkSheetProperties[]=
+"  <WorksheetOptions xmlns=\"urn:schemas-microsoft-com:office:excel\">\n\
+   <Unsynced/>\n\
+   <Selected/>\n\
+   <FreezePanes/>\n\
+   <FrozenNoSplit/>\n\
+   <SplitHorizontal>%d</SplitHorizontal>\n\
+   <TopRowBottomPane>%d</TopRowBottomPane>\n\
+   <SplitVertical>%d</SplitVertical>\n\
+   <LeftColumnRightPane>%d</LeftColumnRightPane>\n\
+   <ActivePane>0</ActivePane>\n\
+   <Panes>\n\
+    <Pane>\n\
+     <Number>3</Number>\n\
+    </Pane>\n\
+    <Pane>\n\
+     <Number>1</Number>\n\
+    </Pane>\n\
+    <Pane>\n\
+     <Number>2</Number>\n\
+    </Pane>\n\
+    <Pane>\n\
+     <Number>0</Number>\n\
+     <ActiveRow>0</ActiveRow>\n\
+     <ActiveCol>%d</ActiveCol>\n\
+    </Pane>\n\
+   </Panes>\n\
+   <ProtectObjects>False</ProtectObjects>\n\
+   <ProtectScenarios>False</ProtectScenarios>\n\
+  </WorksheetOptions>\n";
+
+const char XMLEndWorkbook[]=
+ "</Workbook>\n";
diff --git a/xdl/third_party/tbb/src/perf/time_async_return.cpp b/xdl/third_party/tbb/src/perf/time_async_return.cpp
new file mode 100644
index 00000000..a4c9b946
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_async_return.cpp
@@ -0,0 +1,224 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*
+    This microbenchmark measures prioritization of the tasks that were spawned to execute async_node
+    successor's body. The idea of the prioritization is to have TBB worker threads react eagerly on
+    the work, which was returned back to the graph through async_node's gateway interface while
+    being occupied by CPU work generated by function_node with nested parallelism. Worker threads
+    should prefer async_node task instead of next parallel_for task. The result of correct work
+    prioritization is the interleaving of CPU and ASYNC work:
+
+        ASYNC task=1 started, thread_idx=0
+        CPU task=1 started, thread_idx=0
+            CPU task=1, nested pfor task=0, thread_idx=0
+            CPU task=1, nested pfor task=4, thread_idx=1
+        ASYNC task=1 finished, thread_idx=0
+        ASYNC task=2 started, thread_idx=0
+            CPU task=1, nested pfor task=1, thread_idx=0
+            CPU task=1, nested pfor task=5, thread_idx=1
+        ASYNC task=2 finished, thread_idx=0
+        ASYNC task=3 started, thread_idx=0
+            CPU task=1, nested pfor task=2, thread_idx=0
+            CPU task=1, nested pfor task=6, thread_idx=1
+        ASYNC task=3 finished, thread_idx=0
+        ASYNC task=4 started, thread_idx=0
+            CPU task=1, nested pfor task=3, thread_idx=0
+            CPU task=1, nested pfor task=7, thread_idx=1
+        ASYNC task=4 finished, thread_idx=0
+        ASYNC task=5 started, thread_idx=0
+        CPU task=1 finished, thread_idx=0
+        CPU task=2 started, thread_idx=0
+            CPU task=2, nested pfor task=0, thread_idx=0
+            CPU task=2, nested pfor task=4, thread_idx=1
+            CPU task=2, nested pfor task=5, thread_idx=1
+        ASYNC task=5 finished, thread_idx=0
+        ASYNC task=6 started, thread_idx=0
+            CPU task=2, nested pfor task=1, thread_idx=0
+        ASYNC task=6 finished, thread_idx=1
+            CPU task=2, nested pfor task=2, thread_idx=0
+        ASYNC task=7 started, thread_idx=1
+            CPU task=2, nested pfor task=6, thread_idx=1
+        ASYNC task=7 finished, thread_idx=0
+        ASYNC task=8 started, thread_idx=0
+            CPU task=2, nested pfor task=7, thread_idx=1
+            CPU task=2, nested pfor task=3, thread_idx=0
+        CPU task=2 finished, thread_idx=0
+        ASYNC task=8 finished, thread_idx=1
+        Elapsed time: 8.002
+
+    The parameters are chosen so that CPU and ASYNC work take approximately the same time.
+*/
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/concurrent_queue.h"
+#include "tbb/tick_count.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/flow_graph.h"
+#include "tbb/task_arena.h"
+#include <vector>
+#include <cstdio>
+
+const int NUM_THREADS = 2;                          // number of threads TBB is initialized with
+const int CPU_LIMIT = 2;                            // number of repetitions of sub-graph with function_node
+const double CPU_SPIN = 1.;                         // execution time of every parallel_for task
+const int NESTED_CPU_TASKS_COUNT = 4 * NUM_THREADS; // number of parallel_for tasks
+const int ASYNC_LIMIT = 8;                          // number of repetitions of sub-graph with async_node
+const double ASYNC_SPIN = 0.5;                      // execution time of every async_node work
+
+void spin(double s) {
+    tbb::tick_count start = tbb::tick_count::now();
+    while ((tbb::tick_count::now() - start).seconds() < s);
+}
+
+typedef int data_type;
+typedef tbb::flow::async_node<data_type, data_type> async_node_type;
+typedef tbb::flow::multifunction_node<data_type,
+    tbb::flow::tuple<data_type, data_type> > decider_node_type;
+
+struct AsyncActivity {
+    typedef async_node_type::gateway_type gateway_type;
+
+    struct work_type {
+        data_type input;
+        gateway_type* gateway;
+    };
+    bool done;
+    bool end_of_work() { return done; }
+    tbb::concurrent_queue<work_type> my_queue;
+    tbb::tbb_thread my_service_thread;
+
+    struct ServiceThreadFunc {
+        void operator()(AsyncActivity* activity) {
+            while (!activity->end_of_work()) {
+                work_type work;
+                while (activity->my_queue.try_pop(work)) {
+                    spin(ASYNC_SPIN); // do work
+                    work.gateway->try_put(work.input);
+                    work.gateway->release_wait();
+                }
+            }
+        }
+    };
+
+    void stop_and_wait() {
+        done = true;
+        my_service_thread.join();
+    }
+
+    void submit(data_type input, gateway_type* gateway) {
+        work_type work = { input, gateway };
+        gateway->reserve_wait();
+        my_queue.push(work);
+    }
+
+    AsyncActivity() : done(false), my_service_thread(ServiceThreadFunc(), this) {}
+};
+
+struct StartBody {
+    bool has_run;
+    bool operator()(data_type& input) {
+        if (has_run) return false;
+        else {
+            input = 1;
+            has_run = true;
+            return true;
+        }
+    }
+    StartBody() : has_run(false) {}
+};
+
+struct ParallelForBody {
+    const data_type& my_input;
+    ParallelForBody(const data_type& input) : my_input(input) {}
+    void operator()(const data_type& p) const {
+        std::printf("    CPU task=%d, nested pfor task=%d, thread_idx=%d\n", my_input, p,
+                    tbb::this_task_arena::current_thread_index());
+        spin(CPU_SPIN);
+    }
+};
+
+struct CpuWorkBody {
+    const int parallel_for_tasks_count;
+    data_type operator()(const data_type& input) {
+        std::printf("CPU task=%d started, thread_idx=%d\n", input,
+                    tbb::this_task_arena::current_thread_index());
+        tbb::parallel_for(0, parallel_for_tasks_count, ParallelForBody(input));
+        return input;
+    }
+    CpuWorkBody() : parallel_for_tasks_count(NESTED_CPU_TASKS_COUNT) {}
+};
+
+struct DeciderBody {
+    const int& my_limit;
+    DeciderBody( const int& limit ) : my_limit( limit ) {}
+    void operator()(data_type input, decider_node_type::output_ports_type& ports) {
+        const char* work_type = my_limit == ASYNC_LIMIT ? "ASYNC" : "CPU";
+        std::printf("%s task=%d finished, thread_idx=%d\n", work_type, input,
+                    tbb::this_task_arena::current_thread_index());
+        if (input < my_limit)
+            tbb::flow::get<0>(ports).try_put(input + 1);
+        else
+            tbb::flow::get<1>(ports).try_put(input + 1);
+    }
+};
+
+struct AsyncSubmissionBody {
+    AsyncActivity* my_activity;
+    void operator()(data_type input, async_node_type::gateway_type& gateway) {
+        my_activity->submit(input, &gateway);
+        std::printf("ASYNC task=%d started, thread_idx=%d\n", input,
+                    tbb::this_task_arena::current_thread_index());
+    }
+    AsyncSubmissionBody(AsyncActivity* activity) : my_activity(activity) {}
+};
+
+int main() {
+    tbb::task_scheduler_init init(NUM_THREADS);
+    AsyncActivity activity;
+    tbb::flow::graph g;
+
+    tbb::flow::source_node<data_type> starter_node(g, StartBody(), false);
+    tbb::flow::function_node<data_type, data_type> cpu_work_node(g, tbb::flow::unlimited, CpuWorkBody());
+    decider_node_type cpu_restarter_node(g, tbb::flow::unlimited, DeciderBody(CPU_LIMIT));
+    async_node_type async_node(g, tbb::flow::unlimited, AsyncSubmissionBody(&activity));
+    decider_node_type async_restarter_node(g, tbb::flow::unlimited, DeciderBody(ASYNC_LIMIT)
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+                                           , /*priority=*/1
+#endif
+    );
+
+    tbb::flow::make_edge(starter_node, cpu_work_node);
+    tbb::flow::make_edge(cpu_work_node, cpu_restarter_node);
+    tbb::flow::make_edge(tbb::flow::output_port<0>(cpu_restarter_node), cpu_work_node);
+
+    tbb::flow::make_edge(starter_node, async_node);
+    tbb::flow::make_edge(async_node, async_restarter_node);
+    tbb::flow::make_edge(tbb::flow::output_port<0>(async_restarter_node), async_node);
+
+    tbb::tick_count start_time = tbb::tick_count::now();
+    starter_node.activate();
+    g.wait_for_all();
+    activity.stop_and_wait();
+    std::printf("Elapsed time: %lf seconds\n", (tbb::tick_count::now() - start_time).seconds());
+
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_cpq_throughput_test.cpp b/xdl/third_party/tbb/src/perf/time_cpq_throughput_test.cpp
new file mode 100644
index 00000000..40563309
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_cpq_throughput_test.cpp
@@ -0,0 +1,294 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_CUSTOM_MAIN 1
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+
+#include <cstdlib>
+#include <cmath>
+#include <queue>
+#include "tbb/tbb_stddef.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/concurrent_priority_queue.h"
+#include "../test/harness.h"
+#include "../examples/common/utility/utility.h"
+#if _MSC_VER
+#pragma warning(disable: 4996)
+#endif
+
+#define IMPL_SERIAL 0
+#define IMPL_STL 1
+#define IMPL_CPQ 2
+
+using namespace tbb;
+
+// test parameters & defaults
+int impl = IMPL_CPQ; // which implementation to test
+int contention = 1; // busywork between operations in us
+int preload = 0; // # elements to pre-load queue with
+double throughput_window = 30.0; // in seconds
+int ops_per_iteration = 20; // minimum: 2 (1 push, 1 pop)
+const int sample_operations = 1000; // for timing checks
+
+// global data & types
+int pushes_per_iter;
+int pops_per_iter;
+tbb::atomic<unsigned int> operation_count;
+tbb::tick_count start;
+
+// a non-trivial data element to use in the priority queue
+const int padding_size = 15;  // change to get cache line size for test machine
+class padding_type {
+public:
+    int p[padding_size];
+    padding_type& operator=(const padding_type& other) {
+        if (this != &other) {
+            for (int i=0; i<padding_size; ++i) {
+                p[i] = other.p[i];
+            }
+        }
+        return *this;
+    }
+};
+
+class my_data_type {
+public:
+    int priority;
+    padding_type padding;
+    my_data_type() : priority(0) {}
+};
+
+class my_less {
+public:
+    bool operator()(my_data_type d1, my_data_type d2) {
+        return d1.priority<d2.priority;
+    }
+};
+
+// arrays to get/put data from/to to generate non-trivial accesses during busywork
+my_data_type *input_data;
+my_data_type *output_data;
+size_t arrsz;
+
+// Serial priority queue
+std::priority_queue<my_data_type, std::vector<my_data_type>, my_less > *serial_cpq;
+
+// Coarse-locked priority queue
+spin_mutex *my_mutex;
+std::priority_queue<my_data_type, std::vector<my_data_type>, my_less > *stl_cpq;
+
+// TBB concurrent_priority_queue
+concurrent_priority_queue<my_data_type, my_less > *agg_cpq;
+
+// Busy work and calibration helpers
+unsigned int one_us_iters = 345; // default value
+
+// if user wants to calibrate to microseconds on particular machine, call 
+// this at beginning of program; sets one_us_iters to number of iters to 
+// busy_wait for approx. 1 us
+void calibrate_busy_wait() {
+    const unsigned niter = 1000000;
+    tbb::tick_count t0 = tbb::tick_count::now();
+    for (volatile unsigned int i=0; i<niter; ++i) continue;
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    one_us_iters = (unsigned int)(niter/(t1-t0).seconds())*1e-6;
+    printf("one_us_iters: %d\n", one_us_iters);
+}
+
+void busy_wait(int us)
+{
+    unsigned int iter = us*one_us_iters;
+    for (volatile unsigned int i=0; i<iter; ++i) continue;
+}
+
+// Push to priority queue, depending on implementation
+void do_push(my_data_type elem, int nThr, int impl) {
+    if (impl == IMPL_SERIAL) {
+        serial_cpq->push(elem);
+    }
+    else if (impl == IMPL_STL) {
+        tbb::spin_mutex::scoped_lock myLock(*my_mutex);
+        stl_cpq->push(elem);
+    }
+    else if (impl == IMPL_CPQ) {
+        agg_cpq->push(elem);
+    }
+}
+
+// Pop from priority queue, depending on implementation
+my_data_type do_pop(int nThr, int impl) {
+    my_data_type elem;
+    if (impl == IMPL_SERIAL) {
+        if (!serial_cpq->empty()) {
+            elem = serial_cpq->top();
+            serial_cpq->pop();
+            return elem;
+        }
+    }
+    else if (impl == IMPL_STL) {
+        tbb::spin_mutex::scoped_lock myLock(*my_mutex);
+        if (!stl_cpq->empty()) {
+            elem = stl_cpq->top();
+            stl_cpq->pop();
+            return elem;
+        }
+    }
+    else if (impl == IMPL_CPQ) {
+        if (agg_cpq->try_pop(elem)) {
+            return elem;
+        }
+    }
+    return elem;
+}
+
+
+struct TestThroughputBody : NoAssign {
+    int nThread;
+    int implementation;
+
+    TestThroughputBody(int nThread_, int implementation_) : 
+        nThread(nThread_), implementation(implementation_) {}
+    
+    void operator()(const int threadID) const {
+        tbb::tick_count now;
+        size_t pos_in = threadID, pos_out = threadID;
+        my_data_type elem;
+        while (1) {
+            for (int i=0; i<sample_operations; i+=ops_per_iteration) {
+                // do pushes
+                for (int j=0; j<pushes_per_iter; ++j) {
+                    elem = input_data[pos_in];
+                    do_push(elem, nThread, implementation);
+                    busy_wait(contention);
+                    pos_in += nThread;
+                    if (pos_in >= arrsz) pos_in = pos_in % arrsz;
+                }
+                // do pops
+                for (int j=0; j<pops_per_iter; ++j) {
+                    output_data[pos_out] = do_pop(nThread, implementation);
+                    busy_wait(contention);
+                    pos_out += nThread;
+                    if (pos_out >= arrsz) pos_out = pos_out % arrsz;
+                }
+            }
+            now = tbb::tick_count::now();
+            operation_count += sample_operations;
+            if ((now-start).seconds() >= throughput_window) break;
+        }
+    }
+};
+
+void TestSerialThroughput() {
+    tbb::tick_count now;
+
+    serial_cpq = new std::priority_queue<my_data_type, std::vector<my_data_type>, my_less >;        
+    for (int i=0; i<preload; ++i) do_push(input_data[i], 1, IMPL_SERIAL);
+
+    TestThroughputBody my_serial_test(1, IMPL_SERIAL);
+    start = tbb::tick_count::now();
+    NativeParallelFor(1, my_serial_test);
+    now = tbb::tick_count::now();
+    delete serial_cpq;
+
+    printf("SERIAL 1 %10d\n", int(operation_count/(now-start).seconds()));
+}
+
+void TestThroughputCpqOnNThreads(int nThreads) {
+    tbb::tick_count now;
+
+    if (impl == IMPL_STL) {
+        stl_cpq = new std::priority_queue<my_data_type, std::vector<my_data_type>, my_less >;
+        for (int i=0; i<preload; ++i) do_push(input_data[i], nThreads, IMPL_STL);
+
+        TestThroughputBody my_stl_test(nThreads, IMPL_STL);
+        start = tbb::tick_count::now();
+        NativeParallelFor(nThreads, my_stl_test);
+        now = tbb::tick_count::now();
+        delete stl_cpq;
+        
+        printf("STL  %3d %10d\n", nThreads, int(operation_count/(now-start).seconds()));
+    }
+    else if (impl == IMPL_CPQ) {
+        agg_cpq = new concurrent_priority_queue<my_data_type, my_less >;
+        for (int i=0; i<preload; ++i) do_push(input_data[i], nThreads, IMPL_CPQ);
+
+        TestThroughputBody my_cpq_test(nThreads, IMPL_CPQ);
+        start = tbb::tick_count::now();
+        NativeParallelFor(nThreads, my_cpq_test);
+        now = tbb::tick_count::now();
+        delete agg_cpq;
+        
+        printf("CPQ  %3d %10d\n", nThreads, int(operation_count/(now-start).seconds()));
+    }
+}
+
+
+int main(int argc, char *argv[]) {
+    utility::thread_number_range threads(tbb::task_scheduler_init::default_num_threads);
+    struct select_impl{
+        static bool validate(const int & impl){
+            return  ((impl == IMPL_SERIAL) || (impl == IMPL_STL) || (impl == IMPL_CPQ));
+        }
+    };
+    utility::parse_cli_arguments(argc,argv,utility::cli_argument_pack()
+            .positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
+            .positional_arg(contention,"contention"," busywork between operations, in us")
+            .positional_arg(impl,"queue_type", "which implementation to test. One of 0(SERIAL), 1(STL), 2(CPQ) ", select_impl::validate)
+            .positional_arg(preload,"preload","number of elements to pre-load queue with")
+            .positional_arg(ops_per_iteration, "batch size" ,"minimum: 2 (1 push, 1 pop)")
+            .positional_arg(throughput_window, "duration", "in seconds")
+            );
+
+    std::cout<< "Priority queue performance test "<<impl<<" will run with "<<contention<<"us contention "
+           "using "<<threads<<" threads, "<<ops_per_iteration<<" batch size, "<<preload<<" pre-loaded elements,"
+           " for "<<throughput_window<<" seconds.\n"
+           <<std::flush
+    ;
+
+    srand(42);
+    arrsz = 100000;
+    input_data = new my_data_type[arrsz];
+    output_data = new my_data_type[arrsz];
+    for (size_t i=0; i<arrsz; ++i) {
+       input_data[i].priority = rand()%100;
+    }
+    //calibrate_busy_wait();
+    pushes_per_iter = ops_per_iteration/2;
+    pops_per_iter = ops_per_iteration/2;
+    operation_count = 0;
+
+    // Initialize mutex for Coarse-locked priority_queue
+    cache_aligned_allocator<spin_mutex> my_mutex_allocator;
+    my_mutex = (spin_mutex *)my_mutex_allocator.allocate(1);
+
+    if (impl == IMPL_SERIAL) {
+        TestSerialThroughput();
+    }
+    else {
+        for( int p=threads.first; p<=threads.last; p = threads.step(p) ) {
+            TestThroughputCpqOnNThreads(p);
+        }
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_fibonacci_cutoff.cpp b/xdl/third_party/tbb/src/perf/time_fibonacci_cutoff.cpp
new file mode 100644
index 00000000..e22f2ac2
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_fibonacci_cutoff.cpp
@@ -0,0 +1,130 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstdio>
+#include <cstdlib>
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task.h"
+#include "tbb/tick_count.h"
+#include "fibonacci_impl_tbb.cpp"
+
+long CutOff = 1;
+
+long SerialFib( const long n );
+
+long ParallelFib( const long n ); 
+
+inline void dump_title() {
+    printf("    Mode,   P, repeat,  N, =fib value, cutoff,     time, speedup\n");
+}
+
+inline void output(int P, long n, long c, int T, double serial_elapsed, double elapsed, long result) {
+    printf("%s,%4d,%7d,%3ld,%11ld,%7ld,%9.3g,%8.3g\n", ( (P == 0) ? "  Serial" : "Parallel" ),
+                 P, T, n, result, c, elapsed, serial_elapsed / elapsed);
+}
+
+#define MOVE_BY_FOURTHS 1
+inline long calculate_new_cutoff(const long lo, const long hi) {
+#if MOVE_BY_FOURTHS    
+    return lo + (3 + hi - lo ) / 4;
+#else
+    return (hi + lo)/2;
+#endif
+}
+
+void find_cutoff(const int P, const long n, const int T, const double serial_elapsed) {
+    long lo = 1, hi = n;
+    double elapsed = 0, lo_elapsed = 0, hi_elapsed = 0;
+    long final_cutoff = -1;
+
+    tbb::task_scheduler_init init(P);
+
+    while(true) {
+       CutOff = calculate_new_cutoff(lo, hi);
+       long result = 0;
+       tbb::tick_count t0;
+       for (int t = -1; t < T; ++t) {
+           if (t == 0) t0 = tbb::tick_count::now();
+           result += ParallelFib(n);
+       }
+       elapsed = (tbb::tick_count::now() - t0).seconds();
+       output(P,n,CutOff,T,serial_elapsed,elapsed,result);
+
+       if (serial_elapsed / elapsed >= P/2.0) {
+           final_cutoff = CutOff;
+           if (hi == CutOff) {
+               if (hi == lo) {
+                  // we have had this value at both above and below 50%
+                  lo = 1; lo_elapsed = 0;
+               } else  {
+                  break;
+               }
+           }
+           hi = CutOff;
+           hi_elapsed = elapsed;
+       } else {
+           if (lo == CutOff) break;
+           lo = CutOff;
+           lo_elapsed = elapsed;
+       }
+    } 
+
+    double interpolated_cutoff = lo + ( P/2.0 - serial_elapsed/lo_elapsed ) * ( (hi - lo) / ( serial_elapsed/hi_elapsed - serial_elapsed/lo_elapsed ));
+
+    if (final_cutoff != -1) {
+        printf("50%% efficiency cutoff is %ld ( linearly interpolated cutoff is %g )\n", final_cutoff, interpolated_cutoff);
+    } else {
+        printf("Cannot achieve 50%% efficiency\n");
+    }
+
+    return;
+}
+
+int main(int argc, char *argv[]) {
+    if (argc < 4) {
+        printf("Usage: %s threads n repetitions\nWhere n make sense in range [25; 45]\n",argv[0]); 
+        return 1;
+    }
+
+    int P = atoi(argv[1]);
+    volatile long n = atol(argv[2]);
+    int T = atoi(argv[3]);
+
+    // warmup parallel engine
+    ParallelFib(n);
+
+    dump_title();
+
+    // collect serial time
+    long serial_result = 0;
+    tbb::tick_count t0; 
+    for (int t = -1; t < T; ++t) {
+        if (t == 0) t0 = tbb::tick_count::now();        
+        serial_result += SerialFib(n);
+    }
+    double serial_elapsed = (tbb::tick_count::now() - t0).seconds();
+    output(0,n,0,T,serial_elapsed,serial_elapsed,serial_result);
+
+    // perform search
+    find_cutoff(P,n,T,serial_elapsed);
+
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_framework.h b/xdl/third_party/tbb/src/perf/time_framework.h
new file mode 100644
index 00000000..9f1ca2e5
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_framework.h
@@ -0,0 +1,351 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TIME_FRAMEWORK_H__
+#define __TIME_FRAMEWORK_H__
+
+#include <cstdlib>
+#include <math.h>
+#include <vector>
+#include <string>
+#include <sstream>
+#include "tbb/tbb_stddef.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#define HARNESS_CUSTOM_MAIN 1
+#include "../test/harness.h"
+#include "../test/harness_barrier.h"
+#define STATISTICS_INLINE
+#include "statistics.h"
+
+#ifndef ARG_TYPE
+typedef intptr_t arg_t;
+#else
+typedef ARG_TYPE arg_t;
+#endif
+
+class Timer {
+    tbb::tick_count tick;
+public:
+    Timer() { tick = tbb::tick_count::now(); }
+    double get_time()  { return (tbb::tick_count::now() - tick).seconds(); }
+    double diff_time(const Timer &newer) { return (newer.tick - tick).seconds(); }
+    double mark_time() { tbb::tick_count t1(tbb::tick_count::now()), t2(tick); tick = t1; return (t1 - t2).seconds(); }
+    double mark_time(const Timer &newer) { tbb::tick_count t(tick); tick = newer.tick; return (tick - t).seconds(); }
+};
+
+class TesterBase /*: public tbb::internal::no_copy*/ {
+protected:
+    friend class TestProcessor;
+    friend class TestRunner;
+
+    //! it is barrier for synchronizing between threads
+    Harness::SpinBarrier *barrier;
+    
+    //! number of tests per this tester
+    const int tests_count;
+    
+    //! number of threads to operate
+    int threads_count;
+
+    //! some value for tester
+    arg_t value;
+
+    //! tester name
+    const char *tester_name;
+
+    // avoid false sharing
+    char pad[128 - sizeof(arg_t) - sizeof(int)*2 - sizeof(void*)*2 ];
+
+public:
+    //! init tester base. @arg ntests is number of embedded tests in this tester.
+    TesterBase(int ntests)
+        : barrier(NULL), tests_count(ntests)
+    {}
+    virtual ~TesterBase() {}
+
+    //! internal function
+    void base_init(arg_t v, int t, Harness::SpinBarrier &b) {
+        threads_count = t;
+        barrier = &b;
+        value = v;
+        init();
+    }
+
+    //! optionally override to init after value and threads count were set.
+    virtual void init() { }
+
+    //! Override to provide your names
+    virtual std::string get_name(int testn) {
+        return Format("test %d", testn);
+    }
+
+    //! optionally override to init test mode just before execution for a given thread number.
+    virtual void test_prefix(int testn, int threadn) { }
+
+    //! Override to provide main test's entry function returns a value to record
+    virtual value_t test(int testn, int threadn) = 0;
+
+    //! Type of aggregation from results of threads
+    enum result_t {
+        SUM, AVG, MIN, MAX
+    };
+
+    //! Override to change result type for the test. Return postfix for test name or 0 if result type is not needed.
+    virtual const char *get_result_type(int /*testn*/, result_t type) const {
+        return type == AVG ? "" : 0; // only average result by default
+    }
+};
+
+/*****
+a user's tester concept:
+
+class tester: public TesterBase {
+public:
+    //! init tester with known amount of work
+    tester() : TesterBase(<user-specified tests count>) { ... }
+
+    //! run a test with sequental number @arg test_number for @arg thread.
+    / *override* / value_t test(int test_number, int thread);
+};
+
+******/
+
+template<typename Tester, int scale = 1>
+class TimeTest : public Tester {
+    /*override*/ value_t test(int testn, int threadn) {
+        Timer timer;
+        Tester::test(testn, threadn);
+        return timer.get_time() * double(scale);
+    }
+};
+
+template<typename Tester>
+class NanosecPerValue : public Tester {
+    /*override*/ value_t test(int testn, int threadn) {
+        Timer timer;
+        Tester::test(testn, threadn);
+        // return time (ns) per value
+        return timer.get_time()*1e+9/double(Tester::value);
+    }
+};
+
+template<typename Tester, int scale = 1>
+class ValuePerSecond : public Tester {
+    /*override*/ value_t test(int testn, int threadn) {
+        Timer timer;
+        Tester::test(testn, threadn);
+        // return value per seconds/scale
+        return double(Tester::value)/(timer.get_time()*scale);
+    }
+};
+
+template<typename Tester, int scale = 1>
+class NumberPerSecond : public Tester {
+    /*override*/ value_t test(int testn, int threadn) {
+        Timer timer;
+        Tester::test(testn, threadn);
+        // return a scale per seconds
+        return double(scale)/timer.get_time();
+    }
+};
+
+// operate with single tester
+class TestRunner {
+    friend class TestProcessor;
+    friend struct RunArgsBody;
+    TestRunner(const TestRunner &); // don't copy
+
+    const char *tester_name;
+    StatisticsCollector *stat;
+    std::vector<std::vector<StatisticsCollector::TestCase> > keys;
+
+public:
+    TesterBase &tester;
+
+    template<typename Test>
+    TestRunner(const char *name, Test *test)
+        : tester_name(name), tester(*static_cast<TesterBase*>(test))
+    {
+        test->tester_name = name;
+    }
+    
+    ~TestRunner() { delete &tester; }
+
+    void init(arg_t value, int threads, Harness::SpinBarrier &barrier, StatisticsCollector *s) {
+        tester.base_init(value, threads, barrier);
+        stat = s;
+        keys.resize(tester.tests_count);
+        for(int testn = 0; testn < tester.tests_count; testn++) {
+            keys[testn].resize(threads);
+            std::string test_name(tester.get_name(testn));
+            for(int threadn = 0; threadn < threads; threadn++)
+                keys[testn][threadn] = stat->SetTestCase(tester_name, test_name.c_str(), threadn);
+        }
+    }
+
+    void run_test(int threadn) {
+        for(int testn = 0; testn < tester.tests_count; testn++) {
+            tester.test_prefix(testn, threadn);
+            tester.barrier->wait();                                 // <<<<<<<<<<<<<<<<< Barrier before running test mode
+            value_t result = tester.test(testn, threadn);
+            stat->AddRoundResult(keys[testn][threadn], result);
+        }
+    }
+
+    void post_process(StatisticsCollector &report) {
+        const int threads = tester.threads_count;
+        for(int testn = 0; testn < tester.tests_count; testn++) {
+            size_t coln = keys[testn][0].getResults().size()-1;
+            value_t rsum = keys[testn][0].getResults()[coln];
+            value_t rmin = rsum, rmax = rsum;
+            for(int threadn = 1; threadn < threads; threadn++) {
+                value_t result = keys[testn][threadn].getResults()[coln];
+                rsum += result; // for both SUM or AVG
+                if(rmin > result) rmin = result;
+                if(rmax < result) rmax = result;
+            }
+            std::string test_name(tester.get_name(testn));
+            const char *rname = tester.get_result_type(testn, TesterBase::SUM);
+            if( rname ) {
+                report.SetTestCase(tester_name, (test_name+rname).c_str(), threads);
+                report.AddRoundResult(rsum);
+            }
+            rname = tester.get_result_type(testn, TesterBase::MIN);
+            if( rname ) {
+                report.SetTestCase(tester_name, (test_name+rname).c_str(), threads);
+                report.AddRoundResult(rmin);
+            }
+            rname = tester.get_result_type(testn, TesterBase::AVG);
+            if( rname ) {
+                report.SetTestCase(tester_name, (test_name+rname).c_str(), threads);
+                report.AddRoundResult(rsum / threads);
+            }
+            rname = tester.get_result_type(testn, TesterBase::MAX);
+            if( rname ) {
+                report.SetTestCase(tester_name, (test_name+rname).c_str(), threads);
+                report.AddRoundResult(rmax);
+            }
+        }
+    }
+};
+
+struct RunArgsBody {
+    const vector<TestRunner*> &run_list;
+    RunArgsBody(const vector<TestRunner*> &a) : run_list(a) { }
+#ifndef __TBB_parallel_for_H
+    void operator()(int thread) const {
+#else
+    void operator()(const tbb::blocked_range<int> &r) const {
+        ASSERT( r.begin() + 1 == r.end(), 0);
+        int thread = r.begin();
+#endif
+        for(size_t i = 0; i < run_list.size(); i++)
+            run_list[i]->run_test(thread);
+    }
+};
+
+//! Main test processor.
+/** Override or use like this:
+ class MyTestCollection : public TestProcessor {
+    void factory(arg_t value, int threads) {
+        process( value, threads,
+            run("my1", new tester<my1>() ),
+            run("my2", new tester<my2>() ),
+        end );
+        if(value == threads)
+            stat->Print();
+    }
+};
+*/
+
+class TestProcessor {
+    friend class TesterBase;
+
+    // <threads, collector>
+    typedef std::map<int, StatisticsCollector *> statistics_collection;
+    statistics_collection stat_by_threads;
+
+protected:
+    // Members
+    const char *collection_name;
+    // current stat
+    StatisticsCollector *stat;
+    // token
+    size_t end;
+
+public:
+    StatisticsCollector report;
+
+    // token of tests list
+    template<typename Test>
+    TestRunner *run(const char *name, Test *test) {
+        return new TestRunner(name, test);
+    }
+
+    // iteration processing
+    void process(arg_t value, int threads, ...) {
+        // prepare items
+        stat = stat_by_threads[threads];
+        if(!stat) {
+            stat_by_threads[threads] = stat = new StatisticsCollector((collection_name + Format("@%d", threads)).c_str(), StatisticsCollector::ByAlg);
+            stat->SetTitle("Detailed log of %s running with %d threads.", collection_name, threads);
+        }
+        Harness::SpinBarrier barrier(threads);
+        // init args
+        va_list args; va_start(args, threads);
+        vector<TestRunner*> run_list; run_list.reserve(16);
+        while(true) {
+            TestRunner *item = va_arg(args, TestRunner*);
+            if( !item ) break;
+            item->init(value, threads, barrier, stat);
+            run_list.push_back(item);
+        }
+        va_end(args);
+        std::ostringstream buf;
+        buf << value;
+        const size_t round_number = stat->GetRoundsCount();
+        stat->SetRoundTitle(round_number, buf.str().c_str());
+        report.SetRoundTitle(round_number, buf.str().c_str());
+        // run them
+#ifndef __TBB_parallel_for_H
+        NativeParallelFor(threads, RunArgsBody(run_list));
+#else
+        tbb::parallel_for(tbb::blocked_range<int>(0,threads,1), RunArgsBody(run_list));
+#endif
+        // destroy args
+        for(size_t i = 0; i < run_list.size(); i++) {
+            run_list[i]->post_process(report);
+            delete run_list[i];
+        }
+    }
+
+public:
+    TestProcessor(const char *name, StatisticsCollector::Sorting sort_by = StatisticsCollector::ByAlg)
+        : collection_name(name), stat(NULL), end(0), report(collection_name, sort_by)
+    { }
+
+    ~TestProcessor() {
+        for(statistics_collection::iterator i = stat_by_threads.begin(); i != stat_by_threads.end(); i++)
+            delete i->second;
+    }
+};
+
+#endif// __TIME_FRAMEWORK_H__
diff --git a/xdl/third_party/tbb/src/perf/time_hash_map.cpp b/xdl/third_party/tbb/src/perf/time_hash_map.cpp
new file mode 100644
index 00000000..17dcd28c
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_hash_map.cpp
@@ -0,0 +1,261 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// configuration:
+#define TBB_USE_THREADING_TOOLS 0
+
+//! enable/disable std::map tests
+#define STDTABLE 0
+
+//! enable/disable old implementation tests (correct include file also)
+#define OLDTABLE 0
+#define OLDTABLEHEADER "tbb/concurrent_hash_map-5468.h"//-4329
+
+//! enable/disable experimental implementation tests (correct include file also)
+#define TESTTABLE 0
+#define TESTTABLEHEADER "tbb/concurrent_unordered_map.h"
+
+//! avoid erase()
+#define TEST_ERASE 1
+
+//////////////////////////////////////////////////////////////////////////////////
+
+#include <cstdlib>
+#include <math.h>
+#include "tbb/tbb_stddef.h"
+#include <vector>
+#include <map>
+// needed by hash_maps
+#include <stdexcept>
+#include <iterator>
+#include <algorithm>    // Need std::swap
+#include <utility>      // Need std::pair
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/aligned_space.h"
+#include "tbb/atomic.h"
+#define __TBB_concurrent_unordered_set_H
+#include "tbb/internal/_concurrent_unordered_impl.h"
+#undef __TBB_concurrent_unordered_set_H
+// for test
+#include "tbb/spin_mutex.h"
+#include "time_framework.h"
+
+
+using namespace tbb;
+using namespace tbb::internal;
+
+struct IntHashCompare {
+    size_t operator() ( int x ) const { return x; }
+    bool operator() ( int x, int y ) const { return x==y; }
+    static long hash( int x ) { return x; }
+    bool equal( int x, int y ) const { return x==y; }
+};
+
+namespace version_current {
+    namespace tbb { using namespace ::tbb; namespace internal { using namespace ::tbb::internal; } }
+    namespace tbb { namespace interface5 { using namespace ::tbb::interface5; namespace internal { using namespace ::tbb::interface5::internal; } } }
+    #include "tbb/concurrent_hash_map.h"
+}
+typedef version_current::tbb::concurrent_hash_map<int,int> IntTable;
+
+#if OLDTABLE
+#undef __TBB_concurrent_hash_map_H
+namespace version_base {
+    namespace tbb { using namespace ::tbb; namespace internal { using namespace ::tbb::internal; } }
+    namespace tbb { namespace interface5 { using namespace ::tbb::interface5; namespace internal { using namespace ::tbb::interface5::internal; } } }
+    #include OLDTABLEHEADER
+}
+typedef version_base::tbb::concurrent_hash_map<int,int> OldTable;
+#endif
+
+#if TESTTABLE
+#undef __TBB_concurrent_hash_map_H
+namespace version_new {
+    namespace tbb { using namespace ::tbb; namespace internal { using namespace ::tbb::internal; } }
+    namespace tbb { namespace interface5 { using namespace ::tbb::interface5; namespace internal { using namespace ::tbb::interface5::internal; } } }
+    #include TESTTABLEHEADER
+}
+typedef version_new::tbb::concurrent_unordered_map<int,int> TestTable;
+#define TESTTABLE 1
+#endif
+
+///////////////////////////////////////
+
+static const char *map_testnames[] = {
+    "1.insert", "2.count1st", "3.count2nd", "4.insert-exists", "5.erase "
+};
+
+template<typename TableType>
+struct TestTBBMap : TesterBase {
+    TableType Table;
+    int n_items;
+
+    TestTBBMap() : TesterBase(4+TEST_ERASE), Table(MaxThread*4) {}
+    void init() { n_items = value/threads_count; }
+
+    std::string get_name(int testn) {
+        return std::string(map_testnames[testn]);
+    }
+
+    double test(int test, int t)
+    {
+        switch(test) {
+          case 0: // fill
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                Table.insert( std::make_pair(i,i) );
+            }
+            break;
+          case 1: // work1
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                size_t c = Table.count( i );
+                ASSERT( c == 1, NULL);
+            }
+            break;
+          case 2: // work2
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                Table.count( i );
+            }
+            break;
+          case 3: // work3
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                Table.insert( std::make_pair(i,i) );
+            }
+            break;
+#if TEST_ERASE
+          case 4: // clean
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                ASSERT( Table.erase( i ), NULL);
+            }
+#endif
+        }
+        return 0;
+    }
+};
+
+template<typename M>
+struct TestSTLMap : TesterBase {
+    std::map<int, int> Table;
+    M mutex;
+
+    int n_items;
+    TestSTLMap() : TesterBase(4+TEST_ERASE) {}
+    void init() { n_items = value/threads_count; }
+
+    std::string get_name(int testn) {
+        return std::string(map_testnames[testn]);
+    }
+
+    double test(int test, int t)
+    {
+        switch(test) {
+          case 0: // fill
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                typename M::scoped_lock with(mutex);
+                Table[i] = 0;
+            }
+            break;
+          case 1: // work1
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                typename M::scoped_lock with(mutex);
+                size_t c = Table.count(i);
+                ASSERT( c == 1, NULL);
+            }
+            break;
+          case 2: // work2
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                typename M::scoped_lock with(mutex);
+                Table.count(i);
+            }
+            break;
+          case 3: // work3
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                typename M::scoped_lock with(mutex);
+                Table.insert(std::make_pair(i,i));
+            }
+            break;
+          case 4: // clean
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                typename M::scoped_lock with(mutex);
+                Table.erase(i);
+            }
+        }
+        return 0;
+    }
+};
+
+class fake_mutex {
+public:
+    class scoped_lock {
+        fake_mutex *p;
+
+    public:
+        scoped_lock() {}
+        scoped_lock( fake_mutex &m ) { p = &m; }
+        ~scoped_lock() { }
+        void acquire( fake_mutex &m ) { p = &m; }
+        void release() { }
+    };
+};
+
+class test_hash_map : public TestProcessor {
+public:
+    test_hash_map() : TestProcessor("time_hash_map") {}
+    void factory(int value, int threads) {
+        if(Verbose) printf("Processing with %d threads: %d...\n", threads, value);
+        process( value, threads,
+#if STDTABLE
+            run("std::map ", new NanosecPerValue<TestSTLMap<spin_mutex> >() ),
+#endif
+#if OLDTABLE
+            run("old::hmap", new NanosecPerValue<TestTBBMap<OldTable> >() ),
+#endif
+            run("tbb::hmap", new NanosecPerValue<TestTBBMap<IntTable> >() ),
+#if TESTTABLE
+            run("new::hmap", new NanosecPerValue<TestTBBMap<TestTable> >() ),
+#endif
+        end );
+        //stat->Print(StatisticsCollector::Stdout);
+        //if(value >= 2097152) stat->Print(StatisticsCollector::HTMLFile);
+    }
+};
+
+/////////////////////////////////////////////////////////////////////////////////////////
+
+int main(int argc, char* argv[]) {
+    if(argc>1) Verbose = true;
+    //if(argc>2) ExtraVerbose = true;
+    MinThread = 1; MaxThread = task_scheduler_init::default_num_threads();
+    ParseCommandLine( argc, argv );
+
+    ASSERT(tbb_allocator<int>::allocator_type() == tbb_allocator<int>::scalable, "expecting scalable allocator library to be loaded. Please build it by:\n\t\tmake tbbmalloc");
+
+    {
+        test_hash_map the_test;
+        for( int t=MinThread; t <= MaxThread; t++)
+            for( int o=/*2048*/(1<<8)*8; o<2200000; o*=2 )
+                the_test.factory(o, t);
+        the_test.report.SetTitle("Nanoseconds per operation of (Mode) for N items in container (Name)");
+        the_test.report.SetStatisticFormula("1AVG per size", "=AVERAGE(ROUNDS)");
+        the_test.report.Print(StatisticsCollector::HTMLFile|StatisticsCollector::ExcelXML);
+    }
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_hash_map_fill.cpp b/xdl/third_party/tbb/src/perf/time_hash_map_fill.cpp
new file mode 100644
index 00000000..353a854d
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_hash_map_fill.cpp
@@ -0,0 +1,167 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// configuration:
+
+// Size of final table (must be multiple of STEP_*)
+int MAX_TABLE_SIZE = 2000000;
+
+// Specify list of unique percents (5-30,100) to test against. Max 10 values
+#define UNIQUE_PERCENTS PERCENT(5); PERCENT(10); PERCENT(20); PERCENT(30); PERCENT(100)
+
+#define SECONDS_RATIO 1000000 // microseconds
+
+// enable/disable tests for:
+#define BOX1 "CHMap"
+#define BOX1TEST ValuePerSecond<Uniques<tbb::concurrent_hash_map<int,int> >, SECONDS_RATIO>
+#define BOX1HEADER "tbb/concurrent_hash_map.h"
+
+// enable/disable tests for:
+#define BOX2 "CUMap"
+#define BOX2TEST ValuePerSecond<Uniques<tbb::concurrent_unordered_map<int,int> >, SECONDS_RATIO>
+#define BOX2HEADER "tbb/concurrent_unordered_map.h"
+
+// enable/disable tests for:
+//#define BOX3 "OLD"
+#define BOX3TEST ValuePerSecond<Uniques<tbb::concurrent_hash_map<int,int> >, SECONDS_RATIO>
+#define BOX3HEADER "tbb/concurrent_hash_map-5468.h"
+
+#define TBB_USE_THREADING_TOOLS 0
+//////////////////////////////////////////////////////////////////////////////////
+
+#include <cstdlib>
+#include <math.h>
+#include "tbb/tbb_stddef.h"
+#include <vector>
+#include <map>
+// needed by hash_maps
+#include <stdexcept>
+#include <iterator>
+#include <algorithm>    // Need std::swap
+#include <utility>      // Need std::pair
+#include <cstring>      // Need std::memset
+#include <typeinfo>
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/aligned_space.h"
+#include "tbb/atomic.h"
+#define __TBB_concurrent_unordered_set_H
+#include "tbb/internal/_concurrent_unordered_impl.h"
+#undef __TBB_concurrent_unordered_set_H
+// for test
+#include "tbb/spin_mutex.h"
+#include "time_framework.h"
+
+
+using namespace tbb;
+using namespace tbb::internal;
+
+/////////////////////////////////////////////////////////////////////////////////////////
+// Input data built for test
+int *Data;
+
+// Main test class used to run the timing tests. All overridden methods are called by the framework
+template<typename TableType>
+struct Uniques : TesterBase {
+    TableType Table;
+    int n_items;
+
+    // Initializes base class with number of test modes
+    Uniques() : TesterBase(2), Table(MaxThread*16) {
+        //Table->max_load_factor(1); // add stub into hash_map to uncomment it
+    }
+    ~Uniques() {}
+
+    // Returns name of test mode specified by number
+    /*override*/ std::string get_name(int testn) {
+        if(testn == 1) return "find";
+        return "insert";
+    }
+
+    // Informs the class that value and threads number become known
+    /*override*/ void init() {
+        n_items = value/threads_count; // operations
+    }
+
+    // Informs the class that the test mode for specified thread is about to start
+    /*override*/ void test_prefix(int testn, int t) {
+        barrier->wait();
+        if(Verbose && !t && testn) printf("%s: inserted %u, %g%% of operations\n", tester_name, unsigned(Table.size()), 100.0*Table.size()/(value*testn));
+    }
+
+    // Executes test mode for a given thread. Return value is ignored when used with timing wrappers.
+    /*override*/ double test(int testn, int t)
+    {
+        if( testn == 0 ) { // do insertions
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                Table.insert( std::make_pair(Data[i],t) );
+            }
+        } else { // do last finds
+            for(int i = t*n_items, e = (t+1)*n_items; i < e; i++) {
+                size_t c =
+                    Table.count( Data[i] );
+                ASSERT( c == 1, NULL ); // must exist
+            }
+        }
+        return 0;
+    }
+};
+
+/////////////////////////////////////////////////////////////////////////////////////////
+#undef max
+#include <limits>
+
+// Using BOX declarations from configuration
+#include "time_sandbox.h"
+
+int rounds = 0;
+// Prepares the input data for given unique percent
+void execute_percent(test_sandbox &the_test, int p) {
+    int input_size = MAX_TABLE_SIZE*100/p;
+    Data = new int[input_size];
+    int uniques = p==100?std::numeric_limits<int>::max() : MAX_TABLE_SIZE;
+    ASSERT(p==100 || p <= 30, "Function is broken for %% > 30 except for 100%%");
+    for(int i = 0; i < input_size; i++)
+        Data[i] = (rand()*rand())%uniques;
+    for(int t = MinThread; t <= MaxThread; t++)
+        the_test.factory(input_size, t); // executes the tests specified in BOX-es for given 'value' and threads
+    the_test.report.SetRoundTitle(rounds++, "%d%%", p);
+}
+#define PERCENT(x) execute_percent(the_test, x)
+
+int main(int argc, char* argv[]) {
+    if(argc>1) Verbose = true;
+    //if(argc>2) ExtraVerbose = true;
+    MinThread = 1; MaxThread = task_scheduler_init::default_num_threads();
+    ParseCommandLine( argc, argv );
+    if(getenv("TABLE_SIZE"))
+        MAX_TABLE_SIZE = atoi(getenv("TABLE_SIZE"));
+
+    ASSERT(tbb_allocator<int>::allocator_type() == tbb_allocator<int>::scalable, "expecting scalable allocator library to be loaded. Please build it by:\n\t\tmake tbbmalloc");
+    // Declares test processor
+    test_sandbox the_test("time_hash_map_fill"/*, StatisticsCollector::ByThreads*/);
+    srand(10101);
+    UNIQUE_PERCENTS; // test the percents
+    the_test.report.SetTitle("Operations per microsecond");
+    the_test.report.SetRunInfo("Items", MAX_TABLE_SIZE);
+    the_test.report.Print(StatisticsCollector::HTMLFile|StatisticsCollector::ExcelXML); // Write files
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_hash_map_fill.html b/xdl/third_party/tbb/src/perf/time_hash_map_fill.html
new file mode 100644
index 00000000..379df27e
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_hash_map_fill.html
@@ -0,0 +1,122 @@
+<HTML><BODY>
+<H2>time_hash_map_fill</H2>
+<P><a href=time_hash_map_fill.cpp>time_hash_map_fill.cpp</a> is a micro-benchmark specifically designed to highlight aspects of concurrent resizing algorithm of the hash tables.
+It was derived from the Count Strings example that counts the number of unique words. But to exclude synchronization on the counters from the picture,
+it was simplified to build just a set of unique numbers from an input array. The array is filled evenly by using a pseudo-random number generator from the standard C library for various proportions of unique numbers.
+For example, for 5% of unique numbers, the same number is repeated 20 times on average. Together, it gives 5% of actual insertions and 95% are just lookups. However, in the beginning, there are more new keys occur than in the end.
+In addition, a size of the source array correlates with input rates in order to produce the same number of unique keys at the end, and so exclude cache effects from the equation.
+</P>
+<H2>Diagram</H2><img src="time_hash_map_fill.gif"/>
+<H3>Prepare results</H3>
+<P>This benchmark outputs results in Excel* and html file formats by default. To generate text (CSV) file instead, specify STAT_FORMAT=pivot-csv environment variable. To change the default table size, set TABLE_SIZE.
+<code><b><pre>src$    make time_hash_map_fill args=-v STAT_FORMAT=pivot-csv TABLE_SIZE=250000</pre></b></code>Or to get statistics from different runs:
+<code><b><pre>src$    make time_hash_map_fill TABLE_SIZE=50000 run_cmd="bash ../../src/perf/<a href=run_statistics.sh>run_statistics.sh</a>"</pre></b></code>
+</P>
+<H3>Build diagram</H3>You can use <a href="http://ploticus.sourceforge.net/">Ploticus</a> to build diagram from the prepared data using this html file as a script. But first, the input data file should be sorted to join lines from different runs together, e.g.:
+<code><b><pre>src$    sort -t , -k 1dr,2 -k 3n,4 -k 7n,7 ../build/<i>{scrambled_path}</i>/time_hash_map_fill.csv -o perf/time_hash_map_fill.csv</pre></b></code>Here, field 7 is "Column" field that contains input rates because run_statistics.sh adds hostname and number of the run as 5 and 6 fields. Now, to build gif diagram, run:
+<code><b><pre>perf$   pl -maxrows 200000 -maxfields 1500000 -maxvector 1200000 -gif -scale 1.8 time_hash_map_fill.html</pre></b></code>
+<H3>Script body</H3>
+<hr/><pre>
+
+#setifnotgiven NAMES = $makelist("1.CHMap 2.CUMap 3.OLD")
+#setifnotgiven LABLESIZE = 0.06
+
+#proc settings
+  encodenames: yes
+  units: cm
+
+#proc getdata
+  file: time_hash_map_fill.csv
+  fieldnameheader: yes
+  delim: comma
+  showdata: no
+  select: @@Mode = insert
+  pf_fieldnames: Name Mode Threads Value
+  filter:
+    ##print @@Name,"@@Items on @@Column",@@3,@@Value
+
+#endproc
+
+#proc page
+  pagesize: 70 50
+  tightcrop: yes
+#endproc
+
+#proc processdata
+  action: summary
+  fields: Name Mode Threads
+  valfield: Value
+  fieldnames: Name Mode Threads Average sd sem n_obs Min Max
+  showdata: no
+
+#proc categories
+  axis: x
+  datafield: Mode
+
+#proc areadef
+  title: Throughput on Insert operation
+  titledetails: size=14  align=C
+  areaname: slide
+  xscaletype: categories
+  xautorange: datafield=Mode
+  xaxis.stubs: usecategories
+  xaxis.label: Threads across table sizes and % of input rates
+//  yrange: 0 70
+  yautorange: datafield=Max,Min
+  yaxis.stubs: inc
+  yaxis.label: ops/ns
+//  yaxis.stubformat: %3.1f
+  autowidth: 1.1
+  autoheight: 0.07
+  frame: yes
+
+#for LABEL in @NAMES
+#set NLABEL = $arithl(@NLABEL+1)
+#set COLOR = $icolor( @NLABEL )
+#proc legendentry
+  label: @LABEL
+  sampletype: color
+  details: @COLOR
+
+#procdef catlines
+  select: @Name = @LABEL
+  catfield: Mode
+  subcatfield: Threads
+  subcats: auto
+  plotwidth: 0.8
+  #saveas C
+
+#proc catlines
+  #clone C
+  dpsymbol: shape=square radius=@LABLESIZE style=solid color=@COLOR
+  valfield: Average
+  errfield: sd
+
+#proc catlines
+  #clone C
+  valfield: Max
+  dpsymbol: shape=triangle radius=@LABLESIZE style=solid color=@COLOR
+
+#proc catlines
+  #clone C
+  valfield: Min
+  dpsymbol: shape=downtriangle radius=@LABLESIZE style=solid color=@COLOR
+
+#endloop
+
+#proc legend
+  location: 3.2 max
+  seglen: 0.2
+#endproc
+</pre>
+<HR/>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/src/perf/time_locked_work.cpp b/xdl/third_party/tbb/src/perf/time_locked_work.cpp
new file mode 100644
index 00000000..7ed9894c
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_locked_work.cpp
@@ -0,0 +1,166 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+////// Test configuration ////////////////////////////////////////////////////
+#define SECONDS_RATIO 1000000 // microseconds
+
+#ifndef REPEAT_K
+#define REPEAT_K 50 // repeat coefficient
+#endif
+
+int outer_work[] = {/*256,*/ 64, 16, 4, 0};
+int inner_work[] = {32, 8, 0 };
+
+// keep it to calibrate the time of work without synchronization
+#define BOX1 "baseline"
+#define BOX1TEST TimeTest< TBB_Mutex<tbb::null_mutex>, SECONDS_RATIO >
+
+// enable/disable tests for:
+#define BOX2 "spin_mutex"
+#define BOX2TEST TimeTest< TBB_Mutex<tbb::spin_mutex>, SECONDS_RATIO >
+
+// enable/disable tests for:
+#define BOX3 "spin_rw_mutex"
+#define BOX3TEST TimeTest< TBB_Mutex<tbb::spin_rw_mutex>, SECONDS_RATIO >
+
+// enable/disable tests for:
+#define BOX4 "queuing_mutex"
+#define BOX4TEST TimeTest< TBB_Mutex<tbb::queuing_mutex>, SECONDS_RATIO >
+
+// enable/disable tests for:
+//#define BOX5 "queuing_rw_mutex"
+#define BOX5TEST TimeTest< TBB_Mutex<tbb::queuing_rw_mutex>, SECONDS_RATIO >
+
+//////////////////////////////////////////////////////////////////////////////
+
+#include <cstdlib>
+#include <math.h>
+#include <algorithm>    // Need std::swap
+#include <utility>      // Need std::pair
+#include <sstream>
+#include "tbb/tbb_stddef.h"
+#include "tbb/null_mutex.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/queuing_mutex.h"
+#include "tbb/queuing_rw_mutex.h"
+#include "tbb/mutex.h"
+
+#if INTEL_TRIAL==2
+#include "tbb/parallel_for.h" // enable threading by TBB scheduler
+#include "tbb/task_scheduler_init.h"
+#include "tbb/blocked_range.h" 
+#endif
+// for test
+#include "time_framework.h"
+
+using namespace tbb;
+using namespace tbb::internal;
+
+/////////////////////////////////////////////////////////////////////////////////////////
+
+//! base class for tests family
+struct TestLocks : TesterBase {
+    // Inherits "value", "threads_count", and other variables
+    TestLocks() : TesterBase(/*number of modes*/sizeof(outer_work)/sizeof(int)) {}
+    //! returns name of test part/mode
+    /*override*/std::string get_name(int testn) {
+        std::ostringstream buf;
+        buf.width(4); buf.fill('0');
+        buf << outer_work[testn]; // mode number
+        return buf.str();
+    }
+    //! enables results types and returns theirs suffixes
+    /*override*/const char *get_result_type(int, result_t type) const {
+        switch(type) {
+            case MIN: return " min";
+            case MAX: return " max";
+            default: return 0;
+        }
+    }
+    //! repeats count
+    int repeat_until(int /*test_n*/) const {
+        return REPEAT_K*100;//TODO: suggest better?
+    }
+    //! fake work
+    void do_work(int work) volatile {
+        for(int i = 0; i < work; i++) {
+            volatile int x = i;
+            __TBB_Pause(0); // just to call inline assembler
+            x *= work/threads_count;
+        }
+    }
+};
+
+//! template test unit for any of TBB mutexes
+template<typename M>
+struct TBB_Mutex : TestLocks {
+    M mutex;
+
+    double test(int testn, int /*threadn*/)
+    {
+        for(int r = 0; r < repeat_until(testn); ++r) {
+            do_work(outer_work[testn]);
+            {
+                typename M::scoped_lock with(mutex);
+                do_work(/*inner work*/value);
+            }
+        }
+        return 0;
+    }
+};
+
+/////////////////////////////////////////////////////////////////////////////////////////
+
+//Using BOX declarations
+#include "time_sandbox.h"
+
+// run tests for each of inner work value
+void RunLoops(test_sandbox &the_test, int thread) {
+    for( unsigned i=0; i<sizeof(inner_work)/sizeof(int); ++i )
+        the_test.factory(inner_work[i], thread);
+}
+
+int main(int argc, char* argv[]) {
+    if(argc>1) Verbose = true;
+    int DefThread = task_scheduler_init::default_num_threads();
+    MinThread = 1; MaxThread = DefThread+1;
+    ParseCommandLine( argc, argv );
+    ASSERT(MinThread <= MaxThread, 0);
+#if INTEL_TRIAL && defined(__TBB_parallel_for_H)
+    task_scheduler_init me(MaxThread);
+#endif
+    {
+        test_sandbox the_test("time_locked_work", StatisticsCollector::ByThreads);
+        //TODO: refactor this out as RunThreads(test&)
+        for( int t = MinThread; t < DefThread && t <= MaxThread; t *= 2)
+            RunLoops( the_test, t ); // execute undersubscribed threads
+        if( DefThread > MinThread && DefThread <= MaxThread )
+            RunLoops( the_test, DefThread ); // execute on all hw threads
+        if( DefThread < MaxThread)
+            RunLoops( the_test, MaxThread ); // execute requested oversubscribed threads
+
+        the_test.report.SetTitle("Time of lock/unlock for mutex Name with Outer and Inner work");
+        //the_test.report.SetStatisticFormula("1AVG per size", "=AVERAGE(ROUNDS)");
+        the_test.report.Print(StatisticsCollector::HTMLFile|StatisticsCollector::ExcelXML, /*ModeName*/ "Outer work");
+    }
+    return 0;
+}
+
diff --git a/xdl/third_party/tbb/src/perf/time_lru_cache_throughput.cpp b/xdl/third_party/tbb/src/perf/time_lru_cache_throughput.cpp
new file mode 100644
index 00000000..cec2e33d
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_lru_cache_throughput.cpp
@@ -0,0 +1,217 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "../examples/common/utility/utility.h"
+#include "tbb/tick_count.h"
+//#include <tbb/parallel_for.h>
+#include "tbb/task_scheduler_init.h" //for number of threads
+#include <functional>
+
+#include "coarse_grained_raii_lru_cache.h"
+#define TBB_PREVIEW_CONCURRENT_LRU_CACHE 1
+#include "tbb/concurrent_lru_cache.h"
+
+#define HARNESS_CUSTOM_MAIN 1
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+
+#include "../src/test/harness.h"
+#include "../src/test/harness_barrier.h"
+
+#include <vector>
+#include <algorithm>
+#include "tbb/mutex.h"
+
+//TODO: probably move this to separate header utlity file
+namespace micro_benchmarking{
+namespace utils{
+    template <typename type>
+    void disable_elimination(type const& v){
+        volatile type dummy = v;
+        (void) dummy;
+    }
+    //Busy work and calibration helpers
+    unsigned int one_us_iters = 345; // default value
+
+    //TODO: add a CLI parameter for calibration run
+    // if user wants to calibrate to microseconds on particular machine, call
+    // this at beginning of program; sets one_us_iters to number of iters to
+    // busy_wait for approx. 1 us
+    void calibrate_busy_wait() {
+        const unsigned niter = 1000000;
+        tbb::tick_count t0 = tbb::tick_count::now();
+        for (volatile unsigned int i=0; i<niter; ++i) continue;
+        tbb::tick_count t1 = tbb::tick_count::now();
+
+        one_us_iters = (unsigned int)(niter/(t1-t0).seconds())*1e-6;
+    }
+
+    void busy_wait(int us)
+    {
+        unsigned int iter = us*one_us_iters;
+        for (volatile unsigned int i=0; i<iter; ++i) continue;
+    }
+}
+}
+
+struct parameter_pack{
+    size_t time_window_sec;
+    size_t time_check_granularity_ops;
+    size_t cache_lru_history_size;
+    size_t time_of_item_use_usec;
+    size_t cache_miss_percent;
+    int threads_number;
+    size_t weight_of_initiation_call_usec;
+    bool use_serial_initiation_function;
+    parameter_pack(
+            size_t a_time_window_sec
+            ,size_t a_time_check_granularity_ops
+            ,size_t a_cache_lru_history_size
+            ,size_t a_time_of_item_use_usec, size_t a_cache_miss_percent
+            , int a_threads_number ,size_t a_weight_of_initiation_call_usec
+            , bool a_use_serial_initiation_function
+    )   :
+        time_window_sec(a_time_window_sec)
+        ,time_check_granularity_ops(a_time_check_granularity_ops)
+        ,cache_lru_history_size(a_cache_lru_history_size)
+        ,time_of_item_use_usec(a_time_of_item_use_usec)
+        ,cache_miss_percent(a_cache_miss_percent)
+        ,threads_number(a_threads_number)
+        ,weight_of_initiation_call_usec(a_weight_of_initiation_call_usec)
+        ,use_serial_initiation_function(a_use_serial_initiation_function)
+    {}
+};
+
+struct return_size_t {
+    size_t m_weight_of_initiation_call_usec;
+    bool use_serial_initiation_function;
+    return_size_t(size_t a_weight_of_initiation_call_usec, bool a_use_serial_initiation_function)
+        :m_weight_of_initiation_call_usec(a_weight_of_initiation_call_usec), use_serial_initiation_function(a_use_serial_initiation_function)
+    {}
+    size_t operator()(size_t key){
+        static tbb::mutex mtx;
+        if (use_serial_initiation_function){
+            mtx.lock();
+        }
+        micro_benchmarking::utils::busy_wait(m_weight_of_initiation_call_usec);
+        if (use_serial_initiation_function){
+            mtx.unlock();
+        }
+
+        return key;
+    }
+};
+
+template< typename a_cache_type>
+struct throughput {
+    typedef throughput self_type;
+    typedef a_cache_type cache_type;
+
+    parameter_pack m_parameter_pack;
+
+
+    const size_t per_thread_sample_size ;
+    typedef std::vector<size_t> access_sequence_type;
+    access_sequence_type m_access_sequence;
+    cache_type m_cache;
+    Harness::SpinBarrier m_barrier;
+    tbb::atomic<size_t> loops_count;
+
+    throughput(parameter_pack a_parameter_pack)
+        :m_parameter_pack(a_parameter_pack)
+        ,per_thread_sample_size(m_parameter_pack.cache_lru_history_size *(1 +  m_parameter_pack.cache_miss_percent/100))
+        ,m_access_sequence(m_parameter_pack.threads_number * per_thread_sample_size )
+        ,m_cache(return_size_t(m_parameter_pack.weight_of_initiation_call_usec,m_parameter_pack.use_serial_initiation_function),m_parameter_pack.cache_lru_history_size)
+
+    {
+        loops_count=0;
+        //TODO: check if changing from generating longer sequence to generating indexes in a specified range (i.e. making per_thread_sample_size fixed) give any change
+        std::generate(m_access_sequence.begin(),m_access_sequence.end(),std::rand);
+    }
+
+    size_t operator()(){
+        struct _{ static void  retrieve_from_cache(self_type* _this, size_t thread_index){
+            parameter_pack& p = _this->m_parameter_pack;
+            access_sequence_type::iterator const begin_it =_this->m_access_sequence.begin()+ thread_index * _this->per_thread_sample_size;
+            access_sequence_type::iterator const end_it = begin_it +  _this->per_thread_sample_size;
+
+            _this->m_barrier.wait();
+            tbb::tick_count start = tbb::tick_count::now();
+
+            size_t local_loops_count =0;
+            do {
+                size_t part_of_the_sample_so_far = (local_loops_count * p.time_check_granularity_ops) % _this->per_thread_sample_size;
+                access_sequence_type::iterator const iteration_begin_it = begin_it + part_of_the_sample_so_far;
+                access_sequence_type::iterator const iteration_end_it = iteration_begin_it +
+                        (std::min)(p.time_check_granularity_ops, _this->per_thread_sample_size - part_of_the_sample_so_far);
+
+                for (access_sequence_type::iterator it = iteration_begin_it; it < iteration_end_it; ++it){
+                    typename cache_type::handle h = _this->m_cache[*it];
+                    micro_benchmarking::utils::busy_wait(p.time_of_item_use_usec);
+                    micro_benchmarking::utils::disable_elimination(h.value());
+                }
+                ++local_loops_count;
+            }while((tbb::tick_count::now()-start).seconds() < p.time_window_sec);
+            _this->loops_count+=local_loops_count;
+        }};
+        m_barrier.initialize(m_parameter_pack.threads_number);
+
+        NativeParallelFor(m_parameter_pack.threads_number,std::bind1st(std::ptr_fun(&_::retrieve_from_cache),this));
+
+        return loops_count * m_parameter_pack.time_check_granularity_ops;
+    }
+};
+
+int main(int argc,const char** args ){
+
+    size_t time_window_sec = 10;
+    size_t cache_lru_history_size = 1000;
+    size_t time_check_granularity_ops = 200;
+    size_t time_of_item_use_usec = 100;
+    size_t cache_miss_percent = 5;
+    int threads_number =tbb::task_scheduler_init::default_num_threads();
+    size_t weight_of_initiation_call_usec =1000;
+    bool use_serial_initiation_function = false;
+    bool use_coarse_grained_locked_cache = false;
+
+    parameter_pack p(time_window_sec, time_check_granularity_ops, cache_lru_history_size,time_of_item_use_usec,cache_miss_percent,threads_number,weight_of_initiation_call_usec,use_serial_initiation_function);
+
+    utility::parse_cli_arguments(argc,args,utility::cli_argument_pack()
+            .arg(p.cache_lru_history_size,"cache-lru-history-size","")
+            .arg(p.time_window_sec,"time-window","time frame for measuring, in seconds")
+            .arg(p.threads_number,"n-of-threads","number of threads to run on")
+            .arg(p.time_of_item_use_usec,"time-of-item-use","time between  consequent requests to the cache, in microseconds")
+            .arg(p.cache_miss_percent,"cache-miss-percent","cache miss percent ")
+            .arg(p.weight_of_initiation_call_usec,"initiation-call-weight","time occupied by a single call to initiation function, in microseconds")
+            .arg(p.use_serial_initiation_function,"use-serial-initiation-function","limit lock-based serial initiation function")
+            .arg(use_coarse_grained_locked_cache,"use-locked-version","use stl coarse grained lock based version")
+            );
+
+    typedef tbb::concurrent_lru_cache<size_t,size_t,return_size_t> tbb_cache;
+    typedef coarse_grained_raii_lru_cache<size_t,size_t,return_size_t> coarse_grained_locked_cache;
+
+    size_t operations =0;
+    if (!use_coarse_grained_locked_cache){
+        operations = throughput<tbb_cache>(p)();
+    }else{
+        operations = throughput<coarse_grained_locked_cache>(p)();
+    }
+    std::cout<<"operations: "<<operations<<std::endl;
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_parallel_for_each.cpp b/xdl/third_party/tbb/src/perf/time_parallel_for_each.cpp
new file mode 100644
index 00000000..d34199fc
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_parallel_for_each.cpp
@@ -0,0 +1,70 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <vector>
+#include <list>
+#include <iostream>
+#include <cstdlib>
+#include <algorithm>
+#include <string>
+
+#include "tbb/parallel_for_each.h"
+#include "tbb/tick_count.h"
+
+template <typename Type>
+void foo( Type &f ) {
+    f += 1.0f;
+}
+
+template <typename Container>
+void test( std::string testName, const int N, const int numRepeats ) {
+    typedef typename Container::value_type Type;
+    Container v;
+
+    for ( int i = 0; i < N; ++i ) {
+        v.push_back( static_cast<Type>(std::rand()) );
+    }
+
+    std::vector<double> times;
+    times.reserve( numRepeats );
+
+    for ( int i = 0; i < numRepeats; ++i ) {
+        tbb::tick_count t0 = tbb::tick_count::now();
+        tbb::parallel_for_each( v.begin(), v.end(), foo<Type> );
+        tbb::tick_count t1 = tbb::tick_count::now();
+        times.push_back( (t1 - t0).seconds()*1e+3 );
+    }
+
+    std::sort( times.begin(), times.end() );
+    std::cout << "Test " << testName << std::endl
+        << "min " << times[times.size() / 20] << " ms " << std::endl
+        << "med " << times[times.size() / 2] << " ms " << std::endl
+        << "max " << times[times.size() - times.size() / 20 - 1] << " ms " << std::endl;
+}
+
+int main( int argc, char* argv[] ) {
+    const int N = argc > 1 ? std::atoi( argv[1] ) : 10 * 1000;
+    const int numRepeats = argc > 2 ? std::atoi( argv[2] ) : 10;
+
+    test< std::vector<float> >( "std::vector<float>", N, numRepeats );
+    test< std::list<float> >( "std::list<float>", N / 100, numRepeats );
+
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/perf/time_sandbox.h b/xdl/third_party/tbb/src/perf/time_sandbox.h
new file mode 100644
index 00000000..67e4c01d
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_sandbox.h
@@ -0,0 +1,171 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TIME_FRAMEWORK_H__
+#error time_framework.h must be included
+#endif
+
+#define INJECT_TBB namespace tbb { using namespace ::tbb; namespace internal { using namespace ::tbb::internal; } }
+#define INJECT_TBB5 namespace tbb { namespace interface5 { using namespace ::tbb::interface5; namespace internal { using namespace ::tbb::interface5::internal; } } }
+
+#ifndef INJECT_BOX_NAMES
+#if defined(__TBB_task_H) || defined(__TBB_concurrent_unordered_internal_H) || defined(__TBB_reader_writer_lock_H) || defined(__TBB__concurrent_unordered_impl_H)
+#define INJECT_BOX_NAMES INJECT_TBB INJECT_TBB5
+#else
+#define INJECT_BOX_NAMES INJECT_TBB
+#endif
+#endif
+
+#ifdef BOX1
+namespace sandbox1 {
+    INJECT_BOX_NAMES
+#   ifdef BOX1HEADER
+#   include BOX1HEADER
+#   endif
+    typedef ::BOX1TEST testbox;
+}
+#endif
+#ifdef BOX2
+namespace sandbox2 {
+    INJECT_BOX_NAMES
+#   ifdef BOX2HEADER
+#   include BOX2HEADER
+#   endif
+    typedef ::BOX2TEST testbox;
+}
+#endif
+#ifdef BOX3
+namespace sandbox3 {
+    INJECT_BOX_NAMES
+#   ifdef BOX3HEADER
+#   include BOX3HEADER
+#   endif
+    typedef ::BOX3TEST testbox;
+}
+#endif
+#ifdef BOX4
+namespace sandbox4 {
+    INJECT_BOX_NAMES
+#   ifdef BOX4HEADER
+#   include BOX4HEADER
+#   endif
+    typedef ::BOX4TEST testbox;
+}
+#endif
+#ifdef BOX5
+namespace sandbox5 {
+    INJECT_BOX_NAMES
+#   ifdef BOX5HEADER
+#   include BOX5HEADER
+#   endif
+    typedef ::BOX5TEST testbox;
+}
+#endif
+#ifdef BOX6
+namespace sandbox6 {
+    INJECT_BOX_NAMES
+#   ifdef BOX6HEADER
+#   include BOX6HEADER
+#   endif
+    typedef ::BOX6TEST testbox;
+}
+#endif
+#ifdef BOX7
+namespace sandbox7 {
+    INJECT_BOX_NAMES
+#   ifdef BOX7HEADER
+#   include BOX7HEADER
+#   endif
+    typedef ::BOX7TEST testbox;
+}
+#endif
+#ifdef BOX8
+namespace sandbox8 {
+    INJECT_BOX_NAMES
+#   ifdef BOX8HEADER
+#   include BOX8HEADER
+#   endif
+    typedef ::BOX8TEST testbox;
+}
+#endif
+#ifdef BOX9
+namespace sandbox9 {
+    INJECT_BOX_NAMES
+#   ifdef BOX9HEADER
+#   include BOX9HEADER
+#   endif
+    typedef ::BOX9TEST testbox;
+}
+#endif
+
+//if harness.h included
+#if defined(ASSERT) && !HARNESS_NO_PARSE_COMMAND_LINE
+#ifndef TEST_PREFIX
+#define TEST_PREFIX if(Verbose) printf("Processing with %d threads: %ld...\n", threads, long(value));
+#endif
+#endif//harness included
+
+#ifndef TEST_PROCESSOR_NAME
+#define TEST_PROCESSOR_NAME test_sandbox
+#endif
+
+class TEST_PROCESSOR_NAME : public TestProcessor {
+public:
+    TEST_PROCESSOR_NAME(const char *name, StatisticsCollector::Sorting sort_by = StatisticsCollector::ByAlg)
+        : TestProcessor(name, sort_by) {}
+    void factory(arg_t value, int threads) {
+#ifdef TEST_PREFIX
+        TEST_PREFIX
+#endif
+        process( value, threads,
+#define RUNBOX(n) run(#n"."BOX##n, new sandbox##n::testbox() )
+#ifdef BOX1
+        RUNBOX(1),
+#endif
+#ifdef BOX2
+        RUNBOX(2),
+#endif
+#ifdef BOX3
+        RUNBOX(3),
+#endif
+#ifdef BOX4
+        RUNBOX(4),
+#endif
+#ifdef BOX5
+        RUNBOX(5),
+#endif
+#ifdef BOX6
+        RUNBOX(6),
+#endif
+#ifdef BOX7
+        RUNBOX(7),
+#endif
+#ifdef BOX8
+        RUNBOX(8),
+#endif
+#ifdef BOX9
+        RUNBOX(9),
+#endif
+        end );
+#ifdef TEST_POSTFIX
+        TEST_POSTFIX
+#endif
+    }
+};
diff --git a/xdl/third_party/tbb/src/perf/time_split_node.cpp b/xdl/third_party/tbb/src/perf/time_split_node.cpp
new file mode 100644
index 00000000..8771a771
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_split_node.cpp
@@ -0,0 +1,120 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <iostream>
+#include "tbb/flow_graph.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+
+static double bm_split_node(tbb::flow::graph& g, int nIter);
+static double bm_broadcast_node(tbb::flow::graph& g, int nIter);
+static double bm_queue_node(tbb::flow::graph& g, int nIter);
+
+typedef int my_type;
+//typedef std::vector<int> my_type;
+
+const int nIter = 1 << 24; //16M
+const int nSize = 100000000;
+
+int main()
+{
+    //set up one thread to eliminate scheduler overheads
+    tbb::task_scheduler_init tsi(1);
+
+    tbb::flow::graph g;
+
+    //1. queue_node benchmark; calculate queue_node time + plus threads creation time (if we have multi-threading)
+    std::cout << "queue benchmark: number of calls of putting element:" << nIter;
+    const double tQueue = bm_queue_node(g, nIter);
+    std::cout << ";  time:" << tQueue << std::endl << std::endl;
+
+    //2. split_node benchmark
+    std::cout << "split_node benchmark: number of calls:" << nIter;
+    const double tSplitNode = bm_split_node(g, nIter);
+    //output split_node benchmark result
+    std::cout << ";  time:" << tSplitNode << std::endl;
+    std::cout << "exclusive split_node time:" << tSplitNode - tQueue << std::endl << std::endl;
+
+    //3. broadcast_node benchmark
+    std::cout << "broadcast_node benchmark: number of calls:" << nIter;
+    const double tBNode = bm_broadcast_node(g, nIter);
+    //output broadcast_node benchmark result
+    std::cout << ";  time:" << tBNode << std::endl;
+    std::cout << "exclusive broadcast_node time:" << tBNode - tQueue << std::endl;
+
+    return 0;
+}
+
+//! Dummy executing split_node, "nIter" calls; Returns time in seconds.
+double bm_split_node(tbb::flow::graph& g, int nIter)
+{
+    my_type v1(nSize);
+
+    tbb::flow::queue_node<my_type> my_queue1(g);
+    tbb::flow::tuple<my_type> my_tuple(1);
+
+    tbb::flow::split_node< tbb::flow::tuple<my_type> > my_split_node(g);
+    make_edge(tbb::flow::get<0>(my_split_node.output_ports()), my_queue1);
+
+    const tbb::tick_count t0 = tbb::tick_count::now();
+
+    //using split_node
+    for (int i = 0; i < nIter; ++i)
+        my_split_node.try_put(my_tuple); 
+
+    //barrier sync
+    g.wait_for_all();
+
+    return (tbb::tick_count::now() - t0).seconds();
+}
+
+//! Dummy executing broadcast_node; "nIter" calls; Returns time in seconds.
+double bm_broadcast_node(tbb::flow::graph& g, int nIter)
+{
+    tbb::flow::queue_node<my_type> my_queue(g);
+    tbb::flow::broadcast_node<my_type> my_broadcast_node(g);
+    make_edge(my_broadcast_node, my_queue);
+
+    my_type v(nSize);
+
+    const tbb::tick_count t0 = tbb::tick_count::now();
+
+    //using broadcast_node
+    for (int i = 0; i < nIter; ++i)
+        my_broadcast_node.try_put(v);
+    //barrier sync
+    g.wait_for_all();
+
+    return (tbb::tick_count::now() - t0).seconds();
+}
+
+double bm_queue_node(tbb::flow::graph& g, int nIter)
+{
+    tbb::flow::queue_node<my_type> first_queue(g);
+
+    my_type v(nSize);
+
+    tbb::tick_count t0 = tbb::tick_count::now();
+    //using queue_node
+    for (int i = 0; i < nIter; ++i)
+        first_queue.try_put(v);
+    g.wait_for_all();
+    return (tbb::tick_count::now() - t0).seconds();
+}
diff --git a/xdl/third_party/tbb/src/perf/time_vector.cpp b/xdl/third_party/tbb/src/perf/time_vector.cpp
new file mode 100644
index 00000000..93e2e359
--- /dev/null
+++ b/xdl/third_party/tbb/src/perf/time_vector.cpp
@@ -0,0 +1,249 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//#define DO_SCALABLEALLOC
+
+#include <cstdlib>
+#include <cmath>
+#include <vector>
+#include <algorithm>
+#include <functional>
+#include <numeric>
+#include "tbb/tbb_stddef.h"
+#include "tbb/spin_mutex.h"
+#ifdef DO_SCALABLEALLOC
+#include "tbb/scalable_allocator.h"
+#endif
+#include "tbb/concurrent_vector.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/tick_count.h"
+#include "tbb/blocked_range.h"
+#define HARNESS_CUSTOM_MAIN 1
+#include "../test/harness.h"
+//#include "harness_barrier.h"
+#include "../test/harness_allocator.h"
+#define STATISTICS_INLINE
+#include "statistics.h"
+
+using namespace tbb;
+bool ExtraVerbose = false;
+
+class Timer {
+    tbb::tick_count tick;
+public:
+    Timer() { tick = tbb::tick_count::now(); }
+    double get_time()  { return (tbb::tick_count::now() - tick).seconds(); }
+    double diff_time(const Timer &newer) { return (newer.tick - tick).seconds(); }
+    double mark_time() { tick_count t1(tbb::tick_count::now()), t2(tick); tick = t1; return (t1 - t2).seconds(); }
+    double mark_time(const Timer &newer) { tick_count t(tick); tick = newer.tick; return (tick - t).seconds(); }
+};
+
+/************************************************************************/
+/* TEST1                                                                */
+/************************************************************************/
+#define mk_vector_test1(v, a) vector_test1<v<Timer, static_counting_allocator<a<Timer> > >, v<double, static_counting_allocator<a<double> > > >
+template<class timers_vector_t, class values_vector_t>
+class vector_test1 {
+    const char *mode;
+    StatisticsCollector &stat;
+    StatisticsCollector::TestCase key[16];
+
+public:
+    vector_test1(const char *m, StatisticsCollector &s)  :  mode(m), stat(s) {}
+
+    vector_test1 &operator()(size_t len) {
+        if(Verbose) printf("test1<%s>(%u): collecting timing statistics\n", mode, unsigned(len));
+        __TBB_ASSERT(sizeof(Timer) == sizeof(double), NULL);
+        static const char *test_names[] = {
+            "b)creation wholly",
+            "a)creation by push",
+            "c)operation time per item",
+            0 };
+        for(int i = 0; test_names[i]; ++i) key[i] = stat.SetTestCase(test_names[i], mode, len);
+
+        Timer timer0; timers_vector_t::allocator_type::init_counters();
+        timers_vector_t tv(len);
+        Timer timer1; values_vector_t::allocator_type::init_counters();
+        values_vector_t dv;
+        for (size_t i = 0; i < len; ++i)
+            dv.push_back( i );
+        Timer timer2;
+        for (size_t i = 0; i < len; ++i)
+        {
+            dv[len-i-1] = timer0.diff_time(tv[i]);
+            tv[i].mark_time();
+        }
+        stat.AddStatisticValue( key[2], "1total, ms", "%.3f", timer2.get_time()*1e+3 );
+        stat.AddStatisticValue( key[1], "1total, ms", "%.3f", timer1.diff_time(timer2)*1e+3 );
+        stat.AddStatisticValue( key[0], "1total, ms", "%.3f", timer0.diff_time(timer1)*1e+3 );
+        //allocator statistics
+        stat.AddStatisticValue( key[0], "2total allocations", "%d", int(timers_vector_t::allocator_type::allocations) );
+        stat.AddStatisticValue( key[1], "2total allocations", "%d", int(values_vector_t::allocator_type::allocations) );
+        stat.AddStatisticValue( key[2], "2total allocations", "%d",  0);
+        stat.AddStatisticValue( key[0], "3total alloc#items", "%d", int(timers_vector_t::allocator_type::items_allocated) );
+        stat.AddStatisticValue( key[1], "3total alloc#items", "%d", int(values_vector_t::allocator_type::items_allocated) );
+        stat.AddStatisticValue( key[2], "3total alloc#items", "%d",  0);
+        //remarks
+        stat.AddStatisticValue( key[0], "9note", "segment creation time, us:");
+        stat.AddStatisticValue( key[2], "9note", "average op-time per item, us:");
+        Timer last_timer(timer2); double last_value = 0;
+        for (size_t j = 0, i = 2; i < len; i *= 2, j++) {
+            stat.AddRoundResult( key[0], (dv[len-i-1]-last_value)*1e+6 );
+            last_value = dv[len-i-1];
+            stat.AddRoundResult( key[2], last_timer.diff_time(tv[i])/double(i)*1e+6 );
+            last_timer = tv[i];
+            stat.SetRoundTitle(j, i);
+        }
+        tv.clear(); dv.clear();
+        //__TBB_ASSERT(timers_vector_t::allocator_type::items_allocated == timers_vector_t::allocator_type::items_freed, NULL);
+        //__TBB_ASSERT(values_vector_t::allocator_type::items_allocated == values_vector_t::allocator_type::items_freed, NULL);
+    	return *this;
+    }
+};
+
+/************************************************************************/
+/* TEST2                                                                */
+/************************************************************************/
+#define mk_vector_test2(v, a) vector_test2<v<size_t, a<size_t> > >
+template<class vector_t>
+class vector_test2 {
+    const char *mode;
+    static const int ntrial = 10;
+    StatisticsCollector &stat;
+
+public:
+    vector_test2(const char *m, StatisticsCollector &s)  :  mode(m), stat(s) {}
+
+    vector_test2 &operator()(size_t len) {
+        if(Verbose) printf("test2<%s>(%u): performing standard transformation sequence on vector\n", mode, unsigned(len));
+        StatisticsCollector::TestCase init_key = stat.SetTestCase("allocate", mode, len);
+        StatisticsCollector::TestCase fill_key = stat.SetTestCase("fill", mode, len);
+        StatisticsCollector::TestCase proc_key = stat.SetTestCase("process", mode, len);
+        StatisticsCollector::TestCase full_key = stat.SetTestCase("total time", mode, len);
+        for (int i = 0; i < ntrial; i++) {
+            Timer timer0;
+            vector_t v1(len);
+            vector_t v2(len);
+            Timer timer1;
+            std::generate(v1.begin(), v1.end(), values(0));
+            std::generate(v2.begin(), v2.end(), values(size_t(-len)));
+            Timer timer2;
+            std::reverse(v1.rbegin(), v1.rend());
+            std::inner_product(v1.begin(), v1.end(), v2.rbegin(), 1);
+            std::sort(v1.rbegin(), v1.rend());
+            std::sort(v2.rbegin(), v2.rend());
+            std::set_intersection(v1.begin(), v1.end(), v2.rbegin(), v2.rend(), v1.begin());
+            Timer timer3;
+            stat.AddRoundResult( proc_key, timer2.diff_time(timer3)*1e+3 );
+            stat.AddRoundResult( fill_key, timer1.diff_time(timer2)*1e+3 );
+            stat.AddRoundResult( init_key, timer0.diff_time(timer1)*1e+3 );
+            stat.AddRoundResult( full_key, timer0.diff_time(timer3)*1e+3 );
+        }
+        stat.SetStatisticFormula("1Average", "=AVERAGE(ROUNDS)");
+        stat.SetStatisticFormula("2+/-", "=(MAX(ROUNDS)-MIN(ROUNDS))/2");
+        return *this;
+    }
+
+    class values
+    {
+        size_t value;
+    public:
+        values(size_t i) : value(i) {}
+        size_t operator()() {
+            return value++%(1|(value^55));
+        }
+    };
+};
+
+/************************************************************************/
+/* TEST3                                                                */
+/************************************************************************/
+#define mk_vector_test3(v, a) vector_test3<v<char, local_counting_allocator<a<char>, size_t > > >
+template<class vector_t>
+class vector_test3 {
+    const char *mode;
+    StatisticsCollector &stat;
+
+public:
+    vector_test3(const char *m, StatisticsCollector &s)  :  mode(m), stat(s) {}
+
+    vector_test3 &operator()(size_t len) {
+        if(Verbose) printf("test3<%s>(%u): collecting allocator statistics\n", mode, unsigned(len));
+        static const size_t sz = 1024;
+        vector_t V[sz];
+        StatisticsCollector::TestCase vinst_key = stat.SetTestCase("instances number", mode, len);
+        StatisticsCollector::TestCase count_key = stat.SetTestCase("allocations count", mode, len);
+        StatisticsCollector::TestCase items_key = stat.SetTestCase("allocated items", mode, len);
+        //stat.ReserveRounds(sz-1);
+        for (size_t c = 0, i = 0, s = sz/2; s >= 1 && i < sz; s /= 2, c++)
+        {
+            const size_t count = c? 1<<(c-1) : 0;
+            for (size_t e = i+s; i < e; i++) {
+                //if(count >= 16) V[i].reserve(count);
+                for (size_t j = 0; j < count; j++)
+                    V[i].push_back(j);
+            }
+            stat.SetRoundTitle ( c, count );
+            stat.AddRoundResult( vinst_key, s );
+            stat.AddRoundResult( count_key, V[i-1].get_allocator().allocations );
+            stat.AddRoundResult( items_key, V[i-1].get_allocator().items_allocated );
+        }
+        return *this;
+    }
+};
+
+/************************************************************************/
+/* TYPES SET FOR TESTS                                                  */
+/************************************************************************/
+#define types_set(n, title, op) { StatisticsCollector Collector("time_vector"#n); Collector.SetTitle title; \
+    {mk_vector_test##n(tbb::concurrent_vector, tbb::cache_aligned_allocator) ("TBB:NFS", Collector)op;} \
+    {mk_vector_test##n(tbb::concurrent_vector, tbb::tbb_allocator)           ("TBB:TBB", Collector)op;} \
+    {mk_vector_test##n(tbb::concurrent_vector, std::allocator)               ("TBB:STD", Collector)op;} \
+    {mk_vector_test##n(std::vector, tbb::cache_aligned_allocator)            ("STL:NFS", Collector)op;} \
+    {mk_vector_test##n(std::vector, tbb::tbb_allocator)                      ("STL:TBB", Collector)op;} \
+    {mk_vector_test##n(std::vector, std::allocator)                          ("STL:STD", Collector)op;} \
+    Collector.Print(StatisticsCollector::Stdout|StatisticsCollector::HTMLFile|StatisticsCollector::ExcelXML); }
+
+
+/************************************************************************/
+/* MAIN DRIVER                                                          */
+/************************************************************************/
+int main(int argc, char* argv[]) {
+	if(argc>1) Verbose = true;
+	if(argc>2) ExtraVerbose = true;
+    MinThread = 0; MaxThread = 500000; // use in another meaning - test#:problem size
+    ParseCommandLine( argc, argv );
+
+    ASSERT(tbb_allocator<int>::allocator_type() == tbb_allocator<int>::scalable, "expecting scalable allocator library to be loaded");
+    
+    if(!MinThread || MinThread == 1)
+        types_set(1, ("Vectors performance test #1 for %d", MaxThread), (MaxThread) )
+    if(!MinThread || MinThread == 2)
+        types_set(2, ("Vectors performance test #2 for %d", MaxThread), (MaxThread) )
+    if(!MinThread || MinThread == 3)
+        types_set(3, ("Vectors performance test #3 for %d", MaxThread), (MaxThread) )
+
+    if(!Verbose) printf("done\n");
+    return 0;
+}
+
diff --git a/xdl/third_party/tbb/src/rml/client/index.html b/xdl/third_party/tbb/src/rml/client/index.html
new file mode 100644
index 00000000..0a652b7e
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/index.html
@@ -0,0 +1,42 @@
+<HTML>
+<BODY>
+<H2>Overview</H2>
+
+This directory has source code that must be statically linked into an RML client.
+
+<H2>Files</H2>
+
+<DL>
+<DT><A HREF="rml_factory.h">rml_factory.h</A>
+<DD>Text shared by <A HREF="rml_omp.cpp">rml_omp.cpp</A> and <A HREF="rml_tbb.cpp">rml_tbb.cpp</A>.
+       This is not an ordinary include file, so it does not have an #ifndef guard.</DD></DT>
+</DL>
+
+<H3> Specific to client=OpenMP</H3>
+<DL>
+<DT><A HREF="rml_omp.cpp">rml_omp.cpp</A>
+<DD>Source file for OpenMP client.</DD></DT>
+<DT><A HREF="omp_dynamic_link.h">omp_dynamic_link.h</A></DT>
+<DT><A HREF="omp_dynamic_link.cpp">omp_dynamic_link.cpp</A>
+<DD>Source files for dynamic linking support.  
+       The code is the code from the TBB source directory, but adjusted so that it 
+       appears in namespace <TT>__kmp</TT> instead of namespace <TT>tbb::internal</TT>.</DD></DT>
+</DL>
+<H3> Specific to client=TBB</H3>
+<DL>
+<DT><A HREF="rml_tbb.cpp">rml_tbb.cpp</A>
+<DD>Source file for TBB client.  It uses the dynamic linking support from the TBB source directory.</DD></DT>
+</DL>
+
+<HR/>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
+
diff --git a/xdl/third_party/tbb/src/rml/client/library_assert.h b/xdl/third_party/tbb/src/rml/client/library_assert.h
new file mode 100644
index 00000000..0af2d5c8
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/library_assert.h
@@ -0,0 +1,34 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef LIBRARY_ASSERT_H
+#define LIBRARY_ASSERT_H
+
+#ifndef  LIBRARY_ASSERT
+#ifdef KMP_ASSERT2
+#define LIBRARY_ASSERT(x,y) KMP_ASSERT2((x),(y))
+#else
+#include <assert.h>
+#define LIBRARY_ASSERT(x,y)         assert(x)
+#define __TBB_DYNAMIC_LOAD_ENABLED  1
+#endif
+#endif /* LIBRARY_ASSERT */
+
+#endif /* LIBRARY_ASSERT_H */
diff --git a/xdl/third_party/tbb/src/rml/client/omp_dynamic_link.cpp b/xdl/third_party/tbb/src/rml/client/omp_dynamic_link.cpp
new file mode 100644
index 00000000..2da09a3e
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/omp_dynamic_link.cpp
@@ -0,0 +1,24 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "omp_dynamic_link.h"
+#include "library_assert.h"
+#include "tbb/dynamic_link.cpp" // Refers to src/tbb, not include/tbb
+
diff --git a/xdl/third_party/tbb/src/rml/client/omp_dynamic_link.h b/xdl/third_party/tbb/src/rml/client/omp_dynamic_link.h
new file mode 100644
index 00000000..331e2cac
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/omp_dynamic_link.h
@@ -0,0 +1,30 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __KMP_omp_dynamic_link_H
+#define __KMP_omp_dynamic_link_H
+
+#define OPEN_INTERNAL_NAMESPACE namespace __kmp {
+#define CLOSE_INTERNAL_NAMESPACE }
+
+#include "library_assert.h"
+#include "tbb/dynamic_link.h" // Refers to src/tbb, not include/tbb 
+
+#endif /* __KMP_omp_dynamic_link_H */
diff --git a/xdl/third_party/tbb/src/rml/client/rml_factory.h b/xdl/third_party/tbb/src/rml/client/rml_factory.h
new file mode 100644
index 00000000..500870dc
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/rml_factory.h
@@ -0,0 +1,94 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// No ifndef guard because this file is not a normal include file.
+
+#if TBB_USE_DEBUG
+#define DEBUG_SUFFIX "_debug"
+#else
+#define DEBUG_SUFFIX
+#endif /* TBB_USE_DEBUG */
+
+// RML_SERVER_NAME is the name of the RML server library.
+#if _WIN32||_WIN64
+#define RML_SERVER_NAME "irml" DEBUG_SUFFIX ".dll"
+#elif __APPLE__
+#define RML_SERVER_NAME "libirml" DEBUG_SUFFIX ".dylib"
+#elif __linux__
+#define RML_SERVER_NAME "libirml" DEBUG_SUFFIX ".so.1"
+#elif __FreeBSD__ || __NetBSD__ || __OpenBSD__ || __sun || _AIX
+#define RML_SERVER_NAME "libirml" DEBUG_SUFFIX ".so"
+#else
+#error Unknown OS
+#endif
+
+const ::rml::versioned_object::version_type CLIENT_VERSION = 2;
+
+#if __TBB_WEAK_SYMBOLS_PRESENT
+    #pragma weak __RML_open_factory
+    #pragma weak __RML_close_factory
+    extern "C" {
+        ::rml::factory::status_type __RML_open_factory ( ::rml::factory&, ::rml::versioned_object::version_type&, ::rml::versioned_object::version_type );
+        void __RML_close_factory( ::rml::factory& f );
+    }
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT */
+
+::rml::factory::status_type FACTORY::open() {
+    // Failure of following assertion indicates that factory is already open, or not zero-inited.
+    LIBRARY_ASSERT( !library_handle, NULL );
+    status_type (*open_factory_routine)( factory&, version_type&, version_type );
+    dynamic_link_descriptor server_link_table[4] = {
+        DLD(__RML_open_factory,open_factory_routine),
+        MAKE_SERVER(my_make_server_routine),
+        DLD(__RML_close_factory,my_wait_to_close_routine),
+        GET_INFO(my_call_with_server_info_routine),
+    };
+    status_type result;
+    if( dynamic_link( RML_SERVER_NAME, server_link_table, 4, &library_handle ) ) {
+        version_type server_version;
+        result = (*open_factory_routine)( *this, server_version, CLIENT_VERSION );
+        // server_version can be checked here for incompatibility if necessary.
+    } else {
+        library_handle = NULL;
+        result = st_not_found;
+    }
+    return result;
+}
+
+void FACTORY::close() {
+    if( library_handle )
+        (*my_wait_to_close_routine)(*this);
+    if( (size_t)library_handle>FACTORY::c_dont_unload ) {
+        dynamic_unlink(library_handle);
+        library_handle = NULL;
+    }
+}
+
+::rml::factory::status_type FACTORY::make_server( SERVER*& s, CLIENT& c) {
+    // Failure of following assertion means that factory was not successfully opened.
+    LIBRARY_ASSERT( my_make_server_routine, NULL );
+    return (*my_make_server_routine)(*this,s,c);
+}
+
+void FACTORY::call_with_server_info( ::rml::server_info_callback_t cb, void* arg ) const {
+    // Failure of following assertion means that factory was not successfully opened.
+    LIBRARY_ASSERT( my_call_with_server_info_routine, NULL );
+    (*my_call_with_server_info_routine)( cb, arg );
+}
diff --git a/xdl/third_party/tbb/src/rml/client/rml_omp.cpp b/xdl/third_party/tbb/src/rml/client/rml_omp.cpp
new file mode 100644
index 00000000..e1991c1d
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/rml_omp.cpp
@@ -0,0 +1,46 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "rml_omp.h"
+#include "omp_dynamic_link.h"
+#include <assert.h>
+
+namespace __kmp {
+namespace rml {
+
+#define MAKE_SERVER(x) DLD(__KMP_make_rml_server,x)
+#define GET_INFO(x) DLD(__KMP_call_with_my_server_info,x)
+#define SERVER omp_server 
+#define CLIENT omp_client
+#define FACTORY omp_factory
+
+#if __TBB_WEAK_SYMBOLS_PRESENT
+    #pragma weak __KMP_make_rml_server
+    #pragma weak __KMP_call_with_my_server_info
+    extern "C" {
+        omp_factory::status_type __KMP_make_rml_server( omp_factory& f, omp_server*& server, omp_client& client );
+        void __KMP_call_with_my_server_info( ::rml::server_info_callback_t cb, void* arg );
+    }
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT */
+
+#include "rml_factory.h"
+
+} // rml
+} // __kmp
diff --git a/xdl/third_party/tbb/src/rml/client/rml_tbb.cpp b/xdl/third_party/tbb/src/rml/client/rml_tbb.cpp
new file mode 100644
index 00000000..99781973
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/client/rml_tbb.cpp
@@ -0,0 +1,48 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "../include/rml_tbb.h"
+#include "tbb/dynamic_link.h"
+#include <assert.h>
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+#define MAKE_SERVER(x) DLD(__TBB_make_rml_server,x)
+#define GET_INFO(x) DLD(__TBB_call_with_my_server_info,x)
+#define SERVER tbb_server 
+#define CLIENT tbb_client
+#define FACTORY tbb_factory
+
+#if __TBB_WEAK_SYMBOLS_PRESENT
+    #pragma weak __TBB_make_rml_server
+    #pragma weak __TBB_call_with_my_server_info
+    extern "C" {
+        ::rml::factory::status_type __TBB_make_rml_server( tbb::internal::rml::tbb_factory& f, tbb::internal::rml::tbb_server*& server, tbb::internal::rml::tbb_client& client );
+        void __TBB_call_with_my_server_info( ::rml::server_info_callback_t cb, void* arg );
+    }
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT */
+
+#include "rml_factory.h"
+
+} // rml
+} // internal
+} // tbb
diff --git a/xdl/third_party/tbb/src/rml/include/index.html b/xdl/third_party/tbb/src/rml/include/index.html
new file mode 100644
index 00000000..5c080a26
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/include/index.html
@@ -0,0 +1,29 @@
+<HTML>
+<BODY>
+<H2>Overview</H2>
+
+This directory has the include files for the Resource Management Layer (RML).
+
+<H2>Files</H2>
+
+<DL>
+<DT><P><A HREF="rml_base.h">rml_base.h</A>
+<DD>Interfaces shared by TBB and OpenMP.</P>
+<DT><P><A HREF="rml_omp.h">rml_omp.h</A>
+<DD>Interface exclusive to OpenMP.</P>
+<DT><P><A HREF="rml_tbb.h">rml_tbb.h</A>
+<DD>Interface exclusive to TBB.</P>
+</DL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
+
diff --git a/xdl/third_party/tbb/src/rml/include/rml_base.h b/xdl/third_party/tbb/src/rml/include/rml_base.h
new file mode 100644
index 00000000..f60ed7ee
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/include/rml_base.h
@@ -0,0 +1,188 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Header guard and namespace names follow rml conventions.
+
+#ifndef __RML_rml_base_H
+#define __RML_rml_base_H
+
+#include <cstddef>
+
+#if _WIN32||_WIN64
+#include <windows.h>
+#endif /* _WIN32||_WIN64 */
+
+#ifdef RML_PURE_VIRTUAL_HANDLER
+#define RML_PURE(T) {RML_PURE_VIRTUAL_HANDLER(); return (T)0;}
+#else
+#define RML_PURE(T) = 0;
+#endif
+
+namespace rml {
+
+//! Base class for denying assignment and copy constructor.
+class no_copy {
+    void operator=( no_copy& );
+    no_copy( no_copy& );
+public:
+    no_copy() {}
+};
+
+class server;
+
+class versioned_object {
+public:
+    //! A version number
+    typedef unsigned version_type;
+    
+    //! Get version of this object
+    /** The version number is incremented when a incompatible change is introduced.
+        The version number is invariant for the lifetime of the object. */
+    virtual version_type version() const RML_PURE(version_type)
+};
+
+//! Represents a client's job for an execution context.
+/** A job object is constructed by the client.
+    Not derived from versioned_object because version is same as for client. */
+class job {
+    friend class server;
+
+    //! Word for use by server
+    /** Typically the server uses it to speed up internal lookup.
+        Clients must not modify the word. */
+    void* scratch_ptr;
+};
+
+//! Information that client provides to server when asking for a server.
+/** The instance must endure at least until acknowledge_close_connection is called. */
+class client: public versioned_object {
+public:
+    //! Typedef for convenience of derived classes in other namespaces.
+    typedef ::rml::job job;
+
+    //! Index of a job in a job pool
+    typedef unsigned size_type;
+
+    //! Maximum number of threads that client can exploit profitably if nothing else is running on the machine.  
+    /** The returned value should remain invariant for the lifetime of the connection.  [idempotent] */
+    virtual size_type max_job_count() const RML_PURE(size_type)
+
+    //! Minimum stack size for each job.  0 means to use default stack size. [idempotent]
+    virtual std::size_t min_stack_size() const RML_PURE(std::size_t)
+
+    //! Server calls this routine when it needs client to create a job object.
+    virtual job* create_one_job() RML_PURE(job*)
+
+    //! Acknowledge that all jobs have been cleaned up.
+    /** Called by server in response to request_close_connection
+        after cleanup(job) has been called for each job. */
+    virtual void acknowledge_close_connection() RML_PURE(void)
+
+    enum policy_type {turnaround,throughput};
+
+    //! Inform server of desired policy. [idempotent]
+    virtual policy_type policy() const RML_PURE(policy_type)
+
+    //! Inform client that server is done with *this.   
+    /** Client should destroy the job.
+        Not necessarily called by execution context represented by *this.
+        Never called while any other thread is working on the job. */
+    virtual void cleanup( job& ) RML_PURE(void)
+
+    // In general, we should not add new virtual methods, because that would 
+    // break derived classes.  Think about reserving some vtable slots.  
+};
+
+// Information that server provides to client.
+// Virtual functions are routines provided by the server for the client to call. 
+class server: public versioned_object {
+public:
+    //! Typedef for convenience of derived classes.
+    typedef ::rml::job job;
+
+#if _WIN32||_WIN64
+    typedef void* execution_resource_t;
+#endif
+
+    //! Request that connection to server be closed.
+    /** Causes each job associated with the client to have its cleanup method called,
+        possibly by a thread different than the thread that created the job. 
+        This method can return before all cleanup methods return. 
+        Actions that have to wait after all cleanup methods return should be part of 
+        client::acknowledge_close_connection. 
+        Pass true as exiting if request_close_connection() is called because exit() is
+        called. In that case, it is the client's responsibility to make sure all threads
+        are terminated. In all other cases, pass false.  */
+    virtual void request_close_connection( bool exiting = false ) = 0;
+
+    //! Called by client thread when it reaches a point where it cannot make progress until other threads do.  
+    virtual void yield() = 0;
+
+    //! Called by client to indicate a change in the number of non-RML threads that are running.
+    /** This is a performance hint to the RML to adjust how many threads it should let run 
+        concurrently.  The delta is the change in the number of non-RML threads that are running.
+        For example, a value of 1 means the client has started running another thread, and a value 
+        of -1 indicates that the client has blocked or terminated one of its threads. */
+    virtual void independent_thread_number_changed( int delta ) = 0;
+
+    //! Default level of concurrency for which RML strives when there are no non-RML threads running.
+    /** Normally, the value is the hardware concurrency minus one. 
+        The "minus one" accounts for the thread created by main(). */
+    virtual unsigned default_concurrency() const = 0;
+
+protected:
+    static void*& scratch_ptr( job& j ) {return j.scratch_ptr;}
+};
+
+class factory {
+public:
+    //! status results
+    enum status_type {
+        st_success=0,
+        st_connection_exists,
+        st_not_found,
+        st_incompatible
+    };
+
+    //! Scratch pointer for use by RML.
+    void* scratch_ptr;
+
+protected:
+    //! Pointer to routine that waits for server to indicate when client can close itself.
+    status_type (*my_wait_to_close_routine)( factory& );
+
+public:
+    //! Library handle for use by RML.
+#if _WIN32||_WIN64
+    HMODULE library_handle;
+#else
+    void* library_handle;
+#endif /* _WIN32||_WIN64 */ 
+
+    //! Special marker to keep dll from being unloaded prematurely
+    static const std::size_t c_dont_unload = 1;
+};
+
+//! Typedef for callback functions to print server info
+typedef void (*server_info_callback_t)( void* arg, const char* server_info );
+
+} // namespace rml
+
+#endif /* __RML_rml_base_H */
diff --git a/xdl/third_party/tbb/src/rml/include/rml_omp.h b/xdl/third_party/tbb/src/rml/include/rml_omp.h
new file mode 100644
index 00000000..e97ebb62
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/include/rml_omp.h
@@ -0,0 +1,130 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Header guard and namespace names follow OpenMP runtime conventions.
+
+#ifndef KMP_RML_OMP_H
+#define KMP_RML_OMP_H
+
+#include "rml_base.h"
+
+namespace __kmp {
+namespace rml {
+
+class omp_client;
+
+//------------------------------------------------------------------------
+// Classes instantiated by the server
+//------------------------------------------------------------------------
+
+//! Represents a set of omp worker threads provided by the server.
+class omp_server: public ::rml::server {
+public:
+    //! A number of coins (i.e., threads)
+    typedef unsigned size_type;
+
+    //! Return the number of coins in the bank. (negative if machine is oversubscribed).
+    virtual int current_balance() const = 0;
+  
+    //! Request n coins.  Returns number of coins granted. Oversubscription amount if negative.
+    /** Always granted if is_strict is true.
+        - Positive or zero result indicates that the number of coins was taken from the bank.
+        - Negative result indicates that no coins were taken, and that the bank has deficit 
+          by that amount and the caller (if being a good citizen) should return that many coins.
+     */
+    virtual int try_increase_load( size_type /*n*/, bool /*strict*/ ) = 0;
+
+    //! Return n coins into the bank.
+    virtual void decrease_load( size_type /*n*/ ) = 0;
+
+    //! Convert n coins into n threads.
+    /** When a thread returns, it is converted back into a coin and the coin is returned to the bank. */
+    virtual void get_threads( size_type /*m*/, void* /*cookie*/, job* /*array*/[] ) = 0;
+
+    /** Putting a thread to sleep - convert a thread into a coin
+        Waking up a thread        - convert a coin into a thread
+      
+       Note: conversion between a coin and a thread does not affect the accounting.
+     */
+#if _WIN32||_WIN64
+    //! Inform server of a tbb master thread.
+    virtual void register_master( execution_resource_t& /*v*/ ) = 0;
+
+    //! Inform server that the tbb master thread is done with its work.
+    virtual void unregister_master( execution_resource_t /*v*/ ) = 0;
+ 
+    //! deactivate
+    /** give control to ConcRT RM */
+    virtual void deactivate( job* ) = 0;
+
+    //! reactivate
+    virtual void reactivate( job* ) = 0;
+#endif /* _WIN32||_WIN64 */
+};
+
+
+//------------------------------------------------------------------------
+// Classes (or base classes thereof) instantiated by the client
+//------------------------------------------------------------------------
+
+class omp_client: public ::rml::client {
+public:
+    //! Called by server thread when it delivers a thread to client
+    /** The index argument is a 0-origin index of the job for this thread within the array
+        returned by method get_threads.  Server decreases the load by 1 (i.e., returning the coin
+        back to the bank) after this method returns. */
+    virtual void process( job&, void* /*cookie*/, size_type /*index*/ ) RML_PURE(void)
+};
+
+/** Client must ensure that instance is zero-inited, typically by being a file-scope object. */
+class omp_factory: public ::rml::factory {
+
+    //! Pointer to routine that creates an RML server.
+    status_type (*my_make_server_routine)( omp_factory&, omp_server*&, omp_client& );
+
+    //! Pointer to routine that calls callback function with server version info.
+    void (*my_call_with_server_info_routine)( ::rml::server_info_callback_t cb, void* arg );
+
+public:
+    typedef ::rml::versioned_object::version_type version_type;
+    typedef omp_client client_type;
+    typedef omp_server server_type;
+
+    //! Open factory.
+    /** Dynamically links against RML library. 
+        Returns st_success, st_incompatible, or st_not_found. */
+    status_type open();
+
+    //! Factory method to be called by client to create a server object.
+    /** Factory must be open. 
+        Returns st_success or st_incompatible . */
+    status_type make_server( server_type*&, client_type& );
+
+    //! Close factory.
+    void close();
+
+    //! Call the callback with the server build info.
+    void call_with_server_info( ::rml::server_info_callback_t cb, void* arg ) const;
+};
+
+} // namespace rml
+} // namespace __kmp
+
+#endif /* KMP_RML_OMP_H */
diff --git a/xdl/third_party/tbb/src/rml/include/rml_tbb.h b/xdl/third_party/tbb/src/rml/include/rml_tbb.h
new file mode 100644
index 00000000..3526052f
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/include/rml_tbb.h
@@ -0,0 +1,101 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Header guard and namespace names follow TBB conventions.
+
+#ifndef __TBB_rml_tbb_H
+#define __TBB_rml_tbb_H
+
+#include "tbb/tbb_config.h"
+#include "rml_base.h"
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+class tbb_client;
+
+//------------------------------------------------------------------------
+// Classes instantiated by the server
+//------------------------------------------------------------------------
+
+//! Represents a set of tbb worker threads provided by the server.
+class tbb_server: public ::rml::server {
+public:
+    //! Inform server of adjustments in the number of workers that the client can profitably use.
+    virtual void adjust_job_count_estimate( int delta ) = 0;
+
+#if _WIN32||_WIN64
+    //! Inform server of a tbb master thread.
+    virtual void register_master( execution_resource_t& v ) = 0;
+
+    //! Inform server that the tbb master thread is done with its work.
+    virtual void unregister_master( execution_resource_t v ) = 0;
+#endif /* _WIN32||_WIN64 */
+};
+
+//------------------------------------------------------------------------
+// Classes instantiated by the client
+//------------------------------------------------------------------------
+
+class tbb_client: public ::rml::client {
+public:
+    //! Defined by TBB to steal a task and execute it.  
+    /** Called by server when it wants an execution context to do some TBB work.
+        The method should return when it is okay for the thread to yield indefinitely. */
+    virtual void process( job& ) RML_PURE(void)
+};
+
+/** Client must ensure that instance is zero-inited, typically by being a file-scope object. */
+class tbb_factory: public ::rml::factory {
+
+    //! Pointer to routine that creates an RML server.
+    status_type (*my_make_server_routine)( tbb_factory&, tbb_server*&, tbb_client& );
+
+    //! Pointer to routine that calls callback function with server version info.
+    void (*my_call_with_server_info_routine)( ::rml::server_info_callback_t cb, void* arg );
+
+public:
+    typedef ::rml::versioned_object::version_type version_type;
+    typedef tbb_client client_type;
+    typedef tbb_server server_type;
+
+    //! Open factory.
+    /** Dynamically links against RML library. 
+        Returns st_success, st_incompatible, or st_not_found. */
+    status_type open();
+
+    //! Factory method to be called by client to create a server object.
+    /** Factory must be open. 
+        Returns st_success, or st_incompatible . */
+    status_type make_server( server_type*&, client_type& );
+
+    //! Close factory
+    void close();
+
+    //! Call the callback with the server build info
+    void call_with_server_info( ::rml::server_info_callback_t cb, void* arg ) const;
+};
+
+} // namespace rml
+} // namespace internal
+} // namespace tbb
+
+#endif /*__TBB_rml_tbb_H */
diff --git a/xdl/third_party/tbb/src/rml/index.html b/xdl/third_party/tbb/src/rml/index.html
new file mode 100644
index 00000000..afd48f28
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/index.html
@@ -0,0 +1,31 @@
+<HTML>
+<BODY>
+<H2>Overview</H2>
+
+The subdirectories pertain to the Resource Management Layer (RML).
+
+<H2>Directories</H2>
+
+<DL>
+<DT><P><A HREF="include/index.html">include/</A>
+<DD>Include files used by clients of RML.</P>
+<DT><P><A HREF="client/index.html">client/</A>
+<DD>Source files for code that must be statically linked with a client.</P>
+<DT><P><A HREF="server/index.html">server/</A>
+<DD>Source files for the RML server.</P>
+<DT><P><A HREF="test">test/</A>
+<DD>Unit tests for RML server and its components.</P>
+</DL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
+
diff --git a/xdl/third_party/tbb/src/rml/perfor/omp_nested.cpp b/xdl/third_party/tbb/src/rml/perfor/omp_nested.cpp
new file mode 100644
index 00000000..3a21b048
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/perfor/omp_nested.cpp
@@ -0,0 +1,144 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstddef>
+#include <cstdlib>
+#include <cstdio>
+#include <float.h>
+#include <math.h>
+#include <time.h>
+
+#include <omp.h>
+#include <assert.h>
+
+#include "thread_level.h"
+
+#if _WIN32||_WIN64
+#include <Windows.h> /* Need Sleep */
+#else
+#include <unistd.h>  /* Need usleep */
+#endif
+
+void MilliSleep( unsigned milliseconds ) {
+#if _WIN32||_WIN64
+    Sleep( milliseconds );
+#else
+    usleep( milliseconds*1000 );
+#endif /* _WIN32||_WIN64 */
+}
+
+// Algorithm parameters
+const int Max_OMP_Outer_Threads = 8;
+
+// Global variables
+int max_outer_threads = Max_OMP_Outer_Threads;
+
+// Print help on command-line arguments
+void help_message(char *prog_name) {
+  fprintf(stderr, "\n%s usage:\n", prog_name);
+  fprintf(stderr, 
+	  "  Parameters:\n"
+	  "    -o<num> : max # of threads OMP should use at outer level\n"
+	  "\n  Help:\n"
+	  "    -h : print this help message\n");
+}
+
+// Process command-line arguments
+void process_args(int argc, char *argv[], int *max_outer_t) {
+  (*max_outer_t) = omp_get_max_threads();
+  for (int i=1; i<argc; ++i) {  
+    if (argv[i][0] == '-') {
+      switch (argv[i][1]) {
+      case 'o': // set max_outer_threads
+	if (sscanf(&argv[i][2], "%d", max_outer_t) != 1 || *max_outer_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -o option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'h': // print help message
+	help_message(argv[0]);
+	exit(0);
+	break;
+      default:
+	fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+	help_message(argv[0]);
+	break;
+      }
+    } else {
+      fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+      help_message(argv[0]);
+    }
+  }
+}
+
+int main(int argc, char *argv[]) { 
+  process_args(argc, argv, &max_outer_threads);
+#ifdef LOG_THREADS
+  TotalThreadLevel.init();
+#endif
+
+  double start, end;
+  start = omp_get_wtime( );
+  
+#pragma omp parallel num_threads(max_outer_threads)
+  {
+    int omp_thread = omp_get_thread_num();
+#ifdef LOG_THREADS
+    if (omp_thread == 0)
+      TotalThreadLevel.change_level(omp_get_num_threads(), omp_outer);
+#endif
+    if (omp_thread == 0) {
+      MilliSleep(3000);
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(-1, omp_outer);
+#endif
+#pragma omp parallel
+      {
+	int my_omp_thread = omp_get_thread_num();
+#ifdef LOG_THREADS
+	if (my_omp_thread == 0)
+	  TotalThreadLevel.change_level(omp_get_num_threads(), omp_inner);
+#endif
+	printf("Inner thread %d nested inside outer thread %d\n", my_omp_thread, omp_thread);
+#ifdef LOG_THREADS
+	if (my_omp_thread == 0)
+	  TotalThreadLevel.change_level(-omp_get_num_threads(), omp_inner);
+#endif
+      }
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(1, omp_outer);
+#endif
+    }
+    else {
+      MilliSleep(6000);
+    }
+#ifdef LOG_THREADS
+    if (omp_thread == 0)
+      TotalThreadLevel.change_level(-omp_get_num_threads(), omp_outer);
+#endif
+  }
+  end = omp_get_wtime( );
+  printf("Simple test of nested OMP (%d outer threads max) took: %6.6f\n",
+	 max_outer_threads, end-start);
+#ifdef LOG_THREADS
+  TotalThreadLevel.dump();
+#endif
+  return 0;
+}
diff --git a/xdl/third_party/tbb/src/rml/perfor/omp_simple.cpp b/xdl/third_party/tbb/src/rml/perfor/omp_simple.cpp
new file mode 100644
index 00000000..24604215
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/perfor/omp_simple.cpp
@@ -0,0 +1,160 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstddef>
+#include <cstdlib>
+#include <cstdio>
+#include <float.h>
+#include <math.h>
+#include <time.h>
+
+#include <omp.h>
+#include <assert.h>
+
+#include "thread_level.h"
+
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+
+#if _WIN32||_WIN64
+#include <Windows.h> /* Need Sleep */
+#else
+#include <unistd.h>  /* Need usleep */
+#endif
+
+void MilliSleep( unsigned milliseconds ) {
+#if _WIN32||_WIN64
+    Sleep( milliseconds );
+#else
+    usleep( milliseconds*1000 );
+#endif /* _WIN32||_WIN64 */
+}
+
+using namespace std;
+using namespace tbb;
+
+// Algorithm parameters
+const int Max_TBB_Threads = 16;
+const int Max_OMP_Threads = 16;
+
+// Global variables
+int max_tbb_threads = Max_TBB_Threads;
+int max_omp_threads = Max_OMP_Threads;
+
+// Print help on command-line arguments
+void help_message(char *prog_name) {
+  fprintf(stderr, "\n%s usage:\n", prog_name);
+  fprintf(stderr, 
+	  "  Parameters:\n"
+	  "    -t<num> : max # of threads TBB should use\n"
+	  "    -o<num> : max # of threads OMP should use\n"
+	  "\n  Help:\n"
+	  "    -h : print this help message\n");
+}
+
+// Process command-line arguments
+void process_args(int argc, char *argv[], int *max_tbb_t, int *max_omp_t) {
+  for (int i=1; i<argc; ++i) {  
+    if (argv[i][0] == '-') {
+      switch (argv[i][1]) {
+      case 't': // set max_tbb_threads
+	if (sscanf(&argv[i][2], "%d", max_tbb_t) != 1 || *max_tbb_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -t option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'o': // set max_omp_threads
+	if (sscanf(&argv[i][2], "%d", max_omp_t) != 1 || *max_omp_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -o option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'h': // print help message
+	help_message(argv[0]);
+	exit(0);
+	break;
+      default:
+	fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+	help_message(argv[0]);
+	break;
+      }
+    } else {
+      fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+      help_message(argv[0]);
+    }
+  }
+}
+
+int main(int argc, char *argv[]) { 
+  process_args(argc, argv, &max_tbb_threads, &max_omp_threads);
+  TotalThreadLevel.init();
+
+  double start, end;
+  start = omp_get_wtime();
+  
+#pragma omp parallel num_threads(max_omp_threads)
+  {
+    int omp_thread = omp_get_thread_num();
+#ifdef LOG_THREADS
+    if (omp_thread == 0)
+      TotalThreadLevel.change_level(omp_get_num_threads(), omp_outer);
+#endif
+    task_scheduler_init phase(max_tbb_threads);
+    if (omp_thread == 0) {
+      MilliSleep(3000);
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(-1, omp_outer);
+#endif
+      parallel_for(blocked_range<size_t>(0, 1000), 
+		   [=](const blocked_range<size_t>& range) {
+#ifdef LOG_THREADS
+	TotalThreadLevel.change_level(1, tbb_inner);
+#endif
+#pragma ivdep
+	for (size_t i=range.begin(); i!=range.end(); ++i) {
+	  if (i==range.begin())
+	    printf("TBB range starting at %d on OMP thread %d\n", (int)i, omp_thread);
+	}
+#ifdef LOG_THREADS
+	TotalThreadLevel.change_level(-1, tbb_inner);
+#endif
+      }, auto_partitioner());
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(1, omp_outer);
+#endif
+    }
+    else {
+      MilliSleep(6000);
+    }
+#ifdef LOG_THREADS
+    if (omp_thread == 0)
+      TotalThreadLevel.change_level(-omp_get_num_threads(), omp_outer);
+#endif
+  }
+  end = omp_get_wtime();
+  printf("Simple test of OMP (%d threads max) with TBB (%d threads max) inside took: %6.6f\n",
+	 max_omp_threads, max_tbb_threads, end-start);
+#ifdef LOG_THREADS
+  TotalThreadLevel.dump();
+#endif
+  return 0;
+}
diff --git a/xdl/third_party/tbb/src/rml/perfor/tbb_multi_omp.cpp b/xdl/third_party/tbb/src/rml/perfor/tbb_multi_omp.cpp
new file mode 100644
index 00000000..5b5064c1
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/perfor/tbb_multi_omp.cpp
@@ -0,0 +1,186 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstddef>
+#include <cstdlib>
+#include <cstdio>
+#include <float.h>
+#include <math.h>
+#include <time.h>
+
+#include <omp.h>
+#include <assert.h>
+
+#include "thread_level.h"
+
+#include "tbb/task.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/scalable_allocator.h"
+
+#if _WIN32||_WIN64
+#include <Windows.h> /* Need Sleep */
+#else
+#include <unistd.h>  /* Need usleep */
+#endif
+
+void MilliSleep( unsigned milliseconds ) {
+#if _WIN32||_WIN64
+    Sleep( milliseconds );
+#else
+    usleep( milliseconds*1000 );
+#endif /* _WIN32||_WIN64 */
+}
+
+using namespace std;
+using namespace tbb;
+
+// Algorithm parameters
+const int Max_TBB_Threads = 16;
+const int Max_OMP_Threads = 16;
+
+// Global variables
+int max_tbb_threads = Max_TBB_Threads;
+int max_omp_threads = Max_OMP_Threads;
+
+// Print help on command-line arguments
+void help_message(char *prog_name) {
+  fprintf(stderr, "\n%s usage:\n", prog_name);
+  fprintf(stderr, 
+	  "  Parameters:\n"
+	  "    -t<num> : max # of threads TBB should use\n"
+	  "    -o<num> : max # of threads OMP should use\n"
+	  "\n  Help:\n"
+	  "    -h : print this help message\n");
+}
+
+// Process command-line arguments
+void process_args(int argc, char *argv[], int *max_tbb_t, int *max_omp_t) {
+  for (int i=1; i<argc; ++i) {  
+    if (argv[i][0] == '-') {
+      switch (argv[i][1]) {
+      case 't': // set max_tbb_threads
+	if (sscanf(&argv[i][2], "%d", max_tbb_t) != 1 || *max_tbb_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -t option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'o': // set max_omp_threads
+	if (sscanf(&argv[i][2], "%d", max_omp_t) != 1 || *max_omp_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -o option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'h': // print help message
+	help_message(argv[0]);
+	exit(0);
+	break;
+      default:
+	fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+	help_message(argv[0]);
+	break;
+      }
+    } else {
+      fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+      help_message(argv[0]);
+    }
+  }
+}
+
+class SimpleTask : public task {
+  bool isLeaf;
+  int myId;
+public:
+  SimpleTask(bool isLeaf_, int myId_) : isLeaf(isLeaf_), myId(myId_) {}
+  task* execute() {
+#ifdef LOG_THREADS
+    TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+    omp_set_num_threads(max_omp_threads);
+    if (!isLeaf) {
+      set_ref_count(65);
+      for (int i=0; i<64; ++i) {
+	SimpleTask& st = *new(allocate_child()) SimpleTask(true, i);
+	spawn(st);
+      }
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+      wait_for_all();
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+    }
+    else {
+      if (myId%2 == 0) {
+	MilliSleep(3000);
+#pragma omp parallel
+	{
+#ifdef LOG_THREADS
+	  if (omp_get_thread_num() == 0)
+	    TotalThreadLevel.change_level(omp_get_num_threads()-1, omp_inner);
+#endif
+	  //printf("In OMP parallel region on TBB task with myId=0: thread %d of %d\n", omp_get_thread_num(), omp_get_num_threads());
+#ifdef LOG_THREADS
+	  if (omp_get_thread_num() == 0)
+	    TotalThreadLevel.change_level(-(omp_get_num_threads()-1), omp_inner);
+#endif
+	}
+      }
+      else {
+	MilliSleep(6000);
+      }
+    }
+#ifdef LOG_THREADS
+    TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+    return NULL;
+  }
+};
+
+
+int main(int argc, char *argv[]) { 
+#ifdef LOG_THREADS
+  TotalThreadLevel.init();
+  TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+  process_args(argc, argv, &max_tbb_threads, &max_omp_threads);
+
+  task_scheduler_init phase(max_tbb_threads);
+  tick_count start, end;
+  start = tick_count::now();
+  SimpleTask& st = *new(task::allocate_root()) SimpleTask(false, -1);
+#ifdef LOG_THREADS
+  TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+  task::spawn_root_and_wait(st);
+#ifdef LOG_THREADS
+  TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+  end = tick_count::now();
+  printf("Simple Test of TBB (%d threads max) with OMP (%d threads max) inside took: %6.6f\n", 
+	 max_tbb_threads, max_omp_threads, (end-start).seconds());
+
+#ifdef LOG_THREADS
+  TotalThreadLevel.change_level(-1, tbb_outer);
+  TotalThreadLevel.dump();
+#endif
+  return 0;
+}
diff --git a/xdl/third_party/tbb/src/rml/perfor/tbb_simple.cpp b/xdl/third_party/tbb/src/rml/perfor/tbb_simple.cpp
new file mode 100644
index 00000000..58558ba3
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/perfor/tbb_simple.cpp
@@ -0,0 +1,191 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <cstddef>
+#include <cstdlib>
+#include <cstdio>
+#include <float.h>
+#include <math.h>
+#include <time.h>
+
+#include <omp.h>
+#include <assert.h>
+
+#include "thread_level.h"
+
+#include "tbb/task.h"
+#include "tbb/tick_count.h"
+#include "tbb/task_scheduler_init.h"
+
+#if _WIN32||_WIN64
+#include <Windows.h> /* Need Sleep */
+#else
+#include <unistd.h>  /* Need usleep */
+#endif
+
+void MilliSleep( unsigned milliseconds ) {
+#if _WIN32||_WIN64
+    Sleep( milliseconds );
+#else
+    usleep( milliseconds*1000 );
+#endif /* _WIN32||_WIN64 */
+}
+
+using namespace std;
+using namespace tbb;
+
+// Algorithm parameters
+const int Max_TBB_Threads = 16;
+const int Max_OMP_Threads = 16;
+
+// Global variables
+int max_tbb_threads = Max_TBB_Threads;
+int max_omp_threads = Max_OMP_Threads;
+
+// Print help on command-line arguments
+void help_message(char *prog_name) {
+  fprintf(stderr, "\n%s usage:\n", prog_name);
+  fprintf(stderr, 
+	  "  Parameters:\n"
+	  "    -t<num> : max # of threads TBB should use\n"
+	  "    -o<num> : max # of threads OMP should use\n"
+	  "\n  Help:\n"
+	  "    -h : print this help message\n");
+}
+
+// Process command-line arguments
+void process_args(int argc, char *argv[], int *max_tbb_t, int *max_omp_t) {
+  for (int i=1; i<argc; ++i) {  
+    if (argv[i][0] == '-') {
+      switch (argv[i][1]) {
+      case 't': // set max_tbb_threads
+	if (sscanf(&argv[i][2], "%d", max_tbb_t) != 1 || *max_tbb_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -t option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'o': // set max_omp_threads
+	if (sscanf(&argv[i][2], "%d", max_omp_t) != 1 || *max_omp_t < 1) {
+	  fprintf(stderr, "%s Warning: argument of -o option unacceptable: %s\n", argv[0], &argv[i][2]);
+	  help_message(argv[0]);
+	}
+	break;
+      case 'h': // print help message
+	help_message(argv[0]);
+	exit(0);
+	break;
+      default:
+	fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+	help_message(argv[0]);
+	break;
+      }
+    } else {
+      fprintf(stderr, "%s: Warning: command-line option ignored: %s\n", argv[0], argv[i]);
+      help_message(argv[0]);
+    }
+  }
+}
+
+class SimpleTask : public task {
+  bool isLeaf;
+  int myId;
+public:
+  SimpleTask(bool isLeaf_, int myId_) : isLeaf(isLeaf_), myId(myId_) {}
+  task* execute() {
+#ifdef LOG_THREADS
+    TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+    omp_set_num_threads(max_omp_threads);
+    if (!isLeaf) {
+      set_ref_count(17);
+      for (int i=0; i<16; ++i) {
+	SimpleTask& st = *new(allocate_child()) SimpleTask(true, i);
+	spawn(st);
+      }
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+      wait_for_all();
+#ifdef LOG_THREADS
+      TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+    }
+    else {
+      if (myId == 0) {
+	MilliSleep(3000);
+#ifdef LOG_THREADS
+	TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+#pragma omp parallel
+	{
+#ifdef LOG_THREADS
+	  if (omp_get_thread_num() == 0)
+	    TotalThreadLevel.change_level(omp_get_num_threads(), omp_inner);
+#endif
+	  printf("In OMP parallel region on TBB task with myId=0: thread %d of %d\n", 
+		 omp_get_thread_num(), omp_get_num_threads());
+#ifdef LOG_THREADS
+	  if (omp_get_thread_num() == 0)
+	    TotalThreadLevel.change_level(-omp_get_num_threads(), omp_inner);
+#endif
+	}
+#ifdef LOG_THREADS
+	TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+      }
+      else {
+	MilliSleep(6000);
+      }
+    }
+#ifdef LOG_THREADS
+    TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+    return NULL;
+  }
+};
+
+
+int main(int argc, char *argv[]) { 
+#ifdef LOG_THREADS
+  TotalThreadLevel.init();
+  TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+  process_args(argc, argv, &max_tbb_threads, &max_omp_threads);
+
+  task_scheduler_init phase(max_tbb_threads);
+  tick_count start, end;
+  start = tick_count::now();
+  SimpleTask& st = *new(task::allocate_root()) SimpleTask(false, -1);
+#ifdef LOG_THREADS
+  TotalThreadLevel.change_level(-1, tbb_outer);
+#endif
+  task::spawn_root_and_wait(st);
+#ifdef LOG_THREADS
+  TotalThreadLevel.change_level(1, tbb_outer);
+#endif
+  end = tick_count::now();
+  printf("Simple Test of TBB (%d threads max) with OMP (%d threads max) inside took: %6.6f\n", 
+	 max_tbb_threads, max_omp_threads, (end-start).seconds());
+#ifdef LOG_THREADS
+  TotalThreadLevel.change_level(-1, tbb_outer);
+  TotalThreadLevel.dump();
+#endif
+  return 0;
+}
diff --git a/xdl/third_party/tbb/src/rml/perfor/thread_level.h b/xdl/third_party/tbb/src/rml/perfor/thread_level.h
new file mode 100644
index 00000000..abc1f53b
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/perfor/thread_level.h
@@ -0,0 +1,134 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Thread level recorder
+#ifndef __THREAD_LEVEL_H
+#define __THREAD_LEVEL_H
+#include <cstdio>
+#include <omp.h>
+#include <assert.h>
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+
+//#define LOG_THREADS // use this to ifdef out calls to this class 
+//#define NO_BAIL_OUT // continue execution after detecting oversubscription
+
+using namespace tbb;
+
+typedef enum {tbb_outer, tbb_inner, omp_outer, omp_inner} client_t;
+
+class ThreadLevelRecorder {
+  tbb::atomic<int> tbb_outer_level;
+  tbb::atomic<int> tbb_inner_level;
+  tbb::atomic<int> omp_outer_level;
+  tbb::atomic<int> omp_inner_level;
+  struct record {
+    tbb::tick_count time;
+    int n_tbb_outer_thread;
+    int n_tbb_inner_thread;
+    int n_omp_outer_thread;
+    int n_omp_inner_thread;
+  };
+  tbb::atomic<unsigned> next;
+  /** Must be power of two */
+  static const unsigned max_record_count = 1<<20;
+  record array[max_record_count];
+  int max_threads;
+  bool fail;
+ public:
+  void change_level(int delta, client_t whichClient);
+  void dump();
+  void init();
+};
+
+void ThreadLevelRecorder::change_level(int delta, client_t whichClient) {
+  int tox=tbb_outer_level, tix=tbb_inner_level, oox=omp_outer_level, oix=omp_inner_level;
+  if (whichClient == tbb_outer) {
+    tox = tbb_outer_level+=delta;
+  } else if (whichClient == tbb_inner) {
+    tix = tbb_inner_level+=delta;
+  } else if (whichClient == omp_outer) {
+    oox = omp_outer_level+=delta;
+  } else if (whichClient == omp_inner) {
+    oix = omp_inner_level+=delta;
+  } else {
+    printf("WARNING: Bad client type; ignoring.\n");
+    return;
+  }
+  // log non-negative entries
+  tbb::tick_count t = tbb::tick_count::now();
+  unsigned k = next++;
+  if (k<max_record_count) {
+    record& r = array[k];
+    r.time = t;
+    r.n_tbb_outer_thread = tox>=0?tox:0;
+    r.n_omp_outer_thread = oox>=0?oox:0;
+    r.n_tbb_inner_thread = tix>=0?tix:0;
+    r.n_omp_inner_thread = oix>=0?oix:0;
+  }
+  char errStr[100];
+  int tot_threads;
+  tot_threads = tox+tix+oox+oix;
+  sprintf(errStr, "ERROR: Number of threads (%d+%d+%d+%d=%d) in use exceeds maximum (%d).\n", 
+	  tox, tix, oox, oix, tot_threads, max_threads);
+  if (tot_threads > max_threads) {
+#ifdef NO_BAIL_OUT
+    if (!fail) {
+      printf("%sContinuing...\n", errStr);
+      fail = true;
+    }
+#else
+    dump();
+    printf("%s\n", errStr);
+    assert(tot_threads <= max_threads);
+#endif
+  }
+}
+
+void ThreadLevelRecorder::dump() {
+  FILE* f = fopen("time.txt","w");
+  if (!f) {
+    perror("fopen(time.txt)\n");
+    exit(1);
+  }
+  unsigned limit = next;
+  if (limit>max_record_count) { // Clip
+    limit = max_record_count;
+  }
+  for (unsigned i=0; i<limit; ++i) {
+    fprintf(f,"%f\t%d\t%d\t%d\t%d\n",(array[i].time-array[0].time).seconds(), array[i].n_tbb_outer_thread,
+	    array[i].n_tbb_inner_thread, array[i].n_omp_outer_thread, array[i].n_omp_inner_thread);
+  }
+  fclose(f);
+  int tox=tbb_outer_level, tix=tbb_inner_level, oox=omp_outer_level, oix=omp_inner_level;
+  int tot_threads;
+  tot_threads = tox+tix+oox+oix;
+  if (!fail) printf("INFO: Passed.\n");
+  else printf("INFO: Failed.\n");
+}
+
+void ThreadLevelRecorder::init() {
+  fail = false;
+  max_threads = omp_get_max_threads();
+  printf("INFO: Getting maximum hardware threads... %d.\n", max_threads);
+}
+
+ThreadLevelRecorder TotalThreadLevel;
+#endif
diff --git a/xdl/third_party/tbb/src/rml/server/index.html b/xdl/third_party/tbb/src/rml/server/index.html
new file mode 100644
index 00000000..df6b0931
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/index.html
@@ -0,0 +1,18 @@
+<HTML>
+<BODY>
+<H2>Overview</H2>
+
+This directory has source code internal to the server.
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
+
diff --git a/xdl/third_party/tbb/src/rml/server/irml.rc b/xdl/third_party/tbb/src/rml/server/irml.rc
new file mode 100644
index 00000000..b06cebb1
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/irml.rc
@@ -0,0 +1,116 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+// Microsoft Visual C++ generated resource script.
+//
+#ifdef APSTUDIO_INVOKED
+#ifndef APSTUDIO_READONLY_SYMBOLS
+#define _APS_NO_MFC                     1
+#define _APS_NEXT_RESOURCE_VALUE        102
+#define _APS_NEXT_COMMAND_VALUE         40001
+#define _APS_NEXT_CONTROL_VALUE         1001
+#define _APS_NEXT_SYMED_VALUE           101
+#endif
+#endif
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#include <winresrc.h>
+#define ENDL "\r\n"
+#include "tbb/tbb_version.h"
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// Neutral resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_NEU)
+#ifdef _WIN32
+LANGUAGE LANG_NEUTRAL, SUBLANG_NEUTRAL
+#pragma code_page(1252)
+#endif //_WIN32
+
+/////////////////////////////////////////////////////////////////////////////
+// manifest integration
+#ifdef TBB_MANIFEST
+#include "winuser.h"
+2 RT_MANIFEST tbbmanifest.exe.manifest
+#endif
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Version
+//
+
+VS_VERSION_INFO VERSIONINFO
+ FILEVERSION TBB_VERNUMBERS
+ PRODUCTVERSION TBB_VERNUMBERS
+ FILEFLAGSMASK 0x17L
+#ifdef _DEBUG
+ FILEFLAGS 0x1L
+#else
+ FILEFLAGS 0x0L
+#endif
+ FILEOS 0x40004L
+ FILETYPE 0x2L
+ FILESUBTYPE 0x0L
+BEGIN
+    BLOCK "StringFileInfo"
+    BEGIN
+        BLOCK "000004b0"
+        BEGIN
+            VALUE "CompanyName", "Intel Corporation\0"
+            VALUE "FileDescription", "Intel(R) Threading Building Blocks resource manager library\0"
+            VALUE "FileVersion", TBB_VERSION "\0"
+            VALUE "LegalCopyright", "Copyright 2005-2018 Intel Corporation.  All Rights Reserved.\0"
+            VALUE "LegalTrademarks", "\0"
+#ifndef TBB_USE_DEBUG
+            VALUE "OriginalFilename", "irml.dll\0"
+#else
+            VALUE "OriginalFilename", "irml_debug.dll\0"
+#endif
+            VALUE "ProductName", "Intel(R) Threading Building Blocks for Windows\0"
+            VALUE "ProductVersion", TBB_VERSION "\0"
+            VALUE "PrivateBuild", "\0"
+            VALUE "SpecialBuild", "\0"
+        END
+    END
+    BLOCK "VarFileInfo"
+    BEGIN
+        VALUE "Translation", 0x0, 1200
+    END
+END
+
+#endif    // Neutral resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/src/rml/server/job_automaton.h b/xdl/third_party/tbb/src/rml/server/job_automaton.h
new file mode 100644
index 00000000..370bead6
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/job_automaton.h
@@ -0,0 +1,145 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __RML_job_automaton_H
+#define __RML_job_automaton_H
+
+#include "rml_base.h"
+#include "tbb/atomic.h"
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings 
+    #pragma warning (push)
+    #pragma warning (disable: 4244)
+#endif
+
+namespace rml {
+
+namespace internal {
+
+//! Finite state machine.   
+/**   /--------------\
+     /                V
+    0 --> 1--> ptr --> -1 
+                ^
+                |
+                |
+                V
+              ptr|1
+
+"owner" = corresponding server_thread.
+Odd states (except -1) indicate that someone is executing code on the job.
+Most transitions driven only by owner.
+Transition 0-->-1 is driven by non-owner.
+Transition ptr->-1 is driven  by owner or non-owner.
+*/ 
+class job_automaton: no_copy {
+private:
+    tbb::atomic<intptr_t> my_job;
+public:
+    /** Created by non-owner */
+    job_automaton() {
+        my_job = 0;
+    }
+ 
+    ~job_automaton() {
+        __TBB_ASSERT( my_job==-1, "must plug before destroying" );
+    }
+
+    //! Try to transition 0-->1 or ptr-->ptr|1.
+    /** Should only be called by owner. */
+    bool try_acquire() {
+        intptr_t snapshot = my_job;
+        if( snapshot==-1 ) {
+            return false;
+        } else {
+            __TBB_ASSERT( (snapshot&1)==0, "already marked that way" );
+            intptr_t old = my_job.compare_and_swap( snapshot|1, snapshot );
+            __TBB_ASSERT( old==snapshot || old==-1, "unexpected interference" );  
+            return old==snapshot;
+        }
+    }
+    //! Transition ptr|1-->ptr
+    /** Should only be called by owner. */
+    void release() {
+        intptr_t snapshot = my_job;
+        __TBB_ASSERT( snapshot&1, NULL );
+        // Atomic store suffices here.
+        my_job = snapshot&~1;
+    }
+
+    //! Transition 1-->ptr
+    /** Should only be called by owner. */
+    void set_and_release( rml::job* job ) {
+        intptr_t value = reinterpret_cast<intptr_t>(job);
+        __TBB_ASSERT( (value&1)==0, "job misaligned" );
+        __TBB_ASSERT( value!=0, "null job" );
+        __TBB_ASSERT( my_job==1, "already set, or not marked busy?" );
+        // Atomic store suffices here.
+        my_job = value;
+    }
+
+    //! Transition 0-->-1
+    /** If successful, return true. called by non-owner (for TBB and the likes) */
+    bool try_plug_null() {
+        return my_job.compare_and_swap( -1, 0 )==0;
+    }
+
+    //! Try to transition to -1.  If successful, set j to contents and return true.
+    /** Called by owner or non-owner. (for OpenMP and the likes) */
+    bool try_plug( rml::job*&j ) {
+        for(;;) {
+            intptr_t snapshot = my_job;
+            if( snapshot&1 ) {
+                j = NULL;
+                return false;
+            } 
+            // Not busy
+            if( my_job.compare_and_swap( -1, snapshot )==snapshot ) {
+                j = reinterpret_cast<rml::job*>(snapshot);
+                return true;
+            } 
+            // Need to retry, because current thread may be non-owner that read a 0, and owner might have
+            // caused transition 0->1->ptr after we took our snapshot.
+        }
+    }
+
+    /** Called by non-owner to wait for transition to ptr. */
+    rml::job* wait_for_job() const {
+        intptr_t snapshot;
+        for(;;) {
+            snapshot = my_job;
+            if( snapshot&~1 ) break;
+            __TBB_Yield();
+        }
+        __TBB_ASSERT( snapshot!=-1, "wait on plugged job_automaton" );
+        return reinterpret_cast<rml::job*>(snapshot&~1);
+    }
+};
+
+} // namespace internal
+} // namespace rml
+
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4244 are back
+
+#endif /* __RML_job_automaton_H */
diff --git a/xdl/third_party/tbb/src/rml/server/lin-rml-export.def b/xdl/third_party/tbb/src/rml/server/lin-rml-export.def
new file mode 100644
index 00000000..04f43bb2
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/lin-rml-export.def
@@ -0,0 +1,30 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+__RML_open_factory;
+__RML_close_factory;
+__TBB_make_rml_server;
+__KMP_make_rml_server;
+__TBB_call_with_my_server_info;
+__KMP_call_with_my_server_info;
+local:*;
+};
diff --git a/xdl/third_party/tbb/src/rml/server/rml_server.cpp b/xdl/third_party/tbb/src/rml/server/rml_server.cpp
new file mode 100644
index 00000000..25084656
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/rml_server.cpp
@@ -0,0 +1,3309 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "rml_tbb.h"
+#define private public /* Sleazy trick to avoid publishing internal names in public header. */
+#include "rml_omp.h"
+#undef private
+
+#include "tbb/tbb_allocator.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/aligned_space.h"
+#include "tbb/atomic.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/tbb_misc.h"           // Get AvailableHwConcurrency() from here.
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+// VS2008/VC9 seems to have an issue;
+#pragma warning( push )
+#pragma warning( disable: 4985 )
+#endif
+#include "tbb/concurrent_vector.h"
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+#pragma warning( pop )
+#endif
+#if _MSC_VER && defined(_Wp64)
+// Workaround for overzealous compiler warnings
+#pragma warning (push)
+#pragma warning (disable: 4244)
+#endif
+
+#include "job_automaton.h"
+#include "wait_counter.h"
+#include "thread_monitor.h"
+
+#if RML_USE_WCRM
+#include <concrt.h>
+#include <concrtrm.h>
+using namespace Concurrency;
+#include <vector>
+#include <hash_map>
+#define __RML_REMOVE_VIRTUAL_PROCESSORS_DISABLED 0
+#endif /* RML_USE_WCRM */
+
+#define STRINGIFY(x) #x
+#define TOSTRING(x) STRINGIFY(x)
+
+namespace rml {
+namespace internal {
+
+using tbb::internal::rml::tbb_client;
+using tbb::internal::rml::tbb_server;
+
+using __kmp::rml::omp_client;
+using __kmp::rml::omp_server;
+
+typedef versioned_object::version_type version_type;
+
+#define SERVER_VERSION 2
+#define EARLIEST_COMPATIBLE_CLIENT_VERSION 2
+
+static const size_t cache_line_size = tbb::internal::NFS_MaxLineSize;
+
+template<typename Server, typename Client> class generic_connection;
+class tbb_connection_v2;
+class omp_connection_v2;
+
+#if RML_USE_WCRM
+//! State of a server_thread
+/** Below are diagrams of legal state transitions.
+
+                          ts_busy
+                          ^      ^
+                         /        \
+                        /          V
+    ts_done <----- ts_asleep <------> ts_idle
+*/
+
+enum thread_state_t {
+    ts_idle,
+    ts_asleep,
+    ts_busy,
+    ts_done
+};
+
+//! Extra state of an omp server thread
+enum thread_extra_state_t {
+    ts_none,
+    ts_removed,
+    ts_lent
+};
+
+//! Results from try_grab_for()
+enum thread_grab_t {
+    wk_failed,
+    wk_from_asleep,
+    wk_from_idle
+};
+
+#else /* !RML_USE_WCRM */
+
+//! State of a server_thread
+/** Below are diagrams of legal state transitions.
+
+    OMP
+              ts_omp_busy
+              ^          ^
+             /            \
+            /              V
+    ts_asleep <-----------> ts_idle
+
+
+              ts_deactivated
+             ^            ^
+            /              \
+           V                \
+    ts_none  <--------------> ts_reactivated
+
+    TBB
+              ts_tbb_busy
+              ^          ^
+             /            \
+            /              V
+    ts_asleep <-----------> ts_idle --> ts_done
+
+    For TBB only. Extra state transition.
+
+    ts_created -> ts_started -> ts_visited
+ */
+enum thread_state_t {
+    //! Thread not doing anything useful, but running and looking for work.
+    ts_idle,
+    //! Thread not doing anything useful and is asleep */
+    ts_asleep,
+    //! Thread is enlisted into OpenMP team
+    ts_omp_busy,
+    //! Thread is busy doing TBB work.
+    ts_tbb_busy,
+    //! For tbb threads only
+    ts_done,
+    ts_created,
+    ts_started,
+    ts_visited,
+    //! For omp threads only
+    ts_none,
+    ts_deactivated,
+    ts_reactivated
+};
+#endif /* RML_USE_WCRM */
+
+#if TBB_USE_ASSERT
+#define PRODUCE_ARG(x) ,x
+#else
+#define PRODUCE_ARG(x)
+#endif /* TBB_USE_ASSERT */
+
+//! Synchronizes dispatch of OpenMP work.
+class omp_dispatch_type {
+    typedef ::rml::job job_type;
+    omp_client* client;
+    void* cookie;
+    omp_client::size_type index;
+    tbb::atomic<job_type*> job;
+#if TBB_USE_ASSERT
+    omp_connection_v2* server;
+#endif /* TBB_USE_ASSERT */
+public:
+    omp_dispatch_type() {job=NULL;}
+    void consume();
+    void produce( omp_client& c, job_type* j, void* cookie_, omp_client::size_type index_ PRODUCE_ARG( omp_connection_v2& s )) {
+        __TBB_ASSERT( j, NULL );
+        __TBB_ASSERT( !job, "job already set" );
+        client = &c;
+#if TBB_USE_ASSERT
+        server = &s;
+#endif /* TBB_USE_ASSERT */
+        cookie = cookie_;
+        index = index_;
+        // Must be last
+        job = j;
+    }
+};
+
+//! A reference count.
+/** No default constructor, because users of ref_count must be very careful about whether the
+    initial reference count is 0 or 1. */
+class ref_count: no_copy {
+    friend class thread_map;
+    tbb::atomic<int> my_ref_count;
+public:
+    ref_count(int k ) {my_ref_count=k;}
+    ~ref_count() {__TBB_ASSERT( !my_ref_count, "premature destruction of refcounted object" );}
+    //! Add one and return new value.
+    int add_ref() {
+        int k = ++my_ref_count;
+        __TBB_ASSERT(k>=1,"reference count underflowed before add_ref");
+        return k;
+    }
+    //! Subtract one and return new value.
+    int remove_ref() {
+        int k = --my_ref_count;
+        __TBB_ASSERT(k>=0,"reference count underflow");
+        return k;
+    }
+};
+
+#if RML_USE_WCRM
+
+#if USE_UMS_THREAD
+#define RML_THREAD_KIND UmsThreadDefault
+#define RML_THREAD_KIND_STRING "UmsThread"
+#else
+#define RML_THREAD_KIND ThreadScheduler
+#define RML_THREAD_KIND_STRING "WinThread"
+#endif
+
+// Forward declaration
+class thread_map;
+
+static const IExecutionResource* c_remove_prepare = (IExecutionResource*)0;
+static const IExecutionResource* c_remove_returned = (IExecutionResource*)1;
+
+//! Server thread representation
+class server_thread_rep : no_copy {
+    friend class thread_map;
+    friend class omp_connection_v2;
+    friend class server_thread;
+    friend class tbb_server_thread;
+    friend class omp_server_thread;
+    template<typename Connection> friend void make_job( Connection& c, typename Connection::server_thread_type& t );
+    typedef int thread_state_rep_t;
+public:
+    //! Ctor
+    server_thread_rep( bool assigned, IScheduler* s, IExecutionResource* r, thread_map& map, rml::client& cl ) :
+        uid( GetExecutionContextId() ), my_scheduler(s), my_proxy(NULL),
+        my_thread_map(map), my_client(cl), my_job(NULL)
+    {
+        my_state = assigned ? ts_busy : ts_idle;
+        my_extra_state = ts_none;
+        terminate = false;
+        my_execution_resource = r;
+    }
+    //! Dtor
+    ~server_thread_rep() {}
+
+    //! Synchronization routine
+    inline rml::job* wait_for_job() {
+        if( !my_job ) my_job = my_job_automaton.wait_for_job();
+        return my_job;
+    }
+
+    // Getters and setters
+    inline thread_state_t read_state() const { thread_state_rep_t s = my_state; return static_cast<thread_state_t>(s); }
+    inline void set_state( thread_state_t to ) {my_state = to;}
+    inline void set_removed() { __TBB_ASSERT( my_extra_state==ts_none, NULL ); my_extra_state = ts_removed; }
+    inline bool is_removed() const { return my_extra_state==ts_removed; }
+    inline bool is_lent() const {return my_extra_state==ts_lent;}
+    inline void set_lent() { my_extra_state=ts_lent; }
+    inline void set_returned() { my_extra_state=ts_none; }
+    inline IExecutionResource* get_execution_resource() { return my_execution_resource; }
+    inline IVirtualProcessorRoot* get_virtual_processor() { return (IVirtualProcessorRoot*)get_execution_resource(); }
+
+    //! Enlist the thread for work
+    inline bool wakeup( thread_state_t to, thread_state_t from ) {
+        __TBB_ASSERT( from==ts_asleep && (to==ts_idle||to==ts_busy||to==ts_done), NULL );
+        return my_state.compare_and_swap( to, from )==from;
+    }
+
+    //! Enlist the thread for.
+    thread_grab_t try_grab_for();
+
+    //! Destroy the client job associated with the thread
+    template<typename Connection> bool destroy_job( Connection* c );
+
+    //! Try to re-use the thread
+    void revive( IScheduler* s, IExecutionResource* r, rml::client& c ) {
+        // the variables may not have been set before a thread was told to quit
+        __TBB_ASSERT( my_scheduler==s, "my_scheduler has been altered?\n" );
+        my_scheduler = s;
+        __TBB_ASSERT( &my_client==&c, "my_client has been altered?\n" );
+        if( r ) my_execution_resource = r;
+        my_client = c;
+        my_state = ts_idle;
+        __TBB_ASSERT( my_extra_state==ts_removed, NULL );
+        my_extra_state = ts_none;
+    }
+
+protected:
+    const int uid;
+    IScheduler* my_scheduler;
+    IThreadProxy* my_proxy;
+    tbb::atomic<IExecutionResource*> my_execution_resource; /* for non-masters, it is IVirtualProcessorRoot */
+    thread_map& my_thread_map;
+    rml::client& my_client;
+    job* my_job;
+    job_automaton my_job_automaton;
+    tbb::atomic<bool> terminate;
+    tbb::atomic<thread_state_rep_t> my_state;
+    tbb::atomic<thread_extra_state_t> my_extra_state;
+};
+
+//! Class that implements IExecutionContext
+class server_thread : public IExecutionContext, public server_thread_rep {
+    friend class tbb_connection_v2;
+    friend class omp_connection_v2;
+    friend class tbb_server_thread;
+    friend class omp_server_thread;
+    friend class thread_map;
+    template<typename Connection> friend void make_job( Connection& c, typename Connection::server_thread_type& t );
+protected:
+    server_thread( bool is_tbb, bool assigned, IScheduler* s, IExecutionResource* r, thread_map& map, rml::client& cl ) : server_thread_rep(assigned,s,r,map,cl), tbb_thread(is_tbb) {}
+    ~server_thread() {}
+    unsigned int GetId() const __TBB_override { return uid; }
+    IScheduler* GetScheduler() __TBB_override { return my_scheduler; }
+    IThreadProxy* GetProxy()   __TBB_override { return my_proxy; }
+    void SetProxy( IThreadProxy* thr_proxy ) __TBB_override { my_proxy = thr_proxy; }
+
+private:
+    bool tbb_thread;
+};
+
+// Forward declaration
+class tbb_connection_v2;
+class omp_connection_v2;
+
+//! TBB server thread
+class tbb_server_thread : public server_thread {
+    friend class tbb_connection_v2;
+public:
+    tbb_server_thread( bool assigned, IScheduler* s, IExecutionResource* r, tbb_connection_v2* con, thread_map& map, rml::client& cl ) : server_thread(true,assigned,s,r,map,cl), my_conn(con) {
+        activation_count = 0;
+    }
+    ~tbb_server_thread() {}
+    void Dispatch( DispatchState* ) __TBB_override;
+    inline bool initiate_termination();
+    bool sleep_perhaps();
+    //! Switch out this thread
+    bool switch_out();
+private:
+    tbb_connection_v2* my_conn;
+public:
+    tbb::atomic<int> activation_count;
+};
+
+//! OMP server thread
+class omp_server_thread : public server_thread {
+    friend class omp_connection_v2;
+public:
+    omp_server_thread( bool assigned, IScheduler* s, IExecutionResource* r, omp_connection_v2* con, thread_map& map, rml::client& cl ) :
+        server_thread(false,assigned,s,r,map,cl), my_conn(con), my_cookie(NULL), my_index(UINT_MAX) {}
+    ~omp_server_thread() {}
+    void Dispatch( DispatchState* ) __TBB_override;
+    inline void* get_cookie() {return my_cookie;}
+    inline ::__kmp::rml::omp_client::size_type get_index() {return my_index;}
+
+    inline IExecutionResource* get_execution_resource() { return get_execution_resource(); }
+    inline bool initiate_termination() { return destroy_job( (omp_connection_v2*) my_conn ); }
+    void sleep_perhaps();
+private:
+    omp_connection_v2* my_conn;
+    void* my_cookie;
+    ::__kmp::rml::omp_client::size_type my_index;
+    omp_dispatch_type omp_data;
+};
+
+//! Class that implements IScheduler
+template<typename Connection>
+class scheduler : no_copy, public IScheduler {
+public:
+    unsigned int GetId() const __TBB_override {return uid;}
+    void Statistics( unsigned int* /*pTaskCompletionRate*/, unsigned int* /*pTaskArrivalRate*/, unsigned int* /*pNumberOfTaskEnqueued*/) __TBB_override {}
+    SchedulerPolicy GetPolicy() const __TBB_override { __TBB_ASSERT(my_policy,NULL); return *my_policy; }
+    void AddVirtualProcessors( IVirtualProcessorRoot** vproots, unsigned int count ) __TBB_override { if( !my_conn.is_closing() ) my_conn.add_virtual_processors( vproots, count); }
+    void RemoveVirtualProcessors( IVirtualProcessorRoot** vproots, unsigned int count ) __TBB_override;
+    void NotifyResourcesExternallyIdle( IVirtualProcessorRoot** vproots, unsigned int count ) __TBB_override { __TBB_ASSERT( false, "This call is not allowed for TBB" ); }
+    void NotifyResourcesExternallyBusy( IVirtualProcessorRoot** vproots, unsigned int count ) __TBB_override { __TBB_ASSERT( false, "This call is not allowed for TBB" ); }
+protected:
+    scheduler( Connection& conn );
+    virtual ~scheduler() { __TBB_ASSERT( my_policy, NULL ); delete my_policy; }
+
+public:
+    static scheduler* create( Connection& conn ) {return new scheduler( conn );}
+
+private:
+    const int uid;
+    Connection& my_conn;
+    SchedulerPolicy* my_policy;
+};
+
+
+/*
+ * --> ts_busy --> ts_done
+ */
+class thread_scavenger_thread : public IExecutionContext, no_copy {
+public:
+    thread_scavenger_thread( IScheduler* s, IVirtualProcessorRoot* r, thread_map& map ) :
+        uid( GetExecutionContextId() ), my_scheduler(s), my_virtual_processor_root(r), my_proxy(NULL), my_thread_map(map)
+    {
+        my_state = ts_busy;
+#if TBB_USE_ASSERT
+        activation_count = 0;
+#endif
+    }
+    ~thread_scavenger_thread() {}
+    unsigned int GetId() const __TBB_override { return uid; }
+    IScheduler* GetScheduler() __TBB_override { return my_scheduler; }
+    IThreadProxy* GetProxy()   __TBB_override { return my_proxy; }
+    void SetProxy( IThreadProxy* thr_proxy ) __TBB_override { my_proxy = thr_proxy; }
+    void Dispatch( DispatchState* ) __TBB_override;
+    inline thread_state_t read_state() { return my_state; }
+    inline void set_state( thread_state_t s ) { my_state = s; }
+    inline IVirtualProcessorRoot* get_virtual_processor() { return my_virtual_processor_root; }
+private:
+    const int uid;
+    IScheduler* my_scheduler;
+    IVirtualProcessorRoot* my_virtual_processor_root;
+    IThreadProxy* my_proxy;
+    thread_map& my_thread_map;
+    tbb::atomic<thread_state_t> my_state;
+#if TBB_USE_ASSERT
+public:
+    tbb::atomic<int> activation_count;
+#endif
+};
+
+static const thread_scavenger_thread* c_claimed = reinterpret_cast<thread_scavenger_thread*>(1);
+
+struct garbage_connection_queue {
+    tbb::atomic<uintptr_t> head;
+    tbb::atomic<uintptr_t> tail;
+    static const uintptr_t empty = 0; // connection scavenger thread empty list
+    static const uintptr_t plugged = 1;  // end of use of the list
+    static const uintptr_t plugged_acked = 2;  // connection scavenger saw the plugged flag, and it freed all connections
+};
+
+//! Connection scavenger
+/** It collects closed connection objects, wait for worker threads belonging to the connection to return to ConcRT RM
+ *  then return the object to the memory manager.
+ */
+class connection_scavenger_thread {
+    friend void assist_cleanup_connections();
+    /*
+     * connection_scavenger_thread's state
+     * ts_busy <----> ts_asleep <--
+     */
+    tbb::atomic<thread_state_t> state;
+
+    /* We steal two bits from a connection pointer to encode
+     * whether the connection is for TBB or for OMP.
+     *
+     * ----------------------------------
+     * |                          |  |  |
+     * ----------------------------------
+     *                              ^  ^
+     *                             /   |
+     *            1 : tbb, 0 : omp     |
+     *                  if set, terminate
+     */
+    // FIXME: pad these?
+    thread_monitor monitor;
+    HANDLE thr_handle;
+#if TBB_USE_ASSERT
+    tbb::atomic<int> n_scavenger_threads;
+#endif
+
+public:
+    connection_scavenger_thread() : thr_handle(NULL) {
+        state = ts_asleep;
+#if TBB_USE_ASSERT
+        n_scavenger_threads = 0;
+#endif
+    }
+
+    ~connection_scavenger_thread() {}
+
+    void wakeup() {
+        if( state.compare_and_swap( ts_busy, ts_asleep )==ts_asleep )
+            monitor.notify();
+    }
+
+    void sleep_perhaps();
+
+    void process_requests( uintptr_t conn_ex );
+
+    static __RML_DECL_THREAD_ROUTINE thread_routine( void* arg );
+
+    void launch() {
+        thread_monitor::launch( connection_scavenger_thread::thread_routine, this, NULL );
+    }
+
+    template<typename Server, typename Client>
+    void add_request( generic_connection<Server,Client>* conn_to_close );
+
+    template<typename Server, typename Client>
+    uintptr_t grab_and_prepend( generic_connection<Server,Client>* last_conn_to_close );
+};
+
+void free_all_connections( uintptr_t );
+
+#endif /* RML_USE_WCRM */
+
+#if !RML_USE_WCRM
+class server_thread;
+
+//! thread_map_base; we need to make the iterator type available to server_thread
+struct thread_map_base {
+    //! A value in the map
+    class value_type {
+    public:
+        server_thread& thread() {
+            __TBB_ASSERT( my_thread, "thread_map::value_type::thread() called when !my_thread" );
+            return *my_thread;
+        }
+        rml::job& job() {
+            __TBB_ASSERT( my_job, "thread_map::value_type::job() called when !my_job" );
+            return *my_job;
+        }
+        value_type() : my_thread(NULL), my_job(NULL) {}
+        server_thread& wait_for_thread() const {
+            for(;;) {
+                server_thread* ptr=const_cast<server_thread*volatile&>(my_thread);
+                if( ptr )
+                    return *ptr;
+                __TBB_Yield();
+            }
+        }
+        /** Shortly after when a connection is established, it is possible for the server
+            to grab a server_thread that has not yet created a job object for that server. */
+        rml::job* wait_for_job() const {
+            if( !my_job ) {
+                my_job = my_automaton.wait_for_job();
+            }
+            return my_job;
+        }
+    private:
+        server_thread* my_thread;
+        /** Marked mutable because though it is physically modified, conceptually it is a duplicate of
+            the job held by job_automaton. */
+        mutable rml::job* my_job;
+        job_automaton my_automaton;
+        // FIXME - pad out to cache line, because my_automaton is hit hard by thread()
+        friend class thread_map;
+    };
+    typedef tbb::concurrent_vector<value_type,tbb::zero_allocator<value_type,tbb::cache_aligned_allocator> > array_type;
+};
+#endif /* !RML_USE_WCRM */
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about uninstantiable class
+    #pragma warning(push)
+    #pragma warning(disable:4510 4610)
+#endif
+
+template<typename T>
+class padded: public T {
+    char pad[cache_line_size - sizeof(T)%cache_line_size];
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+// FIXME - should we pad out memory to avoid false sharing of our global variables?
+static unsigned the_default_concurrency;
+static tbb::atomic<int> the_balance;
+static tbb::atomic<tbb::internal::do_once_state> rml_module_state;
+
+#if !RML_USE_WCRM
+//! Per thread information
+/** ref_count holds number of clients that are using this,
+    plus 1 if a host thread owns this instance. */
+class server_thread: public ref_count {
+    friend class thread_map;
+    template<typename Server, typename Client> friend class generic_connection;
+    friend class tbb_connection_v2;
+    friend class omp_connection_v2;
+    //! Integral type that can hold a thread_state_t
+    typedef int thread_state_rep_t;
+    tbb::atomic<thread_state_rep_t> state;
+public:
+    thread_monitor monitor;
+private:
+    bool    is_omp_thread;
+    tbb::atomic<thread_state_rep_t> my_extra_state;
+    server_thread* link;
+    thread_map_base::array_type::iterator my_map_pos;
+    rml::server *my_conn;
+    rml::job* my_job;
+    job_automaton* my_ja;
+    size_t my_index;
+    tbb::atomic<bool> terminate;
+    omp_dispatch_type omp_dispatch;
+
+#if TBB_USE_ASSERT
+    //! Flag used to check if thread is still using *this.
+    bool has_active_thread;
+#endif /* TBB_USE_ASSERT */
+
+    //! Volunteer to sleep.
+    void sleep_perhaps( thread_state_t asleep );
+
+    //! Destroy job corresponding to given client
+    /** Return true if thread must quit. */
+    template<typename Connection>
+    bool destroy_job( Connection& c );
+
+    //! Do terminate the thread
+    /** Return true if thread must quit. */
+    bool do_termination();
+
+    void loop();
+    static __RML_DECL_THREAD_ROUTINE thread_routine( void* arg );
+
+public:
+    server_thread();
+
+    ~server_thread();
+
+    //! Read the thread state
+    thread_state_t read_state() const {
+        thread_state_rep_t s = state;
+        __TBB_ASSERT( unsigned(s)<=unsigned(ts_done), "corrupted server thread?" );
+        return thread_state_t(s);
+    }
+
+    //! Read the tbb-specific extra thread state
+    thread_state_t read_extra_state() const {
+        thread_state_rep_t s = my_extra_state;
+        return thread_state_t(s);
+    }
+
+    //! Launch a thread that is bound to *this.
+    void launch( size_t stack_size );
+
+    //! Attempt to wakeup a thread
+    /** The value "to" is the new state for the thread, if it was woken up.
+        Returns true if thread was woken up, false otherwise. */
+    bool wakeup( thread_state_t to, thread_state_t from );
+
+    //! Attempt to enslave a thread for OpenMP/TBB.
+    /** Returns true if state is successfully changed.  's' takes either ts_omp_busy or ts_tbb_busy */
+    bool try_grab_for( thread_state_t s );
+
+#if _WIN32||_WIN64
+    //! Send the worker thread to sleep temporarily
+    void deactivate();
+
+    //! Wake the worker thread up
+    void reactivate();
+#endif /* _WIN32||_WIN64 */
+};
+
+//! Bag of threads that are private to a client.
+class private_thread_bag {
+    struct list_thread: server_thread {
+       list_thread* next;
+    };
+    //! Root of atomic linked list of list_thread
+    /** ABA problem is avoided because items are only atomically pushed, never popped. */
+    tbb::atomic<list_thread*> my_root;
+    tbb::cache_aligned_allocator<padded<list_thread> > my_allocator;
+public:
+    //! Construct empty bag
+    private_thread_bag() {my_root=NULL;}
+
+    //! Create a fresh server_thread object.
+    server_thread& add_one_thread() {
+        list_thread* t = my_allocator.allocate(1);
+        new( t ) list_thread;
+        // Atomically add to list
+        list_thread* old_root;
+        do {
+            old_root = my_root;
+            t->next = old_root;
+        } while( my_root.compare_and_swap( t, old_root )!=old_root );
+        return *t;
+    }
+
+    //! Destroy the bag and threads in it.
+    ~private_thread_bag() {
+        while( my_root ) {
+            // Unlink thread from list.
+            list_thread* t = my_root;
+            my_root = t->next;
+            // Destroy and deallocate the thread.
+            t->~list_thread();
+            my_allocator.deallocate(static_cast<padded<list_thread>*>(t),1);
+        }
+    }
+};
+
+//! Forward declaration
+void wakeup_some_tbb_threads();
+
+//! Type-independent part of class generic_connection.
+/** One to one map from server threads to jobs, and associated reference counting. */
+class thread_map : public thread_map_base {
+public:
+    typedef rml::client::size_type size_type;
+    //! ctor
+    thread_map( wait_counter& fc, ::rml::client& client ) :
+        all_visited_at_least_once(false), my_min_stack_size(0), my_server_ref_count(1),
+        my_client_ref_count(1), my_client(client), my_factory_counter(fc)
+    { my_unrealized_threads = 0; }
+    //! dtor
+    ~thread_map() {}
+    typedef array_type::iterator iterator;
+    iterator begin() {return my_array.begin();}
+    iterator end() {return my_array.end();}
+    void bind();
+    void unbind();
+    void assist_cleanup( bool assist_null_only );
+
+    /** Returns number of unrealized threads to create. */
+    size_type wakeup_tbb_threads( size_type n );
+    bool wakeup_next_thread( iterator i, tbb_connection_v2& conn );
+    void release_tbb_threads( server_thread* t );
+    void adjust_balance( int delta );
+
+    //! Add a server_thread object to the map, but do not bind it.
+    /** Return NULL if out of unrealized threads. */
+    value_type* add_one_thread( bool is_omp_thread_ );
+
+    void bind_one_thread( rml::server& server, value_type& x );
+
+    void remove_client_ref();
+    int add_server_ref() {return my_server_ref_count.add_ref();}
+    int remove_server_ref() {return my_server_ref_count.remove_ref();}
+
+    ::rml::client& client() const {return my_client;}
+
+    size_type get_unrealized_threads() { return my_unrealized_threads; }
+
+private:
+    private_thread_bag my_private_threads;
+    bool all_visited_at_least_once;
+    array_type my_array;
+    size_t my_min_stack_size;
+    tbb::atomic<size_type> my_unrealized_threads;
+
+    //! Number of threads referencing *this, plus one extra.
+    /** When it becomes zero, the containing server object can be safely deleted. */
+    ref_count my_server_ref_count;
+
+    //! Number of jobs that need cleanup, plus one extra.
+    /** When it becomes zero, acknowledge_close_connection is called. */
+    ref_count my_client_ref_count;
+
+    ::rml::client& my_client;
+    //! Counter owned by factory that produced this thread_map.
+    wait_counter& my_factory_counter;
+};
+
+void thread_map::bind_one_thread( rml::server& server, value_type& x ) {
+    // Add one to account for the thread referencing this map hereforth.
+    server_thread& t = x.thread();
+    my_server_ref_count.add_ref();
+    my_client_ref_count.add_ref();
+#if TBB_USE_ASSERT
+    __TBB_ASSERT( t.add_ref()==1, NULL );
+#else
+    t.add_ref();
+#endif
+    // Have responsibility to start the thread.
+    t.my_conn = &server;
+    t.my_ja = &x.my_automaton;
+    t.launch( my_min_stack_size );
+    /* Must wake thread up so it can fill in its "my_job" field in *this.
+       Otherwise deadlock can occur where wait_for_job spins on thread that is sleeping. */
+    __TBB_ASSERT( t.state!=ts_tbb_busy, NULL );
+    t.wakeup( ts_idle, ts_asleep );
+}
+
+thread_map::value_type* thread_map::add_one_thread( bool is_omp_thread_ ) {
+    size_type u;
+    do {
+        u = my_unrealized_threads;
+        if( !u ) return NULL;
+    } while( my_unrealized_threads.compare_and_swap(u-1,u)!=u );
+    server_thread& t = my_private_threads.add_one_thread();
+    t.is_omp_thread = is_omp_thread_;
+    __TBB_ASSERT( u>=1, NULL );
+    t.my_index = u - 1;
+    __TBB_ASSERT( t.state!=ts_tbb_busy, NULL );
+    t.my_extra_state = t.is_omp_thread ? ts_none : ts_created;
+
+    iterator i = t.my_map_pos = my_array.grow_by(1);
+    value_type& v = *i;
+    v.my_thread = &t;
+    return &v;
+}
+
+void thread_map::bind() {
+    ++my_factory_counter;
+    my_min_stack_size = my_client.min_stack_size();
+    __TBB_ASSERT( my_unrealized_threads==0, "already called bind?" );
+    my_unrealized_threads = my_client.max_job_count();
+}
+
+void thread_map::unbind() {
+    // Ask each server_thread to cleanup its job for this server.
+    for( iterator i=begin(); i!=end(); ++i ) {
+        server_thread& t = i->thread();
+        t.terminate = true;
+        t.wakeup( ts_idle, ts_asleep );
+    }
+    // Remove extra ref to client.
+    remove_client_ref();
+}
+
+void thread_map::assist_cleanup( bool assist_null_only ) {
+    // To avoid deadlock, the current thread *must* help out with cleanups that have not started,
+    // because the thread that created the job may be busy for a long time.
+    for( iterator i = begin(); i!=end(); ++i ) {
+        rml::job* j=0;
+        job_automaton& ja = i->my_automaton;
+        if( assist_null_only ? ja.try_plug_null() : ja.try_plug(j) ) {
+            if( j ) {
+                my_client.cleanup(*j);
+            } else {
+                // server thread did not get a chance to create a job.
+            }
+            remove_client_ref();
+        }
+    }
+}
+
+thread_map::size_type thread_map::wakeup_tbb_threads( size_type n ) {
+    __TBB_ASSERT(n>0,"must specify positive number of threads to wake up");
+    iterator e = end();
+    for( iterator k=begin(); k!=e; ++k ) {
+        // If another thread added *k, there is a tiny timing window where thread() is invalid.
+        server_thread& t = k->wait_for_thread();
+        thread_state_t thr_s = t.read_state();
+        if( t.read_extra_state()==ts_created || thr_s==ts_tbb_busy || thr_s==ts_done )
+            continue;
+        if( --the_balance>=0 ) { // try to withdraw a coin from the deposit
+            while( !t.try_grab_for( ts_tbb_busy ) ) {
+                thr_s = t.read_state();
+                if( thr_s==ts_tbb_busy || thr_s==ts_done ) {
+                    // we lost; move on to the next.
+                    ++the_balance;
+                    goto skip;
+                }
+            }
+            if( --n==0 )
+                return 0;
+        } else {
+            // overdraft.
+            ++the_balance;
+            break;
+        }
+skip:
+        ;
+    }
+    return n<my_unrealized_threads ? n : size_type(my_unrealized_threads);
+}
+#else /* RML_USE_WCRM */
+
+class thread_map : no_copy {
+    friend class omp_connection_v2;
+    typedef ::std::hash_map<uintptr_t,server_thread*> hash_map_type;
+    size_t my_min_stack_size;
+    size_t my_unrealized_threads;
+    ::rml::client& my_client;
+    //! Counter owned by factory that produced this thread_map.
+    wait_counter& my_factory_counter;
+    //! Ref counters
+    ref_count my_server_ref_count;
+    ref_count my_client_ref_count;
+    // FIXME: pad this?
+    hash_map_type my_map;
+    bool shutdown_in_progress;
+    std::vector<IExecutionResource*> original_exec_resources;
+    tbb::cache_aligned_allocator<padded<tbb_server_thread> > my_tbb_allocator;
+    tbb::cache_aligned_allocator<padded<omp_server_thread> > my_omp_allocator;
+    tbb::cache_aligned_allocator<padded<thread_scavenger_thread> > my_scavenger_allocator;
+    IResourceManager* my_concrt_resource_manager;
+    IScheduler* my_scheduler;
+    ISchedulerProxy* my_scheduler_proxy;
+    tbb::atomic<thread_scavenger_thread*> my_thread_scavenger_thread;
+#if TBB_USE_ASSERT
+    tbb::atomic<int> n_add_vp_requests;
+    tbb::atomic<int> n_thread_scavengers_created;
+#endif
+public:
+    thread_map( wait_counter& fc, ::rml::client& client ) :
+        my_min_stack_size(0), my_client(client), my_factory_counter(fc),
+        my_server_ref_count(1), my_client_ref_count(1), shutdown_in_progress(false),
+        my_concrt_resource_manager(NULL), my_scheduler(NULL), my_scheduler_proxy(NULL)
+    {
+        my_thread_scavenger_thread = NULL;
+#if TBB_USE_ASSERT
+        n_add_vp_requests = 0;
+        n_thread_scavengers_created;
+#endif
+    }
+
+    ~thread_map() {
+        __TBB_ASSERT( n_thread_scavengers_created<=1, "too many scavenger thread created" );
+        // if thread_scavenger_thread is launched, wait for it to complete
+        if( my_thread_scavenger_thread ) {
+            __TBB_ASSERT( my_thread_scavenger_thread!=c_claimed, NULL );
+            while( my_thread_scavenger_thread->read_state()==ts_busy )
+                __TBB_Yield();
+            thread_scavenger_thread* tst = my_thread_scavenger_thread;
+            my_scavenger_allocator.deallocate(static_cast<padded<thread_scavenger_thread>*>(tst),1);
+        }
+        // deallocate thread contexts
+        for( hash_map_type::const_iterator hi=my_map.begin(); hi!=my_map.end(); ++hi ) {
+            server_thread* thr = hi->second;
+            if( thr->tbb_thread ) {
+                while( ((tbb_server_thread*)thr)->activation_count>1 )
+                    __TBB_Yield();
+                ((tbb_server_thread*)thr)->~tbb_server_thread();
+                my_tbb_allocator.deallocate(static_cast<padded<tbb_server_thread>*>(thr),1);
+            } else {
+                ((omp_server_thread*)thr)->~omp_server_thread();
+                my_omp_allocator.deallocate(static_cast<padded<omp_server_thread>*>(thr),1);
+            }
+        }
+        if( my_scheduler_proxy ) {
+            my_scheduler_proxy->Shutdown();
+            my_concrt_resource_manager->Release();
+            __TBB_ASSERT( my_scheduler, NULL );
+            delete my_scheduler;
+        } else {
+            __TBB_ASSERT( !my_scheduler, NULL );
+        }
+    }
+    typedef hash_map_type::key_type key_type;
+    typedef hash_map_type::value_type value_type;
+    typedef hash_map_type::iterator iterator;
+    iterator begin() {return my_map.begin();}
+    iterator end() {return my_map.end();}
+    iterator find( key_type k ) {return my_map.find( k );}
+    iterator insert( key_type k, server_thread* v ) {
+        std::pair<iterator,bool> res = my_map.insert( value_type(k,v) );
+        return res.first;
+    }
+    void bind( IScheduler* s ) {
+        ++my_factory_counter;
+        if( s ) {
+            my_unrealized_threads = s->GetPolicy().GetPolicyValue( MaxConcurrency );
+            __TBB_ASSERT( my_unrealized_threads>0, NULL );
+            my_scheduler = s;
+            my_concrt_resource_manager = CreateResourceManager(); // reference count==3 when first created.
+            my_scheduler_proxy = my_concrt_resource_manager->RegisterScheduler( s, CONCRT_RM_VERSION_1 );
+            my_scheduler_proxy->RequestInitialVirtualProcessors( false );
+        }
+    }
+    bool is_closing() { return shutdown_in_progress; }
+    void unbind( rml::server& server, ::tbb::spin_mutex& mtx );
+    void add_client_ref() { my_server_ref_count.add_ref(); }
+    void remove_client_ref();
+    void add_server_ref() {my_server_ref_count.add_ref();}
+    int remove_server_ref() {return my_server_ref_count.remove_ref();}
+    int get_server_ref_count() { int k = my_server_ref_count.my_ref_count; return k; }
+    void assist_cleanup( bool assist_null_only );
+    void adjust_balance( int delta );
+    int current_balance() const {int k = the_balance; return k;}
+    ::rml::client& client() const {return my_client;}
+    void register_as_master( server::execution_resource_t& v ) const { (IExecutionResource*&)v = my_scheduler_proxy ? my_scheduler_proxy->SubscribeCurrentThread() : NULL; }
+    // Remove() should be called from the same thread that subscribed the current h/w thread (i.e., the one that
+    // called register_as_master() ).
+    void unregister( server::execution_resource_t v ) const {if( v ) ((IExecutionResource*)v)->Remove( my_scheduler );}
+    void add_virtual_processors( IVirtualProcessorRoot** vprocs, unsigned int count, tbb_connection_v2& conn, ::tbb::spin_mutex& mtx );
+    void add_virtual_processors( IVirtualProcessorRoot** vprocs, unsigned int count, omp_connection_v2& conn, ::tbb::spin_mutex& mtx );
+    void remove_virtual_processors( IVirtualProcessorRoot** vproots, unsigned count, ::tbb::spin_mutex& mtx );
+    void mark_virtual_processors_as_lent( IVirtualProcessorRoot** vproots, unsigned count, ::tbb::spin_mutex& mtx );
+    void create_oversubscribers( unsigned n, std::vector<server_thread*>& thr_vec, omp_connection_v2& conn, ::tbb::spin_mutex& mtx );
+    void wakeup_tbb_threads( int c, ::tbb::spin_mutex& mtx );
+    void mark_virtual_processors_as_returned( IVirtualProcessorRoot** vprocs, unsigned int count, tbb::spin_mutex& mtx );
+    inline void addto_original_exec_resources( IExecutionResource* r, ::tbb::spin_mutex& mtx ) {
+        ::tbb::spin_mutex::scoped_lock lck(mtx);
+        __TBB_ASSERT( !is_closing(), "trying to register master while connection is being shutdown?" );
+        original_exec_resources.push_back( r );
+    }
+#if !__RML_REMOVE_VIRTUAL_PROCESSORS_DISABLED
+    void allocate_thread_scavenger( IExecutionResource* v );
+#endif
+    inline thread_scavenger_thread* get_thread_scavenger() { return my_thread_scavenger_thread; }
+};
+
+garbage_connection_queue connections_to_reclaim;
+connection_scavenger_thread connection_scavenger;
+
+#endif /* !RML_USE_WCRM */
+
+//------------------------------------------------------------------------
+// generic_connection
+//------------------------------------------------------------------------
+
+template<typename Server, typename Client>
+struct connection_traits {};
+
+// head of the active tbb connections
+static tbb::atomic<uintptr_t> active_tbb_connections;
+static tbb::atomic<int> current_tbb_conn_readers;
+static size_t current_tbb_conn_reader_epoch;
+static tbb::atomic<size_t> close_tbb_connection_event_count;
+
+#if RML_USE_WCRM
+template<typename Connection>
+void make_job( Connection& c, server_thread& t );
+#endif
+
+template<typename Server, typename Client>
+class generic_connection: public Server, no_copy {
+    version_type version() const __TBB_override {return SERVER_VERSION;}
+    void yield() __TBB_override {thread_monitor::yield();}
+    void independent_thread_number_changed( int delta ) __TBB_override { my_thread_map.adjust_balance( -delta ); }
+    unsigned default_concurrency() const __TBB_override { return the_default_concurrency; }
+    friend void wakeup_some_tbb_threads();
+    friend class connection_scavenger_thread;
+
+protected:
+    thread_map my_thread_map;
+    generic_connection* next_conn;
+    size_t my_ec;
+#if RML_USE_WCRM
+    // FIXME: pad it?
+    tbb::spin_mutex map_mtx;
+    IScheduler* my_scheduler;
+    void do_open( IScheduler* s ) {
+        my_scheduler = s;
+        my_thread_map.bind( s );
+    }
+    bool is_closing() { return my_thread_map.is_closing(); }
+    void request_close_connection( bool existing );
+#else
+    void do_open() {my_thread_map.bind();}
+    void request_close_connection( bool );
+#endif /* RML_USE_WCRM */
+    //! Make destructor virtual
+    virtual ~generic_connection() {}
+#if !RML_USE_WCRM
+    generic_connection( wait_counter& fc, Client& c ) : my_thread_map(fc,c), next_conn(NULL), my_ec(0) {}
+#else
+    generic_connection( wait_counter& fc, Client& c ) :
+            my_thread_map(fc,c), next_conn(NULL), my_ec(0), map_mtx(), my_scheduler(NULL) {}
+    void add_virtual_processors( IVirtualProcessorRoot** vprocs, unsigned int count );
+    void remove_virtual_processors( IVirtualProcessorRoot** vprocs, unsigned int count );
+    void notify_resources_externally_busy( IVirtualProcessorRoot** vprocs, unsigned int count ) { my_thread_map.mark_virtual_processors_as_lent( vprocs, count, map_mtx ); }
+    void notify_resources_externally_idle( IVirtualProcessorRoot** vprocs, unsigned int count ) {
+        my_thread_map.mark_virtual_processors_as_returned( vprocs, count, map_mtx );
+    }
+#endif /* !RML_USE_WCRM */
+
+public:
+    typedef Server server_type;
+    typedef Client client_type;
+    Client& client() const {return static_cast<Client&>(my_thread_map.client());}
+    void set_scratch_ptr( job& j, void* ptr ) { ::rml::server::scratch_ptr(j) = ptr; }
+#if RML_USE_WCRM
+    template<typename Connection>
+    friend void make_job( Connection& c, server_thread& t );
+    void add_server_ref ()   {my_thread_map.add_server_ref();}
+    void remove_server_ref() {if( my_thread_map.remove_server_ref()==0 ) delete this;}
+    void add_client_ref ()   {my_thread_map.add_client_ref();}
+    void remove_client_ref() {my_thread_map.remove_client_ref();}
+#else /* !RML_USE_WCRM */
+    int  add_server_ref ()   {return my_thread_map.add_server_ref();}
+    void remove_server_ref() {if( my_thread_map.remove_server_ref()==0 ) delete this;}
+    void remove_client_ref() {my_thread_map.remove_client_ref();}
+    void make_job( server_thread& t, job_automaton& ja );
+#endif /* RML_USE_WCRM */
+    static generic_connection* get_addr( uintptr_t addr_ex ) {
+        return reinterpret_cast<generic_connection*>( addr_ex&~(uintptr_t)3 );
+    }
+};
+
+//------------------------------------------------------------------------
+// TBB server
+//------------------------------------------------------------------------
+
+template<>
+struct connection_traits<tbb_server,tbb_client> {
+    static const bool assist_null_only = true;
+    static const bool is_tbb = true;
+};
+
+//! Represents a server/client binding.
+/** The internal representation uses inheritance for the server part and a pointer for the client part. */
+class tbb_connection_v2: public generic_connection<tbb_server,tbb_client> {
+    void adjust_job_count_estimate( int delta ) __TBB_override;
+#if !RML_USE_WCRM
+#if _WIN32||_WIN64
+    void register_master ( rml::server::execution_resource_t& /*v*/ ) __TBB_override {}
+    void unregister_master ( rml::server::execution_resource_t /*v*/ ) __TBB_override {}
+#endif
+#else
+    void register_master ( rml::server::execution_resource_t& v ) __TBB_override {
+        my_thread_map.register_as_master(v);
+        if( v ) ++nesting;
+    }
+    void unregister_master ( rml::server::execution_resource_t v ) __TBB_override {
+        if( v ) {
+            __TBB_ASSERT( nesting>0, NULL );
+            if( --nesting==0 ) {
+#if !__RML_REMOVE_VIRTUAL_PROCESSORS_DISABLED
+                my_thread_map.allocate_thread_scavenger( (IExecutionResource*)v );
+#endif
+            }
+        }
+        my_thread_map.unregister(v);
+    }
+    IScheduler* create_scheduler() {return( scheduler<tbb_connection_v2>::create( *this ) );}
+    friend void  free_all_connections( uintptr_t );
+    friend class scheduler<tbb_connection_v2>;
+    friend class execution_context;
+    friend class connection_scavenger_thread;
+#endif /* RML_USE_WCRM */
+    friend void wakeup_some_tbb_threads();
+    //! Estimate on number of jobs without threads working on them.
+    tbb::atomic<int> my_slack;
+    friend class dummy_class_to_shut_up_gratuitous_warning_from_gcc_3_2_3;
+#if TBB_USE_ASSERT
+    tbb::atomic<int> my_job_count_estimate;
+#endif /* TBB_USE_ASSERT */
+
+    tbb::atomic<int> n_adjust_job_count_requests;
+#if RML_USE_WCRM
+    tbb::atomic<int> nesting;
+#endif
+
+    // dtor
+    ~tbb_connection_v2();
+
+public:
+#if RML_USE_WCRM
+    typedef tbb_server_thread server_thread_type;
+#endif
+    //! True if there is slack that try_process can use.
+    bool has_slack() const {return my_slack>0;}
+
+#if RML_USE_WCRM
+    bool try_process( job& job )
+#else
+    bool try_process( server_thread& t, job& job )
+#endif
+    {
+        bool visited = false;
+        // No check for my_slack>0 here because caller is expected to do that check.
+        int k = --my_slack;
+        if( k>=0 ) {
+#if !RML_USE_WCRM
+            t.my_extra_state = ts_visited; // remember the thread paid a trip to process() at least once
+#endif
+            client().process(job);
+            visited = true;
+        }
+        ++my_slack;
+        return visited;
+    }
+
+    tbb_connection_v2( wait_counter& fc, tbb_client& client ) : generic_connection<tbb_server,tbb_client>(fc,client)
+    {
+        my_slack = 0;
+#if RML_USE_WCRM
+        nesting = 0;
+#endif
+#if TBB_USE_ASSERT
+        my_job_count_estimate = 0;
+#endif /* TBB_USE_ASSERT */
+        __TBB_ASSERT( !my_slack, NULL );
+
+#if RML_USE_WCRM
+        do_open( client.max_job_count()>0 ? create_scheduler() : NULL );
+#else
+        do_open();
+#endif /* !RML_USE_WCRM */
+        n_adjust_job_count_requests = 0;
+
+        // Acquire head of active_tbb_connections & push the connection into the list
+        uintptr_t conn;
+        do {
+            for( ; (conn=active_tbb_connections)&1; )
+                __TBB_Yield();
+        } while( active_tbb_connections.compare_and_swap( conn|1, conn )!=conn );
+
+        this->next_conn = generic_connection<tbb_server,tbb_client>::get_addr(conn);
+        // Update and release head of active_tbb_connections
+        active_tbb_connections = (uintptr_t) this; // set and release
+    }
+    inline void wakeup_tbb_threads( unsigned n ) {
+        my_thread_map.wakeup_tbb_threads( n
+#if RML_USE_WCRM
+                , map_mtx
+#endif
+                );
+    }
+#if RML_USE_WCRM
+    inline int get_nesting_level() { return nesting; }
+#else
+    inline bool wakeup_next_thread( thread_map::iterator i ) {return my_thread_map.wakeup_next_thread( i, *this );}
+    inline thread_map::size_type get_unrealized_threads () {return my_thread_map.get_unrealized_threads();}
+#endif /* !RML_USE_WCRM */
+};
+
+//------------------------------------------------------------------------
+// OpenMP server
+//------------------------------------------------------------------------
+
+template<>
+struct connection_traits<omp_server,omp_client> {
+    static const bool assist_null_only = false;
+    static const bool is_tbb = false;
+};
+
+class omp_connection_v2: public generic_connection<omp_server,omp_client> {
+#if !RML_USE_WCRM
+    int  current_balance() const __TBB_override {return the_balance;}
+#else
+    friend void  free_all_connections( uintptr_t );
+    friend class scheduler<omp_connection_v2>;
+    int current_balance() const __TBB_override {return my_thread_map.current_balance();}
+#endif /* !RML_USE_WCRM */
+    int  try_increase_load( size_type n, bool strict ) __TBB_override;
+    void decrease_load( size_type n ) __TBB_override;
+    void get_threads( size_type request_size, void* cookie, job* array[] ) __TBB_override;
+#if !RML_USE_WCRM
+#if _WIN32||_WIN64
+    void register_master ( rml::server::execution_resource_t& /*v*/ ) __TBB_override {}
+    void unregister_master ( rml::server::execution_resource_t /*v*/ ) __TBB_override {}
+#endif
+#else
+    void register_master ( rml::server::execution_resource_t& v ) __TBB_override {
+        my_thread_map.register_as_master( v );
+        my_thread_map.addto_original_exec_resources( (IExecutionResource*)v, map_mtx );
+    }
+    void unregister_master ( rml::server::execution_resource_t v ) __TBB_override { my_thread_map.unregister(v); }
+#endif /* !RML_USE_WCRM */
+#if _WIN32||_WIN64
+    void deactivate( rml::job* j ) __TBB_override;
+    void reactivate( rml::job* j ) __TBB_override;
+#endif /* _WIN32||_WIN64 */
+#if RML_USE_WCRM
+public:
+    typedef omp_server_thread server_thread_type;
+private:
+    IScheduler* create_scheduler() {return( scheduler<omp_connection_v2>::create( *this ) );}
+#endif /* RML_USE_WCRM */
+public:
+#if TBB_USE_ASSERT
+    //! Net change in delta caused by this connection.
+    /** Should be zero when connection is broken */
+    tbb::atomic<int> net_delta;
+#endif /* TBB_USE_ASSERT */
+
+    omp_connection_v2( wait_counter& fc, omp_client& client ) : generic_connection<omp_server,omp_client>(fc,client) {
+#if TBB_USE_ASSERT
+        net_delta = 0;
+#endif /* TBB_USE_ASSERT */
+#if RML_USE_WCRM
+        do_open( create_scheduler() );
+#else
+        do_open();
+#endif /* RML_USE_WCRM */
+    }
+    ~omp_connection_v2() {__TBB_ASSERT( net_delta==0, "net increase/decrease of load is nonzero" );}
+};
+
+#if !RML_USE_WCRM
+/* to deal with cases where the machine is oversubscribed; we want each thread to trip to try_process() at least once */
+/* this should not involve computing the_balance */
+bool thread_map::wakeup_next_thread( thread_map::iterator this_thr, tbb_connection_v2& conn ) {
+    if( all_visited_at_least_once )
+        return false;
+
+    iterator e = end();
+retry:
+    bool exist = false;
+    iterator k=this_thr;
+    for( ++k; k!=e; ++k ) {
+        // If another thread added *k, there is a tiny timing window where thread() is invalid.
+        server_thread& t = k->wait_for_thread();
+        if( t.my_extra_state!=ts_visited )
+            exist = true;
+        if( t.read_state()!=ts_tbb_busy && t.my_extra_state==ts_started )
+            if( t.try_grab_for( ts_tbb_busy ) )
+                return true;
+    }
+    for( k=begin(); k!=this_thr; ++k ) {
+        server_thread& t = k->wait_for_thread();
+        if( t.my_extra_state!=ts_visited )
+            exist = true;
+        if( t.read_state()!=ts_tbb_busy && t.my_extra_state==ts_started )
+            if( t.try_grab_for( ts_tbb_busy ) )
+                return true;
+    }
+
+    if( exist )
+        if( conn.has_slack() )
+            goto retry;
+    else
+        all_visited_at_least_once = true;
+    return false;
+}
+
+void thread_map::release_tbb_threads( server_thread* t ) {
+    for( ; t; t = t->link ) {
+        while( t->read_state()!=ts_asleep )
+            __TBB_Yield();
+        t->my_extra_state = ts_started;
+    }
+}
+#endif /* !RML_USE_WCRM */
+
+void thread_map::adjust_balance( int delta ) {
+    int new_balance = the_balance += delta;
+    if( new_balance>0 && 0>=new_balance-delta /*== old the_balance*/ )
+        wakeup_some_tbb_threads();
+}
+
+void thread_map::remove_client_ref() {
+    int k = my_client_ref_count.remove_ref();
+    if( k==0 ) {
+        // Notify factory that thread has crossed back into RML.
+        --my_factory_counter;
+        // Notify client that RML is done with the client object.
+        my_client.acknowledge_close_connection();
+    }
+}
+
+#if RML_USE_WCRM
+/** Not a member of generic_connection because we need Connection to be the derived class. */
+template<typename Connection>
+void make_job( Connection& c, typename Connection::server_thread_type& t ) {
+    if( t.my_job_automaton.try_acquire() ) {
+        rml::job* j = t.my_client.create_one_job();
+        __TBB_ASSERT( j!=NULL, "client:::create_one_job returned NULL" );
+        __TBB_ASSERT( (intptr_t(j)&1)==0, "client::create_one_job returned misaligned job" );
+        t.my_job_automaton.set_and_release( j );
+        c.set_scratch_ptr( *j, (void*) &t );
+    }
+}
+#endif /* RML_USE_WCRM */
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+// Suppress "conditional expression is constant" warning.
+#pragma warning( push )
+#pragma warning( disable: 4127 )
+#endif
+#if RML_USE_WCRM
+template<typename Server, typename Client>
+void generic_connection<Server,Client>::request_close_connection( bool exiting ) {
+    // for TBB connections, exiting should always be false
+    if( connection_traits<Server,Client>::is_tbb )
+        __TBB_ASSERT( !exiting, NULL);
+#if TBB_USE_ASSERT
+    else if( exiting )
+        reinterpret_cast<omp_connection_v2*>(this)->net_delta = 0;
+#endif
+    if( exiting ) {
+        uintptr_t tail = connections_to_reclaim.tail;
+        while( connections_to_reclaim.tail.compare_and_swap( garbage_connection_queue::plugged, tail )!=tail )
+            __TBB_Yield();
+        my_thread_map.unbind( *this, map_mtx );
+        my_thread_map.assist_cleanup( connection_traits<Server,Client>::assist_null_only );
+        // It is assumed that the client waits for all other threads to terminate before
+        // calling request_close_connection with true.  Thus, it is safe to return all
+        // outstanding connection objects that are reachable. It is possible that there may
+        // be some unreachable connection objects lying somewhere.
+        free_all_connections( connection_scavenger.grab_and_prepend( this ) );
+        return;
+    }
+#else /* !RML_USE_WCRM */
+template<typename Server, typename Client>
+void generic_connection<Server,Client>::request_close_connection( bool ) {
+#endif /* RML_USE_WCRM */
+    if( connection_traits<Server,Client>::is_tbb ) {
+        // acquire the head of active tbb connections
+        uintptr_t conn;
+        do {
+            for( ; (conn=active_tbb_connections)&1; )
+                __TBB_Yield();
+        } while( active_tbb_connections.compare_and_swap( conn|1, conn )!=conn );
+
+        // Locate the current connection
+        generic_connection* pred_conn = NULL;
+        generic_connection* curr_conn = (generic_connection*) conn;
+        for( ; curr_conn && curr_conn!=this; curr_conn=curr_conn->next_conn )
+            pred_conn = curr_conn;
+        __TBB_ASSERT( curr_conn==this, "the current connection is not in the list?" );
+
+        // Remove this from the list
+        if( pred_conn ) {
+            pred_conn->next_conn = curr_conn->next_conn;
+            active_tbb_connections = reinterpret_cast<uintptr_t>(generic_connection<tbb_server,tbb_client>::get_addr(active_tbb_connections)); // release it
+        } else
+            active_tbb_connections = (uintptr_t) curr_conn->next_conn; // update & release it
+        curr_conn->next_conn = NULL;
+        // Increment the tbb connection close event count
+        my_ec = ++close_tbb_connection_event_count;
+        // Wait happens in tbb_connection_v2::~tbb_connection_v2()
+    }
+#if RML_USE_WCRM
+    my_thread_map.unbind( *this, map_mtx );
+    my_thread_map.assist_cleanup( connection_traits<Server,Client>::assist_null_only );
+    connection_scavenger.add_request( this );
+#else
+    my_thread_map.unbind();
+    my_thread_map.assist_cleanup( connection_traits<Server,Client>::assist_null_only );
+    // Remove extra reference
+    remove_server_ref();
+#endif
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning( pop )
+#endif
+
+#if RML_USE_WCRM
+
+template<typename Server, typename Client>
+void generic_connection<Server,Client>::add_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count )
+{}
+
+template<>
+void generic_connection<tbb_server,tbb_client>::add_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count )
+{
+    my_thread_map.add_virtual_processors( vproots, count, (tbb_connection_v2&)*this, map_mtx );
+}
+template<>
+void generic_connection<omp_server,omp_client>::add_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count )
+{
+    // For OMP, since it uses ScheudlerPolicy of MinThreads==MaxThreads, this is called once when
+    // RequestInitialVirtualProcessors() is  called.
+    my_thread_map.add_virtual_processors( vproots, count, (omp_connection_v2&)*this, map_mtx );
+}
+
+template<typename Server, typename Client>
+void generic_connection<Server,Client>::remove_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count )
+{
+    __TBB_ASSERT( false, "should not be called" );
+}
+/* For OMP, RemoveVirtualProcessors() will never be called. */
+
+template<>
+void generic_connection<tbb_server,tbb_client>::remove_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count )
+{
+    my_thread_map.remove_virtual_processors( vproots, count, map_mtx );
+}
+
+void tbb_connection_v2::adjust_job_count_estimate( int delta ) {
+#if TBB_USE_ASSERT
+    my_job_count_estimate += delta;
+#endif /* TBB_USE_ASSERT */
+    // Atomically update slack.
+    int c = my_slack+=delta;
+    if( c>0 ) {
+        ++n_adjust_job_count_requests;
+        my_thread_map.wakeup_tbb_threads( c, map_mtx );
+        --n_adjust_job_count_requests;
+    }
+}
+#endif /* RML_USE_WCRM */
+
+tbb_connection_v2::~tbb_connection_v2() {
+#if TBB_USE_ASSERT
+    if( my_job_count_estimate!=0 ) {
+        fprintf(stderr, "TBB client tried to disconnect with non-zero net job count estimate of %d\n", int(my_job_count_estimate ));
+        abort();
+    }
+    __TBB_ASSERT( !my_slack, "attempt to destroy tbb_server with nonzero slack" );
+    __TBB_ASSERT( this!=static_cast<tbb_connection_v2*>(generic_connection<tbb_server,tbb_client >::get_addr(active_tbb_connections)), "request_close_connection() must be called" );
+#endif /* TBB_USE_ASSERT */
+#if !RML_USE_WCRM
+    // If there are other threads ready for work, give them coins
+    if( the_balance>0 )
+        wakeup_some_tbb_threads();
+#endif
+    // Someone might be accessing my data members
+    while( current_tbb_conn_readers>0 && (ptrdiff_t)(my_ec-current_tbb_conn_reader_epoch)>0 )
+        __TBB_Yield();
+}
+
+#if !RML_USE_WCRM
+template<typename Server, typename Client>
+void generic_connection<Server,Client>::make_job( server_thread& t, job_automaton& ja ) {
+    if( ja.try_acquire() ) {
+        rml::job* j = client().create_one_job();
+        __TBB_ASSERT( j!=NULL, "client:::create_one_job returned NULL" );
+        __TBB_ASSERT( (intptr_t(j)&1)==0, "client::create_one_job returned misaligned job" );
+        ja.set_and_release( j );
+        __TBB_ASSERT( t.my_conn && t.my_ja && t.my_job==NULL, NULL );
+        t.my_job  = j;
+        set_scratch_ptr( *j, (void*) &t );
+    }
+}
+
+void tbb_connection_v2::adjust_job_count_estimate( int delta ) {
+#if TBB_USE_ASSERT
+    my_job_count_estimate += delta;
+#endif /* TBB_USE_ASSERT */
+    // Atomically update slack.
+    int c = my_slack+=delta;
+    if( c>0 ) {
+        ++n_adjust_job_count_requests;
+        // The client has work to do and there are threads available
+        thread_map::size_type n = my_thread_map.wakeup_tbb_threads(c);
+
+        server_thread* new_threads_anchor = NULL;
+        thread_map::size_type i;
+        {
+        tbb::internal::affinity_helper fpa;
+        for( i=0; i<n; ++i ) {
+            // Obtain unrealized threads
+            thread_map::value_type* k = my_thread_map.add_one_thread( false );
+            if( !k )
+                // No unrealized threads left.
+                break;
+            // Eagerly start the thread off.
+            fpa.protect_affinity_mask( /*restore_process_mask=*/true );
+            my_thread_map.bind_one_thread( *this, *k );
+            server_thread& t = k->thread();
+            __TBB_ASSERT( !t.link, NULL );
+            t.link = new_threads_anchor;
+            new_threads_anchor = &t;
+        }
+        // Implicit destruction of fpa resets original affinity mask.
+        }
+
+        thread_map::size_type j=0;
+        for( ; the_balance>0 && j<i; ++j ) {
+            if( --the_balance>=0 ) {
+                // Withdraw a coin from the bank
+                __TBB_ASSERT( new_threads_anchor, NULL );
+
+                server_thread* t = new_threads_anchor;
+                new_threads_anchor = t->link;
+                while( !t->try_grab_for( ts_tbb_busy ) )
+                    __TBB_Yield();
+                t->my_extra_state = ts_started;
+            } else {
+                // Overdraft. return it to the bank
+                ++the_balance;
+                break;
+            }
+        }
+        __TBB_ASSERT( i-j!=0||new_threads_anchor==NULL, NULL );
+        // Mark the ones that did not get started as eligible for being snatched.
+        if( new_threads_anchor )
+            my_thread_map.release_tbb_threads( new_threads_anchor );
+
+        --n_adjust_job_count_requests;
+    }
+}
+#endif /* RML_USE_WCRM */
+
+#if RML_USE_WCRM
+int omp_connection_v2::try_increase_load( size_type n, bool strict ) {
+    __TBB_ASSERT(int(n)>=0,NULL);
+    if( strict ) {
+        the_balance -= int(n);
+    } else {
+        int avail, old;
+        do {
+            avail = the_balance;
+            if( avail<=0 ) {
+                // No atomic read-write-modify operation necessary.
+                return avail;
+            }
+            // Don't read the_system_balance; if it changes, compare_and_swap will fail anyway.
+            old = the_balance.compare_and_swap( int(n)<avail ? avail-n : 0, avail );
+        } while( old!=avail );
+        if( int(n)>avail )
+            n=avail;
+    }
+#if TBB_USE_ASSERT
+    net_delta += n;
+#endif /* TBB_USE_ASSERT */
+    return n;
+}
+
+void omp_connection_v2::decrease_load( size_type /*n*/ ) {}
+
+void omp_connection_v2::get_threads( size_type request_size, void* cookie, job* array[] ) {
+    unsigned index = 0;
+    std::vector<omp_server_thread*> enlisted(request_size);
+    std::vector<thread_grab_t> to_activate(request_size);
+
+    if( request_size==0 ) return;
+
+    {
+        tbb::spin_mutex::scoped_lock lock(map_mtx);
+
+        __TBB_ASSERT( !is_closing(), "try to get threads while connection is being shutdown?" );
+
+        for( int scan=0; scan<2; ++scan ) {
+            for( thread_map::iterator i=my_thread_map.begin(); i!=my_thread_map.end(); ++i ) {
+                omp_server_thread* thr = (omp_server_thread*) (*i).second;
+                // in the first scan, skip VPs that are lent
+                if( scan==0 && thr->is_lent() ) continue;
+                thread_grab_t res = thr->try_grab_for();
+                if( res!=wk_failed ) {// && if is not busy by some other scheduler
+                    to_activate[index] = res;
+                    enlisted[index] = thr;
+                    if( ++index==request_size )
+                        goto activate_threads;
+                }
+            }
+        }
+    }
+
+activate_threads:
+
+    for( unsigned i=0; i<index; ++i ) {
+        omp_server_thread* thr = enlisted[i];
+        if( to_activate[i]==wk_from_asleep )
+            thr->get_virtual_processor()->Activate( thr );
+        job* j = thr->wait_for_job();
+        array[i] = j;
+        thr->omp_data.produce( client(), j, cookie, i PRODUCE_ARG(*this) );
+    }
+
+    if( index==request_size )
+        return;
+
+    // If we come to this point, it must be because dynamic==false
+    // Create Oversubscribers..
+
+    // Note that our policy is such that MinConcurrency==MaxConcurrency.
+    // RM will deliver MaxConcurrency of VirtualProcessors and no more.
+    __TBB_ASSERT( request_size>index, NULL );
+    unsigned n = request_size - index;
+    std::vector<server_thread*> thr_vec(n);
+    typedef std::vector<server_thread*>::iterator iterator_thr;
+    my_thread_map.create_oversubscribers( n, thr_vec, *this, map_mtx );
+    for( iterator_thr ti=thr_vec.begin(); ti!=thr_vec.end(); ++ti ) {
+        omp_server_thread* thr = (omp_server_thread*) *ti;
+        __TBB_ASSERT( thr, "thread not created?" );
+        // Thread is already grabbed; since it is newly created, we need to activate it.
+        thr->get_virtual_processor()->Activate( thr );
+        job* j = thr->wait_for_job();
+        array[index] = j;
+        thr->omp_data.produce( client(), j, cookie, index PRODUCE_ARG(*this) );
+        ++index;
+    }
+}
+
+#if _WIN32||_WIN64
+void omp_connection_v2::deactivate( rml::job* j )
+{
+    my_thread_map.adjust_balance(1);
+#if TBB_USE_ASSERT
+    net_delta -= 1;
+#endif
+    omp_server_thread* thr = (omp_server_thread*) scratch_ptr( *j );
+    (thr->get_virtual_processor())->Deactivate( thr );
+}
+
+void omp_connection_v2::reactivate( rml::job* j )
+{
+    // Should not adjust the_balance because OMP client is supposed to
+    // do try_increase_load() to reserve the threads to use.
+    omp_server_thread* thr = (omp_server_thread*) scratch_ptr( *j );
+    (thr->get_virtual_processor())->Activate( thr );
+}
+#endif /* !_WIN32||_WIN64 */
+
+#endif  /* RML_USE_WCRM */
+
+//! Wake up some available tbb threads
+void wakeup_some_tbb_threads()
+{
+    /* First, atomically grab the connection, then increase the server ref count to keep
+       it from being released prematurely.  Second, check if the balance is available for TBB
+       and the tbb conneciton has slack to exploit.  If the answer is true, go ahead and
+       try to wake some up. */
+    if( generic_connection<tbb_server,tbb_client >::get_addr(active_tbb_connections)==0 )
+        // the next connection will see the change; return.
+        return;
+
+start_it_over:
+    int n_curr_readers = ++current_tbb_conn_readers;
+    if( n_curr_readers>1 ) // I lost
+        return;
+    // if n_curr_readers==1, i am the first one, so I will take responsibility for waking tbb threads up.
+
+    // update the current epoch
+    current_tbb_conn_reader_epoch = close_tbb_connection_event_count;
+
+    // read and clear
+    // Newly added connection will not invalidate the pointer, and it will
+    // compete with the current one to claim coins.
+    // One that is about to close the connection increments the event count
+    // after it removes the connection from the list.  But it will keep around
+    // the connection until all readers including this one catch up. So, reading
+    // the head and clearing the lock bit should be o.k.
+    generic_connection<tbb_server,tbb_client>* next_conn_wake_up = generic_connection<tbb_server,tbb_client>::get_addr( active_tbb_connections );
+
+    for( ; next_conn_wake_up; ) {
+        /* some threads are creating tbb server threads; they may not see my changes made to the_balance */
+        /* When a thread is in adjust_job_count_estimate() to increase the slack
+           RML tries to activate worker threads on behalf of the requesting thread
+           by repeatedly drawing a coin from the bank optimistically and grabbing a
+           thread.  If it finds the bank overdrafted, it returns the coin back to
+           the bank and returns the control to the thread (return from the method).
+           There lies a tiny timing hole.
+
+           When the overdraft occurs (note that multiple masters may be in
+           adjust_job_count_estimate() so the_balance can be any negative value) and
+           a worker returns from the TBB work at that moment, its returning the coin
+           does not bump up the_balance over 0, so it happily returns from
+           wakeup_some_tbb_threads() without attempting to give coins to worker threads
+           that are ready.
+        */
+        while( ((tbb_connection_v2*)next_conn_wake_up)->n_adjust_job_count_requests>0 )
+            __TBB_Yield();
+
+        int bal = the_balance;
+        n_curr_readers = current_tbb_conn_readers; // get the snapshot
+        if( bal<=0 ) break;
+        // if the connection is deleted, the following will immediately return because its slack would be 0 or less.
+
+        tbb_connection_v2* tbb_conn = (tbb_connection_v2*)next_conn_wake_up;
+        int my_slack = tbb_conn->my_slack;
+        if( my_slack>0 ) tbb_conn->wakeup_tbb_threads( my_slack );
+        next_conn_wake_up = next_conn_wake_up->next_conn;
+    }
+
+    int delta = current_tbb_conn_readers -= n_curr_readers;
+    //if delta>0, more threads entered the routine since this one took the snapshot
+    if( delta>0 ) {
+        current_tbb_conn_readers = 0;
+        if( the_balance>0 && generic_connection<tbb_server,tbb_client >::get_addr(active_tbb_connections)!=0 )
+            goto start_it_over;
+    }
+
+    // Signal any connection that is waiting for me to complete my access that I am done.
+    current_tbb_conn_reader_epoch = close_tbb_connection_event_count;
+}
+
+#if !RML_USE_WCRM
+int omp_connection_v2::try_increase_load( size_type n, bool strict ) {
+    __TBB_ASSERT(int(n)>=0,NULL);
+    if( strict ) {
+        the_balance -= int(n);
+    } else {
+        int avail, old;
+        do {
+            avail = the_balance;
+            if( avail<=0 ) {
+                // No atomic read-write-modify operation necessary.
+                return avail;
+            }
+            // don't read the_balance; if it changes, compare_and_swap will fail anyway.
+            old = the_balance.compare_and_swap( int(n)<avail ? avail-n : 0, avail );
+        } while( old!=avail );
+        if( int(n)>avail )
+            n=avail;
+    }
+#if TBB_USE_ASSERT
+    net_delta += n;
+#endif /* TBB_USE_ASSERT */
+    return n;
+}
+
+void omp_connection_v2::decrease_load( size_type n ) {
+    __TBB_ASSERT(int(n)>=0,NULL);
+    my_thread_map.adjust_balance(int(n));
+#if TBB_USE_ASSERT
+    net_delta -= n;
+#endif /* TBB_USE_ASSERT */
+}
+
+void omp_connection_v2::get_threads( size_type request_size, void* cookie, job* array[] ) {
+
+    if( !request_size )
+        return;
+
+    unsigned index = 0;
+    for(;;) { // don't return until all request_size threads are grabbed.
+        // Need to grab some threads
+        thread_map::iterator k_end=my_thread_map.end();
+        for( thread_map::iterator k=my_thread_map.begin(); k!=k_end; ++k ) {
+            // If another thread added *k, there is a tiny timing window where thread() is invalid.
+            server_thread& t = k->wait_for_thread();
+            if( t.try_grab_for( ts_omp_busy ) ) {
+                // The preincrement instead of post-increment of index is deliberate.
+                job* j = k->wait_for_job();
+                array[index] = j;
+                t.omp_dispatch.produce( client(), j, cookie, index PRODUCE_ARG(*this) );
+                if( ++index==request_size )
+                    return;
+            }
+        }
+        // Need to allocate more threads
+        for( unsigned i=index; i<request_size; ++i ) {
+            __TBB_ASSERT( index<request_size, NULL );
+            thread_map::value_type* k = my_thread_map.add_one_thread( true );
+#if TBB_USE_ASSERT
+            if( !k ) {
+                // Client erred
+                __TBB_ASSERT(false, "server::get_threads: exceeded job_count\n");
+            }
+#endif
+            my_thread_map.bind_one_thread( *this, *k );
+            server_thread& t = k->thread();
+            if( t.try_grab_for( ts_omp_busy ) ) {
+                job* j = k->wait_for_job();
+                array[index] = j;
+                // The preincrement instead of post-increment of index is deliberate.
+                t.omp_dispatch.produce( client(), j, cookie, index PRODUCE_ARG(*this) );
+                if( ++index==request_size )
+                    return;
+            } // else someone else snatched it.
+        }
+    }
+}
+#endif /* !RML_USE_WCRM */
+
+//------------------------------------------------------------------------
+// Methods of omp_dispatch_type
+//------------------------------------------------------------------------
+void omp_dispatch_type::consume() {
+    // Wait for short window between when master sets state of this thread to ts_omp_busy
+    // and master thread calls produce.
+    job_type* j;
+    tbb::internal::atomic_backoff backoff;
+    while( (j = job)==NULL ) backoff.pause();
+    job = static_cast<job_type*>(NULL);
+    client->process(*j,cookie,index);
+#if TBB_USE_ASSERT
+    // Return of method process implies "decrease_load" from client's viewpoint, even though
+    // the actual adjustment of the_balance only happens when this thread really goes to sleep.
+    --server->net_delta;
+#endif /* TBB_USE_ASSERT */
+}
+
+#if !RML_USE_WCRM
+#if _WIN32||_WIN64
+void omp_connection_v2::deactivate( rml::job* j )
+{
+#if TBB_USE_ASSERT
+    net_delta -= 1;
+#endif
+    __TBB_ASSERT( j, NULL );
+    server_thread* thr = (server_thread*) scratch_ptr( *j );
+    thr->deactivate();
+}
+
+void omp_connection_v2::reactivate( rml::job* j )
+{
+    // Should not adjust the_balance because OMP client is supposed to
+    // do try_increase_load() to reserve the threads to use.
+    __TBB_ASSERT( j, NULL );
+    server_thread* thr = (server_thread*) scratch_ptr( *j );
+    thr->reactivate();
+}
+#endif /* _WIN32||_WIN64 */
+
+//------------------------------------------------------------------------
+// Methods of server_thread
+//------------------------------------------------------------------------
+
+server_thread::server_thread() :
+    ref_count(0),
+    link(NULL),
+    my_map_pos(),
+    my_conn(NULL), my_job(NULL), my_ja(NULL)
+{
+    state = ts_idle;
+    terminate = false;
+#if TBB_USE_ASSERT
+    has_active_thread = false;
+#endif /* TBB_USE_ASSERT */
+}
+
+server_thread::~server_thread() {
+    __TBB_ASSERT( !has_active_thread, NULL );
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about an initialized variable 'sink_for_alloca' not referenced
+    #pragma warning(push)
+    #pragma warning(disable:4189)
+#endif
+__RML_DECL_THREAD_ROUTINE server_thread::thread_routine( void* arg ) {
+    server_thread* self = static_cast<server_thread*>(arg);
+    AVOID_64K_ALIASING( self->my_index );
+#if TBB_USE_ASSERT
+    __TBB_ASSERT( !self->has_active_thread, NULL );
+    self->has_active_thread = true;
+#endif /* TBB_USE_ASSERT */
+    self->loop();
+    return 0;
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+void server_thread::launch( size_t stack_size ) {
+#if USE_WINTHREAD
+    thread_monitor::launch( thread_routine, this, stack_size, &this->my_index );
+#else
+    thread_monitor::launch( thread_routine, this, stack_size );
+#endif /* USE_PTHREAD */
+}
+
+void server_thread::sleep_perhaps( thread_state_t asleep ) {
+    if( terminate ) return;
+    __TBB_ASSERT( asleep==ts_asleep, NULL );
+    thread_monitor::cookie c;
+    monitor.prepare_wait(c);
+    if( state.compare_and_swap( asleep, ts_idle )==ts_idle ) {
+        if( !terminate ) {
+            monitor.commit_wait(c);
+            // Someone else woke me up.  The compare_and_swap further below deals with spurious wakeups.
+        } else {
+            monitor.cancel_wait();
+        }
+        thread_state_t s = read_state();
+        if( s==ts_asleep ) {
+            state.compare_and_swap( ts_idle, ts_asleep );
+            // I woke myself up, either because I cancelled the wait or suffered a spurious wakeup.
+        } else {
+            // Someone else woke me up; there the_balance is decremented by 1. -- tbb only
+            if( !is_omp_thread ) {
+                __TBB_ASSERT( s==ts_tbb_busy||s==ts_idle, NULL );
+            }
+        }
+    } else {
+        // someone else made it busy ; see try_grab_for when state==ts_idle.
+        __TBB_ASSERT( state==ts_omp_busy||state==ts_tbb_busy, NULL );
+        monitor.cancel_wait();
+    }
+    __TBB_ASSERT( read_state()!=asleep, "a thread can only put itself to sleep" );
+}
+
+bool server_thread::wakeup( thread_state_t to, thread_state_t from ) {
+    bool success = false;
+    __TBB_ASSERT( from==ts_asleep && (to==ts_idle||to==ts_omp_busy||to==ts_tbb_busy), NULL );
+    if( state.compare_and_swap( to, from )==from ) {
+        if( !is_omp_thread ) __TBB_ASSERT( to==ts_idle||to==ts_tbb_busy, NULL );
+        // There is a small timing window that permits balance to become negative,
+        // but such occurrences are probably rare enough to not worry about, since
+        // at worst the result is slight temporary oversubscription.
+        monitor.notify();
+        success = true;
+    }
+    return success;
+}
+
+//! Attempt to change a thread's state to ts_omp_busy, and waking it up if necessary.
+bool server_thread::try_grab_for( thread_state_t target_state ) {
+    bool success = false;
+    switch( read_state() ) {
+        case ts_asleep:
+            success = wakeup( target_state, ts_asleep );
+            break;
+        case ts_idle:
+            success = state.compare_and_swap( target_state, ts_idle )==ts_idle;
+            break;
+        default:
+            // Thread is not available to be part of an OpenMP thread team.
+            break;
+    }
+    return success;
+}
+
+#if _WIN32||_WIN64
+void server_thread::deactivate() {
+    thread_state_t es = (thread_state_t) my_extra_state.fetch_and_store( ts_deactivated );
+    __TBB_ASSERT( my_extra_state==ts_deactivated, "someone else tampered with my_extra_state?" );
+    if( es==ts_none )
+        state = ts_idle;
+    else
+        __TBB_ASSERT( es==ts_reactivated, "Cannot call deactivate() while in ts_deactivated" );
+        // only the thread can transition itself from ts_deactivted to ts_none
+    __TBB_ASSERT( my_extra_state==ts_deactivated, "someone else tampered with my_extra_state?" );
+    my_extra_state = ts_none; // release the critical section
+    int bal = ++the_balance;
+    if( bal>0 )
+        wakeup_some_tbb_threads();
+    if( es==ts_none )
+        sleep_perhaps( ts_asleep );
+}
+
+void server_thread::reactivate() {
+    thread_state_t es;
+    do {
+        while( (es=read_extra_state())==ts_deactivated )
+            __TBB_Yield();
+        if( es==ts_reactivated ) {
+            __TBB_ASSERT( false, "two Reactivate() calls in a row.  Should not happen" );
+            return;
+        }
+        __TBB_ASSERT( es==ts_none, NULL );
+    } while( (thread_state_t)my_extra_state.compare_and_swap( ts_reactivated, ts_none )!=ts_none );
+    if( state!=ts_omp_busy ) {
+        my_extra_state = ts_none;
+        while( !try_grab_for( ts_omp_busy ) )
+            __TBB_Yield();
+    }
+}
+#endif /* _WIN32||_WIN64 */
+
+
+template<typename Connection>
+bool server_thread::destroy_job( Connection& c ) {
+    __TBB_ASSERT( !is_omp_thread||(state==ts_idle||state==ts_omp_busy), NULL );
+    __TBB_ASSERT(  is_omp_thread||(state==ts_idle||state==ts_tbb_busy), NULL );
+    if( !is_omp_thread ) {
+        __TBB_ASSERT( state==ts_idle||state==ts_tbb_busy, NULL );
+        if( state==ts_idle )
+            state.compare_and_swap( ts_done, ts_idle );
+        // 'state' may be set to ts_tbb_busy by another thread.
+
+        if( state==ts_tbb_busy ) { // return the coin to the deposit
+            // need to deposit first to let the next connection see the change
+            ++the_balance;
+            state = ts_done; // no other thread changes the state when it is ts_*_busy
+        }
+    }
+    if( job_automaton* ja = my_ja ) {
+        rml::job* j;
+        if( ja->try_plug(j) ) {
+            __TBB_ASSERT( j, NULL );
+            c.client().cleanup(*j);
+            c.remove_client_ref();
+        } else {
+            // Some other thread took responsibility for cleaning up the job.
+        }
+    }
+    // Must do remove client reference first, because execution of
+    // c.remove_ref() can cause *this to be destroyed.
+    int k = remove_ref();
+    __TBB_ASSERT_EX( k==0, "more than one references?" );
+#if TBB_USE_ASSERT
+    has_active_thread = false;
+#endif /* TBB_USE_ASSERT */
+    c.remove_server_ref();
+    return true;
+}
+
+bool server_thread::do_termination() {
+    if( is_omp_thread )
+        return destroy_job( *static_cast<omp_connection_v2*>(my_conn) );
+    else
+        return destroy_job( *static_cast<tbb_connection_v2*>(my_conn) );
+}
+
+//! Loop that each thread executes
+void server_thread::loop() {
+    if( is_omp_thread )
+        static_cast<omp_connection_v2*>(my_conn)->make_job( *this, *my_ja );
+    else
+        static_cast<tbb_connection_v2*>(my_conn)->make_job( *this, *my_ja );
+    for(;;) {
+        __TBB_Yield();
+        if( state==ts_idle )
+            sleep_perhaps( ts_asleep );
+
+        // Check whether I should quit.
+        if( terminate )
+            if( do_termination() )
+                return;
+
+        // read the state
+        thread_state_t s = read_state();
+        __TBB_ASSERT( s==ts_idle||s==ts_omp_busy||s==ts_tbb_busy, NULL );
+
+        if( s==ts_omp_busy ) {
+            // Enslaved by OpenMP team.
+            omp_dispatch.consume();
+            /* here wake tbb threads up if feasible */
+            if( ++the_balance>0 )
+                wakeup_some_tbb_threads();
+            state = ts_idle;
+        } else if( s==ts_tbb_busy ) {
+            // do some TBB work.
+            __TBB_ASSERT( my_conn && my_job, NULL );
+            tbb_connection_v2& conn = *static_cast<tbb_connection_v2*>(my_conn);
+            // give openmp higher priority
+            bool has_coin = true;
+            if( conn.has_slack() ) {
+                // it has the coin, it should trip to the scheduler at least once as long as its slack is positive
+                do {
+                    if( conn.try_process( *this, *my_job ) )
+                        if( conn.has_slack() && the_balance>=0 )
+                            has_coin = !conn.wakeup_next_thread( my_map_pos );
+                } while( has_coin && conn.has_slack() && the_balance>=0 );
+            }
+            state = ts_idle;
+            if( has_coin ) {
+                ++the_balance; // return the coin back to the deposit
+                if( conn.has_slack() ) { // a new adjust_job_request_estimate() is in progress
+                                         // it may have missed my changes to state and/or the_balance
+                    if( --the_balance>=0 ) { // try to grab the coin back
+                        // I got the coin
+                        if( state.compare_and_swap( ts_tbb_busy, ts_idle )!=ts_idle )
+                            ++the_balance; // someone else enlisted me.
+                    } else {
+                        // overdraft. return the coin
+                        ++the_balance;
+                    }
+                } // else the new request will see my changes to state & the_balance.
+            }
+            /* here wake tbb threads up if feasible */
+            if( the_balance>0 )
+                wakeup_some_tbb_threads();
+        }
+    }
+}
+#endif /* !RML_USE_WCRM */
+
+#if RML_USE_WCRM
+
+class tbb_connection_v2;
+class omp_connection_v2;
+
+#define CREATE_SCHEDULER_POLICY(policy,min_thrs,max_thrs,stack_size) \
+    try {                                                                 \
+        policy = new SchedulerPolicy (7,                                  \
+                          SchedulerKind, RML_THREAD_KIND, /*defined in _rml_serer_msrt.h*/ \
+                          MinConcurrency, min_thrs,                       \
+                          MaxConcurrency, max_thrs,                       \
+                          TargetOversubscriptionFactor, 1,                \
+                          ContextStackSize, stack_size/1000, /*ConcRT:kB, iRML:bytes*/ \
+                          ContextPriority, THREAD_PRIORITY_NORMAL,        \
+                          DynamicProgressFeedback, ProgressFeedbackDisabled ); \
+    } catch ( invalid_scheduler_policy_key & ) {                               \
+        __TBB_ASSERT( false, "invalid scheduler policy key exception caught" );\
+    } catch ( invalid_scheduler_policy_value & ) {                        \
+        __TBB_ASSERT( false, "invalid scheduler policy value exception caught" );\
+    }
+
+static unsigned int core_count;
+static tbb::atomic<int> core_count_inited;
+
+
+static unsigned int get_processor_count()
+{
+    if( core_count_inited!=2 ) {
+        if( core_count_inited.compare_and_swap( 1, 0 )==0 ) {
+            core_count = GetProcessorCount();
+            core_count_inited = 2;
+        } else {
+            tbb::internal::spin_wait_until_eq( core_count_inited, 2 );
+        }
+    }
+    return core_count;
+}
+
+template<typename Connection>
+scheduler<Connection>::scheduler( Connection& conn ) : uid(GetSchedulerId()), my_conn(conn) {}
+
+template<>
+scheduler<tbb_connection_v2>::scheduler( tbb_connection_v2& conn ) : uid(GetSchedulerId()), my_conn(conn)
+{
+    rml::client& cl = my_conn.client();
+    unsigned max_job_count = cl.max_job_count();
+    unsigned count = get_processor_count();
+    __TBB_ASSERT( max_job_count>0, "max job count must be positive" );
+    __TBB_ASSERT( count>1, "The processor count must be greater than 1" );
+    if( max_job_count>count-1) max_job_count = count-1;
+    CREATE_SCHEDULER_POLICY( my_policy, 0, max_job_count, cl.min_stack_size() );
+}
+
+#if __RML_REMOVE_VIRTUAL_PROCESSORS_DISABLED
+template<>
+void scheduler<tbb_connection_v2>::RemoveVirtualProcessors( IVirtualProcessorRoot**, unsigned int)
+{
+}
+#else
+template<>
+void scheduler<tbb_connection_v2>::RemoveVirtualProcessors( IVirtualProcessorRoot** vproots, unsigned int count )
+{
+    if( !my_conn.is_closing() )
+        my_conn.remove_virtual_processors( vproots, count );
+}
+#endif
+
+template<>
+void scheduler<tbb_connection_v2>::NotifyResourcesExternallyIdle( IVirtualProcessorRoot** /*vproots*/, unsigned int /*count*/)
+{
+    __TBB_ASSERT( false, "NotifyResourcesExternallyIdle() is not allowed for TBB" );
+}
+
+template<>
+void scheduler<tbb_connection_v2>::NotifyResourcesExternallyBusy( IVirtualProcessorRoot** /*vproots*/, unsigned int /*count*/ )
+{
+    __TBB_ASSERT( false, "NotifyResourcesExternallyBusy() is not allowed for TBB" );
+}
+
+template<>
+scheduler<omp_connection_v2>::scheduler( omp_connection_v2& conn ) : uid(GetSchedulerId()), my_conn(conn)
+{
+    unsigned count = get_processor_count();
+    rml::client& cl = my_conn.client();
+    __TBB_ASSERT( count>1, "The processor count must be greater than 1" );
+    CREATE_SCHEDULER_POLICY( my_policy, count-1, count-1, cl.min_stack_size() );
+}
+
+template<>
+void scheduler<omp_connection_v2>::RemoveVirtualProcessors( IVirtualProcessorRoot** /*vproots*/, unsigned int /*count*/ ) {
+    __TBB_ASSERT( false, "RemoveVirtualProcessors() is not allowed for OMP" );
+}
+
+template<>
+void scheduler<omp_connection_v2>::NotifyResourcesExternallyIdle( IVirtualProcessorRoot** vproots, unsigned int count ){
+    if( !my_conn.is_closing() )
+        my_conn.notify_resources_externally_idle( vproots, count );
+}
+
+template<>
+void scheduler<omp_connection_v2>::NotifyResourcesExternallyBusy( IVirtualProcessorRoot** vproots, unsigned int count ){
+    if( !my_conn.is_closing() )
+        my_conn.notify_resources_externally_busy( vproots, count );
+}
+
+/* ts_idle, ts_asleep, ts_busy */
+void tbb_server_thread::Dispatch( DispatchState* ) {
+    // Activate() will resume a thread right after Deactivate() as if it returns from the call
+    tbb_connection_v2* tbb_conn = static_cast<tbb_connection_v2*>(my_conn);
+    make_job( *tbb_conn, *this );
+
+    for( ;; ) {
+        // Try to wake some tbb threads if the balance is positive.
+        // When a thread is added by ConcRT and enter here for the first time,
+        // the thread may wake itself up (i.e., atomically change its state to ts_busy.
+        if( the_balance>0 )
+             wakeup_some_tbb_threads();
+        if( read_state()!=ts_busy )
+            if( sleep_perhaps() )
+                return;
+        if( terminate )
+            if( initiate_termination() )
+                return;
+        if( read_state()==ts_busy ) {
+            // this thread has a coin (i.e., state=ts_busy; it should trip to the scheduler at least once
+            if ( tbb_conn->has_slack() ) {
+                do {
+                    tbb_conn->try_process( *wait_for_job() );
+                } while( tbb_conn->has_slack() && the_balance>=0 && !is_removed() );
+            }
+            __TBB_ASSERT( read_state()==ts_busy, "thread is not in busy state after returning from process()" );
+            // see remove_virtual_processors()
+            if( my_state.compare_and_swap( ts_idle, ts_busy )==ts_busy ) {
+                int bal = ++the_balance;
+                if( tbb_conn->has_slack() ) {
+                    // slack is positive, volunteer to help
+                    bal = --the_balance;  // try to grab the coin back
+                    if( bal>=0 ) { // got the coin back
+                        if( my_state.compare_and_swap( ts_busy, ts_idle )!=ts_idle )
+                            ++the_balance; // someone else enlisted me.
+                        // else my_state is ts_busy, I will come back to tbb_conn->try_process().
+                    } else {
+                        // overdraft. return the coin
+                        ++the_balance;
+                    }
+                } // else the new request will see my changes to state & the_balance.
+            } else {
+                __TBB_ASSERT( false, "someone tampered with my state" );
+            }
+        } // someone else might set the state to something other than ts_idle
+    }
+}
+
+void omp_server_thread::Dispatch( DispatchState* ) {
+    // Activate() will resume a thread right after Deactivate() as if it returns from the call
+    make_job( *static_cast<omp_connection_v2*>(my_conn), *this );
+
+    for( ;; ) {
+        if( read_state()!=ts_busy )
+            sleep_perhaps();
+        if( terminate ) {
+            if( initiate_termination() )
+                return;
+        }
+        if( read_state()==ts_busy ) {
+            omp_data.consume();
+            __TBB_ASSERT( read_state()==ts_busy, "thread is not in busy state after returning from process()" );
+            my_thread_map.adjust_balance( 1 );
+            set_state( ts_idle );
+        }
+        // someone else might set the state to something other than ts_idle
+    }
+}
+
+//! Attempt to change a thread's state to ts_omp_busy, and waking it up if necessary.
+thread_grab_t server_thread_rep::try_grab_for() {
+    thread_grab_t res = wk_failed;
+    thread_state_t s = read_state();
+    switch( s ) {
+    case ts_asleep:
+        if( wakeup( ts_busy, ts_asleep ) )
+            res = wk_from_asleep;
+        __TBB_ASSERT( res==wk_failed||read_state()==ts_busy, NULL );
+        break;
+    case ts_idle:
+        if( my_state.compare_and_swap( ts_busy, ts_idle )==ts_idle )
+            res = wk_from_idle;
+        // At this point a thread is grabbed (i.e., its state has  changed to ts_busy.
+        // It is possible that the thread 1) processes the job, returns from process() and
+        // sets its state ts_idle again.  In some cases, it even sets its state to ts_asleep.
+        break;
+    default:
+        break;
+    }
+    return res;
+}
+
+bool tbb_server_thread::switch_out() {
+    thread_state_t s = read_state();
+    __TBB_ASSERT( s==ts_asleep||s==ts_busy, NULL );
+    // This thread comes back from the TBB scheduler, and changed its state to ts_asleep successfully.
+    // The master enlisted it and woke it up by Activate()'ing it; now it is emerging from Deactivated().
+    // ConcRT requested for removal of the vp associated with the thread, and RML marks it removed.
+    // Now, it has ts_busy, and removed. -- we should remove it.
+    IExecutionResource* old_vp = my_execution_resource;
+    if( s==ts_busy ) {
+        ++the_balance;
+        my_state = ts_asleep;
+    }
+    IThreadProxy* proxy = my_proxy;
+    __TBB_ASSERT( proxy, NULL );
+    my_execution_resource = (IExecutionResource*) c_remove_prepare;
+    old_vp->Remove( my_scheduler );
+    my_execution_resource = (IExecutionResource*) c_remove_returned;
+    int cnt = --activation_count;
+    __TBB_ASSERT_EX( cnt==0||cnt==1, "too many activations?" );
+    proxy->SwitchOut();
+    if( terminate ) {
+        bool activated = activation_count==1;
+#if TBB_USE_ASSERT
+        /* In a rare sequence of events, a thread comes out of SwitchOut with activation_count==1.
+         * 1) The thread is SwitchOut'ed.
+         * 2) AddVirtualProcessors() arrived and the thread is Activated.
+         * 3) The thread is coming out of SwitchOut().
+         * 4) request_close_connection arrives and inform the thread that it is time to terminate.
+         * 5) The thread hits the check and falls into the path with 'activated==true'.
+         * In that case, do the clean-up but do not switch to the thread scavenger; rather simply return to RM.
+         */
+        if( activated ) {
+            // thread is 'revived' in add_virtual_processors after being Activated().
+            // so, if the thread extra state is still marked 'removed', it will shortly change to 'none'
+            // i.e., !is_remove().  The thread state is changed to ts_idle before the extra state, so
+            // the thread's state should be either ts_idle or ts_done.
+            while( is_removed() )
+                __TBB_Yield();
+            thread_state_t s = read_state();
+            __TBB_ASSERT( s==ts_idle || s==ts_done, NULL );
+        }
+#endif
+        __TBB_ASSERT( my_state==ts_asleep||my_state==ts_idle, NULL );
+        // it is possible that in make_job() the thread may not have a chance to create a job.
+        // my_job may not be set if the thread did not get a chance to process client's job (i.e., call try_process())
+        rml::job* j;
+        if( my_job_automaton.try_plug(j) ) {
+            __TBB_ASSERT( j, NULL );
+            my_client.cleanup(*j);
+            my_conn->remove_client_ref();
+        }
+        // Must do remove client reference first, because execution of
+        // c.remove_ref() can cause *this to be destroyed.
+        if( !activated )
+            proxy->SwitchTo( my_thread_map.get_thread_scavenger(), Idle );
+        my_conn->remove_server_ref();
+        return true;
+    }
+    // We revive a thread in add_virtual_processors() after we Activate the thread on a new virtual processor.
+    // So briefly wait until the thread's my_execution_resource gets set.
+    while( get_virtual_processor()==c_remove_returned )
+        __TBB_Yield();
+    return false;
+}
+
+bool tbb_server_thread::sleep_perhaps () {
+    if( terminate ) return false;
+    thread_state_t s = read_state();
+    if( s==ts_idle ) {
+        if( my_state.compare_and_swap( ts_asleep, ts_idle )==ts_idle ) {
+            // If a thread is between read_state() and compare_and_swap(), and the master tries to terminate,
+            // the master's compare_and_swap() will fail because the thread's state is ts_idle.
+            // We need to check if terminate is true or not before letting the thread go to sleep,
+            // otherwise we will miss the terminate signal.
+            if( !terminate ) {
+                if( !is_removed() ) {
+                    --activation_count;
+                    get_virtual_processor()->Deactivate( this );
+                }
+                if( is_removed() ) {
+                    if( switch_out() )
+                        return true;
+                    __TBB_ASSERT( my_execution_resource>c_remove_returned, NULL );
+                }
+                // in add_virtual_processors(), when we revive a thread, we change its state after Activate the thread
+                // in that case the state may be ts_asleep for a short period
+                while( read_state()==ts_asleep )
+                    __TBB_Yield();
+            } else {
+                if( my_state.compare_and_swap( ts_done, ts_asleep )!=ts_asleep ) {
+                    --activation_count;
+                    // unbind() changed my state. It will call Activate(). So issue a matching Deactivate()
+                    get_virtual_processor()->Deactivate( this );
+                }
+            }
+        }
+    } else {
+        __TBB_ASSERT( s==ts_busy, NULL );
+    }
+    return false;
+}
+
+void omp_server_thread::sleep_perhaps () {
+    if( terminate ) return;
+    thread_state_t s = read_state();
+    if( s==ts_idle ) {
+        if( my_state.compare_and_swap( ts_asleep, ts_idle )==ts_idle ) {
+            // If a thread is between read_state() and compare_and_swap(), and the master tries to terminate,
+            // the master's compare_and_swap() will fail because the thread's state is ts_idle.
+            // We need to check if terminate is true or not before letting the thread go to sleep,
+            // otherwise we will miss the terminate signal.
+            if( !terminate ) {
+                get_virtual_processor()->Deactivate( this );
+                __TBB_ASSERT( !is_removed(), "OMP threads should not be deprived of a virtual processor" );
+                __TBB_ASSERT( read_state()!=ts_asleep, NULL );
+            } else {
+                if( my_state.compare_and_swap( ts_done, ts_asleep )!=ts_asleep )
+                    // unbind() changed my state. It will call Activate(). So issue a matching Deactivate()
+                    get_virtual_processor()->Deactivate( this );
+            }
+        }
+    } else {
+        __TBB_ASSERT( s==ts_busy, NULL );
+    }
+}
+
+bool tbb_server_thread::initiate_termination() {
+    if( read_state()==ts_busy ) {
+        int bal = ++the_balance;
+        if( bal>0 ) wakeup_some_tbb_threads();
+    }
+    return destroy_job( (tbb_connection_v2*) my_conn );
+}
+
+template<typename Connection>
+bool server_thread_rep::destroy_job( Connection* c ) {
+    __TBB_ASSERT( my_state!=ts_asleep, NULL );
+    rml::job* j;
+    if( my_job_automaton.try_plug(j) ) {
+        __TBB_ASSERT( j, NULL );
+        my_client.cleanup(*j);
+        c->remove_client_ref();
+    }
+    // Must do remove client reference first, because execution of
+    // c.remove_ref() can cause *this to be destroyed.
+    c->remove_server_ref();
+    return true;
+}
+
+void thread_map::assist_cleanup( bool assist_null_only ) {
+    // To avoid deadlock, the current thread *must* help out with cleanups that have not started,
+    // because the thread that created the job may be busy for a long time.
+    for( iterator i = begin(); i!=end(); ++i ) {
+        rml::job* j=0;
+        server_thread* thr = (*i).second;
+        job_automaton& ja = thr->my_job_automaton;
+        if( assist_null_only ? ja.try_plug_null() : ja.try_plug(j) ) {
+            if( j ) {
+                my_client.cleanup(*j);
+            } else {
+                // server thread did not get a chance to create a job.
+            }
+            remove_client_ref();
+        }
+    }
+}
+
+void thread_map::add_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count, tbb_connection_v2& conn, ::tbb::spin_mutex& mtx )
+{
+#if TBB_USE_ASSERT
+    int req_cnt = ++n_add_vp_requests;
+    __TBB_ASSERT( req_cnt==1, NULL );
+#endif
+    std::vector<thread_map::iterator> vec(count);
+    std::vector<tbb_server_thread*> tvec(count);
+    iterator end;
+
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+        __TBB_ASSERT( my_map.size()==0||count==1, NULL );
+        end = my_map.end(); //remember 'end' at the time of 'find'
+        // find entries in the map for those VPs that were previously added and then removed.
+        for( size_t i=0; i<count; ++i ) {
+            vec[i] = my_map.find( (key_type) vproots[i] );
+#if TBB_USE_DEBUG
+            if( vec[i]!=end ) {
+                tbb_server_thread* t = (tbb_server_thread*) (*vec[i]).second;
+                IVirtualProcessorRoot* v = t->get_virtual_processor();
+                __TBB_ASSERT( v==c_remove_prepare||v==c_remove_returned, NULL );
+            }
+#endif
+        }
+
+        iterator nxt = my_map.begin();
+        for( size_t i=0; i<count; ++i ) {
+            if( vec[i]!=end ) {
+#if TBB_USE_ASSERT
+                tbb_server_thread* t = (tbb_server_thread*) (*vec[i]).second;
+                __TBB_ASSERT( t->read_state()==ts_asleep, NULL );
+                IVirtualProcessorRoot* r = t->get_virtual_processor();
+                __TBB_ASSERT( r==c_remove_prepare||r==c_remove_returned, NULL );
+#endif
+                continue;
+            }
+
+            if( my_unrealized_threads>0 ) {
+                --my_unrealized_threads;
+            } else {
+                __TBB_ASSERT( nxt!=end, "nxt should not be thread_map::iterator::end" );
+                // find a removed thread context for i
+                for( ; nxt!=end; ++nxt ) {
+                    tbb_server_thread* t = (tbb_server_thread*) (*nxt).second;
+                    if( t->is_removed() && t->read_state()==ts_asleep && t->get_virtual_processor()==c_remove_returned ) {
+                        vec[i] = nxt++;
+                        break;
+                    }
+                }
+                // break target
+                if( vec[i]==end ) // ignore excessive VP.
+                    vproots[i] = NULL;
+            }
+        }
+    }
+
+    for( size_t i=0; i<count; ++i ) {
+        __TBB_ASSERT( !tvec[i], NULL );
+        if( vec[i]==end ) {
+            if( vproots[i] ) {
+                tvec[i] = my_tbb_allocator.allocate(1);
+                new ( tvec[i] ) tbb_server_thread( false, my_scheduler, (IExecutionResource*)vproots[i], &conn, *this, my_client );
+            }
+#if TBB_USE_ASSERT
+        } else {
+            tbb_server_thread* t = (tbb_server_thread*) (*vec[i]).second;
+            __TBB_ASSERT( t->GetProxy(), "Proxy is cleared?" );
+#endif
+        }
+    }
+
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+
+        bool closing = is_closing();
+
+        for( size_t i=0; i<count; ++i ) {
+            if( vec[i]==end ) {
+                if( vproots[i] ) {
+                    thread_map::key_type key = (thread_map::key_type) vproots[i];
+                    vec[i] = insert( key, (server_thread*) tvec[i] );
+                    my_client_ref_count.add_ref();
+                    my_server_ref_count.add_ref();
+                }
+            } else if( !closing ) {
+                tbb_server_thread* t = (tbb_server_thread*) (*vec[i]).second;
+
+                if( (*vec[i]).first!=(thread_map::key_type)vproots[i] ) {
+                    my_map.erase( vec[i] );
+                    thread_map::key_type key = (thread_map::key_type) vproots[i];
+                    __TBB_ASSERT( key, NULL );
+                    vec[i] = insert( key, t );
+                }
+                __TBB_ASSERT( t->read_state()==ts_asleep, NULL );
+                // We did not decrement server/client ref count when a thread is removed.
+                // So, don't increment server/client ref count here.
+            }
+        }
+
+        // we could check is_closing() earlier.  That requires marking the newly allocated server_thread objects
+        // that are not inserted into the thread_map, and deallocate them.  Doing so seems more cumbersome
+        // than simply adding these to the thread_map and let thread_map's destructor take care of reclamation.
+        __TBB_ASSERT( closing==is_closing(), NULL );
+        if( closing ) return;
+    }
+
+    for( size_t i=0; i<count; ++i ) {
+        if( vproots[i] ) {
+            tbb_server_thread* t = (tbb_server_thread*) (*vec[i]).second;
+            __TBB_ASSERT( tvec[i]!=NULL||t->GetProxy(), "Proxy is cleared?" );
+            if( t->is_removed() )
+                __TBB_ASSERT( t->get_virtual_processor()==c_remove_returned, NULL );
+            int cnt = ++t->activation_count;
+            __TBB_ASSERT_EX( cnt==0||cnt==1, NULL );
+            vproots[i]->Activate( t );
+            if( t->is_removed() )
+                t->revive( my_scheduler, vproots[i], my_client );
+        }
+    }
+#if TBB_USE_ASSERT
+    req_cnt = --n_add_vp_requests;
+    __TBB_ASSERT( req_cnt==0, NULL );
+#endif
+}
+
+void thread_map::remove_virtual_processors( IVirtualProcessorRoot** vproots, unsigned count, ::tbb::spin_mutex& mtx ) {
+    if( my_map.size()==0 )
+        return;
+    tbb::spin_mutex::scoped_lock lck( mtx );
+
+    if( is_closing() ) return;
+
+    for( unsigned int c=0; c<count; ++c ) {
+        iterator i = my_map.find( (key_type) vproots[c] );
+        if( i==my_map.end() ) {
+            thread_scavenger_thread* tst = my_thread_scavenger_thread;
+            if( !tst ) {
+                // Remove unknown vp from my scheduler;
+                vproots[c]->Remove( my_scheduler );
+            } else {
+                while( (tst=my_thread_scavenger_thread)==c_claimed )
+                    __TBB_Yield();
+                if( vproots[c]!=tst->get_virtual_processor() )
+                    vproots[c]->Remove( my_scheduler );
+            }
+            continue;
+        }
+        tbb_server_thread* thr = (tbb_server_thread*) (*i).second;
+        __TBB_ASSERT( thr->tbb_thread, "incorrect type of server_thread" );
+        thr->set_removed();
+        if( thr->read_state()==ts_asleep ) {
+            while( thr->activation_count>0 ) {
+                if( thr->get_virtual_processor()<=c_remove_returned )
+                    break;
+                __TBB_Yield();
+            }
+            if( thr->get_virtual_processor()>c_remove_returned ) {
+                // the thread is in Deactivated state
+                ++thr->activation_count;
+                // wake the thread up so that it Switches Out itself.
+                thr->get_virtual_processor()->Activate( thr );
+            } // else, it is Switched Out
+        } // else the thread will see that it is removed and proceed to switch itself out without Deactivation
+    }
+}
+
+void thread_map::add_virtual_processors( IVirtualProcessorRoot** vproots, unsigned int count, omp_connection_v2& conn, ::tbb::spin_mutex& mtx )
+{
+    std::vector<thread_map::iterator> vec(count);
+    std::vector<server_thread*> tvec(count);
+    iterator end;
+
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+        // read the map
+        end = my_map.end(); //remember 'end' at the time of 'find'
+        for( size_t i=0; i<count; ++i )
+            vec[i] = my_map.find( (key_type) vproots[i] );
+    }
+
+    for( size_t i=0; i<count; ++i ) {
+        __TBB_ASSERT( !tvec[i], NULL );
+        if( vec[i]==end ) {
+            tvec[i] = my_omp_allocator.allocate(1);
+            new ( tvec[i] ) omp_server_thread( false, my_scheduler, (IExecutionResource*)vproots[i], &conn, *this, my_client );
+        }
+    }
+
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+
+        for( size_t i=0; i<count; ++i ) {
+            if( vec[i]==my_map.end() ) {
+                thread_map::key_type key = (thread_map::key_type) vproots[i];
+                vec[i] = insert( key, tvec[i] );
+                my_client_ref_count.add_ref();
+                my_server_ref_count.add_ref();
+            }
+        }
+
+        // we could check is_closing() earlier.  That requires marking the newly allocated server_thread objects
+        // that are not inserted into the thread_map, and deallocate them.  Doing so seems more cumbersome
+        // than simply adding these to the thread_map and let thread_map's destructor take care of reclamation.
+        if( is_closing() ) return;
+    }
+
+    for( size_t i=0; i<count; ++i )
+        vproots[i]->Activate( (*vec[i]).second );
+
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+        for( size_t i=0; i<count; ++i )
+            original_exec_resources.push_back( vproots[i] );
+    }
+}
+
+void thread_map::mark_virtual_processors_as_lent( IVirtualProcessorRoot** vproots, unsigned count, ::tbb::spin_mutex& mtx ) {
+    tbb::spin_mutex::scoped_lock lck( mtx );
+
+    if( is_closing() ) return;
+
+    iterator end = my_map.end();
+    for( unsigned int c=0; c<count; ++c ) {
+        iterator i = my_map.find( (key_type) vproots[c] );
+        if( i==end ) {
+            // The vproc has not been added to the map in create_oversubscribers()
+            my_map.insert( hash_map_type::value_type( (key_type) vproots[c], (server_thread*)1 ) );
+        } else {
+            server_thread* thr = (*i).second;
+            if( ((uintptr_t)thr)&~(uintptr_t)1 ) {
+                __TBB_ASSERT( !thr->is_removed(), "incorrectly removed" );
+                ((omp_server_thread*)thr)->set_lent();
+            }
+        }
+    }
+}
+
+void thread_map::create_oversubscribers( unsigned n, std::vector<server_thread*>& thr_vec, omp_connection_v2& conn, ::tbb::spin_mutex& mtx ) {
+    std::vector<IExecutionResource*> curr_exec_rsc;
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+        curr_exec_rsc = original_exec_resources; // copy construct
+    }
+    typedef std::vector<IExecutionResource*>::iterator iterator_er;
+    typedef ::std::vector<std::pair<hash_map_type::key_type, hash_map_type::mapped_type> > hash_val_vector_t;
+    hash_val_vector_t v_vec(n);
+    iterator_er begin = curr_exec_rsc.begin();
+    iterator_er end   = curr_exec_rsc.end();
+    iterator_er i = begin;
+    for( unsigned c=0; c<n; ++c ) {
+        IVirtualProcessorRoot* vpr = my_scheduler_proxy->CreateOversubscriber( *i );
+        omp_server_thread* t = new ( my_omp_allocator.allocate(1) ) omp_server_thread( true, my_scheduler, (IExecutionResource*)vpr, &conn, *this, my_client );
+        thr_vec[c] = t;
+        v_vec[c] = hash_map_type::value_type( (key_type) vpr, t );
+        if( ++i==end ) i = begin;
+    }
+
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+
+        if( is_closing() ) return;
+
+        iterator end = my_map.end();
+        unsigned c = 0;
+        for( hash_val_vector_t::iterator vi=v_vec.begin(); vi!=v_vec.end(); ++vi, ++c ) {
+            iterator i = my_map.find( (key_type) (*vi).first );
+            if( i==end ) {
+                my_map.insert( *vi );
+            } else {
+                // the vproc has not been added to the map in mark_virtual_processors_as_returned();
+                uintptr_t lent = (uintptr_t) (*i).second;
+                __TBB_ASSERT( lent<=1, "vproc map entry added incorrectly?");
+                (*i).second = thr_vec[c];
+                if( lent )
+                    ((omp_server_thread*)thr_vec[c])->set_lent();
+                else
+                    ((omp_server_thread*)thr_vec[c])->set_returned();
+            }
+            my_client_ref_count.add_ref();
+            my_server_ref_count.add_ref();
+        }
+    }
+}
+
+void thread_map::wakeup_tbb_threads( int c, ::tbb::spin_mutex& mtx ) {
+    std::vector<tbb_server_thread*> vec(c);
+
+    size_t idx = 0;
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+
+        if( is_closing() ) return;
+        // only one RML thread is in here to wake worker threads up.
+
+        int bal = the_balance;
+        int cnt = c<bal ? c : bal;
+
+        if( cnt<=0 ) { return; }
+
+        for( iterator i=begin(); i!=end(); ++i ) {
+            tbb_server_thread* thr = (tbb_server_thread*) (*i).second;
+            // ConcRT RM should take threads away from TBB scheduler instead of lending them to another scheduler
+            if( thr->is_removed() )
+                continue;
+
+            if( --the_balance>=0 ) {
+                thread_grab_t res;
+                while( (res=thr->try_grab_for())!=wk_from_idle ) {
+                    if( res==wk_from_asleep ) {
+                        vec[idx++] = thr;
+                        break;
+                    } else {
+                        thread_state_t s = thr->read_state();
+                        if( s==ts_busy ) {// failed because already assigned. move on.
+                            ++the_balance;
+                            goto skip;
+                        }
+                    }
+                }
+                thread_state_t s = thr->read_state();
+                __TBB_ASSERT_EX( s==ts_busy, "should have set the state to ts_busy" );
+                if( --cnt==0 )
+                    break;
+            } else {
+                // overdraft
+                ++the_balance;
+                break;
+            }
+skip:
+            ;
+        }
+    }
+
+    for( size_t i=0; i<idx; ++i ) {
+        tbb_server_thread* thr = vec[i];
+        __TBB_ASSERT( thr, NULL );
+        thread_state_t s = thr->read_state();
+        __TBB_ASSERT_EX( s==ts_busy, "should have set the state to ts_busy" );
+        ++thr->activation_count;
+        thr->get_virtual_processor()->Activate( thr );
+    }
+
+}
+
+void thread_map::mark_virtual_processors_as_returned( IVirtualProcessorRoot** vprocs, unsigned int count, tbb::spin_mutex& mtx ) {
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+
+        if( is_closing() ) return;
+
+        iterator end = my_map.end();
+        for(unsigned c=0; c<count; ++c ) {
+            iterator i = my_map.find( (key_type) vprocs[c] );
+            if( i==end ) {
+                // the vproc has not been added to the map in create_oversubscribers()
+                my_map.insert( hash_map_type::value_type( (key_type) vprocs[c], static_cast<server_thread*>(0) ) );
+            } else {
+                omp_server_thread* thr = (omp_server_thread*) (*i).second;
+                if( ((uintptr_t)thr)&~(uintptr_t)1 ) {
+                    __TBB_ASSERT( !thr->is_removed(), "incorrectly removed" );
+                    // we should not make any assumption on the initial state of an added vproc.
+                    thr->set_returned();
+                }
+            }
+        }
+    }
+}
+
+
+void thread_map::unbind( rml::server& /*server*/, tbb::spin_mutex& mtx ) {
+    {
+        tbb::spin_mutex::scoped_lock lck( mtx );
+        shutdown_in_progress = true;  // ignore any callbacks from ConcRT RM
+
+        // Ask each server_thread to cleanup its job for this server.
+        for( iterator i = begin(); i!=end(); ++i ) {
+            server_thread* t = (*i).second;
+            t->terminate = true;
+            if( t->is_removed() ) {
+                // This is for TBB only as ConcRT RM does not request OMP schedulers to remove virtual processors
+                if( t->read_state()==ts_asleep ) {
+                    __TBB_ASSERT( my_thread_scavenger_thread, "this is TBB connection; thread_scavenger_thread must be allocated" );
+                    // thread is on its way to switch_out; see remove_virtual_processors() where
+                    // the thread is Activated() to bring it back from 'Deactivated' in sleep_perhaps()
+                    // now assume that the thread will go to SwitchOut()
+#if TBB_USE_ASSERT
+                    while( t->get_virtual_processor()>c_remove_returned )
+                        __TBB_Yield();
+#endif
+                    // A removed thread is supposed to proceed to SwithcOut.
+                    // There, we remove client&server references.
+                }
+            } else {
+                if( t->wakeup( ts_done, ts_asleep ) ) {
+                    if( t->tbb_thread )
+                        ++((tbb_server_thread*)t)->activation_count;
+                    t->get_virtual_processor()->Activate( t );
+                    // We mark in the thread_map such that when termination sequence started, we ignore
+                    // all notification from ConcRT RM.
+                }
+            }
+        }
+    }
+    // Remove extra ref to client.
+    remove_client_ref();
+
+    if( my_thread_scavenger_thread ) {
+        thread_scavenger_thread* tst;
+        while( (tst=my_thread_scavenger_thread)==c_claimed )
+            __TBB_Yield();
+#if TBB_USE_ASSERT
+        ++my_thread_scavenger_thread->activation_count;
+#endif
+        tst->get_virtual_processor()->Activate( tst );
+    }
+}
+
+#if !__RML_REMOVE_VIRTUAL_PROCESSORS_DISABLED
+void thread_map::allocate_thread_scavenger( IExecutionResource* v )
+{
+    if( my_thread_scavenger_thread>c_claimed ) return;
+    thread_scavenger_thread* c = my_thread_scavenger_thread.fetch_and_store((thread_scavenger_thread*)c_claimed);
+    if( c==NULL ) { // successfully claimed
+        add_server_ref();
+#if TBB_USE_ASSERT
+        ++n_thread_scavengers_created;
+#endif
+        __TBB_ASSERT( v, NULL );
+        IVirtualProcessorRoot* vpr = my_scheduler_proxy->CreateOversubscriber( v );
+        my_thread_scavenger_thread = c = new ( my_scavenger_allocator.allocate(1) ) thread_scavenger_thread( my_scheduler, vpr, *this );
+#if TBB_USE_ASSERT
+        ++c->activation_count;
+#endif
+        vpr->Activate( c );
+    } else if( c>c_claimed ) {
+        my_thread_scavenger_thread = c;
+    }
+}
+#endif
+
+void thread_scavenger_thread::Dispatch( DispatchState* )
+{
+    __TBB_ASSERT( my_proxy, NULL );
+#if TBB_USE_ASSERT
+    --activation_count;
+#endif
+    get_virtual_processor()->Deactivate( this );
+    for( thread_map::iterator i=my_thread_map.begin(); i!=my_thread_map.end(); ++i ) {
+        tbb_server_thread* t = (tbb_server_thread*) (*i).second;
+        if( t->read_state()==ts_asleep && t->is_removed() ) {
+            while( t->get_execution_resource()!=c_remove_returned )
+                __TBB_Yield();
+            my_proxy->SwitchTo( t, Blocking );
+        }
+    }
+    get_virtual_processor()->Remove( my_scheduler );
+    my_thread_map.remove_server_ref();
+    // signal to the connection scavenger that i am done with the map.
+    __TBB_ASSERT( activation_count==1, NULL );
+    set_state( ts_done );
+}
+
+//! Windows "DllMain" that handles startup and shutdown of dynamic library.
+extern "C" bool WINAPI DllMain( HINSTANCE /*hinstDLL*/, DWORD fwdReason, LPVOID lpvReserved ) {
+    void assist_cleanup_connections();
+    if( fwdReason==DLL_PROCESS_DETACH ) {
+        // dll is being unloaded
+        if( !lpvReserved ) // if FreeLibrary has been called
+            assist_cleanup_connections();
+    }
+    return true;
+}
+
+void free_all_connections( uintptr_t conn_ex ) {
+    while( conn_ex ) {
+        bool is_tbb = (conn_ex&2)>0;
+        //clear extra bits
+        uintptr_t curr_conn = conn_ex & ~(uintptr_t)3;
+        __TBB_ASSERT( curr_conn, NULL );
+
+        // Wait for worker threads to return
+        if( is_tbb ) {
+            tbb_connection_v2* tbb_conn = reinterpret_cast<tbb_connection_v2*>(curr_conn);
+            conn_ex = reinterpret_cast<uintptr_t>(tbb_conn->next_conn);
+            while( tbb_conn->my_thread_map.remove_server_ref()>0 )
+                __TBB_Yield();
+            delete tbb_conn;
+        } else {
+            omp_connection_v2* omp_conn = reinterpret_cast<omp_connection_v2*>(curr_conn);
+            conn_ex = reinterpret_cast<uintptr_t>(omp_conn->next_conn);
+            while( omp_conn->my_thread_map.remove_server_ref()>0 )
+                __TBB_Yield();
+            delete omp_conn;
+        }
+    }
+}
+
+void assist_cleanup_connections()
+{
+    //signal to connection_scavenger_thread to terminate
+    uintptr_t tail = connections_to_reclaim.tail;
+    while( connections_to_reclaim.tail.compare_and_swap( garbage_connection_queue::plugged, tail )!=tail ) {
+        __TBB_Yield();
+        tail = connections_to_reclaim.tail;
+    }
+
+    __TBB_ASSERT( connection_scavenger.state==ts_busy || connection_scavenger.state==ts_asleep, NULL );
+    // Scavenger thread may be busy freeing connections
+    DWORD thr_exit_code = STILL_ACTIVE;
+    while( connection_scavenger.state==ts_busy ) {
+        if( GetExitCodeThread( connection_scavenger.thr_handle, &thr_exit_code )>0 )
+            if( thr_exit_code!=STILL_ACTIVE )
+                break;
+        __TBB_Yield();
+        thr_exit_code = STILL_ACTIVE;
+    }
+    if( connection_scavenger.state==ts_asleep && thr_exit_code==STILL_ACTIVE )
+        connection_scavenger.wakeup(); // wake the connection scavenger thread up
+
+    // it is possible that the connection scavenger thread already exited.  Take over its responsibility.
+    if( tail && connections_to_reclaim.tail!=garbage_connection_queue::plugged_acked ) {
+        // atomically claim the head of the list.
+        uintptr_t head = connections_to_reclaim.head.fetch_and_store( garbage_connection_queue::empty );
+        if( head==garbage_connection_queue::empty )
+            head = tail;
+        connection_scavenger.process_requests( head );
+    }
+    __TBB_ASSERT( connections_to_reclaim.tail==garbage_connection_queue::plugged||connections_to_reclaim.tail==garbage_connection_queue::plugged_acked, "someone else added a request after termination has initiated" );
+    __TBB_ASSERT( (unsigned)the_balance==the_default_concurrency, NULL );
+}
+
+void connection_scavenger_thread::sleep_perhaps() {
+    uintptr_t tail = connections_to_reclaim.tail;
+    // connections_to_reclaim.tail==garbage_connection_queue::plugged --> terminate,
+    // connections_to_reclaim.tail>garbage_connection_queue::plugged : we got work to do
+    if( tail>=garbage_connection_queue::plugged ) return;
+    __TBB_ASSERT( !tail, NULL );
+    thread_monitor::cookie c;
+    monitor.prepare_wait(c);
+    if( state.compare_and_swap( ts_asleep, ts_busy )==ts_busy ) {
+        if( connections_to_reclaim.tail!=garbage_connection_queue::plugged ) {
+            monitor.commit_wait(c);
+            // Someone else woke me up.  The compare_and_swap further below deals with spurious wakeups.
+        } else {
+            monitor.cancel_wait();
+        }
+        thread_state_t s = state;
+        if( s==ts_asleep ) // if spurious wakeup.
+            state.compare_and_swap( ts_busy, ts_asleep );
+            // I woke myself up, either because I cancelled the wait or suffered a spurious wakeup.
+    } else {
+        __TBB_ASSERT( false, "someone else tampered with my state" );
+    }
+    __TBB_ASSERT( state==ts_busy, "a thread can only put itself to sleep" );
+}
+
+void connection_scavenger_thread::process_requests( uintptr_t conn_ex )
+{
+    __TBB_ASSERT( conn_ex>1, NULL );
+    __TBB_ASSERT( n_scavenger_threads==1||connections_to_reclaim.tail==garbage_connection_queue::plugged, "more than one connection_scavenger_thread being active?" );
+
+    bool done = false;
+    while( !done ) {
+        bool is_tbb = (conn_ex&2)>0;
+        //clear extra bits
+        uintptr_t curr_conn = conn_ex & ~(uintptr_t)3;
+
+        // no contention. there is only one connection_scavenger_thread!!
+        uintptr_t next_conn;
+        tbb_connection_v2* tbb_conn = NULL;
+        omp_connection_v2* omp_conn = NULL;
+        // Wait for worker threads to return
+        if( is_tbb ) {
+            tbb_conn = reinterpret_cast<tbb_connection_v2*>(curr_conn);
+            next_conn = reinterpret_cast<uintptr_t>(tbb_conn->next_conn);
+            while( tbb_conn->my_thread_map.get_server_ref_count()>1 )
+                __TBB_Yield();
+        } else {
+            omp_conn = reinterpret_cast<omp_connection_v2*>(curr_conn);
+            next_conn = reinterpret_cast<uintptr_t>(omp_conn->next_conn);
+            while( omp_conn->my_thread_map.get_server_ref_count()>1 )
+                __TBB_Yield();
+        }
+
+        //someone else may try to write into this connection object.
+        //So access next_conn field first before remove the extra server ref count.
+
+        if( next_conn==0 ) {
+            uintptr_t tail = connections_to_reclaim.tail;
+            if( tail==garbage_connection_queue::plugged ) {
+                tail = garbage_connection_queue::plugged_acked; // connection scavenger saw the flag, and it freed all connections.
+                done = true;
+            } else if( tail==conn_ex ) {
+                if( connections_to_reclaim.tail.compare_and_swap( garbage_connection_queue::empty, tail )==tail ) {
+                    __TBB_ASSERT( !connections_to_reclaim.head, NULL );
+                    done = true;
+                }
+            }
+
+            if( !done ) {
+                // A new connection to close is added to connections_to_reclaim.tail;
+                // Wait for curr_conn->next_conn to be set.
+                if( is_tbb ) {
+                    while( !tbb_conn->next_conn )
+                        __TBB_Yield();
+                    conn_ex = reinterpret_cast<uintptr_t>(tbb_conn->next_conn);
+                } else {
+                    while( !omp_conn->next_conn )
+                        __TBB_Yield();
+                    conn_ex = reinterpret_cast<uintptr_t>(omp_conn->next_conn);
+                }
+            }
+        } else {
+            conn_ex = next_conn;
+        }
+        __TBB_ASSERT( conn_ex, NULL );
+        if( is_tbb )
+            // remove extra server ref count; this will trigger Shutdown/Release of ConcRT RM
+            tbb_conn->remove_server_ref();
+        else
+            // remove extra server ref count; this will trigger Shutdown/Release of ConcRT RM
+            omp_conn->remove_server_ref();
+    }
+}
+
+__RML_DECL_THREAD_ROUTINE connection_scavenger_thread::thread_routine( void* arg ) {
+    connection_scavenger_thread* thr = (connection_scavenger_thread*) arg;
+    thr->state = ts_busy;
+    thr->thr_handle = GetCurrentThread();
+#if TBB_USE_ASSERT
+    ++thr->n_scavenger_threads;
+#endif
+    for(;;) {
+        __TBB_Yield();
+        thr->sleep_perhaps();
+        if( connections_to_reclaim.tail==garbage_connection_queue::plugged || connections_to_reclaim.tail==garbage_connection_queue::plugged_acked ) {
+            thr->state = ts_asleep;
+            return 0;
+        }
+
+        __TBB_ASSERT( connections_to_reclaim.tail!=garbage_connection_queue::plugged_acked, NULL );
+        __TBB_ASSERT( connections_to_reclaim.tail>garbage_connection_queue::plugged && (connections_to_reclaim.tail&garbage_connection_queue::plugged)==0 , NULL );
+        while( connections_to_reclaim.head==garbage_connection_queue::empty )
+            __TBB_Yield();
+        uintptr_t head = connections_to_reclaim.head.fetch_and_store( garbage_connection_queue::empty );
+        thr->process_requests( head );
+        wakeup_some_tbb_threads();
+    }
+}
+
+template<typename Server, typename Client>
+void connection_scavenger_thread::add_request( generic_connection<Server,Client>* conn_to_close )
+{
+    uintptr_t conn_ex = (uintptr_t)conn_to_close | (connection_traits<Server,Client>::is_tbb<<1);
+    __TBB_ASSERT( !conn_to_close->next_conn, NULL );
+    const uintptr_t old_tail_ex = connections_to_reclaim.tail.fetch_and_store(conn_ex);
+    __TBB_ASSERT( old_tail_ex==0||old_tail_ex>garbage_connection_queue::plugged_acked, "Unloading DLL called while this connection is being closed?" );
+
+    if( old_tail_ex==garbage_connection_queue::empty )
+        connections_to_reclaim.head = conn_ex;
+    else {
+        bool is_tbb = (old_tail_ex&2)>0;
+        uintptr_t old_tail = old_tail_ex & ~(uintptr_t)3;
+        if( is_tbb )
+            reinterpret_cast<tbb_connection_v2*>(old_tail)->next_conn = reinterpret_cast<tbb_connection_v2*>(conn_ex);
+        else
+            reinterpret_cast<omp_connection_v2*>(old_tail)->next_conn = reinterpret_cast<omp_connection_v2*>(conn_ex);
+    }
+
+    if( state==ts_asleep )
+        wakeup();
+}
+
+template<>
+uintptr_t connection_scavenger_thread::grab_and_prepend( generic_connection<tbb_server,tbb_client>* /*last_conn_to_close*/ ) { return 0;}
+
+template<>
+uintptr_t connection_scavenger_thread::grab_and_prepend( generic_connection<omp_server,omp_client>* last_conn_to_close )
+{
+    uintptr_t conn_ex = (uintptr_t)last_conn_to_close;
+    uintptr_t head = connections_to_reclaim.head.fetch_and_store( garbage_connection_queue::empty );
+    reinterpret_cast<omp_connection_v2*>(last_conn_to_close)->next_conn = reinterpret_cast<omp_connection_v2*>(head);
+    return conn_ex;
+}
+
+extern "C" ULONGLONG NTAPI VerSetConditionMask( ULONGLONG, DWORD, BYTE);
+
+bool is_windows7_or_later ()
+{
+    try {
+        return GetOSVersion()>=IResourceManager::Win7OrLater;
+    } catch( ... ) {
+        return false;
+    }
+}
+
+#endif /* RML_USE_WCRM */
+
+template<typename Connection, typename Server, typename Client>
+static factory::status_type connect( factory& f, Server*& server, Client& client ) {
+    server = new Connection(*static_cast<wait_counter*>(f.scratch_ptr),client);
+    return factory::st_success;
+}
+
+void init_rml_module () {
+    the_balance = the_default_concurrency = tbb::internal::AvailableHwConcurrency() - 1;
+#if RML_USE_WCRM
+    connection_scavenger.launch();
+#endif
+}
+
+extern "C" factory::status_type __RML_open_factory( factory& f, version_type& server_version, version_type client_version ) {
+    // Hack to keep this library from being closed by causing the first client's dlopen to not have a corresponding dlclose.
+    // This code will be removed once we figure out how to do shutdown of the RML perfectly.
+    static tbb::atomic<bool> one_time_flag;
+    if( one_time_flag.compare_and_swap(true,false)==false) {
+        __TBB_ASSERT( (size_t)f.library_handle!=factory::c_dont_unload, NULL );
+#if _WIN32||_WIN64
+        f.library_handle = reinterpret_cast<HMODULE>(factory::c_dont_unload);
+#else
+        f.library_handle = reinterpret_cast<void*>(factory::c_dont_unload);
+#endif
+    }
+    // End of hack
+
+    // Initialize the_balance only once
+    tbb::internal::atomic_do_once ( &init_rml_module, rml_module_state );
+
+    server_version = SERVER_VERSION;
+    f.scratch_ptr = 0;
+    if( client_version==0 ) {
+        return factory::st_incompatible;
+#if RML_USE_WCRM
+    } else if ( !is_windows7_or_later() ) {
+#if TBB_USE_DEBUG
+        fprintf(stderr, "This version of the RML library requires Windows 7 to run on.\nConnection request denied.\n");
+#endif
+        return factory::st_incompatible;
+#endif
+    } else {
+#if TBB_USE_DEBUG
+        if( client_version<EARLIEST_COMPATIBLE_CLIENT_VERSION )
+            fprintf(stderr, "This client library is too old for the current RML server.\nThe connection request is granted but oversubscription/undersubscription may occur.\n");
+#endif
+        f.scratch_ptr = new wait_counter;
+        return factory::st_success;
+    }
+}
+
+extern "C" void __RML_close_factory( factory& f ) {
+    if( wait_counter* fc = static_cast<wait_counter*>(f.scratch_ptr) ) {
+        f.scratch_ptr = 0;
+        fc->wait();
+        size_t bal = the_balance;
+        f.scratch_ptr = (void*)bal;
+        delete fc;
+    }
+}
+
+void call_with_build_date_str( ::rml::server_info_callback_t cb, void* arg );
+
+}} // rml::internal
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+extern "C" tbb_factory::status_type __TBB_make_rml_server( tbb_factory& f, tbb_server*& server, tbb_client& client ) {
+    return ::rml::internal::connect< ::rml::internal::tbb_connection_v2>(f,server,client);
+}
+
+extern "C" void __TBB_call_with_my_server_info( ::rml::server_info_callback_t cb, void* arg ) {
+    return ::rml::internal::call_with_build_date_str( cb, arg );
+}
+
+}}}
+
+namespace __kmp {
+namespace rml {
+
+extern "C" omp_factory::status_type __KMP_make_rml_server( omp_factory& f, omp_server*& server, omp_client& client ) {
+    return ::rml::internal::connect< ::rml::internal::omp_connection_v2>(f,server,client);
+}
+
+extern "C" void __KMP_call_with_my_server_info( ::rml::server_info_callback_t cb, void* arg ) {
+    return ::rml::internal::call_with_build_date_str( cb, arg );
+}
+
+}}
+
+/*
+ * RML server info
+ */
+#include "version_string.ver"
+
+#ifndef __TBB_VERSION_STRINGS
+#pragma message("Warning: version_string.ver isn't generated properly by version_info.sh script!")
+#endif
+
+// We use the build time as the RML server info. TBB is required to build RML, so we make it the same as the TBB build time.
+#ifndef __TBB_DATETIME
+#define __TBB_DATETIME __DATE__ " " __TIME__
+#endif
+
+#if !RML_USE_WCRM
+#define RML_SERVER_BUILD_TIME "Intel(R) RML library built: " __TBB_DATETIME
+#define RML_SERVER_VERSION_ST "Intel(R) RML library version: v" TOSTRING(SERVER_VERSION)
+#else
+#define RML_SERVER_BUILD_TIME "Intel(R) RML library built: " __TBB_DATETIME
+#define RML_SERVER_VERSION_ST "Intel(R) RML library version: v" TOSTRING(SERVER_VERSION) " on ConcRT RM with " RML_THREAD_KIND_STRING
+#endif
+
+namespace rml {
+namespace internal {
+
+void call_with_build_date_str( ::rml::server_info_callback_t cb, void* arg )
+{
+    (*cb)( arg, RML_SERVER_BUILD_TIME );
+    (*cb)( arg, RML_SERVER_VERSION_ST );
+}
+}} // rml::internal
diff --git a/xdl/third_party/tbb/src/rml/server/thread_monitor.h b/xdl/third_party/tbb/src/rml/server/thread_monitor.h
new file mode 100644
index 00000000..2b59bb78
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/thread_monitor.h
@@ -0,0 +1,271 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// All platform-specific threading support is encapsulated here. */
+
+#ifndef __RML_thread_monitor_H
+#define __RML_thread_monitor_H
+
+#if USE_WINTHREAD
+#include <windows.h>
+#include <process.h>
+#include <malloc.h> //_alloca
+#include "tbb/tbb_misc.h" // support for processor groups
+#if __TBB_WIN8UI_SUPPORT
+#include <thread>
+#endif
+#elif USE_PTHREAD
+#include <pthread.h>
+#include <string.h>
+#include <stdlib.h>
+#else
+#error Unsupported platform
+#endif
+#include <stdio.h>
+#include "tbb/itt_notify.h"
+#include "tbb/atomic.h"
+#include "tbb/semaphore.h"
+
+// All platform-specific threading support is in this header.
+
+#if (_WIN32||_WIN64)&&!__TBB_ipf
+// Deal with 64K aliasing.  The formula for "offset" is a Fibonacci hash function,
+// which has the desirable feature of spreading out the offsets fairly evenly
+// without knowing the total number of offsets, and furthermore unlikely to
+// accidentally cancel out other 64K aliasing schemes that Microsoft might implement later.
+// See Knuth Vol 3. "Theorem S" for details on Fibonacci hashing.
+// The second statement is really does need "volatile", otherwise the compiler might remove the _alloca.
+#define AVOID_64K_ALIASING(idx)                       \
+    size_t offset = (idx+1) * 40503U % (1U<<16);      \
+    void* volatile sink_for_alloca = _alloca(offset); \
+    __TBB_ASSERT_EX(sink_for_alloca, "_alloca failed");
+#else
+// Linux thread allocators avoid 64K aliasing.
+#define AVOID_64K_ALIASING(idx) tbb::internal::suppress_unused_warning(idx)
+#endif /* _WIN32||_WIN64 */
+
+namespace rml {
+
+namespace internal {
+
+#if DO_ITT_NOTIFY
+static const ::tbb::tchar *SyncType_RML = _T("%Constant");
+static const ::tbb::tchar *SyncObj_ThreadMonitor = _T("RML Thr Monitor");
+#endif /* DO_ITT_NOTIFY */
+
+//! Monitor with limited two-phase commit form of wait.
+/** At most one thread should wait on an instance at a time. */
+class thread_monitor {
+public:
+    class cookie {
+        friend class thread_monitor;
+        tbb::atomic<size_t> my_epoch;
+    };
+    thread_monitor() : skipped_wakeup(false), my_sema() {
+        my_cookie.my_epoch = 0;
+        ITT_SYNC_CREATE(&my_sema, SyncType_RML, SyncObj_ThreadMonitor);
+        in_wait = false;
+    }
+    ~thread_monitor() {}
+
+    //! If a thread is waiting or started a two-phase wait, notify it.
+    /** Can be called by any thread. */
+    void notify();
+
+    //! Begin two-phase wait.
+    /** Should only be called by thread that owns the monitor.
+        The caller must either complete the wait or cancel it. */
+    void prepare_wait( cookie& c );
+
+    //! Complete a two-phase wait and wait until notification occurs after the earlier prepare_wait.
+    void commit_wait( cookie& c );
+
+    //! Cancel a two-phase wait.
+    void cancel_wait();
+
+#if USE_WINTHREAD
+    typedef HANDLE handle_type;
+
+    #define __RML_DECL_THREAD_ROUTINE unsigned WINAPI
+    typedef unsigned (WINAPI *thread_routine_type)(void*);
+
+    //! Launch a thread
+    static handle_type launch( thread_routine_type thread_routine, void* arg, size_t stack_size, const size_t* worker_index = NULL );
+
+#elif USE_PTHREAD
+    typedef pthread_t handle_type;
+
+    #define __RML_DECL_THREAD_ROUTINE void*
+    typedef void*(*thread_routine_type)(void*);
+
+    //! Launch a thread
+    static handle_type launch( thread_routine_type thread_routine, void* arg, size_t stack_size );
+#endif /* USE_PTHREAD */
+
+    //! Yield control to OS
+    /** Affects the calling thread. **/
+    static void yield();
+
+    //! Join thread
+    static void join(handle_type handle);
+
+    //! Detach thread
+    static void detach_thread(handle_type handle);
+private:
+    cookie my_cookie; // epoch counter
+    tbb::atomic<bool> in_wait;
+    bool skipped_wakeup;
+    tbb::internal::binary_semaphore my_sema;
+#if USE_PTHREAD
+    static void check( int error_code, const char* routine );
+#endif
+};
+
+#if USE_WINTHREAD
+
+#ifndef STACK_SIZE_PARAM_IS_A_RESERVATION
+#define STACK_SIZE_PARAM_IS_A_RESERVATION 0x00010000
+#endif
+
+#if __TBB_WIN8UI_SUPPORT
+inline thread_monitor::handle_type thread_monitor::launch( thread_routine_type thread_function, void* arg, size_t, const size_t*) {
+//TODO: check that exception thrown from std::thread is not swallowed silently
+    std::thread* thread_tmp=new std::thread(thread_function, arg);
+    return thread_tmp->native_handle();
+}
+#else //__TBB_WIN8UI_SUPPORT
+inline thread_monitor::handle_type thread_monitor::launch( thread_routine_type thread_routine, void* arg, size_t stack_size, const size_t* worker_index ) {
+    unsigned thread_id;
+    int number_of_processor_groups = ( worker_index ) ? tbb::internal::NumberOfProcessorGroups() : 0;
+    unsigned create_flags = ( number_of_processor_groups > 1 ) ? CREATE_SUSPENDED : 0;
+    HANDLE h = (HANDLE)_beginthreadex( NULL, unsigned(stack_size), thread_routine, arg, STACK_SIZE_PARAM_IS_A_RESERVATION | create_flags, &thread_id );
+    if( !h ) {
+        fprintf(stderr,"thread_monitor::launch: _beginthreadex failed\n");
+        exit(1);
+    }
+    if ( number_of_processor_groups > 1 ) {
+        tbb::internal::MoveThreadIntoProcessorGroup( h,
+                        tbb::internal::FindProcessorGroupIndex( static_cast<int>(*worker_index) ) );
+        ResumeThread( h );
+    }
+    return h;
+}
+#endif //__TBB_WIN8UI_SUPPORT
+
+void thread_monitor::join(handle_type handle) {
+#if TBB_USE_ASSERT
+    DWORD res =
+#endif
+        WaitForSingleObjectEx(handle, INFINITE, FALSE);
+    __TBB_ASSERT( res==WAIT_OBJECT_0, NULL );
+#if TBB_USE_ASSERT
+    BOOL val =
+#endif
+        CloseHandle(handle);
+    __TBB_ASSERT( val, NULL );
+}
+
+void thread_monitor::detach_thread(handle_type handle) {
+#if TBB_USE_ASSERT
+    BOOL val =
+#endif
+        CloseHandle(handle);
+    __TBB_ASSERT( val, NULL );
+}
+
+inline void thread_monitor::yield() {
+// TODO: consider unification via __TBB_Yield or tbb::this_tbb_thread::yield
+#if !__TBB_WIN8UI_SUPPORT
+    SwitchToThread();
+#else
+    std::this_thread::yield();
+#endif
+}
+#endif /* USE_WINTHREAD */
+
+#if USE_PTHREAD
+// TODO: can we throw exceptions instead of termination?
+inline void thread_monitor::check( int error_code, const char* routine ) {
+    if( error_code ) {
+        fprintf(stderr,"thread_monitor %s in %s\n", strerror(error_code), routine );
+        exit(1);
+    }
+}
+
+inline thread_monitor::handle_type thread_monitor::launch( void* (*thread_routine)(void*), void* arg, size_t stack_size ) {
+    // FIXME - consider more graceful recovery than just exiting if a thread cannot be launched.
+    // Note that there are some tricky situations to deal with, such that the thread is already
+    // grabbed as part of an OpenMP team.
+    pthread_attr_t s;
+    check(pthread_attr_init( &s ), "pthread_attr_init");
+    if( stack_size>0 )
+        check(pthread_attr_setstacksize( &s, stack_size ), "pthread_attr_setstack_size" );
+    pthread_t handle;
+    check( pthread_create( &handle, &s, thread_routine, arg ), "pthread_create" );
+    check( pthread_attr_destroy( &s ), "pthread_attr_destroy" );
+    return handle;
+}
+
+void thread_monitor::join(handle_type handle) {
+    check(pthread_join(handle, NULL), "pthread_join");
+}
+
+void thread_monitor::detach_thread(handle_type handle) {
+    check(pthread_detach(handle), "pthread_detach");
+}
+
+inline void thread_monitor::yield() {
+    sched_yield();
+}
+#endif /* USE_PTHREAD */
+
+inline void thread_monitor::notify() {
+    my_cookie.my_epoch = my_cookie.my_epoch + 1;
+    bool do_signal = in_wait.fetch_and_store( false );
+    if( do_signal )
+        my_sema.V();
+}
+
+inline void thread_monitor::prepare_wait( cookie& c ) {
+    if( skipped_wakeup ) {
+        // Lazily consume a signal that was skipped due to cancel_wait
+        skipped_wakeup = false;
+        my_sema.P(); // does not really wait on the semaphore
+    }
+    c = my_cookie;
+    in_wait.store<tbb::full_fence>( true );
+}
+
+inline void thread_monitor::commit_wait( cookie& c ) {
+    bool do_it = ( c.my_epoch == my_cookie.my_epoch );
+    if( do_it ) my_sema.P();
+    else        cancel_wait();
+}
+
+inline void thread_monitor::cancel_wait() {
+    // if not in_wait, then some thread has sent us a signal;
+    // it will be consumed by the next prepare_wait call
+    skipped_wakeup = ! in_wait.fetch_and_store( false );
+}
+
+} // namespace internal
+} // namespace rml
+
+#endif /* __RML_thread_monitor_H */
diff --git a/xdl/third_party/tbb/src/rml/server/wait_counter.h b/xdl/third_party/tbb/src/rml/server/wait_counter.h
new file mode 100644
index 00000000..2fcad92d
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/wait_counter.h
@@ -0,0 +1,73 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __RML_wait_counter_H
+#define __RML_wait_counter_H
+
+#include "thread_monitor.h"
+#include "tbb/atomic.h"
+
+namespace rml {
+namespace internal {
+
+class wait_counter {
+    thread_monitor my_monitor;
+    tbb::atomic<int> my_count;
+    tbb::atomic<int> n_transients;
+public:
+    wait_counter() { 
+        // The "1" here is subtracted by the call to "wait".
+        my_count=1;
+        n_transients=0;
+    }
+
+    //! Wait for number of operator-- invocations to match number of operator++ invocations.
+    /** Exactly one thread should call this method. */
+    void wait() {
+        int k = --my_count;
+        __TBB_ASSERT( k>=0, "counter underflow" );
+        if( k>0 ) {
+            thread_monitor::cookie c;
+            my_monitor.prepare_wait(c);
+            if( my_count )
+                my_monitor.commit_wait(c);
+            else 
+                my_monitor.cancel_wait();
+        }
+        while( n_transients>0 )
+            __TBB_Yield();
+    }
+    void operator++() {
+        ++my_count;
+    }
+    void operator--() {
+        ++n_transients;
+        int k = --my_count;
+        __TBB_ASSERT( k>=0, "counter underflow" );
+        if( k==0 ) 
+            my_monitor.notify();
+        --n_transients;
+    }
+};
+
+} // namespace internal
+} // namespace rml
+
+#endif /* __RML_wait_counter_H */
diff --git a/xdl/third_party/tbb/src/rml/server/win32-rml-export.def b/xdl/third_party/tbb/src/rml/server/win32-rml-export.def
new file mode 100644
index 00000000..bf379d1f
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/win32-rml-export.def
@@ -0,0 +1,27 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+EXPORTS
+
+__RML_open_factory
+__RML_close_factory
+__TBB_make_rml_server
+__KMP_make_rml_server
+__TBB_call_with_my_server_info
+__KMP_call_with_my_server_info
+
diff --git a/xdl/third_party/tbb/src/rml/server/win64-rml-export.def b/xdl/third_party/tbb/src/rml/server/win64-rml-export.def
new file mode 100644
index 00000000..bf379d1f
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/server/win64-rml-export.def
@@ -0,0 +1,27 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+EXPORTS
+
+__RML_open_factory
+__RML_close_factory
+__TBB_make_rml_server
+__KMP_make_rml_server
+__TBB_call_with_my_server_info
+__KMP_call_with_my_server_info
+
diff --git a/xdl/third_party/tbb/src/rml/test/rml_omp_stub.cpp b/xdl/third_party/tbb/src/rml/test/rml_omp_stub.cpp
new file mode 100644
index 00000000..b682b6e5
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/rml_omp_stub.cpp
@@ -0,0 +1,72 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// This file is compiled with C++, but linked with a program written in C.
+// The intent is to find dependencies on the C++ run-time.
+
+#include <stdlib.h>
+#include "../../../include/tbb/tbb_stddef.h" // __TBB_override
+#include "harness_defs.h"
+#define RML_PURE_VIRTUAL_HANDLER abort
+
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+// VS2008/VC9 seems to have an issue;
+#pragma warning( push )
+#pragma warning( disable: 4100 ) 
+#elif __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+// VS2012-2013 issues "warning C4702: unreachable code" for the code which really
+// shouldn't be reached according to the test logic: rml::client has the
+// implementation for the "pure" virtual methods to be aborted if they are
+// called.
+#pragma warning( push )
+#pragma warning( disable: 4702 )
+#endif
+#include "rml_omp.h"
+#if ( _MSC_VER==1500 && !defined(__INTEL_COMPILER)) || __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+#pragma warning( pop )
+#endif
+
+rml::versioned_object::version_type Version;
+
+class MyClient: public __kmp::rml::omp_client {
+public:
+    rml::versioned_object::version_type version() const __TBB_override {return 0;}
+    size_type max_job_count() const __TBB_override {return 1024;}
+    size_t min_stack_size() const __TBB_override {return 1<<20;}
+    rml::job* create_one_job() __TBB_override {return NULL;}
+    void acknowledge_close_connection() __TBB_override {}
+    void cleanup(job&) __TBB_override {}
+    policy_type policy() const __TBB_override {return throughput;}
+    void process( job&, void*, __kmp::rml::omp_client::size_type ) __TBB_override {}
+
+};
+
+//! Never actually set, because point of test is to find linkage issues.
+__kmp::rml::omp_server* MyServerPtr;
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#define HARNESS_CUSTOM_MAIN 1
+#include "harness.h"
+
+extern "C" void Cplusplus() {
+    MyClient client;
+    Version = client.version();
+    REPORT("done\n");
+}
diff --git a/xdl/third_party/tbb/src/rml/test/test_job_automaton.cpp b/xdl/third_party/tbb/src/rml/test/test_job_automaton.cpp
new file mode 100644
index 00000000..3499c9b4
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_job_automaton.cpp
@@ -0,0 +1,152 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#if __TBB_MIC_OFFLOAD
+int TestMain () {
+    return Harness::Skipped;
+}
+#else
+#include "job_automaton.h"
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness_barrier.h"
+
+class State {
+    Harness::SpinBarrier barrier;
+    rml::internal::job_automaton ja;
+    rml::job job;
+    tbb::atomic<int> job_created;
+    tbb::atomic<int> job_destroyed;
+    tbb::atomic<bool> job_received;
+public:
+    State() : barrier(2) {
+        job_created = 0;
+        job_destroyed = 0;
+        job_received = false;
+    }
+    void exercise( bool is_owner );
+    ~State() {
+        ASSERT( job_created==job_destroyed, "accounting error" );
+        ASSERT( job_destroyed<=1, "destroyed job twice" );
+    }
+};
+
+int DelayMask;
+const int N = 14; 
+tbb::atomic<int> Coverage[N];
+
+//! Mark kth interval as covered and insert delay if kth bit of DelayMask is set.
+/** An interval is the code between two operations on the job_automaton that we are testing. */
+void Cover( int k ) {
+    ASSERT( k<N, NULL );
+    ++Coverage[k];
+    if( DelayMask>>k&1 ) {
+        // Introduce delay (and possibly a thread context switch)
+        __TBB_Yield();
+    }
+}
+
+void State::exercise( bool is_owner ) {
+    barrier.wait();
+    if( is_owner ) {
+        Cover(0);
+        if( ja.try_acquire() ) {
+            Cover(1);
+            ++job_created;
+            ja.set_and_release(&job);
+            Cover(2);
+            if( ja.try_acquire() ) {
+                Cover(3);
+                ja.release();
+                Cover(4);
+                if( ja.try_acquire() ) {
+                    Cover(5);
+                    ja.release();
+                }
+            }
+            Cover(6);
+        } else {
+            Cover(7);
+        }
+        if( DelayMask&1<<N ) {
+            while( !job_received ) 
+                __TBB_Yield();
+        }
+    } else {
+        // Using extra bit of DelayMask for choosing whether to run wait_for_job or not.
+        if( DelayMask&1<<N ) {
+            rml::job* j= ja.wait_for_job();
+            if( j!=&job ) REPORT("%p\n",j);
+            ASSERT( j==&job, NULL );
+            job_received = true;
+        }
+        Cover(8);
+    }   
+    rml::job* j;
+    if( ja.try_plug(j) ) {
+        ASSERT( j==&job || !j, NULL );
+        if( j ) {
+            Cover(9+is_owner);
+            ++job_destroyed;
+        } else {
+            __TBB_ASSERT( !is_owner, "owner failed to create job but plugged self" );
+            Cover(11);
+        } 
+    } else {
+        Cover(12+is_owner);
+    }
+}
+
+class Loop: NoAssign {
+    State& s;
+public:
+    Loop(State& s_) : s(s_) {}
+    void operator()( int i ) const {s.exercise(i==0);}
+};
+
+/** Return true if coverage is acceptable.
+    If report==true, issue message if it is unacceptable. */
+bool CheckCoverage( bool report ) {
+    bool okay = true;
+    for( int i=0; i<N; ++i ) {
+        const int min_coverage = 4; 
+        if( Coverage[i]<min_coverage ) {
+            okay = false;
+            if( report )
+                REPORT("Warning: Coverage[%d]=%d is less than acceptable minimum of %d\n", i, int(Coverage[i]),min_coverage);
+        }
+    }
+    return okay;
+}
+
+int TestMain () {
+    for( DelayMask=0; DelayMask<8<<N; ++DelayMask ) {
+        State s;
+        NativeParallelFor( 2, Loop(s) );
+        if( CheckCoverage(false) ) { 
+            // Reached acceptable code coverage level
+            break;
+        }
+    }
+    CheckCoverage(true);
+    return Harness::Done;
+}
+
+#endif /* __TBB_MIC_OFFLOAD */
diff --git a/xdl/third_party/tbb/src/rml/test/test_rml_mixed.cpp b/xdl/third_party/tbb/src/rml/test/test_rml_mixed.cpp
new file mode 100644
index 00000000..37b75ffd
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_rml_mixed.cpp
@@ -0,0 +1,318 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <tbb/tbb_config.h>
+#if __TBB_WIN8UI_SUPPORT || __TBB_MIC_OFFLOAD
+#include "harness.h"
+int TestMain () {
+    return Harness::Skipped;
+}
+#else
+#include "rml_tbb.h"
+#include "rml_omp.h"
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+
+#define HARNESS_DEFAULT_MIN_THREADS 4
+#include "harness.h"
+
+// dynamic_link initializes its data structures in a static constructor. But
+// the initialization order of static constructors in different modules is
+// non-deterministic. Thus dynamic_link fails on some systems when the
+// application changes its current directory after the library (TBB/OpenMP/...)
+// is loaded but before the static constructors in the library are executed.
+#define CHDIR_SUPPORT_BROKEN ( __TBB_GCC_VERSION >= 40600 || (__linux__ && __TBB_CLANG_VERSION >= 30500) )
+
+const int OMP_ParallelRegionSize = 16;
+int TBB_MaxThread = 4;           // Includes master
+int OMP_MaxThread = int(~0u>>1); // Includes master
+
+template<typename Client>
+class ClientBase: public Client {
+protected:
+    typedef typename Client::version_type version_type;
+    typedef typename Client::job job;
+    typedef typename Client::policy_type policy_type;
+
+private:
+    version_type version() const __TBB_override {
+        return 0;
+    }
+    size_t min_stack_size() const __TBB_override {
+        return 1<<20;
+    }
+    job* create_one_job() __TBB_override {
+        return new rml::job;
+    }
+    policy_type policy() const __TBB_override {
+        return Client::turnaround;
+    }
+    void acknowledge_close_connection() __TBB_override {
+        delete this;
+    }
+    void cleanup( job& j ) __TBB_override {delete &j;}
+
+public:
+    virtual ~ClientBase() {}
+};
+
+#if _WIN32
+#include <direct.h>
+#define PATH_LEN MAX_PATH+1
+#define SLASH '\\'
+#define ROOT_DIR "\\"
+// ROOT_DIR_REST means how many symbols before first slash in the path
+#define ROOT_DIR_REST 2
+#else
+#include <unistd.h>
+#include <limits.h>
+#define PATH_LEN PATH_MAX+1
+#define SLASH '/'
+#define ROOT_DIR "/"
+// ROOT_DIR_REST means how many symbols before first slash in the path
+#define ROOT_DIR_REST 0
+#define _getcwd getcwd
+#define _chdir  chdir
+#endif
+
+#if !CHDIR_SUPPORT_BROKEN
+class ChangeCurrentDir {
+    char dir[PATH_LEN+1];
+    char *last_slash;
+public:
+    ChangeCurrentDir() {
+        if ( !_getcwd( dir, PATH_LEN ) ) {
+            REPORT_FATAL_ERROR("ERROR: Couldn't get current working directory\n");
+        }
+
+        last_slash = strrchr( dir, SLASH );
+        ASSERT( last_slash, "The current directory doesn't contain slashes" );
+        *last_slash = 0;
+
+        if ( _chdir( last_slash-dir == ROOT_DIR_REST ? ROOT_DIR : dir ) ) {
+            REPORT_FATAL_ERROR("ERROR: Couldn't change current working directory (%s)\n", dir );
+        }
+    }
+
+    // Restore current dir
+    ~ChangeCurrentDir() {
+        *last_slash = SLASH;
+        if ( _chdir(dir) ) {
+            REPORT_FATAL_ERROR("ERROR: Couldn't change current working directory\n");
+        }
+    }
+};
+#endif
+
+//! Represents a TBB or OpenMP run-time that uses RML.
+template<typename Factory, typename Client>
+class RunTime {
+public:
+    //! Factory that run-time uses to make servers.
+    Factory factory;
+    Client* client;
+    typename Factory::server_type* server;
+#if _WIN32||_WIN64
+    ::rml::server::execution_resource_t me;
+#endif
+    RunTime() {
+        factory.open();
+    }
+    ~RunTime() {
+        factory.close();
+    }
+    //! Create server for this run-time
+    void create_connection();
+
+    //! Destroy server for this run-time
+    void destroy_connection();
+};
+
+class ThreadLevelRecorder {
+    tbb::atomic<int> level;
+    struct record {
+        tbb::tick_count time;
+        int nthread;
+    };
+    tbb::atomic<unsigned> next;
+    /** Must be power of two */
+    static const unsigned max_record_count = 1<<20;
+    record array[max_record_count];
+public:
+    void change_level( int delta );
+    void dump();
+};
+
+void ThreadLevelRecorder::change_level( int delta ) {
+    int x = level+=delta;
+    tbb::tick_count t = tbb::tick_count::now();
+    unsigned k = next++;
+    if( k<max_record_count ) {
+        record& r = array[k];
+        r.time = t;
+        r.nthread = x;
+    } 
+}
+
+void ThreadLevelRecorder::dump() {
+    FILE* f = fopen("time.txt","w");
+    if( !f ) {
+        perror("fopen(time.txt)\n");
+        exit(1);
+    }
+    unsigned limit = next;
+    if( limit>max_record_count ) {
+        // Clip
+        limit = next;
+    }
+    for( unsigned i=0; i<limit; ++i ) {
+        fprintf(f,"%f\t%d\n",(array[i].time-array[0].time).seconds(),array[i].nthread);
+    }
+    fclose(f);
+}
+
+class TBB_Client: public ClientBase<tbb::internal::rml::tbb_client> {
+    void process( job& j ) __TBB_override;
+    size_type max_job_count() const __TBB_override {
+        return TBB_MaxThread-1;
+    }
+};
+
+class OMP_Client: public ClientBase<__kmp::rml::omp_client> {
+    void process( job&, void* cookie, omp_client::size_type ) __TBB_override;
+    size_type max_job_count() const __TBB_override {
+        return OMP_MaxThread-1;
+    }
+};
+
+#if !CHDIR_SUPPORT_BROKEN
+// A global instance of ChangeCurrentDir should be declared before TBB_RunTime and OMP_RunTime
+// since we want to change current directory before opening factory
+ChangeCurrentDir Changer;
+#endif
+RunTime<tbb::internal::rml::tbb_factory, TBB_Client> TBB_RunTime;
+RunTime<__kmp::rml::omp_factory, OMP_Client> OMP_RunTime;
+ThreadLevelRecorder TotalThreadLevel;
+
+template<typename Factory, typename Client>
+void RunTime<Factory,Client>::create_connection() {
+    client = new Client;
+    typename Factory::status_type status = factory.make_server( server, *client );
+    ASSERT( status==Factory::st_success, NULL );
+#if _WIN32||_WIN64
+    server->register_master( me );
+#endif /* _WIN32||_WIN64 */
+}
+
+template<typename Factory, typename Client>
+void RunTime<Factory,Client>::destroy_connection() {
+#if _WIN32||_WIN64
+    server->unregister_master( me );
+#endif /* _WIN32||_WIN64 */
+    server->request_close_connection();
+    server = NULL;
+}
+
+class OMP_Team {
+public:
+    OMP_Team( __kmp::rml::omp_server& ) {}
+    tbb::atomic<unsigned> barrier;
+};
+
+tbb::atomic<int> AvailWork;
+tbb::atomic<int> CompletionCount;
+ 
+void OMPWork() {
+    tbb::atomic<int> x;
+    for( x=0; x<2000000; ++x ) {
+        continue;
+    }
+}
+
+void TBBWork() {
+    if( AvailWork>=0 ) {
+        int k = --AvailWork;
+        if( k==-1 ) {
+            TBB_RunTime.server->adjust_job_count_estimate(-(TBB_MaxThread-1));
+            ++CompletionCount;
+        } else if( k>=0 ) {
+            for( int j=0; j<4; ++j ) {
+                OMP_Team team( *OMP_RunTime.server );
+                int n = OMP_RunTime.server->try_increase_load( OMP_ParallelRegionSize-1, /*strict=*/false );
+                team.barrier = 0;
+                ::rml::job* array[OMP_ParallelRegionSize-1];
+                if( n>0)
+                    OMP_RunTime.server->get_threads( n, &team, array );
+                // Master does work inside parallel region too.
+                OMPWork();
+                // Master waits for workers to finish
+                if( n>0 )
+                    while( team.barrier!=unsigned(n) ) {
+                        __TBB_Yield();
+                    } 
+            }
+            ++CompletionCount;
+        }
+    }
+}
+
+void TBB_Client::process( job& ) {
+    TotalThreadLevel.change_level(1);
+    TBBWork();
+    TotalThreadLevel.change_level(-1);
+}
+
+void OMP_Client::process( job& /* j */, void* cookie, omp_client::size_type ) {
+    TotalThreadLevel.change_level(1);
+    ASSERT( OMP_RunTime.server, NULL );
+    OMPWork();
+    ASSERT( OMP_RunTime.server, NULL );
+    static_cast<OMP_Team*>(cookie)->barrier+=1;
+    TotalThreadLevel.change_level(-1);
+}
+
+void TBBOutSideOpenMPInside() {
+    TotalThreadLevel.change_level(1);
+    CompletionCount = 0;
+    int tbbtasks = 32;
+    AvailWork = tbbtasks;
+    TBB_RunTime.server->adjust_job_count_estimate(TBB_MaxThread-1);
+    while( CompletionCount!=tbbtasks+1 ) {
+        TBBWork();
+    }
+    TotalThreadLevel.change_level(-1);
+}
+
+int TestMain () {
+#if CHDIR_SUPPORT_BROKEN
+    REPORT("Known issue: dynamic_link does not support current directory changing before its initialization.\n");
+#endif
+    for( TBB_MaxThread=MinThread; TBB_MaxThread<=MaxThread; ++TBB_MaxThread ) {
+        REMARK("Testing with TBB_MaxThread=%d\n", TBB_MaxThread);
+        TBB_RunTime.create_connection();
+        OMP_RunTime.create_connection();
+        TBBOutSideOpenMPInside();
+        OMP_RunTime.destroy_connection();
+        TBB_RunTime.destroy_connection();
+    }
+    TotalThreadLevel.dump();
+    return Harness::Done;
+}
+#endif /* __TBB_WIN8UI_SUPPORT || __TBB_MIC_OFFLOAD */
diff --git a/xdl/third_party/tbb/src/rml/test/test_rml_omp.cpp b/xdl/third_party/tbb/src/rml/test/test_rml_omp.cpp
new file mode 100644
index 00000000..037ec6b3
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_rml_omp.cpp
@@ -0,0 +1,203 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <tbb/tbb_config.h>
+#if __TBB_WIN8UI_SUPPORT || __TBB_MIC_OFFLOAD
+#include "harness.h"
+int TestMain () {
+    return Harness::Skipped;
+}
+#else
+#include "rml_omp.h"
+
+typedef __kmp::rml::omp_server MyServer;
+typedef __kmp::rml::omp_factory MyFactory;
+
+// Forward declaration for the function used in test_server.h
+void DoClientSpecificVerification( MyServer& , int );
+
+#define HARNESS_DEFAULT_MIN_THREADS 0
+#include "test_server.h"
+#include "tbb/tbb_misc.h"
+
+static bool StrictTeam;
+
+class MyTeam {
+    MyTeam& operator=( const MyTeam& ) ;
+public:
+    struct info_type {
+        rml::job* job;
+        bool ran;
+        info_type() : job(NULL), ran(false) {}
+    };
+    MyTeam( MyServer& /* server */, size_t max_thread_ ) :
+        max_thread(max_thread_)
+    {
+        self_ptr = this;
+        info = new info_type[max_thread];
+    }
+    ~MyTeam() {
+        delete[] info;
+    }
+    const size_t max_thread;
+    size_t n_thread;
+    tbb::atomic<int> barrier;
+    /** Indexed with 1-origin index */
+    info_type* info;
+    int iteration;
+    MyTeam* self_ptr;
+};
+
+class MyClient: public ClientBase<__kmp::rml::omp_client> {
+public:
+    MyServer* server;
+    void process( job& j, void* cookie, size_type index ) __TBB_override {
+        MyTeam& t = *static_cast<MyTeam*>(cookie);
+        ASSERT( t.self_ptr==&t, "trashed cookie" );
+        ASSERT( index<t.max_thread, NULL );
+        ASSERT( !t.info[index].ran, "duplicate index?" );
+        t.info[index].job = &j;
+        t.info[index].ran = true;
+        do_process(&j);
+        if( index==1 && nesting.level<nesting.limit ) {
+            DoOneConnection<MyFactory,MyClient> doc(MaxThread,Nesting(nesting.level+1,nesting.limit),0,false);
+            doc(0);
+        }
+#if _WIN32||_WIN64
+        // test activate/deactivate
+        if( t.n_thread>1 && t.n_thread%2==0 ) {
+            if( nesting.level==0 ) {
+                if( index&1 ) {
+                    size_type target = index-1;
+                    ASSERT(  target<t.max_thread, NULL );
+                    // wait until t.info[target].job is defined
+                    tbb::internal::spin_wait_until_eq( t.info[target].ran, true );
+                    server->try_increase_load( 1, true );
+                    server->reactivate( t.info[target].job );
+                } else {
+                    server->deactivate( &j );
+                }
+            }
+        }
+#endif /* _WIN32||_WIN64 */
+        ++t.barrier;
+    }
+    static const bool is_omp = true;
+    bool is_strict() const {return StrictTeam;}
+};
+
+void FireUpJobs( MyServer& server, MyClient& client, int max_thread, int n_extra, Checker* checker ) {
+    ASSERT( max_thread>=0, NULL );
+#if _WIN32||_WIN64
+    ::rml::server::execution_resource_t me;
+    server.register_master( me );
+#endif /* _WIN32||_WIN64 */
+    client.server = &server;
+    MyTeam team(server,size_t(max_thread));
+    MyServer::size_type n_thread = 0;
+    for( int iteration=0; iteration<4; ++iteration ) {
+        for( size_t i=0; i<team.max_thread; ++i )
+            team.info[i].ran = false;
+        switch( iteration ) {
+            default:
+                n_thread = int(max_thread);
+                break;
+            case 1:
+                // No change in number of threads
+                break;
+            case 2:
+                // Decrease number of threads.
+                n_thread = int(max_thread)/2;
+                break;
+            // Case 3 is same code as the default, but has effect of increasing the number of threads.
+        }
+        team.barrier = 0;
+        REMARK("client %d: server.run with n_thread=%d\n", client.client_id(), int(n_thread) );
+        server.independent_thread_number_changed( n_extra );
+        if( checker ) {
+            // Give RML time to respond to change in number of threads.
+            Harness::Sleep(1);
+        }
+        int n_delivered = server.try_increase_load( n_thread, StrictTeam );
+        ASSERT( !StrictTeam || n_delivered==int(n_thread), "server failed to satisfy strict request" );
+        if( n_delivered<0 ) {
+            REMARK( "client %d: oversubscription occurred (by %d)\n", client.client_id(), -n_delivered );
+            server.independent_thread_number_changed( -n_extra );
+            n_delivered = 0;
+        } else {
+            team.n_thread = n_delivered;
+            ::rml::job* job_array[JobArraySize];
+            job_array[n_delivered] = (::rml::job*)intptr_t(-1);
+            server.get_threads( n_delivered, &team, job_array );
+            __TBB_ASSERT( job_array[n_delivered]== (::rml::job*)intptr_t(-1), NULL );
+            for( int i=0; i<n_delivered; ++i ) {
+                MyJob* j = static_cast<MyJob*>(job_array[i]);
+                int s = j->state;
+                ASSERT( s==MyJob::idle||s==MyJob::busy, NULL );
+            }
+            server.independent_thread_number_changed( -n_extra );
+            REMARK("client %d: team size is %d\n", client.client_id(), n_delivered);
+            if( checker ) {
+                checker->check_number_of_threads_delivered( n_delivered, n_thread, n_extra );
+            }
+            // Protocol requires that master wait until workers have called "done_processing"
+            while( team.barrier!=n_delivered ) {
+                ASSERT( team.barrier>=0, NULL );
+                ASSERT( team.barrier<=n_delivered, NULL );
+                __TBB_Yield();
+            }
+            REMARK("client %d: team completed\n", client.client_id() );
+            for( int i=0; i<n_delivered; ++i ) {
+                ASSERT( team.info[i].ran, "thread on team allegedly delivered, but did not run?" );
+            }
+        }
+        for( MyServer::size_type i=n_delivered; i<MyServer::size_type(max_thread); ++i ) {
+            ASSERT( !team.info[i].ran, "thread on team ran with illegal index" );
+        }
+    }
+#if _WIN32||_WIN64
+    server.unregister_master( me );
+#endif
+}
+
+void DoClientSpecificVerification( MyServer& server, int /*n_thread*/ )
+{
+    ASSERT( server.current_balance()==int(tbb::internal::AvailableHwConcurrency())-1, NULL );
+}
+
+int TestMain () {
+#if _MSC_VER == 1600 && RML_USE_WCRM
+    REPORT("Known issue: RML resets the process mask when Concurrency Runtime is used.\n");
+    // AvailableHwConcurrency reads process mask when the first call. That's why it should
+    // be called before RML initialization.
+    tbb::internal::AvailableHwConcurrency();
+#endif
+
+    StrictTeam = true;
+    VerifyInitialization<MyFactory,MyClient>( MaxThread );
+    SimpleTest<MyFactory,MyClient>();
+
+    StrictTeam = false;
+    VerifyInitialization<MyFactory,MyClient>( MaxThread );
+    SimpleTest<MyFactory,MyClient>();
+
+    return Harness::Done;
+}
+#endif /* __TBB_WIN8UI_SUPPORT || __TBB_MIC_OFFLOAD */
diff --git a/xdl/third_party/tbb/src/rml/test/test_rml_omp_c_linkage.c b/xdl/third_party/tbb/src/rml/test/test_rml_omp_c_linkage.c
new file mode 100644
index 00000000..50b9e236
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_rml_omp_c_linkage.c
@@ -0,0 +1,26 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+void Cplusplus();
+
+int main() {
+    Cplusplus();      
+    return 0;
+} 
diff --git a/xdl/third_party/tbb/src/rml/test/test_rml_tbb.cpp b/xdl/third_party/tbb/src/rml/test/test_rml_tbb.cpp
new file mode 100644
index 00000000..6e78d4a6
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_rml_tbb.cpp
@@ -0,0 +1,205 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <tbb/tbb_config.h>
+#if __TBB_WIN8UI_SUPPORT || __TBB_MIC_OFFLOAD
+#include "harness.h"
+int TestMain () {
+    return Harness::Skipped;
+}
+#else
+#include "rml_tbb.h"
+
+typedef tbb::internal::rml::tbb_server MyServer;
+typedef tbb::internal::rml::tbb_factory MyFactory;
+
+// Forward declaration of the function used in test_server.h
+void DoClientSpecificVerification( MyServer&, int );
+
+#define HARNESS_DEFAULT_MIN_THREADS 0
+#include "test_server.h"
+
+tbb::atomic<int> n_available_hw_threads;
+
+class MyClient: public ClientBase<tbb::internal::rml::tbb_client> {
+    tbb::atomic<int> counter;
+    tbb::atomic<int> gate;
+    void process( job& j ) __TBB_override {
+        do_process(&j);
+        //wait until the gate is open.
+        while( gate==0 )
+            Harness::Sleep(1);
+
+        __TBB_ASSERT( nesting.limit<=2, NULL );
+        if( nesting.level>=nesting.limit )
+            return;
+
+        size_type max_outstanding_connections = max_job_count(); // if nesting.level==0
+        if( nesting.level==1 )
+            max_outstanding_connections *= (1+max_outstanding_connections);
+
+        if( default_concurrency()<=max_outstanding_connections+2 )
+            // i.e., if it is not guaranteed that at least two connections may be made without depleting the_balance
+            return;
+
+        // at this point, ( nesting.level<nesting.limit ) && ( my_server->default_concurrency()-max_outstanding_connections>2 ) 
+        for( ;; ) {
+            while( n_available_hw_threads<=1 )
+                Harness::Sleep(1);
+
+            int n = --n_available_hw_threads;
+            if( n>0 ) break;
+            // else I lost
+            ++n_available_hw_threads;
+        }
+        
+        DoOneConnection<MyFactory,MyClient> doc(max_job_count(),Nesting(nesting.level+1,nesting.limit),0,false);
+        doc(0);
+
+        ++n_available_hw_threads;
+    }
+public:
+    MyClient() {counter=1;}
+    static const bool is_omp = false;
+    bool is_strict() const {return false;}
+    void open_the_gate() { gate = 1; }
+    void close_the_gate() { gate = 0; }
+};
+
+void FireUpJobs( MyServer& server, MyClient& client, int n_thread, int n_extra, Checker* checker ) {
+    REMARK("client %d: calling adjust_job_count_estimate(%d)\n", client.client_id(),n_thread);
+    // Exercise independent_thread_number_changed, even for zero values.
+    server.independent_thread_number_changed( n_extra );
+#if _WIN32||_WIN64
+    ::rml::server::execution_resource_t me;
+    server.register_master( me );
+#endif /* _WIN32||_WIN64 */
+    // Experiments indicate that when oversubscribing, the main thread should wait a little
+    // while for the RML worker threads to do some work. 
+    if( checker ) {
+        // Give RML time to respond to change in number of threads.
+        Harness::Sleep(1);
+        for( int k=0; k<n_thread; ++k )
+            client.job_array[k].processing_count = 0;
+    }
+    //close the gate to keep worker threads from returning to RML until a snapshot is taken
+    client.close_the_gate();
+    server.adjust_job_count_estimate( n_thread );
+    int n_used = 0;
+    if( checker ) {
+        Harness::Sleep(100);
+        for( int k=0; k<n_thread; ++k )
+            if( client.job_array[k].processing_count )
+                ++n_used;
+    }
+    // open the gate
+    client.open_the_gate();
+    // Logic further below presumes that jobs never starve, so undo previous call
+    // to independent_thread_number_changed before waiting on those jobs.
+    server.independent_thread_number_changed( -n_extra );
+    REMARK("client %d: wait for each job to be processed at least once\n",client.client_id());
+    // Calculate the number of jobs that are expected to get threads.
+    int expected = n_thread;
+    // Wait for expected number of jobs to be processed.
+#if RML_USE_WCRM
+    int default_concurrency = server.default_concurrency();
+    if( N_TestConnections>0 ) {
+        if( default_concurrency+1>=8 && n_thread<=3 && N_TestConnections<=3 && (default_concurrency/int(N_TestConnections)-1)>=n_thread ) {
+#endif /* RML_USE_WCRM */
+            for(;;) {
+                int n = 0;
+                for( int k=0; k<n_thread; ++k ) 
+                    if( client.job_array[k].processing_count!=0 ) 
+                        ++n;
+                if( n>=expected ) break;
+                server.yield();
+            }
+#if RML_USE_WCRM
+        } else if( n_thread>0 ) {
+            for( int m=0; m<20; ++m ) {
+                int n = 0;
+                for( int k=0; k<n_thread; ++k ) 
+                    if( client.job_array[k].processing_count!=0 ) 
+                        ++n;
+                if( n>=expected ) break;
+                Harness::Sleep(1);
+            }
+        }
+    }
+#endif /* RML_USE_WCRM */
+    server.adjust_job_count_estimate(-n_thread);
+#if _WIN32||_WIN64
+    server.unregister_master( me );
+#endif
+    // Give RML some time to respond
+    if( checker ) {
+        Harness::Sleep(1);
+        checker->check_number_of_threads_delivered( n_used, n_thread, n_extra );
+    }
+}
+
+void DoClientSpecificVerification( MyServer&, int n_thread )
+{
+    MyClient* client = new MyClient;
+    client->initialize( n_thread, Nesting(), ClientStackSize[0] );
+    MyFactory factory;
+    memset( &factory, 0, sizeof(factory) );
+    MyFactory::status_type status = factory.open();
+    ASSERT( status!=MyFactory::st_not_found, "could not find RML library" );
+    ASSERT( status!=MyFactory::st_incompatible, NULL );
+    ASSERT( status==MyFactory::st_success, NULL );
+    MyFactory::server_type* server; 
+    status = factory.make_server( server, *client );
+    ASSERT( status==MyFactory::st_success, NULL );
+    client->set_server( server );
+    client->expect_close_connection = true;
+    server->request_close_connection();
+    // Client deletes itself when it sees call to acknowledge_close_connection from server.
+    factory.close();
+}
+
+void Initialize()
+{
+    MyClient* client = new MyClient;
+    client->initialize( 1, Nesting(), ClientStackSize[0] );
+    MyFactory factory;
+    memset( &factory, 0, sizeof(factory) );
+    factory.open();
+    MyFactory::server_type* server; 
+    factory.make_server( server, *client );
+    client->set_server( server );
+    n_available_hw_threads = server->default_concurrency();
+    client->expect_close_connection = true;
+    server->request_close_connection();
+    // Client deletes itself when it sees call to acknowledge_close_connection from server.
+    factory.close();
+}
+
+int TestMain () {
+    VerifyInitialization<MyFactory,MyClient>( MaxThread );
+    if ( server_concurrency<1 ) {
+         REPORT("The test is not intended to run on 1 thread\n");
+         return Harness::Skipped;
+    }
+    Initialize();
+    SimpleTest<MyFactory,MyClient>();
+    return Harness::Done;
+}
+#endif /* __TBB_WIN8UI_SUPPORT || __TBB_MIC_OFFLOAD */
diff --git a/xdl/third_party/tbb/src/rml/test/test_server.h b/xdl/third_party/tbb/src/rml/test/test_server.h
new file mode 100644
index 00000000..0e77b96e
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_server.h
@@ -0,0 +1,433 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* This header contains code shared by test_omp_server.cpp and test_tbb_server.cpp 
+   There is no ifndef guard - test is supposed to include this file exactly once.
+   The test is also exected to have #include of rml_omp.h or rml_tbb.h before 
+   including this header. 
+
+   This header should not use any parts of TBB that require linking in the TBB run-time. 
+   It uses a few instances of tbb::atomic<T>, all of which are completely inlined. */
+
+#include "tbb/atomic.h"
+#include "tbb/tbb_thread.h"
+#include "harness.h"
+#include "harness_memory.h"
+#include "harness_concurrency_tracker.h"
+
+//! Define TRIVIAL as 1 to test only a single client, no nesting, no extra threads.
+#define TRIVIAL 0
+
+//! Maximum number of clients 
+#if TRIVIAL 
+const size_t MaxClient = 1;
+#else
+const size_t MaxClient = 4;
+#endif
+
+const size_t ClientStackSize[MaxClient] = {
+    1000000
+#if !TRIVIAL
+   ,2000000
+   ,1000000
+   ,4000000
+#endif /* TRIVIAL */
+};
+
+const size_t OverheadStackSize = 500000;
+
+const size_t JobArraySize = 1000;
+
+static bool TestSingleConnection;
+
+static size_t N_TestConnections;
+
+static int server_concurrency;
+
+class MyJob: public ::rml::job {
+public:
+    //! Enumeration for tracking states of a job.
+    enum state_t {
+        //! Job has not yet been allocated.
+        unallocated,
+        //! Is idle.
+        idle,
+        //! Has a thread working on it.
+        busy,
+        //! After call to client::cleanup 
+        clean
+    };
+    tbb::atomic<int> state;
+    tbb::atomic<int> processing_count;
+    void update( state_t new_state, state_t old_state ) {
+        int o = state.compare_and_swap(new_state,old_state);
+        ASSERT( o==old_state, "illegal transition" );
+    }
+    void update_from_either( state_t new_state, state_t old_state1, state_t old_state2 ) {
+        int snapshot;
+        do {
+            snapshot = state;
+            ASSERT( snapshot==old_state1||snapshot==old_state2, "illegal transition" );
+        } while( state.compare_and_swap(new_state,snapshot)!=snapshot );
+    }
+    MyJob() {
+        state=unallocated;
+        processing_count=0;
+    }
+    ~MyJob() {
+        // Overwrite so that accidental use after destruction can be detected.
+        memset(static_cast<void*>(this),-1,sizeof(*this));
+    }
+};
+
+static tbb::atomic<int> ClientConstructions;
+static tbb::atomic<int> ClientDestructions;
+
+struct Nesting {
+    int level;
+    int limit;
+    Nesting() : level(0), limit(0) {}
+    Nesting( int level_, int limit_ ) : level(level_), limit(limit_) {}
+};
+
+template<typename Client>
+class ClientBase: public Client {
+protected:
+    typedef typename Client::size_type size_type;
+    typedef typename Client::version_type version_type;
+    typedef typename Client::policy_type policy_type;
+    typedef typename Client::job job;
+private:
+    size_type my_max_job_count;
+    size_t my_stack_size;
+    tbb::atomic<size_t> next_job_index;
+    int my_client_id;
+    rml::server* my_server;
+
+public:
+    enum state_t {
+        //! Treat *this as constructed.
+        live=0x1234,
+        //! Treat *this as destroyed.
+        destroyed=0xDEAD
+    };
+
+    tbb::atomic<int> state;
+    void update( state_t new_state, state_t old_state ) {
+        int o = state.compare_and_swap(new_state,old_state);
+        ASSERT( o==old_state, NULL );
+    }
+
+    tbb::atomic<bool> expect_close_connection;
+
+    MyJob *job_array;
+
+    version_type version() const __TBB_override {
+        ASSERT( state==live, NULL );
+        return 1;
+    }
+
+    size_type max_job_count() const __TBB_override {
+        ASSERT( state==live, NULL );
+        return my_max_job_count;
+    }
+
+    size_t min_stack_size() const __TBB_override {
+        ASSERT( state==live, NULL );
+        return my_stack_size;
+    }
+
+    policy_type policy() const __TBB_override {return Client::throughput;}
+
+    void acknowledge_close_connection() __TBB_override {
+        ASSERT( expect_close_connection, NULL );
+        for( size_t k=next_job_index; k>0; ) {
+            --k;
+            ASSERT( job_array[k].state==MyJob::clean, NULL );
+        }
+        delete[] job_array;
+        job_array = NULL;
+        ASSERT( my_server, NULL );
+        update( destroyed, live );
+        delete this;
+    }
+
+    void cleanup( job& j_ ) __TBB_override {
+        REMARK("client %d: cleanup(%p) called\n",client_id(),&j_);
+        ASSERT( state==live, NULL );
+        MyJob& j = static_cast<MyJob&>(j_);
+        while( j.state==MyJob::busy )
+            my_server->yield();
+        j.update(MyJob::clean,MyJob::idle);
+        REMARK("client %d: cleanup(%p) returns\n",client_id(),&j_);
+    }
+   
+    job* create_one_job();
+
+protected:
+    void do_process( job* j_ ) {
+        ASSERT( state==live, NULL );
+        MyJob& j = static_cast<MyJob&>(*j_);
+        ASSERT( j_, NULL );
+        j.update(MyJob::busy,MyJob::idle);
+        // use of the plain addition (not the atomic increment) is intentonial
+        j.processing_count = j.processing_count + 1;
+        ASSERT( my_stack_size>OverheadStackSize, NULL ); 
+#ifdef __ia64__
+        // Half of the stack is reserved for RSE, so test only remaining half.
+        UseStackSpace( (my_stack_size-OverheadStackSize)/2 );
+#else
+        UseStackSpace( my_stack_size-OverheadStackSize );
+#endif
+        j.update(MyJob::idle,MyJob::busy);
+        my_server->yield();
+    } 
+public:
+    ClientBase() : my_server(NULL) {
+        my_client_id = ClientConstructions++;
+        next_job_index = 0; 
+    }
+    int client_id() const {return my_client_id;}
+
+    Nesting nesting;
+
+    void initialize( size_type max_job_count, Nesting nesting_, size_t stack_size ) {
+        ASSERT( stack_size>0, NULL );
+        my_max_job_count = max_job_count;
+        nesting = nesting_;
+        my_stack_size = stack_size;
+        job_array = new MyJob[JobArraySize];
+        expect_close_connection = false;
+        state = live;
+    }
+
+    void set_server( rml::server* s ) {my_server=s;}
+
+    unsigned default_concurrency() const { ASSERT( my_server, NULL); return my_server->default_concurrency(); }
+
+    virtual ~ClientBase() {
+        ASSERT( state==destroyed, NULL );
+        ++ClientDestructions;
+    }
+};
+
+template<typename Client>
+typename Client::job* ClientBase<Client>::create_one_job() {
+    REMARK("client %d: create_one_job() called\n",client_id());
+    size_t k = next_job_index++;
+    ASSERT( state==live, NULL );
+    // Following assertion depends on assumption that implementation does not destroy jobs until 
+    // the connection is closed.  If the implementation is changed to destroy jobs sooner, the 
+    // test logic in this header will have to be reworked.
+    ASSERT( k<my_max_job_count, "RML allocated more than max_job_count jobs simultaneously" );
+    ASSERT( k<JobArraySize, "JobArraySize not big enough (problem is in test, not RML)" );
+    MyJob& j = job_array[k];
+    j.update(MyJob::idle,MyJob::unallocated);
+    REMARK("client %d: create_one_job() for k=%d returns %p\n",client_id(),int(k),&j);
+    return &j;
+}
+
+struct warning_tracker {
+    tbb::atomic<int> n_more_than_available;
+    tbb::atomic<int> n_too_many_threads;
+    tbb::atomic<int> n_system_overload;
+    warning_tracker() {
+        n_more_than_available = 0;
+        n_too_many_threads = 0;
+        n_system_overload = 0;
+    }
+    bool all_set() { return n_more_than_available>0 && n_too_many_threads>0 && n_system_overload>0; }
+} tracker;
+
+class Checker {
+public:
+    int default_concurrency;
+    void check_number_of_threads_delivered( int n_delivered, int n_requested, int n_extra ) const;
+    Checker( rml::server& server ) : default_concurrency(int(server.default_concurrency())) {}
+};
+
+void Checker::check_number_of_threads_delivered( int n_delivered, int n_requested, int n_extra ) const {
+    ASSERT( default_concurrency>=0, NULL );
+    if( tracker.all_set() ) return;
+    // Check that number of threads delivered is reasonable.
+    int n_avail = default_concurrency;
+    if( n_extra>0 )
+        n_avail-=n_extra;
+    if( n_avail<0 ) 
+        n_avail=0;
+    if( n_requested>default_concurrency ) 
+        n_avail += n_requested-default_concurrency;
+    int n_expected = n_requested;
+    if( n_expected>n_avail )
+        n_expected=n_avail;
+    const char* msg = NULL;
+    if( n_delivered>n_avail ) {
+        if( ++tracker.n_more_than_available>1 )
+            return;
+        msg = "server delivered more threads than were theoretically available";
+    } else if( n_delivered>n_expected ) {
+        if( ++tracker.n_too_many_threads>1 )
+            return;
+        msg = "server delivered more threads than expected";
+    } else if( n_delivered<n_expected ) {
+        if( ++tracker.n_system_overload>1 )
+            return;
+        msg = "server delivered fewer threads than ideal; or, the system is overloaded?";
+    }
+    if( msg ) {
+        REPORT("Warning: %s (n_delivered=%d n_avail=%d n_requested=%d n_extra=%d default_concurrency=%d)\n",
+               msg, n_delivered, n_avail, n_requested, n_extra, default_concurrency );
+    }
+}
+
+template<typename Factory,typename Client>
+class DoOneConnection: NoAssign {
+    //! Number of threads to request
+    const int n_thread;
+    //! Nesting 
+    const Nesting nesting;
+    //! Number of extra threads to pretend having outside the RML
+    const int n_extra;
+    //! If true, check number of threads actually delivered.
+    const bool check_delivered;
+public:
+    DoOneConnection( int n_thread_, Nesting nesting_, int n_extra_, bool check_delivered_ ) : 
+        n_thread(n_thread_), 
+        nesting(nesting_), 
+        n_extra(n_extra_), 
+        check_delivered(check_delivered_)
+    {
+    }
+   
+    //! Test ith connection 
+    void operator()( size_t i ) const;
+};
+
+template<typename Factory,typename Client>
+void DoOneConnection<Factory,Client>::operator()( size_t i ) const {
+    ASSERT( i<MaxClient, NULL );
+    Client* client = new Client;
+    client->initialize( Client::is_omp ? JobArraySize : n_thread, nesting, ClientStackSize[i] );
+    Factory factory;
+    memset( &factory, 0, sizeof(factory) );
+    typename Factory::status_type status = factory.open();
+    ASSERT( status==Factory::st_success, NULL );
+
+    typename Factory::server_type* server; 
+    status = factory.make_server( server, *client );
+    ASSERT( status==Factory::st_success, NULL );
+    Harness::ConcurrencyTracker ct;
+    REMARK("client %d: opened server n_thread=%d nesting=(%d,%d)\n",
+               client->client_id(), n_thread, nesting.level, nesting.limit);
+    client->set_server( server );
+    Checker checker( *server );
+ 
+    FireUpJobs( *server, *client, n_thread, n_extra, check_delivered && !client->is_strict() ? &checker : NULL );
+
+    // Close the connection
+    client->expect_close_connection = true;
+    REMARK("client %d: calling request_close_connection\n", client->client_id());
+#if !RML_USE_WCRM
+    int default_concurrency = server->default_concurrency();
+#endif
+    server->request_close_connection();
+    // Client deletes itself when it sees call to acknowledge_close_connection from server.
+    factory.close();
+#if !RML_USE_WCRM
+    if( TestSingleConnection )
+        __TBB_ASSERT_EX( uintptr_t(factory.scratch_ptr)==uintptr_t(default_concurrency), "under/over subscription?" );
+#endif
+}
+
+//! Test with n_threads threads and n_client clients.
+template<typename Factory, typename Client>
+void SimpleTest() {
+    Harness::ConcurrencyTracker::Reset();
+    TestSingleConnection = true;
+    N_TestConnections = 1;
+    for( int n_thread=MinThread; n_thread<=MaxThread; ++n_thread ) {
+        // Test a single connection, no nesting, no extra threads
+        DoOneConnection<Factory,Client> doc(n_thread,Nesting(0,0),0,false);
+        doc(0);
+    }
+#if !TRIVIAL
+    TestSingleConnection = false;
+    for( int n_thread=MinThread; n_thread<=MaxThread; ++n_thread ) {
+        // Test parallel connections
+        for( int n_client=1; n_client<=int(MaxClient); ++n_client ) {
+            N_TestConnections = n_client;
+            REMARK("SimpleTest: n_thread=%d n_client=%d\n",n_thread,n_client);
+            NativeParallelFor( n_client, DoOneConnection<Factory,Client>(n_thread,Nesting(0,0),0,false) );
+        }
+        // Test server::independent_thread_number_changed
+        N_TestConnections = 1;
+        for( int n_extra=-4; n_extra<=32; n_extra=n_extra+1+n_extra/5 ) {
+            DoOneConnection<Factory,Client> doc(n_thread,Nesting(0,0),n_extra,true);
+            doc(0);
+        }
+#if !RML_USE_WCRM
+        // Test nested connections
+        DoOneConnection<Factory,Client> doc(n_thread,Nesting(0,2),0,false);
+        doc(0);
+#endif
+    }
+    ASSERT( Harness::ConcurrencyTracker::PeakParallelism()>1 || server_concurrency==0, "No multiple connections exercised?" );
+#endif /* !TRIVIAL */
+    // Let RML catch up.
+    while( ClientConstructions!=ClientDestructions )
+        Harness::Sleep(1);
+}
+
+static void check_server_info( void* arg, const char* server_info )
+{
+    ASSERT( strstr(server_info, (char*)arg), NULL );
+}
+
+template<typename Factory, typename Client>
+void VerifyInitialization( int n_thread ) {
+    Client* client = new Client;
+    client->initialize( Client::is_omp ? JobArraySize : n_thread, Nesting(), ClientStackSize[0] );
+    Factory factory;
+    memset( &factory, 0, sizeof(factory) );
+    typename Factory::status_type status = factory.open();
+    ASSERT( status!=Factory::st_not_found, "could not find RML library" );
+    ASSERT( status!=Factory::st_incompatible, NULL );
+    ASSERT( status==Factory::st_success, NULL );
+    factory.call_with_server_info( check_server_info, (void*)"Intel(R) RML library" );
+    typename Factory::server_type* server; 
+    status = factory.make_server( server, *client );
+    ASSERT( status!=Factory::st_incompatible, NULL );
+    ASSERT( status!=Factory::st_not_found, NULL );
+    ASSERT( status==Factory::st_success, NULL );
+    REMARK("client %d: opened server n_thread=%d nesting=(%d,%d)\n",
+               client->client_id(), n_thread, 0, 0);
+    ASSERT( server, NULL );
+    client->set_server( server );
+    server_concurrency = server->default_concurrency();
+
+    DoClientSpecificVerification( *server, n_thread );
+
+    // Close the connection
+    client->expect_close_connection = true;
+    REMARK("client %d: calling request_close_connection\n", client->client_id());
+    server->request_close_connection();
+    // Client deletes itself when it sees call to acknowledge_close_connection from server.
+    factory.close();
+}
diff --git a/xdl/third_party/tbb/src/rml/test/test_thread_monitor.cpp b/xdl/third_party/tbb/src/rml/test/test_thread_monitor.cpp
new file mode 100644
index 00000000..e92e886d
--- /dev/null
+++ b/xdl/third_party/tbb/src/rml/test/test_thread_monitor.cpp
@@ -0,0 +1,117 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#if __TBB_MIC_OFFLOAD
+int TestMain () {
+    return Harness::Skipped;
+}
+#else
+#include "thread_monitor.h"
+#include "harness_memory.h"
+#include "tbb/semaphore.cpp"
+
+class ThreadState {
+    void loop();
+public:
+    static __RML_DECL_THREAD_ROUTINE routine( void* arg ) {
+        static_cast<ThreadState*>(arg)->loop();
+        return 0;
+    }
+    typedef rml::internal::thread_monitor thread_monitor;
+    thread_monitor monitor;
+    volatile int request;
+    volatile int ack;
+    volatile unsigned clock;
+    volatile unsigned stamp;
+    ThreadState() : request(-1), ack(-1), clock(0) {}
+};
+
+void ThreadState::loop() {
+    for(;;) {
+        ++clock;
+        if( ack==request ) {
+            thread_monitor::cookie c;
+            monitor.prepare_wait(c);
+            if( ack==request ) {
+                REMARK("%p: request=%d ack=%d\n", this, request, ack );
+                monitor.commit_wait(c);
+            } else
+                monitor.cancel_wait();
+        } else {
+            // Throw in delay occasionally
+            switch( request%8 ) {
+                case 0: 
+                case 1:
+                case 5:
+                    rml::internal::thread_monitor::yield();
+            }
+            int r = request;
+            ack = request;
+            if( !r ) return;
+        }
+    }
+}
+
+// Linux on IA-64 architecture seems to require at least 1<<18 bytes per stack.
+const size_t MinStackSize = 1<<18;
+const size_t MaxStackSize = 1<<22;
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        ThreadState* t = new ThreadState[p];
+        for( size_t stack_size = MinStackSize; stack_size<=MaxStackSize; stack_size*=2 ) {
+            REMARK("launching %d threads\n",p);
+            for( int i=0; i<p; ++i )
+                rml::internal::thread_monitor::launch( ThreadState::routine, t+i, stack_size ); 
+            for( int k=1000; k>=0; --k ) {
+                if( k%8==0 ) {
+                    // Wait for threads to wait.
+                    for( int i=0; i<p; ++i ) {
+                        unsigned count = 0;
+                        do {
+                            t[i].stamp = t[i].clock;
+                            rml::internal::thread_monitor::yield();
+                            if( ++count>=1000 ) {
+                                REPORT("Warning: thread %d not waiting\n",i);
+                                break;
+                            }
+                        } while( t[i].stamp!=t[i].clock );
+                    }
+                }
+                REMARK("notifying threads\n");
+                for( int i=0; i<p; ++i ) {
+                    // Change state visible to launched thread
+                    t[i].request = k;
+                    t[i].monitor.notify();
+                }
+                REMARK("waiting for threads to respond\n");
+                for( int i=0; i<p; ++i ) 
+                    // Wait for thread to respond 
+                    while( t[i].ack!=k ) 
+                        rml::internal::thread_monitor::yield();
+            }
+        }
+        delete[] t;
+    }
+
+    return Harness::Done;
+}
+#endif /* __TBB_MIC_OFFLOAD */
diff --git a/xdl/third_party/tbb/src/tbb/arena.cpp b/xdl/third_party/tbb/src/tbb/arena.cpp
new file mode 100644
index 00000000..77618028
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/arena.cpp
@@ -0,0 +1,1063 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/global_control.h" // thread_stack_size
+
+#include "scheduler.h"
+#include "governor.h"
+#include "arena.h"
+#include "itt_notify.h"
+#include "semaphore.h"
+#include "tbb/internal/_flow_graph_impl.h"
+
+#include <functional>
+
+#if __TBB_STATISTICS_STDOUT
+#include <cstdio>
+#endif
+
+namespace tbb {
+namespace internal {
+
+// put it here in order to enable compiler to inline it into arena::process and nested_arena_entry
+void generic_scheduler::attach_arena( arena* a, size_t index, bool is_master ) {
+    __TBB_ASSERT( a->my_market == my_market, NULL );
+    my_arena = a;
+    my_arena_index = index;
+    my_arena_slot = a->my_slots + index;
+    attach_mailbox( affinity_id(index+1) );
+    if ( is_master && my_inbox.is_idle_state( true ) ) {
+        // Master enters an arena with its own task to be executed. It means that master is not
+        // going to enter stealing loop and take affinity tasks.
+        my_inbox.set_is_idle( false );
+    }
+#if __TBB_TASK_GROUP_CONTEXT
+    // Context to be used by root tasks by default (if the user has not specified one).
+    if( !is_master )
+        my_dummy_task->prefix().context = a->my_default_ctx;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+#if __TBB_TASK_PRIORITY
+    // In the current implementation master threads continue processing even when
+    // there are other masters with higher priority. Only TBB worker threads are
+    // redistributed between arenas based on the latters' priority. Thus master
+    // threads use arena's top priority as a reference point (in contrast to workers
+    // that use my_market->my_global_top_priority).
+    if( is_master ) {
+        my_ref_top_priority = &a->my_top_priority;
+        my_ref_reload_epoch = &a->my_reload_epoch;
+    }
+    my_local_reload_epoch = *my_ref_reload_epoch;
+    __TBB_ASSERT( !my_offloaded_tasks, NULL );
+#endif /* __TBB_TASK_PRIORITY */
+}
+
+inline static bool occupy_slot( generic_scheduler*& slot, generic_scheduler& s ) {
+    return !slot && as_atomic( slot ).compare_and_swap( &s, NULL ) == NULL;
+}
+
+size_t arena::occupy_free_slot_in_range( generic_scheduler& s, size_t lower, size_t upper ) {
+    if ( lower >= upper ) return out_of_arena;
+    // Start search for an empty slot from the one we occupied the last time
+    size_t index = s.my_arena_index;
+    if ( index < lower || index >= upper ) index = s.my_random.get() % (upper - lower) + lower;
+    __TBB_ASSERT( index >= lower && index < upper, NULL );
+    // Find a free slot
+    for ( size_t i = index; i < upper; ++i )
+        if ( occupy_slot(my_slots[i].my_scheduler, s) ) return i;
+    for ( size_t i = lower; i < index; ++i )
+        if ( occupy_slot(my_slots[i].my_scheduler, s) ) return i;
+    return out_of_arena;
+}
+
+template <bool as_worker>
+size_t arena::occupy_free_slot( generic_scheduler& s ) {
+    // Firstly, masters try to occupy reserved slots
+    size_t index = as_worker ? out_of_arena : occupy_free_slot_in_range( s, 0, my_num_reserved_slots );
+    if ( index == out_of_arena ) {
+        // Secondly, all threads try to occupy all non-reserved slots
+        index = occupy_free_slot_in_range( s, my_num_reserved_slots, my_num_slots );
+        // Likely this arena is already saturated
+        if ( index == out_of_arena )
+            return out_of_arena;
+    }
+
+    ITT_NOTIFY(sync_acquired, my_slots + index);
+    atomic_update( my_limit, (unsigned)(index + 1), std::less<unsigned>() );
+    return index;
+}
+
+void arena::process( generic_scheduler& s ) {
+    __TBB_ASSERT( is_alive(my_guard), NULL );
+    __TBB_ASSERT( governor::is_set(&s), NULL );
+    __TBB_ASSERT( s.my_innermost_running_task == s.my_dummy_task, NULL );
+    __TBB_ASSERT( s.worker_outermost_level(), NULL );
+
+    __TBB_ASSERT( my_num_slots > 1, NULL );
+
+    size_t index = occupy_free_slot</*as_worker*/true>( s );
+    if ( index == out_of_arena )
+        goto quit;
+
+    __TBB_ASSERT( index >= my_num_reserved_slots, "Workers cannot occupy reserved slots" );
+    s.attach_arena( this, index, /*is_master*/false );
+
+#if !__TBB_FP_CONTEXT
+    my_cpu_ctl_env.set_env();
+#endif
+
+#if __TBB_ARENA_OBSERVER
+    __TBB_ASSERT( !s.my_last_local_observer, "There cannot be notified local observers when entering arena" );
+    my_observers.notify_entry_observers( s.my_last_local_observer, /*worker=*/true );
+#endif /* __TBB_ARENA_OBSERVER */
+
+    // Task pool can be marked as non-empty if the worker occupies the slot left by a master.
+    if ( s.my_arena_slot->task_pool != EmptyTaskPool ) {
+        __TBB_ASSERT( s.my_inbox.is_idle_state(false), NULL );
+        s.local_wait_for_all( *s.my_dummy_task, NULL );
+        __TBB_ASSERT( s.my_inbox.is_idle_state(true), NULL );
+    }
+
+    for ( ;; ) {
+        __TBB_ASSERT( s.my_innermost_running_task == s.my_dummy_task, NULL );
+        __TBB_ASSERT( s.worker_outermost_level(), NULL );
+        __TBB_ASSERT( is_alive(my_guard), NULL );
+        __TBB_ASSERT( s.is_quiescent_local_task_pool_reset(),
+                      "Worker cannot leave arena while its task pool is not reset" );
+        __TBB_ASSERT( s.my_arena_slot->task_pool == EmptyTaskPool, "Empty task pool is not marked appropriately" );
+        // This check prevents relinquishing more than necessary workers because
+        // of the non-atomicity of the decision making procedure
+        if ( num_workers_active() > my_num_workers_allotted
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+             || recall_by_mandatory_request()
+#endif
+            )
+            break;
+        // Try to steal a task.
+        // Passing reference count is technically unnecessary in this context,
+        // but omitting it here would add checks inside the function.
+        task* t = s.receive_or_steal_task( __TBB_ISOLATION_ARG( s.my_dummy_task->prefix().ref_count, no_isolation ) );
+        if (t) {
+            // A side effect of receive_or_steal_task is that my_innermost_running_task can be set.
+            // But for the outermost dispatch loop it has to be a dummy task.
+            s.my_innermost_running_task = s.my_dummy_task;
+            s.local_wait_for_all(*s.my_dummy_task,t);
+        }
+    }
+#if __TBB_ARENA_OBSERVER
+    my_observers.notify_exit_observers( s.my_last_local_observer, /*worker=*/true );
+    s.my_last_local_observer = NULL;
+#endif /* __TBB_ARENA_OBSERVER */
+#if __TBB_TASK_PRIORITY
+    if ( s.my_offloaded_tasks )
+        orphan_offloaded_tasks( s );
+#endif /* __TBB_TASK_PRIORITY */
+#if __TBB_STATISTICS
+    ++s.my_counters.arena_roundtrips;
+    *my_slots[index].my_counters += s.my_counters;
+    s.my_counters.reset();
+#endif /* __TBB_STATISTICS */
+    __TBB_store_with_release( my_slots[index].my_scheduler, (generic_scheduler*)NULL );
+    s.my_arena_slot = 0; // detached from slot
+    s.my_inbox.detach();
+    __TBB_ASSERT( s.my_inbox.is_idle_state(true), NULL );
+    __TBB_ASSERT( s.my_innermost_running_task == s.my_dummy_task, NULL );
+    __TBB_ASSERT( s.worker_outermost_level(), NULL );
+    __TBB_ASSERT( is_alive(my_guard), NULL );
+quit:
+    // In contrast to earlier versions of TBB (before 3.0 U5) now it is possible
+    // that arena may be temporarily left unpopulated by threads. See comments in
+    // arena::on_thread_leaving() for more details.
+    on_thread_leaving<ref_worker>();
+}
+
+arena::arena ( market& m, unsigned num_slots, unsigned num_reserved_slots ) {
+    __TBB_ASSERT( !my_guard, "improperly allocated arena?" );
+    __TBB_ASSERT( sizeof(my_slots[0]) % NFS_GetLineSize()==0, "arena::slot size not multiple of cache line size" );
+    __TBB_ASSERT( (uintptr_t)this % NFS_GetLineSize()==0, "arena misaligned" );
+#if __TBB_TASK_PRIORITY
+    __TBB_ASSERT( !my_reload_epoch && !my_orphaned_tasks && !my_skipped_fifo_priority, "New arena object is not zeroed" );
+#endif /* __TBB_TASK_PRIORITY */
+    my_market = &m;
+    my_limit = 1;
+    // Two slots are mandatory: for the master, and for 1 worker (required to support starvation resistant tasks).
+    my_num_slots = num_arena_slots(num_slots);
+    my_num_reserved_slots = num_reserved_slots;
+    my_max_num_workers = num_slots-num_reserved_slots;
+    my_references = ref_external; // accounts for the master
+#if __TBB_TASK_PRIORITY
+    my_bottom_priority = my_top_priority = normalized_normal_priority;
+#endif /* __TBB_TASK_PRIORITY */
+    my_aba_epoch = m.my_arenas_aba_epoch;
+#if __TBB_ARENA_OBSERVER
+    my_observers.my_arena = this;
+#endif
+    __TBB_ASSERT ( my_max_num_workers <= my_num_slots, NULL );
+    // Construct slots. Mark internal synchronization elements for the tools.
+    for( unsigned i = 0; i < my_num_slots; ++i ) {
+        __TBB_ASSERT( !my_slots[i].my_scheduler && !my_slots[i].task_pool, NULL );
+        __TBB_ASSERT( !my_slots[i].task_pool_ptr, NULL );
+        __TBB_ASSERT( !my_slots[i].my_task_pool_size, NULL );
+        ITT_SYNC_CREATE(my_slots + i, SyncType_Scheduler, SyncObj_WorkerTaskPool);
+        mailbox(i+1).construct();
+        ITT_SYNC_CREATE(&mailbox(i+1), SyncType_Scheduler, SyncObj_Mailbox);
+        my_slots[i].hint_for_pop = i;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        my_slots[i].hint_for_critical = i;
+#endif
+#if __TBB_STATISTICS
+        my_slots[i].my_counters = new ( NFS_Allocate(1, sizeof(statistics_counters), NULL) ) statistics_counters;
+#endif /* __TBB_STATISTICS */
+    }
+    my_task_stream.initialize(my_num_slots);
+    ITT_SYNC_CREATE(&my_task_stream, SyncType_Scheduler, SyncObj_TaskStream);
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    my_critical_task_stream.initialize(my_num_slots);
+    ITT_SYNC_CREATE(&my_critical_task_stream, SyncType_Scheduler, SyncObj_CriticalTaskStream);
+#endif
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    my_concurrency_mode = cm_normal;
+#endif
+#if !__TBB_FP_CONTEXT
+    my_cpu_ctl_env.get_env();
+#endif
+}
+
+arena& arena::allocate_arena( market& m, unsigned num_slots, unsigned num_reserved_slots ) {
+    __TBB_ASSERT( sizeof(base_type) + sizeof(arena_slot) == sizeof(arena), "All arena data fields must go to arena_base" );
+    __TBB_ASSERT( sizeof(base_type) % NFS_GetLineSize() == 0, "arena slots area misaligned: wrong padding" );
+    __TBB_ASSERT( sizeof(mail_outbox) == NFS_MaxLineSize, "Mailbox padding is wrong" );
+    size_t n = allocation_size(num_arena_slots(num_slots));
+    unsigned char* storage = (unsigned char*)NFS_Allocate( 1, n, NULL );
+    // Zero all slots to indicate that they are empty
+    memset( storage, 0, n );
+    return *new( storage + num_arena_slots(num_slots) * sizeof(mail_outbox) ) arena(m, num_slots, num_reserved_slots);
+}
+
+void arena::free_arena () {
+    __TBB_ASSERT( is_alive(my_guard), NULL );
+    __TBB_ASSERT( !my_references, "There are threads in the dying arena" );
+    __TBB_ASSERT( !my_num_workers_requested && !my_num_workers_allotted, "Dying arena requests workers" );
+    __TBB_ASSERT( my_pool_state == SNAPSHOT_EMPTY || !my_max_num_workers, "Inconsistent state of a dying arena" );
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    __TBB_ASSERT( my_concurrency_mode != cm_enforced_global, NULL );
+#endif
+#if !__TBB_STATISTICS_EARLY_DUMP
+    GATHER_STATISTIC( dump_arena_statistics() );
+#endif
+    poison_value( my_guard );
+    intptr_t drained = 0;
+    for ( unsigned i = 0; i < my_num_slots; ++i ) {
+        __TBB_ASSERT( !my_slots[i].my_scheduler, "arena slot is not empty" );
+        // TODO: understand the assertion and modify
+        // __TBB_ASSERT( my_slots[i].task_pool == EmptyTaskPool, NULL );
+        __TBB_ASSERT( my_slots[i].head == my_slots[i].tail, NULL ); // TODO: replace by is_quiescent_local_task_pool_empty
+        my_slots[i].free_task_pool();
+#if __TBB_STATISTICS
+        NFS_Free( my_slots[i].my_counters );
+#endif /* __TBB_STATISTICS */
+        drained += mailbox(i+1).drain();
+    }
+    __TBB_ASSERT( my_task_stream.drain()==0, "Not all enqueued tasks were executed");
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    __TBB_ASSERT( my_critical_task_stream.drain()==0, "Not all critical tasks were executed");
+#endif
+#if __TBB_COUNT_TASK_NODES
+    my_market->update_task_node_count( -drained );
+#endif /* __TBB_COUNT_TASK_NODES */
+    // remove an internal reference
+    my_market->release( /*is_public=*/false, /*blocking_terminate=*/false );
+#if __TBB_TASK_GROUP_CONTEXT
+    __TBB_ASSERT( my_default_ctx, "Master thread never entered the arena?" );
+    my_default_ctx->~task_group_context();
+    NFS_Free(my_default_ctx);
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+#if __TBB_ARENA_OBSERVER
+    if ( !my_observers.empty() )
+        my_observers.clear();
+#endif /* __TBB_ARENA_OBSERVER */
+    void* storage  = &mailbox(my_num_slots);
+    __TBB_ASSERT( my_references == 0, NULL );
+    __TBB_ASSERT( my_pool_state == SNAPSHOT_EMPTY || !my_max_num_workers, NULL );
+    this->~arena();
+#if TBB_USE_ASSERT > 1
+    memset( storage, 0, allocation_size(my_num_slots) );
+#endif /* TBB_USE_ASSERT */
+    NFS_Free( storage );
+}
+
+#if __TBB_STATISTICS
+void arena::dump_arena_statistics () {
+    statistics_counters total;
+    for( unsigned i = 0; i < my_num_slots; ++i ) {
+#if __TBB_STATISTICS_EARLY_DUMP
+        generic_scheduler* s = my_slots[i].my_scheduler;
+        if ( s )
+            *my_slots[i].my_counters += s->my_counters;
+#else
+        __TBB_ASSERT( !my_slots[i].my_scheduler, NULL );
+#endif
+        if ( i != 0 ) {
+            total += *my_slots[i].my_counters;
+            dump_statistics( *my_slots[i].my_counters, i );
+        }
+    }
+    dump_statistics( *my_slots[0].my_counters, 0 );
+#if __TBB_STATISTICS_STDOUT
+#if !__TBB_STATISTICS_TOTALS_ONLY
+    printf( "----------------------------------------------\n" );
+#endif
+    dump_statistics( total, workers_counters_total );
+    total += *my_slots[0].my_counters;
+    dump_statistics( total, arena_counters_total );
+#if !__TBB_STATISTICS_TOTALS_ONLY
+    printf( "==============================================\n" );
+#endif
+#endif /* __TBB_STATISTICS_STDOUT */
+}
+#endif /* __TBB_STATISTICS */
+
+#if __TBB_TASK_PRIORITY
+// The method inspects a scheduler to determine:
+// 1. if it has tasks that can be retrieved and executed (via the return value);
+// 2. if it has any tasks at all, including those of lower priority (via tasks_present);
+// 3. if it is able to work with enqueued tasks (via dequeuing_possible).
+inline bool arena::may_have_tasks ( generic_scheduler* s, bool& tasks_present, bool& dequeuing_possible ) {
+    if ( !s || s->my_arena != this )
+        return false;
+    dequeuing_possible |= s->worker_outermost_level();
+    if ( s->my_pool_reshuffling_pending ) {
+        // This primary task pool is nonempty and may contain tasks at the current
+        // priority level. Its owner is winnowing lower priority tasks at the moment.
+        tasks_present = true;
+        return true;
+    }
+    if ( s->my_offloaded_tasks ) {
+        tasks_present = true;
+        if ( s->my_local_reload_epoch < *s->my_ref_reload_epoch ) {
+            // This scheduler's offload area is nonempty and may contain tasks at the
+            // current priority level.
+            return true;
+        }
+    }
+    return false;
+}
+
+void arena::orphan_offloaded_tasks(generic_scheduler& s) {
+    __TBB_ASSERT( s.my_offloaded_tasks, NULL );
+    GATHER_STATISTIC( ++s.my_counters.prio_orphanings );
+    ++my_abandonment_epoch;
+    __TBB_ASSERT( s.my_offloaded_task_list_tail_link && !*s.my_offloaded_task_list_tail_link, NULL );
+    task* orphans;
+    do {
+        orphans = const_cast<task*>(my_orphaned_tasks);
+        *s.my_offloaded_task_list_tail_link = orphans;
+    } while ( as_atomic(my_orphaned_tasks).compare_and_swap(s.my_offloaded_tasks, orphans) != orphans );
+    s.my_offloaded_tasks = NULL;
+#if TBB_USE_ASSERT
+    s.my_offloaded_task_list_tail_link = NULL;
+#endif /* TBB_USE_ASSERT */
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+bool arena::has_enqueued_tasks() {
+    // Look for enqueued tasks at all priority levels
+    for ( int p = 0; p < num_priority_levels; ++p )
+        if ( !my_task_stream.empty(p) )
+            return true;
+    return false;
+}
+
+void arena::restore_priority_if_need() {
+    // Check for the presence of enqueued tasks "lost" on some of
+    // priority levels because updating arena priority and switching
+    // arena into "populated" (FULL) state happen non-atomically.
+    // Imposing atomicity would require task::enqueue() to use a lock,
+    // which is unacceptable.
+    if ( has_enqueued_tasks() ) {
+        advertise_new_work<work_enqueued>();
+#if __TBB_TASK_PRIORITY
+        // update_arena_priority() expects non-zero arena::my_num_workers_requested,
+        // so must be called after advertise_new_work<work_enqueued>()
+        for ( int p = 0; p < num_priority_levels; ++p )
+            if ( !my_task_stream.empty(p) ) {
+                if ( p < my_bottom_priority || p > my_top_priority )
+                    my_market->update_arena_priority(*this, p);
+            }
+#endif
+    }
+}
+
+bool arena::is_out_of_work() {
+    // TODO: rework it to return at least a hint about where a task was found; better if the task itself.
+    for(;;) {
+        pool_state_t snapshot = my_pool_state;
+        switch( snapshot ) {
+            case SNAPSHOT_EMPTY:
+                return true;
+            case SNAPSHOT_FULL: {
+                // Use unique id for "busy" in order to avoid ABA problems.
+                const pool_state_t busy = pool_state_t(&busy);
+                // Request permission to take snapshot
+                if( my_pool_state.compare_and_swap( busy, SNAPSHOT_FULL )==SNAPSHOT_FULL ) {
+                    // Got permission. Take the snapshot.
+                    // NOTE: This is not a lock, as the state can be set to FULL at
+                    //       any moment by a thread that spawns/enqueues new task.
+                    size_t n = my_limit;
+                    // Make local copies of volatile parameters. Their change during
+                    // snapshot taking procedure invalidates the attempt, and returns
+                    // this thread into the dispatch loop.
+#if __TBB_TASK_PRIORITY
+                    uintptr_t reload_epoch = __TBB_load_with_acquire( my_reload_epoch );
+                    intptr_t top_priority = my_top_priority;
+                    // Inspect primary task pools first
+#endif /* __TBB_TASK_PRIORITY */
+                    size_t k;
+                    for( k=0; k<n; ++k ) {
+                        if( my_slots[k].task_pool != EmptyTaskPool &&
+                            __TBB_load_relaxed(my_slots[k].head) < __TBB_load_relaxed(my_slots[k].tail) )
+                        {
+                            // k-th primary task pool is nonempty and does contain tasks.
+                            break;
+                        }
+                        if( my_pool_state!=busy )
+                            return false; // the work was published
+                    }
+                    __TBB_ASSERT( k <= n, NULL );
+                    bool work_absent = k == n;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+                    bool no_critical_tasks = my_critical_task_stream.empty(0);
+                    work_absent &= no_critical_tasks;
+#endif
+#if __TBB_TASK_PRIORITY
+                    // Variable tasks_present indicates presence of tasks at any priority
+                    // level, while work_absent refers only to the current priority.
+                    bool tasks_present = !work_absent || my_orphaned_tasks;
+                    bool dequeuing_possible = false;
+                    if ( work_absent ) {
+                        // Check for the possibility that recent priority changes
+                        // brought some tasks to the current priority level
+
+                        uintptr_t abandonment_epoch = my_abandonment_epoch;
+                        // Master thread's scheduler needs special handling as it
+                        // may be destroyed at any moment (workers' schedulers are
+                        // guaranteed to be alive while at least one thread is in arena).
+                        // The lock below excludes concurrency with task group state change
+                        // propagation and guarantees lifetime of the master thread.
+                        the_context_state_propagation_mutex.lock();
+                        work_absent = !may_have_tasks( my_slots[0].my_scheduler, tasks_present, dequeuing_possible );
+                        the_context_state_propagation_mutex.unlock();
+                        // The following loop is subject to data races. While k-th slot's
+                        // scheduler is being examined, corresponding worker can either
+                        // leave to RML or migrate to another arena.
+                        // But the races are not prevented because all of them are benign.
+                        // First, the code relies on the fact that worker thread's scheduler
+                        // object persists until the whole library is deinitialized.
+                        // Second, in the worst case the races can only cause another
+                        // round of stealing attempts to be undertaken. Introducing complex
+                        // synchronization into this coldest part of the scheduler's control
+                        // flow does not seem to make sense because it both is unlikely to
+                        // ever have any observable performance effect, and will require
+                        // additional synchronization code on the hotter paths.
+                        for( k = 1; work_absent && k < n; ++k ) {
+                            if( my_pool_state!=busy )
+                                return false; // the work was published
+                            work_absent = !may_have_tasks( my_slots[k].my_scheduler, tasks_present, dequeuing_possible );
+                        }
+                        // Preclude premature switching arena off because of a race in the previous loop.
+                        work_absent = work_absent
+                                      && !__TBB_load_with_acquire(my_orphaned_tasks)
+                                      && abandonment_epoch == my_abandonment_epoch;
+                    }
+#endif /* __TBB_TASK_PRIORITY */
+                    // Test and test-and-set.
+                    if( my_pool_state==busy ) {
+#if __TBB_TASK_PRIORITY
+                        bool no_fifo_tasks = my_task_stream.empty(top_priority);
+                        work_absent = work_absent && (!dequeuing_possible || no_fifo_tasks)
+                                      && top_priority == my_top_priority && reload_epoch == my_reload_epoch;
+#else
+                        bool no_fifo_tasks = my_task_stream.empty(0);
+                        work_absent = work_absent && no_fifo_tasks;
+#endif /* __TBB_TASK_PRIORITY */
+                        if( work_absent ) {
+#if __TBB_TASK_PRIORITY
+                            if ( top_priority > my_bottom_priority ) {
+                                if ( my_market->lower_arena_priority(*this, top_priority - 1, reload_epoch)
+                                     && !my_task_stream.empty(top_priority) )
+                                {
+                                    atomic_update( my_skipped_fifo_priority, top_priority, std::less<intptr_t>());
+                                }
+                            }
+                            else if ( !tasks_present && !my_orphaned_tasks && no_fifo_tasks ) {
+#endif /* __TBB_TASK_PRIORITY */
+                                // save current demand value before setting SNAPSHOT_EMPTY,
+                                // to avoid race with advertise_new_work.
+                                int current_demand = (int)my_max_num_workers;
+                                if( my_pool_state.compare_and_swap( SNAPSHOT_EMPTY, busy )==busy ) {
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+                                    if( my_concurrency_mode==cm_enforced_global  ) {
+                                        // adjust_demand() called inside, if needed
+                                        my_market->mandatory_concurrency_disable( this );
+                                    } else
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+                                    {
+                                        // This thread transitioned pool to empty state, and thus is
+                                        // responsible for telling the market that there is no work to do.
+                                        my_market->adjust_demand( *this, -current_demand );
+                                    }
+                                    restore_priority_if_need();
+                                    return true;
+                                }
+                                return false;
+#if __TBB_TASK_PRIORITY
+                            }
+#endif /* __TBB_TASK_PRIORITY */
+                        }
+                        // Undo previous transition SNAPSHOT_FULL-->busy, unless another thread undid it.
+                        my_pool_state.compare_and_swap( SNAPSHOT_FULL, busy );
+                    }
+                }
+                return false;
+            }
+            default:
+                // Another thread is taking a snapshot.
+                return false;
+        }
+    }
+}
+
+#if __TBB_COUNT_TASK_NODES
+intptr_t arena::workers_task_node_count() {
+    intptr_t result = 0;
+    for( unsigned i = 1; i < my_num_slots; ++i ) {
+        generic_scheduler* s = my_slots[i].my_scheduler;
+        if( s )
+            result += s->my_task_node_count;
+    }
+    return result;
+}
+#endif /* __TBB_COUNT_TASK_NODES */
+
+void arena::enqueue_task( task& t, intptr_t prio, FastRandom &random )
+{
+#if __TBB_RECYCLE_TO_ENQUEUE
+    __TBB_ASSERT( t.state()==task::allocated || t.state()==task::to_enqueue, "attempt to enqueue task with inappropriate state" );
+#else
+    __TBB_ASSERT( t.state()==task::allocated, "attempt to enqueue task that is not in 'allocated' state" );
+#endif
+    t.prefix().state = task::ready;
+    t.prefix().extra_state |= es_task_enqueued; // enqueued task marker
+
+#if TBB_USE_ASSERT
+    if( task* parent = t.parent() ) {
+        internal::reference_count ref_count = parent->prefix().ref_count;
+        __TBB_ASSERT( ref_count!=0, "attempt to enqueue task whose parent has a ref_count==0 (forgot to set_ref_count?)" );
+        __TBB_ASSERT( ref_count>0, "attempt to enqueue task whose parent has a ref_count<0" );
+        parent->prefix().extra_state |= es_ref_count_active;
+    }
+    __TBB_ASSERT(t.prefix().affinity==affinity_id(0), "affinity is ignored for enqueued tasks");
+#endif /* TBB_USE_ASSERT */
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    if( prio == internal::priority_critical || internal::is_critical( t ) ) {
+        // TODO: consider using of 'scheduler::handled_as_critical'
+        internal::make_critical( t );
+#if __TBB_TASK_ISOLATION
+        generic_scheduler* s = governor::local_scheduler_if_initialized();
+        __TBB_ASSERT( s, "Scheduler must be initialized at this moment" );
+        // propagate isolation level to critical task
+        t.prefix().isolation = s->my_innermost_running_task->prefix().isolation;
+#endif
+        ITT_NOTIFY(sync_releasing, &my_critical_task_stream);
+        if( !s || !s->my_arena_slot ) {
+            // Either scheduler is not initialized or it is not attached to the arena, use random
+            // lane for the task.
+            my_critical_task_stream.push( &t, 0, internal::random_lane_selector(random) );
+        } else {
+            unsigned& lane = s->my_arena_slot->hint_for_critical;
+            my_critical_task_stream.push( &t, 0, tbb::internal::subsequent_lane_selector(lane) );
+        }
+        advertise_new_work<work_spawned>();
+        return;
+    }
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+
+    ITT_NOTIFY(sync_releasing, &my_task_stream);
+#if __TBB_TASK_PRIORITY
+    intptr_t p = prio ? normalize_priority(priority_t(prio)) : normalized_normal_priority;
+    assert_priority_valid(p);
+#if __TBB_PREVIEW_CRITICAL_TASKS && __TBB_CPF_BUILD
+    my_task_stream.push( &t, p, internal::random_lane_selector(random) );
+#else
+    my_task_stream.push( &t, p, random );
+#endif
+    if ( p != my_top_priority )
+        my_market->update_arena_priority( *this, p );
+#else /* !__TBB_TASK_PRIORITY */
+    __TBB_ASSERT_EX(prio == 0, "the library is not configured to respect the task priority");
+#if __TBB_PREVIEW_CRITICAL_TASKS && __TBB_CPF_BUILD
+    my_task_stream.push( &t, 0, internal::random_lane_selector(random) );
+#else
+    my_task_stream.push( &t, 0, random );
+#endif
+#endif /* !__TBB_TASK_PRIORITY */
+    advertise_new_work<work_enqueued>();
+#if __TBB_TASK_PRIORITY
+    if ( p != my_top_priority )
+        my_market->update_arena_priority( *this, p );
+#endif /* __TBB_TASK_PRIORITY */
+}
+
+class nested_arena_context : no_copy {
+public:
+    nested_arena_context(generic_scheduler *s, arena* a, size_t slot_index, bool type, bool same)
+        : my_scheduler(*s), my_orig_ctx(NULL), same_arena(same) {
+        if (same_arena) {
+            my_orig_state.my_properties = my_scheduler.my_properties;
+            my_orig_state.my_innermost_running_task = my_scheduler.my_innermost_running_task;
+            mimic_outermost_level(a, type);
+        } else {
+            my_orig_state = *s;
+            mimic_outermost_level(a, type);
+            s->nested_arena_entry(a, slot_index);
+        }
+    }
+    ~nested_arena_context() {
+#if __TBB_TASK_GROUP_CONTEXT
+        my_scheduler.my_dummy_task->prefix().context = my_orig_ctx; // restore context of dummy task
+#endif
+        if (same_arena) {
+            my_scheduler.my_properties = my_orig_state.my_properties;
+            my_scheduler.my_innermost_running_task = my_orig_state.my_innermost_running_task;
+        } else {
+            my_scheduler.nested_arena_exit();
+            static_cast<scheduler_state&>(my_scheduler) = my_orig_state; // restore arena settings
+#if __TBB_TASK_PRIORITY
+            my_scheduler.my_local_reload_epoch = *my_orig_state.my_ref_reload_epoch;
+#endif
+            governor::assume_scheduler(&my_scheduler);
+        }
+    }
+
+private:
+    generic_scheduler &my_scheduler;
+    scheduler_state my_orig_state;
+    task_group_context *my_orig_ctx;
+    const bool same_arena;
+
+    void mimic_outermost_level(arena* a, bool type) {
+        my_scheduler.my_properties.outermost = true;
+        my_scheduler.my_properties.type = type;
+        my_scheduler.my_innermost_running_task = my_scheduler.my_dummy_task;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        my_scheduler.my_properties.has_taken_critical_task = false;
+#endif
+#if __TBB_TASK_GROUP_CONTEXT
+        // Save dummy's context and replace it by arena's context
+        my_orig_ctx = my_scheduler.my_dummy_task->prefix().context;
+        my_scheduler.my_dummy_task->prefix().context = a->my_default_ctx;
+#endif
+    }
+};
+
+void generic_scheduler::nested_arena_entry(arena* a, size_t slot_index) {
+    __TBB_ASSERT( is_alive(a->my_guard), NULL );
+    __TBB_ASSERT( a!=my_arena, NULL);
+
+    // overwrite arena settings
+#if __TBB_TASK_PRIORITY
+    if ( my_offloaded_tasks )
+        my_arena->orphan_offloaded_tasks( *this );
+    my_offloaded_tasks = NULL;
+#endif /* __TBB_TASK_PRIORITY */
+    attach_arena( a, slot_index, /*is_master*/true );
+    __TBB_ASSERT( my_arena == a, NULL );
+    governor::assume_scheduler( this );
+    // TODO? ITT_NOTIFY(sync_acquired, a->my_slots + index);
+    // TODO: it requires market to have P workers (not P-1)
+    // TODO: a preempted worker should be excluded from assignment to other arenas e.g. my_slack--
+    if( !is_worker() && slot_index >= my_arena->my_num_reserved_slots )
+        my_arena->my_market->adjust_demand(*my_arena, -1);
+#if __TBB_ARENA_OBSERVER
+    my_last_local_observer = 0; // TODO: try optimize number of calls
+    my_arena->my_observers.notify_entry_observers( my_last_local_observer, /*worker=*/false );
+#endif
+}
+
+void generic_scheduler::nested_arena_exit() {
+#if __TBB_ARENA_OBSERVER
+    my_arena->my_observers.notify_exit_observers( my_last_local_observer, /*worker=*/false );
+#endif /* __TBB_ARENA_OBSERVER */
+#if __TBB_TASK_PRIORITY
+    if ( my_offloaded_tasks )
+        my_arena->orphan_offloaded_tasks( *this );
+#endif
+    if( !is_worker() && my_arena_index >= my_arena->my_num_reserved_slots )
+        my_arena->my_market->adjust_demand(*my_arena, 1);
+    // Free the master slot.
+    __TBB_ASSERT(my_arena->my_slots[my_arena_index].my_scheduler, "A slot is already empty");
+    __TBB_store_with_release(my_arena->my_slots[my_arena_index].my_scheduler, (generic_scheduler*)NULL);
+    my_arena->my_exit_monitors.notify_one(); // do not relax!
+}
+
+void generic_scheduler::wait_until_empty() {
+    my_dummy_task->prefix().ref_count++; // prevents exit from local_wait_for_all when local work is done enforcing the stealing
+    while( my_arena->my_pool_state != arena::SNAPSHOT_EMPTY )
+        local_wait_for_all(*my_dummy_task, NULL);
+    my_dummy_task->prefix().ref_count--;
+}
+
+} // namespace internal
+} // namespace tbb
+
+#include "scheduler_utility.h"
+#include "tbb/task_arena.h" // task_arena_base
+
+namespace tbb {
+namespace interface7 {
+namespace internal {
+
+void task_arena_base::internal_initialize( ) {
+    governor::one_time_init();
+    if( my_max_concurrency < 1 )
+        my_max_concurrency = (int)governor::default_num_threads();
+    __TBB_ASSERT( my_master_slots <= (unsigned)my_max_concurrency, "Number of slots reserved for master should not exceed arena concurrency");
+    arena* new_arena = market::create_arena( my_max_concurrency, my_master_slots, 0 );
+    // add an internal market reference; a public reference was added in create_arena
+    market &m = market::global_market( /*is_public=*/false );
+    // allocate default context for task_arena
+#if __TBB_TASK_GROUP_CONTEXT
+    new_arena->my_default_ctx = new ( NFS_Allocate(1, sizeof(task_group_context), NULL) )
+            task_group_context( task_group_context::isolated, task_group_context::default_traits );
+#if __TBB_FP_CONTEXT
+    new_arena->my_default_ctx->capture_fp_settings();
+#endif
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    // threads might race to initialize the arena
+    if(as_atomic(my_arena).compare_and_swap(new_arena, NULL) != NULL) {
+        __TBB_ASSERT(my_arena, NULL); // another thread won the race
+        // release public market reference
+        m.release( /*is_public=*/true, /*blocking_terminate=*/false );
+        new_arena->on_thread_leaving<arena::ref_external>(); // destroy unneeded arena
+#if __TBB_TASK_GROUP_CONTEXT
+        spin_wait_while_eq(my_context, (task_group_context*)NULL);
+    } else {
+        new_arena->my_default_ctx->my_version_and_traits |= my_version_and_traits & exact_exception_flag;
+        as_atomic(my_context) = new_arena->my_default_ctx;
+#endif
+    }
+    // TODO: should it trigger automatic initialization of this thread?
+    governor::local_scheduler_weak();
+}
+
+void task_arena_base::internal_terminate( ) {
+    if( my_arena ) {// task_arena was initialized
+        my_arena->my_market->release( /*is_public=*/true, /*blocking_terminate=*/false );
+        my_arena->on_thread_leaving<arena::ref_external>();
+        my_arena = 0;
+#if __TBB_TASK_GROUP_CONTEXT
+        my_context = 0;
+#endif
+    }
+}
+
+void task_arena_base::internal_attach( ) {
+    __TBB_ASSERT(!my_arena, NULL);
+    generic_scheduler* s = governor::local_scheduler_if_initialized();
+    if( s && s->my_arena ) {
+        // There is an active arena to attach to.
+        // It's still used by s, so won't be destroyed right away.
+        my_arena = s->my_arena;
+        __TBB_ASSERT( my_arena->my_references > 0, NULL );
+        my_arena->my_references += arena::ref_external;
+#if __TBB_TASK_GROUP_CONTEXT
+        my_context = my_arena->my_default_ctx;
+        my_version_and_traits |= my_context->my_version_and_traits & exact_exception_flag;
+#endif
+        my_master_slots = my_arena->my_num_reserved_slots;
+        my_max_concurrency = my_master_slots + my_arena->my_max_num_workers;
+        __TBB_ASSERT(arena::num_arena_slots(my_max_concurrency)==my_arena->my_num_slots, NULL);
+        // increases market's ref count for task_arena
+        market::global_market( /*is_public=*/true );
+    }
+}
+
+void task_arena_base::internal_enqueue( task& t, intptr_t prio ) const {
+    __TBB_ASSERT(my_arena, NULL);
+    generic_scheduler* s = governor::local_scheduler_if_initialized();
+    __TBB_ASSERT(s, "Scheduler is not initialized"); // we allocated a task so can expect the scheduler
+#if __TBB_TASK_GROUP_CONTEXT
+    __TBB_ASSERT(my_arena->my_default_ctx == t.prefix().context, NULL);
+    __TBB_ASSERT(!my_arena->my_default_ctx->is_group_execution_cancelled(), // TODO: any better idea?
+                 "The task will not be executed because default task_group_context of task_arena is cancelled. Has previously enqueued task thrown an exception?");
+#endif
+    my_arena->enqueue_task( t, prio, s->my_random );
+}
+
+class delegated_task : public task {
+    internal::delegate_base & my_delegate;
+    concurrent_monitor & my_monitor;
+    task * my_root;
+    task* execute() __TBB_override {
+        generic_scheduler& s = *(generic_scheduler*)prefix().owner;
+        __TBB_ASSERT(s.outermost_level(), "expected to be enqueued and received on the outermost level");
+        struct outermost_context : internal::no_copy {
+            delegated_task * t;
+            generic_scheduler & s;
+            task * orig_dummy;
+            task_group_context * orig_ctx;
+            scheduler_properties orig_props;
+            outermost_context(delegated_task *_t, generic_scheduler &_s)
+                : t(_t), s(_s), orig_dummy(s.my_dummy_task), orig_props(s.my_properties) {
+                __TBB_ASSERT(s.my_innermost_running_task == t, NULL);
+#if __TBB_TASK_GROUP_CONTEXT
+                orig_ctx = t->prefix().context;
+                t->prefix().context = s.my_arena->my_default_ctx;
+#endif
+                // Mimics outermost master
+                s.my_dummy_task = t;
+                s.my_properties.type = scheduler_properties::master;
+            }
+            ~outermost_context() {
+#if __TBB_TASK_GROUP_CONTEXT
+                // Restore context for sake of registering potential exception
+                t->prefix().context = orig_ctx;
+#endif
+                s.my_properties = orig_props;
+                s.my_dummy_task = orig_dummy;
+            }
+        } scope(this, s);
+        my_delegate();
+        return NULL;
+    }
+    ~delegated_task() {
+        // potential exception was already registered. It must happen before the notification
+        __TBB_ASSERT(my_root->ref_count()==2, NULL);
+        __TBB_store_with_release(my_root->prefix().ref_count, 1); // must precede the wakeup
+        my_monitor.notify(*this); // do not relax, it needs a fence!
+    }
+public:
+    delegated_task( internal::delegate_base & d, concurrent_monitor & s, task * t )
+        : my_delegate(d), my_monitor(s), my_root(t) {}
+    // predicate for concurrent_monitor notification
+    bool operator()(uintptr_t ctx) const { return (void*)ctx == (void*)&my_delegate; }
+};
+
+void task_arena_base::internal_execute(internal::delegate_base& d) const {
+    __TBB_ASSERT(my_arena, NULL);
+    generic_scheduler* s = governor::local_scheduler_weak();
+    __TBB_ASSERT(s, "Scheduler is not initialized");
+
+    bool same_arena = s->my_arena == my_arena;
+    size_t index1 = s->my_arena_index;
+    if (!same_arena) {
+        index1 = my_arena->occupy_free_slot</* as_worker*/false>(*s);
+        if (index1 == arena::out_of_arena) {
+
+#if __TBB_USE_OPTIONAL_RTTI
+            // Workaround for the bug inside graph. If the thread can not occupy arena slot during task_arena::execute()
+            // and all aggregator operations depend on this task completion (all other threads are inside arena already)
+            // deadlock appears, because enqueued task will never enter arena.
+            // Workaround: check if the task came from graph via RTTI (casting to graph::spawn_functor)
+            // and enqueue this task with non-blocking internal_enqueue method.
+            // TODO: have to change behaviour later in next GOLD release (maybe to add new library entry point - try_execute)
+            typedef tbb::flow::interface10::graph::spawn_functor graph_funct;
+            internal::delegated_function< graph_funct, void >* deleg_funct =
+                    dynamic_cast< internal::delegated_function< graph_funct, void>* >(&d);
+
+            if (deleg_funct) {
+                internal_enqueue(*new(task::allocate_root(*my_context))
+                    internal::function_task< internal::strip< graph_funct >::type >
+                        (internal::forward< graph_funct >(deleg_funct->my_func)), 0);
+                return;
+            } else {
+#endif /*  __TBB_USE_OPTIONAL_RTTI */
+                concurrent_monitor::thread_context waiter;
+#if __TBB_TASK_GROUP_CONTEXT
+                task_group_context exec_context(task_group_context::isolated, my_version_and_traits & exact_exception_flag);
+#if __TBB_FP_CONTEXT
+                exec_context.copy_fp_settings(*my_context);
+#endif
+#endif
+                auto_empty_task root(__TBB_CONTEXT_ARG(s, &exec_context));
+                root.prefix().ref_count = 2;
+                my_arena->enqueue_task(*new(task::allocate_root(__TBB_CONTEXT_ARG1(exec_context)))
+                    delegated_task(d, my_arena->my_exit_monitors, &root),
+                    0, s->my_random); // TODO: priority?
+                size_t index2 = arena::out_of_arena;
+                do {
+                    my_arena->my_exit_monitors.prepare_wait(waiter, (uintptr_t)&d);
+                    if (__TBB_load_with_acquire(root.prefix().ref_count) < 2) {
+                        my_arena->my_exit_monitors.cancel_wait(waiter);
+                        break;
+                    }
+                    index2 = my_arena->occupy_free_slot</*as_worker*/false>(*s);
+                    if (index2 != arena::out_of_arena) {
+                        my_arena->my_exit_monitors.cancel_wait(waiter);
+                        nested_arena_context scope(s, my_arena, index2, scheduler_properties::master, same_arena);
+                        s->local_wait_for_all(root, NULL);
+#if TBB_USE_EXCEPTIONS
+                        __TBB_ASSERT(!exec_context.my_exception, NULL); // exception can be thrown above, not deferred
+#endif
+                        __TBB_ASSERT(root.prefix().ref_count == 0, NULL);
+                        break;
+                    }
+                    my_arena->my_exit_monitors.commit_wait(waiter);
+                } while (__TBB_load_with_acquire(root.prefix().ref_count) == 2);
+                if (index2 == arena::out_of_arena) {
+                    // notify a waiting thread even if this thread did not enter arena,
+                    // in case it was woken by a leaving thread but did not need to enter
+                    my_arena->my_exit_monitors.notify_one(); // do not relax!
+                }
+#if TBB_USE_EXCEPTIONS
+                // process possible exception
+                if (task_group_context::exception_container_type *pe = exec_context.my_exception)
+                    TbbRethrowException(pe);
+#endif
+                return;
+#if __TBB_USE_OPTIONAL_RTTI
+            } // if task came from graph
+#endif
+        } // if (index1 == arena::out_of_arena)
+    } // if (!same_arena)
+
+    context_guard_helper</*report_tasks=*/false> context_guard;
+    context_guard.set_ctx(__TBB_CONTEXT_ARG1(my_context));
+#if TBB_USE_EXCEPTIONS
+    try {
+#endif
+        //TODO: replace dummy tasks for workers as well to avoid using of the_dummy_context
+        nested_arena_context scope(s, my_arena, index1, scheduler_properties::master, same_arena);
+        d();
+#if TBB_USE_EXCEPTIONS
+    }
+    catch (...) {
+        context_guard.restore_default(); // TODO: is it needed on Windows?
+        if (my_version_and_traits & exact_exception_flag) throw;
+        else {
+            task_group_context exception_container(task_group_context::isolated,
+                task_group_context::default_traits & ~task_group_context::exact_exception);
+            exception_container.register_pending_exception();
+            __TBB_ASSERT(exception_container.my_exception, NULL);
+            TbbRethrowException(exception_container.my_exception);
+        }
+    }
+#endif
+}
+
+// this wait task is a temporary approach to wait for arena emptiness for masters without slots
+// TODO: it will be rather reworked for one source of notification from is_out_of_work
+class wait_task : public task {
+    binary_semaphore & my_signal;
+    task* execute() __TBB_override {
+        generic_scheduler* s = governor::local_scheduler_if_initialized();
+        __TBB_ASSERT( s, NULL );
+        __TBB_ASSERT( s->outermost_level(), "The enqueued task can be processed only on outermost level" );
+        if ( s->is_worker() ) {
+            __TBB_ASSERT( s->my_innermost_running_task == this, NULL );
+            // Mimic worker on outermost level to run remaining tasks
+            s->my_innermost_running_task = s->my_dummy_task;
+            s->local_wait_for_all( *s->my_dummy_task, NULL );
+            s->my_innermost_running_task = this;
+        } else s->my_arena->is_out_of_work(); // avoids starvation of internal_wait: issuing this task makes arena full
+        my_signal.V();
+        return NULL;
+    }
+public:
+    wait_task ( binary_semaphore & sema ) : my_signal(sema) {}
+};
+
+void task_arena_base::internal_wait() const {
+    __TBB_ASSERT(my_arena, NULL);
+    generic_scheduler* s = governor::local_scheduler_weak();
+    __TBB_ASSERT(s, "Scheduler is not initialized");
+    __TBB_ASSERT(s->my_arena != my_arena || s->my_arena_index == 0, "task_arena::wait_until_empty() is not supported within a worker context" );
+    if( s->my_arena == my_arena ) {
+        //unsupported, but try do something for outermost master
+        __TBB_ASSERT(s->master_outermost_level(), "unsupported");
+        if( !s->my_arena_index )
+            while( my_arena->num_workers_active() )
+                s->wait_until_empty();
+    } else for(;;) {
+        while( my_arena->my_pool_state != arena::SNAPSHOT_EMPTY ) {
+            if( !__TBB_load_with_acquire(my_arena->my_slots[0].my_scheduler) // TODO TEMP: one master, make more masters
+                && as_atomic(my_arena->my_slots[0].my_scheduler).compare_and_swap(s, NULL) == NULL ) {
+                nested_arena_context a(s, my_arena, 0, scheduler_properties::worker, false);
+                s->wait_until_empty();
+            } else {
+                binary_semaphore waiter; // TODO: replace by a single event notification from is_out_of_work
+                internal_enqueue( *new( task::allocate_root(__TBB_CONTEXT_ARG1(*my_context)) ) wait_task(waiter), 0 ); // TODO: priority?
+                waiter.P(); // TODO: concurrent_monitor
+            }
+        }
+        if( !my_arena->num_workers_active() && !my_arena->my_slots[0].my_scheduler) // no activity
+            break; // spin until workers active but avoid spinning in a worker
+        __TBB_Yield(); // wait until workers and master leave
+    }
+}
+
+/*static*/ int task_arena_base::internal_current_slot() {
+    generic_scheduler* s = governor::local_scheduler_if_initialized();
+    return s? int(s->my_arena_index) : -1;
+}
+
+#if __TBB_TASK_ISOLATION
+class isolation_guard : tbb::internal::no_copy {
+    isolation_tag &guarded;
+    isolation_tag previous_value;
+public:
+    isolation_guard( isolation_tag &isolation ) : guarded( isolation ), previous_value( isolation ) {}
+    ~isolation_guard() {
+        guarded = previous_value;
+    }
+};
+
+void isolate_within_arena( delegate_base& d, intptr_t reserved ) {
+    __TBB_ASSERT_EX( reserved == 0, NULL );
+    // TODO: Decide what to do if the scheduler is not initialized. Is there a use case for it?
+    generic_scheduler* s = governor::local_scheduler_weak();
+    __TBB_ASSERT( s, "this_task_arena::isolate() needs an initialized scheduler" );
+    // Theoretically, we can keep the current isolation in the scheduler; however, it makes sense to store it in innermost
+    // running task because it can in principle be queried via task::self().
+    isolation_tag& current_isolation = s->my_innermost_running_task->prefix().isolation;
+    // We temporarily change the isolation tag of the currently running task. It will be restored in the destructor of the guard.
+    isolation_guard guard( current_isolation );
+    current_isolation = reinterpret_cast<isolation_tag>(&d);
+    d();
+}
+#endif /* __TBB_TASK_ISOLATION */
+
+int task_arena_base::internal_max_concurrency(const task_arena *ta) {
+    arena* a = NULL;
+    if( ta ) // for special cases of ta->max_concurrency()
+        a = ta->my_arena;
+    else if( generic_scheduler* s = governor::local_scheduler_if_initialized() )
+        a = s->my_arena; // the current arena if any
+
+    if( a ) { // Get parameters from the arena
+        __TBB_ASSERT( !ta || ta->my_max_concurrency==1, NULL );
+        return a->my_num_reserved_slots + a->my_max_num_workers;
+    } else {
+        __TBB_ASSERT( !ta || ta->my_max_concurrency==automatic, NULL );
+        return int(governor::default_num_threads());
+    }
+}
+} // tbb::interfaceX::internal
+} // tbb::interfaceX
+} // tbb
diff --git a/xdl/third_party/tbb/src/tbb/arena.h b/xdl/third_party/tbb/src/tbb/arena.h
new file mode 100644
index 00000000..7e902056
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/arena.h
@@ -0,0 +1,477 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_arena_H
+#define _TBB_arena_H
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/atomic.h"
+
+#include "tbb/tbb_machine.h"
+
+#include "scheduler_common.h"
+#include "intrusive_list.h"
+#if __TBB_PREVIEW_CRITICAL_TASKS && __TBB_CPF_BUILD
+#include "task_stream_extended.h"
+#else
+#include "task_stream.h"
+#endif
+#include "../rml/include/rml_tbb.h"
+#include "mailbox.h"
+#include "observer_proxy.h"
+#include "market.h"
+#include "governor.h"
+#include "concurrent_monitor.h"
+
+namespace tbb {
+
+class task_group_context;
+class allocate_root_with_context_proxy;
+
+namespace internal {
+
+//! The structure of an arena, except the array of slots.
+/** Separated in order to simplify padding.
+    Intrusive list node base class is used by market to form a list of arenas. **/
+struct arena_base : padded<intrusive_list_node> {
+    //! The number of workers that have been marked out by the resource manager to service the arena.
+    unsigned my_num_workers_allotted;   // heavy use in stealing loop
+
+    //! Reference counter for the arena.
+    /** Worker and master references are counted separately: first several bits are for references
+        from master threads or explicit task_arenas (see arena::ref_external_bits below);
+        the rest counts the number of workers servicing the arena. */
+    atomic<unsigned> my_references;     // heavy use in stealing loop
+
+#if __TBB_TASK_PRIORITY
+    //! The highest priority of recently spawned or enqueued tasks.
+    volatile intptr_t my_top_priority;  // heavy use in stealing loop
+#endif /* !__TBB_TASK_PRIORITY */
+
+    //! The maximal number of currently busy slots.
+    atomic<unsigned> my_limit;          // heavy use in stealing loop
+
+    //! Task pool for the tasks scheduled via task::enqueue() method.
+    /** Such scheduling guarantees eventual execution even if
+        - new tasks are constantly coming (by extracting scheduled tasks in
+          relaxed FIFO order);
+        - the enqueuing thread does not call any of wait_for_all methods.
+        Depending on __TBB_TASK_PRIORITY, num_priority_levels can be 1 or more. **/
+#if __TBB_PREVIEW_CRITICAL_TASKS && __TBB_CPF_BUILD
+    task_stream<num_priority_levels, front_accessor> my_task_stream; // heavy use in stealing loop
+#else
+    task_stream<num_priority_levels> my_task_stream; // heavy use in stealing loop
+#endif
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    //! Task pool for the tasks with critical property set.
+    /** Critical tasks are scheduled for execution ahead of other sources (including local task pool
+        and even bypassed tasks) unless the thread already executes a critical task in an outer
+        dispatch loop **/
+    // used on the hot path of the task dispatch loop
+    task_stream<1, back_nonnull_accessor> my_critical_task_stream;
+#endif
+
+    //! The number of workers requested by the master thread owning the arena.
+    unsigned my_max_num_workers;
+
+    //! The number of workers that are currently requested from the resource manager.
+    int my_num_workers_requested;
+
+    //! Current task pool state and estimate of available tasks amount.
+    /** The estimate is either 0 (SNAPSHOT_EMPTY) or infinity (SNAPSHOT_FULL).
+        Special state is "busy" (any other unsigned value).
+        Note that the implementation of arena::is_busy_or_empty() requires
+        my_pool_state to be unsigned. */
+    tbb::atomic<uintptr_t> my_pool_state;
+
+#if __TBB_ARENA_OBSERVER
+    //! The list of local observers attached to this arena.
+    observer_list my_observers;
+#endif
+
+#if __TBB_TASK_PRIORITY
+    //! The lowest normalized priority of available spawned or enqueued tasks.
+    intptr_t my_bottom_priority;
+
+    //! Tracks events that may bring tasks in offload areas to the top priority level.
+    /** Incremented when arena top priority changes or a task group priority
+        is elevated to the current arena's top level. **/
+    uintptr_t my_reload_epoch;
+
+    //! The list of offloaded tasks abandoned by workers revoked by the market.
+    task* my_orphaned_tasks;
+
+    //! Counter used to track the occurrence of recent orphaning and re-sharing operations.
+    tbb::atomic<uintptr_t> my_abandonment_epoch;
+
+    //! The highest priority level containing enqueued tasks.
+    /** It being greater than 0 means that high priority enqueued tasks had to be
+        bypassed because all workers were blocked in nested dispatch loops and
+        were unable to progress at then current priority level. **/
+    tbb::atomic<intptr_t> my_skipped_fifo_priority;
+#endif /* !__TBB_TASK_PRIORITY */
+
+    // Below are rarely modified members
+
+    //! The market that owns this arena.
+    market* my_market;
+
+    //! ABA prevention marker.
+    uintptr_t my_aba_epoch;
+
+#if !__TBB_FP_CONTEXT
+    //! FPU control settings of arena's master thread captured at the moment of arena instantiation.
+    cpu_ctl_env my_cpu_ctl_env;
+#endif
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Default task group context.
+    /** Used by root tasks allocated directly by the master thread (not from inside
+        a TBB task) without explicit context specification. **/
+    task_group_context* my_default_ctx;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+    //! The number of slots in the arena.
+    unsigned my_num_slots;
+
+    //! The number of reserved slots (can be occupied only by masters).
+    unsigned my_num_reserved_slots;
+
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    //! Possible states for the concurrency mode of an arena.
+    enum concurrency_mode {
+        cm_normal =  0,     // arena is served by workers as usual
+        cm_enforced_local,  // arena needs an extra worker despite the arena limit
+        cm_enforced_global  // arena needs an extra worker despite a global limit
+    };
+
+    //! The concurrency mode of an arena.
+    concurrency_mode my_concurrency_mode;
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+
+    //! Waiting object for master threads that cannot join the arena.
+    concurrent_monitor my_exit_monitors;
+
+#if TBB_USE_ASSERT
+    //! Used to trap accesses to the object after its destruction.
+    uintptr_t my_guard;
+#endif /* TBB_USE_ASSERT */
+}; // struct arena_base
+
+class arena: public padded<arena_base>
+{
+    //! If enqueued tasks found, restore arena priority and task presence status
+    void restore_priority_if_need();
+public:
+    typedef padded<arena_base> base_type;
+
+    //! Types of work advertised by advertise_new_work()
+    enum new_work_type {
+        work_spawned,
+        wakeup,
+        work_enqueued
+    };
+
+    //! Constructor
+    arena ( market&, unsigned max_num_workers, unsigned num_reserved_slots );
+
+    //! Allocate an instance of arena.
+    static arena& allocate_arena( market&, unsigned num_slots, unsigned num_reserved_slots );
+
+    static int unsigned num_arena_slots ( unsigned num_slots ) {
+        return max(2u, num_slots);
+    }
+
+    static int allocation_size ( unsigned num_slots ) {
+        return sizeof(base_type) + num_slots * (sizeof(mail_outbox) + sizeof(arena_slot));
+    }
+
+    //! Get reference to mailbox corresponding to given affinity_id.
+    mail_outbox& mailbox( affinity_id id ) {
+        __TBB_ASSERT( 0<id, "affinity id must be positive integer" );
+        __TBB_ASSERT( id <= my_num_slots, "affinity id out of bounds" );
+
+        return ((mail_outbox*)this)[-(int)id];
+    }
+
+    //! Completes arena shutdown, destructs and deallocates it.
+    void free_arena ();
+
+    typedef uintptr_t pool_state_t;
+
+    //! No tasks to steal since last snapshot was taken
+    static const pool_state_t SNAPSHOT_EMPTY = 0;
+
+    //! At least one task has been offered for stealing since the last snapshot started
+    static const pool_state_t SNAPSHOT_FULL = pool_state_t(-1);
+
+    //! The number of least significant bits for external references
+    static const unsigned ref_external_bits = 12; // up to 4095 external and 1M workers
+
+    //! Reference increment values for externals and workers
+    static const unsigned ref_external = 1;
+    static const unsigned ref_worker   = 1<<ref_external_bits;
+
+    //! No tasks to steal or snapshot is being taken.
+    static bool is_busy_or_empty( pool_state_t s ) { return s < SNAPSHOT_FULL; }
+
+    //! The number of workers active in the arena.
+    unsigned num_workers_active( ) {
+        return my_references >> ref_external_bits;
+    }
+
+    //! If necessary, raise a flag that there is new job in arena.
+    template<arena::new_work_type work_type> void advertise_new_work();
+
+    //! Check if there is job anywhere in arena.
+    /** Return true if no job or if arena is being cleaned up. */
+    bool is_out_of_work();
+
+    //! enqueue a task into starvation-resistance queue
+    void enqueue_task( task&, intptr_t, FastRandom & );
+
+    //! Registers the worker with the arena and enters TBB scheduler dispatch loop
+    void process( generic_scheduler& );
+
+    //! Notification that worker or master leaves its arena
+    template<unsigned ref_param>
+    inline void on_thread_leaving ( );
+
+#if __TBB_STATISTICS
+    //! Outputs internal statistics accumulated by the arena
+    void dump_arena_statistics ();
+#endif /* __TBB_STATISTICS */
+
+#if __TBB_TASK_PRIORITY
+    //! Check if recent priority changes may bring some tasks to the current priority level soon
+    /** /param tasks_present indicates presence of tasks at any priority level. **/
+    inline bool may_have_tasks ( generic_scheduler*, bool& tasks_present, bool& dequeuing_possible );
+
+    //! Puts offloaded tasks into global list of orphaned tasks
+    void orphan_offloaded_tasks ( generic_scheduler& s );
+#endif /* __TBB_TASK_PRIORITY */
+
+#if __TBB_COUNT_TASK_NODES
+    //! Returns the number of task objects "living" in worker threads
+    intptr_t workers_task_node_count();
+#endif
+
+    //! Check for the presence of enqueued tasks at all priority levels
+    bool has_enqueued_tasks();
+
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    //! Recall worker if global mandatory is enabled, but not for this arena
+    bool recall_by_mandatory_request() const {
+        return my_market->my_mandatory_num_requested && my_concurrency_mode==cm_normal;
+    }
+
+    //! The arena is currently in an enforced concurrency mode
+    bool must_have_concurrency() const {
+        return my_num_workers_requested &&
+               ( my_concurrency_mode==cm_enforced_local || my_concurrency_mode==cm_enforced_global );
+    }
+#endif
+    static const size_t out_of_arena = ~size_t(0);
+    //! Tries to occupy a slot in the arena. On success, returns the slot index; if no slot is available, returns out_of_arena.
+    template <bool as_worker>
+    size_t occupy_free_slot( generic_scheduler& s );
+    //! Tries to occupy a slot in the specified range.
+    size_t occupy_free_slot_in_range( generic_scheduler& s, size_t lower, size_t upper );
+
+    /** Must be the last data field */
+    arena_slot my_slots[1];
+}; // class arena
+
+template<unsigned ref_param>
+inline void arena::on_thread_leaving ( ) {
+    //
+    // Implementation of arena destruction synchronization logic contained various
+    // bugs/flaws at the different stages of its evolution, so below is a detailed
+    // description of the issues taken into consideration in the framework of the
+    // current design.
+    //
+    // In case of using fire-and-forget tasks (scheduled via task::enqueue())
+    // master thread is allowed to leave its arena before all its work is executed,
+    // and market may temporarily revoke all workers from this arena. Since revoked
+    // workers never attempt to reset arena state to EMPTY and cancel its request
+    // to RML for threads, the arena object is destroyed only when both the last
+    // thread is leaving it and arena's state is EMPTY (that is its master thread
+    // left and it does not contain any work).
+    // Thus resetting arena to EMPTY state (as earlier TBB versions did) should not
+    // be done here (or anywhere else in the master thread to that matter); doing so
+    // can result either in arena's premature destruction (at least without
+    // additional costly checks in workers) or in unnecessary arena state changes
+    // (and ensuing workers migration).
+    //
+    // A worker that checks for work presence and transitions arena to the EMPTY
+    // state (in snapshot taking procedure arena::is_out_of_work()) updates
+    // arena::my_pool_state first and only then arena::my_num_workers_requested.
+    // So the check for work absence must be done against the latter field.
+    //
+    // In a time window between decrementing the active threads count and checking
+    // if there is an outstanding request for workers. New worker thread may arrive,
+    // finish remaining work, set arena state to empty, and leave decrementing its
+    // refcount and destroying. Then the current thread will destroy the arena
+    // the second time. To preclude it a local copy of the outstanding request
+    // value can be stored before decrementing active threads count.
+    //
+    // But this technique may cause two other problem. When the stored request is
+    // zero, it is possible that arena still has threads and they can generate new
+    // tasks and thus re-establish non-zero requests. Then all the threads can be
+    // revoked (as described above) leaving this thread the last one, and causing
+    // it to destroy non-empty arena.
+    //
+    // The other problem takes place when the stored request is non-zero. Another
+    // thread may complete the work, set arena state to empty, and leave without
+    // arena destruction before this thread decrements the refcount. This thread
+    // cannot destroy the arena either. Thus the arena may be "orphaned".
+    //
+    // In both cases we cannot dereference arena pointer after the refcount is
+    // decremented, as our arena may already be destroyed.
+    //
+    // If this is the master thread, the market is protected by refcount to it.
+    // In case of workers market's liveness is ensured by the RML connection
+    // rundown protocol, according to which the client (i.e. the market) lives
+    // until RML server notifies it about connection termination, and this
+    // notification is fired only after all workers return into RML.
+    //
+    // Thus if we decremented refcount to zero we ask the market to check arena
+    // state (including the fact if it is alive) under the lock.
+    //
+    uintptr_t aba_epoch = my_aba_epoch;
+    market* m = my_market;
+    __TBB_ASSERT(my_references >= ref_param, "broken arena reference counter");
+#if __TBB_STATISTICS_EARLY_DUMP
+    // While still holding a reference to the arena, compute how many external references are left.
+    // If just one, dump statistics.
+    if ( modulo_power_of_two(my_references,ref_worker)==ref_param ) // may only be true with ref_external
+        GATHER_STATISTIC( dump_arena_statistics() );
+#endif
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    // When there is no workers someone must free arena, as
+    // without workers, no one calls is_out_of_work().
+    // Skip workerless arenas because they have no demand for workers.
+    // TODO: consider more strict conditions for the cleanup,
+    // because it can create the demand of workers,
+    // but the arena can be already empty (and so ready for destroying)
+    if( ref_param==ref_external && my_num_slots != my_num_reserved_slots
+        && 0 == m->my_num_workers_soft_limit && my_concurrency_mode==cm_normal ) {
+        bool is_out = false;
+        for (int i=0; i<num_priority_levels; i++) {
+            is_out = is_out_of_work();
+            if (is_out)
+                break;
+        }
+        // We expect, that in worst case it's enough to have num_priority_levels-1
+        // calls to restore priorities and and yet another is_out_of_work() to conform
+        // that no work was found. But as market::set_active_num_workers() can be called
+        // concurrently, can't guarantee last is_out_of_work() return true.
+    }
+#endif
+    if ( (my_references -= ref_param ) == 0 )
+        m->try_destroy_arena( this, aba_epoch );
+}
+
+template<arena::new_work_type work_type> void arena::advertise_new_work() {
+    if( work_type == work_enqueued ) {
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        if( my_market->my_num_workers_soft_limit == 0 ) {
+            if( my_concurrency_mode!=cm_enforced_global ) {
+                if( my_market->mandatory_concurrency_enable( this ) ) {
+                    my_pool_state = SNAPSHOT_FULL;
+                    return;
+                }
+            }
+        } else if( my_max_num_workers==0 && my_num_reserved_slots==1 ) {
+            my_max_num_workers = 1;
+            __TBB_ASSERT(my_concurrency_mode==cm_normal, NULL);
+            my_concurrency_mode = cm_enforced_local;
+            my_pool_state = SNAPSHOT_FULL;
+            my_market->adjust_demand( *this, 1 );
+            return;
+        }
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+        // Local memory fence here and below is required to avoid missed wakeups; see the comment below.
+        // Starvation resistant tasks require concurrency, so missed wakeups are unacceptable.
+        atomic_fence();
+    }
+    else if( work_type == wakeup ) {
+        __TBB_ASSERT(my_max_num_workers!=0, "Unexpected worker wakeup request");
+        atomic_fence();
+    }
+    // Double-check idiom that, in case of spawning, is deliberately sloppy about memory fences.
+    // Technically, to avoid missed wakeups, there should be a full memory fence between the point we
+    // released the task pool (i.e. spawned task) and read the arena's state.  However, adding such a
+    // fence might hurt overall performance more than it helps, because the fence would be executed
+    // on every task pool release, even when stealing does not occur.  Since TBB allows parallelism,
+    // but never promises parallelism, the missed wakeup is not a correctness problem.
+    pool_state_t snapshot = my_pool_state;
+    if( is_busy_or_empty(snapshot) ) {
+        // Attempt to mark as full.  The compare_and_swap below is a little unusual because the
+        // result is compared to a value that can be different than the comparand argument.
+        if( my_pool_state.compare_and_swap( SNAPSHOT_FULL, snapshot )==SNAPSHOT_EMPTY ) {
+            if( snapshot!=SNAPSHOT_EMPTY ) {
+                // This thread read "busy" into snapshot, and then another thread transitioned
+                // my_pool_state to "empty" in the meantime, which caused the compare_and_swap above
+                // to fail.  Attempt to transition my_pool_state from "empty" to "full".
+                if( my_pool_state.compare_and_swap( SNAPSHOT_FULL, SNAPSHOT_EMPTY )!=SNAPSHOT_EMPTY ) {
+                    // Some other thread transitioned my_pool_state from "empty", and hence became
+                    // responsible for waking up workers.
+                    return;
+                }
+            }
+            // This thread transitioned pool from empty to full state, and thus is responsible for
+            // telling the market that there is work to do.
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+            if( work_type == work_spawned ) {
+                if( my_concurrency_mode!=cm_normal ) {
+                    switch( my_concurrency_mode ) {
+                    case cm_enforced_local:
+                        __TBB_ASSERT(my_max_num_workers==1, "");
+                        __TBB_ASSERT(!governor::local_scheduler()->is_worker(), "");
+                        // There was deliberate oversubscription on 1 core for sake of starvation-resistant tasks.
+                        // Now a single active thread (must be the master) supposedly starts a new parallel region
+                        // with relaxed sequential semantics, and oversubscription should be avoided.
+                        // Demand for workers has been decreased to 0 during SNAPSHOT_EMPTY, so just keep it.
+                        my_max_num_workers = 0;
+                        my_concurrency_mode = cm_normal;
+                        break;
+                    case cm_enforced_global:
+                        my_market->mandatory_concurrency_disable( this );
+                        restore_priority_if_need();
+                        break;
+                    default:
+                        break;
+                    }
+                    return;
+                }
+            }
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+            // TODO: investigate adjusting of arena's demand by a single worker.
+            my_market->adjust_demand( *this, my_max_num_workers );
+        }
+    }
+}
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_arena_H */
diff --git a/xdl/third_party/tbb/src/tbb/cache_aligned_allocator.cpp b/xdl/third_party/tbb/src/tbb/cache_aligned_allocator.cpp
new file mode 100644
index 00000000..6525308a
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/cache_aligned_allocator.cpp
@@ -0,0 +1,256 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/tbb_exception.h"
+#include "tbb_misc.h"
+#include "dynamic_link.h"
+#include <cstdlib>
+
+#if _WIN32||_WIN64
+#include "tbb/machine/windows_api.h"
+#else
+#include <dlfcn.h>
+#endif /* _WIN32||_WIN64 */
+
+#if __TBB_WEAK_SYMBOLS_PRESENT
+
+#pragma weak scalable_malloc
+#pragma weak scalable_free
+#pragma weak scalable_aligned_malloc
+#pragma weak scalable_aligned_free
+
+extern "C" {
+    void* scalable_malloc( size_t );
+    void  scalable_free( void* );
+    void* scalable_aligned_malloc( size_t, size_t );
+    void  scalable_aligned_free( void* );
+}
+
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT */
+
+namespace tbb {
+
+namespace internal {
+
+//! Dummy routine used for first indirect call via MallocHandler.
+static void* DummyMalloc( size_t size );
+
+//! Dummy routine used for first indirect call via FreeHandler.
+static void DummyFree( void * ptr );
+
+//! Handler for memory allocation
+static void* (*MallocHandler)( size_t size ) = &DummyMalloc;
+
+//! Handler for memory deallocation
+static void (*FreeHandler)( void* pointer ) = &DummyFree;
+
+//! Dummy routine used for first indirect call via padded_allocate_handler.
+static void* dummy_padded_allocate( size_t bytes, size_t alignment );
+
+//! Dummy routine used for first indirect call via padded_free_handler.
+static void dummy_padded_free( void * ptr );
+
+// ! Allocates memory using standard malloc. It is used when scalable_allocator is not available
+static void* padded_allocate( size_t bytes, size_t alignment );
+
+// ! Allocates memory using standard free. It is used when scalable_allocator is not available
+static void padded_free( void* p );
+
+//! Handler for padded memory allocation
+static void* (*padded_allocate_handler)( size_t bytes, size_t alignment ) = &dummy_padded_allocate;
+
+//! Handler for padded memory deallocation
+static void (*padded_free_handler)( void* p ) = &dummy_padded_free;
+
+//! Table describing how to link the handlers.
+static const dynamic_link_descriptor MallocLinkTable[] = {
+    DLD(scalable_malloc, MallocHandler),
+    DLD(scalable_free, FreeHandler),
+    DLD(scalable_aligned_malloc, padded_allocate_handler),
+    DLD(scalable_aligned_free, padded_free_handler),
+};
+
+
+#if TBB_USE_DEBUG
+#define DEBUG_SUFFIX "_debug"
+#else
+#define DEBUG_SUFFIX
+#endif /* TBB_USE_DEBUG */
+
+// MALLOCLIB_NAME is the name of the TBB memory allocator library.
+#if _WIN32||_WIN64
+#define MALLOCLIB_NAME "tbbmalloc" DEBUG_SUFFIX ".dll"
+#elif __APPLE__
+#define MALLOCLIB_NAME "libtbbmalloc" DEBUG_SUFFIX ".dylib"
+#elif __FreeBSD__ || __NetBSD__ || __OpenBSD__ || __sun || _AIX || __ANDROID__
+#define MALLOCLIB_NAME "libtbbmalloc" DEBUG_SUFFIX ".so"
+#elif __linux__  // Note that order of these #elif's is important!
+#define MALLOCLIB_NAME "libtbbmalloc" DEBUG_SUFFIX  __TBB_STRING(.so.TBB_COMPATIBLE_INTERFACE_VERSION)
+#else
+#error Unknown OS
+#endif
+
+//! Initialize the allocation/free handler pointers.
+/** Caller is responsible for ensuring this routine is called exactly once.
+    The routine attempts to dynamically link with the TBB memory allocator.
+    If that allocator is not found, it links to malloc and free. */
+void initialize_handler_pointers() {
+    __TBB_ASSERT( MallocHandler==&DummyMalloc, NULL );
+    bool success = dynamic_link( MALLOCLIB_NAME, MallocLinkTable, 4 );
+    if( !success ) {
+        // If unsuccessful, set the handlers to the default routines.
+        // This must be done now, and not before FillDynamicLinks runs, because if other
+        // threads call the handlers, we want them to go through the DoOneTimeInitializations logic,
+        // which forces them to wait.
+        FreeHandler = &std::free;
+        MallocHandler = &std::malloc;
+        padded_allocate_handler = &padded_allocate;
+        padded_free_handler = &padded_free;
+    }
+#if !__TBB_RML_STATIC
+    PrintExtraVersionInfo( "ALLOCATOR", success?"scalable_malloc":"malloc" );
+#endif
+}
+
+static tbb::atomic<do_once_state> initialization_state;
+void initialize_cache_aligned_allocator() {
+    atomic_do_once( &initialize_handler_pointers, initialization_state );
+}
+
+//! Executed on very first call through MallocHandler
+static void* DummyMalloc( size_t size ) {
+    initialize_cache_aligned_allocator();
+    __TBB_ASSERT( MallocHandler!=&DummyMalloc, NULL );
+    return (*MallocHandler)( size );
+}
+
+//! Executed on very first call through FreeHandler
+static void DummyFree( void * ptr ) {
+    initialize_cache_aligned_allocator();
+    __TBB_ASSERT( FreeHandler!=&DummyFree, NULL );
+    (*FreeHandler)( ptr );
+}
+
+//! Executed on very first call through padded_allocate_handler
+static void* dummy_padded_allocate( size_t bytes, size_t alignment ) {
+    initialize_cache_aligned_allocator();
+    __TBB_ASSERT( padded_allocate_handler!=&dummy_padded_allocate, NULL );
+    return (*padded_allocate_handler)(bytes, alignment);
+}
+
+//! Executed on very first call through padded_free_handler
+static void dummy_padded_free( void * ptr ) {
+    initialize_cache_aligned_allocator();
+    __TBB_ASSERT( padded_free_handler!=&dummy_padded_free, NULL );
+    (*padded_free_handler)( ptr );
+}
+
+// TODO: use CPUID to find actual line size, though consider backward compatibility
+static size_t NFS_LineSize = 128;
+
+size_t NFS_GetLineSize() {
+    return NFS_LineSize;
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // unary minus operator applied to unsigned type, result still unsigned
+    #pragma warning( disable: 4146 4706 )
+#endif
+
+void* NFS_Allocate( size_t n, size_t element_size, void* /*hint*/ ) {
+    //TODO: make this functionality  available via an adaptor over generic STL like allocator
+    const size_t nfs_cache_line_size = NFS_LineSize;
+    __TBB_ASSERT( nfs_cache_line_size <= NFS_MaxLineSize, "illegal value for NFS_LineSize" );
+    __TBB_ASSERT( is_power_of_two(nfs_cache_line_size), "must be power of two" );
+    size_t bytes = n*element_size;
+
+    if (bytes<n || bytes+nfs_cache_line_size<bytes) {
+        // Overflow
+        throw_exception(eid_bad_alloc);
+    }
+    // scalable_aligned_malloc considers zero size request an error, and returns NULL
+    if (bytes==0) bytes = 1;
+
+    void* result = (*padded_allocate_handler)( bytes, nfs_cache_line_size );
+    if (!result)
+        throw_exception(eid_bad_alloc);
+
+    __TBB_ASSERT( is_aligned(result, nfs_cache_line_size), "The address returned isn't aligned to cache line size" );
+    return result;
+}
+
+void NFS_Free( void* p ) {
+    (*padded_free_handler)( p );
+}
+
+static void* padded_allocate( size_t bytes, size_t alignment ) {
+    unsigned char* result = NULL;
+    unsigned char* base = (unsigned char*)std::malloc(alignment+bytes);
+    if( base ) {
+        // Round up to the next line
+        result = (unsigned char*)((uintptr_t)(base+alignment)&-alignment);
+        // Record where block actually starts.
+        ((uintptr_t*)result)[-1] = uintptr_t(base);
+    }
+    return result;
+}
+
+static void padded_free( void* p ) {
+    if( p ) {
+        __TBB_ASSERT( (uintptr_t)p>=0x4096, "attempt to free block not obtained from cache_aligned_allocator" );
+        // Recover where block actually starts
+        unsigned char* base = ((unsigned char**)p)[-1];
+        __TBB_ASSERT( (void*)((uintptr_t)(base+NFS_LineSize)&-NFS_LineSize)==p, "not allocated by NFS_Allocate?" );
+        std::free(base);
+    }
+}
+
+void* __TBB_EXPORTED_FUNC allocate_via_handler_v3( size_t n ) {
+    void* result = (*MallocHandler) (n);
+    if (!result) {
+        throw_exception(eid_bad_alloc);
+    }
+    return result;
+}
+
+void __TBB_EXPORTED_FUNC deallocate_via_handler_v3( void *p ) {
+    if( p ) {
+        (*FreeHandler)( p );
+    }
+}
+
+bool __TBB_EXPORTED_FUNC is_malloc_used_v3() {
+    if (MallocHandler == &DummyMalloc) {
+        void* void_ptr = (*MallocHandler)(1);
+        (*FreeHandler)(void_ptr);
+    }
+    __TBB_ASSERT( MallocHandler!=&DummyMalloc && FreeHandler!=&DummyFree, NULL );
+    // Cast to void avoids type mismatch errors on some compilers (e.g. __IBMCPP__)
+    __TBB_ASSERT( !(((void*)MallocHandler==(void*)&std::malloc) ^ ((void*)FreeHandler==(void*)&std::free)),
+                  "Both shim pointers must refer to routines from the same package (either TBB or CRT)" );
+    return (void*)MallocHandler == (void*)&std::malloc;
+}
+
+} // namespace internal
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/cilk-tbb-interop.h b/xdl/third_party/tbb/src/tbb/cilk-tbb-interop.h
new file mode 100644
index 00000000..45496776
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/cilk-tbb-interop.h
@@ -0,0 +1,115 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* The API to enable interoperability between Intel(R) Cilk(TM) Plus and
+   Intel(R) Threading Building Blocks. */
+
+#ifndef CILK_TBB_INTEROP_H
+#define CILK_TBB_INTEROP_H
+
+#ifndef _WIN32
+#ifdef IN_CILK_RUNTIME
+#define CILK_EXPORT __attribute__((visibility("protected")))
+#else
+#define CILK_EXPORT /* nothing */
+#endif
+#else
+#ifdef IN_CILK_RUNTIME
+#define CILK_EXPORT __declspec(dllexport)
+#else
+#define CILK_EXPORT __declspec(dllimport)
+#endif  // IN_CILK_RUNTIME
+#endif // _WIN32
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+/* A return code.  0 indicates success */
+typedef int __cilk_tbb_retcode;
+
+enum __cilk_tbb_stack_op {
+    CILK_TBB_STACK_ORPHAN, // disconnecting stack from a thread
+    CILK_TBB_STACK_ADOPT,  // reconnecting orphaned stack to a trhead
+    CILK_TBB_STACK_RELEASE // releasing stack
+};
+
+typedef __cilk_tbb_retcode (*__cilk_tbb_pfn_stack_op)(enum __cilk_tbb_stack_op, void* data);
+
+typedef __cilk_tbb_retcode (*__cilk_tbb_pfn_unwatch_stacks)(void *data);
+
+/* Each thunk structure has two pointers: "routine" and "data".
+   The caller of the thunk invokes *routine, passing "data" as the void* parameter. */
+
+/* Thunk invoked by Intel Cilk Plus runtime (cilkrts) when it changes the relationship
+   between a stack and a thread. It does not matter what stack the thunk runs on.
+   The thread (not fiber) on which the thunk runs is important.
+
+   CILK_TBB_STACK_ORPHAN
+      The thunk must be invoked on the thread disconnecting itself from the stack.
+      Must "happen before" the stack is adopted elsewhere.
+   CILK_TBB_STACK_ADOPT
+      The thunk must be invoked on the thread adopting the stack.
+   CILK_TBB_STACK_RELEASE
+      The thunk must be invoked on the thread doing the releasing,
+      Must "happen before" the stack is used elsewhere.
+
+   When a non-empty stack is transferred between threads, the first thread must orphan it
+   and the second thread must adopt it.
+
+   An empty stack can be transferred similarly, or simply released by the first thread.
+
+   Here is a summary of the actions as transitions on a state machine.
+
+                       watch                                    ORPHAN
+                       -->-->                                   -->--
+                      /      \                                 /     \
+   (freed empty stack)       (TBB sees stack running on thread)      (stack in limbo)
+                |     \     /                                  \     /     |
+                |      --<--                                    --<--      |
+                ^      RELEASE or                              ADOPT       V
+                 \     unwatch                                            /
+                  \                                                      /
+                   --------------------------<---------------------------
+                                          RELEASE
+*/
+struct __cilk_tbb_stack_op_thunk {
+    __cilk_tbb_pfn_stack_op routine;
+    void* data;                 /* Set by TBB */
+};
+
+/* Thunk invoked by TBB when it is no longer interested in watching the stack bound to the current thread. */
+struct __cilk_tbb_unwatch_thunk {
+    __cilk_tbb_pfn_unwatch_stacks routine;
+    void* data;
+};
+
+/* Defined by cilkrts, called by TBB.
+   Requests that cilkrts invoke __cilk_tbb_stack_op_thunk when it orphans a stack.
+   cilkrts sets *u to a thunk that TBB should call when it is no longer interested in watching the stack. */
+CILK_EXPORT
+__cilk_tbb_retcode __cilkrts_watch_stack(struct __cilk_tbb_unwatch_thunk* u,
+                                         struct __cilk_tbb_stack_op_thunk o);
+
+#ifdef __cplusplus
+}
+#endif /* __cplusplus */
+
+#endif  // CILK_TBB_INTEROP_H
diff --git a/xdl/third_party/tbb/src/tbb/concurrent_hash_map.cpp b/xdl/third_party/tbb/src/tbb/concurrent_hash_map.cpp
new file mode 100644
index 00000000..e6c2da44
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/concurrent_hash_map.cpp
@@ -0,0 +1,58 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/concurrent_hash_map.h"
+
+namespace tbb {
+
+namespace internal {
+#if !TBB_NO_LEGACY
+struct hash_map_segment_base {
+    typedef spin_rw_mutex segment_mutex_t;
+    //! Type of a hash code.
+    typedef size_t hashcode_t;
+    //! Log2 of n_segment
+    static const size_t n_segment_bits = 6;
+    //! Maximum size of array of chains
+    static const size_t max_physical_size = size_t(1)<<(8*sizeof(hashcode_t)-n_segment_bits);
+    //! Mutex that protects this segment
+    segment_mutex_t my_mutex;
+    // Number of nodes
+    atomic<size_t> my_logical_size;
+    // Size of chains
+    /** Always zero or a power of two */
+    size_t my_physical_size;
+    //! True if my_logical_size>=my_physical_size.
+    /** Used to support Intel(R) Thread Checker. */
+    bool __TBB_EXPORTED_METHOD internal_grow_predicate() const;
+};
+
+bool hash_map_segment_base::internal_grow_predicate() const {
+    // Intel(R) Thread Checker considers the following reads to be races, so we hide them in the
+    // library so that Intel(R) Thread Checker will ignore them.  The reads are used in a double-check
+    // context, so the program is nonetheless correct despite the race.
+    return my_logical_size >= my_physical_size && my_physical_size < max_physical_size;
+}
+#endif//!TBB_NO_LEGACY
+
+} // namespace internal
+
+} // namespace tbb
+
diff --git a/xdl/third_party/tbb/src/tbb/concurrent_monitor.cpp b/xdl/third_party/tbb/src/tbb/concurrent_monitor.cpp
new file mode 100644
index 00000000..e8501b0d
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/concurrent_monitor.cpp
@@ -0,0 +1,136 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "concurrent_monitor.h"
+
+namespace tbb {
+namespace internal {
+
+void concurrent_monitor::thread_context::init() {
+    new (sema.begin()) binary_semaphore;
+    ready = true;
+}
+
+concurrent_monitor::~concurrent_monitor() {
+    abort_all();
+    __TBB_ASSERT( waitset_ec.empty(), "waitset not empty?" );
+}
+
+void concurrent_monitor::prepare_wait( thread_context& thr, uintptr_t ctx ) {
+    if( !thr.ready )
+        thr.init();
+    // this is good place to pump previous skipped wakeup
+    else if( thr.skipped_wakeup ) {
+        thr.skipped_wakeup = false;
+        thr.semaphore().P();
+    }
+    thr.context = ctx;
+    thr.in_waitset = true;
+    {
+        tbb::spin_mutex::scoped_lock l( mutex_ec );
+        __TBB_store_relaxed( thr.epoch, __TBB_load_relaxed(epoch) );
+        waitset_ec.add( (waitset_t::node_t*)&thr );
+    }
+    atomic_fence();
+}
+
+void concurrent_monitor::cancel_wait( thread_context& thr ) {
+    // possible skipped wakeup will be pumped in the following prepare_wait()
+    thr.skipped_wakeup = true;
+    // try to remove node from waitset
+    bool th_in_waitset = thr.in_waitset;
+    if( th_in_waitset ) {
+        tbb::spin_mutex::scoped_lock l( mutex_ec );
+        if (thr.in_waitset) {
+            waitset_ec.remove( (waitset_t::node_t&)thr );
+            // node is removed from waitset, so there will be no wakeup
+            thr.in_waitset = false;
+            thr.skipped_wakeup = false;
+        }
+    }
+}
+
+void concurrent_monitor::notify_one_relaxed() {
+    if( waitset_ec.empty() )
+        return;
+    waitset_node_t* n;
+    const waitset_node_t* end = waitset_ec.end();
+    {
+        tbb::spin_mutex::scoped_lock l( mutex_ec );
+        __TBB_store_relaxed( epoch, __TBB_load_relaxed(epoch) + 1 );
+        n = waitset_ec.front();
+        if( n!=end ) {
+            waitset_ec.remove( *n );
+            to_thread_context(n)->in_waitset = false;
+        }
+    }
+    if( n!=end )
+        to_thread_context(n)->semaphore().V();
+}
+
+void concurrent_monitor::notify_all_relaxed() {
+    if( waitset_ec.empty() )
+        return;
+    waitset_t temp;
+    const waitset_node_t* end;
+    {
+        tbb::spin_mutex::scoped_lock l( mutex_ec );
+        __TBB_store_relaxed( epoch, __TBB_load_relaxed(epoch) + 1 );
+        waitset_ec.flush_to( temp );
+        end = temp.end();
+        for( waitset_node_t* n=temp.front(); n!=end; n=n->next )
+            to_thread_context(n)->in_waitset = false;
+    }
+    waitset_node_t* nxt;
+    for( waitset_node_t* n=temp.front(); n!=end; n=nxt ) {
+        nxt = n->next;
+        to_thread_context(n)->semaphore().V();
+    }
+#if TBB_USE_ASSERT
+    temp.clear();
+#endif
+}
+
+void concurrent_monitor::abort_all_relaxed() {
+    if( waitset_ec.empty() )
+        return;
+    waitset_t temp;
+    const waitset_node_t* end;
+    {
+        tbb::spin_mutex::scoped_lock l( mutex_ec );
+        __TBB_store_relaxed( epoch, __TBB_load_relaxed(epoch) + 1 );
+        waitset_ec.flush_to( temp );
+        end = temp.end();
+        for( waitset_node_t* n=temp.front(); n!=end; n=n->next )
+            to_thread_context(n)->in_waitset = false;
+    }
+    waitset_node_t* nxt;
+    for( waitset_node_t* n=temp.front(); n!=end; n=nxt ) {
+        nxt = n->next;
+        to_thread_context(n)->aborted = true;
+        to_thread_context(n)->semaphore().V();
+    }
+#if TBB_USE_ASSERT
+    temp.clear();
+#endif
+}
+
+} // namespace internal
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/concurrent_monitor.h b/xdl/third_party/tbb/src/tbb/concurrent_monitor.h
new file mode 100644
index 00000000..1efa52ed
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/concurrent_monitor.h
@@ -0,0 +1,241 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_concurrent_monitor_H
+#define __TBB_concurrent_monitor_H
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/atomic.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/tbb_exception.h"
+#include "tbb/aligned_space.h"
+
+#include "semaphore.h"
+
+namespace tbb {
+namespace internal {
+
+//! Circular doubly-linked list with sentinel
+/** head.next points to the front and head.prev points to the back */
+class circular_doubly_linked_list_with_sentinel : no_copy {
+public:
+    struct node_t {
+        node_t* next;
+        node_t* prev;
+        explicit node_t() : next((node_t*)(uintptr_t)0xcdcdcdcd), prev((node_t*)(uintptr_t)0xcdcdcdcd) {}
+    };
+
+    // ctor
+    circular_doubly_linked_list_with_sentinel() {clear();}
+    // dtor
+    ~circular_doubly_linked_list_with_sentinel() {__TBB_ASSERT( head.next==&head && head.prev==&head, "the list is not empty" );}
+
+    inline size_t  size()  const {return count;}
+    inline bool    empty() const {return size()==0;}
+    inline node_t* front() const {return head.next;}
+    inline node_t* last()  const {return head.prev;}
+    inline node_t* begin() const {return front();}
+    inline const node_t* end() const {return &head;}
+
+    //! add to the back of the list
+    inline void add( node_t* n ) {
+        __TBB_store_relaxed(count, __TBB_load_relaxed(count) + 1);
+        n->prev = head.prev;
+        n->next = &head;
+        head.prev->next = n;
+        head.prev = n;
+    }
+
+    //! remove node 'n'
+    inline void remove( node_t& n ) {
+        __TBB_ASSERT( count > 0, "attempt to remove an item from an empty list" );
+        __TBB_store_relaxed(count, __TBB_load_relaxed(count) - 1);
+        n.prev->next = n.next;
+        n.next->prev = n.prev;
+    }
+
+    //! move all elements to 'lst' and initialize the 'this' list
+    inline void flush_to( circular_doubly_linked_list_with_sentinel& lst ) {
+        if( const size_t l_count = __TBB_load_relaxed(count) ) {
+            __TBB_store_relaxed(lst.count, l_count);
+            lst.head.next = head.next;
+            lst.head.prev = head.prev;
+            head.next->prev = &lst.head;
+            head.prev->next = &lst.head;
+            clear();
+        }
+    }
+
+    void clear() {head.next = head.prev = &head; __TBB_store_relaxed(count, 0);}
+private:
+    __TBB_atomic size_t count;
+    node_t head;
+};
+
+typedef circular_doubly_linked_list_with_sentinel waitset_t;
+typedef circular_doubly_linked_list_with_sentinel::node_t waitset_node_t;
+
+//! concurrent_monitor
+/** fine-grained concurrent_monitor implementation */
+class concurrent_monitor : no_copy {
+public:
+    /** per-thread descriptor for concurrent_monitor */
+    class thread_context : waitset_node_t, no_copy {
+        friend class concurrent_monitor;
+    public:
+        thread_context() : skipped_wakeup(false), aborted(false), ready(false), context(0) {
+            epoch = 0;
+            in_waitset = false;
+        }
+        ~thread_context() {
+            if (ready) {
+                if( skipped_wakeup ) semaphore().P();
+                semaphore().~binary_semaphore();
+            }
+        }
+        binary_semaphore& semaphore() { return *sema.begin(); }
+    private:
+        //! The method for lazy initialization of the thread_context's semaphore.
+        //  Inlining of the method is undesirable, due to extra instructions for
+        //  exception support added at caller side.
+        __TBB_NOINLINE( void init() );
+        tbb::aligned_space<binary_semaphore> sema;
+        __TBB_atomic unsigned epoch;
+        tbb::atomic<bool> in_waitset;
+        bool  skipped_wakeup;
+        bool  aborted;
+        bool  ready;
+        uintptr_t context;
+    };
+
+    //! ctor
+    concurrent_monitor() {__TBB_store_relaxed(epoch, 0);}
+
+    //! dtor
+    ~concurrent_monitor() ;
+
+    //! prepare wait by inserting 'thr' into the wait queue
+    void prepare_wait( thread_context& thr, uintptr_t ctx = 0 );
+
+    //! Commit wait if event count has not changed; otherwise, cancel wait.
+    /** Returns true if committed, false if canceled. */
+    inline bool commit_wait( thread_context& thr ) {
+        const bool do_it = thr.epoch == __TBB_load_relaxed(epoch);
+        // this check is just an optimization
+        if( do_it ) {
+            __TBB_ASSERT( thr.ready, "use of commit_wait() without prior prepare_wait()");
+            thr.semaphore().P();
+            __TBB_ASSERT( !thr.in_waitset, "still in the queue?" );
+            if( thr.aborted )
+                throw_exception( eid_user_abort );
+        } else {
+            cancel_wait( thr );
+        }
+        return do_it;
+    }
+    //! Cancel the wait. Removes the thread from the wait queue if not removed yet.
+    void cancel_wait( thread_context& thr );
+
+    //! Wait for a condition to be satisfied with waiting-on context
+    template<typename WaitUntil, typename Context>
+    void wait( WaitUntil until, Context on );
+
+    //! Notify one thread about the event
+    void notify_one() {atomic_fence(); notify_one_relaxed();}
+
+    //! Notify one thread about the event. Relaxed version.
+    void notify_one_relaxed();
+
+    //! Notify all waiting threads of the event
+    void notify_all() {atomic_fence(); notify_all_relaxed();}
+
+    //! Notify all waiting threads of the event; Relaxed version
+    void notify_all_relaxed();
+
+    //! Notify waiting threads of the event that satisfies the given predicate
+    template<typename P> void notify( const P& predicate ) {atomic_fence(); notify_relaxed( predicate );}
+
+    //! Notify waiting threads of the event that satisfies the given predicate; Relaxed version
+    template<typename P> void notify_relaxed( const P& predicate );
+
+    //! Abort any sleeping threads at the time of the call
+    void abort_all() {atomic_fence(); abort_all_relaxed(); }
+
+    //! Abort any sleeping threads at the time of the call; Relaxed version
+    void abort_all_relaxed();
+
+private:
+    tbb::spin_mutex mutex_ec;
+    waitset_t       waitset_ec;
+    __TBB_atomic unsigned epoch;
+    thread_context* to_thread_context( waitset_node_t* n ) { return static_cast<thread_context*>(n); }
+};
+
+template<typename WaitUntil, typename Context>
+void concurrent_monitor::wait( WaitUntil until, Context on )
+{
+    bool slept = false;
+    thread_context thr_ctx;
+    prepare_wait( thr_ctx, on() );
+    while( !until() ) {
+        if( (slept = commit_wait( thr_ctx ) )==true )
+            if( until() ) break;
+        slept = false;
+        prepare_wait( thr_ctx, on() );
+    }
+    if( !slept )
+        cancel_wait( thr_ctx );
+}
+
+template<typename P>
+void concurrent_monitor::notify_relaxed( const P& predicate ) {
+        if( waitset_ec.empty() )
+            return;
+        waitset_t temp;
+        waitset_node_t* nxt;
+        const waitset_node_t* end = waitset_ec.end();
+        {
+            tbb::spin_mutex::scoped_lock l( mutex_ec );
+            __TBB_store_relaxed(epoch, __TBB_load_relaxed(epoch) + 1);
+            for( waitset_node_t* n=waitset_ec.last(); n!=end; n=nxt ) {
+                nxt = n->prev;
+                thread_context* thr = to_thread_context( n );
+                if( predicate( thr->context ) ) {
+                    waitset_ec.remove( *n );
+                    thr->in_waitset = false;
+                    temp.add( n );
+                }
+            }
+        }
+
+        end = temp.end();
+        for( waitset_node_t* n=temp.front(); n!=end; n=nxt ) {
+            nxt = n->next;
+            to_thread_context(n)->semaphore().V();
+        }
+#if TBB_USE_ASSERT
+        temp.clear();
+#endif
+}
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* __TBB_concurrent_monitor_H */
diff --git a/xdl/third_party/tbb/src/tbb/concurrent_queue.cpp b/xdl/third_party/tbb/src/tbb/concurrent_queue.cpp
new file mode 100644
index 00000000..5401e23b
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/concurrent_queue.cpp
@@ -0,0 +1,674 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/tbb_exception.h"
+// Define required to satisfy test in internal file.
+#define  __TBB_concurrent_queue_H
+#include "tbb/internal/_concurrent_queue_impl.h"
+#include "concurrent_monitor.h"
+#include "itt_notify.h"
+#include <new>
+#include <cstring>   // for memset()
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif
+
+#define RECORD_EVENTS 0
+
+
+namespace tbb {
+
+namespace internal {
+
+typedef concurrent_queue_base_v3 concurrent_queue_base;
+
+typedef size_t ticket;
+
+//! A queue using simple locking.
+/** For efficiency, this class has no constructor.
+    The caller is expected to zero-initialize it. */
+struct micro_queue {
+    typedef concurrent_queue_base::page page;
+
+    friend class micro_queue_pop_finalizer;
+
+    atomic<page*> head_page;
+    atomic<ticket> head_counter;
+
+    atomic<page*> tail_page;
+    atomic<ticket> tail_counter;
+
+    spin_mutex page_mutex;
+
+    void push( const void* item, ticket k, concurrent_queue_base& base,
+               concurrent_queue_base::copy_specifics op_type );
+
+    void abort_push( ticket k, concurrent_queue_base& base );
+
+    bool pop( void* dst, ticket k, concurrent_queue_base& base );
+
+    micro_queue& assign( const micro_queue& src, concurrent_queue_base& base,
+                         concurrent_queue_base::copy_specifics op_type );
+
+    page* make_copy ( concurrent_queue_base& base, const page* src_page, size_t begin_in_page,
+                      size_t end_in_page, ticket& g_index, concurrent_queue_base::copy_specifics op_type ) ;
+
+    void make_invalid( ticket k );
+};
+
+// we need to yank it out of micro_queue because of concurrent_queue_base::deallocate_page being virtual.
+class micro_queue_pop_finalizer: no_copy {
+    typedef concurrent_queue_base::page page;
+    ticket my_ticket;
+    micro_queue& my_queue;
+    page* my_page;
+    concurrent_queue_base &base;
+public:
+    micro_queue_pop_finalizer( micro_queue& queue, concurrent_queue_base& b, ticket k, page* p ) :
+        my_ticket(k), my_queue(queue), my_page(p), base(b)
+    {}
+    ~micro_queue_pop_finalizer() {
+        page* p = my_page;
+        if( p ) {
+            spin_mutex::scoped_lock lock( my_queue.page_mutex );
+            page* q = p->next;
+            my_queue.head_page = q;
+            if( !q ) {
+                my_queue.tail_page = NULL;
+            }
+        }
+        my_queue.head_counter = my_ticket;
+        if( p )
+           base.deallocate_page( p );
+    }
+};
+
+struct predicate_leq {
+    ticket t;
+    predicate_leq( ticket t_ ) : t(t_) {}
+    bool operator() ( uintptr_t p ) const {return (ticket)p<=t;}
+};
+
+//! Internal representation of a ConcurrentQueue.
+/** For efficiency, this class has no constructor.
+    The caller is expected to zero-initialize it. */
+class concurrent_queue_rep {
+public:
+private:
+    friend struct micro_queue;
+
+    //! Approximately n_queue/golden ratio
+    static const size_t phi = 3;
+
+public:
+    //! Must be power of 2
+    static const size_t n_queue = 8;
+
+    //! Map ticket to an array index
+    static size_t index( ticket k ) {
+        return k*phi%n_queue;
+    }
+
+    atomic<ticket> head_counter;
+    concurrent_monitor items_avail;
+    atomic<size_t> n_invalid_entries;
+    char pad1[NFS_MaxLineSize-((sizeof(atomic<ticket>)+sizeof(concurrent_monitor)+sizeof(atomic<size_t>))&(NFS_MaxLineSize-1))];
+
+    atomic<ticket> tail_counter;
+    concurrent_monitor slots_avail;
+    char pad2[NFS_MaxLineSize-((sizeof(atomic<ticket>)+sizeof(concurrent_monitor))&(NFS_MaxLineSize-1))];
+    micro_queue array[n_queue];
+
+    micro_queue& choose( ticket k ) {
+        // The formula here approximates LRU in a cache-oblivious way.
+        return array[index(k)];
+    }
+
+    atomic<unsigned> abort_counter;
+
+    //! Value for effective_capacity that denotes unbounded queue.
+    static const ptrdiff_t infinite_capacity = ptrdiff_t(~size_t(0)/2);
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // unary minus operator applied to unsigned type, result still unsigned
+    #pragma warning( push )
+    #pragma warning( disable: 4146 )
+#endif
+
+static void* static_invalid_page;
+
+//------------------------------------------------------------------------
+// micro_queue
+//------------------------------------------------------------------------
+void micro_queue::push( const void* item, ticket k, concurrent_queue_base& base,
+                        concurrent_queue_base::copy_specifics op_type ) {
+    k &= -concurrent_queue_rep::n_queue;
+    page* p = NULL;
+    // find index on page where we would put the data
+    size_t index = modulo_power_of_two( k/concurrent_queue_rep::n_queue, base.items_per_page );
+    if( !index ) {  // make a new page
+        __TBB_TRY {
+            p = base.allocate_page();
+        } __TBB_CATCH(...) {
+            ++base.my_rep->n_invalid_entries;
+            make_invalid( k );
+            __TBB_RETHROW();
+        }
+        p->mask = 0;
+        p->next = NULL;
+    }
+
+    // wait for my turn
+    if( tail_counter!=k ) // The developer insisted on keeping first check out of the backoff loop
+        for( atomic_backoff b(true);;b.pause() ) {
+            ticket tail = tail_counter;
+            if( tail==k ) break;
+            else if( tail&0x1 ) {
+                // no memory. throws an exception; assumes concurrent_queue_rep::n_queue>1
+                ++base.my_rep->n_invalid_entries;
+                throw_exception( eid_bad_last_alloc );
+            }
+        }
+
+    if( p ) { // page is newly allocated; insert in micro_queue
+        spin_mutex::scoped_lock lock( page_mutex );
+        if( page* q = tail_page )
+            q->next = p;
+        else
+            head_page = p;
+        tail_page = p;
+    }
+
+    if (item) {
+        p = tail_page;
+        ITT_NOTIFY( sync_acquired, p );
+        __TBB_TRY {
+            if( concurrent_queue_base::copy == op_type ) {
+                base.copy_item( *p, index, item );
+            } else {
+                __TBB_ASSERT( concurrent_queue_base::move == op_type, NULL );
+                static_cast<concurrent_queue_base_v8&>(base).move_item( *p, index, item );
+            }
+        }  __TBB_CATCH(...) {
+            ++base.my_rep->n_invalid_entries;
+            tail_counter += concurrent_queue_rep::n_queue;
+            __TBB_RETHROW();
+        }
+        ITT_NOTIFY( sync_releasing, p );
+        // If no exception was thrown, mark item as present.
+        p->mask |= uintptr_t(1)<<index;
+    }
+    else // no item; this was called from abort_push
+        ++base.my_rep->n_invalid_entries;
+
+    tail_counter += concurrent_queue_rep::n_queue;
+}
+
+
+void micro_queue::abort_push( ticket k, concurrent_queue_base& base ) {
+    push(NULL, k, base, concurrent_queue_base::copy);
+}
+
+bool micro_queue::pop( void* dst, ticket k, concurrent_queue_base& base ) {
+    k &= -concurrent_queue_rep::n_queue;
+    spin_wait_until_eq( head_counter, k );
+    spin_wait_while_eq( tail_counter, k );
+    page *p = head_page;
+    __TBB_ASSERT( p, NULL );
+    size_t index = modulo_power_of_two( k/concurrent_queue_rep::n_queue, base.items_per_page );
+    bool success = false;
+    {
+        micro_queue_pop_finalizer finalizer( *this, base, k+concurrent_queue_rep::n_queue, index==base.items_per_page-1 ? p : NULL );
+        if( p->mask & uintptr_t(1)<<index ) {
+            success = true;
+            ITT_NOTIFY( sync_acquired, dst );
+            ITT_NOTIFY( sync_acquired, head_page );
+            base.assign_and_destroy_item( dst, *p, index );
+            ITT_NOTIFY( sync_releasing, head_page );
+        } else {
+            --base.my_rep->n_invalid_entries;
+        }
+    }
+    return success;
+}
+
+micro_queue& micro_queue::assign( const micro_queue& src, concurrent_queue_base& base,
+                                  concurrent_queue_base::copy_specifics op_type )
+{
+    head_counter = src.head_counter;
+    tail_counter = src.tail_counter;
+
+    const page* srcp = src.head_page;
+    if( srcp ) {
+        ticket g_index = head_counter;
+        __TBB_TRY {
+            size_t n_items  = (tail_counter-head_counter)/concurrent_queue_rep::n_queue;
+            size_t index = modulo_power_of_two( head_counter/concurrent_queue_rep::n_queue, base.items_per_page );
+            size_t end_in_first_page = (index+n_items<base.items_per_page)?(index+n_items):base.items_per_page;
+
+            head_page = make_copy( base, srcp, index, end_in_first_page, g_index, op_type );
+            page* cur_page = head_page;
+
+            if( srcp != src.tail_page ) {
+                for( srcp = srcp->next; srcp!=src.tail_page; srcp=srcp->next ) {
+                    cur_page->next = make_copy( base, srcp, 0, base.items_per_page, g_index, op_type );
+                    cur_page = cur_page->next;
+                }
+
+                __TBB_ASSERT( srcp==src.tail_page, NULL );
+
+                size_t last_index = modulo_power_of_two( tail_counter/concurrent_queue_rep::n_queue, base.items_per_page );
+                if( last_index==0 ) last_index = base.items_per_page;
+
+                cur_page->next = make_copy( base, srcp, 0, last_index, g_index, op_type );
+                cur_page = cur_page->next;
+            }
+            tail_page = cur_page;
+        } __TBB_CATCH(...) {
+            make_invalid( g_index );
+            __TBB_RETHROW();
+        }
+    } else {
+        head_page = tail_page = NULL;
+    }
+    return *this;
+}
+
+concurrent_queue_base::page* micro_queue::make_copy( concurrent_queue_base& base,
+    const concurrent_queue_base::page* src_page, size_t begin_in_page, size_t end_in_page,
+    ticket& g_index, concurrent_queue_base::copy_specifics op_type )
+{
+    page* new_page = base.allocate_page();
+    new_page->next = NULL;
+    new_page->mask = src_page->mask;
+    for( ; begin_in_page!=end_in_page; ++begin_in_page, ++g_index )
+        if( new_page->mask & uintptr_t(1)<<begin_in_page ) {
+            if( concurrent_queue_base::copy == op_type ) {
+                base.copy_page_item( *new_page, begin_in_page, *src_page, begin_in_page );
+            } else {
+                __TBB_ASSERT( concurrent_queue_base::move == op_type, NULL );
+                static_cast<concurrent_queue_base_v8&>(base).move_page_item( *new_page, begin_in_page, *src_page, begin_in_page );
+            }
+        }
+    return new_page;
+}
+
+void micro_queue::make_invalid( ticket k )
+{
+    static concurrent_queue_base::page dummy = {static_cast<page*>((void*)1), 0};
+    // mark it so that no more pushes are allowed.
+    static_invalid_page = &dummy;
+    {
+        spin_mutex::scoped_lock lock( page_mutex );
+        tail_counter = k+concurrent_queue_rep::n_queue+1;
+        if( page* q = tail_page )
+            q->next = static_cast<page*>(static_invalid_page);
+        else
+            head_page = static_cast<page*>(static_invalid_page);
+        tail_page = static_cast<page*>(static_invalid_page);
+    }
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif // warning 4146 is back
+
+//------------------------------------------------------------------------
+// concurrent_queue_base
+//------------------------------------------------------------------------
+concurrent_queue_base_v3::concurrent_queue_base_v3( size_t item_sz ) {
+    items_per_page = item_sz<=  8 ? 32 :
+                     item_sz<= 16 ? 16 :
+                     item_sz<= 32 ?  8 :
+                     item_sz<= 64 ?  4 :
+                     item_sz<=128 ?  2 :
+                     1;
+    my_capacity = size_t(-1)/(item_sz>1 ? item_sz : 2);
+    my_rep = cache_aligned_allocator<concurrent_queue_rep>().allocate(1);
+    __TBB_ASSERT( is_aligned(my_rep, NFS_GetLineSize()), "alignment error" );
+    __TBB_ASSERT( is_aligned(&my_rep->head_counter, NFS_GetLineSize()), "alignment error" );
+    __TBB_ASSERT( is_aligned(&my_rep->tail_counter, NFS_GetLineSize()), "alignment error" );
+    __TBB_ASSERT( is_aligned(&my_rep->array, NFS_GetLineSize()), "alignment error" );
+    std::memset(static_cast<void*>(my_rep),0,sizeof(concurrent_queue_rep));
+    new ( &my_rep->items_avail ) concurrent_monitor();
+    new ( &my_rep->slots_avail ) concurrent_monitor();
+    this->item_size = item_sz;
+}
+
+concurrent_queue_base_v3::~concurrent_queue_base_v3() {
+    size_t nq = my_rep->n_queue;
+    for( size_t i=0; i<nq; i++ )
+        __TBB_ASSERT( my_rep->array[i].tail_page==NULL, "pages were not freed properly" );
+    cache_aligned_allocator<concurrent_queue_rep>().deallocate(my_rep,1);
+}
+
+void concurrent_queue_base_v3::internal_push( const void* src ) {
+    internal_insert_item( src, copy );
+}
+
+void concurrent_queue_base_v8::internal_push_move( const void* src ) {
+   internal_insert_item( src, move );
+}
+
+void concurrent_queue_base_v3::internal_insert_item( const void* src, copy_specifics op_type ) {
+    concurrent_queue_rep& r = *my_rep;
+    unsigned old_abort_counter = r.abort_counter;
+    ticket k = r.tail_counter++;
+    ptrdiff_t e = my_capacity;
+#if DO_ITT_NOTIFY
+    bool sync_prepare_done = false;
+#endif
+    if( (ptrdiff_t)(k-r.head_counter)>=e ) { // queue is full
+#if DO_ITT_NOTIFY
+        if( !sync_prepare_done ) {
+            ITT_NOTIFY( sync_prepare, &sync_prepare_done );
+            sync_prepare_done = true;
+        }
+#endif
+        bool slept = false;
+        concurrent_monitor::thread_context thr_ctx;
+        r.slots_avail.prepare_wait( thr_ctx, ((ptrdiff_t)(k-e)) );
+        while( (ptrdiff_t)(k-r.head_counter)>=const_cast<volatile ptrdiff_t&>(e = my_capacity) ) {
+            __TBB_TRY {
+                if( r.abort_counter!=old_abort_counter ) {
+                    r.slots_avail.cancel_wait( thr_ctx );
+                    throw_exception( eid_user_abort );
+                }
+                slept = r.slots_avail.commit_wait( thr_ctx );
+            } __TBB_CATCH( tbb::user_abort& ) {
+                r.choose(k).abort_push(k, *this);
+                __TBB_RETHROW();
+            } __TBB_CATCH(...) {
+                __TBB_RETHROW();
+            }
+            if (slept == true) break;
+            r.slots_avail.prepare_wait( thr_ctx, ((ptrdiff_t)(k-e)) );
+        }
+        if( !slept )
+            r.slots_avail.cancel_wait( thr_ctx );
+    }
+    ITT_NOTIFY( sync_acquired, &sync_prepare_done );
+    __TBB_ASSERT( (ptrdiff_t)(k-r.head_counter)<my_capacity, NULL);
+    r.choose( k ).push( src, k, *this, op_type );
+    r.items_avail.notify( predicate_leq(k) );
+}
+
+void concurrent_queue_base_v3::internal_pop( void* dst ) {
+    concurrent_queue_rep& r = *my_rep;
+    ticket k;
+#if DO_ITT_NOTIFY
+    bool sync_prepare_done = false;
+#endif
+    unsigned old_abort_counter = r.abort_counter;
+    // This loop is a single pop operation; abort_counter should not be re-read inside
+    do {
+        k=r.head_counter++;
+        if ( (ptrdiff_t)(r.tail_counter-k)<=0 ) { // queue is empty
+#if DO_ITT_NOTIFY
+            if( !sync_prepare_done ) {
+                ITT_NOTIFY( sync_prepare, dst );
+                sync_prepare_done = true;
+            }
+#endif
+            bool slept = false;
+            concurrent_monitor::thread_context thr_ctx;
+            r.items_avail.prepare_wait( thr_ctx, k );
+            while( (ptrdiff_t)(r.tail_counter-k)<=0 ) {
+                __TBB_TRY {
+                    if( r.abort_counter!=old_abort_counter ) {
+                        r.items_avail.cancel_wait( thr_ctx );
+                        throw_exception( eid_user_abort );
+                    }
+                    slept = r.items_avail.commit_wait( thr_ctx );
+                } __TBB_CATCH( tbb::user_abort& ) {
+                    r.head_counter--;
+                    __TBB_RETHROW();
+                } __TBB_CATCH(...) {
+                    __TBB_RETHROW();
+                }
+                if (slept == true) break;
+                r.items_avail.prepare_wait( thr_ctx, k );
+            }
+            if( !slept )
+                r.items_avail.cancel_wait( thr_ctx );
+        }
+        __TBB_ASSERT((ptrdiff_t)(r.tail_counter-k)>0, NULL);
+    } while( !r.choose(k).pop(dst,k,*this) );
+
+    // wake up a producer..
+    r.slots_avail.notify( predicate_leq(k) );
+}
+
+void concurrent_queue_base_v3::internal_abort() {
+    concurrent_queue_rep& r = *my_rep;
+    ++r.abort_counter;
+    r.items_avail.abort_all();
+    r.slots_avail.abort_all();
+}
+
+bool concurrent_queue_base_v3::internal_pop_if_present( void* dst ) {
+    concurrent_queue_rep& r = *my_rep;
+    ticket k;
+    do {
+        k = r.head_counter;
+        for(;;) {
+            if( (ptrdiff_t)(r.tail_counter-k)<=0 ) {
+                // Queue is empty
+                return false;
+            }
+            // Queue had item with ticket k when we looked.  Attempt to get that item.
+            ticket tk=k;
+            k = r.head_counter.compare_and_swap( tk+1, tk );
+            if( k==tk )
+                break;
+            // Another thread snatched the item, retry.
+        }
+    } while( !r.choose( k ).pop( dst, k, *this ) );
+
+    r.slots_avail.notify( predicate_leq(k) );
+
+    return true;
+}
+
+bool concurrent_queue_base_v3::internal_push_if_not_full( const void* src ) {
+    return internal_insert_if_not_full( src, copy );
+}
+
+bool concurrent_queue_base_v8::internal_push_move_if_not_full( const void* src ) {
+    return internal_insert_if_not_full( src, move );
+}
+
+bool concurrent_queue_base_v3::internal_insert_if_not_full( const void* src, copy_specifics op_type ) {
+    concurrent_queue_rep& r = *my_rep;
+    ticket k = r.tail_counter;
+    for(;;) {
+        if( (ptrdiff_t)(k-r.head_counter)>=my_capacity ) {
+            // Queue is full
+            return false;
+        }
+        // Queue had empty slot with ticket k when we looked.  Attempt to claim that slot.
+        ticket tk=k;
+        k = r.tail_counter.compare_and_swap( tk+1, tk );
+        if( k==tk )
+            break;
+        // Another thread claimed the slot, so retry.
+    }
+    r.choose(k).push(src, k, *this, op_type);
+    r.items_avail.notify( predicate_leq(k) );
+    return true;
+}
+
+ptrdiff_t concurrent_queue_base_v3::internal_size() const {
+    __TBB_ASSERT( sizeof(ptrdiff_t)<=sizeof(size_t), NULL );
+    return ptrdiff_t(my_rep->tail_counter-my_rep->head_counter-my_rep->n_invalid_entries);
+}
+
+bool concurrent_queue_base_v3::internal_empty() const {
+    ticket tc = my_rep->tail_counter;
+    ticket hc = my_rep->head_counter;
+    // if tc!=r.tail_counter, the queue was not empty at some point between the two reads.
+    return ( tc==my_rep->tail_counter && ptrdiff_t(tc-hc-my_rep->n_invalid_entries)<=0 );
+}
+
+void concurrent_queue_base_v3::internal_set_capacity( ptrdiff_t capacity, size_t /*item_sz*/ ) {
+    my_capacity = capacity<0 ? concurrent_queue_rep::infinite_capacity : capacity;
+}
+
+void concurrent_queue_base_v3::internal_finish_clear() {
+    size_t nq = my_rep->n_queue;
+    for( size_t i=0; i<nq; ++i ) {
+        page* tp = my_rep->array[i].tail_page;
+        __TBB_ASSERT( my_rep->array[i].head_page==tp, "at most one page should remain" );
+        if( tp!=NULL) {
+            if( tp!=static_invalid_page ) deallocate_page( tp );
+            my_rep->array[i].tail_page = NULL;
+        }
+    }
+}
+
+void concurrent_queue_base_v3::internal_throw_exception() const {
+    throw_exception( eid_bad_alloc );
+}
+
+void concurrent_queue_base_v3::internal_assign( const concurrent_queue_base& src, copy_specifics op_type ) {
+    items_per_page = src.items_per_page;
+    my_capacity = src.my_capacity;
+
+    // copy concurrent_queue_rep.
+    my_rep->head_counter = src.my_rep->head_counter;
+    my_rep->tail_counter = src.my_rep->tail_counter;
+    my_rep->n_invalid_entries = src.my_rep->n_invalid_entries;
+    my_rep->abort_counter = src.my_rep->abort_counter;
+
+    // copy micro_queues
+    for( size_t i = 0; i<my_rep->n_queue; ++i )
+        my_rep->array[i].assign( src.my_rep->array[i], *this, op_type );
+
+    __TBB_ASSERT( my_rep->head_counter==src.my_rep->head_counter && my_rep->tail_counter==src.my_rep->tail_counter,
+            "the source concurrent queue should not be concurrently modified." );
+}
+
+void concurrent_queue_base_v3::assign( const concurrent_queue_base& src ) {
+    internal_assign( src, copy );
+}
+
+void concurrent_queue_base_v8::move_content( concurrent_queue_base_v8& src ) {
+    internal_assign( src, move );
+}
+
+//------------------------------------------------------------------------
+// concurrent_queue_iterator_rep
+//------------------------------------------------------------------------
+class concurrent_queue_iterator_rep: no_assign {
+public:
+    ticket head_counter;
+    const concurrent_queue_base& my_queue;
+    const size_t offset_of_last;
+    concurrent_queue_base::page* array[concurrent_queue_rep::n_queue];
+    concurrent_queue_iterator_rep( const concurrent_queue_base& queue, size_t offset_of_last_ ) :
+        head_counter(queue.my_rep->head_counter),
+        my_queue(queue),
+        offset_of_last(offset_of_last_)
+    {
+        const concurrent_queue_rep& rep = *queue.my_rep;
+        for( size_t k=0; k<concurrent_queue_rep::n_queue; ++k )
+            array[k] = rep.array[k].head_page;
+    }
+    //! Set item to point to kth element.  Return true if at end of queue or item is marked valid; false otherwise.
+    bool get_item( void*& item, size_t k ) {
+        if( k==my_queue.my_rep->tail_counter ) {
+            item = NULL;
+            return true;
+        } else {
+            concurrent_queue_base::page* p = array[concurrent_queue_rep::index(k)];
+            __TBB_ASSERT(p,NULL);
+            size_t i = modulo_power_of_two( k/concurrent_queue_rep::n_queue, my_queue.items_per_page );
+            item = static_cast<unsigned char*>(static_cast<void*>(p)) + offset_of_last + my_queue.item_size*i;
+            return (p->mask & uintptr_t(1)<<i)!=0;
+        }
+    }
+};
+
+//------------------------------------------------------------------------
+// concurrent_queue_iterator_base
+//------------------------------------------------------------------------
+
+void concurrent_queue_iterator_base_v3::initialize( const concurrent_queue_base& queue, size_t offset_of_last ) {
+    my_rep = cache_aligned_allocator<concurrent_queue_iterator_rep>().allocate(1);
+    new( my_rep ) concurrent_queue_iterator_rep(queue,offset_of_last);
+    size_t k = my_rep->head_counter;
+    if( !my_rep->get_item(my_item, k) ) advance();
+}
+
+concurrent_queue_iterator_base_v3::concurrent_queue_iterator_base_v3( const concurrent_queue_base& queue ) {
+    initialize(queue,0);
+}
+
+concurrent_queue_iterator_base_v3::concurrent_queue_iterator_base_v3( const concurrent_queue_base& queue, size_t offset_of_last ) {
+    initialize(queue,offset_of_last);
+}
+
+void concurrent_queue_iterator_base_v3::assign( const concurrent_queue_iterator_base& other ) {
+    if( my_rep!=other.my_rep ) {
+        if( my_rep ) {
+            cache_aligned_allocator<concurrent_queue_iterator_rep>().deallocate(my_rep, 1);
+            my_rep = NULL;
+        }
+        if( other.my_rep ) {
+            my_rep = cache_aligned_allocator<concurrent_queue_iterator_rep>().allocate(1);
+            new( my_rep ) concurrent_queue_iterator_rep( *other.my_rep );
+        }
+    }
+    my_item = other.my_item;
+}
+
+void concurrent_queue_iterator_base_v3::advance() {
+    __TBB_ASSERT( my_item, "attempt to increment iterator past end of queue" );
+    size_t k = my_rep->head_counter;
+    const concurrent_queue_base& queue = my_rep->my_queue;
+#if TBB_USE_ASSERT
+    void* tmp;
+    my_rep->get_item(tmp,k);
+    __TBB_ASSERT( my_item==tmp, NULL );
+#endif /* TBB_USE_ASSERT */
+    size_t i = modulo_power_of_two( k/concurrent_queue_rep::n_queue, queue.items_per_page );
+    if( i==queue.items_per_page-1 ) {
+        concurrent_queue_base::page*& root = my_rep->array[concurrent_queue_rep::index(k)];
+        root = root->next;
+    }
+    // advance k
+    my_rep->head_counter = ++k;
+    if( !my_rep->get_item(my_item, k) ) advance();
+}
+
+concurrent_queue_iterator_base_v3::~concurrent_queue_iterator_base_v3() {
+    //delete my_rep;
+    cache_aligned_allocator<concurrent_queue_iterator_rep>().deallocate(my_rep, 1);
+    my_rep = NULL;
+}
+
+} // namespace internal
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/concurrent_vector.cpp b/xdl/third_party/tbb/src/tbb/concurrent_vector.cpp
new file mode 100644
index 00000000..d9a25969
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/concurrent_vector.cpp
@@ -0,0 +1,614 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if (_MSC_VER)
+    //MSVC 10 "deprecated" application of some std:: algorithms to raw pointers as not safe.
+    //The reason is that destination is not checked against bounds/having enough place.
+    #define _SCL_SECURE_NO_WARNINGS
+#endif
+
+#include "tbb/concurrent_vector.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_exception.h"
+#include "tbb_misc.h"
+#include "itt_notify.h"
+
+#include <cstring>
+#include <memory> //for uninitialized_fill_n
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif
+
+namespace tbb {
+
+namespace internal {
+class concurrent_vector_base_v3::helper :no_assign {
+public:
+    //! memory page size
+    static const size_type page_size = 4096;
+
+    inline static bool incompact_predicate(size_type size) { // assert size != 0, see source/test/test_vector_layout.cpp
+        return size < page_size || ((size-1)%page_size < page_size/2 && size < page_size * 128); // for more details
+    }
+
+    inline static size_type find_segment_end(const concurrent_vector_base_v3 &v) {
+        segment_t *s = v.my_segment;
+        segment_index_t u = s==v.my_storage? pointers_per_short_table : pointers_per_long_table;
+        segment_index_t k = 0;
+        while( k < u && (s[k].load<relaxed>()==segment_allocated() ))
+            ++k;
+        return k;
+    }
+
+    // TODO: optimize accesses to my_first_block
+    //! assign first segment size. k - is index of last segment to be allocated, not a count of segments
+    inline static void assign_first_segment_if_necessary(concurrent_vector_base_v3 &v, segment_index_t k) {
+        if( !v.my_first_block ) {
+            /* There was a suggestion to set first segment according to incompact_predicate:
+            while( k && !helper::incompact_predicate(segment_size( k ) * element_size) )
+                --k; // while previous vector size is compact, decrement
+            // reasons to not do it:
+            // * constructor(n) is not ready to accept fragmented segments
+            // * backward compatibility due to that constructor
+            // * current version gives additional guarantee and faster init.
+            // * two calls to reserve() will give the same effect.
+            */
+            v.my_first_block.compare_and_swap(k+1, 0); // store number of segments
+        }
+    }
+
+    inline static void *allocate_segment(concurrent_vector_base_v3 &v, size_type n) {
+        void *ptr = v.vector_allocator_ptr(v, n);
+        if(!ptr) throw_exception(eid_bad_alloc); // check for bad allocation, throw exception
+        return ptr;
+    }
+
+    //! Publish segment so other threads can see it.
+    template<typename argument_type>
+    inline static void publish_segment( segment_t& s, argument_type rhs ) {
+        // see also itt_store_pointer_with_release_v3()
+        ITT_NOTIFY( sync_releasing, &s );
+        s.store<release>(rhs);
+    }
+
+    static size_type enable_segment(concurrent_vector_base_v3 &v, size_type k, size_type element_size, bool mark_as_not_used_on_failure = false);
+
+    // TODO: rename as get_segments_table() and return segment pointer
+    inline static void extend_table_if_necessary(concurrent_vector_base_v3 &v, size_type k, size_type start ) {
+        if(k >= pointers_per_short_table && v.my_segment == v.my_storage)
+            extend_segment_table(v, start );
+    }
+
+    static void extend_segment_table(concurrent_vector_base_v3 &v, size_type start);
+
+    struct segment_not_used_predicate: no_assign {
+        segment_t &s;
+        segment_not_used_predicate(segment_t &segment) : s(segment) {}
+        bool operator()() const { return s.load<relaxed>() == segment_not_used ();}
+    };
+    inline static segment_t& acquire_segment(concurrent_vector_base_v3 &v, size_type index, size_type element_size, bool owner) {
+        segment_t &s = v.my_segment[index]; // TODO: pass v.my_segment as argument
+        if( s.load<acquire>() == segment_not_used() ) { // do not check for segment_allocation_failed state
+            if( owner ) {
+                enable_segment( v, index, element_size );
+            } else {
+                ITT_NOTIFY(sync_prepare, &s);
+                spin_wait_while(segment_not_used_predicate(s));
+                ITT_NOTIFY(sync_acquired, &s);
+            }
+        } else {
+            ITT_NOTIFY(sync_acquired, &s);
+        }
+        enforce_segment_allocated(s.load<relaxed>()); //it's hard to recover correctly after segment_allocation_failed state
+        return s;
+    }
+
+    ///// non-static fields of helper for exception-safe iteration across segments
+    segment_t *table;// TODO: review all segment_index_t as just short type
+    size_type first_block, k, sz, start, finish, element_size;
+    helper(segment_t *segments, size_type fb, size_type esize, size_type index, size_type s, size_type f) throw()
+        : table(segments), first_block(fb), k(index), sz(0), start(s), finish(f), element_size(esize) {}
+    inline void first_segment() throw() {
+        __TBB_ASSERT( start <= finish, NULL );
+        __TBB_ASSERT( first_block || !finish, NULL );
+        if( k < first_block ) k = 0; // process solid segment at a time
+        size_type base = segment_base( k );
+        __TBB_ASSERT( base <= start, NULL );
+        finish -= base; start -= base; // rebase as offsets from segment k
+        sz = k ? base : segment_size( first_block ); // sz==base for k>0
+    }
+    inline void next_segment() throw() {
+        finish -= sz; start = 0; // offsets from next segment
+        if( !k ) k = first_block;
+        else { ++k; sz = segment_size( k ); }
+    }
+    template<typename F>
+    inline size_type apply(const F &func) {
+        first_segment();
+        while( sz < finish ) { // work for more than one segment
+            //TODO: remove extra load() of table[k] inside func
+            func( table[k], table[k].load<relaxed>().pointer<char>() + element_size*start, sz - start );
+            next_segment();
+        }
+        func( table[k], table[k].load<relaxed>().pointer<char>() + element_size*start, finish - start );
+        return k;
+    }
+    inline segment_value_t get_segment_value(size_type index, bool wait) {
+        segment_t &s = table[index];
+        if( wait && (s.load<acquire>() == segment_not_used()) ) {
+            ITT_NOTIFY(sync_prepare, &s);
+            spin_wait_while(segment_not_used_predicate(s));
+            ITT_NOTIFY(sync_acquired, &s);
+        }
+        return s.load<relaxed>();
+    }
+    ~helper() {
+        if( sz >= finish ) return; // the work is done correctly
+        cleanup();
+    }
+
+    //! Out of line code to assists destructor in infrequent cases.
+    void cleanup();
+
+    /// TODO: turn into lambda functions when available
+    struct init_body {
+        internal_array_op2 func;
+        const void *arg;
+        init_body(internal_array_op2 init, const void *src) : func(init), arg(src) {}
+        void operator()(segment_t &, void *begin, size_type n) const {
+            func( begin, arg, n );
+        }
+    };
+    struct safe_init_body {
+        internal_array_op2 func;
+        const void *arg;
+        safe_init_body(internal_array_op2 init, const void *src) : func(init), arg(src) {}
+        void operator()(segment_t &s, void *begin, size_type n) const {
+            enforce_segment_allocated(s.load<relaxed>());
+            func( begin, arg, n );
+        }
+    };
+    struct destroy_body {
+        internal_array_op1 func;
+        destroy_body(internal_array_op1 destroy) : func(destroy) {}
+        void operator()(segment_t &s, void *begin, size_type n) const {
+            if(s.load<relaxed>() == segment_allocated())
+                func( begin, n );
+        }
+    };
+}; // class helper
+
+void concurrent_vector_base_v3::helper::extend_segment_table(concurrent_vector_base_v3 &v, concurrent_vector_base_v3::size_type start) {
+    if( start > segment_size(pointers_per_short_table) ) start = segment_size(pointers_per_short_table);
+    // If other threads are trying to set pointers in the short segment, wait for them to finish their
+    // assignments before we copy the short segment to the long segment. Note: grow_to_at_least depends on it
+    for( segment_index_t i = 0; segment_base(i) < start && v.my_segment == v.my_storage; i++ ){
+        if(v.my_storage[i].load<relaxed>() == segment_not_used()) {
+            ITT_NOTIFY(sync_prepare, &v.my_storage[i]);
+            atomic_backoff backoff(true);
+            while( v.my_segment == v.my_storage && (v.my_storage[i].load<relaxed>() == segment_not_used()) )
+                backoff.pause();
+            ITT_NOTIFY(sync_acquired, &v.my_storage[i]);
+        }
+    }
+    if( v.my_segment != v.my_storage ) return;
+
+    segment_t* new_segment_table = (segment_t*)NFS_Allocate( pointers_per_long_table, sizeof(segment_t), NULL );
+    __TBB_ASSERT(new_segment_table, "NFS_Allocate should throws exception if it cannot allocate the requested storage, and not returns zero pointer" );
+    std::uninitialized_fill_n(new_segment_table,size_t(pointers_per_long_table),segment_t()); //init newly allocated table
+   //TODO: replace with static assert
+    __TBB_STATIC_ASSERT(pointers_per_long_table >= pointers_per_short_table, "size of the big table should be not lesser than of the small one, as we copy values to it" );
+    std::copy(v.my_storage, v.my_storage+pointers_per_short_table, new_segment_table);//copy values from old table, here operator= of segment_t is used
+    if( v.my_segment.compare_and_swap( new_segment_table, v.my_storage ) != v.my_storage )
+        NFS_Free( new_segment_table );
+    // else TODO: add ITT_NOTIFY signals for v.my_segment?
+}
+
+concurrent_vector_base_v3::size_type concurrent_vector_base_v3::helper::enable_segment(concurrent_vector_base_v3 &v, concurrent_vector_base_v3::size_type k, concurrent_vector_base_v3::size_type element_size,
+        bool mark_as_not_used_on_failure ) {
+
+    struct segment_scope_guard : no_copy{
+        segment_t* my_segment_ptr;
+        bool my_mark_as_not_used;
+        segment_scope_guard(segment_t& segment, bool mark_as_not_used) : my_segment_ptr(&segment), my_mark_as_not_used(mark_as_not_used){}
+        void dismiss(){ my_segment_ptr = 0;}
+        ~segment_scope_guard(){
+            if (my_segment_ptr){
+                if (!my_mark_as_not_used){
+                    publish_segment(*my_segment_ptr, segment_allocation_failed());
+                }else{
+                    publish_segment(*my_segment_ptr, segment_not_used());
+                }
+            }
+        }
+    };
+
+    segment_t* s = v.my_segment; // TODO: optimize out as argument? Optimize accesses to my_first_block
+    __TBB_ASSERT(s[k].load<relaxed>() != segment_allocated(), "concurrent operation during growth?");
+
+    size_type size_of_enabled_segment =  segment_size(k);
+    size_type size_to_allocate = size_of_enabled_segment;
+    if( !k ) {
+        assign_first_segment_if_necessary(v, default_initial_segments-1);
+        size_of_enabled_segment =  2 ;
+        size_to_allocate = segment_size(v.my_first_block);
+
+    } else  {
+        spin_wait_while_eq( v.my_first_block, segment_index_t(0) );
+    }
+
+    if( k && (k < v.my_first_block)){ //no need to allocate anything
+        // s[0].array is changed only once ( 0 -> !0 ) and points to uninitialized memory
+        segment_value_t array0 = s[0].load<acquire>();
+        if(array0 == segment_not_used()){
+            // sync_prepare called only if there is a wait
+            ITT_NOTIFY(sync_prepare, &s[0]);
+            spin_wait_while( segment_not_used_predicate(s[0]));
+            array0 = s[0].load<acquire>();
+        }
+        ITT_NOTIFY(sync_acquired, &s[0]);
+
+        segment_scope_guard k_segment_guard(s[k], false);
+        enforce_segment_allocated(array0); // initial segment should be allocated
+        k_segment_guard.dismiss();
+
+        publish_segment( s[k],
+            static_cast<void*>(array0.pointer<char>() + segment_base(k)*element_size )
+        );
+    } else {
+        segment_scope_guard k_segment_guard(s[k], mark_as_not_used_on_failure);
+        publish_segment(s[k], allocate_segment(v, size_to_allocate));
+        k_segment_guard.dismiss();
+    }
+    return size_of_enabled_segment;
+}
+
+void concurrent_vector_base_v3::helper::cleanup() {
+    if( !sz ) { // allocation failed, restore the table
+        segment_index_t k_start = k, k_end = segment_index_of(finish-1);
+        if( segment_base( k_start ) < start )
+            get_segment_value(k_start++, true); // wait
+        if( k_start < first_block ) {
+            segment_value_t segment0 = get_segment_value(0, start>0); // wait if necessary
+            if((segment0 != segment_not_used()) && !k_start ) ++k_start;
+            if(segment0 != segment_allocated())
+                for(; k_start < first_block && k_start <= k_end; ++k_start )
+                    publish_segment(table[k_start], segment_allocation_failed());
+            else for(; k_start < first_block && k_start <= k_end; ++k_start )
+                    publish_segment(table[k_start], static_cast<void*>(
+                        (segment0.pointer<char>()) + segment_base(k_start)*element_size) );
+        }
+        for(; k_start <= k_end; ++k_start ) // not in first block
+            if(table[k_start].load<acquire>() == segment_not_used())
+                publish_segment(table[k_start], segment_allocation_failed());
+        // fill allocated items
+        first_segment();
+        goto recover;
+    }
+    while( sz <= finish ) { // there is still work for at least one segment
+        next_segment();
+recover:
+        segment_value_t array = table[k].load<relaxed>();
+        if(array == segment_allocated())
+            std::memset( (array.pointer<char>()) + element_size*start, 0, ((sz<finish?sz:finish) - start)*element_size );
+        else __TBB_ASSERT( array == segment_allocation_failed(), NULL );
+    }
+}
+
+concurrent_vector_base_v3::~concurrent_vector_base_v3() {
+    segment_t* s = my_segment;
+    if( s != my_storage ) {
+#if TBB_USE_ASSERT
+        //to please assert in segment_t destructor
+        std::fill_n(my_storage,size_t(pointers_per_short_table),segment_t());
+#endif /* TBB_USE_ASSERT */
+#if TBB_USE_DEBUG
+        for( segment_index_t i = 0; i < pointers_per_long_table; i++)
+            __TBB_ASSERT( my_segment[i].load<relaxed>() != segment_allocated(), "Segment should have been freed. Please recompile with new TBB before using exceptions.");
+#endif
+        my_segment = my_storage;
+        NFS_Free( s );
+    }
+}
+
+concurrent_vector_base_v3::size_type concurrent_vector_base_v3::internal_capacity() const {
+    return segment_base( helper::find_segment_end(*this) );
+}
+
+void concurrent_vector_base_v3::internal_throw_exception(size_type t) const {
+    exception_id ids[] = { eid_out_of_range, eid_segment_range_error, eid_index_range_error };
+    __TBB_ASSERT(t < sizeof(ids) / sizeof(exception_id), NULL);
+    throw_exception(ids[t]);
+}
+
+void concurrent_vector_base_v3::internal_reserve( size_type n, size_type element_size, size_type max_size ) {
+    if( n>max_size )
+        throw_exception(eid_reservation_length_error);
+    __TBB_ASSERT( n, NULL );
+    helper::assign_first_segment_if_necessary(*this, segment_index_of(n-1));
+    segment_index_t k = helper::find_segment_end(*this);
+
+    for( ; segment_base(k)<n; ++k ) {
+        helper::extend_table_if_necessary(*this, k, 0);
+        if(my_segment[k].load<relaxed>() != segment_allocated())
+            helper::enable_segment(*this, k, element_size, true ); //in case of failure mark segments as not used
+    }
+}
+
+//TODO: Looks like atomic loads can be done relaxed here, as the only place this method is called from
+//is the constructor, which does not require synchronization (for more details see comment in the
+// concurrent_vector_base constructor).
+void concurrent_vector_base_v3::internal_copy( const concurrent_vector_base_v3& src, size_type element_size, internal_array_op2 copy ) {
+    size_type n = src.my_early_size;
+    __TBB_ASSERT( my_segment == my_storage, NULL);
+    if( n ) {
+        helper::assign_first_segment_if_necessary(*this, segment_index_of(n-1));
+        size_type b;
+        for( segment_index_t k=0; (b=segment_base(k))<n; ++k ) {
+            if( (src.my_segment.load<acquire>() == src.my_storage && k >= pointers_per_short_table)
+                || (src.my_segment[k].load<relaxed>() != segment_allocated())) {
+                my_early_size = b; break;
+            }
+            helper::extend_table_if_necessary(*this, k, 0);
+            size_type m = helper::enable_segment(*this, k, element_size);
+            if( m > n-b ) m = n-b;
+            my_early_size = b+m;
+            copy( my_segment[k].load<relaxed>().pointer<void>(), src.my_segment[k].load<relaxed>().pointer<void>(), m );
+        }
+    }
+}
+
+void concurrent_vector_base_v3::internal_assign( const concurrent_vector_base_v3& src, size_type element_size, internal_array_op1 destroy, internal_array_op2 assign, internal_array_op2 copy ) {
+    size_type n = src.my_early_size;
+    while( my_early_size>n ) { // TODO: improve
+        segment_index_t k = segment_index_of( my_early_size-1 );
+        size_type b=segment_base(k);
+        size_type new_end = b>=n ? b : n;
+        __TBB_ASSERT( my_early_size>new_end, NULL );
+        enforce_segment_allocated(my_segment[k].load<relaxed>()); //if vector was broken before
+        // destructors are supposed to not throw any exceptions
+        destroy( my_segment[k].load<relaxed>().pointer<char>() + element_size*(new_end-b), my_early_size-new_end );
+        my_early_size = new_end;
+    }
+    size_type dst_initialized_size = my_early_size;
+    my_early_size = n;
+    helper::assign_first_segment_if_necessary(*this, segment_index_of(n));
+    size_type b;
+    for( segment_index_t k=0; (b=segment_base(k))<n; ++k ) {
+        if( (src.my_segment.load<acquire>() == src.my_storage && k >= pointers_per_short_table)
+            || src.my_segment[k].load<relaxed>() != segment_allocated() ) { // if source is damaged
+                my_early_size = b; break; // TODO: it may cause undestructed items
+        }
+        helper::extend_table_if_necessary(*this, k, 0);
+        if( my_segment[k].load<relaxed>() == segment_not_used())
+            helper::enable_segment(*this, k, element_size);
+        else
+            enforce_segment_allocated(my_segment[k].load<relaxed>());
+        size_type m = k? segment_size(k) : 2;
+        if( m > n-b ) m = n-b;
+        size_type a = 0;
+        if( dst_initialized_size>b ) {
+            a = dst_initialized_size-b;
+            if( a>m ) a = m;
+            assign( my_segment[k].load<relaxed>().pointer<void>(), src.my_segment[k].load<relaxed>().pointer<void>(), a );
+            m -= a;
+            a *= element_size;
+        }
+        if( m>0 )
+            copy( my_segment[k].load<relaxed>().pointer<char>() + a, src.my_segment[k].load<relaxed>().pointer<char>() + a, m );
+    }
+    __TBB_ASSERT( src.my_early_size==n, "detected use of concurrent_vector::operator= with right side that was concurrently modified" );
+}
+
+void* concurrent_vector_base_v3::internal_push_back( size_type element_size, size_type& index ) {
+    __TBB_ASSERT( sizeof(my_early_size)==sizeof(uintptr_t), NULL );
+    size_type tmp = my_early_size.fetch_and_increment<acquire>();
+    index = tmp;
+    segment_index_t k_old = segment_index_of( tmp );
+    size_type base = segment_base(k_old);
+    helper::extend_table_if_necessary(*this, k_old, tmp);
+    segment_t& s = helper::acquire_segment(*this, k_old, element_size, base==tmp);
+    size_type j_begin = tmp-base;
+    return (void*)(s.load<relaxed>().pointer<char>() + element_size*j_begin);
+}
+
+void concurrent_vector_base_v3::internal_grow_to_at_least( size_type new_size, size_type element_size, internal_array_op2 init, const void *src ) {
+    internal_grow_to_at_least_with_result( new_size, element_size, init, src );
+}
+
+concurrent_vector_base_v3::size_type concurrent_vector_base_v3::internal_grow_to_at_least_with_result( size_type new_size, size_type element_size, internal_array_op2 init, const void *src ) {
+    size_type e = my_early_size;
+    while( e<new_size ) {
+        size_type f = my_early_size.compare_and_swap(new_size,e);
+        if( f==e ) {
+            internal_grow( e, new_size, element_size, init, src );
+            break;
+        }
+        e = f;
+    }
+    // Check/wait for segments allocation completes
+    segment_index_t i, k_old = segment_index_of( new_size-1 );
+    if( k_old >= pointers_per_short_table && my_segment == my_storage ) {
+        spin_wait_while_eq( my_segment, my_storage );
+    }
+    for( i = 0; i <= k_old; ++i ) {
+        segment_t &s = my_segment[i];
+        if(s.load<relaxed>() == segment_not_used()) {
+            ITT_NOTIFY(sync_prepare, &s);
+            atomic_backoff backoff(true);
+            while( my_segment[i].load<acquire>() == segment_not_used() ) // my_segment may change concurrently
+                backoff.pause();
+            ITT_NOTIFY(sync_acquired, &s);
+        }
+        enforce_segment_allocated(my_segment[i].load<relaxed>());
+    }
+#if TBB_USE_DEBUG
+    size_type capacity = internal_capacity();
+    __TBB_ASSERT( capacity >= new_size, NULL);
+#endif
+    return e;
+}
+
+concurrent_vector_base_v3::size_type concurrent_vector_base_v3::internal_grow_by( size_type delta, size_type element_size, internal_array_op2 init, const void *src ) {
+    size_type result = my_early_size.fetch_and_add(delta);
+    internal_grow( result, result+delta, element_size, init, src );
+    return result;
+}
+
+void concurrent_vector_base_v3::internal_grow( const size_type start, size_type finish, size_type element_size, internal_array_op2 init, const void *src ) {
+    __TBB_ASSERT( start<finish, "start must be less than finish" );
+    segment_index_t k_start = segment_index_of(start), k_end = segment_index_of(finish-1);
+    helper::assign_first_segment_if_necessary(*this, k_end);
+    helper::extend_table_if_necessary(*this, k_end, start);
+    helper range(my_segment, my_first_block, element_size, k_start, start, finish);
+    for(; k_end > k_start && k_end >= range.first_block; --k_end ) // allocate segments in reverse order
+        helper::acquire_segment(*this, k_end, element_size, true/*for k_end>k_start*/);
+    for(; k_start <= k_end; ++k_start ) // but allocate first block in straight order
+        helper::acquire_segment(*this, k_start, element_size, segment_base( k_start ) >= start );
+    range.apply( helper::init_body(init, src) );
+}
+
+void concurrent_vector_base_v3::internal_resize( size_type n, size_type element_size, size_type max_size, const void *src,
+                                                internal_array_op1 destroy, internal_array_op2 init ) {
+    size_type j = my_early_size;
+    if( n > j ) { // construct items
+        internal_reserve(n, element_size, max_size);
+        my_early_size = n;
+        helper for_each(my_segment, my_first_block, element_size, segment_index_of(j), j, n);
+        for_each.apply( helper::safe_init_body(init, src) );
+    } else {
+        my_early_size = n;
+        helper for_each(my_segment, my_first_block, element_size, segment_index_of(n), n, j);
+        for_each.apply( helper::destroy_body(destroy) );
+    }
+}
+
+concurrent_vector_base_v3::segment_index_t concurrent_vector_base_v3::internal_clear( internal_array_op1 destroy ) {
+    __TBB_ASSERT( my_segment, NULL );
+    size_type j = my_early_size;
+    my_early_size = 0;
+    helper for_each(my_segment, my_first_block, 0, 0, 0, j); // element_size is safe to be zero if 'start' is zero
+    j = for_each.apply( helper::destroy_body(destroy) );
+    size_type i = helper::find_segment_end(*this);
+    return j < i? i : j+1;
+}
+
+void *concurrent_vector_base_v3::internal_compact( size_type element_size, void *table, internal_array_op1 destroy, internal_array_op2 copy )
+{
+    const size_type my_size = my_early_size;
+    const segment_index_t k_end = helper::find_segment_end(*this); // allocated segments
+    const segment_index_t k_stop = my_size? segment_index_of(my_size-1) + 1 : 0; // number of segments to store existing items: 0=>0; 1,2=>1; 3,4=>2; [5-8]=>3;..
+    const segment_index_t first_block = my_first_block; // number of merged segments, getting values from atomics
+
+    segment_index_t k = first_block;
+    if(k_stop < first_block)
+        k = k_stop;
+    else
+        while (k < k_stop && helper::incompact_predicate(segment_size( k ) * element_size) ) k++;
+    if(k_stop == k_end && k == first_block)
+        return NULL;
+
+    segment_t *const segment_table = my_segment;
+    internal_segments_table &old = *static_cast<internal_segments_table*>( table );
+    //this call is left here for sake of backward compatibility, and as a placeholder for table initialization
+    std::fill_n(old.table,sizeof(old.table)/sizeof(old.table[0]),segment_t());
+    old.first_block=0;
+
+    if ( k != first_block && k ) // first segment optimization
+    {
+        // exception can occur here
+        void *seg = helper::allocate_segment(*this, segment_size(k));
+        old.table[0].store<relaxed>(seg);
+        old.first_block = k; // fill info for freeing new segment if exception occurs
+        // copy items to the new segment
+        size_type my_segment_size = segment_size( first_block );
+        for (segment_index_t i = 0, j = 0; i < k && j < my_size; j = my_segment_size) {
+            __TBB_ASSERT( segment_table[i].load<relaxed>() == segment_allocated(), NULL);
+            void *s = static_cast<void*>(
+                static_cast<char*>(seg) + segment_base(i)*element_size );
+            //TODO: refactor to use std::min
+            if(j + my_segment_size >= my_size) my_segment_size = my_size - j;
+            __TBB_TRY { // exception can occur here
+                copy( s, segment_table[i].load<relaxed>().pointer<void>(), my_segment_size );
+            } __TBB_CATCH(...) { // destroy all the already copied items
+                helper for_each(&old.table[0], old.first_block, element_size,
+                    0, 0, segment_base(i)+ my_segment_size);
+                for_each.apply( helper::destroy_body(destroy) );
+                __TBB_RETHROW();
+            }
+            my_segment_size = i? segment_size( ++i ) : segment_size( i = first_block );
+        }
+        // commit the changes
+        std::copy(segment_table,segment_table + k,old.table);
+        for (segment_index_t i = 0; i < k; i++) {
+            segment_table[i].store<relaxed>(static_cast<void*>(
+                static_cast<char*>(seg) + segment_base(i)*element_size ));
+        }
+        old.first_block = first_block; my_first_block = k; // now, first_block != my_first_block
+        // destroy original copies
+        my_segment_size = segment_size( first_block ); // old.first_block actually
+        for (segment_index_t i = 0, j = 0; i < k && j < my_size; j = my_segment_size) {
+            if(j + my_segment_size >= my_size) my_segment_size = my_size - j;
+            // destructors are supposed to not throw any exceptions
+            destroy( old.table[i].load<relaxed>().pointer<void>(), my_segment_size );
+            my_segment_size = i? segment_size( ++i ) : segment_size( i = first_block );
+        }
+    }
+    // free unnecessary segments allocated by reserve() call
+    if ( k_stop < k_end ) {
+        old.first_block = first_block;
+        std::copy(segment_table+k_stop, segment_table+k_end, old.table+k_stop );
+        std::fill_n(segment_table+k_stop, (k_end-k_stop), segment_t());
+        if( !k ) my_first_block = 0;
+    }
+    return table;
+}
+
+void concurrent_vector_base_v3::internal_swap(concurrent_vector_base_v3& v)
+{
+    size_type my_sz = my_early_size.load<acquire>();
+    size_type v_sz = v.my_early_size.load<relaxed>();
+    if(!my_sz && !v_sz) return;
+
+    bool my_was_short = (my_segment.load<relaxed>() == my_storage);
+    bool v_was_short  = (v.my_segment.load<relaxed>() == v.my_storage);
+
+    //In C++11, this would be: swap(my_storage, v.my_storage);
+    for (int i=0; i < pointers_per_short_table; ++i){
+        swap(my_storage[i], v.my_storage[i]);
+    }
+    tbb::internal::swap<relaxed>(my_first_block, v.my_first_block);
+    tbb::internal::swap<relaxed>(my_segment, v.my_segment);
+    if (my_was_short){
+        v.my_segment.store<relaxed>(v.my_storage);
+    }
+    if(v_was_short){
+        my_segment.store<relaxed>(my_storage);
+    }
+
+    my_early_size.store<relaxed>(v_sz);
+    v.my_early_size.store<release>(my_sz);
+}
+
+} // namespace internal
+
+} // tbb
diff --git a/xdl/third_party/tbb/src/tbb/condition_variable.cpp b/xdl/third_party/tbb/src/tbb/condition_variable.cpp
new file mode 100644
index 00000000..7c213140
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/condition_variable.cpp
@@ -0,0 +1,209 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#include "tbb/compat/condition_variable"
+#include "tbb/atomic.h"
+#include "tbb_misc.h"
+#include "dynamic_link.h"
+#include "itt_notify.h"
+
+namespace tbb {
+
+namespace internal {
+
+//condition_variable
+#if _WIN32||_WIN64
+using tbb::interface5::internal::condition_variable_using_event;
+
+static atomic<do_once_state> condvar_api_state;
+
+void WINAPI init_condvar_using_event( condition_variable_using_event* cv_event )
+{
+    // TODO: For Metro port, we can always use the API for condition variables, without dynamic_link etc.
+    cv_event->event = CreateEventEx(NULL, NULL, 0x1 /*CREATE_EVENT_MANUAL_RESET*/, EVENT_ALL_ACCESS );
+    InitializeCriticalSectionEx( &cv_event->mutex, 4000, 0 );
+    cv_event->n_waiters = 0;
+    cv_event->release_count = 0;
+    cv_event->epoch = 0;
+}
+
+BOOL WINAPI sleep_condition_variable_cs_using_event( condition_variable_using_event* cv_event, LPCRITICAL_SECTION cs, DWORD dwMilliseconds )
+{
+    EnterCriticalSection( &cv_event->mutex );
+    ++cv_event->n_waiters;
+    unsigned my_generation = cv_event->epoch;
+    LeaveCriticalSection( &cv_event->mutex );
+    LeaveCriticalSection( cs );
+    for (;;) {
+        // should come here at least once
+        DWORD rc = WaitForSingleObjectEx( cv_event->event, dwMilliseconds, FALSE );
+        EnterCriticalSection( &cv_event->mutex );
+        if( rc!=WAIT_OBJECT_0 ) {
+            --cv_event->n_waiters;
+            LeaveCriticalSection( &cv_event->mutex );
+            if( rc==WAIT_TIMEOUT ) {
+                SetLastError( WAIT_TIMEOUT );
+                EnterCriticalSection( cs );
+            }
+            return false;
+        }
+        __TBB_ASSERT( rc==WAIT_OBJECT_0, NULL );
+        if( cv_event->release_count>0 && cv_event->epoch!=my_generation )
+            break;
+        LeaveCriticalSection( &cv_event->mutex );
+    }
+
+    // still in the critical section
+    --cv_event->n_waiters;
+    int count = --cv_event->release_count;
+    LeaveCriticalSection( &cv_event->mutex );
+
+    if( count==0 ) {
+        __TBB_ASSERT( cv_event->event, "Premature destruction of condition variable?" );
+        ResetEvent( cv_event->event );
+    }
+    EnterCriticalSection( cs );
+    return true;
+}
+
+void WINAPI wake_condition_variable_using_event( condition_variable_using_event* cv_event )
+{
+    EnterCriticalSection( &cv_event->mutex );
+    if( cv_event->n_waiters>cv_event->release_count ) {
+        SetEvent( cv_event->event ); // Signal the manual-reset event.
+        ++cv_event->release_count;
+        ++cv_event->epoch;
+    }
+    LeaveCriticalSection( &cv_event->mutex );
+}
+
+void WINAPI wake_all_condition_variable_using_event( condition_variable_using_event* cv_event )
+{
+    EnterCriticalSection( &cv_event->mutex );
+    if( cv_event->n_waiters>0 ) {
+        SetEvent( cv_event->event );
+        cv_event->release_count = cv_event->n_waiters;
+        ++cv_event->epoch;
+    }
+    LeaveCriticalSection( &cv_event->mutex );
+}
+
+void WINAPI destroy_condvar_using_event( condition_variable_using_event* cv_event )
+{
+    HANDLE my_event = cv_event->event;
+    EnterCriticalSection( &cv_event->mutex );
+    // NULL is an invalid HANDLE value
+    cv_event->event = NULL;
+    if( cv_event->n_waiters>0 ) {
+        LeaveCriticalSection( &cv_event->mutex );
+        spin_wait_until_eq( cv_event->n_waiters, 0 );
+        // make sure the last thread completes its access to cv
+        EnterCriticalSection( &cv_event->mutex );
+    }
+    LeaveCriticalSection( &cv_event->mutex );
+    CloseHandle( my_event );
+}
+
+void WINAPI destroy_condvar_noop( CONDITION_VARIABLE* /*cv*/ ) { /*no op*/ }
+
+static void (WINAPI *__TBB_init_condvar)( PCONDITION_VARIABLE ) = (void (WINAPI *)(PCONDITION_VARIABLE))&init_condvar_using_event;
+static BOOL (WINAPI *__TBB_condvar_wait)( PCONDITION_VARIABLE, LPCRITICAL_SECTION, DWORD ) = (BOOL (WINAPI *)(PCONDITION_VARIABLE,LPCRITICAL_SECTION, DWORD))&sleep_condition_variable_cs_using_event;
+static void (WINAPI *__TBB_condvar_notify_one)( PCONDITION_VARIABLE ) = (void (WINAPI *)(PCONDITION_VARIABLE))&wake_condition_variable_using_event;
+static void (WINAPI *__TBB_condvar_notify_all)( PCONDITION_VARIABLE ) = (void (WINAPI *)(PCONDITION_VARIABLE))&wake_all_condition_variable_using_event;
+static void (WINAPI *__TBB_destroy_condvar)( PCONDITION_VARIABLE ) = (void (WINAPI *)(PCONDITION_VARIABLE))&destroy_condvar_using_event;
+
+//! Table describing how to link the handlers.
+static const dynamic_link_descriptor CondVarLinkTable[] = {
+    DLD(InitializeConditionVariable, __TBB_init_condvar),
+    DLD(SleepConditionVariableCS,    __TBB_condvar_wait),
+    DLD(WakeConditionVariable,       __TBB_condvar_notify_one),
+    DLD(WakeAllConditionVariable,    __TBB_condvar_notify_all)
+};
+
+void init_condvar_module()
+{
+    __TBB_ASSERT( (uintptr_t)__TBB_init_condvar==(uintptr_t)&init_condvar_using_event, NULL );
+#if __TBB_WIN8UI_SUPPORT
+    // We expect condition variables to be always available for Windows* store applications,
+    // so there is no need to check presense and use alternative implementation.
+    __TBB_init_condvar = (void (WINAPI *)(PCONDITION_VARIABLE))&InitializeConditionVariable;
+    __TBB_condvar_wait = (BOOL(WINAPI *)(PCONDITION_VARIABLE, LPCRITICAL_SECTION, DWORD))&SleepConditionVariableCS;
+    __TBB_condvar_notify_one = (void (WINAPI *)(PCONDITION_VARIABLE))&WakeConditionVariable;
+    __TBB_condvar_notify_all = (void (WINAPI *)(PCONDITION_VARIABLE))&WakeAllConditionVariable;
+    __TBB_destroy_condvar = (void (WINAPI *)(PCONDITION_VARIABLE))&destroy_condvar_noop;
+#else
+    if (dynamic_link("Kernel32.dll", CondVarLinkTable, 4))
+        __TBB_destroy_condvar = (void (WINAPI *)(PCONDITION_VARIABLE))&destroy_condvar_noop;
+#endif
+}
+#endif /* _WIN32||_WIN64 */
+
+} // namespace internal
+
+#if _WIN32||_WIN64
+
+namespace interface5 {
+namespace internal {
+
+using tbb::internal::condvar_api_state;
+using tbb::internal::__TBB_init_condvar;
+using tbb::internal::__TBB_condvar_wait;
+using tbb::internal::__TBB_condvar_notify_one;
+using tbb::internal::__TBB_condvar_notify_all;
+using tbb::internal::__TBB_destroy_condvar;
+using tbb::internal::init_condvar_module;
+
+void internal_initialize_condition_variable( condvar_impl_t& cv )
+{
+    atomic_do_once( &init_condvar_module, condvar_api_state );
+    __TBB_init_condvar( &cv.cv_native );
+}
+
+void internal_destroy_condition_variable( condvar_impl_t& cv )
+{
+    __TBB_destroy_condvar( &cv.cv_native );
+}
+
+void internal_condition_variable_notify_one( condvar_impl_t& cv )
+{
+    __TBB_condvar_notify_one ( &cv.cv_native );
+}
+
+void internal_condition_variable_notify_all( condvar_impl_t& cv )
+{
+    __TBB_condvar_notify_all( &cv.cv_native );
+}
+
+bool internal_condition_variable_wait( condvar_impl_t& cv, mutex* mtx, const tick_count::interval_t* i )
+{
+    DWORD duration = i ? DWORD((i->seconds()*1000)) : INFINITE;
+    mtx->set_state( mutex::INITIALIZED );
+    BOOL res = __TBB_condvar_wait( &cv.cv_native, mtx->native_handle(), duration );
+    mtx->set_state( mutex::HELD );
+    return res?true:false;
+}
+
+} // namespace internal
+} // nameespace interface5
+
+#endif /* _WIN32||_WIN64 */
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/critical_section.cpp b/xdl/third_party/tbb/src/tbb/critical_section.cpp
new file mode 100644
index 00000000..841b8d8d
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/critical_section.cpp
@@ -0,0 +1,31 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/critical_section.h"
+#include "itt_notify.h"
+
+namespace tbb {
+    namespace internal {
+
+void critical_section_v4::internal_construct() {
+    ITT_SYNC_CREATE(&my_impl, _T("ppl::critical_section"), _T(""));
+}
+}  // namespace internal
+}  // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/custom_scheduler.h b/xdl/third_party/tbb/src/tbb/custom_scheduler.h
new file mode 100644
index 00000000..3c7ab7e6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/custom_scheduler.h
@@ -0,0 +1,718 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_custom_scheduler_H
+#define _TBB_custom_scheduler_H
+
+#include "scheduler.h"
+#include "observer_proxy.h"
+#include "itt_notify.h"
+
+namespace tbb {
+namespace internal {
+
+//------------------------------------------------------------------------
+//! Traits classes for scheduler
+//------------------------------------------------------------------------
+
+struct DefaultSchedulerTraits {
+    static const bool itt_possible = true;
+    static const bool has_slow_atomic = false;
+};
+
+struct IntelSchedulerTraits {
+    static const bool itt_possible = false;
+#if __TBB_x86_32||__TBB_x86_64
+    static const bool has_slow_atomic = true;
+#else
+    static const bool has_slow_atomic = false;
+#endif /* __TBB_x86_32||__TBB_x86_64 */
+};
+
+//------------------------------------------------------------------------
+// custom_scheduler
+//------------------------------------------------------------------------
+
+//! A scheduler with a customized evaluation loop.
+/** The customization can use SchedulerTraits to make decisions without needing a run-time check. */
+template<typename SchedulerTraits>
+class custom_scheduler: private generic_scheduler {
+    typedef custom_scheduler<SchedulerTraits> scheduler_type;
+
+    custom_scheduler( market& m ) : generic_scheduler(m) {}
+
+    //! Scheduler loop that dispatches tasks.
+    /** If child is non-NULL, it is dispatched first.
+        Then, until "parent" has a reference count of 1, other task are dispatched or stolen. */
+    void local_wait_for_all( task& parent, task* child ) __TBB_override;
+
+    //! Entry point from client code to the scheduler loop that dispatches tasks.
+    /** The method is virtual, but the *this object is used only for sake of dispatching on the correct vtable,
+        not necessarily the correct *this object.  The correct *this object is looked up in TLS. */
+    void wait_for_all( task& parent, task* child ) __TBB_override {
+        static_cast<custom_scheduler*>(governor::local_scheduler())->scheduler_type::local_wait_for_all( parent, child );
+    }
+
+    //! Decrements ref_count of a predecessor.
+    /** If it achieves 0, the predecessor is scheduled for execution.
+        When changing, remember that this is a hot path function. */
+    void tally_completion_of_predecessor( task& s, __TBB_ISOLATION_ARG( task*& bypass_slot, isolation_tag isolation ) ) {
+        task_prefix& p = s.prefix();
+        if( SchedulerTraits::itt_possible )
+            ITT_NOTIFY(sync_releasing, &p.ref_count);
+        if( SchedulerTraits::has_slow_atomic && p.ref_count==1 )
+            p.ref_count=0;
+        else if( __TBB_FetchAndDecrementWrelease(&p.ref_count) > 1 ) {// more references exist
+            // '__TBB_cl_evict(&p)' degraded performance of parallel_preorder example
+            return;
+        }
+
+        // Ordering on p.ref_count (superfluous if SchedulerTraits::has_slow_atomic)
+        __TBB_control_consistency_helper();
+        __TBB_ASSERT(p.ref_count==0, "completion of task caused predecessor's reference count to underflow");
+        if( SchedulerTraits::itt_possible )
+            ITT_NOTIFY(sync_acquired, &p.ref_count);
+#if TBB_USE_ASSERT
+        p.extra_state &= ~es_ref_count_active;
+#endif /* TBB_USE_ASSERT */
+#if __TBB_TASK_ISOLATION
+        if ( isolation != no_isolation ) {
+            // The parent is allowed not to have isolation (even if a child has isolation) because it has never spawned.
+            __TBB_ASSERT(p.isolation == no_isolation || p.isolation == isolation, NULL);
+            p.isolation = isolation;
+        }
+#endif /* __TBB_TASK_ISOLATION */
+
+#if __TBB_RECYCLE_TO_ENQUEUE
+        if (p.state==task::to_enqueue) {
+            // related to __TBB_TASK_ARENA TODO: try keep priority of the task
+            // e.g. rework task_prefix to remember priority of received task and use here
+            my_arena->enqueue_task(s, 0, my_random );
+        } else
+#endif /*__TBB_RECYCLE_TO_ENQUEUE*/
+        if( bypass_slot==NULL )
+            bypass_slot = &s;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        else if( internal::is_critical( s ) ) {
+            local_spawn( bypass_slot, bypass_slot->prefix().next );
+            bypass_slot = &s;
+        }
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+        else
+            local_spawn( &s, s.prefix().next );
+    }
+
+public:
+    static generic_scheduler* allocate_scheduler( market& m ) {
+        void* p = NFS_Allocate(1, sizeof(scheduler_type), NULL);
+        std::memset(p, 0, sizeof(scheduler_type));
+        scheduler_type* s = new( p ) scheduler_type( m );
+        s->assert_task_pool_valid();
+        ITT_SYNC_CREATE(s, SyncType_Scheduler, SyncObj_TaskPoolSpinning);
+        return s;
+    }
+
+    //! Try getting a task from the mailbox or stealing from another scheduler.
+    /** Returns the stolen task or NULL if all attempts fail. */
+    task* receive_or_steal_task( __TBB_ISOLATION_ARG( __TBB_atomic reference_count& completion_ref_count, isolation_tag isolation ) ) __TBB_override;
+
+}; // class custom_scheduler<>
+
+//------------------------------------------------------------------------
+// custom_scheduler methods
+//------------------------------------------------------------------------
+template<typename SchedulerTraits>
+task* custom_scheduler<SchedulerTraits>::receive_or_steal_task( __TBB_ISOLATION_ARG(__TBB_atomic reference_count& completion_ref_count, isolation_tag isolation) ) {
+    task* t = NULL;
+    bool outermost_worker_level = worker_outermost_level();
+    bool outermost_dispatch_level = outermost_worker_level || master_outermost_level();
+    bool can_steal_here = can_steal();
+    my_inbox.set_is_idle( true );
+#if __TBB_HOARD_NONLOCAL_TASKS
+    __TBB_ASSERT(!my_nonlocal_free_list, NULL);
+#endif
+#if __TBB_TASK_PRIORITY
+    if ( outermost_dispatch_level ) {
+        if ( intptr_t skipped_priority = my_arena->my_skipped_fifo_priority ) {
+            // This thread can dequeue FIFO tasks, and some priority levels of
+            // FIFO tasks have been bypassed (to prevent deadlock caused by
+            // dynamic priority changes in nested task group hierarchy).
+            if ( my_arena->my_skipped_fifo_priority.compare_and_swap(0, skipped_priority) == skipped_priority
+                 && skipped_priority > my_arena->my_top_priority )
+            {
+                my_market->update_arena_priority( *my_arena, skipped_priority );
+            }
+        }
+    }
+#endif /* !__TBB_TASK_PRIORITY */
+    // TODO: Try to find a place to reset my_limit (under market's lock)
+    // The number of slots potentially used in the arena. Updated once in a while, as my_limit changes rarely.
+    size_t n = my_arena->my_limit-1;
+    int yield_count = 0;
+    // The state "failure_count==-1" is used only when itt_possible is true,
+    // and denotes that a sync_prepare has not yet been issued.
+    for( int failure_count = -static_cast<int>(SchedulerTraits::itt_possible);; ++failure_count) {
+        __TBB_ASSERT( my_arena->my_limit > 0, NULL );
+        __TBB_ASSERT( my_arena_index <= n, NULL );
+        if( completion_ref_count==1 ) {
+            if( SchedulerTraits::itt_possible ) {
+                if( failure_count!=-1 ) {
+                    ITT_NOTIFY(sync_prepare, &completion_ref_count);
+                    // Notify Intel(R) Thread Profiler that thread has stopped spinning.
+                    ITT_NOTIFY(sync_acquired, this);
+                }
+                ITT_NOTIFY(sync_acquired, &completion_ref_count);
+            }
+            __TBB_ASSERT( !t, NULL );
+            // A worker thread in its outermost dispatch loop (i.e. its execution stack is empty) should
+            // exit it either when there is no more work in the current arena, or when revoked by the market.
+            __TBB_ASSERT( !outermost_worker_level, NULL );
+            __TBB_control_consistency_helper(); // on ref_count
+            break; // exit stealing loop and return;
+        }
+        // Check if the resource manager requires our arena to relinquish some threads
+        if ( outermost_worker_level && (my_arena->my_num_workers_allotted < my_arena->num_workers_active()
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+                 || my_arena->recall_by_mandatory_request()
+#endif
+                 ) ) {
+            if( SchedulerTraits::itt_possible && failure_count != -1 )
+                ITT_NOTIFY(sync_cancel, this);
+            return NULL;
+        }
+#if __TBB_TASK_PRIORITY
+        const int p = int(my_arena->my_top_priority);
+#else /* !__TBB_TASK_PRIORITY */
+        static const int p = 0;
+#endif
+        // Check if there are tasks mailed to this thread via task-to-thread affinity mechanism.
+        __TBB_ASSERT(my_affinity_id, NULL);
+        if ( n && !my_inbox.empty() ) {
+            t = get_mailbox_task( __TBB_ISOLATION_EXPR( isolation ) );
+#if __TBB_TASK_ISOLATION
+            // There is a race with a thread adding a new task (possibly with suitable isolation)
+            // to our mailbox, so the below conditions might result in a false positive.
+            // Then set_is_idle(false) allows that task to be stolen; it's OK.
+            if ( isolation != no_isolation && !t && !my_inbox.empty()
+                     && my_inbox.is_idle_state( true ) ) {
+                // We have proxy tasks in our mailbox but the isolation blocks their execution.
+                // So publish the proxy tasks in mailbox to be available for stealing from owner's task pool.
+                my_inbox.set_is_idle( false );
+            }
+#endif /* __TBB_TASK_ISOLATION */
+        }
+        if ( t ) {
+            GATHER_STATISTIC( ++my_counters.mails_received );
+        }
+        // Check if there are tasks in starvation-resistant stream.
+        // Only allowed at the outermost dispatch level without isolation.
+        else if (__TBB_ISOLATION_EXPR(isolation == no_isolation &&) outermost_dispatch_level &&
+                 !my_arena->my_task_stream.empty(p) && (
+#if __TBB_PREVIEW_CRITICAL_TASKS && __TBB_CPF_BUILD
+                     t = my_arena->my_task_stream.pop( p, subsequent_lane_selector(my_arena_slot->hint_for_pop) )
+#else
+                     t = my_arena->my_task_stream.pop( p, my_arena_slot->hint_for_pop )
+#endif
+                 ) ) {
+            ITT_NOTIFY(sync_acquired, &my_arena->my_task_stream);
+            // just proceed with the obtained task
+        }
+#if __TBB_TASK_PRIORITY
+        // Check if any earlier offloaded non-top priority tasks become returned to the top level
+        else if ( my_offloaded_tasks && (t = reload_tasks( __TBB_ISOLATION_EXPR( isolation ) )) ) {
+            __TBB_ASSERT( !is_proxy(*t), "The proxy task cannot be offloaded" );
+            // just proceed with the obtained task
+        }
+#endif /* __TBB_TASK_PRIORITY */
+        else if ( can_steal_here && n && (t = steal_task( __TBB_ISOLATION_EXPR(isolation) )) ) {
+            // just proceed with the obtained task
+        }
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        else if( (t = get_critical_task( __TBB_ISOLATION_EXPR(isolation) )) ) {
+            __TBB_ASSERT( internal::is_critical(*t), "Received task must be critical one" );
+            ITT_NOTIFY(sync_acquired, &my_arena->my_critical_task_stream);
+            // just proceed with the obtained task
+        }
+#endif // __TBB_PREVIEW_CRITICAL_TASKS
+        else
+            goto fail;
+        // A task was successfully obtained somewhere
+        __TBB_ASSERT(t,NULL);
+#if __TBB_ARENA_OBSERVER
+        my_arena->my_observers.notify_entry_observers( my_last_local_observer, is_worker() );
+#endif
+#if __TBB_SCHEDULER_OBSERVER
+        the_global_observer_list.notify_entry_observers( my_last_global_observer, is_worker() );
+#endif /* __TBB_SCHEDULER_OBSERVER */
+        if ( SchedulerTraits::itt_possible && failure_count != -1 ) {
+            // FIXME - might be victim, or might be selected from a mailbox
+            // Notify Intel(R) Thread Profiler that thread has stopped spinning.
+            ITT_NOTIFY(sync_acquired, this);
+        }
+        break; // exit stealing loop and return
+fail:
+        GATHER_STATISTIC( ++my_counters.steals_failed );
+        if( SchedulerTraits::itt_possible && failure_count==-1 ) {
+            // The first attempt to steal work failed, so notify Intel(R) Thread Profiler that
+            // the thread has started spinning.  Ideally, we would do this notification
+            // *before* the first failed attempt to steal, but at that point we do not
+            // know that the steal will fail.
+            ITT_NOTIFY(sync_prepare, this);
+            failure_count = 0;
+        }
+        // Pause, even if we are going to yield, because the yield might return immediately.
+        prolonged_pause();
+        const int failure_threshold = 2*int(n+1);
+        if( failure_count>=failure_threshold ) {
+#if __TBB_YIELD2P
+            failure_count = 0;
+#else
+            failure_count = failure_threshold;
+#endif
+            __TBB_Yield();
+#if __TBB_TASK_PRIORITY
+            // Check if there are tasks abandoned by other workers
+            if ( my_arena->my_orphaned_tasks ) {
+                // Epoch must be advanced before seizing the list pointer
+                ++my_arena->my_abandonment_epoch;
+                task* orphans = (task*)__TBB_FetchAndStoreW( &my_arena->my_orphaned_tasks, 0 );
+                if ( orphans ) {
+                    task** link = NULL;
+                    // Get local counter out of the way (we've just brought in external tasks)
+                    my_local_reload_epoch--;
+                    t = reload_tasks( orphans, link, __TBB_ISOLATION_ARG( effective_reference_priority(), isolation ) );
+                    if ( orphans ) {
+                        *link = my_offloaded_tasks;
+                        if ( !my_offloaded_tasks )
+                            my_offloaded_task_list_tail_link = link;
+                        my_offloaded_tasks = orphans;
+                    }
+                    __TBB_ASSERT( !my_offloaded_tasks == !my_offloaded_task_list_tail_link, NULL );
+                    if ( t ) {
+                        if( SchedulerTraits::itt_possible )
+                            ITT_NOTIFY(sync_cancel, this);
+                        __TBB_ASSERT( !is_proxy(*t), "The proxy task cannot be offloaded" );
+                        break; // exit stealing loop and return
+                    }
+                }
+            }
+#endif /* __TBB_TASK_PRIORITY */
+            const int yield_threshold = 100;
+            if( yield_count++ >= yield_threshold ) {
+                // When a worker thread has nothing to do, return it to RML.
+                // For purposes of affinity support, the thread is considered idle while in RML.
+#if __TBB_TASK_PRIORITY
+                if( outermost_worker_level || my_arena->my_top_priority > my_arena->my_bottom_priority ) {
+                    if ( my_arena->is_out_of_work() && outermost_worker_level ) {
+#else /* !__TBB_TASK_PRIORITY */
+                    if ( outermost_worker_level && my_arena->is_out_of_work() ) {
+#endif /* !__TBB_TASK_PRIORITY */
+                        if( SchedulerTraits::itt_possible )
+                            ITT_NOTIFY(sync_cancel, this);
+                        return NULL;
+                    }
+#if __TBB_TASK_PRIORITY
+                }
+                if ( my_offloaded_tasks ) {
+                    // Safeguard against any sloppiness in managing reload epoch
+                    // counter (e.g. on the hot path because of performance reasons).
+                    my_local_reload_epoch--;
+                    // Break the deadlock caused by a higher priority dispatch loop
+                    // stealing and offloading a lower priority task. Priority check
+                    // at the stealing moment cannot completely preclude such cases
+                    // because priorities can changes dynamically.
+                    if ( !outermost_worker_level && *my_ref_top_priority > my_arena->my_top_priority ) {
+                        GATHER_STATISTIC( ++my_counters.prio_ref_fixups );
+                        my_ref_top_priority = &my_arena->my_top_priority;
+                        // it's expected that only outermost workers can use global reload epoch
+                        __TBB_ASSERT(my_ref_reload_epoch == &my_arena->my_reload_epoch, NULL);
+                    }
+                }
+#endif /* __TBB_TASK_PRIORITY */
+            } // end of arena snapshot branch
+            // If several attempts did not find work, re-read the arena limit.
+            n = my_arena->my_limit-1;
+        } // end of yielding branch
+    } // end of nonlocal task retrieval loop
+    if ( my_inbox.is_idle_state( true ) )
+        my_inbox.set_is_idle( false );
+    return t;
+}
+
+template<typename SchedulerTraits>
+void custom_scheduler<SchedulerTraits>::local_wait_for_all( task& parent, task* child ) {
+    __TBB_ASSERT( governor::is_set(this), NULL );
+    __TBB_ASSERT( parent.ref_count() >= (child && child->parent() == &parent ? 2 : 1), "ref_count is too small" );
+    __TBB_ASSERT( my_innermost_running_task, NULL );
+    assert_task_pool_valid();
+    // Using parent's refcount in sync_prepare (in the stealing loop below) is
+    // a workaround for TP. We need to name it here to display correctly in Ampl.
+    if( SchedulerTraits::itt_possible )
+        ITT_SYNC_CREATE(&parent.prefix().ref_count, SyncType_Scheduler, SyncObj_TaskStealingLoop);
+#if __TBB_TASK_GROUP_CONTEXT
+    __TBB_ASSERT( parent.prefix().context, "parent task does not have context" );
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    task* t = child;
+    // Constant all_local_work_done is an unreachable refcount value that prevents
+    // early quitting the dispatch loop. It is defined to be in the middle of the range
+    // of negative values representable by the reference_count type.
+    static const reference_count
+        // For normal dispatch loops
+        parents_work_done = 1,
+        // For termination dispatch loops in masters
+        all_local_work_done = (reference_count)3 << (sizeof(reference_count) * 8 - 2);
+    reference_count quit_point;
+#if __TBB_TASK_PRIORITY
+    __TBB_ASSERT( (uintptr_t)*my_ref_top_priority < (uintptr_t)num_priority_levels, NULL );
+    volatile intptr_t *old_ref_top_priority = my_ref_top_priority;
+    // When entering nested parallelism level market level counter
+    // must be replaced with the one local to this arena.
+    volatile uintptr_t *old_ref_reload_epoch = my_ref_reload_epoch;
+#endif /* __TBB_TASK_PRIORITY */
+    task* old_innermost_running_task = my_innermost_running_task;
+    scheduler_properties old_properties = my_properties;
+    // Remove outermost property to indicate nested level.
+    __TBB_ASSERT( my_properties.outermost || my_innermost_running_task!=my_dummy_task, "The outermost property should be set out of a dispatch loop" );
+    my_properties.outermost &= my_innermost_running_task==my_dummy_task;
+#if __TBB_TASK_ISOLATION
+    isolation_tag isolation = my_innermost_running_task->prefix().isolation;
+#endif /* __TBB_TASK_ISOLATION */
+    if( master_outermost_level() ) {
+        // We are in the outermost task dispatch loop of a master thread or a worker which mimics master
+        quit_point = &parent == my_dummy_task ? all_local_work_done : parents_work_done;
+    } else {
+        quit_point = parents_work_done;
+#if __TBB_TASK_PRIORITY
+        if ( &parent != my_dummy_task ) {
+            // We are in a nested dispatch loop.
+            // Market or arena priority must not prevent child tasks from being
+            // executed so that dynamic priority changes did not cause deadlock.
+            my_ref_top_priority = &parent.prefix().context->my_priority;
+            my_ref_reload_epoch = &my_arena->my_reload_epoch;
+            if(my_ref_reload_epoch != old_ref_reload_epoch)
+                my_local_reload_epoch = *my_ref_reload_epoch-1;
+        }
+#endif /* __TBB_TASK_PRIORITY */
+    }
+
+    context_guard_helper</*report_tasks=*/SchedulerTraits::itt_possible> context_guard;
+    if ( t ) {
+        context_guard.set_ctx( __TBB_CONTEXT_ARG1(t->prefix().context) );
+#if __TBB_TASK_ISOLATION
+        if ( isolation != no_isolation ) {
+            __TBB_ASSERT( t->prefix().isolation == no_isolation, NULL );
+            // Propagate the isolation to the task executed without spawn.
+            t->prefix().isolation = isolation;
+        }
+#endif /* __TBB_TASK_ISOLATION */
+    }
+#if TBB_USE_EXCEPTIONS
+    // Infinite safeguard EH loop
+    for (;;) {
+    try {
+#endif /* TBB_USE_EXCEPTIONS */
+    // Outer loop receives tasks from global environment (via mailbox, FIFO queue(s),
+    // and by  stealing from other threads' task pools).
+    // All exit points from the dispatch loop are located in its immediate scope.
+    for(;;) {
+        // Middle loop retrieves tasks from the local task pool.
+        for(;;) {
+            // Inner loop evaluates tasks coming from nesting loops and those returned
+            // by just executed tasks (bypassing spawn or enqueue calls).
+            while(t) {
+                __TBB_ASSERT( my_inbox.is_idle_state(false), NULL );
+                __TBB_ASSERT(!is_proxy(*t),"unexpected proxy");
+                __TBB_ASSERT( t->prefix().owner, NULL );
+#if __TBB_TASK_ISOLATION
+                __TBB_ASSERT( isolation == no_isolation || isolation == t->prefix().isolation,
+                    "A task from another isolated region is going to be executed" );
+#endif /* __TBB_TASK_ISOLATION */
+                assert_task_valid(t);
+#if __TBB_TASK_GROUP_CONTEXT && TBB_USE_ASSERT
+                assert_context_valid(t->prefix().context);
+                if ( !t->prefix().context->my_cancellation_requested )
+#endif
+                // TODO: make the assert stronger by prohibiting allocated state.
+                __TBB_ASSERT( 1L<<t->state() & (1L<<task::allocated|1L<<task::ready|1L<<task::reexecute), NULL );
+                assert_task_pool_valid();
+#if __TBB_PREVIEW_CRITICAL_TASKS
+                // TODO: check performance and optimize if needed for added conditions on the
+                // hot-path.
+                if( !internal::is_critical(*t) ) {
+                    if( task* critical_task = get_critical_task( __TBB_ISOLATION_EXPR(isolation) ) ) {
+                        __TBB_ASSERT( internal::is_critical(*critical_task),
+                                      "Received task must be critical one" );
+                        ITT_NOTIFY(sync_acquired, &my_arena->my_critical_task_stream);
+                        t->prefix().state = task::allocated;
+                        my_innermost_running_task = t; // required during spawn to propagate isolation
+                        local_spawn(t, t->prefix().next);
+                        t = critical_task;
+                    } else {
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+#if __TBB_TASK_PRIORITY
+                        intptr_t p = priority(*t);
+                        if ( p != *my_ref_top_priority
+                             && (t->prefix().extra_state & es_task_enqueued) == 0 ) {
+                            assert_priority_valid(p);
+                            if ( p != my_arena->my_top_priority ) {
+                                my_market->update_arena_priority( *my_arena, p );
+                            }
+                            if ( p < effective_reference_priority() ) {
+                                if ( !my_offloaded_tasks ) {
+                                    my_offloaded_task_list_tail_link = &t->prefix().next_offloaded;
+                                    // Erase possible reference to the owner scheduler
+                                    // (next_offloaded is a union member)
+                                    *my_offloaded_task_list_tail_link = NULL;
+                                }
+                                offload_task( *t, p );
+                                if ( is_task_pool_published() ) {
+                                    t = winnow_task_pool( __TBB_ISOLATION_EXPR( isolation ) );
+                                    if ( t )
+                                        continue;
+                                } else {
+                                    // Mark arena as full to unlock arena priority level adjustment
+                                    // by arena::is_out_of_work(), and ensure worker's presence.
+                                    my_arena->advertise_new_work<arena::wakeup>();
+                                }
+                                goto stealing_ground;
+                            }
+                        }
+#endif /* __TBB_TASK_PRIORITY */
+#if __TBB_PREVIEW_CRITICAL_TASKS
+                    }
+                } // if is not critical
+#endif
+                task* t_next = NULL;
+                my_innermost_running_task = t;
+                t->prefix().owner = this;
+                t->prefix().state = task::executing;
+#if __TBB_TASK_GROUP_CONTEXT
+                if ( !t->prefix().context->my_cancellation_requested )
+#endif
+                {
+                    GATHER_STATISTIC( ++my_counters.tasks_executed );
+                    GATHER_STATISTIC( my_counters.avg_arena_concurrency += my_arena->num_workers_active() );
+                    GATHER_STATISTIC( my_counters.avg_assigned_workers += my_arena->my_num_workers_allotted );
+#if __TBB_TASK_PRIORITY
+                    GATHER_STATISTIC( my_counters.avg_arena_prio += p );
+                    GATHER_STATISTIC( my_counters.avg_market_prio += my_market->my_global_top_priority );
+#endif /* __TBB_TASK_PRIORITY */
+                    ITT_STACK(SchedulerTraits::itt_possible, callee_enter, t->prefix().context->itt_caller);
+#if __TBB_PREVIEW_CRITICAL_TASKS
+                    internal::critical_task_count_guard tc_guard(my_properties, *t);
+#endif
+                    t_next = t->execute();
+                    ITT_STACK(SchedulerTraits::itt_possible, callee_leave, t->prefix().context->itt_caller);
+                    if (t_next) {
+                        __TBB_ASSERT( t_next->state()==task::allocated,
+                                      "if task::execute() returns task, it must be marked as allocated" );
+                        reset_extra_state(t_next);
+                        __TBB_ISOLATION_EXPR( t_next->prefix().isolation = t->prefix().isolation );
+#if TBB_USE_ASSERT
+                        affinity_id next_affinity=t_next->prefix().affinity;
+                        if (next_affinity != 0 && next_affinity != my_affinity_id)
+                            GATHER_STATISTIC( ++my_counters.affinity_ignored );
+#endif
+                    } // if there is bypassed task
+                }
+                assert_task_pool_valid();
+                switch( t->state() ) {
+                    case task::executing: {
+                        task* s = t->parent();
+                        __TBB_ASSERT( my_innermost_running_task==t, NULL );
+                        __TBB_ASSERT( t->prefix().ref_count==0, "Task still has children after it has been executed" );
+                        t->~task();
+                        if( s )
+                            tally_completion_of_predecessor( *s, __TBB_ISOLATION_ARG( t_next, t->prefix().isolation ) );
+                        free_task<no_hint>( *t );
+                        poison_pointer( my_innermost_running_task );
+                        assert_task_pool_valid();
+                        break;
+                    }
+
+                    case task::recycle: // set by recycle_as_safe_continuation()
+                        t->prefix().state = task::allocated;
+#if __TBB_RECYCLE_TO_ENQUEUE
+                        __TBB_fallthrough;
+                    case task::to_enqueue: // set by recycle_to_enqueue()
+#endif
+                        __TBB_ASSERT( t_next != t, "a task returned from method execute() can not be recycled in another way" );
+                        reset_extra_state(t);
+                        // for safe continuation, need atomically decrement ref_count;
+                        tally_completion_of_predecessor(*t, __TBB_ISOLATION_ARG( t_next, t->prefix().isolation ) );
+                        assert_task_pool_valid();
+                        break;
+
+                    case task::reexecute: // set by recycle_to_reexecute()
+                        __TBB_ASSERT( t_next, "reexecution requires that method execute() return another task" );
+                        __TBB_ASSERT( t_next != t, "a task returned from method execute() can not be recycled in another way" );
+                        t->prefix().state = task::allocated;
+                        reset_extra_state(t);
+                        local_spawn( t, t->prefix().next );
+                        assert_task_pool_valid();
+                        break;
+                    case task::allocated:
+                        reset_extra_state(t);
+                        break;
+#if TBB_USE_ASSERT
+                    case task::ready:
+                        __TBB_ASSERT( false, "task is in READY state upon return from method execute()" );
+                        break;
+                    default:
+                        __TBB_ASSERT( false, "illegal state" );
+#else
+                    default: // just to shut up some compilation warnings
+                        break;
+#endif /* TBB_USE_ASSERT */
+                }
+                GATHER_STATISTIC( t_next ? ++my_counters.spawns_bypassed : 0 );
+                t = t_next;
+            } // end of scheduler bypass loop
+
+            assert_task_pool_valid();
+            if ( parent.prefix().ref_count == quit_point ) {
+                __TBB_ASSERT( quit_point != all_local_work_done, NULL );
+                __TBB_control_consistency_helper(); // on ref_count
+                ITT_NOTIFY(sync_acquired, &parent.prefix().ref_count);
+                goto done;
+            }
+            if ( is_task_pool_published() ) {
+                t = get_task( __TBB_ISOLATION_EXPR( isolation ) );
+            } else {
+                __TBB_ASSERT( is_quiescent_local_task_pool_reset(), NULL );
+                break;
+            }
+            assert_task_pool_valid();
+
+            if ( !t ) break;
+
+            context_guard.set_ctx( __TBB_CONTEXT_ARG1(t->prefix().context) );
+        }; // end of local task pool retrieval loop
+
+#if __TBB_TASK_PRIORITY
+stealing_ground:
+#endif /* __TBB_TASK_PRIORITY */
+#if __TBB_HOARD_NONLOCAL_TASKS
+        // before stealing, previously stolen task objects are returned
+        for (; my_nonlocal_free_list; my_nonlocal_free_list = t ) {
+            t = my_nonlocal_free_list->prefix().next;
+            free_nonlocal_small_task( *my_nonlocal_free_list );
+        }
+#endif
+        if ( quit_point == all_local_work_done ) {
+            __TBB_ASSERT( !is_task_pool_published() && is_quiescent_local_task_pool_reset(), NULL );
+            __TBB_ASSERT( !worker_outermost_level(), NULL );
+            my_innermost_running_task = old_innermost_running_task;
+            my_properties = old_properties;
+#if __TBB_TASK_PRIORITY
+            my_ref_top_priority = old_ref_top_priority;
+            if(my_ref_reload_epoch != old_ref_reload_epoch)
+                my_local_reload_epoch = *old_ref_reload_epoch-1;
+            my_ref_reload_epoch = old_ref_reload_epoch;
+#endif /* __TBB_TASK_PRIORITY */
+            return;
+        }
+        
+        t = receive_or_steal_task( __TBB_ISOLATION_ARG( parent.prefix().ref_count, isolation ) );
+        if ( !t )
+            goto done;
+        // The user can capture another the FPU settings to the context so the
+        // cached data in the helper can be out-of-date and we cannot do fast
+        // check.
+        context_guard.set_ctx( __TBB_CONTEXT_ARG1(t->prefix().context) );
+    } // end of infinite stealing loop
+#if TBB_USE_EXCEPTIONS
+    __TBB_ASSERT( false, "Must never get here" );
+    } // end of try-block
+    TbbCatchAll( t->prefix().context );
+    // Complete post-processing ...
+    if( t->state() == task::recycle
+#if __TBB_RECYCLE_TO_ENQUEUE
+        // TODO: the enqueue semantics gets lost below, consider reimplementing
+        ||  t->state() == task::to_enqueue
+#endif
+      ) {
+        // ... for recycled tasks to atomically decrement ref_count
+        t->prefix().state = task::allocated;
+        if( SchedulerTraits::itt_possible )
+            ITT_NOTIFY(sync_releasing, &t->prefix().ref_count);
+        if( __TBB_FetchAndDecrementWrelease(&t->prefix().ref_count)==1 ) {
+            if( SchedulerTraits::itt_possible )
+                ITT_NOTIFY(sync_acquired, &t->prefix().ref_count);
+        }else{
+            t = NULL;
+        }
+    }
+    } // end of infinite EH loop
+    __TBB_ASSERT( false, "Must never get here too" );
+#endif /* TBB_USE_EXCEPTIONS */
+done:
+    my_innermost_running_task = old_innermost_running_task;
+    my_properties = old_properties;
+#if __TBB_TASK_PRIORITY
+    my_ref_top_priority = old_ref_top_priority;
+    if(my_ref_reload_epoch != old_ref_reload_epoch)
+        my_local_reload_epoch = *old_ref_reload_epoch-1;
+    my_ref_reload_epoch = old_ref_reload_epoch;
+#endif /* __TBB_TASK_PRIORITY */
+    if ( !ConcurrentWaitsEnabled(parent) ) {
+        if ( parent.prefix().ref_count != parents_work_done ) {
+            // This is a worker that was revoked by the market.
+            __TBB_ASSERT( worker_outermost_level(),
+                "Worker thread exits nested dispatch loop prematurely" );
+            return;
+        }
+        parent.prefix().ref_count = 0;
+    }
+#if TBB_USE_ASSERT
+    parent.prefix().extra_state &= ~es_ref_count_active;
+#endif /* TBB_USE_ASSERT */
+#if __TBB_TASK_GROUP_CONTEXT
+    __TBB_ASSERT(parent.prefix().context && default_context(), NULL);
+    task_group_context* parent_ctx = parent.prefix().context;
+    if ( parent_ctx->my_cancellation_requested ) {
+        task_group_context::exception_container_type *pe = parent_ctx->my_exception;
+        if ( master_outermost_level() && parent_ctx == default_context() ) {
+            // We are in the outermost task dispatch loop of a master thread, and
+            // the whole task tree has been collapsed. So we may clear cancellation data.
+            parent_ctx->my_cancellation_requested = 0;
+            // TODO: Add assertion that master's dummy task context does not have children
+            parent_ctx->my_state &= ~(uintptr_t)task_group_context::may_have_children;
+        }
+        if ( pe ) {
+            // On Windows, FPU control settings changed in the helper destructor are not visible
+            // outside a catch block. So restore the default settings manually before rethrowing
+            // the exception.
+            context_guard.restore_default();
+            TbbRethrowException( pe );
+        }
+    }
+    __TBB_ASSERT(!is_worker() || !CancellationInfoPresent(*my_dummy_task),
+        "Worker's dummy task context modified");
+    __TBB_ASSERT(!master_outermost_level() || !CancellationInfoPresent(*my_dummy_task),
+        "Unexpected exception or cancellation data in the master's dummy task");
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    assert_task_pool_valid();
+}
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_custom_scheduler_H */
diff --git a/xdl/third_party/tbb/src/tbb/dynamic_link.cpp b/xdl/third_party/tbb/src/tbb/dynamic_link.cpp
new file mode 100644
index 00000000..ed046f32
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/dynamic_link.cpp
@@ -0,0 +1,577 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "dynamic_link.h"
+#include "tbb/tbb_config.h"
+
+/*
+    This file is used by both TBB and OpenMP RTL. Do not use __TBB_ASSERT() macro
+    and runtime_warning() function because they are not available in OpenMP. Use
+    LIBRARY_ASSERT and DYNAMIC_LINK_WARNING instead.
+*/
+
+#include <cstdarg>          // va_list etc.
+#if _WIN32
+    #include <malloc.h>
+
+    // Unify system calls
+    #define dlopen( name, flags )   LoadLibrary( name )
+    #define dlsym( handle, name )   GetProcAddress( handle, name )
+    #define dlclose( handle )       ( ! FreeLibrary( handle ) )
+    #define dlerror()               GetLastError()
+#ifndef PATH_MAX
+    #define PATH_MAX                MAX_PATH
+#endif
+#else /* _WIN32 */
+    #include <dlfcn.h>
+    #include <string.h>
+    #include <unistd.h>
+    #include <limits.h>
+    #include <stdlib.h>
+#endif /* _WIN32 */
+
+#if __TBB_WEAK_SYMBOLS_PRESENT && !__TBB_DYNAMIC_LOAD_ENABLED
+    //TODO: use function attribute for weak symbols instead of the pragma.
+    #pragma weak dlopen
+    #pragma weak dlsym
+    #pragma weak dlclose
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT && !__TBB_DYNAMIC_LOAD_ENABLED */
+
+#include "tbb_misc.h"
+
+#define __USE_TBB_ATOMICS       ( !(__linux__&&__ia64__) || __TBB_BUILD )
+#define __USE_STATIC_DL_INIT    ( !__ANDROID__ )
+
+#if !__USE_TBB_ATOMICS
+#include <pthread.h>
+#endif
+
+/*
+dynamic_link is a common interface for searching for required symbols in an
+executable and dynamic libraries.
+
+dynamic_link provides certain guarantees:
+  1. Either all or none of the requested symbols are resolved. Moreover, if
+  symbols are not resolved, the dynamic_link_descriptor table is not modified;
+  2. All returned symbols have secured lifetime: this means that none of them
+  can be invalidated until dynamic_unlink is called;
+  3. Any loaded library is loaded only via the full path. The full path is that
+  from which the runtime itself was loaded. (This is done to avoid security
+  issues caused by loading libraries from insecure paths).
+
+dynamic_link searches for the requested symbols in three stages, stopping as
+soon as all of the symbols have been resolved.
+
+  1. Search the global scope:
+    a. On Windows: dynamic_link tries to obtain the handle of the requested
+    library and if it succeeds it resolves the symbols via that handle.
+    b. On Linux: dynamic_link tries to search for the symbols in the global
+    scope via the main program handle. If the symbols are present in the global
+    scope their lifetime is not guaranteed (since dynamic_link does not know
+    anything about the library from which they are exported). Therefore it
+    tries to "pin" the symbols by obtaining the library name and reopening it.
+    dlopen may fail to reopen the library in two cases:
+       i. The symbols are exported from the executable. Currently dynamic _link
+      cannot handle this situation, so it will not find these symbols in this
+      step.
+      ii. The necessary library has been unloaded and cannot be reloaded. It
+      seems there is nothing that can be done in this case. No symbols are
+      returned.
+
+  2. Dynamic load: an attempt is made to load the requested library via the
+  full path.
+    The full path used is that from which the runtime itself was loaded. If the
+    library can be loaded, then an attempt is made to resolve the requested
+    symbols in the newly loaded library.
+    If the symbols are not found the library is unloaded.
+
+  3. Weak symbols: if weak symbols are available they are returned.
+*/
+
+OPEN_INTERNAL_NAMESPACE
+
+#if __TBB_WEAK_SYMBOLS_PRESENT || __TBB_DYNAMIC_LOAD_ENABLED
+
+#if !defined(DYNAMIC_LINK_WARNING) && !__TBB_WIN8UI_SUPPORT && __TBB_DYNAMIC_LOAD_ENABLED
+    // Report runtime errors and continue.
+    #define DYNAMIC_LINK_WARNING dynamic_link_warning
+    static void dynamic_link_warning( dynamic_link_error_t code, ... ) {
+        (void) code;
+    } // library_warning
+#endif /* !defined(DYNAMIC_LINK_WARNING) && !__TBB_WIN8UI_SUPPORT && __TBB_DYNAMIC_LOAD_ENABLED */
+
+    static bool resolve_symbols( dynamic_link_handle module, const dynamic_link_descriptor descriptors[], size_t required )
+    {
+        if ( !module )
+            return false;
+
+        #if !__TBB_DYNAMIC_LOAD_ENABLED /* only __TBB_WEAK_SYMBOLS_PRESENT is defined */
+            if ( !dlsym ) return false;
+        #endif /* !__TBB_DYNAMIC_LOAD_ENABLED */
+
+        const size_t n_desc=20; // Usually we don't have more than 20 descriptors per library
+        LIBRARY_ASSERT( required <= n_desc, "Too many descriptors is required" );
+        if ( required > n_desc ) return false;
+        pointer_to_handler h[n_desc];
+
+        for ( size_t k = 0; k < required; ++k ) {
+            dynamic_link_descriptor const & desc = descriptors[k];
+            pointer_to_handler addr = (pointer_to_handler)dlsym( module, desc.name );
+            if ( !addr ) {
+                return false;
+            }
+            h[k] = addr;
+        }
+
+        // Commit the entry points.
+        // Cannot use memset here, because the writes must be atomic.
+        for( size_t k = 0; k < required; ++k )
+            *descriptors[k].handler = h[k];
+        return true;
+    }
+
+#if __TBB_WIN8UI_SUPPORT
+    bool dynamic_link( const char*  library, const dynamic_link_descriptor descriptors[], size_t required, dynamic_link_handle*, int flags ) {
+        dynamic_link_handle tmp_handle = NULL;
+        TCHAR wlibrary[256];
+        if ( MultiByteToWideChar(CP_UTF8, 0, library, -1, wlibrary, 255) == 0 ) return false;
+        if ( flags & DYNAMIC_LINK_LOAD )
+            tmp_handle = LoadPackagedLibrary( wlibrary, 0 );
+        if (tmp_handle != NULL){
+            return resolve_symbols(tmp_handle, descriptors, required);
+        }else{
+            return false;
+        }
+    }
+    void dynamic_unlink( dynamic_link_handle ) {}
+    void dynamic_unlink_all() {}
+#else
+#if __TBB_DYNAMIC_LOAD_ENABLED
+/*
+    There is a security issue on Windows: LoadLibrary() may load and execute malicious code.
+    See http://www.microsoft.com/technet/security/advisory/2269637.mspx for details.
+    To avoid the issue, we have to pass full path (not just library name) to LoadLibrary. This
+    function constructs full path to the specified library (it is assumed the library located
+    side-by-side with the tbb.dll.
+
+    The function constructs absolute path for given relative path. Important: Base directory is not
+    current one, it is the directory tbb.dll loaded from.
+
+    Example:
+        Let us assume "tbb.dll" is located in "c:\program files\common\intel\" directory, e. g.
+        absolute path of tbb library is "c:\program files\common\intel\tbb.dll". Absolute path for
+        "tbbmalloc.dll" would be "c:\program files\common\intel\tbbmalloc.dll". Absolute path for
+        "malloc\tbbmalloc.dll" would be "c:\program files\common\intel\malloc\tbbmalloc.dll".
+*/
+
+    // Struct handle_storage is used by dynamic_link routine to store handles of
+    // all loaded or pinned dynamic libraries. When TBB is shut down, it calls
+    // dynamic_unlink_all() that unloads modules referenced by handle_storage.
+    // This struct should not have any constructors since it may be used before
+    // the constructor is called.
+    #define MAX_LOADED_MODULES 8 // The number of maximum possible modules which can be loaded
+
+#if __USE_TBB_ATOMICS
+    typedef ::tbb::atomic<size_t> atomic_incrementer;
+    void init_atomic_incrementer( atomic_incrementer & ) {}
+
+    static void atomic_once( void( *func ) (void), tbb::atomic< tbb::internal::do_once_state > &once_state ) {
+        tbb::internal::atomic_do_once( func, once_state );
+    }
+    #define ATOMIC_ONCE_DECL( var ) tbb::atomic< tbb::internal::do_once_state > var
+#else
+    static void pthread_assert( int error_code, const char* msg ) {
+        LIBRARY_ASSERT( error_code == 0, msg );
+    }
+
+    class atomic_incrementer {
+        size_t my_val;
+        pthread_spinlock_t my_lock;
+    public:
+        void init() {
+            my_val = 0;
+            pthread_assert( pthread_spin_init( &my_lock, PTHREAD_PROCESS_PRIVATE ), "pthread_spin_init failed" );
+        }
+        size_t operator++(int) {
+            pthread_assert( pthread_spin_lock( &my_lock ), "pthread_spin_lock failed" );
+            size_t prev_val = my_val++;
+            pthread_assert( pthread_spin_unlock( &my_lock ), "pthread_spin_unlock failed" );
+            return prev_val;
+        }
+        operator size_t() {
+            pthread_assert( pthread_spin_lock( &my_lock ), "pthread_spin_lock failed" );
+            size_t val = my_val;
+            pthread_assert( pthread_spin_unlock( &my_lock ), "pthread_spin_unlock failed" );
+            return val;
+        }
+        ~atomic_incrementer() {
+            pthread_assert( pthread_spin_destroy( &my_lock ), "pthread_spin_destroy failed" );
+        }
+    };
+
+    void init_atomic_incrementer( atomic_incrementer &r ) {
+        r.init();
+    }
+
+    static void atomic_once( void( *func ) (), pthread_once_t &once_state ) {
+        pthread_assert( pthread_once( &once_state, func ), "pthread_once failed" );
+    }
+    #define ATOMIC_ONCE_DECL( var ) pthread_once_t var = PTHREAD_ONCE_INIT
+#endif /* __USE_TBB_ATOMICS */
+
+    struct handles_t {
+        atomic_incrementer my_size;
+        dynamic_link_handle my_handles[MAX_LOADED_MODULES];
+
+        void init() {
+            init_atomic_incrementer( my_size );
+        }
+
+        void add(const dynamic_link_handle &handle) {
+            const size_t ind = my_size++;
+            LIBRARY_ASSERT( ind < MAX_LOADED_MODULES, "Too many modules are loaded" );
+            my_handles[ind] = handle;
+        }
+
+        void free() {
+            const size_t size = my_size;
+            for (size_t i=0; i<size; ++i)
+                dynamic_unlink( my_handles[i] );
+        }
+    } handles;
+
+    ATOMIC_ONCE_DECL( init_dl_data_state );
+
+    static struct ap_data_t {
+        char _path[PATH_MAX+1];
+        size_t _len;
+    } ap_data;
+
+    static void init_ap_data() {
+    #if _WIN32
+        // Get handle of our DLL first.
+        HMODULE handle;
+        BOOL brc = GetModuleHandleEx(
+            GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS | GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT,
+            (LPCSTR)( & dynamic_link ), // any function inside the library can be used for the address
+            & handle
+            );
+        if ( !brc ) { // Error occurred.
+            int err = GetLastError();
+            DYNAMIC_LINK_WARNING( dl_sys_fail, "GetModuleHandleEx", err );
+            return;
+        }
+        // Now get path to our DLL.
+        DWORD drc = GetModuleFileName( handle, ap_data._path, static_cast< DWORD >( PATH_MAX ) );
+        if ( drc == 0 ) { // Error occurred.
+            int err = GetLastError();
+            DYNAMIC_LINK_WARNING( dl_sys_fail, "GetModuleFileName", err );
+            return;
+        }
+        if ( drc >= PATH_MAX ) { // Buffer too short.
+            DYNAMIC_LINK_WARNING( dl_buff_too_small );
+            return;
+        }
+        // Find the position of the last backslash.
+        char *backslash = strrchr( ap_data._path, '\\' );
+
+        if ( !backslash ) {    // Backslash not found.
+            LIBRARY_ASSERT( backslash!=NULL, "Unbelievable.");
+            return;
+        }
+        LIBRARY_ASSERT( backslash >= ap_data._path, "Unbelievable.");
+        ap_data._len = (size_t)(backslash - ap_data._path) + 1;
+        *(backslash+1) = 0;
+    #else
+        // Get the library path
+        Dl_info dlinfo;
+        int res = dladdr( (void*)&dynamic_link, &dlinfo ); // any function inside the library can be used for the address
+        if ( !res ) {
+            char const * err = dlerror();
+            DYNAMIC_LINK_WARNING( dl_sys_fail, "dladdr", err );
+            return;
+        } else {
+            LIBRARY_ASSERT( dlinfo.dli_fname!=NULL, "Unbelievable." );
+        }
+
+        char const *slash = strrchr( dlinfo.dli_fname, '/' );
+        size_t fname_len=0;
+        if ( slash ) {
+            LIBRARY_ASSERT( slash >= dlinfo.dli_fname, "Unbelievable.");
+            fname_len = (size_t)(slash - dlinfo.dli_fname) + 1;
+        }
+
+        size_t rc;
+        if ( dlinfo.dli_fname[0]=='/' ) {
+            // The library path is absolute
+            rc = 0;
+            ap_data._len = 0;
+        } else {
+            // The library path is relative so get the current working directory
+            if ( !getcwd( ap_data._path, sizeof(ap_data._path)/sizeof(ap_data._path[0]) ) ) {
+                DYNAMIC_LINK_WARNING( dl_buff_too_small );
+                return;
+            }
+            ap_data._len = strlen( ap_data._path );
+            ap_data._path[ap_data._len++]='/';
+            rc = ap_data._len;
+        }
+
+        if ( fname_len>0 ) {
+            if ( ap_data._len>PATH_MAX ) {
+                DYNAMIC_LINK_WARNING( dl_buff_too_small );
+                ap_data._len=0;
+                return;
+            }
+            strncpy( ap_data._path+rc, dlinfo.dli_fname, fname_len );
+            ap_data._len += fname_len;
+            ap_data._path[ap_data._len]=0;
+        }
+    #endif /* _WIN32 */
+    }
+
+    static void init_dl_data() {
+        handles.init();
+        init_ap_data();
+    }
+
+    /*
+        The function constructs absolute path for given relative path. Important: Base directory is not
+        current one, it is the directory libtbb.so loaded from.
+
+        Arguments:
+        in  name -- Name of a file (may be with relative path; it must not be an absolute one).
+        out path -- Buffer to save result (absolute path) to.
+        in  len  -- Size of buffer.
+        ret      -- 0         -- Error occurred.
+                    > len     -- Buffer too short, required size returned.
+                    otherwise -- Ok, number of characters (incl. terminating null) written to buffer.
+    */
+    static size_t abs_path( char const * name, char * path, size_t len ) {
+        if ( ap_data._len == 0 )
+            return 0;
+
+        size_t name_len = strlen( name );
+        size_t full_len = name_len+ap_data._len;
+        if ( full_len < len ) {
+            __TBB_ASSERT(ap_data._path[ap_data._len] == 0, NULL);
+            strcpy( path, ap_data._path );
+            strcat( path, name );
+        }
+        return full_len+1; // +1 for null character
+    }
+#endif  // __TBB_DYNAMIC_LOAD_ENABLED
+
+    void init_dynamic_link_data() {
+    #if __TBB_DYNAMIC_LOAD_ENABLED
+        atomic_once( &init_dl_data, init_dl_data_state );
+    #endif
+    }
+
+    #if __USE_STATIC_DL_INIT
+    // ap_data structure is initialized with current directory on Linux.
+    // So it should be initialized as soon as possible since the current directory may be changed.
+    // static_init_ap_data object provides this initialization during library loading.
+    static struct static_init_dl_data_t {
+        static_init_dl_data_t() {
+            init_dynamic_link_data();
+        }
+    } static_init_dl_data;
+    #endif
+
+    #if __TBB_WEAK_SYMBOLS_PRESENT
+    static bool weak_symbol_link( const dynamic_link_descriptor descriptors[], size_t required )
+    {
+        // Check if the required entries are present in what was loaded into our process.
+        for ( size_t k = 0; k < required; ++k )
+            if ( !descriptors[k].ptr )
+                return false;
+        // Commit the entry points.
+        for ( size_t k = 0; k < required; ++k )
+            *descriptors[k].handler = (pointer_to_handler) descriptors[k].ptr;
+        return true;
+    }
+    #else
+    static bool weak_symbol_link( const dynamic_link_descriptor[], size_t ) {
+        return false;
+    }
+    #endif /* __TBB_WEAK_SYMBOLS_PRESENT */
+
+    void dynamic_unlink( dynamic_link_handle handle ) {
+    #if !__TBB_DYNAMIC_LOAD_ENABLED /* only __TBB_WEAK_SYMBOLS_PRESENT is defined */
+        if ( !dlclose ) return;
+    #endif
+        if ( handle ) {
+            dlclose( handle );
+        }
+    }
+
+    void dynamic_unlink_all() {
+    #if __TBB_DYNAMIC_LOAD_ENABLED
+        handles.free();
+    #endif
+    }
+
+#if !_WIN32
+#if __TBB_DYNAMIC_LOAD_ENABLED
+    static dynamic_link_handle pin_symbols( dynamic_link_descriptor desc, const dynamic_link_descriptor* descriptors, size_t required ) {
+        // It is supposed that all symbols are from the only one library
+        // The library has been loaded by another module and contains at least one requested symbol.
+        // But after we obtained the symbol the library can be unloaded by another thread
+        // invalidating our symbol. Therefore we need to pin the library in memory.
+        dynamic_link_handle library_handle = 0;
+        Dl_info info;
+        // Get library's name from earlier found symbol
+        if ( dladdr( (void*)*desc.handler, &info ) ) {
+            // Pin the library
+            library_handle = dlopen( info.dli_fname, RTLD_LAZY );
+            if ( library_handle ) {
+                // If original library was unloaded before we pinned it
+                // and then another module loaded in its place, the earlier
+                // found symbol would become invalid. So revalidate them.
+                if ( !resolve_symbols( library_handle, descriptors, required ) ) {
+                    // Wrong library.
+                    dynamic_unlink(library_handle);
+                    library_handle = 0;
+                }
+            } else {
+                char const * err = dlerror();
+                DYNAMIC_LINK_WARNING( dl_lib_not_found, info.dli_fname, err );
+            }
+        }
+        // else the library has been unloaded by another thread
+        return library_handle;
+    }
+#endif /* __TBB_DYNAMIC_LOAD_ENABLED */
+#endif /* !_WIN32 */
+
+    static dynamic_link_handle global_symbols_link( const char* library, const dynamic_link_descriptor descriptors[], size_t required ) {
+        ::tbb::internal::suppress_unused_warning( library );
+        dynamic_link_handle library_handle;
+#if _WIN32
+        if ( GetModuleHandleEx( 0, library, &library_handle ) ) {
+            if ( resolve_symbols( library_handle, descriptors, required ) )
+                return library_handle;
+            else
+                FreeLibrary( library_handle );
+        }
+#else /* _WIN32 */
+    #if !__TBB_DYNAMIC_LOAD_ENABLED /* only __TBB_WEAK_SYMBOLS_PRESENT is defined */
+        if ( !dlopen ) return 0;
+    #endif /* !__TBB_DYNAMIC_LOAD_ENABLED */
+        library_handle = dlopen( NULL, RTLD_LAZY );
+    #if !__ANDROID__
+        // On Android dlopen( NULL ) returns NULL if it is called during dynamic module initialization.
+        LIBRARY_ASSERT( library_handle, "The handle for the main program is NULL" );
+    #endif
+    #if __TBB_DYNAMIC_LOAD_ENABLED
+        // Check existence of the first symbol only, then use it to find the library and load all necessary symbols.
+        pointer_to_handler handler;
+        dynamic_link_descriptor desc;
+        desc.name = descriptors[0].name;
+        desc.handler = &handler;
+        if ( resolve_symbols( library_handle, &desc, 1 ) ) {
+            dynamic_unlink( library_handle );
+            return pin_symbols( desc, descriptors, required );
+        }
+    #else  /* only __TBB_WEAK_SYMBOLS_PRESENT is defined */
+        if ( resolve_symbols( library_handle, descriptors, required ) )
+            return library_handle;
+    #endif
+        dynamic_unlink( library_handle );
+#endif /* _WIN32 */
+        return 0;
+    }
+
+    static void save_library_handle( dynamic_link_handle src, dynamic_link_handle *dst ) {
+        LIBRARY_ASSERT( src, "The library handle to store must be non-zero" );
+        if ( dst )
+            *dst = src;
+    #if __TBB_DYNAMIC_LOAD_ENABLED
+        else
+            handles.add( src );
+    #endif /* __TBB_DYNAMIC_LOAD_ENABLED */
+    }
+
+    dynamic_link_handle dynamic_load( const char* library, const dynamic_link_descriptor descriptors[], size_t required ) {
+        ::tbb::internal::suppress_unused_warning( library, descriptors, required );
+#if __TBB_DYNAMIC_LOAD_ENABLED
+
+        size_t const len = PATH_MAX + 1;
+        char path[ len ];
+        size_t rc = abs_path( library, path, len );
+        if ( 0 < rc && rc <= len ) {
+#if _WIN32
+            // Prevent Windows from displaying silly message boxes if it fails to load library
+            // (e.g. because of MS runtime problems - one of those crazy manifest related ones)
+            UINT prev_mode = SetErrorMode (SEM_FAILCRITICALERRORS);
+#endif /* _WIN32 */
+            dynamic_link_handle library_handle = dlopen( path, RTLD_LAZY );
+#if _WIN32
+            SetErrorMode (prev_mode);
+#endif /* _WIN32 */
+            if( library_handle ) {
+                if( !resolve_symbols( library_handle, descriptors, required ) ) {
+                    // The loaded library does not contain all the expected entry points
+                    dynamic_unlink( library_handle );
+                    library_handle = NULL;
+                }
+            } else
+                DYNAMIC_LINK_WARNING( dl_lib_not_found, path, dlerror() );
+            return library_handle;
+        } else if ( rc>len )
+                DYNAMIC_LINK_WARNING( dl_buff_too_small );
+                // rc == 0 means failing of init_ap_data so the warning has already been issued.
+
+#endif /* __TBB_DYNAMIC_LOAD_ENABLED */
+            return 0;
+    }
+
+    bool dynamic_link( const char* library, const dynamic_link_descriptor descriptors[], size_t required, dynamic_link_handle *handle, int flags ) {
+        init_dynamic_link_data();
+
+        // TODO: May global_symbols_link find weak symbols?
+        dynamic_link_handle library_handle = ( flags & DYNAMIC_LINK_GLOBAL ) ? global_symbols_link( library, descriptors, required ) : 0;
+
+        if ( !library_handle && ( flags & DYNAMIC_LINK_LOAD ) )
+            library_handle = dynamic_load( library, descriptors, required );
+
+        if ( !library_handle && ( flags & DYNAMIC_LINK_WEAK ) )
+            return weak_symbol_link( descriptors, required );
+
+        if ( library_handle ) {
+            save_library_handle( library_handle, handle );
+            return true;
+        }
+        return false;
+    }
+
+#endif /*__TBB_WIN8UI_SUPPORT*/
+#else /* __TBB_WEAK_SYMBOLS_PRESENT || __TBB_DYNAMIC_LOAD_ENABLED */
+    bool dynamic_link( const char*, const dynamic_link_descriptor*, size_t, dynamic_link_handle *handle, int ) {
+        if ( handle )
+            *handle=0;
+        return false;
+    }
+    void dynamic_unlink( dynamic_link_handle ) {}
+    void dynamic_unlink_all() {}
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT || __TBB_DYNAMIC_LOAD_ENABLED */
+
+CLOSE_INTERNAL_NAMESPACE
diff --git a/xdl/third_party/tbb/src/tbb/dynamic_link.h b/xdl/third_party/tbb/src/tbb/dynamic_link.h
new file mode 100644
index 00000000..337f82b1
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/dynamic_link.h
@@ -0,0 +1,123 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_dynamic_link
+#define __TBB_dynamic_link
+
+// Support for dynamic loading entry points from other shared libraries.
+
+#include "tbb/tbb_stddef.h"
+
+#ifdef LIBRARY_ASSERT
+    #undef __TBB_ASSERT
+    #define __TBB_ASSERT(x,y) LIBRARY_ASSERT(x,y)
+#else
+    #define LIBRARY_ASSERT(x,y) __TBB_ASSERT_EX(x,y)
+#endif /* !LIBRARY_ASSERT */
+
+/** By default, symbols declared and defined here go into namespace tbb::internal.
+    To put them in other namespace, define macros OPEN_INTERNAL_NAMESPACE
+    and CLOSE_INTERNAL_NAMESPACE to override the following default definitions. **/
+#ifndef OPEN_INTERNAL_NAMESPACE
+#define OPEN_INTERNAL_NAMESPACE namespace tbb { namespace internal {
+#define CLOSE_INTERNAL_NAMESPACE }}
+#endif /* OPEN_INTERNAL_NAMESPACE */
+
+#include <stddef.h>
+#if _WIN32
+#include "tbb/machine/windows_api.h"
+#endif /* _WIN32 */
+
+OPEN_INTERNAL_NAMESPACE
+
+//! Type definition for a pointer to a void somefunc(void)
+typedef void (*pointer_to_handler)();
+
+//! The helper to construct dynamic_link_descriptor structure
+// Double cast through the void* in DLD macro is necessary to
+// prevent warnings from some compilers (g++ 4.1)
+#if __TBB_WEAK_SYMBOLS_PRESENT
+#define DLD(s,h) {#s, (pointer_to_handler*)(void*)(&h), (pointer_to_handler)&s}
+#define DLD_NOWEAK(s,h) {#s, (pointer_to_handler*)(void*)(&h), NULL}
+#else
+#define DLD(s,h) {#s, (pointer_to_handler*)(void*)(&h)}
+#define DLD_NOWEAK(s,h) DLD(s,h)
+#endif /* __TBB_WEAK_SYMBOLS_PRESENT */
+//! Association between a handler name and location of pointer to it.
+struct dynamic_link_descriptor {
+    //! Name of the handler
+    const char* name;
+    //! Pointer to the handler
+    pointer_to_handler* handler;
+#if __TBB_WEAK_SYMBOLS_PRESENT
+    //! Weak symbol
+    pointer_to_handler ptr;
+#endif
+};
+
+#if _WIN32
+typedef HMODULE dynamic_link_handle;
+#else
+typedef void* dynamic_link_handle;
+#endif /* _WIN32 */
+
+const int DYNAMIC_LINK_GLOBAL = 0x01;
+const int DYNAMIC_LINK_LOAD   = 0x02;
+const int DYNAMIC_LINK_WEAK   = 0x04;
+const int DYNAMIC_LINK_ALL    = DYNAMIC_LINK_GLOBAL | DYNAMIC_LINK_LOAD | DYNAMIC_LINK_WEAK;
+
+//! Fill in dynamically linked handlers.
+/** 'library' is the name of the requested library. It should not contain a full
+    path since dynamic_link adds the full path (from which the runtime itself
+    was loaded) to the library name.
+    'required' is the number of the initial entries in the array descriptors[]
+    that have to be found in order for the call to succeed. If the library and
+    all the required handlers are found, then the corresponding handler
+    pointers are set, and the return value is true.  Otherwise the original
+    array of descriptors is left untouched and the return value is false.
+    'required' is limited by 20 (exceeding of this value will result in failure
+    to load the symbols and the return value will be false).
+    'handle' is the handle of the library if it is loaded. Otherwise it is left
+    untouched.
+    'flags' is the set of DYNAMIC_LINK_* flags. Each of the DYNAMIC_LINK_* flags
+    allows its corresponding linking stage.
+**/
+bool dynamic_link( const char* library,
+                   const dynamic_link_descriptor descriptors[],
+                   size_t required,
+                   dynamic_link_handle* handle = 0,
+                   int flags = DYNAMIC_LINK_ALL );
+
+void dynamic_unlink( dynamic_link_handle handle );
+
+void dynamic_unlink_all();
+
+enum dynamic_link_error_t {
+    dl_success = 0,
+    dl_lib_not_found,     // char const * lib, dlerr_t err
+    dl_sym_not_found,     // char const * sym, dlerr_t err
+                          // Note: dlerr_t depends on OS: it is char const * on Linux* and macOS*, int on Windows*.
+    dl_sys_fail,          // char const * func, int err
+    dl_buff_too_small     // none
+}; // dynamic_link_error_t
+
+CLOSE_INTERNAL_NAMESPACE
+
+#endif /* __TBB_dynamic_link */
diff --git a/xdl/third_party/tbb/src/tbb/governor.cpp b/xdl/third_party/tbb/src/tbb/governor.cpp
new file mode 100644
index 00000000..9fabe6e0
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/governor.cpp
@@ -0,0 +1,379 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <stdio.h>
+#include <stdlib.h>
+#include "governor.h"
+#include "tbb_main.h"
+#include "scheduler.h"
+#include "market.h"
+#include "arena.h"
+
+#include "tbb/task_scheduler_init.h"
+
+#include "dynamic_link.h"
+
+namespace tbb {
+namespace internal {
+
+//------------------------------------------------------------------------
+// governor
+//------------------------------------------------------------------------
+
+#if __TBB_SURVIVE_THREAD_SWITCH
+// Support for interoperability with Intel(R) Cilk(TM) Plus.
+
+#if _WIN32
+#define CILKLIB_NAME "cilkrts20.dll"
+#else
+#define CILKLIB_NAME "libcilkrts.so"
+#endif
+
+//! Handler for interoperation with cilkrts library.
+static __cilk_tbb_retcode (*watch_stack_handler)(struct __cilk_tbb_unwatch_thunk* u,
+                                                 struct __cilk_tbb_stack_op_thunk o);
+
+//! Table describing how to link the handlers.
+static const dynamic_link_descriptor CilkLinkTable[] = {
+    DLD_NOWEAK(__cilkrts_watch_stack, watch_stack_handler)
+};
+
+static atomic<do_once_state> cilkrts_load_state;
+
+bool initialize_cilk_interop() {
+    // Pinning can fail. This is a normal situation, and means that the current
+    // thread does not use cilkrts and consequently does not need interop.
+    return dynamic_link( CILKLIB_NAME, CilkLinkTable, 1,  /*handle=*/0, DYNAMIC_LINK_GLOBAL );
+}
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+namespace rml {
+    tbb_server* make_private_server( tbb_client& client );
+}
+
+void governor::acquire_resources () {
+#if USE_PTHREAD
+    int status = theTLS.create(auto_terminate);
+#else
+    int status = theTLS.create();
+#endif
+    if( status )
+        handle_perror(status, "TBB failed to initialize task scheduler TLS\n");
+    is_speculation_enabled = cpu_has_speculation();
+    is_rethrow_broken = gcc_rethrow_exception_broken();
+}
+
+void governor::release_resources () {
+    theRMLServerFactory.close();
+    destroy_process_mask();
+#if TBB_USE_ASSERT
+    if( __TBB_InitOnce::initialization_done() && theTLS.get() ) 
+        runtime_warning( "TBB is unloaded while tbb::task_scheduler_init object is alive?" );
+#endif
+    int status = theTLS.destroy();
+    if( status )
+        runtime_warning("failed to destroy task scheduler TLS: %s", strerror(status));
+    dynamic_unlink_all();
+}
+
+rml::tbb_server* governor::create_rml_server ( rml::tbb_client& client ) {
+    rml::tbb_server* server = NULL;
+    if( !UsePrivateRML ) {
+        ::rml::factory::status_type status = theRMLServerFactory.make_server( server, client );
+        if( status != ::rml::factory::st_success ) {
+            UsePrivateRML = true;
+            runtime_warning( "rml::tbb_factory::make_server failed with status %x, falling back on private rml", status );
+        }
+    }
+    if ( !server ) {
+        __TBB_ASSERT( UsePrivateRML, NULL );
+        server = rml::make_private_server( client );
+    }
+    __TBB_ASSERT( server, "Failed to create RML server" );
+    return server;
+}
+
+
+uintptr_t governor::tls_value_of( generic_scheduler* s ) {
+    __TBB_ASSERT( (uintptr_t(s)&1) == 0, "Bad pointer to the scheduler" );
+    // LSB marks the scheduler initialized with arena
+    return uintptr_t(s) | uintptr_t((s && (s->my_arena || s->is_worker()))? 1 : 0);
+}
+
+void governor::assume_scheduler( generic_scheduler* s ) {
+    theTLS.set( tls_value_of(s) );
+}
+
+bool governor::is_set( generic_scheduler* s ) {
+    return theTLS.get() == tls_value_of(s);
+}
+
+void governor::sign_on(generic_scheduler* s) {
+    __TBB_ASSERT( is_set(NULL) && s, NULL );
+    assume_scheduler( s );
+#if __TBB_SURVIVE_THREAD_SWITCH
+    if( watch_stack_handler ) {
+        __cilk_tbb_stack_op_thunk o;
+        o.routine = &stack_op_handler;
+        o.data = s;
+        if( (*watch_stack_handler)(&s->my_cilk_unwatch_thunk, o) ) {
+            // Failed to register with cilkrts, make sure we are clean
+            s->my_cilk_unwatch_thunk.routine = NULL;
+        }
+#if TBB_USE_ASSERT
+        else
+            s->my_cilk_state = generic_scheduler::cs_running;
+#endif /* TBB_USE_ASSERT */
+    }
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+    __TBB_ASSERT( is_set(s), NULL );
+}
+
+void governor::sign_off(generic_scheduler* s) {
+    suppress_unused_warning(s);
+    __TBB_ASSERT( is_set(s), "attempt to unregister a wrong scheduler instance" );
+    assume_scheduler(NULL);
+#if __TBB_SURVIVE_THREAD_SWITCH
+    __cilk_tbb_unwatch_thunk &ut = s->my_cilk_unwatch_thunk;
+    if ( ut.routine )
+       (*ut.routine)(ut.data);
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+}
+
+void governor::one_time_init() {
+    if( !__TBB_InitOnce::initialization_done() )
+        DoOneTimeInitializations();
+#if __TBB_SURVIVE_THREAD_SWITCH
+    atomic_do_once( &initialize_cilk_interop, cilkrts_load_state );
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+}
+
+generic_scheduler* governor::init_scheduler_weak() {
+    one_time_init();
+    __TBB_ASSERT( is_set(NULL), "TLS contains a scheduler?" );
+    generic_scheduler* s = generic_scheduler::create_master( NULL ); // without arena
+    s->my_auto_initialized = true;
+    return s;
+}
+
+generic_scheduler* governor::init_scheduler( int num_threads, stack_size_type stack_size, bool auto_init ) {
+    one_time_init();
+    if ( uintptr_t v = theTLS.get() ) {
+        generic_scheduler* s = tls_scheduler_of( v );
+        if ( (v&1) == 0 ) { // TLS holds scheduler instance without arena
+            __TBB_ASSERT( s->my_ref_count == 1, "weakly initialized scheduler must have refcount equal to 1" );
+            __TBB_ASSERT( !s->my_arena, "weakly initialized scheduler  must have no arena" );
+            __TBB_ASSERT( s->my_auto_initialized, "weakly initialized scheduler is supposed to be auto-initialized" );
+            s->attach_arena( market::create_arena( default_num_threads(), 1, 0 ), 0, /*is_master*/true );
+            __TBB_ASSERT( s->my_arena_index == 0, "Master thread must occupy the first slot in its arena" );
+            s->my_arena_slot->my_scheduler = s;
+            s->my_arena->my_default_ctx = s->default_context(); // it also transfers implied ownership
+            // Mark the scheduler as fully initialized
+            assume_scheduler( s );
+        }
+        // Increment refcount only for explicit instances of task_scheduler_init.
+        if ( !auto_init ) s->my_ref_count += 1;
+        __TBB_ASSERT( s->my_arena, "scheduler is not initialized fully" );
+        return s;
+    }
+    // Create new scheduler instance with arena
+    if( num_threads == task_scheduler_init::automatic )
+        num_threads = default_num_threads();
+    arena *a = market::create_arena( num_threads, 1, stack_size );
+    generic_scheduler* s = generic_scheduler::create_master( a );
+    __TBB_ASSERT(s, "Somehow a local scheduler creation for a master thread failed");
+    __TBB_ASSERT( is_set(s), NULL );
+    s->my_auto_initialized = auto_init;
+    return s;
+}
+
+bool governor::terminate_scheduler( generic_scheduler* s, bool blocking ) {
+    bool ok = false;
+    __TBB_ASSERT( is_set(s), "Attempt to terminate non-local scheduler instance" );
+    if (0 == --(s->my_ref_count)) {
+        ok = s->cleanup_master( blocking );
+        __TBB_ASSERT( is_set(NULL), "cleanup_master has not cleared its TLS slot" );
+    }
+    return ok;
+}
+
+void governor::auto_terminate(void* arg){
+    generic_scheduler* s = tls_scheduler_of( uintptr_t(arg) ); // arg is equivalent to theTLS.get()
+    if( s && s->my_auto_initialized ) {
+        if( !--(s->my_ref_count) ) {
+            // If the TLS slot is already cleared by OS or underlying concurrency
+            // runtime, restore its value.
+            if( !is_set(s) )
+                assume_scheduler(s);
+            s->cleanup_master( /*blocking_terminate=*/false );
+            __TBB_ASSERT( is_set(NULL), "cleanup_master has not cleared its TLS slot" );
+        }
+    }
+}
+
+void governor::print_version_info () {
+    if ( UsePrivateRML )
+        PrintExtraVersionInfo( "RML", "private" );
+    else {
+        PrintExtraVersionInfo( "RML", "shared" );
+        theRMLServerFactory.call_with_server_info( PrintRMLVersionInfo, (void*)"" );
+    }
+#if __TBB_SURVIVE_THREAD_SWITCH
+    if( watch_stack_handler )
+        PrintExtraVersionInfo( "CILK", CILKLIB_NAME );
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+}
+
+void governor::initialize_rml_factory () {
+    ::rml::factory::status_type res = theRMLServerFactory.open();
+    UsePrivateRML = res != ::rml::factory::st_success;
+}
+
+#if __TBB_SURVIVE_THREAD_SWITCH
+__cilk_tbb_retcode governor::stack_op_handler( __cilk_tbb_stack_op op, void* data ) {
+    __TBB_ASSERT(data,NULL);
+    generic_scheduler* s = static_cast<generic_scheduler*>(data);
+#if TBB_USE_ASSERT
+    void* current = local_scheduler_if_initialized();
+#if _WIN32||_WIN64
+    uintptr_t thread_id = GetCurrentThreadId();
+#else
+    uintptr_t thread_id = uintptr_t(pthread_self());
+#endif
+#endif /* TBB_USE_ASSERT */
+    switch( op ) {
+        case CILK_TBB_STACK_ADOPT: {
+            __TBB_ASSERT( !current && s->my_cilk_state==generic_scheduler::cs_limbo ||
+                          current==s && s->my_cilk_state==generic_scheduler::cs_running, "invalid adoption" );
+#if TBB_USE_ASSERT
+            if( current==s )
+                runtime_warning( "redundant adoption of %p by thread %p\n", s, (void*)thread_id );
+            s->my_cilk_state = generic_scheduler::cs_running;
+#endif /* TBB_USE_ASSERT */
+            assume_scheduler( s );
+            break;
+        }
+        case CILK_TBB_STACK_ORPHAN: {
+            __TBB_ASSERT( current==s && s->my_cilk_state==generic_scheduler::cs_running, "invalid orphaning" );
+#if TBB_USE_ASSERT
+            s->my_cilk_state = generic_scheduler::cs_limbo;
+#endif /* TBB_USE_ASSERT */
+            assume_scheduler(NULL);
+            break;
+        }
+        case CILK_TBB_STACK_RELEASE: {
+            __TBB_ASSERT( !current && s->my_cilk_state==generic_scheduler::cs_limbo ||
+                          current==s && s->my_cilk_state==generic_scheduler::cs_running, "invalid release" );
+#if TBB_USE_ASSERT
+            s->my_cilk_state = generic_scheduler::cs_freed;
+#endif /* TBB_USE_ASSERT */
+            s->my_cilk_unwatch_thunk.routine = NULL;
+            auto_terminate( s );
+            break;
+        }
+        default:
+            __TBB_ASSERT(0, "invalid op");
+    }
+    return 0;
+}
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+} // namespace internal
+
+//------------------------------------------------------------------------
+// task_scheduler_init
+//------------------------------------------------------------------------
+
+using namespace internal;
+
+/** Left out-of-line for the sake of the backward binary compatibility **/
+void task_scheduler_init::initialize( int number_of_threads ) {
+    initialize( number_of_threads, 0 );
+}
+
+void task_scheduler_init::initialize( int number_of_threads, stack_size_type thread_stack_size ) {
+#if __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS
+    uintptr_t new_mode = thread_stack_size & propagation_mode_mask;
+#endif
+    thread_stack_size &= ~(stack_size_type)propagation_mode_mask;
+    if( number_of_threads!=deferred ) {
+        __TBB_ASSERT_RELEASE( !my_scheduler, "task_scheduler_init already initialized" );
+        __TBB_ASSERT_RELEASE( number_of_threads==automatic || number_of_threads > 0,
+                    "number_of_threads for task_scheduler_init must be automatic or positive" );
+        internal::generic_scheduler *s = governor::init_scheduler( number_of_threads, thread_stack_size, /*auto_init=*/false );
+#if __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS
+        if ( s->master_outermost_level() ) {
+            uintptr_t &vt = s->default_context()->my_version_and_traits;
+            uintptr_t prev_mode = vt & task_group_context::exact_exception ? propagation_mode_exact : 0;
+            vt = new_mode & propagation_mode_exact ? vt | task_group_context::exact_exception
+                    : new_mode & propagation_mode_captured ? vt & ~task_group_context::exact_exception : vt;
+            // Use least significant bit of the scheduler pointer to store previous mode.
+            // This is necessary when components compiled with different compilers and/or
+            // TBB versions initialize the
+            my_scheduler = static_cast<scheduler*>((generic_scheduler*)((uintptr_t)s | prev_mode));
+        }
+        else
+#endif /* __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS */
+            my_scheduler = s;
+    } else {
+        __TBB_ASSERT_RELEASE( !thread_stack_size, "deferred initialization ignores stack size setting" );
+    }
+}
+
+bool task_scheduler_init::internal_terminate( bool blocking ) {
+#if __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS
+    uintptr_t prev_mode = (uintptr_t)my_scheduler & propagation_mode_exact;
+    my_scheduler = (scheduler*)((uintptr_t)my_scheduler & ~(uintptr_t)propagation_mode_exact);
+#endif /* __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS */
+    generic_scheduler* s = static_cast<generic_scheduler*>(my_scheduler);
+    my_scheduler = NULL;
+    __TBB_ASSERT_RELEASE( s, "task_scheduler_init::terminate without corresponding task_scheduler_init::initialize()");
+#if __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS
+    if ( s->master_outermost_level() ) {
+        uintptr_t &vt = s->default_context()->my_version_and_traits;
+        vt = prev_mode & propagation_mode_exact ? vt | task_group_context::exact_exception
+                                        : vt & ~task_group_context::exact_exception;
+    }
+#endif /* __TBB_TASK_GROUP_CONTEXT && TBB_USE_EXCEPTIONS */
+    return governor::terminate_scheduler(s, blocking);
+}
+
+void task_scheduler_init::terminate() {
+    internal_terminate(/*blocking_terminate=*/false);
+}
+
+#if __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+bool task_scheduler_init::internal_blocking_terminate( bool throwing ) {
+    bool ok = internal_terminate( /*blocking_terminate=*/true );
+#if TBB_USE_EXCEPTIONS
+    if( throwing && !ok )
+        throw_exception( eid_blocking_thread_join_impossible );
+#else
+    suppress_unused_warning( throwing );
+#endif
+    return ok;
+}
+#endif // __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+
+int task_scheduler_init::default_num_threads() {
+    return governor::default_num_threads();
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/governor.h b/xdl/third_party/tbb/src/tbb/governor.h
new file mode 100644
index 00000000..1f4949c6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/governor.h
@@ -0,0 +1,163 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_governor_H
+#define _TBB_governor_H
+
+#include "tbb/task_scheduler_init.h"
+#include "../rml/include/rml_tbb.h"
+
+#include "tbb_misc.h" // for AvailableHwConcurrency
+#include "tls.h"
+
+#if __TBB_SURVIVE_THREAD_SWITCH
+#include "cilk-tbb-interop.h"
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+namespace tbb {
+namespace internal {
+
+class market;
+class generic_scheduler;
+class __TBB_InitOnce;
+
+namespace rml {
+class tbb_client;
+}
+
+//------------------------------------------------------------------------
+// Class governor
+//------------------------------------------------------------------------
+
+//! The class handles access to the single instance of market, and to TLS to keep scheduler instances.
+/** It also supports automatic on-demand initialization of the TBB scheduler.
+    The class contains only static data members and methods.*/
+class governor {
+private:
+    friend class __TBB_InitOnce;
+    friend class market;
+
+    //! TLS for scheduler instances associated with individual threads
+    static basic_tls<uintptr_t> theTLS;
+
+    //! Caches the maximal level of parallelism supported by the hardware
+    static unsigned DefaultNumberOfThreads;
+
+    static rml::tbb_factory theRMLServerFactory;
+
+    static bool UsePrivateRML;
+
+    // Flags for runtime-specific conditions
+    static bool is_speculation_enabled;
+    static bool is_rethrow_broken;
+
+    //! Create key for thread-local storage and initialize RML.
+    static void acquire_resources ();
+
+    //! Destroy the thread-local storage key and deinitialize RML.
+    static void release_resources ();
+
+    static rml::tbb_server* create_rml_server ( rml::tbb_client& );
+
+    //! The internal routine to undo automatic initialization.
+    /** The signature is written with void* so that the routine
+        can be the destructor argument to pthread_key_create. */
+    static void auto_terminate(void* scheduler);
+
+public:
+    static unsigned default_num_threads () {
+        // No memory fence required, because at worst each invoking thread calls AvailableHwConcurrency once.
+        return DefaultNumberOfThreads ? DefaultNumberOfThreads :
+                                        DefaultNumberOfThreads = AvailableHwConcurrency();
+    }
+    static void one_time_init();
+    //! Processes scheduler initialization request (possibly nested) in a master thread
+    /** If necessary creates new instance of arena and/or local scheduler.
+        The auto_init argument specifies if the call is due to automatic initialization. **/
+    static generic_scheduler* init_scheduler( int num_threads, stack_size_type stack_size, bool auto_init );
+
+    //! Automatic initialization of scheduler in a master thread with default settings without arena
+    static generic_scheduler* init_scheduler_weak();
+
+    //! Processes scheduler termination request (possibly nested) in a master thread
+    static bool terminate_scheduler( generic_scheduler* s, bool blocking );
+
+    //! Register TBB scheduler instance in thread-local storage.
+    static void sign_on( generic_scheduler* s );
+
+    //! Unregister TBB scheduler instance from thread-local storage.
+    static void sign_off( generic_scheduler* s );
+
+    //! Used to check validity of the local scheduler TLS contents.
+    static bool is_set( generic_scheduler* s );
+
+    //! Temporarily set TLS slot to the given scheduler
+    static void assume_scheduler( generic_scheduler* s );
+
+    //! Computes the value of the TLS
+    static uintptr_t tls_value_of( generic_scheduler* s );
+
+    // TODO IDEA: refactor bit manipulations over pointer types to a class?
+    //! Converts TLS value to the scheduler pointer
+    static generic_scheduler* tls_scheduler_of( uintptr_t v ) {
+        return (generic_scheduler*)(v & ~uintptr_t(1));
+    }
+
+    //! Obtain the thread-local instance of the TBB scheduler.
+    /** If the scheduler has not been initialized yet, initialization is done automatically.
+        Note that auto-initialized scheduler instance is destroyed only when its thread terminates. **/
+    static generic_scheduler* local_scheduler () {
+        uintptr_t v = theTLS.get();
+        return (v&1) ? tls_scheduler_of(v) : init_scheduler( task_scheduler_init::automatic, 0, /*auto_init=*/true );
+    }
+
+    static generic_scheduler* local_scheduler_weak () {
+        uintptr_t v = theTLS.get();
+        return v ? tls_scheduler_of(v) : init_scheduler_weak();
+    }
+
+    static generic_scheduler* local_scheduler_if_initialized () {
+        return tls_scheduler_of( theTLS.get() );
+    }
+
+    //! Undo automatic initialization if necessary; call when a thread exits.
+    static void terminate_auto_initialized_scheduler() {
+        auto_terminate( local_scheduler_if_initialized() );
+    }
+
+    static void print_version_info ();
+
+    static void initialize_rml_factory ();
+
+    static bool does_client_join_workers (const tbb::internal::rml::tbb_client &client);
+
+#if __TBB_SURVIVE_THREAD_SWITCH
+    static __cilk_tbb_retcode stack_op_handler( __cilk_tbb_stack_op op, void* );
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+    static bool speculation_enabled() { return is_speculation_enabled; }
+    static bool rethrow_exception_broken() { return is_rethrow_broken; }
+
+}; // class governor
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_governor_H */
diff --git a/xdl/third_party/tbb/src/tbb/ia32-masm/atomic_support.asm b/xdl/third_party/tbb/src/tbb/ia32-masm/atomic_support.asm
new file mode 100644
index 00000000..059b547b
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia32-masm/atomic_support.asm
@@ -0,0 +1,188 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+.686
+.model flat,c
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchadd1
+__TBB_machine_fetchadd1:
+	mov edx,4[esp]
+	mov eax,8[esp]
+	lock xadd [edx],al
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchstore1
+__TBB_machine_fetchstore1:
+	mov edx,4[esp]
+	mov eax,8[esp]
+	lock xchg [edx],al
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_cmpswp1
+__TBB_machine_cmpswp1:
+	mov edx,4[esp]
+	mov ecx,8[esp]
+	mov eax,12[esp]
+	lock cmpxchg [edx],cl
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchadd2
+__TBB_machine_fetchadd2:
+	mov edx,4[esp]
+	mov eax,8[esp]
+	lock xadd [edx],ax
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchstore2
+__TBB_machine_fetchstore2:
+	mov edx,4[esp]
+	mov eax,8[esp]
+	lock xchg [edx],ax
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_cmpswp2
+__TBB_machine_cmpswp2:
+	mov edx,4[esp]
+	mov ecx,8[esp]
+	mov eax,12[esp]
+	lock cmpxchg [edx],cx
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchadd4
+__TBB_machine_fetchadd4:
+	mov edx,4[esp]
+	mov eax,8[esp]
+	lock xadd [edx],eax
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchstore4
+__TBB_machine_fetchstore4:
+	mov edx,4[esp]
+	mov eax,8[esp]
+	lock xchg [edx],eax
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_cmpswp4
+__TBB_machine_cmpswp4:
+	mov edx,4[esp]
+	mov ecx,8[esp]
+	mov eax,12[esp]
+	lock cmpxchg [edx],ecx
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchadd8
+__TBB_machine_fetchadd8:
+	push ebx
+	push edi
+	mov edi,12[esp]
+	mov eax,[edi]
+	mov edx,4[edi]
+__TBB_machine_fetchadd8_loop:
+	mov ebx,16[esp]
+	mov ecx,20[esp]
+	add ebx,eax
+	adc ecx,edx
+	lock cmpxchg8b qword ptr [edi]
+	jnz __TBB_machine_fetchadd8_loop
+	pop edi
+	pop ebx
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_fetchstore8
+__TBB_machine_fetchstore8:
+	push ebx
+	push edi
+	mov edi,12[esp]
+	mov ebx,16[esp]
+	mov ecx,20[esp]
+	mov eax,[edi]
+	mov edx,4[edi]
+__TBB_machine_fetchstore8_loop:
+	lock cmpxchg8b qword ptr [edi]
+	jnz __TBB_machine_fetchstore8_loop
+	pop edi
+	pop ebx
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_cmpswp8
+__TBB_machine_cmpswp8:
+	push ebx
+	push edi
+	mov edi,12[esp]
+	mov ebx,16[esp]
+	mov ecx,20[esp]
+	mov eax,24[esp]
+	mov edx,28[esp]
+	lock cmpxchg8b qword ptr [edi]
+	pop edi
+	pop ebx
+	ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_load8
+__TBB_machine_Load8:
+	; If location is on stack, compiler may have failed to align it correctly, so we do dynamic check.
+	mov ecx,4[esp]
+	test ecx,7
+	jne load_slow
+	; Load within a cache line
+	sub esp,12
+	fild qword ptr [ecx]
+	fistp qword ptr [esp]
+	mov eax,[esp]
+	mov edx,4[esp]
+	add esp,12
+	ret
+load_slow:
+	; Load is misaligned. Use cmpxchg8b.
+	push ebx
+	push edi
+	mov edi,ecx
+	xor eax,eax
+	xor ebx,ebx
+	xor ecx,ecx
+	xor edx,edx
+	lock cmpxchg8b qword ptr [edi]
+	pop edi
+	pop ebx
+	ret
+EXTRN __TBB_machine_store8_slow:PROC
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_store8
+__TBB_machine_Store8:
+	; If location is on stack, compiler may have failed to align it correctly, so we do dynamic check.
+	mov ecx,4[esp]
+	test ecx,7
+	jne __TBB_machine_store8_slow ;; tail call to tbb_misc.cpp
+	fild qword ptr 8[esp]
+	fistp qword ptr [ecx]
+	ret
+end
diff --git a/xdl/third_party/tbb/src/tbb/ia32-masm/itsx.asm b/xdl/third_party/tbb/src/tbb/ia32-masm/itsx.asm
new file mode 100644
index 00000000..e10248ff
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia32-masm/itsx.asm
@@ -0,0 +1,80 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+.686
+.model flat,c
+.code
+        ALIGN 4
+        PUBLIC c __TBB_machine_try_lock_elided
+__TBB_machine_try_lock_elided:
+        mov ecx, 4[esp]
+        xor eax, eax
+        mov al, 1
+        BYTE 0F2H
+        xchg al, byte ptr [ecx]
+        xor  al, 1
+        ret
+.code
+        ALIGN 4
+        PUBLIC c __TBB_machine_unlock_elided
+__TBB_machine_unlock_elided:
+        mov ecx, 4[esp]
+        BYTE 0F3H
+        mov byte ptr [ecx], 0
+        ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_begin_transaction
+__TBB_machine_begin_transaction:
+        mov  eax, -1
+        BYTE 0C7H
+        BYTE 0F8H
+        BYTE 000H
+        BYTE 000H
+        BYTE 000H
+        BYTE 000H
+        ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_end_transaction
+__TBB_machine_end_transaction:
+        BYTE 00FH
+        BYTE 001H
+        BYTE 0D5H
+        ret
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_transaction_conflict_abort
+__TBB_machine_transaction_conflict_abort:
+        BYTE 0C6H
+        BYTE 0F8H
+        BYTE 0FFH  ; 12.4.5 Abort argument: lock not free when tested
+        ret
+.code 
+        ALIGN 4
+	PUBLIC c __TBB_machine_is_in_transaction
+__TBB_machine_is_in_transaction:
+        xor eax, eax
+        BYTE 00FH
+        BYTE 001H
+        BYTE 0D6H
+        JZ   rset
+        MOV  al,1
+rset:
+        RET
+end
diff --git a/xdl/third_party/tbb/src/tbb/ia32-masm/lock_byte.asm b/xdl/third_party/tbb/src/tbb/ia32-masm/lock_byte.asm
new file mode 100644
index 00000000..c0f9ebd2
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia32-masm/lock_byte.asm
@@ -0,0 +1,38 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+; DO NOT EDIT - AUTOMATICALLY GENERATED FROM .s FILE
+.686
+.model flat,c
+.code 
+	ALIGN 4
+	PUBLIC c __TBB_machine_trylockbyte
+__TBB_machine_trylockbyte:
+	mov edx,4[esp]
+	mov al,[edx]
+	mov cl,1
+	test al,1
+	jnz __TBB_machine_trylockbyte_contended
+	lock cmpxchg [edx],cl
+	jne __TBB_machine_trylockbyte_contended
+	mov eax,1
+	ret
+__TBB_machine_trylockbyte_contended:
+	xor eax,eax
+	ret
+end
diff --git a/xdl/third_party/tbb/src/tbb/ia64-gas/atomic_support.s b/xdl/third_party/tbb/src/tbb/ia64-gas/atomic_support.s
new file mode 100644
index 00000000..bd60d988
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia64-gas/atomic_support.s
@@ -0,0 +1,670 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_fetchadd1__TBB_full_fence#
+        .global __TBB_machine_fetchadd1__TBB_full_fence#
+__TBB_machine_fetchadd1__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_fetchadd1acquire
+}
+        .endp __TBB_machine_fetchadd1__TBB_full_fence#
+
+        .proc __TBB_machine_fetchadd1acquire#
+        .global __TBB_machine_fetchadd1acquire#
+__TBB_machine_fetchadd1acquire:
+
+
+
+
+
+
+
+        ld1 r9=[r32]
+;;
+Retry_1acquire:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg1.acq r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_1acquire
+        br.ret.sptk.many b0
+# 49 "<stdin>"
+        .endp __TBB_machine_fetchadd1acquire#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore1__TBB_full_fence#
+        .global __TBB_machine_fetchstore1__TBB_full_fence#
+__TBB_machine_fetchstore1__TBB_full_fence:
+        mf
+;;
+        xchg1 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore1__TBB_full_fence#
+
+
+        .proc __TBB_machine_fetchstore1acquire#
+        .global __TBB_machine_fetchstore1acquire#
+__TBB_machine_fetchstore1acquire:
+        xchg1 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore1acquire#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_cmpswp1__TBB_full_fence#
+        .global __TBB_machine_cmpswp1__TBB_full_fence#
+__TBB_machine_cmpswp1__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_cmpswp1acquire
+}
+        .endp __TBB_machine_cmpswp1__TBB_full_fence#
+
+        .proc __TBB_machine_cmpswp1acquire#
+        .global __TBB_machine_cmpswp1acquire#
+__TBB_machine_cmpswp1acquire:
+
+        zxt1 r34=r34
+;;
+
+        mov ar.ccv=r34
+;;
+        cmpxchg1.acq r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp1acquire#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_fetchadd2__TBB_full_fence#
+        .global __TBB_machine_fetchadd2__TBB_full_fence#
+__TBB_machine_fetchadd2__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_fetchadd2acquire
+}
+        .endp __TBB_machine_fetchadd2__TBB_full_fence#
+
+        .proc __TBB_machine_fetchadd2acquire#
+        .global __TBB_machine_fetchadd2acquire#
+__TBB_machine_fetchadd2acquire:
+
+
+
+
+
+
+
+        ld2 r9=[r32]
+;;
+Retry_2acquire:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg2.acq r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_2acquire
+        br.ret.sptk.many b0
+# 49 "<stdin>"
+        .endp __TBB_machine_fetchadd2acquire#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore2__TBB_full_fence#
+        .global __TBB_machine_fetchstore2__TBB_full_fence#
+__TBB_machine_fetchstore2__TBB_full_fence:
+        mf
+;;
+        xchg2 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore2__TBB_full_fence#
+
+
+        .proc __TBB_machine_fetchstore2acquire#
+        .global __TBB_machine_fetchstore2acquire#
+__TBB_machine_fetchstore2acquire:
+        xchg2 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore2acquire#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_cmpswp2__TBB_full_fence#
+        .global __TBB_machine_cmpswp2__TBB_full_fence#
+__TBB_machine_cmpswp2__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_cmpswp2acquire
+}
+        .endp __TBB_machine_cmpswp2__TBB_full_fence#
+
+        .proc __TBB_machine_cmpswp2acquire#
+        .global __TBB_machine_cmpswp2acquire#
+__TBB_machine_cmpswp2acquire:
+
+        zxt2 r34=r34
+;;
+
+        mov ar.ccv=r34
+;;
+        cmpxchg2.acq r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp2acquire#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_fetchadd4__TBB_full_fence#
+        .global __TBB_machine_fetchadd4__TBB_full_fence#
+__TBB_machine_fetchadd4__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_fetchadd4acquire
+}
+        .endp __TBB_machine_fetchadd4__TBB_full_fence#
+
+        .proc __TBB_machine_fetchadd4acquire#
+        .global __TBB_machine_fetchadd4acquire#
+__TBB_machine_fetchadd4acquire:
+
+        cmp.eq p6,p0=1,r33
+        cmp.eq p8,p0=-1,r33
+  (p6) br.cond.dptk Inc_4acquire
+  (p8) br.cond.dpnt Dec_4acquire
+;;
+
+        ld4 r9=[r32]
+;;
+Retry_4acquire:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg4.acq r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_4acquire
+        br.ret.sptk.many b0
+
+Inc_4acquire:
+        fetchadd4.acq r8=[r32],1
+        br.ret.sptk.many b0
+Dec_4acquire:
+        fetchadd4.acq r8=[r32],-1
+        br.ret.sptk.many b0
+
+        .endp __TBB_machine_fetchadd4acquire#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore4__TBB_full_fence#
+        .global __TBB_machine_fetchstore4__TBB_full_fence#
+__TBB_machine_fetchstore4__TBB_full_fence:
+        mf
+;;
+        xchg4 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore4__TBB_full_fence#
+
+
+        .proc __TBB_machine_fetchstore4acquire#
+        .global __TBB_machine_fetchstore4acquire#
+__TBB_machine_fetchstore4acquire:
+        xchg4 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore4acquire#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_cmpswp4__TBB_full_fence#
+        .global __TBB_machine_cmpswp4__TBB_full_fence#
+__TBB_machine_cmpswp4__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_cmpswp4acquire
+}
+        .endp __TBB_machine_cmpswp4__TBB_full_fence#
+
+        .proc __TBB_machine_cmpswp4acquire#
+        .global __TBB_machine_cmpswp4acquire#
+__TBB_machine_cmpswp4acquire:
+
+        zxt4 r34=r34
+;;
+
+        mov ar.ccv=r34
+;;
+        cmpxchg4.acq r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp4acquire#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_fetchadd8__TBB_full_fence#
+        .global __TBB_machine_fetchadd8__TBB_full_fence#
+__TBB_machine_fetchadd8__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_fetchadd8acquire
+}
+        .endp __TBB_machine_fetchadd8__TBB_full_fence#
+
+        .proc __TBB_machine_fetchadd8acquire#
+        .global __TBB_machine_fetchadd8acquire#
+__TBB_machine_fetchadd8acquire:
+
+        cmp.eq p6,p0=1,r33
+        cmp.eq p8,p0=-1,r33
+  (p6) br.cond.dptk Inc_8acquire
+  (p8) br.cond.dpnt Dec_8acquire
+;;
+
+        ld8 r9=[r32]
+;;
+Retry_8acquire:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg8.acq r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_8acquire
+        br.ret.sptk.many b0
+
+Inc_8acquire:
+        fetchadd8.acq r8=[r32],1
+        br.ret.sptk.many b0
+Dec_8acquire:
+        fetchadd8.acq r8=[r32],-1
+        br.ret.sptk.many b0
+
+        .endp __TBB_machine_fetchadd8acquire#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore8__TBB_full_fence#
+        .global __TBB_machine_fetchstore8__TBB_full_fence#
+__TBB_machine_fetchstore8__TBB_full_fence:
+        mf
+;;
+        xchg8 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore8__TBB_full_fence#
+
+
+        .proc __TBB_machine_fetchstore8acquire#
+        .global __TBB_machine_fetchstore8acquire#
+__TBB_machine_fetchstore8acquire:
+        xchg8 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore8acquire#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+
+
+        .proc __TBB_machine_cmpswp8__TBB_full_fence#
+        .global __TBB_machine_cmpswp8__TBB_full_fence#
+__TBB_machine_cmpswp8__TBB_full_fence:
+{
+        mf
+        br __TBB_machine_cmpswp8acquire
+}
+        .endp __TBB_machine_cmpswp8__TBB_full_fence#
+
+        .proc __TBB_machine_cmpswp8acquire#
+        .global __TBB_machine_cmpswp8acquire#
+__TBB_machine_cmpswp8acquire:
+
+
+
+
+        mov ar.ccv=r34
+;;
+        cmpxchg8.acq r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp8acquire#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+# 19 "<stdin>"
+        .proc __TBB_machine_fetchadd1release#
+        .global __TBB_machine_fetchadd1release#
+__TBB_machine_fetchadd1release:
+
+
+
+
+
+
+
+        ld1 r9=[r32]
+;;
+Retry_1release:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg1.rel r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_1release
+        br.ret.sptk.many b0
+# 49 "<stdin>"
+        .endp __TBB_machine_fetchadd1release#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore1release#
+        .global __TBB_machine_fetchstore1release#
+__TBB_machine_fetchstore1release:
+        mf
+;;
+        xchg1 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore1release#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+# 101 "<stdin>"
+        .proc __TBB_machine_cmpswp1release#
+        .global __TBB_machine_cmpswp1release#
+__TBB_machine_cmpswp1release:
+
+        zxt1 r34=r34
+;;
+
+        mov ar.ccv=r34
+;;
+        cmpxchg1.rel r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp1release#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+# 19 "<stdin>"
+        .proc __TBB_machine_fetchadd2release#
+        .global __TBB_machine_fetchadd2release#
+__TBB_machine_fetchadd2release:
+
+
+
+
+
+
+
+        ld2 r9=[r32]
+;;
+Retry_2release:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg2.rel r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_2release
+        br.ret.sptk.many b0
+# 49 "<stdin>"
+        .endp __TBB_machine_fetchadd2release#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore2release#
+        .global __TBB_machine_fetchstore2release#
+__TBB_machine_fetchstore2release:
+        mf
+;;
+        xchg2 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore2release#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+# 101 "<stdin>"
+        .proc __TBB_machine_cmpswp2release#
+        .global __TBB_machine_cmpswp2release#
+__TBB_machine_cmpswp2release:
+
+        zxt2 r34=r34
+;;
+
+        mov ar.ccv=r34
+;;
+        cmpxchg2.rel r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp2release#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+# 19 "<stdin>"
+        .proc __TBB_machine_fetchadd4release#
+        .global __TBB_machine_fetchadd4release#
+__TBB_machine_fetchadd4release:
+
+        cmp.eq p6,p0=1,r33
+        cmp.eq p8,p0=-1,r33
+  (p6) br.cond.dptk Inc_4release
+  (p8) br.cond.dpnt Dec_4release
+;;
+
+        ld4 r9=[r32]
+;;
+Retry_4release:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg4.rel r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_4release
+        br.ret.sptk.many b0
+
+Inc_4release:
+        fetchadd4.rel r8=[r32],1
+        br.ret.sptk.many b0
+Dec_4release:
+        fetchadd4.rel r8=[r32],-1
+        br.ret.sptk.many b0
+
+        .endp __TBB_machine_fetchadd4release#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore4release#
+        .global __TBB_machine_fetchstore4release#
+__TBB_machine_fetchstore4release:
+        mf
+;;
+        xchg4 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore4release#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+# 101 "<stdin>"
+        .proc __TBB_machine_cmpswp4release#
+        .global __TBB_machine_cmpswp4release#
+__TBB_machine_cmpswp4release:
+
+        zxt4 r34=r34
+;;
+
+        mov ar.ccv=r34
+;;
+        cmpxchg4.rel r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp4release#
+// DO NOT EDIT - AUTOMATICALLY GENERATED FROM tools/generate_atomic/ipf_generate.sh
+# 1 "<stdin>"
+# 1 "<built-in>"
+# 1 "<command line>"
+# 1 "<stdin>"
+
+
+
+
+
+        .section .text
+        .align 16
+# 19 "<stdin>"
+        .proc __TBB_machine_fetchadd8release#
+        .global __TBB_machine_fetchadd8release#
+__TBB_machine_fetchadd8release:
+
+        cmp.eq p6,p0=1,r33
+        cmp.eq p8,p0=-1,r33
+  (p6) br.cond.dptk Inc_8release
+  (p8) br.cond.dpnt Dec_8release
+;;
+
+        ld8 r9=[r32]
+;;
+Retry_8release:
+        mov ar.ccv=r9
+        mov r8=r9;
+        add r10=r9,r33
+;;
+        cmpxchg8.rel r9=[r32],r10,ar.ccv
+;;
+        cmp.ne p7,p0=r8,r9
+  (p7) br.cond.dpnt Retry_8release
+        br.ret.sptk.many b0
+
+Inc_8release:
+        fetchadd8.rel r8=[r32],1
+        br.ret.sptk.many b0
+Dec_8release:
+        fetchadd8.rel r8=[r32],-1
+        br.ret.sptk.many b0
+
+        .endp __TBB_machine_fetchadd8release#
+# 62 "<stdin>"
+        .section .text
+        .align 16
+        .proc __TBB_machine_fetchstore8release#
+        .global __TBB_machine_fetchstore8release#
+__TBB_machine_fetchstore8release:
+        mf
+;;
+        xchg8 r8=[r32],r33
+        br.ret.sptk.many b0
+        .endp __TBB_machine_fetchstore8release#
+# 88 "<stdin>"
+        .section .text
+        .align 16
+# 101 "<stdin>"
+        .proc __TBB_machine_cmpswp8release#
+        .global __TBB_machine_cmpswp8release#
+__TBB_machine_cmpswp8release:
+
+
+
+
+        mov ar.ccv=r34
+;;
+        cmpxchg8.rel r8=[r32],r33,ar.ccv
+        br.ret.sptk.many b0
+        .endp __TBB_machine_cmpswp8release#
diff --git a/xdl/third_party/tbb/src/tbb/ia64-gas/ia64_misc.s b/xdl/third_party/tbb/src/tbb/ia64-gas/ia64_misc.s
new file mode 100644
index 00000000..1f282816
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia64-gas/ia64_misc.s
@@ -0,0 +1,99 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+	// RSE backing store pointer retrieval
+    .section .text
+    .align 16
+    .proc __TBB_get_bsp#
+    .global __TBB_get_bsp#
+__TBB_get_bsp:
+        mov r8=ar.bsp
+        br.ret.sptk.many b0
+    .endp __TBB_get_bsp#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_load8_relaxed#
+    .global __TBB_machine_load8_relaxed#
+__TBB_machine_load8_relaxed:
+        ld8 r8=[r32]
+        br.ret.sptk.many b0
+    .endp __TBB_machine_load8_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_store8_relaxed#
+    .global __TBB_machine_store8_relaxed#
+__TBB_machine_store8_relaxed:
+        st8 [r32]=r33
+        br.ret.sptk.many b0
+    .endp __TBB_machine_store8_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_load4_relaxed#
+    .global __TBB_machine_load4_relaxed#
+__TBB_machine_load4_relaxed:
+        ld4 r8=[r32]
+        br.ret.sptk.many b0
+    .endp __TBB_machine_load4_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_store4_relaxed#
+    .global __TBB_machine_store4_relaxed#
+__TBB_machine_store4_relaxed:
+        st4 [r32]=r33
+        br.ret.sptk.many b0
+    .endp __TBB_machine_store4_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_load2_relaxed#
+    .global __TBB_machine_load2_relaxed#
+__TBB_machine_load2_relaxed:
+        ld2 r8=[r32]
+        br.ret.sptk.many b0
+    .endp __TBB_machine_load2_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_store2_relaxed#
+    .global __TBB_machine_store2_relaxed#
+__TBB_machine_store2_relaxed:
+        st2 [r32]=r33
+        br.ret.sptk.many b0
+    .endp __TBB_machine_store2_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_load1_relaxed#
+    .global __TBB_machine_load1_relaxed#
+__TBB_machine_load1_relaxed:
+        ld1 r8=[r32]
+        br.ret.sptk.many b0
+    .endp __TBB_machine_load1_relaxed#
+
+    .section .text
+    .align 16
+    .proc __TBB_machine_store1_relaxed#
+    .global __TBB_machine_store1_relaxed#
+__TBB_machine_store1_relaxed:
+        st1 [r32]=r33
+        br.ret.sptk.many b0
+    .endp __TBB_machine_store1_relaxed#
diff --git a/xdl/third_party/tbb/src/tbb/ia64-gas/lock_byte.s b/xdl/third_party/tbb/src/tbb/ia64-gas/lock_byte.s
new file mode 100644
index 00000000..5a90b074
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia64-gas/lock_byte.s
@@ -0,0 +1,46 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+	// Support for class TinyLock
+	.section .text
+	.align 16
+	// unsigned int __TBB_machine_trylockbyte( byte& flag );
+	// r32 = address of flag 
+	.proc  __TBB_machine_trylockbyte#
+	.global __TBB_machine_trylockbyte#
+ADDRESS_OF_FLAG=r32
+RETCODE=r8
+FLAG=r9
+BUSY=r10
+SCRATCH=r11
+__TBB_machine_trylockbyte:
+        ld1.acq FLAG=[ADDRESS_OF_FLAG]
+        mov BUSY=1
+        mov RETCODE=0
+;;
+        cmp.ne p6,p0=0,FLAG
+        mov ar.ccv=r0
+(p6)    br.ret.sptk.many b0
+;;
+        cmpxchg1.acq SCRATCH=[ADDRESS_OF_FLAG],BUSY,ar.ccv  // Try to acquire lock
+;;
+        cmp.eq p6,p0=0,SCRATCH
+;;
+(p6)    mov RETCODE=1
+   	br.ret.sptk.many b0	
+	.endp __TBB_machine_trylockbyte#
diff --git a/xdl/third_party/tbb/src/tbb/ia64-gas/log2.s b/xdl/third_party/tbb/src/tbb/ia64-gas/log2.s
new file mode 100644
index 00000000..71010988
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia64-gas/log2.s
@@ -0,0 +1,58 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+	.section .text
+	.align 16
+	// unsigned long __TBB_machine_lg( unsigned long x );
+	// r32 = x
+	.proc  __TBB_machine_lg#
+	.global __TBB_machine_lg#
+__TBB_machine_lg:
+        shr r16=r32,1	// .x
+;;
+        shr r17=r32,2	// ..x
+	or r32=r32,r16	// xx
+;;
+	shr r16=r32,3	// ...xx
+	or r32=r32,r17  // xxx
+;;
+	shr r17=r32,5	// .....xxx
+	or r32=r32,r16  // xxxxx
+;;
+	shr r16=r32,8	// ........xxxxx
+	or r32=r32,r17	// xxxxxxxx
+;;
+	shr r17=r32,13
+	or r32=r32,r16	// 13x
+;;
+	shr r16=r32,21
+	or r32=r32,r17	// 21x
+;;
+	shr r17=r32,34  
+	or r32=r32,r16	// 34x
+;;
+	shr r16=r32,55
+	or r32=r32,r17  // 55x
+;;
+	or r32=r32,r16  // 64x
+;;
+	popcnt r8=r32
+;;
+	add r8=-1,r8
+   	br.ret.sptk.many b0	
+	.endp __TBB_machine_lg#
diff --git a/xdl/third_party/tbb/src/tbb/ia64-gas/pause.s b/xdl/third_party/tbb/src/tbb/ia64-gas/pause.s
new file mode 100644
index 00000000..efcf0db8
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ia64-gas/pause.s
@@ -0,0 +1,33 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+	.section .text
+	.align 16
+	// void __TBB_machine_pause( long count );
+	// r32 = count
+	.proc  __TBB_machine_pause#
+	.global __TBB_machine_pause#
+count = r32
+__TBB_machine_pause:
+        hint.m 0
+	add count=-1,count
+;;
+	cmp.eq p6,p7=0,count
+(p7)	br.cond.dpnt __TBB_machine_pause
+(p6)   	br.ret.sptk.many b0	
+	.endp __TBB_machine_pause#
diff --git a/xdl/third_party/tbb/src/tbb/ibm_aix51/atomic_support.c b/xdl/third_party/tbb/src/tbb/ibm_aix51/atomic_support.c
new file mode 100644
index 00000000..174f1832
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/ibm_aix51/atomic_support.c
@@ -0,0 +1,55 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <stdint.h>
+#include <sys/atomic_op.h>
+
+/* This file must be compiled with gcc.  The IBM compiler doesn't seem to
+   support inline assembly statements (October 2007). */
+
+#ifdef __GNUC__
+
+int32_t __TBB_machine_cas_32 (volatile void* ptr, int32_t value, int32_t comparand) { 
+    __asm__ __volatile__ ("sync\n");  /* memory release operation */
+    compare_and_swap ((atomic_p) ptr, &comparand, value);
+    __asm__ __volatile__ ("isync\n");  /* memory acquire operation */
+    return comparand;
+}
+
+int64_t __TBB_machine_cas_64 (volatile void* ptr, int64_t value, int64_t comparand) { 
+    __asm__ __volatile__ ("sync\n");  /* memory release operation */
+    compare_and_swaplp ((atomic_l) ptr, &comparand, value);
+    __asm__ __volatile__ ("isync\n");  /* memory acquire operation */
+    return comparand;
+}
+
+void __TBB_machine_flush () { 
+    __asm__ __volatile__ ("sync\n");
+}
+
+void __TBB_machine_lwsync () { 
+    __asm__ __volatile__ ("lwsync\n");
+}
+
+void __TBB_machine_isync () { 
+    __asm__ __volatile__ ("isync\n");
+}
+
+#endif /* __GNUC__ */
diff --git a/xdl/third_party/tbb/src/tbb/index.html b/xdl/third_party/tbb/src/tbb/index.html
new file mode 100644
index 00000000..902443f6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/index.html
@@ -0,0 +1,31 @@
+<HTML>
+<BODY>
+
+<H2>Overview</H2>
+This directory contains the source code of the TBB core components.
+
+<H2>Directories</H2>
+<DL>
+<DT><A HREF="tools_api">tools_api</A>
+<DD>Source code of the interface components provided by the Intel&reg; Parallel Studio tools.
+<DT><A HREF="intel64-masm">intel64-masm</A>
+<DD>Assembly code for the Intel&reg; 64 architecture.
+<DT><A HREF="ia32-masm">ia32-masm</A>
+<DD>Assembly code for IA32 architecture.
+<DT><A HREF="ia64-gas">ia64-gas</A>
+<DD>Assembly code for IA-64 architecture.
+<DT><A HREF="ibm_aix51">ibm_aix51</A>
+<DD>Assembly code for AIX 5.1 port.
+</DL>
+
+<HR>
+<A HREF="../index.html">Up to parent directory</A>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+</BODY>
+</HTML>
diff --git a/xdl/third_party/tbb/src/tbb/intel64-masm/atomic_support.asm b/xdl/third_party/tbb/src/tbb/intel64-masm/atomic_support.asm
new file mode 100644
index 00000000..871f9d12
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/intel64-masm/atomic_support.asm
@@ -0,0 +1,72 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+; DO NOT EDIT - AUTOMATICALLY GENERATED FROM .s FILE
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_fetchadd1
+__TBB_machine_fetchadd1:
+	mov rax,rdx
+	lock xadd [rcx],al
+	ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_fetchstore1
+__TBB_machine_fetchstore1:
+	mov rax,rdx
+	lock xchg [rcx],al
+	ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_cmpswp1
+__TBB_machine_cmpswp1:
+	mov rax,r8
+	lock cmpxchg [rcx],dl
+	ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_fetchadd2
+__TBB_machine_fetchadd2:
+	mov rax,rdx
+	lock xadd [rcx],ax
+	ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_fetchstore2
+__TBB_machine_fetchstore2:
+	mov rax,rdx
+	lock xchg [rcx],ax
+	ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_cmpswp2
+__TBB_machine_cmpswp2:
+	mov rax,r8
+	lock cmpxchg [rcx],dx
+	ret
+.code
+        ALIGN 8
+        PUBLIC __TBB_machine_pause
+__TBB_machine_pause:
+L1:
+        dw 090f3H; pause
+        add ecx,-1
+        jne L1
+        ret
+end
+
diff --git a/xdl/third_party/tbb/src/tbb/intel64-masm/intel64_misc.asm b/xdl/third_party/tbb/src/tbb/intel64-masm/intel64_misc.asm
new file mode 100644
index 00000000..0c835008
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/intel64-masm/intel64_misc.asm
@@ -0,0 +1,33 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+.code
+	ALIGN 8
+	PUBLIC __TBB_get_cpu_ctl_env
+__TBB_get_cpu_ctl_env:
+    stmxcsr [rcx]
+    fstcw   [rcx+4]
+	ret
+.code
+	ALIGN 8
+	PUBLIC __TBB_set_cpu_ctl_env
+__TBB_set_cpu_ctl_env:
+    ldmxcsr [rcx]
+    fldcw   [rcx+4]
+	ret
+end
diff --git a/xdl/third_party/tbb/src/tbb/intel64-masm/itsx.asm b/xdl/third_party/tbb/src/tbb/intel64-masm/itsx.asm
new file mode 100644
index 00000000..be7be746
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/intel64-masm/itsx.asm
@@ -0,0 +1,76 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+.code
+        ALIGN 8
+        PUBLIC __TBB_machine_try_lock_elided
+__TBB_machine_try_lock_elided:
+        xor  rax, rax
+        mov  al, 1
+        BYTE 0F2H
+        xchg al, byte ptr [rcx]
+        xor  al, 1
+        ret
+.code
+        ALIGN 8
+        PUBLIC __TBB_machine_unlock_elided
+__TBB_machine_unlock_elided:
+        BYTE 0F3H
+        mov  byte ptr [rcx], 0
+        ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_begin_transaction
+__TBB_machine_begin_transaction:
+        mov  eax, -1
+        BYTE 0C7H
+        BYTE 0F8H
+        BYTE 000H
+        BYTE 000H
+        BYTE 000H
+        BYTE 000H
+        ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_end_transaction
+__TBB_machine_end_transaction:
+        BYTE 00FH
+        BYTE 001H
+        BYTE 0D5H
+        ret
+.code 
+	ALIGN 8
+	PUBLIC __TBB_machine_transaction_conflict_abort
+__TBB_machine_transaction_conflict_abort:
+        BYTE 0C6H
+        BYTE 0F8H
+        BYTE 0FFH  ; 12.4.5 Abort argument: lock not free when tested
+        ret
+.code 
+        ALIGN 8
+	PUBLIC __TBB_machine_is_in_transaction
+__TBB_machine_is_in_transaction:
+        xor eax, eax
+        BYTE 00FH  ; _xtest sets or clears ZF
+        BYTE 001H
+        BYTE 0D6H
+        jz   rset
+        mov  al,1
+rset:
+        ret
+end
diff --git a/xdl/third_party/tbb/src/tbb/intrusive_list.h b/xdl/third_party/tbb/src/tbb/intrusive_list.h
new file mode 100644
index 00000000..bf16b1d9
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/intrusive_list.h
@@ -0,0 +1,246 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_intrusive_list_H
+#define _TBB_intrusive_list_H
+
+#include "tbb/tbb_stddef.h"
+
+namespace tbb {
+namespace internal {
+
+//! Data structure to be inherited by the types that can form intrusive lists.
+/** Intrusive list is formed by means of the member_intrusive_list<T> template class.
+    Note that type T must derive from intrusive_list_node either publicly or
+    declare instantiation member_intrusive_list<T> as a friend.
+    This class implements a limited subset of std::list interface. **/
+struct intrusive_list_node {
+    intrusive_list_node *my_prev_node,
+                        *my_next_node;
+#if TBB_USE_ASSERT
+    intrusive_list_node () { my_prev_node = my_next_node = this; }
+#endif /* TBB_USE_ASSERT */
+};
+
+//! List of element of type T, where T is derived from intrusive_list_node
+/** The class is not thread safe. **/
+template <class List, class T>
+class intrusive_list_base {
+    //! Pointer to the head node
+    intrusive_list_node my_head;
+
+    //! Number of list elements
+    size_t my_size;
+
+    static intrusive_list_node& node ( T& item ) { return List::node(item); }
+
+    static T& item ( intrusive_list_node* node ) { return List::item(node); }
+
+    template<class Iterator>
+    class iterator_impl {
+        Iterator& self () { return *static_cast<Iterator*>(this); }
+
+        //! Node the iterator points to at the moment
+        intrusive_list_node *my_pos;
+
+    protected:
+        iterator_impl (intrusive_list_node* pos )
+            :  my_pos(pos)
+        {}
+
+        T& item () const {
+            return intrusive_list_base::item(my_pos);
+        }
+
+    public:
+        iterator_impl () :  my_pos(NULL) {}
+
+        Iterator& operator = ( const Iterator& it ) {
+            return my_pos = it.my_pos;
+        }
+
+        Iterator& operator = ( const T& val ) {
+            return my_pos = &node(val);
+        }
+
+        bool operator == ( const Iterator& it ) const {
+            return my_pos == it.my_pos;
+        }
+
+        bool operator != ( const Iterator& it ) const {
+            return my_pos != it.my_pos;
+        }
+
+        Iterator& operator++ () {
+            my_pos = my_pos->my_next_node;
+            return self();
+        }
+
+        Iterator& operator-- () {
+            my_pos = my_pos->my_prev_node;
+            return self();
+        }
+
+        Iterator operator++ ( int ) {
+            Iterator result = self();
+            ++(*this);
+            return result;
+        }
+
+        Iterator operator-- ( int ) {
+            Iterator result = self();
+            --(*this);
+            return result;
+        }
+    }; // intrusive_list_base::iterator_impl
+
+    void assert_ok () const {
+        __TBB_ASSERT( (my_head.my_prev_node == &my_head && !my_size) ||
+                      (my_head.my_next_node != &my_head && my_size >0), "intrusive_list_base corrupted" );
+#if TBB_USE_ASSERT >= 2
+        size_t i = 0;
+        for ( intrusive_list_node *n = my_head.my_next_node; n != &my_head; n = n->my_next_node )
+            ++i;
+        __TBB_ASSERT( my_size == i, "Wrong size" );
+#endif /* TBB_USE_ASSERT >= 2 */
+    }
+
+public:
+    class iterator : public iterator_impl<iterator> {
+        template <class U, class V> friend class intrusive_list_base;
+    public:
+        iterator (intrusive_list_node* pos )
+            : iterator_impl<iterator>(pos )
+        {}
+        iterator () {}
+
+        T* operator-> () const { return &this->item(); }
+
+        T& operator* () const { return this->item(); }
+    }; // class iterator
+
+    class const_iterator : public iterator_impl<const_iterator> {
+        template <class U, class V> friend class intrusive_list_base;
+    public:
+        const_iterator (const intrusive_list_node* pos )
+            : iterator_impl<const_iterator>(const_cast<intrusive_list_node*>(pos) )
+        {}
+        const_iterator () {}
+
+        const T* operator-> () const { return &this->item(); }
+
+        const T& operator* () const { return this->item(); }
+    }; // class iterator
+
+    intrusive_list_base () : my_size(0) {
+        my_head.my_prev_node = &my_head;
+        my_head.my_next_node = &my_head;
+    }
+
+    bool empty () const { return my_head.my_next_node == &my_head; }
+
+    size_t size () const { return my_size; }
+
+    iterator begin () { return iterator(my_head.my_next_node); }
+
+    iterator end () { return iterator(&my_head); }
+
+    const_iterator begin () const { return const_iterator(my_head.my_next_node); }
+
+    const_iterator end () const { return const_iterator(&my_head); }
+
+    void push_front ( T& val ) {
+        __TBB_ASSERT( node(val).my_prev_node == &node(val) && node(val).my_next_node == &node(val),
+                    "Object with intrusive list node can be part of only one intrusive list simultaneously" );
+        // An object can be part of only one intrusive list at the given moment via the given node member
+        node(val).my_prev_node = &my_head;
+        node(val).my_next_node = my_head.my_next_node;
+        my_head.my_next_node->my_prev_node = &node(val);
+        my_head.my_next_node = &node(val);
+        ++my_size;
+        assert_ok();
+    }
+
+    void remove( T& val ) {
+        __TBB_ASSERT( node(val).my_prev_node != &node(val) && node(val).my_next_node != &node(val), "Element to remove is not in the list" );
+        __TBB_ASSERT( node(val).my_prev_node->my_next_node == &node(val) && node(val).my_next_node->my_prev_node == &node(val), "Element to remove is not in the list" );
+        --my_size;
+        node(val).my_next_node->my_prev_node = node(val).my_prev_node;
+        node(val).my_prev_node->my_next_node = node(val).my_next_node;
+#if TBB_USE_ASSERT
+        node(val).my_prev_node = node(val).my_next_node = &node(val);
+#endif
+        assert_ok();
+    }
+
+    iterator erase ( iterator it ) {
+        T& val = *it;
+        ++it;
+        remove( val );
+        return it;
+    }
+
+}; // intrusive_list_base
+
+
+//! Double linked list of items of type T containing a member of type intrusive_list_node.
+/** NodePtr is a member pointer to the node data field. Class U is either T or
+    a base class of T containing the node member. Default values exist for the sake
+    of a partial specialization working with inheritance case.
+
+    The list does not have ownership of its items. Its purpose is to avoid dynamic
+    memory allocation when forming lists of existing objects.
+
+    The class is not thread safe. **/
+template <class T, class U, intrusive_list_node U::*NodePtr>
+class memptr_intrusive_list : public intrusive_list_base<memptr_intrusive_list<T, U, NodePtr>, T>
+{
+    friend class intrusive_list_base<memptr_intrusive_list<T, U, NodePtr>, T>;
+
+    static intrusive_list_node& node ( T& val ) { return val.*NodePtr; }
+
+    static T& item ( intrusive_list_node* node ) {
+        // Cannot use __TBB_offsetof (and consequently __TBB_get_object_ref) macro
+        // with *NodePtr argument because gcc refuses to interpret pasted "->" and "*"
+        // as member pointer dereferencing operator, and explicit usage of ## in
+        // __TBB_offsetof implementation breaks operations with normal member names.
+        return *reinterpret_cast<T*>((char*)node - ((ptrdiff_t)&(reinterpret_cast<T*>(0x1000)->*NodePtr) - 0x1000));
+    }
+}; // intrusive_list<T, U, NodePtr>
+
+//! Double linked list of items of type T that is derived from intrusive_list_node class.
+/** The list does not have ownership of its items. Its purpose is to avoid dynamic
+    memory allocation when forming lists of existing objects.
+
+    The class is not thread safe. **/
+template <class T>
+class intrusive_list : public intrusive_list_base<intrusive_list<T>, T>
+{
+    friend class intrusive_list_base<intrusive_list<T>, T>;
+
+    static intrusive_list_node& node ( T& val ) { return val; }
+
+    static T& item ( intrusive_list_node* node ) { return *static_cast<T*>(node); }
+}; // intrusive_list<T>
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_intrusive_list_H */
diff --git a/xdl/third_party/tbb/src/tbb/itt_notify.cpp b/xdl/third_party/tbb/src/tbb/itt_notify.cpp
new file mode 100644
index 00000000..31c5559e
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/itt_notify.cpp
@@ -0,0 +1,99 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if DO_ITT_NOTIFY
+
+#if _WIN32||_WIN64
+    #ifndef UNICODE
+        #define UNICODE
+    #endif
+#else
+    #pragma weak dlopen
+    #pragma weak dlsym
+    #pragma weak dlerror
+#endif /* WIN */
+
+#if __TBB_BUILD
+
+extern "C" void ITT_DoOneTimeInitialization();
+#define __itt_init_ittlib_name(x,y) (ITT_DoOneTimeInitialization(), true)
+
+#elif __TBBMALLOC_BUILD
+
+extern "C" void MallocInitializeITT();
+#define __itt_init_ittlib_name(x,y) (MallocInitializeITT(), true)
+
+#else
+#error This file is expected to be used for either TBB or TBB allocator build.
+#endif // __TBB_BUILD
+
+#include "tools_api/ittnotify_static.c"
+
+namespace tbb {
+namespace internal {
+int __TBB_load_ittnotify() {
+#if !(_WIN32||_WIN64)
+    // tool_api crashes without dlopen, check that it's present. Common case
+    // for lack of dlopen is static binaries, i.e. ones build with -static.
+    if (dlopen == NULL)
+        return 0;
+#endif
+    return __itt_init_ittlib(NULL,          // groups for:
+      (__itt_group_id)(__itt_group_sync     // prepare/cancel/acquired/releasing
+                       | __itt_group_thread // name threads
+                       | __itt_group_stitch // stack stitching
+                       | __itt_group_structure
+                           ));
+}
+
+}} // namespaces
+
+#endif /* DO_ITT_NOTIFY */
+
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+#include "itt_notify.h"
+
+namespace tbb {
+
+#if DO_ITT_NOTIFY
+    const tchar
+            *SyncType_GlobalLock = _T("TbbGlobalLock"),
+            *SyncType_Scheduler = _T("%Constant")
+            ;
+    const tchar
+            *SyncObj_SchedulerInitialization = _T("TbbSchedulerInitialization"),
+            *SyncObj_SchedulersList = _T("TbbSchedulersList"),
+            *SyncObj_WorkerLifeCycleMgmt = _T("TBB Scheduler"),
+            *SyncObj_TaskStealingLoop = _T("TBB Scheduler"),
+            *SyncObj_WorkerTaskPool = _T("TBB Scheduler"),
+            *SyncObj_MasterTaskPool = _T("TBB Scheduler"),
+            *SyncObj_TaskPoolSpinning = _T("TBB Scheduler"),
+            *SyncObj_Mailbox = _T("TBB Scheduler"),
+            *SyncObj_TaskReturnList = _T("TBB Scheduler"),
+            *SyncObj_TaskStream = _T("TBB Scheduler"),
+#if __TBB_PREVIEW_CRITICAL_TASKS
+            *SyncObj_CriticalTaskStream = _T("TBB Scheduler"),
+#endif
+            *SyncObj_ContextsList = _T("TBB Scheduler")
+            ;
+#endif /* DO_ITT_NOTIFY */
+
+} // namespace tbb
+
diff --git a/xdl/third_party/tbb/src/tbb/itt_notify.h b/xdl/third_party/tbb/src/tbb/itt_notify.h
new file mode 100644
index 00000000..32d5d9d6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/itt_notify.h
@@ -0,0 +1,139 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_ITT_NOTIFY
+#define _TBB_ITT_NOTIFY
+
+#include "tbb/tbb_stddef.h"
+
+#if DO_ITT_NOTIFY
+
+#if _WIN32||_WIN64
+    #ifndef UNICODE
+        #define UNICODE
+    #endif
+#endif /* WIN */
+
+#ifndef INTEL_ITTNOTIFY_API_PRIVATE
+#define INTEL_ITTNOTIFY_API_PRIVATE
+#endif
+
+#include "tools_api/ittnotify.h"
+#include "tools_api/legacy/ittnotify.h"
+extern "C" void __itt_fini_ittlib(void);
+
+#if _WIN32||_WIN64
+    #undef _T
+    #undef __itt_event_create
+    #define __itt_event_create __itt_event_createA
+#endif /* WIN */
+
+
+#endif /* DO_ITT_NOTIFY */
+
+#if !ITT_CALLER_NULL
+#define ITT_CALLER_NULL ((__itt_caller)0)
+#endif
+
+namespace tbb {
+//! Unicode support
+#if (_WIN32||_WIN64) && !__MINGW32__
+    //! Unicode character type. Always wchar_t on Windows.
+    /** We do not use typedefs from Windows TCHAR family to keep consistence of TBB coding style. **/
+    typedef wchar_t tchar;
+    //! Standard Windows macro to markup the string literals.
+    #define _T(string_literal) L ## string_literal
+#else /* !WIN */
+    typedef char tchar;
+    //! Standard Windows style macro to markup the string literals.
+    #define _T(string_literal) string_literal
+#endif /* !WIN */
+} // namespace tbb
+
+#if DO_ITT_NOTIFY
+namespace tbb {
+    //! Display names of internal synchronization types
+    extern const tchar
+            *SyncType_GlobalLock,
+            *SyncType_Scheduler;
+    //! Display names of internal synchronization components/scenarios
+    extern const tchar
+            *SyncObj_SchedulerInitialization,
+            *SyncObj_SchedulersList,
+            *SyncObj_WorkerLifeCycleMgmt,
+            *SyncObj_TaskStealingLoop,
+            *SyncObj_WorkerTaskPool,
+            *SyncObj_MasterTaskPool,
+            *SyncObj_TaskPoolSpinning,
+            *SyncObj_Mailbox,
+            *SyncObj_TaskReturnList,
+            *SyncObj_TaskStream,
+#if __TBB_PREVIEW_CRITICAL_TASKS
+            *SyncObj_CriticalTaskStream,
+#endif
+            *SyncObj_ContextsList
+            ;
+
+    namespace internal {
+        void __TBB_EXPORTED_FUNC itt_set_sync_name_v3( void* obj, const tchar* name);
+
+    } // namespace internal
+
+} // namespace tbb
+
+// const_cast<void*>() is necessary to cast off volatility
+#define ITT_NOTIFY(name,obj)            __itt_notify_##name(const_cast<void*>(static_cast<volatile void*>(obj)))
+#define ITT_THREAD_SET_NAME(name)       __itt_thread_set_name(name)
+#define ITT_FINI_ITTLIB()               __itt_fini_ittlib()
+#define ITT_SYNC_CREATE(obj, type, name) __itt_sync_create((void*)(obj), type, name, 2)
+#define ITT_SYNC_RENAME(obj, name)      __itt_sync_rename(obj, name)
+#define ITT_STACK_CREATE(obj)           obj = __itt_stack_caller_create()
+#if __TBB_TASK_GROUP_CONTEXT
+#define ITT_STACK(precond, name, obj)   (precond) ? __itt_stack_##name(obj) : ((void)0);
+#else
+#define ITT_STACK(precond, name, obj)      ((void)0)
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
+
+#define ITT_TASK_GROUP(obj,name,parent)     itt_make_task_group_v7(internal::ITT_DOMAIN_MAIN,(void*)(obj),ALGORITHM,(void*)(parent),(parent!=NULL) ? ALGORITHM : FLOW_NULL,name)
+#define ITT_TASK_BEGIN(obj,name,id)         itt_task_begin_v7(internal::ITT_DOMAIN_MAIN,(void*)(id),ALGORITHM,(void*)(obj),ALGORITHM,name)
+#define ITT_TASK_END                        itt_task_end_v7(internal::ITT_DOMAIN_MAIN)
+
+#else /* !DO_ITT_NOTIFY */
+
+#define ITT_NOTIFY(name,obj)            ((void)0)
+#define ITT_THREAD_SET_NAME(name)       ((void)0)
+#define ITT_FINI_ITTLIB()               ((void)0)
+#define ITT_SYNC_CREATE(obj, type, name) ((void)0)
+#define ITT_SYNC_RENAME(obj, name)      ((void)0)
+#define ITT_STACK_CREATE(obj)           ((void)0)
+#define ITT_STACK(precond, name, obj)   ((void)0)
+
+#define ITT_TASK_GROUP(type,name,parent)    ((void)0)
+#define ITT_TASK_BEGIN(type,name,id)        ((void)0)
+#define ITT_TASK_END                        ((void)0)
+
+#endif /* !DO_ITT_NOTIFY */
+
+namespace tbb {
+namespace internal {
+int __TBB_load_ittnotify();
+}}
+
+#endif /* _TBB_ITT_NOTIFY */
diff --git a/xdl/third_party/tbb/src/tbb/lin32-tbb-export.def b/xdl/third_party/tbb/src/tbb/lin32-tbb-export.def
new file mode 100644
index 00000000..8f44f311
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/lin32-tbb-export.def
@@ -0,0 +1,49 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+#define __TBB_SYMBOL( sym ) sym;
+#include "lin32-tbb-export.lst"
+
+local:
+
+/* TBB symbols */
+*3tbb*;
+*__TBB*;
+
+/* ITT symbols */
+__itt_*;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+get_memcpy_largest_cachelinesize;
+get_memcpy_largest_cache_size;
+get_mem_ops_method;
+init_mem_ops_method;
+irc__get_msg;
+irc__print;
+override_mem_ops_method;
+set_memcpy_largest_cachelinesize;
+set_memcpy_largest_cache_size;
+
+};
diff --git a/xdl/third_party/tbb/src/tbb/lin32-tbb-export.lst b/xdl/third_party/tbb/src/tbb/lin32-tbb-export.lst
new file mode 100644
index 00000000..6fb16263
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/lin32-tbb-export.lst
@@ -0,0 +1,402 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+/* cache_aligned_allocator.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal12NFS_AllocateEjjPv )
+__TBB_SYMBOL( _ZN3tbb8internal15NFS_GetLineSizeEv )
+__TBB_SYMBOL( _ZN3tbb8internal8NFS_FreeEPv )
+__TBB_SYMBOL( _ZN3tbb8internal23allocate_via_handler_v3Ej )
+__TBB_SYMBOL( _ZN3tbb8internal25deallocate_via_handler_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal17is_malloc_used_v3Ev )
+
+/* task.cpp v3 */
+__TBB_SYMBOL( _ZN3tbb4task13note_affinityEt )
+__TBB_SYMBOL( _ZN3tbb4task22internal_set_ref_countEi )
+__TBB_SYMBOL( _ZN3tbb4task28internal_decrement_ref_countEv )
+__TBB_SYMBOL( _ZN3tbb4task22spawn_and_wait_for_allERNS_9task_listE )
+__TBB_SYMBOL( _ZN3tbb4task4selfEv )
+__TBB_SYMBOL( _ZN3tbb10interface58internal9task_base7destroyERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb4task26is_owned_by_current_threadEv )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy8allocateEj )
+__TBB_SYMBOL( _ZN3tbb8internal28affinity_partitioner_base_v36resizeEj )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy8allocateEj )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy8allocateEj )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy8allocateEj )
+__TBB_SYMBOL( _ZTIN3tbb4taskE )
+__TBB_SYMBOL( _ZTSN3tbb4taskE )
+__TBB_SYMBOL( _ZTVN3tbb4taskE )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init19default_num_threadsEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEij )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEi )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init9terminateEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init27internal_blocking_terminateEb )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( _ZN3tbb8internal26task_scheduler_observer_v37observeEb )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+__TBB_SYMBOL( _ZN3tbb10empty_task7executeEv )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD0Ev )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD1Ev )
+__TBB_SYMBOL( _ZTIN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTSN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTVN3tbb10empty_taskE )
+
+/* arena.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base19internal_initializeEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base18internal_terminateEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base15internal_attachEv )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_enqueueERNS_4taskEi )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_executeERNS1_13delegate_baseE )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base13internal_waitEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base21internal_current_slotEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base24internal_max_concurrencyEPKNS0_10task_arenaE )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( _ZN3tbb10interface78internal20isolate_within_arenaERNS1_13delegate_baseEi )
+#endif /* __TBB_TASK_ISOLATION */
+
+#if !TBB_NO_LEGACY
+/* task_v2.cpp */
+__TBB_SYMBOL( _ZN3tbb4task7destroyERS0_ )
+#endif /* !TBB_NO_LEGACY */
+
+/* Exception handling in task scheduler */
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy8allocateEj )
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb4task12change_groupERNS_18task_group_contextE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context28is_group_execution_cancelledEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context22cancel_group_executionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context26register_pending_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context5resetEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context19capture_fp_settingsEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context4initEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD1Ev )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD2Ev )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( _ZN3tbb18task_group_context12set_priorityENS_10priority_tE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context8priorityEv )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4nameEv )
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4whatEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception10throw_selfEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception3setEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exception4moveEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception5clearEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception7destroyEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception8allocateEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD0Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD1Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZN3tbb13tbb_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb13tbb_exceptionE )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+/* Symbols for exceptions thrown from TBB */
+__TBB_SYMBOL( _ZN3tbb8internal33throw_bad_last_alloc_exception_v4Ev )
+__TBB_SYMBOL( _ZN3tbb8internal18throw_exception_v4ENS0_12exception_idE )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD0Ev )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD1Ev )
+__TBB_SYMBOL( _ZNK3tbb14bad_last_alloc4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTSN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTVN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD0Ev )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD1Ev )
+__TBB_SYMBOL( _ZNK3tbb12missing_wait4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTSN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTVN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD0Ev )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD1Ev )
+__TBB_SYMBOL( _ZNK3tbb27invalid_multiple_scheduling4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTSN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTVN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD0Ev )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD1Ev )
+__TBB_SYMBOL( _ZNK3tbb13improper_lock4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTSN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTVN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZN3tbb10user_abortD0Ev )
+__TBB_SYMBOL( _ZN3tbb10user_abortD1Ev )
+__TBB_SYMBOL( _ZNK3tbb10user_abort4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTSN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTVN3tbb10user_abortE )
+
+/* tbb_misc.cpp */
+__TBB_SYMBOL( _ZN3tbb17assertion_failureEPKciS1_S1_ )
+__TBB_SYMBOL( _ZN3tbb21set_assertion_handlerEPFvPKciS1_S1_E )
+__TBB_SYMBOL( _ZN3tbb8internal36get_initial_auto_partitioner_divisorEv )
+__TBB_SYMBOL( _ZN3tbb8internal13handle_perrorEiPKc )
+__TBB_SYMBOL( _ZN3tbb8internal15runtime_warningEPKcz )
+#if __TBB_x86_32
+__TBB_SYMBOL( __TBB_machine_store8_slow_perf_warning )
+__TBB_SYMBOL( __TBB_machine_store8_slow )
+#endif
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+/* tbb_main.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal32itt_load_pointer_with_acquire_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal33itt_store_pointer_with_release_v3EPvS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal18call_itt_notify_v5EiPv )
+__TBB_SYMBOL( _ZN3tbb8internal20itt_set_sync_name_v3EPvPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_load_pointer_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal22itt_make_task_group_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal23itt_metadata_str_add_v7ENS0_15itt_domain_enumEPvyNS0_12string_indexEPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_relation_add_v7ENS0_15itt_domain_enumEPvyNS0_12itt_relationES2_y )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_task_begin_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal15itt_task_end_v7ENS0_15itt_domain_enumE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_region_begin_v9ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_region_end_v9ENS0_15itt_domain_enumEPvy )
+
+/* pipeline.cpp */
+__TBB_SYMBOL( _ZTIN3tbb6filterE )
+__TBB_SYMBOL( _ZTSN3tbb6filterE )
+__TBB_SYMBOL( _ZTVN3tbb6filterE )
+__TBB_SYMBOL( _ZN3tbb6filterD2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipeline10add_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline12inject_tokenERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8pipeline13remove_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEj )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEjRNS_18task_group_contextE )
+#endif
+__TBB_SYMBOL( _ZN3tbb8pipeline5clearEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter12process_itemEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter16try_process_itemEv )
+__TBB_SYMBOL( _ZTIN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTSN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTVN3tbb8pipelineE )
+__TBB_SYMBOL( _ZN3tbb8pipelineC1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineC2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD0Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD2Ev )
+__TBB_SYMBOL( _ZN3tbb6filter16set_end_of_inputEv )
+
+/* queuing_rw_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock17upgrade_to_writerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock19downgrade_to_readerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock11try_acquireERS0_b )
+
+/* reader_writer_lock.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock13try_lock_readEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock4lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock6unlockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock8try_lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock9lock_readEv )
+
+#if !TBB_NO_LEGACY
+/* spin_rw_mutex.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex16internal_upgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex22internal_itt_releasingEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex18internal_downgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_writerEPS0_ )
+#endif
+
+/* spin_rw_mutex v3 */
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v316internal_upgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_downgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_writerEv )
+
+// x86_rtm_rw_mutex.cpp
+#if __TBB_TSX_AVAILABLE
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_releaseERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_readerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_writerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_upgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_downgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex27internal_try_acquire_writerERNS2_11scoped_lockE )
+#endif
+
+/* spin_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb10spin_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock20internal_try_acquireERS0_ )
+
+/* mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb5mutex18internal_constructEv )
+
+/* recursive_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex18internal_constructEv )
+
+/* QueuingMutex.cpp */
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock11try_acquireERS0_ )
+
+/* critical_section.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal19critical_section_v418internal_constructEv )
+
+#if !TBB_NO_LEGACY
+/* concurrent_hash_map */
+__TBB_SYMBOL( _ZNK3tbb8internal21hash_map_segment_base23internal_grow_predicateEv )
+
+/* concurrent_queue.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base12internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base13internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base21internal_set_capacityEij )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base23internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base25internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseC2Ej )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTSN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTVN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base6assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base7advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseC2ERKNS0_21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseD2Ev )
+__TBB_SYMBOL( _ZNK3tbb8internal21concurrent_queue_base13internal_sizeEv )
+#endif
+
+/* concurrent_queue v3 */
+/* constructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3C2Ej )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3Ej )
+/* destructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3D2Ev )
+/* typeinfo */
+__TBB_SYMBOL( _ZTIN3tbb8internal24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZTSN3tbb8internal24concurrent_queue_base_v3E )
+/* vtable */
+__TBB_SYMBOL( _ZTVN3tbb8internal24concurrent_queue_base_v3E )
+/* methods */
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v37advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v313internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v818internal_push_moveEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v325internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v830internal_push_move_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v312internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v323internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v314internal_abortEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_set_capacityEij )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v313internal_sizeEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v314internal_emptyEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_finish_clearEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v324internal_throw_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v812move_contentERS1_ )
+
+#if !TBB_NO_LEGACY
+/* concurrent_vector.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base13internal_copyERKS1_jPFvPvPKvjE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base14internal_clearEPFvPvjEb )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base15internal_assignERKS1_jPFvPvjEPFvS4_PKvjESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_grow_byEjjPFvPvjE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_reserveEjjj )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base18internal_push_backEjRj )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base25internal_grow_to_at_leastEjjPFvPvjE )
+__TBB_SYMBOL( _ZNK3tbb8internal22concurrent_vector_base17internal_capacityEv )
+#endif
+
+/* concurrent_vector v3 */
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_copyERKS1_jPFvPvPKvjE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v314internal_clearEPFvPvjE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_assignERKS1_jPFvPvjEPFvS4_PKvjESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_grow_byEjjPFvPvPKvjES4_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_reserveEjjj )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v318internal_push_backEjRj )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v325internal_grow_to_at_leastEjjPFvPvPKvjES4_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v317internal_capacityEv )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_compactEjPvPFvS2_jEPFvS2_PKvjE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_swapERS1_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v324internal_throw_exceptionEj )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_resizeEjjjPKvPFvPvjEPFvS4_S3_jE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v337internal_grow_to_at_least_with_resultEjjPFvPvPKvjES4_ )
+
+/* tbb_thread */
+#if __MINGW32__
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFjPvES2_ )
+#else
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFPvS2_ES2_ )
+#endif
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v320hardware_concurrencyEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v34joinEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v36detachEv )
+__TBB_SYMBOL( _ZN3tbb8internal15free_closure_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_sleep_v3ERKNS_10tick_count10interval_tE )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_yield_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal16thread_get_id_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_closure_v3Ej )
+__TBB_SYMBOL( _ZN3tbb8internal7move_v3ERNS0_13tbb_thread_v3ES2_ )
+
+#if __MINGW32__
+/* condition_variable */
+__TBB_SYMBOL( _ZN3tbb10interface58internal32internal_condition_variable_waitERNS1_14condvar_impl_tEPNS_5mutexEPKNS_10tick_count10interval_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal35internal_destroy_condition_variableERNS1_14condvar_impl_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal38internal_condition_variable_notify_allERNS1_14condvar_impl_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal38internal_condition_variable_notify_oneERNS1_14condvar_impl_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal38internal_initialize_condition_variableERNS1_14condvar_impl_tE )
+#endif
+
+// global parameter
+__TBB_SYMBOL( _ZN3tbb10interface914global_control12active_valueEi )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control15internal_createEv )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control16internal_destroyEv )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/lin64-tbb-export.def b/xdl/third_party/tbb/src/tbb/lin64-tbb-export.def
new file mode 100644
index 00000000..4f1a07b3
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/lin64-tbb-export.def
@@ -0,0 +1,46 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+#define __TBB_SYMBOL( sym ) sym;
+#include "lin64-tbb-export.lst"
+
+local:
+
+/* TBB symbols */
+*3tbb*;
+*__TBB*;
+
+/* ITT symbols */
+__itt_*;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+get_msg_buf;
+get_text_buf;
+message_catalog;
+print_buf;
+irc__get_msg;
+irc__print;
+
+};
diff --git a/xdl/third_party/tbb/src/tbb/lin64-tbb-export.lst b/xdl/third_party/tbb/src/tbb/lin64-tbb-export.lst
new file mode 100644
index 00000000..1e6eaed0
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/lin64-tbb-export.lst
@@ -0,0 +1,383 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+/* cache_aligned_allocator.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal12NFS_AllocateEmmPv )
+__TBB_SYMBOL( _ZN3tbb8internal15NFS_GetLineSizeEv )
+__TBB_SYMBOL( _ZN3tbb8internal8NFS_FreeEPv )
+__TBB_SYMBOL( _ZN3tbb8internal23allocate_via_handler_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal25deallocate_via_handler_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal17is_malloc_used_v3Ev )
+
+/* task.cpp v3 */
+__TBB_SYMBOL( _ZN3tbb4task13note_affinityEt )
+__TBB_SYMBOL( _ZN3tbb4task22internal_set_ref_countEi )
+__TBB_SYMBOL( _ZN3tbb4task28internal_decrement_ref_countEv )
+__TBB_SYMBOL( _ZN3tbb4task22spawn_and_wait_for_allERNS_9task_listE )
+__TBB_SYMBOL( _ZN3tbb4task4selfEv )
+__TBB_SYMBOL( _ZN3tbb10interface58internal9task_base7destroyERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb4task26is_owned_by_current_threadEv )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy8allocateEm )
+__TBB_SYMBOL( _ZN3tbb8internal28affinity_partitioner_base_v36resizeEj )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy8allocateEm )
+__TBB_SYMBOL( _ZTIN3tbb4taskE )
+__TBB_SYMBOL( _ZTSN3tbb4taskE )
+__TBB_SYMBOL( _ZTVN3tbb4taskE )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init19default_num_threadsEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEim )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEi )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init9terminateEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init27internal_blocking_terminateEb )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( _ZN3tbb8internal26task_scheduler_observer_v37observeEb )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+__TBB_SYMBOL( _ZN3tbb10empty_task7executeEv )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD0Ev )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD1Ev )
+__TBB_SYMBOL( _ZTIN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTSN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTVN3tbb10empty_taskE )
+
+/* arena.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base19internal_initializeEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base18internal_terminateEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base15internal_attachEv )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_enqueueERNS_4taskEl )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_executeERNS1_13delegate_baseE )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base13internal_waitEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base21internal_current_slotEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base24internal_max_concurrencyEPKNS0_10task_arenaE )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( _ZN3tbb10interface78internal20isolate_within_arenaERNS1_13delegate_baseEl )
+#endif
+
+#if !TBB_NO_LEGACY
+/* task_v2.cpp */
+__TBB_SYMBOL( _ZN3tbb4task7destroyERS0_ )
+#endif /* !TBB_NO_LEGACY */
+
+/* Exception handling in task scheduler */
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb4task12change_groupERNS_18task_group_contextE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context28is_group_execution_cancelledEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context22cancel_group_executionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context26register_pending_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context5resetEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context19capture_fp_settingsEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context4initEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD1Ev )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD2Ev )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( _ZN3tbb18task_group_context12set_priorityENS_10priority_tE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context8priorityEv )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4nameEv )
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4whatEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception10throw_selfEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception3setEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exception4moveEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception5clearEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception7destroyEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception8allocateEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD0Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD1Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZN3tbb13tbb_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb13tbb_exceptionE )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+/* Symbols for exceptions thrown from TBB */
+__TBB_SYMBOL( _ZN3tbb8internal33throw_bad_last_alloc_exception_v4Ev )
+__TBB_SYMBOL( _ZN3tbb8internal18throw_exception_v4ENS0_12exception_idE )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD0Ev )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD1Ev )
+__TBB_SYMBOL( _ZNK3tbb14bad_last_alloc4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTSN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTVN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD0Ev )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD1Ev )
+__TBB_SYMBOL( _ZNK3tbb12missing_wait4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTSN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTVN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD0Ev )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD1Ev )
+__TBB_SYMBOL( _ZNK3tbb27invalid_multiple_scheduling4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTSN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTVN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD0Ev )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD1Ev )
+__TBB_SYMBOL( _ZNK3tbb13improper_lock4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTSN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTVN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZN3tbb10user_abortD0Ev )
+__TBB_SYMBOL( _ZN3tbb10user_abortD1Ev )
+__TBB_SYMBOL( _ZNK3tbb10user_abort4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTSN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTVN3tbb10user_abortE )
+/* tbb_misc.cpp */
+__TBB_SYMBOL( _ZN3tbb17assertion_failureEPKciS1_S1_ )
+__TBB_SYMBOL( _ZN3tbb21set_assertion_handlerEPFvPKciS1_S1_E )
+__TBB_SYMBOL( _ZN3tbb8internal36get_initial_auto_partitioner_divisorEv )
+__TBB_SYMBOL( _ZN3tbb8internal13handle_perrorEiPKc )
+__TBB_SYMBOL( _ZN3tbb8internal15runtime_warningEPKcz )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+/* tbb_main.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal32itt_load_pointer_with_acquire_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal33itt_store_pointer_with_release_v3EPvS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal18call_itt_notify_v5EiPv )
+__TBB_SYMBOL( _ZN3tbb8internal20itt_set_sync_name_v3EPvPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_load_pointer_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal23itt_metadata_str_add_v7ENS0_15itt_domain_enumEPvyNS0_12string_indexEPKc )
+__TBB_SYMBOL( _ZN3tbb8internal22itt_make_task_group_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_task_begin_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_relation_add_v7ENS0_15itt_domain_enumEPvyNS0_12itt_relationES2_y )
+__TBB_SYMBOL( _ZN3tbb8internal15itt_task_end_v7ENS0_15itt_domain_enumE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_region_begin_v9ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_region_end_v9ENS0_15itt_domain_enumEPvy )
+
+/* pipeline.cpp */
+__TBB_SYMBOL( _ZTIN3tbb6filterE )
+__TBB_SYMBOL( _ZTSN3tbb6filterE )
+__TBB_SYMBOL( _ZTVN3tbb6filterE )
+__TBB_SYMBOL( _ZN3tbb6filterD2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipeline10add_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline12inject_tokenERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8pipeline13remove_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEm )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEmRNS_18task_group_contextE )
+#endif
+__TBB_SYMBOL( _ZN3tbb8pipeline5clearEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter12process_itemEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter16try_process_itemEv )
+__TBB_SYMBOL( _ZTIN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTSN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTVN3tbb8pipelineE )
+__TBB_SYMBOL( _ZN3tbb8pipelineC1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineC2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD0Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD2Ev )
+__TBB_SYMBOL( _ZN3tbb6filter16set_end_of_inputEv )
+
+/* queuing_rw_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock17upgrade_to_writerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock19downgrade_to_readerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock11try_acquireERS0_b )
+
+/* reader_writer_lock.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock13try_lock_readEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock4lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock6unlockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock8try_lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock9lock_readEv )
+
+#if !TBB_NO_LEGACY
+/* spin_rw_mutex.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex16internal_upgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex22internal_itt_releasingEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex18internal_downgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_writerEPS0_ )
+#endif
+
+// x86_rtm_rw_mutex.cpp
+#if __TBB_TSX_AVAILABLE
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_writerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex27internal_try_acquire_writerERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_readerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_releaseERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_upgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_downgradeERNS2_11scoped_lockE )
+#endif
+
+/* spin_rw_mutex v3 */
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v316internal_upgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_downgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_writerEv )
+
+/* spin_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex18internal_constructEv )
+
+/* mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb5mutex18internal_constructEv )
+
+/* recursive_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex18internal_constructEv )
+
+/* QueuingMutex.cpp */
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock11try_acquireERS0_ )
+
+/* critical_section.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal19critical_section_v418internal_constructEv )
+
+#if !TBB_NO_LEGACY
+/* concurrent_hash_map */
+__TBB_SYMBOL( _ZNK3tbb8internal21hash_map_segment_base23internal_grow_predicateEv )
+
+/* concurrent_queue.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base12internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base13internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base21internal_set_capacityElm )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base23internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base25internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseC2Em )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTSN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTVN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base6assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base7advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseC2ERKNS0_21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseD2Ev )
+__TBB_SYMBOL( _ZNK3tbb8internal21concurrent_queue_base13internal_sizeEv )
+#endif
+
+/* concurrent_queue v3 */
+/* constructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3C2Em )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3Em )
+/* destructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3D2Ev )
+/* typeinfo */
+__TBB_SYMBOL( _ZTIN3tbb8internal24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZTSN3tbb8internal24concurrent_queue_base_v3E )
+/* vtable */
+__TBB_SYMBOL( _ZTVN3tbb8internal24concurrent_queue_base_v3E )
+/* methods */
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v37advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v313internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v818internal_push_moveEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v325internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v830internal_push_move_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v312internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v323internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v314internal_abortEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_finish_clearEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_set_capacityElm )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v313internal_sizeEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v314internal_emptyEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v324internal_throw_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v812move_contentERS1_ )
+
+#if !TBB_NO_LEGACY
+/* concurrent_vector.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base13internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base14internal_clearEPFvPvmEb )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base15internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_grow_byEmmPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base18internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base25internal_grow_to_at_leastEmmPFvPvmE )
+__TBB_SYMBOL( _ZNK3tbb8internal22concurrent_vector_base17internal_capacityEv )
+#endif
+
+/* concurrent_vector v3 */
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v314internal_clearEPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_grow_byEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v318internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v325internal_grow_to_at_leastEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v317internal_capacityEv )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_compactEmPvPFvS2_mEPFvS2_PKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_swapERS1_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v324internal_throw_exceptionEm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_resizeEmmmPKvPFvPvmEPFvS4_S3_mE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v337internal_grow_to_at_least_with_resultEmmPFvPvPKvmES4_ )
+
+/* tbb_thread */
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v320hardware_concurrencyEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v36detachEv )
+__TBB_SYMBOL( _ZN3tbb8internal16thread_get_id_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15free_closure_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v34joinEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFPvS2_ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_closure_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal7move_v3ERNS0_13tbb_thread_v3ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_yield_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_sleep_v3ERKNS_10tick_count10interval_tE )
+
+/* global_parameter */
+__TBB_SYMBOL( _ZN3tbb10interface914global_control12active_valueEi )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control15internal_createEv )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control16internal_destroyEv )
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/lin64ipf-tbb-export.def b/xdl/third_party/tbb/src/tbb/lin64ipf-tbb-export.def
new file mode 100644
index 00000000..e567e227
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/lin64ipf-tbb-export.def
@@ -0,0 +1,48 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+#define __TBB_SYMBOL( sym ) sym;
+#include "lin64ipf-tbb-export.lst"
+
+local:
+
+/* TBB symbols */
+*3tbb*;
+*__TBB*;
+
+/* ITT symbols */
+__itt_*;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+?0_memcopyA;
+?0_memcopyDu;
+?0_memcpyD;
+?1__memcpy;
+?1__memmove;
+?1__serial_memmove;
+memcpy;
+memset;
+
+};
diff --git a/xdl/third_party/tbb/src/tbb/lin64ipf-tbb-export.lst b/xdl/third_party/tbb/src/tbb/lin64ipf-tbb-export.lst
new file mode 100644
index 00000000..369f178d
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/lin64ipf-tbb-export.lst
@@ -0,0 +1,424 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+/* cache_aligned_allocator.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal12NFS_AllocateEmmPv )
+__TBB_SYMBOL( _ZN3tbb8internal15NFS_GetLineSizeEv )
+__TBB_SYMBOL( _ZN3tbb8internal8NFS_FreeEPv )
+__TBB_SYMBOL( _ZN3tbb8internal23allocate_via_handler_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal25deallocate_via_handler_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal17is_malloc_used_v3Ev )
+
+/* task.cpp v3 */
+__TBB_SYMBOL( _ZN3tbb4task13note_affinityEt )
+__TBB_SYMBOL( _ZN3tbb4task22internal_set_ref_countEi )
+__TBB_SYMBOL( _ZN3tbb4task28internal_decrement_ref_countEv )
+__TBB_SYMBOL( _ZN3tbb4task22spawn_and_wait_for_allERNS_9task_listE )
+__TBB_SYMBOL( _ZN3tbb4task4selfEv )
+__TBB_SYMBOL( _ZN3tbb10interface58internal9task_base7destroyERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb4task26is_owned_by_current_threadEv )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy8allocateEm )
+__TBB_SYMBOL( _ZN3tbb8internal28affinity_partitioner_base_v36resizeEj )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy8allocateEm )
+__TBB_SYMBOL( _ZTIN3tbb4taskE )
+__TBB_SYMBOL( _ZTSN3tbb4taskE )
+__TBB_SYMBOL( _ZTVN3tbb4taskE )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init19default_num_threadsEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEim )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEi )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init9terminateEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init27internal_blocking_terminateEb )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( _ZN3tbb8internal26task_scheduler_observer_v37observeEb )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+__TBB_SYMBOL( _ZN3tbb10empty_task7executeEv )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD0Ev )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD1Ev )
+__TBB_SYMBOL( _ZTIN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTSN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTVN3tbb10empty_taskE )
+
+/* arena.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base19internal_initializeEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base18internal_terminateEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base15internal_attachEv )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_enqueueERNS_4taskEl )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_executeERNS1_13delegate_baseE )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base13internal_waitEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base21internal_current_slotEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base24internal_max_concurrencyEPKNS0_10task_arenaE )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( _ZN3tbb10interface78internal20isolate_within_arenaERNS1_13delegate_baseEl )
+#endif
+
+#if !TBB_NO_LEGACY
+/* task_v2.cpp */
+__TBB_SYMBOL( _ZN3tbb4task7destroyERS0_ )
+#endif /* !TBB_NO_LEGACY */
+
+/* Exception handling in task scheduler */
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb4task12change_groupERNS_18task_group_contextE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context28is_group_execution_cancelledEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context22cancel_group_executionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context26register_pending_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context5resetEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context19capture_fp_settingsEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context4initEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD1Ev )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD2Ev )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( _ZN3tbb18task_group_context12set_priorityENS_10priority_tE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context8priorityEv )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4nameEv )
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4whatEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception10throw_selfEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception3setEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exception4moveEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception5clearEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception7destroyEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception8allocateEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD0Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD1Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZN3tbb13tbb_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb13tbb_exceptionE )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+/* Symbols for exceptions thrown from TBB */
+__TBB_SYMBOL( _ZN3tbb8internal33throw_bad_last_alloc_exception_v4Ev )
+__TBB_SYMBOL( _ZN3tbb8internal18throw_exception_v4ENS0_12exception_idE )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD0Ev )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD1Ev )
+__TBB_SYMBOL( _ZNK3tbb14bad_last_alloc4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTSN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTVN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD0Ev )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD1Ev )
+__TBB_SYMBOL( _ZNK3tbb12missing_wait4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTSN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTVN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD0Ev )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD1Ev )
+__TBB_SYMBOL( _ZNK3tbb27invalid_multiple_scheduling4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTSN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTVN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD0Ev )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD1Ev )
+__TBB_SYMBOL( _ZNK3tbb13improper_lock4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTSN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTVN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZN3tbb10user_abortD0Ev )
+__TBB_SYMBOL( _ZN3tbb10user_abortD1Ev )
+__TBB_SYMBOL( _ZNK3tbb10user_abort4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTSN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTVN3tbb10user_abortE )
+
+/* tbb_misc.cpp */
+__TBB_SYMBOL( _ZN3tbb17assertion_failureEPKciS1_S1_ )
+__TBB_SYMBOL( _ZN3tbb21set_assertion_handlerEPFvPKciS1_S1_E )
+__TBB_SYMBOL( _ZN3tbb8internal36get_initial_auto_partitioner_divisorEv )
+__TBB_SYMBOL( _ZN3tbb8internal13handle_perrorEiPKc )
+__TBB_SYMBOL( _ZN3tbb8internal15runtime_warningEPKcz )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+/* tbb_main.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal32itt_load_pointer_with_acquire_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal33itt_store_pointer_with_release_v3EPvS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal18call_itt_notify_v5EiPv )
+__TBB_SYMBOL( _ZN3tbb8internal20itt_set_sync_name_v3EPvPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_load_pointer_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal23itt_metadata_str_add_v7ENS0_15itt_domain_enumEPvyNS0_12string_indexEPKc )
+__TBB_SYMBOL( _ZN3tbb8internal22itt_make_task_group_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_task_begin_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_relation_add_v7ENS0_15itt_domain_enumEPvyNS0_12itt_relationES2_y )
+__TBB_SYMBOL( _ZN3tbb8internal15itt_task_end_v7ENS0_15itt_domain_enumE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_region_begin_v9ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_region_end_v9ENS0_15itt_domain_enumEPvy )
+
+/* pipeline.cpp */
+__TBB_SYMBOL( _ZTIN3tbb6filterE )
+__TBB_SYMBOL( _ZTSN3tbb6filterE )
+__TBB_SYMBOL( _ZTVN3tbb6filterE )
+__TBB_SYMBOL( _ZN3tbb6filterD2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipeline10add_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline12inject_tokenERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8pipeline13remove_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEm )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEmRNS_18task_group_contextE )
+#endif
+__TBB_SYMBOL( _ZN3tbb8pipeline5clearEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter12process_itemEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter16try_process_itemEv )
+__TBB_SYMBOL( _ZTIN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTSN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTVN3tbb8pipelineE )
+__TBB_SYMBOL( _ZN3tbb8pipelineC1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineC2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD0Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD2Ev )
+__TBB_SYMBOL( _ZN3tbb6filter16set_end_of_inputEv )
+
+/* queuing_rw_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock17upgrade_to_writerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock19downgrade_to_readerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock11try_acquireERS0_b )
+
+/* reader_writer_lock.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock13try_lock_readEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock4lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock6unlockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock8try_lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock9lock_readEv )
+
+#if !TBB_NO_LEGACY
+/* spin_rw_mutex.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex16internal_upgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex22internal_itt_releasingEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex18internal_downgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_writerEPS0_ )
+#endif
+
+/* spin_rw_mutex v3 */
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v316internal_upgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_downgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_writerEv )
+
+/* spin_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb10spin_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock20internal_try_acquireERS0_ )
+
+/* mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb5mutex18internal_constructEv )
+
+/* recursive_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex18internal_constructEv )
+
+/* QueuingMutex.cpp */
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock11try_acquireERS0_ )
+
+/* critical_section.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal19critical_section_v418internal_constructEv )
+
+#if !TBB_NO_LEGACY
+/* concurrent_hash_map */
+__TBB_SYMBOL( _ZNK3tbb8internal21hash_map_segment_base23internal_grow_predicateEv )
+
+/* concurrent_queue.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base12internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base13internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base21internal_set_capacityElm )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base23internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base25internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseC2Em )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTSN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTVN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base6assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base7advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseC2ERKNS0_21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseD2Ev )
+__TBB_SYMBOL( _ZNK3tbb8internal21concurrent_queue_base13internal_sizeEv )
+#endif
+
+/* concurrent_queue v3 */
+/* constructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3C2Em )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3Em )
+/* destructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3D2Ev )
+/* typeinfo */
+__TBB_SYMBOL( _ZTIN3tbb8internal24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZTSN3tbb8internal24concurrent_queue_base_v3E )
+/* vtable */
+__TBB_SYMBOL( _ZTVN3tbb8internal24concurrent_queue_base_v3E )
+/* methods */
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v37advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v313internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v818internal_push_moveEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v325internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v830internal_push_move_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v312internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v323internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v314internal_abortEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_finish_clearEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_set_capacityElm )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v313internal_sizeEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v314internal_emptyEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v324internal_throw_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v812move_contentERS1_ )
+
+#if !TBB_NO_LEGACY
+/* concurrent_vector.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base13internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base14internal_clearEPFvPvmEb )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base15internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_grow_byEmmPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base18internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base25internal_grow_to_at_leastEmmPFvPvmE )
+__TBB_SYMBOL( _ZNK3tbb8internal22concurrent_vector_base17internal_capacityEv )
+#endif
+
+/* concurrent_vector v3 */
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v314internal_clearEPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_grow_byEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v318internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v325internal_grow_to_at_leastEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v317internal_capacityEv )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_compactEmPvPFvS2_mEPFvS2_PKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_swapERS1_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v324internal_throw_exceptionEm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_resizeEmmmPKvPFvPvmEPFvS4_S3_mE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v337internal_grow_to_at_least_with_resultEmmPFvPvPKvmES4_ )
+
+/* tbb_thread */
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v320hardware_concurrencyEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v36detachEv )
+__TBB_SYMBOL( _ZN3tbb8internal16thread_get_id_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15free_closure_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v34joinEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFPvS2_ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_closure_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal7move_v3ERNS0_13tbb_thread_v3ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_yield_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_sleep_v3ERKNS_10tick_count10interval_tE )
+
+/* asm functions */
+__TBB_SYMBOL( __TBB_machine_fetchadd1__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchadd2__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchadd4__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchadd8__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchstore1__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchstore2__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchstore4__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchstore8__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_fetchadd1acquire )
+__TBB_SYMBOL( __TBB_machine_fetchadd1release )
+__TBB_SYMBOL( __TBB_machine_fetchadd2acquire )
+__TBB_SYMBOL( __TBB_machine_fetchadd2release )
+__TBB_SYMBOL( __TBB_machine_fetchadd4acquire )
+__TBB_SYMBOL( __TBB_machine_fetchadd4release )
+__TBB_SYMBOL( __TBB_machine_fetchadd8acquire )
+__TBB_SYMBOL( __TBB_machine_fetchadd8release )
+__TBB_SYMBOL( __TBB_machine_fetchstore1acquire )
+__TBB_SYMBOL( __TBB_machine_fetchstore1release )
+__TBB_SYMBOL( __TBB_machine_fetchstore2acquire )
+__TBB_SYMBOL( __TBB_machine_fetchstore2release )
+__TBB_SYMBOL( __TBB_machine_fetchstore4acquire )
+__TBB_SYMBOL( __TBB_machine_fetchstore4release )
+__TBB_SYMBOL( __TBB_machine_fetchstore8acquire )
+__TBB_SYMBOL( __TBB_machine_fetchstore8release )
+__TBB_SYMBOL( __TBB_machine_cmpswp1acquire )
+__TBB_SYMBOL( __TBB_machine_cmpswp1release )
+__TBB_SYMBOL( __TBB_machine_cmpswp1__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_cmpswp2acquire )
+__TBB_SYMBOL( __TBB_machine_cmpswp2release )
+__TBB_SYMBOL( __TBB_machine_cmpswp2__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_cmpswp4acquire )
+__TBB_SYMBOL( __TBB_machine_cmpswp4release )
+__TBB_SYMBOL( __TBB_machine_cmpswp4__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_cmpswp8acquire )
+__TBB_SYMBOL( __TBB_machine_cmpswp8release )
+__TBB_SYMBOL( __TBB_machine_cmpswp8__TBB_full_fence )
+__TBB_SYMBOL( __TBB_machine_lg )
+__TBB_SYMBOL( __TBB_machine_lockbyte )
+__TBB_SYMBOL( __TBB_machine_pause )
+__TBB_SYMBOL( __TBB_machine_trylockbyte )
+__TBB_SYMBOL( __TBB_machine_load8_relaxed )
+__TBB_SYMBOL( __TBB_machine_store8_relaxed )
+__TBB_SYMBOL( __TBB_machine_load4_relaxed )
+__TBB_SYMBOL( __TBB_machine_store4_relaxed )
+__TBB_SYMBOL( __TBB_machine_load2_relaxed )
+__TBB_SYMBOL( __TBB_machine_store2_relaxed )
+__TBB_SYMBOL( __TBB_machine_load1_relaxed )
+__TBB_SYMBOL( __TBB_machine_store1_relaxed )
+
+/* global parameter */
+__TBB_SYMBOL( _ZN3tbb10interface914global_control12active_valueEi )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control15internal_createEv )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control16internal_destroyEv )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/mac32-tbb-export.def b/xdl/third_party/tbb/src/tbb/mac32-tbb-export.def
new file mode 100644
index 00000000..a465b0c4
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/mac32-tbb-export.def
@@ -0,0 +1,23 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define __TBB_SYMBOL( sym ) _##sym
+#include "mac32-tbb-export.lst"
+
diff --git a/xdl/third_party/tbb/src/tbb/mac32-tbb-export.lst b/xdl/third_party/tbb/src/tbb/mac32-tbb-export.lst
new file mode 100644
index 00000000..0261a6c8
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/mac32-tbb-export.lst
@@ -0,0 +1,410 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+/*
+    Sometimes macOS* requires leading underscore (e. g. in export list file), but sometimes not
+    (e. g. when searching symbol in a dynamic library via dlsym()). Symbols in this file SHOULD
+    be listed WITHOUT one leading underscore. __TBB_SYMBOL macro should add underscore when
+    necessary, depending on the indended usage.
+*/
+
+// cache_aligned_allocator.cpp
+__TBB_SYMBOL( _ZN3tbb8internal12NFS_AllocateEmmPv )
+__TBB_SYMBOL( _ZN3tbb8internal15NFS_GetLineSizeEv )
+__TBB_SYMBOL( _ZN3tbb8internal8NFS_FreeEPv )
+__TBB_SYMBOL( _ZN3tbb8internal23allocate_via_handler_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal25deallocate_via_handler_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal17is_malloc_used_v3Ev )
+
+// task.cpp v3
+__TBB_SYMBOL( _ZN3tbb4task13note_affinityEt )
+__TBB_SYMBOL( _ZN3tbb4task22internal_set_ref_countEi )
+__TBB_SYMBOL( _ZN3tbb4task28internal_decrement_ref_countEv )
+__TBB_SYMBOL( _ZN3tbb4task22spawn_and_wait_for_allERNS_9task_listE )
+__TBB_SYMBOL( _ZN3tbb4task4selfEv )
+__TBB_SYMBOL( _ZN3tbb10interface58internal9task_base7destroyERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb4task26is_owned_by_current_threadEv )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy8allocateEm )
+__TBB_SYMBOL( _ZN3tbb8internal28affinity_partitioner_base_v36resizeEj )
+__TBB_SYMBOL( _ZN3tbb8internal36get_initial_auto_partitioner_divisorEv )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy8allocateEm )
+__TBB_SYMBOL( _ZTIN3tbb4taskE )
+__TBB_SYMBOL( _ZTSN3tbb4taskE )
+__TBB_SYMBOL( _ZTVN3tbb4taskE )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init19default_num_threadsEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEim )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEi )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init9terminateEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init27internal_blocking_terminateEb )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( _ZN3tbb8internal26task_scheduler_observer_v37observeEb )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+__TBB_SYMBOL( _ZN3tbb10empty_task7executeEv )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD0Ev )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD1Ev )
+__TBB_SYMBOL( _ZTIN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTSN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTVN3tbb10empty_taskE )
+
+/* arena.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base19internal_initializeEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base18internal_terminateEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base15internal_attachEv )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_enqueueERNS_4taskEl )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_executeERNS1_13delegate_baseE )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base13internal_waitEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base21internal_current_slotEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base24internal_max_concurrencyEPKNS0_10task_arenaE )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( _ZN3tbb10interface78internal20isolate_within_arenaERNS1_13delegate_baseEl )
+#endif /* __TBB_TASK_ISOLATION */
+
+#if !TBB_NO_LEGACY
+// task_v2.cpp
+__TBB_SYMBOL( _ZN3tbb4task7destroyERS0_ )
+#endif
+
+// Exception handling in task scheduler
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb4task12change_groupERNS_18task_group_contextE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context28is_group_execution_cancelledEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context22cancel_group_executionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context26register_pending_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context5resetEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context19capture_fp_settingsEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context4initEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD1Ev )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD2Ev )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( _ZN3tbb18task_group_context12set_priorityENS_10priority_tE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context8priorityEv )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4nameEv )
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4whatEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception10throw_selfEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception3setEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exception4moveEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception5clearEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception7destroyEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception8allocateEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD0Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD1Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTIN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb13tbb_exceptionE )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+// Symbols for exceptions thrown from TBB
+__TBB_SYMBOL( _ZN3tbb8internal33throw_bad_last_alloc_exception_v4Ev )
+__TBB_SYMBOL( _ZN3tbb8internal18throw_exception_v4ENS0_12exception_idE )
+__TBB_SYMBOL( _ZNSt13runtime_errorD1Ev )
+__TBB_SYMBOL( _ZTISt13runtime_error )
+__TBB_SYMBOL( _ZTSSt13runtime_error )
+__TBB_SYMBOL( _ZNSt16invalid_argumentD1Ev )
+__TBB_SYMBOL( _ZTISt16invalid_argument )
+__TBB_SYMBOL( _ZTSSt16invalid_argument )
+__TBB_SYMBOL( _ZNSt11range_errorD1Ev )
+__TBB_SYMBOL( _ZTISt11range_error )
+__TBB_SYMBOL( _ZTSSt11range_error )
+__TBB_SYMBOL( _ZNSt12length_errorD1Ev )
+__TBB_SYMBOL( _ZTISt12length_error )
+__TBB_SYMBOL( _ZTSSt12length_error )
+__TBB_SYMBOL( _ZNSt12out_of_rangeD1Ev )
+__TBB_SYMBOL( _ZTISt12out_of_range )
+__TBB_SYMBOL( _ZTSSt12out_of_range )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD0Ev )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD1Ev )
+__TBB_SYMBOL( _ZNK3tbb14bad_last_alloc4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTSN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTVN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD0Ev )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD1Ev )
+__TBB_SYMBOL( _ZNK3tbb12missing_wait4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTSN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTVN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD0Ev )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD1Ev )
+__TBB_SYMBOL( _ZNK3tbb27invalid_multiple_scheduling4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTSN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTVN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD0Ev )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD1Ev )
+__TBB_SYMBOL( _ZNK3tbb13improper_lock4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTSN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTVN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZN3tbb10user_abortD0Ev )
+__TBB_SYMBOL( _ZN3tbb10user_abortD1Ev )
+__TBB_SYMBOL( _ZNK3tbb10user_abort4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTSN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTVN3tbb10user_abortE )
+
+// tbb_misc.cpp
+__TBB_SYMBOL( _ZN3tbb17assertion_failureEPKciS1_S1_ )
+__TBB_SYMBOL( _ZN3tbb21set_assertion_handlerEPFvPKciS1_S1_E )
+__TBB_SYMBOL( _ZN3tbb8internal13handle_perrorEiPKc )
+__TBB_SYMBOL( _ZN3tbb8internal15runtime_warningEPKcz )
+#if __TBB_x86_32
+__TBB_SYMBOL( __TBB_machine_store8_slow_perf_warning )
+__TBB_SYMBOL( __TBB_machine_store8_slow )
+#endif
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+// tbb_main.cpp
+__TBB_SYMBOL( _ZN3tbb8internal32itt_load_pointer_with_acquire_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal33itt_store_pointer_with_release_v3EPvS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal18call_itt_notify_v5EiPv )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_load_pointer_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal20itt_set_sync_name_v3EPvPKc )
+__TBB_SYMBOL( _ZN3tbb8internal22itt_make_task_group_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal23itt_metadata_str_add_v7ENS0_15itt_domain_enumEPvyNS0_12string_indexEPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_relation_add_v7ENS0_15itt_domain_enumEPvyNS0_12itt_relationES2_y )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_task_begin_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal15itt_task_end_v7ENS0_15itt_domain_enumE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_region_begin_v9ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_region_end_v9ENS0_15itt_domain_enumEPvy )
+
+// pipeline.cpp
+__TBB_SYMBOL( _ZTIN3tbb6filterE )
+__TBB_SYMBOL( _ZTSN3tbb6filterE )
+__TBB_SYMBOL( _ZTVN3tbb6filterE )
+__TBB_SYMBOL( _ZN3tbb6filterD2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipeline10add_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline12inject_tokenERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8pipeline13remove_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEm )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEmRNS_18task_group_contextE )
+#endif
+__TBB_SYMBOL( _ZN3tbb8pipeline5clearEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter12process_itemEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter16try_process_itemEv )
+__TBB_SYMBOL( _ZN3tbb8pipelineC1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineC2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD0Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTSN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTVN3tbb8pipelineE )
+__TBB_SYMBOL( _ZN3tbb6filter16set_end_of_inputEv )
+
+// queuing_rw_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock17upgrade_to_writerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock19downgrade_to_readerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock11try_acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex18internal_constructEv )
+
+// reader_writer_lock.cpp
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock13try_lock_readEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock4lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock6unlockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock8try_lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock9lock_readEv )
+
+#if !TBB_NO_LEGACY
+// spin_rw_mutex.cpp v2
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex16internal_upgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex22internal_itt_releasingEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex18internal_downgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_writerEPS0_ )
+#endif
+
+// spin_rw_mutex v3
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v316internal_upgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_downgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_constructEv )
+
+// x86_rtm_rw_mutex.cpp
+#if __TBB_TSX_AVAILABLE
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_releaseERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_upgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_downgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_readerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_writerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex27internal_try_acquire_writerERNS2_11scoped_lockE )
+#endif
+
+// spin_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex18internal_constructEv )
+
+// mutex.cpp
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb5mutex18internal_constructEv )
+
+// recursive_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex18internal_constructEv )
+
+// queuing_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock11try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex18internal_constructEv )
+
+// critical_section.cpp
+__TBB_SYMBOL( _ZN3tbb8internal19critical_section_v418internal_constructEv )
+
+#if !TBB_NO_LEGACY
+// concurrent_hash_map
+__TBB_SYMBOL( _ZNK3tbb8internal21hash_map_segment_base23internal_grow_predicateEv )
+
+// concurrent_queue.cpp v2
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base12internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base13internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base21internal_set_capacityEim )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base23internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base25internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseC2Em )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTSN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTVN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base6assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base7advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseC2ERKNS0_21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseD2Ev )
+__TBB_SYMBOL( _ZNK3tbb8internal21concurrent_queue_base13internal_sizeEv )
+#endif
+
+// concurrent_queue v3
+// constructors
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3C2Em )
+// destructors
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3D2Ev )
+// typeinfo
+__TBB_SYMBOL( _ZTIN3tbb8internal24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZTSN3tbb8internal24concurrent_queue_base_v3E )
+// vtable
+__TBB_SYMBOL( _ZTVN3tbb8internal24concurrent_queue_base_v3E )
+// methods
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v37advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v313internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v818internal_push_moveEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v325internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v830internal_push_move_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v312internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v323internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v314internal_abortEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_set_capacityEim )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v313internal_sizeEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v314internal_emptyEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_finish_clearEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v324internal_throw_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v812move_contentERS1_ )
+
+#if !TBB_NO_LEGACY
+// concurrent_vector.cpp v2
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base13internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base14internal_clearEPFvPvmEb )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base15internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_grow_byEmmPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base18internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base25internal_grow_to_at_leastEmmPFvPvmE )
+__TBB_SYMBOL( _ZNK3tbb8internal22concurrent_vector_base17internal_capacityEv )
+#endif
+
+// concurrent_vector v3
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v314internal_clearEPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_grow_byEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v318internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v325internal_grow_to_at_leastEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v317internal_capacityEv )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_compactEmPvPFvS2_mEPFvS2_PKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_swapERS1_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v324internal_throw_exceptionEm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_resizeEmmmPKvPFvPvmEPFvS4_S3_mE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v337internal_grow_to_at_least_with_resultEmmPFvPvPKvmES4_ )
+
+// tbb_thread
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFPvS2_ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v320hardware_concurrencyEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v34joinEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v36detachEv )
+__TBB_SYMBOL( _ZN3tbb8internal15free_closure_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_sleep_v3ERKNS_10tick_count10interval_tE )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_yield_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal16thread_get_id_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_closure_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal7move_v3ERNS0_13tbb_thread_v3ES2_ )
+
+// global parameter
+__TBB_SYMBOL( _ZN3tbb10interface914global_control12active_valueEi )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control15internal_createEv )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control16internal_destroyEv )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/mac64-tbb-export.def b/xdl/third_party/tbb/src/tbb/mac64-tbb-export.def
new file mode 100644
index 00000000..07dc4b81
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/mac64-tbb-export.def
@@ -0,0 +1,23 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define __TBB_SYMBOL( sym ) _##sym
+#include "mac64-tbb-export.lst"
+
diff --git a/xdl/third_party/tbb/src/tbb/mac64-tbb-export.lst b/xdl/third_party/tbb/src/tbb/mac64-tbb-export.lst
new file mode 100644
index 00000000..2024cd4d
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/mac64-tbb-export.lst
@@ -0,0 +1,407 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+/*
+    Sometimes macOS* requires leading underscore (e. g. in export list file), but sometimes not
+    (e. g. when searching symbol in a dynamic library via dlsym()). Symbols in this file SHOULD
+    be listed WITHOUT one leading underscore. __TBB_SYMBOL macro should add underscore when
+    necessary, depending on the indended usage.
+*/
+
+// cache_aligned_allocator.cpp
+__TBB_SYMBOL( _ZN3tbb8internal12NFS_AllocateEmmPv )
+__TBB_SYMBOL( _ZN3tbb8internal15NFS_GetLineSizeEv )
+__TBB_SYMBOL( _ZN3tbb8internal8NFS_FreeEPv )
+__TBB_SYMBOL( _ZN3tbb8internal23allocate_via_handler_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal25deallocate_via_handler_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal17is_malloc_used_v3Ev )
+
+// task.cpp v3
+__TBB_SYMBOL( _ZN3tbb4task13note_affinityEt )
+__TBB_SYMBOL( _ZN3tbb4task22internal_set_ref_countEi )
+__TBB_SYMBOL( _ZN3tbb4task28internal_decrement_ref_countEv )
+__TBB_SYMBOL( _ZN3tbb4task22spawn_and_wait_for_allERNS_9task_listE )
+__TBB_SYMBOL( _ZN3tbb4task4selfEv )
+__TBB_SYMBOL( _ZN3tbb10interface58internal9task_base7destroyERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb4task26is_owned_by_current_threadEv )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy8allocateEm )
+__TBB_SYMBOL( _ZN3tbb8internal28affinity_partitioner_base_v36resizeEj )
+__TBB_SYMBOL( _ZN3tbb8internal36get_initial_auto_partitioner_divisorEv )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy8allocateEm )
+__TBB_SYMBOL( _ZTIN3tbb4taskE )
+__TBB_SYMBOL( _ZTSN3tbb4taskE )
+__TBB_SYMBOL( _ZTVN3tbb4taskE )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init19default_num_threadsEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEim )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEi )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init9terminateEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init27internal_blocking_terminateEb )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( _ZN3tbb8internal26task_scheduler_observer_v37observeEb )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+__TBB_SYMBOL( _ZN3tbb10empty_task7executeEv )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD0Ev )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD1Ev )
+__TBB_SYMBOL( _ZTIN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTSN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTVN3tbb10empty_taskE )
+
+/* arena.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base19internal_initializeEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base18internal_terminateEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base15internal_attachEv )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_enqueueERNS_4taskEl )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_executeERNS1_13delegate_baseE )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base13internal_waitEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base21internal_current_slotEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base24internal_max_concurrencyEPKNS0_10task_arenaE )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( _ZN3tbb10interface78internal20isolate_within_arenaERNS1_13delegate_baseEl )
+#endif /* __TBB_TASK_ISOLATION */
+
+#if !TBB_NO_LEGACY
+// task_v2.cpp
+__TBB_SYMBOL( _ZN3tbb4task7destroyERS0_ )
+#endif
+
+// Exception handling in task scheduler
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy8allocateEm )
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb4task12change_groupERNS_18task_group_contextE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context28is_group_execution_cancelledEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context22cancel_group_executionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context26register_pending_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context5resetEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context19capture_fp_settingsEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context4initEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD1Ev )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD2Ev )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( _ZN3tbb18task_group_context12set_priorityENS_10priority_tE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context8priorityEv )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4nameEv )
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4whatEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception10throw_selfEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception3setEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exception4moveEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception5clearEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception7destroyEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception8allocateEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD0Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD1Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTIN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb13tbb_exceptionE )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+// Symbols for exceptions thrown from TBB
+__TBB_SYMBOL( _ZN3tbb8internal33throw_bad_last_alloc_exception_v4Ev )
+__TBB_SYMBOL( _ZN3tbb8internal18throw_exception_v4ENS0_12exception_idE )
+__TBB_SYMBOL( _ZNSt13runtime_errorD1Ev )
+__TBB_SYMBOL( _ZTISt13runtime_error )
+__TBB_SYMBOL( _ZTSSt13runtime_error )
+__TBB_SYMBOL( _ZNSt16invalid_argumentD1Ev )
+__TBB_SYMBOL( _ZTISt16invalid_argument )
+__TBB_SYMBOL( _ZTSSt16invalid_argument )
+__TBB_SYMBOL( _ZNSt11range_errorD1Ev )
+__TBB_SYMBOL( _ZTISt11range_error )
+__TBB_SYMBOL( _ZTSSt11range_error )
+__TBB_SYMBOL( _ZNSt12length_errorD1Ev )
+__TBB_SYMBOL( _ZTISt12length_error )
+__TBB_SYMBOL( _ZTSSt12length_error )
+__TBB_SYMBOL( _ZNSt12out_of_rangeD1Ev )
+__TBB_SYMBOL( _ZTISt12out_of_range )
+__TBB_SYMBOL( _ZTSSt12out_of_range )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD0Ev )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD1Ev )
+__TBB_SYMBOL( _ZNK3tbb14bad_last_alloc4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTSN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTVN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD0Ev )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD1Ev )
+__TBB_SYMBOL( _ZNK3tbb12missing_wait4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTSN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTVN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD0Ev )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD1Ev )
+__TBB_SYMBOL( _ZNK3tbb27invalid_multiple_scheduling4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTSN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTVN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD0Ev )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD1Ev )
+__TBB_SYMBOL( _ZNK3tbb13improper_lock4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTSN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTVN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZN3tbb10user_abortD0Ev )
+__TBB_SYMBOL( _ZN3tbb10user_abortD1Ev )
+__TBB_SYMBOL( _ZNK3tbb10user_abort4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTSN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTVN3tbb10user_abortE )
+
+
+// tbb_misc.cpp
+__TBB_SYMBOL( _ZN3tbb17assertion_failureEPKciS1_S1_ )
+__TBB_SYMBOL( _ZN3tbb21set_assertion_handlerEPFvPKciS1_S1_E )
+__TBB_SYMBOL( _ZN3tbb8internal13handle_perrorEiPKc )
+__TBB_SYMBOL( _ZN3tbb8internal15runtime_warningEPKcz )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+// tbb_main.cpp
+__TBB_SYMBOL( _ZN3tbb8internal32itt_load_pointer_with_acquire_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal33itt_store_pointer_with_release_v3EPvS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal18call_itt_notify_v5EiPv )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_load_pointer_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal20itt_set_sync_name_v3EPvPKc )
+__TBB_SYMBOL( _ZN3tbb8internal23itt_metadata_str_add_v7ENS0_15itt_domain_enumEPvyNS0_12string_indexEPKc )
+__TBB_SYMBOL( _ZN3tbb8internal22itt_make_task_group_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_task_begin_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_relation_add_v7ENS0_15itt_domain_enumEPvyNS0_12itt_relationES2_y )
+__TBB_SYMBOL( _ZN3tbb8internal15itt_task_end_v7ENS0_15itt_domain_enumE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_region_begin_v9ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_region_end_v9ENS0_15itt_domain_enumEPvy )
+
+// pipeline.cpp
+__TBB_SYMBOL( _ZTIN3tbb6filterE )
+__TBB_SYMBOL( _ZTSN3tbb6filterE )
+__TBB_SYMBOL( _ZTVN3tbb6filterE )
+__TBB_SYMBOL( _ZN3tbb6filterD2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipeline10add_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline12inject_tokenERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8pipeline13remove_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEm )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEmRNS_18task_group_contextE )
+#endif
+__TBB_SYMBOL( _ZN3tbb8pipeline5clearEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter12process_itemEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter16try_process_itemEv )
+__TBB_SYMBOL( _ZN3tbb8pipelineC1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineC2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD0Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTSN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTVN3tbb8pipelineE )
+__TBB_SYMBOL( _ZN3tbb6filter16set_end_of_inputEv )
+
+// queuing_rw_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock17upgrade_to_writerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock19downgrade_to_readerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock11try_acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex18internal_constructEv )
+
+// reader_writer_lock.cpp
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock13try_lock_readEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock4lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock6unlockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock8try_lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock9lock_readEv )
+
+#if !TBB_NO_LEGACY
+// spin_rw_mutex.cpp v2
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex16internal_upgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex22internal_itt_releasingEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex18internal_downgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_writerEPS0_ )
+#endif
+
+// spin_rw_mutex v3
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v316internal_upgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_downgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_constructEv )
+
+// x86_rtm_rw_mutex.cpp
+#if __TBB_TSX_AVAILABLE
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_releaseERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_upgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_downgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_readerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_writerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex27internal_try_acquire_writerERNS2_11scoped_lockE )
+#endif
+
+// spin_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex18internal_constructEv )
+
+// mutex.cpp
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb5mutex18internal_constructEv )
+
+// recursive_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex18internal_constructEv )
+
+// queuing_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock11try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex18internal_constructEv )
+
+// critical_section.cpp
+__TBB_SYMBOL( _ZN3tbb8internal19critical_section_v418internal_constructEv )
+
+#if !TBB_NO_LEGACY
+// concurrent_hash_map
+__TBB_SYMBOL( _ZNK3tbb8internal21hash_map_segment_base23internal_grow_predicateEv )
+
+// concurrent_queue.cpp v2
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base12internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base13internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base21internal_set_capacityElm )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base23internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base25internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseC2Em )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTSN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTVN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base6assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base7advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseC2ERKNS0_21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseD2Ev )
+__TBB_SYMBOL( _ZNK3tbb8internal21concurrent_queue_base13internal_sizeEv )
+#endif
+
+// concurrent_queue v3
+// constructors
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3C2Em )
+// destructors
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3D2Ev )
+// typeinfo
+__TBB_SYMBOL( _ZTIN3tbb8internal24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZTSN3tbb8internal24concurrent_queue_base_v3E )
+// vtable
+__TBB_SYMBOL( _ZTVN3tbb8internal24concurrent_queue_base_v3E )
+// methods
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v37advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v313internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v818internal_push_moveEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v325internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v830internal_push_move_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v312internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v323internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v314internal_abortEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_finish_clearEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_set_capacityElm )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v313internal_sizeEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v314internal_emptyEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v324internal_throw_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v812move_contentERS1_ )
+
+#if !TBB_NO_LEGACY
+// concurrent_vector.cpp v2
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base13internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base14internal_clearEPFvPvmEb )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base15internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_grow_byEmmPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base18internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base25internal_grow_to_at_leastEmmPFvPvmE )
+__TBB_SYMBOL( _ZNK3tbb8internal22concurrent_vector_base17internal_capacityEv )
+#endif
+
+// concurrent_vector v3
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_copyERKS1_mPFvPvPKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v314internal_clearEPFvPvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_assignERKS1_mPFvPvmEPFvS4_PKvmESA_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_grow_byEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_reserveEmmm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v318internal_push_backEmRm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v325internal_grow_to_at_leastEmmPFvPvPKvmES4_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v317internal_capacityEv )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_compactEmPvPFvS2_mEPFvS2_PKvmE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_swapERS1_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v324internal_throw_exceptionEm )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_resizeEmmmPKvPFvPvmEPFvS4_S3_mE )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v337internal_grow_to_at_least_with_resultEmmPFvPvPKvmES4_ )
+
+// tbb_thread
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v320hardware_concurrencyEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v36detachEv )
+__TBB_SYMBOL( _ZN3tbb8internal16thread_get_id_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15free_closure_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v34joinEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFPvS2_ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_closure_v3Em )
+__TBB_SYMBOL( _ZN3tbb8internal7move_v3ERNS0_13tbb_thread_v3ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_yield_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_sleep_v3ERKNS_10tick_count10interval_tE )
+
+// global parameter
+__TBB_SYMBOL( _ZN3tbb10interface914global_control12active_valueEi )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control15internal_createEv )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control16internal_destroyEv )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/mailbox.h b/xdl/third_party/tbb/src/tbb/mailbox.h
new file mode 100644
index 00000000..75a216eb
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/mailbox.h
@@ -0,0 +1,235 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_mailbox_H
+#define _TBB_mailbox_H
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/cache_aligned_allocator.h"
+
+#include "scheduler_common.h"
+#include "tbb/atomic.h"
+
+namespace tbb {
+namespace internal {
+
+struct task_proxy : public task {
+    static const intptr_t      pool_bit = 1<<0;
+    static const intptr_t   mailbox_bit = 1<<1;
+    static const intptr_t location_mask = pool_bit | mailbox_bit;
+    /* All but two low-order bits represent a (task*).
+       Two low-order bits mean:
+       1 = proxy is/was/will be in task pool
+       2 = proxy is/was/will be in mailbox */
+    intptr_t task_and_tag;
+
+    //! Pointer to next task_proxy in a mailbox
+    task_proxy *__TBB_atomic next_in_mailbox;
+
+    //! Mailbox to which this was mailed.
+    mail_outbox* outbox;
+
+    //! True if the proxy is stored both in its sender's pool and in the destination mailbox.
+    static bool is_shared ( intptr_t tat ) {
+        return (tat & location_mask) == location_mask;
+    }
+
+    //! Returns a pointer to the encapsulated task or NULL.
+    static task* task_ptr ( intptr_t tat ) {
+        return (task*)(tat & ~location_mask);
+    }
+
+    //! Returns a pointer to the encapsulated task or NULL, and frees proxy if necessary.
+    template<intptr_t from_bit>
+    inline task* extract_task () {
+        __TBB_ASSERT( prefix().extra_state == es_task_proxy, "Normal task misinterpreted as a proxy?" );
+        intptr_t tat = __TBB_load_with_acquire(task_and_tag);
+        __TBB_ASSERT( tat == from_bit || (is_shared(tat) && task_ptr(tat)),
+            "Proxy's tag cannot specify both locations if the proxy "
+            "was retrieved from one of its original locations" );
+        if ( tat != from_bit ) {
+            const intptr_t cleaner_bit = location_mask & ~from_bit;
+            // Attempt to transition the proxy to the "empty" state with
+            // cleaner_bit specifying entity responsible for its eventual freeing.
+            // Explicit cast to void* is to work around a seeming ICC 11.1 bug.
+            if ( as_atomic(task_and_tag).compare_and_swap(cleaner_bit, tat) == tat ) {
+                // Successfully grabbed the task, and left new owner with the job of freeing the proxy
+                return task_ptr(tat);
+            }
+        }
+        // Proxied task has already been claimed from another proxy location.
+        __TBB_ASSERT( task_and_tag == from_bit, "Empty proxy cannot contain non-zero task pointer" );
+        return NULL;
+    }
+}; // struct task_proxy
+
+//! Internal representation of mail_outbox, without padding.
+class unpadded_mail_outbox {
+protected:
+    typedef task_proxy*__TBB_atomic proxy_ptr;
+
+    //! Pointer to first task_proxy in mailbox, or NULL if box is empty.
+    proxy_ptr my_first;
+
+    //! Pointer to pointer that will point to next item in the queue.  Never NULL.
+    proxy_ptr* __TBB_atomic my_last;
+
+    //! Owner of mailbox is not executing a task, and has drained its own task pool.
+    bool my_is_idle;
+};
+
+//! Class representing where mail is put.
+/** Padded to occupy a cache line. */
+class mail_outbox : padded<unpadded_mail_outbox> {
+
+    task_proxy* internal_pop( __TBB_ISOLATION_EXPR(isolation_tag isolation) ) {
+        task_proxy* curr = __TBB_load_relaxed( my_first );
+        if ( !curr )
+            return NULL;
+        task_proxy **prev_ptr = &my_first;
+#if __TBB_TASK_ISOLATION
+        if ( isolation != no_isolation ) {
+            while ( curr->prefix().isolation != isolation ) {
+                prev_ptr = &curr->next_in_mailbox;
+                curr = curr->next_in_mailbox;
+                if ( !curr )
+                    return NULL;
+            }
+        }
+#endif /* __TBB_TASK_ISOLATION */
+        __TBB_control_consistency_helper(); // on my_first
+        // There is a first item in the mailbox.  See if there is a second.
+        if ( task_proxy* second = curr->next_in_mailbox ) {
+            // There are at least two items, so first item can be popped easily.
+            *prev_ptr = second;
+        } else {
+            // There is only one item.  Some care is required to pop it.
+            *prev_ptr = NULL;
+            if ( as_atomic( my_last ).compare_and_swap( prev_ptr, &curr->next_in_mailbox ) == &curr->next_in_mailbox ) {
+                // Successfully transitioned mailbox from having one item to having none.
+                __TBB_ASSERT( !curr->next_in_mailbox, NULL );
+            } else {
+                // Some other thread updated my_last but has not filled in first->next_in_mailbox
+                // Wait until first item points to second item.
+                atomic_backoff backoff;
+                while ( !(second = curr->next_in_mailbox) ) backoff.pause();
+                *prev_ptr = second;
+            }
+        }
+        __TBB_ASSERT( curr, NULL );
+        return curr;
+    }
+public:
+    friend class mail_inbox;
+
+    //! Push task_proxy onto the mailbox queue of another thread.
+    /** Implementation is wait-free. */
+    void push( task_proxy* t ) {
+        __TBB_ASSERT(t, NULL);
+        t->next_in_mailbox = NULL;
+        proxy_ptr * const link = (proxy_ptr *)__TBB_FetchAndStoreW(&my_last,(intptr_t)&t->next_in_mailbox);
+        // No release fence required for the next store, because there are no memory operations
+        // between the previous fully fenced atomic operation and the store.
+        __TBB_store_relaxed(*link, t);
+    }
+
+    //! Return true if mailbox is empty
+    bool empty() {
+        return __TBB_load_relaxed(my_first) == NULL;
+    }
+
+    //! Construct *this as a mailbox from zeroed memory.
+    /** Raise assertion if *this is not previously zeroed, or sizeof(this) is wrong.
+        This method is provided instead of a full constructor since we know the object
+        will be constructed in zeroed memory. */
+    void construct() {
+        __TBB_ASSERT( sizeof(*this)==NFS_MaxLineSize, NULL );
+        __TBB_ASSERT( !my_first, NULL );
+        __TBB_ASSERT( !my_last, NULL );
+        __TBB_ASSERT( !my_is_idle, NULL );
+        my_last=&my_first;
+        suppress_unused_warning(pad);
+    }
+
+    //! Drain the mailbox
+    intptr_t drain() {
+        intptr_t k = 0;
+        // No fences here because other threads have already quit.
+        for( ; task_proxy* t = my_first; ++k ) {
+            my_first = t->next_in_mailbox;
+            NFS_Free((char*)t - task_prefix_reservation_size);
+        }
+        return k;
+    }
+
+    //! True if thread that owns this mailbox is looking for work.
+    bool recipient_is_idle() {
+        return my_is_idle;
+    }
+}; // class mail_outbox
+
+//! Class representing source of mail.
+class mail_inbox {
+    //! Corresponding sink where mail that we receive will be put.
+    mail_outbox* my_putter;
+public:
+    //! Construct unattached inbox
+    mail_inbox() : my_putter(NULL) {}
+
+    //! Attach inbox to a corresponding outbox.
+    void attach( mail_outbox& putter ) {
+        my_putter = &putter;
+    }
+    //! Detach inbox from its outbox
+    void detach() {
+        __TBB_ASSERT(my_putter,"not attached");
+        my_putter = NULL;
+    }
+    //! Get next piece of mail, or NULL if mailbox is empty.
+    task_proxy* pop( __TBB_ISOLATION_EXPR( isolation_tag isolation ) ) {
+        return my_putter->internal_pop( __TBB_ISOLATION_EXPR( isolation ) );
+    }
+    //! Return true if mailbox is empty
+    bool empty() {
+        return my_putter->empty();
+    }
+    //! Indicate whether thread that reads this mailbox is idle.
+    /** Raises assertion failure if mailbox is redundantly marked as not idle. */
+    void set_is_idle( bool value ) {
+        if( my_putter ) {
+            __TBB_ASSERT( my_putter->my_is_idle || value, "attempt to redundantly mark mailbox as not idle" );
+            my_putter->my_is_idle = value;
+        }
+    }
+    //! Indicate whether thread that reads this mailbox is idle.
+    bool is_idle_state ( bool value ) const {
+        return !my_putter || my_putter->my_is_idle == value;
+    }
+
+#if DO_ITT_NOTIFY
+    //! Get pointer to corresponding outbox used for ITT_NOTIFY calls.
+    void* outbox() const {return my_putter;}
+#endif /* DO_ITT_NOTIFY */
+}; // class mail_inbox
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_mailbox_H */
diff --git a/xdl/third_party/tbb/src/tbb/market.cpp b/xdl/third_party/tbb/src/tbb/market.cpp
new file mode 100644
index 00000000..c9226096
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/market.cpp
@@ -0,0 +1,885 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/global_control.h" // global_control::active_value
+
+#include "market.h"
+#include "tbb_main.h"
+#include "governor.h"
+#include "scheduler.h"
+#include "itt_notify.h"
+
+namespace tbb {
+namespace internal {
+
+void market::insert_arena_into_list ( arena& a ) {
+#if __TBB_TASK_PRIORITY
+    arena_list_type &arenas = my_priority_levels[a.my_top_priority].arenas;
+    arena *&next = my_priority_levels[a.my_top_priority].next_arena;
+#else /* !__TBB_TASK_PRIORITY */
+    arena_list_type &arenas = my_arenas;
+    arena *&next = my_next_arena;
+#endif /* !__TBB_TASK_PRIORITY */
+    arenas.push_front( a );
+    if ( arenas.size() == 1 )
+        next = &*arenas.begin();
+}
+
+void market::remove_arena_from_list ( arena& a ) {
+#if __TBB_TASK_PRIORITY
+    arena_list_type &arenas = my_priority_levels[a.my_top_priority].arenas;
+    arena *&next = my_priority_levels[a.my_top_priority].next_arena;
+#else /* !__TBB_TASK_PRIORITY */
+    arena_list_type &arenas = my_arenas;
+    arena *&next = my_next_arena;
+#endif /* !__TBB_TASK_PRIORITY */
+    arena_list_type::iterator it = next;
+    __TBB_ASSERT( it != arenas.end(), NULL );
+    if ( next == &a ) {
+        if ( ++it == arenas.end() && arenas.size() > 1 )
+            it = arenas.begin();
+        next = &*it;
+    }
+    arenas.remove( a );
+}
+
+//------------------------------------------------------------------------
+// market
+//------------------------------------------------------------------------
+
+market::market ( unsigned workers_soft_limit, unsigned workers_hard_limit, size_t stack_size )
+    : my_num_workers_hard_limit(workers_hard_limit)
+    , my_num_workers_soft_limit(workers_soft_limit)
+#if __TBB_TASK_PRIORITY
+    , my_global_top_priority(normalized_normal_priority)
+    , my_global_bottom_priority(normalized_normal_priority)
+#endif /* __TBB_TASK_PRIORITY */
+    , my_ref_count(1)
+    , my_stack_size(stack_size)
+    , my_workers_soft_limit_to_report(workers_soft_limit)
+{
+#if __TBB_TASK_PRIORITY
+    __TBB_ASSERT( my_global_reload_epoch == 0, NULL );
+    my_priority_levels[normalized_normal_priority].workers_available = my_num_workers_soft_limit;
+#endif /* __TBB_TASK_PRIORITY */
+
+    // Once created RML server will start initializing workers that will need
+    // global market instance to get worker stack size
+    my_server = governor::create_rml_server( *this );
+    __TBB_ASSERT( my_server, "Failed to create RML server" );
+}
+
+static unsigned calc_workers_soft_limit(unsigned workers_soft_limit, unsigned workers_hard_limit) {
+    if( int soft_limit = market::app_parallelism_limit() )
+        workers_soft_limit = soft_limit-1;
+    else // if user set no limits (yet), use market's parameter
+        workers_soft_limit = max( governor::default_num_threads() - 1, workers_soft_limit );
+    if( workers_soft_limit >= workers_hard_limit )
+        workers_soft_limit = workers_hard_limit-1;
+    return workers_soft_limit;
+}
+
+market& market::global_market ( bool is_public, unsigned workers_requested, size_t stack_size ) {
+    global_market_mutex_type::scoped_lock lock( theMarketMutex );
+    market *m = theMarket;
+    if( m ) {
+        ++m->my_ref_count;
+        const unsigned old_public_count = is_public? m->my_public_ref_count++ : /*any non-zero value*/1;
+        lock.release();
+        if( old_public_count==0 )
+            set_active_num_workers( calc_workers_soft_limit(workers_requested, m->my_num_workers_hard_limit) );
+
+        // do not warn if default number of workers is requested
+        if( workers_requested != governor::default_num_threads()-1 ) {
+            __TBB_ASSERT( skip_soft_limit_warning > workers_requested,
+                          "skip_soft_limit_warning must be larger than any valid workers_requested" );
+            unsigned soft_limit_to_report = m->my_workers_soft_limit_to_report;
+            if( soft_limit_to_report < workers_requested ) {
+                runtime_warning( "The number of workers is currently limited to %u. "
+                                 "The request for %u workers is ignored. Further requests for more workers "
+                                 "will be silently ignored until the limit changes.\n",
+                                 soft_limit_to_report, workers_requested );
+                // The race is possible when multiple threads report warnings.
+                // We are OK with that, as there are just multiple warnings.
+                internal::as_atomic(m->my_workers_soft_limit_to_report).
+                    compare_and_swap(skip_soft_limit_warning, soft_limit_to_report);
+            }
+
+        }
+        if( m->my_stack_size < stack_size )
+            runtime_warning( "Thread stack size has been already set to %u. "
+                             "The request for larger stack (%u) cannot be satisfied.\n",
+                              m->my_stack_size, stack_size );
+    }
+    else {
+        // TODO: A lot is done under theMarketMutex locked. Can anything be moved out?
+        if( stack_size == 0 )
+            stack_size = global_control::active_value(global_control::thread_stack_size);
+        // Expecting that 4P is suitable for most applications.
+        // Limit to 2P for large thread number.
+        // TODO: ask RML for max concurrency and possibly correct hard_limit
+        const unsigned factor = governor::default_num_threads()<=128? 4 : 2;
+        // The requested number of threads is intentionally not considered in
+        // computation of the hard limit, in order to separate responsibilities
+        // and avoid complicated interactions between global_control and task_scheduler_init.
+        // The market guarantees that at least 256 threads might be created.
+        const unsigned workers_hard_limit = max(max(factor*governor::default_num_threads(), 256u), app_parallelism_limit());
+        const unsigned workers_soft_limit = calc_workers_soft_limit(workers_requested, workers_hard_limit);
+        // Create the global market instance
+        size_t size = sizeof(market);
+#if __TBB_TASK_GROUP_CONTEXT
+        __TBB_ASSERT( __TBB_offsetof(market, my_workers) + sizeof(generic_scheduler*) == sizeof(market),
+                      "my_workers must be the last data field of the market class");
+        size += sizeof(generic_scheduler*) * (workers_hard_limit - 1);
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+        __TBB_InitOnce::add_ref();
+        void* storage = NFS_Allocate(1, size, NULL);
+        memset( storage, 0, size );
+        // Initialize and publish global market
+        m = new (storage) market( workers_soft_limit, workers_hard_limit, stack_size );
+        if( is_public )
+            m->my_public_ref_count = 1;
+        theMarket = m;
+        // This check relies on the fact that for shared RML default_concurrency==max_concurrency
+        if ( !governor::UsePrivateRML && m->my_server->default_concurrency() < workers_soft_limit )
+            runtime_warning( "RML might limit the number of workers to %u while %u is requested.\n"
+                    , m->my_server->default_concurrency(), workers_soft_limit );
+    }
+    return *m;
+}
+
+void market::destroy () {
+#if __TBB_COUNT_TASK_NODES
+    if ( my_task_node_count )
+        runtime_warning( "Leaked %ld task objects\n", (long)my_task_node_count );
+#endif /* __TBB_COUNT_TASK_NODES */
+    this->market::~market(); // qualified to suppress warning
+    NFS_Free( this );
+    __TBB_InitOnce::remove_ref();
+}
+
+bool market::release ( bool is_public, bool blocking_terminate ) {
+    __TBB_ASSERT( theMarket == this, "Global market instance was destroyed prematurely?" );
+    bool do_release = false;
+    {
+        global_market_mutex_type::scoped_lock lock( theMarketMutex );
+        if ( blocking_terminate ) {
+            __TBB_ASSERT( is_public, "Only an object with a public reference can request the blocking terminate" );
+            while ( my_public_ref_count == 1 && my_ref_count > 1 ) {
+                lock.release();
+                // To guarantee that request_close_connection() is called by the last master, we need to wait till all
+                // references are released. Re-read my_public_ref_count to limit waiting if new masters are created.
+                // Theoretically, new private references to the market can be added during waiting making it potentially
+                // endless.
+                // TODO: revise why the weak scheduler needs market's pointer and try to remove this wait.
+                // Note that the market should know about its schedulers for cancelation/exception/priority propagation,
+                // see e.g. task_group_context::cancel_group_execution()
+                while ( __TBB_load_with_acquire( my_public_ref_count ) == 1 && __TBB_load_with_acquire( my_ref_count ) > 1 )
+                    __TBB_Yield();
+                lock.acquire( theMarketMutex );
+            }
+        }
+        if ( is_public ) {
+            __TBB_ASSERT( theMarket == this, "Global market instance was destroyed prematurely?" );
+            __TBB_ASSERT( my_public_ref_count, NULL );
+            --my_public_ref_count;
+        }
+        if ( --my_ref_count == 0 ) {
+            __TBB_ASSERT( !my_public_ref_count, NULL );
+            do_release = true;
+            theMarket = NULL;
+        }
+    }
+    if( do_release ) {
+        __TBB_ASSERT( !__TBB_load_with_acquire(my_public_ref_count), "No public references remain if we remove the market." );
+        // inform RML that blocking termination is required
+        my_join_workers = blocking_terminate;
+        my_server->request_close_connection();
+        return blocking_terminate;
+    }
+    return false;
+}
+
+void market::set_active_num_workers ( unsigned soft_limit ) {
+    int old_requested=0, requested=0;
+    bool need_mandatory = false;
+    market *m;
+
+    {
+        global_market_mutex_type::scoped_lock lock( theMarketMutex );
+        if ( !theMarket )
+            return; // actual value will be used at market creation
+        m = theMarket;
+        ++m->my_ref_count;
+    }
+    // have my_ref_count for market, use it safely
+    {
+        arenas_list_mutex_type::scoped_lock lock( m->my_arenas_list_mutex );
+        __TBB_ASSERT(soft_limit <= m->my_num_workers_hard_limit, NULL);
+        m->my_num_workers_soft_limit = soft_limit;
+        // report only once after new soft limit value is set
+        m->my_workers_soft_limit_to_report = soft_limit;
+
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        // updates soft_limit to zero must be postponed
+        // while mandatory parallelism is enabled
+        if( !(m->my_mandatory_num_requested && !soft_limit) )
+#endif
+        {
+            const int demand =
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+                m->my_mandatory_num_requested? 0 :
+#endif
+                m->my_total_demand;
+            requested = min(demand, (int)soft_limit);
+            old_requested = m->my_num_workers_requested;
+            m->my_num_workers_requested = requested;
+#if __TBB_TASK_PRIORITY
+            m->my_priority_levels[m->my_global_top_priority].workers_available = soft_limit;
+            m->update_allotment( m->my_global_top_priority );
+#else
+            m->update_allotment();
+#endif
+        }
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        if( !m->my_mandatory_num_requested && !soft_limit ) {
+            // enable mandatory concurrency, if enqueued tasks are found
+            // and zero soft_limit requested
+#if __TBB_TASK_PRIORITY
+            for( int p = m->my_global_top_priority; p >= m->my_global_bottom_priority; --p ) {
+                priority_level_info &pl = m->my_priority_levels[p];
+                arena_list_type &arenas = pl.arenas;
+#else
+                const int p = 0;
+                arena_list_type &arenas = m->my_arenas;
+#endif /* __TBB_TASK_PRIORITY */
+                for( arena_list_type::iterator it = arenas.begin(); it != arenas.end(); ++it ) {
+                    if( !it->my_task_stream.empty(p) ) {
+                        // switch local_mandatory to global_mandatory unconditionally
+                        if( m->mandatory_concurrency_enable_impl( &*it ) )
+                            need_mandatory = true;
+                    }
+                }
+#if __TBB_TASK_PRIORITY
+            }
+#endif /* __TBB_TASK_PRIORITY */
+        }
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+    }
+    // adjust_job_count_estimate must be called outside of any locks
+    int delta = requested - old_requested;
+    if( need_mandatory ) ++delta;
+    if( delta!=0 )
+        m->my_server->adjust_job_count_estimate( delta );
+    // release internal market reference to match ++m->my_ref_count above
+    m->release( /*is_public=*/false, /*blocking_terminate=*/false );
+}
+
+bool governor::does_client_join_workers (const tbb::internal::rml::tbb_client &client) {
+    return ((const market&)client).must_join_workers();
+}
+
+arena* market::create_arena ( int num_slots, int num_reserved_slots, size_t stack_size ) {
+    __TBB_ASSERT( num_slots > 0, NULL );
+    __TBB_ASSERT( num_reserved_slots <= num_slots, NULL );
+    // Add public market reference for master thread/task_arena (that adds an internal reference in exchange).
+    market &m = global_market( /*is_public=*/true, num_slots-num_reserved_slots, stack_size );
+
+    arena& a = arena::allocate_arena( m, num_slots, num_reserved_slots );
+    // Add newly created arena into the existing market's list.
+    arenas_list_mutex_type::scoped_lock lock(m.my_arenas_list_mutex);
+    m.insert_arena_into_list(a);
+    return &a;
+}
+
+/** This method must be invoked under my_arenas_list_mutex. **/
+void market::detach_arena ( arena& a ) {
+    __TBB_ASSERT( theMarket == this, "Global market instance was destroyed prematurely?" );
+    __TBB_ASSERT( !a.my_slots[0].my_scheduler, NULL );
+    remove_arena_from_list(a);
+    if ( a.my_aba_epoch == my_arenas_aba_epoch )
+        ++my_arenas_aba_epoch;
+}
+
+void market::try_destroy_arena ( arena* a, uintptr_t aba_epoch ) {
+    bool locked = true;
+    __TBB_ASSERT( a, NULL );
+    // we hold reference to the market, so it cannot be destroyed at any moment here
+    __TBB_ASSERT( this == theMarket, NULL );
+    __TBB_ASSERT( my_ref_count!=0, NULL );
+    my_arenas_list_mutex.lock();
+    assert_market_valid();
+#if __TBB_TASK_PRIORITY
+    // scan all priority levels, not only in [my_global_bottom_priority;my_global_top_priority]
+    // range, because arena to be destroyed can have no outstanding request for workers
+    for ( int p = num_priority_levels-1; p >= 0; --p ) {
+        priority_level_info &pl = my_priority_levels[p];
+        arena_list_type &my_arenas = pl.arenas;
+#endif /* __TBB_TASK_PRIORITY */
+        arena_list_type::iterator it = my_arenas.begin();
+        for ( ; it != my_arenas.end(); ++it ) {
+            if ( a == &*it ) {
+                if ( it->my_aba_epoch == aba_epoch ) {
+                    // Arena is alive
+                    if ( !a->my_num_workers_requested && !a->my_references ) {
+                        __TBB_ASSERT( !a->my_num_workers_allotted && (a->my_pool_state == arena::SNAPSHOT_EMPTY || !a->my_max_num_workers), "Inconsistent arena state" );
+                        // Arena is abandoned. Destroy it.
+                        detach_arena( *a );
+                        my_arenas_list_mutex.unlock();
+                        locked = false;
+                        a->free_arena();
+                    }
+                }
+                if (locked)
+                    my_arenas_list_mutex.unlock();
+                return;
+            }
+        }
+#if __TBB_TASK_PRIORITY
+    }
+#endif /* __TBB_TASK_PRIORITY */
+    my_arenas_list_mutex.unlock();
+}
+
+/** This method must be invoked under my_arenas_list_mutex. **/
+arena* market::arena_in_need ( arena_list_type &arenas, arena *hint ) {
+    if ( arenas.empty() )
+        return NULL;
+    arena_list_type::iterator it = hint;
+    __TBB_ASSERT( it != arenas.end(), NULL );
+    do {
+        arena& a = *it;
+        if ( ++it == arenas.end() )
+            it = arenas.begin();
+        if( a.num_workers_active() < a.my_num_workers_allotted
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+            && !a.recall_by_mandatory_request()
+#endif
+            ) {
+            a.my_references += arena::ref_worker;
+            return &a;
+        }
+    } while ( it != hint );
+    return NULL;
+}
+
+int market::update_allotment ( arena_list_type& arenas, int workers_demand, int max_workers ) {
+    __TBB_ASSERT( workers_demand, NULL );
+    max_workers = min(workers_demand, max_workers);
+    int carry = 0;
+    int assigned = 0;
+    arena_list_type::iterator it = arenas.begin();
+    for ( ; it != arenas.end(); ++it ) {
+        arena& a = *it;
+        if ( a.my_num_workers_requested <= 0 ) {
+            __TBB_ASSERT( !a.my_num_workers_allotted, NULL );
+            continue;
+        }
+        int tmp = a.my_num_workers_requested * max_workers + carry;
+        int allotted = tmp / workers_demand;
+        carry = tmp % workers_demand;
+        // a.my_num_workers_requested may temporarily exceed a.my_max_num_workers
+        allotted = min( allotted, (int)a.my_max_num_workers );
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        if ( !allotted && a.must_have_concurrency() )
+            allotted = 1;
+#endif
+        a.my_num_workers_allotted = allotted;
+        assigned += allotted;
+    }
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    __TBB_ASSERT( assigned <= workers_demand, NULL ); // weaker assertion due to enforced allotment
+#else
+    __TBB_ASSERT( assigned <= max_workers, NULL );
+#endif
+    return assigned;
+}
+
+/** This method must be invoked under my_arenas_list_mutex. **/
+bool market::is_arena_in_list( arena_list_type &arenas, arena *a ) {
+    if ( a ) {
+        for ( arena_list_type::iterator it = arenas.begin(); it != arenas.end(); ++it )
+            if ( a == &*it )
+                return true;
+    }
+    return false;
+}
+
+#if __TBB_TASK_PRIORITY
+inline void market::update_global_top_priority ( intptr_t newPriority ) {
+    GATHER_STATISTIC( ++governor::local_scheduler_if_initialized()->my_counters.market_prio_switches );
+    my_global_top_priority = newPriority;
+    my_priority_levels[newPriority].workers_available =
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        my_mandatory_num_requested && !my_num_workers_soft_limit ? 1 :
+#endif
+        my_num_workers_soft_limit;
+    advance_global_reload_epoch();
+}
+
+inline void market::reset_global_priority () {
+    my_global_bottom_priority = normalized_normal_priority;
+    update_global_top_priority(normalized_normal_priority);
+}
+
+arena* market::arena_in_need ( arena* prev_arena ) {
+    if( as_atomic(my_total_demand) <= 0 )
+        return NULL;
+    arenas_list_mutex_type::scoped_lock lock(my_arenas_list_mutex, /*is_writer=*/false);
+    assert_market_valid();
+    int p = my_global_top_priority;
+    arena *a = NULL;
+
+    // Checks if arena is alive or not
+    if ( is_arena_in_list( my_priority_levels[p].arenas, prev_arena ) ) {
+        a = arena_in_need( my_priority_levels[p].arenas, prev_arena );
+    }
+
+    while ( !a && p >= my_global_bottom_priority ) {
+        priority_level_info &pl = my_priority_levels[p--];
+        a = arena_in_need( pl.arenas, pl.next_arena );
+        if ( a ) {
+            as_atomic(pl.next_arena) = a; // a subject for innocent data race under the reader lock
+            // TODO: rework global round robin policy to local or random to avoid this write
+        }
+        // TODO: When refactoring task priority code, take into consideration the
+        // __TBB_TRACK_PRIORITY_LEVEL_SATURATION sections from earlier versions of TBB
+    }
+    return a;
+}
+
+void market::update_allotment ( intptr_t highest_affected_priority ) {
+    intptr_t i = highest_affected_priority;
+    int available = my_priority_levels[i].workers_available;
+    for ( ; i >= my_global_bottom_priority; --i ) {
+        priority_level_info &pl = my_priority_levels[i];
+        pl.workers_available = available;
+        if ( pl.workers_requested ) {
+            available -= update_allotment( pl.arenas, pl.workers_requested, available );
+            if ( available < 0 ) { // TODO: assertion?
+                available = 0;
+                break;
+            }
+        }
+    }
+    __TBB_ASSERT( i <= my_global_bottom_priority || !available, NULL );
+    for ( --i; i >= my_global_bottom_priority; --i ) {
+        priority_level_info &pl = my_priority_levels[i];
+        pl.workers_available = 0;
+        arena_list_type::iterator it = pl.arenas.begin();
+        for ( ; it != pl.arenas.end(); ++it ) {
+            __TBB_ASSERT( it->my_num_workers_requested >= 0 || !it->my_num_workers_allotted, NULL );
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+            it->my_num_workers_allotted = it->must_have_concurrency() ? 1 : 0;
+#else
+            it->my_num_workers_allotted = 0;
+#endif
+        }
+    }
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+bool market::mandatory_concurrency_enable_impl ( arena *a, bool *enabled ) {
+    if( a->my_concurrency_mode==arena_base::cm_enforced_global ) {
+        if( enabled )
+            *enabled = false;
+        return false;
+    }
+    if( enabled )
+        *enabled = true;
+    a->my_max_num_workers = 1;
+    a->my_concurrency_mode = arena_base::cm_enforced_global;
+#if __TBB_TASK_PRIORITY
+    priority_level_info &pl = my_priority_levels[a->my_top_priority];
+    pl.workers_requested++;
+    if( my_global_top_priority < a->my_top_priority ) {
+        my_global_top_priority = a->my_top_priority;
+        advance_global_reload_epoch();
+    }
+#endif
+    a->my_num_workers_requested++;
+    a->my_num_workers_allotted++;
+    if( 1 == ++my_mandatory_num_requested ) {
+        my_total_demand++;
+        return true;
+    }
+    return false;
+}
+
+bool market::mandatory_concurrency_enable ( arena *a ) {
+    bool add_thread;
+    bool enabled;
+    {
+        arenas_list_mutex_type::scoped_lock lock(my_arenas_list_mutex);
+        add_thread = mandatory_concurrency_enable_impl(a, &enabled);
+    }
+    if( add_thread )
+        my_server->adjust_job_count_estimate( 1 );
+    return enabled;
+}
+
+void market::mandatory_concurrency_disable ( arena *a ) {
+    bool remove_thread = false;
+    int delta_adjust_demand = 0;
+
+    {
+        arenas_list_mutex_type::scoped_lock lock(my_arenas_list_mutex);
+
+        if( a->my_concurrency_mode!=arena_base::cm_enforced_global  )
+            return;
+        __TBB_ASSERT( a->my_max_num_workers==1, NULL );
+        a->my_max_num_workers = 0;
+#if __TBB_TASK_PRIORITY
+        if ( a->my_top_priority != normalized_normal_priority ) {
+            update_arena_top_priority( *a, normalized_normal_priority );
+        }
+        a->my_bottom_priority = normalized_normal_priority;
+#endif
+
+        int val = --my_mandatory_num_requested;
+        __TBB_ASSERT_EX( val >= 0, NULL );
+        if( val == 0 ) {
+            my_total_demand--;
+            remove_thread = true;
+        }
+        a->my_num_workers_requested--;
+        if (a->my_num_workers_requested > 0)
+            delta_adjust_demand = a->my_num_workers_requested;
+        else
+            a->my_num_workers_allotted = 0;
+
+#if __TBB_TASK_PRIORITY
+        priority_level_info &pl = my_priority_levels[a->my_top_priority];
+        pl.workers_requested--;
+        intptr_t p = my_global_top_priority;
+        for (; !my_priority_levels[p].workers_requested && p>0; p--)
+            ;
+        if( !p )
+            reset_global_priority();
+        else if( p!= my_global_top_priority )
+            update_global_top_priority(p);
+#endif
+        a->my_concurrency_mode = arena::cm_normal;
+    }
+    if( delta_adjust_demand )
+        adjust_demand( *a, -delta_adjust_demand );
+    if( remove_thread )
+        my_server->adjust_job_count_estimate( -1 );
+}
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+
+void market::adjust_demand ( arena& a, int delta ) {
+    __TBB_ASSERT( theMarket, "market instance was destroyed prematurely?" );
+    if ( !delta )
+        return;
+    my_arenas_list_mutex.lock();
+    int prev_req = a.my_num_workers_requested;
+    a.my_num_workers_requested += delta;
+    if ( a.my_num_workers_requested <= 0 ) {
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        // must not recall worker from arena with mandatory parallelism
+        if ( a.my_market->my_mandatory_num_requested && a.my_concurrency_mode!=arena_base::cm_normal )
+            a.my_num_workers_allotted = 1;
+        else
+#endif
+            a.my_num_workers_allotted = 0;
+        if ( prev_req <= 0 ) {
+            my_arenas_list_mutex.unlock();
+            return;
+        }
+        delta = -prev_req;
+    }
+    else if ( prev_req < 0 ) {
+        delta = a.my_num_workers_requested;
+    }
+    my_total_demand += delta;
+#if !__TBB_TASK_PRIORITY
+    update_allotment();
+#else /* !__TBB_TASK_PRIORITY */
+    intptr_t p = a.my_top_priority;
+    priority_level_info &pl = my_priority_levels[p];
+    pl.workers_requested += delta;
+    __TBB_ASSERT( pl.workers_requested >= 0, NULL );
+    if ( a.my_num_workers_requested <= 0 ) {
+        if ( a.my_top_priority != normalized_normal_priority ) {
+            GATHER_STATISTIC( ++governor::local_scheduler_if_initialized()->my_counters.arena_prio_resets );
+            update_arena_top_priority( a, normalized_normal_priority );
+        }
+        a.my_bottom_priority = normalized_normal_priority;
+    }
+    if ( p == my_global_top_priority ) {
+        if ( !pl.workers_requested ) {
+            while ( --p >= my_global_bottom_priority && !my_priority_levels[p].workers_requested )
+                continue;
+            if ( p < my_global_bottom_priority )
+                reset_global_priority();
+            else
+                update_global_top_priority(p);
+        }
+        update_allotment( my_global_top_priority );
+    }
+    else if ( p > my_global_top_priority ) {
+        __TBB_ASSERT( pl.workers_requested > 0, NULL );
+        // TODO: investigate if the following invariant is always valid
+        __TBB_ASSERT( a.my_num_workers_requested >= 0, NULL );
+        update_global_top_priority(p);
+        a.my_num_workers_allotted = min( (int)my_num_workers_soft_limit, a.my_num_workers_requested );
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        // must not recall worker from arena with mandatory parallelism
+        if ( !a.my_num_workers_allotted && a.my_num_workers_requested
+             && a.my_market->my_mandatory_num_requested && a.my_concurrency_mode!=arena_base::cm_normal )
+            a.my_num_workers_allotted = 1;
+#endif
+        my_priority_levels[p - 1].workers_available = my_num_workers_soft_limit - a.my_num_workers_allotted;
+        update_allotment( p - 1 );
+    }
+    else if ( p == my_global_bottom_priority ) {
+        if ( !pl.workers_requested ) {
+            while ( ++p <= my_global_top_priority && !my_priority_levels[p].workers_requested )
+                continue;
+            if ( p > my_global_top_priority )
+                reset_global_priority();
+            else
+                my_global_bottom_priority = p;
+        }
+        else
+            update_allotment( p );
+    }
+    else if ( p < my_global_bottom_priority ) {
+        int prev_bottom = my_global_bottom_priority;
+        my_global_bottom_priority = p;
+        update_allotment( prev_bottom );
+    }
+    else {
+        __TBB_ASSERT( my_global_bottom_priority < p && p < my_global_top_priority, NULL );
+        update_allotment( p );
+    }
+    __TBB_ASSERT( my_global_top_priority >= a.my_top_priority || a.my_num_workers_requested<=0, NULL );
+    assert_market_valid();
+#endif /* !__TBB_TASK_PRIORITY */
+    if ( delta > 0 ) {
+        // can't overflow soft_limit, but remember values request by arenas in
+        // my_total_demand to not prematurely release workers to RML
+        if ( my_num_workers_requested+delta > (int)my_num_workers_soft_limit )
+            delta = my_num_workers_soft_limit - my_num_workers_requested;
+    } else {
+        // the number of workers should not be decreased below my_total_demand
+        if ( my_num_workers_requested+delta < my_total_demand )
+            delta = min(my_total_demand, (int)my_num_workers_soft_limit) - my_num_workers_requested;
+    }
+    my_num_workers_requested += delta;
+    __TBB_ASSERT( my_num_workers_requested <= (int)my_num_workers_soft_limit, NULL );
+
+    my_arenas_list_mutex.unlock();
+    // Must be called outside of any locks
+    my_server->adjust_job_count_estimate( delta );
+    GATHER_STATISTIC( governor::local_scheduler_if_initialized() ? ++governor::local_scheduler_if_initialized()->my_counters.gate_switches : 0 );
+}
+
+void market::process( job& j ) {
+    generic_scheduler& s = static_cast<generic_scheduler&>(j);
+    // s.my_arena can be dead. Don't access it until arena_in_need is called
+    arena *a = s.my_arena;
+    __TBB_ASSERT( governor::is_set(&s), NULL );
+    enum {
+        query_interval = 1000,
+        first_interval = 1
+    };
+    for(int i = first_interval; ; i--) {
+        while ( (a = arena_in_need(a)) )
+        {
+            a->process(s);
+            a = NULL; // To avoid double checks in arena_in_need
+            i = first_interval;
+        }
+        // Workers leave market because there is no arena in need. It can happen earlier than
+        // adjust_job_count_estimate() decreases my_slack and RML can put this thread to sleep.
+        // It might result in a busy-loop checking for my_slack<0 and calling this method instantly.
+        // first_interval>0 and the yield refines this spinning.
+        if( i > 0 )
+            __TBB_Yield();
+        else
+#if !__TBB_SLEEP_PERMISSION
+            break;
+#else
+        { // i == 0
+#if __TBB_TASK_PRIORITY
+            arena_list_type &al = my_priority_levels[my_global_top_priority].arenas;
+#else /* __TBB_TASK_PRIORITY */
+            arena_list_type &al = my_arenas;
+#endif /* __TBB_TASK_PRIORITY */
+            if( al.empty() ) // races if any are innocent TODO: replace by an RML query interface
+                break; // no arenas left, perhaps going to shut down
+            if( the_global_observer_list.ask_permission_to_leave() )
+                break; // go sleep
+            __TBB_Yield();
+            i = query_interval;
+        }
+#endif// !__TBB_SLEEP_PERMISSION
+    }
+    GATHER_STATISTIC( ++s.my_counters.market_roundtrips );
+}
+
+void market::cleanup( job& j ) {
+    __TBB_ASSERT( theMarket != this, NULL );
+    generic_scheduler& s = static_cast<generic_scheduler&>(j);
+    generic_scheduler* mine = governor::local_scheduler_if_initialized();
+    __TBB_ASSERT( !mine || mine->is_worker(), NULL );
+    if( mine!=&s ) {
+        governor::assume_scheduler( &s );
+        generic_scheduler::cleanup_worker( &s, mine!=NULL );
+        governor::assume_scheduler( mine );
+    } else {
+        generic_scheduler::cleanup_worker( &s, true );
+    }
+}
+
+void market::acknowledge_close_connection() {
+    destroy();
+}
+
+::rml::job* market::create_one_job() {
+    unsigned index = ++my_first_unused_worker_idx;
+    __TBB_ASSERT( index > 0, NULL );
+    ITT_THREAD_SET_NAME(_T("TBB Worker Thread"));
+    // index serves as a hint decreasing conflicts between workers when they migrate between arenas
+    generic_scheduler* s = generic_scheduler::create_worker( *this, index );
+#if __TBB_TASK_GROUP_CONTEXT
+    __TBB_ASSERT( index <= my_num_workers_hard_limit, NULL );
+    __TBB_ASSERT( !my_workers[index - 1], NULL );
+    my_workers[index - 1] = s;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    return s;
+}
+
+#if __TBB_TASK_PRIORITY
+void market::update_arena_top_priority ( arena& a, intptr_t new_priority ) {
+    GATHER_STATISTIC( ++governor::local_scheduler_if_initialized()->my_counters.arena_prio_switches );
+    __TBB_ASSERT( a.my_top_priority != new_priority, NULL );
+    priority_level_info &prev_level = my_priority_levels[a.my_top_priority],
+                        &new_level = my_priority_levels[new_priority];
+    remove_arena_from_list(a);
+    a.my_top_priority = new_priority;
+    insert_arena_into_list(a);
+    as_atomic( a.my_reload_epoch ).fetch_and_increment<tbb::release>(); // TODO: synch with global reload epoch in order to optimize usage of local reload epoch
+    prev_level.workers_requested -= a.my_num_workers_requested;
+    new_level.workers_requested += a.my_num_workers_requested;
+    __TBB_ASSERT( prev_level.workers_requested >= 0 && new_level.workers_requested >= 0, NULL );
+}
+
+bool market::lower_arena_priority ( arena& a, intptr_t new_priority, uintptr_t old_reload_epoch ) {
+    // TODO: replace the lock with a try_lock loop which performs a double check of the epoch
+    arenas_list_mutex_type::scoped_lock lock(my_arenas_list_mutex);
+    if ( a.my_reload_epoch != old_reload_epoch ) {
+        assert_market_valid();
+        return false;
+    }
+    __TBB_ASSERT( a.my_top_priority > new_priority, NULL );
+    __TBB_ASSERT( my_global_top_priority >= a.my_top_priority, NULL );
+
+    intptr_t p = a.my_top_priority;
+    update_arena_top_priority( a, new_priority );
+    if ( a.my_num_workers_requested > 0 ) {
+        if ( my_global_bottom_priority > new_priority ) {
+            my_global_bottom_priority = new_priority;
+        }
+        if ( p == my_global_top_priority && !my_priority_levels[p].workers_requested ) {
+            // Global top level became empty
+            for ( --p; p>my_global_bottom_priority && !my_priority_levels[p].workers_requested; --p ) continue;
+            update_global_top_priority(p);
+        }
+        update_allotment( p );
+    }
+
+    __TBB_ASSERT( my_global_top_priority >= a.my_top_priority, NULL );
+    assert_market_valid();
+    return true;
+}
+
+bool market::update_arena_priority ( arena& a, intptr_t new_priority ) {
+    // TODO: do not acquire this global lock while checking arena's state.
+    arenas_list_mutex_type::scoped_lock lock(my_arenas_list_mutex);
+
+    tbb::internal::assert_priority_valid(new_priority);
+    __TBB_ASSERT( my_global_top_priority >= a.my_top_priority || a.my_num_workers_requested <= 0, NULL );
+    assert_market_valid();
+    if ( a.my_top_priority == new_priority ) {
+        return false;
+    }
+    else if ( a.my_top_priority > new_priority ) {
+        if ( a.my_bottom_priority > new_priority )
+            a.my_bottom_priority = new_priority;
+        return false;
+    }
+    else if ( a.my_num_workers_requested <= 0 ) {
+        return false;
+    }
+
+    __TBB_ASSERT( my_global_top_priority >= a.my_top_priority, NULL );
+
+    intptr_t p = a.my_top_priority;
+    intptr_t highest_affected_level = max(p, new_priority);
+    update_arena_top_priority( a, new_priority );
+
+    if ( my_global_top_priority < new_priority ) {
+        update_global_top_priority(new_priority);
+    }
+    else if ( my_global_top_priority == new_priority ) {
+        advance_global_reload_epoch();
+    }
+    else {
+        __TBB_ASSERT( new_priority < my_global_top_priority, NULL );
+        __TBB_ASSERT( new_priority > my_global_bottom_priority, NULL );
+        if ( p == my_global_top_priority && !my_priority_levels[p].workers_requested ) {
+            // Global top level became empty
+            __TBB_ASSERT( my_global_bottom_priority < p, NULL );
+            for ( --p; !my_priority_levels[p].workers_requested; --p ) continue;
+            __TBB_ASSERT( p >= new_priority, NULL );
+            update_global_top_priority(p);
+            highest_affected_level = p;
+        }
+    }
+    if ( p == my_global_bottom_priority ) {
+        // Arena priority was increased from the global bottom level.
+        __TBB_ASSERT( p < new_priority, NULL );
+        __TBB_ASSERT( new_priority <= my_global_top_priority, NULL );
+        while ( my_global_bottom_priority < my_global_top_priority
+                && !my_priority_levels[my_global_bottom_priority].workers_requested )
+            ++my_global_bottom_priority;
+        __TBB_ASSERT( my_global_bottom_priority <= new_priority, NULL );
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+        const bool enforced_concurrency = my_mandatory_num_requested && a.must_have_concurrency();
+#else
+        const bool enforced_concurrency = false;
+#endif
+        __TBB_ASSERT_EX( enforced_concurrency || my_priority_levels[my_global_bottom_priority].workers_requested > 0, NULL );
+    }
+    update_allotment( highest_affected_level );
+
+    __TBB_ASSERT( my_global_top_priority >= a.my_top_priority, NULL );
+    assert_market_valid();
+    return true;
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+} // namespace internal
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/market.h b/xdl/third_party/tbb/src/tbb/market.h
new file mode 100644
index 00000000..d6bdf103
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/market.h
@@ -0,0 +1,375 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_market_H
+#define _TBB_market_H
+
+#include "tbb/tbb_stddef.h"
+
+#include "scheduler_common.h"
+#include "tbb/atomic.h"
+#include "tbb/spin_rw_mutex.h"
+#include "../rml/include/rml_tbb.h"
+
+#include "intrusive_list.h"
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (push)
+    #pragma warning (disable: 4244)
+#endif
+
+namespace tbb {
+
+class task_group_context;
+
+namespace internal {
+
+//------------------------------------------------------------------------
+// Class market
+//------------------------------------------------------------------------
+
+class market : no_copy, rml::tbb_client {
+    friend class generic_scheduler;
+    friend class arena;
+    friend class tbb::interface7::internal::task_arena_base;
+    template<typename SchedulerTraits> friend class custom_scheduler;
+    friend class tbb::task_group_context;
+private:
+    friend void ITT_DoUnsafeOneTimeInitialization ();
+
+    typedef intrusive_list<arena> arena_list_type;
+    typedef intrusive_list<generic_scheduler> scheduler_list_type;
+
+    //! Currently active global market
+    static market* theMarket;
+
+    typedef scheduler_mutex_type global_market_mutex_type;
+
+    //! Mutex guarding creation/destruction of theMarket, insertions/deletions in my_arenas, and cancellation propagation
+    static global_market_mutex_type  theMarketMutex;
+
+    //! Lightweight mutex guarding accounting operations with arenas list
+    typedef spin_rw_mutex arenas_list_mutex_type;
+    arenas_list_mutex_type my_arenas_list_mutex;
+
+    //! Pointer to the RML server object that services this TBB instance.
+    rml::tbb_server* my_server;
+
+    //! Maximal number of workers allowed for use by the underlying resource manager
+    /** It can't be changed after market creation. **/
+    unsigned my_num_workers_hard_limit;
+
+    //! Current application-imposed limit on the number of workers (see set_active_num_workers())
+    /** It can't be more than my_num_workers_hard_limit. **/
+    unsigned my_num_workers_soft_limit;
+
+    //! Number of workers currently requested from RML
+    int my_num_workers_requested;
+
+    //! First unused index of worker
+    /** Used to assign indices to the new workers coming from RML, and busy part
+        of my_workers array. **/
+    atomic<unsigned> my_first_unused_worker_idx;
+
+    //! Number of workers that were requested by all arenas
+    int my_total_demand;
+
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    //! How many times mandatory concurrency was requested from the market
+    int my_mandatory_num_requested;
+#endif
+
+#if __TBB_TASK_PRIORITY
+    //! Highest priority among active arenas in the market.
+    /** Arena priority level is its tasks highest priority (specified by arena's
+        my_top_priority member).
+        Arena is active when it has outstanding request for workers. Note that
+        inactive arena may have workers lingering there for some time. **/
+    intptr_t my_global_top_priority;
+
+    //! Lowest priority among active arenas in the market.
+    /** See also my_global_top_priority **/
+    intptr_t my_global_bottom_priority;
+
+    //! Tracks events that may bring tasks in offload areas to the top priority level.
+    /** Incremented when global top priority is decremented or a task group priority
+        is elevated to the current top level. **/
+    uintptr_t my_global_reload_epoch;
+
+    //! Information about arenas at a particular priority level
+    struct priority_level_info {
+        //! List of arenas at this priority level
+        arena_list_type arenas;
+
+        //! The first arena to be checked when idle worker seeks for an arena to enter
+        /** The check happens in round-robin fashion. **/
+        arena *next_arena;
+
+        //! Total amount of workers requested by arenas at this priority level.
+        int workers_requested;
+
+        //! Maximal amount of workers the market can tell off to this priority level.
+        int workers_available;
+    }; // struct priority_level_info
+
+    //! Information about arenas at different priority levels
+    priority_level_info my_priority_levels[num_priority_levels];
+
+#else /* !__TBB_TASK_PRIORITY */
+
+    //! List of registered arenas
+    arena_list_type my_arenas;
+
+    //! The first arena to be checked when idle worker seeks for an arena to enter
+    /** The check happens in round-robin fashion. **/
+    arena *my_next_arena;
+#endif /* !__TBB_TASK_PRIORITY */
+
+    //! ABA prevention marker to assign to newly created arenas
+    uintptr_t my_arenas_aba_epoch;
+
+    //! Reference count controlling market object lifetime
+    unsigned my_ref_count;
+
+    //! Count of master threads attached
+    unsigned my_public_ref_count;
+
+    //! Stack size of worker threads
+    size_t my_stack_size;
+
+    //! Shutdown mode
+    bool my_join_workers;
+
+    //! The value indicating that the soft limit warning is unnecessary
+    static const unsigned skip_soft_limit_warning = ~0U;
+
+    //! Either workers soft limit to be reported via runtime_warning() or skip_soft_limit_warning
+    unsigned my_workers_soft_limit_to_report;
+#if __TBB_COUNT_TASK_NODES
+    //! Net number of nodes that have been allocated from heap.
+    /** Updated each time a scheduler or arena is destroyed. */
+    atomic<intptr_t> my_task_node_count;
+#endif /* __TBB_COUNT_TASK_NODES */
+
+    //! Constructor
+    market ( unsigned workers_soft_limit, unsigned workers_hard_limit, size_t stack_size );
+
+    //! Factory method creating new market object
+    static market& global_market ( bool is_public, unsigned max_num_workers = 0, size_t stack_size = 0 );
+
+    //! Destroys and deallocates market object created by market::create()
+    void destroy ();
+
+#if __TBB_TASK_PRIORITY
+    //! Returns next arena that needs more workers, or NULL.
+    arena* arena_in_need ( arena* prev_arena );
+
+    //! Recalculates the number of workers assigned to each arena at and below the specified priority.
+    /** The actual number of workers servicing a particular arena may temporarily
+        deviate from the calculated value. **/
+    void update_allotment ( intptr_t highest_affected_priority );
+
+    //! Changes arena's top priority and updates affected priority levels info in the market.
+    void update_arena_top_priority ( arena& a, intptr_t newPriority );
+
+    //! Changes market's global top priority and related settings.
+    inline void update_global_top_priority ( intptr_t newPriority );
+
+    //! Resets empty market's global top and bottom priority to the normal level.
+    inline void reset_global_priority ();
+
+    inline void advance_global_reload_epoch () {
+        __TBB_store_with_release( my_global_reload_epoch, my_global_reload_epoch + 1 );
+    }
+
+    void assert_market_valid () const {
+        __TBB_ASSERT( (my_priority_levels[my_global_top_priority].workers_requested > 0
+                           && !my_priority_levels[my_global_top_priority].arenas.empty())
+                       || (my_global_top_priority == my_global_bottom_priority &&
+                           my_global_top_priority == normalized_normal_priority), NULL );
+    }
+
+#else /* !__TBB_TASK_PRIORITY */
+
+    //! Recalculates the number of workers assigned to each arena in the list.
+    /** The actual number of workers servicing a particular arena may temporarily
+        deviate from the calculated value. **/
+    void update_allotment () {
+        if ( my_total_demand )
+            update_allotment( my_arenas, my_total_demand, (int)my_num_workers_soft_limit );
+    }
+
+    // TODO: consider to rewrite the code with is_arena_in_list function
+    //! Returns next arena that needs more workers, or NULL.
+    arena* arena_in_need (arena*) {
+        if(__TBB_load_with_acquire(my_total_demand) <= 0)
+            return NULL;
+        arenas_list_mutex_type::scoped_lock lock(my_arenas_list_mutex, /*is_writer=*/false);
+        return arena_in_need(my_arenas, my_next_arena);
+    }
+    void assert_market_valid () const {}
+#endif /* !__TBB_TASK_PRIORITY */
+
+    ////////////////////////////////////////////////////////////////////////////////
+    // Helpers to unify code branches dependent on priority feature presence
+
+    void insert_arena_into_list ( arena& a );
+
+    void remove_arena_from_list ( arena& a );
+
+    arena* arena_in_need ( arena_list_type &arenas, arena *hint );
+
+    static int update_allotment ( arena_list_type& arenas, int total_demand, int max_workers );
+
+    bool is_arena_in_list( arena_list_type &arenas, arena *a );
+
+
+    ////////////////////////////////////////////////////////////////////////////////
+    // Implementation of rml::tbb_client interface methods
+
+    version_type version () const __TBB_override { return 0; }
+
+    unsigned max_job_count () const __TBB_override { return my_num_workers_hard_limit; }
+
+    size_t min_stack_size () const __TBB_override { return worker_stack_size(); }
+
+    policy_type policy () const __TBB_override { return throughput; }
+
+    job* create_one_job () __TBB_override;
+
+    void cleanup( job& j ) __TBB_override;
+
+    void acknowledge_close_connection () __TBB_override;
+
+    void process( job& j ) __TBB_override;
+
+public:
+    //! Creates an arena object
+    /** If necessary, also creates global market instance, and boosts its ref count.
+        Each call to create_arena() must be matched by the call to arena::free_arena(). **/
+    static arena* create_arena ( int num_slots, int num_reserved_slots, size_t stack_size );
+
+    //! Removes the arena from the market's list
+    void try_destroy_arena ( arena*, uintptr_t aba_epoch );
+
+    //! Removes the arena from the market's list
+    void detach_arena ( arena& );
+
+    //! Decrements market's refcount and destroys it in the end
+    bool release ( bool is_public, bool blocking_terminate );
+
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+    //! Imlpementation of mandatory concurrency enabling
+    bool mandatory_concurrency_enable_impl ( arena *a, bool *enabled = NULL );
+
+    //! Inform the master that there is an arena with mandatory concurrency
+    bool mandatory_concurrency_enable ( arena *a );
+
+    //! Inform the master that the arena is no more interested in mandatory concurrency
+    void mandatory_concurrency_disable ( arena *a );
+#endif /* __TBB_ENQUEUE_ENFORCED_CONCURRENCY */
+
+    //! Request that arena's need in workers should be adjusted.
+    /** Concurrent invocations are possible only on behalf of different arenas. **/
+    void adjust_demand ( arena&, int delta );
+
+    //! Used when RML asks for join mode during workers termination.
+    bool must_join_workers () const { return my_join_workers; }
+
+    //! Returns the requested stack size of worker threads.
+    size_t worker_stack_size () const { return my_stack_size; }
+
+    //! Set number of active workers
+    static void set_active_num_workers( unsigned w );
+
+    //! Reports active parallelism level according to user's settings
+    static unsigned app_parallelism_limit();
+
+#if _WIN32||_WIN64
+    //! register master with the resource manager
+    void register_master( ::rml::server::execution_resource_t& rsc_handle ) {
+        __TBB_ASSERT( my_server, "RML server not defined?" );
+        // the server may ignore registration and set master_exec_resource to NULL.
+        my_server->register_master( rsc_handle );
+    }
+
+    //! unregister master with the resource manager
+    void unregister_master( ::rml::server::execution_resource_t& rsc_handle ) const {
+        my_server->unregister_master( rsc_handle );
+    }
+#endif /* WIN */
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Finds all contexts affected by the state change and propagates the new state to them.
+    /** The propagation is relayed to the market because tasks created by one
+        master thread can be passed to and executed by other masters. This means
+        that context trees can span several arenas at once and thus state change
+        propagation cannot be generally localized to one arena only. **/
+    template <typename T>
+    bool propagate_task_group_state ( T task_group_context::*mptr_state, task_group_context& src, T new_state );
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#if __TBB_TASK_PRIORITY
+    //! Lowers arena's priority is not higher than newPriority
+    /** Returns true if arena priority was actually elevated. **/
+    bool lower_arena_priority ( arena& a, intptr_t new_priority, uintptr_t old_reload_epoch );
+
+    //! Makes sure arena's priority is not lower than newPriority
+    /** Returns true if arena priority was elevated. Also updates arena's bottom
+        priority boundary if necessary.
+
+        This method is called whenever a user changes priority, because whether
+        it was hiked or sunk can be determined for sure only under the lock used
+        by this function. **/
+    bool update_arena_priority ( arena& a, intptr_t new_priority );
+#endif /* __TBB_TASK_PRIORITY */
+
+#if __TBB_COUNT_TASK_NODES
+    //! Net number of nodes that have been allocated from heap.
+    /** Updated each time a scheduler or arena is destroyed. */
+    void update_task_node_count( intptr_t delta ) { my_task_node_count += delta; }
+#endif /* __TBB_COUNT_TASK_NODES */
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! List of registered master threads
+    scheduler_list_type my_masters;
+
+    //! Array of pointers to the registered workers
+    /** Used by cancellation propagation mechanism.
+        Must be the last data member of the class market. **/
+    generic_scheduler* my_workers[1];
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+    static unsigned max_num_workers() {
+        global_market_mutex_type::scoped_lock lock( theMarketMutex );
+        return theMarket? theMarket->my_num_workers_hard_limit : 0;
+    }
+}; // class market
+
+} // namespace internal
+} // namespace tbb
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (pop)
+#endif // warning 4244 is back
+
+#endif /* _TBB_market_H */
diff --git a/xdl/third_party/tbb/src/tbb/mutex.cpp b/xdl/third_party/tbb/src/tbb/mutex.cpp
new file mode 100644
index 00000000..12a44905
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/mutex.cpp
@@ -0,0 +1,152 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _WIN32||_WIN64
+#include <errno.h> // EDEADLK
+#endif
+#include "tbb/mutex.h"
+#include "itt_notify.h"
+#if __TBB_TSX_AVAILABLE
+#include "governor.h" // for speculation_enabled()
+#endif
+
+namespace tbb {
+    void mutex::scoped_lock::internal_acquire( mutex& m ) {
+
+#if _WIN32||_WIN64
+        switch( m.state ) {
+        case INITIALIZED:
+        case HELD:
+            EnterCriticalSection( &m.impl );
+            // If a thread comes here, and another thread holds the lock, it will block
+            // in EnterCriticalSection.  When it returns from EnterCriticalSection,
+            // m.state must be set to INITIALIZED.  If the same thread tries to acquire a lock it
+            // already holds, the lock is in HELD state, thus will cause throwing the exception.
+            if (m.state==HELD)
+                tbb::internal::handle_perror(EDEADLK,"mutex::scoped_lock: deadlock caused by attempt to reacquire held mutex");
+            m.state = HELD;
+            break;
+        case DESTROYED:
+            __TBB_ASSERT(false,"mutex::scoped_lock: mutex already destroyed");
+            break;
+        default:
+            __TBB_ASSERT(false,"mutex::scoped_lock: illegal mutex state");
+            break;
+        }
+#else
+        int error_code = pthread_mutex_lock(&m.impl);
+        if( error_code )
+            tbb::internal::handle_perror(error_code,"mutex::scoped_lock: pthread_mutex_lock failed");
+#endif /* _WIN32||_WIN64 */
+        my_mutex = &m;
+    }
+
+void mutex::scoped_lock::internal_release() {
+    __TBB_ASSERT( my_mutex, "mutex::scoped_lock: not holding a mutex" );
+#if _WIN32||_WIN64
+     switch( my_mutex->state ) {
+        case INITIALIZED:
+            __TBB_ASSERT(false,"mutex::scoped_lock: try to release the lock without acquisition");
+            break;
+        case HELD:
+            my_mutex->state = INITIALIZED;
+            LeaveCriticalSection(&my_mutex->impl);
+            break;
+        case DESTROYED:
+            __TBB_ASSERT(false,"mutex::scoped_lock: mutex already destroyed");
+            break;
+        default:
+            __TBB_ASSERT(false,"mutex::scoped_lock: illegal mutex state");
+            break;
+    }
+#else
+     int error_code = pthread_mutex_unlock(&my_mutex->impl);
+     __TBB_ASSERT_EX(!error_code, "mutex::scoped_lock: pthread_mutex_unlock failed");
+#endif /* _WIN32||_WIN64 */
+     my_mutex = NULL;
+}
+
+bool mutex::scoped_lock::internal_try_acquire( mutex& m ) {
+#if _WIN32||_WIN64
+    switch( m.state ) {
+        case INITIALIZED:
+        case HELD:
+            break;
+        case DESTROYED:
+            __TBB_ASSERT(false,"mutex::scoped_lock: mutex already destroyed");
+            break;
+        default:
+            __TBB_ASSERT(false,"mutex::scoped_lock: illegal mutex state");
+            break;
+    }
+#endif /* _WIN32||_WIN64 */
+
+    bool result;
+#if _WIN32||_WIN64
+    result = TryEnterCriticalSection(&m.impl)!=0;
+    if( result ) {
+        __TBB_ASSERT(m.state!=HELD, "mutex::scoped_lock: deadlock caused by attempt to reacquire held mutex");
+        m.state = HELD;
+    }
+#else
+    result = pthread_mutex_trylock(&m.impl)==0;
+#endif /* _WIN32||_WIN64 */
+    if( result )
+        my_mutex = &m;
+    return result;
+}
+
+void mutex::internal_construct() {
+#if _WIN32||_WIN64
+    InitializeCriticalSectionEx(&impl, 4000, 0);
+    state = INITIALIZED;
+#else
+    int error_code = pthread_mutex_init(&impl,NULL);
+    if( error_code )
+        tbb::internal::handle_perror(error_code,"mutex: pthread_mutex_init failed");
+#endif /* _WIN32||_WIN64*/
+    ITT_SYNC_CREATE(&impl, _T("tbb::mutex"), _T(""));
+}
+
+void mutex::internal_destroy() {
+#if _WIN32||_WIN64
+    switch( state ) {
+      case INITIALIZED:
+        DeleteCriticalSection(&impl);
+       break;
+      case DESTROYED:
+        __TBB_ASSERT(false,"mutex: already destroyed");
+        break;
+      default:
+        __TBB_ASSERT(false,"mutex: illegal state for destruction");
+        break;
+    }
+    state = DESTROYED;
+#else
+    int error_code = pthread_mutex_destroy(&impl);
+#if __TBB_TSX_AVAILABLE
+    // For processors with speculative execution, skip the error code check due to glibc bug #16657
+    if( tbb::internal::governor::speculation_enabled() ) return;
+#endif
+    __TBB_ASSERT_EX(!error_code,"mutex: pthread_mutex_destroy failed");
+#endif /* _WIN32||_WIN64 */
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/observer_proxy.cpp b/xdl/third_party/tbb/src/tbb/observer_proxy.cpp
new file mode 100644
index 00000000..1a5b39ad
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/observer_proxy.cpp
@@ -0,0 +1,426 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_SCHEDULER_OBSERVER
+
+#include "observer_proxy.h"
+#include "tbb_main.h"
+#include "governor.h"
+#include "scheduler.h"
+#include "arena.h"
+
+namespace tbb {
+namespace internal {
+
+padded<observer_list> the_global_observer_list;
+
+#if TBB_USE_ASSERT
+static atomic<int> observer_proxy_count;
+
+struct check_observer_proxy_count {
+    ~check_observer_proxy_count() {
+        if( observer_proxy_count!=0 ) {
+            runtime_warning( "Leaked %ld observer_proxy objects\n", long(observer_proxy_count) );
+        }
+    }
+};
+
+static check_observer_proxy_count the_check_observer_proxy_count;
+#endif /* TBB_USE_ASSERT */
+
+#if __TBB_ARENA_OBSERVER || __TBB_SLEEP_PERMISSION
+interface6::task_scheduler_observer* observer_proxy::get_v6_observer() {
+    if(my_version != 6) return NULL;
+    return static_cast<interface6::task_scheduler_observer*>(my_observer);
+}
+#endif
+
+#if __TBB_ARENA_OBSERVER
+bool observer_proxy::is_global() {
+    return !get_v6_observer() || get_v6_observer()->my_context_tag == interface6::task_scheduler_observer::global_tag;
+}
+#endif /* __TBB_ARENA_OBSERVER */
+
+observer_proxy::observer_proxy( task_scheduler_observer_v3& tso )
+    : my_list(NULL), my_next(NULL), my_prev(NULL), my_observer(&tso)
+{
+#if TBB_USE_ASSERT
+    ++observer_proxy_count;
+#endif /* TBB_USE_ASSERT */
+    // 1 for observer
+    my_ref_count = 1;
+    my_version =
+#if __TBB_ARENA_OBSERVER
+        load<relaxed>(my_observer->my_busy_count)
+                 == interface6::task_scheduler_observer::v6_trait ? 6 :
+#endif
+        0;
+    __TBB_ASSERT( my_version >= 6 || !load<relaxed>(my_observer->my_busy_count), NULL );
+}
+
+#if TBB_USE_ASSERT
+observer_proxy::~observer_proxy () {
+    __TBB_ASSERT( !my_ref_count, "Attempt to destroy proxy still in use" );
+    poison_value(my_ref_count);
+    poison_pointer(my_prev);
+    poison_pointer(my_next);
+    --observer_proxy_count;
+}
+#endif /* TBB_USE_ASSERT */
+
+template<memory_semantics M, class T, class V>
+T atomic_fetch_and_store ( T* addr, const V& val ) {
+    return (T)atomic_traits<sizeof(T), M>::fetch_and_store( addr, (T)val );
+}
+
+void observer_list::clear () {
+    __TBB_ASSERT( this != &the_global_observer_list, "Method clear() cannot be used on the list of global observers" );
+    // Though the method will work fine for the empty list, we require the caller
+    // to check for the list emptiness before invoking it to avoid extra overhead.
+    __TBB_ASSERT( !empty(), NULL );
+    {
+        scoped_lock lock(mutex(), /*is_writer=*/true);
+        observer_proxy *next = my_head;
+        while ( observer_proxy *p = next ) {
+            __TBB_ASSERT( p->my_version >= 6, NULL );
+            next = p->my_next;
+            // Both proxy p and observer p->my_observer (if non-null) are guaranteed
+            // to be alive while the list is locked.
+            task_scheduler_observer_v3 *obs = p->my_observer;
+            // Make sure that possible concurrent observer destruction does not
+            // conflict with the proxy list cleanup.
+            if ( !obs || !(p = (observer_proxy*)__TBB_FetchAndStoreW(&obs->my_proxy, 0)) )
+                continue;
+            // accessing 'obs' after detaching of obs->my_proxy leads to the race with observer destruction
+            __TBB_ASSERT( !next || p == next->my_prev, NULL );
+            __TBB_ASSERT( is_alive(p->my_ref_count), "Observer's proxy died prematurely" );
+            __TBB_ASSERT( p->my_ref_count == 1, "Reference for observer is missing" );
+#if TBB_USE_ASSERT
+            p->my_observer = NULL;
+            p->my_ref_count = 0;
+#endif /* TBB_USE_ASSERT */
+            remove(p);
+            delete p;
+        }
+    }
+    while( my_head )
+        __TBB_Yield();
+}
+
+void observer_list::insert ( observer_proxy* p ) {
+    scoped_lock lock(mutex(), /*is_writer=*/true);
+    if ( my_head ) {
+        p->my_prev = my_tail;
+        my_tail->my_next = p;
+    }
+    else
+        my_head = p;
+    my_tail = p;
+}
+
+void observer_list::remove ( observer_proxy* p ) {
+    __TBB_ASSERT( my_head, "Attempt to remove an item from an empty list" );
+    __TBB_ASSERT( !my_tail->my_next, "Last item's my_next must be NULL" );
+    if( p == my_tail ) {
+        __TBB_ASSERT( !p->my_next, NULL );
+        my_tail = p->my_prev;
+    }
+    else {
+        __TBB_ASSERT( p->my_next, NULL );
+        p->my_next->my_prev = p->my_prev;
+    }
+    if ( p == my_head ) {
+        __TBB_ASSERT( !p->my_prev, NULL );
+        my_head = p->my_next;
+    }
+    else {
+        __TBB_ASSERT( p->my_prev, NULL );
+        p->my_prev->my_next = p->my_next;
+    }
+    __TBB_ASSERT( (my_head && my_tail) || (!my_head && !my_tail), NULL );
+}
+
+void observer_list::remove_ref( observer_proxy* p ) {
+    int r = p->my_ref_count;
+    __TBB_ASSERT( is_alive(r), NULL );
+    while(r>1) {
+        __TBB_ASSERT( r!=0, NULL );
+        int r_old = p->my_ref_count.compare_and_swap(r-1,r);
+        if( r_old==r ) {
+            // Successfully decremented count.
+            return;
+        }
+        r = r_old;
+    }
+    __TBB_ASSERT( r==1, NULL );
+    // Reference count might go to zero
+    {
+        // Use lock to avoid resurrection by a thread concurrently walking the list
+        observer_list::scoped_lock lock(mutex(), /*is_writer=*/true);
+        r = --p->my_ref_count;
+        if( !r )
+            remove(p);
+    }
+    __TBB_ASSERT( r || !p->my_ref_count, NULL );
+    if( !r )
+        delete p;
+}
+
+void observer_list::do_notify_entry_observers( observer_proxy*& last, bool worker ) {
+    // Pointer p marches though the list from last (exclusively) to the end.
+    observer_proxy *p = last, *prev = p;
+    for(;;) {
+        task_scheduler_observer_v3* tso=NULL;
+        // Hold lock on list only long enough to advance to the next proxy in the list.
+        {
+            scoped_lock lock(mutex(), /*is_writer=*/false);
+            do {
+                if( p ) {
+                    // We were already processing the list.
+                    if( observer_proxy* q = p->my_next ) {
+                        if( p == prev )
+                            remove_ref_fast(prev); // sets prev to NULL if successful
+                        p = q;
+                    }
+                    else {
+                        // Reached the end of the list.
+                        if( p == prev ) {
+                            // Keep the reference as we store the 'last' pointer in scheduler
+                            __TBB_ASSERT(p->my_ref_count >= 1 + (p->my_observer?1:0), NULL);
+                        } else {
+                            // The last few proxies were empty
+                            __TBB_ASSERT(p->my_ref_count, NULL);
+                            ++p->my_ref_count;
+                            if( prev ) {
+                                lock.release();
+                                remove_ref(prev);
+                            }
+                        }
+                        last = p;
+                        return;
+                    }
+                } else {
+                    // Starting pass through the list
+                    p = my_head;
+                    if( !p )
+                        return;
+                }
+                tso = p->my_observer;
+            } while( !tso );
+            ++p->my_ref_count;
+            ++tso->my_busy_count;
+        }
+        __TBB_ASSERT( !prev || p!=prev, NULL );
+        // Release the proxy pinned before p
+        if( prev )
+            remove_ref(prev);
+        // Do not hold any locks on the list while calling user's code.
+        // Do not intercept any exceptions that may escape the callback so that
+        // they are either handled by the TBB scheduler or passed to the debugger.
+        tso->on_scheduler_entry(worker);
+        __TBB_ASSERT(p->my_ref_count, NULL);
+        intptr_t bc = --tso->my_busy_count;
+        __TBB_ASSERT_EX( bc>=0, "my_busy_count underflowed" );
+        prev = p;
+    }
+}
+
+void observer_list::do_notify_exit_observers( observer_proxy* last, bool worker ) {
+    // Pointer p marches though the list from the beginning to last (inclusively).
+    observer_proxy *p = NULL, *prev = NULL;
+    for(;;) {
+        task_scheduler_observer_v3* tso=NULL;
+        // Hold lock on list only long enough to advance to the next proxy in the list.
+        {
+            scoped_lock lock(mutex(), /*is_writer=*/false);
+            do {
+                if( p ) {
+                    // We were already processing the list.
+                    if( p != last ) {
+                        __TBB_ASSERT( p->my_next, "List items before 'last' must have valid my_next pointer" );
+                        if( p == prev )
+                            remove_ref_fast(prev); // sets prev to NULL if successful
+                        p = p->my_next;
+                    } else {
+                        // remove the reference from the last item
+                        remove_ref_fast(p);
+                        if( p ) {
+                            lock.release();
+                            remove_ref(p);
+                        }
+                        return;
+                    }
+                } else {
+                    // Starting pass through the list
+                    p = my_head;
+                    __TBB_ASSERT( p, "Nonzero 'last' must guarantee that the global list is non-empty" );
+                }
+                tso = p->my_observer;
+            } while( !tso );
+            // The item is already refcounted
+            if ( p != last ) // the last is already referenced since entry notification
+                ++p->my_ref_count;
+            ++tso->my_busy_count;
+        }
+        __TBB_ASSERT( !prev || p!=prev, NULL );
+        if( prev )
+            remove_ref(prev);
+        // Do not hold any locks on the list while calling user's code.
+        // Do not intercept any exceptions that may escape the callback so that
+        // they are either handled by the TBB scheduler or passed to the debugger.
+        tso->on_scheduler_exit(worker);
+        __TBB_ASSERT(p->my_ref_count || p == last, NULL);
+        intptr_t bc = --tso->my_busy_count;
+        __TBB_ASSERT_EX( bc>=0, "my_busy_count underflowed" );
+        prev = p;
+    }
+}
+
+#if __TBB_SLEEP_PERMISSION
+bool observer_list::ask_permission_to_leave() {
+    __TBB_ASSERT( this == &the_global_observer_list, "This method cannot be used on lists of arena observers" );
+    if( !my_head ) return true;
+    // Pointer p marches though the list
+    observer_proxy *p = NULL, *prev = NULL;
+    bool result = true;
+    while( result ) {
+        task_scheduler_observer* tso = NULL;
+        // Hold lock on list only long enough to advance to the next proxy in the list.
+        {
+            scoped_lock lock(mutex(), /*is_writer=*/false);
+            do {
+                if( p ) {
+                    // We were already processing the list.
+                    observer_proxy* q = p->my_next;
+                    // read next, remove the previous reference
+                    if( p == prev )
+                        remove_ref_fast(prev); // sets prev to NULL if successful
+                    if( q ) p = q;
+                    else {
+                        // Reached the end of the list.
+                        if( prev ) {
+                            lock.release();
+                            remove_ref(prev);
+                        }
+                        return result;
+                    }
+                } else {
+                    // Starting pass through the list
+                    p = my_head;
+                    if( !p )
+                        return result;
+                }
+                tso = p->get_v6_observer();
+            } while( !tso );
+            ++p->my_ref_count;
+            ++tso->my_busy_count;
+        }
+        __TBB_ASSERT( !prev || p!=prev, NULL );
+        // Release the proxy pinned before p
+        if( prev )
+            remove_ref(prev);
+        // Do not hold any locks on the list while calling user's code.
+        // Do not intercept any exceptions that may escape the callback so that
+        // they are either handled by the TBB scheduler or passed to the debugger.
+        result = tso->may_sleep();
+        __TBB_ASSERT(p->my_ref_count, NULL);
+        intptr_t bc = --tso->my_busy_count;
+        __TBB_ASSERT_EX( bc>=0, "my_busy_count underflowed" );
+        prev = p;
+    }
+    if( prev )
+        remove_ref(prev);
+    return result;
+}
+#endif//__TBB_SLEEP_PERMISSION
+
+void task_scheduler_observer_v3::observe( bool enable ) {
+    if( enable ) {
+        if( !my_proxy ) {
+            my_proxy = new observer_proxy( *this );
+            my_busy_count = 0; // proxy stores versioning information, clear it
+#if __TBB_ARENA_OBSERVER
+            if ( !my_proxy->is_global() ) {
+                // Local observer activation
+                generic_scheduler* s = governor::local_scheduler_if_initialized();
+                __TBB_ASSERT( my_proxy->get_v6_observer(), NULL );
+                intptr_t tag = my_proxy->get_v6_observer()->my_context_tag;
+                if( tag != interface6::task_scheduler_observer::implicit_tag ) { // explicit arena
+                    task_arena *a = reinterpret_cast<task_arena*>(tag);
+                    a->initialize();
+                    my_proxy->my_list = &a->my_arena->my_observers;
+                } else {
+                    if( !(s && s->my_arena) )
+                        s = governor::init_scheduler( task_scheduler_init::automatic, 0, true );
+                    __TBB_ASSERT( __TBB_InitOnce::initialization_done(), NULL );
+                    __TBB_ASSERT( s && s->my_arena, NULL );
+                    my_proxy->my_list = &s->my_arena->my_observers;
+                }
+                my_proxy->my_list->insert(my_proxy);
+                // Notify newly activated observer and other pending ones if it belongs to current arena
+                if(s && &s->my_arena->my_observers == my_proxy->my_list )
+                    my_proxy->my_list->notify_entry_observers( s->my_last_local_observer, s->is_worker() );
+            } else
+#endif /* __TBB_ARENA_OBSERVER */
+            {
+                // Obsolete. Global observer activation
+                if( !__TBB_InitOnce::initialization_done() )
+                    DoOneTimeInitializations();
+                my_proxy->my_list = &the_global_observer_list;
+                my_proxy->my_list->insert(my_proxy);
+                if( generic_scheduler* s = governor::local_scheduler_if_initialized() ) {
+                    // Notify newly created observer of its own thread.
+                    // Any other pending observers are notified too.
+                    the_global_observer_list.notify_entry_observers( s->my_last_global_observer, s->is_worker() );
+                }
+            }
+        }
+    } else {
+        // Make sure that possible concurrent proxy list cleanup does not conflict
+        // with the observer destruction here.
+        if ( observer_proxy* proxy = (observer_proxy*)__TBB_FetchAndStoreW(&my_proxy, 0) ) {
+            // List destruction should not touch this proxy after we've won the above interlocked exchange.
+            __TBB_ASSERT( proxy->my_observer == this, NULL );
+            __TBB_ASSERT( is_alive(proxy->my_ref_count), "Observer's proxy died prematurely" );
+            __TBB_ASSERT( proxy->my_ref_count >= 1, "reference for observer missing" );
+            observer_list &list = *proxy->my_list;
+            {
+                // Ensure that none of the list walkers relies on observer pointer validity
+                observer_list::scoped_lock lock(list.mutex(), /*is_writer=*/true);
+                proxy->my_observer = NULL;
+                // Proxy may still be held by other threads (to track the last notified observer)
+                if( !--proxy->my_ref_count ) {// nobody can increase it under exclusive lock
+                    list.remove(proxy);
+                    __TBB_ASSERT( !proxy->my_ref_count, NULL );
+                    delete proxy;
+                }
+            }
+            while( my_busy_count ) // other threads are still accessing the callback
+                __TBB_Yield();
+        }
+    }
+}
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* __TBB_SCHEDULER_OBSERVER */
diff --git a/xdl/third_party/tbb/src/tbb/observer_proxy.h b/xdl/third_party/tbb/src/tbb/observer_proxy.h
new file mode 100644
index 00000000..9751293f
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/observer_proxy.h
@@ -0,0 +1,176 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_observer_proxy_H
+#define _TBB_observer_proxy_H
+
+#if __TBB_SCHEDULER_OBSERVER
+
+#include "scheduler_common.h" // to include task.h
+#include "tbb/task_scheduler_observer.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/aligned_space.h"
+
+namespace tbb {
+namespace internal {
+
+class observer_list {
+    friend class arena;
+
+    // Mutex is wrapped with aligned_space to shut up warnings when its destructor
+    // is called while threads are still using it.
+    typedef aligned_space<spin_rw_mutex>  my_mutex_type;
+
+    //! Pointer to the head of this list.
+    observer_proxy* my_head;
+
+    //! Pointer to the tail of this list.
+    observer_proxy* my_tail;
+
+    //! Mutex protecting this list.
+    my_mutex_type my_mutex;
+
+    //! Back-pointer to the arena this list belongs to.
+    arena* my_arena;
+
+    //! Decrement refcount of the proxy p if there are other outstanding references.
+    /** In case of success sets p to NULL. Must be invoked from under the list lock. **/
+    inline static void remove_ref_fast( observer_proxy*& p );
+
+    //! Implements notify_entry_observers functionality.
+    void do_notify_entry_observers( observer_proxy*& last, bool worker );
+
+    //! Implements notify_exit_observers functionality.
+    void do_notify_exit_observers( observer_proxy* last, bool worker );
+
+public:
+    observer_list () : my_head(NULL), my_tail(NULL) {}
+
+    //! Removes and destroys all observer proxies from the list.
+    /** Cannot be used concurrently with other methods. **/
+    void clear ();
+
+    //! Add observer proxy to the tail of the list.
+    void insert ( observer_proxy* p );
+
+    //! Remove observer proxy from the list.
+    void remove ( observer_proxy* p );
+
+    //! Decrement refcount of the proxy and destroy it if necessary.
+    /** When refcount reaches zero removes the proxy from the list and destructs it. **/
+    void remove_ref( observer_proxy* p );
+
+    //! Type of the scoped lock for the reader-writer mutex associated with the list.
+    typedef spin_rw_mutex::scoped_lock scoped_lock;
+
+    //! Accessor to the reader-writer mutex associated with the list.
+    spin_rw_mutex& mutex () { return my_mutex.begin()[0]; }
+
+    bool empty () const { return my_head == NULL; }
+
+    //! Call entry notifications on observers added after last was notified.
+    /** Updates last to become the last notified observer proxy (in the global list)
+        or leaves it to be NULL. The proxy has its refcount incremented. **/
+    inline void notify_entry_observers( observer_proxy*& last, bool worker );
+
+    //! Call exit notifications on last and observers added before it.
+    inline void notify_exit_observers( observer_proxy*& last, bool worker );
+
+    //! Call may_sleep callbacks to ask for permission for a worker thread to leave market
+    bool ask_permission_to_leave();
+}; // class observer_list
+
+//! Wrapper for an observer object
+/** To maintain shared lists of observers the scheduler first wraps each observer
+    object into a proxy so that a list item remained valid even after the corresponding
+    proxy object is destroyed by the user code. **/
+class observer_proxy {
+    friend class task_scheduler_observer_v3;
+    friend class observer_list;
+    //! Reference count used for garbage collection.
+    /** 1 for reference from my task_scheduler_observer.
+        1 for each task dispatcher's last observer pointer.
+        No accounting for neighbors in the shared list. */
+    atomic<int> my_ref_count;
+    //! Reference to the list this observer belongs to.
+    observer_list* my_list;
+    //! Pointer to next observer in the list specified by my_head.
+    /** NULL for the last item in the list. **/
+    observer_proxy* my_next;
+    //! Pointer to the previous observer in the list specified by my_head.
+    /** For the head of the list points to the last item. **/
+    observer_proxy* my_prev;
+    //! Associated observer
+    task_scheduler_observer_v3* my_observer;
+    //! Version
+    char my_version;
+
+#if __TBB_ARENA_OBSERVER || __TBB_SLEEP_PERMISSION
+    interface6::task_scheduler_observer* get_v6_observer();
+#endif
+#if __TBB_ARENA_OBSERVER
+    bool is_global(); //TODO: move them back inline when un-CPF'ing
+#endif
+
+    //! Constructs proxy for the given observer and adds it to the specified list.
+    observer_proxy( task_scheduler_observer_v3& );
+
+#if TBB_USE_ASSERT
+    ~observer_proxy();
+#endif /* TBB_USE_ASSERT */
+
+    //! Shut up the warning
+    observer_proxy& operator = ( const observer_proxy& );
+}; // class observer_proxy
+
+inline void observer_list::remove_ref_fast( observer_proxy*& p ) {
+    if( p->my_observer ) {
+        // Can decrement refcount quickly, as it cannot drop to zero while under the lock.
+        int r = --p->my_ref_count;
+        __TBB_ASSERT_EX( r, NULL );
+        p = NULL;
+    } else {
+        // Use slow form of refcount decrementing, after the lock is released.
+    }
+}
+
+inline void observer_list::notify_entry_observers( observer_proxy*& last, bool worker ) {
+    if ( last == my_tail )
+        return;
+    do_notify_entry_observers( last, worker );
+}
+
+inline void observer_list::notify_exit_observers( observer_proxy*& last, bool worker ) {
+    if ( !last )
+        return;
+    __TBB_ASSERT(is_alive((uintptr_t)last), NULL);
+    do_notify_exit_observers( last, worker );
+    __TBB_ASSERT(last, NULL);
+    poison_value(last);
+}
+
+extern padded<observer_list> the_global_observer_list;
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* __TBB_SCHEDULER_OBSERVER */
+
+#endif /* _TBB_observer_proxy_H */
diff --git a/xdl/third_party/tbb/src/tbb/pipeline.cpp b/xdl/third_party/tbb/src/tbb/pipeline.cpp
new file mode 100644
index 00000000..a23d1474
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/pipeline.cpp
@@ -0,0 +1,781 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/pipeline.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "itt_notify.h"
+#include "semaphore.h"
+#include "tls.h"  // for parallel filters that do not use NULL as end_of_input
+
+
+namespace tbb {
+
+namespace internal {
+
+//! This structure is used to store task information in a input buffer
+struct task_info {
+    void* my_object;
+    //! Invalid unless a task went through an ordered stage.
+    Token my_token;
+    //! False until my_token is set.
+    bool my_token_ready;
+    //! True if my_object is valid.
+    bool is_valid;
+    //! Set to initial state (no object, no token)
+    void reset() {
+        my_object = NULL;
+        my_token = 0;
+        my_token_ready = false;
+        is_valid = false;
+    }
+};
+//! A buffer of input items for a filter.
+/** Each item is a task_info, inserted into a position in the buffer corresponding to a Token. */
+class input_buffer : no_copy {
+    friend class tbb::internal::pipeline_root_task;
+    friend class tbb::filter;
+    friend class tbb::thread_bound_filter;
+    friend class tbb::internal::stage_task;
+    friend class tbb::pipeline;
+
+    typedef  Token  size_type;
+
+    //! Array of deferred tasks that cannot yet start executing.
+    task_info* array;
+
+    //! for thread-bound filter, semaphore for waiting, NULL otherwise.
+    semaphore* my_sem;
+
+    //! Size of array
+    /** Always 0 or a power of 2 */
+    size_type array_size;
+
+    //! Lowest token that can start executing.
+    /** All prior Token have already been seen. */
+    Token low_token;
+
+    //! Serializes updates.
+    spin_mutex array_mutex;
+
+    //! Resize "array".
+    /** Caller is responsible to acquiring a lock on "array_mutex". */
+    void grow( size_type minimum_size );
+
+    //! Initial size for "array"
+    /** Must be a power of 2 */
+    static const size_type initial_buffer_size = 4;
+
+    //! Used for out of order buffer, and for assigning my_token if is_ordered and my_token not already assigned
+    Token high_token;
+
+    //! True for ordered filter, false otherwise.
+    bool is_ordered;
+
+    //! True for thread-bound filter, false otherwise.
+    bool is_bound;
+
+    //! for parallel filters that accepts NULLs, thread-local flag for reaching end_of_input
+    typedef basic_tls<intptr_t> end_of_input_tls_t;
+    end_of_input_tls_t end_of_input_tls;
+    bool end_of_input_tls_allocated; // no way to test pthread creation of TLS
+
+    void create_sema(size_t initial_tokens) { __TBB_ASSERT(!my_sem,NULL); my_sem = new internal::semaphore(initial_tokens); }
+    void free_sema() { __TBB_ASSERT(my_sem,NULL); delete my_sem; }
+    void sema_P() { __TBB_ASSERT(my_sem,NULL); my_sem->P(); }
+    void sema_V() { __TBB_ASSERT(my_sem,NULL); my_sem->V(); }
+
+public:
+    //! Construct empty buffer.
+    input_buffer( bool is_ordered_, bool is_bound_ ) :
+            array(NULL), my_sem(NULL), array_size(0),
+            low_token(0), high_token(0),
+            is_ordered(is_ordered_), is_bound(is_bound_),
+            end_of_input_tls_allocated(false) {
+        grow(initial_buffer_size);
+        __TBB_ASSERT( array, NULL );
+        if(is_bound) create_sema(0);
+    }
+
+    //! Destroy the buffer.
+    ~input_buffer() {
+        __TBB_ASSERT( array, NULL );
+        cache_aligned_allocator<task_info>().deallocate(array,array_size);
+        poison_pointer( array );
+        if(my_sem) {
+            free_sema();
+        }
+        if(end_of_input_tls_allocated) {
+            destroy_my_tls();
+        }
+    }
+
+    //! Put a token into the buffer.
+    /** If task information was placed into buffer, returns true;
+        otherwise returns false, informing the caller to create and spawn a task.
+        If input buffer owned by thread-bound filter and the item at
+        low_token was not valid, issue a V()
+        If the input_buffer is owned by a successor to a thread-bound filter,
+        the force_put parameter should be true to ensure the token is inserted
+        in the buffer.
+    */
+    bool put_token( task_info& info_, bool force_put = false ) {
+        {
+            info_.is_valid = true;
+            spin_mutex::scoped_lock lock( array_mutex );
+            Token token;
+            bool was_empty = !array[low_token&(array_size-1)].is_valid;
+            if( is_ordered ) {
+                if( !info_.my_token_ready ) {
+                    info_.my_token = high_token++;
+                    info_.my_token_ready = true;
+                }
+                token = info_.my_token;
+            } else
+                token = high_token++;
+            __TBB_ASSERT( (tokendiff_t)(token-low_token)>=0, NULL );
+            if( token!=low_token || is_bound || force_put ) {
+                // Trying to put token that is beyond low_token.
+                // Need to wait until low_token catches up before dispatching.
+                if( token-low_token>=array_size )
+                    grow( token-low_token+1 );
+                ITT_NOTIFY( sync_releasing, this );
+                array[token&(array_size-1)] = info_;
+                if(was_empty && is_bound) {
+                    sema_V();
+                }
+                return true;
+            }
+        }
+        return false;
+    }
+
+    //! Note that processing of a token is finished.
+    /** Fires up processing of the next token, if processing was deferred. */
+    // Using template to avoid explicit dependency on stage_task
+    // this is only called for serial filters, and is the reason for the
+    // advance parameter in return_item (we're incrementing low_token here.)
+    // Non-TBF serial stages don't advance the token at the start because the presence
+    // of the current token in the buffer keeps another stage from being spawned.
+    template<typename StageTask>
+    void note_done( Token token, StageTask& spawner ) {
+        task_info wakee;
+        wakee.reset();
+        {
+            spin_mutex::scoped_lock lock( array_mutex );
+            if( !is_ordered || token==low_token ) {
+                // Wake the next task
+                task_info& item = array[++low_token & (array_size-1)];
+                ITT_NOTIFY( sync_acquired, this );
+                wakee = item;
+                item.is_valid = false;
+            }
+        }
+        if( wakee.is_valid )
+            spawner.spawn_stage_task(wakee);
+    }
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! The method destroys all data in filters to prevent memory leaks
+    void clear( filter* my_filter ) {
+        long t=low_token;
+        for( size_type i=0; i<array_size; ++i, ++t ){
+            task_info& temp = array[t&(array_size-1)];
+            if (temp.is_valid ) {
+                my_filter->finalize(temp.my_object);
+                temp.is_valid = false;
+            }
+        }
+    }
+#endif
+
+    //! return an item, invalidate the queued item, but only advance if advance
+    //  advance == true for parallel filters.  If the filter is serial, leave the
+    // item in the buffer to keep another stage from being spawned.
+    bool return_item(task_info& info, bool advance) {
+        spin_mutex::scoped_lock lock( array_mutex );
+        task_info& item = array[low_token&(array_size-1)];
+        ITT_NOTIFY( sync_acquired, this );
+        if( item.is_valid ) {
+            info = item;
+            item.is_valid = false;
+            if (advance) low_token++;
+            return true;
+        }
+        return false;
+    }
+
+    //! true if the current low_token is valid.
+    bool has_item() { spin_mutex::scoped_lock lock(array_mutex); return array[low_token&(array_size -1)].is_valid; }
+
+    // end_of_input signal for parallel_pipeline, parallel input filters with 0 tokens allowed.
+    void create_my_tls() { int status = end_of_input_tls.create(); if(status) handle_perror(status, "TLS not allocated for filter"); end_of_input_tls_allocated = true; }
+    void destroy_my_tls() { int status = end_of_input_tls.destroy(); if(status) handle_perror(status, "Failed to destroy filter TLS"); }
+    bool my_tls_end_of_input() { return end_of_input_tls.get() != 0; }
+    void set_my_tls_end_of_input() { end_of_input_tls.set(1); }
+};
+
+void input_buffer::grow( size_type minimum_size ) {
+    size_type old_size = array_size;
+    size_type new_size = old_size ? 2*old_size : initial_buffer_size;
+    while( new_size<minimum_size )
+        new_size*=2;
+    task_info* new_array = cache_aligned_allocator<task_info>().allocate(new_size);
+    task_info* old_array = array;
+    for( size_type i=0; i<new_size; ++i )
+        new_array[i].is_valid = false;
+    long t=low_token;
+    for( size_type i=0; i<old_size; ++i, ++t )
+        new_array[t&(new_size-1)] = old_array[t&(old_size-1)];
+    array = new_array;
+    array_size = new_size;
+    if( old_array )
+        cache_aligned_allocator<task_info>().deallocate(old_array,old_size);
+}
+
+class stage_task: public task, public task_info {
+private:
+    friend class tbb::pipeline;
+    pipeline& my_pipeline;
+    filter* my_filter;
+    //! True if this task has not yet read the input.
+    bool my_at_start;
+
+public:
+    //! Construct stage_task for first stage in a pipeline.
+    /** Such a stage has not read any input yet. */
+    stage_task( pipeline& pipeline ) :
+        my_pipeline(pipeline),
+        my_filter(pipeline.filter_list),
+        my_at_start(true)
+    {
+        task_info::reset();
+    }
+    //! Construct stage_task for a subsequent stage in a pipeline.
+    stage_task( pipeline& pipeline, filter* filter_, const task_info& info ) :
+        task_info(info),
+        my_pipeline(pipeline),
+        my_filter(filter_),
+        my_at_start(false)
+    {}
+    //! Roughly equivalent to the constructor of input stage task
+    void reset() {
+        task_info::reset();
+        my_filter = my_pipeline.filter_list;
+        my_at_start = true;
+    }
+    //! The virtual task execution method
+    task* execute() __TBB_override;
+#if __TBB_TASK_GROUP_CONTEXT
+    ~stage_task()
+    {
+        if (my_filter && my_object && (my_filter->my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(4)) {
+            __TBB_ASSERT(is_cancelled(), "Trying to finalize the task that wasn't cancelled");
+            my_filter->finalize(my_object);
+            my_object = NULL;
+        }
+    }
+#endif // __TBB_TASK_GROUP_CONTEXT
+    //! Creates and spawns stage_task from task_info
+    void spawn_stage_task(const task_info& info)
+    {
+        stage_task* clone = new (allocate_additional_child_of(*parent()))
+                                stage_task( my_pipeline, my_filter, info );
+        spawn(*clone);
+    }
+};
+
+task* stage_task::execute() {
+    __TBB_ASSERT( !my_at_start || !my_object, NULL );
+    __TBB_ASSERT( !my_filter->is_bound(), NULL );
+    if( my_at_start ) {
+        if( my_filter->is_serial() ) {
+            my_object = (*my_filter)(my_object);
+            if( my_object || ( my_filter->object_may_be_null() && !my_pipeline.end_of_input) )
+            {
+                if( my_filter->is_ordered() ) {
+                    my_token = my_pipeline.token_counter++; // ideally, with relaxed semantics
+                    my_token_ready = true;
+                } else if( (my_filter->my_filter_mode & my_filter->version_mask) >= __TBB_PIPELINE_VERSION(5) ) {
+                    if( my_pipeline.has_thread_bound_filters )
+                        my_pipeline.token_counter++; // ideally, with relaxed semantics
+                }
+                if( !my_filter->next_filter_in_pipeline ) { // we're only filter in pipeline
+                    reset();
+                    goto process_another_stage;
+                } else {
+                    ITT_NOTIFY( sync_releasing, &my_pipeline.input_tokens );
+                    if( --my_pipeline.input_tokens>0 )
+                        spawn( *new( allocate_additional_child_of(*parent()) ) stage_task( my_pipeline ) );
+                }
+            } else {
+                my_pipeline.end_of_input = true;
+                return NULL;
+            }
+        } else /*not is_serial*/ {
+            if( my_pipeline.end_of_input )
+                return NULL;
+            if( (my_filter->my_filter_mode & my_filter->version_mask) >= __TBB_PIPELINE_VERSION(5) ) {
+                if( my_pipeline.has_thread_bound_filters )
+                    my_pipeline.token_counter++;
+            }
+            ITT_NOTIFY( sync_releasing, &my_pipeline.input_tokens );
+            if( --my_pipeline.input_tokens>0 )
+                spawn( *new( allocate_additional_child_of(*parent()) ) stage_task( my_pipeline ) );
+            my_object = (*my_filter)(my_object);
+            if( !my_object && (!my_filter->object_may_be_null() || my_filter->my_input_buffer->my_tls_end_of_input()) )
+            {
+                my_pipeline.end_of_input = true;
+                if( (my_filter->my_filter_mode & my_filter->version_mask) >= __TBB_PIPELINE_VERSION(5) ) {
+                    if( my_pipeline.has_thread_bound_filters )
+                        my_pipeline.token_counter--;  // fix token_counter
+                }
+                return NULL;
+            }
+        }
+        my_at_start = false;
+    } else {
+        my_object = (*my_filter)(my_object);
+        if( my_filter->is_serial() )
+            my_filter->my_input_buffer->note_done(my_token, *this);
+    }
+    my_filter = my_filter->next_filter_in_pipeline;
+    if( my_filter ) {
+        // There is another filter to execute.
+        if( my_filter->is_serial() ) {
+            // The next filter must execute tokens in order
+            if( my_filter->my_input_buffer->put_token(*this) ){
+                // Can't proceed with the same item
+                if( my_filter->is_bound() ) {
+                    // Find the next non-thread-bound filter
+                    do {
+                        my_filter = my_filter->next_filter_in_pipeline;
+                    } while( my_filter && my_filter->is_bound() );
+                    // Check if there is an item ready to process
+                    if( my_filter && my_filter->my_input_buffer->return_item(*this, !my_filter->is_serial()))
+                        goto process_another_stage;
+                }
+                my_filter = NULL; // To prevent deleting my_object twice if exception occurs
+                return NULL;
+            }
+        }
+    } else {
+        // Reached end of the pipe.
+        size_t ntokens_avail = ++my_pipeline.input_tokens;
+        if(my_pipeline.filter_list->is_bound() ) {
+            if(ntokens_avail == 1) {
+                my_pipeline.filter_list->my_input_buffer->sema_V();
+            }
+            return NULL;
+        }
+        if( ntokens_avail>1  // Only recycle if there is one available token
+                || my_pipeline.end_of_input ) {
+            return NULL; // No need to recycle for new input
+        }
+        ITT_NOTIFY( sync_acquired, &my_pipeline.input_tokens );
+        // Recycle as an input stage task.
+        reset();
+    }
+process_another_stage:
+    /* A semi-hackish way to reexecute the same task object immediately without spawning.
+       recycle_as_continuation marks the task for future execution,
+       and then 'this' pointer is returned to bypass spawning. */
+    recycle_as_continuation();
+    return this;
+}
+
+class pipeline_root_task: public task {
+    pipeline& my_pipeline;
+    bool do_segment_scanning;
+
+    task* execute() __TBB_override {
+        if( !my_pipeline.end_of_input )
+            if( !my_pipeline.filter_list->is_bound() )
+                if( my_pipeline.input_tokens > 0 ) {
+                    recycle_as_continuation();
+                    set_ref_count(1);
+                    return new( allocate_child() ) stage_task( my_pipeline );
+                }
+        if( do_segment_scanning ) {
+            filter* current_filter = my_pipeline.filter_list->next_segment;
+            /* first non-thread-bound filter that follows thread-bound one
+            and may have valid items to process */
+            filter* first_suitable_filter = current_filter;
+            while( current_filter ) {
+                __TBB_ASSERT( !current_filter->is_bound(), "filter is thread-bound?" );
+                __TBB_ASSERT( current_filter->prev_filter_in_pipeline->is_bound(), "previous filter is not thread-bound?" );
+                if( !my_pipeline.end_of_input || current_filter->has_more_work())
+                {
+                    task_info info;
+                    info.reset();
+                    if( current_filter->my_input_buffer->return_item(info, !current_filter->is_serial()) ) {
+                        set_ref_count(1);
+                        recycle_as_continuation();
+                        return new( allocate_child() ) stage_task( my_pipeline, current_filter, info);
+                    }
+                    current_filter = current_filter->next_segment;
+                    if( !current_filter ) {
+                        if( !my_pipeline.end_of_input ) {
+                            recycle_as_continuation();
+                            return this;
+                        }
+                        current_filter = first_suitable_filter;
+                        __TBB_Yield();
+                    }
+                } else {
+                    /* The preceding pipeline segment is empty.
+                    Fast-forward to the next post-TBF segment. */
+                    first_suitable_filter = first_suitable_filter->next_segment;
+                    current_filter = first_suitable_filter;
+                }
+            } /* while( current_filter ) */
+            return NULL;
+        } else {
+            if( !my_pipeline.end_of_input ) {
+                recycle_as_continuation();
+                return this;
+            }
+            return NULL;
+        }
+    }
+public:
+    pipeline_root_task( pipeline& pipeline ): my_pipeline(pipeline), do_segment_scanning(false)
+    {
+        __TBB_ASSERT( my_pipeline.filter_list, NULL );
+        filter* first = my_pipeline.filter_list;
+        if( (first->my_filter_mode & first->version_mask) >= __TBB_PIPELINE_VERSION(5) ) {
+            // Scanning the pipeline for segments
+            filter* head_of_previous_segment = first;
+            for(  filter* subfilter=first->next_filter_in_pipeline;
+                  subfilter!=NULL;
+                  subfilter=subfilter->next_filter_in_pipeline )
+            {
+                if( subfilter->prev_filter_in_pipeline->is_bound() && !subfilter->is_bound() ) {
+                    do_segment_scanning = true;
+                    head_of_previous_segment->next_segment = subfilter;
+                    head_of_previous_segment = subfilter;
+                }
+            }
+        }
+    }
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    // Suppress compiler warning about constant conditional expression
+    #pragma warning (disable: 4127)
+#endif
+
+// The class destroys end_counter and clears all input buffers if pipeline was cancelled.
+class pipeline_cleaner: internal::no_copy {
+    pipeline& my_pipeline;
+public:
+    pipeline_cleaner(pipeline& _pipeline) :
+        my_pipeline(_pipeline)
+    {}
+    ~pipeline_cleaner(){
+#if __TBB_TASK_GROUP_CONTEXT
+        if (my_pipeline.end_counter->is_cancelled()) // Pipeline was cancelled
+            my_pipeline.clear_filters();
+#endif
+        my_pipeline.end_counter = NULL;
+    }
+};
+
+} // namespace internal
+
+void pipeline::inject_token( task& ) {
+    __TBB_ASSERT(false,"illegal call to inject_token");
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+void pipeline::clear_filters() {
+    for( filter* f = filter_list; f; f = f->next_filter_in_pipeline ) {
+        if ((f->my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(4))
+            if( internal::input_buffer* b = f->my_input_buffer )
+                b->clear(f);
+    }
+}
+#endif
+
+pipeline::pipeline() :
+    filter_list(NULL),
+    filter_end(NULL),
+    end_counter(NULL),
+    end_of_input(false),
+    has_thread_bound_filters(false)
+{
+    token_counter = 0;
+    input_tokens = 0;
+}
+
+pipeline::~pipeline() {
+    clear();
+}
+
+void pipeline::clear() {
+    filter* next;
+    for( filter* f = filter_list; f; f=next ) {
+        if( internal::input_buffer* b = f->my_input_buffer ) {
+            delete b;
+            f->my_input_buffer = NULL;
+        }
+        next=f->next_filter_in_pipeline;
+        f->next_filter_in_pipeline = filter::not_in_pipeline();
+        if ( (f->my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(3) ) {
+            f->prev_filter_in_pipeline = filter::not_in_pipeline();
+            f->my_pipeline = NULL;
+        }
+        if ( (f->my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(5) )
+            f->next_segment = NULL;
+    }
+    filter_list = filter_end = NULL;
+}
+
+void pipeline::add_filter( filter& filter_ ) {
+#if TBB_USE_ASSERT
+    if ( (filter_.my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(3) )
+        __TBB_ASSERT( filter_.prev_filter_in_pipeline==filter::not_in_pipeline(), "filter already part of pipeline?" );
+    __TBB_ASSERT( filter_.next_filter_in_pipeline==filter::not_in_pipeline(), "filter already part of pipeline?" );
+    __TBB_ASSERT( !end_counter, "invocation of add_filter on running pipeline" );
+#endif
+    if ( (filter_.my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(3) ) {
+        filter_.my_pipeline = this;
+        filter_.prev_filter_in_pipeline = filter_end;
+        if ( filter_list == NULL)
+            filter_list = &filter_;
+        else
+            filter_end->next_filter_in_pipeline = &filter_;
+        filter_.next_filter_in_pipeline = NULL;
+        filter_end = &filter_;
+    }
+    else
+    {
+        if( !filter_end )
+            filter_end = reinterpret_cast<filter*>(&filter_list);
+
+        *reinterpret_cast<filter**>(filter_end) = &filter_;
+        filter_end = reinterpret_cast<filter*>(&filter_.next_filter_in_pipeline);
+        *reinterpret_cast<filter**>(filter_end) = NULL;
+    }
+    if( (filter_.my_filter_mode & filter_.version_mask) >= __TBB_PIPELINE_VERSION(5) ) {
+        if( filter_.is_serial() ) {
+            if( filter_.is_bound() )
+                has_thread_bound_filters = true;
+            filter_.my_input_buffer = new internal::input_buffer( filter_.is_ordered(), filter_.is_bound() );
+        }
+        else {
+            if(filter_.prev_filter_in_pipeline) {
+                if(filter_.prev_filter_in_pipeline->is_bound()) {
+                    // successors to bound filters must have an input_buffer
+                    filter_.my_input_buffer = new internal::input_buffer( /*is_ordered*/false, false );
+                }
+            }
+            else {  // input filter
+                if(filter_.object_may_be_null() ) {
+                    //TODO: buffer only needed to hold TLS; could improve
+                    filter_.my_input_buffer = new internal::input_buffer( /*is_ordered*/false, false );
+                    filter_.my_input_buffer->create_my_tls();
+                }
+            }
+        }
+    } else {
+        if( filter_.is_serial() ) {
+            filter_.my_input_buffer = new internal::input_buffer( filter_.is_ordered(), false );
+        }
+    }
+
+}
+
+void pipeline::remove_filter( filter& filter_ ) {
+    __TBB_ASSERT( filter_.prev_filter_in_pipeline!=filter::not_in_pipeline(), "filter not part of pipeline" );
+    __TBB_ASSERT( filter_.next_filter_in_pipeline!=filter::not_in_pipeline(), "filter not part of pipeline" );
+    __TBB_ASSERT( !end_counter, "invocation of remove_filter on running pipeline" );
+    if (&filter_ == filter_list)
+        filter_list = filter_.next_filter_in_pipeline;
+    else {
+        __TBB_ASSERT( filter_.prev_filter_in_pipeline, "filter list broken?" );
+        filter_.prev_filter_in_pipeline->next_filter_in_pipeline = filter_.next_filter_in_pipeline;
+    }
+    if (&filter_ == filter_end)
+        filter_end = filter_.prev_filter_in_pipeline;
+    else {
+        __TBB_ASSERT( filter_.next_filter_in_pipeline, "filter list broken?" );
+        filter_.next_filter_in_pipeline->prev_filter_in_pipeline = filter_.prev_filter_in_pipeline;
+    }
+    if( internal::input_buffer* b = filter_.my_input_buffer ) {
+        delete b;
+        filter_.my_input_buffer = NULL;
+    }
+    filter_.next_filter_in_pipeline = filter_.prev_filter_in_pipeline = filter::not_in_pipeline();
+    if ( (filter_.my_filter_mode & filter::version_mask) >= __TBB_PIPELINE_VERSION(5) )
+        filter_.next_segment = NULL;
+    filter_.my_pipeline = NULL;
+}
+
+void pipeline::run( size_t max_number_of_live_tokens
+#if __TBB_TASK_GROUP_CONTEXT
+    , tbb::task_group_context& context
+#endif
+    ) {
+    __TBB_ASSERT( max_number_of_live_tokens>0, "pipeline::run must have at least one token" );
+    __TBB_ASSERT( !end_counter, "pipeline already running?" );
+    if( filter_list ) {
+        internal::pipeline_cleaner my_pipeline_cleaner(*this);
+        end_of_input = false;
+        input_tokens = internal::Token(max_number_of_live_tokens);
+        if(has_thread_bound_filters) {
+            // release input filter if thread-bound
+            if(filter_list->is_bound()) {
+                filter_list->my_input_buffer->sema_V();
+            }
+        }
+#if __TBB_TASK_GROUP_CONTEXT
+        end_counter = new( task::allocate_root(context) ) internal::pipeline_root_task( *this );
+#else
+        end_counter = new( task::allocate_root() ) internal::pipeline_root_task( *this );
+#endif
+        // Start execution of tasks
+        task::spawn_root_and_wait( *end_counter );
+
+        if(has_thread_bound_filters) {
+            for(filter* f = filter_list->next_filter_in_pipeline; f; f=f->next_filter_in_pipeline) {
+                if(f->is_bound()) {
+                    f->my_input_buffer->sema_V(); // wake to end
+                }
+            }
+        }
+    }
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+void pipeline::run( size_t max_number_of_live_tokens ) {
+    if( filter_list ) {
+        // Construct task group context with the exception propagation mode expected
+        // by the pipeline caller.
+        uintptr_t ctx_traits = filter_list->my_filter_mode & filter::exact_exception_propagation ?
+                task_group_context::default_traits :
+                task_group_context::default_traits & ~task_group_context::exact_exception;
+        task_group_context context(task_group_context::bound, ctx_traits);
+        run(max_number_of_live_tokens, context);
+    }
+}
+#endif // __TBB_TASK_GROUP_CONTEXT
+
+bool filter::has_more_work() {
+    __TBB_ASSERT(my_pipeline, NULL);
+    __TBB_ASSERT(my_input_buffer, "has_more_work() called for filter with no input buffer");
+    return (internal::tokendiff_t)(my_pipeline->token_counter - my_input_buffer->low_token) != 0;
+}
+
+filter::~filter() {
+    if ( (my_filter_mode & version_mask) >= __TBB_PIPELINE_VERSION(3) ) {
+        if ( next_filter_in_pipeline != filter::not_in_pipeline() )
+            my_pipeline->remove_filter(*this);
+        else
+            __TBB_ASSERT( prev_filter_in_pipeline == filter::not_in_pipeline(), "probably filter list is broken" );
+    } else {
+        __TBB_ASSERT( next_filter_in_pipeline==filter::not_in_pipeline(), "cannot destroy filter that is part of pipeline" );
+    }
+}
+
+void
+filter::set_end_of_input() {
+    __TBB_ASSERT(my_input_buffer, NULL);
+    __TBB_ASSERT(object_may_be_null(), NULL);
+    if(is_serial()) {
+        my_pipeline->end_of_input = true;
+    }
+    else {
+        __TBB_ASSERT(my_input_buffer->end_of_input_tls_allocated, NULL);
+        my_input_buffer->set_my_tls_end_of_input();
+    }
+}
+
+thread_bound_filter::result_type thread_bound_filter::process_item() {
+    return internal_process_item(true);
+}
+
+thread_bound_filter::result_type thread_bound_filter::try_process_item() {
+    return internal_process_item(false);
+}
+
+thread_bound_filter::result_type thread_bound_filter::internal_process_item(bool is_blocking) {
+    __TBB_ASSERT(my_pipeline != NULL,"It's not supposed that process_item is called for a filter that is not in a pipeline.");
+    internal::task_info info;
+    info.reset();
+
+    if( my_pipeline->end_of_input && !has_more_work() )
+        return end_of_stream;
+
+    if( !prev_filter_in_pipeline ) {
+        if( my_pipeline->end_of_input )
+            return end_of_stream;
+        while( my_pipeline->input_tokens == 0 ) {
+            if( !is_blocking )
+                return item_not_available;
+            my_input_buffer->sema_P();
+        }
+        info.my_object = (*this)(info.my_object);
+        if( info.my_object ) {
+            __TBB_ASSERT(my_pipeline->input_tokens > 0, "Token failed in thread-bound filter");
+            my_pipeline->input_tokens--;
+            if( is_ordered() ) {
+                info.my_token = my_pipeline->token_counter;
+                info.my_token_ready = true;
+            }
+            my_pipeline->token_counter++; // ideally, with relaxed semantics
+        } else {
+            my_pipeline->end_of_input = true;
+            return end_of_stream;
+        }
+    } else { /* this is not an input filter */
+        while( !my_input_buffer->has_item() ) {
+            if( !is_blocking ) {
+                return item_not_available;
+            }
+            my_input_buffer->sema_P();
+            if( my_pipeline->end_of_input && !has_more_work() ) {
+                return end_of_stream;
+            }
+        }
+        if( !my_input_buffer->return_item(info, /*advance*/true) ) {
+            __TBB_ASSERT(false,"return_item failed");
+        }
+        info.my_object = (*this)(info.my_object);
+    }
+    if( next_filter_in_pipeline ) {
+        if ( !next_filter_in_pipeline->my_input_buffer->put_token(info,/*force_put=*/true) ) {
+            __TBB_ASSERT(false, "Couldn't put token after thread-bound buffer");
+        }
+    } else {
+        size_t ntokens_avail = ++(my_pipeline->input_tokens);
+        if( my_pipeline->filter_list->is_bound() ) {
+            if( ntokens_avail == 1 ) {
+                my_pipeline->filter_list->my_input_buffer->sema_V();
+            }
+        }
+    }
+
+    return success;
+}
+
+} // tbb
+
diff --git a/xdl/third_party/tbb/src/tbb/private_server.cpp b/xdl/third_party/tbb/src/tbb/private_server.cpp
new file mode 100644
index 00000000..bd794536
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/private_server.cpp
@@ -0,0 +1,422 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "../rml/include/rml_tbb.h"
+#include "../rml/server/thread_monitor.h"
+#include "tbb/atomic.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "scheduler_common.h"
+#include "governor.h"
+#include "tbb_misc.h"
+
+using rml::internal::thread_monitor;
+
+namespace tbb {
+namespace internal {
+namespace rml {
+
+typedef thread_monitor::handle_type thread_handle;
+
+class private_server;
+
+class private_worker: no_copy {
+private:
+    //! State in finite-state machine that controls the worker.
+    /** State diagram:
+        init --> starting --> normal
+          |         |           |
+          |         V           |
+          \------> quit <------/
+      */
+    enum state_t {
+        //! *this is initialized
+        st_init,
+        //! *this has associated thread that is starting up.
+        st_starting,
+        //! Associated thread is doing normal life sequence.
+        st_normal,
+        //! Associated thread has ended normal life sequence and promises to never touch *this again.
+        st_quit
+    };
+    atomic<state_t> my_state;
+
+    //! Associated server
+    private_server& my_server;
+
+    //! Associated client
+    tbb_client& my_client;
+
+    //! index used for avoiding the 64K aliasing problem
+    const size_t my_index;
+
+    //! Monitor for sleeping when there is no work to do.
+    /** The invariant that holds for sleeping workers is:
+        "my_slack<=0 && my_state==st_normal && I am on server's list of asleep threads" */
+    thread_monitor my_thread_monitor;
+
+    //! Handle of the OS thread associated with this worker
+    thread_handle my_handle;
+
+    //! Link for list of workers that are sleeping or have no associated thread.
+    private_worker* my_next;
+
+    friend class private_server;
+
+    //! Actions executed by the associated thread
+    void run();
+
+    //! Wake up associated thread (or launch a thread if there is none)
+    void wake_or_launch();
+
+    //! Called by a thread (usually not the associated thread) to commence termination.
+    void start_shutdown();
+
+    static __RML_DECL_THREAD_ROUTINE thread_routine( void* arg );
+
+    static void release_handle(thread_handle my_handle, bool join);
+
+protected:
+    private_worker( private_server& server, tbb_client& client, const size_t i ) :
+        my_server(server), my_client(client), my_index(i),
+        my_thread_monitor(), my_handle(), my_next()
+    {
+        my_state = st_init;
+    }
+};
+
+static const size_t cache_line_size = tbb::internal::NFS_MaxLineSize;
+
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about uninstantiable class
+    #pragma warning(push)
+    #pragma warning(disable:4510 4610)
+#endif
+class padded_private_worker: public private_worker {
+    char pad[cache_line_size - sizeof(private_worker)%cache_line_size];
+public:
+    padded_private_worker( private_server& server, tbb_client& client, const size_t i )
+    : private_worker(server,client,i) { suppress_unused_warning(pad); }
+};
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+class private_server: public tbb_server, no_copy {
+private:
+    tbb_client& my_client;
+    //! Maximum number of threads to be created.
+    /** Threads are created lazily, so maximum might not actually be reached. */
+    const tbb_client::size_type my_n_thread;
+
+    //! Stack size for each thread. */
+    const size_t my_stack_size;
+
+    //! Number of jobs that could use their associated thread minus number of active threads.
+    /** If negative, indicates oversubscription.
+        If positive, indicates that more threads should run.
+        Can be lowered asynchronously, but must be raised only while holding my_asleep_list_mutex,
+        because raising it impacts the invariant for sleeping threads. */
+    atomic<int> my_slack;
+
+    //! Counter used to determine when to delete this.
+    atomic<int> my_ref_count;
+
+    padded_private_worker* my_thread_array;
+
+    //! List of workers that are asleep or committed to sleeping until notified by another thread.
+    tbb::atomic<private_worker*> my_asleep_list_root;
+
+    //! Protects my_asleep_list_root
+    typedef scheduler_mutex_type asleep_list_mutex_type;
+    asleep_list_mutex_type my_asleep_list_mutex;
+
+#if TBB_USE_ASSERT
+    atomic<int> my_net_slack_requests;
+#endif /* TBB_USE_ASSERT */
+
+    //! Wake up to two sleeping workers, if there are any sleeping.
+    /** The call is used to propagate a chain reaction where each thread wakes up two threads,
+        which in turn each wake up two threads, etc. */
+    void propagate_chain_reaction() {
+        // First test of a double-check idiom.  Second test is inside wake_some(0).
+        if( my_asleep_list_root )
+            wake_some(0);
+    }
+
+    //! Try to add t to list of sleeping workers
+    bool try_insert_in_asleep_list( private_worker& t );
+
+    //! Equivalent of adding additional_slack to my_slack and waking up to 2 threads if my_slack permits.
+    void wake_some( int additional_slack );
+
+    virtual ~private_server();
+
+    void remove_server_ref() {
+        if( --my_ref_count==0 ) {
+            my_client.acknowledge_close_connection();
+            this->~private_server();
+            tbb::cache_aligned_allocator<private_server>().deallocate( this, 1 );
+        }
+    }
+
+    friend class private_worker;
+public:
+    private_server( tbb_client& client );
+
+    version_type version() const __TBB_override {
+        return 0;
+    }
+
+    void request_close_connection( bool /*exiting*/ ) __TBB_override {
+        for( size_t i=0; i<my_n_thread; ++i )
+            my_thread_array[i].start_shutdown();
+        remove_server_ref();
+    }
+
+    void yield() __TBB_override {__TBB_Yield();}
+
+    void independent_thread_number_changed( int ) __TBB_override {__TBB_ASSERT(false,NULL);}
+
+    unsigned default_concurrency() const __TBB_override { return governor::default_num_threads() - 1; }
+
+    void adjust_job_count_estimate( int delta ) __TBB_override;
+
+#if _WIN32||_WIN64
+    void register_master ( ::rml::server::execution_resource_t& ) __TBB_override {}
+    void unregister_master ( ::rml::server::execution_resource_t ) __TBB_override {}
+#endif /* _WIN32||_WIN64 */
+};
+
+//------------------------------------------------------------------------
+// Methods of private_worker
+//------------------------------------------------------------------------
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings about an initialized variable 'sink_for_alloca' not referenced
+    #pragma warning(push)
+    #pragma warning(disable:4189)
+#endif
+#if __MINGW32__ && __GNUC__==4 &&__GNUC_MINOR__>=2 && !__MINGW64__
+// ensure that stack is properly aligned for TBB threads
+__attribute__((force_align_arg_pointer))
+#endif
+__RML_DECL_THREAD_ROUTINE private_worker::thread_routine( void* arg ) {
+    private_worker* self = static_cast<private_worker*>(arg);
+    AVOID_64K_ALIASING( self->my_index );
+    self->run();
+    return 0;
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+void private_worker::release_handle(thread_handle handle, bool join) {
+    if (join)
+        thread_monitor::join(handle);
+    else
+        thread_monitor::detach_thread(handle);
+}
+
+void private_worker::start_shutdown() {
+    state_t s;
+
+    do {
+        s = my_state;
+        __TBB_ASSERT( s!=st_quit, NULL );
+    } while( my_state.compare_and_swap( st_quit, s )!=s );
+    if( s==st_normal || s==st_starting ) {
+        // May have invalidated invariant for sleeping, so wake up the thread.
+        // Note that the notify() here occurs without maintaining invariants for my_slack.
+        // It does not matter, because my_state==st_quit overrides checking of my_slack.
+        my_thread_monitor.notify();
+        // Do not need release handle in st_init state,
+        // because in this case the thread wasn't started yet.
+        // For st_starting release is done at launch site.
+        if (s==st_normal)
+            release_handle(my_handle, governor::does_client_join_workers(my_client));
+    } else if( s==st_init ) {
+        // Perform action that otherwise would be performed by associated thread when it quits.
+        my_server.remove_server_ref();
+    }
+}
+
+void private_worker::run() {
+    my_server.propagate_chain_reaction();
+
+    // Transiting to st_normal here would require setting my_handle,
+    // which would create race with the launching thread and
+    // complications in handle management on Windows.
+
+    ::rml::job& j = *my_client.create_one_job();
+    while( my_state!=st_quit ) {
+        if( my_server.my_slack>=0 ) {
+            my_client.process(j);
+        } else {
+            thread_monitor::cookie c;
+            // Prepare to wait
+            my_thread_monitor.prepare_wait(c);
+            // Check/set the invariant for sleeping
+            if( my_state!=st_quit && my_server.try_insert_in_asleep_list(*this) ) {
+                my_thread_monitor.commit_wait(c);
+                __TBB_ASSERT( my_state==st_quit || !my_next, "Thread monitor missed a spurious wakeup?" );
+                my_server.propagate_chain_reaction();
+            } else {
+                // Invariant broken
+                my_thread_monitor.cancel_wait();
+            }
+        }
+    }
+    my_client.cleanup(j);
+
+    ++my_server.my_slack;
+    my_server.remove_server_ref();
+}
+
+inline void private_worker::wake_or_launch() {
+    if( my_state==st_init && my_state.compare_and_swap( st_starting, st_init )==st_init ) {
+        // after this point, remove_server_ref() must be done by created thread
+#if USE_WINTHREAD
+        my_handle = thread_monitor::launch( thread_routine, this, my_server.my_stack_size, &this->my_index );
+#elif USE_PTHREAD
+        {
+        affinity_helper fpa;
+        fpa.protect_affinity_mask( /*restore_process_mask=*/true );
+        my_handle = thread_monitor::launch( thread_routine, this, my_server.my_stack_size );
+        // Implicit destruction of fpa resets original affinity mask.
+        }
+#endif /* USE_PTHREAD */
+        state_t s = my_state.compare_and_swap( st_normal, st_starting );
+        if (st_starting != s) {
+            // Do shutdown during startup. my_handle can't be released
+            // by start_shutdown, because my_handle value might be not set yet
+            // at time of transition from st_starting to st_quit.
+            __TBB_ASSERT( s==st_quit, NULL );
+            release_handle(my_handle, governor::does_client_join_workers(my_client));
+        }
+    }
+    else {
+        __TBB_ASSERT( !my_next, "Should not wake a thread while it's still in asleep list" );
+        my_thread_monitor.notify();
+    }
+}
+
+//------------------------------------------------------------------------
+// Methods of private_server
+//------------------------------------------------------------------------
+private_server::private_server( tbb_client& client ) :
+    my_client(client),
+    my_n_thread(client.max_job_count()),
+    my_stack_size(client.min_stack_size()),
+    my_thread_array(NULL)
+{
+    my_ref_count = my_n_thread+1;
+    my_slack = 0;
+#if TBB_USE_ASSERT
+    my_net_slack_requests = 0;
+#endif /* TBB_USE_ASSERT */
+    my_asleep_list_root = NULL;
+    my_thread_array = tbb::cache_aligned_allocator<padded_private_worker>().allocate( my_n_thread );
+    for( size_t i=0; i<my_n_thread; ++i ) {
+        private_worker* t = new( &my_thread_array[i] ) padded_private_worker( *this, client, i );
+        t->my_next = my_asleep_list_root;
+        my_asleep_list_root = t;
+    }
+}
+
+private_server::~private_server() {
+    __TBB_ASSERT( my_net_slack_requests==0, NULL );
+    for( size_t i=my_n_thread; i--; )
+        my_thread_array[i].~padded_private_worker();
+    tbb::cache_aligned_allocator<padded_private_worker>().deallocate( my_thread_array, my_n_thread );
+    tbb::internal::poison_pointer( my_thread_array );
+}
+
+inline bool private_server::try_insert_in_asleep_list( private_worker& t ) {
+    asleep_list_mutex_type::scoped_lock lock;
+    if( !lock.try_acquire(my_asleep_list_mutex) )
+        return false;
+    // Contribute to slack under lock so that if another takes that unit of slack,
+    // it sees us sleeping on the list and wakes us up.
+    int k = ++my_slack;
+    if( k<=0 ) {
+        t.my_next = my_asleep_list_root;
+        my_asleep_list_root = &t;
+        return true;
+    } else {
+        --my_slack;
+        return false;
+    }
+}
+
+void private_server::wake_some( int additional_slack ) {
+    __TBB_ASSERT( additional_slack>=0, NULL );
+    private_worker* wakee[2];
+    private_worker**w = wakee;
+    {
+        asleep_list_mutex_type::scoped_lock lock(my_asleep_list_mutex);
+        while( my_asleep_list_root && w<wakee+2 ) {
+            if( additional_slack>0 ) {
+                if (additional_slack+my_slack<=0) // additional demand does not exceed surplus supply
+                    break;
+                --additional_slack;
+            } else {
+                // Chain reaction; Try to claim unit of slack
+                int old;
+                do {
+                    old = my_slack;
+                    if( old<=0 ) goto done;
+                } while( my_slack.compare_and_swap(old-1,old)!=old );
+            }
+            // Pop sleeping worker to combine with claimed unit of slack
+            my_asleep_list_root = (*w++ = my_asleep_list_root)->my_next;
+        }
+        if( additional_slack ) {
+            // Contribute our unused slack to my_slack.
+            my_slack += additional_slack;
+        }
+    }
+done:
+    while( w>wakee ) {
+        private_worker* ww = *--w;
+        ww->my_next = NULL;
+        ww->wake_or_launch();
+    }
+}
+
+void private_server::adjust_job_count_estimate( int delta ) {
+#if TBB_USE_ASSERT
+    my_net_slack_requests+=delta;
+#endif /* TBB_USE_ASSERT */
+    if( delta<0 ) {
+        my_slack+=delta;
+    } else if( delta>0 ) {
+        wake_some( delta );
+    }
+}
+
+//! Factory method called from task.cpp to create a private_server.
+tbb_server* make_private_server( tbb_client& client ) {
+    return new( tbb::cache_aligned_allocator<private_server>().allocate(1) ) private_server(client);
+}
+
+} // namespace rml
+} // namespace internal
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/queuing_mutex.cpp b/xdl/third_party/tbb/src/tbb/queuing_mutex.cpp
new file mode 100644
index 00000000..fdbb2182
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/queuing_mutex.cpp
@@ -0,0 +1,108 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/queuing_mutex.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/tbb_stddef.h"
+#include "tbb_misc.h"
+#include "itt_notify.h"
+
+namespace tbb {
+
+using namespace internal;
+
+//! A method to acquire queuing_mutex lock
+void queuing_mutex::scoped_lock::acquire( queuing_mutex& m )
+{
+    __TBB_ASSERT( !this->mutex, "scoped_lock is already holding a mutex");
+
+    // Must set all fields before the fetch_and_store, because once the
+    // fetch_and_store executes, *this becomes accessible to other threads.
+    mutex = &m;
+    next  = NULL;
+    going = 0;
+
+    // The fetch_and_store must have release semantics, because we are
+    // "sending" the fields initialized above to other processors.
+    scoped_lock* pred = m.q_tail.fetch_and_store<tbb::release>(this);
+    if( pred ) {
+        ITT_NOTIFY(sync_prepare, mutex);
+#if TBB_USE_ASSERT
+        __TBB_control_consistency_helper(); // on "m.q_tail"
+        __TBB_ASSERT( !pred->next, "the predecessor has another successor!");
+#endif
+        pred->next = this;
+        spin_wait_while_eq( going, 0ul );
+    }
+    ITT_NOTIFY(sync_acquired, mutex);
+
+    // Force acquire so that user's critical section receives correct values
+    // from processor that was previously in the user's critical section.
+    __TBB_load_with_acquire(going);
+}
+
+//! A method to acquire queuing_mutex if it is free
+bool queuing_mutex::scoped_lock::try_acquire( queuing_mutex& m )
+{
+    __TBB_ASSERT( !this->mutex, "scoped_lock is already holding a mutex");
+
+    // Must set all fields before the fetch_and_store, because once the
+    // fetch_and_store executes, *this becomes accessible to other threads.
+    next  = NULL;
+    going = 0;
+
+    // The CAS must have release semantics, because we are
+    // "sending" the fields initialized above to other processors.
+    if( m.q_tail.compare_and_swap<tbb::release>(this, NULL) )
+        return false;
+
+    // Force acquire so that user's critical section receives correct values
+    // from processor that was previously in the user's critical section.
+    __TBB_load_with_acquire(going);
+    mutex = &m;
+    ITT_NOTIFY(sync_acquired, mutex);
+    return true;
+}
+
+//! A method to release queuing_mutex lock
+void queuing_mutex::scoped_lock::release( )
+{
+    __TBB_ASSERT(this->mutex!=NULL, "no lock acquired");
+
+    ITT_NOTIFY(sync_releasing, mutex);
+    if( !next ) {
+        if( this == mutex->q_tail.compare_and_swap<tbb::release>(NULL, this) ) {
+            // this was the only item in the queue, and the queue is now empty.
+            goto done;
+        }
+        // Someone in the queue
+        spin_wait_while_eq( next, (scoped_lock*)0 );
+    }
+    __TBB_ASSERT(next,NULL);
+    __TBB_store_with_release(next->going, 1);
+done:
+    initialize();
+}
+
+void queuing_mutex::internal_construct() {
+    ITT_SYNC_CREATE(this, _T("tbb::queuing_mutex"), _T(""));
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/queuing_rw_mutex.cpp b/xdl/third_party/tbb/src/tbb/queuing_rw_mutex.cpp
new file mode 100644
index 00000000..2ed20cdb
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/queuing_rw_mutex.cpp
@@ -0,0 +1,492 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/** Before making any changes in the implementation, please emulate algorithmic changes
+    with SPIN tool using <TBB directory>/tools/spin_models/ReaderWriterMutex.pml.
+    There could be some code looking as "can be restructured" but its structure does matter! */
+
+#include "tbb/queuing_rw_mutex.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/tbb_stddef.h"
+#include "tbb/tbb_machine.h"
+#include "itt_notify.h"
+
+
+namespace tbb {
+
+using namespace internal;
+
+//! Flag bits in a state_t that specify information about a locking request.
+enum state_t_flags {
+    STATE_NONE                   = 0,
+    STATE_WRITER                 = 1<<0,
+    STATE_READER                 = 1<<1,
+    STATE_READER_UNBLOCKNEXT     = 1<<2,
+    STATE_ACTIVEREADER           = 1<<3,
+    STATE_UPGRADE_REQUESTED      = 1<<4,
+    STATE_UPGRADE_WAITING        = 1<<5,
+    STATE_UPGRADE_LOSER          = 1<<6,
+    STATE_COMBINED_WAITINGREADER = STATE_READER | STATE_READER_UNBLOCKNEXT,
+    STATE_COMBINED_READER        = STATE_COMBINED_WAITINGREADER | STATE_ACTIVEREADER,
+    STATE_COMBINED_UPGRADING     = STATE_UPGRADE_WAITING | STATE_UPGRADE_LOSER
+};
+
+const unsigned char RELEASED = 0;
+const unsigned char ACQUIRED = 1;
+
+inline bool queuing_rw_mutex::scoped_lock::try_acquire_internal_lock()
+{
+    return as_atomic(my_internal_lock).compare_and_swap<tbb::acquire>(ACQUIRED,RELEASED) == RELEASED;
+}
+
+inline void queuing_rw_mutex::scoped_lock::acquire_internal_lock()
+{
+    // Usually, we would use the test-test-and-set idiom here, with exponential backoff.
+    // But so far, experiments indicate there is no value in doing so here.
+    while( !try_acquire_internal_lock() ) {
+        __TBB_Pause(1);
+    }
+}
+
+inline void queuing_rw_mutex::scoped_lock::release_internal_lock()
+{
+    __TBB_store_with_release(my_internal_lock,RELEASED);
+}
+
+inline void queuing_rw_mutex::scoped_lock::wait_for_release_of_internal_lock()
+{
+    spin_wait_until_eq(my_internal_lock, RELEASED);
+}
+
+inline void queuing_rw_mutex::scoped_lock::unblock_or_wait_on_internal_lock( uintptr_t flag ) {
+    if( flag )
+        wait_for_release_of_internal_lock();
+    else
+        release_internal_lock();
+}
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    #pragma warning (push)
+    #pragma warning (disable: 4311 4312)
+#endif
+
+//! A view of a T* with additional functionality for twiddling low-order bits.
+template<typename T>
+class tricky_atomic_pointer: no_copy {
+public:
+    typedef typename atomic_selector<sizeof(T*)>::word word;
+
+    template<memory_semantics M>
+    static T* fetch_and_add( T* volatile * location, word addend ) {
+        return reinterpret_cast<T*>( atomic_traits<sizeof(T*),M>::fetch_and_add(location, addend) );
+    }
+    template<memory_semantics M>
+    static T* fetch_and_store( T* volatile * location, T* value ) {
+        return reinterpret_cast<T*>( atomic_traits<sizeof(T*),M>::fetch_and_store(location, reinterpret_cast<word>(value)) );
+    }
+    template<memory_semantics M>
+    static T* compare_and_swap( T* volatile * location, T* value, T* comparand ) {
+        return reinterpret_cast<T*>(
+                 atomic_traits<sizeof(T*),M>::compare_and_swap(location, reinterpret_cast<word>(value),
+                                                              reinterpret_cast<word>(comparand))
+               );
+    }
+
+    T* & ref;
+    tricky_atomic_pointer( T*& original ) : ref(original) {};
+    tricky_atomic_pointer( T* volatile & original ) : ref(original) {};
+    T* operator&( word operand2 ) const {
+        return reinterpret_cast<T*>( reinterpret_cast<word>(ref) & operand2 );
+    }
+    T* operator|( word operand2 ) const {
+        return reinterpret_cast<T*>( reinterpret_cast<word>(ref) | operand2 );
+    }
+};
+
+typedef tricky_atomic_pointer<queuing_rw_mutex::scoped_lock> tricky_pointer;
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    #pragma warning (pop)
+#endif
+
+//! Mask for low order bit of a pointer.
+static const tricky_pointer::word FLAG = 0x1;
+
+inline
+uintptr_t get_flag( queuing_rw_mutex::scoped_lock* ptr ) {
+    return uintptr_t(ptr) & FLAG;
+}
+
+//------------------------------------------------------------------------
+// Methods of queuing_rw_mutex::scoped_lock
+//------------------------------------------------------------------------
+
+//! A method to acquire queuing_rw_mutex lock
+void queuing_rw_mutex::scoped_lock::acquire( queuing_rw_mutex& m, bool write )
+{
+    __TBB_ASSERT( !my_mutex, "scoped_lock is already holding a mutex");
+
+    // Must set all fields before the fetch_and_store, because once the
+    // fetch_and_store executes, *this becomes accessible to other threads.
+    my_mutex = &m;
+    __TBB_store_relaxed(my_prev , (scoped_lock*)0);
+    __TBB_store_relaxed(my_next , (scoped_lock*)0);
+    __TBB_store_relaxed(my_going, 0);
+    my_state = state_t(write ? STATE_WRITER : STATE_READER);
+    my_internal_lock = RELEASED;
+
+    queuing_rw_mutex::scoped_lock* pred = m.q_tail.fetch_and_store<tbb::release>(this);
+
+    if( write ) {       // Acquiring for write
+
+        if( pred ) {
+            ITT_NOTIFY(sync_prepare, my_mutex);
+            pred = tricky_pointer(pred) & ~FLAG;
+            __TBB_ASSERT( !( uintptr_t(pred) & FLAG ), "use of corrupted pointer!" );
+#if TBB_USE_ASSERT
+            __TBB_control_consistency_helper(); // on "m.q_tail"
+            __TBB_ASSERT( !__TBB_load_relaxed(pred->my_next), "the predecessor has another successor!");
+#endif
+           __TBB_store_with_release(pred->my_next,this);
+            spin_wait_until_eq(my_going, 1);
+        }
+
+    } else {            // Acquiring for read
+#if DO_ITT_NOTIFY
+        bool sync_prepare_done = false;
+#endif
+        if( pred ) {
+            unsigned short pred_state;
+            __TBB_ASSERT( !__TBB_load_relaxed(my_prev), "the predecessor is already set" );
+            if( uintptr_t(pred) & FLAG ) {
+                /* this is only possible if pred is an upgrading reader and it signals us to wait */
+                pred_state = STATE_UPGRADE_WAITING;
+                pred = tricky_pointer(pred) & ~FLAG;
+            } else {
+                // Load pred->my_state now, because once pred->my_next becomes
+                // non-NULL, we must assume that *pred might be destroyed.
+                pred_state = pred->my_state.compare_and_swap<tbb::acquire>(STATE_READER_UNBLOCKNEXT, STATE_READER);
+            }
+            __TBB_store_relaxed(my_prev, pred);
+            __TBB_ASSERT( !( uintptr_t(pred) & FLAG ), "use of corrupted pointer!" );
+#if TBB_USE_ASSERT
+            __TBB_control_consistency_helper(); // on "m.q_tail"
+            __TBB_ASSERT( !__TBB_load_relaxed(pred->my_next), "the predecessor has another successor!");
+#endif
+           __TBB_store_with_release(pred->my_next,this);
+            if( pred_state != STATE_ACTIVEREADER ) {
+#if DO_ITT_NOTIFY
+                sync_prepare_done = true;
+                ITT_NOTIFY(sync_prepare, my_mutex);
+#endif
+                spin_wait_until_eq(my_going, 1);
+            }
+        }
+
+        // The protected state must have been acquired here before it can be further released to any other reader(s):
+        unsigned short old_state = my_state.compare_and_swap<tbb::acquire>(STATE_ACTIVEREADER, STATE_READER);
+        if( old_state!=STATE_READER ) {
+#if DO_ITT_NOTIFY
+            if( !sync_prepare_done )
+                ITT_NOTIFY(sync_prepare, my_mutex);
+#endif
+            // Failed to become active reader -> need to unblock the next waiting reader first
+            __TBB_ASSERT( my_state==STATE_READER_UNBLOCKNEXT, "unexpected state" );
+            spin_wait_while_eq(my_next, (scoped_lock*)NULL);
+            /* my_state should be changed before unblocking the next otherwise it might finish
+               and another thread can get our old state and left blocked */
+            my_state = STATE_ACTIVEREADER;
+           __TBB_store_with_release(my_next->my_going,1);
+        }
+    }
+
+    ITT_NOTIFY(sync_acquired, my_mutex);
+
+    // Force acquire so that user's critical section receives correct values
+    // from processor that was previously in the user's critical section.
+    __TBB_load_with_acquire(my_going);
+}
+
+//! A method to acquire queuing_rw_mutex if it is free
+bool queuing_rw_mutex::scoped_lock::try_acquire( queuing_rw_mutex& m, bool write )
+{
+    __TBB_ASSERT( !my_mutex, "scoped_lock is already holding a mutex");
+
+    if( load<relaxed>(m.q_tail) )
+        return false; // Someone already took the lock
+
+    // Must set all fields before the fetch_and_store, because once the
+    // fetch_and_store executes, *this becomes accessible to other threads.
+    __TBB_store_relaxed(my_prev, (scoped_lock*)0);
+    __TBB_store_relaxed(my_next, (scoped_lock*)0);
+    __TBB_store_relaxed(my_going, 0); // TODO: remove dead assignment?
+    my_state = state_t(write ? STATE_WRITER : STATE_ACTIVEREADER);
+    my_internal_lock = RELEASED;
+
+    // The CAS must have release semantics, because we are
+    // "sending" the fields initialized above to other processors.
+    if( m.q_tail.compare_and_swap<tbb::release>(this, NULL) )
+        return false; // Someone already took the lock
+    // Force acquire so that user's critical section receives correct values
+    // from processor that was previously in the user's critical section.
+    __TBB_load_with_acquire(my_going);
+    my_mutex = &m;
+    ITT_NOTIFY(sync_acquired, my_mutex);
+    return true;
+}
+
+//! A method to release queuing_rw_mutex lock
+void queuing_rw_mutex::scoped_lock::release( )
+{
+    __TBB_ASSERT(my_mutex!=NULL, "no lock acquired");
+
+    ITT_NOTIFY(sync_releasing, my_mutex);
+
+    if( my_state == STATE_WRITER ) { // Acquired for write
+
+        // The logic below is the same as "writerUnlock", but elides
+        // "return" from the middle of the routine.
+        // In the statement below, acquire semantics of reading my_next is required
+        // so that following operations with fields of my_next are safe.
+        scoped_lock* n = __TBB_load_with_acquire(my_next);
+        if( !n ) {
+            if( this == my_mutex->q_tail.compare_and_swap<tbb::release>(NULL, this) ) {
+                // this was the only item in the queue, and the queue is now empty.
+                goto done;
+            }
+            spin_wait_while_eq( my_next, (scoped_lock*)NULL );
+            n = __TBB_load_with_acquire(my_next);
+        }
+        __TBB_store_relaxed(n->my_going, 2); // protect next queue node from being destroyed too early
+        if( n->my_state==STATE_UPGRADE_WAITING ) {
+            // the next waiting for upgrade means this writer was upgraded before.
+            acquire_internal_lock();
+            queuing_rw_mutex::scoped_lock* tmp = tricky_pointer::fetch_and_store<tbb::release>(&(n->my_prev), NULL);
+            n->my_state = STATE_UPGRADE_LOSER;
+            __TBB_store_with_release(n->my_going,1);
+            unblock_or_wait_on_internal_lock(get_flag(tmp));
+        } else {
+            __TBB_ASSERT( my_state & (STATE_COMBINED_WAITINGREADER | STATE_WRITER), "unexpected state" );
+            __TBB_ASSERT( !( uintptr_t(__TBB_load_relaxed(n->my_prev)) & FLAG ), "use of corrupted pointer!" );
+            __TBB_store_relaxed(n->my_prev, (scoped_lock*)0);
+            __TBB_store_with_release(n->my_going,1);
+        }
+
+    } else { // Acquired for read
+
+        queuing_rw_mutex::scoped_lock *tmp = NULL;
+retry:
+        // Addition to the original paper: Mark my_prev as in use
+        queuing_rw_mutex::scoped_lock *pred = tricky_pointer::fetch_and_add<tbb::acquire>(&my_prev, FLAG);
+
+        if( pred ) {
+            if( !(pred->try_acquire_internal_lock()) )
+            {
+                // Failed to acquire the lock on pred. The predecessor either unlinks or upgrades.
+                // In the second case, it could or could not know my "in use" flag - need to check
+                tmp = tricky_pointer::compare_and_swap<tbb::release>(&my_prev, pred, tricky_pointer(pred) | FLAG );
+                if( !(uintptr_t(tmp) & FLAG) ) {
+                    // Wait for the predecessor to change my_prev (e.g. during unlink)
+                    spin_wait_while_eq( my_prev, tricky_pointer(pred)|FLAG );
+                    // Now owner of pred is waiting for _us_ to release its lock
+                    pred->release_internal_lock();
+                }
+                // else the "in use" flag is back -> the predecessor didn't get it and will release itself; nothing to do
+
+                tmp = NULL;
+                goto retry;
+            }
+            __TBB_ASSERT(pred && pred->my_internal_lock==ACQUIRED, "predecessor's lock is not acquired");
+            __TBB_store_relaxed(my_prev, pred);
+            acquire_internal_lock();
+
+            __TBB_store_with_release(pred->my_next,static_cast<scoped_lock *>(NULL));
+
+            if( !__TBB_load_relaxed(my_next) && this != my_mutex->q_tail.compare_and_swap<tbb::release>(pred, this) ) {
+                spin_wait_while_eq( my_next, (void*)NULL );
+            }
+            __TBB_ASSERT( !get_flag(__TBB_load_relaxed(my_next)), "use of corrupted pointer" );
+
+            // ensure acquire semantics of reading 'my_next'
+            if( scoped_lock *const l_next = __TBB_load_with_acquire(my_next) ) { // I->next != nil, TODO: rename to n after clearing up and adapting the n in the comment two lines below
+                // Equivalent to I->next->prev = I->prev but protected against (prev[n]&FLAG)!=0
+                tmp = tricky_pointer::fetch_and_store<tbb::release>(&(l_next->my_prev), pred);
+                // I->prev->next = I->next;
+                __TBB_ASSERT(__TBB_load_relaxed(my_prev)==pred, NULL);
+                __TBB_store_with_release(pred->my_next, my_next);
+            }
+            // Safe to release in the order opposite to acquiring which makes the code simpler
+            pred->release_internal_lock();
+
+        } else { // No predecessor when we looked
+            acquire_internal_lock();  // "exclusiveLock(&I->EL)"
+            scoped_lock* n = __TBB_load_with_acquire(my_next);
+            if( !n ) {
+                if( this != my_mutex->q_tail.compare_and_swap<tbb::release>(NULL, this) ) {
+                    spin_wait_while_eq( my_next, (scoped_lock*)NULL );
+                    n = __TBB_load_relaxed(my_next);
+                } else {
+                    goto unlock_self;
+                }
+            }
+            __TBB_store_relaxed(n->my_going, 2); // protect next queue node from being destroyed too early
+            tmp = tricky_pointer::fetch_and_store<tbb::release>(&(n->my_prev), NULL);
+            __TBB_store_with_release(n->my_going,1);
+        }
+unlock_self:
+        unblock_or_wait_on_internal_lock(get_flag(tmp));
+    }
+done:
+    spin_wait_while_eq( my_going, 2 );
+
+    initialize();
+}
+
+bool queuing_rw_mutex::scoped_lock::downgrade_to_reader()
+{
+    __TBB_ASSERT( my_state==STATE_WRITER, "no sense to downgrade a reader" );
+
+    ITT_NOTIFY(sync_releasing, my_mutex);
+    my_state = STATE_READER;
+    if( ! __TBB_load_relaxed(my_next) ) {
+        // the following load of q_tail must not be reordered with setting STATE_READER above
+        if( this==my_mutex->q_tail.load<full_fence>() ) {
+            unsigned short old_state = my_state.compare_and_swap<tbb::release>(STATE_ACTIVEREADER, STATE_READER);
+            if( old_state==STATE_READER )
+                return true; // Downgrade completed
+        }
+        /* wait for the next to register */
+        spin_wait_while_eq( my_next, (void*)NULL );
+    }
+    scoped_lock *const n = __TBB_load_with_acquire(my_next);
+    __TBB_ASSERT( n, "still no successor at this point!" );
+    if( n->my_state & STATE_COMBINED_WAITINGREADER )
+        __TBB_store_with_release(n->my_going,1);
+    else if( n->my_state==STATE_UPGRADE_WAITING )
+        // the next waiting for upgrade means this writer was upgraded before.
+        n->my_state = STATE_UPGRADE_LOSER;
+    my_state = STATE_ACTIVEREADER;
+    return true;
+}
+
+bool queuing_rw_mutex::scoped_lock::upgrade_to_writer()
+{
+    __TBB_ASSERT( my_state==STATE_ACTIVEREADER, "only active reader can be upgraded" );
+
+    queuing_rw_mutex::scoped_lock * tmp;
+    queuing_rw_mutex::scoped_lock * me = this;
+
+    ITT_NOTIFY(sync_releasing, my_mutex);
+    my_state = STATE_UPGRADE_REQUESTED;
+requested:
+    __TBB_ASSERT( !(uintptr_t(__TBB_load_relaxed(my_next)) & FLAG), "use of corrupted pointer!" );
+    acquire_internal_lock();
+    if( this != my_mutex->q_tail.compare_and_swap<tbb::release>(tricky_pointer(me)|FLAG, this) ) {
+        spin_wait_while_eq( my_next, (void*)NULL );
+        queuing_rw_mutex::scoped_lock * n;
+        n = tricky_pointer::fetch_and_add<tbb::acquire>(&my_next, FLAG);
+        unsigned short n_state = n->my_state;
+        /* the next reader can be blocked by our state. the best thing to do is to unblock it */
+        if( n_state & STATE_COMBINED_WAITINGREADER )
+            __TBB_store_with_release(n->my_going,1);
+        tmp = tricky_pointer::fetch_and_store<tbb::release>(&(n->my_prev), this);
+        unblock_or_wait_on_internal_lock(get_flag(tmp));
+        if( n_state & (STATE_COMBINED_READER | STATE_UPGRADE_REQUESTED) ) {
+            // save n|FLAG for simplicity of following comparisons
+            tmp = tricky_pointer(n)|FLAG;
+            for( atomic_backoff b; __TBB_load_relaxed(my_next)==tmp; b.pause() ) {
+                if( my_state & STATE_COMBINED_UPGRADING ) {
+                    if( __TBB_load_with_acquire(my_next)==tmp )
+                        __TBB_store_relaxed(my_next, n);
+                    goto waiting;
+                }
+            }
+            __TBB_ASSERT(__TBB_load_relaxed(my_next) != (tricky_pointer(n)|FLAG), NULL);
+            goto requested;
+        } else {
+            __TBB_ASSERT( n_state & (STATE_WRITER | STATE_UPGRADE_WAITING), "unexpected state");
+            __TBB_ASSERT( (tricky_pointer(n)|FLAG) == __TBB_load_relaxed(my_next), NULL);
+            __TBB_store_relaxed(my_next, n);
+        }
+    } else {
+        /* We are in the tail; whoever comes next is blocked by q_tail&FLAG */
+        release_internal_lock();
+    } // if( this != my_mutex->q_tail... )
+    my_state.compare_and_swap<tbb::acquire>(STATE_UPGRADE_WAITING, STATE_UPGRADE_REQUESTED);
+
+waiting:
+    __TBB_ASSERT( !( intptr_t(__TBB_load_relaxed(my_next)) & FLAG ), "use of corrupted pointer!" );
+    __TBB_ASSERT( my_state & STATE_COMBINED_UPGRADING, "wrong state at upgrade waiting_retry" );
+    __TBB_ASSERT( me==this, NULL );
+    ITT_NOTIFY(sync_prepare, my_mutex);
+    /* if no one was blocked by the "corrupted" q_tail, turn it back */
+    my_mutex->q_tail.compare_and_swap<tbb::release>( this, tricky_pointer(me)|FLAG );
+    queuing_rw_mutex::scoped_lock * pred;
+    pred = tricky_pointer::fetch_and_add<tbb::acquire>(&my_prev, FLAG);
+    if( pred ) {
+        bool success = pred->try_acquire_internal_lock();
+        pred->my_state.compare_and_swap<tbb::release>(STATE_UPGRADE_WAITING, STATE_UPGRADE_REQUESTED);
+        if( !success ) {
+            tmp = tricky_pointer::compare_and_swap<tbb::release>(&my_prev, pred, tricky_pointer(pred)|FLAG );
+            if( uintptr_t(tmp) & FLAG ) {
+                spin_wait_while_eq(my_prev, pred);
+                pred = __TBB_load_relaxed(my_prev);
+            } else {
+                spin_wait_while_eq( my_prev, tricky_pointer(pred)|FLAG );
+                pred->release_internal_lock();
+            }
+        } else {
+            __TBB_store_relaxed(my_prev, pred);
+            pred->release_internal_lock();
+            spin_wait_while_eq(my_prev, pred);
+            pred = __TBB_load_relaxed(my_prev);
+        }
+        if( pred )
+            goto waiting;
+    } else {
+        // restore the corrupted my_prev field for possible further use (e.g. if downgrade back to reader)
+        __TBB_store_relaxed(my_prev, pred);
+    }
+    __TBB_ASSERT( !pred && !__TBB_load_relaxed(my_prev), NULL );
+
+    // additional lifetime issue prevention checks
+    // wait for the successor to finish working with my fields
+    wait_for_release_of_internal_lock();
+    // now wait for the predecessor to finish working with my fields
+    spin_wait_while_eq( my_going, 2 );
+
+    // Acquire critical section indirectly from previous owner or directly from predecessor (TODO: not clear).
+    __TBB_control_consistency_helper(); // on either "my_mutex->q_tail" or "my_going" (TODO: not clear)
+
+    bool result = ( my_state != STATE_UPGRADE_LOSER );
+    my_state = STATE_WRITER;
+    __TBB_store_relaxed(my_going, 1);
+
+    ITT_NOTIFY(sync_acquired, my_mutex);
+    return result;
+}
+
+void queuing_rw_mutex::internal_construct() {
+    ITT_SYNC_CREATE(this, _T("tbb::queuing_rw_mutex"), _T(""));
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/reader_writer_lock.cpp b/xdl/third_party/tbb/src/tbb/reader_writer_lock.cpp
new file mode 100644
index 00000000..fd13aca8
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/reader_writer_lock.cpp
@@ -0,0 +1,347 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/reader_writer_lock.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/tbb_exception.h"
+#include "itt_notify.h"
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4244)
+#endif
+
+namespace tbb {
+namespace interface5 {
+
+const uintptr_t WFLAG1 = 0x1;  // writer interested or active
+const uintptr_t WFLAG2 = 0x2;  // writers interested, no entering readers
+const uintptr_t RFLAG = 0x4;   // reader interested but not active
+const uintptr_t RC_INCR = 0x8; // to adjust reader count
+
+
+// Perform an atomic bitwise-OR on the operand, and return its previous value.
+inline uintptr_t fetch_and_or(atomic<uintptr_t>& operand, uintptr_t value) {
+    for (tbb::internal::atomic_backoff b;;b.pause()) {
+        uintptr_t old = operand;
+        uintptr_t result = operand.compare_and_swap(old|value, old);
+        if (result==old) return result;
+    }
+}
+
+// Perform an atomic bitwise-AND on the operand, and return its previous value.
+inline uintptr_t fetch_and_and(atomic<uintptr_t>& operand, uintptr_t value) {
+    for (tbb::internal::atomic_backoff b;;b.pause()) {
+        uintptr_t old = operand;
+        uintptr_t result = operand.compare_and_swap(old&value, old);
+        if (result==old) return result;
+    }
+}
+
+//! Spin WHILE the value at the location is greater than or equal to a given value
+/** T and U should be comparable types. */
+template<typename T, typename U>
+void spin_wait_while_geq( const volatile T& location, U value ) {
+    tbb::internal::atomic_backoff backoff;
+    while( location>=value ) backoff.pause();
+}
+
+//! Spin UNTIL (location & value) is true.
+/** T and U should be comparable types. */
+template<typename T, typename U>
+void spin_wait_until_and( const volatile T& location, U value ) {
+    tbb::internal::atomic_backoff backoff;
+    while( !(location & value) ) backoff.pause();
+}
+
+
+void reader_writer_lock::internal_construct() {
+    reader_head = NULL;
+    writer_head = NULL;
+    writer_tail = NULL;
+    rdr_count_and_flags = 0;
+    my_current_writer = tbb_thread::id();
+#if TBB_USE_THREADING_TOOLS
+    ITT_SYNC_CREATE(this, _T("tbb::reader_writer_lock"), _T(""));
+#endif /* TBB_USE_THREADING_TOOLS */
+}
+
+void reader_writer_lock::internal_destroy() {
+    __TBB_ASSERT(rdr_count_and_flags==0, "reader_writer_lock destroyed with pending readers/writers.");
+    __TBB_ASSERT(reader_head==NULL, "reader_writer_lock destroyed with pending readers.");
+    __TBB_ASSERT(writer_tail==NULL, "reader_writer_lock destroyed with pending writers.");
+    __TBB_ASSERT(writer_head==NULL, "reader_writer_lock destroyed with pending/active writers.");
+}
+
+// Acquires the reader_writer_lock for write.    If the lock is currently held in write
+// mode by another context, the writer will block by spinning on a local variable.
+// Throws exception improper_lock if the context tries to acquire a
+// reader_writer_lock that it already has write ownership of.
+void reader_writer_lock::lock() {
+    if (is_current_writer()) { // recursive lock attempt
+        // we don't support recursive writer locks; throw exception
+        tbb::internal::throw_exception(tbb::internal::eid_improper_lock);
+    }
+    else {
+        scoped_lock *a_writer_lock = new scoped_lock();
+        (void) start_write(a_writer_lock);
+    }
+}
+
+// Tries to acquire the reader_writer_lock for write.    This function does not block.
+// Return Value: True or false, depending on whether the lock is acquired or not.
+// If the lock is already held by this acquiring context, try_lock() returns false.
+bool reader_writer_lock::try_lock() {
+    if (is_current_writer()) { // recursive lock attempt
+        return false;
+    }
+    else {
+        scoped_lock *a_writer_lock = new scoped_lock();
+        a_writer_lock->status = waiting_nonblocking;
+        return start_write(a_writer_lock);
+    }
+}
+
+bool reader_writer_lock::start_write(scoped_lock *I) {
+    tbb_thread::id id = this_tbb_thread::get_id();
+    scoped_lock *pred = NULL;
+    if (I->status == waiting_nonblocking) {
+        if ((pred = writer_tail.compare_and_swap(I, NULL)) != NULL) {
+            delete I;
+            return false;
+        }
+    }
+    else {
+        ITT_NOTIFY(sync_prepare, this);
+        pred = writer_tail.fetch_and_store(I);
+    }
+    if (pred)
+        pred->next = I;
+    else {
+        set_next_writer(I);
+        if (I->status == waiting_nonblocking) {
+            if (I->next) { // potentially more writers
+                set_next_writer(I->next);
+            }
+            else { // no more writers
+                writer_head.fetch_and_store(NULL);
+                if (I != writer_tail.compare_and_swap(NULL, I)) { // an incoming writer is in the process of being added
+                    spin_wait_while_eq(I->next, (scoped_lock *)NULL);  // wait for new writer to be added
+                    __TBB_ASSERT(I->next, "There should be a node following the last writer.");
+                    set_next_writer(I->next);
+                }
+            }
+            delete I;
+            return false;
+        }
+    }
+    spin_wait_while_eq(I->status, waiting);
+    ITT_NOTIFY(sync_acquired, this);
+    my_current_writer = id;
+    return true;
+}
+
+void reader_writer_lock::set_next_writer(scoped_lock *W) {
+    writer_head = W;
+    if (W->status == waiting_nonblocking) {
+        if (rdr_count_and_flags.compare_and_swap(WFLAG1+WFLAG2, 0) == 0) {
+            W->status = active;
+        }
+    }
+    else {
+        if (fetch_and_or(rdr_count_and_flags, WFLAG1) & RFLAG) { // reader present
+            spin_wait_until_and(rdr_count_and_flags, WFLAG2); // block until readers set WFLAG2
+        }
+        else { // no reader in timing window
+            __TBB_AtomicOR(&rdr_count_and_flags, WFLAG2);
+        }
+        spin_wait_while_geq(rdr_count_and_flags, RC_INCR); // block until readers finish
+        W->status = active;
+   }
+}
+
+// Acquires the reader_writer_lock for read.    If the lock is currently held by a writer,
+// this reader will block and wait until the writers are done.
+// Throws exception improper_lock when the context tries to acquire a reader_writer_lock
+// that it already has write ownership of.
+void reader_writer_lock::lock_read() {
+    if (is_current_writer()) { // recursive lock attempt
+        // we don't support writer->reader downgrade; throw exception
+        tbb::internal::throw_exception(tbb::internal::eid_improper_lock);
+    }
+    else {
+        scoped_lock_read a_reader_lock;
+        start_read(&a_reader_lock);
+    }
+}
+
+// Tries to acquire the reader_writer_lock for read.    This function does not block.
+// Return Value: True or false, depending on whether the lock is acquired or not.
+bool reader_writer_lock::try_lock_read() {
+    if (is_current_writer()) { // recursive lock attempt
+        return false;
+    }
+    else {
+        if (rdr_count_and_flags.fetch_and_add(RC_INCR) & (WFLAG1+WFLAG2)) { // writers present
+            rdr_count_and_flags -= RC_INCR;
+            return false;
+        }
+        else { // no writers
+            ITT_NOTIFY(sync_acquired, this);
+            return true;
+        }
+    }
+}
+
+void reader_writer_lock::start_read(scoped_lock_read *I) {
+    ITT_NOTIFY(sync_prepare, this);
+    I->next = reader_head.fetch_and_store(I);
+    if (!I->next) { // first arriving reader in my group; set RFLAG, test writer flags
+        // unblock and/or update statuses of non-blocking readers
+        if (!(fetch_and_or(rdr_count_and_flags, RFLAG) & (WFLAG1+WFLAG2))) { // no writers
+            unblock_readers();
+        }
+    }
+    __TBB_ASSERT(I->status == waiting || I->status == active, "Lock requests should be waiting or active before blocking.");
+    spin_wait_while_eq(I->status, waiting); // block
+    if (I->next) {
+        __TBB_ASSERT(I->next->status == waiting, NULL);
+        rdr_count_and_flags += RC_INCR;
+        I->next->status = active; // wake successor
+    }
+    ITT_NOTIFY(sync_acquired, this);
+}
+
+void reader_writer_lock::unblock_readers() {
+    // clear rdr interest flag, increment rdr count
+    __TBB_ASSERT(rdr_count_and_flags&RFLAG, NULL);
+    rdr_count_and_flags += RC_INCR-RFLAG;
+    __TBB_ASSERT(rdr_count_and_flags >= RC_INCR, NULL);
+    // indicate clear of window
+    if (rdr_count_and_flags & WFLAG1 && !(rdr_count_and_flags & WFLAG2)) {
+        __TBB_AtomicOR(&rdr_count_and_flags, WFLAG2);
+    }
+    // unblock waiting readers
+    scoped_lock_read *head = reader_head.fetch_and_store(NULL);
+    __TBB_ASSERT(head, NULL);
+    __TBB_ASSERT(head->status == waiting, NULL);
+    head->status = active;
+}
+
+// Releases the reader_writer_lock
+void reader_writer_lock::unlock() {
+    if( my_current_writer!=tbb_thread::id() ) {
+        // A writer owns the lock
+        __TBB_ASSERT(is_current_writer(), "caller of reader_writer_lock::unlock() does not own the lock.");
+        __TBB_ASSERT(writer_head, NULL);
+        __TBB_ASSERT(writer_head->status==active, NULL);
+        scoped_lock *a_writer_lock = writer_head;
+        end_write(a_writer_lock);
+        __TBB_ASSERT(a_writer_lock != writer_head, "Internal error: About to turn writer_head into dangling reference.");
+        delete a_writer_lock;
+    } else {
+        end_read();
+    }
+}
+
+void reader_writer_lock::end_write(scoped_lock *I) {
+    __TBB_ASSERT(I==writer_head, "Internal error: can't unlock a thread that is not holding the lock.");
+    my_current_writer = tbb_thread::id();
+    ITT_NOTIFY(sync_releasing, this);
+    if (I->next) { // potentially more writers
+        writer_head = I->next;
+        writer_head->status = active;
+    }
+    else { // No more writers; clear writer flag, test reader interest flag
+        __TBB_ASSERT(writer_head, NULL);
+        if (fetch_and_and(rdr_count_and_flags, ~(WFLAG1+WFLAG2)) & RFLAG) {
+            unblock_readers();
+        }
+        writer_head.fetch_and_store(NULL);
+        if (I != writer_tail.compare_and_swap(NULL, I)) { // an incoming writer is in the process of being added
+            spin_wait_while_eq(I->next, (scoped_lock *)NULL);  // wait for new writer to be added
+            __TBB_ASSERT(I->next, "There should be a node following the last writer.");
+            set_next_writer(I->next);
+        }
+    }
+}
+
+void reader_writer_lock::end_read() {
+    ITT_NOTIFY(sync_releasing, this);
+    __TBB_ASSERT(rdr_count_and_flags >= RC_INCR, "unlock() called but no readers hold the lock.");
+    rdr_count_and_flags -= RC_INCR;
+}
+
+inline bool reader_writer_lock::is_current_writer() {
+    return my_current_writer==this_tbb_thread::get_id();
+}
+
+// Construct with a blocking attempt to acquire a write lock on the passed reader_writer_lock
+void reader_writer_lock::scoped_lock::internal_construct (reader_writer_lock& lock) {
+    mutex = &lock;
+    next = NULL;
+    status = waiting;
+    if (mutex->is_current_writer()) { // recursive lock attempt
+        // we don't support recursive writer locks; throw exception
+        tbb::internal::throw_exception(tbb::internal::eid_improper_lock);
+    }
+    else { // this thread holds no locks
+        (void) mutex->start_write(this);
+    }
+}
+
+inline reader_writer_lock::scoped_lock::scoped_lock() : mutex(NULL), next(NULL) {
+    status = waiting;
+}
+
+// Construct with a blocking attempt to acquire a write lock on the passed reader_writer_lock
+void reader_writer_lock::scoped_lock_read::internal_construct (reader_writer_lock& lock) {
+    mutex = &lock;
+    next = NULL;
+    status = waiting;
+    if (mutex->is_current_writer()) { // recursive lock attempt
+        // we don't support writer->reader downgrade; throw exception
+        tbb::internal::throw_exception(tbb::internal::eid_improper_lock);
+    }
+    else { // this thread holds no locks
+        mutex->start_read(this);
+    }
+}
+
+inline reader_writer_lock::scoped_lock_read::scoped_lock_read() : mutex(NULL), next(NULL) {
+    status = waiting;
+}
+
+void reader_writer_lock::scoped_lock::internal_destroy() {
+    if (mutex) {
+        __TBB_ASSERT(mutex->is_current_writer(), "~scoped_lock() destroyed by thread different than thread that holds lock.");
+        mutex->end_write(this);
+    }
+    status = invalid;
+}
+
+void reader_writer_lock::scoped_lock_read::internal_destroy() {
+    if (mutex)
+        mutex->end_read();
+    status = invalid;
+}
+
+} // namespace interface5
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/recursive_mutex.cpp b/xdl/third_party/tbb/src/tbb/recursive_mutex.cpp
new file mode 100644
index 00000000..09775391
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/recursive_mutex.cpp
@@ -0,0 +1,136 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/recursive_mutex.h"
+#include "itt_notify.h"
+
+namespace tbb {
+
+void recursive_mutex::scoped_lock::internal_acquire( recursive_mutex& m ) {
+#if _WIN32||_WIN64
+    switch( m.state ) {
+      case INITIALIZED:
+        // since we cannot look into the internal of the CriticalSection object
+        // we won't know how many times the lock has been acquired, and thus
+        // we won't know when we may safely set the state back to INITIALIZED
+        // if we change the state to HELD as in mutex.cpp.  thus, we won't change
+        // the state for recursive_mutex
+        EnterCriticalSection( &m.impl );
+        break;
+      case DESTROYED:
+        __TBB_ASSERT(false,"recursive_mutex::scoped_lock: mutex already destroyed");
+        break;
+      default:
+        __TBB_ASSERT(false,"recursive_mutex::scoped_lock: illegal mutex state");
+        break;
+    }
+#else
+    int error_code = pthread_mutex_lock(&m.impl);
+    if( error_code )
+        tbb::internal::handle_perror(error_code,"recursive_mutex::scoped_lock: pthread_mutex_lock failed");
+#endif /* _WIN32||_WIN64 */
+    my_mutex = &m;
+}
+
+void recursive_mutex::scoped_lock::internal_release() {
+    __TBB_ASSERT( my_mutex, "recursive_mutex::scoped_lock: not holding a mutex" );
+#if _WIN32||_WIN64
+    switch( my_mutex->state ) {
+      case INITIALIZED:
+        LeaveCriticalSection( &my_mutex->impl );
+        break;
+      case DESTROYED:
+        __TBB_ASSERT(false,"recursive_mutex::scoped_lock: mutex already destroyed");
+        break;
+      default:
+        __TBB_ASSERT(false,"recursive_mutex::scoped_lock: illegal mutex state");
+        break;
+    }
+#else
+     int error_code = pthread_mutex_unlock(&my_mutex->impl);
+     __TBB_ASSERT_EX(!error_code, "recursive_mutex::scoped_lock: pthread_mutex_unlock failed");
+#endif /* _WIN32||_WIN64 */
+     my_mutex = NULL;
+}
+
+bool recursive_mutex::scoped_lock::internal_try_acquire( recursive_mutex& m ) {
+#if _WIN32||_WIN64
+    switch( m.state ) {
+      case INITIALIZED:
+        break;
+      case DESTROYED:
+        __TBB_ASSERT(false,"recursive_mutex::scoped_lock: mutex already destroyed");
+        break;
+      default:
+        __TBB_ASSERT(false,"recursive_mutex::scoped_lock: illegal mutex state");
+        break;
+    }
+#endif /* _WIN32||_WIN64 */
+    bool result;
+#if _WIN32||_WIN64
+    result = TryEnterCriticalSection(&m.impl)!=0;
+#else
+    result = pthread_mutex_trylock(&m.impl)==0;
+#endif /* _WIN32||_WIN64 */
+    if( result )
+        my_mutex = &m;
+    return result;
+}
+
+void recursive_mutex::internal_construct() {
+#if _WIN32||_WIN64
+    InitializeCriticalSectionEx(&impl, 4000, 0);
+    state = INITIALIZED;
+#else
+    pthread_mutexattr_t mtx_attr;
+    int error_code = pthread_mutexattr_init( &mtx_attr );
+    if( error_code )
+        tbb::internal::handle_perror(error_code,"recursive_mutex: pthread_mutexattr_init failed");
+
+    pthread_mutexattr_settype( &mtx_attr, PTHREAD_MUTEX_RECURSIVE );
+    error_code = pthread_mutex_init( &impl, &mtx_attr );
+    if( error_code )
+        tbb::internal::handle_perror(error_code,"recursive_mutex: pthread_mutex_init failed");
+    pthread_mutexattr_destroy( &mtx_attr );
+#endif /* _WIN32||_WIN64*/
+    ITT_SYNC_CREATE(&impl, _T("tbb::recursive_mutex"), _T(""));
+}
+
+void recursive_mutex::internal_destroy() {
+#if _WIN32||_WIN64
+    switch( state ) {
+      case INITIALIZED:
+        DeleteCriticalSection(&impl);
+        break;
+      case DESTROYED:
+        __TBB_ASSERT(false,"recursive_mutex: already destroyed");
+        break;
+      default:
+        __TBB_ASSERT(false,"recursive_mutex: illegal state for destruction");
+        break;
+    }
+    state = DESTROYED;
+#else
+    int error_code = pthread_mutex_destroy(&impl);
+    __TBB_ASSERT_EX(!error_code,"recursive_mutex: pthread_mutex_destroy failed");
+#endif /* _WIN32||_WIN64 */
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/scheduler.cpp b/xdl/third_party/tbb/src/tbb/scheduler.cpp
new file mode 100644
index 00000000..288bd1ad
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/scheduler.cpp
@@ -0,0 +1,1433 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "custom_scheduler.h"
+#include "scheduler_utility.h"
+#include "governor.h"
+#include "market.h"
+#include "arena.h"
+#include "mailbox.h"
+#include "observer_proxy.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/atomic.h"
+
+namespace tbb {
+namespace internal {
+
+//------------------------------------------------------------------------
+// Library initialization
+//------------------------------------------------------------------------
+
+/** Defined in tbb_main.cpp **/
+extern generic_scheduler* (*AllocateSchedulerPtr)( market& );
+
+inline generic_scheduler* allocate_scheduler ( market& m ) {
+    return AllocateSchedulerPtr( m );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+context_state_propagation_mutex_type the_context_state_propagation_mutex;
+
+uintptr_t the_context_state_propagation_epoch = 0;
+
+//! Context to be associated with dummy tasks of worker threads schedulers.
+/** It is never used for its direct purpose, and is introduced solely for the sake
+    of avoiding one extra conditional branch in the end of wait_for_all method. **/
+static task_group_context the_dummy_context(task_group_context::isolated);
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+void Scheduler_OneTimeInitialization ( bool itt_present ) {
+    AllocateSchedulerPtr = itt_present ? &custom_scheduler<DefaultSchedulerTraits>::allocate_scheduler :
+                                      &custom_scheduler<IntelSchedulerTraits>::allocate_scheduler;
+#if __TBB_TASK_GROUP_CONTEXT
+    // There must be no tasks belonging to this fake task group. Mark invalid for the assert
+    __TBB_ASSERT(!(task_group_context::low_unused_state_bit & (task_group_context::low_unused_state_bit-1)), NULL);
+    the_dummy_context.my_state = task_group_context::low_unused_state_bit;
+#if __TBB_TASK_PRIORITY
+    // It should never prevent tasks from being passed to execution.
+    the_dummy_context.my_priority = num_priority_levels - 1;
+#endif /* __TBB_TASK_PRIORITY */
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+}
+
+//------------------------------------------------------------------------
+// scheduler interface
+//------------------------------------------------------------------------
+
+//  A pure virtual destructor should still have a body
+//  so the one for tbb::internal::scheduler::~scheduler() is provided here
+scheduler::~scheduler( ) {}
+
+//------------------------------------------------------------------------
+// generic_scheduler
+//------------------------------------------------------------------------
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warning about using 'this' in base initializer list.
+    #pragma warning(push)
+    #pragma warning(disable:4355)
+#endif
+
+generic_scheduler::generic_scheduler( market& m )
+    : my_market(&m)
+    , my_random(this)
+    , my_ref_count(1)
+    , my_small_task_count(1)   // Extra 1 is a guard reference
+#if __TBB_SURVIVE_THREAD_SWITCH && TBB_USE_ASSERT
+    , my_cilk_state(cs_none)
+#endif /* __TBB_SURVIVE_THREAD_SWITCH && TBB_USE_ASSERT */
+{
+    __TBB_ASSERT( !my_arena_index, "constructor expects the memory being zero-initialized" );
+    __TBB_ASSERT( governor::is_set(NULL), "scheduler is already initialized for this thread" );
+
+    my_innermost_running_task = my_dummy_task = &allocate_task( sizeof(task), __TBB_CONTEXT_ARG(NULL, &the_dummy_context) );
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    my_properties.has_taken_critical_task = false;
+#endif
+    my_properties.outermost = true;
+#if __TBB_TASK_PRIORITY
+    my_ref_top_priority = &m.my_global_top_priority;
+    my_ref_reload_epoch = &m.my_global_reload_epoch;
+#endif /* __TBB_TASK_PRIORITY */
+#if __TBB_TASK_GROUP_CONTEXT
+    // Sync up the local cancellation state with the global one. No need for fence here.
+    my_context_state_propagation_epoch = the_context_state_propagation_epoch;
+    my_context_list_head.my_prev = &my_context_list_head;
+    my_context_list_head.my_next = &my_context_list_head;
+    ITT_SYNC_CREATE(&my_context_list_mutex, SyncType_Scheduler, SyncObj_ContextsList);
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    ITT_SYNC_CREATE(&my_dummy_task->prefix().ref_count, SyncType_Scheduler, SyncObj_WorkerLifeCycleMgmt);
+    ITT_SYNC_CREATE(&my_return_list, SyncType_Scheduler, SyncObj_TaskReturnList);
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif // warning 4355 is back
+
+#if TBB_USE_ASSERT > 1
+void generic_scheduler::assert_task_pool_valid() const {
+    if ( !my_arena_slot )
+        return;
+    acquire_task_pool();
+    task** tp = my_arena_slot->task_pool_ptr;
+    if ( my_arena_slot->my_task_pool_size )
+        __TBB_ASSERT( my_arena_slot->my_task_pool_size >= min_task_pool_size, NULL );
+    const size_t H = __TBB_load_relaxed(my_arena_slot->head); // mirror
+    const size_t T = __TBB_load_relaxed(my_arena_slot->tail); // mirror
+    __TBB_ASSERT( H <= T, NULL );
+    for ( size_t i = 0; i < H; ++i )
+        __TBB_ASSERT( tp[i] == poisoned_ptr, "Task pool corrupted" );
+    for ( size_t i = H; i < T; ++i ) {
+        if ( tp[i] ) {
+            assert_task_valid( tp[i] );
+            __TBB_ASSERT( tp[i]->prefix().state == task::ready ||
+                tp[i]->prefix().extra_state == es_task_proxy, "task in the deque has invalid state" );
+        }
+    }
+    for ( size_t i = T; i < my_arena_slot->my_task_pool_size; ++i )
+        __TBB_ASSERT( tp[i] == poisoned_ptr, "Task pool corrupted" );
+    release_task_pool();
+}
+#endif /* TBB_USE_ASSERT > 1 */
+
+void generic_scheduler::init_stack_info () {
+    // Stacks are growing top-down. Highest address is called "stack base",
+    // and the lowest is "stack limit".
+    __TBB_ASSERT( !my_stealing_threshold, "Stealing threshold has already been calculated" );
+    size_t  stack_size = my_market->worker_stack_size();
+#if USE_WINTHREAD
+#if defined(_MSC_VER)&&_MSC_VER<1400 && !_WIN64
+    NT_TIB  *pteb;
+    __asm mov eax, fs:[0x18]
+    __asm mov pteb, eax
+#else
+    NT_TIB  *pteb = (NT_TIB*)NtCurrentTeb();
+#endif
+    __TBB_ASSERT( &pteb < pteb->StackBase && &pteb > pteb->StackLimit, "invalid stack info in TEB" );
+    __TBB_ASSERT( stack_size >0, "stack_size not initialized?" );
+    // When a thread is created with the attribute STACK_SIZE_PARAM_IS_A_RESERVATION, stack limit
+    // in the TIB points to the committed part of the stack only. This renders the expression
+    // "(uintptr_t)pteb->StackBase / 2 + (uintptr_t)pteb->StackLimit / 2" virtually useless.
+    // Thus for worker threads we use the explicit stack size we used while creating them.
+    // And for master threads we rely on the following fact and assumption:
+    // - the default stack size of a master thread on Windows is 1M;
+    // - if it was explicitly set by the application it is at least as large as the size of a worker stack.
+    if ( is_worker() || stack_size < MByte )
+        my_stealing_threshold = (uintptr_t)pteb->StackBase - stack_size / 2;
+    else
+        my_stealing_threshold = (uintptr_t)pteb->StackBase - MByte / 2;
+#else /* USE_PTHREAD */
+    // There is no portable way to get stack base address in Posix, so we use
+    // non-portable method (on all modern Linux) or the simplified approach
+    // based on the common sense assumptions. The most important assumption
+    // is that the main thread's stack size is not less than that of other threads.
+    // See also comment 3 at the end of this file
+    void    *stack_base = &stack_size;
+#if __linux__ && !__bg__
+#if __TBB_ipf
+    void    *rsb_base = __TBB_get_bsp();
+#endif
+    size_t  np_stack_size = 0;
+    void    *stack_limit = NULL;
+    pthread_attr_t  np_attr_stack;
+    if( 0 == pthread_getattr_np(pthread_self(), &np_attr_stack) ) {
+        if ( 0 == pthread_attr_getstack(&np_attr_stack, &stack_limit, &np_stack_size) ) {
+#if __TBB_ipf
+            pthread_attr_t  attr_stack;
+            if ( 0 == pthread_attr_init(&attr_stack) ) {
+                if ( 0 == pthread_attr_getstacksize(&attr_stack, &stack_size) ) {
+                    if ( np_stack_size < stack_size ) {
+                        // We are in a secondary thread. Use reliable data.
+                        // IA-64 architecture stack is split into RSE backup and memory parts
+                        rsb_base = stack_limit;
+                        stack_size = np_stack_size/2;
+                        // Limit of the memory part of the stack
+                        stack_limit = (char*)stack_limit + stack_size;
+                    }
+                    // We are either in the main thread or this thread stack
+                    // is bigger that that of the main one. As we cannot discern
+                    // these cases we fall back to the default (heuristic) values.
+                }
+                pthread_attr_destroy(&attr_stack);
+            }
+            // IA-64 architecture stack is split into RSE backup and memory parts
+            my_rsb_stealing_threshold = (uintptr_t)((char*)rsb_base + stack_size/2);
+#endif /* __TBB_ipf */
+            // Size of the stack free part
+            stack_size = size_t((char*)stack_base - (char*)stack_limit);
+        }
+        pthread_attr_destroy(&np_attr_stack);
+    }
+#endif /* __linux__ */
+    __TBB_ASSERT( stack_size>0, "stack size must be positive" );
+    my_stealing_threshold = (uintptr_t)((char*)stack_base - stack_size/2);
+#endif /* USE_PTHREAD */
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+/** The function uses synchronization scheme similar to the one in the destructor
+    of task_group_context augmented with interlocked state change of each context
+    object. The purpose of this algo is to prevent threads doing nonlocal context
+    destruction from accessing destroyed owner-scheduler instance still pointed to
+    by the context object. **/
+void generic_scheduler::cleanup_local_context_list () {
+    // Detach contexts remaining in the local list
+    bool wait_for_concurrent_destroyers_to_leave = false;
+    uintptr_t local_count_snapshot = my_context_state_propagation_epoch;
+    my_local_ctx_list_update.store<relaxed>(1);
+    {
+        // This is just a definition. Actual lock is acquired only in case of conflict.
+        spin_mutex::scoped_lock lock;
+        // Full fence prevents reordering of store to my_local_ctx_list_update with
+        // load from my_nonlocal_ctx_list_update.
+        atomic_fence();
+        // Check for the conflict with concurrent destroyer or cancellation propagator
+        if ( my_nonlocal_ctx_list_update.load<relaxed>() || local_count_snapshot != the_context_state_propagation_epoch )
+            lock.acquire(my_context_list_mutex);
+        // No acquire fence is necessary for loading my_context_list_head.my_next,
+        // as the list can be updated by this thread only.
+        context_list_node_t *node = my_context_list_head.my_next;
+        while ( node != &my_context_list_head ) {
+            task_group_context &ctx = __TBB_get_object_ref(task_group_context, my_node, node);
+            __TBB_ASSERT( __TBB_load_relaxed(ctx.my_kind) != task_group_context::binding_required, "Only a context bound to a root task can be detached" );
+            node = node->my_next;
+            __TBB_ASSERT( is_alive(ctx.my_version_and_traits), "Walked into a destroyed context while detaching contexts from the local list" );
+            // Synchronizes with ~task_group_context(). TODO: evaluate and perhaps relax
+            if ( internal::as_atomic(ctx.my_kind).fetch_and_store(task_group_context::detached) == task_group_context::dying )
+                wait_for_concurrent_destroyers_to_leave = true;
+        }
+    }
+    my_local_ctx_list_update.store<release>(0);
+    // Wait until other threads referencing this scheduler object finish with it
+    if ( wait_for_concurrent_destroyers_to_leave )
+        spin_wait_until_eq( my_nonlocal_ctx_list_update, 0u );
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+void generic_scheduler::free_scheduler() {
+    __TBB_ASSERT( !my_arena_slot, NULL );
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    __TBB_ASSERT( !my_properties.has_taken_critical_task, "Critical tasks miscount." );
+#endif
+#if __TBB_TASK_GROUP_CONTEXT
+    cleanup_local_context_list();
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    free_task<small_local_task>( *my_dummy_task );
+
+#if __TBB_HOARD_NONLOCAL_TASKS
+    while( task* t = my_nonlocal_free_list ) {
+        task_prefix& p = t->prefix();
+        my_nonlocal_free_list = p.next;
+        __TBB_ASSERT( p.origin && p.origin!=this, NULL );
+        free_nonlocal_small_task(*t);
+    }
+#endif
+    // k accounts for a guard reference and each task that we deallocate.
+    intptr_t k = 1;
+    for(;;) {
+        while( task* t = my_free_list ) {
+            my_free_list = t->prefix().next;
+            deallocate_task(*t);
+            ++k;
+        }
+        if( my_return_list==plugged_return_list() )
+            break;
+        my_free_list = (task*)__TBB_FetchAndStoreW( &my_return_list, (intptr_t)plugged_return_list() );
+    }
+#if __TBB_COUNT_TASK_NODES
+    my_market->update_task_node_count( my_task_node_count );
+#endif /* __TBB_COUNT_TASK_NODES */
+    // Update my_small_task_count last.  Doing so sooner might cause another thread to free *this.
+    __TBB_ASSERT( my_small_task_count>=k, "my_small_task_count corrupted" );
+    governor::sign_off(this);
+    if( __TBB_FetchAndAddW( &my_small_task_count, -k )==k )
+        NFS_Free( this );
+}
+
+task& generic_scheduler::allocate_task( size_t number_of_bytes,
+                                            __TBB_CONTEXT_ARG(task* parent, task_group_context* context) ) {
+    GATHER_STATISTIC(++my_counters.active_tasks);
+    task *t;
+    if( number_of_bytes<=quick_task_size ) {
+#if __TBB_HOARD_NONLOCAL_TASKS
+        if( (t = my_nonlocal_free_list) ) {
+            GATHER_STATISTIC(--my_counters.free_list_length);
+            __TBB_ASSERT( t->state()==task::freed, "free list of tasks is corrupted" );
+            my_nonlocal_free_list = t->prefix().next;
+        } else
+#endif
+        if( (t = my_free_list) ) {
+            GATHER_STATISTIC(--my_counters.free_list_length);
+            __TBB_ASSERT( t->state()==task::freed, "free list of tasks is corrupted" );
+            my_free_list = t->prefix().next;
+        } else if( my_return_list ) {
+            // No fence required for read of my_return_list above, because __TBB_FetchAndStoreW has a fence.
+            t = (task*)__TBB_FetchAndStoreW( &my_return_list, 0 ); // with acquire
+            __TBB_ASSERT( t, "another thread emptied the my_return_list" );
+            __TBB_ASSERT( t->prefix().origin==this, "task returned to wrong my_return_list" );
+            ITT_NOTIFY( sync_acquired, &my_return_list );
+            my_free_list = t->prefix().next;
+        } else {
+            t = (task*)((char*)NFS_Allocate( 1, task_prefix_reservation_size+quick_task_size, NULL ) + task_prefix_reservation_size );
+#if __TBB_COUNT_TASK_NODES
+            ++my_task_node_count;
+#endif /* __TBB_COUNT_TASK_NODES */
+            t->prefix().origin = this;
+            t->prefix().next = 0;
+            ++my_small_task_count;
+        }
+#if __TBB_PREFETCHING
+        task *t_next = t->prefix().next;
+        if( !t_next ) { // the task was last in the list
+#if __TBB_HOARD_NONLOCAL_TASKS
+            if( my_free_list )
+                t_next = my_free_list;
+            else
+#endif
+            if( my_return_list ) // enable prefetching, gives speedup
+                t_next = my_free_list = (task*)__TBB_FetchAndStoreW( &my_return_list, 0 );
+        }
+        if( t_next ) { // gives speedup for both cache lines
+            __TBB_cl_prefetch(t_next);
+            __TBB_cl_prefetch(&t_next->prefix());
+        }
+#endif /* __TBB_PREFETCHING */
+    } else {
+        GATHER_STATISTIC(++my_counters.big_tasks);
+        t = (task*)((char*)NFS_Allocate( 1, task_prefix_reservation_size+number_of_bytes, NULL ) + task_prefix_reservation_size );
+#if __TBB_COUNT_TASK_NODES
+        ++my_task_node_count;
+#endif /* __TBB_COUNT_TASK_NODES */
+        t->prefix().origin = NULL;
+    }
+    task_prefix& p = t->prefix();
+#if __TBB_TASK_GROUP_CONTEXT
+    p.context = context;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    // Obsolete. But still in use, so has to be assigned correct value here.
+    p.owner = this;
+    p.ref_count = 0;
+    // Obsolete. Assign some not outrageously out-of-place value for a while.
+    p.depth = 0;
+    p.parent = parent;
+    // In TBB 2.1 and later, the constructor for task sets extra_state to indicate the version of the tbb/task.h header.
+    // In TBB 2.0 and earlier, the constructor leaves extra_state as zero.
+    p.extra_state = 0;
+    p.affinity = 0;
+    p.state = task::allocated;
+    __TBB_ISOLATION_EXPR( p.isolation = no_isolation );
+    return *t;
+}
+
+void generic_scheduler::free_nonlocal_small_task( task& t ) {
+    __TBB_ASSERT( t.state()==task::freed, NULL );
+    generic_scheduler& s = *static_cast<generic_scheduler*>(t.prefix().origin);
+    __TBB_ASSERT( &s!=this, NULL );
+    for(;;) {
+        task* old = s.my_return_list;
+        if( old==plugged_return_list() )
+            break;
+        // Atomically insert t at head of s.my_return_list
+        t.prefix().next = old;
+        ITT_NOTIFY( sync_releasing, &s.my_return_list );
+        if( as_atomic(s.my_return_list).compare_and_swap(&t, old )==old ) {
+#if __TBB_PREFETCHING
+            __TBB_cl_evict(&t.prefix());
+            __TBB_cl_evict(&t);
+#endif
+            return;
+        }
+    }
+    deallocate_task(t);
+    if( __TBB_FetchAndDecrementWrelease( &s.my_small_task_count )==1 ) {
+        // We freed the last task allocated by scheduler s, so it's our responsibility
+        // to free the scheduler.
+        NFS_Free( &s );
+    }
+}
+
+inline size_t generic_scheduler::prepare_task_pool ( size_t num_tasks ) {
+    size_t T = __TBB_load_relaxed(my_arena_slot->tail); // mirror
+    if ( T + num_tasks <= my_arena_slot->my_task_pool_size )
+        return T;
+
+    size_t new_size = num_tasks;
+
+    if ( !my_arena_slot->my_task_pool_size ) {
+        __TBB_ASSERT( !is_task_pool_published() && is_quiescent_local_task_pool_reset(), NULL );
+        __TBB_ASSERT( !my_arena_slot->task_pool_ptr, NULL );
+        if ( num_tasks < min_task_pool_size ) new_size = min_task_pool_size;
+        my_arena_slot->allocate_task_pool( new_size );
+        return 0;
+    }
+
+    acquire_task_pool();
+    size_t H = __TBB_load_relaxed( my_arena_slot->head ); // mirror
+    task** task_pool = my_arena_slot->task_pool_ptr;;
+    __TBB_ASSERT( my_arena_slot->my_task_pool_size >= min_task_pool_size, NULL );
+    // Count not skipped tasks. Consider using std::count_if.
+    for ( size_t i = H; i < T; ++i )
+        if ( task_pool[i] ) ++new_size;
+    // If the free space at the beginning of the task pool is too short, we
+    // are likely facing a pathological single-producer-multiple-consumers
+    // scenario, and thus it's better to expand the task pool
+    bool allocate = new_size > my_arena_slot->my_task_pool_size - min_task_pool_size/4;
+    if ( allocate ) {
+        // Grow task pool. As this operation is rare, and its cost is asymptotically
+        // amortizable, we can tolerate new task pool allocation done under the lock.
+        if ( new_size < 2 * my_arena_slot->my_task_pool_size )
+            new_size = 2 * my_arena_slot->my_task_pool_size;
+        my_arena_slot->allocate_task_pool( new_size ); // updates my_task_pool_size
+    }
+    // Filter out skipped tasks. Consider using std::copy_if.
+    size_t T1 = 0;
+    for ( size_t i = H; i < T; ++i )
+        if ( task_pool[i] )
+            my_arena_slot->task_pool_ptr[T1++] = task_pool[i];
+    // Deallocate the previous task pool if a new one has been allocated.
+    if ( allocate )
+        NFS_Free( task_pool );
+    else
+        my_arena_slot->fill_with_canary_pattern( T1, my_arena_slot->tail );
+    // Publish the new state.
+    commit_relocated_tasks( T1 );
+    assert_task_pool_valid();
+    return T1;
+}
+
+/** ATTENTION:
+    This method is mostly the same as generic_scheduler::lock_task_pool(), with
+    a little different logic of slot state checks (slot is either locked or points
+    to our task pool).
+    Thus if either of them is changed, consider changing the counterpart as well. **/
+inline void generic_scheduler::acquire_task_pool() const {
+    if ( !is_task_pool_published() )
+        return; // we are not in arena - nothing to lock
+    bool sync_prepare_done = false;
+    for( atomic_backoff b;;b.pause() ) {
+#if TBB_USE_ASSERT
+        __TBB_ASSERT( my_arena_slot == my_arena->my_slots + my_arena_index, "invalid arena slot index" );
+        // Local copy of the arena slot task pool pointer is necessary for the next
+        // assertion to work correctly to exclude asynchronous state transition effect.
+        task** tp = my_arena_slot->task_pool;
+        __TBB_ASSERT( tp == LockedTaskPool || tp == my_arena_slot->task_pool_ptr, "slot ownership corrupt?" );
+#endif
+        if( my_arena_slot->task_pool != LockedTaskPool &&
+            as_atomic(my_arena_slot->task_pool).compare_and_swap(LockedTaskPool, my_arena_slot->task_pool_ptr ) == my_arena_slot->task_pool_ptr )
+        {
+            // We acquired our own slot
+            ITT_NOTIFY(sync_acquired, my_arena_slot);
+            break;
+        }
+        else if( !sync_prepare_done ) {
+            // Start waiting
+            ITT_NOTIFY(sync_prepare, my_arena_slot);
+            sync_prepare_done = true;
+        }
+        // Someone else acquired a lock, so pause and do exponential backoff.
+    }
+    __TBB_ASSERT( my_arena_slot->task_pool == LockedTaskPool, "not really acquired task pool" );
+} // generic_scheduler::acquire_task_pool
+
+inline void generic_scheduler::release_task_pool() const {
+    if ( !is_task_pool_published() )
+        return; // we are not in arena - nothing to unlock
+    __TBB_ASSERT( my_arena_slot, "we are not in arena" );
+    __TBB_ASSERT( my_arena_slot->task_pool == LockedTaskPool, "arena slot is not locked" );
+    ITT_NOTIFY(sync_releasing, my_arena_slot);
+    __TBB_store_with_release( my_arena_slot->task_pool, my_arena_slot->task_pool_ptr );
+}
+
+/** ATTENTION:
+    This method is mostly the same as generic_scheduler::acquire_task_pool(),
+    with a little different logic of slot state checks (slot can be empty, locked
+    or point to any task pool other than ours, and asynchronous transitions between
+    all these states are possible).
+    Thus if any of them is changed, consider changing the counterpart as well **/
+inline task** generic_scheduler::lock_task_pool( arena_slot* victim_arena_slot ) const {
+    task** victim_task_pool;
+    bool sync_prepare_done = false;
+    for( atomic_backoff backoff;; /*backoff pause embedded in the loop*/) {
+        victim_task_pool = victim_arena_slot->task_pool;
+        // NOTE: Do not use comparison of head and tail indices to check for
+        // the presence of work in the victim's task pool, as they may give
+        // incorrect indication because of task pool relocations and resizes.
+        if ( victim_task_pool == EmptyTaskPool ) {
+            // The victim thread emptied its task pool - nothing to lock
+            if( sync_prepare_done )
+                ITT_NOTIFY(sync_cancel, victim_arena_slot);
+            break;
+        }
+        if( victim_task_pool != LockedTaskPool &&
+            as_atomic(victim_arena_slot->task_pool).compare_and_swap(LockedTaskPool, victim_task_pool ) == victim_task_pool )
+        {
+            // We've locked victim's task pool
+            ITT_NOTIFY(sync_acquired, victim_arena_slot);
+            break;
+        }
+        else if( !sync_prepare_done ) {
+            // Start waiting
+            ITT_NOTIFY(sync_prepare, victim_arena_slot);
+            sync_prepare_done = true;
+        }
+        GATHER_STATISTIC( ++my_counters.thieves_conflicts );
+        // Someone else acquired a lock, so pause and do exponential backoff.
+#if __TBB_STEALING_ABORT_ON_CONTENTION
+        if(!backoff.bounded_pause()) {
+            // the 16 was acquired empirically and a theory behind it supposes
+            // that number of threads becomes much bigger than number of
+            // tasks which can be spawned by one thread causing excessive contention.
+            // TODO: However even small arenas can benefit from the abort on contention
+            //       if preemption of a thief is a problem
+            if(my_arena->my_limit >= 16)
+                return EmptyTaskPool;
+            __TBB_Yield();
+        }
+#else
+        backoff.pause();
+#endif
+    }
+    __TBB_ASSERT( victim_task_pool == EmptyTaskPool ||
+                  (victim_arena_slot->task_pool == LockedTaskPool && victim_task_pool != LockedTaskPool),
+                  "not really locked victim's task pool?" );
+    return victim_task_pool;
+} // generic_scheduler::lock_task_pool
+
+inline void generic_scheduler::unlock_task_pool( arena_slot* victim_arena_slot,
+                                                task** victim_task_pool ) const {
+    __TBB_ASSERT( victim_arena_slot, "empty victim arena slot pointer" );
+    __TBB_ASSERT( victim_arena_slot->task_pool == LockedTaskPool, "victim arena slot is not locked" );
+    ITT_NOTIFY(sync_releasing, victim_arena_slot);
+    __TBB_store_with_release( victim_arena_slot->task_pool, victim_task_pool );
+}
+
+
+inline task* generic_scheduler::prepare_for_spawning( task* t ) {
+    __TBB_ASSERT( t->state()==task::allocated, "attempt to spawn task that is not in 'allocated' state" );
+    t->prefix().state = task::ready;
+#if TBB_USE_ASSERT
+    if( task* parent = t->parent() ) {
+        internal::reference_count ref_count = parent->prefix().ref_count;
+        __TBB_ASSERT( ref_count>=0, "attempt to spawn task whose parent has a ref_count<0" );
+        __TBB_ASSERT( ref_count!=0, "attempt to spawn task whose parent has a ref_count==0 (forgot to set_ref_count?)" );
+        parent->prefix().extra_state |= es_ref_count_active;
+    }
+#endif /* TBB_USE_ASSERT */
+    affinity_id dst_thread = t->prefix().affinity;
+    __TBB_ASSERT( dst_thread == 0 || is_version_3_task(*t),
+                  "backwards compatibility to TBB 2.0 tasks is broken" );
+#if __TBB_TASK_ISOLATION
+    isolation_tag isolation = my_innermost_running_task->prefix().isolation;
+    t->prefix().isolation = isolation;
+#endif /* __TBB_TASK_ISOLATION */
+    if( dst_thread != 0 && dst_thread != my_affinity_id ) {
+        task_proxy& proxy = (task_proxy&)allocate_task( sizeof(task_proxy),
+                                                      __TBB_CONTEXT_ARG(NULL, NULL) );
+        // Mark as a proxy
+        proxy.prefix().extra_state = es_task_proxy;
+        proxy.outbox = &my_arena->mailbox(dst_thread);
+        // Mark proxy as present in both locations (sender's task pool and destination mailbox)
+        proxy.task_and_tag = intptr_t(t) | task_proxy::location_mask;
+#if __TBB_TASK_PRIORITY
+        poison_pointer( proxy.prefix().context );
+#endif /* __TBB_TASK_PRIORITY */
+        __TBB_ISOLATION_EXPR( proxy.prefix().isolation = isolation );
+        ITT_NOTIFY( sync_releasing, proxy.outbox );
+        // Mail the proxy - after this point t may be destroyed by another thread at any moment.
+        proxy.outbox->push(&proxy);
+        return &proxy;
+    }
+    return t;
+}
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+bool generic_scheduler::handled_as_critical( task& t ) {
+    if( !internal::is_critical( t ) )
+        return false;
+#if __TBB_TASK_ISOLATION
+    t.prefix().isolation = my_innermost_running_task->prefix().isolation;
+#endif
+    ITT_NOTIFY(sync_releasing, &my_arena->my_critical_task_stream);
+    __TBB_ASSERT( my_arena, "Must be attached to the arena." );
+    __TBB_ASSERT( my_arena_slot, "Must occupy a slot in the attached arena" );
+    my_arena->my_critical_task_stream.push(
+        &t, 0, tbb::internal::subsequent_lane_selector(my_arena_slot->hint_for_critical) );
+    return true;
+}
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+
+/** Conceptually, this method should be a member of class scheduler.
+    But doing so would force us to publish class scheduler in the headers. */
+void generic_scheduler::local_spawn( task* first, task*& next ) {
+    __TBB_ASSERT( first, NULL );
+    __TBB_ASSERT( governor::is_set(this), NULL );
+#if __TBB_TODO
+    // We need to consider capping the max task pool size and switching
+    // to in-place task execution whenever it is reached.
+#endif
+    if ( &first->prefix().next == &next ) {
+        // Single task is being spawned
+#if __TBB_TODO
+        // TODO:
+        // In the future we need to add overloaded spawn method for a single task,
+        // and a method accepting an array of task pointers (we may also want to
+        // change the implementation of the task_list class). But since such changes
+        // may affect the binary compatibility, we postpone them for a while.
+#endif
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        if( !handled_as_critical( *first ) )
+#endif
+        {
+            size_t T = prepare_task_pool( 1 );
+            my_arena_slot->task_pool_ptr[T] = prepare_for_spawning( first );
+            commit_spawned_tasks( T + 1 );
+            if ( !is_task_pool_published() )
+                publish_task_pool();
+        }
+    }
+    else {
+        // Task list is being spawned
+#if __TBB_TODO
+        // TODO: add task_list::front() and implement&document the local execution ordering which is
+        // opposite to the current implementation. The idea is to remove hackish fast_reverse_vector
+        // and use push_back/push_front when accordingly LIFO and FIFO order of local execution is
+        // desired. It also requires refactoring of the reload_tasks method and my_offloaded_tasks list.
+        // Additional benefit may come from adding counter to the task_list so that it can reserve enough
+        // space in the task pool in advance and move all the tasks directly without any intermediate
+        // storages. But it requires dealing with backward compatibility issues and still supporting
+        // counter-less variant (though not necessarily fast implementation).
+#endif
+        task *arr[min_task_pool_size];
+        fast_reverse_vector<task*> tasks(arr, min_task_pool_size);
+        task *t_next = NULL;
+        for( task* t = first; ; t = t_next ) {
+            // If t is affinitized to another thread, it may already be executed
+            // and destroyed by the time prepare_for_spawning returns.
+            // So milk it while it is alive.
+            bool end = &t->prefix().next == &next;
+            t_next = t->prefix().next;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+            if( !handled_as_critical( *t ) )
+#endif
+                tasks.push_back( prepare_for_spawning(t) );
+            if( end )
+                break;
+        }
+        if( size_t num_tasks = tasks.size() ) {
+            size_t T = prepare_task_pool( num_tasks );
+            tasks.copy_memory( my_arena_slot->task_pool_ptr + T );
+            commit_spawned_tasks( T + num_tasks );
+            if ( !is_task_pool_published() )
+                publish_task_pool();
+        }
+    }
+    my_arena->advertise_new_work<arena::work_spawned>();
+    assert_task_pool_valid();
+}
+
+void generic_scheduler::local_spawn_root_and_wait( task* first, task*& next ) {
+    __TBB_ASSERT( governor::is_set(this), NULL );
+    __TBB_ASSERT( first, NULL );
+    auto_empty_task dummy( __TBB_CONTEXT_ARG(this, first->prefix().context) );
+    internal::reference_count n = 0;
+    for( task* t=first; ; t=t->prefix().next ) {
+        ++n;
+        __TBB_ASSERT( !t->prefix().parent, "not a root task, or already running" );
+        t->prefix().parent = &dummy;
+        if( &t->prefix().next==&next ) break;
+#if __TBB_TASK_GROUP_CONTEXT
+        __TBB_ASSERT( t->prefix().context == t->prefix().next->prefix().context,
+                    "all the root tasks in list must share the same context");
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    }
+    dummy.prefix().ref_count = n+1;
+    if( n>1 )
+        local_spawn( first->prefix().next, next );
+    local_wait_for_all( dummy, first );
+}
+
+void tbb::internal::generic_scheduler::spawn( task& first, task*& next ) {
+    governor::local_scheduler()->local_spawn( &first, next );
+}
+
+void tbb::internal::generic_scheduler::spawn_root_and_wait( task& first, task*& next ) {
+    governor::local_scheduler()->local_spawn_root_and_wait( &first, next );
+}
+
+void tbb::internal::generic_scheduler::enqueue( task& t, void* prio ) {
+    generic_scheduler *s = governor::local_scheduler();
+    // these redirections are due to bw-compatibility, consider reworking some day
+    __TBB_ASSERT( s->my_arena, "thread is not in any arena" );
+    s->my_arena->enqueue_task(t, (intptr_t)prio, s->my_random );
+}
+
+#if __TBB_TASK_PRIORITY
+class auto_indicator : no_copy {
+    volatile bool& my_indicator;
+public:
+    auto_indicator ( volatile bool& indicator ) : my_indicator(indicator) { my_indicator = true ;}
+    ~auto_indicator () { my_indicator = false; }
+};
+
+task *generic_scheduler::get_task_and_activate_task_pool( size_t H0, __TBB_ISOLATION_ARG( size_t T0, isolation_tag isolation ) ) {
+    __TBB_ASSERT( is_local_task_pool_quiescent(), NULL );
+
+    // Go through the task pool to find an available task for execution.
+    task *t = NULL;
+#if __TBB_TASK_ISOLATION
+    size_t T = T0;
+    bool tasks_omitted = false;
+    while ( !t && T>H0 ) {
+        t = get_task( --T, isolation, tasks_omitted );
+        if ( !tasks_omitted ) {
+            poison_pointer( my_arena_slot->task_pool_ptr[T] );
+            --T0;
+        }
+    }
+    // Make a hole if some tasks have been skipped.
+    if ( t && tasks_omitted ) {
+        my_arena_slot->task_pool_ptr[T] = NULL;
+        if ( T == H0 ) {
+            // The obtained task is on the head. So we can move the head instead of making a hole.
+            ++H0;
+            poison_pointer( my_arena_slot->task_pool_ptr[T] );
+        }
+    }
+#else
+    while ( !t && T0 ) {
+        t = get_task( --T0 );
+        poison_pointer( my_arena_slot->task_pool_ptr[T0] );
+    }
+#endif /* __TBB_TASK_ISOLATION */
+
+    if ( H0 < T0 ) {
+        // There are some tasks in the task pool. Publish them.
+        __TBB_store_relaxed( my_arena_slot->head, H0 );
+        __TBB_store_relaxed( my_arena_slot->tail, T0 );
+        if ( is_task_pool_published() )
+            release_task_pool();
+        else
+            publish_task_pool();
+    } else {
+        __TBB_store_relaxed( my_arena_slot->head, 0 );
+        __TBB_store_relaxed( my_arena_slot->tail, 0 );
+        if ( is_task_pool_published() )
+            leave_task_pool();
+    }
+
+#if __TBB_TASK_ISOLATION
+    // Now it is safe to call note_affinity because the task pool is restored.
+    if ( tasks_omitted && my_innermost_running_task == t ) {
+        assert_task_valid( t );
+        t->note_affinity( my_affinity_id );
+    }
+#endif /* __TBB_TASK_ISOLATION */
+
+    assert_task_pool_valid();
+    return t;
+}
+
+task* generic_scheduler::winnow_task_pool( __TBB_ISOLATION_EXPR( isolation_tag isolation ) ) {
+    GATHER_STATISTIC( ++my_counters.prio_winnowings );
+    __TBB_ASSERT( is_task_pool_published(), NULL );
+    __TBB_ASSERT( my_offloaded_tasks, "At least one task is expected to be already offloaded" );
+    // To eliminate possible sinking of the store to the indicator below the subsequent
+    // store to my_arena_slot->tail, the stores should have either been separated
+    // by full fence or both use release fences. And resetting indicator should have
+    // been done with release fence. But since this is just an optimization, and
+    // the corresponding checking sequence in arena::is_out_of_work() is not atomic
+    // anyway, fences aren't used, so that not to penalize warmer path.
+    auto_indicator indicator( my_pool_reshuffling_pending );
+
+    // Locking the task pool unconditionally produces simpler code,
+    // scalability of which should not suffer unless priority jitter takes place.
+    // TODO: consider the synchronization algorithm here is for the owner thread
+    // to avoid locking task pool most of the time.
+    acquire_task_pool();
+    size_t T0 = __TBB_load_relaxed( my_arena_slot->tail );
+    size_t H0 = __TBB_load_relaxed( my_arena_slot->head );
+    size_t T1 = 0;
+    for ( size_t src = H0; src<T0; ++src ) {
+        if ( task *t = my_arena_slot->task_pool_ptr[src] ) {
+            // We cannot offload a proxy task (check the priority of it) because it can be already consumed.
+            if ( !is_proxy( *t ) ) {
+                intptr_t p = priority( *t );
+                if ( p<*my_ref_top_priority ) {
+                    offload_task( *t, p );
+                    continue;
+                }
+            }
+            my_arena_slot->task_pool_ptr[T1++] = t;
+        }
+    }
+    __TBB_ASSERT( T1<=T0, NULL );
+
+    // Choose max(T1, H0) because ranges [0, T1) and [H0, T0) can overlap.
+    my_arena_slot->fill_with_canary_pattern( max( T1, H0 ), T0 );
+    return get_task_and_activate_task_pool( 0, __TBB_ISOLATION_ARG( T1, isolation ) );
+}
+
+task* generic_scheduler::reload_tasks ( task*& offloaded_tasks, task**& offloaded_task_list_link, __TBB_ISOLATION_ARG( intptr_t top_priority, isolation_tag isolation ) ) {
+    GATHER_STATISTIC( ++my_counters.prio_reloads );
+#if __TBB_TASK_ISOLATION
+    // In many cases, locking the task pool is no-op here because the task pool is in the empty
+    // state. However, isolation allows entering stealing loop with non-empty task pool.
+    // In principle, it is possible to process reloaded tasks without locking but it will
+    // complicate the logic of get_task_and_activate_task_pool (TODO: evaluate).
+    acquire_task_pool();
+#else
+    __TBB_ASSERT( !is_task_pool_published(), NULL );
+#endif
+    task *arr[min_task_pool_size];
+    fast_reverse_vector<task*> tasks(arr, min_task_pool_size);
+    task **link = &offloaded_tasks;
+    while ( task *t = *link ) {
+        task** next_ptr = &t->prefix().next_offloaded;
+        __TBB_ASSERT( !is_proxy(*t), "The proxy tasks cannot be offloaded" );
+        if ( priority(*t) >= top_priority ) {
+            tasks.push_back( t );
+            // Note that owner is an alias of next_offloaded. Thus the following
+            // assignment overwrites *next_ptr
+            task* next = *next_ptr;
+            t->prefix().owner = this;
+            __TBB_ASSERT( t->prefix().state == task::ready, NULL );
+            *link = next;
+        }
+        else {
+            link = next_ptr;
+        }
+    }
+    if ( link == &offloaded_tasks ) {
+        offloaded_tasks = NULL;
+#if TBB_USE_ASSERT
+        offloaded_task_list_link = NULL;
+#endif /* TBB_USE_ASSERT */
+    }
+    else {
+        __TBB_ASSERT( link, NULL );
+        // Mark end of list
+        *link = NULL;
+        offloaded_task_list_link = link;
+    }
+    __TBB_ASSERT( link, NULL );
+    size_t num_tasks = tasks.size();
+    if ( !num_tasks ) {
+        __TBB_ISOLATION_EXPR( release_task_pool() );
+        return NULL;
+    }
+
+    // Copy found tasks into the task pool.
+    GATHER_STATISTIC( ++my_counters.prio_tasks_reloaded );
+    size_t T = prepare_task_pool( num_tasks );
+    tasks.copy_memory( my_arena_slot->task_pool_ptr + T );
+
+    // Find a task available for execution.
+    task *t = get_task_and_activate_task_pool( __TBB_load_relaxed( my_arena_slot->head ), __TBB_ISOLATION_ARG( T + num_tasks, isolation ) );
+    if ( t ) --num_tasks;
+    if ( num_tasks )
+        my_arena->advertise_new_work<arena::work_spawned>();
+
+    return t;
+}
+
+task* generic_scheduler::reload_tasks( __TBB_ISOLATION_EXPR( isolation_tag isolation ) ) {
+    uintptr_t reload_epoch = *my_ref_reload_epoch;
+    __TBB_ASSERT( my_offloaded_tasks, NULL );
+    __TBB_ASSERT( my_local_reload_epoch <= reload_epoch
+                  || my_local_reload_epoch - reload_epoch > uintptr_t(-1)/2,
+                  "Reload epoch counter overflow?" );
+    if ( my_local_reload_epoch == reload_epoch )
+        return NULL;
+    __TBB_ASSERT( my_offloaded_tasks, NULL );
+    intptr_t top_priority = effective_reference_priority();
+    __TBB_ASSERT( (uintptr_t)top_priority < (uintptr_t)num_priority_levels, NULL );
+    task *t = reload_tasks( my_offloaded_tasks, my_offloaded_task_list_tail_link, __TBB_ISOLATION_ARG( top_priority, isolation ) );
+    if ( my_offloaded_tasks && (my_arena->my_bottom_priority >= top_priority || !my_arena->my_num_workers_requested) ) {
+        // Safeguard against deliberately relaxed synchronization while checking
+        // for the presence of work in arena (so that not to impact hot paths).
+        // Arena may be reset to empty state when offloaded low priority tasks
+        // are still present. This results in both bottom and top priority bounds
+        // becoming 'normal', which makes offloaded low priority tasks unreachable.
+        // Update arena's bottom priority to accommodate them.
+        // NOTE:    If the number of priority levels is increased, we may want
+        //          to calculate minimum of priorities in my_offloaded_tasks.
+
+        // First indicate the presence of lower-priority tasks
+        my_market->update_arena_priority( *my_arena, priority(*my_offloaded_tasks) );
+        // Then mark arena as full to unlock arena priority level adjustment
+        // by arena::is_out_of_work(), and ensure worker's presence
+        my_arena->advertise_new_work<arena::wakeup>();
+    }
+    my_local_reload_epoch = reload_epoch;
+    return t;
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+#if __TBB_TASK_ISOLATION
+inline task* generic_scheduler::get_task( size_t T, isolation_tag isolation, bool& tasks_omitted )
+#else
+inline task* generic_scheduler::get_task( size_t T )
+#endif /* __TBB_TASK_ISOLATION */
+{
+    __TBB_ASSERT( __TBB_load_relaxed( my_arena_slot->tail ) <= T
+        || is_local_task_pool_quiescent(), "Is it safe to get a task at position T?" );
+
+    task* result = my_arena_slot->task_pool_ptr[T];
+    __TBB_ASSERT( !is_poisoned( result ), "The poisoned task is going to be processed" );
+#if __TBB_TASK_ISOLATION
+    if ( !result )
+        return NULL;
+
+    bool omit = isolation != no_isolation && isolation != result->prefix().isolation;
+    if ( !omit && !is_proxy( *result ) )
+        return result;
+    else if ( omit ) {
+        tasks_omitted = true;
+        return NULL;
+    }
+#else
+    poison_pointer( my_arena_slot->task_pool_ptr[T] );
+    if ( !result || !is_proxy( *result ) )
+        return result;
+#endif /* __TBB_TASK_ISOLATION */
+
+    task_proxy& tp = static_cast<task_proxy&>(*result);
+    if ( task *t = tp.extract_task<task_proxy::pool_bit>() ) {
+        GATHER_STATISTIC( ++my_counters.proxies_executed );
+        // Following assertion should be true because TBB 2.0 tasks never specify affinity, and hence are not proxied.
+        __TBB_ASSERT( is_version_3_task( *t ), "backwards compatibility with TBB 2.0 broken" );
+        __TBB_ASSERT( my_innermost_running_task != t, NULL );
+        my_innermost_running_task = t; // prepare for calling note_affinity()
+#if __TBB_TASK_ISOLATION
+        // Task affinity has changed. Postpone calling note_affinity because the task pool is in invalid state.
+        if ( !tasks_omitted )
+#endif /* __TBB_TASK_ISOLATION */
+        {
+            poison_pointer( my_arena_slot->task_pool_ptr[T] );
+            t->note_affinity( my_affinity_id );
+        }
+        return t;
+    }
+
+    // Proxy was empty, so it's our responsibility to free it
+    free_task<small_task>( tp );
+#if __TBB_TASK_ISOLATION
+    if ( tasks_omitted )
+        my_arena_slot->task_pool_ptr[T] = NULL;
+#endif /* __TBB_TASK_ISOLATION */
+    return NULL;
+}
+
+inline task* generic_scheduler::get_task( __TBB_ISOLATION_EXPR( isolation_tag isolation ) ) {
+    __TBB_ASSERT( is_task_pool_published(), NULL );
+    // The current task position in the task pool.
+    size_t T0 = __TBB_load_relaxed( my_arena_slot->tail );
+    // The bounds of available tasks in the task pool. H0 is only used when the head bound is reached.
+    size_t H0 = (size_t)-1, T = T0;
+    task* result = NULL;
+    bool task_pool_empty = false;
+    __TBB_ISOLATION_EXPR( bool tasks_omitted = false );
+    do {
+        __TBB_ASSERT( !result, NULL );
+        __TBB_store_relaxed( my_arena_slot->tail, --T );
+        atomic_fence();
+        if ( (intptr_t)__TBB_load_relaxed( my_arena_slot->head ) > (intptr_t)T ) {
+            acquire_task_pool();
+            H0 = __TBB_load_relaxed( my_arena_slot->head );
+            if ( (intptr_t)H0 > (intptr_t)T ) {
+                // The thief has not backed off - nothing to grab.
+                __TBB_ASSERT( H0 == __TBB_load_relaxed( my_arena_slot->head )
+                    && T == __TBB_load_relaxed( my_arena_slot->tail )
+                    && H0 == T + 1, "victim/thief arbitration algorithm failure" );
+                reset_task_pool_and_leave();
+                // No tasks in the task pool.
+                task_pool_empty = true;
+                break;
+            } else if ( H0 == T ) {
+                // There is only one task in the task pool.
+                reset_task_pool_and_leave();
+                task_pool_empty = true;
+            } else {
+                // Release task pool if there are still some tasks.
+                // After the release, the tail will be less than T, thus a thief
+                // will not attempt to get a task at position T.
+                release_task_pool();
+            }
+        }
+        __TBB_control_consistency_helper(); // on my_arena_slot->head
+#if __TBB_TASK_ISOLATION
+        result = get_task( T, isolation, tasks_omitted );
+        if ( result ) {
+            poison_pointer( my_arena_slot->task_pool_ptr[T] );
+            break;
+        } else if ( !tasks_omitted ) {
+            poison_pointer( my_arena_slot->task_pool_ptr[T] );
+            __TBB_ASSERT( T0 == T+1, NULL );
+            T0 = T;
+        }
+#else
+        result = get_task( T );
+#endif /* __TBB_TASK_ISOLATION */
+    } while ( !result && !task_pool_empty );
+
+#if __TBB_TASK_ISOLATION
+    if ( tasks_omitted ) {
+        if ( task_pool_empty ) {
+            // All tasks have been checked. The task pool should be  in reset state.
+            // We just restore the bounds for the available tasks.
+            // TODO: Does it have sense to move them to the beginning of the task pool?
+            __TBB_ASSERT( is_quiescent_local_task_pool_reset(), NULL );
+            if ( result ) {
+                // If we have a task, it should be at H0 position.
+                __TBB_ASSERT( H0 == T, NULL );
+                ++H0;
+            }
+            __TBB_ASSERT( H0 <= T0, NULL );
+            if ( H0 < T0 ) {
+                // Restore the task pool if there are some tasks.
+                __TBB_store_relaxed( my_arena_slot->head, H0 );
+                __TBB_store_relaxed( my_arena_slot->tail, T0 );
+                // The release fence is used in publish_task_pool.
+                publish_task_pool();
+                // Synchronize with snapshot as we published some tasks.
+                my_arena->advertise_new_work<arena::wakeup>();
+            }
+        } else {
+            // A task has been obtained. We need to make a hole in position T.
+            __TBB_ASSERT( is_task_pool_published(), NULL );
+            __TBB_ASSERT( result, NULL );
+            my_arena_slot->task_pool_ptr[T] = NULL;
+            __TBB_store_with_release( my_arena_slot->tail, T0 );
+            // Synchronize with snapshot as we published some tasks.
+            // TODO: consider some approach not to call wakeup for each time. E.g. check if the tail reached the head.
+            my_arena->advertise_new_work<arena::wakeup>();
+        }
+
+        // Now it is safe to call note_affinity because the task pool is restored.
+        if ( my_innermost_running_task == result ) {
+            assert_task_valid( result );
+            result->note_affinity( my_affinity_id );
+        }
+    }
+#endif /* __TBB_TASK_ISOLATION */
+    __TBB_ASSERT( (intptr_t)__TBB_load_relaxed( my_arena_slot->tail ) >= 0, NULL );
+    __TBB_ASSERT( result || __TBB_ISOLATION_EXPR( tasks_omitted || ) is_quiescent_local_task_pool_reset(), NULL );
+    return result;
+} // generic_scheduler::get_task
+
+task* generic_scheduler::steal_task( __TBB_ISOLATION_EXPR(isolation_tag isolation) ) {
+    // Try to steal a task from a random victim.
+    size_t k = my_random.get() % (my_arena->my_limit-1);
+    arena_slot* victim = &my_arena->my_slots[k];
+    // The following condition excludes the master that might have
+    // already taken our previous place in the arena from the list .
+    // of potential victims. But since such a situation can take
+    // place only in case of significant oversubscription, keeping
+    // the checks simple seems to be preferable to complicating the code.
+    if( k >= my_arena_index )
+        ++victim;               // Adjusts random distribution to exclude self
+    task **pool = victim->task_pool;
+    task *t = NULL;
+    if( pool == EmptyTaskPool || !(t = steal_task_from( __TBB_ISOLATION_ARG(*victim, isolation) )) )
+        return NULL;
+    if( is_proxy(*t) ) {
+        task_proxy &tp = *(task_proxy*)t;
+        t = tp.extract_task<task_proxy::pool_bit>();
+        if ( !t ) {
+            // Proxy was empty, so it's our responsibility to free it
+            free_task<no_cache_small_task>(tp);
+            return NULL;
+        }
+        GATHER_STATISTIC( ++my_counters.proxies_stolen );
+    }
+    t->prefix().extra_state |= es_task_is_stolen;
+    if( is_version_3_task(*t) ) {
+        my_innermost_running_task = t;
+        t->prefix().owner = this;
+        t->note_affinity( my_affinity_id );
+    }
+    GATHER_STATISTIC( ++my_counters.steals_committed );
+    return t;
+}
+
+task* generic_scheduler::steal_task_from( __TBB_ISOLATION_ARG( arena_slot& victim_slot, isolation_tag isolation ) ) {
+    task** victim_pool = lock_task_pool( &victim_slot );
+    if ( !victim_pool )
+        return NULL;
+    task* result = NULL;
+    size_t H = __TBB_load_relaxed(victim_slot.head); // mirror
+    size_t H0 = H;
+    bool tasks_omitted = false;
+    do {
+        __TBB_store_relaxed( victim_slot.head, ++H );
+        atomic_fence();
+        if ( (intptr_t)H > (intptr_t)__TBB_load_relaxed( victim_slot.tail ) ) {
+            // Stealing attempt failed, deque contents has not been changed by us
+            GATHER_STATISTIC( ++my_counters.thief_backoffs );
+            __TBB_store_relaxed( victim_slot.head, /*dead: H = */ H0 );
+            __TBB_ASSERT( !result, NULL );
+            goto unlock;
+        }
+        __TBB_control_consistency_helper(); // on victim_slot.tail
+        result = victim_pool[H-1];
+        __TBB_ASSERT( !is_poisoned( result ), NULL );
+
+        if ( result ) {
+            __TBB_ISOLATION_EXPR( if ( isolation == no_isolation || isolation == result->prefix().isolation ) )
+            {
+                if ( !is_proxy( *result ) )
+                    break;
+                task_proxy& tp = *static_cast<task_proxy*>(result);
+                // If mailed task is likely to be grabbed by its destination thread, skip it.
+                if ( !(task_proxy::is_shared( tp.task_and_tag ) && tp.outbox->recipient_is_idle()) )
+                    break;
+                GATHER_STATISTIC( ++my_counters.proxies_bypassed );
+            }
+            // The task cannot be executed either due to isolation or proxy contraints.
+            result = NULL;
+            tasks_omitted = true;
+        } else if ( !tasks_omitted ) {
+            // Cleanup the task pool from holes until a task is skipped.
+            __TBB_ASSERT( H0 == H-1, NULL );
+            poison_pointer( victim_pool[H0] );
+            H0 = H;
+        }
+    } while ( !result );
+    __TBB_ASSERT( result, NULL );
+
+    // emit "task was consumed" signal
+    ITT_NOTIFY( sync_acquired, (void*)((uintptr_t)&victim_slot+sizeof( uintptr_t )) );
+    poison_pointer( victim_pool[H-1] );
+    if ( tasks_omitted ) {
+        // Some proxies in the task pool have been omitted. Set the stolen task to NULL.
+        victim_pool[H-1] = NULL;
+        __TBB_store_relaxed( victim_slot.head, /*dead: H = */ H0 );
+    }
+unlock:
+    unlock_task_pool( &victim_slot, victim_pool );
+#if __TBB_PREFETCHING
+    __TBB_cl_evict(&victim_slot.head);
+    __TBB_cl_evict(&victim_slot.tail);
+#endif
+    if ( tasks_omitted )
+        // Synchronize with snapshot as the head and tail can be bumped which can falsely trigger EMPTY state
+        my_arena->advertise_new_work<arena::wakeup>();
+    return result;
+}
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+// Retrieves critical task respecting isolation level, if provided. The rule is:
+// 1) If no outer critical task and no isolation => take any critical task
+// 2) If working on an outer critical task and no isolation => cannot take any critical task
+// 3) If no outer critical task but isolated => respect isolation
+// 4) If working on an outer critical task and isolated => respect isolation
+task* generic_scheduler::get_critical_task( __TBB_ISOLATION_EXPR(isolation_tag isolation) ) {
+    __TBB_ASSERT( my_arena && my_arena_slot, "Must be attached to arena" );
+    if( my_arena->my_critical_task_stream.empty(0) )
+        return NULL;
+    task* critical_task = NULL;
+    // To keep some LIFO-ness, start search with the lane that was used during push operation.
+    unsigned& start_lane = my_arena_slot->hint_for_critical;
+#if __TBB_TASK_ISOLATION
+    if( isolation != no_isolation ) {
+        critical_task = my_arena->my_critical_task_stream.pop_specific( 0, start_lane, isolation );
+    } else
+#endif
+    if( !my_properties.has_taken_critical_task ) {
+        critical_task = my_arena->my_critical_task_stream.pop( 0, preceding_lane_selector(start_lane) );
+    }
+    return critical_task;
+}
+#endif
+
+task* generic_scheduler::get_mailbox_task( __TBB_ISOLATION_EXPR( isolation_tag isolation ) ) {
+    __TBB_ASSERT( my_affinity_id>0, "not in arena" );
+    while ( task_proxy* const tp = my_inbox.pop( __TBB_ISOLATION_EXPR( isolation ) ) ) {
+        if ( task* result = tp->extract_task<task_proxy::mailbox_bit>() ) {
+            ITT_NOTIFY( sync_acquired, my_inbox.outbox() );
+            result->prefix().extra_state |= es_task_is_stolen;
+            return result;
+        }
+        // We have exclusive access to the proxy, and can destroy it.
+        free_task<no_cache_small_task>(*tp);
+    }
+    return NULL;
+}
+
+inline void generic_scheduler::publish_task_pool() {
+    __TBB_ASSERT ( my_arena, "no arena: initialization not completed?" );
+    __TBB_ASSERT ( my_arena_index < my_arena->my_num_slots, "arena slot index is out-of-bound" );
+    __TBB_ASSERT ( my_arena_slot == &my_arena->my_slots[my_arena_index], NULL);
+    __TBB_ASSERT ( my_arena_slot->task_pool == EmptyTaskPool, "someone else grabbed my arena slot?" );
+    __TBB_ASSERT ( __TBB_load_relaxed(my_arena_slot->head) < __TBB_load_relaxed(my_arena_slot->tail),
+                   "entering arena without tasks to share" );
+    // Release signal on behalf of previously spawned tasks (when this thread was not in arena yet)
+    ITT_NOTIFY(sync_releasing, my_arena_slot);
+    __TBB_store_with_release( my_arena_slot->task_pool, my_arena_slot->task_pool_ptr );
+}
+
+inline void generic_scheduler::leave_task_pool() {
+    __TBB_ASSERT( is_task_pool_published(), "Not in arena" );
+    // Do not reset my_arena_index. It will be used to (attempt to) re-acquire the slot next time
+    __TBB_ASSERT( &my_arena->my_slots[my_arena_index] == my_arena_slot, "arena slot and slot index mismatch" );
+    __TBB_ASSERT ( my_arena_slot->task_pool == LockedTaskPool, "Task pool must be locked when leaving arena" );
+    __TBB_ASSERT ( is_quiescent_local_task_pool_empty(), "Cannot leave arena when the task pool is not empty" );
+    ITT_NOTIFY(sync_releasing, &my_arena->my_slots[my_arena_index]);
+    // No release fence is necessary here as this assignment precludes external
+    // accesses to the local task pool when becomes visible. Thus it is harmless
+    // if it gets hoisted above preceding local bookkeeping manipulations.
+    __TBB_store_relaxed( my_arena_slot->task_pool, EmptyTaskPool );
+}
+
+generic_scheduler* generic_scheduler::create_worker( market& m, size_t index ) {
+    generic_scheduler* s = allocate_scheduler( m );
+    __TBB_ASSERT(index, "workers should have index > 0");
+    s->my_arena_index = index; // index is not a real slot in arena yet
+    s->my_dummy_task->prefix().ref_count = 2;
+    s->my_properties.type = scheduler_properties::worker;
+    // Do not call init_stack_info before the scheduler is set as master or worker.
+    s->init_stack_info();
+    governor::sign_on(s);
+    return s;
+}
+
+// TODO: make it a member method
+generic_scheduler* generic_scheduler::create_master( arena* a ) {
+    // add an internal market reference; the public reference is possibly added in create_arena
+    generic_scheduler* s = allocate_scheduler( market::global_market(/*is_public=*/false) );
+    __TBB_ASSERT( !s->my_arena, NULL );
+    __TBB_ASSERT( s->my_market, NULL );
+    task& t = *s->my_dummy_task;
+    s->my_properties.type = scheduler_properties::master;
+    t.prefix().ref_count = 1;
+#if __TBB_TASK_GROUP_CONTEXT
+    t.prefix().context = new ( NFS_Allocate(1, sizeof(task_group_context), NULL) )
+            task_group_context( task_group_context::isolated, task_group_context::default_traits );
+#if __TBB_FP_CONTEXT
+    s->default_context()->capture_fp_settings();
+#endif
+    // Do not call init_stack_info before the scheduler is set as master or worker.
+    s->init_stack_info();
+    context_state_propagation_mutex_type::scoped_lock lock(the_context_state_propagation_mutex);
+    s->my_market->my_masters.push_front( *s );
+    lock.release();
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    if( a ) {
+    // Master thread always occupies the first slot
+        s->attach_arena( a, /*index*/0, /*is_master*/true );
+    s->my_arena_slot->my_scheduler = s;
+        a->my_default_ctx = s->default_context(); // also transfers implied ownership
+    }
+    __TBB_ASSERT( s->my_arena_index == 0, "Master thread must occupy the first slot in its arena" );
+    governor::sign_on(s);
+
+#if _WIN32||_WIN64
+    s->my_market->register_master( s->master_exec_resource );
+#endif /* _WIN32||_WIN64 */
+    // Process any existing observers.
+#if __TBB_ARENA_OBSERVER
+    __TBB_ASSERT( !a || a->my_observers.empty(), "Just created arena cannot have any observers associated with it" );
+#endif
+#if __TBB_SCHEDULER_OBSERVER
+    the_global_observer_list.notify_entry_observers( s->my_last_global_observer, /*worker=*/false );
+#endif /* __TBB_SCHEDULER_OBSERVER */
+    return s;
+}
+
+void generic_scheduler::cleanup_worker( void* arg, bool worker ) {
+    generic_scheduler& s = *(generic_scheduler*)arg;
+    __TBB_ASSERT( !s.my_arena_slot, "cleaning up attached worker" );
+#if __TBB_SCHEDULER_OBSERVER
+    if ( worker ) // can be called by master for worker, do not notify master twice
+        the_global_observer_list.notify_exit_observers( s.my_last_global_observer, /*worker=*/true );
+#endif /* __TBB_SCHEDULER_OBSERVER */
+    s.free_scheduler();
+}
+
+bool generic_scheduler::cleanup_master( bool blocking_terminate ) {
+    arena* const a = my_arena;
+    market * const m = my_market;
+    __TBB_ASSERT( my_market, NULL );
+    if( a && is_task_pool_published() ) {
+        acquire_task_pool();
+        if ( my_arena_slot->task_pool == EmptyTaskPool ||
+             __TBB_load_relaxed(my_arena_slot->head) >= __TBB_load_relaxed(my_arena_slot->tail) )
+        {
+            // Local task pool is empty
+            leave_task_pool();
+        }
+        else {
+            // Master's local task pool may e.g. contain proxies of affinitized tasks.
+            release_task_pool();
+            __TBB_ASSERT ( governor::is_set(this), "TLS slot is cleared before the task pool cleanup" );
+            local_wait_for_all( *my_dummy_task, NULL );
+            __TBB_ASSERT( !is_task_pool_published(), NULL );
+            __TBB_ASSERT ( governor::is_set(this), "Other thread reused our TLS key during the task pool cleanup" );
+        }
+    }
+#if __TBB_ARENA_OBSERVER
+    if( a )
+        a->my_observers.notify_exit_observers( my_last_local_observer, /*worker=*/false );
+#endif
+#if __TBB_SCHEDULER_OBSERVER
+    the_global_observer_list.notify_exit_observers( my_last_global_observer, /*worker=*/false );
+#endif /* __TBB_SCHEDULER_OBSERVER */
+#if _WIN32||_WIN64
+    m->unregister_master( master_exec_resource );
+#endif /* _WIN32||_WIN64 */
+    if( a ) {
+        __TBB_ASSERT(a->my_slots+0 == my_arena_slot, NULL);
+#if __TBB_STATISTICS
+        *my_arena_slot->my_counters += my_counters;
+#endif /* __TBB_STATISTICS */
+        __TBB_store_with_release(my_arena_slot->my_scheduler, (generic_scheduler*)NULL);
+    }
+#if __TBB_TASK_GROUP_CONTEXT
+    else { // task_group_context ownership was not transferred to arena
+        default_context()->~task_group_context();
+        NFS_Free(default_context());
+    }
+    context_state_propagation_mutex_type::scoped_lock lock(the_context_state_propagation_mutex);
+    my_market->my_masters.remove( *this );
+    lock.release();
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    my_arena_slot = NULL; // detached from slot
+    free_scheduler(); // do not use scheduler state after this point
+
+    if( a )
+        a->on_thread_leaving<arena::ref_external>();
+    // If there was an associated arena, it added a public market reference
+    return m->release( /*is_public*/ a != NULL, blocking_terminate );
+}
+
+} // namespace internal
+} // namespace tbb
+
+/*
+    Comments:
+
+1.  The premise of the cancellation support implementation is that cancellations are
+    not part of the hot path of the program execution. Therefore all changes in its
+    implementation in order to reduce the overhead of the cancellation control flow
+    should be done only in ways that do not increase overhead of the normal execution.
+
+    In general contexts are used by all threads and their descendants are created in
+    different threads as well. In order to minimize impact of the cross-thread tree
+    maintenance (first of all because of the synchronization), the tree of contexts
+    is split into pieces, each of which is handled by the only thread. Such pieces
+    are represented as lists of contexts, members of which are contexts that were
+    bound to their parents in the given thread.
+
+    The context tree maintenance and cancellation propagation algorithms is designed
+    in such a manner that cross-thread access to a context list will take place only
+    when cancellation signal is sent (by user or when an exception happens), and
+    synchronization is necessary only then. Thus the normal execution flow (without
+    exceptions and cancellation) remains free from any synchronization done on
+    behalf of exception handling and cancellation support.
+
+2.  Consider parallel cancellations at the different levels of the context tree:
+
+        Ctx1 <- Cancelled by Thread1            |- Thread2 started processing
+         |                                      |
+        Ctx2                                    |- Thread1 started processing
+         |                                   T1 |- Thread2 finishes and syncs up local counters
+        Ctx3 <- Cancelled by Thread2            |
+         |                                      |- Ctx5 is bound to Ctx2
+        Ctx4                                    |
+                                             T2 |- Thread1 reaches Ctx2
+
+    Thread-propagator of each cancellation increments global counter. However the thread
+    propagating the cancellation from the outermost context (Thread1) may be the last
+    to finish. Which means that the local counters may be synchronized earlier (by Thread2,
+    at Time1) than it propagated cancellation into Ctx2 (at time Time2). If a new context
+    (Ctx5) is created and bound to Ctx2 between Time1 and Time2, checking its parent only
+    (Ctx2) may result in cancellation request being lost.
+
+    This issue is solved by doing the whole propagation under the lock.
+
+    If we need more concurrency while processing parallel cancellations, we could try
+    the following modification of the propagation algorithm:
+
+    advance global counter and remember it
+    for each thread:
+        scan thread's list of contexts
+    for each thread:
+        sync up its local counter only if the global counter has not been changed
+
+    However this version of the algorithm requires more analysis and verification.
+
+3.  There is no portable way to get stack base address in Posix, however the modern
+    Linux versions provide pthread_attr_np API that can be used  to obtain thread's
+    stack size and base address. Unfortunately even this function does not provide
+    enough information for the main thread on IA-64 architecture (RSE spill area
+    and memory stack are allocated as two separate discontinuous chunks of memory),
+    and there is no portable way to discern the main and the secondary threads.
+    Thus for macOS* and IA-64 architecture for Linux* OS we use the TBB worker stack size for
+    all threads and use the current stack top as the stack base. This simplified
+    approach is based on the following assumptions:
+    1) If the default stack size is insufficient for the user app needs, the
+    required amount will be explicitly specified by the user at the point of the
+    TBB scheduler initialization (as an argument to tbb::task_scheduler_init
+    constructor).
+    2) When a master thread initializes the scheduler, it has enough space on its
+    stack. Here "enough" means "at least as much as worker threads have".
+    3) If the user app strives to conserve the memory by cutting stack size, it
+    should do this for TBB workers too (as in the #1).
+*/
diff --git a/xdl/third_party/tbb/src/tbb/scheduler.h b/xdl/third_party/tbb/src/tbb/scheduler.h
new file mode 100644
index 00000000..3f5a35c1
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/scheduler.h
@@ -0,0 +1,819 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_scheduler_H
+#define _TBB_scheduler_H
+
+#include "scheduler_common.h"
+#include "tbb/spin_mutex.h"
+#include "mailbox.h"
+#include "tbb_misc.h" // for FastRandom
+#include "itt_notify.h"
+#include "../rml/include/rml_tbb.h"
+
+#include "intrusive_list.h"
+
+#if __TBB_SURVIVE_THREAD_SWITCH
+#include "cilk-tbb-interop.h"
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+namespace tbb {
+namespace internal {
+
+template<typename SchedulerTraits> class custom_scheduler;
+
+//------------------------------------------------------------------------
+// generic_scheduler
+//------------------------------------------------------------------------
+
+#define EmptyTaskPool ((task**)0)
+#define LockedTaskPool ((task**)~(intptr_t)0)
+
+//! Bit-field representing properties of a sheduler
+struct scheduler_properties {
+    static const bool worker = false;
+    static const bool master = true;
+    //! Indicates that a scheduler acts as a master or a worker.
+    bool type : 1;
+    //! Indicates that a scheduler is on outermost level.
+    /**  Note that the explicit execute method will set this property. **/
+    bool outermost : 1;
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    //! Indicates that a scheduler is in the process of executing critical task(s).
+    bool has_taken_critical_task : 1;
+
+    //! Reserved bits
+    unsigned char : 5;
+#else
+    //! Reserved bits
+    unsigned char : 6;
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+};
+
+struct scheduler_state {
+    //! Index of the arena slot the scheduler occupies now, or occupied last time.
+    size_t my_arena_index; // TODO: make it unsigned and pair with my_affinity_id to fit into cache line
+
+    //! Pointer to the slot in the arena we own at the moment.
+    arena_slot* my_arena_slot;
+
+    //! The arena that I own (if master) or am servicing at the moment (if worker)
+    arena* my_arena;
+
+    //! Innermost task whose task::execute() is running. A dummy task on the outermost level.
+    task* my_innermost_running_task;
+
+
+    mail_inbox my_inbox;
+
+    //! The mailbox id assigned to this scheduler.
+    /** The id is assigned upon first entry into the arena.
+        TODO: how are id's being garbage collected?
+        TODO: master thread may enter arena and leave and then reenter.
+                We want to give it the same affinity_id upon reentry, if practical.
+        TODO: investigate if it makes sense to merge this field into scheduler_properties.
+      */
+    affinity_id my_affinity_id;
+
+    scheduler_properties my_properties;
+
+#if __TBB_SCHEDULER_OBSERVER
+    //! Last observer in the global observers list processed by this scheduler
+    observer_proxy* my_last_global_observer;
+#endif
+
+#if __TBB_ARENA_OBSERVER
+    //! Last observer in the local observers list processed by this scheduler
+    observer_proxy* my_last_local_observer;
+#endif
+#if __TBB_TASK_PRIORITY
+    //! Latest known highest priority of tasks in the market or arena.
+    /** Master threads currently tracks only tasks in their arenas, while workers
+        take into account global top priority (among all arenas in the market). **/
+    volatile intptr_t *my_ref_top_priority;
+
+    //! Pointer to market's (for workers) or current arena's (for the master) reload epoch counter.
+    volatile uintptr_t *my_ref_reload_epoch;
+#endif /* __TBB_TASK_PRIORITY */
+};
+
+//! Work stealing task scheduler.
+/** None of the fields here are ever read or written by threads other than
+    the thread that creates the instance.
+
+    Class generic_scheduler is an abstract base class that contains most of the scheduler,
+    except for tweaks specific to processors and tools (e.g. VTune).
+    The derived template class custom_scheduler<SchedulerTraits> fills in the tweaks. */
+class generic_scheduler: public scheduler
+                       , public ::rml::job
+                       , public intrusive_list_node
+                       , public scheduler_state {
+public: // almost every class in TBB uses generic_scheduler
+
+    //! If sizeof(task) is <=quick_task_size, it is handled on a free list instead of malloc'd.
+    static const size_t quick_task_size = 256-task_prefix_reservation_size;
+
+    static bool is_version_3_task( task& t ) {
+#if __TBB_PREVIEW_CRITICAL_TASKS
+        return (t.prefix().extra_state & 0x7)>=0x1;
+#else
+        return (t.prefix().extra_state & 0x0F)>=0x1;
+#endif
+    }
+
+    //! Position in the call stack specifying its maximal filling when stealing is still allowed
+    uintptr_t my_stealing_threshold;
+#if __TBB_ipf
+    //! Position in the RSE backup area specifying its maximal filling when stealing is still allowed
+    uintptr_t my_rsb_stealing_threshold;
+#endif
+
+    static const size_t null_arena_index = ~size_t(0);
+
+    inline bool is_task_pool_published () const;
+
+    inline bool is_local_task_pool_quiescent () const;
+
+    inline bool is_quiescent_local_task_pool_empty () const;
+
+    inline bool is_quiescent_local_task_pool_reset () const;
+
+    //! The market I am in
+    market* my_market;
+
+    //! Random number generator used for picking a random victim from which to steal.
+    FastRandom my_random;
+
+    //! Free list of small tasks that can be reused.
+    task* my_free_list;
+
+#if __TBB_HOARD_NONLOCAL_TASKS
+    //! Free list of small non-local tasks that should be returned or can be reused.
+    task* my_nonlocal_free_list;
+#endif
+    //! Fake root task created by slave threads.
+    /** The task is used as the "parent" argument to method wait_for_all. */
+    task* my_dummy_task;
+
+    //! Reference count for scheduler
+    /** Number of task_scheduler_init objects that point to this scheduler */
+    long my_ref_count;
+
+    inline void attach_mailbox( affinity_id id );
+
+    /* A couple of bools can be located here because space is otherwise just padding after my_affinity_id. */
+
+    //! True if *this was created by automatic TBB initialization
+    bool my_auto_initialized;
+
+#if __TBB_COUNT_TASK_NODES
+    //! Net number of big task objects that have been allocated but not yet freed.
+    intptr_t my_task_node_count;
+#endif /* __TBB_COUNT_TASK_NODES */
+
+    //! Sets up the data necessary for the stealing limiting heuristics
+    void init_stack_info ();
+
+    //! Returns true if stealing is allowed
+    bool can_steal () {
+        int anchor;
+        // TODO IDEA: Add performance warning?
+#if __TBB_ipf
+        return my_stealing_threshold < (uintptr_t)&anchor && (uintptr_t)__TBB_get_bsp() < my_rsb_stealing_threshold;
+#else
+        return my_stealing_threshold < (uintptr_t)&anchor;
+#endif
+    }
+
+    //! Used by workers to enter the task pool
+    /** Does not lock the task pool in case if arena slot has been successfully grabbed. **/
+    void publish_task_pool();
+
+    //! Leave the task pool
+    /** Leaving task pool automatically releases the task pool if it is locked. **/
+    void leave_task_pool();
+
+    //! Resets head and tail indices to 0, and leaves task pool
+    /** The task pool must be locked by the owner (via acquire_task_pool).**/
+    inline void reset_task_pool_and_leave ();
+
+    //! Locks victim's task pool, and returns pointer to it. The pointer can be NULL.
+    /** Garbles victim_arena_slot->task_pool for the duration of the lock. **/
+    task** lock_task_pool( arena_slot* victim_arena_slot ) const;
+
+    //! Unlocks victim's task pool
+    /** Restores victim_arena_slot->task_pool munged by lock_task_pool. **/
+    void unlock_task_pool( arena_slot* victim_arena_slot, task** victim_task_pool ) const;
+
+    //! Locks the local task pool
+    /** Garbles my_arena_slot->task_pool for the duration of the lock. Requires
+        correctly set my_arena_slot->task_pool_ptr. **/
+    void acquire_task_pool() const;
+
+    //! Unlocks the local task pool
+    /** Restores my_arena_slot->task_pool munged by acquire_task_pool. Requires
+        correctly set my_arena_slot->task_pool_ptr. **/
+    void release_task_pool() const;
+
+    //! Checks if t is affinitized to another thread, and if so, bundles it as proxy.
+    /** Returns either t or proxy containing t. **/
+    task* prepare_for_spawning( task* t );
+
+    //! Makes newly spawned tasks visible to thieves
+    inline void commit_spawned_tasks( size_t new_tail );
+
+    //! Makes relocated tasks visible to thieves and releases the local task pool.
+    /** Obviously, the task pool must be locked when calling this method. **/
+    inline void commit_relocated_tasks( size_t new_tail );
+
+    //! Get a task from the local pool.
+    /** Called only by the pool owner.
+        Returns the pointer to the task or NULL if a suitable task is not found.
+        Resets the pool if it is empty. **/
+    task* get_task( __TBB_ISOLATION_EXPR( isolation_tag isolation ) );
+
+    //! Get a task from the local pool at specified location T.
+    /** Returns the pointer to the task or NULL if the task cannot be executed,
+        e.g. proxy has been deallocated or isolation constraint is not met.
+        tasks_omitted tells if some tasks have been omitted.
+        Called only by the pool owner. The caller should guarantee that the
+        position T is not available for a thief. **/
+#if __TBB_TASK_ISOLATION
+    task* get_task( size_t T, isolation_tag isolation, bool& tasks_omitted );
+#else
+    task* get_task( size_t T );
+#endif /* __TBB_TASK_ISOLATION */
+    //! Attempt to get a task from the mailbox.
+    /** Gets a task only if it has not been executed by its sender or a thief
+        that has stolen it from the sender's task pool. Otherwise returns NULL.
+
+        This method is intended to be used only by the thread extracting the proxy
+        from its mailbox. (In contrast to local task pool, mailbox can be read only
+        by its owner). **/
+    task* get_mailbox_task( __TBB_ISOLATION_EXPR( isolation_tag isolation ) );
+
+    //! True if t is a task_proxy
+    static bool is_proxy( const task& t ) {
+        return t.prefix().extra_state==es_task_proxy;
+    }
+
+    //! Attempts to steal a task from a randomly chosen thread/scheduler
+    task* steal_task( __TBB_ISOLATION_EXPR(isolation_tag isolation) );
+
+    //! Steal task from another scheduler's ready pool.
+    task* steal_task_from( __TBB_ISOLATION_ARG( arena_slot& victim_arena_slot, isolation_tag isolation ) );
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    //! Tries to find critical task in critical task stream
+    task* get_critical_task( __TBB_ISOLATION_EXPR(isolation_tag isolation) );
+
+    //! Pushes task to critical task stream if it appears to be such task and returns
+    //! true. Otherwise does nothing and returns false.
+    bool handled_as_critical( task& t );
+#endif
+
+    /** Initial size of the task deque sufficient to serve without reallocation
+        4 nested parallel_for calls with iteration space of 65535 grains each. **/
+    static const size_t min_task_pool_size = 64;
+
+    //! Makes sure that the task pool can accommodate at least n more elements
+    /** If necessary relocates existing task pointers or grows the ready task deque.
+        Returns (possible updated) tail index (not accounting for n). **/
+    size_t prepare_task_pool( size_t n );
+
+    //! Initialize a scheduler for a master thread.
+    static generic_scheduler* create_master( arena* a );
+
+    //! Perform necessary cleanup when a master thread stops using TBB.
+    bool cleanup_master( bool blocking_terminate );
+
+    //! Initialize a scheduler for a worker thread.
+    static generic_scheduler* create_worker( market& m, size_t index );
+
+    //! Perform necessary cleanup when a worker thread finishes.
+    static void cleanup_worker( void* arg, bool worker );
+
+protected:
+    template<typename SchedulerTraits> friend class custom_scheduler;
+    generic_scheduler( market & );
+
+public:
+#if TBB_USE_ASSERT > 1
+    //! Check that internal data structures are in consistent state.
+    /** Raises __TBB_ASSERT failure if inconsistency is found. */
+    void assert_task_pool_valid() const;
+#else
+    void assert_task_pool_valid() const {}
+#endif /* TBB_USE_ASSERT <= 1 */
+
+    void attach_arena( arena*, size_t index, bool is_master );
+    void nested_arena_entry( arena*, size_t );
+    void nested_arena_exit();
+    void wait_until_empty();
+
+    void spawn( task& first, task*& next ) __TBB_override;
+
+    void spawn_root_and_wait( task& first, task*& next ) __TBB_override;
+
+    void enqueue( task&, void* reserved ) __TBB_override;
+
+    void local_spawn( task* first, task*& next );
+    void local_spawn_root_and_wait( task* first, task*& next );
+    virtual void local_wait_for_all( task& parent, task* child ) = 0;
+
+    //! Destroy and deallocate this scheduler object
+    void free_scheduler();
+
+    //! Allocate task object, either from the heap or a free list.
+    /** Returns uninitialized task object with initialized prefix. */
+    task& allocate_task( size_t number_of_bytes,
+                       __TBB_CONTEXT_ARG(task* parent, task_group_context* context) );
+
+    //! Put task on free list.
+    /** Does not call destructor. */
+    template<free_task_hint h>
+    void free_task( task& t );
+
+    //! Return task object to the memory allocator.
+    inline void deallocate_task( task& t );
+
+    //! True if running on a worker thread, false otherwise.
+    inline bool is_worker() const;
+
+    //! True if the scheduler is on the outermost dispatch level.
+    inline bool outermost_level() const;
+
+    //! True if the scheduler is on the outermost dispatch level in a master thread.
+    /** Returns true when this scheduler instance is associated with an application
+        thread, and is not executing any TBB task. This includes being in a TBB
+        dispatch loop (one of wait_for_all methods) invoked directly from that thread. **/
+    inline bool master_outermost_level () const;
+
+    //! True if the scheduler is on the outermost dispatch level in a worker thread.
+    inline bool worker_outermost_level () const;
+
+    //! Returns the concurrency limit of the current arena.
+    unsigned max_threads_in_arena();
+
+#if __TBB_COUNT_TASK_NODES
+    intptr_t get_task_node_count( bool count_arena_workers = false );
+#endif /* __TBB_COUNT_TASK_NODES */
+
+    //! Special value used to mark my_return_list as not taking any more entries.
+    static task* plugged_return_list() {return (task*)(intptr_t)(-1);}
+
+    //! Number of small tasks that have been allocated by this scheduler.
+    __TBB_atomic intptr_t my_small_task_count;
+
+    //! List of small tasks that have been returned to this scheduler by other schedulers.
+    // TODO IDEA: see if putting my_return_list on separate cache line improves performance
+    task* my_return_list;
+
+    //! Try getting a task from other threads (via mailbox, stealing, FIFO queue, orphans adoption).
+    /** Returns obtained task or NULL if all attempts fail. */
+    virtual task* receive_or_steal_task( __TBB_ISOLATION_ARG( __TBB_atomic reference_count& completion_ref_count, isolation_tag isolation ) ) = 0;
+
+    //! Free a small task t that that was allocated by a different scheduler
+    void free_nonlocal_small_task( task& t );
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Returns task group context used by this scheduler instance.
+    /** This context is associated with root tasks created by a master thread
+        without explicitly specified context object outside of any running task.
+
+        Note that the default context of a worker thread is never accessed by
+        user code (directly or indirectly). **/
+    inline task_group_context* default_context ();
+
+    //! Padding isolating thread-local members from members that can be written to by other threads.
+    char _padding1[NFS_MaxLineSize - sizeof(context_list_node_t)];
+
+    //! Head of the thread specific list of task group contexts.
+    context_list_node_t my_context_list_head;
+
+    //! Mutex protecting access to the list of task group contexts.
+    // TODO: check whether it can be deadly preempted and replace by spinning/sleeping mutex
+    spin_mutex my_context_list_mutex;
+
+    //! Last state propagation epoch known to this thread
+    /** Together with the_context_state_propagation_epoch constitute synchronization protocol
+        that keeps hot path of task group context construction destruction mostly
+        lock-free.
+        When local epoch equals the global one, the state of task group contexts
+        registered with this thread is consistent with that of the task group trees
+        they belong to. **/
+    uintptr_t my_context_state_propagation_epoch;
+
+    //! Flag indicating that a context is being destructed by its owner thread
+    /** Together with my_nonlocal_ctx_list_update constitute synchronization protocol
+        that keeps hot path of context destruction (by the owner thread) mostly
+        lock-free. **/
+    tbb::atomic<uintptr_t> my_local_ctx_list_update;
+
+#if __TBB_TASK_PRIORITY
+    //! Returns reference priority used to decide whether a task should be offloaded.
+    inline intptr_t effective_reference_priority () const;
+
+    // TODO: move into slots and fix is_out_of_work
+    //! Task pool for offloading tasks with priorities lower than the current top priority.
+    task* my_offloaded_tasks;
+
+    //! Points to the last offloaded task in the my_offloaded_tasks list.
+    task** my_offloaded_task_list_tail_link;
+
+    //! Indicator of how recently the offload area was checked for the presence of top priority tasks.
+    uintptr_t my_local_reload_epoch;
+
+    //! Indicates that the pool is likely non-empty even if appears so from outside
+    volatile bool my_pool_reshuffling_pending;
+
+    //! Searches offload area for top priority tasks and reloads found ones into primary task pool.
+    /** Returns one of the found tasks or NULL. **/
+    task* reload_tasks( __TBB_ISOLATION_EXPR( isolation_tag isolation ) );
+
+    task* reload_tasks( task*& offloaded_tasks, task**& offloaded_task_list_link, __TBB_ISOLATION_ARG( intptr_t top_priority, isolation_tag isolation ) );
+
+    //! Moves tasks with priority below the top one from primary task pool into offload area.
+    /** Returns the next execution candidate task or NULL. **/
+    task* winnow_task_pool ( __TBB_ISOLATION_EXPR( isolation_tag isolation ) );
+
+    //! Get a task from locked or empty pool in range [H0, T0). Releases or unlocks the task pool.
+    /** Returns the found task or NULL. **/
+    task *get_task_and_activate_task_pool( size_t H0 , __TBB_ISOLATION_ARG( size_t T0, isolation_tag isolation ) );
+
+    //! Unconditionally moves the task into offload area.
+    inline void offload_task ( task& t, intptr_t task_priority );
+#endif /* __TBB_TASK_PRIORITY */
+
+    //! Detaches abandoned contexts
+    /** These contexts must be destroyed by other threads. **/
+    void cleanup_local_context_list ();
+
+    //! Finds all contexts registered by this scheduler affected by the state change
+    //! and propagates the new state to them.
+    template <typename T>
+    void propagate_task_group_state ( T task_group_context::*mptr_state, task_group_context& src, T new_state );
+
+    // check consistency
+    static void assert_context_valid(const task_group_context *tgc) {
+        suppress_unused_warning(tgc);
+#if TBB_USE_ASSERT
+        __TBB_ASSERT(tgc, NULL);
+        uintptr_t ctx = tgc->my_version_and_traits;
+        __TBB_ASSERT(is_alive(ctx), "referenced task_group_context was destroyed");
+        static const char *msg = "task_group_context is invalid";
+        __TBB_ASSERT(!(ctx&~(3|(7<<task_group_context::traits_offset))), msg); // the value fits known values of versions and traits
+        __TBB_ASSERT(tgc->my_kind < task_group_context::dying, msg);
+        __TBB_ASSERT(tgc->my_cancellation_requested == 0 || tgc->my_cancellation_requested == 1, msg);
+        __TBB_ASSERT(tgc->my_state < task_group_context::low_unused_state_bit, msg);
+        if(tgc->my_kind != task_group_context::isolated) {
+            __TBB_ASSERT(tgc->my_owner, msg);
+            __TBB_ASSERT(tgc->my_node.my_next && tgc->my_node.my_prev, msg);
+        }
+#if __TBB_TASK_PRIORITY
+        assert_priority_valid(tgc->my_priority);
+#endif
+        if(tgc->my_parent)
+#if TBB_USE_ASSERT > 1
+            assert_context_valid(tgc->my_parent);
+#else
+            __TBB_ASSERT(is_alive(tgc->my_parent->my_version_and_traits), msg);
+#endif
+#endif
+    }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#if _WIN32||_WIN64
+private:
+    //! Handle returned by RML when registering a master with RML
+    ::rml::server::execution_resource_t master_exec_resource;
+public:
+#endif /* _WIN32||_WIN64 */
+
+#if __TBB_TASK_GROUP_CONTEXT
+    //! Flag indicating that a context is being destructed by non-owner thread.
+    /** See also my_local_ctx_list_update. **/
+    tbb::atomic<uintptr_t> my_nonlocal_ctx_list_update;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#if __TBB_SURVIVE_THREAD_SWITCH
+    __cilk_tbb_unwatch_thunk my_cilk_unwatch_thunk;
+#if TBB_USE_ASSERT
+    //! State values used to check interface contract with cilkrts.
+    /** Names of cs_running...cs_freed derived from state machine diagram in cilk-tbb-interop.h */
+    enum cilk_state_t {
+        cs_none=0xF000, // Start at nonzero value so that we can detect use of zeroed memory.
+        cs_running,
+        cs_limbo,
+        cs_freed
+    };
+    cilk_state_t my_cilk_state;
+#endif /* TBB_USE_ASSERT */
+#endif /* __TBB_SURVIVE_THREAD_SWITCH */
+
+#if __TBB_STATISTICS
+    //! Set of counters to track internal statistics on per thread basis
+    /** Placed at the end of the class definition to minimize the disturbance of
+        the core logic memory operations. **/
+    mutable statistics_counters my_counters;
+#endif /* __TBB_STATISTICS */
+
+}; // class generic_scheduler
+
+
+} // namespace internal
+} // namespace tbb
+
+#include "arena.h"
+#include "governor.h"
+
+namespace tbb {
+namespace internal {
+
+inline bool generic_scheduler::is_task_pool_published () const {
+    __TBB_ASSERT(my_arena_slot, 0);
+    return my_arena_slot->task_pool != EmptyTaskPool;
+}
+
+inline bool generic_scheduler::is_local_task_pool_quiescent () const {
+    __TBB_ASSERT(my_arena_slot, 0);
+    task** tp = my_arena_slot->task_pool;
+    return tp == EmptyTaskPool || tp == LockedTaskPool;
+}
+
+inline bool generic_scheduler::is_quiescent_local_task_pool_empty () const {
+    __TBB_ASSERT( is_local_task_pool_quiescent(), "Task pool is not quiescent" );
+    return __TBB_load_relaxed(my_arena_slot->head) == __TBB_load_relaxed(my_arena_slot->tail);
+}
+
+inline bool generic_scheduler::is_quiescent_local_task_pool_reset () const {
+    __TBB_ASSERT( is_local_task_pool_quiescent(), "Task pool is not quiescent" );
+    return __TBB_load_relaxed(my_arena_slot->head) == 0 && __TBB_load_relaxed(my_arena_slot->tail) == 0;
+}
+
+inline bool generic_scheduler::outermost_level () const {
+    return my_properties.outermost;
+}
+
+inline bool generic_scheduler::master_outermost_level () const {
+    return !is_worker() && outermost_level();
+}
+
+inline bool generic_scheduler::worker_outermost_level () const {
+    return is_worker() && outermost_level();
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+inline task_group_context* generic_scheduler::default_context () {
+    return my_dummy_task->prefix().context;
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+inline void generic_scheduler::attach_mailbox( affinity_id id ) {
+    __TBB_ASSERT(id>0,NULL);
+    my_inbox.attach( my_arena->mailbox(id) );
+    my_affinity_id = id;
+}
+
+inline bool generic_scheduler::is_worker() const {
+    return my_properties.type == scheduler_properties::worker;
+}
+
+inline unsigned generic_scheduler::max_threads_in_arena() {
+    __TBB_ASSERT(my_arena, NULL);
+    return my_arena->my_num_slots;
+}
+
+//! Return task object to the memory allocator.
+inline void generic_scheduler::deallocate_task( task& t ) {
+#if TBB_USE_ASSERT
+    task_prefix& p = t.prefix();
+    p.state = 0xFF;
+    p.extra_state = 0xFF;
+    poison_pointer(p.next);
+#endif /* TBB_USE_ASSERT */
+    NFS_Free((char*)&t-task_prefix_reservation_size);
+#if __TBB_COUNT_TASK_NODES
+    --my_task_node_count;
+#endif /* __TBB_COUNT_TASK_NODES */
+}
+
+#if __TBB_COUNT_TASK_NODES
+inline intptr_t generic_scheduler::get_task_node_count( bool count_arena_workers ) {
+    return my_task_node_count + (count_arena_workers? my_arena->workers_task_node_count(): 0);
+}
+#endif /* __TBB_COUNT_TASK_NODES */
+
+inline void generic_scheduler::reset_task_pool_and_leave () {
+    __TBB_ASSERT( my_arena_slot->task_pool == LockedTaskPool, "Task pool must be locked when resetting task pool" );
+    __TBB_store_relaxed( my_arena_slot->tail, 0 );
+    __TBB_store_relaxed( my_arena_slot->head, 0 );
+    leave_task_pool();
+}
+
+//TODO: move to arena_slot
+inline void generic_scheduler::commit_spawned_tasks( size_t new_tail ) {
+    __TBB_ASSERT ( new_tail <= my_arena_slot->my_task_pool_size, "task deque end was overwritten" );
+    // emit "task was released" signal
+    ITT_NOTIFY(sync_releasing, (void*)((uintptr_t)my_arena_slot+sizeof(uintptr_t)));
+    // Release fence is necessary to make sure that previously stored task pointers
+    // are visible to thieves.
+    __TBB_store_with_release( my_arena_slot->tail, new_tail );
+}
+
+void generic_scheduler::commit_relocated_tasks ( size_t new_tail ) {
+    __TBB_ASSERT( is_local_task_pool_quiescent(),
+                  "Task pool must be locked when calling commit_relocated_tasks()" );
+    __TBB_store_relaxed( my_arena_slot->head, 0 );
+    // Tail is updated last to minimize probability of a thread making arena
+    // snapshot being misguided into thinking that this task pool is empty.
+    __TBB_store_release( my_arena_slot->tail, new_tail );
+    release_task_pool();
+}
+
+template<free_task_hint hint>
+void generic_scheduler::free_task( task& t ) {
+#if __TBB_HOARD_NONLOCAL_TASKS
+    static const int h = hint&(~local_task);
+#else
+    static const free_task_hint h = hint;
+#endif
+    GATHER_STATISTIC(--my_counters.active_tasks);
+    task_prefix& p = t.prefix();
+    // Verify that optimization hints are correct.
+    __TBB_ASSERT( h!=small_local_task || p.origin==this, NULL );
+    __TBB_ASSERT( !(h&small_task) || p.origin, NULL );
+    __TBB_ASSERT( !(h&local_task) || (!p.origin || uintptr_t(p.origin) > uintptr_t(4096)), "local_task means allocated");
+    poison_value(p.depth);
+    poison_value(p.ref_count);
+    poison_pointer(p.owner);
+    __TBB_ASSERT( 1L<<t.state() & (1L<<task::executing|1L<<task::allocated), NULL );
+    p.state = task::freed;
+    if( h==small_local_task || p.origin==this ) {
+        GATHER_STATISTIC(++my_counters.free_list_length);
+        p.next = my_free_list;
+        my_free_list = &t;
+    } else if( !(h&local_task) && p.origin && uintptr_t(p.origin) < uintptr_t(4096) ) {
+        // a special value reserved for future use, do nothing since
+        // origin is not pointing to a scheduler instance
+    } else if( !(h&local_task) && p.origin ) {
+        GATHER_STATISTIC(++my_counters.free_list_length);
+#if __TBB_HOARD_NONLOCAL_TASKS
+        if( !(h&no_cache) ) {
+            p.next = my_nonlocal_free_list;
+            my_nonlocal_free_list = &t;
+        } else
+#endif
+        free_nonlocal_small_task(t);
+    } else {
+        GATHER_STATISTIC(--my_counters.big_tasks);
+        deallocate_task(t);
+    }
+}
+
+#if __TBB_TASK_PRIORITY
+inline intptr_t generic_scheduler::effective_reference_priority () const {
+    // Workers on the outermost dispatch level (i.e. with empty stack) use market's
+    // priority as a reference point (to speedup discovering process level priority
+    // changes). But when there are enough workers to service (even if only partially)
+    // a lower priority arena, they should use arena's priority as a reference, lest
+    // be trapped in a futile spinning (because market's priority would prohibit
+    // executing ANY tasks in this arena).
+    return !worker_outermost_level() ||
+        (my_arena->my_num_workers_allotted < my_arena->num_workers_active()
+#if __TBB_ENQUEUE_ENFORCED_CONCURRENCY
+         && my_arena->my_concurrency_mode!=arena_base::cm_enforced_global
+#endif
+            ) ? *my_ref_top_priority : my_arena->my_top_priority;
+}
+
+inline void generic_scheduler::offload_task ( task& t, intptr_t /*priority*/ ) {
+    GATHER_STATISTIC( ++my_counters.prio_tasks_offloaded );
+    __TBB_ASSERT( !is_proxy(t), "The proxy task cannot be offloaded" );
+    __TBB_ASSERT( my_offloaded_task_list_tail_link && !*my_offloaded_task_list_tail_link, NULL );
+#if TBB_USE_ASSERT
+    t.prefix().state = task::ready;
+#endif /* TBB_USE_ASSERT */
+    t.prefix().next_offloaded = my_offloaded_tasks;
+    my_offloaded_tasks = &t;
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+class critical_task_count_guard : internal::no_copy {
+public:
+    critical_task_count_guard(scheduler_properties& properties, task& t)
+        : my_properties(properties),
+          my_original_critical_task_state(properties.has_taken_critical_task) {
+        my_properties.has_taken_critical_task |= internal::is_critical(t);
+    }
+    ~critical_task_count_guard() {
+        my_properties.has_taken_critical_task = my_original_critical_task_state;
+    }
+private:
+    scheduler_properties& my_properties;
+    bool my_original_critical_task_state;
+};
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+
+#if __TBB_FP_CONTEXT || __TBB_TASK_GROUP_CONTEXT
+//! Helper class for tracking floating point context and task group context switches
+/** Assuming presence of an itt collector, in addition to keeping track of floating
+    point context, this class emits itt events to indicate begin and end of task group
+    context execution **/
+template <bool report_tasks>
+class context_guard_helper {
+#if __TBB_TASK_GROUP_CONTEXT
+    const task_group_context *curr_ctx;
+#endif
+#if __TBB_FP_CONTEXT
+    cpu_ctl_env guard_cpu_ctl_env;
+    cpu_ctl_env curr_cpu_ctl_env;
+#endif
+public:
+    context_guard_helper()
+#if __TBB_TASK_GROUP_CONTEXT
+        : curr_ctx(NULL)
+#endif
+    {
+#if __TBB_FP_CONTEXT
+        guard_cpu_ctl_env.get_env();
+        curr_cpu_ctl_env = guard_cpu_ctl_env;
+#endif
+    }
+    ~context_guard_helper() {
+#if __TBB_FP_CONTEXT
+        if ( curr_cpu_ctl_env != guard_cpu_ctl_env )
+            guard_cpu_ctl_env.set_env();
+#endif
+#if __TBB_TASK_GROUP_CONTEXT
+        if (report_tasks && curr_ctx)
+            ITT_TASK_END;
+#endif
+    }
+    void set_ctx( const task_group_context *ctx ) {
+        generic_scheduler::assert_context_valid(ctx);
+#if __TBB_FP_CONTEXT
+        const cpu_ctl_env &ctl = *punned_cast<cpu_ctl_env*>(&ctx->my_cpu_ctl_env);
+#endif
+#if __TBB_TASK_GROUP_CONTEXT
+        if(ctx != curr_ctx) {
+#endif
+#if __TBB_FP_CONTEXT
+            if ( ctl != curr_cpu_ctl_env ) {
+                curr_cpu_ctl_env = ctl;
+                curr_cpu_ctl_env.set_env();
+            }
+#endif
+#if __TBB_TASK_GROUP_CONTEXT
+            // if task group context was active, report end of current execution frame.
+            if (report_tasks) {
+                if (curr_ctx)
+                    ITT_TASK_END;
+                // reporting begin of new task group context execution frame.
+                // using address of task group context object to group tasks (parent).
+                // id of task execution frame is NULL and reserved for future use.
+                ITT_TASK_BEGIN(ctx,ctx->my_name,NULL);
+                curr_ctx = ctx;
+            }
+        }
+#endif
+    }
+    void restore_default() {
+#if __TBB_FP_CONTEXT
+        if ( curr_cpu_ctl_env != guard_cpu_ctl_env ) {
+            guard_cpu_ctl_env.set_env();
+            curr_cpu_ctl_env = guard_cpu_ctl_env;
+        }
+#endif
+    }
+};
+#else
+template <bool T>
+struct context_guard_helper {
+    void set_ctx( __TBB_CONTEXT_ARG1(task_group_context *) ) {}
+    void restore_default() {}
+};
+#endif /* __TBB_FP_CONTEXT */
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_scheduler_H */
diff --git a/xdl/third_party/tbb/src/tbb/scheduler_common.h b/xdl/third_party/tbb/src/tbb/scheduler_common.h
new file mode 100644
index 00000000..2afd1a18
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/scheduler_common.h
@@ -0,0 +1,453 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_scheduler_common_H
+#define _TBB_scheduler_common_H
+
+#include "tbb/tbb_machine.h"
+#include "tbb/cache_aligned_allocator.h"
+
+#include <string.h>  // for memset, memcpy, memmove
+
+#include "tbb_statistics.h"
+
+#if TBB_USE_ASSERT > 1
+#include <stdio.h>
+#endif /* TBB_USE_ASSERT > 1 */
+
+/* Temporarily change "private" to "public" while including "tbb/task.h".
+   This hack allows us to avoid publishing internal types and methods
+   in the public header files just for sake of friend declarations. */
+#ifndef private
+    #define private public
+    #define undef_private
+#endif
+
+#include "tbb/task.h"
+#include "tbb/tbb_exception.h"
+
+#ifdef undef_private
+    #undef private
+#endif
+
+#ifndef __TBB_SCHEDULER_MUTEX_TYPE
+#define __TBB_SCHEDULER_MUTEX_TYPE tbb::spin_mutex
+#endif
+// TODO: add conditional inclusion based on specified type
+#include "tbb/spin_mutex.h"
+
+// This macro is an attempt to get rid of ugly ifdefs in the shared parts of the code.
+// It drops the second argument depending on whether the controlling macro is defined.
+// The first argument is just a convenience allowing to keep comma before the macro usage.
+#if __TBB_TASK_GROUP_CONTEXT
+    #define __TBB_CONTEXT_ARG1(context) context
+    #define __TBB_CONTEXT_ARG(arg1, context) arg1, context
+#else /* !__TBB_TASK_GROUP_CONTEXT */
+    #define __TBB_CONTEXT_ARG1(context)
+    #define __TBB_CONTEXT_ARG(arg1, context) arg1
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
+
+#if __TBB_TASK_ISOLATION
+    #define __TBB_ISOLATION_EXPR(isolation) isolation
+    #define __TBB_ISOLATION_ARG(arg1, isolation) arg1, isolation
+#else
+    #define __TBB_ISOLATION_EXPR(isolation)
+    #define __TBB_ISOLATION_ARG(arg1, isolation) arg1
+#endif /* __TBB_TASK_ISOLATION */
+
+
+#if DO_TBB_TRACE
+#include <cstdio>
+#define TBB_TRACE(x) ((void)std::printf x)
+#else
+#define TBB_TRACE(x) ((void)(0))
+#endif /* DO_TBB_TRACE */
+
+#if !__TBB_CPU_CTL_ENV_PRESENT
+#include <fenv.h>
+#endif
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    // These particular warnings are so ubiquitous that no attempt is made to narrow
+    // the scope of the warnings.
+    #pragma warning (disable: 4100 4127 4312 4244 4267 4706)
+#endif
+
+namespace tbb {
+namespace interface7 {
+namespace internal {
+class task_arena_base;
+class delegated_task;
+class wait_task;
+}}
+namespace internal {
+using namespace interface7::internal;
+
+class arena;
+template<typename SchedulerTraits> class custom_scheduler;
+class generic_scheduler;
+class governor;
+class mail_outbox;
+class market;
+class observer_proxy;
+class task_scheduler_observer_v3;
+
+#if __TBB_TASK_PRIORITY
+static const intptr_t num_priority_levels = 3;
+static const intptr_t normalized_normal_priority = (num_priority_levels - 1) / 2;
+
+inline intptr_t normalize_priority ( priority_t p ) {
+    return intptr_t(p - priority_low) / priority_stride_v4;
+}
+
+static const priority_t priority_from_normalized_rep[num_priority_levels] = {
+    priority_low, priority_normal, priority_high
+};
+
+inline void assert_priority_valid ( intptr_t p ) {
+    __TBB_ASSERT_EX( p >= 0 && p < num_priority_levels, NULL );
+}
+
+inline intptr_t& priority ( task& t ) {
+    return t.prefix().context->my_priority;
+}
+#else /* __TBB_TASK_PRIORITY */
+static const intptr_t num_priority_levels = 1;
+#endif /* __TBB_TASK_PRIORITY */
+
+//! Mutex type for global locks in the scheduler
+typedef __TBB_SCHEDULER_MUTEX_TYPE scheduler_mutex_type;
+
+#if __TBB_TASK_GROUP_CONTEXT
+//! Task group state change propagation global epoch
+/** Together with generic_scheduler::my_context_state_propagation_epoch forms
+    cross-thread signaling mechanism that allows to avoid locking at the hot path
+    of normal execution flow.
+
+    When a descendant task group context is registered or unregistered, the global
+    and local epochs are compared. If they differ, a state change is being propagated,
+    and thus registration/deregistration routines take slower branch that may block
+    (at most one thread of the pool can be blocked at any moment). Otherwise the
+    control path is lock-free and fast. **/
+extern uintptr_t the_context_state_propagation_epoch;
+
+//! Mutex guarding state change propagation across task groups forest.
+/** Also protects modification of related data structures. **/
+typedef scheduler_mutex_type context_state_propagation_mutex_type;
+extern context_state_propagation_mutex_type the_context_state_propagation_mutex;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//! Alignment for a task object
+const size_t task_alignment = 32;
+
+//! Number of bytes reserved for a task prefix
+/** If not exactly sizeof(task_prefix), the extra bytes *precede* the task_prefix. */
+const size_t task_prefix_reservation_size = ((sizeof(internal::task_prefix)-1)/task_alignment+1)*task_alignment;
+
+//! Definitions for bits in task_prefix::extra_state
+enum task_extra_state {
+    //! Tag for v1 tasks (i.e. tasks in TBB 1.0 and 2.0)
+    es_version_1_task = 0,
+    //! Tag for v3 tasks (i.e. tasks in TBB 2.1-2.2)
+    es_version_3_task = 1,
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    //! Tag for critical tasks
+    es_task_critical = 0x8,
+#endif
+    //! Tag for enqueued tasks
+    es_task_enqueued = 0x10,
+    //! Tag for v3 task_proxy.
+    es_task_proxy = 0x20,
+    //! Set if ref_count might be changed by another thread.  Used for debugging.
+    es_ref_count_active = 0x40,
+    //! Set if the task has been stolen
+    es_task_is_stolen = 0x80
+};
+
+inline void reset_extra_state ( task *t ) {
+    t->prefix().extra_state &= ~(es_task_is_stolen | es_task_enqueued);
+}
+
+//! Optimization hint to free_task that enables it omit unnecessary tests and code.
+enum free_task_hint {
+    //! No hint
+    no_hint=0,
+    //! Task is known to have been allocated by this scheduler
+    local_task=1,
+    //! Task is known to be a small task.
+    /** Task should be returned to the free list of *some* scheduler, possibly not this scheduler. */
+    small_task=2,
+    //! Bitwise-OR of local_task and small_task.
+    /** Task should be returned to free list of this scheduler. */
+    small_local_task=3,
+    //! Disable caching for a small task.
+    no_cache = 4,
+    //! Task is known to be a small task and must not be cached.
+    no_cache_small_task = no_cache | small_task
+};
+
+//------------------------------------------------------------------------
+// Debugging support
+//------------------------------------------------------------------------
+
+#if TBB_USE_ASSERT
+
+static const uintptr_t venom = tbb::internal::select_size_t_constant<0xDEADBEEFU,0xDDEEAADDDEADBEEFULL>::value;
+
+template <typename T>
+void poison_value ( T& val ) { val = * punned_cast<T*>(&venom); }
+
+/** Expected to be used in assertions only, thus no empty form is defined. **/
+inline bool is_alive( uintptr_t v ) { return v != venom; }
+
+/** Logically, this method should be a member of class task.
+    But we do not want to publish it, so it is here instead. */
+inline void assert_task_valid( const task* task ) {
+    __TBB_ASSERT( task!=NULL, NULL );
+    __TBB_ASSERT( !is_poisoned(&task), NULL );
+    __TBB_ASSERT( (uintptr_t)task % task_alignment == 0, "misaligned task" );
+#if __TBB_RECYCLE_TO_ENQUEUE
+    __TBB_ASSERT( (unsigned)task->state()<=(unsigned)task::to_enqueue, "corrupt task (invalid state)" );
+#else
+    __TBB_ASSERT( (unsigned)task->state()<=(unsigned)task::recycle, "corrupt task (invalid state)" );
+#endif
+}
+
+#else /* !TBB_USE_ASSERT */
+
+/** In contrast to debug version poison_value() is a macro here because
+    the variable used as its argument may be undefined in release builds. **/
+#define poison_value(g) ((void)0)
+
+inline void assert_task_valid( const task* ) {}
+
+#endif /* !TBB_USE_ASSERT */
+
+//------------------------------------------------------------------------
+// Helpers
+//------------------------------------------------------------------------
+
+#if __TBB_TASK_GROUP_CONTEXT
+inline bool ConcurrentWaitsEnabled ( task& t ) {
+    return (t.prefix().context->my_version_and_traits & task_group_context::concurrent_wait) != 0;
+}
+
+inline bool CancellationInfoPresent ( task& t ) {
+    return t.prefix().context->my_cancellation_requested != 0;
+}
+
+#if TBB_USE_CAPTURED_EXCEPTION
+    inline tbb_exception* TbbCurrentException( task_group_context*, tbb_exception* src) { return src->move(); }
+    inline tbb_exception* TbbCurrentException( task_group_context* c, captured_exception* src) {
+        if( c->my_version_and_traits & task_group_context::exact_exception )
+            runtime_warning( "Exact exception propagation is requested by application but the linked library is built without support for it");
+        return src;
+    }
+    #define TbbRethrowException(TbbCapturedException) (TbbCapturedException)->throw_self()
+#else
+    // Using macro instead of an inline function here allows to avoid evaluation of the
+    // TbbCapturedException expression when exact propagation is enabled for the context.
+    #define TbbCurrentException(context, TbbCapturedException) \
+        context->my_version_and_traits & task_group_context::exact_exception    \
+            ? tbb_exception_ptr::allocate()    \
+            : tbb_exception_ptr::allocate( *(TbbCapturedException) );
+    #define TbbRethrowException(TbbCapturedException) \
+        { \
+            if( governor::rethrow_exception_broken() ) fix_broken_rethrow(); \
+            (TbbCapturedException)->throw_self(); \
+        }
+#endif /* !TBB_USE_CAPTURED_EXCEPTION */
+
+#define TbbRegisterCurrentException(context, TbbCapturedException) \
+    if ( context->cancel_group_execution() ) {  \
+        /* We are the first to signal cancellation, so store the exception that caused it. */  \
+        context->my_exception = TbbCurrentException( context, TbbCapturedException ); \
+    }
+
+#define TbbCatchAll(context)  \
+    catch ( tbb_exception& exc ) {  \
+        TbbRegisterCurrentException( context, &exc );   \
+    } catch ( std::exception& exc ) {   \
+        TbbRegisterCurrentException( context, captured_exception::allocate(typeid(exc).name(), exc.what()) ); \
+    } catch ( ... ) {   \
+        TbbRegisterCurrentException( context, captured_exception::allocate("...", "Unidentified exception") );\
+    }
+
+#else /* !__TBB_TASK_GROUP_CONTEXT */
+
+inline bool ConcurrentWaitsEnabled ( task& t ) { return false; }
+
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+inline void prolonged_pause() {
+#if defined(__TBB_time_stamp) && !__TBB_STEALING_PAUSE
+    // Assumption based on practice: 1000-2000 ticks seems to be a suitable invariant for the
+    // majority of platforms. Currently, skip platforms that define __TBB_STEALING_PAUSE
+    // because these platforms require very careful tuning.
+    machine_tsc_t prev = __TBB_time_stamp();
+    const machine_tsc_t finish = prev + 1000;
+    atomic_backoff backoff;
+    do {
+        backoff.bounded_pause();
+        machine_tsc_t curr = __TBB_time_stamp();
+        if ( curr <= prev )
+            // Possibly, the current logical thread is moved to another hardware thread or overflow is occurred.
+            break;
+        prev = curr;
+    } while ( prev < finish );
+#else
+#ifdef __TBB_STEALING_PAUSE
+    static const long PauseTime = __TBB_STEALING_PAUSE;
+#elif __TBB_ipf
+    static const long PauseTime = 1500;
+#else
+    static const long PauseTime = 80;
+#endif
+    // TODO IDEA: Update PauseTime adaptively?
+    __TBB_Pause(PauseTime);
+#endif
+}
+
+//------------------------------------------------------------------------
+// arena_slot
+//------------------------------------------------------------------------
+struct arena_slot_line1 {
+    //TODO: make this tbb:atomic<>.
+    //! Scheduler of the thread attached to the slot
+    /** Marks the slot as busy, and is used to iterate through the schedulers belonging to this arena **/
+    generic_scheduler* my_scheduler;
+
+    // Synchronization of access to Task pool
+    /** Also is used to specify if the slot is empty or locked:
+         0 - empty
+        -1 - locked **/
+    task* *__TBB_atomic task_pool;
+
+    //! Index of the first ready task in the deque.
+    /** Modified by thieves, and by the owner during compaction/reallocation **/
+    __TBB_atomic size_t head;
+};
+
+struct arena_slot_line2 {
+    //! Hint provided for operations with the container of starvation-resistant tasks.
+    /** Modified by the owner thread (during these operations). **/
+    unsigned hint_for_pop;
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    //! Similar to 'hint_for_pop' but for critical tasks.
+    unsigned hint_for_critical;
+#endif
+
+    //! Index of the element following the last ready task in the deque.
+    /** Modified by the owner thread. **/
+    __TBB_atomic size_t tail;
+
+    //! Capacity of the primary task pool (number of elements - pointers to task).
+    size_t my_task_pool_size;
+
+    // Task pool of the scheduler that owns this slot
+    task* *__TBB_atomic task_pool_ptr;
+
+#if __TBB_STATISTICS
+    //! Set of counters to accumulate internal statistics related to this arena
+    statistics_counters *my_counters;
+#endif /* __TBB_STATISTICS */
+};
+
+struct arena_slot : padded<arena_slot_line1>, padded<arena_slot_line2> {
+#if TBB_USE_ASSERT
+    void fill_with_canary_pattern ( size_t first, size_t last ) {
+        for ( size_t i = first; i < last; ++i )
+            poison_pointer(task_pool_ptr[i]);
+    }
+#else
+    void fill_with_canary_pattern ( size_t, size_t ) {}
+#endif /* TBB_USE_ASSERT */
+
+    void allocate_task_pool( size_t n ) {
+        size_t byte_size = ((n * sizeof(task*) + NFS_MaxLineSize - 1) / NFS_MaxLineSize) * NFS_MaxLineSize;
+        my_task_pool_size = byte_size / sizeof(task*);
+        task_pool_ptr = (task**)NFS_Allocate( 1, byte_size, NULL );
+        // No need to clear the fresh deque since valid items are designated by the head and tail members.
+        // But fill it with a canary pattern in the high vigilance debug mode.
+        fill_with_canary_pattern( 0, my_task_pool_size );
+    }
+
+    //! Deallocate task pool that was allocated by means of allocate_task_pool.
+    void free_task_pool( ) {
+        // TODO: understand the assertion and modify
+        // __TBB_ASSERT( !task_pool /*TODO: == EmptyTaskPool*/, NULL);
+        if( task_pool_ptr ) {
+           __TBB_ASSERT( my_task_pool_size, NULL);
+           NFS_Free( task_pool_ptr );
+           task_pool_ptr = NULL;
+           my_task_pool_size = 0;
+        }
+    }
+};
+
+#if !__TBB_CPU_CTL_ENV_PRESENT
+class cpu_ctl_env {
+    fenv_t *my_fenv_ptr;
+public:
+    cpu_ctl_env() : my_fenv_ptr(NULL) {}
+    ~cpu_ctl_env() {
+        if ( my_fenv_ptr )
+            tbb::internal::NFS_Free( (void*)my_fenv_ptr );
+    }
+    // It is possible not to copy memory but just to copy pointers but the following issues should be addressed:
+    //   1. The arena lifetime and the context lifetime are independent;
+    //   2. The user is allowed to recapture different FPU settings to context so 'current FPU settings' inside
+    //   dispatch loop may become invalid.
+    // But do we really want to improve the fenv implementation? It seems to be better to replace the fenv implementation
+    // with a platform specific implementation.
+    cpu_ctl_env( const cpu_ctl_env &src ) : my_fenv_ptr(NULL) {
+        *this = src;
+    }
+    cpu_ctl_env& operator=( const cpu_ctl_env &src ) {
+        __TBB_ASSERT( src.my_fenv_ptr, NULL );
+        if ( !my_fenv_ptr )
+            my_fenv_ptr = (fenv_t*)tbb::internal::NFS_Allocate(1, sizeof(fenv_t), NULL);
+        *my_fenv_ptr = *src.my_fenv_ptr;
+        return *this;
+    }
+    bool operator!=( const cpu_ctl_env &ctl ) const {
+        __TBB_ASSERT( my_fenv_ptr, "cpu_ctl_env is not initialized." );
+        __TBB_ASSERT( ctl.my_fenv_ptr, "cpu_ctl_env is not initialized." );
+        return memcmp( (void*)my_fenv_ptr, (void*)ctl.my_fenv_ptr, sizeof(fenv_t) );
+    }
+    void get_env () {
+        if ( !my_fenv_ptr )
+            my_fenv_ptr = (fenv_t*)tbb::internal::NFS_Allocate(1, sizeof(fenv_t), NULL);
+        fegetenv( my_fenv_ptr );
+    }
+    const cpu_ctl_env& set_env () const {
+        __TBB_ASSERT( my_fenv_ptr, "cpu_ctl_env is not initialized." );
+        fesetenv( my_fenv_ptr );
+        return *this;
+    }
+};
+#endif /* !__TBB_CPU_CTL_ENV_PRESENT */
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_scheduler_common_H */
diff --git a/xdl/third_party/tbb/src/tbb/scheduler_utility.h b/xdl/third_party/tbb/src/tbb/scheduler_utility.h
new file mode 100644
index 00000000..6e84472b
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/scheduler_utility.h
@@ -0,0 +1,133 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_scheduler_utility_H
+#define _TBB_scheduler_utility_H
+
+#include "scheduler.h"
+
+namespace tbb {
+namespace internal {
+
+//------------------------------------------------------------------------
+// auto_empty_task
+//------------------------------------------------------------------------
+
+//! Smart holder for the empty task class with automatic destruction
+class auto_empty_task {
+    task* my_task;
+    generic_scheduler* my_scheduler;
+public:
+    auto_empty_task ( __TBB_CONTEXT_ARG(generic_scheduler *s, task_group_context* context) )
+        : my_task( new(&s->allocate_task(sizeof(empty_task), __TBB_CONTEXT_ARG(NULL, context))) empty_task )
+        , my_scheduler(s)
+    {}
+    // empty_task has trivial destructor, so there's no need to call it.
+    ~auto_empty_task () { my_scheduler->free_task<small_local_task>(*my_task); }
+
+    operator task& () { return *my_task; }
+    task* operator & () { return my_task; }
+    task_prefix& prefix () { return my_task->prefix(); }
+}; // class auto_empty_task
+
+//------------------------------------------------------------------------
+// fast_reverse_vector
+//------------------------------------------------------------------------
+
+//! Vector that grows without reallocations, and stores items in the reverse order.
+/** Requires to initialize its first segment with a preallocated memory chunk
+    (usually it is static array or an array allocated on the stack).
+    The second template parameter specifies maximal number of segments. Each next
+    segment is twice as large as the previous one. **/
+template<typename T, size_t max_segments = 16>
+class fast_reverse_vector
+{
+public:
+    fast_reverse_vector ( T* initial_segment, size_t segment_size )
+        : m_cur_segment(initial_segment)
+        , m_cur_segment_size(segment_size)
+        , m_pos(segment_size)
+        , m_num_segments(0)
+        , m_size(0)
+    {
+        __TBB_ASSERT ( initial_segment && segment_size, "Nonempty initial segment must be supplied");
+    }
+
+    ~fast_reverse_vector ()
+    {
+        for ( size_t i = 1; i < m_num_segments; ++i )
+            NFS_Free( m_segments[i] );
+    }
+
+    size_t size () const { return m_size + m_cur_segment_size - m_pos; }
+
+    void push_back ( const T& val )
+    {
+        if ( !m_pos ) {
+            if ( !m_num_segments ) m_segments[m_num_segments++] = m_cur_segment;
+            m_size += m_cur_segment_size;
+            m_cur_segment_size *= 2;
+            m_pos = m_cur_segment_size;
+            m_segments[m_num_segments++] = m_cur_segment = (T*)NFS_Allocate( m_cur_segment_size, sizeof(T), NULL );
+            __TBB_ASSERT ( m_num_segments < max_segments, "Maximal capacity exceeded" );
+        }
+        m_cur_segment[--m_pos] = val;
+    }
+
+    //! Copies the contents of the vector into the dst array.
+    /** Can only be used when T is a POD type, as copying does not invoke copy constructors. **/
+    void copy_memory ( T* dst ) const
+    {
+        size_t sz = m_cur_segment_size - m_pos;
+        memcpy( dst, m_cur_segment + m_pos, sz * sizeof(T) );
+        dst += sz;
+        sz = m_cur_segment_size / 2;
+        for ( long i = (long)m_num_segments - 2; i >= 0; --i ) {
+            memcpy( dst, m_segments[i], sz * sizeof(T) );
+            dst += sz;
+            sz /= 2;
+        }
+    }
+
+protected:
+    //! The current (not completely filled) segment
+    T       *m_cur_segment;
+
+    //! Capacity of m_cur_segment
+    size_t  m_cur_segment_size;
+
+    //! Insertion position in m_cur_segment
+    size_t  m_pos;
+
+    //! Array of segments (has fixed size specified by the second template parameter)
+    T       *m_segments[max_segments];
+
+    //! Number of segments (the size of m_segments)
+    size_t  m_num_segments;
+
+    //! Number of items in the segments in m_segments
+    size_t  m_size;
+
+}; // class fast_reverse_vector
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_scheduler_utility_H */
diff --git a/xdl/third_party/tbb/src/tbb/semaphore.cpp b/xdl/third_party/tbb/src/tbb/semaphore.cpp
new file mode 100644
index 00000000..853bece6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/semaphore.cpp
@@ -0,0 +1,94 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "semaphore.h"
+#if __TBB_USE_SRWLOCK
+#include "dynamic_link.h" // Refers to src/tbb, not include/tbb
+#include "tbb_misc.h"
+#endif
+
+namespace tbb {
+namespace internal {
+
+// TODO: For new win UI port, we can use SRWLock API without dynamic_link etc.
+#if __TBB_USE_SRWLOCK
+
+static atomic<do_once_state> concmon_module_inited;
+
+void WINAPI init_binsem_using_event( SRWLOCK* h_ )
+{
+    srwl_or_handle* shptr = (srwl_or_handle*) h_;
+    shptr->h = CreateEventEx( NULL, NULL, 0, EVENT_ALL_ACCESS|SEMAPHORE_ALL_ACCESS );
+}
+
+void WINAPI acquire_binsem_using_event( SRWLOCK* h_ )
+{
+    srwl_or_handle* shptr = (srwl_or_handle*) h_;
+    WaitForSingleObjectEx( shptr->h, INFINITE, FALSE );
+}
+
+void WINAPI release_binsem_using_event( SRWLOCK* h_ )
+{
+    srwl_or_handle* shptr = (srwl_or_handle*) h_;
+    SetEvent( shptr->h );
+}
+
+static void (WINAPI *__TBB_init_binsem)( SRWLOCK* ) = (void (WINAPI *)(SRWLOCK*))&init_binsem_using_event;
+static void (WINAPI *__TBB_acquire_binsem)( SRWLOCK* ) = (void (WINAPI *)(SRWLOCK*))&acquire_binsem_using_event;
+static void (WINAPI *__TBB_release_binsem)( SRWLOCK* ) = (void (WINAPI *)(SRWLOCK*))&release_binsem_using_event;
+
+//! Table describing the how to link the handlers.
+static const dynamic_link_descriptor SRWLLinkTable[] = {
+    DLD(InitializeSRWLock,       __TBB_init_binsem),
+    DLD(AcquireSRWLockExclusive, __TBB_acquire_binsem),
+    DLD(ReleaseSRWLockExclusive, __TBB_release_binsem)
+};
+
+inline void init_concmon_module()
+{
+    __TBB_ASSERT( (uintptr_t)__TBB_init_binsem==(uintptr_t)&init_binsem_using_event, NULL );
+    if( dynamic_link( "Kernel32.dll", SRWLLinkTable, sizeof(SRWLLinkTable)/sizeof(dynamic_link_descriptor) ) ) {
+        __TBB_ASSERT( (uintptr_t)__TBB_init_binsem!=(uintptr_t)&init_binsem_using_event, NULL );
+        __TBB_ASSERT( (uintptr_t)__TBB_acquire_binsem!=(uintptr_t)&acquire_binsem_using_event, NULL );
+        __TBB_ASSERT( (uintptr_t)__TBB_release_binsem!=(uintptr_t)&release_binsem_using_event, NULL );
+    }
+}
+
+binary_semaphore::binary_semaphore() {
+    atomic_do_once( &init_concmon_module, concmon_module_inited );
+
+    __TBB_init_binsem( &my_sem.lock );
+    if( (uintptr_t)__TBB_init_binsem!=(uintptr_t)&init_binsem_using_event )
+        P();
+}
+
+binary_semaphore::~binary_semaphore() {
+    if( (uintptr_t)__TBB_init_binsem==(uintptr_t)&init_binsem_using_event )
+        CloseHandle( my_sem.h );
+}
+
+void binary_semaphore::P() { __TBB_acquire_binsem( &my_sem.lock ); }
+
+void binary_semaphore::V() { __TBB_release_binsem( &my_sem.lock ); }
+
+#endif /* __TBB_USE_SRWLOCK */
+
+} // namespace internal
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/semaphore.h b/xdl/third_party/tbb/src/tbb/semaphore.h
new file mode 100644
index 00000000..d02bf00f
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/semaphore.h
@@ -0,0 +1,254 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_semaphore_H
+#define __TBB_tbb_semaphore_H
+
+#include <tbb/atomic.h>
+#include "tbb/tbb_stddef.h"
+
+#if _WIN32||_WIN64
+#include "tbb/machine/windows_api.h"
+
+#elif __APPLE__
+#include <mach/semaphore.h>
+#include <mach/task.h>
+#include <mach/mach_init.h>
+#include <mach/error.h>
+
+#else
+#include <semaphore.h>
+#ifdef TBB_USE_DEBUG
+#include <errno.h>
+#endif
+#endif /*_WIN32||_WIN64*/
+
+namespace tbb {
+namespace internal {
+
+
+#if _WIN32||_WIN64
+typedef LONG sem_count_t;
+//! Edsger Dijkstra's counting semaphore
+class semaphore : no_copy {
+    static const int max_semaphore_cnt = MAXLONG;
+public:
+    //! ctor
+    semaphore(size_t start_cnt_ = 0) {init_semaphore(start_cnt_);}
+    //! dtor
+    ~semaphore() {CloseHandle( sem );}
+    //! wait/acquire
+    void P() {WaitForSingleObjectEx( sem, INFINITE, FALSE );}
+    //! post/release
+    void V() {ReleaseSemaphore( sem, 1, NULL );}
+private:
+    HANDLE sem;
+    void init_semaphore(size_t start_cnt_) {
+        sem = CreateSemaphoreEx( NULL, LONG(start_cnt_), max_semaphore_cnt, NULL, 0, SEMAPHORE_ALL_ACCESS );
+    }
+};
+#elif __APPLE__
+//! Edsger Dijkstra's counting semaphore
+class semaphore : no_copy {
+public:
+    //! ctor
+    semaphore(int start_cnt_ = 0) : sem(start_cnt_) { init_semaphore(start_cnt_); }
+    //! dtor
+    ~semaphore() {
+        kern_return_t ret = semaphore_destroy( mach_task_self(), sem );
+        __TBB_ASSERT_EX( ret==err_none, NULL );
+    }
+    //! wait/acquire
+    void P() {
+        int ret;
+        do {
+            ret = semaphore_wait( sem );
+        } while( ret==KERN_ABORTED );
+        __TBB_ASSERT( ret==KERN_SUCCESS, "semaphore_wait() failed" );
+    }
+    //! post/release
+    void V() { semaphore_signal( sem ); }
+private:
+    semaphore_t sem;
+    void init_semaphore(int start_cnt_) {
+        kern_return_t ret = semaphore_create( mach_task_self(), &sem, SYNC_POLICY_FIFO, start_cnt_ );
+        __TBB_ASSERT_EX( ret==err_none, "failed to create a semaphore" );
+    }
+};
+#else /* Linux/Unix */
+typedef uint32_t sem_count_t;
+//! Edsger Dijkstra's counting semaphore
+class semaphore : no_copy {
+public:
+    //! ctor
+    semaphore(int start_cnt_ = 0 ) { init_semaphore( start_cnt_ ); }
+
+    //! dtor
+    ~semaphore() {
+        int ret = sem_destroy( &sem );
+        __TBB_ASSERT_EX( !ret, NULL );
+    }
+    //! wait/acquire
+    void P() {
+        while( sem_wait( &sem )!=0 )
+            __TBB_ASSERT( errno==EINTR, NULL );
+    }
+    //! post/release
+    void V() { sem_post( &sem ); }
+private:
+    sem_t sem;
+    void init_semaphore(int start_cnt_) {
+        int ret = sem_init( &sem, /*shared among threads*/ 0, start_cnt_ );
+        __TBB_ASSERT_EX( !ret, NULL );
+    }
+};
+#endif /* _WIN32||_WIN64 */
+
+
+//! for performance reasons, we want specialized binary_semaphore
+#if _WIN32||_WIN64
+#if !__TBB_USE_SRWLOCK
+//! binary_semaphore for concurrent_monitor
+class binary_semaphore : no_copy {
+public:
+    //! ctor
+    binary_semaphore() { my_sem = CreateEventEx( NULL, NULL, 0, EVENT_ALL_ACCESS );  }
+    //! dtor
+    ~binary_semaphore() { CloseHandle( my_sem ); }
+    //! wait/acquire
+    void P() { WaitForSingleObjectEx( my_sem, INFINITE, FALSE ); }
+    //! post/release
+    void V() { SetEvent( my_sem ); }
+private:
+    HANDLE my_sem;
+};
+#else /* __TBB_USE_SRWLOCK */
+
+union srwl_or_handle {
+    SRWLOCK lock;
+    HANDLE  h;
+};
+
+//! binary_semaphore for concurrent_monitor
+class binary_semaphore : no_copy {
+public:
+    //! ctor
+    binary_semaphore();
+    //! dtor
+    ~binary_semaphore();
+    //! wait/acquire
+    void P();
+    //! post/release
+    void V();
+private:
+    srwl_or_handle my_sem;
+};
+#endif /* !__TBB_USE_SRWLOCK */
+#elif __APPLE__
+//! binary_semaphore for concurrent monitor
+class binary_semaphore : no_copy {
+public:
+    //! ctor
+    binary_semaphore() : my_sem(0) {
+        kern_return_t ret = semaphore_create( mach_task_self(), &my_sem, SYNC_POLICY_FIFO, 0 );
+        __TBB_ASSERT_EX( ret==err_none, "failed to create a semaphore" );
+    }
+    //! dtor
+    ~binary_semaphore() {
+        kern_return_t ret = semaphore_destroy( mach_task_self(), my_sem );
+        __TBB_ASSERT_EX( ret==err_none, NULL );
+    }
+    //! wait/acquire
+    void P() {
+        int ret;
+        do {
+            ret = semaphore_wait( my_sem );
+        } while( ret==KERN_ABORTED );
+        __TBB_ASSERT( ret==KERN_SUCCESS, "semaphore_wait() failed" );
+    }
+    //! post/release
+    void V() { semaphore_signal( my_sem ); }
+private:
+    semaphore_t my_sem;
+};
+#else /* Linux/Unix */
+
+#if __TBB_USE_FUTEX
+class binary_semaphore : no_copy {
+// The implementation is equivalent to the "Mutex, Take 3" one
+// in the paper "Futexes Are Tricky" by Ulrich Drepper
+public:
+    //! ctor
+    binary_semaphore() { my_sem = 1; }
+    //! dtor
+    ~binary_semaphore() {}
+    //! wait/acquire
+    void P() {
+        int s;
+        if( (s = my_sem.compare_and_swap( 1, 0 ))!=0 ) {
+            if( s!=2 )
+                s = my_sem.fetch_and_store( 2 );
+            while( s!=0 ) { // This loop deals with spurious wakeup
+                futex_wait( &my_sem, 2 );
+                s = my_sem.fetch_and_store( 2 );
+            }
+        }
+    }
+    //! post/release
+    void V() {
+        __TBB_ASSERT( my_sem>=1, "multiple V()'s in a row?" );
+        if( my_sem.fetch_and_store( 0 )==2 )
+            futex_wakeup_one( &my_sem );
+    }
+private:
+    atomic<int> my_sem; // 0 - open; 1 - closed, no waits; 2 - closed, possible waits
+};
+#else
+typedef uint32_t sem_count_t;
+//! binary_semaphore for concurrent monitor
+class binary_semaphore : no_copy {
+public:
+    //! ctor
+    binary_semaphore() {
+        int ret = sem_init( &my_sem, /*shared among threads*/ 0, 0 );
+        __TBB_ASSERT_EX( !ret, NULL );
+    }
+    //! dtor
+    ~binary_semaphore() {
+        int ret = sem_destroy( &my_sem );
+        __TBB_ASSERT_EX( !ret, NULL );
+    }
+    //! wait/acquire
+    void P() {
+        while( sem_wait( &my_sem )!=0 )
+            __TBB_ASSERT( errno==EINTR, NULL );
+    }
+    //! post/release
+    void V() { sem_post( &my_sem ); }
+private:
+    sem_t my_sem;
+};
+#endif /* __TBB_USE_FUTEX */
+#endif /* _WIN32||_WIN64 */
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* __TBB_tbb_semaphore_H */
diff --git a/xdl/third_party/tbb/src/tbb/spin_mutex.cpp b/xdl/third_party/tbb/src/tbb/spin_mutex.cpp
new file mode 100644
index 00000000..150af224
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/spin_mutex.cpp
@@ -0,0 +1,58 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_machine.h"
+#include "tbb/spin_mutex.h"
+#include "itt_notify.h"
+#include "tbb_misc.h"
+
+namespace tbb {
+
+void spin_mutex::scoped_lock::internal_acquire( spin_mutex& m ) {
+    __TBB_ASSERT( !my_mutex, "already holding a lock on a spin_mutex" );
+    ITT_NOTIFY(sync_prepare, &m);
+    __TBB_LockByte(m.flag);
+    my_mutex = &m;
+    ITT_NOTIFY(sync_acquired, &m);
+}
+
+void spin_mutex::scoped_lock::internal_release() {
+    __TBB_ASSERT( my_mutex, "release on spin_mutex::scoped_lock that is not holding a lock" );
+
+    ITT_NOTIFY(sync_releasing, my_mutex);
+    __TBB_UnlockByte(my_mutex->flag);
+    my_mutex = NULL;
+}
+
+bool spin_mutex::scoped_lock::internal_try_acquire( spin_mutex& m ) {
+    __TBB_ASSERT( !my_mutex, "already holding a lock on a spin_mutex" );
+    bool result = bool( __TBB_TryLockByte(m.flag) );
+    if( result ) {
+        my_mutex = &m;
+        ITT_NOTIFY(sync_acquired, &m);
+    }
+    return result;
+}
+
+void spin_mutex::internal_construct() {
+    ITT_SYNC_CREATE(this, _T("tbb::spin_mutex"), _T(""));
+}
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/spin_rw_mutex.cpp b/xdl/third_party/tbb/src/tbb/spin_rw_mutex.cpp
new file mode 100644
index 00000000..37078d13
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/spin_rw_mutex.cpp
@@ -0,0 +1,159 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/atomic.h"
+#include "itt_notify.h"
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4244)
+#endif
+
+namespace tbb {
+
+template<typename T> // a template can work with private spin_rw_mutex::state_t
+static inline T CAS(volatile T &addr, T newv, T oldv) {
+    // ICC (9.1 and 10.1 tried) unable to do implicit conversion
+    // from "volatile T*" to "volatile void*", so explicit cast added.
+    return tbb::internal::as_atomic(addr).compare_and_swap( newv, oldv );
+}
+
+//! Acquire write lock on the given mutex.
+bool spin_rw_mutex_v3::internal_acquire_writer()
+{
+    ITT_NOTIFY(sync_prepare, this);
+    for( internal::atomic_backoff backoff;;backoff.pause() ){
+        state_t s = const_cast<volatile state_t&>(state); // ensure reloading
+        if( !(s & BUSY) ) { // no readers, no writers
+            if( CAS(state, WRITER, s)==s )
+                break; // successfully stored writer flag
+            backoff.reset(); // we could be very close to complete op.
+        } else if( !(s & WRITER_PENDING) ) { // no pending writers
+            __TBB_AtomicOR(&state, WRITER_PENDING);
+        }
+    }
+    ITT_NOTIFY(sync_acquired, this);
+    return false;
+}
+
+//! Release writer lock on the given mutex
+void spin_rw_mutex_v3::internal_release_writer()
+{
+    ITT_NOTIFY(sync_releasing, this);
+    __TBB_AtomicAND( &state, READERS );
+}
+
+//! Acquire read lock on given mutex.
+void spin_rw_mutex_v3::internal_acquire_reader()
+{
+    ITT_NOTIFY(sync_prepare, this);
+    for( internal::atomic_backoff b;;b.pause() ){
+        state_t s = const_cast<volatile state_t&>(state); // ensure reloading
+        if( !(s & (WRITER|WRITER_PENDING)) ) { // no writer or write requests
+            state_t t = (state_t)__TBB_FetchAndAddW( &state, (intptr_t) ONE_READER );
+            if( !( t&WRITER ))
+                break; // successfully stored increased number of readers
+            // writer got there first, undo the increment
+            __TBB_FetchAndAddW( &state, -(intptr_t)ONE_READER );
+        }
+    }
+
+    ITT_NOTIFY(sync_acquired, this);
+    __TBB_ASSERT( state & READERS, "invalid state of a read lock: no readers" );
+}
+
+//! Upgrade reader to become a writer.
+/** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+bool spin_rw_mutex_v3::internal_upgrade()
+{
+    state_t s = state;
+    __TBB_ASSERT( s & READERS, "invalid state before upgrade: no readers " );
+    // check and set writer-pending flag
+    // required conditions: either no pending writers, or we are the only reader
+    // (with multiple readers and pending writer, another upgrade could have been requested)
+    while( (s & READERS)==ONE_READER || !(s & WRITER_PENDING) ) {
+        state_t old_s = s;
+        if( (s=CAS(state, s | WRITER | WRITER_PENDING, s))==old_s ) {
+            ITT_NOTIFY(sync_prepare, this);
+            internal::atomic_backoff backoff;
+            while( (state & READERS) != ONE_READER ) backoff.pause();
+            __TBB_ASSERT((state&(WRITER_PENDING|WRITER))==(WRITER_PENDING|WRITER),"invalid state when upgrading to writer");
+            // both new readers and writers are blocked at this time
+            __TBB_FetchAndAddW( &state,  - (intptr_t)(ONE_READER+WRITER_PENDING));
+            ITT_NOTIFY(sync_acquired, this);
+            return true; // successfully upgraded
+        }
+    }
+    // slow reacquire
+    internal_release_reader();
+    return internal_acquire_writer(); // always returns false
+}
+
+//! Downgrade writer to a reader
+void spin_rw_mutex_v3::internal_downgrade() {
+    ITT_NOTIFY(sync_releasing, this);
+    __TBB_FetchAndAddW( &state, (intptr_t)(ONE_READER-WRITER));
+    __TBB_ASSERT( state & READERS, "invalid state after downgrade: no readers" );
+}
+
+//! Release read lock on the given mutex
+void spin_rw_mutex_v3::internal_release_reader()
+{
+    __TBB_ASSERT( state & READERS, "invalid state of a read lock: no readers" );
+    ITT_NOTIFY(sync_releasing, this); // release reader
+    __TBB_FetchAndAddWrelease( &state,-(intptr_t)ONE_READER);
+}
+
+//! Try to acquire write lock on the given mutex
+bool spin_rw_mutex_v3::internal_try_acquire_writer()
+{
+    // for a writer: only possible to acquire if no active readers or writers
+    state_t s = state;
+    if( !(s & BUSY) ) // no readers, no writers; mask is 1..1101
+        if( CAS(state, WRITER, s)==s ) {
+            ITT_NOTIFY(sync_acquired, this);
+            return true; // successfully stored writer flag
+        }
+    return false;
+}
+
+//! Try to acquire read lock on the given mutex
+bool spin_rw_mutex_v3::internal_try_acquire_reader()
+{
+    // for a reader: acquire if no active or waiting writers
+    state_t s = state;
+    if( !(s & (WRITER|WRITER_PENDING)) ) { // no writers
+        state_t t = (state_t)__TBB_FetchAndAddW( &state, (intptr_t) ONE_READER );
+        if( !( t&WRITER )) {  // got the lock
+            ITT_NOTIFY(sync_acquired, this);
+            return true; // successfully stored increased number of readers
+        }
+        // writer got there first, undo the increment
+        __TBB_FetchAndAddW( &state, -(intptr_t)ONE_READER );
+    }
+    return false;
+}
+
+void spin_rw_mutex_v3::internal_construct() {
+    ITT_SYNC_CREATE(this, _T("tbb::spin_rw_mutex"), _T(""));
+}
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/task.cpp b/xdl/third_party/tbb/src/tbb/task.cpp
new file mode 100644
index 00000000..e8e7e460
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/task.cpp
@@ -0,0 +1,275 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Do not include task.h directly. Use scheduler_common.h instead
+#include "scheduler_common.h"
+#include "governor.h"
+#include "scheduler.h"
+#include "itt_notify.h"
+
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/partitioner.h"
+
+#include <new>
+
+namespace tbb {
+
+namespace internal {
+
+//------------------------------------------------------------------------
+// Methods of allocate_root_proxy
+//------------------------------------------------------------------------
+task& allocate_root_proxy::allocate( size_t size ) {
+    internal::generic_scheduler* v = governor::local_scheduler_weak();
+    __TBB_ASSERT( v, "thread did not activate a task_scheduler_init object?" );
+#if __TBB_TASK_GROUP_CONTEXT
+    task_prefix& p = v->my_innermost_running_task->prefix();
+
+    ITT_STACK_CREATE(p.context->itt_caller);
+#endif
+    // New root task becomes part of the currently running task's cancellation context
+    return v->allocate_task( size, __TBB_CONTEXT_ARG(NULL, p.context) );
+}
+
+void allocate_root_proxy::free( task& task ) {
+    internal::generic_scheduler* v = governor::local_scheduler_weak();
+    __TBB_ASSERT( v, "thread does not have initialized task_scheduler_init object?" );
+#if __TBB_TASK_GROUP_CONTEXT
+    // No need to do anything here as long as there is no context -> task connection
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    v->free_task<local_task>( task );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+//------------------------------------------------------------------------
+// Methods of allocate_root_with_context_proxy
+//------------------------------------------------------------------------
+task& allocate_root_with_context_proxy::allocate( size_t size ) const {
+    internal::generic_scheduler* s = governor::local_scheduler_weak();
+    __TBB_ASSERT( s, "Scheduler auto-initialization failed?" );
+    __TBB_ASSERT( &my_context, "allocate_root(context) argument is a dereferenced NULL pointer" );
+    task& t = s->allocate_task( size, NULL, &my_context );
+    // Supported usage model prohibits concurrent initial binding. Thus we do not
+    // need interlocked operations or fences to manipulate with my_context.my_kind
+    if ( __TBB_load_relaxed(my_context.my_kind) == task_group_context::binding_required ) {
+        // If we are in the outermost task dispatch loop of a master thread, then
+        // there is nothing to bind this context to, and we skip the binding part
+        // treating the context as isolated.
+        if ( s->master_outermost_level() )
+            __TBB_store_relaxed(my_context.my_kind, task_group_context::isolated);
+        else
+            my_context.bind_to( s );
+    }
+#if __TBB_FP_CONTEXT
+    if ( __TBB_load_relaxed(my_context.my_kind) == task_group_context::isolated &&
+            !(my_context.my_version_and_traits & task_group_context::fp_settings) )
+        my_context.copy_fp_settings( *s->default_context() );
+#endif
+    ITT_STACK_CREATE(my_context.itt_caller);
+    return t;
+}
+
+void allocate_root_with_context_proxy::free( task& task ) const {
+    internal::generic_scheduler* v = governor::local_scheduler_weak();
+    __TBB_ASSERT( v, "thread does not have initialized task_scheduler_init object?" );
+    // No need to do anything here as long as unbinding is performed by context destructor only.
+    v->free_task<local_task>( task );
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//------------------------------------------------------------------------
+// Methods of allocate_continuation_proxy
+//------------------------------------------------------------------------
+task& allocate_continuation_proxy::allocate( size_t size ) const {
+    task* t = (task*)this;
+    assert_task_valid(t);
+    generic_scheduler* s = governor::local_scheduler_weak();
+    task* parent = t->parent();
+    t->prefix().parent = NULL;
+    return s->allocate_task( size, __TBB_CONTEXT_ARG(parent, t->prefix().context) );
+}
+
+void allocate_continuation_proxy::free( task& mytask ) const {
+    // Restore the parent as it was before the corresponding allocate was called.
+    ((task*)this)->prefix().parent = mytask.parent();
+    governor::local_scheduler_weak()->free_task<local_task>(mytask);
+}
+
+//------------------------------------------------------------------------
+// Methods of allocate_child_proxy
+//------------------------------------------------------------------------
+task& allocate_child_proxy::allocate( size_t size ) const {
+    task* t = (task*)this;
+    assert_task_valid(t);
+    generic_scheduler* s = governor::local_scheduler_weak();
+    return s->allocate_task( size, __TBB_CONTEXT_ARG(t, t->prefix().context) );
+}
+
+void allocate_child_proxy::free( task& mytask ) const {
+    governor::local_scheduler_weak()->free_task<local_task>(mytask);
+}
+
+//------------------------------------------------------------------------
+// Methods of allocate_additional_child_of_proxy
+//------------------------------------------------------------------------
+task& allocate_additional_child_of_proxy::allocate( size_t size ) const {
+    parent.increment_ref_count();
+    generic_scheduler* s = governor::local_scheduler_weak();
+    return s->allocate_task( size, __TBB_CONTEXT_ARG(&parent, parent.prefix().context) );
+}
+
+void allocate_additional_child_of_proxy::free( task& task ) const {
+    // Undo the increment.  We do not check the result of the fetch-and-decrement.
+    // We could consider be spawning the task if the fetch-and-decrement returns 1.
+    // But we do not know that was the programmer's intention.
+    // Furthermore, if it was the programmer's intention, the program has a fundamental
+    // race condition (that we warn about in Reference manual), because the
+    // reference count might have become zero before the corresponding call to
+    // allocate_additional_child_of_proxy::allocate.
+    parent.internal_decrement_ref_count();
+    governor::local_scheduler_weak()->free_task<local_task>(task);
+}
+
+//------------------------------------------------------------------------
+// Support for auto_partitioner
+//------------------------------------------------------------------------
+size_t get_initial_auto_partitioner_divisor() {
+    const size_t X_FACTOR = 4;
+    return X_FACTOR * governor::local_scheduler()->max_threads_in_arena();
+}
+
+//------------------------------------------------------------------------
+// Methods of affinity_partitioner_base_v3
+//------------------------------------------------------------------------
+void affinity_partitioner_base_v3::resize( unsigned factor ) {
+    // Check factor to avoid asking for number of workers while there might be no arena.
+    size_t new_size = factor ? factor*governor::local_scheduler()->max_threads_in_arena() : 0;
+    if( new_size!=my_size ) {
+        if( my_array ) {
+            NFS_Free( my_array );
+            // Following two assignments must be done here for sake of exception safety.
+            my_array = NULL;
+            my_size = 0;
+        }
+        if( new_size ) {
+            my_array = static_cast<affinity_id*>(NFS_Allocate(new_size,sizeof(affinity_id), NULL ));
+            memset( my_array, 0, sizeof(affinity_id)*new_size );
+            my_size = new_size;
+        }
+    }
+}
+
+} // namespace internal
+
+using namespace tbb::internal;
+
+//------------------------------------------------------------------------
+// task
+//------------------------------------------------------------------------
+
+void task::internal_set_ref_count( int count ) {
+    __TBB_ASSERT( count>=0, "count must not be negative" );
+    task_prefix &p = prefix();
+    __TBB_ASSERT(p.ref_count==1 && p.state==allocated && self().parent()==this
+        || !(p.extra_state & es_ref_count_active), "ref_count race detected");
+    ITT_NOTIFY(sync_releasing, &p.ref_count);
+    p.ref_count = count;
+}
+
+internal::reference_count task::internal_decrement_ref_count() {
+    ITT_NOTIFY( sync_releasing, &prefix().ref_count );
+    internal::reference_count k = __TBB_FetchAndDecrementWrelease( &prefix().ref_count );
+    __TBB_ASSERT( k>=1, "task's reference count underflowed" );
+    if( k==1 )
+        ITT_NOTIFY( sync_acquired, &prefix().ref_count );
+    return k-1;
+}
+
+task& task::self() {
+    generic_scheduler *v = governor::local_scheduler_weak();
+    v->assert_task_pool_valid();
+    __TBB_ASSERT( v->my_innermost_running_task, NULL );
+    return *v->my_innermost_running_task;
+}
+
+bool task::is_owned_by_current_thread() const {
+    return true;
+}
+
+void interface5::internal::task_base::destroy( task& victim ) {
+    // 1 may be a guard reference for wait_for_all, which was not reset because
+    // of concurrent_wait mode or because prepared root task was not actually used
+    // for spawning tasks (as in structured_task_group).
+    __TBB_ASSERT( (intptr_t)victim.prefix().ref_count <= 1, "Task being destroyed must not have children" );
+    __TBB_ASSERT( victim.state()==task::allocated, "illegal state for victim task" );
+    task* parent = victim.parent();
+    victim.~task();
+    if( parent ) {
+        __TBB_ASSERT( parent->state()!=task::freed && parent->state()!=task::ready,
+                      "attempt to destroy child of running or corrupted parent?" );
+        // 'reexecute' and 'executing' are also signs of a race condition, since most tasks
+        // set their ref_count upon entry but "es_ref_count_active" should detect this
+        parent->internal_decrement_ref_count();
+        // Even if the last reference to *parent is removed, it should not be spawned (documented behavior).
+    }
+    governor::local_scheduler_weak()->free_task<no_cache>( victim );
+}
+
+void task::spawn_and_wait_for_all( task_list& list ) {
+    generic_scheduler* s = governor::local_scheduler();
+    task* t = list.first;
+    if( t ) {
+        if( &t->prefix().next!=list.next_ptr )
+            s->local_spawn( t->prefix().next, *list.next_ptr );
+        list.clear();
+    }
+    s->local_wait_for_all( *this, t );
+}
+
+/** Defined out of line so that compiler does not replicate task's vtable.
+    It's pointless to define it inline anyway, because all call sites to it are virtual calls
+    that the compiler is unlikely to optimize. */
+void task::note_affinity( affinity_id ) {
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+void task::change_group ( task_group_context& ctx ) {
+    prefix().context = &ctx;
+    internal::generic_scheduler* s = governor::local_scheduler_weak();
+    if ( __TBB_load_relaxed(ctx.my_kind) == task_group_context::binding_required ) {
+        // If we are in the outermost task dispatch loop of a master thread, then
+        // there is nothing to bind this context to, and we skip the binding part
+        // treating the context as isolated.
+        if ( s->master_outermost_level() )
+            __TBB_store_relaxed(ctx.my_kind, task_group_context::isolated);
+        else
+            ctx.bind_to( s );
+    }
+#if __TBB_FP_CONTEXT
+    if ( __TBB_load_relaxed(ctx.my_kind) == task_group_context::isolated &&
+            !(ctx.my_version_and_traits & task_group_context::fp_settings) )
+        ctx.copy_fp_settings( *s->default_context() );
+#endif
+    ITT_STACK_CREATE(ctx.itt_caller);
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+} // namespace tbb
+
diff --git a/xdl/third_party/tbb/src/tbb/task_group_context.cpp b/xdl/third_party/tbb/src/tbb/task_group_context.cpp
new file mode 100644
index 00000000..f20ae30a
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/task_group_context.cpp
@@ -0,0 +1,495 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "scheduler.h"
+
+#include "itt_notify.h"
+
+namespace tbb {
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+using namespace internal;
+
+//------------------------------------------------------------------------
+// captured_exception
+//------------------------------------------------------------------------
+
+inline char* duplicate_string ( const char* src ) {
+    char* dst = NULL;
+    if ( src ) {
+        size_t len = strlen(src) + 1;
+        dst = (char*)allocate_via_handler_v3(len);
+        strncpy (dst, src, len);
+    }
+    return dst;
+}
+
+captured_exception::~captured_exception () throw() {
+    clear();
+}
+
+void captured_exception::set ( const char* a_name, const char* info ) throw() {
+    my_exception_name = duplicate_string( a_name );
+    my_exception_info = duplicate_string( info );
+}
+
+void captured_exception::clear () throw() {
+    deallocate_via_handler_v3 (const_cast<char*>(my_exception_name));
+    deallocate_via_handler_v3 (const_cast<char*>(my_exception_info));
+}
+
+captured_exception* captured_exception::move () throw() {
+    captured_exception *e = (captured_exception*)allocate_via_handler_v3(sizeof(captured_exception));
+    if ( e ) {
+        ::new (e) captured_exception();
+        e->my_exception_name = my_exception_name;
+        e->my_exception_info = my_exception_info;
+        e->my_dynamic = true;
+        my_exception_name = my_exception_info = NULL;
+    }
+    return e;
+}
+
+void captured_exception::destroy () throw() {
+    __TBB_ASSERT ( my_dynamic, "Method destroy can be used only on objects created by clone or allocate" );
+    if ( my_dynamic ) {
+        this->captured_exception::~captured_exception();
+        deallocate_via_handler_v3 (this);
+    }
+}
+
+captured_exception* captured_exception::allocate ( const char* a_name, const char* info ) {
+    captured_exception *e = (captured_exception*)allocate_via_handler_v3( sizeof(captured_exception) );
+    if ( e ) {
+        ::new (e) captured_exception(a_name, info);
+        e->my_dynamic = true;
+    }
+    return e;
+}
+
+const char* captured_exception::name() const throw() {
+    return my_exception_name;
+}
+
+const char* captured_exception::what() const throw() {
+    return my_exception_info;
+}
+
+
+//------------------------------------------------------------------------
+// tbb_exception_ptr
+//------------------------------------------------------------------------
+
+#if !TBB_USE_CAPTURED_EXCEPTION
+
+namespace internal {
+
+template<typename T>
+tbb_exception_ptr* AllocateExceptionContainer( const T& src ) {
+    tbb_exception_ptr *eptr = (tbb_exception_ptr*)allocate_via_handler_v3( sizeof(tbb_exception_ptr) );
+    if ( eptr )
+        new (eptr) tbb_exception_ptr(src);
+    return eptr;
+}
+
+tbb_exception_ptr* tbb_exception_ptr::allocate () {
+    return AllocateExceptionContainer( std::current_exception() );
+}
+
+tbb_exception_ptr* tbb_exception_ptr::allocate ( const tbb_exception& ) {
+    return AllocateExceptionContainer( std::current_exception() );
+}
+
+tbb_exception_ptr* tbb_exception_ptr::allocate ( captured_exception& src ) {
+    tbb_exception_ptr *res = AllocateExceptionContainer( src );
+    src.destroy();
+    return res;
+}
+
+void tbb_exception_ptr::destroy () throw() {
+    this->tbb_exception_ptr::~tbb_exception_ptr();
+    deallocate_via_handler_v3 (this);
+}
+
+} // namespace internal
+#endif /* !TBB_USE_CAPTURED_EXCEPTION */
+
+
+//------------------------------------------------------------------------
+// task_group_context
+//------------------------------------------------------------------------
+
+task_group_context::~task_group_context () {
+    if ( __TBB_load_relaxed(my_kind) == binding_completed ) {
+        if ( governor::is_set(my_owner) ) {
+            // Local update of the context list
+            uintptr_t local_count_snapshot = my_owner->my_context_state_propagation_epoch;
+            my_owner->my_local_ctx_list_update.store<relaxed>(1);
+            // Prevent load of nonlocal update flag from being hoisted before the
+            // store to local update flag.
+            atomic_fence();
+            if ( my_owner->my_nonlocal_ctx_list_update.load<relaxed>() ) {
+                spin_mutex::scoped_lock lock(my_owner->my_context_list_mutex);
+                my_node.my_prev->my_next = my_node.my_next;
+                my_node.my_next->my_prev = my_node.my_prev;
+                my_owner->my_local_ctx_list_update.store<relaxed>(0);
+            }
+            else {
+                my_node.my_prev->my_next = my_node.my_next;
+                my_node.my_next->my_prev = my_node.my_prev;
+                // Release fence is necessary so that update of our neighbors in
+                // the context list was committed when possible concurrent destroyer
+                // proceeds after local update flag is reset by the following store.
+                my_owner->my_local_ctx_list_update.store<release>(0);
+                if ( local_count_snapshot != the_context_state_propagation_epoch ) {
+                    // Another thread was propagating cancellation request when we removed
+                    // ourselves from the list. We must ensure that it is not accessing us
+                    // when this destructor finishes. We'll be able to acquire the lock
+                    // below only after the other thread finishes with us.
+                    spin_mutex::scoped_lock lock(my_owner->my_context_list_mutex);
+                }
+            }
+        }
+        else {
+            // Nonlocal update of the context list
+            // Synchronizes with generic_scheduler::cleanup_local_context_list()
+            // TODO: evaluate and perhaps relax, or add some lock instead
+            if ( internal::as_atomic(my_kind).fetch_and_store(dying) == detached ) {
+                my_node.my_prev->my_next = my_node.my_next;
+                my_node.my_next->my_prev = my_node.my_prev;
+            }
+            else {
+                //TODO: evaluate and perhaps relax
+                my_owner->my_nonlocal_ctx_list_update.fetch_and_increment<full_fence>();
+                //TODO: evaluate and perhaps remove
+                spin_wait_until_eq( my_owner->my_local_ctx_list_update, 0u );
+                my_owner->my_context_list_mutex.lock();
+                my_node.my_prev->my_next = my_node.my_next;
+                my_node.my_next->my_prev = my_node.my_prev;
+                my_owner->my_context_list_mutex.unlock();
+                //TODO: evaluate and perhaps relax
+                my_owner->my_nonlocal_ctx_list_update.fetch_and_decrement<full_fence>();
+            }
+        }
+    }
+#if __TBB_FP_CONTEXT
+    internal::punned_cast<cpu_ctl_env*>(&my_cpu_ctl_env)->~cpu_ctl_env();
+#endif
+    poison_value(my_version_and_traits);
+    if ( my_exception )
+        my_exception->destroy();
+    ITT_STACK(itt_caller != ITT_CALLER_NULL, caller_destroy, itt_caller);
+}
+
+void task_group_context::init () {
+#if DO_ITT_NOTIFY
+    // Check version of task group context to avoid reporting misleading identifier.
+    if( ( my_version_and_traits & version_mask ) < 3 )
+        my_name = internal::CUSTOM_CTX;
+#endif
+    ITT_TASK_GROUP(this, my_name, NULL);
+    __TBB_STATIC_ASSERT ( sizeof(my_version_and_traits) >= 4, "Layout of my_version_and_traits must be reconsidered on this platform" );
+    __TBB_STATIC_ASSERT ( sizeof(task_group_context) == 2 * NFS_MaxLineSize, "Context class has wrong size - check padding and members alignment" );
+    __TBB_ASSERT ( (uintptr_t(this) & (sizeof(my_cancellation_requested) - 1)) == 0, "Context is improperly aligned" );
+    __TBB_ASSERT ( __TBB_load_relaxed(my_kind) == isolated || __TBB_load_relaxed(my_kind) == bound, "Context can be created only as isolated or bound" );
+    my_parent = NULL;
+    my_cancellation_requested = 0;
+    my_exception = NULL;
+    my_owner = NULL;
+    my_state = 0;
+    itt_caller = ITT_CALLER_NULL;
+#if __TBB_TASK_PRIORITY
+    my_priority = normalized_normal_priority;
+#endif /* __TBB_TASK_PRIORITY */
+#if __TBB_FP_CONTEXT
+    __TBB_STATIC_ASSERT( sizeof(my_cpu_ctl_env) == sizeof(internal::uint64_t), "The reserved space for FPU settings are not equal sizeof(uint64_t)" );
+    __TBB_STATIC_ASSERT( sizeof(cpu_ctl_env) <= sizeof(my_cpu_ctl_env), "FPU settings storage does not fit to uint64_t" );
+    suppress_unused_warning( my_cpu_ctl_env.space );
+
+    cpu_ctl_env &ctl = *internal::punned_cast<cpu_ctl_env*>(&my_cpu_ctl_env);
+    new ( &ctl ) cpu_ctl_env;
+    if ( my_version_and_traits & fp_settings )
+        ctl.get_env();
+#endif
+}
+
+void task_group_context::register_with ( generic_scheduler *local_sched ) {
+    __TBB_ASSERT( local_sched, NULL );
+    my_owner = local_sched;
+    // state propagation logic assumes new contexts are bound to head of the list
+    my_node.my_prev = &local_sched->my_context_list_head;
+    // Notify threads that may be concurrently destroying contexts registered
+    // in this scheduler's list that local list update is underway.
+    local_sched->my_local_ctx_list_update.store<relaxed>(1);
+    // Prevent load of global propagation epoch counter from being hoisted before
+    // speculative stores above, as well as load of nonlocal update flag from
+    // being hoisted before the store to local update flag.
+    atomic_fence();
+    // Finalize local context list update
+    if ( local_sched->my_nonlocal_ctx_list_update.load<relaxed>() ) {
+        spin_mutex::scoped_lock lock(my_owner->my_context_list_mutex);
+        local_sched->my_context_list_head.my_next->my_prev = &my_node;
+        my_node.my_next = local_sched->my_context_list_head.my_next;
+        my_owner->my_local_ctx_list_update.store<relaxed>(0);
+        local_sched->my_context_list_head.my_next = &my_node;
+    }
+    else {
+        local_sched->my_context_list_head.my_next->my_prev = &my_node;
+        my_node.my_next = local_sched->my_context_list_head.my_next;
+        my_owner->my_local_ctx_list_update.store<release>(0);
+        // Thread-local list of contexts allows concurrent traversal by another thread
+        // while propagating state change. To ensure visibility of my_node's members
+        // to the concurrently traversing thread, the list's head is updated by means
+        // of store-with-release.
+        __TBB_store_with_release(local_sched->my_context_list_head.my_next, &my_node);
+    }
+}
+
+void task_group_context::bind_to ( generic_scheduler *local_sched ) {
+    __TBB_ASSERT ( __TBB_load_relaxed(my_kind) == binding_required, "Already bound or isolated?" );
+    __TBB_ASSERT ( !my_parent, "Parent is set before initial binding" );
+    my_parent = local_sched->my_innermost_running_task->prefix().context;
+#if __TBB_FP_CONTEXT
+    // Inherit FPU settings only if the context has not captured FPU settings yet.
+    if ( !(my_version_and_traits & fp_settings) )
+        copy_fp_settings(*my_parent);
+#endif
+
+    // Condition below prevents unnecessary thrashing parent context's cache line
+    if ( !(my_parent->my_state & may_have_children) )
+        my_parent->my_state |= may_have_children; // full fence is below
+    if ( my_parent->my_parent ) {
+        // Even if this context were made accessible for state change propagation
+        // (by placing __TBB_store_with_release(s->my_context_list_head.my_next, &my_node)
+        // above), it still could be missed if state propagation from a grand-ancestor
+        // was underway concurrently with binding.
+        // Speculative propagation from the parent together with epoch counters
+        // detecting possibility of such a race allow to avoid taking locks when
+        // there is no contention.
+
+        // Acquire fence is necessary to prevent reordering subsequent speculative
+        // loads of parent state data out of the scope where epoch counters comparison
+        // can reliably validate it.
+        uintptr_t local_count_snapshot = __TBB_load_with_acquire( my_parent->my_owner->my_context_state_propagation_epoch );
+        // Speculative propagation of parent's state. The speculation will be
+        // validated by the epoch counters check further on.
+        my_cancellation_requested = my_parent->my_cancellation_requested;
+#if __TBB_TASK_PRIORITY
+        my_priority = my_parent->my_priority;
+#endif /* __TBB_TASK_PRIORITY */
+        register_with( local_sched ); // Issues full fence
+
+        // If no state propagation was detected by the following condition, the above
+        // full fence guarantees that the parent had correct state during speculative
+        // propagation before the fence. Otherwise the propagation from parent is
+        // repeated under the lock.
+        if ( local_count_snapshot != the_context_state_propagation_epoch ) {
+            // Another thread may be propagating state change right now. So resort to lock.
+            context_state_propagation_mutex_type::scoped_lock lock(the_context_state_propagation_mutex);
+            my_cancellation_requested = my_parent->my_cancellation_requested;
+#if __TBB_TASK_PRIORITY
+            my_priority = my_parent->my_priority;
+#endif /* __TBB_TASK_PRIORITY */
+        }
+    }
+    else {
+        register_with( local_sched ); // Issues full fence
+        // As we do not have grand-ancestors, concurrent state propagation (if any)
+        // may originate only from the parent context, and thus it is safe to directly
+        // copy the state from it.
+        my_cancellation_requested = my_parent->my_cancellation_requested;
+#if __TBB_TASK_PRIORITY
+        my_priority = my_parent->my_priority;
+#endif /* __TBB_TASK_PRIORITY */
+    }
+    __TBB_store_relaxed(my_kind, binding_completed);
+}
+
+template <typename T>
+void task_group_context::propagate_task_group_state ( T task_group_context::*mptr_state, task_group_context& src, T new_state ) {
+    if (this->*mptr_state == new_state) {
+        // Nothing to do, whether descending from "src" or not, so no need to scan.
+        // Hopefully this happens often thanks to earlier invocations.
+        // This optimization is enabled by LIFO order in the context lists:
+        // - new contexts are bound to the beginning of lists;
+        // - descendants are newer than ancestors;
+        // - earlier invocations are therefore likely to "paint" long chains.
+    }
+    else if (this == &src) {
+        // This clause is disjunct from the traversal below, which skips src entirely.
+        // Note that src.*mptr_state is not necessarily still equal to new_state (another thread may have changed it again).
+        // Such interference is probably not frequent enough to aim for optimisation by writing new_state again (to make the other thread back down).
+        // Letting the other thread prevail may also be fairer.
+    }
+    else {
+        for ( task_group_context *ancestor = my_parent; ancestor != NULL; ancestor = ancestor->my_parent ) {
+            __TBB_ASSERT(internal::is_alive(ancestor->my_version_and_traits), "context tree was corrupted");
+            if ( ancestor == &src ) {
+                for ( task_group_context *ctx = this; ctx != ancestor; ctx = ctx->my_parent )
+                    ctx->*mptr_state = new_state;
+                break;
+            }
+        }
+    }
+}
+
+template <typename T>
+void generic_scheduler::propagate_task_group_state ( T task_group_context::*mptr_state, task_group_context& src, T new_state ) {
+    spin_mutex::scoped_lock lock(my_context_list_mutex);
+    // Acquire fence is necessary to ensure that the subsequent node->my_next load
+    // returned the correct value in case it was just inserted in another thread.
+    // The fence also ensures visibility of the correct my_parent value.
+    context_list_node_t *node = __TBB_load_with_acquire(my_context_list_head.my_next);
+    while ( node != &my_context_list_head ) {
+        task_group_context &ctx = __TBB_get_object_ref(task_group_context, my_node, node);
+        if ( ctx.*mptr_state != new_state )
+            ctx.propagate_task_group_state( mptr_state, src, new_state );
+        node = node->my_next;
+        __TBB_ASSERT( is_alive(ctx.my_version_and_traits), "Local context list contains destroyed object" );
+    }
+    // Sync up local propagation epoch with the global one. Release fence prevents
+    // reordering of possible store to *mptr_state after the sync point.
+    __TBB_store_with_release(my_context_state_propagation_epoch, the_context_state_propagation_epoch);
+}
+
+template <typename T>
+bool market::propagate_task_group_state ( T task_group_context::*mptr_state, task_group_context& src, T new_state ) {
+    if ( !(src.my_state & task_group_context::may_have_children) )
+        return true;
+    // The whole propagation algorithm is under the lock in order to ensure correctness
+    // in case of concurrent state changes at the different levels of the context tree.
+    // See comment at the bottom of scheduler.cpp
+    context_state_propagation_mutex_type::scoped_lock lock(the_context_state_propagation_mutex);
+    if ( src.*mptr_state != new_state )
+        // Another thread has concurrently changed the state. Back down.
+        return false;
+    // Advance global state propagation epoch
+    __TBB_FetchAndAddWrelease(&the_context_state_propagation_epoch, 1);
+    // Propagate to all workers and masters and sync up their local epochs with the global one
+    unsigned num_workers = my_first_unused_worker_idx;
+    for ( unsigned i = 0; i < num_workers; ++i ) {
+        generic_scheduler *s = my_workers[i];
+        // If the worker is only about to be registered, skip it.
+        if ( s )
+            s->propagate_task_group_state( mptr_state, src, new_state );
+    }
+    // Propagate to all master threads
+    // The whole propagation sequence is locked, thus no contention is expected
+    for( scheduler_list_type::iterator it = my_masters.begin(); it != my_masters.end(); it++  )
+        it->propagate_task_group_state( mptr_state, src, new_state );
+    return true;
+}
+
+bool task_group_context::cancel_group_execution () {
+    __TBB_ASSERT ( my_cancellation_requested == 0 || my_cancellation_requested == 1, "Invalid cancellation state");
+    if ( my_cancellation_requested || as_atomic(my_cancellation_requested).compare_and_swap(1, 0) ) {
+        // This task group and any descendants have already been canceled.
+        // (A newly added descendant would inherit its parent's my_cancellation_requested,
+        // not missing out on any cancellation still being propagated, and a context cannot be uncanceled.)
+        return false;
+    }
+    governor::local_scheduler_weak()->my_market->propagate_task_group_state( &task_group_context::my_cancellation_requested, *this, (uintptr_t)1 );
+    return true;
+}
+
+bool task_group_context::is_group_execution_cancelled () const {
+    return my_cancellation_requested != 0;
+}
+
+// IMPORTANT: It is assumed that this method is not used concurrently!
+void task_group_context::reset () {
+    //! TODO: Add assertion that this context does not have children
+    // No fences are necessary since this context can be accessed from another thread
+    // only after stealing happened (which means necessary fences were used).
+    if ( my_exception )  {
+        my_exception->destroy();
+        my_exception = NULL;
+    }
+    my_cancellation_requested = 0;
+}
+
+#if __TBB_FP_CONTEXT
+// IMPORTANT: It is assumed that this method is not used concurrently!
+void task_group_context::capture_fp_settings () {
+    //! TODO: Add assertion that this context does not have children
+    // No fences are necessary since this context can be accessed from another thread
+    // only after stealing happened (which means necessary fences were used).
+    cpu_ctl_env &ctl = *internal::punned_cast<cpu_ctl_env*>(&my_cpu_ctl_env);
+    if ( !(my_version_and_traits & fp_settings) ) {
+        new ( &ctl ) cpu_ctl_env;
+        my_version_and_traits |= fp_settings;
+    }
+    ctl.get_env();
+}
+
+void task_group_context::copy_fp_settings( const task_group_context &src ) {
+    __TBB_ASSERT( !(my_version_and_traits & fp_settings), "The context already has FPU settings." );
+    __TBB_ASSERT( src.my_version_and_traits & fp_settings, "The source context does not have FPU settings." );
+
+    cpu_ctl_env &ctl = *internal::punned_cast<cpu_ctl_env*>(&my_cpu_ctl_env);
+    cpu_ctl_env &src_ctl = *internal::punned_cast<cpu_ctl_env*>(&src.my_cpu_ctl_env);
+    new (&ctl) cpu_ctl_env( src_ctl );
+    my_version_and_traits |= fp_settings;
+}
+#endif /* __TBB_FP_CONTEXT */
+
+void task_group_context::register_pending_exception () {
+    if ( my_cancellation_requested )
+        return;
+#if TBB_USE_EXCEPTIONS
+    try {
+        throw;
+    } TbbCatchAll( this );
+#endif /* TBB_USE_EXCEPTIONS */
+}
+
+#if __TBB_TASK_PRIORITY
+void task_group_context::set_priority ( priority_t prio ) {
+    __TBB_ASSERT( prio == priority_low || prio == priority_normal || prio == priority_high, "Invalid priority level value" );
+    intptr_t p = normalize_priority(prio);
+    if ( my_priority == p && !(my_state & task_group_context::may_have_children))
+        return;
+    my_priority = p;
+    internal::generic_scheduler* s = governor::local_scheduler_if_initialized();
+    if ( !s || !s->my_arena || !s->my_market->propagate_task_group_state(&task_group_context::my_priority, *this, p) )
+        return;
+
+    //! TODO: the arena of the calling thread might be unrelated;
+    // need to find out the right arena for priority update.
+    // The executing status check only guarantees being inside some working arena.
+    if ( s->my_innermost_running_task->state() == task::executing )
+        // Updating arena priority here does not eliminate necessity of checking each
+        // task priority and updating arena priority if necessary before the task execution.
+        // These checks will be necessary because:
+        // a) set_priority() may be invoked before any tasks from this task group are spawned;
+        // b) all spawned tasks from this task group are retrieved from the task pools.
+        // These cases create a time window when arena priority may be lowered.
+        s->my_market->update_arena_priority( *s->my_arena, p );
+}
+
+priority_t task_group_context::priority () const {
+    return static_cast<priority_t>(priority_from_normalized_rep[my_priority]);
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/task_stream.h b/xdl/third_party/tbb/src/tbb/task_stream.h
new file mode 100644
index 00000000..30aac2cd
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/task_stream.h
@@ -0,0 +1,172 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_task_stream_H
+#define _TBB_task_stream_H
+
+#include "tbb/tbb_stddef.h"
+#include <deque>
+#include <climits>
+#include "tbb/atomic.h" // for __TBB_Atomic*
+#include "tbb/spin_mutex.h"
+#include "tbb/tbb_allocator.h"
+#include "scheduler_common.h"
+#include "tbb_misc.h" // for FastRandom
+
+namespace tbb {
+namespace internal {
+
+//! Essentially, this is just a pair of a queue and a mutex to protect the queue.
+/** The reason std::pair is not used is that the code would look less clean
+    if field names were replaced with 'first' and 'second'. **/
+template< typename T, typename mutex_t >
+struct queue_and_mutex {
+    typedef std::deque< T, tbb_allocator<T> > queue_base_t;
+
+    queue_base_t my_queue;
+    mutex_t      my_mutex;
+
+    queue_and_mutex () : my_queue(), my_mutex() {}
+    ~queue_and_mutex () {}
+};
+
+typedef uintptr_t population_t;
+const population_t one = 1;
+
+inline void set_one_bit( population_t& dest, int pos ) {
+    __TBB_ASSERT( pos>=0, NULL );
+    __TBB_ASSERT( pos<int(sizeof(population_t)*CHAR_BIT), NULL );
+    __TBB_AtomicOR( &dest, one<<pos );
+}
+
+inline void clear_one_bit( population_t& dest, int pos ) {
+    __TBB_ASSERT( pos>=0, NULL );
+    __TBB_ASSERT( pos<int(sizeof(population_t)*CHAR_BIT), NULL );
+    __TBB_AtomicAND( &dest, ~(one<<pos) );
+}
+
+inline bool is_bit_set( population_t val, int pos ) {
+    __TBB_ASSERT( pos>=0, NULL );
+    __TBB_ASSERT( pos<int(sizeof(population_t)*CHAR_BIT), NULL );
+    return (val & (one<<pos)) != 0;
+}
+
+//! The container for "fairness-oriented" aka "enqueued" tasks.
+template<int Levels>
+class task_stream : no_copy {
+    typedef queue_and_mutex <task*, spin_mutex> lane_t;
+    population_t population[Levels];
+    padded<lane_t>* lanes[Levels];
+    unsigned N;
+
+public:
+    task_stream() : N() {
+        for(int level = 0; level < Levels; level++) {
+            population[level] = 0;
+            lanes[level] = NULL;
+        }
+    }
+
+    void initialize( unsigned n_lanes ) {
+        const unsigned max_lanes = sizeof(population_t) * CHAR_BIT;
+
+        N = n_lanes>=max_lanes ? max_lanes : n_lanes>2 ? 1<<(__TBB_Log2(n_lanes-1)+1) : 2;
+        __TBB_ASSERT( N==max_lanes || N>=n_lanes && ((N-1)&N)==0, "number of lanes miscalculated");
+        __TBB_ASSERT( N <= sizeof(population_t) * CHAR_BIT, NULL );
+        for(int level = 0; level < Levels; level++) {
+            lanes[level] = new padded<lane_t>[N];
+            __TBB_ASSERT( !population[level], NULL );
+        }
+    }
+
+    ~task_stream() {
+        for(int level = 0; level < Levels; level++)
+            if (lanes[level]) delete[] lanes[level];
+    }
+
+    //! Push a task into a lane.
+    void push( task* source, int level, FastRandom& random ) {
+        // Lane selection is random. Each thread should keep a separate seed value.
+        unsigned idx;
+        for( ; ; ) {
+            idx = random.get() & (N-1);
+            spin_mutex::scoped_lock lock;
+            if( lock.try_acquire(lanes[level][idx].my_mutex) ) {
+                lanes[level][idx].my_queue.push_back(source);
+                set_one_bit( population[level], idx ); //TODO: avoid atomic op if the bit is already set
+                break;
+            }
+        }
+    }
+
+    //! Try finding and popping a task.
+    task* pop( int level, unsigned& last_used_lane ) {
+        task* result = NULL;
+        // Lane selection is round-robin. Each thread should keep its last used lane.
+        unsigned idx = (last_used_lane+1)&(N-1);
+        for( ; population[level]; idx=(idx+1)&(N-1) ) {
+            if( is_bit_set( population[level], idx ) ) {
+                lane_t& lane = lanes[level][idx];
+                spin_mutex::scoped_lock lock;
+                if( lock.try_acquire(lane.my_mutex) && !lane.my_queue.empty() ) {
+                    result = lane.my_queue.front();
+                    lane.my_queue.pop_front();
+                    if( lane.my_queue.empty() )
+                        clear_one_bit( population[level], idx );
+                    break;
+                }
+            }
+        }
+        last_used_lane = idx;
+        return result;
+    }
+
+    //! Checks existence of a task.
+    bool empty(int level) {
+        return !population[level];
+    }
+
+    //! Destroys all remaining tasks in every lane. Returns the number of destroyed tasks.
+    /** Tasks are not executed, because it would potentially create more tasks at a late stage.
+        The scheduler is really expected to execute all tasks before task_stream destruction. */
+    intptr_t drain() {
+        intptr_t result = 0;
+        for(int level = 0; level < Levels; level++)
+            for(unsigned i=0; i<N; ++i) {
+                lane_t& lane = lanes[level][i];
+                spin_mutex::scoped_lock lock(lane.my_mutex);
+                for(lane_t::queue_base_t::iterator it=lane.my_queue.begin();
+                    it!=lane.my_queue.end(); ++it, ++result)
+                {
+                    __TBB_ASSERT( is_bit_set( population[level], i ), NULL );
+                    task* t = *it;
+                    tbb::task::destroy(*t);
+                }
+                lane.my_queue.clear();
+                clear_one_bit( population[level], i );
+            }
+        return result;
+    }
+}; // task_stream
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_task_stream_H */
diff --git a/xdl/third_party/tbb/src/tbb/task_stream_extended.h b/xdl/third_party/tbb/src/tbb/task_stream_extended.h
new file mode 100644
index 00000000..4ff34aa4
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/task_stream_extended.h
@@ -0,0 +1,323 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_task_stream_extended_H
+#define _TBB_task_stream_extended_H
+
+//! This file is a possible future replacement for the task_stream class implemented in
+//! task_stream.h. It refactors the code and extends task_stream capabilities by moving lane
+//! management during operations on caller side. Despite the fact that new implementation should not
+//! affect performance of the original task stream, analysis on this subject was not made at the
+//! time it was developed. In addition, it is not clearly seen at the moment that this container
+//! would be suitable for critical tasks due to linear time complexity on its operations.
+
+
+#if _TBB_task_stream_H
+#error Either task_stream.h or this file can be included at the same time.
+#endif
+
+#if !__TBB_CPF_BUILD
+#error This code bears a preview status until it proves its usefulness/peformance suitability.
+#endif
+
+#include "tbb/tbb_stddef.h"
+#include <deque>
+#include <climits>
+#include "tbb/atomic.h" // for __TBB_Atomic*
+#include "tbb/spin_mutex.h"
+#include "tbb/tbb_allocator.h"
+#include "scheduler_common.h"
+#include "tbb_misc.h" // for FastRandom
+
+namespace tbb {
+namespace internal {
+
+//! Essentially, this is just a pair of a queue and a mutex to protect the queue.
+/** The reason std::pair is not used is that the code would look less clean
+    if field names were replaced with 'first' and 'second'. **/
+template< typename T, typename mutex_t >
+struct queue_and_mutex {
+    typedef std::deque< T, tbb_allocator<T> > queue_base_t;
+
+    queue_base_t my_queue;
+    mutex_t      my_mutex;
+
+    queue_and_mutex () : my_queue(), my_mutex() {}
+    ~queue_and_mutex () {}
+};
+
+typedef uintptr_t population_t;
+const population_t one = 1;
+
+inline void set_one_bit( population_t& dest, int pos ) {
+    __TBB_ASSERT( pos>=0, NULL );
+    __TBB_ASSERT( pos<int(sizeof(population_t)*CHAR_BIT), NULL );
+    __TBB_AtomicOR( &dest, one<<pos );
+}
+
+inline void clear_one_bit( population_t& dest, int pos ) {
+    __TBB_ASSERT( pos>=0, NULL );
+    __TBB_ASSERT( pos<int(sizeof(population_t)*CHAR_BIT), NULL );
+    __TBB_AtomicAND( &dest, ~(one<<pos) );
+}
+
+inline bool is_bit_set( population_t val, int pos ) {
+    __TBB_ASSERT( pos>=0, NULL );
+    __TBB_ASSERT( pos<int(sizeof(population_t)*CHAR_BIT), NULL );
+    return (val & (one<<pos)) != 0;
+}
+
+struct random_lane_selector :
+#if __INTEL_COMPILER == 1110 || __INTEL_COMPILER == 1500
+        no_assign
+#else
+        no_copy
+#endif
+{
+    random_lane_selector( FastRandom& random ) : my_random( random ) {}
+    unsigned operator()( unsigned out_of ) const {
+        __TBB_ASSERT( ((out_of-1) & out_of) == 0, "number of lanes is not power of two." );
+        return my_random.get() & (out_of-1);
+    }
+private:
+    FastRandom& my_random;
+};
+
+struct lane_selector_base :
+#if __INTEL_COMPILER == 1110 || __INTEL_COMPILER == 1500
+        no_assign
+#else
+        no_copy
+#endif
+{
+    unsigned& my_previous;
+    lane_selector_base( unsigned& previous ) : my_previous( previous ) {}
+};
+
+struct subsequent_lane_selector : lane_selector_base {
+    subsequent_lane_selector( unsigned& previous ) : lane_selector_base( previous ) {}
+    unsigned operator()( unsigned out_of ) const {
+        __TBB_ASSERT( ((out_of-1) & out_of) == 0, "number of lanes is not power of two." );
+        return (++my_previous &= out_of-1);
+    }
+};
+
+struct preceding_lane_selector : lane_selector_base {
+    preceding_lane_selector( unsigned& previous ) : lane_selector_base( previous ) {}
+    unsigned operator()( unsigned out_of ) const {
+        __TBB_ASSERT( ((out_of-1) & out_of) == 0, "number of lanes is not power of two." );
+        return (--my_previous &= (out_of-1));
+    }
+};
+
+class task_stream_base : no_copy {
+protected:
+    typedef queue_and_mutex <task*, spin_mutex> lane_t;
+};
+
+enum task_stream_accessor_type { front_accessor = 0, back_nonnull_accessor };
+
+//! Specializes from which side of the underlying container elements are retrieved. Method must be
+//! called under corresponding mutex locked.
+template<task_stream_accessor_type accessor>
+class task_stream_accessor : public task_stream_base {
+protected:
+    using task_stream_base::lane_t;
+    task* get_item( lane_t::queue_base_t& queue ) {
+        task* result = queue.front();
+        queue.pop_front();
+        return result;
+    }
+};
+
+template<>
+class task_stream_accessor< back_nonnull_accessor > : public task_stream_base {
+protected:
+    task* get_item( lane_t::queue_base_t& queue ) {
+        task* result = NULL;
+        do {
+            result = queue.back();
+            queue.pop_back();
+        } while( !result && !queue.empty() );
+        return result;
+    }
+};
+
+//! The container for "fairness-oriented" aka "enqueued" tasks.
+template<int Levels, task_stream_accessor_type accessor>
+class task_stream : public task_stream_accessor< accessor > {
+    typedef typename task_stream_accessor<accessor>::lane_t lane_t;
+    population_t population[Levels];
+    padded<lane_t>* lanes[Levels];
+    unsigned N;
+
+public:
+    task_stream() : N() {
+        for(int level = 0; level < Levels; level++) {
+            population[level] = 0;
+            lanes[level] = NULL;
+        }
+    }
+
+    void initialize( unsigned n_lanes ) {
+        const unsigned max_lanes = sizeof(population_t) * CHAR_BIT;
+
+        N = n_lanes>=max_lanes ? max_lanes : n_lanes>2 ? 1<<(__TBB_Log2(n_lanes-1)+1) : 2;
+        __TBB_ASSERT( N==max_lanes || N>=n_lanes && ((N-1)&N)==0, "number of lanes miscalculated");
+        __TBB_ASSERT( N <= sizeof(population_t) * CHAR_BIT, NULL );
+        for(int level = 0; level < Levels; level++) {
+            lanes[level] = new padded<lane_t>[N];
+            __TBB_ASSERT( !population[level], NULL );
+        }
+    }
+
+    ~task_stream() {
+        for(int level = 0; level < Levels; level++)
+            if (lanes[level]) delete[] lanes[level];
+    }
+
+    //! Returns true on successful push, otherwise - false.
+    bool try_push( task* source, int level, unsigned lane_idx ) {
+        __TBB_ASSERT( 0 <= level && level < Levels, "Incorrect lane level specified." );
+        spin_mutex::scoped_lock lock;
+        if( lock.try_acquire( lanes[level][lane_idx].my_mutex ) ) {
+            lanes[level][lane_idx].my_queue.push_back( source );
+            set_one_bit( population[level], lane_idx ); // TODO: avoid atomic op if the bit is already set
+            return true;
+        }
+        return false;
+    }
+
+    //! Push a task into a lane. Lane selection is performed by passed functor.
+    template<typename lane_selector_t>
+    void push( task* source, int level, const lane_selector_t& next_lane ) {
+        bool succeed = false;
+        unsigned lane = 0;
+        do {
+            lane = next_lane( /*out_of=*/N );
+            __TBB_ASSERT( lane < N, "Incorrect lane index." );
+        } while( ! (succeed = try_push( source, level, lane )) );
+    }
+
+    //! Returns pointer to task on successful pop, otherwise - NULL.
+    task* try_pop( int level, unsigned lane_idx ) {
+        __TBB_ASSERT( 0 <= level && level < Levels, "Incorrect lane level specified." );
+        if( !is_bit_set( population[level], lane_idx ) )
+            return NULL;
+        task* result = NULL;
+        lane_t& lane = lanes[level][lane_idx];
+        spin_mutex::scoped_lock lock;
+        if( lock.try_acquire( lane.my_mutex ) && !lane.my_queue.empty() ) {
+            result = this->get_item( lane.my_queue );
+            if( lane.my_queue.empty() )
+                clear_one_bit( population[level], lane_idx );
+        }
+        return result;
+    }
+
+    //! Try finding and popping a task using passed functor for lane selection. Last used lane is
+    //! updated inside lane selector.
+    template<typename lane_selector_t>
+    task* pop( int level, const lane_selector_t& next_lane ) {
+        task* popped = NULL;
+        unsigned lane = 0;
+        do {
+            lane = next_lane( /*out_of=*/N );
+            __TBB_ASSERT( lane < N, "Incorrect lane index." );
+        } while( !empty( level ) && !(popped = try_pop( level, lane )) );
+        return popped;
+    }
+
+    // TODO: unify '*_specific' logic with 'pop' methods above
+    task* look_specific( __TBB_ISOLATION_ARG(task_stream_base::lane_t::queue_base_t& queue, isolation_tag isolation) ) {
+        __TBB_ASSERT( !queue.empty(), NULL );
+        // TODO: add a worst-case performance test and consider an alternative container with better
+        // performance for isolation search.
+        typename lane_t::queue_base_t::iterator curr = queue.end();
+        do {
+            // TODO: consider logic from get_task to simplify the code.
+            task* result = *--curr;
+            if( result __TBB_ISOLATION_EXPR( && result->prefix().isolation == isolation ) ) {
+                if( queue.end() - curr == 1 )
+                    queue.pop_back(); // a little of housekeeping along the way
+                else
+                    *curr = 0;      // grabbing task with the same isolation
+                // TODO: move one of the container's ends instead if the task has been found there
+                return result;
+            }
+        } while( curr != queue.begin() );
+        return NULL;
+    }
+
+    //! Try finding and popping a related task.
+    task* pop_specific( int level, __TBB_ISOLATION_ARG(unsigned& last_used_lane, isolation_tag isolation) ) {
+        task* result = NULL;
+        // Lane selection is round-robin in backward direction.
+        unsigned idx = last_used_lane & (N-1);
+        do {
+            if( is_bit_set( population[level], idx ) ) {
+                lane_t& lane = lanes[level][idx];
+                spin_mutex::scoped_lock lock;
+                if( lock.try_acquire(lane.my_mutex) && !lane.my_queue.empty() ) {
+                    result = look_specific( __TBB_ISOLATION_ARG(lane.my_queue, isolation) );
+                    if( lane.my_queue.empty() )
+                        clear_one_bit( population[level], idx );
+                    if( result )
+                        break;
+                }
+            }
+            idx=(idx-1)&(N-1);
+        } while( !empty(level) && idx != last_used_lane );
+        last_used_lane = idx;
+        return result;
+    }
+
+    //! Checks existence of a task.
+    bool empty(int level) {
+        return !population[level];
+    }
+
+    //! Destroys all remaining tasks in every lane. Returns the number of destroyed tasks.
+    /** Tasks are not executed, because it would potentially create more tasks at a late stage.
+        The scheduler is really expected to execute all tasks before task_stream destruction. */
+    intptr_t drain() {
+        intptr_t result = 0;
+        for(int level = 0; level < Levels; level++)
+            for(unsigned i=0; i<N; ++i) {
+                lane_t& lane = lanes[level][i];
+                spin_mutex::scoped_lock lock(lane.my_mutex);
+                for(typename lane_t::queue_base_t::iterator it=lane.my_queue.begin();
+                    it!=lane.my_queue.end(); ++it, ++result)
+                {
+                    __TBB_ASSERT( is_bit_set( population[level], i ), NULL );
+                    task* t = *it;
+                    tbb::task::destroy(*t);
+                }
+                lane.my_queue.clear();
+                clear_one_bit( population[level], i );
+            }
+        return result;
+    }
+}; // task_stream
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_task_stream_extended_H */
diff --git a/xdl/third_party/tbb/src/tbb/tbb_assert_impl.h b/xdl/third_party/tbb/src/tbb/tbb_assert_impl.h
new file mode 100644
index 00000000..9032adb0
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_assert_impl.h
@@ -0,0 +1,101 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// IMPORTANT: To use assertion handling in TBB, exactly one of the TBB source files
+// should #include tbb_assert_impl.h thus instantiating assertion handling routines.
+// The intent of putting it to a separate file is to allow some tests to use it
+// as well in order to avoid dependency on the library.
+
+// include headers for required function declarations
+#include <cstdlib>
+#include <stdio.h>
+#include <string.h>
+#include <stdarg.h>
+#if _MSC_VER
+#include <crtdbg.h>
+#endif
+
+#if _MSC_VER >= 1400
+#define __TBB_EXPORTED_FUNC   __cdecl
+#else
+#define __TBB_EXPORTED_FUNC
+#endif
+
+#if __TBBMALLOC_BUILD
+namespace rml { namespace internal {
+#else
+namespace tbb {
+#endif
+    //! Type for an assertion handler
+    typedef void(*assertion_handler_type)( const char* filename, int line, const char* expression, const char * comment );
+
+    static assertion_handler_type assertion_handler;
+
+    assertion_handler_type __TBB_EXPORTED_FUNC set_assertion_handler( assertion_handler_type new_handler ) {
+        assertion_handler_type old_handler = assertion_handler;
+        assertion_handler = new_handler;
+        return old_handler;
+    }
+
+    void __TBB_EXPORTED_FUNC assertion_failure( const char* filename, int line, const char* expression, const char* comment ) {
+        if( assertion_handler_type a = assertion_handler ) {
+            (*a)(filename,line,expression,comment);
+        } else {
+            static bool already_failed;
+            if( !already_failed ) {
+                already_failed = true;
+                fprintf( stderr, "Assertion %s failed on line %d of file %s\n",
+                         expression, line, filename );
+                if( comment )
+                    fprintf( stderr, "Detailed description: %s\n", comment );
+#if _MSC_VER && _DEBUG
+                if(1 == _CrtDbgReport(_CRT_ASSERT, filename, line, "tbb_debug.dll", "%s\r\n%s", expression, comment?comment:""))
+                        _CrtDbgBreak();
+#else
+                fflush(stderr);
+                std::abort();
+#endif
+            }
+        }
+    }
+
+#if defined(_MSC_VER)&&_MSC_VER<1400
+#   define vsnprintf _vsnprintf
+#endif
+
+#if !__TBBMALLOC_BUILD
+    namespace internal {
+        //! Report a runtime warning.
+        void __TBB_EXPORTED_FUNC runtime_warning( const char* format, ... )
+        {
+            char str[1024]; memset(str, 0, 1024);
+            va_list args; va_start(args, format);
+            vsnprintf( str, 1024-1, format, args);
+            va_end(args);
+            fprintf( stderr, "TBB Warning: %s\n", str);
+        }
+    } // namespace internal
+#endif
+
+#if __TBBMALLOC_BUILD
+}} // namespaces rml::internal
+#else
+}  // namespace tbb
+#endif
diff --git a/xdl/third_party/tbb/src/tbb/tbb_environment.h b/xdl/third_party/tbb/src/tbb/tbb_environment.h
new file mode 100644
index 00000000..bde3fd6c
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_environment.h
@@ -0,0 +1,59 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbb_environment_H
+#define __TBB_tbb_environment_H
+
+#include <cstdlib>
+#include <cstring>
+
+namespace tbb {
+
+namespace internal {
+
+#if __TBB_WIN8UI_SUPPORT
+static inline bool GetBoolEnvironmentVariable( const char * ) {
+    return false;
+}
+#else  /* __TBB_WIN8UI_SUPPORT */
+static inline bool GetBoolEnvironmentVariable( const char * name ) {
+    if( const char* s = std::getenv(name) )
+    {
+        // The result is defined as true only if the environment variable contains
+        // no characters except one '1' character and an arbitrary number of spaces
+        // (including the absence of spaces).
+        size_t index = std::strspn(s, " ");
+        if (s[index] != '1') return false;
+        index++;
+        // Memory access after incrementing is safe, since the getenv() returns a
+        // NULL terminated string, and even if the character getting by index is '1',
+        // and this character is the end of string, after incrementing we will get
+        // an index of character, that contains '\0'
+        index += std::strspn(&s[index], " ");
+        return !s[index];
+    }
+    return false;
+}
+#endif /* __TBB_WIN8UI_SUPPORT */
+
+} // namespace internal
+} // namespace tbb
+
+#endif // __TBB_tbb_environment_H
diff --git a/xdl/third_party/tbb/src/tbb/tbb_main.cpp b/xdl/third_party/tbb/src/tbb/tbb_main.cpp
new file mode 100644
index 00000000..060fdb74
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_main.cpp
@@ -0,0 +1,565 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#include "tbb/global_control.h"
+#include "tbb_main.h"
+#include "governor.h"
+#include "market.h"
+#include "tbb_misc.h"
+#include "itt_notify.h"
+
+namespace tbb {
+namespace internal {
+
+//------------------------------------------------------------------------
+// Begin shared data layout.
+// The following global data items are mostly read-only after initialization.
+//------------------------------------------------------------------------
+
+//! Padding in order to prevent false sharing.
+static const char _pad[NFS_MaxLineSize - sizeof(int)] = {};
+
+//------------------------------------------------------------------------
+// governor data
+basic_tls<uintptr_t> governor::theTLS;
+unsigned governor::DefaultNumberOfThreads;
+rml::tbb_factory governor::theRMLServerFactory;
+bool governor::UsePrivateRML;
+bool governor::is_speculation_enabled;
+bool governor::is_rethrow_broken;
+
+//------------------------------------------------------------------------
+// market data
+market* market::theMarket;
+market::global_market_mutex_type market::theMarketMutex;
+
+//------------------------------------------------------------------------
+// One time initialization data
+
+//! Counter of references to global shared resources such as TLS.
+atomic<int> __TBB_InitOnce::count;
+
+__TBB_atomic_flag __TBB_InitOnce::InitializationLock;
+
+//! Flag that is set to true after one-time initializations are done.
+bool __TBB_InitOnce::InitializationDone;
+
+#if DO_ITT_NOTIFY
+    static bool ITT_Present;
+    static bool ITT_InitializationDone;
+#endif
+
+#if !(_WIN32||_WIN64) || __TBB_SOURCE_DIRECTLY_INCLUDED
+    static __TBB_InitOnce __TBB_InitOnceHiddenInstance;
+#endif
+
+//------------------------------------------------------------------------
+// generic_scheduler data
+
+//! Pointer to the scheduler factory function
+generic_scheduler* (*AllocateSchedulerPtr)( market& );
+
+#if __TBB_OLD_PRIMES_RNG
+//! Table of primes used by fast random-number generator (FastRandom).
+/** Also serves to keep anything else from being placed in the same
+    cache line as the global data items preceding it. */
+static const unsigned Primes[] = {
+    0x9e3779b1, 0xffe6cc59, 0x2109f6dd, 0x43977ab5,
+    0xba5703f5, 0xb495a877, 0xe1626741, 0x79695e6b,
+    0xbc98c09f, 0xd5bee2b3, 0x287488f9, 0x3af18231,
+    0x9677cd4d, 0xbe3a6929, 0xadc6a877, 0xdcf0674b,
+    0xbe4d6fe9, 0x5f15e201, 0x99afc3fd, 0xf3f16801,
+    0xe222cfff, 0x24ba5fdb, 0x0620452d, 0x79f149e3,
+    0xc8b93f49, 0x972702cd, 0xb07dd827, 0x6c97d5ed,
+    0x085a3d61, 0x46eb5ea7, 0x3d9910ed, 0x2e687b5b,
+    0x29609227, 0x6eb081f1, 0x0954c4e1, 0x9d114db9,
+    0x542acfa9, 0xb3e6bd7b, 0x0742d917, 0xe9f3ffa7,
+    0x54581edb, 0xf2480f45, 0x0bb9288f, 0xef1affc7,
+    0x85fa0ca7, 0x3ccc14db, 0xe6baf34b, 0x343377f7,
+    0x5ca19031, 0xe6d9293b, 0xf0a9f391, 0x5d2e980b,
+    0xfc411073, 0xc3749363, 0xb892d829, 0x3549366b,
+    0x629750ad, 0xb98294e5, 0x892d9483, 0xc235baf3,
+    0x3d2402a3, 0x6bdef3c9, 0xbec333cd, 0x40c9520f
+};
+
+//------------------------------------------------------------------------
+// End of shared data layout
+//------------------------------------------------------------------------
+
+//------------------------------------------------------------------------
+// Shared data accessors
+//------------------------------------------------------------------------
+
+unsigned GetPrime ( unsigned seed ) {
+    return Primes[seed%(sizeof(Primes)/sizeof(Primes[0]))];
+}
+#endif //__TBB_OLD_PRIMES_RNG
+
+//------------------------------------------------------------------------
+// __TBB_InitOnce
+//------------------------------------------------------------------------
+
+void __TBB_InitOnce::add_ref() {
+    if( ++count==1 )
+        governor::acquire_resources();
+}
+
+void __TBB_InitOnce::remove_ref() {
+    int k = --count;
+    __TBB_ASSERT(k>=0,"removed __TBB_InitOnce ref that was not added?");
+    if( k==0 ) {
+        governor::release_resources();
+        ITT_FINI_ITTLIB();
+    }
+}
+
+//------------------------------------------------------------------------
+// One-time Initializations
+//------------------------------------------------------------------------
+
+//! Defined in cache_aligned_allocator.cpp
+void initialize_cache_aligned_allocator();
+
+//! Defined in scheduler.cpp
+void Scheduler_OneTimeInitialization ( bool itt_present );
+
+#if DO_ITT_NOTIFY
+
+static __itt_domain *tbb_domains[ITT_NUM_DOMAINS] = {};
+
+struct resource_string {
+    const char *str;
+    __itt_string_handle *itt_str_handle;
+};
+
+//
+// populate resource strings
+//
+#define TBB_STRING_RESOURCE( index_name, str ) { str, NULL },
+static resource_string strings_for_itt[] = {
+    #include "tbb/internal/_tbb_strings.h"
+    { "num_resource_strings", NULL }
+};
+#undef TBB_STRING_RESOURCE
+
+static __itt_string_handle *ITT_get_string_handle(int idx) {
+    __TBB_ASSERT( idx >= 0 && idx < NUM_STRINGS, "string handle out of valid range");
+    return (idx >= 0 && idx < NUM_STRINGS) ? strings_for_itt[idx].itt_str_handle : NULL;
+}
+
+static void ITT_init_domains() {
+    tbb_domains[ITT_DOMAIN_MAIN] = __itt_domain_create( _T("tbb") );
+    tbb_domains[ITT_DOMAIN_MAIN]->flags = 1;
+    tbb_domains[ITT_DOMAIN_FLOW] = __itt_domain_create( _T("tbb.flow") );
+    tbb_domains[ITT_DOMAIN_FLOW]->flags = 1;
+    tbb_domains[ITT_DOMAIN_ALGO] = __itt_domain_create( _T("tbb.algorithm") );
+    tbb_domains[ITT_DOMAIN_ALGO]->flags = 1;
+}
+
+static void ITT_init_strings() {
+    for ( int i = 0; i < NUM_STRINGS; ++i ) {
+#if _WIN32||_WIN64
+        strings_for_itt[i].itt_str_handle = __itt_string_handle_createA( strings_for_itt[i].str );
+#else
+        strings_for_itt[i].itt_str_handle = __itt_string_handle_create( strings_for_itt[i].str );
+#endif
+    }
+}
+
+static void ITT_init() {
+    ITT_init_domains();
+    ITT_init_strings();
+}
+
+/** Thread-unsafe lazy one-time initialization of tools interop.
+    Used by both dummy handlers and general TBB one-time initialization routine. **/
+void ITT_DoUnsafeOneTimeInitialization () {
+    if ( !ITT_InitializationDone ) {
+        ITT_Present = (__TBB_load_ittnotify()!=0);
+        if (ITT_Present) ITT_init();
+        ITT_InitializationDone = true;
+        ITT_SYNC_CREATE(&market::theMarketMutex, SyncType_GlobalLock, SyncObj_SchedulerInitialization);
+    }
+}
+
+/** Thread-safe lazy one-time initialization of tools interop.
+    Used by dummy handlers only. **/
+extern "C"
+void ITT_DoOneTimeInitialization() {
+    __TBB_InitOnce::lock();
+    ITT_DoUnsafeOneTimeInitialization();
+    __TBB_InitOnce::unlock();
+}
+#endif /* DO_ITT_NOTIFY */
+
+//! Performs thread-safe lazy one-time general TBB initialization.
+void DoOneTimeInitializations() {
+    suppress_unused_warning(_pad);
+    __TBB_InitOnce::lock();
+    // No fence required for load of InitializationDone, because we are inside a critical section.
+    if( !__TBB_InitOnce::InitializationDone ) {
+        __TBB_InitOnce::add_ref();
+        if( GetBoolEnvironmentVariable("TBB_VERSION") )
+            PrintVersion();
+        bool itt_present = false;
+#if DO_ITT_NOTIFY
+        ITT_DoUnsafeOneTimeInitialization();
+        itt_present = ITT_Present;
+#endif /* DO_ITT_NOTIFY */
+        initialize_cache_aligned_allocator();
+        governor::initialize_rml_factory();
+        Scheduler_OneTimeInitialization( itt_present );
+        // Force processor groups support detection
+        governor::default_num_threads();
+        // Dump version data
+        governor::print_version_info();
+        PrintExtraVersionInfo( "Tools support", itt_present ? "enabled" : "disabled" );
+        __TBB_InitOnce::InitializationDone = true;
+    }
+    __TBB_InitOnce::unlock();
+}
+
+#if (_WIN32||_WIN64) && !__TBB_SOURCE_DIRECTLY_INCLUDED
+//! Windows "DllMain" that handles startup and shutdown of dynamic library.
+extern "C" bool WINAPI DllMain( HANDLE /*hinstDLL*/, DWORD reason, LPVOID lpvReserved ) {
+    switch( reason ) {
+        case DLL_PROCESS_ATTACH:
+            __TBB_InitOnce::add_ref();
+            break;
+        case DLL_PROCESS_DETACH:
+            // Since THREAD_DETACH is not called for the main thread, call auto-termination
+            // here as well - but not during process shutdown (due to risk of a deadlock).
+            if( lpvReserved==NULL ) // library unload
+                governor::terminate_auto_initialized_scheduler();
+            __TBB_InitOnce::remove_ref();
+            // It is assumed that InitializationDone is not set after DLL_PROCESS_DETACH,
+            // and thus no race on InitializationDone is possible.
+            if( __TBB_InitOnce::initialization_done() ) {
+                // Remove reference that we added in DoOneTimeInitializations.
+                __TBB_InitOnce::remove_ref();
+            }
+            break;
+        case DLL_THREAD_DETACH:
+            governor::terminate_auto_initialized_scheduler();
+            break;
+    }
+    return true;
+}
+#endif /* (_WIN32||_WIN64) && !__TBB_SOURCE_DIRECTLY_INCLUDED */
+
+void itt_store_pointer_with_release_v3( void* dst, void* src ) {
+    ITT_NOTIFY(sync_releasing, dst);
+    __TBB_store_with_release(*static_cast<void**>(dst),src);
+}
+
+void* itt_load_pointer_with_acquire_v3( const void* src ) {
+    void* result = __TBB_load_with_acquire(*static_cast<void*const*>(src));
+    ITT_NOTIFY(sync_acquired, const_cast<void*>(src));
+    return result;
+}
+
+#if DO_ITT_NOTIFY
+void call_itt_notify_v5(int t, void *ptr) {
+    switch (t) {
+    case 0: ITT_NOTIFY(sync_prepare, ptr); break;
+    case 1: ITT_NOTIFY(sync_cancel, ptr); break;
+    case 2: ITT_NOTIFY(sync_acquired, ptr); break;
+    case 3: ITT_NOTIFY(sync_releasing, ptr); break;
+    }
+}
+#else
+void call_itt_notify_v5(int /*t*/, void* /*ptr*/) {}
+#endif
+
+#if DO_ITT_NOTIFY
+const __itt_id itt_null_id = {0, 0, 0};
+
+static inline __itt_domain* get_itt_domain( itt_domain_enum idx ) {
+    if (tbb_domains[idx] == NULL) {
+        ITT_DoOneTimeInitialization();
+    }
+    return tbb_domains[idx];
+}
+
+static inline void itt_id_make(__itt_id *id, void* addr, unsigned long long extra) {
+    *id = __itt_id_make(addr, extra);
+}
+
+static inline void itt_id_create(const __itt_domain *domain, __itt_id id) {
+    ITTNOTIFY_VOID_D1(id_create, domain, id);
+}
+
+void itt_make_task_group_v7( itt_domain_enum domain, void *group, unsigned long long group_extra,
+                             void *parent, unsigned long long parent_extra, string_index name_index ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        __itt_id group_id = itt_null_id;
+        __itt_id parent_id = itt_null_id;
+        itt_id_make( &group_id, group, group_extra );
+        itt_id_create( d, group_id );
+        if ( parent ) {
+            itt_id_make( &parent_id, parent, parent_extra );
+        }
+        __itt_string_handle *n = ITT_get_string_handle(name_index);
+        ITTNOTIFY_VOID_D3(task_group, d, group_id, parent_id, n);
+    }
+}
+
+void itt_metadata_str_add_v7( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
+                              string_index key, const char *value ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        __itt_id id = itt_null_id;
+        itt_id_make( &id, addr, addr_extra );
+        __itt_string_handle *k = ITT_get_string_handle(key);
+       size_t value_length = strlen( value );
+#if _WIN32||_WIN64
+        ITTNOTIFY_VOID_D4(metadata_str_addA, d, id, k, value, value_length);
+#else
+        ITTNOTIFY_VOID_D4(metadata_str_add, d, id, k, value, value_length);
+#endif
+    }
+}
+
+void itt_relation_add_v7( itt_domain_enum domain, void *addr0, unsigned long long addr0_extra,
+                          itt_relation relation, void *addr1, unsigned long long addr1_extra ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        __itt_id id0 = itt_null_id;
+        __itt_id id1 = itt_null_id;
+        itt_id_make( &id0, addr0, addr0_extra );
+        itt_id_make( &id1, addr1, addr1_extra );
+        ITTNOTIFY_VOID_D3(relation_add, d, id0, (__itt_relation)relation, id1);
+    }
+}
+
+void itt_task_begin_v7( itt_domain_enum domain, void *task, unsigned long long task_extra,
+                        void *parent, unsigned long long parent_extra, string_index name_index ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        __itt_id task_id = itt_null_id;
+        __itt_id parent_id = itt_null_id;
+        if ( task ) {
+            itt_id_make( &task_id, task, task_extra );
+        }
+        if ( parent ) {
+            itt_id_make( &parent_id, parent, parent_extra );
+        }
+        __itt_string_handle *n = ITT_get_string_handle(name_index);
+        ITTNOTIFY_VOID_D3(task_begin, d, task_id, parent_id, n );
+    }
+}
+
+void itt_task_end_v7( itt_domain_enum domain ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        ITTNOTIFY_VOID_D0(task_end, d);
+    }
+}
+
+void itt_region_begin_v9( itt_domain_enum domain, void *region, unsigned long long region_extra,
+                          void *parent, unsigned long long parent_extra, string_index /* name_index */ ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        __itt_id region_id = itt_null_id;
+        __itt_id parent_id = itt_null_id;
+        itt_id_make( &region_id, region, region_extra );
+        if ( parent ) {
+            itt_id_make( &parent_id, parent, parent_extra );
+        }
+        ITTNOTIFY_VOID_D3(region_begin, d, region_id, parent_id, NULL );
+    }
+}
+
+void itt_region_end_v9( itt_domain_enum domain, void *region, unsigned long long region_extra ) {
+    if ( __itt_domain *d = get_itt_domain( domain ) ) {
+        __itt_id region_id = itt_null_id;
+        itt_id_make( &region_id, region, region_extra );
+        ITTNOTIFY_VOID_D1( region_end, d, region_id );
+    }
+}
+
+#else // DO_ITT_NOTIFY
+
+void itt_make_task_group_v7( itt_domain_enum /*domain*/, void* /*group*/, unsigned long long /*group_extra*/,
+                             void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) { }
+
+void itt_metadata_str_add_v7( itt_domain_enum /*domain*/, void* /*addr*/, unsigned long long /*addr_extra*/,
+                              string_index /*key*/, const char* /*value*/ ) { }
+
+void itt_relation_add_v7( itt_domain_enum /*domain*/, void* /*addr0*/, unsigned long long /*addr0_extra*/,
+                          itt_relation /*relation*/, void* /*addr1*/, unsigned long long /*addr1_extra*/ ) { }
+
+void itt_task_begin_v7( itt_domain_enum /*domain*/, void* /*task*/, unsigned long long /*task_extra*/,
+                        void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) { }
+
+void itt_task_end_v7( itt_domain_enum /*domain*/ ) { }
+
+void itt_region_begin_v9( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/,
+                          void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) { }
+
+void itt_region_end_v9( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/ ) { }
+
+#endif // DO_ITT_NOTIFY
+
+void* itt_load_pointer_v3( const void* src ) {
+    //TODO: replace this with __TBB_load_relaxed
+    void* result = *static_cast<void*const*>(src);
+    return result;
+}
+
+void itt_set_sync_name_v3( void* obj, const tchar* name) {
+    ITT_SYNC_RENAME(obj, name);
+    suppress_unused_warning(obj, name);
+}
+
+
+class control_storage {
+    friend class tbb::interface9::global_control;
+protected:
+    size_t my_active_value;
+    atomic<global_control*> my_head;
+    spin_mutex my_list_mutex;
+
+    virtual size_t default_value() const = 0;
+    virtual void apply_active() const {}
+    virtual bool is_first_arg_preferred(size_t a, size_t b) const {
+        return a>b; // prefer max by default
+    }
+    virtual size_t active_value() const {
+        return my_head? my_active_value : default_value();
+    }
+};
+
+class allowed_parallelism_control : public padded<control_storage> {
+    virtual size_t default_value() const __TBB_override {
+        return max(1U, governor::default_num_threads());
+    }
+    virtual bool is_first_arg_preferred(size_t a, size_t b) const __TBB_override {
+        return a<b; // prefer min allowed parallelism
+    }
+    virtual void apply_active() const __TBB_override {
+        __TBB_ASSERT( my_active_value>=1, NULL );
+        // -1 to take master into account
+        market::set_active_num_workers( my_active_value-1 );
+    }
+    virtual size_t active_value() const __TBB_override {
+/* Reading of my_active_value is not synchronized with possible updating
+   of my_head by other thread. It's ok, as value of my_active_value became
+   not invalid, just obsolete. */
+        if (!my_head)
+            return default_value();
+        // non-zero, if market is active
+        const size_t workers = market::max_num_workers();
+        // We can't exceed market's maximal number of workers.
+        // +1 to take master into account
+        return workers? min(workers+1, my_active_value): my_active_value;
+    }
+public:
+    size_t active_value_if_present() const {
+        return my_head? my_active_value : 0;
+    }
+};
+
+class stack_size_control : public padded<control_storage> {
+    virtual size_t default_value() const __TBB_override {
+        return tbb::internal::ThreadStackSize;
+    }
+    virtual void apply_active() const __TBB_override {
+#if __TBB_WIN8UI_SUPPORT
+        __TBB_ASSERT( false, "For Windows Store* apps we must not set stack size" );
+#endif
+    }
+};
+
+static allowed_parallelism_control allowed_parallelism_ctl;
+static stack_size_control stack_size_ctl;
+
+static control_storage *controls[] = {&allowed_parallelism_ctl, &stack_size_ctl};
+
+unsigned market::app_parallelism_limit() {
+    return allowed_parallelism_ctl.active_value_if_present();
+}
+
+} // namespace internal
+
+namespace interface9 {
+
+using namespace internal;
+using namespace tbb::internal;
+
+void global_control::internal_create() {
+    __TBB_ASSERT_RELEASE( my_param < global_control::parameter_max, NULL );
+    control_storage *const c = controls[my_param];
+
+    spin_mutex::scoped_lock lock(c->my_list_mutex);
+    if (!c->my_head || c->is_first_arg_preferred(my_value, c->my_active_value)) {
+        c->my_active_value = my_value;
+        // to guarantee that apply_active() is called with current active value,
+        // calls it here and in internal_destroy() under my_list_mutex
+        c->apply_active();
+    }
+    my_next = c->my_head;
+    // publish my_head, at this point my_active_value must be valid
+    c->my_head = this;
+}
+
+void global_control::internal_destroy() {
+    global_control *prev = 0;
+
+    __TBB_ASSERT_RELEASE( my_param < global_control::parameter_max, NULL );
+    control_storage *const c = controls[my_param];
+    __TBB_ASSERT( c->my_head, NULL );
+
+    // Concurrent reading and changing global parameter is possible.
+    // In this case, my_active_value may not match current state of parameters.
+    // This is OK because:
+    // 1) my_active_value is either current or previous
+    // 2) my_active_value is current on internal_destroy leave
+    spin_mutex::scoped_lock lock(c->my_list_mutex);
+    size_t new_active = (size_t)-1, old_active = c->my_active_value;
+
+    if ( c->my_head != this )
+        new_active = c->my_head->my_value;
+    else if ( c->my_head->my_next )
+        new_active = c->my_head->my_next->my_value;
+    // if there is only one element, new_active will be set later
+    for ( global_control *curr = c->my_head; curr; prev = curr, curr = curr->my_next )
+        if ( curr == this ) {
+            if ( prev )
+                prev->my_next = my_next;
+            else
+                c->my_head = my_next;
+        } else
+            if (c->is_first_arg_preferred(curr->my_value, new_active))
+                new_active = curr->my_value;
+
+    if ( !c->my_head ) {
+        __TBB_ASSERT( new_active==(size_t)-1, NULL );
+        new_active = c->default_value();
+    }
+    if ( new_active != old_active ) {
+        c->my_active_value = new_active;
+        c->apply_active();
+    }
+}
+
+size_t global_control::active_value( int param ) {
+    __TBB_ASSERT_RELEASE( param < global_control::parameter_max, NULL );
+    return controls[param]->active_value();
+}
+
+} // tbb::interface9
+} // namespace tbb
diff --git a/xdl/third_party/tbb/src/tbb/tbb_main.h b/xdl/third_party/tbb/src/tbb/tbb_main.h
new file mode 100644
index 00000000..b84357b6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_main.h
@@ -0,0 +1,99 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_tbb_main_H
+#define _TBB_tbb_main_H
+
+#include "tbb/atomic.h"
+#include "governor.h"
+#include "tbb_environment.h"
+
+namespace tbb {
+
+namespace internal {
+
+void DoOneTimeInitializations ();
+
+//------------------------------------------------------------------------
+// __TBB_InitOnce
+//------------------------------------------------------------------------
+
+//! Class that supports TBB initialization.
+/** It handles acquisition and release of global resources (e.g. TLS) during startup and shutdown,
+    as well as synchronization for DoOneTimeInitializations. */
+class __TBB_InitOnce {
+    friend void DoOneTimeInitializations();
+    friend void ITT_DoUnsafeOneTimeInitialization ();
+
+    static atomic<int> count;
+
+    //! Platform specific code to acquire resources.
+    static void acquire_resources();
+
+    //! Platform specific code to release resources.
+    static void release_resources();
+
+    //! Specifies if the one-time initializations has been done.
+    static bool InitializationDone;
+
+    //! Global initialization lock
+    /** Scenarios are possible when tools interop has to be initialized before the
+        TBB itself. This imposes a requirement that the global initialization lock
+        has to support valid static initialization, and does not issue any tool
+        notifications in any build mode. **/
+    static __TBB_atomic_flag InitializationLock;
+
+public:
+    static void lock()   { __TBB_LockByte( InitializationLock ); }
+
+    static void unlock() { __TBB_UnlockByte( InitializationLock ); }
+
+    static bool initialization_done() { return __TBB_load_with_acquire(InitializationDone); }
+
+    //! Add initial reference to resources.
+    /** We assume that dynamic loading of the library prevents any other threads
+        from entering the library until this constructor has finished running. **/
+    __TBB_InitOnce() { add_ref(); }
+
+    //! Remove the initial reference to resources.
+    /** This is not necessarily the last reference if other threads are still running. **/
+    ~__TBB_InitOnce() {
+        governor::terminate_auto_initialized_scheduler(); // TLS dtor not called for the main thread
+        remove_ref();
+        // We assume that InitializationDone is not set after file-scope destructors
+        // start running, and thus no race on InitializationDone is possible.
+        if( initialization_done() ) {
+            // Remove an extra reference that was added in DoOneTimeInitializations.
+            remove_ref();
+        }
+    }
+    //! Add reference to resources.  If first reference added, acquire the resources.
+    static void add_ref();
+
+    //! Remove reference to resources.  If last reference removed, release the resources.
+    static void remove_ref();
+}; // class __TBB_InitOnce
+
+
+} // namespace internal
+
+} // namespace tbb
+
+#endif /* _TBB_tbb_main_H */
diff --git a/xdl/third_party/tbb/src/tbb/tbb_misc.cpp b/xdl/third_party/tbb/src/tbb/tbb_misc.cpp
new file mode 100644
index 00000000..23bc1ffe
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_misc.cpp
@@ -0,0 +1,309 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Source file for miscellaneous entities that are infrequently referenced by
+// an executing program.
+
+#include "tbb/tbb_stddef.h"
+#include "tbb_assert_impl.h" // Out-of-line TBB assertion handling routines are instantiated here.
+#include "tbb/tbb_exception.h"
+#include "tbb/tbb_machine.h"
+#include "tbb_misc.h"
+#include "tbb_version.h"
+
+#include <cstdio>
+#include <cstdlib>
+#include <stdexcept>
+#include <cstring>
+
+#if _WIN32||_WIN64
+#include "tbb/machine/windows_api.h"
+#endif
+
+#define __TBB_STD_RETHROW_EXCEPTION_POSSIBLY_BROKEN                             \
+    (__GLIBCXX__ && __TBB_GLIBCXX_VERSION>=40700 && __TBB_GLIBCXX_VERSION<60000 \
+     && TBB_USE_EXCEPTIONS && !TBB_USE_CAPTURED_EXCEPTION)
+
+#if __TBB_STD_RETHROW_EXCEPTION_POSSIBLY_BROKEN
+// GCC ABI declarations necessary for a workaround
+#include <cxxabi.h>
+#endif
+
+namespace tbb {
+
+const char* bad_last_alloc::what() const throw() { return "bad allocation in previous or concurrent attempt"; }
+const char* improper_lock::what() const throw() { return "attempted recursive lock on critical section or non-recursive mutex"; }
+const char* user_abort::what() const throw() { return "User-initiated abort has terminated this operation"; }
+const char* invalid_multiple_scheduling::what() const throw() { return "The same task_handle object cannot be executed more than once"; }
+const char* missing_wait::what() const throw() { return "wait() was not called on the structured_task_group"; }
+
+namespace internal {
+
+#if TBB_USE_EXCEPTIONS
+    #define DO_THROW(exc, init_args) throw exc init_args;
+#else /* !TBB_USE_EXCEPTIONS */
+    #define PRINT_ERROR_AND_ABORT(exc_name, msg) \
+        fprintf (stderr, "Exception %s with message %s would've been thrown, "  \
+            "if exception handling were not disabled. Aborting.\n", exc_name, msg); \
+        fflush(stderr); \
+        std::abort();
+    #define DO_THROW(exc, init_args) PRINT_ERROR_AND_ABORT(#exc, #init_args)
+#endif /* !TBB_USE_EXCEPTIONS */
+
+
+/* The "what" should be fairly short, not more than about 128 characters.
+   Because we control all the call sites to handle_perror, it is pointless
+   to bullet-proof it for very long strings.
+
+   Design note: ADR put this routine off to the side in tbb_misc.cpp instead of
+   Task.cpp because the throw generates a pathetic lot of code, and ADR wanted
+   this large chunk of code to be placed on a cold page. */
+void handle_perror( int error_code, const char* what ) {
+    char buf[256];
+#if _MSC_VER
+ #define snprintf _snprintf
+#endif
+    int written = snprintf(buf, sizeof(buf), "%s: %s", what, strerror( error_code ));
+    // On overflow, the returned value exceeds sizeof(buf) (for GLIBC) or is negative (for MSVC).
+    __TBB_ASSERT_EX( written>0 && written<(int)sizeof(buf), "Error description is too long" );
+    // Ensure that buffer ends in terminator.
+    buf[sizeof(buf)-1] = 0;
+#if TBB_USE_EXCEPTIONS
+    throw std::runtime_error(buf);
+#else
+    PRINT_ERROR_AND_ABORT( "runtime_error", buf);
+#endif /* !TBB_USE_EXCEPTIONS */
+}
+
+#if _WIN32||_WIN64
+void handle_win_error( int error_code ) {
+    char buf[512];
+#if !__TBB_WIN8UI_SUPPORT
+    FormatMessageA( FORMAT_MESSAGE_FROM_SYSTEM | FORMAT_MESSAGE_IGNORE_INSERTS,
+                    NULL, error_code, 0, buf, sizeof(buf), NULL );
+#else
+//TODO: update with right replacement for FormatMessageA
+    sprintf_s((char*)&buf, 512, "error code %d", error_code);
+#endif
+#if TBB_USE_EXCEPTIONS
+    throw std::runtime_error(buf);
+#else
+    PRINT_ERROR_AND_ABORT( "runtime_error", buf);
+#endif /* !TBB_USE_EXCEPTIONS */
+}
+#endif // _WIN32||_WIN64
+
+void throw_bad_last_alloc_exception_v4() {
+    throw_exception_v4(eid_bad_last_alloc);
+}
+
+void throw_exception_v4 ( exception_id eid ) {
+    __TBB_ASSERT ( eid > 0 && eid < eid_max, "Unknown exception ID" );
+    switch ( eid ) {
+    case eid_bad_alloc: DO_THROW(std::bad_alloc, () );
+    case eid_bad_last_alloc: DO_THROW( bad_last_alloc, () );
+    case eid_nonpositive_step: DO_THROW(std::invalid_argument, ("Step must be positive") );
+    case eid_out_of_range: DO_THROW(std::out_of_range, ("Index out of requested size range") );
+    case eid_segment_range_error: DO_THROW(std::range_error, ("Index out of allocated segment slots") );
+    case eid_index_range_error: DO_THROW(std::range_error, ("Index is not allocated") );
+    case eid_missing_wait: DO_THROW( missing_wait, () );
+    case eid_invalid_multiple_scheduling: DO_THROW( invalid_multiple_scheduling, () );
+    case eid_improper_lock: DO_THROW( improper_lock, () );
+    case eid_possible_deadlock: DO_THROW(std::runtime_error, ("Resource deadlock would occur") );
+    case eid_operation_not_permitted: DO_THROW(std::runtime_error, ("Operation not permitted") );
+    case eid_condvar_wait_failed: DO_THROW(std::runtime_error, ("Wait on condition variable failed") );
+    case eid_invalid_load_factor: DO_THROW(std::out_of_range, ("Invalid hash load factor") );
+    case eid_reserved: DO_THROW(std::out_of_range, ("[backward compatibility] Invalid number of buckets") );
+    case eid_invalid_swap: DO_THROW(std::invalid_argument, ("swap() is invalid on non-equal allocators") );
+    case eid_reservation_length_error: DO_THROW(std::length_error, ("reservation size exceeds permitted max size") );
+    case eid_invalid_key: DO_THROW(std::out_of_range, ("invalid key") );
+    case eid_user_abort: DO_THROW( user_abort, () );
+    case eid_bad_tagged_msg_cast: DO_THROW(std::runtime_error, ("Illegal tagged_msg cast") );
+#if __TBB_SUPPORTS_WORKERS_WAITING_IN_TERMINATE
+    case eid_blocking_thread_join_impossible: DO_THROW(std::runtime_error, ("Blocking terminate failed") );
+#endif
+    default: break;
+    }
+#if !TBB_USE_EXCEPTIONS && __APPLE__
+    out_of_range e1("");
+    length_error e2("");
+    range_error e3("");
+    invalid_argument e4("");
+#endif /* !TBB_USE_EXCEPTIONS && __APPLE__ */
+}
+
+#if __TBB_STD_RETHROW_EXCEPTION_POSSIBLY_BROKEN
+// Runtime detection and workaround for the GCC bug 62258.
+// The problem is that std::rethrow_exception() does not increment a counter
+// of active exceptions, causing std::uncaught_exception() to return a wrong value.
+// The code is created after, and roughly reflects, the workaround
+// at https://gcc.gnu.org/bugzilla/attachment.cgi?id=34683
+
+void fix_broken_rethrow() {
+    struct gcc_eh_data {
+        void *       caughtExceptions;
+        unsigned int uncaughtExceptions;
+    };
+    gcc_eh_data* eh_data = punned_cast<gcc_eh_data*>( abi::__cxa_get_globals() );
+    ++eh_data->uncaughtExceptions;
+}
+
+bool gcc_rethrow_exception_broken() {
+    bool is_broken;
+    __TBB_ASSERT( !std::uncaught_exception(),
+        "gcc_rethrow_exception_broken() must not be called when an exception is active" );
+    try {
+        // Throw, catch, and rethrow an exception
+        try {
+            throw __TBB_GLIBCXX_VERSION;
+        } catch(...) {
+            std::rethrow_exception( std::current_exception() );
+        }
+    } catch(...) {
+        // Check the bug presence
+        is_broken = std::uncaught_exception();
+    }
+    if( is_broken ) fix_broken_rethrow();
+    __TBB_ASSERT( !std::uncaught_exception(), NULL );
+    return is_broken;
+}
+#else
+void fix_broken_rethrow() {}
+bool gcc_rethrow_exception_broken() { return false; }
+#endif /* __TBB_STD_RETHROW_EXCEPTION_POSSIBLY_BROKEN */
+
+/** The leading "\0" is here so that applying "strings" to the binary delivers a clean result. */
+static const char VersionString[] = "\0" TBB_VERSION_STRINGS;
+
+static bool PrintVersionFlag = false;
+
+void PrintVersion() {
+    PrintVersionFlag = true;
+    fputs(VersionString+1,stderr);
+}
+
+void PrintExtraVersionInfo( const char* category, const char* format, ... ) {
+    if( PrintVersionFlag ) {
+        char str[1024]; memset(str, 0, 1024);
+        va_list args; va_start(args, format);
+        // Note: correct vsnprintf definition obtained from tbb_assert_impl.h
+        vsnprintf( str, 1024-1, format, args);
+        va_end(args);
+        fprintf(stderr, "TBB: %s\t%s\n", category, str );
+    }
+}
+
+void PrintRMLVersionInfo( void* arg, const char* server_info ) {
+    PrintExtraVersionInfo( server_info, (const char *)arg );
+}
+
+//! check for transaction support.
+#if _MSC_VER
+#include <intrin.h> // for __cpuid
+#endif
+bool cpu_has_speculation() {
+#if __TBB_TSX_AVAILABLE
+#if (__INTEL_COMPILER || __GNUC__ || _MSC_VER || __SUNPRO_CC)
+    bool result = false;
+    const int rtm_ebx_mask = 1<<11;
+#if _MSC_VER
+    int info[4] = {0,0,0,0};
+    const int reg_ebx = 1;
+    __cpuidex(info, 7, 0);
+    result = (info[reg_ebx] & rtm_ebx_mask)!=0;
+#elif __GNUC__ || __SUNPRO_CC
+    int32_t reg_ebx = 0;
+    int32_t reg_eax = 7;
+    int32_t reg_ecx = 0;
+    __asm__ __volatile__ ( "movl %%ebx, %%esi\n"
+                           "cpuid\n"
+                           "movl %%ebx, %0\n"
+                           "movl %%esi, %%ebx\n"
+                           : "=a"(reg_ebx) : "0" (reg_eax), "c" (reg_ecx) : "esi",
+#if __TBB_x86_64
+                           "ebx",
+#endif
+                           "edx"
+                           );
+    result = (reg_ebx & rtm_ebx_mask)!=0 ;
+#endif
+    return result;
+#else
+    #error Speculation detection not enabled for compiler
+#endif /* __INTEL_COMPILER || __GNUC__ || _MSC_VER */
+#else  /* __TBB_TSX_AVAILABLE */
+    return false;
+#endif /* __TBB_TSX_AVAILABLE */
+}
+
+} // namespace internal
+
+extern "C" int TBB_runtime_interface_version() {
+    return TBB_INTERFACE_VERSION;
+}
+
+} // namespace tbb
+
+#if !__TBB_RML_STATIC
+#if __TBB_x86_32
+
+#include "tbb/atomic.h"
+
+// in MSVC environment, int64_t defined in tbb::internal namespace only (see tbb_stddef.h)
+#if _MSC_VER
+using tbb::internal::int64_t;
+#endif
+
+//! Warn about 8-byte store that crosses a cache line.
+extern "C" void __TBB_machine_store8_slow_perf_warning( volatile void *ptr ) {
+    // Report run-time warning unless we have already recently reported warning for that address.
+    const unsigned n = 4;
+    static tbb::atomic<void*> cache[n];
+    static tbb::atomic<unsigned> k;
+    for( unsigned i=0; i<n; ++i )
+        if( ptr==cache[i] )
+            goto done;
+    cache[(k++)%n] = const_cast<void*>(ptr);
+    tbb::internal::runtime_warning( "atomic store on misaligned 8-byte location %p is slow", ptr );
+done:;
+}
+
+//! Handle 8-byte store that crosses a cache line.
+extern "C" void __TBB_machine_store8_slow( volatile void *ptr, int64_t value ) {
+    for( tbb::internal::atomic_backoff b;;b.pause() ) {
+        int64_t tmp = *(int64_t*)ptr;
+        if( __TBB_machine_cmpswp8(ptr,value,tmp)==tmp )
+            break;
+    }
+}
+
+#endif /* __TBB_x86_32 */
+#endif /* !__TBB_RML_STATIC */
+
+#if __TBB_ipf
+/* It was found that on IA-64 architecture inlining of __TBB_machine_lockbyte leads
+   to serious performance regression with ICC. So keep it out-of-line.
+ */
+extern "C" intptr_t __TBB_machine_lockbyte( volatile unsigned char& flag ) {
+    tbb::internal::atomic_backoff backoff;
+    while( !__TBB_TryLockByte(flag) ) backoff.pause();
+    return 0;
+}
+#endif
diff --git a/xdl/third_party/tbb/src/tbb/tbb_misc.h b/xdl/third_party/tbb/src/tbb/tbb_misc.h
new file mode 100644
index 00000000..c1584e32
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_misc.h
@@ -0,0 +1,272 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_tbb_misc_H
+#define _TBB_tbb_misc_H
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/tbb_machine.h"
+#include "tbb/atomic.h"     // For atomic_xxx definitions
+
+#if __linux__ || __FreeBSD__
+#include <sys/param.h>  // __FreeBSD_version
+#if __FreeBSD_version >= 701000
+#include <sys/cpuset.h>
+#endif
+#endif
+
+// Does the operating system have a system call to pin a thread to a set of OS processors?
+#define __TBB_OS_AFFINITY_SYSCALL_PRESENT ((__linux__ && !__ANDROID__) || (__FreeBSD_version >= 701000))
+// On IBM* Blue Gene* CNK nodes, the affinity API has restrictions that prevent its usability for TBB,
+// and also sysconf(_SC_NPROCESSORS_ONLN) already takes process affinity into account.
+#define __TBB_USE_OS_AFFINITY_SYSCALL (__TBB_OS_AFFINITY_SYSCALL_PRESENT && !__bg__)
+
+namespace tbb {
+namespace internal {
+
+const size_t MByte = 1024*1024;
+
+#if __TBB_WIN8UI_SUPPORT
+// In Win8UI mode, TBB uses a thread creation API that does not allow to specify the stack size.
+// Still, the thread stack size value, either explicit or default, is used by the scheduler.
+// So here we set the default value to match the platform's default of 1MB.
+const size_t ThreadStackSize = 1*MByte;
+#else
+const size_t ThreadStackSize = (sizeof(uintptr_t) <= 4 ? 2 : 4 )*MByte;
+#endif
+
+#ifndef __TBB_HardwareConcurrency
+
+//! Returns maximal parallelism level supported by the current OS configuration.
+int AvailableHwConcurrency();
+
+#else
+
+inline int AvailableHwConcurrency() {
+    int n = __TBB_HardwareConcurrency();
+    return n > 0 ? n : 1; // Fail safety strap
+}
+#endif /* __TBB_HardwareConcurrency */
+
+
+#if _WIN32||_WIN64
+
+//! Returns number of processor groups in the current OS configuration.
+/** AvailableHwConcurrency must be called at least once before calling this method. **/
+int NumberOfProcessorGroups();
+
+//! Retrieves index of processor group containing processor with the given index
+int FindProcessorGroupIndex ( int processorIndex );
+
+//! Affinitizes the thread to the specified processor group
+void MoveThreadIntoProcessorGroup( void* hThread, int groupIndex );
+
+#endif /* _WIN32||_WIN64 */
+
+//! Throws std::runtime_error with what() returning error_code description prefixed with aux_info
+void handle_win_error( int error_code );
+
+//! Prints TBB version information on stderr
+void PrintVersion();
+
+//! Prints arbitrary extra TBB version information on stderr
+void PrintExtraVersionInfo( const char* category, const char* format, ... );
+
+//! A callback routine to print RML version information on stderr
+void PrintRMLVersionInfo( void* arg, const char* server_info );
+
+// For TBB compilation only; not to be used in public headers
+#if defined(min) || defined(max)
+#undef min
+#undef max
+#endif
+
+//! Utility template function returning lesser of the two values.
+/** Provided here to avoid including not strict safe <algorithm>.\n
+    In case operands cause signed/unsigned or size mismatch warnings it is caller's
+    responsibility to do the appropriate cast before calling the function. **/
+template<typename T>
+T min ( const T& val1, const T& val2 ) {
+    return val1 < val2 ? val1 : val2;
+}
+
+//! Utility template function returning greater of the two values.
+/** Provided here to avoid including not strict safe <algorithm>.\n
+    In case operands cause signed/unsigned or size mismatch warnings it is caller's
+    responsibility to do the appropriate cast before calling the function. **/
+template<typename T>
+T max ( const T& val1, const T& val2 ) {
+    return val1 < val2 ? val2 : val1;
+}
+
+//! Utility helper structure to ease overload resolution
+template<int > struct int_to_type {};
+
+//------------------------------------------------------------------------
+// FastRandom
+//------------------------------------------------------------------------
+
+/** Defined in tbb_main.cpp **/
+unsigned GetPrime ( unsigned seed );
+
+//! A fast random number generator.
+/** Uses linear congruential method. */
+class FastRandom {
+private:
+#if __TBB_OLD_PRIMES_RNG
+    unsigned x, a;
+    static const unsigned c = 1;
+#else
+    unsigned x, c;
+    static const unsigned a = 0x9e3779b1; // a big prime number
+#endif //__TBB_OLD_PRIMES_RNG
+public:
+    //! Get a random number.
+    unsigned short get() {
+        return get(x);
+    }
+    //! Get a random number for the given seed; update the seed for next use.
+    unsigned short get( unsigned& seed ) {
+        unsigned short r = (unsigned short)(seed>>16);
+        __TBB_ASSERT(c&1, "c must be odd for big rng period");
+        seed = seed*a+c;
+        return r;
+    }
+    //! Construct a random number generator.
+    FastRandom( void* unique_ptr ) { init(uintptr_t(unique_ptr)); }
+    FastRandom( uint32_t seed) { init(seed); }
+    FastRandom( uint64_t seed) { init(seed); }
+    template <typename T>
+    void init( T seed ) {
+        init(seed,int_to_type<sizeof(seed)>());
+    }
+    void init( uint64_t seed , int_to_type<8> ) {
+        init(uint32_t((seed>>32)+seed), int_to_type<4>());
+    }
+    void init( uint32_t seed, int_to_type<4> ) {
+#if __TBB_OLD_PRIMES_RNG
+        x = seed;
+        a = GetPrime( seed );
+#else
+        // threads use different seeds for unique sequences
+        c = (seed|1)*0xba5703f5; // c must be odd, shuffle by a prime number
+        x = c^(seed>>1); // also shuffle x for the first get() invocation
+#endif
+    }
+};
+
+//------------------------------------------------------------------------
+// Atomic extensions
+//------------------------------------------------------------------------
+
+//! Atomically replaces value of dst with newValue if they satisfy condition of compare predicate
+/** Return value semantics is the same as for CAS. **/
+template<typename T1, typename T2, class Pred>
+T1 atomic_update ( tbb::atomic<T1>& dst, T2 newValue, Pred compare ) {
+    T1 oldValue = dst;
+    while ( compare(oldValue, newValue) ) {
+        if ( dst.compare_and_swap((T1)newValue, oldValue) == oldValue )
+            break;
+        oldValue = dst;
+    }
+    return oldValue;
+}
+
+//! One-time initialization states
+enum do_once_state {
+    do_once_uninitialized = 0,  ///< No execution attempts have been undertaken yet
+    do_once_pending,            ///< A thread is executing associated do-once routine
+    do_once_executed,           ///< Do-once routine has been executed
+    initialization_complete = do_once_executed  ///< Convenience alias
+};
+
+//! One-time initialization function
+/** /param initializer Pointer to function without arguments
+           The variant that returns bool is used for cases when initialization can fail
+           and it is OK to continue execution, but the state should be reset so that
+           the initialization attempt was repeated the next time.
+    /param state Shared state associated with initializer that specifies its
+            initialization state. Must be initially set to #uninitialized value
+            (e.g. by means of default static zero initialization). **/
+template <typename F>
+void atomic_do_once ( const F& initializer, atomic<do_once_state>& state ) {
+    // tbb::atomic provides necessary acquire and release fences.
+    // The loop in the implementation is necessary to avoid race when thread T2
+    // that arrived in the middle of initialization attempt by another thread T1
+    // has just made initialization possible.
+    // In such a case T2 has to rely on T1 to initialize, but T1 may already be past
+    // the point where it can recognize the changed conditions.
+    while ( state != do_once_executed ) {
+        if( state == do_once_uninitialized ) {
+            if( state.compare_and_swap( do_once_pending, do_once_uninitialized ) == do_once_uninitialized ) {
+                run_initializer( initializer, state );
+                break;
+            }
+        }
+        spin_wait_while_eq( state, do_once_pending );
+    }
+}
+
+// Run the initializer which can not fail
+inline void run_initializer( void (*f)(), atomic<do_once_state>& state ) {
+    f();
+    state = do_once_executed;
+}
+
+// Run the initializer which can require repeated call
+inline void run_initializer( bool (*f)(), atomic<do_once_state>& state ) {
+    state = f() ? do_once_executed : do_once_uninitialized;
+}
+
+#if __TBB_USE_OS_AFFINITY_SYSCALL
+  #if __linux__
+    typedef cpu_set_t basic_mask_t;
+  #elif __FreeBSD_version >= 701000
+    typedef cpuset_t basic_mask_t;
+  #else
+    #error affinity_helper is not implemented in this OS
+  #endif
+    class affinity_helper : no_copy {
+        basic_mask_t* threadMask;
+        int is_changed;
+    public:
+        affinity_helper() : threadMask(NULL), is_changed(0) {}
+        ~affinity_helper();
+        void protect_affinity_mask( bool restore_process_mask  );
+        void dismiss();
+    };
+    void destroy_process_mask();
+#else
+    class affinity_helper : no_copy {
+    public:
+        void protect_affinity_mask( bool ) {}
+        void dismiss() {}
+    };
+    inline void destroy_process_mask(){}
+#endif /* __TBB_USE_OS_AFFINITY_SYSCALL */
+
+bool cpu_has_speculation();
+bool gcc_rethrow_exception_broken();
+void fix_broken_rethrow();
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* _TBB_tbb_misc_H */
diff --git a/xdl/third_party/tbb/src/tbb/tbb_misc_ex.cpp b/xdl/third_party/tbb/src/tbb/tbb_misc_ex.cpp
new file mode 100644
index 00000000..ae2e498d
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_misc_ex.cpp
@@ -0,0 +1,405 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Source file for miscellaneous entities that are infrequently referenced by
+// an executing program, and implementation of which requires dynamic linking.
+
+#include "tbb_misc.h"
+
+#if !defined(__TBB_HardwareConcurrency)
+
+#include "dynamic_link.h"
+#include <stdio.h>
+#include <limits.h>
+
+#if _WIN32||_WIN64
+#include "tbb/machine/windows_api.h"
+#if __TBB_WIN8UI_SUPPORT
+#include <thread>
+#endif
+#else
+#include <unistd.h>
+#if __linux__
+#include <sys/sysinfo.h>
+#include <string.h>
+#include <sched.h>
+#include <errno.h>
+#elif __sun
+#include <sys/sysinfo.h>
+#elif __FreeBSD__
+#include <errno.h>
+#include <string.h>
+#include <sys/param.h>  // Required by <sys/cpuset.h>
+#include <sys/cpuset.h>
+#endif
+#endif
+
+namespace tbb {
+namespace internal {
+
+#if __TBB_USE_OS_AFFINITY_SYSCALL
+
+#if __linux__
+// Handlers for interoperation with libiomp
+static int (*libiomp_try_restoring_original_mask)();
+// Table for mapping to libiomp entry points
+static const dynamic_link_descriptor iompLinkTable[] = {
+    DLD_NOWEAK( kmp_set_thread_affinity_mask_initial, libiomp_try_restoring_original_mask )
+};
+#endif
+
+static void set_thread_affinity_mask( size_t maskSize, const basic_mask_t* threadMask ) {
+#if __linux__
+    if( sched_setaffinity( 0, maskSize, threadMask ) )
+#else /* FreeBSD */
+    if( cpuset_setaffinity( CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, maskSize, threadMask ) )
+#endif
+        runtime_warning( "setaffinity syscall failed" );
+}
+
+static void get_thread_affinity_mask( size_t maskSize, basic_mask_t* threadMask ) {
+#if __linux__
+    if( sched_getaffinity( 0, maskSize, threadMask ) )
+#else /* FreeBSD */
+    if( cpuset_getaffinity( CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, maskSize, threadMask ) )
+#endif
+        runtime_warning( "getaffinity syscall failed" );
+}
+
+static basic_mask_t* process_mask;
+static int num_masks;
+
+void destroy_process_mask() {
+    if( process_mask ) {
+        delete [] process_mask;
+    }
+}
+
+#define curMaskSize sizeof(basic_mask_t) * num_masks
+affinity_helper::~affinity_helper() {
+    if( threadMask ) {
+        if( is_changed ) {
+            set_thread_affinity_mask( curMaskSize, threadMask );
+        }
+        delete [] threadMask;
+    }
+}
+void affinity_helper::protect_affinity_mask( bool restore_process_mask ) {
+    if( threadMask == NULL && num_masks ) { // TODO: assert num_masks validity?
+        threadMask = new basic_mask_t [num_masks];
+        memset( threadMask, 0, curMaskSize );
+        get_thread_affinity_mask( curMaskSize, threadMask );
+        if( restore_process_mask ) {
+            __TBB_ASSERT( process_mask, "A process mask is requested but not yet stored" );
+            is_changed = memcmp( process_mask, threadMask, curMaskSize );
+            if( is_changed )
+                set_thread_affinity_mask( curMaskSize, process_mask );
+        } else {
+            // Assume that the mask will be changed by the caller.
+            is_changed = 1;
+        }
+    }
+}
+void affinity_helper::dismiss() {
+    if( threadMask ) {
+        delete [] threadMask;
+        threadMask = NULL;
+    }
+    is_changed = 0;
+}
+#undef curMaskSize
+
+static atomic<do_once_state> hardware_concurrency_info;
+
+static int theNumProcs;
+
+static void initialize_hardware_concurrency_info () {
+    int err;
+    int availableProcs = 0;
+    int numMasks = 1;
+#if __linux__
+#if __TBB_MAIN_THREAD_AFFINITY_BROKEN
+    int maxProcs = INT_MAX; // To check the entire mask.
+    int pid = 0; // Get the mask of the calling thread.
+#else
+    int maxProcs = sysconf(_SC_NPROCESSORS_ONLN);
+    int pid = getpid();
+#endif
+#else /* FreeBSD >= 7.1 */
+    int maxProcs = sysconf(_SC_NPROCESSORS_ONLN);
+#endif
+    basic_mask_t* processMask;
+    const size_t BasicMaskSize =  sizeof(basic_mask_t);
+    for (;;) {
+        const int curMaskSize = BasicMaskSize * numMasks;
+        processMask = new basic_mask_t[numMasks];
+        memset( processMask, 0, curMaskSize );
+#if __linux__
+        err = sched_getaffinity( pid, curMaskSize, processMask );
+        if ( !err || errno != EINVAL || curMaskSize * CHAR_BIT >= 256 * 1024 )
+            break;
+#else /* FreeBSD >= 7.1 */
+        // CPU_LEVEL_WHICH - anonymous (current) mask, CPU_LEVEL_CPUSET - assigned mask
+#if __TBB_MAIN_THREAD_AFFINITY_BROKEN
+        err = cpuset_getaffinity( CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, curMaskSize, processMask );
+#else
+        err = cpuset_getaffinity( CPU_LEVEL_WHICH, CPU_WHICH_PID, -1, curMaskSize, processMask );
+#endif
+        if ( !err || errno != ERANGE || curMaskSize * CHAR_BIT >= 16 * 1024 )
+            break;
+#endif /* FreeBSD >= 7.1 */
+        delete[] processMask;
+        numMasks <<= 1;
+    }
+    if ( !err ) {
+        // We have found the mask size and captured the process affinity mask into processMask.
+        num_masks = numMasks; // do here because it's needed for affinity_helper to work
+#if __linux__
+        // For better coexistence with libiomp which might have changed the mask already,
+        // check for its presence and ask it to restore the mask.
+        dynamic_link_handle libhandle;
+        if ( dynamic_link( "libiomp5.so", iompLinkTable, 1, &libhandle, DYNAMIC_LINK_GLOBAL ) ) {
+            // We have found the symbol provided by libiomp5 for restoring original thread affinity.
+            affinity_helper affhelp;
+            affhelp.protect_affinity_mask( /*restore_process_mask=*/false );
+            if ( libiomp_try_restoring_original_mask()==0 ) {
+                // Now we have the right mask to capture, restored by libiomp.
+                const int curMaskSize = BasicMaskSize * numMasks;
+                memset( processMask, 0, curMaskSize );
+                get_thread_affinity_mask( curMaskSize, processMask );
+            } else
+                affhelp.dismiss();  // thread mask has not changed
+            dynamic_unlink( libhandle );
+            // Destructor of affinity_helper restores the thread mask (unless dismissed).
+        }
+#endif
+        for ( int m = 0; availableProcs < maxProcs && m < numMasks; ++m ) {
+            for ( size_t i = 0; (availableProcs < maxProcs) && (i < BasicMaskSize * CHAR_BIT); ++i ) {
+                if ( CPU_ISSET( i, processMask + m ) )
+                    ++availableProcs;
+            }
+        }
+        process_mask = processMask;
+    }
+    else {
+        // Failed to get the process affinity mask; assume the whole machine can be used.
+        availableProcs = (maxProcs == INT_MAX) ? sysconf(_SC_NPROCESSORS_ONLN) : maxProcs;
+        delete[] processMask;
+    }
+    theNumProcs = availableProcs > 0 ? availableProcs : 1; // Fail safety strap
+    __TBB_ASSERT( theNumProcs <= sysconf(_SC_NPROCESSORS_ONLN), NULL );
+}
+
+int AvailableHwConcurrency() {
+    atomic_do_once( &initialize_hardware_concurrency_info, hardware_concurrency_info );
+    return theNumProcs;
+}
+
+/* End of __TBB_USE_OS_AFFINITY_SYSCALL implementation */
+#elif __ANDROID__
+
+// Work-around for Android that reads the correct number of available CPUs since system calls are unreliable.
+// Format of "present" file is: ([<int>-<int>|<int>],)+
+int AvailableHwConcurrency() {
+    FILE *fp = fopen("/sys/devices/system/cpu/present", "r");
+    if (fp == NULL) return 1;
+    int num_args, lower, upper, num_cpus=0;
+    while ((num_args = fscanf(fp, "%u-%u", &lower, &upper)) != EOF) {
+        switch(num_args) {
+            case 2: num_cpus += upper - lower + 1; break;
+            case 1: num_cpus += 1; break;
+        }
+        fscanf(fp, ",");
+    }
+    return (num_cpus > 0) ? num_cpus : 1;
+}
+
+#elif defined(_SC_NPROCESSORS_ONLN)
+
+int AvailableHwConcurrency() {
+    int n = sysconf(_SC_NPROCESSORS_ONLN);
+    return (n > 0) ? n : 1;
+}
+
+#elif _WIN32||_WIN64
+
+static atomic<do_once_state> hardware_concurrency_info;
+
+static const WORD TBB_ALL_PROCESSOR_GROUPS = 0xffff;
+
+// Statically allocate an array for processor group information.
+// Windows 7 supports maximum 4 groups, but let's look ahead a little.
+static const WORD MaxProcessorGroups = 64;
+
+struct ProcessorGroupInfo {
+    DWORD_PTR   mask;                   ///< Affinity mask covering the whole group
+    int         numProcs;               ///< Number of processors in the group
+    int         numProcsRunningTotal;   ///< Subtotal of processors in this and preceding groups
+
+    //! Total number of processor groups in the system
+    static int NumGroups;
+
+    //! Index of the group with a slot reserved for the first master thread
+    /** In the context of multiple processor groups support current implementation
+        defines "the first master thread" as the first thread to invoke
+        AvailableHwConcurrency().
+
+        TODO:   Implement a dynamic scheme remapping workers depending on the pending
+                master threads affinity. **/
+    static int HoleIndex;
+};
+
+int ProcessorGroupInfo::NumGroups = 1;
+int ProcessorGroupInfo::HoleIndex = 0;
+
+ProcessorGroupInfo theProcessorGroups[MaxProcessorGroups];
+
+struct TBB_GROUP_AFFINITY {
+    DWORD_PTR Mask;
+    WORD   Group;
+    WORD   Reserved[3];
+};
+
+static DWORD (WINAPI *TBB_GetActiveProcessorCount)( WORD groupIndex ) = NULL;
+static WORD (WINAPI *TBB_GetActiveProcessorGroupCount)() = NULL;
+static BOOL (WINAPI *TBB_SetThreadGroupAffinity)( HANDLE hThread,
+                        const TBB_GROUP_AFFINITY* newAff, TBB_GROUP_AFFINITY *prevAff );
+static BOOL (WINAPI *TBB_GetThreadGroupAffinity)( HANDLE hThread, TBB_GROUP_AFFINITY* );
+
+static const dynamic_link_descriptor ProcessorGroupsApiLinkTable[] = {
+      DLD(GetActiveProcessorCount, TBB_GetActiveProcessorCount)
+    , DLD(GetActiveProcessorGroupCount, TBB_GetActiveProcessorGroupCount)
+    , DLD(SetThreadGroupAffinity, TBB_SetThreadGroupAffinity)
+    , DLD(GetThreadGroupAffinity, TBB_GetThreadGroupAffinity)
+};
+
+static void initialize_hardware_concurrency_info () {
+#if __TBB_WIN8UI_SUPPORT
+    // For these applications processor groups info is unavailable
+    // Setting up a number of processors for one processor group
+    theProcessorGroups[0].numProcs = theProcessorGroups[0].numProcsRunningTotal = std::thread::hardware_concurrency();
+#else /* __TBB_WIN8UI_SUPPORT */
+    dynamic_link( "Kernel32.dll", ProcessorGroupsApiLinkTable,
+                  sizeof(ProcessorGroupsApiLinkTable)/sizeof(dynamic_link_descriptor) );
+    SYSTEM_INFO si;
+    GetNativeSystemInfo(&si);
+    DWORD_PTR pam, sam, m = 1;
+    GetProcessAffinityMask( GetCurrentProcess(), &pam, &sam );
+    int nproc = 0;
+    for ( size_t i = 0; i < sizeof(DWORD_PTR) * CHAR_BIT; ++i, m <<= 1 ) {
+        if ( pam & m )
+            ++nproc;
+    }
+    __TBB_ASSERT( nproc <= (int)si.dwNumberOfProcessors, NULL );
+    // By default setting up a number of processors for one processor group
+    theProcessorGroups[0].numProcs = theProcessorGroups[0].numProcsRunningTotal = nproc;
+    // Setting up processor groups in case the process does not restrict affinity mask and more than one processor group is present
+    if ( nproc == (int)si.dwNumberOfProcessors && TBB_GetActiveProcessorCount ) {
+        // The process does not have restricting affinity mask and multiple processor groups are possible
+        ProcessorGroupInfo::NumGroups = (int)TBB_GetActiveProcessorGroupCount();
+        __TBB_ASSERT( ProcessorGroupInfo::NumGroups <= MaxProcessorGroups, NULL );
+        // Fail safety bootstrap. Release versions will limit available concurrency
+        // level, while debug ones would assert.
+        if ( ProcessorGroupInfo::NumGroups > MaxProcessorGroups )
+            ProcessorGroupInfo::NumGroups = MaxProcessorGroups;
+        if ( ProcessorGroupInfo::NumGroups > 1 ) {
+            TBB_GROUP_AFFINITY ga;
+            if ( TBB_GetThreadGroupAffinity( GetCurrentThread(), &ga ) )
+                ProcessorGroupInfo::HoleIndex = ga.Group;
+            int nprocs = 0;
+            for ( WORD i = 0; i < ProcessorGroupInfo::NumGroups; ++i ) {
+                ProcessorGroupInfo  &pgi = theProcessorGroups[i];
+                pgi.numProcs = (int)TBB_GetActiveProcessorCount(i);
+                __TBB_ASSERT( pgi.numProcs <= (int)sizeof(DWORD_PTR) * CHAR_BIT, NULL );
+                pgi.mask = pgi.numProcs == sizeof(DWORD_PTR) * CHAR_BIT ? ~(DWORD_PTR)0 : (DWORD_PTR(1) << pgi.numProcs) - 1;
+                pgi.numProcsRunningTotal = nprocs += pgi.numProcs;
+            }
+            __TBB_ASSERT( nprocs == (int)TBB_GetActiveProcessorCount( TBB_ALL_PROCESSOR_GROUPS ), NULL );
+        }
+    }
+#endif /* __TBB_WIN8UI_SUPPORT */
+
+    PrintExtraVersionInfo("Processor groups", "%d", ProcessorGroupInfo::NumGroups);
+    if (ProcessorGroupInfo::NumGroups>1)
+        for (int i=0; i<ProcessorGroupInfo::NumGroups; ++i)
+            PrintExtraVersionInfo( "----- Group", "%d: size %d", i, theProcessorGroups[i].numProcs);
+}
+
+int NumberOfProcessorGroups() {
+    __TBB_ASSERT( hardware_concurrency_info == initialization_complete, "NumberOfProcessorGroups is used before AvailableHwConcurrency" );
+    return ProcessorGroupInfo::NumGroups;
+}
+
+// Offset for the slot reserved for the first master thread
+#define HoleAdjusted(procIdx, grpIdx) (procIdx + (holeIdx <= grpIdx))
+
+int FindProcessorGroupIndex ( int procIdx ) {
+    // In case of oversubscription spread extra workers in a round robin manner
+    int holeIdx;
+    const int numProcs = theProcessorGroups[ProcessorGroupInfo::NumGroups - 1].numProcsRunningTotal;
+    if ( procIdx >= numProcs - 1 ) {
+        holeIdx = INT_MAX;
+        procIdx = (procIdx - numProcs + 1) % numProcs;
+    }
+    else
+        holeIdx = ProcessorGroupInfo::HoleIndex;
+    __TBB_ASSERT( hardware_concurrency_info == initialization_complete, "FindProcessorGroupIndex is used before AvailableHwConcurrency" );
+    // Approximate the likely group index assuming all groups are of the same size
+    int i = procIdx / theProcessorGroups[0].numProcs;
+    // Make sure the approximation is a valid group index
+    if (i >= ProcessorGroupInfo::NumGroups) i = ProcessorGroupInfo::NumGroups-1;
+    // Now adjust the approximation up or down
+    if ( theProcessorGroups[i].numProcsRunningTotal > HoleAdjusted(procIdx, i) ) {
+        while ( theProcessorGroups[i].numProcsRunningTotal - theProcessorGroups[i].numProcs > HoleAdjusted(procIdx, i) ) {
+            __TBB_ASSERT( i > 0, NULL );
+            --i;
+        }
+    }
+    else {
+        do {
+            ++i;
+        } while ( theProcessorGroups[i].numProcsRunningTotal <= HoleAdjusted(procIdx, i) );
+    }
+    __TBB_ASSERT( i < ProcessorGroupInfo::NumGroups, NULL );
+    return i;
+}
+
+void MoveThreadIntoProcessorGroup( void* hThread, int groupIndex ) {
+    __TBB_ASSERT( hardware_concurrency_info == initialization_complete, "MoveThreadIntoProcessorGroup is used before AvailableHwConcurrency" );
+    if ( !TBB_SetThreadGroupAffinity )
+        return;
+    TBB_GROUP_AFFINITY ga = { theProcessorGroups[groupIndex].mask, (WORD)groupIndex, {0,0,0} };
+    TBB_SetThreadGroupAffinity( hThread, &ga, NULL );
+}
+
+int AvailableHwConcurrency() {
+    atomic_do_once( &initialize_hardware_concurrency_info, hardware_concurrency_info );
+    return theProcessorGroups[ProcessorGroupInfo::NumGroups - 1].numProcsRunningTotal;
+}
+
+/* End of _WIN32||_WIN64 implementation */
+#else
+    #error AvailableHwConcurrency is not implemented for this OS
+#endif
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* !__TBB_HardwareConcurrency */
diff --git a/xdl/third_party/tbb/src/tbb/tbb_resource.rc b/xdl/third_party/tbb/src/tbb/tbb_resource.rc
new file mode 100644
index 00000000..0dac864e
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_resource.rc
@@ -0,0 +1,116 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+// Microsoft Visual C++ generated resource script.
+//
+#ifdef APSTUDIO_INVOKED
+#ifndef APSTUDIO_READONLY_SYMBOLS
+#define _APS_NO_MFC                     1
+#define _APS_NEXT_RESOURCE_VALUE        102
+#define _APS_NEXT_COMMAND_VALUE         40001
+#define _APS_NEXT_CONTROL_VALUE         1001
+#define _APS_NEXT_SYMED_VALUE           101
+#endif
+#endif
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#include <winresrc.h>
+#define ENDL "\r\n"
+#include "tbb_version.h"
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// Neutral resources
+
+//#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_NEU)
+#ifdef _WIN32
+LANGUAGE LANG_NEUTRAL, SUBLANG_NEUTRAL
+#pragma code_page(1252)
+#endif //_WIN32
+
+/////////////////////////////////////////////////////////////////////////////
+// manifest integration
+#ifdef TBB_MANIFEST
+#include "winuser.h"
+2 RT_MANIFEST tbbmanifest.exe.manifest
+#endif
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Version
+//
+
+VS_VERSION_INFO VERSIONINFO
+ FILEVERSION TBB_VERNUMBERS
+ PRODUCTVERSION TBB_VERNUMBERS
+ FILEFLAGSMASK 0x17L
+#ifdef _DEBUG
+ FILEFLAGS 0x1L
+#else
+ FILEFLAGS 0x0L
+#endif
+ FILEOS 0x40004L
+ FILETYPE 0x2L
+ FILESUBTYPE 0x0L
+BEGIN
+    BLOCK "StringFileInfo"
+    BEGIN
+        BLOCK "000004b0"
+        BEGIN
+            VALUE "CompanyName", "Intel Corporation\0"
+            VALUE "FileDescription", "Intel(R) Threading Building Blocks library\0"
+            VALUE "FileVersion", TBB_VERSION "\0"
+            VALUE "LegalCopyright", "Copyright 2005-2018 Intel Corporation.  All Rights Reserved.\0"
+            VALUE "LegalTrademarks", "\0"
+#ifndef TBB_USE_DEBUG
+            VALUE "OriginalFilename", "tbb.dll\0"
+#else
+            VALUE "OriginalFilename", "tbb_debug.dll\0"
+#endif
+            VALUE "ProductName", "Intel(R) Threading Building Blocks for Windows\0"
+            VALUE "ProductVersion", TBB_VERSION "\0"
+            VALUE "PrivateBuild", "\0"
+            VALUE "SpecialBuild", "\0"
+        END
+    END
+    BLOCK "VarFileInfo"
+    BEGIN
+        VALUE "Translation", 0x0, 1200
+    END
+END
+
+//#endif    // Neutral resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/src/tbb/tbb_statistics.cpp b/xdl/third_party/tbb/src/tbb/tbb_statistics.cpp
new file mode 100644
index 00000000..a04c8c96
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_statistics.cpp
@@ -0,0 +1,187 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb_statistics.h"
+
+#if __TBB_STATISTICS
+
+#include <climits>
+#include <cstdarg>
+#if __TBB_STATISTICS_STDOUT
+#include <cstdio>
+#endif
+
+#include "tbb/spin_mutex.h"
+
+namespace tbb {
+namespace internal {
+
+//! Human readable titles of statistics groups defined by statistics_groups enum.
+/** The order of this vector elements must correspond to the statistics_counters
+    structure layout. **/
+const char* StatGroupTitles[] = {
+    "task objects", "tasks executed", "stealing attempts", "task proxies", "arena", "market", "priority ops", "prio ops details"
+};
+
+//! Human readable titles of statistics elements defined by statistics_counters struct.
+/** The order of this vector elements must correspond to the statistics_counters
+    structure layout (with NULLs interspersed to separate groups). **/
+const char* StatFieldTitles[] = {
+    /*task objects*/        "active", "freed", "big", NULL,
+    /*tasks executed*/      "total", "w/o spawn", NULL,
+    /*stealing attempts*/   "succeeded", "failed", "conflicts", "backoffs", NULL,
+    /*task proxies*/        "mailed", "revoked", "stolen", "bypassed", "ignored", NULL,
+    /*arena*/               "switches", "roundtrips", "avg.conc", "avg.allot", NULL,
+    /*market*/              "roundtrips", NULL,
+    /*priority ops*/        "ar.switch", "mkt.switch", "ar.reset", "ref.fixup", "avg.ar.pr", "avg.mkt.pr", NULL,
+    /*prio ops details*/    "winnows", "reloads", "orphaned", "winnowed", "reloaded", NULL
+};
+
+//! Class for logging statistics
+/** There should be only one instance of this class.
+    Results are written to a file "statistics.txt" in tab-separated format. */
+class statistics_logger {
+public:
+    statistics_logger () {
+        __TBB_ASSERT( sg_end - 1 == 1 << (sizeof(StatGroupTitles)/sizeof(*StatGroupTitles) - 1), NULL );
+
+        my_file = fopen("statistics.txt","w");
+        if( !my_file )
+            perror("fopen(\"statistics.txt\"\")");
+        // Initialize groups dump layout info
+        group_start_field[0] = 0;
+        for ( size_t i = 0, j = 0; i < NumGroups; ++i, ++j ) {
+            __TBB_ASSERT( StatFieldTitles[j], "Empty group occurred" );
+            while ( StatFieldTitles[j] )
+                ++j;
+            group_start_field[i + 1] = j - i; // -i accounts for preceding NULL separators
+        }
+        __TBB_ASSERT( group_start_field[NumGroups] == statistics_counters::size(),
+                      "Wrong number of elements in StatFieldTitles" );
+        dump( "\n%-*s", IDColumnWidth, "");
+        process_groups( &statistics_logger::print_group_title );
+        dump( "%-*s", IDColumnWidth, "ID");
+        process_groups( &statistics_logger::print_field_titles );
+    }
+
+    ~statistics_logger () { fclose(my_file); }
+
+    void record( const statistics_counters& c, size_t id ) {
+        spin_mutex::scoped_lock lock(my_mutex);
+        counters_to_dump = &c;
+#if __TBB_STATISTICS_TOTALS_ONLY
+        if ( id == arena_counters_total ) {
+            dump( "%-*s", IDColumnWidth, "Tot" );
+            process_groups( &statistics_logger::print_field_values );
+        }
+#else /* !__TBB_STATISTICS_TOTALS_ONLY */
+        const char* idString = NULL;
+        switch ( id ) {
+        case 0:
+            idString = "M"; break;
+        case workers_counters_total:
+            idString = "Wtot"; break;
+        case arena_counters_total:
+            idString = "Tot"; break;
+        default:
+            dump( "W%-*u", IDColumnWidth - 1, id );
+        }
+        if ( idString )
+            dump( "%-*s", IDColumnWidth, idString );
+        process_groups( &statistics_logger::print_field_values );
+#endif /* !__TBB_STATISTICS_TOTALS_ONLY */
+    }
+private:
+    static const size_t IDColumnWidth = 5;
+    static const size_t StatisticsColumnWidth = 10;
+    static const size_t NumGroups = sizeof(StatGroupTitles)/sizeof(char*);
+
+    //! File into which statistics are written.
+    FILE* my_file;
+    //! Mutex that serializes accesses to my_file
+    spin_mutex my_mutex;
+    //! Indices of the each group's first field in statistics_counters struct.
+    /** An extra element is used to track the total number of statistics fields. **/
+    size_t group_start_field[NumGroups + 1];
+    //! Currently processed set of counters.
+    const statistics_counters* counters_to_dump;
+
+    static const size_t NumFields = sizeof(StatFieldTitles)/sizeof(*StatFieldTitles) - NumGroups;
+    bool averages_fields[NumFields];
+
+    void dump ( char const* fmt, ... ) {
+        va_list args;
+        if ( my_file ) {
+            va_start( args, fmt );
+            vfprintf( my_file, fmt, args );
+            va_end( args );
+        }
+#if __TBB_STATISTICS_STDOUT
+        va_start( args, fmt );
+        vprintf( fmt, args );
+        va_end( args );
+#endif
+    }
+
+    void process_groups ( void (statistics_logger::*per_group_action)(size_t group_idx) ) {
+        for ( size_t i = 0, group_flag = 1; i < NumGroups; ++i, group_flag <<= 1 ) {
+            __TBB_ASSERT( group_flag < sg_end, "StatGroupTitles contents is incompatible with statistics_groups definition" );
+            if ( __TBB_ActiveStatisticsGroups & group_flag )
+                (this->*per_group_action)( i );
+        }
+        dump( "\n" );
+    }
+
+    void print_group_title ( size_t group_idx ) {
+        dump( "%-*s", (group_start_field[group_idx + 1] - group_start_field[group_idx]) * (StatisticsColumnWidth + 1),
+                        StatGroupTitles[group_idx] );
+    }
+
+    void print_field_titles ( size_t group_idx ) {
+        // +group_idx accounts for preceding NULL separators
+        size_t i = group_start_field[group_idx] + group_idx;
+        while ( StatFieldTitles[i] ) {
+            averages_fields[i - group_idx] = strncmp(StatFieldTitles[i], "avg.", 4) == 0;
+            dump( "%-*s ", StatisticsColumnWidth, StatFieldTitles[i++] );
+        }
+    }
+
+    void print_field_values ( size_t group_idx ) {
+        size_t begin = group_start_field[group_idx],
+               end = group_start_field[group_idx + 1];
+        for ( size_t i = begin; i < end; ++i ) {
+            if ( averages_fields[i] )
+                dump( "%-*.2f ", StatisticsColumnWidth, (double)counters_to_dump->field(i)/counters_to_dump->tasks_executed );
+            else
+                dump( "%-*ld ", StatisticsColumnWidth, counters_to_dump->field(i) );
+        }
+    }
+}; // class statistics_logger
+
+static statistics_logger the_statistics;
+
+void dump_statistics ( const statistics_counters& c, size_t id ) {
+    the_statistics.record(c, id);
+}
+
+} // namespace internal
+} // namespace tbb
+
+#endif /* __TBB_STATISTICS */
diff --git a/xdl/third_party/tbb/src/tbb/tbb_statistics.h b/xdl/third_party/tbb/src/tbb/tbb_statistics.h
new file mode 100644
index 00000000..aba55069
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_statistics.h
@@ -0,0 +1,240 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_tbb_statistics_H
+#define _TBB_tbb_statistics_H
+
+/**
+    This file defines parameters of the internal statistics collected by the TBB
+    library (currently by the task scheduler only).
+
+    Statistics is accumulated separately in each thread and is dumped when
+    the scheduler instance associated with the given  thread is destroyed.
+    For apps with multiple master threads or with the same master repeatedly
+    initializing and then deinitializing task scheduler this results in TBB
+    workers statistics getting inseparably mixed.
+
+    Therefore statistics is accumulated in arena slots, and should be dumped
+    when arena is destroyed. This separates statistics collected for each
+    scheduler activity region in each master thread.
+
+    With the current RML implementation (TBB 2.2, 3.0) to avoid complete loss of
+    statistics data during app shutdown (because of lazy workers deinitialization
+    logic) set __TBB_STATISTICS_EARLY_DUMP macro to write the statistics at the
+    moment a master thread deinitializes its scheduler. This may happen a little
+    earlier than the moment of arena destruction resulting in the following undesired
+    (though usually tolerable) effects:
+    - a few events related to unsuccessful stealing or thread pool activity may be lost,
+    - statistics may be substantially incomplete in case of FIFO tasks used in
+      the FAF mode.
+
+    Macro __TBB_STATISTICS_STDOUT and global variable __TBB_ActiveStatisticsGroups
+    defined below can be used to configure the statistics output.
+
+    To add new counter:
+    1) Insert it into the appropriate group range in statistics_counters;
+    2) Insert the corresponding field title into StatFieldTitles (preserving
+       relative order of the fields).
+
+    To add new counters group:
+    1) Insert new group bit flag into statistics_groups;
+    2) Insert the new group title into StatGroupTitles (preserving
+       relative order of the groups).
+    3) Add counter belonging to the new group as described above
+**/
+
+#include "tbb/tbb_stddef.h"
+
+#ifndef __TBB_STATISTICS
+#define __TBB_STATISTICS 0
+#endif /* __TBB_STATISTICS */
+
+#if __TBB_STATISTICS
+
+#include <string.h>  // for memset
+
+//! Dump counters into stdout as well.
+/** By default statistics counters are written to the file "statistics.txt" only. **/
+#define __TBB_STATISTICS_STDOUT 1
+
+//! Dump only totals for all threads in the given arena
+/** By default statistics counters for each arena slot are dumped separately, as
+    well as the subtotal for workers. **/
+#define __TBB_STATISTICS_TOTALS_ONLY 1
+
+//! Dump statistics for an arena when its master completes
+/** By default (when this macro is not set) the statistics is sent to output when
+    arena object is destroyed. But with the current lazy workers termination
+    logic default behavior may result in losing all statistics output. **/
+#define __TBB_STATISTICS_EARLY_DUMP 1
+
+#define GATHER_STATISTIC(x) (x)
+
+namespace tbb {
+namespace internal {
+
+//! Groups of statistics counters.
+/** The order of enumerators must be the same as the order of the corresponding
+    field groups in the statistics_counters structure. **/
+enum statistics_groups {
+    sg_task_allocation = 0x01,
+    sg_task_execution = 0x02,
+    sg_stealing = 0x04,
+    sg_affinity = 0x08,
+    sg_arena = 0x10,
+    sg_market = 0x20,
+    sg_prio = 0x40,
+    sg_prio_ex = 0x80,
+    // List end marker. Insert new groups only before it.
+    sg_end
+};
+
+//! Groups of counters to output
+const uintptr_t __TBB_ActiveStatisticsGroups = sg_task_execution | sg_stealing | sg_affinity | sg_arena | sg_market;
+
+//! A set of various statistics counters that are updated by the library on per thread basis.
+/** All the fields must be of the same type (statistics_counters::counter_type).
+    This is necessary to allow reinterpreting this structure as an array. **/
+struct statistics_counters {
+    typedef long counter_type;
+
+    // Group: sg_task_allocation
+    // Counters in this group can have negative values as the tasks migrate across
+    // threads while the associated counters are updated in the current thread only
+    // to avoid data races
+
+    //! Number of tasks allocated and not yet destroyed
+    counter_type active_tasks;
+    //! Number of task corpses stored for future reuse
+    counter_type free_list_length;
+    //! Number of big tasks allocated during the run
+    /** To find total number of tasks malloc'd, compute (big_tasks+my_small_task_count) */
+    counter_type big_tasks;
+
+    // Group: sg_task_execution
+
+    //! Number of tasks executed
+    counter_type tasks_executed;
+    //! Number of elided spawns
+    counter_type spawns_bypassed;
+
+    // Group: sg_stealing
+
+    //! Number of tasks successfully stolen
+    counter_type steals_committed;
+    //! Number of failed stealing attempts
+    counter_type steals_failed;
+    //! Number of failed attempts to lock victim's task pool
+    counter_type thieves_conflicts;
+    //! Number of times thief backed off because of the collision with the owner
+    counter_type thief_backoffs;
+
+    // Group: sg_affinity
+
+    //! Number of tasks received from mailbox
+    counter_type mails_received;
+    //! Number of affinitized tasks executed by the owner
+    /** Goes as "revoked" in statistics printout. **/
+    counter_type proxies_executed;
+    //! Number of affinitized tasks intercepted by thieves
+    counter_type proxies_stolen;
+    //! Number of proxy bypasses by thieves during stealing
+    counter_type proxies_bypassed;
+    //! Number of affinitized tasks executed by the owner via scheduler bypass mechanism
+    counter_type affinity_ignored;
+
+    // Group: sg_arena
+
+    //! Number of times the state of arena switched between "full" and "empty"
+    counter_type gate_switches;
+    //! Number of times workers left an arena and returned into the market
+    counter_type arena_roundtrips;
+    // !Average concurrency level of this arena
+    counter_type avg_arena_concurrency;
+    //! Average assigned priority
+    counter_type avg_assigned_workers;
+
+    // Group: sg_market
+
+    //! Number of times workers left the market and returned into RML
+    counter_type market_roundtrips;
+
+    // Group; sg_prio
+
+    //! Number of arena priority switches
+    counter_type arena_prio_switches;
+    //! Number of market priority switches
+    counter_type market_prio_switches;
+    //! Number of arena priority switches
+    counter_type arena_prio_resets;
+    //! Number of reference priority source fixups to avoid deadlock
+    counter_type prio_ref_fixups;
+    //! Average arena priority
+    counter_type avg_arena_prio;
+    //! Average market priority
+    counter_type avg_market_prio;
+
+    // Group; sg_prio_ex
+
+    //! Number of times local task pools were winnowed
+    counter_type prio_winnowings;
+    //! Number of times secondary task pools were searched for top priority tasks
+    counter_type prio_reloads;
+    //! Number of times secondary task pools were abandoned by quitting workers
+    counter_type prio_orphanings;
+    //! Number of tasks offloaded into secondary task pools
+    counter_type prio_tasks_offloaded;
+    //! Number of tasks reloaded from secondary task pools
+    counter_type prio_tasks_reloaded;
+
+    // Constructor and helpers
+
+    statistics_counters() { reset(); }
+
+    void reset () { memset( this, 0, sizeof(statistics_counters) ); }
+
+    counter_type& field ( size_t index ) { return reinterpret_cast<counter_type*>(this)[index]; }
+
+    const counter_type& field ( size_t index ) const { return reinterpret_cast<const counter_type*>(this)[index]; }
+
+    static size_t size () { return sizeof(statistics_counters) / sizeof(counter_type); }
+
+    const statistics_counters& operator += ( const statistics_counters& rhs ) {
+        for ( size_t i = 0; i < size(); ++i )
+            field(i) += rhs.field(i);
+        return *this;
+    }
+}; // statistics_counters
+
+static const size_t workers_counters_total = (size_t)-1;
+static const size_t arena_counters_total = (size_t)-2;
+
+void dump_statistics ( const statistics_counters& c, size_t id );
+
+} // namespace internal
+} // namespace tbb
+
+#else /* !__TBB_STATISTICS */
+
+#define GATHER_STATISTIC(x) ((void)0)
+
+#endif /* !__TBB_STATISTICS */
+
+#endif /* _TBB_tbb_statistics_H */
diff --git a/xdl/third_party/tbb/src/tbb/tbb_thread.cpp b/xdl/third_party/tbb/src/tbb/tbb_thread.cpp
new file mode 100644
index 00000000..0bcb76e8
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_thread.cpp
@@ -0,0 +1,196 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _WIN32||_WIN64
+#include <process.h>        // _beginthreadex()
+#endif
+#include <errno.h>
+#include "tbb_misc.h"       // handle_win_error()
+#include "tbb/tbb_stddef.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/global_control.h" // thread_stack_size
+#include "governor.h"       // default_num_threads()
+#if __TBB_WIN8UI_SUPPORT
+#include <thread>
+#endif
+
+namespace tbb {
+namespace internal {
+
+//! Allocate a closure
+void* allocate_closure_v3( size_t size )
+{
+    return allocate_via_handler_v3( size );
+}
+
+//! Free a closure allocated by allocate_closure_v3
+void free_closure_v3( void *ptr )
+{
+    deallocate_via_handler_v3( ptr );
+}
+
+void tbb_thread_v3::join()
+{
+    if (!joinable())
+        handle_perror( EINVAL, "tbb_thread::join" ); // Invalid argument
+    if (this_tbb_thread::get_id() == get_id())
+        handle_perror( EDEADLK, "tbb_thread::join" ); // Resource deadlock avoided
+#if _WIN32||_WIN64
+#if __TBB_WIN8UI_SUPPORT
+    std::thread* thread_tmp=(std::thread*)my_thread_id;
+    thread_tmp->join();
+    delete thread_tmp;
+#else // __TBB_WIN8UI_SUPPORT
+    DWORD status = WaitForSingleObjectEx( my_handle, INFINITE, FALSE );
+    if ( status == WAIT_FAILED )
+        handle_win_error( GetLastError() );
+    BOOL close_stat = CloseHandle( my_handle );
+    if ( close_stat == 0 )
+        handle_win_error( GetLastError() );
+    my_thread_id = 0;
+#endif // __TBB_WIN8UI_SUPPORT
+#else
+    int status = pthread_join( my_handle, NULL );
+    if( status )
+        handle_perror( status, "pthread_join" );
+#endif // _WIN32||_WIN64
+    my_handle = 0;
+}
+
+void tbb_thread_v3::detach() {
+    if (!joinable())
+        handle_perror( EINVAL, "tbb_thread::detach" ); // Invalid argument
+#if _WIN32||_WIN64
+    BOOL status = CloseHandle( my_handle );
+    if ( status == 0 )
+      handle_win_error( GetLastError() );
+    my_thread_id = 0;
+#else
+    int status = pthread_detach( my_handle );
+    if( status )
+        handle_perror( status, "pthread_detach" );
+#endif // _WIN32||_WIN64
+    my_handle = 0;
+}
+
+void tbb_thread_v3::internal_start( __TBB_NATIVE_THREAD_ROUTINE_PTR(start_routine),
+                                    void* closure ) {
+#if _WIN32||_WIN64
+#if __TBB_WIN8UI_SUPPORT
+    std::thread* thread_tmp=new std::thread(start_routine, closure);
+    my_handle  = thread_tmp->native_handle();
+//  TODO: to find out the way to find thread_id without GetThreadId and other
+//  desktop functions.
+//  Now tbb_thread does have its own thread_id that stores std::thread object
+    my_thread_id = (size_t)thread_tmp;
+#else
+    unsigned thread_id;
+    // The return type of _beginthreadex is "uintptr_t" on new MS compilers,
+    // and 'unsigned long' on old MS compilers.  uintptr_t works for both.
+    uintptr_t status = _beginthreadex( NULL, (unsigned)global_control::active_value(global_control::thread_stack_size),
+                                       start_routine, closure, 0, &thread_id );
+    if( status==0 )
+        handle_perror(errno,"__beginthreadex");
+    else {
+        my_handle = (HANDLE)status;
+        my_thread_id = thread_id;
+    }
+#endif
+#else
+    pthread_t thread_handle;
+    int status;
+    pthread_attr_t stack_size;
+    status = pthread_attr_init( &stack_size );
+    if( status )
+        handle_perror( status, "pthread_attr_init" );
+    status = pthread_attr_setstacksize( &stack_size, global_control::active_value(global_control::thread_stack_size) );
+    if( status )
+        handle_perror( status, "pthread_attr_setstacksize" );
+
+    status = pthread_create( &thread_handle, &stack_size, start_routine, closure );
+    if( status )
+        handle_perror( status, "pthread_create" );
+    status = pthread_attr_destroy( &stack_size );
+    if( status )
+        handle_perror( status, "pthread_attr_destroy" );
+
+    my_handle = thread_handle;
+#endif // _WIN32||_WIN64
+}
+
+unsigned tbb_thread_v3::hardware_concurrency() __TBB_NOEXCEPT(true) {
+    return governor::default_num_threads();
+}
+
+tbb_thread_v3::id thread_get_id_v3() {
+#if _WIN32||_WIN64
+    return tbb_thread_v3::id( GetCurrentThreadId() );
+#else
+    return tbb_thread_v3::id( pthread_self() );
+#endif // _WIN32||_WIN64
+}
+
+void move_v3( tbb_thread_v3& t1, tbb_thread_v3& t2 )
+{
+    if (t1.joinable())
+        t1.detach();
+    t1.my_handle = t2.my_handle;
+    t2.my_handle = 0;
+#if _WIN32||_WIN64
+    t1.my_thread_id = t2.my_thread_id;
+    t2.my_thread_id = 0;
+#endif // _WIN32||_WIN64
+}
+
+void thread_yield_v3()
+{
+    __TBB_Yield();
+}
+
+void thread_sleep_v3(const tick_count::interval_t &i)
+{
+#if _WIN32||_WIN64
+     tick_count t0 = tick_count::now();
+     tick_count t1 = t0;
+     for(;;) {
+         double remainder = (i-(t1-t0)).seconds()*1e3;  // milliseconds remaining to sleep
+         if( remainder<=0 ) break;
+         DWORD t = remainder>=INFINITE ? INFINITE-1 : DWORD(remainder);
+#if !__TBB_WIN8UI_SUPPORT
+         Sleep( t );
+#else
+         std::chrono::milliseconds sleep_time( t );
+         std::this_thread::sleep_for( sleep_time );
+#endif
+         t1 = tick_count::now();
+    }
+#else
+    struct timespec req;
+    double sec = i.seconds();
+
+    req.tv_sec = static_cast<long>(sec);
+    req.tv_nsec = static_cast<long>( (sec - req.tv_sec)*1e9 );
+    nanosleep(&req, NULL);
+#endif // _WIN32||_WIN64
+}
+
+} // internal
+} // tbb
diff --git a/xdl/third_party/tbb/src/tbb/tbb_version.h b/xdl/third_party/tbb/src/tbb/tbb_version.h
new file mode 100644
index 00000000..dcaa55b1
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tbb_version.h
@@ -0,0 +1,119 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Please define version number in the file:
+#include "tbb/tbb_stddef.h"
+
+// And don't touch anything below
+#ifndef ENDL
+#define ENDL "\n"
+#endif
+#include "version_string.ver"
+
+#ifndef __TBB_VERSION_STRINGS
+#pragma message("Warning: version_string.ver isn't generated properly by version_info.sh script!")
+// here is an example of macros value:
+#define __TBB_VERSION_STRINGS \
+"TBB: BUILD_HOST\tUnknown\n" \
+"TBB: BUILD_ARCH\tUnknown\n" \
+"TBB: BUILD_OS\t\tUnknown\n" \
+"TBB: BUILD_CL\t\tUnknown\n" \
+"TBB: BUILD_COMPILER\tUnknown\n" \
+"TBB: BUILD_COMMAND\tUnknown\n"
+#endif
+#ifndef __TBB_DATETIME
+#ifdef RC_INVOKED
+#define __TBB_DATETIME "Unknown"
+#else
+#define __TBB_DATETIME __DATE__ __TIME__
+#endif
+#endif
+
+#define __TBB_VERSION_NUMBER(N) #N ": VERSION\t\t" __TBB_STRING(TBB_VERSION_MAJOR.TBB_VERSION_MINOR) ENDL
+#define __TBB_INTERFACE_VERSION_NUMBER(N) #N ": INTERFACE VERSION\t" __TBB_STRING(TBB_INTERFACE_VERSION) ENDL
+
+#define __TBB_VERSION_DATETIME(N) #N ": BUILD_DATE\t\t" __TBB_DATETIME ENDL
+#ifndef TBB_USE_DEBUG
+    #define __TBB_VERSION_USE_DEBUG(N) #N ": TBB_USE_DEBUG\tundefined" ENDL
+#elif TBB_USE_DEBUG==0
+    #define __TBB_VERSION_USE_DEBUG(N) #N ": TBB_USE_DEBUG\t0" ENDL
+#elif TBB_USE_DEBUG==1
+    #define __TBB_VERSION_USE_DEBUG(N) #N ": TBB_USE_DEBUG\t1" ENDL
+#elif TBB_USE_DEBUG==2
+    #define __TBB_VERSION_USE_DEBUG(N) #N ": TBB_USE_DEBUG\t2" ENDL
+#else
+    #error Unexpected value for TBB_USE_DEBUG
+#endif
+
+/* Make __TBB_VERSION_USE_ASSERT and __TBB_VERSION_DO_NOTIFY empty for rc
+ * because rc from VS2005 crashed with fatal error RC10056 for too complex
+ * macros (for example, when __TBB_CPF_BUILD is enabled).
+ * All information is available in BUILD_COMMAND anyway.
+ */
+
+#ifdef RC_INVOKED
+    #define __TBB_VERSION_USE_ASSERT(N)
+#else // RC_INVOKED
+#ifndef TBB_USE_ASSERT
+    #define __TBB_VERSION_USE_ASSERT(N) #N ": TBB_USE_ASSERT\tundefined" ENDL
+#elif TBB_USE_ASSERT==0
+    #define __TBB_VERSION_USE_ASSERT(N) #N ": TBB_USE_ASSERT\t0" ENDL
+#elif TBB_USE_ASSERT==1
+    #define __TBB_VERSION_USE_ASSERT(N) #N ": TBB_USE_ASSERT\t1" ENDL
+#elif TBB_USE_ASSERT==2
+    #define __TBB_VERSION_USE_ASSERT(N) #N ": TBB_USE_ASSERT\t2" ENDL
+#else
+    #error Unexpected value for TBB_USE_ASSERT
+#endif
+#endif // RC_INVOKED
+
+#ifndef __TBB_CPF_BUILD
+    #define __TBB_VERSION_TBB_PREVIEW_BINARY(N)
+#else
+    #define __TBB_VERSION_TBB_PREVIEW_BINARY(N) #N ": TBB_PREVIEW_BINARY\t1" ENDL
+#endif
+
+#ifdef RC_INVOKED
+    #define __TBB_VERSION_DO_NOTIFY(N)
+#else
+#ifndef DO_ITT_NOTIFY
+    #define __TBB_VERSION_DO_NOTIFY(N) #N ": DO_ITT_NOTIFY\tundefined" ENDL
+#elif DO_ITT_NOTIFY==1
+    #define __TBB_VERSION_DO_NOTIFY(N) #N ": DO_ITT_NOTIFY\t1" ENDL
+#elif DO_ITT_NOTIFY==0
+    #define __TBB_VERSION_DO_NOTIFY(N)
+#else
+    #error Unexpected value for DO_ITT_NOTIFY
+#endif
+#endif // RC_INVOKED
+
+#define TBB_VERSION_STRINGS_P(N) __TBB_VERSION_NUMBER(N) __TBB_INTERFACE_VERSION_NUMBER(N) __TBB_VERSION_DATETIME(N) __TBB_VERSION_STRINGS(N) __TBB_VERSION_USE_DEBUG(N) __TBB_VERSION_USE_ASSERT(N) __TBB_VERSION_TBB_PREVIEW_BINARY(N) __TBB_VERSION_DO_NOTIFY(N)
+
+#define TBB_VERSION_STRINGS TBB_VERSION_STRINGS_P(TBB)
+#define TBBMALLOC_VERSION_STRINGS TBB_VERSION_STRINGS_P(TBBmalloc)
+
+// numbers
+#ifndef __TBB_VERSION_YMD
+#define __TBB_VERSION_YMD 0, 0
+#endif
+
+#define TBB_VERNUMBERS TBB_VERSION_MAJOR, TBB_VERSION_MINOR, __TBB_VERSION_YMD
+
+#define TBB_VERSION __TBB_STRING(TBB_VERNUMBERS)
diff --git a/xdl/third_party/tbb/src/tbb/tls.h b/xdl/third_party/tbb/src/tbb/tls.h
new file mode 100644
index 00000000..4bae634f
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tls.h
@@ -0,0 +1,124 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_tls_H
+#define _TBB_tls_H
+
+#if USE_PTHREAD
+#include <pthread.h>
+#else /* assume USE_WINTHREAD */
+#include "tbb/machine/windows_api.h"
+#endif
+
+namespace tbb {
+
+namespace internal {
+
+typedef void (*tls_dtor_t)(void*);
+
+//! Basic cross-platform wrapper class for TLS operations.
+template <typename T>
+class basic_tls {
+#if USE_PTHREAD
+    typedef pthread_key_t tls_key_t;
+public:
+    int  create( tls_dtor_t dtor = NULL ) {
+        return pthread_key_create(&my_key, dtor);
+    }
+    int  destroy()      { return pthread_key_delete(my_key); }
+    void set( T value ) { pthread_setspecific(my_key, (void*)value); }
+    T    get()          { return (T)pthread_getspecific(my_key); }
+#else /* USE_WINTHREAD */
+    typedef DWORD tls_key_t;
+public:
+#if !__TBB_WIN8UI_SUPPORT
+    int create() {
+        tls_key_t tmp = TlsAlloc();
+        if( tmp==TLS_OUT_OF_INDEXES )
+            return TLS_OUT_OF_INDEXES;
+        my_key = tmp;
+        return 0;
+    }
+    int  destroy()      { TlsFree(my_key); my_key=0; return 0; }
+    void set( T value ) { TlsSetValue(my_key, (LPVOID)value); }
+    T    get()          { return (T)TlsGetValue(my_key); }
+#else /*!__TBB_WIN8UI_SUPPORT*/
+    int create() {
+        tls_key_t tmp = FlsAlloc(NULL);
+        if( tmp== (DWORD)0xFFFFFFFF )
+            return (DWORD)0xFFFFFFFF;
+        my_key = tmp;
+        return 0;
+    }
+    int  destroy()      { FlsFree(my_key); my_key=0; return 0; }
+    void set( T value ) { FlsSetValue(my_key, (LPVOID)value); }
+    T    get()          { return (T)FlsGetValue(my_key); }
+#endif /* !__TBB_WIN8UI_SUPPORT */
+#endif /* USE_WINTHREAD */
+private:
+    tls_key_t my_key;
+};
+
+//! More advanced TLS support template class.
+/** It supports RAII and to some extent mimic __declspec(thread) variables. */
+template <typename T>
+class tls : public basic_tls<T> {
+    typedef basic_tls<T> base;
+public:
+    tls()  { base::create();  }
+    ~tls() { base::destroy(); }
+    T operator=(T value) { base::set(value); return value; }
+    operator T() { return base::get(); }
+};
+
+template <typename T>
+class tls<T*> : basic_tls<T*> {
+    typedef basic_tls<T*> base;
+    static void internal_dtor(void* ptr) {
+        if (ptr) delete (T*)ptr;
+    }
+    T* internal_get() {
+        T* result = base::get();
+        if (!result) {
+            result = new T;
+            base::set(result);
+        }
+        return result;
+    }
+public:
+    tls()  {
+#if USE_PTHREAD
+        base::create( internal_dtor );
+#else
+        base::create();
+#endif
+    }
+    ~tls() { base::destroy(); }
+    T* operator=(T* value) { base::set(value); return value; }
+    operator T*()   { return  internal_get(); }
+    T* operator->() { return  internal_get(); }
+    T& operator*()  { return *internal_get(); }
+};
+
+} // namespace internal
+
+} // namespace tbb
+
+#endif /* _TBB_tls_H */
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/disable_warnings.h b/xdl/third_party/tbb/src/tbb/tools_api/disable_warnings.h
new file mode 100644
index 00000000..6725ddc3
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/disable_warnings.h
@@ -0,0 +1,39 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "ittnotify_config.h"
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+
+#pragma warning (disable: 593)   /* parameter "XXXX" was set but never used                 */
+#pragma warning (disable: 344)   /* typedef name has already been declared (with same type) */
+#pragma warning (disable: 174)   /* expression has no effect                                */
+#pragma warning (disable: 4127)  /* conditional expression is constant                      */
+#pragma warning (disable: 4306)  /* conversion from '?' to '?' of greater size              */
+
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#if defined __INTEL_COMPILER
+
+#pragma warning (disable: 869)  /* parameter "XXXXX" was never referenced                  */
+#pragma warning (disable: 1418) /* external function definition with no prior declaration  */
+#pragma warning (disable: 1419) /* external declaration in primary source file             */
+
+#endif /* __INTEL_COMPILER */
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/ittnotify.h b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify.h
new file mode 100644
index 00000000..433477e5
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify.h
@@ -0,0 +1,3837 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _ITTNOTIFY_H_
+#define _ITTNOTIFY_H_
+
+/**
+@file
+@brief Public User API functions and types
+@mainpage
+
+The ITT API is used to annotate a user's program with additional information
+that can be used by correctness and performance tools. The user inserts
+calls in their program. Those calls generate information that is collected
+at runtime, and used by Intel(R) Threading Tools.
+
+@section API Concepts
+The following general concepts are used throughout the API.
+
+@subsection Unicode Support
+Many API functions take character string arguments. On Windows, there
+are two versions of each such function. The function name is suffixed
+by W if Unicode support is enabled, and by A otherwise. Any API function
+that takes a character string argument adheres to this convention.
+
+@subsection Conditional Compilation
+Many users prefer having an option to modify ITT API code when linking it
+inside their runtimes. ITT API header file provides a mechanism to replace
+ITT API function names inside your code with empty strings. To do this,
+define the macros INTEL_NO_ITTNOTIFY_API during compilation and remove the
+static library from the linker script.
+
+@subsection Domains
+[see domains]
+Domains provide a way to separate notification for different modules or
+libraries in a program. Domains are specified by dotted character strings,
+e.g. TBB.Internal.Control.
+
+A mechanism (to be specified) is provided to enable and disable
+domains. By default, all domains are enabled.
+@subsection Named Entities and Instances
+Named entities (frames, regions, tasks, and markers) communicate
+information about the program to the analysis tools. A named entity often
+refers to a section of program code, or to some set of logical concepts
+that the programmer wants to group together.
+
+Named entities relate to the programmer's static view of the program. When
+the program actually executes, many instances of a given named entity
+may be created.
+
+The API annotations denote instances of named entities. The actual
+named entities are displayed using the analysis tools. In other words,
+the named entities come into existence when instances are created.
+
+Instances of named entities may have instance identifiers (IDs). Some
+API calls use instance identifiers to create relationships between
+different instances of named entities. Other API calls associate data
+with instances of named entities.
+
+Some named entities must always have instance IDs. In particular, regions
+and frames always have IDs. Task and markers need IDs only if the ID is
+needed in another API call (such as adding a relation or metadata).
+
+The lifetime of instance IDs is distinct from the lifetime of
+instances. This allows various relationships to be specified separate
+from the actual execution of instances. This flexibility comes at the
+expense of extra API calls.
+
+The same ID may not be reused for different instances, unless a previous
+[ref] __itt_id_destroy call for that ID has been issued.
+*/
+
+/** @cond exclude_from_documentation */
+#ifndef ITT_OS_WIN
+#  define ITT_OS_WIN   1
+#endif /* ITT_OS_WIN */
+
+#ifndef ITT_OS_LINUX
+#  define ITT_OS_LINUX 2
+#endif /* ITT_OS_LINUX */
+
+#ifndef ITT_OS_MAC
+#  define ITT_OS_MAC   3
+#endif /* ITT_OS_MAC */
+
+#ifndef ITT_OS_FREEBSD
+#  define ITT_OS_FREEBSD   4
+#endif /* ITT_OS_FREEBSD */
+
+#ifndef ITT_OS
+#  if defined WIN32 || defined _WIN32
+#    define ITT_OS ITT_OS_WIN
+#  elif defined( __APPLE__ ) && defined( __MACH__ )
+#    define ITT_OS ITT_OS_MAC
+#  elif defined( __FreeBSD__ )
+#    define ITT_OS ITT_OS_FREEBSD
+#  else
+#    define ITT_OS ITT_OS_LINUX
+#  endif
+#endif /* ITT_OS */
+
+#ifndef ITT_PLATFORM_WIN
+#  define ITT_PLATFORM_WIN 1
+#endif /* ITT_PLATFORM_WIN */
+
+#ifndef ITT_PLATFORM_POSIX
+#  define ITT_PLATFORM_POSIX 2
+#endif /* ITT_PLATFORM_POSIX */
+
+#ifndef ITT_PLATFORM_MAC
+#  define ITT_PLATFORM_MAC 3
+#endif /* ITT_PLATFORM_MAC */
+
+#ifndef ITT_PLATFORM_FREEBSD
+#  define ITT_PLATFORM_FREEBSD 4
+#endif /* ITT_PLATFORM_FREEBSD */
+
+#ifndef ITT_PLATFORM
+#  if ITT_OS==ITT_OS_WIN
+#    define ITT_PLATFORM ITT_PLATFORM_WIN
+#  elif ITT_OS==ITT_OS_MAC
+#    define ITT_PLATFORM ITT_PLATFORM_MAC
+#  elif ITT_OS==ITT_OS_FREEBSD
+#    define ITT_PLATFORM ITT_PLATFORM_FREEBSD
+#  else
+#    define ITT_PLATFORM ITT_PLATFORM_POSIX
+#  endif
+#endif /* ITT_PLATFORM */
+
+#if defined(_UNICODE) && !defined(UNICODE)
+#define UNICODE
+#endif
+
+#include <stddef.h>
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#include <tchar.h>
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#include <stdint.h>
+#if defined(UNICODE) || defined(_UNICODE)
+#include <wchar.h>
+#endif /* UNICODE || _UNICODE */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#ifndef CDECL
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    define CDECL __cdecl
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#    if defined _M_IX86 || defined __i386__
+#      define CDECL __attribute__ ((cdecl))
+#    else  /* _M_IX86 || __i386__ */
+#      define CDECL /* actual only on x86 platform */
+#    endif /* _M_IX86 || __i386__ */
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* CDECL */
+
+#ifndef STDCALL
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    define STDCALL __stdcall
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#    if defined _M_IX86 || defined __i386__
+#      define STDCALL __attribute__ ((stdcall))
+#    else  /* _M_IX86 || __i386__ */
+#      define STDCALL /* supported only on x86 platform */
+#    endif /* _M_IX86 || __i386__ */
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* STDCALL */
+
+#define ITTAPI    CDECL
+#define LIBITTAPI CDECL
+
+/* TODO: Temporary for compatibility! */
+#define ITTAPI_CALL    CDECL
+#define LIBITTAPI_CALL CDECL
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+/* use __forceinline (VC++ specific) */
+#define ITT_INLINE           __forceinline
+#define ITT_INLINE_ATTRIBUTE /* nothing */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+/*
+ * Generally, functions are not inlined unless optimization is specified.
+ * For functions declared inline, this attribute inlines the function even
+ * if no optimization level was specified.
+ */
+#ifdef __STRICT_ANSI__
+#define ITT_INLINE           static
+#define ITT_INLINE_ATTRIBUTE __attribute__((unused))
+#else  /* __STRICT_ANSI__ */
+#define ITT_INLINE           static inline
+#define ITT_INLINE_ATTRIBUTE __attribute__((always_inline, unused))
+#endif /* __STRICT_ANSI__ */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+/** @endcond */
+
+#ifdef INTEL_ITTNOTIFY_ENABLE_LEGACY
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    pragma message("WARNING!!! Deprecated API is used. Please undefine INTEL_ITTNOTIFY_ENABLE_LEGACY macro")
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+// #warning usage leads to ICC's compilation error
+// #    warning "Deprecated API is used. Please undefine INTEL_ITTNOTIFY_ENABLE_LEGACY macro"
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#  include "legacy/ittnotify.h"
+#endif /* INTEL_ITTNOTIFY_ENABLE_LEGACY */
+
+/** @cond exclude_from_documentation */
+/* Helper macro for joining tokens */
+#define ITT_JOIN_AUX(p,n) p##n
+#define ITT_JOIN(p,n)     ITT_JOIN_AUX(p,n)
+
+#ifdef ITT_MAJOR
+#undef ITT_MAJOR
+#endif
+#ifdef ITT_MINOR
+#undef ITT_MINOR
+#endif
+#define ITT_MAJOR     3
+#define ITT_MINOR     0
+
+/* Standard versioning of a token with major and minor version numbers */
+#define ITT_VERSIONIZE(x)    \
+    ITT_JOIN(x,              \
+    ITT_JOIN(_,              \
+    ITT_JOIN(ITT_MAJOR,      \
+    ITT_JOIN(_, ITT_MINOR))))
+
+#ifndef INTEL_ITTNOTIFY_PREFIX
+#  define INTEL_ITTNOTIFY_PREFIX __itt_
+#endif /* INTEL_ITTNOTIFY_PREFIX */
+#ifndef INTEL_ITTNOTIFY_POSTFIX
+#  define INTEL_ITTNOTIFY_POSTFIX _ptr_
+#endif /* INTEL_ITTNOTIFY_POSTFIX */
+
+#define ITTNOTIFY_NAME_AUX(n) ITT_JOIN(INTEL_ITTNOTIFY_PREFIX,n)
+#define ITTNOTIFY_NAME(n)     ITT_VERSIONIZE(ITTNOTIFY_NAME_AUX(ITT_JOIN(n,INTEL_ITTNOTIFY_POSTFIX)))
+
+#define ITTNOTIFY_VOID(n) (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)
+#define ITTNOTIFY_DATA(n) (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)
+
+#define ITTNOTIFY_VOID_D0(n,d)       (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d)
+#define ITTNOTIFY_VOID_D1(n,d,x)     (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x)
+#define ITTNOTIFY_VOID_D2(n,d,x,y)   (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y)
+#define ITTNOTIFY_VOID_D3(n,d,x,y,z) (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z)
+#define ITTNOTIFY_VOID_D4(n,d,x,y,z,a)     (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z,a)
+#define ITTNOTIFY_VOID_D5(n,d,x,y,z,a,b)   (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b)
+#define ITTNOTIFY_VOID_D6(n,d,x,y,z,a,b,c) (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b,c)
+#define ITTNOTIFY_DATA_D0(n,d)       (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d)
+#define ITTNOTIFY_DATA_D1(n,d,x)     (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x)
+#define ITTNOTIFY_DATA_D2(n,d,x,y)   (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y)
+#define ITTNOTIFY_DATA_D3(n,d,x,y,z) (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z)
+#define ITTNOTIFY_DATA_D4(n,d,x,y,z,a)     (!(d)->flags) ? 0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z,a)
+#define ITTNOTIFY_DATA_D5(n,d,x,y,z,a,b)   (!(d)->flags) ? 0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b)
+#define ITTNOTIFY_DATA_D6(n,d,x,y,z,a,b,c) (!(d)->flags) ? 0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b,c)
+
+#ifdef ITT_STUB
+#undef ITT_STUB
+#endif
+#ifdef ITT_STUBV
+#undef ITT_STUBV
+#endif
+#define ITT_STUBV(api,type,name,args)                             \
+    typedef type (api* ITT_JOIN(ITTNOTIFY_NAME(name),_t)) args;   \
+    extern ITT_JOIN(ITTNOTIFY_NAME(name),_t) ITTNOTIFY_NAME(name);
+#define ITT_STUB ITT_STUBV
+/** @endcond */
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+/** @cond exclude_from_gpa_documentation */
+/**
+ * @defgroup public Public API
+ * @{
+ * @}
+ */
+
+/**
+ * @defgroup control Collection Control
+ * @ingroup public
+ * General behavior: application continues to run, but no profiling information is being collected
+ *
+ * Pausing occurs not only for the current thread but for all process as well as spawned processes
+ * - Intel(R) Parallel Inspector and Intel(R) Inspector XE:
+ *   - Does not analyze or report errors that involve memory access.
+ *   - Other errors are reported as usual. Pausing data collection in
+ *     Intel(R) Parallel Inspector and Intel(R) Inspector XE
+ *     only pauses tracing and analyzing memory access.
+ *     It does not pause tracing or analyzing threading APIs.
+ *   .
+ * - Intel(R) Parallel Amplifier and Intel(R) VTune(TM) Amplifier XE:
+ *   - Does continue to record when new threads are started.
+ *   .
+ * - Other effects:
+ *   - Possible reduction of runtime overhead.
+ *   .
+ * @{
+ */
+/** @brief Pause collection */
+void ITTAPI __itt_pause(void);
+/** @brief Resume collection */
+void ITTAPI __itt_resume(void);
+/** @brief Detach collection */
+void ITTAPI __itt_detach(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, pause,  (void))
+ITT_STUBV(ITTAPI, void, resume, (void))
+ITT_STUBV(ITTAPI, void, detach, (void))
+#define __itt_pause      ITTNOTIFY_VOID(pause)
+#define __itt_pause_ptr  ITTNOTIFY_NAME(pause)
+#define __itt_resume     ITTNOTIFY_VOID(resume)
+#define __itt_resume_ptr ITTNOTIFY_NAME(resume)
+#define __itt_detach     ITTNOTIFY_VOID(detach)
+#define __itt_detach_ptr ITTNOTIFY_NAME(detach)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_pause()
+#define __itt_pause_ptr  0
+#define __itt_resume()
+#define __itt_resume_ptr 0
+#define __itt_detach()
+#define __itt_detach_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_pause_ptr  0
+#define __itt_resume_ptr 0
+#define __itt_detach_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} control group */
+/** @endcond */
+
+/**
+ * @defgroup threads Threads
+ * @ingroup public
+ * Give names to threads
+ * @{
+ */
+/**
+ * @brief Sets thread name of calling thread
+ * @param[in] name - name of thread
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_thread_set_nameA(const char    *name);
+void ITTAPI __itt_thread_set_nameW(const wchar_t *name);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_thread_set_name     __itt_thread_set_nameW
+#  define __itt_thread_set_name_ptr __itt_thread_set_nameW_ptr
+#else /* UNICODE */
+#  define __itt_thread_set_name     __itt_thread_set_nameA
+#  define __itt_thread_set_name_ptr __itt_thread_set_nameA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+void ITTAPI __itt_thread_set_name(const char *name);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, thread_set_nameA, (const char    *name))
+ITT_STUBV(ITTAPI, void, thread_set_nameW, (const wchar_t *name))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, thread_set_name,  (const char    *name))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_thread_set_nameA     ITTNOTIFY_VOID(thread_set_nameA)
+#define __itt_thread_set_nameA_ptr ITTNOTIFY_NAME(thread_set_nameA)
+#define __itt_thread_set_nameW     ITTNOTIFY_VOID(thread_set_nameW)
+#define __itt_thread_set_nameW_ptr ITTNOTIFY_NAME(thread_set_nameW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_thread_set_name     ITTNOTIFY_VOID(thread_set_name)
+#define __itt_thread_set_name_ptr ITTNOTIFY_NAME(thread_set_name)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_thread_set_nameA(name)
+#define __itt_thread_set_nameA_ptr 0
+#define __itt_thread_set_nameW(name)
+#define __itt_thread_set_nameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_thread_set_name(name)
+#define __itt_thread_set_name_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_thread_set_nameA_ptr 0
+#define __itt_thread_set_nameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_thread_set_name_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @cond exclude_from_gpa_documentation */
+
+/**
+ * @brief Mark current thread as ignored from this point on, for the duration of its existence.
+ */
+void ITTAPI __itt_thread_ignore(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, thread_ignore, (void))
+#define __itt_thread_ignore     ITTNOTIFY_VOID(thread_ignore)
+#define __itt_thread_ignore_ptr ITTNOTIFY_NAME(thread_ignore)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_thread_ignore()
+#define __itt_thread_ignore_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_thread_ignore_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} threads group */
+
+/**
+ * @defgroup suppress Error suppression
+ * @ingroup public
+ * General behavior: application continues to run, but errors are suppressed
+ *
+ * @{
+ */
+
+/*****************************************************************//**
+ * @name group of functions used for error suppression in correctness tools
+ *********************************************************************/
+/** @{ */
+/**
+ * @hideinitializer
+ * @brief possible value for suppression mask
+ */
+#define __itt_suppress_all_errors 0x7fffffff
+
+/**
+ * @hideinitializer
+ * @brief possible value for suppression mask (suppresses errors from threading analysis)
+ */
+#define __itt_suppress_threading_errors 0x000000ff
+
+/**
+ * @hideinitializer
+ * @brief possible value for suppression mask (suppresses errors from memory analysis)
+ */
+#define __itt_suppress_memory_errors 0x0000ff00
+
+/**
+ * @brief Start suppressing errors identified in mask on this thread
+ */
+void ITTAPI __itt_suppress_push(unsigned int mask);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, suppress_push, (unsigned int mask))
+#define __itt_suppress_push     ITTNOTIFY_VOID(suppress_push)
+#define __itt_suppress_push_ptr ITTNOTIFY_NAME(suppress_push)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_suppress_push(mask)
+#define __itt_suppress_push_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_suppress_push_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Undo the effects of the matching call to __itt_suppress_push
+ */
+void ITTAPI __itt_suppress_pop(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, suppress_pop, (void))
+#define __itt_suppress_pop     ITTNOTIFY_VOID(suppress_pop)
+#define __itt_suppress_pop_ptr ITTNOTIFY_NAME(suppress_pop)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_suppress_pop()
+#define __itt_suppress_pop_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_suppress_pop_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @enum __itt_model_disable
+ * @brief Enumerator for the disable methods
+ */
+typedef enum __itt_suppress_mode {
+    __itt_unsuppress_range,
+    __itt_suppress_range
+} __itt_suppress_mode_t;
+
+/**
+ * @brief Mark a range of memory for error suppression or unsuppression for error types included in mask
+ */
+void ITTAPI __itt_suppress_mark_range(__itt_suppress_mode_t mode, unsigned int mask, void * address, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, suppress_mark_range, (__itt_suppress_mode_t mode, unsigned int mask, void * address, size_t size))
+#define __itt_suppress_mark_range     ITTNOTIFY_VOID(suppress_mark_range)
+#define __itt_suppress_mark_range_ptr ITTNOTIFY_NAME(suppress_mark_range)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_suppress_mark_range(mask)
+#define __itt_suppress_mark_range_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_suppress_mark_range_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Undo the effect of a matching call to __itt_suppress_mark_range.   If not matching
+ *        call is found, nothing is changed.
+ */
+void ITTAPI __itt_suppress_clear_range(__itt_suppress_mode_t mode, unsigned int mask, void * address, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, suppress_clear_range, (__itt_suppress_mode_t mode, unsigned int mask, void * address, size_t size))
+#define __itt_suppress_clear_range     ITTNOTIFY_VOID(suppress_clear_range)
+#define __itt_suppress_clear_range_ptr ITTNOTIFY_NAME(suppress_clear_range)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_suppress_clear_range(mask)
+#define __itt_suppress_clear_range_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_suppress_clear_range_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} */
+/** @} suppress group */
+
+/**
+ * @defgroup sync Synchronization
+ * @ingroup public
+ * Indicate user-written synchronization code
+ * @{
+ */
+/**
+ * @hideinitializer
+ * @brief possible value of attribute argument for sync object type
+ */
+#define __itt_attr_barrier 1
+
+/**
+ * @hideinitializer
+ * @brief possible value of attribute argument for sync object type
+ */
+#define __itt_attr_mutex   2
+
+/**
+@brief Name a synchronization object
+@param[in] addr       Handle for the synchronization object. You should
+use a real address to uniquely identify the synchronization object.
+@param[in] objtype    null-terminated object type string. If NULL is
+passed, the name will be "User Synchronization".
+@param[in] objname    null-terminated object name string. If NULL,
+no name will be assigned to the object.
+@param[in] attribute  one of [#__itt_attr_barrier, #__itt_attr_mutex]
+ */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_sync_createA(void *addr, const char    *objtype, const char    *objname, int attribute);
+void ITTAPI __itt_sync_createW(void *addr, const wchar_t *objtype, const wchar_t *objname, int attribute);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_sync_create     __itt_sync_createW
+#  define __itt_sync_create_ptr __itt_sync_createW_ptr
+#else /* UNICODE */
+#  define __itt_sync_create     __itt_sync_createA
+#  define __itt_sync_create_ptr __itt_sync_createA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+void ITTAPI __itt_sync_create (void *addr, const char *objtype, const char *objname, int attribute);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, sync_createA, (void *addr, const char    *objtype, const char    *objname, int attribute))
+ITT_STUBV(ITTAPI, void, sync_createW, (void *addr, const wchar_t *objtype, const wchar_t *objname, int attribute))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, sync_create,  (void *addr, const char*    objtype, const char*    objname, int attribute))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_createA     ITTNOTIFY_VOID(sync_createA)
+#define __itt_sync_createA_ptr ITTNOTIFY_NAME(sync_createA)
+#define __itt_sync_createW     ITTNOTIFY_VOID(sync_createW)
+#define __itt_sync_createW_ptr ITTNOTIFY_NAME(sync_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_create     ITTNOTIFY_VOID(sync_create)
+#define __itt_sync_create_ptr ITTNOTIFY_NAME(sync_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_createA(addr, objtype, objname, attribute)
+#define __itt_sync_createA_ptr 0
+#define __itt_sync_createW(addr, objtype, objname, attribute)
+#define __itt_sync_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_create(addr, objtype, objname, attribute)
+#define __itt_sync_create_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_createA_ptr 0
+#define __itt_sync_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_create_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+@brief Rename a synchronization object
+
+You can use the rename call to assign or reassign a name to a given
+synchronization object.
+@param[in] addr  handle for the synchronization object.
+@param[in] name  null-terminated object name string.
+*/
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_sync_renameA(void *addr, const char    *name);
+void ITTAPI __itt_sync_renameW(void *addr, const wchar_t *name);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_sync_rename     __itt_sync_renameW
+#  define __itt_sync_rename_ptr __itt_sync_renameW_ptr
+#else /* UNICODE */
+#  define __itt_sync_rename     __itt_sync_renameA
+#  define __itt_sync_rename_ptr __itt_sync_renameA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+void ITTAPI __itt_sync_rename(void *addr, const char *name);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, sync_renameA, (void *addr, const char    *name))
+ITT_STUBV(ITTAPI, void, sync_renameW, (void *addr, const wchar_t *name))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, sync_rename,  (void *addr, const char    *name))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_renameA     ITTNOTIFY_VOID(sync_renameA)
+#define __itt_sync_renameA_ptr ITTNOTIFY_NAME(sync_renameA)
+#define __itt_sync_renameW     ITTNOTIFY_VOID(sync_renameW)
+#define __itt_sync_renameW_ptr ITTNOTIFY_NAME(sync_renameW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_rename     ITTNOTIFY_VOID(sync_rename)
+#define __itt_sync_rename_ptr ITTNOTIFY_NAME(sync_rename)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_renameA(addr, name)
+#define __itt_sync_renameA_ptr 0
+#define __itt_sync_renameW(addr, name)
+#define __itt_sync_renameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_rename(addr, name)
+#define __itt_sync_rename_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_renameA_ptr 0
+#define __itt_sync_renameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_rename_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ @brief Destroy a synchronization object.
+ @param addr Handle for the synchronization object.
+ */
+void ITTAPI __itt_sync_destroy(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, sync_destroy, (void *addr))
+#define __itt_sync_destroy     ITTNOTIFY_VOID(sync_destroy)
+#define __itt_sync_destroy_ptr ITTNOTIFY_NAME(sync_destroy)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_sync_destroy(addr)
+#define __itt_sync_destroy_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_sync_destroy_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/*****************************************************************//**
+ * @name group of functions is used for performance measurement tools
+ *********************************************************************/
+/** @{ */
+/**
+ * @brief Enter spin loop on user-defined sync object
+ */
+void ITTAPI __itt_sync_prepare(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, sync_prepare, (void *addr))
+#define __itt_sync_prepare     ITTNOTIFY_VOID(sync_prepare)
+#define __itt_sync_prepare_ptr ITTNOTIFY_NAME(sync_prepare)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_sync_prepare(addr)
+#define __itt_sync_prepare_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_sync_prepare_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Quit spin loop without acquiring spin object
+ */
+void ITTAPI __itt_sync_cancel(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, sync_cancel, (void *addr))
+#define __itt_sync_cancel     ITTNOTIFY_VOID(sync_cancel)
+#define __itt_sync_cancel_ptr ITTNOTIFY_NAME(sync_cancel)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_sync_cancel(addr)
+#define __itt_sync_cancel_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_sync_cancel_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Successful spin loop completion (sync object acquired)
+ */
+void ITTAPI __itt_sync_acquired(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, sync_acquired, (void *addr))
+#define __itt_sync_acquired     ITTNOTIFY_VOID(sync_acquired)
+#define __itt_sync_acquired_ptr ITTNOTIFY_NAME(sync_acquired)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_sync_acquired(addr)
+#define __itt_sync_acquired_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_sync_acquired_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Start sync object releasing code. Is called before the lock release call.
+ */
+void ITTAPI __itt_sync_releasing(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, sync_releasing, (void *addr))
+#define __itt_sync_releasing     ITTNOTIFY_VOID(sync_releasing)
+#define __itt_sync_releasing_ptr ITTNOTIFY_NAME(sync_releasing)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_sync_releasing(addr)
+#define __itt_sync_releasing_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_sync_releasing_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} */
+
+/** @} sync group */
+
+/**************************************************************//**
+ * @name group of functions is used for correctness checking tools
+ ******************************************************************/
+/** @{ */
+/**
+ * @ingroup legacy
+ * @deprecated Legacy API
+ * @brief Fast synchronization which does no require spinning.
+ * - This special function is to be used by TBB and OpenMP libraries only when they know
+ *   there is no spin but they need to suppress TC warnings about shared variable modifications.
+ * - It only has corresponding pointers in static library and does not have corresponding function
+ *   in dynamic library.
+ * @see void __itt_sync_prepare(void* addr);
+ */
+void ITTAPI __itt_fsync_prepare(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, fsync_prepare, (void *addr))
+#define __itt_fsync_prepare     ITTNOTIFY_VOID(fsync_prepare)
+#define __itt_fsync_prepare_ptr ITTNOTIFY_NAME(fsync_prepare)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_fsync_prepare(addr)
+#define __itt_fsync_prepare_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_fsync_prepare_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup legacy
+ * @deprecated Legacy API
+ * @brief Fast synchronization which does no require spinning.
+ * - This special function is to be used by TBB and OpenMP libraries only when they know
+ *   there is no spin but they need to suppress TC warnings about shared variable modifications.
+ * - It only has corresponding pointers in static library and does not have corresponding function
+ *   in dynamic library.
+ * @see void __itt_sync_cancel(void *addr);
+ */
+void ITTAPI __itt_fsync_cancel(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, fsync_cancel, (void *addr))
+#define __itt_fsync_cancel     ITTNOTIFY_VOID(fsync_cancel)
+#define __itt_fsync_cancel_ptr ITTNOTIFY_NAME(fsync_cancel)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_fsync_cancel(addr)
+#define __itt_fsync_cancel_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_fsync_cancel_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup legacy
+ * @deprecated Legacy API
+ * @brief Fast synchronization which does no require spinning.
+ * - This special function is to be used by TBB and OpenMP libraries only when they know
+ *   there is no spin but they need to suppress TC warnings about shared variable modifications.
+ * - It only has corresponding pointers in static library and does not have corresponding function
+ *   in dynamic library.
+ * @see void __itt_sync_acquired(void *addr);
+ */
+void ITTAPI __itt_fsync_acquired(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, fsync_acquired, (void *addr))
+#define __itt_fsync_acquired     ITTNOTIFY_VOID(fsync_acquired)
+#define __itt_fsync_acquired_ptr ITTNOTIFY_NAME(fsync_acquired)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_fsync_acquired(addr)
+#define __itt_fsync_acquired_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_fsync_acquired_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup legacy
+ * @deprecated Legacy API
+ * @brief Fast synchronization which does no require spinning.
+ * - This special function is to be used by TBB and OpenMP libraries only when they know
+ *   there is no spin but they need to suppress TC warnings about shared variable modifications.
+ * - It only has corresponding pointers in static library and does not have corresponding function
+ *   in dynamic library.
+ * @see void __itt_sync_releasing(void* addr);
+ */
+void ITTAPI __itt_fsync_releasing(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, fsync_releasing, (void *addr))
+#define __itt_fsync_releasing     ITTNOTIFY_VOID(fsync_releasing)
+#define __itt_fsync_releasing_ptr ITTNOTIFY_NAME(fsync_releasing)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_fsync_releasing(addr)
+#define __itt_fsync_releasing_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_fsync_releasing_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} */
+
+/**
+ * @defgroup model Modeling by Intel(R) Parallel Advisor
+ * @ingroup public
+ * This is the subset of itt used for modeling by Intel(R) Parallel Advisor.
+ * This API is called ONLY using annotate.h, by "Annotation" macros
+ * the user places in their sources during the parallelism modeling steps.
+ *
+ * site_begin/end and task_begin/end take the address of handle variables,
+ * which are writeable by the API.  Handles must be 0 initialized prior
+ * to the first call to begin, or may cause a run-time failure.
+ * The handles are initialized in a multi-thread safe way by the API if
+ * the handle is 0.  The commonly expected idiom is one static handle to
+ * identify a site or task.  If a site or task of the same name has already
+ * been started during this collection, the same handle MAY be returned,
+ * but is not required to be - it is unspecified if data merging is done
+ * based on name.  These routines also take an instance variable.  Like
+ * the lexical instance, these must be 0 initialized.  Unlike the lexical
+ * instance, this is used to track a single dynamic instance.
+ *
+ * API used by the Intel(R) Parallel Advisor to describe potential concurrency
+ * and related activities. User-added source annotations expand to calls
+ * to these procedures to enable modeling of a hypothetical concurrent
+ * execution serially.
+ * @{
+ */
+#if !defined(_ADVISOR_ANNOTATE_H_) || defined(ANNOTATE_EXPAND_NULL)
+
+typedef void* __itt_model_site;             /*!< @brief handle for lexical site     */
+typedef void* __itt_model_site_instance;    /*!< @brief handle for dynamic instance */
+typedef void* __itt_model_task;             /*!< @brief handle for lexical site     */
+typedef void* __itt_model_task_instance;    /*!< @brief handle for dynamic instance */
+
+/**
+ * @enum __itt_model_disable
+ * @brief Enumerator for the disable methods
+ */
+typedef enum {
+    __itt_model_disable_observation,
+    __itt_model_disable_collection
+} __itt_model_disable;
+
+#endif /* !_ADVISOR_ANNOTATE_H_ || ANNOTATE_EXPAND_NULL */
+
+/**
+ * @brief ANNOTATE_SITE_BEGIN/ANNOTATE_SITE_END support.
+ *
+ * site_begin/end model a potential concurrency site.
+ * site instances may be recursively nested with themselves.
+ * site_end exits the most recently started but unended site for the current
+ * thread.  The handle passed to end may be used to validate structure.
+ * Instances of a site encountered on different threads concurrently
+ * are considered completely distinct. If the site name for two different
+ * lexical sites match, it is unspecified whether they are treated as the
+ * same or different for data presentation.
+ */
+void ITTAPI __itt_model_site_begin(__itt_model_site *site, __itt_model_site_instance *instance, const char *name);
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_model_site_beginW(const wchar_t *name);
+#endif
+void ITTAPI __itt_model_site_beginA(const char *name);
+void ITTAPI __itt_model_site_beginAL(const char *name, size_t siteNameLen);
+void ITTAPI __itt_model_site_end  (__itt_model_site *site, __itt_model_site_instance *instance);
+void ITTAPI __itt_model_site_end_2(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_site_begin,  (__itt_model_site *site, __itt_model_site_instance *instance, const char *name))
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, model_site_beginW,  (const wchar_t *name))
+#endif
+ITT_STUBV(ITTAPI, void, model_site_beginA,  (const char *name))
+ITT_STUBV(ITTAPI, void, model_site_beginAL,  (const char *name, size_t siteNameLen))
+ITT_STUBV(ITTAPI, void, model_site_end,    (__itt_model_site *site, __itt_model_site_instance *instance))
+ITT_STUBV(ITTAPI, void, model_site_end_2,  (void))
+#define __itt_model_site_begin      ITTNOTIFY_VOID(model_site_begin)
+#define __itt_model_site_begin_ptr  ITTNOTIFY_NAME(model_site_begin)
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_model_site_beginW      ITTNOTIFY_VOID(model_site_beginW)
+#define __itt_model_site_beginW_ptr  ITTNOTIFY_NAME(model_site_beginW)
+#endif
+#define __itt_model_site_beginA      ITTNOTIFY_VOID(model_site_beginA)
+#define __itt_model_site_beginA_ptr  ITTNOTIFY_NAME(model_site_beginA)
+#define __itt_model_site_beginAL      ITTNOTIFY_VOID(model_site_beginAL)
+#define __itt_model_site_beginAL_ptr  ITTNOTIFY_NAME(model_site_beginAL)
+#define __itt_model_site_end        ITTNOTIFY_VOID(model_site_end)
+#define __itt_model_site_end_ptr    ITTNOTIFY_NAME(model_site_end)
+#define __itt_model_site_end_2        ITTNOTIFY_VOID(model_site_end_2)
+#define __itt_model_site_end_2_ptr    ITTNOTIFY_NAME(model_site_end_2)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_site_begin(site, instance, name)
+#define __itt_model_site_begin_ptr  0
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_model_site_beginW(name)
+#define __itt_model_site_beginW_ptr  0
+#endif
+#define __itt_model_site_beginA(name)
+#define __itt_model_site_beginA_ptr  0
+#define __itt_model_site_beginAL(name, siteNameLen)
+#define __itt_model_site_beginAL_ptr  0
+#define __itt_model_site_end(site, instance)
+#define __itt_model_site_end_ptr    0
+#define __itt_model_site_end_2()
+#define __itt_model_site_end_2_ptr    0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_site_begin_ptr  0
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_model_site_beginW_ptr  0
+#endif
+#define __itt_model_site_beginA_ptr  0
+#define __itt_model_site_beginAL_ptr  0
+#define __itt_model_site_end_ptr    0
+#define __itt_model_site_end_2_ptr    0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_TASK_BEGIN/ANNOTATE_TASK_END support
+ *
+ * task_begin/end model a potential task, which is contained within the most
+ * closely enclosing dynamic site.  task_end exits the most recently started
+ * but unended task.  The handle passed to end may be used to validate
+ * structure.  It is unspecified if bad dynamic nesting is detected.  If it
+ * is, it should be encoded in the resulting data collection.  The collector
+ * should not fail due to construct nesting issues, nor attempt to directly
+ * indicate the problem.
+ */
+void ITTAPI __itt_model_task_begin(__itt_model_task *task, __itt_model_task_instance *instance, const char *name);
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_model_task_beginW(const wchar_t *name);
+void ITTAPI __itt_model_iteration_taskW(const wchar_t *name);
+#endif
+void ITTAPI __itt_model_task_beginA(const char *name);
+void ITTAPI __itt_model_task_beginAL(const char *name, size_t taskNameLen);
+void ITTAPI __itt_model_iteration_taskA(const char *name);
+void ITTAPI __itt_model_iteration_taskAL(const char *name, size_t taskNameLen);
+void ITTAPI __itt_model_task_end  (__itt_model_task *task, __itt_model_task_instance *instance);
+void ITTAPI __itt_model_task_end_2(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_task_begin,  (__itt_model_task *task, __itt_model_task_instance *instance, const char *name))
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, model_task_beginW,  (const wchar_t *name))
+ITT_STUBV(ITTAPI, void, model_iteration_taskW, (const wchar_t *name))
+#endif
+ITT_STUBV(ITTAPI, void, model_task_beginA,  (const char *name))
+ITT_STUBV(ITTAPI, void, model_task_beginAL,  (const char *name, size_t taskNameLen))
+ITT_STUBV(ITTAPI, void, model_iteration_taskA,  (const char *name))
+ITT_STUBV(ITTAPI, void, model_iteration_taskAL,  (const char *name, size_t taskNameLen))
+ITT_STUBV(ITTAPI, void, model_task_end,    (__itt_model_task *task, __itt_model_task_instance *instance))
+ITT_STUBV(ITTAPI, void, model_task_end_2,  (void))
+#define __itt_model_task_begin      ITTNOTIFY_VOID(model_task_begin)
+#define __itt_model_task_begin_ptr  ITTNOTIFY_NAME(model_task_begin)
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_model_task_beginW     ITTNOTIFY_VOID(model_task_beginW)
+#define __itt_model_task_beginW_ptr ITTNOTIFY_NAME(model_task_beginW)
+#define __itt_model_iteration_taskW     ITTNOTIFY_VOID(model_iteration_taskW)
+#define __itt_model_iteration_taskW_ptr ITTNOTIFY_NAME(model_iteration_taskW)
+#endif
+#define __itt_model_task_beginA    ITTNOTIFY_VOID(model_task_beginA)
+#define __itt_model_task_beginA_ptr ITTNOTIFY_NAME(model_task_beginA)
+#define __itt_model_task_beginAL    ITTNOTIFY_VOID(model_task_beginAL)
+#define __itt_model_task_beginAL_ptr ITTNOTIFY_NAME(model_task_beginAL)
+#define __itt_model_iteration_taskA    ITTNOTIFY_VOID(model_iteration_taskA)
+#define __itt_model_iteration_taskA_ptr ITTNOTIFY_NAME(model_iteration_taskA)
+#define __itt_model_iteration_taskAL    ITTNOTIFY_VOID(model_iteration_taskAL)
+#define __itt_model_iteration_taskAL_ptr ITTNOTIFY_NAME(model_iteration_taskAL)
+#define __itt_model_task_end        ITTNOTIFY_VOID(model_task_end)
+#define __itt_model_task_end_ptr    ITTNOTIFY_NAME(model_task_end)
+#define __itt_model_task_end_2        ITTNOTIFY_VOID(model_task_end_2)
+#define __itt_model_task_end_2_ptr    ITTNOTIFY_NAME(model_task_end_2)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_task_begin(task, instance, name)
+#define __itt_model_task_begin_ptr  0
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_model_task_beginW(name)
+#define __itt_model_task_beginW_ptr  0
+#endif
+#define __itt_model_task_beginA(name)
+#define __itt_model_task_beginA_ptr  0
+#define __itt_model_task_beginAL(name, siteNameLen)
+#define __itt_model_task_beginAL_ptr  0
+#define __itt_model_iteration_taskA(name)
+#define __itt_model_iteration_taskA_ptr  0
+#define __itt_model_iteration_taskAL(name, siteNameLen)
+#define __itt_model_iteration_taskAL_ptr  0
+#define __itt_model_task_end(task, instance)
+#define __itt_model_task_end_ptr    0
+#define __itt_model_task_end_2()
+#define __itt_model_task_end_2_ptr    0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_task_begin_ptr  0
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_model_task_beginW_ptr 0
+#endif
+#define __itt_model_task_beginA_ptr  0
+#define __itt_model_task_beginAL_ptr  0
+#define __itt_model_iteration_taskA_ptr    0
+#define __itt_model_iteration_taskAL_ptr    0
+#define __itt_model_task_end_ptr    0
+#define __itt_model_task_end_2_ptr    0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_LOCK_ACQUIRE/ANNOTATE_LOCK_RELEASE support
+ *
+ * lock_acquire/release model a potential lock for both lockset and
+ * performance modeling.  Each unique address is modeled as a separate
+ * lock, with invalid addresses being valid lock IDs.  Specifically:
+ * no storage is accessed by the API at the specified address - it is only
+ * used for lock identification.  Lock acquires may be self-nested and are
+ * unlocked by a corresponding number of releases.
+ * (These closely correspond to __itt_sync_acquired/__itt_sync_releasing,
+ * but may not have identical semantics.)
+ */
+void ITTAPI __itt_model_lock_acquire(void *lock);
+void ITTAPI __itt_model_lock_acquire_2(void *lock);
+void ITTAPI __itt_model_lock_release(void *lock);
+void ITTAPI __itt_model_lock_release_2(void *lock);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_lock_acquire, (void *lock))
+ITT_STUBV(ITTAPI, void, model_lock_acquire_2, (void *lock))
+ITT_STUBV(ITTAPI, void, model_lock_release, (void *lock))
+ITT_STUBV(ITTAPI, void, model_lock_release_2, (void *lock))
+#define __itt_model_lock_acquire     ITTNOTIFY_VOID(model_lock_acquire)
+#define __itt_model_lock_acquire_ptr ITTNOTIFY_NAME(model_lock_acquire)
+#define __itt_model_lock_acquire_2     ITTNOTIFY_VOID(model_lock_acquire_2)
+#define __itt_model_lock_acquire_2_ptr ITTNOTIFY_NAME(model_lock_acquire_2)
+#define __itt_model_lock_release     ITTNOTIFY_VOID(model_lock_release)
+#define __itt_model_lock_release_ptr ITTNOTIFY_NAME(model_lock_release)
+#define __itt_model_lock_release_2     ITTNOTIFY_VOID(model_lock_release_2)
+#define __itt_model_lock_release_2_ptr ITTNOTIFY_NAME(model_lock_release_2)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_lock_acquire(lock)
+#define __itt_model_lock_acquire_ptr 0
+#define __itt_model_lock_acquire_2(lock)
+#define __itt_model_lock_acquire_2_ptr 0
+#define __itt_model_lock_release(lock)
+#define __itt_model_lock_release_ptr 0
+#define __itt_model_lock_release_2(lock)
+#define __itt_model_lock_release_2_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_lock_acquire_ptr 0
+#define __itt_model_lock_acquire_2_ptr 0
+#define __itt_model_lock_release_ptr 0
+#define __itt_model_lock_release_2_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_RECORD_ALLOCATION/ANNOTATE_RECORD_DEALLOCATION support
+ *
+ * record_allocation/deallocation describe user-defined memory allocator
+ * behavior, which may be required for correctness modeling to understand
+ * when storage is not expected to be actually reused across threads.
+ */
+void ITTAPI __itt_model_record_allocation  (void *addr, size_t size);
+void ITTAPI __itt_model_record_deallocation(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_record_allocation,   (void *addr, size_t size))
+ITT_STUBV(ITTAPI, void, model_record_deallocation, (void *addr))
+#define __itt_model_record_allocation       ITTNOTIFY_VOID(model_record_allocation)
+#define __itt_model_record_allocation_ptr   ITTNOTIFY_NAME(model_record_allocation)
+#define __itt_model_record_deallocation     ITTNOTIFY_VOID(model_record_deallocation)
+#define __itt_model_record_deallocation_ptr ITTNOTIFY_NAME(model_record_deallocation)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_record_allocation(addr, size)
+#define __itt_model_record_allocation_ptr   0
+#define __itt_model_record_deallocation(addr)
+#define __itt_model_record_deallocation_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_record_allocation_ptr   0
+#define __itt_model_record_deallocation_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_INDUCTION_USES support
+ *
+ * Note particular storage is inductive through the end of the current site
+ */
+void ITTAPI __itt_model_induction_uses(void* addr, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_induction_uses, (void *addr, size_t size))
+#define __itt_model_induction_uses     ITTNOTIFY_VOID(model_induction_uses)
+#define __itt_model_induction_uses_ptr ITTNOTIFY_NAME(model_induction_uses)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_induction_uses(addr, size)
+#define __itt_model_induction_uses_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_induction_uses_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_REDUCTION_USES support
+ *
+ * Note particular storage is used for reduction through the end
+ * of the current site
+ */
+void ITTAPI __itt_model_reduction_uses(void* addr, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_reduction_uses, (void *addr, size_t size))
+#define __itt_model_reduction_uses     ITTNOTIFY_VOID(model_reduction_uses)
+#define __itt_model_reduction_uses_ptr ITTNOTIFY_NAME(model_reduction_uses)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_reduction_uses(addr, size)
+#define __itt_model_reduction_uses_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_reduction_uses_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_OBSERVE_USES support
+ *
+ * Have correctness modeling record observations about uses of storage
+ * through the end of the current site
+ */
+void ITTAPI __itt_model_observe_uses(void* addr, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_observe_uses, (void *addr, size_t size))
+#define __itt_model_observe_uses     ITTNOTIFY_VOID(model_observe_uses)
+#define __itt_model_observe_uses_ptr ITTNOTIFY_NAME(model_observe_uses)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_observe_uses(addr, size)
+#define __itt_model_observe_uses_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_observe_uses_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_CLEAR_USES support
+ *
+ * Clear the special handling of a piece of storage related to induction,
+ * reduction or observe_uses
+ */
+void ITTAPI __itt_model_clear_uses(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_clear_uses, (void *addr))
+#define __itt_model_clear_uses     ITTNOTIFY_VOID(model_clear_uses)
+#define __itt_model_clear_uses_ptr ITTNOTIFY_NAME(model_clear_uses)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_clear_uses(addr)
+#define __itt_model_clear_uses_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_clear_uses_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief ANNOTATE_DISABLE_*_PUSH/ANNOTATE_DISABLE_*_POP support
+ *
+ * disable_push/disable_pop push and pop disabling based on a parameter.
+ * Disabling observations stops processing of memory references during
+ * correctness modeling, and all annotations that occur in the disabled
+ * region.  This allows description of code that is expected to be handled
+ * specially during conversion to parallelism or that is not recognized
+ * by tools (e.g. some kinds of synchronization operations.)
+ * This mechanism causes all annotations in the disabled region, other
+ * than disable_push and disable_pop, to be ignored.  (For example, this
+ * might validly be used to disable an entire parallel site and the contained
+ * tasks and locking in it for data collection purposes.)
+ * The disable for collection is a more expensive operation, but reduces
+ * collector overhead significantly.  This applies to BOTH correctness data
+ * collection and performance data collection.  For example, a site
+ * containing a task might only enable data collection for the first 10
+ * iterations.  Both performance and correctness data should reflect this,
+ * and the program should run as close to full speed as possible when
+ * collection is disabled.
+ */
+void ITTAPI __itt_model_disable_push(__itt_model_disable x);
+void ITTAPI __itt_model_disable_pop(void);
+void ITTAPI __itt_model_aggregate_task(size_t x);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, model_disable_push, (__itt_model_disable x))
+ITT_STUBV(ITTAPI, void, model_disable_pop,  (void))
+ITT_STUBV(ITTAPI, void, model_aggregate_task, (size_t x))
+#define __itt_model_disable_push     ITTNOTIFY_VOID(model_disable_push)
+#define __itt_model_disable_push_ptr ITTNOTIFY_NAME(model_disable_push)
+#define __itt_model_disable_pop      ITTNOTIFY_VOID(model_disable_pop)
+#define __itt_model_disable_pop_ptr  ITTNOTIFY_NAME(model_disable_pop)
+#define __itt_model_aggregate_task      ITTNOTIFY_VOID(model_aggregate_task)
+#define __itt_model_aggregate_task_ptr  ITTNOTIFY_NAME(model_aggregate_task)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_model_disable_push(x)
+#define __itt_model_disable_push_ptr 0
+#define __itt_model_disable_pop()
+#define __itt_model_disable_pop_ptr 0
+#define __itt_model_aggregate_task(x)
+#define __itt_model_aggregate_task_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_model_disable_push_ptr 0
+#define __itt_model_disable_pop_ptr 0
+#define __itt_model_aggregate_task_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} model group */
+
+/**
+ * @defgroup heap Heap
+ * @ingroup public
+ * Heap group
+ * @{
+ */
+
+typedef void* __itt_heap_function;
+
+/**
+ * @brief Create an identification for heap function
+ * @return non-zero identifier or NULL
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_heap_function ITTAPI __itt_heap_function_createA(const char*    name, const char*    domain);
+__itt_heap_function ITTAPI __itt_heap_function_createW(const wchar_t* name, const wchar_t* domain);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_heap_function_create     __itt_heap_function_createW
+#  define __itt_heap_function_create_ptr __itt_heap_function_createW_ptr
+#else
+#  define __itt_heap_function_create     __itt_heap_function_createA
+#  define __itt_heap_function_create_ptr __itt_heap_function_createA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_heap_function ITTAPI __itt_heap_function_create(const char* name, const char* domain);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_heap_function, heap_function_createA, (const char*    name, const char*    domain))
+ITT_STUB(ITTAPI, __itt_heap_function, heap_function_createW, (const wchar_t* name, const wchar_t* domain))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_heap_function, heap_function_create,  (const char*    name, const char*    domain))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_heap_function_createA     ITTNOTIFY_DATA(heap_function_createA)
+#define __itt_heap_function_createA_ptr ITTNOTIFY_NAME(heap_function_createA)
+#define __itt_heap_function_createW     ITTNOTIFY_DATA(heap_function_createW)
+#define __itt_heap_function_createW_ptr ITTNOTIFY_NAME(heap_function_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_heap_function_create      ITTNOTIFY_DATA(heap_function_create)
+#define __itt_heap_function_create_ptr  ITTNOTIFY_NAME(heap_function_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_heap_function_createA(name, domain) (__itt_heap_function)0
+#define __itt_heap_function_createA_ptr 0
+#define __itt_heap_function_createW(name, domain) (__itt_heap_function)0
+#define __itt_heap_function_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_heap_function_create(name, domain)  (__itt_heap_function)0
+#define __itt_heap_function_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_heap_function_createA_ptr 0
+#define __itt_heap_function_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_heap_function_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an allocation begin occurrence.
+ */
+void ITTAPI __itt_heap_allocate_begin(__itt_heap_function h, size_t size, int initialized);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_allocate_begin, (__itt_heap_function h, size_t size, int initialized))
+#define __itt_heap_allocate_begin     ITTNOTIFY_VOID(heap_allocate_begin)
+#define __itt_heap_allocate_begin_ptr ITTNOTIFY_NAME(heap_allocate_begin)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_allocate_begin(h, size, initialized)
+#define __itt_heap_allocate_begin_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_allocate_begin_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an allocation end occurrence.
+ */
+void ITTAPI __itt_heap_allocate_end(__itt_heap_function h, void** addr, size_t size, int initialized);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_allocate_end, (__itt_heap_function h, void** addr, size_t size, int initialized))
+#define __itt_heap_allocate_end     ITTNOTIFY_VOID(heap_allocate_end)
+#define __itt_heap_allocate_end_ptr ITTNOTIFY_NAME(heap_allocate_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_allocate_end(h, addr, size, initialized)
+#define __itt_heap_allocate_end_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_allocate_end_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an free begin occurrence.
+ */
+void ITTAPI __itt_heap_free_begin(__itt_heap_function h, void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_free_begin, (__itt_heap_function h, void* addr))
+#define __itt_heap_free_begin     ITTNOTIFY_VOID(heap_free_begin)
+#define __itt_heap_free_begin_ptr ITTNOTIFY_NAME(heap_free_begin)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_free_begin(h, addr)
+#define __itt_heap_free_begin_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_free_begin_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an free end occurrence.
+ */
+void ITTAPI __itt_heap_free_end(__itt_heap_function h, void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_free_end, (__itt_heap_function h, void* addr))
+#define __itt_heap_free_end     ITTNOTIFY_VOID(heap_free_end)
+#define __itt_heap_free_end_ptr ITTNOTIFY_NAME(heap_free_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_free_end(h, addr)
+#define __itt_heap_free_end_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_free_end_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an reallocation begin occurrence.
+ */
+void ITTAPI __itt_heap_reallocate_begin(__itt_heap_function h, void* addr, size_t new_size, int initialized);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_reallocate_begin, (__itt_heap_function h, void* addr, size_t new_size, int initialized))
+#define __itt_heap_reallocate_begin     ITTNOTIFY_VOID(heap_reallocate_begin)
+#define __itt_heap_reallocate_begin_ptr ITTNOTIFY_NAME(heap_reallocate_begin)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_reallocate_begin(h, addr, new_size, initialized)
+#define __itt_heap_reallocate_begin_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_reallocate_begin_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an reallocation end occurrence.
+ */
+void ITTAPI __itt_heap_reallocate_end(__itt_heap_function h, void* addr, void** new_addr, size_t new_size, int initialized);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_reallocate_end, (__itt_heap_function h, void* addr, void** new_addr, size_t new_size, int initialized))
+#define __itt_heap_reallocate_end     ITTNOTIFY_VOID(heap_reallocate_end)
+#define __itt_heap_reallocate_end_ptr ITTNOTIFY_NAME(heap_reallocate_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_reallocate_end(h, addr, new_addr, new_size, initialized)
+#define __itt_heap_reallocate_end_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_reallocate_end_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @brief internal access begin */
+void ITTAPI __itt_heap_internal_access_begin(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_internal_access_begin,  (void))
+#define __itt_heap_internal_access_begin      ITTNOTIFY_VOID(heap_internal_access_begin)
+#define __itt_heap_internal_access_begin_ptr  ITTNOTIFY_NAME(heap_internal_access_begin)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_internal_access_begin()
+#define __itt_heap_internal_access_begin_ptr  0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_internal_access_begin_ptr  0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @brief internal access end */
+void ITTAPI __itt_heap_internal_access_end(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_internal_access_end, (void))
+#define __itt_heap_internal_access_end     ITTNOTIFY_VOID(heap_internal_access_end)
+#define __itt_heap_internal_access_end_ptr ITTNOTIFY_NAME(heap_internal_access_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_internal_access_end()
+#define __itt_heap_internal_access_end_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_internal_access_end_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @brief record memory growth begin */
+void ITTAPI __itt_heap_record_memory_growth_begin(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_record_memory_growth_begin,  (void))
+#define __itt_heap_record_memory_growth_begin      ITTNOTIFY_VOID(heap_record_memory_growth_begin)
+#define __itt_heap_record_memory_growth_begin_ptr  ITTNOTIFY_NAME(heap_record_memory_growth_begin)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_record_memory_growth_begin()
+#define __itt_heap_record_memory_growth_begin_ptr  0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_record_memory_growth_begin_ptr  0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @brief record memory growth end */
+void ITTAPI __itt_heap_record_memory_growth_end(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_record_memory_growth_end, (void))
+#define __itt_heap_record_memory_growth_end     ITTNOTIFY_VOID(heap_record_memory_growth_end)
+#define __itt_heap_record_memory_growth_end_ptr ITTNOTIFY_NAME(heap_record_memory_growth_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_record_memory_growth_end()
+#define __itt_heap_record_memory_growth_end_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_record_memory_growth_end_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Specify the type of heap detection/reporting to modify.
+ */
+/**
+ * @hideinitializer
+ * @brief Report on memory leaks.
+ */
+#define __itt_heap_leaks 0x00000001
+
+/**
+ * @hideinitializer
+ * @brief Report on memory growth.
+ */
+#define __itt_heap_growth 0x00000002
+
+
+/** @brief heap reset detection */
+void ITTAPI __itt_heap_reset_detection(unsigned int reset_mask);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_reset_detection,  (unsigned int reset_mask))
+#define __itt_heap_reset_detection      ITTNOTIFY_VOID(heap_reset_detection)
+#define __itt_heap_reset_detection_ptr  ITTNOTIFY_NAME(heap_reset_detection)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_reset_detection()
+#define __itt_heap_reset_detection_ptr  0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_reset_detection_ptr  0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @brief report */
+void ITTAPI __itt_heap_record(unsigned int record_mask);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, heap_record, (unsigned int record_mask))
+#define __itt_heap_record     ITTNOTIFY_VOID(heap_record)
+#define __itt_heap_record_ptr ITTNOTIFY_NAME(heap_record)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_heap_record()
+#define __itt_heap_record_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_heap_record_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @} heap group */
+/** @endcond */
+/* ========================================================================== */
+
+/**
+ * @defgroup domains Domains
+ * @ingroup public
+ * Domains group
+ * @{
+ */
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_domain
+{
+    volatile int flags; /*!< Zero if disabled, non-zero if enabled. The meaning of different non-zero values is reserved to the runtime */
+    const char* nameA;  /*!< Copy of original name in ASCII. */
+#if defined(UNICODE) || defined(_UNICODE)
+    const wchar_t* nameW; /*!< Copy of original name in UNICODE. */
+#else  /* UNICODE || _UNICODE */
+    void* nameW;
+#endif /* UNICODE || _UNICODE */
+    int   extra1; /*!< Reserved to the runtime */
+    void* extra2; /*!< Reserved to the runtime */
+    struct ___itt_domain* next;
+} __itt_domain;
+
+#pragma pack(pop)
+/** @endcond */
+
+/**
+ * @ingroup domains
+ * @brief Create a domain.
+ * Create domain using some domain name: the URI naming style is recommended.
+ * Because the set of domains is expected to be static over the application's
+ * execution time, there is no mechanism to destroy a domain.
+ * Any domain can be accessed by any thread in the process, regardless of
+ * which thread created the domain. This call is thread-safe.
+ * @param[in] name name of domain
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_domain* ITTAPI __itt_domain_createA(const char    *name);
+__itt_domain* ITTAPI __itt_domain_createW(const wchar_t *name);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_domain_create     __itt_domain_createW
+#  define __itt_domain_create_ptr __itt_domain_createW_ptr
+#else /* UNICODE */
+#  define __itt_domain_create     __itt_domain_createA
+#  define __itt_domain_create_ptr __itt_domain_createA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_domain* ITTAPI __itt_domain_create(const char *name);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_domain*, domain_createA, (const char    *name))
+ITT_STUB(ITTAPI, __itt_domain*, domain_createW, (const wchar_t *name))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_domain*, domain_create,  (const char    *name))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_domain_createA     ITTNOTIFY_DATA(domain_createA)
+#define __itt_domain_createA_ptr ITTNOTIFY_NAME(domain_createA)
+#define __itt_domain_createW     ITTNOTIFY_DATA(domain_createW)
+#define __itt_domain_createW_ptr ITTNOTIFY_NAME(domain_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_domain_create     ITTNOTIFY_DATA(domain_create)
+#define __itt_domain_create_ptr ITTNOTIFY_NAME(domain_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_domain_createA(name) (__itt_domain*)0
+#define __itt_domain_createA_ptr 0
+#define __itt_domain_createW(name) (__itt_domain*)0
+#define __itt_domain_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_domain_create(name)  (__itt_domain*)0
+#define __itt_domain_create_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_domain_createA_ptr 0
+#define __itt_domain_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_domain_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} domains group */
+
+/**
+ * @defgroup ids IDs
+ * @ingroup public
+ * IDs group
+ * @{
+ */
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_id
+{
+    unsigned long long d1, d2, d3;
+} __itt_id;
+
+#pragma pack(pop)
+/** @endcond */
+
+static const __itt_id __itt_null = { 0, 0, 0 };
+
+/**
+ * @ingroup ids
+ * @brief A convenience function is provided to create an ID without domain control.
+ * @brief This is a convenience function to initialize an __itt_id structure. This function
+ * does not affect the collector runtime in any way. After you make the ID with this
+ * function, you still must create it with the __itt_id_create function before using the ID
+ * to identify a named entity.
+ * @param[in] addr The address of object; high QWORD of the ID value.
+ * @param[in] extra The extra data to unique identify object; low QWORD of the ID value.
+ */
+
+ITT_INLINE __itt_id ITTAPI __itt_id_make(void* addr, unsigned long long extra) ITT_INLINE_ATTRIBUTE;
+ITT_INLINE __itt_id ITTAPI __itt_id_make(void* addr, unsigned long long extra)
+{
+    __itt_id id = __itt_null;
+    id.d1 = (unsigned long long)((uintptr_t)addr);
+    id.d2 = (unsigned long long)extra;
+    id.d3 = (unsigned long long)0; /* Reserved. Must be zero */
+    return id;
+}
+
+/**
+ * @ingroup ids
+ * @brief Create an instance of identifier.
+ * This establishes the beginning of the lifetime of an instance of
+ * the given ID in the trace. Once this lifetime starts, the ID
+ * can be used to tag named entity instances in calls such as
+ * __itt_task_begin, and to specify relationships among
+ * identified named entity instances, using the \ref relations APIs.
+ * Instance IDs are not domain specific!
+ * @param[in] domain The domain controlling the execution of this call.
+ * @param[in] id The ID to create.
+ */
+void ITTAPI __itt_id_create(const __itt_domain *domain, __itt_id id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, id_create, (const __itt_domain *domain, __itt_id id))
+#define __itt_id_create(d,x) ITTNOTIFY_VOID_D1(id_create,d,x)
+#define __itt_id_create_ptr  ITTNOTIFY_NAME(id_create)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_id_create(domain,id)
+#define __itt_id_create_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_id_create_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup ids
+ * @brief Destroy an instance of identifier.
+ * This ends the lifetime of the current instance of the given ID value in the trace.
+ * Any relationships that are established after this lifetime ends are invalid.
+ * This call must be performed before the given ID value can be reused for a different
+ * named entity instance.
+ * @param[in] domain The domain controlling the execution of this call.
+ * @param[in] id The ID to destroy.
+ */
+void ITTAPI __itt_id_destroy(const __itt_domain *domain, __itt_id id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, id_destroy, (const __itt_domain *domain, __itt_id id))
+#define __itt_id_destroy(d,x) ITTNOTIFY_VOID_D1(id_destroy,d,x)
+#define __itt_id_destroy_ptr  ITTNOTIFY_NAME(id_destroy)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_id_destroy(domain,id)
+#define __itt_id_destroy_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_id_destroy_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} ids group */
+
+/**
+ * @defgroup handless String Handles
+ * @ingroup public
+ * String Handles group
+ * @{
+ */
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_string_handle
+{
+    const char* strA; /*!< Copy of original string in ASCII. */
+#if defined(UNICODE) || defined(_UNICODE)
+    const wchar_t* strW; /*!< Copy of original string in UNICODE. */
+#else  /* UNICODE || _UNICODE */
+    void* strW;
+#endif /* UNICODE || _UNICODE */
+    int   extra1; /*!< Reserved. Must be zero   */
+    void* extra2; /*!< Reserved. Must be zero   */
+    struct ___itt_string_handle* next;
+} __itt_string_handle;
+
+#pragma pack(pop)
+/** @endcond */
+
+/**
+ * @ingroup handles
+ * @brief Create a string handle.
+ * Create and return handle value that can be associated with a string.
+ * Consecutive calls to __itt_string_handle_create with the same name
+ * return the same value. Because the set of string handles is expected to remain
+ * static during the application's execution time, there is no mechanism to destroy a string handle.
+ * Any string handle can be accessed by any thread in the process, regardless of which thread created
+ * the string handle. This call is thread-safe.
+ * @param[in] name The input string
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_string_handle* ITTAPI __itt_string_handle_createA(const char    *name);
+__itt_string_handle* ITTAPI __itt_string_handle_createW(const wchar_t *name);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_string_handle_create     __itt_string_handle_createW
+#  define __itt_string_handle_create_ptr __itt_string_handle_createW_ptr
+#else /* UNICODE */
+#  define __itt_string_handle_create     __itt_string_handle_createA
+#  define __itt_string_handle_create_ptr __itt_string_handle_createA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_string_handle* ITTAPI __itt_string_handle_create(const char *name);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_string_handle*, string_handle_createA, (const char    *name))
+ITT_STUB(ITTAPI, __itt_string_handle*, string_handle_createW, (const wchar_t *name))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_string_handle*, string_handle_create,  (const char    *name))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_string_handle_createA     ITTNOTIFY_DATA(string_handle_createA)
+#define __itt_string_handle_createA_ptr ITTNOTIFY_NAME(string_handle_createA)
+#define __itt_string_handle_createW     ITTNOTIFY_DATA(string_handle_createW)
+#define __itt_string_handle_createW_ptr ITTNOTIFY_NAME(string_handle_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_string_handle_create     ITTNOTIFY_DATA(string_handle_create)
+#define __itt_string_handle_create_ptr ITTNOTIFY_NAME(string_handle_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_string_handle_createA(name) (__itt_string_handle*)0
+#define __itt_string_handle_createA_ptr 0
+#define __itt_string_handle_createW(name) (__itt_string_handle*)0
+#define __itt_string_handle_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_string_handle_create(name)  (__itt_string_handle*)0
+#define __itt_string_handle_create_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_string_handle_createA_ptr 0
+#define __itt_string_handle_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_string_handle_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} handles group */
+
+/** @cond exclude_from_documentation */
+typedef unsigned long long __itt_timestamp;
+/** @endcond */
+
+#define __itt_timestamp_none ((__itt_timestamp)-1LL)
+
+/** @cond exclude_from_gpa_documentation */
+
+/**
+ * @ingroup timestamps
+ * @brief Return timestamp corresponding to the current moment.
+ * This returns the timestamp in the format that is the most relevant for the current
+ * host or platform (RDTSC, QPC, and others). You can use the "<" operator to
+ * compare __itt_timestamp values.
+ */
+__itt_timestamp ITTAPI __itt_get_timestamp(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_timestamp, get_timestamp, (void))
+#define __itt_get_timestamp      ITTNOTIFY_DATA(get_timestamp)
+#define __itt_get_timestamp_ptr  ITTNOTIFY_NAME(get_timestamp)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_get_timestamp()
+#define __itt_get_timestamp_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_get_timestamp_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} timestamps */
+/** @endcond */
+
+/** @cond exclude_from_gpa_documentation */
+
+/**
+ * @defgroup regions Regions
+ * @ingroup public
+ * Regions group
+ * @{
+ */
+/**
+ * @ingroup regions
+ * @brief Begin of region instance.
+ * Successive calls to __itt_region_begin with the same ID are ignored
+ * until a call to __itt_region_end with the same ID
+ * @param[in] domain The domain for this region instance
+ * @param[in] id The instance ID for this region instance. Must not be __itt_null
+ * @param[in] parentid The instance ID for the parent of this region instance, or __itt_null
+ * @param[in] name The name of this region
+ */
+void ITTAPI __itt_region_begin(const __itt_domain *domain, __itt_id id, __itt_id parentid, __itt_string_handle *name);
+
+/**
+ * @ingroup regions
+ * @brief End of region instance.
+ * The first call to __itt_region_end with a given ID ends the
+ * region. Successive calls with the same ID are ignored, as are
+ * calls that do not have a matching __itt_region_begin call.
+ * @param[in] domain The domain for this region instance
+ * @param[in] id The instance ID for this region instance
+ */
+void ITTAPI __itt_region_end(const __itt_domain *domain, __itt_id id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, region_begin, (const __itt_domain *domain, __itt_id id, __itt_id parentid, __itt_string_handle *name))
+ITT_STUBV(ITTAPI, void, region_end,   (const __itt_domain *domain, __itt_id id))
+#define __itt_region_begin(d,x,y,z) ITTNOTIFY_VOID_D3(region_begin,d,x,y,z)
+#define __itt_region_begin_ptr      ITTNOTIFY_NAME(region_begin)
+#define __itt_region_end(d,x)       ITTNOTIFY_VOID_D1(region_end,d,x)
+#define __itt_region_end_ptr        ITTNOTIFY_NAME(region_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_region_begin(d,x,y,z)
+#define __itt_region_begin_ptr 0
+#define __itt_region_end(d,x)
+#define __itt_region_end_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_region_begin_ptr 0
+#define __itt_region_end_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} regions group */
+
+/**
+ * @defgroup frames Frames
+ * @ingroup public
+ * Frames are similar to regions, but are intended to be easier to use and to implement.
+ * In particular:
+ * - Frames always represent periods of elapsed time
+ * - By default, frames have no nesting relationships
+ * @{
+ */
+
+/**
+ * @ingroup frames
+ * @brief Begin a frame instance.
+ * Successive calls to __itt_frame_begin with the
+ * same ID are ignored until a call to __itt_frame_end with the same ID.
+ * @param[in] domain The domain for this frame instance
+ * @param[in] id The instance ID for this frame instance or NULL
+ */
+void ITTAPI __itt_frame_begin_v3(const __itt_domain *domain, __itt_id *id);
+
+/**
+ * @ingroup frames
+ * @brief End a frame instance.
+ * The first call to __itt_frame_end with a given ID
+ * ends the frame. Successive calls with the same ID are ignored, as are
+ * calls that do not have a matching __itt_frame_begin call.
+ * @param[in] domain The domain for this frame instance
+ * @param[in] id The instance ID for this frame instance or NULL for current
+ */
+void ITTAPI __itt_frame_end_v3(const __itt_domain *domain, __itt_id *id);
+
+/**
+ * @ingroup frames
+ * @brief Submits a frame instance.
+ * Successive calls to __itt_frame_begin or __itt_frame_submit with the
+ * same ID are ignored until a call to __itt_frame_end or __itt_frame_submit
+ * with the same ID.
+ * Passing special __itt_timestamp_none value as "end" argument means
+ * take the current timestamp as the end timestamp.
+ * @param[in] domain The domain for this frame instance
+ * @param[in] id The instance ID for this frame instance or NULL
+ * @param[in] begin Timestamp of the beginning of the frame
+ * @param[in] end Timestamp of the end of the frame
+ */
+void ITTAPI __itt_frame_submit_v3(const __itt_domain *domain, __itt_id *id,
+    __itt_timestamp begin, __itt_timestamp end);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, frame_begin_v3,  (const __itt_domain *domain, __itt_id *id))
+ITT_STUBV(ITTAPI, void, frame_end_v3,    (const __itt_domain *domain, __itt_id *id))
+ITT_STUBV(ITTAPI, void, frame_submit_v3, (const __itt_domain *domain, __itt_id *id, __itt_timestamp begin, __itt_timestamp end))
+#define __itt_frame_begin_v3(d,x)      ITTNOTIFY_VOID_D1(frame_begin_v3,d,x)
+#define __itt_frame_begin_v3_ptr       ITTNOTIFY_NAME(frame_begin_v3)
+#define __itt_frame_end_v3(d,x)        ITTNOTIFY_VOID_D1(frame_end_v3,d,x)
+#define __itt_frame_end_v3_ptr         ITTNOTIFY_NAME(frame_end_v3)
+#define __itt_frame_submit_v3(d,x,b,e) ITTNOTIFY_VOID_D3(frame_submit_v3,d,x,b,e)
+#define __itt_frame_submit_v3_ptr      ITTNOTIFY_NAME(frame_submit_v3)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_frame_begin_v3(domain,id)
+#define __itt_frame_begin_v3_ptr 0
+#define __itt_frame_end_v3(domain,id)
+#define __itt_frame_end_v3_ptr   0
+#define __itt_frame_submit_v3(domain,id,begin,end)
+#define __itt_frame_submit_v3_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_frame_begin_v3_ptr 0
+#define __itt_frame_end_v3_ptr   0
+#define __itt_frame_submit_v3_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} frames group */
+/** @endcond */
+
+/**
+ * @defgroup taskgroup Task Group
+ * @ingroup public
+ * Task Group
+ * @{
+ */
+/**
+ * @ingroup task_groups
+ * @brief Denotes a task_group instance.
+ * Successive calls to __itt_task_group with the same ID are ignored.
+ * @param[in] domain The domain for this task_group instance
+ * @param[in] id The instance ID for this task_group instance. Must not be __itt_null.
+ * @param[in] parentid The instance ID for the parent of this task_group instance, or __itt_null.
+ * @param[in] name The name of this task_group
+ */
+void ITTAPI __itt_task_group(const __itt_domain *domain, __itt_id id, __itt_id parentid, __itt_string_handle *name);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, task_group, (const __itt_domain *domain, __itt_id id, __itt_id parentid, __itt_string_handle *name))
+#define __itt_task_group(d,x,y,z) ITTNOTIFY_VOID_D3(task_group,d,x,y,z)
+#define __itt_task_group_ptr      ITTNOTIFY_NAME(task_group)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_task_group(d,x,y,z)
+#define __itt_task_group_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_task_group_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} taskgroup group */
+
+/**
+ * @defgroup tasks Tasks
+ * @ingroup public
+ * A task instance represents a piece of work performed by a particular
+ * thread for a period of time. A call to __itt_task_begin creates a
+ * task instance. This becomes the current instance for that task on that
+ * thread. A following call to __itt_task_end on the same thread ends the
+ * instance. There may be multiple simultaneous instances of tasks with the
+ * same name on different threads. If an ID is specified, the task instance
+ * receives that ID. Nested tasks are allowed.
+ *
+ * Note: The task is defined by the bracketing of __itt_task_begin and
+ * __itt_task_end on the same thread. If some scheduling mechanism causes
+ * task switching (the thread executes a different user task) or task
+ * switching (the user task switches to a different thread) then this breaks
+ * the notion of  current instance. Additional API calls are required to
+ * deal with that possibility.
+ * @{
+ */
+
+/**
+ * @ingroup tasks
+ * @brief Begin a task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] taskid The instance ID for this task instance, or __itt_null
+ * @param[in] parentid The parent instance to which this task instance belongs, or __itt_null
+ * @param[in] name The name of this task
+ */
+void ITTAPI __itt_task_begin(const __itt_domain *domain, __itt_id taskid, __itt_id parentid, __itt_string_handle *name);
+
+/**
+ * @ingroup tasks
+ * @brief Begin a task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] taskid The identifier for this task instance (may be 0)
+ * @param[in] parentid The parent of this task (may be 0)
+ * @param[in] fn The pointer to the function you are tracing
+ */
+void ITTAPI __itt_task_begin_fn(const __itt_domain *domain, __itt_id taskid, __itt_id parentid, void* fn);
+
+/**
+ * @ingroup tasks
+ * @brief End the current task instance.
+ * @param[in] domain The domain for this task
+ */
+void ITTAPI __itt_task_end(const __itt_domain *domain);
+
+/**
+ * @ingroup tasks
+ * @brief Begin an overlapped task instance.
+ * @param[in] domain The domain for this task.
+ * @param[in] taskid The identifier for this task instance, *cannot* be __itt_null.
+ * @param[in] parentid The parent of this task, or __itt_null.
+ * @param[in] name The name of this task.
+ */
+void ITTAPI __itt_task_begin_overlapped(const __itt_domain* domain, __itt_id taskid, __itt_id parentid, __itt_string_handle* name);
+
+/**
+ * @ingroup tasks
+ * @brief End an overlapped task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] taskid Explicit ID of finished task
+ */
+void ITTAPI __itt_task_end_overlapped(const __itt_domain *domain, __itt_id taskid);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, task_begin,    (const __itt_domain *domain, __itt_id id, __itt_id parentid, __itt_string_handle *name))
+ITT_STUBV(ITTAPI, void, task_begin_fn, (const __itt_domain *domain, __itt_id id, __itt_id parentid, void* fn))
+ITT_STUBV(ITTAPI, void, task_end,      (const __itt_domain *domain))
+ITT_STUBV(ITTAPI, void, task_begin_overlapped, (const __itt_domain *domain, __itt_id taskid, __itt_id parentid, __itt_string_handle *name))
+ITT_STUBV(ITTAPI, void, task_end_overlapped,   (const __itt_domain *domain, __itt_id taskid))
+#define __itt_task_begin(d,x,y,z)    ITTNOTIFY_VOID_D3(task_begin,d,x,y,z)
+#define __itt_task_begin_ptr         ITTNOTIFY_NAME(task_begin)
+#define __itt_task_begin_fn(d,x,y,z) ITTNOTIFY_VOID_D3(task_begin_fn,d,x,y,z)
+#define __itt_task_begin_fn_ptr      ITTNOTIFY_NAME(task_begin_fn)
+#define __itt_task_end(d)            ITTNOTIFY_VOID_D0(task_end,d)
+#define __itt_task_end_ptr           ITTNOTIFY_NAME(task_end)
+#define __itt_task_begin_overlapped(d,x,y,z) ITTNOTIFY_VOID_D3(task_begin_overlapped,d,x,y,z)
+#define __itt_task_begin_overlapped_ptr      ITTNOTIFY_NAME(task_begin_overlapped)
+#define __itt_task_end_overlapped(d,x)       ITTNOTIFY_VOID_D1(task_end_overlapped,d,x)
+#define __itt_task_end_overlapped_ptr        ITTNOTIFY_NAME(task_end_overlapped)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_task_begin(domain,id,parentid,name)
+#define __itt_task_begin_ptr    0
+#define __itt_task_begin_fn(domain,id,parentid,fn)
+#define __itt_task_begin_fn_ptr 0
+#define __itt_task_end(domain)
+#define __itt_task_end_ptr      0
+#define __itt_task_begin_overlapped(domain,taskid,parentid,name)
+#define __itt_task_begin_overlapped_ptr         0
+#define __itt_task_end_overlapped(domain,taskid)
+#define __itt_task_end_overlapped_ptr           0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_task_begin_ptr    0
+#define __itt_task_begin_fn_ptr 0
+#define __itt_task_end_ptr      0
+#define __itt_task_begin_overlapped_ptr 0
+#define __itt_task_end_overlapped_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} tasks group */
+
+/**
+ * @defgroup counters Counters
+ * @ingroup public
+ * Counters are user-defined objects with a monotonically increasing
+ * value. Counter values are 64-bit unsigned integers. Counter values
+ * are tracked per-thread. Counters have names that can be displayed in
+ * the tools.
+ * @{
+ */
+
+/**
+ * @ingroup counters
+ * @brief Increment a counter by one.
+ * The first call with a given name creates a counter by that name and sets its
+ * value to zero on every thread. Successive calls increment the counter value
+ * on the thread on which the call is issued.
+ * @param[in] domain The domain controlling the call. Counter names are not domain specific.
+ *            The domain argument is used only to enable or disable the API calls.
+ * @param[in] name The name of the counter
+ */
+void ITTAPI __itt_counter_inc_v3(const __itt_domain *domain, __itt_string_handle *name);
+
+/**
+ * @ingroup counters
+ * @brief Increment a counter by the value specified in delta.
+ * @param[in] domain The domain controlling the call. Counter names are not domain specific.
+ *            The domain argument is used only to enable or disable the API calls.
+ * @param[in] name The name of the counter
+ * @param[in] delta The amount by which to increment the counter
+ */
+void ITTAPI __itt_counter_inc_delta_v3(const __itt_domain *domain, __itt_string_handle *name, unsigned long long delta);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, counter_inc_v3,       (const __itt_domain *domain, __itt_string_handle *name))
+ITT_STUBV(ITTAPI, void, counter_inc_delta_v3, (const __itt_domain *domain, __itt_string_handle *name, unsigned long long delta))
+#define __itt_counter_inc_v3(d,x)         ITTNOTIFY_VOID_D1(counter_inc_v3,d,x)
+#define __itt_counter_inc_v3_ptr          ITTNOTIFY_NAME(counter_inc_v3)
+#define __itt_counter_inc_delta_v3(d,x,y) ITTNOTIFY_VOID_D2(counter_inc_delta_v3,d,x,y)
+#define __itt_counter_inc_delta_v3_ptr    ITTNOTIFY_NAME(counter_inc_delta_v3)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_counter_inc_v3(domain,name)
+#define __itt_counter_inc_v3_ptr       0
+#define __itt_counter_inc_delta_v3(domain,name,delta)
+#define __itt_counter_inc_delta_v3_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_counter_inc_v3_ptr       0
+#define __itt_counter_inc_delta_v3_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} counters group */
+
+/**
+ * @defgroup markers Markers
+ * Markers represent a single discreet event in time. Markers have a scope,
+ * described by an enumerated type __itt_scope. Markers are created by
+ * the API call __itt_marker. A marker instance can be given an ID for use in
+ * adding metadata.
+ * @{
+ */
+
+/**
+ * @brief Describes the scope of an event object in the trace.
+ */
+typedef enum
+{
+    __itt_scope_unknown = 0,
+    __itt_scope_global,
+    __itt_scope_track_group,
+    __itt_scope_track,
+    __itt_scope_task,
+    __itt_scope_marker
+} __itt_scope;
+
+/** @cond exclude_from_documentation */
+#define __itt_marker_scope_unknown  __itt_scope_unknown
+#define __itt_marker_scope_global   __itt_scope_global
+#define __itt_marker_scope_process  __itt_scope_track_group
+#define __itt_marker_scope_thread   __itt_scope_track
+#define __itt_marker_scope_task     __itt_scope_task
+/** @endcond */
+
+/**
+ * @ingroup markers
+ * @brief Create a marker instance
+ * @param[in] domain The domain for this marker
+ * @param[in] id The instance ID for this marker or __itt_null
+ * @param[in] name The name for this marker
+ * @param[in] scope The scope for this marker
+ */
+void ITTAPI __itt_marker(const __itt_domain *domain, __itt_id id, __itt_string_handle *name, __itt_scope scope);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, marker, (const __itt_domain *domain, __itt_id id, __itt_string_handle *name, __itt_scope scope))
+#define __itt_marker(d,x,y,z) ITTNOTIFY_VOID_D3(marker,d,x,y,z)
+#define __itt_marker_ptr      ITTNOTIFY_NAME(marker)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_marker(domain,id,name,scope)
+#define __itt_marker_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_marker_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} markers group */
+
+/**
+ * @defgroup metadata Metadata
+ * The metadata API is used to attach extra information to named
+ * entities. Metadata can be attached to an identified named entity by ID,
+ * or to the current entity (which is always a task).
+ *
+ * Conceptually metadata has a type (what kind of metadata), a key (the
+ * name of the metadata), and a value (the actual data). The encoding of
+ * the value depends on the type of the metadata.
+ *
+ * The type of metadata is specified by an enumerated type __itt_metdata_type.
+ * @{
+ */
+
+/**
+ * @ingroup parameters
+ * @brief describes the type of metadata
+ */
+typedef enum {
+    __itt_metadata_unknown = 0,
+    __itt_metadata_u64,     /**< Unsigned 64-bit integer */
+    __itt_metadata_s64,     /**< Signed 64-bit integer */
+    __itt_metadata_u32,     /**< Unsigned 32-bit integer */
+    __itt_metadata_s32,     /**< Signed 32-bit integer */
+    __itt_metadata_u16,     /**< Unsigned 16-bit integer */
+    __itt_metadata_s16,     /**< Signed 16-bit integer */
+    __itt_metadata_float,   /**< Signed 32-bit floating-point */
+    __itt_metadata_double   /**< SIgned 64-bit floating-point */
+} __itt_metadata_type;
+
+/**
+ * @ingroup parameters
+ * @brief Add metadata to an instance of a named entity.
+ * @param[in] domain The domain controlling the call
+ * @param[in] id The identifier of the instance to which the metadata is to be added, or __itt_null to add to the current task
+ * @param[in] key The name of the metadata
+ * @param[in] type The type of the metadata
+ * @param[in] count The number of elements of the given type. If count == 0, no metadata will be added.
+ * @param[in] data The metadata itself
+*/
+void ITTAPI __itt_metadata_add(const __itt_domain *domain, __itt_id id, __itt_string_handle *key, __itt_metadata_type type, size_t count, void *data);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, metadata_add, (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, __itt_metadata_type type, size_t count, void *data))
+#define __itt_metadata_add(d,x,y,z,a,b) ITTNOTIFY_VOID_D5(metadata_add,d,x,y,z,a,b)
+#define __itt_metadata_add_ptr          ITTNOTIFY_NAME(metadata_add)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_metadata_add(d,x,y,z,a,b)
+#define __itt_metadata_add_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_metadata_add_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup parameters
+ * @brief Add string metadata to an instance of a named entity.
+ * @param[in] domain The domain controlling the call
+ * @param[in] id The identifier of the instance to which the metadata is to be added, or __itt_null to add to the current task
+ * @param[in] key The name of the metadata
+ * @param[in] data The metadata itself
+ * @param[in] length The number of characters in the string, or -1 if the length is unknown but the string is null-terminated
+*/
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_metadata_str_addA(const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const char *data, size_t length);
+void ITTAPI __itt_metadata_str_addW(const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const wchar_t *data, size_t length);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_metadata_str_add     __itt_metadata_str_addW
+#  define __itt_metadata_str_add_ptr __itt_metadata_str_addW_ptr
+#else /* UNICODE */
+#  define __itt_metadata_str_add     __itt_metadata_str_addA
+#  define __itt_metadata_str_add_ptr __itt_metadata_str_addA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+void ITTAPI __itt_metadata_str_add(const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const char *data, size_t length);
+#endif
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, metadata_str_addA, (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const char *data, size_t length))
+ITT_STUBV(ITTAPI, void, metadata_str_addW, (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const wchar_t *data, size_t length))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, metadata_str_add, (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const char *data, size_t length))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_metadata_str_addA(d,x,y,z,a) ITTNOTIFY_VOID_D4(metadata_str_addA,d,x,y,z,a)
+#define __itt_metadata_str_addA_ptr        ITTNOTIFY_NAME(metadata_str_addA)
+#define __itt_metadata_str_addW(d,x,y,z,a) ITTNOTIFY_VOID_D4(metadata_str_addW,d,x,y,z,a)
+#define __itt_metadata_str_addW_ptr        ITTNOTIFY_NAME(metadata_str_addW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_metadata_str_add(d,x,y,z,a)  ITTNOTIFY_VOID_D4(metadata_str_add,d,x,y,z,a)
+#define __itt_metadata_str_add_ptr         ITTNOTIFY_NAME(metadata_str_add)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_metadata_str_addA(d,x,y,z,a)
+#define __itt_metadata_str_addA_ptr 0
+#define __itt_metadata_str_addW(d,x,y,z,a)
+#define __itt_metadata_str_addW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_metadata_str_add(d,x,y,z,a)
+#define __itt_metadata_str_add_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_metadata_str_addA_ptr 0
+#define __itt_metadata_str_addW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_metadata_str_add_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup parameters
+ * @brief Add metadata to an instance of a named entity.
+ * @param[in] domain The domain controlling the call
+ * @param[in] scope The scope of the instance to which the metadata is to be added
+
+ * @param[in] id The identifier of the instance to which the metadata is to be added, or __itt_null to add to the current task
+
+ * @param[in] key The name of the metadata
+ * @param[in] type The type of the metadata
+ * @param[in] count The number of elements of the given type. If count == 0, no metadata will be added.
+ * @param[in] data The metadata itself
+*/
+void ITTAPI __itt_metadata_add_with_scope(const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, __itt_metadata_type type, size_t count, void *data);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, metadata_add_with_scope, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, __itt_metadata_type type, size_t count, void *data))
+#define __itt_metadata_add_with_scope(d,x,y,z,a,b) ITTNOTIFY_VOID_D5(metadata_add_with_scope,d,x,y,z,a,b)
+#define __itt_metadata_add_with_scope_ptr          ITTNOTIFY_NAME(metadata_add_with_scope)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_metadata_add_with_scope(d,x,y,z,a,b)
+#define __itt_metadata_add_with_scope_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_metadata_add_with_scope_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup parameters
+ * @brief Add string metadata to an instance of a named entity.
+ * @param[in] domain The domain controlling the call
+ * @param[in] scope The scope of the instance to which the metadata is to be added
+
+ * @param[in] id The identifier of the instance to which the metadata is to be added, or __itt_null to add to the current task
+
+ * @param[in] key The name of the metadata
+ * @param[in] data The metadata itself
+ * @param[in] length The number of characters in the string, or -1 if the length is unknown but the string is null-terminated
+*/
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_metadata_str_add_with_scopeA(const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const char *data, size_t length);
+void ITTAPI __itt_metadata_str_add_with_scopeW(const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const wchar_t *data, size_t length);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_metadata_str_add_with_scope     __itt_metadata_str_add_with_scopeW
+#  define __itt_metadata_str_add_with_scope_ptr __itt_metadata_str_add_with_scopeW_ptr
+#else /* UNICODE */
+#  define __itt_metadata_str_add_with_scope     __itt_metadata_str_add_with_scopeA
+#  define __itt_metadata_str_add_with_scope_ptr __itt_metadata_str_add_with_scopeA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+void ITTAPI __itt_metadata_str_add_with_scope(const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const char *data, size_t length);
+#endif
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, metadata_str_add_with_scopeA, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const char *data, size_t length))
+ITT_STUBV(ITTAPI, void, metadata_str_add_with_scopeW, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const wchar_t *data, size_t length))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, metadata_str_add_with_scope, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const char *data, size_t length))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_metadata_str_add_with_scopeA(d,x,y,z,a) ITTNOTIFY_VOID_D4(metadata_str_add_with_scopeA,d,x,y,z,a)
+#define __itt_metadata_str_add_with_scopeA_ptr        ITTNOTIFY_NAME(metadata_str_add_with_scopeA)
+#define __itt_metadata_str_add_with_scopeW(d,x,y,z,a) ITTNOTIFY_VOID_D4(metadata_str_add_with_scopeW,d,x,y,z,a)
+#define __itt_metadata_str_add_with_scopeW_ptr        ITTNOTIFY_NAME(metadata_str_add_with_scopeW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_metadata_str_add_with_scope(d,x,y,z,a)  ITTNOTIFY_VOID_D4(metadata_str_add_with_scope,d,x,y,z,a)
+#define __itt_metadata_str_add_with_scope_ptr         ITTNOTIFY_NAME(metadata_str_add_with_scope)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_metadata_str_add_with_scopeA(d,x,y,z,a)
+#define __itt_metadata_str_add_with_scopeA_ptr  0
+#define __itt_metadata_str_add_with_scopeW(d,x,y,z,a)
+#define __itt_metadata_str_add_with_scopeW_ptr  0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_metadata_str_add_with_scope(d,x,y,z,a)
+#define __itt_metadata_str_add_with_scope_ptr   0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_metadata_str_add_with_scopeA_ptr  0
+#define __itt_metadata_str_add_with_scopeW_ptr  0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_metadata_str_add_with_scope_ptr   0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @} metadata group */
+
+/**
+ * @defgroup relations Relations
+ * Instances of named entities can be explicitly associated with other
+ * instances using instance IDs and the relationship API calls.
+ *
+ * @{
+ */
+
+/**
+ * @ingroup relations
+ * @brief The kind of relation between two instances is specified by the enumerated type __itt_relation.
+ * Relations between instances can be added with an API call. The relation
+ * API uses instance IDs. Relations can be added before or after the actual
+ * instances are created and persist independently of the instances. This
+ * is the motivation for having different lifetimes for instance IDs and
+ * the actual instances.
+ */
+typedef enum
+{
+    __itt_relation_is_unknown = 0,
+    __itt_relation_is_dependent_on,         /**< "A is dependent on B" means that A cannot start until B completes */
+    __itt_relation_is_sibling_of,           /**< "A is sibling of B" means that A and B were created as a group */
+    __itt_relation_is_parent_of,            /**< "A is parent of B" means that A created B */
+    __itt_relation_is_continuation_of,      /**< "A is continuation of B" means that A assumes the dependencies of B */
+    __itt_relation_is_child_of,             /**< "A is child of B" means that A was created by B (inverse of is_parent_of) */
+    __itt_relation_is_continued_by,         /**< "A is continued by B" means that B assumes the dependencies of A (inverse of is_continuation_of) */
+    __itt_relation_is_predecessor_to        /**< "A is predecessor to B" means that B cannot start until A completes (inverse of is_dependent_on) */
+} __itt_relation;
+
+/**
+ * @ingroup relations
+ * @brief Add a relation to the current task instance.
+ * The current task instance is the head of the relation.
+ * @param[in] domain The domain controlling this call
+ * @param[in] relation The kind of relation
+ * @param[in] tail The ID for the tail of the relation
+ */
+void ITTAPI __itt_relation_add_to_current(const __itt_domain *domain, __itt_relation relation, __itt_id tail);
+
+/**
+ * @ingroup relations
+ * @brief Add a relation between two instance identifiers.
+ * @param[in] domain The domain controlling this call
+ * @param[in] head The ID for the head of the relation
+ * @param[in] relation The kind of relation
+ * @param[in] tail The ID for the tail of the relation
+ */
+void ITTAPI __itt_relation_add(const __itt_domain *domain, __itt_id head, __itt_relation relation, __itt_id tail);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, relation_add_to_current, (const __itt_domain *domain, __itt_relation relation, __itt_id tail))
+ITT_STUBV(ITTAPI, void, relation_add,            (const __itt_domain *domain, __itt_id head, __itt_relation relation, __itt_id tail))
+#define __itt_relation_add_to_current(d,x,y) ITTNOTIFY_VOID_D2(relation_add_to_current,d,x,y)
+#define __itt_relation_add_to_current_ptr    ITTNOTIFY_NAME(relation_add_to_current)
+#define __itt_relation_add(d,x,y,z)          ITTNOTIFY_VOID_D3(relation_add,d,x,y,z)
+#define __itt_relation_add_ptr               ITTNOTIFY_NAME(relation_add)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_relation_add_to_current(d,x,y)
+#define __itt_relation_add_to_current_ptr 0
+#define __itt_relation_add(d,x,y,z)
+#define __itt_relation_add_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_relation_add_to_current_ptr 0
+#define __itt_relation_add_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} relations group */
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_clock_info
+{
+    unsigned long long clock_freq; /*!< Clock domain frequency */
+    unsigned long long clock_base; /*!< Clock domain base timestamp */
+} __itt_clock_info;
+
+#pragma pack(pop)
+/** @endcond */
+
+/** @cond exclude_from_documentation */
+typedef void (ITTAPI *__itt_get_clock_info_fn)(__itt_clock_info* clock_info, void* data);
+/** @endcond */
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_clock_domain
+{
+    __itt_clock_info info;      /*!< Most recent clock domain info */
+    __itt_get_clock_info_fn fn; /*!< Callback function pointer */
+    void* fn_data;              /*!< Input argument for the callback function */
+    int   extra1;               /*!< Reserved. Must be zero */
+    void* extra2;               /*!< Reserved. Must be zero */
+    struct ___itt_clock_domain* next;
+} __itt_clock_domain;
+
+#pragma pack(pop)
+/** @endcond */
+
+/**
+ * @ingroup clockdomains
+ * @brief Create a clock domain.
+ * Certain applications require the capability to trace their application using
+ * a clock domain different than the CPU, for instance the instrumentation of events
+ * that occur on a GPU.
+ * Because the set of domains is expected to be static over the application's execution time,
+ * there is no mechanism to destroy a domain.
+ * Any domain can be accessed by any thread in the process, regardless of which thread created
+ * the domain. This call is thread-safe.
+ * @param[in] fn A pointer to a callback function which retrieves alternative CPU timestamps
+ * @param[in] fn_data Argument for a callback function; may be NULL
+ */
+__itt_clock_domain* ITTAPI __itt_clock_domain_create(__itt_get_clock_info_fn fn, void* fn_data);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_clock_domain*, clock_domain_create, (__itt_get_clock_info_fn fn, void* fn_data))
+#define __itt_clock_domain_create     ITTNOTIFY_DATA(clock_domain_create)
+#define __itt_clock_domain_create_ptr ITTNOTIFY_NAME(clock_domain_create)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_clock_domain_create(fn,fn_data) (__itt_clock_domain*)0
+#define __itt_clock_domain_create_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_clock_domain_create_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup clockdomains
+ * @brief Recalculate clock domains frequences and clock base timestamps.
+ */
+void ITTAPI __itt_clock_domain_reset(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, clock_domain_reset, (void))
+#define __itt_clock_domain_reset     ITTNOTIFY_VOID(clock_domain_reset)
+#define __itt_clock_domain_reset_ptr ITTNOTIFY_NAME(clock_domain_reset)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_clock_domain_reset()
+#define __itt_clock_domain_reset_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_clock_domain_reset_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup clockdomain
+ * @brief Create an instance of identifier. This establishes the beginning of the lifetime of
+ * an instance of the given ID in the trace. Once this lifetime starts, the ID can be used to
+ * tag named entity instances in calls such as __itt_task_begin, and to specify relationships among
+ * identified named entity instances, using the \ref relations APIs.
+ * @param[in] domain The domain controlling the execution of this call.
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] id The ID to create.
+ */
+void ITTAPI __itt_id_create_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id);
+
+/**
+ * @ingroup clockdomain
+ * @brief Destroy an instance of identifier. This ends the lifetime of the current instance of the
+ * given ID value in the trace. Any relationships that are established after this lifetime ends are
+ * invalid. This call must be performed before the given ID value can be reused for a different
+ * named entity instance.
+ * @param[in] domain The domain controlling the execution of this call.
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] id The ID to destroy.
+ */
+void ITTAPI __itt_id_destroy_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, id_create_ex,  (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id))
+ITT_STUBV(ITTAPI, void, id_destroy_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id))
+#define __itt_id_create_ex(d,x,y,z)  ITTNOTIFY_VOID_D3(id_create_ex,d,x,y,z)
+#define __itt_id_create_ex_ptr       ITTNOTIFY_NAME(id_create_ex)
+#define __itt_id_destroy_ex(d,x,y,z) ITTNOTIFY_VOID_D3(id_destroy_ex,d,x,y,z)
+#define __itt_id_destroy_ex_ptr      ITTNOTIFY_NAME(id_destroy_ex)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_id_create_ex(domain,clock_domain,timestamp,id)
+#define __itt_id_create_ex_ptr    0
+#define __itt_id_destroy_ex(domain,clock_domain,timestamp,id)
+#define __itt_id_destroy_ex_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_id_create_ex_ptr    0
+#define __itt_id_destroy_ex_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup clockdomain
+ * @brief Begin a task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] taskid The instance ID for this task instance, or __itt_null
+ * @param[in] parentid The parent instance to which this task instance belongs, or __itt_null
+ * @param[in] name The name of this task
+ */
+void ITTAPI __itt_task_begin_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id taskid, __itt_id parentid, __itt_string_handle* name);
+
+/**
+ * @ingroup clockdomain
+ * @brief Begin a task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] taskid The identifier for this task instance, or __itt_null
+ * @param[in] parentid The parent of this task, or __itt_null
+ * @param[in] fn The pointer to the function you are tracing
+ */
+void ITTAPI __itt_task_begin_fn_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id taskid, __itt_id parentid, void* fn);
+
+/**
+ * @ingroup clockdomain
+ * @brief End the current task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ */
+void ITTAPI __itt_task_end_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, task_begin_ex,        (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_id parentid, __itt_string_handle *name))
+ITT_STUBV(ITTAPI, void, task_begin_fn_ex,     (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_id parentid, void* fn))
+ITT_STUBV(ITTAPI, void, task_end_ex,          (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp))
+#define __itt_task_begin_ex(d,x,y,z,a,b)      ITTNOTIFY_VOID_D5(task_begin_ex,d,x,y,z,a,b)
+#define __itt_task_begin_ex_ptr               ITTNOTIFY_NAME(task_begin_ex)
+#define __itt_task_begin_fn_ex(d,x,y,z,a,b)   ITTNOTIFY_VOID_D5(task_begin_fn_ex,d,x,y,z,a,b)
+#define __itt_task_begin_fn_ex_ptr            ITTNOTIFY_NAME(task_begin_fn_ex)
+#define __itt_task_end_ex(d,x,y)              ITTNOTIFY_VOID_D2(task_end_ex,d,x,y)
+#define __itt_task_end_ex_ptr                 ITTNOTIFY_NAME(task_end_ex)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_task_begin_ex(domain,clock_domain,timestamp,id,parentid,name)
+#define __itt_task_begin_ex_ptr          0
+#define __itt_task_begin_fn_ex(domain,clock_domain,timestamp,id,parentid,fn)
+#define __itt_task_begin_fn_ex_ptr       0
+#define __itt_task_end_ex(domain,clock_domain,timestamp)
+#define __itt_task_end_ex_ptr            0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_task_begin_ex_ptr          0
+#define __itt_task_begin_fn_ex_ptr       0
+#define __itt_task_end_ex_ptr            0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup markers
+ * @brief Create a marker instance.
+ * @param[in] domain The domain for this marker
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] id The instance ID for this marker, or __itt_null
+ * @param[in] name The name for this marker
+ * @param[in] scope The scope for this marker
+ */
+void ITTAPI __itt_marker_ex(const __itt_domain *domain,  __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_string_handle *name, __itt_scope scope);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, marker_ex,    (const __itt_domain *domain,  __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_string_handle *name, __itt_scope scope))
+#define __itt_marker_ex(d,x,y,z,a,b)    ITTNOTIFY_VOID_D5(marker_ex,d,x,y,z,a,b)
+#define __itt_marker_ex_ptr             ITTNOTIFY_NAME(marker_ex)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_marker_ex(domain,clock_domain,timestamp,id,name,scope)
+#define __itt_marker_ex_ptr    0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_marker_ex_ptr    0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @ingroup clockdomain
+ * @brief Add a relation to the current task instance.
+ * The current task instance is the head of the relation.
+ * @param[in] domain The domain controlling this call
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] relation The kind of relation
+ * @param[in] tail The ID for the tail of the relation
+ */
+void ITTAPI __itt_relation_add_to_current_ex(const __itt_domain *domain,  __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_relation relation, __itt_id tail);
+
+/**
+ * @ingroup clockdomain
+ * @brief Add a relation between two instance identifiers.
+ * @param[in] domain The domain controlling this call
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] head The ID for the head of the relation
+ * @param[in] relation The kind of relation
+ * @param[in] tail The ID for the tail of the relation
+ */
+void ITTAPI __itt_relation_add_ex(const __itt_domain *domain,  __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id head, __itt_relation relation, __itt_id tail);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, relation_add_to_current_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_relation relation, __itt_id tail))
+ITT_STUBV(ITTAPI, void, relation_add_ex,            (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id head, __itt_relation relation, __itt_id tail))
+#define __itt_relation_add_to_current_ex(d,x,y,z,a) ITTNOTIFY_VOID_D4(relation_add_to_current_ex,d,x,y,z,a)
+#define __itt_relation_add_to_current_ex_ptr        ITTNOTIFY_NAME(relation_add_to_current_ex)
+#define __itt_relation_add_ex(d,x,y,z,a,b)          ITTNOTIFY_VOID_D5(relation_add_ex,d,x,y,z,a,b)
+#define __itt_relation_add_ex_ptr                   ITTNOTIFY_NAME(relation_add_ex)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_relation_add_to_current_ex(domain,clock_domain,timestame,relation,tail)
+#define __itt_relation_add_to_current_ex_ptr 0
+#define __itt_relation_add_ex(domain,clock_domain,timestamp,head,relation,tail)
+#define __itt_relation_add_ex_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_relation_add_to_current_ex_ptr 0
+#define __itt_relation_add_ex_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @cond exclude_from_documentation */
+typedef enum ___itt_track_group_type
+{
+    __itt_track_group_type_normal = 0
+} __itt_track_group_type;
+/** @endcond */
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_track_group
+{
+    __itt_string_handle* name;     /*!< Name of the track group */
+    struct ___itt_track* track;    /*!< List of child tracks    */
+    __itt_track_group_type tgtype; /*!< Type of the track group */
+    int   extra1;                  /*!< Reserved. Must be zero  */
+    void* extra2;                  /*!< Reserved. Must be zero  */
+    struct ___itt_track_group* next;
+} __itt_track_group;
+
+#pragma pack(pop)
+/** @endcond */
+
+/**
+ * @brief Placeholder for custom track types. Currently, "normal" custom track
+ * is the only available track type.
+ */
+typedef enum ___itt_track_type
+{
+    __itt_track_type_normal = 0
+#ifdef INTEL_ITTNOTIFY_API_PRIVATE
+    , __itt_track_type_queue
+#endif /* INTEL_ITTNOTIFY_API_PRIVATE */
+} __itt_track_type;
+
+/** @cond exclude_from_documentation */
+#pragma pack(push, 8)
+
+typedef struct ___itt_track
+{
+    __itt_string_handle* name; /*!< Name of the track group */
+    __itt_track_group* group;  /*!< Parent group to a track */
+    __itt_track_type ttype;    /*!< Type of the track       */
+    int   extra1;              /*!< Reserved. Must be zero  */
+    void* extra2;              /*!< Reserved. Must be zero  */
+    struct ___itt_track* next;
+} __itt_track;
+
+#pragma pack(pop)
+/** @endcond */
+
+/**
+ * @brief Create logical track group.
+ */
+__itt_track_group* ITTAPI __itt_track_group_create(__itt_string_handle* name, __itt_track_group_type track_group_type);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_track_group*, track_group_create, (__itt_string_handle* name, __itt_track_group_type track_group_type))
+#define __itt_track_group_create     ITTNOTIFY_DATA(track_group_create)
+#define __itt_track_group_create_ptr ITTNOTIFY_NAME(track_group_create)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_track_group_create(name)  (__itt_track_group*)0
+#define __itt_track_group_create_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_track_group_create_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Create logical track.
+ */
+__itt_track* ITTAPI __itt_track_create(__itt_track_group* track_group, __itt_string_handle* name, __itt_track_type track_type);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_track*, track_create, (__itt_track_group* track_group,__itt_string_handle* name, __itt_track_type track_type))
+#define __itt_track_create     ITTNOTIFY_DATA(track_create)
+#define __itt_track_create_ptr ITTNOTIFY_NAME(track_create)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_track_create(track_group,name,track_type)  (__itt_track*)0
+#define __itt_track_create_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_track_create_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Set the logical track.
+ */
+void ITTAPI __itt_set_track(__itt_track* track);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, set_track, (__itt_track *track))
+#define __itt_set_track     ITTNOTIFY_VOID(set_track)
+#define __itt_set_track_ptr ITTNOTIFY_NAME(set_track)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_set_track(track)
+#define __itt_set_track_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_set_track_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/* ========================================================================== */
+/** @cond exclude_from_gpa_documentation */
+/**
+ * @defgroup events Events
+ * @ingroup public
+ * Events group
+ * @{
+ */
+/** @brief user event type */
+typedef int __itt_event;
+
+/**
+ * @brief Create an event notification
+ * @note name or namelen being null/name and namelen not matching, user event feature not enabled
+ * @return non-zero event identifier upon success and __itt_err otherwise
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_event LIBITTAPI __itt_event_createA(const char    *name, int namelen);
+__itt_event LIBITTAPI __itt_event_createW(const wchar_t *name, int namelen);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_event_create     __itt_event_createW
+#  define __itt_event_create_ptr __itt_event_createW_ptr
+#else
+#  define __itt_event_create     __itt_event_createA
+#  define __itt_event_create_ptr __itt_event_createA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_event LIBITTAPI __itt_event_create(const char *name, int namelen);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, __itt_event, event_createA, (const char    *name, int namelen))
+ITT_STUB(LIBITTAPI, __itt_event, event_createW, (const wchar_t *name, int namelen))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, __itt_event, event_create,  (const char    *name, int namelen))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_event_createA     ITTNOTIFY_DATA(event_createA)
+#define __itt_event_createA_ptr ITTNOTIFY_NAME(event_createA)
+#define __itt_event_createW     ITTNOTIFY_DATA(event_createW)
+#define __itt_event_createW_ptr ITTNOTIFY_NAME(event_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_event_create      ITTNOTIFY_DATA(event_create)
+#define __itt_event_create_ptr  ITTNOTIFY_NAME(event_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_event_createA(name, namelen) (__itt_event)0
+#define __itt_event_createA_ptr 0
+#define __itt_event_createW(name, namelen) (__itt_event)0
+#define __itt_event_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_event_create(name, namelen)  (__itt_event)0
+#define __itt_event_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_event_createA_ptr 0
+#define __itt_event_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_event_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an event occurrence.
+ * @return __itt_err upon failure (invalid event id/user event feature not enabled)
+ */
+int LIBITTAPI __itt_event_start(__itt_event event);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(LIBITTAPI, int, event_start, (__itt_event event))
+#define __itt_event_start     ITTNOTIFY_DATA(event_start)
+#define __itt_event_start_ptr ITTNOTIFY_NAME(event_start)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_event_start(event) (int)0
+#define __itt_event_start_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_event_start_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an event end occurrence.
+ * @note It is optional if events do not have durations.
+ * @return __itt_err upon failure (invalid event id/user event feature not enabled)
+ */
+int LIBITTAPI __itt_event_end(__itt_event event);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(LIBITTAPI, int, event_end, (__itt_event event))
+#define __itt_event_end     ITTNOTIFY_DATA(event_end)
+#define __itt_event_end_ptr ITTNOTIFY_NAME(event_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_event_end(event) (int)0
+#define __itt_event_end_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_event_end_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} events group */
+
+
+/**
+ * @defgroup arrays Arrays Visualizer
+ * @ingroup public
+ * Visualize arrays
+ * @{
+ */
+
+/**
+ * @enum __itt_av_data_type
+ * @brief Defines types of arrays data (for C/C++ intrinsic types)
+ */
+typedef enum
+{
+    __itt_e_first = 0,
+    __itt_e_char = 0,  /* 1-byte integer */
+    __itt_e_uchar,     /* 1-byte unsigned integer */
+    __itt_e_int16,     /* 2-byte integer */
+    __itt_e_uint16,    /* 2-byte unsigned integer  */
+    __itt_e_int32,     /* 4-byte integer */
+    __itt_e_uint32,    /* 4-byte unsigned integer */
+    __itt_e_int64,     /* 8-byte integer */
+    __itt_e_uint64,    /* 8-byte unsigned integer */
+    __itt_e_float,     /* 4-byte floating */
+    __itt_e_double,    /* 8-byte floating */
+    __itt_e_last = __itt_e_double
+} __itt_av_data_type;
+
+/**
+ * @brief Save an array data to a file.
+ * Output format is defined by the file extension. The csv and bmp formats are supported (bmp - for 2-dimensional array only).
+ * @param[in] data - pointer to the array data
+ * @param[in] rank - the rank of the array
+ * @param[in] dimensions - pointer to an array of integers, which specifies the array dimensions.
+ * The size of dimensions must be equal to the rank
+ * @param[in] type - the type of the array, specified as one of the __itt_av_data_type values (for intrinsic types)
+ * @param[in] filePath - the file path; the output format is defined by the file extension
+ * @param[in] columnOrder - defines how the array is stored in the linear memory.
+ * It should be 1 for column-major order (e.g. in FORTRAN) or 0 - for row-major order (e.g. in C).
+ */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+int ITTAPI __itt_av_saveA(void *data, int rank, const int *dimensions, int type, const char *filePath, int columnOrder);
+int ITTAPI __itt_av_saveW(void *data, int rank, const int *dimensions, int type, const wchar_t *filePath, int columnOrder);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_av_save     __itt_av_saveW
+#  define __itt_av_save_ptr __itt_av_saveW_ptr
+#else /* UNICODE */
+#  define __itt_av_save     __itt_av_saveA
+#  define __itt_av_save_ptr __itt_av_saveA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+int ITTAPI __itt_av_save(void *data, int rank, const int *dimensions, int type, const char *filePath, int columnOrder);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, int, av_saveA, (void *data, int rank, const int *dimensions, int type, const char *filePath, int columnOrder))
+ITT_STUB(ITTAPI, int, av_saveW, (void *data, int rank, const int *dimensions, int type, const wchar_t *filePath, int columnOrder))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int, av_save,  (void *data, int rank, const int *dimensions, int type, const char *filePath, int columnOrder))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_av_saveA     ITTNOTIFY_DATA(av_saveA)
+#define __itt_av_saveA_ptr ITTNOTIFY_NAME(av_saveA)
+#define __itt_av_saveW     ITTNOTIFY_DATA(av_saveW)
+#define __itt_av_saveW_ptr ITTNOTIFY_NAME(av_saveW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_av_save     ITTNOTIFY_DATA(av_save)
+#define __itt_av_save_ptr ITTNOTIFY_NAME(av_save)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_av_saveA(name)
+#define __itt_av_saveA_ptr 0
+#define __itt_av_saveW(name)
+#define __itt_av_saveW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_av_save(name)
+#define __itt_av_save_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_av_saveA_ptr 0
+#define __itt_av_saveW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_av_save_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+void ITTAPI __itt_enable_attach(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, enable_attach, (void))
+#define __itt_enable_attach     ITTNOTIFY_VOID(enable_attach)
+#define __itt_enable_attach_ptr ITTNOTIFY_NAME(enable_attach)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_enable_attach()
+#define __itt_enable_attach_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_enable_attach_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @cond exclude_from_gpa_documentation */
+
+/** @} arrays group */
+
+/** @endcond */
+
+
+#ifdef __cplusplus
+}
+#endif /* __cplusplus */
+
+#endif /* _ITTNOTIFY_H_ */
+
+#ifdef INTEL_ITTNOTIFY_API_PRIVATE
+
+#ifndef _ITTNOTIFY_PRIVATE_
+#define _ITTNOTIFY_PRIVATE_
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+/**
+ * @ingroup clockdomain
+ * @brief Begin an overlapped task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] taskid The identifier for this task instance, *cannot* be __itt_null.
+ * @param[in] parentid The parent of this task, or __itt_null.
+ * @param[in] name The name of this task.
+ */
+void ITTAPI __itt_task_begin_overlapped_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id taskid, __itt_id parentid, __itt_string_handle* name);
+
+/**
+ * @ingroup clockdomain
+ * @brief End an overlapped task instance.
+ * @param[in] domain The domain for this task
+ * @param[in] clock_domain The clock domain controlling the execution of this call.
+ * @param[in] timestamp The user defined timestamp.
+ * @param[in] taskid Explicit ID of finished task
+ */
+void ITTAPI __itt_task_end_overlapped_ex(const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id taskid);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, task_begin_overlapped_ex,       (const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id taskid, __itt_id parentid, __itt_string_handle* name))
+ITT_STUBV(ITTAPI, void, task_end_overlapped_ex,         (const __itt_domain* domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id taskid))
+#define __itt_task_begin_overlapped_ex(d,x,y,z,a,b)     ITTNOTIFY_VOID_D5(task_begin_overlapped_ex,d,x,y,z,a,b)
+#define __itt_task_begin_overlapped_ex_ptr              ITTNOTIFY_NAME(task_begin_overlapped_ex)
+#define __itt_task_end_overlapped_ex(d,x,y,z)           ITTNOTIFY_VOID_D3(task_end_overlapped_ex,d,x,y,z)
+#define __itt_task_end_overlapped_ex_ptr                ITTNOTIFY_NAME(task_end_overlapped_ex)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_task_begin_overlapped_ex(domain,clock_domain,timestamp,taskid,parentid,name)
+#define __itt_task_begin_overlapped_ex_ptr      0
+#define __itt_task_end_overlapped_ex(domain,clock_domain,timestamp,taskid)
+#define __itt_task_end_overlapped_ex_ptr        0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_task_begin_overlapped_ex_ptr      0
+#define __itt_task_end_overlapped_ptr           0
+#define __itt_task_end_overlapped_ex_ptr        0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @defgroup makrs_internal Marks
+ * @ingroup internal
+ * Marks group
+ * @warning Internal API:
+ *   - It is not shipped to outside of Intel
+ *   - It is delivered to internal Intel teams using e-mail or SVN access only
+ * @{
+ */
+/** @brief user mark type */
+typedef int __itt_mark_type;
+
+/**
+ * @brief Creates a user mark type with the specified name using char or Unicode string.
+ * @param[in] name - name of mark to create
+ * @return Returns a handle to the mark type
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_mark_type ITTAPI __itt_mark_createA(const char    *name);
+__itt_mark_type ITTAPI __itt_mark_createW(const wchar_t *name);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_mark_create     __itt_mark_createW
+#  define __itt_mark_create_ptr __itt_mark_createW_ptr
+#else /* UNICODE */
+#  define __itt_mark_create     __itt_mark_createA
+#  define __itt_mark_create_ptr __itt_mark_createA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_mark_type ITTAPI __itt_mark_create(const char *name);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_mark_type, mark_createA, (const char    *name))
+ITT_STUB(ITTAPI, __itt_mark_type, mark_createW, (const wchar_t *name))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_mark_type, mark_create,  (const char *name))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_mark_createA     ITTNOTIFY_DATA(mark_createA)
+#define __itt_mark_createA_ptr ITTNOTIFY_NAME(mark_createA)
+#define __itt_mark_createW     ITTNOTIFY_DATA(mark_createW)
+#define __itt_mark_createW_ptr ITTNOTIFY_NAME(mark_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_create      ITTNOTIFY_DATA(mark_create)
+#define __itt_mark_create_ptr  ITTNOTIFY_NAME(mark_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_mark_createA(name) (__itt_mark_type)0
+#define __itt_mark_createA_ptr 0
+#define __itt_mark_createW(name) (__itt_mark_type)0
+#define __itt_mark_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_create(name)  (__itt_mark_type)0
+#define __itt_mark_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_mark_createA_ptr 0
+#define __itt_mark_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Creates a "discrete" user mark type of the specified type and an optional parameter using char or Unicode string.
+ *
+ * - The mark of "discrete" type is placed to collection results in case of success. It appears in overtime view(s) as a special tick sign.
+ * - The call is "synchronous" - function returns after mark is actually added to results.
+ * - This function is useful, for example, to mark different phases of application
+ *   (beginning of the next mark automatically meand end of current region).
+ * - Can be used together with "continuous" marks (see below) at the same collection session
+ * @param[in] mt - mark, created by __itt_mark_create(const char* name) function
+ * @param[in] parameter - string parameter of mark
+ * @return Returns zero value in case of success, non-zero value otherwise.
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+int ITTAPI __itt_markA(__itt_mark_type mt, const char    *parameter);
+int ITTAPI __itt_markW(__itt_mark_type mt, const wchar_t *parameter);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_mark     __itt_markW
+#  define __itt_mark_ptr __itt_markW_ptr
+#else /* UNICODE  */
+#  define __itt_mark     __itt_markA
+#  define __itt_mark_ptr __itt_markA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+int ITTAPI __itt_mark(__itt_mark_type mt, const char *parameter);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, int, markA, (__itt_mark_type mt, const char    *parameter))
+ITT_STUB(ITTAPI, int, markW, (__itt_mark_type mt, const wchar_t *parameter))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int, mark,  (__itt_mark_type mt, const char *parameter))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_markA     ITTNOTIFY_DATA(markA)
+#define __itt_markA_ptr ITTNOTIFY_NAME(markA)
+#define __itt_markW     ITTNOTIFY_DATA(markW)
+#define __itt_markW_ptr ITTNOTIFY_NAME(markW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark      ITTNOTIFY_DATA(mark)
+#define __itt_mark_ptr  ITTNOTIFY_NAME(mark)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_markA(mt, parameter) (int)0
+#define __itt_markA_ptr 0
+#define __itt_markW(mt, parameter) (int)0
+#define __itt_markW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark(mt, parameter)  (int)0
+#define __itt_mark_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_markA_ptr 0
+#define __itt_markW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Use this if necessary to create a "discrete" user event type (mark) for process
+ * rather then for one thread
+ * @see int __itt_mark(__itt_mark_type mt, const char* parameter);
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+int ITTAPI __itt_mark_globalA(__itt_mark_type mt, const char    *parameter);
+int ITTAPI __itt_mark_globalW(__itt_mark_type mt, const wchar_t *parameter);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_mark_global     __itt_mark_globalW
+#  define __itt_mark_global_ptr __itt_mark_globalW_ptr
+#else /* UNICODE  */
+#  define __itt_mark_global     __itt_mark_globalA
+#  define __itt_mark_global_ptr __itt_mark_globalA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+int ITTAPI __itt_mark_global(__itt_mark_type mt, const char *parameter);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, int, mark_globalA, (__itt_mark_type mt, const char    *parameter))
+ITT_STUB(ITTAPI, int, mark_globalW, (__itt_mark_type mt, const wchar_t *parameter))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int, mark_global,  (__itt_mark_type mt, const char *parameter))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_mark_globalA     ITTNOTIFY_DATA(mark_globalA)
+#define __itt_mark_globalA_ptr ITTNOTIFY_NAME(mark_globalA)
+#define __itt_mark_globalW     ITTNOTIFY_DATA(mark_globalW)
+#define __itt_mark_globalW_ptr ITTNOTIFY_NAME(mark_globalW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_global      ITTNOTIFY_DATA(mark_global)
+#define __itt_mark_global_ptr  ITTNOTIFY_NAME(mark_global)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_mark_globalA(mt, parameter) (int)0
+#define __itt_mark_globalA_ptr 0
+#define __itt_mark_globalW(mt, parameter) (int)0
+#define __itt_mark_globalW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_global(mt, parameter)  (int)0
+#define __itt_mark_global_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_mark_globalA_ptr 0
+#define __itt_mark_globalW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_mark_global_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Creates an "end" point for "continuous" mark with specified name.
+ *
+ * - Returns zero value in case of success, non-zero value otherwise.
+ *   Also returns non-zero value when preceding "begin" point for the
+ *   mark with the same name failed to be created or not created.
+ * - The mark of "continuous" type is placed to collection results in
+ *   case of success. It appears in overtime view(s) as a special tick
+ *   sign (different from "discrete" mark) together with line from
+ *   corresponding "begin" mark to "end" mark.
+ * @note Continuous marks can overlap and be nested inside each other.
+ * Discrete mark can be nested inside marked region
+ * @param[in] mt - mark, created by __itt_mark_create(const char* name) function
+ * @return Returns zero value in case of success, non-zero value otherwise.
+ */
+int ITTAPI __itt_mark_off(__itt_mark_type mt);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, int, mark_off, (__itt_mark_type mt))
+#define __itt_mark_off     ITTNOTIFY_DATA(mark_off)
+#define __itt_mark_off_ptr ITTNOTIFY_NAME(mark_off)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_mark_off(mt) (int)0
+#define __itt_mark_off_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_mark_off_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Use this if necessary to create an "end" point for mark of process
+ * @see int __itt_mark_off(__itt_mark_type mt);
+ */
+int ITTAPI __itt_mark_global_off(__itt_mark_type mt);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, int, mark_global_off, (__itt_mark_type mt))
+#define __itt_mark_global_off     ITTNOTIFY_DATA(mark_global_off)
+#define __itt_mark_global_off_ptr ITTNOTIFY_NAME(mark_global_off)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_mark_global_off(mt) (int)0
+#define __itt_mark_global_off_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_mark_global_off_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} marks group */
+
+/**
+ * @defgroup counters_internal Counters
+ * @ingroup internal
+ * Counters group
+ * @{
+ */
+/**
+ * @brief opaque structure for counter identification
+ */
+typedef struct ___itt_counter *__itt_counter;
+
+/**
+ * @brief Create a counter with given name/domain for the calling thread
+ *
+ * After __itt_counter_create() is called, __itt_counter_inc() / __itt_counter_inc_delta() can be used
+ * to increment the counter on any thread
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_counter ITTAPI __itt_counter_createA(const char    *name, const char    *domain);
+__itt_counter ITTAPI __itt_counter_createW(const wchar_t *name, const wchar_t *domain);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_counter_create     __itt_counter_createW
+#  define __itt_counter_create_ptr __itt_counter_createW_ptr
+#else /* UNICODE */
+#  define __itt_counter_create     __itt_counter_createA
+#  define __itt_counter_create_ptr __itt_counter_createA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_counter ITTAPI __itt_counter_create(const char *name, const char *domain);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_counter, counter_createA, (const char    *name, const char    *domain))
+ITT_STUB(ITTAPI, __itt_counter, counter_createW, (const wchar_t *name, const wchar_t *domain))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_counter, counter_create,  (const char *name, const char *domain))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_counter_createA     ITTNOTIFY_DATA(counter_createA)
+#define __itt_counter_createA_ptr ITTNOTIFY_NAME(counter_createA)
+#define __itt_counter_createW     ITTNOTIFY_DATA(counter_createW)
+#define __itt_counter_createW_ptr ITTNOTIFY_NAME(counter_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_counter_create     ITTNOTIFY_DATA(counter_create)
+#define __itt_counter_create_ptr ITTNOTIFY_NAME(counter_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_counter_createA(name, domain)
+#define __itt_counter_createA_ptr 0
+#define __itt_counter_createW(name, domain)
+#define __itt_counter_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_counter_create(name, domain)
+#define __itt_counter_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_counter_createA_ptr 0
+#define __itt_counter_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_counter_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Destroy the counter identified by the pointer previously returned by __itt_counter_create()
+ */
+void ITTAPI __itt_counter_destroy(__itt_counter id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, counter_destroy, (__itt_counter id))
+#define __itt_counter_destroy     ITTNOTIFY_VOID(counter_destroy)
+#define __itt_counter_destroy_ptr ITTNOTIFY_NAME(counter_destroy)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_counter_destroy(id)
+#define __itt_counter_destroy_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_counter_destroy_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Increment the counter value
+ */
+void ITTAPI __itt_counter_inc(__itt_counter id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, counter_inc, (__itt_counter id))
+#define __itt_counter_inc     ITTNOTIFY_VOID(counter_inc)
+#define __itt_counter_inc_ptr ITTNOTIFY_NAME(counter_inc)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_counter_inc(id)
+#define __itt_counter_inc_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_counter_inc_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Increment the counter value with x
+ */
+void ITTAPI __itt_counter_inc_delta(__itt_counter id, unsigned long long value);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, counter_inc_delta, (__itt_counter id, unsigned long long value))
+#define __itt_counter_inc_delta     ITTNOTIFY_VOID(counter_inc_delta)
+#define __itt_counter_inc_delta_ptr ITTNOTIFY_NAME(counter_inc_delta)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_counter_inc_delta(id, value)
+#define __itt_counter_inc_delta_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_counter_inc_delta_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} counters group */
+
+/**
+ * @defgroup stitch Stack Stitching
+ * @ingroup internal
+ * Stack Stitching group
+ * @{
+ */
+/**
+ * @brief opaque structure for counter identification
+ */
+typedef struct ___itt_caller *__itt_caller;
+
+/**
+ * @brief Create the stitch point e.g. a point in call stack where other stacks should be stitched to.
+ * The function returns a unique identifier which is used to match the cut points with corresponding stitch points.
+ */
+__itt_caller ITTAPI __itt_stack_caller_create(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_caller, stack_caller_create, (void))
+#define __itt_stack_caller_create     ITTNOTIFY_DATA(stack_caller_create)
+#define __itt_stack_caller_create_ptr ITTNOTIFY_NAME(stack_caller_create)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_stack_caller_create() (__itt_caller)0
+#define __itt_stack_caller_create_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_stack_caller_create_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Destroy the inforamtion about stitch point identified by the pointer previously returned by __itt_stack_caller_create()
+ */
+void ITTAPI __itt_stack_caller_destroy(__itt_caller id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, stack_caller_destroy, (__itt_caller id))
+#define __itt_stack_caller_destroy     ITTNOTIFY_VOID(stack_caller_destroy)
+#define __itt_stack_caller_destroy_ptr ITTNOTIFY_NAME(stack_caller_destroy)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_stack_caller_destroy(id)
+#define __itt_stack_caller_destroy_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_stack_caller_destroy_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Sets the cut point. Stack from each event which occurs after this call will be cut
+ * at the same stack level the function was called and stitched to the corresponding stitch point.
+ */
+void ITTAPI __itt_stack_callee_enter(__itt_caller id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, stack_callee_enter, (__itt_caller id))
+#define __itt_stack_callee_enter     ITTNOTIFY_VOID(stack_callee_enter)
+#define __itt_stack_callee_enter_ptr ITTNOTIFY_NAME(stack_callee_enter)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_stack_callee_enter(id)
+#define __itt_stack_callee_enter_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_stack_callee_enter_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief This function eliminates the cut point which was set by latest __itt_stack_callee_enter().
+ */
+void ITTAPI __itt_stack_callee_leave(__itt_caller id);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, stack_callee_leave, (__itt_caller id))
+#define __itt_stack_callee_leave     ITTNOTIFY_VOID(stack_callee_leave)
+#define __itt_stack_callee_leave_ptr ITTNOTIFY_NAME(stack_callee_leave)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_stack_callee_leave(id)
+#define __itt_stack_callee_leave_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_stack_callee_leave_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @} stitch group */
+
+/* ***************************************************************************************************************************** */
+
+#include <stdarg.h>
+
+/** @cond exclude_from_documentation */
+typedef enum __itt_error_code
+{
+    __itt_error_success       = 0, /*!< no error */
+    __itt_error_no_module     = 1, /*!< module can't be loaded */
+    /* %1$s -- library name; win: %2$d -- system error code; unx: %2$s -- system error message. */
+    __itt_error_no_symbol     = 2, /*!< symbol not found */
+    /* %1$s -- library name, %2$s -- symbol name. */
+    __itt_error_unknown_group = 3, /*!< unknown group specified */
+    /* %1$s -- env var name, %2$s -- group name. */
+    __itt_error_cant_read_env = 4, /*!< GetEnvironmentVariable() failed */
+    /* %1$s -- env var name, %2$d -- system error. */
+    __itt_error_env_too_long  = 5, /*!< variable value too long */
+    /* %1$s -- env var name, %2$d -- actual length of the var, %3$d -- max allowed length. */
+    __itt_error_system        = 6  /*!< pthread_mutexattr_init or pthread_mutex_init failed */
+    /* %1$s -- function name, %2$d -- errno. */
+} __itt_error_code;
+
+typedef void (__itt_error_handler_t)(__itt_error_code code, va_list);
+__itt_error_handler_t* __itt_set_error_handler(__itt_error_handler_t*);
+
+const char* ITTAPI __itt_api_version(void);
+/** @endcond */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#define __itt_error_handler ITT_JOIN(INTEL_ITTNOTIFY_PREFIX, error_handler)
+void __itt_error_handler(__itt_error_code code, va_list args);
+extern const int ITTNOTIFY_NAME(err);
+#define __itt_err ITTNOTIFY_NAME(err)
+ITT_STUB(ITTAPI, const char*, api_version, (void))
+#define __itt_api_version     ITTNOTIFY_DATA(api_version)
+#define __itt_api_version_ptr ITTNOTIFY_NAME(api_version)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_api_version()   (const char*)0
+#define __itt_api_version_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_api_version_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+#ifdef __cplusplus
+}
+#endif /* __cplusplus */
+
+#endif /* _ITTNOTIFY_PRIVATE_ */
+
+#endif /* INTEL_ITTNOTIFY_API_PRIVATE */
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_config.h b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_config.h
new file mode 100644
index 00000000..9956232e
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_config.h
@@ -0,0 +1,512 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _ITTNOTIFY_CONFIG_H_
+#define _ITTNOTIFY_CONFIG_H_
+
+/** @cond exclude_from_documentation */
+#ifndef ITT_OS_WIN
+#  define ITT_OS_WIN   1
+#endif /* ITT_OS_WIN */
+
+#ifndef ITT_OS_LINUX
+#  define ITT_OS_LINUX 2
+#endif /* ITT_OS_LINUX */
+
+#ifndef ITT_OS_MAC
+#  define ITT_OS_MAC   3
+#endif /* ITT_OS_MAC */
+
+#ifndef ITT_OS_FREEBSD
+#  define ITT_OS_FREEBSD   4
+#endif /* ITT_OS_FREEBSD */
+
+#ifndef ITT_OS
+#  if defined WIN32 || defined _WIN32
+#    define ITT_OS ITT_OS_WIN
+#  elif defined( __APPLE__ ) && defined( __MACH__ )
+#    define ITT_OS ITT_OS_MAC
+#  elif defined( __FreeBSD__ )
+#    define ITT_OS ITT_OS_FREEBSD
+#  else
+#    define ITT_OS ITT_OS_LINUX
+#  endif
+#endif /* ITT_OS */
+
+#ifndef ITT_PLATFORM_WIN
+#  define ITT_PLATFORM_WIN 1
+#endif /* ITT_PLATFORM_WIN */
+
+#ifndef ITT_PLATFORM_POSIX
+#  define ITT_PLATFORM_POSIX 2
+#endif /* ITT_PLATFORM_POSIX */
+
+#ifndef ITT_PLATFORM_MAC
+#  define ITT_PLATFORM_MAC 3
+#endif /* ITT_PLATFORM_MAC */
+
+#ifndef ITT_PLATFORM_FREEBSD
+#  define ITT_PLATFORM_FREEBSD 4
+#endif /* ITT_PLATFORM_FREEBSD */
+
+#ifndef ITT_PLATFORM
+#  if ITT_OS==ITT_OS_WIN
+#    define ITT_PLATFORM ITT_PLATFORM_WIN
+#  elif ITT_OS==ITT_OS_MAC
+#    define ITT_PLATFORM ITT_PLATFORM_MAC
+#  elif ITT_OS==ITT_OS_FREEBSD
+#    define ITT_PLATFORM ITT_PLATFORM_FREEBSD
+#  else
+#    define ITT_PLATFORM ITT_PLATFORM_POSIX
+#  endif
+#endif /* ITT_PLATFORM */
+
+#if defined(_UNICODE) && !defined(UNICODE)
+#define UNICODE
+#endif
+
+#include <stddef.h>
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#include <tchar.h>
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#include <stdint.h>
+#if defined(UNICODE) || defined(_UNICODE)
+#include <wchar.h>
+#endif /* UNICODE || _UNICODE */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#ifndef CDECL
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    define CDECL __cdecl
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#    if defined _M_IX86 || defined __i386__
+#      define CDECL __attribute__ ((cdecl))
+#    else  /* _M_IX86 || __i386__ */
+#      define CDECL /* actual only on x86 platform */
+#    endif /* _M_IX86 || __i386__ */
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* CDECL */
+
+#ifndef STDCALL
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    define STDCALL __stdcall
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#    if defined _M_IX86 || defined __i386__
+#      define STDCALL __attribute__ ((stdcall))
+#    else  /* _M_IX86 || __i386__ */
+#      define STDCALL /* supported only on x86 platform */
+#    endif /* _M_IX86 || __i386__ */
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* STDCALL */
+
+#define ITTAPI    CDECL
+#define LIBITTAPI CDECL
+
+/* TODO: Temporary for compatibility! */
+#define ITTAPI_CALL    CDECL
+#define LIBITTAPI_CALL CDECL
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+/* use __forceinline (VC++ specific) */
+#define ITT_INLINE           __forceinline
+#define ITT_INLINE_ATTRIBUTE /* nothing */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+/*
+ * Generally, functions are not inlined unless optimization is specified.
+ * For functions declared inline, this attribute inlines the function even
+ * if no optimization level was specified.
+ */
+#ifdef __STRICT_ANSI__
+#define ITT_INLINE           static
+#define ITT_INLINE_ATTRIBUTE __attribute__((unused))
+#else  /* __STRICT_ANSI__ */
+#define ITT_INLINE           static inline
+#define ITT_INLINE_ATTRIBUTE __attribute__((always_inline, unused))
+#endif /* __STRICT_ANSI__ */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+/** @endcond */
+
+#ifndef ITT_ARCH_IA32
+#  define ITT_ARCH_IA32  1
+#endif /* ITT_ARCH_IA32 */
+
+#ifndef ITT_ARCH_IA32E
+#  define ITT_ARCH_IA32E 2
+#endif /* ITT_ARCH_IA32E */
+
+#ifndef ITT_ARCH_ARM
+#  define ITT_ARCH_ARM  4
+#endif /* ITT_ARCH_ARM */
+
+#ifndef ITT_ARCH_PPC64
+#  define ITT_ARCH_PPC64  5
+#endif /* ITT_ARCH_PPC64 */
+
+#ifndef ITT_ARCH
+#  if defined _M_IX86 || defined __i386__
+#    define ITT_ARCH ITT_ARCH_IA32
+#  elif defined _M_X64 || defined _M_AMD64 || defined __x86_64__
+#    define ITT_ARCH ITT_ARCH_IA32E
+#  elif defined _M_IA64 || defined __ia64__
+#    define ITT_ARCH ITT_ARCH_IA64
+#  elif defined _M_ARM || __arm__
+#    define ITT_ARCH ITT_ARCH_ARM
+#  elif defined __powerpc64__
+#    define ITT_ARCH ITT_ARCH_PPC64
+#  endif
+#endif
+
+#ifdef __cplusplus
+#  define ITT_EXTERN_C extern "C"
+#  define ITT_EXTERN_C_BEGIN extern "C" {
+#  define ITT_EXTERN_C_END }
+#else
+#  define ITT_EXTERN_C /* nothing */
+#  define ITT_EXTERN_C_BEGIN /* nothing */
+#  define ITT_EXTERN_C_END /* nothing */
+#endif /* __cplusplus */
+
+#define ITT_TO_STR_AUX(x) #x
+#define ITT_TO_STR(x)     ITT_TO_STR_AUX(x)
+
+#define __ITT_BUILD_ASSERT(expr, suffix) do { \
+    static char __itt_build_check_##suffix[(expr) ? 1 : -1]; \
+    __itt_build_check_##suffix[0] = 0; \
+} while(0)
+#define _ITT_BUILD_ASSERT(expr, suffix)  __ITT_BUILD_ASSERT((expr), suffix)
+#define ITT_BUILD_ASSERT(expr)           _ITT_BUILD_ASSERT((expr), __LINE__)
+
+#define ITT_MAGIC { 0xED, 0xAB, 0xAB, 0xEC, 0x0D, 0xEE, 0xDA, 0x30 }
+
+/* Replace with snapshot date YYYYMMDD for promotion build. */
+#define API_VERSION_BUILD    20111111
+
+#ifndef API_VERSION_NUM
+#define API_VERSION_NUM 0.0.0
+#endif /* API_VERSION_NUM */
+
+#define API_VERSION "ITT-API-Version " ITT_TO_STR(API_VERSION_NUM) \
+                                " (" ITT_TO_STR(API_VERSION_BUILD) ")"
+
+/* OS communication functions */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#include <windows.h>
+typedef HMODULE           lib_t;
+typedef DWORD             TIDT;
+typedef CRITICAL_SECTION  mutex_t;
+#define MUTEX_INITIALIZER { 0 }
+#define strong_alias(name, aliasname) /* empty for Windows */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#include <dlfcn.h>
+#if defined(UNICODE) || defined(_UNICODE)
+#include <wchar.h>
+#endif /* UNICODE */
+#ifndef _GNU_SOURCE
+#define _GNU_SOURCE 1 /* need for PTHREAD_MUTEX_RECURSIVE */
+#endif /* _GNU_SOURCE */
+#ifndef __USE_UNIX98
+#define __USE_UNIX98 1 /* need for PTHREAD_MUTEX_RECURSIVE, on SLES11.1 with gcc 4.3.4 wherein pthread.h missing dependency on __USE_XOPEN2K8 */
+#endif /*__USE_UNIX98*/
+#include <pthread.h>
+typedef void*             lib_t;
+typedef pthread_t         TIDT;
+typedef pthread_mutex_t   mutex_t;
+#define MUTEX_INITIALIZER PTHREAD_MUTEX_INITIALIZER
+#define _strong_alias(name, aliasname) \
+            extern __typeof (name) aliasname __attribute__ ((alias (#name)));
+#define strong_alias(name, aliasname) _strong_alias(name, aliasname)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_get_proc(lib, name) GetProcAddress(lib, name)
+#define __itt_mutex_init(mutex)   InitializeCriticalSection(mutex)
+#define __itt_mutex_lock(mutex)   EnterCriticalSection(mutex)
+#define __itt_mutex_unlock(mutex) LeaveCriticalSection(mutex)
+#define __itt_load_lib(name)      LoadLibraryA(name)
+#define __itt_unload_lib(handle)  FreeLibrary(handle)
+#define __itt_system_error()      (int)GetLastError()
+#define __itt_fstrcmp(s1, s2)     lstrcmpA(s1, s2)
+#define __itt_fstrnlen(s, l)      strnlen_s(s, l)
+#define __itt_fstrcpyn(s1, b, s2, l) strncpy_s(s1, b, s2, l)
+#define __itt_fstrdup(s)          _strdup(s)
+#define __itt_thread_id()         GetCurrentThreadId()
+#define __itt_thread_yield()      SwitchToThread()
+#ifndef ITT_SIMPLE_INIT
+ITT_INLINE long
+__itt_interlocked_increment(volatile long* ptr) ITT_INLINE_ATTRIBUTE;
+ITT_INLINE long __itt_interlocked_increment(volatile long* ptr)
+{
+    return InterlockedIncrement(ptr);
+}
+#endif /* ITT_SIMPLE_INIT */
+#else /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+#define __itt_get_proc(lib, name) dlsym(lib, name)
+#define __itt_mutex_init(mutex)   {\
+    pthread_mutexattr_t mutex_attr;                                         \
+    int error_code = pthread_mutexattr_init(&mutex_attr);                   \
+    if (error_code)                                                         \
+        __itt_report_error(__itt_error_system, "pthread_mutexattr_init",    \
+                           error_code);                                     \
+    error_code = pthread_mutexattr_settype(&mutex_attr,                     \
+                                           PTHREAD_MUTEX_RECURSIVE);        \
+    if (error_code)                                                         \
+        __itt_report_error(__itt_error_system, "pthread_mutexattr_settype", \
+                           error_code);                                     \
+    error_code = pthread_mutex_init(mutex, &mutex_attr);                    \
+    if (error_code)                                                         \
+        __itt_report_error(__itt_error_system, "pthread_mutex_init",        \
+                           error_code);                                     \
+    error_code = pthread_mutexattr_destroy(&mutex_attr);                    \
+    if (error_code)                                                         \
+        __itt_report_error(__itt_error_system, "pthread_mutexattr_destroy", \
+                           error_code);                                     \
+}
+#define __itt_mutex_lock(mutex)   pthread_mutex_lock(mutex)
+#define __itt_mutex_unlock(mutex) pthread_mutex_unlock(mutex)
+#define __itt_load_lib(name)      dlopen(name, RTLD_LAZY)
+#define __itt_unload_lib(handle)  dlclose(handle)
+#define __itt_system_error()      errno
+#define __itt_fstrcmp(s1, s2)     strcmp(s1, s2)
+
+/* makes customer code define safe APIs for SDL_STRNLEN_S and SDL_STRNCPY_S */
+#ifdef SDL_STRNLEN_S
+#define __itt_fstrnlen(s, l)      SDL_STRNLEN_S(s, l)
+#else
+#define __itt_fstrnlen(s, l)      strlen(s)
+#endif /* SDL_STRNLEN_S */
+#ifdef SDL_STRNCPY_S
+#define __itt_fstrcpyn(s1, b, s2, l) SDL_STRNCPY_S(s1, b, s2, l)
+#else
+#define __itt_fstrcpyn(s1, b, s2, l) {                                      \
+    if (b > 0) {                                                            \
+        /* 'volatile' is used to suppress the warning that a destination */ \
+        /*  bound depends on the length of the source.                   */ \
+        volatile size_t num_to_copy = (size_t)(b - 1) < (size_t)(l) ?       \
+                (size_t)(b - 1) : (size_t)(l);                              \
+        strncpy(s1, s2, num_to_copy);                                       \
+        s1[num_to_copy] = 0;                                                \
+    }                                                                       \
+}
+#endif /* SDL_STRNCPY_S */
+
+#define __itt_fstrdup(s)          strdup(s)
+#define __itt_thread_id()         pthread_self()
+#define __itt_thread_yield()      sched_yield()
+#if ITT_ARCH==ITT_ARCH_IA64
+#ifdef __INTEL_COMPILER
+#define __TBB_machine_fetchadd4(addr, val) __fetchadd4_acq((void *)addr, val)
+#else  /* __INTEL_COMPILER */
+/* TODO: Add Support for not Intel compilers for IA-64 architecture */
+#endif /* __INTEL_COMPILER */
+#elif ITT_ARCH==ITT_ARCH_IA32 || ITT_ARCH==ITT_ARCH_IA32E /* ITT_ARCH!=ITT_ARCH_IA64 */
+ITT_INLINE long
+__TBB_machine_fetchadd4(volatile void* ptr, long addend) ITT_INLINE_ATTRIBUTE;
+ITT_INLINE long __TBB_machine_fetchadd4(volatile void* ptr, long addend)
+{
+    long result;
+    __asm__ __volatile__("lock\nxadd %0,%1"
+                          : "=r"(result),"=m"(*(int*)ptr)
+                          : "0"(addend), "m"(*(int*)ptr)
+                          : "memory");
+    return result;
+}
+#elif ITT_ARCH==ITT_ARCH_ARM || ITT_ARCH==ITT_ARCH_PPC64
+#define __TBB_machine_fetchadd4(addr, val) __sync_fetch_and_add(addr, val)
+#endif /* ITT_ARCH==ITT_ARCH_IA64 */
+#ifndef ITT_SIMPLE_INIT
+ITT_INLINE long
+__itt_interlocked_increment(volatile long* ptr) ITT_INLINE_ATTRIBUTE;
+ITT_INLINE long __itt_interlocked_increment(volatile long* ptr)
+{
+    return __TBB_machine_fetchadd4(ptr, 1) + 1L;
+}
+#endif /* ITT_SIMPLE_INIT */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+typedef enum {
+    __itt_collection_normal = 0,
+    __itt_collection_paused = 1
+} __itt_collection_state;
+
+typedef enum {
+    __itt_thread_normal  = 0,
+    __itt_thread_ignored = 1
+} __itt_thread_state;
+
+#pragma pack(push, 8)
+
+typedef struct ___itt_thread_info
+{
+    const char* nameA; /*!< Copy of original name in ASCII. */
+#if defined(UNICODE) || defined(_UNICODE)
+    const wchar_t* nameW; /*!< Copy of original name in UNICODE. */
+#else  /* UNICODE || _UNICODE */
+    void* nameW;
+#endif /* UNICODE || _UNICODE */
+    TIDT               tid;
+    __itt_thread_state state;   /*!< Thread state (paused or normal) */
+    int                extra1;  /*!< Reserved to the runtime */
+    void*              extra2;  /*!< Reserved to the runtime */
+    struct ___itt_thread_info* next;
+} __itt_thread_info;
+
+#include "ittnotify_types.h" /* For __itt_group_id definition */
+
+typedef struct ___itt_api_info_20101001
+{
+    const char*    name;
+    void**         func_ptr;
+    void*          init_func;
+    __itt_group_id group;
+}  __itt_api_info_20101001;
+
+typedef struct ___itt_api_info
+{
+    const char*    name;
+    void**         func_ptr;
+    void*          init_func;
+    void*          null_func;
+    __itt_group_id group;
+}  __itt_api_info;
+
+struct ___itt_domain;
+struct ___itt_string_handle;
+
+typedef struct ___itt_global
+{
+    unsigned char          magic[8];
+    unsigned long          version_major;
+    unsigned long          version_minor;
+    unsigned long          version_build;
+    volatile long          api_initialized;
+    volatile long          mutex_initialized;
+    volatile long          atomic_counter;
+    mutex_t                mutex;
+    lib_t                  lib;
+    void*                  error_handler;
+    const char**           dll_path_ptr;
+    __itt_api_info*        api_list_ptr;
+    struct ___itt_global*  next;
+    /* Joinable structures below */
+    __itt_thread_info*     thread_list;
+    struct ___itt_domain*  domain_list;
+    struct ___itt_string_handle* string_list;
+    __itt_collection_state state;
+} __itt_global;
+
+#pragma pack(pop)
+
+#define NEW_THREAD_INFO_W(gptr,h,h_tail,t,s,n) { \
+    h = (__itt_thread_info*)malloc(sizeof(__itt_thread_info)); \
+    if (h != NULL) { \
+        h->tid    = t; \
+        h->nameA  = NULL; \
+        h->nameW  = n ? _wcsdup(n) : NULL; \
+        h->state  = s; \
+        h->extra1 = 0;    /* reserved */ \
+        h->extra2 = NULL; /* reserved */ \
+        h->next   = NULL; \
+        if (h_tail == NULL) \
+            (gptr)->thread_list = h; \
+        else \
+            h_tail->next = h; \
+    } \
+}
+
+#define NEW_THREAD_INFO_A(gptr,h,h_tail,t,s,n) { \
+    h = (__itt_thread_info*)malloc(sizeof(__itt_thread_info)); \
+    if (h != NULL) { \
+        h->tid    = t; \
+        h->nameA  = n ? __itt_fstrdup(n) : NULL; \
+        h->nameW  = NULL; \
+        h->state  = s; \
+        h->extra1 = 0;    /* reserved */ \
+        h->extra2 = NULL; /* reserved */ \
+        h->next   = NULL; \
+        if (h_tail == NULL) \
+            (gptr)->thread_list = h; \
+        else \
+            h_tail->next = h; \
+    } \
+}
+
+#define NEW_DOMAIN_W(gptr,h,h_tail,name) { \
+    h = (__itt_domain*)malloc(sizeof(__itt_domain)); \
+    if (h != NULL) { \
+        h->flags  = 1;    /* domain is enabled by default */ \
+        h->nameA  = NULL; \
+        h->nameW  = name ? _wcsdup(name) : NULL; \
+        h->extra1 = 0;    /* reserved */ \
+        h->extra2 = NULL; /* reserved */ \
+        h->next   = NULL; \
+        if (h_tail == NULL) \
+            (gptr)->domain_list = h; \
+        else \
+            h_tail->next = h; \
+    } \
+}
+
+#define NEW_DOMAIN_A(gptr,h,h_tail,name) { \
+    h = (__itt_domain*)malloc(sizeof(__itt_domain)); \
+    if (h != NULL) { \
+        h->flags  = 1;    /* domain is enabled by default */ \
+        h->nameA  = name ? __itt_fstrdup(name) : NULL; \
+        h->nameW  = NULL; \
+        h->extra1 = 0;    /* reserved */ \
+        h->extra2 = NULL; /* reserved */ \
+        h->next   = NULL; \
+        if (h_tail == NULL) \
+            (gptr)->domain_list = h; \
+        else \
+            h_tail->next = h; \
+    } \
+}
+
+#define NEW_STRING_HANDLE_W(gptr,h,h_tail,name) { \
+    h = (__itt_string_handle*)malloc(sizeof(__itt_string_handle)); \
+    if (h != NULL) { \
+        h->strA   = NULL; \
+        h->strW   = name ? _wcsdup(name) : NULL; \
+        h->extra1 = 0;    /* reserved */ \
+        h->extra2 = NULL; /* reserved */ \
+        h->next   = NULL; \
+        if (h_tail == NULL) \
+            (gptr)->string_list = h; \
+        else \
+            h_tail->next = h; \
+    } \
+}
+
+#define NEW_STRING_HANDLE_A(gptr,h,h_tail,name) { \
+    h = (__itt_string_handle*)malloc(sizeof(__itt_string_handle)); \
+    if (h != NULL) { \
+        h->strA   = name ? __itt_fstrdup(name) : NULL; \
+        h->strW   = NULL; \
+        h->extra1 = 0;    /* reserved */ \
+        h->extra2 = NULL; /* reserved */ \
+        h->next   = NULL; \
+        if (h_tail == NULL) \
+            (gptr)->string_list = h; \
+        else \
+            h_tail->next = h; \
+    } \
+}
+
+#endif /* _ITTNOTIFY_CONFIG_H_ */
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_static.c b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_static.c
new file mode 100644
index 00000000..dab25fa1
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_static.c
@@ -0,0 +1,1043 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "ittnotify_config.h"
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define PATH_MAX 512
+#else /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+#include <limits.h>
+#include <dlfcn.h>
+#include <errno.h>
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdarg.h>
+#include <string.h>
+
+#define INTEL_NO_MACRO_BODY
+#define INTEL_ITTNOTIFY_API_PRIVATE
+#include "ittnotify.h"
+#include "legacy/ittnotify.h"
+
+#include "disable_warnings.h"
+
+static const char api_version[] = API_VERSION "\0\n@(#) $Revision: 413915 $\n";
+
+#define _N_(n) ITT_JOIN(INTEL_ITTNOTIFY_PREFIX,n)
+
+#if ITT_OS==ITT_OS_WIN
+static const char* ittnotify_lib_name = "libittnotify.dll";
+#elif ITT_OS==ITT_OS_LINUX || ITT_OS==ITT_OS_FREEBSD
+static const char* ittnotify_lib_name = "libittnotify.so";
+#elif ITT_OS==ITT_OS_MAC
+static const char* ittnotify_lib_name = "libittnotify.dylib";
+#else
+#error Unsupported or unknown OS.
+#endif
+
+#ifdef __ANDROID__
+#include <android/log.h>
+#include <stdio.h>
+#include <unistd.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+#include <linux/limits.h>
+
+#ifdef ITT_ANDROID_LOG
+    #define ITT_ANDROID_LOG_TAG   "INTEL_VTUNE_USERAPI"
+    #define ITT_ANDROID_LOGI(...) ((void)__android_log_print(ANDROID_LOG_INFO, ITT_ANDROID_LOG_TAG, __VA_ARGS__))
+    #define ITT_ANDROID_LOGW(...) ((void)__android_log_print(ANDROID_LOG_WARN, ITT_ANDROID_LOG_TAG, __VA_ARGS__))
+    #define ITT_ANDROID_LOGE(...) ((void)__android_log_print(ANDROID_LOG_ERROR,ITT_ANDROID_LOG_TAG, __VA_ARGS__))
+    #define ITT_ANDROID_LOGD(...) ((void)__android_log_print(ANDROID_LOG_DEBUG,ITT_ANDROID_LOG_TAG, __VA_ARGS__))
+#else
+    #define ITT_ANDROID_LOGI(...)
+    #define ITT_ANDROID_LOGW(...)
+    #define ITT_ANDROID_LOGE(...)
+    #define ITT_ANDROID_LOGD(...)
+#endif
+
+/* default location of userapi collector on Android */
+#define ANDROID_ITTNOTIFY_DEFAULT_PATH_MASK(x)  "/data/data/com.intel.vtune/perfrun/lib" \
+                                                #x "/runtime/libittnotify.so"
+
+#if ITT_ARCH==ITT_ARCH_IA32 || ITT_ARCH==ITT_ARCH_ARM
+#define ANDROID_ITTNOTIFY_DEFAULT_PATH  ANDROID_ITTNOTIFY_DEFAULT_PATH_MASK(32)
+#else
+#define ANDROID_ITTNOTIFY_DEFAULT_PATH  ANDROID_ITTNOTIFY_DEFAULT_PATH_MASK(64)
+#endif
+
+#endif
+
+
+#ifndef LIB_VAR_NAME
+#if ITT_ARCH==ITT_ARCH_IA32 || ITT_ARCH==ITT_ARCH_ARM
+#define LIB_VAR_NAME INTEL_LIBITTNOTIFY32
+#else
+#define LIB_VAR_NAME INTEL_LIBITTNOTIFY64
+#endif
+#endif /* LIB_VAR_NAME */
+
+#define ITT_MUTEX_INIT_AND_LOCK(p) {                                 \
+        if (!p.mutex_initialized)                                    \
+        {                                                            \
+            if (__itt_interlocked_increment(&p.atomic_counter) == 1) \
+            {                                                        \
+                __itt_mutex_init(&p.mutex);                          \
+                p.mutex_initialized = 1;                             \
+            }                                                        \
+            else                                                     \
+                while (!p.mutex_initialized)                         \
+                    __itt_thread_yield();                            \
+        }                                                            \
+        __itt_mutex_lock(&p.mutex);                                  \
+}
+
+const int _N_(err) = 0;
+
+typedef int (__itt_init_ittlib_t)(const char*, __itt_group_id);
+
+/* this define used to control initialization function name. */
+#ifndef __itt_init_ittlib_name
+ITT_EXTERN_C int _N_(init_ittlib)(const char*, __itt_group_id);
+static __itt_init_ittlib_t* __itt_init_ittlib_ptr = _N_(init_ittlib);
+#define __itt_init_ittlib_name __itt_init_ittlib_ptr
+#endif /* __itt_init_ittlib_name */
+
+typedef void (__itt_fini_ittlib_t)(void);
+
+/* this define used to control finalization function name. */
+#ifndef __itt_fini_ittlib_name
+ITT_EXTERN_C void _N_(fini_ittlib)(void);
+static __itt_fini_ittlib_t* __itt_fini_ittlib_ptr = _N_(fini_ittlib);
+#define __itt_fini_ittlib_name __itt_fini_ittlib_ptr
+#endif /* __itt_fini_ittlib_name */
+
+/* building pointers to imported funcs */
+#undef ITT_STUBV
+#undef ITT_STUB
+#define ITT_STUB(api,type,name,args,params,ptr,group,format)   \
+static type api ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)) args;\
+typedef type api ITT_JOIN(_N_(name),_t) args;                  \
+ITT_EXTERN_C_BEGIN ITT_JOIN(_N_(name),_t)* ITTNOTIFY_NAME(name) = ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)); ITT_EXTERN_C_END \
+static type api ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)) args \
+{                                                              \
+    __itt_init_ittlib_name(NULL, __itt_group_all);             \
+    if (ITTNOTIFY_NAME(name) && ITTNOTIFY_NAME(name) != ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init))) \
+        return ITTNOTIFY_NAME(name) params;                    \
+    else                                                       \
+        return (type)0;                                        \
+}
+
+#define ITT_STUBV(api,type,name,args,params,ptr,group,format)  \
+static type api ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)) args;\
+typedef type api ITT_JOIN(_N_(name),_t) args;                  \
+ITT_EXTERN_C_BEGIN ITT_JOIN(_N_(name),_t)* ITTNOTIFY_NAME(name) = ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)); ITT_EXTERN_C_END \
+static type api ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)) args \
+{                                                              \
+    __itt_init_ittlib_name(NULL, __itt_group_all);             \
+    if (ITTNOTIFY_NAME(name) && ITTNOTIFY_NAME(name) != ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init))) \
+        ITTNOTIFY_NAME(name) params;                           \
+    else                                                       \
+        return;                                                \
+}
+
+#undef __ITT_INTERNAL_INIT
+#include "ittnotify_static.h"
+
+#undef ITT_STUB
+#undef ITT_STUBV
+#define ITT_STUB(api,type,name,args,params,ptr,group,format)   \
+static type api ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)) args;\
+typedef type api ITT_JOIN(_N_(name),_t) args;                  \
+ITT_EXTERN_C_BEGIN ITT_JOIN(_N_(name),_t)* ITTNOTIFY_NAME(name) = ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)); ITT_EXTERN_C_END
+
+#define ITT_STUBV(api,type,name,args,params,ptr,group,format)  \
+static type api ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)) args;\
+typedef type api ITT_JOIN(_N_(name),_t) args;                  \
+ITT_EXTERN_C_BEGIN ITT_JOIN(_N_(name),_t)* ITTNOTIFY_NAME(name) = ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)); ITT_EXTERN_C_END
+
+#define __ITT_INTERNAL_INIT
+#include "ittnotify_static.h"
+#undef __ITT_INTERNAL_INIT
+
+ITT_GROUP_LIST(group_list);
+
+#pragma pack(push, 8)
+
+typedef struct ___itt_group_alias
+{
+    const char*    env_var;
+    __itt_group_id groups;
+} __itt_group_alias;
+
+static __itt_group_alias group_alias[] = {
+    { "KMP_FOR_TPROFILE", (__itt_group_id)(__itt_group_control | __itt_group_thread | __itt_group_sync  | __itt_group_mark) },
+    { "KMP_FOR_TCHECK",   (__itt_group_id)(__itt_group_control | __itt_group_thread | __itt_group_sync  | __itt_group_fsync | __itt_group_mark | __itt_group_suppress) },
+    { NULL,               (__itt_group_none) },
+    { api_version,        (__itt_group_none) } /* !!! Just to avoid unused code elimination !!! */
+};
+
+#pragma pack(pop)
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#pragma warning(push)
+#pragma warning(disable: 4054) /* warning C4054: 'type cast' : from function pointer 'XXX' to data pointer 'void *' */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+static __itt_api_info api_list[] = {
+/* Define functions with static implementation */
+#undef ITT_STUB
+#undef ITT_STUBV
+#define ITT_STUB(api,type,name,args,params,nameindll,group,format) { ITT_TO_STR(ITT_JOIN(__itt_,nameindll)), (void**)(void*)&ITTNOTIFY_NAME(name), (void*)(size_t)&ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)), (void*)(size_t)&ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)), (__itt_group_id)(group)},
+#define ITT_STUBV ITT_STUB
+#define __ITT_INTERNAL_INIT
+#include "ittnotify_static.h"
+#undef __ITT_INTERNAL_INIT
+/* Define functions without static implementation */
+#undef ITT_STUB
+#undef ITT_STUBV
+#define ITT_STUB(api,type,name,args,params,nameindll,group,format) {ITT_TO_STR(ITT_JOIN(__itt_,nameindll)), (void**)(void*)&ITTNOTIFY_NAME(name), (void*)(size_t)&ITT_VERSIONIZE(ITT_JOIN(_N_(name),_init)), NULL, (__itt_group_id)(group)},
+#define ITT_STUBV ITT_STUB
+#include "ittnotify_static.h"
+    {NULL, NULL, NULL, NULL, __itt_group_none}
+};
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#pragma warning(pop)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+static const char dll_path[PATH_MAX] = { 0 };
+
+/* static part descriptor which handles. all notification api attributes. */
+__itt_global _N_(_ittapi_global) = {
+    ITT_MAGIC,                                     /* identification info */
+    ITT_MAJOR, ITT_MINOR, API_VERSION_BUILD,       /* version info */
+    0,                                             /* api_initialized */
+    0,                                             /* mutex_initialized */
+    0,                                             /* atomic_counter */
+    MUTEX_INITIALIZER,                             /* mutex */
+    NULL,                                          /* dynamic library handle */
+    NULL,                                          /* error_handler */
+    (const char**)&dll_path,                       /* dll_path_ptr */
+    (__itt_api_info*)&api_list,                    /* api_list_ptr */
+    NULL,                                          /* next __itt_global */
+    NULL,                                          /* thread_list */
+    NULL,                                          /* domain_list */
+    NULL,                                          /* string_list */
+    __itt_collection_normal                        /* collection state */
+};
+
+typedef void (__itt_api_init_t)(__itt_global*, __itt_group_id);
+typedef void (__itt_api_fini_t)(__itt_global*);
+
+/* ========================================================================= */
+
+#ifdef ITT_NOTIFY_EXT_REPORT
+ITT_EXTERN_C void _N_(error_handler)(__itt_error_code, va_list args);
+#endif /* ITT_NOTIFY_EXT_REPORT */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#pragma warning(push)
+#pragma warning(disable: 4055) /* warning C4055: 'type cast' : from data pointer 'void *' to function pointer 'XXX' */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+static void __itt_report_error_impl(int code, ...) {
+    va_list args;
+    va_start(args, code);
+    if (_N_(_ittapi_global).error_handler != NULL)
+    {
+        __itt_error_handler_t* handler = (__itt_error_handler_t*)(size_t)_N_(_ittapi_global).error_handler;
+        handler((__itt_error_code)code, args);
+    }
+#ifdef ITT_NOTIFY_EXT_REPORT
+    _N_(error_handler)(code, args);
+#endif /* ITT_NOTIFY_EXT_REPORT */
+    va_end(args);
+}
+
+//va_start cannot take enum (__itt_error_code) on clang, so it is necessary to transform it to int
+#define __itt_report_error(code, ...) \
+                __itt_report_error_impl((int)code,__VA_ARGS__)
+
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#pragma warning(pop)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+static __itt_domain* ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(domain_createW),_init))(const wchar_t* name)
+{
+    __itt_domain *h_tail = NULL, *h = NULL;
+
+    if (name == NULL)
+    {
+        return NULL;
+    }
+
+    ITT_MUTEX_INIT_AND_LOCK(_N_(_ittapi_global));
+    if (_N_(_ittapi_global).api_initialized)
+    {
+        if (ITTNOTIFY_NAME(domain_createW) && ITTNOTIFY_NAME(domain_createW) != ITT_VERSIONIZE(ITT_JOIN(_N_(domain_createW),_init)))
+        {
+            __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+            return ITTNOTIFY_NAME(domain_createW)(name);
+        }
+    }
+    for (h_tail = NULL, h = _N_(_ittapi_global).domain_list; h != NULL; h_tail = h, h = h->next)
+    {
+        if (h->nameW != NULL && !wcscmp(h->nameW, name)) break;
+    }
+    if (h == NULL)
+    {
+        NEW_DOMAIN_W(&_N_(_ittapi_global),h,h_tail,name);
+    }
+    __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+    return h;
+}
+
+static __itt_domain* ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(domain_createA),_init))(const char* name)
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+static __itt_domain* ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(domain_create),_init))(const char* name)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+{
+    __itt_domain *h_tail = NULL, *h = NULL;
+
+    if (name == NULL)
+    {
+        return NULL;
+    }
+
+    ITT_MUTEX_INIT_AND_LOCK(_N_(_ittapi_global));
+    if (_N_(_ittapi_global).api_initialized)
+    {
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+        if (ITTNOTIFY_NAME(domain_createA) && ITTNOTIFY_NAME(domain_createA) != ITT_VERSIONIZE(ITT_JOIN(_N_(domain_createA),_init)))
+        {
+            __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+            return ITTNOTIFY_NAME(domain_createA)(name);
+        }
+#else
+        if (ITTNOTIFY_NAME(domain_create) && ITTNOTIFY_NAME(domain_create) != ITT_VERSIONIZE(ITT_JOIN(_N_(domain_create),_init)))
+        {
+            __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+            return ITTNOTIFY_NAME(domain_create)(name);
+        }
+#endif
+    }
+    for (h_tail = NULL, h = _N_(_ittapi_global).domain_list; h != NULL; h_tail = h, h = h->next)
+    {
+        if (h->nameA != NULL && !__itt_fstrcmp(h->nameA, name)) break;
+    }
+    if (h == NULL)
+    {
+        NEW_DOMAIN_A(&_N_(_ittapi_global),h,h_tail,name);
+    }
+    __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+    return h;
+}
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+static __itt_string_handle* ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(string_handle_createW),_init))(const wchar_t* name)
+{
+    __itt_string_handle *h_tail = NULL, *h = NULL;
+
+    if (name == NULL)
+    {
+        return NULL;
+    }
+
+    ITT_MUTEX_INIT_AND_LOCK(_N_(_ittapi_global));
+    if (_N_(_ittapi_global).api_initialized)
+    {
+        if (ITTNOTIFY_NAME(string_handle_createW) && ITTNOTIFY_NAME(string_handle_createW) != ITT_VERSIONIZE(ITT_JOIN(_N_(string_handle_createW),_init)))
+        {
+            __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+            return ITTNOTIFY_NAME(string_handle_createW)(name);
+        }
+    }
+    for (h_tail = NULL, h = _N_(_ittapi_global).string_list; h != NULL; h_tail = h, h = h->next)
+    {
+        if (h->strW != NULL && !wcscmp(h->strW, name)) break;
+    }
+    if (h == NULL)
+    {
+        NEW_STRING_HANDLE_W(&_N_(_ittapi_global),h,h_tail,name);
+    }
+    __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+    return h;
+}
+
+static __itt_string_handle* ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(string_handle_createA),_init))(const char* name)
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+static __itt_string_handle* ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(string_handle_create),_init))(const char* name)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+{
+    __itt_string_handle *h_tail = NULL, *h = NULL;
+
+    if (name == NULL)
+    {
+        return NULL;
+    }
+
+    ITT_MUTEX_INIT_AND_LOCK(_N_(_ittapi_global));
+    if (_N_(_ittapi_global).api_initialized)
+    {
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+        if (ITTNOTIFY_NAME(string_handle_createA) && ITTNOTIFY_NAME(string_handle_createA) != ITT_VERSIONIZE(ITT_JOIN(_N_(string_handle_createA),_init)))
+        {
+            __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+            return ITTNOTIFY_NAME(string_handle_createA)(name);
+        }
+#else
+        if (ITTNOTIFY_NAME(string_handle_create) && ITTNOTIFY_NAME(string_handle_create) != ITT_VERSIONIZE(ITT_JOIN(_N_(string_handle_create),_init)))
+        {
+            __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+            return ITTNOTIFY_NAME(string_handle_create)(name);
+        }
+#endif
+    }
+    for (h_tail = NULL, h = _N_(_ittapi_global).string_list; h != NULL; h_tail = h, h = h->next)
+    {
+        if (h->strA != NULL && !__itt_fstrcmp(h->strA, name)) break;
+    }
+    if (h == NULL)
+    {
+        NEW_STRING_HANDLE_A(&_N_(_ittapi_global),h,h_tail,name);
+    }
+    __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+    return h;
+}
+
+/* -------------------------------------------------------------------------- */
+
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(pause),_init))(void)
+{
+    if (!_N_(_ittapi_global).api_initialized && _N_(_ittapi_global).thread_list == NULL)
+    {
+        __itt_init_ittlib_name(NULL, __itt_group_all);
+    }
+    if (ITTNOTIFY_NAME(pause) && ITTNOTIFY_NAME(pause) != ITT_VERSIONIZE(ITT_JOIN(_N_(pause),_init)))
+    {
+        ITTNOTIFY_NAME(pause)();
+    }
+    else
+    {
+        _N_(_ittapi_global).state = __itt_collection_paused;
+    }
+}
+
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(resume),_init))(void)
+{
+    if (!_N_(_ittapi_global).api_initialized && _N_(_ittapi_global).thread_list == NULL)
+    {
+        __itt_init_ittlib_name(NULL, __itt_group_all);
+    }
+    if (ITTNOTIFY_NAME(resume) && ITTNOTIFY_NAME(resume) != ITT_VERSIONIZE(ITT_JOIN(_N_(resume),_init)))
+    {
+        ITTNOTIFY_NAME(resume)();
+    }
+    else
+    {
+        _N_(_ittapi_global).state = __itt_collection_normal;
+    }
+}
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_nameW),_init))(const wchar_t* name)
+{
+    if (!_N_(_ittapi_global).api_initialized && _N_(_ittapi_global).thread_list == NULL)
+    {
+        __itt_init_ittlib_name(NULL, __itt_group_all);
+    }
+    if (ITTNOTIFY_NAME(thread_set_nameW) && ITTNOTIFY_NAME(thread_set_nameW) != ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_nameW),_init)))
+    {
+        ITTNOTIFY_NAME(thread_set_nameW)(name);
+    }
+}
+
+static int ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thr_name_setW),_init))(const wchar_t* name, int namelen)
+{
+    (void)namelen;
+    ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_nameW),_init))(name);
+    return 0;
+}
+
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_nameA),_init))(const char* name)
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_name),_init))(const char* name)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+{
+    if (!_N_(_ittapi_global).api_initialized && _N_(_ittapi_global).thread_list == NULL)
+    {
+        __itt_init_ittlib_name(NULL, __itt_group_all);
+    }
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+    if (ITTNOTIFY_NAME(thread_set_nameA) && ITTNOTIFY_NAME(thread_set_nameA) != ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_nameA),_init)))
+    {
+        ITTNOTIFY_NAME(thread_set_nameA)(name);
+    }
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+    if (ITTNOTIFY_NAME(thread_set_name) && ITTNOTIFY_NAME(thread_set_name) != ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_name),_init)))
+    {
+        ITTNOTIFY_NAME(thread_set_name)(name);
+    }
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+}
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+static int ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thr_name_setA),_init))(const char* name, int namelen)
+{
+    (void)namelen;
+    ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_nameA),_init))(name);
+    return 0;
+}
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+static int ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thr_name_set),_init))(const char* name, int namelen)
+{
+    (void)namelen;
+    ITT_VERSIONIZE(ITT_JOIN(_N_(thread_set_name),_init))(name);
+    return 0;
+}
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thread_ignore),_init))(void)
+{
+    if (!_N_(_ittapi_global).api_initialized && _N_(_ittapi_global).thread_list == NULL)
+    {
+        __itt_init_ittlib_name(NULL, __itt_group_all);
+    }
+    if (ITTNOTIFY_NAME(thread_ignore) && ITTNOTIFY_NAME(thread_ignore) != ITT_VERSIONIZE(ITT_JOIN(_N_(thread_ignore),_init)))
+    {
+        ITTNOTIFY_NAME(thread_ignore)();
+    }
+}
+
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(thr_ignore),_init))(void)
+{
+    ITT_VERSIONIZE(ITT_JOIN(_N_(thread_ignore),_init))();
+}
+
+static void ITTAPI ITT_VERSIONIZE(ITT_JOIN(_N_(enable_attach),_init))(void)
+{
+#ifdef __ANDROID__
+    /*
+     * if LIB_VAR_NAME env variable were set before then stay previous value
+     * else set default path
+    */
+    setenv(ITT_TO_STR(LIB_VAR_NAME), ANDROID_ITTNOTIFY_DEFAULT_PATH, 0);
+#endif
+}
+
+/* -------------------------------------------------------------------------- */
+
+static const char* __itt_fsplit(const char* s, const char* sep, const char** out, int* len)
+{
+    int i;
+    int j;
+
+    if (!s || !sep || !out || !len)
+        return NULL;
+
+    for (i = 0; s[i]; i++)
+    {
+        int b = 0;
+        for (j = 0; sep[j]; j++)
+            if (s[i] == sep[j])
+            {
+                b = 1;
+                break;
+            }
+        if (!b)
+            break;
+    }
+
+    if (!s[i])
+        return NULL;
+
+    *len = 0;
+    *out = &s[i];
+
+    for (; s[i]; i++, (*len)++)
+    {
+        int b = 0;
+        for (j = 0; sep[j]; j++)
+            if (s[i] == sep[j])
+            {
+                b = 1;
+                break;
+            }
+        if (b)
+            break;
+    }
+
+    for (; s[i]; i++)
+    {
+        int b = 0;
+        for (j = 0; sep[j]; j++)
+            if (s[i] == sep[j])
+            {
+                b = 1;
+                break;
+            }
+        if (!b)
+            break;
+    }
+
+    return &s[i];
+}
+
+/* This function return value of env variable that placed into static buffer.
+ * !!! The same static buffer is used for subsequent calls. !!!
+ * This was done to aviod dynamic allocation for few calls.
+ * Actually we need this function only four times.
+ */
+static const char* __itt_get_env_var(const char* name)
+{
+#define MAX_ENV_VALUE_SIZE 4086
+    static char  env_buff[MAX_ENV_VALUE_SIZE];
+    static char* env_value = (char*)env_buff;
+
+    if (name != NULL)
+    {
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+        size_t max_len = MAX_ENV_VALUE_SIZE - (size_t)(env_value - env_buff);
+        DWORD rc = GetEnvironmentVariableA(name, env_value, (DWORD)max_len);
+        if (rc >= max_len)
+            __itt_report_error(__itt_error_env_too_long, name, (size_t)rc - 1, (size_t)(max_len - 1));
+        else if (rc > 0)
+        {
+            const char* ret = (const char*)env_value;
+            env_value += rc + 1;
+            return ret;
+        }
+        else
+        {
+            /* If environment variable is empty, GetEnvirornmentVariables()
+             * returns zero (number of characters (not including terminating null),
+             * and GetLastError() returns ERROR_SUCCESS. */
+            DWORD err = GetLastError();
+            if (err == ERROR_SUCCESS)
+                return env_value;
+
+            if (err != ERROR_ENVVAR_NOT_FOUND)
+                __itt_report_error(__itt_error_cant_read_env, name, (int)err);
+        }
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+        char* env = getenv(name);
+        if (env != NULL)
+        {
+            size_t len = __itt_fstrnlen(env, MAX_ENV_VALUE_SIZE);
+            size_t max_len = MAX_ENV_VALUE_SIZE - (size_t)(env_value - env_buff);
+            if (len < max_len)
+            {
+                const char* ret = (const char*)env_value;
+                __itt_fstrcpyn(env_value, max_len, env, len + 1);
+                env_value += len + 1;
+                return ret;
+            } else
+                __itt_report_error(__itt_error_env_too_long, name, (size_t)len, (size_t)(max_len - 1));
+        }
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+    }
+    return NULL;
+}
+
+static const char* __itt_get_lib_name(void)
+{
+    const char* lib_name = __itt_get_env_var(ITT_TO_STR(LIB_VAR_NAME));
+
+#ifdef __ANDROID__
+    if (lib_name == NULL)
+    {
+
+#if ITT_ARCH==ITT_ARCH_IA32 || ITT_ARCH==ITT_ARCH_ARM
+        const char* const marker_filename = "com.intel.itt.collector_lib_32";
+#else
+        const char* const marker_filename = "com.intel.itt.collector_lib_64";
+#endif
+
+        char system_wide_marker_filename[PATH_MAX] = {0};
+        int itt_marker_file_fd = -1;
+        ssize_t res = 0;
+
+        res = snprintf(system_wide_marker_filename, PATH_MAX - 1, "%s%s", "/data/local/tmp/", marker_filename);
+        if (res < 0)
+        {
+            ITT_ANDROID_LOGE("Unable to concatenate marker file string.");
+            return lib_name;
+        }
+        itt_marker_file_fd = open(system_wide_marker_filename, O_RDONLY);
+
+        if (itt_marker_file_fd == -1)
+        {
+            const pid_t my_pid = getpid();
+            char cmdline_path[PATH_MAX] = {0};
+            char package_name[PATH_MAX] = {0};
+            char app_sandbox_file[PATH_MAX] = {0};
+            int cmdline_fd = 0;
+
+            ITT_ANDROID_LOGI("Unable to open system-wide marker file.");
+            res = snprintf(cmdline_path, PATH_MAX - 1, "/proc/%d/cmdline", my_pid);
+            if (res < 0)
+            {
+                ITT_ANDROID_LOGE("Unable to get cmdline path string.");
+                return lib_name;
+            }
+
+            ITT_ANDROID_LOGI("CMD file: %s\n", cmdline_path);
+            cmdline_fd = open(cmdline_path, O_RDONLY);
+            if (cmdline_fd == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to open %s file!", cmdline_path);
+                return lib_name;
+            }
+            res = read(cmdline_fd, package_name, PATH_MAX - 1);
+            if (res == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to read %s file!", cmdline_path);
+                res = close(cmdline_fd);
+                if (res == -1)
+                {
+                    ITT_ANDROID_LOGE("Unable to close %s file!", cmdline_path);
+                }
+                return lib_name;
+            }
+            res = close(cmdline_fd);
+            if (res == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to close %s file!", cmdline_path);
+                return lib_name;
+            }
+            ITT_ANDROID_LOGI("Package name: %s\n", package_name);
+            res = snprintf(app_sandbox_file, PATH_MAX - 1, "/data/data/%s/%s", package_name, marker_filename);
+            if (res < 0)
+            {
+                ITT_ANDROID_LOGE("Unable to concatenate marker file string.");
+                return lib_name;
+            }
+
+            ITT_ANDROID_LOGI("Lib marker file name: %s\n", app_sandbox_file);
+            itt_marker_file_fd = open(app_sandbox_file, O_RDONLY);
+            if (itt_marker_file_fd == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to open app marker file!");
+                return lib_name;
+            }
+        }
+
+        {
+            char itt_lib_name[PATH_MAX] = {0};
+
+            res = read(itt_marker_file_fd, itt_lib_name, PATH_MAX - 1);
+            if (res == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to read %s file!", itt_marker_file_fd);
+                res = close(itt_marker_file_fd);
+                if (res == -1)
+                {
+                    ITT_ANDROID_LOGE("Unable to close %s file!", itt_marker_file_fd);
+                }
+                return lib_name;
+            }
+            ITT_ANDROID_LOGI("ITT Lib path: %s", itt_lib_name);
+            res = close(itt_marker_file_fd);
+            if (res == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to close %s file!", itt_marker_file_fd);
+                return lib_name;
+            }
+            ITT_ANDROID_LOGI("Set env %s to %s", ITT_TO_STR(LIB_VAR_NAME), itt_lib_name);
+            res = setenv(ITT_TO_STR(LIB_VAR_NAME), itt_lib_name, 0);
+            if (res == -1)
+            {
+                ITT_ANDROID_LOGE("Unable to set env var!");
+                return lib_name;
+            }
+            lib_name = __itt_get_env_var(ITT_TO_STR(LIB_VAR_NAME));
+            ITT_ANDROID_LOGI("ITT Lib path from env: %s", lib_name);
+        }
+    }
+#endif
+
+    return lib_name;
+}
+
+/* Avoid clashes with std::min */
+#define __itt_min(a,b) ((a) < (b) ? (a) : (b))
+
+static __itt_group_id __itt_get_groups(void)
+{
+    int i;
+    __itt_group_id res = __itt_group_none;
+    const char* var_name  = "INTEL_ITTNOTIFY_GROUPS";
+    const char* group_str = __itt_get_env_var(var_name);
+
+    if (group_str != NULL)
+    {
+        int len;
+        char gr[255];
+        const char* chunk;
+        while ((group_str = __itt_fsplit(group_str, ",; ", &chunk, &len)) != NULL)
+        {
+            __itt_fstrcpyn(gr, sizeof(gr) - 1, chunk, len + 1);
+            gr[__itt_min(len, (int)(sizeof(gr) - 1))] = 0;
+
+            for (i = 0; group_list[i].name != NULL; i++)
+            {
+                if (!__itt_fstrcmp(gr, group_list[i].name))
+                {
+                    res = (__itt_group_id)(res | group_list[i].id);
+                    break;
+                }
+            }
+        }
+        /* TODO: !!! Workaround for bug with warning for unknown group !!!
+         * Should be fixed in new initialization scheme.
+         * Now the following groups should be set always. */
+        for (i = 0; group_list[i].id != __itt_group_none; i++)
+            if (group_list[i].id != __itt_group_all &&
+                group_list[i].id > __itt_group_splitter_min &&
+                group_list[i].id < __itt_group_splitter_max)
+                res = (__itt_group_id)(res | group_list[i].id);
+        return res;
+    }
+    else
+    {
+        for (i = 0; group_alias[i].env_var != NULL; i++)
+            if (__itt_get_env_var(group_alias[i].env_var) != NULL)
+                return group_alias[i].groups;
+    }
+
+    return res;
+}
+#undef __itt_min
+
+static int __itt_lib_version(lib_t lib)
+{
+    if (lib == NULL)
+        return 0;
+    if (__itt_get_proc(lib, "__itt_api_init"))
+        return 2;
+    if (__itt_get_proc(lib, "__itt_api_version"))
+        return 1;
+    return 0;
+}
+
+/* It's not used right now! Comment it out to avoid warnings.
+static void __itt_reinit_all_pointers(void)
+{
+    int i;
+    // Fill all pointers with initial stubs
+    for (i = 0; _N_(_ittapi_global).api_list_ptr[i].name != NULL; i++)
+        *_N_(_ittapi_global).api_list_ptr[i].func_ptr = _N_(_ittapi_global).api_list_ptr[i].init_func;
+}
+*/
+
+static void __itt_nullify_all_pointers(void)
+{
+    int i;
+    /* Nulify all pointers except domain_create and string_handle_create */
+    for (i = 0; _N_(_ittapi_global).api_list_ptr[i].name != NULL; i++)
+        *_N_(_ittapi_global).api_list_ptr[i].func_ptr = _N_(_ittapi_global).api_list_ptr[i].null_func;
+}
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#pragma warning(push)
+#pragma warning(disable: 4054) /* warning C4054: 'type cast' : from function pointer 'XXX' to data pointer 'void *' */
+#pragma warning(disable: 4055) /* warning C4055: 'type cast' : from data pointer 'void *' to function pointer 'XXX' */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+ITT_EXTERN_C void _N_(fini_ittlib)(void)
+{
+    __itt_api_fini_t* __itt_api_fini_ptr = NULL;
+    static volatile TIDT current_thread = 0;
+
+    if (_N_(_ittapi_global).api_initialized)
+    {
+        __itt_mutex_lock(&_N_(_ittapi_global).mutex);
+        if (_N_(_ittapi_global).api_initialized)
+        {
+            if (current_thread == 0)
+            {
+                current_thread = __itt_thread_id();
+                if (_N_(_ittapi_global).lib != NULL)
+                {
+                    __itt_api_fini_ptr = (__itt_api_fini_t*)(size_t)__itt_get_proc(_N_(_ittapi_global).lib, "__itt_api_fini");
+                }
+                if (__itt_api_fini_ptr)
+                {
+                    __itt_api_fini_ptr(&_N_(_ittapi_global));
+                }
+
+                __itt_nullify_all_pointers();
+
+ /* TODO: !!! not safe !!! don't support unload so far.
+  *             if (_N_(_ittapi_global).lib != NULL)
+  *                 __itt_unload_lib(_N_(_ittapi_global).lib);
+  *             _N_(_ittapi_global).lib = NULL;
+  */
+                _N_(_ittapi_global).api_initialized = 0;
+                current_thread = 0;
+            }
+        }
+        __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+    }
+}
+
+ITT_EXTERN_C int _N_(init_ittlib)(const char* lib_name, __itt_group_id init_groups)
+{
+    int i;
+    __itt_group_id groups;
+#ifdef ITT_COMPLETE_GROUP
+    __itt_group_id zero_group = __itt_group_none;
+#endif /* ITT_COMPLETE_GROUP */
+    static volatile TIDT current_thread = 0;
+
+    if (!_N_(_ittapi_global).api_initialized)
+    {
+#ifndef ITT_SIMPLE_INIT
+        ITT_MUTEX_INIT_AND_LOCK(_N_(_ittapi_global));
+#endif /* ITT_SIMPLE_INIT */
+
+        if (!_N_(_ittapi_global).api_initialized)
+        {
+            if (current_thread == 0)
+            {
+                current_thread = __itt_thread_id();
+                if (lib_name == NULL)
+                {
+                    lib_name = __itt_get_lib_name();
+                }
+                groups = __itt_get_groups();
+                if (groups != __itt_group_none || lib_name != NULL)
+                {
+                    _N_(_ittapi_global).lib = __itt_load_lib((lib_name == NULL) ? ittnotify_lib_name : lib_name);
+
+                    if (_N_(_ittapi_global).lib != NULL)
+                    {
+                        __itt_api_init_t* __itt_api_init_ptr;
+                        int lib_version = __itt_lib_version(_N_(_ittapi_global).lib);
+
+                        switch (lib_version) {
+                        case 0:
+                            groups = __itt_group_legacy;
+                            /* Falls through */
+                        case 1:
+                            /* Fill all pointers from dynamic library */
+                            for (i = 0; _N_(_ittapi_global).api_list_ptr[i].name != NULL; i++)
+                            {
+                                if (_N_(_ittapi_global).api_list_ptr[i].group & groups & init_groups)
+                                {
+                                    *_N_(_ittapi_global).api_list_ptr[i].func_ptr = (void*)__itt_get_proc(_N_(_ittapi_global).lib, _N_(_ittapi_global).api_list_ptr[i].name);
+                                    if (*_N_(_ittapi_global).api_list_ptr[i].func_ptr == NULL)
+                                    {
+                                        /* Restore pointers for function with static implementation */
+                                        *_N_(_ittapi_global).api_list_ptr[i].func_ptr = _N_(_ittapi_global).api_list_ptr[i].null_func;
+                                        __itt_report_error(__itt_error_no_symbol, lib_name, _N_(_ittapi_global).api_list_ptr[i].name);
+#ifdef ITT_COMPLETE_GROUP
+                                        zero_group = (__itt_group_id)(zero_group | _N_(_ittapi_global).api_list_ptr[i].group);
+#endif /* ITT_COMPLETE_GROUP */
+                                    }
+                                }
+                                else
+                                    *_N_(_ittapi_global).api_list_ptr[i].func_ptr = _N_(_ittapi_global).api_list_ptr[i].null_func;
+                            }
+
+                            if (groups == __itt_group_legacy)
+                            {
+                                /* Compatibility with legacy tools */
+                                ITTNOTIFY_NAME(thread_ignore)  = ITTNOTIFY_NAME(thr_ignore);
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+                                ITTNOTIFY_NAME(sync_createA)   = ITTNOTIFY_NAME(sync_set_nameA);
+                                ITTNOTIFY_NAME(sync_createW)   = ITTNOTIFY_NAME(sync_set_nameW);
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+                                ITTNOTIFY_NAME(sync_create)    = ITTNOTIFY_NAME(sync_set_name);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+                                ITTNOTIFY_NAME(sync_prepare)   = ITTNOTIFY_NAME(notify_sync_prepare);
+                                ITTNOTIFY_NAME(sync_cancel)    = ITTNOTIFY_NAME(notify_sync_cancel);
+                                ITTNOTIFY_NAME(sync_acquired)  = ITTNOTIFY_NAME(notify_sync_acquired);
+                                ITTNOTIFY_NAME(sync_releasing) = ITTNOTIFY_NAME(notify_sync_releasing);
+                            }
+
+#ifdef ITT_COMPLETE_GROUP
+                            for (i = 0; _N_(_ittapi_global).api_list_ptr[i].name != NULL; i++)
+                                if (_N_(_ittapi_global).api_list_ptr[i].group & zero_group)
+                                    *_N_(_ittapi_global).api_list_ptr[i].func_ptr = _N_(_ittapi_global).api_list_ptr[i].null_func;
+#endif /* ITT_COMPLETE_GROUP */
+                            break;
+                        case 2:
+                            __itt_api_init_ptr = (__itt_api_init_t*)(size_t)__itt_get_proc(_N_(_ittapi_global).lib, "__itt_api_init");
+                            if (__itt_api_init_ptr)
+                                __itt_api_init_ptr(&_N_(_ittapi_global), init_groups);
+                            break;
+                        }
+                    }
+                    else
+                    {
+                        __itt_nullify_all_pointers();
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+                        int error = __itt_system_error();
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+                        const char* error = dlerror();
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+                        __itt_report_error(__itt_error_no_module, lib_name, error);
+                    }
+                }
+                else
+                {
+                    __itt_nullify_all_pointers();
+                }
+                _N_(_ittapi_global).api_initialized = 1;
+                current_thread = 0;
+                /* !!! Just to avoid unused code elimination !!! */
+                if (__itt_fini_ittlib_ptr == _N_(fini_ittlib)) current_thread = 0;
+            }
+        }
+
+#ifndef ITT_SIMPLE_INIT
+        __itt_mutex_unlock(&_N_(_ittapi_global).mutex);
+#endif /* ITT_SIMPLE_INIT */
+    }
+
+    /* Evaluating if any function ptr is non empty and it's in init_groups */
+    for (i = 0; _N_(_ittapi_global).api_list_ptr[i].name != NULL; i++)
+    {
+        if (*_N_(_ittapi_global).api_list_ptr[i].func_ptr != _N_(_ittapi_global).api_list_ptr[i].null_func &&
+            _N_(_ittapi_global).api_list_ptr[i].group & init_groups)
+        {
+            return 1;
+        }
+    }
+    return 0;
+}
+
+ITT_EXTERN_C __itt_error_handler_t* _N_(set_error_handler)(__itt_error_handler_t* handler)
+{
+    __itt_error_handler_t* prev = (__itt_error_handler_t*)(size_t)_N_(_ittapi_global).error_handler;
+    _N_(_ittapi_global).error_handler = (void*)(size_t)handler;
+    return prev;
+}
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#pragma warning(pop)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_static.h b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_static.h
new file mode 100644
index 00000000..ec93aad4
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_static.h
@@ -0,0 +1,328 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "ittnotify_config.h"
+
+#ifndef ITT_FORMAT_DEFINED
+#  ifndef ITT_FORMAT
+#    define ITT_FORMAT
+#  endif /* ITT_FORMAT */
+#  ifndef ITT_NO_PARAMS
+#    define ITT_NO_PARAMS
+#  endif /* ITT_NO_PARAMS */
+#endif /* ITT_FORMAT_DEFINED */
+
+/*
+ * parameters for macro expected:
+ * ITT_STUB(api, type, func_name, arguments, params, func_name_in_dll, group, printf_fmt)
+ */
+#ifdef __ITT_INTERNAL_INIT
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_domain*, domain_createA, (const char    *name), (ITT_FORMAT name), domain_createA, __itt_group_structure, "\"%s\"")
+ITT_STUB(ITTAPI, __itt_domain*, domain_createW, (const wchar_t *name), (ITT_FORMAT name), domain_createW, __itt_group_structure, "\"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_domain*, domain_create,  (const char    *name), (ITT_FORMAT name), domain_create,  __itt_group_structure, "\"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_string_handle*, string_handle_createA, (const char    *name), (ITT_FORMAT name), string_handle_createA, __itt_group_structure, "\"%s\"")
+ITT_STUB(ITTAPI, __itt_string_handle*, string_handle_createW, (const wchar_t *name), (ITT_FORMAT name), string_handle_createW, __itt_group_structure, "\"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_string_handle*, string_handle_create,  (const char    *name), (ITT_FORMAT name), string_handle_create,  __itt_group_structure, "\"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+ITT_STUBV(ITTAPI, void, pause,  (void), (ITT_NO_PARAMS), pause,  __itt_group_control | __itt_group_legacy, "no args")
+ITT_STUBV(ITTAPI, void, resume, (void), (ITT_NO_PARAMS), resume, __itt_group_control | __itt_group_legacy, "no args")
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, thread_set_nameA, (const char    *name), (ITT_FORMAT name), thread_set_nameA, __itt_group_thread, "\"%s\"")
+ITT_STUBV(ITTAPI, void, thread_set_nameW, (const wchar_t *name), (ITT_FORMAT name), thread_set_nameW, __itt_group_thread, "\"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, thread_set_name,  (const char    *name), (ITT_FORMAT name), thread_set_name,  __itt_group_thread, "\"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, thread_ignore, (void), (ITT_NO_PARAMS), thread_ignore, __itt_group_thread, "no args")
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, int,  thr_name_setA, (const char    *name, int namelen), (ITT_FORMAT name, namelen), thr_name_setA, __itt_group_thread | __itt_group_legacy, "\"%s\", %d")
+ITT_STUB(LIBITTAPI, int,  thr_name_setW, (const wchar_t *name, int namelen), (ITT_FORMAT name, namelen), thr_name_setW, __itt_group_thread | __itt_group_legacy, "\"%S\", %d")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, int,  thr_name_set,  (const char    *name, int namelen), (ITT_FORMAT name, namelen), thr_name_set,  __itt_group_thread | __itt_group_legacy, "\"%s\", %d")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(LIBITTAPI, void, thr_ignore,   (void),                             (ITT_NO_PARAMS),            thr_ignore,    __itt_group_thread | __itt_group_legacy, "no args")
+#endif /* __ITT_INTERNAL_BODY */
+
+ITT_STUBV(ITTAPI, void, enable_attach, (void), (ITT_NO_PARAMS), enable_attach, __itt_group_all, "no args")
+
+#else  /* __ITT_INTERNAL_INIT */
+
+ITT_STUBV(ITTAPI, void, detach, (void), (ITT_NO_PARAMS), detach, __itt_group_control | __itt_group_legacy, "no args")
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, sync_createA, (void *addr, const char    *objtype, const char    *objname, int attribute), (ITT_FORMAT addr, objtype, objname, attribute), sync_createA, __itt_group_sync | __itt_group_fsync, "%p, \"%s\", \"%s\", %x")
+ITT_STUBV(ITTAPI, void, sync_createW, (void *addr, const wchar_t *objtype, const wchar_t *objname, int attribute), (ITT_FORMAT addr, objtype, objname, attribute), sync_createW, __itt_group_sync | __itt_group_fsync, "%p, \"%S\", \"%S\", %x")
+ITT_STUBV(ITTAPI, void, sync_renameA, (void *addr, const char    *name), (ITT_FORMAT addr, name), sync_renameA, __itt_group_sync | __itt_group_fsync, "%p, \"%s\"")
+ITT_STUBV(ITTAPI, void, sync_renameW, (void *addr, const wchar_t *name), (ITT_FORMAT addr, name), sync_renameW, __itt_group_sync | __itt_group_fsync, "%p, \"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, sync_create,  (void *addr, const char    *objtype, const char    *objname, int attribute), (ITT_FORMAT addr, objtype, objname, attribute), sync_create,  __itt_group_sync | __itt_group_fsync, "%p, \"%s\", \"%s\", %x")
+ITT_STUBV(ITTAPI, void, sync_rename,  (void *addr, const char    *name), (ITT_FORMAT addr, name), sync_rename,  __itt_group_sync | __itt_group_fsync, "%p, \"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, sync_destroy,    (void *addr), (ITT_FORMAT addr), sync_destroy,   __itt_group_sync | __itt_group_fsync, "%p")
+
+ITT_STUBV(ITTAPI, void, sync_prepare,    (void* addr), (ITT_FORMAT addr), sync_prepare,   __itt_group_sync,  "%p")
+ITT_STUBV(ITTAPI, void, sync_cancel,     (void *addr), (ITT_FORMAT addr), sync_cancel,    __itt_group_sync,  "%p")
+ITT_STUBV(ITTAPI, void, sync_acquired,   (void *addr), (ITT_FORMAT addr), sync_acquired,  __itt_group_sync,  "%p")
+ITT_STUBV(ITTAPI, void, sync_releasing,  (void* addr), (ITT_FORMAT addr), sync_releasing, __itt_group_sync,  "%p")
+
+ITT_STUBV(ITTAPI, void, suppress_push,       (unsigned int mask),                             (ITT_FORMAT mask), suppress_push,  __itt_group_suppress,  "%p")
+ITT_STUBV(ITTAPI, void, suppress_pop,        (void),                                          (ITT_NO_PARAMS),   suppress_pop,   __itt_group_suppress,  "no args")
+ITT_STUBV(ITTAPI, void, suppress_mark_range, (__itt_suppress_mode_t mode, unsigned int mask, void * address, size_t size),(ITT_FORMAT mode, mask, address, size), suppress_mark_range, __itt_group_suppress, "%d, %p, %p, %d")
+ITT_STUBV(ITTAPI, void, suppress_clear_range,(__itt_suppress_mode_t mode, unsigned int mask, void * address, size_t size),(ITT_FORMAT mode, mask, address, size), suppress_clear_range,__itt_group_suppress, "%d, %p, %p, %d")
+
+ITT_STUBV(ITTAPI, void, fsync_prepare,   (void* addr), (ITT_FORMAT addr), sync_prepare,   __itt_group_fsync, "%p")
+ITT_STUBV(ITTAPI, void, fsync_cancel,    (void *addr), (ITT_FORMAT addr), sync_cancel,    __itt_group_fsync, "%p")
+ITT_STUBV(ITTAPI, void, fsync_acquired,  (void *addr), (ITT_FORMAT addr), sync_acquired,  __itt_group_fsync, "%p")
+ITT_STUBV(ITTAPI, void, fsync_releasing, (void* addr), (ITT_FORMAT addr), sync_releasing, __itt_group_fsync, "%p")
+
+ITT_STUBV(ITTAPI, void, model_site_begin,          (__itt_model_site *site, __itt_model_site_instance *instance, const char *name), (ITT_FORMAT site, instance, name), model_site_begin, __itt_group_model, "%p, %p, \"%s\"")
+ITT_STUBV(ITTAPI, void, model_site_end,            (__itt_model_site *site, __itt_model_site_instance *instance),                   (ITT_FORMAT site, instance),       model_site_end,   __itt_group_model, "%p, %p")
+ITT_STUBV(ITTAPI, void, model_task_begin,          (__itt_model_task *task, __itt_model_task_instance *instance, const char *name), (ITT_FORMAT task, instance, name), model_task_begin, __itt_group_model, "%p, %p, \"%s\"")
+ITT_STUBV(ITTAPI, void, model_task_end,            (__itt_model_task *task, __itt_model_task_instance *instance),                   (ITT_FORMAT task, instance),       model_task_end,   __itt_group_model, "%p, %p")
+ITT_STUBV(ITTAPI, void, model_lock_acquire,        (void *lock), (ITT_FORMAT lock), model_lock_acquire, __itt_group_model, "%p")
+ITT_STUBV(ITTAPI, void, model_lock_release,        (void *lock), (ITT_FORMAT lock), model_lock_release, __itt_group_model, "%p")
+ITT_STUBV(ITTAPI, void, model_record_allocation,   (void *addr, size_t size), (ITT_FORMAT addr, size), model_record_allocation,   __itt_group_model, "%p, %d")
+ITT_STUBV(ITTAPI, void, model_record_deallocation, (void *addr),              (ITT_FORMAT addr),       model_record_deallocation, __itt_group_model, "%p")
+ITT_STUBV(ITTAPI, void, model_induction_uses,      (void* addr, size_t size), (ITT_FORMAT addr, size), model_induction_uses,      __itt_group_model, "%p, %d")
+ITT_STUBV(ITTAPI, void, model_reduction_uses,      (void* addr, size_t size), (ITT_FORMAT addr, size), model_reduction_uses,      __itt_group_model, "%p, %d")
+ITT_STUBV(ITTAPI, void, model_observe_uses,        (void* addr, size_t size), (ITT_FORMAT addr, size), model_observe_uses,        __itt_group_model, "%p, %d")
+ITT_STUBV(ITTAPI, void, model_clear_uses,          (void* addr),              (ITT_FORMAT addr),       model_clear_uses,          __itt_group_model, "%p")
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, model_site_beginW,         (const wchar_t *name),     (ITT_FORMAT name),       model_site_beginW,         __itt_group_model, "\"%s\"")
+ITT_STUBV(ITTAPI, void, model_task_beginW,         (const wchar_t *name),     (ITT_FORMAT name),       model_task_beginW,         __itt_group_model, "\"%s\"")
+ITT_STUBV(ITTAPI, void, model_iteration_taskW,     (const wchar_t *name),     (ITT_FORMAT name),       model_iteration_taskW,     __itt_group_model, "\"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, model_site_beginA,         (const char *name),        (ITT_FORMAT name),       model_site_beginA,         __itt_group_model, "\"%s\"")
+ITT_STUBV(ITTAPI, void, model_site_beginAL,        (const char *name, size_t len), (ITT_FORMAT name, len), model_site_beginAL,    __itt_group_model, "\"%s\", %d")
+ITT_STUBV(ITTAPI, void, model_task_beginA,         (const char *name),        (ITT_FORMAT name),       model_task_beginA,         __itt_group_model, "\"%s\"")
+ITT_STUBV(ITTAPI, void, model_task_beginAL,        (const char *name, size_t len), (ITT_FORMAT name, len), model_task_beginAL,    __itt_group_model, "\"%s\", %d")
+ITT_STUBV(ITTAPI, void, model_iteration_taskA,     (const char *name),        (ITT_FORMAT name),       model_iteration_taskA,     __itt_group_model, "\"%s\"")
+ITT_STUBV(ITTAPI, void, model_iteration_taskAL,    (const char *name, size_t len), (ITT_FORMAT name, len), model_iteration_taskAL, __itt_group_model, "\"%s\", %d")
+ITT_STUBV(ITTAPI, void, model_site_end_2,          (void),                    (ITT_NO_PARAMS),         model_site_end_2,          __itt_group_model, "no args")
+ITT_STUBV(ITTAPI, void, model_task_end_2,          (void),                    (ITT_NO_PARAMS),         model_task_end_2,          __itt_group_model, "no args")
+ITT_STUBV(ITTAPI, void, model_lock_acquire_2,      (void *lock),              (ITT_FORMAT lock),       model_lock_acquire_2,      __itt_group_model, "%p")
+ITT_STUBV(ITTAPI, void, model_lock_release_2,      (void *lock),              (ITT_FORMAT lock),       model_lock_release_2,      __itt_group_model, "%p")
+ITT_STUBV(ITTAPI, void, model_aggregate_task,      (size_t count),            (ITT_FORMAT count),      model_aggregate_task,      __itt_group_model, "%d")
+ITT_STUBV(ITTAPI, void, model_disable_push,        (__itt_model_disable x),   (ITT_FORMAT x),          model_disable_push,        __itt_group_model, "%p")
+ITT_STUBV(ITTAPI, void, model_disable_pop,         (void),                    (ITT_NO_PARAMS),         model_disable_pop,         __itt_group_model, "no args")
+#endif /* __ITT_INTERNAL_BODY */
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_heap_function, heap_function_createA, (const char    *name, const char    *domain), (ITT_FORMAT name, domain), heap_function_createA, __itt_group_heap, "\"%s\", \"%s\"")
+ITT_STUB(ITTAPI, __itt_heap_function, heap_function_createW, (const wchar_t *name, const wchar_t *domain), (ITT_FORMAT name, domain), heap_function_createW, __itt_group_heap, "\"%s\", \"%s\"")
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_heap_function, heap_function_create,  (const char    *name, const char    *domain), (ITT_FORMAT name, domain), heap_function_create,  __itt_group_heap, "\"%s\", \"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* __ITT_INTERNAL_BODY */
+ITT_STUBV(ITTAPI, void, heap_allocate_begin,   (__itt_heap_function h, size_t size, int initialized),             (ITT_FORMAT h, size, initialized),       heap_allocate_begin, __itt_group_heap, "%p, %lu, %d")
+ITT_STUBV(ITTAPI, void, heap_allocate_end,     (__itt_heap_function h, void** addr, size_t size, int initialized), (ITT_FORMAT h, addr, size, initialized), heap_allocate_end,   __itt_group_heap, "%p, %p, %lu, %d")
+ITT_STUBV(ITTAPI, void, heap_free_begin,       (__itt_heap_function h, void*  addr), (ITT_FORMAT h, addr), heap_free_begin, __itt_group_heap, "%p, %p")
+ITT_STUBV(ITTAPI, void, heap_free_end,         (__itt_heap_function h, void*  addr), (ITT_FORMAT h, addr), heap_free_end,   __itt_group_heap, "%p, %p")
+ITT_STUBV(ITTAPI, void, heap_reallocate_begin, (__itt_heap_function h, void*  addr, size_t new_size, int initialized),                  (ITT_FORMAT h, addr, new_size, initialized),           heap_reallocate_begin, __itt_group_heap, "%p, %p, %lu, %d")
+ITT_STUBV(ITTAPI, void, heap_reallocate_end,   (__itt_heap_function h, void*  addr, void** new_addr, size_t new_size, int initialized), (ITT_FORMAT h, addr, new_addr, new_size, initialized), heap_reallocate_end,   __itt_group_heap, "%p, %p, %p, %lu, %d")
+ITT_STUBV(ITTAPI, void, heap_internal_access_begin, (void), (ITT_NO_PARAMS), heap_internal_access_begin, __itt_group_heap, "no args")
+ITT_STUBV(ITTAPI, void, heap_internal_access_end,   (void), (ITT_NO_PARAMS), heap_internal_access_end,   __itt_group_heap, "no args")
+ITT_STUBV(ITTAPI, void, heap_record_memory_growth_begin, (void), (ITT_NO_PARAMS), heap_record_memory_growth_begin, __itt_group_heap, "no args")
+ITT_STUBV(ITTAPI, void, heap_record_memory_growth_end,   (void), (ITT_NO_PARAMS), heap_record_memory_growth_end,   __itt_group_heap, "no args")
+ITT_STUBV(ITTAPI, void, heap_reset_detection, (unsigned int reset_mask),  (ITT_FORMAT reset_mask), heap_reset_detection, __itt_group_heap, "%u")
+ITT_STUBV(ITTAPI, void, heap_record,          (unsigned int record_mask), (ITT_FORMAT record_mask),  heap_record,        __itt_group_heap, "%u")
+
+ITT_STUBV(ITTAPI, void, id_create,  (const __itt_domain *domain, __itt_id id), (ITT_FORMAT domain, id), id_create,  __itt_group_structure, "%p, %lu")
+ITT_STUBV(ITTAPI, void, id_destroy, (const __itt_domain *domain, __itt_id id), (ITT_FORMAT domain, id), id_destroy, __itt_group_structure, "%p, %lu")
+
+ITT_STUB(ITTAPI, __itt_timestamp, get_timestamp, (void), (ITT_NO_PARAMS), get_timestamp,  __itt_group_structure, "no args")
+
+ITT_STUBV(ITTAPI, void, region_begin, (const __itt_domain *domain, __itt_id id, __itt_id parent, __itt_string_handle *name), (ITT_FORMAT domain, id, parent, name), region_begin, __itt_group_structure, "%p, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, region_end,   (const __itt_domain *domain, __itt_id id),                                             (ITT_FORMAT domain, id),               region_end,   __itt_group_structure, "%p, %lu")
+
+#ifndef __ITT_INTERNAL_BODY
+ITT_STUBV(ITTAPI, void, frame_begin_v3,  (const __itt_domain *domain, __itt_id *id),                                             (ITT_FORMAT domain, id),             frame_begin_v3,  __itt_group_structure, "%p, %p")
+ITT_STUBV(ITTAPI, void, frame_end_v3,    (const __itt_domain *domain, __itt_id *id),                                             (ITT_FORMAT domain, id),             frame_end_v3,    __itt_group_structure, "%p, %p")
+ITT_STUBV(ITTAPI, void, frame_submit_v3, (const __itt_domain *domain, __itt_id *id, __itt_timestamp begin, __itt_timestamp end), (ITT_FORMAT domain, id, begin, end), frame_submit_v3, __itt_group_structure, "%p, %p, %lu, %lu")
+#endif /* __ITT_INTERNAL_BODY */
+
+ITT_STUBV(ITTAPI, void, task_group,   (const __itt_domain *domain, __itt_id id, __itt_id parent, __itt_string_handle *name), (ITT_FORMAT domain, id, parent, name), task_group,  __itt_group_structure, "%p, %lu, %lu, %p")
+
+ITT_STUBV(ITTAPI, void, task_begin,    (const __itt_domain *domain, __itt_id id, __itt_id parent, __itt_string_handle *name), (ITT_FORMAT domain, id, parent, name), task_begin,    __itt_group_structure, "%p, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, task_begin_fn, (const __itt_domain *domain, __itt_id id, __itt_id parent, void* fn),                  (ITT_FORMAT domain, id, parent, fn),   task_begin_fn, __itt_group_structure, "%p, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, task_end,      (const __itt_domain *domain),                                                          (ITT_FORMAT domain),                   task_end,      __itt_group_structure, "%p")
+
+ITT_STUBV(ITTAPI, void, counter_inc_v3,       (const __itt_domain *domain, __itt_string_handle *name),                           (ITT_FORMAT domain, name),        counter_inc_v3,       __itt_group_structure, "%p, %p")
+ITT_STUBV(ITTAPI, void, counter_inc_delta_v3, (const __itt_domain *domain, __itt_string_handle *name, unsigned long long value), (ITT_FORMAT domain, name, value), counter_inc_delta_v3, __itt_group_structure, "%p, %p, %lu")
+
+ITT_STUBV(ITTAPI, void, marker, (const __itt_domain *domain, __itt_id id, __itt_string_handle *name, __itt_scope scope), (ITT_FORMAT domain, id, name, scope), marker, __itt_group_structure, "%p, %lu, %p, %d")
+
+ITT_STUBV(ITTAPI, void, metadata_add,      (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, __itt_metadata_type type, size_t count, void *data), (ITT_FORMAT domain, id, key, type, count, data), metadata_add, __itt_group_structure, "%p, %lu, %p, %d, %lu, %p")
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, metadata_str_addA, (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const char* data, size_t length),    (ITT_FORMAT domain, id, key, data, length), metadata_str_addA, __itt_group_structure, "%p, %lu, %p, %p, %lu")
+ITT_STUBV(ITTAPI, void, metadata_str_addW, (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const wchar_t* data, size_t length), (ITT_FORMAT domain, id, key, data, length), metadata_str_addW, __itt_group_structure, "%p, %lu, %p, %p, %lu")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, metadata_str_add,  (const __itt_domain *domain, __itt_id id, __itt_string_handle *key, const char* data, size_t length),    (ITT_FORMAT domain, id, key, data, length), metadata_str_add,  __itt_group_structure, "%p, %lu, %p, %p, %lu")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+ITT_STUBV(ITTAPI, void, relation_add_to_current, (const __itt_domain *domain, __itt_relation relation, __itt_id tail),                (ITT_FORMAT domain, relation, tail),       relation_add_to_current, __itt_group_structure, "%p, %lu, %p")
+ITT_STUBV(ITTAPI, void, relation_add,            (const __itt_domain *domain, __itt_id head, __itt_relation relation, __itt_id tail), (ITT_FORMAT domain, head, relation, tail), relation_add,            __itt_group_structure, "%p, %p, %lu, %p")
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, __itt_event, event_createA, (const char    *name, int namelen), (ITT_FORMAT name, namelen), event_createA, __itt_group_mark | __itt_group_legacy, "\"%s\", %d")
+ITT_STUB(LIBITTAPI, __itt_event, event_createW, (const wchar_t *name, int namelen), (ITT_FORMAT name, namelen), event_createW, __itt_group_mark | __itt_group_legacy, "\"%S\", %d")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, __itt_event, event_create,  (const char    *name, int namelen), (ITT_FORMAT name, namelen), event_create,  __itt_group_mark | __itt_group_legacy, "\"%s\", %d")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, int,  event_start,          (__itt_event event),                (ITT_FORMAT event),         event_start,   __itt_group_mark | __itt_group_legacy, "%d")
+ITT_STUB(LIBITTAPI, int,  event_end,            (__itt_event event),                (ITT_FORMAT event),         event_end,     __itt_group_mark | __itt_group_legacy, "%d")
+#endif /* __ITT_INTERNAL_BODY */
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, sync_set_nameA, (void *addr, const char    *objtype, const char    *objname, int attribute), (ITT_FORMAT addr, objtype, objname, attribute), sync_set_nameA, __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p, \"%s\", \"%s\", %x")
+ITT_STUBV(ITTAPI, void, sync_set_nameW, (void *addr, const wchar_t *objtype, const wchar_t *objname, int attribute), (ITT_FORMAT addr, objtype, objname, attribute), sync_set_nameW, __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p, \"%S\", \"%S\", %x")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, sync_set_name,  (void *addr, const char    *objtype, const char    *objname, int attribute), (ITT_FORMAT addr, objtype, objname, attribute), sync_set_name,  __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "p, \"%s\", \"%s\", %x")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, int, notify_sync_nameA, (void *p, const char    *objtype, int typelen, const char    *objname, int namelen, int attribute), (ITT_FORMAT p, objtype, typelen, objname, namelen, attribute), notify_sync_nameA, __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p, \"%s\", %d, \"%s\", %d, %x")
+ITT_STUB(LIBITTAPI, int, notify_sync_nameW, (void *p, const wchar_t *objtype, int typelen, const wchar_t *objname, int namelen, int attribute), (ITT_FORMAT p, objtype, typelen, objname, namelen, attribute), notify_sync_nameW, __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p, \"%S\", %d, \"%S\", %d, %x")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, int, notify_sync_name,  (void *p, const char    *objtype, int typelen, const char    *objname, int namelen, int attribute), (ITT_FORMAT p, objtype, typelen, objname, namelen, attribute), notify_sync_name,  __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p, \"%s\", %d, \"%s\", %d, %x")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+ITT_STUBV(LIBITTAPI, void, notify_sync_prepare,   (void *p), (ITT_FORMAT p), notify_sync_prepare,   __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p")
+ITT_STUBV(LIBITTAPI, void, notify_sync_cancel,    (void *p), (ITT_FORMAT p), notify_sync_cancel,    __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p")
+ITT_STUBV(LIBITTAPI, void, notify_sync_acquired,  (void *p), (ITT_FORMAT p), notify_sync_acquired,  __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p")
+ITT_STUBV(LIBITTAPI, void, notify_sync_releasing, (void *p), (ITT_FORMAT p), notify_sync_releasing, __itt_group_sync | __itt_group_fsync | __itt_group_legacy, "%p")
+#endif /* __ITT_INTERNAL_BODY */
+
+ITT_STUBV(LIBITTAPI, void, memory_read,   (void *addr, size_t size), (ITT_FORMAT addr, size), memory_read,   __itt_group_legacy, "%p, %lu")
+ITT_STUBV(LIBITTAPI, void, memory_write,  (void *addr, size_t size), (ITT_FORMAT addr, size), memory_write,  __itt_group_legacy, "%p, %lu")
+ITT_STUBV(LIBITTAPI, void, memory_update, (void *addr, size_t size), (ITT_FORMAT addr, size), memory_update, __itt_group_legacy, "%p, %lu")
+
+ITT_STUB(LIBITTAPI, __itt_state_t,     state_get,    (void),                                    (ITT_NO_PARAMS),   state_get,    __itt_group_legacy, "no args")
+ITT_STUB(LIBITTAPI, __itt_state_t,     state_set,    (__itt_state_t s),                         (ITT_FORMAT s),    state_set,    __itt_group_legacy, "%d")
+ITT_STUB(LIBITTAPI, __itt_obj_state_t, obj_mode_set, (__itt_obj_prop_t p, __itt_obj_state_t s), (ITT_FORMAT p, s), obj_mode_set, __itt_group_legacy, "%d, %d")
+ITT_STUB(LIBITTAPI, __itt_thr_state_t, thr_mode_set, (__itt_thr_prop_t p, __itt_thr_state_t s), (ITT_FORMAT p, s), thr_mode_set, __itt_group_legacy, "%d, %d")
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_frame, frame_createA, (const char    *domain), (ITT_FORMAT domain), frame_createA, __itt_group_frame, "\"%s\"")
+ITT_STUB(ITTAPI, __itt_frame, frame_createW, (const wchar_t *domain), (ITT_FORMAT domain), frame_createW, __itt_group_frame, "\"%s\"")
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_frame, frame_create,  (const char    *domain), (ITT_FORMAT domain), frame_create,  __itt_group_frame, "\"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* __ITT_INTERNAL_BODY */
+ITT_STUBV(ITTAPI, void, frame_begin,         (__itt_frame frame),     (ITT_FORMAT frame),  frame_begin,   __itt_group_frame, "%p")
+ITT_STUBV(ITTAPI, void, frame_end,           (__itt_frame frame),     (ITT_FORMAT frame),  frame_end,     __itt_group_frame, "%p")
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_counter, counter_createA, (const char    *name, const char    *domain), (ITT_FORMAT name, domain), counter_createA, __itt_group_counter, "\"%s\", \"%s\"")
+ITT_STUB(ITTAPI, __itt_counter, counter_createW, (const wchar_t *name, const wchar_t *domain), (ITT_FORMAT name, domain), counter_createW, __itt_group_counter, "\"%s\", \"%s\"")
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_counter, counter_create,  (const char    *name, const char    *domain), (ITT_FORMAT name, domain), counter_create,  __itt_group_counter, "\"%s\", \"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* __ITT_INTERNAL_BODY */
+ITT_STUBV(ITTAPI, void, counter_destroy,   (__itt_counter id),                           (ITT_FORMAT id),        counter_destroy,   __itt_group_counter, "%p")
+ITT_STUBV(ITTAPI, void, counter_inc,       (__itt_counter id),                           (ITT_FORMAT id),        counter_inc,       __itt_group_counter, "%p")
+ITT_STUBV(ITTAPI, void, counter_inc_delta, (__itt_counter id, unsigned long long value), (ITT_FORMAT id, value), counter_inc_delta, __itt_group_counter, "%p, %lu")
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_mark_type, mark_createA, (const char    *name), (ITT_FORMAT name), mark_createA, __itt_group_mark, "\"%s\"")
+ITT_STUB(ITTAPI, __itt_mark_type, mark_createW, (const wchar_t *name), (ITT_FORMAT name), mark_createW, __itt_group_mark, "\"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_mark_type, mark_create,  (const char    *name), (ITT_FORMAT name), mark_create,  __itt_group_mark, "\"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* __ITT_INTERNAL_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, int,  markA,        (__itt_mark_type mt, const char    *parameter), (ITT_FORMAT mt, parameter), markA, __itt_group_mark, "%d, \"%s\"")
+ITT_STUB(ITTAPI, int,  markW,        (__itt_mark_type mt, const wchar_t *parameter), (ITT_FORMAT mt, parameter), markW, __itt_group_mark, "%d, \"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int,  mark,         (__itt_mark_type mt, const char    *parameter), (ITT_FORMAT mt, parameter), mark,  __itt_group_mark, "%d, \"%s\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int,  mark_off, (__itt_mark_type mt), (ITT_FORMAT mt), mark_off, __itt_group_mark, "%d")
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, int,  mark_globalA, (__itt_mark_type mt, const char    *parameter), (ITT_FORMAT mt, parameter), mark_globalA, __itt_group_mark, "%d, \"%s\"")
+ITT_STUB(ITTAPI, int,  mark_globalW, (__itt_mark_type mt, const wchar_t *parameter), (ITT_FORMAT mt, parameter), mark_globalW, __itt_group_mark, "%d, \"%S\"")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int,  mark_global,  (__itt_mark_type mt, const char    *parameter), (ITT_FORMAT mt, parameter), mark_global,  __itt_group_mark, "%d, \"%S\"")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int,  mark_global_off, (__itt_mark_type mt),                        (ITT_FORMAT mt),            mark_global_off, __itt_group_mark, "%d")
+
+#ifndef __ITT_INTERNAL_BODY
+ITT_STUB(ITTAPI, __itt_caller, stack_caller_create, (void), (ITT_NO_PARAMS), stack_caller_create,  __itt_group_stitch, "no args")
+#endif /* __ITT_INTERNAL_BODY */
+ITT_STUBV(ITTAPI, void, stack_caller_destroy, (__itt_caller id), (ITT_FORMAT id), stack_caller_destroy, __itt_group_stitch, "%p")
+ITT_STUBV(ITTAPI, void, stack_callee_enter,   (__itt_caller id), (ITT_FORMAT id), stack_callee_enter,   __itt_group_stitch, "%p")
+ITT_STUBV(ITTAPI, void, stack_callee_leave,   (__itt_caller id), (ITT_FORMAT id), stack_callee_leave,   __itt_group_stitch, "%p")
+
+ITT_STUB(ITTAPI,  __itt_clock_domain*, clock_domain_create, (__itt_get_clock_info_fn fn, void* fn_data), (ITT_FORMAT fn, fn_data), clock_domain_create, __itt_group_structure, "%p, %p")
+ITT_STUBV(ITTAPI, void,                clock_domain_reset,  (void),                                      (ITT_NO_PARAMS),          clock_domain_reset,  __itt_group_structure, "no args")
+ITT_STUBV(ITTAPI, void, id_create_ex,  (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id), (ITT_FORMAT domain, clock_domain, timestamp, id), id_create_ex,  __itt_group_structure, "%p, %p, %lu, %lu")
+ITT_STUBV(ITTAPI, void, id_destroy_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id), (ITT_FORMAT domain, clock_domain, timestamp, id), id_destroy_ex, __itt_group_structure, "%p, %p, %lu, %lu")
+ITT_STUBV(ITTAPI, void, task_begin_ex,    (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_id parentid, __itt_string_handle *name), (ITT_FORMAT domain, clock_domain, timestamp, id, parentid, name), task_begin_ex, __itt_group_structure, "%p, %p, %lu, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, task_begin_fn_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_id parentid, void* fn),                  (ITT_FORMAT domain, clock_domain, timestamp, id, parentid, fn), task_begin_fn_ex, __itt_group_structure, "%p, %p, %lu, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, task_end_ex,      (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp),                                                            (ITT_FORMAT domain, clock_domain, timestamp), task_end_ex, __itt_group_structure, "%p, %p, %lu")
+ITT_STUBV(ITTAPI, void, task_begin_overlapped,       (const __itt_domain *domain, __itt_id id, __itt_id parent, __itt_string_handle *name),                                                                   (ITT_FORMAT domain, id, parent, name), task_begin_overlapped, __itt_group_structure, "%p, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, task_begin_overlapped_ex,    (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_id parentid, __itt_string_handle *name), (ITT_FORMAT domain, clock_domain, timestamp, id, parentid, name), task_begin_overlapped_ex, __itt_group_structure, "%p, %p, %lu, %lu, %lu, %p")
+ITT_STUBV(ITTAPI, void, task_end_overlapped, (const __itt_domain *domain, __itt_id id),                                                                                                                       (ITT_FORMAT domain, id), task_end_overlapped, __itt_group_structure, "%p, %lu")
+ITT_STUBV(ITTAPI, void, task_end_overlapped_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id),                                                    (ITT_FORMAT domain, clock_domain, timestamp, id), task_end_overlapped_ex, __itt_group_structure, "%p, %p, %lu, %lu")
+ITT_STUBV(ITTAPI, void, marker_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id id, __itt_string_handle *name, __itt_scope scope), (ITT_FORMAT domain, clock_domain, timestamp, id, name, scope), marker_ex, __itt_group_structure, "%p, %p, %lu, %lu, %p, %d")
+ITT_STUBV(ITTAPI, void, metadata_add_with_scope, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, __itt_metadata_type type, size_t count, void *data), (ITT_FORMAT domain, scope, key, type, count, data), metadata_add_with_scope, __itt_group_structure, "%p, %d, %p, %d, %lu, %p")
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, metadata_str_add_with_scopeA, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const char *data, size_t length),    (ITT_FORMAT domain, scope, key, data, length), metadata_str_add_with_scopeA, __itt_group_structure, "%p, %d, %p, %p, %lu")
+ITT_STUBV(ITTAPI, void, metadata_str_add_with_scopeW, (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const wchar_t *data, size_t length), (ITT_FORMAT domain, scope, key, data, length), metadata_str_add_with_scopeW, __itt_group_structure, "%p, %d, %p, %p, %lu")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, metadata_str_add_with_scope,  (const __itt_domain *domain, __itt_scope scope, __itt_string_handle *key, const char *data, size_t length),    (ITT_FORMAT domain, scope, key, data, length), metadata_str_add_with_scope,  __itt_group_structure, "%p, %d, %p, %p, %lu")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, relation_add_to_current_ex, (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_relation relation, __itt_id tail),                (ITT_FORMAT domain, clock_domain, timestamp, relation, tail),       relation_add_to_current_ex, __itt_group_structure, "%p, %p, %lu, %d, %lu")
+ITT_STUBV(ITTAPI, void, relation_add_ex,            (const __itt_domain *domain, __itt_clock_domain* clock_domain, unsigned long long timestamp, __itt_id head, __itt_relation relation, __itt_id tail), (ITT_FORMAT domain, clock_domain, timestamp, head, relation, tail), relation_add_ex,            __itt_group_structure, "%p, %p, %lu, %lu, %d, %lu")
+ITT_STUB(ITTAPI,  __itt_track_group*, track_group_create, (__itt_string_handle* name, __itt_track_group_type track_group_type),                    (ITT_FORMAT name, track_group_type),        track_group_create, __itt_group_structure, "%p, %d")
+ITT_STUB(ITTAPI,  __itt_track*,       track_create,       (__itt_track_group* track_group,__itt_string_handle* name, __itt_track_type track_type), (ITT_FORMAT track_group, name, track_type), track_create,       __itt_group_structure, "%p, %p, %d")
+ITT_STUBV(ITTAPI, void,               set_track,          (__itt_track *track),                                                                    (ITT_FORMAT track),                         set_track,          __itt_group_structure, "%p")
+
+#ifndef __ITT_INTERNAL_BODY
+ITT_STUB(ITTAPI, const char*, api_version, (void), (ITT_NO_PARAMS), api_version, __itt_group_all & ~__itt_group_legacy, "no args")
+#endif /* __ITT_INTERNAL_BODY */
+
+#ifndef __ITT_INTERNAL_BODY
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, int, av_saveA, (void *data, int rank, const int *dimensions, int type, const char *filePath, int columnOrder), (ITT_FORMAT data, rank, dimensions, type, filePath, columnOrder), av_saveA, __itt_group_arrays, "%p, %d, %p, %d, \"%s\", %d")
+ITT_STUB(ITTAPI, int, av_saveW, (void *data, int rank, const int *dimensions, int type, const wchar_t *filePath, int columnOrder), (ITT_FORMAT data, rank, dimensions, type, filePath, columnOrder), av_saveW, __itt_group_arrays, "%p, %d, %p, %d, \"%S\", %d")
+#else  /* ITT_PLATFORM!=ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, int, av_save,  (void *data, int rank, const int *dimensions, int type, const char *filePath, int columnOrder), (ITT_FORMAT data, rank, dimensions, type, filePath, columnOrder), av_save,  __itt_group_arrays, "%p, %d, %p, %d, \"%s\", %d")
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* __ITT_INTERNAL_BODY */
+
+#endif /* __ITT_INTERNAL_INIT */
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_types.h b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_types.h
new file mode 100644
index 00000000..2c0f5da5
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/ittnotify_types.h
@@ -0,0 +1,77 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _ITTNOTIFY_TYPES_H_
+#define _ITTNOTIFY_TYPES_H_
+
+typedef enum ___itt_group_id
+{
+    __itt_group_none      = 0,
+    __itt_group_legacy    = 1<<0,
+    __itt_group_control   = 1<<1,
+    __itt_group_thread    = 1<<2,
+    __itt_group_mark      = 1<<3,
+    __itt_group_sync      = 1<<4,
+    __itt_group_fsync     = 1<<5,
+    __itt_group_jit       = 1<<6,
+    __itt_group_model     = 1<<7,
+    __itt_group_splitter_min = 1<<7,
+    __itt_group_counter   = 1<<8,
+    __itt_group_frame     = 1<<9,
+    __itt_group_stitch    = 1<<10,
+    __itt_group_heap      = 1<<11,
+    __itt_group_splitter_max = 1<<12,
+    __itt_group_structure = 1<<12,
+    __itt_group_suppress = 1<<13,
+    __itt_group_arrays    = 1<<14,
+    __itt_group_all       = -1
+} __itt_group_id;
+
+#pragma pack(push, 8)
+
+typedef struct ___itt_group_list
+{
+    __itt_group_id id;
+    const char*    name;
+} __itt_group_list;
+
+#pragma pack(pop)
+
+#define ITT_GROUP_LIST(varname) \
+    static __itt_group_list varname[] = {       \
+        { __itt_group_all,       "all"       }, \
+        { __itt_group_control,   "control"   }, \
+        { __itt_group_thread,    "thread"    }, \
+        { __itt_group_mark,      "mark"      }, \
+        { __itt_group_sync,      "sync"      }, \
+        { __itt_group_fsync,     "fsync"     }, \
+        { __itt_group_jit,       "jit"       }, \
+        { __itt_group_model,     "model"     }, \
+        { __itt_group_counter,   "counter"   }, \
+        { __itt_group_frame,     "frame"     }, \
+        { __itt_group_stitch,    "stitch"    }, \
+        { __itt_group_heap,      "heap"      }, \
+        { __itt_group_structure, "structure" }, \
+        { __itt_group_suppress,  "suppress"  }, \
+        { __itt_group_arrays,    "arrays"    }, \
+        { __itt_group_none,      NULL        }  \
+    }
+
+#endif /* _ITTNOTIFY_TYPES_H_ */
diff --git a/xdl/third_party/tbb/src/tbb/tools_api/legacy/ittnotify.h b/xdl/third_party/tbb/src/tbb/tools_api/legacy/ittnotify.h
new file mode 100644
index 00000000..a3d8d2e1
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/tools_api/legacy/ittnotify.h
@@ -0,0 +1,1002 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _LEGACY_ITTNOTIFY_H_
+#define _LEGACY_ITTNOTIFY_H_
+
+/**
+ * @file
+ * @brief Legacy User API functions and types
+ */
+
+/** @cond exclude_from_documentation */
+#ifndef ITT_OS_WIN
+#  define ITT_OS_WIN   1
+#endif /* ITT_OS_WIN */
+
+#ifndef ITT_OS_LINUX
+#  define ITT_OS_LINUX 2
+#endif /* ITT_OS_LINUX */
+
+#ifndef ITT_OS_MAC
+#  define ITT_OS_MAC   3
+#endif /* ITT_OS_MAC */
+
+#ifndef ITT_OS_FREEBSD
+#  define ITT_OS_FREEBSD   4
+#endif /* ITT_OS_FREEBSD */
+
+#ifndef ITT_OS
+#  if defined WIN32 || defined _WIN32
+#    define ITT_OS ITT_OS_WIN
+#  elif defined( __APPLE__ ) && defined( __MACH__ )
+#    define ITT_OS ITT_OS_MAC
+#  elif defined( __FreeBSD__ )
+#    define ITT_OS ITT_OS_FREEBSD
+#  else
+#    define ITT_OS ITT_OS_LINUX
+#  endif
+#endif /* ITT_OS */
+
+#ifndef ITT_PLATFORM_WIN
+#  define ITT_PLATFORM_WIN 1
+#endif /* ITT_PLATFORM_WIN */
+
+#ifndef ITT_PLATFORM_POSIX
+#  define ITT_PLATFORM_POSIX 2
+#endif /* ITT_PLATFORM_POSIX */
+
+#ifndef ITT_PLATFORM_MAC
+#  define ITT_PLATFORM_MAC 3
+#endif /* ITT_PLATFORM_MAC */
+
+#ifndef ITT_PLATFORM_FREEBSD
+#  define ITT_PLATFORM_FREEBSD 4
+#endif /* ITT_PLATFORM_FREEBSD */
+
+#ifndef ITT_PLATFORM
+#  if ITT_OS==ITT_OS_WIN
+#    define ITT_PLATFORM ITT_PLATFORM_WIN
+#  elif ITT_OS==ITT_OS_MAC
+#    define ITT_PLATFORM ITT_PLATFORM_MAC
+#  elif ITT_OS==ITT_OS_FREEBSD
+#    define ITT_PLATFORM ITT_PLATFORM_FREEBSD
+#  else
+#    define ITT_PLATFORM ITT_PLATFORM_POSIX
+#  endif
+#endif /* ITT_PLATFORM */
+
+#if defined(_UNICODE) && !defined(UNICODE)
+#define UNICODE
+#endif
+
+#include <stddef.h>
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#include <tchar.h>
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#include <stdint.h>
+#if defined(UNICODE) || defined(_UNICODE)
+#include <wchar.h>
+#endif /* UNICODE || _UNICODE */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+#ifndef CDECL
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    define CDECL __cdecl
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#    if defined _M_IX86 || defined __i386__ 
+#      define CDECL __attribute__ ((cdecl))
+#    else  /* _M_IX86 || __i386__ */
+#      define CDECL /* actual only on x86 platform */
+#    endif /* _M_IX86 || __i386__ */
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* CDECL */
+
+#ifndef STDCALL
+#  if ITT_PLATFORM==ITT_PLATFORM_WIN
+#    define STDCALL __stdcall
+#  else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#    if defined _M_IX86 || defined __i386__
+#      define STDCALL __attribute__ ((stdcall)) 
+#    else  /* _M_IX86 || __i386__ */
+#      define STDCALL /* supported only on x86 platform */
+#    endif /* _M_IX86 || __i386__ */
+#  endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* STDCALL */
+
+#define ITTAPI    CDECL
+#define LIBITTAPI CDECL
+
+/* TODO: Temporary for compatibility! */
+#define ITTAPI_CALL    CDECL
+#define LIBITTAPI_CALL CDECL
+
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+/* use __forceinline (VC++ specific) */
+#define ITT_INLINE           __forceinline
+#define ITT_INLINE_ATTRIBUTE /* nothing */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+/*
+ * Generally, functions are not inlined unless optimization is specified.
+ * For functions declared inline, this attribute inlines the function even
+ * if no optimization level was specified.
+ */
+#ifdef __STRICT_ANSI__
+#define ITT_INLINE           static
+#define ITT_INLINE_ATTRIBUTE __attribute__((unused))
+#else  /* __STRICT_ANSI__ */
+#define ITT_INLINE           static inline
+#define ITT_INLINE_ATTRIBUTE __attribute__((always_inline, unused))
+#endif /* __STRICT_ANSI__ */
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+/** @endcond */
+
+/** @cond exclude_from_documentation */
+/* Helper macro for joining tokens */
+#define ITT_JOIN_AUX(p,n) p##n
+#define ITT_JOIN(p,n)     ITT_JOIN_AUX(p,n)
+
+#ifdef ITT_MAJOR
+#undef ITT_MAJOR
+#endif
+#ifdef ITT_MINOR
+#undef ITT_MINOR
+#endif
+#define ITT_MAJOR     3
+#define ITT_MINOR     0
+
+/* Standard versioning of a token with major and minor version numbers */
+#define ITT_VERSIONIZE(x)    \
+    ITT_JOIN(x,              \
+    ITT_JOIN(_,              \
+    ITT_JOIN(ITT_MAJOR,      \
+    ITT_JOIN(_, ITT_MINOR))))
+
+#ifndef INTEL_ITTNOTIFY_PREFIX
+#  define INTEL_ITTNOTIFY_PREFIX __itt_
+#endif /* INTEL_ITTNOTIFY_PREFIX */
+#ifndef INTEL_ITTNOTIFY_POSTFIX
+#  define INTEL_ITTNOTIFY_POSTFIX _ptr_
+#endif /* INTEL_ITTNOTIFY_POSTFIX */
+
+#define ITTNOTIFY_NAME_AUX(n) ITT_JOIN(INTEL_ITTNOTIFY_PREFIX,n)
+#define ITTNOTIFY_NAME(n)     ITT_VERSIONIZE(ITTNOTIFY_NAME_AUX(ITT_JOIN(n,INTEL_ITTNOTIFY_POSTFIX)))
+
+#define ITTNOTIFY_VOID(n) (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)
+#define ITTNOTIFY_DATA(n) (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)
+
+#define ITTNOTIFY_VOID_D0(n,d)       (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d)
+#define ITTNOTIFY_VOID_D1(n,d,x)     (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x)
+#define ITTNOTIFY_VOID_D2(n,d,x,y)   (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y)
+#define ITTNOTIFY_VOID_D3(n,d,x,y,z) (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z)
+#define ITTNOTIFY_VOID_D4(n,d,x,y,z,a)     (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z,a)
+#define ITTNOTIFY_VOID_D5(n,d,x,y,z,a,b)   (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b)
+#define ITTNOTIFY_VOID_D6(n,d,x,y,z,a,b,c) (!(d)->flags) ? (void)0 : (!ITTNOTIFY_NAME(n)) ? (void)0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b,c)
+#define ITTNOTIFY_DATA_D0(n,d)       (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d)
+#define ITTNOTIFY_DATA_D1(n,d,x)     (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x)
+#define ITTNOTIFY_DATA_D2(n,d,x,y)   (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y)
+#define ITTNOTIFY_DATA_D3(n,d,x,y,z) (!(d)->flags) ?       0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z)
+#define ITTNOTIFY_DATA_D4(n,d,x,y,z,a)     (!(d)->flags) ? 0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z,a)
+#define ITTNOTIFY_DATA_D5(n,d,x,y,z,a,b)   (!(d)->flags) ? 0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b)
+#define ITTNOTIFY_DATA_D6(n,d,x,y,z,a,b,c) (!(d)->flags) ? 0 : (!ITTNOTIFY_NAME(n)) ?       0 : ITTNOTIFY_NAME(n)(d,x,y,z,a,b,c)
+
+#ifdef ITT_STUB
+#undef ITT_STUB
+#endif
+#ifdef ITT_STUBV
+#undef ITT_STUBV
+#endif
+#define ITT_STUBV(api,type,name,args)                             \
+    typedef type (api* ITT_JOIN(ITTNOTIFY_NAME(name),_t)) args;   \
+    extern ITT_JOIN(ITTNOTIFY_NAME(name),_t) ITTNOTIFY_NAME(name);
+#define ITT_STUB ITT_STUBV
+/** @endcond */
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+/**
+ * @defgroup legacy Legacy API
+ * @{
+ * @}
+ */
+
+/**
+ * @defgroup legacy_control Collection Control
+ * @ingroup legacy
+ * General behavior: application continues to run, but no profiling information is being collected
+ *
+ * Pausing occurs not only for the current thread but for all process as well as spawned processes
+ * - Intel(R) Parallel Inspector and Intel(R) Inspector XE:
+ *   - Does not analyze or report errors that involve memory access.
+ *   - Other errors are reported as usual. Pausing data collection in
+ *     Intel(R) Parallel Inspector and Intel(R) Inspector XE
+ *     only pauses tracing and analyzing memory access.
+ *     It does not pause tracing or analyzing threading APIs.
+ *   .
+ * - Intel(R) Parallel Amplifier and Intel(R) VTune(TM) Amplifier XE:
+ *   - Does continue to record when new threads are started.
+ *   .
+ * - Other effects:
+ *   - Possible reduction of runtime overhead.
+ *   .
+ * @{
+ */
+#ifndef _ITTNOTIFY_H_
+/** @brief Pause collection */
+void ITTAPI __itt_pause(void);
+/** @brief Resume collection */
+void ITTAPI __itt_resume(void);
+/** @brief Detach collection */
+void ITTAPI __itt_detach(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, pause,   (void))
+ITT_STUBV(ITTAPI, void, resume,  (void))
+ITT_STUBV(ITTAPI, void, detach,  (void))
+#define __itt_pause      ITTNOTIFY_VOID(pause)
+#define __itt_pause_ptr  ITTNOTIFY_NAME(pause)
+#define __itt_resume     ITTNOTIFY_VOID(resume)
+#define __itt_resume_ptr ITTNOTIFY_NAME(resume)
+#define __itt_detach     ITTNOTIFY_VOID(detach)
+#define __itt_detach_ptr ITTNOTIFY_NAME(detach)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_pause()
+#define __itt_pause_ptr  0
+#define __itt_resume()
+#define __itt_resume_ptr 0
+#define __itt_detach()
+#define __itt_detach_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_pause_ptr  0
+#define __itt_resume_ptr 0
+#define __itt_detach_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+#endif /* _ITTNOTIFY_H_ */
+/** @} legacy_control group */
+
+/**
+ * @defgroup legacy_threads Threads
+ * @ingroup legacy
+ * Threads group
+ * @warning Legacy API
+ * @{
+ */
+/**
+ * @deprecated Legacy API
+ * @brief Set name to be associated with thread in analysis GUI.
+ * @return __itt_err upon failure (name or namelen being null,name and namelen mismatched)
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+int LIBITTAPI __itt_thr_name_setA(const char    *name, int namelen);
+int LIBITTAPI __itt_thr_name_setW(const wchar_t *name, int namelen);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_thr_name_set     __itt_thr_name_setW
+#  define __itt_thr_name_set_ptr __itt_thr_name_setW_ptr
+#else
+#  define __itt_thr_name_set     __itt_thr_name_setA
+#  define __itt_thr_name_set_ptr __itt_thr_name_setA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+int LIBITTAPI __itt_thr_name_set(const char *name, int namelen);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, int, thr_name_setA, (const char    *name, int namelen))
+ITT_STUB(LIBITTAPI, int, thr_name_setW, (const wchar_t *name, int namelen))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, int, thr_name_set,  (const char    *name, int namelen))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_thr_name_setA     ITTNOTIFY_DATA(thr_name_setA)
+#define __itt_thr_name_setA_ptr ITTNOTIFY_NAME(thr_name_setA)
+#define __itt_thr_name_setW     ITTNOTIFY_DATA(thr_name_setW)
+#define __itt_thr_name_setW_ptr ITTNOTIFY_NAME(thr_name_setW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_thr_name_set     ITTNOTIFY_DATA(thr_name_set)
+#define __itt_thr_name_set_ptr ITTNOTIFY_NAME(thr_name_set)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_thr_name_setA(name, namelen)
+#define __itt_thr_name_setA_ptr 0
+#define __itt_thr_name_setW(name, namelen)
+#define __itt_thr_name_setW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_thr_name_set(name, namelen)
+#define __itt_thr_name_set_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_thr_name_setA_ptr 0
+#define __itt_thr_name_setW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_thr_name_set_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Mark current thread as ignored from this point on, for the duration of its existence.
+ */
+void LIBITTAPI __itt_thr_ignore(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, thr_ignore, (void))
+#define __itt_thr_ignore     ITTNOTIFY_VOID(thr_ignore)
+#define __itt_thr_ignore_ptr ITTNOTIFY_NAME(thr_ignore)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_thr_ignore()
+#define __itt_thr_ignore_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_thr_ignore_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} legacy_threads group */
+
+/**
+ * @defgroup legacy_sync Synchronization
+ * @ingroup legacy
+ * Synchronization group
+ * @warning Legacy API
+ * @{
+ */
+/**
+ * @hideinitializer
+ * @brief possible value of attribute argument for sync object type
+ */
+#define __itt_attr_barrier 1
+
+/**
+ * @hideinitializer
+ * @brief possible value of attribute argument for sync object type
+ */
+#define __itt_attr_mutex   2
+
+/**
+ * @deprecated Legacy API
+ * @brief Assign a name to a sync object using char or Unicode string
+ * @param[in] addr    - pointer to the sync object. You should use a real pointer to your object
+ *                      to make sure that the values don't clash with other object addresses
+ * @param[in] objtype - null-terminated object type string. If NULL is passed, the object will
+ *                      be assumed to be of generic "User Synchronization" type
+ * @param[in] objname - null-terminated object name string. If NULL, no name will be assigned
+ *                      to the object -- you can use the __itt_sync_rename call later to assign
+ *                      the name
+ * @param[in] attribute - one of [#__itt_attr_barrier, #__itt_attr_mutex] values which defines the
+ *                      exact semantics of how prepare/acquired/releasing calls work.
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+void ITTAPI __itt_sync_set_nameA(void *addr, const char    *objtype, const char    *objname, int attribute);
+void ITTAPI __itt_sync_set_nameW(void *addr, const wchar_t *objtype, const wchar_t *objname, int attribute);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_sync_set_name     __itt_sync_set_nameW
+#  define __itt_sync_set_name_ptr __itt_sync_set_nameW_ptr
+#else /* UNICODE */
+#  define __itt_sync_set_name     __itt_sync_set_nameA
+#  define __itt_sync_set_name_ptr __itt_sync_set_nameA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+void ITTAPI __itt_sync_set_name(void *addr, const char* objtype, const char* objname, int attribute);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUBV(ITTAPI, void, sync_set_nameA, (void *addr, const char    *objtype, const char    *objname, int attribute))
+ITT_STUBV(ITTAPI, void, sync_set_nameW, (void *addr, const wchar_t *objtype, const wchar_t *objname, int attribute))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUBV(ITTAPI, void, sync_set_name,  (void *addr, const char    *objtype, const char    *objname, int attribute))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_set_nameA     ITTNOTIFY_VOID(sync_set_nameA)
+#define __itt_sync_set_nameA_ptr ITTNOTIFY_NAME(sync_set_nameA)
+#define __itt_sync_set_nameW     ITTNOTIFY_VOID(sync_set_nameW)
+#define __itt_sync_set_nameW_ptr ITTNOTIFY_NAME(sync_set_nameW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_set_name     ITTNOTIFY_VOID(sync_set_name)
+#define __itt_sync_set_name_ptr ITTNOTIFY_NAME(sync_set_name)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_set_nameA(addr, objtype, objname, attribute)
+#define __itt_sync_set_nameA_ptr 0
+#define __itt_sync_set_nameW(addr, objtype, objname, attribute)
+#define __itt_sync_set_nameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_set_name(addr, objtype, objname, attribute)
+#define __itt_sync_set_name_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_sync_set_nameA_ptr 0
+#define __itt_sync_set_nameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_sync_set_name_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Assign a name and type to a sync object using char or Unicode string
+ * @param[in] addr -      pointer to the sync object. You should use a real pointer to your object
+ *                        to make sure that the values don't clash with other object addresses
+ * @param[in] objtype -   null-terminated object type string. If NULL is passed, the object will
+ *                        be assumed to be of generic "User Synchronization" type
+ * @param[in] objname -   null-terminated object name string. If NULL, no name will be assigned
+ *                        to the object -- you can use the __itt_sync_rename call later to assign
+ *                        the name
+ * @param[in] typelen, namelen -   a length of string for appropriate objtype and objname parameter
+ * @param[in] attribute - one of [#__itt_attr_barrier, #__itt_attr_mutex] values which defines the
+ *                        exact semantics of how prepare/acquired/releasing calls work.
+ * @return __itt_err upon failure (name or namelen being null,name and namelen mismatched)
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+int LIBITTAPI __itt_notify_sync_nameA(void *addr, const char    *objtype, int typelen, const char    *objname, int namelen, int attribute);
+int LIBITTAPI __itt_notify_sync_nameW(void *addr, const wchar_t *objtype, int typelen, const wchar_t *objname, int namelen, int attribute);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_notify_sync_name __itt_notify_sync_nameW
+#else
+#  define __itt_notify_sync_name __itt_notify_sync_nameA
+#endif
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+int LIBITTAPI __itt_notify_sync_name(void *addr, const char *objtype, int typelen, const char *objname, int namelen, int attribute);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, int, notify_sync_nameA, (void *addr, const char    *objtype, int typelen, const char    *objname, int namelen, int attribute))
+ITT_STUB(LIBITTAPI, int, notify_sync_nameW, (void *addr, const wchar_t *objtype, int typelen, const wchar_t *objname, int namelen, int attribute))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, int, notify_sync_name,  (void *addr, const char    *objtype, int typelen, const char    *objname, int namelen, int attribute))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_notify_sync_nameA     ITTNOTIFY_DATA(notify_sync_nameA)
+#define __itt_notify_sync_nameA_ptr ITTNOTIFY_NAME(notify_sync_nameA)
+#define __itt_notify_sync_nameW     ITTNOTIFY_DATA(notify_sync_nameW)
+#define __itt_notify_sync_nameW_ptr ITTNOTIFY_NAME(notify_sync_nameW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_notify_sync_name     ITTNOTIFY_DATA(notify_sync_name)
+#define __itt_notify_sync_name_ptr ITTNOTIFY_NAME(notify_sync_name)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_notify_sync_nameA(addr, objtype, typelen, objname, namelen, attribute)
+#define __itt_notify_sync_nameA_ptr 0
+#define __itt_notify_sync_nameW(addr, objtype, typelen, objname, namelen, attribute)
+#define __itt_notify_sync_nameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_notify_sync_name(addr, objtype, typelen, objname, namelen, attribute)
+#define __itt_notify_sync_name_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_notify_sync_nameA_ptr 0
+#define __itt_notify_sync_nameW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_notify_sync_name_ptr 0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Enter spin loop on user-defined sync object
+ */
+void LIBITTAPI __itt_notify_sync_prepare(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, notify_sync_prepare, (void *addr))
+#define __itt_notify_sync_prepare     ITTNOTIFY_VOID(notify_sync_prepare)
+#define __itt_notify_sync_prepare_ptr ITTNOTIFY_NAME(notify_sync_prepare)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_notify_sync_prepare(addr)
+#define __itt_notify_sync_prepare_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_notify_sync_prepare_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Quit spin loop without acquiring spin object
+ */
+void LIBITTAPI __itt_notify_sync_cancel(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, notify_sync_cancel, (void *addr))
+#define __itt_notify_sync_cancel     ITTNOTIFY_VOID(notify_sync_cancel)
+#define __itt_notify_sync_cancel_ptr ITTNOTIFY_NAME(notify_sync_cancel)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_notify_sync_cancel(addr)
+#define __itt_notify_sync_cancel_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_notify_sync_cancel_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Successful spin loop completion (sync object acquired)
+ */
+void LIBITTAPI __itt_notify_sync_acquired(void *addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, notify_sync_acquired, (void *addr))
+#define __itt_notify_sync_acquired     ITTNOTIFY_VOID(notify_sync_acquired)
+#define __itt_notify_sync_acquired_ptr ITTNOTIFY_NAME(notify_sync_acquired)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_notify_sync_acquired(addr)
+#define __itt_notify_sync_acquired_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_notify_sync_acquired_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Start sync object releasing code. Is called before the lock release call.
+ */
+void LIBITTAPI __itt_notify_sync_releasing(void* addr);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, notify_sync_releasing, (void *addr))
+#define __itt_notify_sync_releasing     ITTNOTIFY_VOID(notify_sync_releasing)
+#define __itt_notify_sync_releasing_ptr ITTNOTIFY_NAME(notify_sync_releasing)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_notify_sync_releasing(addr)
+#define __itt_notify_sync_releasing_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_notify_sync_releasing_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} legacy_sync group */
+
+#ifndef _ITTNOTIFY_H_
+/**
+ * @defgroup legacy_events Events
+ * @ingroup legacy
+ * Events group
+ * @{
+ */
+
+/** @brief user event type */
+typedef int __itt_event;
+
+/**
+ * @brief Create an event notification
+ * @note name or namelen being null/name and namelen not matching, user event feature not enabled
+ * @return non-zero event identifier upon success and __itt_err otherwise
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_event LIBITTAPI __itt_event_createA(const char    *name, int namelen);
+__itt_event LIBITTAPI __itt_event_createW(const wchar_t *name, int namelen);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_event_create     __itt_event_createW
+#  define __itt_event_create_ptr __itt_event_createW_ptr
+#else
+#  define __itt_event_create     __itt_event_createA
+#  define __itt_event_create_ptr __itt_event_createA_ptr
+#endif /* UNICODE */
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_event LIBITTAPI __itt_event_create(const char *name, int namelen);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(LIBITTAPI, __itt_event, event_createA, (const char    *name, int namelen))
+ITT_STUB(LIBITTAPI, __itt_event, event_createW, (const wchar_t *name, int namelen))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(LIBITTAPI, __itt_event, event_create,  (const char *name, int namelen))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_event_createA     ITTNOTIFY_DATA(event_createA)
+#define __itt_event_createA_ptr ITTNOTIFY_NAME(event_createA)
+#define __itt_event_createW     ITTNOTIFY_DATA(event_createW)
+#define __itt_event_createW_ptr ITTNOTIFY_NAME(event_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_event_create      ITTNOTIFY_DATA(event_create)
+#define __itt_event_create_ptr  ITTNOTIFY_NAME(event_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_event_createA(name, namelen) (__itt_event)0
+#define __itt_event_createA_ptr 0
+#define __itt_event_createW(name, namelen) (__itt_event)0
+#define __itt_event_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_event_create(name, namelen)  (__itt_event)0
+#define __itt_event_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_event_createA_ptr 0
+#define __itt_event_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_event_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an event occurrence.
+ * @return __itt_err upon failure (invalid event id/user event feature not enabled)
+ */
+int LIBITTAPI __itt_event_start(__itt_event event);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(LIBITTAPI, int, event_start, (__itt_event event))
+#define __itt_event_start     ITTNOTIFY_DATA(event_start)
+#define __itt_event_start_ptr ITTNOTIFY_NAME(event_start)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_event_start(event) (int)0
+#define __itt_event_start_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_event_start_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @brief Record an event end occurrence.
+ * @note It is optional if events do not have durations.
+ * @return __itt_err upon failure (invalid event id/user event feature not enabled)
+ */
+int LIBITTAPI __itt_event_end(__itt_event event);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(LIBITTAPI, int, event_end, (__itt_event event))
+#define __itt_event_end     ITTNOTIFY_DATA(event_end)
+#define __itt_event_end_ptr ITTNOTIFY_NAME(event_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_event_end(event) (int)0
+#define __itt_event_end_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_event_end_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} legacy_events group */
+#endif /* _ITTNOTIFY_H_ */
+
+/**
+ * @defgroup legacy_memory Memory Accesses
+ * @ingroup legacy
+ */
+
+/**
+ * @deprecated Legacy API
+ * @brief Inform the tool of memory accesses on reading
+ */
+void LIBITTAPI __itt_memory_read(void *addr, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, memory_read, (void *addr, size_t size))
+#define __itt_memory_read     ITTNOTIFY_VOID(memory_read)
+#define __itt_memory_read_ptr ITTNOTIFY_NAME(memory_read)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_memory_read(addr, size)
+#define __itt_memory_read_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_memory_read_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Inform the tool of memory accesses on writing
+ */
+void LIBITTAPI __itt_memory_write(void *addr, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, memory_write, (void *addr, size_t size))
+#define __itt_memory_write     ITTNOTIFY_VOID(memory_write)
+#define __itt_memory_write_ptr ITTNOTIFY_NAME(memory_write)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_memory_write(addr, size)
+#define __itt_memory_write_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_memory_write_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief Inform the tool of memory accesses on updating
+ */
+void LIBITTAPI __itt_memory_update(void *address, size_t size);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(LIBITTAPI, void, memory_update, (void *addr, size_t size))
+#define __itt_memory_update     ITTNOTIFY_VOID(memory_update)
+#define __itt_memory_update_ptr ITTNOTIFY_NAME(memory_update)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_memory_update(addr, size)
+#define __itt_memory_update_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_memory_update_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} legacy_memory group */
+
+/**
+ * @defgroup legacy_state Thread and Object States
+ * @ingroup legacy
+ */
+
+/** @brief state type */
+typedef int __itt_state_t;
+
+/** @cond exclude_from_documentation */
+typedef enum __itt_obj_state {
+    __itt_obj_state_err = 0,
+    __itt_obj_state_clr = 1,
+    __itt_obj_state_set = 2,
+    __itt_obj_state_use = 3
+} __itt_obj_state_t;
+
+typedef enum __itt_thr_state {
+    __itt_thr_state_err = 0,
+    __itt_thr_state_clr = 1,
+    __itt_thr_state_set = 2
+} __itt_thr_state_t;
+
+typedef enum __itt_obj_prop {
+    __itt_obj_prop_watch    = 1,
+    __itt_obj_prop_ignore   = 2,
+    __itt_obj_prop_sharable = 3
+} __itt_obj_prop_t;
+
+typedef enum __itt_thr_prop {
+    __itt_thr_prop_quiet = 1
+} __itt_thr_prop_t;
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief managing thread and object states
+ */
+__itt_state_t LIBITTAPI __itt_state_get(void);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_state_t, state_get, (void))
+#define __itt_state_get     ITTNOTIFY_DATA(state_get)
+#define __itt_state_get_ptr ITTNOTIFY_NAME(state_get)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_state_get(void) (__itt_state_t)0
+#define __itt_state_get_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_state_get_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief managing thread and object states
+ */
+__itt_state_t LIBITTAPI __itt_state_set(__itt_state_t s);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_state_t, state_set, (__itt_state_t s))
+#define __itt_state_set     ITTNOTIFY_DATA(state_set)
+#define __itt_state_set_ptr ITTNOTIFY_NAME(state_set)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_state_set(s) (__itt_state_t)0
+#define __itt_state_set_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_state_set_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief managing thread and object modes
+ */
+__itt_thr_state_t LIBITTAPI __itt_thr_mode_set(__itt_thr_prop_t p, __itt_thr_state_t s);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_thr_state_t, thr_mode_set, (__itt_thr_prop_t p, __itt_thr_state_t s))
+#define __itt_thr_mode_set     ITTNOTIFY_DATA(thr_mode_set)
+#define __itt_thr_mode_set_ptr ITTNOTIFY_NAME(thr_mode_set)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_thr_mode_set(p, s) (__itt_thr_state_t)0
+#define __itt_thr_mode_set_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_thr_mode_set_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/**
+ * @deprecated Legacy API
+ * @brief managing thread and object modes
+ */
+__itt_obj_state_t LIBITTAPI __itt_obj_mode_set(__itt_obj_prop_t p, __itt_obj_state_t s);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUB(ITTAPI, __itt_obj_state_t, obj_mode_set, (__itt_obj_prop_t p, __itt_obj_state_t s))
+#define __itt_obj_mode_set     ITTNOTIFY_DATA(obj_mode_set)
+#define __itt_obj_mode_set_ptr ITTNOTIFY_NAME(obj_mode_set)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_obj_mode_set(p, s) (__itt_obj_state_t)0
+#define __itt_obj_mode_set_ptr 0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_obj_mode_set_ptr 0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} legacy_state group */
+
+/**
+ * @defgroup frames Frames
+ * @ingroup legacy
+ * Frames group
+ * @{
+ */
+/**
+ * @brief opaque structure for frame identification
+ */
+typedef struct __itt_frame_t *__itt_frame;
+
+/**
+ * @brief Create a global frame with given domain
+ */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+__itt_frame ITTAPI __itt_frame_createA(const char    *domain);
+__itt_frame ITTAPI __itt_frame_createW(const wchar_t *domain);
+#if defined(UNICODE) || defined(_UNICODE)
+#  define __itt_frame_create     __itt_frame_createW
+#  define __itt_frame_create_ptr __itt_frame_createW_ptr
+#else /* UNICODE */
+#  define __itt_frame_create     __itt_frame_createA
+#  define __itt_frame_create_ptr __itt_frame_createA_ptr
+#endif /* UNICODE */
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+__itt_frame ITTAPI __itt_frame_create(const char *domain);
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+ITT_STUB(ITTAPI, __itt_frame, frame_createA, (const char    *domain))
+ITT_STUB(ITTAPI, __itt_frame, frame_createW, (const wchar_t *domain))
+#else  /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+ITT_STUB(ITTAPI, __itt_frame, frame_create,  (const char *domain))
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_frame_createA     ITTNOTIFY_DATA(frame_createA)
+#define __itt_frame_createA_ptr ITTNOTIFY_NAME(frame_createA)
+#define __itt_frame_createW     ITTNOTIFY_DATA(frame_createW)
+#define __itt_frame_createW_ptr ITTNOTIFY_NAME(frame_createW)
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_frame_create     ITTNOTIFY_DATA(frame_create)
+#define __itt_frame_create_ptr ITTNOTIFY_NAME(frame_create)
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_frame_createA(domain)
+#define __itt_frame_createA_ptr 0
+#define __itt_frame_createW(domain)
+#define __itt_frame_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_frame_create(domain)
+#define __itt_frame_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#if ITT_PLATFORM==ITT_PLATFORM_WIN
+#define __itt_frame_createA_ptr 0
+#define __itt_frame_createW_ptr 0
+#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#define __itt_frame_create_ptr  0
+#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+
+/** @brief Record an frame begin occurrence. */
+void ITTAPI __itt_frame_begin(__itt_frame frame);
+/** @brief Record an frame end occurrence. */
+void ITTAPI __itt_frame_end  (__itt_frame frame);
+
+/** @cond exclude_from_documentation */
+#ifndef INTEL_NO_MACRO_BODY
+#ifndef INTEL_NO_ITTNOTIFY_API
+ITT_STUBV(ITTAPI, void, frame_begin, (__itt_frame frame))
+ITT_STUBV(ITTAPI, void, frame_end,   (__itt_frame frame))
+#define __itt_frame_begin     ITTNOTIFY_VOID(frame_begin)
+#define __itt_frame_begin_ptr ITTNOTIFY_NAME(frame_begin)
+#define __itt_frame_end       ITTNOTIFY_VOID(frame_end)
+#define __itt_frame_end_ptr   ITTNOTIFY_NAME(frame_end)
+#else  /* INTEL_NO_ITTNOTIFY_API */
+#define __itt_frame_begin(frame)
+#define __itt_frame_begin_ptr 0
+#define __itt_frame_end(frame)
+#define __itt_frame_end_ptr   0
+#endif /* INTEL_NO_ITTNOTIFY_API */
+#else  /* INTEL_NO_MACRO_BODY */
+#define __itt_frame_begin_ptr 0
+#define __itt_frame_end_ptr   0
+#endif /* INTEL_NO_MACRO_BODY */
+/** @endcond */
+/** @} frames group */
+
+#ifdef __cplusplus
+}
+#endif /* __cplusplus */
+
+#endif /* _LEGACY_ITTNOTIFY_H_ */
diff --git a/xdl/third_party/tbb/src/tbb/win32-tbb-export.def b/xdl/third_party/tbb/src/tbb/win32-tbb-export.def
new file mode 100644
index 00000000..d6567c40
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/win32-tbb-export.def
@@ -0,0 +1,28 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+EXPORTS
+
+#define __TBB_SYMBOL( sym ) sym
+#if _M_ARM
+#include "winrt-tbb-export.lst"
+#else
+#include "win32-tbb-export.lst"
+#endif
+
+
diff --git a/xdl/third_party/tbb/src/tbb/win32-tbb-export.lst b/xdl/third_party/tbb/src/tbb/win32-tbb-export.lst
new file mode 100644
index 00000000..ee280975
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/win32-tbb-export.lst
@@ -0,0 +1,342 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+#include "tbb/tbb_config.h"
+
+// Assembly-language support that is called directly by clients
+// __TBB_SYMBOL( __TBB_machine_cmpswp1 )
+// __TBB_SYMBOL( __TBB_machine_cmpswp2 )
+// __TBB_SYMBOL( __TBB_machine_cmpswp4 )
+__TBB_SYMBOL( __TBB_machine_cmpswp8 )
+// __TBB_SYMBOL( __TBB_machine_fetchadd1 )
+// __TBB_SYMBOL( __TBB_machine_fetchadd2 )
+// __TBB_SYMBOL( __TBB_machine_fetchadd4 )
+__TBB_SYMBOL( __TBB_machine_fetchadd8 )
+// __TBB_SYMBOL( __TBB_machine_fetchstore1 )
+// __TBB_SYMBOL( __TBB_machine_fetchstore2 )
+// __TBB_SYMBOL( __TBB_machine_fetchstore4 )
+__TBB_SYMBOL( __TBB_machine_fetchstore8 )
+__TBB_SYMBOL( __TBB_machine_store8 )
+__TBB_SYMBOL( __TBB_machine_load8 )
+__TBB_SYMBOL( __TBB_machine_trylockbyte )
+__TBB_SYMBOL( __TBB_machine_try_lock_elided )
+__TBB_SYMBOL( __TBB_machine_unlock_elided )
+__TBB_SYMBOL( __TBB_machine_is_in_transaction )
+
+// cache_aligned_allocator.cpp
+__TBB_SYMBOL( ?NFS_Allocate@internal@tbb@@YAPAXIIPAX@Z )
+__TBB_SYMBOL( ?NFS_GetLineSize@internal@tbb@@YAIXZ )
+__TBB_SYMBOL( ?NFS_Free@internal@tbb@@YAXPAX@Z )
+__TBB_SYMBOL( ?allocate_via_handler_v3@internal@tbb@@YAPAXI@Z )
+__TBB_SYMBOL( ?deallocate_via_handler_v3@internal@tbb@@YAXPAX@Z )
+__TBB_SYMBOL( ?is_malloc_used_v3@internal@tbb@@YA_NXZ )
+
+// task.cpp v3
+__TBB_SYMBOL( ?allocate@allocate_additional_child_of_proxy@internal@tbb@@QBEAAVtask@3@I@Z )
+__TBB_SYMBOL( ?allocate@allocate_child_proxy@internal@tbb@@QBEAAVtask@3@I@Z )
+__TBB_SYMBOL( ?allocate@allocate_continuation_proxy@internal@tbb@@QBEAAVtask@3@I@Z )
+__TBB_SYMBOL( ?allocate@allocate_root_proxy@internal@tbb@@SAAAVtask@3@I@Z )
+__TBB_SYMBOL( ?destroy@task_base@internal@interface5@tbb@@SAXAAVtask@4@@Z )
+__TBB_SYMBOL( ?free@allocate_additional_child_of_proxy@internal@tbb@@QBEXAAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_child_proxy@internal@tbb@@QBEXAAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_continuation_proxy@internal@tbb@@QBEXAAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_root_proxy@internal@tbb@@SAXAAVtask@3@@Z )
+__TBB_SYMBOL( ?internal_set_ref_count@task@tbb@@AAEXH@Z )
+__TBB_SYMBOL( ?internal_decrement_ref_count@task@tbb@@AAEHXZ )
+__TBB_SYMBOL( ?is_owned_by_current_thread@task@tbb@@QBE_NXZ )
+__TBB_SYMBOL( ?note_affinity@task@tbb@@UAEXG@Z )
+__TBB_SYMBOL( ?resize@affinity_partitioner_base_v3@internal@tbb@@AAEXI@Z )
+__TBB_SYMBOL( ?self@task@tbb@@SAAAV12@XZ )
+__TBB_SYMBOL( ?spawn_and_wait_for_all@task@tbb@@QAEXAAVtask_list@2@@Z )
+__TBB_SYMBOL( ?default_num_threads@task_scheduler_init@tbb@@SAHXZ )
+__TBB_SYMBOL( ?initialize@task_scheduler_init@tbb@@QAEXHI@Z )
+__TBB_SYMBOL( ?initialize@task_scheduler_init@tbb@@QAEXH@Z )
+__TBB_SYMBOL( ?terminate@task_scheduler_init@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?internal_blocking_terminate@task_scheduler_init@tbb@@AAE_N_N@Z )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( ?observe@task_scheduler_observer_v3@internal@tbb@@QAEX_N@Z )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+
+/* arena.cpp */
+__TBB_SYMBOL( ?internal_max_concurrency@task_arena_base@internal@interface7@tbb@@KAHPBVtask_arena@34@@Z )
+__TBB_SYMBOL( ?internal_current_slot@task_arena_base@internal@interface7@tbb@@KAHXZ )
+__TBB_SYMBOL( ?internal_initialize@task_arena_base@internal@interface7@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?internal_terminate@task_arena_base@internal@interface7@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?internal_attach@task_arena_base@internal@interface7@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?internal_enqueue@task_arena_base@internal@interface7@tbb@@IBEXAAVtask@4@H@Z )
+__TBB_SYMBOL( ?internal_execute@task_arena_base@internal@interface7@tbb@@IBEXAAVdelegate_base@234@@Z )
+__TBB_SYMBOL( ?internal_wait@task_arena_base@internal@interface7@tbb@@IBEXXZ )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( ?isolate_within_arena@internal@interface7@tbb@@YAXAAVdelegate_base@123@H@Z )
+#endif /* __TBB_TASK_ISOLATION */
+
+#if !TBB_NO_LEGACY
+// task_v2.cpp
+__TBB_SYMBOL( ?destroy@task@tbb@@QAEXAAV12@@Z )
+#endif
+
+// exception handling support
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( ?allocate@allocate_root_with_context_proxy@internal@tbb@@QBEAAVtask@3@I@Z )
+__TBB_SYMBOL( ?free@allocate_root_with_context_proxy@internal@tbb@@QBEXAAVtask@3@@Z )
+__TBB_SYMBOL( ?change_group@task@tbb@@QAEXAAVtask_group_context@2@@Z )
+__TBB_SYMBOL( ?is_group_execution_cancelled@task_group_context@tbb@@QBE_NXZ )
+__TBB_SYMBOL( ?cancel_group_execution@task_group_context@tbb@@QAE_NXZ )
+__TBB_SYMBOL( ?reset@task_group_context@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?capture_fp_settings@task_group_context@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?init@task_group_context@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?register_pending_exception@task_group_context@tbb@@QAEXXZ )
+__TBB_SYMBOL( ??1task_group_context@tbb@@QAE@XZ )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( ?set_priority@task_group_context@tbb@@QAEXW4priority_t@2@@Z )
+__TBB_SYMBOL( ?priority@task_group_context@tbb@@QBE?AW4priority_t@2@XZ )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( ?name@captured_exception@tbb@@UBEPBDXZ )
+__TBB_SYMBOL( ?what@captured_exception@tbb@@UBEPBDXZ )
+__TBB_SYMBOL( ??1captured_exception@tbb@@UAE@XZ )
+__TBB_SYMBOL( ?move@captured_exception@tbb@@UAEPAV12@XZ )
+__TBB_SYMBOL( ?destroy@captured_exception@tbb@@UAEXXZ )
+__TBB_SYMBOL( ?set@captured_exception@tbb@@QAEXPBD0@Z )
+__TBB_SYMBOL( ?clear@captured_exception@tbb@@QAEXXZ )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+// Symbols for exceptions thrown from TBB
+__TBB_SYMBOL( ?throw_bad_last_alloc_exception_v4@internal@tbb@@YAXXZ )
+__TBB_SYMBOL( ?throw_exception_v4@internal@tbb@@YAXW4exception_id@12@@Z )
+__TBB_SYMBOL( ?what@bad_last_alloc@tbb@@UBEPBDXZ )
+__TBB_SYMBOL( ?what@missing_wait@tbb@@UBEPBDXZ )
+__TBB_SYMBOL( ?what@invalid_multiple_scheduling@tbb@@UBEPBDXZ )
+__TBB_SYMBOL( ?what@improper_lock@tbb@@UBEPBDXZ )
+__TBB_SYMBOL( ?what@user_abort@tbb@@UBEPBDXZ )
+
+// tbb_misc.cpp
+__TBB_SYMBOL( ?assertion_failure@tbb@@YAXPBDH00@Z )
+__TBB_SYMBOL( ?get_initial_auto_partitioner_divisor@internal@tbb@@YAIXZ )
+__TBB_SYMBOL( ?handle_perror@internal@tbb@@YAXHPBD@Z )
+__TBB_SYMBOL( ?set_assertion_handler@tbb@@YAP6AXPBDH00@ZP6AX0H00@Z@Z )
+__TBB_SYMBOL( ?runtime_warning@internal@tbb@@YAXPBDZZ )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+// tbb_main.cpp
+__TBB_SYMBOL( ?itt_load_pointer_with_acquire_v3@internal@tbb@@YAPAXPBX@Z )
+__TBB_SYMBOL( ?itt_store_pointer_with_release_v3@internal@tbb@@YAXPAX0@Z )
+__TBB_SYMBOL( ?call_itt_notify_v5@internal@tbb@@YAXHPAX@Z )
+__TBB_SYMBOL( ?itt_set_sync_name_v3@internal@tbb@@YAXPAXPB_W@Z )
+__TBB_SYMBOL( ?itt_load_pointer_v3@internal@tbb@@YAPAXPBX@Z )
+__TBB_SYMBOL( ?itt_make_task_group_v7@internal@tbb@@YAXW4itt_domain_enum@12@PAX_K12W4string_index@12@@Z )
+__TBB_SYMBOL( ?itt_metadata_str_add_v7@internal@tbb@@YAXW4itt_domain_enum@12@PAX_KW4string_index@12@PBD@Z )
+__TBB_SYMBOL( ?itt_relation_add_v7@internal@tbb@@YAXW4itt_domain_enum@12@PAX_KW4itt_relation@12@12@Z )
+__TBB_SYMBOL( ?itt_task_begin_v7@internal@tbb@@YAXW4itt_domain_enum@12@PAX_K12W4string_index@12@@Z )
+__TBB_SYMBOL( ?itt_task_end_v7@internal@tbb@@YAXW4itt_domain_enum@12@@Z )
+__TBB_SYMBOL( ?itt_region_begin_v9@internal@tbb@@YAXW4itt_domain_enum@12@PAX_K12W4string_index@12@@Z )
+__TBB_SYMBOL( ?itt_region_end_v9@internal@tbb@@YAXW4itt_domain_enum@12@PAX_K@Z )
+
+// pipeline.cpp
+__TBB_SYMBOL( ??0pipeline@tbb@@QAE@XZ )
+__TBB_SYMBOL( ??1filter@tbb@@UAE@XZ )
+__TBB_SYMBOL( ??1pipeline@tbb@@UAE@XZ )
+__TBB_SYMBOL( ??_7pipeline@tbb@@6B@ )
+__TBB_SYMBOL( ?add_filter@pipeline@tbb@@QAEXAAVfilter@2@@Z )
+__TBB_SYMBOL( ?clear@pipeline@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?inject_token@pipeline@tbb@@AAEXAAVtask@2@@Z )
+__TBB_SYMBOL( ?run@pipeline@tbb@@QAEXI@Z )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( ?run@pipeline@tbb@@QAEXIAAVtask_group_context@2@@Z )
+#endif
+__TBB_SYMBOL( ?process_item@thread_bound_filter@tbb@@QAE?AW4result_type@12@XZ )
+__TBB_SYMBOL( ?try_process_item@thread_bound_filter@tbb@@QAE?AW4result_type@12@XZ )
+__TBB_SYMBOL( ?set_end_of_input@filter@tbb@@IAEXXZ )
+
+// queuing_rw_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@queuing_rw_mutex@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?acquire@scoped_lock@queuing_rw_mutex@tbb@@QAEXAAV23@_N@Z )
+__TBB_SYMBOL( ?downgrade_to_reader@scoped_lock@queuing_rw_mutex@tbb@@QAE_NXZ )
+__TBB_SYMBOL( ?release@scoped_lock@queuing_rw_mutex@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?upgrade_to_writer@scoped_lock@queuing_rw_mutex@tbb@@QAE_NXZ )
+__TBB_SYMBOL( ?try_acquire@scoped_lock@queuing_rw_mutex@tbb@@QAE_NAAV23@_N@Z )
+
+// reader_writer_lock.cpp
+__TBB_SYMBOL( ?try_lock_read@reader_writer_lock@interface5@tbb@@QAE_NXZ )
+__TBB_SYMBOL( ?try_lock@reader_writer_lock@interface5@tbb@@QAE_NXZ )
+__TBB_SYMBOL( ?unlock@reader_writer_lock@interface5@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?lock_read@reader_writer_lock@interface5@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?lock@reader_writer_lock@interface5@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?internal_construct@reader_writer_lock@interface5@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_destroy@reader_writer_lock@interface5@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_construct@scoped_lock@reader_writer_lock@interface5@tbb@@AAEXAAV234@@Z )
+__TBB_SYMBOL( ?internal_destroy@scoped_lock@reader_writer_lock@interface5@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_construct@scoped_lock_read@reader_writer_lock@interface5@tbb@@AAEXAAV234@@Z )
+__TBB_SYMBOL( ?internal_destroy@scoped_lock_read@reader_writer_lock@interface5@tbb@@AAEXXZ )
+
+#if !TBB_NO_LEGACY
+// spin_rw_mutex.cpp v2
+__TBB_SYMBOL( ?internal_acquire_reader@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_acquire_writer@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+__TBB_SYMBOL( ?internal_downgrade@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_itt_releasing@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_release_reader@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_release_writer@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_upgrade@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_writer@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_reader@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+#endif
+
+// spin_rw_mutex v3
+__TBB_SYMBOL( ?internal_construct@spin_rw_mutex_v3@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_upgrade@spin_rw_mutex_v3@tbb@@AAE_NXZ )
+__TBB_SYMBOL( ?internal_downgrade@spin_rw_mutex_v3@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_acquire_reader@spin_rw_mutex_v3@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_acquire_writer@spin_rw_mutex_v3@tbb@@AAE_NXZ )
+__TBB_SYMBOL( ?internal_release_reader@spin_rw_mutex_v3@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_release_writer@spin_rw_mutex_v3@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_try_acquire_reader@spin_rw_mutex_v3@tbb@@AAE_NXZ )
+__TBB_SYMBOL( ?internal_try_acquire_writer@spin_rw_mutex_v3@tbb@@AAE_NXZ )
+
+// x86_rtm_rw_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@x86_rtm_rw_mutex@internal@interface8@tbb@@AAEXXZ ) 
+__TBB_SYMBOL( ?internal_release@x86_rtm_rw_mutex@internal@interface8@tbb@@AAEXAAVscoped_lock@1234@@Z ) 
+__TBB_SYMBOL( ?internal_acquire_writer@x86_rtm_rw_mutex@internal@interface8@tbb@@AAEXAAVscoped_lock@1234@_N@Z ) 
+__TBB_SYMBOL( ?internal_acquire_reader@x86_rtm_rw_mutex@internal@interface8@tbb@@AAEXAAVscoped_lock@1234@_N@Z ) 
+__TBB_SYMBOL( ?internal_upgrade@x86_rtm_rw_mutex@internal@interface8@tbb@@AAE_NAAVscoped_lock@1234@@Z ) 
+__TBB_SYMBOL( ?internal_downgrade@x86_rtm_rw_mutex@internal@interface8@tbb@@AAE_NAAVscoped_lock@1234@@Z ) 
+__TBB_SYMBOL( ?internal_try_acquire_writer@x86_rtm_rw_mutex@internal@interface8@tbb@@AAE_NAAVscoped_lock@1234@@Z ) 
+
+// spin_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@spin_mutex@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@spin_mutex@tbb@@AAEXAAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@spin_mutex@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@spin_mutex@tbb@@AAE_NAAV23@@Z )
+
+// mutex.cpp
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@mutex@tbb@@AAEXAAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@mutex@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@mutex@tbb@@AAE_NAAV23@@Z )
+__TBB_SYMBOL( ?internal_construct@mutex@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_destroy@mutex@tbb@@AAEXXZ )
+
+// recursive_mutex.cpp
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@recursive_mutex@tbb@@AAEXAAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@recursive_mutex@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@recursive_mutex@tbb@@AAE_NAAV23@@Z )
+__TBB_SYMBOL( ?internal_construct@recursive_mutex@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_destroy@recursive_mutex@tbb@@AAEXXZ )
+
+// queuing_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@queuing_mutex@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?acquire@scoped_lock@queuing_mutex@tbb@@QAEXAAV23@@Z )
+__TBB_SYMBOL( ?release@scoped_lock@queuing_mutex@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?try_acquire@scoped_lock@queuing_mutex@tbb@@QAE_NAAV23@@Z )
+
+// critical_section.cpp
+__TBB_SYMBOL( ?internal_construct@critical_section_v4@internal@tbb@@QAEXXZ )
+
+#if !TBB_NO_LEGACY
+// concurrent_hash_map.cpp
+__TBB_SYMBOL( ?internal_grow_predicate@hash_map_segment_base@internal@tbb@@QBE_NXZ )
+
+// concurrent_queue.cpp v2
+__TBB_SYMBOL( ?advance@concurrent_queue_iterator_base@internal@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_iterator_base@internal@tbb@@IAEXABV123@@Z )
+__TBB_SYMBOL( ?internal_size@concurrent_queue_base@internal@tbb@@IBEHXZ )
+__TBB_SYMBOL( ??0concurrent_queue_base@internal@tbb@@IAE@I@Z )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base@internal@tbb@@IAE@ABVconcurrent_queue_base@12@@Z )
+__TBB_SYMBOL( ??1concurrent_queue_base@internal@tbb@@MAE@XZ )
+__TBB_SYMBOL( ??1concurrent_queue_iterator_base@internal@tbb@@IAE@XZ )
+__TBB_SYMBOL( ?internal_pop@concurrent_queue_base@internal@tbb@@IAEXPAX@Z )
+__TBB_SYMBOL( ?internal_pop_if_present@concurrent_queue_base@internal@tbb@@IAE_NPAX@Z )
+__TBB_SYMBOL( ?internal_push@concurrent_queue_base@internal@tbb@@IAEXPBX@Z )
+__TBB_SYMBOL( ?internal_push_if_not_full@concurrent_queue_base@internal@tbb@@IAE_NPBX@Z )
+__TBB_SYMBOL( ?internal_set_capacity@concurrent_queue_base@internal@tbb@@IAEXHI@Z )
+#endif
+
+// concurrent_queue v3
+__TBB_SYMBOL( ??1concurrent_queue_iterator_base_v3@internal@tbb@@IAE@XZ )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base_v3@internal@tbb@@IAE@ABVconcurrent_queue_base_v3@12@@Z )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base_v3@internal@tbb@@IAE@ABVconcurrent_queue_base_v3@12@I@Z )
+__TBB_SYMBOL( ?advance@concurrent_queue_iterator_base_v3@internal@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_iterator_base_v3@internal@tbb@@IAEXABV123@@Z )
+__TBB_SYMBOL( ??0concurrent_queue_base_v3@internal@tbb@@IAE@I@Z )
+__TBB_SYMBOL( ??1concurrent_queue_base_v3@internal@tbb@@MAE@XZ )
+__TBB_SYMBOL( ?internal_pop@concurrent_queue_base_v3@internal@tbb@@IAEXPAX@Z )
+__TBB_SYMBOL( ?internal_pop_if_present@concurrent_queue_base_v3@internal@tbb@@IAE_NPAX@Z )
+__TBB_SYMBOL( ?internal_abort@concurrent_queue_base_v3@internal@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?internal_push@concurrent_queue_base_v3@internal@tbb@@IAEXPBX@Z )
+__TBB_SYMBOL( ?internal_push_move@concurrent_queue_base_v8@internal@tbb@@IAEXPBX@Z )
+__TBB_SYMBOL( ?internal_push_if_not_full@concurrent_queue_base_v3@internal@tbb@@IAE_NPBX@Z )
+__TBB_SYMBOL( ?internal_push_move_if_not_full@concurrent_queue_base_v8@internal@tbb@@IAE_NPBX@Z )
+__TBB_SYMBOL( ?internal_size@concurrent_queue_base_v3@internal@tbb@@IBEHXZ )
+__TBB_SYMBOL( ?internal_empty@concurrent_queue_base_v3@internal@tbb@@IBE_NXZ )
+__TBB_SYMBOL( ?internal_set_capacity@concurrent_queue_base_v3@internal@tbb@@IAEXHI@Z )
+__TBB_SYMBOL( ?internal_finish_clear@concurrent_queue_base_v3@internal@tbb@@IAEXXZ )
+__TBB_SYMBOL( ?internal_throw_exception@concurrent_queue_base_v3@internal@tbb@@IBEXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_base_v3@internal@tbb@@IAEXABV123@@Z )
+__TBB_SYMBOL( ?move_content@concurrent_queue_base_v8@internal@tbb@@IAEXAAV123@@Z )
+
+#if !TBB_NO_LEGACY
+// concurrent_vector.cpp v2
+__TBB_SYMBOL( ?internal_assign@concurrent_vector_base@internal@tbb@@IAEXABV123@IP6AXPAXI@ZP6AX1PBXI@Z4@Z )
+__TBB_SYMBOL( ?internal_capacity@concurrent_vector_base@internal@tbb@@IBEIXZ )
+__TBB_SYMBOL( ?internal_clear@concurrent_vector_base@internal@tbb@@IAEXP6AXPAXI@Z_N@Z )
+__TBB_SYMBOL( ?internal_copy@concurrent_vector_base@internal@tbb@@IAEXABV123@IP6AXPAXPBXI@Z@Z )
+__TBB_SYMBOL( ?internal_grow_by@concurrent_vector_base@internal@tbb@@IAEIIIP6AXPAXI@Z@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least@concurrent_vector_base@internal@tbb@@IAEXIIP6AXPAXI@Z@Z )
+__TBB_SYMBOL( ?internal_push_back@concurrent_vector_base@internal@tbb@@IAEPAXIAAI@Z )
+__TBB_SYMBOL( ?internal_reserve@concurrent_vector_base@internal@tbb@@IAEXIII@Z )
+#endif
+
+// concurrent_vector v3
+__TBB_SYMBOL( ??1concurrent_vector_base_v3@internal@tbb@@IAE@XZ )
+__TBB_SYMBOL( ?internal_assign@concurrent_vector_base_v3@internal@tbb@@IAEXABV123@IP6AXPAXI@ZP6AX1PBXI@Z4@Z )
+__TBB_SYMBOL( ?internal_capacity@concurrent_vector_base_v3@internal@tbb@@IBEIXZ )
+__TBB_SYMBOL( ?internal_clear@concurrent_vector_base_v3@internal@tbb@@IAEIP6AXPAXI@Z@Z )
+__TBB_SYMBOL( ?internal_copy@concurrent_vector_base_v3@internal@tbb@@IAEXABV123@IP6AXPAXPBXI@Z@Z )
+__TBB_SYMBOL( ?internal_grow_by@concurrent_vector_base_v3@internal@tbb@@IAEIIIP6AXPAXPBXI@Z1@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least@concurrent_vector_base_v3@internal@tbb@@IAEXIIP6AXPAXPBXI@Z1@Z )
+__TBB_SYMBOL( ?internal_push_back@concurrent_vector_base_v3@internal@tbb@@IAEPAXIAAI@Z )
+__TBB_SYMBOL( ?internal_reserve@concurrent_vector_base_v3@internal@tbb@@IAEXIII@Z )
+__TBB_SYMBOL( ?internal_compact@concurrent_vector_base_v3@internal@tbb@@IAEPAXIPAXP6AX0I@ZP6AX0PBXI@Z@Z )
+__TBB_SYMBOL( ?internal_swap@concurrent_vector_base_v3@internal@tbb@@IAEXAAV123@@Z )
+__TBB_SYMBOL( ?internal_throw_exception@concurrent_vector_base_v3@internal@tbb@@IBEXI@Z )
+__TBB_SYMBOL( ?internal_resize@concurrent_vector_base_v3@internal@tbb@@IAEXIIIPBXP6AXPAXI@ZP6AX10I@Z@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least_with_result@concurrent_vector_base_v3@internal@tbb@@IAEIIIP6AXPAXPBXI@Z1@Z )
+
+// tbb_thread
+__TBB_SYMBOL( ?join@tbb_thread_v3@internal@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?detach@tbb_thread_v3@internal@tbb@@QAEXXZ )
+__TBB_SYMBOL( ?internal_start@tbb_thread_v3@internal@tbb@@AAEXP6GIPAX@Z0@Z )
+__TBB_SYMBOL( ?allocate_closure_v3@internal@tbb@@YAPAXI@Z )
+__TBB_SYMBOL( ?free_closure_v3@internal@tbb@@YAXPAX@Z )
+__TBB_SYMBOL( ?hardware_concurrency@tbb_thread_v3@internal@tbb@@SAIXZ )
+__TBB_SYMBOL( ?thread_yield_v3@internal@tbb@@YAXXZ )
+__TBB_SYMBOL( ?thread_sleep_v3@internal@tbb@@YAXABVinterval_t@tick_count@2@@Z )
+__TBB_SYMBOL( ?move_v3@internal@tbb@@YAXAAVtbb_thread_v3@12@0@Z )
+__TBB_SYMBOL( ?thread_get_id_v3@internal@tbb@@YA?AVid@tbb_thread_v3@12@XZ )
+
+// condition_variable
+__TBB_SYMBOL( ?internal_initialize_condition_variable@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_wait@internal@interface5@tbb@@YA_NAATcondvar_impl_t@123@PAVmutex@3@PBVinterval_t@tick_count@3@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_notify_one@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_notify_all@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_destroy_condition_variable@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+
+// global parameter
+__TBB_SYMBOL( ?active_value@global_control@interface9@tbb@@CAIH@Z )
+__TBB_SYMBOL( ?internal_create@global_control@interface9@tbb@@AAEXXZ )
+__TBB_SYMBOL( ?internal_destroy@global_control@interface9@tbb@@AAEXXZ )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/win64-gcc-tbb-export.def b/xdl/third_party/tbb/src/tbb/win64-gcc-tbb-export.def
new file mode 100644
index 00000000..22c181c4
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/win64-gcc-tbb-export.def
@@ -0,0 +1,44 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+#define __TBB_SYMBOL( sym ) sym;
+#include "win64-gcc-tbb-export.lst"
+
+local:
+
+/* TBB symbols */
+*3tbb*;
+*__TBB*;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+get_msg_buf;
+get_text_buf;
+message_catalog;
+print_buf;
+irc__get_msg;
+irc__print;
+
+};
+
diff --git a/xdl/third_party/tbb/src/tbb/win64-gcc-tbb-export.lst b/xdl/third_party/tbb/src/tbb/win64-gcc-tbb-export.lst
new file mode 100644
index 00000000..5c8b67a9
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/win64-gcc-tbb-export.lst
@@ -0,0 +1,392 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+/* cache_aligned_allocator.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal12NFS_AllocateEyyPv ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal15NFS_GetLineSizeEv )
+__TBB_SYMBOL( _ZN3tbb8internal8NFS_FreeEPv )
+__TBB_SYMBOL( _ZN3tbb8internal23allocate_via_handler_v3Ey ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25deallocate_via_handler_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal17is_malloc_used_v3Ev )
+
+/* task.cpp v3 */
+__TBB_SYMBOL( _ZN3tbb4task13note_affinityEt )
+__TBB_SYMBOL( _ZN3tbb4task22internal_set_ref_countEi )
+__TBB_SYMBOL( _ZN3tbb4task28internal_decrement_ref_countEv )
+__TBB_SYMBOL( _ZN3tbb4task22spawn_and_wait_for_allERNS_9task_listE )
+__TBB_SYMBOL( _ZN3tbb4task4selfEv )
+__TBB_SYMBOL( _ZN3tbb10interface58internal9task_base7destroyERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb4task26is_owned_by_current_threadEv )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_root_proxy8allocateEy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal28affinity_partitioner_base_v36resizeEj )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal20allocate_child_proxy8allocateEy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal27allocate_continuation_proxy8allocateEy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZNK3tbb8internal34allocate_additional_child_of_proxy8allocateEy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZTIN3tbb4taskE )
+__TBB_SYMBOL( _ZTSN3tbb4taskE )
+__TBB_SYMBOL( _ZTVN3tbb4taskE )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init19default_num_threadsEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEiy )  // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init10initializeEi )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init9terminateEv )
+__TBB_SYMBOL( _ZN3tbb19task_scheduler_init27internal_blocking_terminateEb )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( _ZN3tbb8internal26task_scheduler_observer_v37observeEb )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+__TBB_SYMBOL( _ZN3tbb10empty_task7executeEv )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD0Ev )
+__TBB_SYMBOL( _ZN3tbb10empty_taskD1Ev )
+__TBB_SYMBOL( _ZTIN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTSN3tbb10empty_taskE )
+__TBB_SYMBOL( _ZTVN3tbb10empty_taskE )
+
+/* arena.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base19internal_initializeEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base18internal_terminateEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base15internal_attachEv )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_enqueueERNS_4taskEx )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base16internal_executeERNS1_13delegate_baseE )
+__TBB_SYMBOL( _ZNK3tbb10interface78internal15task_arena_base13internal_waitEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base21internal_current_slotEv )
+__TBB_SYMBOL( _ZN3tbb10interface78internal15task_arena_base24internal_max_concurrencyEPKNS0_10task_arenaE )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( _ZN3tbb10interface78internal20isolate_within_arenaERNS1_13delegate_baseEx )
+#endif /* __TBB_TASK_ISOLATION */
+
+#if !TBB_NO_LEGACY
+/* task_v2.cpp */
+__TBB_SYMBOL( _ZN3tbb4task7destroyERS0_ )
+#endif /* !TBB_NO_LEGACY */
+
+/* Exception handling in task scheduler */
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy8allocateEy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZNK3tbb8internal32allocate_root_with_context_proxy4freeERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb4task12change_groupERNS_18task_group_contextE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context28is_group_execution_cancelledEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context22cancel_group_executionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context26register_pending_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context5resetEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context19capture_fp_settingsEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_context4initEv )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD1Ev )
+__TBB_SYMBOL( _ZN3tbb18task_group_contextD2Ev )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( _ZN3tbb18task_group_context12set_priorityENS_10priority_tE )
+__TBB_SYMBOL( _ZNK3tbb18task_group_context8priorityEv )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4nameEv )
+__TBB_SYMBOL( _ZNK3tbb18captured_exception4whatEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception10throw_selfEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception3setEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exception4moveEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception5clearEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception7destroyEv )
+__TBB_SYMBOL( _ZN3tbb18captured_exception8allocateEPKcS2_ )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD0Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD1Ev )
+__TBB_SYMBOL( _ZN3tbb18captured_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb18captured_exceptionE )
+__TBB_SYMBOL( _ZN3tbb13tbb_exceptionD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTSN3tbb13tbb_exceptionE )
+__TBB_SYMBOL( _ZTVN3tbb13tbb_exceptionE )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+/* Symbols for exceptions thrown from TBB */
+__TBB_SYMBOL( _ZN3tbb8internal33throw_bad_last_alloc_exception_v4Ev )
+__TBB_SYMBOL( _ZN3tbb8internal18throw_exception_v4ENS0_12exception_idE )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD0Ev )
+__TBB_SYMBOL( _ZN3tbb14bad_last_allocD1Ev )
+__TBB_SYMBOL( _ZNK3tbb14bad_last_alloc4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTSN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZTVN3tbb14bad_last_allocE )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD0Ev )
+__TBB_SYMBOL( _ZN3tbb12missing_waitD1Ev )
+__TBB_SYMBOL( _ZNK3tbb12missing_wait4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTSN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZTVN3tbb12missing_waitE )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD0Ev )
+__TBB_SYMBOL( _ZN3tbb27invalid_multiple_schedulingD1Ev )
+__TBB_SYMBOL( _ZNK3tbb27invalid_multiple_scheduling4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTSN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZTVN3tbb27invalid_multiple_schedulingE )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD0Ev )
+__TBB_SYMBOL( _ZN3tbb13improper_lockD1Ev )
+__TBB_SYMBOL( _ZNK3tbb13improper_lock4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTSN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZTVN3tbb13improper_lockE )
+__TBB_SYMBOL( _ZN3tbb10user_abortD0Ev )
+__TBB_SYMBOL( _ZN3tbb10user_abortD1Ev )
+__TBB_SYMBOL( _ZNK3tbb10user_abort4whatEv )
+__TBB_SYMBOL( _ZTIN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTSN3tbb10user_abortE )
+__TBB_SYMBOL( _ZTVN3tbb10user_abortE )
+
+/* tbb_misc.cpp */
+__TBB_SYMBOL( _ZN3tbb17assertion_failureEPKciS1_S1_ )
+__TBB_SYMBOL( _ZN3tbb21set_assertion_handlerEPFvPKciS1_S1_E )
+__TBB_SYMBOL( _ZN3tbb8internal36get_initial_auto_partitioner_divisorEv )
+__TBB_SYMBOL( _ZN3tbb8internal13handle_perrorEiPKc )
+__TBB_SYMBOL( _ZN3tbb8internal15runtime_warningEPKcz )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+/* tbb_main.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal32itt_load_pointer_with_acquire_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal33itt_store_pointer_with_release_v3EPvS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal18call_itt_notify_v5EiPv )
+__TBB_SYMBOL( _ZN3tbb8internal20itt_set_sync_name_v3EPvPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_load_pointer_v3EPKv )
+__TBB_SYMBOL( _ZN3tbb8internal22itt_make_task_group_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal23itt_metadata_str_add_v7ENS0_15itt_domain_enumEPvyNS0_12string_indexEPKc )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_relation_add_v7ENS0_15itt_domain_enumEPvyNS0_12itt_relationES2_y )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_task_begin_v7ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal15itt_task_end_v7ENS0_15itt_domain_enumE )
+__TBB_SYMBOL( _ZN3tbb8internal19itt_region_begin_v9ENS0_15itt_domain_enumEPvyS2_yNS0_12string_indexE )
+__TBB_SYMBOL( _ZN3tbb8internal17itt_region_end_v9ENS0_15itt_domain_enumEPvy )
+
+
+/* pipeline.cpp */
+__TBB_SYMBOL( _ZTIN3tbb6filterE )
+__TBB_SYMBOL( _ZTSN3tbb6filterE )
+__TBB_SYMBOL( _ZTVN3tbb6filterE )
+__TBB_SYMBOL( _ZN3tbb6filterD2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipeline10add_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline12inject_tokenERNS_4taskE )
+__TBB_SYMBOL( _ZN3tbb8pipeline13remove_filterERNS_6filterE )
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEy ) // MODIFIED LINUX ENTRY
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( _ZN3tbb8pipeline3runEyRNS_18task_group_contextE ) // MODIFIED LINUX ENTRY
+#endif
+__TBB_SYMBOL( _ZN3tbb8pipeline5clearEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter12process_itemEv )
+__TBB_SYMBOL( _ZN3tbb19thread_bound_filter16try_process_itemEv )
+__TBB_SYMBOL( _ZTIN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTSN3tbb8pipelineE )
+__TBB_SYMBOL( _ZTVN3tbb8pipelineE )
+__TBB_SYMBOL( _ZN3tbb8pipelineC1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineC2Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD0Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD1Ev )
+__TBB_SYMBOL( _ZN3tbb8pipelineD2Ev )
+__TBB_SYMBOL( _ZN3tbb6filter16set_end_of_inputEv )
+
+/* queuing_rw_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock17upgrade_to_writerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock19downgrade_to_readerEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7acquireERS0_b )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb16queuing_rw_mutex11scoped_lock11try_acquireERS0_b )
+
+/* reader_writer_lock.cpp */
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock11scoped_lock18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock13try_lock_readEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16scoped_lock_read18internal_constructERS1_ )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock4lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock6unlockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock8try_lockEv )
+__TBB_SYMBOL( _ZN3tbb10interface518reader_writer_lock9lock_readEv )
+
+#if !TBB_NO_LEGACY
+/* spin_rw_mutex.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex16internal_upgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex22internal_itt_releasingEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_acquire_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex18internal_downgradeEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex23internal_release_writerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_readerEPS0_ )
+__TBB_SYMBOL( _ZN3tbb13spin_rw_mutex27internal_try_acquire_writerEPS0_ )
+#endif
+
+// x86_rtm_rw_mutex.cpp
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_writerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex27internal_try_acquire_writerERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex23internal_acquire_readerERNS2_11scoped_lockEb )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_releaseERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex16internal_upgradeERNS2_11scoped_lockE )
+__TBB_SYMBOL( _ZN3tbb10interface88internal16x86_rtm_rw_mutex18internal_downgradeERNS2_11scoped_lockE )
+
+/* spin_rw_mutex v3 */
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v316internal_upgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v318internal_downgradeEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_acquire_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v323internal_release_writerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_readerEv )
+__TBB_SYMBOL( _ZN3tbb16spin_rw_mutex_v327internal_try_acquire_writerEv )
+
+/* spin_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb10spin_mutex18internal_constructEv )
+
+/* mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb5mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb5mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb5mutex18internal_constructEv )
+
+/* recursive_mutex.cpp */
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock16internal_releaseEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex11scoped_lock20internal_try_acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex16internal_destroyEv )
+__TBB_SYMBOL( _ZN3tbb15recursive_mutex18internal_constructEv )
+
+/* QueuingMutex.cpp */
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex18internal_constructEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7acquireERS0_ )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock7releaseEv )
+__TBB_SYMBOL( _ZN3tbb13queuing_mutex11scoped_lock11try_acquireERS0_ )
+
+/* critical_section.cpp */
+__TBB_SYMBOL( _ZN3tbb8internal19critical_section_v418internal_constructEv )
+
+#if !TBB_NO_LEGACY
+/* concurrent_hash_map */
+__TBB_SYMBOL( _ZNK3tbb8internal21hash_map_segment_base23internal_grow_predicateEv )
+
+/* concurrent_queue.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base12internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base13internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base21internal_set_capacityExy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base23internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_base25internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseC2Ey ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal21concurrent_queue_baseD2Ev )
+__TBB_SYMBOL( _ZTIN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTSN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZTVN3tbb8internal21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base6assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_base7advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseC2ERKNS0_21concurrent_queue_baseE )
+__TBB_SYMBOL( _ZN3tbb8internal30concurrent_queue_iterator_baseD2Ev )
+__TBB_SYMBOL( _ZNK3tbb8internal21concurrent_queue_base13internal_sizeEv )
+#endif
+
+/* concurrent_queue v3 */
+/* constructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3C2Ey ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3C2ERKNS0_24concurrent_queue_base_v3Ey ) // MODIFIED LINUX ENTRY
+/* destructors */
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v3D2Ev )
+/* typeinfo */
+__TBB_SYMBOL( _ZTIN3tbb8internal24concurrent_queue_base_v3E )
+__TBB_SYMBOL( _ZTSN3tbb8internal24concurrent_queue_base_v3E )
+/* vtable */
+__TBB_SYMBOL( _ZTVN3tbb8internal24concurrent_queue_base_v3E )
+/* methods */
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal33concurrent_queue_iterator_base_v37advanceEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v313internal_pushEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v818internal_push_moveEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v325internal_push_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v830internal_push_move_if_not_fullEPKv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v312internal_popEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v323internal_pop_if_presentEPv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v314internal_abortEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_finish_clearEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v321internal_set_capacityExy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v313internal_sizeEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v314internal_emptyEv )
+__TBB_SYMBOL( _ZNK3tbb8internal24concurrent_queue_base_v324internal_throw_exceptionEv )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v36assignERKS1_ )
+__TBB_SYMBOL( _ZN3tbb8internal24concurrent_queue_base_v812move_contentERS1_ )
+
+
+#if !TBB_NO_LEGACY
+/* concurrent_vector.cpp v2 */
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base13internal_copyERKS1_yPFvPvPKvyE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base14internal_clearEPFvPvyEb ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base15internal_assignERKS1_yPFvPvyEPFvS4_PKvyESA_ ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_grow_byEyyPFvPvyE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base16internal_reserveEyyy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base18internal_push_backEyRy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal22concurrent_vector_base25internal_grow_to_at_leastEyyPFvPvyE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZNK3tbb8internal22concurrent_vector_base17internal_capacityEv )
+#endif
+
+/* concurrent_vector v3 */
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_copyERKS1_yPFvPvPKvyE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v314internal_clearEPFvPvyE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_assignERKS1_yPFvPvyEPFvS4_PKvyESA_ ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_grow_byEyyPFvPvPKvyES4_ ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_reserveEyyy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v318internal_push_backEyRy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v325internal_grow_to_at_leastEyyPFvPvPKvyES4_ ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v317internal_capacityEv )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v316internal_compactEyPvPFvS2_yEPFvS2_PKvyE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v313internal_swapERS1_ )
+__TBB_SYMBOL( _ZNK3tbb8internal25concurrent_vector_base_v324internal_throw_exceptionEy ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v3D2Ev )
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v315internal_resizeEyyyPKvPFvPvyEPFvS4_S3_yE ) // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal25concurrent_vector_base_v337internal_grow_to_at_least_with_resultEyyPFvPvPKvyES4_ ) // MODIFIED LINUX ENTRY
+
+/* tbb_thread */
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v320hardware_concurrencyEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v36detachEv )
+__TBB_SYMBOL( _ZN3tbb8internal16thread_get_id_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15free_closure_v3EPv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v34joinEv )
+__TBB_SYMBOL( _ZN3tbb8internal13tbb_thread_v314internal_startEPFjPvES2_ )  // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal19allocate_closure_v3Ey )  // MODIFIED LINUX ENTRY
+__TBB_SYMBOL( _ZN3tbb8internal7move_v3ERNS0_13tbb_thread_v3ES2_ )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_yield_v3Ev )
+__TBB_SYMBOL( _ZN3tbb8internal15thread_sleep_v3ERKNS_10tick_count10interval_tE )
+
+/* condition_variable */
+__TBB_SYMBOL( _ZN3tbb10interface58internal32internal_condition_variable_waitERNS1_14condvar_impl_tEPNS_5mutexEPKNS_10tick_count10interval_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal35internal_destroy_condition_variableERNS1_14condvar_impl_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal38internal_condition_variable_notify_allERNS1_14condvar_impl_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal38internal_condition_variable_notify_oneERNS1_14condvar_impl_tE )
+__TBB_SYMBOL( _ZN3tbb10interface58internal38internal_initialize_condition_variableERNS1_14condvar_impl_tE )
+
+// global parameter
+__TBB_SYMBOL( _ZN3tbb10interface914global_control12active_valueEi )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control15internal_createEv )
+__TBB_SYMBOL( _ZN3tbb10interface914global_control16internal_destroyEv )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/win64-tbb-export.def b/xdl/third_party/tbb/src/tbb/win64-tbb-export.def
new file mode 100644
index 00000000..776dd5ad
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/win64-tbb-export.def
@@ -0,0 +1,26 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+; This file is organized with a section for each .cpp file.
+; Each of these sections is in alphabetical order.
+
+EXPORTS
+
+#define __TBB_SYMBOL( sym ) sym
+#include "win64-tbb-export.lst"
+
diff --git a/xdl/third_party/tbb/src/tbb/win64-tbb-export.lst b/xdl/third_party/tbb/src/tbb/win64-tbb-export.lst
new file mode 100644
index 00000000..e7639c7f
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/win64-tbb-export.lst
@@ -0,0 +1,337 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+// This file is organized with a section for each .cpp file.
+// Each of these sections is in alphabetical order.
+
+#include "tbb/tbb_config.h"
+
+// Assembly-language support that is called directly by clients
+__TBB_SYMBOL( __TBB_machine_cmpswp1 )
+__TBB_SYMBOL( __TBB_machine_fetchadd1 )
+__TBB_SYMBOL( __TBB_machine_fetchstore1 )
+__TBB_SYMBOL( __TBB_machine_cmpswp2 )
+__TBB_SYMBOL( __TBB_machine_fetchadd2 )
+__TBB_SYMBOL( __TBB_machine_fetchstore2 )
+__TBB_SYMBOL( __TBB_machine_pause )
+__TBB_SYMBOL( __TBB_machine_try_lock_elided )
+__TBB_SYMBOL( __TBB_machine_unlock_elided )
+__TBB_SYMBOL( __TBB_machine_is_in_transaction )
+
+// cache_aligned_allocator.cpp
+__TBB_SYMBOL( ?NFS_Allocate@internal@tbb@@YAPEAX_K0PEAX@Z )
+__TBB_SYMBOL( ?NFS_GetLineSize@internal@tbb@@YA_KXZ )
+__TBB_SYMBOL( ?NFS_Free@internal@tbb@@YAXPEAX@Z )
+__TBB_SYMBOL( ?allocate_via_handler_v3@internal@tbb@@YAPEAX_K@Z )
+__TBB_SYMBOL( ?deallocate_via_handler_v3@internal@tbb@@YAXPEAX@Z )
+__TBB_SYMBOL( ?is_malloc_used_v3@internal@tbb@@YA_NXZ )
+
+
+// task.cpp v3
+__TBB_SYMBOL( ?resize@affinity_partitioner_base_v3@internal@tbb@@AEAAXI@Z )
+__TBB_SYMBOL( ?allocate@allocate_additional_child_of_proxy@internal@tbb@@QEBAAEAVtask@3@_K@Z )
+__TBB_SYMBOL( ?allocate@allocate_child_proxy@internal@tbb@@QEBAAEAVtask@3@_K@Z )
+__TBB_SYMBOL( ?allocate@allocate_continuation_proxy@internal@tbb@@QEBAAEAVtask@3@_K@Z )
+__TBB_SYMBOL( ?allocate@allocate_root_proxy@internal@tbb@@SAAEAVtask@3@_K@Z )
+__TBB_SYMBOL( ?destroy@task_base@internal@interface5@tbb@@SAXAEAVtask@4@@Z )
+__TBB_SYMBOL( ?free@allocate_additional_child_of_proxy@internal@tbb@@QEBAXAEAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_child_proxy@internal@tbb@@QEBAXAEAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_continuation_proxy@internal@tbb@@QEBAXAEAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_root_proxy@internal@tbb@@SAXAEAVtask@3@@Z )
+__TBB_SYMBOL( ?internal_set_ref_count@task@tbb@@AEAAXH@Z )
+__TBB_SYMBOL( ?internal_decrement_ref_count@task@tbb@@AEAA_JXZ )
+__TBB_SYMBOL( ?is_owned_by_current_thread@task@tbb@@QEBA_NXZ )
+__TBB_SYMBOL( ?note_affinity@task@tbb@@UEAAXG@Z )
+__TBB_SYMBOL( ?self@task@tbb@@SAAEAV12@XZ )
+__TBB_SYMBOL( ?spawn_and_wait_for_all@task@tbb@@QEAAXAEAVtask_list@2@@Z )
+__TBB_SYMBOL( ?default_num_threads@task_scheduler_init@tbb@@SAHXZ )
+__TBB_SYMBOL( ?initialize@task_scheduler_init@tbb@@QEAAXH_K@Z )
+__TBB_SYMBOL( ?initialize@task_scheduler_init@tbb@@QEAAXH@Z )
+__TBB_SYMBOL( ?terminate@task_scheduler_init@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?internal_blocking_terminate@task_scheduler_init@tbb@@AEAA_N_N@Z )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( ?observe@task_scheduler_observer_v3@internal@tbb@@QEAAX_N@Z )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+
+/* arena.cpp */
+__TBB_SYMBOL( ?internal_max_concurrency@task_arena_base@internal@interface7@tbb@@KAHPEBVtask_arena@34@@Z )
+__TBB_SYMBOL( ?internal_current_slot@task_arena_base@internal@interface7@tbb@@KAHXZ )
+__TBB_SYMBOL( ?internal_initialize@task_arena_base@internal@interface7@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?internal_terminate@task_arena_base@internal@interface7@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?internal_attach@task_arena_base@internal@interface7@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?internal_enqueue@task_arena_base@internal@interface7@tbb@@IEBAXAEAVtask@4@_J@Z )
+__TBB_SYMBOL( ?internal_execute@task_arena_base@internal@interface7@tbb@@IEBAXAEAVdelegate_base@234@@Z )
+__TBB_SYMBOL( ?internal_wait@task_arena_base@internal@interface7@tbb@@IEBAXXZ )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( ?isolate_within_arena@internal@interface7@tbb@@YAXAEAVdelegate_base@123@_J@Z )
+#endif /* __TBB_TASK_ISOLATION */
+#if !TBB_NO_LEGACY
+// task_v2.cpp
+__TBB_SYMBOL( ?destroy@task@tbb@@QEAAXAEAV12@@Z )
+#endif
+
+// Exception handling in task scheduler
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( ?allocate@allocate_root_with_context_proxy@internal@tbb@@QEBAAEAVtask@3@_K@Z )
+__TBB_SYMBOL( ?free@allocate_root_with_context_proxy@internal@tbb@@QEBAXAEAVtask@3@@Z )
+__TBB_SYMBOL( ?change_group@task@tbb@@QEAAXAEAVtask_group_context@2@@Z )
+__TBB_SYMBOL( ?is_group_execution_cancelled@task_group_context@tbb@@QEBA_NXZ )
+__TBB_SYMBOL( ?cancel_group_execution@task_group_context@tbb@@QEAA_NXZ )
+__TBB_SYMBOL( ?reset@task_group_context@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?capture_fp_settings@task_group_context@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?init@task_group_context@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?register_pending_exception@task_group_context@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ??1task_group_context@tbb@@QEAA@XZ )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( ?set_priority@task_group_context@tbb@@QEAAXW4priority_t@2@@Z )
+__TBB_SYMBOL( ?priority@task_group_context@tbb@@QEBA?AW4priority_t@2@XZ )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( ?name@captured_exception@tbb@@UEBAPEBDXZ )
+__TBB_SYMBOL( ?what@captured_exception@tbb@@UEBAPEBDXZ )
+__TBB_SYMBOL( ??1captured_exception@tbb@@UEAA@XZ )
+__TBB_SYMBOL( ?move@captured_exception@tbb@@UEAAPEAV12@XZ )
+__TBB_SYMBOL( ?destroy@captured_exception@tbb@@UEAAXXZ )
+__TBB_SYMBOL( ?set@captured_exception@tbb@@QEAAXPEBD0@Z )
+__TBB_SYMBOL( ?clear@captured_exception@tbb@@QEAAXXZ )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+// Symbols for exceptions thrown from TBB
+__TBB_SYMBOL( ?throw_bad_last_alloc_exception_v4@internal@tbb@@YAXXZ )
+__TBB_SYMBOL( ?throw_exception_v4@internal@tbb@@YAXW4exception_id@12@@Z )
+__TBB_SYMBOL( ?what@bad_last_alloc@tbb@@UEBAPEBDXZ )
+__TBB_SYMBOL( ?what@missing_wait@tbb@@UEBAPEBDXZ )
+__TBB_SYMBOL( ?what@invalid_multiple_scheduling@tbb@@UEBAPEBDXZ )
+__TBB_SYMBOL( ?what@improper_lock@tbb@@UEBAPEBDXZ )
+__TBB_SYMBOL( ?what@user_abort@tbb@@UEBAPEBDXZ )
+
+// tbb_misc.cpp
+__TBB_SYMBOL( ?assertion_failure@tbb@@YAXPEBDH00@Z )
+__TBB_SYMBOL( ?get_initial_auto_partitioner_divisor@internal@tbb@@YA_KXZ )
+__TBB_SYMBOL( ?handle_perror@internal@tbb@@YAXHPEBD@Z )
+__TBB_SYMBOL( ?set_assertion_handler@tbb@@YAP6AXPEBDH00@ZP6AX0H00@Z@Z )
+__TBB_SYMBOL( ?runtime_warning@internal@tbb@@YAXPEBDZZ )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+// tbb_main.cpp
+__TBB_SYMBOL( ?itt_load_pointer_with_acquire_v3@internal@tbb@@YAPEAXPEBX@Z )
+__TBB_SYMBOL( ?itt_store_pointer_with_release_v3@internal@tbb@@YAXPEAX0@Z )
+__TBB_SYMBOL( ?call_itt_notify_v5@internal@tbb@@YAXHPEAX@Z )
+__TBB_SYMBOL( ?itt_load_pointer_v3@internal@tbb@@YAPEAXPEBX@Z )
+__TBB_SYMBOL( ?itt_set_sync_name_v3@internal@tbb@@YAXPEAXPEB_W@Z )
+__TBB_SYMBOL( ?itt_make_task_group_v7@internal@tbb@@YAXW4itt_domain_enum@12@PEAX_K12W4string_index@12@@Z )
+__TBB_SYMBOL( ?itt_metadata_str_add_v7@internal@tbb@@YAXW4itt_domain_enum@12@PEAX_KW4string_index@12@PEBD@Z )
+__TBB_SYMBOL( ?itt_relation_add_v7@internal@tbb@@YAXW4itt_domain_enum@12@PEAX_KW4itt_relation@12@12@Z )
+__TBB_SYMBOL( ?itt_task_begin_v7@internal@tbb@@YAXW4itt_domain_enum@12@PEAX_K12W4string_index@12@@Z )
+__TBB_SYMBOL( ?itt_task_end_v7@internal@tbb@@YAXW4itt_domain_enum@12@@Z )
+__TBB_SYMBOL( ?itt_region_begin_v9@internal@tbb@@YAXW4itt_domain_enum@12@PEAX_K12W4string_index@12@@Z )
+__TBB_SYMBOL( ?itt_region_end_v9@internal@tbb@@YAXW4itt_domain_enum@12@PEAX_K@Z )
+
+// pipeline.cpp
+__TBB_SYMBOL( ??_7pipeline@tbb@@6B@ )
+__TBB_SYMBOL( ??0pipeline@tbb@@QEAA@XZ )
+__TBB_SYMBOL( ??1filter@tbb@@UEAA@XZ )
+__TBB_SYMBOL( ??1pipeline@tbb@@UEAA@XZ )
+__TBB_SYMBOL( ?add_filter@pipeline@tbb@@QEAAXAEAVfilter@2@@Z )
+__TBB_SYMBOL( ?clear@pipeline@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?inject_token@pipeline@tbb@@AEAAXAEAVtask@2@@Z )
+__TBB_SYMBOL( ?run@pipeline@tbb@@QEAAX_K@Z )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( ?run@pipeline@tbb@@QEAAX_KAEAVtask_group_context@2@@Z )
+#endif
+__TBB_SYMBOL( ?process_item@thread_bound_filter@tbb@@QEAA?AW4result_type@12@XZ )
+__TBB_SYMBOL( ?try_process_item@thread_bound_filter@tbb@@QEAA?AW4result_type@12@XZ )
+__TBB_SYMBOL( ?set_end_of_input@filter@tbb@@IEAAXXZ )
+
+// queuing_rw_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@queuing_rw_mutex@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?acquire@scoped_lock@queuing_rw_mutex@tbb@@QEAAXAEAV23@_N@Z )
+__TBB_SYMBOL( ?downgrade_to_reader@scoped_lock@queuing_rw_mutex@tbb@@QEAA_NXZ )
+__TBB_SYMBOL( ?release@scoped_lock@queuing_rw_mutex@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?upgrade_to_writer@scoped_lock@queuing_rw_mutex@tbb@@QEAA_NXZ )
+__TBB_SYMBOL( ?try_acquire@scoped_lock@queuing_rw_mutex@tbb@@QEAA_NAEAV23@_N@Z )
+
+// reader_writer_lock.cpp
+__TBB_SYMBOL( ?try_lock_read@reader_writer_lock@interface5@tbb@@QEAA_NXZ )
+__TBB_SYMBOL( ?try_lock@reader_writer_lock@interface5@tbb@@QEAA_NXZ )
+__TBB_SYMBOL( ?unlock@reader_writer_lock@interface5@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?lock_read@reader_writer_lock@interface5@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?lock@reader_writer_lock@interface5@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?internal_construct@reader_writer_lock@interface5@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@reader_writer_lock@interface5@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_construct@scoped_lock@reader_writer_lock@interface5@tbb@@AEAAXAEAV234@@Z )
+__TBB_SYMBOL( ?internal_destroy@scoped_lock@reader_writer_lock@interface5@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_construct@scoped_lock_read@reader_writer_lock@interface5@tbb@@AEAAXAEAV234@@Z )
+__TBB_SYMBOL( ?internal_destroy@scoped_lock_read@reader_writer_lock@interface5@tbb@@AEAAXXZ )
+
+#if !TBB_NO_LEGACY
+// spin_rw_mutex.cpp v2
+__TBB_SYMBOL( ?internal_itt_releasing@spin_rw_mutex@tbb@@CAXPEAV12@@Z )
+__TBB_SYMBOL( ?internal_acquire_writer@spin_rw_mutex@tbb@@CA_NPEAV12@@Z )
+__TBB_SYMBOL( ?internal_acquire_reader@spin_rw_mutex@tbb@@CAXPEAV12@@Z )
+__TBB_SYMBOL( ?internal_downgrade@spin_rw_mutex@tbb@@CAXPEAV12@@Z )
+__TBB_SYMBOL( ?internal_upgrade@spin_rw_mutex@tbb@@CA_NPEAV12@@Z )
+__TBB_SYMBOL( ?internal_release_reader@spin_rw_mutex@tbb@@CAXPEAV12@@Z )
+__TBB_SYMBOL( ?internal_release_writer@spin_rw_mutex@tbb@@CAXPEAV12@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_writer@spin_rw_mutex@tbb@@CA_NPEAV12@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_reader@spin_rw_mutex@tbb@@CA_NPEAV12@@Z )
+#endif
+
+// spin_rw_mutex v3
+__TBB_SYMBOL( ?internal_construct@spin_rw_mutex_v3@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_upgrade@spin_rw_mutex_v3@tbb@@AEAA_NXZ )
+__TBB_SYMBOL( ?internal_downgrade@spin_rw_mutex_v3@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_acquire_reader@spin_rw_mutex_v3@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_acquire_writer@spin_rw_mutex_v3@tbb@@AEAA_NXZ )
+__TBB_SYMBOL( ?internal_release_reader@spin_rw_mutex_v3@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_release_writer@spin_rw_mutex_v3@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire_reader@spin_rw_mutex_v3@tbb@@AEAA_NXZ )
+__TBB_SYMBOL( ?internal_try_acquire_writer@spin_rw_mutex_v3@tbb@@AEAA_NXZ )
+
+// x86_rtm_rw_mutex.cpp
+__TBB_SYMBOL( ?internal_acquire_writer@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAAXAEAVscoped_lock@1234@_N@Z )
+__TBB_SYMBOL( ?internal_acquire_reader@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAAXAEAVscoped_lock@1234@_N@Z )
+__TBB_SYMBOL( ?internal_upgrade@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAA_NAEAVscoped_lock@1234@@Z )
+__TBB_SYMBOL( ?internal_downgrade@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAA_NAEAVscoped_lock@1234@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_writer@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAA_NAEAVscoped_lock@1234@@Z )
+__TBB_SYMBOL( ?internal_release@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAAXAEAVscoped_lock@1234@@Z )
+__TBB_SYMBOL( ?internal_construct@x86_rtm_rw_mutex@internal@interface8@tbb@@AEAAXXZ )
+
+// spin_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@spin_mutex@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@spin_mutex@tbb@@AEAAXAEAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@spin_mutex@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@spin_mutex@tbb@@AEAA_NAEAV23@@Z )
+
+// mutex.cpp
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@mutex@tbb@@AEAAXAEAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@mutex@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@mutex@tbb@@AEAA_NAEAV23@@Z )
+__TBB_SYMBOL( ?internal_construct@mutex@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@mutex@tbb@@AEAAXXZ )
+
+// recursive_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@recursive_mutex@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@recursive_mutex@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@recursive_mutex@tbb@@AEAAXAEAV23@@Z )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@recursive_mutex@tbb@@AEAA_NAEAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@recursive_mutex@tbb@@AEAAXXZ )
+
+// queuing_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@queuing_mutex@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?acquire@scoped_lock@queuing_mutex@tbb@@QEAAXAEAV23@@Z )
+__TBB_SYMBOL( ?release@scoped_lock@queuing_mutex@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?try_acquire@scoped_lock@queuing_mutex@tbb@@QEAA_NAEAV23@@Z )
+
+//critical_section.cpp
+__TBB_SYMBOL( ?internal_construct@critical_section_v4@internal@tbb@@QEAAXXZ )
+
+#if !TBB_NO_LEGACY
+// concurrent_hash_map.cpp
+__TBB_SYMBOL( ?internal_grow_predicate@hash_map_segment_base@internal@tbb@@QEBA_NXZ )
+
+// concurrent_queue.cpp v2
+__TBB_SYMBOL( ??0concurrent_queue_base@internal@tbb@@IEAA@_K@Z )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base@internal@tbb@@IEAA@AEBVconcurrent_queue_base@12@@Z )
+__TBB_SYMBOL( ??1concurrent_queue_base@internal@tbb@@MEAA@XZ )
+__TBB_SYMBOL( ??1concurrent_queue_iterator_base@internal@tbb@@IEAA@XZ )
+__TBB_SYMBOL( ?advance@concurrent_queue_iterator_base@internal@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_iterator_base@internal@tbb@@IEAAXAEBV123@@Z )
+__TBB_SYMBOL( ?internal_pop@concurrent_queue_base@internal@tbb@@IEAAXPEAX@Z )
+__TBB_SYMBOL( ?internal_pop_if_present@concurrent_queue_base@internal@tbb@@IEAA_NPEAX@Z )
+__TBB_SYMBOL( ?internal_push@concurrent_queue_base@internal@tbb@@IEAAXPEBX@Z )
+__TBB_SYMBOL( ?internal_push_if_not_full@concurrent_queue_base@internal@tbb@@IEAA_NPEBX@Z )
+__TBB_SYMBOL( ?internal_set_capacity@concurrent_queue_base@internal@tbb@@IEAAX_J_K@Z )
+__TBB_SYMBOL( ?internal_size@concurrent_queue_base@internal@tbb@@IEBA_JXZ )
+#endif
+
+// concurrent_queue v3
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base_v3@internal@tbb@@IEAA@AEBVconcurrent_queue_base_v3@12@@Z )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base_v3@internal@tbb@@IEAA@AEBVconcurrent_queue_base_v3@12@_K@Z )
+__TBB_SYMBOL( ??1concurrent_queue_iterator_base_v3@internal@tbb@@IEAA@XZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_iterator_base_v3@internal@tbb@@IEAAXAEBV123@@Z )
+__TBB_SYMBOL( ?advance@concurrent_queue_iterator_base_v3@internal@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ??0concurrent_queue_base_v3@internal@tbb@@IEAA@_K@Z )
+__TBB_SYMBOL( ??1concurrent_queue_base_v3@internal@tbb@@MEAA@XZ )
+__TBB_SYMBOL( ?internal_push@concurrent_queue_base_v3@internal@tbb@@IEAAXPEBX@Z )
+__TBB_SYMBOL( ?internal_push_move@concurrent_queue_base_v8@internal@tbb@@IEAAXPEBX@Z )
+__TBB_SYMBOL( ?internal_push_if_not_full@concurrent_queue_base_v3@internal@tbb@@IEAA_NPEBX@Z )
+__TBB_SYMBOL( ?internal_push_move_if_not_full@concurrent_queue_base_v8@internal@tbb@@IEAA_NPEBX@Z )
+__TBB_SYMBOL( ?internal_pop@concurrent_queue_base_v3@internal@tbb@@IEAAXPEAX@Z )
+__TBB_SYMBOL( ?internal_pop_if_present@concurrent_queue_base_v3@internal@tbb@@IEAA_NPEAX@Z )
+__TBB_SYMBOL( ?internal_abort@concurrent_queue_base_v3@internal@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?internal_size@concurrent_queue_base_v3@internal@tbb@@IEBA_JXZ )
+__TBB_SYMBOL( ?internal_empty@concurrent_queue_base_v3@internal@tbb@@IEBA_NXZ )
+__TBB_SYMBOL( ?internal_finish_clear@concurrent_queue_base_v3@internal@tbb@@IEAAXXZ )
+__TBB_SYMBOL( ?internal_set_capacity@concurrent_queue_base_v3@internal@tbb@@IEAAX_J_K@Z )
+__TBB_SYMBOL( ?internal_throw_exception@concurrent_queue_base_v3@internal@tbb@@IEBAXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_base_v3@internal@tbb@@IEAAXAEBV123@@Z )
+__TBB_SYMBOL( ?move_content@concurrent_queue_base_v8@internal@tbb@@IEAAXAEAV123@@Z )
+
+#if !TBB_NO_LEGACY
+// concurrent_vector.cpp v2
+__TBB_SYMBOL( ?internal_assign@concurrent_vector_base@internal@tbb@@IEAAXAEBV123@_KP6AXPEAX1@ZP6AX2PEBX1@Z5@Z )
+__TBB_SYMBOL( ?internal_capacity@concurrent_vector_base@internal@tbb@@IEBA_KXZ )
+__TBB_SYMBOL( ?internal_clear@concurrent_vector_base@internal@tbb@@IEAAXP6AXPEAX_K@Z_N@Z )
+__TBB_SYMBOL( ?internal_copy@concurrent_vector_base@internal@tbb@@IEAAXAEBV123@_KP6AXPEAXPEBX1@Z@Z )
+__TBB_SYMBOL( ?internal_grow_by@concurrent_vector_base@internal@tbb@@IEAA_K_K0P6AXPEAX0@Z@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least@concurrent_vector_base@internal@tbb@@IEAAX_K0P6AXPEAX0@Z@Z )
+__TBB_SYMBOL( ?internal_push_back@concurrent_vector_base@internal@tbb@@IEAAPEAX_KAEA_K@Z )
+__TBB_SYMBOL( ?internal_reserve@concurrent_vector_base@internal@tbb@@IEAAX_K00@Z )
+#endif
+
+// concurrent_vector v3
+__TBB_SYMBOL( ??1concurrent_vector_base_v3@internal@tbb@@IEAA@XZ )
+__TBB_SYMBOL( ?internal_assign@concurrent_vector_base_v3@internal@tbb@@IEAAXAEBV123@_KP6AXPEAX1@ZP6AX2PEBX1@Z5@Z )
+__TBB_SYMBOL( ?internal_capacity@concurrent_vector_base_v3@internal@tbb@@IEBA_KXZ )
+__TBB_SYMBOL( ?internal_clear@concurrent_vector_base_v3@internal@tbb@@IEAA_KP6AXPEAX_K@Z@Z )
+__TBB_SYMBOL( ?internal_copy@concurrent_vector_base_v3@internal@tbb@@IEAAXAEBV123@_KP6AXPEAXPEBX1@Z@Z )
+__TBB_SYMBOL( ?internal_grow_by@concurrent_vector_base_v3@internal@tbb@@IEAA_K_K0P6AXPEAXPEBX0@Z2@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least@concurrent_vector_base_v3@internal@tbb@@IEAAX_K0P6AXPEAXPEBX0@Z2@Z )
+__TBB_SYMBOL( ?internal_push_back@concurrent_vector_base_v3@internal@tbb@@IEAAPEAX_KAEA_K@Z )
+__TBB_SYMBOL( ?internal_reserve@concurrent_vector_base_v3@internal@tbb@@IEAAX_K00@Z )
+__TBB_SYMBOL( ?internal_compact@concurrent_vector_base_v3@internal@tbb@@IEAAPEAX_KPEAXP6AX10@ZP6AX1PEBX0@Z@Z )
+__TBB_SYMBOL( ?internal_swap@concurrent_vector_base_v3@internal@tbb@@IEAAXAEAV123@@Z )
+__TBB_SYMBOL( ?internal_throw_exception@concurrent_vector_base_v3@internal@tbb@@IEBAX_K@Z )
+__TBB_SYMBOL( ?internal_resize@concurrent_vector_base_v3@internal@tbb@@IEAAX_K00PEBXP6AXPEAX0@ZP6AX210@Z@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least_with_result@concurrent_vector_base_v3@internal@tbb@@IEAA_K_K0P6AXPEAXPEBX0@Z2@Z )
+
+// tbb_thread
+__TBB_SYMBOL( ?allocate_closure_v3@internal@tbb@@YAPEAX_K@Z )
+__TBB_SYMBOL( ?detach@tbb_thread_v3@internal@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?free_closure_v3@internal@tbb@@YAXPEAX@Z )
+__TBB_SYMBOL( ?hardware_concurrency@tbb_thread_v3@internal@tbb@@SAIXZ )
+__TBB_SYMBOL( ?internal_start@tbb_thread_v3@internal@tbb@@AEAAXP6AIPEAX@Z0@Z )
+__TBB_SYMBOL( ?join@tbb_thread_v3@internal@tbb@@QEAAXXZ )
+__TBB_SYMBOL( ?move_v3@internal@tbb@@YAXAEAVtbb_thread_v3@12@0@Z )
+__TBB_SYMBOL( ?thread_get_id_v3@internal@tbb@@YA?AVid@tbb_thread_v3@12@XZ )
+__TBB_SYMBOL( ?thread_sleep_v3@internal@tbb@@YAXAEBVinterval_t@tick_count@2@@Z )
+__TBB_SYMBOL( ?thread_yield_v3@internal@tbb@@YAXXZ )
+
+// condition_variable
+__TBB_SYMBOL( ?internal_initialize_condition_variable@internal@interface5@tbb@@YAXAEATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_wait@internal@interface5@tbb@@YA_NAEATcondvar_impl_t@123@PEAVmutex@3@PEBVinterval_t@tick_count@3@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_notify_one@internal@interface5@tbb@@YAXAEATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_notify_all@internal@interface5@tbb@@YAXAEATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_destroy_condition_variable@internal@interface5@tbb@@YAXAEATcondvar_impl_t@123@@Z )
+
+// global parameter
+__TBB_SYMBOL( ?active_value@global_control@interface9@tbb@@CA_KH@Z )
+__TBB_SYMBOL( ?internal_create@global_control@interface9@tbb@@AEAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@global_control@interface9@tbb@@AEAAXXZ )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/winrt-tbb-export.lst b/xdl/third_party/tbb/src/tbb/winrt-tbb-export.lst
new file mode 100644
index 00000000..e30e6294
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/winrt-tbb-export.lst
@@ -0,0 +1,300 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+#include "tbb/tbb_config.h"
+
+// cache_aligned_allocator.cpp
+__TBB_SYMBOL( ?NFS_Allocate@internal@tbb@@YAPAXIIPAX@Z )
+__TBB_SYMBOL( ?NFS_GetLineSize@internal@tbb@@YAIXZ )
+__TBB_SYMBOL( ?NFS_Free@internal@tbb@@YAXPAX@Z )
+__TBB_SYMBOL( ?allocate_via_handler_v3@internal@tbb@@YAPAXI@Z )
+__TBB_SYMBOL( ?deallocate_via_handler_v3@internal@tbb@@YAXPAX@Z )
+__TBB_SYMBOL( ?is_malloc_used_v3@internal@tbb@@YA_NXZ )
+
+// task.cpp v3
+__TBB_SYMBOL( ?allocate@allocate_additional_child_of_proxy@internal@tbb@@QBAAAVtask@3@I@Z )
+__TBB_SYMBOL( ?allocate@allocate_child_proxy@internal@tbb@@QBAAAVtask@3@I@Z )
+__TBB_SYMBOL( ?allocate@allocate_continuation_proxy@internal@tbb@@QBAAAVtask@3@I@Z )
+__TBB_SYMBOL( ?allocate@allocate_root_proxy@internal@tbb@@SAAAVtask@3@I@Z )
+__TBB_SYMBOL( ?destroy@task_base@internal@interface5@tbb@@SAXAAVtask@4@@Z )
+__TBB_SYMBOL( ?free@allocate_additional_child_of_proxy@internal@tbb@@QBAXAAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_child_proxy@internal@tbb@@QBAXAAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_continuation_proxy@internal@tbb@@QBAXAAVtask@3@@Z )
+__TBB_SYMBOL( ?free@allocate_root_proxy@internal@tbb@@SAXAAVtask@3@@Z )
+__TBB_SYMBOL( ?internal_set_ref_count@task@tbb@@AAAXH@Z )
+__TBB_SYMBOL( ?internal_decrement_ref_count@task@tbb@@AAAHXZ )
+__TBB_SYMBOL( ?is_owned_by_current_thread@task@tbb@@QBA_NXZ )
+__TBB_SYMBOL( ?note_affinity@task@tbb@@UAAXG@Z )
+__TBB_SYMBOL( ?resize@affinity_partitioner_base_v3@internal@tbb@@AAAXI@Z )
+__TBB_SYMBOL( ?self@task@tbb@@SAAAV12@XZ )
+__TBB_SYMBOL( ?spawn_and_wait_for_all@task@tbb@@QAAXAAVtask_list@2@@Z )
+__TBB_SYMBOL( ?default_num_threads@task_scheduler_init@tbb@@SAHXZ )
+__TBB_SYMBOL( ?initialize@task_scheduler_init@tbb@@QAAXHI@Z )
+__TBB_SYMBOL( ?initialize@task_scheduler_init@tbb@@QAAXH@Z )
+__TBB_SYMBOL( ?terminate@task_scheduler_init@tbb@@QAAXXZ )
+#if __TBB_SCHEDULER_OBSERVER
+__TBB_SYMBOL( ?observe@task_scheduler_observer_v3@internal@tbb@@QAAX_N@Z )
+#endif /* __TBB_SCHEDULER_OBSERVER */
+
+/* arena.cpp */
+__TBB_SYMBOL( ?internal_max_concurrency@task_arena_base@internal@interface7@tbb@@KAHPBVtask_arena@34@@Z )
+__TBB_SYMBOL( ?internal_current_slot@task_arena_base@internal@interface7@tbb@@KAHXZ )
+__TBB_SYMBOL( ?internal_initialize@task_arena_base@internal@interface7@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?internal_terminate@task_arena_base@internal@interface7@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?internal_attach@task_arena_base@internal@interface7@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?internal_enqueue@task_arena_base@internal@interface7@tbb@@IBAXAAVtask@4@H@Z )
+__TBB_SYMBOL( ?internal_execute@task_arena_base@internal@interface7@tbb@@IBAXAAVdelegate_base@234@@Z )
+__TBB_SYMBOL( ?internal_wait@task_arena_base@internal@interface7@tbb@@IBAXXZ )
+#if __TBB_TASK_ISOLATION
+__TBB_SYMBOL( ?isolate_within_arena@internal@interface7@tbb@@YAXAAVdelegate_base@123@H@Z )
+#endif /* __TBB_TASK_ISOLATION */
+
+#if !TBB_NO_LEGACY
+// task_v2.cpp
+__TBB_SYMBOL( ?destroy@task@tbb@@QAAXAAV12@@Z )
+#endif
+
+// exception handling support
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( ?allocate@allocate_root_with_context_proxy@internal@tbb@@QBAAAVtask@3@I@Z )
+__TBB_SYMBOL( ?free@allocate_root_with_context_proxy@internal@tbb@@QBAXAAVtask@3@@Z )
+__TBB_SYMBOL( ?change_group@task@tbb@@QAAXAAVtask_group_context@2@@Z )
+__TBB_SYMBOL( ?is_group_execution_cancelled@task_group_context@tbb@@QBA_NXZ )
+__TBB_SYMBOL( ?cancel_group_execution@task_group_context@tbb@@QAA_NXZ )
+__TBB_SYMBOL( ?reset@task_group_context@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?capture_fp_settings@task_group_context@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?init@task_group_context@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?register_pending_exception@task_group_context@tbb@@QAAXXZ )
+__TBB_SYMBOL( ??1task_group_context@tbb@@QAA@XZ )
+#if __TBB_TASK_PRIORITY
+__TBB_SYMBOL( ?set_priority@task_group_context@tbb@@QAAXW4priority_t@2@@Z )
+__TBB_SYMBOL( ?priority@task_group_context@tbb@@QBA?AW4priority_t@2@XZ )
+#endif /* __TBB_TASK_PRIORITY */
+__TBB_SYMBOL( ?name@captured_exception@tbb@@UBAPBDXZ )
+__TBB_SYMBOL( ?what@captured_exception@tbb@@UBAPBDXZ )
+__TBB_SYMBOL( ??1captured_exception@tbb@@UAA@XZ )
+__TBB_SYMBOL( ?move@captured_exception@tbb@@UAAPAV12@XZ )
+__TBB_SYMBOL( ?destroy@captured_exception@tbb@@UAAXXZ )
+__TBB_SYMBOL( ?set@captured_exception@tbb@@QAAXPBD0@Z )
+__TBB_SYMBOL( ?clear@captured_exception@tbb@@QAAXXZ )
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+// Symbols for exceptions thrown from TBB
+__TBB_SYMBOL( ?throw_bad_last_alloc_exception_v4@internal@tbb@@YAXXZ )
+__TBB_SYMBOL( ?throw_exception_v4@internal@tbb@@YAXW4exception_id@12@@Z )
+__TBB_SYMBOL( ?what@bad_last_alloc@tbb@@UBAPBDXZ )
+__TBB_SYMBOL( ?what@missing_wait@tbb@@UBAPBDXZ )
+__TBB_SYMBOL( ?what@invalid_multiple_scheduling@tbb@@UBAPBDXZ )
+__TBB_SYMBOL( ?what@improper_lock@tbb@@UBAPBDXZ )
+__TBB_SYMBOL( ?what@user_abort@tbb@@UBAPBDXZ )
+
+// tbb_misc.cpp
+__TBB_SYMBOL( ?assertion_failure@tbb@@YAXPBDH00@Z )
+__TBB_SYMBOL( ?get_initial_auto_partitioner_divisor@internal@tbb@@YAIXZ )
+__TBB_SYMBOL( ?handle_perror@internal@tbb@@YAXHPBD@Z )
+__TBB_SYMBOL( ?set_assertion_handler@tbb@@YAP6AXPBDH00@ZP6AX0H00@Z@Z )
+__TBB_SYMBOL( ?runtime_warning@internal@tbb@@YAXPBDZZ )
+__TBB_SYMBOL( TBB_runtime_interface_version )
+
+// tbb_main.cpp
+__TBB_SYMBOL( ?itt_load_pointer_with_acquire_v3@internal@tbb@@YAPAXPBX@Z )
+__TBB_SYMBOL( ?itt_store_pointer_with_release_v3@internal@tbb@@YAXPAX0@Z )
+__TBB_SYMBOL( ?call_itt_notify_v5@internal@tbb@@YAXHPAX@Z )
+__TBB_SYMBOL( ?itt_set_sync_name_v3@internal@tbb@@YAXPAXPB_W@Z )
+__TBB_SYMBOL( ?itt_load_pointer_v3@internal@tbb@@YAPAXPBX@Z )
+
+// pipeline.cpp
+__TBB_SYMBOL( ??0pipeline@tbb@@QAA@XZ )
+__TBB_SYMBOL( ??1filter@tbb@@UAA@XZ )
+__TBB_SYMBOL( ??1pipeline@tbb@@UAA@XZ )
+__TBB_SYMBOL( ??_7pipeline@tbb@@6B@ )
+__TBB_SYMBOL( ?add_filter@pipeline@tbb@@QAAXAAVfilter@2@@Z )
+__TBB_SYMBOL( ?clear@pipeline@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?inject_token@pipeline@tbb@@AAAXAAVtask@2@@Z )
+__TBB_SYMBOL( ?run@pipeline@tbb@@QAAXI@Z )
+#if __TBB_TASK_GROUP_CONTEXT
+__TBB_SYMBOL( ?run@pipeline@tbb@@QAAXIAAVtask_group_context@2@@Z )
+#endif
+__TBB_SYMBOL( ?process_item@thread_bound_filter@tbb@@QAA?AW4result_type@12@XZ )
+__TBB_SYMBOL( ?try_process_item@thread_bound_filter@tbb@@QAA?AW4result_type@12@XZ )
+__TBB_SYMBOL( ?set_end_of_input@filter@tbb@@IAAXXZ )
+
+// queuing_rw_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@queuing_rw_mutex@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?acquire@scoped_lock@queuing_rw_mutex@tbb@@QAAXAAV23@_N@Z )
+__TBB_SYMBOL( ?downgrade_to_reader@scoped_lock@queuing_rw_mutex@tbb@@QAA_NXZ )
+__TBB_SYMBOL( ?release@scoped_lock@queuing_rw_mutex@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?upgrade_to_writer@scoped_lock@queuing_rw_mutex@tbb@@QAA_NXZ )
+__TBB_SYMBOL( ?try_acquire@scoped_lock@queuing_rw_mutex@tbb@@QAA_NAAV23@_N@Z )
+
+// reader_writer_lock.cpp
+__TBB_SYMBOL( ?try_lock_read@reader_writer_lock@interface5@tbb@@QAA_NXZ )
+__TBB_SYMBOL( ?try_lock@reader_writer_lock@interface5@tbb@@QAA_NXZ )
+__TBB_SYMBOL( ?unlock@reader_writer_lock@interface5@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?lock_read@reader_writer_lock@interface5@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?lock@reader_writer_lock@interface5@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?internal_construct@reader_writer_lock@interface5@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@reader_writer_lock@interface5@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_construct@scoped_lock@reader_writer_lock@interface5@tbb@@AAAXAAV234@@Z )
+__TBB_SYMBOL( ?internal_destroy@scoped_lock@reader_writer_lock@interface5@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_construct@scoped_lock_read@reader_writer_lock@interface5@tbb@@AAAXAAV234@@Z )
+__TBB_SYMBOL( ?internal_destroy@scoped_lock_read@reader_writer_lock@interface5@tbb@@AAAXXZ )
+
+#if !TBB_NO_LEGACY
+// spin_rw_mutex.cpp v2
+__TBB_SYMBOL( ?internal_acquire_reader@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_acquire_writer@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+__TBB_SYMBOL( ?internal_downgrade@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_itt_releasing@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_release_reader@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_release_writer@spin_rw_mutex@tbb@@CAXPAV12@@Z )
+__TBB_SYMBOL( ?internal_upgrade@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_writer@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+__TBB_SYMBOL( ?internal_try_acquire_reader@spin_rw_mutex@tbb@@CA_NPAV12@@Z )
+#endif
+
+// spin_rw_mutex v3
+__TBB_SYMBOL( ?internal_construct@spin_rw_mutex_v3@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_upgrade@spin_rw_mutex_v3@tbb@@AAA_NXZ )
+__TBB_SYMBOL( ?internal_downgrade@spin_rw_mutex_v3@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_acquire_reader@spin_rw_mutex_v3@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_acquire_writer@spin_rw_mutex_v3@tbb@@AAA_NXZ )
+__TBB_SYMBOL( ?internal_release_reader@spin_rw_mutex_v3@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_release_writer@spin_rw_mutex_v3@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire_reader@spin_rw_mutex_v3@tbb@@AAA_NXZ )
+__TBB_SYMBOL( ?internal_try_acquire_writer@spin_rw_mutex_v3@tbb@@AAA_NXZ )
+
+// spin_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@spin_mutex@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@spin_mutex@tbb@@AAAXAAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@spin_mutex@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@spin_mutex@tbb@@AAA_NAAV23@@Z )
+
+// mutex.cpp
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@mutex@tbb@@AAAXAAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@mutex@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@mutex@tbb@@AAA_NAAV23@@Z )
+__TBB_SYMBOL( ?internal_construct@mutex@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@mutex@tbb@@AAAXXZ )
+
+// recursive_mutex.cpp
+__TBB_SYMBOL( ?internal_acquire@scoped_lock@recursive_mutex@tbb@@AAAXAAV23@@Z )
+__TBB_SYMBOL( ?internal_release@scoped_lock@recursive_mutex@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_try_acquire@scoped_lock@recursive_mutex@tbb@@AAA_NAAV23@@Z )
+__TBB_SYMBOL( ?internal_construct@recursive_mutex@tbb@@AAAXXZ )
+__TBB_SYMBOL( ?internal_destroy@recursive_mutex@tbb@@AAAXXZ )
+
+// queuing_mutex.cpp
+__TBB_SYMBOL( ?internal_construct@queuing_mutex@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?acquire@scoped_lock@queuing_mutex@tbb@@QAAXAAV23@@Z )
+__TBB_SYMBOL( ?release@scoped_lock@queuing_mutex@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?try_acquire@scoped_lock@queuing_mutex@tbb@@QAA_NAAV23@@Z )
+
+// critical_section.cpp
+__TBB_SYMBOL( ?internal_construct@critical_section_v4@internal@tbb@@QAAXXZ )
+
+#if !TBB_NO_LEGACY
+// concurrent_hash_map.cpp
+__TBB_SYMBOL( ?internal_grow_predicate@hash_map_segment_base@internal@tbb@@QBA_NXZ )
+
+// concurrent_queue.cpp v2
+__TBB_SYMBOL( ?advance@concurrent_queue_iterator_base@internal@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_iterator_base@internal@tbb@@IAAXABV123@@Z )
+__TBB_SYMBOL( ?internal_size@concurrent_queue_base@internal@tbb@@IBAHXZ )
+__TBB_SYMBOL( ??0concurrent_queue_base@internal@tbb@@IAA@I@Z )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base@internal@tbb@@IAA@ABVconcurrent_queue_base@12@@Z )
+__TBB_SYMBOL( ??1concurrent_queue_base@internal@tbb@@MAA@XZ )
+__TBB_SYMBOL( ??1concurrent_queue_iterator_base@internal@tbb@@IAA@XZ )
+__TBB_SYMBOL( ?internal_pop@concurrent_queue_base@internal@tbb@@IAAXPAX@Z )
+__TBB_SYMBOL( ?internal_pop_if_present@concurrent_queue_base@internal@tbb@@IAA_NPAX@Z )
+__TBB_SYMBOL( ?internal_push@concurrent_queue_base@internal@tbb@@IAAXPBX@Z )
+__TBB_SYMBOL( ?internal_push_if_not_full@concurrent_queue_base@internal@tbb@@IAA_NPBX@Z )
+__TBB_SYMBOL( ?internal_set_capacity@concurrent_queue_base@internal@tbb@@IAAXHI@Z )
+#endif
+
+// concurrent_queue v3
+__TBB_SYMBOL( ??1concurrent_queue_iterator_base_v3@internal@tbb@@IAA@XZ )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base_v3@internal@tbb@@IAA@ABVconcurrent_queue_base_v3@12@@Z )
+__TBB_SYMBOL( ??0concurrent_queue_iterator_base_v3@internal@tbb@@IAA@ABVconcurrent_queue_base_v3@12@I@Z )
+__TBB_SYMBOL( ?advance@concurrent_queue_iterator_base_v3@internal@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_iterator_base_v3@internal@tbb@@IAAXABV123@@Z )
+__TBB_SYMBOL( ??0concurrent_queue_base_v3@internal@tbb@@IAA@I@Z )
+__TBB_SYMBOL( ??1concurrent_queue_base_v3@internal@tbb@@MAA@XZ )
+__TBB_SYMBOL( ?internal_pop@concurrent_queue_base_v3@internal@tbb@@IAAXPAX@Z )
+__TBB_SYMBOL( ?internal_pop_if_present@concurrent_queue_base_v3@internal@tbb@@IAA_NPAX@Z )
+__TBB_SYMBOL( ?internal_abort@concurrent_queue_base_v3@internal@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?internal_push@concurrent_queue_base_v3@internal@tbb@@IAAXPBX@Z )
+__TBB_SYMBOL( ?internal_push_move@concurrent_queue_base_v8@internal@tbb@@IAAXPBX@Z )
+__TBB_SYMBOL( ?internal_push_if_not_full@concurrent_queue_base_v3@internal@tbb@@IAA_NPBX@Z )
+__TBB_SYMBOL( ?internal_push_move_if_not_full@concurrent_queue_base_v8@internal@tbb@@IAA_NPBX@Z )
+__TBB_SYMBOL( ?internal_size@concurrent_queue_base_v3@internal@tbb@@IBAHXZ )
+__TBB_SYMBOL( ?internal_empty@concurrent_queue_base_v3@internal@tbb@@IBA_NXZ )
+__TBB_SYMBOL( ?internal_set_capacity@concurrent_queue_base_v3@internal@tbb@@IAAXHI@Z )
+__TBB_SYMBOL( ?internal_finish_clear@concurrent_queue_base_v3@internal@tbb@@IAAXXZ )
+__TBB_SYMBOL( ?internal_throw_exception@concurrent_queue_base_v3@internal@tbb@@IBAXXZ )
+__TBB_SYMBOL( ?assign@concurrent_queue_base_v3@internal@tbb@@IAAXABV123@@Z )
+__TBB_SYMBOL( ?move_content@concurrent_queue_base_v8@internal@tbb@@IAAXAAV123@@Z )
+
+#if !TBB_NO_LEGACY
+// concurrent_vector.cpp v2
+__TBB_SYMBOL( ?internal_assign@concurrent_vector_base@internal@tbb@@IAAXABV123@IP6AXPAXI@ZP6AX1PBXI@Z4@Z )
+__TBB_SYMBOL( ?internal_capacity@concurrent_vector_base@internal@tbb@@IBAIXZ )
+__TBB_SYMBOL( ?internal_clear@concurrent_vector_base@internal@tbb@@IAAXP6AXPAXI@Z_N@Z )
+__TBB_SYMBOL( ?internal_copy@concurrent_vector_base@internal@tbb@@IAAXABV123@IP6AXPAXPBXI@Z@Z )
+__TBB_SYMBOL( ?internal_grow_by@concurrent_vector_base@internal@tbb@@IAAIIIP6AXPAXI@Z@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least@concurrent_vector_base@internal@tbb@@IAAXIIP6AXPAXI@Z@Z )
+__TBB_SYMBOL( ?internal_push_back@concurrent_vector_base@internal@tbb@@IAAPAXIAAI@Z )
+__TBB_SYMBOL( ?internal_reserve@concurrent_vector_base@internal@tbb@@IAAXIII@Z )
+#endif
+
+// concurrent_vector v3
+__TBB_SYMBOL( ??1concurrent_vector_base_v3@internal@tbb@@IAA@XZ )
+__TBB_SYMBOL( ?internal_assign@concurrent_vector_base_v3@internal@tbb@@IAAXABV123@IP6AXPAXI@ZP6AX1PBXI@Z4@Z )
+__TBB_SYMBOL( ?internal_capacity@concurrent_vector_base_v3@internal@tbb@@IBAIXZ )
+__TBB_SYMBOL( ?internal_clear@concurrent_vector_base_v3@internal@tbb@@IAAIP6AXPAXI@Z@Z )
+__TBB_SYMBOL( ?internal_copy@concurrent_vector_base_v3@internal@tbb@@IAAXABV123@IP6AXPAXPBXI@Z@Z )
+__TBB_SYMBOL( ?internal_grow_by@concurrent_vector_base_v3@internal@tbb@@IAAIIIP6AXPAXPBXI@Z1@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least@concurrent_vector_base_v3@internal@tbb@@IAAXIIP6AXPAXPBXI@Z1@Z )
+__TBB_SYMBOL( ?internal_push_back@concurrent_vector_base_v3@internal@tbb@@IAAPAXIAAI@Z )
+__TBB_SYMBOL( ?internal_reserve@concurrent_vector_base_v3@internal@tbb@@IAAXIII@Z )
+__TBB_SYMBOL( ?internal_compact@concurrent_vector_base_v3@internal@tbb@@IAAPAXIPAXP6AX0I@ZP6AX0PBXI@Z@Z )
+__TBB_SYMBOL( ?internal_swap@concurrent_vector_base_v3@internal@tbb@@IAAXAAV123@@Z )
+__TBB_SYMBOL( ?internal_throw_exception@concurrent_vector_base_v3@internal@tbb@@IBAXI@Z )
+__TBB_SYMBOL( ?internal_resize@concurrent_vector_base_v3@internal@tbb@@IAAXIIIPBXP6AXPAXI@ZP6AX10I@Z@Z )
+__TBB_SYMBOL( ?internal_grow_to_at_least_with_result@concurrent_vector_base_v3@internal@tbb@@IAAIIIP6AXPAXPBXI@Z1@Z )
+
+// tbb_thread
+__TBB_SYMBOL( ?join@tbb_thread_v3@internal@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?detach@tbb_thread_v3@internal@tbb@@QAAXXZ )
+__TBB_SYMBOL( ?internal_start@tbb_thread_v3@internal@tbb@@AAAXP6AIPAX@Z0@Z )
+__TBB_SYMBOL( ?allocate_closure_v3@internal@tbb@@YAPAXI@Z )
+__TBB_SYMBOL( ?free_closure_v3@internal@tbb@@YAXPAX@Z )
+__TBB_SYMBOL( ?hardware_concurrency@tbb_thread_v3@internal@tbb@@SAIXZ )
+__TBB_SYMBOL( ?thread_yield_v3@internal@tbb@@YAXXZ )
+__TBB_SYMBOL( ?thread_sleep_v3@internal@tbb@@YAXABVinterval_t@tick_count@2@@Z )
+__TBB_SYMBOL( ?move_v3@internal@tbb@@YAXAAVtbb_thread_v3@12@0@Z )
+__TBB_SYMBOL( ?thread_get_id_v3@internal@tbb@@YA?AVid@tbb_thread_v3@12@XZ )
+
+// condition_variable
+__TBB_SYMBOL( ?internal_initialize_condition_variable@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_wait@internal@interface5@tbb@@YA_NAATcondvar_impl_t@123@PAVmutex@3@PBVinterval_t@tick_count@3@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_notify_one@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_condition_variable_notify_all@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+__TBB_SYMBOL( ?internal_destroy_condition_variable@internal@interface5@tbb@@YAXAATcondvar_impl_t@123@@Z )
+
+#undef __TBB_SYMBOL
diff --git a/xdl/third_party/tbb/src/tbb/x86_rtm_rw_mutex.cpp b/xdl/third_party/tbb/src/tbb/x86_rtm_rw_mutex.cpp
new file mode 100644
index 00000000..ebf9d0c5
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbb/x86_rtm_rw_mutex.cpp
@@ -0,0 +1,282 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#if __TBB_TSX_AVAILABLE
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/tbb_machine.h"
+#include "itt_notify.h"
+#include "governor.h"
+#include "tbb/atomic.h"
+
+// __TBB_RW_MUTEX_DELAY_TEST shifts the point where flags aborting speculation are
+// added to the read-set of the operation.  If 1, will add the test just before
+// the transaction is ended; this technique is called lazy subscription.
+// CAUTION: due to proven issues of lazy subscription, use of __TBB_RW_MUTEX_DELAY_TEST is discouraged!
+#ifndef __TBB_RW_MUTEX_DELAY_TEST
+    #define __TBB_RW_MUTEX_DELAY_TEST 0
+#endif
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4244)
+#endif
+
+namespace tbb {
+
+namespace interface8 {
+namespace internal {
+
+// abort code for mutexes that detect a conflict with another thread.
+// value is hexadecimal
+enum {
+    speculation_transaction_aborted = 0x01,
+    speculation_can_retry           = 0x02,
+    speculation_memadd_conflict     = 0x04,
+    speculation_buffer_overflow     = 0x08,
+    speculation_breakpoint_hit      = 0x10,
+    speculation_nested_abort        = 0x20,
+    speculation_xabort_mask         = 0xFF000000,
+    speculation_xabort_shift        = 24,
+    speculation_retry               = speculation_transaction_aborted
+                                      | speculation_can_retry
+                                      | speculation_memadd_conflict
+};
+
+// maximum number of times to retry
+// TODO: experiment on retry values.
+static const int retry_threshold_read = 10;
+static const int retry_threshold_write = 10;
+
+//! Release speculative mutex
+void x86_rtm_rw_mutex::internal_release(x86_rtm_rw_mutex::scoped_lock& s) {
+    switch(s.transaction_state) {
+    case RTM_transacting_writer:
+    case RTM_transacting_reader:
+        {
+            __TBB_ASSERT(__TBB_machine_is_in_transaction(), "transaction_state && not speculating");
+#if __TBB_RW_MUTEX_DELAY_TEST
+            if(s.transaction_state == RTM_transacting_reader) {
+                if(this->w_flag) __TBB_machine_transaction_conflict_abort();
+            } else {
+                if(this->state) __TBB_machine_transaction_conflict_abort();
+            }
+#endif
+            __TBB_machine_end_transaction();
+            s.my_scoped_lock.mutex = NULL;
+        }
+        break;
+    case RTM_real_reader:
+        __TBB_ASSERT(!this->w_flag, "w_flag set but read lock acquired");
+        s.my_scoped_lock.release();
+        break;
+    case RTM_real_writer:
+        __TBB_ASSERT(this->w_flag, "w_flag unset but write lock acquired");
+        this->w_flag = false;
+        s.my_scoped_lock.release();
+        break;
+    case RTM_not_in_mutex:
+        __TBB_ASSERT(false, "RTM_not_in_mutex, but in release");
+        break;
+    default:
+        __TBB_ASSERT(false, "invalid transaction_state");
+    }
+    s.transaction_state = RTM_not_in_mutex;
+}
+
+//! Acquire write lock on the given mutex.
+void x86_rtm_rw_mutex::internal_acquire_writer(x86_rtm_rw_mutex::scoped_lock& s, bool only_speculate)
+{
+    __TBB_ASSERT(s.transaction_state == RTM_not_in_mutex, "scoped_lock already in transaction");
+    if(tbb::internal::governor::speculation_enabled()) {
+        int num_retries = 0;
+        unsigned int abort_code;
+        do {
+            tbb::internal::atomic_backoff backoff;
+            if(this->state) {
+                if(only_speculate) return;
+                do {
+                    backoff.pause();  // test the spin_rw_mutex (real readers or writers)
+                } while(this->state);
+            }
+            // _xbegin returns -1 on success or the abort code, so capture it
+            if(( abort_code = __TBB_machine_begin_transaction()) == ~(unsigned int)(0) )
+            {
+                // started speculation
+#if !__TBB_RW_MUTEX_DELAY_TEST
+                if(this->state) {  // add spin_rw_mutex to read-set.
+                    // reader or writer grabbed the lock, so abort.
+                    __TBB_machine_transaction_conflict_abort();
+                }
+#endif
+                s.transaction_state = RTM_transacting_writer;
+                // Don not wrap the following assignment to a function,
+                // because it can abort the transaction in debug. Need mutex for release().
+                s.my_scoped_lock.mutex = this;
+                return;  // successfully started speculation
+            }
+            ++num_retries;
+        } while( (abort_code & speculation_retry) != 0 && (num_retries < retry_threshold_write) );
+    }
+
+    if(only_speculate) return;              // should apply a real try_lock...
+    s.my_scoped_lock.acquire(*this, true);  // kill transactional writers
+    __TBB_ASSERT(!w_flag, "After acquire for write, w_flag already true");
+    w_flag = true;                          // kill transactional readers
+    s.transaction_state = RTM_real_writer;
+    return;
+}
+
+//! Acquire read lock on given mutex.
+//  only_speculate : true if we are doing a try_acquire.  If true and we fail to speculate, don't
+//     really acquire the lock, return and do a try_acquire on the contained spin_rw_mutex.  If
+//     the lock is already held by a writer, just return.
+void x86_rtm_rw_mutex::internal_acquire_reader(x86_rtm_rw_mutex::scoped_lock& s, bool only_speculate) {
+    __TBB_ASSERT(s.transaction_state == RTM_not_in_mutex, "scoped_lock already in transaction");
+    if(tbb::internal::governor::speculation_enabled()) {
+        int num_retries = 0;
+        unsigned int abort_code;
+        do {
+            tbb::internal::atomic_backoff backoff;
+            // if in try_acquire, and lock is held as writer, don't attempt to speculate.
+            if(w_flag) {
+                if(only_speculate) return;
+                do {
+                    backoff.pause();  // test the spin_rw_mutex (real readers or writers)
+                } while(w_flag);
+            }
+            // _xbegin returns -1 on success or the abort code, so capture it
+            if((abort_code = __TBB_machine_begin_transaction()) == ~(unsigned int)(0) )
+            {
+                // started speculation
+#if !__TBB_RW_MUTEX_DELAY_TEST
+                if(w_flag) {  // add w_flag to read-set.
+                    __TBB_machine_transaction_conflict_abort();  // writer grabbed the lock, so abort.
+                }
+#endif
+                s.transaction_state = RTM_transacting_reader;
+                // Don not wrap the following assignment to a function,
+                // because it can abort the transaction in debug. Need mutex for release().
+                s.my_scoped_lock.mutex = this;
+                return;  // successfully started speculation
+            }
+            // fallback path
+            // retry only if there is any hope of getting into a transaction soon
+            // Retry in the following cases (from Section 8.3.5 of Intel(R)
+            // Architecture Instruction Set Extensions Programming Reference):
+            // 1. abort caused by XABORT instruction (bit 0 of EAX register is set)
+            // 2. the transaction may succeed on a retry (bit 1 of EAX register is set)
+            // 3. if another logical processor conflicted with a memory address
+            //    that was part of the transaction that aborted (bit 2 of EAX register is set)
+            // That is, retry if (abort_code & 0x7) is non-zero
+            ++num_retries;
+        } while( (abort_code & speculation_retry) != 0 && (num_retries < retry_threshold_read) );
+    }
+
+    if(only_speculate) return;
+    s.my_scoped_lock.acquire( *this, false );
+    s.transaction_state = RTM_real_reader;
+}
+
+//! Upgrade reader to become a writer.
+/** Returns whether the upgrade happened without releasing and re-acquiring the lock */
+bool x86_rtm_rw_mutex::internal_upgrade(x86_rtm_rw_mutex::scoped_lock& s)
+{
+    switch(s.transaction_state) {
+    case RTM_real_reader: {
+            s.transaction_state = RTM_real_writer;
+            bool no_release = s.my_scoped_lock.upgrade_to_writer();
+            __TBB_ASSERT(!w_flag, "After upgrade_to_writer, w_flag already true");
+            w_flag = true;
+            return no_release;
+        }
+    case RTM_transacting_reader:
+#if !__TBB_RW_MUTEX_DELAY_TEST
+        if(this->state) {  // add spin_rw_mutex to read-set.
+            // Real reader or writer holds the lock; so commit the read and re-acquire for write.
+            internal_release(s);
+            internal_acquire_writer(s);
+            return false;
+        } else
+#endif
+        {
+            s.transaction_state = RTM_transacting_writer;
+            return true;
+        }
+    default:
+        __TBB_ASSERT(false, "Invalid state for upgrade");
+        return false;
+    }
+}
+
+//! Downgrade writer to a reader.
+bool x86_rtm_rw_mutex::internal_downgrade(x86_rtm_rw_mutex::scoped_lock& s) {
+    switch(s.transaction_state) {
+    case RTM_real_writer:
+        s.transaction_state = RTM_real_reader;
+        __TBB_ASSERT(w_flag, "Before downgrade_to_reader w_flag not true");
+        w_flag = false;
+        return s.my_scoped_lock.downgrade_to_reader();
+    case RTM_transacting_writer:
+#if __TBB_RW_MUTEX_DELAY_TEST
+        if(this->state) {  // a reader or writer has acquired mutex for real.
+            __TBB_machine_transaction_conflict_abort();
+        }
+#endif
+        s.transaction_state = RTM_transacting_reader;
+        return true;
+    default:
+        __TBB_ASSERT(false, "Invalid state for downgrade");
+        return false;
+    }
+}
+
+//! Try to acquire write lock on the given mutex.
+//  There may be reader(s) which acquired the spin_rw_mutex, as well as possibly
+//  transactional reader(s).  If this is the case, the acquire will fail, and assigning
+//  w_flag will kill the transactors.  So we only assign w_flag if we have successfully
+//  acquired the lock.
+bool x86_rtm_rw_mutex::internal_try_acquire_writer(x86_rtm_rw_mutex::scoped_lock& s)
+{
+    internal_acquire_writer(s, /*only_speculate=*/true);
+    if(s.transaction_state == RTM_transacting_writer) {
+        return true;
+    }
+    __TBB_ASSERT(s.transaction_state == RTM_not_in_mutex, "Trying to acquire writer which is already allocated");
+    // transacting write acquire failed.  try_acquire the real mutex
+    bool result = s.my_scoped_lock.try_acquire(*this, true);
+    if(result) {
+        // only shoot down readers if we're not transacting ourselves
+        __TBB_ASSERT(!w_flag, "After try_acquire_writer, w_flag already true");
+        w_flag = true;
+        s.transaction_state = RTM_real_writer;
+    }
+    return result;
+}
+
+void x86_rtm_rw_mutex::internal_construct() {
+    ITT_SYNC_CREATE(this, _T("tbb::x86_rtm_rw_mutex"), _T(""));
+}
+
+} // namespace internal
+} // namespace interface8
+} // namespace tbb
+
+#endif /* __TBB_TSX_AVAILABLE */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/Customize.h b/xdl/third_party/tbb/src/tbbmalloc/Customize.h
new file mode 100644
index 00000000..49866acd
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/Customize.h
@@ -0,0 +1,149 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_malloc_Customize_H_
+#define _TBB_malloc_Customize_H_
+
+// customizing MALLOC_ASSERT macro
+#include "tbb/tbb_stddef.h"
+#define MALLOC_ASSERT(assertion, message) __TBB_ASSERT(assertion, message)
+
+#ifndef MALLOC_DEBUG
+#define MALLOC_DEBUG TBB_USE_DEBUG
+#endif
+
+#include "Synchronize.h"
+
+#if DO_ITT_NOTIFY
+#include "tbb/itt_notify.h"
+#define MALLOC_ITT_SYNC_PREPARE(pointer) ITT_NOTIFY(sync_prepare, (pointer))
+#define MALLOC_ITT_SYNC_ACQUIRED(pointer) ITT_NOTIFY(sync_acquired, (pointer))
+#define MALLOC_ITT_SYNC_RELEASING(pointer) ITT_NOTIFY(sync_releasing, (pointer))
+#define MALLOC_ITT_SYNC_CANCEL(pointer) ITT_NOTIFY(sync_cancel, (pointer))
+#define MALLOC_ITT_FINI_ITTLIB()        ITT_FINI_ITTLIB()
+#else
+#define MALLOC_ITT_SYNC_PREPARE(pointer) ((void)0)
+#define MALLOC_ITT_SYNC_ACQUIRED(pointer) ((void)0)
+#define MALLOC_ITT_SYNC_RELEASING(pointer) ((void)0)
+#define MALLOC_ITT_SYNC_CANCEL(pointer) ((void)0)
+#define MALLOC_ITT_FINI_ITTLIB()        ((void)0)
+#endif
+
+inline intptr_t BitScanRev(uintptr_t x) {
+    return !x? -1 : __TBB_Log2(x);
+}
+
+template<typename T>
+static inline bool isAligned(T* arg, uintptr_t alignment) {
+    return tbb::internal::is_aligned(arg,alignment);
+}
+
+static inline bool isPowerOfTwo(uintptr_t arg) {
+    return tbb::internal::is_power_of_two(arg);
+}
+static inline bool isPowerOfTwoAtLeast(uintptr_t arg, uintptr_t power2) {
+    return arg && tbb::internal::is_power_of_two_at_least(arg,power2);
+}
+
+#define MALLOC_STATIC_ASSERT(condition,msg) __TBB_STATIC_ASSERT(condition,msg)
+
+#define USE_DEFAULT_MEMORY_MAPPING 1
+
+// To support malloc replacement
+#include "proxy.h"
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
+#define malloc_proxy __TBB_malloc_proxy
+extern "C" void * __TBB_malloc_proxy(size_t)  __attribute__ ((weak));
+#elif MALLOC_ZONE_OVERLOAD_ENABLED
+// as there is no significant overhead, always suppose that proxy can be present
+const bool malloc_proxy = true;
+#else
+const bool malloc_proxy = false;
+#endif
+
+namespace rml {
+namespace internal {
+    void init_tbbmalloc();
+} } // namespaces
+
+#define MALLOC_EXTRA_INITIALIZATION rml::internal::init_tbbmalloc()
+
+// Need these to work regardless of tools support.
+namespace tbb {
+    namespace internal {
+
+        enum notify_type {prepare=0, cancel, acquired, releasing};
+
+#if TBB_USE_THREADING_TOOLS
+        inline void call_itt_notify(notify_type t, void *ptr) {
+            switch ( t ) {
+            case prepare:
+                MALLOC_ITT_SYNC_PREPARE( ptr );
+                break;
+            case cancel:
+                MALLOC_ITT_SYNC_CANCEL( ptr );
+                break;
+            case acquired:
+                MALLOC_ITT_SYNC_ACQUIRED( ptr );
+                break;
+            case releasing:
+                MALLOC_ITT_SYNC_RELEASING( ptr );
+                break;
+            }
+        }
+#else
+        inline void call_itt_notify(notify_type /*t*/, void * /*ptr*/) {}
+#endif // TBB_USE_THREADING_TOOLS
+
+        template <typename T>
+        inline void itt_store_word_with_release(T& dst, T src) {
+#if TBB_USE_THREADING_TOOLS
+            call_itt_notify(releasing, &dst);
+#endif // TBB_USE_THREADING_TOOLS
+            FencedStore(*(intptr_t*)&dst, src);
+        }
+
+        template <typename T>
+        inline T itt_load_word_with_acquire(T& src) {
+            T result = FencedLoad(*(intptr_t*)&src);
+#if TBB_USE_THREADING_TOOLS
+            call_itt_notify(acquired, &src);
+#endif // TBB_USE_THREADING_TOOLS
+            return result;
+
+        }
+    } // namespace internal
+} // namespace tbb
+
+#include "tbb/internal/_aggregator_impl.h"
+
+template <typename OperationType>
+struct MallocAggregator {
+    typedef tbb::internal::aggregator_generic<OperationType> type;
+};
+
+//! aggregated_operation base class
+template <typename Derived>
+struct MallocAggregatedOperation {
+    typedef tbb::internal::aggregated_operation<Derived> type;
+};
+
+#endif /* _TBB_malloc_Customize_H_ */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/MapMemory.h b/xdl/third_party/tbb/src/tbbmalloc/MapMemory.h
new file mode 100644
index 00000000..545555ca
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/MapMemory.h
@@ -0,0 +1,209 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _itt_shared_malloc_MapMemory_H
+#define _itt_shared_malloc_MapMemory_H
+
+#include <stdlib.h>
+
+void *ErrnoPreservingMalloc(size_t bytes)
+{
+    int prevErrno = errno;
+    void *ret = malloc( bytes );
+    if (!ret)
+        errno = prevErrno;
+    return ret;
+}
+
+#if __linux__ || __APPLE__ || __sun || __FreeBSD__
+
+#if __sun && !defined(_XPG4_2)
+ // To have void* as mmap's 1st argument
+ #define _XPG4_2 1
+ #define XPG4_WAS_DEFINED 1
+#endif
+
+#include <sys/mman.h>
+#if __linux__
+/* __TBB_MAP_HUGETLB is MAP_HUGETLB from system header linux/mman.h.
+   The header is not included here, as on some Linux flavors inclusion of
+   linux/mman.h leads to compilation error,
+   while changing of MAP_HUGETLB is highly unexpected.
+*/
+#define __TBB_MAP_HUGETLB 0x40000
+#else
+#define __TBB_MAP_HUGETLB 0
+#endif
+
+#if XPG4_WAS_DEFINED
+ #undef _XPG4_2
+ #undef XPG4_WAS_DEFINED
+#endif
+
+inline void* mmap_impl(size_t map_size, void* map_hint = NULL, int map_flags = 0) {
+#ifndef MAP_ANONYMOUS
+// macOS* defines MAP_ANON, which is deprecated in Linux*.
+#define MAP_ANONYMOUS MAP_ANON
+#endif /* MAP_ANONYMOUS */
+    return mmap(map_hint, map_size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS | map_flags, -1, 0);
+}
+
+inline void* mmapTHP(size_t bytes) {
+    // Initializes in zero-initialized data section
+    static void* hint;
+
+    // Optimistically try to use a last huge page aligned region end
+    // as a hint for mmap.
+    hint = hint ? (void*)((uintptr_t)hint - bytes) : hint;
+    void* result = mmap_impl(bytes, hint);
+
+    // Something went wrong
+    if (result == MAP_FAILED) {
+        hint = NULL;
+        return MAP_FAILED;
+    }
+
+    // Otherwise, fall back to the slow path - map oversized region
+    // and trim excess parts.
+    if (!isAligned(result, HUGE_PAGE_SIZE)) {
+        // Undo previous try
+        munmap(result, bytes);
+
+        // Map oversized on huge page size region
+        result = mmap_impl(bytes + HUGE_PAGE_SIZE);
+
+        // Something went wrong
+        if (result == MAP_FAILED) {
+            hint = NULL;
+            return MAP_FAILED;
+        }
+
+        // Misalignment offset
+        uintptr_t offset = 0;
+
+        if (!isAligned(result, HUGE_PAGE_SIZE)) {
+            // Trim excess head of a region if it is no aligned
+            offset = HUGE_PAGE_SIZE - ((uintptr_t)result & (HUGE_PAGE_SIZE - 1));
+            munmap(result, offset);
+
+            // New region begining
+            result = (void*)((uintptr_t)result + offset);
+        }
+
+        // Trim excess tail of a region
+        munmap((void*)((uintptr_t)result + bytes), HUGE_PAGE_SIZE - offset);
+    }
+
+    // Assume, that mmap virtual addresses grow down by default
+    // So, set a hint as a result of a last successfull allocation
+    // and then use it minus requested size as a new mapping point.
+    // TODO: Atomic store is meant here, fence not needed, but
+    // currently we don't have such function.
+    hint = result;
+
+    MALLOC_ASSERT(isAligned(result, HUGE_PAGE_SIZE), "Mapped address is not aligned on huge page size.");
+
+    return result;
+}
+
+#define MEMORY_MAPPING_USES_MALLOC 0
+void* MapMemory (size_t bytes, PageType pageType)
+{
+    void* result = 0;
+    int prevErrno = errno;
+
+    switch (pageType) {
+        case REGULAR:
+        {
+            result = mmap_impl(bytes);
+            break;
+        }
+        case PREALLOCATED_HUGE_PAGE:
+        {
+            MALLOC_ASSERT((bytes % HUGE_PAGE_SIZE) == 0, "Mapping size should be divisible by huge page size");
+            result = mmap_impl(bytes, NULL, __TBB_MAP_HUGETLB);
+            break;
+        }
+        case TRANSPARENT_HUGE_PAGE:
+        {
+            MALLOC_ASSERT((bytes % HUGE_PAGE_SIZE) == 0, "Mapping size should be divisible by huge page size");
+            result = mmapTHP(bytes);
+            break;
+        }
+        default:
+        {
+            MALLOC_ASSERT(false, "Unknown page type");
+        }
+    }
+
+    if (result == MAP_FAILED) {
+        errno = prevErrno;
+        return 0;
+    }
+
+    return result;
+}
+
+int UnmapMemory(void *area, size_t bytes)
+{
+    int prevErrno = errno;
+    int ret = munmap(area, bytes);
+    if (-1 == ret)
+        errno = prevErrno;
+    return ret;
+}
+
+#elif (_WIN32 || _WIN64) && !__TBB_WIN8UI_SUPPORT
+#include <windows.h>
+
+#define MEMORY_MAPPING_USES_MALLOC 0
+void* MapMemory (size_t bytes, PageType)
+{
+    /* Is VirtualAlloc thread safe? */
+    return VirtualAlloc(NULL, bytes, MEM_RESERVE | MEM_COMMIT, PAGE_READWRITE);
+}
+
+int UnmapMemory(void *area, size_t /*bytes*/)
+{
+    BOOL result = VirtualFree(area, 0, MEM_RELEASE);
+    return !result;
+}
+
+#else
+
+#define MEMORY_MAPPING_USES_MALLOC 1
+void* MapMemory (size_t bytes, PageType)
+{
+    return ErrnoPreservingMalloc( bytes );
+}
+
+int UnmapMemory(void *area, size_t /*bytes*/)
+{
+    free( area );
+    return 0;
+}
+
+#endif /* OS dependent */
+
+#if MALLOC_CHECK_RECURSION && MEMORY_MAPPING_USES_MALLOC
+#error Impossible to protect against malloc recursion when memory mapping uses malloc.
+#endif
+
+#endif /* _itt_shared_malloc_MapMemory_H */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/Statistics.h b/xdl/third_party/tbb/src/tbbmalloc/Statistics.h
new file mode 100644
index 00000000..ead9cc06
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/Statistics.h
@@ -0,0 +1,129 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define MAX_THREADS 1024
+#define NUM_OF_BINS 30
+#define ThreadCommonCounters NUM_OF_BINS
+
+enum counter_type {
+    allocBlockNew = 0,
+    allocBlockPublic,
+    allocBumpPtrUsed,
+    allocFreeListUsed,
+    allocPrivatized,
+    examineEmptyEnough,
+    examineNotEmpty,
+    freeRestoreBumpPtr,
+    freeByOtherThread,
+    freeToActiveBlock,
+    freeToInactiveBlock,
+    freeBlockPublic,
+    freeBlockBack,
+    MaxCounters
+};
+enum common_counter_type {
+    allocNewLargeObj = 0,
+    allocCachedLargeObj,
+    cacheLargeObj,
+    freeLargeObj,
+    lockPublicFreeList,
+    freeToOtherThread
+};
+
+#if COLLECT_STATISTICS
+/* Statistics reporting callback registered via a static object dtor
+   on Posix or DLL_PROCESS_DETACH on Windows.
+ */
+
+static bool reportAllocationStatistics;
+
+struct bin_counters {
+    int counter[MaxCounters];
+};
+
+static bin_counters statistic[MAX_THREADS][NUM_OF_BINS+1]; //zero-initialized;
+
+static inline int STAT_increment(int thread, int bin, int ctr)
+{
+    return reportAllocationStatistics && thread < MAX_THREADS ? ++(statistic[thread][bin].counter[ctr]) : 0;
+}
+
+static inline void initStatisticsCollection() {
+#if defined(MALLOCENV_COLLECT_STATISTICS)
+    if (NULL != getenv(MALLOCENV_COLLECT_STATISTICS))
+        reportAllocationStatistics = true;
+#endif
+}
+
+#else
+#define STAT_increment(a,b,c) ((void)0)
+#endif /* COLLECT_STATISTICS */
+
+#if COLLECT_STATISTICS
+static inline void STAT_print(int thread)
+{
+    if (!reportAllocationStatistics)
+        return;
+
+    char filename[100];
+#if USE_PTHREAD
+    sprintf(filename, "stat_ScalableMalloc_proc%04d_thr%04d.log", getpid(), thread);
+#else
+    sprintf(filename, "stat_ScalableMalloc_thr%04d.log", thread);
+#endif
+    FILE* outfile = fopen(filename, "w");
+    for(int i=0; i<NUM_OF_BINS; ++i)
+    {
+        bin_counters& ctrs = statistic[thread][i];
+        fprintf(outfile, "Thr%04d Bin%02d", thread, i);
+        fprintf(outfile, ": allocNewBlocks %5d", ctrs.counter[allocBlockNew]);
+        fprintf(outfile, ", allocPublicBlocks %5d", ctrs.counter[allocBlockPublic]);
+        fprintf(outfile, ", restoreBumpPtr %5d", ctrs.counter[freeRestoreBumpPtr]);
+        fprintf(outfile, ", privatizeCalled %10d", ctrs.counter[allocPrivatized]);
+        fprintf(outfile, ", emptyEnough %10d", ctrs.counter[examineEmptyEnough]);
+        fprintf(outfile, ", notEmptyEnough %10d", ctrs.counter[examineNotEmpty]);
+        fprintf(outfile, ", freeBlocksPublic %5d", ctrs.counter[freeBlockPublic]);
+        fprintf(outfile, ", freeBlocksBack %5d", ctrs.counter[freeBlockBack]);
+        fprintf(outfile, "\n");
+    }
+    for(int i=0; i<NUM_OF_BINS; ++i)
+    {
+        bin_counters& ctrs = statistic[thread][i];
+        fprintf(outfile, "Thr%04d Bin%02d", thread, i);
+        fprintf(outfile, ": allocBumpPtr %10d", ctrs.counter[allocBumpPtrUsed]);
+        fprintf(outfile, ", allocFreeList %10d", ctrs.counter[allocFreeListUsed]);
+        fprintf(outfile, ", freeToActiveBlk %10d", ctrs.counter[freeToActiveBlock]);
+        fprintf(outfile, ", freeToInactive  %10d", ctrs.counter[freeToInactiveBlock]);
+        fprintf(outfile, ", freedByOther %10d", ctrs.counter[freeByOtherThread]);
+        fprintf(outfile, "\n");
+    }
+    bin_counters& ctrs = statistic[thread][ThreadCommonCounters];
+    fprintf(outfile, "Thr%04d common counters", thread);
+    fprintf(outfile, ": allocNewLargeObject %5d", ctrs.counter[allocNewLargeObj]);
+    fprintf(outfile, ": allocCachedLargeObject %5d", ctrs.counter[allocCachedLargeObj]);
+    fprintf(outfile, ", cacheLargeObject %5d", ctrs.counter[cacheLargeObj]);
+    fprintf(outfile, ", freeLargeObject %5d", ctrs.counter[freeLargeObj]);
+    fprintf(outfile, ", lockPublicFreeList %5d", ctrs.counter[lockPublicFreeList]);
+    fprintf(outfile, ", freeToOtherThread %10d", ctrs.counter[freeToOtherThread]);
+    fprintf(outfile, "\n");
+
+    fclose(outfile);
+}
+#endif
diff --git a/xdl/third_party/tbb/src/tbbmalloc/Synchronize.h b/xdl/third_party/tbb/src/tbbmalloc/Synchronize.h
new file mode 100644
index 00000000..ce6a118d
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/Synchronize.h
@@ -0,0 +1,108 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_malloc_Synchronize_H_
+#define __TBB_malloc_Synchronize_H_
+
+#include "tbb/tbb_machine.h"
+
+//! Stripped down version of spin_mutex.
+/** Instances of MallocMutex must be declared in memory that is zero-initialized.
+    There are no constructors.  This is a feature that lets it be
+    used in situations where the mutex might be used while file-scope constructors
+    are running.
+
+    There are no methods "acquire" or "release".  The scoped_lock must be used
+    in a strict block-scoped locking pattern.  Omitting these methods permitted
+    further simplification. */
+class MallocMutex : tbb::internal::no_copy {
+    __TBB_atomic_flag flag;
+
+public:
+    class scoped_lock : tbb::internal::no_copy {
+        MallocMutex& mutex;
+        bool taken;
+    public:
+        scoped_lock( MallocMutex& m ) : mutex(m), taken(true) { __TBB_LockByte(m.flag); }
+        scoped_lock( MallocMutex& m, bool block, bool *locked ) : mutex(m), taken(false) {
+            if (block) {
+                __TBB_LockByte(m.flag);
+                taken = true;
+            } else {
+                taken = __TBB_TryLockByte(m.flag);
+            }
+            if (locked) *locked = taken;
+        }
+        ~scoped_lock() {
+            if (taken) __TBB_UnlockByte(mutex.flag);
+        }
+    };
+    friend class scoped_lock;
+};
+
+// TODO: use signed/unsigned in atomics more consistently
+inline intptr_t AtomicIncrement( volatile intptr_t& counter ) {
+    return __TBB_FetchAndAddW( &counter, 1 )+1;
+}
+
+inline uintptr_t AtomicAdd( volatile intptr_t& counter, intptr_t value ) {
+    return __TBB_FetchAndAddW( &counter, value );
+}
+
+inline intptr_t AtomicCompareExchange( volatile intptr_t& location, intptr_t new_value, intptr_t comparand) {
+    return __TBB_CompareAndSwapW( &location, new_value, comparand );
+}
+
+inline uintptr_t AtomicFetchStore(volatile void* location, uintptr_t value) {
+    return __TBB_FetchAndStoreW(location, value);
+}
+
+inline void AtomicOr(volatile void *operand, uintptr_t addend) {
+    __TBB_AtomicOR(operand, addend);
+}
+
+inline void AtomicAnd(volatile void *operand, uintptr_t addend) {
+    __TBB_AtomicAND(operand, addend);
+}
+
+inline intptr_t FencedLoad( const volatile intptr_t &location ) {
+    return __TBB_load_with_acquire(location);
+}
+
+inline void FencedStore( volatile intptr_t &location, intptr_t value ) {
+    __TBB_store_with_release(location, value);
+}
+
+inline void SpinWaitWhileEq(const volatile intptr_t &location, const intptr_t value) {
+    tbb::internal::spin_wait_while_eq(location, value);
+}
+
+class AtomicBackoff {
+    tbb::internal::atomic_backoff backoff;
+public:
+    AtomicBackoff() {}
+    void pause() { backoff.pause(); }
+};
+
+inline void SpinWaitUntilEq(const volatile intptr_t &location, const intptr_t value) {
+    tbb::internal::spin_wait_until_eq(location, value);
+}
+
+#endif /* __TBB_malloc_Synchronize_H_ */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/TypeDefinitions.h b/xdl/third_party/tbb/src/tbbmalloc/TypeDefinitions.h
new file mode 100644
index 00000000..79110e55
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/TypeDefinitions.h
@@ -0,0 +1,62 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _itt_shared_malloc_TypeDefinitions_H_
+#define _itt_shared_malloc_TypeDefinitions_H_
+
+// Define preprocessor symbols used to determine architecture
+#if _WIN32||_WIN64
+#   if defined(_M_X64)||defined(__x86_64__)  // the latter for MinGW support
+#       define __ARCH_x86_64 1
+#   elif defined(_M_IA64)
+#       define __ARCH_ipf 1
+#   elif defined(_M_IX86)||defined(__i386__) // the latter for MinGW support
+#       define __ARCH_x86_32 1
+#   elif defined(_M_ARM)
+#       define __ARCH_other 1
+#   else
+#       error Unknown processor architecture for Windows
+#   endif
+#   define USE_WINTHREAD 1
+#else /* Assume generic Unix */
+#   if __x86_64__
+#       define __ARCH_x86_64 1
+#   elif __ia64__
+#       define __ARCH_ipf 1
+#   elif __i386__ || __i386
+#       define __ARCH_x86_32 1
+#   else
+#       define __ARCH_other 1
+#   endif
+#   define USE_PTHREAD 1
+#endif
+
+// According to C99 standard INTPTR_MIN defined for C++
+// iff __STDC_LIMIT_MACROS pre-defined
+#ifndef __STDC_LIMIT_MACROS
+#define __STDC_LIMIT_MACROS 1
+#endif
+
+//! PROVIDE YOUR OWN Customize.h IF YOU FEEL NECESSARY
+#include "Customize.h"
+
+#include "shared_utils.h"
+
+#endif /* _itt_shared_malloc_TypeDefinitions_H_ */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/backend.cpp b/xdl/third_party/tbb/src/tbbmalloc/backend.cpp
new file mode 100644
index 00000000..44d3bcc7
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/backend.cpp
@@ -0,0 +1,1516 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <string.h>   /* for memset */
+#include <errno.h>
+#include "tbbmalloc_internal.h"
+
+namespace rml {
+namespace internal {
+
+/*********** Code to acquire memory from the OS or other executive ****************/
+
+/*
+  syscall/malloc can set non-zero errno in case of failure,
+  but later allocator might be able to find memory to fulfill the request.
+  And we do not want changing of errno by successful scalable_malloc call.
+  To support this, restore old errno in (get|free)RawMemory, and set errno
+  in frontend just before returning to user code.
+  Please note: every syscall/libc call used inside scalable_malloc that
+  sets errno must be protected this way, not just memory allocation per se.
+*/
+
+#if USE_DEFAULT_MEMORY_MAPPING
+#include "MapMemory.h"
+#else
+/* assume MapMemory and UnmapMemory are customized */
+#endif
+
+void* getRawMemory (size_t size, PageType pageType) {
+    return MapMemory(size, pageType);
+}
+
+int freeRawMemory (void *object, size_t size) {
+    return UnmapMemory(object, size);
+}
+
+#if CHECK_ALLOCATION_RANGE
+
+void Backend::UsedAddressRange::registerAlloc(uintptr_t left, uintptr_t right)
+{
+    MallocMutex::scoped_lock lock(mutex);
+    if (left < leftBound)
+        leftBound = left;
+    if (right > rightBound)
+        rightBound = right;
+    MALLOC_ASSERT(leftBound, ASSERT_TEXT);
+    MALLOC_ASSERT(leftBound < rightBound, ASSERT_TEXT);
+    MALLOC_ASSERT(leftBound <= left && right <= rightBound, ASSERT_TEXT);
+}
+
+void Backend::UsedAddressRange::registerFree(uintptr_t left, uintptr_t right)
+{
+    MallocMutex::scoped_lock lock(mutex);
+    if (leftBound == left) {
+        if (rightBound == right) {
+            leftBound = ADDRESS_UPPER_BOUND;
+            rightBound = 0;
+        } else
+            leftBound = right;
+    } else if (rightBound == right)
+        rightBound = left;
+    MALLOC_ASSERT((!rightBound && leftBound == ADDRESS_UPPER_BOUND)
+                  || leftBound < rightBound, ASSERT_TEXT);
+}
+#endif // CHECK_ALLOCATION_RANGE
+
+// Initialized in frontend inside defaultMemPool
+extern HugePagesStatus hugePages;
+
+void *Backend::allocRawMem(size_t &size)
+{
+    void *res = NULL;
+    size_t allocSize = 0;
+
+    if (extMemPool->userPool()) {
+        if (extMemPool->fixedPool && bootsrapMemDone == FencedLoad(bootsrapMemStatus))
+            return NULL;
+        MALLOC_ASSERT(bootsrapMemStatus != bootsrapMemNotDone,
+                      "Backend::allocRawMem() called prematurely?");
+        // TODO: support for raw mem not aligned at sizeof(uintptr_t)
+        // memory from fixed pool is asked once and only once
+        allocSize = alignUpGeneric(size, extMemPool->granularity);
+        res = (*extMemPool->rawAlloc)(extMemPool->poolId, allocSize);
+    } else {
+        // Align allocation on page size
+        size_t pageSize = hugePages.isEnabled ? hugePages.getGranularity() : extMemPool->granularity;
+        MALLOC_ASSERT(pageSize, "Page size cannot be zero.");
+        allocSize = alignUpGeneric(size, pageSize);
+
+        // If user requested huge pages and they are available, try to use preallocated ones firstly.
+        // If there are none, lets check transparent huge pages support and use them instead.
+        if (hugePages.isEnabled) {
+            if (hugePages.isHPAvailable) {
+                res = getRawMemory(allocSize, PREALLOCATED_HUGE_PAGE);
+            }
+            if (!res && hugePages.isTHPAvailable) {
+                res = getRawMemory(allocSize, TRANSPARENT_HUGE_PAGE);
+            }
+        }
+
+        if (!res) {
+            res = getRawMemory(allocSize, REGULAR);
+        }
+    }
+
+    if (res) {
+        MALLOC_ASSERT(allocSize > 0, "Invalid size of an allocated region.");
+        size = allocSize;
+        if (!extMemPool->userPool())
+            usedAddrRange.registerAlloc((uintptr_t)res, (uintptr_t)res+size);
+#if MALLOC_DEBUG
+        volatile size_t curTotalSize = totalMemSize; // to read global value once
+        MALLOC_ASSERT(curTotalSize+size > curTotalSize, "Overflow allocation size.");
+#endif
+        AtomicAdd((intptr_t&)totalMemSize, size);
+    }
+
+    return res;
+}
+
+bool Backend::freeRawMem(void *object, size_t size)
+{
+    bool fail;
+#if MALLOC_DEBUG
+    volatile size_t curTotalSize = totalMemSize; // to read global value once
+    MALLOC_ASSERT(curTotalSize-size < curTotalSize, "Negative allocation size.");
+#endif
+    AtomicAdd((intptr_t&)totalMemSize, -size);
+    if (extMemPool->userPool()) {
+        MALLOC_ASSERT(!extMemPool->fixedPool, "No free for fixed-size pools.");
+        fail = (*extMemPool->rawFree)(extMemPool->poolId, object, size);
+    } else {
+        usedAddrRange.registerFree((uintptr_t)object, (uintptr_t)object + size);
+        fail = freeRawMemory(object, size);
+    }
+    // TODO: use result in all freeRawMem() callers
+    return !fail;
+}
+
+/********* End memory acquisition code ********************************/
+
+// Protected object size. After successful locking returns size of locked block,
+// and releasing requires setting block size.
+class GuardedSize : tbb::internal::no_copy {
+    uintptr_t value;
+public:
+    enum State {
+        LOCKED,
+        COAL_BLOCK,        // block is coalescing now
+        MAX_LOCKED_VAL = COAL_BLOCK,
+        LAST_REGION_BLOCK, // used to mark last block in region
+        // values after this are "normal" block sizes
+        MAX_SPEC_VAL = LAST_REGION_BLOCK
+    };
+
+    void initLocked() { value = LOCKED; }
+    void makeCoalscing() {
+        MALLOC_ASSERT(value == LOCKED, ASSERT_TEXT);
+        value = COAL_BLOCK;
+    }
+    size_t tryLock(State state) {
+        size_t szVal, sz;
+        MALLOC_ASSERT(state <= MAX_LOCKED_VAL, ASSERT_TEXT);
+        for (;;) {
+            sz = FencedLoad((intptr_t&)value);
+            if (sz <= MAX_LOCKED_VAL)
+                break;
+            szVal = AtomicCompareExchange((intptr_t&)value, state, sz);
+
+            if (szVal==sz)
+                break;
+        }
+        return sz;
+    }
+    void unlock(size_t size) {
+        MALLOC_ASSERT(value <= MAX_LOCKED_VAL, "The lock is not locked");
+        MALLOC_ASSERT(size > MAX_LOCKED_VAL, ASSERT_TEXT);
+        FencedStore((intptr_t&)value, size);
+    }
+    bool isLastRegionBlock() const { return value==LAST_REGION_BLOCK; }
+    friend void Backend::IndexedBins::verify();
+};
+
+struct MemRegion {
+    MemRegion *next,      // keep all regions in any pool to release all them on
+              *prev;      // pool destroying, 2-linked list to release individual
+                          // regions.
+    size_t     allocSz,   // got from pool callback
+               blockSz;   // initial and maximal inner block size
+    MemRegionType type;
+};
+
+// this data must be unmodified while block is in use, so separate it
+class BlockMutexes {
+protected:
+    GuardedSize myL,   // lock for me
+                leftL; // lock for left neighbor
+};
+
+class FreeBlock : BlockMutexes {
+public:
+    static const size_t minBlockSize;
+    friend void Backend::IndexedBins::verify();
+
+    FreeBlock    *prev,       // in 2-linked list related to bin
+                 *next,
+                 *nextToFree; // used to form a queue during coalescing
+    // valid only when block is in processing, i.e. one is not free and not
+    size_t        sizeTmp;    // used outside of backend
+    int           myBin;      // bin that is owner of the block
+    bool          aligned;
+    bool          blockInBin; // this block in myBin already
+
+    FreeBlock *rightNeig(size_t sz) const {
+        MALLOC_ASSERT(sz, ASSERT_TEXT);
+        return (FreeBlock*)((uintptr_t)this+sz);
+    }
+    FreeBlock *leftNeig(size_t sz) const {
+        MALLOC_ASSERT(sz, ASSERT_TEXT);
+        return (FreeBlock*)((uintptr_t)this - sz);
+    }
+
+    void initHeader() { myL.initLocked(); leftL.initLocked(); }
+    void setMeFree(size_t size) { myL.unlock(size); }
+    size_t trySetMeUsed(GuardedSize::State s) { return myL.tryLock(s); }
+    bool isLastRegionBlock() const { return myL.isLastRegionBlock(); }
+
+    void setLeftFree(size_t sz) { leftL.unlock(sz); }
+    size_t trySetLeftUsed(GuardedSize::State s) { return leftL.tryLock(s); }
+
+    size_t tryLockBlock() {
+        size_t rSz, sz = trySetMeUsed(GuardedSize::LOCKED);
+
+        if (sz <= GuardedSize::MAX_LOCKED_VAL)
+            return false;
+        rSz = rightNeig(sz)->trySetLeftUsed(GuardedSize::LOCKED);
+        if (rSz <= GuardedSize::MAX_LOCKED_VAL) {
+            setMeFree(sz);
+            return false;
+        }
+        MALLOC_ASSERT(rSz == sz, ASSERT_TEXT);
+        return sz;
+    }
+    void markCoalescing(size_t blockSz) {
+        myL.makeCoalscing();
+        rightNeig(blockSz)->leftL.makeCoalscing();
+        sizeTmp = blockSz;
+        nextToFree = NULL;
+    }
+    void markUsed() {
+        myL.initLocked();
+        rightNeig(sizeTmp)->leftL.initLocked();
+        nextToFree = NULL;
+    }
+    static void markBlocks(FreeBlock *fBlock, int num, size_t size) {
+        for (int i=1; i<num; i++) {
+            fBlock = (FreeBlock*)((uintptr_t)fBlock + size);
+            fBlock->initHeader();
+        }
+    }
+};
+
+// Last block in any region. Its "size" field is GuardedSize::LAST_REGION_BLOCK,
+// This kind of blocks used to find region header
+// and have a possibility to return region back to OS
+struct LastFreeBlock : public FreeBlock {
+    MemRegion *memRegion;
+};
+
+const size_t FreeBlock::minBlockSize = sizeof(FreeBlock);
+
+inline bool BackendSync::waitTillBlockReleased(intptr_t startModifiedCnt)
+{
+    AtomicBackoff backoff;
+#if __TBB_MALLOC_BACKEND_STAT
+    class ITT_Guard {
+        void *ptr;
+    public:
+        ITT_Guard(void *p) : ptr(p) {
+            MALLOC_ITT_SYNC_PREPARE(ptr);
+        }
+        ~ITT_Guard() {
+            MALLOC_ITT_SYNC_ACQUIRED(ptr);
+        }
+    };
+    ITT_Guard ittGuard(&inFlyBlocks);
+#endif
+    for (intptr_t myBinsInFlyBlocks = FencedLoad(inFlyBlocks),
+             myCoalescQInFlyBlocks = backend->blocksInCoalescing(); ;
+         backoff.pause()) {
+        MALLOC_ASSERT(myBinsInFlyBlocks>=0 && myCoalescQInFlyBlocks>=0, NULL);
+        intptr_t currBinsInFlyBlocks = FencedLoad(inFlyBlocks),
+            currCoalescQInFlyBlocks = backend->blocksInCoalescing();
+        WhiteboxTestingYield();
+        // Stop waiting iff:
+
+        // 1) blocks were removed from processing, not added
+        if (myBinsInFlyBlocks > currBinsInFlyBlocks
+        // 2) released during delayed coalescing queue
+            || myCoalescQInFlyBlocks > currCoalescQInFlyBlocks)
+            break;
+        // 3) if there are blocks in coalescing, and no progress in its processing,
+        // try to scan coalescing queue and stop waiting, if changes were made
+        // (if there are no changes and in-fly blocks exist, we continue
+        //  waiting to not increase load on coalescQ)
+        if (currCoalescQInFlyBlocks > 0 && backend->scanCoalescQ(/*forceCoalescQDrop=*/false))
+            break;
+        // 4) when there are no blocks
+        if (!currBinsInFlyBlocks && !currCoalescQInFlyBlocks)
+            // re-scan make sense only if bins were modified since scanned
+            return startModifiedCnt != getNumOfMods();
+        myBinsInFlyBlocks = currBinsInFlyBlocks;
+        myCoalescQInFlyBlocks = currCoalescQInFlyBlocks;
+    }
+    return true;
+}
+
+void CoalRequestQ::putBlock(FreeBlock *fBlock)
+{
+    MALLOC_ASSERT(fBlock->sizeTmp >= FreeBlock::minBlockSize, ASSERT_TEXT);
+    fBlock->markUsed();
+    // the block is in the queue, do not forget that it's here
+    AtomicIncrement(inFlyBlocks);
+
+    for (;;) {
+        FreeBlock *myBlToFree = (FreeBlock*)FencedLoad((intptr_t&)blocksToFree);
+
+        fBlock->nextToFree = myBlToFree;
+        if (myBlToFree ==
+            (FreeBlock*)AtomicCompareExchange((intptr_t&)blocksToFree,
+                                              (intptr_t)fBlock,
+                                              (intptr_t)myBlToFree))
+            return;
+    }
+}
+
+FreeBlock *CoalRequestQ::getAll()
+{
+    for (;;) {
+        FreeBlock *myBlToFree = (FreeBlock*)FencedLoad((intptr_t&)blocksToFree);
+
+        if (!myBlToFree)
+            return NULL;
+        else {
+            if (myBlToFree ==
+                (FreeBlock*)AtomicCompareExchange((intptr_t&)blocksToFree,
+                                                  0, (intptr_t)myBlToFree))
+                return myBlToFree;
+            else
+                continue;
+        }
+    }
+}
+
+inline void CoalRequestQ::blockWasProcessed()
+{
+    bkndSync->binsModified();
+    int prev = AtomicAdd(inFlyBlocks, -1);
+    MALLOC_ASSERT(prev > 0, ASSERT_TEXT);
+}
+
+// Try to get a block from a bin.
+// If the remaining free space would stay in the same bin,
+//     split the block without removing it.
+// If the free space should go to other bin(s), remove the block.
+// alignedBin is true, if all blocks in the bin have slab-aligned right side.
+FreeBlock *Backend::IndexedBins::getFromBin(int binIdx, BackendSync *sync,
+                size_t size, bool needAlignedRes, bool alignedBin, bool wait,
+                int *binLocked)
+{
+    Bin *b = &freeBins[binIdx];
+try_next:
+    FreeBlock *fBlock = NULL;
+    if (b->head) {
+        bool locked;
+        MallocMutex::scoped_lock scopedLock(b->tLock, wait, &locked);
+
+        if (!locked) {
+            if (binLocked) (*binLocked)++;
+            return NULL;
+        }
+
+        for (FreeBlock *curr = b->head; curr; curr = curr->next) {
+            size_t szBlock = curr->tryLockBlock();
+            if (!szBlock) {
+                // block is locked, re-do bin lock, as there is no place to spin
+                // while block coalescing
+                goto try_next;
+            }
+
+            if (alignedBin || !needAlignedRes) {
+                size_t splitSz = szBlock - size;
+                // If we got a block as split result,
+                // it must have a room for control structures.
+                if (szBlock >= size && (splitSz >= FreeBlock::minBlockSize ||
+                                        !splitSz))
+                    fBlock = curr;
+            } else {
+                void *newB = alignUp(curr, slabSize);
+                uintptr_t rightNew = (uintptr_t)newB + size;
+                uintptr_t rightCurr = (uintptr_t)curr + szBlock;
+                // appropriate size, and left and right split results
+                // are either big enough or non-existent
+                if (rightNew <= rightCurr
+                    && (newB==curr ||
+                        (uintptr_t)newB-(uintptr_t)curr >= FreeBlock::minBlockSize)
+                    && (rightNew==rightCurr ||
+                        rightCurr - rightNew >= FreeBlock::minBlockSize))
+                    fBlock = curr;
+            }
+            if (fBlock) {
+                // consume must be called before result of removing from a bin
+                // is visible externally.
+                sync->blockConsumed();
+                if (alignedBin && needAlignedRes &&
+                    Backend::sizeToBin(szBlock-size) == Backend::sizeToBin(szBlock)) {
+                    // free remainder of fBlock stay in same bin,
+                    // so no need to remove it from the bin
+                    // TODO: add more "still here" cases
+                    FreeBlock *newFBlock = fBlock;
+                    // return block from right side of fBlock
+                    fBlock = (FreeBlock*)((uintptr_t)newFBlock + szBlock - size);
+                    MALLOC_ASSERT(isAligned(fBlock, slabSize), "Invalid free block");
+                    fBlock->initHeader();
+                    fBlock->setLeftFree(szBlock - size);
+                    newFBlock->setMeFree(szBlock - size);
+
+                    fBlock->sizeTmp = size;
+                } else {
+                    b->removeBlock(fBlock);
+                    if (freeBins[binIdx].empty())
+                        bitMask.set(binIdx, false);
+                    fBlock->sizeTmp = szBlock;
+                }
+                break;
+            } else { // block size is not valid, search for next block in the bin
+                curr->setMeFree(szBlock);
+                curr->rightNeig(szBlock)->setLeftFree(szBlock);
+            }
+        }
+    }
+    return fBlock;
+}
+
+bool Backend::IndexedBins::tryReleaseRegions(int binIdx, Backend *backend)
+{
+    Bin *b = &freeBins[binIdx];
+    FreeBlock *fBlockList = NULL;
+
+    // got all blocks from the bin and re-do coalesce on them
+    // to release single-block regions
+try_next:
+    if (b->head) {
+        MallocMutex::scoped_lock binLock(b->tLock);
+        for (FreeBlock *curr = b->head; curr; ) {
+            size_t szBlock = curr->tryLockBlock();
+            if (!szBlock)
+                goto try_next;
+
+            FreeBlock *next = curr->next;
+
+            b->removeBlock(curr);
+            curr->sizeTmp = szBlock;
+            curr->nextToFree = fBlockList;
+            fBlockList = curr;
+            curr = next;
+        }
+    }
+    return backend->coalescAndPutList(fBlockList, /*forceCoalescQDrop=*/true,
+                                      /*reportBlocksProcessed=*/false);
+}
+
+void Backend::Bin::removeBlock(FreeBlock *fBlock)
+{
+    MALLOC_ASSERT(fBlock->next||fBlock->prev||fBlock==head,
+                  "Detected that a block is not in the bin.");
+    if (head == fBlock)
+        head = fBlock->next;
+    if (tail == fBlock)
+        tail = fBlock->prev;
+    if (fBlock->prev)
+        fBlock->prev->next = fBlock->next;
+    if (fBlock->next)
+        fBlock->next->prev = fBlock->prev;
+}
+
+void Backend::IndexedBins::addBlock(int binIdx, FreeBlock *fBlock, size_t blockSz, bool addToTail)
+{
+    Bin *b = &freeBins[binIdx];
+
+    fBlock->myBin = binIdx;
+    fBlock->aligned = toAlignedBin(fBlock, blockSz);
+    fBlock->next = fBlock->prev = NULL;
+    {
+        MallocMutex::scoped_lock scopedLock(b->tLock);
+        if (addToTail) {
+            fBlock->prev = b->tail;
+            b->tail = fBlock;
+            if (fBlock->prev)
+                fBlock->prev->next = fBlock;
+            if (!b->head)
+                b->head = fBlock;
+        } else {
+            fBlock->next = b->head;
+            b->head = fBlock;
+            if (fBlock->next)
+                fBlock->next->prev = fBlock;
+            if (!b->tail)
+                b->tail = fBlock;
+        }
+    }
+    bitMask.set(binIdx, true);
+}
+
+bool Backend::IndexedBins::tryAddBlock(int binIdx, FreeBlock *fBlock, bool addToTail)
+{
+    bool locked;
+    Bin *b = &freeBins[binIdx];
+
+    fBlock->myBin = binIdx;
+    fBlock->aligned = toAlignedBin(fBlock, fBlock->sizeTmp);
+    if (addToTail) {
+        fBlock->next = NULL;
+        {
+            MallocMutex::scoped_lock scopedLock(b->tLock, /*wait=*/false, &locked);
+            if (!locked)
+                return false;
+            fBlock->prev = b->tail;
+            b->tail = fBlock;
+            if (fBlock->prev)
+                fBlock->prev->next = fBlock;
+            if (!b->head)
+                b->head = fBlock;
+        }
+    } else {
+        fBlock->prev = NULL;
+        {
+            MallocMutex::scoped_lock scopedLock(b->tLock, /*wait=*/false, &locked);
+            if (!locked)
+                return false;
+            fBlock->next = b->head;
+            b->head = fBlock;
+            if (fBlock->next)
+                fBlock->next->prev = fBlock;
+            if (!b->tail)
+                b->tail = fBlock;
+        }
+    }
+    bitMask.set(binIdx, true);
+    return true;
+}
+
+void Backend::IndexedBins::reset()
+{
+    for (int i=0; i<Backend::freeBinsNum; i++)
+        freeBins[i].reset();
+    bitMask.reset();
+}
+
+void Backend::IndexedBins::lockRemoveBlock(int binIdx, FreeBlock *fBlock)
+{
+    MallocMutex::scoped_lock scopedLock(freeBins[binIdx].tLock);
+    freeBins[binIdx].removeBlock(fBlock);
+    if (freeBins[binIdx].empty())
+        bitMask.set(binIdx, false);
+}
+
+bool ExtMemoryPool::regionsAreReleaseable() const
+{
+    return !keepAllMemory && !delayRegsReleasing;
+}
+
+FreeBlock *Backend::splitUnalignedBlock(FreeBlock *fBlock, int num, size_t size,
+                                        bool needAlignedBlock)
+{
+    const size_t totalSize = num*size;
+    if (needAlignedBlock) {
+        size_t fBlockSz = fBlock->sizeTmp;
+        uintptr_t fBlockEnd = (uintptr_t)fBlock + fBlockSz;
+        FreeBlock *newB = alignUp(fBlock, slabSize);
+        FreeBlock *rightPart = (FreeBlock*)((uintptr_t)newB + totalSize);
+
+        // Space to use is in the middle,
+        // ... return free right part
+        if ((uintptr_t)rightPart != fBlockEnd) {
+            rightPart->initHeader();  // to prevent coalescing rightPart with fBlock
+            coalescAndPut(rightPart, fBlockEnd - (uintptr_t)rightPart);
+        }
+        // ... and free left part
+        if (newB != fBlock) {
+            newB->initHeader(); // to prevent coalescing fBlock with newB
+            coalescAndPut(fBlock, (uintptr_t)newB - (uintptr_t)fBlock);
+        }
+
+        fBlock = newB;
+        MALLOC_ASSERT(isAligned(fBlock, slabSize), ASSERT_TEXT);
+    } else {
+        if (size_t splitSz = fBlock->sizeTmp - totalSize) {
+            // split block and return free right part
+            FreeBlock *splitB = (FreeBlock*)((uintptr_t)fBlock + totalSize);
+            splitB->initHeader();
+            coalescAndPut(splitB, splitSz);
+        }
+    }
+    FreeBlock::markBlocks(fBlock, num, size);
+    return fBlock;
+}
+
+FreeBlock *Backend::splitAlignedBlock(FreeBlock *fBlock, int num, size_t size,
+                                      bool needAlignedBlock)
+{
+    if (fBlock->sizeTmp != num*size) { // i.e., need to split the block
+        FreeBlock *newAlgnd;
+        size_t newSz;
+
+        if (needAlignedBlock) {
+            newAlgnd = fBlock;
+            fBlock = (FreeBlock*)((uintptr_t)newAlgnd + newAlgnd->sizeTmp
+                                  - num*size);
+            MALLOC_ASSERT(isAligned(fBlock, slabSize), "Invalid free block");
+            fBlock->initHeader();
+            newSz = newAlgnd->sizeTmp - num*size;
+        } else {
+            newAlgnd = (FreeBlock*)((uintptr_t)fBlock + num*size);
+            newSz = fBlock->sizeTmp - num*size;
+            newAlgnd->initHeader();
+        }
+        coalescAndPut(newAlgnd, newSz);
+    }
+    MALLOC_ASSERT(!needAlignedBlock || isAligned(fBlock, slabSize),
+                  "Expect to get aligned block, if one was requested.");
+    FreeBlock::markBlocks(fBlock, num, size);
+    return fBlock;
+}
+
+size_t Backend::getMaxBinnedSize() const
+{
+    return hugePages.isEnabled && !inUserPool() ?
+        maxBinned_HugePage : maxBinned_SmallPage;
+}
+
+inline bool Backend::MaxRequestComparator::operator()(size_t oldMaxReq,
+                                                      size_t requestSize) const
+{
+    return requestSize > oldMaxReq && requestSize < backend->getMaxBinnedSize();
+}
+
+// last chance to get memory
+FreeBlock *Backend::releaseMemInCaches(intptr_t startModifiedCnt,
+                                    int *lockedBinsThreshold, int numOfLockedBins)
+{
+    // something released from caches
+    if (extMemPool->hardCachesCleanup()
+        // ..or can use blocks that are in processing now
+        || bkndSync.waitTillBlockReleased(startModifiedCnt))
+        return (FreeBlock*)VALID_BLOCK_IN_BIN;
+    // OS can't give us more memory, but we have some in locked bins
+    if (*lockedBinsThreshold && numOfLockedBins) {
+        *lockedBinsThreshold = 0;
+        return (FreeBlock*)VALID_BLOCK_IN_BIN;
+    }
+    return NULL; // nothing found, give up
+}
+
+FreeBlock *Backend::askMemFromOS(size_t blockSize, intptr_t startModifiedCnt,
+                                 int *lockedBinsThreshold, int numOfLockedBins,
+                                 bool *splittableRet)
+{
+    FreeBlock *block;
+    // The block sizes can be divided into 3 groups:
+    //   1. "quite small": popular object size, we are in bootstarp or something
+    //      like; request several regions.
+    //   2. "quite large": we want to have several such blocks in the region
+    //      but not want several pre-allocated regions.
+    //   3. "huge": exact fit, we allocate only one block and do not allow
+    //       any other allocations to placed in a region.
+    // Dividing the block sizes in these groups we are trying to balance between
+    // too small regions (that leads to fragmentation) and too large ones (that
+    // leads to excessive address space consumption). If a region is "too
+    // large", allocate only one, to prevent fragmentation. It supposedly
+    // doesn't hurt performance, because the object requested by user is large.
+    // Bounds for the groups are:
+    const size_t maxBinned = getMaxBinnedSize();
+    const size_t quiteSmall = maxBinned / 8;
+    const size_t quiteLarge = maxBinned;
+
+    if (blockSize >= quiteLarge) {
+        // Do not interact with other threads via semaphores, as for exact fit
+        // we can't share regions with them, memory requesting is individual.
+        block = addNewRegion(blockSize, MEMREG_ONE_BLOCK, /*addToBin=*/false);
+        if (!block)
+            return releaseMemInCaches(startModifiedCnt, lockedBinsThreshold, numOfLockedBins);
+        *splittableRet = false;
+    } else {
+        const size_t regSz_sizeBased = alignUp(4*maxRequestedSize, 1024*1024);
+        // Another thread is modifying backend while we can't get the block.
+        // Wait while it leaves and re-do the scan
+        // before trying other ways to extend the backend.
+        if (bkndSync.waitTillBlockReleased(startModifiedCnt)
+            // semaphore is protecting adding more more memory from OS
+            || memExtendingSema.wait())
+            return (FreeBlock*)VALID_BLOCK_IN_BIN;
+
+        if (startModifiedCnt != bkndSync.getNumOfMods()) {
+            memExtendingSema.signal();
+            return (FreeBlock*)VALID_BLOCK_IN_BIN;
+        }
+
+        if (blockSize < quiteSmall) {
+            // For this size of blocks, add NUM_OF_REG "advance" regions in bin,
+            // and return one as a result.
+            // TODO: add to bin first, because other threads can use them right away.
+            // This must be done carefully, because blocks in bins can be released
+            // in releaseCachesToLimit().
+            const unsigned NUM_OF_REG = 3;
+            block = addNewRegion(regSz_sizeBased, MEMREG_FLEXIBLE_SIZE, /*addToBin=*/false);
+            if (block)
+                for (unsigned idx=0; idx<NUM_OF_REG; idx++)
+                    if (! addNewRegion(regSz_sizeBased, MEMREG_FLEXIBLE_SIZE, /*addToBin=*/true))
+                        break;
+        } else {
+            block = addNewRegion(regSz_sizeBased, MEMREG_SEVERAL_BLOCKS, /*addToBin=*/false);
+        }
+        memExtendingSema.signal();
+
+        // no regions found, try to clean cache
+        if (!block || block == (FreeBlock*)VALID_BLOCK_IN_BIN)
+            return releaseMemInCaches(startModifiedCnt, lockedBinsThreshold, numOfLockedBins);
+        // Since a region can hold more than one block it can be splitted.
+        *splittableRet = true;
+    }
+    // after asking memory from OS, release caches if we above the memory limits
+    releaseCachesToLimit();
+
+    return block;
+}
+
+void Backend::releaseCachesToLimit()
+{
+    if (!memSoftLimit || totalMemSize <= memSoftLimit)
+        return;
+    size_t locTotalMemSize, locMemSoftLimit;
+
+    scanCoalescQ(/*forceCoalescQDrop=*/false);
+    if (extMemPool->softCachesCleanup() &&
+        (locTotalMemSize = FencedLoad((intptr_t&)totalMemSize)) <=
+        (locMemSoftLimit = FencedLoad((intptr_t&)memSoftLimit)))
+        return;
+    // clean global large-object cache, if this is not enough, clean local caches
+    // do this in several tries, because backend fragmentation can prevent
+    // region from releasing
+    for (int cleanLocal = 0; cleanLocal<2; cleanLocal++)
+        while (cleanLocal?
+               extMemPool->allLocalCaches.cleanup(extMemPool, /*cleanOnlyUnused=*/true)
+               : extMemPool->loc.decreasingCleanup())
+            if ((locTotalMemSize = FencedLoad((intptr_t&)totalMemSize)) <=
+                (locMemSoftLimit = FencedLoad((intptr_t&)memSoftLimit)))
+                return;
+    // last chance to match memSoftLimit
+    extMemPool->hardCachesCleanup();
+}
+
+FreeBlock *Backend::IndexedBins::
+    findBlock(int nativeBin, BackendSync *sync, size_t size,
+              bool resSlabAligned, bool alignedBin, int *numOfLockedBins)
+{
+    for (int i=getMinNonemptyBin(nativeBin); i<freeBinsNum; i=getMinNonemptyBin(i+1))
+        if (FreeBlock *block = getFromBin(i, sync, size, resSlabAligned, alignedBin,
+                                          /*wait=*/false, numOfLockedBins))
+            return block;
+
+    return NULL;
+}
+
+void Backend::requestBootstrapMem()
+{
+    if (bootsrapMemDone == FencedLoad(bootsrapMemStatus))
+        return;
+    MallocMutex::scoped_lock lock( bootsrapMemStatusMutex );
+    if (bootsrapMemDone == bootsrapMemStatus)
+        return;
+    MALLOC_ASSERT(bootsrapMemNotDone == bootsrapMemStatus, ASSERT_TEXT);
+    bootsrapMemStatus = bootsrapMemInitializing;
+    // request some rather big region during bootstrap in advance
+    // ok to get NULL here, as later we re-do a request with more modest size
+    addNewRegion(2*1024*1024, MEMREG_FLEXIBLE_SIZE, /*addToBin=*/true);
+    bootsrapMemStatus = bootsrapMemDone;
+}
+
+// try to allocate size Byte block in available bins
+// needAlignedRes is true if result must be slab-aligned
+FreeBlock *Backend::genericGetBlock(int num, size_t size, bool needAlignedBlock)
+{
+    FreeBlock *block = NULL;
+    const size_t totalReqSize = num*size;
+    // no splitting after requesting new region, asks exact size
+    const int nativeBin = sizeToBin(totalReqSize);
+
+    requestBootstrapMem();
+    // If we found 2 or less locked bins, it's time to ask more memory from OS.
+    // But nothing can be asked from fixed pool. And we prefer wait, not ask
+    // for more memory, if block is quite large.
+    int lockedBinsThreshold = extMemPool->fixedPool || size>=maxBinned_SmallPage? 0 : 2;
+
+    // Find maximal requested size limited by getMaxBinnedSize()
+    AtomicUpdate(maxRequestedSize, totalReqSize, MaxRequestComparator(this));
+    scanCoalescQ(/*forceCoalescQDrop=*/false);
+
+    bool splittable = true;
+    for (;;) {
+        const intptr_t startModifiedCnt = bkndSync.getNumOfMods();
+        int numOfLockedBins;
+
+        do {
+            numOfLockedBins = 0;
+
+            // TODO: try different bin search order
+            if (needAlignedBlock) {
+                block = freeAlignedBins.findBlock(nativeBin, &bkndSync, num*size,
+                                    /*needAlignedBlock=*/true, /*alignedBin=*/true,
+                                    &numOfLockedBins);
+                if (!block)
+                    block = freeLargeBins.findBlock(nativeBin, &bkndSync, num*size,
+                                    /*needAlignedBlock=*/true, /*alignedBin=*/false,
+                                    &numOfLockedBins);
+            } else {
+                block = freeLargeBins.findBlock(nativeBin, &bkndSync, num*size,
+                                    /*needAlignedBlock=*/false, /*alignedBin=*/false,
+                                    &numOfLockedBins);
+                if (!block)
+                    block = freeAlignedBins.findBlock(nativeBin, &bkndSync, num*size,
+                                    /*needAlignedBlock=*/false, /*alignedBin=*/true,
+                                    &numOfLockedBins);
+            }
+        } while (!block && numOfLockedBins>lockedBinsThreshold);
+
+        if (block)
+            break;
+
+        if (!(scanCoalescQ(/*forceCoalescQDrop=*/true)
+              | extMemPool->softCachesCleanup())) {
+            // bins are not updated,
+            // only remaining possibility is to ask for more memory
+            block =
+                askMemFromOS(totalReqSize, startModifiedCnt, &lockedBinsThreshold,
+                             numOfLockedBins, &splittable);
+            if (!block)
+                return NULL;
+            if (block != (FreeBlock*)VALID_BLOCK_IN_BIN) {
+                // size can be increased in askMemFromOS, that's why >=
+                MALLOC_ASSERT(block->sizeTmp >= size, ASSERT_TEXT);
+                break;
+            }
+            // valid block somewhere in bins, let's find it
+            block = NULL;
+        }
+    }
+    MALLOC_ASSERT(block, ASSERT_TEXT);
+    if (splittable)
+        block = toAlignedBin(block, block->sizeTmp)?
+            splitAlignedBlock(block, num, size, needAlignedBlock) :
+            splitUnalignedBlock(block, num, size, needAlignedBlock);
+    // matched blockConsumed() from startUseBlock()
+    bkndSync.blockReleased();
+
+    return block;
+}
+
+LargeMemoryBlock *Backend::getLargeBlock(size_t size)
+{
+    LargeMemoryBlock *lmb =
+        (LargeMemoryBlock*)genericGetBlock(1, size, /*needAlignedRes=*/false);
+    if (lmb) {
+        lmb->unalignedSize = size;
+        if (extMemPool->userPool())
+            extMemPool->lmbList.add(lmb);
+    }
+    return lmb;
+}
+
+void *Backend::getBackRefSpace(size_t size, bool *rawMemUsed)
+{
+    // This block is released only at shutdown, so it can prevent
+    // a entire region releasing when it's received from the backend,
+    // so prefer getRawMemory using.
+    if (void *ret = getRawMemory(size, REGULAR)) {
+        *rawMemUsed = true;
+        return ret;
+    }
+    void *ret = genericGetBlock(1, size, /*needAlignedRes=*/false);
+    if (ret) *rawMemUsed = false;
+    return ret;
+}
+
+void Backend::putBackRefSpace(void *b, size_t size, bool rawMemUsed)
+{
+    if (rawMemUsed)
+        freeRawMemory(b, size);
+    // ignore not raw mem, as it released on region releasing
+}
+
+void Backend::removeBlockFromBin(FreeBlock *fBlock)
+{
+    if (fBlock->myBin != Backend::NO_BIN) {
+        if (fBlock->aligned)
+            freeAlignedBins.lockRemoveBlock(fBlock->myBin, fBlock);
+        else
+            freeLargeBins.lockRemoveBlock(fBlock->myBin, fBlock);
+    }
+}
+
+void Backend::genericPutBlock(FreeBlock *fBlock, size_t blockSz)
+{
+    bkndSync.blockConsumed();
+    coalescAndPut(fBlock, blockSz);
+    bkndSync.blockReleased();
+}
+
+void AllLargeBlocksList::add(LargeMemoryBlock *lmb)
+{
+    MallocMutex::scoped_lock scoped_cs(largeObjLock);
+    lmb->gPrev = NULL;
+    lmb->gNext = loHead;
+    if (lmb->gNext)
+        lmb->gNext->gPrev = lmb;
+    loHead = lmb;
+}
+
+void AllLargeBlocksList::remove(LargeMemoryBlock *lmb)
+{
+    MallocMutex::scoped_lock scoped_cs(largeObjLock);
+    if (loHead == lmb)
+        loHead = lmb->gNext;
+    if (lmb->gNext)
+        lmb->gNext->gPrev = lmb->gPrev;
+    if (lmb->gPrev)
+        lmb->gPrev->gNext = lmb->gNext;
+}
+
+void Backend::putLargeBlock(LargeMemoryBlock *lmb)
+{
+    if (extMemPool->userPool())
+        extMemPool->lmbList.remove(lmb);
+    genericPutBlock((FreeBlock *)lmb, lmb->unalignedSize);
+}
+
+void Backend::returnLargeObject(LargeMemoryBlock *lmb)
+{
+    removeBackRef(lmb->backRefIdx);
+    putLargeBlock(lmb);
+    STAT_increment(getThreadId(), ThreadCommonCounters, freeLargeObj);
+}
+
+#if BACKEND_HAS_MREMAP
+void *Backend::remap(void *ptr, size_t oldSize, size_t newSize, size_t alignment)
+{
+    // no remap for user pools and for object too small that living in bins
+    if (inUserPool() || min(oldSize, newSize)<maxBinned_SmallPage
+        // during remap, can't guarantee alignment more strict than current or
+        // more strict than page alignment
+        || !isAligned(ptr, alignment) || alignment>extMemPool->granularity)
+        return NULL;
+    const LargeMemoryBlock* lmbOld = ((LargeObjectHdr *)ptr - 1)->memoryBlock;
+    const size_t oldUnalignedSize = lmbOld->unalignedSize;
+    FreeBlock *oldFBlock = (FreeBlock *)lmbOld;
+    FreeBlock *right = oldFBlock->rightNeig(oldUnalignedSize);
+    // in every region only one block can have LAST_REGION_BLOCK on right,
+    // so don't need no synchronization
+    if (!right->isLastRegionBlock())
+        return NULL;
+
+    MemRegion *oldRegion = static_cast<LastFreeBlock*>(right)->memRegion;
+    MALLOC_ASSERT( oldRegion < ptr, ASSERT_TEXT );
+    const size_t oldRegionSize = oldRegion->allocSz;
+    if (oldRegion->type != MEMREG_ONE_BLOCK)
+        return NULL;  // we are not single in the region
+    const size_t userOffset = (uintptr_t)ptr - (uintptr_t)oldRegion;
+    const size_t requestSize =
+        alignUp(userOffset + newSize + sizeof(LastFreeBlock), extMemPool->granularity);
+    if (requestSize < newSize) // is wrapped around?
+        return NULL;
+    regionList.remove(oldRegion);
+
+    void *ret = mremap(oldRegion, oldRegion->allocSz, requestSize, MREMAP_MAYMOVE);
+    if (MAP_FAILED == ret) { // can't remap, revert and leave
+        regionList.add(oldRegion);
+        return NULL;
+    }
+    MemRegion *region = (MemRegion*)ret;
+    MALLOC_ASSERT(region->type == MEMREG_ONE_BLOCK, ASSERT_TEXT);
+    region->allocSz = requestSize;
+
+    FreeBlock *fBlock = (FreeBlock *)alignUp((uintptr_t)region + sizeof(MemRegion),
+                                             largeObjectAlignment);
+    // put LastFreeBlock at the very end of region
+    const uintptr_t fBlockEnd = (uintptr_t)region + requestSize - sizeof(LastFreeBlock);
+    region->blockSz = fBlockEnd - (uintptr_t)fBlock;
+
+    regionList.add(region);
+    startUseBlock(region, fBlock, /*addToBin=*/false);
+    MALLOC_ASSERT(fBlock->sizeTmp == region->blockSz, ASSERT_TEXT);
+    // matched blockConsumed() in startUseBlock().
+    // TODO: get rid of useless pair blockConsumed()/blockReleased()
+    bkndSync.blockReleased();
+
+    // object must start at same offest from region's start
+    void *object = (void*)((uintptr_t)region + userOffset);
+    MALLOC_ASSERT(isAligned(object, alignment), ASSERT_TEXT);
+    LargeObjectHdr *header = (LargeObjectHdr*)object - 1;
+    setBackRef(header->backRefIdx, header);
+
+    LargeMemoryBlock *lmb = (LargeMemoryBlock*)fBlock;
+    lmb->unalignedSize = region->blockSz;
+    lmb->objectSize = newSize;
+    lmb->backRefIdx = header->backRefIdx;
+    header->memoryBlock = lmb;
+    MALLOC_ASSERT((uintptr_t)lmb + lmb->unalignedSize >=
+                  (uintptr_t)object + lmb->objectSize, "An object must fit to the block.");
+
+    usedAddrRange.registerFree((uintptr_t)oldRegion, (uintptr_t)oldRegion + oldRegionSize);
+    usedAddrRange.registerAlloc((uintptr_t)region, (uintptr_t)region + requestSize);
+    AtomicAdd((intptr_t&)totalMemSize, region->allocSz - oldRegionSize);
+
+    return object;
+}
+#endif /* BACKEND_HAS_MREMAP */
+
+void Backend::releaseRegion(MemRegion *memRegion)
+{
+    regionList.remove(memRegion);
+    freeRawMem(memRegion, memRegion->allocSz);
+}
+
+// coalesce fBlock with its neighborhood
+FreeBlock *Backend::doCoalesc(FreeBlock *fBlock, MemRegion **mRegion)
+{
+    FreeBlock *resBlock = fBlock;
+    size_t resSize = fBlock->sizeTmp;
+    MemRegion *memRegion = NULL;
+
+    fBlock->markCoalescing(resSize);
+    resBlock->blockInBin = false;
+
+    // coalescing with left neighbor
+    size_t leftSz = fBlock->trySetLeftUsed(GuardedSize::COAL_BLOCK);
+    if (leftSz != GuardedSize::LOCKED) {
+        if (leftSz == GuardedSize::COAL_BLOCK) {
+            coalescQ.putBlock(fBlock);
+            return NULL;
+        } else {
+            FreeBlock *left = fBlock->leftNeig(leftSz);
+            size_t lSz = left->trySetMeUsed(GuardedSize::COAL_BLOCK);
+            if (lSz <= GuardedSize::MAX_LOCKED_VAL) {
+                fBlock->setLeftFree(leftSz); // rollback
+                coalescQ.putBlock(fBlock);
+                return NULL;
+            } else {
+                MALLOC_ASSERT(lSz == leftSz, "Invalid header");
+                left->blockInBin = true;
+                resBlock = left;
+                resSize += leftSz;
+                resBlock->sizeTmp = resSize;
+            }
+        }
+    }
+    // coalescing with right neighbor
+    FreeBlock *right = fBlock->rightNeig(fBlock->sizeTmp);
+    size_t rightSz = right->trySetMeUsed(GuardedSize::COAL_BLOCK);
+    if (rightSz != GuardedSize::LOCKED) {
+        // LastFreeBlock is on the right side
+        if (GuardedSize::LAST_REGION_BLOCK == rightSz) {
+            right->setMeFree(GuardedSize::LAST_REGION_BLOCK);
+            memRegion = static_cast<LastFreeBlock*>(right)->memRegion;
+        } else if (GuardedSize::COAL_BLOCK == rightSz) {
+            if (resBlock->blockInBin) {
+                resBlock->blockInBin = false;
+                removeBlockFromBin(resBlock);
+            }
+            coalescQ.putBlock(resBlock);
+            return NULL;
+        } else {
+            size_t rSz = right->rightNeig(rightSz)->
+                trySetLeftUsed(GuardedSize::COAL_BLOCK);
+            if (rSz <= GuardedSize::MAX_LOCKED_VAL) {
+                right->setMeFree(rightSz);  // rollback
+                if (resBlock->blockInBin) {
+                    resBlock->blockInBin = false;
+                    removeBlockFromBin(resBlock);
+                }
+                coalescQ.putBlock(resBlock);
+                return NULL;
+            } else {
+                MALLOC_ASSERT(rSz == rightSz, "Invalid header");
+                removeBlockFromBin(right);
+                resSize += rightSz;
+
+                // Is LastFreeBlock on the right side of right?
+                FreeBlock *nextRight = right->rightNeig(rightSz);
+                size_t nextRightSz = nextRight->
+                    trySetMeUsed(GuardedSize::COAL_BLOCK);
+                if (nextRightSz > GuardedSize::MAX_LOCKED_VAL) {
+                    if (nextRightSz == GuardedSize::LAST_REGION_BLOCK)
+                        memRegion = static_cast<LastFreeBlock*>(nextRight)->memRegion;
+
+                    nextRight->setMeFree(nextRightSz);
+                }
+            }
+        }
+    }
+    if (memRegion) {
+        MALLOC_ASSERT((uintptr_t)memRegion + memRegion->allocSz >=
+                      (uintptr_t)right + sizeof(LastFreeBlock), ASSERT_TEXT);
+        MALLOC_ASSERT((uintptr_t)memRegion < (uintptr_t)resBlock, ASSERT_TEXT);
+        *mRegion = memRegion;
+    } else
+        *mRegion = NULL;
+    resBlock->sizeTmp = resSize;
+    return resBlock;
+}
+
+bool Backend::coalescAndPutList(FreeBlock *list, bool forceCoalescQDrop,
+                                bool reportBlocksProcessed)
+{
+    bool regionReleased = false;
+
+    for (FreeBlock *helper; list;
+         list = helper,
+             // matches block enqueue in CoalRequestQ::putBlock()
+             reportBlocksProcessed? coalescQ.blockWasProcessed() : (void)0) {
+        MemRegion *memRegion;
+        bool addToTail = false;
+
+        helper = list->nextToFree;
+        FreeBlock *toRet = doCoalesc(list, &memRegion);
+        if (!toRet)
+            continue;
+
+        if (memRegion && memRegion->blockSz == toRet->sizeTmp
+            && !extMemPool->fixedPool) {
+            if (extMemPool->regionsAreReleaseable()) {
+                // release the region, because there is no used blocks in it
+                if (toRet->blockInBin)
+                    removeBlockFromBin(toRet);
+                releaseRegion(memRegion);
+                regionReleased = true;
+                continue;
+            } else // add block from empty region to end of bin,
+                addToTail = true; // preserving for exact fit
+        }
+        size_t currSz = toRet->sizeTmp;
+        int bin = sizeToBin(currSz);
+        bool toAligned = toAlignedBin(toRet, currSz);
+        bool needAddToBin = true;
+
+        if (toRet->blockInBin) {
+            // Does it stay in same bin?
+            if (toRet->myBin == bin && toRet->aligned == toAligned)
+                needAddToBin = false;
+            else {
+                toRet->blockInBin = false;
+                removeBlockFromBin(toRet);
+            }
+        }
+
+        // Does not stay in same bin, or bin-less; add it
+        if (needAddToBin) {
+            toRet->prev = toRet->next = toRet->nextToFree = NULL;
+            toRet->myBin = NO_BIN;
+
+            // If the block is too small to fit in any bin, keep it bin-less.
+            // It's not a leak because the block later can be coalesced.
+            if (currSz >= minBinnedSize) {
+                toRet->sizeTmp = currSz;
+                IndexedBins *target = toAligned? &freeAlignedBins : &freeLargeBins;
+                if (forceCoalescQDrop) {
+                    target->addBlock(bin, toRet, toRet->sizeTmp, addToTail);
+                } else if (!target->tryAddBlock(bin, toRet, addToTail)) {
+                    coalescQ.putBlock(toRet);
+                    continue;
+                }
+            }
+            toRet->sizeTmp = 0;
+        }
+        // Free (possibly coalesced) free block.
+        // Adding to bin must be done before this point,
+        // because after a block is free it can be coalesced, and
+        // using its pointer became unsafe.
+        // Remember that coalescing is not done under any global lock.
+        toRet->setMeFree(currSz);
+        toRet->rightNeig(currSz)->setLeftFree(currSz);
+    }
+    return regionReleased;
+}
+
+// Coalesce fBlock and add it back to a bin;
+// processing delayed coalescing requests.
+void Backend::coalescAndPut(FreeBlock *fBlock, size_t blockSz)
+{
+    fBlock->sizeTmp = blockSz;
+    fBlock->nextToFree = NULL;
+
+    coalescAndPutList(fBlock, /*forceCoalescQDrop=*/false, /*reportBlocksProcessed=*/false);
+}
+
+bool Backend::scanCoalescQ(bool forceCoalescQDrop)
+{
+    FreeBlock *currCoalescList = coalescQ.getAll();
+
+    if (currCoalescList)
+        // reportBlocksProcessed=true informs that the blocks leave coalescQ,
+        // matches blockConsumed() from CoalRequestQ::putBlock()
+        coalescAndPutList(currCoalescList, forceCoalescQDrop,
+                          /*reportBlocksProcessed=*/true);
+    // returns status of coalescQ.getAll(), as an indication of possibe changes in backend
+    // TODO: coalescAndPutList() may report is some new free blocks became available or not
+    return currCoalescList;
+}
+
+FreeBlock *Backend::findBlockInRegion(MemRegion *region, size_t exactBlockSize)
+{
+    FreeBlock *fBlock;
+    size_t blockSz;
+    uintptr_t fBlockEnd,
+        lastFreeBlock = (uintptr_t)region + region->allocSz - sizeof(LastFreeBlock);
+
+    MALLOC_STATIC_ASSERT(sizeof(LastFreeBlock) % sizeof(uintptr_t) == 0,
+        "Atomic applied on LastFreeBlock, and we put it at the end of region, that"
+        " is uintptr_t-aligned, so no unaligned atomic operations are possible.");
+     // right bound is slab-aligned, keep LastFreeBlock after it
+    if (region->type==MEMREG_FLEXIBLE_SIZE) {
+        fBlock = (FreeBlock *)alignUp((uintptr_t)region + sizeof(MemRegion),
+                                      sizeof(uintptr_t));
+        fBlockEnd = alignDown(lastFreeBlock, slabSize);
+    } else {
+        fBlock = (FreeBlock *)alignUp((uintptr_t)region + sizeof(MemRegion),
+                                      largeObjectAlignment);
+        fBlockEnd = (uintptr_t)fBlock + exactBlockSize;
+        MALLOC_ASSERT(fBlockEnd <= lastFreeBlock, ASSERT_TEXT);
+    }
+    if (fBlockEnd <= (uintptr_t)fBlock)
+        return NULL; // allocSz is too small
+    blockSz = fBlockEnd - (uintptr_t)fBlock;
+    // TODO: extend getSlabBlock to support degradation, i.e. getting less blocks
+    // then requested, and then relax this check
+    // (now all or nothing is implemented, check according to this)
+    if (blockSz < numOfSlabAllocOnMiss*slabSize)
+        return NULL;
+
+    region->blockSz = blockSz;
+    return fBlock;
+}
+
+// startUseBlock adds free block to a bin, the block can be used and
+// even released after this, so the region must be added to regionList already
+void Backend::startUseBlock(MemRegion *region, FreeBlock *fBlock, bool addToBin)
+{
+    size_t blockSz = region->blockSz;
+    fBlock->initHeader();
+    fBlock->setMeFree(blockSz);
+
+    LastFreeBlock *lastBl = static_cast<LastFreeBlock*>(fBlock->rightNeig(blockSz));
+    // to not get unaligned atomics during LastFreeBlock access
+    MALLOC_ASSERT(isAligned(lastBl, sizeof(uintptr_t)), NULL);
+    lastBl->initHeader();
+    lastBl->setMeFree(GuardedSize::LAST_REGION_BLOCK);
+    lastBl->setLeftFree(blockSz);
+    lastBl->myBin = NO_BIN;
+    lastBl->memRegion = region;
+
+    if (addToBin) {
+        unsigned targetBin = sizeToBin(blockSz);
+        // during adding advance regions, register bin for a largest block in region
+        advRegBins.registerBin(targetBin);
+        if (region->type!=MEMREG_ONE_BLOCK && toAlignedBin(fBlock, blockSz)) {
+            freeAlignedBins.addBlock(targetBin, fBlock, blockSz, /*addToTail=*/false);
+        } else {
+            freeLargeBins.addBlock(targetBin, fBlock, blockSz, /*addToTail=*/false);
+        }
+    } else {
+        // to match with blockReleased() in genericGetBlock
+        bkndSync.blockConsumed();
+        fBlock->sizeTmp = fBlock->tryLockBlock();
+        MALLOC_ASSERT(fBlock->sizeTmp >= FreeBlock::minBlockSize,
+                      "Locking must be successful");
+    }
+}
+
+void MemRegionList::add(MemRegion *r)
+{
+    r->prev = NULL;
+    MallocMutex::scoped_lock lock(regionListLock);
+    r->next = head;
+    head = r;
+    if (head->next)
+        head->next->prev = head;
+}
+
+void MemRegionList::remove(MemRegion *r)
+{
+    MallocMutex::scoped_lock lock(regionListLock);
+    if (head == r)
+        head = head->next;
+    if (r->next)
+        r->next->prev = r->prev;
+    if (r->prev)
+        r->prev->next = r->next;
+}
+
+#if __TBB_MALLOC_BACKEND_STAT
+int MemRegionList::reportStat(FILE *f)
+{
+    int regNum = 0;
+    MallocMutex::scoped_lock lock(regionListLock);
+    for (MemRegion *curr = head; curr; curr = curr->next) {
+        fprintf(f, "%p: max block %lu B, ", curr, curr->blockSz);
+        regNum++;
+    }
+    return regNum;
+}
+#endif
+
+FreeBlock *Backend::addNewRegion(size_t size, MemRegionType memRegType, bool addToBin)
+{
+    MALLOC_STATIC_ASSERT(sizeof(BlockMutexes) <= sizeof(BlockI),
+                 "Header must be not overwritten in used blocks");
+    MALLOC_ASSERT(FreeBlock::minBlockSize > GuardedSize::MAX_SPEC_VAL,
+          "Block length must not conflict with special values of GuardedSize");
+    // If the region is not "flexible size" we should reserve some space for
+    // a region header, the worst case alignment and the last block mark.
+    const size_t requestSize = memRegType == MEMREG_FLEXIBLE_SIZE ? size :
+        size + sizeof(MemRegion) + largeObjectAlignment
+             +  FreeBlock::minBlockSize + sizeof(LastFreeBlock);
+
+    size_t rawSize = requestSize;
+    MemRegion *region = (MemRegion*)allocRawMem(rawSize);
+    if (!region) {
+        MALLOC_ASSERT(rawSize==requestSize, "getRawMem has not allocated memory but changed the allocated size.");
+        return NULL;
+    }
+    if (rawSize < sizeof(MemRegion)) {
+        if (!extMemPool->fixedPool)
+            freeRawMem(region, rawSize);
+        return NULL;
+    }
+
+    region->type = memRegType;
+    region->allocSz = rawSize;
+    FreeBlock *fBlock = findBlockInRegion(region, size);
+    if (!fBlock) {
+        if (!extMemPool->fixedPool)
+            freeRawMem(region, rawSize);
+        return NULL;
+    }
+    regionList.add(region);
+    startUseBlock(region, fBlock, addToBin);
+    bkndSync.binsModified();
+    return addToBin? (FreeBlock*)VALID_BLOCK_IN_BIN : fBlock;
+}
+
+void Backend::init(ExtMemoryPool *extMemoryPool)
+{
+    extMemPool = extMemoryPool;
+    usedAddrRange.init();
+    coalescQ.init(&bkndSync);
+    bkndSync.init(this);
+}
+
+void Backend::reset()
+{
+    MALLOC_ASSERT(extMemPool->userPool(), "Only user pool can be reset.");
+    // no active threads are allowed in backend while reset() called
+    verify();
+
+    freeLargeBins.reset();
+    freeAlignedBins.reset();
+    advRegBins.reset();
+
+    for (MemRegion *curr = regionList.head; curr; curr = curr->next) {
+        FreeBlock *fBlock = findBlockInRegion(curr, curr->blockSz);
+        MALLOC_ASSERT(fBlock, "A memory region unexpectedly got smaller");
+        startUseBlock(curr, fBlock, /*addToBin=*/true);
+    }
+}
+
+bool Backend::destroy()
+{
+    bool noError = true;
+    // no active threads are allowed in backend while destroy() called
+    verify();
+    if (!inUserPool()) {
+        freeLargeBins.reset();
+        freeAlignedBins.reset();
+    }
+    while (regionList.head) {
+        MemRegion *helper = regionList.head->next;
+        noError &= freeRawMem(regionList.head, regionList.head->allocSz);
+        regionList.head = helper;
+    }
+    return noError;
+}
+
+bool Backend::clean()
+{
+    scanCoalescQ(/*forceCoalescQDrop=*/false);
+
+    bool res = false;
+    // We can have several blocks occupying a whole region,
+    // because such regions are added in advance (see askMemFromOS() and reset()),
+    // and never used. Release them all.
+    for (int i = advRegBins.getMinUsedBin(0); i != -1; i = advRegBins.getMinUsedBin(i+1)) {
+        if (i == freeAlignedBins.getMinNonemptyBin(i))
+            res |= freeAlignedBins.tryReleaseRegions(i, this);
+        if (i == freeLargeBins.getMinNonemptyBin(i))
+            res |= freeLargeBins.tryReleaseRegions(i, this);
+    }
+
+    return res;
+}
+
+void Backend::IndexedBins::verify()
+{
+    for (int i=0; i<freeBinsNum; i++) {
+        for (FreeBlock *fb = freeBins[i].head; fb; fb=fb->next) {
+            uintptr_t mySz = fb->myL.value;
+            MALLOC_ASSERT(mySz>GuardedSize::MAX_SPEC_VAL, ASSERT_TEXT);
+            FreeBlock *right = (FreeBlock*)((uintptr_t)fb + mySz);
+            suppress_unused_warning(right);
+            MALLOC_ASSERT(right->myL.value<=GuardedSize::MAX_SPEC_VAL, ASSERT_TEXT);
+            MALLOC_ASSERT(right->leftL.value==mySz, ASSERT_TEXT);
+            MALLOC_ASSERT(fb->leftL.value<=GuardedSize::MAX_SPEC_VAL, ASSERT_TEXT);
+        }
+    }
+}
+
+// For correct operation, it must be called when no other threads
+// is changing backend.
+void Backend::verify()
+{
+#if MALLOC_DEBUG
+    scanCoalescQ(/*forceCoalescQDrop=*/false);
+
+    freeLargeBins.verify();
+    freeAlignedBins.verify();
+#endif // MALLOC_DEBUG
+}
+
+#if __TBB_MALLOC_BACKEND_STAT
+size_t Backend::Bin::countFreeBlocks()
+{
+    size_t cnt = 0;
+    {
+        MallocMutex::scoped_lock lock(tLock);
+        for (FreeBlock *fb = head; fb; fb = fb->next)
+            cnt++;
+    }
+    return cnt;
+}
+
+size_t Backend::Bin::reportFreeBlocks(FILE *f)
+{
+    size_t totalSz = 0;
+    MallocMutex::scoped_lock lock(tLock);
+    for (FreeBlock *fb = head; fb; fb = fb->next) {
+        size_t sz = fb->tryLockBlock();
+        fb->setMeFree(sz);
+        fprintf(f, " [%p;%p]", fb, (void*)((uintptr_t)fb+sz));
+        totalSz += sz;
+    }
+    return totalSz;
+}
+
+void Backend::IndexedBins::reportStat(FILE *f)
+{
+    size_t totalSize = 0;
+
+    for (int i=0; i<Backend::freeBinsNum; i++)
+        if (size_t cnt = freeBins[i].countFreeBlocks()) {
+            totalSize += freeBins[i].reportFreeBlocks(f);
+            fprintf(f, " %d:%lu, ", i, cnt);
+        }
+    fprintf(f, "\ttotal size %lu KB", totalSize/1024);
+}
+
+void Backend::reportStat(FILE *f)
+{
+    scanCoalescQ(/*forceCoalescQDrop=*/false);
+
+    fprintf(f, "\n  regions:\n");
+    int regNum = regionList.reportStat(f);
+    fprintf(f, "\n%d regions, %lu KB in all regions\n  free bins:\nlarge bins: ",
+            regNum, totalMemSize/1024);
+    freeLargeBins.reportStat(f);
+    fprintf(f, "\naligned bins: ");
+    freeAlignedBins.reportStat(f);
+    fprintf(f, "\n");
+}
+#endif // __TBB_MALLOC_BACKEND_STAT
+
+} } // namespaces
diff --git a/xdl/third_party/tbb/src/tbbmalloc/backref.cpp b/xdl/third_party/tbb/src/tbbmalloc/backref.cpp
new file mode 100644
index 00000000..ae8e66ad
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/backref.cpp
@@ -0,0 +1,342 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbbmalloc_internal.h"
+#include <new>        /* for placement new */
+
+namespace rml {
+namespace internal {
+
+
+/********* backreferences ***********************/
+/* Each slab block and each large memory object header contains BackRefIdx
+ * that points out in some BackRefBlock which points back to this block or header.
+ */
+struct BackRefBlock : public BlockI {
+    BackRefBlock *nextForUse;     // the next in the chain of blocks with free items
+    FreeObject   *bumpPtr;        // bump pointer moves from the end to the beginning of the block
+    FreeObject   *freeList;
+    // list of all blocks that were allocated from raw mem (i.e., not from backend)
+    BackRefBlock *nextRawMemBlock;
+    int           allocatedCount; // the number of objects allocated
+    BackRefIdx::master_t myNum;   // the index in the master
+    MallocMutex   blockMutex;
+    // true if this block has been added to the listForUse chain,
+    // modifications protected by masterMutex
+    bool          addedToForUse;
+
+    BackRefBlock(const BackRefBlock *blockToUse, intptr_t num) :
+        nextForUse(NULL), bumpPtr((FreeObject*)((uintptr_t)blockToUse + slabSize - sizeof(void*))),
+        freeList(NULL), nextRawMemBlock(NULL), allocatedCount(0), myNum(num),
+        addedToForUse(false) {
+        memset(&blockMutex, 0, sizeof(MallocMutex));
+
+        MALLOC_ASSERT(!(num >> CHAR_BIT*sizeof(BackRefIdx::master_t)),
+                      "index in BackRefMaster must fit to BackRefIdx::master");
+    }
+    // clean all but header
+    void zeroSet() { memset(this+1, 0, BackRefBlock::bytes-sizeof(BackRefBlock)); }
+    static const int bytes = slabSize;
+};
+
+// max number of backreference pointers in slab block
+static const int BR_MAX_CNT = (BackRefBlock::bytes-sizeof(BackRefBlock))/sizeof(void*);
+
+struct BackRefMaster {
+/* On 64-bit systems a slab block can hold up to ~2K back pointers to slab blocks
+ * or large objects, so it can address at least 32MB. The master array of 256KB
+ * holds 32K pointers to such blocks, addressing ~1 TB.
+ * On 32-bit systems there is ~4K back pointers in a slab block, so ~64MB can be addressed.
+ * The master array of 8KB holds 2K pointers to leaves, so ~128 GB can addressed.
+ */
+    static const size_t bytes = sizeof(uintptr_t)>4? 256*1024 : 8*1024;
+    static const int dataSz;
+/* space is reserved for master table and 4 leaves
+   taking into account VirtualAlloc allocation granularity */
+    static const int leaves = 4;
+    static const size_t masterSize = BackRefMaster::bytes+leaves*BackRefBlock::bytes;
+    // The size of memory request for a few more leaf blocks;
+    // selected to match VirtualAlloc granularity
+    static const size_t blockSpaceSize = 64*1024;
+
+    Backend       *backend;
+    BackRefBlock  *active;         // if defined, use it for allocations
+    BackRefBlock  *listForUse;     // the chain of data blocks with free items
+    BackRefBlock  *allRawMemBlocks;
+    intptr_t       lastUsed;       // index of the last used block
+    bool           rawMemUsed;
+    MallocMutex    requestNewSpaceMutex;
+    BackRefBlock  *backRefBl[1];   // the real size of the array is dataSz
+
+    BackRefBlock *findFreeBlock();
+    void          addToForUseList(BackRefBlock *bl);
+    void          initEmptyBackRefBlock(BackRefBlock *newBl);
+    bool          requestNewSpace();
+};
+
+const int BackRefMaster::dataSz
+    = 1+(BackRefMaster::bytes-sizeof(BackRefMaster))/sizeof(BackRefBlock*);
+
+static MallocMutex masterMutex;
+static BackRefMaster *backRefMaster;
+
+bool initBackRefMaster(Backend *backend)
+{
+    bool rawMemUsed;
+    BackRefMaster *master =
+        (BackRefMaster*)backend->getBackRefSpace(BackRefMaster::masterSize,
+                                                 &rawMemUsed);
+    if (! master)
+        return false;
+    master->backend = backend;
+    master->listForUse = master->allRawMemBlocks = NULL;
+    master->rawMemUsed = rawMemUsed;
+    master->lastUsed = -1;
+    memset(&master->requestNewSpaceMutex, 0, sizeof(MallocMutex));
+    for (int i=0; i<BackRefMaster::leaves; i++) {
+        BackRefBlock *bl = (BackRefBlock*)((uintptr_t)master + BackRefMaster::bytes + i*BackRefBlock::bytes);
+        bl->zeroSet();
+        master->initEmptyBackRefBlock(bl);
+        if (i)
+            master->addToForUseList(bl);
+        else // active leaf is not needed in listForUse
+            master->active = bl;
+    }
+    // backRefMaster is read in getBackRef, so publish it in consistent state
+    FencedStore((intptr_t&)backRefMaster, (intptr_t)master);
+    return true;
+}
+
+void destroyBackRefMaster(Backend *backend)
+{
+    if (backRefMaster) { // Is initBackRefMaster() called?
+        for (BackRefBlock *curr=backRefMaster->allRawMemBlocks; curr; ) {
+            BackRefBlock *next = curr->nextRawMemBlock;
+            // allRawMemBlocks list is only for raw mem blocks
+            backend->putBackRefSpace(curr, BackRefMaster::blockSpaceSize,
+                                     /*rawMemUsed=*/true);
+            curr = next;
+        }
+        backend->putBackRefSpace(backRefMaster, BackRefMaster::masterSize,
+                                 backRefMaster->rawMemUsed);
+    }
+}
+
+void BackRefMaster::addToForUseList(BackRefBlock *bl)
+{
+    bl->nextForUse = listForUse;
+    listForUse = bl;
+    bl->addedToForUse = true;
+}
+
+void BackRefMaster::initEmptyBackRefBlock(BackRefBlock *newBl)
+{
+    intptr_t nextLU = lastUsed+1;
+    new (newBl) BackRefBlock(newBl, nextLU);
+    MALLOC_ASSERT(nextLU < dataSz, NULL);
+    backRefBl[nextLU] = newBl;
+    // lastUsed is read in getBackRef, and access to backRefBl[lastUsed]
+    // is possible only after checking backref against current lastUsed
+    FencedStore(lastUsed, nextLU);
+}
+
+bool BackRefMaster::requestNewSpace()
+{
+    bool isRawMemUsed;
+    MALLOC_STATIC_ASSERT(!(blockSpaceSize % BackRefBlock::bytes),
+                         "Must request space for whole number of blocks.");
+
+    if (backRefMaster->dataSz <= lastUsed + 1) // no space in master
+        return false;
+
+    // only one thread at a time may add blocks
+    MallocMutex::scoped_lock newSpaceLock(requestNewSpaceMutex);
+
+    if (listForUse) // double check that only one block is available
+        return true;
+    BackRefBlock *newBl =
+        (BackRefBlock*)backend->getBackRefSpace(blockSpaceSize, &isRawMemUsed);
+    if (!newBl) return false;
+
+    // touch a page for the 1st time without taking masterMutex ...
+    for (BackRefBlock *bl = newBl; (uintptr_t)bl < (uintptr_t)newBl + blockSpaceSize;
+         bl = (BackRefBlock*)((uintptr_t)bl + BackRefBlock::bytes))
+        bl->zeroSet();
+
+    MallocMutex::scoped_lock lock(masterMutex); // ... and share under lock
+
+    const size_t numOfUnusedIdxs = backRefMaster->dataSz - lastUsed - 1;
+    if (numOfUnusedIdxs <= 0) { // no space in master under lock, roll back
+        backend->putBackRefSpace(newBl, blockSpaceSize, isRawMemUsed);
+        return false;
+    }
+    // It's possible that only part of newBl is used, due to lack of indices in master.
+    // This is OK as such underutilization is possible only once for backreferneces table.
+    int blocksToUse = min(numOfUnusedIdxs, blockSpaceSize / BackRefBlock::bytes);
+
+    // use the first block in the batch to maintain the list of "raw" memory
+    // to be released at shutdown
+    if (isRawMemUsed) {
+        newBl->nextRawMemBlock = backRefMaster->allRawMemBlocks;
+        backRefMaster->allRawMemBlocks = newBl;
+    }
+    for (BackRefBlock *bl = newBl; blocksToUse>0;
+         bl = (BackRefBlock*)((uintptr_t)bl + BackRefBlock::bytes), blocksToUse--) {
+        initEmptyBackRefBlock(bl);
+        if (active->allocatedCount == BR_MAX_CNT)
+            active = bl; // active leaf is not needed in listForUse
+        else
+            addToForUseList(bl);
+    }
+    return true;
+}
+
+BackRefBlock *BackRefMaster::findFreeBlock()
+{
+    if (active->allocatedCount < BR_MAX_CNT)
+        return active;
+
+    if (listForUse) {                                   // use released list
+        MallocMutex::scoped_lock lock(masterMutex);
+
+        if (active->allocatedCount == BR_MAX_CNT && listForUse) {
+            active = listForUse;
+            listForUse = listForUse->nextForUse;
+            MALLOC_ASSERT(active->addedToForUse, ASSERT_TEXT);
+            active->addedToForUse = false;
+        }
+    } else // allocate new data node
+        if (!requestNewSpace())
+            return NULL;
+    return active;
+}
+
+void *getBackRef(BackRefIdx backRefIdx)
+{
+    // !backRefMaster means no initialization done, so it can't be valid memory
+    // see addEmptyBackRefBlock for fences around lastUsed
+    if (!FencedLoad((intptr_t&)backRefMaster)
+        || backRefIdx.getMaster() > FencedLoad(backRefMaster->lastUsed)
+        || backRefIdx.getOffset() >= BR_MAX_CNT)
+        return NULL;
+    return *(void**)((uintptr_t)backRefMaster->backRefBl[backRefIdx.getMaster()]
+                     + sizeof(BackRefBlock)+backRefIdx.getOffset()*sizeof(void*));
+}
+
+void setBackRef(BackRefIdx backRefIdx, void *newPtr)
+{
+    MALLOC_ASSERT(backRefIdx.getMaster()<=backRefMaster->lastUsed && backRefIdx.getOffset()<BR_MAX_CNT,
+                  ASSERT_TEXT);
+    *(void**)((uintptr_t)backRefMaster->backRefBl[backRefIdx.getMaster()]
+              + sizeof(BackRefBlock) + backRefIdx.getOffset()*sizeof(void*)) = newPtr;
+}
+
+BackRefIdx BackRefIdx::newBackRef(bool largeObj)
+{
+    BackRefBlock *blockToUse;
+    void **toUse;
+    BackRefIdx res;
+    bool lastBlockFirstUsed = false;
+
+    do {
+        MALLOC_ASSERT(backRefMaster, ASSERT_TEXT);
+        blockToUse = backRefMaster->findFreeBlock();
+        if (!blockToUse)
+            return BackRefIdx();
+        toUse = NULL;
+        { // the block is locked to find a reference
+            MallocMutex::scoped_lock lock(blockToUse->blockMutex);
+
+            if (blockToUse->freeList) {
+                toUse = (void**)blockToUse->freeList;
+                blockToUse->freeList = blockToUse->freeList->next;
+                MALLOC_ASSERT(!blockToUse->freeList ||
+                              ((uintptr_t)blockToUse->freeList>=(uintptr_t)blockToUse
+                               && (uintptr_t)blockToUse->freeList <
+                               (uintptr_t)blockToUse + slabSize), ASSERT_TEXT);
+            } else if (blockToUse->allocatedCount < BR_MAX_CNT) {
+                toUse = (void**)blockToUse->bumpPtr;
+                blockToUse->bumpPtr =
+                    (FreeObject*)((uintptr_t)blockToUse->bumpPtr - sizeof(void*));
+                if (blockToUse->allocatedCount == BR_MAX_CNT-1) {
+                    MALLOC_ASSERT((uintptr_t)blockToUse->bumpPtr
+                                  < (uintptr_t)blockToUse+sizeof(BackRefBlock),
+                                  ASSERT_TEXT);
+                    blockToUse->bumpPtr = NULL;
+                }
+            }
+            if (toUse) {
+                if (!blockToUse->allocatedCount && !backRefMaster->listForUse)
+                    lastBlockFirstUsed = true;
+                blockToUse->allocatedCount++;
+            }
+        } // end of lock scope
+    } while (!toUse);
+    // The first thread that uses the last block requests new space in advance;
+    // possible failures are ignored.
+    if (lastBlockFirstUsed)
+        backRefMaster->requestNewSpace();
+
+    res.master = blockToUse->myNum;
+    uintptr_t offset =
+        ((uintptr_t)toUse - ((uintptr_t)blockToUse + sizeof(BackRefBlock)))/sizeof(void*);
+    // Is offset too big?
+    MALLOC_ASSERT(!(offset >> 15), ASSERT_TEXT);
+    res.offset = offset;
+    if (largeObj) res.largeObj = largeObj;
+
+    return res;
+}
+
+void removeBackRef(BackRefIdx backRefIdx)
+{
+    MALLOC_ASSERT(!backRefIdx.isInvalid(), ASSERT_TEXT);
+    MALLOC_ASSERT(backRefIdx.getMaster()<=backRefMaster->lastUsed
+                  && backRefIdx.getOffset()<BR_MAX_CNT, ASSERT_TEXT);
+    BackRefBlock *currBlock = backRefMaster->backRefBl[backRefIdx.getMaster()];
+    FreeObject *freeObj = (FreeObject*)((uintptr_t)currBlock + sizeof(BackRefBlock)
+                                        + backRefIdx.getOffset()*sizeof(void*));
+    MALLOC_ASSERT(((uintptr_t)freeObj>(uintptr_t)currBlock &&
+                   (uintptr_t)freeObj<(uintptr_t)currBlock + slabSize), ASSERT_TEXT);
+    {
+        MallocMutex::scoped_lock lock(currBlock->blockMutex);
+
+        freeObj->next = currBlock->freeList;
+        MALLOC_ASSERT(!freeObj->next ||
+                      ((uintptr_t)freeObj->next > (uintptr_t)currBlock
+                       && (uintptr_t)freeObj->next <
+                       (uintptr_t)currBlock + slabSize), ASSERT_TEXT);
+        currBlock->freeList = freeObj;
+        currBlock->allocatedCount--;
+    }
+    // TODO: do we need double-check here?
+    if (!currBlock->addedToForUse && currBlock!=backRefMaster->active) {
+        MallocMutex::scoped_lock lock(masterMutex);
+
+        if (!currBlock->addedToForUse && currBlock!=backRefMaster->active)
+            backRefMaster->addToForUseList(currBlock);
+    }
+}
+
+/********* End of backreferences ***********************/
+
+} // namespace internal
+} // namespace rml
+
diff --git a/xdl/third_party/tbb/src/tbbmalloc/frontend.cpp b/xdl/third_party/tbb/src/tbbmalloc/frontend.cpp
new file mode 100644
index 00000000..d4c489ec
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/frontend.cpp
@@ -0,0 +1,3227 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+#include "tbbmalloc_internal.h"
+#include <errno.h>
+#include <new>        /* for placement new */
+#include <string.h>   /* for memset */
+
+#include "../tbb/tbb_version.h"
+#include "../tbb/tbb_environment.h"
+#include "../tbb/itt_notify.h" // for __TBB_load_ittnotify()
+
+#if USE_PTHREAD
+    #define TlsSetValue_func pthread_setspecific
+    #define TlsGetValue_func pthread_getspecific
+    #define GetMyTID() pthread_self()
+    #include <sched.h>
+    inline void do_yield() {sched_yield();}
+    extern "C" { static void mallocThreadShutdownNotification(void*); }
+    #if __sun || __SUNPRO_CC
+    #define __asm__ asm
+    #endif
+    #include <unistd.h> // sysconf(_SC_PAGESIZE)
+#elif USE_WINTHREAD
+    #define GetMyTID() GetCurrentThreadId()
+#if __TBB_WIN8UI_SUPPORT
+    #include<thread>
+    #define TlsSetValue_func FlsSetValue
+    #define TlsGetValue_func FlsGetValue
+    #define TlsAlloc() FlsAlloc(NULL)
+    #define TLS_ALLOC_FAILURE FLS_OUT_OF_INDEXES
+    #define TlsFree FlsFree
+    inline void do_yield() {std::this_thread::yield();}
+#else
+    #define TlsSetValue_func TlsSetValue
+    #define TlsGetValue_func TlsGetValue
+    #define TLS_ALLOC_FAILURE TLS_OUT_OF_INDEXES
+    inline void do_yield() {SwitchToThread();}
+#endif
+#else
+    #error Must define USE_PTHREAD or USE_WINTHREAD
+
+#endif
+
+
+#define FREELIST_NONBLOCKING 1
+
+namespace rml {
+class MemoryPool;
+namespace internal {
+
+class Block;
+class MemoryPool;
+
+#if MALLOC_CHECK_RECURSION
+
+inline bool isMallocInitialized();
+
+bool RecursiveMallocCallProtector::noRecursion() {
+    MALLOC_ASSERT(isMallocInitialized(),
+                  "Recursion status can be checked only when initialization was done.");
+    return !mallocRecursionDetected;
+}
+
+#endif // MALLOC_CHECK_RECURSION
+
+/** Support for handling the special UNUSABLE pointer state **/
+const intptr_t UNUSABLE = 0x1;
+inline bool isSolidPtr( void* ptr ) {
+    return (UNUSABLE|(intptr_t)ptr)!=UNUSABLE;
+}
+inline bool isNotForUse( void* ptr ) {
+    return (intptr_t)ptr==UNUSABLE;
+}
+
+/*
+ * Block::objectSize value used to mark blocks allocated by startupAlloc
+ */
+const uint16_t startupAllocObjSizeMark = ~(uint16_t)0;
+
+/*
+ * The following constant is used to define the size of struct Block, the block header.
+ * The intent is to have the size of a Block multiple of the cache line size, this allows us to
+ * get good alignment at the cost of some overhead equal to the amount of padding included in the Block.
+ */
+const int blockHeaderAlignment = estimatedCacheLineSize;
+
+/********* The data structures and global objects        **************/
+
+/*
+ * The malloc routines themselves need to be able to occasionally malloc some space,
+ * in order to set up the structures used by the thread local structures. This
+ * routine performs that functions.
+ */
+class BootStrapBlocks {
+    MallocMutex bootStrapLock;
+    Block      *bootStrapBlock;
+    Block      *bootStrapBlockUsed;
+    FreeObject *bootStrapObjectList;
+public:
+    void *allocate(MemoryPool *memPool, size_t size);
+    void free(void* ptr);
+    void reset();
+};
+
+#if USE_INTERNAL_TID
+class ThreadId {
+    static tls_key_t Tid_key;
+    static intptr_t ThreadCount;
+
+    unsigned int id;
+
+    static unsigned int tlsNumber() {
+        unsigned int result = reinterpret_cast<intptr_t>(TlsGetValue_func(Tid_key));
+        if( !result ) {
+            RecursiveMallocCallProtector scoped;
+            // Thread-local value is zero -> first call from this thread,
+            // need to initialize with next ID value (IDs start from 1)
+            result = AtomicIncrement(ThreadCount); // returned new value!
+            TlsSetValue_func( Tid_key, reinterpret_cast<void*>(result) );
+        }
+        return result;
+    }
+public:
+    static bool init() {
+#if USE_WINTHREAD
+        Tid_key = TlsAlloc();
+        if (Tid_key == TLS_ALLOC_FAILURE)
+            return false;
+#else
+        int status = pthread_key_create( &Tid_key, NULL );
+        if ( status ) {
+            fprintf (stderr, "The memory manager cannot create tls key during initialization\n");
+            return false;
+        }
+#endif /* USE_WINTHREAD */
+        return true;
+    }
+    static void destroy() {
+        if( Tid_key ) {
+#if USE_WINTHREAD
+            BOOL status = !(TlsFree( Tid_key ));  // fail is zero
+#else
+            int status = pthread_key_delete( Tid_key );
+#endif /* USE_WINTHREAD */
+            if ( status )
+                fprintf (stderr, "The memory manager cannot delete tls key\n");
+            Tid_key = 0;
+        }
+    }
+
+    ThreadId() : id(ThreadId::tlsNumber()) {}
+    bool isCurrentThreadId() const { return id == ThreadId::tlsNumber(); }
+
+#if COLLECT_STATISTICS || MALLOC_TRACE
+    friend unsigned int getThreadId() { return ThreadId::tlsNumber(); }
+#endif
+#if COLLECT_STATISTICS
+    static unsigned getMaxThreadId() { return ThreadCount; }
+
+    friend int STAT_increment(ThreadId tid, int bin, int ctr);
+#endif
+};
+
+tls_key_t ThreadId::Tid_key;
+intptr_t ThreadId::ThreadCount;
+
+#if COLLECT_STATISTICS
+int STAT_increment(ThreadId tid, int bin, int ctr)
+{
+    return ::STAT_increment(tid.id, bin, ctr);
+}
+#endif
+
+#else // USE_INTERNAL_TID
+
+class ThreadId {
+#if USE_PTHREAD
+    pthread_t tid;
+#else
+    DWORD     tid;
+#endif
+public:
+    ThreadId() : tid(GetMyTID()) {}
+#if USE_PTHREAD
+    bool isCurrentThreadId() const { return pthread_equal(pthread_self(), tid); }
+#else
+    bool isCurrentThreadId() const { return GetCurrentThreadId() == tid; }
+#endif
+    static bool init() { return true; }
+    static void destroy() {}
+};
+
+#endif // USE_INTERNAL_TID
+
+/*********** Code to provide thread ID and a thread-local void pointer **********/
+
+bool TLSKey::init()
+{
+#if USE_WINTHREAD
+    TLS_pointer_key = TlsAlloc();
+    if (TLS_pointer_key == TLS_ALLOC_FAILURE)
+        return false;
+#else
+    int status = pthread_key_create( &TLS_pointer_key, mallocThreadShutdownNotification );
+    if ( status )
+        return false;
+#endif /* USE_WINTHREAD */
+    return true;
+}
+
+bool TLSKey::destroy()
+{
+#if USE_WINTHREAD
+    BOOL status1 = !(TlsFree(TLS_pointer_key)); // fail is zero
+#else
+    int status1 = pthread_key_delete(TLS_pointer_key);
+#endif /* USE_WINTHREAD */
+    MALLOC_ASSERT(!status1, "The memory manager cannot delete tls key.");
+    return status1==0;
+}
+
+inline TLSData* TLSKey::getThreadMallocTLS() const
+{
+    return (TLSData *)TlsGetValue_func( TLS_pointer_key );
+}
+
+inline void TLSKey::setThreadMallocTLS( TLSData * newvalue ) {
+    RecursiveMallocCallProtector scoped;
+    TlsSetValue_func( TLS_pointer_key, newvalue );
+}
+
+/* The 'next' field in the block header has to maintain some invariants:
+ *   it needs to be on a 16K boundary and the first field in the block.
+ *   Any value stored there needs to have the lower 14 bits set to 0
+ *   so that various assert work. This means that if you want to smash this memory
+ *   for debugging purposes you will need to obey this invariant.
+ * The total size of the header needs to be a power of 2 to simplify
+ * the alignment requirements. For now it is a 128 byte structure.
+ * To avoid false sharing, the fields changed only locally are separated
+ * from the fields changed by foreign threads.
+ * Changing the size of the block header would require to change
+ * some bin allocation sizes, in particular "fitting" sizes (see above).
+ */
+class Bin;
+class StartupBlock;
+
+class MemoryPool {
+    // if no explicit grainsize, expect to see malloc in user's pAlloc
+    // and set reasonable low granularity
+    static const size_t defaultGranularity = estimatedCacheLineSize;
+
+    MemoryPool();                  // deny
+public:
+    static MallocMutex  memPoolListLock;
+
+    // list of all active pools is used to release
+    // all TLS data on thread termination or library unload
+    MemoryPool    *next,
+                  *prev;
+    ExtMemoryPool  extMemPool;
+    BootStrapBlocks bootStrapBlocks;
+
+    static void initDefaultPool();
+
+    bool init(intptr_t poolId, const MemPoolPolicy* memPoolPolicy);
+    bool reset();
+    bool destroy();
+    void onThreadShutdown(TLSData *tlsData);
+
+    inline TLSData *getTLS(bool create);
+    void clearTLS() { extMemPool.tlsPointerKey.setThreadMallocTLS(NULL); }
+
+    Block *getEmptyBlock(size_t size);
+    void returnEmptyBlock(Block *block, bool poolTheBlock);
+
+    // get/put large object to/from local large object cache
+    void *getFromLLOCache(TLSData *tls, size_t size, size_t alignment);
+    void putToLLOCache(TLSData *tls, void *object);
+};
+
+static intptr_t defaultMemPool_space[sizeof(MemoryPool)/sizeof(intptr_t) +
+                                     (sizeof(MemoryPool)%sizeof(intptr_t)? 1 : 0)];
+static MemoryPool *defaultMemPool = (MemoryPool*)defaultMemPool_space;
+const size_t MemoryPool::defaultGranularity;
+// zero-initialized
+MallocMutex  MemoryPool::memPoolListLock;
+// TODO: move huge page status to default pool, because that's its states
+HugePagesStatus hugePages;
+static bool usedBySrcIncluded = false;
+
+// Padding helpers
+template<size_t padd>
+struct PaddingImpl {
+    size_t       __padding[padd];
+};
+
+template<>
+struct PaddingImpl<0> {};
+
+template<int N>
+struct Padding : PaddingImpl<N/sizeof(size_t)> {};
+
+// Slab block is 16KB-aligned. To prevent false sharing, separate locally-accessed
+// fields and fields commonly accessed by not owner threads.
+class GlobalBlockFields : public BlockI {
+protected:
+    FreeObject  *publicFreeList;
+    Block       *nextPrivatizable;
+    MemoryPool  *poolPtr;
+};
+
+class LocalBlockFields : public GlobalBlockFields, Padding<blockHeaderAlignment - sizeof(GlobalBlockFields)>  {
+protected:
+    Block       *next;
+    Block       *previous;        /* Use double linked list to speed up removal */
+    FreeObject  *bumpPtr;         /* Bump pointer moves from the end to the beginning of a block */
+    FreeObject  *freeList;
+    /* Pointer to local data for the owner thread. Used for fast finding tls
+       when releasing object from a block that current thread owned.
+       NULL for orphaned blocks. */
+    TLSData     *tlsPtr;
+    ThreadId     ownerTid;        /* the ID of the thread that owns or last owned the block */
+    BackRefIdx   backRefIdx;
+    uint16_t     allocatedCount;  /* Number of objects allocated (obviously by the owning thread) */
+    uint16_t     objectSize;
+    bool         isFull;
+
+    friend class FreeBlockPool;
+    friend class StartupBlock;
+    friend class LifoList;
+    friend void *BootStrapBlocks::allocate(MemoryPool *, size_t);
+    friend bool OrphanedBlocks::cleanup(Backend*);
+    friend Block *MemoryPool::getEmptyBlock(size_t);
+};
+
+// Use inheritance to guarantee that a user data start on next cache line.
+// Can't use member for it, because when LocalBlockFields already on cache line,
+// we must have no additional memory consumption for all compilers.
+class Block : public LocalBlockFields,
+              Padding<2*blockHeaderAlignment - sizeof(LocalBlockFields)> {
+public:
+    bool empty() const { return allocatedCount==0 && !isSolidPtr(publicFreeList); }
+    inline FreeObject* allocate();
+    inline FreeObject *allocateFromFreeList();
+    inline bool emptyEnoughToUse();
+    bool freeListNonNull() { return freeList; }
+    void freePublicObject(FreeObject *objectToFree);
+    inline void freeOwnObject(void *object);
+    void reset();
+    void privatizePublicFreeList( bool cleanup = false );
+    void restoreBumpPtr();
+    void privatizeOrphaned(TLSData *tls, unsigned index);
+    void shareOrphaned(intptr_t binTag, unsigned index);
+    unsigned int getSize() const {
+        MALLOC_ASSERT(isStartupAllocObject() || objectSize<minLargeObjectSize,
+                      "Invalid object size");
+        return isStartupAllocObject()? 0 : objectSize;
+    }
+    const BackRefIdx *getBackRefIdx() const { return &backRefIdx; }
+    inline bool isOwnedByCurrentThread() const;
+    bool isStartupAllocObject() const { return objectSize == startupAllocObjSizeMark; }
+    inline FreeObject *findObjectToFree(const void *object) const;
+    void checkFreePrecond(const void *object) const {
+#if MALLOC_DEBUG
+        const char *msg = "Possible double free or heap corruption.";
+        // small objects are always at least sizeof(size_t) Byte aligned,
+        // try to check this before this dereference as for invalid objects
+        // this may be unreadable
+        MALLOC_ASSERT(isAligned(object, sizeof(size_t)), "Try to free invalid small object");
+        // releasing to free slab
+        MALLOC_ASSERT(allocatedCount>0, msg);
+        // must not point to slab's header
+        MALLOC_ASSERT((uintptr_t)object - (uintptr_t)this >= sizeof(Block), msg);
+        if (startupAllocObjSizeMark == objectSize) // startup block
+            MALLOC_ASSERT(object<=bumpPtr, msg);
+        else {
+            // non-startup objects are 8 Byte aligned
+            MALLOC_ASSERT(isAligned(object, 8), "Try to free invalid small object");
+            MALLOC_ASSERT(allocatedCount <= (slabSize-sizeof(Block))/objectSize
+                          && (!bumpPtr || object>bumpPtr), msg);
+            FreeObject *toFree = findObjectToFree(object);
+            // check against head of freeList, as this is mostly
+            // expected after double free
+            MALLOC_ASSERT(toFree != freeList, msg);
+            // check against head of publicFreeList, to detect double free
+            // involving foreign thread
+            MALLOC_ASSERT(toFree != publicFreeList, msg);
+        }
+#else
+        suppress_unused_warning(object);
+#endif
+    }
+    void initEmptyBlock(TLSData *tls, size_t size);
+    size_t findObjectSize(void *object) const;
+    MemoryPool *getMemPool() const { return poolPtr; } // do not use on the hot path!
+
+protected:
+    void cleanBlockHeader();
+
+private:
+    static const float emptyEnoughRatio; /* "Reactivate" a block if this share of its objects is free. */
+
+    inline FreeObject *allocateFromBumpPtr();
+    inline FreeObject *findAllocatedObject(const void *address) const;
+    inline bool isProperlyPlaced(const void *object) const;
+    inline void markOwned(TLSData *tls) {
+        MALLOC_ASSERT(!tlsPtr, ASSERT_TEXT);
+        ownerTid = ThreadId(); /* save the ID of the current thread */
+        tlsPtr = tls;
+    }
+    inline void markOrphaned() {
+        MALLOC_ASSERT(tlsPtr, ASSERT_TEXT);
+        tlsPtr = NULL;
+    }
+
+    friend class Bin;
+    friend class TLSData;
+    friend bool MemoryPool::destroy();
+};
+
+const float Block::emptyEnoughRatio = 1.0 / 4.0;
+
+MALLOC_STATIC_ASSERT(sizeof(Block) <= 2*estimatedCacheLineSize,
+    "The class Block does not fit into 2 cache lines on this platform. "
+    "Defining USE_INTERNAL_TID may help to fix it.");
+
+class Bin {
+    Block      *activeBlk;
+    Block      *mailbox;
+    MallocMutex mailLock;
+
+public:
+    inline Block* getActiveBlock() const { return activeBlk; }
+    void resetActiveBlock() { activeBlk = 0; }
+    bool activeBlockUnused() const { return activeBlk && !activeBlk->allocatedCount; }
+    inline void setActiveBlock(Block *block);
+    inline Block* setPreviousBlockActive();
+    Block* getPublicFreeListBlock();
+    void moveBlockToFront(Block *block);
+    void processLessUsedBlock(MemoryPool *memPool, Block *block);
+
+    void outofTLSBin(Block* block);
+    void verifyTLSBin(size_t size) const;
+    void pushTLSBin(Block* block);
+
+    void verifyInitState() const {
+        MALLOC_ASSERT( activeBlk == 0, ASSERT_TEXT );
+        MALLOC_ASSERT( mailbox == 0, ASSERT_TEXT );
+    }
+
+    friend void Block::freePublicObject (FreeObject *objectToFree);
+};
+
+/********* End of the data structures                    **************/
+
+/*
+ * There are bins for all 8 byte aligned objects less than this segregated size; 8 bins in total
+ */
+const uint32_t minSmallObjectIndex = 0;
+const uint32_t numSmallObjectBins = 8;
+const uint32_t maxSmallObjectSize = 64;
+
+/*
+ * There are 4 bins between each couple of powers of 2 [64-128-256-...]
+ * from maxSmallObjectSize till this size; 16 bins in total
+ */
+const uint32_t minSegregatedObjectIndex = minSmallObjectIndex+numSmallObjectBins;
+const uint32_t numSegregatedObjectBins = 16;
+const uint32_t maxSegregatedObjectSize = 1024;
+
+/*
+ * And there are 5 bins with allocation sizes that are multiples of estimatedCacheLineSize
+ * and selected to fit 9, 6, 4, 3, and 2 allocations in a block.
+ */
+const uint32_t minFittingIndex = minSegregatedObjectIndex+numSegregatedObjectBins;
+const uint32_t numFittingBins = 5;
+
+const uint32_t fittingAlignment = estimatedCacheLineSize;
+
+#define SET_FITTING_SIZE(N) ( (slabSize-sizeof(Block))/N ) & ~(fittingAlignment-1)
+// For blockSize=16*1024, sizeof(Block)=2*estimatedCacheLineSize and fittingAlignment=estimatedCacheLineSize,
+// the comments show the fitting sizes and the amounts left unused for estimatedCacheLineSize=64/128:
+const uint32_t fittingSize1 = SET_FITTING_SIZE(9); // 1792/1792 128/000
+const uint32_t fittingSize2 = SET_FITTING_SIZE(6); // 2688/2688 128/000
+const uint32_t fittingSize3 = SET_FITTING_SIZE(4); // 4032/3968 128/256
+const uint32_t fittingSize4 = SET_FITTING_SIZE(3); // 5376/5376 128/000
+const uint32_t fittingSize5 = SET_FITTING_SIZE(2); // 8128/8064 000/000
+#undef SET_FITTING_SIZE
+
+/*
+ * The total number of thread-specific Block-based bins
+ */
+const uint32_t numBlockBins = minFittingIndex+numFittingBins;
+
+/*
+ * Objects of this size and larger are considered large objects.
+ */
+const uint32_t minLargeObjectSize = fittingSize5 + 1;
+
+/*
+ * Per-thread pool of slab blocks. Idea behind it is to not share with other
+ * threads memory that are likely in local cache(s) of our CPU.
+ */
+class FreeBlockPool {
+    Block      *head;
+    int         size;
+    Backend    *backend;
+    bool        lastAccessMiss;
+public:
+    static const int POOL_HIGH_MARK = 32;
+    static const int POOL_LOW_MARK  = 8;
+
+    class ResOfGet {
+        ResOfGet();
+    public:
+        Block* block;
+        bool   lastAccMiss;
+        ResOfGet(Block *b, bool lastMiss) : block(b), lastAccMiss(lastMiss) {}
+    };
+
+    // allocated in zero-initialized memory
+    FreeBlockPool(Backend *bknd) : backend(bknd) {}
+    ResOfGet getBlock();
+    void returnBlock(Block *block);
+    bool externalCleanup(); // can be called by another thread
+};
+
+template<int LOW_MARK, int HIGH_MARK>
+class LocalLOCImpl {
+    static const size_t MAX_TOTAL_SIZE = 4*1024*1024;
+    // TODO: can single-linked list be faster here?
+    LargeMemoryBlock *head,
+                     *tail; // need it when do releasing on overflow
+    size_t            totalSize;
+    int               numOfBlocks;
+public:
+    bool put(LargeMemoryBlock *object, ExtMemoryPool *extMemPool);
+    LargeMemoryBlock *get(size_t size);
+    bool externalCleanup(ExtMemoryPool *extMemPool);
+#if __TBB_MALLOC_WHITEBOX_TEST
+    LocalLOCImpl() : head(NULL), tail(NULL), totalSize(0), numOfBlocks(0) {}
+    static size_t getMaxSize() { return MAX_TOTAL_SIZE; }
+    static const int LOC_HIGH_MARK = HIGH_MARK;
+#else
+    // no ctor, object must be created in zero-initialized memory
+#endif
+};
+
+typedef LocalLOCImpl<8,32> LocalLOC; // set production code parameters
+
+class TLSData : public TLSRemote {
+    MemoryPool   *memPool;
+public:
+    Bin           bin[numBlockBinLimit];
+    FreeBlockPool freeSlabBlocks;
+    LocalLOC      lloc;
+    unsigned      currCacheIdx;
+private:
+    bool unused;
+public:
+    TLSData(MemoryPool *mPool, Backend *bknd) : memPool(mPool), freeSlabBlocks(bknd) {}
+    MemoryPool *getMemPool() const { return memPool; }
+    Bin* getAllocationBin(size_t size);
+    void release(MemoryPool *mPool);
+    bool externalCleanup(ExtMemoryPool *mPool, bool cleanOnlyUnused) {
+        if (!unused && cleanOnlyUnused) return false;
+        // both cleanups to be called, and the order is not important
+        return lloc.externalCleanup(mPool) | freeSlabBlocks.externalCleanup();
+    }
+    bool cleanUnusedActiveBlocks(Backend *backend, bool userPool);
+    void markUsed() { unused = false; } // called by owner when TLS touched
+    void markUnused() { unused =  true; } // can be called by not owner thread
+};
+
+TLSData *TLSKey::createTLS(MemoryPool *memPool, Backend *backend)
+{
+    MALLOC_ASSERT( sizeof(TLSData) >= sizeof(Bin) * numBlockBins + sizeof(FreeBlockPool), ASSERT_TEXT );
+    TLSData* tls = (TLSData*) memPool->bootStrapBlocks.allocate(memPool, sizeof(TLSData));
+    if ( !tls )
+        return NULL;
+    new(tls) TLSData(memPool, backend);
+    /* the block contains zeroes after bootStrapMalloc, so bins are initialized */
+#if MALLOC_DEBUG
+    for (uint32_t i = 0; i < numBlockBinLimit; i++)
+        tls->bin[i].verifyInitState();
+#endif
+    setThreadMallocTLS(tls);
+    memPool->extMemPool.allLocalCaches.registerThread(tls);
+    return tls;
+}
+
+bool TLSData::cleanUnusedActiveBlocks(Backend *backend, bool userPool)
+{
+    bool released = false;
+    // active blocks can be not used, so return them to backend
+    for (uint32_t i=0; i<numBlockBinLimit; i++)
+        if (bin[i].activeBlockUnused()) {
+            Block *block = bin[i].getActiveBlock();
+            bin[i].outofTLSBin(block);
+            // slab blocks in user's pools do not have valid backRefIdx
+            if (!userPool)
+                removeBackRef(*(block->getBackRefIdx()));
+            backend->putSlabBlock(block);
+
+            released = true;
+        }
+    return released;
+}
+
+bool ExtMemoryPool::releaseAllLocalCaches()
+{
+    bool released = allLocalCaches.cleanup(this, /*cleanOnlyUnused=*/false);
+
+    if (TLSData *tlsData = tlsPointerKey.getThreadMallocTLS())
+        // released only for current thread for now
+        released |= tlsData->cleanUnusedActiveBlocks(&backend, userPool());
+
+    return released;
+}
+
+void AllLocalCaches::registerThread(TLSRemote *tls)
+{
+    tls->prev = NULL;
+    MallocMutex::scoped_lock lock(listLock);
+    MALLOC_ASSERT(head!=tls, ASSERT_TEXT);
+    tls->next = head;
+    if (head)
+        head->prev = tls;
+    head = tls;
+    MALLOC_ASSERT(head->next!=head, ASSERT_TEXT);
+}
+
+void AllLocalCaches::unregisterThread(TLSRemote *tls)
+{
+    MallocMutex::scoped_lock lock(listLock);
+    MALLOC_ASSERT(head, "Can't unregister thread: no threads are registered.");
+    if (head == tls)
+        head = tls->next;
+    if (tls->next)
+        tls->next->prev = tls->prev;
+    if (tls->prev)
+        tls->prev->next = tls->next;
+    MALLOC_ASSERT(!tls->next || tls->next->next!=tls->next, ASSERT_TEXT);
+}
+
+bool AllLocalCaches::cleanup(ExtMemoryPool *extPool, bool cleanOnlyUnused)
+{
+    bool total = false;
+    {
+        MallocMutex::scoped_lock lock(listLock);
+
+        for (TLSRemote *curr=head; curr; curr=curr->next)
+            total |= static_cast<TLSData*>(curr)->
+                         externalCleanup(extPool, cleanOnlyUnused);
+    }
+    return total;
+}
+
+void AllLocalCaches::markUnused()
+{
+    bool locked;
+    MallocMutex::scoped_lock lock(listLock, /*block=*/false, &locked);
+    if (!locked) // not wait for marking if someone doing something with it
+        return;
+
+    for (TLSRemote *curr=head; curr; curr=curr->next)
+        static_cast<TLSData*>(curr)->markUnused();
+}
+
+#if MALLOC_CHECK_RECURSION
+MallocMutex RecursiveMallocCallProtector::rmc_mutex;
+pthread_t   RecursiveMallocCallProtector::owner_thread;
+void       *RecursiveMallocCallProtector::autoObjPtr;
+bool        RecursiveMallocCallProtector::mallocRecursionDetected;
+#if __FreeBSD__
+bool        RecursiveMallocCallProtector::canUsePthread;
+#endif
+
+#endif
+
+/*********** End code to provide thread ID and a TLS pointer **********/
+
+// Parameter for isLargeObject, keeps our expectations on memory origin.
+// Assertions must use unknownMem to reliably report object invalidity.
+enum MemoryOrigin {
+    ourMem,    // allocated by TBB allocator
+    unknownMem // can be allocated by system allocator or TBB allocator
+};
+
+template<MemoryOrigin> bool isLargeObject(void *object);
+static void *internalMalloc(size_t size);
+static void internalFree(void *object);
+static void *internalPoolMalloc(MemoryPool* mPool, size_t size);
+static bool internalPoolFree(MemoryPool *mPool, void *object, size_t size);
+
+#if !MALLOC_DEBUG
+#if __INTEL_COMPILER || _MSC_VER
+#define NOINLINE(decl) __declspec(noinline) decl
+#define ALWAYSINLINE(decl) __forceinline decl
+#elif __GNUC__
+#define NOINLINE(decl) decl __attribute__ ((noinline))
+#define ALWAYSINLINE(decl) decl __attribute__ ((always_inline))
+#else
+#define NOINLINE(decl) decl
+#define ALWAYSINLINE(decl) decl
+#endif
+
+static NOINLINE( bool doInitialization() );
+ALWAYSINLINE( bool isMallocInitialized() );
+
+#undef ALWAYSINLINE
+#undef NOINLINE
+#endif /* !MALLOC_DEBUG */
+
+
+/********* Now some rough utility code to deal with indexing the size bins. **************/
+
+/*
+ * Given a number return the highest non-zero bit in it. It is intended to work with 32-bit values only.
+ * Moreover, on IPF, for sake of simplicity and performance, it is narrowed to only serve for 64 to 1023.
+ * This is enough for current algorithm of distribution of sizes among bins.
+ * __TBB_Log2 is not used here to minimize dependencies on TBB specific sources.
+ */
+#if _WIN64 && _MSC_VER>=1400 && !__INTEL_COMPILER
+extern "C" unsigned char _BitScanReverse( unsigned long* i, unsigned long w );
+#pragma intrinsic(_BitScanReverse)
+#endif
+static inline unsigned int highestBitPos(unsigned int n)
+{
+    MALLOC_ASSERT( n>=64 && n<1024, ASSERT_TEXT ); // only needed for bsr array lookup, but always true
+    unsigned int pos;
+#if __ARCH_x86_32||__ARCH_x86_64
+
+# if __linux__||__APPLE__||__FreeBSD__||__NetBSD__||__OpenBSD__||__sun||__MINGW32__
+    __asm__ ("bsr %1,%0" : "=r"(pos) : "r"(n));
+# elif (_WIN32 && (!_WIN64 || __INTEL_COMPILER))
+    __asm
+    {
+        bsr eax, n
+        mov pos, eax
+    }
+# elif _WIN64 && _MSC_VER>=1400
+    _BitScanReverse((unsigned long*)&pos, (unsigned long)n);
+# else
+#   error highestBitPos() not implemented for this platform
+# endif
+#elif __arm__
+    __asm__ __volatile__
+    (
+       "clz %0, %1\n"
+       "rsb %0, %0, %2\n"
+       :"=r" (pos) :"r" (n), "I" (31)
+    );
+#else
+    static unsigned int bsr[16] = {0/*N/A*/,6,7,7,8,8,8,8,9,9,9,9,9,9,9,9};
+    pos = bsr[ n>>6 ];
+#endif /* __ARCH_* */
+    return pos;
+}
+
+template<bool Is32Bit>
+unsigned int getSmallObjectIndex(unsigned int size)
+{
+    return (size-1)>>3;
+}
+template<>
+unsigned int getSmallObjectIndex</*Is32Bit=*/false>(unsigned int size)
+{
+    // For 64-bit malloc, 16 byte alignment is needed except for bin 0.
+    unsigned int result = (size-1)>>3;
+    if (result) result |= 1; // 0,1,3,5,7; bins 2,4,6 are not aligned to 16 bytes
+    return result;
+}
+/*
+ * Depending on indexRequest, for a given size return either the index into the bin
+ * for objects of this size, or the actual size of objects in this bin.
+ */
+template<bool indexRequest>
+static unsigned int getIndexOrObjectSize (unsigned int size)
+{
+    if (size <= maxSmallObjectSize) { // selection from 8/16/24/32/40/48/56/64
+        unsigned int index = getSmallObjectIndex</*Is32Bit=*/(sizeof(size_t)<=4)>( size );
+         /* Bin 0 is for 8 bytes, bin 1 is for 16, and so forth */
+        return indexRequest ? index : (index+1)<<3;
+    }
+    else if (size <= maxSegregatedObjectSize ) { // 80/96/112/128 / 160/192/224/256 / 320/384/448/512 / 640/768/896/1024
+        unsigned int order = highestBitPos(size-1); // which group of bin sizes?
+        MALLOC_ASSERT( 6<=order && order<=9, ASSERT_TEXT );
+        if (indexRequest)
+            return minSegregatedObjectIndex - (4*6) - 4 + (4*order) + ((size-1)>>(order-2));
+        else {
+            unsigned int alignment = 128 >> (9-order); // alignment in the group
+            MALLOC_ASSERT( alignment==16 || alignment==32 || alignment==64 || alignment==128, ASSERT_TEXT );
+            return alignUp(size,alignment);
+        }
+    }
+    else {
+        if( size <= fittingSize3 ) {
+            if( size <= fittingSize2 ) {
+                if( size <= fittingSize1 )
+                    return indexRequest ? minFittingIndex : fittingSize1;
+                else
+                    return indexRequest ? minFittingIndex+1 : fittingSize2;
+            } else
+                return indexRequest ? minFittingIndex+2 : fittingSize3;
+        } else {
+            if( size <= fittingSize5 ) {
+                if( size <= fittingSize4 )
+                    return indexRequest ? minFittingIndex+3 : fittingSize4;
+                else
+                    return indexRequest ? minFittingIndex+4 : fittingSize5;
+            } else {
+                MALLOC_ASSERT( 0,ASSERT_TEXT ); // this should not happen
+                return ~0U;
+            }
+        }
+    }
+}
+
+static unsigned int getIndex (unsigned int size)
+{
+    return getIndexOrObjectSize</*indexRequest=*/true>(size);
+}
+
+static unsigned int getObjectSize (unsigned int size)
+{
+    return getIndexOrObjectSize</*indexRequest=*/false>(size);
+}
+
+
+void *BootStrapBlocks::allocate(MemoryPool *memPool, size_t size)
+{
+    FreeObject *result;
+
+    MALLOC_ASSERT( size == sizeof(TLSData), ASSERT_TEXT );
+
+    { // Lock with acquire
+        MallocMutex::scoped_lock scoped_cs(bootStrapLock);
+
+        if( bootStrapObjectList) {
+            result = bootStrapObjectList;
+            bootStrapObjectList = bootStrapObjectList->next;
+        } else {
+            if (!bootStrapBlock) {
+                bootStrapBlock = memPool->getEmptyBlock(size);
+                if (!bootStrapBlock) return NULL;
+            }
+            result = bootStrapBlock->bumpPtr;
+            bootStrapBlock->bumpPtr = (FreeObject *)((uintptr_t)bootStrapBlock->bumpPtr - bootStrapBlock->objectSize);
+            if ((uintptr_t)bootStrapBlock->bumpPtr < (uintptr_t)bootStrapBlock+sizeof(Block)) {
+                bootStrapBlock->bumpPtr = NULL;
+                bootStrapBlock->next = bootStrapBlockUsed;
+                bootStrapBlockUsed = bootStrapBlock;
+                bootStrapBlock = NULL;
+            }
+        }
+    } // Unlock with release
+
+    memset (result, 0, size);
+    return (void*)result;
+}
+
+void BootStrapBlocks::free(void* ptr)
+{
+    MALLOC_ASSERT( ptr, ASSERT_TEXT );
+    { // Lock with acquire
+        MallocMutex::scoped_lock scoped_cs(bootStrapLock);
+        ((FreeObject*)ptr)->next = bootStrapObjectList;
+        bootStrapObjectList = (FreeObject*)ptr;
+    } // Unlock with release
+}
+
+void BootStrapBlocks::reset()
+{
+    bootStrapBlock = bootStrapBlockUsed = NULL;
+    bootStrapObjectList = NULL;
+}
+
+#if !(FREELIST_NONBLOCKING)
+static MallocMutex publicFreeListLock; // lock for changes of publicFreeList
+#endif
+
+/********* End rough utility code  **************/
+
+/* LifoList assumes zero initialization so a vector of it can be created
+ * by just allocating some space with no call to constructor.
+ * On Linux, it seems to be necessary to avoid linking with C++ libraries.
+ *
+ * By usage convention there is no race on the initialization. */
+LifoList::LifoList( ) : top(NULL)
+{
+    // MallocMutex assumes zero initialization
+    memset(&lock, 0, sizeof(MallocMutex));
+}
+
+void LifoList::push(Block *block)
+{
+    MallocMutex::scoped_lock scoped_cs(lock);
+    block->next = top;
+    top = block;
+}
+
+Block *LifoList::pop()
+{
+    Block *block=NULL;
+    if (top) {
+        MallocMutex::scoped_lock scoped_cs(lock);
+        if (top) {
+            block = top;
+            top = block->next;
+        }
+    }
+    return block;
+}
+
+Block *LifoList::grab()
+{
+    Block *block = NULL;
+    if (top) {
+        MallocMutex::scoped_lock scoped_cs(lock);
+        block = top;
+        top = NULL;
+    }
+    return block;
+}
+
+/********* Thread and block related code      *************/
+
+template<bool poolDestroy> void AllLargeBlocksList::releaseAll(Backend *backend) {
+     LargeMemoryBlock *next, *lmb = loHead;
+     loHead = NULL;
+
+     for (; lmb; lmb = next) {
+         next = lmb->gNext;
+         if (poolDestroy) {
+             // as it's pool destruction, no need to return object to backend,
+             // only remove backrefs, as they are global
+             removeBackRef(lmb->backRefIdx);
+         } else {
+             // clean g(Next|Prev) to prevent removing lmb
+             // from AllLargeBlocksList inside returnLargeObject
+             lmb->gNext = lmb->gPrev = NULL;
+             backend->returnLargeObject(lmb);
+         }
+     }
+}
+
+TLSData* MemoryPool::getTLS(bool create)
+{
+    TLSData* tls = extMemPool.tlsPointerKey.getThreadMallocTLS();
+    if (create && !tls)
+        tls = extMemPool.tlsPointerKey.createTLS(this, &extMemPool.backend);
+    return tls;
+}
+
+/*
+ * Return the bin for the given size.
+ */
+inline Bin* TLSData::getAllocationBin(size_t size)
+{
+    return bin + getIndex(size);
+}
+
+/* Return an empty uninitialized block in a non-blocking fashion. */
+Block *MemoryPool::getEmptyBlock(size_t size)
+{
+    TLSData* tls = extMemPool.tlsPointerKey.getThreadMallocTLS();
+    // try to use per-thread cache, if TLS available
+    FreeBlockPool::ResOfGet resOfGet = tls?
+        tls->freeSlabBlocks.getBlock() : FreeBlockPool::ResOfGet(NULL, false);
+    Block *result = resOfGet.block;
+
+    if (!result) { // not found in local cache, asks backend for slabs
+        int num = resOfGet.lastAccMiss? Backend::numOfSlabAllocOnMiss : 1;
+        BackRefIdx backRefIdx[Backend::numOfSlabAllocOnMiss];
+
+        result = static_cast<Block*>(extMemPool.backend.getSlabBlock(num));
+        if (!result) return NULL;
+
+        if (!extMemPool.userPool())
+            for (int i=0; i<num; i++) {
+                backRefIdx[i] = BackRefIdx::newBackRef(/*largeObj=*/false);
+                if (backRefIdx[i].isInvalid()) {
+                    // roll back resource allocation
+                    for (int j=0; j<i; j++)
+                        removeBackRef(backRefIdx[j]);
+                    Block *b = result;
+                    for (int j=0; j<num; b=(Block*)((uintptr_t)b+slabSize), j++)
+                        extMemPool.backend.putSlabBlock(b);
+                    return NULL;
+                }
+            }
+        // resources were allocated, register blocks
+        Block *b = result;
+        for (int i=0; i<num; b=(Block*)((uintptr_t)b+slabSize), i++) {
+            // slab block in user's pool must have invalid backRefIdx
+            if (extMemPool.userPool()) {
+                new (&b->backRefIdx) BackRefIdx();
+            } else {
+                setBackRef(backRefIdx[i], b);
+                b->backRefIdx = backRefIdx[i];
+            }
+            b->tlsPtr = tls;
+            b->poolPtr = this;
+            // all but first one go to per-thread pool
+            if (i > 0) {
+                MALLOC_ASSERT(tls, ASSERT_TEXT);
+                tls->freeSlabBlocks.returnBlock(b);
+            }
+        }
+    }
+    MALLOC_ASSERT(result, ASSERT_TEXT);
+    result->initEmptyBlock(tls, size);
+    STAT_increment(getThreadId(), getIndex(result->objectSize), allocBlockNew);
+    return result;
+}
+
+void MemoryPool::returnEmptyBlock(Block *block, bool poolTheBlock)
+{
+    block->reset();
+    if (poolTheBlock) {
+        extMemPool.tlsPointerKey.getThreadMallocTLS()->freeSlabBlocks.returnBlock(block);
+    }
+    else {
+        // slab blocks in user's pools do not have valid backRefIdx
+        if (!extMemPool.userPool())
+            removeBackRef(*(block->getBackRefIdx()));
+        extMemPool.backend.putSlabBlock(block);
+    }
+}
+
+bool ExtMemoryPool::init(intptr_t poolId, rawAllocType rawAlloc,
+                         rawFreeType rawFree, size_t granularity,
+                         bool keepAllMemory, bool fixedPool)
+{
+    this->poolId = poolId;
+    this->rawAlloc = rawAlloc;
+    this->rawFree = rawFree;
+    this->granularity = granularity;
+    this->keepAllMemory = keepAllMemory;
+    this->fixedPool = fixedPool;
+    this->delayRegsReleasing = false;
+    if (!initTLS())
+        return false;
+    loc.init(this);
+    backend.init(this);
+    MALLOC_ASSERT(isPoolValid(), NULL);
+    return true;
+}
+
+bool ExtMemoryPool::initTLS() { return tlsPointerKey.init(); }
+
+bool MemoryPool::init(intptr_t poolId, const MemPoolPolicy *policy)
+{
+    if (!extMemPool.init(poolId, policy->pAlloc, policy->pFree,
+               policy->granularity? policy->granularity : defaultGranularity,
+               policy->keepAllMemory, policy->fixedPool))
+        return false;
+    {
+        MallocMutex::scoped_lock lock(memPoolListLock);
+        next = defaultMemPool->next;
+        defaultMemPool->next = this;
+        prev = defaultMemPool;
+        if (next)
+            next->prev = this;
+    }
+    return true;
+}
+
+bool MemoryPool::reset()
+{
+    MALLOC_ASSERT(extMemPool.userPool(), "No reset for the system pool.");
+    // memory is not releasing during pool reset
+    // TODO: mark regions to release unused on next reset()
+    extMemPool.delayRegionsReleasing(true);
+
+    bootStrapBlocks.reset();
+    extMemPool.lmbList.releaseAll</*poolDestroy=*/false>(&extMemPool.backend);
+    if (!extMemPool.reset())
+        return false;
+
+    if (!extMemPool.initTLS())
+        return false;
+    extMemPool.delayRegionsReleasing(false);
+    return true;
+}
+
+bool MemoryPool::destroy()
+{
+#if __TBB_MALLOC_LOCACHE_STAT
+    extMemPool.loc.reportStat(stdout);
+#endif
+#if __TBB_MALLOC_BACKEND_STAT
+    extMemPool.backend.reportStat(stdout);
+#endif
+    {
+        MallocMutex::scoped_lock lock(memPoolListLock);
+        // remove itself from global pool list
+        if (prev)
+            prev->next = next;
+        if (next)
+            next->prev = prev;
+    }
+    // slab blocks in non-default pool do not have backreferences,
+    // only large objects do
+    if (extMemPool.userPool())
+        extMemPool.lmbList.releaseAll</*poolDestroy=*/true>(&extMemPool.backend);
+    else {
+        // only one non-userPool() is supported now
+        MALLOC_ASSERT(this==defaultMemPool, NULL);
+        // There and below in extMemPool.destroy(), do not restore initial state
+        // for user pool, because it's just about to be released. But for system
+        // pool restoring, we do not want to do zeroing of it on subsequent reload.
+        bootStrapBlocks.reset();
+        extMemPool.orphanedBlocks.reset();
+    }
+    return extMemPool.destroy();
+}
+
+void MemoryPool::onThreadShutdown(TLSData *tlsData)
+{
+    if (tlsData) { // might be called for "empty" TLS
+        tlsData->release(this);
+        bootStrapBlocks.free(tlsData);
+        clearTLS();
+    }
+}
+
+#if MALLOC_DEBUG
+void Bin::verifyTLSBin (size_t size) const
+{
+/* The debug version verifies the TLSBin as needed */
+    uint32_t objSize = getObjectSize(size);
+
+    if (activeBlk) {
+        MALLOC_ASSERT( activeBlk->isOwnedByCurrentThread(), ASSERT_TEXT );
+        MALLOC_ASSERT( activeBlk->objectSize == objSize, ASSERT_TEXT );
+#if MALLOC_DEBUG>1
+        for (Block* temp = activeBlk->next; temp; temp=temp->next) {
+            MALLOC_ASSERT( temp!=activeBlk, ASSERT_TEXT );
+            MALLOC_ASSERT( temp->isOwnedByCurrentThread(), ASSERT_TEXT );
+            MALLOC_ASSERT( temp->objectSize == objSize, ASSERT_TEXT );
+            MALLOC_ASSERT( temp->previous->next == temp, ASSERT_TEXT );
+            if (temp->next) {
+                MALLOC_ASSERT( temp->next->previous == temp, ASSERT_TEXT );
+            }
+        }
+        for (Block* temp = activeBlk->previous; temp; temp=temp->previous) {
+            MALLOC_ASSERT( temp!=activeBlk, ASSERT_TEXT );
+            MALLOC_ASSERT( temp->isOwnedByCurrentThread(), ASSERT_TEXT );
+            MALLOC_ASSERT( temp->objectSize == objSize, ASSERT_TEXT );
+            MALLOC_ASSERT( temp->next->previous == temp, ASSERT_TEXT );
+            if (temp->previous) {
+                MALLOC_ASSERT( temp->previous->next == temp, ASSERT_TEXT );
+            }
+        }
+#endif /* MALLOC_DEBUG>1 */
+    }
+}
+#else /* MALLOC_DEBUG */
+inline void Bin::verifyTLSBin (size_t) const { }
+#endif /* MALLOC_DEBUG */
+
+/*
+ * Add a block to the start of this tls bin list.
+ */
+void Bin::pushTLSBin(Block* block)
+{
+    /* The objectSize should be defined and not a parameter
+       because the function is applied to partially filled blocks as well */
+    unsigned int size = block->objectSize;
+
+    MALLOC_ASSERT( block->isOwnedByCurrentThread(), ASSERT_TEXT );
+    MALLOC_ASSERT( block->objectSize != 0, ASSERT_TEXT );
+    MALLOC_ASSERT( block->next == NULL, ASSERT_TEXT );
+    MALLOC_ASSERT( block->previous == NULL, ASSERT_TEXT );
+
+    MALLOC_ASSERT( this, ASSERT_TEXT );
+    verifyTLSBin(size);
+
+    block->next = activeBlk;
+    if( activeBlk ) {
+        block->previous = activeBlk->previous;
+        activeBlk->previous = block;
+        if( block->previous )
+            block->previous->next = block;
+    } else {
+        activeBlk = block;
+    }
+
+    verifyTLSBin(size);
+}
+
+/*
+ * Take a block out of its tls bin (e.g. before removal).
+ */
+void Bin::outofTLSBin(Block* block)
+{
+    unsigned int size = block->objectSize;
+
+    MALLOC_ASSERT( block->isOwnedByCurrentThread(), ASSERT_TEXT );
+    MALLOC_ASSERT( block->objectSize != 0, ASSERT_TEXT );
+
+    MALLOC_ASSERT( this, ASSERT_TEXT );
+    verifyTLSBin(size);
+
+    if (block == activeBlk) {
+        activeBlk = block->previous? block->previous : block->next;
+    }
+    /* Delink the block */
+    if (block->previous) {
+        MALLOC_ASSERT( block->previous->next == block, ASSERT_TEXT );
+        block->previous->next = block->next;
+    }
+    if (block->next) {
+        MALLOC_ASSERT( block->next->previous == block, ASSERT_TEXT );
+        block->next->previous = block->previous;
+    }
+    block->next = NULL;
+    block->previous = NULL;
+
+    verifyTLSBin(size);
+}
+
+Block* Bin::getPublicFreeListBlock()
+{
+    Block* block;
+    MALLOC_ASSERT( this, ASSERT_TEXT );
+    // if this method is called, active block usage must be unsuccessful
+    MALLOC_ASSERT( !activeBlk && !mailbox || activeBlk && activeBlk->isFull, ASSERT_TEXT );
+
+// the counter should be changed    STAT_increment(getThreadId(), ThreadCommonCounters, lockPublicFreeList);
+    if (!FencedLoad((intptr_t&)mailbox)) // hotpath is empty mailbox
+        return NULL;
+    else { // mailbox is not empty, take lock and inspect it
+        MallocMutex::scoped_lock scoped_cs(mailLock);
+        block = mailbox;
+        if( block ) {
+            MALLOC_ASSERT( block->isOwnedByCurrentThread(), ASSERT_TEXT );
+            MALLOC_ASSERT( !isNotForUse(block->nextPrivatizable), ASSERT_TEXT );
+            mailbox = block->nextPrivatizable;
+            block->nextPrivatizable = (Block*) this;
+        }
+    }
+    if( block ) {
+        MALLOC_ASSERT( isSolidPtr(block->publicFreeList), ASSERT_TEXT );
+        block->privatizePublicFreeList();
+    }
+    return block;
+}
+
+bool Block::emptyEnoughToUse()
+{
+    const float threshold = (slabSize - sizeof(Block)) * (1-emptyEnoughRatio);
+
+    if (bumpPtr) {
+        /* If we are still using a bump ptr for this block it is empty enough to use. */
+        STAT_increment(getThreadId(), getIndex(objectSize), examineEmptyEnough);
+        isFull = false;
+        return 1;
+    }
+
+    /* allocatedCount shows how many objects in the block are in use; however it still counts
+       blocks freed by other threads; so prior call to privatizePublicFreeList() is recommended */
+    isFull = (allocatedCount*objectSize > threshold)? true: false;
+#if COLLECT_STATISTICS
+    if (isFull)
+        STAT_increment(getThreadId(), getIndex(objectSize), examineNotEmpty);
+    else
+        STAT_increment(getThreadId(), getIndex(objectSize), examineEmptyEnough);
+#endif
+    return !isFull;
+}
+
+/* Restore the bump pointer for an empty block that is planned to use */
+void Block::restoreBumpPtr()
+{
+    MALLOC_ASSERT( allocatedCount == 0, ASSERT_TEXT );
+    MALLOC_ASSERT( publicFreeList == NULL, ASSERT_TEXT );
+    STAT_increment(getThreadId(), getIndex(objectSize), freeRestoreBumpPtr);
+    bumpPtr = (FreeObject *)((uintptr_t)this + slabSize - objectSize);
+    freeList = NULL;
+    isFull = 0;
+}
+
+void Block::freeOwnObject(void *object)
+{
+    tlsPtr->markUsed();
+    allocatedCount--;
+    MALLOC_ASSERT( allocatedCount < (slabSize-sizeof(Block))/objectSize, ASSERT_TEXT );
+#if COLLECT_STATISTICS
+    // Note that getAllocationBin is not called on the hottest path with statistics off.
+    if (tlsPtr->getAllocationBin(objectSize)->getActiveBlock() != this)
+        STAT_increment(getThreadId(), getIndex(objectSize), freeToInactiveBlock);
+    else
+        STAT_increment(getThreadId(), getIndex(objectSize), freeToActiveBlock);
+#endif
+    if (empty()) {
+        // The bump pointer is about to be restored for the block,
+        // no need to find objectToFree here (this is costly).
+
+        // if the last object of a slab is freed, the slab cannot be marked full
+        MALLOC_ASSERT(!isFull, ASSERT_TEXT);
+        tlsPtr->getAllocationBin(objectSize)->processLessUsedBlock(poolPtr, this);
+    } else {
+        FreeObject *objectToFree = findObjectToFree(object);
+        objectToFree->next = freeList;
+        freeList = objectToFree;
+
+        if (isFull && emptyEnoughToUse())
+            tlsPtr->getAllocationBin(objectSize)->moveBlockToFront(this);
+    }
+}
+
+void Block::freePublicObject (FreeObject *objectToFree)
+{
+    FreeObject *localPublicFreeList;
+
+    MALLOC_ITT_SYNC_RELEASING(&publicFreeList);
+#if FREELIST_NONBLOCKING
+    FreeObject *temp = publicFreeList;
+    do {
+        localPublicFreeList = objectToFree->next = temp;
+        temp = (FreeObject*)AtomicCompareExchange(
+                                (intptr_t&)publicFreeList,
+                                (intptr_t)objectToFree, (intptr_t)localPublicFreeList );
+        // no backoff necessary because trying to make change, not waiting for a change
+    } while( temp != localPublicFreeList );
+#else
+    STAT_increment(getThreadId(), ThreadCommonCounters, lockPublicFreeList);
+    {
+        MallocMutex::scoped_lock scoped_cs(publicFreeListLock);
+        localPublicFreeList = objectToFree->next = publicFreeList;
+        publicFreeList = objectToFree;
+    }
+#endif
+
+    if( localPublicFreeList==NULL ) {
+        // if the block is abandoned, its nextPrivatizable pointer should be UNUSABLE
+        // otherwise, it should point to the bin the block belongs to.
+        // reading nextPrivatizable is thread-safe below, because:
+        // 1) the executing thread atomically got publicFreeList==NULL and changed it to non-NULL;
+        // 2) only owning thread can change it back to NULL,
+        // 3) but it can not be done until the block is put to the mailbox
+        // So the executing thread is now the only one that can change nextPrivatizable
+        if( !isNotForUse(nextPrivatizable) ) {
+            MALLOC_ASSERT( nextPrivatizable!=NULL, ASSERT_TEXT );
+            Bin* theBin = (Bin*) nextPrivatizable;
+            MallocMutex::scoped_lock scoped_cs(theBin->mailLock);
+            nextPrivatizable = theBin->mailbox;
+            theBin->mailbox = this;
+        }
+    }
+    STAT_increment(getThreadId(), ThreadCommonCounters, freeToOtherThread);
+    STAT_increment(ownerTid, getIndex(objectSize), freeByOtherThread);
+}
+
+void Block::privatizePublicFreeList( bool cleanup )
+{
+    FreeObject *temp, *localPublicFreeList;
+    const intptr_t endMarker = cleanup? UNUSABLE : 0;
+
+    // During cleanup of orphaned blocks, the calling thread is not registered as the owner 
+    MALLOC_ASSERT( cleanup || isOwnedByCurrentThread(), ASSERT_TEXT );
+#if FREELIST_NONBLOCKING
+    temp = publicFreeList;
+    do {
+        localPublicFreeList = temp;
+        temp = (FreeObject*)AtomicCompareExchange( (intptr_t&)publicFreeList,
+                                        endMarker, (intptr_t)localPublicFreeList);
+        // no backoff necessary because trying to make change, not waiting for a change
+    } while( temp != localPublicFreeList );
+#else
+    STAT_increment(getThreadId(), ThreadCommonCounters, lockPublicFreeList);
+    {
+        MallocMutex::scoped_lock scoped_cs(publicFreeListLock);
+        localPublicFreeList = publicFreeList;
+        publicFreeList = endMarker;
+    }
+    temp = localPublicFreeList;
+#endif
+    MALLOC_ITT_SYNC_ACQUIRED(&publicFreeList);
+
+     // publicFreeList must have been UNUSABLE (possible for orphaned blocks) or valid, but not NULL
+    MALLOC_ASSERT( localPublicFreeList!=NULL, ASSERT_TEXT );
+    MALLOC_ASSERT( localPublicFreeList==temp, ASSERT_TEXT );
+    if( isSolidPtr(temp) ) {
+        MALLOC_ASSERT( allocatedCount <= (slabSize-sizeof(Block))/objectSize, ASSERT_TEXT );
+        /* other threads did not change the counter freeing our blocks */
+        allocatedCount--;
+        while( isSolidPtr(temp->next) ){ // the list will end with either NULL or UNUSABLE
+            temp = temp->next;
+            allocatedCount--;
+            MALLOC_ASSERT( allocatedCount < (slabSize-sizeof(Block))/objectSize, ASSERT_TEXT );
+        }
+        /* merge with local freeList */
+        temp->next = freeList;
+        freeList = localPublicFreeList;
+        STAT_increment(getThreadId(), getIndex(objectSize), allocPrivatized);
+    }
+}
+
+void Block::privatizeOrphaned(TLSData *tls, unsigned index)
+{
+    Bin* bin = tls->bin + index;
+    STAT_increment(getThreadId(), index, allocBlockPublic);
+    next = NULL;
+    previous = NULL;
+    MALLOC_ASSERT( publicFreeList!=NULL, ASSERT_TEXT );
+    /* There is not a race here since no other thread owns this block */
+    markOwned(tls);
+    // It is safe to change nextPrivatizable, as publicFreeList is not null
+    MALLOC_ASSERT( isNotForUse(nextPrivatizable), ASSERT_TEXT );
+    nextPrivatizable = (Block*)bin;
+    // the next call is required to change publicFreeList to 0
+    privatizePublicFreeList();
+    if( allocatedCount ) {
+        emptyEnoughToUse(); // check its fullness and set result->isFull
+    } else {
+        restoreBumpPtr();
+    }
+    MALLOC_ASSERT( !isNotForUse(publicFreeList), ASSERT_TEXT );
+}
+
+void Block::shareOrphaned(intptr_t binTag, unsigned index)
+{
+    MALLOC_ASSERT( binTag, ASSERT_TEXT );
+    STAT_increment(getThreadId(), index, freeBlockPublic);
+    markOrphaned();
+    // need to set publicFreeList to non-zero, so other threads
+    // will not change nextPrivatizable and it can be zeroed.
+    if ((intptr_t)nextPrivatizable==binTag) {
+        void* oldval;
+#if FREELIST_NONBLOCKING
+        oldval = (void*)AtomicCompareExchange((intptr_t&)publicFreeList, UNUSABLE, 0);
+#else
+        STAT_increment(getThreadId(), ThreadCommonCounters, lockPublicFreeList);
+        {
+            MallocMutex::scoped_lock scoped_cs(publicFreeListLock);
+            if ( (oldval=publicFreeList)==NULL )
+                (intptr_t&)(publicFreeList) = UNUSABLE;
+        }
+#endif
+        if ( oldval!=NULL ) {
+            // another thread freed an object; we need to wait until it finishes.
+            // There is no need for exponential backoff, as the wait here is not for a lock;
+            // but need to yield, so the thread we wait has a chance to run.
+            // TODO: add a pause to also be friendly to hyperthreads
+            int count = 256;
+            while( (intptr_t)const_cast<Block* volatile &>(nextPrivatizable)==binTag ) {
+                if (--count==0) {
+                    do_yield();
+                    count = 256;
+                }
+            }
+        }
+    } else {
+        MALLOC_ASSERT( isSolidPtr(publicFreeList), ASSERT_TEXT );
+    }
+    MALLOC_ASSERT( publicFreeList!=NULL, ASSERT_TEXT );
+    // now it is safe to change our data
+    previous = NULL;
+    // it is caller responsibility to ensure that the list of blocks
+    // formed by nextPrivatizable pointers is kept consistent if required.
+    // if only called from thread shutdown code, it does not matter.
+    (intptr_t&)(nextPrivatizable) = UNUSABLE;
+}
+
+void Block::cleanBlockHeader()
+{
+    next = NULL;
+    previous = NULL;
+    freeList = NULL;
+    allocatedCount = 0;
+    isFull = 0;
+    tlsPtr = NULL;
+
+    publicFreeList = NULL;
+}
+
+void Block::initEmptyBlock(TLSData *tls, size_t size)
+{
+    // Having getIndex and getObjectSize called next to each other
+    // allows better compiler optimization as they basically share the code.
+    unsigned int index = getIndex(size);
+    unsigned int objSz = getObjectSize(size);
+
+    cleanBlockHeader();
+    objectSize = objSz;
+    markOwned(tls);
+    // bump pointer should be prepared for first allocation - thus mode it down to objectSize
+    bumpPtr = (FreeObject *)((uintptr_t)this + slabSize - objectSize);
+
+    // each block should have the address where the head of the list of "privatizable" blocks is kept
+    // the only exception is a block for boot strap which is initialized when TLS is yet NULL
+    nextPrivatizable = tls? (Block*)(tls->bin + index) : NULL;
+    TRACEF(( "[ScalableMalloc trace] Empty block %p is initialized, owner is %ld, objectSize is %d, bumpPtr is %p\n",
+             this, tlsPtr ? getThreadId() : -1, objectSize, bumpPtr ));
+}
+
+Block *OrphanedBlocks::get(TLSData *tls, unsigned int size)
+{
+    // TODO: try to use index from getAllocationBin
+    unsigned int index = getIndex(size);
+    Block *block = bins[index].pop();
+    if (block) {
+        MALLOC_ITT_SYNC_ACQUIRED(bins+index);
+        block->privatizeOrphaned(tls, index);
+    }
+    return block;
+}
+
+void OrphanedBlocks::put(intptr_t binTag, Block *block)
+{
+    unsigned int index = getIndex(block->getSize());
+    block->shareOrphaned(binTag, index);
+    MALLOC_ITT_SYNC_RELEASING(bins+index);
+    bins[index].push(block);
+}
+
+void OrphanedBlocks::reset()
+{
+    for (uint32_t i=0; i<numBlockBinLimit; i++)
+        new (bins+i) LifoList();
+}
+
+bool OrphanedBlocks::cleanup(Backend* backend)
+{
+    bool result = false;
+    for (uint32_t i=0; i<numBlockBinLimit; i++) {
+        Block* block = bins[i].grab();
+        MALLOC_ITT_SYNC_ACQUIRED(bins+i);
+        while (block) {
+            Block* next = block->next;
+            block->privatizePublicFreeList( /*cleanup=*/true );
+            if (block->empty()) {
+                block->reset();
+                // slab blocks in user's pools do not have valid backRefIdx
+                if (!backend->inUserPool())
+                    removeBackRef(*(block->getBackRefIdx()));
+                backend->putSlabBlock(block);
+                result = true;
+            } else {
+                MALLOC_ITT_SYNC_RELEASING(bins+i);
+                bins[i].push(block);
+            }
+            block = next;
+        }
+    }
+    return result;
+}
+
+FreeBlockPool::ResOfGet FreeBlockPool::getBlock()
+{
+    Block *b = (Block*)AtomicFetchStore(&head, 0);
+
+    if (b) {
+        size--;
+        Block *newHead = b->next;
+        lastAccessMiss = false;
+        FencedStore((intptr_t&)head, (intptr_t)newHead);
+    } else
+        lastAccessMiss = true;
+
+    return ResOfGet(b, lastAccessMiss);
+}
+
+void FreeBlockPool::returnBlock(Block *block)
+{
+    MALLOC_ASSERT( size <= POOL_HIGH_MARK, ASSERT_TEXT );
+    Block *localHead = (Block*)AtomicFetchStore(&head, 0);
+
+    if (!localHead)
+        size = 0; // head was stolen by externalClean, correct size accordingly
+    else if (size == POOL_HIGH_MARK) {
+        // release cold blocks and add hot one,
+        // so keep POOL_LOW_MARK-1 blocks and add new block to head
+        Block *headToFree = localHead, *helper;
+        for (int i=0; i<POOL_LOW_MARK-2; i++)
+            headToFree = headToFree->next;
+        Block *last = headToFree;
+        headToFree = headToFree->next;
+        last->next = NULL;
+        size = POOL_LOW_MARK-1;
+        for (Block *currBl = headToFree; currBl; currBl = helper) {
+            helper = currBl->next;
+            // slab blocks in user's pools do not have valid backRefIdx
+            if (!backend->inUserPool())
+                removeBackRef(currBl->backRefIdx);
+            backend->putSlabBlock(currBl);
+        }
+    }
+    size++;
+    block->next = localHead;
+    FencedStore((intptr_t&)head, (intptr_t)block);
+}
+
+bool FreeBlockPool::externalCleanup()
+{
+    Block *helper;
+    bool nonEmpty = false;
+
+    for (Block *currBl=(Block*)AtomicFetchStore(&head, 0); currBl; currBl=helper) {
+        helper = currBl->next;
+        // slab blocks in user's pools do not have valid backRefIdx
+        if (!backend->inUserPool())
+            removeBackRef(currBl->backRefIdx);
+        backend->putSlabBlock(currBl);
+        nonEmpty = true;
+    }
+    return nonEmpty;
+}
+
+/* Prepare the block for returning to FreeBlockPool */
+void Block::reset()
+{
+    // it is caller's responsibility to ensure no data is lost before calling this
+    MALLOC_ASSERT( allocatedCount==0, ASSERT_TEXT );
+    MALLOC_ASSERT( !isSolidPtr(publicFreeList), ASSERT_TEXT );
+    if (!isStartupAllocObject())
+        STAT_increment(getThreadId(), getIndex(objectSize), freeBlockBack);
+
+    cleanBlockHeader();
+
+    nextPrivatizable = NULL;
+
+    objectSize = 0;
+    // for an empty block, bump pointer should point right after the end of the block
+    bumpPtr = (FreeObject *)((uintptr_t)this + slabSize);
+}
+
+inline void Bin::setActiveBlock (Block *block)
+{
+//    MALLOC_ASSERT( bin, ASSERT_TEXT );
+    MALLOC_ASSERT( block->isOwnedByCurrentThread(), ASSERT_TEXT );
+    // it is the caller responsibility to keep bin consistence (i.e. ensure this block is in the bin list)
+    activeBlk = block;
+}
+
+inline Block* Bin::setPreviousBlockActive()
+{
+    MALLOC_ASSERT( activeBlk, ASSERT_TEXT );
+    Block* temp = activeBlk->previous;
+    if( temp ) {
+        MALLOC_ASSERT( temp->isFull == 0, ASSERT_TEXT );
+        activeBlk = temp;
+    }
+    return temp;
+}
+
+inline bool Block::isOwnedByCurrentThread() const {
+    return tlsPtr && ownerTid.isCurrentThreadId();
+}
+
+FreeObject *Block::findObjectToFree(const void *object) const
+{
+    FreeObject *objectToFree;
+    // Due to aligned allocations, a pointer passed to scalable_free
+    // might differ from the address of internally allocated object.
+    // Small objects however should always be fine.
+    if (objectSize <= maxSegregatedObjectSize)
+        objectToFree = (FreeObject*)object;
+    // "Fitting size" allocations are suspicious if aligned higher than naturally
+    else {
+        if ( ! isAligned(object,2*fittingAlignment) )
+            // TODO: the above check is questionable - it gives false negatives in ~50% cases,
+            //       so might even be slower in average than unconditional use of findAllocatedObject.
+            // here it should be a "real" object
+            objectToFree = (FreeObject*)object;
+        else
+            // here object can be an aligned address, so applying additional checks
+            objectToFree = findAllocatedObject(object);
+        MALLOC_ASSERT( isAligned(objectToFree,fittingAlignment), ASSERT_TEXT );
+    }
+    MALLOC_ASSERT( isProperlyPlaced(objectToFree), ASSERT_TEXT );
+
+    return objectToFree;
+}
+
+void TLSData::release(MemoryPool *mPool)
+{
+    mPool->extMemPool.allLocalCaches.unregisterThread(this);
+    externalCleanup(&mPool->extMemPool, /*cleanOnlyUnused=*/false);
+
+    for (unsigned index = 0; index < numBlockBins; index++) {
+        Block *activeBlk = bin[index].getActiveBlock();
+        if (!activeBlk)
+            continue;
+        Block *threadlessBlock = activeBlk->previous;
+        while (threadlessBlock) {
+            Block *threadBlock = threadlessBlock->previous;
+            if (threadlessBlock->empty()) {
+                /* we destroy the thread, so not use its block pool */
+                mPool->returnEmptyBlock(threadlessBlock, /*poolTheBlock=*/false);
+            } else {
+                mPool->extMemPool.orphanedBlocks.put(intptr_t(bin+index), threadlessBlock);
+            }
+            threadlessBlock = threadBlock;
+        }
+        threadlessBlock = activeBlk;
+        while (threadlessBlock) {
+            Block *threadBlock = threadlessBlock->next;
+            if (threadlessBlock->empty()) {
+                /* we destroy the thread, so not use its block pool */
+                mPool->returnEmptyBlock(threadlessBlock, /*poolTheBlock=*/false);
+            } else {
+                mPool->extMemPool.orphanedBlocks.put(intptr_t(bin+index), threadlessBlock);
+            }
+            threadlessBlock = threadBlock;
+        }
+        bin[index].resetActiveBlock();
+    }
+}
+
+
+#if MALLOC_CHECK_RECURSION
+// TODO: Use dedicated heap for this
+
+/*
+ * It's a special kind of allocation that can be used when malloc is
+ * not available (either during startup or when malloc was already called and
+ * we are, say, inside pthread_setspecific's call).
+ * Block can contain objects of different sizes,
+ * allocations are performed by moving bump pointer and increasing of object counter,
+ * releasing is done via counter of objects allocated in the block
+ * or moving bump pointer if releasing object is on a bound.
+ * TODO: make bump pointer to grow to the same backward direction as all the others.
+ */
+
+class StartupBlock : public Block {
+    size_t availableSize() const {
+        return slabSize - ((uintptr_t)bumpPtr - (uintptr_t)this);
+    }
+    static StartupBlock *getBlock();
+public:
+    static FreeObject *allocate(size_t size);
+    static size_t msize(void *ptr) { return *((size_t*)ptr - 1); }
+    void free(void *ptr);
+};
+
+static MallocMutex startupMallocLock;
+static StartupBlock *firstStartupBlock;
+
+StartupBlock *StartupBlock::getBlock()
+{
+    BackRefIdx backRefIdx = BackRefIdx::newBackRef(/*largeObj=*/false);
+    if (backRefIdx.isInvalid()) return NULL;
+
+    StartupBlock *block = static_cast<StartupBlock*>(
+        defaultMemPool->extMemPool.backend.getSlabBlock(1));
+    if (!block) return NULL;
+
+    block->cleanBlockHeader();
+    setBackRef(backRefIdx, block);
+    block->backRefIdx = backRefIdx;
+    // use startupAllocObjSizeMark to mark objects from startup block marker
+    block->objectSize = startupAllocObjSizeMark;
+    block->bumpPtr = (FreeObject *)((uintptr_t)block + sizeof(StartupBlock));
+    return block;
+}
+
+FreeObject *StartupBlock::allocate(size_t size)
+{
+    FreeObject *result;
+    StartupBlock *newBlock = NULL;
+    bool newBlockUnused = false;
+
+    /* Objects must be aligned on their natural bounds,
+       and objects bigger than word on word's bound. */
+    size = alignUp(size, sizeof(size_t));
+    // We need size of an object to implement msize.
+    size_t reqSize = size + sizeof(size_t);
+    // speculatively allocates newBlock to try avoid allocation while holding lock
+    /* TODO: The function is called when malloc nested call is detected,
+             so simultaneous usage from different threads seems unlikely.
+             If pre-allocation is found useless, the code might be simplified. */
+    if (!firstStartupBlock || firstStartupBlock->availableSize() < reqSize) {
+        newBlock = StartupBlock::getBlock();
+        if (!newBlock) return NULL;
+    }
+    {
+        MallocMutex::scoped_lock scoped_cs(startupMallocLock);
+        // Re-check whether we need a new block (conditions might have changed)
+        if (!firstStartupBlock || firstStartupBlock->availableSize() < reqSize) {
+            if (!newBlock) {
+                newBlock = StartupBlock::getBlock();
+                if (!newBlock) return NULL;
+            }
+            newBlock->next = (Block*)firstStartupBlock;
+            if (firstStartupBlock)
+                firstStartupBlock->previous = (Block*)newBlock;
+            firstStartupBlock = newBlock;
+        } else
+            newBlockUnused = true;
+        result = firstStartupBlock->bumpPtr;
+        firstStartupBlock->allocatedCount++;
+        firstStartupBlock->bumpPtr =
+            (FreeObject *)((uintptr_t)firstStartupBlock->bumpPtr + reqSize);
+    }
+    if (newBlock && newBlockUnused)
+        defaultMemPool->returnEmptyBlock(newBlock, /*poolTheBlock=*/false);
+
+    // keep object size at the negative offset
+    *((size_t*)result) = size;
+    return (FreeObject*)((size_t*)result+1);
+}
+
+void StartupBlock::free(void *ptr)
+{
+    Block* blockToRelease = NULL;
+    {
+        MallocMutex::scoped_lock scoped_cs(startupMallocLock);
+
+        MALLOC_ASSERT(firstStartupBlock, ASSERT_TEXT);
+        MALLOC_ASSERT(startupAllocObjSizeMark==objectSize
+                      && allocatedCount>0, ASSERT_TEXT);
+        MALLOC_ASSERT((uintptr_t)ptr>=(uintptr_t)this+sizeof(StartupBlock)
+                      && (uintptr_t)ptr+StartupBlock::msize(ptr)<=(uintptr_t)this+slabSize,
+                      ASSERT_TEXT);
+        if (0 == --allocatedCount) {
+            if (this == firstStartupBlock)
+                firstStartupBlock = (StartupBlock*)firstStartupBlock->next;
+            if (previous)
+                previous->next = next;
+            if (next)
+                next->previous = previous;
+            blockToRelease = this;
+        } else if ((uintptr_t)ptr + StartupBlock::msize(ptr) == (uintptr_t)bumpPtr) {
+            // last object in the block released
+            FreeObject *newBump = (FreeObject*)((size_t*)ptr - 1);
+            MALLOC_ASSERT((uintptr_t)newBump>(uintptr_t)this+sizeof(StartupBlock),
+                          ASSERT_TEXT);
+            bumpPtr = newBump;
+        }
+    }
+    if (blockToRelease) {
+        blockToRelease->previous = blockToRelease->next = NULL;
+        defaultMemPool->returnEmptyBlock(blockToRelease, /*poolTheBlock=*/false);
+    }
+}
+
+#endif /* MALLOC_CHECK_RECURSION */
+
+/********* End thread related code  *************/
+
+/********* Library initialization *************/
+
+//! Value indicating the state of initialization.
+/* 0 = initialization not started.
+ * 1 = initialization started but not finished.
+ * 2 = initialization finished.
+ * In theory, we only need values 0 and 2. But value 1 is nonetheless
+ * useful for detecting errors in the double-check pattern.
+ */
+static intptr_t mallocInitialized;   // implicitly initialized to 0
+static MallocMutex initMutex;
+
+/** The leading "\0" is here so that applying "strings" to the binary
+    delivers a clean result. */
+static char VersionString[] = "\0" TBBMALLOC_VERSION_STRINGS;
+
+void AllocControlledMode::initReadEnv(const char *envName, intptr_t defaultVal)
+{
+    if (!setDone) {
+#if !__TBB_WIN8UI_SUPPORT
+    // TODO: use strtol to get the actual value of the envirable
+        const char *envVal = getenv(envName);
+        if (envVal && !strcmp(envVal, "1"))
+            val = 1;
+        else
+#endif
+            val = defaultVal;
+        setDone = true;
+    }
+}
+
+#if USE_PTHREAD && (__TBB_SOURCE_DIRECTLY_INCLUDED || __TBB_USE_DLOPEN_REENTRANCY_WORKAROUND)
+
+/* Decrease race interval between dynamic library unloading and pthread key
+   destructor. Protect only Pthreads with supported unloading. */
+class ShutdownSync {
+/* flag is the number of threads in pthread key dtor body
+   (i.e., between threadDtorStart() and threadDtorDone())
+   or the signal to skip dtor, if flag < 0 */
+    intptr_t flag;
+    static const intptr_t skipDtor = INTPTR_MIN/2;
+public:
+    void init() { flag = 0; }
+/* Suppose that 2*abs(skipDtor) or more threads never call threadDtorStart()
+   simultaneously, so flag never becomes negative because of that. */
+    bool threadDtorStart() {
+        if (flag < 0)
+            return false;
+        if (AtomicIncrement(flag) <= 0) { // note that new value returned
+            AtomicAdd(flag, -1);  // flag is spoiled by us, restore it
+            return false;
+        }
+        return true;
+    }
+    void threadDtorDone() {
+        AtomicAdd(flag, -1);
+    }
+    void processExit() {
+        if (AtomicAdd(flag, skipDtor) != 0)
+            SpinWaitUntilEq(flag, skipDtor);
+    }
+};
+
+#else
+
+class ShutdownSync {
+public:
+    void init() { }
+    bool threadDtorStart() { return true; }
+    void threadDtorDone() { }
+    void processExit() { }
+};
+
+#endif // USE_PTHREAD && (__TBB_SOURCE_DIRECTLY_INCLUDED || __TBB_USE_DLOPEN_REENTRANCY_WORKAROUND)
+
+static ShutdownSync shutdownSync;
+
+inline bool isMallocInitialized() {
+    // Load must have acquire fence; otherwise thread taking "initialized" path
+    // might perform textually later loads *before* mallocInitialized becomes 2.
+    return 2 == FencedLoad(mallocInitialized);
+}
+
+bool isMallocInitializedExt() {
+    return isMallocInitialized();
+}
+
+/** Caller is responsible for ensuring this routine is called exactly once. */
+extern "C" void MallocInitializeITT() {
+#if DO_ITT_NOTIFY
+    if (!usedBySrcIncluded)
+        tbb::internal::__TBB_load_ittnotify();
+#endif
+}
+
+void MemoryPool::initDefaultPool() {
+    hugePages.init();
+}
+
+/*
+ * Allocator initialization routine;
+ * it is called lazily on the very first scalable_malloc call.
+ */
+static bool initMemoryManager()
+{
+    TRACEF(( "[ScalableMalloc trace] sizeof(Block) is %d (expected 128); sizeof(uintptr_t) is %d\n",
+             sizeof(Block), sizeof(uintptr_t) ));
+    MALLOC_ASSERT( 2*blockHeaderAlignment == sizeof(Block), ASSERT_TEXT );
+    MALLOC_ASSERT( sizeof(FreeObject) == sizeof(void*), ASSERT_TEXT );
+    MALLOC_ASSERT( isAligned(defaultMemPool, sizeof(intptr_t)),
+                   "Memory pool must be void*-aligned for atomic to work over aligned arguments.");
+
+#if USE_WINTHREAD
+    const size_t granularity = 64*1024; // granulatity of VirtualAlloc
+#else
+    // POSIX.1-2001-compliant way to get page size
+    const size_t granularity = sysconf(_SC_PAGESIZE);
+#endif
+    bool initOk = defaultMemPool->
+        extMemPool.init(0, NULL, NULL, granularity,
+                        /*keepAllMemory=*/false, /*fixedPool=*/false);
+// TODO: extMemPool.init() to not allocate memory
+    if (!initOk || !initBackRefMaster(&defaultMemPool->extMemPool.backend) || !ThreadId::init())
+        return false;
+    MemoryPool::initDefaultPool();
+    // init() is required iff initMemoryManager() is called
+    // after mallocProcessShutdownNotification()
+    shutdownSync.init();
+#if COLLECT_STATISTICS
+    initStatisticsCollection();
+#endif
+    return true;
+}
+
+static bool GetBoolEnvironmentVariable(const char* name) {
+    return tbb::internal::GetBoolEnvironmentVariable(name);
+}
+
+//! Ensures that initMemoryManager() is called once and only once.
+/** Does not return until initMemoryManager() has been completed by a thread.
+    There is no need to call this routine if mallocInitialized==2 . */
+static bool doInitialization()
+{
+    MallocMutex::scoped_lock lock( initMutex );
+    if (mallocInitialized!=2) {
+        MALLOC_ASSERT( mallocInitialized==0, ASSERT_TEXT );
+        mallocInitialized = 1;
+        RecursiveMallocCallProtector scoped;
+        if (!initMemoryManager()) {
+            mallocInitialized = 0; // restore and out
+            return false;
+        }
+#ifdef  MALLOC_EXTRA_INITIALIZATION
+        MALLOC_EXTRA_INITIALIZATION;
+#endif
+#if MALLOC_CHECK_RECURSION
+        RecursiveMallocCallProtector::detectNaiveOverload();
+#endif
+        MALLOC_ASSERT( mallocInitialized==1, ASSERT_TEXT );
+        // Store must have release fence, otherwise mallocInitialized==2
+        // might become remotely visible before side effects of
+        // initMemoryManager() become remotely visible.
+        FencedStore( mallocInitialized, 2 );
+        if( GetBoolEnvironmentVariable("TBB_VERSION") ) {
+            fputs(VersionString+1,stderr);
+            hugePages.printStatus();
+        }
+    }
+    /* It can't be 0 or I would have initialized it */
+    MALLOC_ASSERT( mallocInitialized==2, ASSERT_TEXT );
+    return true;
+}
+
+/********* End library initialization *************/
+
+/********* The malloc show begins     *************/
+
+
+FreeObject *Block::allocateFromFreeList()
+{
+    FreeObject *result;
+
+    if (!freeList) return NULL;
+
+    result = freeList;
+    MALLOC_ASSERT( result, ASSERT_TEXT );
+
+    freeList = result->next;
+    MALLOC_ASSERT( allocatedCount < (slabSize-sizeof(Block))/objectSize, ASSERT_TEXT );
+    allocatedCount++;
+    STAT_increment(getThreadId(), getIndex(objectSize), allocFreeListUsed);
+
+    return result;
+}
+
+FreeObject *Block::allocateFromBumpPtr()
+{
+    FreeObject *result = bumpPtr;
+    if (result) {
+        bumpPtr = (FreeObject *) ((uintptr_t) bumpPtr - objectSize);
+        if ( (uintptr_t)bumpPtr < (uintptr_t)this+sizeof(Block) ) {
+            bumpPtr = NULL;
+        }
+        MALLOC_ASSERT( allocatedCount < (slabSize-sizeof(Block))/objectSize, ASSERT_TEXT );
+        allocatedCount++;
+        STAT_increment(getThreadId(), getIndex(objectSize), allocBumpPtrUsed);
+    }
+    return result;
+}
+
+inline FreeObject* Block::allocate()
+{
+    MALLOC_ASSERT( isOwnedByCurrentThread(), ASSERT_TEXT );
+
+    /* for better cache locality, first looking in the free list. */
+    if ( FreeObject *result = allocateFromFreeList() ) {
+        return result;
+    }
+    MALLOC_ASSERT( !freeList, ASSERT_TEXT );
+
+    /* if free list is empty, try thread local bump pointer allocation. */
+    if ( FreeObject *result = allocateFromBumpPtr() ) {
+        return result;
+    }
+    MALLOC_ASSERT( !bumpPtr, ASSERT_TEXT );
+
+    /* the block is considered full. */
+    isFull = 1;
+    return NULL;
+}
+
+size_t Block::findObjectSize(void *object) const
+{
+    size_t blSize = getSize();
+#if MALLOC_CHECK_RECURSION
+    // Currently, there is no aligned allocations from startup blocks,
+    // so we can return just StartupBlock::msize().
+    // TODO: This must be extended if we add aligned allocation from startup blocks.
+    if (!blSize)
+        return StartupBlock::msize(object);
+#endif
+    // object can be aligned, so real size can be less than block's
+    size_t size =
+        blSize - ((uintptr_t)object - (uintptr_t)findObjectToFree(object));
+    MALLOC_ASSERT(size>0 && size<minLargeObjectSize, ASSERT_TEXT);
+    return size;
+}
+
+void Bin::moveBlockToFront(Block *block)
+{
+    /* move the block to the front of the bin */
+    if (block == activeBlk) return;
+    outofTLSBin(block);
+    pushTLSBin(block);
+}
+
+void Bin::processLessUsedBlock(MemoryPool *memPool, Block *block)
+{
+    if (block != activeBlk) {
+        /* We are not actively using this block; return it to the general block pool */
+        outofTLSBin(block);
+        memPool->returnEmptyBlock(block, /*poolTheBlock=*/true);
+    } else {
+        /* all objects are free - let's restore the bump pointer */
+        block->restoreBumpPtr();
+    }
+}
+
+template<int LOW_MARK, int HIGH_MARK>
+bool LocalLOCImpl<LOW_MARK, HIGH_MARK>::put(LargeMemoryBlock *object, ExtMemoryPool *extMemPool)
+{
+    const size_t size = object->unalignedSize;
+    // not spoil cache with too large object, that can cause its total cleanup
+    if (size > MAX_TOTAL_SIZE)
+        return false;
+    LargeMemoryBlock *localHead = (LargeMemoryBlock*)AtomicFetchStore(&head, 0);
+
+    object->prev = NULL;
+    object->next = localHead;
+    if (localHead)
+        localHead->prev = object;
+    else {
+        // those might not be cleaned during local cache stealing, correct them
+        totalSize = 0;
+        numOfBlocks = 0;
+        tail = object;
+    }
+    localHead = object;
+    totalSize += size;
+    numOfBlocks++;
+    // must meet both size and number of cached objects constrains
+    if (totalSize > MAX_TOTAL_SIZE || numOfBlocks >= HIGH_MARK) {
+        // scanning from tail until meet conditions
+        while (totalSize > MAX_TOTAL_SIZE || numOfBlocks > LOW_MARK) {
+            totalSize -= tail->unalignedSize;
+            numOfBlocks--;
+            tail = tail->prev;
+        }
+        LargeMemoryBlock *headToRelease = tail->next;
+        tail->next = NULL;
+
+        extMemPool->freeLargeObjectList(headToRelease);
+    }
+
+    FencedStore((intptr_t&)head, (intptr_t)localHead);
+    return true;
+}
+
+template<int LOW_MARK, int HIGH_MARK>
+LargeMemoryBlock *LocalLOCImpl<LOW_MARK, HIGH_MARK>::get(size_t size)
+{
+    LargeMemoryBlock *localHead, *res=NULL;
+
+    if (size > MAX_TOTAL_SIZE)
+        return NULL;
+
+    if (!head || (localHead = (LargeMemoryBlock*)AtomicFetchStore(&head, 0)) == NULL) {
+        // do not restore totalSize, numOfBlocks and tail at this point,
+        // as they are used only in put(), where they must be restored
+        return NULL;
+    }
+
+    for (LargeMemoryBlock *curr = localHead; curr; curr=curr->next) {
+        if (curr->unalignedSize == size) {
+            res = curr;
+            if (curr->next)
+                curr->next->prev = curr->prev;
+            else
+                tail = curr->prev;
+            if (curr != localHead)
+                curr->prev->next = curr->next;
+            else
+                localHead = curr->next;
+            totalSize -= size;
+            numOfBlocks--;
+            break;
+        }
+    }
+    FencedStore((intptr_t&)head, (intptr_t)localHead);
+    return res;
+}
+
+template<int LOW_MARK, int HIGH_MARK>
+bool LocalLOCImpl<LOW_MARK, HIGH_MARK>::externalCleanup(ExtMemoryPool *extMemPool)
+{
+    if (LargeMemoryBlock *localHead = (LargeMemoryBlock*)AtomicFetchStore(&head, 0)) {
+        extMemPool->freeLargeObjectList(localHead);
+        return true;
+    }
+    return false;
+}
+
+void *MemoryPool::getFromLLOCache(TLSData* tls, size_t size, size_t alignment)
+{
+    LargeMemoryBlock *lmb = NULL;
+
+    size_t headersSize = sizeof(LargeMemoryBlock)+sizeof(LargeObjectHdr);
+    size_t allocationSize = LargeObjectCache::alignToBin(size+headersSize+alignment);
+    if (allocationSize < size) // allocationSize is wrapped around after alignToBin
+        return NULL;
+    MALLOC_ASSERT(allocationSize >= alignment, "Overflow must be checked before.");
+
+    if (tls) {
+        tls->markUsed();
+        lmb = tls->lloc.get(allocationSize);
+    }
+    if (!lmb)
+        lmb = extMemPool.mallocLargeObject(this, allocationSize);
+
+    if (lmb) {
+        // doing shuffle we suppose that alignment offset guarantees
+        // that different cache lines are in use
+        MALLOC_ASSERT(alignment >= estimatedCacheLineSize, ASSERT_TEXT);
+
+        void *alignedArea = (void*)alignUp((uintptr_t)lmb+headersSize, alignment);
+        uintptr_t alignedRight =
+            alignDown((uintptr_t)lmb+lmb->unalignedSize - size, alignment);
+        // Has some room to shuffle object between cache lines?
+        // Note that alignedRight and alignedArea are aligned at alignment.
+        unsigned ptrDelta = alignedRight - (uintptr_t)alignedArea;
+        if (ptrDelta && tls) { // !tls is cold path
+            // for the hot path of alignment==estimatedCacheLineSize,
+            // allow compilers to use shift for division
+            // (since estimatedCacheLineSize is a power-of-2 constant)
+            unsigned numOfPossibleOffsets = alignment == estimatedCacheLineSize?
+                  ptrDelta / estimatedCacheLineSize :
+                  ptrDelta / alignment;
+            unsigned myCacheIdx = ++tls->currCacheIdx;
+            unsigned offset = myCacheIdx % numOfPossibleOffsets;
+
+            // Move object to a cache line with an offset that is different from
+            // previous allocation. This supposedly allows us to use cache
+            // associativity more efficiently.
+            alignedArea = (void*)((uintptr_t)alignedArea + offset*alignment);
+        }
+        MALLOC_ASSERT((uintptr_t)lmb+lmb->unalignedSize >=
+                      (uintptr_t)alignedArea+size, "Object doesn't fit the block.");
+        LargeObjectHdr *header = (LargeObjectHdr*)alignedArea-1;
+        header->memoryBlock = lmb;
+        header->backRefIdx = lmb->backRefIdx;
+        setBackRef(header->backRefIdx, header);
+
+        lmb->objectSize = size;
+
+        MALLOC_ASSERT( isLargeObject<unknownMem>(alignedArea), ASSERT_TEXT );
+        MALLOC_ASSERT( isAligned(alignedArea, alignment), ASSERT_TEXT );
+
+        return alignedArea;
+    }
+    return NULL;
+}
+
+void MemoryPool::putToLLOCache(TLSData *tls, void *object)
+{
+    LargeObjectHdr *header = (LargeObjectHdr*)object - 1;
+    // overwrite backRefIdx to simplify double free detection
+    header->backRefIdx = BackRefIdx();
+
+    if (tls) {
+        tls->markUsed();
+        if (tls->lloc.put(header->memoryBlock, &extMemPool))
+            return;
+    }
+    extMemPool.freeLargeObject(header->memoryBlock);
+}
+
+/*
+ * All aligned allocations fall into one of the following categories:
+ *  1. if both request size and alignment are <= maxSegregatedObjectSize,
+ *       we just align the size up, and request this amount, because for every size
+ *       aligned to some power of 2, the allocated object is at least that aligned.
+ * 2. for size<minLargeObjectSize, check if already guaranteed fittingAlignment is enough.
+ * 3. if size+alignment<minLargeObjectSize, we take an object of fittingSizeN and align
+ *       its address up; given such pointer, scalable_free could find the real object.
+ *       Wrapping of size+alignment is impossible because maximal allowed
+ *       alignment plus minLargeObjectSize can't lead to wrapping.
+ * 4. otherwise, aligned large object is allocated.
+ */
+static void *allocateAligned(MemoryPool *memPool, size_t size, size_t alignment)
+{
+    MALLOC_ASSERT( isPowerOfTwo(alignment), ASSERT_TEXT );
+
+    if (!isMallocInitialized())
+        if (!doInitialization())
+            return NULL;
+
+    void *result;
+    if (size<=maxSegregatedObjectSize && alignment<=maxSegregatedObjectSize)
+        result = internalPoolMalloc(memPool, alignUp(size? size: sizeof(size_t), alignment));
+    else if (size<minLargeObjectSize) {
+        if (alignment<=fittingAlignment)
+            result = internalPoolMalloc(memPool, size);
+        else if (size+alignment < minLargeObjectSize) {
+            void *unaligned = internalPoolMalloc(memPool, size+alignment);
+            if (!unaligned) return NULL;
+            result = alignUp(unaligned, alignment);
+        } else
+            goto LargeObjAlloc;
+    } else {
+    LargeObjAlloc:
+        TLSData *tls = memPool->getTLS(/*create=*/true);
+        // take into account only alignment that are higher then natural
+        result =
+            memPool->getFromLLOCache(tls, size, largeObjectAlignment>alignment?
+                                               largeObjectAlignment: alignment);
+    }
+
+    MALLOC_ASSERT( isAligned(result, alignment), ASSERT_TEXT );
+    return result;
+}
+
+static void *reallocAligned(MemoryPool *memPool, void *ptr,
+                            size_t newSize, size_t alignment = 0)
+{
+    void *result;
+    size_t copySize;
+
+    if (isLargeObject<ourMem>(ptr)) {
+        LargeMemoryBlock* lmb = ((LargeObjectHdr *)ptr - 1)->memoryBlock;
+        copySize = lmb->unalignedSize-((uintptr_t)ptr-(uintptr_t)lmb);
+
+        // Apply different strategies if size decreases
+        if (newSize <= copySize && (0 == alignment || isAligned(ptr, alignment))) {
+
+            // For huge objects (that do not fit in backend cache), keep the same space unless
+            // the new size is at least twice smaller
+            bool isMemoryBlockHuge = copySize > memPool->extMemPool.backend.getMaxBinnedSize();
+            size_t threshold = isMemoryBlockHuge ? copySize / 2 : 0;
+            if (newSize > threshold) {
+                lmb->objectSize = newSize;
+                return ptr;
+            }
+            // TODO: For large objects suitable for the backend cache,
+            // split out the excessive part and put it to the backend.
+        }
+        // Reallocate for real
+        copySize = lmb->objectSize;
+#if BACKEND_HAS_MREMAP
+        if (void *r = memPool->extMemPool.remap(ptr, copySize, newSize,
+                          alignment < largeObjectAlignment ? largeObjectAlignment : alignment))
+            return r;
+#endif
+        result = alignment ? allocateAligned(memPool, newSize, alignment) :
+            internalPoolMalloc(memPool, newSize);
+
+    } else {
+        Block* block = (Block *)alignDown(ptr, slabSize);
+        copySize = block->findObjectSize(ptr);
+
+        // TODO: Move object to another bin if size decreases and the current bin is "empty enough".
+        // Currently, in case of size decreasing, old pointer is returned
+        if (newSize <= copySize && (0==alignment || isAligned(ptr, alignment))) {
+            return ptr;
+        } else {
+            result = alignment ? allocateAligned(memPool, newSize, alignment) :
+                internalPoolMalloc(memPool, newSize);
+        }
+    }
+    if (result) {
+        memcpy(result, ptr, copySize < newSize ? copySize : newSize);
+        internalPoolFree(memPool, ptr, 0);
+    }
+    return result;
+}
+
+/* A predicate checks if an object is properly placed inside its block */
+inline bool Block::isProperlyPlaced(const void *object) const
+{
+    return 0 == ((uintptr_t)this + slabSize - (uintptr_t)object) % objectSize;
+}
+
+/* Finds the real object inside the block */
+FreeObject *Block::findAllocatedObject(const void *address) const
+{
+    // calculate offset from the end of the block space
+    uint16_t offset = (uintptr_t)this + slabSize - (uintptr_t)address;
+    MALLOC_ASSERT( offset<=slabSize-sizeof(Block), ASSERT_TEXT );
+    // find offset difference from a multiple of allocation size
+    offset %= objectSize;
+    // and move the address down to where the real object starts.
+    return (FreeObject*)((uintptr_t)address - (offset? objectSize-offset: 0));
+}
+
+/*
+ * Bad dereference caused by a foreign pointer is possible only here, not earlier in call chain.
+ * Separate function isolates SEH code, as it has bad influence on compiler optimization.
+ */
+static inline BackRefIdx safer_dereference (const BackRefIdx *ptr)
+{
+    BackRefIdx id;
+#if _MSC_VER
+    __try {
+#endif
+        id = *ptr;
+#if _MSC_VER
+    } __except( GetExceptionCode() == EXCEPTION_ACCESS_VIOLATION?
+                EXCEPTION_EXECUTE_HANDLER : EXCEPTION_CONTINUE_SEARCH ) {
+        id = BackRefIdx();
+    }
+#endif
+    return id;
+}
+
+template<MemoryOrigin memOrigin>
+bool isLargeObject(void *object)
+{
+    if (!isAligned(object, largeObjectAlignment))
+        return false;
+    LargeObjectHdr *header = (LargeObjectHdr*)object - 1;
+    BackRefIdx idx = memOrigin==unknownMem? safer_dereference(&header->backRefIdx) :
+        header->backRefIdx;
+
+    return idx.isLargeObject()
+        // in valid LargeObjectHdr memoryBlock is not NULL
+        && header->memoryBlock
+        // in valid LargeObjectHdr memoryBlock points somewhere before header
+        // TODO: more strict check
+        && (uintptr_t)header->memoryBlock < (uintptr_t)header
+        && getBackRef(idx) == header;
+}
+
+static inline bool isSmallObject (void *ptr)
+{
+    Block* expectedBlock = (Block*)alignDown(ptr, slabSize);
+    const BackRefIdx* idx = expectedBlock->getBackRefIdx();
+
+    bool isSmall = expectedBlock == getBackRef(safer_dereference(idx));
+    if (isSmall)
+        expectedBlock->checkFreePrecond(ptr);
+    return isSmall;
+}
+
+/**** Check if an object was allocated by scalable_malloc ****/
+static inline bool isRecognized (void* ptr)
+{
+    return defaultMemPool->extMemPool.backend.ptrCanBeValid(ptr) &&
+        (isLargeObject<unknownMem>(ptr) || isSmallObject(ptr));
+}
+
+static inline void freeSmallObject(void *object)
+{
+    /* mask low bits to get the block */
+    Block *block = (Block *)alignDown(object, slabSize);
+    block->checkFreePrecond(object);
+
+#if MALLOC_CHECK_RECURSION
+    if (block->isStartupAllocObject()) {
+        ((StartupBlock *)block)->free(object);
+        return;
+    }
+#endif
+    if (block->isOwnedByCurrentThread()) {
+        block->freeOwnObject(object);
+    } else { /* Slower path to add to the shared list, the allocatedCount is updated by the owner thread in malloc. */
+        FreeObject *objectToFree = block->findObjectToFree(object);
+        block->freePublicObject(objectToFree);
+    }
+}
+
+static void *internalPoolMalloc(MemoryPool* memPool, size_t size)
+{
+    Bin* bin;
+    Block * mallocBlock;
+
+    if (!memPool) return NULL;
+
+    if (!size) size = sizeof(size_t);
+
+    TLSData *tls = memPool->getTLS(/*create=*/true);
+
+    /* Allocate a large object */
+    if (size >= minLargeObjectSize)
+        return memPool->getFromLLOCache(tls, size, largeObjectAlignment);
+
+    if (!tls) return NULL;
+
+    tls->markUsed();
+    /*
+     * Get an element in thread-local array corresponding to the given size;
+     * It keeps ptr to the active block for allocations of this size
+     */
+    bin = tls->getAllocationBin(size);
+    if ( !bin ) return NULL;
+
+    /* Get a block to try to allocate in. */
+    for( mallocBlock = bin->getActiveBlock(); mallocBlock;
+         mallocBlock = bin->setPreviousBlockActive() ) // the previous block should be empty enough
+    {
+        if( FreeObject *result = mallocBlock->allocate() )
+            return result;
+    }
+
+    /*
+     * else privatize publicly freed objects in some block and allocate from it
+     */
+    mallocBlock = bin->getPublicFreeListBlock();
+    if (mallocBlock) {
+        if (mallocBlock->emptyEnoughToUse()) {
+            bin->moveBlockToFront(mallocBlock);
+        }
+        MALLOC_ASSERT( mallocBlock->freeListNonNull(), ASSERT_TEXT );
+        if ( FreeObject *result = mallocBlock->allocateFromFreeList() )
+            return result;
+        /* Else something strange happened, need to retry from the beginning; */
+        TRACEF(( "[ScalableMalloc trace] Something is wrong: no objects in public free list; reentering.\n" ));
+        return internalPoolMalloc(memPool, size);
+    }
+
+    /*
+     * no suitable own blocks, try to get a partial block that some other thread has discarded.
+     */
+    mallocBlock = memPool->extMemPool.orphanedBlocks.get(tls, size);
+    while (mallocBlock) {
+        bin->pushTLSBin(mallocBlock);
+        bin->setActiveBlock(mallocBlock); // TODO: move under the below condition?
+        if( FreeObject *result = mallocBlock->allocate() )
+            return result;
+        mallocBlock = memPool->extMemPool.orphanedBlocks.get(tls, size);
+    }
+
+    /*
+     * else try to get a new empty block
+     */
+    mallocBlock = memPool->getEmptyBlock(size);
+    if (mallocBlock) {
+        bin->pushTLSBin(mallocBlock);
+        bin->setActiveBlock(mallocBlock);
+        if( FreeObject *result = mallocBlock->allocate() )
+            return result;
+        /* Else something strange happened, need to retry from the beginning; */
+        TRACEF(( "[ScalableMalloc trace] Something is wrong: no objects in empty block; reentering.\n" ));
+        return internalPoolMalloc(memPool, size);
+    }
+    /*
+     * else nothing works so return NULL
+     */
+    TRACEF(( "[ScalableMalloc trace] No memory found, returning NULL.\n" ));
+    return NULL;
+}
+
+// When size==0 (i.e. unknown), detect here whether the object is large.
+// For size is known and < minLargeObjectSize, we still need to check
+// if the actual object is large, because large objects might be used
+// for aligned small allocations.
+static bool internalPoolFree(MemoryPool *memPool, void *object, size_t size)
+{
+    if (!memPool || !object) return false;
+
+    // The library is initialized at allocation call, so releasing while
+    // not initialized means foreign object is releasing.
+    MALLOC_ASSERT(isMallocInitialized(), ASSERT_TEXT);
+    MALLOC_ASSERT(memPool->extMemPool.userPool() || isRecognized(object),
+                  "Invalid pointer during object releasing is detected.");
+
+    if (size >= minLargeObjectSize || isLargeObject<ourMem>(object))
+        memPool->putToLLOCache(memPool->getTLS(/*create=*/false), object);
+    else
+        freeSmallObject(object);
+    return true;
+}
+
+static void *internalMalloc(size_t size)
+{
+    if (!size) size = sizeof(size_t);
+
+#if MALLOC_CHECK_RECURSION
+    if (RecursiveMallocCallProtector::sameThreadActive())
+        return size<minLargeObjectSize? StartupBlock::allocate(size) :
+            // nested allocation, so skip tls
+            (FreeObject*)defaultMemPool->getFromLLOCache(NULL, size, slabSize);
+#endif
+
+    if (!isMallocInitialized())
+        if (!doInitialization())
+            return NULL;
+    return internalPoolMalloc(defaultMemPool, size);
+}
+
+static void internalFree(void *object)
+{
+    internalPoolFree(defaultMemPool, object, 0);
+}
+
+static size_t internalMsize(void* ptr)
+{
+    if (ptr) {
+        MALLOC_ASSERT(isRecognized(ptr), "Invalid pointer in scalable_msize detected.");
+        if (isLargeObject<ourMem>(ptr)) {
+            // TODO: return the maximum memory size, that can be written to this object 
+            LargeMemoryBlock* lmb = ((LargeObjectHdr*)ptr - 1)->memoryBlock;
+            return lmb->objectSize;
+        } else
+            return ((Block*)alignDown(ptr, slabSize))->findObjectSize(ptr);
+    }
+    errno = EINVAL;
+    // Unlike _msize, return 0 in case of parameter error.
+    // Returning size_t(-1) looks more like the way to troubles.
+    return 0;
+}
+
+} // namespace internal
+
+using namespace rml::internal;
+
+// legacy entry point saved for compatibility with binaries complied
+// with pre-6003 versions of TBB
+rml::MemoryPool *pool_create(intptr_t pool_id, const MemPoolPolicy *policy)
+{
+    rml::MemoryPool *pool;
+    MemPoolPolicy pol(policy->pAlloc, policy->pFree, policy->granularity);
+
+    pool_create_v1(pool_id, &pol, &pool);
+    return pool;
+}
+
+rml::MemPoolError pool_create_v1(intptr_t pool_id, const MemPoolPolicy *policy,
+                                 rml::MemoryPool **pool)
+{
+    if ( !policy->pAlloc || policy->version<MemPoolPolicy::TBBMALLOC_POOL_VERSION
+         // empty pFree allowed only for fixed pools
+         || !(policy->fixedPool || policy->pFree)) {
+        *pool = NULL;
+        return INVALID_POLICY;
+    }
+    if ( policy->version>MemPoolPolicy::TBBMALLOC_POOL_VERSION // future versions are not supported
+         // new flags can be added in place of reserved, but default
+         // behaviour must be supported by this version
+         || policy->reserved ) {
+        *pool = NULL;
+        return UNSUPPORTED_POLICY;
+    }
+    if (!isMallocInitialized())
+        if (!doInitialization()) {
+            *pool = NULL;
+            return NO_MEMORY;
+        }
+    rml::internal::MemoryPool *memPool =
+        (rml::internal::MemoryPool*)internalMalloc((sizeof(rml::internal::MemoryPool)));
+    if (!memPool) {
+        *pool = NULL;
+        return NO_MEMORY;
+    }
+    memset(memPool, 0, sizeof(rml::internal::MemoryPool));
+    if (!memPool->init(pool_id, policy)) {
+        internalFree(memPool);
+        *pool = NULL;
+        return NO_MEMORY;
+    }
+
+    *pool = (rml::MemoryPool*)memPool;
+    return POOL_OK;
+}
+
+bool pool_destroy(rml::MemoryPool* memPool)
+{
+    if (!memPool) return false;
+    bool ret = ((rml::internal::MemoryPool*)memPool)->destroy();
+    internalFree(memPool);
+
+    return ret;
+}
+
+bool pool_reset(rml::MemoryPool* memPool)
+{
+    if (!memPool) return false;
+
+    return ((rml::internal::MemoryPool*)memPool)->reset();
+}
+
+void *pool_malloc(rml::MemoryPool* mPool, size_t size)
+{
+    return internalPoolMalloc((rml::internal::MemoryPool*)mPool, size);
+}
+
+void *pool_realloc(rml::MemoryPool* mPool, void *object, size_t size)
+{
+    if (!object)
+        return internalPoolMalloc((rml::internal::MemoryPool*)mPool, size);
+    if (!size) {
+        internalPoolFree((rml::internal::MemoryPool*)mPool, object, 0);
+        return NULL;
+    }
+    return reallocAligned((rml::internal::MemoryPool*)mPool, object, size, 0);
+}
+
+void *pool_aligned_malloc(rml::MemoryPool* mPool, size_t size, size_t alignment)
+{
+    if (!isPowerOfTwo(alignment) || 0==size)
+        return NULL;
+
+    return allocateAligned((rml::internal::MemoryPool*)mPool, size, alignment);
+}
+
+void *pool_aligned_realloc(rml::MemoryPool* memPool, void *ptr, size_t size, size_t alignment)
+{
+    if (!isPowerOfTwo(alignment))
+        return NULL;
+    rml::internal::MemoryPool *mPool = (rml::internal::MemoryPool*)memPool;
+    void *tmp;
+
+    if (!ptr)
+        tmp = allocateAligned(mPool, size, alignment);
+    else if (!size) {
+        internalPoolFree(mPool, ptr, 0);
+        return NULL;
+    } else
+        tmp = reallocAligned(mPool, ptr, size, alignment);
+
+    return tmp;
+}
+
+bool pool_free(rml::MemoryPool *mPool, void *object)
+{
+    return internalPoolFree((rml::internal::MemoryPool*)mPool, object, 0);
+}
+
+rml::MemoryPool *pool_identify(void *object)
+{
+    rml::internal::MemoryPool *pool;
+    if (isLargeObject<ourMem>(object)) {
+        LargeObjectHdr *header = (LargeObjectHdr*)object - 1;
+        pool = header->memoryBlock->pool;
+    } else {
+        Block *block = (Block*)alignDown(object, slabSize);
+        pool = block->getMemPool();
+    }
+    // do not return defaultMemPool, as it can't be used in pool_free() etc
+    __TBB_ASSERT_RELEASE(pool!=defaultMemPool,
+        "rml::pool_identify() can't be used for scalable_malloc() etc results.");
+    return (rml::MemoryPool*)pool;
+}
+
+} // namespace rml
+
+using namespace rml::internal;
+
+#if MALLOC_TRACE
+static unsigned int threadGoingDownCount = 0;
+#endif
+
+/*
+ * When a thread is shutting down this routine should be called to remove all the thread ids
+ * from the malloc blocks and replace them with a NULL thread id.
+ *
+ * For pthreads, the function is set as a callback in pthread_key_create for TLS bin.
+ * It will be automatically called at thread exit with the key value as the argument,
+ * unless that value is NULL.
+ * For Windows, it is called from DllMain( DLL_THREAD_DETACH ).
+ *
+ * However neither of the above is called for the main process thread, so the routine
+ * also needs to be called during the process shutdown.
+ *
+*/
+// TODO: Consider making this function part of class MemoryPool.
+void doThreadShutdownNotification(TLSData* tls, bool main_thread)
+{
+    TRACEF(( "[ScalableMalloc trace] Thread id %d blocks return start %d\n",
+             getThreadId(),  threadGoingDownCount++ ));
+
+#if USE_PTHREAD
+    if (tls) {
+        if (!shutdownSync.threadDtorStart()) return;
+        tls->getMemPool()->onThreadShutdown(tls);
+        shutdownSync.threadDtorDone();
+    } else
+#endif
+    {
+        suppress_unused_warning(tls); // not used on Windows
+        // The default pool is safe to use at this point:
+        //   on Linux, only the main thread can go here before destroying defaultMemPool;
+        //   on Windows, shutdown is synchronized via loader lock and isMallocInitialized().
+        // See also __TBB_mallocProcessShutdownNotification()
+        defaultMemPool->onThreadShutdown(defaultMemPool->getTLS(/*create=*/false));
+        // Take lock to walk through other pools; but waiting might be dangerous at this point
+        // (e.g. on Windows the main thread might deadlock)
+        bool locked;
+        MallocMutex::scoped_lock lock(MemoryPool::memPoolListLock, /*wait=*/!main_thread, &locked);
+        if (locked) { // the list is safe to process
+            for (MemoryPool *memPool = defaultMemPool->next; memPool; memPool = memPool->next)
+                memPool->onThreadShutdown(memPool->getTLS(/*create=*/false));
+        }
+    }
+
+    TRACEF(( "[ScalableMalloc trace] Thread id %d blocks return end\n", getThreadId() ));
+}
+
+#if USE_PTHREAD
+void mallocThreadShutdownNotification(void* arg)
+{
+    // The routine is called for each pool (as TLS dtor) on each thread, except for the main thread
+    if (!isMallocInitialized()) return;
+    doThreadShutdownNotification((TLSData*)arg, false);
+}
+#else
+extern "C" void __TBB_mallocThreadShutdownNotification()
+{
+    // The routine is called once per thread on Windows
+    if (!isMallocInitialized()) return;
+    doThreadShutdownNotification(NULL, false);
+}
+#endif
+
+extern "C" void __TBB_mallocProcessShutdownNotification(bool windows_process_dying)
+{
+    if (!isMallocInitialized()) return;
+
+    // Don't clean allocator internals if the entire process is exiting
+    if (!windows_process_dying) {
+        doThreadShutdownNotification(NULL, /*main_thread=*/true);
+    }
+#if  __TBB_MALLOC_LOCACHE_STAT
+    printf("cache hit ratio %f, size hit %f\n",
+           1.*cacheHits/mallocCalls, 1.*memHitKB/memAllocKB);
+    defaultMemPool->extMemPool.loc.reportStat(stdout);
+#endif
+
+    shutdownSync.processExit();
+#if __TBB_SOURCE_DIRECTLY_INCLUDED
+/* Pthread keys must be deleted as soon as possible to not call key dtor
+   on thread termination when then the tbbmalloc code can be already unloaded.
+*/
+    defaultMemPool->destroy();
+    destroyBackRefMaster(&defaultMemPool->extMemPool.backend);
+    ThreadId::destroy();      // Delete key for thread id
+    hugePages.reset();
+    // new total malloc initialization is possible after this point
+    FencedStore(mallocInitialized, 0);
+#elif __TBB_USE_DLOPEN_REENTRANCY_WORKAROUND
+/* In most cases we prevent unloading tbbmalloc, and don't clean up memory
+   on process shutdown. When impossible to prevent, library unload results
+   in shutdown notification, and it makes sense to release unused memory
+   at that point (we can't release all memory because it's possible that
+   it will be accessed after this point).
+   TODO: better support systems where we can't prevent unloading by removing
+   pthread destructors and releasing caches.
+ */
+    defaultMemPool->extMemPool.hardCachesCleanup();
+#endif // __TBB_SOURCE_DIRECTLY_INCLUDED
+
+#if COLLECT_STATISTICS
+    unsigned nThreads = ThreadId::getMaxThreadId();
+    for( int i=1; i<=nThreads && i<MAX_THREADS; ++i )
+        STAT_print(i);
+#endif
+    if (!usedBySrcIncluded)
+        MALLOC_ITT_FINI_ITTLIB();
+}
+
+extern "C" void * scalable_malloc(size_t size)
+{
+    void *ptr = internalMalloc(size);
+    if (!ptr) errno = ENOMEM;
+    return ptr;
+}
+
+extern "C" void scalable_free (void *object) {
+    internalFree(object);
+}
+
+#if MALLOC_ZONE_OVERLOAD_ENABLED
+extern "C" void __TBB_malloc_free_definite_size(void *object, size_t size) {
+    internalPoolFree(defaultMemPool, object, size);
+}
+#endif
+
+/*
+ * A variant that provides additional memory safety, by checking whether the given address
+ * was obtained with this allocator, and if not redirecting to the provided alternative call.
+ */
+extern "C" void __TBB_malloc_safer_free(void *object, void (*original_free)(void*))
+{
+    if (!object)
+        return;
+
+    // tbbmalloc can allocate object only when tbbmalloc has been initialized
+    if (FencedLoad(mallocInitialized) && defaultMemPool->extMemPool.backend.ptrCanBeValid(object)) {
+        if (isLargeObject<unknownMem>(object)) {
+            // must check 1st for large object, because small object check touches 4 pages on left,
+            // and it can be inaccessible
+            TLSData *tls = defaultMemPool->getTLS(/*create=*/false);
+
+            defaultMemPool->putToLLOCache(tls, object);
+            return;
+        } else if (isSmallObject(object)) {
+            freeSmallObject(object);
+            return;
+        }
+    }
+    if (original_free)
+        original_free(object);
+}
+
+/********* End the free code        *************/
+
+/********* Code for scalable_realloc       ***********/
+
+/*
+ * From K&R
+ * "realloc changes the size of the object pointed to by p to size. The contents will
+ * be unchanged up to the minimum of the old and the new sizes. If the new size is larger,
+ * the new space is uninitialized. realloc returns a pointer to the new space, or
+ * NULL if the request cannot be satisfied, in which case *p is unchanged."
+ *
+ */
+extern "C" void* scalable_realloc(void* ptr, size_t size)
+{
+    void *tmp;
+
+    if (!ptr)
+        tmp = internalMalloc(size);
+    else if (!size) {
+        internalFree(ptr);
+        return NULL;
+    } else
+        tmp = reallocAligned(defaultMemPool, ptr, size, 0);
+
+    if (!tmp) errno = ENOMEM;
+    return tmp;
+}
+
+/*
+ * A variant that provides additional memory safety, by checking whether the given address
+ * was obtained with this allocator, and if not redirecting to the provided alternative call.
+ */
+extern "C" void* __TBB_malloc_safer_realloc(void* ptr, size_t sz, void* original_realloc)
+{
+    void *tmp; // TODO: fix warnings about uninitialized use of tmp
+
+    if (!ptr) {
+        tmp = internalMalloc(sz);
+    } else if (FencedLoad(mallocInitialized) && isRecognized(ptr)) {
+        if (!sz) {
+            internalFree(ptr);
+            return NULL;
+        } else {
+            tmp = reallocAligned(defaultMemPool, ptr, sz, 0);
+        }
+    }
+#if USE_WINTHREAD
+    else if (original_realloc && sz) {
+        orig_ptrs *original_ptrs = static_cast<orig_ptrs*>(original_realloc);
+        if ( original_ptrs->msize ){
+            size_t oldSize = original_ptrs->msize(ptr);
+            tmp = internalMalloc(sz);
+            if (tmp) {
+                memcpy(tmp, ptr, sz<oldSize? sz : oldSize);
+                if ( original_ptrs->free ){
+                    original_ptrs->free( ptr );
+                }
+            }
+        } else
+            tmp = NULL;
+    }
+#else
+    else if (original_realloc) {
+        typedef void* (*realloc_ptr_t)(void*,size_t);
+        realloc_ptr_t original_realloc_ptr;
+        (void *&)original_realloc_ptr = original_realloc;
+        tmp = original_realloc_ptr(ptr,sz);
+    }
+#endif
+    else tmp = NULL;
+
+    if (!tmp) errno = ENOMEM;
+    return tmp;
+}
+
+/********* End code for scalable_realloc   ***********/
+
+/********* Code for scalable_calloc   ***********/
+
+/*
+ * From K&R
+ * calloc returns a pointer to space for an array of nobj objects,
+ * each of size size, or NULL if the request cannot be satisfied.
+ * The space is initialized to zero bytes.
+ *
+ */
+
+extern "C" void * scalable_calloc(size_t nobj, size_t size)
+{
+    // it's square root of maximal size_t value
+    const size_t mult_not_overflow = size_t(1) << (sizeof(size_t)*CHAR_BIT/2);
+    const size_t arraySize = nobj * size;
+
+    // check for overflow during multiplication:
+    if (nobj>=mult_not_overflow || size>=mult_not_overflow) // 1) heuristic check
+        if (nobj && arraySize / nobj != size) {             // 2) exact check
+            errno = ENOMEM;
+            return NULL;
+        }
+    void* result = internalMalloc(arraySize);
+    if (result)
+        memset(result, 0, arraySize);
+    else
+        errno = ENOMEM;
+    return result;
+}
+
+/********* End code for scalable_calloc   ***********/
+
+/********* Code for aligned allocation API **********/
+
+extern "C" int scalable_posix_memalign(void **memptr, size_t alignment, size_t size)
+{
+    if ( !isPowerOfTwoAtLeast(alignment, sizeof(void*)) )
+        return EINVAL;
+    void *result = allocateAligned(defaultMemPool, size, alignment);
+    if (!result)
+        return ENOMEM;
+    *memptr = result;
+    return 0;
+}
+
+extern "C" void * scalable_aligned_malloc(size_t size, size_t alignment)
+{
+    if (!isPowerOfTwo(alignment) || 0==size) {
+        errno = EINVAL;
+        return NULL;
+    }
+    void *tmp = allocateAligned(defaultMemPool, size, alignment);
+    if (!tmp) errno = ENOMEM;
+    return tmp;
+}
+
+extern "C" void * scalable_aligned_realloc(void *ptr, size_t size, size_t alignment)
+{
+    if (!isPowerOfTwo(alignment)) {
+        errno = EINVAL;
+        return NULL;
+    }
+    void *tmp;
+
+    if (!ptr)
+        tmp = allocateAligned(defaultMemPool, size, alignment);
+    else if (!size) {
+        scalable_free(ptr);
+        return NULL;
+    } else
+        tmp = reallocAligned(defaultMemPool, ptr, size, alignment);
+
+    if (!tmp) errno = ENOMEM;
+    return tmp;
+}
+
+extern "C" void * __TBB_malloc_safer_aligned_realloc(void *ptr, size_t size, size_t alignment, void* orig_function)
+{
+    /* corner cases left out of reallocAligned to not deal with errno there */
+    if (!isPowerOfTwo(alignment)) {
+        errno = EINVAL;
+        return NULL;
+    }
+    void *tmp = NULL;
+
+    if (!ptr) {
+        tmp = allocateAligned(defaultMemPool, size, alignment);
+    } else if (FencedLoad(mallocInitialized) && isRecognized(ptr)) {
+        if (!size) {
+            internalFree(ptr);
+            return NULL;
+        } else {
+            tmp = reallocAligned(defaultMemPool, ptr, size, alignment);
+        }
+    }
+#if USE_WINTHREAD
+    else {
+        orig_aligned_ptrs *original_ptrs = static_cast<orig_aligned_ptrs*>(orig_function);
+        if (size) {
+            // Without orig_msize, we can't do anything with this.
+            // Just keeping old pointer.
+            if ( original_ptrs->aligned_msize ){
+                // set alignment and offset to have possibly correct oldSize
+                size_t oldSize = original_ptrs->aligned_msize(ptr, sizeof(void*), 0);
+                tmp = allocateAligned(defaultMemPool, size, alignment);
+                if (tmp) {
+                    memcpy(tmp, ptr, size<oldSize? size : oldSize);
+                    if ( original_ptrs->aligned_free ){
+                        original_ptrs->aligned_free( ptr );
+                    }
+                }
+            }
+        } else {
+            if ( original_ptrs->aligned_free ){
+                original_ptrs->aligned_free( ptr );
+            }
+            return NULL;
+        }
+    }
+#else
+    // As original_realloc can't align result, and there is no way to find
+    // size of reallocating object, we are giving up.
+    suppress_unused_warning(orig_function);
+#endif
+    if (!tmp) errno = ENOMEM;
+    return tmp;
+}
+
+extern "C" void scalable_aligned_free(void *ptr)
+{
+    internalFree(ptr);
+}
+
+/********* end code for aligned allocation API **********/
+
+/********* Code for scalable_msize       ***********/
+
+/*
+ * Returns the size of a memory block allocated in the heap.
+ */
+extern "C" size_t scalable_msize(void* ptr)
+{
+    return internalMsize(ptr);
+}
+
+/*
+ * A variant that provides additional memory safety, by checking whether the given address
+ * was obtained with this allocator, and if not redirecting to the provided alternative call.
+ */
+extern "C" size_t __TBB_malloc_safer_msize(void *object, size_t (*original_msize)(void*))
+{
+    if (object) {
+        // Check if the memory was allocated by scalable_malloc
+        if (FencedLoad(mallocInitialized) && isRecognized(object))
+            return internalMsize(object);
+        else if (original_msize)
+            return original_msize(object);
+    }
+    // object is NULL or unknown, or foreign and no original_msize
+#if USE_WINTHREAD
+    errno = EINVAL; // errno expected to be set only on this platform
+#endif
+    return 0;
+}
+
+/*
+ * The same as above but for _aligned_msize case
+ */
+extern "C" size_t __TBB_malloc_safer_aligned_msize(void *object, size_t alignment, size_t offset, size_t (*orig_aligned_msize)(void*,size_t,size_t))
+{
+    if (object) {
+        // Check if the memory was allocated by scalable_malloc
+        if (FencedLoad(mallocInitialized) && isRecognized(object))
+            return internalMsize(object);
+        else if (orig_aligned_msize)
+            return orig_aligned_msize(object,alignment,offset);
+    }
+    // object is NULL or unknown
+    errno = EINVAL;
+    return 0;
+}
+
+/********* End code for scalable_msize   ***********/
+
+extern "C" int scalable_allocation_mode(int param, intptr_t value)
+{
+    if (param == TBBMALLOC_SET_SOFT_HEAP_LIMIT) {
+        defaultMemPool->extMemPool.backend.setRecommendedMaxSize((size_t)value);
+        return TBBMALLOC_OK;
+    } else if (param == USE_HUGE_PAGES) {
+#if __linux__
+        switch (value) {
+        case 0:
+        case 1:
+            hugePages.setMode(value);
+            return TBBMALLOC_OK;
+        default:
+            return TBBMALLOC_INVALID_PARAM;
+        }
+#else
+        return TBBMALLOC_NO_EFFECT;
+#endif
+#if __TBB_SOURCE_DIRECTLY_INCLUDED
+    } else if (param == TBBMALLOC_INTERNAL_SOURCE_INCLUDED) {
+        switch (value) {
+        case 0: // used by dynamic library
+        case 1: // used by static library or directly included sources
+            usedBySrcIncluded = value;
+            return TBBMALLOC_OK;
+        default:
+            return TBBMALLOC_INVALID_PARAM;
+        }
+#endif
+    }
+    return TBBMALLOC_INVALID_PARAM;
+}
+
+extern "C" int scalable_allocation_command(int cmd, void *param)
+{
+    if (param)
+        return TBBMALLOC_INVALID_PARAM;
+    switch(cmd) {
+    case TBBMALLOC_CLEAN_THREAD_BUFFERS:
+        if (TLSData *tls = defaultMemPool->getTLS(/*create=*/false))
+            return tls->externalCleanup(&defaultMemPool->extMemPool,
+                                        /*cleanOnlyUnused=*/false)?
+                TBBMALLOC_OK : TBBMALLOC_NO_EFFECT;
+        return TBBMALLOC_NO_EFFECT;
+    case TBBMALLOC_CLEAN_ALL_BUFFERS:
+        return defaultMemPool->extMemPool.hardCachesCleanup()?
+            TBBMALLOC_OK : TBBMALLOC_NO_EFFECT;
+    }
+    return TBBMALLOC_INVALID_PARAM;
+}
diff --git a/xdl/third_party/tbb/src/tbbmalloc/index.html b/xdl/third_party/tbb/src/tbbmalloc/index.html
new file mode 100644
index 00000000..d39803ae
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/index.html
@@ -0,0 +1,54 @@
+<HTML>
+<body>
+<H2>Overview</H2>
+<P>
+This directory contains the Intel&reg; Threading Building Blocks (Intel&reg; TBB) scalable allocator library source files.
+</P>
+
+<HR>
+<p></p>
+Copyright &copy; 2005-2018 Intel Corporation.  All Rights Reserved.
+<P></P>
+Intel is a registered trademark or trademark of Intel Corporation
+or its subsidiaries in the United States and other countries.
+<p></p>
+* Other names and brands may be claimed as the property of others.
+
+<P>
+<H3>Third Party and Open Source Licenses</H3>
+</P>
+<P>
+    <pre>
+    proxy_overload_osx.h
+    // Copyright (c) 2011, Google Inc.
+    // All rights reserved.
+    //
+    // Redistribution and use in source and binary forms, with or without
+    // modification, are permitted provided that the following conditions are
+    // met:
+    //
+    //     * Redistributions of source code must retain the above copyright
+    // notice, this list of conditions and the following disclaimer.
+    //     * Redistributions in binary form must reproduce the above
+    // copyright notice, this list of conditions and the following disclaimer
+    // in the documentation and/or other materials provided with the
+    // distribution.
+    //     * Neither the name of Google Inc. nor the names of its
+    // contributors may be used to endorse or promote products derived from
+    // this software without specific prior written permission.
+    //
+    // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+    // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+    // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+    // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+    // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+    // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+    // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+    // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+    // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+    // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+    // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+    </pre>
+</P>
+</body>
+</HTML>
diff --git a/xdl/third_party/tbb/src/tbbmalloc/large_objects.cpp b/xdl/third_party/tbb/src/tbbmalloc/large_objects.cpp
new file mode 100644
index 00000000..07d12949
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/large_objects.cpp
@@ -0,0 +1,976 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbbmalloc_internal.h"
+
+/********* Allocation of large objects ************/
+
+
+namespace rml {
+namespace internal {
+
+
+/* The functor called by the aggregator for the operation list */
+template<typename Props>
+class CacheBinFunctor {
+    typename LargeObjectCacheImpl<Props>::CacheBin *const bin;
+    ExtMemoryPool *const extMemPool;
+    typename LargeObjectCacheImpl<Props>::BinBitMask *const bitMask;
+    const int idx;
+
+    LargeMemoryBlock *toRelease;
+    bool needCleanup;
+    uintptr_t currTime;
+
+    /* Do preprocessing under the operation list. */
+    /* All the OP_PUT_LIST operations are merged in the one operation.
+       All OP_GET operations are merged with the OP_PUT_LIST operations but
+       it demands the update of the moving average value in the bin.
+       Only the last OP_CLEAN_TO_THRESHOLD operation has sense.
+       The OP_CLEAN_ALL operation also should be performed only once.
+       Moreover it cancels the OP_CLEAN_TO_THRESHOLD operation. */
+    class OperationPreprocessor {
+        // TODO: remove the dependency on CacheBin.
+        typename LargeObjectCacheImpl<Props>::CacheBin *const  bin;
+
+        /* Contains the relative time in the operation list.
+           It counts in the reverse order since the aggregator also
+           provides operations in the reverse order. */
+        uintptr_t lclTime;
+
+        /* opGet contains only OP_GET operations which cannot be merge with OP_PUT operations
+           opClean contains all OP_CLEAN_TO_THRESHOLD and OP_CLEAN_ALL operations. */
+        CacheBinOperation *opGet, *opClean;
+        /* The time of the last OP_CLEAN_TO_THRESHOLD operations */
+        uintptr_t cleanTime;
+
+        /* lastGetOpTime - the time of the last OP_GET operation.
+           lastGet - the same meaning as CacheBin::lastGet */
+        uintptr_t lastGetOpTime, lastGet;
+
+        /* The total sum of all usedSize changes requested with CBOP_UPDATE_USED_SIZE operations. */
+        size_t updateUsedSize;
+
+        /* The list of blocks for the OP_PUT_LIST operation. */
+        LargeMemoryBlock *head, *tail;
+        int putListNum;
+
+        /* if the OP_CLEAN_ALL is requested. */
+        bool isCleanAll;
+
+        inline void commitOperation(CacheBinOperation *op) const;
+        inline void addOpToOpList(CacheBinOperation *op, CacheBinOperation **opList) const;
+        bool getFromPutList(CacheBinOperation* opGet, uintptr_t currTime);
+        void addToPutList( LargeMemoryBlock *head, LargeMemoryBlock *tail, int num );
+
+    public:
+        OperationPreprocessor(typename LargeObjectCacheImpl<Props>::CacheBin *bin) :
+            bin(bin), lclTime(0), opGet(NULL), opClean(NULL), cleanTime(0),
+            lastGetOpTime(0), updateUsedSize(0), head(NULL), isCleanAll(false)  {}
+        void operator()(CacheBinOperation* opList);
+        uintptr_t getTimeRange() const { return -lclTime; }
+
+        friend class CacheBinFunctor;
+    };
+
+public:
+    CacheBinFunctor(typename LargeObjectCacheImpl<Props>::CacheBin *bin, ExtMemoryPool *extMemPool,
+                    typename LargeObjectCacheImpl<Props>::BinBitMask *bitMask, int idx) :
+        bin(bin), extMemPool(extMemPool), bitMask(bitMask), idx(idx), toRelease(NULL), needCleanup(false) {}
+    void operator()(CacheBinOperation* opList);
+
+    bool isCleanupNeeded() const { return needCleanup; }
+    LargeMemoryBlock *getToRelease() const { return toRelease; }
+    uintptr_t getCurrTime() const { return currTime; }
+};
+
+// ---------------- Cache Bin Aggregator Operation Helpers ---------------- //
+// The list of possible operations.
+enum CacheBinOperationType {
+    CBOP_INVALID = 0,
+    CBOP_GET,
+    CBOP_PUT_LIST,
+    CBOP_CLEAN_TO_THRESHOLD,
+    CBOP_CLEAN_ALL,
+    CBOP_UPDATE_USED_SIZE
+};
+
+// The operation status list. CBST_NOWAIT can be specified for non-blocking operations.
+enum CacheBinOperationStatus {
+    CBST_WAIT = 0,
+    CBST_NOWAIT,
+    CBST_DONE
+};
+
+// The list of structures which describe the operation data
+struct OpGet {
+    static const CacheBinOperationType type = CBOP_GET;
+    LargeMemoryBlock **res;
+    size_t size;
+    uintptr_t currTime;
+};
+
+struct OpPutList {
+    static const CacheBinOperationType type = CBOP_PUT_LIST;
+    LargeMemoryBlock *head;
+};
+
+struct OpCleanToThreshold {
+    static const CacheBinOperationType type = CBOP_CLEAN_TO_THRESHOLD;
+    LargeMemoryBlock **res;
+    uintptr_t currTime;
+};
+
+struct OpCleanAll {
+    static const CacheBinOperationType type = CBOP_CLEAN_ALL;
+    LargeMemoryBlock **res;
+};
+
+struct OpUpdateUsedSize {
+    static const CacheBinOperationType type = CBOP_UPDATE_USED_SIZE;
+    size_t size;
+};
+
+union CacheBinOperationData {
+private:
+    OpGet opGet;
+    OpPutList opPutList;
+    OpCleanToThreshold opCleanToThreshold;
+    OpCleanAll opCleanAll;
+    OpUpdateUsedSize opUpdateUsedSize;
+};
+
+// Forward declarations
+template <typename OpTypeData> OpTypeData& opCast(CacheBinOperation &op);
+
+// Describes the aggregator operation
+struct CacheBinOperation : public MallocAggregatedOperation<CacheBinOperation>::type {
+    CacheBinOperationType type;
+
+    template <typename OpTypeData>
+    CacheBinOperation(OpTypeData &d, CacheBinOperationStatus st = CBST_WAIT) {
+        opCast<OpTypeData>(*this) = d;
+        type = OpTypeData::type;
+        MallocAggregatedOperation<CacheBinOperation>::type::status = st;
+    }
+private:
+    CacheBinOperationData data;
+
+    template <typename OpTypeData>
+    friend OpTypeData& opCast(CacheBinOperation &op);
+};
+
+// The opCast function can be the member of CacheBinOperation but it will have
+// small stylistic ambiguity: it will look like a getter (with a cast) for the
+// CacheBinOperation::data data member but it should return a reference to
+// simplify the code from a lot of getter/setter calls. So the global cast in
+// the style of static_cast (or reinterpret_cast) seems to be more readable and
+// have more explicit semantic.
+template <typename OpTypeData>
+OpTypeData& opCast(CacheBinOperation &op) {
+    return *reinterpret_cast<OpTypeData*>(&op.data);
+}
+// ------------------------------------------------------------------------ //
+
+#if __TBB_MALLOC_LOCACHE_STAT
+intptr_t mallocCalls, cacheHits;
+intptr_t memAllocKB, memHitKB;
+#endif
+
+inline bool lessThanWithOverflow(intptr_t a, intptr_t b)
+{
+    return (a < b && (b - a < UINTPTR_MAX/2)) ||
+           (a > b && (a - b > UINTPTR_MAX/2));
+}
+
+/* ----------------------------------- Operation processing methods ------------------------------------ */
+
+template<typename Props> void CacheBinFunctor<Props>::
+    OperationPreprocessor::commitOperation(CacheBinOperation *op) const
+{
+    FencedStore( (intptr_t&)(op->status), CBST_DONE );
+}
+
+template<typename Props> void CacheBinFunctor<Props>::
+    OperationPreprocessor::addOpToOpList(CacheBinOperation *op, CacheBinOperation **opList) const
+{
+    op->next = *opList;
+    *opList = op;
+}
+
+template<typename Props> bool CacheBinFunctor<Props>::
+    OperationPreprocessor::getFromPutList(CacheBinOperation *opGet, uintptr_t currTime)
+{
+    if ( head ) {
+        uintptr_t age = head->age;
+        LargeMemoryBlock *next = head->next;
+        *opCast<OpGet>(*opGet).res = head;
+        commitOperation( opGet );
+        head = next;
+        putListNum--;
+        MALLOC_ASSERT( putListNum>=0, ASSERT_TEXT );
+
+        // use moving average with current hit interval
+        bin->updateMeanHitRange( currTime - age );
+        return true;
+    }
+    return false;
+}
+
+template<typename Props> void CacheBinFunctor<Props>::
+    OperationPreprocessor::addToPutList(LargeMemoryBlock *h, LargeMemoryBlock *t, int num)
+{
+    if ( head ) {
+        MALLOC_ASSERT( tail, ASSERT_TEXT );
+        tail->next = h;
+        h->prev = tail;
+        tail = t;
+        putListNum += num;
+    } else {
+        head = h;
+        tail = t;
+        putListNum = num;
+    }
+}
+
+template<typename Props> void CacheBinFunctor<Props>::
+    OperationPreprocessor::operator()(CacheBinOperation* opList)
+{
+    for ( CacheBinOperation *op = opList, *opNext; op; op = opNext ) {
+        opNext = op->next;
+        switch ( op->type ) {
+        case CBOP_GET:
+            {
+                lclTime--;
+                if ( !lastGetOpTime ) {
+                    lastGetOpTime = lclTime;
+                    lastGet = 0;
+                } else if ( !lastGet ) lastGet = lclTime;
+
+                if ( !getFromPutList(op,lclTime) ) {
+                    opCast<OpGet>(*op).currTime = lclTime;
+                    addOpToOpList( op, &opGet );
+                }
+            }
+            break;
+
+        case CBOP_PUT_LIST:
+            {
+                LargeMemoryBlock *head = opCast<OpPutList>(*op).head;
+                LargeMemoryBlock *curr = head, *prev = NULL;
+
+                int num = 0;
+                do {
+                    // we do not kept prev pointers during assigning blocks to bins, set them now
+                    curr->prev = prev;
+
+                    // Save the local times to the memory blocks. Local times are necessary
+                    // for the getFromPutList function which updates the hit range value in
+                    // CacheBin when OP_GET and OP_PUT_LIST operations are merged successfully.
+                    // The age will be updated to the correct global time after preprocessing
+                    // when global cache time is updated.
+                    curr->age = --lclTime;
+
+                    prev = curr;
+                    num += 1;
+
+                    STAT_increment(getThreadId(), ThreadCommonCounters, cacheLargeObj);
+                } while ((curr = curr->next) != NULL);
+
+                LargeMemoryBlock *tail = prev;
+                addToPutList(head, tail, num);
+
+                while ( opGet ) {
+                    CacheBinOperation *next = opGet->next;
+                    if ( !getFromPutList(opGet, opCast<OpGet>(*opGet).currTime) )
+                        break;
+                    opGet = next;
+                }
+            }
+            break;
+
+        case CBOP_UPDATE_USED_SIZE:
+            updateUsedSize += opCast<OpUpdateUsedSize>(*op).size;
+            commitOperation( op );
+            break;
+
+        case CBOP_CLEAN_ALL:
+            isCleanAll = true;
+            addOpToOpList( op, &opClean );
+            break;
+
+        case CBOP_CLEAN_TO_THRESHOLD:
+            {
+                uintptr_t currTime = opCast<OpCleanToThreshold>(*op).currTime;
+                // We don't worry about currTime overflow since it is a rare
+                // occurrence and doesn't affect correctness
+                cleanTime = cleanTime < currTime ? currTime : cleanTime;
+                addOpToOpList( op, &opClean );
+            }
+            break;
+
+        default:
+            MALLOC_ASSERT( false, "Unknown operation." );
+        }
+    }
+    MALLOC_ASSERT( !( opGet && head ), "Not all put/get pairs are processed!" );
+}
+
+template<typename Props> void CacheBinFunctor<Props>::operator()(CacheBinOperation* opList)
+{
+    MALLOC_ASSERT( opList, "Empty operation list is passed into operation handler." );
+
+    OperationPreprocessor prep(bin);
+    prep(opList);
+
+    if ( uintptr_t timeRange = prep.getTimeRange() ) {
+        uintptr_t startTime = extMemPool->loc.getCurrTimeRange(timeRange);
+        // endTime is used as the current (base) time since the local time is negative.
+        uintptr_t endTime = startTime + timeRange;
+
+        if ( prep.lastGetOpTime && prep.lastGet ) bin->setLastGet(prep.lastGet+endTime);
+
+        if ( CacheBinOperation *opGet = prep.opGet ) {
+            bool isEmpty = false;
+            do {
+#if __TBB_MALLOC_WHITEBOX_TEST
+                tbbmalloc_whitebox::locGetProcessed++;
+#endif
+                const OpGet &opGetData = opCast<OpGet>(*opGet);
+                if ( !isEmpty ) {
+                    if ( LargeMemoryBlock *res = bin->get() ) {
+                        uintptr_t getTime = opGetData.currTime + endTime;
+                        // use moving average with current hit interval
+                        bin->updateMeanHitRange( getTime - res->age);
+                        bin->updateCachedSize( -opGetData.size );
+                        *opGetData.res = res;
+                    } else {
+                        isEmpty = true;
+                        uintptr_t lastGetOpTime = prep.lastGetOpTime+endTime;
+                        bin->forgetOutdatedState(lastGetOpTime);
+                        bin->updateAgeThreshold(lastGetOpTime);
+                    }
+                }
+
+                CacheBinOperation *opNext = opGet->next;
+                bin->updateUsedSize( opGetData.size, bitMask, idx );
+                prep.commitOperation( opGet );
+                opGet = opNext;
+            } while ( opGet );
+            if ( prep.lastGetOpTime )
+                bin->setLastGet( prep.lastGetOpTime + endTime );
+        } else if ( LargeMemoryBlock *curr = prep.head ) {
+            curr->prev = NULL;
+            while ( curr ) {
+                // Update local times to global times
+                curr->age += endTime;
+                curr=curr->next;
+            }
+#if __TBB_MALLOC_WHITEBOX_TEST
+            tbbmalloc_whitebox::locPutProcessed+=prep.putListNum;
+#endif
+            toRelease = bin->putList(prep.head, prep.tail, bitMask, idx, prep.putListNum);
+        }
+        needCleanup = extMemPool->loc.isCleanupNeededOnRange(timeRange, startTime);
+        currTime = endTime - 1;
+    }
+
+    if ( CacheBinOperation *opClean = prep.opClean ) {
+        if ( prep.isCleanAll )
+            *opCast<OpCleanAll>(*opClean).res = bin->cleanAll(bitMask, idx);
+        else
+            *opCast<OpCleanToThreshold>(*opClean).res = bin->cleanToThreshold(prep.cleanTime, bitMask, idx);
+
+        CacheBinOperation *opNext = opClean->next;
+        prep.commitOperation( opClean );
+
+        while ((opClean = opNext) != NULL) {
+            opNext = opClean->next;
+            prep.commitOperation(opClean);
+        }
+    }
+
+    if ( size_t size = prep.updateUsedSize )
+        bin->updateUsedSize(size, bitMask, idx);
+}
+/* ----------------------------------------------------------------------------------------------------- */
+/* --------------------------- Methods for creating and executing operations --------------------------- */
+template<typename Props> void LargeObjectCacheImpl<Props>::
+    CacheBin::ExecuteOperation(CacheBinOperation *op, ExtMemoryPool *extMemPool, BinBitMask *bitMask, int idx, bool longLifeTime)
+{
+    CacheBinFunctor<Props> func( this, extMemPool, bitMask, idx );
+    aggregator.execute( op, func, longLifeTime );
+
+    if (  LargeMemoryBlock *toRelease = func.getToRelease() )
+        extMemPool->backend.returnLargeObject(toRelease);
+
+    if ( func.isCleanupNeeded() )
+        extMemPool->loc.doCleanup( func.getCurrTime(), /*doThreshDecr=*/false);
+}
+
+template<typename Props> LargeMemoryBlock *LargeObjectCacheImpl<Props>::
+    CacheBin::get(ExtMemoryPool *extMemPool, size_t size, BinBitMask *bitMask, int idx)
+{
+    LargeMemoryBlock *lmb=NULL;
+    OpGet data = {&lmb, size};
+    CacheBinOperation op(data);
+    ExecuteOperation( &op, extMemPool, bitMask, idx );
+    return lmb;
+}
+
+template<typename Props> void LargeObjectCacheImpl<Props>::
+    CacheBin::putList(ExtMemoryPool *extMemPool, LargeMemoryBlock *head, BinBitMask *bitMask, int idx)
+{
+    MALLOC_ASSERT(sizeof(LargeMemoryBlock)+sizeof(CacheBinOperation)<=head->unalignedSize, "CacheBinOperation is too large to be placed in LargeMemoryBlock!");
+
+    OpPutList data = {head};
+    CacheBinOperation *op = new (head+1) CacheBinOperation(data, CBST_NOWAIT);
+    ExecuteOperation( op, extMemPool, bitMask, idx, false );
+}
+
+template<typename Props> bool LargeObjectCacheImpl<Props>::
+    CacheBin::cleanToThreshold(ExtMemoryPool *extMemPool, BinBitMask *bitMask, uintptr_t currTime, int idx)
+{
+    LargeMemoryBlock *toRelease = NULL;
+
+    /* oldest may be more recent then age, that's why cast to signed type
+       was used. age overflow is also processed correctly. */
+    if (last && (intptr_t)(currTime - oldest) > ageThreshold) {
+        OpCleanToThreshold data = {&toRelease, currTime};
+        CacheBinOperation op(data);
+        ExecuteOperation( &op, extMemPool, bitMask, idx );
+    }
+    bool released = toRelease;
+
+    Backend *backend = &extMemPool->backend;
+    while ( toRelease ) {
+        LargeMemoryBlock *helper = toRelease->next;
+        backend->returnLargeObject(toRelease);
+        toRelease = helper;
+    }
+    return released;
+}
+
+template<typename Props> bool LargeObjectCacheImpl<Props>::
+    CacheBin::releaseAllToBackend(ExtMemoryPool *extMemPool, BinBitMask *bitMask, int idx)
+{
+    LargeMemoryBlock *toRelease = NULL;
+
+    if (last) {
+        OpCleanAll data = {&toRelease};
+        CacheBinOperation op(data);
+        ExecuteOperation(&op, extMemPool, bitMask, idx);
+    }
+    bool released = toRelease;
+
+    Backend *backend = &extMemPool->backend;
+    while ( toRelease ) {
+        LargeMemoryBlock *helper = toRelease->next;
+        MALLOC_ASSERT(!helper || lessThanWithOverflow(helper->age, toRelease->age),
+                      ASSERT_TEXT);
+        backend->returnLargeObject(toRelease);
+        toRelease = helper;
+    }
+    return released;
+}
+
+template<typename Props> void LargeObjectCacheImpl<Props>::
+    CacheBin::updateUsedSize(ExtMemoryPool *extMemPool, size_t size, BinBitMask *bitMask, int idx) {
+    OpUpdateUsedSize data = {size};
+    CacheBinOperation op(data);
+    ExecuteOperation( &op, extMemPool, bitMask, idx );
+}
+/* ----------------------------------------------------------------------------------------------------- */
+/* ------------------------------ Unsafe methods used with the aggregator ------------------------------ */
+template<typename Props> LargeMemoryBlock *LargeObjectCacheImpl<Props>::
+    CacheBin::putList(LargeMemoryBlock *head, LargeMemoryBlock *tail, BinBitMask *bitMask, int idx, int num)
+{
+    size_t size = head->unalignedSize;
+    usedSize -= num*size;
+    MALLOC_ASSERT( !last || (last->age != 0 && last->age != -1U), ASSERT_TEXT );
+    MALLOC_ASSERT( (tail==head && num==1) || (tail!=head && num>1), ASSERT_TEXT );
+    LargeMemoryBlock *toRelease = NULL;
+    if (!lastCleanedAge) {
+        // 1st object of such size was released.
+        // Not cache it, and remember when this occurs
+        // to take into account during cache miss.
+        lastCleanedAge = tail->age;
+        toRelease = tail;
+        tail = tail->prev;
+        if (tail)
+            tail->next = NULL;
+        else
+            head = NULL;
+        num--;
+    }
+    if (num) {
+        // add [head;tail] list to cache
+        MALLOC_ASSERT( tail, ASSERT_TEXT );
+        tail->next = first;
+        if (first)
+            first->prev = tail;
+        first = head;
+        if (!last) {
+            MALLOC_ASSERT(0 == oldest, ASSERT_TEXT);
+            oldest = tail->age;
+            last = tail;
+        }
+
+        cachedSize += num*size;
+    }
+
+    // No used object, and nothing in the bin, mark the bin as empty
+    if (!usedSize && !first)
+        bitMask->set(idx, false);
+
+    return toRelease;
+}
+
+template<typename Props> LargeMemoryBlock *LargeObjectCacheImpl<Props>::
+    CacheBin::get()
+{
+    LargeMemoryBlock *result=first;
+    if (result) {
+        first = result->next;
+        if (first)
+            first->prev = NULL;
+        else {
+            last = NULL;
+            oldest = 0;
+        }
+    }
+
+    return result;
+}
+
+// forget the history for the bin if it was unused for long time
+template<typename Props> void LargeObjectCacheImpl<Props>::
+    CacheBin::forgetOutdatedState(uintptr_t currTime)
+{
+    // If the time since the last get is LongWaitFactor times more than ageThreshold
+    // for the bin, treat the bin as rarely-used and forget everything we know
+    // about it.
+    // If LongWaitFactor is too small, we forget too early and
+    // so prevents good caching, while if too high, caching blocks
+    // with unrelated usage pattern occurs.
+    const uintptr_t sinceLastGet = currTime - lastGet;
+    bool doCleanup = false;
+
+    if (ageThreshold)
+        doCleanup = sinceLastGet > Props::LongWaitFactor*ageThreshold;
+    else if (lastCleanedAge)
+        doCleanup = sinceLastGet > Props::LongWaitFactor*(lastCleanedAge - lastGet);
+
+    if (doCleanup) {
+        lastCleanedAge = 0;
+        ageThreshold = 0;
+    }
+
+}
+
+template<typename Props> LargeMemoryBlock *LargeObjectCacheImpl<Props>::
+    CacheBin::cleanToThreshold(uintptr_t currTime, BinBitMask *bitMask, int idx)
+{
+    /* oldest may be more recent then age, that's why cast to signed type
+    was used. age overflow is also processed correctly. */
+    if ( !last || (intptr_t)(currTime - last->age) < ageThreshold ) return NULL;
+
+#if MALLOC_DEBUG
+    uintptr_t nextAge = 0;
+#endif
+    do {
+#if MALLOC_DEBUG
+        // check that list ordered
+        MALLOC_ASSERT(!nextAge || lessThanWithOverflow(nextAge, last->age),
+            ASSERT_TEXT);
+        nextAge = last->age;
+#endif
+        cachedSize -= last->unalignedSize;
+        last = last->prev;
+    } while (last && (intptr_t)(currTime - last->age) > ageThreshold);
+
+    LargeMemoryBlock *toRelease = NULL;
+    if (last) {
+        toRelease = last->next;
+        oldest = last->age;
+        last->next = NULL;
+    } else {
+        toRelease = first;
+        first = NULL;
+        oldest = 0;
+        if (!usedSize)
+            bitMask->set(idx, false);
+    }
+    MALLOC_ASSERT( toRelease, ASSERT_TEXT );
+    lastCleanedAge = toRelease->age;
+
+    return toRelease;
+}
+
+template<typename Props> LargeMemoryBlock *LargeObjectCacheImpl<Props>::
+    CacheBin::cleanAll(BinBitMask *bitMask, int idx)
+{
+    if (!last) return NULL;
+
+    LargeMemoryBlock *toRelease = first;
+    last = NULL;
+    first = NULL;
+    oldest = 0;
+    cachedSize = 0;
+    if (!usedSize)
+        bitMask->set(idx, false);
+
+    return toRelease;
+}
+/* ----------------------------------------------------------------------------------------------------- */
+
+template<typename Props> size_t LargeObjectCacheImpl<Props>::
+    CacheBin::reportStat(int num, FILE *f)
+{
+#if __TBB_MALLOC_LOCACHE_STAT
+    if (first)
+        printf("%d(%lu): total %lu KB thr %ld lastCln %lu oldest %lu\n",
+               num, num*Props::CacheStep+Props::MinSize,
+               cachedSize/1024, ageThreshold, lastCleanedAge, oldest);
+#else
+    suppress_unused_warning(num);
+    suppress_unused_warning(f);
+#endif
+    return cachedSize;
+}
+
+// release from cache blocks that are older than ageThreshold
+template<typename Props>
+bool LargeObjectCacheImpl<Props>::regularCleanup(ExtMemoryPool *extMemPool, uintptr_t currTime, bool doThreshDecr)
+{
+    bool released = false;
+    BinsSummary binsSummary;
+
+    for (int i = bitMask.getMaxTrue(numBins-1); i >= 0;
+         i = bitMask.getMaxTrue(i-1)) {
+        bin[i].updateBinsSummary(&binsSummary);
+        if (!doThreshDecr && tooLargeLOC>2 && binsSummary.isLOCTooLarge()) {
+            // if LOC is too large for quite long time, decrease the threshold
+            // based on bin hit statistics.
+            // For this, redo cleanup from the beginning.
+            // Note: on this iteration total usedSz can be not too large
+            // in comparison to total cachedSz, as we calculated it only
+            // partially. We are ok with it.
+            i = bitMask.getMaxTrue(numBins-1)+1;
+            doThreshDecr = true;
+            binsSummary.reset();
+            continue;
+        }
+        if (doThreshDecr)
+            bin[i].decreaseThreshold();
+        if (bin[i].cleanToThreshold(extMemPool, &bitMask, currTime, i))
+            released = true;
+    }
+
+    // We want to find if LOC was too large for some time continuously,
+    // so OK with races between incrementing and zeroing, but incrementing
+    // must be atomic.
+    if (binsSummary.isLOCTooLarge())
+        AtomicIncrement(tooLargeLOC);
+    else
+        tooLargeLOC = 0;
+    return released;
+}
+
+template<typename Props>
+bool LargeObjectCacheImpl<Props>::cleanAll(ExtMemoryPool *extMemPool)
+{
+    bool released = false;
+    for (int i = numBins-1; i >= 0; i--)
+        released |= bin[i].releaseAllToBackend(extMemPool, &bitMask, i);
+    return released;
+}
+
+#if __TBB_MALLOC_WHITEBOX_TEST
+template<typename Props>
+size_t LargeObjectCacheImpl<Props>::getLOCSize() const
+{
+    size_t size = 0;
+    for (int i = numBins-1; i >= 0; i--)
+        size += bin[i].getSize();
+    return size;
+}
+
+size_t LargeObjectCache::getLOCSize() const
+{
+    return largeCache.getLOCSize() + hugeCache.getLOCSize();
+}
+
+template<typename Props>
+size_t LargeObjectCacheImpl<Props>::getUsedSize() const
+{
+    size_t size = 0;
+    for (int i = numBins-1; i >= 0; i--)
+        size += bin[i].getUsedSize();
+    return size;
+}
+
+size_t LargeObjectCache::getUsedSize() const
+{
+    return largeCache.getUsedSize() + hugeCache.getUsedSize();
+}
+#endif // __TBB_MALLOC_WHITEBOX_TEST
+
+inline bool LargeObjectCache::isCleanupNeededOnRange(uintptr_t range, uintptr_t currTime)
+{
+    return range >= cacheCleanupFreq
+        || currTime+range < currTime-1 // overflow, 0 is power of 2, do cleanup
+        // (prev;prev+range] contains n*cacheCleanupFreq
+        || alignUp(currTime, cacheCleanupFreq)<currTime+range;
+}
+
+bool LargeObjectCache::doCleanup(uintptr_t currTime, bool doThreshDecr)
+{
+    if (!doThreshDecr)
+        extMemPool->allLocalCaches.markUnused();
+    return largeCache.regularCleanup(extMemPool, currTime, doThreshDecr)
+        | hugeCache.regularCleanup(extMemPool, currTime, doThreshDecr);
+}
+
+bool LargeObjectCache::decreasingCleanup()
+{
+    return doCleanup(FencedLoad((intptr_t&)cacheCurrTime), /*doThreshDecr=*/true);
+}
+
+bool LargeObjectCache::regularCleanup()
+{
+    return doCleanup(FencedLoad((intptr_t&)cacheCurrTime), /*doThreshDecr=*/false);
+}
+
+bool LargeObjectCache::cleanAll()
+{
+    return largeCache.cleanAll(extMemPool) | hugeCache.cleanAll(extMemPool);
+}
+
+template<typename Props>
+LargeMemoryBlock *LargeObjectCacheImpl<Props>::get(ExtMemoryPool *extMemoryPool, size_t size)
+{
+    MALLOC_ASSERT( size%Props::CacheStep==0, ASSERT_TEXT );
+    int idx = sizeToIdx(size);
+
+    LargeMemoryBlock *lmb = bin[idx].get(extMemoryPool, size, &bitMask, idx);
+
+    if (lmb) {
+        MALLOC_ITT_SYNC_ACQUIRED(bin+idx);
+        STAT_increment(getThreadId(), ThreadCommonCounters, allocCachedLargeObj);
+    }
+    return lmb;
+}
+
+template<typename Props>
+void LargeObjectCacheImpl<Props>::updateCacheState(ExtMemoryPool *extMemPool, DecreaseOrIncrease op, size_t size)
+{
+    int idx = sizeToIdx(size);
+    MALLOC_ASSERT(idx<numBins, ASSERT_TEXT);
+    bin[idx].updateUsedSize(extMemPool, op==decrease? -size : size, &bitMask, idx);
+}
+
+#if __TBB_MALLOC_LOCACHE_STAT
+template<typename Props>
+void LargeObjectCacheImpl<Props>::reportStat(FILE *f)
+{
+    size_t cachedSize = 0;
+    for (int i=0; i<numBins; i++)
+        cachedSize += bin[i].reportStat(i, f);
+    fprintf(f, "total LOC size %lu MB\n", cachedSize/1024/1024);
+}
+
+void LargeObjectCache::reportStat(FILE *f)
+{
+    largeCache.reportStat(f);
+    hugeCache.reportStat(f);
+    fprintf(f, "cache time %lu\n", cacheCurrTime);
+}
+#endif
+
+template<typename Props>
+void LargeObjectCacheImpl<Props>::putList(ExtMemoryPool *extMemPool, LargeMemoryBlock *toCache)
+{
+    int toBinIdx = sizeToIdx(toCache->unalignedSize);
+
+    MALLOC_ITT_SYNC_RELEASING(bin+toBinIdx);
+    bin[toBinIdx].putList(extMemPool, toCache, &bitMask, toBinIdx);
+}
+
+void LargeObjectCache::updateCacheState(DecreaseOrIncrease op, size_t size)
+{
+    if (size < maxLargeSize)
+        largeCache.updateCacheState(extMemPool, op, size);
+    else if (size < maxHugeSize)
+        hugeCache.updateCacheState(extMemPool, op, size);
+}
+
+void LargeObjectCache::registerRealloc(size_t oldSize, size_t newSize)
+{
+    updateCacheState(decrease, oldSize);
+    updateCacheState(increase, newSize);
+}
+
+// return artificial bin index, it's used only during sorting and never saved
+int LargeObjectCache::sizeToIdx(size_t size)
+{
+    MALLOC_ASSERT(size < maxHugeSize, ASSERT_TEXT);
+    return size < maxLargeSize?
+        LargeCacheType::sizeToIdx(size) :
+        LargeCacheType::getNumBins()+HugeCacheType::sizeToIdx(size);
+}
+
+void LargeObjectCache::putList(LargeMemoryBlock *list)
+{
+    LargeMemoryBlock *toProcess, *n;
+
+    for (LargeMemoryBlock *curr = list; curr; curr = toProcess) {
+        LargeMemoryBlock *tail = curr;
+        toProcess = curr->next;
+        if (curr->unalignedSize >= maxHugeSize) {
+            extMemPool->backend.returnLargeObject(curr);
+            continue;
+        }
+        int currIdx = sizeToIdx(curr->unalignedSize);
+
+        // Find all blocks fitting to same bin. Not use more efficient sorting
+        // algorithm because list is short (commonly,
+        // LocalLOC's HIGH_MARK-LOW_MARK, i.e. 24 items).
+        for (LargeMemoryBlock *b = toProcess; b; b = n) {
+            n = b->next;
+            if (sizeToIdx(b->unalignedSize) == currIdx) {
+                tail->next = b;
+                tail = b;
+                if (toProcess == b)
+                    toProcess = toProcess->next;
+                else {
+                    b->prev->next = b->next;
+                    if (b->next)
+                        b->next->prev = b->prev;
+                }
+            }
+        }
+        tail->next = NULL;
+        if (curr->unalignedSize < maxLargeSize)
+            largeCache.putList(extMemPool, curr);
+        else
+            hugeCache.putList(extMemPool, curr);
+    }
+}
+
+void LargeObjectCache::put(LargeMemoryBlock *largeBlock)
+{
+    if (largeBlock->unalignedSize < maxHugeSize) {
+        largeBlock->next = NULL;
+        if (largeBlock->unalignedSize<maxLargeSize)
+            largeCache.putList(extMemPool, largeBlock);
+        else
+            hugeCache.putList(extMemPool, largeBlock);
+    } else
+        extMemPool->backend.returnLargeObject(largeBlock);
+}
+
+LargeMemoryBlock *LargeObjectCache::get(size_t size)
+{
+    MALLOC_ASSERT( size%largeBlockCacheStep==0, ASSERT_TEXT );
+    MALLOC_ASSERT( size>=minLargeSize, ASSERT_TEXT );
+
+    if ( size < maxHugeSize) {
+        return size < maxLargeSize?
+            largeCache.get(extMemPool, size) : hugeCache.get(extMemPool, size);
+    }
+    return NULL;
+}
+
+LargeMemoryBlock *ExtMemoryPool::mallocLargeObject(MemoryPool *pool, size_t allocationSize)
+{
+#if __TBB_MALLOC_LOCACHE_STAT
+    AtomicIncrement(mallocCalls);
+    AtomicAdd(memAllocKB, allocationSize/1024);
+#endif
+    LargeMemoryBlock* lmb = loc.get(allocationSize);
+    if (!lmb) {
+        BackRefIdx backRefIdx = BackRefIdx::newBackRef(/*largeObj=*/true);
+        if (backRefIdx.isInvalid())
+            return NULL;
+
+        // unalignedSize is set in getLargeBlock
+        lmb = backend.getLargeBlock(allocationSize);
+        if (!lmb) {
+            removeBackRef(backRefIdx);
+            loc.updateCacheState(decrease, allocationSize);
+            return NULL;
+        }
+        lmb->backRefIdx = backRefIdx;
+        lmb->pool = pool;
+        STAT_increment(getThreadId(), ThreadCommonCounters, allocNewLargeObj);
+    } else {
+#if __TBB_MALLOC_LOCACHE_STAT
+        AtomicIncrement(cacheHits);
+        AtomicAdd(memHitKB, allocationSize/1024);
+#endif
+    }
+    return lmb;
+}
+
+void ExtMemoryPool::freeLargeObject(LargeMemoryBlock *mBlock)
+{
+    loc.put(mBlock);
+}
+
+void ExtMemoryPool::freeLargeObjectList(LargeMemoryBlock *head)
+{
+    loc.putList(head);
+}
+
+bool ExtMemoryPool::softCachesCleanup()
+{
+    return loc.regularCleanup();
+}
+
+bool ExtMemoryPool::hardCachesCleanup()
+{
+    // thread-local caches must be cleaned before LOC,
+    // because object from thread-local cache can be released to LOC
+    bool ret = releaseAllLocalCaches();
+    ret |= orphanedBlocks.cleanup(&backend);
+    ret |= loc.cleanAll();
+    ret |= backend.clean();
+    return ret;
+}
+
+#if BACKEND_HAS_MREMAP
+void *ExtMemoryPool::remap(void *ptr, size_t oldSize, size_t newSize, size_t alignment)
+{
+    const size_t oldUnalignedSize = ((LargeObjectHdr*)ptr - 1)->memoryBlock->unalignedSize;
+    void *o = backend.remap(ptr, oldSize, newSize, alignment);
+    if (o) {
+        LargeMemoryBlock *lmb = ((LargeObjectHdr*)o - 1)->memoryBlock;
+        loc.registerRealloc(lmb->unalignedSize, oldUnalignedSize);
+    }
+    return o;
+}
+#endif /* BACKEND_HAS_MREMAP */
+
+/*********** End allocation of large objects **********/
+
+} // namespace internal
+} // namespace rml
+
diff --git a/xdl/third_party/tbb/src/tbbmalloc/lin32-proxy-export.def b/xdl/third_party/tbb/src/tbbmalloc/lin32-proxy-export.def
new file mode 100644
index 00000000..387f4360
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/lin32-proxy-export.def
@@ -0,0 +1,59 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+calloc;
+free;
+malloc;
+realloc;
+posix_memalign;
+memalign;
+aligned_alloc;
+valloc;
+pvalloc;
+mallinfo;
+mallopt;
+malloc_usable_size;
+__libc_malloc;
+__libc_realloc;
+__libc_calloc;
+__libc_free;
+__libc_memalign;
+__libc_pvalloc;
+__libc_valloc;
+__TBB_malloc_proxy;
+_ZdaPv; /* next ones are new/delete */
+_ZdaPvRKSt9nothrow_t;
+_ZdlPv;
+_ZdlPvRKSt9nothrow_t;
+_Znaj;
+_ZnajRKSt9nothrow_t;
+_Znwj;
+_ZnwjRKSt9nothrow_t;
+
+local:
+
+/* TBB symbols */
+*3rml8internal*;
+*3tbb*;
+*__TBB*;
+
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/lin32-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/lin32-tbbmalloc-export.def
new file mode 100644
index 00000000..303e19c7
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/lin32-tbbmalloc-export.def
@@ -0,0 +1,76 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+scalable_calloc;
+scalable_free;
+scalable_malloc;
+scalable_realloc;
+scalable_posix_memalign;
+scalable_aligned_malloc;
+scalable_aligned_realloc;
+scalable_aligned_free;
+scalable_msize;
+scalable_allocation_mode;
+scalable_allocation_command;
+__TBB_malloc_safer_aligned_msize;
+__TBB_malloc_safer_aligned_realloc;
+__TBB_malloc_safer_free;
+__TBB_malloc_safer_msize;
+__TBB_malloc_safer_realloc;
+
+/* memory pool stuff */
+_ZN3rml10pool_resetEPNS_10MemoryPoolE;
+_ZN3rml11pool_createEiPKNS_13MemPoolPolicyE;
+_ZN3rml14pool_create_v1EiPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE;
+_ZN3rml11pool_mallocEPNS_10MemoryPoolEj;
+_ZN3rml12pool_destroyEPNS_10MemoryPoolE;
+_ZN3rml9pool_freeEPNS_10MemoryPoolEPv;
+_ZN3rml12pool_reallocEPNS_10MemoryPoolEPvj;
+_ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvjj;
+_ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEjj;
+_ZN3rml13pool_identifyEPv;
+
+local:
+
+/* TBB symbols */
+*3rml*;
+*3tbb*;
+*__TBB*;
+__itt_*;
+ITT_DoOneTimeInitialization;
+TBB_runtime_interface_version;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+get_memcpy_largest_cachelinesize;
+get_memcpy_largest_cache_size;
+get_mem_ops_method;
+init_mem_ops_method;
+irc__get_msg;
+irc__print;
+override_mem_ops_method;
+set_memcpy_largest_cachelinesize;
+set_memcpy_largest_cache_size;
+
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/lin64-proxy-export.def b/xdl/third_party/tbb/src/tbbmalloc/lin64-proxy-export.def
new file mode 100644
index 00000000..0bf86244
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/lin64-proxy-export.def
@@ -0,0 +1,59 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+calloc;
+free;
+malloc;
+realloc;
+posix_memalign;
+memalign;
+aligned_alloc;
+valloc;
+pvalloc;
+mallinfo;
+mallopt;
+malloc_usable_size;
+__libc_malloc;
+__libc_realloc;
+__libc_calloc;
+__libc_free;
+__libc_memalign;
+__libc_pvalloc;
+__libc_valloc;
+__TBB_malloc_proxy;
+_ZdaPv;  /* next ones are new/delete */
+_ZdaPvRKSt9nothrow_t;
+_ZdlPv;
+_ZdlPvRKSt9nothrow_t;
+_Znam;
+_ZnamRKSt9nothrow_t;
+_Znwm;
+_ZnwmRKSt9nothrow_t;
+
+local:
+
+/* TBB symbols */
+*3rml8internal*;
+*3tbb*;
+*__TBB*;
+
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/lin64-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/lin64-tbbmalloc-export.def
new file mode 100644
index 00000000..e954bfe4
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/lin64-tbbmalloc-export.def
@@ -0,0 +1,76 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+scalable_calloc;
+scalable_free;
+scalable_malloc;
+scalable_realloc;
+scalable_posix_memalign;
+scalable_aligned_malloc;
+scalable_aligned_realloc;
+scalable_aligned_free;
+scalable_msize;
+scalable_allocation_mode;
+scalable_allocation_command;
+__TBB_malloc_safer_aligned_msize;
+__TBB_malloc_safer_aligned_realloc;
+__TBB_malloc_safer_free;
+__TBB_malloc_safer_msize;
+__TBB_malloc_safer_realloc;
+
+/* memory pool stuff */
+_ZN3rml11pool_createElPKNS_13MemPoolPolicyE;
+_ZN3rml14pool_create_v1ElPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE;
+_ZN3rml10pool_resetEPNS_10MemoryPoolE;
+_ZN3rml11pool_mallocEPNS_10MemoryPoolEm;
+_ZN3rml12pool_destroyEPNS_10MemoryPoolE;
+_ZN3rml9pool_freeEPNS_10MemoryPoolEPv;
+_ZN3rml12pool_reallocEPNS_10MemoryPoolEPvm;
+_ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvmm;
+_ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEmm;
+_ZN3rml13pool_identifyEPv;
+
+local:
+
+/* TBB symbols */
+*3rml*;
+*3tbb*;
+*__TBB*;
+__itt_*;
+ITT_DoOneTimeInitialization;
+TBB_runtime_interface_version;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+get_memcpy_largest_cachelinesize;
+get_memcpy_largest_cache_size;
+get_mem_ops_method;
+init_mem_ops_method;
+irc__get_msg;
+irc__print;
+override_mem_ops_method;
+set_memcpy_largest_cachelinesize;
+set_memcpy_largest_cache_size;
+
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/lin64ipf-proxy-export.def b/xdl/third_party/tbb/src/tbbmalloc/lin64ipf-proxy-export.def
new file mode 100644
index 00000000..0bf86244
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/lin64ipf-proxy-export.def
@@ -0,0 +1,59 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+calloc;
+free;
+malloc;
+realloc;
+posix_memalign;
+memalign;
+aligned_alloc;
+valloc;
+pvalloc;
+mallinfo;
+mallopt;
+malloc_usable_size;
+__libc_malloc;
+__libc_realloc;
+__libc_calloc;
+__libc_free;
+__libc_memalign;
+__libc_pvalloc;
+__libc_valloc;
+__TBB_malloc_proxy;
+_ZdaPv;  /* next ones are new/delete */
+_ZdaPvRKSt9nothrow_t;
+_ZdlPv;
+_ZdlPvRKSt9nothrow_t;
+_Znam;
+_ZnamRKSt9nothrow_t;
+_Znwm;
+_ZnwmRKSt9nothrow_t;
+
+local:
+
+/* TBB symbols */
+*3rml8internal*;
+*3tbb*;
+*__TBB*;
+
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/lin64ipf-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/lin64ipf-tbbmalloc-export.def
new file mode 100644
index 00000000..9cbfce7f
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/lin64ipf-tbbmalloc-export.def
@@ -0,0 +1,79 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+
+scalable_calloc;
+scalable_free;
+scalable_malloc;
+scalable_realloc;
+scalable_posix_memalign;
+scalable_aligned_malloc;
+scalable_aligned_realloc;
+scalable_aligned_free;
+scalable_msize;
+scalable_allocation_mode;
+scalable_allocation_command;
+__TBB_malloc_safer_aligned_msize;
+__TBB_malloc_safer_aligned_realloc;
+__TBB_malloc_safer_free;
+__TBB_malloc_safer_msize;
+__TBB_malloc_safer_realloc;
+/* For tbbmalloc proxy to use MallocMutex with new_handler feature */
+__TBB_machine_lockbyte;
+__TBB_machine_trylockbyte;
+
+/* memory pool stuff */
+_ZN3rml11pool_createElPKNS_13MemPoolPolicyE;
+_ZN3rml14pool_create_v1ElPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE;
+_ZN3rml10pool_resetEPNS_10MemoryPoolE;
+_ZN3rml11pool_mallocEPNS_10MemoryPoolEm;
+_ZN3rml12pool_destroyEPNS_10MemoryPoolE;
+_ZN3rml9pool_freeEPNS_10MemoryPoolEPv;
+_ZN3rml12pool_reallocEPNS_10MemoryPoolEPvm;
+_ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvmm;
+_ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEmm;
+_ZN3rml13pool_identifyEPv;
+
+local:
+
+/* TBB symbols */
+*3rml*;
+*3tbb*;
+*__TBB*;
+__itt_*;
+ITT_DoOneTimeInitialization;
+TBB_runtime_interface_version;
+
+/* Intel Compiler (libirc) symbols */
+__intel_*;
+_intel_*;
+get_memcpy_largest_cachelinesize;
+get_memcpy_largest_cache_size;
+get_mem_ops_method;
+init_mem_ops_method;
+irc__get_msg;
+irc__print;
+override_mem_ops_method;
+set_memcpy_largest_cachelinesize;
+set_memcpy_largest_cache_size;
+
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/mac32-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/mac32-tbbmalloc-export.def
new file mode 100644
index 00000000..24ab729a
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/mac32-tbbmalloc-export.def
@@ -0,0 +1,48 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+_scalable_calloc
+_scalable_free
+_scalable_malloc
+_scalable_realloc
+_scalable_posix_memalign
+_scalable_aligned_malloc
+_scalable_aligned_realloc
+_scalable_aligned_free
+_scalable_msize
+_scalable_allocation_mode
+_scalable_allocation_command
+___TBB_malloc_safer_aligned_msize
+___TBB_malloc_safer_aligned_realloc
+___TBB_malloc_safer_free
+___TBB_malloc_safer_msize
+___TBB_malloc_safer_realloc
+___TBB_malloc_free_definite_size
+/* memory pool stuff */
+__ZN3rml11pool_createElPKNS_13MemPoolPolicyE
+__ZN3rml14pool_create_v1ElPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE
+__ZN3rml10pool_resetEPNS_10MemoryPoolE
+__ZN3rml12pool_destroyEPNS_10MemoryPoolE
+__ZN3rml11pool_mallocEPNS_10MemoryPoolEm
+__ZN3rml9pool_freeEPNS_10MemoryPoolEPv
+__ZN3rml12pool_reallocEPNS_10MemoryPoolEPvm
+__ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvmm
+__ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEmm
+__ZN3rml13pool_identifyEPv
diff --git a/xdl/third_party/tbb/src/tbbmalloc/mac64-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/mac64-tbbmalloc-export.def
new file mode 100644
index 00000000..24ab729a
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/mac64-tbbmalloc-export.def
@@ -0,0 +1,48 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+_scalable_calloc
+_scalable_free
+_scalable_malloc
+_scalable_realloc
+_scalable_posix_memalign
+_scalable_aligned_malloc
+_scalable_aligned_realloc
+_scalable_aligned_free
+_scalable_msize
+_scalable_allocation_mode
+_scalable_allocation_command
+___TBB_malloc_safer_aligned_msize
+___TBB_malloc_safer_aligned_realloc
+___TBB_malloc_safer_free
+___TBB_malloc_safer_msize
+___TBB_malloc_safer_realloc
+___TBB_malloc_free_definite_size
+/* memory pool stuff */
+__ZN3rml11pool_createElPKNS_13MemPoolPolicyE
+__ZN3rml14pool_create_v1ElPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE
+__ZN3rml10pool_resetEPNS_10MemoryPoolE
+__ZN3rml12pool_destroyEPNS_10MemoryPoolE
+__ZN3rml11pool_mallocEPNS_10MemoryPoolEm
+__ZN3rml9pool_freeEPNS_10MemoryPoolEPv
+__ZN3rml12pool_reallocEPNS_10MemoryPoolEPvm
+__ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvmm
+__ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEmm
+__ZN3rml13pool_identifyEPv
diff --git a/xdl/third_party/tbb/src/tbbmalloc/proxy.cpp b/xdl/third_party/tbb/src/tbbmalloc/proxy.cpp
new file mode 100644
index 00000000..2cc05489
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/proxy.cpp
@@ -0,0 +1,793 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __linux__ && !__ANDROID__
+// include <bits/c++config.h> indirectly so that <cstdlib> is not included
+#include <cstddef>
+// include <features.h> indirectly so that <stdlib.h> is not included
+#include <unistd.h>
+// Working around compiler issue with Anaconda's gcc 7.3 compiler package.
+// New gcc ported for old libc may provide their inline implementation
+// of aligned_alloc as required by new C++ standard, this makes it hard to
+// redefine aligned_alloc here. However, running on systems with new libc
+// version, it still needs it to be redefined, thus tricking system headers
+#if defined(__GLIBC_PREREQ) && !__GLIBC_PREREQ(2, 16) && _GLIBCXX_HAVE_ALIGNED_ALLOC
+// tell <cstdlib> that there is no aligned_alloc
+#undef _GLIBCXX_HAVE_ALIGNED_ALLOC
+// trick <stdlib.h> to define another symbol instead
+#define aligned_alloc __hidden_redefined_aligned_alloc
+// Fix the state and undefine the trick
+#include <cstdlib>
+#undef aligned_alloc
+#endif // defined(__GLIBC_PREREQ)&&!__GLIBC_PREREQ(2, 16)&&_GLIBCXX_HAVE_ALIGNED_ALLOC
+#endif // __linux__ && !__ANDROID__
+
+#include "proxy.h"
+#include "tbb/tbb_config.h"
+#include "tbb/tbb_environment.h"
+
+#if !defined(__EXCEPTIONS) && !defined(_CPPUNWIND) && !defined(__SUNPRO_CC)
+    #if TBB_USE_EXCEPTIONS
+        #error Compilation settings do not support exception handling. Please do not set TBB_USE_EXCEPTIONS macro or set it to 0.
+    #elif !defined(TBB_USE_EXCEPTIONS)
+        #define TBB_USE_EXCEPTIONS 0
+    #endif
+#elif !defined(TBB_USE_EXCEPTIONS)
+    #define TBB_USE_EXCEPTIONS 1
+#endif
+
+#if __TBB_CPP11_PRESENT
+#define __TBB_THROW_BAD_ALLOC
+#define __TBB_NO_THROW noexcept
+#else
+#define __TBB_THROW_BAD_ALLOC throw(std::bad_alloc)
+#define __TBB_NO_THROW throw()
+#endif
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || _WIN32 && !__TBB_WIN8UI_SUPPORT
+/*** internal global operator new implementation (Linux, Windows) ***/
+#include <new>
+
+// Synchronization primitives to protect original library pointers and new_handler 
+#include "Synchronize.h"
+
+#if __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT
+// Use MallocMutex implementation
+typedef MallocMutex ProxyMutex;
+#else
+// One byte atomic intrinsics are not available,
+// so use simple pointer based spin mutex
+class SimpleSpinMutex : tbb::internal::no_copy {
+    intptr_t flag;
+public:
+    class scoped_lock : tbb::internal::no_copy {
+        SimpleSpinMutex& mutex;
+    public:
+        scoped_lock( SimpleSpinMutex& m ) : mutex(m) {
+            while( !(AtomicFetchStore( &(m.flag), 1 ) == 0) );
+        }
+        ~scoped_lock() {
+            FencedStore(mutex.flag, 0);
+        }
+    };
+    friend class scoped_lock;
+};
+typedef SimpleSpinMutex ProxyMutex;
+#endif /* __TBB_MSVC_PART_WORD_INTERLOCKED_INTRINSICS_PRESENT */
+
+// In case there is no std::get_new_handler function
+// which provides synchronized access to std::new_handler
+#if !__TBB_CPP11_GET_NEW_HANDLER_PRESENT
+static ProxyMutex new_lock;
+#endif
+
+static inline void* InternalOperatorNew(size_t sz) {
+    void* res = scalable_malloc(sz);
+#if TBB_USE_EXCEPTIONS
+    while (!res) {
+        std::new_handler handler;
+#if __TBB_CPP11_GET_NEW_HANDLER_PRESENT
+        handler = std::get_new_handler();
+#else
+        {
+            ProxyMutex::scoped_lock lock(new_lock);
+            handler = std::set_new_handler(0);
+            std::set_new_handler(handler);
+        }
+#endif
+        if (handler) {
+            (*handler)();
+        } else {
+            throw std::bad_alloc();
+        }
+        res = scalable_malloc(sz);
+}
+#endif /* TBB_USE_EXCEPTIONS */
+    return res;
+}
+/*** end of internal global operator new implementation ***/
+#endif // MALLOC_UNIXLIKE_OVERLOAD_ENABLED || _WIN32 && !__TBB_WIN8UI_SUPPORT
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+
+#ifndef __THROW
+#define __THROW
+#endif
+
+/*** service functions and variables ***/
+#include <string.h> // for memset
+#include <unistd.h> // for sysconf
+
+static long memoryPageSize;
+
+static inline void initPageSize()
+{
+    memoryPageSize = sysconf(_SC_PAGESIZE);
+}
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
+#include <dlfcn.h>
+#include <malloc.h>    // mallinfo
+
+/* __TBB_malloc_proxy used as a weak symbol by libtbbmalloc for:
+   1) detection that the proxy library is loaded
+   2) check that dlsym("malloc") found something different from our replacement malloc
+*/
+extern "C" void *__TBB_malloc_proxy(size_t) __attribute__ ((alias ("malloc")));
+
+static void *orig_msize;
+
+#elif MALLOC_ZONE_OVERLOAD_ENABLED
+
+#include "proxy_overload_osx.h"
+
+#endif // MALLOC_ZONE_OVERLOAD_ENABLED
+
+// Original (i.e., replaced) functions,
+// they are never changed for MALLOC_ZONE_OVERLOAD_ENABLED.
+static void *orig_free,
+    *orig_realloc;
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
+#define ZONE_ARG
+#define PREFIX(name) name
+
+static void *orig_libc_free,
+    *orig_libc_realloc;
+
+// We already tried to find ptr to original functions.
+static intptr_t origFuncSearched;
+
+inline void InitOrigPointers()
+{
+    // race is OK here, as different threads found same functions
+    if (!FencedLoad(origFuncSearched)) {
+        orig_free = dlsym(RTLD_NEXT, "free");
+        orig_realloc = dlsym(RTLD_NEXT, "realloc");
+        orig_msize = dlsym(RTLD_NEXT, "malloc_usable_size");
+        orig_libc_free = dlsym(RTLD_NEXT, "__libc_free");
+        orig_libc_realloc = dlsym(RTLD_NEXT, "__libc_realloc");
+
+        FencedStore(origFuncSearched, 1);
+    }
+}
+
+/*** replacements for malloc and the family ***/
+extern "C" {
+#elif MALLOC_ZONE_OVERLOAD_ENABLED
+
+// each impl_* function has such 1st argument, it's unused
+#define ZONE_ARG struct _malloc_zone_t *,
+#define PREFIX(name) impl_##name
+// not interested in original functions for zone overload
+inline void InitOrigPointers() {}
+
+#endif // MALLOC_UNIXLIKE_OVERLOAD_ENABLED and MALLOC_ZONE_OVERLOAD_ENABLED
+
+void *PREFIX(malloc)(ZONE_ARG size_t size) __THROW
+{
+    return scalable_malloc(size);
+}
+
+void *PREFIX(calloc)(ZONE_ARG size_t num, size_t size) __THROW
+{
+    return scalable_calloc(num, size);
+}
+
+void PREFIX(free)(ZONE_ARG void *object) __THROW
+{
+    InitOrigPointers();
+    __TBB_malloc_safer_free(object, (void (*)(void*))orig_free);
+}
+
+void *PREFIX(realloc)(ZONE_ARG void* ptr, size_t sz) __THROW
+{
+    InitOrigPointers();
+    return __TBB_malloc_safer_realloc(ptr, sz, orig_realloc);
+}
+
+/* The older *NIX interface for aligned allocations;
+   it's formally substituted by posix_memalign and deprecated,
+   so we do not expect it to cause cyclic dependency with C RTL. */
+void *PREFIX(memalign)(ZONE_ARG size_t alignment, size_t size) __THROW
+{
+    return scalable_aligned_malloc(size, alignment);
+}
+
+/* valloc allocates memory aligned on a page boundary */
+void *PREFIX(valloc)(ZONE_ARG size_t size) __THROW
+{
+    if (! memoryPageSize) initPageSize();
+
+    return scalable_aligned_malloc(size, memoryPageSize);
+}
+
+#undef ZONE_ARG
+#undef PREFIX
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
+
+// match prototype from system headers
+#if __ANDROID__
+size_t malloc_usable_size(const void *ptr) __THROW
+#else
+size_t malloc_usable_size(void *ptr) __THROW
+#endif
+{
+    InitOrigPointers();
+    return __TBB_malloc_safer_msize(const_cast<void*>(ptr), (size_t (*)(void*))orig_msize);
+}
+
+int posix_memalign(void **memptr, size_t alignment, size_t size) __THROW
+{
+    return scalable_posix_memalign(memptr, alignment, size);
+}
+
+/* pvalloc allocates smallest set of complete pages which can hold
+   the requested number of bytes. Result is aligned on page boundary. */
+void *pvalloc(size_t size) __THROW
+{
+    if (! memoryPageSize) initPageSize();
+    // align size up to the page size,
+    // pvalloc(0) returns 1 page, see man libmpatrol
+    size = size? ((size-1) | (memoryPageSize-1)) + 1 : memoryPageSize;
+
+    return scalable_aligned_malloc(size, memoryPageSize);
+}
+
+int mallopt(int /*param*/, int /*value*/) __THROW
+{
+    return 1;
+}
+
+struct mallinfo mallinfo() __THROW
+{
+    struct mallinfo m;
+    memset(&m, 0, sizeof(struct mallinfo));
+
+    return m;
+}
+
+#if __ANDROID__
+// Android doesn't have malloc_usable_size, provide it to be compatible
+// with Linux, in addition overload dlmalloc_usable_size() that presented
+// under Android.
+size_t dlmalloc_usable_size(const void *ptr) __attribute__ ((alias ("malloc_usable_size")));
+#else // __ANDROID__
+// C11 function, supported starting GLIBC 2.16
+void *aligned_alloc(size_t alignment, size_t size) __attribute__ ((alias ("memalign")));
+// Those non-standard functions are exported by GLIBC, and might be used
+// in conjunction with standard malloc/free, so we must ovberload them.
+// Bionic doesn't have them. Not removing from the linker scripts,
+// as absent entry points are ignored by the linker.
+void *__libc_malloc(size_t size) __attribute__ ((alias ("malloc")));
+void *__libc_calloc(size_t num, size_t size) __attribute__ ((alias ("calloc")));
+void *__libc_memalign(size_t alignment, size_t size) __attribute__ ((alias ("memalign")));
+void *__libc_pvalloc(size_t size) __attribute__ ((alias ("pvalloc")));
+void *__libc_valloc(size_t size) __attribute__ ((alias ("valloc")));
+
+// call original __libc_* to support naive replacement of free via __libc_free etc
+void __libc_free(void *ptr)
+{
+    InitOrigPointers();
+    __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_libc_free);
+}
+
+void *__libc_realloc(void *ptr, size_t size)
+{
+    InitOrigPointers();
+    return __TBB_malloc_safer_realloc(ptr, size, orig_libc_realloc);
+}
+#endif // !__ANDROID__
+
+} /* extern "C" */
+
+/*** replacements for global operators new and delete ***/
+
+void* operator new(size_t sz) __TBB_THROW_BAD_ALLOC {
+    return InternalOperatorNew(sz);
+}
+void* operator new[](size_t sz) __TBB_THROW_BAD_ALLOC {
+    return InternalOperatorNew(sz);
+}
+void operator delete(void* ptr) __TBB_NO_THROW {
+    InitOrigPointers();
+    __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
+}
+void operator delete[](void* ptr) __TBB_NO_THROW {
+    InitOrigPointers();
+    __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
+}
+void* operator new(size_t sz, const std::nothrow_t&) __TBB_NO_THROW {
+    return scalable_malloc(sz);
+}
+void* operator new[](std::size_t sz, const std::nothrow_t&) __TBB_NO_THROW {
+    return scalable_malloc(sz);
+}
+void operator delete(void* ptr, const std::nothrow_t&) __TBB_NO_THROW {
+    InitOrigPointers();
+    __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
+}
+void operator delete[](void* ptr, const std::nothrow_t&) __TBB_NO_THROW {
+    InitOrigPointers();
+    __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
+}
+
+#endif /* MALLOC_UNIXLIKE_OVERLOAD_ENABLED */
+#endif /* MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED */
+
+#ifdef _WIN32
+#include <windows.h>
+
+#if !__TBB_WIN8UI_SUPPORT
+
+#include <stdio.h>
+#include "tbb_function_replacement.h"
+#include "shared_utils.h"
+
+void __TBB_malloc_safer_delete( void *ptr)
+{
+    __TBB_malloc_safer_free( ptr, NULL );
+}
+
+void* safer_aligned_malloc( size_t size, size_t alignment )
+{
+    // workaround for "is power of 2 pow N" bug that accepts zeros
+    return scalable_aligned_malloc( size, alignment>sizeof(size_t*)?alignment:sizeof(size_t*) );
+}
+
+// we do not support _expand();
+void* safer_expand( void *, size_t )
+{
+    return NULL;
+}
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(CRTLIB)                                             \
+void (*orig_free_##CRTLIB)(void*);                                                                   \
+void __TBB_malloc_safer_free_##CRTLIB(void *ptr)                                                     \
+{                                                                                                    \
+    __TBB_malloc_safer_free( ptr, orig_free_##CRTLIB );                                              \
+}                                                                                                    \
+                                                                                                     \
+void (*orig__aligned_free_##CRTLIB)(void*);                                                          \
+void __TBB_malloc_safer__aligned_free_##CRTLIB(void *ptr)                                            \
+{                                                                                                    \
+    __TBB_malloc_safer_free( ptr, orig__aligned_free_##CRTLIB );                                     \
+}                                                                                                    \
+                                                                                                     \
+size_t (*orig__msize_##CRTLIB)(void*);                                                               \
+size_t __TBB_malloc_safer__msize_##CRTLIB(void *ptr)                                                 \
+{                                                                                                    \
+    return __TBB_malloc_safer_msize( ptr, orig__msize_##CRTLIB );                                    \
+}                                                                                                    \
+                                                                                                     \
+size_t (*orig__aligned_msize_##CRTLIB)(void*, size_t, size_t);                                       \
+size_t __TBB_malloc_safer__aligned_msize_##CRTLIB( void *ptr, size_t alignment, size_t offset)       \
+{                                                                                                    \
+    return __TBB_malloc_safer_aligned_msize( ptr, alignment, offset, orig__aligned_msize_##CRTLIB ); \
+}                                                                                                    \
+                                                                                                     \
+void* __TBB_malloc_safer_realloc_##CRTLIB( void *ptr, size_t size )                                  \
+{                                                                                                    \
+    orig_ptrs func_ptrs = {orig_free_##CRTLIB, orig__msize_##CRTLIB};                                \
+    return __TBB_malloc_safer_realloc( ptr, size, &func_ptrs );                                      \
+}                                                                                                    \
+                                                                                                     \
+void* __TBB_malloc_safer__aligned_realloc_##CRTLIB( void *ptr, size_t size, size_t aligment )        \
+{                                                                                                    \
+    orig_aligned_ptrs func_ptrs = {orig__aligned_free_##CRTLIB, orig__aligned_msize_##CRTLIB};       \
+    return __TBB_malloc_safer_aligned_realloc( ptr, size, aligment, &func_ptrs );                    \
+}
+
+// Only for ucrtbase: substitution for _o_free
+void (*orig__o_free)(void*);
+void __TBB_malloc__o_free(void *ptr)
+{
+    __TBB_malloc_safer_free( ptr, orig__o_free );
+}
+// Only for ucrtbase: substitution for _free_base
+void(*orig__free_base)(void*);
+void __TBB_malloc__free_base(void *ptr)
+{
+    __TBB_malloc_safer_free(ptr, orig__free_base);
+}
+
+// Size limit is MAX_PATTERN_SIZE (28) byte codes / 56 symbols per line.
+// * can be used to match any digit in byte codes.
+// # followed by several * indicate a relative address that needs to be corrected.
+// Purpose of the pattern is to mark an instruction bound; it should consist of several
+// full instructions plus one extra byte code. It's not required for the patterns
+// to be unique (i.e., it's OK to have same pattern for unrelated functions).
+// TODO: use hot patch prologues if exist
+const char* known_bytecodes[] = {
+#if _WIN64
+//  "========================================================" - 56 symbols
+    "4883EC284885C974",       // release free()
+    "4883EC284885C975",       // release _msize()
+    "4885C974375348",         // release free() 8.0.50727.42, 10.0
+    "E907000000CCCC",         // release _aligned_msize(), _aligned_free() ucrtbase.dll
+    "C7442410000000008B",     // release free() ucrtbase.dll 10.0.14393.33
+    "E90B000000CCCC",         // release _msize() ucrtbase.dll 10.0.14393.33
+    "48895C24085748",         // release _aligned_msize() ucrtbase.dll 10.0.14393.33
+    "E903000000CCCC",         // release _aligned_msize() ucrtbase.dll 10.0.16299.522
+    "48894C24084883EC28BA",   // debug prologue
+    "4C894424184889542410",   // debug _aligned_msize() 10.0
+    "48894C24084883EC2848",   // debug _aligned_free 10.0
+    "488BD1488D0D#*******E9", // _o_free(), ucrtbase.dll
+ #if __TBB_OVERLOAD_OLD_MSVCR
+    "48895C2408574883EC3049", // release _aligned_msize 9.0
+    "4883EC384885C975",       // release _msize() 9.0
+    "4C8BC1488B0DA6E4040033", // an old win64 SDK
+ #endif
+#else // _WIN32
+//  "========================================================" - 56 symbols
+    "8BFF558BEC8B",           // multiple
+    "8BFF558BEC83",           // release free() & _msize() 10.0.40219.325, _msize() ucrtbase.dll
+    "8BFF558BECFF",           // release _aligned_msize ucrtbase.dll
+    "8BFF558BEC51",           // release free() & _msize() ucrtbase.dll 10.0.14393.33
+    "558BEC8B450885C074",     // release _aligned_free 11.0
+    "558BEC837D08000F",       // release _msize() 11.0.51106.1
+    "558BEC837D08007419FF",   // release free() 11.0.50727.1
+    "558BEC8B450885C075",     // release _aligned_msize() 11.0.50727.1
+    "558BEC6A018B",           // debug free() & _msize() 11.0
+    "558BEC8B451050",         // debug _aligned_msize() 11.0
+    "558BEC8B450850",         // debug _aligned_free 11.0
+    "8BFF558BEC6A",           // debug free() & _msize() 10.0.40219.325
+ #if __TBB_OVERLOAD_OLD_MSVCR
+    "6A1868********E8",       // release free() 8.0.50727.4053, 9.0
+    "6A1C68********E8",       // release _msize() 8.0.50727.4053, 9.0
+ #endif
+#endif // _WIN64/_WIN32
+    NULL
+    };
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,function_name,dbgsuffix) \
+    ReplaceFunctionWithStore( #CRT_VER #dbgsuffix ".dll", #function_name, \
+      (FUNCPTR)__TBB_malloc_safer_##function_name##_##CRT_VER##dbgsuffix, \
+      known_bytecodes, (FUNCPTR*)&orig_##function_name##_##CRT_VER##dbgsuffix );
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_NO_FALLBACK(CRT_VER,function_name,dbgsuffix) \
+    ReplaceFunctionWithStore( #CRT_VER #dbgsuffix ".dll", #function_name, \
+      (FUNCPTR)__TBB_malloc_safer_##function_name##_##CRT_VER##dbgsuffix, 0, NULL );
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_REDIRECT(CRT_VER,function_name,dest_func,dbgsuffix) \
+    ReplaceFunctionWithStore( #CRT_VER #dbgsuffix ".dll", #function_name, \
+      (FUNCPTR)__TBB_malloc_safer_##dest_func##_##CRT_VER##dbgsuffix, 0, NULL );
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_IMPL(CRT_VER,dbgsuffix)                             \
+    if (BytecodesAreKnown(#CRT_VER #dbgsuffix ".dll")) {                                          \
+      __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,free,dbgsuffix)                         \
+      __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,_msize,dbgsuffix)                       \
+      __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_NO_FALLBACK(CRT_VER,realloc,dbgsuffix)          \
+      __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,_aligned_free,dbgsuffix)                \
+      __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,_aligned_msize,dbgsuffix)               \
+      __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_NO_FALLBACK(CRT_VER,_aligned_realloc,dbgsuffix) \
+    } else                                                                                        \
+        SkipReplacement(#CRT_VER #dbgsuffix ".dll");
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_RELEASE(CRT_VER) __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_IMPL(CRT_VER,)
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_DEBUG(CRT_VER) __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_IMPL(CRT_VER,d)
+
+#define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(CRT_VER)     \
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_RELEASE(CRT_VER) \
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_DEBUG(CRT_VER)
+
+#if __TBB_OVERLOAD_OLD_MSVCR
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr70d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr70);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr71d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr71);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr80d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr80);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr90d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr90);
+#endif
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr100d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr100);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr110d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr110);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr120d);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr120);
+__TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(ucrtbase);
+
+/*** replacements for global operators new and delete ***/
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning( push )
+#pragma warning( disable : 4290 )
+#endif
+
+/*** operator new overloads internals (Linux, Windows) ***/
+
+void* operator_new(size_t sz) __TBB_THROW_BAD_ALLOC {
+    return InternalOperatorNew(sz);
+}
+void* operator_new_arr(size_t sz) __TBB_THROW_BAD_ALLOC {
+    return InternalOperatorNew(sz);
+}
+void operator_delete(void* ptr) __TBB_NO_THROW {
+    __TBB_malloc_safer_delete(ptr);
+}
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning( pop )
+#endif
+
+void operator_delete_arr(void* ptr) __TBB_NO_THROW {
+    __TBB_malloc_safer_delete(ptr);
+}
+void* operator_new_t(size_t sz, const std::nothrow_t&) __TBB_NO_THROW {
+    return scalable_malloc(sz);
+}
+void* operator_new_arr_t(std::size_t sz, const std::nothrow_t&) __TBB_NO_THROW {
+    return scalable_malloc(sz);
+}
+void operator_delete_t(void* ptr, const std::nothrow_t&) __TBB_NO_THROW {
+    __TBB_malloc_safer_delete(ptr);
+}
+void operator_delete_arr_t(void* ptr, const std::nothrow_t&) __TBB_NO_THROW {
+    __TBB_malloc_safer_delete(ptr);
+}
+
+struct Module {
+    const char *name;
+    bool        doFuncReplacement; // do replacement in the DLL
+};
+
+Module modules_to_replace[] = {
+    {"msvcr100d.dll", true},
+    {"msvcr100.dll", true},
+    {"msvcr110d.dll", true},
+    {"msvcr110.dll", true},
+    {"msvcr120d.dll", true},
+    {"msvcr120.dll", true},
+    {"ucrtbase.dll", true},
+//    "ucrtbased.dll" is not supported because of problems with _dbg functions
+#if __TBB_OVERLOAD_OLD_MSVCR
+    {"msvcr90d.dll", true},
+    {"msvcr90.dll", true},
+    {"msvcr80d.dll", true},
+    {"msvcr80.dll", true},
+    {"msvcr70d.dll", true},
+    {"msvcr70.dll", true},
+    {"msvcr71d.dll", true},
+    {"msvcr71.dll", true},
+#endif
+#if __TBB_TODO
+    // TODO: Try enabling replacement for non-versioned system binaries below
+    {"msvcrtd.dll", true},
+    {"msvcrt.dll", true},
+#endif
+    };
+
+/*
+We need to replace following functions:
+malloc
+calloc
+_aligned_malloc
+_expand (by dummy implementation)
+??2@YAPAXI@Z      operator new                         (ia32)
+??_U@YAPAXI@Z     void * operator new[] (size_t size)  (ia32)
+??3@YAXPAX@Z      operator delete                      (ia32)
+??_V@YAXPAX@Z     operator delete[]                    (ia32)
+??2@YAPEAX_K@Z    void * operator new(unsigned __int64)   (intel64)
+??_V@YAXPEAX@Z    void * operator new[](unsigned __int64) (intel64)
+??3@YAXPEAX@Z     operator delete                         (intel64)
+??_V@YAXPEAX@Z    operator delete[]                       (intel64)
+??2@YAPAXIABUnothrow_t@std@@@Z      void * operator new (size_t sz, const std::nothrow_t&) throw()  (optional)
+??_U@YAPAXIABUnothrow_t@std@@@Z     void * operator new[] (size_t sz, const std::nothrow_t&) throw() (optional)
+
+and these functions have runtime-specific replacement:
+realloc
+free
+_msize
+_aligned_realloc
+_aligned_free
+_aligned_msize
+*/
+
+typedef struct FRData_t {
+    //char *_module;
+    const char *_func;
+    FUNCPTR _fptr;
+    FRR_ON_ERROR _on_error;
+} FRDATA;
+
+FRDATA c_routines_to_replace[] = {
+    { "malloc",  (FUNCPTR)scalable_malloc, FRR_FAIL },
+    { "calloc",  (FUNCPTR)scalable_calloc, FRR_FAIL },
+    { "_aligned_malloc",  (FUNCPTR)safer_aligned_malloc, FRR_FAIL },
+    { "_expand",  (FUNCPTR)safer_expand, FRR_IGNORE },
+};
+
+FRDATA cxx_routines_to_replace[] = {
+#if _WIN64
+    { "??2@YAPEAX_K@Z", (FUNCPTR)operator_new, FRR_FAIL },
+    { "??_U@YAPEAX_K@Z", (FUNCPTR)operator_new_arr, FRR_FAIL },
+    { "??3@YAXPEAX@Z", (FUNCPTR)operator_delete, FRR_FAIL },
+    { "??_V@YAXPEAX@Z", (FUNCPTR)operator_delete_arr, FRR_FAIL },
+#else
+    { "??2@YAPAXI@Z", (FUNCPTR)operator_new, FRR_FAIL },
+    { "??_U@YAPAXI@Z", (FUNCPTR)operator_new_arr, FRR_FAIL },
+    { "??3@YAXPAX@Z", (FUNCPTR)operator_delete, FRR_FAIL },
+    { "??_V@YAXPAX@Z", (FUNCPTR)operator_delete_arr, FRR_FAIL },
+#endif
+    { "??2@YAPAXIABUnothrow_t@std@@@Z", (FUNCPTR)operator_new_t, FRR_IGNORE },
+    { "??_U@YAPAXIABUnothrow_t@std@@@Z", (FUNCPTR)operator_new_arr_t, FRR_IGNORE }
+};
+
+#ifndef UNICODE
+typedef char unicode_char_t;
+#define WCHAR_SPEC "%s"
+#else
+typedef wchar_t unicode_char_t;
+#define WCHAR_SPEC "%ls"
+#endif
+
+// Check that we recognize bytecodes that should be replaced by trampolines.
+// If some functions have unknown prologue patterns, replacement should not be done.
+bool BytecodesAreKnown(const unicode_char_t *dllName)
+{
+    const char *funcName[] = {"free", "_msize", "_aligned_free", "_aligned_msize", 0};
+    HMODULE module = GetModuleHandle(dllName);
+
+    if (!module)
+        return false;
+    for (int i=0; funcName[i]; i++)
+        if (! IsPrologueKnown(module, funcName[i], known_bytecodes)) {
+            fprintf(stderr, "TBBmalloc: skip allocation functions replacement in " WCHAR_SPEC
+                    ": unknown prologue for function " WCHAR_SPEC "\n", dllName, funcName[i]);
+            return false;
+        }
+    return true;
+}
+
+void SkipReplacement(const unicode_char_t *dllName)
+{
+#ifndef UNICODE
+    const char *dllStr = dllName;
+#else
+    const size_t sz = 128; // all DLL name must fit
+
+    char buffer[sz];
+    size_t real_sz;
+    char *dllStr = buffer;
+
+    errno_t ret = wcstombs_s(&real_sz, dllStr, sz, dllName, sz-1);
+    __TBB_ASSERT(!ret, "Dll name conversion failed");
+#endif
+
+    for (size_t i=0; i<arrayLength(modules_to_replace); i++)
+        if (!strcmp(modules_to_replace[i].name, dllStr)) {
+            modules_to_replace[i].doFuncReplacement = false;
+            break;
+        }
+}
+
+void ReplaceFunctionWithStore( const unicode_char_t *dllName, const char *funcName, FUNCPTR newFunc, const char ** opcodes, FUNCPTR* origFunc,  FRR_ON_ERROR on_error = FRR_FAIL )
+{
+    FRR_TYPE res = ReplaceFunction( dllName, funcName, newFunc, opcodes, origFunc );
+
+    if (res == FRR_OK || res == FRR_NODLL || (res == FRR_NOFUNC && on_error == FRR_IGNORE))
+        return;
+
+    fprintf(stderr, "Failed to %s function %s in module %s\n",
+            res==FRR_NOFUNC? "find" : "replace", funcName, dllName);
+
+    // Unable to replace a required function
+    // Aborting because incomplete replacement of memory management functions
+    // may leave the program in an invalid state
+    abort();
+}
+
+void doMallocReplacement()
+{
+    // Replace functions and keep backup of original code (separate for each runtime)
+#if __TBB_OVERLOAD_OLD_MSVCR
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr70)
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr71)
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr80)
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr90)
+#endif
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr100)
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr110)
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr120)
+    __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_RELEASE(ucrtbase)
+
+    // Replace functions without storing original code
+    for (size_t j = 0; j < arrayLength(modules_to_replace); j++) {
+        if (!modules_to_replace[j].doFuncReplacement)
+            continue;
+        for (size_t i = 0; i < arrayLength(c_routines_to_replace); i++)
+        {
+            ReplaceFunctionWithStore( modules_to_replace[j].name, c_routines_to_replace[i]._func, c_routines_to_replace[i]._fptr, NULL, NULL,  c_routines_to_replace[i]._on_error );
+        }
+        if ( strcmp(modules_to_replace[j].name, "ucrtbase.dll") == 0 ) {
+            // If _o_free function is present and patchable, redirect it to tbbmalloc as well
+            // This prevents issues with other _o_* functions which might allocate memory with malloc
+            if ( IsPrologueKnown(GetModuleHandle("ucrtbase.dll"), "_o_free", known_bytecodes) ) {
+                ReplaceFunctionWithStore( "ucrtbase.dll", "_o_free", (FUNCPTR)__TBB_malloc__o_free, known_bytecodes, (FUNCPTR*)&orig__o_free,  FRR_FAIL );
+            }
+            // Similarly for _free_base
+            if (IsPrologueKnown(GetModuleHandle("ucrtbase.dll"), "_free_base", known_bytecodes)) {
+                ReplaceFunctionWithStore("ucrtbase.dll", "_free_base", (FUNCPTR)__TBB_malloc__free_base, known_bytecodes, (FUNCPTR*)&orig__free_base, FRR_FAIL);
+            }
+            // ucrtbase.dll does not export operator new/delete, so skip the rest of the loop.
+            continue;
+        }
+
+        for (size_t i = 0; i < arrayLength(cxx_routines_to_replace); i++)
+        {
+#if !_WIN64
+            // in Microsoft* Visual Studio* 2012 and 2013 32-bit operator delete consists of 2 bytes only: short jump to free(ptr);
+            // replacement should be skipped for this particular case.
+            if ( ((strcmp(modules_to_replace[j].name, "msvcr110.dll") == 0) || (strcmp(modules_to_replace[j].name, "msvcr120.dll") == 0)) && (strcmp(cxx_routines_to_replace[i]._func, "??3@YAXPAX@Z") == 0) ) continue;
+            // in Microsoft* Visual Studio* 2013 32-bit operator delete[] consists of 2 bytes only: short jump to free(ptr);
+            // replacement should be skipped for this particular case.
+            if ( (strcmp(modules_to_replace[j].name, "msvcr120.dll") == 0) && (strcmp(cxx_routines_to_replace[i]._func, "??_V@YAXPAX@Z") == 0) ) continue;
+#endif
+            ReplaceFunctionWithStore( modules_to_replace[j].name, cxx_routines_to_replace[i]._func, cxx_routines_to_replace[i]._fptr, NULL, NULL,  cxx_routines_to_replace[i]._on_error );
+        }
+    }
+}
+
+#endif // !__TBB_WIN8UI_SUPPORT
+
+extern "C" BOOL WINAPI DllMain( HINSTANCE hInst, DWORD callReason, LPVOID reserved )
+{
+
+    if ( callReason==DLL_PROCESS_ATTACH && reserved && hInst ) {
+#if !__TBB_WIN8UI_SUPPORT
+        if (!tbb::internal::GetBoolEnvironmentVariable("TBB_MALLOC_DISABLE_REPLACEMENT"))
+        {
+            doMallocReplacement();
+        }
+#endif // !__TBB_WIN8UI_SUPPORT
+    }
+
+    return TRUE;
+}
+
+// Just to make the linker happy and link the DLL to the application
+extern "C" __declspec(dllexport) void __TBB_malloc_proxy()
+{
+
+}
+
+#endif //_WIN32
diff --git a/xdl/third_party/tbb/src/tbbmalloc/proxy.h b/xdl/third_party/tbb/src/tbbmalloc/proxy.h
new file mode 100644
index 00000000..b92a3962
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/proxy.h
@@ -0,0 +1,66 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef _TBB_malloc_proxy_H_
+#define _TBB_malloc_proxy_H_
+
+#define MALLOC_UNIXLIKE_OVERLOAD_ENABLED __linux__
+#define MALLOC_ZONE_OVERLOAD_ENABLED __APPLE__
+
+// MALLOC_UNIXLIKE_OVERLOAD_ENABLED depends on MALLOC_CHECK_RECURSION stuff
+// TODO: limit MALLOC_CHECK_RECURSION to *_OVERLOAD_ENABLED only
+#if __linux__ || __APPLE__ || __sun || __FreeBSD__ || MALLOC_UNIXLIKE_OVERLOAD_ENABLED
+#define MALLOC_CHECK_RECURSION 1
+#endif
+
+#include <stddef.h>
+
+extern "C" {
+    void * scalable_malloc(size_t size);
+    void * scalable_calloc(size_t nobj, size_t size);
+    void   scalable_free(void *ptr);
+    void * scalable_realloc(void* ptr, size_t size);
+    void * scalable_aligned_malloc(size_t size, size_t alignment);
+    void * scalable_aligned_realloc(void* ptr, size_t size, size_t alignment);
+    int    scalable_posix_memalign(void **memptr, size_t alignment, size_t size);
+    size_t scalable_msize(void *ptr);
+    void   __TBB_malloc_safer_free( void *ptr, void (*original_free)(void*));
+    void * __TBB_malloc_safer_realloc( void *ptr, size_t, void* );
+    void * __TBB_malloc_safer_aligned_realloc( void *ptr, size_t, size_t, void* );
+    size_t __TBB_malloc_safer_msize( void *ptr, size_t (*orig_msize_crt80d)(void*));
+    size_t __TBB_malloc_safer_aligned_msize( void *ptr, size_t, size_t, size_t (*orig_msize_crt80d)(void*,size_t,size_t));
+
+#if MALLOC_ZONE_OVERLOAD_ENABLED
+    void   __TBB_malloc_free_definite_size(void *object, size_t size);
+#endif
+} // extern "C"
+
+// Struct with original free() and _msize() pointers
+struct orig_ptrs {
+    void   (*free) (void*);
+    size_t (*msize)(void*);
+};
+
+struct orig_aligned_ptrs {
+    void   (*aligned_free) (void*);
+    size_t (*aligned_msize)(void*,size_t,size_t);
+};
+
+#endif /* _TBB_malloc_proxy_H_ */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/proxy_overload_osx.h b/xdl/third_party/tbb/src/tbbmalloc/proxy_overload_osx.h
new file mode 100644
index 00000000..089f7be6
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/proxy_overload_osx.h
@@ -0,0 +1,190 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// The original source for this code is
+// Copyright (c) 2011, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+//     * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+//     * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+//     * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#include <AvailabilityMacros.h>
+#include <malloc/malloc.h>
+#include <mach/mach.h>
+#include <stdlib.h>
+
+static kern_return_t enumerator(task_t, void *, unsigned, vm_address_t,
+                                memory_reader_t, vm_range_recorder_t)
+{
+    return KERN_FAILURE;
+}
+
+static size_t good_size(malloc_zone_t *, size_t size)
+{
+    return size;
+}
+
+static boolean_t zone_check(malloc_zone_t *) /* Consistency checker */
+{
+    return true;
+}
+
+static void zone_print(malloc_zone_t *, boolean_t) { }
+static void zone_log(malloc_zone_t *, void *) {}
+static void zone_force_lock(malloc_zone_t *) {}
+static void zone_force_unlock(malloc_zone_t *) {}
+
+static void zone_statistics(malloc_zone_t *, malloc_statistics_t *s)
+{
+    s->blocks_in_use = 0;
+    s->size_in_use = s->max_size_in_use = s->size_allocated = 0;
+}
+
+static boolean_t zone_locked(malloc_zone_t *)
+{
+    return false;
+}
+
+static boolean_t impl_zone_enable_discharge_checking(malloc_zone_t *)
+{
+    return false;
+}
+
+static void impl_zone_disable_discharge_checking(malloc_zone_t *) {}
+static void impl_zone_discharge(malloc_zone_t *, void *) {}
+static void impl_zone_destroy(struct _malloc_zone_t *) {}
+
+/* note: impl_malloc_usable_size() is called for each free() call, so it must be fast */
+static size_t impl_malloc_usable_size(struct _malloc_zone_t *, const void *ptr)
+{
+    // malloc_usable_size() is used by macOS* to recognize which memory manager
+    // allocated the address, so our wrapper must not redirect to the original function.
+    return __TBB_malloc_safer_msize(const_cast<void*>(ptr), NULL);
+}
+
+static void *impl_malloc(struct _malloc_zone_t *, size_t size);
+static void *impl_calloc(struct _malloc_zone_t *, size_t num_items, size_t size);
+static void *impl_valloc(struct _malloc_zone_t *, size_t size);
+static void impl_free(struct _malloc_zone_t *, void *ptr);
+static void *impl_realloc(struct _malloc_zone_t *, void *ptr, size_t size);
+static void *impl_memalign(struct _malloc_zone_t *, size_t alignment, size_t size);
+
+/* ptr is in zone and have reported size */
+static void impl_free_definite_size(struct _malloc_zone_t*, void *ptr, size_t size)
+{
+    __TBB_malloc_free_definite_size(ptr, size);
+}
+
+/* Empty out caches in the face of memory pressure. */
+static size_t impl_pressure_relief(struct _malloc_zone_t *, size_t goal)
+{
+    return 0;
+}
+
+static malloc_zone_t *system_zone = NULL;
+
+struct DoMallocReplacement {
+    DoMallocReplacement() {
+        static malloc_introspection_t introspect;
+        memset(&introspect, 0, sizeof(malloc_introspection_t));
+        static malloc_zone_t zone;
+        memset(&zone, 0, sizeof(malloc_zone_t));
+
+        introspect.enumerator = &enumerator;
+        introspect.good_size = &good_size;
+        introspect.check = &zone_check;
+        introspect.print = &zone_print;
+        introspect.log = zone_log;
+        introspect.force_lock = &zone_force_lock;
+        introspect.force_unlock = &zone_force_unlock;
+        introspect.statistics = zone_statistics;
+        introspect.zone_locked = &zone_locked;
+        introspect.enable_discharge_checking = &impl_zone_enable_discharge_checking;
+        introspect.disable_discharge_checking = &impl_zone_disable_discharge_checking;
+        introspect.discharge = &impl_zone_discharge;
+
+        zone.size = &impl_malloc_usable_size;
+        zone.malloc = &impl_malloc;
+        zone.calloc = &impl_calloc;
+        zone.valloc = &impl_valloc;
+        zone.free = &impl_free;
+        zone.realloc = &impl_realloc;
+        zone.destroy = &impl_zone_destroy;
+        zone.zone_name = "tbbmalloc";
+        zone.introspect = &introspect;
+        zone.version = 8;
+        zone.memalign = impl_memalign;
+        zone.free_definite_size = &impl_free_definite_size;
+        zone.pressure_relief = &impl_pressure_relief;
+
+        // make sure that default purgeable zone is initialized
+        malloc_default_purgeable_zone();
+        void* ptr = malloc(1);
+        // get all registered memory zones
+        unsigned zcount = 0;
+        malloc_zone_t** zone_array = NULL;
+        kern_return_t errorcode = malloc_get_all_zones(mach_task_self(),NULL,(vm_address_t**)&zone_array,&zcount);
+        if (!errorcode && zone_array && zcount>0) {
+            // find the zone that allocated ptr
+            for (unsigned i=0; i<zcount; ++i) {
+                malloc_zone_t* z = zone_array[i];
+                if (z && z->size(z,ptr)>0) { // the right one is found
+                    system_zone = z;
+                    break;
+                }
+            }
+        }
+        free(ptr);
+
+        malloc_zone_register(&zone);
+        if (system_zone) {
+            // after unregistration of the system zone, the last registered (i.e. our) zone becomes the default
+            malloc_zone_unregister(system_zone);
+            // register the system zone back
+            malloc_zone_register(system_zone);
+        }
+    }
+};
+
+static DoMallocReplacement doMallocReplacement;
+
diff --git a/xdl/third_party/tbb/src/tbbmalloc/shared_utils.h b/xdl/third_party/tbb/src/tbbmalloc/shared_utils.h
new file mode 100644
index 00000000..2bbd2130
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/shared_utils.h
@@ -0,0 +1,136 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_shared_utils_H
+#define __TBB_shared_utils_H
+
+// Include files containing declarations of intptr_t and uintptr_t
+#include <stddef.h>  // size_t
+#if _MSC_VER
+typedef unsigned __int16 uint16_t;
+typedef unsigned __int32 uint32_t;
+typedef unsigned __int64 uint64_t;
+ #if !UINTPTR_MAX
+  #define UINTPTR_MAX SIZE_MAX
+ #endif
+#else // _MSC_VER
+#include <stdint.h>
+#endif
+
+/*
+ * Functions to align an integer down or up to the given power of two,
+ * and test for such an alignment, and for power of two.
+ */
+template<typename T>
+static inline T alignDown(T arg, uintptr_t alignment) {
+    return T( (uintptr_t)arg                & ~(alignment-1));
+}
+template<typename T>
+static inline T alignUp  (T arg, uintptr_t alignment) {
+    return T(((uintptr_t)arg+(alignment-1)) & ~(alignment-1));
+    // /*is this better?*/ return (((uintptr_t)arg-1) | (alignment-1)) + 1;
+}
+template<typename T> // works for not power-of-2 alignments
+static inline T alignUpGeneric(T arg, uintptr_t alignment) {
+    if (size_t rem = arg % alignment) {
+        arg += alignment - rem;
+    }
+    return arg;
+}
+
+template<typename T, size_t N> // generic function to find length of array
+inline size_t arrayLength(const T(&)[N]) {
+    return N;
+}
+
+#if defined(min)
+#undef min
+#endif
+
+template<typename T>
+T min ( const T& val1, const T& val2 ) {
+    return val1 < val2 ? val1 : val2;
+}
+
+/*
+ * Functions to parse files information (system files for example)
+ */
+
+#include <stdio.h>
+
+#if defined(_MSC_VER) && (_MSC_VER<1900) && !defined(__INTEL_COMPILER)
+    // Suppress overzealous compiler warnings that default ctor and assignment
+    // operator cannot be generated and object 'class' can never be instantiated.
+    #pragma warning(push)
+    #pragma warning(disable:4510 4512 4610)
+#endif
+
+struct parseFileItem {
+    const char* format;
+    unsigned long long& value;
+};
+
+#if defined(_MSC_VER) && (_MSC_VER<1900) && !defined(__INTEL_COMPILER)
+    #pragma warning(pop)
+#endif
+
+template <int BUF_LINE_SIZE, int N>
+void parseFile(const char* file, const parseFileItem (&items)[N]) {
+    // Tries to find all items in each line
+    int found[N] = { 0 };
+    // If all items found, stop forward file reading
+    int numFound = 0;
+    // Line storage
+    char buf[BUF_LINE_SIZE];
+
+    if (FILE *f = fopen(file, "r")) {
+        while (numFound < N && fgets(buf, BUF_LINE_SIZE, f)) {
+            for (int i = 0; i < N; ++i) {
+                if (!found[i] && 1 == sscanf(buf, items[i].format, &items[i].value)) {
+                    ++numFound;
+                    found[i] = 1;
+                }
+            }
+        }
+        fclose(f);
+    }
+}
+
+namespace rml {
+namespace internal {
+
+/*
+ * Best estimate of cache line size, for the purpose of avoiding false sharing.
+ * Too high causes memory overhead, too low causes false-sharing overhead.
+ * Because, e.g., 32-bit code might run on a 64-bit system with a larger cache line size,
+ * it would probably be better to probe at runtime where possible and/or allow for an environment variable override,
+ * but currently this is still used for compile-time layout of class Block, so the change is not entirely trivial.
+ */
+#if __powerpc64__ || __ppc64__ || __bgp__
+const uint32_t estimatedCacheLineSize = 128;
+#else
+const uint32_t estimatedCacheLineSize =  64;
+#endif
+
+} // namespace internal
+} // namespace rml
+
+#endif /* __TBB_shared_utils_H */
+
diff --git a/xdl/third_party/tbb/src/tbbmalloc/tbb_function_replacement.cpp b/xdl/third_party/tbb/src/tbbmalloc/tbb_function_replacement.cpp
new file mode 100644
index 00000000..93a519ee
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/tbb_function_replacement.cpp
@@ -0,0 +1,504 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+#if !__TBB_WIN8UI_SUPPORT && defined(_WIN32)
+
+#define _CRT_SECURE_NO_DEPRECATE 1
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+
+#include <windows.h>
+#include <new>
+#include <stdio.h>
+#include <string.h>
+#include "tbb_function_replacement.h"
+
+#include "tbb/tbb_stddef.h"
+#include "../tbb/tbb_assert_impl.h"
+
+inline UINT_PTR Ptr2Addrint(LPVOID ptr)
+{
+    Int2Ptr i2p;
+    i2p.lpv = ptr;
+    return i2p.uip;
+}
+
+inline LPVOID Addrint2Ptr(UINT_PTR ptr)
+{
+    Int2Ptr i2p;
+    i2p.uip = ptr;
+    return i2p.lpv;
+}
+
+// Is the distance between addr1 and addr2 smaller than dist
+inline bool IsInDistance(UINT_PTR addr1, UINT_PTR addr2, __int64 dist)
+{
+    __int64 diff = addr1>addr2 ? addr1-addr2 : addr2-addr1;
+    return diff<dist;
+}
+
+/*
+ * When inserting a probe in 64 bits process the distance between the insertion
+ * point and the target may be bigger than 2^32. In this case we are using
+ * indirect jump through memory where the offset to this memory location
+ * is smaller than 2^32 and it contains the absolute address (8 bytes).
+ *
+ * This class is used to hold the pages used for the above trampolines.
+ * Since this utility will be used to replace malloc functions this implementation
+ * doesn't allocate memory dynamically.
+ *
+ * The struct MemoryBuffer holds the data about a page in the memory used for
+ * replacing functions in 64-bit code where the target is too far to be replaced
+ * with a short jump. All the calculations of m_base and m_next are in a multiple
+ * of SIZE_OF_ADDRESS (which is 8 in Win64).
+ */
+class MemoryProvider {
+private:
+    struct MemoryBuffer {
+        UINT_PTR m_base;    // base address of the buffer
+        UINT_PTR m_next;    // next free location in the buffer
+        DWORD    m_size;    // size of buffer
+
+        // Default constructor
+        MemoryBuffer() : m_base(0), m_next(0), m_size(0) {}
+
+        // Constructor
+        MemoryBuffer(void *base, DWORD size)
+        {
+            m_base = Ptr2Addrint(base);
+            m_next = m_base;
+            m_size = size;
+        }
+    };
+
+MemoryBuffer *CreateBuffer(UINT_PTR addr)
+    {
+        // No more room in the pages database
+        if (m_lastBuffer - m_pages == MAX_NUM_BUFFERS)
+            return 0;
+
+        void *newAddr = Addrint2Ptr(addr);
+        // Get information for the region which the given address belongs to
+        MEMORY_BASIC_INFORMATION memInfo;
+        if (VirtualQuery(newAddr, &memInfo, sizeof(memInfo)) != sizeof(memInfo))
+            return 0;
+
+        for(;;) {
+            // The new address to check is beyond the current region and aligned to allocation size
+            newAddr = Addrint2Ptr( (Ptr2Addrint(memInfo.BaseAddress) + memInfo.RegionSize + m_allocSize) & ~(UINT_PTR)(m_allocSize-1) );
+
+            // Check that the address is in the right distance.
+            // VirtualAlloc can only round the address down; so it will remain in the right distance
+            if (!IsInDistance(addr, Ptr2Addrint(newAddr), MAX_DISTANCE))
+                break;
+
+            if (VirtualQuery(newAddr, &memInfo, sizeof(memInfo)) != sizeof(memInfo))
+                break;
+
+            if (memInfo.State == MEM_FREE && memInfo.RegionSize >= m_allocSize)
+            {
+                // Found a free region, try to allocate a page in this region
+                void *newPage = VirtualAlloc(newAddr, m_allocSize, MEM_COMMIT|MEM_RESERVE, PAGE_READWRITE);
+                if (!newPage)
+                    break;
+
+                // Add the new page to the pages database
+                MemoryBuffer *pBuff = new (m_lastBuffer) MemoryBuffer(newPage, m_allocSize);
+                ++m_lastBuffer;
+                return pBuff;
+            }
+        }
+
+        // Failed to find a buffer in the distance
+        return 0;
+    }
+
+public:
+    MemoryProvider()
+    {
+        SYSTEM_INFO sysInfo;
+        GetSystemInfo(&sysInfo);
+        m_allocSize = sysInfo.dwAllocationGranularity;
+        m_lastBuffer = &m_pages[0];
+    }
+
+    // We can't free the pages in the destructor because the trampolines
+    // are using these memory locations and a replaced function might be called
+    // after the destructor was called.
+    ~MemoryProvider()
+    {
+    }
+
+    // Return a memory location in distance less than 2^31 from input address
+    UINT_PTR GetLocation(UINT_PTR addr)
+    {
+        MemoryBuffer *pBuff = m_pages;
+        for (; pBuff<m_lastBuffer && IsInDistance(pBuff->m_next, addr, MAX_DISTANCE); ++pBuff)
+        {
+            if (pBuff->m_next < pBuff->m_base + pBuff->m_size)
+            {
+                UINT_PTR loc = pBuff->m_next;
+                pBuff->m_next += MAX_PROBE_SIZE;
+                return loc;
+            }
+        }
+
+        pBuff = CreateBuffer(addr);
+        if(!pBuff)
+            return 0;
+
+        UINT_PTR loc = pBuff->m_next;
+        pBuff->m_next += MAX_PROBE_SIZE;
+        return loc;
+    }
+
+private:
+    MemoryBuffer m_pages[MAX_NUM_BUFFERS];
+    MemoryBuffer *m_lastBuffer;
+    DWORD m_allocSize;
+};
+
+static MemoryProvider memProvider;
+
+// Compare opcodes from dictionary (str1) and opcodes from code (str2)
+// str1 might contain '*' to mask addresses
+// RETURN: 0 if opcodes did not match, 1 on success
+size_t compareStrings( const char *str1, const char *str2 )
+{
+   for (size_t i=0; str1[i]!=0; i++){
+       if( str1[i]!='*' && str1[i]!='#' && str1[i]!=str2[i] ) return 0;
+   }
+   return 1;
+}
+
+// Check function prologue with known prologues from the dictionary
+// opcodes - dictionary
+// inpAddr - pointer to function prologue
+// Dictionary contains opcodes for several full asm instructions
+// + one opcode byte for the next asm instruction for safe address processing
+// RETURN: 1 + the index of the matched pattern, or 0 if no match found.
+static UINT CheckOpcodes( const char ** opcodes, void *inpAddr, bool abortOnError )
+{
+    static size_t opcodesStringsCount = 0;
+    static size_t maxOpcodesLength = 0;
+    static size_t opcodes_pointer = (size_t)opcodes;
+    char opcodeString[2*MAX_PATTERN_SIZE+1];
+    size_t i;
+    size_t result;
+
+    // Get the values for static variables
+    // max length and number of patterns
+    if( !opcodesStringsCount || opcodes_pointer != (size_t)opcodes ){
+        while( *(opcodes + opcodesStringsCount)!= NULL ){
+            if( (i=strlen(*(opcodes + opcodesStringsCount))) > maxOpcodesLength )
+                maxOpcodesLength = i;
+            opcodesStringsCount++;
+        }
+        opcodes_pointer = (size_t)opcodes;
+        __TBB_ASSERT( maxOpcodesLength/2 <= MAX_PATTERN_SIZE, "Pattern exceeded the limit of 28 opcodes/56 symbols" );
+    }
+
+    // Translate prologue opcodes to string format to compare
+    for( i=0; i<maxOpcodesLength/2 && i<MAX_PATTERN_SIZE; ++i ){
+        sprintf( opcodeString + 2*i, "%.2X", *((unsigned char*)inpAddr+i) );
+    }
+    opcodeString[2*i] = 0;
+
+    // Compare translated opcodes with patterns
+    for( UINT idx=0; idx<opcodesStringsCount; ++idx ){
+        result = compareStrings( opcodes[idx],opcodeString );
+        if( result )
+            return idx+1; // avoid 0 which indicates a failure
+    }
+    if (abortOnError) {
+        // Impossibility to find opcodes in the dictionary is a serious issue,
+        // as if we unable to call original function, leak or crash is expected result.
+        __TBB_ASSERT_RELEASE( false, "CheckOpcodes failed" );
+    }
+    return 0;
+}
+
+// Modify offsets in original code after moving it to a trampoline.
+// We do not have more than one offset to correct in existing opcode patterns.
+static void CorrectOffset( UINT_PTR address, const char* pattern, UINT distance )
+{
+    const char* pos = strstr(pattern, "#*******");
+    if( pos ) {
+        address += (pos - pattern)/2; // compute the offset position
+        UINT value;
+        // UINT assignment is not used to avoid potential alignment issues
+        memcpy(&value, Addrint2Ptr(address), sizeof(value));
+        value += distance;
+        memcpy(Addrint2Ptr(address), &value, sizeof(value));
+    }
+}
+
+// Insert jump relative instruction to the input address
+// RETURN: the size of the trampoline or 0 on failure
+static DWORD InsertTrampoline32(void *inpAddr, void *targetAddr, const char* pattern, void** storedAddr)
+{
+    size_t bytesToMove = SIZE_OF_RELJUMP;
+    UINT_PTR srcAddr = Ptr2Addrint(inpAddr);
+    UINT_PTR tgtAddr = Ptr2Addrint(targetAddr);
+    // Check that the target fits in 32 bits
+    if (!IsInDistance(srcAddr, tgtAddr, MAX_DISTANCE))
+        return 0;
+
+    UINT_PTR offset;
+    UINT offset32;
+    UCHAR *codePtr = (UCHAR *)inpAddr;
+
+    if ( storedAddr ){ // If requested, store original function code
+        bytesToMove = strlen(pattern)/2-1; // The last byte matching the pattern must not be copied
+        __TBB_ASSERT_RELEASE( bytesToMove >= SIZE_OF_RELJUMP, "Incorrect bytecode pattern?" );
+        UINT_PTR trampAddr = memProvider.GetLocation(srcAddr);
+        if (!trampAddr)
+            return 0;
+        *storedAddr = Addrint2Ptr(trampAddr);
+        // Set 'executable' flag for original instructions in the new place
+        DWORD pageFlags = PAGE_EXECUTE_READWRITE;
+        if (!VirtualProtect(*storedAddr, MAX_PROBE_SIZE, pageFlags, &pageFlags)) return 0;
+        // Copy original instructions to the new place
+        memcpy(*storedAddr, codePtr, bytesToMove);
+        offset = srcAddr - trampAddr;
+        offset32 = (UINT)(offset & 0xFFFFFFFF);
+        CorrectOffset( trampAddr, pattern, offset32 );
+        // Set jump to the code after replacement
+        offset32 -= SIZE_OF_RELJUMP;
+        *(UCHAR*)(trampAddr+bytesToMove) = 0xE9;
+        memcpy((UCHAR*)(trampAddr+bytesToMove+1), &offset32, sizeof(offset32));
+    }
+
+    // The following will work correctly even if srcAddr>tgtAddr, as long as
+    // address difference is less than 2^31, which is guaranteed by IsInDistance.
+    offset = tgtAddr - srcAddr - SIZE_OF_RELJUMP;
+    offset32 = (UINT)(offset & 0xFFFFFFFF);
+    // Insert the jump to the new code
+    *codePtr = 0xE9;
+    memcpy(codePtr+1, &offset32, sizeof(offset32));
+
+    // Fill the rest with NOPs to correctly see disassembler of old code in debugger.
+    for( unsigned i=SIZE_OF_RELJUMP; i<bytesToMove; i++ ){
+        *(codePtr+i) = 0x90;
+    }
+
+    return SIZE_OF_RELJUMP;
+}
+
+// This function is called when the offset doesn't fit in 32 bits
+// 1  Find and allocate a page in the small distance (<2^31) from input address
+// 2  Put jump RIP relative indirect through the address in the close page
+// 3  Put the absolute address of the target in the allocated location
+// RETURN: the size of the trampoline or 0 on failure
+static DWORD InsertTrampoline64(void *inpAddr, void *targetAddr, const char* pattern, void** storedAddr)
+{
+    size_t bytesToMove = SIZE_OF_INDJUMP;
+
+    UINT_PTR srcAddr = Ptr2Addrint(inpAddr);
+    UINT_PTR tgtAddr = Ptr2Addrint(targetAddr);
+
+    // Get a location close to the source address
+    UINT_PTR location = memProvider.GetLocation(srcAddr);
+    if (!location)
+        return 0;
+
+    UINT_PTR offset;
+    UINT offset32;
+    UCHAR *codePtr = (UCHAR *)inpAddr;
+
+    // Fill the location
+    UINT_PTR *locPtr = (UINT_PTR *)Addrint2Ptr(location);
+    *locPtr = tgtAddr;
+
+    if ( storedAddr ){ // If requested, store original function code
+        bytesToMove = strlen(pattern)/2-1; // The last byte matching the pattern must not be copied
+        __TBB_ASSERT_RELEASE( bytesToMove >= SIZE_OF_INDJUMP, "Incorrect bytecode pattern?" );
+        UINT_PTR trampAddr = memProvider.GetLocation(srcAddr);
+        if (!trampAddr)
+            return 0;
+        *storedAddr = Addrint2Ptr(trampAddr);
+        // Set 'executable' flag for original instructions in the new place
+        DWORD pageFlags = PAGE_EXECUTE_READWRITE;
+        if (!VirtualProtect(*storedAddr, MAX_PROBE_SIZE, pageFlags, &pageFlags)) return 0;
+        // Copy original instructions to the new place
+        memcpy(*storedAddr, codePtr, bytesToMove);
+        offset = srcAddr - trampAddr;
+        offset32 = (UINT)(offset & 0xFFFFFFFF);
+        CorrectOffset( trampAddr, pattern, offset32 );
+        // Set jump to the code after replacement. It is within the distance of relative jump!
+        offset32 -= SIZE_OF_RELJUMP;
+        *(UCHAR*)(trampAddr+bytesToMove) = 0xE9;
+        memcpy((UCHAR*)(trampAddr+bytesToMove+1), &offset32, sizeof(offset32));
+    }
+
+    // Fill the buffer
+    offset = location - srcAddr - SIZE_OF_INDJUMP;
+    offset32 = (UINT)(offset & 0xFFFFFFFF);
+    *(codePtr) = 0xFF;
+    *(codePtr+1) = 0x25;
+    memcpy(codePtr+2, &offset32, sizeof(offset32));
+
+    // Fill the rest with NOPs to correctly see disassembler of old code in debugger.
+    for( unsigned i=SIZE_OF_INDJUMP; i<bytesToMove; i++ ){
+        *(codePtr+i) = 0x90;
+    }
+
+    return SIZE_OF_INDJUMP;
+}
+
+// Insert a jump instruction in the inpAddr to the targetAddr
+// 1. Get the memory protection of the page containing the input address
+// 2. Change the memory protection to writable
+// 3. Call InsertTrampoline32 or InsertTrampoline64
+// 4. Restore memory protection
+// RETURN: FALSE on failure, TRUE on success
+static bool InsertTrampoline(void *inpAddr, void *targetAddr, const char ** opcodes, void** origFunc)
+{
+    DWORD probeSize;
+    // Change page protection to EXECUTE+WRITE
+    DWORD origProt = 0;
+    if (!VirtualProtect(inpAddr, MAX_PROBE_SIZE, PAGE_EXECUTE_WRITECOPY, &origProt))
+        return FALSE;
+
+    const char* pattern = NULL;
+    if ( origFunc ){ // Need to store original function code
+        UCHAR * const codePtr = (UCHAR *)inpAddr;
+        if ( *codePtr == 0xE9 ){ // JMP relative instruction
+            // For the special case when a system function consists of a single near jump,
+            // instead of moving it somewhere we use the target of the jump as the original function.
+            unsigned offsetInJmp = *(unsigned*)(codePtr + 1);
+            *origFunc = (void*)(Ptr2Addrint(inpAddr) + offsetInJmp + SIZE_OF_RELJUMP);
+            origFunc = NULL; // now it must be ignored by InsertTrampoline32/64
+        } else {
+            // find the right opcode pattern
+            UINT opcodeIdx = CheckOpcodes( opcodes, inpAddr, /*abortOnError=*/true );
+            __TBB_ASSERT( opcodeIdx > 0, "abortOnError ignored in CheckOpcodes?" );
+            pattern = opcodes[opcodeIdx-1];  // -1 compensates for +1 in CheckOpcodes
+        }
+    }
+
+    probeSize = InsertTrampoline32(inpAddr, targetAddr, pattern, origFunc);
+    if (!probeSize)
+        probeSize = InsertTrampoline64(inpAddr, targetAddr, pattern, origFunc);
+
+    // Restore original protection
+    VirtualProtect(inpAddr, MAX_PROBE_SIZE, origProt, &origProt);
+
+    if (!probeSize)
+        return FALSE;
+
+    FlushInstructionCache(GetCurrentProcess(), inpAddr, probeSize);
+    FlushInstructionCache(GetCurrentProcess(), origFunc, probeSize);
+
+    return TRUE;
+}
+
+// Routine to replace the functions
+// TODO: replace opcodesNumber with opcodes and opcodes number to check if we replace right code.
+FRR_TYPE ReplaceFunctionA(const char *dllName, const char *funcName, FUNCPTR newFunc, const char ** opcodes, FUNCPTR* origFunc)
+{
+    // Cache the results of the last search for the module
+    // Assume that there was no DLL unload between
+    static char cachedName[MAX_PATH+1];
+    static HMODULE cachedHM = 0;
+
+    if (!dllName || !*dllName)
+        return FRR_NODLL;
+
+    if (!cachedHM || strncmp(dllName, cachedName, MAX_PATH) != 0)
+    {
+        // Find the module handle for the input dll
+        HMODULE hModule = GetModuleHandleA(dllName);
+        if (hModule == 0)
+        {
+            // Couldn't find the module with the input name
+            cachedHM = 0;
+            return FRR_NODLL;
+        }
+
+        cachedHM = hModule;
+        strncpy(cachedName, dllName, MAX_PATH);
+    }
+
+    FARPROC inpFunc = GetProcAddress(cachedHM, funcName);
+    if (inpFunc == 0)
+    {
+        // Function was not found
+        return FRR_NOFUNC;
+    }
+
+    if (!InsertTrampoline((void*)inpFunc, (void*)newFunc, opcodes, (void**)origFunc)){
+        // Failed to insert the trampoline to the target address
+        return FRR_FAILED;
+    }
+
+    return FRR_OK;
+}
+
+FRR_TYPE ReplaceFunctionW(const wchar_t *dllName, const char *funcName, FUNCPTR newFunc, const char ** opcodes, FUNCPTR* origFunc)
+{
+    // Cache the results of the last search for the module
+    // Assume that there was no DLL unload between
+    static wchar_t cachedName[MAX_PATH+1];
+    static HMODULE cachedHM = 0;
+
+    if (!dllName || !*dllName)
+        return FRR_NODLL;
+
+    if (!cachedHM || wcsncmp(dllName, cachedName, MAX_PATH) != 0)
+    {
+        // Find the module handle for the input dll
+        HMODULE hModule = GetModuleHandleW(dllName);
+        if (hModule == 0)
+        {
+            // Couldn't find the module with the input name
+            cachedHM = 0;
+            return FRR_NODLL;
+        }
+
+        cachedHM = hModule;
+        wcsncpy(cachedName, dllName, MAX_PATH);
+    }
+
+    FARPROC inpFunc = GetProcAddress(cachedHM, funcName);
+    if (inpFunc == 0)
+    {
+        // Function was not found
+        return FRR_NOFUNC;
+    }
+
+    if (!InsertTrampoline((void*)inpFunc, (void*)newFunc, opcodes, (void**)origFunc)){
+        // Failed to insert the trampoline to the target address
+        return FRR_FAILED;
+    }
+
+    return FRR_OK;
+}
+
+bool IsPrologueKnown(HMODULE module, const char *funcName, const char **opcodes)
+{
+    FARPROC inpFunc = GetProcAddress(module, funcName);
+    if (!inpFunc)
+        return false;
+    return CheckOpcodes( opcodes, (void*)inpFunc, /*abortOnError=*/false ) != 0;
+}
+
+#endif /* !__TBB_WIN8UI_SUPPORT && defined(_WIN32) */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/tbb_function_replacement.h b/xdl/third_party/tbb/src/tbbmalloc/tbb_function_replacement.h
new file mode 100644
index 00000000..35dc538e
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/tbb_function_replacement.h
@@ -0,0 +1,83 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_function_replacement_H
+#define __TBB_function_replacement_H
+
+#include <stddef.h> //for ptrdiff_t
+typedef enum {
+    FRR_OK,     /* Succeeded in replacing the function */
+    FRR_NODLL,  /* The requested DLL was not found */
+    FRR_NOFUNC, /* The requested function was not found */
+    FRR_FAILED, /* The function replacement request failed */
+} FRR_TYPE;
+
+typedef enum {
+    FRR_FAIL,     /* Required function */
+    FRR_IGNORE,   /* optional function */
+} FRR_ON_ERROR;
+
+typedef void (*FUNCPTR)();
+
+#ifndef UNICODE
+#define ReplaceFunction ReplaceFunctionA
+#else
+#define ReplaceFunction ReplaceFunctionW
+#endif //UNICODE
+
+FRR_TYPE ReplaceFunctionA(const char *dllName, const char *funcName, FUNCPTR newFunc, const char ** opcodes, FUNCPTR* origFunc=NULL);
+FRR_TYPE ReplaceFunctionW(const wchar_t *dllName, const char *funcName, FUNCPTR newFunc, const char ** opcodes, FUNCPTR* origFunc=NULL);
+
+bool IsPrologueKnown(HMODULE module, const char *funcName, const char **opcodes);
+
+// Utilities to convert between ADDRESS and LPVOID
+union Int2Ptr {
+    UINT_PTR uip;
+    LPVOID lpv;
+};
+
+inline UINT_PTR Ptr2Addrint(LPVOID ptr);
+inline LPVOID Addrint2Ptr(UINT_PTR ptr);
+
+// The size of a trampoline region
+const unsigned MAX_PROBE_SIZE = 32;
+
+// The size of a jump relative instruction "e9 00 00 00 00"
+const unsigned SIZE_OF_RELJUMP = 5;
+
+// The size of jump RIP relative indirect "ff 25 00 00 00 00"
+const unsigned SIZE_OF_INDJUMP = 6;
+
+// The size of address we put in the location (in Intel64)
+const unsigned SIZE_OF_ADDRESS = 8;
+
+// The size limit (in bytes) for an opcode pattern to fit into a trampoline
+// There should be enough space left for a relative jump; +1 is for the extra pattern byte.
+const unsigned MAX_PATTERN_SIZE = MAX_PROBE_SIZE - SIZE_OF_RELJUMP + 1;
+
+// The max distance covered in 32 bits: 2^31 - 1 - C
+// where C should not be smaller than the size of a probe.
+// The latter is important to correctly handle "backward" jumps.
+const __int64 MAX_DISTANCE = (((__int64)1 << 31) - 1) - MAX_PROBE_SIZE;
+
+// The maximum number of distinct buffers in memory
+const ptrdiff_t MAX_NUM_BUFFERS = 256;
+
+#endif //__TBB_function_replacement_H
diff --git a/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc.cpp b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc.cpp
new file mode 100644
index 00000000..bab6e798
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc.cpp
@@ -0,0 +1,121 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "TypeDefinitions.h" // Customize.h and proxy.h get included
+#include "tbbmalloc_internal_api.h"
+
+#include "../tbb/tbb_assert_impl.h" // Out-of-line TBB assertion handling routines are instantiated here.
+
+#undef UNICODE
+
+#if USE_PTHREAD
+#include <dlfcn.h> // dlopen
+#elif USE_WINTHREAD
+#include "tbb/machine/windows_api.h"
+#endif
+
+namespace rml {
+namespace internal {
+
+#if TBB_USE_DEBUG
+#define DEBUG_SUFFIX "_debug"
+#else
+#define DEBUG_SUFFIX
+#endif /* TBB_USE_DEBUG */
+
+// MALLOCLIB_NAME is the name of the TBB memory allocator library.
+#if _WIN32||_WIN64
+#define MALLOCLIB_NAME "tbbmalloc" DEBUG_SUFFIX ".dll"
+#elif __APPLE__
+#define MALLOCLIB_NAME "libtbbmalloc" DEBUG_SUFFIX ".dylib"
+#elif __FreeBSD__ || __NetBSD__ || __OpenBSD__ || __sun || _AIX || __ANDROID__
+#define MALLOCLIB_NAME "libtbbmalloc" DEBUG_SUFFIX ".so"
+#elif __linux__
+#define MALLOCLIB_NAME "libtbbmalloc" DEBUG_SUFFIX  __TBB_STRING(.so.TBB_COMPATIBLE_INTERFACE_VERSION)
+#else
+#error Unknown OS
+#endif
+
+void init_tbbmalloc() {
+#if DO_ITT_NOTIFY
+    MallocInitializeITT();
+#endif
+
+/* Preventing TBB allocator library from unloading to prevent
+   resource leak, as memory is not released on the library unload.
+*/
+#if USE_WINTHREAD && !__TBB_SOURCE_DIRECTLY_INCLUDED && !__TBB_WIN8UI_SUPPORT
+    // Prevent Windows from displaying message boxes if it fails to load library
+    UINT prev_mode = SetErrorMode (SEM_FAILCRITICALERRORS);
+    HMODULE lib;
+    BOOL ret = GetModuleHandleEx(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS
+                                 |GET_MODULE_HANDLE_EX_FLAG_PIN,
+                                 (LPCTSTR)&scalable_malloc, &lib);
+    MALLOC_ASSERT(lib && ret, "Allocator can't find itself.");
+    SetErrorMode (prev_mode);
+#endif /* USE_PTHREAD && !__TBB_SOURCE_DIRECTLY_INCLUDED */
+}
+
+#if !__TBB_SOURCE_DIRECTLY_INCLUDED
+#if USE_WINTHREAD
+extern "C" BOOL WINAPI DllMain( HINSTANCE /*hInst*/, DWORD callReason, LPVOID lpvReserved)
+{
+    if (callReason==DLL_THREAD_DETACH)
+    {
+        __TBB_mallocThreadShutdownNotification();
+    }
+    else if (callReason==DLL_PROCESS_DETACH)
+    {
+        __TBB_mallocProcessShutdownNotification(lpvReserved != NULL);
+    }
+    return TRUE;
+}
+#else /* !USE_WINTHREAD */
+struct RegisterProcessShutdownNotification {
+// Work around non-reentrancy in dlopen() on Android
+#if !__TBB_USE_DLOPEN_REENTRANCY_WORKAROUND
+    RegisterProcessShutdownNotification() {
+        // prevents unloading, POSIX case
+        dlopen(MALLOCLIB_NAME, RTLD_NOW);
+    }
+#endif /* !__TBB_USE_DLOPEN_REENTRANCY_WORKAROUND */
+    ~RegisterProcessShutdownNotification() {
+        __TBB_mallocProcessShutdownNotification(false);
+    }
+};
+
+static RegisterProcessShutdownNotification reg;
+#endif /* !USE_WINTHREAD */
+#endif /* !__TBB_SOURCE_DIRECTLY_INCLUDED */
+
+} } // namespaces
+
+#if __TBB_ipf
+/* It was found that on IA-64 architecture inlining of __TBB_machine_lockbyte leads
+   to serious performance regression with ICC. So keep it out-of-line.
+
+   This code is copy-pasted from tbb_misc.cpp.
+ */
+extern "C" intptr_t __TBB_machine_lockbyte( volatile unsigned char& flag ) {
+    tbb::internal::atomic_backoff backoff;
+    while( !__TBB_TryLockByte(flag) ) backoff.pause();
+    return 0;
+}
+#endif
diff --git a/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc.rc b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc.rc
new file mode 100644
index 00000000..546c7411
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc.rc
@@ -0,0 +1,119 @@
+// Copyright (c) 2005-2018 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//
+//
+//
+
+// Microsoft Visual C++ generated resource script.
+//
+#ifdef APSTUDIO_INVOKED
+#ifndef APSTUDIO_READONLY_SYMBOLS
+#define _APS_NO_MFC                     1
+#define _APS_NEXT_RESOURCE_VALUE        102
+#define _APS_NEXT_COMMAND_VALUE         40001
+#define _APS_NEXT_CONTROL_VALUE         1001
+#define _APS_NEXT_SYMED_VALUE           101
+#endif
+#endif
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#include <winresrc.h>
+#define ENDL "\r\n"
+#include "tbb/tbb_version.h"
+
+#define TBBMALLOC_VERNUMBERS TBB_VERSION_MAJOR, TBB_VERSION_MINOR, __TBB_VERSION_YMD
+#define TBBMALLOC_VERSION __TBB_STRING(TBBMALLOC_VERNUMBERS)
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// Neutral resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_NEU)
+#ifdef _WIN32
+LANGUAGE LANG_NEUTRAL, SUBLANG_NEUTRAL
+#pragma code_page(1252)
+#endif //_WIN32
+
+/////////////////////////////////////////////////////////////////////////////
+// manifest integration
+#ifdef TBB_MANIFEST
+#include "winuser.h"
+2 RT_MANIFEST tbbmanifest.exe.manifest
+#endif
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Version
+//
+
+VS_VERSION_INFO VERSIONINFO
+ FILEVERSION TBBMALLOC_VERNUMBERS
+ PRODUCTVERSION TBB_VERNUMBERS
+ FILEFLAGSMASK 0x17L
+#ifdef _DEBUG
+ FILEFLAGS 0x1L
+#else
+ FILEFLAGS 0x0L
+#endif
+ FILEOS 0x40004L
+ FILETYPE 0x2L
+ FILESUBTYPE 0x0L
+BEGIN
+    BLOCK "StringFileInfo"
+    BEGIN
+        BLOCK "000004b0"
+        BEGIN
+            VALUE "CompanyName", "Intel Corporation\0"
+            VALUE "FileDescription", "Scalable Allocator library\0"
+            VALUE "FileVersion", TBBMALLOC_VERSION "\0"
+            VALUE "LegalCopyright", "Copyright 2005-2018 Intel Corporation.  All Rights Reserved.\0"
+            VALUE "LegalTrademarks", "\0"
+#ifndef TBB_USE_DEBUG
+            VALUE "OriginalFilename", "tbbmalloc.dll\0"
+#else
+            VALUE "OriginalFilename", "tbbmalloc_debug.dll\0"
+#endif
+            VALUE "ProductName", "Intel(R) Threading Building Blocks for Windows\0"
+            VALUE "ProductVersion", TBB_VERSION "\0"
+            VALUE "PrivateBuild", "\0"
+            VALUE "SpecialBuild", "\0"
+        END
+    END
+    BLOCK "VarFileInfo"
+    BEGIN
+        VALUE "Translation", 0x0, 1200
+    END
+END
+
+#endif    // Neutral resources
+/////////////////////////////////////////////////////////////////////////////
+
+
+#ifndef APSTUDIO_INVOKED
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 3 resource.
+//
+
+
+/////////////////////////////////////////////////////////////////////////////
+#endif    // not APSTUDIO_INVOKED
+
diff --git a/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc_internal.h b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc_internal.h
new file mode 100644
index 00000000..b173ca15
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc_internal.h
@@ -0,0 +1,1244 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbbmalloc_internal_H
+#define __TBB_tbbmalloc_internal_H 1
+
+
+#include "TypeDefinitions.h" /* Also includes customization layer Customize.h */
+
+#if USE_PTHREAD
+    // Some pthreads documentation says that <pthreads.h> must be first header.
+    #include <pthread.h>
+    typedef pthread_key_t tls_key_t;
+#elif USE_WINTHREAD
+    #include "tbb/machine/windows_api.h"
+    typedef DWORD tls_key_t;
+#else
+    #error Must define USE_PTHREAD or USE_WINTHREAD
+#endif
+
+// TODO: *BSD also has it
+#define BACKEND_HAS_MREMAP __linux__
+#define CHECK_ALLOCATION_RANGE MALLOC_DEBUG || MALLOC_ZONE_OVERLOAD_ENABLED || MALLOC_UNIXLIKE_OVERLOAD_ENABLED
+
+#include "tbb/tbb_config.h" // for __TBB_LIBSTDCPP_EXCEPTION_HEADERS_BROKEN
+#if __TBB_LIBSTDCPP_EXCEPTION_HEADERS_BROKEN
+  #define _EXCEPTION_PTR_H /* prevents exception_ptr.h inclusion */
+  #define _GLIBCXX_NESTED_EXCEPTION_H /* prevents nested_exception.h inclusion */
+#endif
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <limits.h> // for CHAR_BIT
+#include <string.h> // for memset
+#if MALLOC_CHECK_RECURSION
+#include <new>        /* for placement new */
+#endif
+#include "tbb/scalable_allocator.h"
+#include "tbbmalloc_internal_api.h"
+
+/********* Various compile-time options        **************/
+
+#if !__TBB_DEFINE_MIC && __TBB_MIC_NATIVE
+ #error Intel(R) Many Integrated Core Compiler does not define __MIC__ anymore.
+#endif
+
+#define MALLOC_TRACE 0
+
+#if MALLOC_TRACE
+#define TRACEF(x) printf x
+#else
+#define TRACEF(x) ((void)0)
+#endif /* MALLOC_TRACE */
+
+#define ASSERT_TEXT NULL
+
+#define COLLECT_STATISTICS ( MALLOC_DEBUG && MALLOCENV_COLLECT_STATISTICS )
+#ifndef USE_INTERNAL_TID
+#define USE_INTERNAL_TID COLLECT_STATISTICS || MALLOC_TRACE
+#endif
+
+#include "Statistics.h"
+
+// call yield for whitebox testing, skip in real library
+#ifndef WhiteboxTestingYield
+#define WhiteboxTestingYield() ((void)0)
+#endif
+
+
+/********* End compile-time options        **************/
+
+namespace rml {
+
+namespace internal {
+
+#if __TBB_MALLOC_LOCACHE_STAT
+extern intptr_t mallocCalls, cacheHits;
+extern intptr_t memAllocKB, memHitKB;
+#endif
+
+//! Utility template function to prevent "unused" warnings by various compilers.
+template<typename T>
+void suppress_unused_warning( const T& ) {}
+
+/********** Various global default constants ********/
+
+/*
+ * Default huge page size
+ */
+static const size_t HUGE_PAGE_SIZE = 2 * 1024 * 1024;
+
+/********** End of global default constatns *********/
+
+/********** Various numeric parameters controlling allocations ********/
+
+/*
+ * slabSize - the size of a block for allocation of small objects,
+ * it must be larger than maxSegregatedObjectSize.
+ */
+const uintptr_t slabSize = 16*1024;
+
+/*
+ * Large blocks cache cleanup frequency.
+ * It should be power of 2 for the fast checking.
+ */
+const unsigned cacheCleanupFreq = 256;
+
+/*
+ * Alignment of large (>= minLargeObjectSize) objects.
+ */
+const size_t largeObjectAlignment = estimatedCacheLineSize;
+
+/*
+ * This number of bins in the TLS that leads to blocks that we can allocate in.
+ */
+const uint32_t numBlockBinLimit = 31;
+
+/********** End of numeric parameters controlling allocations *********/
+
+class BlockI;
+class Block;
+struct LargeMemoryBlock;
+struct ExtMemoryPool;
+struct MemRegion;
+class FreeBlock;
+class TLSData;
+class Backend;
+class MemoryPool;
+struct CacheBinOperation;
+extern const uint32_t minLargeObjectSize;
+
+enum DecreaseOrIncrease {
+    decrease, increase
+};
+
+class TLSKey {
+    tls_key_t TLS_pointer_key;
+public:
+    bool init();
+    bool destroy();
+    TLSData* getThreadMallocTLS() const;
+    void setThreadMallocTLS( TLSData * newvalue );
+    TLSData* createTLS(MemoryPool *memPool, Backend *backend);
+};
+
+template<typename Arg, typename Compare>
+inline void AtomicUpdate(Arg &location, Arg newVal, const Compare &cmp)
+{
+    MALLOC_STATIC_ASSERT(sizeof(Arg) == sizeof(intptr_t),
+                         "Type of argument must match AtomicCompareExchange type.");
+    for (Arg old = location; cmp(old, newVal); ) {
+        Arg val = AtomicCompareExchange((intptr_t&)location, (intptr_t)newVal, old);
+        if (val == old)
+            break;
+        // TODO: do we need backoff after unsuccessful CAS?
+        old = val;
+    }
+}
+
+// TODO: make BitMaskBasic more general
+// (currently, it fits BitMaskMin well, but not as suitable for BitMaskMax)
+template<unsigned NUM>
+class BitMaskBasic {
+    static const unsigned SZ = (NUM-1)/(CHAR_BIT*sizeof(uintptr_t))+1;
+    static const unsigned WORD_LEN = CHAR_BIT*sizeof(uintptr_t);
+    uintptr_t mask[SZ];
+protected:
+    void set(size_t idx, bool val) {
+        MALLOC_ASSERT(idx<NUM, ASSERT_TEXT);
+
+        size_t i = idx / WORD_LEN;
+        int pos = WORD_LEN - idx % WORD_LEN - 1;
+        if (val)
+            AtomicOr(&mask[i], 1ULL << pos);
+        else
+            AtomicAnd(&mask[i], ~(1ULL << pos));
+    }
+    int getMinTrue(unsigned startIdx) const {
+        unsigned idx = startIdx / WORD_LEN;
+        int pos;
+
+        if (startIdx % WORD_LEN) {
+            // only interested in part of a word, clear bits before startIdx
+            pos = WORD_LEN - startIdx % WORD_LEN;
+            uintptr_t actualMask = mask[idx] & (((uintptr_t)1<<pos) - 1);
+            idx++;
+            if (-1 != (pos = BitScanRev(actualMask)))
+                return idx*WORD_LEN - pos - 1;
+        }
+
+        while (idx<SZ)
+            if (-1 != (pos = BitScanRev(mask[idx++])))
+                return idx*WORD_LEN - pos - 1;
+        return -1;
+    }
+public:
+    void reset() { for (unsigned i=0; i<SZ; i++) mask[i] = 0; }
+};
+
+template<unsigned NUM>
+class BitMaskMin : public BitMaskBasic<NUM> {
+public:
+    void set(size_t idx, bool val) { BitMaskBasic<NUM>::set(idx, val); }
+    int getMinTrue(unsigned startIdx) const {
+        return BitMaskBasic<NUM>::getMinTrue(startIdx);
+    }
+};
+
+template<unsigned NUM>
+class BitMaskMax : public BitMaskBasic<NUM> {
+public:
+    void set(size_t idx, bool val) {
+        BitMaskBasic<NUM>::set(NUM - 1 - idx, val);
+    }
+    int getMaxTrue(unsigned startIdx) const {
+        int p = BitMaskBasic<NUM>::getMinTrue(NUM-startIdx-1);
+        return -1==p? -1 : (int)NUM - 1 - p;
+    }
+};
+
+
+// The part of thread-specific data that can be modified by other threads.
+// Such modifications must be protected by AllLocalCaches::listLock.
+struct TLSRemote {
+    TLSRemote *next,
+              *prev;
+};
+
+// The list of all thread-local data; supporting cleanup of thread caches
+class AllLocalCaches {
+    TLSRemote  *head;
+    MallocMutex listLock; // protects operations in the list
+public:
+    void registerThread(TLSRemote *tls);
+    void unregisterThread(TLSRemote *tls);
+    bool cleanup(ExtMemoryPool *extPool, bool cleanOnlyUnused);
+    void markUnused();
+    void reset() { head = NULL; }
+};
+
+class LifoList {
+public:
+    inline LifoList();
+    inline void push(Block *block);
+    inline Block *pop();
+    inline Block *grab();
+
+private:
+    Block *top;
+    MallocMutex lock;
+};
+
+/*
+ * When a block that is not completely free is returned for reuse by other threads
+ * this is where the block goes.
+ *
+ * LifoList assumes zero initialization; so below its constructors are omitted,
+ * to avoid linking with C++ libraries on Linux.
+ */
+
+class OrphanedBlocks {
+    LifoList bins[numBlockBinLimit];
+public:
+    Block *get(TLSData *tls, unsigned int size);
+    void put(intptr_t binTag, Block *block);
+    void reset();
+    bool cleanup(Backend* backend);
+};
+
+/* cache blocks in range [MinSize; MaxSize) in bins with CacheStep
+ TooLargeFactor -- when cache size treated "too large" in comparison to user data size
+ OnMissFactor -- If cache miss occurred and cache was cleaned,
+                 set ageThreshold to OnMissFactor * the difference
+                 between current time and last time cache was cleaned.
+ LongWaitFactor -- to detect rarely-used bins and forget about their usage history
+*/
+template<size_t MIN_SIZE, size_t MAX_SIZE, uint32_t CACHE_STEP, int TOO_LARGE,
+         int ON_MISS, int LONG_WAIT>
+struct LargeObjectCacheProps {
+    static const size_t MinSize = MIN_SIZE, MaxSize = MAX_SIZE;
+    static const uint32_t CacheStep = CACHE_STEP;
+    static const int TooLargeFactor = TOO_LARGE, OnMissFactor = ON_MISS,
+        LongWaitFactor = LONG_WAIT;
+};
+
+template<typename Props>
+class LargeObjectCacheImpl {
+private:
+    // The number of bins to cache large objects.
+    static const uint32_t numBins = (Props::MaxSize-Props::MinSize)/Props::CacheStep;
+    // Current sizes of used and cached objects. It's calculated while we are
+    // traversing bins, and used for isLOCTooLarge() check at the same time.
+    class BinsSummary {
+        size_t usedSz;
+        size_t cachedSz;
+    public:
+        BinsSummary() : usedSz(0), cachedSz(0) {}
+        // "too large" criteria
+        bool isLOCTooLarge() const { return cachedSz > Props::TooLargeFactor*usedSz; }
+        void update(size_t usedSize, size_t cachedSize) {
+            usedSz += usedSize;
+            cachedSz += cachedSize;
+        }
+        void reset() { usedSz = cachedSz = 0; }
+    };
+public:
+    typedef BitMaskMax<numBins> BinBitMask;
+
+    // 2-linked list of same-size cached blocks ordered by age (oldest on top)
+    // TODO: are we really want the list to be 2-linked? This allows us
+    // reduce memory consumption and do less operations under lock.
+    // TODO: try to switch to 32-bit logical time to save space in CacheBin
+    // and move bins to different cache lines.
+    class CacheBin {
+    private:
+        LargeMemoryBlock *first,
+                         *last;
+  /* age of an oldest block in the list; equal to last->age, if last defined,
+     used for quick cheching it without acquiring the lock. */
+        uintptr_t         oldest;
+  /* currAge when something was excluded out of list because of the age,
+     not because of cache hit */
+        uintptr_t         lastCleanedAge;
+  /* Current threshold value for the blocks of a particular size.
+     Set on cache miss. */
+        intptr_t          ageThreshold;
+
+  /* total size of all objects corresponding to the bin and allocated by user */
+        size_t            usedSize,
+  /* total size of all objects cached in the bin */
+                          cachedSize;
+  /* mean time of presence of block in the bin before successful reuse */
+        intptr_t          meanHitRange;
+  /* time of last get called for the bin */
+        uintptr_t         lastGet;
+
+        typename MallocAggregator<CacheBinOperation>::type aggregator;
+
+        void ExecuteOperation(CacheBinOperation *op, ExtMemoryPool *extMemPool, BinBitMask *bitMask, int idx, bool longLifeTime = true);
+  /* should be placed in zero-initialized memory, ctor not needed. */
+        CacheBin();
+    public:
+        void init() { memset(this, 0, sizeof(CacheBin)); }
+        void putList(ExtMemoryPool *extMemPool, LargeMemoryBlock *head, BinBitMask *bitMask, int idx);
+        LargeMemoryBlock *get(ExtMemoryPool *extMemPool, size_t size, BinBitMask *bitMask, int idx);
+        bool cleanToThreshold(ExtMemoryPool *extMemPool, BinBitMask *bitMask, uintptr_t currTime, int idx);
+        bool releaseAllToBackend(ExtMemoryPool *extMemPool, BinBitMask *bitMask, int idx);
+        void updateUsedSize(ExtMemoryPool *extMemPool, size_t size, BinBitMask *bitMask, int idx);
+
+        void decreaseThreshold() {
+            if (ageThreshold)
+                ageThreshold = (ageThreshold + meanHitRange)/2;
+        }
+        void updateBinsSummary(BinsSummary *binsSummary) const {
+            binsSummary->update(usedSize, cachedSize);
+        }
+        size_t getSize() const { return cachedSize; }
+        size_t getUsedSize() const { return usedSize; }
+        size_t reportStat(int num, FILE *f);
+  /* ---------- unsafe methods used with the aggregator ---------- */
+        void forgetOutdatedState(uintptr_t currTime);
+        LargeMemoryBlock *putList(LargeMemoryBlock *head, LargeMemoryBlock *tail, BinBitMask *bitMask, int idx, int num);
+        LargeMemoryBlock *get();
+        LargeMemoryBlock *cleanToThreshold(uintptr_t currTime, BinBitMask *bitMask, int idx);
+        LargeMemoryBlock *cleanAll(BinBitMask *bitMask, int idx);
+        void updateUsedSize(size_t size, BinBitMask *bitMask, int idx) {
+            if (!usedSize) bitMask->set(idx, true);
+            usedSize += size;
+            if (!usedSize && !first) bitMask->set(idx, false);
+        }
+        void updateMeanHitRange( intptr_t hitRange ) {
+            hitRange = hitRange >= 0 ? hitRange : 0;
+            meanHitRange = meanHitRange ? (meanHitRange + hitRange)/2 : hitRange;
+        }
+        void updateAgeThreshold( uintptr_t currTime ) {
+            if (lastCleanedAge)
+                ageThreshold = Props::OnMissFactor*(currTime - lastCleanedAge);
+        }
+        void updateCachedSize(size_t size) { cachedSize += size; }
+        void setLastGet( uintptr_t newLastGet ) { lastGet = newLastGet; }
+  /* -------------------------------------------------------- */
+    };
+private:
+    intptr_t     tooLargeLOC; // how many times LOC was "too large"
+    // for fast finding of used bins and bins with non-zero usedSize;
+    // indexed from the end, as we need largest 1st
+    BinBitMask   bitMask;
+    // bins with lists of recently freed large blocks cached for re-use
+    CacheBin bin[numBins];
+
+public:
+    static int sizeToIdx(size_t size) {
+        MALLOC_ASSERT(Props::MinSize <= size && size < Props::MaxSize, ASSERT_TEXT);
+        return (size-Props::MinSize)/Props::CacheStep;
+    }
+    static int getNumBins() { return numBins; }
+
+    void putList(ExtMemoryPool *extMemPool, LargeMemoryBlock *largeBlock);
+    LargeMemoryBlock *get(ExtMemoryPool *extMemPool, size_t size);
+
+    void updateCacheState(ExtMemoryPool *extMemPool, DecreaseOrIncrease op, size_t size);
+    bool regularCleanup(ExtMemoryPool *extMemPool, uintptr_t currAge, bool doThreshDecr);
+    bool cleanAll(ExtMemoryPool *extMemPool);
+    void reset() {
+        tooLargeLOC = 0;
+        for (int i = numBins-1; i >= 0; i--)
+            bin[i].init();
+        bitMask.reset();
+    }
+    void reportStat(FILE *f);
+#if __TBB_MALLOC_WHITEBOX_TEST
+    size_t getLOCSize() const;
+    size_t getUsedSize() const;
+#endif
+};
+
+class LargeObjectCache {
+    static const size_t minLargeSize =  8*1024,
+                        maxLargeSize =  8*1024*1024,
+    // There are benchmarks of interest that should work well with objects of this size
+                        maxHugeSize = 129*1024*1024;
+public:
+    // Difference between object sizes in large block bins
+    static const uint32_t largeBlockCacheStep =  8*1024,
+                          hugeBlockCacheStep = 512*1024;
+private:
+    typedef LargeObjectCacheProps<minLargeSize, maxLargeSize, largeBlockCacheStep, 2, 2, 16> LargeCacheTypeProps;
+    typedef LargeObjectCacheProps<maxLargeSize, maxHugeSize, hugeBlockCacheStep, 1, 1, 4> HugeCacheTypeProps;
+    typedef LargeObjectCacheImpl< LargeCacheTypeProps > LargeCacheType;
+    typedef LargeObjectCacheImpl< HugeCacheTypeProps > HugeCacheType;
+
+    // beginning of largeCache is more actively used and smaller than hugeCache,
+    // so put hugeCache first to prevent false sharing
+    // with LargeObjectCache's predecessor
+    HugeCacheType hugeCache;
+    LargeCacheType largeCache;
+
+    /* logical time, incremented on each put/get operation
+       To prevent starvation between pools, keep separately for each pool.
+       Overflow is OK, as we only want difference between
+       its current value and some recent.
+
+       Both malloc and free should increment logical time, as in
+       a different case multiple cached blocks would have same age,
+       and accuracy of predictors suffers.
+    */
+    uintptr_t cacheCurrTime;
+
+                     // memory pool that owns this LargeObjectCache,
+    ExtMemoryPool *extMemPool; // strict 1:1 relation, never changed
+
+    static int sizeToIdx(size_t size);
+public:
+    void init(ExtMemoryPool *memPool) { extMemPool = memPool; }
+    void put(LargeMemoryBlock *largeBlock);
+    void putList(LargeMemoryBlock *head);
+    LargeMemoryBlock *get(size_t size);
+
+    void updateCacheState(DecreaseOrIncrease op, size_t size);
+    bool isCleanupNeededOnRange(uintptr_t range, uintptr_t currTime);
+    bool doCleanup(uintptr_t currTime, bool doThreshDecr);
+
+    bool decreasingCleanup();
+    bool regularCleanup();
+    bool cleanAll();
+    void reset() {
+        largeCache.reset();
+        hugeCache.reset();
+    }
+    void reportStat(FILE *f);
+#if __TBB_MALLOC_WHITEBOX_TEST
+    size_t getLOCSize() const;
+    size_t getUsedSize() const;
+#endif
+    static size_t alignToBin(size_t size) {
+        return size<maxLargeSize? alignUp(size, largeBlockCacheStep)
+            : alignUp(size, hugeBlockCacheStep);
+    }
+
+    uintptr_t getCurrTime() { return (uintptr_t)AtomicIncrement((intptr_t&)cacheCurrTime); }
+    uintptr_t getCurrTimeRange(uintptr_t range) { return (uintptr_t)AtomicAdd((intptr_t&)cacheCurrTime, range)+1; }
+    void registerRealloc(size_t oldSize, size_t newSize);
+};
+
+// select index size for BackRefMaster based on word size: default is uint32_t,
+// uint16_t for 32-bit platforms
+template<bool>
+struct MasterIndexSelect {
+    typedef uint32_t master_type;
+};
+
+template<>
+struct MasterIndexSelect<false> {
+    typedef uint16_t master_type;
+};
+
+class BackRefIdx { // composite index to backreference array
+public:
+    typedef MasterIndexSelect<4 < sizeof(uintptr_t)>::master_type master_t;
+private:
+    static const master_t invalid = ~master_t(0);
+    master_t master;      // index in BackRefMaster
+    uint16_t largeObj:1;  // is this object "large"?
+    uint16_t offset  :15; // offset from beginning of BackRefBlock
+public:
+    BackRefIdx() : master(invalid), largeObj(0), offset(0) {}
+    bool isInvalid() const { return master == invalid; }
+    bool isLargeObject() const { return largeObj; }
+    master_t getMaster() const { return master; }
+    uint16_t getOffset() const { return offset; }
+
+    // only newBackRef can modify BackRefIdx
+    static BackRefIdx newBackRef(bool largeObj);
+};
+
+// Block header is used during block coalescing
+// and must be preserved in used blocks.
+class BlockI {
+    intptr_t     blockState[2];
+};
+
+struct LargeMemoryBlock : public BlockI {
+    MemoryPool       *pool;          // owner pool
+    LargeMemoryBlock *next,          // ptrs in list of cached blocks
+                     *prev,
+    // 2-linked list of pool's large objects
+    // Used to destroy backrefs on pool destroy (backrefs are global)
+    // and for object releasing during pool reset.
+                     *gPrev,
+                     *gNext;
+    uintptr_t         age;           // age of block while in cache
+    size_t            objectSize;    // the size requested by a client
+    size_t            unalignedSize; // the size requested from backend
+    BackRefIdx        backRefIdx;    // cached here, used copy is in LargeObjectHdr
+};
+
+// global state of blocks currently in processing
+class BackendSync {
+    // Class instances should reside in zero-initialized memory!
+    // The number of blocks currently removed from a bin and not returned back
+    intptr_t inFlyBlocks;         // to another
+    intptr_t binsModifications;   // incremented on every bin modification
+    Backend *backend;
+public:
+    void init(Backend *b) { backend = b; }
+    void blockConsumed() { AtomicIncrement(inFlyBlocks); }
+    void binsModified() { AtomicIncrement(binsModifications); }
+    void blockReleased() {
+#if __TBB_MALLOC_BACKEND_STAT
+        MALLOC_ITT_SYNC_RELEASING(&inFlyBlocks);
+#endif
+        AtomicIncrement(binsModifications);
+        intptr_t prev = AtomicAdd(inFlyBlocks, -1);
+        MALLOC_ASSERT(prev > 0, ASSERT_TEXT);
+        suppress_unused_warning(prev);
+    }
+    intptr_t getNumOfMods() const { return FencedLoad(binsModifications); }
+    // return true if need re-do the blocks search
+    inline bool waitTillBlockReleased(intptr_t startModifiedCnt);
+};
+
+class CoalRequestQ { // queue of free blocks that coalescing was delayed
+private:
+    FreeBlock   *blocksToFree;
+    BackendSync *bkndSync;
+    // counted blocks in blocksToFree and that are leaved blocksToFree
+    // and still in active coalescing
+    intptr_t     inFlyBlocks;
+public:
+    void init(BackendSync *bSync) { bkndSync = bSync; }
+    FreeBlock *getAll(); // return current list of blocks and make queue empty
+    void putBlock(FreeBlock *fBlock);
+    inline void blockWasProcessed();
+    intptr_t blocksInFly() const { return FencedLoad(inFlyBlocks); }
+};
+
+class MemExtendingSema {
+    intptr_t     active;
+public:
+    bool wait() {
+        bool rescanBins = false;
+        // up to 3 threads can add more memory from OS simultaneously,
+        // rest of threads have to wait
+        for (;;) {
+            intptr_t prevCnt = FencedLoad(active);
+            if (prevCnt < 3) {
+                intptr_t n = AtomicCompareExchange(active, prevCnt+1, prevCnt);
+                if (n == prevCnt)
+                    break;
+            } else {
+                SpinWaitWhileEq(active, prevCnt);
+                rescanBins = true;
+                break;
+            }
+        }
+        return rescanBins;
+    }
+    void signal() { AtomicAdd(active, -1); }
+};
+
+enum MemRegionType {
+    // The region does not guarantee the block size.
+    MEMREG_FLEXIBLE_SIZE = 0,
+    // The region can hold exact number of blocks with the size of the
+    // first reqested block.
+    MEMREG_SEVERAL_BLOCKS,
+    // The region holds only one block with a reqested size.
+    MEMREG_ONE_BLOCK
+};
+
+class MemRegionList {
+    MallocMutex regionListLock;
+public:
+    MemRegion  *head;
+    void add(MemRegion *r);
+    void remove(MemRegion *r);
+    int reportStat(FILE *f);
+};
+
+class Backend {
+private:
+/* Blocks in range [minBinnedSize; getMaxBinnedSize()] are kept in bins,
+   one region can contains several blocks. Larger blocks are allocated directly
+   and one region always contains one block.
+*/
+    enum {
+        minBinnedSize = 8*1024UL,
+        /*   If huge pages are available, maxBinned_HugePage used.
+             If not, maxBinned_SmallPage is the threshold.
+             TODO: use pool's granularity for upper bound setting.*/
+        maxBinned_SmallPage = 1024*1024UL,
+        // TODO: support other page sizes
+        maxBinned_HugePage = 4*1024*1024UL
+    };
+    enum {
+        VALID_BLOCK_IN_BIN = 1 // valid block added to bin, not returned as result
+    };
+public:
+    static const int freeBinsNum =
+        (maxBinned_HugePage-minBinnedSize)/LargeObjectCache::largeBlockCacheStep + 1;
+
+    // if previous access missed per-thread slabs pool,
+    // allocate numOfSlabAllocOnMiss blocks in advance
+    static const int numOfSlabAllocOnMiss = 2;
+
+    enum {
+        NO_BIN = -1,
+        // special bin for blocks >= maxBinned_HugePage, blocks go to this bin
+        // when pool is created with keepAllMemory policy
+        // TODO: currently this bin is scanned using "1st fit", as it accumulates
+        // blocks of different sizes, "best fit" is preferred in terms of fragmentation
+        HUGE_BIN = freeBinsNum-1
+    };
+
+    // Bin keeps 2-linked list of free blocks. It must be 2-linked
+    // because during coalescing a block it's removed from a middle of the list.
+    struct Bin {
+        FreeBlock   *head,
+                    *tail;
+        MallocMutex  tLock;
+
+        void removeBlock(FreeBlock *fBlock);
+        void reset() { head = tail = 0; }
+        bool empty() const { return !head; }
+
+        size_t countFreeBlocks();
+        size_t reportFreeBlocks(FILE *f);
+        void reportStat(FILE *f);
+    };
+
+    typedef BitMaskMin<Backend::freeBinsNum> BitMaskBins;
+
+    // array of bins supplemented with bitmask for fast finding of non-empty bins
+    class IndexedBins {
+        BitMaskBins bitMask;
+        Bin         freeBins[Backend::freeBinsNum];
+        FreeBlock *getFromBin(int binIdx, BackendSync *sync, size_t size,
+                              bool resSlabAligned, bool alignedBin, bool wait,
+                              int *resLocked);
+    public:
+        FreeBlock *findBlock(int nativeBin, BackendSync *sync, size_t size,
+                             bool resSlabAligned, bool alignedBin, int *numOfLockedBins);
+        bool tryReleaseRegions(int binIdx, Backend *backend);
+        void lockRemoveBlock(int binIdx, FreeBlock *fBlock);
+        void addBlock(int binIdx, FreeBlock *fBlock, size_t blockSz, bool addToTail);
+        bool tryAddBlock(int binIdx, FreeBlock *fBlock, bool addToTail);
+        int getMinNonemptyBin(unsigned startBin) const {
+            int p = bitMask.getMinTrue(startBin);
+            return p == -1 ? Backend::freeBinsNum : p;
+        }
+        void verify();
+        void reset();
+        void reportStat(FILE *f);
+    };
+
+private:
+    class AdvRegionsBins {
+        BitMaskBins bins;
+    public:
+        void registerBin(int regBin) { bins.set(regBin, 1); }
+        int getMinUsedBin(int start) const { return bins.getMinTrue(start); }
+        void reset() { bins.reset(); }
+    };
+    // auxiliary class to atomic maximum request finding
+    class MaxRequestComparator {
+        const Backend *backend;
+    public:
+        MaxRequestComparator(const Backend *be) : backend(be) {}
+        inline bool operator()(size_t oldMaxReq, size_t requestSize) const;
+    };
+
+#if CHECK_ALLOCATION_RANGE
+    // Keep min and max of all addresses requested from OS,
+    // use it for checking memory possibly allocated by replaced allocators
+    // and for debugging purposes. Valid only for default memory pool.
+    class UsedAddressRange {
+        static const uintptr_t ADDRESS_UPPER_BOUND = UINTPTR_MAX;
+
+        uintptr_t   leftBound,
+                    rightBound;
+        MallocMutex mutex;
+    public:
+        // rightBound is zero-initialized
+        void init() { leftBound = ADDRESS_UPPER_BOUND; }
+        void registerAlloc(uintptr_t left, uintptr_t right);
+        void registerFree(uintptr_t left, uintptr_t right);
+        // as only left and right bounds are kept, we can return true
+        // for pointer not allocated by us, if more than single region
+        // was requested from OS
+        bool inRange(void *ptr) const {
+            const uintptr_t p = (uintptr_t)ptr;
+            return leftBound<=p && p<=rightBound;
+        }
+    };
+#else
+    class UsedAddressRange {
+    public:
+        void init() { }
+        void registerAlloc(uintptr_t, uintptr_t) {}
+        void registerFree(uintptr_t, uintptr_t) {}
+        bool inRange(void *) const { return true; }
+    };
+#endif
+
+    ExtMemoryPool   *extMemPool;
+    // used for release every region on pool destroying
+    MemRegionList    regionList;
+
+    CoalRequestQ     coalescQ; // queue of coalescing requests
+    BackendSync      bkndSync;
+    // semaphore protecting adding more more memory from OS
+    MemExtendingSema memExtendingSema;
+    size_t           totalMemSize,
+                     memSoftLimit;
+    UsedAddressRange usedAddrRange;
+    // to keep 1st allocation large than requested, keep bootstrapping status
+    enum {
+        bootsrapMemNotDone = 0,
+        bootsrapMemInitializing,
+        bootsrapMemDone
+    };
+    intptr_t         bootsrapMemStatus;
+    MallocMutex      bootsrapMemStatusMutex;
+
+    // Using of maximal observed requested size allows decrease
+    // memory consumption for small requests and decrease fragmentation
+    // for workloads when small and large allocation requests are mixed.
+    // TODO: decrease, not only increase it
+    size_t           maxRequestedSize;
+
+    FreeBlock *addNewRegion(size_t size, MemRegionType type, bool addToBin);
+    FreeBlock *findBlockInRegion(MemRegion *region, size_t exactBlockSize);
+    void startUseBlock(MemRegion *region, FreeBlock *fBlock, bool addToBin);
+    void releaseRegion(MemRegion *region);
+
+    FreeBlock *releaseMemInCaches(intptr_t startModifiedCnt,
+                                  int *lockedBinsThreshold, int numOfLockedBins);
+    void requestBootstrapMem();
+    FreeBlock *askMemFromOS(size_t totalReqSize, intptr_t startModifiedCnt,
+                            int *lockedBinsThreshold, int numOfLockedBins,
+                            bool *splittable);
+    FreeBlock *genericGetBlock(int num, size_t size, bool resSlabAligned);
+    void genericPutBlock(FreeBlock *fBlock, size_t blockSz);
+    FreeBlock *splitUnalignedBlock(FreeBlock *fBlock, int num, size_t size,
+                              bool needAlignedRes);
+    FreeBlock *splitAlignedBlock(FreeBlock *fBlock, int num, size_t size,
+                            bool needAlignedRes);
+
+    FreeBlock *doCoalesc(FreeBlock *fBlock, MemRegion **memRegion);
+    bool coalescAndPutList(FreeBlock *head, bool forceCoalescQDrop, bool reportBlocksProcessed);
+    void coalescAndPut(FreeBlock *fBlock, size_t blockSz);
+
+    void removeBlockFromBin(FreeBlock *fBlock);
+
+    void *allocRawMem(size_t &size);
+    bool freeRawMem(void *object, size_t size);
+
+    void putLargeBlock(LargeMemoryBlock *lmb);
+    void releaseCachesToLimit();
+public:
+    bool scanCoalescQ(bool forceCoalescQDrop);
+    intptr_t blocksInCoalescing() const { return coalescQ.blocksInFly(); }
+    void verify();
+    void init(ExtMemoryPool *extMemoryPool);
+    void reset();
+    bool destroy();
+    bool clean(); // clean on caches cleanup
+    void reportStat(FILE *f);
+
+    BlockI *getSlabBlock(int num) {
+        BlockI *b = (BlockI*)
+            genericGetBlock(num, slabSize, /*resSlabAligned=*/true);
+        MALLOC_ASSERT(isAligned(b, slabSize), ASSERT_TEXT);
+        return b;
+    }
+    void putSlabBlock(BlockI *block) {
+        genericPutBlock((FreeBlock *)block, slabSize);
+    }
+    void *getBackRefSpace(size_t size, bool *rawMemUsed);
+    void putBackRefSpace(void *b, size_t size, bool rawMemUsed);
+
+    bool inUserPool() const;
+
+    LargeMemoryBlock *getLargeBlock(size_t size);
+    void returnLargeObject(LargeMemoryBlock *lmb);
+
+    void *remap(void *ptr, size_t oldSize, size_t newSize, size_t alignment);
+
+    void setRecommendedMaxSize(size_t softLimit) {
+        memSoftLimit = softLimit;
+        releaseCachesToLimit();
+    }
+    size_t getMaxBinnedSize() const;
+
+    bool ptrCanBeValid(void *ptr) const { return usedAddrRange.inRange(ptr); }
+
+#if __TBB_MALLOC_WHITEBOX_TEST
+    size_t getTotalMemSize() const { return totalMemSize; }
+#endif
+private:
+    static int sizeToBin(size_t size) {
+        if (size >= maxBinned_HugePage)
+            return HUGE_BIN;
+        else if (size < minBinnedSize)
+            return NO_BIN;
+
+        int bin = (size - minBinnedSize)/LargeObjectCache::largeBlockCacheStep;
+
+        MALLOC_ASSERT(bin < HUGE_BIN, "Invalid size.");
+        return bin;
+    }
+#if __TBB_MALLOC_BACKEND_STAT
+    static size_t binToSize(int bin) {
+        MALLOC_ASSERT(bin <= HUGE_BIN, "Invalid bin.");
+
+        return bin*LargeObjectCache::largeBlockCacheStep + minBinnedSize;
+    }
+#endif
+    static bool toAlignedBin(FreeBlock *block, size_t size) {
+        return isAligned((char*)block+size, slabSize)
+            && size >= slabSize;
+    }
+
+    // register bins related to advance regions
+    AdvRegionsBins advRegBins;
+    IndexedBins freeLargeBins,
+                freeAlignedBins;
+};
+
+// An TBB allocator mode that can be controlled by user
+// via API/environment variable. Must be placed in zero-initialized memory.
+// External synchronization assumed.
+// TODO: TBB_VERSION support
+class AllocControlledMode {
+    intptr_t val;
+    bool     setDone;
+public:
+    bool ready() const { return setDone; }
+    intptr_t get() const {
+        MALLOC_ASSERT(setDone, ASSERT_TEXT);
+        return val;
+    }
+    void set(intptr_t newVal) { // note set() can be called before init()
+        val = newVal;
+        setDone = true;
+    }
+    // envName - environment variable to get controlled mode
+    void initReadEnv(const char *envName, intptr_t defaultVal);
+};
+
+// Page type to be used inside MapMemory.
+// Regular (4KB aligned), Huge and Transparent Huge Pages (2MB aligned).
+enum PageType {
+    REGULAR = 0,
+    PREALLOCATED_HUGE_PAGE,
+    TRANSPARENT_HUGE_PAGE
+};
+
+// init() and printStatus() is called only under global initialization lock.
+// Race is possible between registerAllocation() and registerReleasing(),
+// harm is that up to single huge page releasing is missed (because failure
+// to get huge page is registered only 1st time), that is negligible.
+// setMode is also can be called concurrently.
+// Object must reside in zero-initialized memory
+// TODO: can we check for huge page presence during every 10th mmap() call
+// in case huge page is released by another process?
+class HugePagesStatus {
+private:
+    AllocControlledMode requestedMode; // changed only by user
+                                       // to keep enabled and requestedMode consistent
+    MallocMutex setModeLock;
+    size_t      pageSize;
+    intptr_t    needActualStatusPrint;
+
+    static void doPrintStatus(bool state, const char *stateName) {
+        // Under macOS* fprintf/snprintf acquires an internal lock, so when
+        // 1st allocation is done under the lock, we got a deadlock.
+        // Do not use fprintf etc during initialization.
+        fputs("TBBmalloc: huge pages\t", stderr);
+        if (!state)
+            fputs("not ", stderr);
+        fputs(stateName, stderr);
+        fputs("\n", stderr);
+    }
+
+    void parseSystemMemInfo() {
+        bool hpAvailable  = false;
+        bool thpAvailable = false;
+        unsigned long long hugePageSize = 0;
+
+#if __linux__
+        // Check huge pages existense
+        unsigned long long meminfoHugePagesTotal = 0;
+
+        parseFileItem meminfoItems[] = {
+            // Parse system huge page size
+            { "Hugepagesize: %llu kB", hugePageSize },
+            // Check if there are preallocated huge pages on the system
+            // https://www.kernel.org/doc/Documentation/vm/hugetlbpage.txt
+            { "HugePages_Total: %llu", meminfoHugePagesTotal } };
+
+        parseFile</*BUFF_SIZE=*/100>("/proc/meminfo", meminfoItems);
+
+        // Double check another system information regarding preallocated
+        // huge pages if there are no information in /proc/meminfo
+        unsigned long long vmHugePagesTotal = 0;
+
+        parseFileItem vmItem[] = { { "%llu", vmHugePagesTotal } };
+
+        // We parse a counter number, it can't be huge
+        parseFile</*BUFF_SIZE=*/100>("/proc/sys/vm/nr_hugepages", vmItem);
+
+        if (meminfoHugePagesTotal > 0 || vmHugePagesTotal > 0) {
+            MALLOC_ASSERT(hugePageSize != 0, "Huge Page size can't be zero if we found preallocated.");
+
+            // Any non zero value clearly states that there are preallocated
+            // huge pages on the system
+            hpAvailable = true;
+        }
+
+        // Check if there is transparent huge pages support on the system
+        unsigned long long thpPresent = 'n';
+        parseFileItem thpItem[] = { { "[alwa%cs] madvise never\n", thpPresent } };
+        parseFile</*BUFF_SIZE=*/100>("/sys/kernel/mm/transparent_hugepage/enabled", thpItem);
+
+        if (thpPresent == 'y') {
+            MALLOC_ASSERT(hugePageSize != 0, "Huge Page size can't be zero if we found thp existence.");
+            thpAvailable = true;
+        }
+#endif
+        MALLOC_ASSERT(!pageSize, "Huge page size can't be set twice. Double initialization.");
+
+        // Initialize object variables
+        pageSize       = hugePageSize * 1024; // was read in KB from meminfo
+        isHPAvailable  = hpAvailable;
+        isTHPAvailable = thpAvailable;
+    }
+
+public:
+
+    // System information
+    bool isHPAvailable;
+    bool isTHPAvailable;
+
+    // User defined value
+    bool isEnabled;
+
+    void init() {
+        parseSystemMemInfo();
+        MallocMutex::scoped_lock lock(setModeLock);
+        requestedMode.initReadEnv("TBB_MALLOC_USE_HUGE_PAGES", 0);
+        isEnabled = (isHPAvailable || isTHPAvailable) && requestedMode.get();
+    }
+
+    // Could be set from user code at any place.
+    // If we didn't call init() at this place, isEnabled will be false
+    void setMode(intptr_t newVal) {
+        MallocMutex::scoped_lock lock(setModeLock);
+        requestedMode.set(newVal);
+        isEnabled = (isHPAvailable || isTHPAvailable) && newVal;
+    }
+
+    bool isRequested() const {
+        return requestedMode.ready() ? requestedMode.get() : false;
+    }
+
+    void reset() {
+        pageSize = needActualStatusPrint = 0;
+        isEnabled = isHPAvailable = isTHPAvailable = false;
+    }
+
+    // If memory mapping size is a multiple of huge page size, some OS kernels
+    // can use huge pages transparently. Use this when huge pages are requested.
+    size_t getGranularity() const {
+        if (requestedMode.ready())
+            return requestedMode.get() ? pageSize : 0;
+        else
+            return HUGE_PAGE_SIZE; // the mode is not yet known; assume typical 2MB huge pages
+    }
+
+    void printStatus() {
+        doPrintStatus(requestedMode.get(), "requested");
+        if (requestedMode.get()) { // report actual status iff requested
+            if (pageSize)
+                FencedStore(needActualStatusPrint, 1);
+            else
+                doPrintStatus(/*state=*/false, "available");
+        }
+    }
+};
+
+class AllLargeBlocksList {
+    MallocMutex       largeObjLock;
+    LargeMemoryBlock *loHead;
+public:
+    void add(LargeMemoryBlock *lmb);
+    void remove(LargeMemoryBlock *lmb);
+    template<bool poolDestroy> void releaseAll(Backend *backend);
+};
+
+struct ExtMemoryPool {
+    Backend           backend;
+    LargeObjectCache  loc;
+    AllLocalCaches    allLocalCaches;
+    OrphanedBlocks    orphanedBlocks;
+
+    intptr_t          poolId;
+    // To find all large objects. Used during user pool destruction,
+    // to release all backreferences in large blocks (slab blocks do not have them).
+    AllLargeBlocksList lmbList;
+    // Callbacks to be used instead of MapMemory/UnmapMemory.
+    rawAllocType      rawAlloc;
+    rawFreeType       rawFree;
+    size_t            granularity;
+    bool              keepAllMemory,
+                      delayRegsReleasing,
+    // TODO: implements fixedPool with calling rawFree on destruction
+                      fixedPool;
+    TLSKey            tlsPointerKey;  // per-pool TLS key
+
+    bool init(intptr_t poolId, rawAllocType rawAlloc, rawFreeType rawFree,
+              size_t granularity, bool keepAllMemory, bool fixedPool);
+    bool initTLS();
+
+    // i.e., not system default pool for scalable_malloc/scalable_free
+    bool userPool() const { return rawAlloc; }
+
+     // true if something has been released
+    bool softCachesCleanup();
+    bool releaseAllLocalCaches();
+    bool hardCachesCleanup();
+    void *remap(void *ptr, size_t oldSize, size_t newSize, size_t alignment);
+    bool reset() {
+        loc.reset();
+        allLocalCaches.reset();
+        orphanedBlocks.reset();
+        bool ret = tlsPointerKey.destroy();
+        backend.reset();
+        return ret;
+    }
+    bool destroy() {
+        MALLOC_ASSERT(isPoolValid(),
+                      "Possible double pool_destroy or heap corruption");
+        if (!userPool()) {
+            loc.reset();
+            allLocalCaches.reset();
+        }
+        // pthread_key_dtors must be disabled before memory unmapping
+        // TODO: race-free solution
+        bool ret = tlsPointerKey.destroy();
+        if (rawFree || !userPool())
+            ret &= backend.destroy();
+        // pool is not valid after this point
+        granularity = 0;
+        return ret;
+    }
+    void delayRegionsReleasing(bool mode) { delayRegsReleasing = mode; }
+    inline bool regionsAreReleaseable() const;
+
+    LargeMemoryBlock *mallocLargeObject(MemoryPool *pool, size_t allocationSize);
+    void freeLargeObject(LargeMemoryBlock *lmb);
+    void freeLargeObjectList(LargeMemoryBlock *head);
+    // use granulatity as marker for pool validity
+    bool isPoolValid() const { return granularity; }
+};
+
+inline bool Backend::inUserPool() const { return extMemPool->userPool(); }
+
+struct LargeObjectHdr {
+    LargeMemoryBlock *memoryBlock;
+    /* Backreference points to LargeObjectHdr.
+       Duplicated in LargeMemoryBlock to reuse in subsequent allocations. */
+    BackRefIdx       backRefIdx;
+};
+
+struct FreeObject {
+    FreeObject  *next;
+};
+
+
+/******* A helper class to support overriding malloc with scalable_malloc *******/
+#if MALLOC_CHECK_RECURSION
+
+class RecursiveMallocCallProtector {
+    // pointer to an automatic data of holding thread
+    static void       *autoObjPtr;
+    static MallocMutex rmc_mutex;
+    static pthread_t   owner_thread;
+/* Under FreeBSD 8.0 1st call to any pthread function including pthread_self
+   leads to pthread initialization, that causes malloc calls. As 1st usage of
+   RecursiveMallocCallProtector can be before pthread initialized, pthread calls
+   can't be used in 1st instance of RecursiveMallocCallProtector.
+   RecursiveMallocCallProtector is used 1st time in checkInitialization(),
+   so there is a guarantee that on 2nd usage pthread is initialized.
+   No such situation observed with other supported OSes.
+ */
+#if __FreeBSD__
+    static bool        canUsePthread;
+#else
+    static const bool  canUsePthread = true;
+#endif
+/*
+  The variable modified in checkInitialization,
+  so can be read without memory barriers.
+ */
+    static bool mallocRecursionDetected;
+
+    MallocMutex::scoped_lock* lock_acquired;
+    char scoped_lock_space[sizeof(MallocMutex::scoped_lock)+1];
+
+    static uintptr_t absDiffPtr(void *x, void *y) {
+        uintptr_t xi = (uintptr_t)x, yi = (uintptr_t)y;
+        return xi > yi ? xi - yi : yi - xi;
+    }
+public:
+
+    RecursiveMallocCallProtector() : lock_acquired(NULL) {
+        lock_acquired = new (scoped_lock_space) MallocMutex::scoped_lock( rmc_mutex );
+        if (canUsePthread)
+            owner_thread = pthread_self();
+        autoObjPtr = &scoped_lock_space;
+    }
+    ~RecursiveMallocCallProtector() {
+        if (lock_acquired) {
+            autoObjPtr = NULL;
+            lock_acquired->~scoped_lock();
+        }
+    }
+    static bool sameThreadActive() {
+        if (!autoObjPtr) // fast path
+            return false;
+        // Some thread has an active recursive call protector; check if the current one.
+        // Exact pthread_self based test
+        if (canUsePthread) {
+            if (pthread_equal( owner_thread, pthread_self() )) {
+                mallocRecursionDetected = true;
+                return true;
+            } else
+                return false;
+        }
+        // inexact stack size based test
+        const uintptr_t threadStackSz = 2*1024*1024;
+        int dummy;
+        return absDiffPtr(autoObjPtr, &dummy)<threadStackSz;
+    }
+    static bool noRecursion();
+/* The function is called on 1st scalable_malloc call to check if malloc calls
+   scalable_malloc (nested call must set mallocRecursionDetected). */
+    static void detectNaiveOverload() {
+        if (!malloc_proxy) {
+#if __FreeBSD__
+/* If !canUsePthread, we can't call pthread_self() before, but now pthread
+   is already on, so can do it. */
+            if (!canUsePthread) {
+                canUsePthread = true;
+                owner_thread = pthread_self();
+            }
+#endif
+            free(malloc(1));
+        }
+    }
+};
+
+#else
+
+class RecursiveMallocCallProtector {
+public:
+    RecursiveMallocCallProtector() {}
+    ~RecursiveMallocCallProtector() {}
+};
+
+#endif  /* MALLOC_CHECK_RECURSION */
+
+bool isMallocInitializedExt();
+
+unsigned int getThreadId();
+
+bool initBackRefMaster(Backend *backend);
+void destroyBackRefMaster(Backend *backend);
+void removeBackRef(BackRefIdx backRefIdx);
+void setBackRef(BackRefIdx backRefIdx, void *newPtr);
+void *getBackRef(BackRefIdx backRefIdx);
+
+} // namespace internal
+} // namespace rml
+
+#endif // __TBB_tbbmalloc_internal_H
diff --git a/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc_internal_api.h b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc_internal_api.h
new file mode 100644
index 00000000..f9efc387
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/tbbmalloc_internal_api.h
@@ -0,0 +1,44 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_tbbmalloc_internal_api_H
+#define __TBB_tbbmalloc_internal_api_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+typedef enum {
+    /* Tune usage of source included allocator. Selected value is large enough
+       to not intercept with constants from AllocationModeParam. */
+    TBBMALLOC_INTERNAL_SOURCE_INCLUDED = 65536
+} AllocationModeInternalParam;
+
+void MallocInitializeITT();
+void __TBB_mallocProcessShutdownNotification(bool);
+#if _WIN32||_WIN64
+void __TBB_mallocThreadShutdownNotification();
+#endif
+
+#ifdef __cplusplus
+} /* extern "C" */
+#endif /* __cplusplus */
+
+#endif /* __TBB_tbbmalloc_internal_api_H */
diff --git a/xdl/third_party/tbb/src/tbbmalloc/win32-gcc-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/win32-gcc-tbbmalloc-export.def
new file mode 100644
index 00000000..e5012d68
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/win32-gcc-tbbmalloc-export.def
@@ -0,0 +1,52 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+scalable_calloc;
+scalable_free;
+scalable_malloc;
+scalable_realloc;
+scalable_posix_memalign;
+scalable_aligned_malloc;
+scalable_aligned_realloc;
+scalable_aligned_free;
+scalable_msize;
+scalable_allocation_mode;
+scalable_allocation_command;
+__TBB_malloc_safer_free;
+__TBB_malloc_safer_realloc;
+__TBB_malloc_safer_msize;
+__TBB_malloc_safer_aligned_msize;
+__TBB_malloc_safer_aligned_realloc;
+/* memory pool stuff */
+_ZN3rml10pool_resetEPNS_10MemoryPoolE;
+_ZN3rml11pool_createEiPKNS_13MemPoolPolicyE;
+_ZN3rml14pool_create_v1EiPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE;
+_ZN3rml11pool_mallocEPNS_10MemoryPoolEj;
+_ZN3rml12pool_destroyEPNS_10MemoryPoolE;
+_ZN3rml9pool_freeEPNS_10MemoryPoolEPv;
+_ZN3rml12pool_reallocEPNS_10MemoryPoolEPvj;
+_ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvjj;
+_ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEjj;
+_ZN3rml13pool_identifyEPv;
+
+local:*;
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/win32-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/win32-tbbmalloc-export.def
new file mode 100644
index 00000000..0c445de0
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/win32-tbbmalloc-export.def
@@ -0,0 +1,47 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+EXPORTS
+
+; frontend.cpp
+scalable_calloc
+scalable_free
+scalable_malloc
+scalable_realloc
+scalable_posix_memalign
+scalable_aligned_malloc
+scalable_aligned_realloc
+scalable_aligned_free
+scalable_msize
+scalable_allocation_mode
+scalable_allocation_command
+__TBB_malloc_safer_free
+__TBB_malloc_safer_realloc
+__TBB_malloc_safer_msize
+__TBB_malloc_safer_aligned_msize
+__TBB_malloc_safer_aligned_realloc
+?pool_create@rml@@YAPAVMemoryPool@1@HPBUMemPoolPolicy@1@@Z
+?pool_create_v1@rml@@YA?AW4MemPoolError@1@HPBUMemPoolPolicy@1@PAPAVMemoryPool@1@@Z
+?pool_destroy@rml@@YA_NPAVMemoryPool@1@@Z
+?pool_malloc@rml@@YAPAXPAVMemoryPool@1@I@Z
+?pool_free@rml@@YA_NPAVMemoryPool@1@PAX@Z
+?pool_reset@rml@@YA_NPAVMemoryPool@1@@Z
+?pool_realloc@rml@@YAPAXPAVMemoryPool@1@PAXI@Z
+?pool_aligned_realloc@rml@@YAPAXPAVMemoryPool@1@PAXII@Z
+?pool_aligned_malloc@rml@@YAPAXPAVMemoryPool@1@II@Z
+?pool_identify@rml@@YAPAVMemoryPool@1@PAX@Z
diff --git a/xdl/third_party/tbb/src/tbbmalloc/win64-gcc-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/win64-gcc-tbbmalloc-export.def
new file mode 100644
index 00000000..4b3c24ba
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/win64-gcc-tbbmalloc-export.def
@@ -0,0 +1,52 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+{
+global:
+scalable_calloc;
+scalable_free;
+scalable_malloc;
+scalable_realloc;
+scalable_posix_memalign;
+scalable_aligned_malloc;
+scalable_aligned_realloc;
+scalable_aligned_free;
+scalable_msize;
+scalable_allocation_mode;
+scalable_allocation_command;
+__TBB_malloc_safer_free;
+__TBB_malloc_safer_realloc;
+__TBB_malloc_safer_msize;
+__TBB_malloc_safer_aligned_msize;
+__TBB_malloc_safer_aligned_realloc;
+/* memory pool stuff */
+_ZN3rml10pool_resetEPNS_10MemoryPoolE;
+_ZN3rml11pool_createExPKNS_13MemPoolPolicyE;
+_ZN3rml14pool_create_v1ExPKNS_13MemPoolPolicyEPPNS_10MemoryPoolE;
+_ZN3rml11pool_mallocEPNS_10MemoryPoolEy;
+_ZN3rml12pool_destroyEPNS_10MemoryPoolE;
+_ZN3rml9pool_freeEPNS_10MemoryPoolEPv;
+_ZN3rml12pool_reallocEPNS_10MemoryPoolEPvy;
+_ZN3rml20pool_aligned_reallocEPNS_10MemoryPoolEPvyy;
+_ZN3rml19pool_aligned_mallocEPNS_10MemoryPoolEyy;
+_ZN3rml13pool_identifyEPv;
+
+local:*;
+};
diff --git a/xdl/third_party/tbb/src/tbbmalloc/win64-tbbmalloc-export.def b/xdl/third_party/tbb/src/tbbmalloc/win64-tbbmalloc-export.def
new file mode 100644
index 00000000..095f2cea
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbmalloc/win64-tbbmalloc-export.def
@@ -0,0 +1,48 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+EXPORTS
+
+; frontend.cpp
+scalable_calloc
+scalable_free
+scalable_malloc
+scalable_realloc
+scalable_posix_memalign
+scalable_aligned_malloc
+scalable_aligned_realloc
+scalable_aligned_free
+scalable_msize
+scalable_allocation_mode
+scalable_allocation_command
+__TBB_malloc_safer_free
+__TBB_malloc_safer_realloc
+__TBB_malloc_safer_msize
+__TBB_malloc_safer_aligned_msize
+__TBB_malloc_safer_aligned_realloc
+; memory pool stuff
+?pool_create@rml@@YAPEAVMemoryPool@1@_JPEBUMemPoolPolicy@1@@Z
+?pool_create_v1@rml@@YA?AW4MemPoolError@1@_JPEBUMemPoolPolicy@1@PEAPEAVMemoryPool@1@@Z
+?pool_destroy@rml@@YA_NPEAVMemoryPool@1@@Z
+?pool_malloc@rml@@YAPEAXPEAVMemoryPool@1@_K@Z
+?pool_free@rml@@YA_NPEAVMemoryPool@1@PEAX@Z
+?pool_reset@rml@@YA_NPEAVMemoryPool@1@@Z
+?pool_realloc@rml@@YAPEAXPEAVMemoryPool@1@PEAX_K@Z
+?pool_aligned_realloc@rml@@YAPEAXPEAVMemoryPool@1@PEAX_K2@Z
+?pool_aligned_malloc@rml@@YAPEAXPEAVMemoryPool@1@_K1@Z
+?pool_identify@rml@@YAPEAVMemoryPool@1@PEAX@Z
diff --git a/xdl/third_party/tbb/src/tbbproxy/tbbproxy-windows.asm b/xdl/third_party/tbb/src/tbbproxy/tbbproxy-windows.asm
new file mode 100644
index 00000000..d0dcb8f8
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbproxy/tbbproxy-windows.asm
@@ -0,0 +1,111 @@
+; Copyright (c) 2005-2018 Intel Corporation
+;
+; Licensed under the Apache License, Version 2.0 (the "License");
+; you may not use this file except in compliance with the License.
+; You may obtain a copy of the License at
+;
+;     http://www.apache.org/licenses/LICENSE-2.0
+;
+; Unless required by applicable law or agreed to in writing, software
+; distributed under the License is distributed on an "AS IS" BASIS,
+; WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+; See the License for the specific language governing permissions and
+; limitations under the License.
+;
+;
+;
+;
+
+// __TBB_STRING macro defined in "tbb_stddef.h". However, we cannot include "tbb_stddef.h"
+// because it contains a lot of C/C++ definitions. So, we have to define __TBB_STRING here:
+#define __TBB_STRING_AUX( x ) #x
+#define __TBB_STRING( x ) __TBB_STRING_AUX( x )
+
+// Eliminate difference between IA-32 and Intel 64: AWORD is a type of pointer, LANG is language
+// specification for extern directive.
+#ifdef ARCH_ia32
+    #define AWORD dword
+    #define LANG  c
+#else
+    #define AWORD qword
+    #define LANG
+#endif
+
+#ifdef ARCH_ia32
+    // These directives are required for IA32 architecture only.
+    .686
+    .model flat, syscall
+#endif
+
+/*
+    Symbol names.
+*/
+
+// Note: masm for IA-32 does not like symbols defined as "name:" in data sections,
+// so we have to define symbols with "name label type" directive instead.
+
+fname macro sym:req
+    align sizeof AWORD
+    Ln_&sym& label byte
+    byte "&sym&", 0
+endm
+
+.const        // Symbol names are constants.
+#define __TBB_SYMBOL( sym ) fname sym
+#include __TBB_STRING( __TBB_LST )
+
+/*
+    Symbol descriptors.
+*/
+
+extern LANG __tbb_internal_runtime_loader_stub : AWORD
+
+fsymbol macro sym:req
+    Ls_&sym& label AWORD
+    AWORD __tbb_internal_runtime_loader_stub
+    AWORD Ln_&sym&
+    dword sizeof AWORD
+    dword 1
+endm
+
+.data
+align sizeof AWORD
+public LANG __tbb_internal_runtime_loader_symbols
+__tbb_internal_runtime_loader_symbols label AWORD
+#define __TBB_SYMBOL( sym ) fsymbol sym
+#include __TBB_STRING( __TBB_LST )
+AWORD 0, 0        // Terminator of the __tbb_internal_runtime_loader_symbols array.
+dword 0, 0
+
+/*
+    Generate functions.
+*/
+
+// Helper assembler macro to handle different naming conventions on IA-32 and Intel 64:
+// IA-32: C++ names preserved, C names require leading underscore.
+// Intel 64: All names preserved.
+mangle  macro name:req
+    #ifdef ARCH_ia32
+        if @instr( 1, name, <?> )
+            exitm @catstr( name )
+        else
+            exitm @catstr( <_>, name )
+        endif
+    #else
+        exitm @catstr( name )
+    #endif
+endm
+
+function macro sym:req
+    mangle( sym )  proc
+        jmp AWORD ptr Ls_&sym&
+    mangle( sym )  endp
+endm
+
+.code
+#define __TBB_SYMBOL( sym ) function sym
+#include __TBB_STRING( __TBB_LST )
+
+end
+
+// end of file //
diff --git a/xdl/third_party/tbb/src/tbbproxy/tbbproxy.cpp b/xdl/third_party/tbb/src/tbbproxy/tbbproxy.cpp
new file mode 100644
index 00000000..5b40b862
--- /dev/null
+++ b/xdl/third_party/tbb/src/tbbproxy/tbbproxy.cpp
@@ -0,0 +1,612 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#if !__TBB_WIN8UI_SUPPORT
+#define TBB_PREVIEW_RUNTIME_LOADER 1
+#include "tbb/runtime_loader.h"
+#include "tbb/tbb_stddef.h"
+#include "tbb_environment.h"
+
+// C standard headers.
+#include <cctype>            // isspace
+#include <cstdarg>           // va_list, etc.
+#include <cstdio>            // fprintf, stderr, etc.
+#include <cstdlib>           // malloc, free, abort.
+#include <cstring>           // strlen, etc.
+
+// C++ standard headers.
+#include <typeinfo>
+
+// OS-specific includes.
+#if _WIN32 || _WIN64
+    #include <windows.h>
+    #define snprintf _snprintf
+    #undef max
+#else
+    #include <dlfcn.h>    // dlopen, dlsym, dlclose, dlerror.
+#endif
+
+#if TBB_USE_ASSERT
+    // We cannot use __TBB_ASSERT as it is because it calls a function from tbb library which may
+    // be not yet loaded. Redefine __TBB_ASSERT not to call tbb functions.
+    #undef __TBB_ASSERT
+    #define __TBB_ASSERT( cond, msg ) {                                                            \
+        if ( ! (cond) ) {                                                                          \
+            say( "%s:%d: Assertion failed: %s.", __FILE__, __LINE__, (msg) );                      \
+        } /* if */                                                                                 \
+        /* TODO: abort? */                                                                         \
+    }
+#endif
+
+// Declare here, define at the bottom.
+extern "C" int __tbb_internal_runtime_loader_stub();
+
+namespace tbb {
+
+namespace interface6 {
+
+namespace internal {
+
+namespace runtime_loader {
+
+
+/*
+    ------------------------------------------------------------------------------------------------
+    User interaction utilities.
+    ------------------------------------------------------------------------------------------------
+*/
+
+
+// Print message to stderr. Do not call it directly, use say() or tell() instead.
+static void _say( char const * format, va_list args ) {
+    /*
+        On 64-bit Linux* OS, vsnprintf() modifies args argument,
+        so vsnprintf() crashes if it is called for the second time with the same args.
+        To prevent the crash, we have to pass a fresh intact copy of args to vsnprintf() each time.
+
+        On Windows* OS, unfortunately, standard va_copy() macro is not available. However, it
+        seems vsnprintf() does not modify args argument.
+    */
+    #if ! ( _WIN32 || _WIN64 )
+        va_list _args;
+        __va_copy( _args, args );  // Make copy of args.
+        #define args _args         // Substitute args with its copy, _args.
+    #endif
+    int len = vsnprintf( NULL, 0, format, args );
+    #if ! ( _WIN32 || _WIN64 )
+        #undef args                // Remove substitution.
+        va_end( _args );
+    #endif
+    char * buf = reinterpret_cast< char * >( malloc( len + 1 ) );
+    if ( buf != NULL ) {
+        vsnprintf( buf, len + 1, format, args );
+        fprintf( stderr, "TBB: %s\n", buf );
+        free( buf );
+    } else {
+        fprintf( stderr, "TBB: Not enough memory for message: %s\n", format );
+    }
+} // _say
+
+
+// Debug/test/troubleshooting printing controlled by TBB_VERSION environment variable.
+// To enable printing, the variable must be set and not empty.
+// Do not call it directly, use tell() instead.
+static void _tell( char const * format, va_list args ) {
+    if ( tbb::internal::GetBoolEnvironmentVariable("TBB_VERSION") ) {
+        _say( format, args );
+    } // if
+} // _tell
+
+
+// Print message to stderr unconditionally.
+static void say( char const * format, ... ) {
+    va_list args;
+    va_start( args, format );
+    _say( format, args );
+    va_end( args );
+} // say
+
+
+// Debug/test/troubleshooting printing controlled by TBB_VERSION environment variable.
+// To enable printing, the variable must be set and not empty.
+static void tell( char const * format, ... ) {
+    va_list args;
+    va_start( args, format );
+    _tell( format, args );
+    va_end( args );
+} // tell
+
+
+// Error reporting utility. Behavior depends on mode.
+static tbb::runtime_loader::error_code error( tbb::runtime_loader::error_mode mode, tbb::runtime_loader::error_code err, char const * format, ... ) {
+    va_list args;
+    va_start( args, format );
+    if ( mode == tbb::runtime_loader::em_abort ) {
+        // In em_abort mode error message printed unconditionally.
+        _say( format, args );
+    } else {
+        // In other modes printing depends on TBB_VERSION environment variable.
+        _tell( format, args );
+    } // if
+    va_end( args );
+    switch ( mode ) {
+        case tbb::runtime_loader::em_abort : {
+            say( "Aborting..." );
+            #if TBB_USE_DEBUG && ( _WIN32 || _WIN64 )
+                DebugBreak();
+            #endif
+            abort();
+        } break;
+        case tbb::runtime_loader::em_throw : {
+            throw err;
+        } break;
+        case tbb::runtime_loader::em_status : {
+            // Do nothing.
+        } break;
+    } // switch
+    return err;
+} // error
+
+
+/*
+    ------------------------------------------------------------------------------------------------
+    General-purpose string manipulation utilities.
+    ------------------------------------------------------------------------------------------------
+*/
+
+
+// Delete character ch from string str in-place.
+static void strip( char * str, char ch ) {
+    int in  = 0;  // Input character index.
+    int out = 0;  // Output character index.
+    for ( ; ; ) {
+        if ( str[ in ] != ch ) {
+            str[ out ] = str[ in ];
+            ++ out;
+        } // if
+        if ( str[ in ] == 0 ) {
+            break;
+        } // if
+        ++ in;
+    } // forever
+} // func strip
+
+
+// Strip trailing whitespaces in-place.
+static void trim( char * str ) {
+    size_t len = strlen( str );
+    while ( len > 0 && isspace( str[ len - 1 ] ) ) {
+        -- len;
+    } // while
+    str[ len ] = 0;
+} // func trim
+
+
+#if _WIN32 || _WIN64
+    // "When specifying a path, be sure to use backslashes (\), not forward slashes (/)."
+    // (see http://msdn.microsoft.com/en-us/library/ms886736.aspx).
+    const char proper_slash = '\\';
+    inline char char_or_slash( char c ) { return c=='/'? '\\': c; }
+#else
+    const char proper_slash = '/';
+    inline char char_or_slash( char c ) { return c; }
+#endif
+
+// Concatenate name of directory and name of file.
+void cat_file( char const * dir, char const * file, char * buffer, size_t len ) {
+    size_t i = 0;
+    // Copy directory name
+    for( ; i<len && *dir; ++i, ++dir ) {
+        buffer[i] = char_or_slash(*dir);
+    }
+    // Append trailing slash if missed.
+    if( i>0 && i<len && buffer[i-1]!=proper_slash ) {
+        buffer[i++] = proper_slash;
+    }
+    // Copy file name
+    __TBB_ASSERT( char_or_slash(*file)!=proper_slash, "File name starts with a slash" );
+    for( ; i<len && *file; ++i, ++file ) {
+        buffer[i] = *file;
+    }
+    // Append null terminator
+    buffer[ i<len? i: len-1 ] = '\0';
+} // cat_file
+
+
+/*
+    ------------------------------------------------------------------------------------------------
+    Windows implementation of dlopen, dlclose, dlsym, dlerror.
+    ------------------------------------------------------------------------------------------------
+*/
+
+
+#if _WIN32 || _WIN64
+
+    // Implement Unix-like interface (dlopen, dlclose, dlsym, dlerror) via Win32 API functions.
+
+    // Type of dlopen result.
+    typedef HMODULE handle_t;
+
+    enum rtld_flags_t {
+        RTLD_NOW,
+        RTLD_GLOBAL
+    }; // enum rtld_flags_t
+
+    // Unix-like dlopen().
+    static handle_t dlopen( char const * name, rtld_flags_t ) {
+        return LoadLibrary( name );
+    } // dlopen
+
+    // Unix-like dlsym().
+    static void * dlsym( handle_t lib, char const * sym ) {
+        return (void*)GetProcAddress( lib, sym );
+    } // dlsym
+
+    // Unix-like dlclose().
+    static int dlclose( handle_t lib ) {
+        return ! FreeLibrary( lib );
+    } // dlclose
+
+    // The function mimics Unix dlerror() function.
+    // Note: Not thread-safe due to statically allocated buffer.
+    static char * dlerror() {
+
+        static char buffer[ 2048 ];  // Note: statically allocated buffer.
+
+        DWORD err = GetLastError();
+        if ( err == ERROR_SUCCESS ) {
+            return NULL;
+        } // if
+
+        DWORD rc;
+        rc =
+            FormatMessage(
+                FORMAT_MESSAGE_FROM_SYSTEM,
+                NULL,
+                err,
+                MAKELANGID( LANG_NEUTRAL, SUBLANG_DEFAULT ), // Default language.
+                reinterpret_cast< LPTSTR >( & buffer ),
+                sizeof( buffer ),
+                NULL
+            );
+        if ( rc == 0 ) {
+            // FormatMessage() failed to format system error message. Buffer to short or another issue.
+            snprintf( buffer, sizeof( buffer ), "System error %u.", err );
+        } else {
+            /*
+                FormatMessage() returns Windows-style end-of-lines, "\r\n". When string is printed,
+                printf() also replaces all the occurrences of "\n" with "\r\n" (again!), so sequences
+                like "\r\r\r\n" appear in output. It is not too good. Stripping all "\r" normalizes
+                string and returns it to canonical form, so printf() will produce correct end-of-line
+                sequences.
+            */
+            strip( buffer, '\r' );   // Delete carriage returns if any.
+            trim( buffer );          // Delete trailing newlines and spaces.
+        } // if
+
+        return buffer;
+
+    } // dlerror
+
+#else
+
+    // Type of dlopen() result.
+    typedef void * handle_t;
+
+#endif
+
+
+/*
+    ------------------------------------------------------------------------------------------------
+    Runtime loader stuff.
+    ------------------------------------------------------------------------------------------------
+*/
+
+
+// Descriptor table declaration. It is defined in assembler file.
+enum symbol_type_t {
+    st_object   = 0,
+    st_function = 1
+}; // enum symbol_type_t
+struct symbol_t {
+    void *        addr;
+    char const *  name;
+    int           size;
+    symbol_type_t type;
+}; // symbol_t
+extern "C" symbol_t __tbb_internal_runtime_loader_symbols[];
+
+// Hooks for internal use (e. g. for testing).
+tbb::runtime_loader::error_mode stub_mode = tbb::runtime_loader::em_abort;
+
+static char const * tbb_dll_name = __TBB_STRING(__TBB_DLL_NAME);  // Name of TBB library.
+static handle_t     handle       = NULL;                          // Handle of loaded TBB library or NULL.
+static int          version      = 0;                             // Version of the loaded library.
+static int          counter      = 0;                             // Number of runtime_loader objects using the loaded library.
+
+#define ANOTHER_RTL "probably multiple runtime_loader objects work in parallel"
+
+
+// One attempt to load library (dll_name can be a full path or just a file name).
+static tbb::runtime_loader::error_code _load( char const * dll_name, int min_ver, int max_ver ) {
+
+    tbb::runtime_loader::error_mode mode = tbb::runtime_loader::em_status;
+    tbb::runtime_loader::error_code code = tbb::runtime_loader::ec_ok;
+
+    /*
+        If these variables declared at the first usage, Intel C++ Compiler may issue warning(s):
+            transfer of control [goto error] bypasses initialization of: ...
+        Declaring variables at the beginning of the function eliminates warnings.
+    */
+    typedef int (*int_func_t)( void );
+    char const * get_ver_name = "TBB_runtime_interface_version"; // Name of function.
+    int_func_t   get_ver_func = NULL;                            // Pointer to function.
+    handle_t     _handle      = NULL;
+    int          _version     = 0;
+    int          total        = 0;
+    int          not_found    = 0;
+
+    // This function should be called iff there is no loaded library.
+    __TBB_ASSERT( handle  == NULL, "Handle is invalid; "  ANOTHER_RTL );
+    __TBB_ASSERT( version == 0,    "Version is invalid; " ANOTHER_RTL );
+    __TBB_ASSERT( counter == 0,    "Counter is invalid; " ANOTHER_RTL );
+
+    tell( "Loading \"%s\"...", dll_name );
+
+    // First load the library.
+    _handle = dlopen( dll_name, RTLD_NOW );
+    if ( _handle == NULL ) {
+        const char * msg = dlerror();
+        code = error( mode, tbb::runtime_loader::ec_no_lib, "Loading \"%s\" failed; system error: %s", dll_name, msg );
+        goto error;
+    } // if
+
+    // Then try to find out its version.
+    /*
+        g++ 3.4 issues error:
+            ISO C++ forbids casting between pointer-to-function and pointer-to-object
+        on reinterpret_cast<>. Thus, we have no choice but using C-style type cast.
+    */
+    get_ver_func = (int_func_t) dlsym( _handle, get_ver_name );
+    if ( get_ver_func == NULL ) {
+        code = error( mode, tbb::runtime_loader::ec_bad_lib, "Symbol \"%s\" not found; library rejected.", get_ver_name );
+        goto error;
+    } // if
+    _version = get_ver_func();
+    if ( ! ( min_ver <= _version && _version <= max_ver ) ) {
+        code = error( mode, tbb::runtime_loader::ec_bad_ver, "Version %d is out of requested range; library rejected.", _version );
+        goto error;
+    } // if
+
+    // Library is suitable. Mark it as loaded.
+    handle   = _handle;
+    version  = _version;
+    counter += 1;
+    __TBB_ASSERT( counter == 1, "Counter is invalid; " ANOTHER_RTL );
+
+    // Now search for all known symbols.
+    for ( int i = 0; __tbb_internal_runtime_loader_symbols[ i ].name != NULL; ++ i ) {
+        symbol_t & symbol = __tbb_internal_runtime_loader_symbols[ i ];
+        // Verify symbol descriptor.
+        __TBB_ASSERT( symbol.type == st_object || symbol.type == st_function, "Invalid symbol type" );
+        #if _WIN32 || _WIN64
+            __TBB_ASSERT( symbol.type == st_function, "Should not be symbols of object type on Windows" );
+        #endif
+        if ( symbol.type == st_object ) {
+            __TBB_ASSERT( symbol.addr != NULL, "Object address invalid" );
+            __TBB_ASSERT( symbol.size > 0, "Symbol size must be > 0" );
+            __TBB_ASSERT( symbol.size <= 0x1000, "Symbol size too big" );
+        } else {                     // Function
+            // __TBB_ASSERT( symbol.addr == reinterpret_cast< void * >( & stub ), "Invalid symbol address" );
+            __TBB_ASSERT( symbol.size == sizeof( void * ), "Invalid symbol size" );
+        } // if
+        void * addr = dlsym( _handle, symbol.name );
+        if ( addr != NULL ) {
+            if ( symbol.type == st_object ) {
+                if ( strncmp( symbol.name, "_ZTS", 4 ) == 0 ) {
+                    // If object name begins with "_ZTS", it is a string, mangled type name.
+                    // Its value must equal to name of symbol without "_ZTS" prefix.
+                    char const * name = static_cast< char const * >( addr );
+                    __TBB_ASSERT( strlen( name ) + 1 == size_t( symbol.size ), "Unexpected size of typeinfo name" );
+                    __TBB_ASSERT( strcmp( symbol.name + 4, name ) == 0, "Unexpected content of typeinfo name" );
+                    strncpy( reinterpret_cast< char * >( symbol.addr ), name, symbol.size );
+                    reinterpret_cast< char * >( symbol.addr )[ symbol.size - 1 ] = 0;
+                } else {
+                    #if TBB_USE_ASSERT
+                        // If object name begins with "_ZTI", it is an object of std::type_info class.
+                        // Its protected value must equal to name of symbol without "_ZTI" prefix.
+                        if ( strncmp( symbol.name, "_ZTI", 4 ) == 0 ) {
+                            std::type_info const * info = static_cast< std::type_info const * >( addr );
+                            __TBB_ASSERT( size_t( symbol.size ) >= sizeof( std::type_info ), "typeinfo size is too small" );
+                            // std::type_info::name is not a virtual method, it is safe to call it.
+                            __TBB_ASSERT( strcmp( symbol.name + 4, info->name() ) == 0, "Unexpected content of typeinfo" );
+                        } // if
+                    #endif
+                    // Copy object content from libtbb into runtime_loader.
+                    memcpy( symbol.addr, addr, symbol.size );
+                }; // if
+            } else {                     // Function
+                symbol.addr = addr;
+            } // if
+        } else {
+            char const * msg = dlerror();
+            tell( "Symbol \"%s\" not found; system error: %s", symbol.name, msg );
+            ++ not_found;
+        } // if
+        ++ total;
+    } // for i
+
+    if ( not_found > 0 ) {
+        tell( "%d of %d symbols not found.", not_found, total );
+    } // if
+
+    tell( "The library successfully loaded." );
+    return code;
+
+    error:
+        if ( _handle != NULL ) {
+            int rc = dlclose( _handle );
+            if ( rc != 0 ) {
+                // Error occurred.
+                __TBB_ASSERT( rc != 0, "Unexpected error: dlclose() failed" );
+            } // if
+        } // if
+        _handle = NULL;
+        return code;
+
+} // _load
+
+
+static tbb::runtime_loader::error_code load( tbb::runtime_loader::error_mode mode, char const * path[], int min_ver, int max_ver ) {
+    // Check arguments first.
+    if ( min_ver <= 0 ) {
+        return error( mode, tbb::runtime_loader::ec_bad_arg, "tbb::runtime_loader::load(): Invalid value of min_ver argument: %d.", min_ver );
+    } // if
+    if ( max_ver <= 0 ) {
+        return error( mode, tbb::runtime_loader::ec_bad_arg, "tbb::runtime_loader::load(): Invalid value of max_ver argument: %d.", max_ver );
+    } // if
+    if ( min_ver > max_ver ) {
+        return error( mode, tbb::runtime_loader::ec_bad_arg, "tbb::runtime_loader::load(): min_ver and max_ver specify empty range: [%d, %d].", min_ver, max_ver );
+    } // if
+    if ( min_ver == max_ver ) {
+        tell( "Searching for \"%s\" version %d...", tbb_dll_name, min_ver );
+    } else if ( max_ver == INT_MAX ) {
+        tell( "Searching for \"%s\" version %d+...", tbb_dll_name, min_ver );
+    } else {
+        tell( "Searching for \"%s\" version in range [%d, %d]...", tbb_dll_name, min_ver, max_ver );
+    } // if
+    // Then check whether a library already loaded.
+    if ( handle != NULL ) {
+        // Library already loaded. Check whether the version is compatible.
+        __TBB_ASSERT( version > 0, "Version is invalid; " ANOTHER_RTL );
+        __TBB_ASSERT( counter > 0, "Counter is invalid; " ANOTHER_RTL );
+        if ( min_ver <= version && version <= max_ver ) {
+            // Version is ok, let us use this library.
+            tell( "Library version %d is already loaded.", version );
+            counter += 1;
+            return tbb::runtime_loader::ec_ok;
+        } else {
+            // Version is not suitable.
+            return error( mode, tbb::runtime_loader::ec_bad_ver, "Library version %d is already loaded.", version );
+        } // if
+    } // if
+    // There is no loaded library, try to load it using provided directories.
+    __TBB_ASSERT( version == 0, "Version is invalid; " ANOTHER_RTL );
+    __TBB_ASSERT( counter == 0, "Counter is invalid; " ANOTHER_RTL );
+    size_t namelen = strlen(tbb_dll_name);
+    size_t buflen = 0;
+    char * buffer = NULL;
+    for ( int i = 0; path[i] != NULL; ++ i ) {
+        size_t len = strlen(path[i]) + namelen + 2; // 1 for slash and 1 for null terminator
+        if( buflen<len ) {
+            free( buffer );
+            buflen = len;
+            buffer = (char*)malloc( buflen );
+            if( !buffer )
+                return error( mode, tbb::runtime_loader::ec_no_lib, "Not enough memory." );
+        }
+        cat_file( path[i], tbb_dll_name, buffer, buflen );
+        __TBB_ASSERT(strstr(buffer,tbb_dll_name), "Name concatenation error");
+        tbb::runtime_loader::error_code ec = _load( buffer, min_ver, max_ver );
+        if ( ec == tbb::runtime_loader::ec_ok ) {
+            return ec;       // Success. Exiting...
+        } // if
+    } // for i
+    free( buffer );
+    return error( mode, tbb::runtime_loader::ec_no_lib, "No suitable library found." );
+} // load
+
+
+
+
+// Suppress "defined but not used" compiler warnings.
+static void const * dummy[] = {
+    (void *) & strip,
+    (void *) & trim,
+    & dummy,
+    NULL
+};
+
+
+} // namespace runtime_loader
+
+} // namespace internal
+
+
+runtime_loader::runtime_loader( error_mode mode ) :
+    my_mode( mode ),
+    my_status( ec_ok ),
+    my_loaded( false )
+{
+} // ctor
+
+
+runtime_loader::runtime_loader( char const * path[], int min_ver, int max_ver, error_mode mode ) :
+    my_mode( mode ),
+    my_status( ec_ok ),
+    my_loaded( false )
+{
+    load( path, min_ver, max_ver );
+} // ctor
+
+
+runtime_loader::~runtime_loader() {
+} // dtor
+
+
+tbb::runtime_loader::error_code runtime_loader::load( char const * path[], int min_ver, int max_ver ) {
+    if ( my_loaded ) {
+        my_status = tbb::interface6::internal::runtime_loader::error( my_mode, ec_bad_call, "tbb::runtime_loader::load(): Library already loaded by this runtime_loader object." );
+    } else {
+        my_status = internal::runtime_loader::load( my_mode, path, min_ver, max_ver );
+        if ( my_status == ec_ok ) {
+            my_loaded = true;
+        } // if
+    } // if
+    return my_status;
+} // load
+
+
+
+
+tbb::runtime_loader::error_code runtime_loader::status() {
+    return my_status;
+} // status
+
+
+} // namespace interface6
+
+} // namespace tbb
+
+
+// Stub function replaces all TBB entry points when no library is loaded.
+int __tbb_internal_runtime_loader_stub() {
+    char const * msg = NULL;
+    if ( tbb::interface6::internal::runtime_loader::handle == NULL ) {
+        msg = "A function is called while TBB library is not loaded";
+    } else {
+        msg = "A function is called which is not present in loaded TBB library";
+    } // if
+    return tbb::interface6::internal::runtime_loader::error( tbb::interface6::internal::runtime_loader::stub_mode, tbb::runtime_loader::ec_no_lib, msg );
+} // stub
+
+#endif // !__TBB_WIN8UI_SUPPORT //
+// end of file //
diff --git a/xdl/third_party/tbb/src/test/harness.h b/xdl/third_party/tbb/src/test/harness.h
new file mode 100644
index 00000000..4e2f1780
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness.h
@@ -0,0 +1,836 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Declarations for rock-bottom simple test harness.
+// Just include this file to use it.
+// Every test is presumed to have a command line of the form "test [-v] [MinThreads[:MaxThreads]]"
+// The default for MinThreads is 1, for MaxThreads 4.
+// The defaults can be overridden by defining macros HARNESS_DEFAULT_MIN_THREADS
+// and HARNESS_DEFAULT_MAX_THREADS before including harness.h
+
+#ifndef tbb_tests_harness_H
+#define tbb_tests_harness_H
+
+#include "tbb/tbb_config.h"
+#include "harness_defs.h"
+
+namespace Harness {
+    enum TestResult {
+        Done,
+        Skipped,
+        Unknown
+    };
+}
+
+//! Entry point to a TBB unit test application
+/** It MUST be defined by the test application.
+
+    If HARNESS_NO_PARSE_COMMAND_LINE macro was not explicitly set before including harness.h,
+    then global variables MinThread, and MaxThread will be available and
+    initialized when it is called.
+
+    Returns Harness::Done when the tests passed successfully. When the test fail, it must
+    not return, calling exit(errcode) or abort() instead. When the test is not supported
+    for the given platform/compiler/etc, it should return Harness::Skipped.
+
+    To provide non-standard variant of main() for the test, define HARNESS_CUSTOM_MAIN
+    before including harness.h **/
+int TestMain ();
+
+#if __SUNPRO_CC
+    #include <stdlib.h>
+    #include <string.h>
+    #include <ucontext.h>
+#else /* !__SUNPRO_CC */
+    #include <cstdlib>
+    #include <cstring>
+#endif /* !__SUNPRO_CC */
+
+#include <new>
+
+#if __TBB_MIC_NATIVE
+    #include "harness_mic.h"
+#else
+    #define HARNESS_EXPORT
+    #define REPORT_FATAL_ERROR REPORT
+#endif /* !__MIC__ */
+
+#if _WIN32||_WIN64
+    #include "tbb/machine/windows_api.h"
+    #if _WIN32_WINNT > 0x0501 && _MSC_VER && !_M_ARM
+        // Suppress "typedef ignored ... when no variable is declared" warning by vc14
+        #pragma warning (push)
+        #pragma warning (disable: 4091)
+        #include <dbghelp.h>
+        #pragma warning (pop)
+        #pragma comment (lib, "dbghelp.lib")
+    #endif
+    #if __TBB_WIN8UI_SUPPORT
+        #include <thread>
+    #endif
+    #if _MSC_VER
+        #include <crtdbg.h>
+    #endif
+    #include <process.h>
+#else
+    #include <pthread.h>
+#endif
+
+#if __linux__
+    #include <sys/utsname.h> /* for uname */
+    #include <errno.h>       /* for use in LinuxKernelVersion() */
+    #include <features.h>
+#endif
+// at least GLIBC 2.1 or OSX 10.5
+#if __GLIBC__>2 || ( __GLIBC__==2 && __GLIBC_MINOR__ >= 1) || __APPLE__
+    #include <execinfo.h> /*backtrace*/
+    #define BACKTRACE_FUNCTION_AVAILABLE 1
+#endif
+
+namespace Harness {
+    class NativeMutex {
+#if _WIN32||_WIN64
+        CRITICAL_SECTION my_critical_section;
+      public:
+        NativeMutex() {
+            InitializeCriticalSectionEx(&my_critical_section, 4000, 0);
+        }
+        void lock() {
+            EnterCriticalSection(&my_critical_section);
+        }
+        void unlock() {
+            LeaveCriticalSection(&my_critical_section);
+        }
+        ~NativeMutex() {
+            DeleteCriticalSection(&my_critical_section);
+        }
+#else
+        pthread_mutex_t m_mutex;
+    public:
+        NativeMutex() {
+             pthread_mutex_init(&m_mutex, NULL);
+        }
+        void lock() {
+            pthread_mutex_lock(&m_mutex);
+        }
+        void unlock() {
+            pthread_mutex_unlock(&m_mutex);
+        }
+        ~NativeMutex() {
+            pthread_mutex_destroy(&m_mutex);
+        }
+#endif
+    };
+    namespace internal {
+        static NativeMutex print_stack_mutex;
+    }
+}
+
+#include "harness_runtime_loader.h"
+#include "harness_report.h"
+
+//! Prints current call stack
+void print_call_stack() {
+    Harness::internal::print_stack_mutex.lock();
+    fflush(stdout); fflush(stderr);
+    #if BACKTRACE_FUNCTION_AVAILABLE
+        const int sz = 100; // max number of frames to capture
+        void *buff[sz];
+        int n = backtrace(buff, sz);
+        REPORT("Call stack info (%d):\n", n);
+        backtrace_symbols_fd(buff, n, fileno(stdout));
+    #elif __SUNPRO_CC
+        REPORT("Call stack info:\n");
+        printstack(fileno(stdout));
+    #elif _WIN32_WINNT > 0x0501 && _MSC_VER>=1500 && !__TBB_WIN8UI_SUPPORT
+        const int sz = 62; // XP limitation for number of frames
+        void *buff[sz];
+        int n = CaptureStackBackTrace(0, sz, buff, NULL);
+        REPORT("Call stack info (%d):\n", n);
+        static LONG once = 0;
+        if( !InterlockedExchange(&once, 1) )
+            SymInitialize(GetCurrentProcess(), NULL, TRUE);
+        const int len = 255; // just some reasonable string buffer size
+        union { SYMBOL_INFO sym; char pad[sizeof(SYMBOL_INFO)+len]; };
+        sym.MaxNameLen = len;
+        sym.SizeOfStruct = sizeof( SYMBOL_INFO );
+        DWORD64 offset;
+        for(int i = 1; i < n; i++) { // skip current frame
+            if(!SymFromAddr( GetCurrentProcess(), DWORD64(buff[i]), &offset, &sym )) {
+                sym.Address = ULONG64(buff[i]); offset = 0; sym.Name[0] = 0;
+            }
+            REPORT("[%d] %016I64X+%04I64X: %s\n", i, sym.Address, offset, sym.Name); //TODO: print module name
+        }
+    #endif /*BACKTRACE_FUNCTION_AVAILABLE*/
+    Harness::internal::print_stack_mutex.unlock();
+}
+
+#if !HARNESS_NO_ASSERT
+    #include <exception> //for set_terminate
+    #include "harness_assert.h"
+    #if TEST_USES_TBB
+        #include <tbb/tbb_stddef.h> /*set_assertion_handler*/
+    #endif
+
+    struct InitReporter {
+        void (*default_terminate_handler)() ;
+        InitReporter(): default_terminate_handler(NULL) {
+            #if TEST_USES_TBB
+                #if TBB_USE_ASSERT
+                    tbb::set_assertion_handler(ReportError);
+                #endif
+                ASSERT_WARNING(TBB_INTERFACE_VERSION <= tbb::TBB_runtime_interface_version(), "runtime version mismatch");
+            #endif
+            #if TBB_USE_EXCEPTIONS
+                default_terminate_handler = std::set_terminate(handle_terminate);
+            #endif
+        }
+        static void handle_terminate();
+    };
+    static InitReporter InitReportError;
+
+    void InitReporter::handle_terminate(){
+        REPORT("std::terminate called.\n");
+        print_call_stack();
+        if (InitReportError.default_terminate_handler){
+            InitReportError.default_terminate_handler();
+        }
+    }
+
+    typedef void (*test_error_extra_t)(void);
+    static test_error_extra_t ErrorExtraCall;
+    //! Set additional handler to process failed assertions
+    void SetHarnessErrorProcessing( test_error_extra_t extra_call ) {
+        ErrorExtraCall = extra_call;
+    }
+
+    //! Reports errors issued by failed assertions
+    void ReportError( const char* filename, int line, const char* expression, const char * message ) {
+        print_call_stack();
+    #if __TBB_ICL_11_1_CODE_GEN_BROKEN
+        printf("%s:%d, assertion %s: %s\n", filename, line, expression, message ? message : "failed" );
+    #else
+        REPORT_FATAL_ERROR("%s:%d, assertion %s: %s\n", filename, line, expression, message ? message : "failed" );
+    #endif
+
+        if( ErrorExtraCall )
+            (*ErrorExtraCall)();
+        fflush(stdout); fflush(stderr);
+    #if HARNESS_TERMINATE_ON_ASSERT
+        TerminateProcess(GetCurrentProcess(), 1);
+    #elif HARNESS_EXIT_ON_ASSERT
+        exit(1);
+    #elif HARNESS_CONTINUE_ON_ASSERT
+        // continue testing
+    #elif _MSC_VER && _DEBUG
+        // aligned with tbb_assert_impl.h behavior
+        if(1 == _CrtDbgReport(_CRT_ASSERT, filename, line, NULL, "%s\r\n%s", expression, message?message:""))
+            _CrtDbgBreak();
+    #else
+        abort();
+    #endif /* HARNESS_EXIT_ON_ASSERT */
+    }
+    //! Reports warnings issued by failed warning assertions
+    void ReportWarning( const char* filename, int line, const char* expression, const char * message ) {
+        REPORT("Warning: %s:%d, assertion %s: %s\n", filename, line, expression, message ? message : "failed" );
+    }
+
+#else /* !HARNESS_NO_ASSERT */
+
+    #define ASSERT(p,msg) (Harness::suppress_unused_warning(p), (void)0)
+    #define ASSERT_WARNING(p,msg) (Harness::suppress_unused_warning(p), (void)0)
+
+#endif /* !HARNESS_NO_ASSERT */
+
+namespace Harness {
+    //TODO: unify with utility::internal::array_length from examples common utilities
+    template<typename T, size_t N>
+    inline size_t array_length(const T(&)[N])
+    {
+       return N;
+    }
+
+    template<typename T, size_t N>
+    inline T* end( T(& array)[N])
+    {
+       return array+ array_length(array) ;
+    }
+
+} //namespace Harness
+
+#if TEST_USES_TBB
+    #include "tbb/blocked_range.h"
+
+    namespace Harness {
+        template<typename T, size_t N>
+        tbb::blocked_range<T*> make_blocked_range( T(& array)[N]){ return tbb::blocked_range<T*>(array, array + N);}
+    }
+#endif
+
+#if !HARNESS_NO_PARSE_COMMAND_LINE
+
+//! Controls level of commentary printed via printf-like REMARK() macro.
+/** If true, makes the test print commentary.  If false, test should print "done" and nothing more. */
+static bool Verbose;
+
+#ifndef HARNESS_DEFAULT_MIN_THREADS
+    #define HARNESS_DEFAULT_MIN_THREADS 1
+#endif
+
+//! Minimum number of threads
+static int MinThread = HARNESS_DEFAULT_MIN_THREADS;
+
+#ifndef HARNESS_DEFAULT_MAX_THREADS
+    #define HARNESS_DEFAULT_MAX_THREADS 4
+#endif
+
+//! Maximum number of threads
+static int MaxThread = HARNESS_DEFAULT_MAX_THREADS;
+
+//! Parse command line of the form "name [-v] [MinThreads[:MaxThreads]]"
+/** Sets Verbose, MinThread, and MaxThread accordingly.
+    The nthread argument can be a single number or a range of the form m:n.
+    A single number m is interpreted as if written m:m.
+    The numbers must be non-negative.
+    Clients often treat the value 0 as "run sequentially." */
+inline void ParseCommandLine( int argc, char* argv[] ) {
+    if( !argc ) REPORT("Command line with 0 arguments\n");
+    int i = 1;
+    if( i<argc ) {
+        if( strncmp( argv[i], "-v", 2 )==0 ) {
+            Verbose = true;
+            ++i;
+        }
+    }
+    if( i<argc ) {
+        char* endptr;
+        MinThread = strtol( argv[i], &endptr, 0 );
+        if( *endptr==':' )
+            MaxThread = strtol( endptr+1, &endptr, 0 );
+        else if( *endptr=='\0' )
+            MaxThread = MinThread;
+        if( *endptr!='\0' ) {
+            REPORT_FATAL_ERROR("garbled nthread range\n");
+            exit(1);
+        }
+        if( MinThread<0 ) {
+            REPORT_FATAL_ERROR("nthread must be nonnegative\n");
+            exit(1);
+        }
+        if( MaxThread<MinThread ) {
+            REPORT_FATAL_ERROR("nthread range is backwards\n");
+            exit(1);
+        }
+        ++i;
+    }
+#if __TBB_STDARGS_BROKEN
+    if ( !argc )
+        argc = 1;
+    else {
+        while ( i < argc && argv[i][0] == 0 )
+            ++i;
+    }
+#endif /* __TBB_STDARGS_BROKEN */
+    if( i!=argc ) {
+        REPORT_FATAL_ERROR("Usage: %s [-v] [nthread|minthread:maxthread]\n", argv[0] );
+        exit(1);
+    }
+}
+#endif /* HARNESS_NO_PARSE_COMMAND_LINE */
+
+#if !HARNESS_CUSTOM_MAIN
+
+#if __TBB_MPI_INTEROP
+#undef SEEK_SET
+#undef SEEK_CUR
+#undef SEEK_END
+#include "mpi.h"
+#endif
+
+#if __TBB_MIC_OFFLOAD && __MIC__
+extern "C" int COIProcessProxyFlush();
+#endif
+
+HARNESS_EXPORT
+#if HARNESS_NO_PARSE_COMMAND_LINE
+int main() {
+#if __TBB_MPI_INTEROP
+    MPI_Init(NULL,NULL);
+#endif
+#else
+int main(int argc, char* argv[]) {
+    ParseCommandLine( argc, argv );
+#if __TBB_MPI_INTEROP
+    MPI_Init(&argc,&argv);
+#endif
+#endif
+#if HARNESS_SKIP_TEST
+    REPORT( "skip\n" );
+    return 0;
+#else
+#if __TBB_MPI_INTEROP
+    // Simple TBB/MPI interoperability harness for most of tests
+    // Worker processes send blocking messages to the master process about their rank and group size
+    // Master process receives this info and print it in verbose mode
+    int rank, size, myrank;
+    MPI_Status status;
+    MPI_Comm_size(MPI_COMM_WORLD,&size);
+    MPI_Comm_rank(MPI_COMM_WORLD,&myrank);
+    if (myrank == 0) {
+#if !HARNESS_NO_PARSE_COMMAND_LINE
+        REMARK("Hello mpi world. I am %d of %d\n", myrank, size);
+#endif
+        for ( int i = 1; i < size; i++ ) {
+            MPI_Recv (&rank, 1, MPI_INT, i, 1, MPI_COMM_WORLD, &status);
+            MPI_Recv (&size, 1, MPI_INT, i, 1, MPI_COMM_WORLD, &status);
+#if !HARNESS_NO_PARSE_COMMAND_LINE
+            REMARK("Hello mpi world. I am %d of %d\n", rank, size);
+#endif
+        }
+    } else {
+        MPI_Send (&myrank, 1, MPI_INT, 0, 1, MPI_COMM_WORLD);
+        MPI_Send (&size, 1, MPI_INT, 0, 1, MPI_COMM_WORLD);
+    }
+#endif
+
+    int res = Harness::Unknown;
+#if __TBB_MIC_OFFLOAD
+    // "mic:-1" or "mandatory" specifies execution on the target. The runtime
+    // system chooses the specific target. Execution on the CPU is not allowed.
+#if __INTEL_COMPILER < 1400
+    #pragma offload target(mic:-1) out(res)
+#else
+    #pragma offload target(mic) out(res) mandatory
+#endif
+#endif
+    {
+        res = TestMain();
+#if __TBB_MIC_OFFLOAD && __MIC__
+        // It is recommended not to use the __MIC__ macro directly in the offload block but it is Ok here
+        // since it is not lead to an unexpected difference between host and target compilation phases.
+        // We need to flush internals COI buffers to order output from the offload part before the host part.
+        // Also it is work-around for the issue with missed output.
+        COIProcessProxyFlush();
+#endif
+    }
+
+    ASSERT( res==Harness::Done || res==Harness::Skipped, "Wrong return code by TestMain");
+#if __TBB_MPI_INTEROP
+    if (myrank == 0) {
+        REPORT( res==Harness::Done ? "done\n" : "skip\n" );
+    }
+    MPI_Finalize();
+#else
+    REPORT( res==Harness::Done ? "done\n" : "skip\n" );
+#endif
+    return 0;
+#endif /* HARNESS_SKIP_TEST */
+}
+
+#endif /* !HARNESS_CUSTOM_MAIN */
+
+//! Base class for prohibiting compiler-generated operator=
+class NoAssign {
+    //! Assignment not allowed
+    void operator=( const NoAssign& );
+public:
+    NoAssign() {} // explicitly defined to prevent gratuitous warnings
+};
+
+//! Base class for prohibiting compiler-generated copy constructor or operator=
+class NoCopy: NoAssign {
+    //! Copy construction not allowed
+    NoCopy( const NoCopy& );
+public:
+    NoCopy() {}
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#include <utility>
+
+//! Base class for objects which support move ctors
+class Movable {
+public:
+    Movable() : alive(true) {}
+    void Reset() { alive = true; }
+    Movable(Movable&& other) {
+        ASSERT(other.alive, "Moving from a dead object");
+        alive = true;
+        other.alive = false;
+    }
+    Movable& operator=(Movable&& other) {
+        ASSERT(alive, "Assignment to a dead object");
+        ASSERT(other.alive, "Assignment of a dead object");
+        other.alive = false;
+        return *this;
+    }
+    Movable& operator=(const Movable& other) {
+        ASSERT(alive, "Assignment to a dead object");
+        ASSERT(other.alive, "Assignment of a dead object");
+        return *this;
+    }
+    Movable(const Movable& other) {
+        ASSERT(other.alive, "Const reference to a dead object");
+        alive = true;
+    }
+    ~Movable() { alive = false; }
+    volatile bool alive;
+};
+
+class MoveOnly : Movable, NoCopy {
+public:
+    MoveOnly() : Movable() {}
+    MoveOnly(MoveOnly&& other) : Movable( std::move(other) ) {}
+};
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+#if HARNESS_TBBMALLOC_THREAD_SHUTDOWN && __TBB_SOURCE_DIRECTLY_INCLUDED && (_WIN32||_WIN64)
+#include "../tbbmalloc/tbbmalloc_internal_api.h"
+#endif
+
+//! For internal use by template function NativeParallelFor
+template<typename Index, typename Body>
+class NativeParallelForTask: NoCopy {
+public:
+    NativeParallelForTask( Index index_, const Body& body_ ) :
+        index(index_),
+        body(body_)
+    {}
+
+    //! Start task
+    void start() {
+#if _WIN32||_WIN64
+        unsigned thread_id;
+#if __TBB_WIN8UI_SUPPORT
+        std::thread* thread_tmp=new std::thread(thread_function, this);
+        thread_handle = thread_tmp->native_handle();
+        thread_id = 0;
+#else
+        unsigned stack_size = 0;
+#if HARNESS_THREAD_STACK_SIZE
+        stack_size = HARNESS_THREAD_STACK_SIZE;
+#endif
+        thread_handle = (HANDLE)_beginthreadex( NULL, stack_size, thread_function, this, 0, &thread_id );
+#endif
+        ASSERT( thread_handle!=0, "NativeParallelFor: _beginthreadex failed" );
+#else
+#if __ICC==1100
+    #pragma warning (push)
+    #pragma warning (disable: 2193)
+#endif /* __ICC==1100 */
+        // Some machines may have very large hard stack limit. When the test is
+        // launched by make, the default stack size is set to the hard limit, and
+        // calls to pthread_create fail with out-of-memory error.
+        // Therefore we set the stack size explicitly (as for TBB worker threads).
+#if !defined(HARNESS_THREAD_STACK_SIZE)
+#if __i386__||__i386||__arm__
+        const size_t stack_size = 1*MByte;
+#elif __x86_64__
+        const size_t stack_size = 2*MByte;
+#else
+        const size_t stack_size = 4*MByte;
+#endif
+#else
+        const size_t stack_size = HARNESS_THREAD_STACK_SIZE;
+#endif /* HARNESS_THREAD_STACK_SIZE */
+        pthread_attr_t attr_stack;
+        int status = pthread_attr_init(&attr_stack);
+        ASSERT(0==status, "NativeParallelFor: pthread_attr_init failed");
+        status = pthread_attr_setstacksize( &attr_stack, stack_size );
+        ASSERT(0==status, "NativeParallelFor: pthread_attr_setstacksize failed");
+        status = pthread_create(&thread_id, &attr_stack, thread_function, this);
+        ASSERT(0==status, "NativeParallelFor: pthread_create failed");
+        pthread_attr_destroy(&attr_stack);
+#if __ICC==1100
+    #pragma warning (pop)
+#endif
+#endif /* _WIN32||_WIN64 */
+    }
+
+    //! Wait for task to finish
+    void wait_to_finish() {
+#if _WIN32||_WIN64
+        DWORD status = WaitForSingleObjectEx( thread_handle, INFINITE, FALSE );
+        ASSERT( status!=WAIT_FAILED, "WaitForSingleObject failed" );
+        CloseHandle( thread_handle );
+#else
+        int status = pthread_join( thread_id, NULL );
+        ASSERT( !status, "pthread_join failed" );
+#endif
+#if HARNESS_NO_ASSERT
+        (void)status;
+#endif
+    }
+
+private:
+#if _WIN32||_WIN64
+    HANDLE thread_handle;
+#else
+    pthread_t thread_id;
+#endif
+
+    //! Range over which task will invoke the body.
+    const Index index;
+
+    //! Body to invoke over the range.
+    const Body body;
+
+#if _WIN32||_WIN64
+    static unsigned __stdcall thread_function( void* object )
+#else
+    static void* thread_function(void* object)
+#endif
+    {
+        NativeParallelForTask& self = *static_cast<NativeParallelForTask*>(object);
+        (self.body)(self.index);
+#if HARNESS_TBBMALLOC_THREAD_SHUTDOWN && __TBB_SOURCE_DIRECTLY_INCLUDED && (_WIN32||_WIN64)
+        // in those cases can't release per-thread cache automatically,
+        // so do it manually
+        // TODO: investigate less-intrusive way to do it, for example via FLS keys
+        __TBB_mallocThreadShutdownNotification();
+#endif
+        return 0;
+    }
+};
+
+//! Execute body(i) in parallel for i in the interval [0,n).
+/** Each iteration is performed by a separate thread. */
+template<typename Index, typename Body>
+void NativeParallelFor( Index n, const Body& body ) {
+    typedef NativeParallelForTask<Index,Body> task;
+
+    if( n>0 ) {
+        // Allocate array to hold the tasks
+        task* array = static_cast<task*>(operator new( n*sizeof(task) ));
+
+        // Construct the tasks
+        for( Index i=0; i!=n; ++i )
+            new( &array[i] ) task(i,body);
+
+        // Start the tasks
+        for( Index i=0; i!=n; ++i )
+            array[i].start();
+
+        // Wait for the tasks to finish and destroy each one.
+        for( Index i=n; i; --i ) {
+            array[i-1].wait_to_finish();
+            array[i-1].~task();
+        }
+
+        // Deallocate the task array
+        operator delete(array);
+    }
+}
+
+//! The function to zero-initialize arrays; useful to avoid warnings
+template <typename T>
+void zero_fill(void* array, size_t n) {
+    memset(array, 0, sizeof(T)*n);
+}
+
+#if __SUNPRO_CC && defined(min)
+#undef min
+#undef max
+#endif
+
+#ifndef min
+//! Utility template function returning lesser of the two values.
+/** Provided here to avoid including not strict safe <algorithm>.\n
+    In case operands cause signed/unsigned or size mismatch warnings it is caller's
+    responsibility to do the appropriate cast before calling the function. **/
+template<typename T1, typename T2>
+T1 min ( const T1& val1, const T2& val2 ) {
+    return val1 < val2 ? val1 : val2;
+}
+#endif /* !min */
+
+#ifndef max
+//! Utility template function returning greater of the two values.
+/** Provided here to avoid including not strict safe <algorithm>.\n
+    In case operands cause signed/unsigned or size mismatch warnings it is caller's
+    responsibility to do the appropriate cast before calling the function. **/
+template<typename T1, typename T2>
+T1 max ( const T1& val1, const T2& val2 ) {
+    return val1 < val2 ? val2 : val1;
+}
+#endif /* !max */
+
+template<typename T>
+static inline bool is_aligned(T arg, size_t alignment) {
+    return 0==((size_t)arg &  (alignment-1));
+}
+
+#if __linux__
+inline unsigned LinuxKernelVersion()
+{
+    unsigned digit1, digit2, digit3;
+    struct utsname utsnameBuf;
+
+    if (-1 == uname(&utsnameBuf)) {
+        REPORT_FATAL_ERROR("Can't call uname: errno %d\n", errno);
+        exit(1);
+    }
+    if (3 != sscanf(utsnameBuf.release, "%u.%u.%u", &digit1, &digit2, &digit3)) {
+        REPORT_FATAL_ERROR("Unable to parse OS release '%s'\n", utsnameBuf.release);
+        exit(1);
+    }
+    return 1000000*digit1+1000*digit2+digit3;
+}
+#endif
+
+namespace Harness {
+
+#if !HARNESS_NO_ASSERT
+//! Base class that asserts that no operations are made with the object after its destruction.
+class NoAfterlife {
+protected:
+    enum state_t {
+        LIVE=0x56781234,
+        DEAD=0xDEADBEEF
+    } m_state;
+
+public:
+    NoAfterlife() : m_state(LIVE) {}
+    NoAfterlife( const NoAfterlife& src ) : m_state(LIVE) {
+        ASSERT( src.IsLive(), "Constructing from the dead source" );
+    }
+    ~NoAfterlife() {
+        ASSERT( IsLive(), "Repeated destructor call" );
+        m_state = DEAD;
+    }
+    const NoAfterlife& operator=( const NoAfterlife& src ) {
+        ASSERT( IsLive(), NULL );
+        ASSERT( src.IsLive(), NULL );
+        return *this;
+    }
+    void AssertLive() const {
+        ASSERT( IsLive(), "Already dead" );
+    }
+    bool IsLive() const {
+        return m_state == LIVE;
+    }
+}; // NoAfterlife
+#endif /* !HARNESS_NO_ASSERT */
+
+#if _WIN32 || _WIN64
+    void Sleep ( int ms ) {
+#if !__TBB_WIN8UI_SUPPORT
+        ::Sleep(ms);
+#else
+         std::chrono::milliseconds sleep_time( ms );
+         std::this_thread::sleep_for( sleep_time );
+#endif
+
+    }
+
+    typedef DWORD tid_t;
+    tid_t CurrentTid () { return GetCurrentThreadId(); }
+
+#else /* !WIN */
+
+    void Sleep ( int ms ) {
+        timespec  requested = { ms / 1000, (ms % 1000)*1000000 };
+        timespec  remaining = { 0, 0 };
+        nanosleep(&requested, &remaining);
+    }
+
+    typedef pthread_t tid_t;
+    tid_t CurrentTid () { return pthread_self(); }
+#endif /* !WIN */
+
+    static const unsigned Primes[] = {
+        0x9e3779b1, 0xffe6cc59, 0x2109f6dd, 0x43977ab5, 0xba5703f5, 0xb495a877, 0xe1626741, 0x79695e6b,
+        0xbc98c09f, 0xd5bee2b3, 0x287488f9, 0x3af18231, 0x9677cd4d, 0xbe3a6929, 0xadc6a877, 0xdcf0674b,
+        0xbe4d6fe9, 0x5f15e201, 0x99afc3fd, 0xf3f16801, 0xe222cfff, 0x24ba5fdb, 0x0620452d, 0x79f149e3,
+        0xc8b93f49, 0x972702cd, 0xb07dd827, 0x6c97d5ed, 0x085a3d61, 0x46eb5ea7, 0x3d9910ed, 0x2e687b5b,
+        0x29609227, 0x6eb081f1, 0x0954c4e1, 0x9d114db9, 0x542acfa9, 0xb3e6bd7b, 0x0742d917, 0xe9f3ffa7,
+        0x54581edb, 0xf2480f45, 0x0bb9288f, 0xef1affc7, 0x85fa0ca7, 0x3ccc14db, 0xe6baf34b, 0x343377f7,
+        0x5ca19031, 0xe6d9293b, 0xf0a9f391, 0x5d2e980b, 0xfc411073, 0xc3749363, 0xb892d829, 0x3549366b,
+        0x629750ad, 0xb98294e5, 0x892d9483, 0xc235baf3, 0x3d2402a3, 0x6bdef3c9, 0xbec333cd, 0x40c9520f
+    };
+
+    class FastRandom {
+        unsigned x, a;
+    public:
+        unsigned short get() {
+            unsigned short r = (unsigned short)(x >> 16);
+            x = x*a + 1;
+            return r;
+        }
+        explicit FastRandom( unsigned seed ) {
+            x = seed;
+            a = Primes[seed % (sizeof(Primes) / sizeof(Primes[0]))];
+        }
+    };
+    template<typename T>
+    class FastRandomBody {
+        FastRandom r;
+    public:
+        explicit FastRandomBody( unsigned seed ) : r(seed) {}
+        // Depending on the input type T the result distribution formed from this operator()
+        // might possess different characteristics than the original one used in FastRandom instance.
+        T operator()() { return T(r.get()); }
+    };
+
+    int SetEnv( const char *envname, const char *envval ) {
+        ASSERT( envname && envval, "Harness::SetEnv() requires two valid C strings" );
+#if __TBB_WIN8UI_SUPPORT
+        ASSERT( false, "Harness::SetEnv() should not be called in code built for win8ui" );
+        return -1;
+#elif !(_MSC_VER || __MINGW32__ || __MINGW64__)
+        // On POSIX systems use setenv
+        return setenv(envname, envval, /*overwrite=*/1);
+#elif __STDC_SECURE_LIB__>=200411
+        // this macro is set in VC & MinGW if secure API functions are present
+        return _putenv_s(envname, envval);
+#else
+        // If no secure API on Windows, use _putenv
+        size_t namelen = strlen(envname), valuelen = strlen(envval);
+        char* buf = new char[namelen+valuelen+2];
+        strncpy(buf, envname, namelen);
+        buf[namelen] = '=';
+        strncpy(buf+namelen+1, envval, valuelen);
+        buf[namelen+1+valuelen] = char(0);
+        int status = _putenv(buf);
+        delete[] buf;
+        return status;
+#endif
+    }
+
+    char* GetEnv(const char *envname) {
+        ASSERT(envname, "Harness::GetEnv() requires a valid C string");
+#if __TBB_WIN8UI_SUPPORT
+        return NULL;
+#else
+        return std::getenv(envname);
+#endif
+    }
+
+    class DummyBody {
+        int m_numIters;
+    public:
+        explicit DummyBody( int iters ) : m_numIters( iters ) {}
+        void operator()( int ) const {
+            for ( volatile int i = 0; i < m_numIters; ++i ) {}
+        }
+    };
+} // namespace Harness
+
+#endif /* tbb_tests_harness_H */
diff --git a/xdl/third_party/tbb/src/test/harness_allocator.h b/xdl/third_party/tbb/src/test/harness_allocator.h
new file mode 100644
index 00000000..d57bb962
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_allocator.h
@@ -0,0 +1,620 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Declarations for simple estimate of the memory being used by a program.
+// Not yet implemented for macOS*.
+// This header is an optional part of the test harness.
+// It assumes that "harness_assert.h" has already been included.
+
+#ifndef tbb_test_harness_allocator_H
+#define tbb_test_harness_allocator_H
+
+#include "harness_defs.h"
+
+#if __linux__ || __APPLE__ || __sun
+#include <unistd.h>
+#elif _WIN32
+#include "tbb/machine/windows_api.h"
+#endif /* OS specific */
+#include <memory>
+#include <new>
+#include <cstdio>
+#include <stdexcept>
+#include <utility>
+#include __TBB_STD_SWAP_HEADER
+
+#include "tbb/atomic.h"
+
+#if __SUNPRO_CC
+using std::printf;
+#endif
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (push)
+#if defined(_Wp64)
+    #pragma warning (disable: 4267)
+#endif
+#if _MSC_VER <= 1600
+    #pragma warning (disable: 4355)
+#endif
+#if _MSC_VER <= 1800
+    #pragma warning (disable: 4512)
+#endif
+#endif
+
+#if TBB_INTERFACE_VERSION >= 7005
+// Allocator traits were introduced in 4.2 U5
+namespace Harness {
+#if __TBB_ALLOCATOR_TRAITS_PRESENT
+    using std::true_type;
+    using std::false_type;
+#else
+    using tbb::internal::true_type;
+    using tbb::internal::false_type;
+#endif //__TBB_ALLOCATOR_TRAITS_PRESENT
+}
+#endif
+
+template<typename counter_type = size_t>
+struct arena_data {
+    char * const my_buffer;
+    size_t const my_size; //in bytes
+    counter_type my_allocated; // in bytes
+
+    template<typename T>
+    arena_data(T * a_buffer, size_t a_size) __TBB_NOEXCEPT(true)
+    :   my_buffer(reinterpret_cast<char*>(a_buffer))
+    ,   my_size(a_size * sizeof(T))
+    {
+        my_allocated =0;
+    }
+private:
+    void operator=( const arena_data& ); // NoAssign is not used to avoid dependency on harness.h
+};
+
+template<typename T, typename pocma = Harness::false_type, typename counter_type = size_t>
+struct arena {
+    typedef arena_data<counter_type> arena_data_t;
+private:
+    arena_data_t * my_data;
+public:
+    typedef T value_type;
+    typedef value_type* pointer;
+    typedef const value_type* const_pointer;
+    typedef value_type& reference;
+    typedef const value_type& const_reference;
+    typedef size_t size_type;
+    typedef ptrdiff_t difference_type;
+    template<typename U> struct rebind {
+        typedef arena<U, pocma, counter_type> other;
+    };
+
+    typedef pocma propagate_on_container_move_assignment;
+
+    arena(arena_data_t & data) __TBB_NOEXCEPT(true) : my_data(&data) {}
+
+    template<typename U1, typename U2, typename U3>
+    friend struct arena;
+
+    template<typename U1, typename U2 >
+    arena(arena<U1, U2, counter_type> const& other) __TBB_NOEXCEPT(true) : my_data(other.my_data) {}
+
+    friend void swap(arena & lhs ,arena & rhs){
+        std::swap(lhs.my_data, rhs.my_data);
+    }
+
+    pointer address(reference x) const {return &x;}
+    const_pointer address(const_reference x) const {return &x;}
+
+    //! Allocate space for n objects, starting on a cache/sector line.
+    pointer allocate( size_type n, const void* =0) {
+        size_t new_size = (my_data->my_allocated += n*sizeof(T));
+        ASSERT(my_data->my_allocated <= my_data->my_size,"trying to allocate more than was reserved");
+        char* result =  &(my_data->my_buffer[new_size - n*sizeof(T)]);
+        return reinterpret_cast<pointer>(result);
+    }
+
+    //! Free block of memory that starts on a cache line
+    void deallocate( pointer p_arg, size_type n) {
+        char* p = reinterpret_cast<char*>(p_arg);
+        ASSERT(p >=my_data->my_buffer && p <= my_data->my_buffer + my_data->my_size, "trying to deallocate pointer not from arena ?");
+        ASSERT(p + n*sizeof(T) <= my_data->my_buffer + my_data->my_size, "trying to deallocate incorrect number of items?");
+        tbb::internal::suppress_unused_warning(p, n);
+    }
+
+    //! Largest value for which method allocate might succeed.
+    size_type max_size() const throw() {
+        return my_data->my_size / sizeof(T);
+    }
+
+    //! Copy-construct value at location pointed to by p.
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    template<typename U, typename... Args>
+    void construct(U *p, Args&&... args)
+        { ::new((void *)p) U(std::forward<Args>(args)...); }
+#else // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void construct( pointer p, value_type&& value ) {::new((void*)(p)) value_type(std::move(value));}
+#endif
+    void construct( pointer p, const value_type& value ) {::new((void*)(p)) value_type(value);}
+#endif // __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+
+    //! Destroy value at location pointed to by p.
+    void destroy( pointer p ) {
+        p->~value_type();
+        // suppress "unreferenced parameter" warnings by MSVC up to and including 2015
+        tbb::internal::suppress_unused_warning(p);
+    }
+
+    friend bool operator==(arena const& lhs, arena const& rhs){
+        return lhs.my_data == rhs.my_data;
+    }
+
+    friend bool operator!=(arena const& lhs, arena const& rhs){
+        return !(lhs== rhs);
+    }
+};
+
+template <typename count_t = tbb::atomic<size_t> >
+struct allocator_counters {
+    count_t items_allocated;
+    count_t items_freed;
+    count_t allocations;
+    count_t frees;
+
+    friend bool operator==(allocator_counters const & lhs, allocator_counters const & rhs){
+        return     lhs.items_allocated == rhs.items_allocated
+                && lhs.items_freed == rhs.items_freed
+                && lhs.allocations == rhs.allocations
+                && lhs.frees == rhs.frees
+        ;
+    }
+};
+
+template <typename base_alloc_t, typename count_t = tbb::atomic<size_t> >
+class static_counting_allocator : public base_alloc_t
+{
+public:
+    typedef typename base_alloc_t::pointer pointer;
+    typedef typename base_alloc_t::const_pointer const_pointer;
+    typedef typename base_alloc_t::reference reference;
+    typedef typename base_alloc_t::const_reference const_reference;
+    typedef typename base_alloc_t::value_type value_type;
+    typedef typename base_alloc_t::size_type size_type;
+    typedef typename base_alloc_t::difference_type difference_type;
+    template<typename U> struct rebind {
+        typedef static_counting_allocator<typename base_alloc_t::template rebind<U>::other,count_t> other;
+    };
+
+    typedef allocator_counters<count_t> counters_t;
+
+    static size_t max_items;
+    static count_t items_allocated;
+    static count_t items_freed;
+    static count_t allocations;
+    static count_t frees;
+    static bool verbose, throwing;
+
+    static_counting_allocator() throw() { }
+
+    static_counting_allocator(const base_alloc_t& src) throw()
+    : base_alloc_t(src) { }
+
+    static_counting_allocator(const static_counting_allocator& src) throw()
+    : base_alloc_t(src) { }
+
+    template<typename U, typename C>
+    static_counting_allocator(const static_counting_allocator<U, C>& src) throw()
+    : base_alloc_t(src) { }
+
+    pointer allocate(const size_type n)
+    {
+        if(verbose) printf("\t+%d|", int(n));
+        if(max_items && items_allocated + n >= max_items) {
+            if(verbose) printf("items limit hits!");
+            if(throwing)
+                __TBB_THROW( std::bad_alloc() );
+            return NULL;
+        }
+        pointer p = base_alloc_t::allocate(n, pointer(0));
+        allocations++;
+        items_allocated += n;
+        return p;
+    }
+
+    pointer allocate(const size_type n, const void * const)
+    {   return allocate(n); }
+
+    void deallocate(const pointer ptr, const size_type n)
+    {
+        if(verbose) printf("\t-%d|", int(n));
+        frees++;
+        items_freed += n;
+        base_alloc_t::deallocate(ptr, n);
+    }
+
+    static counters_t counters(){
+        counters_t c = {items_allocated, items_freed, allocations, frees} ;
+        return c;
+    }
+
+    static void init_counters(bool v = false) {
+        verbose = v;
+        if(verbose) printf("\n------------------------------------------- Allocations:\n");
+        items_allocated = 0;
+        items_freed = 0;
+        allocations = 0;
+        frees = 0;
+        max_items = 0;
+    }
+
+    static void set_limits(size_type max = 0, bool do_throw = true) {
+        max_items = max;
+        throwing = do_throw;
+    }
+};
+
+template <typename base_alloc_t, typename count_t>
+size_t static_counting_allocator<base_alloc_t, count_t>::max_items;
+template <typename base_alloc_t, typename count_t>
+count_t static_counting_allocator<base_alloc_t, count_t>::items_allocated;
+template <typename base_alloc_t, typename count_t>
+count_t static_counting_allocator<base_alloc_t, count_t>::items_freed;
+template <typename base_alloc_t, typename count_t>
+count_t static_counting_allocator<base_alloc_t, count_t>::allocations;
+template <typename base_alloc_t, typename count_t>
+count_t static_counting_allocator<base_alloc_t, count_t>::frees;
+template <typename base_alloc_t, typename count_t>
+bool static_counting_allocator<base_alloc_t, count_t>::verbose;
+template <typename base_alloc_t, typename count_t>
+bool static_counting_allocator<base_alloc_t, count_t>::throwing;
+
+
+template <typename tag, typename count_t = tbb::atomic<size_t> >
+class static_shared_counting_allocator_base
+{
+public:
+    typedef allocator_counters<count_t> counters_t;
+
+    static size_t max_items;
+    static count_t items_allocated;
+    static count_t items_freed;
+    static count_t allocations;
+    static count_t frees;
+    static bool verbose, throwing;
+
+    static counters_t counters(){
+        counters_t c = {items_allocated, items_freed, allocations, frees} ;
+        return c;
+    }
+
+    static void init_counters(bool v = false) {
+        verbose = v;
+        if(verbose) printf("\n------------------------------------------- Allocations:\n");
+        items_allocated = 0;
+        items_freed = 0;
+        allocations = 0;
+        frees = 0;
+        max_items = 0;
+    }
+
+    static void set_limits(size_t max = 0, bool do_throw = true) {
+        max_items = max;
+        throwing = do_throw;
+    }
+};
+
+template <typename tag, typename count_t>
+size_t static_shared_counting_allocator_base<tag, count_t>::max_items;
+
+template <typename tag, typename count_t>
+count_t static_shared_counting_allocator_base<tag, count_t>::items_allocated;
+
+template <typename tag, typename count_t>
+count_t static_shared_counting_allocator_base<tag, count_t>::items_freed;
+
+template <typename tag, typename count_t>
+count_t static_shared_counting_allocator_base<tag, count_t>::allocations;
+
+template <typename tag, typename count_t>
+count_t static_shared_counting_allocator_base<tag, count_t>::frees;
+
+template <typename tag, typename count_t>
+bool static_shared_counting_allocator_base<tag, count_t>::verbose;
+
+template <typename tag, typename count_t>
+bool static_shared_counting_allocator_base<tag, count_t>::throwing;
+
+template <typename tag, typename base_alloc_t, typename count_t = tbb::atomic<size_t> >
+class static_shared_counting_allocator : public static_shared_counting_allocator_base<tag, count_t>, public base_alloc_t
+{
+    typedef static_shared_counting_allocator_base<tag, count_t> base_t;
+public:
+    typedef typename base_alloc_t::pointer pointer;
+    typedef typename base_alloc_t::const_pointer const_pointer;
+    typedef typename base_alloc_t::reference reference;
+    typedef typename base_alloc_t::const_reference const_reference;
+    typedef typename base_alloc_t::value_type value_type;
+    typedef typename base_alloc_t::size_type size_type;
+    typedef typename base_alloc_t::difference_type difference_type;
+    template<typename U> struct rebind {
+        typedef static_shared_counting_allocator<tag, typename base_alloc_t::template rebind<U>::other, count_t> other;
+    };
+
+    static_shared_counting_allocator() throw() { }
+
+    static_shared_counting_allocator(const base_alloc_t& src) throw()
+    : base_alloc_t(src) { }
+
+    static_shared_counting_allocator(const static_shared_counting_allocator& src) throw()
+    : base_alloc_t(src) { }
+
+    template<typename U, typename C>
+    static_shared_counting_allocator(const static_shared_counting_allocator<tag, U, C>& src) throw()
+    : base_alloc_t(src) { }
+
+    pointer allocate(const size_type n)
+    {
+        if(base_t::verbose) printf("\t+%d|", int(n));
+        if(base_t::max_items && base_t::items_allocated + n >= base_t::max_items) {
+            if(base_t::verbose) printf("items limit hits!");
+            if(base_t::throwing)
+                __TBB_THROW( std::bad_alloc() );
+            return NULL;
+        }
+        base_t::allocations++;
+        base_t::items_allocated += n;
+        return base_alloc_t::allocate(n, pointer(0));
+    }
+
+    pointer allocate(const size_type n, const void * const)
+    {   return allocate(n); }
+
+    void deallocate(const pointer ptr, const size_type n)
+    {
+        if(base_t::verbose) printf("\t-%d|", int(n));
+        base_t::frees++;
+        base_t::items_freed += n;
+        base_alloc_t::deallocate(ptr, n);
+    }
+};
+
+template <typename base_alloc_t, typename count_t = tbb::atomic<size_t> >
+class local_counting_allocator : public base_alloc_t
+{
+public:
+    typedef typename base_alloc_t::pointer pointer;
+    typedef typename base_alloc_t::const_pointer const_pointer;
+    typedef typename base_alloc_t::reference reference;
+    typedef typename base_alloc_t::const_reference const_reference;
+    typedef typename base_alloc_t::value_type value_type;
+    typedef typename base_alloc_t::size_type size_type;
+    typedef typename base_alloc_t::difference_type difference_type;
+    template<typename U> struct rebind {
+        typedef local_counting_allocator<typename base_alloc_t::template rebind<U>::other,count_t> other;
+    };
+
+    count_t items_allocated;
+    count_t items_freed;
+    count_t allocations;
+    count_t frees;
+    size_t max_items;
+
+    void set_counters(const count_t & a_items_allocated, const count_t & a_items_freed, const count_t & a_allocations, const count_t & a_frees, const count_t & a_max_items){
+        items_allocated = a_items_allocated;
+        items_freed = a_items_freed;
+        allocations = a_allocations;
+        frees = a_frees;
+        max_items = a_max_items;
+    }
+
+    template< typename allocator_t>
+    void set_counters(const allocator_t & a){
+        this->set_counters(a.items_allocated, a.items_freed, a.allocations, a.frees, a.max_items);
+    }
+
+    void clear_counters(){
+        count_t zero;
+        zero = 0;
+        this->set_counters(zero,zero,zero,zero,zero);
+    }
+
+    local_counting_allocator() throw() {
+        this->clear_counters();
+    }
+
+    local_counting_allocator(const local_counting_allocator &a) throw()
+        : base_alloc_t(a)
+        , items_allocated(a.items_allocated)
+        , items_freed(a.items_freed)
+        , allocations(a.allocations)
+        , frees(a.frees)
+        , max_items(a.max_items)
+    { }
+
+    template<typename U, typename C>
+    local_counting_allocator(const static_counting_allocator<U,C> & a) throw() {
+        this->set_counters(a);
+    }
+
+    template<typename U, typename C>
+    local_counting_allocator(const local_counting_allocator<U,C> &a) throw()
+        : items_allocated(a.items_allocated)
+        , items_freed(a.items_freed)
+        , allocations(a.allocations)
+        , frees(a.frees)
+        , max_items(a.max_items)
+    { }
+
+    bool operator==(const local_counting_allocator &a) const
+    { return static_cast<const base_alloc_t&>(a) == *this; }
+
+    pointer allocate(const size_type n)
+    {
+        if(max_items && items_allocated + n >= max_items)
+            __TBB_THROW( std::bad_alloc() );
+        pointer p = base_alloc_t::allocate(n, pointer(0));
+        ++allocations;
+        items_allocated += n;
+        return p;
+    }
+
+    pointer allocate(const size_type n, const void * const)
+    { return allocate(n); }
+
+    void deallocate(const pointer ptr, const size_type n)
+    {
+        ++frees;
+        items_freed += n;
+        base_alloc_t::deallocate(ptr, n);
+    }
+
+    void set_limits(size_type max = 0) {
+        max_items = max;
+    }
+};
+
+template <typename T, template<typename X> class Allocator = std::allocator>
+class debug_allocator : public Allocator<T>
+{
+public:
+    typedef Allocator<T> base_allocator_type;
+    typedef typename base_allocator_type::value_type value_type;
+    typedef typename base_allocator_type::pointer pointer;
+    typedef typename base_allocator_type::const_pointer const_pointer;
+    typedef typename base_allocator_type::reference reference;
+    typedef typename base_allocator_type::const_reference const_reference;
+    typedef typename base_allocator_type::size_type size_type;
+    typedef typename base_allocator_type::difference_type difference_type;
+    template<typename U> struct rebind {
+        typedef debug_allocator<U, Allocator> other;
+    };
+
+    debug_allocator() throw() { }
+    debug_allocator(const debug_allocator &a) throw() : base_allocator_type( a ) { }
+    template<typename U>
+    debug_allocator(const debug_allocator<U> &a) throw() : base_allocator_type( Allocator<U>( a ) ) { }
+
+    pointer allocate(const size_type n, const void *hint = 0 ) {
+        pointer ptr = base_allocator_type::allocate( n, hint );
+        std::memset( (void*)ptr, 0xE3E3E3E3, n * sizeof(value_type) );
+        return ptr;
+    }
+};
+
+//! Analogous to std::allocator<void>, as defined in ISO C++ Standard, Section 20.4.1
+/** @ingroup memory_allocation */
+template<template<typename T> class Allocator>
+class debug_allocator<void, Allocator> : public Allocator<void> {
+public:
+    typedef Allocator<void> base_allocator_type;
+    typedef typename base_allocator_type::value_type value_type;
+    typedef typename base_allocator_type::pointer pointer;
+    typedef typename base_allocator_type::const_pointer const_pointer;
+    template<typename U> struct rebind {
+        typedef debug_allocator<U, Allocator> other;
+    };
+};
+
+template<typename T1, template<typename X1> class B1, typename T2, template<typename X2> class B2>
+inline bool operator==( const debug_allocator<T1,B1> &a, const debug_allocator<T2,B2> &b) {
+    return static_cast< B1<T1> >(a) == static_cast< B2<T2> >(b);
+}
+template<typename T1, template<typename X1> class B1, typename T2, template<typename X2> class B2>
+inline bool operator!=( const debug_allocator<T1,B1> &a, const debug_allocator<T2,B2> &b) {
+    return static_cast< B1<T1> >(a) != static_cast< B2<T2> >(b);
+}
+
+template <typename T, typename pocma = Harness::false_type, template<typename X> class Allocator = std::allocator>
+class stateful_allocator : public Allocator<T>
+{
+    void* unique_pointer;
+
+    template<typename T1, typename pocma1, template<typename X1> class Allocator1>
+    friend class  stateful_allocator;
+public:
+    typedef Allocator<T> base_allocator_type;
+    typedef typename base_allocator_type::value_type value_type;
+    typedef typename base_allocator_type::pointer pointer;
+    typedef typename base_allocator_type::const_pointer const_pointer;
+    typedef typename base_allocator_type::reference reference;
+    typedef typename base_allocator_type::const_reference const_reference;
+    typedef typename base_allocator_type::size_type size_type;
+    typedef typename base_allocator_type::difference_type difference_type;
+    template<typename U> struct rebind {
+        typedef stateful_allocator<U, pocma, Allocator> other;
+    };
+    typedef pocma propagate_on_container_move_assignment;
+
+    stateful_allocator() throw() : unique_pointer(this) { }
+
+    template<typename U>
+    stateful_allocator(const stateful_allocator<U, pocma> &a) throw() : base_allocator_type( Allocator<U>( a ) ),  unique_pointer(a.uniqe_pointer) { }
+
+    friend bool operator==(stateful_allocator const& lhs, stateful_allocator const& rhs){
+        return lhs.unique_pointer == rhs.unique_pointer;
+    }
+
+    friend bool operator!=(stateful_allocator const& rhs, stateful_allocator const& lhs){
+        return !(lhs == rhs);
+    }
+
+};
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    #pragma warning (pop)
+#endif // warning 4267,4512,4355 is back
+
+namespace Harness {
+
+    struct IsEqual {
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+        template <typename T>
+        static bool compare( const std::weak_ptr<T> &t1, const std::weak_ptr<T> &t2 ) {
+            // Compare real pointers.
+            return t1.lock().get() == t2.lock().get();
+        }
+        template <typename T>
+        static bool compare( const std::unique_ptr<T> &t1, const std::unique_ptr<T> &t2 ) {
+            // Compare real values.
+            return *t1 == *t2;
+        }
+        template <typename T1, typename T2>
+        static bool compare( const std::pair< const std::weak_ptr<T1>, std::weak_ptr<T2> > &t1,
+                const std::pair< const std::weak_ptr<T1>, std::weak_ptr<T2> > &t2 ) {
+            // Compare real pointers.
+            return t1.first.lock().get() == t2.first.lock().get() &&
+                t1.second.lock().get() == t2.second.lock().get();
+        }
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+        template <typename T1, typename T2>
+        static bool compare( const T1 &t1, const T2 &t2 ) {
+            return t1 == t2;
+        }
+        template <typename T1, typename T2>
+        bool operator()( T1 &t1, T2 &t2) const {
+            return compare( (const T1&)t1, (const T2&)t2 );
+        }
+    };
+
+} // Harness
+#endif // tbb_test_harness_allocator_H
diff --git a/xdl/third_party/tbb/src/test/harness_allocator_overload.h b/xdl/third_party/tbb/src/test/harness_allocator_overload.h
new file mode 100644
index 00000000..23978631
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_allocator_overload.h
@@ -0,0 +1,39 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_test_harness_allocator_overload_H
+#define tbb_test_harness_allocator_overload_H
+
+#include "../tbbmalloc/proxy.h" // for MALLOC_UNIXLIKE_OVERLOAD_ENABLED, MALLOC_ZONE_OVERLOAD_ENABLED
+#include "tbb/tbb_config.h" // for __TBB_WIN8UI_SUPPORT
+
+// Skip configurations with unsupported system malloc overload:
+// skip unsupported MSVCs, WIN8UI and MINGW (it doesn't define _MSC_VER),
+// no support for MSVC 2015 and greater in debug for now,
+// don't use defined(_MSC_VER), because result of using defined() in macro expansion is undefined
+#define MALLOC_WINDOWS_OVERLOAD_ENABLED ((_WIN32||_WIN64) && !__TBB_WIN8UI_SUPPORT && _MSC_VER >= 1500 && !(_MSC_VER >= 1900 && _DEBUG))
+
+// Skip configurations with unsupported system malloc overload:
+// * overload via linking with -lmalloc_proxy is broken in offload,
+// as the library is loaded too late in that mode,
+// * LD_PRELOAD mechanism is broken in offload
+#define HARNESS_SKIP_TEST ((!MALLOC_WINDOWS_OVERLOAD_ENABLED && !MALLOC_UNIXLIKE_OVERLOAD_ENABLED && !MALLOC_ZONE_OVERLOAD_ENABLED) || __TBB_MIC_OFFLOAD)
+
+#endif // tbb_test_harness_allocator_overload_H
diff --git a/xdl/third_party/tbb/src/test/harness_assert.h b/xdl/third_party/tbb/src/test/harness_assert.h
new file mode 100644
index 00000000..3fc8e5ab
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_assert.h
@@ -0,0 +1,41 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Just the assertion portion of the harness.
+// This is useful for writing portions of tests that include
+// the minimal number of necessary header files.
+//
+// The full "harness.h" must be included later.
+
+#ifndef harness_assert_H
+#define harness_assert_H
+
+void ReportError( const char* filename, int line, const char* expression, const char* message);
+void ReportWarning( const char* filename, int line, const char* expression, const char* message);
+
+#define ASSERT_CUSTOM(p,message,file,line)  ((p)?(void)0:ReportError(file,line,#p,message))
+#define ASSERT(p,message)                   ASSERT_CUSTOM(p,message,__FILE__,__LINE__)
+#define ASSERT_WARNING(p,message)           ((p)?(void)0:ReportWarning(__FILE__,__LINE__,#p,message))
+
+//! Compile-time error if x and y have different types
+template<typename T>
+void AssertSameType( const T& /*x*/, const T& /*y*/ ) {}
+
+#endif /* harness_assert_H */
diff --git a/xdl/third_party/tbb/src/test/harness_bad_expr.h b/xdl/third_party/tbb/src/test/harness_bad_expr.h
new file mode 100644
index 00000000..a4eb2e37
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_bad_expr.h
@@ -0,0 +1,77 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Declarations for checking __TBB_ASSERT checks inside TBB.
+// This header is an optional part of the test harness.
+// It assumes that "harness.h" has already been included.
+
+#define TRY_BAD_EXPR_ENABLED (TBB_USE_ASSERT && TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN)
+
+#if TRY_BAD_EXPR_ENABLED
+
+//! Check that expression x raises assertion failure with message containing given substring.
+/** Assumes that tbb::set_assertion_handler( AssertionFailureHandler ) was called earlier. */
+#define TRY_BAD_EXPR(x,substr)          \
+    {                                   \
+        const char* message = NULL;     \
+        bool okay = false;              \
+        try {                           \
+            x;                          \
+        } catch( AssertionFailure a ) { \
+            okay = true;                \
+            message = a.message;        \
+        }                               \
+        CheckAssertionFailure(__LINE__,#x,okay,message,substr); \
+    }
+
+//! Exception object that holds a message.
+struct AssertionFailure {
+    const char* message;
+    AssertionFailure( const char* filename, int line, const char* expression, const char* comment );
+};
+
+AssertionFailure::AssertionFailure( const char* filename, int line, const char* expression, const char* comment ) :
+    message(comment)
+{
+    ASSERT(filename,"missing filename");
+    ASSERT(0<line,"line number must be positive");
+    // All of our current files have fewer than 4000 lines.
+    ASSERT(line<5000,"dubiously high line number");
+    ASSERT(expression,"missing expression");
+}
+
+void AssertionFailureHandler( const char* filename, int line, const char* expression, const char* comment ) {
+    throw AssertionFailure(filename,line,expression,comment);
+}
+
+void CheckAssertionFailure( int line, const char* expression, bool okay, const char* message, const char* substr ) {
+    if( !okay ) {
+        REPORT("Line %d, %s failed to fail\n", line, expression );
+        abort();
+    } else if( !message ) {
+        REPORT("Line %d, %s failed without a message\n", line, expression );
+        abort();
+    } else if( strstr(message,substr)==0 ) {
+        REPORT("Line %d, %s failed with message '%s' missing substring '%s'\n", __LINE__, expression, message, substr );
+        abort();
+    }
+}
+
+#endif /* TRY_BAD_EXPR_ENABLED */
diff --git a/xdl/third_party/tbb/src/test/harness_barrier.h b/xdl/third_party/tbb/src/test/harness_barrier.h
new file mode 100644
index 00000000..ed290c19
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_barrier.h
@@ -0,0 +1,140 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+
+#ifndef harness_barrier_H
+#define harness_barrier_H
+
+namespace Harness {
+
+//! Spin WHILE the value of the variable is equal to a given value
+/** T and U should be comparable types. */
+class TimedWaitWhileEq {
+    //! Assignment not allowed
+    void operator=( const TimedWaitWhileEq& );
+    double &my_limit;
+public:
+    TimedWaitWhileEq(double &n_seconds) : my_limit(n_seconds) {}
+    TimedWaitWhileEq(const TimedWaitWhileEq &src) : my_limit(src.my_limit) {}
+    template<typename T, typename U>
+    void operator()( const volatile T& location, U value ) const {
+        tbb::tick_count start = tbb::tick_count::now();
+        double time_passed;
+        do {
+            time_passed = (tbb::tick_count::now()-start).seconds();
+            if( time_passed < 0.0001 ) __TBB_Pause(10); else __TBB_Yield();
+        } while( time_passed < my_limit && location == value);
+        my_limit -= time_passed;
+    }
+};
+//! Spin WHILE the value of the variable is equal to a given value
+/** T and U should be comparable types. */
+class WaitWhileEq {
+    //! Assignment not allowed
+    void operator=( const WaitWhileEq& );
+public:
+    template<typename T, typename U>
+    void operator()( const volatile T& location, U value ) const {
+        tbb::internal::spin_wait_while_eq(location, value);
+    }
+};
+class SpinBarrier
+{
+    unsigned numThreads;
+    tbb::atomic<unsigned> numThreadsFinished; // reached the barrier in this epoch
+    // the number of times the barrier was opened; TODO: move to a separate cache line
+    tbb::atomic<unsigned> epoch;
+    // a throwaway barrier can be used only once, then wait() becomes a no-op
+    bool throwaway;
+
+    struct DummyCallback {
+        void operator() () const {}
+        template<typename T, typename U>
+        void operator()( const T&, U) const {}
+    };
+
+    SpinBarrier( const SpinBarrier& );    // no copy ctor
+    void operator=( const SpinBarrier& ); // no assignment
+public:
+    SpinBarrier( unsigned nthreads = 0, bool throwaway_ = false ) {
+        initialize(nthreads, throwaway_);
+    }
+    void initialize( unsigned nthreads, bool throwaway_ = false ) {
+        numThreads = nthreads;
+        numThreadsFinished = 0;
+        epoch = 0;
+        throwaway = throwaway_;
+    }
+
+    // Returns whether this thread was the last to reach the barrier.
+    // onWaitCallback is called by a thread for waiting;
+    // onOpenBarrierCallback is called by the last thread before unblocking other threads.
+    template<typename WaitEq, typename Callback>
+    bool custom_wait(const WaitEq &onWaitCallback, const Callback &onOpenBarrierCallback)
+    {
+        if (throwaway && epoch)
+            return false;
+        unsigned myEpoch = epoch;
+        unsigned myNumThreads = numThreads; // read it before the increment
+        int threadsLeft = myNumThreads - numThreadsFinished.fetch_and_increment() - 1;
+        ASSERT(threadsLeft>=0, "Broken barrier");
+        if (threadsLeft > 0) {
+            /* this thread is not the last; wait until the epoch changes & return false */
+            onWaitCallback(epoch, myEpoch);
+            return false;
+        }
+        /* This thread is the last one at the barrier in this epoch */
+        onOpenBarrierCallback();
+        /* reset the barrier, increment the epoch, and return true */
+        threadsLeft = numThreadsFinished -= myNumThreads;
+        ASSERT( threadsLeft == 0, "Broken barrier");
+        /* wakes up threads waiting to exit in this epoch */
+        myEpoch -= epoch++;
+        ASSERT( myEpoch == 0, "Broken barrier");
+        return true;
+    }
+    bool timed_wait_noerror(double n_seconds) {
+        custom_wait(TimedWaitWhileEq(n_seconds), DummyCallback());
+        return n_seconds >= 0.0001;
+    }
+    bool timed_wait(double n_seconds, const char *msg="Time is out while waiting on a barrier") {
+        bool is_last = custom_wait(TimedWaitWhileEq(n_seconds), DummyCallback());
+        ASSERT( n_seconds >= 0, msg); // TODO: refactor to avoid passing msg here and rising assertion
+        return is_last;
+    }
+    // onOpenBarrierCallback is called by the last thread before unblocking other threads.
+    template<typename Callback>
+    bool wait(const Callback &onOpenBarrierCallback) {
+        return custom_wait(WaitWhileEq(), onOpenBarrierCallback);
+    }
+    bool wait(){
+        return wait(DummyCallback());
+    }
+    //! signal to the barrier, rather a semaphore functionality
+    bool signal_nowait() {
+        return custom_wait(DummyCallback(),DummyCallback());
+    }
+};
+
+}
+
+#endif //harness_barrier_H
diff --git a/xdl/third_party/tbb/src/test/harness_checktype.h b/xdl/third_party/tbb/src/test/harness_checktype.h
new file mode 100644
index 00000000..30530255
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_checktype.h
@@ -0,0 +1,99 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_tests_harness_checktype_H
+#define tbb_tests_harness_checktype_H
+
+// type that checks construction and destruction.
+
+#ifndef __HARNESS_CHECKTYPE_DEFAULT_CTOR
+    #define __HARNESS_CHECKTYPE_DEFAULT_CTOR 1
+#endif
+
+template<class Counter>
+class check_type : Harness::NoAfterlife {
+    Counter id;
+    bool am_ready;
+public:
+    static tbb::atomic<int> check_type_counter;
+    // if only non-default constructors are desired, set __HARNESS_CHECKTYPE_NODEFAULT_CTOR
+    check_type(Counter _n
+#if __HARNESS_CHECKTYPE_DEFAULT_CTOR
+            = 0
+#endif
+            ) : id(_n), am_ready(false) {
+        ++check_type_counter;
+    }
+
+    check_type(const check_type& other) : Harness::NoAfterlife(other) {
+        other.AssertLive();
+        AssertLive();
+        id = other.id;
+        am_ready = other.am_ready;
+        ++check_type_counter;
+    }
+
+    operator int() const { return (int)my_id(); }
+    check_type& operator++() { ++id; return *this;; }
+
+    ~check_type() {
+        AssertLive();
+        --check_type_counter;
+        ASSERT(check_type_counter >= 0, "too many destructions");
+    }
+
+    check_type &operator=(const check_type &other) {
+        other.AssertLive();
+        AssertLive();
+        id = other.id;
+        am_ready = other.am_ready;
+        return *this;
+    }
+
+    Counter my_id() const { AssertLive(); return id; }
+    bool is_ready() { AssertLive(); return am_ready; }
+    void function() {
+        AssertLive();
+        if( id == (Counter)0 ) {
+            id = (Counter)1;
+            am_ready = true;
+        }
+    }
+
+};
+
+template<class Counter>
+tbb::atomic<int> check_type<Counter>::check_type_counter;
+
+// provide a class that for a check_type will initialize the counter on creation, and on
+// destruction will check that the constructions and destructions of check_type match.
+template<class MyClass>
+struct Check {
+    Check() {}   // creation does nothing
+    ~Check() {}  // destruction checks nothing
+};
+
+template<class Counttype>
+struct Check<check_type< Counttype > > {
+    Check() { check_type<Counttype>::check_type_counter = 0; }
+    ~Check() { ASSERT(check_type<Counttype>::check_type_counter == 0, "check_type constructions and destructions don't match"); }
+};
+
+#endif  // tbb_tests_harness_checktype_H
diff --git a/xdl/third_party/tbb/src/test/harness_concurrency.h b/xdl/third_party/tbb/src/test/harness_concurrency.h
new file mode 100644
index 00000000..11350661
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_concurrency.h
@@ -0,0 +1,105 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_tests_harness_concurrency_H
+#define tbb_tests_harness_concurrency_H
+
+#if _WIN32||_WIN64
+#include "tbb/machine/windows_api.h"
+#elif __linux__
+#include <unistd.h>
+#include <sys/sysinfo.h>
+#include <string.h>
+#include <sched.h>
+#elif __FreeBSD__
+#include <unistd.h>
+#include <errno.h>
+#include <string.h>
+#include <sys/param.h>  // Required by <sys/cpuset.h>
+#include <sys/cpuset.h>
+#endif
+
+#include <limits.h>
+
+namespace Harness {
+    static int maxProcs = 0;
+    static int GetMaxProcs() {
+        if ( !maxProcs ) {
+#if _WIN32||_WIN64
+            SYSTEM_INFO si;
+            GetNativeSystemInfo(&si);
+            maxProcs = si.dwNumberOfProcessors;
+#elif __linux__
+            maxProcs = get_nprocs();
+#else /* __FreeBSD__ */
+            maxProcs = sysconf(_SC_NPROCESSORS_ONLN);
+#endif
+        }
+        return maxProcs;
+    }
+
+    int LimitNumberOfThreads(int max_threads) {
+        ASSERT( max_threads >= 1 , "The limited number of threads should be positive." );
+        maxProcs = GetMaxProcs();
+        if ( maxProcs < max_threads )
+            // Suppose that process mask is not set so the number of available threads equals maxProcs
+            return maxProcs;
+
+#if _WIN32||_WIN64
+        ASSERT( max_threads <= 64 , "LimitNumberOfThreads doesn't support max_threads to be more than 64 on Windows." );
+        DWORD_PTR mask = 1;
+        for ( int i = 1; i < max_threads; ++i )
+            mask |= mask << 1;
+        bool err = !SetProcessAffinityMask( GetCurrentProcess(), mask );
+#else /* !WIN */
+#if __linux__
+        typedef cpu_set_t mask_t;
+#if __TBB_MAIN_THREAD_AFFINITY_BROKEN
+#define setaffinity(mask) sched_setaffinity(0 /*get the mask of the calling thread*/, sizeof(mask_t), &mask)
+#else
+#define setaffinity(mask) sched_setaffinity(getpid(), sizeof(mask_t), &mask)
+#endif
+#else /* __FreeBSD__ */
+        typedef cpuset_t mask_t;
+#if __TBB_MAIN_THREAD_AFFINITY_BROKEN
+#define setaffinity(mask) cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(mask_t), &mask)
+#else
+#define setaffinity(mask) cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_PID, -1, sizeof(mask_t), &mask)
+#endif
+#endif /* __FreeBSD__ */
+        mask_t newMask;
+        CPU_ZERO(&newMask);
+
+        int maskSize = (int)sizeof(mask_t) * CHAR_BIT;
+        ASSERT_WARNING( maskSize >= maxProcs, "The mask size doesn't seem to be big enough to call setaffinity. The call may return an error." );
+
+        ASSERT( max_threads <= (int)sizeof(mask_t) * CHAR_BIT , "The mask size is not enough to set the requested number of threads." );
+        for ( int i = 0; i < max_threads; ++i )
+            CPU_SET( i, &newMask );
+        int err = setaffinity( newMask );
+#endif /* !WIN */
+        ASSERT( !err, "Setting process affinity failed" );
+
+        return max_threads;
+    }
+
+} // namespace Harness
+
+#endif /* tbb_tests_harness_concurrency_H */
diff --git a/xdl/third_party/tbb/src/test/harness_concurrency_tracker.h b/xdl/third_party/tbb/src/test/harness_concurrency_tracker.h
new file mode 100644
index 00000000..22ac331a
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_concurrency_tracker.h
@@ -0,0 +1,174 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_tests_harness_concurrency_tracker_H
+#define tbb_tests_harness_concurrency_tracker_H
+
+#include "harness_assert.h"
+#include "harness_barrier.h"
+#include "tbb/atomic.h"
+#include "../tbb/tls.h"
+// Note: This file is used by RML tests which do not link TBB.
+// Functionality that requires TBB binaries must be guarded by !__TBB_NO_IMPLICIT_LINKAGE
+#if !defined(__TBB_NO_IMPLICIT_LINKAGE)
+#include "tbb/mutex.h"
+#include "tbb/task.h"
+#include "tbb/combinable.h"
+#include "tbb/parallel_for.h"
+#include <functional> // for std::plus
+#include "harness.h" // for Harness::NoCopy
+#endif
+
+namespace Harness {
+
+static tbb::atomic<unsigned> ctInstantParallelism;
+static tbb::atomic<unsigned> ctPeakParallelism;
+static tbb::internal::tls<uintptr_t>  ctNested;
+
+class ConcurrencyTracker {
+    bool    m_Outer;
+
+    static void Started () {
+        unsigned p = ++ctInstantParallelism;
+        unsigned q = ctPeakParallelism;
+        while( q<p ) {
+            q = ctPeakParallelism.compare_and_swap(p,q);
+        }
+    }
+
+    static void Stopped () {
+        ASSERT ( ctInstantParallelism > 0, "Mismatched call to ConcurrencyTracker::Stopped()" );
+        --ctInstantParallelism;
+    }
+public:
+    ConcurrencyTracker() : m_Outer(false) {
+        uintptr_t nested = ctNested;
+        ASSERT (nested == 0 || nested == 1, NULL);
+        if ( !ctNested ) {
+            Started();
+            m_Outer = true;
+            ctNested = 1;
+        }
+    }
+    ~ConcurrencyTracker() {
+        if ( m_Outer ) {
+            Stopped();
+            ctNested = 0;
+        }
+    }
+
+    static unsigned PeakParallelism() { return ctPeakParallelism; }
+    static unsigned InstantParallelism() { return ctInstantParallelism; }
+
+    static void Reset() {
+        ASSERT (ctInstantParallelism == 0, "Reset cannot be called when concurrency tracking is underway");
+        ctInstantParallelism = ctPeakParallelism = 0;
+    }
+}; // ConcurrencyTracker
+
+#if !defined(__TBB_NO_IMPLICIT_LINKAGE)
+struct ExactConcurrencyLevel : NoCopy {
+    typedef tbb::combinable<size_t> Combinable;
+private:
+    Harness::SpinBarrier       *myBarrier;
+    // count unique worker threads
+    Combinable                 *myUniqueThreads;
+    mutable tbb::atomic<size_t> myActiveBodyCnt;
+    // output parameter for parallel_for body to report that max is reached
+    mutable bool                myReachedMax;
+    // zero timeout means no barrier is used during concurrency level detection
+    const double                myTimeout;
+    const size_t                myConcLevel;
+    const bool                  myCrashOnFail;
+
+    static tbb::mutex global_mutex;
+
+    ExactConcurrencyLevel(double timeout, size_t concLevel, Combinable *uniq, bool crashOnFail) :
+        myBarrier(NULL), myUniqueThreads(uniq), myReachedMax(false),
+        myTimeout(timeout), myConcLevel(concLevel), myCrashOnFail(crashOnFail) {
+        myActiveBodyCnt = 0;
+    }
+    bool run() {
+        const int LOOP_ITERS = 100;
+        tbb::combinable<size_t> uniq;
+        Harness::SpinBarrier barrier((unsigned)myConcLevel, /*throwaway=*/true);
+        if (myTimeout != 0.)
+            myBarrier = &barrier;
+        if (!myUniqueThreads)
+            myUniqueThreads = &uniq;
+        tbb::parallel_for((size_t)0, myConcLevel*LOOP_ITERS, *this, tbb::simple_partitioner());
+        return myReachedMax;
+    }
+public:
+    void operator()(size_t) const {
+        size_t v = ++myActiveBodyCnt;
+        ASSERT(v <= myConcLevel, "Number of active bodies is too high.");
+        if (v == myConcLevel) // record that the max expected concurrency was observed
+            myReachedMax = true;
+        // try to get barrier when 1st time in the thread
+        if (myBarrier && !myBarrier->timed_wait_noerror(myTimeout))
+            ASSERT(!myCrashOnFail, "Timeout was detected.");
+
+        myUniqueThreads->local() = 1;
+        for (int i=0; i<100; i++)
+            __TBB_Pause(1);
+        --myActiveBodyCnt;
+    }
+
+    enum Mode {
+        None,
+        // When multiple blocking checks are performed, there might be not enough
+        // concurrency for all of them. Serialize check() calls.
+        Serialize
+    };
+
+    // check that we have never got more than concLevel threads,
+    // and that in some moment we saw exactly concLevel threads
+    static void check(size_t concLevel, Mode m = None) {
+        ExactConcurrencyLevel o(30., concLevel, NULL, /*crashOnFail=*/true);
+
+        tbb::mutex::scoped_lock lock;
+        if (m == Serialize)
+            lock.acquire(global_mutex);
+        bool ok = o.run();
+        ASSERT(ok, NULL);
+    }
+
+    static bool isEqual(size_t concLevel) {
+        ExactConcurrencyLevel o(3., concLevel, NULL, /*crashOnFail=*/false);
+        return o.run();
+    }
+
+    static void checkLessOrEqual(size_t concLevel, tbb::combinable<size_t> *unique) {
+        ExactConcurrencyLevel o(0., concLevel, unique, /*crashOnFail=*/true);
+
+        o.run(); // ignore result, as without a barrier it is not reliable
+        const size_t num = unique->combine(std::plus<size_t>());
+        ASSERT(num<=concLevel, "Too many workers observed.");
+    }
+};
+
+tbb::mutex ExactConcurrencyLevel::global_mutex;
+
+#endif /* !defined(__TBB_NO_IMPLICIT_LINKAGE) */
+
+} // namespace Harness
+
+#endif /* tbb_tests_harness_concurrency_tracker_H */
diff --git a/xdl/third_party/tbb/src/test/harness_cpu.h b/xdl/third_party/tbb/src/test/harness_cpu.h
new file mode 100644
index 00000000..ea358738
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_cpu.h
@@ -0,0 +1,120 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Declarations for simple estimate of CPU time being used by a program.
+// This header is an optional part of the test harness.
+// It assumes that "harness_assert.h" has already been included.
+
+#if _WIN32
+    #include <windows.h>
+#else
+    #include <sys/time.h>
+    #include <sys/resource.h>
+#endif
+
+//! Return time (in seconds) spent by the current process in user mode.
+/*  Returns 0 if not implemented on platform. */
+static double GetCPUUserTime() {
+#if __TBB_WIN8UI_SUPPORT
+    return 0;
+#elif _WIN32
+    FILETIME my_times[4];
+    bool status = GetProcessTimes(GetCurrentProcess(), my_times, my_times+1, my_times+2, my_times+3)!=0;
+    ASSERT( status, NULL );
+    LARGE_INTEGER usrtime;
+    usrtime.LowPart = my_times[3].dwLowDateTime;
+    usrtime.HighPart = my_times[3].dwHighDateTime;
+    return double(usrtime.QuadPart)*1E-7;
+#else
+    // Generic UNIX, including __APPLE__
+
+    // On Linux, there is no good way to get CPU usage info for the current process:
+    //   getrusage(RUSAGE_SELF, ...) that is used now only returns info for the calling thread;
+    //   getrusage(RUSAGE_CHILDREN, ...) only counts for finished children threads;
+    //   tms_utime and tms_cutime got with times(struct tms*) are equivalent to the above items;
+    //   finally, /proc/self/task/<task_id>/stat doesn't exist on older kernels
+    //      and it isn't quite convenient to read it for every task_id.
+
+    struct rusage resources;
+    bool status = getrusage(RUSAGE_SELF, &resources)==0;
+    ASSERT( status, NULL );
+    return (double(resources.ru_utime.tv_sec)*1E6 + double(resources.ru_utime.tv_usec))*1E-6;
+#endif
+}
+
+#include "tbb/tick_count.h"
+#include <cstdio>
+
+// The resolution of GetCPUUserTime is 10-15 ms or so; waittime should be a few times bigger.
+const double WAITTIME = 0.1; // in seconds, i.e. 100 ms
+const double THRESHOLD = WAITTIME/100;
+
+static void TestCPUUserTime( int nthreads, int nactive = 1 ) {
+    // The test will always pass on Linux; read the comments in GetCPUUserTime for details
+    // Also it will not detect spinning issues on systems with only one processing core.
+
+    int nworkers = nthreads-nactive;
+    if( !nworkers ) return;
+    double lastusrtime = GetCPUUserTime();
+    if( !lastusrtime ) return;
+
+    static double minimal_waittime = WAITTIME,
+                  maximal_waittime = WAITTIME * 10;
+    double usrtime_delta;
+    double waittime_delta;
+    tbb::tick_count stamp = tbb::tick_count::now();
+    volatile intptr_t k = (intptr_t)&usrtime_delta;
+    // wait for GetCPUUserTime update
+    while( (usrtime_delta=GetCPUUserTime()-lastusrtime) < THRESHOLD ) {
+        for ( int i = 0; i < 1000; ++i ) ++k; // do fake work without which user time can stall
+        if ( (waittime_delta = (tbb::tick_count::now()-stamp).seconds()) > maximal_waittime ) {
+            REPORT( "Warning: %.2f sec elapsed but user mode time is still below its threshold (%g < %g)\n",
+                    waittime_delta, usrtime_delta, THRESHOLD );
+            break;
+        }
+    }
+    lastusrtime += usrtime_delta;
+
+    // Wait for workers to go sleep
+    stamp = tbb::tick_count::now();
+    while( ((waittime_delta=(tbb::tick_count::now()-stamp).seconds()) < minimal_waittime)
+            || ((usrtime_delta=GetCPUUserTime()-lastusrtime) < THRESHOLD) )
+    {
+        for ( int i = 0; i < 1000; ++i ) ++k; // do fake work without which user time can stall
+        if ( waittime_delta > maximal_waittime ) {
+            REPORT( "Warning: %.2f sec elapsed but GetCPUUserTime reported only %g sec\n", waittime_delta, usrtime_delta );
+            break;
+        }
+    }
+
+    // Test that all workers sleep when no work.
+    while( nactive>1 && usrtime_delta-nactive*waittime_delta<0 ) {
+        // probably the number of active threads was mispredicted
+        --nactive; ++nworkers;
+    }
+    double avg_worker_usrtime = (usrtime_delta-nactive*waittime_delta)/nworkers;
+
+    if( avg_worker_usrtime > waittime_delta/2 )
+        REPORT( "ERROR: %d worker threads are spinning; waittime: %g; usrtime: %g; avg worker usrtime: %g\n",
+                nworkers, waittime_delta, usrtime_delta, avg_worker_usrtime);
+    else
+        REMARK("%d worker threads; waittime: %g; usrtime: %g; avg worker usrtime: %g\n",
+                        nworkers, waittime_delta, usrtime_delta, avg_worker_usrtime);
+}
diff --git a/xdl/third_party/tbb/src/test/harness_defs.h b/xdl/third_party/tbb/src/test/harness_defs.h
new file mode 100644
index 00000000..f7727d28
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_defs.h
@@ -0,0 +1,211 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_harness_defs_H
+#define __TBB_harness_defs_H
+
+#include "tbb/tbb_config.h"
+#if __FreeBSD__
+#include <sys/param.h>  // for __FreeBSD_version
+#endif
+
+#if __TBB_TEST_PIC && !__PIC__
+#define __TBB_TEST_SKIP_PIC_MODE 1
+#else
+#define __TBB_TEST_SKIP_PIC_MODE 0
+#endif
+
+// no need to test GCC builtins mode on ICC
+#define __TBB_TEST_SKIP_GCC_BUILTINS_MODE ( __TBB_TEST_BUILTINS && (!__TBB_GCC_BUILTIN_ATOMICS_PRESENT || __INTEL_COMPILER) )
+
+#define __TBB_TEST_SKIP_ICC_BUILTINS_MODE ( __TBB_TEST_BUILTINS && !__TBB_ICC_BUILTIN_ATOMICS_PRESENT )
+
+#ifndef TBB_USE_GCC_BUILTINS
+  // Force TBB to use GCC intrinsics port, but not on ICC, as no need
+  #define TBB_USE_GCC_BUILTINS         ( __TBB_TEST_BUILTINS && __TBB_GCC_BUILTIN_ATOMICS_PRESENT && !__INTEL_COMPILER )
+#endif
+
+#ifndef TBB_USE_ICC_BUILTINS
+  // Force TBB to use ICC c++11 style intrinsics port
+  #define TBB_USE_ICC_BUILTINS         ( __TBB_TEST_BUILTINS && __TBB_ICC_BUILTIN_ATOMICS_PRESENT )
+#endif
+
+#if (_WIN32 && !__TBB_WIN8UI_SUPPORT) || (__linux__ && !__ANDROID__ && !__bg__) || __FreeBSD_version >= 701000
+#define __TBB_TEST_SKIP_AFFINITY 0
+#else
+#define __TBB_TEST_SKIP_AFFINITY 1
+#endif
+
+#if __INTEL_COMPILER
+  #define __TBB_CPP11_REFERENCE_WRAPPER_PRESENT ( __INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1200 && \
+    ( _MSC_VER >= 1600 || __TBB_GLIBCXX_VERSION >= 40400 || ( _LIBCPP_VERSION && __cplusplus >= 201103L ) ) )
+  #define __TBB_RANGE_BASED_FOR_PRESENT ( __INTEL_CXX11_MODE__ && __INTEL_COMPILER >= 1300 )
+  #define __TBB_SCOPED_ENUM_PRESENT ( __INTEL_CXX11_MODE__ && __INTEL_COMPILER > 1100 )
+#elif __clang__
+  #define __TBB_CPP11_REFERENCE_WRAPPER_PRESENT ( __cplusplus >= 201103L && (__TBB_GLIBCXX_VERSION >= 40400 || _LIBCPP_VERSION) )
+  #define __TBB_RANGE_BASED_FOR_PRESENT ( __has_feature(__cxx_range_for) )
+  #define __TBB_SCOPED_ENUM_PRESENT ( __has_feature(cxx_strong_enums) )
+#elif __GNUC__
+  #define __TBB_CPP11_REFERENCE_WRAPPER_PRESENT ( __GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400 )
+  #define __TBB_RANGE_BASED_FOR_PRESENT ( __GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40500 )
+  #define __TBB_SCOPED_ENUM_PRESENT ( __GXX_EXPERIMENTAL_CXX0X__ && __TBB_GCC_VERSION >= 40400 )
+  #define __TBB_GCC_WARNING_IGNORED_ATTRIBUTES_PRESENT (__TBB_GCC_VERSION >= 60100)
+#elif _MSC_VER
+  #define __TBB_CPP11_REFERENCE_WRAPPER_PRESENT ( _MSC_VER >= 1600 )
+  #define __TBB_RANGE_BASED_FOR_PRESENT ( _MSC_VER >= 1700 )
+  #define __TBB_SCOPED_ENUM_PRESENT ( _MSC_VER >= 1700 )
+#endif
+
+#define __TBB_CPP14_GENERIC_LAMBDAS_PRESENT  (__cpp_generic_lambdas >= 201304 )
+
+#define __TBB_TEST_SKIP_LAMBDA (__TBB_ICC_13_0_CPP11_STDLIB_SUPPORT_BROKEN || !__TBB_CPP11_LAMBDAS_PRESENT)
+
+#if __GNUC__ && __ANDROID__
+// On Android* OS, GCC does not support _thread keyword
+  #define __TBB_THREAD_LOCAL_VARIABLES_PRESENT 0
+#else
+  #define __TBB_THREAD_LOCAL_VARIABLES_PRESENT 1
+#endif
+
+// ICC has a bug in assumptions of the modifications made via atomic pointer
+#define __TBB_ICC_BUILTIN_ATOMICS_POINTER_ALIASING_BROKEN (TBB_USE_ICC_BUILTINS &&  __INTEL_COMPILER < 1400 && __INTEL_COMPILER > 1200)
+
+// clang on Android/IA-32 fails on exception thrown from static move constructor
+#define __TBB_CPP11_EXCEPTION_IN_STATIC_TEST_BROKEN (__ANDROID__ && __SIZEOF_POINTER__==4 && __clang__)
+
+// MSVC 2013 is unable to properly resolve call to overloaded operator= with std::initializer_list argument for std::pair list elements
+// clang on Android/IA-32 fails on "std::vector<std::pair<int,int>> vd{{1,1},{1,1},{1,1}};" line in release mode
+#define __TBB_CPP11_INIT_LIST_TEST_BROKEN (_MSC_VER <= 1800 && _MSC_VER && !__INTEL_COMPILER) || (__ANDROID__ && __TBB_x86_32 && __clang__)
+// MSVC 2013 is unable to manage lifetime of temporary objects passed to a std::initializer_list constructor properly
+#define __TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN (_MSC_FULL_VER < 180030501 && _MSC_VER && !__INTEL_COMPILER)
+
+// Implementation of C++11 std::placeholders in libstdc++ coming with GCC prior to 4.5 reveals bug in Intel(R) C++ Compiler 13 causing "multiple definition" link errors.
+#define __TBB_CPP11_STD_PLACEHOLDERS_LINKAGE_BROKEN ((__INTEL_COMPILER == 1300 || __INTEL_COMPILER == 1310) && __GXX_EXPERIMENTAL_CXX0X__ && __GLIBCXX__ && __TBB_GLIBCXX_VERSION < 40500)
+
+// Intel C++ Compiler has an issue when a scoped enum with a specified underlying type has negative values.
+#define __TBB_ICC_SCOPED_ENUM_WITH_UNDERLYING_TYPE_NEGATIVE_VALUE_BROKEN ( _MSC_VER && !__TBB_DEBUG && __INTEL_COMPILER && __INTEL_COMPILER <= 1500 )
+// Intel C++ Compiler has an issue with __atomic_load_explicit from a scoped enum with a specified underlying type.
+#define __TBB_ICC_SCOPED_ENUM_WITH_UNDERLYING_TYPE_ATOMIC_LOAD_BROKEN ( TBB_USE_ICC_BUILTINS && !__TBB_DEBUG && __INTEL_COMPILER && __INTEL_COMPILER <= 1500 )
+
+// Unable to use constexpr member functions to initialize compile time constants
+#define __TBB_CONSTEXPR_MEMBER_FUNCTION_BROKEN (__INTEL_COMPILER == 1500)
+// Some versions of MSVC do not do compile-time initialization of static variables with constexpr constructors in debug mode
+#define __TBB_STATIC_CONSTEXPR_INIT_BROKEN (_MSC_VER >= 1900 && _MSC_VER <= 1914 && !__INTEL_COMPILER && _DEBUG)
+
+#if __GNUC__ && __ANDROID__
+  #define __TBB_EXCEPTION_TYPE_INFO_BROKEN ( __TBB_GCC_VERSION < 40600 )
+#elif _MSC_VER
+  #define __TBB_EXCEPTION_TYPE_INFO_BROKEN ( _MSC_VER < 1400 )
+#else
+  #define __TBB_EXCEPTION_TYPE_INFO_BROKEN 0
+#endif
+
+// a function ptr cannot be converted to const T& template argument without explicit cast
+#define __TBB_FUNC_PTR_AS_TEMPL_PARAM_BROKEN ( ((__linux__ || __APPLE__) && __INTEL_COMPILER && __INTEL_COMPILER < 1100) || __SUNPRO_CC )
+
+#define __TBB_UNQUALIFIED_CALL_OF_DTOR_BROKEN (__GNUC__==3 && __GNUC_MINOR__<=3)
+
+#define __TBB_CAS_8_CODEGEN_BROKEN (__TBB_x86_32 && __PIC__ && __TBB_GCC_VERSION == 40102 && !__INTEL_COMPILER)
+
+#define __TBB_THROW_FROM_DTOR_BROKEN (__clang__ && __apple_build_version__ && __apple_build_version__ < 5000279)
+
+// std::uncaught_exception is broken on some version of stdlibc++ (it returns true with no active exception)
+#define __TBB_STD_UNCAUGHT_EXCEPTION_BROKEN (__TBB_GLIBCXX_VERSION == 40407)
+
+#if __TBB_LIBSTDCPP_EXCEPTION_HEADERS_BROKEN
+  #define _EXCEPTION_PTR_H /* prevents exception_ptr.h inclusion */
+  #define _GLIBCXX_NESTED_EXCEPTION_H /* prevents nested_exception.h inclusion */
+#endif
+
+// TODO: Investigate the cases that require this macro.
+#define __TBB_COMPLICATED_ADL_BROKEN ( __GNUC__ && __TBB_GCC_VERSION < 40400 )
+
+// Intel C++ Compiler fails to compile the comparison of tuples in some cases
+#if __INTEL_COMPILER && __INTEL_COMPILER < 1700
+  #define __TBB_TUPLE_COMPARISON_COMPILATION_BROKEN (__TBB_GLIBCXX_VERSION >= 40800 || __MIC__)
+#endif
+
+// Intel C++ Compiler fails to compile std::reference in some cases
+#if __INTEL_COMPILER && __INTEL_COMPILER < 1600 || __INTEL_COMPILER == 1600 && __INTEL_COMPILER_UPDATE <= 1
+  #define __TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN (__TBB_GLIBCXX_VERSION >= 40800 && __TBB_GLIBCXX_VERSION <= 50101 || __MIC__)
+#endif
+
+// Intel C++ Compiler fails to generate non-throwing move members for a class inherited from template
+#define __TBB_NOTHROW_MOVE_MEMBERS_IMPLICIT_GENERATION_BROKEN \
+    (__INTEL_COMPILER>=1600 && __INTEL_COMPILER<=1900 || __INTEL_COMPILER==1500 && __INTEL_COMPILER_UPDATE>3)
+
+// std::is_copy_constructible<T>::value returns 'true' for non copyable type when MSVC compiler is used.
+#define __TBB_IS_COPY_CONSTRUCTIBLE_BROKEN ( _MSC_VER && (_MSC_VER <= 1700 || _MSC_VER <= 1800 && !__INTEL_COMPILER) )
+
+// GCC 4.7 and 4.8 might fail to take an address of overloaded template function (bug 57043)
+#if __GNUC__ && !__INTEL_COMPILER && !__clang__
+  #define __TBB_GCC_OVERLOADED_TEMPLATE_FUNCTION_ADDRESS_BROKEN \
+    (__TBB_GCC_VERSION>=40700 && __TBB_GCC_VERSION<40704 || __TBB_GCC_VERSION>=40800 && __TBB_GCC_VERSION<40803 )
+#endif
+
+// The tuple-based tests with more inputs take a long time to compile.  If changes
+// are made to the tuple implementation or any switch that controls it, or if testing
+// with a new platform implementation of std::tuple, the test should be compiled with
+// MAX_TUPLE_TEST_SIZE >= 10 (or the largest number of elements supported) to ensure
+// all tuple sizes are tested.  Expect a very long compile time.
+#ifndef MAX_TUPLE_TEST_SIZE
+    #if TBB_USE_DEBUG
+        #define MAX_TUPLE_TEST_SIZE 3
+    #else
+        #define MAX_TUPLE_TEST_SIZE 5
+    #endif
+#else
+    #if _MSC_VER
+// test sizes <= 8 don't get "decorated name length exceeded" errors. (disable : 4503)
+        #if MAX_TUPLE_TEST_SIZE > 8
+            #undef MAX_TUPLE_TEST_SIZE
+            #define MAX_TUPLE_TEST_SIZE 8
+        #endif
+    #endif
+    #if MAX_TUPLE_TEST_SIZE > __TBB_VARIADIC_MAX
+        #undef MAX_TUPLE_TEST_SIZE
+        #define MAX_TUPLE_TEST_SIZE __TBB_VARIADIC_MAX
+    #endif
+#endif
+
+#if __TBB_CPF_BUILD
+    #ifndef  TBB_PREVIEW_FLOW_GRAPH_FEATURES
+        #define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+    #endif
+    #ifndef TBB_PREVIEW_FLOW_GRAPH_TRACE
+        #define TBB_PREVIEW_FLOW_GRAPH_TRACE 1
+    #endif
+    #ifndef TBB_PREVIEW_ALGORITHM_TRACE
+        #define TBB_PREVIEW_ALGORITHM_TRACE 1
+    #endif
+#endif
+
+namespace Harness {
+    //! Utility template function to prevent "unused" warnings by various compilers.
+    template<typename T> void suppress_unused_warning( const T& ) {}
+
+    //TODO: unify with one in tbb::internal
+    //! Utility helper structure to ease overload resolution
+    template<int > struct int_to_type {};
+}
+
+const unsigned MByte = 1024*1024;
+
+#endif /* __TBB_harness_defs_H */
diff --git a/xdl/third_party/tbb/src/test/harness_dynamic_libs.h b/xdl/third_party/tbb/src/test/harness_dynamic_libs.h
new file mode 100644
index 00000000..386c5dab
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_dynamic_libs.h
@@ -0,0 +1,128 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+// Include this header file before harness.h for HARNESS_SKIP_TEST to take effect
+#if !__TBB_DYNAMIC_LOAD_ENABLED
+#define HARNESS_SKIP_TEST 1
+#else
+
+#if _WIN32 || _WIN64
+#include "tbb/machine/windows_api.h"
+#else
+#include <dlfcn.h>
+#endif
+#include "harness_assert.h"
+
+namespace Harness {
+
+#if TBB_USE_DEBUG
+#define SUFFIX1 "_debug"
+#define SUFFIX2
+#else
+#define SUFFIX1
+#define SUFFIX2 "_debug"
+#endif /* TBB_USE_DEBUG */
+
+#if _WIN32||_WIN64
+#define PREFIX
+#define EXT ".dll"
+#else
+#define PREFIX "lib"
+#if __APPLE__
+#define EXT ".dylib"
+// Android SDK build system does not support .so file name versioning
+#elif __FreeBSD__ || __NetBSD__ || __sun || _AIX || __ANDROID__
+#define EXT ".so"
+#elif __linux__  // Order of these elif's matters!
+#define EXT __TBB_STRING(.so.TBB_COMPATIBLE_INTERFACE_VERSION)
+#else
+#error Unknown OS
+#endif
+#endif
+
+// Form the names of the TBB memory allocator binaries.
+#define MALLOCLIB_NAME1 PREFIX "tbbmalloc" SUFFIX1 EXT
+#define MALLOCLIB_NAME2 PREFIX "tbbmalloc" SUFFIX2 EXT
+
+#if _WIN32 || _WIN64
+typedef  HMODULE LIBRARY_HANDLE;
+#else
+typedef void *LIBRARY_HANDLE;
+#endif
+
+#if _WIN32 || _WIN64
+#define TEST_LIBRARY_NAME(base) base".dll"
+#elif __APPLE__
+#define TEST_LIBRARY_NAME(base) base".dylib"
+#else
+#define TEST_LIBRARY_NAME(base) base".so"
+#endif
+
+LIBRARY_HANDLE OpenLibrary(const char *name)
+{
+#if _WIN32 || _WIN64
+#if __TBB_WIN8UI_SUPPORT
+    TCHAR wlibrary[MAX_PATH];
+    if ( MultiByteToWideChar(CP_UTF8, 0, name, -1, wlibrary, MAX_PATH) == 0 ) return false;
+    return :: LoadPackagedLibrary( wlibrary, 0 );
+#else
+    return ::LoadLibrary(name);
+#endif
+#else
+    return dlopen(name, RTLD_NOW|RTLD_GLOBAL);
+#endif
+}
+
+void CloseLibrary(LIBRARY_HANDLE lib)
+{
+#if _WIN32 || _WIN64
+    BOOL ret = FreeLibrary(lib);
+    ASSERT(ret, "FreeLibrary must be successful");
+#else
+    int ret = dlclose(lib);
+    ASSERT(ret == 0, "dlclose must be successful");
+#endif
+}
+
+typedef void (*FunctionAddress)();
+
+template <typename FunctionPointer>
+void GetAddress(Harness::LIBRARY_HANDLE lib, const char *name, FunctionPointer& func)
+{
+#if _WIN32 || _WIN64
+    func = (FunctionPointer)(void*)GetProcAddress(lib, name);
+#else
+    func = (FunctionPointer)dlsym(lib, name);
+#endif
+    ASSERT(func, "Can't find required symbol in dynamic library");
+}
+
+FunctionAddress GetAddress(Harness::LIBRARY_HANDLE lib, const char *name)
+{
+    FunctionAddress func;
+    GetAddress(lib, name, func);
+    return func;
+}
+
+}  // namespace Harness
+
+#endif // __TBB_DYNAMIC_LOAD_ENABLED
diff --git a/xdl/third_party/tbb/src/test/harness_eh.h b/xdl/third_party/tbb/src/test/harness_eh.h
new file mode 100644
index 00000000..ae485846
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_eh.h
@@ -0,0 +1,317 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include <typeinfo>
+#include "tbb/tbb_exception.h"
+#include "tbb/atomic.h"
+#if USE_TASK_SCHEDULER_OBSERVER
+#include "tbb/task_scheduler_observer.h"
+#endif
+#include "harness.h"
+#include "harness_concurrency_tracker.h"
+
+int g_NumThreads = 0;
+Harness::tid_t  g_Master = 0;
+const char * g_Orig_Wakeup_Msg = "Missed wakeup or machine is overloaded?";
+const char * g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+
+tbb::atomic<intptr_t> g_CurExecuted,
+                      g_ExecutedAtLastCatch,
+                      g_ExecutedAtFirstCatch,
+                      g_ExceptionsThrown,
+                      g_MasterExecutedThrow,     // number of times master entered exception code
+                      g_NonMasterExecutedThrow,  // number of times nonmaster entered exception code
+                      g_PipelinesStarted;
+volatile bool g_ExceptionCaught = false,
+              g_UnknownException = false;
+
+#if USE_TASK_SCHEDULER_OBSERVER
+tbb::atomic<intptr_t> g_ActualMaxThreads;
+tbb::atomic<intptr_t> g_ActualCurrentThreads;
+#endif
+
+volatile bool g_ThrowException = true,
+         // g_Flog is true for nested construct tests with catches (exceptions are not allowed to
+         // propagate to the tbb construct itself.)
+              g_Flog = false,
+              g_MasterExecuted = false,
+              g_NonMasterExecuted = false;
+
+bool    g_ExceptionInMaster = false;
+bool    g_SolitaryException = false;
+bool    g_NestedPipelines   = false;
+
+//! Number of exceptions propagated into the user code (i.e. intercepted by the tests)
+tbb::atomic<intptr_t> g_NumExceptionsCaught;
+
+//-----------------------------------------------------------
+
+#if USE_TASK_SCHEDULER_OBSERVER
+class eh_test_observer : public tbb::task_scheduler_observer {
+public:
+    void on_scheduler_entry(bool is_worker) __TBB_override {
+        if(is_worker) {  // we've already counted the master
+            size_t p = ++g_ActualCurrentThreads;
+            size_t q = g_ActualMaxThreads;
+            while(q < p) {
+                q = g_ActualMaxThreads.compare_and_swap(p,q);
+            }
+        }
+        else {
+            // size_t q = g_ActualMaxThreads;
+        }
+    }
+    void on_scheduler_exit(bool is_worker) __TBB_override {
+        if(is_worker) {
+            --g_ActualCurrentThreads;
+        }
+    }
+};
+#endif
+//-----------------------------------------------------------
+
+inline void ResetEhGlobals ( bool throwException = true, bool flog = false ) {
+    Harness::ConcurrencyTracker::Reset();
+    g_CurExecuted = g_ExecutedAtLastCatch = g_ExecutedAtFirstCatch = 0;
+    g_ExceptionCaught = false;
+    g_UnknownException = false;
+    g_NestedPipelines = false;
+    g_ThrowException = throwException;
+    g_MasterExecutedThrow = 0;
+    g_NonMasterExecutedThrow = 0;
+    g_Flog = flog;
+    g_MasterExecuted = false;
+    g_NonMasterExecuted = false;
+#if USE_TASK_SCHEDULER_OBSERVER
+    g_ActualMaxThreads = 1;  // count master
+    g_ActualCurrentThreads = 1;  // count master
+#endif
+    g_ExceptionsThrown = g_NumExceptionsCaught = g_PipelinesStarted = 0;
+}
+
+#if TBB_USE_EXCEPTIONS
+class test_exception : public std::exception {
+    const char* my_description;
+public:
+    test_exception ( const char* description ) : my_description(description) {}
+
+    const char* what() const throw() __TBB_override { return my_description; }
+};
+
+class solitary_test_exception : public test_exception {
+public:
+    solitary_test_exception ( const char* description ) : test_exception(description) {}
+};
+
+#if TBB_USE_CAPTURED_EXCEPTION
+    typedef tbb::captured_exception PropagatedException;
+    #define EXCEPTION_NAME(e) e.name()
+#else
+    typedef test_exception PropagatedException;
+    #define EXCEPTION_NAME(e) typeid(e).name()
+#endif
+
+#define EXCEPTION_DESCR "Test exception"
+
+#if HARNESS_EH_SIMPLE_MODE
+
+static void ThrowTestException () {
+    ++g_ExceptionsThrown;
+    throw test_exception(EXCEPTION_DESCR);
+}
+
+#else /* !HARNESS_EH_SIMPLE_MODE */
+
+static void ThrowTestException ( intptr_t threshold ) {
+    bool inMaster = (Harness::CurrentTid() == g_Master);
+    if ( !g_ThrowException ||   // if we're not supposed to throw
+            (!g_Flog &&         // if we're not catching throw in bodies and
+             (g_ExceptionInMaster ^ inMaster)) ) { // we're the master and not expected to throw
+              // or are the master and the master is not the one to throw (??)
+        return;
+    }
+    while ( Existed() < threshold )
+        __TBB_Yield();
+    if ( !g_SolitaryException ) {
+        ++g_ExceptionsThrown;
+        if(inMaster) ++g_MasterExecutedThrow; else ++g_NonMasterExecutedThrow;
+        throw test_exception(EXCEPTION_DESCR);
+    }
+    // g_SolitaryException == true
+    if(g_NestedPipelines) {
+        // only throw exception if we have started at least two inner pipelines
+        // else return
+        if(g_PipelinesStarted >= 3) {
+            if ( g_ExceptionsThrown.compare_and_swap(1, 0) == 0 )  {
+                if(inMaster) ++g_MasterExecutedThrow; else ++g_NonMasterExecutedThrow;
+                throw solitary_test_exception(EXCEPTION_DESCR);
+            }
+        }
+    }
+    else {
+        if ( g_ExceptionsThrown.compare_and_swap(1, 0) == 0 )  {
+            if(inMaster) ++g_MasterExecutedThrow; else ++g_NonMasterExecutedThrow;
+            throw solitary_test_exception(EXCEPTION_DESCR);
+        }
+    }
+}
+#endif /* !HARNESS_EH_SIMPLE_MODE */
+
+#define UPDATE_COUNTS()     \
+    { \
+        ++g_CurExecuted; \
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true; \
+        else g_NonMasterExecuted = true; \
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled; \
+    }
+
+#define CATCH()     \
+    } catch ( PropagatedException& e ) { \
+        g_ExecutedAtFirstCatch.compare_and_swap(g_CurExecuted,0); \
+        g_ExecutedAtLastCatch = g_CurExecuted; \
+        ASSERT( e.what(), "Empty what() string" );  \
+        ASSERT (__TBB_EXCEPTION_TYPE_INFO_BROKEN || strcmp(EXCEPTION_NAME(e), (g_SolitaryException ? typeid(solitary_test_exception) : typeid(test_exception)).name() ) == 0, "Unexpected original exception name"); \
+        ASSERT (__TBB_EXCEPTION_TYPE_INFO_BROKEN || strcmp(e.what(), EXCEPTION_DESCR) == 0, "Unexpected original exception info"); \
+        g_ExceptionCaught = l_ExceptionCaughtAtCurrentLevel = true; \
+        ++g_NumExceptionsCaught; \
+    } catch ( tbb::tbb_exception& e ) { \
+        REPORT("Unexpected %s\n", e.name()); \
+        ASSERT (g_UnknownException && !g_UnknownException, "Unexpected tbb::tbb_exception" ); \
+    } catch ( std::exception& e ) { \
+        REPORT("Unexpected %s\n", typeid(e).name()); \
+        ASSERT (g_UnknownException && !g_UnknownException, "Unexpected std::exception" ); \
+    } catch ( ... ) { \
+        g_ExceptionCaught = l_ExceptionCaughtAtCurrentLevel = true; \
+        g_UnknownException = unknownException = true; \
+    } \
+    if ( !g_SolitaryException ) \
+        REMARK_ONCE ("Multiple exceptions mode: %d throws", (intptr_t)g_ExceptionsThrown);
+
+#define ASSERT_EXCEPTION() \
+    { \
+        ASSERT (!g_ExceptionsThrown || g_ExceptionCaught, "throw without catch"); \
+        ASSERT (!g_ExceptionCaught || g_ExceptionsThrown, "catch without throw"); \
+        ASSERT (g_ExceptionCaught || (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow), "no exception occurred"); \
+        ASSERT (__TBB_EXCEPTION_TYPE_INFO_BROKEN || !g_UnknownException, "unknown exception was caught"); \
+    }
+
+#define CATCH_AND_ASSERT() \
+    CATCH() \
+    ASSERT_EXCEPTION()
+
+#else /* !TBB_USE_EXCEPTIONS */
+
+inline void ThrowTestException ( intptr_t ) {}
+
+#endif /* !TBB_USE_EXCEPTIONS */
+
+#define TRY()   \
+    bool l_ExceptionCaughtAtCurrentLevel = false, unknownException = false;    \
+    __TBB_TRY {
+
+// "l_ExceptionCaughtAtCurrentLevel || unknownException" is used only to "touch" otherwise unused local variables
+#define CATCH_AND_FAIL() } __TBB_CATCH(...) { \
+        ASSERT (false, "Cancelling tasks must not cause any exceptions");    \
+        (void)(l_ExceptionCaughtAtCurrentLevel && unknownException);                        \
+    }
+
+const int c_Timeout = 1000000;
+
+void WaitUntilConcurrencyPeaks ( int expected_peak ) {
+    if ( g_Flog )
+        return;
+    int n = 0;
+retry:
+    while ( ++n < c_Timeout && (int)Harness::ConcurrencyTracker::PeakParallelism() < expected_peak )
+        __TBB_Yield();
+#if USE_TASK_SCHEDULER_OBSERVER
+    ASSERT_WARNING( g_NumThreads == g_ActualMaxThreads, "Library did not provide sufficient threads");
+#endif
+    ASSERT_WARNING(n < c_Timeout,g_Wakeup_Msg);
+    // Workaround in case a missed wakeup takes place
+    if ( n == c_Timeout ) {
+        tbb::task &r = *new( tbb::task::allocate_root() ) tbb::empty_task();
+        r.spawn(r);
+        n = 0;
+        goto retry;
+    }
+}
+
+inline void WaitUntilConcurrencyPeaks () { WaitUntilConcurrencyPeaks(g_NumThreads); }
+
+inline bool IsMaster() {
+    return Harness::CurrentTid() == g_Master;
+}
+
+inline bool IsThrowingThread() {
+    return g_ExceptionInMaster ^ IsMaster() ? true : false;
+}
+
+class CancellatorTask : public tbb::task {
+    static volatile bool s_Ready;
+    tbb::task_group_context &m_groupToCancel;
+    intptr_t m_cancellationThreshold;
+
+    tbb::task* execute () __TBB_override {
+        Harness::ConcurrencyTracker ct;
+        s_Ready = true;
+        while ( g_CurExecuted < m_cancellationThreshold )
+            __TBB_Yield();
+        m_groupToCancel.cancel_group_execution();
+        g_ExecutedAtLastCatch = g_CurExecuted;
+        return NULL;
+    }
+public:
+    CancellatorTask ( tbb::task_group_context& ctx, intptr_t threshold )
+        : m_groupToCancel(ctx), m_cancellationThreshold(threshold)
+    {
+        s_Ready = false;
+    }
+
+    static void Reset () { s_Ready = false; }
+
+    static bool WaitUntilReady () {
+        const intptr_t limit = 10000000;
+        intptr_t n = 0;
+        do {
+            __TBB_Yield();
+        } while( !s_Ready && ++n < limit );
+        // should yield once, then continue if Cancellator is ready.
+        ASSERT( s_Ready || n == limit, NULL );
+        return s_Ready;
+    }
+};
+
+volatile bool CancellatorTask::s_Ready = false;
+
+template<class LauncherTaskT, class CancellatorTaskT>
+void RunCancellationTest ( intptr_t threshold = 1 )
+{
+    tbb::task_group_context  ctx;
+    tbb::empty_task &r = *new( tbb::task::allocate_root(ctx) ) tbb::empty_task;
+    r.set_ref_count(3);
+    r.spawn( *new( r.allocate_child() ) CancellatorTaskT(ctx, threshold) );
+    __TBB_Yield();
+    r.spawn( *new( r.allocate_child() ) LauncherTaskT(ctx) );
+    TRY();
+        r.wait_for_all();
+    CATCH_AND_FAIL();
+    r.destroy(r);
+}
diff --git a/xdl/third_party/tbb/src/test/harness_fp.h b/xdl/third_party/tbb/src/test/harness_fp.h
new file mode 100644
index 00000000..5ad40959
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_fp.h
@@ -0,0 +1,172 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// include system header to prevent standard library to be included under private=public first time
+#include <cstddef>
+#define private public
+#include "tbb/tbb_machine.h"
+#undef private
+#include "harness_assert.h"
+
+#if ( __TBB_x86_32 || __TBB_x86_64 ) && __TBB_CPU_CTL_ENV_PRESENT && !defined(__TBB_WIN32_USE_CL_BUILTINS)
+
+const int FE_TONEAREST = 0x0000,
+          FE_DOWNWARD = 0x0400,
+          FE_UPWARD = 0x0800,
+          FE_TOWARDZERO = 0x0c00,
+          FE_RND_MODE_MASK = FE_TOWARDZERO,
+          SSE_RND_MODE_MASK = FE_RND_MODE_MASK << 3,
+          SSE_DAZ = 0x0040,
+          SSE_FTZ = 0x8000,
+          SSE_MODE_MASK = SSE_DAZ | SSE_FTZ,
+          SSE_STATUS_MASK = 0x3F;
+
+const int NumSseModes = 4;
+const int SseModes[NumSseModes] = { 0, SSE_DAZ, SSE_FTZ, SSE_DAZ | SSE_FTZ };
+
+#if _WIN64 && !__TBB_X86_MSVC_INLINE_ASM_AVAILABLE && !__MINGW64__
+// MinGW uses inline implementation from tbb/machine/linux_intel64.h
+// and when inline asm is not available, the library uses out of line assembly which is not exported
+// thus reimplementing them here
+
+#include <float.h>
+
+inline void __TBB_get_cpu_ctl_env ( tbb::internal::cpu_ctl_env* fe ) {
+    fe->x87cw = short(_control87(0, 0) & _MCW_RC) << 2;
+    fe->mxcsr = _mm_getcsr();
+}
+inline void __TBB_set_cpu_ctl_env ( const tbb::internal::cpu_ctl_env* fe ) {
+    ASSERT( (fe->x87cw & FE_RND_MODE_MASK) == ((fe->x87cw & FE_RND_MODE_MASK) >> 2 & _MCW_RC) << 2, "Check float.h constants" );
+    _control87( (fe->x87cw & FE_RND_MODE_MASK) >> 6, _MCW_RC );
+    _mm_setcsr( fe->mxcsr );
+}
+
+#endif /*  _WIN64 && !__TBB_X86_MSVC_INLINE_ASM_AVAILABLE && !__MINGW64__ */
+
+inline int GetRoundingMode ( bool checkConsistency = true ) {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.get_env();
+    ASSERT( !checkConsistency || (ctl.mxcsr & SSE_RND_MODE_MASK) >> 3 == (ctl.x87cw & FE_RND_MODE_MASK), NULL );
+    return ctl.x87cw & FE_RND_MODE_MASK;
+}
+
+inline void SetRoundingMode ( int mode ) {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.get_env();
+    ctl.mxcsr = (ctl.mxcsr & ~SSE_RND_MODE_MASK) | (mode & FE_RND_MODE_MASK) << 3;
+    ctl.x87cw = short((ctl.x87cw & ~FE_RND_MODE_MASK) | (mode & FE_RND_MODE_MASK));
+    ctl.set_env();
+}
+
+inline int GetSseMode () {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.get_env();
+    return ctl.mxcsr & SSE_MODE_MASK;
+}
+
+inline void SetSseMode ( int mode ) {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.get_env();
+    ctl.mxcsr = (ctl.mxcsr & ~SSE_MODE_MASK) | (mode & SSE_MODE_MASK);
+    ctl.set_env();
+}
+
+#elif defined(_M_ARM) || defined(__TBB_WIN32_USE_CL_BUILTINS)
+const int NumSseModes = 1;
+const int SseModes[NumSseModes] = { 0 };
+
+inline int GetSseMode () { return 0; }
+inline void SetSseMode ( int ) {}
+
+const int FE_TONEAREST = _RC_NEAR,
+          FE_DOWNWARD = _RC_DOWN,
+          FE_UPWARD = _RC_UP,
+          FE_TOWARDZERO = _RC_CHOP;
+
+inline int GetRoundingMode ( bool = true ) {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.get_env();
+    return ctl.my_ctl;
+}
+inline void SetRoundingMode ( int mode ) {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.my_ctl = mode;
+    ctl.set_env();
+}
+
+#else /* Other archs */
+
+#include <fenv.h>
+
+const int RND_MODE_MASK = FE_TONEAREST | FE_DOWNWARD | FE_UPWARD | FE_TOWARDZERO;
+
+const int NumSseModes = 1;
+const int SseModes[NumSseModes] = { 0 };
+
+inline int GetRoundingMode ( bool = true ) { return fegetround(); }
+inline void SetRoundingMode ( int rnd ) { fesetround(rnd); }
+
+inline int GetSseMode () { return 0; }
+inline void SetSseMode ( int ) {}
+
+#endif /* Other archs */
+
+const int NumRoundingModes = 4;
+const int RoundingModes[NumRoundingModes] = { FE_TONEAREST, FE_DOWNWARD, FE_UPWARD, FE_TOWARDZERO };
+const int numFPModes = NumRoundingModes*NumSseModes;
+
+inline void SetFPMode( int mode ) {
+    SetRoundingMode( RoundingModes[mode/NumSseModes%NumRoundingModes] );
+    SetSseMode( SseModes[mode%NumSseModes] );
+}
+
+#define AssertFPMode( mode ) { \
+    ASSERT( GetRoundingMode() == RoundingModes[mode/NumSseModes%NumRoundingModes], "FPU control state has not been set correctly." ); \
+    ASSERT( GetSseMode() == SseModes[mode%NumSseModes], "SSE control state has not been set correctly." ); \
+}
+
+inline int SetNextFPMode( int mode, int step = 1 ) {
+    const int nextMode = (mode+step)%numFPModes;
+    SetFPMode( nextMode );
+    return nextMode;
+}
+
+class FPModeContext {
+    int origSse, origRounding;
+    int currentMode;
+public:
+    FPModeContext(int newMode) {
+        origSse = GetSseMode();
+        origRounding = GetRoundingMode();
+        SetFPMode(currentMode = newMode);
+    }
+    ~FPModeContext() {
+        assertFPMode();
+        SetRoundingMode(origRounding);
+        SetSseMode(origSse);
+    }
+    int setNextFPMode() {
+        assertFPMode();
+        return currentMode = SetNextFPMode(currentMode);
+    }
+    void assertFPMode() {
+        AssertFPMode(currentMode);
+    }
+};
diff --git a/xdl/third_party/tbb/src/test/harness_graph.h b/xdl/third_party/tbb/src/test/harness_graph.h
new file mode 100644
index 00000000..56bd126d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_graph.h
@@ -0,0 +1,1240 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/** @file harness_graph.cpp
+    This contains common helper classes and functions for testing graph nodes
+**/
+
+#ifndef harness_graph_H
+#define harness_graph_H
+
+#include "harness.h"
+#include "harness_barrier.h"
+#include "tbb/flow_graph.h"
+#include "tbb/null_rw_mutex.h"
+#include "tbb/atomic.h"
+#include "tbb/concurrent_unordered_map.h"
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/compat/condition_variable"
+#include "tbb/mutex.h"
+#include "tbb/tbb_thread.h"
+
+using tbb::flow::internal::SUCCESSFULLY_ENQUEUED;
+
+#define WAIT_MAX 2000000
+#define BACKOFF_WAIT(ex,msg) \
+{ \
+    int wait_cnt = 0; \
+    tbb::internal::atomic_backoff backoff; \
+    do { \
+        backoff.pause(); \
+        ++wait_cnt; \
+    } \
+    while( (ex) && (wait_cnt < WAIT_MAX)); \
+    ASSERT(wait_cnt < WAIT_MAX, msg); \
+}
+#define BACKOFF_WAIT_NOASSERT(ex,msg) \
+{ \
+    int wait_cnt = 0; \
+    tbb::internal::atomic_backoff backoff; \
+    do { \
+        backoff.pause(); \
+        ++wait_cnt; \
+    } \
+    while( (ex) && (wait_cnt < WAIT_MAX)); \
+    if(wait_cnt >= WAIT_MAX) REMARK("%s\n",msg); \
+}
+
+// Needed conversion to and from continue_msg, but didn't want to add
+// conversion operators to the class, since we don't want it in general,
+// only in these tests.
+template<typename InputType, typename OutputType>
+struct convertor {
+    static OutputType convert_value(const InputType &i) {
+        return OutputType(i);
+    }
+};
+
+template<typename InputType>
+struct convertor<InputType,tbb::flow::continue_msg> {
+    static tbb::flow::continue_msg convert_value(const InputType &/*i*/) {
+        return tbb::flow::continue_msg();
+    }
+};
+
+template<typename OutputType>
+struct convertor<tbb::flow::continue_msg,OutputType> {
+    static OutputType convert_value(const tbb::flow::continue_msg &/*i*/) {
+        return OutputType();
+    }
+};
+
+// helper for multifunction_node tests.
+template<size_t N>
+struct mof_helper {
+    template<typename InputType, typename ports_type>
+    static inline void output_converted_value(const InputType &i, ports_type &p) {
+        (void)tbb::flow::get<N-1>(p).try_put(convertor<InputType,typename tbb::flow::tuple_element<N-1,ports_type>::type::output_type>::convert_value(i));
+        output_converted_value<N-1>(i, p);
+    }
+};
+
+template<>
+struct mof_helper<1> {
+    template<typename InputType, typename ports_type>
+    static inline void output_converted_value(const InputType &i, ports_type &p) {
+        // just emit a default-constructed object
+        (void)tbb::flow::get<0>(p).try_put(convertor<InputType,typename tbb::flow::tuple_element<0,ports_type>::type::output_type>::convert_value(i));
+    }
+};
+
+template< typename InputType, typename OutputType >
+struct harness_graph_default_functor {
+    static OutputType construct( InputType v ) {
+        return OutputType(v);
+    }
+};
+
+template< typename OutputType >
+struct harness_graph_default_functor< tbb::flow::continue_msg, OutputType > {
+    static OutputType construct( tbb::flow::continue_msg ) {
+        return OutputType();
+    }
+};
+
+template< typename InputType >
+struct harness_graph_default_functor< InputType, tbb::flow::continue_msg > {
+    static tbb::flow::continue_msg construct( InputType ) {
+        return tbb::flow::continue_msg();
+    }
+};
+
+template< >
+struct harness_graph_default_functor< tbb::flow::continue_msg, tbb::flow::continue_msg > {
+    static tbb::flow::continue_msg construct( tbb::flow::continue_msg ) {
+        return tbb::flow::continue_msg();
+    }
+};
+
+template<typename InputType, typename OutputSet>
+struct harness_graph_default_multifunction_functor {
+    static const int N = tbb::flow::tuple_size<OutputSet>::value;
+    typedef typename tbb::flow::multifunction_node<InputType,OutputSet>::output_ports_type ports_type;
+    static void construct(const InputType &i, ports_type &p) {
+        mof_helper<N>::output_converted_value(i, p);
+    }
+};
+
+//! An executor that accepts InputType and generates OutputType
+template< typename InputType, typename OutputType >
+struct harness_graph_executor {
+
+    typedef OutputType (*function_ptr_type)( InputType v );
+
+    template<typename RW>
+    struct mutex_holder { static RW mutex; };
+
+    static function_ptr_type fptr;
+    static tbb::atomic<size_t> execute_count;
+    static tbb::atomic<size_t> current_executors;
+    static size_t max_executors;
+
+    static inline OutputType func( InputType v ) {
+        size_t c; // Declaration separate from initialization to avoid ICC internal error on IA-64 architecture
+        c = current_executors.fetch_and_increment();
+        ASSERT( max_executors == 0 || c <= max_executors, NULL );
+        ++execute_count;
+        OutputType v2 = (*fptr)(v);
+        current_executors.fetch_and_decrement();
+        return v2;
+    }
+
+    template< typename RW >
+    static inline OutputType tfunc( InputType v ) {
+        // Invocations allowed to be concurrent, the lock is acquired in shared ("read") mode.
+        // A test can take it exclusively, thus creating a barrier for invocations.
+        typename RW::scoped_lock l( mutex_holder<RW>::mutex, /*write=*/false );
+        return func(v);
+    }
+
+    template< typename RW >
+    struct tfunctor {
+        tbb::atomic<size_t> my_execute_count;
+        tfunctor() { my_execute_count = 0; }
+        tfunctor( const tfunctor &f ) { my_execute_count = f.my_execute_count; }
+        OutputType operator()( InputType i ) {
+           typename RW::scoped_lock l( harness_graph_executor::mutex_holder<RW>::mutex, /*write=*/false );
+           my_execute_count.fetch_and_increment();
+           return harness_graph_executor::func(i);
+        }
+    };
+    typedef tfunctor<tbb::null_rw_mutex> functor;
+
+};
+
+//! A multifunction executor that accepts InputType and has only one Output of OutputType.
+template< typename InputType, typename OutputTuple >
+struct harness_graph_multifunction_executor {
+    typedef typename tbb::flow::multifunction_node<InputType,OutputTuple>::output_ports_type ports_type;
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type OutputType;
+
+    typedef void (*mfunction_ptr_type)( const InputType& v, ports_type &p );
+
+    template<typename RW>
+    struct mutex_holder { static RW mutex; };
+
+    static mfunction_ptr_type fptr;
+    static tbb::atomic<size_t> execute_count;
+    static tbb::atomic<size_t> current_executors;
+    static size_t max_executors;
+
+    static inline void empty_func( const InputType&, ports_type& ) {
+    }
+
+    static inline void func( const InputType &v, ports_type &p ) {
+        size_t c; // Declaration separate from initialization to avoid ICC internal error on IA-64 architecture
+        c = current_executors.fetch_and_increment();
+        ASSERT( max_executors == 0 || c <= max_executors, NULL );
+        ASSERT(tbb::flow::tuple_size<OutputTuple>::value == 1, NULL);
+        ++execute_count;
+        (*fptr)(v,p);
+        current_executors.fetch_and_decrement();
+    }
+
+    template< typename RW >
+    static inline void tfunc( const InputType& v, ports_type &p ) {
+        // Shared lock in invocations, exclusive in a test; see a comment in harness_graph_executor.
+        typename RW::scoped_lock l( mutex_holder<RW>::mutex, /*write=*/false );
+        func(v,p);
+    }
+
+    template< typename RW >
+    struct tfunctor {
+        tbb::atomic<size_t> my_execute_count;
+        tfunctor() { my_execute_count = 0; }
+        tfunctor( const tfunctor &f ) { my_execute_count = f.my_execute_count; }
+        void operator()( const InputType &i, ports_type &p ) {
+           typename RW::scoped_lock l( harness_graph_multifunction_executor::mutex_holder<RW>::mutex, /*write=*/false );
+           my_execute_count.fetch_and_increment();
+           harness_graph_multifunction_executor::func(i,p);
+        }
+    };
+    typedef tfunctor<tbb::null_rw_mutex> functor;
+
+};
+
+// static vars for function_node tests
+template< typename InputType, typename OutputType >
+template< typename RW >
+RW harness_graph_executor<InputType, OutputType>::mutex_holder<RW>::mutex;
+
+template< typename InputType, typename OutputType >
+tbb::atomic<size_t> harness_graph_executor<InputType, OutputType>::execute_count;
+
+template< typename InputType, typename OutputType >
+typename harness_graph_executor<InputType, OutputType>::function_ptr_type harness_graph_executor<InputType, OutputType>::fptr
+    = harness_graph_default_functor< InputType, OutputType >::construct;
+
+template< typename InputType, typename OutputType >
+tbb::atomic<size_t> harness_graph_executor<InputType, OutputType>::current_executors;
+
+template< typename InputType, typename OutputType >
+size_t harness_graph_executor<InputType, OutputType>::max_executors = 0;
+
+// static vars for multifunction_node tests
+template< typename InputType, typename OutputTuple >
+template< typename RW >
+RW harness_graph_multifunction_executor<InputType, OutputTuple>::mutex_holder<RW>::mutex;
+
+template< typename InputType, typename OutputTuple >
+tbb::atomic<size_t> harness_graph_multifunction_executor<InputType, OutputTuple>::execute_count;
+
+template< typename InputType, typename OutputTuple >
+typename harness_graph_multifunction_executor<InputType, OutputTuple>::mfunction_ptr_type harness_graph_multifunction_executor<InputType, OutputTuple>::fptr
+    = harness_graph_default_multifunction_functor< InputType, OutputTuple >::construct;
+
+template< typename InputType, typename OutputTuple >
+tbb::atomic<size_t> harness_graph_multifunction_executor<InputType, OutputTuple>::current_executors;
+
+template< typename InputType, typename OutputTuple >
+size_t harness_graph_multifunction_executor<InputType, OutputTuple>::max_executors = 0;
+
+//! Counts the number of puts received
+template< typename T >
+struct harness_counting_receiver : public tbb::flow::receiver<T>, NoAssign {
+
+    tbb::atomic< size_t > my_count;
+    T max_value;
+    size_t num_copies;
+    tbb::flow::graph& my_graph;
+
+    harness_counting_receiver(tbb::flow::graph& g) : num_copies(1), my_graph(g) {
+       my_count = 0;
+    }
+
+    void initialize_map( const T& m, size_t c ) {
+       my_count = 0;
+       max_value = m;
+       num_copies = c;
+    }
+
+    tbb::flow::graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    tbb::task *try_put_task( const T & ) __TBB_override {
+      ++my_count;
+      return const_cast<tbb::task *>(SUCCESSFULLY_ENQUEUED);
+    }
+
+    void validate() {
+        size_t n = my_count;
+        ASSERT( n == num_copies*max_value, NULL );
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::receiver<T>::built_predecessors_type built_predecessors_type;
+    built_predecessors_type mbp;
+    built_predecessors_type &built_predecessors() __TBB_override { return mbp; }
+    typedef typename tbb::flow::receiver<T>::predecessor_list_type predecessor_list_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_type predecessor_type;
+    void internal_add_built_predecessor(predecessor_type &) __TBB_override {}
+    void internal_delete_built_predecessor(predecessor_type &) __TBB_override {}
+    void copy_predecessors(predecessor_list_type &) __TBB_override { }
+    size_t predecessor_count() __TBB_override { return 0; }
+#endif
+    void reset_receiver(tbb::flow::reset_flags /*f*/) __TBB_override { my_count = 0; }
+};
+
+//! Counts the number of puts received
+template< typename T >
+struct harness_mapped_receiver : public tbb::flow::receiver<T>, NoCopy {
+
+    tbb::atomic< size_t > my_count;
+    T max_value;
+    size_t num_copies;
+    typedef tbb::concurrent_unordered_map< T, tbb::atomic< size_t > > map_type;
+    map_type *my_map;
+    tbb::flow::graph& my_graph;
+
+    harness_mapped_receiver(tbb::flow::graph& g) : my_map(NULL), my_graph(g) {
+       my_count = 0;
+    }
+
+    ~harness_mapped_receiver() {
+        if ( my_map ) delete my_map;
+    }
+
+    void initialize_map( const T& m, size_t c ) {
+       my_count = 0;
+       max_value = m;
+       num_copies = c;
+       if ( my_map ) delete my_map;
+       my_map = new map_type;
+    }
+
+    tbb::task * try_put_task( const T &t ) __TBB_override {
+      if ( my_map ) {
+          tbb::atomic<size_t> a;
+          a = 1;
+          std::pair< typename map_type::iterator, bool > r =  (*my_map).insert( typename map_type::value_type( t, a ) );
+          if ( r.second == false ) {
+              size_t v = r.first->second.fetch_and_increment();
+              ASSERT( v < num_copies, NULL );
+          }
+      } else {
+          ++my_count;
+      }
+      return const_cast<tbb::task *>(SUCCESSFULLY_ENQUEUED);
+    }
+
+    tbb::flow::graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    void validate() {
+        if ( my_map ) {
+            for ( size_t i = 0; i < (size_t)max_value; ++i ) {
+                size_t n = (*my_map)[(int)i];
+                ASSERT( n == num_copies, NULL );
+            }
+        } else {
+            size_t n = my_count;
+            ASSERT( n == num_copies*max_value, NULL );
+        }
+    }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::receiver<T>::built_predecessors_type built_predecessors_type;
+    built_predecessors_type mbp;
+    built_predecessors_type &built_predecessors() __TBB_override { return mbp; }
+    typedef typename tbb::flow::receiver<T>::predecessor_list_type predecessor_list_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_type predecessor_type;
+    void internal_add_built_predecessor(predecessor_type &) __TBB_override {}
+    void internal_delete_built_predecessor(predecessor_type &) __TBB_override {}
+    void copy_predecessors(predecessor_list_type &) __TBB_override { }
+    size_t predecessor_count() __TBB_override { return 0; }
+#endif
+    void reset_receiver(tbb::flow::reset_flags /*f*/) __TBB_override {
+        my_count = 0;
+        if(my_map) delete my_map;
+        my_map = new map_type;
+    }
+
+};
+
+//! Counts the number of puts received
+template< typename T >
+struct harness_counting_sender : public tbb::flow::sender<T>, NoCopy {
+
+    typedef typename tbb::flow::sender<T>::successor_type successor_type;
+    tbb::atomic< successor_type * > my_receiver;
+    tbb::atomic< size_t > my_count;
+    tbb::atomic< size_t > my_received;
+    size_t my_limit;
+
+    harness_counting_sender( ) : my_limit(~size_t(0)) {
+       my_receiver = NULL;
+       my_count = 0;
+       my_received = 0;
+    }
+
+    harness_counting_sender( size_t limit ) : my_limit(limit) {
+       my_receiver = NULL;
+       my_count = 0;
+       my_received = 0;
+    }
+
+    bool register_successor( successor_type &r ) __TBB_override {
+        my_receiver = &r;
+        return true;
+    }
+
+    bool remove_successor( successor_type &r ) __TBB_override {
+        successor_type *s = my_receiver.fetch_and_store( NULL );
+        ASSERT( s == &r, NULL );
+        return true;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::sender<T>::successor_list_type successor_list_type;
+    typedef typename tbb::flow::sender<T>::built_successors_type built_successors_type;
+    built_successors_type bst;
+    built_successors_type &built_successors() __TBB_override { return bst; }
+    void internal_add_built_successor( successor_type &) __TBB_override {}
+    void internal_delete_built_successor( successor_type &) __TBB_override {}
+    void copy_successors(successor_list_type &) __TBB_override { }
+    size_t successor_count() __TBB_override { return 0; }
+#endif
+
+    bool try_get( T & v ) __TBB_override {
+        size_t i = my_count.fetch_and_increment();
+        if ( i < my_limit ) {
+           v = T( i );
+           ++my_received;
+           return true;
+        } else {
+           return false;
+        }
+    }
+
+    bool try_put_once() {
+        successor_type *s = my_receiver;
+        size_t i = my_count.fetch_and_increment();
+        if ( s->try_put( T(i) ) ) {
+            ++my_received;
+            return true;
+        } else {
+            return false;
+        }
+    }
+
+    void try_put_until_false() {
+        successor_type *s = my_receiver;
+        size_t i = my_count.fetch_and_increment();
+
+        while ( s->try_put( T(i) ) ) {
+            ++my_received;
+            i = my_count.fetch_and_increment();
+        }
+    }
+
+    void try_put_until_limit() {
+        successor_type *s = my_receiver;
+
+        for ( int i = 0; i < (int)my_limit; ++i ) {
+            ASSERT( s->try_put( T(i) ), NULL );
+            ++my_received;
+        }
+        ASSERT( my_received == my_limit, NULL );
+    }
+
+};
+
+// test for resets of buffer-type nodes.
+tbb::atomic<int> serial_fn_state0;
+tbb::atomic<int> serial_fn_state1;
+tbb::atomic<int> serial_continue_state0;
+
+template<typename T>
+struct serial_fn_body {
+    tbb::atomic<int> *_flag;
+    serial_fn_body(tbb::atomic<int> &myatomic) : _flag(&myatomic) { }
+    T operator()(const T& in) {
+        if(*_flag == 0) {
+            *_flag = 1;
+            // wait until we are released
+            tbb::internal::atomic_backoff backoff;
+            do {
+                backoff.pause();
+            } while(*_flag == 1);
+        }
+        // return value
+        return in;
+    }
+};
+
+template<typename T>
+struct serial_continue_body {
+    tbb::atomic<int> *_flag;
+    serial_continue_body(tbb::atomic<int> &myatomic) : _flag(&myatomic) {}
+    T operator()(const tbb::flow::continue_msg& /*in*/) {
+        // signal we have received a value
+        *_flag = 1;
+        // wait until we are released
+        tbb::internal::atomic_backoff backoff;
+        do {
+            backoff.pause();
+        } while(*_flag == 1);
+        // return value
+        return (T)1;
+    }
+};
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+
+// walk two lists via iterator, match elements of each, in possibly-different ordder, and
+// return true if all elements of sv appear in tv.
+template<typename SV, typename TV>
+bool lists_match(SV &sv, TV &tv) {
+    if(sv.size() != tv.size()) {
+        return false;
+    }
+    std::vector<bool> bv(sv.size(), false);
+    for(typename TV::iterator itv = tv.begin(); itv != tv.end(); ++itv) {
+        int ibv = 0;
+        for(typename SV::iterator isv = sv.begin(); isv != sv.end(); ++isv) {
+            if(!bv[ibv]) {
+                if(*itv == *isv) {
+                    bv[ibv] = true;
+                    goto found_it;;
+                }
+            }
+            ++ibv;
+        }
+        return false;
+found_it:
+        continue;
+    }
+    return true;
+}
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+template<typename T, typename BufferType>
+void test_resets() {
+    const int NN = 3;
+    tbb::task_scheduler_init init(4);
+    tbb::task_group_context   tgc;
+    tbb::flow::graph          g(tgc);
+    BufferType                b0(g);
+    tbb::flow::queue_node<T>  q0(g);
+    T j;
+    bool nFound[NN];
+
+    // reset empties buffer
+    for(T i = 0; i < NN; ++i) {
+        b0.try_put(i);
+        nFound[(int)i] = false;
+    }
+    g.wait_for_all();
+    g.reset();
+    ASSERT(!b0.try_get(j), "reset did not empty buffer");
+
+    // reset doesn't delete edge
+
+    tbb::flow::make_edge(b0,q0);
+    g.reset();
+    for(T i = 0; i < NN; ++i) {
+        b0.try_put(i);
+    }
+
+    g.wait_for_all();
+    for( T i = 0; i < NN; ++i) {
+        ASSERT(q0.try_get(j), "Missing value from buffer");
+        ASSERT(!nFound[(int)j], "Duplicate value found");
+        nFound[(int)j] = true;
+    }
+
+    for(int ii = 0; ii < NN; ++ii) {
+        ASSERT(nFound[ii], "missing value");
+    }
+    ASSERT(!q0.try_get(j), "Extra values in output");
+
+    // reset reverses a reversed edge.
+    // we will use a serial rejecting node to get the edge to reverse.
+    tbb::flow::function_node<T, T, tbb::flow::rejecting> sfn(g, tbb::flow::serial, serial_fn_body<T>(serial_fn_state0));
+    tbb::flow::queue_node<T> outq(g);
+    tbb::flow::remove_edge(b0,q0);
+    tbb::flow::make_edge(b0, sfn);
+    tbb::flow::make_edge(sfn,outq);
+    g.wait_for_all();  // wait for all the tasks started by building the graph are done.
+    serial_fn_state0 = 0;
+
+    // b0 ------> sfn ------> outq
+
+    for(int icnt = 0; icnt < 2; ++icnt) {
+        g.wait_for_all();
+        serial_fn_state0 = 0;
+        b0.try_put((T)0);  // will start sfn
+        // wait until function_node starts
+        BACKOFF_WAIT(serial_fn_state0 == 0,"Timed out waiting for function_node to start");
+        // now the function_node is executing.
+        // this will start a task to forward the second item
+        // to the serial function node
+        b0.try_put((T)1);  // first item will be consumed by task completing the execution
+        BACKOFF_WAIT_NOASSERT(g.root_task()->ref_count() >= 3,"Timed out waiting try_put task to wind down");
+        b0.try_put((T)2);  // second item will remain after cancellation
+        // now wait for the task that attempts to forward the buffer item to
+        // complete.
+        BACKOFF_WAIT_NOASSERT(g.root_task()->ref_count() >= 3,"Timed out waiting for tasks to wind down");
+        // now cancel the graph.
+        ASSERT(tgc.cancel_group_execution(), "task group already cancelled");
+        serial_fn_state0 = 0;  // release the function_node.
+        g.wait_for_all();  // wait for all the tasks to complete.
+        // check that at most one output reached the queue_node
+        T outt;
+        T outt2;
+        bool got_item1 = outq.try_get(outt);
+        bool got_item2 = outq.try_get(outt2);
+        // either the output queue was empty (if the function_node tested for cancellation before putting the
+        // result to the queue) or there was one element in the queue (the 0).
+        ASSERT(!got_item1 || ((int)outt == 0 && !got_item2), "incorrect output from function_node");
+        // the edge between the buffer and the function_node should be reversed, and the last
+        // message we put in the buffer should still be there.  We can't directly test for the
+        // edge reversal.
+        got_item1 = b0.try_get(outt);
+        ASSERT(got_item1, " buffer lost a message");
+        ASSERT(2 == (int)outt || 1 == (int)outt, " buffer had incorrect message");  // the one not consumed by the node.
+        ASSERT(g.is_cancelled(), "Graph was not cancelled");
+        g.reset();
+    }  // icnt
+
+    // reset with remove_edge removes edge.  (icnt ==0 => forward edge, 1 => reversed edge
+    for(int icnt = 0; icnt < 2; ++icnt) {
+        if(icnt == 1) {
+            // set up reversed edge
+            tbb::flow::make_edge(b0, sfn);
+            tbb::flow::make_edge(sfn,outq);
+            serial_fn_state0 = 0;
+            b0.try_put((T)0);  // starts up the function node
+            b0.try_put((T)1);  // shoyuld reverse the edge
+            BACKOFF_WAIT(serial_fn_state0 == 0,"Timed out waiting for edge reversal");
+            ASSERT(tgc.cancel_group_execution(), "task group already cancelled");
+            serial_fn_state0 = 0;  // release the function_node.
+            g.wait_for_all();  // wait for all the tasks to complete.
+        }
+        g.reset(tbb::flow::rf_clear_edges);
+        // test that no one is a successor to the buffer now.
+        serial_fn_state0 = 1;  // let the function_node go if it gets an input message
+        b0.try_put((T)23);
+        g.wait_for_all();
+        ASSERT((int)serial_fn_state0 == 1, "function_node executed when it shouldn't");
+        T outt;
+        ASSERT(b0.try_get(outt) && (T)23 == outt, "node lost its input");
+    }
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+template< typename NODE_TYPE >
+class test_buffer_base_extract {
+protected:
+    tbb::flow::graph &g;
+    NODE_TYPE &in0;
+    NODE_TYPE &in1;
+    NODE_TYPE &middle;
+    NODE_TYPE &out0;
+    NODE_TYPE &out1;
+    NODE_TYPE *ins[2];
+    NODE_TYPE *outs[2];
+    typename NODE_TYPE::successor_type *ms_ptr;
+    typename NODE_TYPE::predecessor_type *mp_ptr;
+
+    typename NODE_TYPE::predecessor_list_type in0_p_list;
+    typename NODE_TYPE::successor_list_type in0_s_list;
+    typename NODE_TYPE::predecessor_list_type in1_p_list;
+    typename NODE_TYPE::successor_list_type in1_s_list;
+    typename NODE_TYPE::predecessor_list_type out0_p_list;
+    typename NODE_TYPE::successor_list_type out0_s_list;
+    typename NODE_TYPE::predecessor_list_type out1_p_list;
+    typename NODE_TYPE::successor_list_type out1_s_list;
+    typename NODE_TYPE::predecessor_list_type mp_list;
+    typename NODE_TYPE::predecessor_list_type::iterator mp_list_iter;
+    typename NODE_TYPE::successor_list_type ms_list;
+    typename NODE_TYPE::successor_list_type::iterator ms_list_iter;
+
+    virtual void set_up_lists() {
+        in0_p_list.clear();
+        in0_s_list.clear();
+        in1_p_list.clear();
+        in1_s_list.clear();
+        mp_list.clear();
+        ms_list.clear();
+        out0_p_list.clear();
+        out0_s_list.clear();
+        out1_p_list.clear();
+        out1_s_list.clear();
+        in0.copy_predecessors(in0_p_list);
+        in0.copy_successors(in0_s_list);
+        in1.copy_predecessors(in1_p_list);
+        in1.copy_successors(in1_s_list);
+        middle.copy_predecessors(mp_list);
+        middle.copy_successors(ms_list);
+        out0.copy_predecessors(out0_p_list);
+        out0.copy_successors(out0_s_list);
+        out1.copy_predecessors(out1_p_list);
+        out1.copy_successors(out1_s_list);
+    }
+
+    void make_and_validate_full_graph() {
+        /*     in0           out0  */
+        /*         \       /       */
+        /*           middle        */
+        /*         /       \       */
+        /*     in1           out1  */
+        tbb::flow::make_edge( in0, middle );
+        tbb::flow::make_edge( in1, middle );
+        tbb::flow::make_edge( middle, out0 );
+        tbb::flow::make_edge( middle, out1 );
+
+        set_up_lists();
+
+        ASSERT( in0.predecessor_count() == 0 && in0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in0.successor_count() == 1 && in0_s_list.size() == 1 && *(in0_s_list.begin()) == ms_ptr, "expected 1 successor" );
+        ASSERT( in1.predecessor_count() == 0 && in1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in1.successor_count() == 1 && in1_s_list.size() == 1 && *(in1_s_list.begin()) == ms_ptr, "expected 1 successor" );
+        ASSERT( middle.predecessor_count() == 2 && mp_list.size() == 2, "expected 2 predecessors" );
+        ASSERT( middle.successor_count() == 2 && ms_list.size() == 2, "expected 2 successors" );
+        ASSERT( out0.predecessor_count() == 1 && out0_p_list.size() == 1 && *(out0_p_list.begin()) == mp_ptr, "expected 1 predecessor" );
+        ASSERT( out0.successor_count() == 0 && out0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( out1.predecessor_count() == 1 && out1_p_list.size() == 1 && *(out1_p_list.begin()) == mp_ptr, "expected 1 predecessor" );
+        ASSERT( out1.successor_count() == 0 && out1_s_list.size() == 0, "expected 0 successors" );
+
+        int first_pred = *(mp_list.begin()) == ins[0] ? 0 : ( *(mp_list.begin()) == ins[1] ? 1 : -1 );
+        mp_list_iter = mp_list.begin(); ++mp_list_iter;
+        int second_pred = *mp_list_iter == ins[0] ? 0 : ( *mp_list_iter == ins[1] ? 1 : -1 );
+        ASSERT( first_pred != -1 && second_pred != -1 && first_pred != second_pred, "bad predecessor(s) for middle" );
+
+        int first_succ = *(ms_list.begin()) == outs[0] ? 0 : ( *(ms_list.begin()) == outs[1] ? 1 : -1 );
+        ms_list_iter = ++(ms_list.begin());
+        int second_succ = *ms_list_iter == outs[0] ? 0 : ( *ms_list_iter == outs[1] ? 1 : -1 );
+        ASSERT( first_succ != -1 && second_succ != -1 && first_succ != second_succ, "bad successor(s) for middle" );
+
+        in0.try_put(1);
+        in1.try_put(2);
+        g.wait_for_all();
+
+        int r = 0;
+        int v = 0;
+
+        ASSERT( in0.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( in1.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( middle.try_get(v) == false, "buffer should not have a value" );
+        while ( out0.try_get(v) ) {
+            ASSERT( (v == 1 || v == 2) && (v&r) == 0, "duplicate value" );
+            r |= v;
+            g.wait_for_all();
+        }
+        while ( out1.try_get(v) ) {
+            ASSERT( (v == 1 || v == 2) && (v&r) == 0, "duplicate value" );
+            r |= v;
+            g.wait_for_all();
+        }
+        ASSERT( r == 3, "not all values received" );
+        g.wait_for_all();
+    }
+
+    void validate_half_graph() {
+        /*     in0           out0  */
+        /*                         */
+        /*           middle        */
+        /*         /       \       */
+        /*     in1           out1  */
+        set_up_lists();
+
+        ASSERT( in0.predecessor_count() == 0 && in0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in0.successor_count() == 0 && in0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( in1.predecessor_count() == 0 && in1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in1.successor_count() == 1 && in1_s_list.size() == 1 && *(in1_s_list.begin()) == ms_ptr, "expected 1 successor" );
+        ASSERT( middle.predecessor_count() == 1 && mp_list.size() == 1, "expected 1 predecessor" );
+        ASSERT( middle.successor_count() == 1 && ms_list.size() == 1, "expected 1 successor" );
+        ASSERT( out0.predecessor_count() == 0 && out0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( out0.successor_count() == 0 && out0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( out1.predecessor_count() == 1 && out1_p_list.size() == 1 && *(out1_p_list.begin()) == mp_ptr, "expected 1 predecessor" );
+        ASSERT( out1.successor_count() == 0 && out1_s_list.size() == 0, "expected 0 successors" );
+
+        ASSERT( middle.predecessor_count() == 1 && mp_list.size() == 1, "expected two predecessors" );
+        ASSERT( middle.successor_count() == 1 && ms_list.size() == 1, "expected two successors" );
+
+        ASSERT( *(mp_list.begin()) == ins[1], "incorrect predecessor" );
+        ASSERT( *(ms_list.begin()) == outs[1], "incorrect successor" );
+
+        in0.try_put(1);
+        in1.try_put(2);
+        g.wait_for_all();
+
+        int v = 0;
+        ASSERT( in0.try_get(v) == true && v == 1, "buffer should have a value of 1" );
+        ASSERT( in1.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( middle.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( out0.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( out1.try_get(v) == true && v == 2, "buffer should have a value of 2" );
+        g.wait_for_all();
+    }
+
+    void validate_empty_graph() {
+        /*     in0           out0  */
+        /*                         */
+        /*           middle        */
+        /*                         */
+        /*     in1           out1  */
+        set_up_lists();
+
+        ASSERT( in0.predecessor_count() == 0 && in0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in0.successor_count() == 0 && in0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( in1.predecessor_count() == 0 && in1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in1.successor_count() == 0 && in1_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( middle.predecessor_count() == 0 && mp_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( middle.successor_count() == 0 && ms_list.size() == 0, "expected 0 successors" );
+        ASSERT( out0.predecessor_count() == 0 && out0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( out0.successor_count() == 0 && out0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( out1.predecessor_count() == 0 && out1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( out1.successor_count() == 0 && out1_s_list.size() == 0, "expected 0 successors" );
+
+        ASSERT( middle.predecessor_count() == 0 && mp_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( middle.successor_count() == 0 && ms_list.size() == 0, "expected 0 successors" );
+
+        in0.try_put(1);
+        in1.try_put(2);
+        g.wait_for_all();
+
+        int v = 0;
+        ASSERT( in0.try_get(v) == true && v == 1, "buffer should have a value of 1" );
+        ASSERT( in1.try_get(v) == true && v == 2, "buffer should have a value of 2" );
+        ASSERT( middle.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( out0.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( out1.try_get(v) == false, "buffer should not have a value" );
+        g.wait_for_all();
+    }
+
+    // forbid the ecompiler generation of operator= (VS2012 warning)
+    test_buffer_base_extract& operator=(test_buffer_base_extract & /*other*/);
+
+public:
+
+    test_buffer_base_extract(tbb::flow::graph &_g, NODE_TYPE &i0, NODE_TYPE &i1, NODE_TYPE &m, NODE_TYPE &o0, NODE_TYPE &o1) :
+        g(_g), in0(i0), in1(i1), middle(m), out0(o0), out1(o1) {
+        ins[0] = &in0;
+        ins[1] = &in1;
+        outs[0] = &out0;
+        outs[1] = &out1;
+        ms_ptr = static_cast< typename NODE_TYPE::successor_type * >(&middle);
+        mp_ptr = static_cast< typename NODE_TYPE::predecessor_type *>(&middle);
+    }
+
+    virtual ~test_buffer_base_extract() {}
+
+    void run_tests() {
+        make_and_validate_full_graph();
+
+        in0.extract();
+        out0.extract();
+        validate_half_graph();
+
+        in1.extract();
+        out1.extract();
+        validate_empty_graph();
+
+        make_and_validate_full_graph();
+
+        middle.extract();
+        validate_empty_graph();
+
+        make_and_validate_full_graph();
+    }
+
+};
+
+template< typename NODE_TYPE >
+class test_buffer_extract : public test_buffer_base_extract<NODE_TYPE> {
+protected:
+    tbb::flow::graph my_g;
+    NODE_TYPE my_in0;
+    NODE_TYPE my_in1;
+    NODE_TYPE my_middle;
+    NODE_TYPE my_out0;
+    NODE_TYPE my_out1;
+public:
+    test_buffer_extract() : test_buffer_base_extract<NODE_TYPE>( my_g, my_in0, my_in1, my_middle, my_out0, my_out1),
+                            my_in0(my_g), my_in1(my_g), my_middle(my_g), my_out0(my_g), my_out1(my_g) { }
+};
+
+template< >
+class test_buffer_extract< tbb::flow::sequencer_node<int> > : public test_buffer_base_extract< tbb::flow::sequencer_node<int> > {
+protected:
+    typedef tbb::flow::sequencer_node<int> my_node_t;
+    tbb::flow::graph my_g;
+    my_node_t my_in0;
+    my_node_t my_in1;
+    my_node_t my_middle;
+    my_node_t my_out0;
+    my_node_t my_out1;
+
+    typedef tbb::atomic<size_t> count_t;
+    count_t middle_count;
+    count_t out0_count;
+    count_t out1_count;
+
+    struct always_zero { size_t operator()(int) { return 0; } };
+    struct always_inc {
+        count_t *c;
+        always_inc(count_t &_c) : c(&_c) {}
+        size_t operator()(int) {
+            return c->fetch_and_increment();
+        }
+    };
+
+    void set_up_lists() __TBB_override {
+        middle_count = 0;
+        out0_count = 0;
+        out1_count = 0;
+        my_g.reset(); // reset the sequencer nodes to start at 0 again
+        test_buffer_base_extract< my_node_t >::set_up_lists();
+    }
+
+
+public:
+    test_buffer_extract() : test_buffer_base_extract<my_node_t>( my_g, my_in0, my_in1, my_middle, my_out0, my_out1),
+                            my_in0(my_g, always_zero()), my_in1(my_g, always_zero()), my_middle(my_g, always_inc(middle_count)),
+                            my_out0(my_g, always_inc(out0_count)), my_out1(my_g, always_inc(out1_count)) {
+    }
+};
+
+// test for simple node that has one input, one output (overwrite_node, write_once_node, limiter_node)
+// decrement tests have to be done separately.
+template<template< class > class NType, typename ItemType>
+void test_extract_on_node() {
+    tbb::flow::graph g;
+    ItemType dont_care;
+    NType<ItemType> node0(g);
+    tbb::flow::queue_node<ItemType> q0(g);
+    tbb::flow::queue_node<ItemType> q1(g);
+    tbb::flow::queue_node<ItemType> q2(g);
+    for( int i = 0; i < 2; ++i) {
+        tbb::flow::make_edge(q0,node0);
+        tbb::flow::make_edge(q1,node0);
+        tbb::flow::make_edge(node0, q2);
+        q0.try_put(ItemType(i));
+        g.wait_for_all();
+
+        /* q0               */
+        /*   \              */
+        /*    \             */
+        /*      node0 -- q2 */
+        /*    /             */
+        /*   /              */
+        /* q1               */
+
+        ASSERT(node0.predecessor_count() == 2 && q0.successor_count() == 1 && q1.successor_count() == 1, "bad predecessor count");
+        ASSERT(node0.successor_count() == 1 && q2.predecessor_count() == 1, "bad successor count");
+
+        ASSERT(q2.try_get(dont_care) && int(dont_care) == i, "item not forwarded");
+        typename NType<ItemType>::successor_list_type sv, sv1;
+        typename NType<ItemType>::predecessor_list_type pv, pv1;
+
+        pv1.push_back(&q0);
+        pv1.push_back(&q1);
+        sv1.push_back(&q2);
+        node0.copy_predecessors(pv);
+        node0.copy_successors(sv);
+        ASSERT(lists_match(pv,pv1), "predecessor vector incorrect");
+        ASSERT(lists_match(sv,sv1), "successor vector incorrect");
+
+        if(i == 0) {
+            node0.extract();
+        }
+        else {
+            q0.extract();
+            q1.extract();
+            q2.extract();
+        }
+
+        q0.try_put(ItemType(2));
+        g.wait_for_all();
+        ASSERT(!q2.try_get(dont_care), "node0 not disconnected");
+        ASSERT(q0.try_get(dont_care), "q0 empty (should have one item)");
+
+        node0.copy_predecessors(pv);
+        node0.copy_successors(sv);
+        ASSERT(node0.predecessor_count() == 0 && q0.successor_count() == 0 && q1.successor_count() == 0, "error in pred count after extract");
+        ASSERT(pv.size() == 0, "error in pred array count after extract");
+        ASSERT(node0.successor_count() == 0 && q2.predecessor_count() == 0, "error in succ count after extract");
+        ASSERT(sv.size() == 0, "error in succ array count after extract");
+        g.wait_for_all();
+    }
+}
+
+#endif  // TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+template<typename NodeType>
+void test_input_ports_return_ref(NodeType& mip_node) {
+    typename NodeType::input_ports_type& input_ports1 = mip_node.input_ports();
+    typename NodeType::input_ports_type& input_ports2 = mip_node.input_ports();
+    ASSERT(&input_ports1 == &input_ports2, "input_ports() should return reference");
+}
+
+template<typename NodeType>
+void test_output_ports_return_ref(NodeType& mop_node) {
+    typename NodeType::output_ports_type& output_ports1 = mop_node.output_ports();
+    typename NodeType::output_ports_type& output_ports2 = mop_node.output_ports();
+    ASSERT(&output_ports1 == &output_ports2, "output_ports() should return reference");
+}
+
+template< template <typename> class ReservingNodeType, typename DataType, bool DoClear >
+class harness_reserving_body : NoAssign {
+    ReservingNodeType<DataType> &my_reserving_node;
+    tbb::flow::buffer_node<DataType> &my_buffer_node;
+public:
+    harness_reserving_body(ReservingNodeType<DataType> &reserving_node, tbb::flow::buffer_node<DataType> &bn) : my_reserving_node(reserving_node), my_buffer_node(bn) {}
+    void operator()(DataType i) const {
+        my_reserving_node.try_put(i);
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (push)
+#pragma warning (disable: 4127)  /* suppress conditional expression is constant */
+#endif
+        if (DoClear) {
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (pop)
+#endif
+            my_reserving_node.clear();
+        }
+        my_buffer_node.try_put(i);
+        my_reserving_node.try_put(i);
+    }
+};
+
+template< template <typename> class ReservingNodeType, typename DataType >
+void test_reserving_nodes() {
+    const size_t N = 300;
+
+    tbb::flow::graph g;
+
+    ReservingNodeType<DataType> reserving_n(g);
+
+    tbb::flow::buffer_node<DataType> buffering_n(g);
+    tbb::flow::join_node< tbb::flow::tuple<DataType, DataType>, tbb::flow::reserving > join_n(g);
+    harness_counting_receiver< tbb::flow::tuple<DataType, DataType> > end_receiver(g);
+
+    tbb::flow::make_edge(reserving_n, tbb::flow::input_port<0>(join_n));
+    tbb::flow::make_edge(buffering_n, tbb::flow::input_port<1>(join_n));
+    tbb::flow::make_edge(join_n, end_receiver);
+
+    NativeParallelFor(N, harness_reserving_body<ReservingNodeType, DataType, false>(reserving_n, buffering_n));
+    g.wait_for_all();
+
+    ASSERT(end_receiver.my_count == N, NULL);
+
+    // Should not hang
+    NativeParallelFor(N, harness_reserving_body<ReservingNodeType, DataType, true>(reserving_n, buffering_n));
+    g.wait_for_all();
+
+    ASSERT(end_receiver.my_count == 2 * N, NULL);
+}
+
+namespace lightweight_testing {
+
+typedef tbb::flow::tuple<int, int> output_tuple_type;
+
+template<typename NodeType>
+class native_loop_body : NoAssign {
+    NodeType& my_node;
+public:
+    native_loop_body(NodeType& node) : my_node(node) {}
+
+    void operator()(int) const {
+        tbb::tbb_thread::id this_id = tbb::this_tbb_thread::get_id();
+        my_node.try_put(this_id);
+    }
+};
+
+class concurrency_checker_body {
+public:
+    tbb::atomic<unsigned> my_body_count;
+
+    concurrency_checker_body() {
+        my_body_count = 0;
+    }
+
+    template<typename gateway_type>
+    void operator()(const tbb::tbb_thread::id& input, gateway_type&) {
+        increase_and_check(input);
+    }
+
+    output_tuple_type operator()(const tbb::tbb_thread::id& input) {
+        increase_and_check(input);
+        return output_tuple_type();
+    }
+
+private:
+    void increase_and_check(const tbb::tbb_thread::id& input) {
+        ++my_body_count;
+        tbb::tbb_thread::id body_thread_id = tbb::this_tbb_thread::get_id();
+        ASSERT(input == body_thread_id, "Body executed as not lightweight");
+    }
+};
+
+template<typename NodeType>
+void test_unlimited_lightweight_execution(unsigned N) {
+    tbb::flow::graph g;
+    NodeType node(g, tbb::flow::unlimited, concurrency_checker_body());
+
+    NativeParallelFor(N, native_loop_body<NodeType>(node));
+    g.wait_for_all();
+
+    concurrency_checker_body body = tbb::flow::copy_body<concurrency_checker_body>(node);
+    ASSERT(body.my_body_count == N, "Body needs to be executed N times");
+}
+
+// Using TBB implementation of condition variable
+// not to include std header, which has problems with old GCC
+using tbb::interface5::condition_variable;
+using tbb::interface5::unique_lock;
+
+tbb::mutex m;
+condition_variable lightweight_condition;
+bool work_submitted;
+bool lightweight_work_processed;
+
+template<typename NodeType>
+class native_loop_limited_body : NoAssign {
+    NodeType& my_node;
+    Harness::SpinBarrier& my_barrier;
+public:
+    native_loop_limited_body(NodeType& node, Harness::SpinBarrier& barrier):
+        my_node(node), my_barrier(barrier) {}
+    void operator()(int) const {
+        tbb::tbb_thread::id this_id = tbb::this_tbb_thread::get_id();
+        my_node.try_put(this_id);
+        if(!lightweight_work_processed) {
+            my_barrier.wait();
+            work_submitted = true;
+            lightweight_condition.notify_all();
+        }
+    }
+};
+
+struct condition_predicate {
+    bool operator()() {
+        return work_submitted;
+    }
+};
+
+class limited_lightweight_checker_body {
+public:
+    tbb::atomic<unsigned> my_body_count;
+    tbb::atomic<unsigned> my_lightweight_count;
+    tbb::atomic<unsigned> my_task_count;
+    limited_lightweight_checker_body() {
+        my_body_count = 0;
+        my_lightweight_count = 0;
+        my_task_count = 0;
+    }
+private:
+    void increase_and_check(const tbb::tbb_thread::id& /*input*/) {
+        ++my_body_count;
+        bool is_task = tbb::task::self().state() == tbb::task::executing;
+        if(is_task) {
+            ++my_task_count;
+        } else {
+            unique_lock<tbb::mutex> lock(m);
+            lightweight_condition.wait(lock, condition_predicate());
+            ++my_lightweight_count;
+            lightweight_work_processed = true;
+        }
+    }
+public:
+    template<typename gateway_type>
+    void operator()(const tbb::tbb_thread::id& input, gateway_type&) {
+        increase_and_check(input);
+    }
+    output_tuple_type operator()(const tbb::tbb_thread::id& input) {
+        increase_and_check(input);
+        return output_tuple_type();
+    }
+};
+
+template<typename NodeType>
+void test_limited_lightweight_execution(unsigned N, unsigned concurrency) {
+    ASSERT(concurrency != tbb::flow::unlimited,
+           "Test for limited concurrency cannot be called with unlimited concurrency argument");
+    tbb::flow::graph g;
+    NodeType node(g, concurrency, limited_lightweight_checker_body());
+    // Execute first body as lightweight, then wait for all other threads to fill internal buffer.
+    // Then unblock the lightweightd thread and check if other body executions are inside tbb task.
+    Harness::SpinBarrier barrier(N - concurrency);
+    NativeParallelFor(N, native_loop_limited_body<NodeType>(node, barrier));
+    g.wait_for_all();
+    limited_lightweight_checker_body body = tbb::flow::copy_body<limited_lightweight_checker_body>(node);
+    ASSERT(body.my_body_count == N, "Body needs to be executed N times");
+    ASSERT(body.my_lightweight_count == concurrency, "Body needs to be executed as lightweight once");
+    ASSERT(body.my_task_count == N - concurrency, "Body needs to be executed as not lightweight N - 1 times");
+    work_submitted = false;
+    lightweight_work_processed = false;
+}
+
+template<typename NodeType>
+void test_lightweight(unsigned N) {
+    test_unlimited_lightweight_execution<NodeType>(N);
+    test_limited_lightweight_execution<NodeType>(N, tbb::flow::serial);
+    test_limited_lightweight_execution<NodeType>(N, (std::min)(tbb::tbb_thread::hardware_concurrency() / 2, N/2));
+}
+
+template<template<typename, typename, typename, typename> class NodeType>
+void test(unsigned N) {
+    typedef tbb::tbb_thread::id input_type;
+    typedef tbb::cache_aligned_allocator<input_type> allocator_type;
+    typedef NodeType<input_type, output_tuple_type, tbb::flow::queueing_lightweight, allocator_type> node_type;
+    test_lightweight<node_type>(N);
+}
+
+}
+
+#endif
diff --git a/xdl/third_party/tbb/src/test/harness_inject_scheduler.h b/xdl/third_party/tbb/src/test/harness_inject_scheduler.h
new file mode 100644
index 00000000..9c6cd667
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_inject_scheduler.h
@@ -0,0 +1,86 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Used in tests that work with TBB scheduler but do not link to the TBB library.
+// In other words it embeds the TBB library core into the test executable.
+
+#ifndef harness_inject_scheduler_H
+#define harness_inject_scheduler_H
+
+#if HARNESS_DEFINE_PRIVATE_PUBLIC
+#include <string> // merely prevents LNK2019 error to happen (on ICL+VC9 configurations)
+#include <algorithm> // include it first to avoid error on define below
+#define private public
+#define protected public
+#endif
+
+// Suppress usage of #pragma comment
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+
+// Enable preview features if any
+#define __TBB_BUILD 1
+
+#undef DO_ITT_NOTIFY
+
+#define __TBB_SOURCE_DIRECTLY_INCLUDED 1
+#include "../tbb/tbb_main.cpp"
+#include "../tbb/dynamic_link.cpp"
+#include "../tbb/tbb_misc_ex.cpp"
+
+// Tasking subsystem files
+#include "../tbb/governor.cpp"
+#include "../tbb/market.cpp"
+#include "../tbb/arena.cpp"
+#include "../tbb/scheduler.cpp"
+#include "../tbb/observer_proxy.cpp"
+#include "../tbb/task.cpp"
+#include "../tbb/task_group_context.cpp"
+
+// Other dependencies
+#include "../tbb/cache_aligned_allocator.cpp"
+#include "../tbb/tbb_thread.cpp"
+#include "../tbb/mutex.cpp"
+#include "../tbb/spin_rw_mutex.cpp"
+#include "../tbb/spin_mutex.cpp"
+#include "../tbb/private_server.cpp"
+#include "../tbb/concurrent_monitor.cpp"
+#if _WIN32||_WIN64
+#include "../tbb/semaphore.cpp"
+#endif
+#include "../rml/client/rml_tbb.cpp"
+
+#if HARNESS_USE_RUNTIME_LOADER
+#undef HARNESS_USE_RUNTIME_LOADER
+#include "harness.h"
+
+int TestMain () {
+    // Tests that directly include sources make no sense in runtime loader testing mode.
+    return Harness::Skipped;
+}
+// Renaming the TestMain function avoids conditional compilation around same function in the test file
+#define TestMain TestMainSkipped
+#endif
+
+#if HARNESS_DEFINE_PRIVATE_PUBLIC
+#undef protected
+#undef private
+#endif
+
+#endif /* harness_inject_scheduler_H */
diff --git a/xdl/third_party/tbb/src/test/harness_iterator.h b/xdl/third_party/tbb/src/test/harness_iterator.h
new file mode 100644
index 00000000..3155e547
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_iterator.h
@@ -0,0 +1,164 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef harness_iterator_H
+#define harness_iterator_H
+
+#include <iterator>
+#include <memory>
+#include "tbb/atomic.h"
+#include "harness_assert.h"
+
+namespace Harness {
+
+template <typename T>
+class InputIterator {
+public:
+    typedef std::input_iterator_tag iterator_category;
+    typedef T value_type;
+    typedef typename std::allocator<T>::difference_type difference_type;
+    typedef typename std::allocator<T>::pointer pointer;
+    typedef typename std::allocator<T>::reference reference;
+
+    explicit InputIterator ( T * ptr ) : my_ptr(ptr), my_shared_epoch(new Epoch), my_current_epoch(0) {}
+
+    InputIterator( const InputIterator& it ) {
+        ASSERT(it.my_current_epoch == it.my_shared_epoch->epoch, "Copying an invalidated iterator");
+        my_ptr = it.my_ptr;
+        my_shared_epoch = it.my_shared_epoch;
+        my_current_epoch = it.my_current_epoch;
+        ++my_shared_epoch->refcounter;
+    }
+
+    InputIterator& operator= ( const InputIterator& it ) {
+        ASSERT(it.my_current_epoch == it.my_shared_epoch->epoch, "Assigning an invalidated iterator");
+        my_ptr = it.my_ptr;
+        my_current_epoch = it.my_current_epoch;
+        if(my_shared_epoch == it.my_shared_epoch)
+            return *this;
+        destroy();
+        my_shared_epoch = it.my_shared_epoch;
+        ++my_shared_epoch->refcounter;
+        return *this;
+    }
+
+    T& operator* () const {
+        ASSERT(my_shared_epoch->epoch == my_current_epoch, "Dereferencing an invalidated input iterator");
+        return *my_ptr;
+    }
+
+    InputIterator& operator++ () {
+        ASSERT(my_shared_epoch->epoch == my_current_epoch, "Incrementing an invalidated input iterator");
+        ++my_ptr;
+        ++my_current_epoch;
+        ++my_shared_epoch->epoch;
+        return *this;
+    }
+
+    bool operator== ( const InputIterator& it ) const {
+        ASSERT(my_shared_epoch->epoch == my_current_epoch, "Comparing an invalidated input iterator");
+        ASSERT(it.my_shared_epoch->epoch == it.my_current_epoch, "Comparing with an invalidated input iterator");
+        return my_ptr == it.my_ptr;
+    }
+
+    ~InputIterator() {
+        destroy();
+    }
+private:
+    void destroy() {
+        if(0 == --my_shared_epoch->refcounter) {
+            delete my_shared_epoch;
+        }
+    }
+    struct Epoch {
+        typedef tbb::atomic<size_t> Counter;
+        Epoch() { epoch = 0; refcounter = 1; }
+        Counter epoch;
+        Counter refcounter;
+    };
+
+    T * my_ptr;
+    Epoch *my_shared_epoch;
+    size_t my_current_epoch;
+};
+
+template <typename T>
+class ForwardIterator {
+    T * my_ptr;
+public:
+    typedef std::forward_iterator_tag iterator_category;
+    typedef T value_type;
+    typedef typename std::allocator<T>::difference_type difference_type;
+    typedef typename std::allocator<T>::pointer pointer;
+    typedef typename std::allocator<T>::reference reference;
+
+    explicit ForwardIterator ( T * ptr ) : my_ptr(ptr){}
+
+    ForwardIterator ( const ForwardIterator& r ) : my_ptr(r.my_ptr){}
+    T& operator* () const { return *my_ptr; }
+    ForwardIterator& operator++ () { ++my_ptr; return *this; }
+    bool operator== ( const ForwardIterator& r ) const { return my_ptr == r.my_ptr; }
+};
+
+template <typename T>
+class RandomIterator {
+    T * my_ptr;
+public:
+    typedef std::random_access_iterator_tag iterator_category;
+    typedef T value_type;
+    typedef typename std::allocator<T>::pointer pointer;
+    typedef typename std::allocator<T>::reference reference;
+    typedef typename std::allocator<T>::difference_type difference_type;
+
+    explicit RandomIterator ( T * ptr ) : my_ptr(ptr){}
+    RandomIterator ( const RandomIterator& r ) : my_ptr(r.my_ptr){}
+    T& operator* () const { return *my_ptr; }
+    RandomIterator& operator++ () { ++my_ptr; return *this; }
+    bool operator== ( const RandomIterator& r ) const { return my_ptr == r.my_ptr; }
+    bool operator!= ( const RandomIterator& r ) const { return my_ptr != r.my_ptr; }
+    difference_type operator- (const RandomIterator &r) const {return my_ptr - r.my_ptr;}
+    RandomIterator operator+ (difference_type n) const {return RandomIterator(my_ptr + n);}
+    bool operator< (const RandomIterator &r) const {return my_ptr < r.my_ptr;}
+};
+
+template <typename T>
+class ConstRandomIterator {
+    const T * my_ptr;
+public:
+    typedef std::random_access_iterator_tag iterator_category;
+    typedef const T value_type;
+    typedef typename std::allocator<T>::const_pointer pointer;
+    typedef typename std::allocator<T>::const_reference reference;
+    typedef typename std::allocator<T>::difference_type difference_type;
+
+    explicit ConstRandomIterator ( const T * ptr ) : my_ptr(ptr){}
+    ConstRandomIterator ( const ConstRandomIterator& r ) : my_ptr(r.my_ptr){}
+    const T& operator* () const { return *my_ptr; }
+    ConstRandomIterator& operator++ () { ++my_ptr; return *this; }
+    bool operator== ( const ConstRandomIterator& r ) const { return my_ptr == r.my_ptr; }
+    bool operator!= ( const ConstRandomIterator& r ) const { return my_ptr != r.my_ptr; }
+    difference_type operator- (const ConstRandomIterator &r) const {return my_ptr - r.my_ptr;}
+    ConstRandomIterator operator+ (difference_type n) const {return ConstRandomIterator(my_ptr + n);}
+    bool operator< (const ConstRandomIterator &r) const {return my_ptr < r.my_ptr;}
+};
+
+} // namespace Harness
+
+#endif //harness_iterator_H
diff --git a/xdl/third_party/tbb/src/test/harness_m128.h b/xdl/third_party/tbb/src/test/harness_m128.h
new file mode 100644
index 00000000..606c3a0b
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_m128.h
@@ -0,0 +1,124 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Header that sets HAVE_m128/HAVE_m256 if vector types (__m128/__m256) are available
+
+//! Class for testing safety of using vector types.
+/** Uses circuitous logic forces compiler to put __m128/__m256 objects on stack while
+    executing various methods, and thus tempt it to use aligned loads and stores
+    on the stack. */
+//  Do not create file-scope objects of the class, because MinGW (as of May 2010)
+//  did not always provide proper stack alignment in destructors of such objects.
+
+#if (_MSC_VER>=1600)
+//TODO: handle /arch:AVX in the right way.
+#pragma warning (push)
+#pragma warning (disable: 4752)
+#endif
+
+#if __TBB_GCC_WARNING_SUPPRESSION_PRESENT && __TBB_GCC_WARNING_IGNORED_ATTRIBUTES_PRESENT
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wignored-attributes"
+#endif
+
+
+template<typename __Mvec>
+class ClassWithVectorType {
+    static const int n = 16;
+    static const int F = sizeof(__Mvec)/sizeof(float);
+    __Mvec field[n];
+    void init( int start );
+public:
+    ClassWithVectorType() {init(-n);}
+    ClassWithVectorType( int i ) {init(i);}
+    void operator=( const ClassWithVectorType& src ) {
+        __Mvec stack[n];
+        for( int i=0; i<n; ++i )
+            stack[i^5] = src.field[i];
+        for( int i=0; i<n; ++i )
+            field[i^5] = stack[i];
+    }
+    ~ClassWithVectorType() {init(-2*n);}
+    friend bool operator==( const ClassWithVectorType& x, const ClassWithVectorType& y ) {
+        for( int i=0; i<F*n; ++i )
+            if( ((const float*)x.field)[i]!=((const float*)y.field)[i] )
+                return false;
+        return true;
+    }
+    friend bool operator!=( const ClassWithVectorType& x, const ClassWithVectorType& y ) {
+        return !(x==y);
+    }
+};
+
+template<typename __Mvec>
+void ClassWithVectorType<__Mvec>::init( int start ) {
+    __Mvec stack[n];
+    for( int i=0; i<n; ++i ) {
+        // Declaring value as a one-element array instead of a scalar quites
+        // gratuitous warnings about possible use of "value" before it was set.
+        __Mvec value[1];
+        for( int j=0; j<F; ++j )
+            ((float*)value)[j] = float(n*start+F*i+j);
+        stack[i^5] = value[0];
+    }
+    for( int i=0; i<n; ++i )
+        field[i^5] = stack[i];
+}
+
+#if (__AVX__ || (_MSC_VER>=1600 && _M_X64)) && !defined(__sun)
+#include <immintrin.h>
+#define HAVE_m256 1
+typedef ClassWithVectorType<__m256> ClassWithAVX;
+#if _MSC_VER
+#include <intrin.h> // for __cpuid
+#endif
+bool have_AVX() {
+    bool result = false;
+    const int avx_mask = 1<<28;
+#if _MSC_VER || __INTEL_COMPILER
+    int info[4] = {0,0,0,0};
+    const int ECX = 2;
+    __cpuid(info, 1);
+    result = (info[ECX] & avx_mask)!=0;
+#elif __GNUC__
+    int ECX;
+    __asm__( "cpuid"
+             : "=c"(ECX)
+             : "a" (1)
+             : "ebx", "edx" );
+    result = (ECX & avx_mask);
+#endif
+    return result;
+}
+#endif /* __AVX__ etc */
+
+#if (__SSE__ || _M_IX86_FP || _M_X64) && !defined(__sun)
+#include <xmmintrin.h>
+#define HAVE_m128 1
+typedef ClassWithVectorType<__m128> ClassWithSSE;
+#endif
+
+#if __TBB_GCC_WARNING_SUPPRESSION_PRESENT && __TBB_GCC_WARNING_IGNORED_ATTRIBUTES_PRESENT
+#pragma GCC diagnostic pop
+#endif
+
+#if (_MSC_VER>=1600)
+#pragma warning (pop)
+#endif
diff --git a/xdl/third_party/tbb/src/test/harness_memory.h b/xdl/third_party/tbb/src/test/harness_memory.h
new file mode 100644
index 00000000..57c8249f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_memory.h
@@ -0,0 +1,145 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Declarations for simple estimate of the memory being used by a program.
+// Not yet implemented for macOS*.
+// This header is an optional part of the test harness.
+// It assumes that "harness_assert.h" has already been included.
+
+#if __linux__ || __sun
+#include <sys/resource.h>
+#include <unistd.h>
+
+#elif __APPLE__ && !__ARM_ARCH
+#include <unistd.h>
+#include <mach/mach.h>
+#include <AvailabilityMacros.h>
+#if MAC_OS_X_VERSION_MIN_REQUIRED >= __MAC_10_6 || __IPHONE_OS_VERSION_MIN_REQUIRED >= __IPHONE_8_0
+#include <mach/shared_region.h>
+#else
+#include <mach/shared_memory_server.h>
+#endif
+#if SHARED_TEXT_REGION_SIZE || SHARED_DATA_REGION_SIZE
+const size_t shared_size = SHARED_TEXT_REGION_SIZE+SHARED_DATA_REGION_SIZE;
+#else
+const size_t shared_size = 0;
+#endif
+
+#elif _WIN32 && !__TBB_WIN8UI_SUPPORT
+#include <windows.h>
+#include <psapi.h>
+#if _MSC_VER
+#pragma comment(lib, "psapi")
+#endif
+
+#endif /* OS selection */
+
+enum MemoryStatType {
+    currentUsage,
+    peakUsage
+};
+
+//! Return estimate of number of bytes of memory that this program is currently using.
+/* Returns 0 if not implemented on platform. */
+size_t GetMemoryUsage(MemoryStatType stat = currentUsage) {
+    ASSERT(stat==currentUsage || stat==peakUsage, NULL);
+#if __TBB_WIN8UI_SUPPORT
+    return 0;
+#elif _WIN32
+    PROCESS_MEMORY_COUNTERS mem;
+    bool status = GetProcessMemoryInfo(GetCurrentProcess(), &mem, sizeof(mem))!=0;
+    ASSERT(status, NULL);
+    return stat==currentUsage? mem.PagefileUsage : mem.PeakPagefileUsage;
+#elif __linux__
+    long unsigned size = 0;
+    FILE *fst = fopen("/proc/self/status", "r");
+    ASSERT(fst, NULL);
+    const int BUF_SZ = 200;
+    char buf_stat[BUF_SZ];
+    const char *pattern = stat==peakUsage ? "VmPeak: %lu" : "VmSize: %lu";
+    while (NULL != fgets(buf_stat, BUF_SZ, fst)) {
+        if (1==sscanf(buf_stat, pattern, &size)) {
+            ASSERT(size, "Invalid value of memory consumption.");
+            break;
+        }
+    }
+    // VmPeak is available in kernels staring 2.6.15
+    if (stat!=peakUsage || LinuxKernelVersion() >= 2006015)
+        ASSERT(size, "Invalid /proc/self/status format, pattern not found.");
+    fclose(fst);
+    return size*1024;
+#elif __APPLE__ && !__ARM_ARCH
+    // TODO: find how detect peak virtual memory size under macOS
+    if (stat == peakUsage)
+        return 0;
+    kern_return_t status;
+    task_basic_info info;
+    mach_msg_type_number_t msg_type = TASK_BASIC_INFO_COUNT;
+    status = task_info(mach_task_self(), TASK_BASIC_INFO, reinterpret_cast<task_info_t>(&info), &msg_type);
+    ASSERT(status==KERN_SUCCESS, NULL);
+    return info.virtual_size - shared_size;
+#else
+    return 0;
+#endif
+}
+
+//! Use approximately a specified amount of stack space.
+/** Recursion is used here instead of alloca because some implementations of alloca do not use the stack. */
+void UseStackSpace( size_t amount, char* top=0 ) {
+    char x[1000];
+    memset( x, -1, sizeof(x) );
+    if( !top )
+        top = x;
+    ASSERT( x<=top, "test assumes that stacks grow downwards" );
+    if( size_t(top-x)<amount )
+        UseStackSpace( amount, top );
+}
+
+#if __linux__
+// Parse file utility
+#include "../tbbmalloc/shared_utils.h"
+
+inline bool isTHPEnabledOnMachine() {
+    unsigned long long thpPresent = 'n';
+    parseFileItem thpItem[] = { { "[alwa%cs] madvise never\n", thpPresent } };
+    parseFile</*BUFF_SIZE=*/100>("/sys/kernel/mm/transparent_hugepage/enabled", thpItem);
+
+    if (thpPresent == 'y') {
+        return true;
+    } else {
+        return false;
+    }
+}
+inline unsigned long long getSystemTHPAllocatedSize() {
+    unsigned long long anonHugePagesSize = 0;
+    parseFileItem meminfoItems[] = {
+        { "AnonHugePages: %llu kB", anonHugePagesSize } };
+    parseFile</*BUFF_SIZE=*/100>("/proc/meminfo", meminfoItems);
+    return anonHugePagesSize;
+}
+inline unsigned long long getSystemTHPCount() {
+    unsigned long long anonHugePages = 0;
+    parseFileItem vmstatItems[] = {
+        { "nr_anon_transparent_hugepages %llu", anonHugePages } };
+    parseFile</*BUFF_SIZE=*/100>("/proc/vmstat", vmstatItems);
+    return anonHugePages;
+}
+#endif // __linux__
+
diff --git a/xdl/third_party/tbb/src/test/harness_mic.h b/xdl/third_party/tbb/src/test/harness_mic.h
new file mode 100644
index 00000000..fe81b194
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_mic.h
@@ -0,0 +1,46 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_test_harness_mic_H
+#define tbb_test_harness_mic_H
+
+#if ! __TBB_DEFINE_MIC
+    #error test/harness_mic.h should be included only when building for Intel(R) Many Integrated Core Architecture
+#endif
+
+// test for unifed sources. See makefiles
+#undef HARNESS_INCOMPLETE_SOURCES
+
+#include <stdlib.h>
+#include <stdio.h>
+
+#define TBB_TEST_LOW_WORKLOAD 1
+
+#define REPORT_FATAL_ERROR  REPORT
+#define HARNESS_EXPORT
+
+#if __TBB_MIC_NATIVE
+    #define HARNESS_EXIT_ON_ASSERT 1
+    #define __TBB_PLACEMENT_NEW_EXCEPTION_SAFETY_BROKEN 1
+#else
+    #define HARNESS_TERMINATE_ON_ASSERT 1
+#endif
+
+#endif /* tbb_test_harness_mic_H */
diff --git a/xdl/third_party/tbb/src/test/harness_preload.h b/xdl/third_party/tbb/src/test/harness_preload.h
new file mode 100644
index 00000000..7e3c87a7
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_preload.h
@@ -0,0 +1,47 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// This file is intended for preloading (via compiler options such as -include) into every test.
+// Alas, not all compilers have such options, so the file is "optional".
+
+// Only add here things that are necessary for *every* test!
+// In particular, avoid including other headers.
+// Since this file can be omitted, checking compiler-specific conditions is strongly recommended.
+
+#ifndef harness_preload_H
+#define harness_preload_H
+
+#if __GNUC__>=5 && !__INTEL_COMPILER && !__clang__ && __GXX_EXPERIMENTAL_CXX0X__
+// GCC 5 has added -Wsuggest-override, but unfortunately enables it even in pre-C++11 mode.
+// We only want to use it for C++11 though.
+#pragma GCC diagnostic warning "-Wsuggest-override"
+#define __TBB_TEST_USE_WSUGGEST_OVERRIDE 1
+#endif
+// TODO: consider adding a similar option for clang
+
+#if __TBB_TEST_NO_EXCEPTIONS
+// This code breaks our own recommendations above, and it's deliberate:
+// it includes another file, but that file should only have macros and pragmas;
+// it does not check for compiler, as that is checked in the included file.
+// The file also defines TBB_USE_EXCEPTIONS=0, which is set for all tests via makefiles anyway.
+#include "tbb/tbb_disable_exceptions.h"
+#endif
+
+#endif /* harness_preload_H */
diff --git a/xdl/third_party/tbb/src/test/harness_report.h b/xdl/third_party/tbb/src/test/harness_report.h
new file mode 100644
index 00000000..6b857cd2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_report.h
@@ -0,0 +1,178 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Just the tracing portion of the harness.
+//
+// This header defines TRACE and TRACENL macros, which use REPORT like syntax and
+// are useful for duplicating trace output to the standard debug output on Windows.
+// It is possible to add the ability of automatic extending messages with additional
+// info (file, line, function, time, thread ID, ...).
+//
+// Macros output nothing when test app runs in non-verbose mode (default).
+//
+
+#ifndef tbb_tests_harness_report_H
+#define tbb_tests_harness_report_H
+
+#if defined(MAX_TRACE_SIZE) && MAX_TRACE_SIZE < 1024
+    #undef MAX_TRACE_SIZE
+#endif
+#ifndef MAX_TRACE_SIZE
+    #define MAX_TRACE_SIZE  1024
+#endif
+
+#if __SUNPRO_CC
+#include <stdio.h>
+#else
+#include <cstdio>
+#endif
+
+#include <cstdarg>
+
+// Need to include "tbb/tbb_config.h" to obtain the definition of __TBB_DEFINE_MIC.
+#include "tbb/tbb_config.h"
+
+#if __TBB_DEFINE_MIC
+#include "harness_mic.h"
+#endif
+
+#ifdef HARNESS_INCOMPLETE_SOURCES
+#error Source files are not complete. Check the build environment
+#endif
+
+#if _MSC_VER
+    #define snprintf _snprintf
+#if _MSC_VER<=1400
+    #define vsnprintf _vsnprintf
+#endif
+#endif
+
+namespace Harness {
+    namespace internal {
+
+#ifndef TbbHarnessReporter
+    struct TbbHarnessReporter {
+        void Report ( const char* msg ) {
+            printf( "%s", msg );
+            fflush(stdout);
+#ifdef _WINDOWS_
+            OutputDebugStringA(msg);
+#endif
+        }
+    }; // struct TbbHarnessReporter
+#endif /* !TbbHarnessReporter */
+
+    class Tracer {
+        int         m_flags;
+        const char  *m_file;
+        const char  *m_func;
+        size_t      m_line;
+
+        TbbHarnessReporter m_reporter;
+
+    public:
+        enum  {
+            prefix = 1,
+            need_lf = 2
+        };
+
+        Tracer(): m_flags(0), m_file(NULL), m_func(NULL), m_line(0) {}
+
+        Tracer*  set_trace_info ( int flags, const char *file, size_t line, const char *func ) {
+            m_flags = flags;
+            m_line = line;
+            m_file = file;
+            m_func = func;
+            return  this;
+        }
+
+        void  trace ( const char* fmt, ... ) {
+            char    msg[MAX_TRACE_SIZE];
+            char    msg_fmt_buf[MAX_TRACE_SIZE];
+            const char  *msg_fmt = fmt;
+            if ( m_flags & prefix ) {
+                snprintf (msg_fmt_buf, MAX_TRACE_SIZE, "[%s] %s", m_func, fmt);
+                msg_fmt = msg_fmt_buf;
+            }
+            std::va_list argptr;
+            va_start (argptr, fmt);
+            int len = vsnprintf (msg, MAX_TRACE_SIZE, msg_fmt, argptr);
+            va_end (argptr);
+            if ( m_flags & need_lf &&
+                 len < MAX_TRACE_SIZE - 1  &&  msg_fmt[len-1] != '\n' )
+            {
+                msg[len] = '\n';
+                msg[len + 1] = 0;
+            }
+            m_reporter.Report(msg);
+        }
+    }; // class Tracer
+
+    static Tracer tracer;
+
+    template<int>
+    bool not_the_first_call () {
+        static bool first_call = false;
+        bool res = first_call;
+        first_call = true;
+        return res;
+    }
+
+    } // namespace internal
+} // namespace Harness
+
+#if defined(_MSC_VER)  &&  _MSC_VER >= 1300  ||  defined(__GNUC__)  ||  defined(__GNUG__)
+    #define HARNESS_TRACE_ORIG_INFO __FILE__, __LINE__, __FUNCTION__
+#else
+    #define HARNESS_TRACE_ORIG_INFO __FILE__, __LINE__, ""
+    #define __FUNCTION__ ""
+#endif
+
+
+//! printf style tracing macro
+/** This variant of TRACE adds trailing line-feed (new line) character, if it is absent. **/
+#define TRACE Harness::internal::tracer.set_trace_info(Harness::internal::Tracer::need_lf, HARNESS_TRACE_ORIG_INFO)->trace
+
+//! printf style tracing macro without automatic new line character adding
+#define TRACENL Harness::internal::tracer.set_trace_info(0, HARNESS_TRACE_ORIG_INFO)->trace
+
+//! printf style tracing macro with additional information prefix (e.g. current function name)
+#define TRACEP Harness::internal::tracer.set_trace_info(Harness::internal::Tracer::prefix | \
+                                    Harness::internal::Tracer::need_lf, HARNESS_TRACE_ORIG_INFO)->trace
+
+//! printf style remark macro
+/** Produces output only when the test is run with the -v (verbose) option. **/
+#define REMARK  !Verbose ? (void)0 : TRACENL
+
+//! printf style remark macro
+/** Produces output only when invoked first time.
+    Only one instance of this macro is allowed per source code line. **/
+#define REMARK_ONCE (!Verbose || Harness::internal::not_the_first_call<__LINE__>()) ? (void)0 : TRACE
+
+//! printf style reporting macro
+/** On heterogeneous platforms redirects its output to the host side. **/
+#define REPORT TRACENL
+
+//! printf style reporting macro
+/** Produces output only when invoked first time.
+    Only one instance of this macro is allowed per source code line. **/
+#define REPORT_ONCE (Harness::internal::not_the_first_call<__LINE__>()) ? (void)0 : TRACENL
+
+#endif /* tbb_tests_harness_report_H */
diff --git a/xdl/third_party/tbb/src/test/harness_runtime_loader.h b/xdl/third_party/tbb/src/test/harness_runtime_loader.h
new file mode 100644
index 00000000..7ed4dfb2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_runtime_loader.h
@@ -0,0 +1,37 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef harness_runtime_loader_H
+#define harness_runtime_loader_H
+
+#if HARNESS_USE_RUNTIME_LOADER
+    #if TEST_USES_TBB
+        #define TBB_PREVIEW_RUNTIME_LOADER 1
+        #include "tbb/runtime_loader.h"
+        static char const * _path[] = { ".", NULL };
+        // declaration must be placed before 1st TBB call
+        static tbb::runtime_loader _runtime_loader( _path );
+    #else // TEST_USES_TBB
+        // if TBB library is not used, no need to test Runtime Loader
+        #define HARNESS_SKIP_TEST 1
+    #endif // TEST_USES_TBB
+#endif // HARNESS_USE_RUNTIME_LOADER
+
+#endif /* harness_runtime_loader_H */
diff --git a/xdl/third_party/tbb/src/test/harness_state_trackable.h b/xdl/third_party/tbb/src/test/harness_state_trackable.h
new file mode 100644
index 00000000..ddb98b4b
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_state_trackable.h
@@ -0,0 +1,147 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Declarations for a class that can track operations applied to its objects.
+// This header is an optional part of the test harness.
+
+#ifndef tbb_test_harness_state_trackable_H
+#define tbb_test_harness_state_trackable_H
+
+#include <cstddef>
+#include <map>
+#include <tbb/atomic.h>
+
+#include "harness_assert.h"
+
+namespace Harness{
+    struct StateTrackableBase {
+        enum StateValue {
+            ZeroInitialized     = 0,
+            DefaultInitialized  = 0xDEFAUL,
+            DirectInitialized   = 0xD1111,
+            CopyInitialized     = 0xC0314,
+            MoveInitialized     = 0xAAAAA,
+            Assigned            = 0x11AED,
+            MoveAssigned        = 0x22AED,
+            MovedFrom           = 0xFFFFF,
+            Destroyed           = 0xDEADF00,
+            Unspecified         = 0xEEEEE
+        };
+
+        class State {
+        public:
+            State() __TBB_NOEXCEPT(true) : state(Unspecified) {
+                assignNewState(Unspecified);
+            }
+            State(const State& s) : state(Unspecified) {
+                assignNewState(s.state);
+            }
+            State(StateValue s) __TBB_NOEXCEPT(true) : state(Unspecified) {
+                assignNewState(s);
+            };
+            State& operator=(StateValue s) __TBB_NOEXCEPT(true) {
+                assignNewState(s);
+                return *this;
+            }
+            operator StateValue() const __TBB_NOEXCEPT(true) { return state; }
+        private:
+            void assignNewState(StateValue s) __TBB_NOEXCEPT(true);
+            StateValue state;
+        };
+    };
+
+    struct StateTrackableCounters {
+        static void reset() {
+            counters[StateTrackableBase::ZeroInitialized] = counters[StateTrackableBase::DefaultInitialized] =
+                counters[StateTrackableBase::DirectInitialized] = counters[StateTrackableBase::CopyInitialized] =
+                counters[StateTrackableBase::MoveInitialized] = counters[StateTrackableBase::Assigned] =
+                counters[StateTrackableBase::MoveAssigned] = counters[StateTrackableBase::MovedFrom] =
+                counters[StateTrackableBase::Destroyed] = counters[StateTrackableBase::Unspecified] = 0;
+        }
+
+        static bool initialize() {
+            reset();
+            return true;
+        }
+
+        typedef std::map<StateTrackableBase::StateValue, tbb::atomic<std::size_t> > counters_t;
+        static counters_t counters;
+    };
+
+    StateTrackableCounters::counters_t StateTrackableCounters::counters;
+    static const bool stateTrackableBaseStateInitialized = StateTrackableCounters::initialize();
+
+    void StateTrackableBase::State::assignNewState(StateValue s) __TBB_NOEXCEPT(true) {
+        ASSERT(stateTrackableBaseStateInitialized, "State trackable counters are not initialized");
+        ASSERT(s == StateTrackableBase::Unspecified ||
+            StateTrackableCounters::counters.find(s) != StateTrackableCounters::counters.end(), "The current state value is unknown");
+        ASSERT(state == StateTrackableBase::Unspecified ||
+            StateTrackableCounters::counters.find(state) != StateTrackableCounters::counters.end(), "The new state value is unknown");
+        state = s;
+        ++StateTrackableCounters::counters[state];
+    }
+
+    template<bool allow_zero_initialized_state = false>
+    struct StateTrackable: StateTrackableBase {
+        static const bool is_zero_initialized_state_allowed = allow_zero_initialized_state;
+        State state;
+
+        bool is_valid() const {
+            return state == DefaultInitialized || state == DirectInitialized || state == CopyInitialized
+                || state == MoveInitialized || state == Assigned || state == MoveAssigned || state == MovedFrom
+                || (allow_zero_initialized_state && state == ZeroInitialized)
+                ;
+        }
+
+        StateTrackable (intptr_t)       __TBB_NOEXCEPT(true) : state (DirectInitialized){}
+        StateTrackable ()               __TBB_NOEXCEPT(true) : state (DefaultInitialized){}
+        StateTrackable (const StateTrackable & src) __TBB_NOEXCEPT(true) {
+            ASSERT( src.is_valid(), "bad source for copy" );
+            state = CopyInitialized;
+        }
+    #if __TBB_CPP11_RVALUE_REF_PRESENT
+        StateTrackable (StateTrackable && src) __TBB_NOEXCEPT(true) {
+            ASSERT( src.is_valid(), "bad source for move?" );
+            state = MoveInitialized;
+            src.state = MovedFrom;
+        }
+        StateTrackable & operator=(StateTrackable && src) __TBB_NOEXCEPT(true) {
+            ASSERT( src.is_valid(), "bad source for assignment" );
+            ASSERT( is_valid(), "assigning to invalid instance?" );
+
+            src.state = MovedFrom;
+            state = MoveAssigned;
+            return *this;
+        }
+    #endif
+        StateTrackable & operator=(const StateTrackable & src) __TBB_NOEXCEPT(true) {
+            ASSERT( src.is_valid(), "bad source for assignment?" );
+            ASSERT( is_valid(), "assigning to invalid instance?" );
+
+            state = Assigned;
+            return *this;
+        }
+        ~StateTrackable () __TBB_NOEXCEPT(true) {
+            ASSERT( is_valid(), "Calling destructor on invalid instance? (twice destructor call?)" );
+            state = Destroyed;
+        }
+    };
+} // Harness
+#endif // tbb_test_harness_state_trackable_H
diff --git a/xdl/third_party/tbb/src/test/harness_task.h b/xdl/third_party/tbb/src/test/harness_task.h
new file mode 100644
index 00000000..78a0b727
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_task.h
@@ -0,0 +1,55 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/task.h"
+#include "harness.h"
+
+//! Helper for verifying that old use cases of spawn syntax still work.
+tbb::task* GetTaskPtr( int& counter ) {
+    ++counter;
+    return NULL;
+}
+
+class TaskGenerator: public tbb::task {
+    int m_ChildCount;
+    int m_Depth;
+
+public:
+    TaskGenerator( int child_count, int _depth ) : m_ChildCount(child_count), m_Depth(_depth) {}
+    ~TaskGenerator( ) { m_ChildCount = m_Depth = -125; }
+
+    tbb::task* execute() __TBB_override {
+        ASSERT( m_ChildCount>=0 && m_Depth>=0, NULL );
+        if( m_Depth>0 ) {
+            recycle_as_safe_continuation();
+            set_ref_count( m_ChildCount+1 );
+            int k=0;
+            for( int j=0; j<m_ChildCount; ++j ) {
+                tbb::task& t = *new( allocate_child() ) TaskGenerator(m_ChildCount/2,m_Depth-1);
+                GetTaskPtr(k)->spawn(t);
+            }
+            ASSERT(k==m_ChildCount,NULL);
+            --m_Depth;
+            __TBB_Yield();
+            ASSERT( state()==recycle && ref_count()>0, NULL);
+        }
+        return NULL;
+    }
+};
diff --git a/xdl/third_party/tbb/src/test/harness_tbb_independence.h b/xdl/third_party/tbb/src/test/harness_tbb_independence.h
new file mode 100644
index 00000000..2cfce82c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_tbb_independence.h
@@ -0,0 +1,87 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef harness_tbb_independence_H
+#define harness_tbb_independence_H
+
+// The tests which include tbb/atomic.h gain the dependency on the __TBB_ASSERT
+// implementation even the test does not use anything from it. But almost all
+// compilers optimize out unused inline function so they throw out the
+// dependency. But to be pedantic with the standard the __TBB_ASSERT
+// implementation should be provided. Moreover the offload compiler really
+// requires it.
+#include "../tbb/tbb_assert_impl.h"
+
+#if __linux__  && __ia64__
+
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+#include "tbb/tbb_machine.h"
+
+#include <pthread.h>
+
+// Can't use Intel compiler intrinsic due to internal error reported by 10.1 compiler
+pthread_mutex_t counter_mutex = PTHREAD_MUTEX_INITIALIZER;
+
+int32_t __TBB_machine_fetchadd4__TBB_full_fence (volatile void *ptr, int32_t value)
+{
+    pthread_mutex_lock(&counter_mutex);
+    int32_t result = *(int32_t*)ptr;
+    *(int32_t*)ptr = result + value;
+    pthread_mutex_unlock(&counter_mutex);
+    return result;
+}
+
+int64_t __TBB_machine_fetchadd8__TBB_full_fence (volatile void *ptr, int64_t value)
+{
+    pthread_mutex_lock(&counter_mutex);
+    int32_t result = *(int32_t*)ptr;
+    *(int32_t*)ptr = result + value;
+    pthread_mutex_unlock(&counter_mutex);
+    return result;
+}
+
+void __TBB_machine_pause(int32_t /*delay*/) {  __TBB_Yield(); }
+
+pthread_mutex_t cas_mutex = PTHREAD_MUTEX_INITIALIZER;
+
+extern "C" int64_t __TBB_machine_cmpswp8__TBB_full_fence(volatile void *ptr, int64_t value, int64_t comparand)
+{
+    pthread_mutex_lock(&cas_mutex);
+    int64_t result = *(int64_t*)ptr;
+    if (result == comparand)
+        *(int64_t*)ptr = value;
+    pthread_mutex_unlock(&cas_mutex);
+    return result;
+}
+
+pthread_mutex_t fetchstore_mutex = PTHREAD_MUTEX_INITIALIZER;
+
+int64_t __TBB_machine_fetchstore8__TBB_full_fence (volatile void *ptr, int64_t value)
+{
+    pthread_mutex_lock(&fetchstore_mutex);
+    int64_t result = *(int64_t*)ptr;
+    *(int64_t*)ptr = value;
+    pthread_mutex_unlock(&fetchstore_mutex);
+    return result;
+}
+
+#endif /* __linux__  && __ia64 */
+
+#endif // harness_tbb_independence_H
diff --git a/xdl/third_party/tbb/src/test/harness_test_cases_framework.h b/xdl/third_party/tbb/src/test/harness_test_cases_framework.h
new file mode 100644
index 00000000..d4fe70f8
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_test_cases_framework.h
@@ -0,0 +1,240 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_harness_test_cases_framework_H
+#define tbb_harness_test_cases_framework_H
+
+#if defined(_MSC_VER)
+    #define _SCL_SECURE_NO_WARNINGS
+#endif
+
+#undef DO_ITT_NOTIFY
+
+#include "harness.h"
+#include "harness_assert.h"
+#include "tbb/tbb_stddef.h"
+
+#include <cstdlib>
+
+#include <vector>
+#include <algorithm>
+#include <string>
+#include <sstream>
+#include <iostream>
+
+namespace test_framework{
+    template<typename test_class>
+    void run_test(){
+        test_class()();
+    }
+
+#if TBB_USE_EXCEPTIONS
+    struct assertion_failure:std::exception{
+        const char* my_filename;
+        int my_line;
+        const char* my_expression;
+        const char * my_comment;
+        assertion_failure(const char* filename, int line, const char* expression, const char * comment):
+             my_filename(filename),
+             my_line(line),
+             my_expression(expression),
+             my_comment(comment)
+        {}
+        virtual const char* what() const throw() __TBB_override {
+            return "test assertion failed";
+        }
+    };
+    void throw_assertion_failure(){throw assertion_failure("",0,"","");}
+    void throw_assertion_failure(const char* filename, int line, const char* expression, const char * comment){
+        throw assertion_failure(filename, line, expression, comment);
+    }
+#endif // TBB_USE_EXCEPTIONS
+
+    class test_suite{
+        typedef void(*run_test_function_pointer_type)();
+        typedef std::pair<std::string, run_test_function_pointer_type> tc_record_pair;
+        std::vector<tc_record_pair > test_cases;
+    public:
+        template<class test_class>
+        void register_test_case(std::string const& name, test_class * ){
+            test_cases.push_back(tc_record_pair(name,& run_test<test_class>));
+        }
+        std::string operator()(bool silent=false){
+            std::stringstream str;
+            size_t failed=0;
+            for (size_t i=0;i<test_cases.size();++i){
+#if TBB_USE_EXCEPTIONS
+                try{
+                    (test_cases[i].second)();
+                }catch(std::exception& e){
+                    failed++;
+                    str<<"test case \""<<test_cases[i].first<<"\" failed with exception. what():\""<<e.what()<<"\""<<std::endl;
+                }
+#else
+                    (test_cases[i].second)();
+#endif
+            }
+            if (!silent) {
+                str<<test_cases.size()<<" test cases are run; "<<failed<<" failed"<<std::endl;
+            }
+            return str.str();
+        }
+    };
+    test_suite& get_suite_ref(){static test_suite ts; return ts;}
+    void run_all_and_print_results(test_suite& ts,std::ostream& o , bool silent=false){
+        o<<ts(silent);
+    }
+}
+using test_framework::get_suite_ref;
+#define TEST_CASE_WITH_FIXTURE(TC_NAME,FIXTURE_NAME)       \
+        struct TC_NAME;                                    \
+        struct TC_NAME:FIXTURE_NAME {                      \
+            /* explicitly implemented default constructor  \
+              is need here to please gcc 4.3.2*/           \
+            TC_NAME(){}                                    \
+            void operator()();                             \
+        };                                                 \
+        bool TC_NAME##_registerd =  (get_suite_ref().register_test_case(#TC_NAME,static_cast<TC_NAME*>(0)),true);\
+        void TC_NAME::operator()()
+
+namespace test_framework_unit_tests{
+    namespace test_helper{
+        template <size_t id> struct tag{};
+        template<typename tag>
+        struct test_case{
+            static bool is_run;
+            void operator()(){
+                is_run=true;
+            }
+        };
+        template<typename tag> bool test_case<tag>::is_run = false;
+
+    }
+    using namespace test_framework;
+    namespace test_test_suite_ref{
+        void run_all_runs_all_registered_test_cases(){
+            test_suite s;
+            using test_helper::tag;
+            test_helper::test_case<tag<__LINE__> > tc1;
+            test_helper::test_case<tag<__LINE__> > tc2;
+            s.register_test_case("tc1",&tc1);
+            s.register_test_case("tc2",&tc2);
+            s();
+            ASSERT(tc1.is_run && tc2.is_run,"test_suite::operator() should run all the tests");
+        }
+
+        struct silent_switch_fixture{
+            test_helper::test_case<test_helper::tag<__LINE__> > empty_test_case;
+        };
+        struct run_all_and_print_results_should_respect_silent_mode: silent_switch_fixture{
+            void operator()(){
+                using test_helper::tag;
+                test_helper::test_case<tag<__LINE__> > do_nothing_tc;
+                test_suite ts;
+                ts.register_test_case("tc_name",&do_nothing_tc);
+                bool silent =true;
+                ASSERT(ts(silent).empty(),"in silent mode no message except error should be output");
+            }
+        };
+        struct run_all_and_print_results_should_respect_verbose_mode: silent_switch_fixture{
+            void operator()(){
+                using test_helper::tag;
+                test_helper::test_case<tag<__LINE__> > do_nothing_tc;
+                test_suite ts;
+                ts.register_test_case("tc_name",&do_nothing_tc);
+                bool silent =true;
+                ASSERT(!ts(!silent).empty(),"in verbose mode all messages should be outputed");
+            }
+        };
+    }
+    namespace test_test_case_macro{
+        test_suite& get_suite_ref(){static test_suite ts; return ts;}
+        typedef test_helper::test_case<test_helper::tag<__LINE__> > unique_test_type;
+        TEST_CASE_WITH_FIXTURE(test_auto_registration,unique_test_type){
+            unique_test_type::operator()();
+        }
+        void run_test_test_case_macro(){
+            get_suite_ref()();
+            ASSERT(unique_test_type::is_run,"test case macro should register the test case in suite");
+        }
+        void test_test_case_macro_does_not_create_test_case_object(){
+            ASSERT(false,"to implement");
+        }
+    }
+    namespace internal_assertions_failure_test_cases{
+
+        test_suite& get_suite_ref(){static test_suite ts; return ts;}
+
+        //TODO: investigate compilation errors regarding tbb::set_assertion_handler
+//        struct empty_fixture{};
+//        TEST_CASE_WITH_FIXTURE(test_internal_assertion_does_not_stop_test_suite,empty_fixture){
+//            struct handler{
+//                static void _( const char* /*filename*/, int /*line*/, const char* /*expression*/, const char * /*comment*/ ){
+//                }
+//            };
+//
+//            tbb::assertion_handler_type previous  = tbb::set_assertion_handler(handler::_);
+//            __TBB_ASSERT(false,"this assert should not stop the test suite run");
+//            tbb::set_assertion_handler(previous );
+////            ASSERT(assertion_handler::is_called,"__TBB_ASSERT should call installed assertion handler");
+//        }
+//        TEST_CASE_WITH_FIXTURE(test_internal_assertion_does_mark_the_test_as_failed,empty_fixture){
+//            test_suite ts;
+//            struct _{
+////                static
+//                static void assertion_handler_type( const char* /*filename*/, int /*line*/, const char* /*expression*/, const char * /*comment*/ ){
+//                }
+//            };
+//            tbb::assertion_handler_type previous  = tbb::set_assertion_handler(_::assertion_handler_type);
+//            __TBB_ASSERT(false,"this assert should not stop the test suite run");
+//            tbb::set_assertion_handler(previous );
+//            std::string result = ts();
+//            std::size_t test_case_name_begin_pos = result.find("test case \"");
+//            std::size_t failed_begin_pos = result.find("failed");
+//            ASSERT(test_case_name_begin_pos!=std::string::npos && failed_begin_pos!=std::string::npos && test_case_name_begin_pos<failed_begin_pos,"internal assertion should result in test failure");
+//        }
+
+    }
+    void run_all_test(){
+        test_test_suite_ref::run_all_runs_all_registered_test_cases();
+        test_test_suite_ref::run_all_and_print_results_should_respect_silent_mode()();
+        test_test_suite_ref::run_all_and_print_results_should_respect_verbose_mode()();
+        test_test_case_macro::run_test_test_case_macro();
+        //TODO: uncomment and implement
+//        test_test_case_macro::test_test_case_macro_does_not_create_test_case_object();
+        run_all_and_print_results(internal_assertions_failure_test_cases::get_suite_ref(),std::cout,!Verbose);
+    }
+}
+
+int TestMain (){
+#if TBB_USE_EXCEPTIONS
+    SetHarnessErrorProcessing(test_framework::throw_assertion_failure);
+    //TODO: deal with assertions during stack unwinding
+    //tbb::set_assertion_handler( test_framework::throw_assertion_failure );
+#endif
+    {
+        test_framework_unit_tests::run_all_test();
+    }
+    bool silent = !Verbose;
+    run_all_and_print_results(test_framework::get_suite_ref(),std::cout,silent);
+    return Harness::Done;
+}
+
+#endif //tbb_harness_test_cases_framework_H
diff --git a/xdl/third_party/tbb/src/test/harness_tls.h b/xdl/third_party/tbb/src/test/harness_tls.h
new file mode 100644
index 00000000..c483a6af
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_tls.h
@@ -0,0 +1,79 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+class LimitTLSKeysTo {
+#if _WIN32 || _WIN64
+    #if __TBB_WIN8UI_SUPPORT && !defined(TLS_OUT_OF_INDEXES)
+        // for SDKs for Windows*8 Store Apps that did not redirect TLS to FLS
+        #define TlsAlloc() FlsAlloc(NULL)
+        #define TlsFree FlsFree
+        #define TLS_OUT_OF_INDEXES FLS_OUT_OF_INDEXES
+    #endif
+    typedef DWORD handle;
+#else // _WIN32 || _WIN64
+    typedef pthread_key_t handle;
+#endif
+    // for platforms that not limit number of TLS keys, set artificial limit
+    static const int LIMIT = 16*1024;
+    handle handles[LIMIT];
+    int    lastUsedIdx;
+public:
+    LimitTLSKeysTo(int keep_keys) {
+        for (lastUsedIdx=0; lastUsedIdx<LIMIT; lastUsedIdx++) {
+#if _WIN32 || _WIN64
+            handle h = TlsAlloc();
+            if (h==TLS_OUT_OF_INDEXES)
+#else
+            int setspecific_dummy=10;
+            if (pthread_key_create(&handles[lastUsedIdx], NULL)!=0)
+#endif
+            {
+                break;
+            }
+#if _WIN32 || _WIN64
+            handles[lastUsedIdx] = h;
+#else
+            pthread_setspecific(handles[lastUsedIdx], &setspecific_dummy);
+#endif
+        }
+        lastUsedIdx--;
+        ASSERT(lastUsedIdx >= keep_keys-1, "Less TLS keys are available than requested");
+        for (; keep_keys>0; keep_keys--, lastUsedIdx--) {
+#if _WIN32 || _WIN64
+            TlsFree(handles[lastUsedIdx]);
+#else
+            int ret = pthread_key_delete(handles[lastUsedIdx]);
+            ASSERT(!ret, "Can't delete a key");
+#endif
+        }
+        REMARK("%d thread local objects allocated in advance\n", lastUsedIdx+1);
+    }
+    ~LimitTLSKeysTo() {
+        for (int i=0; i<=lastUsedIdx; i++) {
+#if _WIN32 || _WIN64
+            TlsFree(handles[i]);
+#else
+            int ret = pthread_key_delete(handles[i]);
+            ASSERT(!ret, "Can't delete a key");
+#endif
+        }
+        lastUsedIdx = 0;
+    }
+};
diff --git a/xdl/third_party/tbb/src/test/harness_tsx.h b/xdl/third_party/tbb/src/test/harness_tsx.h
new file mode 100644
index 00000000..688acf15
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/harness_tsx.h
@@ -0,0 +1,70 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Header that includes Intel(R) Transactional Synchronization Extensions (Intel(R) TSX) specific test functions
+
+#if __TBB_TSX_AVAILABLE
+#define __TBB_TSX_TESTING_ENABLED_FOR_THIS_COMPILER (__INTEL_COMPILER || __GNUC__ || _MSC_VER || __SUNPRO_CC)
+#if __TBB_TSX_TESTING_ENABLED_FOR_THIS_COMPILER
+
+#include "harness_defs.h"
+
+inline static bool IsInsideTx()
+{
+    return __TBB_machine_is_in_transaction() != 0;
+}
+
+#if _MSC_VER
+#include <intrin.h> // for __cpuid
+#endif
+// TODO: consider reusing tbb_misc.cpp:cpu_has_speculation() instead of code duplication.
+bool have_TSX() {
+    bool result = false;
+    const int hle_ebx_mask = 1<<4;
+    const int rtm_ebx_mask = 1<<11;
+#if _MSC_VER
+    int info[4] = {0,0,0,0};
+    const int reg_ebx = 1;
+    int old_ecx = 0;
+    __cpuidex(info, 7, old_ecx);
+    result = (info[reg_ebx] & rtm_ebx_mask)!=0;
+    if( result ) ASSERT( (info[reg_ebx] & hle_ebx_mask)!=0, NULL );
+#elif __GNUC__ || __SUNPRO_CC
+    int32_t reg_ebx = 0;
+    int32_t reg_eax = 7;
+    int32_t reg_ecx = 0;
+    __asm__ __volatile__ ( "movl %%ebx, %%esi\n"
+                           "cpuid\n"
+                           "movl %%ebx, %0\n"
+                           "movl %%esi, %%ebx\n"
+                           : "=a"(reg_ebx) : "0" (reg_eax), "c" (reg_ecx) : "esi",
+#if __TBB_x86_64
+                           "ebx",
+#endif
+                           "edx"
+                           );
+    result = (reg_ebx & rtm_ebx_mask)!=0 ;
+    if( result ) ASSERT( (reg_ebx & hle_ebx_mask)!=0, NULL );
+#endif
+    return result;
+}
+
+#endif /* __TBB_TSX_TESTING_ENABLED_FOR_THIS_COMPILER */
+#endif /* __TBB_TSX_AVAILABLE */
diff --git a/xdl/third_party/tbb/src/test/test_ScalableAllocator.cpp b/xdl/third_party/tbb/src/test/test_ScalableAllocator.cpp
new file mode 100644
index 00000000..5113f8c2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_ScalableAllocator.cpp
@@ -0,0 +1,212 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test whether scalable_allocator complies with the requirements in 20.1.5 of ISO C++ Standard (1998).
+
+#define __TBB_EXTRA_DEBUG 1 // enables additional checks
+#define TBB_PREVIEW_MEMORY_POOL 1
+
+#include "harness_assert.h"
+#if !__TBB_SOURCE_DIRECTLY_INCLUDED
+#include "harness_tbb_independence.h" // because harness_allocator.h requires atomics
+#endif
+#include "tbb/memory_pool.h"
+#include "tbb/scalable_allocator.h"
+
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+// the actual body of the test is there:
+#include "test_allocator.h"
+#include "harness_allocator.h"
+
+#if _MSC_VER
+#include "tbb/machine/windows_api.h"
+#endif /* _MSC_VER */
+
+typedef static_counting_allocator<tbb::memory_pool_allocator<char> > cnt_alloc_t;
+typedef local_counting_allocator<std::allocator<char> > cnt_provider_t;
+class MinimalAllocator : cnt_provider_t {
+public:
+    typedef char value_type;
+    MinimalAllocator() {
+        REMARK("%p::ctor\n", this);
+    }
+    MinimalAllocator(const MinimalAllocator&s) : cnt_provider_t(s) {
+        REMARK("%p::ctor(%p)\n", this, &s);
+    }
+    ~MinimalAllocator() {
+        REMARK("%p::dtor: alloc=%u/%u free=%u/%u\n", this,
+            unsigned(items_allocated),unsigned(allocations),
+            unsigned(items_freed), unsigned(frees) );
+        ASSERT(allocations==frees && items_allocated==items_freed,0);
+        if( allocations ) { // non-temporal copy
+            // TODO: describe consumption requirements
+            ASSERT(items_allocated>cnt_alloc_t::items_allocated, 0);
+        }
+    }
+    void *allocate(size_t sz) {
+        void *p = cnt_provider_t::allocate(sz);
+        REMARK("%p::allocate(%u) = %p\n", this, unsigned(sz), p);
+        return p;
+    }
+    void deallocate(void *p, size_t sz) {
+        ASSERT(allocations>frees,0);
+        REMARK("%p::deallocate(%p, %u)\n", this, p, unsigned(sz));
+        cnt_provider_t::deallocate(cnt_provider_t::pointer(p), sz);
+    }
+};
+
+class NullAllocator {
+public:
+    typedef char value_type;
+    NullAllocator() { }
+    NullAllocator(const NullAllocator&) { }
+    ~NullAllocator() { }
+    void *allocate(size_t) { return NULL; }
+    void deallocate(void *, size_t) { ASSERT(0, NULL); }
+};
+
+void TestZeroSpaceMemoryPool()
+{
+    tbb::memory_pool<NullAllocator> pool;
+    bool allocated = pool.malloc(16) || pool.malloc(9*1024);
+    ASSERT(!allocated, "Allocator with no memory must not allocate anything.");
+}
+
+#if !TBB_USE_EXCEPTIONS
+struct FixedPool {
+    void  *buf;
+    size_t size;
+    bool   used;
+    FixedPool(void *a_buf, size_t a_size) : buf(a_buf), size(a_size), used(false) {}
+};
+
+static void *fixedBufGetMem(intptr_t pool_id, size_t &bytes)
+{
+    if (((FixedPool*)pool_id)->used)
+        return NULL;
+
+    ((FixedPool*)pool_id)->used = true;
+    bytes = ((FixedPool*)pool_id)->size;
+    return bytes? ((FixedPool*)pool_id)->buf : NULL;
+}
+#endif
+
+/* test that pools in small space are either usable or not created
+   (i.e., exception raised) */
+void TestSmallFixedSizePool()
+{
+    char *buf;
+    bool allocated = false;
+
+    for (size_t sz = 0; sz < 64*1024; sz = sz? 3*sz : 3) {
+        buf = (char*)malloc(sz);
+#if TBB_USE_EXCEPTIONS
+        try {
+            tbb::fixed_pool pool(buf, sz);
+/* Check that pool is usable, i.e. such an allocation exists,
+   that can be fulfilled from the pool. 16B allocation fits in 16KB slabs,
+   so it requires at least 16KB. Requirement of 9KB allocation is more modest.
+*/
+            allocated = pool.malloc( 16 ) || pool.malloc( 9*1024 );
+        } catch (std::invalid_argument&) {
+            ASSERT(!sz, "expect std::invalid_argument for zero-sized pool only");
+        } catch (...) {
+            ASSERT(0, "wrong exception type;");
+        }
+#else
+/* Do not test high-level pool interface because pool ctor emit exception
+   on creation failure. Instead test same functionality via low-level interface.
+   TODO: add support for configuration with disabled exceptions to pools.
+*/
+        rml::MemPoolPolicy pol(fixedBufGetMem, NULL, 0, /*fixedSizePool=*/true,
+                               /*keepMemTillDestroy=*/false);
+        rml::MemoryPool *pool;
+        FixedPool fixedPool(buf, sz);
+
+        rml::MemPoolError ret = pool_create_v1((intptr_t)&fixedPool, &pol, &pool);
+
+        if (ret == rml::POOL_OK) {
+            allocated = pool_malloc(pool, 16) || pool_malloc(pool, 9*1024);
+            pool_destroy(pool);
+        } else
+            ASSERT(ret == rml::NO_MEMORY, "Expected that pool either valid "
+                                     "or have no memory to be created");
+#endif
+        free(buf);
+    }
+    ASSERT(allocated, "Maximal buf size should be enough to create working fixed_pool");
+#if TBB_USE_EXCEPTIONS
+    try {
+        tbb::fixed_pool pool(NULL, 10*1024*1024);
+        ASSERT(0, "Useless allocator with no memory must not be created");
+    } catch (std::invalid_argument&) {
+    } catch (...) {
+        ASSERT(0, "wrong exception type; expected invalid_argument");
+    }
+#endif
+}
+
+int TestMain () {
+#if _MSC_VER && !__TBBMALLOC_NO_IMPLICIT_LINKAGE && !__TBB_WIN8UI_SUPPORT
+    #ifdef _DEBUG
+        ASSERT(!GetModuleHandle("tbbmalloc.dll") && GetModuleHandle("tbbmalloc_debug.dll"),
+            "test linked with wrong (non-debug) tbbmalloc library");
+    #else
+        ASSERT(!GetModuleHandle("tbbmalloc_debug.dll") && GetModuleHandle("tbbmalloc.dll"),
+            "test linked with wrong (debug) tbbmalloc library");
+    #endif
+#endif /* _MSC_VER && !__TBBMALLOC_NO_IMPLICIT_LINKAGE */
+    int result = TestMain<tbb::scalable_allocator<void> >();
+    {
+        tbb::memory_pool<tbb::scalable_allocator<int> > pool;
+        result += TestMain(tbb::memory_pool_allocator<void>(pool) );
+    }{
+        tbb::memory_pool<MinimalAllocator> pool;
+        cnt_alloc_t alloc(( tbb::memory_pool_allocator<char>(pool) )); // double parentheses to avoid function declaration
+        result += TestMain(alloc);
+    }{
+        static char buf[1024*1024*4];
+        tbb::fixed_pool pool(buf, sizeof(buf));
+        const char *text = "this is a test";// 15 bytes
+        char *p1 = (char*)pool.malloc( 16 );
+        ASSERT(p1, NULL);
+        strcpy(p1, text);
+        char *p2 = (char*)pool.realloc( p1, 15 );
+        ASSERT( p2 && !strcmp(p2, text), "realloc broke memory" );
+
+        result += TestMain(tbb::memory_pool_allocator<void>(pool) );
+
+        // try allocate almost entire buf keeping some reasonable space for internals
+        char *p3 = (char*)pool.realloc( p2, sizeof(buf)-128*1024 );
+        ASSERT( p3, "defragmentation failed" );
+        ASSERT( !strcmp(p3, text), "realloc broke memory" );
+        for( size_t sz = 10; sz < sizeof(buf); sz *= 2) {
+            ASSERT( pool.malloc( sz ), NULL);
+            pool.recycle();
+        }
+
+        result += TestMain(tbb::memory_pool_allocator<void>(pool) );
+    }
+    TestSmallFixedSizePool();
+    TestZeroSpaceMemoryPool();
+
+    ASSERT( !result, NULL );
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_ScalableAllocator_STL.cpp b/xdl/third_party/tbb/src/test/test_ScalableAllocator_STL.cpp
new file mode 100644
index 00000000..6e07435d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_ScalableAllocator_STL.cpp
@@ -0,0 +1,42 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test whether scalable_allocator works with some of the host's STL containers.
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#define __TBB_EXTRA_DEBUG 1 // enables additional checks
+#define TBB_PREVIEW_MEMORY_POOL 1
+
+#include "harness_assert.h"
+#include "tbb/memory_pool.h"
+#include "tbb/scalable_allocator.h"
+
+// The actual body of the test is there:
+#include "test_allocator_STL.h"
+
+int TestMain () {
+    TestAllocatorWithSTL<tbb::scalable_allocator<void> >();
+    tbb::memory_pool<tbb::scalable_allocator<int> > mpool;
+    TestAllocatorWithSTL(tbb::memory_pool_allocator<void>(mpool) );
+    static char buf[1024*1024*4];
+    tbb::fixed_pool fpool(buf, sizeof(buf));
+    TestAllocatorWithSTL(tbb::memory_pool_allocator<void>(fpool) );
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_aggregator.cpp b/xdl/third_party/tbb/src/test/test_aggregator.cpp
new file mode 100644
index 00000000..d92cc8af
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_aggregator.cpp
@@ -0,0 +1,185 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef TBB_PREVIEW_AGGREGATOR
+    #define TBB_PREVIEW_AGGREGATOR 1
+#endif
+
+#include "tbb/aggregator.h"
+#include "harness.h"
+#include <queue>
+
+typedef std::priority_queue<int, std::vector<int>, std::less<int> > pq_t;
+
+int N;
+int* shared_data;
+
+// Code for testing basic interface using function objects
+class push_fnobj : NoAssign, Harness::NoAfterlife {
+    pq_t& pq;
+    int threadID;
+public:
+    push_fnobj(pq_t& pq_, int tid) : pq(pq_), threadID(tid) {}
+    void operator()() const {
+        AssertLive();
+        pq.push(threadID);
+    }
+};
+
+class pop_fnobj : NoAssign, Harness::NoAfterlife {
+    pq_t& pq;
+public:
+    pop_fnobj(pq_t& pq_) : pq(pq_) {}
+    void operator()() const {
+        AssertLive();
+        ASSERT(!pq.empty(), "queue should not be empty yet");
+        int elem = pq.top();
+        pq.pop();
+        shared_data[elem]++;
+    }
+};
+
+class BasicBody : NoAssign {
+    pq_t& pq;
+    tbb::aggregator& agg;
+public:
+    BasicBody(pq_t& pq_, tbb::aggregator& agg_) : pq(pq_), agg(agg_) {}
+    void operator()(const int threadID) const {
+        for (int i=0; i<N; ++i) agg.execute( push_fnobj(pq, threadID) );
+        for (int i=0; i<N; ++i) agg.execute( pop_fnobj(pq) );
+    }
+};
+
+void TestBasicInterface(int nThreads) {
+    pq_t my_pq;
+    tbb::aggregator agg;
+    for (int i=0; i<MaxThread; ++i) shared_data[i] = 0;
+    REMARK("Testing aggregator basic interface.\n");
+    NativeParallelFor(nThreads, BasicBody(my_pq, agg));
+    for (int i=0; i<nThreads; ++i)
+        ASSERT(shared_data[i] == N, "wrong number of elements pushed");
+    REMARK("Done testing aggregator basic interface.\n");
+}
+// End of code for testing basic interface using function objects
+
+
+// Code for testing basic interface using lambda expressions
+#if __TBB_CPP11_LAMBDAS_PRESENT
+void TestBasicLambdaInterface(int nThreads) {
+    pq_t my_pq;
+    tbb::aggregator agg;
+    for (int i=0; i<MaxThread; ++i) shared_data[i] = 0;
+    REMARK("Testing aggregator basic lambda interface.\n");
+    NativeParallelFor(nThreads, [&agg, &my_pq](const int threadID) {
+        for (int i=0; i<N; ++i)
+            agg.execute( [&, threadID]() { my_pq.push(threadID); } );
+        for (int i=0; i<N; ++i) {
+            agg.execute( [&]() {
+                ASSERT(!my_pq.empty(), "queue should not be empty yet");
+                int elem = my_pq.top();
+                my_pq.pop();
+                shared_data[elem]++;
+            } );
+        }
+    } );
+    for (int i=0; i<nThreads; ++i)
+        ASSERT(shared_data[i] == N, "wrong number of elements pushed");
+    REMARK("Done testing aggregator basic lambda interface.\n");
+}
+#endif /* __TBB_CPP11_LAMBDAS_PRESENT */
+// End of code for testing basic interface using lambda expressions
+
+// Code for testing expert interface
+class op_data : public tbb::aggregator_operation, NoAssign {
+public:
+    const int tid;
+    op_data(const int tid_=-1) : tbb::aggregator_operation(), tid(tid_) {}
+};
+
+class my_handler {
+    pq_t *pq;
+public:
+    my_handler() {}
+    my_handler(pq_t *pq_) : pq(pq_) {}
+    void operator()(tbb::aggregator_operation* op_list) const {
+        while (op_list) {
+            op_data& request = static_cast<op_data&>(*op_list);
+            op_list = op_list->next();
+            request.start();
+            if (request.tid >= 0) pq->push(request.tid);
+            else {
+                ASSERT(!pq->empty(), "queue should not be empty!");
+                int elem = pq->top();
+                pq->pop();
+                shared_data[elem]++;
+            }
+            request.finish();
+        }
+    }
+};
+
+class ExpertBody : NoAssign {
+    pq_t& pq;
+    tbb::aggregator_ext<my_handler>& agg;
+public:
+    ExpertBody(pq_t& pq_, tbb::aggregator_ext<my_handler>& agg_) : pq(pq_), agg(agg_) {}
+    void operator()(const int threadID) const {
+        for (int i=0; i<N; ++i) {
+            op_data to_push(threadID);
+            agg.process( &to_push );
+        }
+        for (int i=0; i<N; ++i) {
+            op_data to_pop;
+            agg.process( &to_pop );
+        }
+    }
+};
+
+void TestExpertInterface(int nThreads) {
+    pq_t my_pq;
+    tbb::aggregator_ext<my_handler> agg((my_handler(&my_pq)));
+    for (int i=0; i<MaxThread; ++i) shared_data[i] = 0;
+    REMARK("Testing aggregator expert interface.\n");
+    NativeParallelFor(nThreads, ExpertBody(my_pq, agg));
+    for (int i=0; i<nThreads; ++i)
+        ASSERT(shared_data[i] == N, "wrong number of elements pushed");
+    REMARK("Done testing aggregator expert interface.\n");
+}
+// End of code for testing expert interface
+
+int TestMain() {
+    if (MinThread < 1)
+        MinThread = 1;
+    shared_data = new int[MaxThread];
+    for (int p = MinThread; p <= MaxThread; ++p) {
+        REMARK("Testing on %d threads.\n", p);
+        N = 0;
+        while (N <= 100) {
+            REMARK("Testing with N=%d\n", N);
+            TestBasicInterface(p);
+#if __TBB_CPP11_LAMBDAS_PRESENT
+            TestBasicLambdaInterface(p);
+#endif
+            TestExpertInterface(p);
+            N = N ? N*10 : 1;
+        }
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_aligned_space.cpp b/xdl/third_party/tbb/src/test/test_aligned_space.cpp
new file mode 100644
index 00000000..93f0ae5c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_aligned_space.cpp
@@ -0,0 +1,119 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_GCC_STRICT_ALIASING_BROKEN
+    #pragma GCC diagnostic ignored "-Wstrict-aliasing"
+#endif
+
+//! Wrapper around T where all members are private.
+/** Used to prove that aligned_space<T,N> never calls member of T. */
+template<typename T>
+class Minimal {
+    Minimal();
+    Minimal( Minimal& min );
+    ~Minimal();
+    void operator=( const Minimal& );
+    T pad;
+    template<typename U>
+    friend void AssignToCheckAlignment( Minimal<U>& dst, const Minimal<U>& src ) ;
+};
+
+template<typename T>
+void AssignToCheckAlignment( Minimal<T>& dst, const Minimal<T>& src ) {
+    dst.pad = src.pad;
+}
+
+#include "tbb/aligned_space.h"
+#include "harness_assert.h"
+
+static bool SpaceWasted;
+
+template<typename U, size_t N>
+void TestAlignedSpaceN() {
+    typedef Minimal<U> T;
+    struct {
+        //! Pad byte increases chance that subsequent member will be misaligned if there is a problem.
+        char pad;
+        tbb::aligned_space<T ,N> space;
+    } x;
+    AssertSameType( static_cast< T *>(0), x.space.begin() );
+    AssertSameType( static_cast< T *>(0), x.space.end() );
+    ASSERT( reinterpret_cast<void *>(x.space.begin())==reinterpret_cast< void *>(&x.space), NULL );
+    ASSERT( x.space.end()-x.space.begin()==N, NULL );
+    ASSERT( reinterpret_cast<void *>(x.space.begin())>=reinterpret_cast< void *>(&x.space), NULL );
+    ASSERT( x.space.end()<=reinterpret_cast< T *>(&x.space+1), NULL );
+    // Though not required, a good implementation of aligned_space<T,N> does not use any more space than a T[N].
+    SpaceWasted |= sizeof(x.space)!=sizeof(T)*N;
+    for( size_t k=1; k<N; ++k )
+        AssignToCheckAlignment( x.space.begin()[k-1], x.space.begin()[k] );
+}
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+
+#include <typeinfo>
+template<typename T>
+void PrintSpaceWastingWarning() {
+    REPORT( "Consider rewriting aligned_space<%s,N> to waste less space\n", typeid(T).name() );
+}
+
+// RTTI for long double (128 bit) is broken in libc++ up-to NDK11c. Check on newer versions of NDK.
+#if ( __ANDROID__ && __clang__ && _LIBCPP_VERSION && __TBB_x86_64 )
+template<>
+void PrintSpaceWastingWarning<long double>() {
+    REPORT( "Consider rewriting aligned_space<ld,N> to waste less space\n" );
+}
+#endif
+
+template<typename T>
+void TestAlignedSpace() {
+    SpaceWasted = false;
+    TestAlignedSpaceN<T,1>();
+    TestAlignedSpaceN<T,2>();
+    TestAlignedSpaceN<T,3>();
+    TestAlignedSpaceN<T,4>();
+    TestAlignedSpaceN<T,5>();
+    TestAlignedSpaceN<T,6>();
+    TestAlignedSpaceN<T,7>();
+    TestAlignedSpaceN<T,8>();
+    if( SpaceWasted )
+        PrintSpaceWastingWarning<T>();
+}
+
+#include "harness_m128.h"
+
+int TestMain () {
+    TestAlignedSpace<char>();
+    TestAlignedSpace<short>();
+    TestAlignedSpace<int>();
+    TestAlignedSpace<float>();
+    TestAlignedSpace<double>();
+    TestAlignedSpace<long double>();
+    TestAlignedSpace<size_t>();
+#if HAVE_m128
+    TestAlignedSpace<__m128>();
+#endif
+#if HAVE_m256
+    if (have_AVX()) TestAlignedSpace<__m256>();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_allocator.h b/xdl/third_party/tbb/src/test/test_allocator.h
new file mode 100644
index 00000000..a9662c99
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_allocator.h
@@ -0,0 +1,275 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Basic testing of an allocator
+// Tests against requirements in 20.1.5 of ISO C++ Standard (1998).
+// Does not check for thread safety or false sharing issues.
+//
+// Tests for compatibility with the host's STL are in
+// test_Allocator_STL.h.  Those tests are in a separate file
+// because they bring in lots of STL headers, and the tests here
+// are supposed to work in the abscense of STL.
+
+#include "harness.h"
+#if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    #include <utility> //for std::pair
+#endif
+
+template<typename A>
+struct is_zero_filling {
+    static const bool value = false;
+};
+
+int NumberOfFoo;
+
+template<typename T, size_t N>
+struct Foo {
+    T foo_array[N];
+    Foo() {
+        zero_fill<T>(foo_array, N);
+        ++NumberOfFoo;
+    }
+    Foo( const Foo& x ) {
+        *this = x;
+        ++NumberOfFoo;
+    }
+    ~Foo() {
+        --NumberOfFoo;
+    }
+};
+
+inline char PseudoRandomValue( size_t j, size_t k ) {
+    return char(j*3 ^ j>>4 ^ k);
+}
+
+#if __APPLE__
+#include <fcntl.h>
+#include <unistd.h>
+
+// A RAII class to disable stderr in a certain scope. It's not thread-safe.
+class DisableStderr {
+    int stderrCopy;
+    static void dupToStderrAndClose(int fd) {
+        int ret = dup2(fd, STDERR_FILENO); // close current stderr
+        ASSERT(ret != -1, NULL);
+        ret = close(fd);
+        ASSERT(ret != -1, NULL);
+    }
+public:
+    DisableStderr() {
+        int devNull = open("/dev/null", O_WRONLY);
+        ASSERT(devNull != -1, NULL);
+        stderrCopy = dup(STDERR_FILENO);
+        ASSERT(stderrCopy != -1, NULL);
+        dupToStderrAndClose(devNull);
+    }
+    ~DisableStderr() {
+        dupToStderrAndClose(stderrCopy);
+    }
+};
+#endif
+
+//! T is type and A is allocator for that type
+template<typename T, typename A>
+void TestBasic( A& a ) {
+    T x;
+    const T cx = T();
+
+    // See Table 32 in ISO ++ Standard
+    typename A::pointer px = &x;
+    typename A::const_pointer pcx = &cx;
+
+    typename A::reference rx = x;
+    ASSERT( &rx==&x, NULL );
+
+    typename A::const_reference rcx = cx;
+    ASSERT( &rcx==&cx, NULL );
+
+    typename A::value_type v = x;
+
+    typename A::size_type size;
+    size = 0;
+    --size;
+    ASSERT( size>0, "not an unsigned integral type?" );
+
+    typename A::difference_type difference;
+    difference = 0;
+    --difference;
+    ASSERT( difference<0, "not an signed integral type?" );
+
+    // "rebind" tested by our caller
+
+    ASSERT( a.address(rx)==px, NULL );
+
+    ASSERT( a.address(rcx)==pcx, NULL );
+
+    typename A::pointer array[100];
+    size_t sizeof_T = sizeof(T);
+    for( size_t k=0; k<100; ++k ) {
+        array[k] = k&1 ? a.allocate(k,array[0]) : a.allocate(k);
+        char* s = reinterpret_cast<char*>(reinterpret_cast<void*>(array[k]));
+        for( size_t j=0; j<k*sizeof_T; ++j )
+            s[j] = PseudoRandomValue(j,k);
+    }
+
+    // Test hint argument. This can't be compiled when hint is void*, It should be const void*
+    typename A::pointer a_ptr;
+    const void * const_hint = NULL;
+    a_ptr = a.allocate (1, const_hint);
+    a.deallocate(a_ptr, 1);
+
+    // Test "a.deallocate(p,n)
+    for( size_t k=0; k<100; ++k ) {
+        char* s = reinterpret_cast<char*>(reinterpret_cast<void*>(array[k]));
+        for( size_t j=0; j<k*sizeof_T; ++j )
+            ASSERT( s[j] == PseudoRandomValue(j,k), NULL );
+        a.deallocate(array[k],k);
+    }
+
+    // Test "a.max_size()"
+    AssertSameType( a.max_size(), typename A::size_type(0) );
+    // Following assertion catches case where max_size() is so large that computation of
+    // number of bytes for such an allocation would overflow size_type.
+    ASSERT( a.max_size()*typename A::size_type(sizeof(T))>=a.max_size(), "max_size larger than reasonable" );
+
+    // Test "a.construct(p,t)"
+    int n = NumberOfFoo;
+    typename A::pointer p = a.allocate(1);
+    a.construct( p, cx );
+    ASSERT( NumberOfFoo==n+1, "constructor for Foo not called?" );
+
+    // Test "a.destroy(p)"
+    a.destroy( p );
+    ASSERT( NumberOfFoo==n, "destructor for Foo not called?" );
+    a.deallocate(p,1);
+
+#if TBB_USE_EXCEPTIONS
+    volatile size_t too_big = (~size_t(0) - 1024*1024)/sizeof(T);
+    bool exception_caught = false;
+    typename A::pointer p1 = NULL;
+    try {
+#if __APPLE__
+        // On macOS*, failure to map memory results in messages to stderr;
+        // suppress them.
+        DisableStderr disableStderr;
+#endif
+        p1 = a.allocate(too_big);
+    } catch ( std::bad_alloc& ) {
+        exception_caught = true;
+    }
+    ASSERT( exception_caught, "allocate expected to throw bad_alloc" );
+    a.deallocate(p1, too_big);
+#endif // TBB_USE_EXCEPTIONS
+
+    #if __TBB_ALLOCATOR_CONSTRUCT_VARIADIC
+    {
+        typedef typename A:: template rebind<std::pair<typename A::value_type, typename A::value_type> >::other pair_allocator_type;
+        pair_allocator_type pair_allocator(a);
+        int NumberOfFooBeforeConstruct= NumberOfFoo;
+        typename pair_allocator_type::pointer pair_pointer = pair_allocator.allocate(1);
+        pair_allocator.construct( pair_pointer, cx, cx);
+        ASSERT( NumberOfFoo==NumberOfFooBeforeConstruct+2, "constructor for Foo not called appropriate number of times?" );
+
+        pair_allocator.destroy( pair_pointer );
+        ASSERT( NumberOfFoo==NumberOfFooBeforeConstruct, "destructor for Foo not called appropriate number of times?" );
+        pair_allocator.deallocate(pair_pointer,1);
+    }
+    #endif
+
+}
+
+#include "tbb/blocked_range.h"
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for erroneous "conditional expression is constant" warning in method check_allocate.
+    #pragma warning (disable: 4127)
+#endif
+
+// A is an allocator for some type
+template<typename A>
+struct Body: NoAssign {
+    static const size_t max_k = 100000;
+    A &a;
+    Body(A &a_) : a(a_) {}
+    void check_allocate( typename A::pointer array[], size_t i, size_t t ) const
+    {
+        ASSERT(array[i] == 0, NULL);
+        size_t size = i * (i&3);
+        array[i] = i&1 ? a.allocate(size, array[i>>3]) : a.allocate(size);
+        ASSERT(array[i] != 0, "allocator returned null");
+        char* s = reinterpret_cast<char*>(reinterpret_cast<void*>(array[i]));
+        for( size_t j=0; j<size*sizeof(typename A::value_type); ++j ) {
+            if(is_zero_filling<typename A::template rebind<void>::other>::value)
+                ASSERT( !s[j], NULL);
+            s[j] = PseudoRandomValue(i, t);
+        }
+    }
+
+    void check_deallocate( typename A::pointer array[], size_t i, size_t t ) const
+    {
+        ASSERT(array[i] != 0, NULL);
+        size_t size = i * (i&3);
+        char* s = reinterpret_cast<char*>(reinterpret_cast<void*>(array[i]));
+        for( size_t j=0; j<size*sizeof(typename A::value_type); ++j )
+            ASSERT( s[j] == PseudoRandomValue(i, t), "Thread safety test failed" );
+        a.deallocate(array[i], size);
+        array[i] = 0;
+    }
+
+    void operator()( size_t thread_id ) const {
+        typename A::pointer array[256];
+
+        for( size_t k=0; k<256; ++k )
+            array[k] = 0;
+        for( size_t k=0; k<max_k; ++k ) {
+            size_t i = static_cast<unsigned char>(PseudoRandomValue(k,thread_id));
+            if(!array[i]) check_allocate(array, i, thread_id);
+            else check_deallocate(array, i, thread_id);
+        }
+        for( size_t k=0; k<256; ++k )
+            if(array[k])
+                check_deallocate(array, k, thread_id);
+    }
+};
+
+// A is an allocator for some type, and U is another type
+template<typename U, typename A>
+void Test(A &a) {
+    typename A::template rebind<U>::other b(a);
+    TestBasic<U>(b);
+    TestBasic<typename A::value_type>(a);
+
+    // thread safety
+    NativeParallelFor( 4, Body<A>(a) );
+    ASSERT( NumberOfFoo==0, "Allocate/deallocate count mismatched" );
+
+    ASSERT( a==b, NULL );
+    ASSERT( !(a!=b), NULL );
+}
+
+template<typename Allocator>
+int TestMain(const Allocator &a = Allocator()) {
+    NumberOfFoo = 0;
+    typename Allocator::template rebind<Foo<char,1> >::other a1(a);
+    typename Allocator::template rebind<Foo<double,1> >::other a2(a);
+    Test<Foo<int,17> >( a1 );
+    Test<Foo<float,23> >( a2 );
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/test/test_allocator_STL.h b/xdl/third_party/tbb/src/test/test_allocator_STL.h
new file mode 100644
index 00000000..89e471a3
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_allocator_STL.h
@@ -0,0 +1,136 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Tests for compatibility with the host's STL.
+
+#include "harness.h"
+
+template<typename Container>
+void TestSequence(const typename Container::allocator_type &a) {
+    Container c(a);
+    for( int i=0; i<1000; ++i )
+        c.push_back(i*i);
+    typename Container::const_iterator p = c.begin();
+    for( int i=0; i<1000; ++i ) {
+        ASSERT( *p==i*i, NULL );
+        ++p;
+    }
+    // regression test against compilation error for GCC 4.6.2
+    c.resize(1000);
+}
+
+template<typename Set>
+void TestSet(const typename Set::allocator_type &a) {
+    Set s(typename Set::key_compare(), a);
+    typedef typename Set::value_type value_type;
+    for( int i=0; i<100; ++i )
+        s.insert(value_type(3*i));
+    for( int i=0; i<300; ++i ) {
+        ASSERT( s.erase(i)==size_t(i%3==0), NULL );
+    }
+}
+
+template<typename Map>
+void TestMap(const typename Map::allocator_type &a) {
+    Map m(typename Map::key_compare(), a);
+    typedef typename Map::value_type value_type;
+    for( int i=0; i<100; ++i )
+        m.insert(value_type(i,i*i));
+    for( int i=0; i<100; ++i )
+        ASSERT( m.find(i)->second==i*i, NULL );
+}
+
+#include <deque>
+#include <list>
+#include <map>
+#include <set>
+#include <vector>
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+struct MoveOperationTracker {
+    int my_value;
+
+    MoveOperationTracker( int value = 0 ) : my_value( value ) {}
+    MoveOperationTracker(const MoveOperationTracker&) {
+        ASSERT( false, "Copy constructor is called" );
+    }
+    MoveOperationTracker(MoveOperationTracker&& m) __TBB_NOEXCEPT( true ) : my_value( m.my_value ) {
+    }
+    MoveOperationTracker& operator=(MoveOperationTracker const&) {
+        ASSERT( false, "Copy assigment operator is called" );
+        return *this;
+    }
+    MoveOperationTracker& operator=(MoveOperationTracker&& m) __TBB_NOEXCEPT( true ) {
+        my_value = m.my_value;
+        return *this;
+    }
+
+    bool operator==(int value) const {
+        return my_value == value;
+    }
+
+    bool operator==(const MoveOperationTracker& m) const {
+        return my_value == m.my_value;
+    }
+};
+#endif /*  __TBB_CPP11_RVALUE_REF_PRESENT */
+
+template<typename Allocator>
+void TestAllocatorWithSTL(const Allocator &a = Allocator() ) {
+    typedef typename Allocator::template rebind<int>::other Ai;
+    typedef typename Allocator::template rebind<std::pair<const int, int> >::other Acii;
+#if _MSC_VER
+    typedef typename Allocator::template rebind<const int>::other Aci;
+    typedef typename Allocator::template rebind<std::pair<int, int> >::other Aii;
+#endif
+
+    // Sequenced containers
+    TestSequence<std::deque <int,Ai> >(a);
+    TestSequence<std::list  <int,Ai> >(a);
+    TestSequence<std::vector<int,Ai> >(a);
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    typedef typename Allocator::template rebind<MoveOperationTracker>::other Amot;
+    TestSequence<std::deque <MoveOperationTracker, Amot> >(a);
+    TestSequence<std::list  <MoveOperationTracker, Amot> >(a);
+    TestSequence<std::vector<MoveOperationTracker, Amot> >(a);
+#endif
+
+    // Associative containers
+    TestSet<std::set     <int, std::less<int>, Ai> >(a);
+    TestSet<std::multiset<int, std::less<int>, Ai> >(a);
+    TestMap<std::map     <int, int, std::less<int>, Acii> >(a);
+    TestMap<std::multimap<int, int, std::less<int>, Acii> >(a);
+
+#if _MSC_VER && _CPPLIB_VER < 650
+    // Test compatibility with Microsoft's implementation of std::allocator for some cases that
+    // are undefined according to the ISO standard but permitted by Microsoft.
+    TestSequence<std::deque <const int,Aci> >(a);
+#if _CPPLIB_VER>=500
+    TestSequence<std::list  <const int,Aci> >(a);
+#endif
+    TestSequence<std::vector<const int,Aci> >(a);
+    TestSet<std::set<const int, std::less<int>, Aci> >(a);
+    TestMap<std::map<int, int, std::less<int>, Aii> >(a);
+    TestMap<std::map<const int, int, std::less<int>, Acii> >(a);
+    TestMap<std::multimap<int, int, std::less<int>, Aii> >(a);
+    TestMap<std::multimap<const int, int, std::less<int>, Acii> >(a);
+#endif /* _MSC_VER */
+}
diff --git a/xdl/third_party/tbb/src/test/test_assembly.cpp b/xdl/third_party/tbb/src/test/test_assembly.cpp
new file mode 100644
index 00000000..3054a9fd
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_assembly.cpp
@@ -0,0 +1,164 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Program for basic correctness testing of assembly-language routines.
+#include "harness_defs.h"
+//for ICC builtins mode the test will be skipped as
+//macro __TBB_GCC_BUILTIN_ATOMICS_PRESENT used to define __TBB_TEST_SKIP_GCC_BUILTINS_MODE
+//will not be defined (it is explicitly disabled for ICC)
+#if __TBB_TEST_SKIP_GCC_BUILTINS_MODE
+#include "harness.h"
+int TestMain() {
+    REPORT("Known issue: GCC builtins aren't available\n");
+    return Harness::Skipped;
+}
+#else
+
+#include "tbb/task.h"
+
+#include <new>
+#include "harness.h"
+
+using tbb::internal::reference_count;
+
+//TODO: remove this function when atomic function __TBB_XXX are dropped
+//! Test __TBB_CompareAndSwapW
+static void TestCompareExchange() {
+    ASSERT( intptr_t(-10)<10, "intptr_t not a signed integral type?" );
+    REMARK("testing __TBB_CompareAndSwapW\n");
+    for( intptr_t a=-10; a<10; ++a )
+        for( intptr_t b=-10; b<10; ++b )
+            for( intptr_t c=-10; c<10; ++c ) {
+// Workaround for a bug in GCC 4.3.0; and one more is below.
+#if __TBB_GCC_OPTIMIZER_ORDERING_BROKEN
+                intptr_t x;
+                __TBB_store_with_release( x, a );
+#else
+                intptr_t x = a;
+#endif
+                intptr_t y = __TBB_CompareAndSwapW(&x,b,c);
+                ASSERT( y==a, NULL );
+                if( a==c )
+                    ASSERT( x==b, NULL );
+                else
+                    ASSERT( x==a, NULL );
+            }
+}
+
+//TODO: remove this function when atomic function __TBB_XXX are dropped
+//! Test __TBB___TBB_FetchAndIncrement and __TBB___TBB_FetchAndDecrement
+static void TestAtomicCounter() {
+    // "canary" is a value used to detect illegal overwrites.
+    const reference_count canary = ~(uintptr_t)0/3;
+    REMARK("testing __TBB_FetchAndIncrement\n");
+    struct {
+        reference_count prefix, i, suffix;
+    } x;
+    x.prefix = canary;
+    x.i = 0;
+    x.suffix = canary;
+    for( int k=0; k<10; ++k ) {
+        reference_count j = __TBB_FetchAndIncrementWacquire((volatile void *)&x.i);
+        ASSERT( x.prefix==canary, NULL );
+        ASSERT( x.suffix==canary, NULL );
+        ASSERT( x.i==k+1, NULL );
+        ASSERT( j==k, NULL );
+    }
+    REMARK("testing __TBB_FetchAndDecrement\n");
+    x.i = 10;
+    for( int k=10; k>0; --k ) {
+        reference_count j = __TBB_FetchAndDecrementWrelease((volatile void *)&x.i);
+        ASSERT( j==k, NULL );
+        ASSERT( x.i==k-1, NULL );
+        ASSERT( x.prefix==canary, NULL );
+        ASSERT( x.suffix==canary, NULL );
+    }
+}
+
+static void TestTinyLock() {
+    REMARK("testing __TBB_LockByte\n");
+    __TBB_atomic_flag flags[16];
+    for( unsigned int i=0; i<16; ++i )
+        flags[i] = (__TBB_Flag)i;
+#if __TBB_GCC_OPTIMIZER_ORDERING_BROKEN
+    __TBB_store_with_release( flags[8], 0 );
+#else
+    flags[8] = 0;
+#endif
+    __TBB_LockByte(flags[8]);
+    for( unsigned int i=0; i<16; ++i )
+        #ifdef __sparc
+        ASSERT( flags[i]==(i==8?0xff:i), NULL );
+        #else
+        ASSERT( flags[i]==(i==8?1:i), NULL );
+        #endif
+    __TBB_UnlockByte(flags[8]);
+    for( unsigned int i=0; i<16; ++i )
+        ASSERT( flags[i] == (i==8?0:i), NULL );
+}
+
+static void TestLog2() {
+    REMARK("testing __TBB_Log2\n");
+    for( uintptr_t i=1; i; i<<=1 ) {
+        for( uintptr_t j=1; j<1<<16; ++j ) {
+            if( uintptr_t k = i*j ) {
+                uintptr_t actual = __TBB_Log2(k);
+                const uintptr_t ONE = 1; // warning suppression again
+                ASSERT( k >= ONE<<actual, NULL );
+                ASSERT( k>>1 < ONE<<actual, NULL );
+            }
+        }
+    }
+}
+
+static void TestPause() {
+    REMARK("testing __TBB_Pause\n");
+    __TBB_Pause(1);
+}
+
+static void TestTimeStamp() {
+    REMARK("testing __TBB_time_stamp");
+#if defined(__TBB_time_stamp)
+    tbb::internal::machine_tsc_t prev = __TBB_time_stamp();
+    for ( int i=0; i<1000; ++i ) {
+        tbb::internal::machine_tsc_t curr = __TBB_time_stamp();
+        ASSERT(curr>prev, "__TBB_time_stamp has returned non-monotonically increasing quantity");
+        prev=curr;
+    }
+    REMARK("\n");
+#else
+    REMARK(" skipped\n");
+#endif
+}
+
+int TestMain () {
+    __TBB_TRY {
+        TestLog2();
+        TestTinyLock();
+        TestCompareExchange();
+        TestAtomicCounter();
+        TestPause();
+        TestTimeStamp();
+    } __TBB_CATCH(...) {
+        ASSERT(0,"unexpected exception");
+    }
+    return Harness::Done;
+}
+#endif // __TBB_TEST_SKIP_BUILTINS_MODE
diff --git a/xdl/third_party/tbb/src/test/test_async_msg.cpp b/xdl/third_party/tbb/src/test/test_async_msg.cpp
new file mode 100644
index 00000000..b17c53cf
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_async_msg.cpp
@@ -0,0 +1,608 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef TBB_PREVIEW_FLOW_GRAPH_FEATURES
+    #define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+#endif
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_PREVIEW_ASYNC_MSG
+
+#if _MSC_VER
+#pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#endif
+
+#include "tbb/flow_graph.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/concurrent_queue.h"
+
+#include "harness.h"
+#include "harness_graph.h"
+#include "harness_barrier.h"
+
+#include <sstream>      // std::ostringstream
+#include <type_traits>  // std::is_base_of
+
+static const int USE_N = 1000;
+static const int ACTIVITY_PAUSE_MS_NODE1 = 0;//500;
+static const int ACTIVITY_PAUSE_MS_NODE2 = 0;//100;
+
+#define _TRACE_(msg) {                                                  \
+    if (Verbose) {                                                      \
+        std::ostringstream os;                                          \
+        os << "[TID=" << tbb::this_tbb_thread::get_id() << "] " << msg; \
+        REMARK("%s\n", os.str().c_str());                               \
+    }                                                                   \
+}
+
+class UserAsyncActivity // Singleton
+{
+public:
+    static UserAsyncActivity* create(const tbb::flow::async_msg<int>& msg, int timeoutMS) {
+        ASSERT(s_Activity == NULL, "created twice");
+        _TRACE_( "Create UserAsyncActivity" );
+        s_Activity = new UserAsyncActivity(msg, timeoutMS);
+        _TRACE_( "CREATED! UserAsyncActivity" );
+        return s_Activity;
+    }
+
+    static void destroy() {
+        _TRACE_( "Start UserAsyncActivity::destroy()" );
+        ASSERT(s_Activity != NULL, "destroyed twice");
+        s_Activity->myThread.join();
+        delete s_Activity;
+        s_Activity = NULL;
+        _TRACE_( "End UserAsyncActivity::destroy()" );
+    }
+
+    static int s_Result;
+
+private:
+    static void threadFunc(UserAsyncActivity* activity) {
+        _TRACE_( "UserAsyncActivity::threadFunc" );
+
+        Harness::Sleep(activity->myTimeoutMS);
+
+        const int result = static_cast<int>(reinterpret_cast<size_t>(activity)) & 0xFF; // just different random results
+        s_Result = result;
+
+        _TRACE_( "UserAsyncActivity::threadFunc - returned result " << result );
+
+        activity->returnActivityResults(result);
+    }
+
+    UserAsyncActivity(const tbb::flow::async_msg<int>& msg, int timeoutMS) : myMsg(msg), myTimeoutMS(timeoutMS)
+        , myThread(threadFunc, this)
+    {
+        // Start local thread here...
+        _TRACE_( "Started AsyncActivity" );
+    }
+
+    // Will be called from working thread
+    void returnActivityResults(int result) {
+        myMsg.set(result);
+    }
+
+private: // DATA
+    tbb::flow::async_msg<int>   myMsg;
+    int                         myTimeoutMS;
+    tbb::tbb_thread             myThread;
+
+    static UserAsyncActivity*   s_Activity;
+};
+
+UserAsyncActivity* UserAsyncActivity::s_Activity = NULL;
+int UserAsyncActivity::s_Result = -1;
+
+class UserAsyncMsg1 : public tbb::flow::async_msg<int>
+{
+public:
+    typedef tbb::flow::async_msg<int> base;
+
+    UserAsyncMsg1() : base() {}
+    UserAsyncMsg1(int value) : base(value) {}
+    UserAsyncMsg1(const UserAsyncMsg1& msg) : base(msg) {}
+};
+
+struct F2_body : tbb::internal::no_assign
+{
+    static int          s_FinalResult;
+
+    int&                myI;
+    bool                myAlive;
+
+    F2_body(int& i) : myI(i), myAlive(true) {}
+
+    F2_body(const F2_body& b) : myI(b.myI), myAlive(true) {}
+
+    ~F2_body() {
+        myAlive = false;
+        _TRACE_( "~F2_body" );
+    }
+
+    void operator () (int result) {
+        __TBB_ASSERT(myAlive, "dead node");
+
+        // Handle async activity result here
+        s_FinalResult = result;
+        _TRACE_( "F2: Got async_msg result = " << result );
+    }
+};
+
+// static
+int F2_body::s_FinalResult = -2;
+
+static bool testSimplestCase() {
+    bool bOk = true;
+    _TRACE_( "--- SAMPLE 1 (simple case 3-in-1: F1(A<T>) ---> F2(T)) " );
+
+    for (int i = 0; i <= 2; ++i) {
+        _TRACE_( "CASE " << i + 1 << ": data is " << (i > 0 ? "NOT " : "") << "ready in storage" << (i > 1 ? " NO WAITING in graph" : "") );
+        _TRACE_( "MAIN THREAD" );
+
+        {
+            tbb::flow::graph g;
+            tbb::flow::function_node< tbb::flow::continue_msg, UserAsyncMsg1 > f1( g, tbb::flow::unlimited,
+                [&]( tbb::flow::continue_msg ) -> UserAsyncMsg1 {
+                    _TRACE_( "F1: Created async_msg" );
+
+                    UserAsyncMsg1 a;
+                    UserAsyncActivity::create(a, (i == 0 ? 0 : 1)*ACTIVITY_PAUSE_MS_NODE1);
+
+                    Harness::Sleep(ACTIVITY_PAUSE_MS_NODE2); // let activity to finish
+                    return a;
+                }
+            );
+
+
+            tbb::flow::function_node< int > f2( g, tbb::flow::unlimited,
+                F2_body(i)
+            );
+
+            make_edge(f1, f2);
+            f1.try_put( tbb::flow::continue_msg() );
+            g.wait_for_all();
+            UserAsyncActivity::destroy();
+            _TRACE_( "Done UserAsyncActivity::destroy" );
+            g.wait_for_all();
+            _TRACE_( "Done g.wait_for_all()" );
+        }
+
+        _TRACE_( "--- THE END --- " );
+
+        if (F2_body::s_FinalResult >= 0 && UserAsyncActivity::s_Result == F2_body::s_FinalResult) {
+            _TRACE_( "CASE " << i + 1 << ": " << "PASSED" );
+        }
+        else {
+            _TRACE_( "CASE " << i + 1 << ": " << "FAILED! " << UserAsyncActivity::s_Result << " != " << F2_body::s_FinalResult );
+            bOk = false;
+            ASSERT(0, "testSimplestCase failed");
+        }
+    }
+
+    return bOk;
+}
+
+// ========================================================
+
+class UserAsyncActivityChaining;
+
+class UserAsyncMsg : public tbb::flow::async_msg<int>
+{
+public:
+    typedef tbb::flow::async_msg<int> base;
+
+    UserAsyncMsg() : base() {}
+    UserAsyncMsg(int value) : base(value) {}
+    UserAsyncMsg(const UserAsyncMsg& msg) : base(msg) {}
+
+    // Notify AsyncActivity that it must return result because async calculation chain is over
+    void finalize() const __TBB_override;
+};
+
+class UserAsyncActivityChaining // Singleton: task queue in worker thread
+{
+public:
+    static UserAsyncActivityChaining* instance() {
+        if (s_Activity == NULL) {
+            s_Activity = new UserAsyncActivityChaining();
+        }
+
+        return s_Activity;
+    }
+
+    static void destroy() {
+        ASSERT(s_Activity != NULL, "destroyed twice");
+        s_Activity->myThread.join();
+        delete s_Activity;
+        s_Activity = NULL;
+    }
+
+    static void finish(const UserAsyncMsg& msg) {
+        ASSERT(UserAsyncActivityChaining::s_Activity != NULL, "activity must be alive");
+        UserAsyncActivityChaining::s_Activity->finishTaskQueue(msg);
+    }
+
+    void addWork(int addValue, int timeout = 0) {
+        myQueue.push( MyTask(addValue, timeout) );
+    }
+
+    void finishTaskQueue(const UserAsyncMsg& msg) {
+        myMsg = msg;
+        myQueue.push( MyTask(0, 0, true) );
+    }
+
+    static int s_Result;
+
+private:
+    struct MyTask
+    {
+        MyTask(int addValue = 0, int timeout = 0, bool finishFlag = false)
+            : myAddValue(addValue), myTimeout(timeout), myFinishFlag(finishFlag) {}
+
+        int     myAddValue;
+        int     myTimeout;
+        bool    myFinishFlag;
+    };
+
+    static void threadFunc(UserAsyncActivityChaining* activity)
+    {
+        _TRACE_( "UserAsyncActivityChaining::threadFunc" );
+
+        for (;;)
+        {
+            // Process task queue
+            MyTask work;
+            activity->myQueue.pop(work); // Waits until it can succeed
+
+            _TRACE_( "UserAsyncActivityChaining::threadFunc - work: add "
+                    << work.myAddValue << " (timeout = " << work.myTimeout << ")" << (work.myFinishFlag ? " FINAL" : "") );
+
+            // 'finish flag' task is not real task, just end of queue flag
+            Harness::Sleep(work.myTimeout);
+
+            if (work.myFinishFlag) {
+                break;
+            }
+
+            activity->myQueueSum += work.myAddValue;
+        }
+
+        s_Result = activity->myQueueSum;
+        _TRACE_( "UserAsyncActivityChaining::threadFunc - returned result " << activity->myQueueSum );
+
+        // Get result back to Flow Graph
+        activity->myMsg.set(activity->myQueueSum);
+    }
+
+    UserAsyncActivityChaining()
+        : myQueueSum(0)
+        , myThread(threadFunc, this)
+    {
+        // Start local thread here...
+        _TRACE_( "Started AsyncActivityChaining" );
+    }
+
+private: // DATA
+    tbb::concurrent_bounded_queue<MyTask>   myQueue;
+    int                                     myQueueSum;
+    UserAsyncMsg                            myMsg;
+
+    tbb::tbb_thread                         myThread;
+
+    static UserAsyncActivityChaining*       s_Activity;
+};
+
+// static
+UserAsyncActivityChaining* UserAsyncActivityChaining::s_Activity = NULL;
+// static
+int UserAsyncActivityChaining::s_Result = -4;
+
+// override
+void UserAsyncMsg::finalize() const {
+    _TRACE_( "UserAsyncMsg::finalize()" );
+    UserAsyncActivityChaining::finish(*this);
+}
+
+struct F3_body : tbb::internal::no_assign
+{
+    static int          s_FinalResult;
+
+    int&                myI;
+    bool                myAlive;
+
+    F3_body(int& _i) : myI(_i), myAlive(true) {}
+
+    F3_body(const F3_body& b) : myI(b.myI), myAlive(true) {}
+
+    ~F3_body() {
+        myAlive = false;
+        _TRACE_( "~F3_body" );
+    }
+
+    void operator () (int result) {
+        __TBB_ASSERT(myAlive, "dead node");
+        // Handle async activity result here
+        s_FinalResult = result;
+        _TRACE_( "F3: Got async_msg result = " << result );
+    }
+};
+
+// static
+int F3_body::s_FinalResult = -8;
+
+static bool testChaining() {
+    bool bOk = true;
+    _TRACE_( "--- SAMPLE 2 (case with chaining: F1(A<T>) ---> F2(A<T>) ---> F3(T)) " );
+
+    for (int i = 0; i <= 2; ++i) {
+        _TRACE_( "CASE " << i + 1 << ": data is " << (i > 0 ? "NOT " : "") << "ready in storage" << (i > 1 ? " NO WAITING in graph" : "") );
+        _TRACE_( "MAIN THREAD" );
+
+        tbb::flow::graph g;
+        tbb::flow::function_node< tbb::flow::continue_msg, UserAsyncMsg > f1( g, tbb::flow::unlimited,
+            [&]( tbb::flow::continue_msg ) -> UserAsyncMsg {
+                _TRACE_( "F1: Created UserAsyncMsg" );
+
+                UserAsyncMsg a;
+                UserAsyncActivityChaining::instance()->addWork(11, (i == 0 ? 0 : 1)*ACTIVITY_PAUSE_MS_NODE1);
+
+                return a;
+            }
+        );
+
+        tbb::flow::function_node< UserAsyncMsg, UserAsyncMsg > f2( g, tbb::flow::unlimited,
+            [&]( UserAsyncMsg a) -> UserAsyncMsg {
+                _TRACE_( "F2: resend UserAsyncMsg" );
+
+                UserAsyncActivityChaining::instance()->addWork(22, (i == 0 ? 0 : 1)*ACTIVITY_PAUSE_MS_NODE1);
+
+                Harness::Sleep(ACTIVITY_PAUSE_MS_NODE2); // let activity to finish
+                return a;
+            }
+        );
+
+        tbb::flow::function_node< int > f3( g, tbb::flow::unlimited,
+            F3_body(i)
+        );
+
+        make_edge(f1, f2);
+        make_edge(f2, f3);
+        f1.try_put( tbb::flow::continue_msg() );
+        g.wait_for_all();
+
+        UserAsyncActivityChaining::destroy();
+        _TRACE_( "Done UserAsyncActivityChaining::destroy" );
+        g.wait_for_all();
+        _TRACE_( "Done g.wait_for_all()" );
+
+        _TRACE_( "--- THE END ---" );
+
+        if (F3_body::s_FinalResult >= 0 && UserAsyncActivityChaining::s_Result == F3_body::s_FinalResult) {
+            _TRACE_( "CASE " << i + 1 << ": " << "PASSED" );
+        }
+        else {
+            _TRACE_( "CASE " << i + 1 << ": " << "FAILED! " << UserAsyncActivityChaining::s_Result << " != " << F3_body::s_FinalResult );
+            bOk = false;
+            ASSERT(0, "testChaining failed");
+        }
+    }
+
+    return bOk;
+}
+
+// ========================================================
+namespace testFunctionsAvailabilityNS {
+
+using namespace tbb::flow;
+using tbb::flow::interface10::internal::untyped_sender;
+using tbb::flow::interface10::internal::untyped_receiver;
+
+using tbb::internal::is_same_type;
+using tbb::internal::strip;
+using tbb::flow::interface10::internal::wrap_tuple_elements;
+using tbb::flow::interface10::internal::async_helpers;
+
+class A {}; // Any type (usually called 'T')
+struct ImpossibleType {};
+
+template <typename T>
+struct UserAsync_T   : public async_msg<T> {
+    UserAsync_T() {}
+    UserAsync_T(const T& t) : async_msg<T>(t) {}
+};
+
+typedef UserAsync_T<int  > UserAsync_int;
+typedef UserAsync_T<float> UserAsync_float;
+typedef UserAsync_T<A    > UserAsync_A;
+
+typedef tuple< UserAsync_A, UserAsync_float, UserAsync_int, async_msg<A>, async_msg<float>, async_msg<int>, A, float, int > TypeTuple;
+
+static int g_CheckerCounter = 0;
+
+template <typename T, typename U>
+struct CheckerTryPut {
+    static ImpossibleType check( ... );
+
+    template <typename C>
+    static auto check( C* p, U* q ) -> decltype(p->try_put(*q));
+
+    static const bool value = !is_same_type<decltype(check(static_cast<T*>(0), 0)), ImpossibleType>::value;
+};
+
+template <typename T1, typename T2>
+struct CheckerMakeEdge {
+    static ImpossibleType checkMake( ... );
+    static ImpossibleType checkRemove( ... );
+
+    template <typename N1, typename N2>
+    static auto checkMake( N1* n1, N2* n2 ) -> decltype(tbb::flow::make_edge(*n1, *n2));
+
+    template <typename N1, typename N2>
+    static auto checkRemove( N1* n1, N2* n2 ) -> decltype(tbb::flow::remove_edge(*n1, *n2));
+
+    static const bool valueMake   = !is_same_type<decltype(checkMake  (static_cast<T1*>(0), static_cast<T2*>(0))), ImpossibleType>::value;
+    static const bool valueRemove = !is_same_type<decltype(checkRemove(static_cast<T1*>(0), static_cast<T2*>(0))), ImpossibleType>::value;
+
+    __TBB_STATIC_ASSERT( valueMake == valueRemove, "make_edge() availability is NOT equal to remove_edge() availability" );
+    
+    static const bool value = valueMake;
+};
+
+template <typename T1, typename T2>
+struct TypeChecker {
+     TypeChecker() {
+         ++g_CheckerCounter;
+
+        REMARK("%d: %s -> %s: %s %s \n", g_CheckerCounter, typeid(T1).name(), typeid(T2).name(),
+            (bAllowed ? "YES" : "no"), (bConvertable ? " (Convertable)" : ""));
+     }
+
+// 
+// Check connection: function_node<continue_msg, SENDING_TYPE> <-> function_node<RECEIVING_TYPE>
+//                                         R E C E I V I N G   T Y P E
+// S     'bAllowed'    | int | float | A | async_msg | async_msg | async_msg | UserAsync | UserAsync | UserAsync |
+// E       value       |     |       |   |   <int>   |  <float>  |    <A>    |   _int    |  _float   |   _A      |
+// N   -------------------------------------------------------------------------------------------------------------
+// D       int         |  Y  |       |   |     Y     |           |           |    Y      |           |           |
+// I      float        |     |   Y   |   |           |    Y      |           |           |    Y      |           |
+// N        A          |     |       | Y |           |           |     Y     |           |           |     Y     |
+// G   async_msg<int>  |  Y  |       |   |     Y     |           |           |           |           |           |
+//    async_msg<float> |     |   Y   |   |           |    Y      |           |           |           |           |
+// T   async_msg<A>    |     |       | Y |           |           |     Y     |           |           |           |
+// Y   UserAsync_int   |  Y  |       |   |           |           |           |    Y      |           |           |
+// P  UserAsync_float  |     |   Y   |   |           |           |           |           |    Y      |           |
+// E   UserAsync_A     |     |       | Y |           |           |           |           |           |    Y      |
+// 
+    // Test make_edge() & remove_edge() availability
+    static const bool bAllowed = is_same_type<T1, T2>::value
+        || is_same_type<typename async_helpers<T1>::filtered_type, T2>::value
+        || is_same_type<T1, typename async_helpers<T2>::filtered_type>::value;
+
+    static const bool bConvertable = bAllowed
+        || std::is_base_of<T1, T2>::value
+        || (is_same_type<typename async_helpers<T1>::filtered_type, int>::value && is_same_type<T2, float>::value)
+        || (is_same_type<typename async_helpers<T1>::filtered_type, float>::value && is_same_type<T2, int>::value);
+
+    __TBB_STATIC_ASSERT( (bAllowed == CheckerMakeEdge<function_node<continue_msg, T1>, function_node<T2> >::value), "invalid connection Fn<T1> -> Fn<T2>" );
+    __TBB_STATIC_ASSERT( (bAllowed == CheckerMakeEdge<queue_node<T1>, function_node<T2> >::value), "invalid connection Queue<T1> -> Fn<T2>" );
+
+    // Test make_edge() & remove_edge() availability with output_port<N>(node&)
+    __TBB_STATIC_ASSERT( (bAllowed == CheckerMakeEdge<typename strip< decltype(
+        output_port<0>( *static_cast<multifunction_node< continue_msg, tuple<T1, int> >*>(0) ) ) >::type,
+        function_node<T2> >::value), "invalid connection MultuFn<0><T1,int> -> Fn<T2>" );
+
+    __TBB_STATIC_ASSERT( (bAllowed == CheckerMakeEdge<typename strip< decltype(
+        output_port<1>( *static_cast<multifunction_node< continue_msg, tuple<int, T1> >*>(0) ) ) >::type,
+        function_node<T2> >::value), "invalid connection MultuFn<1><int, T1> -> Fn<T2>" );
+
+    // Test untyped_sender connections
+    __TBB_STATIC_ASSERT( (true == CheckerMakeEdge< untyped_sender, function_node<T1> >::value), "cannot connect UntypedSender -> Fn<T1>" );
+    // Test untyped_receiver connections
+    __TBB_STATIC_ASSERT( (true == CheckerMakeEdge< function_node<continue_msg, T1>, untyped_receiver >::value), "cannot connect F<.., T1> -> UntypedReceiver" );
+
+    // Test untyped_receiver->try_put(T2) availability
+    __TBB_STATIC_ASSERT( (true  == CheckerTryPut<untyped_receiver, T2>::value), "untyped_receiver cannot try_put(T2)" );
+    // Test receiver<T1>->try_put(T2) availability
+    __TBB_STATIC_ASSERT( (bConvertable == CheckerTryPut<receiver<T1>, T2>::value), "invalid availability of receiver<T1>->try_put(T2)" );
+};
+
+template <typename T1>
+struct WrappedChecker {
+    WrappedChecker() {} // Workaround for compilation error
+
+    template <typename T2>
+    struct T1T2Checker : TypeChecker<T1, T2> {};
+
+    typename wrap_tuple_elements< tuple_size<TypeTuple>::value, T1T2Checker, TypeTuple >::type a;
+};
+
+typedef wrap_tuple_elements< tuple_size<TypeTuple>::value, WrappedChecker, TypeTuple >::type Checker;
+
+} // namespace testFunctionsAvailabilityNS
+
+static void testTryPut() {
+    {
+        tbb::flow::graph g;
+        tbb::flow::function_node< int > f(g, tbb::flow::unlimited, [&](int) {});
+
+        ASSERT(f.try_put(5), "try_put(int) must return true");
+        ASSERT(f.try_put(7), "try_put(int) must return true");
+
+        tbb::flow::async_msg<int> a1, a2;
+        a1.set(5);
+        ASSERT(f.try_put(a1), "try_put(async_msg) must return true");
+        ASSERT(f.try_put(a2), "try_put(async_msg) must return true");
+        a2.set(7);
+        g.wait_for_all();
+    }
+    {
+        tbb::flow::graph g;
+        typedef tbb::flow::indexer_node< int >::output_type output_type;
+        tbb::flow::indexer_node< int > i(g);
+        tbb::flow::function_node< output_type > f(g, tbb::flow::unlimited, [&](output_type) {});
+        make_edge(i, f);
+
+        ASSERT(tbb::flow::input_port<0>(i).try_put(5), "try_put(int) must return true");
+        ASSERT(tbb::flow::input_port<0>(i).try_put(7), "try_put(int) must return true");
+
+        tbb::flow::async_msg<int> a1(5), a2(7);
+        ASSERT(tbb::flow::input_port<0>(i).try_put(a1), "try_put(async_msg) must return true");
+        ASSERT(tbb::flow::input_port<0>(i).try_put(a2), "try_put(async_msg) must return true");
+        g.wait_for_all();
+    }
+}
+
+int TestMain() {
+    REMARK(" *** CHECKING FUNCTIONS: make_edge/remove_edge(node<.., T1>, node<T2>) & node<T1>->try_put(T2) ***\n");
+    testFunctionsAvailabilityNS::Checker a;
+    const int typeTupleSize = tbb::flow::tuple_size<testFunctionsAvailabilityNS::TypeTuple>::value;
+    ASSERT(testFunctionsAvailabilityNS::g_CheckerCounter == typeTupleSize*typeTupleSize, "Type checker counter value is incorrect");
+
+    testTryPut();
+
+    // NOTE: Use '-v' command line argument to get traces & remarks
+    tbb::task_scheduler_init init(4);
+    bool bOk = true;
+
+    for (int i = 0; i < USE_N; ++i) {
+        if (i > 0 && i%1000 == 0) {
+            REPORT(" *** Starting TEST %d... ***\n", i);
+        }
+
+        REMARK(" *** TEST %d ***\n", i);
+        bOk = bOk && testSimplestCase();
+        bOk = bOk && testChaining();
+    }
+
+    _TRACE_( " *** " << USE_N << " tests: " << (bOk ? "all tests passed" : "TESTS FAILED !!!") << " ***" );
+    return (bOk ? Harness::Done : Harness::Unknown);
+}
+
+#else // __TBB_PREVIEW_ASYNC_MSG
+
+#include "harness.h"
+
+int TestMain() {
+    return Harness::Skipped;
+}
+
+#endif // __TBB_PREVIEW_ASYNC_MSG
diff --git a/xdl/third_party/tbb/src/test/test_async_node.cpp b/xdl/third_party/tbb/src/test/test_async_node.cpp
new file mode 100644
index 00000000..27ccd2c0
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_async_node.cpp
@@ -0,0 +1,615 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#include "harness_graph.h"
+#include "harness_barrier.h"
+#include "tbb/concurrent_queue.h"
+#include "tbb/flow_graph.h"
+#include "tbb/task.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/mutex.h"
+#include "tbb/compat/condition_variable"
+
+#include <string>
+
+class minimal_type {
+    template<typename T>
+    friend struct place_wrapper;
+
+    int value;
+
+public:
+    minimal_type() : value(-1) {}
+    minimal_type(int v) : value(v) {}
+    minimal_type(const minimal_type &m) : value(m.value) { }
+    minimal_type &operator=(const minimal_type &m) { value = m.value; return *this; }
+};
+
+template <typename T>
+struct place_wrapper {
+    typedef T wrapped_type;
+    T value;
+    tbb::tbb_thread::id thread_id;
+    tbb::task* task_ptr;
+
+    place_wrapper( ) : value(0) {
+        thread_id = tbb::this_tbb_thread::get_id();
+        task_ptr = &tbb::task::self();
+    }
+    place_wrapper( int v ) : value(v) {
+        thread_id = tbb::this_tbb_thread::get_id();
+        task_ptr = &tbb::task::self();
+    }
+
+    place_wrapper( const place_wrapper<int> &v ) : value(v.value), thread_id(v.thread_id), task_ptr(v.task_ptr) { }
+
+    place_wrapper( const place_wrapper<minimal_type> &v ) : value(v.value), thread_id(v.thread_id), task_ptr(v.task_ptr) { }
+};
+
+template<typename T1, typename T2>
+struct wrapper_helper {
+    static void check(const T1 &, const T2 &) { }
+
+    static void copy_value(const T1 &in, T2 &out) {
+        out = in;
+    }
+};
+
+template<typename T1, typename T2>
+struct wrapper_helper< place_wrapper<T1>, place_wrapper<T2> > {
+    static void check(const place_wrapper<T1> &a, const place_wrapper<T2> &b) {
+       REMARK("a.task_ptr == %p != b.task_ptr == %p\n", a.task_ptr, b.task_ptr);
+       ASSERT( (a.thread_id != b.thread_id), "same thread used to execute adjacent nodes");
+       ASSERT( (a.task_ptr != b.task_ptr), "same task used to execute adjacent nodes");
+       return;
+    }
+    static void copy_value(const place_wrapper<T1> &in, place_wrapper<T2> &out) {
+        out.value = in.value;
+    }
+};
+
+const int NUMBER_OF_MSGS = 10;
+const int UNKNOWN_NUMBER_OF_ITEMS = -1;
+tbb::atomic<int> async_body_exec_count;
+tbb::atomic<int> async_activity_processed_msg_count;
+tbb::atomic<int> end_body_exec_count;
+
+// queueing required in test_reset for testing of cancelation
+typedef tbb::flow::async_node< int, int, tbb::flow::queueing > counting_async_node_type;
+typedef counting_async_node_type::gateway_type counting_gateway_type;
+
+struct counting_async_body {
+    tbb::atomic<int> my_async_body_exec_count;
+
+    counting_async_body() {
+        my_async_body_exec_count = 0;
+    }
+
+    void operator()( const int &input, counting_gateway_type& gateway) {
+        REMARK( "Body execution with input == %d\n", input);
+        ++my_async_body_exec_count;
+        ++async_body_exec_count;
+        if ( input == -1 ) {
+            bool result = tbb::task::self().group()->cancel_group_execution();
+            REMARK( "Canceling graph execution\n" );
+            ASSERT( result == true, "attempted to cancel graph twice" );
+            Harness::Sleep(50);
+        }
+        gateway.try_put(input);
+    }
+};
+
+void test_reset() {
+    const int N = NUMBER_OF_MSGS;
+    async_body_exec_count = 0;
+
+    tbb::flow::graph g;
+    counting_async_node_type a(g, tbb::flow::serial, counting_async_body() );
+
+    const int R = 3;
+    std::vector< harness_counting_receiver<int> > r(R, harness_counting_receiver<int>(g));
+
+    for (int i = 0; i < R; ++i) {
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+        tbb::flow::make_edge(a, r[i]);
+#else
+        tbb::flow::make_edge( tbb::flow::output_port<0>(a), r[i] );
+#endif
+    }
+
+    REMARK( "One body execution\n" );
+    a.try_put(-1);
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+    // should be canceled with only 1 item reaching the async_body and the counting receivers
+    // and N items left in the node's queue
+    ASSERT( g.is_cancelled() == true, "task group not canceled" );
+
+    counting_async_body b1 = tbb::flow::copy_body<counting_async_body>(a);
+    ASSERT( int(async_body_exec_count) == int(b1.my_async_body_exec_count), "body and global body counts are different" );
+    ASSERT( int(async_body_exec_count) == 1, "global body execution count not 1"  );
+    for (int i = 0; i < R; ++i) {
+        ASSERT( int(r[i].my_count) == 1, "counting receiver count not 1" );
+    }
+
+    // should clear the async_node queue, but retain its local count at 1 and keep all edges
+    g.reset(tbb::flow::rf_reset_protocol);
+
+    REMARK( "N body executions\n" );
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT( g.is_cancelled() == false, "task group not canceled" );
+
+    // a total of N+1 items should have passed through the node body
+    // the local body count should also be N+1
+    // and the counting receivers should all have a count of N+1
+    counting_async_body b2 = tbb::flow::copy_body<counting_async_body>(a);
+    ASSERT( int(async_body_exec_count) == int(b2.my_async_body_exec_count), "local and global body execution counts are different" );
+    REMARK( "async_body_exec_count==%d\n", int(async_body_exec_count) );
+    ASSERT( int(async_body_exec_count) == N+1, "globcal body execution count not N+1"  );
+    for (int i = 0; i < R; ++i) {
+        ASSERT( int(r[i].my_count) == N+1, "counting receiver has not received N+1 items" );
+    }
+
+    REMARK( "N body executions with new bodies\n" );
+    // should clear the async_node queue and reset its local count to 0, but keep all edges
+    g.reset(tbb::flow::rf_reset_bodies);
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT( g.is_cancelled() == false, "task group not canceled" );
+
+    // a total of 2N+1 items should have passed through the node body
+    // the local body count should be N
+    // and the counting receivers should all have a count of 2N+1
+    counting_async_body b3 = tbb::flow::copy_body<counting_async_body>(a);
+    ASSERT( int(async_body_exec_count) == 2*N+1, "global body execution count not 2N+1"  );
+    ASSERT( int(b3.my_async_body_exec_count) == N, "local body execution count not N"  );
+    for (int i = 0; i < R; ++i) {
+        ASSERT( int(r[i].my_count) == 2*N+1, "counting receiver has not received 2N+1 items" );
+    }
+
+    // should clear the async_node queue and keep its local count at N and remove all edges
+    REMARK( "N body executions with no edges\n" );
+    g.reset(tbb::flow::rf_clear_edges);
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT( g.is_cancelled() == false, "task group not canceled" );
+
+    // a total of 3N+1 items should have passed through the node body
+    // the local body count should now be 2*N
+    // and the counting receivers should remain at a count of 2N+1
+    counting_async_body b4 = tbb::flow::copy_body<counting_async_body>(a);
+    ASSERT( int(async_body_exec_count) == 3*N+1, "global body execution count not 3N+1"  );
+    ASSERT( int(b4.my_async_body_exec_count) == 2*N, "local body execution count not 2N"  );
+    for (int i = 0; i < R; ++i) {
+        ASSERT( int(r[i].my_count) == 2*N+1, "counting receiver has not received 2N+1 items" );
+    }
+
+    // put back 1 edge to receiver 0
+    REMARK( "N body executions with 1 edge\n" );
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+    tbb::flow::make_edge(a, r[0]);
+#else
+    tbb::flow::make_edge( tbb::flow::output_port<0>(a), r[0] );
+#endif
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT( g.is_cancelled() == false, "task group not canceled" );
+
+    // a total of 4N+1 items should have passed through the node body
+    // the local body count should now be 3*N
+    // and all of the counting receivers should remain at a count of 2N+1, except r[0] which should be 3N+1
+    counting_async_body b5 = tbb::flow::copy_body<counting_async_body>(a);
+    ASSERT( int(async_body_exec_count) == 4*N+1, "global body execution count not 4N+1"  );
+    ASSERT( int(b5.my_async_body_exec_count) == 3*N, "local body execution count not 3N"  );
+    ASSERT( int(r[0].my_count) == 3*N+1, "counting receiver has not received 3N+1 items" );
+    for (int i = 1; i < R; ++i) {
+        ASSERT( int(r[i].my_count) == 2*N+1, "counting receiver has not received 2N+1 items" );
+    }
+
+    // should clear the async_node queue and keep its local count at N and remove all edges
+    REMARK( "N body executions with no edges and new body\n" );
+    g.reset(static_cast<tbb::flow::reset_flags>(tbb::flow::rf_reset_bodies|tbb::flow::rf_clear_edges));
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT( g.is_cancelled() == false, "task group not canceled" );
+
+    // a total of 4N+1 items should have passed through the node body
+    // the local body count should now be 3*N
+    // and all of the counting receivers should remain at a count of 2N+1, except r[0] which should be 3N+1
+    counting_async_body b6 = tbb::flow::copy_body<counting_async_body>(a);
+    ASSERT( int(async_body_exec_count) == 5*N+1, "global body execution count not 5N+1"  );
+    ASSERT( int(b6.my_async_body_exec_count) == N, "local body execution count not N"  );
+    ASSERT( int(r[0].my_count) == 3*N+1, "counting receiver has not received 3N+1 items" );
+    for (int i = 1; i < R; ++i) {
+        ASSERT( int(r[i].my_count) == 2*N+1, "counting receiver has not received 2N+1 items" );
+    }
+}
+
+template< typename Input, typename Output >
+class async_activity : NoAssign {
+public:
+    typedef Input input_type;
+    typedef Output output_type;
+    typedef tbb::flow::async_node< input_type, output_type > async_node_type;
+    typedef typename async_node_type::gateway_type gateway_type;
+
+    struct work_type {
+        input_type input;
+        gateway_type* gateway;
+    };
+
+    class ServiceThreadBody {
+    public:
+        ServiceThreadBody( async_activity* activity ) : my_activity( activity ) {}
+
+        void operator()() {
+            my_activity->process();
+        }
+    private:
+        async_activity* my_activity;
+    };
+
+    async_activity(int expected_items, int sleep_time = 50) : my_expected_items(expected_items), my_sleep_time(sleep_time) {
+        my_quit = false;
+        tbb::tbb_thread( ServiceThreadBody( this ) ).swap( my_service_thread );
+    }
+
+private:
+
+    async_activity( const async_activity& ) : my_expected_items(UNKNOWN_NUMBER_OF_ITEMS), my_sleep_time(0) { }
+
+public:
+    ~async_activity() {
+        stop();
+        my_service_thread.join();
+    }
+
+    void submit( const input_type &input, gateway_type& gateway ) {
+        work_type work = { input, &gateway};
+        my_work_queue.push( work );
+    }
+
+    void process() {
+        do {
+            work_type work;
+            if( my_work_queue.try_pop( work ) ) {
+                Harness::Sleep(my_sleep_time);
+                ++async_activity_processed_msg_count;
+                output_type output;
+                wrapper_helper<output_type, output_type>::copy_value(work.input, output);
+                wrapper_helper<output_type, output_type>::check(work.input, output);
+                work.gateway->try_put(output);
+                if ( my_expected_items == UNKNOWN_NUMBER_OF_ITEMS || int(async_activity_processed_msg_count) == my_expected_items ) {
+                    work.gateway->release_wait();
+                }
+            }
+        } while( my_quit == false || !my_work_queue.empty());
+    }
+
+    void stop() {
+        my_quit = true;
+    }
+
+    bool should_reserve_each_time() {
+        if ( my_expected_items == UNKNOWN_NUMBER_OF_ITEMS )
+            return true;
+        else
+            return false;
+    }
+
+private:
+
+    const int my_expected_items;
+    const int my_sleep_time;
+
+    tbb::concurrent_queue< work_type > my_work_queue;
+
+    tbb::atomic< bool > my_quit;
+
+    tbb::tbb_thread my_service_thread;
+};
+
+template<typename Input, typename Output>
+struct basic_test {
+    typedef Input input_type;
+    typedef Output output_type;
+    typedef tbb::flow::async_node< input_type, output_type > async_node_type;
+    typedef typename async_node_type::gateway_type gateway_type;
+
+    class start_body_type {
+        typedef Input input_type;
+    public:
+        input_type operator()( int input ) {
+            return input_type(input);
+        }
+    };
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+    class async_body_type {
+        typedef Input input_type;
+        typedef Output output_type;
+        typedef tbb::flow::async_node< input_type, output_type > async_node_type;
+        typedef typename async_node_type::gateway_type gateway_type;
+    public:
+        typedef async_activity<input_type, output_type> async_activity_type;
+
+        async_body_type( async_activity_type* aa ) : my_async_activity( aa ) { }
+
+        async_body_type( const async_body_type& other ) : my_async_activity( other.my_async_activity ) { }
+
+        void operator()( const input_type &input, gateway_type& gateway ) {
+            ++async_body_exec_count;
+            my_async_activity->submit( input, gateway);
+            if ( my_async_activity->should_reserve_each_time() )
+                gateway.reserve_wait();
+        }
+
+    private:
+        async_activity_type* my_async_activity;
+    };
+#endif
+
+    class end_body_type {
+        typedef Output output_type;
+    public:
+        void operator()( const output_type &input ) {
+            ++end_body_exec_count;
+            output_type output;
+            wrapper_helper<output_type, output_type>::check(input, output);
+        }
+    };
+
+    basic_test() {}
+
+public:
+
+    static int run(int async_expected_items = UNKNOWN_NUMBER_OF_ITEMS) {
+        async_activity<input_type, output_type> my_async_activity(async_expected_items);
+        tbb::flow::graph g;
+        tbb::flow::function_node< int, input_type > start_node( g, tbb::flow::unlimited, start_body_type() );
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        async_node_type offload_node(g, tbb::flow::unlimited, [&] (const input_type &input, gateway_type& gateway) {
+            ++async_body_exec_count;
+            my_async_activity.submit(input, gateway);
+            if(my_async_activity.should_reserve_each_time())
+                gateway.reserve_wait();
+        } );
+#else
+        async_node_type offload_node( g, tbb::flow::unlimited, async_body_type( &my_async_activity ) );
+#endif
+
+        tbb::flow::function_node< output_type > end_node( g, tbb::flow::unlimited, end_body_type() );
+
+        tbb::flow::make_edge( start_node, offload_node );
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+        tbb::flow::make_edge( offload_node, end_node );
+#else
+        tbb::flow::make_edge( tbb::flow::output_port<0>(offload_node), end_node );
+#endif
+        async_body_exec_count = 0;
+        async_activity_processed_msg_count = 0;
+        end_body_exec_count = 0;
+
+        if (async_expected_items != UNKNOWN_NUMBER_OF_ITEMS ) {
+            offload_node.gateway().reserve_wait();
+        }
+        for (int i = 0; i < NUMBER_OF_MSGS; ++i) {
+            start_node.try_put(i);
+        }
+        g.wait_for_all();
+        ASSERT( async_body_exec_count == NUMBER_OF_MSGS, "AsyncBody procesed wrong number of signals" );
+        ASSERT( async_activity_processed_msg_count == NUMBER_OF_MSGS, "AsyncActivity processed wrong number of signals" );
+        ASSERT( end_body_exec_count == NUMBER_OF_MSGS, "EndBody processed wrong number of signals");
+        REMARK("async_body_exec_count == %d == async_activity_processed_msg_count == %d == end_body_exec_count == %d\n",
+                int(async_body_exec_count), int(async_activity_processed_msg_count), int(end_body_exec_count));
+        return Harness::Done;
+    }
+
+};
+
+int test_copy_ctor() {
+    const int N = NUMBER_OF_MSGS;
+    async_body_exec_count = 0;
+
+    tbb::flow::graph g;
+
+    harness_counting_receiver<int> r1(g);
+    harness_counting_receiver<int> r2(g);
+
+    counting_async_node_type a(g, tbb::flow::unlimited, counting_async_body() );
+    counting_async_node_type b(a);
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+    tbb::flow::make_edge(a, r1);
+    tbb::flow::make_edge(b, r2);
+#else
+    tbb::flow::make_edge(tbb::flow::output_port<0>(a), r1);
+    tbb::flow::make_edge(tbb::flow::output_port<0>(b), r2);
+#endif
+
+    for (int i = 0; i < N; ++i) {
+       a.try_put(i);
+    }
+    g.wait_for_all();
+
+    REMARK("async_body_exec_count = %d\n", int(async_body_exec_count));
+    REMARK("r1.my_count == %d and r2.my_count = %d\n", int(r1.my_count), int(r2.my_count));
+    ASSERT( int(async_body_exec_count) == NUMBER_OF_MSGS, "AsyncBody procesed wrong number of signals" );
+    ASSERT( int(r1.my_count) == N, "counting receiver r1 has not received N items" );
+    ASSERT( int(r2.my_count) == 0, "counting receiver r2 has not received 0 items" );
+
+    for (int i = 0; i < N; ++i) {
+       b.try_put(i);
+    }
+    g.wait_for_all();
+
+    REMARK("async_body_exec_count = %d\n", int(async_body_exec_count));
+    REMARK("r1.my_count == %d and r2.my_count = %d\n", int(r1.my_count), int(r2.my_count));
+    ASSERT( int(async_body_exec_count) == 2*NUMBER_OF_MSGS, "AsyncBody procesed wrong number of signals" );
+    ASSERT( int(r1.my_count) == N, "counting receiver r1 has not received N items" );
+    ASSERT( int(r2.my_count) == N, "counting receiver r2 has not received N items" );
+    return Harness::Done;
+}
+
+tbb::atomic<int> main_tid_count;
+
+template<typename Input, typename Output>
+struct spin_test {
+    typedef Input input_type;
+    typedef Output output_type;
+    typedef tbb::flow::async_node< input_type, output_type > async_node_type;
+    typedef typename async_node_type::gateway_type gateway_type;
+
+    class start_body_type {
+        typedef Input input_type;
+    public:
+        input_type operator()( int input ) {
+            return input_type(input);
+        }
+    };
+
+#if !__TBB_CPP11_LAMBDAS_PRESENT
+    class async_body_type {
+        typedef Input input_type;
+        typedef Output output_type;
+        typedef tbb::flow::async_node< input_type, output_type > async_node_type;
+        typedef typename async_node_type::gateway_type gateway_type;
+    public:
+        typedef async_activity<input_type, output_type> async_activity_type;
+
+        async_body_type( async_activity_type* aa ) : my_async_activity( aa ) { }
+
+        async_body_type( const async_body_type& other ) : my_async_activity( other.my_async_activity ) { }
+
+        void operator()(const input_type &input, gateway_type& gateway) {
+            ++async_body_exec_count;
+            my_async_activity->submit(input, gateway);
+            if(my_async_activity->should_reserve_each_time())
+                gateway.reserve_wait();
+        }
+
+    private:
+        async_activity_type* my_async_activity;
+    };
+#endif
+
+    class end_body_type {
+        typedef Output output_type;
+        tbb::tbb_thread::id my_main_tid;
+        Harness::SpinBarrier *my_barrier;
+    public:
+        end_body_type(tbb::tbb_thread::id t, Harness::SpinBarrier &b) : my_main_tid(t), my_barrier(&b) { }
+
+        void operator()( const output_type & ) {
+            ++end_body_exec_count;
+            if (tbb::this_tbb_thread::get_id() == my_main_tid) {
+               ++main_tid_count;
+            }
+            my_barrier->timed_wait_noerror(10);
+        }
+    };
+
+    spin_test() {}
+
+    static int run(int nthreads, int async_expected_items = UNKNOWN_NUMBER_OF_ITEMS) {
+        async_activity<input_type, output_type> my_async_activity(async_expected_items, 0);
+        Harness::SpinBarrier spin_barrier(nthreads);
+        tbb::flow::graph g;
+        tbb::flow::function_node< int, input_type > start_node( g, tbb::flow::unlimited, start_body_type() );
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        async_node_type offload_node(g, tbb::flow::unlimited, [&](const input_type &input, gateway_type& gateway) {
+            ++async_body_exec_count;
+            my_async_activity.submit(input, gateway);
+            if(my_async_activity.should_reserve_each_time())
+                gateway.reserve_wait();
+        });
+#else
+        async_node_type offload_node( g, tbb::flow::unlimited, async_body_type( &my_async_activity ) );
+#endif
+        tbb::flow::function_node< output_type > end_node( g, tbb::flow::unlimited, end_body_type(tbb::this_tbb_thread::get_id(), spin_barrier) );
+        tbb::flow::make_edge( start_node, offload_node );
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+        tbb::flow::make_edge( offload_node, end_node );
+#else
+        tbb::flow::make_edge( tbb::flow::output_port<0>(offload_node), end_node );
+#endif
+        async_body_exec_count = 0;
+        async_activity_processed_msg_count = 0;
+        end_body_exec_count = 0;
+        main_tid_count = 0;
+
+        if (async_expected_items != UNKNOWN_NUMBER_OF_ITEMS ) {
+            offload_node.gateway().reserve_wait();
+        }
+        for (int i = 0; i < nthreads*NUMBER_OF_MSGS; ++i) {
+            start_node.try_put(i);
+        }
+        g.wait_for_all();
+        ASSERT( async_body_exec_count == nthreads*NUMBER_OF_MSGS, "AsyncBody procesed wrong number of signals" );
+        ASSERT( async_activity_processed_msg_count == nthreads*NUMBER_OF_MSGS, "AsyncActivity processed wrong number of signals" );
+        ASSERT( end_body_exec_count == nthreads*NUMBER_OF_MSGS, "EndBody processed wrong number of signals");
+        ASSERT_WARNING( main_tid_count != 0, "Main thread did not participate in end_body tasks");
+        REMARK("async_body_exec_count == %d == async_activity_processed_msg_count == %d == end_body_exec_count == %d\n",
+                int(async_body_exec_count), int(async_activity_processed_msg_count), int(end_body_exec_count));
+        return Harness::Done;
+    }
+
+};
+
+void test_for_spin_avoidance() {
+    spin_test<int, int>::run(4);
+}
+
+template< typename Input, typename Output >
+int run_tests() {
+    basic_test<Input, Output>::run();
+    basic_test<Input, Output>::run(NUMBER_OF_MSGS);
+    basic_test<place_wrapper<Input>, place_wrapper<Output> >::run();
+    basic_test<place_wrapper<Input>, place_wrapper<Output> >::run(NUMBER_OF_MSGS);
+    return Harness::Done;
+}
+
+int TestMain() {
+    tbb::task_scheduler_init init(4);
+    run_tests<int, int>();
+    run_tests<minimal_type, minimal_type>();
+    run_tests<int, minimal_type>();
+
+    lightweight_testing::test<tbb::flow::async_node>(NUMBER_OF_MSGS);
+
+    test_reset();
+    test_copy_ctor();
+    test_for_spin_avoidance();
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_atomic.cpp b/xdl/third_party/tbb/src/test/test_atomic.cpp
new file mode 100644
index 00000000..bea54255
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_atomic.cpp
@@ -0,0 +1,1605 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_defs.h"
+
+#if __TBB_TEST_SKIP_PIC_MODE || (__TBB_TEST_SKIP_GCC_BUILTINS_MODE && __TBB_TEST_SKIP_ICC_BUILTINS_MODE)
+#include "harness.h"
+int TestMain() {
+    REPORT("Known issue: %s\n",
+           __TBB_TEST_SKIP_PIC_MODE? "PIC mode is not supported" : "Compiler builtins for atomic operations aren't available");
+    return Harness::Skipped;
+}
+#else
+
+// Put tbb/atomic.h first, so if it is missing a prerequisite header, we find out about it.
+// The tests here do *not* test for atomicity, just serial correctness. */
+
+#include "tbb/atomic.h"
+#include "harness_assert.h"
+#include <cstring>  // memcmp
+#include "tbb/aligned_space.h"
+#include <new>      //for placement new
+
+using std::memcmp;
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Unary minus operator applied to unsigned type, result still unsigned
+    // Constant conditional expression
+    #pragma warning( disable: 4127 4310 )
+#endif
+
+#if __TBB_GCC_STRICT_ALIASING_BROKEN
+    #pragma GCC diagnostic ignored "-Wstrict-aliasing"
+#endif
+
+enum LoadStoreExpression {
+    UseOperators,
+    UseImplicitAcqRel,
+    UseExplicitFullyFenced,
+    UseExplicitAcqRel,
+    UseExplicitRelaxed,
+    UseGlobalHelperFullyFenced,
+    UseGlobalHelperAcqRel,
+    UseGlobalHelperRelaxed
+};
+
+//! Structure that holds an atomic<T> and some guard bytes around it.
+template<typename T, LoadStoreExpression E = UseOperators>
+struct TestStruct {
+    typedef unsigned char byte_type;
+    T prefix;
+    tbb::atomic<T> counter;
+    T suffix;
+    TestStruct( T i ) {
+        ASSERT( sizeof(*this)==3*sizeof(T), NULL );
+        for (size_t j = 0; j < sizeof(T); ++j) {
+            reinterpret_cast<byte_type*>(&prefix)[j]             = byte_type(0x11*(j+1));
+            reinterpret_cast<byte_type*>(&suffix)[sizeof(T)-j-1] = byte_type(0x11*(j+1));
+        }
+        if ( E == UseOperators )
+            counter = i;
+        else if ( E == UseExplicitRelaxed )
+            counter.template store<tbb::relaxed>(i);
+        else
+            tbb::store<tbb::full_fence>( counter, i );
+    }
+    ~TestStruct() {
+        // Check for writes outside the counter.
+        for (size_t j = 0; j < sizeof(T); ++j) {
+            ASSERT( reinterpret_cast<byte_type*>(&prefix)[j]             == byte_type(0x11*(j+1)), NULL );
+            ASSERT( reinterpret_cast<byte_type*>(&suffix)[sizeof(T)-j-1] == byte_type(0x11*(j+1)), NULL );
+        }
+    }
+    static tbb::atomic<T> gCounter;
+};
+
+// A global variable of type tbb::atomic<>
+template<typename T, LoadStoreExpression E> tbb::atomic<T> TestStruct<T, E>::gCounter;
+
+//! Test compare_and_swap template members of class atomic<T> for memory_semantics=M
+template<typename T,tbb::memory_semantics M>
+void TestCompareAndSwapWithExplicitOrdering( T i, T j, T k ) {
+    ASSERT( i!=k && i!=j, "values must be distinct" );
+    // Test compare_and_swap that should fail
+    TestStruct<T> x(i);
+    T old = x.counter.template compare_and_swap<M>( j, k );
+    ASSERT( old==i, NULL );
+    ASSERT( x.counter==i, "old value not retained" );
+    // Test compare and swap that should succeed
+    old = x.counter.template compare_and_swap<M>( j, i );
+    ASSERT( old==i, NULL );
+    ASSERT( x.counter==j, "value not updated?" );
+}
+
+//! i, j, k must be different values
+template<typename T>
+void TestCompareAndSwap( T i, T j, T k ) {
+    ASSERT( i!=k && i!=j, "values must be distinct" );
+    // Test compare_and_swap that should fail
+    TestStruct<T> x(i);
+    T old = x.counter.compare_and_swap( j, k );
+    ASSERT( old==i, NULL );
+    ASSERT( x.counter==i, "old value not retained" );
+    // Test compare and swap that should succeed
+    old = x.counter.compare_and_swap( j, i );
+    ASSERT( old==i, NULL );
+    if( x.counter==i ) {
+        ASSERT( x.counter==j, "value not updated?" );
+    } else {
+        ASSERT( x.counter==j, "value trashed" );
+    }
+    // Check that atomic global variables work
+    TestStruct<T>::gCounter = i;
+    old = TestStruct<T>::gCounter.compare_and_swap( j, i );
+    ASSERT( old==i, NULL );
+    ASSERT( TestStruct<T>::gCounter==j, "value not updated?" );
+    TestCompareAndSwapWithExplicitOrdering<T,tbb::full_fence>(i,j,k);
+    TestCompareAndSwapWithExplicitOrdering<T,tbb::acquire>(i,j,k);
+    TestCompareAndSwapWithExplicitOrdering<T,tbb::release>(i,j,k);
+    TestCompareAndSwapWithExplicitOrdering<T,tbb::relaxed>(i,j,k);
+}
+
+//! memory_semantics variation on TestFetchAndStore
+template<typename T, tbb::memory_semantics M>
+void TestFetchAndStoreWithExplicitOrdering( T i, T j ) {
+    ASSERT( i!=j, "values must be distinct" );
+    TestStruct<T> x(i);
+    T old = x.counter.template fetch_and_store<M>( j );
+    ASSERT( old==i, NULL );
+    ASSERT( x.counter==j, NULL );
+}
+
+//! i and j must be different values
+template<typename T>
+void TestFetchAndStore( T i, T j ) {
+    ASSERT( i!=j, "values must be distinct" );
+    TestStruct<T> x(i);
+    T old = x.counter.fetch_and_store( j );
+    ASSERT( old==i, NULL );
+    ASSERT( x.counter==j, NULL );
+    // Check that atomic global variables work
+    TestStruct<T>::gCounter = i;
+    old = TestStruct<T>::gCounter.fetch_and_store( j );
+    ASSERT( old==i, NULL );
+    ASSERT( TestStruct<T>::gCounter==j, "value not updated?" );
+    TestFetchAndStoreWithExplicitOrdering<T,tbb::full_fence>(i,j);
+    TestFetchAndStoreWithExplicitOrdering<T,tbb::acquire>(i,j);
+    TestFetchAndStoreWithExplicitOrdering<T,tbb::release>(i,j);
+    TestFetchAndStoreWithExplicitOrdering<T,tbb::relaxed>(i,j);
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // conversion from <bigger integer> to <smaller integer>, possible loss of data
+    // the warning seems a complete nonsense when issued for e.g. short+=short
+    #pragma warning( disable: 4244 )
+#endif
+
+//! Test fetch_and_add members of class atomic<T> for memory_semantics=M
+template<typename T,tbb::memory_semantics M>
+void TestFetchAndAddWithExplicitOrdering( T i ) {
+    TestStruct<T> x(i);
+    T actual;
+    T expected = i;
+
+    // Test fetch_and_add member template
+    for( int j=0; j<10; ++j ) {
+        actual = x.counter.fetch_and_add(j);
+        ASSERT( actual==expected, NULL );
+        expected += j;
+    }
+    for( int j=0; j<10; ++j ) {
+        actual = x.counter.fetch_and_add(-j);
+        ASSERT( actual==expected, NULL );
+        expected -= j;
+    }
+
+    // Test fetch_and_increment member template
+    ASSERT( x.counter==i, NULL );
+    actual = x.counter.template fetch_and_increment<M>();
+    ASSERT( actual==i, NULL );
+    ASSERT( x.counter==T(i+1), NULL );
+
+    // Test fetch_and_decrement member template
+    actual = x.counter.template fetch_and_decrement<M>();
+    ASSERT( actual==T(i+1), NULL );
+    ASSERT( x.counter==i, NULL );
+}
+
+//! Test fetch_and_add and related operators
+template<typename T>
+void TestFetchAndAdd( T i ) {
+    TestStruct<T> x(i);
+    T value;
+    value = ++x.counter;
+    ASSERT( value==T(i+1), NULL );
+    value = x.counter++;
+    ASSERT( value==T(i+1), NULL );
+    value = x.counter--;
+    ASSERT( value==T(i+2), NULL );
+    value = --x.counter;
+    ASSERT( value==i, NULL );
+    T actual;
+    T expected = i;
+    for( int j=-100; j<=100; ++j ) {
+        expected += j;
+        actual = x.counter += j;
+        ASSERT( actual==expected, NULL );
+    }
+    for( int j=-100; j<=100; ++j ) {
+        expected -= j;
+        actual = x.counter -= j;
+        ASSERT( actual==expected, NULL );
+    }
+    // Test fetch_and_increment
+    ASSERT( x.counter==i, NULL );
+    actual = x.counter.fetch_and_increment();
+    ASSERT( actual==i, NULL );
+    ASSERT( x.counter==T(i+1), NULL );
+
+    // Test fetch_and_decrement
+    actual = x.counter.fetch_and_decrement();
+    ASSERT( actual==T(i+1), NULL );
+    ASSERT( x.counter==i, NULL );
+    x.counter = i;
+    ASSERT( x.counter==i, NULL );
+
+    // Check that atomic global variables work
+    TestStruct<T>::gCounter = i;
+    value = TestStruct<T>::gCounter.fetch_and_add( 42 );
+    expected = i+42;
+    ASSERT( value==i, NULL );
+    ASSERT( TestStruct<T>::gCounter==expected, "value not updated?" );
+    TestFetchAndAddWithExplicitOrdering<T,tbb::full_fence>(i);
+    TestFetchAndAddWithExplicitOrdering<T,tbb::acquire>(i);
+    TestFetchAndAddWithExplicitOrdering<T,tbb::release>(i);
+    TestFetchAndAddWithExplicitOrdering<T,tbb::relaxed>(i);
+}
+
+//! A type with unknown size.
+class IncompleteType;
+
+void TestFetchAndAdd( IncompleteType* ) {
+    // There are no fetch-and-add operations on a IncompleteType*.
+}
+void TestFetchAndAdd( void* ) {
+    // There are no fetch-and-add operations on a void*.
+}
+
+void TestFetchAndAdd( bool ) {
+    // There are no fetch-and-add operations on a bool.
+}
+
+template<typename T>
+void TestConst( T i ) {
+    // Try const
+    const TestStruct<T> x(i);
+    ASSERT( memcmp( &i, &x.counter, sizeof(T) )==0, "write to atomic<T> broken?" );
+    ASSERT( x.counter==i, "read of atomic<T> broken?" );
+    const TestStruct<T, UseExplicitRelaxed> y(i);
+    ASSERT( memcmp( &i, &y.counter, sizeof(T) )==0, "relaxed write to atomic<T> broken?" );
+    ASSERT( tbb::load<tbb::relaxed>(y.counter) == i, "relaxed read of atomic<T> broken?" );
+    const TestStruct<T, UseGlobalHelperFullyFenced> z(i);
+    ASSERT( memcmp( &i, &z.counter, sizeof(T) )==0, "sequentially consistent write to atomic<T> broken?" );
+    ASSERT( z.counter.template load<tbb::full_fence>() == i, "sequentially consistent read of atomic<T> broken?" );
+}
+
+#include "harness.h"
+
+#include <sstream>
+
+//TODO: consider moving it to separate file, and unify with one in examples command line interface
+template<typename T>
+std::string to_string(const T& a){
+    std::stringstream str; str <<a;
+    return str.str();
+}
+namespace initialization_tests {
+    template<typename T>
+    struct test_initialization_fixture{
+        typedef tbb::atomic<T> atomic_t;
+        tbb::aligned_space<atomic_t> non_zeroed_storage;
+        enum {fill_value = 0xFF };
+        test_initialization_fixture(){
+            memset(static_cast<void*>(non_zeroed_storage.begin()),fill_value,
+                   sizeof(non_zeroed_storage));
+            ASSERT( char(fill_value)==*(reinterpret_cast<char*>(non_zeroed_storage.begin()))
+                    ,"failed to fill the storage; memset error?");
+        }
+        //TODO: consider move it to destructor, even in a price of UB
+        void tear_down(){
+            non_zeroed_storage.begin()->~atomic_t();
+        }
+    };
+
+    template<typename T>
+    struct TestValueInitialization : test_initialization_fixture<T>{
+        void operator()(){
+            typedef typename test_initialization_fixture<T>::atomic_t atomic_type;
+            //please note that explicit braces below are needed to get zero initialization.
+            //in C++11, 8.5 Initializers [dcl.init], see  paragraphs 10,7,5
+            new (this->non_zeroed_storage.begin()) atomic_type();
+            //TODO: add use of KNOWN_ISSUE macro on SunCC 5.11
+            #if !__SUNPRO_CC || __SUNPRO_CC > 0x5110
+                //TODO: add printing of typename to the assertion
+                ASSERT(char(0)==*(reinterpret_cast<char*>(this->non_zeroed_storage.begin()))
+                        ,("value initialization for tbb::atomic should do zero initialization; "
+                          "actual value:"+to_string(this->non_zeroed_storage.begin()->load())).c_str());
+            #endif
+            this->tear_down();
+        };
+    };
+
+    template<typename T>
+    struct TestDefaultInitialization : test_initialization_fixture<T>{
+        void operator ()(){
+            typedef typename test_initialization_fixture<T>::atomic_t atomic_type;
+            new (this->non_zeroed_storage.begin()) atomic_type;
+            ASSERT( char(this->fill_value)==*(reinterpret_cast<char*>(this->non_zeroed_storage.begin()))
+                    ,"default initialization for atomic should do no initialization");
+            this->tear_down();
+        }
+    };
+#   if __TBB_ATOMIC_CTORS
+        template<typename T>
+        struct TestDirectInitialization : test_initialization_fixture<T> {
+            void operator()(T i){
+                typedef typename test_initialization_fixture<T>::atomic_t atomic_type;
+                new (this->non_zeroed_storage.begin()) atomic_type(i);
+                ASSERT(i == this->non_zeroed_storage.begin()->load()
+                        ,("tbb::atomic initialization failed; "
+                          "value:"+to_string(this->non_zeroed_storage.begin()->load())+
+                          "; expected:"+to_string(i)).c_str());
+                this->tear_down();
+            }
+        };
+#   endif
+}
+template<typename T>
+void TestValueInitialization(){
+    initialization_tests::TestValueInitialization<T>()();
+}
+template<typename T>
+void TestDefaultInitialization(){
+    initialization_tests::TestDefaultInitialization<T>()();
+}
+
+#if __TBB_ATOMIC_CTORS
+template<typename T>
+void TestDirectInitialization(T i){
+    initialization_tests::TestDirectInitialization<T>()(i);
+}
+//TODO:  it would be great to have constructor doing dynamic initialization of local atomic objects implicitly (with zero?),
+//       but do no dynamic initializations by default for static objects
+namespace test_constexpr_initialization_helper {
+    struct white_box_ad_hoc_type {
+        int _int;
+        constexpr white_box_ad_hoc_type(int a =0) : _int(a) {};
+        constexpr operator int() const { return _int; }
+    };
+}
+//some white boxing
+namespace tbb { namespace internal {
+    template<>
+    struct atomic_impl<test_constexpr_initialization_helper::white_box_ad_hoc_type>: atomic_impl<int> {
+        atomic_impl() = default;
+        constexpr atomic_impl(test_constexpr_initialization_helper::white_box_ad_hoc_type value):atomic_impl<int>(value){}
+        constexpr operator int() const { return this->my_storage.my_value; }
+    };
+}}
+
+//TODO: make this a parameterized macro
+void TestConstExprInitializationIsTranslationTime(){
+    const char* ct_init_failed_msg = "translation time init failed?";
+    typedef tbb::atomic<int> atomic_t;
+    constexpr atomic_t a(8);
+    ASSERT(a == 8,ct_init_failed_msg);
+
+#if !__TBB_CONSTEXPR_MEMBER_FUNCTION_BROKEN
+    constexpr tbb::atomic<test_constexpr_initialization_helper::white_box_ad_hoc_type> ct_atomic(10);
+    //for some unknown reason clang does not managed to enum syntax
+#if __clang__
+    constexpr int ct_atomic_value_ten = (int)ct_atomic;
+#else
+    enum {ct_atomic_value_ten = (int)ct_atomic};
+#endif
+    __TBB_STATIC_ASSERT(ct_atomic_value_ten == 10, "translation time init failed?");
+    ASSERT(ct_atomic_value_ten == 10,ct_init_failed_msg);
+    int array[ct_atomic_value_ten];
+    ASSERT(Harness::array_length(array) == 10,ct_init_failed_msg);
+#endif //__TBB_CONSTEXPR_MEMBER_FUNCTION_BROKEN
+}
+
+#include <string>
+#include <vector>
+namespace TestConstExprInitializationOfGlobalObjectsHelper{
+    struct static_objects_dynamic_init_order_tester {
+        static int order_hash;
+        template<int N> struct nth {
+            nth(){ order_hash = (order_hash<<4)+N; }
+        };
+
+        static nth<2> second;
+        static nth<3> third;
+    };
+
+    int static_objects_dynamic_init_order_tester::order_hash=1;
+    static_objects_dynamic_init_order_tester::nth<2> static_objects_dynamic_init_order_tester::second;
+    static_objects_dynamic_init_order_tester::nth<3> static_objects_dynamic_init_order_tester::third;
+
+    void TestStaticsDynamicInitializationOrder(){
+        ASSERT(static_objects_dynamic_init_order_tester::order_hash==0x123,"Statics dynamic initialization order is broken? ");
+    }
+
+    template<typename T>
+    void TestStaticInit();
+
+    namespace auto_registered_tests_helper {
+        template<typename T>
+        struct type_name ;
+
+        #define REGISTER_TYPE_NAME(T)                           \
+        namespace auto_registered_tests_helper{                 \
+            template<>                                          \
+            struct type_name<T> {                               \
+                static const char* name;                        \
+            };                                                  \
+            const char* type_name<T>::name = #T;                \
+        }                                                       \
+
+        typedef void (* p_test_function_type)();
+        static std::vector<p_test_function_type> const_expr_tests;
+
+        template <typename T>
+        struct registration{
+            registration(){const_expr_tests.push_back(&TestStaticInit<T>);}
+        };
+    }
+    //according to ISO C++11 [basic.start.init], static data fields of class template have unordered
+    //initialization unless it is an explicit specialization
+    template<typename T>
+    struct tester;
+
+    #define TESTER_SPECIALIZATION(T,ct_value)                            \
+    template<>                                                           \
+    struct tester<T> {                                                   \
+        struct static_before;                                            \
+        static bool result;                                              \
+        static static_before static_before_;                             \
+        static tbb::atomic<T> static_atomic;                             \
+                                                                         \
+        static auto_registered_tests_helper::registration<T> registered; \
+    };                                                                   \
+    bool tester<T>::result = false;                                      \
+                                                                         \
+    struct tester<T>::static_before {                                    \
+       static_before(){ result = (static_atomic==ct_value); }            \
+    } ;                                                                  \
+                                                                         \
+    tester<T>::static_before tester<T>::static_before_;                  \
+    tbb::atomic<T> tester<T>::static_atomic(ct_value);                   \
+                                                                         \
+    auto_registered_tests_helper::registration<T> tester<T>::registered; \
+    REGISTER_TYPE_NAME(T)                                                \
+
+    template<typename T>
+    void TestStaticInit(){
+        //TODO: add printing of values to the assertion
+        std::string type_name = auto_registered_tests_helper::type_name<T>::name;
+        ASSERT(tester<T>::result,("Static initialization failed for atomic " + type_name).c_str());
+    }
+
+    void CallExprInitTests(){
+#   if __TBB_STATIC_CONSTEXPR_INIT_BROKEN
+        REPORT("Known issue: Compile-time initialization fails for static tbb::atomic variables\n");
+#   else
+        using namespace auto_registered_tests_helper;
+        for (size_t i =0; i<const_expr_tests.size(); ++i){
+            (*const_expr_tests[i])();
+        }
+        REMARK("ran %d constexpr static init test \n",const_expr_tests.size());
+#   endif
+    }
+
+    //TODO: unify somehow list of tested types with one in TestMain
+    //TODO: add specializations for:
+    //T,T(-T(1)
+    //T,1
+#   if __TBB_64BIT_ATOMICS
+        TESTER_SPECIALIZATION(long long,8LL)
+        TESTER_SPECIALIZATION(unsigned long long,8ULL)
+#   endif
+    TESTER_SPECIALIZATION(unsigned long,8UL)
+    TESTER_SPECIALIZATION(long,8L)
+    TESTER_SPECIALIZATION(unsigned int,8U)
+    TESTER_SPECIALIZATION(int,8)
+    TESTER_SPECIALIZATION(unsigned short,8)
+    TESTER_SPECIALIZATION(short,8)
+    TESTER_SPECIALIZATION(unsigned char,8)
+    TESTER_SPECIALIZATION(signed char,8)
+    TESTER_SPECIALIZATION(char,8)
+    TESTER_SPECIALIZATION(wchar_t,8)
+
+    int dummy;
+    TESTER_SPECIALIZATION(void*,&dummy);
+    TESTER_SPECIALIZATION(bool,false);
+    //TODO: add test for constexpt initialization of floating types
+    //for some unknown reasons 0.1 becomes 0.10000001 and equality comparison fails
+    enum written_number_enum{one=2,two};
+    TESTER_SPECIALIZATION(written_number_enum,one);
+    //TODO: add test for ArrayElement<> as in TestMain
+}
+
+void TestConstExprInitializationOfGlobalObjects(){
+    //first assert that assumption the test based on are correct
+    TestConstExprInitializationOfGlobalObjectsHelper::TestStaticsDynamicInitializationOrder();
+    TestConstExprInitializationOfGlobalObjectsHelper::CallExprInitTests();
+}
+#endif //__TBB_ATOMIC_CTORS
+template<typename T>
+void TestOperations( T i, T j, T k ) {
+    TestValueInitialization<T>();
+    TestDefaultInitialization<T>();
+#   if __TBB_ATOMIC_CTORS
+        TestConstExprInitializationIsTranslationTime();
+        TestDirectInitialization<T>(i);
+        TestDirectInitialization<T>(j);
+        TestDirectInitialization<T>(k);
+#   endif
+    TestConst(i);
+    TestCompareAndSwap(i,j,k);
+    TestFetchAndStore(i,k);    // Pass i,k instead of i,j, because callee requires two distinct values.
+}
+
+template<typename T>
+void TestParallel( const char* name );
+
+bool ParallelError;
+
+template<typename T>
+struct AlignmentChecker {
+    char c;
+    tbb::atomic<T> i;
+};
+
+//TODO: candidate for test_compiler?
+template<typename T>
+void TestAlignment( const char* name ) {
+    AlignmentChecker<T> ac;
+    tbb::atomic<T> x;
+    x = T(0);
+    bool is_stack_variable_aligned = tbb::internal::is_aligned(&x,sizeof(T));
+    bool is_member_variable_aligned = tbb::internal::is_aligned(&ac.i,sizeof(T));
+    bool is_struct_size_correct = (sizeof(AlignmentChecker<T>)==2*sizeof(tbb::atomic<T>));
+    bool known_issue_condition = __TBB_FORCE_64BIT_ALIGNMENT_BROKEN && ( sizeof(T)==8);
+    //TODO: replace these ifs with KNOWN_ISSUE macro when it available
+    if (!is_stack_variable_aligned){
+        std::string msg = "Compiler failed to properly align local atomic variable?; size:"+to_string(sizeof(T)) + " type: "
+                +to_string(name) + " location:" + to_string(&x) +"\n";
+        if (known_issue_condition) {
+            REPORT(("Known issue: "+ msg).c_str());
+        }else{
+            ASSERT(false,msg.c_str());
+        }
+    }
+    if (!is_member_variable_aligned){
+        std::string msg = "Compiler failed to properly align atomic member variable?; size:"+to_string(sizeof(T)) + " type: "
+                +to_string(name) + " location:" + to_string(&ac.i) +"\n";
+        if (known_issue_condition) {
+            REPORT(("Known issue: "+ msg).c_str());
+        }else{
+            ASSERT(false,msg.c_str());
+        }
+    }
+    if (!is_struct_size_correct){
+        std::string msg = "Compiler failed to properly add padding to structure with atomic member variable?; Structure size:"+to_string(sizeof(AlignmentChecker<T>))
+                + " atomic size:"+to_string(sizeof(tbb::atomic<T>)) + " type: " + to_string(name) +"\n";
+        if (known_issue_condition) {
+            REPORT(("Known issue: "+ msg).c_str());
+        }else{
+            ASSERT(false,msg.c_str());
+        }
+    }
+
+    AlignmentChecker<T> array[5];
+    for( int k=0; k<5; ++k ) {
+        bool is_member_variable_in_array_aligned = tbb::internal::is_aligned(&array[k].i,sizeof(T));
+        if (!is_member_variable_in_array_aligned) {
+            std::string msg = "Compiler failed to properly align atomic member variable inside an array?; size:"+to_string(sizeof(T)) + " type:"+to_string(name)
+                    + " location:" + to_string(&array[k].i) + "\n";
+            if (known_issue_condition){
+                REPORT(("Known issue: "+ msg).c_str());
+            }else{
+                ASSERT(false,msg.c_str());
+            }
+        }
+    }
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( disable: 4146 ) // unary minus operator applied to unsigned type, result still unsigned
+    #pragma warning( disable: 4334 ) // result of 32-bit shift implicitly converted to 64 bits
+#endif
+
+/** T is an integral type. */
+template<typename T>
+void TestAtomicInteger( const char* name ) {
+    REMARK("testing atomic<%s> (size=%d)\n",name,sizeof(tbb::atomic<T>));
+    TestAlignment<T>(name);
+    TestOperations<T>(0L, T(-T(1)), T(1));
+    for( int k=0; k<int(sizeof(long))*8-1; ++k ) {
+        const long p = 1L<<k;
+        TestOperations<T>(T(p), T(~(p)), T(1-(p)));
+        TestOperations<T>(T(-(p)), T(~(-(p))), T(1-(-(p))));
+        TestFetchAndAdd<T>(T(-(p)));
+    }
+    TestParallel<T>( name );
+}
+
+namespace test_indirection_helpers {
+    template<typename T>
+    struct Foo {
+        T x, y, z;
+    };
+}
+
+template<typename T>
+void TestIndirection() {
+    using test_indirection_helpers::Foo;
+    Foo<T> item;
+    tbb::atomic<Foo<T>*> pointer;
+    pointer = &item;
+    for( int k=-10; k<=10; ++k ) {
+        // Test various syntaxes for indirection to fields with non-zero offset.
+        T value1=T(), value2=T();
+        for( size_t j=0; j<sizeof(T); ++j ) {
+            ((char*)&value1)[j] = char(k^j);
+            ((char*)&value2)[j] = char(k^j*j);
+        }
+        pointer->y = value1;
+        (*pointer).z = value2;
+        T result1 = (*pointer).y;
+        T result2 = pointer->z;
+        ASSERT( memcmp(&value1,&result1,sizeof(T))==0, NULL );
+        ASSERT( memcmp(&value2,&result2,sizeof(T))==0, NULL );
+    }
+    #if __TBB_ICC_BUILTIN_ATOMICS_POINTER_ALIASING_BROKEN
+        //prevent ICC compiler from assuming 'item' is unused and reusing it's storage
+        item.x = item.y=item.z;
+    #endif
+}
+
+//! Test atomic<T*>
+template<typename T>
+void TestAtomicPointer() {
+    REMARK("testing atomic pointer (%d)\n",int(sizeof(T)));
+    T array[1000];
+    TestOperations<T*>(&array[500],&array[250],&array[750]);
+    TestFetchAndAdd<T*>(&array[500]);
+    TestIndirection<T>();
+    TestParallel<T*>( "pointer" );
+
+}
+
+//! Test atomic<Ptr> where Ptr is a pointer to a type of unknown size
+template<typename Ptr>
+void TestAtomicPointerToTypeOfUnknownSize( const char* name ) {
+    REMARK("testing atomic<%s>\n",name);
+    char array[1000];
+    TestOperations<Ptr>((Ptr)(void*)&array[500],(Ptr)(void*)&array[250],(Ptr)(void*)&array[750]);
+    TestParallel<Ptr>( name );
+}
+
+void TestAtomicBool() {
+    REMARK("testing atomic<bool>\n");
+    TestOperations<bool>(false,true,true);
+    TestOperations<bool>(true,false,false);
+    TestParallel<bool>( "bool" );
+}
+
+template<typename EnumType>
+struct HasImplicitConversionToInt {
+    typedef bool yes;
+    typedef int no;
+    __TBB_STATIC_ASSERT( sizeof(yes) != sizeof(no), "The helper needs two types of different sizes to work." );
+
+    static yes detect( int );
+    static no detect( ... );
+
+    enum { value = (sizeof(yes) == sizeof(detect( EnumType() ))) };
+};
+
+enum Color {Red=0,Green=1,Blue=-1};
+
+void TestAtomicEnum() {
+    REMARK("testing atomic<Color>\n");
+    TestOperations<Color>(Red,Green,Blue);
+    TestParallel<Color>( "Color" );
+    __TBB_STATIC_ASSERT( HasImplicitConversionToInt< tbb::atomic<Color> >::value, "The implicit conversion is expected." );
+}
+
+#if __TBB_SCOPED_ENUM_PRESENT
+enum class ScopedColor1 {ScopedRed,ScopedGreen,ScopedBlue=-1};
+// TODO: extend the test to cover 2 byte scoped enum as well
+#if __TBB_ICC_SCOPED_ENUM_WITH_UNDERLYING_TYPE_NEGATIVE_VALUE_BROKEN
+enum class ScopedColor2 : signed char {ScopedZero, ScopedOne,ScopedRed=42,ScopedGreen=-1,ScopedBlue=127};
+#else
+enum class ScopedColor2 : signed char {ScopedZero, ScopedOne,ScopedRed=-128,ScopedGreen=-1,ScopedBlue=127};
+#endif
+
+// TODO: replace the hack of getting symbolic enum name with a better implementation
+std::string enum_strings[] = {"ScopedZero","ScopedOne","ScopedRed","ScopedGreen","ScopedBlue"};
+template<>
+std::string to_string<ScopedColor1>(const ScopedColor1& a){
+    return enum_strings[a==ScopedColor1::ScopedBlue? 4 : (int)a+2];
+}
+template<>
+std::string to_string<ScopedColor2>(const ScopedColor2& a){
+    return enum_strings[a==ScopedColor2::ScopedRed? 2 :
+        a==ScopedColor2::ScopedGreen? 3 : a==ScopedColor2::ScopedBlue? 4 : (int)a ];
+}
+
+void TestAtomicScopedEnum() {
+    REMARK("testing atomic<ScopedColor>\n");
+    TestOperations<ScopedColor1>(ScopedColor1::ScopedRed,ScopedColor1::ScopedGreen,ScopedColor1::ScopedBlue);
+    TestParallel<ScopedColor1>( "ScopedColor1" );
+#if __TBB_ICC_SCOPED_ENUM_WITH_UNDERLYING_TYPE_ATOMIC_LOAD_BROKEN
+    REPORT("Known issue: the operation tests for a scoped enum with a specified underlying type are skipped.\n");
+#else
+    TestOperations<ScopedColor2>(ScopedColor2::ScopedRed,ScopedColor2::ScopedGreen,ScopedColor2::ScopedBlue);
+    TestParallel<ScopedColor2>( "ScopedColor2" );
+#endif
+    __TBB_STATIC_ASSERT( !HasImplicitConversionToInt< tbb::atomic<ScopedColor1> >::value, "The implicit conversion is not expected." );
+    __TBB_STATIC_ASSERT( !HasImplicitConversionToInt< tbb::atomic<ScopedColor1> >::value, "The implicit conversion is not expected." );
+    __TBB_STATIC_ASSERT( sizeof(tbb::atomic<ScopedColor1>) == sizeof(ScopedColor1), "tbb::atomic instantiated with scoped enum should have the same size as scoped enum." );
+    __TBB_STATIC_ASSERT( sizeof(tbb::atomic<ScopedColor2>) == sizeof(ScopedColor2), "tbb::atomic instantiated with scoped enum should have the same size as scoped enum." );
+}
+#endif /* __TBB_SCOPED_ENUM_PRESENT */
+
+template<typename T>
+void TestAtomicFloat( const char* name ) {
+    REMARK("testing atomic<%s>\n", name );
+    TestAlignment<T>(name);
+    TestOperations<T>(0.5,3.25,10.75);
+    TestParallel<T>( name );
+}
+
+#define __TBB_TEST_GENERIC_PART_WORD_CAS (__TBB_ENDIANNESS!=__TBB_ENDIAN_UNSUPPORTED)
+#if __TBB_TEST_GENERIC_PART_WORD_CAS
+void TestEndianness() {
+    // Test for pure endianness (assumed by simpler probe in __TBB_MaskedCompareAndSwap()).
+    bool is_big_endian = true, is_little_endian = true;
+    const tbb::internal::uint32_t probe = 0x03020100;
+    ASSERT (tbb::internal::is_aligned(&probe,4), NULL);
+    for( const char *pc_begin = reinterpret_cast<const char*>(&probe)
+         , *pc = pc_begin, *pc_end = pc_begin + sizeof(probe)
+         ; pc != pc_end; ++pc) {
+        if (*pc != pc_end-1-pc) is_big_endian = false;
+        if (*pc != pc-pc_begin) is_little_endian = false;
+    }
+    ASSERT (!is_big_endian || !is_little_endian, NULL);
+    #if __TBB_ENDIANNESS==__TBB_ENDIAN_DETECT
+        ASSERT (is_big_endian || is_little_endian, "__TBB_ENDIANNESS should be set to __TBB_ENDIAN_UNSUPPORTED");
+    #elif __TBB_ENDIANNESS==__TBB_ENDIAN_BIG
+        ASSERT (is_big_endian, "__TBB_ENDIANNESS should NOT be set to __TBB_ENDIAN_BIG");
+    #elif __TBB_ENDIANNESS==__TBB_ENDIAN_LITTLE
+        ASSERT (is_little_endian, "__TBB_ENDIANNESS should NOT be set to __TBB_ENDIAN_LITTLE");
+    #elif __TBB_ENDIANNESS==__TBB_ENDIAN_UNSUPPORTED
+        #error Generic implementation of part-word CAS may not be used: unsupported endianness
+    #else
+        #error Unexpected value of __TBB_ENDIANNESS
+    #endif
+}
+
+namespace masked_cas_helpers {
+    const int numMaskedOperations = 100000;
+    const int testSpaceSize = 8;
+    int prime[testSpaceSize] = {3,5,7,11,13,17,19,23};
+
+    template<typename T>
+    class TestMaskedCAS_Body: NoAssign {
+        T*  test_space_uncontended;
+        T*  test_space_contended;
+    public:
+        TestMaskedCAS_Body( T* _space1, T* _space2 ) : test_space_uncontended(_space1), test_space_contended(_space2) {}
+        void operator()( int my_idx ) const {
+            using tbb::internal::__TBB_MaskedCompareAndSwap;
+            const volatile T my_prime = T(prime[my_idx]); // 'volatile' prevents erroneous optimizations by SunCC
+            T* const my_ptr = test_space_uncontended+my_idx;
+            T old_value=0;
+            for( int i=0; i<numMaskedOperations; ++i, old_value+=my_prime ){
+                T result;
+            // Test uncontended case
+                T new_value = old_value + my_prime;
+                // The following CAS should always fail
+                result = __TBB_MaskedCompareAndSwap<T>(my_ptr,new_value,old_value-1);
+                ASSERT(result!=old_value-1, "masked CAS succeeded while it should fail");
+                ASSERT(result==*my_ptr, "masked CAS result mismatch with real value");
+                // The following one should succeed
+                result = __TBB_MaskedCompareAndSwap<T>(my_ptr,new_value,old_value);
+                ASSERT(result==old_value && *my_ptr==new_value, "masked CAS failed while it should succeed");
+                // The following one should fail again
+                result = __TBB_MaskedCompareAndSwap<T>(my_ptr,new_value,old_value);
+                ASSERT(result!=old_value, "masked CAS succeeded while it should fail");
+                ASSERT(result==*my_ptr, "masked CAS result mismatch with real value");
+            // Test contended case
+                for( int j=0; j<testSpaceSize; ++j ){
+                    // try adding my_prime until success
+                    T value;
+                    do {
+                        value = test_space_contended[j];
+                        result = __TBB_MaskedCompareAndSwap<T>(test_space_contended+j,value+my_prime,value);
+                    } while( result!=value );
+                }
+            }
+        }
+    };
+
+    template<typename T>
+    struct intptr_as_array_of
+    {
+        static const int how_many_Ts = sizeof(intptr_t)/sizeof(T);
+        union {
+            intptr_t result;
+            T space[ how_many_Ts ];
+        };
+    };
+
+    template<typename T>
+    intptr_t getCorrectUncontendedValue(int slot_idx) {
+        intptr_as_array_of<T> slot;
+        slot.result = 0;
+        for( int i=0; i<slot.how_many_Ts; ++i ) {
+            const T my_prime = T(prime[slot_idx*slot.how_many_Ts + i]);
+            for( int j=0; j<numMaskedOperations; ++j )
+                slot.space[i] += my_prime;
+        }
+        return slot.result;
+    }
+
+    template<typename T>
+    intptr_t getCorrectContendedValue() {
+        intptr_as_array_of<T>  slot;
+        slot.result = 0;
+        for( int i=0; i<slot.how_many_Ts; ++i )
+            for( int primes=0; primes<testSpaceSize; ++primes )
+                for( int j=0; j<numMaskedOperations; ++j )
+                    slot.space[i] += prime[primes];
+        return slot.result;
+    }
+} // namespace masked_cas_helpers
+
+template<typename T>
+void TestMaskedCAS() {
+    using namespace masked_cas_helpers;
+    REMARK("testing masked CAS<%d>\n",int(sizeof(T)));
+
+    const int num_slots = sizeof(T)*testSpaceSize/sizeof(intptr_t);
+    intptr_t arr1[num_slots+2]; // two more "canary" slots at boundaries
+    intptr_t arr2[num_slots+2];
+    for(int i=0; i<num_slots+2; ++i)
+        arr2[i] = arr1[i] = 0;
+    T* test_space_uncontended = (T*)(arr1+1);
+    T* test_space_contended = (T*)(arr2+1);
+
+    NativeParallelFor( testSpaceSize, TestMaskedCAS_Body<T>(test_space_uncontended, test_space_contended) );
+
+    ASSERT( arr1[0]==0 && arr1[num_slots+1]==0 && arr2[0]==0 && arr2[num_slots+1]==0 , "adjacent memory was overwritten" );
+    const intptr_t correctContendedValue = getCorrectContendedValue<T>();
+    for(int i=0; i<num_slots; ++i) {
+        ASSERT( arr1[i+1]==getCorrectUncontendedValue<T>(i), "unexpected value in an uncontended slot" );
+        ASSERT( arr2[i+1]==correctContendedValue, "unexpected value in a contended slot" );
+    }
+}
+#endif // __TBB_TEST_GENERIC_PART_WORD_CAS
+
+template <typename T>
+class TestRelaxedLoadStorePlainBody {
+    static T s_turn,
+             s_ready;
+
+public:
+    static unsigned s_count1,
+                    s_count2;
+
+    void operator() ( int id ) const {
+        using tbb::internal::__TBB_load_relaxed;
+        using tbb::internal::__TBB_store_relaxed;
+
+        if ( id == 0 ) {
+            while ( !__TBB_load_relaxed(s_turn) ) {
+                ++s_count1;
+                __TBB_store_relaxed(s_ready, 1);
+            }
+        }
+        else {
+            while ( !__TBB_load_relaxed(s_ready) ) {
+                ++s_count2;
+                continue;
+            }
+            __TBB_store_relaxed(s_turn, 1);
+        }
+    }
+}; // class TestRelaxedLoadStorePlainBody<T>
+
+template <typename T> T TestRelaxedLoadStorePlainBody<T>::s_turn = 0;
+template <typename T> T TestRelaxedLoadStorePlainBody<T>::s_ready = 0;
+template <typename T> unsigned TestRelaxedLoadStorePlainBody<T>::s_count1 = 0;
+template <typename T> unsigned TestRelaxedLoadStorePlainBody<T>::s_count2 = 0;
+
+template <typename T>
+class TestRelaxedLoadStoreAtomicBody {
+    static tbb::atomic<T> s_turn,
+                          s_ready;
+
+public:
+    static unsigned s_count1,
+                    s_count2;
+
+    void operator() ( int id ) const {
+        if ( id == 0 ) {
+            while ( s_turn.template load<tbb::relaxed>() == 0 ) {
+                ++s_count1;
+                s_ready.template store<tbb::relaxed>(1);
+            }
+        }
+        else {
+            while ( s_ready.template load<tbb::relaxed>() == 0 ) {
+                ++s_count2;
+                continue;
+            }
+            s_turn.template store<tbb::relaxed>(1);
+        }
+    }
+}; // class TestRelaxedLoadStoreAtomicBody<T>
+
+template <typename T> tbb::atomic<T> TestRelaxedLoadStoreAtomicBody<T>::s_turn;
+template <typename T> tbb::atomic<T> TestRelaxedLoadStoreAtomicBody<T>::s_ready;
+template <typename T> unsigned TestRelaxedLoadStoreAtomicBody<T>::s_count1 = 0;
+template <typename T> unsigned TestRelaxedLoadStoreAtomicBody<T>::s_count2 = 0;
+
+template <typename T>
+void TestRegisterPromotionSuppression () {
+    REMARK("testing register promotion suppression (size=%d)\n", (int)sizeof(T));
+    NativeParallelFor( 2, TestRelaxedLoadStorePlainBody<T>() );
+    NativeParallelFor( 2, TestRelaxedLoadStoreAtomicBody<T>() );
+}
+
+template<unsigned N>
+class ArrayElement {
+    char item[N];
+};
+
+#include "harness_barrier.h"
+namespace bit_operation_test_suite{
+    struct fixture : NoAssign{
+        static const uintptr_t zero = 0;
+        const uintptr_t random_value ;
+        const uintptr_t inverted_random_value ;
+        fixture():
+            random_value (tbb::internal::select_size_t_constant<0x9E3779B9,0x9E3779B97F4A7C15ULL>::value),
+            inverted_random_value ( ~random_value)
+        {}
+    };
+
+    struct TestAtomicORSerially : fixture {
+        void operator()(){
+            //these additional variable are needed to get more meaningful expression in the assert
+            uintptr_t initial_value = zero;
+            uintptr_t atomic_or_result = initial_value;
+            uintptr_t atomic_or_operand = random_value;
+
+            __TBB_AtomicOR(&atomic_or_result,atomic_or_operand);
+
+            ASSERT(atomic_or_result == (initial_value | atomic_or_operand),"AtomicOR should do the OR operation");
+        }
+    };
+    struct TestAtomicANDSerially : fixture {
+        void operator()(){
+            //these additional variable are needed to get more meaningful expression in the assert
+            uintptr_t initial_value = inverted_random_value;
+            uintptr_t atomic_and_result = initial_value;
+            uintptr_t atomic_and_operand = random_value;
+
+            __TBB_AtomicAND(&atomic_and_result,atomic_and_operand);
+
+            ASSERT(atomic_and_result == (initial_value & atomic_and_operand),"AtomicAND should do the AND operation");
+        }
+    };
+
+    struct TestAtomicORandANDConcurrently : fixture {
+        static const uintptr_t bit_per_word = sizeof(uintptr_t) * 8;
+        static const uintptr_t threads_number = bit_per_word;
+        Harness::SpinBarrier m_barrier;
+        uintptr_t bitmap;
+        TestAtomicORandANDConcurrently():bitmap(zero) {}
+
+        struct thread_body{
+            TestAtomicORandANDConcurrently* test;
+            thread_body(TestAtomicORandANDConcurrently* the_test) : test(the_test) {}
+            void operator()(int thread_index)const{
+                const uintptr_t single_bit_mask = ((uintptr_t)1u) << (thread_index % bit_per_word);
+                test->m_barrier.wait();
+                static const char* error_msg = "AtomicOR and AtomicAND should be atomic";
+                for (uintptr_t attempts=0; attempts<1000; attempts++ ){
+                    //Set and clear designated bits in a word.
+                    __TBB_AtomicOR(&test->bitmap,single_bit_mask);
+                     __TBB_Yield();
+                    bool the_bit_is_set_after_set_via_atomic_or = ((__TBB_load_with_acquire(test->bitmap) & single_bit_mask )== single_bit_mask);
+                    ASSERT(the_bit_is_set_after_set_via_atomic_or,error_msg);
+
+                    __TBB_AtomicAND(&test->bitmap,~single_bit_mask);
+                    __TBB_Yield();
+                    bool the_bit_is_clear_after_clear_via_atomic_and = ((__TBB_load_with_acquire(test->bitmap) & single_bit_mask )== zero);
+                    ASSERT(the_bit_is_clear_after_clear_via_atomic_and,error_msg);
+                }
+            }
+        };
+        void operator()(){
+            m_barrier.initialize(threads_number);
+            NativeParallelFor(threads_number,thread_body(this));
+        }
+    };
+}
+void TestBitOperations(){
+    using namespace bit_operation_test_suite;
+    TestAtomicORSerially()();
+    TestAtomicANDSerially()();
+    TestAtomicORandANDConcurrently()();
+}
+
+int TestMain () {
+#   if __TBB_ATOMIC_CTORS
+         TestConstExprInitializationOfGlobalObjects();
+#   endif //__TBB_ATOMIC_CTORS
+#   if __TBB_64BIT_ATOMICS && !__TBB_CAS_8_CODEGEN_BROKEN
+         TestAtomicInteger<unsigned long long>("unsigned long long");
+         TestAtomicInteger<long long>("long long");
+#   elif __TBB_CAS_8_CODEGEN_BROKEN
+         REPORT("Known issue: compiler generates incorrect code for 64-bit atomics on this configuration\n");
+#   else
+         REPORT("Known issue: 64-bit atomics are not supported\n");
+         ASSERT(sizeof(long long)==8, "type long long is not 64 bits");
+#   endif
+    TestAtomicInteger<unsigned long>("unsigned long");
+    TestAtomicInteger<long>("long");
+    TestAtomicInteger<unsigned int>("unsigned int");
+    TestAtomicInteger<int>("int");
+    TestAtomicInteger<unsigned short>("unsigned short");
+    TestAtomicInteger<short>("short");
+    TestAtomicInteger<signed char>("signed char");
+    TestAtomicInteger<unsigned char>("unsigned char");
+    TestAtomicInteger<char>("char");
+    TestAtomicInteger<wchar_t>("wchar_t");
+    TestAtomicInteger<size_t>("size_t");
+    TestAtomicInteger<ptrdiff_t>("ptrdiff_t");
+    TestAtomicPointer<ArrayElement<1> >();
+    TestAtomicPointer<ArrayElement<2> >();
+    TestAtomicPointer<ArrayElement<3> >();
+    TestAtomicPointer<ArrayElement<4> >();
+    TestAtomicPointer<ArrayElement<5> >();
+    TestAtomicPointer<ArrayElement<6> >();
+    TestAtomicPointer<ArrayElement<7> >();
+    TestAtomicPointer<ArrayElement<8> >();
+    TestAtomicPointerToTypeOfUnknownSize<IncompleteType*>( "IncompleteType*" );
+    TestAtomicPointerToTypeOfUnknownSize<void*>( "void*" );
+    TestAtomicBool();
+    TestAtomicEnum();
+#   if __TBB_SCOPED_ENUM_PRESENT
+    TestAtomicScopedEnum();
+#   endif
+    TestAtomicFloat<float>("float");
+#   if __TBB_64BIT_ATOMICS && !__TBB_CAS_8_CODEGEN_BROKEN
+        TestAtomicFloat<double>("double");
+#   else
+        ASSERT(sizeof(double)==8, "type double is not 64 bits");
+#   endif
+    ASSERT( !ParallelError, NULL );
+#   if __TBB_TEST_GENERIC_PART_WORD_CAS
+        TestEndianness();
+        ASSERT (sizeof(short)==2, NULL);
+        TestMaskedCAS<unsigned short>();
+        TestMaskedCAS<short>();
+        TestMaskedCAS<unsigned char>();
+        TestMaskedCAS<signed char>();
+        TestMaskedCAS<char>();
+#   elif __TBB_USE_GENERIC_PART_WORD_CAS
+#       error Generic part-word CAS is enabled, but not covered by the test
+#   else
+        REPORT("Skipping test for generic part-word CAS\n");
+#   endif
+#   if __TBB_64BIT_ATOMICS && !__TBB_CAS_8_CODEGEN_BROKEN
+        TestRegisterPromotionSuppression<tbb::internal::int64_t>();
+#   endif
+    TestRegisterPromotionSuppression<tbb::internal::int32_t>();
+    TestRegisterPromotionSuppression<tbb::internal::int16_t>();
+    TestRegisterPromotionSuppression<tbb::internal::int8_t>();
+    TestBitOperations();
+
+    return Harness::Done;
+}
+
+template<typename T, bool aligned>
+class AlignedAtomic: NoAssign {
+    //tbb::aligned_space can not be used here, because internally it utilize align pragma/attribute,
+    //which has bugs on 8byte alignment on ia32 on some compilers( see according ****_BROKEN macro)
+    // Allocate space big enough to always contain sizeof(T)-byte locations that are aligned and misaligned.
+    char raw_space[2*sizeof(T) -1];
+public:
+    tbb::atomic<T>& construct_atomic(){
+        std::memset(&raw_space[0],0, sizeof(raw_space));
+        uintptr_t delta = aligned ? 0 : sizeof(T)/2;
+        size_t index=sizeof(T)-1;
+        tbb::atomic<T>* y = reinterpret_cast<tbb::atomic<T>*>((reinterpret_cast<uintptr_t>(&raw_space[index+delta])&~index) - delta);
+        // Assertion checks that y really did end up somewhere inside "raw_space".
+        ASSERT( raw_space<=reinterpret_cast<char*>(y), "y starts before raw_space" );
+        ASSERT( reinterpret_cast<char*>(y+1) <= raw_space+sizeof(raw_space), "y starts after raw_space" );
+        ASSERT( !(aligned ^ tbb::internal::is_aligned(y,sizeof(T))), "y is not aligned as it required" );
+        return *(new (y) tbb::atomic<T>());
+    }
+};
+
+template<typename T, bool aligned>
+struct FlagAndMessage: AlignedAtomic<T,aligned> {
+    //! 0 if message not set yet, 1 if message is set.
+    tbb::atomic<T>& flag;
+    /** Force flag and message to be on distinct cache lines for machines with cache line size <= 4096 bytes */
+    char pad[4096/sizeof(T)];
+    //! Non-zero if message is ready
+    T message;
+    FlagAndMessage(): flag(FlagAndMessage::construct_atomic()) {
+        std::memset(pad,0,sizeof(pad));
+    }
+};
+
+// A special template function used for summation.
+// Actually it is only necessary because of its specialization for void*
+template<typename T>
+T special_sum(intptr_t arg1, intptr_t arg2) {
+    return (T)((T)arg1 + arg2);
+}
+
+// The specialization for IncompleteType* is required
+// because pointer arithmetic (+) is impossible with IncompleteType*
+template<>
+IncompleteType* special_sum<IncompleteType*>(intptr_t arg1, intptr_t arg2) {
+    return (IncompleteType*)(arg1 + arg2);
+}
+
+// The specialization for void* is required
+// because pointer arithmetic (+) is impossible with void*
+template<>
+void* special_sum<void*>(intptr_t arg1, intptr_t arg2) {
+    return (void*)(arg1 + arg2);
+}
+
+// The specialization for bool is required to shut up gratuitous compiler warnings,
+// because some compilers warn about casting int to bool.
+template<>
+bool special_sum<bool>(intptr_t arg1, intptr_t arg2) {
+    return ((arg1!=0) + arg2)!=0;
+}
+
+#if __TBB_SCOPED_ENUM_PRESENT
+// The specialization for scoped enumerators is required
+// because scoped enumerators prohibit implicit conversion to int
+template<>
+ScopedColor1 special_sum<ScopedColor1>(intptr_t arg1, intptr_t arg2) {
+    return (ScopedColor1)(arg1 + arg2);
+}
+template<>
+ScopedColor2 special_sum<ScopedColor2>(intptr_t arg1, intptr_t arg2) {
+    return (ScopedColor2)(arg1 + arg2);
+}
+#endif
+
+volatile int One = 1;
+
+inline bool IsRelaxed ( LoadStoreExpression e ) {
+    return e == UseExplicitRelaxed || e == UseGlobalHelperRelaxed;
+}
+
+template <typename T, LoadStoreExpression E>
+struct LoadStoreTraits;
+
+template <typename T>
+struct LoadStoreTraits<T, UseOperators> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = src; }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { dst = src; }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseImplicitAcqRel> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = src.load(); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { dst.store(src); }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseExplicitFullyFenced> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = src.template load<tbb::full_fence>(); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { dst.template store<tbb::full_fence>(src); }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseExplicitAcqRel> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = src.template load<tbb::acquire>(); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { dst.template store<tbb::release>(src); }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseExplicitRelaxed> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = src.template load<tbb::relaxed>(); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { dst.template store<tbb::relaxed>(src); }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseGlobalHelperFullyFenced> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = tbb::load<tbb::full_fence>(src); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { tbb::store<tbb::full_fence>(dst, src); }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseGlobalHelperAcqRel> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = tbb::load<tbb::acquire>(src); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { tbb::store<tbb::release>(dst, src); }
+};
+
+template <typename T>
+struct LoadStoreTraits<T, UseGlobalHelperRelaxed> {
+    static void load ( T& dst, const tbb::atomic<T>& src ) { dst = tbb::load<tbb::relaxed>(src); }
+    static void store ( tbb::atomic<T>& dst, const T& src ) { tbb::store<tbb::relaxed>(dst, src); }
+};
+
+template<typename T, bool aligned, LoadStoreExpression E>
+struct HammerLoadAndStoreFence: NoAssign {
+    typedef FlagAndMessage<T,aligned> fam_type;
+private:
+    typedef LoadStoreTraits<T, E> trait;
+    fam_type* fam;
+    const int n;
+    const int p;
+    const int trial;
+    const char* name;
+    mutable T accum;
+public:
+    HammerLoadAndStoreFence( fam_type* fam_, int n_, int p_, const char* name_, int trial_ ) : fam(fam_), n(n_), p(p_), trial(trial_), name(name_) {}
+    void operator()( int k ) const {
+        int one = One;
+        fam_type* s = fam+k;
+        fam_type* s_next = fam + (k+1)%p;
+        for( int i=0; i<n; ++i ) {
+            // The inner for loop is a spin-wait loop, which is normally considered very bad style.
+            // But we must use it here because we are interested in examining subtle hardware effects.
+            for(unsigned short cnt=1; ; ++cnt) {
+                if( !(cnt%1024) ) // to help 1-core or oversubscribed systems complete the test, yield every 2^10 iterations
+                    __TBB_Yield();
+                // Compilers typically generate non-trivial sequence for division by a constant.
+                // The expression here is dependent on the loop index i, so it cannot be hoisted.
+                #define COMPLICATED_ZERO (i*(one-1)/100)
+                // Read flag and then the message
+                T flag, message;
+                if( trial&1 ) {
+                    // COMPLICATED_ZERO here tempts compiler to hoist load of message above reading of flag.
+                    trait::load( flag, (s+COMPLICATED_ZERO)->flag );
+                    message = s->message;
+                } else {
+                    trait::load( flag, s->flag );
+                    message = s->message;
+                }
+                if ( flag != T(0) ) {
+                    if( flag!=(T)-1 ) {
+                        REPORT("ERROR: flag!=(T)-1 k=%d i=%d trial=%x type=%s (atomicity problem?)\n", k, i, trial, name );
+                        ParallelError = true;
+                    }
+                    if( !IsRelaxed(E) && message!=(T)-1 ) {
+                        REPORT("ERROR: message!=(T)-1 k=%d i=%d trial=%x type=%s mode=%d (memory fence problem?)\n", k, i, trial, name, E );
+                        ParallelError = true;
+                    }
+                    s->message = T(0);
+                    trait::store( s->flag, T(0) );
+                    // Prevent deadlock possible in relaxed mode because of store(0)
+                    // to the first thread's flag being reordered after the last
+                    // thread's store(-1) into it.
+                    if ( IsRelaxed(E) ) {
+                        while( s_next->flag.template load<tbb::relaxed>() != T(0) )
+                            __TBB_Yield();
+                    }
+                    else
+                        ASSERT( s_next->flag == T(0), NULL );
+                    // Set message and then the flag
+                    if( trial&2 ) {
+                        // COMPLICATED_ZERO here tempts compiler to sink store below setting of flag
+                        s_next->message = special_sum<T>(-1, COMPLICATED_ZERO);
+                        trait::store( s_next->flag, (T)-1 );
+                    } else {
+                        s_next->message = (T)-1;
+                        trait::store( s_next->flag, (T)-1 );
+                    }
+                    break;
+                } else {
+                    // Force compiler to use message anyway, so it cannot sink read of s->message below the if.
+                    accum = message;
+                }
+            }
+        }
+    }
+};
+
+//! Test that atomic<T> has acquire semantics for loads and release semantics for stores.
+/** Test performs round-robin passing of message among p processors,
+    where p goes from MinThread to MaxThread. */
+template<typename T, bool aligned, LoadStoreExpression E>
+void TestLoadAndStoreFences( const char* name ) {
+    typedef HammerLoadAndStoreFence<T, aligned, E> hammer_load_store_type;
+    typedef typename hammer_load_store_type::fam_type fam_type;
+    for( int p=MinThread<2 ? 2 : MinThread; p<=MaxThread; ++p ) {
+        fam_type * fam = new fam_type[p];
+        // Each of four trials exercise slightly different expression pattern within the test.
+        // See occurrences of COMPLICATED_ZERO for details.
+        for( int trial=0; trial<4; ++trial ) {
+            fam->message = (T)-1;
+            fam->flag = (T)-1;
+            NativeParallelFor( p, hammer_load_store_type( fam, 100, p, name, trial ) );
+            if ( !IsRelaxed(E) ) {
+                for( int k=0; k<p; ++k ) {
+                    ASSERT( fam[k].message==(k==0 ? (T)-1 : T(0)), "incomplete round-robin?" );
+                    ASSERT( fam[k].flag==(k==0 ? (T)-1 : T(0)), "incomplete round-robin?" );
+                }
+            }
+        }
+        delete[] fam;
+    }
+}
+
+//! Sparse set of values of integral type T.
+/** Set is designed so that if a value is read or written non-atomically,
+    the resulting intermediate value is likely to not be a member of the set. */
+template<typename T>
+class SparseValueSet {
+    T factor;
+public:
+    SparseValueSet() {
+        // Compute factor such that:
+        // 1. It has at least one 1 in most of its bytes.
+        // 2. The bytes are typically different.
+        // 3. When multiplied by any value <=127, the product does not overflow.
+        factor = T(0);
+        for( unsigned i=0; i<sizeof(T)*8-7; i+=7 )
+            factor = T(factor | T(1)<<i);
+     }
+     //! Get ith member of set
+     T get( int i ) const {
+         // Create multiple of factor.  The & prevents overflow of the product.
+         return T((i&0x7F)*factor);
+     }
+     //! True if set contains x
+     bool contains( T x ) const {
+         // True if
+         return (x%factor)==0;
+     }
+};
+
+//! Specialization for pointer types.  The pointers are random and should not be dereferenced.
+template<typename T>
+class SparseValueSet<T*> {
+    SparseValueSet<ptrdiff_t> my_set;
+public:
+    T* get( int i ) const {return reinterpret_cast<T*>(my_set.get(i));}
+    bool contains( T* x ) const {return my_set.contains(reinterpret_cast<ptrdiff_t>(x));}
+};
+
+//! Specialization for bool.
+/** Checking bool for atomic read/write is pointless in practice, because
+    there is no way to *not* atomically read or write a bool value. */
+template<>
+class SparseValueSet<bool> {
+public:
+    bool get( int i ) const {return i&1;}
+    bool contains( bool ) const {return true;}
+};
+
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+    // VS2008/VC9 seems to have an issue; limits pull in math.h
+    #pragma warning( push )
+    #pragma warning( disable: 4985 )
+#endif
+#include <limits> /* Need std::numeric_limits */
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif
+
+//! Commonality inherited by specializations for floating-point types.
+template<typename T>
+class SparseFloatSet: NoAssign {
+    const T epsilon;
+public:
+    SparseFloatSet() : epsilon(std::numeric_limits<T>::epsilon()) {}
+    T get( int i ) const {
+        return i==0 ? T(0) : 1/T((i&0x7F)+1);
+    }
+    bool contains( T x ) const {
+        if( x==T(0) ) {
+            return true;
+        } else {
+            int j = int(1/x+T(0.5));
+            if( 0<j && j<=128 ) {
+                T error = x*T(j)-T(1);
+                // In the calculation above, if x was indeed generated by method get, the error should be
+                // at most epsilon, because x is off by at most 1/2 ulp from its infinitely precise value,
+                // j is exact, and the multiplication incurs at most another 1/2 ulp of round-off error.
+                if( -epsilon<=error && error<=epsilon ) {
+                    return true;
+                } else {
+                    REPORT("Warning: excessive floating-point error encountered j=%d x=%.15g error=%.15g\n",j,x,error);
+                }
+            }
+            return false;
+        }
+    };
+};
+
+template<>
+class SparseValueSet<float>: public SparseFloatSet<float> {};
+
+template<>
+class SparseValueSet<double>: public SparseFloatSet<double> {};
+
+#if __TBB_SCOPED_ENUM_PRESENT
+//! Commonality inherited by specializations for scoped enumerator types.
+template<typename EnumType>
+class SparseEnumValueSet {
+public:
+    EnumType get( int i ) const {return i%3==0 ? EnumType::ScopedRed : i%3==1 ? EnumType::ScopedGreen : EnumType::ScopedBlue;}
+    bool contains( EnumType e ) const {return e==EnumType::ScopedRed || e==EnumType::ScopedGreen || e==EnumType::ScopedBlue;}
+};
+template<>
+class SparseValueSet<ScopedColor1> : public SparseEnumValueSet<ScopedColor1> {};
+template<>
+class SparseValueSet<ScopedColor2> : public SparseEnumValueSet<ScopedColor2> {};
+#endif
+
+template<typename T, bool aligned>
+class HammerAssignment: AlignedAtomic<T,aligned> {
+    tbb::atomic<T>& x;
+    const char* name;
+    SparseValueSet<T> set;
+public:
+    HammerAssignment(const char* name_ ) : x(HammerAssignment::construct_atomic()), name(name_) {
+        x = set.get(0);
+    }
+    void operator()( int k ) const {
+        const int n = 1000000;
+        if( k ) {
+            tbb::atomic<T> z;
+            AssertSameType( z=x, z );    // Check that return type from assignment is correct
+            for( int i=0; i<n; ++i ) {
+                // Read x atomically into z.
+                z = x;
+                if( !set.contains(z) ) {
+                    REPORT("ERROR: assignment of atomic<%s> is not atomic\n", name);
+                    ParallelError = true;
+                    return;
+                }
+            }
+        } else {
+            tbb::atomic<T> y;
+            for( int i=0; i<n; ++i ) {
+                // Get pseudo-random value.
+                y = set.get(i);
+                // Write y atomically into x.
+                x = y;
+            }
+        }
+    }
+};
+
+// Compile-time check that a class method has the required signature.
+// Intended to check the assignment operator of tbb::atomic.
+template<typename T> void TestAssignmentSignature( T& (T::*)(const T&) ) {}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( disable: 4355 4800 )
+#endif
+
+template<typename T, bool aligned>
+void TestAssignment( const char* name ) {
+    TestAssignmentSignature( &tbb::atomic<T>::operator= );
+    NativeParallelFor( 2, HammerAssignment<T,aligned>(name ) );
+}
+
+template <typename T, bool aligned, LoadStoreExpression E>
+class DekkerArbitrationBody : NoAssign, Harness::NoAfterlife {
+    typedef LoadStoreTraits<T, E> trait;
+
+    mutable Harness::FastRandom my_rand;
+    static const unsigned short c_rand_ceil = 10;
+    mutable AlignedAtomic<T,aligned> s_ready_storage[2];
+    mutable AlignedAtomic<T,aligned> s_turn_storage;
+    mutable tbb::atomic<T>* s_ready[2];
+    tbb::atomic<T>& s_turn;
+    mutable volatile bool s_inside;
+
+public:
+    void operator() ( int id ) const {
+        const int me = id;
+        const T other = (T)(uintptr_t)(1 - id),
+                cleared = T(0),
+                signaled = T(1);
+        for ( int i = 0; i < 100000; ++i ) {
+            trait::store( *s_ready[me], signaled );
+            trait::store( s_turn, other );
+            T r, t;
+            for ( int j = 0; ; ++j ) {
+                trait::load(r, *s_ready[(uintptr_t)other]);
+                trait::load(t, s_turn);
+                if ( r != signaled || t != other )
+                    break;
+                __TBB_Pause(1);
+                if ( j == 2<<12 ) {
+                    j = 0;
+                    __TBB_Yield();
+                }
+            }
+            // Entered critical section
+            ASSERT( !s_inside, "Peterson lock is broken - some fences are missing" );
+            s_inside = true;
+            unsigned short spin = my_rand.get() % c_rand_ceil;
+            for ( volatile int j = 0; j < spin; ++j )
+                continue;
+            s_inside = false;
+            ASSERT( !s_inside, "Peterson lock is broken - some fences are missing" );
+            // leaving critical section
+            trait::store( *s_ready[me], cleared );
+            spin = my_rand.get() % c_rand_ceil;
+            for ( volatile int j = 0; j < spin; ++j )
+                continue;
+        }
+    }
+
+    DekkerArbitrationBody ()
+        : my_rand((unsigned)(uintptr_t)this)
+        , s_turn(s_turn_storage.construct_atomic())
+        , s_inside (false)
+    {
+        //atomics pointed to by s_ready and s_turn will be zeroed by the
+        //according construct_atomic() calls
+         s_ready[0] = &s_ready_storage[0].construct_atomic();
+         s_ready[1] = &s_ready_storage[1].construct_atomic();
+    }
+};
+
+template <typename T, bool aligned, LoadStoreExpression E>
+void TestDekkerArbitration () {
+    NativeParallelFor( 2, DekkerArbitrationBody<T,aligned, E>() );
+}
+
+template<typename T>
+void TestParallel( const char* name ) {
+    //TODO: looks like there are no tests for operations other than load/store ?
+#if __TBB_FORCE_64BIT_ALIGNMENT_BROKEN
+    if (sizeof(T)==8){
+        TestLoadAndStoreFences<T, false, UseOperators>(name);
+        TestLoadAndStoreFences<T, false, UseImplicitAcqRel>(name);
+        TestLoadAndStoreFences<T, false, UseExplicitFullyFenced>(name);
+        TestLoadAndStoreFences<T, false, UseExplicitAcqRel>(name);
+        TestLoadAndStoreFences<T, false, UseExplicitRelaxed>(name);
+        TestLoadAndStoreFences<T, false, UseGlobalHelperFullyFenced>(name);
+        TestLoadAndStoreFences<T, false, UseGlobalHelperAcqRel>(name);
+        TestLoadAndStoreFences<T, false, UseGlobalHelperRelaxed>(name);
+        TestAssignment<T,false>(name);
+        TestDekkerArbitration<T, false, UseExplicitFullyFenced>();
+        TestDekkerArbitration<T, false, UseGlobalHelperFullyFenced>();
+    }
+#endif
+
+    TestLoadAndStoreFences<T, true, UseOperators>(name);
+    TestLoadAndStoreFences<T, true, UseImplicitAcqRel>(name);
+    TestLoadAndStoreFences<T, true, UseExplicitFullyFenced>(name);
+    TestLoadAndStoreFences<T, true, UseExplicitAcqRel>(name);
+    TestLoadAndStoreFences<T, true, UseExplicitRelaxed>(name);
+    TestLoadAndStoreFences<T, true, UseGlobalHelperFullyFenced>(name);
+    TestLoadAndStoreFences<T, true, UseGlobalHelperAcqRel>(name);
+    TestLoadAndStoreFences<T, true, UseGlobalHelperRelaxed>(name);
+    TestAssignment<T,true>(name);
+    TestDekkerArbitration<T, true, UseExplicitFullyFenced>();
+    TestDekkerArbitration<T, true, UseGlobalHelperFullyFenced>();
+}
+
+#endif // __TBB_TEST_SKIP_PIC_MODE || __TBB_TEST_SKIP_BUILTINS_MODE
diff --git a/xdl/third_party/tbb/src/test/test_blocked_range.cpp b/xdl/third_party/tbb/src/test/test_blocked_range.cpp
new file mode 100644
index 00000000..6f67a3f5
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_blocked_range.cpp
@@ -0,0 +1,210 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/blocked_range.h"
+#include "harness_assert.h"
+
+// First test as much as we can without including other headers.
+// Doing so should catch problems arising from failing to include headers.
+
+class AbstractValueType {
+    AbstractValueType() {}
+    int value;
+public:
+    friend AbstractValueType MakeAbstractValueType( int i );
+    friend int GetValueOf( const AbstractValueType& v ) {return v.value;}
+};
+
+AbstractValueType MakeAbstractValueType( int i ) {
+    AbstractValueType x;
+    x.value = i;
+    return x;
+}
+
+std::size_t operator-( const AbstractValueType& u, const AbstractValueType& v ) {
+    return GetValueOf(u) - GetValueOf(v);
+}
+
+bool operator<( const AbstractValueType& u, const AbstractValueType& v ) {
+    return GetValueOf(u) < GetValueOf(v);
+}
+
+AbstractValueType operator+( const AbstractValueType& u, std::size_t offset ) {
+    return MakeAbstractValueType(GetValueOf(u) + int(offset));
+}
+
+static void SerialTest() {
+    for( int x=-10; x<10; ++x )
+        for( int y=-10; y<10; ++y ) {
+            AbstractValueType i = MakeAbstractValueType(x);
+            AbstractValueType j = MakeAbstractValueType(y);
+            for( std::size_t k=1; k<10; ++k ) {
+                typedef tbb::blocked_range<AbstractValueType> range_type;
+                range_type r( i, j, k );
+                AssertSameType( r.empty(), true );
+                AssertSameType( range_type::size_type(), std::size_t() );
+                AssertSameType( static_cast<range_type::const_iterator*>(0), static_cast<AbstractValueType*>(0) );
+                AssertSameType( r.begin(), MakeAbstractValueType(0) );
+                AssertSameType( r.end(), MakeAbstractValueType(0) );
+                ASSERT( r.empty()==(y<=x), NULL );
+                ASSERT( r.grainsize()==k, NULL );
+                if( x<=y ) {
+                    AssertSameType( r.is_divisible(), true );
+                    ASSERT( r.is_divisible()==(std::size_t(y-x)>k), NULL );
+                    ASSERT( r.size()==std::size_t(y-x), NULL );
+                    if( r.is_divisible() ) {
+                        tbb::blocked_range<AbstractValueType> r2(r,tbb::split());
+                        ASSERT( GetValueOf(r.begin())==x, NULL );
+                        ASSERT( GetValueOf(r.end())==GetValueOf(r2.begin()), NULL );
+                        ASSERT( GetValueOf(r2.end())==y, NULL );
+                        ASSERT( r.grainsize()==k, NULL );
+                        ASSERT( r2.grainsize()==k, NULL );
+                    }
+                }
+            }
+        }
+}
+
+#include "tbb/parallel_for.h"
+#include "harness.h"
+
+const int N = 1<<22;
+
+unsigned char Array[N];
+
+struct Striker {
+    // Note: we use <int> here instead of <long> in order to test for Quad 407676
+    void operator()( const tbb::blocked_range<int>& r ) const {
+        for( tbb::blocked_range<int>::const_iterator i=r.begin(); i!=r.end(); ++i )
+            ++Array[i];
+    }
+};
+
+void ParallelTest() {
+    for( int i=0; i<N; i=i<3 ? i+1 : i*3 ) {
+        const tbb::blocked_range<int> r( 0, i, 10 );
+        tbb::parallel_for( r, Striker() );
+        for( int k=0; k<N; ++k ) {
+            ASSERT( Array[k]==(k<i), NULL );
+            Array[k] = 0;
+        }
+    }
+}
+
+#if __TBB_RANGE_BASED_FOR_PRESENT
+#include "test_range_based_for.h"
+#include <functional>
+void TestRangeBasedFor() {
+    using namespace range_based_for_support_tests;
+    REMARK("testing range based for loop compatibility \n");
+
+    size_t int_array[100] = {0};
+    const size_t sequence_length = Harness::array_length(int_array);
+
+    for (size_t i = 0; i < sequence_length; ++i) {
+        int_array[i] = i + 1;
+    }
+
+    const tbb::blocked_range<size_t*> r(int_array, Harness::end(int_array), 1);
+
+    ASSERT(range_based_for_accumulate<size_t>(r, std::plus<size_t>(), size_t(0)) == gauss_summ_of_int_sequence(sequence_length), "incorrect accumulated value generated via range based for ?");
+}
+#endif //if __TBB_RANGE_BASED_FOR_PRESENT
+
+#if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+
+void TestProportionalSplitOverflow()
+{
+    REMARK("Testing overflow during proportional split - ");
+    using tbb::blocked_range;
+    using tbb::proportional_split;
+
+    blocked_range<size_t> r1(0, size_t(-1) / 2);
+    size_t size = r1.size();
+    size_t begin = r1.begin();
+    size_t end = r1.end();
+
+    proportional_split p(1, 3);
+    blocked_range<size_t> r2(r1, p);
+
+    // overflow-free computation
+    size_t parts = p.left() + p.right();
+    size_t int_part = size / parts;
+    size_t fraction = size - int_part * parts; // fraction < parts
+    size_t right_idx = int_part * p.right() + fraction * p.right() / parts + 1;
+    size_t newRangeBegin = end - right_idx;
+
+    // Division in 'right_idx' very likely is inexact also.
+    size_t tolerance = 1;
+    size_t diff = (r2.begin() < newRangeBegin) ? (newRangeBegin - r2.begin()) : (r2.begin() - newRangeBegin);
+    bool is_split_correct = diff <= tolerance;
+    bool test_passed = (r1.begin() == begin && r1.end() == r2.begin() && is_split_correct &&
+                        r2.end() == end);
+    if (!test_passed) {
+        REPORT("Incorrect split of blocked range[%lu, %lu) into r1[%lu, %lu) and r2[%lu, %lu), "
+               "must be r1[%lu, %lu) and r2[%lu, %lu)\n", begin, end, r1.begin(), r1.end(), r2.begin(), r2.end(), begin, newRangeBegin, newRangeBegin, end);
+        ASSERT(test_passed, NULL);
+    }
+    REMARK("OK\n");
+}
+#endif /* __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES */
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+void TestDeductionGuides() {
+    std::vector<const int *> v;
+
+    // check blocked_range(Value, Value, size_t)
+    tbb::blocked_range r1(v.begin(), v.end());
+    static_assert(std::is_same<decltype(r1), tbb::blocked_range<decltype(v)::iterator>>::value);
+
+    // check blocked_range(blocked_range &)
+    tbb::blocked_range r2(r1);
+    static_assert(std::is_same<decltype(r2), decltype(r1)>::value);
+
+    // check blocked_range(blocked_range &&)
+    tbb::blocked_range r3(std::move(r1));
+    static_assert(std::is_same<decltype(r3), decltype(r1)>::value);
+}
+#endif
+
+//------------------------------------------------------------------------
+// Test driver
+#include "tbb/task_scheduler_init.h"
+
+int TestMain () {
+    SerialTest();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        ParallelTest();
+    }
+
+    #if __TBB_RANGE_BASED_FOR_PRESENT
+        TestRangeBasedFor();
+    #endif //if __TBB_RANGE_BASED_FOR_PRESENT
+
+    #if __TBB_USE_PROPORTIONAL_SPLIT_IN_BLOCKED_RANGES
+        TestProportionalSplitOverflow();
+    #endif
+
+    #if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+        TestDeductionGuides();
+    #endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_blocked_range2d.cpp b/xdl/third_party/tbb/src/test/test_blocked_range2d.cpp
new file mode 100644
index 00000000..b3a878f9
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_blocked_range2d.cpp
@@ -0,0 +1,172 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/blocked_range2d.h"
+#include "harness_assert.h"
+
+// First test as much as we can without including other headers.
+// Doing so should catch problems arising from failing to include headers.
+
+template<typename Tag>
+class AbstractValueType {
+    AbstractValueType() {}
+    int value;
+public:
+    template<typename OtherTag>
+    friend AbstractValueType<OtherTag> MakeAbstractValueType( int i );
+
+    template<typename OtherTag>
+    friend int GetValueOf( const AbstractValueType<OtherTag>& v ) ;
+};
+
+template<typename Tag>
+AbstractValueType<Tag> MakeAbstractValueType( int i ) {
+    AbstractValueType<Tag> x;
+    x.value = i;
+    return x;
+}
+
+template<typename Tag>
+int GetValueOf( const AbstractValueType<Tag>& v ) {return v.value;}
+
+template<typename Tag>
+bool operator<( const AbstractValueType<Tag>& u, const AbstractValueType<Tag>& v ) {
+    return GetValueOf(u)<GetValueOf(v);
+}
+
+template<typename Tag>
+std::size_t operator-( const AbstractValueType<Tag>& u, const AbstractValueType<Tag>& v ) {
+    return GetValueOf(u)-GetValueOf(v);
+}
+
+template<typename Tag>
+AbstractValueType<Tag> operator+( const AbstractValueType<Tag>& u, std::size_t offset ) {
+    return MakeAbstractValueType<Tag>(GetValueOf(u)+int(offset));
+}
+
+struct RowTag {};
+struct ColTag {};
+
+static void SerialTest() {
+    typedef AbstractValueType<RowTag> row_type;
+    typedef AbstractValueType<ColTag> col_type;
+    typedef tbb::blocked_range2d<row_type,col_type> range_type;
+    for( int row_x=-10; row_x<10; ++row_x ) {
+        for( int row_y=row_x; row_y<10; ++row_y ) {
+            row_type row_i = MakeAbstractValueType<RowTag>(row_x);
+            row_type row_j = MakeAbstractValueType<RowTag>(row_y);
+            for( int row_grain=1; row_grain<10; ++row_grain ) {
+                for( int col_x=-10; col_x<10; ++col_x ) {
+                    for( int col_y=col_x; col_y<10; ++col_y ) {
+                        col_type col_i = MakeAbstractValueType<ColTag>(col_x);
+                        col_type col_j = MakeAbstractValueType<ColTag>(col_y);
+                        for( int col_grain=1; col_grain<10; ++col_grain ) {
+                            range_type r( row_i, row_j, row_grain, col_i, col_j, col_grain );
+                            AssertSameType( r.is_divisible(), true );
+                            AssertSameType( r.empty(), true );
+                            AssertSameType( static_cast<range_type::row_range_type::const_iterator*>(0), static_cast<row_type*>(0) );
+                            AssertSameType( static_cast<range_type::col_range_type::const_iterator*>(0), static_cast<col_type*>(0) );
+                            AssertSameType( r.rows(), tbb::blocked_range<row_type>( row_i, row_j, 1 ));
+                            AssertSameType( r.cols(), tbb::blocked_range<col_type>( col_i, col_j, 1 ));
+                            ASSERT( r.empty()==(row_x==row_y||col_x==col_y), NULL );
+                            ASSERT( r.is_divisible()==(row_y-row_x>row_grain||col_y-col_x>col_grain), NULL );
+                            if( r.is_divisible() ) {
+                                range_type r2(r,tbb::split());
+                                if( GetValueOf(r2.rows().begin())==GetValueOf(r.rows().begin()) ) {
+                                    ASSERT( GetValueOf(r2.rows().end())==GetValueOf(r.rows().end()), NULL );
+                                    ASSERT( GetValueOf(r2.cols().begin())==GetValueOf(r.cols().end()), NULL );
+                                } else {
+                                    ASSERT( GetValueOf(r2.cols().end())==GetValueOf(r.cols().end()), NULL );
+                                    ASSERT( GetValueOf(r2.rows().begin())==GetValueOf(r.rows().end()), NULL );
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+        }
+    }
+}
+
+#include "tbb/parallel_for.h"
+#include "harness.h"
+
+const int N = 1<<10;
+
+unsigned char Array[N][N];
+
+struct Striker {
+   // Note: we use <int> here instead of <long> in order to test for problems similar to Quad 407676
+    void operator()( const tbb::blocked_range2d<int>& r ) const {
+        for( tbb::blocked_range<int>::const_iterator i=r.rows().begin(); i!=r.rows().end(); ++i )
+            for( tbb::blocked_range<int>::const_iterator j=r.cols().begin(); j!=r.cols().end(); ++j )
+                ++Array[i][j];
+    }
+};
+
+void ParallelTest() {
+    for( int i=0; i<N; i=i<3 ? i+1 : i*3 ) {
+        for( int j=0; j<N; j=j<3 ? j+1 : j*3 ) {
+            const tbb::blocked_range2d<int> r( 0, i, 7, 0, j, 5 );
+            tbb::parallel_for( r, Striker() );
+            for( int k=0; k<N; ++k ) {
+                for( int l=0; l<N; ++l ) {
+                    ASSERT( Array[k][l]==(k<i && l<j), NULL );
+                    Array[k][l] = 0;
+                }
+            }
+        }
+    }
+}
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+#include <vector>
+void TestDeductionGuides() {
+    std::vector<const unsigned long *> v;
+    std::vector<double> v2;
+
+    // check blocked_range2d(RowValue, RowValue, size_t, ColValue, ColValue, size_t)
+    tbb::blocked_range2d r1(v.begin(), v.end(), 2, v2.begin(), v2.end(), 2);
+    static_assert(std::is_same<decltype(r1), tbb::blocked_range2d<decltype(v)::iterator, decltype(v2)::iterator>>::value);
+
+    // check blocked_range2d(blocked_range2d &)
+    tbb::blocked_range2d r2(r1);
+    static_assert(std::is_same<decltype(r2), decltype(r1)>::value);
+
+    // check blocked_range2d(blocked_range2d &&)
+    tbb::blocked_range2d r3(std::move(r1));
+    static_assert(std::is_same<decltype(r3), decltype(r1)>::value);
+}
+#endif
+
+#include "tbb/task_scheduler_init.h"
+
+int TestMain () {
+    SerialTest();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        ParallelTest();
+    }
+
+    #if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+        TestDeductionGuides();
+    #endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_blocked_range3d.cpp b/xdl/third_party/tbb/src/test/test_blocked_range3d.cpp
new file mode 100644
index 00000000..111d7e8c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_blocked_range3d.cpp
@@ -0,0 +1,205 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/blocked_range3d.h"
+#include "harness_assert.h"
+
+// First test as much as we can without including other headers.
+// Doing so should catch problems arising from failing to include headers.
+
+template<typename Tag>
+class AbstractValueType {
+    AbstractValueType() {}
+    int value;
+public:
+    template<typename OtherTag>
+    friend AbstractValueType<OtherTag> MakeAbstractValueType( int i );
+
+    template<typename OtherTag>
+    friend int GetValueOf( const AbstractValueType<OtherTag>& v ) ;
+};
+
+template<typename Tag>
+AbstractValueType<Tag> MakeAbstractValueType( int i ) {
+    AbstractValueType<Tag> x;
+    x.value = i;
+    return x;
+}
+
+template<typename Tag>
+int GetValueOf( const AbstractValueType<Tag>& v ) {return v.value;}
+
+template<typename Tag>
+bool operator<( const AbstractValueType<Tag>& u, const AbstractValueType<Tag>& v ) {
+    return GetValueOf(u)<GetValueOf(v);
+}
+
+template<typename Tag>
+std::size_t operator-( const AbstractValueType<Tag>& u, const AbstractValueType<Tag>& v ) {
+    return GetValueOf(u)-GetValueOf(v);
+}
+
+template<typename Tag>
+AbstractValueType<Tag> operator+( const AbstractValueType<Tag>& u, std::size_t offset ) {
+    return MakeAbstractValueType<Tag>(GetValueOf(u)+int(offset));
+}
+
+struct PageTag {};
+struct RowTag {};
+struct ColTag {};
+
+static void SerialTest() {
+    typedef AbstractValueType<PageTag> page_type;
+    typedef AbstractValueType<RowTag> row_type;
+    typedef AbstractValueType<ColTag> col_type;
+    typedef tbb::blocked_range3d<page_type,row_type,col_type> range_type;
+    for( int page_x=-4; page_x<4; ++page_x ) {
+        for( int page_y=page_x; page_y<4; ++page_y ) {
+            page_type page_i = MakeAbstractValueType<PageTag>(page_x);
+            page_type page_j = MakeAbstractValueType<PageTag>(page_y);
+            for( int page_grain=1; page_grain<4; ++page_grain ) {
+                for( int row_x=-4; row_x<4; ++row_x ) {
+                    for( int row_y=row_x; row_y<4; ++row_y ) {
+                        row_type row_i = MakeAbstractValueType<RowTag>(row_x);
+                        row_type row_j = MakeAbstractValueType<RowTag>(row_y);
+                        for( int row_grain=1; row_grain<4; ++row_grain ) {
+                            for( int col_x=-4; col_x<4; ++col_x ) {
+                                for( int col_y=col_x; col_y<4; ++col_y ) {
+                                    col_type col_i = MakeAbstractValueType<ColTag>(col_x);
+                                    col_type col_j = MakeAbstractValueType<ColTag>(col_y);
+                                    for( int col_grain=1; col_grain<4; ++col_grain ) {
+                                        range_type r( page_i, page_j, page_grain, row_i, row_j, row_grain, col_i, col_j, col_grain );
+                                        AssertSameType( r.is_divisible(), true );
+
+                                        AssertSameType( r.empty(), true );
+
+                                        AssertSameType( static_cast<range_type::page_range_type::const_iterator*>(0), static_cast<page_type*>(0) );
+                                        AssertSameType( static_cast<range_type::row_range_type::const_iterator*>(0), static_cast<row_type*>(0) );
+                                        AssertSameType( static_cast<range_type::col_range_type::const_iterator*>(0), static_cast<col_type*>(0) );
+
+                                        AssertSameType( r.pages(), tbb::blocked_range<page_type>( page_i, page_j, 1 ));
+                                        AssertSameType( r.rows(), tbb::blocked_range<row_type>( row_i, row_j, 1 ));
+                                        AssertSameType( r.cols(), tbb::blocked_range<col_type>( col_i, col_j, 1 ));
+
+                                        ASSERT( r.empty()==(page_x==page_y||row_x==row_y||col_x==col_y), NULL );
+
+                                        ASSERT( r.is_divisible()==(page_y-page_x>page_grain||row_y-row_x>row_grain||col_y-col_x>col_grain), NULL );
+
+                                        if( r.is_divisible() ) {
+                                            range_type r2(r,tbb::split());
+                                            if( (GetValueOf(r2.pages().begin())==GetValueOf(r.pages().begin())) && (GetValueOf(r2.rows().begin())==GetValueOf(r.rows().begin())) ) {
+                                                ASSERT( GetValueOf(r2.pages().end())==GetValueOf(r.pages().end()), NULL );
+                                                ASSERT( GetValueOf(r2.rows().end())==GetValueOf(r.rows().end()), NULL );
+                                                ASSERT( GetValueOf(r2.cols().begin())==GetValueOf(r.cols().end()), NULL );
+                                            } else {
+                                                if ( (GetValueOf(r2.pages().begin())==GetValueOf(r.pages().begin())) && (GetValueOf(r2.cols().begin())==GetValueOf(r.cols().begin())) ) {
+                                                    ASSERT( GetValueOf(r2.pages().end())==GetValueOf(r.pages().end()), NULL );
+                                                    ASSERT( GetValueOf(r2.cols().end())==GetValueOf(r.cols().end()), NULL );
+                                                    ASSERT( GetValueOf(r2.rows().begin())==GetValueOf(r.rows().end()), NULL );
+                                                } else {
+                                                   ASSERT( GetValueOf(r2.rows().end())==GetValueOf(r.rows().end()), NULL );
+                                                   ASSERT( GetValueOf(r2.cols().end())==GetValueOf(r.cols().end()), NULL );
+                                                   ASSERT( GetValueOf(r2.pages().begin())==GetValueOf(r.pages().end()), NULL );
+                                                }
+                                            }
+                                        }
+                                    }
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+        }
+    }
+}
+
+#include "tbb/parallel_for.h"
+#include "harness.h"
+
+const int N = 1<<5;
+
+unsigned char Array[N][N][N];
+
+struct Striker {
+   // Note: we use <int> here instead of <long> in order to test for problems similar to Quad 407676
+    void operator()( const tbb::blocked_range3d<int>& r ) const {
+        for( tbb::blocked_range<int>::const_iterator i=r.pages().begin(); i!=r.pages().end(); ++i )
+            for( tbb::blocked_range<int>::const_iterator j=r.rows().begin(); j!=r.rows().end(); ++j )
+                for( tbb::blocked_range<int>::const_iterator k=r.cols().begin(); k!=r.cols().end(); ++k )
+                    ++Array[i][j][k];
+    }
+};
+
+void ParallelTest() {
+    for( int i=0; i<N; i=i<3 ? i+1 : i*3 ) {
+        for( int j=0; j<N; j=j<3 ? j+1 : j*3 ) {
+            for( int k=0; k<N; k=k<3 ? k+1 : k*3 ) {
+                const tbb::blocked_range3d<int> r( 0, i, 5, 0, j, 3, 0, k, 1 );
+                tbb::parallel_for( r, Striker() );
+                for( int l=0; l<N; ++l ) {
+                    for( int m=0; m<N; ++m ) {
+                        for( int n=0; n<N; ++n ) {
+                             ASSERT( Array[l][m][n]==(l<i && m<j && n<k), NULL );
+                             Array[l][m][n] = 0;
+                        }
+                    }
+                }
+            }
+        }
+    }
+}
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+#include <vector>
+void TestDeductionGuides() {
+    std::vector<const unsigned long *> v;
+    std::vector<double> v2;
+    std::vector<std::vector<int>> v3;
+
+    // check blocked_range2d(PageValue, PageValue, size_t, RowValue, RowValue, size_t, ColValue, ColValue, size_t)
+    tbb::blocked_range3d r1(v.begin(), v.end(), 2, v2.begin(), v2.end(), 2, v3.begin(), v3.end(), 6);
+    static_assert(std::is_same<decltype(r1),
+        tbb::blocked_range3d<decltype(v)::iterator, decltype(v2)::iterator, decltype(v3)::iterator>>::value);
+
+    // check blocked_range2d(blocked_range3d &)
+    tbb::blocked_range3d r2(r1);
+    static_assert(std::is_same<decltype(r2), decltype(r1)>::value);
+
+    // check blocked_range2d(blocked_range3d &&)
+    tbb::blocked_range3d r3(std::move(r1));
+    static_assert(std::is_same<decltype(r2), decltype(r1)>::value);
+}
+#endif
+
+#include "tbb/task_scheduler_init.h"
+
+int TestMain () {
+    SerialTest();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        ParallelTest();
+    }
+
+    #if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+        TestDeductionGuides();
+    #endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_blocked_rangeNd.cpp b/xdl/third_party/tbb/src/test/test_blocked_rangeNd.cpp
new file mode 100644
index 00000000..343c768f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_blocked_rangeNd.cpp
@@ -0,0 +1,259 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_BLOCKED_RANGE_ND 1
+#include "tbb/blocked_rangeNd.h"
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_CPP11_PRESENT && __TBB_CPP11_ARRAY_PRESENT && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT
+// AbstractValueType class represents Value concept's requirements in the most abstract way
+class AbstractValueType {
+    int value;
+    AbstractValueType() {}
+public:
+    friend AbstractValueType MakeAbstractValue(int i);
+    friend int GetValueOf(const AbstractValueType& v);
+};
+
+int GetValueOf(const AbstractValueType& v) { return v.value; }
+
+AbstractValueType MakeAbstractValue(int i) {
+    AbstractValueType x;
+    x.value = i;
+    return x;
+}
+
+// operator- returns amount of elements of AbstractValueType between u and v
+std::size_t operator-(const AbstractValueType& u, const AbstractValueType& v) {
+    return GetValueOf(u) - GetValueOf(v);
+}
+
+bool operator<(const AbstractValueType& u, const AbstractValueType& v) {
+    return GetValueOf(u) < GetValueOf(v);
+}
+
+AbstractValueType operator+(const AbstractValueType& u, std::size_t offset) {
+    return MakeAbstractValue(GetValueOf(u) + int(offset));
+}
+
+#include "harness_assert.h"
+#include <algorithm> // std::for_each
+#include <array>
+
+namespace internal {
+    template<typename range_t, unsigned int N>
+    struct utils {
+        using val_t = typename range_t::value_type;
+
+        template<typename EntityType, std::size_t DimSize>
+        using data_type = std::array<typename utils<range_t, N - 1>::template data_type<EntityType, DimSize>, DimSize>;
+
+        template<typename EntityType, std::size_t DimSize>
+        static void init_data(data_type<EntityType, DimSize>& data) {
+            std::for_each(data.begin(), data.end(), utils<range_t, N - 1>::template init_data<EntityType, DimSize>);
+        }
+
+        template<typename EntityType, std::size_t DimSize>
+        static void increment_data(const range_t& range, data_type<EntityType, DimSize>& data) {
+            auto begin = data.begin() + range.dim(N - 1).begin();
+            // same as "auto end = out.begin() + range.dim(N - 1).end();"
+            auto end = begin + range.dim(N - 1).size();
+            for (auto i = begin; i != end; ++i) {
+                utils<range_t, N - 1>::template increment_data<EntityType, DimSize>(range, *i);
+            }
+        }
+
+        template<typename EntityType, std::size_t DimSize>
+        static void check_data(const range_t& range, data_type<EntityType, DimSize>& data) {
+            auto begin = data.begin() + range.dim(N - 1).begin();
+            // same as "auto end = out.begin() + range.dim(N - 1).end();"
+            auto end = begin + range.dim(N - 1).size();
+            for (auto i = begin; i != end; ++i) {
+                utils<range_t, N - 1>::template check_data<EntityType, DimSize>(range, *i);
+            }
+        }
+
+        template<typename input_t, std::size_t... Is>
+        static range_t make_range(std::size_t shift, bool negative, val_t(*gen)(input_t), tbb::internal::index_sequence<Is...>) {
+            return range_t( { {
+                    /*    begin =*/gen(negative ? -input_t(Is + shift) : 0),
+                    /*      end =*/gen(input_t(Is + shift)),
+                    /*grainsize =*/Is + 1}
+                    /*pack expansion*/... } );
+        }
+
+        static bool is_empty(const range_t& range) {
+            if (range.dim(N - 1).empty()) { return true; }
+            return utils<range_t, N - 1>::is_empty(range);
+        }
+
+        static bool is_divisible(const range_t& range) {
+            if (range.dim(N - 1).is_divisible()) { return true; }
+            return utils<range_t, N - 1>::is_divisible(range);
+        }
+
+        static void check_splitting(const range_t& range_split, const range_t& range_new, int(*get)(const val_t&), bool split_checker = false) {
+            if (get(range_split.dim(N - 1).begin()) == get(range_new.dim(N - 1).begin())) {
+                ASSERT(get(range_split.dim(N - 1).end()) == get(range_new.dim(N - 1).end()), NULL);
+            }
+            else {
+                ASSERT(get(range_split.dim(N - 1).end()) == get(range_new.dim(N - 1).begin()) && !split_checker, NULL);
+                split_checker = true;
+            }
+            utils<range_t, N - 1>::check_splitting(range_split, range_new, get, split_checker);
+        }
+
+    };
+
+    template<typename range_t>
+    struct utils<range_t, 0> {
+        using val_t = typename range_t::value_type;
+
+        template<typename EntityType, std::size_t DimSize>
+        using data_type = EntityType;
+
+        template<typename EntityType, std::size_t DimSize>
+        static void init_data(data_type<EntityType, DimSize>& data) { data = 0; }
+
+        template<typename EntityType, std::size_t DimSize>
+        static void increment_data(const range_t&, data_type<EntityType, DimSize>& data) { ++data; }
+
+        template<typename EntityType, std::size_t DimSize>
+        static void check_data(const range_t&, data_type<EntityType, DimSize>& data) {
+            ASSERT(data == 1, NULL);
+        }
+
+        static bool is_empty(const range_t&) { return false; }
+
+        static bool is_divisible(const range_t&) { return false; }
+
+        static void check_splitting(const range_t&, const range_t&, int(*)(const val_t&), bool) {}
+    };
+
+    // We need MakeInt function to pass it into make_range as factory function
+    // because of matching make_range with AbstractValueType and other types too
+    int MakeInt(int i) { return i; }
+}
+
+template<unsigned int DimAmount>
+void SerialTest() {
+    __TBB_STATIC_ASSERT((tbb::blocked_rangeNd<int, DimAmount>::ndims()
+                         == tbb::blocked_rangeNd<AbstractValueType, DimAmount>::ndims()),
+                         "different amount of dimensions");
+
+    using range_t = tbb::blocked_rangeNd<AbstractValueType, DimAmount>;
+    // 'typedef' instead of 'using' because of GCC 4.7.2 bug on Debian 7.0
+    typedef internal::utils<range_t, DimAmount> utils;
+
+    // Generate empty range
+    range_t r = utils::make_range(0, true, &MakeAbstractValue, tbb::internal::make_index_sequence<DimAmount>());
+
+    AssertSameType(r.is_divisible(), bool());
+    AssertSameType(r.empty(), bool());
+    AssertSameType(range_t::ndims(), 0U);
+
+    ASSERT(r.empty() == utils::is_empty(r) && r.empty(), NULL);
+    ASSERT(r.is_divisible() == utils::is_divisible(r), NULL);
+
+    // Generate not-empty range divisible range
+    r = utils::make_range(1, true, &MakeAbstractValue, tbb::internal::make_index_sequence<DimAmount>());
+    ASSERT(r.empty() == utils::is_empty(r) && !r.empty(), NULL);
+    ASSERT(r.is_divisible() == utils::is_divisible(r) && r.is_divisible(), NULL);
+
+    range_t r_new(r, tbb::split());
+    utils::check_splitting(r, r_new, &GetValueOf);
+
+    SerialTest<DimAmount - 1>();
+}
+template<> void SerialTest<0>() {}
+
+#include "tbb/parallel_for.h"
+
+template<unsigned int DimAmount>
+void ParallelTest() {
+    using range_t = tbb::blocked_rangeNd<int, DimAmount>;
+    // 'typedef' instead of 'using' because of GCC 4.7.2 bug on Debian 7.0
+    typedef internal::utils<range_t, DimAmount>  utils;
+
+    // Max size is                                 1 << 20 - 1 bytes
+    // Thus size of one dimension's elements is    1 << (20 / DimAmount - 1) bytes
+    typename utils::template data_type<unsigned char, 1 << (20 / DimAmount - 1)> data;
+    utils::init_data(data);
+
+    range_t r = utils::make_range((1 << (20 / DimAmount - 1)) - DimAmount, false, &internal::MakeInt, tbb::internal::make_index_sequence<DimAmount>());
+
+    tbb::parallel_for(r, [&data](const range_t& range) {
+        utils::increment_data(range, data);
+    });
+
+    utils::check_data(r, data);
+
+    ParallelTest<DimAmount - 1>();
+}
+template<> void ParallelTest<0>() {}
+
+void TestCtors() {
+    tbb::blocked_rangeNd<int, 1>{ { 0,13,3 } };
+
+    tbb::blocked_rangeNd<int, 1>{ tbb::blocked_range<int>{ 0,13,3 } };
+
+    tbb::blocked_rangeNd<int, 2>(tbb::blocked_range<int>(-8923, 8884, 13), tbb::blocked_range<int>(-8923, 5, 13));
+
+    tbb::blocked_rangeNd<int, 2>({ -8923, 8884, 13 }, { -8923, 8884, 13 });
+
+    tbb::blocked_range<int> r1(0, 13);
+
+    tbb::blocked_range<int> r2(-12, 23);
+
+    tbb::blocked_rangeNd<int, 2>({ { -8923, 8884, 13 }, r1});
+
+    tbb::blocked_rangeNd<int, 2>({ r2, r1 });
+
+    tbb::blocked_rangeNd<int, 2>(r1, r2);
+
+    tbb::blocked_rangeNd<AbstractValueType, 4>({ MakeAbstractValue(-3), MakeAbstractValue(13), 8 },
+                                               { MakeAbstractValue(-53), MakeAbstractValue(23), 2 },
+                                               { MakeAbstractValue(-23), MakeAbstractValue(33), 1 },
+                                               { MakeAbstractValue(-13), MakeAbstractValue(43), 7 });
+}
+
+static const std::size_t N = 4;
+
+#include "harness.h"
+#include "tbb/task_scheduler_init.h"
+
+int TestMain() {
+    TestCtors();
+    SerialTest<N>();
+    for( int p=MinThread; p<= MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        ParallelTest<N>();
+    }
+    return Harness::Done;
+}
+
+#else
+
+// tbb::blocked_rangeNd requires C++11 support
+#define HARNESS_SKIP_TEST 1
+#include "harness.h"
+
+#endif /* __TBB_CPP11_PRESENT && __TBB_CPP11_ARRAY_PRESENT && __TBB_CPP11_TEMPLATE_ALIASES_PRESENT */
diff --git a/xdl/third_party/tbb/src/test/test_broadcast_node.cpp b/xdl/third_party/tbb/src/test/test_broadcast_node.cpp
new file mode 100644
index 00000000..6bff5a9c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_broadcast_node.cpp
@@ -0,0 +1,346 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "tbb/flow_graph.h"
+#include "tbb/task.h"
+#include "tbb/atomic.h"
+
+const int N = 1000;
+const int R = 4;
+
+class int_convertable_type : private NoAssign {
+
+   int my_value;
+
+public:
+
+   int_convertable_type( int v ) : my_value(v) {}
+   operator int() const { return my_value; }
+
+};
+
+
+template< typename T >
+class counting_array_receiver : public tbb::flow::receiver<T> {
+
+    tbb::atomic<size_t> my_counters[N];
+    tbb::flow::graph& my_graph;
+
+public:
+
+    counting_array_receiver(tbb::flow::graph& g) : my_graph(g) {
+        for (int i = 0; i < N; ++i )
+           my_counters[i] = 0;
+    }
+
+    size_t operator[]( int i ) {
+        size_t v = my_counters[i];
+        return v;
+    }
+
+    tbb::task * try_put_task( const T &v ) __TBB_override {
+        ++my_counters[(int)v];
+        return const_cast<tbb::task *>(tbb::flow::internal::SUCCESSFULLY_ENQUEUED);
+    }
+
+    tbb::flow::graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::receiver<T>::built_predecessors_type built_predecessors_type;
+    built_predecessors_type mbp;
+    built_predecessors_type &built_predecessors() __TBB_override { return mbp; }
+    typedef typename tbb::flow::receiver<T>::predecessor_list_type predecessor_list_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_type predecessor_type;
+    void internal_add_built_predecessor(predecessor_type &) __TBB_override {}
+    void internal_delete_built_predecessor(predecessor_type &) __TBB_override {}
+    void copy_predecessors(predecessor_list_type &) __TBB_override {}
+    size_t predecessor_count() __TBB_override { return 0; }
+#endif
+    void reset_receiver(tbb::flow::reset_flags /*f*/) __TBB_override { }
+
+};
+
+template< typename T >
+void test_serial_broadcasts() {
+
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<T> b(g);
+
+    for ( int num_receivers = 1; num_receivers < R; ++num_receivers ) {
+        std::vector< counting_array_receiver<T> > receivers(num_receivers, counting_array_receiver<T>(g));
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT(b.successor_count() == 0, NULL);
+        ASSERT(b.predecessor_count() == 0, NULL);
+        typename tbb::flow::broadcast_node<T>::successor_list_type my_succs;
+        b.copy_successors(my_succs);
+        ASSERT(my_succs.size() == 0, NULL);
+        typename tbb::flow::broadcast_node<T>::predecessor_list_type my_preds;
+        b.copy_predecessors(my_preds);
+        ASSERT(my_preds.size() == 0, NULL);
+#endif
+
+        for ( int r = 0; r < num_receivers; ++r ) {
+            tbb::flow::make_edge( b, receivers[r] );
+        }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT( b.successor_count() == (size_t)num_receivers, NULL);
+#endif
+
+        for (int n = 0; n < N; ++n ) {
+            ASSERT( b.try_put( (T)n ), NULL );
+        }
+
+        for ( int r = 0; r < num_receivers; ++r ) {
+            for (int n = 0; n < N; ++n ) {
+                ASSERT( receivers[r][n] == 1, NULL );
+            }
+            tbb::flow::remove_edge( b, receivers[r] );
+        }
+        ASSERT( b.try_put( (T)0 ), NULL );
+        for ( int r = 0; r < num_receivers; ++r )
+            ASSERT( receivers[0][0] == 1, NULL );
+    }
+
+}
+
+template< typename T >
+class native_body : private NoAssign {
+
+    tbb::flow::broadcast_node<T> &my_b;
+
+public:
+
+    native_body( tbb::flow::broadcast_node<T> &b ) : my_b(b) {}
+
+    void operator()(int) const {
+        for (int n = 0; n < N; ++n ) {
+            ASSERT( my_b.try_put( (T)n ), NULL );
+        }
+    }
+
+};
+
+template< typename T >
+void run_parallel_broadcasts(tbb::flow::graph& g, int p, tbb::flow::broadcast_node<T>& b) {
+    for ( int num_receivers = 1; num_receivers < R; ++num_receivers ) {
+        std::vector< counting_array_receiver<T> > receivers(num_receivers, counting_array_receiver<T>(g));
+
+        for ( int r = 0; r < num_receivers; ++r ) {
+            tbb::flow::make_edge( b, receivers[r] );
+        }
+
+        NativeParallelFor( p, native_body<T>( b ) );
+
+        for ( int r = 0; r < num_receivers; ++r ) {
+            for (int n = 0; n < N; ++n ) {
+                ASSERT( (int)receivers[r][n] == p, NULL );
+            }
+            tbb::flow::remove_edge( b, receivers[r] );
+        }
+        ASSERT( b.try_put( (T)0 ), NULL );
+        for ( int r = 0; r < num_receivers; ++r )
+            ASSERT( (int)receivers[r][0] == p, NULL );
+    }
+}
+
+template< typename T >
+void test_parallel_broadcasts(int p) {
+
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<T> b(g);
+    run_parallel_broadcasts(g, p, b);
+
+    // test copy constructor
+    tbb::flow::broadcast_node<T> b_copy(b);
+    run_parallel_broadcasts(g, p, b_copy);
+}
+
+// broadcast_node does not allow successors to try_get from it (it does not allow
+// the flow edge to switch) so we only need test the forward direction.
+template<typename T>
+void test_resets() {
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<T> b0(g);
+    tbb::flow::broadcast_node<T> b1(g);
+    tbb::flow::queue_node<T> q0(g);
+    tbb::flow::make_edge(b0,b1);
+    tbb::flow::make_edge(b1,q0);
+    T j;
+
+    // test standard reset
+    for(int testNo = 0; testNo < 2; ++testNo) {
+        for(T i= 0; i <= 3; i += 1) {
+            b0.try_put(i);
+        }
+        g.wait_for_all();
+        for(T i= 0; i <= 3; i += 1) {
+            ASSERT(q0.try_get(j) && j == i, "Bad value in queue");
+        }
+        ASSERT(!q0.try_get(j), "extra value in queue");
+
+        // reset the graph.  It should work as before.
+        if (testNo == 0) g.reset();
+    }
+
+    g.reset(tbb::flow::rf_clear_edges);
+    for(T i= 0; i <= 3; i += 1) {
+        b0.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT(!q0.try_get(j), "edge between nodes not removed");
+    for(T i= 0; i <= 3; i += 1) {
+        b1.try_put(i);
+    }
+    g.wait_for_all();
+    ASSERT(!q0.try_get(j), "edge between nodes not removed");
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+void test_extract() {
+    int dont_care;
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<int> b0(g);
+    tbb::flow::broadcast_node<int> b1(g);
+    tbb::flow::broadcast_node<int> b2(g);
+    tbb::flow::broadcast_node<int> b3(g);
+    tbb::flow::broadcast_node<int> b4(g);
+    tbb::flow::broadcast_node<int> b5(g);
+    tbb::flow::queue_node<int> q0(g);
+    tbb::flow::make_edge(b0,b1);
+    tbb::flow::make_edge(b0,b2);
+    tbb::flow::make_edge(b1,b3);
+    tbb::flow::make_edge(b1,b4);
+    tbb::flow::make_edge(b2,b4);
+    tbb::flow::make_edge(b2,b5);
+    tbb::flow::make_edge(b3,q0);
+    tbb::flow::make_edge(b4,q0);
+    tbb::flow::make_edge(b5,q0);
+
+    /*          b3       */
+    /*         /  \      */
+    /*        b1   \     */
+    /*       / \    \    */
+    /*     b0   b4---q0  */
+    /*       \ /    /    */
+    /*        b2   /     */
+    /*         \  /      */
+    /*          b5       */
+
+    g.wait_for_all();
+    b0.try_put(1);
+    g.wait_for_all();
+    for( int i = 0; i < 4; ++i ) {
+        int j;
+        ASSERT(q0.try_get(j) && j == 1, "missing or incorrect message");
+    }
+    ASSERT(!q0.try_get(dont_care), "extra message in queue");
+    ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 2, "improper count for b0");
+    ASSERT(b1.predecessor_count() == 1 && b1.successor_count() == 2, "improper count for b1");
+    ASSERT(b2.predecessor_count() == 1 && b2.successor_count() == 2, "improper count for b2");
+    ASSERT(b3.predecessor_count() == 1 && b3.successor_count() == 1, "improper count for b3");
+    ASSERT(b4.predecessor_count() == 2 && b4.successor_count() == 1, "improper count before extract of b4");
+    ASSERT(b5.predecessor_count() == 1 && b5.successor_count() == 1, "improper count for b5");
+    b4.extract();  // remove from tree of nodes.
+    ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 2, "improper count for b0 after");
+    ASSERT(b1.predecessor_count() == 1 && b1.successor_count() == 1, "improper succ count for b1 after");
+    ASSERT(b2.predecessor_count() == 1 && b2.successor_count() == 1, "improper succ count for b2 after");
+    ASSERT(b3.predecessor_count() == 1 && b3.successor_count() == 1, "improper succ count for b3 after");
+    ASSERT(b4.predecessor_count() == 0 && b4.successor_count() == 0, "improper succ count after extract");
+    ASSERT(b5.predecessor_count() == 1 && b5.successor_count() == 1, "improper succ count for b5 after");
+
+    /*          b3       */
+    /*         /  \      */
+    /*        b1   \     */
+    /*       /      \    */
+    /*     b0        q0  */
+    /*       \      /    */
+    /*        b2   /     */
+    /*         \  /      */
+    /*          b5       */
+
+    b0.try_put(1);
+    g.wait_for_all();
+    for( int i = 0; i < 2; ++i ) {
+        int j;
+        ASSERT(q0.try_get(j) && j == 1, "missing or incorrect message");
+    }
+    ASSERT(!q0.try_get(dont_care), "extra message in queue");
+    tbb::flow::make_edge(b0,b4);
+    tbb::flow::make_edge(b4,q0);
+    g.wait_for_all();
+    ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 3, "improper count for b0 after");
+    ASSERT(b1.predecessor_count() == 1 && b1.successor_count() == 1, "improper succ count for b1 after");
+    ASSERT(b2.predecessor_count() == 1 && b2.successor_count() == 1, "improper succ count for b2 after");
+    ASSERT(b3.predecessor_count() == 1 && b3.successor_count() == 1, "improper succ count for b3 after");
+    ASSERT(b4.predecessor_count() == 1 && b4.successor_count() == 1, "improper succ count after extract");
+    ASSERT(b5.predecessor_count() == 1 && b5.successor_count() == 1, "improper succ count for b5 after");
+
+    /*          b3       */
+    /*         /  \      */
+    /*        b1   \     */
+    /*       /      \    */
+    /*     b0---b4---q0  */
+    /*       \      /    */
+    /*        b2   /     */
+    /*         \  /      */
+    /*          b5       */
+
+    b0.try_put(1);
+    g.wait_for_all();
+    for( int i = 0; i < 3; ++i ) {
+        int j;
+        ASSERT(q0.try_get(j) && j == 1, "missing or incorrect message");
+    }
+    ASSERT(!q0.try_get(dont_care), "extra message in queue");
+}
+#endif  // TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+
+   test_serial_broadcasts<int>();
+   test_serial_broadcasts<float>();
+   test_serial_broadcasts<int_convertable_type>();
+
+   for( int p=MinThread; p<=MaxThread; ++p ) {
+       test_parallel_broadcasts<int>(p);
+       test_parallel_broadcasts<float>(p);
+       test_parallel_broadcasts<int_convertable_type>(p);
+   }
+
+   test_resets<int>();
+   test_resets<float>();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+   test_extract();
+#endif
+
+   return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_buffer_node.cpp b/xdl/third_party/tbb/src/test/test_buffer_node.cpp
new file mode 100644
index 00000000..20f98211
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_buffer_node.cpp
@@ -0,0 +1,446 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+
+#define N 1000
+#define C 10
+
+template< typename T >
+void spin_try_get( tbb::flow::buffer_node<T> &b, T &value ) {
+    while ( b.try_get(value) != true ) {}
+}
+
+template< typename T >
+void check_item( T* count_value, T &value ) {
+    count_value[value / N] += value % N;
+}
+
+template< typename T >
+struct parallel_puts : NoAssign {
+
+    tbb::flow::buffer_node<T> &my_b;
+
+    parallel_puts( tbb::flow::buffer_node<T> &b ) : my_b(b) {}
+
+    void operator()(int i) const {
+        for (int j = 0; j < N; ++j) {
+            bool msg = my_b.try_put( T(N*i + j) );
+            ASSERT( msg == true, NULL );
+        }
+    }
+};
+
+template< typename T >
+struct touches {
+
+    bool **my_touches;
+    int my_num_threads;
+
+    touches( int num_threads ) : my_num_threads(num_threads) {
+        my_touches = new bool* [my_num_threads];
+        for ( int p = 0; p < my_num_threads; ++p) {
+            my_touches[p] = new bool[N];
+            for ( int n = 0; n < N; ++n)
+                my_touches[p][n] = false;
+        }
+    }
+
+    ~touches() {
+        for ( int p = 0; p < my_num_threads; ++p) {
+            delete [] my_touches[p];
+        }
+        delete [] my_touches;
+    }
+
+    bool check( T v ) {
+        ASSERT ( my_touches[v/N][v%N] == false, NULL);
+        my_touches[v/N][v%N] = true;
+        return true;
+    }
+
+    bool validate_touches() {
+        for ( int p = 0; p < my_num_threads; ++p) {
+            for ( int n = 0; n < N; ++n) {
+                ASSERT ( my_touches[p][n] == true, NULL);
+            }
+        }
+        return true;
+    }
+};
+
+template< typename T >
+struct parallel_gets : NoAssign {
+
+    tbb::flow::buffer_node<T> &my_b;
+    touches<T> &my_touches;
+
+    parallel_gets( tbb::flow::buffer_node<T> &b, touches<T> &t) : my_b(b), my_touches(t) {}
+
+    void operator()(int) const {
+        for (int j = 0; j < N; ++j) {
+            T v;
+            spin_try_get( my_b, v );
+            my_touches.check( v );
+        }
+    }
+
+};
+
+template< typename T >
+struct parallel_put_get : NoAssign {
+
+    tbb::flow::buffer_node<T> &my_b;
+    touches<T> &my_touches;
+
+    parallel_put_get( tbb::flow::buffer_node<T> &b, touches<T> &t ) : my_b(b), my_touches(t) {}
+
+    void operator()(int tid) const {
+
+        for ( int i = 0; i < N; i+=C ) {
+            int j_end = ( N < i + C ) ? N : i + C;
+            // dump about C values into the buffer
+            for ( int j = i; j < j_end; ++j ) {
+                ASSERT( my_b.try_put( T (N*tid + j ) ) == true, NULL );
+            }
+            // receiver about C values from the buffer
+            for ( int j = i; j < j_end; ++j ) {
+                T v;
+                spin_try_get( my_b, v );
+                my_touches.check( v );
+            }
+        }
+    }
+
+};
+
+//
+// Tests
+//
+// Item can be reserved, released, consumed ( single serial receiver )
+//
+template< typename T >
+int test_reservation() {
+    tbb::flow::graph g;
+    T bogus_value(-1);
+
+    // Simple tests
+    tbb::flow::buffer_node<T> b(g);
+
+    b.try_put(T(1));
+    b.try_put(T(2));
+    b.try_put(T(3));
+
+    T v, vsum;
+    ASSERT( b.try_reserve(v) == true, NULL );
+    ASSERT( b.try_release() == true, NULL );
+    v = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_reserve(v) == true, NULL );
+    ASSERT( b.try_consume() == true, NULL );
+    vsum += v;
+    v = bogus_value;
+    g.wait_for_all();
+
+    ASSERT( b.try_get(v) == true, NULL );
+    vsum += v;
+    v = bogus_value;
+    g.wait_for_all();
+
+    ASSERT( b.try_reserve(v) == true, NULL );
+    ASSERT( b.try_release() == true, NULL );
+    v = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_reserve(v) == true, NULL );
+    ASSERT( b.try_consume() == true, NULL );
+    vsum += v;
+    ASSERT( vsum == T(6), NULL);
+    v = bogus_value;
+    g.wait_for_all();
+
+    return 0;
+}
+
+//
+// Tests
+//
+// multilpe parallel senders, items in arbitrary order
+// multilpe parallel senders, multiple parallel receivers, items in arbitrary order and all items received
+//   * overlapped puts / gets
+//   * all puts finished before any getS
+//
+template< typename T >
+int test_parallel(int num_threads) {
+    tbb::flow::graph g;
+    tbb::flow::buffer_node<T> b(g);
+    tbb::flow::buffer_node<T> b2(g);
+    tbb::flow::buffer_node<T> b3(g);
+    T bogus_value(-1);
+    T j = bogus_value;
+
+    NativeParallelFor( num_threads, parallel_puts<T>(b) );
+
+    T *next_value = new T[num_threads];
+    for (int tid = 0; tid < num_threads; ++tid) next_value[tid] = T(0);
+
+    for (int i = 0; i < num_threads * N; ++i ) {
+        spin_try_get( b, j );
+        check_item( next_value, j );
+        j = bogus_value;
+    }
+    for (int tid = 0; tid < num_threads; ++tid)  {
+        ASSERT( next_value[tid] == T((N*(N-1))/2), NULL );
+    }
+
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    NativeParallelFor( num_threads, parallel_puts<T>(b) );
+
+    {
+        touches< T > t( num_threads );
+        NativeParallelFor( num_threads, parallel_gets<T>(b, t) );
+        g.wait_for_all();
+        ASSERT( t.validate_touches(), NULL );
+    }
+    j = bogus_value;
+    ASSERT( b.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    g.wait_for_all();
+    {
+        touches< T > t( num_threads );
+        NativeParallelFor( num_threads, parallel_put_get<T>(b, t) );
+        g.wait_for_all();
+        ASSERT( t.validate_touches(), NULL );
+    }
+    j = bogus_value;
+    ASSERT( b.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::make_edge( b, b2 );
+    tbb::flow::make_edge( b2, b3 );
+
+    NativeParallelFor( num_threads, parallel_puts<T>(b) );
+    {
+        touches< T > t( num_threads );
+        NativeParallelFor( num_threads, parallel_gets<T>(b3, t) );
+        g.wait_for_all();
+        ASSERT( t.validate_touches(), NULL );
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( b2.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( b3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    // test copy constructor
+    ASSERT( b.remove_successor( b2 ), NULL );
+    // fill up b:
+    NativeParallelFor( num_threads, parallel_puts<T>(b) );
+    // copy b:
+    tbb::flow::buffer_node<T> b_copy(b);
+
+    // b_copy should be empty
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b_copy.try_get( j ) == false, NULL );
+
+    // hook them together:
+    ASSERT( b.register_successor(b_copy) == true, NULL );
+    // try to get content from b_copy
+    {
+        touches< T > t( num_threads );
+        NativeParallelFor( num_threads, parallel_gets<T>(b_copy, t) );
+        g.wait_for_all();
+        ASSERT( t.validate_touches(), NULL );
+    }
+    // now both should be empty
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( b_copy.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    delete [] next_value;
+    return 0;
+}
+
+//
+// Tests
+//
+// Predecessors cannot be registered
+// Empty buffer rejects item requests
+// Single serial sender, items in arbitrary order
+// Chained buffers ( 2 & 3 ), single sender, items at last buffer in arbitrary order
+//
+
+template< typename T >
+int test_serial() {
+    tbb::flow::graph g;
+    T bogus_value(-1);
+
+    tbb::flow::buffer_node<T> b(g);
+    tbb::flow::buffer_node<T> b2(g);
+    T j = bogus_value;
+
+    //
+    // Rejects attempts to add / remove predecessor
+    // Rejects request from empty buffer
+    //
+    ASSERT( b.register_predecessor( b2 ) == false, NULL );
+    ASSERT( b.remove_predecessor( b2 ) == false, NULL );
+    ASSERT( b.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    //
+    // Simple puts and gets
+    //
+
+    for (int i = 0; i < N; ++i) {
+        bool msg = b.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+    }
+
+    T vsum = T(0);
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        spin_try_get( b, j );
+        vsum += j;
+    }
+    ASSERT( vsum == (N*(N-1))/2, NULL);
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::make_edge(b, b2);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT( b.successor_count() == 1, NULL);
+    ASSERT( b.predecessor_count() == 0, NULL);
+    ASSERT( b2.successor_count() == 0, NULL);
+    ASSERT( b2.predecessor_count() == 1, NULL);
+    typename tbb::flow::buffer_node<T>::successor_list_type my_succs;
+    b.copy_successors(my_succs);
+    ASSERT(my_succs.size() == 1, NULL);
+    typename tbb::flow::buffer_node<T>::predecessor_list_type my_preds;
+    b.copy_predecessors(my_preds);
+    ASSERT(my_preds.size() == 0, NULL);
+#endif
+
+    vsum = T(0);
+    for (int i = 0; i < N; ++i) {
+        bool msg = b.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+    }
+
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        spin_try_get( b2, j );
+        vsum += j;
+    }
+    ASSERT( vsum == (N*(N-1))/2, NULL);
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( b2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::remove_edge(b, b2);
+    ASSERT( b.try_put( 1 ) == true, NULL );
+    g.wait_for_all();
+    ASSERT( b2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == true, NULL );
+    ASSERT( j == 1, NULL );
+
+    tbb::flow::buffer_node<T> b3(g);
+    tbb::flow::make_edge( b, b2 );
+    tbb::flow::make_edge( b2, b3 );
+
+    vsum = T(0);
+    for (int i = 0; i < N; ++i) {
+        bool msg = b.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+    }
+
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        spin_try_get( b3, j );
+        vsum += j;
+    }
+    ASSERT( vsum == (N*(N-1))/2, NULL);
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( b2.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( b3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::remove_edge(b, b2);
+    ASSERT( b.try_put( 1 ) == true, NULL );
+    g.wait_for_all();
+    ASSERT( b2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+    ASSERT( b3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+    ASSERT( b.try_get( j ) == true, NULL );
+    ASSERT( j == 1, NULL );
+
+    return 0;
+}
+
+int TestMain() {
+    tbb::tick_count start = tbb::tick_count::now(), stop;
+    for (int p = 2; p <= 4; ++p) {
+        tbb::task_scheduler_init init(p);
+        test_serial<int>();
+        test_parallel<int>(p);
+    }
+    stop = tbb::tick_count::now();
+    REMARK("Buffer_Node Time=%6.6f\n", (stop-start).seconds());
+    test_resets<int,tbb::flow::buffer_node<int> >();
+    test_resets<float,tbb::flow::buffer_node<float> >();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_buffer_extract<tbb::flow::buffer_node<int> >().run_tests();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_cache_aligned_allocator.cpp b/xdl/third_party/tbb/src/test/test_cache_aligned_allocator.cpp
new file mode 100644
index 00000000..4ca8e36e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_cache_aligned_allocator.cpp
@@ -0,0 +1,80 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test whether cache_aligned_allocator works with some of the host's STL containers.
+
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_allocator.h"
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+// the real body of the test is there:
+#include "test_allocator.h"
+
+template<>
+struct is_zero_filling<tbb::zero_allocator<void> > {
+    static const bool value = true;
+};
+
+// Test that NFS_Allocate() throws bad_alloc if cannot allocate memory.
+void Test_NFS_Allocate_Throws() {
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    using namespace tbb::internal;
+
+    // First, allocate a reasonably big amount of memory, big enough
+    // to not cause warp around in system allocator after adding object header
+    // during address2 allocation.
+    const size_t itemsize = 1024;
+    const size_t nitems   = 1024;
+    void *address1 = NULL;
+    try {
+        address1 = NFS_Allocate( nitems, itemsize, NULL );
+    } catch( ... ) {
+        // intentionally empty
+    }
+    ASSERT( address1, "NFS_Allocate unable to obtain 1024*1024 bytes" );
+
+    bool exception_caught = false;
+    try {
+        // Try allocating more memory than left in the address space; should cause std::bad_alloc
+        (void) NFS_Allocate( 1, ~size_t(0) - itemsize*nitems + NFS_GetLineSize(), NULL);
+    } catch( std::bad_alloc& ) {
+        exception_caught = true;
+    } catch( ... ) {
+        ASSERT( __TBB_EXCEPTION_TYPE_INFO_BROKEN, "Unexpected exception type (std::bad_alloc was expected)" );
+        exception_caught = true;
+    }
+    ASSERT( exception_caught, "NFS_Allocate did not throw bad_alloc" );
+
+    try {
+        NFS_Free( address1 );
+    } catch( ... ) {
+        ASSERT( false, "NFS_Free did not accept the address obtained with NFS_Allocate" );
+    }
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+}
+
+int TestMain () {
+    int result = TestMain<tbb::cache_aligned_allocator<void> >();
+    result += TestMain<tbb::tbb_allocator<void> >();
+    result += TestMain<tbb::zero_allocator<void> >();
+    ASSERT( !result, NULL );
+    Test_NFS_Allocate_Throws();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_cache_aligned_allocator_STL.cpp b/xdl/third_party/tbb/src/test/test_cache_aligned_allocator_STL.cpp
new file mode 100644
index 00000000..1eb66fdc
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_cache_aligned_allocator_STL.cpp
@@ -0,0 +1,35 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test whether cache_aligned_allocator works with some of the host's STL containers.
+
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_allocator.h"
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "test_allocator_STL.h"
+
+int TestMain () {
+    TestAllocatorWithSTL<tbb::cache_aligned_allocator<void> >();
+    TestAllocatorWithSTL<tbb::tbb_allocator<void> >();
+    TestAllocatorWithSTL<tbb::zero_allocator<void> >();
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_cilk_common.h b/xdl/third_party/tbb/src/test/test_cilk_common.h
new file mode 100644
index 00000000..e35c3a1c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_cilk_common.h
@@ -0,0 +1,83 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// This file is a common part of test_cilk_interop and test_cilk_dynamic_load tests
+
+int TBB_Fib( int n );
+
+class FibCilkSubtask: public tbb::task {
+    int n;
+    int& result;
+    task* execute() __TBB_override {
+        if( n<2 ) {
+            result = n;
+        } else {
+            int x, y;
+            x = cilk_spawn TBB_Fib(n-2);
+            y = cilk_spawn TBB_Fib(n-1);
+            cilk_sync;
+            result = x+y;
+        }
+        return NULL;
+    }
+public:
+    FibCilkSubtask( int& result_, int n_ ) : result(result_), n(n_) {}
+};
+
+class FibTask: public tbb::task {
+    int n;
+    int& result;
+    task* execute() __TBB_override {
+        if( !g_sandwich && n<2 ) {
+            result = n;
+        } else {
+            int x,y;
+            tbb::task_scheduler_init init(P_nested);
+            task* self0 = &task::self();
+            set_ref_count( 3 );
+            if ( g_sandwich ) {
+                spawn (*new( allocate_child() ) FibCilkSubtask(x,n-1));
+                spawn (*new( allocate_child() ) FibCilkSubtask(y,n-2));
+            }
+            else {
+                spawn (*new( allocate_child() ) FibTask(x,n-1));
+                spawn (*new( allocate_child() ) FibTask(y,n-2));
+            }
+            wait_for_all();
+            task* self1 = &task::self();
+            ASSERT( self0 == self1, "failed to preserve TBB TLS" );
+            result = x+y;
+        }
+        return NULL;
+    }
+public:
+    FibTask( int& result_, int n_ ) : result(result_), n(n_) {}
+};
+
+int TBB_Fib( int n ) {
+    if( n<2 ) {
+        return n;
+    } else {
+        int result;
+        tbb::task_scheduler_init init(P_nested);
+        tbb::task::spawn_root_and_wait(*new( tbb::task::allocate_root()) FibTask(result,n) );
+        return result;
+    }
+}
diff --git a/xdl/third_party/tbb/src/test/test_cilk_dynamic_load.cpp b/xdl/third_party/tbb/src/test/test_cilk_dynamic_load.cpp
new file mode 100644
index 00000000..e1207307
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_cilk_dynamic_load.cpp
@@ -0,0 +1,156 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+// Skip the test if no interoperability with cilkrts
+#define __TBB_CILK_INTEROP   (__TBB_SURVIVE_THREAD_SWITCH && __INTEL_COMPILER>=1200)
+// Skip the test when cilkrts did not have dlopen()/dlclose() start up feature
+#define CILK_SYMBOLS_VISIBLE (_WIN32||_WIN64)
+// The compiler does not add "-lcilkrts" linker option on some linux systems
+#define CILK_LINKAGE_BROKEN  (__linux__ && __GNUC__<4 && __INTEL_COMPILER_BUILD_DATE <= 20110427)
+// Currently, the interop doesn't support the situation:
+//1) Intel(R) Threading Building Blocks (Intel(R) TBB) is outermost;
+//2)   Intel(R) Cilk(TM) Plus, and it should be dynamically loaded with dlopen/LoadLibrary (possibly via a 3rd party module);
+//3)     Intel(R) TBB again;
+//4)       Intel(R) Cilk(TM) Plus again.
+#define HEAVY_NESTED_INTEROP_SUPPORT ( __INTEL_COMPILER_BUILD_DATE < 20110427 )
+
+#if __TBB_CILK_INTEROP && CILK_SYMBOLS_VISIBLE && !CILK_LINKAGE_BROKEN && HEAVY_NESTED_INTEROP_SUPPORT
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/task.h"
+
+static const int N = 25;
+static const int P_outer = 4;
+static const int P_nested = 2;
+
+#ifdef _USRDLL
+
+#include <cilk/cilk.h>
+#define HARNESS_CUSTOM_MAIN 1
+#include "harness.h"
+#undef HARNESS_CUSTOM_MAIN
+
+#if _WIN32 || _WIN64
+#define CILK_TEST_EXPORT extern "C" __declspec(dllexport)
+#else
+#define CILK_TEST_EXPORT extern "C"
+#endif /* _WIN32 || _WIN64 */
+
+bool g_sandwich = true; // have to be declare before #include "test_cilk_common.h"
+#include "test_cilk_common.h"
+
+CILK_TEST_EXPORT int CilkFib( int n )
+{
+    return TBB_Fib(n);
+}
+
+CILK_TEST_EXPORT void CilkShutdown()
+{
+    __cilkrts_end_cilk();
+}
+
+#else /* _USRDLL undefined */
+
+#include "harness.h"
+#include "harness_dynamic_libs.h"
+
+int SerialFib( int n ) {
+    int a=0, b=1;
+    for( int i=0; i<n; ++i ) {
+        b += a;
+        a = b-a;
+    }
+    return a;
+}
+
+int F = SerialFib(N);
+
+typedef int (*CILK_CALL)(int);
+CILK_CALL CilkFib = 0;
+
+typedef void (*CILK_SHUTDOWN)();
+CILK_SHUTDOWN CilkShutdown = 0;
+
+class FibTask: public tbb::task {
+    int n;
+    int& result;
+    task* execute() __TBB_override {
+        if( n<2 ) {
+            result = n;
+        } else {
+
+            // TODO: why RTLD_LAZY was used here?
+            Harness::LIBRARY_HANDLE hLib =
+                Harness::OpenLibrary(TEST_LIBRARY_NAME("test_cilk_dynamic_load_dll"));
+            CilkFib = (CILK_CALL)Harness::GetAddress(hLib, "CilkFib");
+            CilkShutdown = (CILK_SHUTDOWN)Harness::GetAddress(hLib, "CilkShutdown");
+
+            int x, y;
+            x = CilkFib(n-2);
+            y = CilkFib(n-1);
+            result = x+y;
+
+            CilkShutdown();
+
+            Harness::CloseLibrary(hLib);
+        }
+        return NULL;
+    }
+public:
+    FibTask( int& result_, int n_ ) : result(result_), n(n_) {}
+};
+
+
+int TBB_Fib( int n ) {
+    if( n<2 ) {
+        return n;
+    } else {
+        int result;
+        tbb::task_scheduler_init init(P_nested);
+        tbb::task::spawn_root_and_wait(*new( tbb::task::allocate_root()) FibTask(result,n) );
+        return result;
+    }
+}
+
+void RunSandwich() {
+    tbb::task_scheduler_init init(P_outer);
+    int m = TBB_Fib(N);
+    ASSERT( m == F, NULL );
+}
+
+int TestMain () {
+    for ( int i = 0; i < 20; ++i )
+        RunSandwich();
+    return Harness::Done;
+}
+
+#endif /* _USRDLL */
+
+#else /* !__TBB_CILK_INTEROP */
+
+#include "harness.h"
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__TBB_CILK_INTEROP */
diff --git a/xdl/third_party/tbb/src/test/test_cilk_interop.cpp b/xdl/third_party/tbb/src/test/test_cilk_interop.cpp
new file mode 100644
index 00000000..99b3590e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_cilk_interop.cpp
@@ -0,0 +1,155 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#include "harness.h"
+
+// Skip the test if no interoperability with cilkrts
+#define __TBB_CILK_INTEROP   (__TBB_SURVIVE_THREAD_SWITCH && __INTEL_COMPILER>=1200)
+// The compiler does not add "-lcilkrts" linker option on some linux systems
+#define CILK_LINKAGE_BROKEN  (__linux__ && __GNUC__<4 && __INTEL_COMPILER_BUILD_DATE <= 20110427)
+// In U4, cilkrts incorrectly sends the interop notifications to TBB
+#define CILK_NOTIFICATIONS_BROKEN ( __INTEL_COMPILER_BUILD_DATE == 20110427 )
+
+#if __TBB_CILK_INTEROP && !CILK_LINKAGE_BROKEN && !CILK_NOTIFICATIONS_BROKEN
+
+static const int N = 14;
+static const int P_outer = 4;
+static const int P_nested = 2;
+
+#include <cilk/cilk.h>
+#include <cilk/cilk_api.h>
+#define private public
+#include "tbb/task.h"
+#undef private
+#include "tbb/task_scheduler_init.h"
+#include <cstdio>
+#include <cassert>
+
+enum tbb_sched_injection_mode_t {
+    tbbsched_none = 0,
+    tbbsched_explicit_only = 1,
+    tbbsched_auto_only = 2,
+    tbbsched_mixed = 3
+};
+
+tbb_sched_injection_mode_t g_sim = tbbsched_none;
+
+bool g_sandwich = false; // have to be declare before #include "test_cilk_common.h"
+#include "test_cilk_common.h"
+
+// A time delay routine
+void Delay( int n ) {
+    static volatile int Global;
+    for( int k=0; k<10000; ++k )
+        for( int i=0; i<n; ++i )
+            ++Global;
+}
+
+int SerialFib( int n ) {
+    int a=0, b=1;
+    for( int i=0; i<n; ++i ) {
+        b += a;
+        a = b-a;
+    }
+    return a;
+}
+
+int F = SerialFib(N);
+
+int Fib ( int n ) {
+    if( n < 2 ) {
+        if ( g_sim ) {
+            tbb::task_scheduler_init tsi(P_nested);
+        }
+        return n;
+    } else {
+        tbb::task_scheduler_init *tsi = NULL;
+        tbb::task *cur = NULL;
+        if ( g_sim ) {
+            if ( n % 2 == 0 ) {
+                if ( g_sim == tbbsched_auto_only || (g_sim == tbbsched_mixed && n % 4 == 0) ) {
+                    // Trigger TBB scheduler auto-initialization
+                    cur = &tbb::task::self();
+                }
+                else {
+                    ASSERT ( g_sim == tbbsched_explicit_only || (g_sim == tbbsched_mixed && n % 4 != 0), NULL );
+                    // Initialize TBB scheduler explicitly
+                    tsi = new tbb::task_scheduler_init(P_nested);
+                }
+            }
+        }
+        int x, y;
+        x = cilk_spawn Fib(n-2);
+        y = cilk_spawn Fib(n-1);
+        cilk_sync;
+        if ( tsi )
+            delete tsi;
+        return x+y;
+    }
+}
+
+void RunCilkOnly ( tbb_sched_injection_mode_t sim ) {
+    g_sim = sim;
+    int m = Fib(N);
+    ASSERT( m == F, NULL );
+}
+
+struct FibBody : NoAssign, Harness::NoAfterlife {
+    void operator() ( int ) const {
+        int m = Fib(N);
+        ASSERT( m == F, NULL );
+    }
+};
+
+void RunCilkOnlyConcurrently ( tbb_sched_injection_mode_t sim ) {
+    g_sim = sim;
+    NativeParallelFor( P_outer, FibBody() );
+}
+
+void RunSandwich( bool sandwich ) {
+    g_sandwich = sandwich;
+    tbb::task_scheduler_init init(P_outer);
+    int m = TBB_Fib(N);
+    ASSERT( g_sandwich == sandwich, "Memory corruption detected" );
+    ASSERT( m == F, NULL );
+}
+
+int TestMain () {
+    for ( int i = 0; i < 100; ++i )
+        RunCilkOnlyConcurrently( tbbsched_none );
+    RunCilkOnly( tbbsched_none );
+    RunCilkOnly( tbbsched_explicit_only );
+    RunCilkOnly( tbbsched_auto_only );
+    RunCilkOnly( tbbsched_mixed );
+    RunSandwich( false );
+    for ( int i = 0; i < 10; ++i )
+        RunSandwich( true );
+    __cilkrts_end_cilk();
+    return Harness::Done;
+}
+
+#else /* !__TBB_CILK_INTEROP */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__TBB_CILK_INTEROP */
diff --git a/xdl/third_party/tbb/src/test/test_combinable.cpp b/xdl/third_party/tbb/src/test/test_combinable.cpp
new file mode 100644
index 00000000..43e26c62
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_combinable.cpp
@@ -0,0 +1,520 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 0
+#define HARNESS_DEFAULT_MAX_THREADS 4
+
+#define __TBB_EXTRA_DEBUG 1 // for concurrent_hash_map
+#include "tbb/combinable.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/tick_count.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/tbb_thread.h"
+
+#include <cstring>
+#include <vector>
+#include <utility>
+
+#include "harness_assert.h"
+#include "harness.h"
+#include "test_container_move_support.h"
+
+#if __TBB_GCC_WARNING_SUPPRESSION_PRESENT
+#pragma GCC diagnostic ignored "-Wuninitialized"
+#endif
+
+static tbb::atomic<int> construction_counter;
+static tbb::atomic<int> destruction_counter;
+
+const int REPETITIONS = 10;
+const int N = 100000;
+const double EXPECTED_SUM = (REPETITIONS + 1) * N;
+
+//
+// A minimal class
+// Define: default and copy constructor, and allow implicit operator&
+// also operator=
+//
+
+class minimal {
+private:
+    int my_value;
+public:
+    minimal(int val=0) : my_value(val) { ++construction_counter; }
+    minimal( const minimal &m ) : my_value(m.my_value) { ++construction_counter; }
+    minimal& operator=(const minimal& other) { my_value = other.my_value; return *this; }
+    minimal& operator+=(const minimal& other) { my_value += other.my_value; return *this; }
+    operator int() const { return my_value; }
+    ~minimal() { ++destruction_counter; }
+    void set_value( const int i ) { my_value = i; }
+    int value( ) const { return my_value; }
+};
+
+//// functors for initialization and combine
+
+template <typename T>
+struct FunctorAddFinit {
+    T operator()() { return 0; }
+};
+
+template <typename T>
+struct FunctorAddFinit7 {
+    T operator()() { return 7; }
+};
+
+template <typename T>
+struct FunctorAddCombine {
+    T operator()(T left, T right ) const {
+        return left + right;
+    }
+};
+
+template <typename T>
+struct FunctorAddCombineRef {
+    T operator()(const T& left, const T& right ) const {
+        return left + right;
+    }
+};
+
+template <typename T>
+T my_combine( T left, T right) { return left + right; }
+
+template <typename T>
+T my_combine_ref( const T &left, const T &right) { return left + right; }
+
+template <typename T>
+class CombineEachHelper {
+public:
+    CombineEachHelper(T& _result) : my_result(_result) {}
+    void operator()(const T& new_bit) { my_result +=  new_bit; }
+    CombineEachHelper& operator=(const CombineEachHelper& other) {
+        my_result =  other;
+        return *this;
+    }
+private:
+    T& my_result;
+};
+
+template <typename T>
+class CombineEachHelperCnt {
+public:
+    CombineEachHelperCnt(T& _result, int& _nbuckets) : my_result(_result), nBuckets(_nbuckets) {}
+    void operator()(const T& new_bit) { my_result +=  new_bit; ++nBuckets; }
+    CombineEachHelperCnt& operator=(const CombineEachHelperCnt& other) {
+        my_result =  other.my_result;
+        nBuckets = other.nBuckets;
+        return *this;
+    }
+private:
+    T& my_result;
+    int& nBuckets;
+};
+
+template <typename T>
+class CombineEachVectorHelper {
+public:
+    typedef std::vector<T, tbb::tbb_allocator<T> > ContainerType;
+    CombineEachVectorHelper(T& _result) : my_result(_result) { }
+    void operator()(const ContainerType& new_bit) {
+        for(typename ContainerType::const_iterator ci = new_bit.begin(); ci != new_bit.end(); ++ci) {
+            my_result +=  *ci;
+        }
+    }
+    CombineEachVectorHelper& operator=(const CombineEachVectorHelper& other) {
+        my_result=other.my_result;
+        return *this;
+    }
+
+private:
+    T& my_result;
+};
+
+//// end functors
+
+// parallel body with a test for first access
+template <typename T>
+class ParallelScalarBody: NoAssign {
+
+    tbb::combinable<T> &sums;
+
+public:
+
+    ParallelScalarBody ( tbb::combinable<T> &_sums ) : sums(_sums) { }
+
+    void operator()( const tbb::blocked_range<int> &r ) const {
+        for (int i = r.begin(); i != r.end(); ++i) {
+            bool was_there;
+            T& my_local = sums.local(was_there);
+            if(!was_there) my_local = 0;
+             my_local +=  1 ;
+        }
+    }
+
+};
+
+// parallel body with no test for first access
+template <typename T>
+class ParallelScalarBodyNoInit: NoAssign {
+
+    tbb::combinable<T> &sums;
+
+public:
+
+    ParallelScalarBodyNoInit ( tbb::combinable<T> &_sums ) : sums(_sums) { }
+
+    void operator()( const tbb::blocked_range<int> &r ) const {
+        for (int i = r.begin(); i != r.end(); ++i) {
+             sums.local() +=  1 ;
+        }
+    }
+
+};
+
+template< typename T >
+void RunParallelScalarTests(const char *test_name) {
+
+    tbb::task_scheduler_init init(tbb::task_scheduler_init::deferred);
+    for (int p = MinThread; p <= MaxThread; ++p) {
+
+        if (p == 0) continue;
+        REMARK("  Testing parallel %s on %d thread(s)...\n", test_name, p);
+        init.initialize(p);
+
+        tbb::tick_count t0;
+        T combine_sum(0);
+        T combine_ref_sum(0);
+        T combine_finit_sum(0);
+        T combine_each_sum(0);
+        T copy_construct_sum(0);
+        T copy_assign_sum(0);
+#if __TBB_ETS_USE_CPP11
+        T move_construct_sum(0);
+        T move_assign_sum(0);
+#endif
+        for (int t = -1; t < REPETITIONS; ++t) {
+            if (Verbose && t == 0) t0 = tbb::tick_count::now();
+
+            // test uninitialized parallel combinable
+            tbb::combinable<T> sums;
+            tbb::parallel_for( tbb::blocked_range<int>( 0, N, 10000 ), ParallelScalarBody<T>( sums ) );
+            combine_sum += sums.combine(my_combine<T>);
+            combine_ref_sum += sums.combine(my_combine_ref<T>);
+
+            // test parallel combinable preinitialized with a functor that returns 0
+            FunctorAddFinit<T> my_finit_decl;
+            tbb::combinable<T> finit_combinable(my_finit_decl);
+            tbb::parallel_for( tbb::blocked_range<int>( 0, N, 10000 ), ParallelScalarBodyNoInit<T>( finit_combinable ) );
+            combine_finit_sum += finit_combinable.combine(my_combine<T>);
+
+            // test another way of combining the elements using CombineEachHelper<T> functor
+            CombineEachHelper<T> my_helper(combine_each_sum);
+            sums.combine_each(my_helper);
+
+            // test copy constructor for parallel combinable
+            tbb::combinable<T> copy_constructed(sums);
+            copy_construct_sum += copy_constructed.combine(my_combine<T>);
+
+            // test copy assignment for uninitialized parallel combinable
+            tbb::combinable<T> assigned;
+            assigned = sums;
+            copy_assign_sum += assigned.combine(my_combine<T>);
+
+#if __TBB_ETS_USE_CPP11
+            // test move constructor for parallel combinable
+            tbb::combinable<T> moved1(std::move(sums));
+            move_construct_sum += moved1.combine(my_combine<T>);
+
+            // test move assignment for uninitialized parallel combinable
+            tbb::combinable<T> moved2;
+            moved2=std::move(finit_combinable);
+            move_assign_sum += moved2.combine(my_combine<T>);
+#endif
+        }
+        // Here and below comparison for equality of float numbers succeeds
+        // as the rounding error doesn't accumulate and doesn't affect the comparison
+        ASSERT( EXPECTED_SUM == combine_sum, NULL);
+        ASSERT( EXPECTED_SUM == combine_ref_sum, NULL);
+        ASSERT( EXPECTED_SUM == combine_finit_sum, NULL);
+        ASSERT( EXPECTED_SUM == combine_each_sum, NULL);
+        ASSERT( EXPECTED_SUM == copy_construct_sum, NULL);
+        ASSERT( EXPECTED_SUM == copy_assign_sum, NULL);
+#if __TBB_ETS_USE_CPP11
+        ASSERT( EXPECTED_SUM == move_construct_sum, NULL);
+        ASSERT( EXPECTED_SUM == move_assign_sum, NULL);
+#endif
+        REMARK("  done parallel %s, %d, %g, %g\n", test_name, p, static_cast<double>(combine_sum),
+                                                      ( tbb::tick_count::now() - t0).seconds());
+        init.terminate();
+    }
+}
+
+template <typename T>
+class ParallelVectorForBody: NoAssign {
+
+    tbb::combinable< std::vector<T, tbb::tbb_allocator<T> > > &locals;
+
+public:
+
+    ParallelVectorForBody ( tbb::combinable< std::vector<T, tbb::tbb_allocator<T> > > &_locals ) : locals(_locals) { }
+
+    void operator()( const tbb::blocked_range<int> &r ) const {
+        T one = 1;
+
+        for (int i = r.begin(); i < r.end(); ++i) {
+            locals.local().push_back( one );
+        }
+    }
+
+};
+
+template< typename T >
+void RunParallelVectorTests(const char *test_name) {
+
+    tbb::task_scheduler_init init(tbb::task_scheduler_init::deferred);
+
+    typedef std::vector<T, tbb::tbb_allocator<T> > ContainerType;
+
+    for (int p = MinThread; p <= MaxThread; ++p) {
+
+        if (p == 0) continue;
+        REMARK("  Testing parallel %s on %d thread(s)... \n", test_name, p);
+        init.initialize(p);
+
+        tbb::tick_count t0;
+        T defaultConstructed_sum(0);
+        T copyConstructed_sum(0);
+        T copyAssigned_sum(0);
+#if __TBB_ETS_USE_CPP11
+        T moveConstructed_sum(0);
+        T moveAssigned_sum(0);
+#endif
+        for (int t = -1; t < REPETITIONS; ++t) {
+            if (Verbose && t == 0) t0 = tbb::tick_count::now();
+
+            typedef typename tbb::combinable< ContainerType > CombinableType;
+
+            // test uninitialized parallel combinable
+            CombinableType vs;
+            tbb::parallel_for( tbb::blocked_range<int> (0, N, 10000), ParallelVectorForBody<T>( vs ) );
+            CombineEachVectorHelper<T> MyCombineEach(defaultConstructed_sum);
+            vs.combine_each(MyCombineEach); // combine_each sums all elements of each vector into the result
+
+            // test copy constructor for parallel combinable with vectors
+            CombinableType vs2(vs);
+            CombineEachVectorHelper<T> MyCombineEach2(copyConstructed_sum);
+            vs2.combine_each(MyCombineEach2);
+
+            // test copy assignment for uninitialized parallel combinable with vectors
+            CombinableType vs3;
+            vs3 = vs;
+            CombineEachVectorHelper<T> MyCombineEach3(copyAssigned_sum);
+            vs3.combine_each(MyCombineEach3);
+
+#if __TBB_ETS_USE_CPP11
+            // test move constructor for parallel combinable with vectors
+            CombinableType vs4(std::move(vs2));
+            CombineEachVectorHelper<T> MyCombineEach4(moveConstructed_sum);
+            vs4.combine_each(MyCombineEach4);
+
+            // test move assignment for uninitialized parallel combinable with vectors
+            vs4=std::move(vs3);
+            CombineEachVectorHelper<T> MyCombineEach5(moveAssigned_sum);
+            vs4.combine_each(MyCombineEach5);
+#endif
+        }
+
+        double ResultValue = defaultConstructed_sum;
+        ASSERT( EXPECTED_SUM == ResultValue, NULL);
+        ResultValue = copyConstructed_sum;
+        ASSERT( EXPECTED_SUM == ResultValue, NULL);
+        ResultValue = copyAssigned_sum;
+        ASSERT( EXPECTED_SUM == ResultValue, NULL);
+#if __TBB_ETS_USE_CPP11
+        ResultValue = moveConstructed_sum;
+        ASSERT( EXPECTED_SUM == ResultValue, NULL);
+        ResultValue = moveAssigned_sum;
+        ASSERT( EXPECTED_SUM == ResultValue, NULL);
+#endif
+        REMARK("  done parallel %s, %d, %g, %g\n", test_name, p, ResultValue, ( tbb::tick_count::now() - t0).seconds());
+        init.terminate();
+    }
+}
+
+void
+RunParallelTests() {
+    REMARK("Running RunParallelTests\n");
+    RunParallelScalarTests<int>("int");
+    RunParallelScalarTests<double>("double");
+    RunParallelScalarTests<minimal>("minimal");
+    RunParallelVectorTests<int>("std::vector<int, tbb::tbb_allocator<int> >");
+    RunParallelVectorTests<double>("std::vector<double, tbb::tbb_allocator<double> >");
+}
+
+template <typename T>
+void
+RunAssignmentAndCopyConstructorTest(const char *test_name) {
+    REMARK("  Testing assignment and copy construction for combinable<%s>...\n", test_name);
+
+    // test creation with finit function (combine returns finit return value if no threads have created locals)
+    FunctorAddFinit7<T> my_finit7_decl;
+    tbb::combinable<T> create1(my_finit7_decl);
+    ASSERT(7 == create1.combine(my_combine<T>), "Unexpected combine result for combinable object preinitialized with functor");
+
+    // test copy construction with function initializer
+    tbb::combinable<T> copy1(create1);
+    ASSERT(7 == copy1.combine(my_combine<T>), "Unexpected combine result for copy-constructed combinable object");
+
+    // test copy assignment with function initializer
+    FunctorAddFinit<T> my_finit_decl;
+    tbb::combinable<T> assign1(my_finit_decl);
+    assign1 = create1;
+    ASSERT(7 == assign1.combine(my_combine<T>), "Unexpected combine result for copy-assigned combinable object");
+
+#if __TBB_ETS_USE_CPP11
+    // test move construction with function initializer
+    tbb::combinable<T> move1(std::move(create1));
+    ASSERT(7 == move1.combine(my_combine<T>), "Unexpected combine result for move-constructed combinable object");
+
+    // test move assignment with function initializer
+    tbb::combinable<T> move2;
+    move2=std::move(copy1);
+    ASSERT(7 == move2.combine(my_combine<T>), "Unexpected combine result for move-assigned combinable object");
+#endif
+
+    REMARK("  done\n");
+
+}
+
+void
+RunAssignmentAndCopyConstructorTests() {
+    REMARK("Running assignment and copy constructor tests:\n");
+    RunAssignmentAndCopyConstructorTest<int>("int");
+    RunAssignmentAndCopyConstructorTest<double>("double");
+    RunAssignmentAndCopyConstructorTest<minimal>("minimal");
+}
+
+void
+RunMoveSemanticsForStateTrackableObjectTest() {
+    REMARK("Testing move assignment and move construction for combinable<Harness::StateTrackable>...\n");
+
+    tbb::combinable< Harness::StateTrackable<true> > create1;
+    ASSERT(create1.local().state == Harness::StateTrackable<true>::DefaultInitialized,
+           "Unexpected value in default combinable object");
+
+    // Copy constructing of the new combinable causes copying of stored values
+    tbb::combinable< Harness::StateTrackable<true> > copy1(create1);
+    ASSERT(copy1.local().state == Harness::StateTrackable<true>::CopyInitialized,
+           "Unexpected value in copy-constructed combinable object");
+
+    // Copy assignment also causes copying of stored values
+    tbb::combinable< Harness::StateTrackable<true> > copy2;
+    ASSERT(copy2.local().state == Harness::StateTrackable<true>::DefaultInitialized,
+           "Unexpected value in default combinable object");
+    copy2=create1;
+    ASSERT(copy2.local().state == Harness::StateTrackable<true>::CopyInitialized,
+           "Unexpected value in copy-assigned combinable object");
+
+#if __TBB_ETS_USE_CPP11
+    // Store some marked values in the initial combinable object
+    create1.local().state = Harness::StateTrackableBase::Unspecified;
+
+    // Move constructing of the new combinable must not cause copying of stored values
+    tbb::combinable< Harness::StateTrackable<true> > move1(std::move(create1));
+    ASSERT(move1.local().state == Harness::StateTrackableBase::Unspecified, "Unexpected value in move-constructed combinable object");
+
+    // Move assignment must not cause copying of stored values
+    copy1=std::move(move1);
+    ASSERT(copy1.local().state == Harness::StateTrackableBase::Unspecified, "Unexpected value in move-assigned combinable object");
+
+    // Make the stored values valid again in order to delete StateTrackable object correctly
+    copy1.local().state = Harness::StateTrackable<true>::MoveAssigned;
+#endif
+
+    REMARK("done\n");
+}
+
+#include "harness_barrier.h"
+
+Harness::SpinBarrier sBarrier;
+
+struct Body : NoAssign {
+    tbb::combinable<int>* locals;
+    const int nthread;
+    const int nIters;
+    Body( int nthread_, int niters_ ) : nthread(nthread_), nIters(niters_) { sBarrier.initialize(nthread_); }
+
+    void operator()(int thread_id ) const {
+        bool existed;
+        sBarrier.wait();
+        for(int i = 0; i < nIters; ++i ) {
+            existed = thread_id & 1;
+            int oldval = locals->local(existed);
+            ASSERT(existed == (i > 0), "Error on first reference");
+            ASSERT(!existed || (oldval == thread_id), "Error on fetched value");
+            existed = thread_id & 1;
+            locals->local(existed) = thread_id;
+            ASSERT(existed, "Error on assignment");
+        }
+    }
+};
+
+void
+TestLocalAllocations( int nthread ) {
+    ASSERT(nthread > 0, "nthread must be positive");
+#define NITERATIONS 1000
+    Body myBody(nthread, NITERATIONS);
+    tbb::combinable<int> myCombinable;
+    myBody.locals = &myCombinable;
+
+    NativeParallelFor( nthread, myBody );
+
+    int mySum = 0;
+    int mySlots = 0;
+    CombineEachHelperCnt<int> myCountCombine(mySum, mySlots);
+    myCombinable.combine_each(myCountCombine);
+
+    ASSERT(nthread == mySlots, "Incorrect number of slots");
+    ASSERT(mySum == (nthread - 1) * nthread / 2, "Incorrect values in result");
+}
+
+void
+RunLocalAllocationsTests() {
+    REMARK("Testing local() allocations\n");
+    for(int i = 1 <= MinThread ? MinThread : 1; i <= MaxThread; ++i) {
+        REMARK("  Testing local() allocation with nthreads=%d...\n", i);
+        for(int j = 0; j < 100; ++j) {
+            TestLocalAllocations(i);
+        }
+        REMARK("  done\n");
+    }
+}
+
+int TestMain () {
+    if (MaxThread > 0) {
+        RunParallelTests();
+    }
+    RunAssignmentAndCopyConstructorTests();
+    RunMoveSemanticsForStateTrackableObjectTest();
+    RunLocalAllocationsTests();
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_composite_node.cpp b/xdl/third_party/tbb/src/test/test_composite_node.cpp
new file mode 100644
index 00000000..4ce7c7c8
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_composite_node.cpp
@@ -0,0 +1,590 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+#include "tbb/flow_graph.h"
+#include "harness_graph.h"
+#include <tuple>
+#include <cmath>
+#include <vector>
+
+struct passthru_body {
+    int operator()( int i ) {
+        return i;
+    }
+};
+
+class src_body{
+    int start;
+    int finish;
+    int step;
+public:
+    src_body(int f, int s) : start(1), finish(f), step(s) {}
+    bool operator()(int &a) {
+       a = start;
+       if (start <= finish) {
+           a = start;
+           start+=step;
+           return true;
+       }
+       else {
+           return false;
+       };
+   }
+};
+
+struct m_fxn_body{
+    void operator()(int, tbb::flow::multifunction_node<int, tbb::flow::tuple<int,int> >::output_ports_type ) {}
+};
+
+struct ct_body {
+ct_body(){}
+    void operator()(tbb::flow::continue_msg){}
+};
+
+struct seq_body {
+int operator()(int i){return i;}
+};
+
+template<int N, typename T1, typename T2>
+struct compare {
+    static void compare_refs(T1 tuple1, T2 tuple2) {
+    ASSERT( &tbb::flow::get<N>(tuple1) == &tbb::flow::get<N>(tuple2), "ports not set correctly");
+    compare<N-1, T1, T2>::compare_refs(tuple1, tuple2);
+    }
+};
+
+template<typename T1, typename T2>
+struct compare<1, T1, T2> {
+    static void compare_refs(T1 tuple1, T2 tuple2) {
+    ASSERT(&tbb::flow::get<0>(tuple1) == &tbb::flow::get<0>(tuple2), "port 0 not correctly set");
+    }
+};
+
+void add_all_nodes (){
+    tbb::flow::graph g;
+
+    typedef tbb::flow::tuple<tbb::flow::continue_msg, tbb::flow::tuple<int, int>, int, int, int, int,
+                             int, int, int, int, int, int, int, int > InputTupleType;
+
+    typedef tbb::flow::tuple<tbb::flow::continue_msg, tbb::flow::tuple<int, int>, tbb::flow::tagged_msg<size_t, int, float>,
+                             int, int, int, int, int, int, int, int, int, int, int, int >  OutputTupleType;
+
+    typedef tbb::flow::tuple< > EmptyTupleType;
+
+    typedef tbb::flow::composite_node<InputTupleType, OutputTupleType > input_output_type;
+    typedef tbb::flow::composite_node<InputTupleType, EmptyTupleType > input_only_type;
+    typedef tbb::flow::composite_node<EmptyTupleType, OutputTupleType > output_only_type;
+
+    const size_t NUM_INPUTS = tbb::flow::tuple_size<InputTupleType>::value;
+    const size_t NUM_OUTPUTS = tbb::flow::tuple_size<OutputTupleType>::value;
+
+    //node types
+    tbb::flow::continue_node<tbb::flow::continue_msg> ct(g, ct_body());
+    tbb::flow::split_node< tbb::flow::tuple<int, int> > s(g);
+    tbb::flow::source_node<int> src(g, src_body(20,5), false);
+    tbb::flow::function_node<int, int> fxn(g, tbb::flow::unlimited, passthru_body());
+    tbb::flow::multifunction_node<int, tbb::flow::tuple<int, int> > m_fxn(g, tbb::flow::unlimited, m_fxn_body());
+    tbb::flow::broadcast_node<int> bc(g);
+    tbb::flow::limiter_node<int> lim(g, 2);
+    tbb::flow::indexer_node<int, float> ind(g);
+    tbb::flow::join_node< tbb::flow::tuple< int, int >, tbb::flow::queueing > j(g);
+    tbb::flow::queue_node<int> q(g);
+    tbb::flow::buffer_node<int> bf(g);
+    tbb::flow::priority_queue_node<int> pq(g);
+    tbb::flow::write_once_node<int> wo(g);
+    tbb::flow::overwrite_node<int> ovw(g);
+    tbb::flow::sequencer_node<int> seq(g, seq_body());
+
+#if !__TBB_UPCAST_OF_TUPLE_OF_REF_BROKEN
+    auto input_tuple = std::tie(ct, s, m_fxn, fxn, bc, tbb::flow::input_port<0>(j), lim, q, tbb::flow::input_port<0>(ind),
+                                pq, ovw, wo, bf, seq);
+    auto output_tuple = std::tie(ct,j, ind, fxn, src, bc, tbb::flow::output_port<0>(s), lim, tbb::flow::output_port<0>(m_fxn),
+                                 q, pq, ovw, wo, bf, seq );
+#else
+    // upcasting from derived to base for a tuple of references created by std::tie
+    // fails on gcc 4.4 (and all icc in that environment)
+    input_output_type::input_ports_type input_tuple(ct, s, m_fxn, fxn, bc, tbb::flow::input_port<0>(j), lim, q,
+                                                    tbb::flow::input_port<0>(ind), pq, ovw, wo, bf, seq);
+
+    input_output_type::output_ports_type output_tuple(ct,j, ind, fxn, src, bc, tbb::flow::output_port<0>(s),
+                                                      lim, tbb::flow::output_port<0>(m_fxn), q, pq, ovw, wo, bf, seq);
+#endif
+
+    //composite_node with both input_ports and output_ports
+    input_output_type a_node(g);
+    a_node.set_external_ports(input_tuple, output_tuple);
+
+    a_node.add_visible_nodes(src, fxn, m_fxn, bc, lim, ind, s, ct, j, q, bf, pq, wo, ovw, seq);
+    a_node.add_nodes(src, fxn, m_fxn, bc, lim, ind, s, ct, j, q, bf, pq, wo, ovw, seq);
+
+    auto a_node_input_ports_ptr = a_node.input_ports();
+    compare<NUM_INPUTS-1, decltype(a_node_input_ports_ptr), decltype(input_tuple)>::compare_refs(a_node_input_ports_ptr, input_tuple);
+    ASSERT (NUM_INPUTS == tbb::flow::tuple_size<decltype(a_node_input_ports_ptr)>::value, "not all declared input ports were bound to nodes");
+
+    auto a_node_output_ports_ptr = a_node.output_ports();
+    compare<NUM_OUTPUTS-1, decltype(a_node_output_ports_ptr), decltype(output_tuple)>::compare_refs(a_node_output_ports_ptr, output_tuple);
+    ASSERT(NUM_OUTPUTS == tbb::flow::tuple_size<decltype(a_node_output_ports_ptr)>::value, "not all declared output ports were bound to nodes");
+
+    //composite_node with only input_ports
+    input_only_type b_node(g);
+    b_node.set_external_ports(input_tuple);
+
+    b_node.add_visible_nodes(src, fxn, m_fxn, bc, lim, ind, s, ct, j, q, bf, pq, wo, ovw, seq);
+    b_node.add_nodes(src, fxn, m_fxn, bc, lim, ind, s, ct, j, q, bf, pq, wo, ovw, seq);
+
+    auto b_node_input_ports_ptr = b_node.input_ports();
+    compare<NUM_INPUTS-1, decltype(b_node_input_ports_ptr), decltype(input_tuple)>::compare_refs(b_node_input_ports_ptr, input_tuple);
+    ASSERT (NUM_INPUTS == tbb::flow::tuple_size<decltype(b_node_input_ports_ptr)>::value, "not all declared input ports were bound to nodes");
+
+    //composite_node with only output_ports
+    output_only_type c_node(g);
+    c_node.set_external_ports(output_tuple);
+
+    c_node.add_visible_nodes(src, fxn, m_fxn, bc, lim, ind, s, ct, j, q, bf, pq, wo, ovw, seq);
+
+    c_node.add_nodes(src, fxn, m_fxn, bc, lim, ind, s, ct, j, q, bf, pq, wo, ovw, seq);
+
+    auto c_node_output_ports_ptr = c_node.output_ports();
+    compare<NUM_OUTPUTS-1, decltype(c_node_output_ports_ptr), decltype(output_tuple)>::compare_refs(c_node_output_ports_ptr, output_tuple);
+    ASSERT (NUM_OUTPUTS == tbb::flow::tuple_size<decltype(c_node_output_ports_ptr)>::value, "not all declared input ports were bound to nodes");
+}
+
+struct tiny_node : public tbb::flow::composite_node< tbb::flow::tuple< int >, tbb::flow::tuple< int > > {
+    tbb::flow::function_node< int, int > f1;
+    tbb::flow::function_node< int, int > f2;
+    typedef tbb::flow::composite_node< tbb::flow::tuple< int >, tbb::flow::tuple< int > > base_type;
+
+public:
+    tiny_node(tbb::flow::graph &g, bool hidden = false) : base_type(g), f1(g, tbb::flow::unlimited, passthru_body() ), f2(g, tbb::flow::unlimited, passthru_body() ) {
+        tbb::flow::make_edge( f1, f2 );
+
+        tbb::flow::tuple<tbb::flow::function_node< int, int >& > input_tuple(f1);
+        tbb::flow::tuple<tbb::flow::function_node< int, int >& > output_tuple(f2);
+        base_type::set_external_ports( input_tuple, output_tuple );
+
+        if(hidden)
+            base_type::add_nodes(f1, f2);
+        else
+            base_type::add_visible_nodes(f1, f2);
+
+    }
+};
+
+int test_tiny(bool hidden = false) {
+    tbb::flow::graph g;
+    tbb::flow::function_node< int, int > f0( g, tbb::flow::unlimited, passthru_body() );
+    tiny_node t(g, hidden);
+    ASSERT(&tbb::flow::input_port<0>(t) == &t.f1, "f1 not bound to input port 0 in composite_node t");
+    ASSERT(&tbb::flow::output_port<0>(t) == &t.f2, "f2 not bound to output port 0 in composite_node t");
+
+    tiny_node t1(g, hidden);
+    ASSERT(&tbb::flow::get<0>(t1.input_ports()) == &t1.f1, "f1 not bound to input port 0 in composite_node t1");
+    ASSERT(&tbb::flow::get<0>(t1.output_ports()) == &t1.f2, "f2 not bound to output port 0 in composite_node t1");
+
+    test_input_ports_return_ref(t1);
+    test_output_ports_return_ref(t1);
+
+    tiny_node t2(g, hidden);
+    ASSERT(&tbb::flow::input_port<0>(t2) == &t2.f1, "f1 not bound to input port 0 in composite_node t2");
+    ASSERT(&tbb::flow::output_port<0>(t2) == &t2.f2, "f2 not bound to output port 0 in composite_node t2");
+
+    tbb::flow::function_node< int, int > f3( g, tbb::flow::unlimited, passthru_body() );
+    tbb::flow::make_edge( f0, t );
+    tbb::flow::make_edge( t, t1 );
+    tbb::flow::make_edge( t1, t2 );
+    tbb::flow::make_edge( t2 , f3 );
+    tbb::flow::queue_node<int> q(g);
+    tbb::flow::make_edge(f3, q);
+    f0.try_put(1);
+    g.wait_for_all();
+
+    int i, j =0;
+    q.try_get(i);
+    ASSERT( i == 1, "item did not go through graph");
+    q.try_get(j);
+    ASSERT( !j, "unexpected item in graph");
+    g.wait_for_all();
+
+    tbb::flow::remove_edge(f3, q);
+    tbb::flow::remove_edge(t2, f3);
+    tbb::flow::remove_edge(t1, t2);
+
+    tbb::flow::make_edge( t1 , f3 );
+    tbb::flow::make_edge(f3, q);
+
+    f0.try_put(2);
+    g.wait_for_all();
+
+    q.try_get(i);
+    ASSERT( i == 2, "item did not go through graph after removal of edge");
+    q.try_get(j);
+    ASSERT( !j, "unexpected item in graph after removal of edge");
+
+    return 0;
+}
+
+class adder_node : public tbb::flow::composite_node< tbb::flow::tuple< int, int >, tbb::flow::tuple< int > > {
+public:
+    tbb::flow::join_node< tbb::flow::tuple< int, int >, tbb::flow::queueing > j;
+    tbb::flow::function_node< tbb::flow::tuple< int, int >, int > f;
+private:
+    typedef tbb::flow::composite_node< tbb::flow::tuple< int, int >, tbb::flow::tuple< int > > base_type;
+
+    struct f_body {
+        int operator()( const tbb::flow::tuple< int, int > &t ) {
+            return tbb::flow::get<0>(t) + tbb::flow::get<1>(t);
+        }
+    };
+
+public:
+    adder_node(tbb::flow::graph &g, bool hidden = false) : base_type(g), j(g), f(g, tbb::flow::unlimited, f_body() ) {
+        tbb::flow::make_edge( j, f );
+
+        base_type::set_external_ports(base_type::input_ports_type(tbb::flow::input_port<0>(j), tbb::flow::input_port<1>(j)), base_type::output_ports_type(f));
+
+        if (hidden)
+            base_type::add_nodes(j, f);
+        else
+            base_type::add_visible_nodes(j, f);
+
+    }
+};
+
+struct square_body { int operator()(int v) { return v*v; } };
+struct cube_body { int operator()(int v) { return v*v*v; } };
+int adder_sum(int i) {
+    return (int)(pow(3*pow(i,3) + pow(i, 2),2));
+}
+int test_adder(bool hidden = false) {
+    tbb::flow::graph g;
+    tbb::flow::function_node<int,int> s(g, tbb::flow::unlimited, square_body());
+    tbb::flow::function_node<int,int> c(g, tbb::flow::unlimited, cube_body());
+    tbb::flow::function_node<int,int> p(g, tbb::flow::unlimited, passthru_body());
+
+    adder_node a0(g, hidden);
+    ASSERT(&tbb::flow::input_port<0>(a0) == &tbb::flow::input_port<0>(a0.j), "input_port 0 of j not bound to input port 0 in composite_node a0");
+    ASSERT(&tbb::flow::input_port<1>(a0) == &tbb::flow::input_port<1>(a0.j), "input_port 1 of j not bound to input port 1 in composite_node a0");
+    ASSERT(&tbb::flow::output_port<0>(a0) == &a0.f, "f not bound to output port 0 in composite_node a0");
+
+    adder_node a1(g, hidden);
+    ASSERT(&tbb::flow::get<0>(a0.input_ports()) == &tbb::flow::input_port<0>(a0.j), "input_port 0 of j not bound to input port 0 in composite_node a1");
+    ASSERT(&tbb::flow::get<1>(a0.input_ports()) == &tbb::flow::input_port<1>(a0.j), "input_port1 of j not bound to input port 1 in composite_node a1");
+    ASSERT(&tbb::flow::get<0>(a0.output_ports()) == &a0.f, "f not bound to output port 0 in composite_node a1");
+
+    adder_node a2(g, hidden);
+    ASSERT(&tbb::flow::input_port<0>(a2) == &tbb::flow::input_port<0>(a2.j), "input_port 0 of j not bound to input port 0 in composite_node a2");
+    ASSERT(&tbb::flow::input_port<1>(a2) == &tbb::flow::input_port<1>(a2.j), "input_port 1 of j not bound to input port 1 in composite_node a2");
+    ASSERT(&tbb::flow::output_port<0>(a2) == &a2.f, "f not bound to output port 0 in composite_node a2");
+
+    adder_node a3(g, hidden);
+    ASSERT(&tbb::flow::get<0>(a3.input_ports()) == &tbb::flow::input_port<0>(a3.j), "input_port 0 of j not bound to input port 0 in composite_node a3");
+    ASSERT(&tbb::flow::get<1>(a3.input_ports()) == &tbb::flow::input_port<1>(a3.j), "input_port1 of j not bound to input port 1 in composite_node a3");
+    ASSERT(&tbb::flow::get<0>(a3.output_ports()) == &a3.f, "f not bound to output port 0 in composite_node a3");
+
+    tbb::flow::function_node<int,int> s2(g, tbb::flow::unlimited, square_body());
+    tbb::flow::queue_node<int> q(g);
+
+    tbb::flow::make_edge( s, tbb::flow::input_port<0>(a0) );
+    tbb::flow::make_edge( c, tbb::flow::input_port<1>(a0) );
+
+    tbb::flow::make_edge( c, tbb::flow::input_port<0>(a1) );
+    tbb::flow::make_edge( c, tbb::flow::input_port<1>(a1) );
+
+    tbb::flow::make_edge( tbb::flow::output_port<0>(a0), tbb::flow::input_port<0>(a2) );
+    tbb::flow::make_edge( tbb::flow::output_port<0>(a1), tbb::flow::input_port<1>(a2) );
+
+    tbb::flow::make_edge( tbb::flow::output_port<0>(a2), s2 );
+    tbb::flow::make_edge( s2, q );
+
+    int sum_total=0;
+    int result=0;
+    for ( int i = 1; i < 4; ++i ) {
+       s.try_put(i);
+       c.try_put(i);
+       sum_total += adder_sum(i);
+    g.wait_for_all();
+    }
+
+    int j;
+    for ( int i = 1; i < 4; ++i ) {
+        q.try_get(j);
+        result += j;
+    }
+    g.wait_for_all();
+    ASSERT(result == sum_total, "the sum from the graph does not match the calculated value");
+
+    tbb::flow::remove_edge(s2, q);
+    tbb::flow::remove_edge( a2, s2 );
+    tbb::flow::make_edge( a0, a3 );
+    tbb::flow::make_edge( a1, tbb::flow::input_port<1>(a3) );
+    tbb::flow::make_edge( a3, s2 );
+    tbb::flow::make_edge( s2, q );
+
+    sum_total=0;
+    result=0;
+    for ( int i = 10; i < 20; ++i ) {
+       s.try_put(i);
+       c.try_put(i);
+       sum_total += adder_sum(i);
+    g.wait_for_all();
+    }
+
+    for ( int i = 10; i < 20; ++i ) {
+        q.try_get(j);
+        result += j;
+    }
+    g.wait_for_all();
+    ASSERT(result == sum_total, "the new sum after the replacement of the nodes does not match the calculated value");
+
+    return 0;
+}
+
+/*
+                                              outer composite node (outer_node)
+                                     |-------------------------------------------------------------------|
+                                     |                                                                   |
+                                     |  |------------------|  |------------------|  |------------------| |
+             |---------------------| |--| inner composite  | /| inner composite  | /| inner composite  | | |-------------------|
+             |broadcast node(input)|/|  | node             |/ | node             |/ | node             |-+-| queue node(output)|
+             |---------------------|\|  |(inner_node1)     |\ | (inner_node2)    |\ | (inner_node3)    | | |-------------------|
+                                     |--|                  | \|                  | \|                  | |
+                                     |  |------------------|  |------------------|  |------------------| |
+                                     |                                                                   |
+                                     |-------------------------------------------------------------------|
+
+*/
+int test_nested_adder(bool hidden=false) {
+    tbb::flow::graph g;
+    tbb::flow::composite_node<tbb::flow::tuple<int, int>, tbb::flow::tuple<int> > outer_node(g);
+    typedef tbb::flow::composite_node<tbb::flow::tuple<int, int>, tbb::flow::tuple<int> > base_type;
+    tbb::flow::broadcast_node<int> input(g);
+    tbb::flow::queue_node<int> output(g);
+
+    adder_node inner_node1(g, hidden);
+    adder_node inner_node2(g, hidden);
+    adder_node inner_node3(g, hidden);
+
+    outer_node.set_external_ports(base_type::input_ports_type(tbb::flow::input_port<0>(inner_node1), tbb::flow::input_port<1>(inner_node1)), base_type::output_ports_type(tbb::flow::output_port<0>(inner_node3)));
+
+    ASSERT(&tbb::flow::input_port<0>(outer_node) == &tbb::flow::input_port<0>(inner_node1), "input port 0 of inner_node1 not bound to input port 0 in outer_node");
+    ASSERT(&tbb::flow::input_port<1>(outer_node) == &tbb::flow::input_port<1>(inner_node1), "input port 1 of inner_node1 not bound to input port 1 in outer_node");
+    ASSERT(&tbb::flow::output_port<0>(outer_node) == &tbb::flow::output_port<0>(inner_node3), "output port 0 of inner_node3 not bound to output port 0 in outer_node");
+
+    tbb::flow::make_edge(input, tbb::flow::input_port<0>(outer_node)/*inner_node1*/);
+    tbb::flow::make_edge(input, tbb::flow::input_port<1>(outer_node)/*inner_node1*/);
+
+    tbb::flow::make_edge(inner_node1, tbb::flow::input_port<0>(inner_node2));
+    tbb::flow::make_edge(inner_node1, tbb::flow::input_port<1>(inner_node2));
+
+    tbb::flow::make_edge(inner_node2, tbb::flow::input_port<0>(inner_node3));
+    tbb::flow::make_edge(inner_node2, tbb::flow::input_port<1>(inner_node3));
+
+    tbb::flow::make_edge(outer_node/*inner_node3*/, output);
+
+    if(hidden)
+        outer_node.add_nodes(inner_node1, inner_node2, inner_node3);
+    else
+        outer_node.add_visible_nodes(inner_node1, inner_node2, inner_node3);
+
+    int out;
+    for (int i = 1; i < 200000; ++i) {
+        input.try_put(i);
+        g.wait_for_all();
+        output.try_get(out);
+        ASSERT(tbb::flow::output_port<0>(outer_node).try_get(out) == output.try_get(out), "output from outer_node does not match output from graph");
+        ASSERT(out == 8*i, "output from outer_node not correct");
+    }
+    g.wait_for_all();
+
+    return 0;
+}
+
+template< typename T >
+class prefix_node : public tbb::flow::composite_node< tbb::flow::tuple< T, T, T, T, T >, tbb::flow::tuple< T, T, T, T, T > > {
+    typedef tbb::flow::tuple< T, T, T, T, T > my_tuple_t;
+public:
+    tbb::flow::join_node< my_tuple_t, tbb::flow::queueing > j;
+    tbb::flow::split_node< my_tuple_t > s;
+private:
+    tbb::flow::function_node< my_tuple_t, my_tuple_t > f;
+    typedef tbb::flow::composite_node< my_tuple_t, my_tuple_t > base_type;
+
+    struct f_body {
+        my_tuple_t operator()( const my_tuple_t &t ) {
+            return my_tuple_t( tbb::flow::get<0>(t),
+                               tbb::flow::get<0>(t) + tbb::flow::get<1>(t),
+                               tbb::flow::get<0>(t) + tbb::flow::get<1>(t) + tbb::flow::get<2>(t),
+                               tbb::flow::get<0>(t) + tbb::flow::get<1>(t) + tbb::flow::get<2>(t) + tbb::flow::get<3>(t),
+                               tbb::flow::get<0>(t) + tbb::flow::get<1>(t) + tbb::flow::get<2>(t) + tbb::flow::get<3>(t) + tbb::flow::get<4>(t) );
+        }
+    };
+
+public:
+    prefix_node(tbb::flow::graph &g, bool hidden = false ) : base_type(g), j(g), s(g), f(g, tbb::flow::serial, f_body() ) {
+        tbb::flow::make_edge( j, f );
+        tbb::flow::make_edge( f, s );
+
+    typename base_type::input_ports_type input_tuple(tbb::flow::input_port<0>(j), tbb::flow::input_port<1>(j), tbb::flow::input_port<2>(j), tbb::flow::input_port<3>(j), tbb::flow::input_port<4>(j));
+
+    typename base_type::output_ports_type output_tuple(tbb::flow::output_port<0>(s), tbb::flow::output_port<1>(s), tbb::flow::output_port<2>(s), tbb::flow::output_port<3>(s), tbb::flow::output_port<4>(s));
+
+    base_type::set_external_ports(input_tuple, output_tuple);
+
+        if(hidden)
+            base_type::add_nodes(j,s,f);
+        else
+            base_type::add_visible_nodes(j,s,f);
+
+    }
+};
+
+int test_prefix(bool hidden = false) {
+    tbb::flow::graph g;
+    prefix_node<double> p(g, hidden);
+
+    ASSERT(&tbb::flow::get<0>(p.input_ports()) == &tbb::flow::input_port<0>(p.j), "input port 0 of j is not bound to input port 0 of composite node p");
+    ASSERT(&tbb::flow::input_port<1>(p.j) == &tbb::flow::input_port<1>(p.j), "input port 1 of j is not bound to input port 1 of composite node p");
+    ASSERT(&tbb::flow::get<2>(p.input_ports()) == &tbb::flow::input_port<2>(p.j), "input port 2 of j is not bound to input port 2 of composite node p");
+    ASSERT(&tbb::flow::input_port<3>(p.j) == &tbb::flow::input_port<3>(p.j), "input port 3 of j is not bound to input port 3 of composite node p");
+    ASSERT(&tbb::flow::get<4>(p.input_ports()) == &tbb::flow::input_port<4>(p.j), "input port 4 of j is not bound to input port 4 of composite node p");
+
+
+    ASSERT(&tbb::flow::get<0>(p.output_ports()) == &tbb::flow::output_port<0>(p.s), "output port 0 of s is not bound to output port 0 of composite node p");
+    ASSERT(&tbb::flow::output_port<1>(p.s) == &tbb::flow::output_port<1>(p.s), "output port 1 of s is not bound to output port 1 of composite node p");
+    ASSERT(&tbb::flow::get<2>(p.output_ports()) == &tbb::flow::output_port<2>(p.s), "output port 2 of s is not bound to output port 2 of composite node p");
+    ASSERT(&tbb::flow::output_port<3>(p.s) == &tbb::flow::output_port<3>(p.s), "output port 3 of s is not bound to output port 3 of composite node p");
+    ASSERT(&tbb::flow::get<4>(p.output_ports()) == &tbb::flow::output_port<4>(p.s), "output port 4 of s is not bound to output port 4 of composite node p");
+
+    std::vector< tbb::flow::queue_node<double> > v( 5, tbb::flow::queue_node<double>(g) );
+    tbb::flow::make_edge( tbb::flow::output_port<0>(p), v[0] );
+    tbb::flow::make_edge( tbb::flow::output_port<1>(p), v[1] );
+    tbb::flow::make_edge( tbb::flow::output_port<2>(p), v[2] );
+    tbb::flow::make_edge( tbb::flow::output_port<3>(p), v[3] );
+    tbb::flow::make_edge( tbb::flow::output_port<4>(p), v[4] );
+
+    for(  double offset = 1; offset < 10000; offset *= 10 ) {
+        tbb::flow::input_port<0>(p).try_put( offset );
+        tbb::flow::input_port<1>(p).try_put( offset + 1 );
+        tbb::flow::input_port<2>(p).try_put( offset + 2 );
+        tbb::flow::input_port<3>(p).try_put( offset + 3 );
+        tbb::flow::input_port<4>(p).try_put( offset + 4 );
+    }
+    g.wait_for_all();
+
+    double x;
+    while ( v[0].try_get(x) ) {
+        g.wait_for_all();
+        for ( int i = 1; i < 5; ++i ) {
+            v[i].try_get(x);
+            g.wait_for_all();
+        }
+    }
+    return 0;
+}
+
+struct input_only_output_only_seq {
+    int operator()(int i){ return (i + 3) / 4 - 1;}
+};
+
+void input_only_output_only_composite(bool hidden) {
+    tbb::flow::graph g;
+#if TBB_PREVIEW_FLOW_GRAPH_TRACE
+    tbb::flow::composite_node<tbb::flow::tuple<int>, tbb::flow::tuple<int> > input_output(g, "test_name");
+#else
+    tbb::flow::composite_node<tbb::flow::tuple<int>, tbb::flow::tuple<int> > input_output(g);
+#endif
+    typedef tbb::flow::composite_node<tbb::flow::tuple<int>, tbb::flow::tuple<> > input_only_composite;
+    typedef tbb::flow::composite_node<tbb::flow::tuple<>, tbb::flow::tuple<int> > output_only_composite;
+    typedef tbb::flow::source_node<int> src_type;
+    typedef tbb::flow::queue_node<int> q_type;
+    typedef tbb::flow::function_node<int, int> f_type;
+    typedef tbb::flow::sequencer_node<int> sequencer_type;
+
+    int num = 0;
+    int finish=1000;
+    int step = 4;
+
+    input_only_composite a_in(g);
+    output_only_composite a_out(g);
+
+    src_type src(g, src_body(finish, step), false);
+    q_type que(g);
+    f_type f(g, 1, passthru_body());
+
+    // Sequencer_node is needed, because serial function_node guarantees only serial body execution,
+    // not a sequential order of messages dispatch
+    sequencer_type seq(g, input_only_output_only_seq());
+
+    tbb::flow::tuple<f_type& > input_tuple(f);
+    a_in.set_external_ports(input_tuple);
+    ASSERT(&tbb::flow::get<0>(a_in.input_ports()) == &f, "f not bound to input port 0 in composite_node a_in");
+
+    tbb::flow::tuple<src_type&> output_tuple(src);
+    a_out.set_external_ports(output_tuple);
+    ASSERT(&tbb::flow::get<0>(a_out.output_ports()) == &src, "src not bound to output port 0 in composite_node a_out");
+
+    if(hidden) {
+        a_in.add_nodes(f, seq, que);
+        a_out.add_nodes(src);
+    } else {
+        a_in.add_visible_nodes(f, seq, que);
+        a_out.add_visible_nodes(src);
+    }
+
+    tbb::flow::make_edge(a_out, a_in);
+    tbb::flow::make_edge(f, seq);
+    tbb::flow::make_edge(seq, que);
+    src.activate();
+    g.wait_for_all();
+
+    for(int i = 1; i<finish/step; ++i) {
+        que.try_get(num);
+        ASSERT(num == 4*i - 3, "number does not match position in sequence");
+    }
+    g.wait_for_all();
+}
+
+#endif // __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+int TestMain() {
+
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+
+    add_all_nodes();
+    test_tiny(false);
+    test_tiny(true);
+    test_adder(false);
+    test_adder(true);
+    test_nested_adder(true);
+    test_nested_adder(false);
+    test_prefix(false);
+    test_prefix(true);
+    input_only_output_only_composite(true);
+    input_only_output_only_composite(false);
+
+    return Harness::Done;
+#else
+    return Harness::Skipped;
+#endif
+
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_hash_map.cpp b/xdl/third_party/tbb/src/test/test_concurrent_hash_map.cpp
new file mode 100644
index 00000000..167c8265
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_hash_map.cpp
@@ -0,0 +1,1482 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef TBB_USE_PERFORMANCE_WARNINGS
+#define TBB_USE_PERFORMANCE_WARNINGS 1
+#endif
+
+// Our tests usually include the header under test first.  But this test needs
+// to use the preprocessor to edit the identifier runtime_warning in concurrent_hash_map.h.
+// Hence we include a few other headers before doing the abusive edit.
+#include "tbb/tbb_stddef.h" /* Defines runtime_warning */
+#include "harness_assert.h" /* Prerequisite for defining hooked_warning */
+
+// The symbol internal::runtime_warning is normally an entry point into the TBB library.
+// Here for sake of testing, we define it to be hooked_warning, a routine peculiar to this unit test.
+#define runtime_warning hooked_warning
+
+static bool bad_hashing = false;
+
+namespace tbb {
+    namespace internal {
+        static void hooked_warning( const char* /*format*/, ... ) {
+            ASSERT(bad_hashing, "unexpected runtime_warning: bad hashing");
+        }
+    } // namespace internal
+} // namespace tbb
+#define __TBB_EXTRA_DEBUG 1 // enables additional checks
+#include "tbb/concurrent_hash_map.h"
+
+// Restore runtime_warning as an entry point into the TBB library.
+#undef runtime_warning
+
+namespace Jungle {
+    struct Tiger {};
+    size_t tbb_hasher( const Tiger& ) {return 0;}
+}
+
+#if !defined(_MSC_VER) || _MSC_VER>=1400 || __INTEL_COMPILER
+void test_ADL() {
+    tbb::tbb_hash_compare<Jungle::Tiger>::hash(Jungle::Tiger()); // Instantiation chain finds tbb_hasher via Argument Dependent Lookup
+}
+#endif
+
+struct UserDefinedKeyType {
+};
+
+namespace tbb {
+    // Test whether tbb_hash_compare can be partially specialized as stated in Reference manual.
+    template<> struct tbb_hash_compare<UserDefinedKeyType> {
+        size_t hash( UserDefinedKeyType ) const {return 0;}
+        bool equal( UserDefinedKeyType /*x*/, UserDefinedKeyType /*y*/ ) {return true;}
+    };
+}
+
+#include "harness_runtime_loader.h"
+
+tbb::concurrent_hash_map<UserDefinedKeyType,int> TestInstantiationWithUserDefinedKeyType;
+
+// Test whether a sufficient set of headers were included to instantiate a concurrent_hash_map. OSS Bug #120 (& #130):
+// http://www.threadingbuildingblocks.org/bug_desc.php?id=120
+tbb::concurrent_hash_map<std::pair<std::pair<int,std::string>,const char*>,int> TestInstantiation;
+
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/atomic.h"
+#include "tbb/tick_count.h"
+#include "harness.h"
+#include "harness_allocator.h"
+
+class MyException : public std::bad_alloc {
+public:
+    virtual const char *what() const throw() __TBB_override { return "out of items limit"; }
+    virtual ~MyException() throw() {}
+};
+
+/** Has tightly controlled interface so that we can verify
+    that concurrent_hash_map uses only the required interface. */
+class MyKey {
+private:
+    void operator=( const MyKey&  );    // Deny access
+    int key;
+    friend class MyHashCompare;
+    friend class YourHashCompare;
+public:
+    static MyKey make( int i ) {
+        MyKey result;
+        result.key = i;
+        return result;
+    }
+    int value_of() const {return key;}
+};
+//TODO: unify with Harness::Foo ?
+tbb::atomic<long> MyDataCount;
+long MyDataCountLimit = 0;
+
+class MyData {
+protected:
+    friend class MyData2;
+    int data;
+    enum state_t {
+        LIVE=0x1234,
+        DEAD=0x5678
+    } my_state;
+    void operator=( const MyData& );    // Deny access
+public:
+    MyData(int i = 0) {
+        my_state = LIVE;
+        data = i;
+        if(MyDataCountLimit && MyDataCount + 1 >= MyDataCountLimit)
+            __TBB_THROW( MyException() );
+        ++MyDataCount;
+    }
+    MyData( const MyData& other ) {
+        ASSERT( other.my_state==LIVE, NULL );
+        my_state = LIVE;
+        data = other.data;
+        if(MyDataCountLimit && MyDataCount + 1 >= MyDataCountLimit)
+            __TBB_THROW( MyException() );
+        ++MyDataCount;
+    }
+    ~MyData() {
+        --MyDataCount;
+        my_state = DEAD;
+    }
+    static MyData make( int i ) {
+        MyData result;
+        result.data = i;
+        return result;
+    }
+    int value_of() const {
+        ASSERT( my_state==LIVE, NULL );
+        return data;
+    }
+    void set_value( int i ) {
+        ASSERT( my_state==LIVE, NULL );
+        data = i;
+    }
+    bool operator==( const MyData& other ) const {
+        ASSERT( other.my_state==LIVE, NULL );
+        ASSERT( my_state==LIVE, NULL );
+        return data == other.data;
+    }
+};
+
+class MyData2 : public MyData {
+public:
+    MyData2( ) {}
+    MyData2( const MyData& other ) {
+        ASSERT( other.my_state==LIVE, NULL );
+        ASSERT( my_state==LIVE, NULL );
+        data = other.data;
+    }
+    void operator=( const MyData& other ) {
+        ASSERT( other.my_state==LIVE, NULL );
+        ASSERT( my_state==LIVE, NULL );
+        data = other.data;
+    }
+    void operator=( const MyData2& other ) {
+        ASSERT( other.my_state==LIVE, NULL );
+        ASSERT( my_state==LIVE, NULL );
+        data = other.data;
+    }
+    bool operator==( const MyData2& other ) const {
+        ASSERT( other.my_state==LIVE, NULL );
+        ASSERT( my_state==LIVE, NULL );
+        return data == other.data;
+    }
+};
+
+class MyHashCompare {
+public:
+    bool equal( const MyKey& j, const MyKey& k ) const {
+        return j.key==k.key;
+    }
+    unsigned long hash( const MyKey& k ) const {
+        return k.key;
+    }
+};
+
+class YourHashCompare {
+public:
+    bool equal( const MyKey& j, const MyKey& k ) const {
+        return j.key==k.key;
+    }
+    unsigned long hash( const MyKey& ) const {
+        return 1;
+    }
+};
+
+typedef local_counting_allocator<std::allocator<MyData> > MyAllocator;
+typedef tbb::concurrent_hash_map<MyKey,MyData,MyHashCompare,MyAllocator> MyTable;
+typedef tbb::concurrent_hash_map<MyKey,MyData2,MyHashCompare> MyTable2;
+typedef tbb::concurrent_hash_map<MyKey,MyData,YourHashCompare> YourTable;
+
+template<typename MyTable>
+inline void CheckAllocator(MyTable &table, size_t expected_allocs, size_t expected_frees, bool exact = true) {
+    size_t items_allocated = table.get_allocator().items_allocated, items_freed = table.get_allocator().items_freed;
+    size_t allocations = table.get_allocator().allocations, frees = table.get_allocator().frees;
+    REMARK("checking allocators: items %u/%u, allocs %u/%u\n",
+            unsigned(items_allocated), unsigned(items_freed), unsigned(allocations), unsigned(frees) );
+    ASSERT( items_allocated == allocations, NULL); ASSERT( items_freed == frees, NULL);
+    if(exact) {
+        ASSERT( allocations == expected_allocs, NULL); ASSERT( frees == expected_frees, NULL);
+    } else {
+        ASSERT( allocations >= expected_allocs, NULL); ASSERT( frees >= expected_frees, NULL);
+        ASSERT( allocations - frees == expected_allocs - expected_frees, NULL );
+    }
+}
+
+inline bool UseKey( size_t i ) {
+    return (i&3)!=3;
+}
+
+struct Insert {
+    static void apply( MyTable& table, int i ) {
+        if( UseKey(i) ) {
+            if( i&4 ) {
+                MyTable::accessor a;
+                table.insert( a, MyKey::make(i) );
+                if( i&1 )
+                    (*a).second.set_value(i*i);
+                else
+                    a->second.set_value(i*i);
+            } else
+                if( i&1 ) {
+                    MyTable::accessor a;
+                    table.insert( a, std::make_pair(MyKey::make(i), MyData(i*i)) );
+                    ASSERT( (*a).second.value_of()==i*i, NULL );
+                } else {
+                    MyTable::const_accessor ca;
+                    table.insert( ca, std::make_pair(MyKey::make(i), MyData(i*i)) );
+                    ASSERT( ca->second.value_of()==i*i, NULL );
+                }
+        }
+    }
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#include "test_container_move_support.h"
+typedef tbb::concurrent_hash_map<MyKey,Foo,MyHashCompare> DataStateTrackedTable;
+
+struct RvalueInsert {
+    static void apply( DataStateTrackedTable& table, int i ) {
+        DataStateTrackedTable::accessor a;
+        ASSERT( (table.insert( a, std::make_pair(MyKey::make(i), Foo(i + 1)))),"already present while should not ?" );
+        ASSERT( (*a).second == i + 1, NULL );
+        ASSERT( (*a).second.state == Harness::StateTrackableBase::MoveInitialized, "");
+    }
+};
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+struct Emplace {
+    static void apply( DataStateTrackedTable& table, int i ) {
+        DataStateTrackedTable::accessor a;
+        ASSERT( (table.emplace( a, MyKey::make(i), (i + 1))),"already present while should not ?" );
+        ASSERT( (*a).second == i + 1, NULL );
+        ASSERT( (*a).second.state == Harness::StateTrackableBase::DirectInitialized, "");
+    }
+};
+#endif // __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+struct InsertInitList {
+    static void apply( MyTable& table, int i ) {
+        if ( UseKey( i ) ) {
+            // TODO: investigate why the following sequence causes an additional allocation sometimes:
+            // table.insert( MyTable::value_type( MyKey::make( i ), i*i ) );
+            // table.insert( MyTable::value_type( MyKey::make( i ), i*i+1 ) );
+            std::initializer_list<MyTable::value_type> il = { MyTable::value_type( MyKey::make( i ), i*i )/*, MyTable::value_type( MyKey::make( i ), i*i+1 ) */ };
+            table.insert( il );
+        }
+    }
+};
+#endif /* __TBB_INITIALIZER_LISTS_PRESENT */
+
+struct Find {
+    static void apply( MyTable& table, int i ) {
+        MyTable::accessor a;
+        const MyTable::accessor& ca = a;
+        bool b = table.find( a, MyKey::make(i) );
+        ASSERT( b==!a.empty(), NULL );
+        if( b ) {
+            if( !UseKey(i) )
+                REPORT("Line %d: unexpected key %d present\n",__LINE__,i);
+            AssertSameType( &*a, static_cast<MyTable::value_type*>(0) );
+            ASSERT( ca->second.value_of()==i*i, NULL );
+            ASSERT( (*ca).second.value_of()==i*i, NULL );
+            if( i&1 )
+                ca->second.set_value( ~ca->second.value_of() );
+            else
+                (*ca).second.set_value( ~ca->second.value_of() );
+        } else {
+            if( UseKey(i) )
+                REPORT("Line %d: key %d missing\n",__LINE__,i);
+        }
+    }
+};
+
+struct FindConst {
+    static void apply( const MyTable& table, int i ) {
+        MyTable::const_accessor a;
+        const MyTable::const_accessor& ca = a;
+        bool b = table.find( a, MyKey::make(i) );
+        ASSERT( b==(table.count(MyKey::make(i))>0), NULL );
+        ASSERT( b==!a.empty(), NULL );
+        ASSERT( b==UseKey(i), NULL );
+        if( b ) {
+            AssertSameType( &*ca, static_cast<const MyTable::value_type*>(0) );
+            ASSERT( ca->second.value_of()==~(i*i), NULL );
+            ASSERT( (*ca).second.value_of()==~(i*i), NULL );
+        }
+    }
+};
+
+tbb::atomic<int> EraseCount;
+
+struct Erase {
+    static void apply( MyTable& table, int i ) {
+        bool b;
+        if(i&4) {
+            if(i&8) {
+                MyTable::const_accessor a;
+                b = table.find( a, MyKey::make(i) ) && table.erase( a );
+            } else {
+                MyTable::accessor a;
+                b = table.find( a, MyKey::make(i) ) && table.erase( a );
+            }
+        } else
+            b = table.erase( MyKey::make(i) );
+        if( b ) ++EraseCount;
+        ASSERT( table.count(MyKey::make(i)) == 0, NULL );
+    }
+};
+
+static const int IE_SIZE = 2;
+tbb::atomic<YourTable::size_type> InsertEraseCount[IE_SIZE];
+
+struct InsertErase  {
+    static void apply( YourTable& table, int i ) {
+        if ( i%3 ) {
+            int key = i%IE_SIZE;
+            if ( table.insert( std::make_pair(MyKey::make(key), MyData2()) ) )
+                ++InsertEraseCount[key];
+        } else {
+            int key = i%IE_SIZE;
+            if( i&1 ) {
+                YourTable::accessor res;
+                if(table.find( res, MyKey::make(key) ) && table.erase( res ) )
+                    --InsertEraseCount[key];
+            } else {
+                YourTable::const_accessor res;
+                if(table.find( res, MyKey::make(key) ) && table.erase( res ) )
+                    --InsertEraseCount[key];
+            }
+        }
+    }
+};
+
+// Test for the deadlock discussed at:
+// http://softwarecommunity.intel.com/isn/Community/en-US/forums/permalink/30253302/30253302/ShowThread.aspx#30253302
+struct InnerInsert {
+    static void apply( YourTable& table, int i ) {
+        YourTable::accessor a1, a2;
+        if(i&1) __TBB_Yield();
+        table.insert( a1, MyKey::make(1) );
+        __TBB_Yield();
+        table.insert( a2, MyKey::make(1 + (1<<30)) ); // the same chain
+        table.erase( a2 ); // if erase by key it would lead to deadlock for single thread
+    }
+};
+
+#include "harness_barrier.h"
+// Test for the misuse of constness
+struct FakeExclusive : NoAssign {
+    Harness::SpinBarrier& barrier;
+    YourTable& table;
+    FakeExclusive(Harness::SpinBarrier& b, YourTable&t) : barrier(b), table(t) {}
+    void operator()( int i ) const {
+        if(i) {
+            YourTable::const_accessor real_ca;
+            // const accessor on non-const table acquired as reader (shared)
+            ASSERT( table.find(real_ca,MyKey::make(1)), NULL );
+            barrier.wait(); // item can be erased
+            Harness::Sleep(10); // let it enter the erase
+            real_ca->second.value_of(); // check the state while holding accessor
+        } else {
+            YourTable::accessor fake_ca;
+            const YourTable &const_table = table;
+            // non-const accessor on const table acquired as reader (shared)
+            ASSERT( const_table.find(fake_ca,MyKey::make(1)), NULL );
+            barrier.wait(); // readers acquired
+            // can mistakenly remove the item while other readers still refers to it
+            table.erase( fake_ca );
+        }
+    }
+};
+
+template<typename Op, typename MyTable>
+class TableOperation: NoAssign {
+    MyTable& my_table;
+public:
+    void operator()( const tbb::blocked_range<int>& range ) const {
+        for( int i=range.begin(); i!=range.end(); ++i )
+            Op::apply(my_table,i);
+    }
+    TableOperation( MyTable& table ) : my_table(table) {}
+};
+
+template<typename Op, typename TableType>
+void DoConcurrentOperations( TableType& table, int n, const char* what, int nthread ) {
+    REMARK("testing %s with %d threads\n",what,nthread);
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for( tbb::blocked_range<int>(0,n,100), TableOperation<Op,TableType>(table) );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    REMARK("time for %s = %g with %d threads\n",what,(t1-t0).seconds(),nthread);
+}
+
+//! Test traversing the table with an iterator.
+void TraverseTable( MyTable& table, size_t n, size_t expected_size ) {
+    REMARK("testing traversal\n");
+    size_t actual_size = table.size();
+    ASSERT( actual_size==expected_size, NULL );
+    size_t count = 0;
+    bool* array = new bool[n];
+    memset( array, 0, n*sizeof(bool) );
+    const MyTable& const_table = table;
+    MyTable::const_iterator ci = const_table.begin();
+    for( MyTable::iterator i = table.begin(); i!=table.end(); ++i ) {
+        // Check iterator
+        int k = i->first.value_of();
+        ASSERT( UseKey(k), NULL );
+        ASSERT( (*i).first.value_of()==k, NULL );
+        ASSERT( 0<=k && size_t(k)<n, "out of bounds key" );
+        ASSERT( !array[k], "duplicate key" );
+        array[k] = true;
+        ++count;
+
+        // Check lower/upper bounds
+        std::pair<MyTable::iterator, MyTable::iterator> er = table.equal_range(i->first);
+        std::pair<MyTable::const_iterator, MyTable::const_iterator> cer = const_table.equal_range(i->first);
+        ASSERT(cer.first == er.first && cer.second == er.second, NULL);
+        ASSERT(cer.first == i, NULL);
+        ASSERT(std::distance(cer.first, cer.second) == 1, NULL);
+
+        // Check const_iterator
+        MyTable::const_iterator cic = ci++;
+        ASSERT( cic->first.value_of()==k, NULL );
+        ASSERT( (*cic).first.value_of()==k, NULL );
+    }
+    ASSERT( ci==const_table.end(), NULL );
+    delete[] array;
+    if( count!=expected_size ) {
+        REPORT("Line %d: count=%ld but should be %ld\n",__LINE__,long(count),long(expected_size));
+    }
+}
+
+typedef tbb::atomic<unsigned char> AtomicByte;
+
+template<typename RangeType>
+struct ParallelTraverseBody: NoAssign {
+    const size_t n;
+    AtomicByte* const array;
+    ParallelTraverseBody( AtomicByte array_[], size_t n_ ) :
+        n(n_),
+        array(array_)
+    {}
+    void operator()( const RangeType& range ) const {
+        for( typename RangeType::iterator i = range.begin(); i!=range.end(); ++i ) {
+            int k = i->first.value_of();
+            ASSERT( 0<=k && size_t(k)<n, NULL );
+            ++array[k];
+        }
+    }
+};
+
+void Check( AtomicByte array[], size_t n, size_t expected_size ) {
+    if( expected_size )
+        for( size_t k=0; k<n; ++k ) {
+            if( array[k] != int(UseKey(k)) ) {
+                REPORT("array[%d]=%d != %d=UseKey(%d)\n",
+                       int(k), int(array[k]), int(UseKey(k)), int(k));
+                ASSERT(false,NULL);
+            }
+        }
+}
+
+//! Test travering the tabel with a parallel range
+void ParallelTraverseTable( MyTable& table, size_t n, size_t expected_size ) {
+    REMARK("testing parallel traversal\n");
+    ASSERT( table.size()==expected_size, NULL );
+    AtomicByte* array = new AtomicByte[n];
+
+    memset( static_cast<void*>(array), 0, n*sizeof(AtomicByte) );
+    MyTable::range_type r = table.range(10);
+    tbb::parallel_for( r, ParallelTraverseBody<MyTable::range_type>( array, n ));
+    Check( array, n, expected_size );
+
+    const MyTable& const_table = table;
+    memset( static_cast<void*>(array), 0, n*sizeof(AtomicByte) );
+    MyTable::const_range_type cr = const_table.range(10);
+    tbb::parallel_for( cr, ParallelTraverseBody<MyTable::const_range_type>( array, n ));
+    Check( array, n, expected_size );
+
+    delete[] array;
+}
+
+void TestInsertFindErase( int nthread ) {
+    int n=250000;
+
+    // compute m = number of unique keys
+    int m = 0;
+    for( int i=0; i<n; ++i )
+        m += UseKey(i);
+
+    MyAllocator a; a.items_freed = a.frees = 100;
+    ASSERT( MyDataCount==0, NULL );
+    MyTable table(a);
+    TraverseTable(table,n,0);
+    ParallelTraverseTable(table,n,0);
+    CheckAllocator(table, 0, 100);
+
+    int expected_allocs = 0, expected_frees = 100;
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    for ( int i = 0; i < 2; ++i ) {
+        if ( i==0 )
+            DoConcurrentOperations<InsertInitList, MyTable>( table, n, "insert(std::initializer_list)", nthread );
+        else
+#endif
+            DoConcurrentOperations<Insert, MyTable>( table, n, "insert", nthread );
+        ASSERT( MyDataCount == m, NULL );
+        TraverseTable( table, n, m );
+        ParallelTraverseTable( table, n, m );
+        expected_allocs += m;
+        CheckAllocator( table, expected_allocs, expected_frees );
+
+        DoConcurrentOperations<Find, MyTable>( table, n, "find", nthread );
+        ASSERT( MyDataCount == m, NULL );
+        CheckAllocator( table, expected_allocs, expected_frees );
+
+        DoConcurrentOperations<FindConst, MyTable>( table, n, "find(const)", nthread );
+        ASSERT( MyDataCount == m, NULL );
+        CheckAllocator( table, expected_allocs, expected_frees );
+
+        EraseCount = 0;
+        DoConcurrentOperations<Erase, MyTable>( table, n, "erase", nthread );
+        ASSERT( EraseCount == m, NULL );
+        ASSERT( MyDataCount == 0, NULL );
+        TraverseTable( table, n, 0 );
+        expected_frees += m;
+        CheckAllocator( table, expected_allocs, expected_frees );
+
+        bad_hashing = true;
+        table.clear();
+        bad_hashing = false;
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    }
+#endif
+
+    if(nthread > 1) {
+        YourTable ie_table;
+        for( int i=0; i<IE_SIZE; ++i )
+            InsertEraseCount[i] = 0;
+        DoConcurrentOperations<InsertErase,YourTable>(ie_table,n/2,"insert_erase",nthread);
+        for( int i=0; i<IE_SIZE; ++i )
+            ASSERT( InsertEraseCount[i]==ie_table.count(MyKey::make(i)), NULL );
+
+        DoConcurrentOperations<InnerInsert,YourTable>(ie_table,2000,"inner insert",nthread);
+        Harness::SpinBarrier barrier(nthread);
+        REMARK("testing erase on fake exclusive accessor\n");
+        NativeParallelFor( nthread, FakeExclusive(barrier, ie_table));
+    }
+}
+
+volatile int Counter;
+
+class AddToTable: NoAssign {
+    MyTable& my_table;
+    const int my_nthread;
+    const int my_m;
+public:
+    AddToTable( MyTable& table, int nthread, int m ) : my_table(table), my_nthread(nthread), my_m(m) {}
+    void operator()( int ) const {
+        for( int i=0; i<my_m; ++i ) {
+            // Busy wait to synchronize threads
+            int j = 0;
+            while( Counter<i ) {
+                if( ++j==1000000 ) {
+                    // If Counter<i after a million iterations, then we almost surely have
+                    // more logical threads than physical threads, and should yield in
+                    // order to let suspended logical threads make progress.
+                    j = 0;
+                    __TBB_Yield();
+                }
+            }
+            // Now all threads attempt to simultaneously insert a key.
+            int k;
+            {
+                MyTable::accessor a;
+                MyKey key = MyKey::make(i);
+                if( my_table.insert( a, key ) )
+                    a->second.set_value( 1 );
+                else
+                    a->second.set_value( a->second.value_of()+1 );
+                k = a->second.value_of();
+            }
+            if( k==my_nthread )
+                Counter=i+1;
+        }
+    }
+};
+
+class RemoveFromTable: NoAssign {
+    MyTable& my_table;
+    const int my_m;
+public:
+    RemoveFromTable( MyTable& table, int m ) : my_table(table), my_m(m) {}
+    void operator()(int) const {
+        for( int i=0; i<my_m; ++i ) {
+            bool b;
+            if(i&4) {
+                if(i&8) {
+                    MyTable::const_accessor a;
+                    b = my_table.find( a, MyKey::make(i) ) && my_table.erase( a );
+                } else {
+                    MyTable::accessor a;
+                    b = my_table.find( a, MyKey::make(i) ) && my_table.erase( a );
+                }
+            } else
+                b = my_table.erase( MyKey::make(i) );
+            if( b ) ++EraseCount;
+        }
+    }
+};
+
+//! Test for memory leak in concurrent_hash_map (TR #153).
+void TestConcurrency( int nthread ) {
+    REMARK("testing multiple insertions/deletions of same key with %d threads\n", nthread);
+    {
+        ASSERT( MyDataCount==0, NULL );
+        MyTable table;
+        const int m = 1000;
+        Counter = 0;
+        tbb::tick_count t0 = tbb::tick_count::now();
+        NativeParallelFor( nthread, AddToTable(table,nthread,m) );
+        tbb::tick_count t1 = tbb::tick_count::now();
+        REMARK("time for %u insertions = %g with %d threads\n",unsigned(MyDataCount),(t1-t0).seconds(),nthread);
+        ASSERT( MyDataCount==m, "memory leak detected" );
+
+        EraseCount = 0;
+        t0 = tbb::tick_count::now();
+        NativeParallelFor( nthread, RemoveFromTable(table,m) );
+        t1 = tbb::tick_count::now();
+        REMARK("time for %u deletions = %g with %d threads\n",unsigned(EraseCount),(t1-t0).seconds(),nthread);
+        ASSERT( MyDataCount==0, "memory leak detected" );
+        ASSERT( EraseCount==m, "return value of erase() is broken" );
+
+        CheckAllocator(table, m, m, /*exact*/nthread <= 1);
+    }
+    ASSERT( MyDataCount==0, "memory leak detected" );
+}
+
+void TestTypes() {
+    AssertSameType( static_cast<MyTable::key_type*>(0), static_cast<MyKey*>(0) );
+    AssertSameType( static_cast<MyTable::mapped_type*>(0), static_cast<MyData*>(0) );
+    AssertSameType( static_cast<MyTable::value_type*>(0), static_cast<std::pair<const MyKey,MyData>*>(0) );
+    AssertSameType( static_cast<MyTable::accessor::value_type*>(0), static_cast<MyTable::value_type*>(0) );
+    AssertSameType( static_cast<MyTable::const_accessor::value_type*>(0), static_cast<const MyTable::value_type*>(0) );
+    AssertSameType( static_cast<MyTable::size_type*>(0), static_cast<size_t*>(0) );
+    AssertSameType( static_cast<MyTable::difference_type*>(0), static_cast<ptrdiff_t*>(0) );
+}
+
+template<typename Iterator, typename T>
+void TestIteratorTraits() {
+    AssertSameType( static_cast<typename Iterator::difference_type*>(0), static_cast<ptrdiff_t*>(0) );
+    AssertSameType( static_cast<typename Iterator::value_type*>(0), static_cast<T*>(0) );
+    AssertSameType( static_cast<typename Iterator::pointer*>(0), static_cast<T**>(0) );
+    AssertSameType( static_cast<typename Iterator::iterator_category*>(0), static_cast<std::forward_iterator_tag*>(0) );
+    T x;
+    typename Iterator::reference xr = x;
+    typename Iterator::pointer xp = &x;
+    ASSERT( &xr==xp, NULL );
+}
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAssignment( Iterator2 j ) {
+    Iterator1 i(j), k;
+    ASSERT( i==j, NULL ); ASSERT( !(i!=j), NULL );
+    k = j;
+    ASSERT( k==j, NULL ); ASSERT( !(k!=j), NULL );
+}
+
+template<typename Range1, typename Range2>
+void TestRangeAssignment( Range2 r2 ) {
+    Range1 r1(r2); r1 = r2;
+}
+//------------------------------------------------------------------------
+// Test for copy constructor and assignment
+//------------------------------------------------------------------------
+
+template<typename MyTable>
+static void FillTable( MyTable& x, int n ) {
+    for( int i=1; i<=n; ++i ) {
+        MyKey key( MyKey::make(-i) ); // hash values must not be specified in direct order
+        typename MyTable::accessor a;
+        bool b = x.insert(a,key);
+        ASSERT(b, NULL);
+        a->second.set_value( i*i );
+    }
+}
+
+template<typename MyTable>
+static void CheckTable( const MyTable& x, int n ) {
+    ASSERT( x.size()==size_t(n), "table is different size than expected" );
+    ASSERT( x.empty()==(n==0), NULL );
+    ASSERT( x.size()<=x.max_size(), NULL );
+    for( int i=1; i<=n; ++i ) {
+        MyKey key( MyKey::make(-i) );
+        typename MyTable::const_accessor a;
+        bool b = x.find(a,key);
+        ASSERT( b, NULL );
+        ASSERT( a->second.value_of()==i*i, NULL );
+    }
+    int count = 0;
+    int key_sum = 0;
+    for( typename MyTable::const_iterator i(x.begin()); i!=x.end(); ++i ) {
+        ++count;
+        key_sum += -i->first.value_of();
+    }
+    ASSERT( count==n, NULL );
+    ASSERT( key_sum==n*(n+1)/2, NULL );
+}
+
+static void TestCopy() {
+    REMARK("testing copy\n");
+    MyTable t1;
+    for( int i=0; i<10000; i=(i<100 ? i+1 : i*3) ) {
+        MyDataCount = 0;
+
+        FillTable(t1,i);
+        // Do not call CheckTable(t1,i) before copying, it enforces rehashing
+
+        MyTable t2(t1);
+        // Check that copy constructor did not mangle source table.
+        CheckTable(t1,i);
+        swap(t1, t2);
+        CheckTable(t1,i);
+        ASSERT( !(t1 != t2), NULL );
+
+        // Clear original table
+        t2.clear();
+        swap(t2, t1);
+        CheckTable(t1,0);
+
+        // Verify that copy of t1 is correct, even after t1 is cleared.
+        CheckTable(t2,i);
+        t2.clear();
+        t1.swap( t2 );
+        CheckTable(t1,0);
+        CheckTable(t2,0);
+        ASSERT( MyDataCount==0, "data leak?" );
+    }
+}
+
+void TestAssignment() {
+    REMARK("testing assignment\n");
+    for( int i=0; i<1000; i=(i<30 ? i+1 : i*5) ) {
+        for( int j=0; j<1000; j=(j<30 ? j+1 : j*7) ) {
+            MyTable t1;
+            MyTable t2;
+            FillTable(t1,i);
+            FillTable(t2,j);
+            ASSERT( (t1 == t2) == (i == j), NULL );
+            CheckTable(t2,j);
+
+            MyTable& tref = t2=t1;
+            ASSERT( &tref==&t2, NULL );
+            ASSERT( t1 == t2, NULL );
+            CheckTable(t1,i);
+            CheckTable(t2,i);
+
+            t1.clear();
+            CheckTable(t1,0);
+            CheckTable(t2,i);
+            ASSERT( MyDataCount==i, "data leak?" );
+
+            t2.clear();
+            CheckTable(t1,0);
+            CheckTable(t2,0);
+            ASSERT( MyDataCount==0, "data leak?" );
+        }
+    }
+}
+
+void TestIteratorsAndRanges() {
+    REMARK("testing iterators compliance\n");
+    TestIteratorTraits<MyTable::iterator,MyTable::value_type>();
+    TestIteratorTraits<MyTable::const_iterator,const MyTable::value_type>();
+
+    MyTable v;
+    MyTable const &u = v;
+
+    TestIteratorAssignment<MyTable::const_iterator>( u.begin() );
+    TestIteratorAssignment<MyTable::const_iterator>( v.begin() );
+    TestIteratorAssignment<MyTable::iterator>( v.begin() );
+    // doesn't compile as expected: TestIteratorAssignment<typename V::iterator>( u.begin() );
+
+    // check for non-existing
+    ASSERT(v.equal_range(MyKey::make(-1)) == std::make_pair(v.end(), v.end()), NULL);
+    ASSERT(u.equal_range(MyKey::make(-1)) == std::make_pair(u.end(), u.end()), NULL);
+
+    REMARK("testing ranges compliance\n");
+    TestRangeAssignment<MyTable::const_range_type>( u.range() );
+    TestRangeAssignment<MyTable::const_range_type>( v.range() );
+    TestRangeAssignment<MyTable::range_type>( v.range() );
+    // doesn't compile as expected: TestRangeAssignment<typename V::range_type>( u.range() );
+
+    REMARK("testing construction and insertion from iterators range\n");
+    FillTable( v, 1000 );
+    MyTable2 t(v.begin(), v.end());
+    v.rehash();
+    CheckTable(t, 1000);
+    t.insert(v.begin(), v.end()); // do nothing
+    CheckTable(t, 1000);
+    t.clear();
+    t.insert(v.begin(), v.end()); // restore
+    CheckTable(t, 1000);
+
+    REMARK("testing comparison\n");
+    typedef tbb::concurrent_hash_map<MyKey,MyData2,YourHashCompare,MyAllocator> YourTable1;
+    typedef tbb::concurrent_hash_map<MyKey,MyData2,YourHashCompare> YourTable2;
+    YourTable1 t1;
+    FillTable( t1, 10 );
+    CheckTable(t1, 10 );
+    YourTable2 t2(t1.begin(), t1.end());
+    MyKey key( MyKey::make(-5) ); MyData2 data;
+    ASSERT(t2.erase(key), NULL);
+    YourTable2::accessor a;
+    ASSERT(t2.insert(a, key), NULL);
+    data.set_value(0);   a->second = data;
+    ASSERT( t1 != t2, NULL);
+    data.set_value(5*5); a->second = data;
+    ASSERT( t1 == t2, NULL);
+}
+
+void TestRehash() {
+    REMARK("testing rehashing\n");
+    MyTable w;
+    w.insert( std::make_pair(MyKey::make(-5), MyData()) );
+    w.rehash(); // without this, assertion will fail
+    MyTable::iterator it = w.begin();
+    int i = 0; // check for non-rehashed buckets
+    for( ; it != w.end(); i++ )
+        w.count( (it++)->first );
+    ASSERT( i == 1, NULL );
+    for( i=0; i<1000; i=(i<29 ? i+1 : i*2) ) {
+        for( int j=max(256+i, i*2); j<10000; j*=3 ) {
+            MyTable v;
+            FillTable( v, i );
+            ASSERT(int(v.size()) == i, NULL);
+            ASSERT(int(v.bucket_count()) <= j, NULL);
+            v.rehash( j );
+            ASSERT(int(v.bucket_count()) >= j, NULL);
+            CheckTable( v, i );
+        }
+    }
+}
+
+#if TBB_USE_EXCEPTIONS
+void TestExceptions() {
+    typedef local_counting_allocator<tbb::tbb_allocator<MyData2> > allocator_t;
+    typedef tbb::concurrent_hash_map<MyKey,MyData2,MyHashCompare,allocator_t> ThrowingTable;
+    enum methods {
+        zero_method = 0,
+        ctor_copy, op_assign, op_insert,
+        all_methods
+    };
+    REMARK("testing exception-safety guarantees\n");
+    ThrowingTable src;
+    FillTable( src, 1000 );
+    ASSERT( MyDataCount==1000, NULL );
+
+    try {
+        for(int t = 0; t < 2; t++) // exception type
+        for(int m = zero_method+1; m < all_methods; m++)
+        {
+            allocator_t a;
+            if(t) MyDataCountLimit = 101;
+            else a.set_limits(101);
+            ThrowingTable victim(a);
+            MyDataCount = 0;
+
+            try {
+                switch(m) {
+                case ctor_copy: {
+                        ThrowingTable acopy(src, a);
+                    } break;
+                case op_assign: {
+                        victim = src;
+                    } break;
+                case op_insert: {
+                        FillTable( victim, 1000 );
+                    } break;
+                default:;
+                }
+                ASSERT(false, "should throw an exception");
+            } catch(std::bad_alloc &e) {
+                MyDataCountLimit = 0;
+                size_t size = victim.size();
+                switch(m) {
+                case op_assign:
+                    ASSERT( MyDataCount==100, "data leak?" );
+                    ASSERT( size>=100, NULL );
+                    CheckAllocator(victim, 100+t, t);
+                    __TBB_fallthrough;
+                case ctor_copy:
+                    CheckTable(src, 1000);
+                    break;
+                case op_insert:
+                    ASSERT( size==size_t(100-t), NULL );
+                    ASSERT( MyDataCount==100-t, "data leak?" );
+                    CheckTable(victim, 100-t);
+                    CheckAllocator(victim, 100, t);
+                    break;
+
+                default:; // nothing to check here
+                }
+                REMARK("Exception %d: %s\t- ok ()\n", m, e.what());
+            }
+            catch ( ... ) {
+                ASSERT ( __TBB_EXCEPTION_TYPE_INFO_BROKEN, "Unrecognized exception" );
+            }
+        }
+    } catch(...) {
+        ASSERT(false, "unexpected exception");
+    }
+    src.clear(); MyDataCount = 0;
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+#include "test_initializer_list.h"
+
+struct test_insert {
+    template<typename container_type, typename element_type>
+    static void do_test( std::initializer_list<element_type> il, container_type const& expected ) {
+        container_type vd;
+        vd.insert( il );
+        ASSERT( vd == expected, "inserting with an initializer list failed" );
+    }
+};
+
+void TestInitList(){
+    using namespace initializer_list_support_tests;
+    REMARK("testing initializer_list methods \n");
+
+    typedef tbb::concurrent_hash_map<int,int> ch_map_type;
+    std::initializer_list<ch_map_type::value_type> pairs_il = {{1,1},{2,2},{3,3},{4,4},{5,5}};
+
+    TestInitListSupportWithoutAssign<ch_map_type, test_insert>( pairs_il );
+    TestInitListSupportWithoutAssign<ch_map_type, test_insert>( {} );
+}
+#endif //if __TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_RANGE_BASED_FOR_PRESENT
+#include "test_range_based_for.h"
+
+void TestRangeBasedFor(){
+    using namespace range_based_for_support_tests;
+
+    REMARK("testing range based for loop compatibility \n");
+    typedef tbb::concurrent_hash_map<int,int> ch_map;
+    ch_map a_ch_map;
+
+    const int sequence_length = 100;
+    for (int i = 1; i <= sequence_length; ++i){
+        a_ch_map.insert(ch_map::value_type(i,i));
+    }
+
+    ASSERT( range_based_for_accumulate(a_ch_map, pair_second_summer(), 0) == gauss_summ_of_int_sequence(sequence_length), "incorrect accumulated value generated via range based for ?");
+}
+#endif //if __TBB_RANGE_BASED_FOR_PRESENT
+
+#include "harness_defs.h"
+
+// The helper to run a test only when a default construction is present.
+template <bool default_construction_present> struct do_default_construction_test {
+    template<typename FuncType> void operator() ( FuncType func ) const { func(); }
+};
+template <> struct do_default_construction_test<false> {
+    template<typename FuncType> void operator()( FuncType ) const {}
+};
+
+template <typename Table>
+class test_insert_by_key : NoAssign {
+    typedef typename Table::value_type value_type;
+    Table &my_c;
+    const value_type &my_value;
+public:
+    test_insert_by_key( Table &c, const value_type &value ) : my_c(c), my_value(value) {}
+    void operator()() const {
+        {
+            typename Table::accessor a;
+            ASSERT( my_c.insert( a, my_value.first ), NULL );
+            ASSERT( Harness::IsEqual()(a->first, my_value.first), NULL );
+            a->second = my_value.second;
+        } {
+            typename Table::const_accessor ca;
+            ASSERT( !my_c.insert( ca, my_value.first ), NULL );
+            ASSERT( Harness::IsEqual()(ca->first, my_value.first), NULL);
+            ASSERT( Harness::IsEqual()(ca->second, my_value.second), NULL);
+        }
+    }
+};
+
+#include <vector>
+#include <list>
+#include <algorithm>
+#if __TBB_CPP11_REFERENCE_WRAPPER_PRESENT
+#include <functional>
+#endif
+
+template <typename Table, typename Iterator, typename Range = typename Table::range_type>
+class test_range : NoAssign {
+    typedef typename Table::value_type value_type;
+    Table &my_c;
+    const std::list<value_type> &my_lst;
+    std::vector< tbb::atomic<bool> >& my_marks;
+public:
+    test_range( Table &c, const std::list<value_type> &lst, std::vector< tbb::atomic<bool> > &marks ) : my_c(c), my_lst(lst), my_marks(marks) {
+        std::fill( my_marks.begin(), my_marks.end(), false );
+    }
+    void operator()( const Range &r ) const { do_test_range( r.begin(), r.end() ); }
+    void do_test_range( Iterator i, Iterator j ) const {
+        for ( Iterator it = i; it != j; ) {
+            Iterator it_prev = it++;
+            typename std::list<value_type>::const_iterator it2 = std::search( my_lst.begin(), my_lst.end(), it_prev, it, Harness::IsEqual() );
+            ASSERT( it2 != my_lst.end(), NULL );
+            typename std::list<value_type>::difference_type dist = std::distance( my_lst.begin(), it2 );
+            ASSERT( !my_marks[dist], NULL );
+            my_marks[dist] = true;
+        }
+    }
+};
+
+template <bool default_construction_present, typename Table>
+class check_value : NoAssign {
+    typedef typename Table::const_iterator const_iterator;
+    typedef typename Table::iterator iterator;
+    typedef typename Table::size_type size_type;
+    Table &my_c;
+public:
+    check_value( Table &c ) : my_c(c) {}
+    void operator()(const typename Table::value_type &value ) {
+        const Table &const_c = my_c;
+        ASSERT( my_c.count( value.first ) == 1, NULL );
+        { // tests with a const accessor.
+            typename Table::const_accessor ca;
+            // find
+            ASSERT( my_c.find( ca, value.first ), NULL);
+            ASSERT( !ca.empty() , NULL);
+            ASSERT( Harness::IsEqual()(ca->first, value.first), NULL );
+            ASSERT( Harness::IsEqual()(ca->second, value.second), NULL );
+            // erase
+            ASSERT( my_c.erase( ca ), NULL );
+            ASSERT( my_c.count( value.first ) == 0, NULL );
+            // insert (pair)
+            ASSERT( my_c.insert( ca, value ), NULL);
+            ASSERT( Harness::IsEqual()(ca->first, value.first), NULL );
+            ASSERT( Harness::IsEqual()(ca->second, value.second), NULL );
+        } { // tests with a non-const accessor.
+            typename Table::accessor a;
+            // find
+            ASSERT( my_c.find( a, value.first ), NULL);
+            ASSERT( !a.empty() , NULL);
+            ASSERT( Harness::IsEqual()(a->first, value.first), NULL );
+            ASSERT( Harness::IsEqual()(a->second, value.second), NULL );
+            // erase
+            ASSERT( my_c.erase( a ), NULL );
+            ASSERT( my_c.count( value.first ) == 0, NULL );
+            // insert
+            ASSERT( my_c.insert( a, value ), NULL);
+            ASSERT( Harness::IsEqual()(a->first, value.first), NULL );
+            ASSERT( Harness::IsEqual()(a->second, value.second), NULL );
+        }
+        // erase by key
+        ASSERT( my_c.erase( value.first ), NULL );
+        ASSERT( my_c.count( value.first ) == 0, NULL );
+        do_default_construction_test<default_construction_present>()(test_insert_by_key<Table>( my_c, value ));
+        // insert by value
+        ASSERT( my_c.insert( value ) != default_construction_present, NULL );
+        // equal_range
+        std::pair<iterator,iterator> r1 = my_c.equal_range( value.first );
+        iterator r1_first_prev = r1.first++;
+        ASSERT( Harness::IsEqual()( *r1_first_prev, value ) && Harness::IsEqual()( r1.first, r1.second ), NULL );
+        std::pair<const_iterator,const_iterator> r2 = const_c.equal_range( value.first );
+        const_iterator r2_first_prev = r2.first++;
+        ASSERT( Harness::IsEqual()( *r2_first_prev, value ) && Harness::IsEqual()( r2.first, r2.second ), NULL );
+    }
+};
+
+#include "tbb/task_scheduler_init.h"
+
+template <typename Value, typename U = Value>
+struct CompareTables {
+    template <typename T>
+    static bool IsEqual( const T& t1, const T& t2 ) {
+        return (t1 == t2) && !(t1 != t2);
+    }
+};
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+template <typename U>
+struct CompareTables< std::pair<const std::weak_ptr<U>, std::weak_ptr<U> > > {
+    template <typename T>
+    static bool IsEqual( const T&, const T& ) {
+        /* do nothing for std::weak_ptr */
+        return true;
+    }
+};
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+
+template <bool default_construction_present, typename Table>
+void Examine( Table c, const std::list<typename Table::value_type> &lst) {
+    typedef const Table const_table;
+    typedef typename Table::const_iterator const_iterator;
+    typedef typename Table::iterator iterator;
+    typedef typename Table::value_type value_type;
+    typedef typename Table::size_type size_type;
+
+    ASSERT( !c.empty(), NULL );
+    ASSERT( c.size() == lst.size(), NULL );
+    ASSERT( c.max_size() >= c.size(), NULL );
+
+    const check_value<default_construction_present,Table> cv(c);
+    std::for_each( lst.begin(), lst.end(), cv );
+
+    std::vector< tbb::atomic<bool> > marks( lst.size() );
+
+    test_range<Table,iterator>( c, lst, marks ).do_test_range( c.begin(), c.end() );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    test_range<const_table,const_iterator>( c, lst, marks ).do_test_range( c.begin(), c.end() );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    tbb::task_scheduler_init init;
+
+    typedef typename Table::range_type range_type;
+    tbb::parallel_for( c.range(), test_range<Table,typename range_type::iterator,range_type>( c, lst, marks ) );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    const_table const_c = c;
+    ASSERT( CompareTables<value_type>::IsEqual( c, const_c ), NULL );
+
+    typedef typename const_table::const_range_type const_range_type;
+    tbb::parallel_for( c.range(), test_range<const_table,typename const_range_type::iterator,const_range_type>( const_c, lst, marks ) );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    const size_type new_bucket_count = 2*c.bucket_count();
+    c.rehash( new_bucket_count );
+    ASSERT( c.bucket_count() >= new_bucket_count, NULL );
+
+    Table c2;
+    typename std::list<value_type>::const_iterator begin5 = lst.begin();
+    std::advance( begin5, 5 );
+    c2.insert( lst.begin(), begin5 );
+    std::for_each( lst.begin(), begin5, check_value<default_construction_present, Table>( c2 ) );
+
+    c2.swap( c );
+    ASSERT( CompareTables<value_type>::IsEqual( c2, const_c ), NULL );
+    ASSERT( c.size() == 5, NULL );
+    std::for_each( lst.begin(), lst.end(), check_value<default_construction_present,Table>(c2) );
+
+    tbb::swap( c, c2 );
+    ASSERT( CompareTables<value_type>::IsEqual( c, const_c ), NULL );
+    ASSERT( c2.size() == 5, NULL );
+
+    c2.clear();
+    ASSERT( CompareTables<value_type>::IsEqual( c2, Table() ), NULL );
+
+    typename Table::allocator_type a = c.get_allocator();
+    value_type *ptr = a.allocate(1);
+    ASSERT( ptr, NULL );
+    a.deallocate( ptr, 1 );
+}
+
+template<typename T>
+struct debug_hash_compare : tbb::tbb_hash_compare<T> {};
+
+template <bool default_construction_present, typename Value>
+void TypeTester( const std::list<Value> &lst ) {
+    __TBB_ASSERT( lst.size() >= 5, "Array should have at least 5 elements" );
+    typedef typename Value::first_type first_type;
+    typedef typename Value::second_type second_type;
+    typedef tbb::concurrent_hash_map<first_type,second_type> ch_map;
+    debug_hash_compare<first_type> compare;
+    // Construct an empty hash map.
+    ch_map c1;
+    c1.insert( lst.begin(), lst.end() );
+    Examine<default_construction_present>( c1, lst );
+#if __TBB_INITIALIZER_LISTS_PRESENT && !__TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN
+    // Constructor from initializer_list.
+    typename std::list<Value>::const_iterator it = lst.begin();
+    std::initializer_list<Value> il = { *it++, *it++, *it++ };
+    ch_map c2( il );
+    c2.insert( it, lst.end() );
+    Examine<default_construction_present>( c2, lst );
+
+    // Constructor from initializer_list and compare object
+    ch_map c3( il, compare);
+    c3.insert( it, lst.end() );
+    Examine<default_construction_present>( c3, lst );
+
+    // Constructor from initializer_list, compare object and allocator
+    ch_map c4( il, compare, typename ch_map::allocator_type());
+    c4.insert( it, lst.end());
+    Examine<default_construction_present>( c4, lst );
+#endif
+    // Copying constructor.
+    ch_map c5(c1);
+    Examine<default_construction_present>( c5, lst );
+    // Construct with non-default allocator
+    typedef tbb::concurrent_hash_map< first_type,second_type,tbb::tbb_hash_compare<first_type>,debug_allocator<Value> > ch_map_debug_alloc;
+    ch_map_debug_alloc c6;
+    c6.insert( lst.begin(), lst.end() );
+    Examine<default_construction_present>( c6, lst );
+    // Copying constructor
+    ch_map_debug_alloc c7(c6);
+    Examine<default_construction_present>( c7, lst );
+    // Construction empty table with n preallocated buckets.
+    ch_map c8( lst.size() );
+    c8.insert( lst.begin(), lst.end() );
+    Examine<default_construction_present>( c8, lst );
+    ch_map_debug_alloc c9( lst.size() );
+    c9.insert( lst.begin(), lst.end() );
+    Examine<default_construction_present>( c9, lst );
+    // Construction with copying iteration range.
+    ch_map c10( c1.begin(), c1.end() );
+    Examine<default_construction_present>( c10, lst );
+    // Construction with copying iteration range and given allocator instance.
+    debug_allocator<Value> allocator;
+    ch_map_debug_alloc c11( lst.begin(), lst.end(), allocator );
+    Examine<default_construction_present>( c11, lst );
+
+    typedef tbb::concurrent_hash_map< first_type,second_type,debug_hash_compare<first_type>,typename ch_map::allocator_type> ch_map_debug_hash;
+
+    // Constructor with two iterators and hash_compare
+    ch_map_debug_hash c12(c1.begin(), c1.end(), compare);
+    Examine<default_construction_present>( c12, lst );
+
+    ch_map_debug_hash c13(c1.begin(), c1.end(), compare, typename ch_map::allocator_type());
+    Examine<default_construction_present>( c13, lst );
+}
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+namespace tbb {
+    template<> struct tbb_hash_compare< const std::shared_ptr<int> > {
+        static size_t hash( const std::shared_ptr<int>& ptr ) { return static_cast<size_t>( *ptr ) * interface5::internal::hash_multiplier; }
+        static bool equal( const  std::shared_ptr<int>& ptr1, const  std::shared_ptr<int>& ptr2 ) { return ptr1 == ptr2; }
+    };
+    template<> struct tbb_hash_compare< const std::weak_ptr<int> > {
+        static size_t hash( const std::weak_ptr<int>& ptr ) { return static_cast<size_t>( *ptr.lock() ) * interface5::internal::hash_multiplier; }
+        static bool equal( const std::weak_ptr<int>& ptr1, const  std::weak_ptr<int>& ptr2 ) { return ptr1.lock() == ptr2.lock(); }
+    };
+}
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+
+void TestCPP11Types() {
+    const int NUMBER = 10;
+
+    typedef std::pair<const int, int> int_int_t;
+    std::list<int_int_t> arrIntInt;
+    for ( int i=0; i<NUMBER; ++i ) arrIntInt.push_back( int_int_t(i, NUMBER-i) );
+    TypeTester</*default_construction_present = */true>( arrIntInt );
+
+#if __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN
+    typedef std::pair<const std::reference_wrapper<const int>, int> ref_int_t;
+    std::list<ref_int_t> arrRefInt;
+    for ( std::list<int_int_t>::iterator it = arrIntInt.begin(); it != arrIntInt.end(); ++it )
+        arrRefInt.push_back( ref_int_t( it->first, it->second ) );
+    TypeTester</*default_construction_present = */true>( arrRefInt );
+
+    typedef std::pair< const int, std::reference_wrapper<int> > int_ref_t;
+    std::list<int_ref_t> arrIntRef;
+    for ( std::list<int_int_t>::iterator it = arrIntInt.begin(); it != arrIntInt.end(); ++it )
+        arrIntRef.push_back( int_ref_t( it->first, it->second ) );
+    TypeTester</*default_construction_present = */false>( arrIntRef );
+#else
+    REPORT("Known issue: C++11 reference wrapper tests are skipped.\n");
+#endif /* __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN*/
+
+    typedef std::pair< const int, tbb::atomic<int> > int_tbb_t;
+    std::list<int_tbb_t> arrIntTbb;
+    for ( int i=0; i<NUMBER; ++i ) {
+        tbb::atomic<int> b;
+        b = NUMBER-i;
+        arrIntTbb.push_back( int_tbb_t(i, b) );
+    }
+    TypeTester</*default_construction_present = */true>( arrIntTbb );
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+    typedef std::pair< const std::shared_ptr<int>, std::shared_ptr<int> > shr_shr_t;
+    std::list<shr_shr_t> arrShrShr;
+    for ( int i=0; i<NUMBER; ++i ) {
+        const int NUMBER_minus_i = NUMBER - i;
+        arrShrShr.push_back( shr_shr_t( std::make_shared<int>(i), std::make_shared<int>(NUMBER_minus_i) ) );
+    }
+    TypeTester< /*default_construction_present = */true>( arrShrShr );
+
+    typedef std::pair< const std::weak_ptr<int>, std::weak_ptr<int> > wk_wk_t;
+    std::list< wk_wk_t > arrWkWk;
+    std::copy( arrShrShr.begin(), arrShrShr.end(), std::back_inserter(arrWkWk) );
+    TypeTester< /*default_construction_present = */true>( arrWkWk );
+#else
+    REPORT("Known issue: C++11 smart pointer tests are skipped.\n");
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+
+struct hash_map_move_traits : default_container_traits {
+    enum{ expected_number_of_items_to_allocate_for_steal_move = 0 };
+
+    template<typename T>
+    struct hash_compare {
+        bool equal( const T& lhs, const T& rhs ) const {
+            return lhs==rhs;
+        }
+        size_t hash( const T& k ) const {
+            return tbb::tbb_hasher(k);
+        }
+    };
+    template<typename element_type, typename allocator_type>
+    struct apply {
+        typedef tbb::concurrent_hash_map<element_type, element_type, hash_compare<element_type>, allocator_type > type;
+    };
+
+    typedef FooPairIterator init_iterator_type;
+    template<typename hash_map_type, typename iterator>
+    static bool equal(hash_map_type const& c, iterator begin, iterator end){
+        bool equal_sizes = ( static_cast<size_t>(std::distance(begin, end)) == c.size() );
+        if (!equal_sizes)
+            return false;
+
+        for (iterator it = begin; it != end; ++it ){
+            if (c.count( (*it).first) == 0){
+                return false;
+            }
+        }
+        return true;
+    }
+};
+
+void TestMoveSupport(){
+    TestMoveConstructor<hash_map_move_traits>();
+    TestConstructorWithMoveIterators<hash_map_move_traits>();
+    TestMoveAssignOperator<hash_map_move_traits>();
+#if TBB_USE_EXCEPTIONS
+    TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorMemoryFailure<hash_map_move_traits>();
+    TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorExceptionInElementCtor<hash_map_move_traits>();
+#else
+    REPORT("Known issue: exception safety tests for C++11 move semantics support are skipped.\n");
+#endif //TBB_USE_EXCEPTIONS
+}
+#else
+void TestMoveSupport(){
+    REPORT("Known issue: tests for C++11 move semantics support are skipped.\n");
+}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+template<typename Key>
+struct non_default_constructible_hash_compare : tbb::tbb_hash_compare<Key> {
+    non_default_constructible_hash_compare() {
+        ASSERT(false, "Hash compare object must not default construct during the construction of hash_map with compare argument");
+    }
+
+    non_default_constructible_hash_compare(int) {}
+};
+
+void TestHashCompareConstructors() {
+    typedef int key_type;
+    typedef tbb::concurrent_hash_map<key_type, key_type, non_default_constructible_hash_compare<key_type> > map_type;
+
+    non_default_constructible_hash_compare<key_type> compare(0);
+    map_type::allocator_type allocator;
+
+    map_type map1(compare);
+    map_type map2(compare, allocator);
+
+    map_type map3(1, compare);
+    map_type map4(1, compare, allocator);
+
+    std::vector<map_type::value_type> reference_vector;
+    map_type map5(reference_vector.begin(), reference_vector.end(), compare);
+    map_type map6(reference_vector.begin(), reference_vector.end(), compare, allocator);
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    map_type map7({}, compare);
+    map_type map8({}, compare, allocator);
+#endif
+}
+
+//------------------------------------------------------------------------
+// Test driver
+//------------------------------------------------------------------------
+int TestMain () {
+    if( MinThread<0 ) {
+        REPORT("ERROR: must use at least one thread\n");
+        exit(1);
+    }
+    if( MaxThread<2 ) MaxThread=2;
+
+    // Do serial tests
+    TestTypes();
+    TestCopy();
+    TestRehash();
+    TestAssignment();
+    TestIteratorsAndRanges();
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    TestInitList();
+#endif //__TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_RANGE_BASED_FOR_PRESENT
+    TestRangeBasedFor();
+#endif //#if __TBB_RANGE_BASED_FOR_PRESENT
+
+#if TBB_USE_EXCEPTIONS
+    TestExceptions();
+#endif /* TBB_USE_EXCEPTIONS */
+
+    TestMoveSupport();
+    {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        tbb::task_scheduler_init init( 1 );
+        int n=250000;
+        {
+            DataStateTrackedTable table;
+            DoConcurrentOperations<RvalueInsert, DataStateTrackedTable>( table, n, "rvalue ref insert", 1 );
+        }
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+        {
+            DataStateTrackedTable table;
+            DoConcurrentOperations<Emplace, DataStateTrackedTable>( table, n, "emplace", 1 );
+        }
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+    }
+
+    // Do concurrency tests.
+    for( int nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        tbb::task_scheduler_init init( nthread );
+        TestInsertFindErase( nthread );
+        TestConcurrency( nthread );
+    }
+    // check linking
+    if(bad_hashing) { //should be false
+        tbb::internal::runtime_warning("none\nERROR: it must not be executed");
+    }
+
+    TestCPP11Types();
+    TestHashCompareConstructors();
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_lru_cache.cpp b/xdl/third_party/tbb/src/test/test_concurrent_lru_cache.cpp
new file mode 100644
index 00000000..ad0873d0
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_lru_cache.cpp
@@ -0,0 +1,466 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER
+    #pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#endif
+
+#ifdef TEST_COARSE_GRAINED_LOCK_IMPLEMENTATION
+    #include "../perf/coarse_grained_raii_lru_cache.h"
+    #define selected_raii_lru_cache_impl coarse_grained_raii_lru_cache
+#else
+    #define TBB_PREVIEW_CONCURRENT_LRU_CACHE 1
+    #include "tbb/concurrent_lru_cache.h"
+    #define selected_raii_lru_cache_impl tbb::concurrent_lru_cache
+#endif
+
+#include "harness_test_cases_framework.h"
+#include "harness.h"
+#include "harness_barrier.h"
+
+#include <utility>
+
+#include "tbb/task_scheduler_init.h"
+
+namespace helpers{
+    // Busy work and calibration helpers
+    unsigned int one_us_iters = 345; // default value
+
+    // if user wants to calibrate to microseconds on particular machine, call
+    // this at beginning of program; sets one_us_iters to number of iters to
+    // busy_wait for approx. 1 us
+//    void calibrate_busy_wait() {
+//        tbb::tick_count t0, t1;
+//
+//        t0 = tbb::tick_count::now();
+//        for (volatile unsigned int i=0; i<1000000; ++i) continue;
+//        t1 = tbb::tick_count::now();
+//
+//        one_us_iters = (unsigned int)((1000000.0/(t1-t0).seconds())*0.000001);
+//        printf("one_us_iters: %d\n", one_us_iters);
+//    }
+    void busy_wait(int us)
+    {
+        unsigned int iter = us*one_us_iters;
+        for (volatile unsigned int i=0; i<iter; ++i) continue;
+    }
+}
+namespace helpers{
+    template<class T> void ignore( const T& ) { }
+    //TODO: add test cases for prevent_optimizing_out function
+    template<typename type>
+    void prevent_optimizing_out(type volatile const& s){
+        volatile const type* dummy = &s;
+        ignore(dummy);
+    }
+
+    struct empty_fixture{};
+
+    template<typename argument_type>
+    struct native_for_concurrent_op_repeated:NoAssign{
+        typedef void (*test_function_pointer_type)(argument_type&);
+
+        argument_type& m_counter_ref;
+        test_function_pointer_type m_test_function_pointer_type;
+        std::size_t m_repeat_number;
+        native_for_concurrent_op_repeated(argument_type& counter_ref, test_function_pointer_type action, std::size_t repeat_number)
+            :m_counter_ref(counter_ref), m_test_function_pointer_type(action), m_repeat_number(repeat_number)
+        {}
+        template <typename ignored_parameter_type>
+        void operator()(ignored_parameter_type const&)const{
+            for (size_t i=0; i<m_repeat_number;++i){
+                m_test_function_pointer_type(m_counter_ref);
+            }
+        }
+
+    };
+
+    template <typename counter_type = size_t>
+    struct object_instances_counting_type{
+        counter_type * m_p_count;
+        object_instances_counting_type(): m_p_count (new counter_type){*m_p_count =1; } //to overcome absence of constructor in tbb::atomic
+        ~object_instances_counting_type(){ if (! --(*m_p_count)){delete(m_p_count);}}
+        object_instances_counting_type(object_instances_counting_type const& other): m_p_count(other.m_p_count){
+            ++(*m_p_count);
+        }
+        object_instances_counting_type& operator=(object_instances_counting_type other){
+            std::swap(this->m_p_count,other.m_p_count);
+            return *this;
+        }
+        size_t instances_count()const {return *m_p_count;}
+    };
+    typedef object_instances_counting_type<> object_instances_counting_serial_type;
+    typedef object_instances_counting_type<tbb::atomic<std::size_t> > object_instances_counting_concurrent_type;
+
+    namespace object_instances_counting_type_test_cases{
+        namespace serial_tests{
+            TEST_CASE_WITH_FIXTURE(test_object_instances_counting_type_creation,empty_fixture){
+                ASSERT(object_instances_counting_serial_type().instances_count()==1,"newly created instance by definition has instances_count equal to 1");
+            }
+            TEST_CASE_WITH_FIXTURE(test_object_instances_counting_type_copy,empty_fixture){
+                object_instances_counting_serial_type source;
+                ASSERT(object_instances_counting_serial_type(source).instances_count()==2,"copy should increase ref count");
+            }
+            TEST_CASE_WITH_FIXTURE(test_object_instances_counting_type_assignment,empty_fixture){
+                object_instances_counting_serial_type source;
+                object_instances_counting_serial_type assigned;
+                assigned = source;
+                ASSERT(source.instances_count()==2,"assign should increase ref count");
+                ASSERT(assigned.instances_count()==2,"assign should increase ref count");
+            }
+        }
+        namespace concurrent_tests{
+            typedef native_for_concurrent_op_repeated<object_instances_counting_concurrent_type>  native_for_concurrent_op;
+
+            struct native_for_single_op_repeated_fixture{
+                object_instances_counting_concurrent_type source;
+                void run_native_for_and_assert_source_is_unique(native_for_concurrent_op::test_function_pointer_type operation,const char* msg){
+                    //TODO: refactor number of threads into separate fixture
+                    const size_t number_of_threads = min(4,tbb::task_scheduler_init::default_num_threads());
+                    const size_t repeats_per_thread = 1000000;
+
+                    NativeParallelFor(number_of_threads , native_for_concurrent_op(source,operation,repeats_per_thread));
+                    ASSERT(source.instances_count()==1,msg);
+                }
+
+            };
+            TEST_CASE_WITH_FIXTURE(test_object_instances_counting_type_copy,native_for_single_op_repeated_fixture){
+                struct _{ static void copy(object_instances_counting_concurrent_type& a_source){
+                    object_instances_counting_concurrent_type copy(a_source);
+                    helpers::prevent_optimizing_out(copy);
+                }};
+                run_native_for_and_assert_source_is_unique(&_::copy,"reference counting during copy construction/destruction is not thread safe ?");
+            }
+            TEST_CASE_WITH_FIXTURE(test_object_instances_counting_type_assignment,native_for_single_op_repeated_fixture){
+                struct _{ static void assign(object_instances_counting_concurrent_type& a_source){
+                    object_instances_counting_concurrent_type assigned;
+                    assigned = a_source;
+                    helpers::prevent_optimizing_out(assigned);
+                }};
+                run_native_for_and_assert_source_is_unique(&_::assign,"reference counting during assigning/destruction is not thread safe ?");
+            }
+
+        }
+}
+}
+
+struct get_lru_cache_type{
+
+    template< typename parameter1, typename parameter2, typename parameter3=void>
+    struct apply{
+        typedef selected_raii_lru_cache_impl<parameter1,parameter2,parameter3> type;
+    };
+    template< typename parameter1, typename parameter2>
+    struct apply<parameter1,parameter2,void>{
+        typedef selected_raii_lru_cache_impl<parameter1,parameter2> type;
+    };
+
+};
+
+// these includes are needed for test_task_handle_mv_sem*
+#include <vector>
+#include <string>
+#include <functional>
+
+namespace serial_tests{
+    using namespace helpers;
+    namespace usability{
+    namespace compilation_only{
+        TEST_CASE_WITH_FIXTURE(test_creation_and_use_interface,empty_fixture){
+            struct dummy_function{static int _(int key){return key;}};
+            typedef get_lru_cache_type::apply<int,int>::type cache_type;
+            size_t number_of_lru_history_items = 8;
+            cache_type cache((&dummy_function::_),(number_of_lru_history_items));
+            int dummy_key=0;
+            cache_type::handle h = cache[dummy_key];
+            int value = h.value();
+            (void)value;
+        }
+    }
+    namespace behaviour {
+        namespace helpers {
+            template <size_t id> struct tag {};
+            template< typename tag, typename value_and_key_type>
+            struct call_counting_function {
+                static int calls_count;
+                static value_and_key_type _(value_and_key_type key) {
+                    ++calls_count;
+                    return key;
+                }
+            };
+            template< typename tag, typename value_and_key_type>
+            int call_counting_function<tag, value_and_key_type>::calls_count = 0;
+        }
+
+        using std::string;
+        struct mv_sem_fixture {
+            struct item_init{
+                static string init(string key) {
+                    return key;
+                }
+            };
+            typedef tbb::concurrent_lru_cache<string, string> cache_type;
+            typedef cache_type::handle handle_type;
+            cache_type cache;
+            mv_sem_fixture() : cache((&item_init::init), 1) {};
+
+            handle_type default_ctor_check;
+        };
+
+        TEST_CASE_WITH_FIXTURE(test_task_handle_mv_sem, mv_sem_fixture) {
+            handle_type handle;
+            handle_type foobar = handle_type();
+
+            //c++03 : handle_move_t assignment
+            handle = cache["handle"];
+
+            //c++03 : init ctor from handle_move_t
+            handle_type foo = cache["bar"];
+
+            //c++03 : init ctor from handle_move_t
+            handle_type handle1(move(handle));
+
+            //c++03 : handle_move_t assignment
+            handle = move(handle1);
+
+            ASSERT(!handle_type(), "user-defined to-bool conversion does not work");
+            ASSERT(handle, "user-defined to-bool conversion does not work");
+
+            handle = handle_type();
+        }
+
+        TEST_CASE_WITH_FIXTURE(test_task_handle_mv_sem_certain_case, mv_sem_fixture) {
+            // there is no way to use handle_object as vector argument in C++03
+            // because argument must meet requirements of CopyAssignable and
+            // CopyConstructible (C++ documentation)
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+            // retain handle_object to keep an item in the cache if it is still active without aging
+            handle_type sheep = cache["sheep"];
+            handle_type horse = cache["horse"];
+            handle_type bull = cache["bull"];
+
+            std::vector<handle_type> animals;
+            animals.reserve(5);
+            animals.emplace_back(std::move(sheep));
+            animals.emplace_back(std::move(horse));
+            animals[0] = std::move(bull);
+            // after resize() vec will be full of default constructed handlers with null pointers
+            // on item in cache and on cache which item belongs to
+            animals.resize(10);
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+        }
+
+        TEST_CASE_WITH_FIXTURE(test_cache_returns_only_values_from_value_function,empty_fixture){
+            struct dummy_function{static int _(int /*key*/){return 0xDEADBEEF;}};
+            typedef get_lru_cache_type::apply<int,int>::type cache_type;
+            size_t number_of_lru_history_items = 8;
+            int dummy_key=1;
+            cache_type cache((&dummy_function::_),(number_of_lru_history_items));
+            ASSERT(dummy_function::_(dummy_key)==cache[dummy_key].value(),"cache operator() must return only values obtained from value_function ");
+        }
+
+        TEST_CASE_WITH_FIXTURE(test_value_function_called_only_on_cache_miss,empty_fixture){
+            typedef helpers::tag<__LINE__> tag;
+            typedef helpers::call_counting_function<tag,int> function;
+            typedef get_lru_cache_type::apply<int,int>::type cache_type;
+            size_t number_of_lru_history_items = 8;
+            cache_type cache((&function::_),(number_of_lru_history_items));
+
+            int dummy_key=0;
+            cache[dummy_key];
+            cache[dummy_key];
+            ASSERT(function::calls_count==1,"value function should be called only on a cache miss");
+        }
+        }
+        namespace helpers{
+            using ::helpers::object_instances_counting_serial_type;
+        }
+        namespace helpers{
+            template<typename value_type>
+            struct clonning_function:NoAssign{
+                value_type& m_ref_original;
+                clonning_function(value_type& ref_original):m_ref_original(ref_original){}
+                template<typename key_type>
+                value_type operator()(key_type)const{ return m_ref_original;}
+            };
+        }
+        struct instance_counting_fixture{
+            static const size_t number_of_lru_history_items = 8;
+
+            typedef helpers::clonning_function<helpers::object_instances_counting_serial_type> cloner_type;
+            typedef get_lru_cache_type::apply<size_t,helpers::object_instances_counting_serial_type,cloner_type>::type cache_type;
+            helpers::object_instances_counting_serial_type source;
+            cloner_type cloner;
+            cache_type cache;
+
+            instance_counting_fixture():cloner((source)),cache(cloner,number_of_lru_history_items){}
+        };
+
+        TEST_CASE_WITH_FIXTURE(test_cache_stores_unused_objects,instance_counting_fixture){
+            for (size_t i=0;i<number_of_lru_history_items;++i){
+                cache[i];
+            }
+            ASSERT(source.instances_count()> 1,"cache should store some unused objects ");
+        }
+
+        TEST_CASE_WITH_FIXTURE(test_cache_stores_no_more_then_X_number_of_unused_objects,instance_counting_fixture){
+            for (size_t i=0;i<number_of_lru_history_items+1;++i){
+                cache[i];
+            }
+            ASSERT(source.instances_count()== number_of_lru_history_items+1,"cache should respect number of stored unused objects to number passed in constructor");
+        }
+
+        namespace helpers{
+            template< typename key_type, typename value_type>
+            struct map_searcher:NoAssign{
+                typedef std::map<key_type,value_type> map_type;
+                map_type & m_map_ref;
+                map_searcher(map_type & map_ref): m_map_ref(map_ref) {}
+                value_type& operator()(key_type k){
+                    typename map_type::iterator it =m_map_ref.find(k);
+                    if (it==m_map_ref.end()){
+                        it = m_map_ref.insert(it,std::make_pair(k,value_type()));
+                    }
+                    return it->second;
+                }
+            };
+        }
+
+        struct filled_instance_counting_fixture_with_external_map{
+            static const size_t number_of_lru_history_items = 8;
+
+            typedef helpers::map_searcher<size_t,helpers::object_instances_counting_serial_type> map_searcher_type;
+            typedef map_searcher_type::map_type objects_map_type;
+            typedef get_lru_cache_type::apply<size_t,helpers::object_instances_counting_serial_type,map_searcher_type>::type cache_type;
+            map_searcher_type::map_type objects_map;
+            cache_type cache;
+            filled_instance_counting_fixture_with_external_map():cache(map_searcher_type(objects_map),number_of_lru_history_items){}
+            bool is_evicted(size_t k){
+                objects_map_type::iterator it =objects_map.find(k);
+                ASSERT(it!=objects_map.end(),"no value for key - error in test logic ?");
+                return it->second.instances_count()==1;
+            }
+            void fill_up_cache(size_t lower_bound, size_t upper_bound){
+                for (size_t i=lower_bound;i<upper_bound;++i){
+                    cache[i];
+                }
+            }
+        };
+
+        TEST_CASE_WITH_FIXTURE(test_cache_should_evict_unused_objects_lru_order,filled_instance_counting_fixture_with_external_map){
+            ASSERT(number_of_lru_history_items > 2,"incorrect test setup");
+            fill_up_cache(0,number_of_lru_history_items);
+            //heat up first element
+            cache[0];
+            //cause eviction
+            cache[number_of_lru_history_items];
+            ASSERT(is_evicted(1) && !is_evicted(0),"cache should evict items in lru order");
+        }
+
+        TEST_CASE_WITH_FIXTURE(test_live_handler_object_prevents_item_from_eviction,filled_instance_counting_fixture_with_external_map){
+            cache_type::handle h = cache[0];
+            //cause eviction
+            fill_up_cache(1,number_of_lru_history_items+2);
+            ASSERT(is_evicted(1) && !is_evicted(0),"cache should not evict items in use");
+        }
+        TEST_CASE_WITH_FIXTURE(test_live_handler_object_is_ref_counted,filled_instance_counting_fixture_with_external_map){
+            cache_type::handle h = cache[0];
+            {
+                cache_type::handle h1 = cache[0];
+            }
+            //cause eviction
+            fill_up_cache(1,number_of_lru_history_items+2);
+            ASSERT(is_evicted(1) && !is_evicted(0),"cache should not evict items in use");
+        }
+    }
+}
+
+
+namespace concurrency_tests{
+    namespace helpers{
+        using namespace ::helpers;
+    }
+    namespace helpers{
+        //key_type must be convertible to array index
+        template< typename key_type, typename value_type, size_t array_size>
+        struct array_searcher:NoAssign{
+            typedef value_type array_type[array_size];
+            array_type const& m_array_ref;
+            array_searcher(array_type const& array_ref): m_array_ref(array_ref) {}
+            const value_type& operator()(key_type k)const{
+                size_t index = k;
+                ASSERT(k < array_size,"incorrect test setup");
+                return m_array_ref[index];
+            }
+        };
+    }
+
+    struct filled_instance_counting_fixture_with_external_array{
+        static const size_t number_of_lru_history_items = 8;
+        static const size_t array_size = 16*number_of_lru_history_items;
+
+        typedef helpers::array_searcher<size_t,helpers::object_instances_counting_concurrent_type,array_size> array_searcher_type;
+        typedef array_searcher_type::array_type objects_array_type;
+        typedef get_lru_cache_type::apply<size_t,helpers::object_instances_counting_concurrent_type,array_searcher_type>::type cache_type;
+        array_searcher_type::array_type objects_array;
+        cache_type cache;
+        filled_instance_counting_fixture_with_external_array():cache(array_searcher_type(objects_array),number_of_lru_history_items){}
+        bool is_evicted(size_t k)const{
+            return array_searcher_type(objects_array)(k).instances_count()==1;
+        }
+        void fill_up_cache(size_t lower_bound, size_t upper_bound){
+            for (size_t i=lower_bound;i<upper_bound;++i){
+                cache[i];
+            }
+        }
+        size_t number_of_non_evicted_from_cache()const{
+            size_t result=0;
+            for (size_t i=0; i<array_size; ++i){
+                if (!this->is_evicted(i)){
+                    ++result;
+                }
+            }
+            return result;
+        }
+    };
+
+
+    //TODO: make this more reproducible
+    //TODO: split this test case in two parts
+    TEST_CASE_WITH_FIXTURE(correctness_of_braces_and_handle_destructor,filled_instance_counting_fixture_with_external_array){
+        typedef correctness_of_braces_and_handle_destructor self_type;
+        struct _{static void use_cache(self_type& tc){
+            for (size_t i=0;i<array_size;++i){
+                cache_type::handle h=tc.cache[i];
+                helpers::prevent_optimizing_out(h.value());
+            }
+
+        }};
+        static const size_t repeat_number = 2;
+        static const size_t number_of_threads = 4 * tbb::task_scheduler_init::default_num_threads(); //have 4x over subscription
+        static const size_t repeats_per_thread = 4;
+
+        for (size_t i=0; i < repeat_number; i++){
+            NativeParallelFor(number_of_threads,helpers::native_for_concurrent_op_repeated<self_type>(*this,&_::use_cache,repeats_per_thread));
+            fill_up_cache(0,array_size);
+            ASSERT(number_of_non_evicted_from_cache()==number_of_lru_history_items,"thread safety is broken for cache ");
+        }
+    }
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_monitor.cpp b/xdl/third_party/tbb/src/test/test_concurrent_monitor.cpp
new file mode 100644
index 00000000..db76a0e8
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_monitor.cpp
@@ -0,0 +1,369 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 6
+#define HARNESS_DEFAULT_MAX_THREADS 8
+
+#include "tbb/concurrent_monitor.h"
+#include "tbb/atomic.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "harness.h"
+#if _WIN32||_WIN64
+#include "tbb/dynamic_link.cpp"
+#endif
+
+#include "tbb/semaphore.cpp"
+#include "tbb/concurrent_monitor.cpp"
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    // Suppress compiler warning about constant conditional expression
+    #pragma warning (disable: 4127)
+#endif
+
+using namespace tbb;
+
+//! Queuing lock with concurrent_monitor; to test concurrent_monitor::notify( Predicate p )
+class QueuingMutex {
+public:
+    //! Construct unacquired mutex.
+    QueuingMutex() { q_tail = NULL; }
+
+    //! The scoped locking pattern
+    class ScopedLock: internal::no_copy {
+        void Initialize() { mutex = NULL; }
+    public:
+        ScopedLock() {Initialize();}
+        ScopedLock( QueuingMutex& m, size_t test_mode ) { Initialize(); Acquire(m,test_mode); }
+        ~ScopedLock() { if( mutex ) Release(); }
+        void Acquire( QueuingMutex& m, size_t test_mode );
+        void Release();
+        void SleepPerhaps();
+
+    private:
+        QueuingMutex* mutex;
+        ScopedLock* next;
+        uintptr_t going;
+        internal::concurrent_monitor::thread_context thr_ctx;
+    };
+
+    friend class ScopedLock;
+private:
+    //! The last competitor requesting the lock
+    atomic<ScopedLock*> q_tail;
+    internal::concurrent_monitor waitq;
+};
+
+struct PredicateEq {
+    uintptr_t p;
+    PredicateEq( uintptr_t p_ ) : p(p_) {}
+    bool operator() ( uintptr_t v ) const {return p==v;}
+};
+
+struct QueuingMutex_Context {
+    const QueuingMutex::ScopedLock* lck;
+    QueuingMutex_Context( QueuingMutex::ScopedLock* l_ ) : lck(l_) {}
+    uintptr_t operator()() { return uintptr_t(lck); }
+};
+
+struct QueuingMutex_Until : NoAssign {
+    uintptr_t& flag;
+    QueuingMutex_Until( uintptr_t& f_ ) : flag(f_) {}
+    bool operator()() { return flag!=0ul; }
+};
+
+//! A method to acquire QueuingMutex lock
+void QueuingMutex::ScopedLock::Acquire( QueuingMutex& m, size_t test_mode )
+{
+    // Must set all fields before the fetch_and_store, because once the
+    // fetch_and_store executes, *this becomes accessible to other threads.
+    mutex = &m;
+    next  = NULL;
+    going = 0;
+
+    // The fetch_and_store must have release semantics, because we are
+    // "sending" the fields initialized above to other processors.
+    ScopedLock* pred = m.q_tail.fetch_and_store<tbb::release>(this);
+    if( pred ) {
+#if TBB_USE_ASSERT
+        __TBB_control_consistency_helper(); // on "m.q_tail"
+        ASSERT( !pred->next, "the predecessor has another successor!");
+#endif
+        pred->next = this;
+        for( int i=0; i<16; ++i ) {
+            if( going!=0ul ) break;
+            __TBB_Yield();
+        }
+        int x = int( test_mode%3 );
+        switch( x ) {
+        case 0:
+            mutex->waitq.wait( QueuingMutex_Until(going), QueuingMutex_Context(this) );
+            break;
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        case 1:
+            mutex->waitq.wait( [&](){ return going!=0ul; }, [=]() { return (uintptr_t)this; } );
+            break;
+#endif
+        default:
+            SleepPerhaps();
+            break;
+        }
+    }
+
+    // Acquire critical section indirectly from previous owner or directly from predecessor.
+    __TBB_control_consistency_helper(); // on either "m.q_tail" or "going"
+}
+
+//! A method to release QueuingMutex lock
+void QueuingMutex::ScopedLock::Release( )
+{
+    if( !next ) {
+        if( this == mutex->q_tail.compare_and_swap<tbb::release>(NULL, this) ) {
+            // this was the only item in the queue, and the queue is now empty.
+            goto done;
+        }
+        // Someone in the queue
+        spin_wait_while_eq( next, (ScopedLock*)0 );
+    }
+    __TBB_store_with_release(next->going, 1);
+    mutex->waitq.notify( PredicateEq(uintptr_t(next)) );
+done:
+    Initialize();
+}
+
+//! Yield and block; go to sleep
+void QueuingMutex::ScopedLock::SleepPerhaps()
+{
+    bool slept = false;
+    internal::concurrent_monitor& mq = mutex->waitq;
+    mq.prepare_wait( thr_ctx, uintptr_t(this) );
+    while( going==0ul ) {
+        if( (slept=mq.commit_wait( thr_ctx ))==true && going!=0ul )
+            break;
+        slept = false;
+        mq.prepare_wait( thr_ctx, uintptr_t(this) );
+    }
+    if( !slept )
+        mq.cancel_wait( thr_ctx );
+}
+
+// Spin lock with concurrent_monitor; to test concurrent_monitor::notify_all() and concurrent_monitor::notify()
+class SpinMutex {
+public:
+    //! Construct unacquired mutex.
+    SpinMutex() : toggle(false) { flag = 0; }
+
+    //! The scoped locking pattern
+    class ScopedLock: internal::no_copy {
+        void Initialize() { mutex = NULL; }
+    public:
+        ScopedLock() {Initialize();}
+        ScopedLock( SpinMutex& m, size_t test_mode ) { Initialize(); Acquire(m,test_mode); }
+        ~ScopedLock() { if( mutex ) Release(); }
+        void Acquire( SpinMutex& m, size_t test_mode );
+        void Release();
+        void SleepPerhaps();
+
+    private:
+        SpinMutex* mutex;
+        internal::concurrent_monitor::thread_context thr_ctx;
+    };
+
+    friend class ScopedLock;
+    friend struct SpinMutex_Until;
+private:
+    tbb::atomic<unsigned> flag;
+    bool toggle;
+    internal::concurrent_monitor waitq;
+};
+
+struct SpinMutex_Context {
+    const SpinMutex::ScopedLock* lck;
+    SpinMutex_Context( SpinMutex::ScopedLock* l_ ) : lck(l_) {}
+    uintptr_t operator()() { return uintptr_t(lck); }
+};
+
+struct SpinMutex_Until {
+    const SpinMutex* mtx;
+    SpinMutex_Until( SpinMutex* m_ ) : mtx(m_) {}
+    bool operator()() { return mtx->flag==0; }
+};
+
+//! A method to acquire SpinMutex lock
+void SpinMutex::ScopedLock::Acquire( SpinMutex& m, size_t test_mode )
+{
+    mutex = &m;
+retry:
+    if( m.flag.compare_and_swap( 1, 0 )!=0 ) {
+        int x = int( test_mode%3 );
+        switch( x ) {
+        case 0:
+            mutex->waitq.wait( SpinMutex_Until(mutex), SpinMutex_Context(this) );
+            break;
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        case 1:
+            mutex->waitq.wait( [&](){ return mutex->flag==0; }, [=]() { return (uintptr_t)this; } );
+            break;
+#endif
+        default:
+            SleepPerhaps();
+            break;
+        }
+        goto retry;
+    }
+}
+
+//! A method to release SpinMutex lock
+void SpinMutex::ScopedLock::Release()
+{
+    bool old_toggle = mutex->toggle;
+    mutex->toggle = !mutex->toggle;
+    mutex->flag = 0;
+    if( old_toggle )
+        mutex->waitq.notify_one();
+    else
+        mutex->waitq.notify_all();
+}
+
+//! Yield and block; go to sleep
+void SpinMutex::ScopedLock::SleepPerhaps()
+{
+    bool slept = false;
+    internal::concurrent_monitor& mq = mutex->waitq;
+    mq.prepare_wait( thr_ctx, uintptr_t(this) );
+    while( mutex->flag ) {
+        if( (slept=mq.commit_wait( thr_ctx ))==true )
+            break;
+        mq.prepare_wait( thr_ctx, uintptr_t(this) );
+    }
+    if( !slept )
+        mq.cancel_wait( thr_ctx );
+}
+
+//! A value protected by a mutex.
+template<typename M>
+struct Counter {
+    typedef M mutex_type;
+    M mutex;
+    long value;
+};
+
+//! Function object for use with parallel_for.h.
+template<typename C, int D>
+struct AddOne: NoAssign {
+    C& counter;
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            typename C::mutex_type::ScopedLock lock(counter.mutex, i);
+            counter.value = counter.value+1;
+            if( D>0 )
+                for( int j=0; j<D; ++j ) __TBB_Yield();
+        }
+    }
+    AddOne( C& counter_ ) : counter(counter_) {}
+};
+
+//! Generic test with TBB mutex type M, max range R, and delay D.
+template<typename M,int R, int D>
+void Test( int p ) {
+    Counter<M> counter;
+    counter.value = 0;
+    const int n = R;
+    tbb::task_scheduler_init init(p);
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,n,n/10),AddOne<Counter<M>,D>(counter));
+    if( counter.value!=n )
+        REPORT("ERROR : counter.value=%ld (instead of %ld)\n",counter.value,n);
+}
+
+#if TBB_USE_EXCEPTIONS
+#define NTHRS_USED_IN_DESTRUCTOR_TEST 8
+
+atomic<size_t> n_sleepers;
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4244 4267)
+#endif
+
+struct AllButOneSleep : NoAssign {
+    internal::concurrent_monitor*& mon;
+    static const size_t VLN = 1024*1024;
+    void operator()( int i ) const {
+        internal::concurrent_monitor::thread_context thr_ctx;
+
+        if( i==0 ) {
+            size_t n_expected_sleepers = NTHRS_USED_IN_DESTRUCTOR_TEST-1;
+            while( n_sleepers<n_expected_sleepers )
+                __TBB_Yield();
+            while( n_sleepers.compare_and_swap( VLN+NTHRS_USED_IN_DESTRUCTOR_TEST, n_expected_sleepers )!=n_expected_sleepers )
+                __TBB_Yield();
+
+            for( int j=0; j<100; ++j )
+                Harness::Sleep( 1 );
+            delete mon;
+            mon = NULL;
+        } else {
+            mon->prepare_wait( thr_ctx, uintptr_t(this) );
+            while( n_sleepers<VLN ) {
+                try {
+                    ++n_sleepers;
+                    mon->commit_wait( thr_ctx );
+                    if( --n_sleepers>VLN )
+                        break;
+                } catch( tbb::user_abort& ) {
+                    // can no longer access 'mon'
+                    break;
+                }
+                mon->prepare_wait( thr_ctx, uintptr_t(this) );
+            }
+        }
+    }
+    AllButOneSleep( internal::concurrent_monitor*& m_ ) : mon(m_) {}
+};
+#endif /* TBB_USE_EXCEPTIONS */
+
+void TestDestructor() {
+#if TBB_USE_EXCEPTIONS
+    tbb::task_scheduler_init init(NTHRS_USED_IN_DESTRUCTOR_TEST);
+    internal::concurrent_monitor* my_mon = new internal::concurrent_monitor;
+    REMARK( "testing the destructor\n" );
+    n_sleepers = 0;
+    NativeParallelFor(NTHRS_USED_IN_DESTRUCTOR_TEST,AllButOneSleep(my_mon));
+    ASSERT( my_mon==NULL, "" );
+#endif /* TBB_USE_EXCEPTIONS */
+}
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK( "testing with %d workers\n", static_cast<int>(p) );
+        // test the predicated notify
+        Test<QueuingMutex,100000,0>( p );
+        Test<QueuingMutex,1000,10000>( p );
+        // test the notify_all method
+        Test<SpinMutex,100000,0>( p );
+        Test<SpinMutex,1000,10000>( p );
+        REMARK( "calling destructor for task_scheduler_init\n" );
+    }
+    TestDestructor();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_priority_queue.cpp b/xdl/third_party/tbb/src/test/test_concurrent_priority_queue.cpp
new file mode 100644
index 00000000..0836fee1
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_priority_queue.cpp
@@ -0,0 +1,1140 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_defs.h"
+#include "tbb/concurrent_priority_queue.h"
+#include "tbb/atomic.h"
+#include "tbb/blocked_range.h"
+#include "harness.h"
+#include <functional>
+#include <algorithm>
+#include "harness_allocator.h"
+#include <vector>
+#include "test_container_move_support.h"
+
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    // VS2008/VC9 seems to have an issue; limits pull in math.h
+    #pragma warning( push )
+    #pragma warning( disable: 4985 )
+#endif
+#include <climits>
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    #pragma warning( pop )
+#endif
+
+#if __INTEL_COMPILER && (_WIN32 || _WIN64) && TBB_USE_DEBUG && _CPPLIB_VER<520
+// The Intel Compiler has an issue that causes the Microsoft Iterator
+// Debugging code to crash in vector::pop_back when it is called after a
+// vector::push_back throws an exception.
+// #define _HAS_ITERATOR_DEBUGGING 0 // Setting this to 0 doesn't solve the problem
+                                     // and also provokes a redefinition warning
+#define __TBB_ITERATOR_DEBUGGING_EXCEPTIONS_BROKEN
+#endif
+
+using namespace tbb;
+
+const size_t MAX_ITER = 10000;
+
+tbb::atomic<unsigned int> counter;
+
+class my_data_type {
+public:
+    int priority;
+    char padding[tbb::internal::NFS_MaxLineSize - sizeof(int) % tbb::internal::NFS_MaxLineSize];
+    my_data_type() {}
+    my_data_type(int init_val) : priority(init_val) {}
+    const my_data_type operator+(const my_data_type& other) const {
+        return my_data_type(priority+other.priority);
+    }
+    bool operator==(const my_data_type& other) const {
+        return this->priority == other.priority;
+    }
+};
+
+const my_data_type DATA_MIN(INT_MIN);
+const my_data_type DATA_MAX(INT_MAX);
+
+class my_less {
+public:
+    bool operator()(const my_data_type d1, const my_data_type d2) const {
+        return d1.priority<d2.priority;
+    }
+};
+
+#if TBB_USE_EXCEPTIONS
+class my_throwing_type : public my_data_type {
+public:
+    static int throw_flag;
+    my_throwing_type() : my_data_type() {}
+    my_throwing_type(const my_throwing_type& src) : my_data_type(src) {
+        if (my_throwing_type::throw_flag) throw 42;
+        priority = src.priority;
+    }
+};
+int my_throwing_type::throw_flag = 0;
+
+typedef concurrent_priority_queue<my_throwing_type, my_less > cpq_ex_test_type;
+#endif
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT
+const size_t push_selector_variants = 3;
+#elif __TBB_CPP11_RVALUE_REF_PRESENT
+const size_t push_selector_variants = 2;
+#else
+const size_t push_selector_variants = 1;
+#endif
+
+template <typename Q, typename E>
+void push_selector(Q& q, E e, size_t i) {
+    switch (i%push_selector_variants) {
+    case 0: q->push(e); break;
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    case 1: q->push(tbb::internal::move(e)); break;
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    case 2: q->emplace(e); break;
+#endif
+#endif
+    }
+}
+
+template<typename T, typename C>
+class FillBody : NoAssign {
+    int nThread;
+    T my_max, my_min;
+    concurrent_priority_queue<T, C> *q;
+    C less_than;
+public:
+    FillBody(int nThread_, T max_, T min_, concurrent_priority_queue<T, C> *q_) : nThread(nThread_), my_max(max_), my_min(min_), q(q_) {}
+    void operator()(const int threadID) const {
+        T elem = my_min + T(threadID);
+        for (size_t i=0; i<MAX_ITER; ++i) {
+            // do some pushes
+            push_selector(q, elem, i);
+            if (elem == my_max) elem = my_min;
+            elem = elem + T(nThread);
+        }
+    }
+};
+
+template<typename T, typename C>
+struct EmptyBody : NoAssign {
+    int nThread;
+    T my_max;
+    concurrent_priority_queue<T, C> *q;
+    C less_than;
+public:
+    EmptyBody(int nThread_, T max_, concurrent_priority_queue<T, C> *q_) : nThread(nThread_), my_max(max_), q(q_) {}
+    void operator()(const int /*threadID*/) const {
+        T elem(my_max), last;
+        if (q->try_pop(last)) {
+            ++counter;
+            while(q->try_pop(elem)) {
+                ASSERT(!less_than(last, elem), "FAILED pop/priority test in EmptyBody.");
+                last = elem;
+                elem = my_max;
+                ++counter;
+            }
+        }
+    }
+};
+
+template <typename T, typename C>
+class FloggerBody : NoAssign {
+    int nThread;
+    concurrent_priority_queue<T, C> *q;
+public:
+    FloggerBody(int nThread_, concurrent_priority_queue<T, C> *q_) :
+        nThread(nThread_), q(q_) {}
+    void operator()(const int threadID) const {
+        T elem = T(threadID+1);
+        for (size_t i=0; i<MAX_ITER; ++i) {
+            push_selector(q, elem, i);
+            (void) q->try_pop(elem);
+        }
+    }
+};
+
+namespace equality_comparison_helpers {
+    struct to_vector{
+        template <typename element_type, typename compare_t, typename allocator_t>
+        std::vector<element_type> operator()(tbb::concurrent_priority_queue<element_type, compare_t, allocator_t> const& source) const{
+            tbb::concurrent_priority_queue<element_type, compare_t, allocator_t>  cpq((source));
+            std::vector<element_type> v; v.reserve(cpq.size());
+            element_type element;
+            while (cpq.try_pop(element)){ v.push_back(element);}
+            std::reverse(v.begin(),v.end());
+            return v;
+        }
+    };
+}
+//TODO: make CPQ more testable instead of hacking ad-hoc operator ==
+//operator == is required for __TBB_TEST_INIT_LIST_SUITE
+template <typename element_type, typename compare_t, typename allocator_t>
+bool operator==(tbb::concurrent_priority_queue<element_type, compare_t, allocator_t> const& lhs, tbb::concurrent_priority_queue<element_type, compare_t, allocator_t> const& rhs){
+    using equality_comparison_helpers::to_vector;
+    return to_vector()(lhs) == to_vector()(rhs);
+}
+
+template <typename range, typename element_type, typename compare_t, typename allocator_t>
+bool operator==(tbb::concurrent_priority_queue<element_type, compare_t, allocator_t> const& lhs, range const & rhs ){
+    using equality_comparison_helpers::to_vector;
+    return to_vector()(lhs) == std::vector<element_type>(rhs.begin(),rhs.end());
+}
+
+void TestToVector(){
+    using equality_comparison_helpers::to_vector;
+    int array[] = {1,5,6,8,4,7};
+    tbb::blocked_range<int *> range =  Harness::make_blocked_range(array);
+    std::vector<int> source(range.begin(),range.end());
+    tbb::concurrent_priority_queue<int> q(source.begin(),source.end());
+    std::vector<int> from_cpq = to_vector()(q);
+    std::sort(source.begin(),source.end());
+    ASSERT(source == from_cpq,"equality_comparison_helpers::to_vector incorrectly copied items from CPQ?");
+}
+
+void TestHelpers(){
+    TestToVector();
+}
+
+void TestConstructorsDestructorsAccessors() {
+    std::vector<int> v;
+    std::allocator<int> a;
+    concurrent_priority_queue<int, std::less<int> > *q, *qo;
+    concurrent_priority_queue<int, std::less<int>, std::allocator<int>  > *qi;
+
+    // Test constructors/destructors
+    REMARK("Testing default constructor.\n");
+    q = new concurrent_priority_queue<int, std::less<int> >();
+    REMARK("Default constructor complete.\n");
+    ASSERT(q->size()==0, "FAILED size test.");
+    ASSERT(q->empty(), "FAILED empty test.");
+    REMARK("Testing destructor.\n");
+    delete q;
+    REMARK("Destruction complete.\n");
+
+    REMARK("Testing capacity constructor.\n");
+    q = new concurrent_priority_queue<int, std::less<int> >(42);
+    REMARK("Capacity constructor complete.\n");
+    ASSERT(q->size()==0, "FAILED size test.");
+    ASSERT(q->empty(), "FAILED empty test.");
+    REMARK("Testing destructor.\n");
+    delete q;
+    REMARK("Destruction complete.\n");
+
+    REMARK("Testing allocator constructor.\n");
+    qi = new concurrent_priority_queue<int, std::less<int>, std::allocator<int> >(a);
+    REMARK("Allocator constructor complete.\n");
+    ASSERT(qi->size()==0, "FAILED size test.");
+    ASSERT(qi->empty(), "FAILED empty test.");
+    REMARK("Testing destructor.\n");
+    delete qi;
+    REMARK("Destruction complete.\n");
+
+    REMARK("Testing capacity+allocator constructor.\n");
+    qi = new concurrent_priority_queue<int, std::less<int>, std::allocator<int> >(42, a);
+    REMARK("Capacity+allocator constructor complete.\n");
+    ASSERT(qi->size()==0, "FAILED size test.");
+    ASSERT(qi->empty(), "FAILED empty test.");
+    REMARK("Testing destructor.\n");
+    delete qi;
+    REMARK("Destruction complete.\n");
+
+    REMARK("Testing iterator filler constructor.\n");
+    for (int i=0; i<42; ++i)
+        v.push_back(i);
+    q = new concurrent_priority_queue<int, std::less<int> >(v.begin(), v.end());
+    REMARK("Iterator filler constructor complete.\n");
+    ASSERT(q->size()==42, "FAILED vector/size test.");
+    ASSERT(!q->empty(), "FAILED vector/empty test.");
+    ASSERT(*q == v, "FAILED vector/equality test.");
+
+    REMARK("Testing copy constructor.\n");
+    qo = new concurrent_priority_queue<int, std::less<int> >(*q);
+    REMARK("Copy constructor complete.\n");
+    ASSERT(qo->size()==42, "FAILED cpq/size test.");
+    ASSERT(!qo->empty(), "FAILED cpq/empty test.");
+    ASSERT(*q == *qo, "FAILED cpq/equality test.");
+
+    REMARK("Testing destructor.\n");
+    delete q;
+    delete qo;
+    REMARK("Destruction complete.\n");
+}
+
+void TestAssignmentClearSwap() {
+    typedef concurrent_priority_queue<int, std::less<int> > cpq_type;
+    std::vector<int> v;
+    cpq_type *q, *qo;
+    int e;
+
+    for (int i=0; i<42; ++i)
+        v.push_back(i);
+    q = new cpq_type(v.begin(), v.end());
+    qo = new cpq_type();
+
+    REMARK("Testing assignment (1).\n");
+    *qo = *q;
+    REMARK("Assignment complete.\n");
+    ASSERT(qo->size()==42, "FAILED assignment/size test.");
+    ASSERT(!qo->empty(), "FAILED assignment/empty test.");
+    ASSERT(*qo == v,"FAILED assignment/equality test");
+
+    cpq_type assigned_q;
+    REMARK("Testing assign(begin,end) (2).\n");
+    assigned_q.assign(v.begin(), v.end());
+    REMARK("Assignment complete.\n");
+    ASSERT(assigned_q.size()==42, "FAILED assignment/size test.");
+    ASSERT(!assigned_q.empty(), "FAILED assignment/empty test.");
+    ASSERT(assigned_q == v,"FAILED assignment/equality test");
+
+    REMARK("Testing clear.\n");
+    q->clear();
+    REMARK("Clear complete.\n");
+    ASSERT(q->size()==0, "FAILED clear/size test.");
+    ASSERT(q->empty(), "FAILED clear/empty test.");
+
+    for (size_t i=0; i<5; ++i)
+        (void) qo->try_pop(e);
+
+    REMARK("Testing assignment (3).\n");
+    *q = *qo;
+    REMARK("Assignment complete.\n");
+    ASSERT(q->size()==37, "FAILED assignment/size test.");
+    ASSERT(!q->empty(), "FAILED assignment/empty test.");
+
+    for (size_t i=0; i<5; ++i)
+        (void) qo->try_pop(e);
+
+    REMARK("Testing swap.\n");
+    q->swap(*qo);
+    REMARK("Swap complete.\n");
+    ASSERT(q->size()==32, "FAILED swap/size test.");
+    ASSERT(!q->empty(), "FAILED swap/empty test.");
+    ASSERT(qo->size()==37, "FAILED swap_operand/size test.");
+    ASSERT(!qo->empty(), "FAILED swap_operand/empty test.");
+    delete q;
+    delete qo;
+}
+
+void TestSerialPushPop() {
+    concurrent_priority_queue<int, std::less<int> > *q;
+    int e=42, prev=INT_MAX;
+    size_t count=0;
+
+    q = new concurrent_priority_queue<int, std::less<int> >(MAX_ITER);
+    REMARK("Testing serial push.\n");
+    for (size_t i=0; i<MAX_ITER; ++i) {
+        push_selector(q, e, i);
+        e = e*-1 + int(i);
+    }
+    REMARK("Pushing complete.\n");
+    ASSERT(q->size()==MAX_ITER, "FAILED push/size test.");
+    ASSERT(!q->empty(), "FAILED push/empty test.");
+
+    REMARK("Testing serial pop.\n");
+    while (!q->empty()) {
+        ASSERT(q->try_pop(e), "FAILED pop test.");
+        ASSERT(prev>=e, "FAILED pop/priority test.");
+        prev = e;
+        ++count;
+        ASSERT(q->size()==MAX_ITER-count, "FAILED swap/size test.");
+        ASSERT(!q->empty() || count==MAX_ITER, "FAILED swap/empty test.");
+    }
+    ASSERT(!q->try_pop(e), "FAILED: successful pop from the empty queue.");
+    REMARK("Popping complete.\n");
+    delete q;
+}
+
+template <typename T, typename C>
+void TestParallelPushPop(int nThreads, T t_max, T t_min, C /*compare*/) {
+    size_t qsize;
+
+    concurrent_priority_queue<T, C> *q = new concurrent_priority_queue<T, C>(0);
+    FillBody<T, C> filler(nThreads, t_max, t_min, q);
+    EmptyBody<T, C> emptier(nThreads, t_max, q);
+    counter = 0;
+    REMARK("Testing parallel push.\n");
+    NativeParallelFor(nThreads, filler);
+    REMARK("Pushing complete.\n");
+    qsize = q->size();
+    ASSERT(q->size()==nThreads*MAX_ITER, "FAILED push/size test.");
+    ASSERT(!q->empty(), "FAILED push/empty test.");
+
+    REMARK("Testing parallel pop.\n");
+    NativeParallelFor(nThreads, emptier);
+    REMARK("Popping complete.\n");
+    ASSERT(counter==qsize, "FAILED pop/size test.");
+    ASSERT(q->size()==0, "FAILED pop/empty test.");
+
+    q->clear();
+    delete(q);
+}
+
+void TestExceptions() {
+#if TBB_USE_EXCEPTIONS
+    const size_t TOO_LARGE_SZ = 1000000000;
+    my_throwing_type elem;
+
+    REMARK("Testing basic constructor exceptions.\n");
+    // Allocate empty queue should not throw no matter the type
+    try {
+        my_throwing_type::throw_flag = 1;
+        cpq_ex_test_type q;
+    } catch(...) {
+#if !(_MSC_VER==1900)
+        ASSERT(false, "FAILED: allocating empty queue should not throw exception.\n");
+        // VS2015 warns about the code in this catch block being unreachable
+#endif
+    }
+    // Allocate small queue should not throw for reasonably sized type
+    try {
+        my_throwing_type::throw_flag = 1;
+        cpq_ex_test_type q(42);
+    } catch(...) {
+        ASSERT(false, "FAILED: allocating small queue should not throw exception.\n");
+    }
+    // Allocate a queue with too large initial size
+    try {
+        my_throwing_type::throw_flag = 0;
+        cpq_ex_test_type q(TOO_LARGE_SZ);
+        REMARK("FAILED: Huge queue did not throw exception.\n");
+    } catch(...) {}
+
+    cpq_ex_test_type *pq;
+    try {
+        my_throwing_type::throw_flag = 0;
+        pq = NULL;
+        pq = new cpq_ex_test_type(TOO_LARGE_SZ);
+        REMARK("FAILED: Huge queue did not throw exception.\n");
+        delete pq;
+    } catch(...) {
+        ASSERT(!pq, "FAILED: pq should not be touched when constructor throws.\n");
+    }
+    REMARK("Basic constructor exceptions testing complete.\n");
+    REMARK("Testing copy constructor exceptions.\n");
+    my_throwing_type::throw_flag = 0;
+    cpq_ex_test_type src_q(42);
+    elem.priority = 42;
+    for (size_t i=0; i<42; ++i) src_q.push(elem);
+    try {
+        my_throwing_type::throw_flag = 1;
+        cpq_ex_test_type q(src_q);
+        REMARK("FAILED: Copy construct did not throw exception.\n");
+    } catch(...) {}
+    try {
+        my_throwing_type::throw_flag = 1;
+        pq = NULL;
+        pq = new concurrent_priority_queue<my_throwing_type, my_less >(src_q);
+        REMARK("FAILED: Copy construct did not throw exception.\n");
+        delete pq;
+    } catch(...) {
+        ASSERT(!pq, "FAILED: pq should not be touched when constructor throws.\n");
+    }
+    REMARK("Copy constructor exceptions testing complete.\n");
+    REMARK("Testing assignment exceptions.\n");
+    // Assignment is copy-swap, so it should be exception safe
+    my_throwing_type::throw_flag = 0;
+    cpq_ex_test_type assign_q(24);
+    try {
+        my_throwing_type::throw_flag = 1;
+        assign_q = src_q;
+        REMARK("FAILED: Assign did not throw exception.\n");
+    } catch(...) {
+        ASSERT(assign_q.empty(), "FAILED: assign_q should be empty.\n");
+    }
+    REMARK("Assignment exceptions testing complete.\n");
+#ifndef __TBB_ITERATOR_DEBUGGING_EXCEPTIONS_BROKEN
+    REMARK("Testing push exceptions.\n");
+    for (size_t i=0; i<push_selector_variants; ++i) {
+        my_throwing_type::throw_flag = 0;
+        pq = new cpq_ex_test_type(3);
+        try {
+            push_selector(pq, elem, i);
+            push_selector(pq, elem, i);
+            push_selector(pq, elem, i);
+        } catch(...) {
+            ASSERT(false, "FAILED: Push should not throw exception... yet.\n");
+        }
+        try { // should crash on copy during expansion of vector
+            my_throwing_type::throw_flag = 1;
+            push_selector(pq, elem, i);
+            REMARK("FAILED: Push did not throw exception.\n");
+        } catch(...) {
+            ASSERT(!pq->empty(), "FAILED: pq should not be empty.\n");
+            ASSERT(pq->size()==3, "FAILED: pq should be only three elements.\n");
+            ASSERT(pq->try_pop(elem), "FAILED: pq is not functional.\n");
+        }
+        delete pq;
+
+        my_throwing_type::throw_flag = 0;
+        pq = new cpq_ex_test_type(3);
+        try {
+            push_selector(pq, elem, i);
+            push_selector(pq, elem, i);
+        } catch(...) {
+            ASSERT(false, "FAILED: Push should not throw exception... yet.\n");
+        }
+        try { // should crash on push copy of element
+            my_throwing_type::throw_flag = 1;
+            push_selector(pq, elem, i);
+            REMARK("FAILED: Push did not throw exception.\n");
+        } catch(...) {
+            ASSERT(!pq->empty(), "FAILED: pq should not be empty.\n");
+            ASSERT(pq->size()==2, "FAILED: pq should be only two elements.\n");
+            ASSERT(pq->try_pop(elem), "FAILED: pq is not functional.\n");
+        }
+        delete pq;
+    }
+    REMARK("Push exceptions testing complete.\n");
+#endif
+#endif // TBB_USE_EXCEPTIONS
+}
+
+template <typename T, typename C>
+void TestFlogger(int nThreads, T /*max*/, C /*compare*/) {
+    REMARK("Testing queue flogger.\n");
+    concurrent_priority_queue<T, C> *q = new concurrent_priority_queue<T, C> (0);
+    NativeParallelFor(nThreads, FloggerBody<T, C >(nThreads, q));
+    ASSERT(q->empty(), "FAILED flogger/empty test.");
+    ASSERT(!q->size(), "FAILED flogger/size test.");
+    REMARK("Flogging complete.\n");
+    delete q;
+}
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+#include "test_initializer_list.h"
+
+void TestInitList(){
+    REMARK("testing initializer_list methods \n");
+    using namespace initializer_list_support_tests;
+    TestInitListSupport<tbb::concurrent_priority_queue<char> >({1,2,3,4,5});
+    TestInitListSupport<tbb::concurrent_priority_queue<int> >({});
+}
+#endif //if __TBB_INITIALIZER_LISTS_PRESENT
+
+struct special_member_calls_t {
+    size_t copy_constructor_called_times;
+    size_t move_constructor_called_times;
+    size_t copy_assignment_called_times;
+    size_t move_assignment_called_times;
+
+    bool friend operator==(special_member_calls_t const& lhs, special_member_calls_t const& rhs){
+        return
+                lhs.copy_constructor_called_times == rhs.copy_constructor_called_times
+             && lhs.move_constructor_called_times == rhs.move_constructor_called_times
+             && lhs.copy_assignment_called_times == rhs.copy_assignment_called_times
+             && lhs.move_assignment_called_times == rhs.move_assignment_called_times;
+    }
+
+};
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+struct MoveOperationTracker {
+    static size_t copy_constructor_called_times;
+    static size_t move_constructor_called_times;
+    static size_t copy_assignment_called_times;
+    static size_t move_assignment_called_times;
+
+    static special_member_calls_t special_member_calls(){
+        special_member_calls_t calls = {copy_constructor_called_times, move_constructor_called_times, copy_assignment_called_times, move_assignment_called_times};
+        return calls;
+    }
+    static size_t value_counter;
+
+    size_t value;
+
+    MoveOperationTracker() : value(++value_counter) {}
+    MoveOperationTracker( const size_t value_ ) : value( value_ ) {}
+    ~MoveOperationTracker() __TBB_NOEXCEPT( true ) {
+        value = 0;
+    }
+    MoveOperationTracker(const MoveOperationTracker& m) : value(m.value) {
+        ASSERT(m.value, "The object has been moved or destroyed");
+        ++copy_constructor_called_times;
+    }
+    MoveOperationTracker(MoveOperationTracker&& m) __TBB_NOEXCEPT(true) : value(m.value) {
+        ASSERT(m.value, "The object has been moved or destroyed");
+        m.value = 0;
+        ++move_constructor_called_times;
+    }
+    MoveOperationTracker& operator=(MoveOperationTracker const& m) {
+        ASSERT(m.value, "The object has been moved or destroyed");
+        value = m.value;
+        ++copy_assignment_called_times;
+        return *this;
+    }
+    MoveOperationTracker& operator=(MoveOperationTracker&& m) __TBB_NOEXCEPT(true) {
+        ASSERT(m.value, "The object has been moved or destroyed");
+        value = m.value;
+        m.value = 0;
+        ++move_assignment_called_times;
+        return *this;
+    }
+
+    bool operator<(MoveOperationTracker const &m) const {
+        ASSERT(value, "The object has been moved or destroyed");
+        ASSERT(m.value, "The object has been moved or destroyed");
+        return value < m.value;
+    }
+
+    friend bool operator==(MoveOperationTracker const &lhs, MoveOperationTracker const &rhs){
+        return !(lhs < rhs) && !(rhs <lhs);
+    }
+};
+size_t MoveOperationTracker::copy_constructor_called_times = 0;
+size_t MoveOperationTracker::move_constructor_called_times = 0;
+size_t MoveOperationTracker::copy_assignment_called_times = 0;
+size_t MoveOperationTracker::move_assignment_called_times = 0;
+size_t MoveOperationTracker::value_counter = 0;
+
+template<typename allocator = tbb::cache_aligned_allocator<MoveOperationTracker> >
+struct cpq_src_fixture : NoAssign {
+    enum {default_container_size = 100};
+    typedef concurrent_priority_queue<MoveOperationTracker, std::less<MoveOperationTracker>, typename allocator:: template rebind<MoveOperationTracker>::other > cpq_t;
+
+    cpq_t cpq_src;
+    const size_t  container_size;
+
+    void init(){
+        size_t &mcct = MoveOperationTracker::move_constructor_called_times;
+        size_t &ccct = MoveOperationTracker::copy_constructor_called_times;
+        size_t &cact = MoveOperationTracker::copy_assignment_called_times;
+        size_t &mact = MoveOperationTracker::move_assignment_called_times;
+        mcct = ccct = cact = mact = 0;
+
+        for (size_t i=1; i <= container_size; ++i){
+            cpq_src.push(MoveOperationTracker(i));
+        }
+        ASSERT(cpq_src.size() == container_size, "error in test setup ?" );
+    }
+
+    cpq_src_fixture(size_t size = default_container_size) : container_size(size){
+        init();
+    }
+
+    cpq_src_fixture(typename cpq_t::allocator_type const& a, size_t size = default_container_size) : cpq_src(a), container_size(size){
+        init();
+    }
+
+};
+
+
+void TestStealingMoveConstructor(){
+    typedef cpq_src_fixture<> fixture_t;
+    fixture_t fixture;
+    fixture_t::cpq_t src_copy(fixture.cpq_src);
+
+    special_member_calls_t previous = MoveOperationTracker::special_member_calls();
+    fixture_t::cpq_t dst(std::move(fixture.cpq_src));
+    ASSERT(previous == MoveOperationTracker::special_member_calls(), "stealing move constructor should not create any new elements");
+
+    ASSERT(dst == src_copy, "cpq content changed during stealing move ?");
+}
+
+void TestStealingMoveConstructorOtherAllocatorInstance(){
+    typedef two_memory_arenas_fixture<MoveOperationTracker> arena_fixture_t;
+    typedef cpq_src_fixture<arena_fixture_t::allocator_t > fixture_t;
+
+    arena_fixture_t arena_fixture(8 * fixture_t::default_container_size, "TestStealingMoveConstructorOtherAllocatorInstance");
+    fixture_t fixture(arena_fixture.source_allocator);
+    fixture_t::cpq_t src_copy(fixture.cpq_src);
+
+    special_member_calls_t previous = MoveOperationTracker::special_member_calls();
+    fixture_t::cpq_t dst(std::move(fixture.cpq_src), arena_fixture.source_allocator);
+    ASSERT(previous == MoveOperationTracker::special_member_calls(), "stealing move constructor should not create any new elements");
+
+    ASSERT(dst == src_copy, "cpq content changed during stealing move ?");
+}
+
+void TestPerElementMoveConstructorOtherAllocatorInstance(){
+    typedef two_memory_arenas_fixture<MoveOperationTracker> arena_fixture_t;
+    typedef cpq_src_fixture<arena_fixture_t::allocator_t > fixture_t;
+
+    arena_fixture_t arena_fixture(8 * fixture_t::default_container_size, "TestPerElementMoveConstructorOtherAllocatorInstance");
+    fixture_t fixture(arena_fixture.source_allocator);
+    fixture_t::cpq_t src_copy(fixture.cpq_src);
+
+    special_member_calls_t move_ctor_called_cpq_size_times = MoveOperationTracker::special_member_calls();
+    move_ctor_called_cpq_size_times.move_constructor_called_times += fixture.container_size;
+
+    fixture_t::cpq_t dst(std::move(fixture.cpq_src), arena_fixture.dst_allocator);
+    ASSERT(move_ctor_called_cpq_size_times == MoveOperationTracker::special_member_calls(), "Per element move constructor should move initialize all new elements");
+    ASSERT(dst == src_copy, "cpq content changed during move ?");
+}
+
+void TestgMoveConstructor(){
+    TestStealingMoveConstructor();
+    TestStealingMoveConstructorOtherAllocatorInstance();
+    TestPerElementMoveConstructorOtherAllocatorInstance();
+}
+
+void TestStealingMoveAssignOperator(){
+    typedef cpq_src_fixture<> fixture_t;
+    fixture_t fixture;
+    fixture_t::cpq_t src_copy(fixture.cpq_src);
+
+    fixture_t::cpq_t dst;
+    special_member_calls_t previous = MoveOperationTracker::special_member_calls();
+    dst = std::move(fixture.cpq_src);
+    ASSERT(previous == MoveOperationTracker::special_member_calls(), "stealing move assign operator should not create any new elements");
+
+    ASSERT(dst == src_copy, "cpq content changed during stealing move ?");
+}
+
+void TestStealingMoveAssignOperatorWithStatefulAllocator(){
+    //Use stateful allocator which is propagated on assignment , i.e. POCMA = true
+    typedef two_memory_arenas_fixture<MoveOperationTracker, /*pocma =*/Harness::true_type> arena_fixture_t;
+    typedef cpq_src_fixture<arena_fixture_t::allocator_t > fixture_t;
+
+    arena_fixture_t arena_fixture(8 * fixture_t::default_container_size, "TestStealingMoveAssignOperatorWithStatefullAllocator");
+    fixture_t fixture(arena_fixture.source_allocator);
+    fixture_t::cpq_t src_copy(fixture.cpq_src);
+    fixture_t::cpq_t dst(arena_fixture.dst_allocator);
+
+    special_member_calls_t previous = MoveOperationTracker::special_member_calls();
+    dst = std::move(fixture.cpq_src);
+    ASSERT(previous == MoveOperationTracker::special_member_calls(), "stealing move assignment operator should not create any new elements");
+
+    ASSERT(dst == src_copy, "cpq content changed during stealing move ?");
+}
+
+void TestPerElementMoveAssignOperator(){
+    //use stateful allocator which is not propagate on assignment , i.e. POCMA = false
+    typedef two_memory_arenas_fixture<MoveOperationTracker, /*pocma =*/Harness::false_type> arena_fixture_t;
+    typedef cpq_src_fixture<arena_fixture_t::allocator_t > fixture_t;
+
+    arena_fixture_t arena_fixture(8 * fixture_t::default_container_size, "TestPerElementMoveAssignOperator");
+    fixture_t fixture(arena_fixture.source_allocator);
+    fixture_t::cpq_t src_copy(fixture.cpq_src);
+    fixture_t::cpq_t dst(arena_fixture.dst_allocator);
+
+    special_member_calls_t move_ctor_called_cpq_size_times = MoveOperationTracker::special_member_calls();
+    move_ctor_called_cpq_size_times.move_constructor_called_times += fixture.container_size;
+    dst = std::move(fixture.cpq_src);
+    ASSERT(move_ctor_called_cpq_size_times == MoveOperationTracker::special_member_calls(), "per element move assignment should move initialize new elements");
+
+    ASSERT(dst == src_copy, "cpq content changed during per element move ?");
+}
+
+void TestgMoveAssignOperator(){
+    TestStealingMoveAssignOperator();
+#if    __TBB_ALLOCATOR_TRAITS_PRESENT
+    TestStealingMoveAssignOperatorWithStatefulAllocator();
+#endif //__TBB_ALLOCATOR_TRAITS_PRESENT
+    TestPerElementMoveAssignOperator();
+}
+
+struct ForwardInEmplaceTester {
+    int a;
+    static bool moveCtorCalled;
+    ForwardInEmplaceTester( int a_val ) : a( a_val ) {}
+    ForwardInEmplaceTester( ForwardInEmplaceTester&& obj, int a_val ) : a( obj.a ) {
+        moveCtorCalled = true;
+        obj.a = a_val;
+    }
+    bool operator<( ForwardInEmplaceTester const& ) const { return true; }
+};
+bool ForwardInEmplaceTester::moveCtorCalled = false;
+
+struct NoDefaultCtorType {
+    size_t value1, value2;
+    NoDefaultCtorType( size_t value1_, size_t value2_ ) : value1( value1_ ), value2( value2_ ) {}
+    bool operator<(NoDefaultCtorType const &m) const {
+        return value1+value2 < m.value1+m.value2;
+    }
+};
+
+void TestMoveSupportInPushPop() {
+    REMARK("Testing Move Support in Push/Pop...");
+    size_t &mcct = MoveOperationTracker::move_constructor_called_times;
+    size_t &ccct = MoveOperationTracker::copy_constructor_called_times;
+    size_t &cact = MoveOperationTracker::copy_assignment_called_times;
+    size_t &mact = MoveOperationTracker::move_assignment_called_times;
+    mcct = ccct = cact = mact = 0;
+
+    concurrent_priority_queue<MoveOperationTracker> q1;
+
+    ASSERT(mcct == 0, "Value must be zero-initialized");
+    ASSERT(ccct == 0, "Value must be zero-initialized");
+
+    q1.push(MoveOperationTracker());
+    ASSERT(mcct > 0, "Not working push(T&&)?");
+    ASSERT(ccct == 0, "Copying of arg occurred during push(T&&)");
+
+    MoveOperationTracker ob;
+    const size_t prev_mcct = mcct;
+    q1.push(std::move(ob));
+    ASSERT(mcct > prev_mcct, "Not working push(T&&)?");
+    ASSERT(ccct == 0, "Copying of arg occurred during push(T&&)");
+
+    ASSERT(cact == 0, "Copy assignment called during push(T&&)");
+    const size_t prev_mact = mact;
+    q1.try_pop(ob);
+    ASSERT(cact == 0, "Copy assignment called during try_pop(T&)");
+    ASSERT(mact > prev_mact, "Move assignment was not called during try_pop(T&)");
+
+    REMARK(" works.\n");
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    REMARK("Testing Emplace...");
+
+    concurrent_priority_queue<NoDefaultCtorType> q2;
+    q2.emplace(15, 3);
+    q2.emplace(2, 35);
+    q2.emplace(8, 8);
+
+    NoDefaultCtorType o(0, 0);
+    q2.try_pop(o);
+    ASSERT(o.value1 == 2 && o.value2 == 35, "Unexpected data popped; possible emplace() failure.");
+    q2.try_pop(o);
+    ASSERT(o.value1 == 15 && o.value2 == 3, "Unexpected data popped; possible emplace() failure.");
+    q2.try_pop(o);
+    ASSERT(o.value1 == 8 && o.value2 == 8, "Unexpected data popped; possible emplace() failure.");
+    ASSERT(!q2.try_pop(o), "The queue should be empty.");
+
+    //TODO: revise this test
+    concurrent_priority_queue<ForwardInEmplaceTester> q3;
+    ASSERT( ForwardInEmplaceTester::moveCtorCalled == false, NULL );
+    q3.emplace( ForwardInEmplaceTester(5), 2 );
+    ASSERT( ForwardInEmplaceTester::moveCtorCalled == true, "Not used std::forward in emplace()?" );
+    ForwardInEmplaceTester obj( 0 );
+    q3.try_pop( obj );
+    ASSERT( obj.a == 5, "Not used std::forward in emplace()?" );
+    ASSERT(!q3.try_pop( obj ), "The queue should be empty.");
+
+    REMARK(" works.\n");
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+}
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+void TestCpqOnNThreads( int nThreads ) {
+    std::less<int> int_compare;
+    my_less data_compare;
+
+    TestConstructorsDestructorsAccessors();
+    TestAssignmentClearSwap();
+    TestSerialPushPop();
+
+    TestParallelPushPop( nThreads, INT_MAX, INT_MIN, int_compare );
+    TestParallelPushPop( nThreads, (unsigned char)CHAR_MAX, (unsigned char)CHAR_MIN, int_compare );
+    TestParallelPushPop( nThreads, DATA_MAX, DATA_MIN, data_compare );
+
+    TestFlogger( nThreads, INT_MAX, int_compare );
+    TestFlogger( nThreads, (unsigned char)CHAR_MAX, int_compare );
+    TestFlogger( nThreads, DATA_MAX, data_compare );
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    MoveOperationTracker::copy_assignment_called_times = 0;
+    TestFlogger( nThreads, MoveOperationTracker(), std::less<MoveOperationTracker>() );
+    ASSERT( MoveOperationTracker::copy_assignment_called_times == 0, "Copy assignment called during try_pop(T&)?" );
+#endif
+
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    TestExceptions();
+#else
+    REPORT( "Known issue: exception handling tests are skipped.\n" );
+#endif
+}
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+struct SmartPointersCompare {
+    template <typename Type> bool operator() (const std::shared_ptr<Type> &t1, const std::shared_ptr<Type> &t2) {
+        return *t1 < *t2;
+    }
+    template <typename Type> bool operator() (const std::weak_ptr<Type> &t1, const std::weak_ptr<Type> &t2) {
+        return *t1.lock().get() < *t2.lock().get();
+    }
+    template <typename Type> bool operator() (const std::unique_ptr<Type> &t1, const std::unique_ptr<Type> &t2) {
+        return *t1 < *t2;
+    }
+};
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+// The helper calls copying or moving push operator if an element has copy constructor.
+// Otherwise it calls only moving push operator.
+template <bool hasCopyCtor>
+struct QueuePushHelper {
+    template <typename Q, typename T>
+    static void push( Q &q, T &&t ) {
+        q.push( std::forward<T>(t) );
+    }
+};
+template <>
+template <typename Q, typename T>
+void QueuePushHelper<false>::push( Q &q, T &&t ) {
+    q.push( std::move(t) );
+}
+#else
+template <bool hasCopyCtor>
+struct QueuePushHelper {
+    template <typename Q, typename T>
+    static void push( Q &q, const T &t ) {
+        q.push( t );
+    }
+};
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+template <bool hasCopyCtor, typename Queue>
+void Examine(Queue &q1, Queue &q2, const std::vector<typename Queue::value_type> &vecSorted) {
+    typedef typename Queue::value_type ValueType;
+
+    ASSERT(!q1.empty() && q1.size() == vecSorted.size(), NULL);
+
+    ValueType elem;
+
+    q2.clear();
+    ASSERT(q2.empty() && !q2.size() && !q2.try_pop(elem), NULL);
+
+    typename std::vector<ValueType>::const_reverse_iterator it1;
+    for (it1 = vecSorted.rbegin(); q1.try_pop(elem); it1++) {
+        ASSERT( Harness::IsEqual()(elem, *it1), NULL );
+        if ( std::distance(vecSorted.rbegin(), it1) % 2 )
+            QueuePushHelper<hasCopyCtor>::push(q2,elem);
+        else
+            QueuePushHelper<hasCopyCtor>::push(q2,tbb::internal::move(elem));
+    }
+    ASSERT(it1 == vecSorted.rend(), NULL);
+    ASSERT(q1.empty() && !q1.size(), NULL);
+    ASSERT(!q2.empty() && q2.size() == vecSorted.size(), NULL);
+
+    q1.swap(q2);
+    ASSERT(q2.empty() && !q2.size(), NULL);
+    ASSERT(!q1.empty() && q1.size() == vecSorted.size(), NULL);
+    for (it1 = vecSorted.rbegin(); q1.try_pop(elem); it1++) ASSERT(Harness::IsEqual()(elem, *it1), NULL);
+    ASSERT(it1 == vecSorted.rend(), NULL);
+
+    typename Queue::allocator_type a = q1.get_allocator();
+    ValueType *ptr = a.allocate(1);
+    ASSERT(ptr, NULL);
+    a.deallocate(ptr, 1);
+}
+
+template <typename Queue>
+void Examine(const Queue &q, const std::vector<typename Queue::value_type> &vecSorted) {
+    Queue q1(q), q2(q);
+    Examine</*hasCopyCtor=*/true>( q1, q2, vecSorted );
+}
+
+template <typename ValueType, typename Compare>
+void TypeTester(const std::vector<ValueType> &vec, Compare comp) {
+    typedef tbb::concurrent_priority_queue<ValueType, Compare> Queue;
+    typedef tbb::concurrent_priority_queue< ValueType, Compare, debug_allocator<ValueType> > QueueDebugAlloc;
+    __TBB_ASSERT(vec.size() >= 5, "Array should have at least 5 elements");
+
+    std::vector<ValueType> vecSorted(vec);
+    std::sort( vecSorted.begin(), vecSorted.end(), comp );
+
+    // Construct an empty queue.
+    Queue q1;
+    q1.assign(vec.begin(), vec.end());
+    Examine(q1, vecSorted);
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    // Constructor from initializer_list.
+    Queue q2({ vec[0], vec[1], vec[2] });
+    for (typename std::vector<ValueType>::const_iterator it = vec.begin() + 3; it != vec.end(); ++it) q2.push(*it);
+    Examine(q2, vecSorted);
+    Queue q3;
+    q3 = { vec[0], vec[1], vec[2] };
+    for (typename std::vector<ValueType>::const_iterator it = vec.begin() + 3; it != vec.end(); ++it) q3.push(*it);
+    Examine(q3, vecSorted);
+#endif
+    // Copying constructor.
+    Queue q4(q1);
+    Examine(q4, vecSorted);
+    // Construct with non-default allocator.
+    QueueDebugAlloc q5;
+    q5.assign(vec.begin(), vec.end());
+    Examine(q5, vecSorted);
+    // Copying constructor for vector with different allocator type.
+    QueueDebugAlloc q6(q5);
+    Examine(q6, vecSorted);
+    // Construction with copying iteration range and given allocator instance.
+    Queue q7(vec.begin(), vec.end());
+    Examine(q7, vecSorted);
+    typename QueueDebugAlloc::allocator_type a;
+    QueueDebugAlloc q8(a);
+    q8.assign(vec.begin(), vec.end());
+    Examine(q8, vecSorted);
+}
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT
+template <typename T>
+void TypeTesterUniquePtr(const std::vector<T> &vec) {
+    __TBB_ASSERT(vec.size() >= 5, "Array should have at least 5 elements");
+
+    typedef std::unique_ptr<T> ValueType;
+    typedef tbb::concurrent_priority_queue<ValueType, SmartPointersCompare> Queue;
+    typedef tbb::concurrent_priority_queue< ValueType, SmartPointersCompare, debug_allocator<ValueType> > QueueDebugAlloc;
+
+    std::vector<ValueType> vecSorted;
+    for ( typename std::vector<T>::const_iterator it = vec.begin(); it != vec.end(); ++it ) {
+        vecSorted.push_back( ValueType(new T(*it)) );
+    }
+    std::sort( vecSorted.begin(), vecSorted.end(), SmartPointersCompare() );
+
+    Queue q1, q1Copy;
+    QueueDebugAlloc q2, q2Copy;
+    for ( typename std::vector<T>::const_iterator it = vec.begin(); it != vec.end(); ++it ) {
+        q1.push( ValueType(new T(*it)) );
+        q1Copy.push( ValueType(new T(*it)) );
+        q2.push( ValueType(new T(*it)) );
+        q2Copy.push( ValueType(new T(*it)) );
+    }
+    Examine</*isCopyCtor=*/false>(q1, q1Copy, vecSorted);
+    Examine</*isCopyCtor=*/false>(q2, q2Copy, vecSorted);
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    Queue q3Copy;
+    QueueDebugAlloc q4Copy;
+
+    q1.clear();
+    q2.clear();
+    for ( typename std::vector<T>::const_iterator it = vec.begin(); it != vec.end(); ++it ) {
+        q1.emplace( new T(*it) );
+        q3Copy.emplace( new T(*it) );
+        q2.emplace( new T(*it) );
+        q4Copy.emplace( new T(*it) );
+    }
+
+    Queue q3( std::move(q1) );
+    QueueDebugAlloc q4( std::move(q2) );
+    Examine</*isCopyCtor=*/false>(q3, q3Copy, vecSorted);
+    Examine</*isCopyCtor=*/false>(q4, q4Copy, vecSorted);
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+}
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT */
+
+template <typename ValueType>
+void TypeTester(const std::vector<ValueType> &vec) { TypeTester(vec, std::less<ValueType>()); }
+
+void TestTypes() {
+    const int NUMBER = 10;
+
+    Harness::FastRandom rnd(1234);
+
+    std::vector<int> arrInt;
+    for (int i = 0; i<NUMBER; ++i) arrInt.push_back(rnd.get());
+    std::vector< tbb::atomic<int> > arrTbb;
+    for (int i = 0; i<NUMBER; ++i) {
+        tbb::atomic<int> a;
+        a = rnd.get();
+        arrTbb.push_back(a);
+    }
+
+    TypeTester(arrInt);
+    TypeTester(arrTbb);
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+    std::vector< std::shared_ptr<int> > arrShr;
+    for (int i = 0; i<NUMBER; ++i) {
+        const int rnd_get = rnd.get();
+        arrShr.push_back(std::make_shared<int>(rnd_get));
+    }
+    std::vector< std::weak_ptr<int> > arrWk;
+    std::copy(arrShr.begin(), arrShr.end(), std::back_inserter(arrWk));
+    TypeTester(arrShr, SmartPointersCompare());
+    TypeTester(arrWk, SmartPointersCompare());
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT
+#if __TBB_IS_COPY_CONSTRUCTIBLE_BROKEN
+    REPORT( "Known issue: std::is_copy_constructible is broken for move-only types. So the std::unique_ptr test is skipped.\n" );
+#else
+    TypeTesterUniquePtr(arrInt);
+#endif /* __TBB_IS_COPY_CONSTRUCTIBLE_BROKEN */
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT */
+#else
+    REPORT( "Known issue: C++11 smart pointer tests are skipped.\n" );
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+}
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+template <template <typename...>typename TQueue>
+void TestDeductionGuides() {
+    using ComplexType = const std::string*;
+    std::string s("s");
+    std::vector<ComplexType> v;
+    auto l = {ComplexType(&s), ComplexType(&s) };
+
+    // check TQueue(InputIterator, InputIterator)
+    TQueue q1(v.begin(), v.end());
+    static_assert(std::is_same<decltype(q1), TQueue<ComplexType>>::value);
+
+    // check TQueue(InputIterator, InputIterator, Allocator)
+    TQueue q2(v.begin(), v.end(), std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q2), TQueue<ComplexType, std::less<ComplexType>,
+        std::allocator<ComplexType>>>::value);
+
+    // check TQueue(std::initializer_list)
+    TQueue q3(l);
+    static_assert(std::is_same<decltype(q3), TQueue<ComplexType>>::value);
+
+    // check TQueue(std::initializer_list, Allocator)
+    TQueue q4(l, std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q4), TQueue<ComplexType, std::less<ComplexType>,
+        std::allocator<ComplexType>>>::value);
+
+    // check TQueue(TQueue &)
+    TQueue q5(q1);
+    static_assert(std::is_same<decltype(q5), decltype(q5)>::value);
+
+    // check TQueue(TQueue &, Allocator)
+    TQueue q6(q4, std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q6), decltype(q4)>::value);
+
+    // check TQueue(TQueue &&)
+    TQueue q7(std::move(q1));
+    static_assert(std::is_same<decltype(q7), decltype(q1)>::value);
+
+    // check TQueue(TQueue &&, Allocator)
+    TQueue q8(std::move(q4), std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q8), decltype(q4)>::value);
+}
+#endif
+
+int TestMain() {
+    if (MinThread < 1)
+        MinThread = 1;
+
+    TestHelpers();
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    TestInitList();
+#else
+    REPORT("Known issue: initializer list tests are skipped.\n");
+#endif
+
+    TestTypes();
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+    TestDeductionGuides<tbb::concurrent_priority_queue>();
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestgMoveConstructor();
+    TestgMoveAssignOperator();
+    TestMoveSupportInPushPop();
+#else
+    REPORT("Known issue: move support tests are skipped.\n");
+#endif
+
+    for (int p = MinThread; p <= MaxThread; ++p) {
+        REMARK("Testing on %d threads.\n", p);
+        TestCpqOnNThreads(p);
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_queue.cpp b/xdl/third_party/tbb/src/test/test_concurrent_queue.cpp
new file mode 100644
index 00000000..72bf7e78
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_queue.cpp
@@ -0,0 +1,1761 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define NOMINMAX
+#include "harness_defs.h"
+#include "tbb/concurrent_queue.h"
+#include "tbb/tick_count.h"
+#include "harness.h"
+#include "harness_allocator.h"
+
+using tbb::internal::spin_wait_while;
+
+#include <vector>
+
+static tbb::atomic<long> FooConstructed;
+static tbb::atomic<long> FooDestroyed;
+
+enum state_t{
+    LIVE=0x1234,
+    DEAD=0xDEAD
+};
+
+class Foo {
+    state_t state;
+public:
+    int thread_id;
+    int serial;
+    Foo() : state(LIVE), thread_id(0), serial(0) {
+        ++FooConstructed;
+    }
+    Foo( const Foo& item ) : state(LIVE) {
+        ASSERT( item.state==LIVE, NULL );
+        ++FooConstructed;
+        thread_id = item.thread_id;
+        serial = item.serial;
+    }
+    ~Foo() {
+        ASSERT( state==LIVE, NULL );
+        ++FooDestroyed;
+        state=DEAD;
+        thread_id=DEAD;
+        serial=DEAD;
+    }
+    void operator=( const Foo& item ) {
+        ASSERT( item.state==LIVE, NULL );
+        ASSERT( state==LIVE, NULL );
+        thread_id = item.thread_id;
+        serial = item.serial;
+    }
+    bool is_const() {return false;}
+    bool is_const() const {return true;}
+    static void clear_counters() { FooConstructed = 0; FooDestroyed = 0; }
+    static long get_n_constructed() { return FooConstructed; }
+    static long get_n_destroyed() { return FooDestroyed; }
+};
+
+// problem size
+static const int N = 50000;     // # of bytes
+
+#if TBB_USE_EXCEPTIONS
+//! Exception for concurrent_queue
+class Foo_exception : public std::bad_alloc {
+public:
+    virtual const char *what() const throw() __TBB_override { return "out of Foo limit"; }
+    virtual ~Foo_exception() throw() {}
+};
+
+static tbb::atomic<long> FooExConstructed;
+static tbb::atomic<long> FooExDestroyed;
+static tbb::atomic<long> serial_source;
+static long MaxFooCount = 0;
+static const long Threshold = 400;
+
+class FooEx {
+    state_t state;
+public:
+    int serial;
+    FooEx() : state(LIVE) {
+        ++FooExConstructed;
+        serial = serial_source++;
+    }
+    FooEx( const FooEx& item ) : state(LIVE) {
+        ASSERT( item.state == LIVE, NULL );
+        ++FooExConstructed;
+        if( MaxFooCount && (FooExConstructed-FooExDestroyed) >= MaxFooCount ) // in push()
+            throw Foo_exception();
+        serial = item.serial;
+    }
+    ~FooEx() {
+        ASSERT( state==LIVE, NULL );
+        ++FooExDestroyed;
+        state=DEAD;
+        serial=DEAD;
+    }
+    void operator=( FooEx& item ) {
+        ASSERT( item.state==LIVE, NULL );
+        ASSERT( state==LIVE, NULL );
+        serial = item.serial;
+        if( MaxFooCount==2*Threshold && (FooExConstructed-FooExDestroyed) <= MaxFooCount/4 ) // in pop()
+            throw Foo_exception();
+    }
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    void operator=( FooEx&& item ) {
+        operator=( item );
+        item.serial = 0;
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+} ;
+#endif /* TBB_USE_EXCEPTIONS */
+
+const size_t MAXTHREAD = 256;
+
+static int Sum[MAXTHREAD];
+
+//! Count of various pop operations
+/** [0] = pop_if_present that failed
+    [1] = pop_if_present that succeeded
+    [2] = pop */
+static tbb::atomic<long> PopKind[3];
+
+const int M = 10000;
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT && __TBB_CPP11_RVALUE_REF_PRESENT
+const size_t push_selector_variants = 3;
+#elif __TBB_CPP11_RVALUE_REF_PRESENT
+const size_t push_selector_variants = 2;
+#else
+const size_t push_selector_variants = 1;
+#endif
+
+template<typename CQ, typename ValueType, typename CounterType>
+void push( CQ& q, ValueType v, CounterType i ) {
+    switch( i % push_selector_variants ) {
+    case 0: q.push( v ); break;
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    case 1: q.push( std::move(v) ); break;
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    case 2: q.emplace( v ); break;
+#endif
+#endif
+    default: ASSERT( false, NULL ); break;
+    }
+}
+
+template<typename CQ,typename T>
+struct Body: NoAssign {
+    CQ* queue;
+    const int nthread;
+    Body( int nthread_ ) : nthread(nthread_) {}
+    void operator()( int thread_id ) const {
+        long pop_kind[3] = {0,0,0};
+        int serial[MAXTHREAD+1];
+        memset( serial, 0, nthread*sizeof(int) );
+        ASSERT( thread_id<nthread, NULL );
+
+        long sum = 0;
+        for( long j=0; j<M; ++j ) {
+            T f;
+            f.thread_id = DEAD;
+            f.serial = DEAD;
+            bool prepopped = false;
+            if( j&1 ) {
+                prepopped = queue->try_pop( f );
+                ++pop_kind[prepopped];
+            }
+            T g;
+            g.thread_id = thread_id;
+            g.serial = j+1;
+            push( *queue, g, j );
+            if( !prepopped ) {
+                while( !(queue)->try_pop(f) ) __TBB_Yield();
+                ++pop_kind[2];
+            }
+            ASSERT( f.thread_id<=nthread, NULL );
+            ASSERT( f.thread_id==nthread || serial[f.thread_id]<f.serial, "partial order violation" );
+            serial[f.thread_id] = f.serial;
+            sum += f.serial-1;
+        }
+        Sum[thread_id] = sum;
+        for( int k=0; k<3; ++k )
+            PopKind[k] += pop_kind[k];
+    }
+};
+
+// Define wrapper classes to test tbb::concurrent_queue<T>
+template<typename T, typename A = tbb::cache_aligned_allocator<T> >
+class ConcQWithSizeWrapper : public tbb::concurrent_queue<T, A> {
+public:
+    ConcQWithSizeWrapper() {}
+    ConcQWithSizeWrapper( const ConcQWithSizeWrapper& q ) : tbb::concurrent_queue<T, A>( q ) {}
+    ConcQWithSizeWrapper(const A& a) : tbb::concurrent_queue<T, A>( a ) {}
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    ConcQWithSizeWrapper(ConcQWithSizeWrapper&& q) : tbb::concurrent_queue<T>( std::move(q) ) {}
+    ConcQWithSizeWrapper(ConcQWithSizeWrapper&& q, const A& a)
+        : tbb::concurrent_queue<T, A>( std::move(q), a ) { }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+    template<typename InputIterator>
+    ConcQWithSizeWrapper( InputIterator begin, InputIterator end, const A& a = A())
+        : tbb::concurrent_queue<T, A>(begin,end,a) {}
+    size_t size() const { return this->unsafe_size(); }
+};
+
+template<typename T>
+class ConcQPushPopWrapper : public tbb::concurrent_queue<T> {
+public:
+    ConcQPushPopWrapper() : my_capacity( size_t(-1)/(sizeof(void*)+sizeof(T)) ) {}
+    size_t size() const { return this->unsafe_size(); }
+    void   set_capacity( const ptrdiff_t n ) { my_capacity = n; }
+    bool   try_push( const T& source ) { return this->push( source ); }
+    bool   try_pop( T& dest ) { return this->tbb::concurrent_queue<T>::try_pop( dest ); }
+    size_t my_capacity;
+};
+
+template<typename T>
+class ConcQWithCapacity : public tbb::concurrent_queue<T> {
+public:
+    ConcQWithCapacity() : my_capacity( size_t(-1)/(sizeof(void*)+sizeof(T)) ) {}
+    size_t size() const { return this->unsafe_size(); }
+    size_t capacity() const { return my_capacity; }
+    void   set_capacity( const int n ) { my_capacity = n; }
+    bool   try_push( const T& source ) { this->push( source ); return (size_t)source.serial<my_capacity; }
+    bool   try_pop( T& dest ) { this->tbb::concurrent_queue<T>::try_pop( dest ); return (size_t)dest.serial<my_capacity; }
+    size_t my_capacity;
+};
+
+template <typename Queue>
+void AssertEquality(Queue &q, const std::vector<typename Queue::value_type> &vec) {
+    ASSERT(q.size() == typename Queue::size_type(vec.size()), NULL);
+    ASSERT(std::equal(q.unsafe_begin(), q.unsafe_end(), vec.begin(), Harness::IsEqual()), NULL);
+}
+
+template <typename Queue>
+void AssertEmptiness(Queue &q) {
+    ASSERT(q.empty(), NULL);
+    ASSERT(!q.size(), NULL);
+    typename Queue::value_type elem;
+    ASSERT(!q.try_pop(elem), NULL);
+}
+
+enum push_t { push_op, try_push_op };
+
+template<push_t push_op>
+struct pusher {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename CQ, typename VType>
+    static bool push( CQ& queue, VType&& val ) {
+        queue.push( std::forward<VType>( val ) );
+        return true;
+    }
+#else
+    template<typename CQ, typename VType>
+    static bool push( CQ& queue, const VType& val ) {
+        queue.push( val );
+        return true;
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+};
+
+template<>
+struct pusher< try_push_op > {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename CQ, typename VType>
+    static bool push( CQ& queue, VType&& val ) {
+        return queue.try_push( std::forward<VType>( val ) );
+    }
+#else
+    template<typename CQ, typename VType>
+    static bool push( CQ& queue, const VType& val ) {
+        return queue.try_push( val );
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+};
+
+enum pop_t { pop_op, try_pop_op };
+
+template<pop_t pop_op>
+struct popper {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename CQ, typename VType>
+    static bool pop( CQ& queue, VType&& val ) {
+        if( queue.empty() ) return false;
+        queue.pop( std::forward<VType>( val ) );
+        return true;
+    }
+#else
+    template<typename CQ, typename VType>
+    static bool pop( CQ& queue, VType& val ) {
+        if( queue.empty() ) return false;
+        queue.pop( val );
+        return true;
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+};
+
+template<>
+struct popper< try_pop_op > {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename CQ, typename VType>
+    static bool pop( CQ& queue, VType&& val ) {
+        return queue.try_pop( std::forward<VType>( val ) );
+    }
+#else
+    template<typename CQ, typename VType>
+    static bool pop( CQ& queue, VType& val ) {
+        return queue.try_pop( val );
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+};
+
+template <push_t push_op, typename Queue>
+void FillTest(Queue &q, const std::vector<typename Queue::value_type> &vec) {
+    for (typename std::vector<typename Queue::value_type>::const_iterator it = vec.begin(); it != vec.end(); ++it)
+        ASSERT(pusher<push_op>::push(q, *it), NULL);
+    AssertEquality(q, vec);
+}
+
+template <pop_t pop_op, typename Queue>
+void EmptyTest(Queue &q, const std::vector<typename Queue::value_type> &vec) {
+    typedef typename Queue::value_type value_type;
+
+    value_type elem;
+    typename std::vector<value_type>::const_iterator it = vec.begin();
+    while (popper<pop_op>::pop(q, elem)) {
+        ASSERT(Harness::IsEqual()(elem, *it), NULL);
+        ++it;
+    }
+    ASSERT(it == vec.end(), NULL);
+    AssertEmptiness(q);
+}
+
+template <typename T, typename A>
+void bounded_queue_specific_test(tbb::concurrent_queue<T, A> &, const std::vector<T> &) { /* do nothing */ }
+
+template <typename T, typename A>
+void bounded_queue_specific_test(tbb::concurrent_bounded_queue<T, A> &q, const std::vector<T> &vec) {
+    typedef typename tbb::concurrent_bounded_queue<T, A>::size_type size_type;
+
+    FillTest<try_push_op>(q, vec);
+    tbb::concurrent_bounded_queue<T, A> q2 = q;
+    EmptyTest<pop_op>(q, vec);
+
+    // capacity
+    q2.set_capacity(size_type(vec.size()));
+    ASSERT(q2.capacity() == size_type(vec.size()), NULL);
+    ASSERT(q2.size() == size_type(vec.size()), NULL);
+    ASSERT(!q2.try_push(vec[0]), NULL);
+
+#if TBB_USE_EXCEPTIONS
+    q.abort();
+#endif
+}
+
+template<typename CQ, typename T>
+void TestPushPop( size_t prefill, ptrdiff_t capacity, int nthread ) {
+    ASSERT( nthread>0, "nthread must be positive" );
+    ptrdiff_t signed_prefill = ptrdiff_t(prefill);
+    if( signed_prefill+1>=capacity )
+        return;
+    bool success = false;
+    for( int k=0; k<3; ++k )
+        PopKind[k] = 0;
+    for( int trial=0; !success; ++trial ) {
+        T::clear_counters();
+        Body<CQ,T> body(nthread);
+        CQ queue;
+        queue.set_capacity( capacity );
+        body.queue = &queue;
+        for( size_t i=0; i<prefill; ++i ) {
+            T f;
+            f.thread_id = nthread;
+            f.serial = 1+int(i);
+            push(queue, f, i);
+            ASSERT( unsigned(queue.size())==i+1, NULL );
+            ASSERT( !queue.empty(), NULL );
+        }
+        tbb::tick_count t0 = tbb::tick_count::now();
+        NativeParallelFor( nthread, body );
+        tbb::tick_count t1 = tbb::tick_count::now();
+        double timing = (t1-t0).seconds();
+        REMARK("prefill=%d capacity=%d threads=%d time = %g = %g nsec/operation\n", int(prefill), int(capacity), nthread, timing, timing/(2*M*nthread)*1.E9);
+        int sum = 0;
+        for( int k=0; k<nthread; ++k )
+            sum += Sum[k];
+        int expected = int(nthread*((M-1)*M/2) + ((prefill-1)*prefill)/2);
+        for( int i=int(prefill); --i>=0; ) {
+            ASSERT( !queue.empty(), NULL );
+            T f;
+            bool result = queue.try_pop(f);
+            ASSERT( result, NULL );
+            ASSERT( int(queue.size())==i, NULL );
+            sum += f.serial-1;
+        }
+        ASSERT( queue.empty(), "The queue should be empty" );
+        ASSERT( queue.size()==0, "The queue should have zero size" );
+        if( sum!=expected )
+            REPORT("sum=%d expected=%d\n",sum,expected);
+        ASSERT( T::get_n_constructed()==T::get_n_destroyed(), NULL );
+        // TODO: checks by counting allocators
+
+        success = true;
+        if( nthread>1 && prefill==0 ) {
+            // Check that pop_if_present got sufficient exercise
+            for( int k=0; k<2; ++k ) {
+#if (_WIN32||_WIN64)
+                // The TBB library on Windows seems to have a tough time generating
+                // the desired interleavings for pop_if_present, so the code tries longer, and settles
+                // for fewer desired interleavings.
+                const int max_trial = 100;
+                const int min_requirement = 20;
+#else
+                const int min_requirement = 100;
+                const int max_trial = 20;
+#endif /* _WIN32||_WIN64 */
+                if( PopKind[k]<min_requirement ) {
+                    if( trial>=max_trial ) {
+                        if( Verbose )
+                            REPORT("Warning: %d threads had only %ld pop_if_present operations %s after %d trials (expected at least %d). "
+                               "This problem may merely be unlucky scheduling. "
+                               "Investigate only if it happens repeatedly.\n",
+                               nthread, long(PopKind[k]), k==0?"failed":"succeeded", max_trial, min_requirement);
+                        else
+                            REPORT("Warning: the number of %s pop_if_present operations is less than expected for %d threads. Investigate if it happens repeatedly.\n",
+                               k==0?"failed":"succeeded", nthread );
+
+                    } else {
+                        success = false;
+                    }
+               }
+            }
+        }
+    }
+}
+
+class Bar {
+    state_t state;
+public:
+    static size_t construction_num, destruction_num;
+    ptrdiff_t my_id;
+    Bar() : state(LIVE), my_id(-1) {}
+    Bar(size_t _i) : state(LIVE), my_id(_i) { construction_num++; }
+    Bar( const Bar& a_bar ) : state(LIVE) {
+        ASSERT( a_bar.state==LIVE, NULL );
+        my_id = a_bar.my_id;
+        construction_num++;
+    }
+    ~Bar() {
+        ASSERT( state==LIVE, NULL );
+        state = DEAD;
+        my_id = DEAD;
+        destruction_num++;
+    }
+    void operator=( const Bar& a_bar ) {
+        ASSERT( a_bar.state==LIVE, NULL );
+        ASSERT( state==LIVE, NULL );
+        my_id = a_bar.my_id;
+    }
+    friend bool operator==(const Bar& bar1, const Bar& bar2 ) ;
+} ;
+
+size_t Bar::construction_num = 0;
+size_t Bar::destruction_num = 0;
+
+bool operator==(const Bar& bar1, const Bar& bar2) {
+    ASSERT( bar1.state==LIVE, NULL );
+    ASSERT( bar2.state==LIVE, NULL );
+    return bar1.my_id == bar2.my_id;
+}
+
+class BarIterator
+{
+    Bar* bar_ptr;
+    BarIterator(Bar* bp_) : bar_ptr(bp_) {}
+public:
+    ~BarIterator() {}
+    BarIterator& operator=( const BarIterator& other ) {
+        bar_ptr = other.bar_ptr;
+        return *this;
+    }
+    Bar& operator*() const {
+        return *bar_ptr;
+    }
+    BarIterator& operator++() {
+        ++bar_ptr;
+        return *this;
+    }
+    Bar* operator++(int) {
+        Bar* result = &operator*();
+        operator++();
+        return result;
+    }
+    friend bool operator==(const BarIterator& bia, const BarIterator& bib) ;
+    friend bool operator!=(const BarIterator& bia, const BarIterator& bib) ;
+    template<typename CQ, typename T, typename TIter, typename CQ_EX, typename T_EX>
+    friend void TestConstructors ();
+} ;
+
+bool operator==(const BarIterator& bia, const BarIterator& bib) {
+    return bia.bar_ptr==bib.bar_ptr;
+}
+
+bool operator!=(const BarIterator& bia, const BarIterator& bib) {
+    return bia.bar_ptr!=bib.bar_ptr;
+}
+
+#if TBB_USE_EXCEPTIONS
+class Bar_exception : public std::bad_alloc {
+public:
+    virtual const char *what() const throw() __TBB_override { return "making the entry invalid"; }
+    virtual ~Bar_exception() throw() {}
+};
+
+class BarEx {
+    static int count;
+public:
+    state_t state;
+    typedef enum {
+        PREPARATION,
+        COPY_CONSTRUCT
+    } mode_t;
+    static mode_t mode;
+    ptrdiff_t my_id;
+    ptrdiff_t my_tilda_id;
+    static int button;
+    BarEx() : state(LIVE), my_id(-1), my_tilda_id(-1) {}
+    BarEx(size_t _i) : state(LIVE), my_id(_i), my_tilda_id(my_id^(-1)) {}
+    BarEx( const BarEx& a_bar ) : state(LIVE) {
+        ASSERT( a_bar.state==LIVE, NULL );
+        my_id = a_bar.my_id;
+        if( mode==PREPARATION )
+            if( !( ++count % 100 ) )
+                throw Bar_exception();
+        my_tilda_id = a_bar.my_tilda_id;
+    }
+    ~BarEx() {
+        ASSERT( state==LIVE, NULL );
+        state = DEAD;
+        my_id = DEAD;
+    }
+    static void set_mode( mode_t m ) { mode = m; }
+    void operator=( const BarEx& a_bar ) {
+        ASSERT( a_bar.state==LIVE, NULL );
+        ASSERT( state==LIVE, NULL );
+        my_id = a_bar.my_id;
+        my_tilda_id = a_bar.my_tilda_id;
+    }
+    friend bool operator==(const BarEx& bar1, const BarEx& bar2 ) ;
+} ;
+
+int    BarEx::count = 0;
+BarEx::mode_t BarEx::mode = BarEx::PREPARATION;
+
+bool operator==(const BarEx& bar1, const BarEx& bar2) {
+    ASSERT( bar1.state==LIVE, NULL );
+    ASSERT( bar2.state==LIVE, NULL );
+    ASSERT( (bar1.my_id ^ bar1.my_tilda_id) == -1, NULL );
+    ASSERT( (bar2.my_id ^ bar2.my_tilda_id) == -1, NULL );
+    return bar1.my_id==bar2.my_id && bar1.my_tilda_id==bar2.my_tilda_id;
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+template<typename CQ, typename T, typename TIter, typename CQ_EX, typename T_EX>
+void TestConstructors ()
+{
+    CQ src_queue;
+    typename CQ::const_iterator dqb;
+    typename CQ::const_iterator dqe;
+    typename CQ::const_iterator iter;
+
+    for( size_t size=0; size<1001; ++size ) {
+        for( size_t i=0; i<size; ++i )
+            src_queue.push(T(i+(i^size)));
+        typename CQ::const_iterator sqb( src_queue.unsafe_begin() );
+        typename CQ::const_iterator sqe( src_queue.unsafe_end()   );
+
+        CQ dst_queue(sqb, sqe);
+
+        ASSERT(src_queue.size()==dst_queue.size(), "different size");
+
+        src_queue.clear();
+    }
+
+    T bar_array[1001];
+    for( size_t size=0; size<1001; ++size ) {
+        for( size_t i=0; i<size; ++i )
+            bar_array[i] = T(i+(i^size));
+
+        const TIter sab(bar_array+0);
+        const TIter sae(bar_array+size);
+
+        CQ dst_queue2(sab, sae);
+
+        ASSERT( size==unsigned(dst_queue2.size()), NULL );
+        ASSERT( sab==TIter(bar_array+0), NULL );
+        ASSERT( sae==TIter(bar_array+size), NULL );
+
+        dqb = dst_queue2.unsafe_begin();
+        dqe = dst_queue2.unsafe_end();
+        TIter v_iter(sab);
+        for( ; dqb != dqe; ++dqb, ++v_iter )
+            ASSERT( *dqb == *v_iter, "unexpected element" );
+        ASSERT( v_iter==sae, "different size?" );
+    }
+
+    src_queue.clear();
+
+    CQ dst_queue3( src_queue );
+    ASSERT( src_queue.size()==dst_queue3.size(), NULL );
+    ASSERT( 0==dst_queue3.size(), NULL );
+
+    int k=0;
+    for( size_t i=0; i<1001; ++i ) {
+        T tmp_bar;
+        src_queue.push(T(++k));
+        src_queue.push(T(++k));
+        src_queue.try_pop(tmp_bar);
+
+        CQ dst_queue4( src_queue );
+
+        ASSERT( src_queue.size()==dst_queue4.size(), NULL );
+
+        dqb = dst_queue4.unsafe_begin();
+        dqe = dst_queue4.unsafe_end();
+        iter = src_queue.unsafe_begin();
+
+        for( ; dqb != dqe; ++dqb, ++iter )
+            ASSERT( *dqb == *iter, "unexpected element" );
+
+        ASSERT( iter==src_queue.unsafe_end(), "different size?" );
+    }
+
+    CQ dst_queue5( src_queue );
+
+    ASSERT( src_queue.size()==dst_queue5.size(), NULL );
+    dqb = dst_queue5.unsafe_begin();
+    dqe = dst_queue5.unsafe_end();
+    iter = src_queue.unsafe_begin();
+    for( ; dqb != dqe; ++dqb, ++iter )
+        ASSERT( *dqb == *iter, "unexpected element" );
+
+    for( size_t i=0; i<100; ++i) {
+        T tmp_bar;
+        src_queue.push(T(i+1000));
+        src_queue.push(T(i+1000));
+        src_queue.try_pop(tmp_bar);
+
+        dst_queue5.push(T(i+1000));
+        dst_queue5.push(T(i+1000));
+        dst_queue5.try_pop(tmp_bar);
+    }
+
+    ASSERT( src_queue.size()==dst_queue5.size(), NULL );
+    dqb = dst_queue5.unsafe_begin();
+    dqe = dst_queue5.unsafe_end();
+    iter = src_queue.unsafe_begin();
+    for( ; dqb != dqe; ++dqb, ++iter )
+        ASSERT( *dqb == *iter, "unexpected element" );
+    ASSERT( iter==src_queue.unsafe_end(), "different size?" );
+
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN || __TBB_PLACEMENT_NEW_EXCEPTION_SAFETY_BROKEN
+    REPORT("Known issue: part of the constructor test is skipped.\n");
+#elif TBB_USE_EXCEPTIONS
+    k = 0;
+    typename CQ_EX::size_type n_elements=0;
+    CQ_EX src_queue_ex;
+    for( size_t size=0; size<1001; ++size ) {
+        T_EX tmp_bar_ex;
+        typename CQ_EX::size_type n_successful_pushes=0;
+        T_EX::set_mode( T_EX::PREPARATION );
+        try {
+            src_queue_ex.push(T_EX(k+(k^size)));
+            ++n_successful_pushes;
+        } catch (...) {
+        }
+        ++k;
+        try {
+            src_queue_ex.push(T_EX(k+(k^size)));
+            ++n_successful_pushes;
+        } catch (...) {
+        }
+        ++k;
+        src_queue_ex.try_pop(tmp_bar_ex);
+        n_elements += (n_successful_pushes - 1);
+        ASSERT( src_queue_ex.size()==n_elements, NULL);
+
+        T_EX::set_mode( T_EX::COPY_CONSTRUCT );
+        CQ_EX dst_queue_ex( src_queue_ex );
+
+        ASSERT( src_queue_ex.size()==dst_queue_ex.size(), NULL );
+
+        typename CQ_EX::const_iterator dqb_ex  = dst_queue_ex.unsafe_begin();
+        typename CQ_EX::const_iterator dqe_ex  = dst_queue_ex.unsafe_end();
+        typename CQ_EX::const_iterator iter_ex = src_queue_ex.unsafe_begin();
+
+        for( ; dqb_ex != dqe_ex; ++dqb_ex, ++iter_ex )
+            ASSERT( *dqb_ex == *iter_ex, "unexpected element" );
+        ASSERT( iter_ex==src_queue_ex.unsafe_end(), "different size?" );
+    }
+#endif /* TBB_USE_EXCEPTIONS */
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    // Testing work of move constructors. TODO: merge into TestMoveConstructors?
+    src_queue.clear();
+
+    typedef typename CQ::size_type qsize_t;
+    for( qsize_t size = 0; size < 1001; ++size ) {
+        for( qsize_t i = 0; i < size; ++i )
+            src_queue.push( T(i + (i ^ size)) );
+        std::vector<const T*> locations(size);
+        typename CQ::const_iterator qit = src_queue.unsafe_begin();
+        for( qsize_t i = 0; i < size; ++i, ++qit )
+            locations[i] = &(*qit);
+
+        qsize_t size_of_queue = src_queue.size();
+        CQ dst_queue( std::move(src_queue) );
+
+        ASSERT( src_queue.empty() && src_queue.size() == 0, "not working move constructor?" );
+        ASSERT( size == size_of_queue && size_of_queue == dst_queue.size(),
+                "not working move constructor?" );
+
+        qit = dst_queue.unsafe_begin();
+        for( qsize_t i = 0; i < size; ++i, ++qit )
+            ASSERT( locations[i] == &(*qit), "there was data movement during move constructor" );
+
+        for( qsize_t i = 0; i < size; ++i ) {
+            T test(i + (i ^ size));
+            T popped;
+            bool pop_result = dst_queue.try_pop( popped );
+
+            ASSERT( pop_result, NULL );
+            ASSERT( test == popped, NULL );
+        }
+    }
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<class T>
+class allocator: public tbb::cache_aligned_allocator<T> {
+public:
+    size_t m_unique_id;
+
+    allocator() : m_unique_id( 0 ) {}
+
+    allocator(size_t unique_id) { m_unique_id = unique_id; }
+
+    template<typename U>
+    allocator(const allocator<U>& a) throw() { m_unique_id = a.m_unique_id; }
+
+    template<typename U>
+    struct rebind { typedef allocator<U> other; };
+
+    friend bool operator==(const allocator& lhs, const allocator& rhs) {
+        return lhs.m_unique_id == rhs.m_unique_id;
+    }
+};
+
+// Checks operability of the queue the data was moved from
+template<typename T, typename CQ>
+void TestQueueOperabilityAfterDataMove( CQ& queue ) {
+    const size_t size = 10;
+    std::vector<T> v(size);
+    for( size_t i = 0; i < size; ++i ) v[i] = T( i * i + i );
+
+    FillTest<push_op>(queue, v);
+    EmptyTest<try_pop_op>(queue, v);
+    bounded_queue_specific_test(queue, v);
+}
+
+template<class CQ, class T>
+void TestMoveConstructors() {
+    T::construction_num = T::destruction_num = 0;
+    CQ src_queue( allocator<T>(0) );
+    const size_t size = 10;
+    for( size_t i = 0; i < size; ++i )
+        src_queue.push( T(i + (i ^ size)) );
+    ASSERT( T::construction_num == 2 * size, NULL );
+    ASSERT( T::destruction_num == size, NULL );
+
+    const T* locations[size];
+    typename CQ::const_iterator qit = src_queue.unsafe_begin();
+    for( size_t i = 0; i < size; ++i, ++qit )
+        locations[i] = &(*qit);
+
+    // Ensuring allocation operation takes place during move when allocators are different
+    T::construction_num = T::destruction_num = 0;
+    CQ dst_queue( std::move(src_queue), allocator<T>(1) );
+    ASSERT( T::construction_num == size, NULL );
+    ASSERT( T::destruction_num == size+1, NULL ); // One item is used by the queue destructor
+
+    TestQueueOperabilityAfterDataMove<T>( src_queue );
+
+    qit = dst_queue.unsafe_begin();
+    for( size_t i = 0; i < size; ++i, ++qit ) {
+        ASSERT( locations[i] != &(*qit), "an item should have been copied but was not" );
+        locations[i] = &(*qit);
+    }
+
+    T::construction_num = T::destruction_num = 0;
+    // Ensuring there is no allocation operation during move with equal allocators
+    CQ dst_queue2( std::move(dst_queue), allocator<T>(1) );
+    ASSERT( T::construction_num == 0, NULL );
+    ASSERT( T::destruction_num == 0, NULL );
+
+    TestQueueOperabilityAfterDataMove<T>( dst_queue );
+
+    qit = dst_queue2.unsafe_begin();
+    for( size_t i = 0; i < size; ++i, ++qit ) {
+        ASSERT( locations[i] == &(*qit), "an item should have been moved but was not" );
+    }
+
+    for( size_t i = 0; i < size; ++i) {
+        T test(i + (i ^ size));
+        T popped;
+        bool pop_result = dst_queue2.try_pop( popped );
+        ASSERT( pop_result, NULL );
+        ASSERT( test == popped, NULL );
+    }
+    ASSERT( dst_queue2.empty(), NULL );
+    ASSERT( dst_queue2.size() == 0, NULL );
+}
+
+void TestMoveConstruction() {
+    REMARK("Testing move constructors with specified allocators...");
+    TestMoveConstructors< ConcQWithSizeWrapper< Bar, allocator<Bar> >, Bar >();
+    TestMoveConstructors< tbb::concurrent_bounded_queue< Bar, allocator<Bar> >, Bar >();
+    // TODO: add tests with movable data
+    REMARK(" work\n");
+}
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAux( Iterator1 i, Iterator2 j, int size ) {
+    Iterator1 old_i; // assigned at first iteration below
+    for( int k=0; k<size; ++k ) {
+        ASSERT( i!=j, NULL );
+        ASSERT( !(i==j), NULL );
+        // Test "->"
+        ASSERT( k+1==i->serial, NULL );
+        if( k&1 ) {
+            // Test post-increment
+            Foo f = *old_i++;
+            ASSERT( k+1==f.serial, NULL );
+            // Test assignment
+            i = old_i;
+        } else {
+            // Test pre-increment
+            if( k<size-1 ) {
+                Foo f = *++i;
+                ASSERT( k+2==f.serial, NULL );
+            } else ++i;
+            // Test assignment
+            old_i = i;
+        }
+    }
+    ASSERT( !(i!=j), NULL );
+    ASSERT( i==j, NULL );
+}
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAssignment( Iterator2 j ) {
+    Iterator1 i(j);
+    ASSERT( i==j, NULL );
+    ASSERT( !(i!=j), NULL );
+    Iterator1 k;
+    k = j;
+    ASSERT( k==j, NULL );
+    ASSERT( !(k!=j), NULL );
+}
+
+template<typename Iterator, typename T>
+void TestIteratorTraits() {
+    AssertSameType( static_cast<typename Iterator::difference_type*>(0), static_cast<ptrdiff_t*>(0) );
+    AssertSameType( static_cast<typename Iterator::value_type*>(0), static_cast<T*>(0) );
+    AssertSameType( static_cast<typename Iterator::pointer*>(0), static_cast<T**>(0) );
+    AssertSameType( static_cast<typename Iterator::iterator_category*>(0), static_cast<std::forward_iterator_tag*>(0) );
+    T x;
+    typename Iterator::reference xr = x;
+    typename Iterator::pointer xp = &x;
+    ASSERT( &xr==xp, NULL );
+}
+
+//! Test the iterators for concurrent_queue
+template<typename CQ>
+void TestIterator() {
+    CQ queue;
+    const CQ& const_queue = queue;
+    for( int j=0; j<500; ++j ) {
+        TestIteratorAux( queue.unsafe_begin()      , queue.unsafe_end()      , j );
+        TestIteratorAux( const_queue.unsafe_begin(), const_queue.unsafe_end(), j );
+        TestIteratorAux( const_queue.unsafe_begin(), queue.unsafe_end()      , j );
+        TestIteratorAux( queue.unsafe_begin()      , const_queue.unsafe_end(), j );
+        Foo f;
+        f.serial = j+1;
+        queue.push(f);
+    }
+    TestIteratorAssignment<typename CQ::const_iterator>( const_queue.unsafe_begin() );
+    TestIteratorAssignment<typename CQ::const_iterator>( queue.unsafe_begin() );
+    TestIteratorAssignment<typename CQ::iterator>( queue.unsafe_begin() );
+    TestIteratorTraits<typename CQ::const_iterator, const Foo>();
+    TestIteratorTraits<typename CQ::iterator, Foo>();
+}
+
+template<typename CQ>
+void TestConcurrentQueueType() {
+    AssertSameType( typename CQ::value_type(), Foo() );
+    Foo f;
+    const Foo g;
+    typename CQ::reference r = f;
+    ASSERT( &r==&f, NULL );
+    ASSERT( !r.is_const(), NULL );
+    typename CQ::const_reference cr = g;
+    ASSERT( &cr==&g, NULL );
+    ASSERT( cr.is_const(), NULL );
+}
+
+template<typename CQ, typename T>
+void TestEmptyQueue() {
+    const CQ queue;
+    ASSERT( queue.size()==0, NULL );
+    ASSERT( queue.capacity()>0, NULL );
+    ASSERT( size_t(queue.capacity())>=size_t(-1)/(sizeof(void*)+sizeof(T)), NULL );
+}
+
+template<typename CQ,typename T>
+void TestFullQueue() {
+    for( int n=0; n<10; ++n ) {
+        T::clear_counters();
+        CQ queue;
+        queue.set_capacity(n);
+        for( int i=0; i<=n; ++i ) {
+            T f;
+            f.serial = i;
+            bool result = queue.try_push( f );
+            ASSERT( result==(i<n), NULL );
+        }
+        for( int i=0; i<=n; ++i ) {
+            T f;
+            bool result = queue.try_pop( f );
+            ASSERT( result==(i<n), NULL );
+            ASSERT( !result || f.serial==i, NULL );
+        }
+        ASSERT( T::get_n_constructed()==T::get_n_destroyed(), NULL );
+    }
+}
+
+template<typename CQ>
+void TestClear() {
+    FooConstructed = 0;
+    FooDestroyed = 0;
+    const unsigned int n=5;
+
+    CQ queue;
+    const int q_capacity=10;
+    queue.set_capacity(q_capacity);
+    for( size_t i=0; i<n; ++i ) {
+        Foo f;
+        f.serial = int(i);
+        queue.push( f );
+    }
+    ASSERT( unsigned(queue.size())==n, NULL );
+    queue.clear();
+    ASSERT( queue.size()==0, NULL );
+    for( size_t i=0; i<n; ++i ) {
+        Foo f;
+        f.serial = int(i);
+        queue.push( f );
+    }
+    ASSERT( unsigned(queue.size())==n, NULL );
+    queue.clear();
+    ASSERT( queue.size()==0, NULL );
+    for( size_t i=0; i<n; ++i ) {
+        Foo f;
+        f.serial = int(i);
+        queue.push( f );
+    }
+    ASSERT( unsigned(queue.size())==n, NULL );
+}
+
+template<typename T>
+struct TestNegativeQueueBody: NoAssign {
+    tbb::concurrent_bounded_queue<T>& queue;
+    const int nthread;
+    TestNegativeQueueBody( tbb::concurrent_bounded_queue<T>& q, int n ) : queue(q), nthread(n) {}
+    void operator()( int k ) const {
+        if( k==0 ) {
+            int number_of_pops = nthread-1;
+            // Wait for all pops to pend.
+            while( queue.size()>-number_of_pops ) {
+                __TBB_Yield();
+            }
+            for( int i=0; ; ++i ) {
+                ASSERT( queue.size()==i-number_of_pops, NULL );
+                ASSERT( queue.empty()==(queue.size()<=0), NULL );
+                if( i==number_of_pops ) break;
+                // Satisfy another pop
+                queue.push( T() );
+            }
+        } else {
+            // Pop item from queue
+            T item;
+            queue.pop(item);
+        }
+    }
+};
+
+//! Test a queue with a negative size.
+template<typename T>
+void TestNegativeQueue( int nthread ) {
+    tbb::concurrent_bounded_queue<T> queue;
+    NativeParallelFor( nthread, TestNegativeQueueBody<T>(queue,nthread) );
+}
+
+#if TBB_USE_EXCEPTIONS
+template<template<typename, typename> class CQ,typename A1,typename A2,typename T>
+void TestExceptionBody() {
+    enum methods {
+        m_push = 0,
+        m_pop
+    };
+
+    REMARK("Testing exception safety\n");
+    MaxFooCount = 5;
+    // verify 'clear()' on exception; queue's destructor calls its clear()
+    // Do test on queues of two different types at the same time to
+    // catch problem with incorrect sharing between templates.
+    {
+        CQ<T,A1> queue0;
+        CQ<int,A1> queue1;
+        for( int i=0; i<2; ++i ) {
+            bool caught = false;
+            try {
+                // concurrent_queue internally rebinds the allocator to the one for 'char'
+                A2::init_counters();
+                A2::set_limits(N/2);
+                for( int k=0; k<N; k++ ) {
+                    if( i==0 )
+                        push(queue0, T(), i);
+                    else
+                        queue1.push( k );
+                }
+            } catch (...) {
+                caught = true;
+            }
+            ASSERT( caught, "call to push should have thrown exception" );
+        }
+    }
+    REMARK("... queue destruction test passed\n");
+
+    try {
+        int n_pushed=0, n_popped=0;
+        for(int t = 0; t <= 1; t++)// exception type -- 0 : from allocator(), 1 : from Foo's constructor
+        {
+            CQ<T,A1> queue_test;
+            for( int m=m_push; m<=m_pop; m++ ) {
+                // concurrent_queue internally rebinds the allocator to the one for 'char'
+                A2::init_counters();
+
+                if(t) MaxFooCount = MaxFooCount + 400;
+                else A2::set_limits(N/2);
+
+                try {
+                    switch(m) {
+                    case m_push:
+                        for( int k=0; k<N; k++ ) {
+                            push( queue_test, T(), k );
+                            n_pushed++;
+                        }
+                        break;
+                    case m_pop:
+                        n_popped=0;
+                        for( int k=0; k<n_pushed; k++ ) {
+                            T elt;
+                            queue_test.try_pop( elt );
+                            n_popped++;
+                        }
+                        n_pushed = 0;
+                        A2::set_limits();
+                        break;
+                    }
+                    if( !t && m==m_push ) ASSERT(false, "should throw an exception");
+                } catch ( Foo_exception & ) {
+                    long tc = MaxFooCount;
+                    MaxFooCount = 0; // disable exception
+                    switch(m) {
+                    case m_push:
+                        ASSERT( ptrdiff_t(queue_test.size())==n_pushed, "incorrect queue size" );
+                        for( int k=0; k<(int)tc; k++ ) {
+                            push( queue_test, T(), k );
+                            n_pushed++;
+                        }
+                        break;
+                    case m_pop:
+                        n_pushed -= (n_popped+1); // including one that threw the exception
+                        ASSERT( n_pushed>=0, "n_pushed cannot be less than 0" );
+                        for( int k=0; k<1000; k++ ) {
+                            push( queue_test, T(), k );
+                            n_pushed++;
+                        }
+                        ASSERT( !queue_test.empty(), "queue must not be empty" );
+                        ASSERT( ptrdiff_t(queue_test.size())==n_pushed, "queue size must be equal to n pushed" );
+                        for( int k=0; k<n_pushed; k++ ) {
+                            T elt;
+                            queue_test.try_pop( elt );
+                        }
+                        ASSERT( queue_test.empty(), "queue must be empty" );
+                        ASSERT( queue_test.size()==0, "queue must be empty" );
+                        break;
+                    }
+                    MaxFooCount = tc;
+                } catch ( std::bad_alloc & ) {
+                    A2::set_limits(); // disable exception from allocator
+                    size_t size = queue_test.size();
+                    switch(m) {
+                    case m_push:
+                        ASSERT( size>0, "incorrect queue size");
+                        break;
+                    case m_pop:
+                        if( !t ) ASSERT( false, "should not throw an exception" );
+                        break;
+                    }
+                }
+                REMARK("... for t=%d and m=%d, exception test passed\n", t, m);
+            }
+        }
+    } catch(...) {
+        ASSERT(false, "unexpected exception");
+    }
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+void TestExceptions() {
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception safety test is skipped.\n");
+#elif TBB_USE_EXCEPTIONS
+    typedef static_counting_allocator<std::allocator<FooEx>, size_t> allocator_t;
+    typedef static_counting_allocator<std::allocator<char>, size_t> allocator_char_t;
+    TestExceptionBody<ConcQWithSizeWrapper,allocator_t,allocator_char_t,FooEx>();
+    TestExceptionBody<tbb::concurrent_bounded_queue,allocator_t,allocator_char_t,FooEx>();
+#endif /* TBB_USE_EXCEPTIONS */
+}
+
+template<typename CQ, typename T>
+struct TestQueueElements: NoAssign {
+    CQ& queue;
+    const int nthread;
+    TestQueueElements( CQ& q, int n ) : queue(q), nthread(n) {}
+    void operator()( int k ) const {
+        for( int i=0; i<1000; ++i ) {
+            if( (i&0x1)==0 ) {
+                ASSERT( T(k)<T(nthread), NULL );
+                queue.push( T(k) );
+            } else {
+                // Pop item from queue
+                T item = 0;
+                queue.try_pop(item);
+                ASSERT( item<=T(nthread), NULL );
+            }
+        }
+    }
+};
+
+//! Test concurrent queue with primitive data type
+template<typename CQ, typename T>
+void TestPrimitiveTypes( int nthread, T exemplar )
+{
+    CQ queue;
+    for( int i=0; i<100; ++i )
+        queue.push( exemplar );
+    NativeParallelFor( nthread, TestQueueElements<CQ,T>(queue,nthread) );
+}
+
+#include "harness_m128.h"
+
+#if HAVE_m128 || HAVE_m256
+
+//! Test concurrent queue with vector types
+/** Type Queue should be a queue of ClassWithSSE/ClassWithAVX. */
+template<typename ClassWithVectorType, typename Queue>
+void TestVectorTypes() {
+    Queue q1;
+    for( int i=0; i<100; ++i ) {
+        // VC8 does not properly align a temporary value; to work around, use explicit variable
+        ClassWithVectorType bar(i);
+        q1.push(bar);
+    }
+
+    // Copy the queue
+    Queue q2 = q1;
+    // Check that elements of the copy are correct
+    typename Queue::const_iterator ci = q2.unsafe_begin();
+    for( int i=0; i<100; ++i ) {
+        ClassWithVectorType foo = *ci;
+        ClassWithVectorType bar(i);
+        ASSERT( *ci==bar, NULL );
+        ++ci;
+    }
+
+    for( int i=0; i<101; ++i ) {
+        ClassWithVectorType tmp;
+        bool b = q1.try_pop( tmp );
+        ASSERT( b==(i<100), NULL );
+        ClassWithVectorType bar(i);
+        ASSERT( !b || tmp==bar, NULL );
+    }
+}
+#endif /* HAVE_m128 || HAVE_m256 */
+
+void TestEmptiness()
+{
+    REMARK(" Test Emptiness\n");
+    TestEmptyQueue<ConcQWithCapacity<char>, char>();
+    TestEmptyQueue<ConcQWithCapacity<Foo>, Foo>();
+    TestEmptyQueue<tbb::concurrent_bounded_queue<char>, char>();
+    TestEmptyQueue<tbb::concurrent_bounded_queue<Foo>, Foo>();
+}
+
+void TestFullness()
+{
+    REMARK(" Test Fullness\n");
+    TestFullQueue<ConcQWithCapacity<Foo>,Foo>();
+    TestFullQueue<tbb::concurrent_bounded_queue<Foo>,Foo>();
+}
+
+void TestClearWorks()
+{
+    REMARK(" Test concurrent_queue::clear() works\n");
+    TestClear<ConcQWithCapacity<Foo> >();
+    TestClear<tbb::concurrent_bounded_queue<Foo> >();
+}
+
+void TestQueueTypeDeclaration()
+{
+    REMARK(" Test concurrent_queue's types work\n");
+    TestConcurrentQueueType<tbb::concurrent_queue<Foo> >();
+    TestConcurrentQueueType<tbb::concurrent_bounded_queue<Foo> >();
+}
+
+void TestQueueIteratorWorks()
+{
+    REMARK(" Test concurrent_queue's iterators work\n");
+    TestIterator<tbb::concurrent_queue<Foo> >();
+    TestIterator<tbb::concurrent_bounded_queue<Foo> >();
+}
+
+#if TBB_USE_EXCEPTIONS
+#define BAR_EX BarEx
+#else
+#define BAR_EX Empty  /* passed as template arg but should not be used */
+#endif
+class Empty;
+
+void TestQueueConstructors()
+{
+    REMARK(" Test concurrent_queue's constructors work\n");
+    TestConstructors<ConcQWithSizeWrapper<Bar>,Bar,BarIterator,ConcQWithSizeWrapper<BAR_EX>,BAR_EX>();
+    TestConstructors<tbb::concurrent_bounded_queue<Bar>,Bar,BarIterator,tbb::concurrent_bounded_queue<BAR_EX>,BAR_EX>();
+}
+
+void TestQueueWorksWithPrimitiveTypes()
+{
+    REMARK(" Test concurrent_queue works with primitive types\n");
+    TestPrimitiveTypes<tbb::concurrent_queue<char>, char>( MaxThread, (char)1 );
+    TestPrimitiveTypes<tbb::concurrent_queue<int>, int>( MaxThread, (int)-12 );
+    TestPrimitiveTypes<tbb::concurrent_queue<float>, float>( MaxThread, (float)-1.2f );
+    TestPrimitiveTypes<tbb::concurrent_queue<double>, double>( MaxThread, (double)-4.3 );
+    TestPrimitiveTypes<tbb::concurrent_bounded_queue<char>, char>( MaxThread, (char)1 );
+    TestPrimitiveTypes<tbb::concurrent_bounded_queue<int>, int>( MaxThread, (int)-12 );
+    TestPrimitiveTypes<tbb::concurrent_bounded_queue<float>, float>( MaxThread, (float)-1.2f );
+    TestPrimitiveTypes<tbb::concurrent_bounded_queue<double>, double>( MaxThread, (double)-4.3 );
+}
+
+void TestQueueWorksWithSSE()
+{
+    REMARK(" Test concurrent_queue works with SSE data\n");
+#if HAVE_m128
+    TestVectorTypes<ClassWithSSE, tbb::concurrent_queue<ClassWithSSE> >();
+    TestVectorTypes<ClassWithSSE, tbb::concurrent_bounded_queue<ClassWithSSE> >();
+#endif /* HAVE_m128 */
+#if HAVE_m256
+    if( have_AVX() ) {
+        TestVectorTypes<ClassWithAVX, tbb::concurrent_queue<ClassWithAVX> >();
+        TestVectorTypes<ClassWithAVX, tbb::concurrent_bounded_queue<ClassWithAVX> >();
+    }
+#endif /* HAVE_m256 */
+}
+
+void TestConcurrentPushPop()
+{
+    REMARK(" Test concurrent_queue's concurrent push and pop\n");
+    for( int nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        REMARK(" Testing with %d thread(s)\n", nthread );
+        TestNegativeQueue<Foo>(nthread);
+        for( size_t prefill=0; prefill<64; prefill+=(1+prefill/3) ) {
+            TestPushPop<ConcQPushPopWrapper<Foo>,Foo>(prefill,ptrdiff_t(-1),nthread);
+            TestPushPop<ConcQPushPopWrapper<Foo>,Foo>(prefill,ptrdiff_t(1),nthread);
+            TestPushPop<ConcQPushPopWrapper<Foo>,Foo>(prefill,ptrdiff_t(2),nthread);
+            TestPushPop<ConcQPushPopWrapper<Foo>,Foo>(prefill,ptrdiff_t(10),nthread);
+            TestPushPop<ConcQPushPopWrapper<Foo>,Foo>(prefill,ptrdiff_t(100),nthread);
+        }
+        for( size_t prefill=0; prefill<64; prefill+=(1+prefill/3) ) {
+            TestPushPop<tbb::concurrent_bounded_queue<Foo>,Foo>(prefill,ptrdiff_t(-1),nthread);
+            TestPushPop<tbb::concurrent_bounded_queue<Foo>,Foo>(prefill,ptrdiff_t(1),nthread);
+            TestPushPop<tbb::concurrent_bounded_queue<Foo>,Foo>(prefill,ptrdiff_t(2),nthread);
+            TestPushPop<tbb::concurrent_bounded_queue<Foo>,Foo>(prefill,ptrdiff_t(10),nthread);
+            TestPushPop<tbb::concurrent_bounded_queue<Foo>,Foo>(prefill,ptrdiff_t(100),nthread);
+        }
+    }
+}
+
+#if TBB_USE_EXCEPTIONS
+tbb::atomic<size_t> num_pushed;
+tbb::atomic<size_t> num_popped;
+tbb::atomic<size_t> failed_pushes;
+tbb::atomic<size_t> failed_pops;
+
+class SimplePushBody {
+    tbb::concurrent_bounded_queue<int>* q;
+    int max;
+public:
+    SimplePushBody(tbb::concurrent_bounded_queue<int>* _q, int hi_thr) : q(_q), max(hi_thr) {}
+    bool operator()() { // predicate for spin_wait_while
+        return q->size()<max;
+    }
+    void operator()(int thread_id) const {
+        if (thread_id == max) {
+            spin_wait_while( *this );
+            q->abort();
+            return;
+        }
+        try {
+            q->push(42);
+            ++num_pushed;
+        } catch ( tbb::user_abort& ) {
+            ++failed_pushes;
+        }
+    }
+};
+
+class SimplePopBody {
+    tbb::concurrent_bounded_queue<int>* q;
+    int max;
+    int prefill;
+public:
+    SimplePopBody(tbb::concurrent_bounded_queue<int>* _q, int hi_thr, int nitems)
+    : q(_q), max(hi_thr), prefill(nitems) {}
+    bool operator()() { // predicate for spin_wait_while
+        // There should be `max` pops, and `prefill` should succeed
+        return q->size()>prefill-max;
+    }
+    void operator()(int thread_id) const {
+        int e;
+        if (thread_id == max) {
+            spin_wait_while( *this );
+            q->abort();
+            return;
+        }
+        try {
+            q->pop(e);
+            ++num_popped;
+        } catch ( tbb::user_abort& ) {
+            ++failed_pops;
+        }
+    }
+};
+#endif /* TBB_USE_EXCEPTIONS */
+
+void TestAbort() {
+#if TBB_USE_EXCEPTIONS
+    for (int nthreads=MinThread; nthreads<=MaxThread; ++nthreads) {
+        REMARK("Testing Abort on %d thread(s).\n", nthreads);
+
+        REMARK("...testing pushing to zero-sized queue\n");
+        tbb::concurrent_bounded_queue<int> iq1;
+        iq1.set_capacity(0);
+        for (int i=0; i<10; ++i) {
+            num_pushed = num_popped = failed_pushes = failed_pops = 0;
+            SimplePushBody my_push_body1(&iq1, nthreads);
+            NativeParallelFor( nthreads+1, my_push_body1 );
+            ASSERT(num_pushed == 0, "no elements should have been pushed to zero-sized queue");
+            ASSERT((int)failed_pushes == nthreads, "All threads should have failed to push an element to zero-sized queue");
+            // Do not test popping each time in order to test queue destruction with no previous pops
+            if (nthreads < (MaxThread+MinThread)/2) {
+                int e;
+                bool queue_empty = !iq1.try_pop(e);
+                ASSERT(queue_empty, "no elements should have been popped from zero-sized queue");
+            }
+        }
+
+        REMARK("...testing pushing to small-sized queue\n");
+        tbb::concurrent_bounded_queue<int> iq2;
+        iq2.set_capacity(2);
+        for (int i=0; i<10; ++i) {
+            num_pushed = num_popped = failed_pushes = failed_pops = 0;
+            SimplePushBody my_push_body2(&iq2, nthreads);
+            NativeParallelFor( nthreads+1, my_push_body2 );
+            ASSERT(num_pushed <= 2, "at most 2 elements should have been pushed to queue of size 2");
+            if (nthreads >= 2)
+                ASSERT((int)failed_pushes == nthreads-2, "nthreads-2 threads should have failed to push an element to queue of size 2");
+            int e;
+            while (iq2.try_pop(e)) ;
+        }
+
+        REMARK("...testing popping from small-sized queue\n");
+        tbb::concurrent_bounded_queue<int> iq3;
+        iq3.set_capacity(2);
+        for (int i=0; i<10; ++i) {
+            num_pushed = num_popped = failed_pushes = failed_pops = 0;
+            iq3.push(42);
+            iq3.push(42);
+            SimplePopBody my_pop_body(&iq3, nthreads, 2);
+            NativeParallelFor( nthreads+1, my_pop_body );
+            ASSERT(num_popped <= 2, "at most 2 elements should have been popped from queue of size 2");
+            if (nthreads >= 2)
+                ASSERT((int)failed_pops == nthreads-2, "nthreads-2 threads should have failed to pop an element from queue of size 2");
+            else {
+                int e;
+                iq3.pop(e);
+            }
+        }
+
+        REMARK("...testing pushing and popping from small-sized queue\n");
+        tbb::concurrent_bounded_queue<int> iq4;
+        int cap = nthreads/2;
+        if (!cap) cap=1;
+        iq4.set_capacity(cap);
+        for (int i=0; i<10; ++i) {
+            num_pushed = num_popped = failed_pushes = failed_pops = 0;
+            SimplePushBody my_push_body2(&iq4, nthreads);
+            NativeParallelFor( nthreads+1, my_push_body2 );
+            ASSERT((int)num_pushed <= cap, "at most cap elements should have been pushed to queue of size cap");
+            if (nthreads >= cap)
+                ASSERT((int)failed_pushes == nthreads-cap, "nthreads-cap threads should have failed to push an element to queue of size cap");
+            SimplePopBody my_pop_body(&iq4, nthreads, (int)num_pushed);
+            NativeParallelFor( nthreads+1, my_pop_body );
+            ASSERT((int)num_popped <= cap, "at most cap elements should have been popped from queue of size cap");
+            if (nthreads >= cap)
+                ASSERT((int)failed_pops == nthreads-cap, "nthreads-cap threads should have failed to pop an element from queue of size cap");
+            else {
+                int e;
+                while (iq4.try_pop(e)) ;
+            }
+        }
+    }
+#endif
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+struct MoveOperationTracker {
+    static size_t copy_constructor_called_times;
+    static size_t move_constructor_called_times;
+    static size_t copy_assignment_called_times;
+    static size_t move_assignment_called_times;
+
+    MoveOperationTracker() {}
+    MoveOperationTracker(const MoveOperationTracker&) {
+        ++copy_constructor_called_times;
+    }
+    MoveOperationTracker(MoveOperationTracker&&) {
+        ++move_constructor_called_times;
+    }
+    MoveOperationTracker& operator=(MoveOperationTracker const&) {
+        ++copy_assignment_called_times;
+        return *this;
+    }
+    MoveOperationTracker& operator=(MoveOperationTracker&&) {
+        ++move_assignment_called_times;
+        return *this;
+    }
+};
+size_t MoveOperationTracker::copy_constructor_called_times = 0;
+size_t MoveOperationTracker::move_constructor_called_times = 0;
+size_t MoveOperationTracker::copy_assignment_called_times = 0;
+size_t MoveOperationTracker::move_assignment_called_times = 0;
+
+template <class CQ, push_t push_op, pop_t pop_op>
+void TestMoveSupport() {
+    size_t &mcct = MoveOperationTracker::move_constructor_called_times;
+    size_t &ccct = MoveOperationTracker::copy_constructor_called_times;
+    size_t &cact = MoveOperationTracker::copy_assignment_called_times;
+    size_t &mact = MoveOperationTracker::move_assignment_called_times;
+    mcct = ccct = cact = mact = 0;
+
+    CQ q;
+
+    ASSERT(mcct == 0, "Value must be zero-initialized");
+    ASSERT(ccct == 0, "Value must be zero-initialized");
+    ASSERT(pusher<push_op>::push( q, MoveOperationTracker() ), NULL);
+    ASSERT(mcct == 1, "Not working push(T&&) or try_push(T&&)?");
+    ASSERT(ccct == 0, "Copying of arg occurred during push(T&&) or try_push(T&&)");
+
+    MoveOperationTracker ob;
+    ASSERT(pusher<push_op>::push( q, std::move(ob) ), NULL);
+    ASSERT(mcct == 2, "Not working push(T&&) or try_push(T&&)?");
+    ASSERT(ccct == 0, "Copying of arg occurred during push(T&&) or try_push(T&&)");
+
+    ASSERT(cact == 0, "Copy assignment called during push(T&&) or try_push(T&&)");
+    ASSERT(mact == 0, "Move assignment called during push(T&&) or try_push(T&&)");
+
+    bool result = popper<pop_op>::pop( q, ob );
+    ASSERT(result, NULL);
+    ASSERT(cact == 0, "Copy assignment called during try_pop(T&&)");
+    ASSERT(mact == 1, "Move assignment was not called during try_pop(T&&)");
+}
+
+void TestMoveSupportInPushPop() {
+    REMARK("Testing Move Support in Push/Pop...");
+    TestMoveSupport< tbb::concurrent_queue<MoveOperationTracker>, push_op, try_pop_op >();
+    TestMoveSupport< tbb::concurrent_bounded_queue<MoveOperationTracker>, push_op, pop_op >();
+    TestMoveSupport< tbb::concurrent_bounded_queue<MoveOperationTracker>, try_push_op, try_pop_op >();
+    REMARK(" works.\n");
+}
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+class NonTrivialConstructorType {
+public:
+    NonTrivialConstructorType( int a = 0 ) : m_a( a ), m_str( "" ) {}
+    NonTrivialConstructorType( const std::string& str ) : m_a( 0 ), m_str( str ) {}
+    NonTrivialConstructorType( int a, const std::string& str ) : m_a( a ), m_str( str ) {}
+    int get_a() const { return m_a; }
+    std::string get_str() const { return m_str; }
+private:
+    int m_a;
+    std::string m_str;
+};
+
+enum emplace_t { emplace_op, try_emplace_op };
+
+template< emplace_t emplace_op >
+struct emplacer {
+    template< typename CQ, typename... Args>
+    static void emplace( CQ& queue, Args&&... val ) { queue.emplace( std::forward<Args>( val )... ); }
+};
+
+template<>
+struct emplacer< try_emplace_op > {
+    template<typename CQ, typename... Args>
+    static void emplace( CQ& queue, Args&&... val ) {
+        bool result = queue.try_emplace( std::forward<Args>( val )... );
+        ASSERT( result, "try_emplace error\n" );
+    }
+};
+
+template<typename CQ, emplace_t emplace_op>
+void TestEmplaceInQueue() {
+    CQ cq;
+    std::string test_str = "I'm being emplaced!";
+    {
+        emplacer<emplace_op>::emplace( cq, 5 );
+        ASSERT( cq.size() == 1, NULL );
+        NonTrivialConstructorType popped( -1 );
+        bool result = cq.try_pop( popped );
+        ASSERT( result, NULL );
+        ASSERT( popped.get_a() == 5, NULL );
+        ASSERT( popped.get_str() == std::string( "" ), NULL );
+    }
+
+    ASSERT( cq.empty(), NULL );
+
+    {
+        NonTrivialConstructorType popped( -1 );
+        emplacer<emplace_op>::emplace( cq, std::string(test_str) );
+        bool result = cq.try_pop( popped );
+        ASSERT( result, NULL );
+        ASSERT( popped.get_a() == 0, NULL );
+        ASSERT( popped.get_str() == test_str, NULL );
+    }
+
+    ASSERT( cq.empty(), NULL );
+
+    {
+        NonTrivialConstructorType popped( -1, "" );
+        emplacer<emplace_op>::emplace( cq, 5, std::string(test_str) );
+        bool result = cq.try_pop( popped );
+        ASSERT( result, NULL );
+        ASSERT( popped.get_a() == 5, NULL );
+        ASSERT( popped.get_str() == test_str, NULL );
+    }
+}
+void TestEmplace() {
+    REMARK("Testing support for 'emplace' method...");
+    TestEmplaceInQueue< ConcQWithSizeWrapper<NonTrivialConstructorType>, emplace_op >();
+    TestEmplaceInQueue< tbb::concurrent_bounded_queue<NonTrivialConstructorType>, emplace_op >();
+    TestEmplaceInQueue< tbb::concurrent_bounded_queue<NonTrivialConstructorType>, try_emplace_op >();
+    REMARK(" works.\n");
+}
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+template <typename Queue>
+void Examine(Queue q, const std::vector<typename Queue::value_type> &vec) {
+    typedef typename Queue::value_type value_type;
+
+    AssertEquality(q, vec);
+
+    const Queue cq = q;
+    AssertEquality(cq, vec);
+
+    q.clear();
+    AssertEmptiness(q);
+
+    FillTest<push_op>(q, vec);
+    EmptyTest<try_pop_op>(q, vec);
+
+    bounded_queue_specific_test(q, vec);
+
+    typename Queue::allocator_type a = q.get_allocator();
+    value_type *ptr = a.allocate(1);
+    ASSERT(ptr, NULL);
+    a.deallocate(ptr, 1);
+}
+
+template <typename Queue, typename QueueDebugAlloc>
+void TypeTester(const std::vector<typename Queue::value_type> &vec) {
+    typedef typename std::vector<typename Queue::value_type>::const_iterator iterator;
+    ASSERT(vec.size() >= 5, "Array should have at least 5 elements");
+    // Construct an empty queue.
+    Queue q1;
+    for (iterator it = vec.begin(); it != vec.end(); ++it) q1.push(*it);
+    Examine(q1, vec);
+    // Copying constructor.
+    Queue q3(q1);
+    Examine(q3, vec);
+    // Construct with non-default allocator.
+    QueueDebugAlloc q4;
+    for (iterator it = vec.begin(); it != vec.end(); ++it) q4.push(*it);
+    Examine(q4, vec);
+    // Copying constructor with the same allocator type.
+    QueueDebugAlloc q5(q4);
+    Examine(q5, vec);
+    // Construction with given allocator instance.
+    typename QueueDebugAlloc::allocator_type a;
+    QueueDebugAlloc q6(a);
+    for (iterator it = vec.begin(); it != vec.end(); ++it) q6.push(*it);
+    Examine(q6, vec);
+    // Construction with copying iteration range and given allocator instance.
+    QueueDebugAlloc q7(q1.unsafe_begin(), q1.unsafe_end(), a);
+    Examine<QueueDebugAlloc>(q7, vec);
+}
+
+template <typename value_type>
+void TestTypes(const std::vector<value_type> &vec) {
+    TypeTester< ConcQWithSizeWrapper<value_type>, ConcQWithSizeWrapper<value_type, debug_allocator<value_type> > >(vec);
+    TypeTester< tbb::concurrent_bounded_queue<value_type>, tbb::concurrent_bounded_queue<value_type, debug_allocator<value_type> > >(vec);
+}
+
+void TestTypes() {
+    const int NUMBER = 10;
+
+    std::vector<int> arrInt;
+    for (int i = 0; i < NUMBER; ++i) arrInt.push_back(i);
+    std::vector< tbb::atomic<int> > arrTbb;
+    for (int i = 0; i < NUMBER; ++i) {
+        tbb::atomic<int> a;
+        a = i;
+        arrTbb.push_back(a);
+    }
+    TestTypes(arrInt);
+    TestTypes(arrTbb);
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+    std::vector< std::shared_ptr<int> > arrShr;
+    for (int i = 0; i < NUMBER; ++i) arrShr.push_back(std::make_shared<int>(i));
+    std::vector< std::weak_ptr<int> > arrWk;
+    std::copy(arrShr.begin(), arrShr.end(), std::back_inserter(arrWk));
+    TestTypes(arrShr);
+    TestTypes(arrWk);
+#else
+    REPORT("Known issue: C++11 smart pointer tests are skipped.\n");
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+}
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+template <template <typename...> typename TQueue>
+void TestDeductionGuides() {
+    using ComplexType = const std::string*;
+    std::vector<ComplexType> v;
+
+    // check TQueue(InputIterator, InputIterator)
+    TQueue q1(v.begin(), v.end());
+    static_assert(std::is_same<decltype(q1), TQueue<ComplexType>>::value);
+
+    // check TQueue(InputIterator, InputIterator, Allocator)
+    TQueue q2(v.begin(), v.end(), std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q2), TQueue<ComplexType, std::allocator<ComplexType>>>::value);
+
+    // check TQueue(TQueue &)
+    TQueue q3(q1);
+    static_assert(std::is_same<decltype(q3), decltype(q1)>::value);
+
+    // check TQueue(TQueue &, Allocator)
+    TQueue q4(q2, std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q4), decltype(q2)>::value);
+
+    // check TQueue(TQueue &&)
+    TQueue q5(std::move(q1));
+    static_assert(std::is_same<decltype(q5), decltype(q1)>::value);
+
+    // check TQueue(TQueue &&, Allocator)
+    TQueue q6(std::move(q4), std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(q6), decltype(q4)>::value);
+}
+#endif
+
+int TestMain () {
+    TestEmptiness();
+
+    TestFullness();
+
+    TestClearWorks();
+
+    TestQueueTypeDeclaration();
+
+    TestQueueIteratorWorks();
+
+    TestQueueConstructors();
+
+    TestQueueWorksWithPrimitiveTypes();
+
+    TestQueueWorksWithSSE();
+
+    // Test concurrent operations
+    TestConcurrentPushPop();
+
+    TestExceptions();
+
+    TestAbort();
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestMoveSupportInPushPop();
+    TestMoveConstruction();
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    TestEmplace();
+#endif /* __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    TestTypes();
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+    TestDeductionGuides<tbb::concurrent_queue>();
+    TestDeductionGuides<tbb::concurrent_bounded_queue>();
+#endif
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_queue_whitebox.cpp b/xdl/third_party/tbb/src/test/test_concurrent_queue_whitebox.cpp
new file mode 100644
index 00000000..7d153da5
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_queue_whitebox.cpp
@@ -0,0 +1,101 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFINE_PRIVATE_PUBLIC 1
+#include "harness_inject_scheduler.h"
+#define private public
+#define protected public
+#include "tbb/concurrent_queue.h"
+#include "../tbb/concurrent_queue.cpp"
+#undef protected
+#undef private
+#include "harness.h"
+
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    // VS2008/VC9 seems to have an issue; limits pull in math.h
+    #pragma warning( push )
+    #pragma warning( disable: 4985 )
+#endif
+#include <limits>
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    #pragma warning( pop )
+#endif
+
+template <typename Q>
+class FloggerBody : NoAssign {
+    Q& q;
+    size_t elem_num;
+public:
+    FloggerBody(Q& q_, size_t elem_num_) : q(q_), elem_num(elem_num_) {}
+    void operator()(const int threadID) const {
+        typedef typename Q::value_type value_type;
+        value_type elem = value_type(threadID);
+        for (size_t i = 0; i < elem_num; ++i) {
+            q.push(elem);
+            (void) q.try_pop(elem);
+        }
+    }
+};
+
+template <typename Q>
+void TestFloggerHelp(Q& q, size_t items_per_page) {
+    size_t nq = q.my_rep->n_queue;
+    size_t reserved_elem_num = nq * items_per_page - 1;
+    size_t hack_val = std::numeric_limits<std::size_t>::max() & ~reserved_elem_num;
+    q.my_rep->head_counter = hack_val;
+    q.my_rep->tail_counter = hack_val;
+    size_t k = q.my_rep->tail_counter & -(ptrdiff_t)nq;
+
+    for (size_t i=0; i<nq; ++i) {
+        q.my_rep->array[i].head_counter = k;
+        q.my_rep->array[i].tail_counter = k;
+    }
+    NativeParallelFor(MaxThread, FloggerBody<Q>(q, reserved_elem_num + 20)); // to induce the overflow occurrence
+    ASSERT(q.empty(), "FAILED flogger/empty test.");
+    ASSERT(q.my_rep->head_counter < hack_val, "FAILED wraparound test.");
+}
+
+template <typename T>
+void TestFlogger() {
+    {
+        tbb::concurrent_queue<T> q;
+        REMARK("Wraparound on strict_ppl::concurrent_queue...");
+        TestFloggerHelp(q, q.my_rep->items_per_page);
+        REMARK(" works.\n");
+    }
+    {
+        tbb::concurrent_bounded_queue<T> q;
+        REMARK("Wraparound on tbb::concurrent_bounded_queue...");
+        TestFloggerHelp(q, q.items_per_page);
+        REMARK(" works.\n");
+    }
+}
+
+void TestWraparound() {
+    REMARK("Testing Wraparound...\n");
+    TestFlogger<int>();
+    TestFlogger<unsigned char>();
+    REMARK("Done Testing Wraparound.\n");
+}
+
+int TestMain () {
+    TestWraparound();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_unordered_common.h b/xdl/third_party/tbb/src/test/test_concurrent_unordered_common.h
new file mode 100644
index 00000000..2d39dd9a
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_unordered_common.h
@@ -0,0 +1,990 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Some tests in this source file are based on PPL tests provided by Microsoft. */
+#include "tbb/parallel_for.h"
+#include "tbb/tick_count.h"
+#include "harness.h"
+#include "test_container_move_support.h"
+// Test that unordered containers do not require keys have default constructors.
+#define __HARNESS_CHECKTYPE_DEFAULT_CTOR 0
+#include "harness_checktype.h"
+#undef  __HARNESS_CHECKTYPE_DEFAULT_CTOR
+#include "harness_allocator.h"
+
+template<typename T>
+struct degenerate_hash {
+    size_t operator()(const T& /*a*/) const {
+        return 1;
+    }
+};
+
+// TestInitListSupportWithoutAssign with an empty initializer list causes internal error in Intel Compiler.
+#define __TBB_ICC_EMPTY_INIT_LIST_TESTS_BROKEN (__INTEL_COMPILER && __INTEL_COMPILER <= 1500)
+
+typedef local_counting_allocator<debug_allocator<std::pair<const int,int>,std::allocator> > MyAllocator;
+
+#define CheckAllocatorE(t,a,f) CheckAllocator(t,a,f,true,__LINE__)
+#define CheckAllocatorA(t,a,f) CheckAllocator(t,a,f,false,__LINE__)
+template<typename MyTable>
+inline void CheckAllocator(MyTable &table, size_t expected_allocs, size_t expected_frees, bool exact = true, int line = 0) {
+    typename MyTable::allocator_type a = table.get_allocator();
+    REMARK("#%d checking allocators: items %u/%u, allocs %u/%u\n", line,
+        unsigned(a.items_allocated), unsigned(a.items_freed), unsigned(a.allocations), unsigned(a.frees) );
+    ASSERT( a.items_allocated == a.allocations, NULL); ASSERT( a.items_freed == a.frees, NULL);
+    if(exact) {
+        ASSERT( a.allocations == expected_allocs, NULL); ASSERT( a.frees == expected_frees, NULL);
+    } else {
+        ASSERT( a.allocations >= expected_allocs, NULL); ASSERT( a.frees >= expected_frees, NULL);
+        ASSERT( a.allocations - a.frees == expected_allocs - expected_frees, NULL );
+    }
+}
+
+template<typename T>
+struct strip_const { typedef T type; };
+
+template<typename T>
+struct strip_const<const T> { typedef T type; };
+
+// value generator for cumap
+template <typename K, typename V = std::pair<const K, K> >
+struct ValueFactory {
+    typedef typename strip_const<K>::type Kstrip;
+    static V make(const K &value) { return V(value, value); }
+    static Kstrip key(const V &value) { return value.first; }
+    static Kstrip get(const V &value) { return (Kstrip)value.second; }
+    template< typename U >
+    static U convert(const V &value) { return U(value.second); }
+};
+
+// generator for cuset
+template <typename T>
+struct ValueFactory<T, T> {
+    static T make(const T &value) { return value; }
+    static T key(const T &value) { return value; }
+    static T get(const T &value) { return value; }
+    template< typename U >
+    static U convert(const T &value) { return U(value); }
+};
+
+template <typename T>
+struct Value : ValueFactory<typename T::key_type, typename T::value_type> {
+    template<typename U>
+    static bool compare( const typename T::iterator& it, U val ) {
+        return (Value::template convert<U>(*it) == val);
+    }
+};
+
+#if _MSC_VER
+#pragma warning(disable: 4189) // warning 4189 -- local variable is initialized but not referenced
+#pragma warning(disable: 4127) // warning 4127 -- while (true) has a constant expression in it
+#endif
+
+template<typename ContainerType, typename Iterator, typename RangeType>
+std::pair<intptr_t,intptr_t> CheckRecursiveRange(RangeType range) {
+    std::pair<intptr_t,intptr_t> sum(0, 0); // count, sum
+    for( Iterator i = range.begin(), e = range.end(); i != e; ++i ) {
+        ++sum.first; sum.second += Value<ContainerType>::get(*i);
+    }
+    if( range.is_divisible() ) {
+        RangeType range2( range, tbb::split() );
+        std::pair<intptr_t,intptr_t> sum1 = CheckRecursiveRange<ContainerType,Iterator, RangeType>( range );
+        std::pair<intptr_t,intptr_t> sum2 = CheckRecursiveRange<ContainerType,Iterator, RangeType>( range2 );
+        sum1.first += sum2.first; sum1.second += sum2.second;
+        ASSERT( sum == sum1, "Mismatched ranges after division");
+    }
+    return sum;
+}
+
+template <typename T>
+struct SpecialTests {
+    static void Test(const char *str) {REMARK("skipped -- specialized %s tests\n", str);}
+};
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+template<typename container_type>
+bool equal_containers( container_type const& lhs, container_type const& rhs ) {
+    if ( lhs.size() != rhs.size() ) {
+        return false;
+    }
+    return std::equal( lhs.begin(), lhs.end(), rhs.begin(), Harness::IsEqual() );
+}
+
+#include "test_initializer_list.h"
+
+template <typename Table, typename MultiTable>
+void TestInitList( std::initializer_list<typename Table::value_type> il ) {
+    using namespace initializer_list_support_tests;
+    REMARK("testing initializer_list methods \n");
+
+    TestInitListSupportWithoutAssign<Table,test_special_insert>(il);
+    TestInitListSupportWithoutAssign<MultiTable, test_special_insert>( il );
+
+#if __TBB_ICC_EMPTY_INIT_LIST_TESTS_BROKEN
+    REPORT( "Known issue: TestInitListSupportWithoutAssign with an empty initializer list is skipped.\n");
+#else
+    TestInitListSupportWithoutAssign<Table, test_special_insert>( {} );
+    TestInitListSupportWithoutAssign<MultiTable, test_special_insert>( {} );
+#endif
+}
+#endif //if __TBB_INITIALIZER_LISTS_PRESENT
+
+template<Harness::StateTrackableBase::StateValue desired_state, typename T>
+void check_value_state(/* typename do_check_element_state =*/ tbb::internal::true_type, T const& t, const char* filename, int line )
+{
+    ASSERT_CUSTOM(is_state_f<desired_state>()(t), "", filename, line);
+}
+
+template<Harness::StateTrackableBase::StateValue desired_state, typename T>
+void check_value_state(/* typename do_check_element_state =*/ tbb::internal::false_type, T const&, const char* , int ) {/*do nothing*/}
+#define ASSERT_VALUE_STATE(do_check_element_state,state,value) check_value_state<state>(do_check_element_state,value,__FILE__,__LINE__)
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<typename T, typename do_check_element_state, typename V>
+void test_rvalue_insert(V v1, V v2)
+{
+    typedef T container_t;
+
+    container_t cont;
+
+    std::pair<typename container_t::iterator, bool> ins = cont.insert(Value<container_t>::make(v1));
+    ASSERT(ins.second == true && Value<container_t>::get(*(ins.first)) == v1, "Element 1 has not been inserted properly");
+    ASSERT_VALUE_STATE(do_check_element_state(),Harness::StateTrackableBase::MoveInitialized,*ins.first);
+
+    typename container_t::iterator it2 = cont.insert(ins.first, Value<container_t>::make(v2));
+    ASSERT(Value<container_t>::get(*(it2)) == v2, "Element 2 has not been inserted properly");
+    ASSERT_VALUE_STATE(do_check_element_state(),Harness::StateTrackableBase::MoveInitialized,*it2);
+
+}
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+// The test does not use variadic templates, but emplace() does.
+
+namespace emplace_helpers {
+template<typename container_t, typename arg_t, typename value_t>
+std::pair<typename container_t::iterator, bool> call_emplace_impl(container_t& c, arg_t&& k, value_t *){
+    // this is a set
+    return c.emplace(std::forward<arg_t>(k));
+}
+
+template<typename container_t, typename arg_t, typename first_t, typename second_t>
+std::pair<typename container_t::iterator, bool> call_emplace_impl(container_t& c, arg_t&& k, std::pair<first_t, second_t> *){
+    // this is a map
+    return c.emplace(k, std::forward<arg_t>(k));
+}
+
+template<typename container_t, typename arg_t>
+std::pair<typename container_t::iterator, bool> call_emplace(container_t& c, arg_t&& k){
+    typename container_t::value_type * selector = NULL;
+    return call_emplace_impl(c, std::forward<arg_t>(k), selector);
+}
+
+template<typename container_t, typename arg_t, typename value_t>
+typename container_t::iterator call_emplace_hint_impl(container_t& c, typename container_t::const_iterator hint, arg_t&& k, value_t *){
+    // this is a set
+    return c.emplace_hint(hint, std::forward<arg_t>(k));
+}
+
+template<typename container_t, typename arg_t, typename first_t, typename second_t>
+typename container_t::iterator call_emplace_hint_impl(container_t& c, typename container_t::const_iterator hint, arg_t&& k, std::pair<first_t, second_t> *){
+    // this is a map
+    return c.emplace_hint(hint, k, std::forward<arg_t>(k));
+}
+
+template<typename container_t, typename arg_t>
+typename container_t::iterator call_emplace_hint(container_t& c, typename container_t::const_iterator hint, arg_t&& k){
+    typename container_t::value_type * selector = NULL;
+    return call_emplace_hint_impl(c, hint, std::forward<arg_t>(k), selector);
+}
+}
+template<typename T, typename do_check_element_state, typename V>
+void test_emplace_insert(V v1, V v2){
+    typedef T container_t;
+    container_t cont;
+
+    std::pair<typename container_t::iterator, bool> ins = emplace_helpers::call_emplace(cont, v1);
+    ASSERT(ins.second == true && Value<container_t>::compare(ins.first, v1), "Element 1 has not been inserted properly");
+    ASSERT_VALUE_STATE(do_check_element_state(),Harness::StateTrackableBase::DirectInitialized,*ins.first);
+
+    typename container_t::iterator it2 = emplace_helpers::call_emplace_hint(cont, ins.first, v2);
+    ASSERT(Value<container_t>::compare(it2, v2), "Element 2 has not been inserted properly");
+    ASSERT_VALUE_STATE(do_check_element_state(),Harness::StateTrackableBase::DirectInitialized,*it2);
+}
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+template<typename T, typename do_check_element_state>
+void test_basic(const char * str, do_check_element_state)
+{
+    T cont;
+    const T &ccont(cont);
+
+    // bool empty() const;
+    ASSERT(ccont.empty(), "Concurrent container is not empty after construction");
+
+    // size_type size() const;
+    ASSERT(ccont.size() == 0, "Concurrent container is not empty after construction");
+
+    // size_type max_size() const;
+    ASSERT(ccont.max_size() > 0, "Concurrent container max size is invalid");
+
+    //iterator begin();
+    //iterator end();
+    ASSERT(cont.begin() == cont.end(), "Concurrent container iterators are invalid after construction");
+    ASSERT(ccont.begin() == ccont.end(), "Concurrent container iterators are invalid after construction");
+    ASSERT(cont.cbegin() == cont.cend(), "Concurrent container iterators are invalid after construction");
+
+    //std::pair<iterator, bool> insert(const value_type& obj);
+    std::pair<typename T::iterator, bool> ins = cont.insert(Value<T>::make(1));
+    ASSERT(ins.second == true && Value<T>::get(*(ins.first)) == 1, "Element 1 has not been inserted properly");
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    test_rvalue_insert<T,do_check_element_state>(1,2);
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    test_emplace_insert<T,do_check_element_state>(1,2);
+#endif // __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif // __TBB_CPP11_RVALUE_REF_PRESENT
+
+    // bool empty() const;
+    ASSERT(!ccont.empty(), "Concurrent container is empty after adding an element");
+
+    // size_type size() const;
+    ASSERT(ccont.size() == 1, "Concurrent container size is incorrect");
+
+    std::pair<typename T::iterator, bool> ins2 = cont.insert(Value<T>::make(1));
+
+    if (T::allow_multimapping)
+    {
+        // std::pair<iterator, bool> insert(const value_type& obj);
+        ASSERT(ins2.second == true && Value<T>::get(*(ins2.first)) == 1, "Element 1 has not been inserted properly");
+
+        // size_type size() const;
+        ASSERT(ccont.size() == 2, "Concurrent container size is incorrect");
+
+        // size_type count(const key_type& k) const;
+        ASSERT(ccont.count(1) == 2, "Concurrent container count(1) is incorrect");
+
+        // std::pair<iterator, iterator> equal_range(const key_type& k);
+        std::pair<typename T::iterator, typename T::iterator> range = cont.equal_range(1);
+        typename T::iterator it = range.first;
+        ASSERT(it != cont.end() && Value<T>::get(*it) == 1, "Element 1 has not been found properly");
+        unsigned int count = 0;
+        for (; it != range.second; it++)
+        {
+            count++;
+            ASSERT(Value<T>::get(*it) == 1, "Element 1 has not been found properly");
+        }
+
+        ASSERT(count == 2, "Range doesn't have the right number of elements");
+    }
+    else
+    {
+        // std::pair<iterator, bool> insert(const value_type& obj);
+        ASSERT(ins2.second == false && ins2.first == ins.first, "Element 1 should not be re-inserted");
+
+        // size_type size() const;
+        ASSERT(ccont.size() == 1, "Concurrent container size is incorrect");
+
+        // size_type count(const key_type& k) const;
+        ASSERT(ccont.count(1) == 1, "Concurrent container count(1) is incorrect");
+
+        // std::pair<const_iterator, const_iterator> equal_range(const key_type& k) const;
+        // std::pair<iterator, iterator> equal_range(const key_type& k);
+        std::pair<typename T::iterator, typename T::iterator> range = cont.equal_range(1);
+        typename T::iterator it = range.first;
+        ASSERT(it != cont.end() && Value<T>::get(*it) == 1, "Element 1 has not been found properly");
+        ASSERT(++it == range.second, "Range doesn't have the right number of elements");
+    }
+
+    // const_iterator find(const key_type& k) const;
+    // iterator find(const key_type& k);
+    typename T::iterator it = cont.find(1);
+    ASSERT(it != cont.end() && Value<T>::get(*(it)) == 1, "Element 1 has not been found properly");
+    ASSERT(ccont.find(1) == it, "Element 1 has not been found properly");
+
+    // iterator insert(const_iterator hint, const value_type& obj);
+    typename T::iterator it2 = cont.insert(ins.first, Value<T>::make(2));
+    ASSERT(Value<T>::get(*it2) == 2, "Element 2 has not been inserted properly");
+
+    // T(const T& _Umap)
+    T newcont = ccont;
+    ASSERT(T::allow_multimapping ? (newcont.size() == 3) : (newcont.size() == 2), "Copy construction has not copied the elements properly");
+
+    // size_type unsafe_erase(const key_type& k);
+    typename T::size_type size = cont.unsafe_erase(1);
+    ASSERT(T::allow_multimapping ? (size == 2) : (size == 1), "Erase has not removed the right number of elements");
+
+    // iterator unsafe_erase(const_iterator position);
+    typename T::iterator it4 = cont.unsafe_erase(cont.find(2));
+    ASSERT(it4 == cont.end() && cont.size() == 0, "Erase has not removed the last element properly");
+
+    // template<class InputIterator> void insert(InputIterator first, InputIterator last);
+    cont.insert(newcont.begin(), newcont.end());
+    ASSERT(T::allow_multimapping ? (cont.size() == 3) : (cont.size() == 2), "Range insert has not copied the elements properly");
+
+    // iterator unsafe_erase(const_iterator first, const_iterator last);
+    std::pair<typename T::iterator, typename T::iterator> range2 = newcont.equal_range(1);
+    newcont.unsafe_erase(range2.first, range2.second);
+    ASSERT(newcont.size() == 1, "Range erase has not erased the elements properly");
+
+    // void clear();
+    newcont.clear();
+    ASSERT(newcont.begin() == newcont.end() && newcont.size() == 0, "Clear has not cleared the container");
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+#if __TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN
+    REPORT("Known issue: the test for insert with initializer_list is skipped.\n");
+#else
+    // void insert(const std::initializer_list<value_type> &il);
+    newcont.insert( { Value<T>::make( 1 ), Value<T>::make( 2 ), Value<T>::make( 1 ) } );
+    if (T::allow_multimapping) {
+        ASSERT(newcont.size() == 3, "Concurrent container size is incorrect");
+        ASSERT(newcont.count(1) == 2, "Concurrent container count(1) is incorrect");
+        ASSERT(newcont.count(2) == 1, "Concurrent container count(2) is incorrect");
+        std::pair<typename T::iterator, typename T::iterator> range = cont.equal_range(1);
+        it = range.first;
+        ASSERT(it != newcont.end() && Value<T>::get(*it) == 1, "Element 1 has not been found properly");
+        unsigned int count = 0;
+        for (; it != range.second; it++) {
+            count++;
+            ASSERT(Value<T>::get(*it) == 1, "Element 1 has not been found properly");
+        }
+        ASSERT(count == 2, "Range doesn't have the right number of elements");
+        range = newcont.equal_range(2); it = range.first;
+        ASSERT(it != newcont.end() && Value<T>::get(*it) == 2, "Element 2 has not been found properly");
+        count = 0;
+        for (; it != range.second; it++) {
+            count++;
+            ASSERT(Value<T>::get(*it) == 2, "Element 2 has not been found properly");
+        }
+        ASSERT(count == 1, "Range doesn't have the right number of elements");
+    } else {
+        ASSERT(newcont.size() == 2, "Concurrent container size is incorrect");
+        ASSERT(newcont.count(1) == 1, "Concurrent container count(1) is incorrect");
+        ASSERT(newcont.count(2) == 1, "Concurrent container count(2) is incorrect");
+        std::pair<typename T::iterator, typename T::iterator> range = newcont.equal_range(1);
+        it = range.first;
+        ASSERT(it != newcont.end() && Value<T>::get(*it) == 1, "Element 1 has not been found properly");
+        ASSERT(++it == range.second, "Range doesn't have the right number of elements");
+        range = newcont.equal_range(2); it = range.first;
+        ASSERT(it != newcont.end() && Value<T>::get(*it) == 2, "Element 2 has not been found properly");
+        ASSERT(++it == range.second, "Range doesn't have the right number of elements");
+    }
+#endif /* __TBB_CPP11_INIT_LIST_TEMP_OBJS_COMPILATION_BROKEN */
+#endif /* __TBB_INITIALIZER_LISTS_PRESENT */
+
+    // T& operator=(const T& _Umap)
+    newcont = ccont;
+    ASSERT(T::allow_multimapping ? (newcont.size() == 3) : (newcont.size() == 2), "Assignment operator has not copied the elements properly");
+
+    // void rehash(size_type n);
+    newcont.rehash(16);
+    ASSERT(T::allow_multimapping ? (newcont.size() == 3) : (newcont.size() == 2), "Rehash should not affect the container elements");
+
+    // float load_factor() const;
+    // float max_load_factor() const;
+    ASSERT(ccont.load_factor() <= ccont.max_load_factor(), "Load factor is invalid");
+
+    // void max_load_factor(float z);
+    cont.max_load_factor(16.0f);
+    ASSERT(ccont.max_load_factor() == 16.0f, "Max load factor has not been changed properly");
+
+    // hasher hash_function() const;
+    ccont.hash_function();
+
+    // key_equal key_eq() const;
+    ccont.key_eq();
+
+    cont.clear();
+    CheckAllocatorA(cont, 1, 0); // one dummy is always allocated
+    for (int i = 0; i < 256; i++)
+    {
+        std::pair<typename T::iterator, bool> ins3 = cont.insert(Value<T>::make(i));
+        ASSERT(ins3.second == true && Value<T>::get(*(ins3.first)) == i, "Element 1 has not been inserted properly");
+    }
+    ASSERT(cont.size() == 256, "Wrong number of elements have been inserted");
+    ASSERT((256 == CheckRecursiveRange<T,typename T::iterator>(cont.range()).first), NULL);
+    ASSERT((256 == CheckRecursiveRange<T,typename T::const_iterator>(ccont.range()).first), NULL);
+
+    // size_type unsafe_bucket_count() const;
+    ASSERT(ccont.unsafe_bucket_count() == 16, "Wrong number of buckets");
+
+    // size_type unsafe_max_bucket_count() const;
+    ASSERT(ccont.unsafe_max_bucket_count() > 65536, "Wrong max number of buckets");
+
+    for (unsigned int i = 0; i < 256; i++)
+    {
+        typename T::size_type buck = ccont.unsafe_bucket(i);
+
+        // size_type unsafe_bucket(const key_type& k) const;
+        ASSERT(buck < 16, "Wrong bucket mapping");
+    }
+
+    typename T::size_type bucketSizeSum = 0;
+    typename T::size_type iteratorSizeSum = 0;
+
+    for (unsigned int i = 0; i < 16; i++)
+    {
+        bucketSizeSum += cont.unsafe_bucket_size(i);
+        for (typename T::iterator bit = cont.unsafe_begin(i); bit != cont.unsafe_end(i); bit++) iteratorSizeSum++;
+    }
+    ASSERT(bucketSizeSum == 256, "sum of bucket counts incorrect");
+    ASSERT(iteratorSizeSum == 256, "sum of iterator counts incorrect");
+
+    // void swap(T&);
+    cont.swap(newcont);
+    ASSERT(newcont.size() == 256, "Wrong number of elements after swap");
+    ASSERT(newcont.count(200) == 1, "Element with key 200 is not present after swap");
+    ASSERT(newcont.count(16) == 1, "Element with key 16 is not present after swap");
+    ASSERT(newcont.count(99) == 1, "Element with key 99 is not present after swap");
+    ASSERT(T::allow_multimapping ? (cont.size() == 3) : (cont.size() == 2), "Wrong number of elements after swap");
+
+    REMARK("passed -- basic %s tests\n", str);
+
+#if defined (VERBOSE)
+    REMARK("container dump debug:\n");
+    cont._Dump();
+    REMARK("container dump release:\n");
+    cont.dump();
+    REMARK("\n");
+#endif
+
+    SpecialTests<T>::Test(str);
+}
+
+template<typename T>
+void test_basic(const char * str){
+    test_basic<T>(str, tbb::internal::false_type());
+}
+
+void test_machine() {
+    ASSERT(__TBB_ReverseByte(0)==0, NULL );
+    ASSERT(__TBB_ReverseByte(1)==0x80, NULL );
+    ASSERT(__TBB_ReverseByte(0xFE)==0x7F, NULL );
+    ASSERT(__TBB_ReverseByte(0xFF)==0xFF, NULL );
+}
+
+template<typename T>
+class FillTable: NoAssign {
+    T &table;
+    const int items;
+    bool my_asymptotic;
+    typedef std::pair<typename T::iterator, bool> pairIB;
+public:
+    FillTable(T &t, int i, bool asymptotic) : table(t), items(i), my_asymptotic(asymptotic) {
+        ASSERT( !(items&1) && items > 100, NULL);
+    }
+    void operator()(int threadn) const {
+        if( threadn == 0 ) { // Fill even keys forward (single thread)
+            bool last_inserted = true;
+            for( int i = 0; i < items; i+=2 ) {
+                pairIB pib = table.insert(Value<T>::make(my_asymptotic?1:i));
+                ASSERT(Value<T>::get(*(pib.first)) == (my_asymptotic?1:i), "Element not properly inserted");
+                ASSERT( last_inserted || !pib.second, "Previous key was not inserted but this is inserted" );
+                last_inserted = pib.second;
+            }
+        } else if( threadn == 1 ) { // Fill even keys backward (single thread)
+            bool last_inserted = true;
+            for( int i = items-2; i >= 0; i-=2 ) {
+                pairIB pib = table.insert(Value<T>::make(my_asymptotic?1:i));
+                ASSERT(Value<T>::get(*(pib.first)) == (my_asymptotic?1:i), "Element not properly inserted");
+                ASSERT( last_inserted || !pib.second, "Previous key was not inserted but this is inserted" );
+                last_inserted = pib.second;
+            }
+        } else if( !(threadn&1) ) { // Fill odd keys forward (multiple threads)
+            for( int i = 1; i < items; i+=2 )
+#if __TBB_INITIALIZER_LISTS_PRESENT && !__TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN
+                if ( i % 32 == 1 && i + 6 < items ) {
+                    if (my_asymptotic) {
+                        table.insert({ Value<T>::make(1), Value<T>::make(1), Value<T>::make(1) });
+                        ASSERT(Value<T>::get(*table.find(1)) == 1, "Element not properly inserted");
+                    }
+                    else {
+                        table.insert({ Value<T>::make(i), Value<T>::make(i + 2), Value<T>::make(i + 4) });
+                        ASSERT(Value<T>::get(*table.find(i)) == i, "Element not properly inserted");
+                        ASSERT(Value<T>::get(*table.find(i + 2)) == i + 2, "Element not properly inserted");
+                        ASSERT(Value<T>::get(*table.find(i + 4)) == i + 4, "Element not properly inserted");
+                    }
+                    i += 4;
+                } else
+#endif
+                {
+                    pairIB pib = table.insert(Value<T>::make(my_asymptotic ? 1 : i));
+                    ASSERT(Value<T>::get(*(pib.first)) == (my_asymptotic ? 1 : i), "Element not properly inserted");
+                }
+        } else { // Check odd keys backward (multiple threads)
+            if (!my_asymptotic) {
+                bool last_found = false;
+                for( int i = items-1; i >= 0; i-=2 ) {
+                    typename T::iterator it = table.find(i);
+                    if( it != table.end() ) { // found
+                        ASSERT(Value<T>::get(*it) == i, "Element not properly inserted");
+                        last_found = true;
+                    } else ASSERT( !last_found, "Previous key was found but this is not" );
+                }
+            }
+        }
+    }
+};
+
+typedef tbb::atomic<unsigned char> AtomicByte;
+
+template<typename ContainerType, typename RangeType>
+struct ParallelTraverseBody: NoAssign {
+    const int n;
+    AtomicByte* const array;
+    ParallelTraverseBody( AtomicByte an_array[], int a_n ) :
+        n(a_n), array(an_array)
+    {}
+    void operator()( const RangeType& range ) const {
+        for( typename RangeType::iterator i = range.begin(); i!=range.end(); ++i ) {
+            int k = static_cast<int>(Value<ContainerType>::key(*i));
+            ASSERT( k == Value<ContainerType>::get(*i), NULL );
+            ASSERT( 0<=k && k<n, NULL );
+            array[k]++;
+        }
+    }
+};
+
+// if multimapping, oddCount is the value that each odd-indexed array element should have.
+// not meaningful for non-multimapped case.
+void CheckRange( AtomicByte array[], int n, bool allowMultiMapping, int oddCount ) {
+    if(allowMultiMapping) {
+        for( int k = 0; k<n; ++k) {
+            if(k%2) {
+                if( array[k] != oddCount ) {
+                    REPORT("array[%d]=%d (should be %d)\n", k, int(array[k]), oddCount);
+                    ASSERT(false,NULL);
+                }
+            }
+            else {
+                if(array[k] != 2) {
+                    REPORT("array[%d]=%d\n", k, int(array[k]));
+                    ASSERT(false,NULL);
+                }
+            }
+        }
+    }
+    else {
+        for( int k=0; k<n; ++k ) {
+            if( array[k] != 1 ) {
+                REPORT("array[%d]=%d\n", k, int(array[k]));
+                ASSERT(false,NULL);
+            }
+        }
+    }
+}
+
+template<typename T>
+class CheckTable: NoAssign {
+    T &table;
+public:
+    CheckTable(T &t) : NoAssign(), table(t) {}
+    void operator()(int i) const {
+        int c = (int)table.count( i );
+        ASSERT( c, "must exist" );
+    }
+};
+
+template<typename T>
+void test_concurrent(const char *tablename, bool asymptotic = false) {
+#if TBB_USE_ASSERT
+    int items = 2000;
+#else
+    int items = 20000;
+#endif
+    int nItemsInserted = 0;
+    int nThreads = 0;
+    T table(items/1000);
+    #if __bgp__
+    nThreads = 6;
+    #else
+    nThreads = 16;
+    #endif
+    if(T::allow_multimapping) {
+        // even passes (threads 0 & 1) put N/2 items each
+        // odd passes  (threads > 1)   put N/2 if thread is odd, else checks if even.
+        items = 4*items / (nThreads + 2);  // approximately same number of items inserted.
+        nItemsInserted = items + (nThreads-2) * items / 4;
+    }
+    else {
+        nItemsInserted = items;
+    }
+    REMARK("%s items == %d\n", tablename, items);
+    tbb::tick_count t0 = tbb::tick_count::now();
+    NativeParallelFor( nThreads, FillTable<T>(table, items, asymptotic) );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    REMARK( "time for filling '%s' by %d items = %g\n", tablename, table.size(), (t1-t0).seconds() );
+    ASSERT( int(table.size()) == nItemsInserted, NULL);
+
+    if(!asymptotic) {
+        AtomicByte* array = new AtomicByte[items];
+        memset( static_cast<void*>(array), 0, items*sizeof(AtomicByte) );
+
+        typename T::range_type r = table.range();
+        std::pair<intptr_t,intptr_t> p = CheckRecursiveRange<T,typename T::iterator>(r);
+        ASSERT((nItemsInserted == p.first), NULL);
+        tbb::parallel_for( r, ParallelTraverseBody<T, typename T::const_range_type>( array, items ));
+        CheckRange( array, items, T::allow_multimapping, (nThreads - 1)/2 );
+
+        const T &const_table = table;
+        memset( static_cast<void*>(array), 0, items*sizeof(AtomicByte) );
+        typename T::const_range_type cr = const_table.range();
+        ASSERT((nItemsInserted == CheckRecursiveRange<T,typename T::const_iterator>(cr).first), NULL);
+        tbb::parallel_for( cr, ParallelTraverseBody<T, typename T::const_range_type>( array, items ));
+        CheckRange( array, items, T::allow_multimapping, (nThreads - 1) / 2 );
+        delete[] array;
+
+        tbb::parallel_for( 0, items, CheckTable<T>( table ) );
+    }
+
+    table.clear();
+    CheckAllocatorA(table, items+1, items); // one dummy is always allocated
+
+}
+
+// The helper to call a function only when a doCall == true.
+template <bool doCall> struct CallIf {
+    template<typename FuncType> void operator() ( FuncType func ) const { func(); }
+};
+template <> struct CallIf<false> {
+    template<typename FuncType> void operator()( FuncType ) const {}
+};
+
+#include <vector>
+#include <list>
+#include <algorithm>
+
+template <typename ValueType>
+class TestRange : NoAssign {
+    const std::list<ValueType> &my_lst;
+    std::vector< tbb::atomic<bool> > &my_marks;
+public:
+    TestRange( const std::list<ValueType> &lst, std::vector< tbb::atomic<bool> > &marks ) : my_lst( lst ), my_marks( marks ) {
+        std::fill( my_marks.begin(), my_marks.end(), false );
+    }
+    template <typename Range>
+    void operator()( const Range &r ) const { doTestRange( r.begin(), r.end() ); }
+    template<typename Iterator>
+    void doTestRange( Iterator i, Iterator j ) const {
+        for ( Iterator it = i; it != j; ) {
+            Iterator prev_it = it++;
+            typename std::list<ValueType>::const_iterator it2 = std::search( my_lst.begin(), my_lst.end(), prev_it, it, Harness::IsEqual() );
+            ASSERT( it2 != my_lst.end(), NULL );
+            typename std::list<ValueType>::difference_type dist = std::distance( my_lst.begin( ), it2 );
+            ASSERT( !my_marks[dist], NULL );
+            my_marks[dist] = true;
+        }
+    }
+};
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+// For the sake of simplified testing, make unique_ptr implicitly convertible to/from the pointer
+namespace test {
+    template<typename T>
+    class unique_ptr : public std::unique_ptr<T> {
+    public:
+        typedef typename std::unique_ptr<T>::pointer pointer;
+        unique_ptr( pointer p ) : std::unique_ptr<T>(p) {}
+        operator pointer() const { return this->get(); }
+    };
+}
+
+namespace tbb {
+    template<> class tbb_hash< std::shared_ptr<int> > {
+    public:
+        size_t operator()( const std::shared_ptr<int>& key ) const { return tbb_hasher( *key ); }
+    };
+    template<> class tbb_hash< const std::shared_ptr<int> > {
+    public:
+        size_t operator()( const std::shared_ptr<int>& key ) const { return tbb_hasher( *key ); }
+    };
+    template<> class tbb_hash< std::weak_ptr<int> > {
+    public:
+        size_t operator()( const std::weak_ptr<int>& key ) const { return tbb_hasher( *key.lock( ) ); }
+    };
+    template<> class tbb_hash< const std::weak_ptr<int> > {
+    public:
+        size_t operator()( const std::weak_ptr<int>& key ) const { return tbb_hasher( *key.lock( ) ); }
+    };
+    template<> class tbb_hash< test::unique_ptr<int> > {
+    public:
+        size_t operator()( const test::unique_ptr<int>& key ) const { return tbb_hasher( *key ); }
+    };
+    template<> class tbb_hash< const test::unique_ptr<int> > {
+    public:
+        size_t operator()( const test::unique_ptr<int>& key ) const { return tbb_hasher( *key ); }
+    };
+}
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+
+template <bool, typename Table>
+void TestMapSpecificMethods( Table &, const typename Table::value_type & ) { /* do nothing for a common case */ }
+
+template <bool defCtorPresent, typename Table>
+class CheckValue : NoAssign {
+    Table &my_c;
+public:
+    CheckValue( Table &c ) : my_c( c ) {}
+    void operator()( const typename Table::value_type &value ) {
+        typedef typename Table::iterator Iterator;
+        typedef typename Table::const_iterator ConstIterator;
+        const Table &constC = my_c;
+        ASSERT( my_c.count( Value<Table>::key( value ) ) == 1, NULL );
+        // find
+        ASSERT( Harness::IsEqual()(*my_c.find( Value<Table>::key( value ) ), value), NULL );
+        ASSERT( Harness::IsEqual()(*constC.find( Value<Table>::key( value ) ), value), NULL );
+        // erase
+        ASSERT( my_c.unsafe_erase( Value<Table>::key( value ) ), NULL );
+        ASSERT( my_c.count( Value<Table>::key( value ) ) == 0, NULL );
+        // insert
+        std::pair<Iterator, bool> res = my_c.insert( value );
+        ASSERT( Harness::IsEqual()(*res.first, value), NULL );
+        ASSERT( res.second, NULL);
+        // erase
+        Iterator it = res.first;
+        it++;
+        ASSERT( my_c.unsafe_erase( res.first ) == it, NULL );
+        // insert
+        ASSERT( Harness::IsEqual()(*my_c.insert( my_c.begin(), value ), value), NULL );
+        // equal_range
+        std::pair<Iterator, Iterator> r1 = my_c.equal_range( Value<Table>::key( value ) );
+        ASSERT( Harness::IsEqual()(*r1.first, value) && ++r1.first == r1.second, NULL );
+        std::pair<ConstIterator, ConstIterator> r2 = constC.equal_range( Value<Table>::key( value ) );
+        ASSERT( Harness::IsEqual()(*r2.first, value) && ++r2.first == r2.second, NULL );
+        TestMapSpecificMethods<defCtorPresent>( my_c, value );
+    }
+};
+
+#include "tbb/task_scheduler_init.h"
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#include "test_container_move_support.h"
+
+struct unordered_move_traits_base {
+    enum{ expected_number_of_items_to_allocate_for_steal_move = 3 };
+
+    template <typename unordered_type, typename iterator_type>
+    static unordered_type& construct_container(tbb::aligned_space<unordered_type> & storage, iterator_type begin, iterator_type end){
+        new (storage.begin()) unordered_type(begin, end);
+        return * storage.begin();
+    }
+
+    template <typename unordered_type, typename iterator_type, typename allocator_type>
+    static unordered_type& construct_container(tbb::aligned_space<unordered_type> & storage, iterator_type begin, iterator_type end, allocator_type const& a ){
+        size_t deault_n_of_buckets = 8; //can not use concurrent_unordered_base::n_of_buckets as it is inaccessible
+        new (storage.begin()) unordered_type(begin, end, deault_n_of_buckets, typename unordered_type::hasher(), typename unordered_type::key_equal(), a);
+        return * storage.begin();
+    }
+
+    template<typename unordered_type, typename iterator>
+    static bool equal(unordered_type const& c, iterator begin, iterator end){
+        bool equal_sizes = ( static_cast<size_t>(std::distance(begin, end)) == c.size() );
+        if (!equal_sizes)
+            return false;
+
+        for (iterator it = begin; it != end; ++it ){
+            if (c.find( Value<unordered_type>::key(*it)) == c.end()){
+                return false;
+            }
+        }
+        return true;
+    }
+};
+
+template<typename container_traits>
+void test_rvalue_ref_support(const char* container_name){
+    TestMoveConstructor<container_traits>();
+    TestMoveAssignOperator<container_traits>();
+#if TBB_USE_EXCEPTIONS
+    TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorMemoryFailure<container_traits>();
+    TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorExceptionInElementCtor<container_traits>();
+#endif //TBB_USE_EXCEPTIONS
+    REMARK("passed -- %s move support tests\n", container_name);
+}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+template <bool defCtorPresent, typename Table>
+void Examine( Table c, const std::list<typename Table::value_type> &lst ) {
+    typedef typename Table::size_type SizeType;
+    typedef typename Table::value_type ValueType;
+
+    ASSERT( !c.empty() && c.size() == lst.size() && c.max_size() >= c.size(), NULL );
+
+    std::for_each( lst.begin(), lst.end(), CheckValue<defCtorPresent, Table>( c ) );
+
+    std::vector< tbb::atomic<bool> > marks( lst.size() );
+
+    TestRange<ValueType>( lst, marks ).doTestRange( c.begin(), c.end() );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    TestRange<ValueType>( lst, marks ).doTestRange( c.begin(), c.end() );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    const Table constC = c;
+    ASSERT( c.size() == constC.size(), NULL );
+
+    TestRange<ValueType>( lst, marks ).doTestRange( constC.cbegin(), constC.cend() );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    tbb::task_scheduler_init init;
+
+    tbb::parallel_for( c.range(), TestRange<ValueType>( lst, marks ) );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    tbb::parallel_for( constC.range( ), TestRange<ValueType>( lst, marks ) );
+    ASSERT( std::find( marks.begin(), marks.end(), false ) == marks.end(), NULL );
+
+    const SizeType bucket_count = c.unsafe_bucket_count();
+    ASSERT( c.unsafe_max_bucket_count() >= bucket_count, NULL );
+    SizeType counter = SizeType( 0 );
+    for ( SizeType i = 0; i < bucket_count; ++i ) {
+        const SizeType size = c.unsafe_bucket_size( i );
+        typedef typename Table::difference_type diff_type;
+        ASSERT( std::distance( c.unsafe_begin( i ), c.unsafe_end( i ) ) == diff_type( size ), NULL );
+        ASSERT( std::distance( c.unsafe_cbegin( i ), c.unsafe_cend( i ) ) == diff_type( size ), NULL );
+        ASSERT( std::distance( constC.unsafe_begin( i ), constC.unsafe_end( i ) ) == diff_type( size ), NULL );
+        ASSERT( std::distance( constC.unsafe_cbegin( i ), constC.unsafe_cend( i ) ) == diff_type( size ), NULL );
+        counter += size;
+    }
+    ASSERT( counter == lst.size(), NULL );
+
+    typedef typename Table::value_type value_type;
+    for ( typename std::list<value_type>::const_iterator it = lst.begin(); it != lst.end(); ) {
+        const SizeType index = c.unsafe_bucket( Value<Table>::key( *it ) );
+        typename std::list<value_type>::const_iterator prev_it = it++;
+        ASSERT( std::search( c.unsafe_begin( index ), c.unsafe_end( index ), prev_it, it, Harness::IsEqual() ) != c.unsafe_end( index ), NULL );
+    }
+
+    c.rehash( 2 * bucket_count );
+    ASSERT( c.unsafe_bucket_count() > bucket_count, NULL );
+
+    ASSERT( c.load_factor() <= c.max_load_factor(), NULL );
+    c.max_load_factor( 1.0f );
+
+    Table c2;
+    typename std::list<value_type>::const_iterator begin5 = lst.begin();
+    std::advance( begin5, 5 );
+    c2.insert( lst.begin(), begin5 );
+    std::for_each( lst.begin(), begin5, CheckValue<defCtorPresent, Table>( c2 ) );
+
+    c2.swap( c );
+    ASSERT( c2.size() == lst.size(), NULL );
+    ASSERT( c.size() == 5, NULL );
+    std::for_each( lst.begin(), lst.end(), CheckValue<defCtorPresent, Table>( c2 ) );
+
+    c2.clear();
+    ASSERT( c2.size() == 0, NULL );
+
+    typename Table::allocator_type a = c.get_allocator();
+    value_type *ptr = a.allocate( 1 );
+    ASSERT( ptr, NULL );
+    a.deallocate( ptr, 1 );
+
+    c.hash_function();
+    c.key_eq();
+}
+
+template <bool defCtorPresent, typename Table, typename TableDebugAlloc>
+void TypeTester( const std::list<typename Table::value_type> &lst ) {
+    ASSERT( lst.size() >= 5, "Array should have at least 5 elements" );
+    ASSERT( lst.size() <= 100, "The test has O(n^2) complexity so a big number of elements can lead long execution time" );
+    // Construct an empty table.
+    Table c1;
+    c1.insert( lst.begin(), lst.end() );
+    Examine<defCtorPresent>( c1, lst );
+
+    typename Table::size_type initial_bucket_number = 8;
+    typename Table::allocator_type allocator;
+    typename Table::hasher hasher;
+#if __TBB_INITIALIZER_LISTS_PRESENT && !__TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN
+    // Constructor from an initializer_list.
+    typename std::list<typename Table::value_type>::const_iterator it = lst.begin();
+    Table c2( { *it++, *it++, *it++ } );
+    c2.insert( it, lst.end( ) );
+    Examine<defCtorPresent>( c2, lst );
+
+    it = lst.begin();
+    // Constructor from an initializer_list, default hasher and key equality and non-default allocator
+    Table c2_alloc( { *it++, *it++, *it++ }, initial_bucket_number, allocator);
+    c2_alloc.insert( it, lst.end() );
+    Examine<defCtorPresent>( c2_alloc, lst );
+
+    it = lst.begin();
+    // Constructor from an initializer_list, default key equality and non-default hasher and allocator
+    Table c2_hash_alloc( { *it++, *it++, *it++ }, initial_bucket_number, hasher, allocator );
+    c2_hash_alloc.insert( it, lst.end() );
+    Examine<defCtorPresent>( c2_hash_alloc, lst );
+#endif
+    // Copying constructor.
+    Table c3( c1 );
+    Examine<defCtorPresent>( c3, lst );
+    // Construct with non-default allocator
+    TableDebugAlloc c4;
+    c4.insert( lst.begin(), lst.end() );
+    Examine<defCtorPresent>( c4, lst );
+    // Copying constructor for a container with a different allocator type.
+    TableDebugAlloc c5( c4 );
+    Examine<defCtorPresent>( c5, lst );
+    // Construction empty table with n preallocated buckets.
+    Table c6( lst.size() );
+    c6.insert( lst.begin(), lst.end() );
+    Examine<defCtorPresent>( c6, lst );
+
+    // Construction empty table with n preallocated buckets, default hasher and key equality and non-default allocator
+    Table c6_alloc( lst.size(), allocator );
+    c6_alloc.insert( lst.begin(), lst.end() );
+    Examine<defCtorPresent>( c6_alloc, lst );
+
+    // Construction empty table with n preallocated buckets, default key equality and non-default hasher and allocator
+    Table c6_hash_alloc( lst.size(), hasher, allocator );
+    c6_hash_alloc.insert( lst.begin(), lst.end() );
+    Examine<defCtorPresent>( c6_hash_alloc, lst );
+
+    TableDebugAlloc c7( lst.size( ) );
+    c7.insert( lst.begin(), lst.end() );
+    Examine<defCtorPresent>( c7, lst );
+    // Construction with a copying iteration range and a given allocator instance.
+    Table c8( c1.begin(), c1.end() );
+    Examine<defCtorPresent>( c8, lst );
+
+    // Construction with a copying iteration range, default hasher and key equality and non-default allocator
+    Table c8_alloc( c1.begin(), c1.end(), initial_bucket_number, allocator );
+    Examine<defCtorPresent>( c8_alloc, lst );
+
+    // Construction with a copying iteration range, default key equality and non-default hasher and allocator
+    Table c8_hash_alloc( c1.begin(), c1.end(), initial_bucket_number, hasher, allocator );
+    Examine<defCtorPresent>( c8_hash_alloc, lst);
+
+    typename TableDebugAlloc::allocator_type a;
+    TableDebugAlloc c9( a );
+    c9.insert( c7.begin(), c7.end() );
+    Examine<defCtorPresent>( c9, lst );
+}
+
+namespace test_select_size_t_constant{
+    __TBB_STATIC_ASSERT((tbb::internal::select_size_t_constant<1234,1234>::value == 1234),"select_size_t_constant::value is not compile time constant");
+//    There will be two constant used in the test 32 bit and 64 bit one.
+//    The 64 bit constant should chosen so that it 32 bit halves adds up to the 32 bit one ( first constant used in the test).
+//    % ~0U is used to sum up 32bit halves of the 64 constant.  ("% ~0U" essentially adds the 32-bit "digits", like "%9" adds
+//    the digits (modulo 9) of a number in base 10).
+//    So iff select_size_t_constant is correct result of the calculation below will be same on both 32bit and 64bit platforms.
+    __TBB_STATIC_ASSERT((tbb::internal::select_size_t_constant<0x12345678U,0x091A2B3C091A2B3CULL>::value % ~0U == 0x12345678U),
+            "select_size_t_constant have chosen the wrong constant");
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_unordered_map.cpp b/xdl/third_party/tbb/src/test/test_concurrent_unordered_map.cpp
new file mode 100644
index 00000000..8d01780f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_unordered_map.cpp
@@ -0,0 +1,337 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define __TBB_EXTRA_DEBUG 1
+#if _MSC_VER
+#define _SCL_SECURE_NO_WARNINGS
+#endif
+
+#include "tbb/concurrent_unordered_map.h"
+#if __TBB_INITIALIZER_LISTS_PRESENT
+// These operator== are used implicitly in  test_initializer_list.h.
+// For some unknown reason clang is not able to find the if they a declared after the
+// inclusion of test_initializer_list.h.
+template<typename container_type>
+bool equal_containers( container_type const& lhs, container_type const& rhs );
+template<typename Key, typename Value>
+bool operator==( tbb::concurrent_unordered_map<Key, Value> const& lhs, tbb::concurrent_unordered_map<Key, Value> const& rhs ) {
+    return equal_containers( lhs, rhs );
+}
+template<typename Key, typename Value>
+bool operator==( tbb::concurrent_unordered_multimap<Key, Value> const& lhs, tbb::concurrent_unordered_multimap<Key, Value> const& rhs ) {
+    return equal_containers( lhs, rhs );
+}
+#endif /* __TBB_INITIALIZER_LISTS_PRESENT */
+#include "test_concurrent_unordered_common.h"
+
+typedef tbb::concurrent_unordered_map<int, int, tbb::tbb_hash<int>, std::equal_to<int>, MyAllocator> MyMap;
+typedef tbb::concurrent_unordered_map<int, int, degenerate_hash<int>, std::equal_to<int>, MyAllocator> MyDegenerateMap;
+typedef tbb::concurrent_unordered_map<int, check_type<int>, tbb::tbb_hash<int>, std::equal_to<int>, MyAllocator> MyCheckedMap;
+typedef tbb::concurrent_unordered_map<intptr_t, FooWithAssign, tbb::tbb_hash<intptr_t>, std::equal_to<intptr_t>, MyAllocator> MyCheckedStateMap;
+typedef tbb::concurrent_unordered_multimap<int, int, tbb::tbb_hash<int>, std::equal_to<int>, MyAllocator> MyMultiMap;
+typedef tbb::concurrent_unordered_multimap<int, int, degenerate_hash<int>, std::equal_to<int>, MyAllocator> MyDegenerateMultiMap;
+typedef tbb::concurrent_unordered_multimap<int, check_type<int>, tbb::tbb_hash<int>, std::equal_to<int>, MyAllocator> MyCheckedMultiMap;
+
+template <>
+struct SpecialTests <MyMap> {
+    static void Test( const char *str ) {
+        MyMap cont( 0 );
+        const MyMap &ccont( cont );
+
+        // mapped_type& operator[](const key_type& k);
+        cont[1] = 2;
+
+        // bool empty() const;
+        ASSERT( !ccont.empty( ), "Concurrent container empty after adding an element" );
+
+        // size_type size() const;
+        ASSERT( ccont.size( ) == 1, "Concurrent container size incorrect" );
+
+        ASSERT( cont[1] == 2, "Concurrent container value incorrect" );
+
+        // mapped_type& at( const key_type& k );
+        // const mapped_type& at(const key_type& k) const;
+        ASSERT( cont.at( 1 ) == 2, "Concurrent container value incorrect" );
+        ASSERT( ccont.at( 1 ) == 2, "Concurrent container value incorrect" );
+
+        // iterator find(const key_type& k);
+        MyMap::const_iterator it = cont.find( 1 );
+        ASSERT( it != cont.end( ) && Value<MyMap>::get( *(it) ) == 2, "Element with key 1 not properly found" );
+        cont.unsafe_erase( it );
+        it = cont.find( 1 );
+        ASSERT( it == cont.end( ), "Element with key 1 not properly erased" );
+
+        REMARK( "passed -- specialized %s tests\n", str );
+    }
+};
+
+void
+check_multimap(MyMultiMap &m, int *targets, int tcount, int key) {
+    std::vector<bool> vfound(tcount,false);
+    std::pair<MyMultiMap::iterator, MyMultiMap::iterator> range = m.equal_range( key );
+    for(MyMultiMap::iterator it = range.first; it != range.second; ++it) {
+        bool found = false;
+        for( int i = 0; i < tcount; ++i) {
+            if((*it).second == targets[i]) {
+                if(!vfound[i])  { // we can insert duplicate values
+                    vfound[i] = found = true;
+                    break;
+                }
+            }
+        }
+        // just in case an extra value in equal_range...
+        ASSERT(found, "extra value from equal range");
+    }
+    for(int i = 0; i < tcount; ++i) ASSERT(vfound[i], "missing value");
+}
+
+template <>
+struct SpecialTests <MyMultiMap> {
+    static void Test( const char *str ) {
+        int one_values[] = { 7, 2, 13, 23, 13 };
+        int zero_values[] = { 4, 9, 13, 29, 42, 111};
+        int n_zero_values = sizeof(zero_values) / sizeof(int);
+        int n_one_values = sizeof(one_values) / sizeof(int);
+        MyMultiMap cont( 0 );
+        const MyMultiMap &ccont( cont );
+        // mapped_type& operator[](const key_type& k);
+        cont.insert( std::make_pair( 1, one_values[0] ) );
+
+        // bool empty() const;
+        ASSERT( !ccont.empty( ), "Concurrent container empty after adding an element" );
+
+        // size_type size() const;
+        ASSERT( ccont.size( ) == 1, "Concurrent container size incorrect" );
+        ASSERT( (*(cont.begin( ))).second == one_values[0], "Concurrent container value incorrect" );
+        ASSERT( (*(cont.equal_range( 1 )).first).second == one_values[0], "Improper value from equal_range" );
+        ASSERT( (cont.equal_range( 1 )).second == cont.end( ), "Improper iterator from equal_range" );
+
+        cont.insert( std::make_pair( 1, one_values[1] ) );
+
+        // bool empty() const;
+        ASSERT( !ccont.empty( ), "Concurrent container empty after adding an element" );
+
+        // size_type size() const;
+        ASSERT( ccont.size( ) == 2, "Concurrent container size incorrect" );
+        check_multimap(cont, one_values, 2, 1);
+
+        // insert the other {1,x} values
+        for( int i = 2; i < n_one_values; ++i ) {
+            cont.insert( std::make_pair( 1, one_values[i] ) );
+        }
+
+        check_multimap(cont, one_values, n_one_values, 1);
+        ASSERT( (cont.equal_range( 1 )).second == cont.end( ), "Improper iterator from equal_range" );
+
+        cont.insert( std::make_pair( 0, zero_values[0] ) );
+
+        // bool empty() const;
+        ASSERT( !ccont.empty( ), "Concurrent container empty after adding an element" );
+
+        // size_type size() const;
+        ASSERT( ccont.size( ) == (size_t)(n_one_values+1), "Concurrent container size incorrect" );
+        check_multimap(cont, one_values, n_one_values, 1);
+        check_multimap(cont, zero_values, 1, 0);
+        ASSERT( (*(cont.begin( ))).second == zero_values[0], "Concurrent container value incorrect" );
+        // insert the rest of the zero values
+        for( int i = 1; i < n_zero_values; ++i) {
+            cont.insert( std::make_pair( 0, zero_values[i] ) );
+        }
+        check_multimap(cont, one_values, n_one_values, 1);
+        check_multimap(cont, zero_values, n_zero_values, 0);
+
+        // clear, reinsert interleaved
+        cont.clear();
+        int bigger_num = ( n_one_values > n_zero_values ) ? n_one_values : n_zero_values;
+        for( int i = 0; i < bigger_num; ++i ) {
+            if(i < n_one_values) cont.insert( std::make_pair( 1, one_values[i] ) );
+            if(i < n_zero_values) cont.insert( std::make_pair( 0, zero_values[i] ) );
+        }
+        check_multimap(cont, one_values, n_one_values, 1);
+        check_multimap(cont, zero_values, n_zero_values, 0);
+
+
+        REMARK( "passed -- specialized %s tests\n", str );
+    }
+};
+
+#if __TBB_RANGE_BASED_FOR_PRESENT
+#include "test_range_based_for.h"
+// Add the similar test for concurrent_unordered_set.
+void TestRangeBasedFor() {
+    using namespace range_based_for_support_tests;
+
+    REMARK( "testing range based for loop compatibility \n" );
+    typedef tbb::concurrent_unordered_map<int, int> cu_map;
+    cu_map a_cu_map;
+    const int sequence_length = 100;
+    for ( int i = 1; i <= sequence_length; ++i ) {
+        a_cu_map.insert( cu_map::value_type( i, i ) );
+    }
+
+    ASSERT( range_based_for_accumulate( a_cu_map, pair_second_summer(), 0 ) == gauss_summ_of_int_sequence( sequence_length ), "incorrect accumulated value generated via range based for ?" );
+}
+#endif /* __TBB_RANGE_BASED_FOR_PRESENT */
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+struct cu_map_type : unordered_move_traits_base {
+    template<typename element_type, typename allocator_type>
+    struct apply {
+        typedef tbb::concurrent_unordered_map<element_type, element_type, tbb::tbb_hash<element_type>, std::equal_to<element_type>, allocator_type > type;
+    };
+
+    typedef FooPairIterator init_iterator_type;
+};
+
+struct cu_multimap_type : unordered_move_traits_base {
+    template<typename element_type, typename allocator_type>
+    struct apply {
+        typedef tbb::concurrent_unordered_multimap<element_type, element_type, tbb::tbb_hash<element_type>, std::equal_to<element_type>, allocator_type > type;
+    };
+
+    typedef FooPairIterator init_iterator_type;
+};
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+template <typename Table>
+class TestOperatorSquareBrackets : NoAssign {
+    typedef typename Table::value_type ValueType;
+    Table &my_c;
+    const ValueType &my_value;
+public:
+    TestOperatorSquareBrackets( Table &c, const ValueType &value ) : my_c( c ), my_value( value ) {}
+    void operator()() const {
+        ASSERT( Harness::IsEqual()(my_c[my_value.first], my_value.second), NULL );
+    }
+};
+
+template <bool defCtorPresent, typename Key, typename Element, typename Hasher, typename Equality, typename Allocator>
+void TestMapSpecificMethods( tbb::concurrent_unordered_map<Key, Element, Hasher, Equality, Allocator> &c,
+    const typename tbb::concurrent_unordered_map<Key, Element, Hasher, Equality, Allocator>::value_type &value ) {
+    typedef tbb::concurrent_unordered_map<Key, Element, Hasher, Equality, Allocator> Table;
+    CallIf<defCtorPresent>()(TestOperatorSquareBrackets<Table>( c, value ));
+    ASSERT( Harness::IsEqual()(c.at( value.first ), value.second), NULL );
+    const Table &constC = c;
+    ASSERT( Harness::IsEqual()(constC.at( value.first ), value.second), NULL );
+}
+
+template <bool defCtorPresent, typename ValueType>
+void TestTypesMap( const std::list<ValueType> &lst ) {
+    typedef typename ValueType::first_type KeyType;
+    typedef typename ValueType::second_type ElemType;
+    TypeTester< defCtorPresent, tbb::concurrent_unordered_map<KeyType, ElemType, tbb::tbb_hash<KeyType>, Harness::IsEqual>,
+        tbb::concurrent_unordered_map< KeyType, ElemType, tbb::tbb_hash<KeyType>, Harness::IsEqual, debug_allocator<ValueType> > >( lst );
+    TypeTester< defCtorPresent, tbb::concurrent_unordered_multimap<KeyType, ElemType, tbb::tbb_hash<KeyType>, Harness::IsEqual>,
+        tbb::concurrent_unordered_multimap< KeyType, ElemType, tbb::tbb_hash<KeyType>, Harness::IsEqual, debug_allocator<ValueType> > >( lst );
+}
+
+void TestTypes() {
+    const int NUMBER = 10;
+
+    std::list< std::pair<const int, int> > arrIntInt;
+    for ( int i = 0; i < NUMBER; ++i ) arrIntInt.push_back( std::make_pair( i, NUMBER - i ) );
+    TestTypesMap</*def_ctor_present = */true>( arrIntInt );
+
+    std::list< std::pair< const int, tbb::atomic<int> > > arrIntTbb;
+    for ( int i = 0; i < NUMBER; ++i ) {
+        tbb::atomic<int> b;
+        b = NUMBER - i;
+        arrIntTbb.push_back( std::make_pair( i, b ) );
+    }
+    TestTypesMap</*defCtorPresent = */true>( arrIntTbb );
+
+#if __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN
+    std::list< std::pair<const std::reference_wrapper<const int>, int> > arrRefInt;
+    for ( std::list< std::pair<const int, int> >::iterator it = arrIntInt.begin(); it != arrIntInt.end(); ++it )
+        arrRefInt.push_back( std::make_pair( std::reference_wrapper<const int>( it->first ), it->second ) );
+    TestTypesMap</*defCtorPresent = */true>( arrRefInt );
+
+    std::list< std::pair<const int, std::reference_wrapper<int> > > arrIntRef;
+    for ( std::list< std::pair<const int, int> >::iterator it = arrIntInt.begin(); it != arrIntInt.end(); ++it ) {
+        // Using std::make_pair below causes compilation issues with early implementations of std::reference_wrapper.
+        arrIntRef.push_back( std::pair<const int, std::reference_wrapper<int> >( it->first, std::reference_wrapper<int>( it->second ) ) );
+    }
+    TestTypesMap</*defCtorPresent = */false>( arrIntRef );
+#endif /* __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN */
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+    std::list< std::pair< const std::shared_ptr<int>, std::shared_ptr<int> > > arrShrShr;
+    for ( int i = 0; i < NUMBER; ++i ) {
+        const int NUMBER_minus_i = NUMBER - i;
+        arrShrShr.push_back( std::make_pair( std::make_shared<int>( i ), std::make_shared<int>( NUMBER_minus_i ) ) );
+    }
+    TestTypesMap</*defCtorPresent = */true>( arrShrShr );
+
+    std::list< std::pair< const std::weak_ptr<int>, std::weak_ptr<int> > > arrWkWk;
+    std::copy( arrShrShr.begin(), arrShrShr.end(), std::back_inserter( arrWkWk ) );
+    TestTypesMap</*defCtorPresent = */true>( arrWkWk );
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    // Regression test for a problem with excessive requirements of emplace()
+    test_emplace_insert<tbb::concurrent_unordered_map< int*, test::unique_ptr<int> >,
+                        tbb::internal::false_type>( new int, new int );
+    test_emplace_insert<tbb::concurrent_unordered_multimap< int*, test::unique_ptr<int> >,
+                        tbb::internal::false_type>( new int, new int );
+#endif
+
+#else
+    REPORT( "Known issue: C++11 smart pointer tests are skipped.\n" );
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+}
+
+int TestMain() {
+    test_machine();
+
+    test_basic<MyMap>( "concurrent unordered Map" );
+    test_basic<MyDegenerateMap>( "concurrent unordered degenerate Map" );
+    test_concurrent<MyMap>( "concurrent unordered Map" );
+    test_concurrent<MyDegenerateMap>( "concurrent unordered degenerate Map" );
+    test_basic<MyMultiMap>( "concurrent unordered MultiMap" );
+    test_basic<MyDegenerateMultiMap>( "concurrent unordered degenerate MultiMap" );
+    test_concurrent<MyMultiMap>( "concurrent unordered MultiMap" );
+    test_concurrent<MyDegenerateMultiMap>( "concurrent unordered degenerate MultiMap" );
+    test_concurrent<MyMultiMap>( "concurrent unordered MultiMap asymptotic", true );
+
+    { Check<MyCheckedMap::value_type> checkit; test_basic<MyCheckedMap>( "concurrent unordered map (checked)" ); }
+    { Check<MyCheckedMap::value_type> checkit; test_concurrent<MyCheckedMap>( "concurrent unordered map (checked)" ); }
+    test_basic<MyCheckedStateMap>("concurrent unordered map (checked state of elements)", tbb::internal::true_type());
+    test_concurrent<MyCheckedStateMap>("concurrent unordered map (checked state of elements)");
+
+    { Check<MyCheckedMultiMap::value_type> checkit; test_basic<MyCheckedMultiMap>( "concurrent unordered MultiMap (checked)" ); }
+    { Check<MyCheckedMultiMap::value_type> checkit; test_concurrent<MyCheckedMultiMap>( "concurrent unordered MultiMap (checked)" ); }
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    TestInitList< tbb::concurrent_unordered_map<int, int>,
+                  tbb::concurrent_unordered_multimap<int, int> >( {{1,1},{2,2},{3,3},{4,4},{5,5}} );
+#endif /* __TBB_INITIALIZER_LISTS_PRESENT */
+
+#if __TBB_RANGE_BASED_FOR_PRESENT
+    TestRangeBasedFor();
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    test_rvalue_ref_support<cu_map_type>( "concurrent unordered map" );
+    test_rvalue_ref_support<cu_multimap_type>( "concurrent unordered multimap" );
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    TestTypes();
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_unordered_set.cpp b/xdl/third_party/tbb/src/test/test_concurrent_unordered_set.cpp
new file mode 100644
index 00000000..92695359
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_unordered_set.cpp
@@ -0,0 +1,203 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER
+#define _SCL_SECURE_NO_WARNINGS
+#endif
+
+#include "harness_defs.h"
+#if !(__TBB_TEST_SECONDARY && __TBB_CPP11_STD_PLACEHOLDERS_LINKAGE_BROKEN)
+
+#define __TBB_EXTRA_DEBUG 1
+#include "tbb/concurrent_unordered_set.h"
+#include "harness_assert.h"
+
+#if __TBB_TEST_SECONDARY
+
+#include "harness_runtime_loader.h"
+
+#else // __TBB_TEST_SECONDARY
+#if __TBB_INITIALIZER_LISTS_PRESENT
+// These operator== are used implicitly in  test_initializer_list.h.
+// For some unknown reason clang is not able to find the if they a declared after the
+// inclusion of test_initializer_list.h.
+template<typename container_type>
+bool equal_containers( container_type const& lhs, container_type const& rhs );
+template<typename T>
+bool operator==(tbb::concurrent_unordered_set<T> const& lhs, tbb::concurrent_unordered_set<T> const& rhs) {
+    return equal_containers( lhs, rhs );
+}
+
+template<typename T>
+bool operator==(tbb::concurrent_unordered_multiset<T> const& lhs, tbb::concurrent_unordered_multiset<T> const& rhs) {
+    return equal_containers( lhs, rhs );
+}
+#endif /* __TBB_INITIALIZER_LISTS_PRESENT */
+#include "test_concurrent_unordered_common.h"
+
+typedef tbb::concurrent_unordered_set<int, tbb::tbb_hash<int>, std::equal_to<int>, MyAllocator> MySet;
+typedef tbb::concurrent_unordered_set<int, degenerate_hash<int>, std::equal_to<int>, MyAllocator> MyDegenerateSet;
+typedef tbb::concurrent_unordered_set<check_type<int>, tbb::tbb_hash<check_type<int> >, std::equal_to<check_type<int> >, MyAllocator> MyCheckedSet;
+typedef tbb::concurrent_unordered_set<FooWithAssign, tbb::tbb_hash<Foo>, std::equal_to<FooWithAssign>, MyAllocator> MyCheckedStateSet;
+typedef tbb::concurrent_unordered_multiset<int, tbb::tbb_hash<int>, std::equal_to<int>, MyAllocator> MyMultiSet;
+typedef tbb::concurrent_unordered_multiset<int, degenerate_hash<int>, std::equal_to<int>, MyAllocator> MyDegenerateMultiSet;
+typedef tbb::concurrent_unordered_multiset<check_type<int>, tbb::tbb_hash<check_type<int> >, std::equal_to<check_type<int> >, MyAllocator> MyCheckedMultiSet;
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+struct cu_set_type : unordered_move_traits_base {
+    template<typename element_type, typename allocator_type>
+    struct apply {
+        typedef tbb::concurrent_unordered_set<element_type, tbb::tbb_hash<element_type>, std::equal_to<element_type>, allocator_type > type;
+    };
+
+    typedef FooIterator init_iterator_type;
+};
+
+struct cu_multiset_type : unordered_move_traits_base {
+    template<typename element_type, typename allocator_type>
+    struct apply {
+        typedef tbb::concurrent_unordered_multiset<element_type, tbb::tbb_hash<element_type>, std::equal_to<element_type>, allocator_type > type;
+    };
+
+    typedef FooIterator init_iterator_type;
+};
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+template <bool defCtorPresent, typename value_type>
+void TestTypesSet( const std::list<value_type> &lst ) {
+    TypeTester< defCtorPresent, tbb::concurrent_unordered_set<value_type, tbb::tbb_hash<value_type>, Harness::IsEqual>,
+        tbb::concurrent_unordered_set< value_type, tbb::tbb_hash<value_type>, Harness::IsEqual, debug_allocator<value_type> > >( lst );
+    TypeTester< defCtorPresent, tbb::concurrent_unordered_multiset<value_type, tbb::tbb_hash<value_type>, Harness::IsEqual>,
+        tbb::concurrent_unordered_multiset< value_type, tbb::tbb_hash<value_type>, Harness::IsEqual, debug_allocator<value_type> > >( lst );
+}
+
+void TestTypes( ) {
+    const int NUMBER = 10;
+
+    std::list<int> arrInt;
+    for ( int i = 0; i<NUMBER; ++i ) arrInt.push_back( i );
+    TestTypesSet</*defCtorPresent = */true>( arrInt );
+
+    std::list< tbb::atomic<int> > arrTbb(NUMBER);
+    int seq = 0;
+    for ( std::list< tbb::atomic<int> >::iterator it = arrTbb.begin(); it != arrTbb.end(); ++it, ++seq ) *it = seq;
+    TestTypesSet</*defCtorPresent = */true>( arrTbb );
+
+#if __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN
+    std::list< std::reference_wrapper<int> > arrRef;
+    for ( std::list<int>::iterator it = arrInt.begin( ); it != arrInt.end( ); ++it )
+        arrRef.push_back( std::reference_wrapper<int>(*it) );
+    TestTypesSet</*defCtorPresent = */false>( arrRef );
+#endif /* __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN */
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+    std::list< std::shared_ptr<int> > arrShr;
+    for ( int i = 0; i<NUMBER; ++i ) arrShr.push_back( std::make_shared<int>( i ) );
+    TestTypesSet</*defCtorPresent = */true>( arrShr );
+
+    std::list< std::weak_ptr<int> > arrWk;
+    std::copy( arrShr.begin( ), arrShr.end( ), std::back_inserter( arrWk ) );
+    TestTypesSet</*defCtorPresent = */true>( arrWk );
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT && __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    // Regression test for a problem with excessive requirements of emplace()
+    test_emplace_insert<tbb::concurrent_unordered_set< test::unique_ptr<int> >,
+                        tbb::internal::false_type>( new int, new int );
+    test_emplace_insert<tbb::concurrent_unordered_multiset< test::unique_ptr<int> >,
+                        tbb::internal::false_type>( new int, new int );
+#endif
+
+#else
+    REPORT( "Known issue: C++11 smart pointer tests are skipped.\n" );
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+}
+#endif // __TBB_TEST_SECONDARY
+
+#if !__TBB_TEST_SECONDARY
+#define INITIALIZATION_TIME_TEST_NAMESPACE            initialization_time_test
+#define TEST_INITIALIZATION_TIME_OPERATIONS_NAME      test_initialization_time_operations
+void test_initialization_time_operations_external();
+#else
+#define INITIALIZATION_TIME_TEST_NAMESPACE            initialization_time_test_external
+#define TEST_INITIALIZATION_TIME_OPERATIONS_NAME      test_initialization_time_operations_external
+#endif
+
+namespace INITIALIZATION_TIME_TEST_NAMESPACE {
+    tbb::concurrent_unordered_set<int> static_init_time_set;
+    int any_non_zero_value = 89432;
+    bool static_init_time_inserted = (static_init_time_set.insert( any_non_zero_value )).second;
+    bool static_init_time_found = ((static_init_time_set.find( any_non_zero_value )) != static_init_time_set.end( ));
+}
+void TEST_INITIALIZATION_TIME_OPERATIONS_NAME( ) {
+    using namespace INITIALIZATION_TIME_TEST_NAMESPACE;
+#define LOCATION ",in function: " __TBB_STRING(TEST_INITIALIZATION_TIME_OPERATIONS_NAME)
+    ASSERT( static_init_time_inserted, "failed to insert an item during initialization of global objects" LOCATION );
+    ASSERT( static_init_time_found, "failed to find an item during initialization of global objects" LOCATION );
+
+    bool static_init_time_found_in_main = ((static_init_time_set.find( any_non_zero_value )) != static_init_time_set.end( ));
+    ASSERT( static_init_time_found_in_main, "failed to find during main() an item inserted during initialization of global objects" LOCATION );
+#undef LOCATION
+}
+
+#if !__TBB_TEST_SECONDARY
+int TestMain() {
+    test_machine( );
+
+    test_basic<MySet>( "concurrent unordered Set" );
+    test_basic<MyDegenerateSet>( "concurrent unordered degenerate Set" );
+    test_concurrent<MySet>("concurrent unordered Set");
+    test_concurrent<MyDegenerateSet>( "concurrent unordered degenerate Set" );
+    test_basic<MyMultiSet>("concurrent unordered MultiSet");
+    test_basic<MyDegenerateMultiSet>("concurrent unordered degenerate MultiSet");
+    test_concurrent<MyMultiSet>( "concurrent unordered MultiSet" );
+    test_concurrent<MyDegenerateMultiSet>("concurrent unordered degenerate MultiSet");
+    test_concurrent<MyMultiSet>( "concurrent unordered MultiSet asymptotic", true );
+
+    { Check<MyCheckedSet::value_type> checkit; test_basic<MyCheckedSet>( "concurrent_unordered_set (checked)" ); }
+    { Check<MyCheckedSet::value_type> checkit; test_concurrent<MyCheckedSet>( "concurrent unordered set (checked)" ); }
+    test_basic<MyCheckedStateSet>("concurrent unordered set (checked element state)", tbb::internal::true_type());
+    test_concurrent<MyCheckedStateSet>("concurrent unordered set (checked element state)");
+
+    { Check<MyCheckedMultiSet::value_type> checkit; test_basic<MyCheckedMultiSet>("concurrent_unordered_multiset (checked)"); }
+    { Check<MyCheckedMultiSet::value_type> checkit; test_concurrent<MyCheckedMultiSet>( "concurrent unordered multiset (checked)" ); }
+
+    test_initialization_time_operations( );
+#if !__TBB_CPP11_STD_PLACEHOLDERS_LINKAGE_BROKEN
+    test_initialization_time_operations_external( );
+#else
+    REPORT( "Known issue: global objects initialization time tests skipped.\n" );
+#endif //!__TBB_CPP11_STD_PLACEHOLDERS_LINKING_BROKEN
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    TestInitList< tbb::concurrent_unordered_set<int>,
+                  tbb::concurrent_unordered_multiset<int> >( {1,2,3,4,5} );
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    test_rvalue_ref_support<cu_set_type>( "concurrent unordered set" );
+    test_rvalue_ref_support<cu_multiset_type>( "concurrent unordered multiset" );
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+    TestTypes();
+
+    return Harness::Done;
+}
+#endif //#if !__TBB_TEST_SECONDARY
+#endif //!(__TBB_TEST_SECONDARY && __TBB_CPP11_STD_PLACEHOLDERS_LINKAGE_BROKEN)
diff --git a/xdl/third_party/tbb/src/test/test_concurrent_vector.cpp b/xdl/third_party/tbb/src/test/test_concurrent_vector.cpp
new file mode 100644
index 00000000..d973619d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_concurrent_vector.cpp
@@ -0,0 +1,1842 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER
+#define _SCL_SECURE_NO_WARNINGS
+#endif
+
+#include "tbb/concurrent_vector.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/tbb_exception.h"
+#include <cstdio>
+#include <cstdlib>
+#include <functional>
+#include <vector>
+#include <numeric>
+#include "harness_report.h"
+#include "harness_assert.h"
+#include "harness_allocator.h"
+#include "harness_defs.h"
+#include "test_container_move_support.h"
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (push)
+    #pragma warning (disable: 4800)
+#endif
+
+#if TBB_USE_EXCEPTIONS
+static bool known_issue_verbose = false;
+#define KNOWN_ISSUE(msg) if(!known_issue_verbose) known_issue_verbose = true, REPORT(msg)
+#endif /* TBB_USE_EXCEPTIONS */
+
+inline void NextSize( int& s ) {
+    if( s<=32 ) ++s;
+    else s += s/10;
+}
+
+//! Check vector have expected size and filling
+template<typename vector_t>
+static void CheckVector( const vector_t& cv, size_t expected_size, size_t old_size ) {
+    ASSERT( cv.capacity()>=expected_size, NULL );
+    ASSERT( cv.size()==expected_size, NULL );
+    ASSERT( cv.empty()==(expected_size==0), NULL );
+    for( int j=0; j<int(expected_size); ++j ) {
+        if( cv[j].bar()!=~j )
+            REPORT("ERROR on line %d for old_size=%ld expected_size=%ld j=%d\n",__LINE__,long(old_size),long(expected_size),j);
+    }
+}
+
+//! Test of assign, grow, copying with various sizes
+void TestResizeAndCopy() {
+    typedef static_counting_allocator<debug_allocator<Foo,std::allocator>, std::size_t> allocator_t;
+    typedef tbb::concurrent_vector<Foo, allocator_t> vector_t;
+    allocator_t::init_counters();
+    for( int old_size=0; old_size<=128; NextSize( old_size ) ) {
+        for( int new_size=0; new_size<=1280; NextSize( new_size ) ) {
+            size_t count = FooCount;
+            vector_t v;
+            ASSERT( count==FooCount, NULL );
+            v.assign(old_size/2, Foo() );
+            ASSERT( count+old_size/2==FooCount, NULL );
+            for( int j=0; j<old_size/2; ++j )
+                ASSERT( v[j].state == Foo::CopyInitialized, NULL);
+            v.assign(FooIterator(0), FooIterator(old_size));
+            v.resize(new_size, Foo(33) );
+            ASSERT( count+new_size==FooCount, NULL );
+            for( int j=0; j<new_size; ++j ) {
+                int expected = j<old_size ? j : 33;
+                if( v[j].bar()!=expected )
+                    REPORT("ERROR on line %d for old_size=%ld new_size=%ld v[%ld].bar()=%d != %d\n",__LINE__,long(old_size),long(new_size),long(j),v[j].bar(), expected);
+            }
+            ASSERT( v.size()==size_t(new_size), NULL );
+            for( int j=0; j<new_size; ++j ) {
+                v[j].bar() = ~j;
+            }
+            const vector_t& cv = v;
+            // Try copy constructor
+            vector_t copy_of_v(cv);
+            CheckVector(cv,new_size,old_size);
+            ASSERT( !(v != copy_of_v), NULL );
+            v.clear();
+            ASSERT( v.empty(), NULL );
+            swap(v, copy_of_v);
+            ASSERT( copy_of_v.empty(), NULL );
+            CheckVector(v,new_size,old_size);
+        }
+    }
+    ASSERT( allocator_t::items_allocated == allocator_t::items_freed, NULL);
+    ASSERT( allocator_t::allocations == allocator_t::frees, NULL);
+}
+
+//! Test reserve, compact, capacity
+void TestCapacity() {
+    typedef static_counting_allocator<debug_allocator<Foo,tbb::cache_aligned_allocator>, std::size_t> allocator_t;
+    typedef tbb::concurrent_vector<Foo, allocator_t> vector_t;
+    allocator_t::init_counters();
+    for( size_t old_size=0; old_size<=11000; old_size=(old_size<5 ? old_size+1 : 3*old_size) ) {
+        for( size_t new_size=0; new_size<=11000; new_size=(new_size<5 ? new_size+1 : 3*new_size) ) {
+            size_t count = FooCount;
+            {
+                vector_t v; v.reserve(old_size);
+                ASSERT( v.capacity()>=old_size, NULL );
+                v.reserve( new_size );
+                ASSERT( v.capacity()>=old_size, NULL );
+                ASSERT( v.capacity()>=new_size, NULL );
+                ASSERT( v.empty(), NULL );
+                size_t fill_size = 2*new_size;
+                for( size_t i=0; i<fill_size; ++i ) {
+                    ASSERT( size_t(FooCount)==count+i, NULL );
+                    size_t j = v.grow_by(1) - v.begin();
+                    ASSERT( j==i, NULL );
+                    v[j].bar() = int(~j);
+                }
+                vector_t copy_of_v(v); // should allocate first segment with same size as for shrink_to_fit()
+                if(__TBB_Log2(/*reserved size*/old_size|1) > __TBB_Log2(fill_size|1) )
+                    ASSERT( v.capacity() != copy_of_v.capacity(), NULL );
+                v.shrink_to_fit();
+                ASSERT( v.capacity() == copy_of_v.capacity(), NULL );
+                CheckVector(v, new_size*2, old_size); // check vector correctness
+                ASSERT( v==copy_of_v, NULL ); // TODO: check also segments layout equality
+            }
+            ASSERT( FooCount==count, NULL );
+        }
+    }
+    ASSERT( allocator_t::items_allocated == allocator_t::items_freed, NULL);
+    ASSERT( allocator_t::allocations == allocator_t::frees, NULL);
+}
+
+struct AssignElement {
+    typedef tbb::concurrent_vector<int>::range_type::iterator iterator;
+    iterator base;
+    void operator()( const tbb::concurrent_vector<int>::range_type& range ) const {
+        for( iterator i=range.begin(); i!=range.end(); ++i ) {
+            if( *i!=0 )
+                REPORT("ERROR for v[%ld]\n", long(i-base));
+            *i = int(i-base);
+        }
+    }
+    AssignElement( iterator base_ ) : base(base_) {}
+};
+
+struct CheckElement {
+    typedef tbb::concurrent_vector<int>::const_range_type::iterator iterator;
+    iterator base;
+    void operator()( const tbb::concurrent_vector<int>::const_range_type& range ) const {
+        for( iterator i=range.begin(); i!=range.end(); ++i )
+            if( *i != int(i-base) )
+                REPORT("ERROR for v[%ld]\n", long(i-base));
+    }
+    CheckElement( iterator base_ ) : base(base_) {}
+};
+
+#include "tbb/tick_count.h"
+#include "tbb/parallel_for.h"
+#include "harness.h"
+
+//! Problem size
+const size_t N = 500000;
+
+//! Test parallel access by iterators
+void TestParallelFor( int nthread ) {
+    typedef tbb::concurrent_vector<int> vector_t;
+    vector_t v;
+    v.resize(N);
+    tbb::tick_count t0 = tbb::tick_count::now();
+    REMARK("Calling parallel_for with %ld threads\n",long(nthread));
+    tbb::parallel_for( v.range(10000), AssignElement(v.begin()) );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    const vector_t& u = v;
+    tbb::parallel_for( u.range(10000), CheckElement(u.begin()) );
+    tbb::tick_count t2 = tbb::tick_count::now();
+    REMARK("Time for parallel_for: assign time = %8.5f, check time = %8.5f\n",
+               (t1-t0).seconds(),(t2-t1).seconds());
+    for( long i=0; size_t(i)<v.size(); ++i )
+        if( v[i]!=i )
+            REPORT("ERROR for v[%ld]\n", i);
+}
+
+template<typename Iterator1, typename Iterator2>
+void TestIteratorAssignment( Iterator2 j ) {
+    Iterator1 i(j);
+    ASSERT( i==j, NULL );
+    ASSERT( !(i!=j), NULL );
+    Iterator1 k;
+    k = j;
+    ASSERT( k==j, NULL );
+    ASSERT( !(k!=j), NULL );
+}
+
+template<typename Range1, typename Range2>
+void TestRangeAssignment( Range2 r2 ) {
+    Range1 r1(r2); r1 = r2;
+}
+
+template<typename Iterator, typename T>
+void TestIteratorTraits() {
+    AssertSameType( static_cast<typename Iterator::difference_type*>(0), static_cast<ptrdiff_t*>(0) );
+    AssertSameType( static_cast<typename Iterator::value_type*>(0), static_cast<T*>(0) );
+    AssertSameType( static_cast<typename Iterator::pointer*>(0), static_cast<T**>(0) );
+    AssertSameType( static_cast<typename Iterator::iterator_category*>(0), static_cast<std::random_access_iterator_tag*>(0) );
+    T x;
+    typename Iterator::reference xr = x;
+    typename Iterator::pointer xp = &x;
+    ASSERT( &xr==xp, NULL );
+}
+
+template<typename Vector, typename Iterator>
+void CheckConstIterator( const Vector& u, int i, const Iterator& cp ) {
+    typename Vector::const_reference pref = *cp;
+    if( pref.bar()!=i )
+        REPORT("ERROR for u[%ld] using const_iterator\n", long(i));
+    typename Vector::difference_type delta = cp-u.begin();
+    ASSERT( delta==i, NULL );
+    if( u[i].bar()!=i )
+        REPORT("ERROR for u[%ld] using subscripting\n", long(i));
+    ASSERT( u.begin()[i].bar()==i, NULL );
+}
+
+template<typename Iterator1, typename Iterator2, typename V>
+void CheckIteratorComparison( V& u ) {
+    V u2 = u;
+    Iterator1 i = u.begin();
+
+    for( int i_count=0; i_count<100; ++i_count ) {
+        Iterator2 j = u.begin();
+        Iterator2 i2 = u2.begin();
+        for( int j_count=0; j_count<100; ++j_count ) {
+            ASSERT( (i==j)==(i_count==j_count), NULL );
+            ASSERT( (i!=j)==(i_count!=j_count), NULL );
+            ASSERT( (i-j)==(i_count-j_count), NULL );
+            ASSERT( (i<j)==(i_count<j_count), NULL );
+            ASSERT( (i>j)==(i_count>j_count), NULL );
+            ASSERT( (i<=j)==(i_count<=j_count), NULL );
+            ASSERT( (i>=j)==(i_count>=j_count), NULL );
+            ASSERT( !(i==i2), NULL );
+            ASSERT( i!=i2, NULL );
+            ++j;
+            ++i2;
+        }
+        ++i;
+    }
+}
+
+template<typename Vector, typename T>
+void TestGrowToAtLeastWithSourceParameter(T const& src){
+    static const size_t vector_size = 10;
+    Vector v1(vector_size,src);
+    Vector v2;
+    v2.grow_to_at_least(vector_size,src);
+    ASSERT(v1==v2,"grow_to_at_least(vector_size,src) did not properly initialize new elements ?");
+}
+//! Test sequential iterators for vector type V.
+/** Also does timing. */
+template<typename T>
+void TestSequentialFor() {
+    typedef tbb::concurrent_vector<FooWithAssign> V;
+    V v(N);
+    ASSERT(v.grow_by(0) == v.grow_by(0, FooWithAssign()), NULL);
+
+    // Check iterator
+    tbb::tick_count t0 = tbb::tick_count::now();
+    typename V::iterator p = v.begin();
+    ASSERT( !(*p).is_const(), NULL );
+    ASSERT( !p->is_const(), NULL );
+    for( int i=0; size_t(i)<v.size(); ++i, ++p ) {
+        if( (*p).state!=Foo::DefaultInitialized )
+            REPORT("ERROR for v[%ld]\n", long(i));
+        typename V::reference pref = *p;
+        pref.bar() = i;
+        typename V::difference_type delta = p-v.begin();
+        ASSERT( delta==i, NULL );
+        ASSERT( -delta<=0, "difference type not signed?" );
+    }
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    // Check const_iterator going forwards
+    const V& u = v;
+    typename V::const_iterator cp = u.begin();
+    ASSERT( cp == v.cbegin(), NULL );
+    ASSERT( (*cp).is_const(), NULL );
+    ASSERT( cp->is_const(), NULL );
+    ASSERT( *cp == v.front(), NULL);
+    for( int i=0; size_t(i)<u.size(); ++i ) {
+        CheckConstIterator(u,i,cp);
+        V::const_iterator &cpr = ++cp;
+        ASSERT( &cpr == &cp, "pre-increment not returning a reference?");
+    }
+    tbb::tick_count t2 = tbb::tick_count::now();
+    REMARK("Time for serial for:  assign time = %8.5f, check time = %8.5f\n",
+               (t1-t0).seconds(),(t2-t1).seconds());
+
+    // Now go backwards
+    cp = u.end();
+    ASSERT( cp == v.cend(), NULL );
+    for( int i=int(u.size()); i>0; ) {
+        --i;
+        V::const_iterator &cpr = --cp;
+        ASSERT( &cpr == &cp, "pre-decrement not returning a reference?");
+        if( i>0 ) {
+            typename V::const_iterator cp_old = cp--;
+            intptr_t here = (*cp_old).bar();
+            ASSERT( here==u[i].bar(), NULL );
+            typename V::const_iterator cp_new = cp++;
+            intptr_t prev = (*cp_new).bar();
+            ASSERT( prev==u[i-1].bar(), NULL );
+        }
+        CheckConstIterator(u,i,cp);
+    }
+
+    // Now go forwards and backwards
+    ptrdiff_t k = 0;
+    cp = u.begin();
+    for( size_t i=0; i<u.size(); ++i ) {
+        CheckConstIterator(u,int(k),cp);
+        typename V::difference_type delta = i*3 % u.size();
+        if( 0<=k+delta && size_t(k+delta)<u.size() ) {
+            V::const_iterator &cpr = (cp += delta);
+            ASSERT( &cpr == &cp, "+= not returning a reference?");
+            k += delta;
+        }
+        delta = i*7 % u.size();
+        if( 0<=k-delta && size_t(k-delta)<u.size() ) {
+            if( i&1 ) {
+                V::const_iterator &cpr = (cp -= delta);
+                ASSERT( &cpr == &cp, "-= not returning a reference?");
+            } else
+                cp = cp - delta;        // Test operator-
+            k -= delta;
+        }
+    }
+
+    for( int i=0; size_t(i)<u.size(); i=(i<50?i+1:i*3) )
+        for( int j=-i; size_t(i+j)<u.size(); j=(j<50?j+1:j*5) ) {
+            ASSERT( (u.begin()+i)[j].bar()==i+j, NULL );
+            ASSERT( (v.begin()+i)[j].bar()==i+j, NULL );
+            ASSERT((v.cbegin()+i)[j].bar()==i+j, NULL );
+            ASSERT( (i+u.begin())[j].bar()==i+j, NULL );
+            ASSERT( (i+v.begin())[j].bar()==i+j, NULL );
+            ASSERT((i+v.cbegin())[j].bar()==i+j, NULL );
+        }
+
+    CheckIteratorComparison<typename V::iterator, typename V::iterator>(v);
+    CheckIteratorComparison<typename V::iterator, typename V::const_iterator>(v);
+    CheckIteratorComparison<typename V::const_iterator, typename V::iterator>(v);
+    CheckIteratorComparison<typename V::const_iterator, typename V::const_iterator>(v);
+
+    TestIteratorAssignment<typename V::const_iterator>( u.begin() );
+    TestIteratorAssignment<typename V::const_iterator>( v.begin() );
+    TestIteratorAssignment<typename V::const_iterator>( v.cbegin() );
+    TestIteratorAssignment<typename V::iterator>( v.begin() );
+    // doesn't compile as expected: TestIteratorAssignment<typename V::iterator>( u.begin() );
+
+    TestRangeAssignment<typename V::const_range_type>( u.range() );
+    TestRangeAssignment<typename V::const_range_type>( v.range() );
+    TestRangeAssignment<typename V::range_type>( v.range() );
+    // doesn't compile as expected: TestRangeAssignment<typename V::range_type>( u.range() );
+
+    // Check reverse_iterator
+    typename V::reverse_iterator rp = v.rbegin();
+    for( size_t i=v.size(); i>0; --i, ++rp ) {
+        typename V::reference pref = *rp;
+        ASSERT( size_t(pref.bar())==i-1, NULL );
+        ASSERT( rp!=v.rend(), NULL );
+    }
+    ASSERT( rp==v.rend(), NULL );
+
+    // Check const_reverse_iterator
+    typename V::const_reverse_iterator crp = u.rbegin();
+    ASSERT( crp == v.crbegin(), NULL );
+    ASSERT( *crp == v.back(), NULL);
+    for( size_t i=v.size(); i>0; --i, ++crp ) {
+        typename V::const_reference cpref = *crp;
+        ASSERT( size_t(cpref.bar())==i-1, NULL );
+        ASSERT( crp!=u.rend(), NULL );
+    }
+    ASSERT( crp == u.rend(), NULL );
+    ASSERT( crp == v.crend(), NULL );
+
+    TestIteratorAssignment<typename V::const_reverse_iterator>( u.rbegin() );
+    TestIteratorAssignment<typename V::reverse_iterator>( v.rbegin() );
+
+    // test compliance with C++ Standard 2003, clause 23.1.1p9
+    {
+        tbb::concurrent_vector<int> v1, v2(1, 100);
+        v1.assign(1, 100); ASSERT(v1 == v2, NULL);
+        ASSERT(v1.size() == 1 && v1[0] == 100, "used integral iterators");
+    }
+
+    // cross-allocator tests
+#if !defined(_WIN64) || defined(_CPPLIB_VER)
+    typedef local_counting_allocator<std::allocator<int>, size_t> allocator1_t;
+    typedef tbb::cache_aligned_allocator<void> allocator2_t;
+    typedef tbb::concurrent_vector<FooWithAssign, allocator1_t> V1;
+    typedef tbb::concurrent_vector<FooWithAssign, allocator2_t> V2;
+    V1 v1( v ); // checking cross-allocator copying
+    V2 v2( 10 ); v2 = v1; // checking cross-allocator assignment
+    ASSERT( (v1 == v) && !(v2 != v), NULL);
+    ASSERT( !(v1 < v) && !(v2 > v), NULL);
+    ASSERT( (v1 <= v) && (v2 >= v), NULL);
+#endif
+}
+
+namespace test_grow_to_at_least_helpers {
+    template<typename MyVector >
+    class GrowToAtLeast: NoAssign {
+        typedef typename MyVector::const_reference const_reference;
+
+        const bool my_use_two_args_form ;
+        MyVector& my_vector;
+        const_reference my_init_from;
+    public:
+        void operator()( const tbb::blocked_range<size_t>& range ) const {
+            for( size_t i=range.begin(); i!=range.end(); ++i ) {
+                size_t n = my_vector.size();
+                size_t req = (i % (2*n+1))+1;
+
+                typename MyVector::iterator p;
+                Foo::State desired_state;
+                if (my_use_two_args_form){
+                    p = my_vector.grow_to_at_least(req,my_init_from);
+                    desired_state = Foo::CopyInitialized;
+                }else{
+                    p = my_vector.grow_to_at_least(req);
+                    desired_state = Foo::DefaultInitialized;
+                }
+                if( p-my_vector.begin() < typename MyVector::difference_type(req) )
+                    ASSERT( p->state == desired_state || p->state == Foo::ZeroInitialized, NULL );
+                ASSERT( my_vector.size()>=req, NULL );
+            }
+        }
+        GrowToAtLeast(bool use_two_args_form, MyVector& vector, const_reference init_from )
+            : my_use_two_args_form(use_two_args_form), my_vector(vector), my_init_from(init_from) {}
+    };
+}
+
+template<bool use_two_arg_form>
+void TestConcurrentGrowToAtLeastImpl() {
+    using namespace test_grow_to_at_least_helpers;
+    typedef static_counting_allocator< tbb::zero_allocator<Foo> > MyAllocator;
+    typedef tbb::concurrent_vector<Foo, MyAllocator> MyVector;
+    Foo copy_from;
+    MyAllocator::init_counters();
+    MyVector v(2, Foo(), MyAllocator());
+    for( size_t s=1; s<1000; s*=10 ) {
+        tbb::parallel_for( tbb::blocked_range<size_t>(0,10000*s,s), GrowToAtLeast<MyVector>(use_two_arg_form, v, copy_from), tbb::simple_partitioner() );
+    }
+    v.clear();
+    ASSERT( 0 == v.get_allocator().frees, NULL);
+    v.shrink_to_fit();
+    size_t items_allocated = v.get_allocator().items_allocated,
+           items_freed = v.get_allocator().items_freed;
+    size_t allocations = v.get_allocator().allocations,
+           frees = v.get_allocator().frees;
+    ASSERT( items_allocated == items_freed, NULL);
+    ASSERT( allocations == frees, NULL);
+}
+
+void TestConcurrentGrowToAtLeast() {
+    TestConcurrentGrowToAtLeastImpl<false>();
+    TestConcurrentGrowToAtLeastImpl<true>();
+}
+
+struct grain_map: NoAssign {
+    enum grow_method_enum {
+        grow_by_range = 1,
+        grow_by_default,
+        grow_by_copy,
+        grow_by_init_list,
+        push_back,
+        push_back_move,
+        emplace_back,
+        last_method
+    };
+
+    struct range_part {
+        size_t number_of_parts;
+        grain_map::grow_method_enum method;
+        bool distribute;
+        Foo::State expected_element_state;
+    };
+
+    const std::vector<range_part> distributed;
+    const std::vector<range_part> batched;
+    const size_t total_number_of_parts;
+
+    grain_map(const range_part* begin, const range_part* end)
+    : distributed(separate(begin,end, &distributed::is_not))
+    , batched(separate(begin,end, &distributed::is_yes))
+    , total_number_of_parts(std::accumulate(begin, end, (size_t)0, &sum_number_of_parts::sum))
+    {}
+
+private:
+    struct sum_number_of_parts{
+        static size_t sum(size_t accumulator, grain_map::range_part const& rp){ return accumulator + rp.number_of_parts;}
+    };
+
+    template <typename functor_t>
+    static std::vector<range_part> separate(const range_part* begin, const range_part* end, functor_t f){
+        std::vector<range_part> part;
+        part.reserve(std::distance(begin,end));
+        //copy all that false==f(*it)
+        std::remove_copy_if(begin, end, std::back_inserter(part), f);
+
+        return part;
+    }
+
+    struct distributed {
+        static bool is_not(range_part const& rp){ return !rp.distribute;}
+        static bool is_yes(range_part const& rp){ return rp.distribute;}
+    };
+};
+
+//! Test concurrent invocations of method concurrent_vector::grow_by
+template<typename MyVector>
+class GrowBy: NoAssign {
+    MyVector& my_vector;
+    const grain_map& my_grain_map;
+    size_t my_part_weight;
+public:
+    void operator()( const tbb::blocked_range<size_t>& range ) const {
+        ASSERT( range.begin() < range.end(), NULL );
+
+        size_t current_adding_index_in_cvector = range.begin();
+
+        for(size_t index=0; index < my_grain_map.batched.size(); ++index){
+            const grain_map::range_part& batch_part = my_grain_map.batched[index];
+            const size_t number_of_items_to_add = batch_part.number_of_parts * my_part_weight;
+            const size_t end = current_adding_index_in_cvector + number_of_items_to_add;
+
+            switch(batch_part.method){
+            case grain_map::grow_by_range : {
+                    my_vector.grow_by(FooIterator(current_adding_index_in_cvector),FooIterator(end));
+                } break;
+            case grain_map::grow_by_default : {
+                    typename MyVector::iterator const s = my_vector.grow_by(number_of_items_to_add);
+                    for( size_t k = 0; k < number_of_items_to_add; ++k )
+                        s[k].bar() = current_adding_index_in_cvector + k;
+                } break;
+#if __TBB_INITIALIZER_LISTS_PRESENT
+            case grain_map::grow_by_init_list : {
+                    FooIterator curr(current_adding_index_in_cvector);
+                    for ( size_t k = 0; k < number_of_items_to_add; ++k ) {
+                        if ( k + 4 < number_of_items_to_add ) {
+                            my_vector.grow_by( { *curr++, *curr++, *curr++, *curr++, *curr++ } );
+                            k += 4;
+                        } else {
+                            my_vector.grow_by( { *curr++ } );
+                        }
+                    }
+                    ASSERT( curr == FooIterator(end), NULL );
+                } break;
+#endif
+            default : { ASSERT(false, "using unimplemented method of batch add in ConcurrentGrow test.");} break;
+            };
+
+            current_adding_index_in_cvector = end;
+        }
+
+        std::vector<size_t> items_left_to_add(my_grain_map.distributed.size());
+        for (size_t i=0; i<my_grain_map.distributed.size(); ++i ){
+            items_left_to_add[i] = my_grain_map.distributed[i].number_of_parts * my_part_weight;
+        }
+
+        for (;current_adding_index_in_cvector < range.end(); ++current_adding_index_in_cvector){
+            size_t method_index = current_adding_index_in_cvector % my_grain_map.distributed.size();
+
+            if (! items_left_to_add[method_index]) {
+                struct not_zero{
+                    static bool is(size_t items_to_add){ return items_to_add;}
+                };
+                method_index = std::distance(items_left_to_add.begin(), std::find_if(items_left_to_add.begin(), items_left_to_add.end(), &not_zero::is));
+                ASSERT(method_index < my_grain_map.distributed.size(), "incorrect test setup - wrong expected distribution: left free space but no elements to add?");
+            };
+
+            ASSERT(items_left_to_add[method_index], "logic error ?");
+            const grain_map::range_part& distributed_part = my_grain_map.distributed[method_index];
+
+            typename MyVector::iterator r;
+            typename MyVector::value_type source;
+            source.bar() = current_adding_index_in_cvector;
+
+            switch(distributed_part.method){
+            case grain_map::grow_by_default : {
+                    (r = my_vector.grow_by(1))->bar() = current_adding_index_in_cvector;
+                } break;
+            case grain_map::grow_by_copy : {
+                    r = my_vector.grow_by(1, source);
+                } break;
+            case grain_map::push_back : {
+                    r = my_vector.push_back(source);
+                } break;
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+            case grain_map::push_back_move : {
+                    r = my_vector.push_back(std::move(source));
+                } break;
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+            case grain_map::emplace_back : {
+                    r = my_vector.emplace_back(current_adding_index_in_cvector);
+                } break;
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+            default : { ASSERT(false, "using unimplemented method of batch add in ConcurrentGrow test.");} break;
+            };
+
+            ASSERT( static_cast<size_t>(r->bar()) == current_adding_index_in_cvector, NULL );
+            }
+        }
+
+    GrowBy( MyVector& vector, const grain_map& m, size_t part_weight )
+    : my_vector(vector)
+    , my_grain_map(m)
+    , my_part_weight(part_weight)
+    {
+    }
+};
+
+const grain_map::range_part concurrent_grow_single_range_map [] = {
+//  number_of_parts,         method,             distribute,   expected_element_state
+        {3,           grain_map::grow_by_range,     false,
+                                                            #if  __TBB_CPP11_RVALUE_REF_PRESENT
+                                                                Foo::MoveInitialized
+                                                            #else
+                                                                Foo::CopyInitialized
+                                                            #endif
+        },
+#if __TBB_INITIALIZER_LISTS_PRESENT && !__TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN
+        {1,           grain_map::grow_by_init_list, false,   Foo::CopyInitialized},
+#endif
+        {2,           grain_map::grow_by_default,   false,   Foo::DefaultInitialized},
+        {1,           grain_map::grow_by_default,   true,    Foo::DefaultInitialized},
+        {1,           grain_map::grow_by_copy,      true,    Foo::CopyInitialized},
+        {1,           grain_map::push_back,         true,    Foo::CopyInitialized},
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        {1,           grain_map::push_back_move,    true,    Foo::MoveInitialized},
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+        {1,           grain_map::emplace_back,      true,    Foo::DirectInitialized},
+#endif // __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+};
+
+//! Test concurrent invocations of grow methods
+void TestConcurrentGrowBy( int nthread ) {
+
+    typedef static_counting_allocator<debug_allocator<Foo> > MyAllocator;
+    typedef tbb::concurrent_vector<Foo, MyAllocator> MyVector;
+
+#if __TBB_INITIALIZER_LISTS_PRESENT && __TBB_CPP11_INIT_LIST_TEMP_OBJS_LIFETIME_BROKEN
+    static bool is_reported = false;
+    if ( !is_reported ) {
+        REPORT( "Known issue: concurrent tests of grow_by(std::initializer_list) are skipped.\n" );
+        is_reported = true;
+    }
+#endif
+
+    MyAllocator::init_counters();
+    {
+        grain_map m(concurrent_grow_single_range_map, Harness::end(concurrent_grow_single_range_map));
+
+        static const size_t desired_grain_size = 100;
+
+        static const size_t part_weight = desired_grain_size / m.total_number_of_parts;
+        static const size_t grain_size = part_weight * m.total_number_of_parts;
+        static const size_t number_of_grains = 8; //this should be (power of two) in order to get minimal ranges equal to grain_size
+        static const size_t range_size = grain_size * number_of_grains;
+
+        MyAllocator a;
+        MyVector v( a );
+        tbb::parallel_for( tbb::blocked_range<size_t>(0,range_size,grain_size), GrowBy<MyVector>(v, m, part_weight), tbb::simple_partitioner() );
+        ASSERT( v.size()==size_t(range_size), NULL );
+
+        // Verify that v is a permutation of 0..m
+        size_t inversions = 0, direct_inits = 0, def_inits = 0, copy_inits = 0, move_inits = 0;
+        std::vector<bool> found(range_size, 0);
+        for( size_t i=0; i<range_size; ++i ) {
+            if( v[i].state == Foo::DefaultInitialized ) ++def_inits;
+            else if( v[i].state == Foo::DirectInitialized ) ++direct_inits;
+            else if( v[i].state == Foo::CopyInitialized ) ++copy_inits;
+            else if( v[i].state == Foo::MoveInitialized ) ++move_inits;
+            else {
+                REMARK("i: %d ", i);
+                ASSERT( false, "v[i] seems not initialized");
+            }
+            intptr_t index = v[i].bar();
+            ASSERT( !found[index], NULL );
+            found[index] = true;
+            if( i>0 )
+                inversions += v[i].bar()<v[i-1].bar();
+        }
+        for( size_t i=0; i<range_size; ++i ) {
+            ASSERT( found[i], NULL );
+            ASSERT( nthread>1 || v[i].bar() == static_cast<intptr_t>(i), "sequential execution is wrong" );
+        }
+
+        REMARK("Initialization by default constructor: %d, by copy: %d, by move: %d\n", def_inits, copy_inits, move_inits);
+
+        size_t expected_direct_inits = 0, expected_def_inits = 0, expected_copy_inits = 0, expected_move_inits = 0;
+        for (size_t i=0; i<Harness::array_length(concurrent_grow_single_range_map); ++i){
+            const grain_map::range_part& rp =concurrent_grow_single_range_map[i];
+            switch (rp.expected_element_state){
+            case Foo::DefaultInitialized: { expected_def_inits += rp.number_of_parts ; } break;
+            case Foo::DirectInitialized:  { expected_direct_inits += rp.number_of_parts ;} break;
+            case Foo::MoveInitialized:    { expected_move_inits += rp.number_of_parts ;} break;
+            case Foo::CopyInitialized:    { expected_copy_inits += rp.number_of_parts ;} break;
+            default: {ASSERT(false, "unexpected expected state");}break;
+            };
+        }
+
+        expected_def_inits    *= part_weight * number_of_grains;
+        expected_move_inits   *= part_weight * number_of_grains;
+        expected_copy_inits   *= part_weight * number_of_grains;
+        expected_direct_inits *= part_weight * number_of_grains;
+
+        ASSERT( def_inits == expected_def_inits , NULL);
+        ASSERT( copy_inits == expected_copy_inits , NULL);
+        ASSERT( move_inits == expected_move_inits , NULL);
+        ASSERT( direct_inits == expected_direct_inits , NULL);
+
+        if( nthread>1 && inversions<range_size/20 )
+            REPORT("Warning: not much concurrency in TestConcurrentGrowBy (%d inversions)\n", inversions);
+    }
+    //TODO: factor this into separate thing, as it seems to used in big number of tests
+    size_t items_allocated = MyAllocator::items_allocated,
+           items_freed = MyAllocator::items_freed;
+    size_t allocations = MyAllocator::allocations,
+           frees = MyAllocator::frees;
+    ASSERT( items_allocated == items_freed, NULL);
+    ASSERT( allocations == frees, NULL);
+}
+
+template <typename Vector>
+void test_grow_by_empty_range( Vector &v, typename Vector::value_type* range_begin_end ) {
+    const Vector v_copy = v;
+    ASSERT( v.grow_by( range_begin_end, range_begin_end ) == v.end(), "grow_by(empty_range) returned a wrong iterator." );
+    ASSERT( v == v_copy, "grow_by(empty_range) has changed the vector." );
+}
+
+void TestSerialGrowByRange( bool fragmented_vector ) {
+    tbb::concurrent_vector<int> v;
+    if ( fragmented_vector ) {
+        v.reserve( 1 );
+    }
+    int init_range[] = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 };
+    ASSERT( v.grow_by( init_range, init_range + (Harness::array_length( init_range )) ) == v.begin(), "grow_by(I,I) returned a wrong iterator." );
+    ASSERT( std::equal( v.begin(), v.end(), init_range ), "grow_by(I,I) did not properly copied all elements ?" );
+    test_grow_by_empty_range( v, init_range );
+    test_grow_by_empty_range( v, (int*)NULL );
+}
+
+//TODO: move this to more appropriate place, smth like test_harness.cpp
+void TestArrayLength(){
+    int five_element_array[5] = {0};
+    ASSERT(Harness::array_length(five_element_array)==5,"array_length failed to determine length of non empty non dynamic array");
+}
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+#include "test_initializer_list.h"
+
+struct test_grow_by {
+    template<typename container_type, typename element_type>
+    static void do_test( std::initializer_list<element_type> const& il, container_type const& expected ) {
+        container_type vd;
+        vd.grow_by( il );
+        ASSERT( vd == expected, "grow_by with an initializer list failed" );
+    }
+};
+
+void TestInitList() {
+    REMARK( "testing initializer_list methods \n" );
+    using namespace initializer_list_support_tests;
+    TestInitListSupport<tbb::concurrent_vector<char>, test_grow_by>( { 1, 2, 3, 4, 5 } );
+    TestInitListSupport<tbb::concurrent_vector<int>, test_grow_by>( {} );
+}
+#endif //if __TBB_INITIALIZER_LISTS_PRESENT
+
+#if __TBB_RANGE_BASED_FOR_PRESENT
+#include "test_range_based_for.h"
+
+void TestRangeBasedFor(){
+    using namespace range_based_for_support_tests;
+
+    REMARK("testing range based for loop compatibility \n");
+    typedef tbb::concurrent_vector<int> c_vector;
+    c_vector a_c_vector;
+
+    const int sequence_length = 100;
+    for (int i =1; i<= sequence_length; ++i){
+        a_c_vector.push_back(i);
+    }
+
+    ASSERT( range_based_for_accumulate(a_c_vector, std::plus<int>(), 0) == gauss_summ_of_int_sequence(sequence_length), "incorrect accumulated value generated via range based for ?");
+}
+#endif //if __TBB_RANGE_BASED_FOR_PRESENT
+
+#if TBB_USE_EXCEPTIONS
+#endif //TBB_USE_EXCEPTIONS
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+namespace move_semantics_helpers{
+    struct move_only_type:NoCopy{
+        const int* my_pointer;
+        move_only_type(move_only_type && other): my_pointer(other.my_pointer){other.my_pointer=NULL;}
+        explicit move_only_type(const int* value): my_pointer(value) {}
+    };
+}
+
+void TestPushBackMoveOnlyContainee(){
+    using namespace move_semantics_helpers;
+    typedef tbb::concurrent_vector<move_only_type > vector_t;
+    vector_t v;
+    static const int magic_number =7;
+    move_only_type src(&magic_number);
+    v.push_back(std::move(src));
+    ASSERT(v[0].my_pointer == &magic_number,"item was incorrectly moved during push_back?");
+    ASSERT(src.my_pointer == NULL,"item was incorrectly moved during push_back?");
+}
+
+namespace emplace_helpers{
+    struct wrapper_type:NoCopy{
+        int value1;
+        int value2;
+        explicit wrapper_type(int v1, int v2) : value1 (v1), value2(v2) {}
+        friend bool operator==(const wrapper_type& lhs, const wrapper_type& rhs){
+            return (lhs.value1 == rhs.value1) && (lhs.value2 == rhs.value2 );
+        }
+    };
+}
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+//TODO: extend the test to number of types e.g. std::string
+void TestEmplaceBack(){
+    using namespace emplace_helpers;
+    typedef tbb::concurrent_vector<wrapper_type > vector_t;
+    vector_t v;
+    v.emplace_back(1,2);
+    ASSERT(v[0] == wrapper_type(1,2),"incorrectly in-place constructed item during emplace_back?");
+}
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+//! Test the assignment operator and swap
+void TestAssign() {
+    typedef tbb::concurrent_vector<FooWithAssign, local_counting_allocator<std::allocator<FooWithAssign>, size_t > > vector_t;
+    local_counting_allocator<std::allocator<FooWithAssign>, size_t > init_alloc;
+    init_alloc.allocations = 100;
+    for( int dst_size=1; dst_size<=128; NextSize( dst_size ) ) {
+        for( int src_size=2; src_size<=128; NextSize( src_size ) ) {
+            vector_t u(FooIterator(0), FooIterator(src_size), init_alloc);
+            for( int i=0; i<src_size; ++i )
+                ASSERT( u[i].bar()==i, NULL );
+            vector_t v(dst_size, FooWithAssign(), init_alloc);
+            for( int i=0; i<dst_size; ++i ) {
+                ASSERT( v[i].state==Foo::CopyInitialized, NULL );
+                v[i].bar() = ~i;
+            }
+            ASSERT( v != u, NULL);
+            v.swap(u);
+            CheckVector(u, dst_size, src_size);
+            u.swap(v);
+            // using assignment
+            v = u;
+            ASSERT( v == u, NULL);
+            u.clear();
+            ASSERT( u.size()==0, NULL );
+            ASSERT( v.size()==size_t(src_size), NULL );
+            for( int i=0; i<src_size; ++i )
+                ASSERT( v[i].bar()==i, NULL );
+            ASSERT( 0 == u.get_allocator().frees, NULL);
+            u.shrink_to_fit(); // deallocate unused memory
+            size_t items_allocated = u.get_allocator().items_allocated,
+                   items_freed = u.get_allocator().items_freed;
+            size_t allocations = u.get_allocator().allocations,
+                   frees = u.get_allocator().frees + 100;
+            ASSERT( items_allocated == items_freed, NULL);
+            ASSERT( allocations == frees, NULL);
+        }
+    }
+}
+
+struct c_vector_type : default_container_traits {
+    template<typename element_type, typename allocator_type>
+    struct apply{
+        typedef tbb::concurrent_vector<element_type,  allocator_type > type;
+    };
+
+    typedef FooIterator init_iterator_type;
+    enum{ expected_number_of_items_to_allocate_for_steal_move = 0 };
+
+    template<typename element_type, typename allocator_type, typename iterator>
+    static bool equal(tbb::concurrent_vector<element_type, allocator_type > const& c, iterator begin, iterator end){
+        bool equal_sizes = (size_t)std::distance(begin, end) == c.size();
+        return  equal_sizes && std::equal(c.begin(), c.end(), begin);
+    }
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+void TestSerialGrowByWithMoveIterators(){
+    typedef default_stateful_fixture_make_helper<c_vector_type>::type fixture_t;
+    typedef fixture_t::container_t vector_t;
+
+    fixture_t fixture("TestSerialGrowByWithMoveIterators");
+
+    vector_t dst(fixture.dst_allocator);
+    dst.grow_by(std::make_move_iterator(fixture.source.begin()), std::make_move_iterator(fixture.source.end()));
+
+    fixture.verify_content_deep_moved(dst);
+}
+
+#if __TBB_MOVE_IF_NOEXCEPT_PRESENT
+namespace test_move_in_shrink_to_fit_helpers {
+    struct dummy : Harness::StateTrackable<>{
+        int i;
+        dummy(int an_i) __TBB_NOEXCEPT(true) : Harness::StateTrackable<>(0), i(an_i) {}
+#if !__TBB_IMPLICIT_MOVE_PRESENT || __TBB_NOTHROW_MOVE_MEMBERS_IMPLICIT_GENERATION_BROKEN
+        dummy(const dummy &src) __TBB_NOEXCEPT(true) : Harness::StateTrackable<>(src), i(src.i) {}
+        dummy(dummy &&src) __TBB_NOEXCEPT(true) : Harness::StateTrackable<>(std::move(src)), i(src.i) {}
+
+        dummy& operator=(dummy &&src) __TBB_NOEXCEPT(true) {
+            Harness::StateTrackable<>::operator=(std::move(src));
+            i = src.i;
+            return *this;
+        }
+
+        //somehow magically this declaration make std::is_nothrow_move_constructible<pod>::value to works correctly on icc14+msvc2013
+        ~dummy() __TBB_NOEXCEPT(true) {}
+#endif //!__TBB_IMPLICIT_MOVE_PRESENT || __TBB_NOTHROW_MOVE_MEMBERS_IMPLICIT_GENERATION_BROKEN
+        friend bool operator== (const dummy &lhs, const dummy &rhs){ return lhs.i == rhs.i; }
+    };
+}
+void TestSerialMoveInShrinkToFit(){
+    const char* test_name = "TestSerialMoveInShrinkToFit";
+    REMARK("running %s \n", test_name);
+    using test_move_in_shrink_to_fit_helpers::dummy;
+
+    __TBB_STATIC_ASSERT(std::is_nothrow_move_constructible<dummy>::value,"incorrect test setup or broken configuration?");
+    {
+        dummy src(0);
+        ASSERT_IN_TEST(is_state<Harness::StateTrackableBase::MoveInitialized>(dummy(std::move_if_noexcept(src))),"broken configuration ?", test_name);
+    }
+    static const size_t sequence_size = 15;
+    typedef  tbb::concurrent_vector<dummy> c_vector_t;
+    std::vector<dummy> source(sequence_size, 0);
+    std::generate_n(source.begin(), source.size(), std::rand);
+
+    c_vector_t c_vector;
+    c_vector.reserve(1); //make it fragmented
+
+    c_vector.assign(source.begin(), source.end());
+    memory_locations c_vector_before_shrink(c_vector);
+    c_vector.shrink_to_fit();
+
+    ASSERT_IN_TEST(c_vector_before_shrink.content_location_changed(c_vector), "incorrect test setup? shrink_to_fit should cause moving elements to other memory locations while it is not", test_name);
+    ASSERT_IN_TEST(all_of(c_vector, is_state_f<Harness::StateTrackableBase::MoveInitialized>()), "container did not move construct some elements?", test_name);
+    ASSERT_IN_TEST(c_vector == c_vector_t(source.begin(),source.end()),"",test_name);
+}
+#endif //__TBB_MOVE_IF_NOEXCEPT_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+#include <string>
+
+// Test the comparison operators
+void TestComparison() {
+    std::string str[3]; str[0] = "abc";
+    str[1].assign("cba");
+    str[2].assign("abc"); // same as 0th
+    tbb::concurrent_vector<char> var[3];
+    var[0].assign(str[0].begin(), str[0].end());
+    var[1].assign(str[0].rbegin(), str[0].rend());
+    var[2].assign(var[1].rbegin(), var[1].rend()); // same as 0th
+    for (int i = 0; i < 3; ++i) {
+        for (int j = 0; j < 3; ++j) {
+            ASSERT( (var[i] == var[j]) == (str[i] == str[j]), NULL );
+            ASSERT( (var[i] != var[j]) == (str[i] != str[j]), NULL );
+            ASSERT( (var[i] < var[j]) == (str[i] < str[j]), NULL );
+            ASSERT( (var[i] > var[j]) == (str[i] > str[j]), NULL );
+            ASSERT( (var[i] <= var[j]) == (str[i] <= str[j]), NULL );
+            ASSERT( (var[i] >= var[j]) == (str[i] >= str[j]), NULL );
+        }
+    }
+}
+
+//------------------------------------------------------------------------
+// Regression test for problem where on oversubscription caused
+// concurrent_vector::grow_by to run very slowly (TR#196).
+//------------------------------------------------------------------------
+
+#include "tbb/task_scheduler_init.h"
+#include <math.h>
+
+typedef unsigned long Number;
+
+static tbb::concurrent_vector<Number> Primes;
+
+class FindPrimes {
+    bool is_prime( Number val ) const {
+        int limit, factor = 3;
+        if( val<5u )
+            return val==2;
+        else {
+            limit = long(sqrtf(float(val))+0.5f);
+            while( factor<=limit && val % factor )
+                ++factor;
+            return factor>limit;
+        }
+    }
+public:
+    void operator()( const tbb::blocked_range<Number>& r ) const {
+        for( Number i=r.begin(); i!=r.end(); ++i ) {
+            if( i%2 && is_prime(i) ) {
+                Primes.push_back( i );
+            }
+        }
+    }
+};
+
+double TimeFindPrimes( int nthread ) {
+    Primes.clear();
+    Primes.reserve(1000000);// TODO: or compact()?
+    tbb::task_scheduler_init init(nthread);
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for( tbb::blocked_range<Number>(0,1000000,500), FindPrimes() );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    return (t1-t0).seconds();
+}
+
+void TestFindPrimes() {
+    // Time fully subscribed run.
+    double t2 = TimeFindPrimes( tbb::task_scheduler_init::automatic );
+
+    // Time parallel run that is very likely oversubscribed.
+    double t128 = TimeFindPrimes(128);
+    REMARK("TestFindPrimes: t2==%g t128=%g k=%g\n", t2, t128, t128/t2);
+
+    // We allow the 128-thread run a little extra time to allow for thread overhead.
+    // Theoretically, following test will fail on machine with >128 processors.
+    // But that situation is not going to come up in the near future,
+    // and the generalization to fix the issue is not worth the trouble.
+    if( t128 > 1.3*t2 ) {
+        REPORT("Warning: grow_by is pathetically slow: t2==%g t128=%g k=%g\n", t2, t128, t128/t2);
+    }
+}
+
+//------------------------------------------------------------------------
+// Test compatibility with STL sort.
+//------------------------------------------------------------------------
+
+#include <algorithm>
+
+void TestSort() {
+    for( int n=0; n<100; n=n*3+1 ) {
+        tbb::concurrent_vector<int> array(n);
+        for( int i=0; i<n; ++i )
+            array.at(i) = (i*7)%n;
+        std::sort( array.begin(), array.end() );
+        for( int i=0; i<n; ++i )
+            ASSERT( array[i]==i, NULL );
+    }
+}
+
+#if TBB_USE_EXCEPTIONS
+
+template<typename c_vector>
+size_t get_early_size(c_vector & v){
+      return v.grow_by(0) - v.begin();
+}
+
+void verify_c_vector_size(size_t size, size_t capacity, size_t early_size, const char * const test_name){
+    ASSERT_IN_TEST( size <= capacity, "", test_name);
+    ASSERT_IN_TEST( early_size >= size, "", test_name);
+}
+
+template<typename c_vector_t>
+void verify_c_vector_size(c_vector_t & c_v, const char * const test_name){
+    verify_c_vector_size(c_v.size(), c_v.capacity(), get_early_size(c_v), test_name);
+}
+
+void verify_c_vector_capacity_is_below(size_t capacity, size_t high, const char * const test_name){
+    ASSERT_IN_TEST(capacity > 0, "unexpected capacity", test_name);
+    ASSERT_IN_TEST(capacity < high, "unexpected capacity", test_name);
+}
+
+template<typename vector_t>
+void verify_last_segment_allocation_failed(vector_t const& victim, const char* const test_name){
+    ASSERT_THROWS_IN_TEST(victim.at(victim.size()), std::range_error, "",test_name );
+}
+
+template<typename vector_t>
+void verify_assignment_operator_throws_bad_last_alloc(vector_t & victim, const char* const test_name){
+    vector_t copy_of_victim(victim, victim.get_allocator());
+    ASSERT_THROWS_IN_TEST(victim = copy_of_victim, tbb::bad_last_alloc, "", test_name);
+}
+
+template<typename vector_t>
+void verify_copy_and_assign_from_produce_the_same(vector_t const& victim, const char* const test_name){
+    //TODO: remove explicit copy of allocator when full support of C++11 allocator_traits in concurrent_vector is present
+    vector_t copy_of_victim(victim, victim.get_allocator());
+    ASSERT_IN_TEST(copy_of_victim == victim, "copy doesn't match original", test_name);
+    vector_t copy_of_victim2(10, victim[0], victim.get_allocator());
+    copy_of_victim2 = victim;
+    ASSERT_IN_TEST(copy_of_victim == copy_of_victim2, "assignment doesn't match copying", test_name);
+}
+
+template<typename allocator_t>
+void verify_vector_partially_copied(
+        tbb::concurrent_vector<FooWithAssign, allocator_t> const& victim, size_t planned_victim_size,
+        tbb::concurrent_vector<FooWithAssign, allocator_t> const& src,  bool is_memory_allocation_failure ,const char* const test_name)
+{
+    if (is_memory_allocation_failure) { // allocator generated exception
+        typedef tbb::concurrent_vector<FooWithAssign, allocator_t> vector_t;
+        ASSERT_IN_TEST( victim == vector_t(src.begin(), src.begin() + victim.size(), src.get_allocator()), "failed to properly copy of source ?", test_name );
+    }else{
+        ASSERT_IN_TEST( std::equal(victim.begin(), victim.begin() + planned_victim_size, src.begin()), "failed to properly copy items before the exception?", test_name );
+        ASSERT_IN_TEST( ::all_of( victim.begin() + planned_victim_size, victim.end(), is_state_f<Foo::ZeroInitialized>() ), "failed to zero-initialize items left not constructed after the exception?", test_name );
+    }
+}
+
+//------------------------------------------------------------------------
+// Test exceptions safety (from allocator and items constructors)
+//------------------------------------------------------------------------
+void TestExceptions() {
+    typedef static_counting_allocator<debug_allocator<FooWithAssign>, std::size_t> allocator_t;
+    typedef tbb::concurrent_vector<FooWithAssign, allocator_t> vector_t;
+
+    enum methods {
+        zero_method = 0,
+        ctor_copy, ctor_size, assign_nt, assign_ir, reserve, compact,
+        all_methods
+    };
+    ASSERT( !FooCount, NULL );
+
+    try {
+        vector_t src(FooIterator(0), FooIterator(N)); // original data
+
+        for(int t = 0; t < 2; ++t) // exception type
+        for(int m = zero_method+1; m < all_methods; ++m)
+        {
+            track_foo_count<__LINE__> check_all_foo_destroyed_on_exit("TestExceptions");
+            track_allocator_memory<allocator_t> verify_no_leak_at_exit("TestExceptions");
+            allocator_t::init_counters();
+            if(t) MaxFooCount = FooCount + N/4;
+            else allocator_t::set_limits(N/4);
+            vector_t victim;
+            try {
+                switch(m) {
+                case ctor_copy: {
+                        vector_t acopy(src);
+                    } break; // auto destruction after exception is checked by ~Foo
+                case ctor_size: {
+                        vector_t sized(N);
+                    } break; // auto destruction after exception is checked by ~Foo
+                // Do not test assignment constructor due to reusing of same methods as below
+                case assign_nt: {
+                        victim.assign(N, FooWithAssign());
+                    } break;
+                case assign_ir: {
+                        victim.assign(FooIterator(0), FooIterator(N));
+                    } break;
+                case reserve: {
+                        try {
+                            victim.reserve(victim.max_size()+1);
+                        } catch(std::length_error &) {
+                        } catch(...) {
+                            KNOWN_ISSUE("ERROR: unrecognized exception - known compiler issue\n");
+                        }
+                        victim.reserve(N);
+                    } break;
+                case compact: {
+                        if(t) MaxFooCount = 0; else allocator_t::set_limits(); // reset limits
+                        victim.reserve(2); victim = src; // fragmented assignment
+                        if(t) MaxFooCount = FooCount + 10; else allocator_t::set_limits(1, false); // block any allocation, check NULL return from allocator
+                        victim.shrink_to_fit(); // should start defragmenting first segment
+                    } break;
+                default:;
+                }
+                if(!t || m != reserve) ASSERT(false, "should throw an exception");
+            } catch(std::bad_alloc &e) {
+                allocator_t::set_limits(); MaxFooCount = 0;
+                size_t capacity = victim.capacity();
+                size_t size = victim.size();
+
+                size_t req_size = get_early_size(victim);
+
+                verify_c_vector_size(size, capacity, req_size, "TestExceptions");
+
+                switch(m) {
+                case reserve:
+                    if(t) ASSERT(false, NULL);
+                    __TBB_fallthrough;
+                case assign_nt:
+                case assign_ir:
+                    if(!t) {
+                        ASSERT(capacity < N/2, "unexpected capacity");
+                        ASSERT(size == 0, "unexpected size");
+                        break;
+                    } else {
+                        ASSERT(size == N, "unexpected size");
+                        ASSERT(capacity >= N, "unexpected capacity");
+                        int i;
+                        for(i = 1; ; ++i)
+                            if(!victim[i].zero_bar()) break;
+                            else ASSERT(victim[i].bar() == (m == assign_ir? i : initial_value_of_bar), NULL);
+                        for(; size_t(i) < size; ++i) ASSERT(!victim[i].zero_bar(), NULL);
+                        ASSERT(size_t(i) == size, NULL);
+                        break;
+                    }
+                case compact:
+                    ASSERT(capacity > 0, "unexpected capacity");
+                    ASSERT(victim == src, "shrink_to_fit() is broken");
+                    break;
+
+                default:; // nothing to check here
+                }
+                REMARK("Exception %d: %s\t- ok\n", m, e.what());
+            }
+        }
+    } catch(...) {
+        ASSERT(false, "unexpected exception");
+    }
+}
+
+//TODO: split into two separate tests
+//TODO: remove code duplication in exception safety tests
+void TestExceptionSafetyGuaranteesForAssignOperator(){
+    //TODO: use __FUNCTION__ for test name
+    const char* const test_name = "TestExceptionSafetyGuaranteesForAssignOperator";
+    typedef static_counting_allocator<debug_allocator<FooWithAssign>, std::size_t> allocator_t;
+    typedef tbb::concurrent_vector<FooWithAssign, allocator_t> vector_t;
+
+    track_foo_count<__LINE__> check_all_foo_destroyed_on_exit(test_name);
+    track_allocator_memory<allocator_t> verify_no_leak_at_exit(test_name);
+
+    vector_t src(FooIterator(0), FooIterator(N)); // original data
+
+    const size_t planned_victim_size = N/4;
+
+    for(int t = 0; t < 2; ++t) {// exception type
+        vector_t victim;
+        victim.reserve(2); // get fragmented assignment
+
+        ASSERT_THROWS_IN_TEST(
+            {
+                limit_foo_count_in_scope foo_limit(FooCount + planned_victim_size, t);
+                limit_allocated_items_in_scope<allocator_t> allocator_limit(allocator_t::items_allocated + planned_victim_size, !t);
+
+                victim = src; // fragmented assignment
+            },
+            std::bad_alloc, "", test_name
+        );
+
+        verify_c_vector_size(victim, test_name);
+
+        if(!t) {
+            verify_c_vector_capacity_is_below(victim.capacity(), N, test_name);
+        }
+
+        verify_vector_partially_copied(victim, planned_victim_size, src, !t, test_name);
+        verify_last_segment_allocation_failed(victim, test_name);
+        verify_copy_and_assign_from_produce_the_same(victim, test_name);
+        verify_assignment_operator_throws_bad_last_alloc(victim, test_name);
+    }
+}
+//TODO: split into two separate tests
+void TestExceptionSafetyGuaranteesForConcurrentGrow(){
+    const char* const test_name = "TestExceptionSafetyGuaranteesForConcurrentGrow";
+    typedef static_counting_allocator<debug_allocator<FooWithAssign>, std::size_t> allocator_t;
+    typedef tbb::concurrent_vector<FooWithAssign, allocator_t> vector_t;
+
+    track_foo_count<__LINE__> check_all_foo_destroyed_on_exit(test_name);
+    track_allocator_memory<allocator_t> verify_no_leak_at_exit(test_name);
+
+    vector_t src(FooIterator(0), FooIterator(N)); // original data
+
+    const size_t planned_victim_size = N/4;
+    static const int grain_size = 70;
+
+    tbb::task_scheduler_init init(2);
+
+    for(int t = 0; t < 2; ++t) {// exception type
+        vector_t victim;
+
+#if TBB_USE_CAPTURED_EXCEPTION
+        #define EXPECTED_EXCEPTION    tbb::captured_exception
+#else
+        #define EXPECTED_EXCEPTION    std::bad_alloc
+#endif
+
+        ASSERT_THROWS_IN_TEST(
+            {
+                limit_foo_count_in_scope foo_limit(FooCount +  31, t); // these numbers help to reproduce the live lock for versions < TBB2.2
+                limit_allocated_items_in_scope<allocator_t> allocator_limit(allocator_t::items_allocated + planned_victim_size, !t);
+
+                grain_map m(concurrent_grow_single_range_map, Harness::end(concurrent_grow_single_range_map));
+
+                static const size_t part_weight =  grain_size / m.total_number_of_parts;
+
+                tbb::parallel_for(
+                        tbb::blocked_range<size_t>(0, N, grain_size),
+                        GrowBy<vector_t>(victim, m, part_weight)
+                );
+            },
+            EXPECTED_EXCEPTION, "", test_name
+        );
+
+        verify_c_vector_size(victim, test_name);
+
+        if(!t) {
+            verify_c_vector_capacity_is_below(victim.capacity(), N, test_name);
+        }
+
+        for(int i = 0; ; ++i) {
+            try {
+                Foo &foo = victim.at(i);
+                ASSERT( foo.is_valid_or_zero(),"" );
+            } catch(std::range_error &) { // skip broken segment
+                ASSERT( size_t(i) < get_early_size(victim), NULL );
+            } catch(std::out_of_range &){
+                ASSERT( i > 0, NULL ); break;
+            } catch(...) {
+                KNOWN_ISSUE("ERROR: unrecognized exception - known compiler issue\n"); break;
+            }
+        }
+
+        verify_copy_and_assign_from_produce_the_same(victim, test_name);
+    }
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+void TestExceptionSafetyGuaranteesForMoveAssignOperatorWithUnEqualAllocatorMemoryFailure(){
+    const char* const test_name = "TestExceptionSafetyGuaranteesForMoveAssignOperatorWithUnEqualAllocatorMemoryFailure";
+
+    //TODO: add ability to inject debug_allocator into stateful_allocator_fixture::allocator_t
+    //typedef static_counting_allocator<debug_allocator<FooWithAssign>, std::size_t> allocator_t;
+    typedef default_stateful_fixture_make_helper<c_vector_type, Harness::false_type>::type fixture_t;
+    typedef arena_allocator_fixture<FooWithAssign, Harness::false_type> arena_allocator_fixture_t;
+    typedef fixture_t::allocator_t allocator_t;
+    typedef fixture_t::container_t vector_t;
+
+    fixture_t fixture(test_name);
+    arena_allocator_fixture_t arena_allocator_fixture(4 * fixture.container_size);
+
+    const size_t allocation_limit = fixture.container_size/4;
+
+    vector_t victim(arena_allocator_fixture.allocator);
+    victim.reserve(2); // get fragmented assignment
+
+    ASSERT_THROWS_IN_TEST(
+        {
+            limit_allocated_items_in_scope<allocator_t> allocator_limit(allocator_t::items_allocated + allocation_limit);
+            victim = std::move(fixture.source); // fragmented assignment
+        },
+        std::bad_alloc, "", test_name
+    );
+
+    verify_c_vector_size(victim, test_name);
+    verify_c_vector_capacity_is_below(victim.capacity(), allocation_limit + 2, test_name);
+
+    fixture.verify_part_of_content_deep_moved(victim, victim.size());
+
+    verify_last_segment_allocation_failed(victim, test_name);
+    verify_copy_and_assign_from_produce_the_same(victim, test_name);
+    verify_assignment_operator_throws_bad_last_alloc(victim, test_name);
+}
+
+void TestExceptionSafetyGuaranteesForMoveAssignOperatorWithUnEqualAllocatorExceptionInElementCtor(){
+    const char* const test_name = "TestExceptionSafetyGuaranteesForMoveAssignOperator";
+    //typedef static_counting_allocator<debug_allocator<FooWithAssign>, std::size_t> allocator_t;
+    typedef default_stateful_fixture_make_helper<c_vector_type, Harness::false_type>::type fixture_t;
+    typedef arena_allocator_fixture<FooWithAssign, Harness::false_type> arena_allocator_fixture_t;
+    typedef fixture_t::container_t vector_t;
+
+    fixture_t fixture(test_name);
+    const size_t planned_victim_size = fixture.container_size/4;
+    arena_allocator_fixture_t arena_allocator_fixture(4 * fixture.container_size);
+
+    vector_t victim(arena_allocator_fixture.allocator);
+    victim.reserve(2); // get fragmented assignment
+
+    ASSERT_THROWS_IN_TEST(
+        {
+            limit_foo_count_in_scope foo_limit(FooCount + planned_victim_size);
+            victim = std::move(fixture.source); // fragmented assignment
+        },
+        std::bad_alloc, "", test_name
+    );
+
+    verify_c_vector_size(victim, test_name);
+
+    fixture.verify_part_of_content_deep_moved(victim, planned_victim_size);
+
+    verify_last_segment_allocation_failed(victim, test_name);
+    verify_copy_and_assign_from_produce_the_same(victim, test_name);
+    verify_assignment_operator_throws_bad_last_alloc(victim, test_name);
+}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+namespace push_back_exception_safety_helpers{
+    //TODO: remove code duplication with emplace_helpers::wrapper_type
+    struct throwing_foo:Foo{
+        int value1;
+        int value2;
+        explicit throwing_foo(int v1, int v2) : value1 (v1), value2(v2) {        }
+    };
+
+    template< typename foo_t = throwing_foo>
+    struct fixture{
+        typedef tbb::concurrent_vector<foo_t, debug_allocator<foo_t> > vector_t;
+        vector_t v;
+
+        void test( void(*p_test)(vector_t&), const char * test_name){
+            track_foo_count<__LINE__> verify_no_foo_leaked_during_exception(test_name);
+            ASSERT_IN_TEST(v.empty(),"incorrect test setup?", test_name );
+            ASSERT_THROWS_IN_TEST(p_test(v), Foo_exception ,"", test_name);
+            ASSERT_IN_TEST(is_state<Foo::ZeroInitialized>(v[0]),"incorrectly filled item during exception in emplace_back?", test_name);
+        }
+    };
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+void TestPushBackMoveExceptionSafety(){
+    typedef push_back_exception_safety_helpers::fixture<Foo> fixture_t;
+    fixture_t t;
+
+    limit_foo_count_in_scope foo_limit(FooCount + 1);
+
+    struct test{
+        static void test_move_push_back(fixture_t::vector_t& v){
+            Foo f;
+            v.push_back(std::move(f));
+        }
+    };
+    t.test(&test::test_move_push_back, "TestPushBackMoveExceptionSafety");
+}
+
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+void TestEmplaceBackExceptionSafety(){
+    typedef push_back_exception_safety_helpers::fixture<> fixture_t;
+    fixture_t t;
+
+    Foo dummy; //make FooCount non zero;
+    Harness::suppress_unused_warning(dummy);
+    limit_foo_count_in_scope foo_limit(FooCount);
+
+    struct test{
+        static void test_emplace(fixture_t::vector_t& v){
+            v.emplace_back(1,2);
+        }
+    };
+    t.test(&test::test_emplace, "TestEmplaceBackExceptionSafety");
+}
+#endif //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+#endif /* TBB_USE_EXCEPTIONS */
+
+//------------------------------------------------------------------------
+// Test support for SIMD instructions
+//------------------------------------------------------------------------
+#include "harness_m128.h"
+
+#if HAVE_m128 || HAVE_m256
+
+template<typename ClassWithVectorType>
+void TestVectorTypes() {
+    tbb::concurrent_vector<ClassWithVectorType> v;
+    for( int i=0; i<100; ++i ) {
+        // VC8 does not properly align a temporary value; to work around, use explicit variable
+        ClassWithVectorType foo(i);
+        v.push_back(foo);
+        for( int j=0; j<i; ++j ) {
+            ClassWithVectorType bar(j);
+            ASSERT( v[j]==bar, NULL );
+        }
+    }
+}
+#endif /* HAVE_m128 | HAVE_m256 */
+
+//------------------------------------------------------------------------
+
+namespace v3_backward_compatibility{
+    namespace segment_t_layout_helpers{
+        //this is previous definition of according inner class of concurrent_vector_base_v3
+        struct segment_t_v3 {
+            void* array;
+        };
+        //helper class to access protected members of concurrent_vector_base
+        struct access_vector_fields :tbb::internal::concurrent_vector_base_v3 {
+            using tbb::internal::concurrent_vector_base_v3::segment_t;
+            using tbb::internal::concurrent_vector_base_v3::segment_index_t;
+            using tbb::internal::concurrent_vector_base_v3::pointers_per_long_table;
+            using tbb::internal::concurrent_vector_base_v3::internal_segments_table;
+        };
+        //this is previous definition of according inner class of concurrent_vector_base_v3
+        struct internal_segments_table_v3 {
+            access_vector_fields::segment_index_t first_block;
+            segment_t_v3 table[access_vector_fields::pointers_per_long_table];
+        };
+
+        template <typename checked_type>
+        struct alignment_check_helper{
+            char dummy;
+            checked_type checked;
+        };
+    }
+    void TestSegmentTLayout(){
+        using namespace segment_t_layout_helpers;
+        typedef alignment_check_helper<segment_t_v3> structure_with_old_segment_type;
+        typedef alignment_check_helper<access_vector_fields::segment_t> structure_with_new_segment_type;
+
+        ASSERT((sizeof(structure_with_old_segment_type)==sizeof(structure_with_new_segment_type))
+              ,"layout of new segment_t and old one differ?");
+    }
+
+    void TestInternalSegmentsTableLayout(){
+        using namespace segment_t_layout_helpers;
+        typedef alignment_check_helper<internal_segments_table_v3> structure_with_old_segment_table_type;
+        typedef alignment_check_helper<access_vector_fields::internal_segments_table> structure_with_new_segment_table_type;
+
+        ASSERT((sizeof(structure_with_old_segment_table_type)==sizeof(structure_with_new_segment_table_type))
+              ,"layout of new internal_segments_table and old one differ?");
+    }
+}
+void TestV3BackwardCompatibility(){
+    using namespace v3_backward_compatibility;
+    TestSegmentTLayout();
+    TestInternalSegmentsTableLayout();
+}
+
+#include "harness_defs.h"
+
+#include <vector>
+#include <numeric>
+#include <functional>
+
+// The helper to run a test only when a default construction is present.
+template <bool default_construction_present> struct do_default_construction_test {
+    template<typename FuncType> void operator() ( FuncType func ) const { func(); }
+};
+template <> struct do_default_construction_test<false> {
+    template<typename FuncType> void operator()( FuncType ) const {}
+};
+
+template <typename Type, typename Allocator>
+class test_grow_by_and_resize : NoAssign {
+    tbb::concurrent_vector<Type, Allocator> &my_c;
+public:
+    test_grow_by_and_resize( tbb::concurrent_vector<Type, Allocator> &c ) : my_c(c) {}
+    void operator()() const {
+        const typename tbb::concurrent_vector<Type, Allocator>::size_type sz = my_c.size();
+        my_c.grow_by( 5 );
+        ASSERT( my_c.size() == sz + 5, NULL );
+        my_c.resize( sz );
+        ASSERT( my_c.size() == sz, NULL );
+    }
+};
+
+template <typename Type, typename Allocator>
+void CompareVectors( const tbb::concurrent_vector<Type, Allocator> &c1, const tbb::concurrent_vector<Type, Allocator> &c2 ) {
+    ASSERT( !(c1 == c2) && c1 != c2, NULL );
+    ASSERT( c1 <= c2 && c1 < c2 && c2 >= c1 && c2 > c1, NULL );
+}
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+template <typename Type, typename Allocator>
+void CompareVectors( const tbb::concurrent_vector<std::weak_ptr<Type>, Allocator> &, const tbb::concurrent_vector<std::weak_ptr<Type>, Allocator> & ) {
+    /* do nothing for std::weak_ptr */
+}
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+
+template <bool default_construction_present, typename Type, typename Allocator>
+void Examine( tbb::concurrent_vector<Type, Allocator> c, const std::vector<Type> &vec ) {
+    typedef tbb::concurrent_vector<Type, Allocator> vector_t;
+    typedef typename vector_t::size_type size_type_t;
+
+    ASSERT( c.size() == vec.size(), NULL );
+    for ( size_type_t i=0; i<c.size(); ++i ) ASSERT( Harness::IsEqual()(c[i], vec[i]), NULL );
+    do_default_construction_test<default_construction_present>()(test_grow_by_and_resize<Type,Allocator>(c));
+    c.grow_by( size_type_t(5), c[0] );
+    c.grow_to_at_least( c.size()+5, c.at(0) );
+    vector_t c2;
+    c2.reserve( 5 );
+    std::copy( c.begin(), c.begin() + 5, std::back_inserter( c2 ) );
+
+    c.grow_by( c2.begin(), c2.end() );
+    const vector_t& cvcr = c;
+    ASSERT( Harness::IsEqual()(cvcr.front(), *(c2.rend()-1)), NULL );
+    ASSERT( Harness::IsEqual()(cvcr.back(), *c2.rbegin()), NULL);
+    ASSERT( Harness::IsEqual()(*c.cbegin(), *(c.crend()-1)), NULL );
+    ASSERT( Harness::IsEqual()(*(c.cend()-1), *c.crbegin()), NULL );
+    c.swap( c2 );
+    ASSERT( c.size() == 5, NULL );
+    CompareVectors( c, c2 );
+    c.swap( c2 );
+    c2.clear();
+    ASSERT( c2.size() == 0, NULL );
+    c2.shrink_to_fit();
+    Allocator a = c.get_allocator();
+    a.deallocate( a.allocate(1), 1 );
+}
+
+template <typename Type>
+class test_default_construction : NoAssign {
+    const std::vector<Type> &my_vec;
+public:
+    test_default_construction( const std::vector<Type> &vec ) : my_vec(vec) {}
+    void operator()() const {
+        // Construction with initial size specified by argument n.
+        tbb::concurrent_vector<Type> c7( my_vec.size() );
+        std::copy( my_vec.begin(), my_vec.end(), c7.begin() );
+        Examine</*default_construction_present = */true>( c7, my_vec );
+        tbb::concurrent_vector< Type, debug_allocator<Type> > c8( my_vec.size() );
+        std::copy( c7.begin(), c7.end(), c8.begin() );
+        Examine</*default_construction_present = */true>( c8, my_vec );
+    }
+};
+
+template <bool default_construction_present, typename Type>
+void TypeTester( const std::vector<Type> &vec ) {
+    __TBB_ASSERT( vec.size() >= 5, "Array should have at least 5 elements" );
+    // Construct empty vector.
+    tbb::concurrent_vector<Type> c1;
+    std::copy( vec.begin(), vec.end(), std::back_inserter(c1) );
+    Examine<default_construction_present>( c1, vec );
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    // Constructor from initializer_list.
+    tbb::concurrent_vector<Type> c2({vec[0],vec[1],vec[2]});
+    std::copy( vec.begin()+3, vec.end(), std::back_inserter(c2) );
+    Examine<default_construction_present>( c2, vec );
+#endif
+    // Copying constructor.
+    tbb::concurrent_vector<Type> c3(c1);
+    Examine<default_construction_present>( c3, vec );
+    // Construct with non-default allocator
+    tbb::concurrent_vector< Type, debug_allocator<Type> > c4;
+    std::copy( vec.begin(), vec.end(), std::back_inserter(c4) );
+    Examine<default_construction_present>( c4, vec );
+    // Copying constructor for vector with different allocator type.
+    tbb::concurrent_vector<Type> c5(c4);
+    Examine<default_construction_present>( c5, vec );
+    tbb::concurrent_vector< Type, debug_allocator<Type> > c6(c3);
+    Examine<default_construction_present>( c6, vec );
+    // Construction with initial size specified by argument n.
+    do_default_construction_test<default_construction_present>()(test_default_construction<Type>(vec));
+    // Construction with initial size specified by argument n, initialization by copying of t, and given allocator instance.
+    debug_allocator<Type> allocator;
+    tbb::concurrent_vector< Type, debug_allocator<Type> > c9(vec.size(), vec[1], allocator);
+    Examine<default_construction_present>( c9, std::vector<Type>(vec.size(), vec[1]) );
+    // Construction with copying iteration range and given allocator instance.
+    tbb::concurrent_vector< Type, debug_allocator<Type> > c10(c1.begin(), c1.end(), allocator);
+    Examine<default_construction_present>( c10, vec );
+    tbb::concurrent_vector<Type> c11(vec.begin(), vec.end());
+    Examine<default_construction_present>( c11, vec );
+}
+
+void TestTypes() {
+    const int NUMBER = 100;
+
+    std::vector<int> intArr;
+    for ( int i=0; i<NUMBER; ++i ) intArr.push_back(i);
+    TypeTester</*default_construction_present = */true>( intArr );
+
+#if __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN
+    std::vector< std::reference_wrapper<int> > refArr;
+    // The constructor of std::reference_wrapper<T> from T& is explicit in some versions of libstdc++.
+    for ( int i=0; i<NUMBER; ++i ) refArr.push_back( std::reference_wrapper<int>(intArr[i]) );
+    TypeTester</*default_construction_present = */false>( refArr );
+#else
+    REPORT( "Known issue: C++11 reference wrapper tests are skipped.\n" );
+#endif /* __TBB_CPP11_REFERENCE_WRAPPER_PRESENT && !__TBB_REFERENCE_WRAPPER_COMPILATION_BROKEN */
+
+    std::vector< tbb::atomic<int> > tbbIntArr( NUMBER );
+    for ( int i=0; i<NUMBER; ++i ) tbbIntArr[i] = i;
+    TypeTester</*default_construction_present = */true>( tbbIntArr );
+
+#if __TBB_CPP11_SMART_POINTERS_PRESENT
+    std::vector< std::shared_ptr<int> > shrPtrArr;
+    for ( int i=0; i<NUMBER; ++i ) shrPtrArr.push_back( std::make_shared<int>(i) );
+    TypeTester</*default_construction_present = */true>( shrPtrArr );
+
+    std::vector< std::weak_ptr<int> > wkPtrArr;
+    std::copy( shrPtrArr.begin(), shrPtrArr.end(), std::back_inserter(wkPtrArr) );
+    TypeTester</*default_construction_present = */true>( wkPtrArr );
+#else
+    REPORT( "Known issue: C++11 smart pointer tests are skipped.\n" );
+#endif /* __TBB_CPP11_SMART_POINTERS_PRESENT */
+}
+
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+template <template <typename...> typename TVector>
+void TestDeductionGuides() {
+    using ComplexType = const std::string*;
+    std::vector<ComplexType> v;
+    std::string s = "s";
+    auto l = {ComplexType(&s), ComplexType(&s)};
+
+    // check TVector(InputIterator, InputIterator)
+    TVector v1(v.begin(), v.end());
+    static_assert(std::is_same<decltype(v1), TVector<ComplexType>>::value);
+
+    // check TVector(InputIterator, InputIterator, Alocator)
+    TVector v2(v.begin(), v.end(), std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(v2),
+       TVector<ComplexType, std::allocator<ComplexType>>>::value);
+
+    // check TVector(std::initializer_list<T>)
+    TVector v3(l);
+    static_assert(std::is_same<decltype(v3),
+        TVector<ComplexType>>::value);
+
+    // check TVector(std::initializer_list, Alocator)
+    TVector v4(l, std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(v4), TVector<ComplexType, std::allocator<ComplexType>>>::value);
+
+    // check TVector(TVector&)
+    TVector v5(v1);
+    static_assert(std::is_same<decltype(v5), TVector<ComplexType>>::value);
+
+    // check TVector(TVector&, Allocator)
+    TVector v6(v5, std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(v6), TVector<ComplexType, std::allocator<ComplexType>>>::value);
+
+    // check TVector(TVector&&)
+    TVector v7(std::move(v1));
+    static_assert(std::is_same<decltype(v7), decltype(v1)>::value);
+
+    // check TVector(TVector&&, Allocator)
+    TVector v8(std::move(v5), std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(v8), TVector<ComplexType, std::allocator<ComplexType>>>::value);
+
+    // check TVector(TVector&, Allocator)
+    TVector v9(v1, std::allocator<ComplexType>());
+    static_assert(std::is_same<decltype(v9), TVector<ComplexType, std::allocator<ComplexType>>>::value);
+
+}
+#endif
+
+int TestMain () {
+    if( MinThread<1 ) {
+        REPORT("ERROR: MinThread=%d, but must be at least 1\n",MinThread); MinThread = 1;
+    }
+    TestFoo();
+    TestV3BackwardCompatibility();
+    TestIteratorTraits<tbb::concurrent_vector<Foo>::iterator,Foo>();
+    TestIteratorTraits<tbb::concurrent_vector<Foo>::const_iterator,const Foo>();
+    TestArrayLength();
+    TestAllOf();
+#if __TBB_INITIALIZER_LISTS_PRESENT
+    TestInitList();
+#else
+    REPORT("Known issue: initializer list tests are skipped.\n");
+#endif
+    TestSequentialFor<FooWithAssign> ();
+    TestResizeAndCopy();
+    TestAssign();
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestMoveConstructor<c_vector_type>();
+    TestMoveAssignOperator<c_vector_type>();
+    TestConstructorWithMoveIterators<c_vector_type>();
+    TestAssignWithMoveIterators<c_vector_type>();
+    TestSerialGrowByWithMoveIterators();
+#if __TBB_MOVE_IF_NOEXCEPT_PRESENT
+    TestSerialMoveInShrinkToFit();
+#endif // __TBB_MOVE_IF_NOEXCEPT_PRESENT
+#else
+    REPORT("Known issue: tests for vector move constructor/assignment operator are skipped.\n");
+#endif
+    TestGrowToAtLeastWithSourceParameter<tbb::concurrent_vector<int> >(12345);
+    TestSerialGrowByRange(false);
+    TestSerialGrowByRange(true);
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestPushBackMoveOnlyContainee();
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    TestEmplaceBack();
+#endif  //__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+#endif  //__TBB_CPP11_RVALUE_REF_PRESENT
+#if HAVE_m128
+    TestVectorTypes<ClassWithSSE>();
+#endif
+#if HAVE_m256
+    if (have_AVX()) TestVectorTypes<ClassWithAVX>();
+#endif
+    TestCapacity();
+    ASSERT( !FooCount, NULL );
+    for( int nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        tbb::task_scheduler_init init( nthread );
+        TestParallelFor( nthread );
+        TestConcurrentGrowToAtLeast();
+        TestConcurrentGrowBy( nthread );
+    }
+    ASSERT( !FooCount, NULL );
+    TestComparison();
+    TestFindPrimes();
+    TestSort();
+#if __TBB_RANGE_BASED_FOR_PRESENT
+    TestRangeBasedFor();
+#endif //if __TBB_RANGE_BASED_FOR_PRESENT
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception safety test is skipped.\n");
+#elif TBB_USE_EXCEPTIONS
+    TestExceptions();
+    TestExceptionSafetyGuaranteesForAssignOperator();
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorMemoryFailure<c_vector_type>();
+    TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorExceptionInElementCtor<c_vector_type>();
+    TestExceptionSafetyGuaranteesForMoveAssignOperatorWithUnEqualAllocatorMemoryFailure();
+    TestExceptionSafetyGuaranteesForMoveAssignOperatorWithUnEqualAllocatorExceptionInElementCtor();
+    TestPushBackMoveExceptionSafety();
+#if __TBB_CPP11_VARIADIC_TEMPLATES_PRESENT
+    TestEmplaceBackExceptionSafety();
+#endif /*__TBB_CPP11_VARIADIC_TEMPLATES_PRESENT */
+#else
+    REPORT("Known issue: exception safety tests for move constructor/assignment operator , grow_by are skipped.\n");
+#endif /*__TBB_CPP11_RVALUE_REF_PRESENT */
+#endif /* TBB_USE_EXCEPTIONS */
+    TestTypes();
+#if __TBB_CPP17_DEDUCTION_GUIDES_PRESENT
+    TestDeductionGuides<tbb::concurrent_vector>();
+#endif
+    ASSERT( !FooCount, NULL );
+    REMARK("sizeof(concurrent_vector<int>) == %d\n", (int)sizeof(tbb::concurrent_vector<int>));
+    return Harness::Done;
+}
+
+#if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif // warning 4800 is back
diff --git a/xdl/third_party/tbb/src/test/test_condition_variable.h b/xdl/third_party/tbb/src/test/test_condition_variable.h
new file mode 100644
index 00000000..898f5002
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_condition_variable.h
@@ -0,0 +1,767 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/compat/condition_variable"
+#include "tbb/mutex.h"
+#include "tbb/recursive_mutex.h"
+#include "tbb/tick_count.h"
+#include "tbb/atomic.h"
+
+#include <stdexcept>
+
+#include "harness.h"
+
+#if TBB_IMPLEMENT_CPP0X
+// This test deliberately avoids a "using tbb" statement,
+// so that the error of putting types in the wrong namespace will be caught.
+using namespace std;
+#else
+using namespace tbb::interface5;
+#endif
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<typename M>
+void TestUniqueLockMoveConstructorAndAssignOp(){
+    typedef unique_lock<M> unique_lock_t;
+
+    static const bool locked = true;
+    static const bool unlocked = false;
+
+    struct Locked{
+        bool value;
+        Locked(bool a_value) : value(a_value) {}
+    };
+
+    typedef Locked destination;
+    typedef Locked source;
+
+    struct MutexAndLockFixture{
+        M mutex;
+        unique_lock_t lock;
+        const bool was_locked;
+
+        MutexAndLockFixture(source lckd_src) : lock(mutex), was_locked(lckd_src.value){
+            if (!lckd_src.value) lock.unlock();
+            ASSERT(was_locked == lock.owns_lock(), "unlock did not release the mutex while should?");
+        }
+    };
+
+    struct TestCases{
+        const char* filename;
+        int line;
+
+        TestCases(const char* a_filename, int a_line) : filename(a_filename), line(a_line) {}
+
+        void TestMoveConstructor(source locked_src){
+            MutexAndLockFixture src(locked_src);
+            unique_lock_t dst_lock(std::move(src.lock));
+            AssertOwnershipWasTransfered(dst_lock, src.lock, src.was_locked, &src.mutex);
+        }
+
+        void TestMoveAssignment(source locked_src, destination locked_dest){
+            MutexAndLockFixture src(locked_src);
+            MutexAndLockFixture dst(locked_dest);
+
+            dst.lock = std::move(src.lock);
+            ASSERT_CUSTOM(unique_lock_t(dst.mutex, try_to_lock).owns_lock(), "unique_lock should release owned mutex on assignment", filename, line);
+            AssertOwnershipWasTransfered(dst.lock, src.lock, src.was_locked, &src.mutex);
+        }
+
+        void AssertOwnershipWasTransfered(unique_lock_t const& dest_lock, unique_lock_t const& src_lck, const bool was_locked, const M* mutex) {
+            ASSERT_CUSTOM(dest_lock.owns_lock() == was_locked, "moved to lock object should have the same state as source before move", filename, line);
+            ASSERT_CUSTOM(dest_lock.mutex() == mutex, "moved to lock object should have the same state as source before move", filename, line);
+            ASSERT_CUSTOM(src_lck.owns_lock() == false, "moved from lock object must not left locked", filename, line);
+            ASSERT_CUSTOM(src_lck.mutex() == NULL, "moved from lock object must not has mutex", filename, line);
+        }
+    };
+//TODO: to rework this with an assertion binder
+#define AT_LOCATION() TestCases( __FILE__, __LINE__) \
+
+        AT_LOCATION().TestMoveConstructor(source(locked));
+        AT_LOCATION().TestMoveAssignment (source(locked), destination(locked));
+        AT_LOCATION().TestMoveAssignment (source(locked), destination(unlocked));
+        AT_LOCATION().TestMoveConstructor(source(unlocked));
+        AT_LOCATION().TestMoveAssignment (source(unlocked), destination(locked));
+        AT_LOCATION().TestMoveAssignment (source(unlocked), destination(unlocked));
+
+#undef AT_LOCATION
+
+}
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+
+template<typename M>
+struct Counter {
+    typedef M mutex_type;
+    M mutex;
+    volatile long value;
+    void flog_once_lock_guard( size_t mode );
+    void flog_once_unique_lock( size_t mode );
+};
+
+template<typename M>
+void Counter<M>::flog_once_lock_guard(size_t mode)
+/** Increments counter once for each iteration in the iteration space. */
+{
+    if( mode&1 ) {
+        // Try acquire and release with implicit lock_guard
+        // precondition: if mutex_type is not a recursive mutex, the calling thread does not own the mutex m.
+        // if the precondition is not met, either dead-lock incorrect 'value' would result in.
+        lock_guard<M> lg(mutex);
+        value = value+1;
+    } else {
+        // Try acquire and release with adopt lock_quard
+        // precodition: the calling thread owns the mutex m.
+        // if the precondition is not met, incorrect 'value' would result in because the thread unlocks
+        // mutex that it does not own.
+        mutex.lock();
+        lock_guard<M> lg( mutex, adopt_lock );
+        value = value+1;
+    }
+}
+
+template<typename M>
+void Counter<M>::flog_once_unique_lock(size_t mode)
+/** Increments counter once for each iteration in the iteration space. */
+{
+    switch( mode&7 ) {
+    case 0:
+        {// implicitly acquire and release mutex with unique_lock
+          unique_lock<M> ul( mutex );
+          value = value+1;
+          ASSERT( ul==true, NULL );
+        }
+        break;
+    case 1:
+        {// unique_lock with defer_lock
+          unique_lock<M> ul( mutex, defer_lock );
+          ASSERT( ul.owns_lock()==false, NULL );
+          ul.lock();
+          value = value+1;
+          ASSERT( ul.owns_lock()==true, NULL );
+        }
+        break;
+    case 2:
+        {// unique_lock::try_lock() with try_to_lock
+          unique_lock<M> ul( mutex, try_to_lock );
+          if( !ul )
+              while( !ul.try_lock() )
+                  __TBB_Yield();
+          value = value+1;
+        }
+        break;
+    case 3:
+        {// unique_lock::try_lock_for() with try_to_lock
+          unique_lock<M> ul( mutex, defer_lock );
+          tbb::tick_count::interval_t i(1.0);
+          while( !ul.try_lock_for( i ) )
+              ;
+          value = value+1;
+          ASSERT( ul.owns_lock()==true, NULL );
+        }
+        break;
+    case 4:
+        {
+          unique_lock<M> ul_o4;
+          {// unique_lock with adopt_lock
+            mutex.lock();
+            unique_lock<M> ul( mutex, adopt_lock );
+            value = value+1;
+            ASSERT( ul.owns_lock()==true, NULL );
+            ASSERT( ul.mutex()==&mutex, NULL );
+            ASSERT( ul_o4.owns_lock()==false, NULL );
+            ASSERT( ul_o4.mutex()==NULL, NULL );
+            swap( ul, ul_o4 );
+            ASSERT( ul.owns_lock()==false, NULL );
+            ASSERT( ul.mutex()==NULL, NULL );
+            ASSERT( ul_o4.owns_lock()==true, NULL );
+            ASSERT( ul_o4.mutex()==&mutex, NULL );
+            ul_o4.unlock();
+          }
+          ASSERT( ul_o4.owns_lock()==false, NULL );
+        }
+        break;
+    case 5:
+        {
+          unique_lock<M> ul_o5;
+          {// unique_lock with adopt_lock
+            mutex.lock();
+            unique_lock<M> ul( mutex, adopt_lock );
+            value = value+1;
+            ASSERT( ul.owns_lock()==true, NULL );
+            ASSERT( ul.mutex()==&mutex, NULL );
+            ASSERT( ul_o5.owns_lock()==false, NULL );
+            ASSERT( ul_o5.mutex()==NULL, NULL );
+            ul_o5.swap( ul );
+            ASSERT( ul.owns_lock()==false, NULL );
+            ASSERT( ul.mutex()==NULL, NULL );
+            ASSERT( ul_o5.owns_lock()==true, NULL );
+            ASSERT( ul_o5.mutex()==&mutex, NULL );
+            ul_o5.unlock();
+          }
+          ASSERT( ul_o5.owns_lock()==false, NULL );
+        }
+        break;
+    default:
+        {// unique_lock with adopt_lock, and release()
+          mutex.lock();
+          unique_lock<M> ul( mutex, adopt_lock );
+          ASSERT( ul==true, NULL );
+          value = value+1;
+          M* old_m = ul.release();
+          old_m->unlock();
+          ASSERT( ul.owns_lock()==false, NULL );
+        }
+        break;
+    }
+}
+
+static tbb::atomic<size_t> Order;
+
+template<typename State, long TestSize>
+struct WorkForLocks: NoAssign {
+    static const size_t chunk = 100;
+    State& state;
+    WorkForLocks( State& state_ ) : state(state_) {}
+    void operator()( int ) const {
+        size_t step;
+        while( (step=Order.fetch_and_add<tbb::acquire>(chunk))<TestSize ) {
+            for( size_t i=0; i<chunk && step<TestSize; ++i, ++step ) {
+                state.flog_once_lock_guard(step);
+                state.flog_once_unique_lock(step);
+            }
+        }
+    }
+};
+
+template<typename M>
+void TestLocks( const char* name, int nthread ) {
+    REMARK("testing %s in TestLocks\n",name);
+    Counter<M> counter;
+    counter.value = 0;
+    Order = 0;
+    // use the macro because of a gcc 4.6 bug
+#define TEST_SIZE 100000
+    NativeParallelFor( nthread, WorkForLocks<Counter<M>, TEST_SIZE>(counter) );
+
+    if( counter.value!=2*TEST_SIZE )
+        REPORT("ERROR for %s in TestLocks: counter.value=%ld != 2 * %ld=test_size\n",name,counter.value,TEST_SIZE);
+#undef TEST_SIZE
+}
+
+static tbb::atomic<int> barrier;
+
+// Test if the constructor works and if native_handle() works
+template<typename M>
+struct WorkForCondVarCtor: NoAssign {
+    condition_variable& my_cv;
+    M& my_mtx;
+    WorkForCondVarCtor( condition_variable& cv_, M& mtx_ ) : my_cv(cv_), my_mtx(mtx_) {}
+    void operator()( int tid ) const {
+        ASSERT( tid<=1, NULL ); // test with 2 threads.
+        condition_variable::native_handle_type handle = my_cv.native_handle();
+        if( tid&1 ) {
+            my_mtx.lock();
+            ++barrier;
+#if _WIN32||_WIN64
+            if( !tbb::interface5::internal::internal_condition_variable_wait( *handle, &my_mtx ) ) {
+                int ec = GetLastError();
+                ASSERT( ec!=WAIT_TIMEOUT, NULL );
+                throw_exception( tbb::internal::eid_condvar_wait_failed );
+            }
+#else
+            if( pthread_cond_wait( handle, my_mtx.native_handle() ) )
+                throw_exception( tbb::internal::eid_condvar_wait_failed );
+#endif
+            ++barrier;
+            my_mtx.unlock();
+        } else {
+            bool res;
+            while( (res=my_mtx.try_lock())==true && barrier==0 ) {
+                my_mtx.unlock();
+                __TBB_Yield();
+            }
+            if( res ) my_mtx.unlock();
+            do {
+#if _WIN32||_WIN64
+                tbb::interface5::internal::internal_condition_variable_notify_one( *handle );
+#else
+                pthread_cond_signal( handle );
+#endif
+                __TBB_Yield();
+            } while ( barrier<2 );
+        }
+    }
+};
+
+static condition_variable* test_cv;
+static tbb::atomic<int> n_waiters;
+
+// Test if the destructor works
+template<typename M>
+struct WorkForCondVarDtor: NoAssign {
+    int nthread;
+    M& my_mtx;
+    WorkForCondVarDtor( int n, M& mtx_ ) : nthread(n), my_mtx(mtx_) {}
+    void operator()( int tid ) const {
+        if( tid==0 ) {
+            unique_lock<M> ul( my_mtx, defer_lock );
+            test_cv = new condition_variable;
+
+            while( n_waiters<nthread-1 )
+                __TBB_Yield();
+            ul.lock();
+            test_cv->notify_all();
+            ul.unlock();
+            while( n_waiters>0 )
+                __TBB_Yield();
+            delete test_cv;
+        } else {
+            while( test_cv==NULL )
+                __TBB_Yield();
+            unique_lock<M> ul(my_mtx);
+            ++n_waiters;
+            test_cv->wait( ul );
+            --n_waiters;
+        }
+    }
+};
+
+static const int max_ticket  = 100;
+static const int short_delay = 10;
+static const int long_delay  = 100;
+
+tbb::atomic<int> n_signaled;
+tbb::atomic<int> n_done, n_done_1, n_done_2;
+tbb::atomic<int> n_timed_out;
+
+static bool false_to_true;
+
+struct TestPredicateFalseToTrue {
+    TestPredicateFalseToTrue() {}
+    bool operator()() { return false_to_true; }
+};
+
+struct TestPredicateFalse {
+    TestPredicateFalse() {}
+    bool operator()() { return false; }
+};
+
+struct TestPredicateTrue {
+    TestPredicateTrue() {}
+    bool operator()() { return true; }
+};
+
+// Test timed wait and timed wait with pred
+template<typename M>
+struct WorkForCondVarTimedWait: NoAssign {
+    int nthread;
+    condition_variable& test_cv;
+    M& my_mtx;
+    WorkForCondVarTimedWait( int n_, condition_variable& cv_, M& mtx_ ) : nthread(n_), test_cv(cv_), my_mtx(mtx_) {}
+    void operator()( int tid ) const {
+        tbb::tick_count t1, t2;
+
+        unique_lock<M> ul( my_mtx, defer_lock );
+
+        ASSERT( n_timed_out==0, NULL );
+        ++barrier;
+        while( barrier<nthread ) __TBB_Yield();
+
+        // test if a thread times out with wait_for()
+        for( int i=1; i<10; ++i ) {
+            tbb::tick_count::interval_t intv((double)i*0.0999 /*seconds*/);
+            ul.lock();
+            cv_status st = no_timeout;
+            __TBB_TRY {
+                /** Some version of glibc return EINVAL instead 0 when spurious wakeup occurs on pthread_cond_timedwait() **/
+                st = test_cv.wait_for( ul, intv );
+            } __TBB_CATCH( std::runtime_error& ) {}
+            ASSERT( ul, "mutex should have been reacquired" );
+            ul.unlock();
+            if( st==timeout )
+                ++n_timed_out;
+        }
+
+        ASSERT( n_timed_out>0, "should have been timed-out at least once\n" );
+        ++n_done_1;
+        while( n_done_1<nthread ) __TBB_Yield();
+
+        for( int i=1; i<10; ++i ) {
+            tbb::tick_count::interval_t intv((double)i*0.0001 /*seconds*/);
+            ul.lock();
+            __TBB_TRY {
+                /** Some version of glibc return EINVAL instead 0 when spurious wakeup occurs on pthread_cond_timedwait() **/
+                ASSERT( false==test_cv.wait_for( ul, intv, TestPredicateFalse()), "incorrect return value" );
+            } __TBB_CATCH( std::runtime_error& ) {}
+            ASSERT( ul, "mutex should have been reacquired" );
+            ul.unlock();
+        }
+
+        if( tid==0 )
+            n_waiters = 0;
+        // barrier
+        ++n_done_2;
+        while( n_done_2<nthread ) __TBB_Yield();
+
+        // at this point, we know wait_for() successfully times out.
+        // so test if a thread blocked on wait_for() could receive a signal before its waiting time elapses.
+        if( tid==0 ) {
+            // signaler
+            n_signaled = 0;
+            ASSERT( n_waiters==0, NULL );
+            ++n_done_2; // open gate 1
+
+            while( n_waiters<(nthread-1) ) __TBB_Yield(); // wait until all other threads block on cv. flag_1
+
+            ul.lock();
+            test_cv.notify_all();
+            n_waiters = 0;
+            ul.unlock();
+
+            while( n_done_2<2*nthread ) __TBB_Yield();
+            ASSERT( n_signaled>0, "too small an interval?" );
+            n_signaled = 0;
+
+        } else {
+            while( n_done_2<nthread+1 ) __TBB_Yield(); // gate 1
+
+            // sleeper
+            tbb::tick_count::interval_t intv((double)2.0 /*seconds*/);
+            ul.lock();
+            ++n_waiters; // raise flag 1/(nthread-1)
+            t1 = tbb::tick_count::now();
+            cv_status st = test_cv.wait_for( ul, intv ); // gate 2
+            t2 = tbb::tick_count::now();
+            ul.unlock();
+            if( st==no_timeout ) {
+                ++n_signaled;
+                ASSERT( (t2-t1).seconds()<intv.seconds(), "got a signal after timed-out?" );
+            }
+        }
+
+        ASSERT( n_done==0, NULL );
+        ++n_done_2;
+
+        if( tid==0 ) {
+            ASSERT( n_waiters==0, NULL );
+            ++n_done; // open gate 3
+
+            while( n_waiters<(nthread-1) ) __TBB_Yield(); // wait until all other threads block on cv.
+            for( int i=0; i<2*short_delay; ++i ) __TBB_Yield();  // give some time to waiters so that all of them in the waitq
+            ul.lock();
+            false_to_true = true;
+            test_cv.notify_all(); // open gate 4
+            ul.unlock();
+
+            while( n_done<nthread ) __TBB_Yield(); // wait until all other threads wake up.
+            ASSERT( n_signaled>0, "too small an interval?" );
+        } else {
+
+            while( n_done<1 ) __TBB_Yield(); // gate 3
+
+            tbb::tick_count::interval_t intv((double)2.0 /*seconds*/);
+            ul.lock();
+            ++n_waiters;
+            // wait_for w/ predciate
+            t1 = tbb::tick_count::now();
+            ASSERT( test_cv.wait_for( ul, intv, TestPredicateFalseToTrue())==true, NULL ); // gate 4
+            t2 = tbb::tick_count::now();
+            ul.unlock();
+            if( (t2-t1).seconds()<intv.seconds() )
+                ++n_signaled;
+            ++n_done;
+        }
+    }
+};
+
+tbb::atomic<int> ticket_for_sleep, ticket_for_wakeup, signaled_ticket, wokeup_ticket;
+tbb::atomic<unsigned> n_visit_to_waitq;
+unsigned max_waitq_length;
+
+template<typename M>
+struct WorkForCondVarWaitAndNotifyOne: NoAssign {
+    int nthread;
+    condition_variable& test_cv;
+    M& my_mtx;
+    WorkForCondVarWaitAndNotifyOne( int n_, condition_variable& cv_, M& mtx_ ) : nthread(n_), test_cv(cv_), my_mtx(mtx_) {}
+    void operator()( int tid ) const {
+        if( tid&1 ) {
+            // exercise signal part
+            while( ticket_for_wakeup<max_ticket ) {
+                int my_ticket = ++ticket_for_wakeup; // atomically grab the next ticket
+                if( my_ticket>max_ticket )
+                    break;
+
+                for( ;; ) {
+                    unique_lock<M> ul( my_mtx, defer_lock );
+                    ul.lock();
+                    if( n_waiters>0 && my_ticket<=ticket_for_sleep && my_ticket==(wokeup_ticket+1) ) {
+                        signaled_ticket = my_ticket;
+                        test_cv.notify_one();
+                        ++n_signaled;
+                        ul.unlock();
+                        break;
+                    }
+                    ul.unlock();
+                    __TBB_Yield();
+                }
+
+                // give waiters time to go to sleep.
+                for( int m=0; m<short_delay; ++m )
+                    __TBB_Yield();
+            }
+        } else {
+            while( ticket_for_sleep<max_ticket ) {
+                unique_lock<M> ul( my_mtx, defer_lock );
+                ul.lock();
+                // exercise wait part
+                int my_ticket = ++ticket_for_sleep; // grab my ticket
+                if( my_ticket>max_ticket ) break;
+
+                // each waiter should go to sleep at least once
+                unsigned nw = ++n_waiters;
+                for( ;; ) {
+                    // update to max_waitq_length
+                    if( nw>max_waitq_length ) max_waitq_length = nw;
+                    ++n_visit_to_waitq;
+                    test_cv.wait( ul );
+                    // if( ret==false ) ++n_timedout;
+                    ASSERT( ul, "mutex should have been locked" );
+                    --n_waiters;
+                    if( signaled_ticket==my_ticket ) {
+                        wokeup_ticket = my_ticket;
+                        break;
+                    }
+                    if( n_waiters>0 )
+                        test_cv.notify_one();
+                    nw = ++n_waiters; // update to max_waitq_length occurs above
+                }
+
+                ul.unlock();
+                __TBB_Yield(); // give other threads chance to run.
+            }
+        }
+        ++n_done;
+        spin_wait_until_eq( n_done, nthread );
+        ASSERT( n_signaled==max_ticket, "incorrect number of notifications sent" );
+    }
+};
+
+struct TestPredicate1 {
+    int target;
+    TestPredicate1( int i_ ) : target(i_) {}
+    bool operator()( ) { return signaled_ticket==target; }
+};
+
+template<typename M>
+struct WorkForCondVarWaitPredAndNotifyAll: NoAssign {
+    int nthread;
+    condition_variable& test_cv;
+    M& my_mtx;
+    int multiple;
+    WorkForCondVarWaitPredAndNotifyAll( int n_, condition_variable& cv_, M& mtx_, int m_ ) :
+        nthread(n_), test_cv(cv_), my_mtx(mtx_), multiple(m_) {}
+    void operator()( int tid ) const {
+        if( tid&1 ) {
+            while( ticket_for_sleep<max_ticket ) {
+                unique_lock<M> ul( my_mtx, defer_lock );
+                // exercise wait part
+                int my_ticket = ++ticket_for_sleep; // grab my ticket
+                if( my_ticket>max_ticket )
+                    break;
+
+                ul.lock();
+                ++n_visit_to_waitq;
+                unsigned nw = ++n_waiters;
+                if( nw>max_waitq_length ) max_waitq_length = nw;
+                test_cv.wait( ul, TestPredicate1( my_ticket ) );
+                wokeup_ticket = my_ticket;
+                --n_waiters;
+                ASSERT( ul, "mutex should have been locked" );
+                ul.unlock();
+
+                __TBB_Yield(); // give other threads chance to run.
+            }
+        } else {
+            // exercise signal part
+            while( ticket_for_wakeup<max_ticket ) {
+                int my_ticket = ++ticket_for_wakeup; // atomically grab the next ticket
+                if( my_ticket>max_ticket )
+                    break;
+
+                for( ;; ) {
+                    unique_lock<M> ul( my_mtx );
+                    if( n_waiters>0 && my_ticket<=ticket_for_sleep && my_ticket==(wokeup_ticket+1) ) {
+                        signaled_ticket = my_ticket;
+                        test_cv.notify_all();
+                        ++n_signaled;
+                        ul.unlock();
+                        break;
+                    }
+                    ul.unlock();
+                    __TBB_Yield();
+                }
+
+                // give waiters time to go to sleep.
+                for( int m=0; m<long_delay*multiple; ++m )
+                    __TBB_Yield();
+            }
+        }
+        ++n_done;
+        spin_wait_until_eq( n_done, nthread );
+        ASSERT( n_signaled==max_ticket, "incorrect number of notifications sent" );
+    }
+};
+
+void InitGlobalCounters()
+{
+      ticket_for_sleep = ticket_for_wakeup = signaled_ticket = wokeup_ticket = 0;
+      n_waiters = 0;
+      n_signaled = 0;
+      n_done = n_done_1 = n_done_2 = 0;
+      n_visit_to_waitq = 0;
+      n_timed_out = 0;
+}
+
+template<typename M>
+void TestConditionVariable( const char* name, int nthread )
+{
+    REMARK("testing %s in TestConditionVariable\n",name);
+    Counter<M> counter;
+    M mtx;
+
+    ASSERT( nthread>1, "at least two threads are needed for testing condition_variable" );
+    REMARK(" - constructor\n" );
+    // Test constructor.
+    {
+      condition_variable cv1;
+#if _WIN32||_WIN64
+      condition_variable::native_handle_type handle = cv1.native_handle();
+      ASSERT( uintptr_t(&handle->cv_event)==uintptr_t(&handle->cv_native), NULL );
+#endif
+      M mtx1;
+      barrier = 0;
+      NativeParallelFor( 2, WorkForCondVarCtor<M>( cv1, mtx1 ) );
+    }
+
+    REMARK(" - destructor\n" );
+    // Test destructor.
+    {
+      M mtx2;
+      test_cv = NULL;
+      n_waiters = 0;
+      NativeParallelFor( nthread, WorkForCondVarDtor<M>( nthread, mtx2 ) );
+    }
+
+    REMARK(" - timed_wait (i.e., wait_for)\n");
+    // Test timed wait.
+    {
+      condition_variable cv_tw;
+      M mtx_tw;
+      barrier = 0;
+      InitGlobalCounters();
+      int nthr = nthread>4?4:nthread;
+      NativeParallelFor( nthr, WorkForCondVarTimedWait<M>( nthr, cv_tw, mtx_tw ) );
+    }
+
+    REMARK(" - wait with notify_one\n");
+    // Test wait and notify_one
+    do {
+        condition_variable cv3;
+        M mtx3;
+        InitGlobalCounters();
+        NativeParallelFor( nthread, WorkForCondVarWaitAndNotifyOne<M>( nthread, cv3, mtx3 ) );
+    } while( n_visit_to_waitq==0 || max_waitq_length==0 );
+
+    REMARK(" - predicated wait with notify_all\n");
+    // Test wait_pred and notify_all
+    int delay_multiple = 1;
+    do {
+        condition_variable cv4;
+        M mtx4;
+        InitGlobalCounters();
+        NativeParallelFor( nthread, WorkForCondVarWaitPredAndNotifyAll<M>( nthread, cv4, mtx4, delay_multiple ) );
+        if( max_waitq_length<unsigned(nthread/2) )
+            ++delay_multiple;
+    } while( n_visit_to_waitq<=0 || max_waitq_length<unsigned(nthread/2) );
+}
+
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+static tbb::atomic<int> err_count;
+
+#define TRY_AND_CATCH_RUNTIME_ERROR(op,msg) \
+        try {                             \
+            op;                           \
+            ++err_count;                  \
+        } catch( std::runtime_error& e ) {ASSERT( strstr(e.what(), msg) , NULL );} catch(...) {++err_count;}
+
+template<typename M>
+void TestUniqueLockException( const char * name ) {
+    REMARK("testing %s TestUniqueLockException\n",name);
+    M mtx;
+    unique_lock<M> ul_0;
+    err_count = 0;
+
+    TRY_AND_CATCH_RUNTIME_ERROR( ul_0.lock(), "Operation not permitted" );
+    TRY_AND_CATCH_RUNTIME_ERROR( ul_0.try_lock(), "Operation not permitted" );
+
+    unique_lock<M> ul_1( mtx );
+
+    TRY_AND_CATCH_RUNTIME_ERROR( ul_1.lock(), "Resource deadlock" );
+    TRY_AND_CATCH_RUNTIME_ERROR( ul_1.try_lock(), "Resource deadlock" );
+
+    ul_1.unlock();
+    TRY_AND_CATCH_RUNTIME_ERROR( ul_1.unlock(), "Operation not permitted" );
+
+    ASSERT( !err_count, "Some exceptions are not thrown or incorrect ones are thrown" );
+}
+
+template<typename M>
+void TestConditionVariableException( const char * name ) {
+    REMARK("testing %s in TestConditionVariableException; yet to be implemented\n",name);
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+template<typename Mutex, typename RecursiveMutex>
+void DoCondVarTest()
+{
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestUniqueLockMoveConstructorAndAssignOp<Mutex>();
+    TestUniqueLockMoveConstructorAndAssignOp<RecursiveMutex>();
+#endif
+
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK( "testing with %d threads\n", p );
+        TestLocks<Mutex>( "mutex", p );
+        TestLocks<RecursiveMutex>( "recursive_mutex", p );
+
+        if( p<=1 ) continue;
+
+        // for testing condition_variable, at least one sleeper and one notifier are needed
+        TestConditionVariable<Mutex>( "mutex", p );
+    }
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception handling tests are skipped.\n");
+#elif TBB_USE_EXCEPTIONS
+    TestUniqueLockException<Mutex>( "mutex" );
+    TestUniqueLockException<RecursiveMutex>( "recursive_mutex" );
+    TestConditionVariableException<Mutex>( "mutex" );
+#endif /* TBB_USE_EXCEPTIONS */
+}
diff --git a/xdl/third_party/tbb/src/test/test_container_move_support.h b/xdl/third_party/tbb/src/test/test_container_move_support.h
new file mode 100644
index 00000000..3d67b146
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_container_move_support.h
@@ -0,0 +1,898 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_test_container_move_support_H
+#define __TBB_test_container_move_support_H
+
+#include "harness.h"
+#include "harness_assert.h"
+#include "harness_allocator.h"
+#include "harness_state_trackable.h"
+#include "tbb/atomic.h"
+#include "tbb/aligned_space.h"
+#include <stdexcept>
+#include <string>
+#include <functional>
+
+tbb::atomic<size_t> FooCount;
+size_t MaxFooCount = 0;
+
+//! Exception for concurrent_container
+class Foo_exception : public std::bad_alloc {
+public:
+    virtual const char *what() const throw() __TBB_override { return "out of Foo limit"; }
+    virtual ~Foo_exception() throw() {}
+};
+
+struct FooLimit {
+    FooLimit(){
+        if(MaxFooCount && FooCount >= MaxFooCount)
+            __TBB_THROW( Foo_exception() );
+    }
+};
+
+static const intptr_t initial_value_of_bar = 42;
+
+
+struct Foo : FooLimit, Harness::StateTrackable<true>{
+    typedef Harness::StateTrackable<true> StateTrackable;
+    intptr_t my_bar;
+public:
+    bool is_valid_or_zero() const{
+        return is_valid()||(state==ZeroInitialized && !my_bar);
+    }
+    intptr_t& zero_bar(){
+        ASSERT( is_valid_or_zero(), NULL );
+        return my_bar;
+    }
+    intptr_t zero_bar() const{
+        ASSERT( is_valid_or_zero(), NULL );
+        return my_bar;
+    }
+    intptr_t& bar(){
+        ASSERT( is_valid(), NULL );
+        return my_bar;
+    }
+    intptr_t bar() const{
+        ASSERT( is_valid(), NULL );
+        return my_bar;
+    }
+    operator intptr_t() const{
+        return this->bar();
+    }
+    Foo( intptr_t barr ): StateTrackable(0){
+        my_bar = barr;
+        FooCount++;
+    }
+    Foo(){
+        my_bar = initial_value_of_bar;
+        FooCount++;
+    }
+    Foo( const Foo& foo ): FooLimit(), StateTrackable(foo){
+        my_bar = foo.my_bar;
+        FooCount++;
+    }
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    Foo( Foo&& foo ): FooLimit(), StateTrackable(std::move(foo)){
+        my_bar = foo.my_bar;
+        //TODO: consider not using constant here, instead something like ~my_bar
+        foo.my_bar = -1;
+        FooCount++;
+    }
+#endif
+    ~Foo(){
+        my_bar = ~initial_value_of_bar;
+        if(state != ZeroInitialized) --FooCount;
+    }
+    friend bool operator==(const int &lhs, const Foo &rhs) {
+        ASSERT( rhs.is_valid_or_zero(), "comparing invalid objects ?" );
+        return lhs == rhs.my_bar;
+    }
+    friend bool operator==(const Foo &lhs, const int &rhs) {
+        ASSERT( lhs.is_valid_or_zero(),   "comparing invalid objects ?" );
+        return lhs.my_bar == rhs;
+    }
+    friend bool operator==(const Foo &lhs, const Foo &rhs) {
+        ASSERT( lhs.is_valid_or_zero(),   "comparing invalid objects ?" );
+        ASSERT( rhs.is_valid_or_zero(), "comparing invalid objects ?" );
+        return lhs.my_bar == rhs.my_bar;
+    }
+    friend bool operator<(const Foo &lhs, const Foo &rhs) {
+        ASSERT( lhs.is_valid_or_zero(),   "comparing invalid objects ?" );
+        ASSERT( rhs.is_valid_or_zero(), "comparing invalid objects ?" );
+        return lhs.my_bar < rhs.my_bar;
+    }
+    bool is_const() const {return true;}
+    bool is_const() {return false;}
+protected:
+    char reserve[1];
+    Foo& operator=( const Foo& x ) {
+        StateTrackable::operator=(x);
+        my_bar = x.my_bar;
+        return *this;
+    }
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    Foo& operator=( Foo&& x ) {
+        ASSERT( x.is_valid_or_zero(), "bad source for assignment" );
+        ASSERT( is_valid_or_zero(), NULL );
+        StateTrackable::operator=(std::move(x));
+        my_bar = x.my_bar;
+        x.my_bar = -1;
+        return *this;
+    }
+#endif
+};
+
+struct FooWithAssign: public Foo {
+    FooWithAssign()                         : Foo(){}
+    FooWithAssign(intptr_t barr)            : Foo(barr){}
+    FooWithAssign(FooWithAssign const& f) : Foo(f) {}
+    FooWithAssign& operator=(FooWithAssign const& f) { return  static_cast<FooWithAssign&>(Foo::operator=(f)); }
+
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    FooWithAssign(FooWithAssign && f)       : Foo(std::move(f)) {}
+    FooWithAssign& operator=(FooWithAssign && f) { return  static_cast<FooWithAssign&>(Foo::operator=(std::move(f))); }
+#endif
+};
+
+template<typename FooIteratorType>
+class FooIteratorBase {
+protected:
+    intptr_t x_bar;
+private:
+    FooIteratorType& as_derived(){ return *static_cast<FooIteratorType*>(this);}
+public:
+    FooIteratorBase(intptr_t x) {
+        x_bar = x;
+    }
+    FooIteratorType &operator++() {
+        x_bar++; return as_derived();
+    }
+    FooIteratorType operator++(int) {
+        FooIteratorType tmp(as_derived()); x_bar++; return tmp;
+    }
+    friend bool operator==(const FooIteratorType & lhs, const FooIteratorType & rhs){ return lhs.x_bar == rhs.x_bar; }
+    friend bool operator!=(const FooIteratorType & lhs, const FooIteratorType & rhs){ return !(lhs == rhs); }
+};
+
+class FooIterator: public std::iterator<std::input_iterator_tag,FooWithAssign>, public FooIteratorBase<FooIterator> {
+public:
+    FooIterator(intptr_t x): FooIteratorBase<FooIterator>(x) {}
+
+    FooWithAssign operator*() {
+        return FooWithAssign(x_bar);
+    }
+};
+
+class FooPairIterator: public std::iterator<std::input_iterator_tag, std::pair<FooWithAssign,FooWithAssign> >,  public FooIteratorBase<FooPairIterator> {
+public:
+    FooPairIterator(intptr_t x): FooIteratorBase<FooPairIterator>(x) {}
+
+    std::pair<FooWithAssign,FooWithAssign> operator*() {
+        FooWithAssign foo; foo.bar() = x_bar;
+
+        return std::make_pair(foo, foo);
+    }
+};
+
+namespace FooTests{
+    template<typename Foo_type>
+    void TestDefaultConstructor(){
+        Foo_type src;
+        ASSERT(src.state == Foo::DefaultInitialized, "incorrect state for default constructed Foo (derived) ?");
+    }
+
+    template<typename Foo_type>
+    void TestDirectConstructor(){
+        Foo_type src(1);
+        ASSERT(src.state == Foo::DirectInitialized, "incorrect state for direct constructed Foo (derived) ?");
+    }
+
+    template<typename Foo_type>
+    void TestCopyConstructor(){
+        Foo_type src;
+        Foo_type dst(src);
+        ASSERT(dst.state == Foo::CopyInitialized, "incorrect state for Copy constructed Foo ?");
+    }
+
+    template<typename Foo_type>
+    void TestAssignOperator(){
+        Foo_type src;
+        Foo_type dst;
+        dst = (src);
+
+        ASSERT(dst.state == Foo::Assigned, "incorrect state for Assigned Foo ?");
+    }
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    template<typename Foo_type>
+    void TestMoveConstructor(){
+        Foo_type src;
+        Foo_type dst(std::move(src));
+        ASSERT(dst.state == Foo::MoveInitialized, "incorrect state for Move constructed Foo ?");
+        ASSERT(src.state == Foo::MovedFrom, "incorrect state for Move from  Foo ?");
+    }
+
+    template<typename Foo_type>
+    void TestMoveAssignOperator(){
+        Foo_type src;
+        Foo_type dst;
+        dst = std::move(src);
+
+        ASSERT(dst.state == Foo::MoveAssigned, "incorrect state for Move Assigned Foo ?");
+        ASSERT(src.state == Foo::MovedFrom, "incorrect state for Moved from Foo ?");
+    }
+#if TBB_USE_EXCEPTIONS
+    void TestMoveConstructorException();
+#endif //TBB_USE_EXCEPTIONS
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+}
+
+void TestFoo(){
+    using namespace FooTests;
+    TestDefaultConstructor<Foo>();
+    TestDefaultConstructor<FooWithAssign>();
+    TestDirectConstructor<Foo>();
+    TestDirectConstructor<FooWithAssign>();
+    TestCopyConstructor<Foo>();
+    TestCopyConstructor<FooWithAssign>();
+    TestAssignOperator<FooWithAssign>();
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestMoveConstructor<Foo>();
+    TestMoveConstructor<FooWithAssign>();
+    TestMoveAssignOperator<FooWithAssign>();
+#if TBB_USE_EXCEPTIONS && !__TBB_CPP11_EXCEPTION_IN_STATIC_TEST_BROKEN
+    TestMoveConstructorException();
+#endif //TBB_USE_EXCEPTIONS
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+}
+
+//TODO: replace _IN_TEST with separately defined macro IN_TEST(msg,test_name)
+#define ASSERT_IN_TEST(p,message,test_name) ASSERT(p, (std::string(test_name) + ": " + message).c_str());
+//TODO: move to harness_assert
+#define ASSERT_THROWS_IN_TEST(expression, exception_type, message, test_name)                  \
+        try{                                                                                   \
+                expression;                                                                    \
+                ASSERT_IN_TEST(false, "should throw an exception", test_name);                 \
+        }catch(exception_type &){                                                              \
+        }catch(...){ASSERT_IN_TEST(false, "unexpected exception", test_name);}                 \
+
+#define ASSERT_THROWS(expression, exception_type, message)  ASSERT_THROWS_IN_TEST(expression, exception_type, message, "")
+
+template<Harness::StateTrackableBase::StateValue desired_state, bool allow_zero_initialized_state>
+bool is_state(Harness::StateTrackable<allow_zero_initialized_state> const& f){ return f.state == desired_state;}
+
+template<Harness::StateTrackableBase::StateValue desired_state>
+struct is_not_state_f {
+    template <bool allow_zero_initialized_state>
+    bool operator()(Harness::StateTrackable<allow_zero_initialized_state> const& f){ return !is_state<desired_state>(f);}
+};
+
+template<Harness::StateTrackableBase::StateValue desired_state>
+struct is_state_f {
+    template <bool allow_zero_initialized_state>
+    bool operator()(Harness::StateTrackable<allow_zero_initialized_state> const& f){ return is_state<desired_state>(f); }
+    //TODO: cu_map defines key as a const thus by default it is not moved, instead it is copied. Investigate how std::unordered_map behaves
+    template<typename T1, typename T2>
+    bool operator()(std::pair<T1, T2> const& p){ return /*is_state<desired_state>(p.first) && */is_state<desired_state>(p.second); }
+};
+
+template<typename iterator, typename unary_predicate>
+bool all_of(iterator  begin, iterator const& end, unary_predicate p){
+    for (; begin != end; ++begin){
+        if ( !p(*begin)) return false;
+    }
+    return true;
+}
+
+template<typename container, typename unary_predicate>
+bool all_of(container const& c, unary_predicate p){
+    return ::all_of( c.begin(), c.end(), p );
+}
+
+void TestAllOf(){
+    Foo foos[] = {Foo(), Foo(), Foo()};
+    ASSERT(::all_of(foos, Harness::end(foos), is_state_f<Foo::DefaultInitialized>()), "all_of returned false while true expected");
+    ASSERT(! ::all_of(foos, Harness::end(foos), is_state_f<Foo::CopyInitialized>()), "all_of returned true while false expected  ");
+}
+
+template<typename static_counter_allocator_type>
+struct track_allocator_memory: NoCopy{
+    typedef typename static_counter_allocator_type::counters_t counters_t;
+
+    counters_t previous_state;
+    const char* const test_name;
+    track_allocator_memory(const char* a_test_name): test_name(a_test_name) { static_counter_allocator_type::init_counters(); }
+    ~track_allocator_memory(){verify_no_allocator_memory_leaks();}
+
+    void verify_no_allocator_memory_leaks() const{
+        ASSERT_IN_TEST( static_counter_allocator_type::items_allocated == static_counter_allocator_type::items_freed, "memory leak?", test_name );
+        ASSERT_IN_TEST( static_counter_allocator_type::allocations == static_counter_allocator_type::frees, "memory leak?", test_name );
+    }
+    void save_allocator_counters(){ previous_state = static_counter_allocator_type::counters(); }
+    void verify_no_more_than_x_memory_items_allocated(size_t  expected_number_of_items_to_allocate){
+        counters_t now = static_counter_allocator_type::counters();
+        ASSERT_IN_TEST( (now.items_allocated - previous_state.items_allocated) <= expected_number_of_items_to_allocate, "More then excepted memory allocated ?", test_name );
+    }
+};
+
+#include <vector>
+template<int line_n>
+struct track_foo_count: NoCopy{
+    bool active;
+    size_t previous_state;
+    const char* const test_name;
+    track_foo_count(const char* a_test_name): active(true), previous_state(FooCount), test_name(a_test_name) { }
+    ~track_foo_count(){
+        if (active){
+            this->verify_no_undestroyed_foo_left_and_dismiss();
+        }
+    }
+
+    //TODO: ideally in most places this check should be replaced with "no foo created or destroyed"
+    //TODO: deactivation of the check seems like a hack
+    void verify_no_undestroyed_foo_left_and_dismiss() {
+        ASSERT_IN_TEST( FooCount == previous_state, "Some instances of Foo were not destroyed ?", test_name );
+        active = false;
+    }
+};
+
+//TODO: inactive mode in these limiters is a temporary workaround for usage in exception type loop of TestException
+
+struct limit_foo_count_in_scope: NoCopy{
+    size_t previous_state;
+    bool active;
+    limit_foo_count_in_scope(size_t new_limit, bool an_active = true): previous_state(MaxFooCount), active(an_active) {
+        if (active){
+            MaxFooCount = new_limit;
+        }
+    }
+    ~limit_foo_count_in_scope(){
+        if (active) {
+            MaxFooCount = previous_state;
+        }
+    }
+};
+
+template<typename static_counter_allocator_type>
+struct limit_allocated_items_in_scope: NoCopy{
+    size_t previous_state;
+    bool active;
+    limit_allocated_items_in_scope(size_t new_limit, bool an_active = true) : previous_state(static_counter_allocator_type::max_items), active(an_active)  {
+        if (active){
+            static_counter_allocator_type::set_limits(new_limit);
+        }
+    }
+    ~limit_allocated_items_in_scope(){
+        if (active) {
+            static_counter_allocator_type::set_limits(previous_state);
+        }
+    }
+};
+
+struct default_container_traits{
+    template <typename container_type, typename iterator_type>
+    static container_type& construct_container(tbb::aligned_space<container_type> & storage, iterator_type begin, iterator_type end){
+        new (storage.begin()) container_type(begin, end);
+        return *storage.begin();
+    }
+
+    template <typename container_type, typename iterator_type, typename allocator_type>
+    static container_type& construct_container(tbb::aligned_space<container_type> & storage, iterator_type begin, iterator_type end, allocator_type const& a){
+        new (storage.begin()) container_type(begin, end, a);
+        return *storage.begin();
+    }
+};
+
+struct memory_locations {
+    std::vector<const void*> locations;
+
+    template <typename container_type>
+    memory_locations(container_type const& source) : locations(source.size()){
+        for (typename container_type::const_iterator it = source.begin(); it != source.end(); ++it){locations[std::distance(source.begin(), it)] = & *it;}
+    }
+
+    template <typename container_t>
+    bool content_location_unchanged(container_t const& dst){
+        struct is_same_location{
+            static bool compare(typename container_t::value_type const& v,  const void* location){ return &v == location;}
+        };
+
+        return std::equal(dst.begin(), dst.end(), locations.begin(), &is_same_location::compare);
+    }
+
+    template <typename container_t>
+    bool content_location_changed(container_t const& dst){
+        struct is_not_same_location{
+            static bool compare(typename container_t::value_type const& v,  const void* location){ return &v != location;}
+        };
+
+        return std::equal(dst.begin(), dst.end(), locations.begin(), &is_not_same_location::compare);
+    }
+
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#include <algorithm>
+void TestMemoryLocaionsHelper(){
+    const size_t test_sequence_len =  15;
+    std::vector<char> source(test_sequence_len, 0);
+    std::generate_n(source.begin(), source.size(), Harness::FastRandomBody<char>(1));
+
+    memory_locations source_memory_locations((source));
+
+    std::vector<char> copy((source));
+    ASSERT(source_memory_locations.content_location_changed(copy), "");
+
+    std::vector<char> alias(std::move(source));
+    ASSERT(source_memory_locations.content_location_unchanged(alias), "");
+}
+namespace FooTests{
+#if TBB_USE_EXCEPTIONS
+    void TestMoveConstructorException(){
+        Foo src;
+        const Foo::StateValue source_state_before = src.state;
+        ASSERT_THROWS_IN_TEST(
+            {
+                limit_foo_count_in_scope foo_limit(FooCount);
+                Foo f1(std::move(src));
+            },
+            std::bad_alloc, "", "TestLimitInstancesNumber"
+        );
+        ASSERT(source_state_before == src.state, "state of source changed while should not?");
+    }
+#endif //TBB_USE_EXCEPTIONS
+}
+
+template<typename container_traits, typename allocator_t>
+struct move_fixture : NoCopy{
+    typedef  typename allocator_t::value_type element_type;
+    typedef  typename container_traits:: template apply<element_type, allocator_t>::type container_t;
+    typedef  typename container_traits::init_iterator_type init_iterator_type;
+    enum {default_container_size = 100};
+    const size_t  container_size;
+    tbb::aligned_space<container_t> source_storage;
+    container_t & source;
+    //check that location of _all_ elements of container under test is changed/unchanged
+    memory_locations locations;
+
+    ~move_fixture(){
+        source_storage.begin()->~container_t();
+    }
+
+    const char* const test_name;
+    move_fixture(const char* a_test_name, size_t a_container_size = default_container_size )
+    :   container_size(a_container_size)
+    ,   source(container_traits::construct_container(source_storage, init_iterator_type(0), init_iterator_type(container_size)))
+    ,   locations(source)
+    ,   test_name(a_test_name)
+    {
+        init("move_fixture::move_fixture()");
+    }
+
+    move_fixture(const char* a_test_name, allocator_t const& a, size_t a_container_size = default_container_size)
+    :   container_size(a_container_size)
+    ,   source(container_traits::construct_container(source_storage, init_iterator_type(0), init_iterator_type(container_size), a))
+    ,   locations(source)
+    ,   test_name(a_test_name)
+    {
+        init("move_fixture::move_fixture(allocator_t const& a)");
+    }
+
+    void init(const std::string& ctor_name){
+        verify_size(source, ctor_name.c_str());
+        verify_content_equal_to_source(source, "did not properly initialized source? Or can not check container for equality with expected ?: " + ctor_name);
+        verify_size(locations.locations, "move_fixture:init ");
+    }
+
+    bool content_location_unchanged(container_t const& dst){
+        return locations.content_location_unchanged(dst);
+    }
+
+    bool content_location_changed(container_t const& dst){
+        return locations.content_location_changed(dst);
+    }
+
+    template<typename container_type>
+    void verify_size(container_type const& dst, const char* a_test_name){
+        ASSERT_IN_TEST(container_size == dst.size(), "Did not construct all the elements or allocate enough memory?, while should ?", a_test_name);
+    }
+
+    void verify_content_equal_to_source(container_t const& dst, const std::string& msg){
+        ASSERT_IN_TEST( container_traits::equal(dst, init_iterator_type(0), init_iterator_type(container_size)), msg.c_str(), test_name);
+    }
+
+    void verify_content_equal_to_source(container_t const& dst){
+        verify_content_equal_to_source(dst, "content changed during move/copy ?");
+    }
+
+    void verify_content_equal_to_source(container_t const& dst, size_t number_of_constructed_items){
+        ASSERT_IN_TEST(number_of_constructed_items <= dst.size(), "incorrect test expectation/input parameters?", test_name);
+        ASSERT_IN_TEST(std::equal(dst.begin(), dst.begin() + number_of_constructed_items, init_iterator_type(0)), "content changed during move/copy ?", test_name);
+    }
+
+    //TODO: better name ? e.g. "content_was_stolen"
+    void verify_content_shallow_moved(container_t const& dst){
+        verify_size(dst, test_name);
+        ASSERT_IN_TEST(content_location_unchanged(dst), "container move constructor actually changed element locations, while should not", test_name);
+        ASSERT_IN_TEST(source.empty(), "Moved from container instance should not contain any elements", test_name);
+        verify_content_equal_to_source(dst);
+    }
+
+    //TODO: better name ? e.g. "element move"
+    void verify_content_deep_moved(container_t const& dst){
+        verify_size(dst, test_name);
+        ASSERT_IN_TEST(content_location_changed(dst),                "container actually did not changed element locations for unequal allocators, while should", test_name);
+        ASSERT_IN_TEST(all_of(dst, is_state_f<Foo::MoveInitialized>()), "container did not move construct some elements?", test_name);
+        ASSERT_IN_TEST(all_of(source, is_state_f<Foo::MovedFrom>()),    "container did not move all the elements?", test_name);
+        verify_content_equal_to_source(dst);
+    }
+
+    void verify_part_of_content_deep_moved(container_t const& dst, size_t number_of_constructed_items){
+        ASSERT_IN_TEST(content_location_changed(dst),                "Vector actually did not changed element locations for unequal allocators, while should", test_name);
+        ASSERT_IN_TEST(::all_of(dst.begin(), dst.begin() + number_of_constructed_items, is_state_f<Foo::MoveInitialized>()), "Vector did not move construct some elements?", test_name);
+        if (dst.size() != number_of_constructed_items) {
+            ASSERT_IN_TEST(::all_of(dst.begin() + number_of_constructed_items, dst.end(), is_state_f<Foo::ZeroInitialized>()), "Failed to zero-initialize items left not constructed after the exception?", test_name );
+        }
+        verify_content_equal_to_source(dst, number_of_constructed_items);
+
+        ASSERT_IN_TEST(::all_of(source.begin(), source.begin() + number_of_constructed_items, is_state_f<Foo::MovedFrom>()),  "Vector did not move all the elements?", test_name);
+        ASSERT_IN_TEST(::all_of(source.begin() + number_of_constructed_items, source.end(), is_not_state_f<Foo::MovedFrom>()),  "Vector changed elements in source after exception point?", test_name);
+    }
+};
+
+
+template <typename T, typename pocma = Harness::false_type>
+struct arena_allocator_fixture : NoCopy{
+    typedef arena<T, pocma>  allocator_t;
+    typedef typename allocator_t::arena_data_t arena_data_t;
+
+    std::vector<tbb::aligned_space<T, 1> > storage;
+    arena_data_t arena_data;
+    allocator_t allocator;
+
+    arena_allocator_fixture(size_t size_to_allocate)
+    :   storage(size_to_allocate)
+    ,   arena_data((*storage.begin()).begin(), storage.size())
+    ,   allocator(arena_data)
+    {}
+};
+
+//TODO: add ability to inject debug_allocator into stateful_allocator_fixture::allocator_t
+template <typename T, typename pocma = Harness::false_type>
+struct two_memory_arenas_fixture : NoCopy{
+    typedef arena_allocator_fixture<T, pocma> arena_fixture_t;
+    typedef typename arena_fixture_t::allocator_t  allocator_t;
+
+    arena_fixture_t source_arena_fixture;
+    arena_fixture_t dst_arena_fixture;
+
+    allocator_t& source_allocator;
+    allocator_t& dst_allocator;
+
+    const char* test_name;
+
+    two_memory_arenas_fixture(size_t size_to_allocate, const char* a_test_name)
+    :   source_arena_fixture(size_to_allocate)
+    ,   dst_arena_fixture(size_to_allocate)
+    ,   source_allocator(source_arena_fixture.allocator)
+    ,   dst_allocator(dst_arena_fixture.allocator)
+    ,   test_name(a_test_name)
+    {
+        ASSERT_IN_TEST(&*source_arena_fixture.storage.begin() != &*dst_arena_fixture.storage.begin(), "source and destination arena instances should use different memory regions", test_name);
+        ASSERT_IN_TEST(source_allocator != dst_allocator, "arenas using different memory regions should not compare equal", test_name);
+        ASSERT_IN_TEST(pocma::value == tbb::internal::allocator_traits<allocator_t>::propagate_on_container_move_assignment::value, "This test require proper allocator_traits support", test_name);
+
+        //Some ISO C++11 allocator requirements enforcement:
+        allocator_t source_allocator_copy(source_allocator), dst(dst_allocator);
+        allocator_t source_previous_state(source_allocator);
+        ASSERT_IN_TEST(source_previous_state == source_allocator, "Copy of allocator should compare equal to it's source", test_name);
+        dst = std::move(source_allocator_copy);
+        ASSERT_IN_TEST(dst == source_previous_state, "Move initialized instance of allocator should compare equal to it's source state before movement", test_name);
+    }
+
+    void verify_allocator_was_moved(const allocator_t& result_allocator){
+        //TODO: add assert that allocator move constructor/assignment operator was called
+        ASSERT_IN_TEST(result_allocator == source_allocator, "allocator was not moved ?", test_name);
+        ASSERT_IN_TEST(result_allocator != dst_allocator,    "allocator was not moved ?", test_name);
+    }
+
+//    template <typename any_allocator_t>
+//    void verify_allocator_was_moved(const any_allocator_t& ){}
+};
+
+template <typename pocma = Harness::false_type>
+struct std_stateful_allocator : NoCopy {
+    typedef stateful_allocator<FooWithAssign, pocma> allocator_t;
+
+    allocator_t source_allocator;
+    allocator_t dst_allocator;
+
+    const char* test_name;
+
+    std_stateful_allocator(size_t , const char* a_test_name)
+    :   test_name(a_test_name)
+    {}
+
+    template <typename any_allocator_t>
+    void verify_allocator_was_moved(const any_allocator_t& ){}
+
+};
+
+template<typename container_traits, typename pocma = Harness::false_type, typename T = FooWithAssign>
+struct default_stateful_fixture_make_helper{
+//    typedef std_stateful_allocator<pocma> allocator_fixture_t;
+    typedef two_memory_arenas_fixture<T, pocma> allocator_fixture_t;
+    typedef static_shared_counting_allocator<Harness::int_to_type<__LINE__>, typename allocator_fixture_t::allocator_t, std::size_t> allocator_t;
+
+    typedef move_fixture<container_traits, allocator_t> move_fixture_t;
+    typedef track_allocator_memory<allocator_t> no_leaks_t;
+    typedef track_foo_count<__LINE__> no_foo_leaks_in_fixture_t;
+    typedef track_foo_count<__LINE__> no_foo_leaks_in_test_t;
+
+    struct default_stateful_fixture : no_leaks_t, private no_foo_leaks_in_fixture_t, allocator_fixture_t, move_fixture_t, no_foo_leaks_in_test_t {
+
+        default_stateful_fixture(const char* a_test_name)
+        :   no_leaks_t(a_test_name)
+        ,   no_foo_leaks_in_fixture_t(a_test_name)
+        //TODO: calculate needed size more accurately
+        //allocate twice more storage to handle case when copy constructor called instead of move one
+        ,   allocator_fixture_t(2*4 * move_fixture_t::default_container_size, a_test_name)
+        ,   move_fixture_t(a_test_name, allocator_fixture_t::source_allocator)
+        ,   no_foo_leaks_in_test_t(a_test_name)
+        {
+            no_leaks_t::save_allocator_counters();
+        }
+
+        void verify_no_more_than_x_memory_items_allocated(){
+            no_leaks_t::verify_no_more_than_x_memory_items_allocated(container_traits::expected_number_of_items_to_allocate_for_steal_move);
+        }
+        using no_foo_leaks_in_test_t::verify_no_undestroyed_foo_left_and_dismiss;
+        typedef typename move_fixture_t::container_t::allocator_type allocator_t;
+    };
+
+    typedef default_stateful_fixture type;
+};
+
+template<typename container_traits>
+void TestMoveConstructorSingleArgument(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestMoveConstructorSingleArgument");
+
+    container_t dst(std::move(fixture.source));
+
+    fixture.verify_content_shallow_moved(dst);
+    fixture.verify_allocator_was_moved(dst.get_allocator());
+    fixture.verify_no_more_than_x_memory_items_allocated();
+    fixture.verify_no_undestroyed_foo_left_and_dismiss();
+}
+
+template<typename container_traits>
+void TestMoveConstructorWithEqualAllocator(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestMoveConstructorWithEqualAllocator");
+
+    container_t dst(std::move(fixture.source), fixture.source.get_allocator());
+
+    fixture.verify_content_shallow_moved(dst);
+    fixture.verify_no_more_than_x_memory_items_allocated();
+    fixture.verify_no_undestroyed_foo_left_and_dismiss();
+}
+
+template<typename container_traits>
+void TestMoveConstructorWithUnEqualAllocator(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestMoveConstructorWithUnEqualAllocator");
+
+    container_t dst(std::move(fixture.source), fixture.dst_allocator);
+
+    fixture.verify_content_deep_moved(dst);
+}
+
+template<typename container_traits>
+void TestMoveConstructor(){
+    TestMoveConstructorSingleArgument<container_traits>();
+    TestMoveConstructorWithEqualAllocator<container_traits>();
+    TestMoveConstructorWithUnEqualAllocator<container_traits>();
+}
+
+template<typename container_traits>
+void TestMoveAssignOperatorPOCMAStateful(){
+    typedef typename default_stateful_fixture_make_helper<container_traits, Harness::true_type>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestMoveAssignOperatorPOCMAStateful");
+
+    container_t dst(fixture.dst_allocator);
+
+    fixture.save_allocator_counters();
+
+    dst = std::move(fixture.source);
+
+    fixture.verify_content_shallow_moved(dst);
+    fixture.verify_allocator_was_moved(dst.get_allocator());
+    fixture.verify_no_more_than_x_memory_items_allocated();
+    fixture.verify_no_undestroyed_foo_left_and_dismiss();
+}
+
+template<typename container_traits>
+void TestMoveAssignOperatorPOCMANonStateful(){
+    typedef std::allocator<FooWithAssign>  allocator_t;
+
+    typedef move_fixture<container_traits, allocator_t> fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestMoveAssignOperatorPOCMANonStateful");
+
+    ASSERT(fixture.source.get_allocator() == allocator_t(), "Incorrect test setup: allocator is stateful while should not?");
+
+    container_t dst;
+    dst = std::move(fixture.source);
+
+    fixture.verify_content_shallow_moved(dst);
+    //TODO: add an assert that allocator was "moved" when POCMA is set
+}
+
+template<typename container_traits>
+void TestMoveAssignOperatorNotPOCMAWithUnEqualAllocator(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestMoveAssignOperatorNotPOCMAWithUnEqualAllocator");
+
+    container_t dst(fixture.dst_allocator);
+    dst = std::move(fixture.source);
+
+    fixture.verify_content_deep_moved(dst);
+}
+
+template<typename container_traits>
+void TestMoveAssignOperatorNotPOCMAWithEqualAllocator(){
+    typedef typename default_stateful_fixture_make_helper<container_traits, Harness::false_type>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+    fixture_t fixture("TestMoveAssignOperatorNotPOCMAWithEqualAllocator");
+
+    container_t dst(fixture.source_allocator);
+    ASSERT(fixture.source.get_allocator() == dst.get_allocator(), "Incorrect test setup: allocators are not equal while should be?");
+
+    fixture.save_allocator_counters();
+
+    dst = std::move(fixture.source);
+
+    fixture.verify_content_shallow_moved(dst);
+    fixture.verify_no_more_than_x_memory_items_allocated();
+    fixture.verify_no_undestroyed_foo_left_and_dismiss();
+}
+
+template<typename container_traits>
+void TestMoveAssignOperator(){
+#if __TBB_ALLOCATOR_TRAITS_PRESENT
+    TestMoveAssignOperatorPOCMANonStateful<container_traits>();
+    TestMoveAssignOperatorPOCMAStateful<container_traits>();
+#endif
+    TestMoveAssignOperatorNotPOCMAWithUnEqualAllocator<container_traits>();
+    TestMoveAssignOperatorNotPOCMAWithEqualAllocator<container_traits>();
+}
+
+template<typename container_traits>
+void TestConstructorWithMoveIterators(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestConstructorWithMoveIterators");
+
+    container_t dst(std::make_move_iterator(fixture.source.begin()), std::make_move_iterator(fixture.source.end()), fixture.dst_allocator);
+
+    fixture.verify_content_deep_moved(dst);
+}
+
+template<typename container_traits>
+void TestAssignWithMoveIterators(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    fixture_t fixture("TestAssignWithMoveIterators");
+
+    container_t dst(fixture.dst_allocator);
+    dst.assign(std::make_move_iterator(fixture.source.begin()), std::make_move_iterator(fixture.source.end()));
+
+    fixture.verify_content_deep_moved(dst);
+}
+
+#if  TBB_USE_EXCEPTIONS
+template<typename container_traits>
+void TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorMemoryFailure(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+    typedef typename container_t::allocator_type allocator_t;
+    const char* test_name = "TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorMemoryFailure";
+    fixture_t fixture(test_name);
+
+    limit_allocated_items_in_scope<allocator_t> allocator_limit(allocator_t::items_allocated + fixture.container_size/4);
+    ASSERT_THROWS_IN_TEST(container_t dst(std::move(fixture.source), fixture.dst_allocator), std::bad_alloc, "", test_name);
+}
+
+//TODO: add tests that verify that stealing move constructors/assign operators does not throw exceptions
+template<typename container_traits>
+void TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorExceptionInElementCtor(){
+    typedef typename default_stateful_fixture_make_helper<container_traits>::type fixture_t;
+    typedef typename fixture_t::container_t container_t;
+
+    const char* test_name = "TestExceptionSafetyGuaranteesMoveConstructorWithUnEqualAllocatorExceptionInElementCtor";
+    fixture_t fixture(test_name);
+
+    limit_foo_count_in_scope foo_limit(FooCount + fixture.container_size/4);
+    ASSERT_THROWS_IN_TEST(container_t dst(std::move(fixture.source), fixture.dst_allocator), std::bad_alloc, "", test_name);
+}
+#endif /* TBB_USE_EXCEPTIONS */
+#endif//__TBB_CPP11_RVALUE_REF_PRESENT
+
+namespace helper_stuff_tests {
+    void inline TestArena(){
+        typedef int arena_element;
+
+        arena_element arena_storage[10] = {0};
+        typedef arena<arena_element> arena_t;
+
+        arena_t::arena_data_t arena_data(arena_storage,Harness::array_length(arena_storage));
+        arena_t a(arena_data);
+
+        ASSERT(a.allocate(1) == arena_storage, "");
+        ASSERT(a.allocate(2) == &arena_storage[1], "");
+        ASSERT(a.allocate(2) == &arena_storage[2+1], "");
+    }
+
+    template<typename static_counting_allocator_type>
+    void inline TestStaticCountingAllocatorRebound(){
+        static_counting_allocator_type::set_limits(1);
+        typedef typename static_counting_allocator_type:: template rebind<std::pair<int,int> >::other rebound_type;
+        ASSERT(rebound_type::max_items == static_counting_allocator_type::max_items, "rebound allocator should use the same limits");
+        static_counting_allocator_type::set_limits(0);
+    }
+
+    void inline TestStatefulAllocator(){
+        stateful_allocator<int> a1,a2;
+        stateful_allocator<int> copy_of_a1(a1);
+        ASSERT(a1 != a2,"non_equal_allocator are designed to simulate stateful allocators");
+        ASSERT(copy_of_a1 == a1,"");
+    }
+}
+struct TestHelperStuff{
+    TestHelperStuff(){
+        using namespace helper_stuff_tests;
+        TestFoo();
+        TestAllOf();
+        TestArena();
+        TestStaticCountingAllocatorRebound<static_shared_counting_allocator<int, arena<int> > >();
+        TestStatefulAllocator();
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        TestMemoryLocaionsHelper();
+#endif //__TBB_CPP11_RVALUE_REF_PRESENT
+    }
+};
+static TestHelperStuff TestHelperStuff_s;
+#endif /* __TBB_test_container_move_support_H */
diff --git a/xdl/third_party/tbb/src/test/test_continue_node.cpp b/xdl/third_party/tbb/src/test/test_continue_node.cpp
new file mode 100644
index 00000000..dcbeef95
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_continue_node.cpp
@@ -0,0 +1,418 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+
+#define N 1000
+#define MAX_NODES 4
+#define C 8
+
+struct empty_no_assign : private NoAssign {
+   empty_no_assign() {}
+   empty_no_assign( int ) {}
+   operator int() { return 0; }
+};
+
+// A class to use as a fake predecessor of continue_node
+struct fake_continue_sender : public tbb::flow::sender<tbb::flow::continue_msg>
+{
+    typedef tbb::flow::sender<tbb::flow::continue_msg>::successor_type successor_type;
+    // Define implementations of virtual methods that are abstract in the base class
+    bool register_successor( successor_type& ) __TBB_override { return false; }
+    bool remove_successor( successor_type& )   __TBB_override { return false; }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef tbb::flow::sender<tbb::flow::continue_msg>::built_successors_type built_successors_type;
+    built_successors_type bst;
+    built_successors_type &built_successors() __TBB_override { return bst; }
+    void internal_add_built_successor( successor_type &) __TBB_override { }
+    void internal_delete_built_successor( successor_type &) __TBB_override { }
+    void copy_successors(successor_list_type &) __TBB_override {}
+    size_t successor_count() __TBB_override {return 0;}
+#endif
+};
+
+template< typename InputType >
+struct parallel_puts : private NoAssign {
+
+    tbb::flow::receiver< InputType > * const my_exe_node;
+
+    parallel_puts( tbb::flow::receiver< InputType > &exe_node ) : my_exe_node(&exe_node) {}
+
+    void operator()( int ) const  {
+        for ( int i = 0; i < N; ++i ) {
+            // the nodes will accept all puts
+            ASSERT( my_exe_node->try_put( InputType() ) == true, NULL );
+        }
+    }
+
+};
+
+template< typename OutputType >
+void run_continue_nodes( int p, tbb::flow::graph& g, tbb::flow::continue_node< OutputType >& n ) {
+    fake_continue_sender fake_sender;
+    for (size_t i = 0; i < N; ++i) {
+        n.register_predecessor( fake_sender );
+    }
+
+    for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+        std::vector< harness_counting_receiver<OutputType> > receivers(num_receivers, harness_counting_receiver<OutputType>(g));
+        harness_graph_executor<tbb::flow::continue_msg, OutputType>::execute_count = 0;
+
+        for (size_t r = 0; r < num_receivers; ++r ) {
+            tbb::flow::make_edge( n, receivers[r] );
+        }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT(n.successor_count() == (size_t)num_receivers, NULL);
+        ASSERT(n.predecessor_count() == 0, NULL);
+        typename tbb::flow::continue_node<OutputType>::successor_list_type my_succs;
+        typedef typename tbb::flow::continue_node<OutputType>::successor_list_type::iterator sv_iter_type;
+        n.copy_successors(my_succs);
+        ASSERT(my_succs.size() == num_receivers, NULL);
+#endif
+
+        NativeParallelFor( p, parallel_puts<tbb::flow::continue_msg>(n) );
+        g.wait_for_all();
+
+        // 2) the nodes will receive puts from multiple predecessors simultaneously,
+        size_t ec = harness_graph_executor<tbb::flow::continue_msg, OutputType>::execute_count;
+        ASSERT( (int)ec == p, NULL );
+        for (size_t r = 0; r < num_receivers; ++r ) {
+            size_t c = receivers[r].my_count;
+            // 3) the nodes will send to multiple successors.
+            ASSERT( (int)c == p, NULL );
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        for(sv_iter_type si=my_succs.begin(); si != my_succs.end(); ++si) {
+            tbb::flow::remove_edge( n, **si );
+        }
+#else
+        for (size_t r = 0; r < num_receivers; ++r ) {
+            tbb::flow::remove_edge( n, receivers[r] );
+        }
+#endif
+    }
+}
+
+template< typename OutputType, typename Body >
+void continue_nodes( Body body ) {
+    for (int p = 1; p < 2*MaxThread; ++p) {
+        tbb::flow::graph g;
+        tbb::flow::continue_node< OutputType > exe_node( g, body );
+        run_continue_nodes( p, g, exe_node);
+        exe_node.try_put(tbb::flow::continue_msg());
+        tbb::flow::continue_node< OutputType > exe_node_copy( exe_node );
+        run_continue_nodes( p, g, exe_node_copy);
+    }
+}
+
+const size_t Offset = 123;
+tbb::atomic<size_t> global_execute_count;
+
+template< typename OutputType >
+struct inc_functor {
+
+    tbb::atomic<size_t> local_execute_count;
+    inc_functor( ) { local_execute_count = 0; }
+    inc_functor( const inc_functor &f ) { local_execute_count = f.local_execute_count; }
+    void operator=(const inc_functor &f) { local_execute_count = f.local_execute_count; }
+
+    OutputType operator()( tbb::flow::continue_msg ) {
+       ++global_execute_count;
+       ++local_execute_count;
+       return OutputType();
+    }
+
+};
+
+template< typename OutputType >
+void continue_nodes_with_copy( ) {
+
+    for (int p = 1; p < 2*MaxThread; ++p) {
+        tbb::flow::graph g;
+        inc_functor<OutputType> cf;
+        cf.local_execute_count = Offset;
+        global_execute_count = Offset;
+
+        tbb::flow::continue_node< OutputType > exe_node( g, cf );
+        fake_continue_sender fake_sender;
+        for (size_t i = 0; i < N; ++i) {
+           exe_node.register_predecessor( fake_sender );
+        }
+
+        for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+            std::vector< harness_counting_receiver<OutputType> > receivers(num_receivers, harness_counting_receiver<OutputType>(g));
+
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::make_edge( exe_node, receivers[r] );
+            }
+
+            NativeParallelFor( p, parallel_puts<tbb::flow::continue_msg>(exe_node) );
+            g.wait_for_all();
+
+            // 2) the nodes will receive puts from multiple predecessors simultaneously,
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                size_t c = receivers[r].my_count;
+                // 3) the nodes will send to multiple successors.
+                ASSERT( (int)c == p, NULL );
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( exe_node, receivers[r] );
+            }
+        }
+
+        // validate that the local body matches the global execute_count and both are correct
+        inc_functor<OutputType> body_copy = tbb::flow::copy_body< inc_functor<OutputType> >( exe_node );
+        const size_t expected_count = p*MAX_NODES + Offset;
+        size_t global_count = global_execute_count;
+        size_t inc_count = body_copy.local_execute_count;
+        ASSERT( global_count == expected_count && global_count == inc_count, NULL );
+        g.reset(tbb::flow::rf_reset_bodies);
+        body_copy = tbb::flow::copy_body< inc_functor<OutputType> >( exe_node );
+        inc_count = body_copy.local_execute_count;
+        ASSERT( Offset == inc_count, "reset(rf_reset_bodies) did not reset functor" );
+
+    }
+}
+
+template< typename OutputType >
+void run_continue_nodes() {
+    harness_graph_executor< tbb::flow::continue_msg, OutputType>::max_executors = 0;
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    continue_nodes<OutputType>( []( tbb::flow::continue_msg i ) -> OutputType { return harness_graph_executor<tbb::flow::continue_msg, OutputType>::func(i); } );
+    #endif
+    continue_nodes<OutputType>( &harness_graph_executor<tbb::flow::continue_msg, OutputType>::func );
+    continue_nodes<OutputType>( typename harness_graph_executor<tbb::flow::continue_msg, OutputType>::functor() );
+    continue_nodes_with_copy<OutputType>();
+}
+
+//! Tests limited concurrency cases for nodes that accept data messages
+void test_concurrency(int num_threads) {
+    tbb::task_scheduler_init init(num_threads);
+    run_continue_nodes<tbb::flow::continue_msg>();
+    run_continue_nodes<int>();
+    run_continue_nodes<empty_no_assign>();
+}
+/*
+ * Connection of two graphs is not currently supported, but works to some limited extent.
+ * This test is included to check for backward compatibility. It checks that a continue_node
+ * with predecessors in two different graphs receives the required
+ * number of continue messages before it executes.
+ */
+using namespace tbb::flow;
+
+struct add_to_counter {
+    int* counter;
+    add_to_counter(int& var):counter(&var){}
+    void operator()(continue_msg){*counter+=1;}
+};
+
+void test_two_graphs(){
+    int count=0;
+
+    //graph g with broadcast_node and continue_node
+    graph g;
+    broadcast_node<continue_msg> start_g(g);
+    continue_node<continue_msg> first_g(g, add_to_counter(count));
+
+    //graph h with broadcast_node
+    graph h;
+    broadcast_node<continue_msg> start_h(h);
+
+    //making two edges to first_g from the two graphs
+    make_edge(start_g,first_g);
+    make_edge(start_h, first_g);
+
+    //two try_puts from the two graphs
+    start_g.try_put(continue_msg());
+    start_h.try_put(continue_msg());
+    g.wait_for_all();
+    ASSERT(count==1, "Not all continue messages received");
+
+    //two try_puts from the graph that doesn't contain the node
+    count=0;
+    start_h.try_put(continue_msg());
+    start_h.try_put(continue_msg());
+    g.wait_for_all();
+    ASSERT(count==1, "Not all continue messages received -1");
+
+    //only one try_put
+    count=0;
+    start_g.try_put(continue_msg());
+    g.wait_for_all();
+    ASSERT(count==0, "Node executed without waiting for all predecessors");
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+void test_extract() {
+    int my_count = 0;
+    tbb::flow::continue_msg cm;
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> b0(g);
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> b1(g);
+    tbb::flow::continue_node<tbb::flow::continue_msg>  c0(g, add_to_counter(my_count));
+    tbb::flow::queue_node<tbb::flow::continue_msg> q0(g);
+
+    tbb::flow::make_edge(b0, c0);
+    tbb::flow::make_edge(b1, c0);
+    tbb::flow::make_edge(c0, q0);
+    for( int i = 0; i < 2; ++i ) {
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 1, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(c0.predecessor_count() == 2 && c0.successor_count() == 1, "c0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 1 && q0.successor_count() == 0, "q0 has incorrect counts");
+
+        /* b0         */
+        /*   \        */
+        /*    c0 - q0 */
+        /*   /        */
+        /* b1         */
+
+        b0.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(my_count == 0, "continue_node fired too soon");
+        b1.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(my_count == 1, "continue_node didn't fire");
+        ASSERT(q0.try_get(cm), "continue_node didn't forward");
+
+        b0.extract();
+
+        /* b0         */
+        /*            */
+        /*    c0 - q0 */
+        /*   /        */
+        /* b1         */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(c0.predecessor_count() == 1 && c0.successor_count() == 1, "c0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 1 && q0.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(tbb::flow::continue_msg());
+        b0.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(my_count == 1, "b0 messages being forwarded to continue_node even though it is disconnected");
+        b1.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(my_count == 2, "continue_node didn't fire though it has only one predecessor");
+        ASSERT(q0.try_get(cm), "continue_node didn't forward second time");
+
+        c0.extract();
+
+        /* b0         */
+        /*            */
+        /*    c0   q0 */
+        /*            */
+        /* b1         */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 0, "b1 has incorrect counts");
+        ASSERT(c0.predecessor_count() == 0 && c0.successor_count() == 0, "c0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(tbb::flow::continue_msg());
+        b0.try_put(tbb::flow::continue_msg());
+        b1.try_put(tbb::flow::continue_msg());
+        b1.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(my_count == 2, "continue didn't fire though it has only one predecessor");
+        ASSERT(!q0.try_get(cm), "continue_node forwarded though it shouldn't");
+        make_edge(b0, c0);
+
+        /* b0         */
+        /*   \        */
+        /*    c0   q0 */
+        /*            */
+        /* b1         */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 1, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 0, "b1 has incorrect counts");
+        ASSERT(c0.predecessor_count() == 1 && c0.successor_count() == 0, "c0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+
+        b0.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+
+        ASSERT(my_count == 3, "continue didn't fire though it has only one predecessor");
+        ASSERT(!q0.try_get(cm), "continue_node forwarded though it shouldn't");
+
+        tbb::flow::make_edge(b1, c0);
+        tbb::flow::make_edge(c0, q0);
+        my_count = 0;
+    }
+}
+#endif
+
+struct lightweight_policy_body : NoAssign {
+    const tbb::tbb_thread::id my_thread_id;
+    tbb::atomic<size_t> my_count;
+
+    lightweight_policy_body() : my_thread_id(tbb::this_tbb_thread::get_id()) {
+        my_count = 0;
+    }
+    void operator()(tbb::flow::continue_msg) {
+        ++my_count;
+        tbb::tbb_thread::id body_thread_id = tbb::this_tbb_thread::get_id();
+        ASSERT(body_thread_id == my_thread_id, "Body executed as not lightweight");
+    }
+};
+
+void test_lightweight_policy() {
+    tbb::flow::graph g;
+    tbb::flow::continue_node<tbb::flow::continue_msg, tbb::flow::lightweight> node1(g, lightweight_policy_body());
+    tbb::flow::continue_node<tbb::flow::continue_msg, tbb::flow::lightweight> node2(g, lightweight_policy_body());
+
+    tbb::flow::make_edge(node1, node2);
+    const size_t n = 10;
+    for(size_t i = 0; i < n; ++i) {
+        node1.try_put(tbb::flow::continue_msg());
+    }
+    g.wait_for_all();
+
+    lightweight_policy_body body1 = tbb::flow::copy_body<lightweight_policy_body>(node1);
+    lightweight_policy_body body2 = tbb::flow::copy_body<lightweight_policy_body>(node2);
+    ASSERT(body1.my_count == n, "Body of the first node needs to be executed N times");
+    ASSERT(body2.my_count == n, "Body of the second node needs to be executed N times");
+}
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+       test_concurrency(p);
+   }
+   test_two_graphs();
+#if __TBB_PREVIEW_LIGHTWEIGHT_POLICY
+   test_lightweight_policy();
+#endif
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+   test_extract();
+#endif
+   return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_critical_section.cpp b/xdl/third_party/tbb/src/test/test_critical_section.cpp
new file mode 100644
index 00000000..35ae53b8
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_critical_section.cpp
@@ -0,0 +1,216 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// test critical section
+//
+#include "tbb/critical_section.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/enumerable_thread_specific.h"
+#include "tbb/tick_count.h"
+#include "harness_assert.h"
+#include "harness.h"
+#include <math.h>
+
+#include "harness_barrier.h"
+Harness::SpinBarrier sBarrier;
+tbb::critical_section cs;
+const int MAX_WORK = 300;
+
+struct BusyBody : NoAssign {
+    tbb::enumerable_thread_specific<double> &locals;
+    const int nThread;
+    const int WorkRatiox100;
+    int &unprotected_count;
+    bool test_throw;
+
+    BusyBody( int nThread_, int workRatiox100_, tbb::enumerable_thread_specific<double> &locals_, int &unprotected_count_, bool test_throw_) :
+        locals(locals_),
+        nThread(nThread_),
+        WorkRatiox100(workRatiox100_),
+        unprotected_count(unprotected_count_),
+        test_throw(test_throw_) {
+        sBarrier.initialize(nThread_);
+    }
+
+    void operator()(const int /* threadID */ ) const {
+        int nIters = MAX_WORK/nThread;
+        sBarrier.wait();
+        tbb::tick_count t0 = tbb::tick_count::now();
+        for(int j = 0; j < nIters; j++) {
+
+            for(int i = 0; i < MAX_WORK * (100 - WorkRatiox100); i++) {
+                locals.local() += 1.0;
+            }
+            cs.lock();
+            ASSERT( !cs.try_lock(), "recursive try_lock must fail" );
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+            if(test_throw && j == (nIters / 2)) {
+                bool was_caught = false,
+                     unknown_exception = false;
+                try {
+                    cs.lock();
+                }
+                catch(tbb::improper_lock& e) {
+                    ASSERT( e.what(), "Error message is absent" );
+                    was_caught = true;
+                }
+                catch(...) {
+                    was_caught = unknown_exception = true;
+                }
+                ASSERT(was_caught, "Recursive lock attempt did not throw");
+                ASSERT(!unknown_exception, "tbb::improper_lock exception is expected");
+            }
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN  */
+            for(int i = 0; i < MAX_WORK * WorkRatiox100; i++) {
+                locals.local() += 1.0;
+            }
+            unprotected_count++;
+            cs.unlock();
+        }
+        locals.local() = (tbb::tick_count::now() - t0).seconds();
+    }
+};
+
+struct BusyBodyScoped : NoAssign {
+    tbb::enumerable_thread_specific<double> &locals;
+    const int nThread;
+    const int WorkRatiox100;
+    int &unprotected_count;
+    bool test_throw;
+
+    BusyBodyScoped( int nThread_, int workRatiox100_, tbb::enumerable_thread_specific<double> &locals_, int &unprotected_count_, bool test_throw_) :
+        locals(locals_),
+        nThread(nThread_),
+        WorkRatiox100(workRatiox100_),
+        unprotected_count(unprotected_count_),
+        test_throw(test_throw_) {
+        sBarrier.initialize(nThread_);
+    }
+
+    void operator()(const int /* threadID */ ) const {
+        int nIters = MAX_WORK/nThread;
+        sBarrier.wait();
+        tbb::tick_count t0 = tbb::tick_count::now();
+        for(int j = 0; j < nIters; j++) {
+
+            for(int i = 0; i < MAX_WORK * (100 - WorkRatiox100); i++) {
+                locals.local() += 1.0;
+            }
+            {
+                tbb::critical_section::scoped_lock my_lock(cs);
+                for(int i = 0; i < MAX_WORK * WorkRatiox100; i++) {
+                    locals.local() += 1.0;
+                }
+                unprotected_count++;
+            }
+        }
+        locals.local() = (tbb::tick_count::now() - t0).seconds();
+    }
+};
+
+void
+RunOneCriticalSectionTest(int nThreads, int csWorkRatio, bool test_throw) {
+    tbb::task_scheduler_init init(tbb::task_scheduler_init::deferred);
+    tbb::enumerable_thread_specific<double> test_locals;
+    int myCount = 0;
+    BusyBody myBody(nThreads, csWorkRatio, test_locals, myCount, test_throw);
+    BusyBodyScoped myScopedBody(nThreads, csWorkRatio, test_locals, myCount, test_throw);
+    init.initialize(nThreads);
+    tbb::tick_count t0;
+    {
+        t0 = tbb::tick_count::now();
+        myCount = 0;
+        NativeParallelFor(nThreads, myBody);
+        ASSERT(myCount == (MAX_WORK - (MAX_WORK % nThreads)), NULL);
+        REMARK("%d threads, work ratio %d per cent, time %g", nThreads, csWorkRatio, (tbb::tick_count::now() - t0).seconds());
+        if (nThreads > 1) {
+            double etsSum = 0;
+            double etsMax = 0;
+            double etsMin = 0;
+            double etsSigmaSq = 0;
+            double etsSigma = 0;
+
+            for(tbb::enumerable_thread_specific<double>::const_iterator ci = test_locals.begin(); ci != test_locals.end(); ci++) {
+                etsSum += *ci;
+                if(etsMax==0.0) {
+                    etsMin = *ci;
+                }
+                else {
+                    if(etsMin > *ci) etsMin = *ci;
+                }
+                if(etsMax < *ci) etsMax = *ci;
+            }
+            double etsAvg = etsSum / (double)nThreads;
+            for(tbb::enumerable_thread_specific<double>::const_iterator ci = test_locals.begin(); ci != test_locals.end(); ci++) {
+                etsSigma = etsAvg - *ci;
+                etsSigmaSq += etsSigma * etsSigma;
+            }
+            // an attempt to gauge the "fairness" of the scheduling of the threads.  We figure
+            // the standard deviation, and compare it with the maximum deviation from the
+            // average time.  If the difference is 0 that means all threads finished in the same
+            // amount of time.  If non-zero, the difference is divided by the time, and the
+            // negative log is taken.  If > 2, then the difference is on the order of 0.01*t
+            // where T is the average time.  We aritrarily define this as "fair."
+            etsSigma = sqrt(etsSigmaSq/double(nThreads));
+            etsMax -= etsAvg;  // max - a == delta1
+            etsMin = etsAvg - etsMin;  // a - min == delta2
+            if(etsMax < etsMin) etsMax = etsMin;
+            etsMax -= etsSigma;
+            // ASSERT(etsMax >= 0, NULL);  // shouldn't the maximum difference from the mean be > the stddev?
+            etsMax = (etsMax > 0.0) ? etsMax : 0.0;  // possible rounding error
+            double fairness = etsMax / etsAvg;
+            if(fairness == 0.0) {
+                fairness = 100.0;
+            }
+            else fairness = - log10(fairness);
+            if(fairness > 2.0 ) {
+                REMARK("  Fair (%g)\n", fairness);
+            }
+            else {
+                REMARK("  Unfair (%g)\n", fairness);
+            }
+        }
+        myCount = 0;
+        NativeParallelFor(nThreads, myScopedBody);
+        ASSERT(myCount == (MAX_WORK - (MAX_WORK % nThreads)), NULL);
+
+    }
+
+    init.terminate();
+}
+
+void
+RunParallelTests() {
+    for(int p = MinThread; p <= MaxThread; p++) {
+        for(int cs_ratio = 1; cs_ratio < 95; cs_ratio *= 2) {
+            RunOneCriticalSectionTest(p, cs_ratio, /*test_throw*/true);
+        }
+    }
+}
+
+int TestMain () {
+    if(MinThread <= 0) MinThread = 1;
+
+    if(MaxThread > 0) {
+        RunParallelTests();
+    }
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_dynamic_link.cpp b/xdl/third_party/tbb/src/test/test_dynamic_link.cpp
new file mode 100644
index 00000000..69d87795
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_dynamic_link.cpp
@@ -0,0 +1,84 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+enum FOO_TYPE {
+    FOO_DUMMY,
+    FOO_IMPLEMENTATION
+};
+
+#if _WIN32 || _WIN64
+#define TEST_EXPORT
+#else
+#define TEST_EXPORT extern "C"
+#endif /* _WIN32 || _WIN64 */
+
+// foo "implementations".
+TEST_EXPORT FOO_TYPE foo1() { return FOO_IMPLEMENTATION; }
+TEST_EXPORT FOO_TYPE foo2() { return FOO_IMPLEMENTATION; }
+// foo "dummies".
+FOO_TYPE dummy_foo1() { return FOO_DUMMY; }
+FOO_TYPE dummy_foo2() { return FOO_DUMMY; }
+
+// Handlers.
+static FOO_TYPE (*foo1_handler)() = &dummy_foo1;
+static FOO_TYPE (*foo2_handler)() = &dummy_foo2;
+
+#include "tbb/tbb_config.h"
+// Suppress the weak symbol mechanism to avoid surplus compiler warnings.
+#ifdef __TBB_WEAK_SYMBOLS_PRESENT
+#undef __TBB_WEAK_SYMBOLS_PRESENT
+#endif
+// Use of harness assert to avoid the dependency on TBB
+#include "harness_assert.h"
+#define LIBRARY_ASSERT(p,message) ASSERT(p,message)
+#include "tbb/dynamic_link.h"
+// Table describing how to link the handlers.
+static const tbb::internal::dynamic_link_descriptor LinkTable[] = {
+    { "foo1", (tbb::internal::pointer_to_handler*)(void*)(&foo1_handler) },
+    { "foo2", (tbb::internal::pointer_to_handler*)(void*)(&foo2_handler) }
+};
+
+// The direct include since we want to test internal functionality.
+#include "tbb/dynamic_link.cpp"
+#include "harness_dynamic_libs.h"
+#include "harness.h"
+
+#if !HARNESS_SKIP_TEST
+int TestMain () {
+#if !_WIN32
+    // Check if the executable exports its symbols.
+    ASSERT( Harness::GetAddress( Harness::OpenLibrary(NULL), "foo1" ) && Harness::GetAddress( Harness::OpenLibrary(NULL), "foo2" ),
+            "The executable doesn't export its symbols. Is the -rdynamic switch set during linking?" );
+#endif /* !_WIN32 */
+    // We want to link (or fail to link) to the symbols available from the
+    // executable so it doesn't matter what the library name is specified in
+    // the dynamic_link call - let it be an empty string.
+    // Generally speaking the test has sense only on Linux but on Windows it
+    // checks the dynamic_link graceful behavior with incorrect library name.
+    if ( tbb::internal::dynamic_link( "", LinkTable, sizeof(LinkTable)/sizeof(LinkTable[0]) ) ) {
+        ASSERT( foo1_handler && foo2_handler, "The symbols are corrupted by dynamic_link" );
+        ASSERT( foo1_handler() == FOO_IMPLEMENTATION && foo2_handler() == FOO_IMPLEMENTATION,
+                "dynamic_link returned the successful code but symbol(s) are wrong" );
+    } else {
+        ASSERT( foo1_handler==dummy_foo1 && foo2_handler==dummy_foo2, "The symbols are corrupted by dynamic_link" );
+    }
+    return Harness::Done;
+}
+#endif // HARNESS_SKIP_TEST
diff --git a/xdl/third_party/tbb/src/test/test_eh_algorithms.cpp b/xdl/third_party/tbb/src/test/test_eh_algorithms.cpp
new file mode 100644
index 00000000..f51fdce2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_eh_algorithms.cpp
@@ -0,0 +1,1583 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 2
+#define HARNESS_DEFAULT_MAX_THREADS 4
+
+#include "harness.h"
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+#include <limits.h> // for INT_MAX
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tbb_exception.h"
+#include "tbb/task.h"
+#include "tbb/atomic.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+#include "tbb/parallel_do.h"
+#include "tbb/pipeline.h"
+#include "tbb/parallel_scan.h"
+#include "tbb/blocked_range.h"
+#include "harness_assert.h"
+
+#define FLAT_RANGE  100000
+#define FLAT_GRAIN  100
+#define OUTER_RANGE  100
+#define OUTER_GRAIN  10
+#define INNER_RANGE  (FLAT_RANGE / OUTER_RANGE)
+#define INNER_GRAIN  (FLAT_GRAIN / OUTER_GRAIN)
+
+tbb::atomic<intptr_t> g_FedTasksCount; // number of tasks added by parallel_do feeder
+tbb::atomic<intptr_t> g_OuterParCalls;  // number of actual invocations of the outer construct executed.
+tbb::atomic<intptr_t> g_TGCCancelled;  // Number of times a task sees its group cancelled at start
+
+inline intptr_t Existed () { return INT_MAX; }
+
+#include "harness_eh.h"
+/********************************
+      Variables in test
+
+__ Test control variables
+      g_ExceptionInMaster -- only the master thread is allowed to throw.  If false, the master cannot throw
+      g_SolitaryException -- only one throw may be executed.
+
+-- controls for ThrowTestException for pipeline tests
+      g_NestedPipelines -- are inner pipelines being run?
+      g_PipelinesStarted -- how many pipelines have run their first filter at least once.
+
+-- Information variables
+
+   g_Master -- Thread ID of the "master" thread
+      In pipelines sometimes the master thread does not participate, so the tests have to be resilient to this.
+
+-- Measurement variables
+
+   g_OuterParCalls -- how many outer parallel ranges or filters started
+   g_TGCCancelled --  how many inner parallel ranges or filters saw task::self().is_cancelled()
+   g_ExceptionsThrown -- number of throws executed (counted in ThrowTestException)
+   g_MasterExecutedThrow -- number of times master thread actually executed a throw
+   g_NonMasterExecutedThrow -- number of times non-master thread actually executed a throw
+   g_ExceptionCaught -- one of PropagatedException or unknown exception was caught.  (Other exceptions cause assertions.)
+
+   --  Tallies for the task bodies which have executed (counted in each inner body, sampled in ThrowTestException)
+      g_CurExecuted -- total number of inner ranges or filters which executed
+      g_ExecutedAtLastCatch -- value of g_CurExecuted when last catch was made, 0 if none.
+      g_ExecutedAtFirstCatch -- value of g_CurExecuted when first catch is made, 0 if none.
+  *********************************/
+
+inline void ResetGlobals (  bool throwException = true, bool flog = false ) {
+    ResetEhGlobals( throwException, flog );
+    g_FedTasksCount = 0;
+    g_OuterParCalls = 0;
+    g_NestedPipelines = false;
+    g_TGCCancelled = 0;
+}
+
+////////////////////////////////////////////////////////////////////////////////
+// Tests for tbb::parallel_for and tbb::parallel_reduce
+
+typedef size_t count_type;
+typedef tbb::blocked_range<count_type> range_type;
+
+inline intptr_t CountSubranges(range_type r) {
+    if(!r.is_divisible()) return intptr_t(1);
+    range_type r2(r,tbb::split());
+    return CountSubranges(r) + CountSubranges(r2);
+}
+
+inline intptr_t NumSubranges ( intptr_t length, intptr_t grain ) {
+    return CountSubranges(range_type(0,length,grain));
+}
+
+template<class Body>
+intptr_t TestNumSubrangesCalculation ( intptr_t length, intptr_t grain, intptr_t inner_length, intptr_t inner_grain ) {
+    ResetGlobals();
+    g_ThrowException = false;
+    intptr_t outerCalls = NumSubranges(length, grain),
+             innerCalls = NumSubranges(inner_length, inner_grain),
+             maxExecuted = outerCalls * (innerCalls + 1);
+    tbb::parallel_for( range_type(0, length, grain), Body() );
+    ASSERT (g_CurExecuted == maxExecuted, "Wrong estimation of bodies invocation count");
+    return maxExecuted;
+}
+
+class NoThrowParForBody {
+public:
+    void operator()( const range_type& r ) const {
+        volatile count_type x = 0;
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        count_type end = r.end();
+        for( count_type i=r.begin(); i<end; ++i )
+            x += i;
+    }
+};
+
+#if TBB_USE_EXCEPTIONS
+
+void Test0 () {
+    ResetGlobals();
+    tbb::simple_partitioner p;
+    for( size_t i=0; i<10; ++i ) {
+        tbb::parallel_for( range_type(0, 0, 1), NoThrowParForBody() );
+        tbb::parallel_for( range_type(0, 0, 1), NoThrowParForBody(), p );
+        tbb::parallel_for( range_type(0, 128, 8), NoThrowParForBody() );
+        tbb::parallel_for( range_type(0, 128, 8), NoThrowParForBody(), p );
+    }
+} // void Test0 ()
+
+//! Template that creates a functor suitable for parallel_reduce from a functor for parallel_for.
+template<typename ParForBody>
+class SimpleParReduceBody: NoAssign {
+    ParForBody m_Body;
+public:
+    void operator()( const range_type& r ) const { m_Body(r); }
+    SimpleParReduceBody() {}
+    SimpleParReduceBody( SimpleParReduceBody& left, tbb::split ) : m_Body(left.m_Body) {}
+    void join( SimpleParReduceBody& /*right*/ ) {}
+}; // SimpleParReduceBody
+
+//! Test parallel_for and parallel_reduce for a given partitioner.
+/** The Body need only be suitable for a parallel_for. */
+template<typename ParForBody, typename Partitioner>
+void TestParallelLoopAux() {
+    Partitioner partitioner;
+    for( int i=0; i<2; ++i ) {
+        ResetGlobals();
+        TRY();
+            if( i==0 )
+                tbb::parallel_for( range_type(0, FLAT_RANGE, FLAT_GRAIN), ParForBody(), partitioner );
+            else {
+                SimpleParReduceBody<ParForBody> rb;
+                tbb::parallel_reduce( range_type(0, FLAT_RANGE, FLAT_GRAIN), rb, partitioner );
+            }
+        CATCH_AND_ASSERT();
+        // two cases: g_SolitaryException and !g_SolitaryException
+        //   1) g_SolitaryException: only one thread actually threw.  There is only one context, so the exception
+        //      (when caught) will cause that context to be cancelled.  After this event, there may be one or
+        //      more threads which are "in-flight", up to g_NumThreads, but no more will be started.  The threads,
+        //      when they start, if they see they are cancelled, TGCCancelled is incremented.
+        //   2) !g_SolitaryException: more than one thread can throw.  The number of threads that actually
+        //      threw is g_MasterExecutedThrow if only the master is allowed, else g_NonMasterExecutedThrow.
+        //      Only one context, so TGCCancelled should be <= g_NumThreads.
+        //
+        // the reasoning is similar for nested algorithms in a single context (Test2).
+        //
+        // If a thread throws in a context, more than one subsequent task body may see the
+        // cancelled state (if they are scheduled before the state is propagated.) this is
+        // infrequent, but it occurs.  So what was to be an assertion must be a remark.
+        ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks ran after exception thrown");
+        if( g_TGCCancelled > g_NumThreads) REMARK( "Too many tasks ran after exception thrown (%d vs. %d)\n",
+                (int)g_TGCCancelled, (int)g_NumThreads);
+        ASSERT(g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+        if ( g_SolitaryException ) {
+            ASSERT(g_NumExceptionsCaught == 1, "No try_blocks in any body expected in this test");
+            ASSERT(g_NumExceptionsCaught == (g_ExceptionInMaster ? g_MasterExecutedThrow : g_NonMasterExecutedThrow),
+                "Not all throws were caught");
+            ASSERT(g_ExecutedAtFirstCatch == g_ExecutedAtLastCatch, "Too many exceptions occurred");
+        }
+        else {
+            ASSERT(g_NumExceptionsCaught >= 1, "No try blocks in any body expected in this test");
+        }
+    }
+}  // TestParallelLoopAux
+
+//! Test with parallel_for and parallel_reduce, over all three kinds of partitioners.
+/** The Body only needs to be suitable for tbb::parallel_for. */
+template<typename Body>
+void TestParallelLoop() {
+    // The simple and auto partitioners should be const, but not the affinity partitioner.
+    TestParallelLoopAux<Body, const tbb::simple_partitioner  >();
+    TestParallelLoopAux<Body, const tbb::auto_partitioner    >();
+#define __TBB_TEMPORARILY_DISABLED 1
+#if !__TBB_TEMPORARILY_DISABLED
+    // TODO: Improve the test so that it tolerates delayed start of tasks with affinity_partitioner
+    TestParallelLoopAux<Body, /***/ tbb::affinity_partitioner>();
+#endif
+#undef __TBB_TEMPORARILY_DISABLED
+}
+
+class SimpleParForBody: NoAssign {
+public:
+    void operator()( const range_type& r ) const {
+        Harness::ConcurrencyTracker ct;
+        volatile long x = 0;
+        ++g_CurExecuted;
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        for( count_type i = r.begin(); i != r.end(); ++i )
+            x += 0;
+        WaitUntilConcurrencyPeaks();
+        ThrowTestException(1);
+    }
+};
+
+void Test1() {
+    // non-nested parallel_for/reduce with throwing body, one context
+    TestParallelLoop<SimpleParForBody>();
+} // void Test1 ()
+
+class OuterParForBody: NoAssign {
+public:
+    void operator()( const range_type& ) const {
+        Harness::ConcurrencyTracker ct;
+        ++g_OuterParCalls;
+        tbb::parallel_for( tbb::blocked_range<size_t>(0, INNER_RANGE, INNER_GRAIN), SimpleParForBody() );
+    }
+};
+
+//! Uses parallel_for body containing an inner parallel_for with the default context not wrapped by a try-block.
+/** Inner algorithms are spawned inside the new bound context by default. Since
+    exceptions thrown from the inner parallel_for are not handled by the caller
+    (outer parallel_for body) in this test, they will cancel all the sibling inner
+    algorithms. **/
+void Test2 () {
+    TestParallelLoop<OuterParForBody>();
+} // void Test2 ()
+
+class OuterParForBodyWithIsolatedCtx {
+public:
+    void operator()( const range_type& ) const {
+        tbb::task_group_context ctx(tbb::task_group_context::isolated);
+        ++g_OuterParCalls;
+        tbb::parallel_for( tbb::blocked_range<size_t>(0, INNER_RANGE, INNER_GRAIN), SimpleParForBody(), tbb::simple_partitioner(), ctx );
+    }
+};
+
+//! Uses parallel_for body invoking an inner parallel_for with an isolated context without a try-block.
+/** Even though exceptions thrown from the inner parallel_for are not handled
+    by the caller in this test, they will not affect sibling inner algorithms
+    already running because of the isolated contexts. However because the first
+    exception cancels the root parallel_for only the first g_NumThreads subranges
+    will be processed (which launch inner parallel_fors) **/
+void Test3 () {
+    ResetGlobals();
+    typedef OuterParForBodyWithIsolatedCtx body_type;
+    intptr_t  innerCalls = NumSubranges(INNER_RANGE, INNER_GRAIN),
+            // we expect one thread to throw without counting, the rest to run to completion
+            // this formula assumes g_numThreads outer pfor ranges will be started, but that is not the
+            // case; the SimpleParFor subranges are started up as part of the outer ones, and when
+            // the amount of concurrency reaches g_NumThreads no more outer Pfor ranges are started.
+            // so we have to count the number of outer Pfors actually started.
+            minExecuted = (g_NumThreads - 1) * innerCalls;
+    TRY();
+        tbb::parallel_for( range_type(0, OUTER_RANGE, OUTER_GRAIN), body_type() );
+    CATCH_AND_ASSERT();
+    minExecuted = (g_OuterParCalls - 1) * innerCalls;  // see above
+
+    // The first formula above assumes all ranges of the outer parallel for are executed, and one
+    // cancels.  In the event, we have a smaller number of ranges that start before the exception
+    // is caught.
+    //
+    //  g_SolitaryException:One inner range throws.  Outer parallel_For is cancelled, but sibling
+    //                      parallel_fors continue to completion (unless the threads that execute
+    //                      are not allowed to throw, in which case we will not see any exceptions).
+    // !g_SolitaryException:multiple inner ranges may throw.  Any which throws will stop, and the
+    //                      corresponding range of the outer pfor will stop also.
+    //
+    // In either case, once the outer pfor gets the exception it will stop executing further ranges.
+
+    // if the only threads executing were not allowed to throw, then not seeing an exception is okay.
+    bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecuted) || (!g_ExceptionInMaster && !g_NonMasterExecuted);
+    if ( g_SolitaryException ) {
+        ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived exception");
+        ASSERT (g_CurExecuted > minExecuted, "Too few tasks survived exception");
+        ASSERT (g_CurExecuted <= minExecuted + (g_ExecutedAtLastCatch + g_NumThreads), "Too many tasks survived exception");
+        ASSERT (g_NumExceptionsCaught == 1 || okayNoExceptionsCaught, "No try_blocks in any body expected in this test");
+    }
+    else {
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+        ASSERT (g_NumExceptionsCaught >= 1 || okayNoExceptionsCaught, "No try_blocks in any body expected in this test");
+    }
+} // void Test3 ()
+
+class OuterParForExceptionSafeBody {
+public:
+    void operator()( const range_type& ) const {
+        tbb::task_group_context ctx(tbb::task_group_context::isolated);
+        ++g_OuterParCalls;
+        TRY();
+            tbb::parallel_for( tbb::blocked_range<size_t>(0, INNER_RANGE, INNER_GRAIN), SimpleParForBody(), tbb::simple_partitioner(), ctx );
+        CATCH();  // this macro sets g_ExceptionCaught
+    }
+};
+
+//! Uses parallel_for body invoking an inner parallel_for (with isolated context) inside a try-block.
+/** Since exception(s) thrown from the inner parallel_for are handled by the caller
+    in this test, they do not affect neither other tasks of the the root parallel_for
+    nor sibling inner algorithms. **/
+void Test4 () {
+    ResetGlobals( true, true );
+    intptr_t  innerCalls = NumSubranges(INNER_RANGE, INNER_GRAIN),
+            outerCalls = NumSubranges(OUTER_RANGE, OUTER_GRAIN);
+    TRY();
+        tbb::parallel_for( range_type(0, OUTER_RANGE, OUTER_GRAIN), OuterParForExceptionSafeBody() );
+    CATCH();
+    // g_SolitaryException  : one inner pfor will throw, the rest will execute to completion.
+    //                        so the count should be (outerCalls -1) * innerCalls, if a throw happened.
+    // !g_SolitaryException : possible multiple inner pfor throws.  Should be approximately
+    //                        (outerCalls - g_NumExceptionsCaught) * innerCalls, give or take a few
+    intptr_t  minExecuted = (outerCalls - g_NumExceptionsCaught) * innerCalls;
+    bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecuted) || (!g_ExceptionInMaster && !g_NonMasterExecuted);
+    if ( g_SolitaryException ) {
+        // only one task had exception thrown. That task had at least one execution (the one that threw).
+        // There may be an arbitrary number of ranges executed after the throw but before the exception
+        // is caught in the scheduler and cancellation is signaled.  (seen 9, 11 and 62 (!) for 8 threads)
+        ASSERT (g_NumExceptionsCaught == 1 || okayNoExceptionsCaught, "No exception registered");
+        ASSERT (g_CurExecuted >= minExecuted, "Too few tasks executed");
+        ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived exception");
+        // a small number of threads can execute in a throwing sub-pfor, if the task which is
+        // to do the solitary throw swaps out after registering its intent to throw but before it
+        // actually does so.  (Or is this caused by the extra threads participating? No, the
+        // number of extra tasks is sometimes far greater than the number of extra threads.)
+        ASSERT (g_CurExecuted <= minExecuted + g_NumThreads, "Too many tasks survived exception");
+        if(g_CurExecuted > minExecuted + g_NumThreads) REMARK("Unusual number of tasks executed after signal (%d vs. %d)\n",
+                (int)g_CurExecuted, minExecuted + g_NumThreads);
+    }
+    else {
+        ASSERT ((g_NumExceptionsCaught >= 1 && g_NumExceptionsCaught <= outerCalls) || okayNoExceptionsCaught, "Unexpected actual number of exceptions");
+        ASSERT (g_CurExecuted >= minExecuted, "Too few executed tasks reported");
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived multiple exceptions");
+        if(g_CurExecuted > g_ExecutedAtLastCatch + g_NumThreads) REMARK("Unusual number of tasks executed after signal (%d vs. %d)\n",
+                (int)g_CurExecuted, g_ExecutedAtLastCatch + g_NumThreads);
+        ASSERT (g_CurExecuted <= outerCalls * (1 + g_NumThreads), "Too many tasks survived exception");
+    }
+} // void Test4 ()
+
+#endif /* TBB_USE_EXCEPTIONS */
+
+class ParForBodyToCancel {
+public:
+    void operator()( const range_type& ) const {
+        ++g_CurExecuted;
+        CancellatorTask::WaitUntilReady();
+    }
+};
+
+template<class B>
+class ParForLauncherTask : public tbb::task {
+    tbb::task_group_context &my_ctx;
+
+    tbb::task* execute () __TBB_override {
+        tbb::parallel_for( range_type(0, FLAT_RANGE, FLAT_GRAIN), B(), tbb::simple_partitioner(), my_ctx );
+        return NULL;
+    }
+public:
+    ParForLauncherTask ( tbb::task_group_context& ctx ) : my_ctx(ctx) {}
+};
+
+//! Test for cancelling an algorithm from outside (from a task running in parallel with the algorithm).
+void TestCancelation1 () {
+    ResetGlobals( false );
+    RunCancellationTest<ParForLauncherTask<ParForBodyToCancel>, CancellatorTask>( NumSubranges(FLAT_RANGE, FLAT_GRAIN) / 4 );
+}
+
+class CancellatorTask2 : public tbb::task {
+    tbb::task_group_context &m_GroupToCancel;
+
+    tbb::task* execute () __TBB_override {
+        Harness::ConcurrencyTracker ct;
+        WaitUntilConcurrencyPeaks();
+        m_GroupToCancel.cancel_group_execution();
+        g_ExecutedAtLastCatch = g_CurExecuted;
+        return NULL;
+    }
+public:
+    CancellatorTask2 ( tbb::task_group_context& ctx, intptr_t ) : m_GroupToCancel(ctx) {}
+};
+
+class ParForBodyToCancel2 {
+public:
+    void operator()( const range_type& ) const {
+        ++g_CurExecuted;
+        Harness::ConcurrencyTracker ct;
+        // The test will hang (and be timed out by the test system) if is_cancelled() is broken
+        while( !tbb::task::self().is_cancelled() )
+            __TBB_Yield();
+    }
+};
+
+//! Test for cancelling an algorithm from outside (from a task running in parallel with the algorithm).
+/** This version also tests task::is_cancelled() method. **/
+void TestCancelation2 () {
+    ResetGlobals();
+    RunCancellationTest<ParForLauncherTask<ParForBodyToCancel2>, CancellatorTask2>();
+    ASSERT (g_ExecutedAtLastCatch < g_NumThreads, "Somehow worker tasks started their execution before the cancellator task");
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived cancellation");
+    ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Some tasks were executed after cancellation");
+}
+
+////////////////////////////////////////////////////////////////////////////////
+// Regression test based on the contribution by the author of the following forum post:
+// http://softwarecommunity.intel.com/isn/Community/en-US/forums/thread/30254959.aspx
+
+class Worker {
+    static const int max_nesting = 3;
+    static const int reduce_range = 1024;
+    static const int reduce_grain = 256;
+public:
+    int DoWork (int level);
+    int Validate (int start_level) {
+        int expected = 1; // identity for multiplication
+        for(int i=start_level+1; i<max_nesting; ++i)
+             expected *= reduce_range;
+        return expected;
+    }
+};
+
+class RecursiveParReduceBodyWithSharedWorker {
+    Worker * m_SharedWorker;
+    int m_NestingLevel;
+    int m_Result;
+public:
+    RecursiveParReduceBodyWithSharedWorker ( RecursiveParReduceBodyWithSharedWorker& src, tbb::split )
+        : m_SharedWorker(src.m_SharedWorker)
+        , m_NestingLevel(src.m_NestingLevel)
+        , m_Result(0)
+    {}
+    RecursiveParReduceBodyWithSharedWorker ( Worker *w, int outer )
+        : m_SharedWorker(w)
+        , m_NestingLevel(outer)
+        , m_Result(0)
+    {}
+
+    void operator() ( const tbb::blocked_range<size_t>& r ) {
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        for (size_t i = r.begin (); i != r.end (); ++i) {
+            m_Result += m_SharedWorker->DoWork (m_NestingLevel);
+        }
+    }
+    void join (const RecursiveParReduceBodyWithSharedWorker & x) {
+        m_Result += x.m_Result;
+    }
+    int result () { return m_Result; }
+};
+
+int Worker::DoWork ( int level ) {
+    ++level;
+    if ( level < max_nesting ) {
+        RecursiveParReduceBodyWithSharedWorker rt (this, level);
+        tbb::parallel_reduce (tbb::blocked_range<size_t>(0, reduce_range, reduce_grain), rt);
+        return rt.result();
+    }
+    else
+        return 1;
+}
+
+//! Regression test for hanging that occurred with the first version of cancellation propagation
+void TestCancelation3 () {
+    Worker w;
+    int result   = w.DoWork (0);
+    int expected = w.Validate(0);
+    ASSERT ( result == expected, "Wrong calculation result");
+}
+
+struct StatsCounters {
+    tbb::atomic<size_t> my_total_created;
+    tbb::atomic<size_t> my_total_deleted;
+    StatsCounters() {
+        my_total_created = 0;
+        my_total_deleted = 0;
+    }
+};
+
+class ParReduceBody {
+    StatsCounters* my_stats;
+    size_t my_id;
+    bool my_exception;
+
+public:
+    ParReduceBody( StatsCounters& s_, bool e_ ) : my_stats(&s_), my_exception(e_) {
+        my_id = my_stats->my_total_created++;
+    }
+
+    ParReduceBody( const ParReduceBody& lhs ) {
+        my_stats = lhs.my_stats;
+        my_id = my_stats->my_total_created++;
+    }
+
+    ParReduceBody( ParReduceBody& lhs, tbb::split ) {
+        my_stats = lhs.my_stats;
+        my_id = my_stats->my_total_created++;
+    }
+
+    ~ParReduceBody(){ ++my_stats->my_total_deleted; }
+
+    void operator()( const tbb::blocked_range<std::size_t>& /*range*/ ) const {
+        //Do nothing, except for one task (chosen arbitrarily)
+        if( my_id >= 12 ) {
+            if( my_exception )
+                ThrowTestException(1);
+            else
+                tbb::task::self().cancel_group_execution();
+        }
+    }
+
+    void join( ParReduceBody& /*rhs*/ ) {}
+};
+
+void TestCancelation4() {
+    StatsCounters statsObj;
+    __TBB_TRY {
+        tbb::task_group_context tgc1, tgc2;
+        ParReduceBody body_for_cancellation(statsObj, false), body_for_exception(statsObj, true);
+        tbb::parallel_reduce( tbb::blocked_range<std::size_t>(0,100000000,100), body_for_cancellation, tbb::simple_partitioner(), tgc1 );
+        tbb::parallel_reduce( tbb::blocked_range<std::size_t>(0,100000000,100), body_for_exception, tbb::simple_partitioner(), tgc2 );
+    } __TBB_CATCH(...) {}
+    ASSERT ( statsObj.my_total_created==statsObj.my_total_deleted, "Not all parallel_reduce body objects created were reclaimed");
+}
+
+void RunParForAndReduceTests () {
+    REMARK( "parallel for and reduce tests\n" );
+    tbb::task_scheduler_init init (g_NumThreads);
+    g_Master = Harness::CurrentTid();
+
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    Test0();
+    Test1();
+    Test2();
+    Test3();
+    Test4();
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+    TestCancelation1();
+    TestCancelation2();
+    TestCancelation3();
+    TestCancelation4();
+}
+
+////////////////////////////////////////////////////////////////////////////////
+// Tests for tbb::parallel_do
+
+#define ITER_RANGE          1000
+#define ITEMS_TO_FEED       50
+#define INNER_ITER_RANGE   100
+#define OUTER_ITER_RANGE  50
+
+#define PREPARE_RANGE(Iterator, rangeSize)  \
+    size_t test_vector[rangeSize + 1]; \
+    for (int i =0; i < rangeSize; i++) \
+        test_vector[i] = i; \
+    Iterator begin(&test_vector[0]); \
+    Iterator end(&test_vector[rangeSize])
+
+void Feed ( tbb::parallel_do_feeder<size_t> &feeder, size_t val ) {
+    if (g_FedTasksCount < ITEMS_TO_FEED) {
+        ++g_FedTasksCount;
+        feeder.add(val);
+    }
+}
+
+#include "harness_iterator.h"
+
+#if TBB_USE_EXCEPTIONS
+
+// Simple functor object with exception
+class SimpleParDoBody {
+public:
+    void operator() ( size_t &value ) const {
+        ++g_CurExecuted;
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        Harness::ConcurrencyTracker ct;
+        value += 1000;
+        WaitUntilConcurrencyPeaks();
+        ThrowTestException(1);
+    }
+};
+
+// Simple functor object with exception and feeder
+class SimpleParDoBodyWithFeeder : SimpleParDoBody {
+public:
+    void operator() ( size_t &value, tbb::parallel_do_feeder<size_t> &feeder ) const {
+        Feed(feeder, 0);
+        SimpleParDoBody::operator()(value);
+    }
+};
+
+// Tests exceptions without nesting
+template <class Iterator, class simple_body>
+void Test1_parallel_do () {
+    ResetGlobals();
+    PREPARE_RANGE(Iterator, ITER_RANGE);
+    TRY();
+        tbb::parallel_do<Iterator, simple_body>(begin, end, simple_body() );
+    CATCH_AND_ASSERT();
+    ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived cancellation");
+    ASSERT (g_NumExceptionsCaught == 1, "No try_blocks in any body expected in this test");
+    if ( !g_SolitaryException )
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+
+} // void Test1_parallel_do ()
+
+template <class Iterator>
+class OuterParDoBody {
+public:
+    void operator()( size_t& /*value*/ ) const {
+        ++g_OuterParCalls;
+        PREPARE_RANGE(Iterator, INNER_ITER_RANGE);
+        tbb::parallel_do<Iterator, SimpleParDoBody>(begin, end, SimpleParDoBody());
+    }
+};
+
+template <class Iterator>
+class OuterParDoBodyWithFeeder : OuterParDoBody<Iterator> {
+public:
+    void operator()( size_t& value, tbb::parallel_do_feeder<size_t>& feeder ) const {
+        Feed(feeder, 0);
+        OuterParDoBody<Iterator>::operator()(value);
+    }
+};
+
+//! Uses parallel_do body containing an inner parallel_do with the default context not wrapped by a try-block.
+/** Inner algorithms are spawned inside the new bound context by default. Since
+    exceptions thrown from the inner parallel_do are not handled by the caller
+    (outer parallel_do body) in this test, they will cancel all the sibling inner
+    algorithms. **/
+template <class Iterator, class outer_body>
+void Test2_parallel_do () {
+    ResetGlobals();
+    PREPARE_RANGE(Iterator, ITER_RANGE);
+    TRY();
+        tbb::parallel_do<Iterator, outer_body >(begin, end, outer_body() );
+    CATCH_AND_ASSERT();
+    //if ( g_SolitaryException )
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived cancellation");
+    ASSERT (g_NumExceptionsCaught == 1, "No try_blocks in any body expected in this test");
+    if ( !g_SolitaryException )
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+} // void Test2_parallel_do ()
+
+template <class Iterator>
+class OuterParDoBodyWithIsolatedCtx {
+public:
+    void operator()( size_t& /*value*/ ) const {
+        tbb::task_group_context ctx(tbb::task_group_context::isolated);
+        ++g_OuterParCalls;
+        PREPARE_RANGE(Iterator, INNER_ITER_RANGE);
+        tbb::parallel_do<Iterator, SimpleParDoBody>(begin, end, SimpleParDoBody(), ctx);
+    }
+};
+
+template <class Iterator>
+class OuterParDoBodyWithIsolatedCtxWithFeeder : OuterParDoBodyWithIsolatedCtx<Iterator> {
+public:
+    void operator()( size_t& value, tbb::parallel_do_feeder<size_t> &feeder ) const {
+        Feed(feeder, 0);
+        OuterParDoBodyWithIsolatedCtx<Iterator>::operator()(value);
+    }
+};
+
+//! Uses parallel_do body invoking an inner parallel_do with an isolated context without a try-block.
+/** Even though exceptions thrown from the inner parallel_do are not handled
+    by the caller in this test, they will not affect sibling inner algorithms
+    already running because of the isolated contexts. However because the first
+    exception cancels the root parallel_do, at most the first g_NumThreads subranges
+    will be processed (which launch inner parallel_dos) **/
+template <class Iterator, class outer_body>
+void Test3_parallel_do () {
+    ResetGlobals();
+    PREPARE_RANGE(Iterator, OUTER_ITER_RANGE);
+    intptr_t innerCalls = INNER_ITER_RANGE,
+             // The assumption here is the same as in outer parallel fors.
+             minExecuted = (g_NumThreads - 1) * innerCalls;
+    g_Master = Harness::CurrentTid();
+    TRY();
+        tbb::parallel_do<Iterator, outer_body >(begin, end, outer_body());
+    CATCH_AND_ASSERT();
+    // figure actual number of expected executions given the number of outer PDos started.
+    minExecuted = (g_OuterParCalls - 1) * innerCalls;
+    // one extra thread may run a task that sees cancellation.  Infrequent but possible
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived exception");
+    if(g_TGCCancelled > g_NumThreads) REMARK("Extra thread(s) executed after cancel (%d vs. %d)\n",
+            (int)g_TGCCancelled, (int)g_NumThreads);
+    if ( g_SolitaryException ) {
+        ASSERT (g_CurExecuted > minExecuted, "Too few tasks survived exception");
+        ASSERT (g_CurExecuted <= minExecuted + (g_ExecutedAtLastCatch + g_NumThreads), "Too many tasks survived exception");
+    }
+    ASSERT (g_NumExceptionsCaught == 1, "No try_blocks in any body expected in this test");
+    if ( !g_SolitaryException )
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+} // void Test3_parallel_do ()
+
+template <class Iterator>
+class OuterParDoWithEhBody {
+public:
+    void operator()( size_t& /*value*/ ) const {
+        tbb::task_group_context ctx(tbb::task_group_context::isolated);
+        ++g_OuterParCalls;
+        PREPARE_RANGE(Iterator, INNER_ITER_RANGE);
+        TRY();
+            tbb::parallel_do<Iterator, SimpleParDoBody>(begin, end, SimpleParDoBody(), ctx);
+        CATCH();
+    }
+};
+
+template <class Iterator>
+class OuterParDoWithEhBodyWithFeeder : NoAssign, OuterParDoWithEhBody<Iterator> {
+public:
+    void operator()( size_t &value, tbb::parallel_do_feeder<size_t> &feeder ) const {
+        Feed(feeder, 0);
+        OuterParDoWithEhBody<Iterator>::operator()(value);
+    }
+};
+
+//! Uses parallel_for body invoking an inner parallel_for (with default bound context) inside a try-block.
+/** Since exception(s) thrown from the inner parallel_for are handled by the caller
+    in this test, they do not affect neither other tasks of the the root parallel_for
+    nor sibling inner algorithms. **/
+template <class Iterator, class outer_body_with_eh>
+void Test4_parallel_do () {
+    ResetGlobals( true, true );
+    PREPARE_RANGE(Iterator, OUTER_ITER_RANGE);
+    g_Master = Harness::CurrentTid();
+    TRY();
+        tbb::parallel_do<Iterator, outer_body_with_eh>(begin, end, outer_body_with_eh());
+    CATCH();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "All exceptions must have been handled in the parallel_do body");
+    intptr_t innerCalls = INNER_ITER_RANGE,
+             outerCalls = OUTER_ITER_RANGE + g_FedTasksCount,
+             maxExecuted = outerCalls * innerCalls,
+             minExecuted = 0;
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived exception");
+    if ( g_SolitaryException ) {
+        minExecuted = maxExecuted - innerCalls;
+        ASSERT (g_NumExceptionsCaught == 1, "No exception registered");
+        ASSERT (g_CurExecuted >= minExecuted, "Too few tasks executed");
+        // This test has the same property as Test4 (parallel_for); the exception can be
+        // thrown, but some number of tasks from the outer Pdo can execute after the throw but
+        // before the cancellation is signaled (have seen 36).
+        ASSERT_WARNING(g_CurExecuted < maxExecuted || g_TGCCancelled, "All tasks survived exception. Oversubscription?");
+    }
+    else {
+        minExecuted = g_NumExceptionsCaught;
+        ASSERT (g_NumExceptionsCaught > 1 && g_NumExceptionsCaught <= outerCalls, "Unexpected actual number of exceptions");
+        ASSERT (g_CurExecuted >= minExecuted, "Too many executed tasks reported");
+        ASSERT (g_CurExecuted < g_ExecutedAtLastCatch + g_NumThreads + outerCalls, "Too many tasks survived multiple exceptions");
+        ASSERT (g_CurExecuted <= outerCalls * (1 + g_NumThreads), "Too many tasks survived exception");
+    }
+} // void Test4_parallel_do ()
+
+// This body throws an exception only if the task was added by feeder
+class ParDoBodyWithThrowingFeederTasks {
+public:
+    //! This form of the function call operator can be used when the body needs to add more work during the processing
+    void operator() ( size_t &value, tbb::parallel_do_feeder<size_t> &feeder ) const {
+        ++g_CurExecuted;
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        Feed(feeder, 1);
+        if (value == 1)
+            ThrowTestException(1);
+    }
+}; // class ParDoBodyWithThrowingFeederTasks
+
+// Test exception in task, which was added by feeder.
+template <class Iterator>
+void Test5_parallel_do () {
+    ResetGlobals();
+    PREPARE_RANGE(Iterator, ITER_RANGE);
+    g_Master = Harness::CurrentTid();
+    TRY();
+        tbb::parallel_do<Iterator, ParDoBodyWithThrowingFeederTasks>(begin, end, ParDoBodyWithThrowingFeederTasks());
+    CATCH();
+    if (g_SolitaryException) {
+        // Failure occurs when g_ExceptionInMaster is false, but all the 1 values in the range
+        // are handled by the master thread.  In this case no throw occurs.
+        ASSERT (l_ExceptionCaughtAtCurrentLevel     // we saw an exception
+                || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) // non-master throws but none tried
+                || (g_ExceptionInMaster && !g_MasterExecutedThrow)     // master throws but master didn't try
+                , "At least one exception should occur");
+        if(!g_ExceptionCaught) {
+            if(g_ExceptionInMaster)
+                REMARK("PDo exception not thrown; non-masters handled all throwing values.\n");
+            else
+                REMARK("PDo exception not thrown; master handled all throwing values.\n");
+        }
+    }
+} // void Test5_parallel_do ()
+
+#endif /* TBB_USE_EXCEPTIONS */
+
+class ParDoBodyToCancel {
+public:
+    void operator()( size_t& /*value*/ ) const {
+        ++g_CurExecuted;
+        CancellatorTask::WaitUntilReady();
+    }
+};
+
+class ParDoBodyToCancelWithFeeder : ParDoBodyToCancel {
+public:
+    void operator()( size_t& value, tbb::parallel_do_feeder<size_t> &feeder ) const {
+        Feed(feeder, 0);
+        ParDoBodyToCancel::operator()(value);
+    }
+};
+
+template<class B, class Iterator>
+class ParDoWorkerTask : public tbb::task {
+    tbb::task_group_context &my_ctx;
+
+    tbb::task* execute () __TBB_override {
+        PREPARE_RANGE(Iterator, INNER_ITER_RANGE);
+        tbb::parallel_do<Iterator, B>( begin, end, B(), my_ctx );
+        return NULL;
+    }
+public:
+    ParDoWorkerTask ( tbb::task_group_context& ctx ) : my_ctx(ctx) {}
+};
+
+//! Test for cancelling an algorithm from outside (from a task running in parallel with the algorithm).
+template <class Iterator, class body_to_cancel>
+void TestCancelation1_parallel_do () {
+    ResetGlobals( false );
+    intptr_t  threshold = 10;
+    tbb::task_group_context  ctx;
+    ctx.reset();
+    tbb::empty_task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    r.set_ref_count(3);
+    r.spawn( *new( r.allocate_child() ) CancellatorTask(ctx, threshold) );
+    __TBB_Yield();
+    r.spawn( *new( r.allocate_child() ) ParDoWorkerTask<body_to_cancel, Iterator>(ctx) );
+    TRY();
+        r.wait_for_all();
+    CATCH_AND_FAIL();
+    ASSERT (g_CurExecuted < g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks were executed after cancellation");
+    r.destroy(r);
+}
+
+class ParDoBodyToCancel2 {
+public:
+    void operator()( size_t& /*value*/ ) const {
+        ++g_CurExecuted;
+        Harness::ConcurrencyTracker ct;
+        // The test will hang (and be timed out by the test system) if is_cancelled() is broken
+        while( !tbb::task::self().is_cancelled() )
+            __TBB_Yield();
+    }
+};
+
+class ParDoBodyToCancel2WithFeeder : ParDoBodyToCancel2 {
+public:
+    void operator()( size_t& value, tbb::parallel_do_feeder<size_t> &feeder ) const {
+        Feed(feeder, 0);
+        ParDoBodyToCancel2::operator()(value);
+    }
+};
+
+//! Test for cancelling an algorithm from outside (from a task running in parallel with the algorithm).
+/** This version also tests task::is_cancelled() method. **/
+template <class Iterator, class body_to_cancel>
+void TestCancelation2_parallel_do () {
+    ResetGlobals();
+    RunCancellationTest<ParDoWorkerTask<body_to_cancel, Iterator>, CancellatorTask2>();
+}
+
+#define RunWithSimpleBody(func, body)       \
+    func<Harness::RandomIterator<size_t>, body>();           \
+    func<Harness::RandomIterator<size_t>, body##WithFeeder>();  \
+    func<Harness::ForwardIterator<size_t>, body>();         \
+    func<Harness::ForwardIterator<size_t>, body##WithFeeder>()
+
+#define RunWithTemplatedBody(func, body)       \
+    func<Harness::RandomIterator<size_t>, body<Harness::RandomIterator<size_t> > >();           \
+    func<Harness::RandomIterator<size_t>, body##WithFeeder<Harness::RandomIterator<size_t> > >();  \
+    func<Harness::ForwardIterator<size_t>, body<Harness::ForwardIterator<size_t> > >();         \
+    func<Harness::ForwardIterator<size_t>, body##WithFeeder<Harness::ForwardIterator<size_t> > >()
+
+void RunParDoTests() {
+    REMARK( "parallel do tests\n" );
+    tbb::task_scheduler_init init (g_NumThreads);
+    g_Master = Harness::CurrentTid();
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    RunWithSimpleBody(Test1_parallel_do, SimpleParDoBody);
+    RunWithTemplatedBody(Test2_parallel_do, OuterParDoBody);
+    RunWithTemplatedBody(Test3_parallel_do, OuterParDoBodyWithIsolatedCtx);
+    RunWithTemplatedBody(Test4_parallel_do, OuterParDoWithEhBody);
+    Test5_parallel_do<Harness::ForwardIterator<size_t> >();
+    Test5_parallel_do<Harness::RandomIterator<size_t> >();
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+    RunWithSimpleBody(TestCancelation1_parallel_do, ParDoBodyToCancel);
+    RunWithSimpleBody(TestCancelation2_parallel_do, ParDoBodyToCancel2);
+}
+
+////////////////////////////////////////////////////////////////////////////////
+// Tests for tbb::pipeline
+
+#define NUM_ITEMS   100
+
+const size_t c_DataEndTag = size_t(~0);
+
+int g_NumTokens = 0;
+
+// Simple input filter class, it assigns 1 to all array members
+// It stops when it receives item equal to -1
+class InputFilter: public tbb::filter {
+    tbb::atomic<size_t> m_Item;
+    size_t m_Buffer[NUM_ITEMS + 1];
+public:
+    InputFilter() : tbb::filter(parallel) {
+        m_Item = 0;
+        for (size_t i = 0; i < NUM_ITEMS; ++i )
+            m_Buffer[i] = 1;
+        m_Buffer[NUM_ITEMS] = c_DataEndTag;
+    }
+
+    void* operator()( void* ) __TBB_override {
+        size_t item = m_Item.fetch_and_increment();
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        if(item == 1) {
+            ++g_PipelinesStarted;   // count on emitting the first item.
+        }
+        if ( item >= NUM_ITEMS )
+            return NULL;
+        m_Buffer[item] = 1;
+        return &m_Buffer[item];
+    }
+
+    size_t* buffer() { return m_Buffer; }
+}; // class InputFilter
+
+// Pipeline filter, without exceptions throwing
+class NoThrowFilter : public tbb::filter {
+    size_t m_Value;
+public:
+    enum operation {
+        addition,
+        subtraction,
+        multiplication
+    } m_Operation;
+
+    NoThrowFilter(operation _operation, size_t value, bool is_parallel)
+        : filter(is_parallel? tbb::filter::parallel : tbb::filter::serial_in_order),
+        m_Value(value), m_Operation(_operation)
+    {}
+    void* operator()(void* item) __TBB_override {
+        size_t &value = *(size_t*)item;
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        ASSERT(value != c_DataEndTag, "terminator element is being processed");
+        switch (m_Operation){
+            case addition:
+                value += m_Value;
+                break;
+            case subtraction:
+                value -= m_Value;
+                break;
+            case multiplication:
+                value *= m_Value;
+                break;
+            default:
+                ASSERT(0, "Wrong operation parameter passed to NoThrowFilter");
+        } // switch (m_Operation)
+        return item;
+    }
+};
+
+// Test pipeline without exceptions throwing
+void Test0_pipeline () {
+    ResetGlobals();
+    // Run test when serial filter is the first non-input filter
+    InputFilter inputFilter;  //Emits NUM_ITEMS items
+    NoThrowFilter filter1(NoThrowFilter::addition, 99, false);
+    NoThrowFilter filter2(NoThrowFilter::subtraction, 90, true);
+    NoThrowFilter filter3(NoThrowFilter::multiplication, 5, false);
+    // Result should be 50 for all items except the last
+    tbb::pipeline p;
+    p.add_filter(inputFilter);
+    p.add_filter(filter1);
+    p.add_filter(filter2);
+    p.add_filter(filter3);
+    p.run(8);
+    for (size_t i = 0; i < NUM_ITEMS; ++i)
+        ASSERT(inputFilter.buffer()[i] == 50, "pipeline didn't process items properly");
+} // void Test0_pipeline ()
+
+#if TBB_USE_EXCEPTIONS
+
+// Simple filter with exception throwing.  If parallel, will wait until
+// as many parallel filters start as there are threads.
+class SimpleFilter : public tbb::filter {
+    bool m_canThrow;
+public:
+    SimpleFilter (tbb::filter::mode _mode, bool canThrow ) : filter (_mode), m_canThrow(canThrow) {}
+    void* operator()(void* item) __TBB_override {
+        ++g_CurExecuted;
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled() ) ++g_TGCCancelled;
+        if ( m_canThrow ) {
+            if ( !is_serial() ) {
+                Harness::ConcurrencyTracker ct;
+                WaitUntilConcurrencyPeaks( min(g_NumTokens, g_NumThreads) );
+            }
+            ThrowTestException(1);
+        }
+        return item;
+    }
+}; // class SimpleFilter
+
+// This enumeration represents filters order in pipeline
+struct FilterSet {
+    tbb::filter::mode   mode1,
+                        mode2;
+    bool                throw1,
+                        throw2;
+
+    FilterSet( tbb::filter::mode m1, tbb::filter::mode m2, bool t1, bool t2 )
+        : mode1(m1), mode2(m2), throw1(t1), throw2(t2)
+    {}
+}; // struct FilterSet
+
+FilterSet serial_parallel( tbb::filter::serial, tbb::filter::parallel, /*throw1*/false, /*throw2*/true );
+
+template<typename InFilter, typename Filter>
+class CustomPipeline : protected tbb::pipeline {
+    InFilter inputFilter;
+    Filter filter1;
+    Filter filter2;
+public:
+    CustomPipeline( const FilterSet& filters )
+        : filter1(filters.mode1, filters.throw1), filter2(filters.mode2, filters.throw2)
+    {
+       add_filter(inputFilter);
+       add_filter(filter1);
+       add_filter(filter2);
+    }
+    void run () { tbb::pipeline::run(g_NumTokens); }
+    void run ( tbb::task_group_context& ctx ) { tbb::pipeline::run(g_NumTokens, ctx); }
+
+    using tbb::pipeline::add_filter;
+};
+
+typedef CustomPipeline<InputFilter, SimpleFilter> SimplePipeline;
+
+// Tests exceptions without nesting
+void Test1_pipeline ( const FilterSet& filters ) {
+    ResetGlobals();
+    SimplePipeline testPipeline(filters);
+    TRY();
+        testPipeline.run();
+        if ( g_CurExecuted == 2 * NUM_ITEMS ) {
+            // all the items were processed, though an exception was supposed to occur.
+            if(!g_ExceptionInMaster && g_NonMasterExecutedThrow > 0) {
+                // if !g_ExceptionInMaster, the master thread is not allowed to throw.
+                // if g_nonMasterExcutedThrow > 0 then a thread besides the master tried to throw.
+                ASSERT(filters.mode1 != tbb::filter::parallel && filters.mode2 != tbb::filter::parallel, "Unusual count");
+            }
+            else {
+                REMARK("test1_Pipeline with %d threads: Only the master thread tried to throw, and it is not allowed to.\n", (int)g_NumThreads);
+            }
+            // In case of all serial filters they might be all executed in the thread(s)
+            // where exceptions are not allowed by the common test logic. So we just quit.
+            return;
+        }
+    CATCH_AND_ASSERT();
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived exception");
+    ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+    ASSERT (g_NumExceptionsCaught == 1, "No try_blocks in any body expected in this test");
+    if ( !g_SolitaryException )
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+
+} // void Test1_pipeline ()
+
+// Filter with nesting
+class OuterFilter : public tbb::filter {
+public:
+    OuterFilter (tbb::filter::mode _mode, bool ) : filter (_mode) {}
+
+    void* operator()(void* item) __TBB_override {
+        ++g_OuterParCalls;
+        SimplePipeline testPipeline(serial_parallel);
+        testPipeline.run();
+        return item;
+    }
+}; // class OuterFilter
+
+//! Uses pipeline containing an inner pipeline with the default context not wrapped by a try-block.
+/** Inner algorithms are spawned inside the new bound context by default. Since
+    exceptions thrown from the inner pipeline are not handled by the caller
+    (outer pipeline body) in this test, they will cancel all the sibling inner
+    algorithms. **/
+void Test2_pipeline ( const FilterSet& filters ) {
+    ResetGlobals();
+    g_NestedPipelines = true;
+    CustomPipeline<InputFilter, OuterFilter> testPipeline(filters);
+    TRY();
+        testPipeline.run();
+    CATCH_AND_ASSERT();
+    bool okayNoExceptionCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow);
+    ASSERT (g_NumExceptionsCaught == 1 || okayNoExceptionCaught, "No try_blocks in any body expected in this test");
+    if ( g_SolitaryException ) {
+        if( g_TGCCancelled > g_NumThreads) REMARK( "Extra tasks ran after exception thrown (%d vs. %d)\n",
+                (int)g_TGCCancelled, (int)g_NumThreads);
+    }
+    else {
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived exception");
+    }
+} // void Test2_pipeline ()
+
+//! creates isolated inner pipeline and runs it.
+class OuterFilterWithIsolatedCtx : public tbb::filter {
+public:
+    OuterFilterWithIsolatedCtx(tbb::filter::mode m, bool ) : filter(m) {}
+
+    void* operator()(void* item) __TBB_override {
+        ++g_OuterParCalls;
+        tbb::task_group_context ctx(tbb::task_group_context::isolated);
+        // create inner pipeline with serial input, parallel output filter, second filter throws
+        SimplePipeline testPipeline(serial_parallel);
+        testPipeline.run(ctx);
+        return item;
+    }
+}; // class OuterFilterWithIsolatedCtx
+
+//! Uses pipeline invoking an inner pipeline with an isolated context without a try-block.
+/** Even though exceptions thrown from the inner pipeline are not handled
+    by the caller in this test, they will not affect sibling inner algorithms
+    already running because of the isolated contexts. However because the first
+    exception cancels the root parallel_do only the first g_NumThreads subranges
+    will be processed (which launch inner pipelines) **/
+void Test3_pipeline ( const FilterSet& filters ) {
+    for( int nTries = 1; nTries <= 4; ++nTries) {
+        ResetGlobals();
+        g_NestedPipelines = true;
+        g_Master = Harness::CurrentTid();
+        intptr_t innerCalls = NUM_ITEMS,
+                 minExecuted = (g_NumThreads - 1) * innerCalls;
+        CustomPipeline<InputFilter, OuterFilterWithIsolatedCtx> testPipeline(filters);
+        TRY();
+            testPipeline.run();
+        CATCH_AND_ASSERT();
+
+        bool okayNoExceptionCaught = (g_ExceptionInMaster && !g_MasterExecuted) ||
+            (!g_ExceptionInMaster && !g_NonMasterExecuted);
+        // only test assertions if the test threw an exception (or we don't care)
+        bool testSucceeded = okayNoExceptionCaught || g_NumExceptionsCaught > 0;
+        if(testSucceeded) {
+            if (g_SolitaryException) {
+
+                // The test is one outer pipeline with two NestedFilters that each start an inner pipeline.
+                // Each time the input filter of a pipeline delivers its first item, it increments
+                // g_PipelinesStarted.  When g_SolitaryException, the throw will not occur until
+                // g_PipelinesStarted >= 3.  (This is so at least a second pipeline in its own isolated
+                // context will start; that is what we're testing.)
+                //
+                // There are two pipelines which will NOT run to completion when a solitary throw
+                // happens in an isolated inner context: the outer pipeline and the pipeline which
+                // throws.  All the other pipelines which start should run to completion.  But only
+                // inner body invocations are counted.
+                //
+                // So g_CurExecuted should be about
+                //
+                //   (2*NUM_ITEMS) * (g_PipelinesStarted - 2) + 1
+                //   ^ executions for each completed pipeline
+                //                   ^ completing pipelines (remembering two will not complete)
+                //                                              ^ one for the inner throwing pipeline
+
+                minExecuted = (2*NUM_ITEMS) * (g_PipelinesStarted - 2) + 1;
+                // each failing pipeline must execute at least two tasks
+                ASSERT(g_CurExecuted >= minExecuted, "Too few tasks survived exception");
+                // no more than g_NumThreads tasks will be executed in a cancelled context.  Otherwise
+                // tasks not executing at throw were scheduled.
+                ASSERT( g_TGCCancelled <= g_NumThreads, "Tasks not in-flight were executed");
+                ASSERT(g_NumExceptionsCaught == 1, "Should have only one exception");
+                // if we're only throwing from the master thread, and that thread didn't
+                // participate in the pipelines, then no throw occurred.
+                if(g_ExceptionInMaster && !g_MasterExecuted) {
+                    REMARK_ONCE("Master expected to throw, but didn't participate.\n");
+                }
+                else if(!g_ExceptionInMaster && !g_NonMasterExecuted) {
+                    REMARK_ONCE("Non-master expected to throw, but didn't participate.\n");
+                }
+            }
+            ASSERT (g_NumExceptionsCaught == 1 || okayNoExceptionCaught, "No try_blocks in any body expected in this test");
+            ASSERT ((g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads) || okayNoExceptionCaught, "Too many tasks survived exception");
+            if(nTries > 1) REMARK("Test3_pipeline succeeeded on try %d\n", nTries);
+            return;
+        }
+    }
+    REMARK_ONCE("Test3_pipeline failed for g_NumThreads==%d, g_ExceptionInMaster==%s , g_SolitaryException==%s\n",
+            g_NumThreads, g_ExceptionInMaster?"T":"F", g_SolitaryException?"T":"F");
+} // void Test3_pipeline ()
+
+class OuterFilterWithEhBody : public tbb::filter {
+public:
+    OuterFilterWithEhBody(tbb::filter::mode m, bool ) : filter(m) {}
+
+    void* operator()(void* item) __TBB_override {
+        tbb::task_group_context ctx(tbb::task_group_context::isolated);
+        ++g_OuterParCalls;
+        SimplePipeline testPipeline(serial_parallel);
+        TRY();
+            testPipeline.run(ctx);
+        CATCH();
+        return item;
+    }
+}; // class OuterFilterWithEhBody
+
+//! Uses pipeline body invoking an inner pipeline (with isolated context) inside a try-block.
+/** Since exception(s) thrown from the inner pipeline are handled by the caller
+    in this test, they do not affect other tasks of the the root pipeline
+    nor sibling inner algorithms. **/
+void Test4_pipeline ( const FilterSet& filters ) {
+#if __GNUC__ && !__INTEL_COMPILER
+    if ( strncmp(__VERSION__, "4.1.0", 5) == 0 ) {
+        REMARK_ONCE("Known issue: one of exception handling tests is skipped.\n");
+        return;
+    }
+#endif
+    ResetGlobals( true, true );
+    // each outer pipeline stage will start NUM_ITEMS inner pipelines.
+    // each inner pipeline that doesn't throw will process NUM_ITEMS items.
+    // for solitary exception there will be one pipeline that only processes one stage, one item.
+    // innerCalls should be 2*NUM_ITEMS
+    intptr_t innerCalls = 2*NUM_ITEMS,
+             outerCalls = 2 * NUM_ITEMS,
+             maxExecuted = outerCalls * innerCalls;  // the number of invocations of the inner pipelines
+    CustomPipeline<InputFilter, OuterFilterWithEhBody> testPipeline(filters);
+    TRY();
+        testPipeline.run();
+    CATCH_AND_ASSERT();
+    intptr_t  minExecuted = 0;
+    bool okayNoExceptionCaught = (g_ExceptionInMaster && !g_MasterExecuted) ||
+        (!g_ExceptionInMaster && !g_NonMasterExecuted);
+    if ( g_SolitaryException ) {
+        minExecuted = maxExecuted - innerCalls;  // one throwing inner pipeline
+        ASSERT (g_NumExceptionsCaught == 1 || okayNoExceptionCaught, "No exception registered");
+        ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived exception");  // probably will assert.
+    }
+    else {
+        // we assume throwing pipelines will not count
+        minExecuted = (outerCalls - g_NumExceptionsCaught) * innerCalls;
+        ASSERT((g_NumExceptionsCaught >= 1 && g_NumExceptionsCaught <= outerCalls)||okayNoExceptionCaught, "Unexpected actual number of exceptions");
+        ASSERT (g_CurExecuted >= minExecuted, "Too many executed tasks reported");
+        // too many already-scheduled tasks are started after the first exception is
+        // thrown.  And g_ExecutedAtLastCatch is updated every time an exception is caught.
+        // So with multiple exceptions there are a variable number of tasks that have been
+        // discarded because of the signals.
+        // each throw is caught, so we will see many cancelled tasks.  g_ExecutedAtLastCatch is
+        // updated with each throw, so the value will be the number of tasks executed at the last
+        ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks survived multiple exceptions");
+    }
+} // void Test4_pipeline ()
+
+//! Testing filter::finalize method
+#define BUFFER_SIZE     32
+#define NUM_BUFFERS     1024
+
+tbb::atomic<size_t> g_AllocatedCount; // Number of currently allocated buffers
+tbb::atomic<size_t> g_TotalCount; // Total number of allocated buffers
+
+//! Base class for all filters involved in finalize method testing
+class FinalizationBaseFilter : public tbb::filter {
+public:
+    FinalizationBaseFilter ( tbb::filter::mode m ) : filter(m) {}
+
+    // Deletes buffers if exception occurred
+    virtual void finalize( void* item ) __TBB_override {
+        size_t* m_Item = (size_t*)item;
+        delete[] m_Item;
+        --g_AllocatedCount;
+    }
+};
+
+//! Input filter to test finalize method
+class InputFilterWithFinalization: public FinalizationBaseFilter {
+public:
+    InputFilterWithFinalization() : FinalizationBaseFilter(tbb::filter::serial) {
+        g_TotalCount = 0;
+    }
+    void* operator()( void* ) __TBB_override {
+        if (g_TotalCount == NUM_BUFFERS)
+            return NULL;
+        size_t* item = new size_t[BUFFER_SIZE];
+        for (int i = 0; i < BUFFER_SIZE; i++)
+            item[i] = 1;
+        ++g_TotalCount;
+        ++g_AllocatedCount;
+        return item;
+    }
+};
+
+// The filter multiplies each buffer item by 10.
+class ProcessingFilterWithFinalization : public FinalizationBaseFilter {
+public:
+    ProcessingFilterWithFinalization (tbb::filter::mode _mode, bool) : FinalizationBaseFilter (_mode) {}
+
+    void* operator()( void* item) __TBB_override {
+        if(g_Master == Harness::CurrentTid()) g_MasterExecuted = true;
+        else g_NonMasterExecuted = true;
+        if( tbb::task::self().is_cancelled()) ++g_TGCCancelled;
+        if (g_TotalCount > NUM_BUFFERS / 2)
+            ThrowTestException(1);
+        size_t* m_Item = (size_t*)item;
+        for (int i = 0; i < BUFFER_SIZE; i++)
+            m_Item[i] *= 10;
+        return item;
+    }
+};
+
+// Output filter deletes previously allocated buffer
+class OutputFilterWithFinalization : public FinalizationBaseFilter {
+public:
+    OutputFilterWithFinalization (tbb::filter::mode m) : FinalizationBaseFilter (m) {}
+
+    void* operator()( void* item) __TBB_override {
+        size_t* m_Item = (size_t*)item;
+        delete[] m_Item;
+        --g_AllocatedCount;
+        return NULL;
+    }
+};
+
+//! Tests filter::finalize method
+void Test5_pipeline ( const FilterSet& filters ) {
+    ResetGlobals();
+    g_AllocatedCount = 0;
+    CustomPipeline<InputFilterWithFinalization, ProcessingFilterWithFinalization> testPipeline(filters);
+    OutputFilterWithFinalization my_output_filter(tbb::filter::parallel);
+
+    testPipeline.add_filter(my_output_filter);
+    TRY();
+        testPipeline.run();
+    CATCH();
+    ASSERT (g_AllocatedCount == 0, "Memory leak: Some my_object weren't destroyed");
+} // void Test5_pipeline ()
+
+//! Tests pipeline function passed with different combination of filters
+template<void testFunc(const FilterSet&)>
+void TestWithDifferentFilters() {
+    const int NumFilterTypes = 3;
+    const tbb::filter::mode modes[NumFilterTypes] = {
+            tbb::filter::parallel,
+            tbb::filter::serial,
+            tbb::filter::serial_out_of_order
+        };
+    for ( int i = 0; i < NumFilterTypes; ++i ) {
+        for ( int j = 0; j < NumFilterTypes; ++j ) {
+            for ( int k = 0; k < 2; ++k )
+                testFunc( FilterSet(modes[i], modes[j], k == 0, k != 0) );
+        }
+    }
+}
+
+#endif /* TBB_USE_EXCEPTIONS */
+
+class FilterToCancel : public tbb::filter {
+public:
+    FilterToCancel(bool is_parallel)
+        : filter( is_parallel ? tbb::filter::parallel : tbb::filter::serial_in_order )
+    {}
+    void* operator()(void* item) __TBB_override {
+        ++g_CurExecuted;
+        CancellatorTask::WaitUntilReady();
+        return item;
+    }
+}; // class FilterToCancel
+
+template <class Filter_to_cancel>
+class PipelineLauncherTask : public tbb::task {
+    tbb::task_group_context &my_ctx;
+public:
+    PipelineLauncherTask ( tbb::task_group_context& ctx ) : my_ctx(ctx) {}
+
+    tbb::task* execute () __TBB_override {
+        // Run test when serial filter is the first non-input filter
+        InputFilter inputFilter;
+        Filter_to_cancel filterToCancel(true);
+        tbb::pipeline p;
+        p.add_filter(inputFilter);
+        p.add_filter(filterToCancel);
+        p.run(g_NumTokens, my_ctx);
+        return NULL;
+    }
+};
+
+//! Test for cancelling an algorithm from outside (from a task running in parallel with the algorithm).
+void TestCancelation1_pipeline () {
+    ResetGlobals();
+    g_ThrowException = false;
+    intptr_t  threshold = 10;
+    tbb::task_group_context ctx;
+    ctx.reset();
+    tbb::empty_task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    r.set_ref_count(3);
+    r.spawn( *new( r.allocate_child() ) CancellatorTask(ctx, threshold) );
+    __TBB_Yield();
+    r.spawn( *new( r.allocate_child() ) PipelineLauncherTask<FilterToCancel>(ctx) );
+    TRY();
+        r.wait_for_all();
+    CATCH_AND_FAIL();
+    r.destroy(r);
+    ASSERT( g_TGCCancelled <= g_NumThreads, "Too many tasks survived cancellation");
+    ASSERT (g_CurExecuted < g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks were executed after cancellation");
+}
+
+class FilterToCancel2 : public tbb::filter {
+public:
+    FilterToCancel2(bool is_parallel)
+        : filter ( is_parallel ? tbb::filter::parallel : tbb::filter::serial_in_order)
+    {}
+
+    void* operator()(void* item) __TBB_override {
+        ++g_CurExecuted;
+        Harness::ConcurrencyTracker ct;
+        // The test will hang (and be timed out by the test system) if is_cancelled() is broken
+        while( !tbb::task::self().is_cancelled() )
+            __TBB_Yield();
+        return item;
+    }
+};
+
+//! Test for cancelling an algorithm from outside (from a task running in parallel with the algorithm).
+/** This version also tests task::is_cancelled() method. **/
+void TestCancelation2_pipeline () {
+    ResetGlobals();
+    RunCancellationTest<PipelineLauncherTask<FilterToCancel2>, CancellatorTask2>();
+    // g_CurExecuted is always >= g_ExecutedAtLastCatch, because the latter is always a snapshot of the
+    // former, and g_CurExecuted is monotonic increasing.  so the comparison should be at least ==.
+    // If another filter is started after cancel but before cancellation is propagated, then the
+    // number will be larger.
+    ASSERT (g_CurExecuted <= g_ExecutedAtLastCatch, "Some tasks were executed after cancellation");
+}
+
+void RunPipelineTests() {
+    REMARK( "pipeline tests\n" );
+    tbb::task_scheduler_init init (g_NumThreads);
+    g_Master = Harness::CurrentTid();
+    g_NumTokens = 2 * g_NumThreads;
+
+    Test0_pipeline();
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    TestWithDifferentFilters<Test1_pipeline>();
+    TestWithDifferentFilters<Test2_pipeline>();
+    TestWithDifferentFilters<Test3_pipeline>();
+    TestWithDifferentFilters<Test4_pipeline>();
+    TestWithDifferentFilters<Test5_pipeline>();
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+    TestCancelation1_pipeline();
+    TestCancelation2_pipeline();
+}
+
+
+#if TBB_USE_EXCEPTIONS
+
+class MyCapturedException : public tbb::captured_exception {
+public:
+    static int m_refCount;
+
+    MyCapturedException () : tbb::captured_exception("MyCapturedException", "test") { ++m_refCount; }
+    ~MyCapturedException () throw() { --m_refCount; }
+
+    MyCapturedException* move () throw() __TBB_override {
+        MyCapturedException* movee = (MyCapturedException*)malloc(sizeof(MyCapturedException));
+        return ::new (movee) MyCapturedException;
+    }
+    void destroy () throw() __TBB_override {
+        this->~MyCapturedException();
+        free(this);
+    }
+    void operator delete ( void* p ) { free(p); }
+};
+
+int MyCapturedException::m_refCount = 0;
+
+void DeleteTbbException ( volatile tbb::tbb_exception* pe ) {
+    delete pe;
+}
+
+void TestTbbExceptionAPI () {
+    const char *name = "Test captured exception",
+               *reason = "Unit testing";
+    tbb::captured_exception e(name, reason);
+    ASSERT (strcmp(e.name(), name) == 0, "Setting captured exception name failed");
+    ASSERT (strcmp(e.what(), reason) == 0, "Setting captured exception reason failed");
+    tbb::captured_exception c(e);
+    ASSERT (strcmp(c.name(), e.name()) == 0, "Copying captured exception name failed");
+    ASSERT (strcmp(c.what(), e.what()) == 0, "Copying captured exception reason failed");
+    tbb::captured_exception *m = e.move();
+    ASSERT (strcmp(m->name(), name) == 0, "Moving captured exception name failed");
+    ASSERT (strcmp(m->what(), reason) == 0, "Moving captured exception reason failed");
+    ASSERT (!e.name() && !e.what(), "Moving semantics broken");
+    m->destroy();
+
+    MyCapturedException mce;
+    MyCapturedException *mmce = mce.move();
+    ASSERT( MyCapturedException::m_refCount == 2, NULL );
+    DeleteTbbException(mmce);
+    ASSERT( MyCapturedException::m_refCount == 1, NULL );
+}
+
+#endif /* TBB_USE_EXCEPTIONS */
+
+/** If min and max thread numbers specified on the command line are different,
+    the test is run only for 2 sizes of the thread pool (MinThread and MaxThread)
+    to be able to test the high and low contention modes while keeping the test reasonably fast **/
+int TestMain () {
+    if(tbb::task_scheduler_init::default_num_threads() == 1) {
+        REPORT("Known issue: tests require multiple hardware threads\n");
+        return Harness::Skipped;
+    }
+    REMARK ("Using %s\n", TBB_USE_CAPTURED_EXCEPTION ? "tbb:captured_exception" : "exact exception propagation");
+    MinThread = min(tbb::task_scheduler_init::default_num_threads(), max(2, MinThread));
+    MaxThread = max(MinThread, min(tbb::task_scheduler_init::default_num_threads(), MaxThread));
+    ASSERT (FLAT_RANGE >= FLAT_GRAIN * MaxThread, "Fix defines");
+    int step = max((MaxThread - MinThread + 1)/2, 1);
+    for ( g_NumThreads = MinThread; g_NumThreads <= MaxThread; g_NumThreads += step ) {
+        REMARK ("Number of threads %d\n", g_NumThreads);
+        // Execute in all the possible modes
+        for ( size_t j = 0; j < 4; ++j ) {
+            g_ExceptionInMaster = (j & 1) != 0;
+            g_SolitaryException = (j & 2) != 0;
+            REMARK("g_ExceptionInMaster==%s, g_SolitaryException==%s\n", g_ExceptionInMaster?"T":"F", g_SolitaryException?"T":"F");
+            RunParForAndReduceTests();
+            RunParDoTests();
+            RunPipelineTests();
+        }
+    }
+#if TBB_USE_EXCEPTIONS
+    TestTbbExceptionAPI();
+#endif
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception handling tests are skipped.\n");
+#endif
+    return Harness::Done;
+}
+
+#else /* !__TBB_TASK_GROUP_CONTEXT */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
diff --git a/xdl/third_party/tbb/src/test/test_eh_flow_graph.cpp b/xdl/third_party/tbb/src/test/test_eh_flow_graph.cpp
new file mode 100644
index 00000000..9ca06736
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_eh_flow_graph.cpp
@@ -0,0 +1,2044 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 2
+#define HARNESS_DEFAULT_MAX_THREADS 4
+#include "harness_defs.h"
+
+#if _MSC_VER
+    #pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#endif
+
+#if __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+    // Suppress "unreachable code" warning by VC++ 17.0-18.0 (VS 2012 or newer)
+    #pragma warning (disable: 4702)
+#endif
+
+#include "harness.h"
+
+// global task_scheduler_observer is an imperfect tool to find how many threads are really
+// participating.  That was the hope, but it counts the entries into the marketplace,
+// not the arena.
+// #define USE_TASK_SCHEDULER_OBSERVER 1
+
+#if _MSC_VER && defined(__INTEL_COMPILER) && !TBB_USE_DEBUG
+    #define TBB_RUN_BUFFERING_TEST __INTEL_COMPILER > 1210
+#else
+    #define TBB_RUN_BUFFERING_TEST 1
+#endif
+
+#if TBB_USE_EXCEPTIONS
+#if USE_TASK_SCHEDULER_OBSERVER
+#include "tbb/task_scheduler_observer.h"
+#endif
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+#include <iostream>
+#include <vector>
+#include "harness_assert.h"
+#include "harness_checktype.h"
+
+inline intptr_t Existed() { return INT_MAX; }  // resolve Existed in harness_eh.h
+
+#include "harness_eh.h"
+#include <stdexcept>
+
+#define NUM_ITEMS 15
+int g_NumItems;
+
+tbb::atomic<unsigned> nExceptions;
+tbb::atomic<intptr_t> g_TGCCancelled;
+
+enum TestNodeTypeEnum { nonThrowing, isThrowing };
+
+static const size_t unlimited_type = 0;
+static const size_t serial_type = 1;
+static const size_t limited_type = 4;
+
+template<TestNodeTypeEnum T> struct TestNodeTypeName;
+template<> struct TestNodeTypeName<nonThrowing> { static const char *name() { return "nonThrowing"; } };
+template<> struct TestNodeTypeName<isThrowing> { static const char *name() { return "isThrowing"; } };
+
+template<size_t Conc> struct concurrencyName;
+template<> struct concurrencyName<serial_type>{ static const char *name() { return "serial"; } };
+template<> struct concurrencyName<unlimited_type>{ static const char *name() { return "unlimited"; } };
+template<> struct concurrencyName<limited_type>{ static const char *name() { return "limited"; } };
+
+// Class that provides waiting and throwing behavior.  If we are not throwing, do nothing
+// If serial, we can't wait for concurrency to peak; we may be the bottleneck and will
+// stop further processing.  We will execute g_NumThreads + 10 times (the "10" is somewhat
+// arbitrary, and just makes sure there are enough items in the graph to keep it flowing),
+// If parallel or serial and throwing, use Harness::ConcurrencyTracker to wait.
+
+template<size_t Conc, TestNodeTypeEnum t = nonThrowing>
+class WaitThrow;
+
+template<>
+class WaitThrow<serial_type,nonThrowing> {
+protected:
+    void WaitAndThrow(int cnt, const char * /*name*/) {
+        if(cnt > g_NumThreads + 10) {
+            Harness::ConcurrencyTracker ct;
+            WaitUntilConcurrencyPeaks();
+        }
+    }
+};
+
+template<>
+class WaitThrow<serial_type,isThrowing> {
+protected:
+    void WaitAndThrow(int cnt, const char * /*name*/) {
+        if(cnt > g_NumThreads + 10) {
+            Harness::ConcurrencyTracker ct;
+            WaitUntilConcurrencyPeaks();
+            ThrowTestException(1);
+        }
+    }
+};
+
+// for nodes with limited concurrency, if that concurrency is < g_NumThreads, we need
+// to make sure enough other nodes wait for concurrency to peak.  If we are attached to
+// N successors, for each item we pass to a successor, we will get N executions of the
+// "absorbers" (because we broadcast to successors.)  for an odd number of threads we
+// need (g_NumThreads - limited + 1) / 2 items (that will give us one extra execution
+// of an "absorber", but we can't change that without changing the behavior of the node.)
+template<>
+class WaitThrow<limited_type,nonThrowing> {
+protected:
+    void WaitAndThrow(int cnt, const char * /*name*/) {
+        if(cnt <= (g_NumThreads - (int)limited_type + 1)/2) {
+            return;
+        }
+        Harness::ConcurrencyTracker ct;
+        WaitUntilConcurrencyPeaks();
+    }
+};
+
+template<>
+class WaitThrow<limited_type,isThrowing> {
+protected:
+    void WaitAndThrow(int cnt, const char * /*name*/) {
+        Harness::ConcurrencyTracker ct;
+        if(cnt <= (g_NumThreads - (int)limited_type + 1)/2) {
+            return;
+        }
+        WaitUntilConcurrencyPeaks();
+        ThrowTestException(1);
+    }
+};
+
+template<>
+class WaitThrow<unlimited_type,nonThrowing> {
+protected:
+    void WaitAndThrow(int /*cnt*/, const char * /*name*/) {
+        Harness::ConcurrencyTracker ct;
+        WaitUntilConcurrencyPeaks();
+    }
+};
+
+template<>
+class WaitThrow<unlimited_type,isThrowing> {
+protected:
+    void WaitAndThrow(int /*cnt*/, const char * /*name*/) {
+        Harness::ConcurrencyTracker ct;
+        WaitUntilConcurrencyPeaks();
+        ThrowTestException(1);
+    }
+};
+
+void
+ResetGlobals(bool throwException = true, bool flog = false) {
+    nExceptions = 0;
+    g_TGCCancelled = 0;
+    ResetEhGlobals(throwException, flog);
+}
+
+// -------source_node body ------------------
+template <class OutputType, TestNodeTypeEnum TType>
+class test_source_body : WaitThrow<serial_type, TType> {
+    using WaitThrow<serial_type, TType>::WaitAndThrow;
+    tbb::atomic<int> *my_current_val;
+    int my_mult;
+public:
+    test_source_body(tbb::atomic<int> &my_cnt, int multiplier = 1) : my_current_val(&my_cnt), my_mult(multiplier) {
+        REMARK("- --------- - - -   constructed %lx\n", (size_t)(my_current_val));
+    }
+
+    bool operator()(OutputType & out) {
+        UPDATE_COUNTS();
+        out = OutputType(my_mult * ++(*my_current_val));
+        REMARK("xx(%lx) out == %d\n", (size_t)(my_current_val), (int)out);
+        if(*my_current_val > g_NumItems) {
+            REMARK(" ------ End of the line!\n");
+            *my_current_val = g_NumItems;
+            return false;
+        }
+        WaitAndThrow((int)out,"test_source_body");
+        return true;
+    }
+
+    int count_value() { return (int)*my_current_val; }
+};
+
+template <TestNodeTypeEnum TType>
+class test_source_body<tbb::flow::continue_msg, TType> : WaitThrow<serial_type, TType> {
+    using WaitThrow<serial_type, TType>::WaitAndThrow;
+    tbb::atomic<int> *my_current_val;
+public:
+    test_source_body(tbb::atomic<int> &my_cnt) : my_current_val(&my_cnt) { }
+
+    bool operator()(tbb::flow::continue_msg & out) {
+        UPDATE_COUNTS();
+        int outint = ++(*my_current_val);
+        out = tbb::flow::continue_msg();
+        if(*my_current_val > g_NumItems) {
+            *my_current_val = g_NumItems;
+            return false;
+        }
+        WaitAndThrow(outint,"test_source_body");
+        return true;
+    }
+
+    int count_value() { return (int)*my_current_val; }
+};
+
+// -------{function/continue}_node body ------------------
+template<class InputType, class OutputType, TestNodeTypeEnum T, size_t Conc>
+class absorber_body : WaitThrow<Conc,T> {
+    using WaitThrow<Conc,T>::WaitAndThrow;
+    tbb::atomic<int> *my_count;
+public:
+    absorber_body(tbb::atomic<int> &my_cnt) : my_count(&my_cnt) { }
+    OutputType operator()(const InputType &/*p_in*/) {
+        UPDATE_COUNTS();
+        int out = ++(*my_count);
+        WaitAndThrow(out,"absorber_body");
+        return OutputType();
+    }
+    int count_value() { return *my_count; }
+};
+
+// -------multifunction_node body ------------------
+
+// helper classes
+template<int N,class PortsType>
+struct IssueOutput {
+    typedef typename tbb::flow::tuple_element<N-1,PortsType>::type::output_type my_type;
+
+    static void issue_tuple_element( PortsType &my_ports) {
+        ASSERT(tbb::flow::get<N-1>(my_ports).try_put(my_type()), "Error putting to successor");
+        IssueOutput<N-1,PortsType>::issue_tuple_element(my_ports);
+    }
+};
+
+template<class PortsType>
+struct IssueOutput<1,PortsType> {
+    typedef typename tbb::flow::tuple_element<0,PortsType>::type::output_type my_type;
+
+    static void issue_tuple_element( PortsType &my_ports) {
+        ASSERT(tbb::flow::get<0>(my_ports).try_put(my_type()), "Error putting to successor");
+    }
+};
+
+template<class InputType, class OutputTupleType, TestNodeTypeEnum T, size_t Conc>
+class multifunction_node_body : WaitThrow<Conc,T> {
+    using WaitThrow<Conc,T>::WaitAndThrow;
+    static const int N = tbb::flow::tuple_size<OutputTupleType>::value;
+    typedef typename tbb::flow::multifunction_node<InputType,OutputTupleType> NodeType;
+    typedef typename NodeType::output_ports_type PortsType;
+    tbb::atomic<int> *my_count;
+public:
+    multifunction_node_body(tbb::atomic<int> &my_cnt) : my_count(&my_cnt) { }
+    void operator()(const InputType& /*in*/, PortsType &my_ports) {
+        UPDATE_COUNTS();
+        int out = ++(*my_count);
+        WaitAndThrow(out,"multifunction_node_body");
+        // issue an item to each output port.
+        IssueOutput<N,PortsType>::issue_tuple_element(my_ports);
+    }
+
+    int count_value() { return *my_count; }
+};
+
+// --------- body to sort items in sequencer_node
+template<class BufferItemType>
+struct sequencer_body {
+    size_t operator()(const BufferItemType &s) {
+        ASSERT(s, "sequencer item out of range (== 0)");
+        return size_t(s) - 1;
+    }
+};
+
+// --------- body to compare the "priorities" of objects for priority_queue_node  five priority levels 0-4.
+template<class T>
+struct myLess {
+    bool operator()(const T &t1, const T &t2) {
+        return (int(t1) % 5) < (int(t2) % 5);
+    }
+};
+
+// --------- type for < comparison in priority_queue_node.
+template<class ItemType>
+struct less_body {
+    bool operator()(const ItemType &lhs, const ItemType &rhs) {
+        return (int(lhs) % 3) < (int(rhs) % 3);
+    }
+};
+
+// --------- tag methods for tag_matching join_node
+template<typename TT>
+class tag_func {
+    TT my_mult;
+public:
+    tag_func(TT multiplier) : my_mult(multiplier) { }
+    void operator=( const tag_func& other){my_mult = other.my_mult;}
+    // operator() will return [0 .. Count)
+    tbb::flow::tag_value operator()( TT v) {
+        tbb::flow::tag_value t = tbb::flow::tag_value(v / my_mult);
+        return t;
+    }
+};
+
+// --------- Source body for split_node test.
+template <class OutputTuple, TestNodeTypeEnum TType>
+class tuple_test_source_body : WaitThrow<serial_type, TType> {
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type ItemType0;
+    typedef typename tbb::flow::tuple_element<1,OutputTuple>::type ItemType1;
+    using WaitThrow<serial_type, TType>::WaitAndThrow;
+    tbb::atomic<int> *my_current_val;
+public:
+    tuple_test_source_body(tbb::atomic<int> &my_cnt) : my_current_val(&my_cnt) { }
+
+    bool operator()(OutputTuple & out) {
+        UPDATE_COUNTS();
+        int ival = ++(*my_current_val);
+        out = OutputTuple(ItemType0(ival),ItemType1(ival));
+        if(*my_current_val > g_NumItems) {
+            *my_current_val = g_NumItems;  // jam the final value; we assert on it later.
+            return false;
+        }
+        WaitAndThrow(ival,"tuple_test_source_body");
+        return true;
+    }
+
+    int count_value() { return (int)*my_current_val; }
+};
+
+// ------- end of node bodies
+
+// source_node is only-serial.  source_node can throw, or the function_node can throw.
+// graph being tested is
+//
+//      source_node+---+parallel function_node
+//
+//    After each run the graph is reset(), to test the reset functionality.
+//
+
+
+template<class ItemType, TestNodeTypeEnum srcThrowType, TestNodeTypeEnum absorbThrowType>
+void run_one_source_node_test(bool throwException, bool flog) {
+    typedef test_source_body<ItemType,srcThrowType> src_body_type;
+    typedef absorber_body<ItemType, tbb::flow::continue_msg, absorbThrowType, unlimited_type> parallel_absorb_body_type;
+    tbb::atomic<int> source_body_count;
+    tbb::atomic<int> absorber_body_count;
+    source_body_count = 0;
+    absorber_body_count = 0;
+
+    tbb::flow::graph g;
+
+    g_Master = Harness::CurrentTid();
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+
+    tbb::flow::source_node<ItemType> sn(g, src_body_type(source_body_count),/*is_active*/false);
+    parallel_absorb_body_type ab2(absorber_body_count);
+    tbb::flow::function_node<ItemType> parallel_fn(g,tbb::flow::unlimited,ab2);
+    make_edge(sn, parallel_fn);
+    for(int runcnt = 0; runcnt < 2; ++runcnt) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                sn.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                sn.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int src_cnt = tbb::flow::copy_body<src_body_type>(sn).count_value();
+        int sink_cnt = tbb::flow::copy_body<parallel_absorb_body_type>(parallel_fn).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception flag in flow::graph not set");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "canceled flag not set");
+            ASSERT(src_cnt <= g_NumItems, "Too many source_node items emitted");
+            ASSERT(sink_cnt <= src_cnt, "Too many source_node items received");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(src_cnt == g_NumItems, "Incorrect # source_node items emitted");
+            ASSERT(sink_cnt == src_cnt, "Incorrect # source_node items received");
+        }
+        g.reset();  // resets the body of the source_node and the absorb_nodes.
+        source_body_count = 0;
+        absorber_body_count = 0;
+        ASSERT(!g.exception_thrown(), "Reset didn't clear exception_thrown()");
+        ASSERT(!g.is_cancelled(), "Reset didn't clear is_cancelled()");
+        src_cnt = tbb::flow::copy_body<src_body_type>(sn).count_value();
+        sink_cnt = tbb::flow::copy_body<parallel_absorb_body_type>(parallel_fn).count_value();
+        ASSERT(src_cnt == 0, "source_node count not reset");
+        ASSERT(sink_cnt == 0, "sink_node count not reset");
+    }
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}  // run_one_source_node_test
+
+
+template<class ItemType, TestNodeTypeEnum srcThrowType, TestNodeTypeEnum absorbThrowType>
+void run_source_node_test() {
+    run_one_source_node_test<ItemType,srcThrowType,absorbThrowType>(false,false);
+    run_one_source_node_test<ItemType,srcThrowType,absorbThrowType>(true,false);
+    run_one_source_node_test<ItemType,srcThrowType,absorbThrowType>(true,true);
+}  // run_source_node_test
+
+void test_source_node() {
+    REMARK("Testing source_node\n");
+    check_type<int>::check_type_counter = 0;
+    g_Wakeup_Msg = "source_node(1): Missed wakeup or machine is overloaded?";
+    run_source_node_test<check_type<int>, isThrowing, nonThrowing>();
+    ASSERT(!check_type<int>::check_type_counter, "Some items leaked in test");
+    g_Wakeup_Msg = "source_node(2): Missed wakeup or machine is overloaded?";
+    run_source_node_test<int, isThrowing, nonThrowing>();
+    g_Wakeup_Msg = "source_node(3): Missed wakeup or machine is overloaded?";
+    run_source_node_test<int, nonThrowing, isThrowing>();
+    g_Wakeup_Msg = "source_node(4): Missed wakeup or machine is overloaded?";
+    run_source_node_test<int, isThrowing, isThrowing>();
+    g_Wakeup_Msg = "source_node(5): Missed wakeup or machine is overloaded?";
+    run_source_node_test<check_type<int>, isThrowing, isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+    ASSERT(!check_type<int>::check_type_counter, "Some items leaked in test");
+}
+
+// -------- utilities & types to test function_node and multifunction_node.
+
+// need to tell the template which node type I am using so it attaches successors correctly.
+enum NodeFetchType { func_node_type, multifunc_node_type };
+
+template<class NodeType, class ItemType, int indx, NodeFetchType NFT>
+struct AttachPoint;
+
+template<class NodeType, class ItemType, int indx>
+struct AttachPoint<NodeType,ItemType,indx,multifunc_node_type> {
+    static tbb::flow::sender<ItemType> &GetSender(NodeType &n) {
+        return tbb::flow::output_port<indx>(n);
+    }
+};
+
+template<class NodeType, class ItemType, int indx>
+struct AttachPoint<NodeType,ItemType,indx,func_node_type> {
+    static tbb::flow::sender<ItemType> &GetSender(NodeType &n) {
+        return n;
+    }
+};
+
+
+// common template for running function_node, multifunction_node.  continue_node
+// has different firing requirements, so it needs a different graph topology.
+template<
+    class SourceNodeType,
+    class SourceNodeBodyType0,
+    class SourceNodeBodyType1,
+    NodeFetchType NFT,
+    class TestNodeType,
+    class TestNodeBodyType,
+    class TypeToSink0,          // what kind of item are we sending to sink0
+    class TypeToSink1,          // what kind of item are we sending to sink1
+    class SinkNodeType0,        // will be same for function;
+    class SinkNodeType1,        // may differ for multifunction_node
+    class SinkNodeBodyType0,
+    class SinkNodeBodyType1,
+    size_t Conc
+    >
+void
+run_one_functype_node_test(bool throwException, bool flog, const char * /*name*/) {
+
+    char mymsg[132];
+    char *saved_msg = const_cast<char *>(g_Wakeup_Msg);
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source0_count;
+    tbb::atomic<int> source1_count;
+    tbb::atomic<int> sink0_count;
+    tbb::atomic<int> sink1_count;
+    tbb::atomic<int> test_count;
+    source0_count = source1_count = sink0_count = sink1_count = test_count = 0;
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+
+    g_Master = Harness::CurrentTid();
+    SourceNodeType source0(g, SourceNodeBodyType0(source0_count),/*is_active*/false);
+    SourceNodeType source1(g, SourceNodeBodyType1(source1_count),/*is_active*/false);
+    TestNodeType node_to_test(g, Conc, TestNodeBodyType(test_count));
+    SinkNodeType0 sink0(g,tbb::flow::unlimited,SinkNodeBodyType0(sink0_count));
+    SinkNodeType1 sink1(g,tbb::flow::unlimited,SinkNodeBodyType1(sink1_count));
+    make_edge(source0, node_to_test);
+    make_edge(source1, node_to_test);
+    make_edge(AttachPoint<TestNodeType, TypeToSink0, 0, NFT>::GetSender(node_to_test), sink0);
+    make_edge(AttachPoint<TestNodeType, TypeToSink1, 1, NFT>::GetSender(node_to_test), sink1);
+
+    for(int iter = 0; iter < 2; ++iter) {  // run, reset, run again
+        sprintf(mymsg, "%s iter=%d, threads=%d, throw=%s, flog=%s", saved_msg, iter, g_NumThreads,
+               throwException?"T":"F", flog?"T":"F");
+        g_Wakeup_Msg = mymsg;
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source0.activate();
+                source1.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source0.activate();
+                source1.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb0_cnt = tbb::flow::copy_body<SourceNodeBodyType0>(source0).count_value();
+        int sb1_cnt = tbb::flow::copy_body<SourceNodeBodyType1>(source1).count_value();
+        int t_cnt   = tbb::flow::copy_body<TestNodeBodyType>(node_to_test).count_value();
+        int nb0_cnt = tbb::flow::copy_body<SinkNodeBodyType0>(sink0).count_value();
+        int nb1_cnt = tbb::flow::copy_body<SinkNodeBodyType1>(sink1).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb0_cnt + sb1_cnt <= 2*g_NumItems, "Too many items sent by sources");
+            ASSERT(sb0_cnt + sb1_cnt >= t_cnt, "Too many items received by test node");
+            ASSERT(nb0_cnt + nb1_cnt <= t_cnt*2, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb0_cnt + sb1_cnt == 2*g_NumItems, "Missing invocations of source_nodes");
+            ASSERT(t_cnt == 2*g_NumItems, "Not all items reached test node");
+            ASSERT(nb0_cnt == 2*g_NumItems && nb1_cnt == 2*g_NumItems, "Missing items in absorbers");
+        }
+        g.reset();  // resets the body of the source_nodes, test_node and the absorb_nodes.
+        source0_count = source1_count = sink0_count = sink1_count = test_count = 0;
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType0>(source0).count_value(),"Reset source 0 failed");
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType1>(source1).count_value(),"Reset source 1 failed");
+        ASSERT(0 == tbb::flow::copy_body<TestNodeBodyType>(node_to_test).count_value(),"Reset test_node failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType0>(sink0).count_value(),"Reset sink 0 failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType1>(sink1).count_value(),"Reset sink 1 failed");
+
+        g_Wakeup_Msg = saved_msg;
+    }
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+//  Test function_node
+//
+// graph being tested is
+//
+//        source_node -\                 /- parallel function_node
+//                      \               /
+//                       +function_node+
+//                      /               \                                  x
+//        source_node -/                 \- parallel function_node
+//
+//    After each run the graph is reset(), to test the reset functionality.
+//
+template<
+    TestNodeTypeEnum SType1,                          // does source node 1 throw?
+    TestNodeTypeEnum SType2,                          // does source node 2 throw?
+    class Item12,                                     // type of item passed between sources and test node
+    TestNodeTypeEnum FType,                           // does function node throw?
+    class Item23,                                     // type passed from function_node to sink nodes
+    TestNodeTypeEnum NType1,                          // does sink node 1 throw?
+    TestNodeTypeEnum NType2,                          // does sink node 1 throw?
+    class NodePolicy,                                 // rejecting,queueing
+    size_t Conc                                       // is node concurrent? {serial | limited | unlimited}
+>
+void run_function_node_test() {
+
+    typedef test_source_body<Item12,SType1> SBodyType1;
+    typedef test_source_body<Item12,SType2> SBodyType2;
+    typedef absorber_body<Item12, Item23, FType, Conc> TestBodyType;
+    typedef absorber_body<Item23,tbb::flow::continue_msg, NType1, unlimited_type> SinkBodyType1;
+    typedef absorber_body<Item23,tbb::flow::continue_msg, NType2, unlimited_type> SinkBodyType2;
+
+    typedef tbb::flow::source_node<Item12> SrcType;
+    typedef tbb::flow::function_node<Item12, Item23, NodePolicy> TestType;
+    typedef tbb::flow::function_node<Item23,tbb::flow::continue_msg> SnkType;
+
+    for(int i = 0; i < 4; ++i ) {
+        if(i != 2) {  // doesn't make sense to flog a non-throwing test
+            bool doThrow = (i & 0x1) != 0;
+            bool doFlog = (i & 0x2) != 0;
+            run_one_functype_node_test<
+                /*SourceNodeType*/      SrcType,
+                /*SourceNodeBodyType0*/ SBodyType1,
+                /*SourceNodeBodyType1*/ SBodyType2,
+                /* NFT */               func_node_type,
+                /*TestNodeType*/        TestType,
+                /*TestNodeBodyType*/    TestBodyType,
+                /*TypeToSink0 */        Item23,
+                /*TypeToSink1 */        Item23,
+                /*SinkNodeType0*/       SnkType,
+                /*SinkNodeType1*/       SnkType,
+                /*SinkNodeBodyType1*/   SinkBodyType1,
+                /*SinkNodeBodyType2*/   SinkBodyType2,
+                /*Conc*/                Conc>
+                    (doThrow,doFlog,"function_node");
+        }
+    }
+}  // run_function_node_test
+
+void test_function_node() {
+    REMARK("Testing function_node\n");
+    // serial rejecting
+    g_Wakeup_Msg = "function_node(1a): Missed wakeup or machine is overloaded?";
+    run_function_node_test<isThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, nonThrowing, tbb::flow::rejecting, serial_type>();
+    g_Wakeup_Msg = "function_node(1b): Missed wakeup or machine is overloaded?";
+    run_function_node_test<nonThrowing, nonThrowing, int, isThrowing, int, nonThrowing, nonThrowing, tbb::flow::rejecting, serial_type>();
+    g_Wakeup_Msg = "function_node(1c): Missed wakeup or machine is overloaded?";
+    run_function_node_test<nonThrowing, nonThrowing, int, nonThrowing, int, isThrowing, nonThrowing, tbb::flow::rejecting, serial_type>();
+
+    // serial queueing
+    g_Wakeup_Msg = "function_node(2): Missed wakeup or machine is overloaded?";
+    run_function_node_test<isThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, isThrowing, int, nonThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, nonThrowing, int, isThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    check_type<int>::check_type_counter = 0;
+    run_function_node_test<nonThrowing, nonThrowing, check_type<int>, nonThrowing, check_type<int>, isThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    ASSERT(!check_type<int>::check_type_counter, "Some items leaked in test");
+
+    // unlimited parallel rejecting
+    g_Wakeup_Msg = "function_node(3): Missed wakeup or machine is overloaded?";
+    run_function_node_test<isThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, nonThrowing, tbb::flow::rejecting, unlimited_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, isThrowing, int, nonThrowing, nonThrowing, tbb::flow::rejecting, unlimited_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, isThrowing, tbb::flow::rejecting, unlimited_type>();
+
+    // limited parallel rejecting
+    g_Wakeup_Msg = "function_node(4): Missed wakeup or machine is overloaded?";
+    run_function_node_test<isThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, nonThrowing, tbb::flow::rejecting, limited_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, isThrowing, int, nonThrowing, nonThrowing, tbb::flow::rejecting, (size_t)limited_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, isThrowing, tbb::flow::rejecting, (size_t)limited_type>();
+
+    // limited parallel queueing
+    g_Wakeup_Msg = "function_node(5): Missed wakeup or machine is overloaded?";
+    run_function_node_test<isThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, nonThrowing, tbb::flow::queueing, (size_t)limited_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, isThrowing, int, nonThrowing, nonThrowing, tbb::flow::queueing, (size_t)limited_type>();
+    run_function_node_test<nonThrowing, nonThrowing, int, nonThrowing, int, nonThrowing, isThrowing, tbb::flow::queueing, (size_t)limited_type>();
+
+    // everyone throwing
+    g_Wakeup_Msg = "function_node(6): Missed wakeup or machine is overloaded?";
+    run_function_node_test<isThrowing, isThrowing, int, isThrowing, int, isThrowing, isThrowing, tbb::flow::rejecting, unlimited_type>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// ----------------------------------- multifunction_node ----------------------------------
+//  Test multifunction_node.
+//
+// graph being tested is
+//
+//        source_node -\                      /- parallel function_node
+//                      \                    /
+//                       +multifunction_node+
+//                      /                    \                                  x
+//        source_node -/                      \- parallel function_node
+//
+//    After each run the graph is reset(), to test the reset functionality.  The
+//    multifunction_node will put an item to each successor for every item
+//    received.
+//
+template<
+    TestNodeTypeEnum SType0,                          // does source node 1 throw?
+    TestNodeTypeEnum SType1,                          // does source node 2 thorw?
+    class Item12,                                 // type of item passed between sources and test node
+    TestNodeTypeEnum FType,                           // does multifunction node throw?
+    class ItemTuple,                              // tuple of types passed from multifunction_node to sink nodes
+    TestNodeTypeEnum NType1,                          // does sink node 1 throw?
+    TestNodeTypeEnum NType2,                          // does sink node 2 throw?
+    class  NodePolicy,                            // rejecting,queueing
+    size_t Conc                                   // is node concurrent? {serial | limited | unlimited}
+>
+void run_multifunction_node_test() {
+
+    typedef typename tbb::flow::tuple_element<0,ItemTuple>::type Item23Type0;
+    typedef typename tbb::flow::tuple_element<1,ItemTuple>::type Item23Type1;
+    typedef test_source_body<Item12,SType0> SBodyType1;
+    typedef test_source_body<Item12,SType1> SBodyType2;
+    typedef multifunction_node_body<Item12, ItemTuple, FType, Conc> TestBodyType;
+    typedef absorber_body<Item23Type0,tbb::flow::continue_msg, NType1, unlimited_type> SinkBodyType1;
+    typedef absorber_body<Item23Type1,tbb::flow::continue_msg, NType2, unlimited_type> SinkBodyType2;
+
+    typedef tbb::flow::source_node<Item12> SrcType;
+    typedef tbb::flow::multifunction_node<Item12, ItemTuple, NodePolicy> TestType;
+    typedef tbb::flow::function_node<Item23Type0,tbb::flow::continue_msg> SnkType0;
+    typedef tbb::flow::function_node<Item23Type1,tbb::flow::continue_msg> SnkType1;
+
+    for(int i = 0; i < 4; ++i ) {
+        if(i != 2) {  // doesn't make sense to flog a non-throwing test
+            bool doThrow = (i & 0x1) != 0;
+            bool doFlog = (i & 0x2) != 0;
+    run_one_functype_node_test<
+        /*SourceNodeType*/      SrcType,
+        /*SourceNodeBodyType0*/ SBodyType1,
+        /*SourceNodeBodyType1*/ SBodyType2,
+        /*NFT*/                 multifunc_node_type,
+        /*TestNodeType*/        TestType,
+        /*TestNodeBodyType*/    TestBodyType,
+        /*TypeToSink0*/         Item23Type0,
+        /*TypeToSink1*/         Item23Type1,
+        /*SinkNodeType0*/       SnkType0,
+        /*SinkNodeType1*/       SnkType1,
+        /*SinkNodeBodyType0*/   SinkBodyType1,
+        /*SinkNodeBodyType1*/   SinkBodyType2,
+        /*Conc*/                Conc>
+            (doThrow,doFlog,"multifunction_node");
+        }
+    }
+}  // run_multifunction_node_test
+
+void test_multifunction_node() {
+    REMARK("Testing multifunction_node\n");
+    g_Wakeup_Msg = "multifunction_node(source throws,rejecting,serial): Missed wakeup or machine is overloaded?";
+    // serial rejecting
+    run_multifunction_node_test<isThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,float>, nonThrowing, nonThrowing, tbb::flow::rejecting, serial_type>();
+    g_Wakeup_Msg = "multifunction_node(test throws,rejecting,serial): Missed wakeup or machine is overloaded?";
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, isThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::rejecting, serial_type>();
+    g_Wakeup_Msg = "multifunction_node(sink throws,rejecting,serial): Missed wakeup or machine is overloaded?";
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, isThrowing, nonThrowing, tbb::flow::rejecting, serial_type>();
+
+    g_Wakeup_Msg = "multifunction_node(2): Missed wakeup or machine is overloaded?";
+    // serial queueing
+    run_multifunction_node_test<isThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, isThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, isThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    check_type<int>::check_type_counter = 0;
+    run_multifunction_node_test<nonThrowing, nonThrowing, check_type<int>, nonThrowing, tbb::flow::tuple<check_type<int>, check_type<int> >, isThrowing, nonThrowing, tbb::flow::queueing, serial_type>();
+    ASSERT(!check_type<int>::check_type_counter, "Some items leaked in test");
+
+    g_Wakeup_Msg = "multifunction_node(3): Missed wakeup or machine is overloaded?";
+    // unlimited parallel rejecting
+    run_multifunction_node_test<isThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::rejecting, unlimited_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, isThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::rejecting, unlimited_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, isThrowing, tbb::flow::rejecting, unlimited_type>();
+
+    g_Wakeup_Msg = "multifunction_node(4): Missed wakeup or machine is overloaded?";
+    // limited parallel rejecting
+    run_multifunction_node_test<isThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::rejecting, limited_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, isThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::rejecting, (size_t)limited_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, isThrowing, tbb::flow::rejecting, (size_t)limited_type>();
+
+    g_Wakeup_Msg = "multifunction_node(5): Missed wakeup or machine is overloaded?";
+    // limited parallel queueing
+    run_multifunction_node_test<isThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::queueing, (size_t)limited_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, isThrowing, tbb::flow::tuple<int,int>, nonThrowing, nonThrowing, tbb::flow::queueing, (size_t)limited_type>();
+    run_multifunction_node_test<nonThrowing, nonThrowing, int, nonThrowing, tbb::flow::tuple<int,int>, nonThrowing, isThrowing, tbb::flow::queueing, (size_t)limited_type>();
+
+    g_Wakeup_Msg = "multifunction_node(6): Missed wakeup or machine is overloaded?";
+    // everyone throwing
+    run_multifunction_node_test<isThrowing, isThrowing, int, isThrowing, tbb::flow::tuple<int,int>, isThrowing, isThrowing, tbb::flow::rejecting, unlimited_type>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+//
+// Continue node has T predecessors.  when it receives messages (continue_msg) on T predecessors
+// it executes the body of the node, and forwards a continue_msg to its successors.
+// However many predecessors the continue_node has, that's how many continue_msgs it receives
+// on input before forwarding a message.
+//
+// The graph will look like
+//
+//                                          +broadcast_node+
+//                                         /                \             ___
+//      source_node+------>+broadcast_node+                  +continue_node+--->+absorber
+//                                         \                /
+//                                          +broadcast_node+
+//
+// The continue_node has unlimited parallelism, no input buffering, and broadcasts to successors.
+// The absorber is parallel, so each item emitted by the source will result in one thread
+// spinning.  So for N threads we pass N-1 continue_messages, then spin wait and then throw if
+// we are allowed to.
+
+template < class SourceNodeType, class SourceNodeBodyType, class TTestNodeType, class TestNodeBodyType,
+        class SinkNodeType, class SinkNodeBodyType>
+void run_one_continue_node_test (bool throwException, bool flog) {
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source_count;
+    tbb::atomic<int> test_count;
+    tbb::atomic<int> sink_count;
+    source_count = test_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+    g_Master = Harness::CurrentTid();
+    SourceNodeType source(g, SourceNodeBodyType(source_count),/*is_active*/false);
+    TTestNodeType node_to_test(g, TestNodeBodyType(test_count));
+    SinkNodeType sink(g,tbb::flow::unlimited,SinkNodeBodyType(sink_count));
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> b1(g), b2(g), b3(g);
+    make_edge(source, b1);
+    make_edge(b1,b2);
+    make_edge(b1,b3);
+    make_edge(b2,node_to_test);
+    make_edge(b3,node_to_test);
+    make_edge(node_to_test, sink);
+    for(int iter = 0; iter < 2; ++iter) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb_cnt = tbb::flow::copy_body<SourceNodeBodyType>(source).count_value();
+        int t_cnt   = tbb::flow::copy_body<TestNodeBodyType>(node_to_test).count_value();
+        int nb_cnt = tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb_cnt <= g_NumItems, "Too many items sent by sources");
+            ASSERT(sb_cnt >= t_cnt, "Too many items received by test node");
+            ASSERT(nb_cnt <= t_cnt, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb_cnt == g_NumItems, "Missing invocations of source_node");
+            ASSERT(t_cnt == g_NumItems, "Not all items reached test node");
+            ASSERT(nb_cnt == g_NumItems, "Missing items in absorbers");
+        }
+        g.reset();  // resets the body of the source_nodes, test_node and the absorb_nodes.
+        source_count = test_count = sink_count = 0;
+        ASSERT(0 == (int)test_count, "Atomic wasn't reset properly");
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType>(source).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<TestNodeBodyType>(node_to_test).count_value(),"Reset test_node failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value(),"Reset sink failed");
+    }
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+template<
+    class ItemType,
+    TestNodeTypeEnum SType,   // does source node throw?
+    TestNodeTypeEnum CType,   // does continue_node throw?
+    TestNodeTypeEnum AType>    // does absorber throw
+void run_continue_node_test() {
+    typedef test_source_body<tbb::flow::continue_msg,SType> SBodyType;
+    typedef absorber_body<tbb::flow::continue_msg,ItemType,CType,unlimited_type> ContBodyType;
+    typedef absorber_body<ItemType,tbb::flow::continue_msg, AType, unlimited_type> SinkBodyType;
+
+    typedef tbb::flow::source_node<tbb::flow::continue_msg> SrcType;
+    typedef tbb::flow::continue_node<ItemType> TestType;
+    typedef tbb::flow::function_node<ItemType,tbb::flow::continue_msg> SnkType;
+
+    for(int i = 0; i < 4; ++i ) {
+        if(i == 2) continue;  // don't run (false,true); it doesn't make sense.
+        bool doThrow = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_continue_node_test<
+            /*SourceNodeType*/      SrcType,
+            /*SourceNodeBodyType*/  SBodyType,
+            /*TestNodeType*/        TestType,
+            /*TestNodeBodyType*/    ContBodyType,
+            /*SinkNodeType*/        SnkType,
+            /*SinkNodeBodyType*/    SinkBodyType>
+            (doThrow,doFlog);
+    }
+}
+
+//
+void test_continue_node() {
+    REMARK("Testing continue_node\n");
+    g_Wakeup_Msg = "buffer_node(non,is,non): Missed wakeup or machine is overloaded?";
+    run_continue_node_test<int,nonThrowing,isThrowing,nonThrowing>();
+    g_Wakeup_Msg = "buffer_node(non,non,is): Missed wakeup or machine is overloaded?";
+    run_continue_node_test<int,nonThrowing,nonThrowing,isThrowing>();
+    g_Wakeup_Msg = "buffer_node(is,non,non): Missed wakeup or machine is overloaded?";
+    run_continue_node_test<int,isThrowing,nonThrowing,nonThrowing>();
+    g_Wakeup_Msg = "buffer_node(is,is,is): Missed wakeup or machine is overloaded?";
+    run_continue_node_test<int,isThrowing,isThrowing,isThrowing>();
+    check_type<double>::check_type_counter = 0;
+    run_continue_node_test<check_type<double>,isThrowing,isThrowing,isThrowing>();
+    ASSERT(!check_type<double>::check_type_counter, "Dropped objects in continue_node test");
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// ---------- buffer_node queue_node overwrite_node --------------
+
+template<
+    class BufferItemType,       //
+    class SourceNodeType,
+    class SourceNodeBodyType,
+    class TestNodeType,
+    class SinkNodeType,
+    class SinkNodeBodyType >
+void run_one_buffer_node_test(bool throwException,bool flog) {
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source_count;
+    tbb::atomic<int> sink_count;
+    source_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+    g_Master = Harness::CurrentTid();
+    SourceNodeType source(g, SourceNodeBodyType(source_count),/*is_active*/false);
+    TestNodeType node_to_test(g);
+    SinkNodeType sink(g,tbb::flow::unlimited,SinkNodeBodyType(sink_count));
+    make_edge(source,node_to_test);
+    make_edge(node_to_test, sink);
+    for(int iter = 0; iter < 2; ++iter) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb_cnt = tbb::flow::copy_body<SourceNodeBodyType>(source).count_value();
+        int nb_cnt = tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb_cnt <= g_NumItems, "Too many items sent by sources");
+            ASSERT(nb_cnt <= sb_cnt, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb_cnt == g_NumItems, "Missing invocations of source_node");
+            ASSERT(nb_cnt == g_NumItems, "Missing items in absorbers");
+        }
+        if(iter == 0) {
+            remove_edge(node_to_test, sink);
+            node_to_test.try_put(BufferItemType());
+            g.wait_for_all();
+            g.reset();
+            source_count = sink_count = 0;
+            BufferItemType tmp;
+            ASSERT(!node_to_test.try_get(tmp), "node not empty");
+            make_edge(node_to_test, sink);
+            g.wait_for_all();
+        }
+        else {
+            g.reset();
+            source_count = sink_count = 0;
+        }
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType>(source).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value(),"Reset sink failed");
+    }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+template<class BufferItemType,
+         TestNodeTypeEnum SourceThrowType,
+         TestNodeTypeEnum SinkThrowType>
+void run_buffer_queue_and_overwrite_node_test() {
+    typedef test_source_body<BufferItemType,SourceThrowType> SourceBodyType;
+    typedef absorber_body<BufferItemType,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType;
+
+    typedef tbb::flow::source_node<BufferItemType> SrcType;
+    typedef tbb::flow::buffer_node<BufferItemType> BufType;
+    typedef tbb::flow::queue_node<BufferItemType>  QueType;
+    typedef tbb::flow::overwrite_node<BufferItemType>  OvrType;
+    typedef tbb::flow::function_node<BufferItemType,tbb::flow::continue_msg> SnkType;
+
+    for(int i = 0; i < 4; ++i) {
+        if(i == 2) continue;  // no need to test flog w/o throws
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+#if TBB_RUN_BUFFERING_TEST
+        run_one_buffer_node_test<
+            /* class BufferItemType*/     BufferItemType,
+            /*class SourceNodeType*/      SrcType,
+            /*class SourceNodeBodyType*/  SourceBodyType,
+            /*class TestNodeType*/        BufType,
+            /*class SinkNodeType*/        SnkType,
+            /*class SinkNodeBodyType*/    SinkBodyType
+            >(throwException, doFlog);
+        run_one_buffer_node_test<
+            /* class BufferItemType*/     BufferItemType,
+            /*class SourceNodeType*/      SrcType,
+            /*class SourceNodeBodyType*/  SourceBodyType,
+            /*class TestNodeType*/        QueType,
+            /*class SinkNodeType*/        SnkType,
+            /*class SinkNodeBodyType*/    SinkBodyType
+            >(throwException, doFlog);
+#endif
+        run_one_buffer_node_test<
+            /* class BufferItemType*/     BufferItemType,
+            /*class SourceNodeType*/      SrcType,
+            /*class SourceNodeBodyType*/  SourceBodyType,
+            /*class TestNodeType*/        OvrType,
+            /*class SinkNodeType*/        SnkType,
+            /*class SinkNodeBodyType*/    SinkBodyType
+            >(throwException, doFlog);
+    }
+}
+
+void test_buffer_queue_and_overwrite_node() {
+    REMARK("Testing buffer_node, queue_node and overwrite_node\n");
+#if TBB_RUN_BUFFERING_TEST
+#else
+    REMARK("skip buffer and queue test (known issue)\n");
+#endif
+    g_Wakeup_Msg = "buffer, queue, overwrite(is,non): Missed wakeup or machine is overloaded?";
+    run_buffer_queue_and_overwrite_node_test<int,isThrowing,nonThrowing>();
+    g_Wakeup_Msg = "buffer, queue, overwrite(non,is): Missed wakeup or machine is overloaded?";
+    run_buffer_queue_and_overwrite_node_test<int,nonThrowing,isThrowing>();
+    g_Wakeup_Msg = "buffer, queue, overwrite(is,is): Missed wakeup or machine is overloaded?";
+    run_buffer_queue_and_overwrite_node_test<int,isThrowing,isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// ---------- sequencer_node -------------------------
+
+
+template<
+    class BufferItemType,       //
+    class SourceNodeType,
+    class SourceNodeBodyType,
+    class TestNodeType,
+    class SeqBodyType,
+    class SinkNodeType,
+    class SinkNodeBodyType >
+void run_one_sequencer_node_test(bool throwException,bool flog) {
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source_count;
+    tbb::atomic<int> sink_count;
+    source_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+    g_Master = Harness::CurrentTid();
+    SourceNodeType source(g, SourceNodeBodyType(source_count),/*is_active*/false);
+    TestNodeType node_to_test(g,SeqBodyType());
+    SinkNodeType sink(g,tbb::flow::unlimited,SinkNodeBodyType(sink_count));
+    make_edge(source,node_to_test);
+    make_edge(node_to_test, sink);
+    for(int iter = 0; iter < 2; ++iter) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb_cnt = tbb::flow::copy_body<SourceNodeBodyType>(source).count_value();
+        int nb_cnt = tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb_cnt <= g_NumItems, "Too many items sent by sources");
+            ASSERT(nb_cnt <= sb_cnt, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb_cnt == g_NumItems, "Missing invocations of source_node");
+            ASSERT(nb_cnt == g_NumItems, "Missing items in absorbers");
+        }
+        if(iter == 0) {
+            remove_edge(node_to_test, sink);
+            node_to_test.try_put(BufferItemType(g_NumItems + 1));
+            node_to_test.try_put(BufferItemType(1));
+            g.wait_for_all();
+            g.reset();
+            source_count = sink_count = 0;
+            make_edge(node_to_test, sink);
+            g.wait_for_all();
+        }
+        else {
+            g.reset();
+            source_count = sink_count = 0;
+        }
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType>(source).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value(),"Reset sink failed");
+    }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+template<class BufferItemType,
+         TestNodeTypeEnum SourceThrowType,
+         TestNodeTypeEnum SinkThrowType>
+void run_sequencer_node_test() {
+    typedef test_source_body<BufferItemType,SourceThrowType> SourceBodyType;
+    typedef absorber_body<BufferItemType,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType;
+    typedef sequencer_body<BufferItemType> SeqBodyType;
+
+    typedef tbb::flow::source_node<BufferItemType> SrcType;
+    typedef tbb::flow::sequencer_node<BufferItemType>  SeqType;
+    typedef tbb::flow::function_node<BufferItemType,tbb::flow::continue_msg> SnkType;
+
+    for(int i = 0; i < 4; ++i) {
+        if(i == 2) continue;  // no need to test flog w/o throws
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_sequencer_node_test<
+            /* class BufferItemType*/     BufferItemType,
+            /*class SourceNodeType*/      SrcType,
+            /*class SourceNodeBodyType*/  SourceBodyType,
+            /*class TestNodeType*/        SeqType,
+            /*class SeqBodyType*/         SeqBodyType,
+            /*class SinkNodeType*/        SnkType,
+            /*class SinkNodeBodyType*/    SinkBodyType
+            >(throwException, doFlog);
+    }
+}
+
+
+
+void test_sequencer_node() {
+    REMARK("Testing sequencer_node\n");
+    g_Wakeup_Msg = "sequencer_node(is,non): Missed wakeup or machine is overloaded?";
+    run_sequencer_node_test<int, isThrowing,nonThrowing>();
+    check_type<int>::check_type_counter = 0;
+    g_Wakeup_Msg = "sequencer_node(non,is): Missed wakeup or machine is overloaded?";
+    run_sequencer_node_test<check_type<int>, nonThrowing,isThrowing>();
+    ASSERT(!check_type<int>::check_type_counter, "Dropped objects in sequencer_node test");
+    g_Wakeup_Msg = "sequencer_node(is,is): Missed wakeup or machine is overloaded?";
+    run_sequencer_node_test<int, isThrowing,isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// ------------ priority_queue_node ------------------
+
+template<
+    class BufferItemType,
+    class SourceNodeType,
+    class SourceNodeBodyType,
+    class TestNodeType,
+    class SinkNodeType,
+    class SinkNodeBodyType >
+void run_one_priority_queue_node_test(bool throwException,bool flog) {
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source_count;
+    tbb::atomic<int> sink_count;
+    source_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+    g_Master = Harness::CurrentTid();
+    SourceNodeType source(g, SourceNodeBodyType(source_count),/*is_active*/false);
+
+    TestNodeType node_to_test(g);
+
+    SinkNodeType sink(g,tbb::flow::unlimited,SinkNodeBodyType(sink_count));
+
+    make_edge(source,node_to_test);
+    make_edge(node_to_test, sink);
+    for(int iter = 0; iter < 2; ++iter) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb_cnt = tbb::flow::copy_body<SourceNodeBodyType>(source).count_value();
+        int nb_cnt = tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb_cnt <= g_NumItems, "Too many items sent by sources");
+            ASSERT(nb_cnt <= sb_cnt, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb_cnt == g_NumItems, "Missing invocations of source_node");
+            ASSERT(nb_cnt == g_NumItems, "Missing items in absorbers");
+        }
+        if(iter == 0) {
+            remove_edge(node_to_test, sink);
+            node_to_test.try_put(BufferItemType(g_NumItems + 1));
+            node_to_test.try_put(BufferItemType(g_NumItems + 2));
+            node_to_test.try_put(BufferItemType());
+            g.wait_for_all();
+            g.reset();
+            source_count = sink_count = 0;
+            make_edge(node_to_test, sink);
+            g.wait_for_all();
+        }
+        else {
+            g.reset();
+            source_count = sink_count = 0;
+        }
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType>(source).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value(),"Reset sink failed");
+    }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+template<class BufferItemType,
+         TestNodeTypeEnum SourceThrowType,
+         TestNodeTypeEnum SinkThrowType>
+void run_priority_queue_node_test() {
+    typedef test_source_body<BufferItemType,SourceThrowType> SourceBodyType;
+    typedef absorber_body<BufferItemType,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType;
+    typedef less_body<BufferItemType> LessBodyType;
+
+    typedef tbb::flow::source_node<BufferItemType> SrcType;
+    typedef tbb::flow::priority_queue_node<BufferItemType,LessBodyType>  PrqType;
+    typedef tbb::flow::function_node<BufferItemType,tbb::flow::continue_msg> SnkType;
+
+    for(int i = 0; i < 4; ++i) {
+        if(i == 2) continue;  // no need to test flog w/o throws
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_priority_queue_node_test<
+            /* class BufferItemType*/     BufferItemType,
+            /*class SourceNodeType*/      SrcType,
+            /*class SourceNodeBodyType*/  SourceBodyType,
+            /*class TestNodeType*/        PrqType,
+            /*class SinkNodeType*/        SnkType,
+            /*class SinkNodeBodyType*/    SinkBodyType
+            >(throwException, doFlog);
+    }
+}
+
+void test_priority_queue_node() {
+    REMARK("Testing priority_queue_node\n");
+    g_Wakeup_Msg = "priority_queue_node(is,non): Missed wakeup or machine is overloaded?";
+    run_priority_queue_node_test<int, isThrowing,nonThrowing>();
+    check_type<int>::check_type_counter = 0;
+    g_Wakeup_Msg = "priority_queue_node(non,is): Missed wakeup or machine is overloaded?";
+    run_priority_queue_node_test<check_type<int>, nonThrowing,isThrowing>();
+    ASSERT(!check_type<int>::check_type_counter, "Dropped objects in priority_queue_node test");
+    g_Wakeup_Msg = "priority_queue_node(is,is): Missed wakeup or machine is overloaded?";
+    run_priority_queue_node_test<int, isThrowing,isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// ------------------- join_node ----------------
+template<class JP> struct graph_policy_name{
+    static const char* name() {return "unknown"; }
+};
+template<> struct graph_policy_name<tbb::flow::queueing>  {
+    static const char* name() {return "queueing"; }
+};
+template<> struct graph_policy_name<tbb::flow::reserving> {
+    static const char* name() {return "reserving"; }
+};
+template<> struct graph_policy_name<tbb::flow::tag_matching> {
+    static const char* name() {return "tag_matching"; }
+};
+
+
+template<
+    class JP,
+    class OutputTuple,
+    class SourceType0,
+    class SourceBodyType0,
+    class SourceType1,
+    class SourceBodyType1,
+    class TestJoinType,
+    class SinkType,
+    class SinkBodyType
+    >
+struct run_one_join_node_test {
+    run_one_join_node_test() {}
+    static void execute_test(bool throwException,bool flog) {
+        typedef typename tbb::flow::tuple_element<0,OutputTuple>::type ItemType0;
+        typedef typename tbb::flow::tuple_element<1,OutputTuple>::type ItemType1;
+
+        tbb::flow::graph g;
+        tbb::atomic<int>source0_count;
+        tbb::atomic<int>source1_count;
+        tbb::atomic<int>sink_count;
+        source0_count = source1_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+        eh_test_observer o;
+        o.observe(true);
+#endif
+        g_Master = Harness::CurrentTid();
+        SourceType0 source0(g, SourceBodyType0(source0_count),/*is_active*/false);
+        SourceType1 source1(g, SourceBodyType1(source1_count),/*is_active*/false);
+        TestJoinType node_to_test(g);
+        SinkType sink(g,tbb::flow::unlimited,SinkBodyType(sink_count));
+        make_edge(source0,tbb::flow::input_port<0>(node_to_test));
+        make_edge(source1,tbb::flow::input_port<1>(node_to_test));
+        make_edge(node_to_test, sink);
+        for(int iter = 0; iter < 2; ++iter) {
+            ResetGlobals(throwException,flog);
+            if(throwException) {
+                TRY();
+                    source0.activate();
+                    source1.activate();
+                    g.wait_for_all();
+                CATCH_AND_ASSERT();
+            }
+            else {
+                TRY();
+                    source0.activate();
+                    source1.activate();
+                    g.wait_for_all();
+                CATCH_AND_FAIL();
+            }
+            bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+            int sb0_cnt = tbb::flow::copy_body<SourceBodyType0>(source0).count_value();
+            int sb1_cnt = tbb::flow::copy_body<SourceBodyType1>(source1).count_value();
+            int nb_cnt = tbb::flow::copy_body<SinkBodyType>(sink).count_value();
+            if(throwException) {
+                ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+                ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+                ASSERT(sb0_cnt <= g_NumItems && sb1_cnt <= g_NumItems, "Too many items sent by sources");
+                ASSERT(nb_cnt <= ((sb0_cnt < sb1_cnt) ? sb0_cnt : sb1_cnt), "Too many items received by sink nodes");
+            }
+            else {
+                ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+                ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+                if(sb0_cnt != g_NumItems) {
+                    REMARK("throwException == %s\n", throwException ? "true" : "false");
+                    REMARK("iter == %d\n", (int)iter);
+                    REMARK("sb0_cnt == %d\n", (int)sb0_cnt);
+                    REMARK("g_NumItems == %d\n", (int)g_NumItems);
+                }
+                ASSERT(sb0_cnt == g_NumItems, "Missing invocations of source_node0");  // this one
+                ASSERT(sb1_cnt == g_NumItems, "Missing invocations of source_node1");
+                ASSERT(nb_cnt == g_NumItems, "Missing items in absorbers");
+            }
+            if(iter == 0) {
+                remove_edge(node_to_test, sink);
+                tbb::flow::input_port<0>(node_to_test).try_put(ItemType0(g_NumItems + 1));
+                tbb::flow::input_port<1>(node_to_test).try_put(ItemType1(g_NumItems + 2));
+                g.wait_for_all();
+                g.reset();
+                source0_count = source1_count = sink_count = 0;
+                make_edge(node_to_test, sink);
+                g.wait_for_all();
+            }
+            else {
+                g.wait_for_all();
+                g.reset();
+                source0_count = source1_count = sink_count = 0;
+            }
+            ASSERT(0 == tbb::flow::copy_body<SourceBodyType0>(source0).count_value(),"Reset source failed");
+            ASSERT(0 == tbb::flow::copy_body<SourceBodyType1>(source1).count_value(),"Reset source failed");
+            nb_cnt = tbb::flow::copy_body<SinkBodyType>(sink).count_value();
+            ASSERT(0 == tbb::flow::copy_body<SinkBodyType>(sink).count_value(),"Reset sink failed");
+        }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+        o.observe(false);
+#endif
+    }
+};  // run_one_join_node_test
+
+template<
+    class OutputTuple,
+    class SourceType0,
+    class SourceBodyType0,
+    class SourceType1,
+    class SourceBodyType1,
+    class TestJoinType,
+    class SinkType,
+    class SinkBodyType
+    >
+struct run_one_join_node_test<
+        tbb::flow::tag_matching,
+        OutputTuple,
+        SourceType0,
+        SourceBodyType0,
+        SourceType1,
+        SourceBodyType1,
+        TestJoinType,
+        SinkType,
+        SinkBodyType
+    > {
+    run_one_join_node_test() {}
+    static void execute_test(bool throwException,bool flog) {
+        typedef typename tbb::flow::tuple_element<0,OutputTuple>::type ItemType0;
+        typedef typename tbb::flow::tuple_element<1,OutputTuple>::type ItemType1;
+
+        tbb::flow::graph g;
+
+        tbb::atomic<int>source0_count;
+        tbb::atomic<int>source1_count;
+        tbb::atomic<int>sink_count;
+        source0_count = source1_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+        eh_test_observer o;
+        o.observe(true);
+#endif
+        g_Master = Harness::CurrentTid();
+        SourceType0 source0(g, SourceBodyType0(source0_count, 2),/*is_active*/false);
+        SourceType1 source1(g, SourceBodyType1(source1_count, 3),/*is_active*/false);
+        TestJoinType node_to_test(g, tag_func<ItemType0>(ItemType0(2)), tag_func<ItemType1>(ItemType1(3)));
+        SinkType sink(g,tbb::flow::unlimited,SinkBodyType(sink_count));
+        make_edge(source0,tbb::flow::input_port<0>(node_to_test));
+        make_edge(source1,tbb::flow::input_port<1>(node_to_test));
+        make_edge(node_to_test, sink);
+        for(int iter = 0; iter < 2; ++iter) {
+            ResetGlobals(throwException,flog);
+            if(throwException) {
+                TRY();
+                    source0.activate();
+                    source1.activate();
+                    g.wait_for_all();
+                CATCH_AND_ASSERT();
+            }
+            else {
+                TRY();
+                    source0.activate();
+                    source1.activate();
+                    g.wait_for_all();
+                CATCH_AND_FAIL();
+            }
+            bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+            int sb0_cnt = tbb::flow::copy_body<SourceBodyType0>(source0).count_value();
+            int sb1_cnt = tbb::flow::copy_body<SourceBodyType1>(source1).count_value();
+            int nb_cnt = tbb::flow::copy_body<SinkBodyType>(sink).count_value();
+            if(throwException) {
+                ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+                ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+                ASSERT(sb0_cnt <= g_NumItems && sb1_cnt <= g_NumItems, "Too many items sent by sources");
+                ASSERT(nb_cnt <= ((sb0_cnt < sb1_cnt) ? sb0_cnt : sb1_cnt), "Too many items received by sink nodes");
+            }
+            else {
+                ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+                ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+                ASSERT(sb0_cnt == g_NumItems, "Missing invocations of source_node0");
+                ASSERT(sb1_cnt == g_NumItems, "Missing invocations of source_node1");
+                ASSERT(nb_cnt == g_NumItems, "Missing items in absorbers");
+            }
+            if(iter == 0) {
+                remove_edge(node_to_test, sink);
+                tbb::flow::input_port<0>(node_to_test).try_put(ItemType0(g_NumItems + 4));
+                tbb::flow::input_port<1>(node_to_test).try_put(ItemType1(g_NumItems + 2));
+                g.wait_for_all();   // have to wait for the graph to stop again....
+                g.reset();  // resets the body of the source_nodes, test_node and the absorb_nodes.
+                source0_count = source1_count = sink_count = 0;
+                make_edge(node_to_test, sink);
+                g.wait_for_all();   // have to wait for the graph to stop again....
+            }
+            else {
+                g.wait_for_all();
+                g.reset();
+                source0_count = source1_count = sink_count = 0;
+            }
+            ASSERT(0 == tbb::flow::copy_body<SourceBodyType0>(source0).count_value(),"Reset source failed");
+            ASSERT(0 == tbb::flow::copy_body<SourceBodyType1>(source1).count_value(),"Reset source failed");
+            nb_cnt = tbb::flow::copy_body<SinkBodyType>(sink).count_value();
+            ASSERT(0 == tbb::flow::copy_body<SinkBodyType>(sink).count_value(),"Reset sink failed");
+        }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+        o.observe(false);
+#endif
+    }
+};  // run_one_join_node_test<tag_matching>
+
+template<class JP, class OutputTuple,
+             TestNodeTypeEnum SourceThrowType,
+             TestNodeTypeEnum SinkThrowType>
+void run_join_node_test() {
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type ItemType0;
+    typedef typename tbb::flow::tuple_element<1,OutputTuple>::type ItemType1;
+    typedef test_source_body<ItemType0,SourceThrowType> SourceBodyType0;
+    typedef test_source_body<ItemType1,SourceThrowType> SourceBodyType1;
+    typedef absorber_body<OutputTuple,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType;
+
+    typedef typename tbb::flow::source_node<ItemType0> SourceType0;
+    typedef typename tbb::flow::source_node<ItemType1> SourceType1;
+    typedef typename tbb::flow::join_node<OutputTuple,JP> TestJoinType;
+    typedef typename tbb::flow::function_node<OutputTuple,tbb::flow::continue_msg> SinkType;
+
+    for(int i = 0; i < 4; ++i) {
+        if(2 == i) continue;
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_join_node_test<
+             JP,
+             OutputTuple,
+             SourceType0,
+             SourceBodyType0,
+             SourceType1,
+             SourceBodyType1,
+             TestJoinType,
+             SinkType,
+             SinkBodyType>::execute_test(throwException,doFlog);
+    }
+}
+
+template<class JP>
+void test_join_node() {
+    REMARK("Testing join_node<%s>\n", graph_policy_name<JP>::name());
+    // only doing two-input joins
+    g_Wakeup_Msg = "join(is,non): Missed wakeup or machine is overloaded?";
+    run_join_node_test<JP, tbb::flow::tuple<int,int>,  isThrowing, nonThrowing>();
+    check_type<int>::check_type_counter = 0;
+    g_Wakeup_Msg = "join(non,is): Missed wakeup or machine is overloaded?";
+    run_join_node_test<JP, tbb::flow::tuple<check_type<int>,int>, nonThrowing, isThrowing>();
+    ASSERT(!check_type<int>::check_type_counter, "Dropped items in test");
+    g_Wakeup_Msg = "join(is,is): Missed wakeup or machine is overloaded?";
+    run_join_node_test<JP, tbb::flow::tuple<int,int>,  isThrowing, isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// ------------------- limiter_node -------------
+
+template<
+    class BufferItemType,       //
+    class SourceNodeType,
+    class SourceNodeBodyType,
+    class TestNodeType,
+    class SinkNodeType,
+    class SinkNodeBodyType >
+void run_one_limiter_node_test(bool throwException,bool flog) {
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source_count;
+    tbb::atomic<int> sink_count;
+    source_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+    g_Master = Harness::CurrentTid();
+    SourceNodeType source(g, SourceNodeBodyType(source_count),/*is_active*/false);
+    TestNodeType node_to_test(g,g_NumThreads + 1);
+    SinkNodeType sink(g,tbb::flow::unlimited,SinkNodeBodyType(sink_count));
+    make_edge(source,node_to_test);
+    make_edge(node_to_test, sink);
+    for(int iter = 0; iter < 2; ++iter) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb_cnt = tbb::flow::copy_body<SourceNodeBodyType>(source).count_value();
+        int nb_cnt = tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb_cnt <= g_NumItems, "Too many items sent by sources");
+            ASSERT(nb_cnt <= sb_cnt, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            // we stop after limiter's limit, which is g_NumThreads + 1.  The source_node
+            // is invoked one extra time, filling its buffer, so its limit is g_NumThreads + 2.
+            ASSERT(sb_cnt == g_NumThreads + 2, "Missing invocations of source_node");
+            ASSERT(nb_cnt == g_NumThreads + 1, "Missing items in absorbers");
+        }
+        if(iter == 0) {
+            remove_edge(node_to_test, sink);
+            node_to_test.try_put(BufferItemType());
+            node_to_test.try_put(BufferItemType());
+            g.wait_for_all();
+            g.reset();
+            source_count = sink_count = 0;
+            BufferItemType tmp;
+            ASSERT(!node_to_test.try_get(tmp), "node not empty");
+            make_edge(node_to_test, sink);
+            g.wait_for_all();
+        }
+        else {
+            g.reset();
+            source_count = sink_count = 0;
+        }
+        ASSERT(0 == tbb::flow::copy_body<SourceNodeBodyType>(source).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkNodeBodyType>(sink).count_value(),"Reset sink failed");
+    }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+template<class BufferItemType,
+         TestNodeTypeEnum SourceThrowType,
+         TestNodeTypeEnum SinkThrowType>
+void run_limiter_node_test() {
+    typedef test_source_body<BufferItemType,SourceThrowType> SourceBodyType;
+    typedef absorber_body<BufferItemType,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType;
+
+    typedef tbb::flow::source_node<BufferItemType> SrcType;
+    typedef tbb::flow::limiter_node<BufferItemType>  LmtType;
+    typedef tbb::flow::function_node<BufferItemType,tbb::flow::continue_msg> SnkType;
+
+    for(int i = 0; i < 4; ++i) {
+        if(i == 2) continue;  // no need to test flog w/o throws
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_limiter_node_test<
+            /* class BufferItemType*/     BufferItemType,
+            /*class SourceNodeType*/      SrcType,
+            /*class SourceNodeBodyType*/  SourceBodyType,
+            /*class TestNodeType*/        LmtType,
+            /*class SinkNodeType*/        SnkType,
+            /*class SinkNodeBodyType*/    SinkBodyType
+            >(throwException, doFlog);
+    }
+}
+
+void test_limiter_node() {
+    REMARK("Testing limiter_node\n");
+    g_Wakeup_Msg = "limiter_node(is,non): Missed wakeup or machine is overloaded?";
+    run_limiter_node_test<int,isThrowing,nonThrowing>();
+    g_Wakeup_Msg = "limiter_node(non,is): Missed wakeup or machine is overloaded?";
+    run_limiter_node_test<int,nonThrowing,isThrowing>();
+    g_Wakeup_Msg = "limiter_node(is,is): Missed wakeup or machine is overloaded?";
+    run_limiter_node_test<int,isThrowing,isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// -------- split_node --------------------
+
+template<
+    class InputTuple,
+    class SourceType,
+    class SourceBodyType,
+    class TestSplitType,
+    class SinkType0,
+    class SinkBodyType0,
+    class SinkType1,
+    class SinkBodyType1>
+void run_one_split_node_test(bool throwException, bool flog) {
+
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source_count;
+    tbb::atomic<int> sink0_count;
+    tbb::atomic<int> sink1_count;
+    source_count = sink0_count = sink1_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+
+    g_Master = Harness::CurrentTid();
+    SourceType source(g, SourceBodyType(source_count),/*is_active*/false);
+    TestSplitType node_to_test(g);
+    SinkType0 sink0(g,tbb::flow::unlimited,SinkBodyType0(sink0_count));
+    SinkType1 sink1(g,tbb::flow::unlimited,SinkBodyType1(sink1_count));
+    make_edge(source, node_to_test);
+    make_edge(tbb::flow::output_port<0>(node_to_test), sink0);
+    make_edge(tbb::flow::output_port<1>(node_to_test), sink1);
+
+    for(int iter = 0; iter < 2; ++iter) {  // run, reset, run again
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb_cnt = tbb::flow::copy_body<SourceBodyType>(source).count_value();
+        int nb0_cnt = tbb::flow::copy_body<SinkBodyType0>(sink0).count_value();
+        int nb1_cnt = tbb::flow::copy_body<SinkBodyType1>(sink1).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb_cnt <= 2*g_NumItems, "Too many items sent by source");
+            ASSERT(nb0_cnt + nb1_cnt <= sb_cnt*2, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb_cnt == g_NumItems, "Missing invocations of source_nodes");
+            ASSERT(nb0_cnt == g_NumItems && nb1_cnt == g_NumItems, "Missing items in absorbers");
+        }
+        g.reset();  // resets the body of the source_nodes and the absorb_nodes.
+        source_count = sink0_count = sink1_count = 0;
+        ASSERT(0 == tbb::flow::copy_body<SourceBodyType>(source).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkBodyType0>(sink0).count_value(),"Reset sink 0 failed");
+        ASSERT(0 == tbb::flow::copy_body<SinkBodyType1>(sink1).count_value(),"Reset sink 1 failed");
+    }
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+template<class InputTuple,
+             TestNodeTypeEnum SourceThrowType,
+             TestNodeTypeEnum SinkThrowType>
+void run_split_node_test() {
+    typedef typename tbb::flow::tuple_element<0,InputTuple>::type ItemType0;
+    typedef typename tbb::flow::tuple_element<1,InputTuple>::type ItemType1;
+    typedef tuple_test_source_body<InputTuple,SourceThrowType> SourceBodyType;
+    typedef absorber_body<ItemType0,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType0;
+    typedef absorber_body<ItemType1,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType1;
+
+    typedef typename tbb::flow::source_node<InputTuple> SourceType;
+    typedef typename tbb::flow::split_node<InputTuple> TestSplitType;
+    typedef typename tbb::flow::function_node<ItemType0,tbb::flow::continue_msg> SinkType0;
+    typedef typename tbb::flow::function_node<ItemType1,tbb::flow::continue_msg> SinkType1;
+
+    for(int i = 0; i < 4; ++i) {
+        if(2 == i) continue;
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_split_node_test<
+            InputTuple,
+            SourceType,
+            SourceBodyType,
+            TestSplitType,
+            SinkType0,
+            SinkBodyType0,
+            SinkType1,
+            SinkBodyType1>
+                (throwException,doFlog);
+    }
+}
+
+void test_split_node() {
+    REMARK("Testing split_node\n");
+    g_Wakeup_Msg = "split_node(is,non): Missed wakeup or machine is overloaded?";
+    run_split_node_test<tbb::flow::tuple<int,int>, isThrowing, nonThrowing>();
+    g_Wakeup_Msg = "split_node(non,is): Missed wakeup or machine is overloaded?";
+    run_split_node_test<tbb::flow::tuple<int,int>, nonThrowing, isThrowing>();
+    g_Wakeup_Msg = "split_node(is,is): Missed wakeup or machine is overloaded?";
+    run_split_node_test<tbb::flow::tuple<int,int>, isThrowing,  isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;
+}
+
+// --------- indexer_node ----------------------
+
+template < class InputTuple,
+    class SourceType0,
+    class SourceBodyType0,
+    class SourceType1,
+    class SourceBodyType1,
+    class TestNodeType,
+    class SinkType,
+    class SinkBodyType>
+void run_one_indexer_node_test(bool throwException,bool flog) {
+    typedef typename tbb::flow::tuple_element<0,InputTuple>::type ItemType0;
+    typedef typename tbb::flow::tuple_element<1,InputTuple>::type ItemType1;
+
+    tbb::flow::graph g;
+
+    tbb::atomic<int> source0_count;
+    tbb::atomic<int> source1_count;
+    tbb::atomic<int> sink_count;
+    source0_count = source1_count = sink_count = 0;
+#if USE_TASK_SCHEDULER_OBSERVER
+    eh_test_observer o;
+    o.observe(true);
+#endif
+    g_Master = Harness::CurrentTid();
+    SourceType0 source0(g, SourceBodyType0(source0_count),/*is_active*/false);
+    SourceType1 source1(g, SourceBodyType1(source1_count),/*is_active*/false);
+    TestNodeType node_to_test(g);
+    SinkType sink(g,tbb::flow::unlimited,SinkBodyType(sink_count));
+    make_edge(source0,tbb::flow::input_port<0>(node_to_test));
+    make_edge(source1,tbb::flow::input_port<1>(node_to_test));
+    make_edge(node_to_test, sink);
+    for(int iter = 0; iter < 2; ++iter) {
+        ResetGlobals(throwException,flog);
+        if(throwException) {
+            TRY();
+                source0.activate();
+                source1.activate();
+                g.wait_for_all();
+            CATCH_AND_ASSERT();
+        }
+        else {
+            TRY();
+                source0.activate();
+                source1.activate();
+                g.wait_for_all();
+            CATCH_AND_FAIL();
+        }
+        bool okayNoExceptionsCaught = (g_ExceptionInMaster && !g_MasterExecutedThrow) || (!g_ExceptionInMaster && !g_NonMasterExecutedThrow) || !throwException;
+        int sb0_cnt = tbb::flow::copy_body<SourceBodyType0>(source0).count_value();
+        int sb1_cnt = tbb::flow::copy_body<SourceBodyType1>(source1).count_value();
+        int nb_cnt = tbb::flow::copy_body<SinkBodyType>(sink).count_value();
+        if(throwException) {
+            ASSERT(g.exception_thrown() || okayNoExceptionsCaught, "Exception not caught by graph");
+            ASSERT(g.is_cancelled() || okayNoExceptionsCaught, "Cancellation not signalled in graph");
+            ASSERT(sb0_cnt <= g_NumItems && sb1_cnt <= g_NumItems, "Too many items sent by sources");
+            ASSERT(nb_cnt <= sb0_cnt + sb1_cnt, "Too many items received by sink nodes");
+        }
+        else {
+            ASSERT(!g.exception_thrown(), "Exception flag in flow::graph set but no throw occurred");
+            ASSERT(!g.is_cancelled(), "canceled flag set but no throw occurred");
+            ASSERT(sb0_cnt == g_NumItems, "Missing invocations of source_node0");
+            ASSERT(sb1_cnt == g_NumItems, "Missing invocations of source_node1");
+            ASSERT(nb_cnt == 2*g_NumItems, "Missing items in absorbers");
+        }
+        if(iter == 0) {
+            remove_edge(node_to_test, sink);
+            tbb::flow::input_port<0>(node_to_test).try_put(ItemType0(g_NumItems + 4));
+            tbb::flow::input_port<1>(node_to_test).try_put(ItemType1(g_NumItems + 2));
+            g.wait_for_all();
+            g.reset();
+            source0_count = source1_count = sink_count = 0;
+            make_edge(node_to_test, sink);
+            g.wait_for_all();
+        }
+        else {
+            g.wait_for_all();
+            g.reset();
+            source0_count = source1_count = sink_count = 0;
+        }
+        ASSERT(0 == tbb::flow::copy_body<SourceBodyType0>(source0).count_value(),"Reset source failed");
+        ASSERT(0 == tbb::flow::copy_body<SourceBodyType1>(source1).count_value(),"Reset source failed");
+        nb_cnt = tbb::flow::copy_body<SinkBodyType>(sink).count_value();
+        ASSERT(0 == tbb::flow::copy_body<SinkBodyType>(sink).count_value(),"Reset sink failed");
+    }
+
+#if USE_TASK_SCHEDULER_OBSERVER
+    o.observe(false);
+#endif
+}
+
+template<class InputTuple,
+    TestNodeTypeEnum SourceThrowType,
+    TestNodeTypeEnum SinkThrowType>
+void run_indexer_node_test() {
+    typedef typename tbb::flow::tuple_element<0,InputTuple>::type ItemType0;
+    typedef typename tbb::flow::tuple_element<1,InputTuple>::type ItemType1;
+    typedef test_source_body<ItemType0,SourceThrowType> SourceBodyType0;
+    typedef test_source_body<ItemType1,SourceThrowType> SourceBodyType1;
+    typedef typename tbb::flow::indexer_node<ItemType0, ItemType1> TestNodeType;
+    typedef absorber_body<typename TestNodeType::output_type,tbb::flow::continue_msg,SinkThrowType,unlimited_type> SinkBodyType;
+
+    typedef typename tbb::flow::source_node<ItemType0> SourceType0;
+    typedef typename tbb::flow::source_node<ItemType1> SourceType1;
+    typedef typename tbb::flow::function_node<typename TestNodeType::output_type,tbb::flow::continue_msg> SinkType;
+
+    for(int i = 0; i < 4; ++i) {
+        if(2 == i) continue;
+        bool throwException = (i & 0x1) != 0;
+        bool doFlog = (i & 0x2) != 0;
+        run_one_indexer_node_test<
+             InputTuple,
+             SourceType0,
+             SourceBodyType0,
+             SourceType1,
+             SourceBodyType1,
+             TestNodeType,
+             SinkType,
+             SinkBodyType>(throwException,doFlog);
+    }
+}
+
+void test_indexer_node() {
+    REMARK("Testing indexer_node\n");
+    g_Wakeup_Msg = "indexer_node(is,non): Missed wakeup or machine is overloaded?";
+    run_indexer_node_test<tbb::flow::tuple<int,int>, isThrowing, nonThrowing>();
+    g_Wakeup_Msg = "indexer_node(non,is): Missed wakeup or machine is overloaded?";
+    run_indexer_node_test<tbb::flow::tuple<int,int>, nonThrowing, isThrowing>();
+    g_Wakeup_Msg = "indexer_node(is,is): Missed wakeup or machine is overloaded?";
+    run_indexer_node_test<tbb::flow::tuple<int,int>, isThrowing,  isThrowing>();
+    g_Wakeup_Msg = g_Orig_Wakeup_Msg;;
+}
+
+///////////////////////////////////////////////
+// whole-graph exception test
+
+class Foo {
+private:
+    // std::vector<int>& m_vec;
+    std::vector<int>* m_vec;
+public:
+    Foo(std::vector<int>& vec) : m_vec(&vec) { }
+    void operator() (tbb::flow::continue_msg) const {
+        ++nExceptions;
+        m_vec->at(m_vec->size()); // Will throw out_of_range exception
+        ASSERT(false, "Exception not thrown by invalid access");
+    }
+};
+
+// test from user ahelwer: http://software.intel.com/en-us/forums/showthread.php?t=103786
+// exception thrown in graph node, not caught in wait_for_all()
+void
+test_flow_graph_exception0() {
+    // Initializes body
+    std::vector<int> vec;
+    vec.push_back(0);
+    Foo f(vec);
+    nExceptions = 0;
+
+    // Construct graph and nodes
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> start(g);
+    tbb::flow::continue_node<tbb::flow::continue_msg> fooNode(g, f);
+
+    // Construct edge
+    tbb::flow::make_edge(start, fooNode);
+
+    // Execute graph
+    ASSERT(!g.exception_thrown(), "exception_thrown flag already set");
+    ASSERT(!g.is_cancelled(), "canceled flag already set");
+    try {
+        start.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(false, "Exception not thrown");
+    }
+    catch(std::out_of_range& ex) {
+        REMARK("Exception: %s (expected)\n", ex.what());
+    }
+    catch(...) {
+        REMARK("Unknown exception caught (expected)\n");
+    }
+    ASSERT(nExceptions > 0, "Exception caught, but no body signaled exception being thrown");
+    nExceptions = 0;
+    ASSERT(g.exception_thrown(), "Exception not intercepted");
+    // if exception set, cancellation also set.
+    ASSERT(g.is_cancelled(), "Exception cancellation not signaled");
+    // in case we got an exception
+    try {
+        g.wait_for_all();  // context still signalled canceled, my_exception still set.
+    }
+    catch(...) {
+        ASSERT(false, "Second exception thrown but no task executing");
+    }
+    ASSERT(nExceptions == 0, "body signaled exception being thrown, but no body executed");
+    ASSERT(!g.exception_thrown(), "exception_thrown flag not reset");
+    ASSERT(!g.is_cancelled(), "canceled flag not reset");
+}
+
+void TestOneThreadNum(int nThread) {
+    REMARK("Testing %d threads\n", nThread);
+    g_NumItems = ((nThread > NUM_ITEMS) ? nThread *2 : NUM_ITEMS);
+    g_NumThreads = nThread;
+    tbb::task_scheduler_init init(nThread);
+    // whole-graph exception catch and rethrow test
+    test_flow_graph_exception0();
+    for(int i = 0; i < 4; ++i) {
+        g_ExceptionInMaster = (i & 1) != 0;
+        g_SolitaryException = (i & 2) != 0;
+        REMARK("g_ExceptionInMaster == %s, g_SolitaryException == %s\n",
+                g_ExceptionInMaster ? "T":"F",
+                g_SolitaryException ? "T":"F");
+        test_source_node();
+        test_function_node();
+        test_continue_node();  // also test broadcast_node
+        test_multifunction_node();
+        // single- and multi-item buffering nodes
+        test_buffer_queue_and_overwrite_node();
+        test_sequencer_node();
+        test_priority_queue_node();
+
+        // join_nodes
+        test_join_node<tbb::flow::queueing>();
+        test_join_node<tbb::flow::reserving>();
+        test_join_node<tbb::flow::tag_matching>();
+
+        test_limiter_node();
+        test_split_node();
+        // graph for write_once_node will be complicated by the fact the node will
+        // not do try_puts after it has been set.  To get parallelism of N we have
+        // to attach N successor nodes to the write_once (or play some similar game).
+        // test_write_once_node();
+        test_indexer_node();
+    }
+}
+#endif // TBB_USE_EXCEPTIONS
+
+#if TBB_USE_EXCEPTIONS
+int TestMain() {
+    // reversing the order of tests
+    for(int nThread=MaxThread; nThread >= MinThread; --nThread) {
+        TestOneThreadNum(nThread);
+    }
+
+    return Harness::Done;
+}
+#else
+int TestMain() {
+    return Harness::Skipped;
+}
+#endif // TBB_USE_EXCEPTIONS
diff --git a/xdl/third_party/tbb/src/test/test_eh_tasks.cpp b/xdl/third_party/tbb/src/test/test_eh_tasks.cpp
new file mode 100644
index 00000000..6cc0d7cf
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_eh_tasks.cpp
@@ -0,0 +1,791 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 2
+#define HARNESS_DEFAULT_MAX_THREADS 4
+#define __TBB_SHUFFLE_PRESENT (_MSC_VER >= 1910 || __cplusplus >= 201103L && (__TBB_GLIBCXX_VERSION >= 40800 || _LIBCPP_VERSION))
+
+#include "harness.h"
+
+#if __TBB_SHUFFLE_PRESENT
+#include <random>
+#endif
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+#define __TBB_ATOMICS_CODEGEN_BROKEN __SUNPRO_CC
+
+#define private public
+#include "tbb/task.h"
+#undef private
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/tick_count.h"
+
+#include <string>
+
+#define NUM_CHILD_TASKS                 256
+#define NUM_ROOT_TASKS                  32
+#define NUM_ROOTS_IN_GROUP              8
+
+//! Statistics about number of tasks in different states
+class TaskStats {
+    typedef tbb::spin_mutex::scoped_lock lock_t;
+    //! Number of tasks allocated that was ever allocated
+    volatile intptr_t m_Existed;
+    //! Number of tasks executed to the moment
+    volatile intptr_t m_Executed;
+    //! Number of tasks allocated but not yet destroyed to the moment
+    volatile intptr_t m_Existing;
+
+    mutable tbb::spin_mutex  m_Mutex;
+public:
+    //! Assumes that assignment is noncontended for the left-hand operand
+    const TaskStats& operator= ( const TaskStats& rhs ) {
+        if ( this != &rhs ) {
+            lock_t lock(rhs.m_Mutex);
+            m_Existed = rhs.m_Existed;
+            m_Executed = rhs.m_Executed;
+            m_Existing = rhs.m_Existing;
+        }
+        return *this;
+    }
+    intptr_t Existed() const { return m_Existed; }
+    intptr_t Executed() const { return m_Executed; }
+    intptr_t Existing() const { return m_Existing; }
+    void IncExisted() { lock_t lock(m_Mutex); ++m_Existed; ++m_Existing; }
+    void IncExecuted() { lock_t lock(m_Mutex); ++m_Executed; }
+    void DecExisting() { lock_t lock(m_Mutex); --m_Existing; }
+    //! Assumed to be used in uncontended manner only
+    void Reset() { m_Executed = m_Existing = m_Existed = 0; }
+};
+
+TaskStats g_CurStat;
+
+inline intptr_t Existed () { return g_CurStat.Existed(); }
+
+#include "harness_eh.h"
+
+bool g_BoostExecutedCount = true;
+volatile bool g_TaskWasCancelled = false;
+
+inline void ResetGlobals () {
+    ResetEhGlobals();
+    g_BoostExecutedCount = true;
+    g_TaskWasCancelled = false;
+    g_CurStat.Reset();
+}
+
+#define ASSERT_TEST_POSTCOND() \
+    ASSERT (g_CurStat.Existed() >= g_CurStat.Executed(), "Total number of tasks is less than executed");  \
+    ASSERT (!g_CurStat.Existing(), "Not all task objects have been destroyed"); \
+    ASSERT (!tbb::task::self().is_cancelled(), "Scheduler's default context has not been cleaned up properly");
+
+inline void WaitForException () {
+    int n = 0;
+    while ( ++n < c_Timeout && !__TBB_load_with_acquire(g_ExceptionCaught) )
+        __TBB_Yield();
+    ASSERT_WARNING( n < c_Timeout, "WaitForException failed" );
+}
+
+class TaskBase : public tbb::task {
+    tbb::task* execute () __TBB_override {
+        tbb::task* t = NULL;
+        __TBB_TRY {
+            t = do_execute();
+        } __TBB_CATCH( ... ) {
+            g_CurStat.IncExecuted();
+            __TBB_RETHROW();
+        }
+        g_CurStat.IncExecuted();
+        return t;
+    }
+protected:
+    TaskBase ( bool throwException = true ) : m_Throw(throwException) { g_CurStat.IncExisted(); }
+    ~TaskBase () { g_CurStat.DecExisting(); }
+
+    virtual tbb::task* do_execute () = 0;
+
+    bool m_Throw;
+}; // class TaskBase
+
+class LeafTask : public TaskBase {
+    tbb::task* do_execute () __TBB_override {
+        Harness::ConcurrencyTracker ct;
+        WaitUntilConcurrencyPeaks();
+        if ( g_BoostExecutedCount )
+            ++g_CurExecuted;
+        if ( m_Throw )
+            ThrowTestException(NUM_CHILD_TASKS/2);
+        if ( !g_ThrowException )
+            __TBB_Yield();
+        return NULL;
+    }
+public:
+    LeafTask ( bool throw_exception = true ) : TaskBase(throw_exception) {}
+};
+
+class SimpleRootTask : public TaskBase {
+    tbb::task* do_execute () __TBB_override {
+        set_ref_count(NUM_CHILD_TASKS + 1);
+        for ( size_t i = 0; i < NUM_CHILD_TASKS; ++i )
+            spawn( *new( allocate_child() ) LeafTask(m_Throw) );
+        wait_for_all();
+        return NULL;
+    }
+public:
+    SimpleRootTask ( bool throw_exception = true ) : TaskBase(throw_exception) {}
+};
+
+#if TBB_USE_EXCEPTIONS
+
+class SimpleThrowingTask : public tbb::task {
+public:
+    tbb::task* execute () __TBB_override { throw 0; }
+    ~SimpleThrowingTask() {}
+};
+
+//! Checks if innermost running task information is updated correctly during cancellation processing
+void Test0 () {
+    tbb::task_scheduler_init init (1);
+    tbb::empty_task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    tbb::task_list tl;
+    tl.push_back( *new( r.allocate_child() ) SimpleThrowingTask );
+    tl.push_back( *new( r.allocate_child() ) SimpleThrowingTask );
+    r.set_ref_count( 3 );
+    try {
+        r.spawn_and_wait_for_all( tl );
+    }
+    catch (...) {}
+    r.destroy( r );
+}
+
+//! Default exception behavior test.
+/** Allocates a root task that spawns a bunch of children, one or several of which throw
+    a test exception in a worker or master thread (depending on the global setting). **/
+void Test1 () {
+    ResetGlobals();
+    tbb::empty_task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    ASSERT (!g_CurStat.Existing() && !g_CurStat.Existed() && !g_CurStat.Executed(),
+            "something wrong with the task accounting");
+    r.set_ref_count(NUM_CHILD_TASKS + 1);
+    for ( int i = 0; i < NUM_CHILD_TASKS; ++i )
+        r.spawn( *new( r.allocate_child() ) LeafTask );
+    TRY();
+        r.wait_for_all();
+    CATCH_AND_ASSERT();
+    r.destroy(r);
+    ASSERT_TEST_POSTCOND();
+} // void Test1 ()
+
+//! Default exception behavior test.
+/** Allocates and spawns root task that runs a bunch of children, one of which throws
+    a test exception in a worker thread. (Similar to Test1, except that the root task
+    is spawned by the test function, and children are created by the root task instead
+    of the test function body.) **/
+void Test2 () {
+    ResetGlobals();
+    SimpleRootTask &r = *new( tbb::task::allocate_root() ) SimpleRootTask;
+    ASSERT (g_CurStat.Existing() == 1 && g_CurStat.Existed() == 1 && !g_CurStat.Executed(),
+            "something wrong with the task accounting");
+    TRY();
+        tbb::task::spawn_root_and_wait(r);
+    CATCH_AND_ASSERT();
+    ASSERT (g_ExceptionCaught, "no exception occurred");
+    ASSERT_TEST_POSTCOND();
+} // void Test2 ()
+
+//! The same as Test2() except the root task has explicit context.
+/** The context is initialized as bound in order to check correctness of its associating
+    with a root task. **/
+void Test3 () {
+    ResetGlobals();
+    tbb::task_group_context  ctx(tbb::task_group_context::bound);
+    SimpleRootTask &r = *new( tbb::task::allocate_root(ctx) ) SimpleRootTask;
+    ASSERT (g_CurStat.Existing() == 1 && g_CurStat.Existed() == 1 && !g_CurStat.Executed(),
+            "something wrong with the task accounting");
+    TRY();
+        tbb::task::spawn_root_and_wait(r);
+    CATCH_AND_ASSERT();
+    ASSERT (g_ExceptionCaught, "no exception occurred");
+    ASSERT_TEST_POSTCOND();
+} // void Test2 ()
+
+class RootLauncherTask : public TaskBase {
+    tbb::task_group_context::kind_type m_CtxKind;
+
+    tbb::task* do_execute () __TBB_override {
+        tbb::task_group_context  ctx(m_CtxKind);
+        SimpleRootTask &r = *new( allocate_root() ) SimpleRootTask;
+        r.change_group(ctx);
+        TRY();
+            spawn_root_and_wait(r);
+            // Give a child of our siblings a chance to throw the test exception
+            WaitForException();
+        CATCH();
+        ASSERT (__TBB_EXCEPTION_TYPE_INFO_BROKEN || !g_UnknownException, "unknown exception was caught");
+        return NULL;
+    }
+public:
+    RootLauncherTask ( tbb::task_group_context::kind_type ctx_kind = tbb::task_group_context::isolated ) : m_CtxKind(ctx_kind) {}
+};
+
+/** Allocates and spawns a bunch of roots, which allocate and spawn new root with
+    isolated context, which at last spawns a bunch of children each, one of which
+    throws a test exception in a worker thread. **/
+void Test4 () {
+    ResetGlobals();
+    tbb::task_list  tl;
+    for ( size_t i = 0; i < NUM_ROOT_TASKS; ++i )
+        tl.push_back( *new( tbb::task::allocate_root() ) RootLauncherTask );
+    TRY();
+        tbb::task::spawn_root_and_wait(tl);
+    CATCH_AND_ASSERT();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "exception in this scope is unexpected");
+    intptr_t  num_tasks_expected = NUM_ROOT_TASKS * (NUM_CHILD_TASKS + 2);
+    ASSERT (g_CurStat.Existed() == num_tasks_expected, "Wrong total number of tasks");
+    if ( g_SolitaryException )
+        ASSERT (g_CurStat.Executed() >= num_tasks_expected - NUM_CHILD_TASKS, "Unexpected number of executed tasks");
+    ASSERT_TEST_POSTCOND();
+} // void Test4 ()
+
+/** The same as Test4, except the contexts are bound. **/
+void Test4_1 () {
+    ResetGlobals();
+    tbb::task_list  tl;
+    for ( size_t i = 0; i < NUM_ROOT_TASKS; ++i )
+        tl.push_back( *new( tbb::task::allocate_root() ) RootLauncherTask(tbb::task_group_context::bound) );
+    TRY();
+        tbb::task::spawn_root_and_wait(tl);
+    CATCH_AND_ASSERT();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "exception in this scope is unexpected");
+    intptr_t  num_tasks_expected = NUM_ROOT_TASKS * (NUM_CHILD_TASKS + 2);
+    ASSERT (g_CurStat.Existed() == num_tasks_expected, "Wrong total number of tasks");
+    if ( g_SolitaryException )
+        ASSERT (g_CurStat.Executed() >= num_tasks_expected - NUM_CHILD_TASKS, "Unexpected number of executed tasks");
+    ASSERT_TEST_POSTCOND();
+} // void Test4_1 ()
+
+
+class RootsGroupLauncherTask : public TaskBase {
+    tbb::task* do_execute () __TBB_override {
+        tbb::task_group_context  ctx (tbb::task_group_context::isolated);
+        tbb::task_list  tl;
+        for ( size_t i = 0; i < NUM_ROOT_TASKS; ++i )
+            tl.push_back( *new( allocate_root(ctx) ) SimpleRootTask );
+        TRY();
+            spawn_root_and_wait(tl);
+            // Give worker a chance to throw exception
+            WaitForException();
+        CATCH_AND_ASSERT();
+        return NULL;
+    }
+};
+
+/** Allocates and spawns a bunch of roots, which allocate and spawn groups of roots
+    with an isolated context shared by all group members, which at last spawn a bunch
+    of children each, one of which throws a test exception in a worker thread. **/
+void Test5 () {
+    ResetGlobals();
+    tbb::task_list  tl;
+    for ( size_t i = 0; i < NUM_ROOTS_IN_GROUP; ++i )
+        tl.push_back( *new( tbb::task::allocate_root() ) RootsGroupLauncherTask );
+    TRY();
+        tbb::task::spawn_root_and_wait(tl);
+    CATCH_AND_ASSERT();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "unexpected exception intercepted");
+    if ( g_SolitaryException )  {
+        intptr_t  num_tasks_expected = NUM_ROOTS_IN_GROUP * (1 + NUM_ROOT_TASKS * (1 + NUM_CHILD_TASKS));
+        intptr_t  min_num_tasks_executed = num_tasks_expected - NUM_ROOT_TASKS * (NUM_CHILD_TASKS + 1);
+        ASSERT (g_CurStat.Executed() >= min_num_tasks_executed, "Too few tasks executed");
+    }
+    ASSERT_TEST_POSTCOND();
+} // void Test5 ()
+
+class ThrowingRootLauncherTask : public TaskBase {
+    tbb::task* do_execute () __TBB_override {
+        tbb::task_group_context  ctx (tbb::task_group_context::bound);
+        SimpleRootTask &r = *new( allocate_root(ctx) ) SimpleRootTask(false);
+        TRY();
+            spawn_root_and_wait(r);
+        CATCH();
+        ASSERT (!l_ExceptionCaughtAtCurrentLevel, "unexpected exception intercepted");
+        ThrowTestException(NUM_CHILD_TASKS);
+        g_TaskWasCancelled |= is_cancelled();
+        return NULL;
+    }
+};
+
+class BoundHierarchyLauncherTask : public TaskBase {
+    bool m_Recover;
+
+    void alloc_roots ( tbb::task_group_context& ctx, tbb::task_list& tl ) {
+        for ( size_t i = 0; i < NUM_ROOT_TASKS; ++i )
+            tl.push_back( *new( allocate_root(ctx) ) ThrowingRootLauncherTask );
+    }
+
+    tbb::task* do_execute () __TBB_override {
+        tbb::task_group_context  ctx (tbb::task_group_context::isolated);
+        tbb::task_list tl;
+        alloc_roots(ctx, tl);
+        TRY();
+            spawn_root_and_wait(tl);
+        CATCH_AND_ASSERT();
+        ASSERT (l_ExceptionCaughtAtCurrentLevel, "no exception occurred");
+        ASSERT (!tl.empty(), "task list was cleared somehow");
+        if ( g_SolitaryException )
+            ASSERT (g_TaskWasCancelled, "No tasks were cancelled despite of exception");
+        if ( m_Recover ) {
+            // Test task_group_context::unbind and task_group_context::reset methods
+            g_ThrowException = false;
+            l_ExceptionCaughtAtCurrentLevel = false;
+            tl.clear();
+            alloc_roots(ctx, tl);
+            ctx.reset();
+            try {
+                spawn_root_and_wait(tl);
+            }
+            catch (...) {
+                l_ExceptionCaughtAtCurrentLevel = true;
+            }
+            ASSERT (!l_ExceptionCaughtAtCurrentLevel, "unexpected exception occurred");
+        }
+        return NULL;
+    }
+public:
+    BoundHierarchyLauncherTask ( bool recover = false ) : m_Recover(recover) {}
+
+}; // class BoundHierarchyLauncherTask
+
+//! Test for bound contexts forming 2 level tree. Exception is thrown on the 1st (root) level.
+/** Allocates and spawns a root that spawns a bunch of 2nd level roots sharing
+    the same isolated context, each of which in their turn spawns a single 3rd level
+    root with  the bound context, and these 3rd level roots spawn bunches of leaves
+    in the end. Leaves do not generate exceptions. The test exception is generated
+    by one of the 2nd level roots. **/
+void Test6 () {
+    ResetGlobals();
+    BoundHierarchyLauncherTask &r = *new( tbb::task::allocate_root() ) BoundHierarchyLauncherTask;
+    TRY();
+        tbb::task::spawn_root_and_wait(r);
+    CATCH_AND_ASSERT();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "unexpected exception intercepted");
+    // After the first of the branches (ThrowingRootLauncherTask) completes,
+    // the rest of the task tree may be collapsed before having a chance to execute leaves.
+    // A number of branches running concurrently with the first one will be able to spawn leaves though.
+    /// \todo: If additional checkpoints are added to scheduler the following assertion must weaken
+    intptr_t  num_tasks_expected = 1 + NUM_ROOT_TASKS * (2 + NUM_CHILD_TASKS);
+    intptr_t  min_num_tasks_created = 1 + g_NumThreads * 2 + NUM_CHILD_TASKS;
+    // 2 stands for BoundHierarchyLauncherTask and SimpleRootTask
+    // 1 corresponds to BoundHierarchyLauncherTask
+    intptr_t  min_num_tasks_executed = 2 + 1 + NUM_CHILD_TASKS;
+    ASSERT (g_CurStat.Existed() <= num_tasks_expected, "Number of expected tasks is calculated incorrectly");
+    ASSERT (g_CurStat.Existed() >= min_num_tasks_created, "Too few tasks created");
+    ASSERT (g_CurStat.Executed() >= min_num_tasks_executed, "Too few tasks executed");
+    ASSERT_TEST_POSTCOND();
+} // void Test6 ()
+
+//! Tests task_group_context::unbind and task_group_context::reset methods.
+/** Allocates and spawns a root that spawns a bunch of 2nd level roots sharing
+    the same isolated context, each of which in their turn spawns a single 3rd level
+    root with  the bound context, and these 3rd level roots spawn bunches of leaves
+    in the end. Leaves do not generate exceptions. The test exception is generated
+    by one of the 2nd level roots. **/
+void Test7 () {
+    ResetGlobals();
+    BoundHierarchyLauncherTask &r = *new( tbb::task::allocate_root() ) BoundHierarchyLauncherTask;
+    TRY();
+        tbb::task::spawn_root_and_wait(r);
+    CATCH_AND_ASSERT();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "unexpected exception intercepted");
+    ASSERT_TEST_POSTCOND();
+} // void Test6 ()
+
+class BoundHierarchyLauncherTask2 : public TaskBase {
+    tbb::task* do_execute () __TBB_override {
+        tbb::task_group_context  ctx;
+        tbb::task_list  tl;
+        for ( size_t i = 0; i < NUM_ROOT_TASKS; ++i )
+            tl.push_back( *new( allocate_root(ctx) ) RootLauncherTask(tbb::task_group_context::bound) );
+        TRY();
+            spawn_root_and_wait(tl);
+        CATCH_AND_ASSERT();
+        // Exception must be intercepted by RootLauncherTask
+        ASSERT (!l_ExceptionCaughtAtCurrentLevel, "no exception occurred");
+        return NULL;
+    }
+}; // class BoundHierarchyLauncherTask2
+
+//! Test for bound contexts forming 2 level tree. Exception is thrown in the 2nd (outer) level.
+/** Allocates and spawns a root that spawns a bunch of 2nd level roots sharing
+    the same isolated context, each of which in their turn spawns a single 3rd level
+    root with  the bound context, and these 3rd level roots spawn bunches of leaves
+    in the end. The test exception is generated by one of the leaves. **/
+void Test8 () {
+    ResetGlobals();
+    BoundHierarchyLauncherTask2 &r = *new( tbb::task::allocate_root() ) BoundHierarchyLauncherTask2;
+    TRY();
+        tbb::task::spawn_root_and_wait(r);
+    CATCH_AND_ASSERT();
+    ASSERT (!l_ExceptionCaughtAtCurrentLevel, "unexpected exception intercepted");
+    if ( g_SolitaryException )  {
+        intptr_t  num_tasks_expected = 1 + NUM_ROOT_TASKS * (2 + NUM_CHILD_TASKS);
+        intptr_t  min_num_tasks_created = 1 + g_NumThreads * (2 + NUM_CHILD_TASKS);
+        intptr_t  min_num_tasks_executed = num_tasks_expected - (NUM_CHILD_TASKS + 1);
+        ASSERT (g_CurStat.Existed() <= num_tasks_expected, "Number of expected tasks is calculated incorrectly");
+        ASSERT (g_CurStat.Existed() >= min_num_tasks_created, "Too few tasks created");
+        ASSERT (g_CurStat.Executed() >= min_num_tasks_executed, "Too few tasks executed");
+    }
+    ASSERT_TEST_POSTCOND();
+} // void Test8 ()
+
+template<typename T>
+void ThrowMovableException ( intptr_t threshold, const T& data ) {
+    if ( !IsThrowingThread() )
+        return;
+    if ( !g_SolitaryException ) {
+#if __TBB_ATOMICS_CODEGEN_BROKEN
+        g_ExceptionsThrown = g_ExceptionsThrown + 1;
+#else
+        ++g_ExceptionsThrown;
+#endif
+        throw tbb::movable_exception<T>(data);
+    }
+    while ( g_CurStat.Existed() < threshold )
+        __TBB_Yield();
+    if ( g_ExceptionsThrown.compare_and_swap(1, 0) == 0 )
+        throw tbb::movable_exception<T>(data);
+}
+
+const int g_IntExceptionData = -375;
+const std::string g_StringExceptionData = "My test string";
+
+// Exception data class implementing minimal requirements of tbb::movable_exception
+class ExceptionData {
+    const ExceptionData& operator = ( const ExceptionData& src );
+    explicit ExceptionData ( int n ) : m_Int(n), m_String(g_StringExceptionData) {}
+public:
+    ExceptionData ( const ExceptionData& src ) : m_Int(src.m_Int), m_String(src.m_String) {}
+    ~ExceptionData () {}
+
+    int m_Int;
+    std::string m_String;
+
+    // Simple way to provide an instance when all initializing constructors are private
+    // and to avoid memory reclamation problems.
+    static ExceptionData s_data;
+};
+
+ExceptionData ExceptionData::s_data(g_IntExceptionData);
+
+typedef tbb::movable_exception<int> SolitaryMovableException;
+typedef tbb::movable_exception<ExceptionData> MultipleMovableException;
+
+class LeafTaskWithMovableExceptions : public TaskBase {
+    tbb::task* do_execute () __TBB_override {
+        Harness::ConcurrencyTracker ct;
+        WaitUntilConcurrencyPeaks();
+        if ( g_SolitaryException )
+            ThrowMovableException<int>(NUM_CHILD_TASKS/2, g_IntExceptionData);
+        else
+            ThrowMovableException<ExceptionData>(NUM_CHILD_TASKS/2, ExceptionData::s_data);
+        return NULL;
+    }
+};
+
+void CheckException ( tbb::tbb_exception& e ) {
+    ASSERT (strcmp(e.name(), (g_SolitaryException ? typeid(SolitaryMovableException)
+                                                   : typeid(MultipleMovableException)).name() ) == 0,
+                                                   "Unexpected original exception name");
+    ASSERT (strcmp(e.what(), "tbb::movable_exception") == 0, "Unexpected original exception info ");
+    if ( g_SolitaryException ) {
+        SolitaryMovableException& me = dynamic_cast<SolitaryMovableException&>(e);
+        ASSERT (me.data() == g_IntExceptionData, "Unexpected solitary movable_exception data");
+    }
+    else {
+        MultipleMovableException& me = dynamic_cast<MultipleMovableException&>(e);
+        ASSERT (me.data().m_Int == g_IntExceptionData, "Unexpected multiple movable_exception int data");
+        ASSERT (me.data().m_String == g_StringExceptionData, "Unexpected multiple movable_exception string data");
+    }
+}
+
+void CheckException () {
+    try {
+        throw;
+    } catch ( tbb::tbb_exception& e ) {
+        CheckException(e);
+    }
+    catch ( ... ) {
+    }
+}
+
+//! Test for movable_exception behavior, and external exception recording.
+/** Allocates a root task that spawns a bunch of children, one or several of which throw
+    a movable exception in a worker or master thread (depending on the global settings).
+    The test also checks the correctness of multiple rethrowing of the pending exception. **/
+void TestMovableException () {
+    REMARK( "TestMovableException\n" );
+    ResetGlobals();
+    bool bUnsupported = false;
+    tbb::task_group_context ctx;
+    tbb::empty_task *r = new( tbb::task::allocate_root() ) tbb::empty_task;
+    ASSERT (!g_CurStat.Existing() && !g_CurStat.Existed() && !g_CurStat.Executed(),
+            "something wrong with the task accounting");
+    r->set_ref_count(NUM_CHILD_TASKS + 1);
+    for ( int i = 0; i < NUM_CHILD_TASKS; ++i )
+        r->spawn( *new( r->allocate_child() ) LeafTaskWithMovableExceptions );
+    TRY()
+        r->wait_for_all();
+    } catch ( ... ) {
+        ASSERT (!ctx.is_group_execution_cancelled(), "");
+        CheckException();
+        try {
+            throw;
+        } catch ( tbb::tbb_exception& e ) {
+            CheckException(e);
+            g_ExceptionCaught = l_ExceptionCaughtAtCurrentLevel = true;
+        }
+        catch ( ... ) {
+            g_ExceptionCaught = true;
+            g_UnknownException = unknownException = true;
+        }
+        try {
+            ctx.register_pending_exception();
+        } catch ( ... ) {
+            bUnsupported = true;
+            REPORT( "Warning: register_pending_exception() failed. This is expected in case of linking with static msvcrt\n" );
+        }
+        ASSERT (ctx.is_group_execution_cancelled() || bUnsupported, "After exception registration the context must be in the cancelled state");
+    }
+    r->destroy(*r);
+    ASSERT_EXCEPTION();
+    ASSERT_TEST_POSTCOND();
+
+    r = new( tbb::task::allocate_root(ctx) ) tbb::empty_task;
+    r->set_ref_count(1);
+    g_ExceptionCaught = g_UnknownException = false;
+    try {
+        r->wait_for_all();
+    } catch ( tbb::tbb_exception& e ) {
+        CheckException(e);
+        g_ExceptionCaught = true;
+    }
+    catch ( ... ) {
+        g_ExceptionCaught = true;
+        g_UnknownException = true;
+    }
+    ASSERT (g_ExceptionCaught || bUnsupported, "no exception occurred");
+    ASSERT (__TBB_EXCEPTION_TYPE_INFO_BROKEN || !g_UnknownException  || bUnsupported, "unknown exception was caught");
+    r->destroy(*r);
+} // void Test10 ()
+
+#endif /* TBB_USE_EXCEPTIONS */
+
+template<class T>
+class CtxLauncherTask : public tbb::task {
+    tbb::task_group_context &m_Ctx;
+
+    tbb::task* execute () __TBB_override {
+        spawn_root_and_wait( *new( allocate_root(m_Ctx) ) T );
+        return NULL;
+    }
+public:
+    CtxLauncherTask ( tbb::task_group_context& ctx ) : m_Ctx(ctx) {}
+};
+
+//! Test for cancelling a task hierarchy from outside (from a task running in parallel with it).
+void TestCancelation () {
+    ResetGlobals();
+    g_ThrowException = false;
+    tbb::task_group_context  ctx;
+    tbb::task_list  tl;
+    tl.push_back( *new( tbb::task::allocate_root() ) CtxLauncherTask<SimpleRootTask>(ctx) );
+    tl.push_back( *new( tbb::task::allocate_root() ) CancellatorTask(ctx, NUM_CHILD_TASKS / 4) );
+    TRY();
+        tbb::task::spawn_root_and_wait(tl);
+    CATCH_AND_FAIL();
+    ASSERT (g_CurStat.Executed() <= g_ExecutedAtLastCatch + g_NumThreads, "Too many tasks were executed after cancellation");
+    ASSERT_TEST_POSTCOND();
+} // void Test9 ()
+
+class CtxDestroyerTask : public tbb::task {
+    int m_nestingLevel;
+
+    tbb::task* execute () __TBB_override {
+        ASSERT ( m_nestingLevel >= 0 && m_nestingLevel < MaxNestingDepth, "Wrong nesting level. The test is broken" );
+        tbb::task_group_context  ctx;
+        tbb::task *t = new( allocate_root(ctx) ) tbb::empty_task;
+        int level = ++m_nestingLevel;
+        if ( level < MaxNestingDepth ) {
+            execute();
+        }
+        else {
+            if ( !CancellatorTask::WaitUntilReady() )
+                REPORT( "Warning: missing wakeup\n" );
+            ++g_CurExecuted;
+        }
+        if ( ctx.is_group_execution_cancelled() )
+            ++s_numCancelled;
+        t->destroy(*t);
+        return NULL;
+    }
+public:
+    CtxDestroyerTask () : m_nestingLevel(0) { s_numCancelled = 0; }
+
+    static const int MaxNestingDepth = 256;
+    static int s_numCancelled;
+};
+
+int CtxDestroyerTask::s_numCancelled = 0;
+
+//! Test for data race between cancellation propagation and context destruction.
+/** If the data race ever occurs, an assertion inside TBB will be triggered. **/
+void TestCtxDestruction () {
+    REMARK( "TestCtxDestruction\n" );
+    for ( size_t i = 0; i < 10; ++i ) {
+        tbb::task_group_context  ctx;
+        tbb::task_list  tl;
+        ResetGlobals();
+        g_BoostExecutedCount = false;
+        g_ThrowException = false;
+        CancellatorTask::Reset();
+
+        tl.push_back( *new( tbb::task::allocate_root() ) CtxLauncherTask<CtxDestroyerTask>(ctx) );
+        tl.push_back( *new( tbb::task::allocate_root() ) CancellatorTask(ctx, 1) );
+        tbb::task::spawn_root_and_wait(tl);
+        ASSERT( g_CurExecuted == 1, "Test is broken" );
+        ASSERT( CtxDestroyerTask::s_numCancelled <= CtxDestroyerTask::MaxNestingDepth, "Test is broken" );
+    }
+} // void TestCtxDestruction()
+
+#include <algorithm>
+#include "harness_barrier.h"
+
+class CtxConcurrentDestroyer : NoAssign, Harness::NoAfterlife {
+    static const int ContextsPerThread = 512;
+
+    static int s_Concurrency;
+    static int s_NumContexts;
+    static tbb::task_group_context** s_Contexts;
+    static char* s_Buffer;
+    static Harness::SpinBarrier s_Barrier;
+    static Harness::SpinBarrier s_ExitBarrier;
+
+    struct Shuffler {
+        void operator() () const {
+#if __TBB_SHUFFLE_PRESENT
+            std::shuffle(s_Contexts, s_Contexts + s_NumContexts, std::mt19937(std::random_device()()));
+#else
+            std::random_shuffle(s_Contexts, s_Contexts + s_NumContexts);
+#endif
+        }
+    };
+public:
+    static void Init ( int p ) {
+        s_Concurrency = p;
+        s_NumContexts = p * ContextsPerThread;
+        s_Contexts = new tbb::task_group_context*[s_NumContexts];
+        s_Buffer = new char[s_NumContexts * sizeof(tbb::task_group_context)];
+        s_Barrier.initialize( p );
+        s_ExitBarrier.initialize( p );
+    }
+    static void Uninit () {
+        for ( int i = 0; i < s_NumContexts; ++i ) {
+            tbb::internal::context_list_node_t &node = s_Contexts[i]->my_node;
+            ASSERT( !node.my_next && !node.my_prev, "Destroyed context was written to during context chain update" );
+        }
+        delete []s_Contexts;
+        delete []s_Buffer;
+    }
+
+    void operator() ( int id ) const {
+        int begin = ContextsPerThread * id,
+            end = begin + ContextsPerThread;
+        for ( int i = begin; i < end; ++i )
+            s_Contexts[i] = new( s_Buffer + i * sizeof(tbb::task_group_context) ) tbb::task_group_context;
+        s_Barrier.wait( Shuffler() );
+        for ( int i = begin; i < end; ++i ) {
+            s_Contexts[i]->tbb::task_group_context::~task_group_context();
+            memset( static_cast<void*>(s_Contexts[i]), 0, sizeof(tbb::task_group_context) );
+        }
+        s_ExitBarrier.wait();
+    }
+}; // class CtxConcurrentDestroyer
+
+int CtxConcurrentDestroyer::s_Concurrency;
+int CtxConcurrentDestroyer::s_NumContexts;
+tbb::task_group_context** CtxConcurrentDestroyer::s_Contexts;
+char* CtxConcurrentDestroyer::s_Buffer;
+Harness::SpinBarrier CtxConcurrentDestroyer::s_Barrier;
+Harness::SpinBarrier CtxConcurrentDestroyer::s_ExitBarrier;
+
+void TestConcurrentCtxDestruction () {
+    REMARK( "TestConcurrentCtxDestruction\n" );
+    CtxConcurrentDestroyer::Init(g_NumThreads);
+    NativeParallelFor( g_NumThreads, CtxConcurrentDestroyer() );
+    CtxConcurrentDestroyer::Uninit();
+}
+
+void RunTests () {
+    REMARK ("Number of threads %d\n", g_NumThreads);
+    tbb::task_scheduler_init init (g_NumThreads);
+    g_Master = Harness::CurrentTid();
+#if TBB_USE_EXCEPTIONS
+    Test1();
+    Test2();
+    Test3();
+    Test4();
+    Test4_1();
+    Test5();
+    Test6();
+    Test7();
+    Test8();
+    TestMovableException();
+#endif /* TBB_USE_EXCEPTIONS */
+    TestCancelation();
+    TestCtxDestruction();
+#if !RML_USE_WCRM
+    TestConcurrentCtxDestruction();
+#endif
+}
+
+int TestMain () {
+    REMARK ("Using %s\n", TBB_USE_CAPTURED_EXCEPTION ? "tbb:captured_exception" : "exact exception propagation");
+    MinThread = min(NUM_ROOTS_IN_GROUP, min(tbb::task_scheduler_init::default_num_threads(), max(2, MinThread)));
+    MaxThread = min(NUM_ROOTS_IN_GROUP, max(MinThread, min(tbb::task_scheduler_init::default_num_threads(), MaxThread)));
+    ASSERT (NUM_ROOTS_IN_GROUP < NUM_ROOT_TASKS, "Fix defines");
+#if TBB_USE_EXCEPTIONS
+    // Test0 always runs on one thread
+    Test0();
+#endif /* TBB_USE_EXCEPTIONS */
+    g_SolitaryException = 0;
+    for ( g_NumThreads = MinThread; g_NumThreads <= MaxThread; ++g_NumThreads )
+        RunTests();
+    return Harness::Done;
+}
+
+#else /* !__TBB_TASK_GROUP_CONTEXT */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
diff --git a/xdl/third_party/tbb/src/test/test_enumerable_thread_specific.cpp b/xdl/third_party/tbb/src/test/test_enumerable_thread_specific.cpp
new file mode 100644
index 00000000..5f7cb112
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_enumerable_thread_specific.cpp
@@ -0,0 +1,1384 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 0
+#define HARNESS_DEFAULT_MAX_THREADS 4
+
+#include "tbb/enumerable_thread_specific.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+#include "tbb/blocked_range.h"
+#include "tbb/tick_count.h"
+#include "tbb/tbb_allocator.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/atomic.h"
+
+#include <cstring>
+#include <vector>
+#include <deque>
+#include <list>
+#include <map>
+#include <utility>
+
+#include "harness_assert.h"
+#include "harness.h"
+#include "harness_checktype.h"
+
+#include "../tbbmalloc/shared_utils.h"
+using rml::internal::estimatedCacheLineSize;
+
+#if __TBB_GCC_WARNING_SUPPRESSION_PRESENT
+#pragma GCC diagnostic ignored "-Wuninitialized"
+#endif
+
+static tbb::atomic<int> construction_counter;
+static tbb::atomic<int> destruction_counter;
+
+#if TBB_USE_DEBUG
+const int REPETITIONS = 4;
+const int N = 10000;
+const int RANGE_MIN=1000;
+#else
+const int REPETITIONS = 10;
+const int N = 100000;
+const int RANGE_MIN=10000;
+#endif
+const int VALID_NUMBER_OF_KEYS = 100;
+const double EXPECTED_SUM = (REPETITIONS + 1) * N;
+
+//! A minimal class that occupies N bytes.
+/** Defines default and copy constructor, and allows implicit operator&.
+    Hides operator=. */
+template<size_t N=tbb::internal::NFS_MaxLineSize>
+class minimal: NoAssign {
+private:
+    int my_value;
+    bool is_constructed;
+    char pad[N-sizeof(int) - sizeof(bool)];
+public:
+    minimal() : NoAssign(), my_value(0) { ++construction_counter; is_constructed = true; }
+    minimal( const minimal &m ) : NoAssign(), my_value(m.my_value) { ++construction_counter; is_constructed = true; }
+    ~minimal() { ++destruction_counter; ASSERT(is_constructed, NULL); is_constructed = false; }
+    void set_value( const int i ) { ASSERT(is_constructed, NULL); my_value = i; }
+    int value( ) const { ASSERT(is_constructed, NULL); return my_value; }
+};
+
+static size_t AlignMask = 0;  // set to cache-line-size - 1
+
+template<typename T>
+T& check_alignment(T& t, const char *aname) {
+    if( !tbb::internal::is_aligned(&t, AlignMask)) {
+        REPORT_ONCE("alignment error with %s allocator (%x)\n", aname, (int)size_t(&t) & (AlignMask-1));
+    }
+    return t;
+}
+
+template<typename T>
+const T& check_alignment(const T& t, const char *aname) {
+    if( !tbb::internal::is_aligned(&t, AlignMask)) {
+        REPORT_ONCE("alignment error with %s allocator (%x)\n", aname, (int)size_t(&t) & (AlignMask-1));
+    }
+    return t;
+}
+
+// Test constructors which throw.  If an ETS constructor throws before completion,
+// the already-built objects are un-constructed.  Do not call the destructor if
+// this occurs.
+
+static tbb::atomic<int> gThrowValue;
+static int targetThrowValue = 3;
+
+class Thrower {
+public:
+    Thrower() {
+#if TBB_USE_EXCEPTIONS
+        if(++gThrowValue == targetThrowValue) {
+            throw std::bad_alloc();
+        }
+#endif
+    }
+};
+
+// MyThrower field of ThrowingConstructor will throw after a certain number of
+// construction calls.  The constructor unwinder wshould unconstruct the instance
+// of check_type<int> that was constructed just before.
+class ThrowingConstructor {
+    check_type<int> m_checktype;
+    Thrower m_throwing_field;
+public:
+    int m_cnt;
+    ThrowingConstructor() : m_checktype(), m_throwing_field() { m_cnt = 0;}
+private:
+};
+
+//
+// A helper class that simplifies writing the tests since minimal does not
+// define = or + operators.
+//
+
+template< typename T >
+struct test_helper {
+   static inline void init(T &e) { e = static_cast<T>(0); }
+   static inline void sum(T &e, const int addend ) { e += static_cast<T>(addend); }
+   static inline void sum(T &e, const double addend ) { e += static_cast<T>(addend); }
+   static inline void set(T &e, const int value ) { e = static_cast<T>(value); }
+   static inline double get(const T &e ) { return static_cast<double>(e); }
+};
+
+template<size_t N>
+struct test_helper<minimal<N> > {
+   static inline void init(minimal<N> &sum) { sum.set_value( 0 ); }
+   static inline void sum(minimal<N> &sum, const int addend ) { sum.set_value( sum.value() + addend); }
+   static inline void sum(minimal<N> &sum, const double addend ) { sum.set_value( sum.value() + static_cast<int>(addend)); }
+   static inline void sum(minimal<N> &sum, const minimal<N> &addend ) { sum.set_value( sum.value() + addend.value()); }
+   static inline void set(minimal<N> &v, const int value ) { v.set_value( static_cast<int>(value) ); }
+   static inline double get(const minimal<N> &sum ) { return static_cast<double>(sum.value()); }
+};
+
+template<>
+struct test_helper<ThrowingConstructor> {
+   static inline void init(ThrowingConstructor &sum) { sum.m_cnt = 0; }
+   static inline void sum(ThrowingConstructor &sum, const int addend ) { sum.m_cnt += addend; }
+   static inline void sum(ThrowingConstructor &sum, const double addend ) { sum.m_cnt += static_cast<int>(addend); }
+   static inline void sum(ThrowingConstructor &sum, const ThrowingConstructor &addend ) { sum.m_cnt += addend.m_cnt; }
+   static inline void set(ThrowingConstructor &v, const int value ) { v.m_cnt = static_cast<int>(value); }
+   static inline double get(const ThrowingConstructor &sum ) { return static_cast<double>(sum.m_cnt); }
+};
+
+//! Tag class used to make certain constructors hard to invoke accidentally.
+struct SecretTagType {} SecretTag;
+
+//// functors and routines for initialization and combine
+
+//! Counts instances of FunctorFinit
+static tbb::atomic<int> FinitCounter;
+
+template <typename T, int Value>
+struct FunctorFinit {
+    FunctorFinit( const FunctorFinit& ) {++FinitCounter;}
+    FunctorFinit( SecretTagType ) {++FinitCounter;}
+    ~FunctorFinit() {--FinitCounter;}
+    T operator()() { return Value; }
+};
+
+template <int Value>
+struct FunctorFinit<ThrowingConstructor,Value> {
+    FunctorFinit( const FunctorFinit& ) {++FinitCounter;}
+    FunctorFinit( SecretTagType ) {++FinitCounter;}
+    ~FunctorFinit() {--FinitCounter;}
+    ThrowingConstructor operator()() { ThrowingConstructor temp; temp.m_cnt = Value; return temp; }
+};
+
+template <size_t N, int Value>
+struct FunctorFinit<minimal<N>,Value> {
+    FunctorFinit( const FunctorFinit& ) {++FinitCounter;}
+    FunctorFinit( SecretTagType ) {++FinitCounter;}
+    ~FunctorFinit() {--FinitCounter;}
+    minimal<N> operator()() {
+        minimal<N> result;
+        result.set_value( Value );
+        return result;
+    }
+};
+
+// Addition
+
+template <typename T>
+struct FunctorAddCombineRef {
+    T operator()(const T& left, const T& right) const {
+        return left+right;
+    }
+};
+
+template <size_t N>
+struct FunctorAddCombineRef<minimal<N> > {
+    minimal<N> operator()(const minimal<N>& left, const minimal<N>& right) const {
+        minimal<N> result;
+        result.set_value( left.value() + right.value() );
+        return result;
+    }
+};
+
+template <>
+struct FunctorAddCombineRef<ThrowingConstructor> {
+    ThrowingConstructor operator()(const ThrowingConstructor& left, const ThrowingConstructor& right) const {
+        ThrowingConstructor result;
+        result.m_cnt = ( left.m_cnt + right.m_cnt );
+        return result;
+    }
+};
+
+template <typename T>
+struct FunctorAddCombine {
+    T operator()(T left, T right ) const {
+        return FunctorAddCombineRef<T>()( left, right );
+    }
+};
+
+template <typename T>
+T FunctionAddByRef( const T &left, const T &right) {
+    return FunctorAddCombineRef<T>()( left, right );
+}
+
+template <typename T>
+T FunctionAdd( T left, T right) { return FunctionAddByRef(left,right); }
+
+template <typename T>
+class Accumulator {
+public:
+    Accumulator(T& _result) : my_result(_result) {}
+    Accumulator& operator=(const Accumulator& other) {
+        test_helper<T>::set(my_result, test_helper<T>::get(other));
+        return *this;
+    }
+    void operator()(const T& new_bit) { test_helper<T>::sum(my_result, new_bit); }
+private:
+    T& my_result;
+};
+
+template <typename T>
+class ClearingAccumulator {
+public:
+    ClearingAccumulator(T& _result) : my_result(_result) {}
+    ClearingAccumulator& operator=(const ClearingAccumulator& other) {
+        test_helper<T>::set(my_result, test_helper<T>::get(other));
+        return *this;
+    }
+    void operator()(T& new_bit) {
+        test_helper<T>::sum(my_result, new_bit);
+        test_helper<T>::init(new_bit);
+    }
+    static void AssertClean(const T& thread_local_value) {
+        T zero;
+        test_helper<T>::init(zero);
+        ASSERT(test_helper<T>::get(thread_local_value)==test_helper<T>::get(zero),
+               "combine_each does not allow to modify thread local values?");
+    }
+private:
+    T& my_result;
+};
+
+//// end functors and routines
+
+template< typename T >
+void run_serial_scalar_tests(const char *test_name) {
+    tbb::tick_count t0;
+    T sum;
+    test_helper<T>::init(sum);
+
+    REMARK("Testing serial %s... ", test_name);
+    for (int t = -1; t < REPETITIONS; ++t) {
+        if (Verbose && t == 0) t0 = tbb::tick_count::now();
+        for (int i = 0; i < N; ++i) {
+            test_helper<T>::sum(sum,1);
+        }
+    }
+
+    double result_value = test_helper<T>::get(sum);
+    ASSERT( EXPECTED_SUM == result_value, NULL);
+    REMARK("done\nserial %s, 0, %g, %g\n", test_name, result_value, ( tbb::tick_count::now() - t0).seconds());
+}
+
+
+template <typename T, template<class> class Allocator>
+class parallel_scalar_body: NoAssign {
+    typedef tbb::enumerable_thread_specific<T, Allocator<T> > ets_type;
+    ets_type &sums;
+    const char* allocator_name;
+
+public:
+
+    parallel_scalar_body ( ets_type &_sums, const char *alloc_name ) : sums(_sums), allocator_name(alloc_name) { }
+
+    void operator()( const tbb::blocked_range<int> &r ) const {
+        for (int i = r.begin(); i != r.end(); ++i)
+            test_helper<T>::sum( check_alignment(sums.local(),allocator_name), 1 );
+    }
+
+};
+
+template< typename T, template<class> class Allocator>
+void run_parallel_scalar_tests_nocombine(const char *test_name, const char *allocator_name) {
+
+    typedef tbb::enumerable_thread_specific<T, Allocator<T> > ets_type;
+
+    Check<T> my_check;
+    gThrowValue = 0;
+    {
+        // We assume that static_sums zero-initialized or has a default constructor that zeros it.
+        static ets_type static_sums = ets_type( T() );
+
+        T exemplar;
+        test_helper<T>::init(exemplar);
+
+        for (int p = MinThread; p <= MaxThread; ++p) {
+            REMARK("Testing parallel %s with allocator %s on %d thread(s)... ", test_name, allocator_name, p);
+            tbb::task_scheduler_init init(p);
+            tbb::tick_count t0;
+
+            T iterator_sum;
+            test_helper<T>::init(iterator_sum);
+
+            T finit_ets_sum;
+            test_helper<T>::init(finit_ets_sum);
+
+            T const_iterator_sum;
+            test_helper<T>::init(const_iterator_sum);
+
+            T range_sum;
+            test_helper<T>::init(range_sum);
+
+            T const_range_sum;
+            test_helper<T>::init(const_range_sum);
+
+            T cconst_sum;
+            test_helper<T>::init(cconst_sum);
+
+            T assign_sum;
+            test_helper<T>::init(assign_sum);
+
+            T cassgn_sum;
+            test_helper<T>::init(cassgn_sum);
+            T non_cassgn_sum;
+            test_helper<T>::init(non_cassgn_sum);
+
+            T static_sum;
+            test_helper<T>::init(static_sum);
+
+            for (int t = -1; t < REPETITIONS; ++t) {
+                if (Verbose && t == 0) t0 = tbb::tick_count::now();
+
+                static_sums.clear();
+
+                ets_type sums(exemplar);
+                FunctorFinit<T,0> my_finit(SecretTag);
+                ets_type finit_ets(my_finit);
+
+                ASSERT( sums.empty(), NULL);
+                tbb::parallel_for( tbb::blocked_range<int>( 0, N, RANGE_MIN ), parallel_scalar_body<T,Allocator>( sums, allocator_name ) );
+                ASSERT( !sums.empty(), NULL);
+
+                ASSERT( finit_ets.empty(), NULL);
+                tbb::parallel_for( tbb::blocked_range<int>( 0, N, RANGE_MIN ), parallel_scalar_body<T,Allocator>( finit_ets, allocator_name ) );
+                ASSERT( !finit_ets.empty(), NULL);
+
+                ASSERT(static_sums.empty(), NULL);
+                tbb::parallel_for( tbb::blocked_range<int>( 0, N, RANGE_MIN ), parallel_scalar_body<T,Allocator>( static_sums, allocator_name ) );
+                ASSERT( !static_sums.empty(), NULL);
+
+                // use iterator
+                typename ets_type::size_type size = 0;
+                for ( typename ets_type::iterator i = sums.begin(); i != sums.end(); ++i ) {
+                     ++size;
+                     test_helper<T>::sum(iterator_sum, *i);
+                }
+                ASSERT( sums.size() == size, NULL);
+
+                // use const_iterator
+                for ( typename ets_type::const_iterator i = sums.begin(); i != sums.end(); ++i ) {
+                     test_helper<T>::sum(const_iterator_sum, *i);
+                }
+
+                // use range_type
+                typename ets_type::range_type r = sums.range();
+                for ( typename ets_type::range_type::const_iterator i = r.begin(); i != r.end(); ++i ) {
+                     test_helper<T>::sum(range_sum, *i);
+                }
+
+                // use const_range_type
+                typename ets_type::const_range_type cr = sums.range();
+                for ( typename ets_type::const_range_type::iterator i = cr.begin(); i != cr.end(); ++i ) {
+                     test_helper<T>::sum(const_range_sum, *i);
+                }
+
+                // test copy constructor, with TLS-cached locals
+                typedef typename tbb::enumerable_thread_specific<T, Allocator<T>, tbb::ets_key_per_instance> cached_ets_type;
+
+                cached_ets_type cconst(sums);
+
+                for ( typename cached_ets_type::const_iterator i = cconst.begin(); i != cconst.end(); ++i ) {
+                     test_helper<T>::sum(cconst_sum, *i);
+                }
+
+                // test assignment
+                ets_type assigned;
+                assigned = sums;
+
+                for ( typename ets_type::const_iterator i = assigned.begin(); i != assigned.end(); ++i ) {
+                     test_helper<T>::sum(assign_sum, *i);
+                }
+
+                // test assign to and from cached locals
+                cached_ets_type cassgn;
+                cassgn = sums;
+                for ( typename cached_ets_type::const_iterator i = cassgn.begin(); i != cassgn.end(); ++i ) {
+                     test_helper<T>::sum(cassgn_sum, *i);
+                }
+
+                ets_type non_cassgn;
+                non_cassgn = cassgn;
+                for ( typename ets_type::const_iterator i = non_cassgn.begin(); i != non_cassgn.end(); ++i ) {
+                     test_helper<T>::sum(non_cassgn_sum, *i);
+                }
+
+                // test finit-initialized ets
+                for(typename ets_type::const_iterator i = finit_ets.begin(); i != finit_ets.end(); ++i) {
+                    test_helper<T>::sum(finit_ets_sum, *i);
+                }
+
+                // test static ets
+                for(typename ets_type::const_iterator i = static_sums.begin(); i != static_sums.end(); ++i) {
+                    test_helper<T>::sum(static_sum, *i);
+                }
+
+            }
+
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(iterator_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(const_iterator_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(range_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(const_range_sum), NULL);
+
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(cconst_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(assign_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(cassgn_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(non_cassgn_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(finit_ets_sum), NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(static_sum), NULL);
+
+            REMARK("done\nparallel %s, %d, %g, %g\n", test_name, p, test_helper<T>::get(iterator_sum),
+                                                          ( tbb::tick_count::now() - t0).seconds());
+        }
+    }  // Check block
+}
+
+template< typename T, template<class> class Allocator>
+void run_parallel_scalar_tests(const char *test_name, const char *allocator_name) {
+
+    typedef tbb::enumerable_thread_specific<T, Allocator<T> > ets_type;
+    bool exception_caught = false;
+
+    // We assume that static_sums zero-initialized or has a default constructor that zeros it.
+    static ets_type static_sums = ets_type( T() );
+
+    T exemplar;
+    test_helper<T>::init(exemplar);
+
+    int test_throw_count = 10;
+    // the test will be performed repeatedly until it does not throw.  For non-throwing types
+    // this means once; for the throwing type test it may loop two or three times.  The
+    // value of targetThrowValue will determine when and if the test will throw.
+    do {
+        targetThrowValue = test_throw_count;  // keep testing until we get no exception
+        exception_caught = false;
+#if TBB_USE_EXCEPTIONS
+        try {
+#endif
+            run_parallel_scalar_tests_nocombine<T,Allocator>(test_name, allocator_name);
+#if TBB_USE_EXCEPTIONS
+        }
+        catch(...) {
+            REMARK("Exception caught %d\n", targetThrowValue);
+        }
+#endif
+        for (int p = MinThread; p <= MaxThread; ++p) {
+            REMARK("Testing parallel %s with allocator %s on %d thread(s)... ", test_name, allocator_name, p);
+            tbb::task_scheduler_init init(p);
+            tbb::tick_count t0;
+
+            gThrowValue = 0;
+
+            T combine_sum;
+            test_helper<T>::init(combine_sum);
+
+            T combine_ref_sum;
+            test_helper<T>::init(combine_ref_sum);
+
+            T accumulator_sum;
+            test_helper<T>::init(accumulator_sum);
+
+            T static_sum;
+            test_helper<T>::init(static_sum);
+
+            T clearing_accumulator_sum;
+            test_helper<T>::init(clearing_accumulator_sum);
+
+            {
+                Check<T> my_check;
+#if TBB_USE_EXCEPTIONS
+                try
+#endif
+                {
+                    for (int t = -1; t < REPETITIONS; ++t) {
+                        if (Verbose && t == 0) t0 = tbb::tick_count::now();
+
+                        static_sums.clear();
+
+                        ets_type sums(exemplar);
+
+                        ASSERT( sums.empty(), NULL);
+                        tbb::parallel_for( tbb::blocked_range<int>( 0, N, RANGE_MIN ),
+                                parallel_scalar_body<T,Allocator>( sums, allocator_name ) );
+                        ASSERT( !sums.empty(), NULL);
+
+                        ASSERT(static_sums.empty(), NULL);
+                        tbb::parallel_for( tbb::blocked_range<int>( 0, N, RANGE_MIN ),
+                                parallel_scalar_body<T,Allocator>( static_sums, allocator_name ) );
+                        ASSERT( !static_sums.empty(), NULL);
+
+                        // Use combine
+                        test_helper<T>::sum(combine_sum, sums.combine(FunctionAdd<T>));
+                        test_helper<T>::sum(combine_ref_sum, sums.combine(FunctionAddByRef<T>));
+                        test_helper<T>::sum(static_sum, static_sums.combine(FunctionAdd<T>));
+
+                        // Accumulate with combine_each
+                        sums.combine_each(Accumulator<T>(accumulator_sum));
+                        // Accumulate and clear thread-local values
+                        sums.combine_each(ClearingAccumulator<T>(clearing_accumulator_sum));
+                        // Check that the values were cleared
+                        sums.combine_each(ClearingAccumulator<T>::AssertClean);
+                    }
+                }
+#if TBB_USE_EXCEPTIONS
+                catch(...) {
+                    REMARK("Exception caught %d\n", targetThrowValue);
+                    exception_caught = true;
+                }
+#endif
+            }
+
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(combine_sum) || exception_caught, NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(combine_ref_sum) || exception_caught, NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(static_sum) || exception_caught, NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(accumulator_sum) || exception_caught, NULL);
+            ASSERT( EXPECTED_SUM == test_helper<T>::get(clearing_accumulator_sum) || exception_caught, NULL);
+
+            REMARK("done\nparallel combine %s, %d, %g, %g\n", test_name, p, test_helper<T>::get(combine_sum),
+                                                          ( tbb::tick_count::now() - t0).seconds());
+        }  // MinThread .. MaxThread
+        test_throw_count += 10;  // keep testing until we don't get an exception
+    } while (exception_caught && test_throw_count < 200);
+    ASSERT(!exception_caught, "No non-exception test completed");
+}
+
+template <typename T, template<class> class Allocator>
+class parallel_vector_for_body: NoAssign {
+    typedef std::vector<T, tbb::tbb_allocator<T> > container_type;
+    typedef tbb::enumerable_thread_specific< container_type, Allocator<container_type> > ets_type;
+    ets_type &locals;
+    const char *allocator_name;
+
+public:
+
+    parallel_vector_for_body ( ets_type &_locals, const char *aname ) : locals(_locals), allocator_name(aname) { }
+
+    void operator()( const tbb::blocked_range<int> &r ) const {
+        T one;
+        test_helper<T>::set(one, 1);
+
+        for (int i = r.begin(); i < r.end(); ++i) {
+            check_alignment(locals.local(),allocator_name).push_back( one );
+        }
+    }
+
+};
+
+template <typename R, typename T>
+struct parallel_vector_reduce_body {
+
+    T sum;
+    size_t count;
+    typedef std::vector<T, tbb::tbb_allocator<T> > container_type;
+
+    parallel_vector_reduce_body ( ) : count(0) { test_helper<T>::init(sum); }
+    parallel_vector_reduce_body ( parallel_vector_reduce_body<R, T> &, tbb::split ) : count(0) {  test_helper<T>::init(sum); }
+
+    void operator()( const R &r ) {
+        for (typename R::iterator ri = r.begin(); ri != r.end(); ++ri) {
+            const container_type &v = *ri;
+            ++count;
+            for (typename container_type::const_iterator vi = v.begin(); vi != v.end(); ++vi) {
+                test_helper<T>::sum(sum, *vi);
+            }
+        }
+    }
+
+    void join( const parallel_vector_reduce_body &b ) {
+        test_helper<T>::sum(sum,b.sum);
+        count += b.count;
+    }
+
+};
+
+template< typename T, template<class> class Allocator>
+void run_parallel_vector_tests(const char *test_name, const char *allocator_name) {
+    tbb::tick_count t0;
+    typedef std::vector<T, tbb::tbb_allocator<T> > container_type;
+    typedef tbb::enumerable_thread_specific< container_type, Allocator<container_type> > ets_type;
+
+    for (int p = MinThread; p <= MaxThread; ++p) {
+        REMARK("Testing parallel %s with allocator %s on %d thread(s)... ", test_name, allocator_name, p);
+        tbb::task_scheduler_init init(p);
+
+        T sum;
+        test_helper<T>::init(sum);
+
+        for (int t = -1; t < REPETITIONS; ++t) {
+            if (Verbose && t == 0) t0 = tbb::tick_count::now();
+            ets_type vs;
+
+            ASSERT( vs.empty(), NULL );
+            tbb::parallel_for( tbb::blocked_range<int> (0, N, RANGE_MIN),
+                               parallel_vector_for_body<T,Allocator>( vs, allocator_name ) );
+            ASSERT( !vs.empty(), NULL );
+
+            // copy construct
+            ets_type vs2(vs); // this causes an assertion failure, related to allocators...
+
+            // assign
+            ets_type vs3;
+            vs3 = vs;
+
+            parallel_vector_reduce_body< typename ets_type::const_range_type, T > pvrb;
+            tbb::parallel_reduce ( vs.range(1), pvrb );
+
+            test_helper<T>::sum(sum, pvrb.sum);
+
+            ASSERT( vs.size() == pvrb.count, NULL );
+            ASSERT( vs2.size() == pvrb.count, NULL );
+            ASSERT( vs3.size() == pvrb.count, NULL );
+
+            tbb::flattened2d<ets_type> fvs = flatten2d(vs);
+            size_t ccount = fvs.size();
+            ASSERT( ccount == size_t(N), NULL );
+            size_t elem_cnt = 0;
+            for(typename tbb::flattened2d<ets_type>::const_iterator i = fvs.begin(); i != fvs.end(); ++i) {
+                ++elem_cnt;
+            };
+            ASSERT( ccount == elem_cnt, NULL );
+
+            elem_cnt = 0;
+            for(typename tbb::flattened2d<ets_type>::iterator i = fvs.begin(); i != fvs.end(); ++i) {
+                ++elem_cnt;
+            };
+            ASSERT( ccount == elem_cnt, NULL );
+
+#if __TBB_ETS_USE_CPP11
+            // Test the ETS constructor with multiple args
+            T minus_one;
+            test_helper<T>::set(minus_one, -1);
+            // Set ETS to construct "local" vectors pre-occupied with 25 "minus_one"s
+            // Cast 25 to size_type to prevent Intel Compiler SFINAE compilation issues with gcc 5.
+            ets_type vvs( typename container_type::size_type(25), minus_one, tbb::tbb_allocator<T>() );
+            ASSERT( vvs.empty(), NULL );
+            tbb::parallel_for ( tbb::blocked_range<int> (0, N, RANGE_MIN), parallel_vector_for_body<T,Allocator>( vvs, allocator_name ) );
+            ASSERT( !vvs.empty(), NULL );
+
+            parallel_vector_reduce_body< typename ets_type::const_range_type, T > pvrb2;
+            tbb::parallel_reduce ( vvs.range(1), pvrb2 );
+            ASSERT( pvrb2.count == vvs.size(), NULL );
+            ASSERT( test_helper<T>::get(pvrb2.sum) == N-pvrb2.count*25, NULL );
+
+            tbb::flattened2d<ets_type> fvvs = flatten2d(vvs);
+            ccount = fvvs.size();
+            ASSERT( ccount == N+pvrb2.count*25, NULL );
+#endif
+        }
+
+        double result_value = test_helper<T>::get(sum);
+        ASSERT( EXPECTED_SUM == result_value, NULL);
+        REMARK("done\nparallel %s, %d, %g, %g\n", test_name, p, result_value, ( tbb::tick_count::now() - t0).seconds());
+    }
+}
+
+template<typename T, template<class> class Allocator>
+void run_cross_type_vector_tests(const char *test_name) {
+    tbb::tick_count t0;
+    const char* allocator_name = "default";
+    typedef std::vector<T, tbb::tbb_allocator<T> > container_type;
+
+    for (int p = MinThread; p <= MaxThread; ++p) {
+        REMARK("Testing parallel %s on %d thread(s)... ", test_name, p);
+        tbb::task_scheduler_init init(p);
+
+        T sum;
+        test_helper<T>::init(sum);
+
+        for (int t = -1; t < REPETITIONS; ++t) {
+            if (Verbose && t == 0) t0 = tbb::tick_count::now();
+            typedef typename tbb::enumerable_thread_specific< container_type, Allocator<container_type>, tbb::ets_no_key > ets_nokey_type;
+            typedef typename tbb::enumerable_thread_specific< container_type, Allocator<container_type>, tbb::ets_key_per_instance > ets_tlskey_type;
+            ets_nokey_type vs;
+
+            ASSERT( vs.empty(), NULL);
+            tbb::parallel_for ( tbb::blocked_range<int> (0, N, RANGE_MIN), parallel_vector_for_body<T, Allocator>( vs, allocator_name ) );
+            ASSERT( !vs.empty(), NULL);
+
+            // copy construct
+            ets_tlskey_type vs2(vs);
+
+            // assign
+            ets_nokey_type vs3;
+            vs3 = vs2;
+
+            parallel_vector_reduce_body< typename ets_nokey_type::const_range_type, T > pvrb;
+            tbb::parallel_reduce ( vs3.range(1), pvrb );
+
+            test_helper<T>::sum(sum, pvrb.sum);
+
+            ASSERT( vs3.size() == pvrb.count, NULL);
+
+            tbb::flattened2d<ets_nokey_type> fvs = flatten2d(vs3);
+            size_t ccount = fvs.size();
+            size_t elem_cnt = 0;
+            for(typename tbb::flattened2d<ets_nokey_type>::const_iterator i = fvs.begin(); i != fvs.end(); ++i) {
+                ++elem_cnt;
+            };
+            ASSERT(ccount == elem_cnt, NULL);
+
+            elem_cnt = 0;
+            for(typename tbb::flattened2d<ets_nokey_type>::iterator i = fvs.begin(); i != fvs.end(); ++i) {
+                ++elem_cnt;
+            };
+            ASSERT(ccount == elem_cnt, NULL);
+        }
+
+        double result_value = test_helper<T>::get(sum);
+        ASSERT( EXPECTED_SUM == result_value, NULL);
+        REMARK("done\nparallel %s, %d, %g, %g\n", test_name, p, result_value, ( tbb::tick_count::now() - t0).seconds());
+    }
+}
+
+template< typename T >
+void run_serial_vector_tests(const char *test_name) {
+    tbb::tick_count t0;
+    T sum;
+    test_helper<T>::init(sum);
+    T one;
+    test_helper<T>::set(one, 1);
+
+    REMARK("Testing serial %s... ", test_name);
+    for (int t = -1; t < REPETITIONS; ++t) {
+        if (Verbose && t == 0) t0 = tbb::tick_count::now();
+        std::vector<T, tbb::tbb_allocator<T> > v;
+        for (int i = 0; i < N; ++i) {
+            v.push_back( one );
+        }
+        for (typename std::vector<T, tbb::tbb_allocator<T> >::const_iterator i = v.begin(); i != v.end(); ++i)
+            test_helper<T>::sum(sum, *i);
+    }
+
+    double result_value = test_helper<T>::get(sum);
+    ASSERT( EXPECTED_SUM == result_value, NULL);
+    REMARK("done\nserial %s, 0, %g, %g\n", test_name, result_value, ( tbb::tick_count::now() - t0).seconds());
+}
+
+const size_t line_size = tbb::internal::NFS_MaxLineSize;
+
+void run_serial_tests() {
+    run_serial_scalar_tests<int>("int");
+    run_serial_scalar_tests<double>("double");
+    run_serial_scalar_tests<minimal<> >("minimal<>");
+    run_serial_vector_tests<int>("std::vector<int, tbb::tbb_allocator<int> >");
+    run_serial_vector_tests<double>("std::vector<double, tbb::tbb_allocator<double> >");
+}
+
+template<template<class>class Allocator>
+void run_parallel_tests(const char *allocator_name) {
+    run_parallel_scalar_tests<int, Allocator>("int",allocator_name);
+    run_parallel_scalar_tests<double, Allocator>("double",allocator_name);
+    run_parallel_scalar_tests_nocombine<minimal<>,Allocator>("minimal<>",allocator_name);
+    run_parallel_scalar_tests<ThrowingConstructor, Allocator>("ThrowingConstructor", allocator_name);
+    run_parallel_vector_tests<int, Allocator>("std::vector<int, tbb::tbb_allocator<int> >",allocator_name);
+    run_parallel_vector_tests<double, Allocator>("std::vector<double, tbb::tbb_allocator<double> >",allocator_name);
+}
+
+void run_cross_type_tests() {
+    // cross-type scalar tests are part of run_parallel_scalar_tests_nocombine
+    run_cross_type_vector_tests<int, tbb::tbb_allocator>("std::vector<int, tbb::tbb_allocator<int> >");
+    run_cross_type_vector_tests<double, tbb::tbb_allocator>("std::vector<double, tbb::tbb_allocator<double> >");
+}
+
+typedef tbb::enumerable_thread_specific<minimal<line_size> > flogged_ets;
+
+class set_body {
+    flogged_ets *a;
+
+public:
+    set_body( flogged_ets*_a ) : a(_a) { }
+
+    void operator() ( ) const {
+        for (int i = 0; i < VALID_NUMBER_OF_KEYS; ++i) {
+            check_alignment(a[i].local(), "default").set_value(i + 1);
+        }
+    }
+
+};
+
+void do_tbb_threads( int max_threads, flogged_ets a[] ) {
+    std::vector< tbb::tbb_thread * > threads;
+
+    for (int p = 0; p < max_threads; ++p) {
+        threads.push_back( new tbb::tbb_thread ( set_body( a ) ) );
+    }
+
+    for (int p = 0; p < max_threads; ++p) {
+        threads[p]->join();
+    }
+
+    for(int p = 0; p < max_threads; ++p) {
+        delete threads[p];
+    }
+}
+
+void flog_key_creation_and_deletion() {
+    const int FLOG_REPETITIONS = 100;
+
+    for (int p = MinThread; p <= MaxThread; ++p) {
+        REMARK("Testing repeated deletes on %d threads... ", p);
+
+        for (int j = 0; j < FLOG_REPETITIONS; ++j) {
+            construction_counter = 0;
+            destruction_counter = 0;
+
+            // causes VALID_NUMBER_OF_KEYS exemplar instances to be constructed
+            flogged_ets* a = new flogged_ets[VALID_NUMBER_OF_KEYS];
+            ASSERT(int(construction_counter) == 0, NULL);   // no exemplars or actual locals have been constructed
+            ASSERT(int(destruction_counter) == 0, NULL);    // and none have been destroyed
+
+            // causes p * VALID_NUMBER_OF_KEYS minimals to be created
+            do_tbb_threads(p, a);
+
+            for (int i = 0; i < VALID_NUMBER_OF_KEYS; ++i) {
+                int pcnt = 0;
+                for ( flogged_ets::iterator tli = a[i].begin(); tli != a[i].end(); ++tli ) {
+                    ASSERT( (*tli).value() == i+1, NULL );
+                    ++pcnt;
+                }
+                ASSERT( pcnt == p, NULL);  // should be one local per thread.
+            }
+            delete[] a;
+        }
+
+        ASSERT( int(construction_counter) == (p)*VALID_NUMBER_OF_KEYS, NULL );
+        ASSERT( int(destruction_counter) == (p)*VALID_NUMBER_OF_KEYS, NULL );
+
+        REMARK("done\nTesting repeated clears on %d threads... ", p);
+
+        construction_counter = 0;
+        destruction_counter = 0;
+
+        // causes VALID_NUMBER_OF_KEYS exemplar instances to be constructed
+        flogged_ets* a = new flogged_ets[VALID_NUMBER_OF_KEYS];
+
+        for (int j = 0; j < FLOG_REPETITIONS; ++j) {
+
+            // causes p * VALID_NUMBER_OF_KEYS minimals to be created
+            do_tbb_threads(p, a);
+
+            for (int i = 0; i < VALID_NUMBER_OF_KEYS; ++i) {
+                for ( flogged_ets::iterator tli = a[i].begin(); tli != a[i].end(); ++tli ) {
+                    ASSERT( (*tli).value() == i+1, NULL );
+                }
+                a[i].clear();
+                ASSERT( static_cast<int>(a[i].end() - a[i].begin()) == 0, NULL );
+            }
+
+        }
+
+        delete[] a;
+
+        ASSERT( int(construction_counter) == (FLOG_REPETITIONS*p)*VALID_NUMBER_OF_KEYS, NULL );
+        ASSERT( int(destruction_counter) == (FLOG_REPETITIONS*p)*VALID_NUMBER_OF_KEYS, NULL );
+
+        REMARK("done\n");
+    }
+
+}
+
+template <typename inner_container>
+void flog_segmented_interator() {
+
+    bool found_error = false;
+    typedef typename inner_container::value_type T;
+    typedef std::vector< inner_container > nested_vec;
+    inner_container my_inner_container;
+    my_inner_container.clear();
+    nested_vec my_vec;
+
+    // simple nested vector (neither level empty)
+    const int maxval = 10;
+    for(int i=0; i < maxval; i++) {
+        my_vec.push_back(my_inner_container);
+        for(int j = 0; j < maxval; j++) {
+            my_vec.at(i).push_back((T)(maxval * i + j));
+        }
+    }
+
+    tbb::internal::segmented_iterator<nested_vec, T> my_si(my_vec);
+
+    T ii;
+    for(my_si=my_vec.begin(), ii=0; my_si != my_vec.end(); ++my_si, ++ii) {
+        if((*my_si) != ii) {
+            found_error = true;
+            REMARK( "*my_si=%d\n", int(*my_si));
+        }
+    }
+
+    // outer level empty
+    my_vec.clear();
+    for(my_si=my_vec.begin(); my_si != my_vec.end(); ++my_si) {
+        found_error = true;
+    }
+
+    // inner levels empty
+    my_vec.clear();
+    for(int i =0; i < maxval; ++i) {
+        my_vec.push_back(my_inner_container);
+    }
+    for(my_si = my_vec.begin(); my_si != my_vec.end(); ++my_si) {
+        found_error = true;
+    }
+
+    // every other inner container is empty
+    my_vec.clear();
+    for(int i=0; i < maxval; ++i) {
+        my_vec.push_back(my_inner_container);
+        if(i%2) {
+            for(int j = 0; j < maxval; ++j) {
+                my_vec.at(i).push_back((T)(maxval * (i/2) + j));
+            }
+        }
+    }
+    for(my_si = my_vec.begin(), ii=0; my_si != my_vec.end(); ++my_si, ++ii) {
+        if((*my_si) != ii) {
+            found_error = true;
+            REMARK("*my_si=%d, ii=%d\n", (int)(*my_si), (int)ii);
+        }
+    }
+
+    tbb::internal::segmented_iterator<nested_vec, const T> my_csi(my_vec);
+    for(my_csi=my_vec.begin(), ii=0; my_csi != my_vec.end(); ++my_csi, ++ii) {
+        if((*my_csi) != ii) {
+            found_error = true;
+            REMARK( "*my_csi=%d\n", int(*my_csi));
+        }
+    }
+
+    // outer level empty
+    my_vec.clear();
+    for(my_csi=my_vec.begin(); my_csi != my_vec.end(); ++my_csi) {
+        found_error = true;
+    }
+
+    // inner levels empty
+    my_vec.clear();
+    for(int i =0; i < maxval; ++i) {
+        my_vec.push_back(my_inner_container);
+    }
+    for(my_csi = my_vec.begin(); my_csi != my_vec.end(); ++my_csi) {
+        found_error = true;
+    }
+
+    // every other inner container is empty
+    my_vec.clear();
+    for(int i=0; i < maxval; ++i) {
+        my_vec.push_back(my_inner_container);
+        if(i%2) {
+            for(int j = 0; j < maxval; ++j) {
+                my_vec.at(i).push_back((T)(maxval * (i/2) + j));
+            }
+        }
+    }
+    for(my_csi = my_vec.begin(), ii=0; my_csi != my_vec.end(); ++my_csi, ++ii) {
+        if((*my_csi) != ii) {
+            found_error = true;
+            REMARK("*my_csi=%d, ii=%d\n", (int)(*my_csi), (int)ii);
+        }
+    }
+
+
+    if(found_error) REPORT("segmented_iterator failed\n");
+}
+
+template <typename Key, typename Val>
+void flog_segmented_iterator_map() {
+   typedef typename std::map<Key, Val> my_map;
+   typedef std::vector< my_map > nested_vec;
+   my_map my_inner_container;
+   my_inner_container.clear();
+   nested_vec my_vec;
+   my_vec.clear();
+   bool found_error = false;
+
+   // simple nested vector (neither level empty)
+   const int maxval = 4;
+   for(int i=0; i < maxval; i++) {
+       my_vec.push_back(my_inner_container);
+       for(int j = 0; j < maxval; j++) {
+           my_vec.at(i).insert(std::make_pair<Key,Val>(maxval * i + j, 2*(maxval*i + j)));
+       }
+   }
+
+   tbb::internal::segmented_iterator<nested_vec, std::pair<const Key, Val> > my_si(my_vec);
+   Key ii;
+   for(my_si=my_vec.begin(), ii=0; my_si != my_vec.end(); ++my_si, ++ii) {
+       if(((*my_si).first != ii) || ((*my_si).second != 2*ii)) {
+           found_error = true;
+           REMARK( "ii=%d, (*my_si).first=%d, second=%d\n",ii, int((*my_si).first), int((*my_si).second));
+       }
+   }
+
+   tbb::internal::segmented_iterator<nested_vec, const std::pair<const Key, Val> > my_csi(my_vec);
+   for(my_csi=my_vec.begin(), ii=0; my_csi != my_vec.end(); ++my_csi, ++ii) {
+       if(((*my_csi).first != ii) || ((*my_csi).second != 2*ii)) {
+           found_error = true;
+           REMARK( "ii=%d, (*my_csi).first=%d, second=%d\n",ii, int((*my_csi).first), int((*my_csi).second));
+       }
+   }
+   if(found_error) REPORT("segmented_iterator_map failed\n");
+}
+
+void run_segmented_iterator_tests() {
+   // only the following containers can be used with the segmented iterator.
+   REMARK("Running Segmented Iterator Tests\n");
+   flog_segmented_interator<std::vector< int > >();
+   flog_segmented_interator<std::vector< double > >();
+   flog_segmented_interator<std::deque< int > >();
+   flog_segmented_interator<std::deque< double > >();
+   flog_segmented_interator<std::list< int > >();
+   flog_segmented_interator<std::list< double > >();
+
+   flog_segmented_iterator_map<int, int>();
+   flog_segmented_iterator_map<int, double>();
+}
+
+template<typename T, template<class> class Allocator, typename Init>
+tbb::enumerable_thread_specific<T,Allocator<T> > MakeETS( Init init ) {
+    return tbb::enumerable_thread_specific<T,Allocator<T> >(init);
+}
+#if __TBB_ETS_USE_CPP11
+// In some GCC versions, parameter packs in lambdas might cause compile errors
+template<typename ETS, typename... P>
+struct MakeETS_Functor {
+    ETS operator()( typename tbb::internal::strip<P>::type&&... params ) {
+        return ETS(std::move(params)...);
+    }
+};
+template<typename T, template<class> class Allocator, typename... P>
+tbb::enumerable_thread_specific<T,Allocator<T> > MakeETS( tbb::internal::stored_pack<P...> pack ) {
+    typedef tbb::enumerable_thread_specific<T,Allocator<T> > result_type;
+    return tbb::internal::call_and_return< result_type >(
+        MakeETS_Functor<result_type,P...>(), std::move(pack)
+    );
+}
+#endif
+
+template<typename T, template<class> class Allocator, typename InitSrc, typename InitDst, typename Validator>
+void ets_copy_assign_test( InitSrc init1, InitDst init2, Validator check, const char *allocator_name ) {
+    typedef tbb::enumerable_thread_specific<T, Allocator<T> > ets_type;
+
+    // Create the source instance
+    const ets_type& cref_binder = MakeETS<T, Allocator>(init1);
+    ets_type& source = const_cast<ets_type&>(cref_binder);
+    check(check_alignment(source.local(),allocator_name));
+
+    // Test copy construction
+    bool existed = false;
+    ets_type copy(source);
+    check(check_alignment(copy.local(existed),allocator_name));
+    ASSERT(existed, "Local data not created by ETS copy constructor");
+    copy.clear();
+    check(check_alignment(copy.local(),allocator_name));
+
+    // Test assignment
+    existed = false;
+    ets_type assign(init2);
+    assign = source;
+    check(check_alignment(assign.local(existed),allocator_name));
+    ASSERT(existed, "Local data not created by ETS assignment");
+    assign.clear();
+    check(check_alignment(assign.local(),allocator_name));
+
+#if __TBB_ETS_USE_CPP11
+    // Create the source instance
+    ets_type&& rvref_binder = MakeETS<T, Allocator>(init1);
+    check(check_alignment(rvref_binder.local(),allocator_name));
+
+    // Test move construction
+    existed = false;
+    ets_type moved(rvref_binder);
+    check(check_alignment(moved.local(existed),allocator_name));
+    ASSERT(existed, "Local data not created by ETS move constructor");
+    moved.clear();
+    check(check_alignment(moved.local(),allocator_name));
+
+    // Test assignment
+    existed = false;
+    ets_type move_assign(init2);
+    move_assign = std::move(moved);
+    check(check_alignment(move_assign.local(existed),allocator_name));
+    ASSERT(existed, "Local data not created by ETS move assignment");
+    move_assign.clear();
+    check(check_alignment(move_assign.local(),allocator_name));
+#endif
+}
+
+template<typename T, int Expected>
+struct Validator {
+    void operator()( const T& value ) {
+        ASSERT(test_helper<T>::get(value) == Expected, NULL);
+    }
+    void operator()( const std::pair<int,T>& value ) {
+        ASSERT(value.first > 0, NULL);
+        ASSERT(test_helper<T>::get(value.second) == Expected*value.first, NULL);
+    }
+};
+
+template <typename T, template<class> class Allocator>
+void run_assign_and_copy_constructor_test(const char *test_name, const char *allocator_name) {
+    REMARK("Testing assignment and copy construction for %s with allocator %s\n", test_name, allocator_name);
+    #define EXPECTED 3142
+
+    // test with exemplar initializer
+    T src_init;
+    test_helper<T>::set(src_init,EXPECTED);
+    T other_init;
+    test_helper<T>::init(other_init);
+    ets_copy_assign_test<T, Allocator>(src_init, other_init, Validator<T,EXPECTED>(), allocator_name);
+
+    // test with function initializer
+    FunctorFinit<T,EXPECTED> src_finit(SecretTag);
+    FunctorFinit<T,0> other_finit(SecretTag);
+    ets_copy_assign_test<T, Allocator>(src_finit, other_finit, Validator<T,EXPECTED>(), allocator_name);
+
+#if __TBB_ETS_USE_CPP11
+    // test with multi-argument "emplace" initializer
+    // The arguments are wrapped into tbb::internal::stored_pack to avoid variadic templates in ets_copy_assign_test.
+    test_helper<T>::set(src_init,EXPECTED*17);
+    ets_copy_assign_test< std::pair<int,T>, Allocator>(tbb::internal::save_pack(17,src_init), std::make_pair(-1,T()), Validator<T,EXPECTED>(), allocator_name);
+#endif
+    #undef EXPECTED
+}
+
+template< template<class> class Allocator>
+void run_assignment_and_copy_constructor_tests(const char* allocator_name) {
+    REMARK("Running assignment and copy constructor tests\n");
+    run_assign_and_copy_constructor_test<int, Allocator>("int", allocator_name);
+    run_assign_and_copy_constructor_test<double, Allocator>("double", allocator_name);
+    // Try class sizes that are close to a cache line in size, in order to check padding calculations.
+    run_assign_and_copy_constructor_test<minimal<line_size-1>, Allocator >("minimal<line_size-1>", allocator_name);
+    run_assign_and_copy_constructor_test<minimal<line_size>, Allocator >("minimal<line_size>", allocator_name);
+    run_assign_and_copy_constructor_test<minimal<line_size+1>, Allocator >("minimal<line_size+1>", allocator_name);
+    ASSERT(FinitCounter==0, NULL);
+}
+
+// Class with no default constructor
+class HasNoDefaultConstructor {
+    HasNoDefaultConstructor();
+public:
+    HasNoDefaultConstructor( SecretTagType ) {}
+};
+// Initialization functor for HasNoDefaultConstructor
+struct HasNoDefaultConstructorFinit {
+    HasNoDefaultConstructor operator()() {
+        return HasNoDefaultConstructor(SecretTag);
+    }
+};
+// Combine functor for HasNoDefaultConstructor
+struct HasNoDefaultConstructorCombine {
+    HasNoDefaultConstructor operator()( HasNoDefaultConstructor, HasNoDefaultConstructor ) {
+        return HasNoDefaultConstructor(SecretTag);
+    }
+};
+
+#if __TBB_ETS_USE_CPP11
+// Class that only has a constructor with multiple parameters and a move constructor
+class HasSpecialAndMoveCtor : NoCopy {
+    HasSpecialAndMoveCtor();
+public:
+    HasSpecialAndMoveCtor( SecretTagType, size_t = size_t(0), const char* = "" ) {}
+    HasSpecialAndMoveCtor( HasSpecialAndMoveCtor&& ) {}
+};
+#endif
+
+// No-op combine-each functor
+template<typename V>
+struct EmptyCombineEach {
+    void operator()( const V& ) { }
+};
+
+int
+align_val(void * const p) {
+    size_t tmp = (size_t)p;
+    int a = 1;
+    while((tmp&0x1) == 0) { a <<=1; tmp >>= 1; }
+    return a;
+}
+
+bool is_between(void* lowp, void *highp, void *testp) {
+    if((size_t)lowp < (size_t)testp && (size_t)testp < (size_t)highp) return true;
+    return (size_t)lowp > (size_t)testp && (size_t)testp > (size_t)highp;
+}
+
+template<class U> struct alignment_of {
+    typedef struct { char t; U    padded; } test_alignment;
+    static const size_t value = sizeof(test_alignment) - sizeof(U);
+};
+using tbb::interface6::internal::ets_element;
+template<typename T, typename OtherType>
+void allocate_ets_element_on_stack(const char *name) {
+    typedef T aligning_element_type;
+    const size_t my_align = alignment_of<aligning_element_type>::value;
+    OtherType c1;
+    ets_element<aligning_element_type> my_stack_element;
+    OtherType c2;
+    ets_element<aligning_element_type> my_stack_element2;
+    struct {
+        OtherType cxx;
+        ets_element<aligning_element_type> my_struct_element;
+    } mystruct1;
+    tbb::internal::suppress_unused_warning(c1,c2);
+    REMARK("using %s, c1 address == %lx (alignment %d), c2 address == %lx (alignment %d)\n", name, &c1, align_val(&c1), &c2, align_val(&c2));
+    REMARK(" ---- my_align == %d\n", (int)my_align);
+    REMARK("    my_stack_element == %lx (alignment %d), my_stack_element2 == %lx (alignment %d)\n",
+            &my_stack_element, align_val(&my_stack_element), &my_stack_element2, align_val(&my_stack_element2));
+    if(is_between(&c1,&c2,&my_stack_element)) REMARK("my_struct_element is in the middle\n");
+    if(is_between(&c1,&c2,&my_stack_element2)) REMARK("my_struct_element2 is in the middle\n");
+    if(!is_between(&c1,&c2,&my_stack_element) && !is_between(&c1,&c2,&my_stack_element2)) REMARK("stack vars reorganized\n");
+    REMARK("   structure field address == %lx, alignment %d\n",
+            mystruct1.my_struct_element.value(),
+            align_val(mystruct1.my_struct_element.value())
+            );
+    ASSERT(tbb::internal::is_aligned(my_stack_element.value(), my_align), "Error in first stack alignment" );
+    ASSERT(tbb::internal::is_aligned(my_stack_element2.value(), my_align), "Error in second stack alignment" );
+    ASSERT(tbb::internal::is_aligned(mystruct1.my_struct_element.value(), my_align), "Error in struct element alignment" );
+}
+
+//! Test situations where only default constructor or copy constructor is required.
+template<template<class> class Allocator>
+void TestInstantiation(const char *allocator_name) {
+    REMARK("TestInstantiation<%s>\n", allocator_name);
+    // Test instantiation is possible when copy constructor is not required.
+    tbb::enumerable_thread_specific<NoCopy, Allocator<NoCopy> > ets1;
+    ets1.local();
+    ets1.combine_each(EmptyCombineEach<NoCopy>());
+
+    // Test instantiation when default constructor is not required, because exemplar is provided.
+    HasNoDefaultConstructor x(SecretTag);
+    tbb::enumerable_thread_specific<HasNoDefaultConstructor, Allocator<HasNoDefaultConstructor> > ets2(x);
+    ets2.local();
+    ets2.combine(HasNoDefaultConstructorCombine());
+
+    // Test instantiation when default constructor is not required, because init function is provided.
+    HasNoDefaultConstructorFinit f;
+    tbb::enumerable_thread_specific<HasNoDefaultConstructor, Allocator<HasNoDefaultConstructor> > ets3(f);
+    ets3.local();
+    ets3.combine(HasNoDefaultConstructorCombine());
+
+#if __TBB_ETS_USE_CPP11
+    // Test instantiation with multiple arguments
+    tbb::enumerable_thread_specific<HasSpecialAndMoveCtor, Allocator<HasSpecialAndMoveCtor> > ets4(SecretTag, 0x42, "meaningless");
+    ets4.local();
+    ets4.combine_each(EmptyCombineEach<HasSpecialAndMoveCtor>());
+    // Test instantiation with one argument that should however use the variadic constructor
+    tbb::enumerable_thread_specific<HasSpecialAndMoveCtor, Allocator<HasSpecialAndMoveCtor> > ets5(SecretTag);
+    ets5.local();
+    ets5.combine_each(EmptyCombineEach<HasSpecialAndMoveCtor>());
+    // Test that move operations do not impose extra requirements
+    // Default allocator is used. If it does not match Allocator, there will be elementwise move
+    tbb::enumerable_thread_specific<HasSpecialAndMoveCtor> ets6( std::move(ets4) );
+    ets6.combine_each(EmptyCombineEach<HasSpecialAndMoveCtor>());
+    ets6 = std::move(ets5);
+#endif
+}
+
+class BigType {
+public:
+    BigType() { /* avoid cl warning C4345 about default initialization of POD types */ }
+    char my_data[12 * 1024 * 1024];
+};
+
+template<template<class> class Allocator>
+void TestConstructorWithBigType(const char *allocator_name) {
+    typedef tbb::enumerable_thread_specific<BigType, Allocator<BigType> > CounterBigType;
+    REMARK("TestConstructorWithBigType<%s>\n", allocator_name);
+    // Test default constructor
+    CounterBigType MyCounters;
+    // Create a local instance.
+    typename CounterBigType::reference my_local = MyCounters.local();
+    my_local.my_data[0] = 'a';
+    // Test copy constructor
+    CounterBigType MyCounters2(MyCounters);
+    ASSERT(check_alignment(MyCounters2.local(), allocator_name).my_data[0]=='a', NULL);
+}
+
+int TestMain () {
+    size_t tbb_allocator_mask;
+    size_t cache_allocator_mask = tbb::internal::NFS_GetLineSize();
+    REMARK("estimatedCacheLineSize == %d, NFS_GetLineSize() returns %d\n",
+                (int)estimatedCacheLineSize, (int)tbb::internal::NFS_GetLineSize());
+    //TODO: use __TBB_alignof(T) to check for local() results instead of using internal knowledges of ets element padding
+    if(tbb::tbb_allocator<int>::allocator_type() == tbb::tbb_allocator<int>::standard) {
+        // scalable allocator is not available.
+        tbb_allocator_mask = 1;
+        REMARK("tbb::tbb_allocator is not available\n");
+    }
+    else {
+        // this value is for large objects, but will be correct for small.
+        tbb_allocator_mask = estimatedCacheLineSize;
+    }
+    AlignMask = cache_allocator_mask;
+    TestInstantiation<tbb::cache_aligned_allocator>("tbb::cache_aligned_allocator");
+    AlignMask = tbb_allocator_mask;
+    TestInstantiation<tbb::tbb_allocator>("tbb::tbb_allocator");
+    AlignMask = cache_allocator_mask;
+    run_assignment_and_copy_constructor_tests<tbb::cache_aligned_allocator>("tbb::cache_aligned_allocator");
+    AlignMask = tbb_allocator_mask;
+    run_assignment_and_copy_constructor_tests<tbb::tbb_allocator>("tbb::tbb_allocator");
+    run_segmented_iterator_tests();
+    flog_key_creation_and_deletion();
+
+    if (MinThread == 0) {
+        run_serial_tests();
+        MinThread = 1;
+    }
+    if (MaxThread > 0) {
+        AlignMask = cache_allocator_mask;
+        run_parallel_tests<tbb::cache_aligned_allocator>("tbb::cache_aligned_allocator");
+        AlignMask = tbb_allocator_mask;
+        run_parallel_tests<tbb::tbb_allocator>("tbb::tbb_allocator");
+        run_cross_type_tests();
+    }
+
+    AlignMask = cache_allocator_mask;
+    TestConstructorWithBigType<tbb::cache_aligned_allocator>("tbb::cache_aligned_allocator");
+    AlignMask = tbb_allocator_mask;
+    TestConstructorWithBigType<tbb::tbb_allocator>("tbb::tbb_allocator");
+
+    allocate_ets_element_on_stack<int,char>("int vs. char");
+    allocate_ets_element_on_stack<int,short>("int vs. short");
+    allocate_ets_element_on_stack<int,char[3]>("int vs. char[3]");
+    allocate_ets_element_on_stack<float,char>("float vs. char");
+    allocate_ets_element_on_stack<float,short>("float vs. short");
+    allocate_ets_element_on_stack<float,char[3]>("float vs. char[3]");
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_environment_whitebox.cpp b/xdl/third_party/tbb/src/test/test_environment_whitebox.cpp
new file mode 100644
index 00000000..4a0fae13
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_environment_whitebox.cpp
@@ -0,0 +1,127 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#include "../tbb/tbb_environment.h"
+
+#include <time.h>
+#include <string>
+#include <algorithm>
+
+// For WIN8UI applications reading and writing the environment variables
+// is prohibited due to the platform limitations
+#if !__TBB_WIN8UI_SUPPORT
+
+void set_and_get_tbb_version(const char* value, bool expected_result){
+    // TODO: consider to replace TBB_VERSION with test specific or arbitrary variable
+    const char* name = "TBB_VERSION";
+    Harness::SetEnv(name, value);
+    bool result = tbb::internal::GetBoolEnvironmentVariable(name);
+    ASSERT(result == expected_result, "Wrong GetBoolEnvironmentVariable return value");
+    Harness::SetEnv(name, "");
+}
+
+Harness::FastRandom rnd(12345);
+
+struct random_character_generator {
+    char operator()() {
+        return rnd.get() % 128; // 127 - the last ASCII symbol
+    }
+};
+
+void test_random_environment_variable(size_t length) {
+    ASSERT(length != 0, "Requested random string cannot be empty");
+    std::string rand_string(length, ' ');
+    std::generate(rand_string.begin(), rand_string.end(), random_character_generator());
+    bool expected_result = false;
+    for (unsigned i = 0; rand_string[i]; i++)
+        if (rand_string[i] == '1') {
+            // if we found more the one '1' character -> return false
+            expected_result = !expected_result;
+            if (!expected_result) break;
+        }
+        else if (rand_string[i] != ' ') {
+            // if we found some character other than ' ' and '1'  -> return false
+            expected_result = false;
+            break;
+        }
+
+    set_and_get_tbb_version(rand_string.c_str(), expected_result);
+}
+
+void test_get_bool_environment_variable() {
+    // Test undefined variable
+    ASSERT(!tbb::internal::GetBoolEnvironmentVariable("TBB_VERSION"),
+           "TBB_VERSION should not be defined in the beginning of the test");
+
+    set_and_get_tbb_version("", false);
+    set_and_get_tbb_version(" ", false);
+    set_and_get_tbb_version("1", true);
+    set_and_get_tbb_version(" 1 ", true);
+    set_and_get_tbb_version("1               ", true);
+    set_and_get_tbb_version("            1               ", true);
+    set_and_get_tbb_version("            1", true);
+    set_and_get_tbb_version(" 11", false);
+    set_and_get_tbb_version("111111", false);
+    set_and_get_tbb_version("1 1", false);
+    set_and_get_tbb_version(" 1 abc?", false);
+    set_and_get_tbb_version("1;", false);
+    set_and_get_tbb_version(" d ", false);
+    set_and_get_tbb_version("0", false);
+    set_and_get_tbb_version("0 ", false);
+    set_and_get_tbb_version("000000", false);
+    set_and_get_tbb_version("01", false);
+    set_and_get_tbb_version("00000001", false);
+    set_and_get_tbb_version("ABCDEFG", false);
+    set_and_get_tbb_version("2018", false);
+    set_and_get_tbb_version("ABC_123", false);
+    set_and_get_tbb_version("true", false);
+
+    size_t length = 10000;
+
+    for(size_t i =0; i < 10; ++i) {
+        test_random_environment_variable((rnd.get() % length) + 1);
+    }
+
+#if _WIN32 || _WIN64
+    // Environment variable length is limited by 32K on Windows systems
+    size_t large_length = 32000;
+#else
+    size_t large_length = 1000000;
+#endif
+    set_and_get_tbb_version(std::string(large_length, 'A').c_str(), false);
+    set_and_get_tbb_version((std::string(large_length, ' ')+'1').c_str(), true);
+    test_random_environment_variable(large_length);
+}
+
+#else // __TBB_WIN8UI_SUPPORT
+
+void test_get_bool_environment_variable() {
+    for(size_t i = 0; i < 100; ++i) {
+        ASSERT(!tbb::internal::GetBoolEnvironmentVariable("TBB_VERSION"),
+               "GetBoolEnvironmentVariable should always return false for UWP applications");
+    }
+}
+#endif // __TBB_WIN8UI_SUPPORT
+
+int TestMain() {
+    test_get_bool_environment_variable();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_examples_common_utility.cpp b/xdl/third_party/tbb/src/test/test_examples_common_utility.cpp
new file mode 100644
index 00000000..87f6aff2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_examples_common_utility.cpp
@@ -0,0 +1,602 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_TEST_USE_WSUGGEST_OVERRIDE
+// __TBB_override may not be used in the tested header file
+#pragma GCC diagnostic ignored "-Wsuggest-override"
+#undef __TBB_TEST_USE_WSUGGEST_OVERRIDE
+#endif
+
+#include "harness_defs.h" // for suppress_unused_warning
+
+#if TBB_USE_EXCEPTIONS
+#include "harness_assert.h"
+#include "../../examples/common/utility/utility.h"
+#include <sstream>
+
+namespace implementation_unit_tests {
+    namespace argument_dest_test_suite{
+        void test_type_impl_parse_and_store_simple_parse(){
+            int a=0;
+            utility::internal::type_impl<int> a_("","",a);
+            a_.parse_and_store("9");
+            ASSERT(a==9,"");
+        }
+        void test_default_value_of_is_matched(){
+            //Testing for result of is_matched() for arguments not yet tried to be parsed.
+            //I.e. values were set up by argument::constructor.
+            using  utility::internal::argument;
+            int i;
+            argument b("","",i);
+            ASSERT(!b.is_matched(),"");
+
+            argument c = b;
+            ASSERT(!c.is_matched(),"");
+
+            argument d = b;
+            d = c;
+            ASSERT(!d.is_matched(),"");
+        }
+    }
+    //TODO: test cases  for argument type management
+    namespace compile_only{
+        //TODO: enhance these to actually do checks  by a negative test, or (if possible)
+        //by a positive test that at compile time selects between two alternatives,
+        //depending on whether operators exist or not (yes, SFINAE :)) -
+        //as non_pod class does provide the operators, and test  do not check that compiler
+        //will reject types which don't have those.
+        using utility::cli_argument_pack;
+        void arg_chain(){
+            cli_argument_pack p;
+            int size=0;
+            p.arg(size,"size","size");
+        }
+        namespace tc_helper{
+            struct non_pod{
+                std::string s;
+                friend std::ostream& operator<<(std::ostream& o, non_pod){ return o;}
+                friend std::istream& operator>>(std::istream& i, non_pod){ return i;}
+            };
+        }
+        void non_pod_dest_type(){
+            cli_argument_pack p;
+            tc_helper::non_pod np;
+            p.arg(np,"","");
+        }
+    }
+    namespace cli_argument_pack_suite{
+        void test_copy_assign(){
+            using utility::cli_argument_pack;
+            int i=9;
+            std::stringstream expected_output; using std::endl;
+            expected_output
+                 << " Program usage is:" << endl
+                 << " the_binary_name [i=value]"
+                 << endl << endl
+                 << " where:" << endl
+                 << " i - i desc (9)" << endl
+            ;
+            cli_argument_pack copy(cli_argument_pack().arg(i,"i","i desc"));
+            ASSERT(copy.usage_string("the_binary_name") == expected_output.str(),"usage string is not as expected");
+            cli_argument_pack assignee; assignee = copy;
+            ASSERT(assignee.usage_string("the_binary_name") == expected_output.str(),"Copying of cli_argument_pack breaks generation of usage string?");
+        }
+    }
+}
+
+#include <utility>
+namespace high_level_api_tests {
+    using utility::cli_argument_pack;
+    using utility::internal::array_length;
+
+    static const char * wrong_exception = "wrong exception thrown";
+    static const char * wrong_exception_description = "caught exception has wrong description";
+    void test_parse_basic(){
+        char const* argv[]={"some.exe","1","a"};
+        cli_argument_pack p;
+        int i=0; char a=' ';
+        p.positional_arg(i,"int","").positional_arg(a,"char","");
+        p.parse(array_length(argv),argv);
+        ASSERT(i==1,"");
+        ASSERT(a=='a',"");
+    }
+    //helper function for test of named flag parsing
+    template<typename T, size_t N>
+    bool parse_silent_flag( T(& argv)[N]){
+        cli_argument_pack p;
+        bool silent=false;
+        p.arg(silent,"silent","is extra info needed");
+        p.parse(array_length(argv),argv);
+        return  silent;
+    }
+    void test_named_flags_success(){
+        char const* argv[]={"some.exe","silent"};
+        ASSERT(true == parse_silent_flag(argv),"");
+    }
+
+    void test_named_flags_failure(){
+        try {
+            char const* argv[]={"some.exe","1"};
+            parse_silent_flag(argv);
+            ASSERT(false,"exception was expected due to invalid argument, but not caught");
+        }
+        catch(std::invalid_argument& e){
+            ASSERT(e.what()==std::string("unknown parameter starting at:'1'"),wrong_exception_description);
+        }
+        catch(...){ASSERT(false,wrong_exception);}
+    }
+
+    //helper function for test of named flag parsing
+    template<typename T, size_t N>
+    std::pair<bool,int> parse_silent_flag_and_int( T(& argv)[N]){
+        cli_argument_pack p;
+        bool silent=false;
+        int i=125;
+        p
+            .arg(silent,"silent","is extra info needed")
+            .positional_arg(i,"int","");
+        p.parse(array_length(argv),argv);
+        return  std::make_pair(silent,i);
+    }
+
+    void test_named_flags_failure_and_other_arg(){
+        char const* argv[]={"some.exe","1"};
+        ASSERT(std::make_pair(false,1) == parse_silent_flag_and_int(argv),"");
+    }
+
+    void test_named_flags_and_other_arg(){
+        char const* argv[]={"some.exe","silent","7"};
+        ASSERT(std::make_pair(true,7) == parse_silent_flag_and_int(argv),"");
+    }
+
+    void test_named_flags_and_other_arg_different_order(){
+        char const* argv[]={"some.exe","7","silent"};
+        ASSERT(std::make_pair(true,7) == parse_silent_flag_and_int(argv),"");
+    }
+
+    void test_flags_only_others_default(){
+        char const* argv[]={"some.exe","silent"};
+        ASSERT(std::make_pair(true,125) == parse_silent_flag_and_int(argv),"");
+    }
+
+    namespace parameters_validation_test_suite{
+        namespace test_validation_function_called_helpers{
+            struct validator{
+                static bool called;
+                static bool accept(const int & ){
+                    called = true;
+                    return true;
+                }
+            };
+            bool validator::called =false;
+        }
+        void test_validation_function_called(){
+            using test_validation_function_called_helpers::validator;
+
+            char const* argv[]={"some.exe","7"};
+            cli_argument_pack p;
+            int size =0;
+            p.positional_arg(size,"size","",validator::accept);
+            p.parse(array_length(argv),argv);
+            ASSERT((validator::called),"validation function has not been called");
+        }
+        void test_validation_failed(){
+            struct validator{
+                static bool reject(const int &){
+                    return false;
+                }
+            };
+            char const* argv[]={"some.exe","7"};
+            cli_argument_pack p;
+            int size =0;
+            p.positional_arg(size,"size","",validator::reject);
+            try {
+                p.parse(array_length(argv),argv);
+                ASSERT((false),"An exception was expected due to failed argument validation, "
+                        "but no exception thrown");
+            }
+            catch(std::invalid_argument& e){
+                std::string error_msg("'7' is invalid value for argument 'size'");
+                ASSERT(e.what()==error_msg , wrong_exception_description);
+            }
+            catch(...){ASSERT((false),wrong_exception);}
+        }
+    }
+    namespace error_handling {
+        void test_wrong_input(){
+            char const* argv[]={"some.exe","silent"};
+            cli_argument_pack p;
+            int size =0;
+            p.positional_arg(size,"size","");
+            try{
+                p.parse(array_length(argv),argv);
+                ASSERT(false,"An exception was expected due to wrong input, but no exception thrown");
+            }
+            catch(std::invalid_argument & e){
+                std::string error_msg("'silent' is incorrect input for argument 'size' (error converting string 'silent')");
+                ASSERT(e.what()==error_msg, wrong_exception_description);
+            }
+            catch(...){ASSERT(false,wrong_exception);}
+        }
+        void test_duplicate_arg_names(){
+            cli_argument_pack p;
+            int a=0;
+            p.arg(a,"a","");
+            try{
+                int dup_a=0;
+                p.arg(dup_a,"a","");
+                ASSERT(false, "An exception was expected due adding duplicate parameter name, but not thrown");
+            }
+            catch(std::invalid_argument& e){
+                ASSERT(e.what()==std::string("argument with name: 'a' already registered"),wrong_exception_description);
+            }
+            catch(...){ASSERT(false,wrong_exception);}
+        }
+        void test_duplicate_positional_arg_names(){
+            cli_argument_pack p;
+            int a=0;
+            p.positional_arg(a,"a","");
+            try{
+                int dup_a=0;
+                p.positional_arg(dup_a,"a","");
+                ASSERT(false, "An exception was expected due adding duplicate parameter name, but not thrown");
+            }
+            catch(std::invalid_argument& e){
+                ASSERT(e.what()==std::string("argument with name: 'a' already registered"),wrong_exception_description);
+            }
+            catch(...){ASSERT(false,wrong_exception);}
+        }
+    }
+    namespace usage_string {
+        void test_one_arg(){
+            cli_argument_pack p;
+            int size =9;
+            p.arg(size,"size","size of problem domain");
+            std::string const binary_name = "binary.exe";
+            std::stringstream expected_output;
+            using std::endl;
+            expected_output << " Program usage is:" << endl
+                 << " " << binary_name << " [size=value]"
+                 << endl << endl
+                 << " where:" << endl
+                 << " size - size of problem domain (9)" << endl
+            ;
+            std::string usage= p.usage_string(binary_name);
+            ASSERT(usage==expected_output.str(),"");
+        }
+        void test_named_and_postional_args(){
+            cli_argument_pack p;
+            int size =9;
+            int length =8;
+            int stride = 7;
+            p
+                .arg(size,"size","")
+                .positional_arg(length,"length","")
+                .positional_arg(stride,"stride","");
+            std::string const binary_name = "binary.exe";
+            std::stringstream expected_output;
+            using std::endl;
+            expected_output << " Program usage is:" << endl
+                 << " " << binary_name << " [size=value] [length=value] [stride=value] [length [stride]]"
+                 << endl << endl
+                 << " where:" << endl
+                 << " size -  (9)" << endl
+                 << " length -  (8)" << endl
+                 << " stride -  (7)" << endl
+            ;
+            std::string usage= p.usage_string(binary_name);
+            ASSERT(usage==expected_output.str(),"");
+        }
+        void test_bool_flag(){
+            bool flag=false;
+            cli_argument_pack p;
+            p.arg(flag,"flag","");
+            std::string const binary_name = "binary.exe";
+            std::stringstream expected_output;
+            using std::endl;
+            expected_output << " Program usage is:" << endl
+                 << " " << binary_name << " [flag]"
+                 << endl << endl
+                 << " where:" << endl
+                 << " flag -  (0)" << endl
+            ;
+            std::string usage= p.usage_string(binary_name);
+            ASSERT(usage==expected_output.str(),"");
+
+        }
+
+    }
+    namespace name_positional_syntax {
+        void test_basic(){
+            cli_argument_pack p;
+            int size =0;
+            int time = 0;
+            p
+                .positional_arg(size,"size","")
+                .positional_arg(time,"time","");
+            char const* argv[]={"some.exe","1","2"};
+            p.parse(array_length(argv),argv);
+            ASSERT(size==1,"");
+            ASSERT(time==2,"");
+        }
+        void test_positional_args_explicitly_named(){
+            const char* no_or_wrong_exception_error_msg = "exception was expected but not thrown, or wrong exception caught";
+            //TODO: Similar functionality is used all over the test. Generalize this helper further, and use as wide within the test as possible?
+            struct failed_with_exception{
+                static bool _(cli_argument_pack & p, std::size_t argc, char const* argv[]){
+                    try{
+                        p.parse(argc,argv);
+                        return false;
+                    }
+                    catch(std::exception &){
+                        return true;
+                    }
+                    catch(...){
+                        return false;
+                    }
+                }
+            };
+            {
+                cli_argument_pack p;
+                int a,b,c,d;
+                p
+                    .positional_arg(a,"a","")
+                    .positional_arg(b,"b","")
+                    .positional_arg(c,"c","")
+                    .positional_arg(d,"d","");
+                char const* argv[]={"some.exe","a=7","0","1","2","4"};
+                ASSERT(failed_with_exception::_(p,array_length(argv),argv),no_or_wrong_exception_error_msg);
+            }
+            {
+                cli_argument_pack p;
+                int a,b,c,d;
+                p
+                    .positional_arg(a,"a","")
+                    .positional_arg(b,"b","")
+                    .positional_arg(c,"c","")
+                    .positional_arg(d,"d","");
+                char const* argv[]={"some.exe","a=7","0","1","2"};
+                ASSERT(failed_with_exception::_(p,array_length(argv),argv),no_or_wrong_exception_error_msg);
+            }
+            {
+                cli_argument_pack p;
+                int a=-1,b=-1,c = -1,d=-1;
+                p
+                    .positional_arg(a,"a","")
+                    .positional_arg(b,"b","")
+                    .positional_arg(c,"c","")
+                    .positional_arg(d,"d","");
+                char const* argv[]={"some.exe","0","1","d=7",};
+                ASSERT(!failed_with_exception::_(p,array_length(argv),argv),"unexpected exception");
+                ASSERT(a==0,""); ASSERT(b==1,""); ASSERT(c==-1,"");ASSERT(d==7,"");
+            }
+        }
+    }
+    namespace name_value_syntax {
+        void test_basic(){
+            cli_argument_pack p;
+            int size =0;
+            p.arg(size,"size","size of problem domain");
+            char const* argv[]={"some.exe","size=7"};
+            p.parse(array_length(argv),argv);
+            ASSERT(size==7,"");
+        }
+
+        void test_relaxed_order(){
+            cli_argument_pack p;
+            int size =0;
+            int time=0;
+            p
+                .arg(size,"size","")
+                .arg(time,"time","");
+            char const* argv[]={"some.exe","time=1","size=2"};
+            p.parse(array_length(argv),argv);
+            ASSERT(size==2,"");
+            ASSERT(time==1,"");
+        }
+
+    }
+    namespace number_of_argument_value{
+        void test_only_single_values_allowed(){
+            cli_argument_pack p;
+            int a=0;
+            p.arg(a,"a","");
+            const char* argv[] = {"","a=7","a=8"};
+            try {
+                p.parse(array_length(argv),argv);
+                ASSERT(false,"exception was expected due to duplicated values provided in input, but not thrown");
+            }
+            catch(std::invalid_argument& e){
+                //TODO: use patterns (regexp ?) to generate /validate exception descriptions
+                ASSERT(e.what() == std::string("several values specified for: 'a' argument"),wrong_exception_description);
+            }
+            catch(...){ASSERT(false,wrong_exception);}
+        }
+    }
+    namespace thread_range_tests{
+        using utility::thread_number_range;
+        using utility::internal::thread_range_step;
+        using utility::internal::step_function_multiply;
+        using utility::internal::step_function_plus;
+        using utility::internal::step_function_power2_ladder;
+
+        int auto_value(){
+            return 100;
+        }
+        bool operator ==(thread_range_step const& left, utility::internal::thread_range_step const& right){
+            return (left.step_function == right.step_function)
+                   && (left.step_function_argument == right.step_function_argument)
+            ;
+        }
+
+        bool operator ==(thread_number_range const& left, thread_number_range const& right){
+            return (left.auto_number_of_threads==right.auto_number_of_threads)
+                    && (left.first == right.first)
+                    && (left.last == right.last)
+                    && (left.step == right.step)
+            ;
+        }
+
+        void constructor_default_values(){
+            thread_number_range r(auto_value);
+            const int default_num_threads = auto_value();
+            ASSERT((r.first==1)&&(r.last==default_num_threads),"");
+        }
+        void validation(){
+            try{
+                thread_number_range range(auto_value,12,6);
+                Harness::suppress_unused_warning(range);
+                ASSERT(false,"exception was expected due to invalid range specified, but not thrown");
+            }
+            catch(std::invalid_argument& e){
+                ASSERT(e.what() == std::string("decreasing sequence not allowed"), wrong_exception_description);
+            }
+            catch(...){ASSERT(false,wrong_exception);}
+        }
+
+        thread_number_range thread_number_range_from_string(std::string const& string_to_parse){
+            thread_number_range r(auto_value,0,0);
+            std::stringstream str(string_to_parse); str>>r;
+            return r;
+        }
+        static const char* thread_range_parse_failed = "error parsing thread range string";
+        void post_process_single_value(){
+            ASSERT(thread_number_range_from_string("auto") ==
+                    thread_number_range(auto_value,auto_value(),auto_value())
+                  ,thread_range_parse_failed
+            );
+        }
+        void post_process_pair_value(){
+            ASSERT(thread_number_range_from_string("1:auto") ==
+                    thread_number_range(auto_value,1,auto_value())
+                  ,thread_range_parse_failed
+            );
+
+            ASSERT(thread_number_range_from_string("auto:auto") ==
+                    thread_number_range(auto_value,auto_value(),auto_value())
+                  ,thread_range_parse_failed
+            );
+        }
+
+        void post_process_troika_value_with_plus_step(){
+            ASSERT(thread_number_range_from_string("1:auto:+2") ==
+                    thread_number_range(auto_value,1,auto_value(),thread_range_step(step_function_plus,2))
+                  ,thread_range_parse_failed
+            );
+        }
+
+        void post_process_troika_value_with_multiply_step(){
+            ASSERT(thread_number_range_from_string("1:auto:*2.6") ==
+                    thread_number_range(auto_value,1,auto_value(),thread_range_step(step_function_multiply,2.6))
+                  ,thread_range_parse_failed
+            );
+        }
+
+        void post_process_troika_value_with_ladder_step(){
+            try{
+                thread_number_range range = thread_number_range_from_string("1:16:#3");
+                Harness::suppress_unused_warning(range);
+                ASSERT(false,"exception was expected due to invalid range specified, but not thrown");
+            }
+            catch(std::invalid_argument& e){
+                ASSERT(e.what() == std::string("the argument of # should be a power of 2"), wrong_exception_description);
+            }
+            catch(...){ASSERT(false,wrong_exception);}
+
+            ASSERT(thread_number_range_from_string("1:32:#4") ==
+                    thread_number_range(auto_value,1,32,thread_range_step(step_function_power2_ladder,4))
+                  ,thread_range_parse_failed
+            );
+        }
+
+        void test_print_content(){
+            std::stringstream str;
+            str<<thread_number_range(auto_value,1,8,thread_range_step(step_function_multiply,2));
+            ASSERT(str.str() == "1:8:*2","Unexpected string");
+        }
+    }
+}
+
+void run_implementation_unit_tests(){
+    using namespace implementation_unit_tests;
+    argument_dest_test_suite::test_type_impl_parse_and_store_simple_parse();
+    argument_dest_test_suite::test_default_value_of_is_matched();
+
+    cli_argument_pack_suite::test_copy_assign();
+}
+void run_high_level_api_tests(){
+    using namespace  high_level_api_tests;
+
+    test_parse_basic();
+    test_named_flags_success();
+    test_named_flags_failure();
+    test_named_flags_failure_and_other_arg();
+    test_named_flags_and_other_arg();
+    test_flags_only_others_default();
+    test_named_flags_and_other_arg_different_order();
+
+    usage_string::test_one_arg();
+    usage_string::test_named_and_postional_args();
+    usage_string::test_bool_flag();
+
+    parameters_validation_test_suite::test_validation_function_called();
+    parameters_validation_test_suite::test_validation_failed();
+
+    name_value_syntax::test_basic();
+    name_value_syntax::test_relaxed_order();
+
+    number_of_argument_value::test_only_single_values_allowed();
+
+    name_positional_syntax::test_basic();
+    name_positional_syntax::test_positional_args_explicitly_named();
+
+    error_handling::test_wrong_input();
+    error_handling::test_duplicate_arg_names();
+    error_handling::test_duplicate_positional_arg_names();
+
+    thread_range_tests::constructor_default_values();
+    thread_range_tests::validation();
+    thread_range_tests::post_process_single_value();
+    thread_range_tests::post_process_pair_value();
+    thread_range_tests::post_process_troika_value_with_plus_step();
+    thread_range_tests::post_process_troika_value_with_multiply_step();
+    thread_range_tests::post_process_troika_value_with_ladder_step();
+    thread_range_tests::test_print_content();
+}
+#endif // TBB_USE_EXCEPTIONS
+
+#include "harness.h"
+int TestMain(){
+#if TBB_USE_EXCEPTIONS
+    Harness::suppress_unused_warning(utility::thread_number_range_desc);
+    try{
+        run_implementation_unit_tests();
+        run_high_level_api_tests();
+    }catch(std::exception& e){
+        //something went wrong , dump any possible details
+        std::stringstream str; str<< "run time error: " << e.what()<<std::endl;
+        ASSERT(false,str.str().c_str());
+    }
+    return Harness::Done;
+#else
+    REPORT("Known issue: the test cannot work with exceptions disabled\n");
+    return Harness::Done;
+#endif
+}
diff --git a/xdl/third_party/tbb/src/test/test_fast_random.cpp b/xdl/third_party/tbb/src/test/test_fast_random.cpp
new file mode 100644
index 00000000..a5711231
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_fast_random.cpp
@@ -0,0 +1,200 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/**
+    The test checks that for different ranges of random numbers (from 0 to
+    [MinThread, MaxThread]) generated with different seeds the probability
+    of each number in the range deviates from the ideal random distribution
+    by no more than AcceptableDeviation percent.
+**/
+
+#define HARNESS_DEFAULT_MIN_THREADS 2
+#define HARNESS_DEFAULT_MAX_THREADS 32
+
+#define HARNESS_DEFINE_PRIVATE_PUBLIC 1
+#include "harness_inject_scheduler.h"
+
+#define TEST_TOTAL_SEQUENCE 0
+
+#include "harness.h"
+#include "tbb/atomic.h"
+
+//! Coefficient defining tolerable deviation from ideal random distribution
+const double AcceptableDeviation = 2.1;
+//! Tolerable probability of failure to achieve tolerable distribution
+const double AcceptableProbabilityOfOutliers = 1e-5;
+//! Coefficient defining the length of random numbers series used to estimate the distribution
+/** Number of random values generated per each range element. I.e. the larger is
+    the range, the longer is the series of random values. **/
+const uintptr_t SeriesBaseLen = 100;
+//! Number of random numbers series to generate
+const uintptr_t NumSeries = 100;
+//! Number of random number generation series with different seeds
+const uintptr_t NumSeeds = 100;
+
+tbb::atomic<uintptr_t> NumHighOutliers;
+tbb::atomic<uintptr_t> NumLowOutliers;
+
+inline void CheckProbability ( double probability, double expectedProbability, int index, int numIndices, void* seed ) {
+    double lowerBound = expectedProbability / AcceptableDeviation,
+           upperBound = expectedProbability * AcceptableDeviation;
+    if ( probability < lowerBound ) {
+        if ( !NumLowOutliers )
+            REMARK( "Warning: Probability %.3f of hitting index %d among %d elements is out of acceptable range (%.3f - %.3f) for seed %p\n",
+                    probability, index, numIndices, lowerBound, upperBound, seed );
+        ++NumLowOutliers;
+    }
+    else if ( probability > upperBound ) {
+        if ( !NumHighOutliers )
+            REMARK( "Warning: Probability %.3f of hitting index %d among %d elements is out of acceptable range (%.3f - %.3f) for seed %p\n",
+                    probability, index, numIndices, lowerBound, upperBound, seed );
+        ++NumHighOutliers;
+    }
+}
+
+struct CheckDistributionBody {
+    void operator() ( int id ) const {
+        uintptr_t randomRange = id + MinThread;
+        uintptr_t *curHits = new uintptr_t[randomRange]
+#if TEST_TOTAL_SEQUENCE
+                , *totalHits = new uintptr_t[randomRange]
+#endif
+        ;
+        double expectedProbability = 1./randomRange;
+        // Loop through different seeds
+        for ( uintptr_t i = 0; i < NumSeeds; ++i ) {
+            // Seed value mimics the one used by the TBB task scheduler
+            void* seed = (char*)&curHits + i * 16;
+            tbb::internal::FastRandom random( seed );
+            // According to Section 3.2.1.2 of Volume 2 of Knuth's Art of Computer Programming
+            // the following conditions must be hold for m=2^32:
+            ASSERT((random.c&1)!=0, "c is relatively prime to m");
+            ASSERT((random.a-1)%4==0, "a-1 is a multiple of p, for every prime p dividing m."
+                   " And a-1 is a multiple of 4, if m is a multiple of 4");
+
+            memset( curHits, 0, randomRange * sizeof(uintptr_t) );
+#if TEST_TOTAL_SEQUENCE
+            memset( totalHits, 0, randomRange * sizeof(uintptr_t) );
+#endif
+            const uintptr_t seriesLen = randomRange * SeriesBaseLen,
+                            experimentLen = NumSeries * seriesLen;
+            uintptr_t *curSeries = new uintptr_t[seriesLen],  // circular buffer
+                       randsGenerated = 0;
+            // Initialize statistics
+            while ( randsGenerated < seriesLen ) {
+                uintptr_t idx = random.get() % randomRange;
+                ++curHits[idx];
+#if TEST_TOTAL_SEQUENCE
+                ++totalHits[idx];
+#endif
+                curSeries[randsGenerated++] = idx;
+            }
+            while ( randsGenerated < experimentLen ) {
+                for ( uintptr_t j = 0; j < randomRange; ++j ) {
+                    CheckProbability( double(curHits[j])/seriesLen, expectedProbability, j, randomRange, seed );
+#if TEST_TOTAL_SEQUENCE
+                    CheckProbability( double(totalHits[j])/randsGenerated, expectedProbability, j, randomRange, seed );
+#endif
+                }
+                --curHits[curSeries[randsGenerated % seriesLen]];
+                int idx = random.get() % randomRange;
+                ++curHits[idx];
+#if TEST_TOTAL_SEQUENCE
+                ++totalHits[idx];
+#endif
+                curSeries[randsGenerated++ % seriesLen] = idx;
+            }
+            delete [] curSeries;
+        }
+        delete [] curHits;
+#if TEST_TOTAL_SEQUENCE
+        delete [] totalHits;
+#endif
+    }
+};
+
+struct rng {
+    tbb::internal::FastRandom my_fast_random;
+    rng (unsigned seed):my_fast_random(seed) {}
+    unsigned short operator()(){return my_fast_random.get();}
+};
+
+template <std::size_t seriesLen >
+struct SingleCheck{
+    bool operator()(unsigned seed)const{
+        std::size_t series1[seriesLen]={0};
+        std::size_t series2[seriesLen]={0};
+        std::generate(series1,series1+seriesLen,rng(seed));
+        std::generate(series2,series2+seriesLen,rng(seed));
+        return std::equal(series1,series1+seriesLen,series2);
+    }
+};
+
+template <std::size_t seriesLen ,size_t seedsNum>
+struct CheckReproducibilityBody:NoAssign{
+    unsigned short seeds[seedsNum];
+    const std::size_t grainSize;
+    CheckReproducibilityBody(std::size_t GrainSize): grainSize(GrainSize){
+       //first generate seeds to check on, and make sure that sequence is reproducible
+       ASSERT(SingleCheck<seedsNum>()(0),"Series generated by FastRandom must be reproducible");
+       std::generate(seeds,seeds+seedsNum,rng(0));
+    }
+
+    void operator()(int id)const{
+       for (size_t i=id*grainSize; (i<seedsNum)&&(i< ((id+1)*grainSize));++i ){
+           ASSERT(SingleCheck<seriesLen>()(i),"Series generated by FastRandom must be reproducible");
+       }
+    }
+
+};
+#include "tbb/tbb_thread.h"
+
+int TestMain () {
+    ASSERT( AcceptableDeviation < 100, NULL );
+    MinThread = max(MinThread, 2);
+    MaxThread = max(MinThread, MaxThread);
+    double NumChecks = double(NumSeeds) * (MaxThread - MinThread + 1) * (MaxThread + MinThread) / 2.0 * (SeriesBaseLen * NumSeries - SeriesBaseLen);
+    REMARK( "Number of distribution quality checks %g\n", NumChecks );
+    NumLowOutliers = NumHighOutliers = 0;
+    // Parallelism is used in this test only to speed up the long serial checks
+    // Essentially it is a loop over random number ranges
+    // Ideally tbb::parallel_for could be used to parallelize the outermost loop
+    // in CheckDistributionBody, but it is not used to avoid unit test contamination.
+    int P = tbb::tbb_thread::hardware_concurrency();
+    enum {reproducibilitySeedsToTest=1000};
+    enum {reproducibilitySeriesLen=100};
+    CheckReproducibilityBody<reproducibilitySeriesLen,reproducibilitySeedsToTest>  CheckReproducibility(reproducibilitySeedsToTest/MaxThread);
+    while ( MinThread <= MaxThread ) {
+        int ThreadsToRun = min(P, MaxThread - MinThread + 1);
+        REMARK("Checking random range [%d;%d)\n", MinThread, MinThread+ThreadsToRun);
+        NativeParallelFor( ThreadsToRun, CheckDistributionBody() );
+        NativeParallelFor( ThreadsToRun, CheckReproducibility );
+        MinThread += P;
+    }
+    double observedProbabilityOfOutliers = (NumLowOutliers + NumHighOutliers) / NumChecks;
+    if ( observedProbabilityOfOutliers > AcceptableProbabilityOfOutliers ) {
+        if ( NumLowOutliers )
+            REPORT( "Warning: %d cases of too low probability of a given number detected\n", (int)NumLowOutliers );
+        if ( NumHighOutliers )
+            REPORT( "Warning: %d cases of too high probability of a given number detected\n", (int)NumHighOutliers );
+        ASSERT( observedProbabilityOfOutliers <= AcceptableProbabilityOfOutliers, NULL );
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_flow_graph.cpp b/xdl/third_party/tbb/src/test/test_flow_graph.cpp
new file mode 100644
index 00000000..88baa6de
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_flow_graph.cpp
@@ -0,0 +1,376 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_graph.h"
+#include "harness_barrier.h"
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+
+const int T = 4;
+const int W = 4;
+
+struct decrement_wait : NoAssign {
+
+    tbb::flow::graph * const my_graph;
+    bool * const my_done_flag;
+
+    decrement_wait( tbb::flow::graph &h, bool *done_flag ) : my_graph(&h), my_done_flag(done_flag) {}
+
+    void operator()(int i) const {
+        Harness::Sleep(10*i);
+        my_done_flag[i] = true;
+        my_graph->decrement_wait_count();
+    }
+};
+
+static void test_wait_count() {
+   tbb::flow::graph h;
+   for (int i = 0; i < T; ++i ) {
+       bool done_flag[W];
+       for (int j = 0; j < W; ++j ) {
+           for ( int w = 0; w < W; ++w ) done_flag[w] = false;
+           for ( int w = 0; w < j; ++w ) h.increment_wait_count();
+
+           NativeParallelFor( j, decrement_wait(h, done_flag) );
+           h.wait_for_all();
+           for ( int w = 0; w < W; ++w ) {
+              if ( w < j ) ASSERT( done_flag[w] == true, NULL );
+              else ASSERT( done_flag[w] == false, NULL );
+           }
+       }
+   }
+}
+
+const int F = 100;
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+bool lambda_flag[F];
+#endif
+bool functor_flag[F];
+
+struct set_functor {
+    int my_i;
+    set_functor( int i ) : my_i(i) {}
+    void operator()() { functor_flag[my_i] = true; }
+};
+
+struct return_functor {
+    int my_i;
+    return_functor( int i ) : my_i(i) {}
+    int operator()() { return my_i; }
+};
+
+static void test_run() {
+    tbb::flow::graph h;
+    for (int i = 0; i < T; ++i ) {
+
+        // Create receivers and flag arrays
+        #if __TBB_CPP11_LAMBDAS_PRESENT
+        harness_mapped_receiver<int> lambda_r(h);
+        lambda_r.initialize_map( F, 1 );
+        #endif
+        harness_mapped_receiver<int> functor_r(h);
+        functor_r.initialize_map( F, 1 );
+
+        // Initialize flag arrays
+        for (int j = 0; j < F; ++j ) {
+            #if __TBB_CPP11_LAMBDAS_PRESENT
+            lambda_flag[j] = false;
+            #endif
+            functor_flag[j] = false;
+        }
+
+        for ( int j = 0; j < F; ++j ) {
+            #if __TBB_CPP11_LAMBDAS_PRESENT
+                h.run( [=]() { lambda_flag[j] = true; } );
+                h.run( lambda_r, [=]() { return j; } );
+            #endif
+            h.run( set_functor(j) );
+            h.run( functor_r, return_functor(j) );
+        }
+        h.wait_for_all();
+        for ( int j = 0; j < F; ++j ) {
+        #if __TBB_CPP11_LAMBDAS_PRESENT
+            ASSERT( lambda_flag[i] == true, NULL );
+        #endif
+            ASSERT( functor_flag[i] == true, NULL );
+        }
+        #if __TBB_CPP11_LAMBDAS_PRESENT
+        lambda_r.validate();
+        #endif
+        functor_r.validate();
+    }
+}
+
+// Encapsulate object we want to store in vector (because contained type must have
+// copy constructor and assignment operator
+class my_int_buffer {
+    tbb::flow::buffer_node<int> *b;
+    tbb::flow::graph& my_graph;
+public:
+    my_int_buffer(tbb::flow::graph &g) : my_graph(g) { b = new tbb::flow::buffer_node<int>(my_graph); }
+    my_int_buffer(const my_int_buffer& other) : my_graph(other.my_graph) {
+        b = new tbb::flow::buffer_node<int>(my_graph);
+    }
+    ~my_int_buffer() { delete b; }
+    my_int_buffer& operator=(const my_int_buffer& /*other*/) {
+        return *this;
+    }
+};
+
+// test the graph iterator, delete nodes from graph, test again
+void test_iterator() {
+   tbb::flow::graph g;
+   my_int_buffer a_buffer(g);
+   my_int_buffer b_buffer(g);
+   my_int_buffer c_buffer(g);
+   my_int_buffer *d_buffer = new my_int_buffer(g);
+   my_int_buffer e_buffer(g);
+   std::vector< my_int_buffer > my_buffer_vector(10, c_buffer);
+
+   int count = 0;
+   for (tbb::flow::graph::iterator it = g.begin(); it != g.end(); ++it) {
+       count++;
+   }
+   ASSERT(count==15, "error in iterator count");
+
+   delete d_buffer;
+
+   count = 0;
+   for (tbb::flow::graph::iterator it = g.begin(); it != g.end(); ++it) {
+       count++;
+   }
+   ASSERT(count==14, "error in iterator count");
+
+   my_buffer_vector.clear();
+
+   count = 0;
+   for (tbb::flow::graph::iterator it = g.begin(); it != g.end(); ++it) {
+       count++;
+   }
+   ASSERT(count==4, "error in iterator count");
+}
+
+class AddRemoveBody : NoAssign {
+    tbb::flow::graph& g;
+    int nThreads;
+    Harness::SpinBarrier &barrier;
+public:
+    AddRemoveBody(int nthr, Harness::SpinBarrier &barrier_, tbb::flow::graph& _g) :
+        g(_g), nThreads(nthr), barrier(barrier_)
+    {}
+    void operator()(const int /*threadID*/) const {
+        my_int_buffer b(g);
+        {
+            std::vector<my_int_buffer> my_buffer_vector(100, b);
+            barrier.wait();  // wait until all nodes are created
+            // now test that the proper number of nodes were created
+            int count = 0;
+            for (tbb::flow::graph::iterator it = g.begin(); it != g.end(); ++it) {
+                count++;
+            }
+            ASSERT(count==101*nThreads, "error in iterator count");
+            barrier.wait();  // wait until all threads are done counting
+        } // all nodes but for the initial node on this thread are deleted
+        barrier.wait(); // wait until all threads have deleted all nodes in their vectors
+        // now test that all the nodes were deleted except for the initial node
+        int count = 0;
+        for (tbb::flow::graph::iterator it = g.begin(); it != g.end(); ++it) {
+            count++;
+        }
+        ASSERT(count==nThreads, "error in iterator count");
+        barrier.wait();  // wait until all threads are done counting
+    } // initial node gets deleted
+};
+
+void test_parallel(int nThreads) {
+    tbb::flow::graph g;
+    Harness::SpinBarrier barrier(nThreads);
+    AddRemoveBody body(nThreads, barrier, g);
+    NativeParallelFor(nThreads, body);
+}
+
+/*
+ * Functors for graph arena spawn tests
+ */
+
+inline void check_arena(tbb::task_arena* a) {
+    ASSERT(a->max_concurrency() == 2, NULL);
+    ASSERT(tbb::this_task_arena::max_concurrency() == 1, NULL);
+}
+
+struct run_functor {
+    tbb::task_arena* my_a;
+    int return_value;
+    run_functor(tbb::task_arena* a) : my_a(a), return_value(1) {}
+    int operator()() {
+        check_arena(my_a);
+        return return_value;
+    }
+};
+
+template < typename T >
+struct function_body {
+    tbb::task_arena* my_a;
+    function_body(tbb::task_arena* a) : my_a(a) {}
+    tbb::flow::continue_msg operator()(const T& /*arg*/) {
+        check_arena(my_a);
+        return tbb::flow::continue_msg();
+    }
+};
+
+typedef tbb::flow::multifunction_node< int, tbb::flow::tuple< int > > mf_node;
+
+struct multifunction_body {
+    tbb::task_arena* my_a;
+    multifunction_body(tbb::task_arena* a) : my_a(a) {}
+    void operator()(const int& /*arg*/, mf_node::output_ports_type& /*outports*/) {
+        check_arena(my_a);
+    }
+};
+
+struct source_body {
+    tbb::task_arena* my_a;
+    int counter;
+    source_body(tbb::task_arena* a) : my_a(a), counter(0) {}
+    bool operator()(const int& /*i*/) {
+        check_arena(my_a);
+        if (counter < 1) {
+          ++counter;
+          return true;
+       }
+       return false;
+    }
+};
+
+struct run_test_functor : tbb::internal::no_assign {
+    tbb::task_arena* fg_arena;
+    tbb::flow::graph& my_graph;
+
+    run_test_functor(tbb::task_arena* a, tbb::flow::graph& g) : fg_arena(a), my_graph(g) {}
+    void operator()() const {
+        harness_mapped_receiver<int> functor_r(my_graph);
+        functor_r.initialize_map(F, 1);
+
+        my_graph.run(run_functor(fg_arena));
+        my_graph.run(functor_r, run_functor(fg_arena));
+
+        my_graph.wait_for_all();
+    }
+};
+
+struct nodes_test_functor : tbb::internal::no_assign {
+    tbb::task_arena* fg_arena;
+    tbb::flow::graph& my_graph;
+
+    nodes_test_functor(tbb::task_arena* a, tbb::flow::graph& g) : fg_arena(a), my_graph(g) {}
+    void operator()() const {
+
+        // Define test nodes
+        // Continue, function, source nodes
+        tbb::flow::continue_node< tbb::flow::continue_msg > c_n(my_graph, function_body<tbb::flow::continue_msg>(fg_arena));
+        tbb::flow::function_node< int > f_n(my_graph, tbb::flow::unlimited, function_body<int>(fg_arena));
+        tbb::flow::source_node< int > s_n(my_graph, source_body(fg_arena), false);
+
+        // Multifunction node
+        mf_node m_n(my_graph, tbb::flow::unlimited, multifunction_body(fg_arena));
+
+        // Join node
+        tbb::flow::function_node< tbb::flow::tuple< int, int > > join_f_n(my_graph, tbb::flow::unlimited, function_body< tbb::flow::tuple< int, int > >(fg_arena));
+        tbb::flow::join_node< tbb::flow::tuple< int, int > > j_n(my_graph);
+        make_edge(j_n, join_f_n);
+
+        // Split node
+        tbb::flow::function_node< int > split_f_n1 = f_n;
+        tbb::flow::function_node< int > split_f_n2 = f_n;
+        tbb::flow::split_node< tbb::flow::tuple< int, int > > sp_n(my_graph);
+        make_edge(tbb::flow::output_port<0>(sp_n), split_f_n1);
+        make_edge(tbb::flow::output_port<1>(sp_n), split_f_n2);
+
+        // Overwrite node
+        tbb::flow::function_node< int > ow_f_n = f_n;
+        tbb::flow::overwrite_node< int > ow_n(my_graph);
+        make_edge(ow_n, ow_f_n);
+
+        // Write once node
+        tbb::flow::function_node< int > w_f_n = f_n;
+        tbb::flow::write_once_node< int > w_n(my_graph);
+        make_edge(w_n, w_f_n);
+
+        // Buffer node
+        tbb::flow::function_node< int > buf_f_n = f_n;
+        tbb::flow::buffer_node< int > buf_n(my_graph);
+        make_edge(w_n, buf_f_n);
+
+        // Limiter node
+        tbb::flow::function_node< int > l_f_n = f_n;
+        tbb::flow::limiter_node< int > l_n(my_graph, 1);
+        make_edge(l_n, l_f_n);
+
+        // Execute nodes
+        c_n.try_put( tbb::flow::continue_msg() );
+        f_n.try_put(1);
+        m_n.try_put(1);
+        s_n.activate();
+
+        tbb::flow::input_port<0>(j_n).try_put(1);
+        tbb::flow::input_port<1>(j_n).try_put(1);
+
+        tbb::flow::tuple< int, int > sp_tuple(1, 1);
+        sp_n.try_put(sp_tuple);
+
+        ow_n.try_put(1);
+        w_n.try_put(1);
+        buf_n.try_put(1);
+        l_n.try_put(1);
+
+        my_graph.wait_for_all();
+    }
+};
+
+void test_graph_arena() {
+    // There is only one thread for execution (master thread).
+    // So, if graph's tasks get spawned in different arena
+    // master thread won't be able to find them in its own arena.
+    // In this case test should hang.
+    tbb::task_scheduler_init init(1);
+
+    tbb::flow::graph g;
+    tbb::task_arena fg_arena;
+    fg_arena.initialize(2);
+    fg_arena.execute(run_test_functor(&fg_arena, g));
+    fg_arena.execute(nodes_test_functor(&fg_arena, g));
+}
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+       tbb::task_scheduler_init init(p);
+       test_wait_count();
+       test_run();
+       test_iterator();
+       test_parallel(p);
+   }
+   test_graph_arena();
+   return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_flow_graph_priorities.cpp b/xdl/third_party/tbb/src/test/test_flow_graph_priorities.cpp
new file mode 100644
index 00000000..5a14d450
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_flow_graph_priorities.cpp
@@ -0,0 +1,595 @@
+/*
+    Copyright (c) 2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_defs.h"
+
+#if __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES
+
+#include "harness_graph.h"
+#include "harness_barrier.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/parallel_for.h"
+#include "tbb/concurrent_queue.h"
+
+#include <vector>
+#include <cstdlib>
+
+using namespace tbb::flow;
+
+tbb::atomic<unsigned> g_task_num;
+
+void spin_for( double delta ) {
+    tbb::tick_count start = tbb::tick_count::now();
+    while( (tbb::tick_count::now() - start).seconds() < delta ) ;
+}
+
+namespace PriorityNodesTakePrecedence {
+
+struct TaskInfo {
+    TaskInfo() : my_priority(-1), my_task_index(-1) {}
+    TaskInfo( int priority, int task_index )
+        : my_priority(priority), my_task_index(task_index) {}
+    int my_priority;
+    int my_task_index;
+};
+std::vector<TaskInfo> g_task_info;
+bool g_work_submitted = false;
+
+const unsigned node_num = 100;
+const unsigned start_index = node_num / 3;
+const unsigned end_index = node_num * 2 / 3;
+tbb::atomic<unsigned> g_priority_task_index;
+
+void body_func( int priority ) {
+    while( !g_work_submitted ) __TBB_Yield();
+    int current_task_index = g_task_num++;
+    if( priority )
+        g_task_info[g_priority_task_index++] = TaskInfo( priority, current_task_index );
+}
+
+struct FunctionBody {
+    FunctionBody( int priority ) : my_priority( priority ) {}
+    int operator()( int msg ) const {
+        body_func( my_priority );
+        return msg;
+    }
+private:
+    int my_priority;
+};
+
+typedef multifunction_node< int,tuple<int> > multi_node;
+
+struct MultifunctionBody {
+    MultifunctionBody( int priority ) : my_priority( priority ) {}
+    void operator()( int msg, multi_node::output_ports_type& op ) const {
+        body_func( my_priority );
+        get<0>(op).try_put( msg );
+    }
+private:
+    int my_priority;
+};
+
+template<typename NodeType, typename BodyType>
+NodeType* node_creator( graph& g, unsigned index ) {
+    if( start_index <= index && index < end_index )
+        return new NodeType( g, unlimited, BodyType(index), node_priority_t(index) );
+    else
+        return new NodeType( g, unlimited, BodyType(0) );
+}
+
+struct passthru_body {
+    continue_msg operator()( int ) const {
+        return continue_msg();
+    }
+};
+
+template<typename NodeType> sender<int>& get_sender( NodeType& node ) { return node; }
+template<> sender<int>& get_sender<multi_node>( multi_node& node ) { return output_port<0>(node); }
+
+template<typename NodeType, typename NodeTypeCreator, typename NodePortRetriever>
+void test_node( NodeTypeCreator node_creator_func, NodePortRetriever get_sender ) {
+    graph g;
+    broadcast_node<int> bn(g);
+    function_node<int> tn(g, unlimited, passthru_body());
+    // Using pointers to nodes to avoid errors on compilers, which try to generate assigment
+    // operator for the nodes
+    std::vector<NodeType*> nodes;
+    for( unsigned i = 0; i < node_num; ++i ) {
+        nodes.push_back( node_creator_func(g, i) );
+        make_edge( bn, *nodes.back() );
+        make_edge( get_sender(*nodes.back()), tn );
+    }
+
+    const size_t repeats = 50;
+    const size_t priority_nodes_num = end_index - start_index;
+    size_t internal_order_failures = 0;
+    size_t global_order_failures = 0;
+    for( size_t repeat = 0; repeat < repeats; ++repeat ) {
+        g_work_submitted = false;
+        g_task_num = g_priority_task_index = 0;
+        g_task_info.clear(); g_task_info.resize( priority_nodes_num );
+
+        bn.try_put( 0 );
+        // Setting of the flag is based on the knowledge that the calling thread broadcasts the message
+        // to successor nodes, that is spawns tasks. Thus, this makes this test to be a whitebox test to
+        // some extent.
+        g_work_submitted = true;
+
+        g.wait_for_all();
+
+        ASSERT( g_priority_task_index == g_task_info.size(), "Incorrect number of tasks with priority" );
+        bool found_max = false;
+        bool found_min = false;
+        for( unsigned i = 0; i < g_priority_task_index/2; ++i ) {
+            if( g_task_info[i].my_priority == int(end_index-1) )
+                found_max = true;
+            if( g_task_info[g_priority_task_index-1-i].my_priority == int(start_index) )
+                found_min = true;
+        }
+        if( !found_min || !found_max )
+            ++internal_order_failures;
+        for( unsigned i = 0; i < g_priority_task_index; ++i ) {
+            if( g_task_info[i].my_task_index > int(priority_nodes_num) + MaxThread )
+                ++global_order_failures;
+        }
+    }
+    float failure_ratio = float(internal_order_failures) / float(repeats);
+    ASSERT(
+        failure_ratio <= 0.3f,
+        "Nodes with priorities executed in wrong order among each other too frequently."
+    );
+    failure_ratio = float(global_order_failures) / float(repeats*priority_nodes_num);
+    ASSERT(
+        failure_ratio <= 0.1f,
+        "Nodes with priorities executed in wrong order too frequently over non-prioritized nodes."
+    );
+    for( size_t i = 0; i < nodes.size(); ++i )
+        delete nodes[i];
+}
+
+void test( int num_threads ) {
+    REMARK( "Testing execution of nodes with priority takes precedence (num_threads=%d) - ", num_threads );
+    tbb::task_scheduler_init init(num_threads);
+    test_node< function_node<int,int> >( &node_creator<function_node<int,int>, FunctionBody>,
+                                         &get_sender< function_node<int,int> > );
+    test_node<multi_node>( &node_creator<multi_node, MultifunctionBody>, &get_sender< multi_node > );
+    REMARK( "done\n" );
+}
+} /* namespace PriorityNodesTakePrecedence */
+
+namespace ThreadsEagerReaction {
+
+using Harness::SpinBarrier;
+
+enum task_type_t { no_task, regular_task, async_task };
+
+struct profile_t {
+    task_type_t task_type;
+    unsigned global_task_id;
+    double elapsed;
+};
+
+std::vector<unsigned> g_async_task_ids;
+
+typedef unsigned data_type;
+typedef async_node<data_type, data_type> async_node_type;
+typedef multifunction_node<
+    data_type, tuple<data_type, data_type> > decider_node_type;
+struct AsyncActivity {
+    typedef async_node_type::gateway_type gateway_type;
+
+    struct work_type { data_type input; gateway_type* gateway; };
+    bool done;
+    tbb::concurrent_queue<work_type> my_queue;
+    tbb::tbb_thread my_service_thread;
+
+    struct ServiceThreadFunc {
+        SpinBarrier& my_barrier;
+        ServiceThreadFunc(SpinBarrier& barrier) : my_barrier(barrier) {}
+        void operator()(AsyncActivity* activity) {
+            while (!activity->done) {
+                work_type work;
+                while (activity->my_queue.try_pop(work)) {
+                    g_async_task_ids.push_back( ++g_task_num );
+                    work.gateway->try_put(work.input);
+                    work.gateway->release_wait();
+                    my_barrier.wait();
+                }
+            }
+        }
+    };
+    void stop_and_wait() { done = true; my_service_thread.join(); }
+
+    void submit(data_type input, gateway_type* gateway) {
+        work_type work = { input, gateway };
+        gateway->reserve_wait();
+        my_queue.push(work);
+    }
+    AsyncActivity(SpinBarrier& barrier)
+        : done(false), my_service_thread(ServiceThreadFunc(barrier), this) {}
+};
+
+struct StartBody {
+    bool has_run;
+    bool operator()(data_type& input) {
+        if (has_run) return false;
+        else {
+            input = 1;
+            has_run = true;
+            return true;
+        }
+    }
+    StartBody() : has_run(false) {}
+};
+
+struct ParallelForBody {
+    SpinBarrier& my_barrier;
+    const data_type& my_input;
+    ParallelForBody(SpinBarrier& barrier, const data_type& input)
+        : my_barrier(barrier), my_input(input) {}
+    void operator()(const data_type&) const {
+        my_barrier.wait();
+        ++g_task_num;
+    }
+};
+
+struct CpuWorkBody {
+    SpinBarrier& my_barrier;
+    const int my_tasks_count;
+    data_type operator()(const data_type& input) {
+        tbb::parallel_for(0, my_tasks_count, ParallelForBody(my_barrier, input), tbb::simple_partitioner());
+        return input;
+    }
+    CpuWorkBody(SpinBarrier& barrier, int tasks_count)
+        : my_barrier(barrier), my_tasks_count(tasks_count) {}
+};
+
+struct DeciderBody {
+    const data_type& my_limit;
+    DeciderBody( const data_type& limit ) : my_limit( limit ) {}
+    void operator()(data_type input, decider_node_type::output_ports_type& ports) {
+        if (input < my_limit)
+            get<0>(ports).try_put(input + 1);
+    }
+};
+
+struct AsyncSubmissionBody {
+    AsyncActivity* my_activity;
+    void operator()(data_type input, async_node_type::gateway_type& gateway) {
+        my_activity->submit(input, &gateway);
+    }
+    AsyncSubmissionBody(AsyncActivity* activity) : my_activity(activity) {}
+};
+
+void test( int num_threads ) {
+    REMARK( "Testing threads react eagerly on asynchronous tasks (num_threads=%d) - ", num_threads );
+    if( num_threads == tbb::task_scheduler_init::default_num_threads() ) {
+        // one thread is required for asynchronous compute resource
+        REMARK("skipping test since it is designed to work on less number of threads than "
+               "hardware concurrency allows\n");
+        return;
+    }
+    const unsigned cpu_threads = unsigned(num_threads);
+    const unsigned cpu_tasks_per_thread = 4;
+    const unsigned nested_cpu_tasks = cpu_tasks_per_thread * cpu_threads;
+    const unsigned async_subgraph_reruns = 8;
+    const unsigned cpu_subgraph_reruns = 2;
+
+    SpinBarrier barrier(cpu_threads + /*async thread=*/1);
+    g_task_num = 0;
+    g_async_task_ids.clear();
+    g_async_task_ids.reserve( async_subgraph_reruns );
+
+    tbb::task_scheduler_init init( cpu_threads );
+    AsyncActivity activity(barrier);
+    graph g;
+
+    source_node<data_type> starter_node(g, StartBody(), false);
+    function_node<data_type, data_type> cpu_work_node(
+        g, unlimited, CpuWorkBody(barrier, nested_cpu_tasks));
+    decider_node_type cpu_restarter_node(g, unlimited, DeciderBody(cpu_subgraph_reruns));
+    async_node_type async_node(g, unlimited, AsyncSubmissionBody(&activity));
+    decider_node_type async_restarter_node(
+        g, unlimited, DeciderBody(async_subgraph_reruns), node_priority_t(1)
+    );
+
+    make_edge(starter_node, cpu_work_node);
+    make_edge(cpu_work_node, cpu_restarter_node);
+    make_edge(output_port<0>(cpu_restarter_node), cpu_work_node);
+
+    make_edge(starter_node, async_node);
+    make_edge(async_node, async_restarter_node);
+    make_edge(output_port<0>(async_restarter_node), async_node);
+
+    starter_node.activate();
+    g.wait_for_all();
+    activity.stop_and_wait();
+
+    const size_t async_task_num = size_t(async_subgraph_reruns);
+    ASSERT( g_async_task_ids.size() == async_task_num, "Incorrect number of async tasks." );
+    unsigned max_span = unsigned(2 * cpu_threads + 1);
+    for( size_t idx = 1; idx < async_task_num; ++idx ) {
+        ASSERT( g_async_task_ids[idx] - g_async_task_ids[idx-1] <= max_span,
+                "Async tasks were not able to interfere with CPU tasks." );
+    }
+    REMARK("done\n");
+}
+} /* ThreadsEagerReaction */
+
+namespace LimitingExecutionToPriorityTask {
+
+enum work_type_t { NONPRIORITIZED_WORK, PRIORITIZED_WORK };
+
+struct execution_tracker_t {
+    execution_tracker_t() { reset(); }
+    void reset() {
+        prioritized_work_submitter = tbb::tbb_thread::id();
+        prioritized_work_started = false;
+        prioritized_work_finished = false;
+        prioritized_work_interrupted = false;
+    }
+    tbb::tbb_thread::id prioritized_work_submitter;
+    bool prioritized_work_started;
+    bool prioritized_work_finished;
+    bool prioritized_work_interrupted;
+} exec_tracker;
+
+template<work_type_t work_type>
+void do_node_work( int work_size );
+
+template<work_type_t>
+void do_nested_work( const tbb::tbb_thread::id& tid, const tbb::blocked_range<int>& subrange );
+
+template<work_type_t work_type>
+struct CommonBody {
+    CommonBody() : my_body_size( 0 ) { }
+    CommonBody( int body_size ) : my_body_size( body_size ) { }
+    continue_msg operator()( const continue_msg& msg ) const {
+        do_node_work<work_type>(my_body_size);
+        return msg;
+    }
+    void operator()( const tbb::blocked_range<int>& subrange ) const {
+        do_nested_work<work_type>( /*tid=*/tbb::this_tbb_thread::get_id(), subrange );
+    }
+    int my_body_size;
+};
+
+template<work_type_t work_type>
+void do_node_work(int work_size) {
+    tbb::parallel_for( tbb::blocked_range<int>(0, work_size), CommonBody<work_type>(),
+                       tbb::simple_partitioner() );
+}
+
+template<work_type_t>
+void do_nested_work( const tbb::tbb_thread::id& tid, const tbb::blocked_range<int>& /*subrange*/ ) {
+    // This is non-prioritized work...
+    if( exec_tracker.prioritized_work_submitter != tid )
+        return;
+    // ...being executed by the thread that initially started prioritized one...
+    ASSERT( exec_tracker.prioritized_work_started,
+            "Prioritized work should have been started by that time." );
+    // ...prioritized work has been started already...
+    if( exec_tracker.prioritized_work_finished )
+        return;
+    // ...but has not been finished yet
+    exec_tracker.prioritized_work_interrupted = true;
+}
+
+struct IsolationFunctor {
+    int work_size;
+    IsolationFunctor(int ws) : work_size(ws) {}
+    void operator()() const {
+        tbb::parallel_for( tbb::blocked_range<int>(0, work_size), CommonBody<PRIORITIZED_WORK>(),
+                           tbb::simple_partitioner() );
+    }
+};
+
+template<>
+void do_node_work<PRIORITIZED_WORK>(int work_size) {
+    exec_tracker.prioritized_work_submitter = tbb::this_tbb_thread::get_id();
+    exec_tracker.prioritized_work_started = true;
+    tbb::this_task_arena::isolate( IsolationFunctor(work_size) );
+    exec_tracker.prioritized_work_finished = true;
+}
+
+template<>
+void do_nested_work<PRIORITIZED_WORK>( const tbb::tbb_thread::id& tid,
+                                       const tbb::blocked_range<int>& /*subrange*/ ) {
+    if( exec_tracker.prioritized_work_submitter == tid ) {
+        ASSERT( !exec_tracker.prioritized_work_interrupted,
+                "Thread was not fully devoted to processing of prioritized task." );
+    } else {
+        // prolong processing of prioritized work so that the thread that started
+        // prioritized work has higher probability to help with non-prioritized one.
+        spin_for(0.1);
+    }
+}
+
+// Using pointers to nodes to avoid errors on compilers, which try to generate assigment operator
+// for the nodes
+typedef std::vector< continue_node<continue_msg>* > nodes_container_t;
+
+void create_nodes( nodes_container_t& nodes, graph& g, int num, int body_size ) {
+    for( int i = 0; i < num; ++i )
+        nodes.push_back(
+            new continue_node<continue_msg>( g, CommonBody<NONPRIORITIZED_WORK>( body_size ) )
+        );
+}
+
+void test( int num_threads ) {
+    REMARK( "Testing limit execution to priority tasks (num_threads=%d) - ", num_threads );
+
+    tbb::task_scheduler_init init( num_threads );
+
+    const int nodes_num = 100;
+    const int priority_node_position_part = 10;
+    const int pivot = nodes_num / priority_node_position_part;
+    const int nodes_in_lane = 3 * num_threads;
+    const int small_problem_size = 100;
+    const int large_problem_size = 1000;
+
+    graph g;
+    nodes_container_t nodes;
+    create_nodes( nodes, g, pivot, large_problem_size );
+    nodes.push_back(
+        new continue_node<continue_msg>(
+            g, CommonBody<PRIORITIZED_WORK>(small_problem_size), node_priority_t(1)
+        )
+    );
+    create_nodes( nodes, g, nodes_num - pivot - 1, large_problem_size );
+
+    broadcast_node<continue_msg> bn(g);
+    for( int i = 0; i < nodes_num; ++i )
+        if( i % nodes_in_lane == 0 )
+            make_edge( bn, *nodes[i] );
+        else
+            make_edge( *nodes[i-1], *nodes[i] );
+    exec_tracker.reset();
+    bn.try_put( continue_msg() );
+    g.wait_for_all();
+
+    for( size_t i = 0; i < nodes.size(); ++i )
+        delete nodes[i];
+    REMARK( "done\n" );
+}
+
+} /* namespace LimitingExecutionToPriorityTask */
+
+#include "tbb/task_arena.h"
+namespace NestedCase {
+
+using tbb::task_arena;
+
+struct ResetGraphFunctor {
+    graph& my_graph;
+    ResetGraphFunctor(graph& g) : my_graph(g) {}
+    // copy construtor to please some old compilers
+    ResetGraphFunctor(const ResetGraphFunctor& rgf) : my_graph(rgf.my_graph) {}
+    void operator()() const { my_graph.reset(); }
+};
+
+struct InnerBody {
+    continue_msg operator()( const continue_msg& ) const {
+        return continue_msg();
+    }
+};
+
+struct OuterBody {
+    int my_max_threads;
+    task_arena& my_inner_arena;
+    OuterBody( int max_threads, task_arena& inner_arena )
+        : my_max_threads(max_threads), my_inner_arena(inner_arena) {}
+    // copy construtor to please some old compilers
+    OuterBody( const OuterBody& rhs )
+        : my_max_threads(rhs.my_max_threads), my_inner_arena(rhs.my_inner_arena) {}
+    int operator()( const int& ) {
+        graph inner_graph;
+        continue_node<continue_msg> start_node(inner_graph, InnerBody());
+        continue_node<continue_msg> mid_node1(inner_graph, InnerBody(), node_priority_t(5));
+        continue_node<continue_msg> mid_node2(inner_graph, InnerBody());
+        continue_node<continue_msg> end_node(inner_graph, InnerBody(), node_priority_t(15));
+        make_edge( start_node, mid_node1 );
+        make_edge( mid_node1, end_node );
+        make_edge( start_node, mid_node2 );
+        make_edge( mid_node2, end_node );
+        my_inner_arena.execute( ResetGraphFunctor(inner_graph) );
+        start_node.try_put( continue_msg() );
+        inner_graph.wait_for_all();
+        return 13;
+    }
+};
+
+void execute_outer_graph( bool same_arena, task_arena& inner_arena, int max_threads,
+                          graph& outer_graph, function_node<int,int>& start_node ) {
+    if( same_arena ) {
+        start_node.try_put( 42 );
+        outer_graph.wait_for_all();
+        return;
+    }
+    for( int num_threads = 1; num_threads <= max_threads; ++num_threads ) {
+        inner_arena.initialize( num_threads );
+        start_node.try_put( 42 );
+        outer_graph.wait_for_all();
+        inner_arena.terminate();
+    }
+}
+
+void test_in_arena( int max_threads, task_arena& outer_arena, task_arena& inner_arena ) {
+    graph outer_graph;
+    const unsigned num_outer_nodes = 10;
+    const size_t concurrency = unlimited;
+    std::vector< function_node<int,int>* > outer_nodes;
+    for( unsigned node_index = 0; node_index < num_outer_nodes; ++node_index ) {
+        internal::node_priority_t priority = internal::no_priority;
+        if( node_index == num_outer_nodes / 2 )
+            priority = 10;
+
+        outer_nodes.push_back(
+            new function_node<int,int>(
+                outer_graph, concurrency, OuterBody(max_threads, inner_arena), priority
+            )
+        );
+    }
+
+    for( unsigned node_index1 = 0; node_index1 < num_outer_nodes; ++node_index1 )
+        for( unsigned node_index2 = node_index1+1; node_index2 < num_outer_nodes; ++node_index2 )
+            make_edge( *outer_nodes[node_index1], *outer_nodes[node_index2] );
+
+    bool same_arena = &outer_arena == &inner_arena;
+    for( int num_threads = 1; num_threads <= max_threads; ++num_threads ) {
+        REMARK( "Testing nested nodes with specified priority in %s arenas, num_threads=%d) - ",
+                same_arena? "same" : "different", num_threads );
+        outer_arena.initialize( num_threads );
+        outer_arena.execute( ResetGraphFunctor(outer_graph) );
+        execute_outer_graph( same_arena, inner_arena, max_threads, outer_graph, *outer_nodes[0] );
+        outer_arena.terminate();
+        REMARK( "done\n" );
+    }
+
+    for( size_t i = 0; i < outer_nodes.size(); ++i )
+        delete outer_nodes[i];
+}
+
+void test( int max_threads ) {
+    tbb::task_scheduler_init init( max_threads );
+    task_arena outer_arena; task_arena inner_arena;
+    test_in_arena( max_threads, outer_arena, outer_arena );
+    test_in_arena( max_threads, outer_arena, inner_arena );
+}
+}
+
+int TestMain() {
+    if( MinThread < 1 ) {
+        REPORT( "Number of threads must be positive\n" );
+        return Harness::Skipped;
+    }
+    for( int p = MinThread; p <= MaxThread; ++p ) {
+        PriorityNodesTakePrecedence::test( p );
+        LimitingExecutionToPriorityTask::test( p );
+    }
+    NestedCase::test( MaxThread );
+    return Harness::Done;
+}
+#else /* __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES */
+#define HARNESS_SKIP_TEST 1
+#include "harness.h"
+#endif /* __TBB_PREVIEW_FLOW_GRAPH_PRIORITIES */
diff --git a/xdl/third_party/tbb/src/test/test_flow_graph_whitebox.cpp b/xdl/third_party/tbb/src/test/test_flow_graph_whitebox.cpp
new file mode 100644
index 00000000..dd87acea
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_flow_graph_whitebox.cpp
@@ -0,0 +1,708 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 3
+#define HARNESS_DEFAULT_MAX_THREADS 4
+
+#if _MSC_VER
+    #pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+    #if _MSC_VER==1700 && !defined(__INTEL_COMPILER)
+        // Suppress "unreachable code" warning by VC++ 17.0 (VS 2012)
+        #pragma warning (disable: 4702)
+    #endif
+#endif
+
+#include "harness.h"
+#include <string> // merely prevents LNK2001 error to happen (on ICL+VC9 configurations)
+
+// need these to get proper external names for private methods in library.
+#include "tbb/spin_mutex.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/task.h"
+#include "tbb/task_arena.h"
+
+#define private public
+#define protected public
+#include "tbb/flow_graph.h"
+#undef protected
+#undef private
+#include "tbb/task_scheduler_init.h"
+#include "harness_graph.h"
+
+template<typename T>
+struct receiverBody {
+    tbb::flow::continue_msg operator()(const T &/*in*/) {
+        return tbb::flow::continue_msg();
+    }
+};
+
+// split_nodes cannot have predecessors
+// they do not reject messages and always forward.
+// they reject edge reversals from successors.
+void TestSplitNode() {
+    typedef tbb::flow::split_node<tbb::flow::tuple<int> > snode_type;
+    tbb::flow::graph g;
+    snode_type snode(g);
+    tbb::flow::function_node<int> rcvr(g,tbb::flow::unlimited, receiverBody<int>());
+    REMARK("Testing split_node\n");
+    ASSERT(tbb::flow::output_port<0>(snode).my_successors.empty(), "Constructed split_node has successors");
+    // tbb::flow::output_port<0>(snode)
+    tbb::flow::make_edge(tbb::flow::output_port<0>(snode), rcvr);
+    ASSERT(!(tbb::flow::output_port<0>(snode).my_successors.empty()), "after make_edge, split_node has no successor.");
+    snode.try_put(tbb::flow::tuple<int>(1));
+    g.wait_for_all();
+    g.reset();
+    ASSERT(!(tbb::flow::output_port<0>(snode).my_successors.empty()), "after reset(), split_node has no successor.");
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(tbb::flow::output_port<0>(snode).my_successors.empty(), "after reset(rf_clear_edges), split_node has a successor.");
+}
+
+// buffering nodes cannot have predecessors
+// they do not reject messages and always save or forward
+// they allow edge reversals from successors
+template< typename B >
+void TestBufferingNode(const char * name) {
+    tbb::flow::graph g;
+    B                bnode(g);
+    tbb::flow::function_node<int,int,tbb::flow::rejecting> fnode(g, tbb::flow::serial, serial_fn_body<int>(serial_fn_state0));
+    REMARK("Testing %s:", name);
+    for(int icnt = 0; icnt < 2; icnt++) {
+        bool reverse_edge = (icnt & 0x2) != 0;
+        serial_fn_state0 = 0;  // reset to waiting state.
+        REMARK(" make_edge");
+        tbb::flow::make_edge(bnode, fnode);
+        ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after make_edge");
+        REMARK(" try_put");
+        bnode.try_put(1);  // will forward to the fnode
+        BACKOFF_WAIT(serial_fn_state0 == 0, "Timed out waiting for first put");
+        if(reverse_edge) {
+            REMARK(" try_put2");
+            bnode.try_put(2);  // will reverse the edge
+            // cannot do a wait_for_all here; the function_node is still executing
+            BACKOFF_WAIT(!bnode.my_successors.empty(), "Timed out waiting after 2nd put");
+            // at this point the only task running is the one for the function_node.
+            ASSERT(bnode.my_successors.empty(), "successor not removed");
+        }
+        else {
+            ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after forwarding message");
+        }
+        serial_fn_state0 = 0;  // release the function_node.
+        if(reverse_edge) {
+            // have to do a second release because the function_node will get the 2nd item
+            BACKOFF_WAIT( serial_fn_state0 == 0, "Timed out waiting after 2nd put");
+            serial_fn_state0 = 0;  // release the function_node.
+        }
+        g.wait_for_all();
+        REMARK(" remove_edge");
+        tbb::flow::remove_edge(bnode, fnode);
+        ASSERT(bnode.my_successors.empty(), "buffering node has a successor after remove_edge");
+    }
+    tbb::flow::join_node<tbb::flow::tuple<int,int>,tbb::flow::reserving> jnode(g);
+    tbb::flow::make_edge(bnode, tbb::flow::input_port<0>(jnode));  // will spawn a task
+    g.wait_for_all();
+    ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after attaching to join");
+    REMARK(" reverse");
+    bnode.try_put(1);  // the edge should reverse
+    g.wait_for_all();
+    ASSERT(bnode.my_successors.empty(), "buffering node has a successor after reserving");
+    REMARK(" reset()");
+    g.wait_for_all();
+    g.reset();  // should be in forward direction again
+    ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after reset()");
+    REMARK(" remove_edge");
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(bnode.my_successors.empty(), "buffering node has a successor after reset(rf_clear_edges)");
+    tbb::flow::make_edge(bnode, tbb::flow::input_port<0>(jnode));  // add edge again
+    // reverse edge by adding to buffer.
+    bnode.try_put(1);  // the edge should reverse
+    g.wait_for_all();
+    ASSERT(bnode.my_successors.empty(), "buffering node has a successor after reserving");
+    REMARK(" remove_edge(reversed)");
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(bnode.my_successors.empty(), "buffering node has no successor after reset()");
+    ASSERT(tbb::flow::input_port<0>(jnode).my_predecessors.empty(), "predecessor not reset");
+    REMARK("  done\n");
+    g.wait_for_all();
+}
+
+// continue_node has only predecessor count
+// they do not have predecessors, only the counts
+// successor edges cannot be reversed
+void TestContinueNode() {
+    tbb::flow::graph g;
+    tbb::flow::function_node<int> fnode0(g, tbb::flow::serial, serial_fn_body<int>(serial_fn_state0));
+    tbb::flow::continue_node<int> cnode(g, 1, serial_continue_body<int>(serial_continue_state0));
+    tbb::flow::function_node<int> fnode1(g, tbb::flow::serial, serial_fn_body<int>(serial_fn_state1));
+    tbb::flow::make_edge(fnode0, cnode);
+    tbb::flow::make_edge(cnode, fnode1);
+    REMARK("Testing continue_node:");
+    for( int icnt = 0; icnt < 2; ++icnt ) {
+        REMARK( " initial%d", icnt);
+        ASSERT(cnode.my_predecessor_count == 2, "predecessor addition didn't increment count");
+        ASSERT(!cnode.successors().empty(), "successors empty though we added one");
+        ASSERT(cnode.my_current_count == 0, "state of continue_receiver incorrect");
+        serial_continue_state0 = 0;
+        serial_fn_state0 = 0;
+        serial_fn_state1 = 0;
+
+        fnode0.try_put(1);  // start the first function node.
+        BACKOFF_WAIT(!serial_fn_state0, "Timed out waiting for function_node to start");
+        // Now the body of function_node 0 is executing.
+        serial_fn_state0 = 0;  // release the node
+        // wait for node to count the message (or for the node body to execute, which would be wrong)
+        BACKOFF_WAIT(serial_continue_state0 == 0 && cnode.my_current_count == 0, "Timed out waiting for continue_state0 to change");
+        ASSERT(serial_continue_state0 == 0, "Improperly released continue_node");
+        ASSERT(cnode.my_current_count == 1, "state of continue_receiver incorrect");
+        if(icnt == 0) {  // first time through, let the continue_node fire
+            REMARK(" firing");
+            fnode0.try_put(1);  // second message
+            BACKOFF_WAIT(serial_fn_state0 == 0, "timeout waiting for continue_body to execute");
+            // Now the body of function_node 0 is executing.
+            serial_fn_state0 = 0;  // release the node
+
+            BACKOFF_WAIT(!serial_continue_state0,"continue_node didn't start");  // now we wait for the continue_node.
+            ASSERT(cnode.my_current_count == 0, " my_current_count not reset before body of continue_node started");
+            serial_continue_state0 = 0;  // release the continue_node
+            BACKOFF_WAIT(!serial_fn_state1,"successor function_node didn't start");    // wait for the successor function_node to enter body
+            serial_fn_state1 = 0;  // release successor function_node.
+            g.wait_for_all();
+
+            // try a try_get()
+            {
+                int i;
+                ASSERT(!cnode.try_get(i), "try_get not rejected");
+            }
+
+            REMARK(" reset");
+            ASSERT(!cnode.my_successors.empty(), "Empty successors in built graph (before reset)");
+            ASSERT(cnode.my_predecessor_count == 2, "predecessor_count reset (before reset)");
+            g.reset();  // should still be the same
+            ASSERT(!cnode.my_successors.empty(), "Empty successors in built graph (after reset)" );
+            ASSERT(cnode.my_predecessor_count == 2, "predecessor_count reset (after reset)");
+        }
+        else {  // we're going to see if the rf_clear_edges resets things.
+            g.wait_for_all();
+            REMARK(" reset(rf_clear_edges)");
+            ASSERT(!cnode.my_successors.empty(), "Empty successors in built graph (before reset)");
+            ASSERT(cnode.my_predecessor_count == 2, "predecessor_count reset (before reset)");
+            g.reset(tbb::flow::rf_clear_edges);  // should be in forward direction again
+            ASSERT(cnode.my_current_count == 0, "state of continue_receiver incorrect after reset(rf_clear_edges)");
+            ASSERT(cnode.my_successors.empty(), "buffering node has a successor after reset(rf_clear_edges)");
+            ASSERT(cnode.my_predecessor_count == cnode.my_initial_predecessor_count, "predecessor count not reset");
+        }
+    }
+
+    REMARK(" done\n");
+
+}
+
+// function_node has predecessors and successors
+// try_get() rejects
+// successor edges cannot be reversed
+// predecessors will reverse (only rejecting will reverse)
+void TestFunctionNode() {
+    tbb::flow::graph g;
+    tbb::flow::queue_node<int> qnode0(g);
+    tbb::flow::function_node<int,int, tbb::flow::rejecting > fnode0(g, tbb::flow::serial, serial_fn_body<int>(serial_fn_state0));
+    // queueing function node
+    tbb::flow::function_node<int,int> fnode1(g, tbb::flow::serial, serial_fn_body<int>(serial_fn_state0));
+
+    tbb::flow::queue_node<int> qnode1(g);
+
+    tbb::flow::make_edge(fnode0, qnode1);
+    tbb::flow::make_edge(qnode0, fnode0);
+
+    serial_fn_state0 = 2;  // just let it go
+    // see if the darned thing will work....
+    qnode0.try_put(1);
+    g.wait_for_all();
+    int ii;
+    ASSERT(qnode1.try_get(ii) && ii == 1, "output not passed");
+    tbb::flow::remove_edge(qnode0, fnode0);
+    tbb::flow::remove_edge(fnode0, qnode1);
+
+    tbb::flow::make_edge(fnode1, qnode1);
+    tbb::flow::make_edge(qnode0, fnode1);
+
+    serial_fn_state0 = 2;  // just let it go
+    // see if the darned thing will work....
+    qnode0.try_put(1);
+    g.wait_for_all();
+    ASSERT(qnode1.try_get(ii) && ii == 1, "output not passed");
+    tbb::flow::remove_edge(qnode0, fnode1);
+    tbb::flow::remove_edge(fnode1, qnode1);
+
+    // rejecting
+    serial_fn_state0 = 0;
+    tbb::flow::make_edge(fnode0, qnode1);
+    tbb::flow::make_edge(qnode0, fnode0);
+    REMARK("Testing rejecting function_node:");
+    ASSERT(!fnode0.my_queue, "node should have no queue");
+    ASSERT(!fnode0.my_successors.empty(), "successor edge not added");
+    qnode0.try_put(1);
+    BACKOFF_WAIT(!serial_fn_state0,"rejecting function_node didn't start");
+    qnode0.try_put(2);   // rejecting node should reject, reverse.
+    BACKOFF_WAIT(fnode0.my_predecessors.empty(), "Missing predecessor ---");
+    serial_fn_state0 = 2;   // release function_node body.
+    g.wait_for_all();
+    REMARK(" reset");
+    g.reset();  // should reverse the edge from the input to the function node.
+    ASSERT(!qnode0.my_successors.empty(), "empty successors after reset()");
+    ASSERT(fnode0.my_predecessors.empty(), "predecessor not reversed");
+    tbb::flow::remove_edge(qnode0, fnode0);
+    tbb::flow::remove_edge(fnode0, qnode1);
+    REMARK("\n");
+
+    // queueing
+    tbb::flow::make_edge(fnode1, qnode1);
+    REMARK("Testing queueing function_node:");
+    ASSERT(fnode1.my_queue, "node should have no queue");
+    ASSERT(!fnode1.my_successors.empty(), "successor edge not added");
+    REMARK(" add_pred");
+    ASSERT(fnode1.register_predecessor(qnode0), "Cannot register as predecessor");
+    ASSERT(!fnode1.my_predecessors.empty(), "Missing predecessor");
+    REMARK(" reset");
+    g.wait_for_all();
+    g.reset();  // should reverse the edge from the input to the function node.
+    ASSERT(!qnode0.my_successors.empty(), "empty successors after reset()");
+    ASSERT(fnode1.my_predecessors.empty(), "predecessor not reversed");
+    tbb::flow::remove_edge(qnode0, fnode1);
+    tbb::flow::remove_edge(fnode1, qnode1);
+    REMARK("\n");
+
+    serial_fn_state0 = 0;  // make the function_node wait
+    tbb::flow::make_edge(qnode0, fnode0);
+    REMARK(" start_func");
+    qnode0.try_put(1);
+    BACKOFF_WAIT(serial_fn_state0 == 0, "Timed out waiting after 1st put");
+    // now if we put an item to the queues the edges to the function_node will reverse.
+    REMARK(" put_node(2)");
+    qnode0.try_put(2);   // start queue node.
+    // wait for the edges to reverse
+    BACKOFF_WAIT(fnode0.my_predecessors.empty(), "Timed out waiting");
+    ASSERT(!fnode0.my_predecessors.empty(), "function_node edge not reversed");
+    g.my_root_task->cancel_group_execution();
+    // release the function_node
+    serial_fn_state0 = 2;
+    g.wait_for_all();
+    ASSERT(!fnode0.my_predecessors.empty() && qnode0.my_successors.empty(), "function_node edge not reversed");
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(fnode0.my_predecessors.empty() && qnode0.my_successors.empty(), "function_node edge not removed");
+    ASSERT(fnode0.my_successors.empty(), "successor to fnode not removed");
+    REMARK(" done\n");
+}
+
+template<typename TT>
+class tag_func {
+    TT my_mult;
+public:
+    tag_func(TT multiplier) : my_mult(multiplier) { }
+    void operator=( const tag_func& other){my_mult = other.my_mult;}
+    // operator() will return [0 .. Count)
+    tbb::flow::tag_value operator()( TT v) {
+        tbb::flow::tag_value t = tbb::flow::tag_value(v / my_mult);
+        return t;
+    }
+};
+
+template<typename JNODE_TYPE>
+void
+TestSimpleSuccessorArc(const char *name) {
+    tbb::flow::graph g;
+    {
+        REMARK("Join<%s> successor test ", name);
+        tbb::flow::join_node<tbb::flow::tuple<int>, JNODE_TYPE> qj(g);
+        tbb::flow::broadcast_node<tbb::flow::tuple<int> > bnode(g);
+        tbb::flow::make_edge(qj, bnode);
+        ASSERT(!qj.my_successors.empty(),"successor missing after linking");
+        g.reset();
+        ASSERT(!qj.my_successors.empty(),"successor missing after reset()");
+        g.reset(tbb::flow::rf_clear_edges);
+        ASSERT(qj.my_successors.empty(), "successors not removed after reset(rf_clear_edges)");
+    }
+}
+
+template<>
+void
+TestSimpleSuccessorArc<tbb::flow::tag_matching>(const char *name) {
+    tbb::flow::graph g;
+    {
+        REMARK("Join<%s> successor test ", name);
+        typedef tbb::flow::tuple<int,int> my_tuple;
+        tbb::flow::join_node<my_tuple, tbb::flow::tag_matching> qj(g,
+                tag_func<int>(1),
+                tag_func<int>(1)
+                );
+        tbb::flow::broadcast_node<my_tuple > bnode(g);
+        tbb::flow::make_edge(qj, bnode);
+        ASSERT(!qj.my_successors.empty(),"successor missing after linking");
+        g.reset();
+        ASSERT(!qj.my_successors.empty(),"successor missing after reset()");
+        g.reset(tbb::flow::rf_clear_edges);
+        ASSERT(qj.my_successors.empty(), "successors not removed after reset(rf_clear_edges)");
+    }
+}
+
+void
+TestJoinNode() {
+    tbb::flow::graph g;
+
+    TestSimpleSuccessorArc<tbb::flow::queueing>("queueing");
+    TestSimpleSuccessorArc<tbb::flow::reserving>("reserving");
+    TestSimpleSuccessorArc<tbb::flow::tag_matching>("tag_matching");
+
+    // queueing and tagging join nodes have input queues, so the input ports do not reverse.
+    REMARK(" reserving preds");
+    {
+        tbb::flow::join_node<tbb::flow::tuple<int,int>, tbb::flow::reserving> rj(g);
+        tbb::flow::queue_node<int> q0(g);
+        tbb::flow::queue_node<int> q1(g);
+        tbb::flow::make_edge(q0,tbb::flow::input_port<0>(rj));
+        tbb::flow::make_edge(q1,tbb::flow::input_port<1>(rj));
+        q0.try_put(1);
+        g.wait_for_all();  // quiesce
+        ASSERT(!(tbb::flow::input_port<0>(rj).my_predecessors.empty()),"reversed port missing predecessor");
+        ASSERT((tbb::flow::input_port<1>(rj).my_predecessors.empty()),"non-reversed port has pred");
+        g.reset();
+        ASSERT((tbb::flow::input_port<0>(rj).my_predecessors.empty()),"reversed port has pred after reset()");
+        ASSERT((tbb::flow::input_port<1>(rj).my_predecessors.empty()),"non-reversed port has pred after reset()");
+        q1.try_put(2);
+        g.wait_for_all();  // quiesce
+        ASSERT(!(tbb::flow::input_port<1>(rj).my_predecessors.empty()),"reversed port missing predecessor");
+        ASSERT((tbb::flow::input_port<0>(rj).my_predecessors.empty()),"non-reversed port has pred");
+        g.reset();
+        ASSERT((tbb::flow::input_port<1>(rj).my_predecessors.empty()),"reversed port has pred after reset()");
+        ASSERT((tbb::flow::input_port<0>(rj).my_predecessors.empty()),"non-reversed port has pred after reset()");
+        // should reset predecessors just as regular reset.
+        q1.try_put(3);
+        g.wait_for_all();  // quiesce
+        ASSERT(!(tbb::flow::input_port<1>(rj).my_predecessors.empty()),"reversed port missing predecessor");
+        ASSERT((tbb::flow::input_port<0>(rj).my_predecessors.empty()),"non-reversed port has pred");
+        g.reset(tbb::flow::rf_clear_edges);
+        ASSERT((tbb::flow::input_port<1>(rj).my_predecessors.empty()),"reversed port has pred after reset()");
+        ASSERT((tbb::flow::input_port<0>(rj).my_predecessors.empty()),"non-reversed port has pred after reset()");
+        ASSERT(q0.my_successors.empty(), "edge not removed by reset(rf_clear_edges)");
+        ASSERT(q1.my_successors.empty(), "edge not removed by reset(rf_clear_edges)");
+    }
+    REMARK(" done\n");
+}
+
+void
+TestLimiterNode() {
+    int out_int;
+    tbb::flow::graph g;
+    tbb::flow::limiter_node<int> ln(g,1);
+    REMARK("Testing limiter_node: preds and succs");
+    ASSERT(ln.decrement.my_predecessor_count == 0, "error in pred count");
+    ASSERT(ln.decrement.my_initial_predecessor_count == 0, "error in initial pred count");
+    ASSERT(ln.decrement.my_current_count == 0, "error in current count");
+    ASSERT(ln.init_decrement_predecessors == 0, "error in decrement predecessors");
+    ASSERT(ln.my_threshold == 1, "error in my_threshold");
+    tbb::flow::queue_node<int> inq(g);
+    tbb::flow::queue_node<int> outq(g);
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> bn(g);
+
+    tbb::flow::make_edge(inq,ln);
+    tbb::flow::make_edge(ln,outq);
+    tbb::flow::make_edge(bn,ln.decrement);
+
+    g.wait_for_all();
+    ASSERT(!(ln.my_successors.empty()),"successors empty after make_edge");
+    ASSERT(ln.my_predecessors.empty(), "input edge reversed");
+    inq.try_put(1);
+    g.wait_for_all();
+    ASSERT(outq.try_get(out_int) && out_int == 1, "limiter_node didn't pass first value");
+    ASSERT(ln.my_predecessors.empty(), "input edge reversed");
+    inq.try_put(2);
+    g.wait_for_all();
+    ASSERT(!outq.try_get(out_int), "limiter_node incorrectly passed second input");
+    ASSERT(!ln.my_predecessors.empty(), "input edge to limiter_node not reversed");
+    bn.try_put(tbb::flow::continue_msg());
+    g.wait_for_all();
+    ASSERT(outq.try_get(out_int) && out_int == 2, "limiter_node didn't pass second value");
+    g.wait_for_all();
+    ASSERT(!ln.my_predecessors.empty(), "input edge was reversed(after try_get())");
+    g.reset();
+    ASSERT(ln.my_predecessors.empty(), "input edge not reset");
+    inq.try_put(3);
+    g.wait_for_all();
+    ASSERT(outq.try_get(out_int) && out_int == 3, "limiter_node didn't pass third value");
+
+    REMARK(" rf_clear_edges");
+    // currently the limiter_node will not pass another message
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(ln.decrement.my_predecessor_count == 0, "error in pred count");
+    ASSERT(ln.decrement.my_initial_predecessor_count == 0, "error in initial pred count");
+    ASSERT(ln.decrement.my_current_count == 0, "error in current count");
+    ASSERT(ln.init_decrement_predecessors == 0, "error in decrement predecessors");
+    ASSERT(ln.my_threshold == 1, "error in my_threshold");
+    ASSERT(ln.my_predecessors.empty(), "preds not reset(rf_clear_edges)");
+    ASSERT(ln.my_successors.empty(), "preds not reset(rf_clear_edges)");
+    ASSERT(inq.my_successors.empty(), "Arc not removed on reset(rf_clear_edges)");
+    ASSERT(inq.my_successors.empty(), "Arc not removed on reset(rf_clear_edges)");
+    ASSERT(bn.my_successors.empty(), "control edge not removed on reset(rf_clear_edges)");
+    tbb::flow::make_edge(inq,ln);
+    tbb::flow::make_edge(ln,outq);
+    inq.try_put(4);
+    inq.try_put(5);
+    g.wait_for_all();
+    ASSERT(outq.try_get(out_int),"missing output after reset(rf_clear_edges)");
+    ASSERT(out_int == 4, "input incorrect (4)");
+    bn.try_put(tbb::flow::continue_msg());
+    g.wait_for_all();
+    ASSERT(!outq.try_get(out_int),"second output incorrectly passed (rf_clear_edges)");
+    REMARK(" done\n");
+}
+
+template<typename MF_TYPE>
+struct mf_body {
+    tbb::atomic<int> *_flag;
+    mf_body( tbb::atomic<int> &myatomic) : _flag(&myatomic) { }
+    void operator()( const int& in, typename MF_TYPE::output_ports_type &outports) {
+        if(*_flag == 0) {
+            *_flag = 1;
+            BACKOFF_WAIT(*_flag == 1, "multifunction_node not released");
+        }
+
+        if(in & 0x1) tbb::flow::get<1>(outports).try_put(in);
+        else         tbb::flow::get<0>(outports).try_put(in);
+    }
+};
+
+template<typename P, typename T>
+struct test_reversal;
+template<typename T>
+struct test_reversal<tbb::flow::queueing, T> {
+    test_reversal() { REMARK("<queueing>"); }
+    // queueing node will not reverse.
+    bool operator()( T &node) { return node.my_predecessors.empty(); }
+};
+
+template<typename T>
+struct test_reversal<tbb::flow::rejecting, T> {
+    test_reversal() { REMARK("<rejecting>"); }
+    bool operator()( T &node) { return !node.my_predecessors.empty(); }
+};
+
+template<typename P>
+void
+TestMultifunctionNode() {
+    typedef tbb::flow::multifunction_node<int, tbb::flow::tuple<int, int>, P> multinode_type;
+    REMARK("Testing multifunction_node");
+    test_reversal<P,multinode_type> my_test;
+    REMARK(":");
+    tbb::flow::graph g;
+    multinode_type mf(g, tbb::flow::serial, mf_body<multinode_type>(serial_fn_state0));
+    tbb::flow::queue_node<int> qin(g);
+    tbb::flow::queue_node<int> qodd_out(g);
+    tbb::flow::queue_node<int> qeven_out(g);
+    tbb::flow::make_edge(qin,mf);
+    tbb::flow::make_edge(tbb::flow::output_port<0>(mf), qeven_out);
+    tbb::flow::make_edge(tbb::flow::output_port<1>(mf), qodd_out);
+    g.wait_for_all();
+    for( int ii = 0; ii < 2 ; ++ii) {
+        serial_fn_state0 = 0;
+        if(ii == 0) REMARK(" reset preds"); else REMARK(" 2nd");
+        qin.try_put(0);
+        // wait for node to be active
+        BACKOFF_WAIT(serial_fn_state0 == 0, "timed out waiting for first put");
+        qin.try_put(1);
+        BACKOFF_WAIT((!my_test(mf)), "Timed out waiting");
+        ASSERT(my_test(mf), "fail second put test");
+        g.my_root_task->cancel_group_execution();
+        // release node
+        serial_fn_state0 = 2;
+        g.wait_for_all();
+        ASSERT(my_test(mf), "fail cancel group test");
+        if( ii == 1) {
+            REMARK(" rf_clear_edges");
+            g.reset(tbb::flow::rf_clear_edges);
+            ASSERT(tbb::flow::output_port<0>(mf).my_successors.empty(), "output_port<0> not reset (rf_clear_edges)");
+            ASSERT(tbb::flow::output_port<1>(mf).my_successors.empty(), "output_port<1> not reset (rf_clear_edges)");
+        }
+        else
+        {
+            g.reset();
+        }
+        ASSERT(mf.my_predecessors.empty(), "edge didn't reset");
+        ASSERT((ii == 0 && !qin.my_successors.empty()) || (ii == 1 && qin.my_successors.empty()), "edge didn't reset");
+    }
+    REMARK(" done\n");
+}
+
+// indexer_node is like a broadcast_node, in that none of its inputs reverse, and it
+// never allows a successor to reverse its edge, so we only need test the successors.
+void
+TestIndexerNode() {
+    tbb::flow::graph g;
+    typedef tbb::flow::indexer_node< int, int > indexernode_type;
+    indexernode_type inode(g);
+    REMARK("Testing indexer_node:");
+    tbb::flow::queue_node<indexernode_type::output_type> qout(g);
+    tbb::flow::make_edge(inode,qout);
+    g.wait_for_all();
+    ASSERT(!inode.my_successors.empty(), "successor of indexer_node missing");
+    g.reset();
+    ASSERT(!inode.my_successors.empty(), "successor of indexer_node missing after reset");
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(inode.my_successors.empty(), "successor of indexer_node not removed by reset(rf_clear_edges)");
+    REMARK(" done\n");
+}
+
+template<typename Node>
+void
+TestScalarNode(const char *name) {
+    tbb::flow::graph g;
+    Node on(g);
+    tbb::flow::queue_node<int> qout(g);
+    REMARK("Testing %s:", name);
+    tbb::flow::make_edge(on,qout);
+    g.wait_for_all();
+    ASSERT(!on.my_successors.empty(), "edge not added");
+    g.reset();
+    ASSERT(!on.my_successors.empty(), "edge improperly removed");
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(on.my_successors.empty(), "edge not removed by reset(rf_clear_edges)");
+    REMARK(" done\n");
+}
+
+struct seq_body {
+    size_t operator()(const int &in) {
+        return size_t(in / 3);
+    }
+};
+
+// sequencer_node behaves like a queueing node, but requires a different constructor.
+void
+TestSequencerNode() {
+    tbb::flow::graph g;
+    tbb::flow::sequencer_node<int> bnode(g, seq_body());
+    REMARK("Testing sequencer_node:");
+    tbb::flow::function_node<int> fnode(g, tbb::flow::serial, serial_fn_body<int>(serial_fn_state0));
+    REMARK("Testing sequencer_node:");
+    serial_fn_state0 = 0;  // reset to waiting state.
+    REMARK(" make_edge");
+    tbb::flow::make_edge(bnode, fnode);
+    ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after make_edge");
+    REMARK(" try_put");
+    bnode.try_put(0);  // will forward to the fnode
+    BACKOFF_WAIT( serial_fn_state0 == 0, "timeout waiting for function_node");  // wait for the function_node to fire up
+    ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after forwarding message");
+    serial_fn_state0 = 0;
+    g.wait_for_all();
+    REMARK(" remove_edge");
+    tbb::flow::remove_edge(bnode, fnode);
+    ASSERT(bnode.my_successors.empty(), "buffering node has a successor after remove_edge");
+    tbb::flow::join_node<tbb::flow::tuple<int,int>,tbb::flow::reserving> jnode(g);
+    tbb::flow::make_edge(bnode, tbb::flow::input_port<0>(jnode));  // will spawn a task
+    g.wait_for_all();
+    ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after attaching to join");
+    REMARK(" reverse");
+    bnode.try_put(3);  // the edge should reverse
+    g.wait_for_all();
+    ASSERT(bnode.my_successors.empty(), "buffering node has a successor after reserving");
+    REMARK(" reset()");
+    g.wait_for_all();
+    g.reset();  // should be in forward direction again
+    ASSERT(!bnode.my_successors.empty(), "buffering node has no successor after reset()");
+    REMARK(" remove_edge");
+    g.reset(tbb::flow::rf_clear_edges);  // should be in forward direction again
+    ASSERT(bnode.my_successors.empty(), "buffering node has a successor after reset(rf_clear_edges)");
+    ASSERT(fnode.my_predecessors.empty(), "buffering node reversed after reset(rf_clear_edges)");
+    REMARK("  done\n");
+    g.wait_for_all();
+}
+
+struct snode_body {
+    int max_cnt;
+    int my_cnt;
+    snode_body( const int &in) : max_cnt(in) { my_cnt = 0; }
+    bool operator()(int &out) {
+        if(max_cnt <= my_cnt++) return false;
+        out = my_cnt;
+        return true;
+    }
+};
+
+void
+TestSourceNode() {
+    tbb::flow::graph g;
+    tbb::flow::source_node<int> sn(g, snode_body(4), false);
+    REMARK("Testing source_node:");
+    tbb::flow::queue_node<int> qin(g);
+    tbb::flow::join_node<tbb::flow::tuple<int,int>, tbb::flow::reserving> jn(g);
+    tbb::flow::queue_node<tbb::flow::tuple<int,int> > qout(g);
+
+    REMARK(" make_edges");
+    tbb::flow::make_edge(sn, tbb::flow::input_port<0>(jn));
+    tbb::flow::make_edge(qin, tbb::flow::input_port<1>(jn));
+    tbb::flow::make_edge(jn,qout);
+    ASSERT(!sn.my_successors.empty(), "source node has no successor after make_edge");
+    g.wait_for_all();
+    g.reset();
+    ASSERT(!sn.my_successors.empty(), "source node has no successor after reset");
+    g.wait_for_all();
+    g.reset(tbb::flow::rf_clear_edges);
+    ASSERT(sn.my_successors.empty(), "source node has successor after reset(rf_clear_edges)");
+    tbb::flow::make_edge(sn, tbb::flow::input_port<0>(jn));
+    tbb::flow::make_edge(qin, tbb::flow::input_port<1>(jn));
+    tbb::flow::make_edge(jn,qout);
+    g.wait_for_all();
+    REMARK(" activate");
+    sn.activate();  // will forward to the fnode
+    REMARK(" wait1");
+    BACKOFF_WAIT( !sn.my_successors.empty(), "Timed out waiting for edge to reverse");
+    ASSERT(sn.my_successors.empty(), "source node has no successor after forwarding message");
+
+    g.wait_for_all();
+    g.reset();
+    ASSERT(!sn.my_successors.empty(), "source_node has no successors after reset");
+    ASSERT(tbb::flow::input_port<0>(jn).my_predecessors.empty(), "successor if source_node has pred after reset.");
+    REMARK(" done\n");
+}
+
+int TestMain() {
+
+    if(MinThread < 3) MinThread = 3;
+    tbb::task_scheduler_init init(MinThread);  // tests presume at least three threads
+
+    TestBufferingNode< tbb::flow::buffer_node<int> >("buffer_node");
+    TestBufferingNode< tbb::flow::priority_queue_node<int> >("priority_queue_node");
+    TestBufferingNode< tbb::flow::queue_node<int> >("queue_node");
+    TestSequencerNode();
+
+    TestMultifunctionNode<tbb::flow::rejecting>();
+    TestMultifunctionNode<tbb::flow::queueing>();
+    TestSourceNode();
+    TestContinueNode();
+    TestFunctionNode();
+
+    TestJoinNode();
+
+    TestLimiterNode();
+    TestIndexerNode();
+    TestSplitNode();
+    TestScalarNode<tbb::flow::broadcast_node<int> >("broadcast_node");
+    TestScalarNode<tbb::flow::overwrite_node<int> >("overwrite_node");
+    TestScalarNode<tbb::flow::write_once_node<int> >("write_once_node");
+
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_fp.cpp b/xdl/third_party/tbb/src/test/test_fp.cpp
new file mode 100644
index 00000000..21f5f050
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_fp.cpp
@@ -0,0 +1,385 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/** This test checks the automatic propagation of master thread FPU settings
+    into the worker threads. **/
+
+#include "harness_fp.h"
+#include "harness.h"
+#define private public
+#include "tbb/task.h"
+#undef private
+#include "tbb/parallel_for.h"
+#include "tbb/task_scheduler_init.h"
+
+const int N = 500000;
+
+#if ( __TBB_x86_32 || __TBB_x86_64 ) && __TBB_CPU_CTL_ENV_PRESENT && !defined(__TBB_WIN32_USE_CL_BUILTINS)
+#include "harness_barrier.h"
+
+class CheckNoSseStatusPropagationBody : public NoAssign {
+    Harness::SpinBarrier &barrier;
+public:
+    CheckNoSseStatusPropagationBody( Harness::SpinBarrier &_barrier ) : barrier(_barrier) {}
+    void operator()( const tbb::blocked_range<int>& ) const {
+        barrier.wait();
+        tbb::internal::cpu_ctl_env ctl;
+        ctl.get_env();
+        ASSERT( (ctl.mxcsr & SSE_STATUS_MASK) == 0, "FPU control status bits have been propagated." );
+    }
+};
+
+void CheckNoSseStatusPropagation() {
+    tbb::internal::cpu_ctl_env ctl;
+    ctl.get_env();
+    ctl.mxcsr |= SSE_STATUS_MASK;
+    ctl.set_env();
+    const int num_threads = tbb::task_scheduler_init::default_num_threads();
+    Harness::SpinBarrier barrier(num_threads);
+    tbb::task_scheduler_init init(num_threads);
+    tbb::parallel_for( tbb::blocked_range<int>(0, num_threads), CheckNoSseStatusPropagationBody(barrier) );
+    ctl.mxcsr &= ~SSE_STATUS_MASK;
+    ctl.set_env();
+}
+#else /* Other archs */
+void CheckNoSseStatusPropagation() {}
+#endif /* Other archs */
+
+class RoundingModeCheckBody {
+    int m_mode;
+    int m_sseMode;
+public:
+    void operator() ( int /*iter*/ ) const {
+        ASSERT( GetRoundingMode() == m_mode, "FPU control state has not been propagated." );
+        ASSERT( GetSseMode() == m_sseMode, "SSE control state has not been propagated." );
+    }
+
+    RoundingModeCheckBody ( int mode, int sseMode ) : m_mode(mode), m_sseMode(sseMode) {}
+};
+
+void TestArenaFpuEnvPropagation( int id ) {
+    // TBB scheduler instance in a master thread captures the FPU control state
+    // at the moment of its initialization and passes it to the workers toiling
+    // on its behalf.
+    for( int k = 0; k < NumSseModes; ++k ) {
+        int sse_mode = SseModes[(k + id) % NumSseModes];
+        SetSseMode( sse_mode );
+        for( int i = 0; i < NumRoundingModes; ++i ) {
+            int mode = RoundingModes[(i + id) % NumRoundingModes];
+            SetRoundingMode( mode );
+            // New mode must be set before TBB scheduler is initialized
+            tbb::task_scheduler_init init;
+            tbb::parallel_for( 0, N, 1, RoundingModeCheckBody(mode, sse_mode) );
+            ASSERT( GetRoundingMode() == mode, NULL );
+        }
+    }
+}
+
+#if __TBB_FP_CONTEXT
+void TestArenaFpuEnvPersistence( int id ) {
+    // Since the following loop uses auto-initialization, the scheduler instance
+    // implicitly created by the first parallel_for invocation will persist
+    // until the thread ends, and thus workers will use the mode set by the
+    // first iteration.
+    int captured_mode = RoundingModes[id % NumRoundingModes];
+    int captured_sse_mode = SseModes[id % NumSseModes];
+    for( int k = 0; k < NumSseModes; ++k ) {
+        int sse_mode = SseModes[(k + id) % NumSseModes];
+        SetSseMode( sse_mode );
+        for( int i = 0; i < NumRoundingModes; ++i ) {
+            int mode = RoundingModes[(i + id) % NumRoundingModes];
+            SetRoundingMode( mode );
+            tbb::parallel_for( 0, N, 1, RoundingModeCheckBody(captured_mode, captured_sse_mode) );
+            ASSERT( GetRoundingMode() == mode, NULL );
+        }
+    }
+}
+#endif
+
+class LauncherBody {
+public:
+    void operator() ( int id ) const {
+        TestArenaFpuEnvPropagation( id );
+#if __TBB_FP_CONTEXT
+        TestArenaFpuEnvPersistence( id );
+#endif
+    }
+};
+
+void TestFpuEnvPropagation () {
+    const int p = tbb::task_scheduler_init::default_num_threads();
+    // The test should be run in an oversubscription mode. So create 4*p threads but
+    // limit the oversubscription for big machines (p>32) with 4*32+(p-32) threads.
+    const int num_threads = p + (NumRoundingModes-1)*min(p,32);
+    NativeParallelFor ( num_threads, LauncherBody() );
+}
+
+void TestCpuCtlEnvApi () {
+    for( int k = 0; k < NumSseModes; ++k ) {
+        SetSseMode( SseModes[k] );
+        for( int i = 0; i < NumRoundingModes; ++i ) {
+            SetRoundingMode( RoundingModes[i] );
+            ASSERT( GetRoundingMode() == RoundingModes[i], NULL );
+            ASSERT( GetSseMode() == SseModes[k], NULL );
+        }
+    }
+}
+
+#if __TBB_FP_CONTEXT
+const int numModes = NumRoundingModes*NumSseModes;
+const int numArenas = 4;
+tbb::task_group_context *contexts[numModes];
+// +1 for a default context
+int roundingModes[numModes+numArenas];
+int sseModes[numModes+numArenas];
+
+class TestContextFpuEnvBody {
+    int arenaNum;
+    int mode;
+    int depth;
+public:
+    TestContextFpuEnvBody( int _arenaNum, int _mode, int _depth = 0 ) : arenaNum(_arenaNum), mode(_mode), depth(_depth) {}
+    void operator()( const tbb::blocked_range<int> &r ) const;
+};
+
+inline void SetMode( int mode ) {
+    SetRoundingMode( roundingModes[mode] );
+    SetSseMode( sseModes[mode] );
+}
+
+inline void AssertMode( int mode ) {
+    ASSERT( GetRoundingMode() == roundingModes[mode], "FPU control state has not been set correctly." );
+    ASSERT( GetSseMode() == sseModes[mode], "SSE control state has not been set correctly." );
+}
+
+inline int SetNextMode( int mode, int step ) {
+    const int nextMode = (mode+step)%numModes;
+    SetMode( nextMode );
+    return nextMode;
+}
+
+class TestContextFpuEnvTask : public tbb::task {
+    int arenaNum;
+    int mode;
+    int depth;
+#if __TBB_CPU_CTL_ENV_PRESENT
+    static const int MAX_DEPTH = 3;
+#else
+    static const int MAX_DEPTH = 4;
+#endif
+public:
+    TestContextFpuEnvTask( int _arenaNum, int _mode, int _depth = 0 ) : arenaNum(_arenaNum), mode(_mode), depth(_depth) {}
+    tbb::task* execute() __TBB_override {
+        AssertMode( mode );
+        if ( depth < MAX_DEPTH ) {
+            // Test default context.
+            const int newMode1 = SetNextMode( mode, depth+1 );
+            tbb::parallel_for( tbb::blocked_range<int>(0, numModes+1), TestContextFpuEnvBody( arenaNum, mode, depth+1 ) );
+            AssertMode( newMode1 );
+
+            // Test user default context.
+            const int newMode2 = SetNextMode( newMode1, depth+1 );
+            tbb::task_group_context ctx1;
+            const int newMode3 = SetNextMode( newMode2, depth+1 );
+            tbb::parallel_for( tbb::blocked_range<int>(0, numModes+1), TestContextFpuEnvBody( arenaNum, mode, depth+1 ), ctx1 );
+            AssertMode( newMode3 );
+
+            // Test user context which captured FPU control settings.
+            const int newMode4 = SetNextMode( newMode3, depth+1 );
+            // Capture newMode4
+            ctx1.capture_fp_settings();
+            const int newMode5 = SetNextMode( newMode4, depth+1 );
+            tbb::parallel_for( tbb::blocked_range<int>(0, numModes+1), TestContextFpuEnvBody( arenaNum, newMode4, depth+1 ), ctx1 );
+            AssertMode( newMode5 );
+
+            // And again test user context which captured FPU control settings to check multiple captures.
+            const int newMode6 = SetNextMode( newMode5, depth+1 );
+            // Capture newMode6
+            ctx1.capture_fp_settings();
+            const int newMode7 = SetNextMode( newMode6, depth+1 );
+            tbb::parallel_for( tbb::blocked_range<int>(0, numModes+1), TestContextFpuEnvBody( arenaNum, newMode6, depth+1 ), ctx1 );
+            AssertMode( newMode7 );
+
+            // Test an isolated context. The isolated context should use default FPU control settings.
+            const int newMode8 = SetNextMode( newMode7, depth+1 );
+            tbb::task_group_context ctx2( tbb::task_group_context::isolated );
+            const int newMode9 = SetNextMode( newMode8, depth+1 );
+            tbb::parallel_for( tbb::blocked_range<int>(0, numModes+1), TestContextFpuEnvBody( arenaNum, numModes+arenaNum, depth+1 ), ctx2 );
+            AssertMode( newMode9 );
+
+            // The binding should not owerrite captured FPU control settings.
+            const int newMode10 = SetNextMode( newMode9, depth+1 );
+            tbb::task_group_context ctx3;
+            ctx3.capture_fp_settings();
+            const int newMode11 = SetNextMode( newMode10, depth+1 );
+            tbb::parallel_for( tbb::blocked_range<int>(0, numModes+1), TestContextFpuEnvBody( arenaNum, newMode10, depth+1 ), ctx3 );
+            AssertMode( newMode11 );
+
+            // Restore initial mode since user code in tbb::task::execute should not change FPU settings.
+            SetMode( mode );
+        }
+
+        return NULL;
+    }
+};
+
+void TestContextFpuEnvBody::operator()( const tbb::blocked_range<int> &r ) const {
+    AssertMode( mode );
+
+    const int newMode = SetNextMode( mode, depth+2 );
+
+    int end = r.end();
+    if ( end-1 == numModes ) {
+        // For a default context our mode should be inherited.
+        tbb::task::spawn_root_and_wait(
+            *new( tbb::task::allocate_root() ) TestContextFpuEnvTask( arenaNum, mode, depth ) );
+        AssertMode( newMode );
+        end--;
+    }
+    for ( int i=r.begin(); i<end; ++i ) {
+        tbb::task::spawn_root_and_wait(
+            *new( tbb::task::allocate_root(*contexts[i]) ) TestContextFpuEnvTask( arenaNum, i, depth ) );
+        AssertMode( newMode );
+    }
+
+    // Restore initial mode since user code in tbb::task::execute should not change FPU settings.
+    SetMode( mode );
+}
+
+class TestContextFpuEnvNativeLoopBody {
+public:
+    void operator() ( int arenaNum ) const {
+        SetMode(numModes+arenaNum);
+        tbb::task_scheduler_init init;
+        tbb::task::spawn_root_and_wait( *new (tbb::task::allocate_root() ) TestContextFpuEnvTask( arenaNum, numModes+arenaNum ) );
+    }
+};
+
+#if TBB_USE_EXCEPTIONS
+const int NUM_ITERS = 1000;
+class TestContextFpuEnvEhBody {
+    int mode;
+    int eh_iter;
+    int depth;
+public:
+    TestContextFpuEnvEhBody( int _mode, int _eh_iter, int _depth = 0 ) : mode(_mode), eh_iter(_eh_iter), depth(_depth) {}
+    void operator()( const tbb::blocked_range<int> &r ) const {
+        AssertMode( mode );
+        if ( depth < 1 ) {
+            const int newMode1 = SetNextMode( mode, 1 );
+            tbb::task_group_context ctx;
+            ctx.capture_fp_settings();
+            const int newMode2 = SetNextMode( newMode1, 1 );
+            try {
+                tbb::parallel_for( tbb::blocked_range<int>(0, NUM_ITERS), TestContextFpuEnvEhBody(newMode1,rand()%NUM_ITERS,1), tbb::simple_partitioner(), ctx );
+            } catch (...) {
+                AssertMode( newMode2 );
+                if ( r.begin() == eh_iter ) throw;
+            }
+            AssertMode( newMode2 );
+            SetMode( mode );
+        } else if ( r.begin() == eh_iter ) throw 0;
+    }
+};
+
+class TestContextFpuEnvEhNativeLoopBody {
+public:
+    void operator() ( int arenaNum ) const {
+        SetMode( arenaNum%numModes );
+        try {
+            tbb::parallel_for( tbb::blocked_range<int>(0, NUM_ITERS), TestContextFpuEnvEhBody((arenaNum+1)%numModes,rand()%NUM_ITERS),
+                tbb::simple_partitioner(), *contexts[(arenaNum+1)%numModes] );
+            ASSERT( false, "parallel_for has not thrown an exception." );
+        } catch (...) {
+            AssertMode( arenaNum%numModes );
+        }
+    }
+};
+#endif /* TBB_USE_EXCEPTIONS */
+
+void TestContextFpuEnv() {
+    // Prepare contexts' fp modes.
+    for ( int i = 0, modeNum = 0; i < NumRoundingModes; ++i ) {
+        const int roundingMode = RoundingModes[i];
+        SetRoundingMode( roundingMode );
+        for( int j = 0; j < NumSseModes; ++j, ++modeNum ) {
+            const int sseMode = SseModes[j];
+            SetSseMode( sseMode );
+
+            contexts[modeNum] = new tbb::task_group_context( tbb::task_group_context::isolated,
+                tbb::task_group_context::default_traits | tbb::task_group_context::fp_settings );
+            roundingModes[modeNum] = roundingMode;
+            sseModes[modeNum] = sseMode;
+        }
+    }
+    // Prepare arenas' fp modes.
+    for ( int arenaNum = 0; arenaNum < numArenas; ++arenaNum ) {
+        roundingModes[numModes+arenaNum] = roundingModes[arenaNum%numModes];
+        sseModes[numModes+arenaNum] = sseModes[arenaNum%numModes];
+    }
+    NativeParallelFor( numArenas, TestContextFpuEnvNativeLoopBody() );
+#if TBB_USE_EXCEPTIONS
+    NativeParallelFor( numArenas, TestContextFpuEnvEhNativeLoopBody() );
+#endif
+    for ( int modeNum = 0; modeNum < numModes; ++modeNum )
+        delete contexts[modeNum];
+}
+
+tbb::task_group_context glbIsolatedCtx( tbb::task_group_context::isolated );
+int glbIsolatedCtxMode = -1;
+
+struct TestGlobalIsolatedContextTask : public tbb::task {
+    tbb::task* execute() __TBB_override {
+        AssertFPMode( glbIsolatedCtxMode );
+        return NULL;
+    }
+};
+
+#include "tbb/mutex.h"
+
+struct TestGlobalIsolatedContextNativeLoopBody {
+    void operator()( int threadId ) const {
+        FPModeContext fpGuard( threadId );
+        static tbb::mutex rootAllocMutex;
+        rootAllocMutex.lock();
+        if ( glbIsolatedCtxMode == -1 )
+            glbIsolatedCtxMode = threadId;
+        tbb::task &root = *new (tbb::task::allocate_root( glbIsolatedCtx )) TestGlobalIsolatedContextTask();
+        rootAllocMutex.unlock();
+        tbb::task::spawn_root_and_wait( root );
+    }
+};
+
+void TestGlobalIsolatedContext() {
+    ASSERT( numArenas > 1, NULL );
+    NativeParallelFor( numArenas, TestGlobalIsolatedContextNativeLoopBody() );
+}
+#endif /* __TBB_FP_CONTEXT */
+
+int TestMain () {
+    TestCpuCtlEnvApi();
+    TestFpuEnvPropagation();
+    CheckNoSseStatusPropagation();
+#if __TBB_FP_CONTEXT
+    TestContextFpuEnv();
+    TestGlobalIsolatedContext();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_function_node.cpp b/xdl/third_party/tbb/src/test/test_function_node.cpp
new file mode 100644
index 00000000..1b98a2a8
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_function_node.cpp
@@ -0,0 +1,599 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/spin_rw_mutex.h"
+
+#define N 100
+#define MAX_NODES 4
+
+//! Performs test on function nodes with limited concurrency and buffering
+/** Theses tests check:
+    1) that the number of executing copies never exceed the concurrency limit
+    2) that the node never rejects
+    3) that no items are lost
+    and 4) all of this happens even if there are multiple predecessors and successors
+*/
+
+template< typename InputType >
+struct parallel_put_until_limit : private NoAssign {
+
+    harness_counting_sender<InputType> *my_senders;
+
+    parallel_put_until_limit( harness_counting_sender<InputType> *senders ) : my_senders(senders) {}
+
+    void operator()( int i ) const  {
+        if ( my_senders ) {
+            my_senders[i].try_put_until_limit();
+        }
+    }
+
+};
+
+template<typename IO>
+struct pass_through {
+    IO operator()(const IO& i) { return i; }
+};
+
+template< typename InputType, typename OutputType, typename Body >
+void buffered_levels( size_t concurrency, Body body ) {
+
+   // Do for lc = 1 to concurrency level
+   for ( size_t lc = 1; lc <= concurrency; ++lc ) {
+   tbb::flow::graph g;
+
+   // Set the execute_counter back to zero in the harness
+   harness_graph_executor<InputType, OutputType>::execute_count = 0;
+   // Set the number of current executors to zero.
+   harness_graph_executor<InputType, OutputType>::current_executors = 0;
+   // Set the max allowed executors to lc.  There is a check in the functor to make sure this is never exceeded.
+   harness_graph_executor<InputType, OutputType>::max_executors = lc;
+
+   // Create the function_node with the appropriate concurrency level, and use default buffering
+   tbb::flow::function_node< InputType, OutputType > exe_node( g, lc, body );
+   tbb::flow::function_node<InputType, InputType> pass_thru( g, tbb::flow::unlimited, pass_through<InputType>());
+
+   // Create a vector of identical exe_nodes and pass_thrus
+   std::vector< tbb::flow::function_node< InputType, OutputType > > exe_vec(2, exe_node);
+   std::vector< tbb::flow::function_node< InputType, InputType > > pass_thru_vec(2, pass_thru);
+   // Attach each pass_thru to its corresponding exe_node
+   for (size_t node_idx=0; node_idx<exe_vec.size(); ++node_idx) {
+       tbb::flow::make_edge(pass_thru_vec[node_idx], exe_vec[node_idx]);
+   }
+
+   // TODO: why the test is executed serially for the node pairs, not concurrently?
+   for (size_t node_idx=0; node_idx<exe_vec.size(); ++node_idx) {
+   // For num_receivers = 1 to MAX_NODES
+   for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+        // Create num_receivers counting receivers and connect the exe_vec[node_idx] to them.
+        std::vector< harness_mapped_receiver<OutputType>* > receivers(num_receivers);
+        for (size_t i = 0; i < num_receivers; i++) {
+            receivers[i] = new harness_mapped_receiver<OutputType>(g);
+        }
+
+        for (size_t r = 0; r < num_receivers; ++r ) {
+            tbb::flow::make_edge( exe_vec[node_idx], *receivers[r] );
+        }
+
+        // Do the test with varying numbers of senders
+        harness_counting_sender<InputType> *senders = NULL;
+        for (size_t num_senders = 1; num_senders <= MAX_NODES; ++num_senders ) {
+            // Create num_senders senders, set there message limit each to N, and connect them to pass_thru_vec[node_idx]
+            senders = new harness_counting_sender<InputType>[num_senders];
+            for (size_t s = 0; s < num_senders; ++s ) {
+               senders[s].my_limit = N;
+               senders[s].register_successor(pass_thru_vec[node_idx] );
+            }
+
+            // Initialize the receivers so they know how many senders and messages to check for
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                 receivers[r]->initialize_map( N, num_senders );
+            }
+
+            // Do the test
+            NativeParallelFor( (int)num_senders, parallel_put_until_limit<InputType>(senders) );
+            g.wait_for_all();
+
+            // confirm that each sender was requested from N times
+            for (size_t s = 0; s < num_senders; ++s ) {
+                size_t n = senders[s].my_received;
+                ASSERT( n == N, NULL );
+                ASSERT( senders[s].my_receiver == &pass_thru_vec[node_idx], NULL );
+            }
+            // validate the receivers
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                receivers[r]->validate();
+            }
+            delete [] senders;
+        }
+        for (size_t r = 0; r < num_receivers; ++r ) {
+            tbb::flow::remove_edge( exe_vec[node_idx], *receivers[r] );
+        }
+        ASSERT( exe_vec[node_idx].try_put( InputType() ) == true, NULL );
+        g.wait_for_all();
+        for (size_t r = 0; r < num_receivers; ++r ) {
+            // since it's detached, nothing should have changed
+            receivers[r]->validate();
+        }
+
+        for (size_t i = 0; i < num_receivers; i++) {
+            delete receivers[i];
+        }
+
+    } // for num_receivers
+    } // for node_idx
+    } // for concurrency level lc
+}
+
+const size_t Offset = 123;
+tbb::atomic<size_t> global_execute_count;
+
+struct inc_functor {
+
+    tbb::atomic<size_t> local_execute_count;
+    inc_functor( ) { local_execute_count = 0; }
+    inc_functor( const inc_functor &f ) { local_execute_count = f.local_execute_count; }
+    void operator=( const inc_functor &f ) { local_execute_count = f.local_execute_count; }
+
+    int operator()( int i ) {
+       ++global_execute_count;
+       ++local_execute_count;
+       return i;
+    }
+
+};
+
+template< typename InputType, typename OutputType >
+void buffered_levels_with_copy( size_t concurrency ) {
+
+    // Do for lc = 1 to concurrency level
+    for ( size_t lc = 1; lc <= concurrency; ++lc ) {
+        tbb::flow::graph g;
+
+        inc_functor cf;
+        cf.local_execute_count = Offset;
+        global_execute_count = Offset;
+
+        tbb::flow::function_node< InputType, OutputType > exe_node( g, lc, cf );
+
+        for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+
+           std::vector< harness_mapped_receiver<OutputType>* > receivers(num_receivers);
+           for (size_t i = 0; i < num_receivers; i++) {
+               receivers[i] = new harness_mapped_receiver<OutputType>(g);
+           }
+
+           for (size_t r = 0; r < num_receivers; ++r ) {
+               tbb::flow::make_edge( exe_node, *receivers[r] );
+            }
+
+            harness_counting_sender<InputType> *senders = NULL;
+            for (size_t num_senders = 1; num_senders <= MAX_NODES; ++num_senders ) {
+                senders = new harness_counting_sender<InputType>[num_senders];
+                for (size_t s = 0; s < num_senders; ++s ) {
+                    senders[s].my_limit = N;
+                    tbb::flow::make_edge( senders[s], exe_node );
+                }
+
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    receivers[r]->initialize_map( N, num_senders );
+                }
+
+                NativeParallelFor( (int)num_senders, parallel_put_until_limit<InputType>(senders) );
+                g.wait_for_all();
+
+                for (size_t s = 0; s < num_senders; ++s ) {
+                    size_t n = senders[s].my_received;
+                    ASSERT( n == N, NULL );
+                    ASSERT( senders[s].my_receiver == &exe_node, NULL );
+                }
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    receivers[r]->validate();
+                }
+                delete [] senders;
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( exe_node, *receivers[r] );
+            }
+            ASSERT( exe_node.try_put( InputType() ) == true, NULL );
+            g.wait_for_all();
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                receivers[r]->validate();
+            }
+
+            for (size_t i = 0; i < num_receivers; i++) {
+                delete receivers[i];
+            }
+        }
+
+        // validate that the local body matches the global execute_count and both are correct
+        inc_functor body_copy = tbb::flow::copy_body<inc_functor>( exe_node );
+        const size_t expected_count = N/2 * MAX_NODES * MAX_NODES * ( MAX_NODES + 1 ) + MAX_NODES + Offset;
+        size_t global_count = global_execute_count;
+        size_t inc_count = body_copy.local_execute_count;
+        ASSERT( global_count == expected_count && global_count == inc_count, NULL );
+        g.reset(tbb::flow::rf_reset_bodies);
+        body_copy = tbb::flow::copy_body<inc_functor>( exe_node );
+        inc_count = body_copy.local_execute_count;
+        ASSERT( Offset == inc_count, "reset(rf_reset_bodies) did not reset functor" );
+    }
+}
+
+template< typename InputType, typename OutputType >
+void run_buffered_levels( int c ) {
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    buffered_levels<InputType,OutputType>( c, []( InputType i ) -> OutputType { return harness_graph_executor<InputType, OutputType>::func(i); } );
+    #endif
+    buffered_levels<InputType,OutputType>( c, &harness_graph_executor<InputType, OutputType>::func );
+    buffered_levels<InputType,OutputType>( c, typename harness_graph_executor<InputType, OutputType>::functor() );
+    buffered_levels_with_copy<InputType,OutputType>( c );
+}
+
+
+//! Performs test on executable nodes with limited concurrency
+/** Theses tests check:
+    1) that the nodes will accepts puts up to the concurrency limit,
+    2) the nodes do not exceed the concurrency limit even when run with more threads (this is checked in the harness_graph_executor),
+    3) the nodes will receive puts from multiple successors simultaneously,
+    and 4) the nodes will send to multiple predecessors.
+    There is no checking of the contents of the messages for corruption.
+*/
+
+template< typename InputType, typename OutputType, typename Body >
+void concurrency_levels( size_t concurrency, Body body ) {
+
+   for ( size_t lc = 1; lc <= concurrency; ++lc ) {
+       tbb::flow::graph g;
+
+       // Set the execute_counter back to zero in the harness
+       harness_graph_executor<InputType, OutputType>::execute_count = 0;
+       // Set the number of current executors to zero.
+       harness_graph_executor<InputType, OutputType>::current_executors = 0;
+       // Set the max allowed executors to lc. There is a check in the functor to make sure this is never exceeded.
+       harness_graph_executor<InputType, OutputType>::max_executors = lc;
+
+       typedef tbb::flow::function_node< InputType, OutputType, tbb::flow::rejecting > fnode_type;
+       fnode_type exe_node( g, lc, body );
+
+       for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+
+            std::vector< harness_counting_receiver<OutputType> > receivers(num_receivers, harness_counting_receiver<OutputType>(g));
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            ASSERT(exe_node.successor_count() == 0, NULL);
+            ASSERT(exe_node.predecessor_count() == 0, NULL);
+#endif
+
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::make_edge( exe_node, receivers[r] );
+            }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            ASSERT(exe_node.successor_count() == num_receivers, NULL);
+            typename fnode_type::successor_list_type my_succs;
+            exe_node.copy_successors(my_succs);
+            ASSERT(my_succs.size() == num_receivers, NULL);
+            typename fnode_type::predecessor_list_type my_preds;
+            exe_node.copy_predecessors(my_preds);
+            ASSERT(my_preds.size() == 0, NULL);
+#endif
+
+            harness_counting_sender<InputType> *senders = NULL;
+
+            for (size_t num_senders = 1; num_senders <= MAX_NODES; ++num_senders ) {
+                senders = new harness_counting_sender<InputType>[num_senders];
+                {
+                    // Exclusively lock m to prevent exe_node from finishing
+                    tbb::spin_rw_mutex::scoped_lock l( harness_graph_executor<InputType, OutputType>::template mutex_holder<tbb::spin_rw_mutex>::mutex );
+
+                    // put to lc level, it will accept and then block at m
+                    for ( size_t c = 0 ; c < lc ; ++c ) {
+                        ASSERT( exe_node.try_put( InputType() ) == true, NULL );
+                    }
+                    // it only accepts to lc level
+                    ASSERT( exe_node.try_put( InputType() ) == false, NULL );
+
+                    for (size_t s = 0; s < num_senders; ++s ) {
+                       // register a sender
+                       senders[s].my_limit = N;
+                       exe_node.register_predecessor( senders[s] );
+                    }
+
+                } // release lock at end of scope, setting the exe node free to continue
+                // wait for graph to settle down
+                g.wait_for_all();
+
+                // confirm that each sender was requested from N times
+                for (size_t s = 0; s < num_senders; ++s ) {
+                    size_t n = senders[s].my_received;
+                    ASSERT( n == N, NULL );
+                    ASSERT( senders[s].my_receiver == &exe_node, NULL );
+                }
+                // confirm that each receivers got N * num_senders + the initial lc puts
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    size_t n = receivers[r].my_count;
+                    ASSERT( n == num_senders*N+lc, NULL );
+                    receivers[r].my_count = 0;
+                }
+                delete [] senders;
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( exe_node, receivers[r] );
+            }
+            ASSERT( exe_node.try_put( InputType() ) == true, NULL );
+            g.wait_for_all();
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                ASSERT( int(receivers[r].my_count) == 0, NULL );
+            }
+        }
+    }
+}
+
+
+template< typename InputType, typename OutputType >
+void run_concurrency_levels( int c ) {
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    concurrency_levels<InputType,OutputType>( c, []( InputType i ) -> OutputType { return harness_graph_executor<InputType, OutputType>::template tfunc<tbb::spin_rw_mutex>(i); } );
+    #endif
+    concurrency_levels<InputType,OutputType>( c, &harness_graph_executor<InputType, OutputType>::template tfunc<tbb::spin_rw_mutex> );
+    concurrency_levels<InputType,OutputType>( c, typename harness_graph_executor<InputType, OutputType>::template tfunctor<tbb::spin_rw_mutex>() );
+}
+
+
+struct empty_no_assign {
+   empty_no_assign() {}
+   empty_no_assign( int ) {}
+   operator int() { return 0; }
+};
+
+template< typename InputType >
+struct parallel_puts : private NoAssign {
+
+    tbb::flow::receiver< InputType > * const my_exe_node;
+
+    parallel_puts( tbb::flow::receiver< InputType > &exe_node ) : my_exe_node(&exe_node) {}
+
+    void operator()( int ) const  {
+        for ( int i = 0; i < N; ++i ) {
+            // the nodes will accept all puts
+            ASSERT( my_exe_node->try_put( InputType() ) == true, NULL );
+        }
+    }
+
+};
+
+//! Performs test on executable nodes with unlimited concurrency
+/** Theses tests check:
+    1) that the nodes will accept all puts
+    2) the nodes will receive puts from multiple predecessors simultaneously,
+    and 3) the nodes will send to multiple successors.
+    There is no checking of the contents of the messages for corruption.
+*/
+
+template< typename InputType, typename OutputType, typename Body >
+void unlimited_concurrency( Body body ) {
+
+    for (int p = 1; p < 2*MaxThread; ++p) {
+        tbb::flow::graph g;
+        tbb::flow::function_node< InputType, OutputType, tbb::flow::rejecting > exe_node( g, tbb::flow::unlimited, body );
+
+        for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+
+            std::vector< harness_counting_receiver<OutputType> > receivers(num_receivers, harness_counting_receiver<OutputType>(g));
+            harness_graph_executor<InputType, OutputType>::execute_count = 0;
+
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::make_edge( exe_node, receivers[r] );
+            }
+
+            NativeParallelFor( p, parallel_puts<InputType>(exe_node) );
+            g.wait_for_all();
+
+            // 2) the nodes will receive puts from multiple predecessors simultaneously,
+            size_t ec = harness_graph_executor<InputType, OutputType>::execute_count;
+            ASSERT( (int)ec == p*N, NULL );
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                size_t c = receivers[r].my_count;
+                // 3) the nodes will send to multiple successors.
+                ASSERT( (int)c == p*N, NULL );
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( exe_node, receivers[r] );
+            }
+            }
+        }
+    }
+
+template< typename InputType, typename OutputType >
+void run_unlimited_concurrency() {
+    harness_graph_executor<InputType, OutputType>::max_executors = 0;
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    unlimited_concurrency<InputType,OutputType>( []( InputType i ) -> OutputType { return harness_graph_executor<InputType, OutputType>::func(i); } );
+    #endif
+    unlimited_concurrency<InputType,OutputType>( &harness_graph_executor<InputType, OutputType>::func );
+    unlimited_concurrency<InputType,OutputType>( typename harness_graph_executor<InputType, OutputType>::functor() );
+}
+
+struct continue_msg_to_int {
+    int my_int;
+    continue_msg_to_int(int x) : my_int(x) {}
+    int operator()(tbb::flow::continue_msg) { return my_int; }
+};
+
+void test_function_node_with_continue_msg_as_input() {
+    // If this function terminates, then this test is successful
+    tbb::flow::graph g;
+
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> Start(g);
+
+    tbb::flow::function_node<tbb::flow::continue_msg, int, tbb::flow::rejecting> FN1( g, tbb::flow::serial, continue_msg_to_int(42));
+    tbb::flow::function_node<tbb::flow::continue_msg, int, tbb::flow::rejecting> FN2( g, tbb::flow::serial, continue_msg_to_int(43));
+
+    tbb::flow::make_edge( Start, FN1 );
+    tbb::flow::make_edge( Start, FN2 );
+
+    Start.try_put( tbb::flow::continue_msg() );
+    g.wait_for_all();
+}
+
+//! Tests limited concurrency cases for nodes that accept data messages
+void test_concurrency(int num_threads) {
+    tbb::task_scheduler_init init(num_threads);
+    run_concurrency_levels<int,int>(num_threads);
+    run_concurrency_levels<int,tbb::flow::continue_msg>(num_threads);
+    run_buffered_levels<int, int>(num_threads);
+    run_unlimited_concurrency<int,int>();
+    run_unlimited_concurrency<int,empty_no_assign>();
+    run_unlimited_concurrency<empty_no_assign,int>();
+    run_unlimited_concurrency<empty_no_assign,empty_no_assign>();
+    run_unlimited_concurrency<int,tbb::flow::continue_msg>();
+    run_unlimited_concurrency<empty_no_assign,tbb::flow::continue_msg>();
+    test_function_node_with_continue_msg_as_input();
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+struct add_to_counter {
+    int* counter;
+    add_to_counter(int& var):counter(&var){}
+    int operator()(int i){*counter+=1; return i + 1;}
+};
+
+template<typename FTYPE>
+void test_extract() {
+    int my_count = 0;
+    int cm;
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<int> b0(g);
+    tbb::flow::broadcast_node<int> b1(g);
+    tbb::flow::function_node<int, int, FTYPE> f0(g, tbb::flow::unlimited, add_to_counter(my_count));
+    tbb::flow::queue_node<int> q0(g);
+
+    tbb::flow::make_edge(b0, f0);
+    tbb::flow::make_edge(b1, f0);
+    tbb::flow::make_edge(f0, q0);
+    for( int i = 0; i < 2; ++i ) {
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 1, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(f0.predecessor_count() == 2 && f0.successor_count() == 1, "f0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 1 && q0.successor_count() == 0, "q0 has incorrect counts");
+
+        /* b0         */
+        /*   \        */
+        /*    f0 - q0 */
+        /*   /        */
+        /* b1         */
+
+        b0.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 1, "function_node didn't fire");
+        ASSERT(q0.try_get(cm), "function_node didn't forward");
+        b1.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 2, "function_node didn't fire");
+        ASSERT(q0.try_get(cm), "function_node didn't forward");
+
+        b0.extract();
+
+        /* b0         */
+        /*            */
+        /*    f0 - q0 */
+        /*   /        */
+        /* b1         */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(f0.predecessor_count() == 1 && f0.successor_count() == 1, "f0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 1 && q0.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(1);
+        b0.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 2, "b0 messages being forwarded to function_node even though it is disconnected");
+        b1.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 3, "function_node didn't fire though it has only one predecessor");
+        ASSERT(q0.try_get(cm), "function_node didn't forward second time");
+
+        f0.extract();
+
+        /* b0         */
+        /*            */
+        /*    f0   q0 */
+        /*            */
+        /* b1         */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 0, "b1 has incorrect counts");
+        ASSERT(f0.predecessor_count() == 0 && f0.successor_count() == 0, "f0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(1);
+        b0.try_put(1);
+        b1.try_put(1);
+        b1.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 3, "function_node didn't fire though it has only one predecessor");
+        ASSERT(!q0.try_get(cm), "function_node forwarded though it shouldn't");
+        make_edge(b0, f0);
+
+        /* b0         */
+        /*   \        */
+        /*    f0   q0 */
+        /*            */
+        /* b1         */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 1, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 0, "b1 has incorrect counts");
+        ASSERT(f0.predecessor_count() == 1 && f0.successor_count() == 0, "f0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+
+        b0.try_put(int());
+        g.wait_for_all();
+
+        ASSERT(my_count == 4, "function_node didn't fire though it has only one predecessor");
+        ASSERT(!q0.try_get(cm), "function_node forwarded though it shouldn't");
+
+        tbb::flow::make_edge(b1, f0);
+        tbb::flow::make_edge(f0, q0);
+        my_count = 0;
+    }
+}
+#endif
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+       test_concurrency(p);
+   }
+   lightweight_testing::test<tbb::flow::function_node>(10);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_extract<tbb::flow::rejecting>();
+    test_extract<tbb::flow::queueing>();
+#endif
+   return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_gfx_factory.cpp b/xdl/third_party/tbb/src/test/test_gfx_factory.cpp
new file mode 100644
index 00000000..8a5b410d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_gfx_factory.cpp
@@ -0,0 +1,309 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_FLOW_GRAPH_NODES 1
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_PREVIEW_GFX_FACTORY && __TBB_PREVIEW_STREAMING_NODE
+
+#if _MSC_VER
+#pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#endif
+
+#include "tbb/flow_graph.h"
+#include "tbb/gfx_factory.h"
+
+#include <cilk/cilk.h>
+
+#include "harness.h"
+#include "harness_assert.h"
+
+using namespace tbb::flow;
+
+//---------------------------------------------------------------------------------------------------------------------------------
+// Helpers
+//---------------------------------------------------------------------------------------------------------------------------------
+
+typedef tuple< gfx_buffer<int>, size_t > kernel_args;
+typedef streaming_node< kernel_args, queueing, gfx_factory > gfx_node;
+
+template <typename T>
+void init_random_buffer(gfx_buffer<T>& buf) {
+    Harness::FastRandom rnd(42);
+    std::generate(buf.begin(), buf.end(), [&rnd]() { return rnd.get(); });
+}
+
+template <typename T>
+void copy_buffer_to_vector(gfx_buffer<T>& buf, std::vector<T>& vect) {
+    std::copy(buf.begin(), buf.end(), std::back_inserter(vect));
+}
+
+//---------------------------------------------------------------------------------------------------------------------------------
+
+// GFX functions to offload
+static __declspec(target(gfx_kernel))
+void sq_vec(int *v, size_t n) {
+    cilk_for(size_t i = 0; i < n; ++i) {
+        v[i] = v[i] * v[i];
+    }
+}
+
+// Reference function
+void sq_vec_ref(std::vector<int>& v) {
+    for (size_t i = 0; i < v.size(); ++i) {
+        v[i] = v[i] * v[i];
+    }
+}
+
+//---------------------------------------------------------------------------------------------------------------------------------
+
+void TestDynamicKernelArgs_finalize() {
+    REMARK("    TestDynamicKernelArgs_finalize: ");
+
+    // Initialize input data
+    const size_t array_size = 1000;
+    gfx_buffer<int> buffer(array_size);
+
+    // Generate random buffer values
+    init_random_buffer(buffer);
+
+    // Copy buffer to vector for the next validation
+    std::vector<int> check_vec;
+    copy_buffer_to_vector(buffer, check_vec);
+
+    // Obtain reference result
+    sq_vec_ref(check_vec);
+
+    graph g;
+    gfx_factory factory(g);
+
+    gfx_node streaming_n(g, sq_vec, gfx_factory::dummy_device_selector(), factory);
+
+    streaming_n.set_args(port_ref<0, 1>);
+    input_port<0>(streaming_n).try_put(buffer);
+    input_port<1>(streaming_n).try_put(array_size);
+
+    g.wait_for_all();
+
+    ASSERT((buffer.size() == check_vec.size()), "Validation has failed");
+    ASSERT((std::equal(buffer.begin(), buffer.end(), check_vec.begin())), "Validation has failed");
+    REMARK("done\n");
+}
+
+void TestConstantKernelArgs_finalize() {
+    REMARK("    TestConstantKernelArgs_finalize: ");
+
+    // Initialize input data
+    const size_t array_size = 1000;
+    gfx_buffer<int> buffer(array_size);
+
+    // Generate random buffer values
+    init_random_buffer(buffer);
+
+    // Copy buffer to vector for the next validation
+    std::vector<int> check_vec;
+    copy_buffer_to_vector(buffer, check_vec);
+
+    // Obtain reference result
+    sq_vec_ref(check_vec);
+
+    graph g;
+    gfx_factory factory(g);
+
+    streaming_node< tuple< gfx_buffer<int> >, queueing, gfx_factory > streaming_n(g, sq_vec, gfx_factory::dummy_device_selector(), factory);
+
+    streaming_n.set_args(port_ref<0>(), array_size);
+    input_port<0>(streaming_n).try_put(buffer);
+
+    g.wait_for_all();
+
+    ASSERT((buffer.size() == check_vec.size()), "Validation has failed");
+    ASSERT((std::equal(buffer.begin(), buffer.end(), check_vec.begin())), "Validation has failed");
+
+    REMARK("done\n");
+}
+
+void TestGfxStreamingFactory_finalize() {
+    REMARK("TestGfxStreamingFactory_finalize: ");
+    TestDynamicKernelArgs_finalize();
+    TestConstantKernelArgs_finalize();
+    REMARK("done\n");
+}
+
+//---------------------------------------------------------------------------------------------------------------------------------
+
+void TestDynamicKernelArgs_send_kernel() {
+    REMARK("    TestDynamicKernelArgs_send_kernel: ");
+
+    // Initialize input data
+    const size_t array_size = 1000;
+    gfx_buffer<int> buffer(array_size);
+
+    // Generate random buffer values
+    init_random_buffer(buffer);
+
+    // Copy buffer to vector for the next validation
+    std::vector<int> check_vec;
+    copy_buffer_to_vector(buffer, check_vec);
+
+    // Obtain reference result
+    sq_vec_ref(check_vec);
+
+    graph g;
+    gfx_factory factory(g);
+
+    gfx_node streaming_n(g, sq_vec, gfx_factory::dummy_device_selector(), factory);
+
+    join_node< kernel_args > join_n(g);
+    function_node< kernel_args > function_n(g, unlimited, [&check_vec](const kernel_args& result) {
+        gfx_buffer<int> buffer = get<0>(result);
+
+        ASSERT((buffer.size() == check_vec.size()), "Validation has failed");
+        ASSERT((std::equal(buffer.begin(), buffer.end(), check_vec.begin())), "Validation has failed");
+    });
+
+    make_edge(output_port<0>(streaming_n), input_port<0>(join_n));
+    make_edge(output_port<1>(streaming_n), input_port<1>(join_n));
+    make_edge(join_n, function_n);
+
+    streaming_n.set_args(port_ref<0, 1>);
+    input_port<0>(streaming_n).try_put(buffer);
+    input_port<1>(streaming_n).try_put(array_size);
+
+    g.wait_for_all();
+
+    REMARK("done\n");
+}
+
+void TestConstantKernelArgs_send_kernel() {
+    REMARK("    TestConstantKernelArgs_send_kernel: ");
+
+    // Initialize input data
+    const size_t array_size = 1000;
+    gfx_buffer<int> buffer(array_size);
+
+    // Generate random buffer values
+    init_random_buffer(buffer);
+
+    // Copy buffer to vector for the next validation
+    std::vector<int> check_vec;
+    copy_buffer_to_vector(buffer, check_vec);
+
+    // Obtain reference result
+    sq_vec_ref(check_vec);
+
+    graph g;
+    gfx_factory factory(g);
+
+    streaming_node< tuple< gfx_buffer<int> >, queueing, gfx_factory > streaming_n(g, sq_vec, gfx_factory::dummy_device_selector(), factory);
+
+    join_node< tuple< gfx_buffer<int> > > join_n(g);
+    function_node< tuple< gfx_buffer<int> > > function_n(g, unlimited, [&check_vec](const tuple< gfx_buffer<int> >& result) {
+        gfx_buffer<int> buffer = get<0>(result);
+
+        ASSERT((buffer.size() == check_vec.size()), "Validation has failed");
+        ASSERT((std::equal(buffer.begin(), buffer.end(), check_vec.begin())), "Validation has failed");
+    });
+
+    make_edge(output_port<0>(streaming_n), input_port<0>(join_n));
+    make_edge(join_n, function_n);
+
+    streaming_n.set_args(port_ref<0>(), array_size);
+    input_port<0>(streaming_n).try_put(buffer);
+
+    g.wait_for_all();
+
+    REMARK("done\n");
+}
+
+void TestGfxStreamingFactory_send_kernel() {
+    REMARK("TestGfxStreamingFactory_send_kernel:\n");
+    TestDynamicKernelArgs_send_kernel();
+    TestConstantKernelArgs_send_kernel();
+    REMARK("done\n");
+}
+
+//---------------------------------------------------------------------------------------------------------------------------------
+
+void ConcurrencyTest() {
+    REMARK("ConcurrencyTest: ");
+
+    // Initialize input data
+    const size_t array_size = 1000;
+    gfx_buffer<int> buffer(array_size);
+
+    // Generate random buffer values
+    init_random_buffer(buffer);
+
+    // Copy buffer to vector for the next validation
+    std::vector<int> check_vec;
+    copy_buffer_to_vector(buffer, check_vec);
+
+    // Obtain reference result
+    sq_vec_ref(check_vec);
+
+    graph g;
+    gfx_factory factory(g);
+
+    streaming_node< tuple< gfx_buffer<int> >, queueing, gfx_factory > streaming_n(g, sq_vec, gfx_factory::dummy_device_selector(), factory);
+
+    join_node< tuple< gfx_buffer<int> > > join_n(g);
+    function_node< tuple< gfx_buffer<int> > > function_n(g, unlimited, [&check_vec](const tuple< gfx_buffer<int> >& result) {
+        gfx_buffer<int> buffer = get<0>(result);
+
+        ASSERT((buffer.size() == check_vec.size()), "Validation has failed");
+        ASSERT((std::equal(buffer.begin(), buffer.end(), check_vec.begin())), "Validation has failed");
+    });
+
+    make_edge(output_port<0>(streaming_n), input_port<0>(join_n));
+    make_edge(join_n, function_n);
+
+    streaming_n.set_args(port_ref<0>(), array_size);
+
+    for (int i = 0; i < 100; i++) {
+        gfx_buffer<int> input(array_size);
+
+        for (int i = 0; i < buffer.size(); i++) {
+            input[i] = buffer[i];
+        }
+
+        input_port<0>(streaming_n).try_put(input);
+    }
+
+    g.wait_for_all();
+
+    REMARK("done\n");
+}
+
+//---------------------------------------------------------------------------------------------------------------------------------
+
+int TestMain() {
+    TestGfxStreamingFactory_finalize();
+    TestGfxStreamingFactory_send_kernel();
+    ConcurrencyTest();
+    return Harness::Done;
+}
+
+#else
+#define HARNESS_SKIP_TEST 1
+#include "harness.h"
+#endif
diff --git a/xdl/third_party/tbb/src/test/test_global_control.cpp b/xdl/third_party/tbb/src/test/test_global_control.cpp
new file mode 100644
index 00000000..02e400f1
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_global_control.cpp
@@ -0,0 +1,792 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_WAITING_FOR_WORKERS 1
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#include "tbb/global_control.h"
+#include "harness.h"
+#define TBB_PREVIEW_LOCAL_OBSERVER 1
+#include "tbb/task_scheduler_observer.h"
+
+const size_t MB = 1024*1024;
+const double BARRIER_TIMEOUT = 10.;
+
+void TestStackSizeSimpleControl()
+{
+    {
+        tbb::global_control s0(tbb::global_control::thread_stack_size, 1*MB);
+
+        {
+            tbb::global_control s1(tbb::global_control::thread_stack_size, 8*MB);
+
+            ASSERT(8*MB == tbb::global_control::active_value(tbb::global_control::thread_stack_size), NULL);
+        }
+        ASSERT(1*MB == tbb::global_control::active_value(tbb::global_control::thread_stack_size), NULL);
+    }
+}
+
+#include "harness_concurrency_tracker.h"
+#include "tbb/task_scheduler_init.h"
+#include <limits.h>   // for UINT_MAX
+
+struct StackSizeRun: NoAssign {
+    int                   num_threads;
+    Harness::SpinBarrier *barr1, *barr2;
+
+    StackSizeRun(int threads, Harness::SpinBarrier *b1, Harness::SpinBarrier *b2) :
+        num_threads(threads), barr1(b1), barr2(b2) {}
+    void operator()( int id ) const {
+        tbb::global_control s1(tbb::global_control::thread_stack_size, (1+id)*MB);
+
+        barr1->timed_wait(BARRIER_TIMEOUT);
+
+        ASSERT(num_threads*MB == tbb::global_control::active_value(tbb::global_control::thread_stack_size), NULL);
+        barr2->timed_wait(BARRIER_TIMEOUT);
+    }
+};
+
+void TestStackSizeThreadsControl()
+{
+    int threads = 4;
+    Harness::SpinBarrier barr1(threads), barr2(threads);
+    NativeParallelFor( threads, StackSizeRun(threads, &barr1, &barr2) );
+}
+
+void RunWorkersLimited(int tsi_max_threads, size_t parallelism, bool wait)
+{
+    tbb::global_control s(tbb::global_control::max_allowed_parallelism, parallelism);
+    // try both configuration with already sleeping workers and with not yet sleeping
+    if (wait)
+        Harness::Sleep(100);
+    const size_t expected_threads = tsi_max_threads>0?
+        min( (unsigned)tsi_max_threads, parallelism )
+        : ( tbb::tbb_thread::hardware_concurrency()==1? 1 : parallelism );
+    Harness::ExactConcurrencyLevel::check(expected_threads);
+}
+
+class blocking_task_scheduler_init {
+    tbb::task_scheduler_init init;
+public:
+    blocking_task_scheduler_init(int num_threads = tbb::task_scheduler_init::automatic) : init(num_threads) {}
+    ~blocking_task_scheduler_init() {
+        bool ok = init.blocking_terminate(std::nothrow);
+        ASSERT(ok, "blocking_terminate has failed");
+    }
+};
+
+void TSI_and_RunWorkers(int tsi_max_threads, size_t parallelism, size_t max_value)
+{
+    blocking_task_scheduler_init tsi(tsi_max_threads);
+    size_t active = tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+    ASSERT(active == max(2U, max_value), "active_value must not be changed by task_scheduler_init");
+    RunWorkersLimited(tsi_max_threads, parallelism, /*wait=*/false);
+}
+
+#include "tbb/tbb_thread.h"
+
+void TestWorkers(size_t curr_par)
+{
+    const size_t max_parallelism =
+        tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+    ASSERT(max(2U, tbb::tbb_thread::hardware_concurrency()) == max_parallelism, NULL);
+    {
+        const unsigned h_c = tbb::tbb_thread::hardware_concurrency();
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, curr_par);
+        size_t v = tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+        ASSERT(!curr_par || max((size_t)2, curr_par) == v, NULL);
+        if (h_c > 1)
+            TSI_and_RunWorkers(tbb::task_scheduler_init::automatic, min(h_c, curr_par), curr_par);
+        if (curr_par) // do not call task_scheduler_init t(0);
+            TSI_and_RunWorkers((int)curr_par, curr_par, curr_par);
+        if (curr_par > 2) { // check that min(tsi, parallelism) is active
+            TSI_and_RunWorkers((int)curr_par-1, curr_par, curr_par);
+            TSI_and_RunWorkers((int)curr_par, curr_par-1, curr_par);
+        }
+        // check constrains on control's value: it can't be increased
+        tbb::global_control c1(tbb::global_control::max_allowed_parallelism, curr_par+1);
+        v = tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+        if (curr_par)
+            ASSERT(max(2U, curr_par) == v, "It's impossible to increase maximal parallelism.");
+        else
+            ASSERT(2 == v, NULL);
+    }
+    ASSERT(tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism)
+           == max_parallelism,
+           "max parallelism has been restored successfully after decreasing/increasing");
+}
+
+void TestWorkersConstraints() {
+    const size_t max_parallelism =
+        tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+    blocking_task_scheduler_init tsi;
+    if (max_parallelism > 3) {
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, max_parallelism-1);
+        ASSERT(max_parallelism-1 ==
+               tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism),
+               "Allowed parallelism must be decreasable.");
+        tbb::global_control c1(tbb::global_control::max_allowed_parallelism, max_parallelism-2);
+        ASSERT(max_parallelism-2 ==
+               tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism),
+               "Allowed parallelism must be decreasable.");
+    }
+    const size_t limit_par = min(max_parallelism, 4U);
+    // check that constrains are really met
+    for (int wait=0; wait<2; wait++) {
+        for (size_t num=2; num<limit_par; num++)
+            RunWorkersLimited(tbb::task_scheduler_init::automatic, num, wait==1);
+        for (size_t num=limit_par; num>1; num--)
+            RunWorkersLimited(tbb::task_scheduler_init::automatic, num, wait==1);
+    }
+}
+
+struct DummyBody {
+    void operator()(int) const {
+        __TBB_Pause(1);
+    }
+};
+
+void RunParallelWork() {
+    const int LOOP_ITERS = 10*1000;
+    tbb::parallel_for(0, LOOP_ITERS, DummyBody(), tbb::simple_partitioner());
+}
+
+struct SetUseRun: NoAssign {
+    Harness::SpinBarrier *barr;
+
+    SetUseRun(Harness::SpinBarrier *b) : barr(b) {}
+    void operator()( int id ) const {
+        if (id == 0) {
+            for (int i=0; i<10; i++) {
+                blocking_task_scheduler_init tsi;
+                RunParallelWork();
+                barr->timed_wait(BARRIER_TIMEOUT);
+            }
+        } else {
+            for (int i=0; i<10; i++) {
+                tbb::global_control c(tbb::global_control::max_allowed_parallelism, 8);
+                barr->timed_wait(BARRIER_TIMEOUT);
+            }
+        }
+    }
+};
+
+void TestConcurrentSetUseConcurrency()
+{
+    Harness::SpinBarrier barr(2);
+    NativeParallelFor( 2, SetUseRun(&barr) );
+}
+
+// check number of workers after autoinitialization
+void TestAutoInit()
+{
+    const size_t max_parallelism =
+        tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+    const unsigned expected_threads = tbb::tbb_thread::hardware_concurrency()==1?
+        1 : (unsigned)max_parallelism;
+    Harness::ExactConcurrencyLevel::check(expected_threads);
+    ASSERT(tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism)
+           == max_parallelism, "max_allowed_parallelism must not be changed after auto init");
+    if (max_parallelism > 2) {
+        // after autoinit it's possible to decrease workers number
+        tbb::global_control s(tbb::global_control::max_allowed_parallelism, max_parallelism-1);
+        Harness::ExactConcurrencyLevel::check(max_parallelism-1);
+    }
+}
+
+// need this to use TRY_BAD_EXPR_ENABLED when TBB_USE_ASSERT is not defined
+#undef TBB_USE_ASSERT
+#define TBB_USE_ASSERT 1
+
+#include "harness_bad_expr.h"
+
+void TestInvalidParallelism()
+{
+#if TRY_BAD_EXPR_ENABLED
+    const size_t max_parallelism =
+        tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+    {
+        tbb::set_assertion_handler( AssertionFailureHandler );
+        TRY_BAD_EXPR( tbb::global_control c(tbb::global_control::max_allowed_parallelism, 0),
+                       "max_allowed_parallelism cannot be 0." );
+        tbb::set_assertion_handler( ReportError );
+        ASSERT(tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism)
+               == max_parallelism, NULL);
+    }
+    {
+        const size_t P = 2;
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, P);
+        ASSERT(tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism)
+               == P, NULL);
+        tbb::set_assertion_handler( AssertionFailureHandler );
+        TRY_BAD_EXPR( tbb::global_control cZ(tbb::global_control::max_allowed_parallelism, 0),
+                      "max_allowed_parallelism cannot be 0." );
+        tbb::set_assertion_handler( ReportError );
+        ASSERT(tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism)
+               == P, NULL);
+    }
+    ASSERT(tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism)
+           == max_parallelism, NULL);
+#endif /* TRY_BAD_EXPR_ENABLED */
+}
+
+void TestTooBigStack()
+{
+#if __TBB_x86_32
+    const size_t stack_sizes[] = {512*MB, 2*1024*MB, UINT_MAX};
+#else
+    const size_t stack_sizes[] = {512*MB, 2*1024*MB, UINT_MAX, 10LU*1024*MB};
+#endif
+
+#if __TBB_WIN8UI_SUPPORT
+    size_t default_ss = tbb::global_control::active_value(tbb::global_control::thread_stack_size);
+#endif
+    for (unsigned i = 0; i<Harness::array_length(stack_sizes); i++) {
+        // as no stack size setting for Windows Store* apps, skip it
+#if TRY_BAD_EXPR_ENABLED && __TBB_x86_64 && (_WIN32 || _WIN64) && !__TBB_WIN8UI_SUPPORT
+        if (stack_sizes[i] != (unsigned)stack_sizes[i]) {
+            size_t curr_ss = tbb::global_control::active_value(tbb::global_control::thread_stack_size);
+            tbb::set_assertion_handler( AssertionFailureHandler );
+            TRY_BAD_EXPR( tbb::global_control s1(tbb::global_control::thread_stack_size, stack_sizes[i]), "Stack size is limited to unsigned int range" );
+            tbb::set_assertion_handler( ReportError );
+            ASSERT(curr_ss == tbb::global_control::active_value(tbb::global_control::thread_stack_size), "Changing of stack size is not expected.");
+            continue;
+        }
+#endif
+        tbb::global_control s1(tbb::global_control::thread_stack_size, stack_sizes[i]);
+        size_t actual_stack_sz = tbb::global_control::active_value(tbb::global_control::thread_stack_size);
+#if __TBB_WIN8UI_SUPPORT
+        ASSERT(actual_stack_sz == default_ss, "It's ignored for Windows Store* apps");
+#else
+        ASSERT(actual_stack_sz==stack_sizes[i], NULL);
+#endif
+    }
+}
+
+struct ParallelForRun: NoAssign {
+    int                   num_threads;
+    Harness::SpinBarrier *barr1, *barr2;
+
+    ParallelForRun(Harness::SpinBarrier *b1, Harness::SpinBarrier *b2) :
+        barr1(b1), barr2(b2) {}
+    void operator()( int /*id*/ ) const {
+        barr1->timed_wait(BARRIER_TIMEOUT);
+        RunParallelWork();
+        barr2->timed_wait(BARRIER_TIMEOUT);
+    }
+};
+
+class FFTask: public tbb::task {
+    tbb::atomic<int> *counter;
+    tbb::task* execute() __TBB_override {
+        (*counter)++;
+       return NULL;
+   }
+public:
+    FFTask(tbb::atomic<int> *counter_) : counter(counter_) {}
+};
+
+class WaiterTask: public tbb::task {
+    tbb::atomic<bool> *flag;
+    tbb::task* execute() __TBB_override {
+        while(!*flag)
+            __TBB_Yield();
+       return NULL;
+   }
+public:
+    WaiterTask(tbb::atomic<bool> *flag_) : flag(flag_) {}
+};
+
+class WorkAndEnqueueTask: public tbb::task {
+    tbb::atomic<int> *counter;
+    tbb::atomic<bool> *signalToLeave;
+    tbb::task* execute() __TBB_override {
+        RunParallelWork();
+        *signalToLeave = true;
+        for (int i=0; i<ENQUEUE_TASKS; i++) {
+            FFTask* t = new( tbb::task::allocate_root() ) FFTask(counter);
+            tbb::task::enqueue(*t);
+        }
+
+        return NULL;
+   }
+public:
+    static const int ENQUEUE_TASKS = 10;
+    WorkAndEnqueueTask(tbb::atomic<int> *counter_, tbb::atomic<bool> *signal_)
+        : counter(counter_), signalToLeave(signal_) {}
+};
+
+#if __TBB_TASK_PRIORITY
+tbb::priority_t getPriorityByInt(int i) {
+    return i%3==0? tbb::priority_low : (i%3==1? tbb::priority_normal :
+                                        tbb::priority_high);
+}
+#endif
+
+class FFTasksRun: NoAssign {
+    void enqTasks(int id) const {
+        for (int i=0; i<ITERS; i++) {
+            FFTask* t = new( tbb::task::allocate_root() ) FFTask(cnt);
+#if __TBB_TASK_PRIORITY
+            tbb::priority_t p = getPriorityByInt(i+id);
+            tbb::task::enqueue(*t, p);
+#else
+            tbb::internal::suppress_unused_warning(id);
+            tbb::task::enqueue(*t);
+#endif
+        }
+    }
+public:
+    static const int ITERS = 20;
+    Harness::SpinBarrier *barr;
+    tbb::atomic<int> *cnt;
+
+    FFTasksRun(Harness::SpinBarrier *b, tbb::atomic<int> *c) :
+        barr(b), cnt(c) {}
+    void operator()(int id) const {
+        if (id)
+            enqTasks(id);
+        barr->wait();
+        if (!id)
+            enqTasks(id);
+    }
+};
+
+void TestTaskEnqueue()
+{
+    {
+        blocking_task_scheduler_init tsi(20);
+        tbb::atomic<int> flag;
+        tbb::atomic<bool> taskDoneFlag;
+        flag = 0;
+        taskDoneFlag = false;
+
+        for (int i=0; i<10; i++) {
+            WaiterTask* w = new( tbb::task::allocate_root() ) WaiterTask(&taskDoneFlag);
+            tbb::task::enqueue(*w);
+        }
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+        taskDoneFlag = true;
+
+        FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+        tbb::task::enqueue(*t);
+        while(!flag)
+            __TBB_Yield();
+    }
+    {
+        blocking_task_scheduler_init tsi(1);
+        tbb::atomic<int> flag;
+        tbb::atomic<bool> taskDoneFlag;
+        flag = 0;
+        taskDoneFlag = false;
+
+        WaiterTask* w = new( tbb::task::allocate_root() ) WaiterTask(&taskDoneFlag);
+        tbb::task::enqueue(*w);
+        taskDoneFlag = true;
+
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+
+        FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+        tbb::task::enqueue(*t);
+        while(!flag)
+            __TBB_Yield();
+    }
+    {
+        blocking_task_scheduler_init tsi(2);
+        tbb::atomic<int> flag;
+        flag = 0;
+
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+
+        FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+        tbb::task::enqueue(*t);
+        while(!flag)
+            __TBB_Yield();
+    }
+    {
+        blocking_task_scheduler_init tsi(2);
+        tbb::atomic<int> flag;
+        flag = 0;
+
+        FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+        tbb::task::enqueue(*t);
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+
+        while(!flag)
+            __TBB_Yield();
+    }
+
+    tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+
+    { // check that enqueue() guarantee mandatory parallelism
+        blocking_task_scheduler_init tsi(1);
+        tbb::atomic<int> flag;
+        flag = 0;
+
+        FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+        tbb::task::enqueue(*t);
+        while(!flag)
+            __TBB_Yield();
+    }
+    {
+        tbb::atomic<int> flag;
+        flag = 0;
+        {
+            blocking_task_scheduler_init tsi(1);
+
+            for (int i=0; i<10; i++) {
+                FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+#if __TBB_TASK_PRIORITY
+                const tbb::priority_t p = getPriorityByInt(i);
+                tbb::task::enqueue(*t, p);
+#else
+                tbb::task::enqueue(*t);
+#endif
+            }
+        }
+        ASSERT(flag==10, "The tasks must be terminated when task_scheduler_init destroyed.");
+    }
+    const unsigned threads = 2;
+    {
+        blocking_task_scheduler_init tsi(1);
+        Harness::SpinBarrier barr1(threads), barr2(threads);
+        RunWorkersLimited(1, 1, false);
+
+        NativeParallelFor( threads, ParallelForRun(&barr1, &barr2) );
+    }
+
+    tbb::atomic<int> counter;
+    counter = 0;
+    {
+        blocking_task_scheduler_init tsi(1);
+        Harness::SpinBarrier barr(threads);
+        RunWorkersLimited(1, 1, false);
+
+        NativeParallelFor( threads, FFTasksRun(&barr, &counter) );
+    }
+    ASSERT(counter == threads*FFTasksRun::ITERS, "All tasks must be done when task_scheduler_init destroyed.");
+    counter = 0;
+    { // an enqueued task can enqueue other tasks and calls parallel_for
+        tbb::atomic<bool> signalToLeave;
+        blocking_task_scheduler_init tsi(1);
+
+        signalToLeave = false;
+        WorkAndEnqueueTask *t = new( tbb::task::allocate_root() )
+            WorkAndEnqueueTask(&counter, &signalToLeave);
+        tbb::task::enqueue(*t);
+        RunParallelWork();
+
+        while (!signalToLeave)
+            __TBB_Yield();
+    }
+    ASSERT(counter == WorkAndEnqueueTask::ENQUEUE_TASKS, "All tasks must be done when task_scheduler_init destroyed.");
+}
+
+class CountWorkersTask: public tbb::task {
+    tbb::atomic<bool> *flag;
+    // count unique worker threads
+    static tbb::combinable<size_t> uniqThreads;
+
+    tbb::task* execute() __TBB_override {
+        uniqThreads.local() = 1;
+        Harness::Sleep(10);
+        *flag = 1;
+        return NULL;
+   }
+public:
+    CountWorkersTask(tbb::atomic<bool> *flag_) : flag(flag_) {}
+    static size_t observedThreads() {
+        return uniqThreads.combine(std::plus<size_t>());
+    }
+};
+
+tbb::combinable<size_t> CountWorkersTask::uniqThreads;
+
+tbb::atomic<int> activeArenas;
+
+class ArenaObserver: public tbb::task_scheduler_observer {
+public:
+    ArenaObserver() : tbb::task_scheduler_observer(/*local=*/true) {
+    }
+    void on_scheduler_entry( bool worker ) __TBB_override {
+        if (worker) {
+            ++activeArenas;
+        }
+    }
+    void on_scheduler_exit( bool worker ) __TBB_override {
+        if (worker) {
+            --activeArenas;
+        }
+    }
+};
+
+ArenaObserver observers[2];
+
+struct ArenasObserveRun: NoAssign {
+    Harness::SpinBarrier *barr;
+
+    ArenasObserveRun(Harness::SpinBarrier *b) : barr(b) {}
+    void operator()( int id ) const {
+        observers[id].observe(true);
+        ArenaObserver o;
+        tbb::atomic<bool> flag;
+        flag = false;
+
+        CountWorkersTask* t = new( tbb::task::allocate_root() )
+            CountWorkersTask(&flag);
+        barr->wait();
+        tbb::task::enqueue(*t);
+        while(!flag)
+            __TBB_Yield();
+    }
+};
+
+struct ArenaRun: NoAssign {
+    tbb::atomic<int> *counter;
+
+    ArenaRun(tbb::atomic<int> *counter_) : counter(counter_) {}
+    void operator()() const {
+        (*counter)++;
+    }
+};
+
+struct ArenaUserRun: NoAssign {
+    static const int ENQUEUE_TASKS = 10;
+    tbb::task_arena *arena;
+    Harness::SpinBarrier *barr;
+    tbb::atomic<int> *counter;
+
+    ArenaUserRun(tbb::task_arena *a, Harness::SpinBarrier *b, tbb::atomic<int> *c) :
+        arena(a), barr(b), counter(c)  {}
+    void operator()( int id ) const {
+
+        for (int i=0; i<ENQUEUE_TASKS; i++)
+            arena->enqueue(ArenaRun(counter));
+        barr->wait();
+        if (!id)
+            arena->terminate();
+    }
+};
+
+void TestConcurrentArenas()
+{
+    Harness::SpinBarrier barrier(2);
+    tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+    {
+        blocking_task_scheduler_init tsi(2);
+        ArenaObserver observer;
+        observer.observe(true);
+
+        Harness::ExactConcurrencyLevel::check(1); // must have 0 worker threads
+
+        NativeParallelFor( 2, ArenasObserveRun(&barrier) );
+        ASSERT(1 == CountWorkersTask::observedThreads(),
+               "Single worker is expecting to serve mandatory parallelism.");
+        while(activeArenas) // wait till single worker termination
+            __TBB_Yield();
+
+        // check that without mandatory parallelism, still have 0 worker threads
+        Harness::ExactConcurrencyLevel::check(1);
+    }
+    tbb::atomic<int> counter;
+    counter = 0;
+    {
+        blocking_task_scheduler_init tsi(1);
+        tbb::task_arena arena(2);
+
+        NativeParallelFor( 2, ArenaUserRun(&arena, &barrier, &counter) );
+    }
+    ASSERT(counter == 2*ArenaUserRun::ENQUEUE_TASKS, "All tasks must be done.");
+}
+
+void TestParallelismRestored()
+{
+    const int TASKS = 5;
+    tbb::atomic<int> counter;
+    counter = 0;
+    {
+        const int P = 4;
+        blocking_task_scheduler_init tsi(P);
+        {
+            tbb::global_control s(tbb::global_control::max_allowed_parallelism, 1);
+            Harness::ExactConcurrencyLevel::check(1);
+            // create enforced concurrency in the arena
+            for (int i=0; i<TASKS; i++) {
+                FFTask* t = new( tbb::task::allocate_root() ) FFTask(&counter);
+                tbb::task::enqueue(*t);
+            }
+        }
+        // global control is off, check that concurrency P is available
+        Harness::ExactConcurrencyLevel::check(P);
+    }
+    ASSERT(counter==TASKS, "The tasks must be executed at this point.");
+}
+
+class NoUnwantedEnforcedRun {
+    Harness::SpinBarrier *globalBarrier;
+public:
+    NoUnwantedEnforcedRun(Harness::SpinBarrier *b) : globalBarrier(b) {}
+    void operator()( int id ) const {
+        Harness::SpinBarrier barr(1);
+
+        tbb::combinable<size_t> uniqThreads;
+        Harness::ExactConcurrencyLevel::check(1);
+        globalBarrier->wait();
+        if (id) {
+            for (int i=0; i<20; i++) {
+                Harness::ExactConcurrencyLevel::check(1); // no workers expected in the thread
+            }
+        } else {
+            // create enforced concurrency in a separate thread, thus provoke enforced worker without
+            // work to do to join arena with parallel_for
+            for (int i=0; i<10; i++) {
+                tbb::atomic<int> flag;
+                flag = 0;
+                FFTask* t = new( tbb::task::allocate_root() ) FFTask(&flag);
+                tbb::task::enqueue(*t);
+                Harness::ExactConcurrencyLevel::checkLessOrEqual(2, &uniqThreads);
+                size_t seen = uniqThreads.combine(std::plus<size_t>());
+                ASSERT(seen==1 || seen==2, NULL);
+                while(!flag)
+                    __TBB_Yield();
+            }
+        }
+    }
+};
+
+// test that enforced concurrency from one thread doesn't affect another
+void TestNoUnwantedEnforced()
+{
+    Harness::SpinBarrier barrier(2);
+    tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+    blocking_task_scheduler_init tsi(4);
+    NativeParallelFor( 2, NoUnwantedEnforcedRun(&barrier) );
+}
+
+class TestMultipleControlsRun {
+    Harness::SpinBarrier *barrier;
+public:
+    TestMultipleControlsRun(Harness::SpinBarrier *b) : barrier(b) {}
+    void operator()( int id ) const {
+        barrier->wait();
+        if (id) {
+            {
+                tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+                Harness::ExactConcurrencyLevel::check(1);
+                barrier->wait();
+            }
+            Harness::ExactConcurrencyLevel::check(1);
+            barrier->wait();
+            {
+                tbb::global_control c(tbb::global_control::max_allowed_parallelism, 2);
+                Harness::ExactConcurrencyLevel::check(1);
+                barrier->wait();
+                Harness::ExactConcurrencyLevel::check(2);
+                barrier->wait();
+            }
+        } else {
+            {
+                Harness::ExactConcurrencyLevel::check(1);
+                tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+                barrier->wait();
+                Harness::ExactConcurrencyLevel::check(1);
+                barrier->wait();
+                Harness::ExactConcurrencyLevel::check(1);
+                barrier->wait();
+            }
+            Harness::ExactConcurrencyLevel::check(2);
+            barrier->wait();
+        }
+    }
+};
+
+// test that global controls from different thread with overlapping lifetime
+// still keep parallelism under control
+void TestMultipleControls()
+{
+    blocking_task_scheduler_init tsi(2); // to prevent autoinitialization
+    Harness::SpinBarrier barrier(2);
+    NativeParallelFor( 2, TestMultipleControlsRun(&barrier) );
+}
+
+// enqueued tasks with priority below current must not be forgotten,
+// when enqueue enforced priority is enabled
+void TestForgottenEnqueuedTasks()
+{
+    tbb::task_scheduler_init tsi(2);
+    tbb::atomic<int> counter;
+    tbb::atomic<bool> waitFlag;
+
+    waitFlag = false;
+    counter = 0;
+    tbb::task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    r.set_ref_count(3);
+    for (int i=0; i<2; i++) {
+        tbb::task &t = *new( r.allocate_child() ) WaiterTask(&waitFlag);
+        tbb::task::spawn(t);
+    }
+    // all workers are occupied by blocked WaiterTask()
+    FFTask* t = new( tbb::task::allocate_root() ) FFTask(&counter);
+    tbb::task::enqueue(*t, tbb::priority_low);
+    {
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+        waitFlag = true; // WaiterTask() done, workers ready to use
+        while (!counter) // wait till FFTask() executed
+            __TBB_Yield();
+    }
+    r.wait_for_all();
+    tbb::task::destroy(r);
+}
+
+int TestMain()
+{
+    TestTaskEnqueue();
+    TestConcurrentArenas();
+    TestMultipleControls();
+    TestNoUnwantedEnforced();
+    const unsigned h_c = tbb::tbb_thread::hardware_concurrency();
+    bool excessHC;
+    {
+        tbb::task_scheduler_init t(h_c+1);
+        excessHC = Harness::ExactConcurrencyLevel::isEqual(h_c+1);
+    }
+    if (h_c>2)
+        TestWorkers(h_c-1);
+    if (excessHC)  // requires hardware concurrency +1, otherwise hangs
+        TestWorkers(h_c+1);
+    if (excessHC || h_c >= 2)
+        TestWorkers(2);
+    if (excessHC || h_c >= 3)
+        TestWorkers(3);
+    TestWorkersConstraints();
+    TestConcurrentSetUseConcurrency();
+    TestInvalidParallelism();
+    TestAutoInit(); // auto-initialization done at this point
+
+    size_t default_ss = tbb::global_control::active_value(tbb::global_control::thread_stack_size);
+    ASSERT(default_ss, NULL);
+#if !__TBB_WIN8UI_SUPPORT
+    // it's impossible to change stack size for Windows Store* apps, so skip the tests
+    TestStackSizeSimpleControl();
+    TestStackSizeThreadsControl();
+#endif
+    TestTooBigStack();
+    ASSERT(default_ss == tbb::global_control::active_value(tbb::global_control::thread_stack_size), NULL);
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_global_control_whitebox.cpp b/xdl/third_party/tbb/src/test/test_global_control_whitebox.cpp
new file mode 100644
index 00000000..c4e3f34f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_global_control_whitebox.cpp
@@ -0,0 +1,83 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFINE_PRIVATE_PUBLIC 1
+#include "harness_inject_scheduler.h"
+#include "harness.h"
+
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#include "tbb/global_control.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+
+bool allWorkersSleep() {
+    using namespace tbb::internal;
+    using namespace tbb::internal::rml;
+
+    unsigned sleeping_threads = 0;
+    unsigned threads = ((private_server*)market::theMarket->my_server)->my_n_thread;
+
+    for (private_worker *l = ((private_server*)market::theMarket->my_server)->my_asleep_list_root;
+         l; l = l->my_next)
+        sleeping_threads++;
+
+    return threads == sleeping_threads;
+}
+
+class ThreadsTask {
+public:
+    void operator() (const tbb::blocked_range<int> &) const { }
+    ThreadsTask() {}
+};
+
+static void RunAndCheckSleeping()
+{
+    Harness::Sleep(100);
+    ASSERT(allWorkersSleep(), NULL);
+    tbb::parallel_for(tbb::blocked_range<int>(0, 100*1000, 1),
+                      ThreadsTask(), tbb::simple_partitioner());
+    Harness::Sleep(100);
+    ASSERT(allWorkersSleep(), NULL);
+}
+
+// test that all workers are sleeping, not spinning
+void TestWorkersSleep() {
+    tbb::task_scheduler_init tsi(8);
+    const size_t max_parallelism =
+        tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
+    if (max_parallelism > 2) {
+        tbb::global_control c(tbb::global_control::max_allowed_parallelism, max_parallelism-1);
+    }
+    RunAndCheckSleeping();
+    tbb::global_control c(tbb::global_control::max_allowed_parallelism, max_parallelism+1);
+    RunAndCheckSleeping();
+}
+
+int TestMain () {
+    {
+        tbb::task_scheduler_init tsi;
+        if (!tbb::internal::governor::UsePrivateRML)
+            return Harness::Skipped;
+    }
+    TestWorkersSleep();
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_halt.cpp b/xdl/third_party/tbb/src/test/test_halt.cpp
new file mode 100644
index 00000000..f167c20b
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_halt.cpp
@@ -0,0 +1,113 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 4
+#define HARNESS_DEFAULT_MAX_THREADS 8
+
+#include "harness_defs.h"
+#include <cstdio>
+#include <cstdlib>
+#include <cassert>
+#include <utility>
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/mutex.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/queuing_mutex.h"
+#include "harness.h"
+
+using namespace std;
+using namespace tbb;
+
+///////////////////// Parallel methods ////////////////////////
+
+// *** Serial shared by mutexes *** //
+int SharedI = 1, SharedN;
+template<typename M>
+class SharedSerialFibBody: NoAssign {
+    M &mutex;
+public:
+    SharedSerialFibBody( M &m ) : mutex( m ) {}
+    //! main loop
+    void operator()( const blocked_range<int>& /*range*/ ) const {
+        for(;;) {
+            typename M::scoped_lock lock( mutex );
+            if(SharedI >= SharedN) break;
+            volatile double sum = 7.3;
+            sum *= 11.17;
+            ++SharedI;
+        }
+    }
+};
+
+//! Root function
+template<class M>
+void SharedSerialFib(int n)
+{
+    SharedI = 1;
+    SharedN = n;
+    M mutex;
+    parallel_for( blocked_range<int>(0,4,1), SharedSerialFibBody<M>( mutex ) );
+}
+
+/////////////////////////// Main ////////////////////////////////////////////////////
+
+double Tsum = 0; int Tnum = 0;
+
+typedef void (*MeasureFunc)(int);
+//! Measure ticks count in loop [2..n]
+void Measure(const char *name, MeasureFunc func, int n)
+{
+    tick_count t0;
+    tick_count::interval_t T;
+    REMARK("%s",name);
+    t0 = tick_count::now();
+    for(int number = 2; number <= n; number++)
+        func(number);
+    T = tick_count::now() - t0;
+    double avg = Tnum? Tsum/Tnum : 1;
+    if (avg == 0.0) avg = 1;
+    if(avg * 100 < T.seconds()) {
+        REPORT("Warning: halting detected (%g sec, av: %g)\n", T.seconds(), avg);
+        ASSERT(avg * 1000 > T.seconds(), "Too long halting period");
+    } else {
+        Tsum += T.seconds(); Tnum++;
+    }
+    REMARK("\t- in %f msec\n", T.seconds()*1000);
+}
+
+int TestMain () {
+    MinThread = max(2, MinThread);
+    int NumbersCount = 100;
+    short recycle = 100;
+    do {
+        for(int threads = MinThread; threads <= MaxThread; threads++) {
+            task_scheduler_init scheduler_init(threads);
+            REMARK("Threads number is %d\t", threads);
+            Measure("Shared serial (wrapper mutex)\t", SharedSerialFib<mutex>, NumbersCount);
+            //sum = Measure("Shared serial (spin_mutex)", SharedSerialFib<tbb::spin_mutex>, NumbersCount);
+            //sum = Measure("Shared serial (queuing_mutex)", SharedSerialFib<tbb::queuing_mutex>, NumbersCount);
+        }
+    } while(--recycle);
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_handle_perror.cpp b/xdl/third_party/tbb/src/test/test_handle_perror.cpp
new file mode 100644
index 00000000..716e1f46
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_handle_perror.cpp
@@ -0,0 +1,58 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Program for basic correctness of handle_perror, which is internal
+// to the TBB shared library.
+
+#include <cerrno>
+#include <stdexcept>
+
+#include "../tbb/tbb_misc.h"
+#include "harness.h"
+
+#if TBB_USE_EXCEPTIONS
+
+static void TestHandlePerror() {
+    bool caught = false;
+    try {
+        tbb::internal::handle_perror( EAGAIN, "apple" );
+    } catch( std::runtime_error& e ) {
+#if TBB_USE_EXCEPTIONS
+        REMARK("caught runtime_exception('%s')\n",e.what());
+        ASSERT( memcmp(e.what(),"apple: ",7)==0, NULL );
+        ASSERT( strlen(strstr(e.what(), strerror(EAGAIN))), "bad error message?" );
+#endif /* TBB_USE_EXCEPTIONS */
+        caught = true;
+    }
+    ASSERT( caught, NULL );
+}
+
+int TestMain () {
+    TestHandlePerror();
+    return Harness::Done;
+}
+
+#else /* !TBB_USE_EXCEPTIONS */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* TBB_USE_EXCEPTIONS */
diff --git a/xdl/third_party/tbb/src/test/test_hw_concurrency.cpp b/xdl/third_party/tbb/src/test/test_hw_concurrency.cpp
new file mode 100644
index 00000000..0620b8f9
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_hw_concurrency.cpp
@@ -0,0 +1,56 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_defs.h"
+
+#if __TBB_TEST_SKIP_AFFINITY
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+int TestMain() {
+    return Harness::Skipped;
+}
+#else /* affinity mask can be set and used by TBB */
+
+#include "harness.h"
+#include "harness_concurrency.h"
+
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/enumerable_thread_specific.h"
+
+// The declaration of a global ETS object is needed to check that
+// it does not initialize the task scheduler, and in particular
+// does not set the default thread number. TODO: add other objects
+// that should not initialize the scheduler.
+tbb::enumerable_thread_specific<std::size_t> ets;
+
+int TestMain () {
+    int maxProcs = Harness::GetMaxProcs();
+
+    if ( maxProcs < 2 )
+        return Harness::Skipped;
+
+    int availableProcs = maxProcs/2;
+    ASSERT( Harness::LimitNumberOfThreads( availableProcs ) == availableProcs, "LimitNumberOfThreads has not set the requested limitation." );
+    ASSERT( tbb::task_scheduler_init::default_num_threads() == availableProcs, NULL );
+    ASSERT( (int)tbb::tbb_thread::hardware_concurrency() == availableProcs, NULL );
+    return Harness::Done;
+}
+#endif /* __TBB_TEST_SKIP_AFFINITY */
diff --git a/xdl/third_party/tbb/src/test/test_indexer_node.cpp b/xdl/third_party/tbb/src/test/test_indexer_node.cpp
new file mode 100644
index 00000000..4f0c5ee2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_indexer_node.cpp
@@ -0,0 +1,888 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+#include "tbb/flow_graph.h"
+
+//
+// Tests
+//
+
+#if defined(_MSC_VER) && _MSC_VER < 1600
+    #pragma warning (disable : 4503) //disabling the "decorated name length exceeded" warning for VS2008 and earlier
+#endif
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+template< typename T >
+class test_indexer_extract {
+protected:
+    typedef tbb::flow::indexer_node<T, T> my_node_t;
+    typedef tbb::flow::queue_node<T> in_node_t;
+    typedef tbb::flow::queue_node<typename my_node_t::output_type> out_node_t;
+
+    tbb::flow::graph g;
+    in_node_t in0;
+    in_node_t in1;
+    in_node_t in2;
+    my_node_t middle;
+    out_node_t out0;
+    out_node_t out1;
+    in_node_t *ins[3];
+    out_node_t *outs[2];
+    typename in_node_t::successor_type *ms_p0_ptr;
+    typename in_node_t::successor_type *ms_p1_ptr;
+    typename out_node_t::predecessor_type *mp_ptr;
+    typename in_node_t::predecessor_list_type in0_p_list;
+    typename in_node_t::successor_list_type in0_s_list;
+    typename in_node_t::predecessor_list_type in1_p_list;
+    typename in_node_t::successor_list_type in1_s_list;
+    typename in_node_t::predecessor_list_type in2_p_list;
+    typename in_node_t::successor_list_type in2_s_list;
+    typename out_node_t::predecessor_list_type out0_p_list;
+    typename out_node_t::successor_list_type out0_s_list;
+    typename out_node_t::predecessor_list_type out1_p_list;
+    typename out_node_t::successor_list_type out1_s_list;
+    typename in_node_t::predecessor_list_type mp0_list;
+    typename in_node_t::predecessor_list_type mp1_list;
+    typename out_node_t::successor_list_type ms_list;
+
+    virtual void set_up_lists() {
+        in0_p_list.clear();
+        in0_s_list.clear();
+        in1_p_list.clear();
+        in1_s_list.clear();
+        in2_p_list.clear();
+        in2_s_list.clear();
+        out0_p_list.clear();
+        out0_s_list.clear();
+        out1_p_list.clear();
+        out1_s_list.clear();
+        mp0_list.clear();
+        mp1_list.clear();
+        ms_list.clear();
+
+        in0.copy_predecessors(in0_p_list);
+        in0.copy_successors(in0_s_list);
+        in1.copy_predecessors(in1_p_list);
+        in1.copy_successors(in1_s_list);
+        in2.copy_predecessors(in2_p_list);
+        in2.copy_successors(in2_s_list);
+        tbb::flow::input_port<0>(middle).copy_predecessors(mp0_list);
+        tbb::flow::input_port<1>(middle).copy_predecessors(mp1_list);
+        middle.copy_successors(ms_list);
+        out0.copy_predecessors(out0_p_list);
+        out0.copy_successors(out0_s_list);
+        out1.copy_predecessors(out1_p_list);
+        out1.copy_successors(out1_s_list);
+    }
+
+    void check_output(int &r, typename my_node_t::output_type &v) {
+        T t = tbb::flow::cast_to<T>(v);
+        if ( t == 1 || t == 2 ) {
+            ASSERT( v.tag() == 0, "value came in on wrong port" );
+        } else if ( t == 4 || t == 8 ) {
+            ASSERT( v.tag() == 1, "value came in on wrong port" );
+        } else {
+            ASSERT( false, "incorrect value passed through indexer_node" );
+        }
+        ASSERT( (r&t) == 0, "duplicate value passed through indexer_node" );
+        r |= t;
+    }
+
+    void make_and_validate_full_graph() {
+        /*     in0                         */
+        /*         \                       */
+        /*           port0          out0   */
+        /*         /       |      /        */
+        /*     in1         middle          */
+        /*                 |      \        */
+        /*     in2 - port1          out1   */
+        tbb::flow::make_edge( in0, tbb::flow::input_port<0>(middle) );
+        tbb::flow::make_edge( in1, tbb::flow::input_port<0>(middle) );
+        tbb::flow::make_edge( in2, tbb::flow::input_port<1>(middle) );
+        tbb::flow::make_edge( middle, out0 );
+        tbb::flow::make_edge( middle, out1 );
+
+        set_up_lists();
+
+        ASSERT( in0.predecessor_count() == 0 && in0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in0.successor_count() == 1 && in0_s_list.size() == 1 && *(in0_s_list.begin()) == ms_p0_ptr, "expected 1 successor" );
+        ASSERT( in1.predecessor_count() == 0 && in1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in1.successor_count() == 1 && in1_s_list.size() == 1 && *(in1_s_list.begin()) == ms_p0_ptr, "expected 1 successor" );
+        ASSERT( in2.predecessor_count() == 0 && in2_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in2.successor_count() == 1 && in2_s_list.size() == 1 && *(in2_s_list.begin()) == ms_p1_ptr, "expected 1 successor" );
+        ASSERT( tbb::flow::input_port<0>(middle).predecessor_count() == 2 && mp0_list.size() == 2, "expected 2 predecessors" );
+        ASSERT( tbb::flow::input_port<1>(middle).predecessor_count() == 1 && mp1_list.size() == 1, "expected 1 predecessors" );
+        ASSERT( middle.successor_count() == 2 && ms_list.size() == 2, "expected 2 successors" );
+        ASSERT( out0.predecessor_count() == 1 && out0_p_list.size() == 1 && *(out0_p_list.begin()) == mp_ptr, "expected 1 predecessor" );
+        ASSERT( out0.successor_count() == 0 && out0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( out1.predecessor_count() == 1 && out1_p_list.size() == 1 && *(out1_p_list.begin()) == mp_ptr, "expected 1 predecessor" );
+        ASSERT( out1.successor_count() == 0 && out1_s_list.size() == 0, "expected 0 successors" );
+
+        int first_pred = *(mp0_list.begin()) == ins[0] ? 0 : ( *(mp0_list.begin()) == ins[1] ? 1 : -1 );
+        typename in_node_t::predecessor_list_type::iterator piv = mp0_list.begin();++piv;
+        int second_pred = *piv == ins[0] ? 0 : ( *piv == ins[1] ? 1 : -1 );
+        ASSERT( first_pred != -1 && second_pred != -1 && first_pred != second_pred, "bad predecessor(s) for middle port 0" );
+
+        ASSERT( *(mp1_list.begin()) == ins[2], "bad predecessor for middle port 1" );
+
+        int first_succ = *(ms_list.begin()) == outs[0] ? 0 : ( *(ms_list.begin()) == outs[1] ? 1 : -1 );
+        typename out_node_t::successor_list_type::iterator ms_vec_iter = ms_list.begin(); ++ms_vec_iter;
+        int second_succ = *ms_vec_iter == outs[0] ? 0 : ( *ms_vec_iter == outs[1] ? 1 : -1 );
+        ASSERT( first_succ != -1 && second_succ != -1 && first_succ != second_succ, "bad successor(s) for middle" );
+
+        in0.try_put(1);
+        in1.try_put(2);
+        in2.try_put(8);
+        in2.try_put(4);
+        g.wait_for_all();
+
+        T v_in;
+
+        ASSERT( in0.try_get(v_in) == false, "buffer should not have a value" );
+        ASSERT( in1.try_get(v_in) == false, "buffer should not have a value" );
+        ASSERT( in1.try_get(v_in) == false, "buffer should not have a value" );
+        ASSERT( in2.try_get(v_in) == false, "buffer should not have a value" );
+        ASSERT( in2.try_get(v_in) == false, "buffer should not have a value" );
+
+        typename my_node_t::output_type v;
+        T r = 0;
+        while ( out0.try_get(v) ) {
+            check_output(r,v);
+            g.wait_for_all();
+        }
+        ASSERT( r == 15, "not all values received" );
+
+        r = 0;
+        while ( out1.try_get(v) ) {
+            check_output(r,v);
+            g.wait_for_all();
+        }
+        ASSERT( r == 15, "not all values received" );
+        g.wait_for_all();
+    }
+
+    void validate_partial_graph() {
+        /*     in0                         */
+        /*                                 */
+        /*           port0          out0   */
+        /*         /       |               */
+        /*     in1         middle          */
+        /*                 |      \        */
+        /*     in2 - port1          out1   */
+        set_up_lists();
+
+        ASSERT( in0.predecessor_count() == 0 && in0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in0.successor_count() == 0 && in0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( in1.predecessor_count() == 0 && in1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in1.successor_count() == 1 && in1_s_list.size() == 1 && *(in1_s_list.begin()) == ms_p0_ptr, "expected 1 successor" );
+        ASSERT( in2.predecessor_count() == 0 && in2_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in2.successor_count() == 1 && in2_s_list.size() == 1 && *(in2_s_list.begin()) == ms_p1_ptr, "expected 1 successor" );
+        ASSERT( tbb::flow::input_port<0>(middle).predecessor_count() == 1 && mp0_list.size() == 1 && *(mp0_list.begin()) == ins[1], "expected 1 predecessor" );
+        ASSERT( tbb::flow::input_port<1>(middle).predecessor_count() == 1 && mp1_list.size() == 1 && *(mp1_list.begin()) == ins[2], "expected 1 predecessor" );
+        ASSERT( middle.successor_count() == 1 && ms_list.size() == 1 && *(ms_list.begin()) == outs[1], "expected 1 successor" );
+        ASSERT( out0.predecessor_count() == 0 && out0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( out0.successor_count() == 0 && out0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( out1.predecessor_count() == 1 && out1_p_list.size() == 1 && *(out1_p_list.begin()) == mp_ptr, "expected 1 predecessor" );
+        ASSERT( out1.successor_count() == 0 && out1_s_list.size() == 0, "expected 0 successors" );
+
+        in0.try_put(1);
+        in1.try_put(2);
+        in2.try_put(8);
+        in2.try_put(4);
+        g.wait_for_all();
+
+        T v_in;
+        typename my_node_t::output_type v;
+
+        ASSERT( in0.try_get(v_in) == true && v_in == 1, "buffer should have a value of 1" );
+        ASSERT( in1.try_get(v_in) == false, "buffer should not have a value" );
+        ASSERT( out0.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( in0.try_get(v_in) == false, "buffer should not have a value" );
+
+        T r = 0;
+        while ( out1.try_get(v) ) {
+            check_output(r,v);
+            g.wait_for_all();
+        }
+        ASSERT( r == 14, "not all values received" );
+        g.wait_for_all();
+    }
+
+    void validate_empty_graph() {
+        /*     in0                         */
+        /*                                 */
+        /*            port0         out0   */
+        /*                |                */
+        /*     in1         middle          */
+        /*                 |               */
+        /*     in2   port1          out1   */
+        set_up_lists();
+
+        ASSERT( in0.predecessor_count() == 0 && in0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in0.successor_count() == 0 && in0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( in1.predecessor_count() == 0 && in1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in1.successor_count() == 0 && in1_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( in2.predecessor_count() == 0 && in2_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( in2.successor_count() == 0 && in2_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( tbb::flow::input_port<0>(middle).predecessor_count() == 0 && mp0_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( tbb::flow::input_port<1>(middle).predecessor_count() == 0 && mp1_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( middle.successor_count() == 0 && ms_list.size() == 0, "expected 0 successors" );
+        ASSERT( out0.predecessor_count() == 0 && out0_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( out0.successor_count() == 0 && out0_s_list.size() == 0, "expected 0 successors" );
+        ASSERT( out1.predecessor_count() == 0 && out1_p_list.size() == 0, "expected 0 predecessors" );
+        ASSERT( out1.successor_count() == 0 && out1_s_list.size() == 0, "expected 0 successors" );
+
+        in0.try_put(1);
+        in1.try_put(2);
+        in2.try_put(8);
+        in2.try_put(4);
+        g.wait_for_all();
+
+        T v_in;
+        typename my_node_t::output_type v;
+
+        ASSERT( in0.try_get(v_in) == true && v_in == 1, "buffer should have a value of 1" );
+        ASSERT( in1.try_get(v_in) == true && v_in == 2, "buffer should have a value of 2" );
+        ASSERT( in2.try_get(v_in) == true && v_in == 8, "buffer should have a value of 8" );
+        ASSERT( in2.try_get(v_in) == true && v_in == 4, "buffer should have a value of 4" );
+        ASSERT( out0.try_get(v) == false, "buffer should not have a value" );
+        ASSERT( out1.try_get(v) == false, "buffer should not have a value" );
+        g.wait_for_all();
+        g.reset(); // NOTE: this should not be necessary!!!!!  But it is!!!!
+    }
+
+public:
+
+    test_indexer_extract() : in0(g), in1(g), in2(g), middle(g), out0(g), out1(g) {
+        ins[0] = &in0;
+        ins[1] = &in1;
+        ins[2] = &in2;
+        outs[0] = &out0;
+        outs[1] = &out1;
+        ms_p0_ptr = static_cast< typename in_node_t::successor_type * >(&tbb::flow::input_port<0>(middle));
+        ms_p1_ptr = static_cast< typename in_node_t::successor_type * >(&tbb::flow::input_port<1>(middle));
+        mp_ptr = static_cast< typename out_node_t::predecessor_type *>(&middle);
+    }
+
+    virtual ~test_indexer_extract() {}
+
+    void run_tests() {
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        in0.extract();
+        out0.extract();
+        REMARK("partial graph\n");
+        validate_partial_graph();
+
+        in1.extract();
+        in2.extract();
+        out1.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        middle.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        in0.extract();
+        in1.extract();
+        in2.extract();
+        middle.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        out0.extract();
+        out1.extract();
+        middle.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+    }
+};
+#endif
+
+const int Count = 150;
+const int MaxPorts = 10;
+const int MaxNSources = 5; // max # of source_nodes to register for each indexer_node input in parallel test
+bool outputCheck[MaxPorts][Count];  // for checking output
+
+void
+check_outputCheck( int nUsed, int maxCnt) {
+    for(int i=0; i < nUsed; ++i) {
+        for( int j = 0; j < maxCnt; ++j) {
+            ASSERT(outputCheck[i][j], NULL);
+        }
+    }
+}
+
+void
+reset_outputCheck( int nUsed, int maxCnt) {
+    for(int i=0; i < nUsed; ++i) {
+        for( int j = 0; j < maxCnt; ++j) {
+            outputCheck[i][j] = false;
+        }
+    }
+}
+
+class test_class {
+    public:
+        test_class() { my_val = 0; }
+        test_class(int i) { my_val = i; }
+        operator int() { return my_val; }
+    private:
+        int my_val;
+};
+
+template<typename T>
+class name_of {
+public:
+    static const char* name() { return  "Unknown"; }
+};
+template<>
+class name_of<int> {
+public:
+    static const char* name() { return  "int"; }
+};
+template<>
+class name_of<float> {
+public:
+    static const char* name() { return  "float"; }
+};
+template<>
+class name_of<double> {
+public:
+    static const char* name() { return  "double"; }
+};
+template<>
+class name_of<long> {
+public:
+    static const char* name() { return  "long"; }
+};
+template<>
+class name_of<short> {
+public:
+    static const char* name() { return  "short"; }
+};
+template<>
+class name_of<test_class> {
+public:
+    static const char* name() { return  "test_class"; }
+};
+
+// TT must be arithmetic, and shouldn't wrap around for reasonable sizes of Count (which is now 150, and maxPorts is 10,
+// so the max number generated right now is 1500 or so.)  Source will generate a series of TT with value
+// (init_val + (i-1)*addend) * my_mult, where i is the i-th invocation of the body.  We are attaching addend
+// source nodes to a indexer_port, and each will generate part of the numerical series the port is expecting
+// to receive.  If there is only one source node, the series order will be maintained; if more than one,
+// this is not guaranteed.
+// The manual specifies bodies can be assigned, so we can't hide the operator=.
+template<typename TT>
+class source_body {
+    TT my_mult;
+    int my_count;
+    int addend;
+public:
+    source_body(TT multiplier, int init_val, int addto) : my_mult(multiplier), my_count(init_val), addend(addto) { }
+    bool operator()( TT &v) {
+        int lc = my_count;
+        v = my_mult * (TT)my_count;
+        my_count += addend;
+        return lc < Count;
+    }
+};
+
+// allocator for indexer_node.
+
+template<typename IType>
+class makeIndexer {
+public:
+    static IType *create() {
+        IType *temp = new IType();
+        return temp;
+    }
+    static void destroy(IType *p) { delete p; }
+};
+
+template<int ELEM, typename INT>
+struct getval_helper {
+
+    typedef typename INT::output_type OT;
+    typedef typename tbb::flow::tuple_element<ELEM-1, typename INT::tuple_types>::type stored_type;
+
+    static int get_integer_val(OT const &o) {
+        stored_type res = tbb::flow::cast_to<stored_type>(o);
+        return (int)res;
+    }
+};
+
+// holder for source_node pointers for eventual deletion
+
+static void* all_source_nodes[MaxPorts][MaxNSources];
+
+template<int ELEM, typename INT>
+class source_node_helper {
+public:
+    typedef INT indexer_node_type;
+    typedef typename indexer_node_type::output_type TT;
+    typedef typename tbb::flow::tuple_element<ELEM-1,typename INT::tuple_types>::type IT;
+    typedef typename tbb::flow::source_node<IT> my_source_node_type;
+    static void print_remark() {
+        source_node_helper<ELEM-1,INT>::print_remark();
+        REMARK(", %s", name_of<IT>::name());
+    }
+    static void add_source_nodes(indexer_node_type &my_indexer, tbb::flow::graph &g, int nInputs) {
+        for(int i=0; i < nInputs; ++i) {
+            my_source_node_type *new_node = new my_source_node_type(g, source_body<IT>((IT)(ELEM+1), i, nInputs));
+            tbb::flow::make_edge(*new_node, tbb::flow::input_port<ELEM-1>(my_indexer));
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+            ASSERT(new_node->successor_count() == 1, NULL);
+#endif
+            all_source_nodes[ELEM-1][i] = (void *)new_node;
+        }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT(tbb::flow::input_port<ELEM-1>(my_indexer).predecessor_count() == (size_t)nInputs, NULL);
+#endif
+        // add the next source_node
+        source_node_helper<ELEM-1, INT>::add_source_nodes(my_indexer, g, nInputs);
+    }
+    static void check_value(TT &v) {
+        if(v.tag() == ELEM-1) {
+            int ival = getval_helper<ELEM,INT>::get_integer_val(v);
+            ASSERT(!(ival%(ELEM+1)), NULL);
+            ival /= (ELEM+1);
+            ASSERT(!outputCheck[ELEM-1][ival], NULL);
+            outputCheck[ELEM-1][ival] = true;
+        }
+        else {
+            source_node_helper<ELEM-1,INT>::check_value(v);
+        }
+    }
+
+    static void remove_source_nodes(indexer_node_type& my_indexer, int nInputs) {
+        for(int i=0; i< nInputs; ++i) {
+            my_source_node_type *dp = reinterpret_cast<my_source_node_type *>(all_source_nodes[ELEM-1][i]);
+            tbb::flow::remove_edge(*dp, tbb::flow::input_port<ELEM-1>(my_indexer));
+            delete dp;
+        }
+        source_node_helper<ELEM-1, INT>::remove_source_nodes(my_indexer, nInputs);
+    }
+};
+
+template<typename INT>
+class source_node_helper<1, INT> {
+    typedef INT indexer_node_type;
+    typedef typename indexer_node_type::output_type TT;
+    typedef typename tbb::flow::tuple_element<0, typename INT::tuple_types>::type IT;
+    typedef typename tbb::flow::source_node<IT> my_source_node_type;
+public:
+    static void print_remark() {
+        REMARK("Parallel test of indexer_node< %s", name_of<IT>::name());
+    }
+    static void add_source_nodes(indexer_node_type &my_indexer, tbb::flow::graph &g, int nInputs) {
+        for(int i=0; i < nInputs; ++i) {
+            my_source_node_type *new_node = new my_source_node_type(g, source_body<IT>((IT)2, i, nInputs));
+            tbb::flow::make_edge(*new_node, tbb::flow::input_port<0>(my_indexer));
+            all_source_nodes[0][i] = (void *)new_node;
+        }
+    }
+    static void check_value(TT &v) {
+        int ival = getval_helper<1,INT>::get_integer_val(v);
+        ASSERT(!(ival%2), NULL);
+        ival /= 2;
+        ASSERT(!outputCheck[0][ival], NULL);
+        outputCheck[0][ival] = true;
+    }
+    static void remove_source_nodes(indexer_node_type& my_indexer, int nInputs) {
+        for(int i=0; i < nInputs; ++i) {
+            my_source_node_type *dp = reinterpret_cast<my_source_node_type *>(all_source_nodes[0][i]);
+            tbb::flow::remove_edge(*dp, tbb::flow::input_port<0>(my_indexer));
+            delete dp;
+        }
+    }
+};
+
+template<typename IType>
+class parallel_test {
+public:
+    typedef typename IType::output_type TType;
+    typedef typename IType::tuple_types union_types;
+    static const int SIZE = tbb::flow::tuple_size<union_types>::value;
+    static void test() {
+        TType v;
+        source_node_helper<SIZE,IType>::print_remark();
+        REMARK(" >\n");
+        for(int i=0; i < MaxPorts; ++i) {
+            for(int j=0; j < MaxNSources; ++j) {
+                all_source_nodes[i][j] = NULL;
+            }
+        }
+        for(int nInputs = 1; nInputs <= MaxNSources; ++nInputs) {
+            tbb::flow::graph g;
+            IType* my_indexer = new IType(g); //makeIndexer<IType>::create();
+            tbb::flow::queue_node<TType> outq1(g);
+            tbb::flow::queue_node<TType> outq2(g);
+
+            tbb::flow::make_edge(*my_indexer, outq1);
+            tbb::flow::make_edge(*my_indexer, outq2);
+
+            source_node_helper<SIZE, IType>::add_source_nodes((*my_indexer), g, nInputs);
+
+            g.wait_for_all();
+
+            reset_outputCheck(SIZE, Count);
+            for(int i=0; i < Count*SIZE; ++i) {
+                ASSERT(outq1.try_get(v), NULL);
+                source_node_helper<SIZE, IType>::check_value(v);
+            }
+
+            check_outputCheck(SIZE, Count);
+            reset_outputCheck(SIZE, Count);
+
+            for(int i=0; i < Count*SIZE; i++) {
+                ASSERT(outq2.try_get(v), NULL);;
+                source_node_helper<SIZE, IType>::check_value(v);
+            }
+            check_outputCheck(SIZE, Count);
+
+            ASSERT(!outq1.try_get(v), NULL);
+            ASSERT(!outq2.try_get(v), NULL);
+
+            source_node_helper<SIZE, IType>::remove_source_nodes((*my_indexer), nInputs);
+            tbb::flow::remove_edge(*my_indexer, outq1);
+            tbb::flow::remove_edge(*my_indexer, outq2);
+            makeIndexer<IType>::destroy(my_indexer);
+        }
+    }
+};
+
+std::vector<int> last_index_seen;
+
+template<int ELEM, typename IType>
+class serial_queue_helper {
+public:
+    typedef typename IType::output_type OT;
+    typedef typename IType::tuple_types TT;
+    typedef typename tbb::flow::tuple_element<ELEM-1,TT>::type IT;
+    static void print_remark() {
+        serial_queue_helper<ELEM-1,IType>::print_remark();
+        REMARK(", %s", name_of<IT>::name());
+    }
+    static void fill_one_queue(int maxVal, IType &my_indexer) {
+        // fill queue to "left" of me
+        serial_queue_helper<ELEM-1,IType>::fill_one_queue(maxVal,my_indexer);
+        for(int i = 0; i < maxVal; ++i) {
+            ASSERT(tbb::flow::input_port<ELEM-1>(my_indexer).try_put((IT)(i*(ELEM+1))), NULL);
+        }
+    }
+    static void put_one_queue_val(int myVal, IType &my_indexer) {
+        // put this val to my "left".
+        serial_queue_helper<ELEM-1,IType>::put_one_queue_val(myVal, my_indexer);
+        ASSERT(tbb::flow::input_port<ELEM-1>(my_indexer).try_put((IT)(myVal*(ELEM+1))), NULL);
+    }
+    static void check_queue_value(OT &v) {
+        if(ELEM - 1 == v.tag()) {
+            // this assumes each or node input is queueing.
+            int rval = getval_helper<ELEM,IType>::get_integer_val(v);
+            ASSERT( rval == (last_index_seen[ELEM-1]+1)*(ELEM+1), NULL);
+            last_index_seen[ELEM-1] = rval / (ELEM+1);
+        }
+        else {
+            serial_queue_helper<ELEM-1,IType>::check_queue_value(v);
+        }
+    }
+};
+
+template<typename IType>
+class serial_queue_helper<1, IType> {
+public:
+    typedef typename IType::output_type OT;
+    typedef typename IType::tuple_types TT;
+    typedef typename tbb::flow::tuple_element<0,TT>::type IT;
+    static void print_remark() {
+        REMARK("Serial test of indexer_node< %s", name_of<IT>::name());
+    }
+    static void fill_one_queue(int maxVal, IType &my_indexer) {
+        for(int i = 0; i < maxVal; ++i) {
+            ASSERT(tbb::flow::input_port<0>(my_indexer).try_put((IT)(i*2)), NULL);
+        }
+    }
+    static void put_one_queue_val(int myVal, IType &my_indexer) {
+        ASSERT(tbb::flow::input_port<0>(my_indexer).try_put((IT)(myVal*2)), NULL);
+    }
+    static void check_queue_value(OT &v) {
+        ASSERT(v.tag() == 0, NULL);  // won't get here unless true
+        int rval = getval_helper<1,IType>::get_integer_val(v);
+        ASSERT( rval == (last_index_seen[0]+1)*2, NULL);
+        last_index_seen[0] = rval / 2;
+    }
+};
+
+template<typename IType, typename TType, int SIZE>
+void test_one_serial( IType &my_indexer, tbb::flow::graph &g) {
+    last_index_seen.clear();
+    for(int ii=0; ii < SIZE; ++ii) last_index_seen.push_back(-1);
+
+    typedef TType q3_input_type;
+    tbb::flow::queue_node< q3_input_type >  q3(g);
+    q3_input_type v;
+
+    tbb::flow::make_edge(my_indexer, q3);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(my_indexer.successor_count() == 1, NULL);
+    ASSERT(tbb::flow::input_port<0>(my_indexer).predecessor_count() == 0, NULL);
+#endif
+
+    // fill each queue with its value one-at-a-time
+    for (int i = 0; i < Count; ++i ) {
+        serial_queue_helper<SIZE,IType>::put_one_queue_val(i,my_indexer);
+    }
+
+    g.wait_for_all();
+    for (int i = 0; i < Count * SIZE; ++i ) {
+        g.wait_for_all();
+        ASSERT(q3.try_get( v ), "Error in try_get()");
+        {
+            serial_queue_helper<SIZE,IType>::check_queue_value(v);
+        }
+    }
+    ASSERT(!q3.try_get( v ), "extra values in output queue");
+    for(int ii=0; ii < SIZE; ++ii) last_index_seen[ii] = -1;
+
+    // fill each queue completely before filling the next.
+    serial_queue_helper<SIZE, IType>::fill_one_queue(Count,my_indexer);
+
+    g.wait_for_all();
+    for (int i = 0; i < Count*SIZE; ++i ) {
+        g.wait_for_all();
+        ASSERT(q3.try_get( v ), "Error in try_get()");
+        {
+            serial_queue_helper<SIZE,IType>::check_queue_value(v);
+        }
+    }
+    ASSERT(!q3.try_get( v ), "extra values in output queue");
+}
+
+//
+// Single predecessor at each port, single accepting successor
+//   * put to buffer before port0, then put to buffer before port1, ...
+//   * fill buffer before port0 then fill buffer before port1, ...
+
+template<typename IType>
+class serial_test {
+    typedef typename IType::output_type TType;  // this is the union
+    typedef typename IType::tuple_types union_types;
+    static const int SIZE = tbb::flow::tuple_size<union_types>::value;
+public:
+static void test() {
+    tbb::flow::graph g;
+    static const int ELEMS = 3;
+    IType* my_indexer = new IType(g); //makeIndexer<IType>::create(g);
+
+    test_input_ports_return_ref(*my_indexer);
+
+    serial_queue_helper<SIZE, IType>::print_remark(); REMARK(" >\n");
+
+    test_one_serial<IType,TType,SIZE>(*my_indexer, g);
+
+    std::vector<IType> indexer_vector(ELEMS,*my_indexer);
+
+    makeIndexer<IType>::destroy(my_indexer);
+
+    for(int e = 0; e < ELEMS; ++e) {
+        test_one_serial<IType,TType,SIZE>(indexer_vector[e], g);
+    }
+}
+
+}; // serial_test
+
+template<
+      template<typename> class TestType,  // serial_test or parallel_test
+      typename T0, typename T1=void, typename T2=void, typename T3=void, typename T4=void,
+      typename T5=void, typename T6=void, typename T7=void, typename T8=void, typename T9=void> // type of the inputs to the indexer_node
+class generate_test {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3, T4, T5, T6, T7, T8, T9>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+//specializations for indexer node inputs
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2, typename T3, typename T4,
+      typename T5, typename T6, typename T7, typename T8>
+class generate_test<TestType, T0, T1, T2, T3, T4, T5, T6, T7, T8> {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3, T4, T5, T6, T7, T8>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2, typename T3, typename T4,
+      typename T5, typename T6, typename T7>
+class generate_test<TestType, T0, T1, T2, T3, T4, T5, T6, T7> {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3, T4, T5, T6, T7>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2, typename T3, typename T4,
+      typename T5, typename T6>
+class generate_test<TestType, T0, T1, T2, T3, T4, T5, T6> {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3, T4, T5, T6>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2, typename T3, typename T4,
+      typename T5>
+class generate_test<TestType, T0, T1, T2, T3, T4, T5>  {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3, T4, T5>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2, typename T3, typename T4>
+class generate_test<TestType, T0, T1, T2, T3, T4>  {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3, T4>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2, typename T3>
+class generate_test<TestType, T0, T1, T2, T3> {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2, T3>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1, typename T2>
+class generate_test<TestType, T0, T1, T2> {
+public:
+    typedef tbb::flow::indexer_node<T0, T1, T2>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0, typename T1>
+class generate_test<TestType, T0, T1> {
+public:
+    typedef tbb::flow::indexer_node<T0, T1>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+template<
+      template<typename> class TestType,
+      typename T0>
+class generate_test<TestType, T0> {
+public:
+    typedef tbb::flow::indexer_node<T0>  indexer_node_type;
+    static void do_test() {
+        TestType<indexer_node_type>::test();
+    }
+};
+
+int TestMain() {
+    REMARK("Testing indexer_node, ");
+#if __TBB_USE_TBB_TUPLE
+    REMARK("using TBB tuple\n");
+#else
+    REMARK("using platform tuple\n");
+#endif
+
+   for (int p = 0; p < 2; ++p) {
+       generate_test<serial_test, float>::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 4
+       generate_test<serial_test, float, double, int>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 6
+       generate_test<serial_test, double, double, int, long, int, short>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 8
+       generate_test<serial_test, float, double, double, double, float, int, float, long>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 10
+       generate_test<serial_test, float, double, int, double, double, float, long, int, float, long>::do_test();
+#endif
+       generate_test<parallel_test, float, double>::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 3
+       generate_test<parallel_test, float, int, long>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 5
+       generate_test<parallel_test, double, double, int, int, short>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 7
+       generate_test<parallel_test, float, int, double, float, long, float, long>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 9
+       generate_test<parallel_test, float, double, int, double, double, long, int, float, long>::do_test();
+#endif
+   }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+   test_indexer_extract<int>().run_tests();
+#endif
+   return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_initializer_list.h b/xdl/third_party/tbb/src/test/test_initializer_list.h
new file mode 100644
index 00000000..222a7bb6
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_initializer_list.h
@@ -0,0 +1,173 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_test_initializer_list_H
+#define __TBB_test_initializer_list_H
+#include "tbb/tbb_config.h"
+
+#if __TBB_INITIALIZER_LISTS_PRESENT
+#include <initializer_list>
+#include <vector>
+#include "harness_defs.h" //for int_to_type
+
+namespace initializer_list_support_tests{
+    template<typename container_type, typename element_type>
+    void test_constructor(std::initializer_list<element_type> il, container_type const& expected){
+        container_type vd (il);
+        ASSERT(vd == expected,"initialization via explicit constructor call with init list failed");
+    }
+
+
+    template<typename container_type, typename element_type>
+    void test_assignment_operator(std::initializer_list<element_type> il, container_type const& expected){
+        container_type va;
+        va = il;
+        ASSERT(va == expected,"init list operator= failed");
+    }
+
+    struct skip_test {
+        template<typename container_type, typename element_type>
+        static void do_test(std::initializer_list<element_type>, container_type const&) { /* do nothing */ }
+    };
+
+    struct test_assign {
+        template<typename container_type, typename element_type>
+        static void do_test( std::initializer_list<element_type> il, container_type const& expected ) {
+            container_type vae;
+            vae.assign( il );
+            ASSERT( vae == expected, "init list assign(begin,end) failed" );
+        }
+    };
+
+    struct test_special_insert {
+        template<typename container_type, typename element_type>
+        static void do_test( std::initializer_list<element_type> il, container_type const& expected ) {
+            container_type vd;
+            vd.insert( il );
+            ASSERT( vd == expected, "inserting with an initializer list failed" );
+        }
+    };
+
+    template <typename container_type, typename test_assign, typename test_special>
+    void TestInitListSupport(std::initializer_list<typename container_type::value_type> il){
+        typedef typename container_type::value_type element_type;
+        std::vector<element_type> test_seq(il.begin(),il.end());
+        container_type expected(test_seq.begin(), test_seq.end());
+
+        test_constructor<container_type,element_type>(il, expected);
+        test_assignment_operator<container_type,element_type>(il, expected);
+        test_assign::do_test(il, expected);
+        test_special::do_test(il, expected);
+    }
+
+    template <typename container_type, typename test_special = skip_test>
+    void TestInitListSupport(std::initializer_list<typename container_type::value_type> il) {
+        TestInitListSupport<container_type, test_assign, test_special>(il);
+    }
+
+    template <typename container_type, typename test_special = skip_test>
+    void TestInitListSupportWithoutAssign(std::initializer_list<typename container_type::value_type> il){
+        TestInitListSupport<container_type, skip_test, test_special>(il);
+    }
+
+    //TODO: add test for no leaks, and correct element lifetime
+    //the need for macro comes from desire to test different scenarios where initializer sequence is compile time constant
+    #define __TBB_TEST_INIT_LIST_SUITE_SINGLE(FUNC_NAME, CONTAINER, ELEMENT_TYPE, INIT_SEQ)                                                           \
+    void FUNC_NAME(){                                                                                                                                 \
+        typedef ELEMENT_TYPE element_type;                                                                                                            \
+        typedef CONTAINER<element_type> container_type;                                                                                               \
+        element_type test_seq[] = INIT_SEQ;                                                                                                           \
+        container_type expected(test_seq,test_seq + Harness::array_length(test_seq));                                                                 \
+                                                                                                                                                      \
+        /*test for explicit contructor call*/                                                                                                         \
+        container_type vd INIT_SEQ;                                                                                                                   \
+        ASSERT(vd == expected,"initialization via explicit constructor call with init list failed");                                                  \
+        /*test for explicit contructor call with std::initializer_list*/                                                                              \
+                                                                                                                                                      \
+        std::initializer_list<element_type> init_list = INIT_SEQ;                                                                                     \
+        container_type v1 (init_list);                                                                                                                \
+        ASSERT(v1 == expected,"initialization via explicit constructor call with std::initializer_list failed");                                      \
+                                                                                                                                                      \
+        /*implicit constructor call test*/                                                                                                            \
+        container_type v = INIT_SEQ;                                                                                                                  \
+        ASSERT(v == expected,"init list constructor failed");                                                                                         \
+                                                                                                                                                      \
+        /*assignment operator test*/                                                                                                                  \
+        /*TODO: count created and destroyed injects to assert that no extra copy of vector was created implicitly*/                                   \
+        container_type va;                                                                                                                            \
+        va = INIT_SEQ;                                                                                                                                \
+        ASSERT(va == expected,"init list operator= failed");                                                                                          \
+        /*assign(begin,end) test*/                                                                                                                    \
+        container_type vae;                                                                                                                           \
+        vae.assign(INIT_SEQ);                                                                                                                         \
+        ASSERT(vae == expected,"init list assign(begin,end) failed");                                                                                 \
+    }                                                                                                                                                 \
+
+    namespace initializer_list_helpers{
+        template<typename T>
+        class ad_hoc_container{
+            std::vector<T> vec;
+            public:
+            ad_hoc_container(){}
+            template<typename InputIterator>
+            ad_hoc_container(InputIterator begin, InputIterator end) : vec(begin,end) {}
+            ad_hoc_container(std::initializer_list<T> il) : vec(il.begin(),il.end()) {}
+            ad_hoc_container(ad_hoc_container const& other) : vec(other.vec) {}
+            ad_hoc_container& operator=(ad_hoc_container const& rhs){ vec=rhs.vec; return *this;}
+            ad_hoc_container& operator=(std::initializer_list<T> il){ vec.assign(il.begin(),il.end()); return *this;}
+            template<typename InputIterator>
+            void assign(InputIterator begin, InputIterator end){ vec.assign(begin,end);}
+            void assign(std::initializer_list<T> il){ vec.assign(il.begin(),il.end());}
+            friend bool operator==(ad_hoc_container<T> const& lhs, ad_hoc_container<T> const& rhs){ return lhs.vec==rhs.vec;}
+        };
+    }
+
+    #define AD_HOC_INIT_SEQ {1,2,3,4}
+    __TBB_TEST_INIT_LIST_SUITE_SINGLE(TestCompilerSupportInt, initializer_list_helpers::ad_hoc_container, int, AD_HOC_INIT_SEQ )
+    #undef AD_HOC_INIT_SEQ
+
+    #if __TBB_CPP11_INIT_LIST_TEST_BROKEN
+        void TestCompilerSupportIntPair(){
+            REPORT("Known issue: skip initializer_list compiler test for std::pair list elements.\n");
+        }
+    #else
+        #define AD_HOC_PAIR_INIT_SEQ {{1,1}, {2,2},{3,3}, {4,4}}
+        #define AD_HOC_INIT_SEQ_PAIR_TYPE std::pair<int,int>
+        __TBB_TEST_INIT_LIST_SUITE_SINGLE(TestCompilerSupportIntPair, initializer_list_helpers::ad_hoc_container, AD_HOC_INIT_SEQ_PAIR_TYPE, AD_HOC_PAIR_INIT_SEQ )
+        #undef AD_HOC_INIT_SEQ_PAIR_TYPE
+        #undef AD_HOC_PAIR_INIT_SEQ
+    #endif
+
+    bool TestCompilerForInitializerList();
+    namespace  {
+        const bool conpiler_init_list_tests_are_run =  TestCompilerForInitializerList();
+    }
+
+    //TODO: move this to test_compiler
+    bool TestCompilerForInitializerList(){
+        TestCompilerSupportInt();
+        TestCompilerSupportIntPair();
+        tbb::internal::suppress_unused_warning(conpiler_init_list_tests_are_run);
+        return true;
+    }
+} // namespace initializer_list_support_tests
+
+#endif //__TBB_INITIALIZER_LISTS_PRESENT
+#endif //__TBB_test_initializer_list_H
diff --git a/xdl/third_party/tbb/src/test/test_inits_loop.cpp b/xdl/third_party/tbb/src/test/test_inits_loop.cpp
new file mode 100644
index 00000000..e5f75594
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_inits_loop.cpp
@@ -0,0 +1,94 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __APPLE__
+
+#define HARNESS_CUSTOM_MAIN 1
+#include "harness.h"
+#include <cstdlib>
+#include "tbb/task_scheduler_init.h"
+
+#include <sys/types.h>
+#include <sys/wait.h>
+#include <unistd.h>
+#include <signal.h>
+#include <errno.h>
+
+bool exec_test(const char *self) {
+    int status = 1;
+    pid_t p = fork();
+    if(p < 0) {
+        REPORT("fork error: errno=%d: %s\n", errno, strerror(errno));
+        return true;
+    }
+    else if(p) { // parent
+        if(waitpid(p, &status, 0) != p) {
+            REPORT("wait error: errno=%d: %s\n", errno, strerror(errno));
+            return true;
+        }
+        if(WIFEXITED(status)) {
+            if(!WEXITSTATUS(status)) return false; // ok
+            else REPORT("child has exited with return code 0x%x\n", WEXITSTATUS(status));
+        } else {
+            REPORT("child error 0x%x:%s%s ", status, WIFSIGNALED(status)?" signalled":"",
+                WIFSTOPPED(status)?" stopped":"");
+            if(WIFSIGNALED(status))
+                REPORT("%s%s", sys_siglist[WTERMSIG(status)], WCOREDUMP(status)?" core dumped":"");
+            if(WIFSTOPPED(status))
+                REPORT("with %d stop-code", WSTOPSIG(status));
+            REPORT("\n");
+        }
+    }
+    else { // child
+        // reproduces error much often
+        execl(self, self, "0", NULL);
+        REPORT("exec fails %s: %d: %s\n", self, errno, strerror(errno));
+        exit(2);
+    }
+    return true;
+}
+
+HARNESS_EXPORT
+int main( int argc, char * argv[] ) {
+    MinThread = 3000;
+    ParseCommandLine( argc, argv );
+    if( MinThread <= 0 ) {
+        tbb::task_scheduler_init init( 2 ); // even number required for an error
+    } else {
+        for(int i = 0; i<MinThread; i++) {
+            if(exec_test(argv[0])) {
+                REPORT("ERROR: execution fails at %d-th iteration!\n", i);
+                exit(1);
+            }
+        }
+        REPORT("done\n");
+    }
+}
+
+#else /* !__APPLE__ */
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__APPLE__ */
diff --git a/xdl/third_party/tbb/src/test/test_intrusive_list.cpp b/xdl/third_party/tbb/src/test/test_intrusive_list.cpp
new file mode 100644
index 00000000..8241377e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_intrusive_list.cpp
@@ -0,0 +1,150 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+
+#include "../tbb/intrusive_list.h"
+
+using tbb::internal::intrusive_list_node;
+
+// Machine word filled with repeated pattern of FC bits
+const uintptr_t NoliMeTangere = ~uintptr_t(0)/0xFF*0xFC;
+
+struct VerificationBase : Harness::NoAfterlife {
+    uintptr_t m_Canary;
+    VerificationBase () : m_Canary(NoliMeTangere) {}
+};
+
+struct DataItemWithInheritedNodeBase : intrusive_list_node {
+    int m_Data;
+public:
+    DataItemWithInheritedNodeBase ( int value ) : m_Data(value) {}
+
+    int Data() const { return m_Data; }
+};
+
+class DataItemWithInheritedNode : public VerificationBase, public DataItemWithInheritedNodeBase {
+    friend class tbb::internal::intrusive_list<DataItemWithInheritedNode>;
+public:
+    DataItemWithInheritedNode ( int value ) : DataItemWithInheritedNodeBase(value) {}
+};
+
+struct DataItemWithMemberNodeBase {
+    int m_Data;
+public:
+    // Cannot be used by member_intrusive_list to form lists of objects derived from DataItemBase
+    intrusive_list_node m_BaseNode;
+
+    DataItemWithMemberNodeBase ( int value ) : m_Data(value) {}
+
+    int Data() const { return m_Data; }
+};
+
+class DataItemWithMemberNodes : public VerificationBase, public DataItemWithMemberNodeBase {
+public:
+    intrusive_list_node m_Node;
+
+    DataItemWithMemberNodes ( int value ) : DataItemWithMemberNodeBase(value) {}
+};
+
+typedef tbb::internal::intrusive_list<DataItemWithInheritedNode> IntrusiveList1;
+typedef tbb::internal::memptr_intrusive_list<DataItemWithMemberNodes,
+        DataItemWithMemberNodeBase, &DataItemWithMemberNodeBase::m_BaseNode> IntrusiveList2;
+typedef tbb::internal::memptr_intrusive_list<DataItemWithMemberNodes,
+        DataItemWithMemberNodes, &DataItemWithMemberNodes::m_Node> IntrusiveList3;
+
+const int NumElements = 256 * 1024;
+
+//! Iterates through the list forward and backward checking the validity of values stored by the list nodes
+template<class List, class Iterator>
+void CheckListNodes ( List& il, int valueStep ) {
+    ASSERT( il.size()==unsigned(NumElements/valueStep), "Wrong size of the list" );
+    ASSERT( !il.empty(), "Incorrect result of empty() or the list is corrupted" );
+    int i;
+    Iterator it = il.begin();
+    for ( i = valueStep - 1; it != il.end(); ++it, i += valueStep ) {
+        ASSERT( it->Data() == i, "Unexpected node value while iterating forward" );
+        ASSERT( (*it).m_Canary == NoliMeTangere, "Memory corruption" );
+    }
+    ASSERT( i == NumElements + valueStep - 1, "Wrong number of list elements while iterating forward" );
+    it = il.end();
+    for ( i = NumElements - 1, it--; it != il.end(); --it, i -= valueStep ) {
+        ASSERT( (*it).Data() == i, "Unexpected node value while iterating backward" );
+        ASSERT( it->m_Canary == NoliMeTangere, "Memory corruption" );
+    }
+    ASSERT( i == -1, "Wrong number of list elements while iterating backward" );
+}
+
+template<class List, class Item>
+void TestListOperations () {
+    typedef typename List::iterator iterator;
+    List il;
+    for ( int i = NumElements - 1; i >= 0; --i )
+        il.push_front( *new Item(i) );
+    CheckListNodes<const List, typename List::const_iterator>( il, 1 );
+    iterator it = il.begin();
+    for ( ; it != il.end(); ++it ) {
+        Item &item = *it;
+        it = il.erase( it ); // also advances the iterator
+        delete &item;
+    }
+    CheckListNodes<List, iterator>( il, 2 );
+    for ( it = il.begin(); it != il.end(); ++it ) {
+        Item &item = *it;
+        il.remove( *it++ ); // extra advance here as well
+        delete &item;
+    }
+    CheckListNodes<List, iterator>( il, 4 );
+    for ( it = il.begin(); it != il.end(); ) {
+        Item &item = *it++; // the iterator advances only here
+        il.remove( item );
+        delete &item;
+    }
+    ASSERT( il.size()==0, "The list has wrong size or not all items were removed" );
+    ASSERT( il.empty(), "Incorrect result of empty() or not all items were removed" );
+}
+
+#include "harness_bad_expr.h"
+
+template<class List, class Item>
+void TestListAssertions () {
+#if TRY_BAD_EXPR_ENABLED
+    tbb::set_assertion_handler( AssertionFailureHandler );
+    List il1, il2;
+    Item n1(1), n2(2), n3(3);
+    il1.push_front(n1);
+    TRY_BAD_EXPR( il2.push_front(n1), "only one intrusive list" );
+    TRY_BAD_EXPR( il1.push_front(n1), "only one intrusive list" );
+    il2.push_front(n2);
+    TRY_BAD_EXPR( il1.remove(n3), "not in the list" );
+    tbb::set_assertion_handler( ReportError );
+#endif /* TRY_BAD_EXPR_ENABLED */
+}
+
+int TestMain () {
+    TestListOperations<IntrusiveList1, DataItemWithInheritedNode>();
+    TestListOperations<IntrusiveList2, DataItemWithMemberNodes>();
+    TestListOperations<IntrusiveList3, DataItemWithMemberNodes>();
+    TestListAssertions<IntrusiveList1, DataItemWithInheritedNode>();
+    TestListAssertions<IntrusiveList2, DataItemWithMemberNodes>();
+    TestListAssertions<IntrusiveList3, DataItemWithMemberNodes>();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_iterators.cpp b/xdl/third_party/tbb/src/test/test_iterators.cpp
new file mode 100644
index 00000000..235d998a
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_iterators.cpp
@@ -0,0 +1,215 @@
+/*
+    Copyright (c) 2017-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_CPP11_PRESENT && __TBB_CPP11_DECLTYPE_PRESENT
+
+#include "tbb/iterators.h"
+
+#include <vector>
+#include <iostream>
+#include <algorithm>
+#include <numeric>
+
+#include "harness.h"
+
+//common checks of a random access iterator functionality
+template <typename RandomIt>
+void test_random_iterator(const RandomIt& it) {
+    ASSERT(  it == it,      "== returned false negative");
+    ASSERT(!(it == it + 1), "== returned false positive");
+    ASSERT(  it != it + 1,  "!= returned false negative");
+    ASSERT(!(it != it),     "!= returned false positive");
+
+    ASSERT(*it == *it, "wrong result with operator*");
+
+    RandomIt it1 = it;
+    ASSERT(it1 == it, "iterator is not copy constructible");
+    RandomIt it2 = RandomIt(it);
+    ASSERT(it2 == it, "iterator is not move constructible");
+
+    ++it1;
+    ASSERT(it1 == it + 1, "wrong result with prefix operator++");
+
+    using std::swap;
+    swap(it1, it2);
+    ASSERT((it1 == it) && (it2 == it + 1), "iterator is not swappable");
+
+    it2 = it;
+    ASSERT(it2 == it, "iterator is not copy assignable");
+
+    ++it2;
+    it2 = RandomIt(it);
+    ASSERT(it2 == it, "iterator is not move assignable");
+
+    it1 = it;
+    ASSERT((it1++ == it) && (it1 == it + 1), "wrong result with postfix operator++");
+
+    it1 = it + 1;
+    ASSERT(--it1 == it, "wrong result with prefix operator--");
+
+    it1 = it + 1;
+    ASSERT((it1-- == it + 1) && (it1 == it), "wrong result with postfix operator--");
+
+    it1 += 1;
+    ASSERT(it1 == it + 1, "wrong result with operator+=");
+
+    it1 -= 1;
+    ASSERT(it1 == it, "wrong result with operator-=");
+
+    ASSERT(1 + it == it + 1, "n + iterator != iterator + n");
+
+    ASSERT((it + 1) - 1 == it, "wrong result with operator-(difference_type)");
+
+    ASSERT((it + 1) - it == 1, "wrong result with iterator subtraction");
+
+    ASSERT(it[1] == *(it + 1), "wrong result with operator[]");
+
+    ASSERT(it < it + 1, "operator< returned false negative");
+    ASSERT(!(it < it),  "operator< returned false positive");
+
+    ASSERT(it + 1 > it, "operator> returned false negative");
+    ASSERT(!(it > it),  "operator> returned false positive");
+
+    ASSERT(it <= it + 1,    "operator<= returned false negative");
+    ASSERT(it <= it,        "operator<= returned false negative");
+    ASSERT(!(it + 1 <= it), "operator<= returned false positive");
+
+    ASSERT(1 + it >= it,    "operator>= returned false negative");
+    ASSERT(    it >= it,    "operator>= returned false negative");
+    ASSERT(!(it >= it + 1), "operator>= returned false positive");
+}
+
+struct test_counting_iterator {
+    template <typename T, typename IntType>
+    void operator()( std::vector<T>& in, IntType begin, IntType end, const T& value) {
+        ASSERT((0 <= begin) && (begin <= end) && (end <= IntType(in.size())),
+        "incorrect test_counting_iterator 'begin' and/or 'end' argument values");
+
+        auto b = tbb::counting_iterator<IntType>(begin);
+        auto e = tbb::counting_iterator<IntType>(end);
+
+        //checks in using
+        std::for_each(b, e, [&in, &value](IntType i) { in[i] = value; });
+
+        auto res = std::all_of(in.begin(), in.begin() + begin, [&value](const T& a) {return a!=value;});
+        ASSERT(res, "wrong result with counting_iterator in vector's begin portion");
+
+        res = std::all_of(in.begin() + begin, in.begin() + end, [&value](const T& a) {return a==value;});
+        ASSERT(res, "wrong result with counting_iterator in vector's main portion");
+
+        res = std::all_of(in.begin() + end, in.end(), [&value](const T& a) {return a!=value;});
+        ASSERT(res, "wrong result with counting_iterator in vector's end portion");
+
+        //explicit checks of the counting iterator specific
+        ASSERT(b[0]==begin, "wrong result with operator[] for an iterator");
+        ASSERT(*(b + 1) == begin+1, "wrong result with operator+ for an iterator");
+        ASSERT(*(b+=1) == begin+1, "wrong result with operator+= for an iterator");
+    }
+};
+
+struct test_zip_iterator {
+    template <typename T1, typename T2>
+    void operator()(std::vector<T1>& in1, std::vector<T2>& in2) {
+        auto b = tbb::make_zip_iterator(in1.begin(), in2.begin());
+        auto e = tbb::make_zip_iterator(in1.end(), in2.end());
+
+        //checks in using
+        std::for_each(b, e, [](const std::tuple<T1&, T2&>& a) { std::get<0>(a) = 1, std::get<1>(a) = 1;});
+        auto res = std::all_of(b, e, [](const std::tuple<T1&, T2&>& a) {return std::get<0>(a) == 1 && std::get<1>(a) == 1;});
+        ASSERT(res, "wrong result with zip_iterator iterator");
+
+        test_random_iterator(b);
+    }
+};
+
+template <typename VecIt1, typename VecIt2>
+void test_transform_effect(VecIt1 first1, VecIt1 last1, VecIt2 first2) {
+    auto triple = [](typename std::iterator_traits<VecIt1>::value_type const& val) {
+        return typename std::iterator_traits<VecIt2>::value_type (3 * val);
+    };
+
+    std::copy(
+        tbb::make_transform_iterator(first1, triple),
+        tbb::make_transform_iterator(last1,  triple),
+        first2
+    );
+
+    for (typename std::iterator_traits<VecIt1>::difference_type i = 0; i < last1 - first1; ++i)
+        if ( first2[i] != (typename std::iterator_traits<VecIt2>::value_type) triple(first1[i]) ) {
+            std::cout << "wrong effect with transform iterator" << std::endl;
+            exit(1);
+        }
+}
+
+struct test_transform_iterator {
+    template <typename T1, typename T2>
+    void operator()(std::vector<T1>& in1, std::vector<T2>& in2) {
+        std::iota(in1.begin(), in1.end(), T1(0));
+
+        test_transform_effect(in1.begin(),  in1.end(),  in2.begin());
+        test_transform_effect(in1.cbegin(), in1.cend(), in2.begin());
+
+        auto new_transform_iterator = tbb::make_transform_iterator(in2.begin(), [](T2& x) { return x + 1; });
+        test_random_iterator(new_transform_iterator);
+    }
+};
+
+template <typename T, typename IntType>
+void test_iterator_by_type(IntType n) {
+
+    const IntType beg = 0;
+    const IntType end = n;
+
+    std::vector<T> in(n, T(0));
+    std::vector<IntType> in2(n, IntType(0));
+
+    test_counting_iterator()(in, beg,     end,     /*value*/ T(-1));
+    test_counting_iterator()(in, beg+123, end-321, /*value*/ T(42));
+    test_random_iterator(tbb::counting_iterator<IntType>(beg));
+
+    test_zip_iterator()(in, in2);
+    test_transform_iterator()(in, in2);
+}
+
+int TestMain() {
+
+    const auto n1 = 1000;
+    const auto n2 = 100000;
+
+    test_iterator_by_type<int16_t, int16_t>(n1);
+    test_iterator_by_type<int16_t, int64_t>(n2);
+
+    test_iterator_by_type<double, int16_t>(n1);
+    test_iterator_by_type<double, int64_t>(n2);
+
+    return Harness::Done;
+}
+
+#else
+
+#include "harness.h"
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* __TBB_CPP11_PRESENT && __TBB_CPP11_DECLTYPE_PRESENT */
diff --git a/xdl/third_party/tbb/src/test/test_ittnotify.cpp b/xdl/third_party/tbb/src/test/test_ittnotify.cpp
new file mode 100644
index 00000000..cc7cceab
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_ittnotify.cpp
@@ -0,0 +1,93 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 2
+#define HARNESS_DEFAULT_MAX_THREADS 2
+
+#if !TBB_USE_THREADING_TOOLS
+    #define TBB_USE_THREADING_TOOLS 1
+#endif
+
+#include "harness.h"
+
+#if DO_ITT_NOTIFY
+
+#include "tbb/spin_mutex.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/queuing_rw_mutex.h"
+#include "tbb/queuing_mutex.h"
+#include "tbb/mutex.h"
+#include "tbb/recursive_mutex.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/task_scheduler_init.h"
+
+
+#include "../tbb/itt_notify.h"
+
+
+template<typename M>
+class WorkEmulator: NoAssign {
+    M& m_mutex;
+    static volatile size_t s_anchor;
+public:
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            typename M::scoped_lock lock(m_mutex);
+            for ( size_t j = 0; j!=range.end(); ++j )
+                s_anchor = (s_anchor - i) / 2 + (s_anchor + j) / 2;
+        }
+    }
+    WorkEmulator( M& mutex ) : m_mutex(mutex) {}
+};
+
+template<typename M>
+volatile size_t WorkEmulator<M>::s_anchor = 0;
+
+
+template<class M>
+void Test( const char * name ) {
+    REMARK("Testing %s\n",name);
+    M mtx;
+    tbb::profiling::set_name(mtx, name);
+
+    const int n = 10000;
+    tbb::parallel_for( tbb::blocked_range<size_t>(0,n,n/100), WorkEmulator<M>(mtx) );
+}
+
+    #define TEST_MUTEX(type, name)  Test<tbb::type>( name )
+
+#endif /* !DO_ITT_NOTIFY */
+
+int TestMain () {
+#if DO_ITT_NOTIFY
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK( "testing with %d workers\n", p );
+        tbb::task_scheduler_init init( p );
+        TEST_MUTEX( spin_mutex, "Spin Mutex" );
+        TEST_MUTEX( queuing_mutex, "Queuing Mutex" );
+        TEST_MUTEX( queuing_rw_mutex, "Queuing RW Mutex" );
+        TEST_MUTEX( spin_rw_mutex, "Spin RW Mutex" );
+    }
+    return Harness::Done;
+#else /* !DO_ITT_NOTIFY */
+    return Harness::Skipped;
+#endif /* !DO_ITT_NOTIFY */
+}
diff --git a/xdl/third_party/tbb/src/test/test_join_node.cpp b/xdl/third_party/tbb/src/test/test_join_node.cpp
new file mode 100644
index 00000000..ea49825f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_join_node.cpp
@@ -0,0 +1,134 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "test_join_node.h"
+
+static tbb::atomic<int> output_count;
+
+// get the tag from the output tuple and emit it.
+// the first tuple component is tag * 2 cast to the type
+template<typename OutputTupleType>
+class recirc_output_func_body {
+public:
+    // we only need this to use source_node_helper
+    typedef typename tbb::flow::join_node<OutputTupleType, tbb::flow::tag_matching> join_node_type;
+    static const int N = tbb::flow::tuple_size<OutputTupleType>::value;
+    int operator()(const OutputTupleType &v) {
+        int out = int(tbb::flow::get<0>(v))/2;
+        source_node_helper<N, join_node_type>::only_check_value(out, v);
+        ++output_count;
+        return out;
+    }
+};
+
+template<typename JType>
+class tag_recirculation_test {
+public:
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple<int, tbb::flow::continue_msg> input_tuple_type;
+    typedef tbb::flow::join_node<input_tuple_type, tbb::flow::reserving> input_join_type;
+    static const int N = tbb::flow::tuple_size<TType>::value;
+    static void test() {
+        source_node_helper<N, JType>::print_remark("Recirculation test of tag-matching join");
+        REMARK(" >\n");
+        for(int maxTag = 1; maxTag <10; maxTag *= 3) {
+            for(int i = 0; i < N; ++i) all_source_nodes[i][0] = NULL;
+
+            tbb::flow::graph g;
+            // this is the tag-matching join we're testing
+            JType * my_join = makeJoin<N, JType, tbb::flow::tag_matching>::create(g);
+            // source_node for continue messages
+            tbb::flow::source_node<tbb::flow::continue_msg> snode(g, recirc_source_node_body(), false);
+            // reserving join that matches recirculating tags with continue messages.
+            input_join_type * my_input_join = makeJoin<2, input_join_type, tbb::flow::reserving>::create(g);
+            // tbb::flow::make_edge(snode, tbb::flow::input_port<1>(*my_input_join));
+            tbb::flow::make_edge(snode, tbb::flow::get<1>(my_input_join->input_ports()));
+            // queue to hold the tags
+            tbb::flow::queue_node<int> tag_queue(g);
+            tbb::flow::make_edge(tag_queue, tbb::flow::input_port<0>(*my_input_join));
+            // add all the function_nodes that are inputs to the tag-matching join
+            source_node_helper<N, JType>::add_recirc_func_nodes(*my_join, *my_input_join, g);
+            // add the function_node that accepts the output of the join and emits the int tag it was based on
+            tbb::flow::function_node<TType, int> recreate_tag(g, tbb::flow::unlimited, recirc_output_func_body<TType>());
+            tbb::flow::make_edge(*my_join, recreate_tag);
+            // now the recirculating part (output back to the queue)
+            tbb::flow::make_edge(recreate_tag, tag_queue);
+
+            // put the tags into the queue
+            for(int t = 1; t<=maxTag; ++t) tag_queue.try_put(t);
+
+            input_count = Recirc_count;
+            output_count = 0;
+
+            // start up the source node to get things going
+            snode.activate();
+
+            // wait for everything to stop
+            g.wait_for_all();
+
+            ASSERT(output_count==Recirc_count, "not all instances were received");
+
+            int j;
+            // grab the tags from the queue, record them
+            std::vector<bool> out_tally(maxTag, false);
+            for(int i = 0; i < maxTag; ++i) {
+                ASSERT(tag_queue.try_get(j), "not enough tags in queue");
+                ASSERT(!out_tally.at(j-1), "duplicate tag from queue");
+                out_tally[j-1] = true;
+            }
+            ASSERT(!tag_queue.try_get(j), "Extra tags in recirculation queue");
+
+            // deconstruct graph
+            source_node_helper<N, JType>::remove_recirc_func_nodes(*my_join, *my_input_join);
+            tbb::flow::remove_edge(*my_join, recreate_tag);
+            makeJoin<N, JType, tbb::flow::tag_matching>::destroy(my_join);
+            tbb::flow::remove_edge(tag_queue, tbb::flow::input_port<0>(*my_input_join));
+            tbb::flow::remove_edge(snode, tbb::flow::input_port<1>(*my_input_join));
+            makeJoin<2, input_join_type, tbb::flow::reserving>::destroy(my_input_join);
+        }
+    }
+};
+
+template<typename JType>
+class generate_recirc_test {
+public:
+    typedef tbb::flow::join_node<JType, tbb::flow::tag_matching> join_node_type;
+    static void do_test() {
+        tag_recirculation_test<join_node_type>::test();
+    }
+};
+
+int TestMain() {
+#if __TBB_USE_TBB_TUPLE
+    REMARK("  Using TBB tuple\n");
+#else
+    REMARK("  Using platform tuple\n");
+#endif
+
+    TestTaggedBuffers();
+    test_main<tbb::flow::queueing>();
+    test_main<tbb::flow::reserving>();
+    test_main<tbb::flow::tag_matching>();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_join_node.h b/xdl/third_party/tbb/src/test/test_join_node.h
new file mode 100644
index 00000000..cb5bb43d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_join_node.h
@@ -0,0 +1,2155 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef tbb_test_join_node_H
+#define tbb_test_join_node_H
+
+#if _MSC_VER
+// Suppress "decorated name length exceeded, name was truncated" warning
+#if __INTEL_COMPILER
+#pragma warning( disable: 2586 )
+#else
+#pragma warning( disable: 4503 )
+#endif
+#endif
+
+#include "harness_graph.h"
+#include "harness_checktype.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+
+#define __TBB_MIC_OFFLOAD_TEST_COMPILATION_BROKEN __TBB_MIC_OFFLOAD
+
+const char *names[] = {
+    "Adam", "Bruce", "Charles", "Daniel", "Evan", "Frederich", "George", "Hiram", "Ichabod",
+    "John", "Kevin", "Leonard", "Michael", "Ned", "Olin", "Paul", "Quentin", "Ralph", "Steven",
+    "Thomas", "Ulysses", "Victor", "Walter", "Xerxes", "Yitzhak", "Zebediah", "Anne", "Bethany",
+    "Clarisse", "Dorothy", "Erin", "Fatima", "Gabrielle", "Helen", "Irene", "Jacqueline",
+    "Katherine", "Lana", "Marilyn", "Noelle", "Okiilani", "Pauline", "Querida", "Rose", "Sybil",
+    "Tatiana", "Umiko", "Victoria", "Wilma", "Xena", "Yolanda", "Zoe", "Algernon", "Benjamin",
+    "Caleb", "Dylan", "Ezra", "Felix", "Gabriel", "Henry", "Issac", "Jasper", "Keifer",
+    "Lincoln", "Milo", "Nathaniel", "Owen", "Peter", "Quincy", "Ronan", "Silas", "Theodore",
+    "Uriah", "Vincent", "Wilbur", "Xavier", "Yoda", "Zachary", "Amelia", "Brielle", "Charlotte",
+    "Daphne", "Emma", "Fiona", "Grace", "Hazel", "Isla", "Juliet", "Keira", "Lily", "Mia",
+    "Nora", "Olivia", "Penelope", "Quintana", "Ruby", "Sophia", "Tessa", "Ursula", "Violet",
+    "Willow", "Xanthe", "Yvonne", "ZsaZsa", "Asher", "Bennett", "Connor", "Dominic", "Ethan",
+    "Finn", "Grayson", "Hudson", "Ian", "Jackson", "Kent", "Liam", "Matthew", "Noah", "Oliver",
+    "Parker", "Quinn", "Rhys", "Sebastian", "Taylor", "Umberto", "Vito", "William", "Xanto",
+    "Yogi", "Zane", "Ava", "Brenda", "Chloe", "Delilah", "Ella", "Felicity", "Genevieve",
+    "Hannah", "Isabella", "Josephine", "Kacie", "Lucy", "Madeline", "Natalie", "Octavia",
+    "Piper", "Qismah", "Rosalie", "Scarlett", "Tanya", "Uta", "Vivian", "Wendy", "Xola",
+    "Yaritza", "Zanthe"};
+
+static const int NameCnt = sizeof(names)/sizeof(char *);
+
+template<typename K>
+struct index_to_key {
+    K operator()(const int indx) {
+        return (K)(3*indx+1);
+    }
+};
+
+template<>
+struct index_to_key<std::string> {
+    std::string operator()(const int indx) {
+        return std::string(names[indx % NameCnt]);
+    }
+};
+
+template<typename K>
+struct K_deref {
+    typedef K type;
+};
+
+template<typename K>
+struct K_deref<K&> {
+    typedef K type;
+};
+
+template<typename K, typename V>
+struct MyKeyFirst {
+    K my_key;
+    V my_value;
+    MyKeyFirst(int i = 0, int v = 0): my_key(index_to_key<K>()(i)), my_value((V)v) {
+    }
+    void print_val() const {
+        REMARK("MyKeyFirst{"); print_my_value(my_key); REMARK(","); print_my_value(my_value); REMARK("}");
+    }
+    operator int() const { return (int)my_value; }
+};
+
+template<typename K, typename V>
+struct MyKeySecond {
+    V my_value;
+    K my_key;
+    MyKeySecond(int i = 0, int v = 0): my_value((V)v), my_key(index_to_key<K>()(i)) {
+    }
+    void print_val() const {
+        REMARK("MyKeySecond{"); print_my_value(my_key); REMARK(","); print_my_value(my_value); REMARK("}");
+    }
+    operator int() const { return (int)my_value; }
+};
+
+template<typename K, typename V>
+struct MyMessageKeyWithoutKey {
+    V my_value;
+    K my_message_key;
+    MyMessageKeyWithoutKey(int i = 0, int v = 0): my_value((V)v), my_message_key(index_to_key<K>()(i)) {
+    }
+    void print_val() const {
+        REMARK("MyMessageKeyWithoutKey{"); print_my_value(my_message_key); REMARK(","); print_my_value(my_value); REMARK("}");
+    }
+    operator int() const { return (int)my_value; }
+    const K& key() const {
+        return my_message_key;
+    }
+};
+
+template<typename K, typename V>
+struct MyMessageKeyWithBrokenKey {
+    V my_value;
+    K my_key;
+    K my_message_key;
+    MyMessageKeyWithBrokenKey(int i = 0, int v = 0): my_value((V)v), my_key(), my_message_key(index_to_key<K>()(i)) {
+    }
+    void print_val() const {
+        REMARK("MyMessageKeyWithBrokenKey{"); print_my_value(my_message_key); REMARK(","); print_my_value(my_value); REMARK("}");
+    }
+    operator int() const { return (int)my_value; }
+    const K& key() const {
+        return my_message_key;
+    }
+
+};
+
+template<typename K, typename V>
+struct MyKeyWithBrokenMessageKey {
+    V my_value;
+    K my_key;
+    MyKeyWithBrokenMessageKey(int i = 0, int v = 0): my_value((V)v), my_key(index_to_key<K>()(i)) {
+    }
+    void print_val() const {
+        REMARK("MyKeyWithBrokenMessageKey{"); print_my_value(my_key); REMARK(","); print_my_value(my_value); REMARK("}");
+    }
+    operator int() const { return (int)my_value; }
+    K key() const {
+        ASSERT(false, "The method should never be called");
+        return K();
+    }
+};
+
+template<typename K, typename V>
+struct MyMessageKeyWithoutKeyMethod {
+    V my_value;
+    K my_message_key;
+    MyMessageKeyWithoutKeyMethod(int i = 0, int v = 0): my_value((V)v), my_message_key(index_to_key<K>()(i)) {
+    }
+    void print_val() const {
+        REMARK("MyMessageKeyWithoutKeyMethod{"); print_my_value(my_message_key); REMARK(","); print_my_value(my_value); REMARK("}");
+    }
+    operator int() const { return (int)my_value; }
+#if __TBB_COMPLICATED_ADL_BROKEN
+    const K& key() const { return my_message_key; }
+#endif
+    //K key() const; // Do not define
+};
+
+// Overload for MyMessageKeyWithoutKeyMethod
+template <typename K, typename V>
+K key_from_message(const MyMessageKeyWithoutKeyMethod<typename tbb::internal::strip<K>::type, V> &m) {
+    return m.my_message_key;
+}
+
+
+// pattern for creating values in the tag_matching and key_matching, given an integer and the index in the tuple
+template<typename TT, size_t INDEX>
+struct make_thingie {
+    TT operator()(int const &i) {
+        return TT(i * (INDEX+1));
+    }
+};
+
+template<template <typename, typename> class T, typename K, typename V, size_t INDEX>
+struct make_thingie<T<K, V>, INDEX> {
+    T<K, V> operator()(int const &i) {
+        return T<K, V>(i, i*(INDEX+1));
+    }
+};
+
+// cast_from<T>::my_int_val(i);
+template<typename T>
+struct cast_from {
+    static int my_int_val(T const &i) { return (int)i; }
+};
+
+template<typename K, typename V>
+struct cast_from<MyKeyFirst<K, V> > {
+    static int my_int_val(MyKeyFirst<K, V> const &i) { return (int)(i.my_value); }
+};
+
+template<typename K, typename V>
+struct cast_from<MyKeySecond<K, V> > {
+    static int my_int_val(MyKeySecond<K, V> const &i) { return (int)(i.my_value); }
+};
+
+template<typename T>
+void print_my_value(T const &i) {
+    REMARK(" %d ", cast_from<T>::my_int_val(i));
+}
+
+template<typename K, typename V>
+void print_my_value(MyKeyFirst<K, V> const &i) {
+    i.print_val();
+}
+
+template<typename K, typename V>
+void print_my_value(MyKeySecond<K, V> const &i) {
+    i.print_val();
+}
+
+template<>
+void print_my_value(std::string const &i) {
+    REMARK("\"%s\"", i.c_str());
+}
+
+//
+// Tests
+//
+
+//!
+// my_struct_key == given a type V with a field named my_key of type K, will return a copy of my_key
+template<class K, typename V>
+struct my_struct_key {
+    K operator()(const V& mv) {
+        return mv.my_key;
+    }
+};
+
+// specialization returning reference to my_key.
+template<class K, typename V>
+struct my_struct_key<K&, V> {
+    const K& operator()(const V& mv) {
+        return const_cast<const K&>(mv.my_key);
+    }
+};
+
+using tbb::internal::is_ref;
+
+template<class K, class V> struct VtoKFB {
+    typedef tbb::flow::interface10::internal::type_to_key_function_body<V, K> type;
+};
+
+template<typename K> struct make_hash_compare { typedef typename tbb::tbb_hash_compare<K> type; };
+
+template<typename K, class V>
+void hash_buffer_test(const char *sname) {
+    typedef typename K_deref<K>::type KnoR;
+    tbb::flow::interface10::internal::hash_buffer<
+        K,
+        V,
+        typename VtoKFB<K, V>::type,
+        tbb::tbb_hash_compare<KnoR>
+    > my_hash_buffer;
+    const bool k_is_ref = is_ref<K>::value;
+    typedef tbb::flow::interface10::internal::type_to_key_function_body_leaf<
+        V, K, my_struct_key<K, V> > my_func_body_type;
+    typename VtoKFB<K, V>::type *kp = new my_func_body_type(my_struct_key<K, V>());
+    my_hash_buffer.set_key_func(kp);
+    REMARK("Running hash_buffer test on %s; is ref == %s\n", sname, k_is_ref ? "true" : "false");
+    V mv1, mv0;
+    bool res;
+    for(int cnt = 0; cnt < 2; ++cnt) {
+        // insert 50 items after checking they are not already in the table
+        for(int i = 0; i < 50; ++i) {
+            KnoR kk = index_to_key<KnoR>()(i);
+            mv1.my_key = kk;
+            mv1.my_value = 0.5*i;
+            res = my_hash_buffer.find_with_key(kk, mv0);
+            ASSERT(!res, "Found non-inserted item");
+            res = my_hash_buffer.insert_with_key(mv1);
+            ASSERT(res, "insert failed");
+            res = my_hash_buffer.find_with_key(kk, mv0);
+            ASSERT(res, "not found after insert");
+            ASSERT(mv0.my_value==mv1.my_value, "result not correct");
+        }
+        // go backwards checking they are still there.
+        for(int i = 49; i>=0; --i) {
+            KnoR kk = index_to_key<KnoR>()(i);
+            double value = 0.5*i;
+            res = my_hash_buffer.find_with_key(kk, mv0);
+            ASSERT(res, "find failed");
+            ASSERT(mv0.my_value==value, "result not correct");
+        }
+        // delete every third item, check they are gone
+        for(int i = 0; i < 50; i += 3) {
+            KnoR kk = index_to_key<KnoR>()(i);
+            my_hash_buffer.delete_with_key(kk);
+            res = my_hash_buffer.find_with_key(kk, mv0);
+            ASSERT(!res, "Found deleted item");
+        }
+        // check the deleted items are gone, the non-deleted items are there.
+        for(int i = 0; i < 50; ++i) {
+            KnoR kk = index_to_key<KnoR>()(i);
+            double value = 0.5*i;
+            if(i%3==0) {
+                res = my_hash_buffer.find_with_key(kk, mv0);
+                ASSERT(!res, "found an item that was previously deleted");
+            }
+            else {
+                res = my_hash_buffer.find_with_key(kk, mv0);
+                ASSERT(res, "find failed");
+                ASSERT(mv0.my_value==value, "result not correct");
+            }
+        }
+        // insert new items, check the deleted items return true, the non-deleted items return false.
+        for(int i = 0; i < 50; ++i) {
+            KnoR kk = index_to_key<KnoR>()(i);
+            double value = 1.5*i;
+            mv1.my_key = kk;
+            mv1.my_value = value;
+            res = my_hash_buffer.insert_with_key(mv1);
+            if(i%3==0) {
+                ASSERT(res, "didn't insert in empty slot");
+            }
+            else {
+                ASSERT(!res, "slot was empty on insert");
+            }
+        }
+        // delete all items
+        for(int i = 0; i < 50; ++i) {
+            KnoR kk = index_to_key<KnoR>()(i);
+            my_hash_buffer.delete_with_key(kk);
+            res = my_hash_buffer.find_with_key(kk, mv0);
+            ASSERT(!res, "Found deleted item");
+        }
+    }  // perform tasks twice
+}
+
+void
+TestTaggedBuffers() {
+    hash_buffer_test<int, MyKeyFirst<int, double> >("MyKeyFirst<int,double>");
+    hash_buffer_test<int&, MyKeyFirst<int, double> >("MyKeyFirst<int,double> with int&");
+    hash_buffer_test<int, MyKeySecond<int, double> >("MyKeySecond<int,double>");
+
+    hash_buffer_test<std::string, MyKeyFirst<std::string, double> >("MyKeyFirst<std::string,double>");
+    hash_buffer_test<std::string&, MyKeySecond<std::string, double> >("MyKeySecond<std::string,double> with std::string&");
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+template< typename T, typename NODE_TYPE >
+class test_join_base_extract : NoAssign {
+protected:
+    typedef typename NODE_TYPE::output_type tuple_t;
+    typedef tbb::flow::queue_node<T> in_queue_t;
+    typedef tbb::flow::queue_node<tuple_t> out_queue_t;
+
+    tbb::flow::graph &g;
+    in_queue_t &in0;
+    in_queue_t &in1;
+    in_queue_t &in2;
+    NODE_TYPE &middle;
+    out_queue_t &out0;
+    out_queue_t &out1;
+    in_queue_t *ins[3];
+    out_queue_t *outs[2];
+    typename in_queue_t::successor_type *ms_p0_ptr;
+    typename in_queue_t::successor_type *ms_p1_ptr;
+    typename out_queue_t::predecessor_type *mp_ptr;
+    typename in_queue_t::predecessor_list_type in0_p_list;
+    typename in_queue_t::successor_list_type in0_s_list;
+    typename in_queue_t::predecessor_list_type in1_p_list;
+    typename in_queue_t::successor_list_type in1_s_list;
+    typename in_queue_t::predecessor_list_type in2_p_list;
+    typename in_queue_t::successor_list_type in2_s_list;
+    typename out_queue_t::predecessor_list_type out0_p_list;
+    typename out_queue_t::successor_list_type out0_s_list;
+    typename out_queue_t::predecessor_list_type out1_p_list;
+    typename out_queue_t::successor_list_type out1_s_list;
+    typename in_queue_t::predecessor_list_type mp0_list;
+    typename in_queue_t::predecessor_list_type mp1_list;
+    typename out_queue_t::successor_list_type ms_list;
+
+    virtual void set_up_lists() {
+        in0_p_list.clear();
+        in0_s_list.clear();
+        in1_p_list.clear();
+        in1_s_list.clear();
+        in2_p_list.clear();
+        in2_s_list.clear();
+        out0_p_list.clear();
+        out0_s_list.clear();
+        out1_p_list.clear();
+        out1_s_list.clear();
+        mp0_list.clear();
+        mp1_list.clear();
+        ms_list.clear();
+
+        in0.copy_predecessors(in0_p_list);
+        in0.copy_successors(in0_s_list);
+        in1.copy_predecessors(in1_p_list);
+        in1.copy_successors(in1_s_list);
+        in2.copy_predecessors(in2_p_list);
+        in2.copy_successors(in2_s_list);
+        tbb::flow::input_port<0>(middle).copy_predecessors(mp0_list);
+        tbb::flow::input_port<1>(middle).copy_predecessors(mp1_list);
+        middle.copy_successors(ms_list);
+        out0.copy_predecessors(out0_p_list);
+        out0.copy_successors(out0_s_list);
+        out1.copy_predecessors(out1_p_list);
+        out1.copy_successors(out1_s_list);
+    }
+
+    void check_tuple(T &r, tuple_t &v) {
+        T t0 = tbb::flow::get<0>(v);
+        T t1 = tbb::flow::get<1>(v);
+        ASSERT((t0==1||t0==2)&&(t0&r)==0, "duplicate value");
+        r |= t0;
+        ASSERT((t1==4||t1==8)&&(t1&r)==0, "duplicate value");
+        r |= t1;
+    }
+
+    void make_and_validate_full_graph() {
+        /*     in0                         */
+        /*         \                       */
+        /*           port0          out0   */
+        /*         /       |      /        */
+        /*     in1         middle          */
+        /*                 |      \        */
+        /*     in2 - port1          out1   */
+        tbb::flow::make_edge(in0, tbb::flow::input_port<0>(middle));
+        tbb::flow::make_edge(in1, tbb::flow::input_port<0>(middle));
+        tbb::flow::make_edge(in2, tbb::flow::input_port<1>(middle));
+        tbb::flow::make_edge(middle, out0);
+        tbb::flow::make_edge(middle, out1);
+
+        set_up_lists();
+
+        ASSERT(in0.predecessor_count()==0&&in0_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in0.successor_count()==1&&in0_s_list.size()==1&&*(in0_s_list.begin())==ms_p0_ptr, "expected 1 successor");
+        ASSERT(in1.predecessor_count()==0&&in1_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in1.successor_count()==1&&in1_s_list.size()==1&&*(in1_s_list.begin())==ms_p0_ptr, "expected 1 successor");
+        ASSERT(in2.predecessor_count()==0&&in2_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in2.successor_count()==1&&in2_s_list.size()==1&&*(in2_s_list.begin())==ms_p1_ptr, "expected 1 successor");
+        ASSERT(tbb::flow::input_port<0>(middle).predecessor_count()==2&&mp0_list.size()==2, "expected 2 predecessors");
+        ASSERT(tbb::flow::input_port<1>(middle).predecessor_count()==1&&mp1_list.size()==1, "expected 1 predecessors");
+        ASSERT(middle.successor_count()==2&&ms_list.size()==2, "expected 2 successors");
+        ASSERT(out0.predecessor_count()==1&&out0_p_list.size()==1&&*(out0_p_list.begin())==mp_ptr, "expected 1 predecessor");
+        ASSERT(out0.successor_count()==0&&out0_s_list.size()==0, "expected 0 successors");
+        ASSERT(out1.predecessor_count()==1&&out1_p_list.size()==1&&*(out1_p_list.begin())==mp_ptr, "expected 1 predecessor");
+        ASSERT(out1.successor_count()==0&&out1_s_list.size()==0, "expected 0 successors");
+
+        typename in_queue_t::predecessor_list_type::iterator mp0_list_iter = mp0_list.begin(); ++mp0_list_iter;
+        int first_pred = *(mp0_list.begin())==ins[0] ? 0 : (*(mp0_list.begin())==ins[1] ? 1 : -1);
+        int second_pred = *mp0_list_iter==ins[0] ? 0 : (*mp0_list_iter==ins[1] ? 1 : -1);
+        ASSERT(first_pred!=-1&&second_pred!=-1&&first_pred!=second_pred, "bad predecessor(s) for middle port 0");
+
+        ASSERT(*(mp1_list.begin())==ins[2], "bad predecessor for middle port 1");
+
+        typename out_queue_t::successor_list_type::iterator ms_list_iter = ms_list.begin(); ++ms_list_iter;
+        int first_succ = *(ms_list.begin())==outs[0] ? 0 : (*(ms_list.begin())==outs[1] ? 1 : -1);
+        int second_succ = *ms_list_iter==outs[0] ? 0 : (*ms_list_iter==outs[1] ? 1 : -1);
+        ASSERT(first_succ!=-1&&second_succ!=-1&&first_succ!=second_succ, "bad successor(s) for middle");
+
+        in0.try_put(1);
+        in1.try_put(2);
+        in2.try_put(8);
+        in2.try_put(4);
+        g.wait_for_all();
+
+        T v_in;
+        tuple_t v;
+
+        ASSERT(in0.try_get(v_in)==false, "buffer should not have a value");
+        ASSERT(in1.try_get(v_in)==false, "buffer should not have a value");
+        ASSERT(in1.try_get(v_in)==false, "buffer should not have a value");
+        ASSERT(in2.try_get(v_in)==false, "buffer should not have a value");
+        ASSERT(in2.try_get(v_in)==false, "buffer should not have a value");
+
+        T r = 0;
+        while(out0.try_get(v)) {
+            check_tuple(r, v);
+            g.wait_for_all();
+        }
+        ASSERT(r==15, "not all values received");
+
+        r = 0;
+        while(out1.try_get(v)) {
+            check_tuple(r, v);
+            g.wait_for_all();
+        }
+        ASSERT(r==15, "not all values received");
+        g.wait_for_all();
+    }
+
+    void validate_partial_graph() {
+        /*     in0                         */
+        /*                                 */
+        /*           port0          out0   */
+        /*         /       |               */
+        /*     in1         middle          */
+        /*                 |      \        */
+        /*     in2 - port1          out1   */
+        set_up_lists();
+
+        ASSERT(in0.predecessor_count()==0&&in0_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in0.successor_count()==0&&in0_s_list.size()==0, "expected 0 successors");
+        ASSERT(in1.predecessor_count()==0&&in1_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in1.successor_count()==1&&in1_s_list.size()==1&&*(in1_s_list.begin())==ms_p0_ptr, "expected 1 successor");
+        ASSERT(in2.predecessor_count()==0&&in2_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in2.successor_count()==1&&in2_s_list.size()==1&&*(in2_s_list.begin())==ms_p1_ptr, "expected 1 successor");
+        ASSERT(tbb::flow::input_port<0>(middle).predecessor_count()==1&&mp0_list.size()==1&&*(mp0_list.begin())==ins[1], "expected 1 predecessor");
+        ASSERT(tbb::flow::input_port<1>(middle).predecessor_count()==1&&mp1_list.size()==1&&*(mp1_list.begin())==ins[2], "expected 1 predecessor");
+        ASSERT(middle.successor_count()==1&&ms_list.size()==1&&*(ms_list.begin())==outs[1], "expected 1 successor");
+        ASSERT(out0.predecessor_count()==0&&out0_p_list.size()==0, "expected 1 predecessor");
+        ASSERT(out0.successor_count()==0&&out0_s_list.size()==0, "expected 0 successors");
+        ASSERT(out1.predecessor_count()==1&&out1_p_list.size()==1&&*(out1_p_list.begin())==mp_ptr, "expected 1 predecessor");
+        ASSERT(out1.successor_count()==0&&out1_s_list.size()==0, "expected 0 successors");
+
+        in0.try_put(1);
+        in1.try_put(2);
+        in2.try_put(8);
+        in2.try_put(4);
+        g.wait_for_all();
+
+        T v_in;
+        tuple_t v;
+
+        ASSERT(in0.try_get(v_in)==true&&v_in==1, "buffer should have a value of 1");
+        ASSERT(in1.try_get(v_in)==false, "buffer should not have a value");
+        ASSERT(out0.try_get(v)==false, "buffer should not have a value");
+        ASSERT(out1.try_get(v)==true&&tbb::flow::get<0>(v)==2&&tbb::flow::get<1>(v)==8, "buffer should have a value of < 2, 8 >");
+        ASSERT(in0.try_get(v_in)==false, "buffer should not have a value");
+        g.wait_for_all();
+        g.reset();  // for queueing and tag_matching the 4 is now in the join
+    }
+
+    void validate_empty_graph() {
+        /*     in0                         */
+        /*                                 */
+        /*            port0         out0   */
+        /*                |                */
+        /*     in1         middle          */
+        /*                 |               */
+        /*     in2   port1          out1   */
+        set_up_lists();
+
+        ASSERT(in0.predecessor_count()==0&&in0_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in0.successor_count()==0&&in0_s_list.size()==0, "expected 0 successors");
+        ASSERT(in1.predecessor_count()==0&&in1_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in1.successor_count()==0&&in1_s_list.size()==0, "expected 0 successors");
+        ASSERT(in2.predecessor_count()==0&&in2_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(in2.successor_count()==0&&in2_s_list.size()==0, "expected 0 successors");
+        ASSERT(tbb::flow::input_port<0>(middle).predecessor_count()==0&&mp0_list.size()==0, "expected 0 predecessors");
+        ASSERT(tbb::flow::input_port<1>(middle).predecessor_count()==0&&mp1_list.size()==0, "expected 0 predecessors");
+        ASSERT(middle.successor_count()==0&&ms_list.size()==0, "expected 0 successors");
+        ASSERT(out0.predecessor_count()==0&&out0_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(out0.successor_count()==0&&out0_s_list.size()==0, "expected 0 successors");
+        ASSERT(out1.predecessor_count()==0&&out1_p_list.size()==0, "expected 0 predecessors");
+        ASSERT(out1.successor_count()==0&&out1_s_list.size()==0, "expected 0 successors");
+
+        in0.try_put(1);
+        in1.try_put(2);
+        in2.try_put(8);
+        in2.try_put(4);
+        g.wait_for_all();
+
+        T v_in;
+        tuple_t v;
+
+        ASSERT(in0.try_get(v_in)==true&&v_in==1, "buffer should have a value of 1");
+        ASSERT(in1.try_get(v_in)==true&&v_in==2, "buffer should have a value of 2");
+        ASSERT(in2.try_get(v_in)==true&&v_in==8, "buffer should have a value of 8");
+        ASSERT(in2.try_get(v_in)==true&&v_in==4, "buffer should have a value of 4");
+        ASSERT(out0.try_get(v)==false, "buffer should not have a value");
+        ASSERT(out1.try_get(v)==false, "buffer should not have a value");
+        g.wait_for_all();
+        g.reset(); // NOTE: this should not be necessary!!!!!  But it is!!!!
+    }
+
+public:
+
+    test_join_base_extract(tbb::flow::graph &_g, in_queue_t &_in0, in_queue_t &_in1, in_queue_t &_in2, NODE_TYPE &m, out_queue_t &_out0, out_queue_t &_out1):
+        g(_g), in0(_in0), in1(_in1), in2(_in2), middle(m), out0(_out0), out1(_out1) {
+        ins[0] = &in0;
+        ins[1] = &in1;
+        ins[2] = &in2;
+        outs[0] = &out0;
+        outs[1] = &out1;
+        ms_p0_ptr = static_cast< typename in_queue_t::successor_type * >(&tbb::flow::input_port<0>(middle));
+        ms_p1_ptr = static_cast< typename in_queue_t::successor_type * >(&tbb::flow::input_port<1>(middle));
+        mp_ptr = static_cast< typename out_queue_t::predecessor_type *>(&middle);
+    }
+
+    virtual ~test_join_base_extract() {}
+
+    void run_tests() {
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        in0.extract();
+        out0.extract();
+        REMARK("partial graph\n");
+        validate_partial_graph();
+
+        in1.extract();
+        in2.extract();
+        out1.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        middle.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        in0.extract();
+        in1.extract();
+        in2.extract();
+        middle.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+
+        out0.extract();
+        out1.extract();
+        middle.extract();
+        REMARK("empty graph\n");
+        validate_empty_graph();
+
+        REMARK("full graph\n");
+        make_and_validate_full_graph();
+    }
+};
+
+template< typename T, typename NODE_TYPE >
+class test_join_extract : public test_join_base_extract< T, NODE_TYPE > {
+protected:
+    typedef typename NODE_TYPE::output_type tuple_t;
+    typedef tbb::flow::queue_node<T> in_queue_t;
+    typedef tbb::flow::queue_node<tuple_t> out_queue_t;
+
+    tbb::flow::graph my_g;
+    in_queue_t my_in0;
+    in_queue_t my_in1;
+    in_queue_t my_in2;
+    NODE_TYPE my_middle;
+    out_queue_t my_out0;
+    out_queue_t my_out1;
+
+public:
+    test_join_extract(): test_join_base_extract<T, NODE_TYPE>(my_g, my_in0, my_in1, my_in2, my_middle, my_out0, my_out1),
+        my_in0(my_g), my_in1(my_g), my_in2(my_g), my_middle(my_g), my_out0(my_g), my_out1(my_g) { }
+};
+
+template< typename T >
+class test_join_extract<T, tbb::flow::join_node< tbb::flow::tuple<T, T>, tbb::flow::tag_matching> > :
+    public test_join_base_extract< T, tbb::flow::join_node< tbb::flow::tuple<T, T>, tbb::flow::tag_matching> > {
+protected:
+    typedef tbb::flow::join_node< tbb::flow::tuple<T, T>, tbb::flow::tag_matching> my_node_t;
+
+    typedef typename my_node_t::output_type tuple_t;
+    typedef tbb::flow::queue_node<T> in_queue_t;
+    typedef tbb::flow::queue_node<tuple_t> out_queue_t;
+
+    tbb::flow::graph my_g;
+    in_queue_t my_in0;
+    in_queue_t my_in1;
+    in_queue_t my_in2;
+    my_node_t my_middle;
+    out_queue_t my_out0;
+    out_queue_t my_out1;
+    struct tag_match_0 { size_t operator()(T v) { return v; } };
+    struct tag_match_1 { size_t operator()(T v) { return v/4; } };
+public:
+    test_join_extract(): test_join_base_extract<T, my_node_t>(my_g, my_in0, my_in1, my_in2, my_middle, my_out0, my_out1),
+        my_in0(my_g), my_in1(my_g), my_in2(my_g), my_middle(my_g, tag_match_0(), tag_match_1()), my_out0(my_g), my_out1(my_g) { }
+};
+#endif
+
+struct threebyte {
+    unsigned char b1;
+    unsigned char b2;
+    unsigned char b3;
+    threebyte(int i = 0) {
+        b1 = (unsigned char)(i&0xFF);
+        b2 = (unsigned char)((i>>8)&0xFF);
+        b3 = (unsigned char)((i>>16)&0xFF);
+    }
+    threebyte(const threebyte &other): b1(other.b1), b2(other.b2), b3(other.b3) { }
+    operator int() const { return (int)(b1+(b2<<8)+(b3<<16)); }
+};
+
+const int Count = 150;
+
+const int Recirc_count = 1000;  // number of tuples to be generated
+const int MaxPorts = 10;
+const int MaxNSources = 5; // max # of source_nodes to register for each join_node input in parallel test
+bool outputCheck[MaxPorts][Count];  // for checking output
+
+void
+check_outputCheck(int nUsed, int maxCnt) {
+    for(int i = 0; i < nUsed; ++i) {
+        for(int j = 0; j < maxCnt; ++j) {
+            ASSERT(outputCheck[i][j], NULL);
+        }
+    }
+}
+
+void
+reset_outputCheck(int nUsed, int maxCnt) {
+    for(int i = 0; i < nUsed; ++i) {
+        for(int j = 0; j < maxCnt; ++j) {
+            outputCheck[i][j] = false;
+        }
+    }
+}
+
+template<typename T>
+class name_of {
+public:
+    static const char* name() { return  "Unknown"; }
+};
+template<typename T>
+class name_of<check_type<T> > {
+public:
+    static const char* name() { return "checktype"; }
+};
+template<>
+class name_of<int> {
+public:
+    static const char* name() { return  "int"; }
+};
+template<>
+class name_of<float> {
+public:
+    static const char* name() { return  "float"; }
+};
+template<>
+class name_of<double> {
+public:
+    static const char* name() { return  "double"; }
+};
+template<>
+class name_of<long> {
+public:
+    static const char* name() { return  "long"; }
+};
+template<>
+class name_of<short> {
+public:
+    static const char* name() { return  "short"; }
+};
+template<>
+class name_of<threebyte> {
+public:
+    static const char* name() { return "threebyte"; }
+};
+template<>
+class name_of<std::string> {
+public:
+    static const char* name() { return "std::string"; }
+};
+template<typename K, typename V>
+class name_of<MyKeyFirst<K, V> > {
+public:
+    static const char* name() { return "MyKeyFirst<K,V>"; }
+};
+template<typename K, typename V>
+class name_of<MyKeySecond<K, V> > {
+public:
+    static const char* name() { return "MyKeySecond<K,V>"; }
+};
+
+// The additional policy to differ message based key matching from usual key matching.
+// It only has sense for the test because join_node is created with the key_matching policy for the both cases.
+template <typename K, typename KHash = tbb::tbb_hash_compare<typename tbb::internal::strip<K>::type > >
+struct message_based_key_matching {};
+
+// test for key_matching
+template<class JP>
+struct is_key_matching_join {
+    static const bool value;
+    typedef int key_type;  // have to define it to something
+};
+
+template<class JP>
+const bool is_key_matching_join<JP>::value = false;
+
+template<class K, class KHash>
+struct is_key_matching_join<tbb::flow::key_matching<K, KHash> > {
+    static const bool value;
+    typedef K key_type;
+};
+
+template<class K, class KHash>
+const bool is_key_matching_join<tbb::flow::key_matching<K, KHash> >::value = true;
+
+template<class K, class KHash>
+struct is_key_matching_join<message_based_key_matching<K, KHash> > {
+    static const bool value;
+    typedef K key_type;
+};
+
+template<class K, class KHash>
+const bool is_key_matching_join<message_based_key_matching<K, KHash> >::value = true;
+
+// for recirculating tags, input is tuple<index,continue_msg>
+// output is index*my_mult cast to the right type
+template<typename TT>
+class recirc_func_body {
+    TT my_mult;
+public:
+    typedef tbb::flow::tuple<int, tbb::flow::continue_msg> input_type;
+    recirc_func_body(TT multiplier): my_mult(multiplier) {}
+    recirc_func_body(const recirc_func_body &other): my_mult(other.my_mult) { }
+    void operator=(const recirc_func_body &other) { my_mult = other.my_mult; }
+    TT operator()(const input_type &v) {
+        return TT(tbb::flow::get<0>(v)) * my_mult;
+    }
+};
+
+static int input_count;  // source_nodes are serial
+
+// emit input_count continue_msg
+class recirc_source_node_body {
+public:
+    bool operator()(tbb::flow::continue_msg &v) {
+        --input_count;
+        v = tbb::flow::continue_msg();
+        return 0<=input_count;
+    }
+};
+
+// T must be arithmetic, and shouldn't wrap around for reasonable sizes of Count (which is now 150, and maxPorts is 10,
+// so the max number generated right now is 1500 or so.)  Source will generate a series of TT with value
+// (init_val + (i-1)*addend) * my_mult, where i is the i-th invocation of the body.  We are attaching addend
+// source nodes to a join_port, and each will generate part of the numerical series the port is expecting
+// to receive.  If there is only one source node, the series order will be maintained; if more than one,
+// this is not guaranteed.
+template<typename TT, size_t INDEX>
+class source_body {
+    int my_count;
+    int addend;
+public:
+    source_body(int init_val, int addto): my_count(init_val), addend(addto) { }
+    void operator=(const source_body& other) { my_count = other.my_count; addend = other.addend; }
+    bool operator()(TT &v) {
+        int lc = my_count;
+        v = make_thingie<TT, INDEX>()(my_count);
+        my_count += addend;
+        return lc < Count;
+    }
+};
+
+template<typename TT>
+class tag_func {
+    TT my_mult;
+public:
+    tag_func(TT multiplier): my_mult(multiplier) { }
+    void operator=(const tag_func& other) { my_mult = other.my_mult; }
+    // operator() will return [0 .. Count)
+    tbb::flow::tag_value operator()(TT v) {
+        tbb::flow::tag_value t = tbb::flow::tag_value(v/my_mult);
+        return t;
+    }
+};
+
+template <class JP>
+struct filter_out_message_based_key_matching {
+    typedef JP policy;
+};
+
+template <typename K, typename KHash>
+struct filter_out_message_based_key_matching<message_based_key_matching<K, KHash> > {
+    // To have message based key matching in join_node, the key_matchig policy should be specified.
+    typedef tbb::flow::key_matching<K, KHash> policy;
+};
+
+// allocator for join_node.  This is specialized for tag_matching and key_matching joins because they require a variable number
+// of tag_value methods passed to the constructor
+
+template<int N, typename JType, class JP>
+class makeJoin {
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g);
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+// for general key_matching case, each type in the tuple is a class that has the my_key field and the my_value field.
+//
+template<typename JType, typename K, typename KHash>
+class makeJoin<2, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<2, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+#if MAX_TUPLE_TEST_SIZE >= 3
+template<typename JType, typename K, typename KHash>
+class makeJoin<3, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<3, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 4
+
+template<typename JType, typename K, typename KHash>
+class makeJoin<4, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<4, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 5
+template<typename JType, typename K, typename KHash>
+class makeJoin<5, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>(),
+            my_struct_key<K, T4>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<5, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5)),
+            tag_func<T4>(T4(6))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 6
+template<typename JType, typename K, typename KHash>
+class makeJoin<6, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>(),
+            my_struct_key<K, T4>(),
+            my_struct_key<K, T5>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<6, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5)),
+            tag_func<T4>(T4(6)),
+            tag_func<T5>(T5(7))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+#endif
+
+#if MAX_TUPLE_TEST_SIZE >= 7
+template<typename JType, typename K, typename KHash>
+class makeJoin<7, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>(),
+            my_struct_key<K, T4>(),
+            my_struct_key<K, T5>(),
+            my_struct_key<K, T6>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<7, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5)),
+            tag_func<T4>(T4(6)),
+            tag_func<T5>(T5(7)),
+            tag_func<T6>(T6(8))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+#endif
+
+#if MAX_TUPLE_TEST_SIZE >= 8
+template<typename JType, typename K, typename KHash>
+class makeJoin<8, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+    typedef typename tbb::flow::tuple_element<7, TType>::type T7;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>(),
+            my_struct_key<K, T4>(),
+            my_struct_key<K, T5>(),
+            my_struct_key<K, T6>(),
+            my_struct_key<K, T7>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<8, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+    typedef typename tbb::flow::tuple_element<7, TType>::type T7;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5)),
+            tag_func<T4>(T4(6)),
+            tag_func<T5>(T5(7)),
+            tag_func<T6>(T6(8)),
+            tag_func<T7>(T7(9))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+#endif
+
+#if MAX_TUPLE_TEST_SIZE >= 9
+template<typename JType, typename K, typename KHash>
+class makeJoin<9, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+    typedef typename tbb::flow::tuple_element<7, TType>::type T7;
+    typedef typename tbb::flow::tuple_element<8, TType>::type T8;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>(),
+            my_struct_key<K, T4>(),
+            my_struct_key<K, T5>(),
+            my_struct_key<K, T6>(),
+            my_struct_key<K, T7>(),
+            my_struct_key<K, T8>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<9, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+    typedef typename tbb::flow::tuple_element<7, TType>::type T7;
+    typedef typename tbb::flow::tuple_element<8, TType>::type T8;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5)),
+            tag_func<T4>(T4(6)),
+            tag_func<T5>(T5(7)),
+            tag_func<T6>(T6(8)),
+            tag_func<T7>(T7(9)),
+            tag_func<T8>(T8(10))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+#endif
+
+#if MAX_TUPLE_TEST_SIZE >= 10
+template<typename JType, typename K, typename KHash>
+class makeJoin<10, JType, tbb::flow::key_matching<K, KHash> > {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+    typedef typename tbb::flow::tuple_element<7, TType>::type T7;
+    typedef typename tbb::flow::tuple_element<8, TType>::type T8;
+    typedef typename tbb::flow::tuple_element<9, TType>::type T9;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            my_struct_key<K, T0>(),
+            my_struct_key<K, T1>(),
+            my_struct_key<K, T2>(),
+            my_struct_key<K, T3>(),
+            my_struct_key<K, T4>(),
+            my_struct_key<K, T5>(),
+            my_struct_key<K, T6>(),
+            my_struct_key<K, T7>(),
+            my_struct_key<K, T8>(),
+            my_struct_key<K, T9>()
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+
+template<typename JType>
+class makeJoin<10, JType, tbb::flow::tag_matching> {
+    typedef typename JType::output_type TType;
+    typedef typename tbb::flow::tuple_element<0, TType>::type T0;
+    typedef typename tbb::flow::tuple_element<1, TType>::type T1;
+    typedef typename tbb::flow::tuple_element<2, TType>::type T2;
+    typedef typename tbb::flow::tuple_element<3, TType>::type T3;
+    typedef typename tbb::flow::tuple_element<4, TType>::type T4;
+    typedef typename tbb::flow::tuple_element<5, TType>::type T5;
+    typedef typename tbb::flow::tuple_element<6, TType>::type T6;
+    typedef typename tbb::flow::tuple_element<7, TType>::type T7;
+    typedef typename tbb::flow::tuple_element<8, TType>::type T8;
+    typedef typename tbb::flow::tuple_element<9, TType>::type T9;
+public:
+    static JType *create(tbb::flow::graph& g) {
+        JType *temp = new JType(g,
+            tag_func<T0>(T0(2)),
+            tag_func<T1>(T1(3)),
+            tag_func<T2>(T2(4)),
+            tag_func<T3>(T3(5)),
+            tag_func<T4>(T4(6)),
+            tag_func<T5>(T5(7)),
+            tag_func<T6>(T6(8)),
+            tag_func<T7>(T7(9)),
+            tag_func<T8>(T8(10)),
+            tag_func<T9>(T9(11))
+        );
+        return temp;
+    }
+    static void destroy(JType *p) { delete p; }
+};
+#endif
+
+// holder for source_node pointers for eventual deletion
+
+static void* all_source_nodes[MaxPorts][MaxNSources];
+
+template<int ELEM, typename JNT>
+class source_node_helper {
+public:
+    typedef JNT join_node_type;
+    typedef tbb::flow::join_node<tbb::flow::tuple<int, tbb::flow::continue_msg>, tbb::flow::reserving> input_join_type;
+    typedef typename join_node_type::output_type TT;
+    typedef typename tbb::flow::tuple_element<ELEM-1, TT>::type IT;
+    typedef typename tbb::flow::source_node<IT> my_source_node_type;
+    typedef typename tbb::flow::function_node<tbb::flow::tuple<int, tbb::flow::continue_msg>, IT> my_recirc_function_type;
+    static void print_remark(const char * str) {
+        source_node_helper<ELEM-1, JNT>::print_remark(str);
+        REMARK(", %s", name_of<IT>::name());
+    }
+    static void add_source_nodes(join_node_type &my_join, tbb::flow::graph &g, int nInputs) {
+        for(int i = 0; i < nInputs; ++i) {
+            my_source_node_type *new_node = new my_source_node_type(g, source_body<IT, ELEM>(i, nInputs));
+            tbb::flow::make_edge(*new_node, tbb::flow::input_port<ELEM-1>(my_join));
+            all_source_nodes[ELEM-1][i] = (void *)new_node;
+        }
+        // add the next source_node
+        source_node_helper<ELEM-1, JNT>::add_source_nodes(my_join, g, nInputs);
+    }
+
+    static void add_recirc_func_nodes(join_node_type &my_join, input_join_type &my_input, tbb::flow::graph &g) {
+        my_recirc_function_type *new_node = new my_recirc_function_type(g, tbb::flow::unlimited, recirc_func_body<IT>((IT)(ELEM+1)));
+        tbb::flow::make_edge(*new_node, tbb::flow::input_port<ELEM-1>(my_join));
+        tbb::flow::make_edge(my_input, *new_node);
+        all_source_nodes[ELEM-1][0] = (void *)new_node;
+        source_node_helper<ELEM-1, JNT>::add_recirc_func_nodes(my_join, my_input, g);
+    }
+
+    static void only_check_value(const int i, const TT &v) {
+        ASSERT(tbb::flow::get<ELEM-1>(v)==(IT)(i*(ELEM+1)), NULL);
+        source_node_helper<ELEM-1, JNT>::only_check_value(i, v);
+    }
+
+    static void check_value(int i, TT &v, bool is_serial) {
+        // the fetched value will match only if there is only one source_node.
+        ASSERT(!is_serial||tbb::flow::get<ELEM-1>(v)==(IT)(i*(ELEM+1)), NULL);
+        // tally the fetched value.
+        int ival = (int)tbb::flow::get<ELEM-1>(v);
+        ASSERT(!(ival%(ELEM+1)), NULL);
+        ival /= (ELEM+1);
+        ASSERT(!outputCheck[ELEM-1][ival], NULL);
+        outputCheck[ELEM-1][ival] = true;
+        source_node_helper<ELEM-1, JNT>::check_value(i, v, is_serial);
+    }
+    static void remove_source_nodes(join_node_type& my_join, int nInputs) {
+        for(int i = 0; i< nInputs; ++i) {
+            my_source_node_type *dp = reinterpret_cast<my_source_node_type *>(all_source_nodes[ELEM-1][i]);
+            tbb::flow::remove_edge(*dp, tbb::flow::input_port<ELEM-1>(my_join));
+            delete dp;
+        }
+        source_node_helper<ELEM-1, JNT>::remove_source_nodes(my_join, nInputs);
+    }
+
+    static void remove_recirc_func_nodes(join_node_type& my_join, input_join_type &my_input) {
+        my_recirc_function_type *fn = reinterpret_cast<my_recirc_function_type *>(all_source_nodes[ELEM-1][0]);
+        tbb::flow::remove_edge(*fn, tbb::flow::input_port<ELEM-1>(my_join));
+        tbb::flow::remove_edge(my_input, *fn);
+        delete fn;
+        source_node_helper<ELEM-1, JNT>::remove_recirc_func_nodes(my_join, my_input);
+    }
+};
+
+template<typename JNT>
+class source_node_helper<1, JNT> {
+    typedef JNT join_node_type;
+    typedef tbb::flow::join_node<tbb::flow::tuple<int, tbb::flow::continue_msg>, tbb::flow::reserving> input_join_type;
+    typedef typename join_node_type::output_type TT;
+    typedef typename tbb::flow::tuple_element<0, TT>::type IT;
+    typedef typename tbb::flow::source_node<IT> my_source_node_type;
+    typedef typename tbb::flow::function_node<tbb::flow::tuple<int, tbb::flow::continue_msg>, IT> my_recirc_function_type;
+public:
+    static void print_remark(const char * str) {
+        REMARK("%s< %s", str, name_of<IT>::name());
+    }
+    static void add_source_nodes(join_node_type &my_join, tbb::flow::graph &g, int nInputs) {
+        for(int i = 0; i < nInputs; ++i) {
+            my_source_node_type *new_node = new my_source_node_type(g, source_body<IT, 1>(i, nInputs));
+            tbb::flow::make_edge(*new_node, tbb::flow::input_port<0>(my_join));
+            all_source_nodes[0][i] = (void *)new_node;
+        }
+    }
+
+    static void add_recirc_func_nodes(join_node_type &my_join, input_join_type &my_input, tbb::flow::graph &g) {
+        my_recirc_function_type *new_node = new my_recirc_function_type(g, tbb::flow::unlimited, recirc_func_body<IT>((IT)(2)));
+        tbb::flow::make_edge(*new_node, tbb::flow::input_port<0>(my_join));
+        tbb::flow::make_edge(my_input, *new_node);
+        all_source_nodes[0][0] = (void *)new_node;
+    }
+
+    static void only_check_value(const int i, const TT &v) {
+        ASSERT(tbb::flow::get<0>(v)==(IT)(i*2), NULL);
+    }
+
+    static void check_value(int i, TT &v, bool is_serial) {
+        ASSERT(!is_serial||tbb::flow::get<0>(v)==(IT)(i*(2)), NULL);
+        int ival = (int)tbb::flow::get<0>(v);
+        ASSERT(!(ival%2), NULL);
+        ival /= 2;
+        ASSERT(!outputCheck[0][ival], NULL);
+        outputCheck[0][ival] = true;
+    }
+    static void remove_source_nodes(join_node_type& my_join, int nInputs) {
+        for(int i = 0; i < nInputs; ++i) {
+            my_source_node_type *dp = reinterpret_cast<my_source_node_type *>(all_source_nodes[0][i]);
+            tbb::flow::remove_edge(*dp, tbb::flow::input_port<0>(my_join));
+            delete dp;
+        }
+    }
+
+    static void remove_recirc_func_nodes(join_node_type& my_join, input_join_type &my_input) {
+        my_recirc_function_type *fn = reinterpret_cast<my_recirc_function_type *>(all_source_nodes[0][0]);
+        tbb::flow::remove_edge(*fn, tbb::flow::input_port<0>(my_join));
+        tbb::flow::remove_edge(my_input, *fn);
+        delete fn;
+    }
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+// Suppress "conditional expression is constant" warning.
+#pragma warning( push )
+#pragma warning( disable: 4127 )
+#endif
+
+template<typename JType, class JP>
+class parallel_test {
+public:
+    typedef typename JType::output_type TType;
+    typedef typename is_key_matching_join<JP>::key_type            key_type;
+    static void test() {
+        const int TUPLE_SIZE = tbb::flow::tuple_size<TType>::value;
+        const bool is_key_matching = is_key_matching_join<JP>::value;
+
+        TType v;
+        source_node_helper<TUPLE_SIZE, JType>::print_remark("Parallel test of join_node");
+        REMARK(" > ");
+        if(is_key_matching) {
+            REMARK("with K == %s", name_of<typename K_deref<typename is_key_matching_join<JP>::key_type>::type >::name());
+            if(is_ref<typename is_key_matching_join<JP>::key_type>::value) {
+                REMARK("&");
+            }
+        }
+        REMARK("\n");
+        for(int i = 0; i < MaxPorts; ++i) {
+            for(int j = 0; j < MaxNSources; ++j) {
+                all_source_nodes[i][j] = NULL;
+            }
+        }
+        for(int nInputs = 1; nInputs<=MaxNSources; ++nInputs) {
+            tbb::flow::graph g;
+            bool not_out_of_order = (nInputs==1)&&(!is_key_matching);
+            JType* my_join = makeJoin<TUPLE_SIZE, JType, JP>::create(g);
+            tbb::flow::queue_node<TType> outq1(g);
+            tbb::flow::queue_node<TType> outq2(g);
+
+            tbb::flow::make_edge(*my_join, outq1);
+            tbb::flow::make_edge(*my_join, outq2);
+
+            source_node_helper<TUPLE_SIZE, JType>::add_source_nodes((*my_join), g, nInputs);
+
+            g.wait_for_all();
+
+            reset_outputCheck(TUPLE_SIZE, Count);
+            for(int i = 0; i < Count; ++i) {
+                ASSERT(outq1.try_get(v), NULL);
+                source_node_helper<TUPLE_SIZE, JType>::check_value(i, v, not_out_of_order);
+            }
+
+            check_outputCheck(TUPLE_SIZE, Count);
+            reset_outputCheck(TUPLE_SIZE, Count);
+
+            for(int i = 0; i < Count; i++) {
+                ASSERT(outq2.try_get(v), NULL);;
+                source_node_helper<TUPLE_SIZE, JType>::check_value(i, v, not_out_of_order);
+            }
+            check_outputCheck(TUPLE_SIZE, Count);
+
+            ASSERT(!outq1.try_get(v), NULL);
+            ASSERT(!outq2.try_get(v), NULL);
+
+            source_node_helper<TUPLE_SIZE, JType>::remove_source_nodes((*my_join), nInputs);
+            tbb::flow::remove_edge(*my_join, outq1);
+            tbb::flow::remove_edge(*my_join, outq2);
+            makeJoin<TUPLE_SIZE, JType, JP>::destroy(my_join);
+        }
+    }
+};
+
+
+template<int ELEM, typename JType>
+class serial_queue_helper {
+public:
+    typedef typename JType::output_type TT;
+    typedef typename tbb::flow::tuple_element<ELEM-1, TT>::type IT;
+    typedef typename tbb::flow::queue_node<IT> my_queue_node_type;
+    static void print_remark() {
+        serial_queue_helper<ELEM-1, JType>::print_remark();
+        REMARK(", %s", name_of<IT>::name());
+    }
+    static void add_queue_nodes(tbb::flow::graph &g, JType &my_join) {
+        serial_queue_helper<ELEM-1, JType>::add_queue_nodes(g, my_join);
+        my_queue_node_type *new_node = new my_queue_node_type(g);
+        tbb::flow::make_edge(*new_node, tbb::flow::get<ELEM-1>(my_join.input_ports()));
+        all_source_nodes[ELEM-1][0] = (void *)new_node;
+    }
+
+    static void fill_one_queue(int maxVal) {
+        // fill queue to "left" of me
+        my_queue_node_type *qptr = reinterpret_cast<my_queue_node_type *>(all_source_nodes[ELEM-1][0]);
+        serial_queue_helper<ELEM-1, JType>::fill_one_queue(maxVal);
+        for(int i = 0; i < maxVal; ++i) {
+            ASSERT(qptr->try_put(make_thingie<IT, ELEM>()(i)), NULL);
+        }
+    }
+
+    static void put_one_queue_val(int myVal) {
+        // put this val to my "left".
+        serial_queue_helper<ELEM-1, JType>::put_one_queue_val(myVal);
+        my_queue_node_type *qptr = reinterpret_cast<my_queue_node_type *>(all_source_nodes[ELEM-1][0]);
+        ASSERT(qptr->try_put(make_thingie<IT, ELEM>()(myVal)), NULL);
+    }
+
+    static void check_queue_value(int i, TT &v) {
+        serial_queue_helper<ELEM-1, JType>::check_queue_value(i, v);
+        ASSERT(cast_from<IT>::my_int_val(tbb::flow::get<ELEM-1>(v))==i * (ELEM+1), NULL);
+    }
+
+    static void remove_queue_nodes(JType &my_join) {
+        my_queue_node_type *vptr = reinterpret_cast<my_queue_node_type *>(all_source_nodes[ELEM-1][0]);
+        tbb::flow::remove_edge(*vptr, tbb::flow::get<ELEM-1>(my_join.input_ports()));
+        serial_queue_helper<ELEM-1, JType>::remove_queue_nodes(my_join);
+        delete vptr;
+    }
+};
+
+template<typename JType>
+class serial_queue_helper<1, JType> {
+public:
+    typedef typename JType::output_type TT;
+    typedef typename tbb::flow::tuple_element<0, TT>::type IT;
+    typedef typename tbb::flow::queue_node<IT> my_queue_node_type;
+    static void print_remark() {
+        REMARK("Serial test of join_node< %s", name_of<IT>::name());
+    }
+
+    static void add_queue_nodes(tbb::flow::graph &g, JType &my_join) {
+        my_queue_node_type *new_node = new my_queue_node_type(g);
+        tbb::flow::make_edge(*new_node, tbb::flow::input_port<0>(my_join));
+        all_source_nodes[0][0] = (void *)new_node;
+    }
+
+    static void fill_one_queue(int maxVal) {
+        my_queue_node_type *qptr = reinterpret_cast<my_queue_node_type *>(all_source_nodes[0][0]);
+        for(int i = 0; i < maxVal; ++i) {
+            ASSERT(qptr->try_put(make_thingie<IT, 1>()(i)), NULL);
+        }
+    }
+
+    static void put_one_queue_val(int myVal) {
+        my_queue_node_type *qptr = reinterpret_cast<my_queue_node_type *>(all_source_nodes[0][0]);
+        IT my_val = make_thingie<IT, 1>()(myVal);
+        ASSERT(qptr->try_put(my_val), NULL);
+    }
+
+    static void check_queue_value(int i, TT &v) {
+        ASSERT(cast_from<IT>::my_int_val(tbb::flow::get<0>(v))==i*2, NULL);
+    }
+
+    static void remove_queue_nodes(JType &my_join) {
+        my_queue_node_type *vptr = reinterpret_cast<my_queue_node_type *>(all_source_nodes[0][0]);
+        tbb::flow::remove_edge(*vptr, tbb::flow::get<0>(my_join.input_ports()));
+        delete vptr;
+    }
+};
+
+//
+// Single reservable predecessor at each port, single accepting successor
+//   * put to buffer before port0, then put to buffer before port1, ...
+//   * fill buffer before port0 then fill buffer before port1, ...
+
+template<typename JType, class JP>
+void test_one_serial(JType &my_join, tbb::flow::graph &g) {
+    typedef typename JType::output_type TType;
+    static const int TUPLE_SIZE = tbb::flow::tuple_size<TType>::value;
+    bool is_key_matching = is_key_matching_join<JP>::value;
+    std::vector<bool> flags;
+    serial_queue_helper<TUPLE_SIZE, JType>::add_queue_nodes(g, my_join);
+    typedef TType q3_input_type;
+    tbb::flow::queue_node< q3_input_type >  q3(g);
+
+    tbb::flow::make_edge(my_join, q3);
+
+    // fill each queue with its value one-at-a-time
+    flags.clear();
+    for(int i = 0; i < Count; ++i) {
+        serial_queue_helper<TUPLE_SIZE, JType>::put_one_queue_val(i);
+        flags.push_back(false);
+    }
+
+    g.wait_for_all();
+    for(int i = 0; i < Count; ++i) {
+        q3_input_type v;
+        g.wait_for_all();
+        ASSERT(q3.try_get(v), "Error in try_get()");
+        if(is_key_matching) {
+            // because we look up tags in the hash table, the output may be out of order.
+            int j = int(tbb::flow::get<0>(v))/2;  // figure what the index should be
+            serial_queue_helper<TUPLE_SIZE, JType>::check_queue_value(j, v);
+            flags[j] = true;
+        }
+        else {
+            serial_queue_helper<TUPLE_SIZE, JType>::check_queue_value(i, v);
+        }
+    }
+
+    if(is_key_matching) {
+        for(int i = 0; i < Count; ++i) {
+            ASSERT(flags[i], NULL);
+            flags[i] = false;
+        }
+    }
+
+    // fill each queue completely before filling the next.
+    serial_queue_helper<TUPLE_SIZE, JType>::fill_one_queue(Count);
+
+    g.wait_for_all();
+    for(int i = 0; i < Count; ++i) {
+        q3_input_type v;
+        g.wait_for_all();
+        ASSERT(q3.try_get(v), "Error in try_get()");
+        if(is_key_matching) {
+            int j = int(tbb::flow::get<0>(v))/2;
+            serial_queue_helper<TUPLE_SIZE, JType>::check_queue_value(j, v);
+            flags[i] = true;
+        }
+        else {
+            serial_queue_helper<TUPLE_SIZE, JType>::check_queue_value(i, v);
+        }
+    }
+
+    if(is_key_matching) {
+        for(int i = 0; i < Count; ++i) {
+            ASSERT(flags[i], NULL);
+        }
+    }
+
+    serial_queue_helper<TUPLE_SIZE, JType>::remove_queue_nodes(my_join);
+
+}
+
+template<typename JType, class JP>
+class serial_test {
+    typedef typename JType::output_type TType;
+public:
+    static void test() {
+        tbb::flow::graph g;
+        std::vector<bool> flags;
+        bool is_key_matching = is_key_matching_join<JP>::value;
+        flags.reserve(Count);
+
+        const int TUPLE_SIZE = tbb::flow::tuple_size<TType>::value;
+        static const int ELEMS = 3;
+
+        JType* my_join = makeJoin<TUPLE_SIZE, JType, JP>::create(g);
+        test_input_ports_return_ref(*my_join);
+        serial_queue_helper<TUPLE_SIZE, JType>::print_remark(); REMARK(" >");
+        if(is_key_matching) {
+            REMARK("with K == %s", name_of<typename K_deref<typename is_key_matching_join<JP>::key_type>::type >::name());
+            if(is_ref<typename is_key_matching_join<JP>::key_type>::value) {
+                REMARK("&");
+            }
+        }
+        REMARK("\n");
+
+        test_one_serial<JType, JP>(*my_join, g);
+        // build the vector with copy construction from the used join node.
+        std::vector<JType>join_vector(ELEMS, *my_join);
+        // destroy the tired old join_node in case we're accidentally reusing pieces of it.
+        makeJoin<TUPLE_SIZE, JType, JP>::destroy(my_join);
+
+        for(int e = 0; e < ELEMS; ++e) {  // exercise each of the vector elements
+            test_one_serial<JType, JP>(join_vector[e], g);
+        }
+    }
+
+}; // serial_test
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning( pop )
+#endif
+
+template<
+    template<typename, class > class TestType,  // serial_test or parallel_test
+    typename OutputTupleType,           // type of the output of the join
+    class J>                 // graph_buffer_policy (reserving, queueing, tag_matching or key_matching)
+    class generate_test {
+    public:
+        typedef tbb::flow::join_node<OutputTupleType, typename filter_out_message_based_key_matching<J>::policy> join_node_type;
+        static void do_test() {
+            TestType<join_node_type, J>::test();
+        }
+};
+
+template<class JP>
+void test_input_port_policies();
+
+// join_node (reserving) does not consume inputs until an item is available at
+// every input.  It tries to reserve each input, and if any fails it releases the
+// reservation.  When it builds a tuple it broadcasts to all its successors and
+// consumes all the inputs.
+//
+// So our test will put an item at one input port, then attach another node to the
+// same node (a queue node in this case).  The second successor should receive the
+// item in the queue, emptying it.
+//
+// We then place an item in the second input queue, and check the output queues; they
+// should still be empty.  Then we place an item in the first queue; the output queues
+// should then receive a tuple.
+//
+// we then attach another function node to the second input.  It should not receive
+// an item, verifying that the item in the queue is consumed.
+template<>
+void test_input_port_policies<tbb::flow::reserving>() {
+    tbb::flow::graph g;
+    typedef tbb::flow::join_node<tbb::flow::tuple<int, int>, tbb::flow::reserving > JType; // two-phase is the default policy
+                                                                                           // create join_node<type0,type1> jn
+    JType jn(g);
+    // create output_queue oq0, oq1
+    typedef JType::output_type OQType;
+    tbb::flow::queue_node<OQType> oq0(g);
+    tbb::flow::queue_node<OQType> oq1(g);
+    // create iq0, iq1
+    typedef tbb::flow::queue_node<int> IQType;
+    IQType iq0(g);
+    IQType iq1(g);
+    // create qnp, qnq
+    IQType qnp(g);
+    IQType qnq(g);
+    REMARK("Testing policies of join_node<reserving> input ports\n");
+    // attach jn to oq0, oq1
+    tbb::flow::make_edge(jn, oq0);
+    tbb::flow::make_edge(jn, oq1);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(jn.successor_count()==2, NULL);
+    JType::successor_list_type my_succs;
+    jn.copy_successors(my_succs);
+    ASSERT(my_succs.size()==2, NULL);
+#endif
+    // attach iq0, iq1 to jn
+    tbb::flow::make_edge(iq0, tbb::flow::get<0>(jn.input_ports()));
+    tbb::flow::make_edge(iq1, tbb::flow::get<1>(jn.input_ports()));
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(tbb::flow::get<0>(jn.input_ports()).predecessor_count()==1, NULL);
+    tbb::flow::tuple_element<0, JType::input_type>::type::predecessor_list_type my_0preds;
+    tbb::flow::input_port<0>(jn).copy_predecessors(my_0preds);
+    ASSERT(my_0preds.size()==1, NULL);
+#endif
+    for(int loop = 0; loop < 3; ++loop) {
+        // place one item in iq0
+        ASSERT(iq0.try_put(1), "Error putting to iq1");
+        // attach iq0 to qnp
+        tbb::flow::make_edge(iq0, qnp);
+        // qnp should have an item in it.
+        g.wait_for_all();
+        {
+            int i;
+            ASSERT(qnp.try_get(i)&&i==1, "Error in item fetched by qnp");
+        }
+        // place item in iq1
+        ASSERT(iq1.try_put(2), "Error putting to iq1");
+        // oq0, oq1 should be empty
+        g.wait_for_all();
+        {
+            OQType t1;
+            ASSERT(!oq0.try_get(t1)&&!oq1.try_get(t1), "oq0 and oq1 not empty");
+        }
+        // detach qnp from iq0
+        tbb::flow::remove_edge(iq0, qnp); // if we don't remove qnp it will gobble any values we put in iq0
+                                          // place item in iq0
+        ASSERT(iq0.try_put(3), "Error on second put to iq0");
+        // oq0, oq1 should have items in them
+        g.wait_for_all();
+        {
+            OQType t0;
+            OQType t1;
+            ASSERT(oq0.try_get(t0)&&tbb::flow::get<0>(t0)==3&&tbb::flow::get<1>(t0)==2, "Error in oq0 output");
+            ASSERT(oq1.try_get(t1)&&tbb::flow::get<0>(t1)==3&&tbb::flow::get<1>(t1)==2, "Error in oq1 output");
+        }
+        // attach qnp to iq0, qnq to iq1
+        // qnp and qnq should be empty
+        tbb::flow::make_edge(iq0, qnp);
+        tbb::flow::make_edge(iq1, qnq);
+        g.wait_for_all();
+        {
+            int i;
+            ASSERT(!qnp.try_get(i), "iq0 still had value in it");
+            ASSERT(!qnq.try_get(i), "iq1 still had value in it");
+        }
+        tbb::flow::remove_edge(iq0, qnp);
+        tbb::flow::remove_edge(iq1, qnq);
+    } // for ( int loop ...
+}
+
+// join_node (queueing) consumes inputs as soon as they are available at
+// any input.  When it builds a tuple it broadcasts to all its successors and
+// discards the broadcast values.
+//
+// So our test will put an item at one input port, then attach another node to the
+// same node (a queue node in this case).  The second successor should not receive
+// an item (because the join consumed it).
+//
+// We then place an item in the second input queue, and check the output queues; they
+// should each have a tuple.
+//
+// we then attach another function node to the second input.  It should not receive
+// an item, verifying that the item in the queue is consumed.
+template<>
+void test_input_port_policies<tbb::flow::queueing>() {
+    tbb::flow::graph g;
+    typedef tbb::flow::join_node<tbb::flow::tuple<int, int>, tbb::flow::queueing > JType;
+    // create join_node<type0,type1> jn
+    JType jn(g);
+    // create output_queue oq0, oq1
+    typedef JType::output_type OQType;
+    tbb::flow::queue_node<OQType> oq0(g);
+    tbb::flow::queue_node<OQType> oq1(g);
+    // create iq0, iq1
+    typedef tbb::flow::queue_node<int> IQType;
+    IQType iq0(g);
+    IQType iq1(g);
+    // create qnp, qnq
+    IQType qnp(g);
+    IQType qnq(g);
+    REMARK("Testing policies of join_node<queueing> input ports\n");
+    // attach jn to oq0, oq1
+    tbb::flow::make_edge(jn, oq0);
+    tbb::flow::make_edge(jn, oq1);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(jn.successor_count()==2, NULL);
+    JType::successor_list_type my_succs;
+    jn.copy_successors(my_succs);
+    ASSERT(my_succs.size()==2, NULL);
+#endif
+    // attach iq0, iq1 to jn
+    tbb::flow::make_edge(iq0, tbb::flow::get<0>(jn.input_ports()));
+    tbb::flow::make_edge(iq1, tbb::flow::get<1>(jn.input_ports()));
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(tbb::flow::get<0>(jn.input_ports()).predecessor_count()==1, NULL);
+    tbb::flow::tuple_element<0, JType::input_type>::type::predecessor_list_type my_0preds;
+    tbb::flow::input_port<0>(jn).copy_predecessors(my_0preds);
+    ASSERT(my_0preds.size()==1, NULL);
+#endif
+    for(int loop = 0; loop < 3; ++loop) {
+        // place one item in iq0
+        ASSERT(iq0.try_put(1), "Error putting to iq1");
+        // attach iq0 to qnp
+        tbb::flow::make_edge(iq0, qnp);
+        // qnp should have an item in it.
+        g.wait_for_all();
+        {
+            int i;
+            ASSERT(!qnp.try_get(i), "Item was received by qnp");
+        }
+        // place item in iq1
+        ASSERT(iq1.try_put(2), "Error putting to iq1");
+        // oq0, oq1 should have items
+        g.wait_for_all();
+        {
+            OQType t0;
+            OQType t1;
+            ASSERT(oq0.try_get(t0)&&tbb::flow::get<0>(t0)==1&&tbb::flow::get<1>(t0)==2, "Error in oq0 output");
+            ASSERT(oq1.try_get(t1)&&tbb::flow::get<0>(t1)==1&&tbb::flow::get<1>(t1)==2, "Error in oq1 output");
+        }
+        // attach qnq to iq1
+        // qnp and qnq should be empty
+        tbb::flow::make_edge(iq1, qnq);
+        g.wait_for_all();
+        {
+            int i;
+            ASSERT(!qnp.try_get(i), "iq0 still had value in it");
+            ASSERT(!qnq.try_get(i), "iq1 still had value in it");
+        }
+        tbb::flow::remove_edge(iq0, qnp);
+        tbb::flow::remove_edge(iq1, qnq);
+    } // for ( int loop ...
+}
+
+template<typename T>
+struct myTagValue {
+    tbb::flow::tag_value operator()(T i) { return tbb::flow::tag_value(i); }
+};
+
+template<>
+struct myTagValue<check_type<int> > {
+    tbb::flow::tag_value operator()(check_type<int> i) { return tbb::flow::tag_value((int)i); }
+};
+
+// join_node (tag_matching) consumes inputs as soon as they are available at
+// any input.  When it builds a tuple it broadcasts to all its successors and
+// discards the broadcast values.
+//
+// It chooses the tuple it broadcasts by matching the tag values returned by the
+// methods given the constructor of the join, in this case the method just casts
+// the value in each port to tag_value.
+//
+// So our test will put an item at one input port, then attach another node to the
+// same node (a queue node in this case).  The second successor should not receive
+// an item (because the join consumed it).
+//
+// We then place an item in the second input queue, and check the output queues; they
+// should each have a tuple.
+//
+// we then attach another queue node to the second input.  It should not receive
+// an item, verifying that the item in the queue is consumed.
+//
+// We will then exercise the join with a bunch of values, and the output order should
+// be determined by the order we insert items into the second queue.  (Each tuple set
+// corresponding to a tag will be complete when the second item is inserted.)
+template<>
+void test_input_port_policies<tbb::flow::tag_matching>() {
+    tbb::flow::graph g;
+    typedef tbb::flow::join_node<tbb::flow::tuple<int, check_type<int> >, tbb::flow::tag_matching > JoinNodeType;
+    typedef JoinNodeType::output_type CheckTupleType;
+    JoinNodeType testJoinNode(g, myTagValue<int>(), myTagValue<check_type<int> >());
+    tbb::flow::queue_node<CheckTupleType> checkTupleQueue0(g);
+    tbb::flow::queue_node<CheckTupleType> checkTupleQueue1(g);
+    {
+        Check<check_type<int> > my_check;
+
+
+        typedef tbb::flow::queue_node<int> IntQueueType;
+        typedef tbb::flow::queue_node<check_type<int> > CheckQueueType;
+        IntQueueType intInputQueue(g);
+        CheckQueueType checkInputQueue(g);
+        IntQueueType intEmptyTestQueue(g);
+        CheckQueueType checkEmptyTestQueue(g);
+        REMARK("Testing policies of join_node<tag_matching> input ports\n");
+        // attach testJoinNode to checkTupleQueue0, checkTupleQueue1
+        tbb::flow::make_edge(testJoinNode, checkTupleQueue0);
+        tbb::flow::make_edge(testJoinNode, checkTupleQueue1);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT(testJoinNode.successor_count()==2, NULL);
+        JoinNodeType::successor_list_type my_succs;
+        testJoinNode.copy_successors(my_succs);
+        ASSERT(my_succs.size()==2, NULL);
+#endif
+        // attach intInputQueue, checkInputQueue to testJoinNode
+        tbb::flow::make_edge(intInputQueue, tbb::flow::input_port<0>(testJoinNode));
+        tbb::flow::make_edge(checkInputQueue, tbb::flow::input_port<1>(testJoinNode));
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT(tbb::flow::input_port<0>(testJoinNode).predecessor_count()==1, NULL);
+        tbb::flow::tuple_element<0, JoinNodeType::input_type>::type::predecessor_list_type my_0preds;
+        tbb::flow::input_port<0>(testJoinNode).copy_predecessors(my_0preds);
+        ASSERT(my_0preds.size()==1, NULL);
+#endif
+
+        // we'll put four discrete values in the inputs to the join_node.  Each
+        // set of inputs should result in one output.
+        for(int loop = 0; loop < 4; ++loop) {
+            // place one item in intInputQueue
+            ASSERT(intInputQueue.try_put(loop), "Error putting to intInputQueue");
+            // attach intInputQueue to intEmptyTestQueue
+            tbb::flow::make_edge(intInputQueue, intEmptyTestQueue);
+            // intEmptyTestQueue should not have an item in it.  (the join consumed it.)
+            g.wait_for_all();
+            {
+                int intVal0;
+                ASSERT(!intEmptyTestQueue.try_get(intVal0), "Item was received by intEmptyTestQueue");
+            }
+            // place item in checkInputQueue
+            check_type<int> checkVal0(loop);
+            ASSERT(checkInputQueue.try_put(checkVal0), "Error putting to checkInputQueue");
+            // checkTupleQueue0, checkTupleQueue1 should have items
+            g.wait_for_all();
+            {
+                CheckTupleType t0;
+                CheckTupleType t1;
+                ASSERT(checkTupleQueue0.try_get(t0)&&tbb::flow::get<0>(t0)==loop&&(int)tbb::flow::get<1>(t0)==loop, "Error in checkTupleQueue0 output");
+                ASSERT(checkTupleQueue1.try_get(t1)&&tbb::flow::get<0>(t1)==loop&&(int)tbb::flow::get<1>(t1)==loop, "Error in checkTupleQueue1 output");
+                ASSERT(!checkTupleQueue0.try_get(t0), "extra object in output queue checkTupleQueue0");
+                ASSERT(!checkTupleQueue1.try_get(t0), "extra object in output queue checkTupleQueue1");
+            }
+            // attach checkEmptyTestQueue to checkInputQueue
+            // intEmptyTestQueue and checkEmptyTestQueue should be empty
+            tbb::flow::make_edge(checkInputQueue, checkEmptyTestQueue);
+            g.wait_for_all();
+            {
+                int intVal1;
+                check_type<int> checkVal1;
+                ASSERT(!intEmptyTestQueue.try_get(intVal1), "intInputQueue still had value in it");
+                ASSERT(!checkEmptyTestQueue.try_get(checkVal1), "checkInputQueue still had value in it");
+            }
+            tbb::flow::remove_edge(intInputQueue, intEmptyTestQueue);
+            tbb::flow::remove_edge(checkInputQueue, checkEmptyTestQueue);
+        } // for ( int loop ...
+
+          // Now we'll put [4 .. nValues - 1] in intInputQueue, and then put [4 .. nValues - 1] in checkInputQueue in
+          // a different order.  We should see tuples in the output queues in the order we inserted
+          // the integers into checkInputQueue.
+        const int nValues = 100;
+        const int nIncr = 31;  // relatively prime to nValues
+
+        for(int loop = 4; loop < 4+nValues; ++loop) {
+            // place one item in intInputQueue
+            ASSERT(intInputQueue.try_put(loop), "Error putting to intInputQueue");
+            g.wait_for_all();
+            {
+                CheckTupleType t3;
+                ASSERT(!checkTupleQueue0.try_get(t3), "Object in output queue");
+                ASSERT(!checkTupleQueue1.try_get(t3), "Object in output queue");
+            }
+        } // for ( int loop ...
+
+        for(int loop = 1; loop<=nValues; ++loop) {
+            int lp1 = 4+(loop * nIncr)%nValues;
+            // place item in checkInputQueue
+            ASSERT(checkInputQueue.try_put(lp1), "Error putting to checkInputQueue");
+            // checkTupleQueue0, checkTupleQueue1 should have items
+            g.wait_for_all();
+            {
+                CheckTupleType t0;
+                CheckTupleType t1;
+                ASSERT(checkTupleQueue0.try_get(t0)&&tbb::flow::get<0>(t0)==lp1 && tbb::flow::get<1>(t0)==lp1, "Error in checkTupleQueue0 output");
+                ASSERT(checkTupleQueue1.try_get(t1)&&tbb::flow::get<0>(t1)==lp1 && tbb::flow::get<1>(t1)==lp1, "Error in checkTupleQueue1 output");
+                ASSERT(!checkTupleQueue0.try_get(t0), "extra object in output queue checkTupleQueue0");
+                ASSERT(!checkTupleQueue1.try_get(t0), "extra object in output queue checkTupleQueue1");
+            }
+        } // for ( int loop ...
+    } // Check
+}
+
+template<typename Policy> struct policy_name {};
+
+template<> struct policy_name<tbb::flow::queueing> {
+const char* msg_beg() { return "queueing\n";}
+const char* msg_end() { return "test queueing extract\n";} 
+};
+
+template<> struct policy_name<tbb::flow::reserving> {
+const char* msg_beg() { return "reserving\n";}
+const char* msg_end() { return "test reserving extract\n";}
+};
+
+template<> struct policy_name<tbb::flow::tag_matching> {
+const char* msg_beg() { return "tag_matching\n";}
+const char* msg_end() { return "test tag_matching extract\n";}
+};
+
+template<typename Policy>
+void test_main() {
+    test_input_port_policies<Policy>();
+    for(int p = 0; p < 2; ++p) {
+        REMARK(policy_name<Policy>().msg_beg());
+        generate_test<serial_test, tbb::flow::tuple<threebyte, double>, Policy>::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 4
+        {
+            Check<check_type<int> > my_check;
+            generate_test<serial_test, tbb::flow::tuple<float, double, check_type<int>, long>, Policy>::do_test();
+        }
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 6
+        generate_test<serial_test, tbb::flow::tuple<double, double, int, long, int, short>, Policy>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 8
+        generate_test<serial_test, tbb::flow::tuple<float, double, double, double, float, int, float, long>, Policy>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 10
+        generate_test<serial_test, tbb::flow::tuple<float, double, int, double, double, float, long, int, float, long>, Policy>::do_test();
+#endif
+        {
+            Check<check_type<int> > my_check1;
+            generate_test<parallel_test, tbb::flow::tuple<float, check_type<int> >, Policy>::do_test();
+        }
+#if MAX_TUPLE_TEST_SIZE >= 3
+        generate_test<parallel_test, tbb::flow::tuple<float, int, long>, Policy>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 5
+        generate_test<parallel_test, tbb::flow::tuple<double, double, int, int, short>, Policy>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 7
+        generate_test<parallel_test, tbb::flow::tuple<float, int, double, float, long, float, long>, Policy>::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 9
+        generate_test<parallel_test, tbb::flow::tuple<float, double, int, double, double, long, int, float, long>, Policy>::do_test();
+#endif
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    REMARK(policy_name<Policy>().msg_end());
+    test_join_extract<int, tbb::flow::join_node< tbb::flow::tuple<int, int>, Policy> >().run_tests();
+#endif
+}
+
+#endif /* tbb_test_join_node_H */
diff --git a/xdl/third_party/tbb/src/test/test_join_node_key_matching.cpp b/xdl/third_party/tbb/src/test/test_join_node_key_matching.cpp
new file mode 100644
index 00000000..36cab709
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_join_node_key_matching.cpp
@@ -0,0 +1,71 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "test_join_node.h"
+
+int TestMain() {
+#if __TBB_USE_TBB_TUPLE
+    REMARK("  Using TBB tuple\n");
+#else
+    REMARK("  Using platform tuple\n");
+#endif
+
+    REMARK("key_matching\n");
+    generate_test<serial_test, tbb::flow::tuple<MyKeyFirst<int, double>, MyKeySecond<int, float> >, tbb::flow::key_matching<int> >::do_test();
+    generate_test<serial_test, tbb::flow::tuple<MyKeyFirst<std::string, double>, MyKeySecond<std::string, float> >, tbb::flow::key_matching<std::string> >::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 3
+    generate_test<serial_test, tbb::flow::tuple<MyKeyFirst<std::string, double>, MyKeySecond<std::string, float>, MyKeyWithBrokenMessageKey<std::string, int> >, tbb::flow::key_matching<std::string&> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 7
+    generate_test<serial_test, tbb::flow::tuple<
+        MyKeyFirst<std::string, double>,
+        MyKeyWithBrokenMessageKey<std::string, int>,
+        MyKeyFirst<std::string, int>,
+        MyKeySecond<std::string, size_t>,
+        MyKeyWithBrokenMessageKey<std::string, int>,
+        MyKeySecond<std::string, short>,
+        MyKeySecond<std::string, threebyte>
+    >, tbb::flow::key_matching<std::string&> >::do_test();
+#endif
+
+    generate_test<parallel_test, tbb::flow::tuple<MyKeyFirst<int, double>, MyKeySecond<int, float> >, tbb::flow::key_matching<int> >::do_test();
+    generate_test<parallel_test, tbb::flow::tuple<MyKeyFirst<int, double>, MyKeySecond<int, float> >, tbb::flow::key_matching<int&> >::do_test();
+    generate_test<parallel_test, tbb::flow::tuple<MyKeyFirst<std::string, double>, MyKeySecond<std::string, float> >, tbb::flow::key_matching<std::string&> >::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 10
+    generate_test<parallel_test, tbb::flow::tuple<
+        MyKeyFirst<std::string, double>,
+        MyKeySecond<std::string, int>,
+        MyKeyFirst<std::string, int>,
+        MyKeyWithBrokenMessageKey<std::string, size_t>,
+        MyKeyWithBrokenMessageKey<std::string, int>,
+        MyKeySecond<std::string, short>,
+        MyKeySecond<std::string, threebyte>,
+        MyKeyFirst<std::string, int>,
+        MyKeySecond<std::string, threebyte>,
+        MyKeyWithBrokenMessageKey<std::string, size_t>
+    >, tbb::flow::key_matching<std::string&> >::do_test();
+#endif
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_join_node_msg_key_matching.cpp b/xdl/third_party/tbb/src/test/test_join_node_msg_key_matching.cpp
new file mode 100644
index 00000000..ad8abb7f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_join_node_msg_key_matching.cpp
@@ -0,0 +1,80 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Message based key matching is a preview feature
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+
+// This preview feature depends on
+// TBB_PREVIEW_FLOW_GRAPH_FEATURES macro, and should not accidentaly be dependent on
+// this deprecated feature
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 0
+
+#include "test_join_node.h"
+
+int TestMain() {
+#if __TBB_USE_TBB_TUPLE
+    REMARK("  Using TBB tuple\n");
+#else
+    REMARK("  Using platform tuple\n");
+#endif
+
+#if !__TBB_MIC_OFFLOAD_TEST_COMPILATION_BROKEN
+    generate_test<serial_test, tbb::flow::tuple<MyMessageKeyWithBrokenKey<int, double>, MyMessageKeyWithoutKey<int, float> >, message_based_key_matching<int> >::do_test();
+    generate_test<serial_test, tbb::flow::tuple<MyMessageKeyWithoutKeyMethod<std::string, double>, MyMessageKeyWithBrokenKey<std::string, float> >, message_based_key_matching<std::string> >::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 3
+    generate_test<serial_test, tbb::flow::tuple<MyMessageKeyWithoutKey<std::string, double>, MyMessageKeyWithoutKeyMethod<std::string, float>, MyMessageKeyWithBrokenKey<std::string, int> >, message_based_key_matching<std::string&> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 7
+    generate_test<serial_test, tbb::flow::tuple<
+        MyMessageKeyWithoutKey<std::string, double>,
+        MyMessageKeyWithoutKeyMethod<std::string, int>,
+        MyMessageKeyWithBrokenKey<std::string, int>,
+        MyMessageKeyWithoutKey<std::string, size_t>,
+        MyMessageKeyWithoutKeyMethod<std::string, int>,
+        MyMessageKeyWithBrokenKey<std::string, short>,
+        MyMessageKeyWithoutKey<std::string, threebyte>
+    >, message_based_key_matching<std::string&> >::do_test();
+#endif
+
+    generate_test<parallel_test, tbb::flow::tuple<MyMessageKeyWithBrokenKey<int, double>, MyMessageKeyWithoutKey<int, float> >, message_based_key_matching<int> >::do_test();
+    generate_test<parallel_test, tbb::flow::tuple<MyMessageKeyWithoutKeyMethod<int, double>, MyMessageKeyWithBrokenKey<int, float> >, message_based_key_matching<int&> >::do_test();
+    generate_test<parallel_test, tbb::flow::tuple<MyMessageKeyWithoutKey<std::string, double>, MyMessageKeyWithoutKeyMethod<std::string, float> >, message_based_key_matching<std::string&> >::do_test();
+
+#if MAX_TUPLE_TEST_SIZE >= 10
+    generate_test<parallel_test, tbb::flow::tuple<
+        MyMessageKeyWithoutKeyMethod<std::string, double>,
+        MyMessageKeyWithBrokenKey<std::string, int>,
+        MyMessageKeyWithoutKey<std::string, int>,
+        MyMessageKeyWithoutKeyMethod<std::string, size_t>,
+        MyMessageKeyWithBrokenKey<std::string, int>,
+        MyMessageKeyWithoutKeyMethod<std::string, short>,
+        MyMessageKeyWithoutKeyMethod<std::string, threebyte>,
+        MyMessageKeyWithBrokenKey<std::string, int>,
+        MyMessageKeyWithoutKeyMethod<std::string, threebyte>,
+        MyMessageKeyWithBrokenKey<std::string, size_t>
+    >, message_based_key_matching<std::string&> >::do_test();
+#endif
+#endif /* __TBB_MIC_OFFLOAD_TEST_COMPILATION_BROKEN */
+
+    generate_test<serial_test, tbb::flow::tuple<MyMessageKeyWithBrokenKey<int, double>, MyMessageKeyWithoutKey<int, float> >, message_based_key_matching<int> >::do_test();
+    generate_test<serial_test, tbb::flow::tuple<MyMessageKeyWithoutKeyMethod<std::string, double>, MyMessageKeyWithBrokenKey<std::string, float> >, message_based_key_matching<std::string> >::do_test();
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_lambda.cpp b/xdl/third_party/tbb/src/test/test_lambda.cpp
new file mode 100644
index 00000000..50c4a73d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_lambda.cpp
@@ -0,0 +1,239 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define NOMINMAX
+
+#include "harness_defs.h"
+#if __TBB_TEST_SKIP_LAMBDA
+
+#include "harness.h"
+int TestMain() {
+    REPORT("Known issue: lambdas are not properly supported on the platform \n");
+    return Harness::Skipped;
+}
+
+#else /*__TBB_TEST_SKIP_LAMBDA*/
+
+#include "tbb/tbb.h"
+#include "tbb/combinable.h"
+#include <cstdio>
+#include <list>
+
+using namespace std;
+using namespace tbb;
+
+typedef pair<int,int> max_element_t;
+
+void f(int val, int *arr, int start, int stop) {
+    for (int i=start; i<=stop; ++i) {
+        arr[i] = val;
+    }
+}
+
+#include "harness.h"
+
+#if __TBB_TASK_GROUP_CONTEXT
+int Fib(int n) {
+    if( n<2 ) {
+        return n;
+    } else {
+        int x=0, y=0;
+        task_group g;
+        g.run( [&]{x=Fib(n-1);} ); // spawn a task
+        g.run( [&]{y=Fib(n-2);} ); // spawn another task
+        g.wait();                  // wait for both tasks to complete
+        return x+y;
+    }
+}
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
+
+#include "harness_report.h"
+#include "harness_assert.h"
+
+int TestMain () {
+    const int N = 1000;
+    const int Grainsize = N/1000;
+    int a[N];
+    int max_sum;
+    ASSERT( MinThread>=1, "Error: Number of threads must be positive.\n");
+
+    for(int p=MinThread; p<=MaxThread; ++p) {
+        task_scheduler_init init(p);
+
+        REMARK("Running lambda expression tests on %d threads...\n", p);
+
+        //test parallel_for
+        REMARK("Testing parallel_for... ");
+        parallel_for(blocked_range<int>(0,N,Grainsize),
+                     [&] (blocked_range<int>& r) {
+                         for (int i=r.begin(); i!=r.end(); ++i)    a[i] = i;
+                     });
+        ASSERT(a[0]==0 && a[N-1]==N-1, "parallel_for w/lambdas failed.\n");
+        REMARK("passed.\n");
+
+        //test parallel_reduce
+        REMARK("Testing parallel_reduce... ");
+        int sum = parallel_reduce(blocked_range<int>(0,N,Grainsize), int(0),
+                                  [&] (blocked_range<int>& r, int current_sum) -> int {
+                                      for (int i=r.begin(); i!=r.end(); ++i)
+                                          current_sum += a[i]*(1000-i);
+                                      return current_sum;
+                                  },
+                                  [] (const int x1, const int x2) {
+                                      return x1+x2;
+                                  } );
+
+        max_element_t max_el =
+            parallel_reduce(blocked_range<int>(0,N,Grainsize), make_pair(a[0], 0),
+                            [&] (blocked_range<int>& r, max_element_t current_max)
+                            -> max_element_t {
+                                for (int i=r.begin(); i!=r.end(); ++i)
+                                    if (a[i]>current_max.first)
+                                        current_max = make_pair(a[i], i);
+                                return current_max;
+                            },
+                            [] (const max_element_t x1, const max_element_t x2) {
+                                return (x1.first>x2.first)?x1:x2;
+                            });
+        ASSERT(sum==166666500 && max_el.first==999 && max_el.second==999,
+               "parallel_reduce w/lambdas failed.\n");
+        REMARK("passed.\n");
+
+        //test parallel_do
+        REMARK("Testing parallel_do... ");
+        list<int> s;
+        s.push_back(0);
+
+        parallel_do(s.begin(), s.end(),
+                    [&](int foo, parallel_do_feeder<int>& feeder) {
+                        if (foo == 42) return;
+                        else if (foo>42) {
+                            s.push_back(foo-3);
+                            feeder.add(foo-3);
+                        } else {
+                            s.push_back(foo+5);
+                            feeder.add(foo+5);
+                        }
+                    });
+        ASSERT(s.back()==42, "parallel_do w/lambda failed.\n");
+        REMARK("passed.\n");
+
+        //test parallel_invoke
+        REMARK("Testing parallel_invoke... ");
+        parallel_invoke([&]{ f(2, a, 0, N/3); },
+                        [&]{ f(1, a, N/3+1, 2*(N/3)); },
+                        [&]{ f(0, a, 2*(N/3)+1, N-1); });
+        ASSERT(a[0]==2.0 && a[N-1]==0.0, "parallel_invoke w/lambda failed.\n");
+        REMARK("passed.\n");
+
+        //test tbb_thread
+        REMARK("Testing tbb_thread... ");
+        tbb_thread::id myId;
+        tbb_thread myThread([](int x, int y) {
+                                ASSERT(x==42 && y==64, "tbb_thread w/lambda failed.\n");
+                                REMARK("passed.\n");
+                            }, 42, 64);
+        myThread.join();
+
+#if __TBB_TASK_GROUP_CONTEXT
+        // test task_group
+        REMARK("Testing task_group... ");
+        int result;
+        result = Fib(32);
+        ASSERT(result==2178309, "task_group w/lambda failed.\n");
+        REMARK("passed.\n");
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+        // Reset array a to index values
+        parallel_for(blocked_range<int>(0,N,Grainsize),
+                     [&] (blocked_range<int>& r) {
+                         for (int i=r.begin(); i!=r.end(); ++i)    a[i] = i;
+                     });
+        // test parallel_sort
+        REMARK("Testing parallel_sort... ");
+        int pivot = 42;
+
+        // sort nearest by increasing distance from pivot
+        parallel_sort(a, a+N,
+                      [&](int x, int y) { return(abs(pivot-x) < abs(pivot-y)); });
+        ASSERT(a[0]==42 && a[N-1]==N-1, "parallel_sort w/lambda failed.\n");
+        REMARK("passed.\n");
+
+        //test combinable
+        REMARK("Testing combinable... ");
+        combinable<std::pair<int,int> > minmax_c([&]() { return std::make_pair(a[0], a[0]); } );
+
+        parallel_for(blocked_range<int>(0,N),
+                     [&] (const blocked_range<int> &r) {
+                         std::pair<int,int>& mmr = minmax_c.local();
+                         for(int i=r.begin(); i!=r.end(); ++i) {
+                             if (mmr.first > a[i]) mmr.first = a[i];
+                             if (mmr.second < a[i]) mmr.second = a[i];
+                         }
+                     });
+        max_sum = 0;
+        minmax_c.combine_each([&max_sum](std::pair<int,int> x) {
+                                  int tsum = x.first + x.second;
+                                  if( tsum>max_sum ) max_sum = tsum;
+                              });
+        ASSERT( (N-1)<=max_sum && max_sum<=a[0]+N-1, "combinable::combine_each /w lambda failed." );
+
+        std::pair<int,int> minmax_result_c;
+        minmax_result_c =
+            minmax_c.combine([](std::pair<int,int> x, std::pair<int,int> y) {
+                                 return std::make_pair(x.first<y.first?x.first:y.first,
+                                                       x.second>y.second?x.second:y.second);
+                             });
+        ASSERT(minmax_result_c.first==0 && minmax_result_c.second==999,
+               "combinable w/lambda failed.\n");
+        REMARK("passed.\n");
+
+        //test enumerable_thread_specific
+        REMARK("Testing enumerable_thread_specific... ");
+        enumerable_thread_specific< std::pair<int,int> > minmax_ets([&]() { return std::make_pair(a[0], a[0]); } );
+
+        max_sum = 0;
+        parallel_for(blocked_range<int>(0,N),
+                     [&] (const blocked_range<int> &r) {
+                         std::pair<int,int>& mmr = minmax_ets.local();
+                         for(int i=r.begin(); i!=r.end(); ++i) {
+                             if (mmr.first > a[i]) mmr.first = a[i];
+                             if (mmr.second < a[i]) mmr.second = a[i];
+                         }
+                     });
+        minmax_ets.combine_each([&max_sum](std::pair<int,int> x) {
+                                  int tsum = x.first + x.second;
+                                  if( tsum>max_sum ) max_sum = tsum;
+                                });
+        ASSERT( (N-1)<=max_sum && max_sum<=a[0]+N-1, "enumerable_thread_specific::combine_each /w lambda failed." );
+
+        std::pair<int,int> minmax_result_ets;
+        minmax_result_ets =
+            minmax_ets.combine([](std::pair<int,int> x, std::pair<int,int> y) {
+                                   return std::make_pair(x.first<y.first?x.first:y.first,
+                                                         x.second>y.second?x.second:y.second);
+                               });
+        ASSERT(minmax_result_ets.first==0 && minmax_result_ets.second==999,
+               "enumerable_thread_specific w/lambda failed.\n");
+        REMARK("passed.\n");
+    }
+    return Harness::Done;
+}
+#endif /* __TBB_TEST_SKIP_LAMBDA */
diff --git a/xdl/third_party/tbb/src/test/test_limiter_node.cpp b/xdl/third_party/tbb/src/test/test_limiter_node.cpp
new file mode 100644
index 00000000..0efe1488
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_limiter_node.cpp
@@ -0,0 +1,547 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#include "harness_graph.h"
+#endif
+#include "tbb/flow_graph.h"
+#include "tbb/atomic.h"
+#include "tbb/task_scheduler_init.h"
+
+const int L = 10;
+const int N = 1000;
+
+using tbb::flow::internal::SUCCESSFULLY_ENQUEUED;
+
+template< typename T >
+struct serial_receiver : public tbb::flow::receiver<T>, NoAssign {
+   T next_value;
+   tbb::flow::graph& my_graph;
+
+   serial_receiver(tbb::flow::graph& g) : next_value(T(0)), my_graph(g) {}
+
+   tbb::task *try_put_task( const T &v ) __TBB_override {
+       ASSERT( next_value++  == v, NULL );
+       return const_cast<tbb::task *>(SUCCESSFULLY_ENQUEUED);
+   }
+
+    tbb::flow::graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::receiver<T>::built_predecessors_type built_predecessors_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_list_type predecessor_list_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_type predecessor_type;
+    built_predecessors_type bpt;
+    built_predecessors_type &built_predecessors() __TBB_override { return bpt; }
+    void internal_add_built_predecessor( predecessor_type & ) __TBB_override { }
+    void internal_delete_built_predecessor( predecessor_type & ) __TBB_override { }
+    void copy_predecessors( predecessor_list_type & ) __TBB_override { }
+    size_t predecessor_count() __TBB_override { return 0; }
+#endif
+
+   void reset_receiver(tbb::flow::reset_flags /*f*/) __TBB_override {next_value = T(0);}
+};
+
+template< typename T >
+struct parallel_receiver : public tbb::flow::receiver<T>, NoAssign {
+
+    tbb::atomic<int> my_count;
+    tbb::flow::graph& my_graph;
+
+    parallel_receiver(tbb::flow::graph& g) : my_graph(g) { my_count = 0; }
+
+    tbb::task *try_put_task( const T &/*v*/ ) __TBB_override {
+       ++my_count;
+       return const_cast<tbb::task *>(tbb::flow::internal::SUCCESSFULLY_ENQUEUED);
+    }
+
+    tbb::flow::graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::receiver<T>::built_predecessors_type built_predecessors_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_list_type predecessor_list_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_type predecessor_type;
+    built_predecessors_type bpt;
+    built_predecessors_type &built_predecessors() __TBB_override { return bpt; }
+    void internal_add_built_predecessor( predecessor_type & ) __TBB_override { }
+    void internal_delete_built_predecessor( predecessor_type & ) __TBB_override { }
+    void copy_predecessors( predecessor_list_type & ) __TBB_override { }
+    size_t predecessor_count( ) __TBB_override { return 0; }
+#endif
+    void reset_receiver(tbb::flow::reset_flags /*f*/) __TBB_override {my_count = 0;}
+};
+
+template< typename T >
+struct empty_sender : public tbb::flow::sender<T> {
+        typedef typename tbb::flow::sender<T>::successor_type successor_type;
+
+        bool register_successor( successor_type & ) __TBB_override { return false; }
+        bool remove_successor( successor_type & ) __TBB_override { return false; }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        typedef typename tbb::flow::sender<T>::built_successors_type built_successors_type;
+        typedef typename tbb::flow::sender<T>::successor_list_type successor_list_type;
+        built_successors_type bst;
+        built_successors_type &built_successors() __TBB_override { return bst; }
+        void    internal_add_built_successor( successor_type & ) __TBB_override { }
+        void internal_delete_built_successor( successor_type & ) __TBB_override { }
+        void copy_successors( successor_list_type & ) __TBB_override { }
+        size_t successor_count() __TBB_override { return 0; }
+#endif
+};
+
+
+template< typename T >
+struct put_body : NoAssign {
+
+    tbb::flow::limiter_node<T> &my_lim;
+    tbb::atomic<int> &my_accept_count;
+
+    put_body( tbb::flow::limiter_node<T> &lim, tbb::atomic<int> &accept_count ) :
+        my_lim(lim), my_accept_count(accept_count) {}
+
+    void operator()( int ) const {
+        for ( int i = 0; i < L; ++i ) {
+            bool msg = my_lim.try_put( T(i) );
+            if ( msg == true )
+               ++my_accept_count;
+        }
+    }
+};
+
+template< typename T >
+struct put_dec_body : NoAssign {
+
+    tbb::flow::limiter_node<T> &my_lim;
+    tbb::atomic<int> &my_accept_count;
+
+    put_dec_body( tbb::flow::limiter_node<T> &lim, tbb::atomic<int> &accept_count ) :
+        my_lim(lim), my_accept_count(accept_count) {}
+
+    void operator()( int ) const {
+        int local_accept_count = 0;
+        while ( local_accept_count < N ) {
+            bool msg = my_lim.try_put( T(local_accept_count) );
+            if ( msg == true ) {
+                ++local_accept_count;
+                ++my_accept_count;
+                my_lim.decrement.try_put( tbb::flow::continue_msg() );
+            }
+        }
+    }
+
+};
+
+template< typename T >
+void test_puts_with_decrements( int num_threads, tbb::flow::limiter_node< T >& lim , tbb::flow::graph& g) {
+    parallel_receiver<T> r(g);
+    empty_sender< tbb::flow::continue_msg > s;
+    tbb::atomic<int> accept_count;
+    accept_count = 0;
+    tbb::flow::make_edge( lim, r );
+    tbb::flow::make_edge(s, lim.decrement);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(lim.decrement.predecessor_count() == 1, NULL);
+    ASSERT(lim.successor_count() == 1, NULL);
+    ASSERT(lim.predecessor_count() == 0, NULL);
+    typename tbb::flow::interface10::internal::decrementer<tbb::flow::limiter_node<T> >::predecessor_list_type dec_preds;
+    lim.decrement.copy_predecessors(dec_preds);
+    ASSERT(dec_preds.size() == 1, NULL);
+#endif
+    // test puts with decrements
+    NativeParallelFor( num_threads, put_dec_body<T>(lim, accept_count) );
+    int c = accept_count;
+    ASSERT( c == N*num_threads, NULL );
+    ASSERT( r.my_count == N*num_threads, NULL );
+}
+
+//
+// Tests
+//
+// limiter only forwards below the limit, multiple parallel senders / single receiver
+// mutiple parallel senders that put to decrement at each accept, limiter accepts new messages
+//
+//
+template< typename T >
+int test_parallel(int num_threads) {
+
+   // test puts with no decrements
+   for ( int i = 0; i < L; ++i ) {
+       tbb::flow::graph g;
+       tbb::flow::limiter_node< T > lim(g, i);
+       parallel_receiver<T> r(g);
+       tbb::atomic<int> accept_count;
+       accept_count = 0;
+       tbb::flow::make_edge( lim, r );
+       // test puts with no decrements
+       NativeParallelFor( num_threads, put_body<T>(lim, accept_count) );
+       g.wait_for_all();
+       int c = accept_count;
+       ASSERT( c == i, NULL );
+   }
+
+   // test puts with decrements
+   for ( int i = 1; i < L; ++i ) {
+       tbb::flow::graph g;
+       tbb::flow::limiter_node< T > lim(g, i);
+       test_puts_with_decrements(num_threads, lim, g);
+       tbb::flow::limiter_node< T > lim_copy( lim );
+       test_puts_with_decrements(num_threads, lim_copy, g);
+   }
+
+   return 0;
+}
+
+//
+// Tests
+//
+// limiter only forwards below the limit, single sender / single receiver
+// at reject, a put to decrement, will cause next message to be accepted
+//
+template< typename T >
+int test_serial() {
+
+   // test puts with no decrements
+   for ( int i = 0; i < L; ++i ) {
+       tbb::flow::graph g;
+       tbb::flow::limiter_node< T > lim(g, i);
+       serial_receiver<T> r(g);
+       tbb::flow::make_edge( lim, r );
+       for ( int j = 0; j < L; ++j ) {
+           bool msg = lim.try_put( T(j) );
+           ASSERT( ( j < i && msg == true ) || ( j >= i && msg == false ), NULL );
+       }
+       g.wait_for_all();
+   }
+
+   // test puts with decrements
+   for ( int i = 1; i < L; ++i ) {
+       tbb::flow::graph g;
+       tbb::flow::limiter_node< T > lim(g, i);
+       serial_receiver<T> r(g);
+       empty_sender< tbb::flow::continue_msg > s;
+       tbb::flow::make_edge( lim, r );
+       tbb::flow::make_edge(s, lim.decrement);
+       for ( int j = 0; j < N; ++j ) {
+           bool msg = lim.try_put( T(j) );
+           ASSERT( ( j < i && msg == true ) || ( j >= i && msg == false ), NULL );
+           if ( msg == false ) {
+               lim.decrement.try_put( tbb::flow::continue_msg() );
+               msg = lim.try_put( T(j) );
+               ASSERT( msg == true, NULL );
+           }
+       }
+   }
+   return 0;
+}
+
+// reported bug in limiter (http://software.intel.com/en-us/comment/1752355)
+#define DECREMENT_OUTPUT 1  // the port number of the decrement output of the multifunction_node
+#define LIMITER_OUTPUT 0    // port number of the integer output
+
+typedef tbb::flow::multifunction_node<int, tbb::flow::tuple<int,tbb::flow::continue_msg> > mfnode_type;
+
+tbb::atomic<size_t> emit_count;
+tbb::atomic<size_t> emit_sum;
+tbb::atomic<size_t> receive_count;
+tbb::atomic<size_t> receive_sum;
+
+struct mfnode_body {
+    int max_cnt;
+    tbb::atomic<int>* my_cnt;
+    mfnode_body(const int& _max, tbb::atomic<int> &_my) : max_cnt(_max), my_cnt(&_my)  { }
+    void operator()(const int &/*in*/, mfnode_type::output_ports_type &out) {
+        int lcnt = ++(*my_cnt);
+        if(lcnt > max_cnt) {
+            return;
+        }
+        // put one continue_msg to the decrement of the limiter.
+        if(!tbb::flow::get<DECREMENT_OUTPUT>(out).try_put(tbb::flow::continue_msg())) {
+            ASSERT(false,"Unexpected rejection of decrement");
+        }
+        {
+            // put messages to the input of the limiter_node until it rejects.
+            while( tbb::flow::get<LIMITER_OUTPUT>(out).try_put(lcnt) ) {
+                emit_sum += lcnt;
+                ++emit_count;
+            }
+        }
+    }
+};
+
+struct fn_body {
+    int operator()(const int &in) {
+        receive_sum += in;
+        ++receive_count;
+        return in;
+    }
+};
+
+//                   +------------+
+//    +---------+    |            v
+//    | mf_node |0---+       +----------+          +----------+
+// +->|         |1---------->| lim_node |--------->| fn_node  |--+
+// |  +---------+            +----------+          +----------+  |
+// |                                                             |
+// |                                                             |
+// +-------------------------------------------------------------+
+//
+void
+test_multifunction_to_limiter(int _max, int _nparallel) {
+    tbb::flow::graph g;
+    emit_count = 0;
+    emit_sum = 0;
+    receive_count = 0;
+    receive_sum = 0;
+    tbb::atomic<int> local_cnt;
+    local_cnt = 0;
+    mfnode_type mf_node(g, tbb::flow::unlimited, mfnode_body(_max, local_cnt));
+    tbb::flow::function_node<int, int> fn_node(g, tbb::flow::unlimited, fn_body());
+    tbb::flow::limiter_node<int> lim_node(g, _nparallel);
+    tbb::flow::make_edge(tbb::flow::output_port<LIMITER_OUTPUT>(mf_node), lim_node);
+    tbb::flow::make_edge(tbb::flow::output_port<DECREMENT_OUTPUT>(mf_node), lim_node.decrement);
+    tbb::flow::make_edge(lim_node, fn_node);
+    tbb::flow::make_edge(fn_node, mf_node);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    REMARK("pred cnt == %d\n",(int)(lim_node.predecessor_count()));
+    REMARK("succ cnt == %d\n",(int)(lim_node.successor_count()));
+    tbb::flow::limiter_node<int>::successor_list_type my_succs;
+    lim_node.copy_successors(my_succs);
+    REMARK("succ cnt from vector  == %d\n",(int)(my_succs.size()));
+    tbb::flow::limiter_node<int>::predecessor_list_type my_preds;
+    lim_node.copy_predecessors(my_preds);
+    REMARK("pred cnt from vector  == %d\n",(int)(my_preds.size()));
+#endif
+    mf_node.try_put(1);
+    g.wait_for_all();
+    ASSERT(emit_count == receive_count, "counts do not match");
+    ASSERT(emit_sum == receive_sum, "sums do not match");
+
+    // reset, test again
+    g.reset();
+    emit_count = 0;
+    emit_sum = 0;
+    receive_count = 0;
+    receive_sum = 0;
+    local_cnt = 0;;
+    mf_node.try_put(1);
+    g.wait_for_all();
+    ASSERT(emit_count == receive_count, "counts do not match");
+    ASSERT(emit_sum == receive_sum, "sums do not match");
+}
+
+
+void
+test_continue_msg_reception() {
+    tbb::flow::graph g;
+    tbb::flow::limiter_node<int> ln(g,2);
+    tbb::flow::queue_node<int>   qn(g);
+    tbb::flow::make_edge(ln, qn);
+    ln.decrement.try_put(tbb::flow::continue_msg());
+    ln.try_put(42);
+    g.wait_for_all();
+    int outint;
+    ASSERT(qn.try_get(outint) && outint == 42, "initial put to decrement stops node");
+}
+
+
+//
+// This test ascertains that if a message is not successfully put
+// to a successor, the message is not dropped but released.
+//
+
+using namespace tbb::flow;
+void test_reserve_release_messages() {
+    graph g;
+
+    //making two queue_nodes: one broadcast_node and one limiter_node
+    queue_node<int> input_queue(g);
+    queue_node<int> output_queue(g);
+    broadcast_node<continue_msg> broad(g);
+    limiter_node<int> limit(g,2,1); //threshold of 2
+
+    //edges
+    make_edge(input_queue, limit);
+    make_edge(limit, output_queue);
+    make_edge(broad,limit.decrement);
+
+    int list[4] = {19, 33, 72, 98}; //list to be put to the input queue
+
+    input_queue.try_put(list[0]); // succeeds
+    input_queue.try_put(list[1]); // succeeds
+    input_queue.try_put(list[2]); // fails, stored in upstream buffer
+    g.wait_for_all();
+
+    remove_edge(limit, output_queue); //remove successor
+
+    //sending continue messages to the decrement port of the limiter
+    broad.try_put(continue_msg());
+    broad.try_put(continue_msg()); //failed message retrieved.
+    g.wait_for_all();
+
+    make_edge(limit, output_queue); //putting the successor back
+
+    broad.try_put(continue_msg());
+    broad.try_put(continue_msg());  //drop the count
+
+    input_queue.try_put(list[3]);  //success
+    g.wait_for_all();
+
+    int var=0;
+
+    for (int i=0; i<4; i++){
+    output_queue.try_get(var);
+    ASSERT(var==list[i], "some data dropped, input does not match output");
+    g.wait_for_all();
+  }
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+void test_extract() {
+    tbb::flow::graph g;
+    int j;
+    tbb::flow::limiter_node<int> node0(g, /*threshold*/1);
+    tbb::flow::queue_node<int> q0(g);
+    tbb::flow::queue_node<int> q1(g);
+    tbb::flow::queue_node<int> q2(g);
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> b0(g);
+    tbb::flow::broadcast_node<tbb::flow::continue_msg> b1(g);
+
+    for( int i = 0; i < 2; ++i ) {
+        REMARK("At pass %d\n", i);
+        ASSERT(node0.predecessor_count() == 0, "incorrect predecessor count at start");
+        ASSERT(node0.successor_count() == 0, "incorrect successor count at start");
+        ASSERT(node0.decrement.predecessor_count() == 0, "incorrect decrement pred count at start");
+
+        tbb::flow::make_edge(q0, node0);
+        tbb::flow::make_edge(q1, node0);
+        tbb::flow::make_edge(node0, q2);
+        tbb::flow::make_edge(b0, node0.decrement);
+        tbb::flow::make_edge(b1, node0.decrement);
+        g.wait_for_all();
+
+        /*    b0   b1              */
+        /*      \  |               */
+        /*  q0\  \ |               */
+        /*     \  \|               */
+        /*      +-node0---q2       */
+        /*     /                   */
+        /*  q1/                    */
+
+        q0.try_put(i);
+        g.wait_for_all();
+        ASSERT(node0.predecessor_count() == 2, "incorrect predecessor count after construction");
+        ASSERT(node0.successor_count() == 1, "incorrect successor count after construction");
+        ASSERT(node0.decrement.predecessor_count() == 2, "incorrect decrement pred count after construction");
+        ASSERT(q2.try_get(j), "fetch of value forwarded to output queue failed");
+        ASSERT(j == i, "improper value forwarded to output queue");
+        q0.try_put(2*i);
+        g.wait_for_all();
+        ASSERT(!q2.try_get(j), "limiter_node forwarded item improperly");
+        b0.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(!q2.try_get(j), "limiter_node forwarded item improperly");
+        b0.try_put(tbb::flow::continue_msg());
+        g.wait_for_all();
+        ASSERT(q2.try_get(j) && j == 2*i, "limiter_node failed to forward item");
+
+        tbb::flow::limiter_node<int>::successor_list_type sv;
+        tbb::flow::limiter_node<int>::predecessor_list_type pv;
+        tbb::flow::continue_receiver::predecessor_list_type dv;
+        tbb::flow::limiter_node<int>::successor_list_type sv1;
+        tbb::flow::limiter_node<int>::predecessor_list_type pv1;
+        tbb::flow::continue_receiver::predecessor_list_type dv1;
+
+        node0.copy_predecessors(pv);
+        node0.copy_successors(sv);
+        node0.decrement.copy_predecessors(dv);
+        pv1.push_back(&(q0));
+        pv1.push_back(&(q1));
+        sv1.push_back(&(q2));
+        dv1.push_back(&(b0));
+        dv1.push_back(&(b1));
+
+        ASSERT(pv.size() == 2, "improper size for predecessors");
+        ASSERT(sv.size() == 1, "improper size for successors");
+        ASSERT(lists_match(pv,pv1), "predecessor lists do not match");
+        ASSERT(lists_match(sv,sv1), "successor lists do not match");
+        ASSERT(lists_match(dv,dv1), "successor lists do not match");
+
+        if(i == 0) {
+            node0.extract();
+            ASSERT(node0.predecessor_count() == 0, "incorrect predecessor count after extraction");
+            ASSERT(node0.successor_count() == 0, "incorrect successor count after extraction");
+            ASSERT(node0.decrement.predecessor_count() == 0, "incorrect decrement pred count after extraction");
+        }
+        else {
+            q0.extract();
+            b0.extract();
+            q2.extract();
+
+            ASSERT(node0.predecessor_count() == 1, "incorrect predecessor count after extract second iter");
+            ASSERT(node0.successor_count() == 0, "incorrect successor count after extract second iter");
+            ASSERT(node0.decrement.predecessor_count() == 1, "incorrect decrement pred count after extract second iter");
+
+            node0.copy_predecessors(pv);
+            node0.copy_successors(sv);
+            node0.decrement.copy_predecessors(dv);
+            pv1.clear();
+            sv1.clear();
+            dv1.clear();
+            pv1.push_back(&(q1));
+            dv1.push_back(&(b1));
+
+            ASSERT(lists_match(pv,pv1), "predecessor lists do not match second iter");
+            ASSERT(lists_match(sv,sv1), "successor lists do not match second iter");
+            ASSERT(lists_match(dv,dv1), "successor lists do not match second iter");
+
+            q1.extract();
+            b1.extract();
+        }
+        ASSERT(node0.predecessor_count() == 0, "incorrect predecessor count after extract");
+        ASSERT(node0.successor_count() == 0, "incorrect successor count after extract");
+        ASSERT(node0.decrement.predecessor_count() == 0, "incorrect decrement pred count after extract");
+
+    }
+
+}
+#endif  // TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+
+int TestMain() {
+    for (int i = 1; i <= 8; ++i) {
+        tbb::task_scheduler_init init(i);
+        test_serial<int>();
+        test_parallel<int>(i);
+    }
+    test_continue_msg_reception();
+    test_multifunction_to_limiter(30,3);
+    test_multifunction_to_limiter(300,13);
+    test_multifunction_to_limiter(3000,1);
+    test_reserve_release_messages();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_extract();
+#endif
+   return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_malloc_atexit.cpp b/xdl/third_party/tbb/src/test/test_malloc_atexit.cpp
new file mode 100644
index 00000000..830d50d2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_atexit.cpp
@@ -0,0 +1,161 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Regression test against a bug in TBB allocator manifested when
+   dynamic library calls atexit() or registers dtors of static objects.
+   If the allocator is not initialized yet, we can get deadlock,
+   because allocator library has static object dtors as well, they
+   registered during allocator initialization, and atexit() is protected
+   by non-recursive mutex in some versions of GLIBC.
+ */
+
+#include <stdlib.h>
+#include "harness_allocator_overload.h"
+
+// __TBB_malloc_safer_msize() returns 0 for unknown objects,
+// thus we can detect ownership
+#if _USRDLL
+ #if _WIN32||_WIN64
+extern __declspec(dllexport)
+ #endif
+bool dll_isMallocOverloaded()
+#else
+bool exe_isMallocOverloaded()
+#endif
+{
+    const size_t reqSz = 8;
+    void *o = malloc(reqSz);
+    bool ret = __TBB_malloc_safer_msize(o, NULL) >= reqSz;
+    free(o);
+    return ret;
+}
+
+#if _USRDLL
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+
+#define HARNESS_CUSTOM_MAIN 1
+#include "harness.h"
+
+#include <dlfcn.h>
+#if __APPLE__
+#include <malloc/malloc.h>
+#define malloc_usable_size(p) malloc_size(p)
+#else
+#include <malloc.h>
+#endif
+#include <signal.h>
+
+#if __linux__ && !__ANDROID__
+extern "C" {
+void __libc_free(void *ptr);
+void *__libc_realloc(void *ptr, size_t size);
+
+// check that such kind of free/realloc overload works correctly
+void free(void *ptr)
+{
+    __libc_free(ptr);
+}
+
+void *realloc(void *ptr, size_t size)
+{
+    return __libc_realloc(ptr, size);
+}
+} // extern "C"
+#endif // __linux__ && !__ANDROID__
+
+#endif // MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+
+// Even when the test is skipped, dll source must not be empty to generate .lib to link with.
+
+#ifndef _PGO_INSTRUMENT
+void dummyFunction() {}
+
+// TODO: enable the check under Android
+#if (MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED) && !__ANDROID__
+typedef void *(malloc_type)(size_t);
+
+static void SigSegv(int)
+{
+    REPORT("Known issue: SIGSEGV during work with memory allocated by replaced allocator.\n"
+           "skip\n");
+    exit(0);
+}
+
+// TODO: Using of SIGSEGV can be eliminated via parsing /proc/self/maps
+// and series of system malloc calls.
+void TestReplacedAllocFunc()
+{
+    struct sigaction sa, sa_default;
+    malloc_type *orig_malloc = (malloc_type*)dlsym(RTLD_NEXT, "malloc");
+    void *p = (*orig_malloc)(16);
+
+    // protect potentially unsafe actions
+    sigemptyset(&sa.sa_mask);
+    sa.sa_flags = 0;
+    sa.sa_handler = SigSegv;
+    if (sigaction(SIGSEGV, &sa, &sa_default))
+        ASSERT(0, "sigaction failed");
+
+    ASSERT(malloc_usable_size(p) >= 16, NULL);
+    free(p);
+    // no more unsafe actions, restore SIGSEGV
+    if (sigaction(SIGSEGV, &sa_default, NULL))
+        ASSERT(0, "sigaction failed");
+}
+#else
+void TestReplacedAllocFunc() { }
+#endif
+
+class Foo {
+public:
+    Foo() {
+        // add a lot of exit handlers to cause memory allocation
+        for (int i=0; i<1024; i++)
+            atexit(dummyFunction);
+        TestReplacedAllocFunc();
+    }
+};
+
+static Foo f;
+#endif
+
+#else // _USRDLL
+#include "harness.h"
+
+#if _WIN32||_WIN64
+#include "tbb/tbbmalloc_proxy.h"
+
+extern __declspec(dllimport)
+#endif
+bool dll_isMallocOverloaded();
+
+int TestMain () {
+#ifdef _PGO_INSTRUMENT
+    REPORT("Known issue: test_malloc_atexit hangs if compiled with -prof-genx\n");
+    return Harness::Skipped;
+#else
+    ASSERT( dll_isMallocOverloaded(), "malloc was not replaced" );
+    ASSERT( exe_isMallocOverloaded(), "malloc was not replaced" );
+    return Harness::Done;
+#endif
+}
+
+#endif // _USRDLL
diff --git a/xdl/third_party/tbb/src/test/test_malloc_compliance.cpp b/xdl/third_party/tbb/src/test/test_malloc_compliance.cpp
new file mode 100644
index 00000000..a07fbcd6
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_compliance.cpp
@@ -0,0 +1,1125 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+bool __tbb_test_errno = false;
+
+#define __STDC_LIMIT_MACROS 1 // to get SIZE_MAX from stdint.h
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_WIN8UI_SUPPORT
+// testing allocator itself not iterfaces
+// so we can use desktop functions
+#define _CRT_USE_WINAPI_FAMILY_DESKTOP_APP !_M_ARM
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+// FIXME: fix the test to support New Windows *8 Store Apps mode.
+int TestMain() {
+    return Harness::Skipped;
+}
+#else /* __TBB_WIN8UI_SUPPORT	 */
+
+#include "harness_defs.h"
+#include "harness_report.h"
+
+#if _WIN32 || _WIN64
+/* _WIN32_WINNT should be defined at the very beginning,
+   because other headers might include <windows.h>
+*/
+#undef _WIN32_WINNT
+#define _WIN32_WINNT 0x0501
+#include "tbb/machine/windows_api.h"
+#include <stdio.h>
+
+#if _MSC_VER && defined(_MT) && defined(_DLL)
+    #pragma comment(lib, "version.lib")  // to use GetFileVersionInfo*
+#endif
+
+void limitMem( size_t limit )
+{
+    static HANDLE hJob = NULL;
+    JOBOBJECT_EXTENDED_LIMIT_INFORMATION jobInfo;
+
+    jobInfo.BasicLimitInformation.LimitFlags = JOB_OBJECT_LIMIT_PROCESS_MEMORY;
+    jobInfo.ProcessMemoryLimit = limit? limit*MByte : 2*MByte*1024;
+    if (NULL == hJob) {
+        if (NULL == (hJob = CreateJobObject(NULL, NULL))) {
+            REPORT("Can't assign create job object: %ld\n", GetLastError());
+            exit(1);
+        }
+        if (0 == AssignProcessToJobObject(hJob, GetCurrentProcess())) {
+            REPORT("Can't assign process to job object: %ld\n", GetLastError());
+            exit(1);
+        }
+    }
+    if (0 == SetInformationJobObject(hJob, JobObjectExtendedLimitInformation,
+                                     &jobInfo, sizeof(jobInfo))) {
+        REPORT("Can't set limits: %ld\n", GetLastError());
+        exit(1);
+    }
+}
+// Do not test errno with static VC runtime
+#else // _WIN32 || _WIN64
+#include <sys/resource.h>
+#include <stdlib.h>
+#include <stdio.h>
+#include <errno.h>
+#include <sys/types.h>  // uint64_t on FreeBSD, needed for rlim_t
+#include <stdint.h>     // SIZE_MAX
+
+void limitMem( size_t limit )
+{
+    rlimit rlim;
+    int ret = getrlimit(RLIMIT_AS,&rlim);
+    if (0 != ret) {
+        REPORT("getrlimit() returned an error: errno %d\n", errno);
+        exit(1);
+    }
+    if (rlim.rlim_max==(rlim_t)RLIM_INFINITY)
+        rlim.rlim_cur = (limit > 0) ? limit*MByte : rlim.rlim_max;
+    else rlim.rlim_cur = (limit > 0 && limit<rlim.rlim_max) ? limit*MByte : rlim.rlim_max;
+    ret = setrlimit(RLIMIT_AS,&rlim);
+    if (0 != ret) {
+        REPORT("Can't set limits: errno %d\n", errno);
+        exit(1);
+    }
+}
+#endif  // _WIN32 || _WIN64
+
+#define ASSERT_ERRNO(cond, msg)  ASSERT( !__tbb_test_errno || (cond), msg )
+#define CHECK_ERRNO(cond) (__tbb_test_errno && (cond))
+
+#include <time.h>
+#include <errno.h>
+#include <limits.h> // for CHAR_BIT
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+#include "tbb/scalable_allocator.h"
+
+#define HARNESS_CUSTOM_MAIN 1
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+#include "harness.h"
+#include "harness_barrier.h"
+#if !__TBB_SOURCE_DIRECTLY_INCLUDED
+#include "harness_tbb_independence.h"
+#endif
+#if __linux__
+#include <stdint.h> // uintptr_t
+#endif
+#if _WIN32 || _WIN64
+#include <malloc.h> // _aligned_(malloc|free|realloc)
+#if __MINGW64__
+// Workaround a bug in MinGW64 headers with _aligned_(malloc|free) not declared by default
+extern "C" void __cdecl _aligned_free(void *);
+extern "C" void *__cdecl _aligned_malloc(size_t,size_t);
+#endif
+#endif
+
+#include <vector>
+
+const int COUNT_ELEM = 25000;
+const size_t MAX_SIZE = 1000;
+const int COUNTEXPERIMENT = 10000;
+
+const char strError[]="failed";
+const char strOk[]="done";
+
+typedef unsigned int UINT;
+typedef unsigned char UCHAR;
+typedef unsigned long DWORD;
+typedef unsigned char BYTE;
+
+
+typedef void* TestMalloc(size_t size);
+typedef void* TestCalloc(size_t num, size_t size);
+typedef void* TestRealloc(void* memblock, size_t size);
+typedef void  TestFree(void* memblock);
+typedef int   TestPosixMemalign(void **memptr, size_t alignment, size_t size);
+typedef void* TestAlignedMalloc(size_t size, size_t alignment);
+typedef void* TestAlignedRealloc(void* memblock, size_t size, size_t alignment);
+typedef void  TestAlignedFree(void* memblock);
+
+// pointers to tested functions
+TestMalloc*  Rmalloc;
+TestCalloc*  Rcalloc;
+TestRealloc* Rrealloc;
+TestFree*    Tfree;
+TestPosixMemalign*  Rposix_memalign;
+TestAlignedMalloc*  Raligned_malloc;
+TestAlignedRealloc* Raligned_realloc;
+TestAlignedFree* Taligned_free;
+
+// call functions via pointer and check result's alignment
+void* Tmalloc(size_t size);
+void* Tcalloc(size_t num, size_t size);
+void* Trealloc(void* memblock, size_t size);
+int   Tposix_memalign(void **memptr, size_t alignment, size_t size);
+void* Taligned_malloc(size_t size, size_t alignment);
+void* Taligned_realloc(void* memblock, size_t size, size_t alignment);
+
+
+bool error_occurred = false;
+
+#if __APPLE__
+// Tests that use the variables are skipped on macOS*
+#else
+const size_t COUNT_ELEM_CALLOC = 2;
+const int COUNT_TESTS = 1000;
+static bool perProcessLimits = true;
+#endif
+
+const size_t POWERS_OF_2 = 20;
+
+struct MemStruct
+{
+    void* Pointer;
+    UINT Size;
+
+    MemStruct() : Pointer(NULL), Size(0) {}
+    MemStruct(void* ptr, UINT sz) : Pointer(ptr), Size(sz) {}
+};
+
+class CMemTest: NoAssign
+{
+    UINT CountErrors;
+    bool FullLog;
+    Harness::SpinBarrier *limitBarrier;
+    static bool firstTime;
+
+public:
+    CMemTest(Harness::SpinBarrier *barrier, bool isVerbose=false) :
+        CountErrors(0), limitBarrier(barrier)
+        {
+            srand((UINT)time(NULL));
+            FullLog=isVerbose;
+        }
+    void NULLReturn(UINT MinSize, UINT MaxSize, int total_threads); // NULL pointer + check errno
+    void UniquePointer(); // unique pointer - check with padding
+    void AddrArifm(); // unique pointer - check with pointer arithmetic
+    bool ShouldReportError();
+    void Free_NULL(); //
+    void Zerofilling(); // check if arrays are zero-filled
+    void TestAlignedParameters();
+    void RunAllTests(int total_threads);
+    ~CMemTest() {}
+};
+
+class Limit {
+    size_t limit;
+public:
+    Limit(size_t a_limit) : limit(a_limit) {}
+    void operator() () const {
+        limitMem(limit);
+    }
+};
+
+int argC;
+char** argV;
+
+struct RoundRobin: NoAssign {
+    const long number_of_threads;
+    mutable CMemTest test;
+
+    RoundRobin( long p, Harness::SpinBarrier *limitBarrier, bool verbose ) :
+        number_of_threads(p), test(limitBarrier, verbose) {}
+    void operator()( int /*id*/ ) const
+        {
+            test.RunAllTests(number_of_threads);
+        }
+};
+
+bool CMemTest::firstTime = true;
+
+inline size_t choose_random_alignment() {
+    return sizeof(void*)<<(rand() % POWERS_OF_2);
+}
+
+static void setSystemAllocs()
+{
+    Rmalloc=malloc;
+    Rrealloc=realloc;
+    Rcalloc=calloc;
+    Tfree=free;
+#if _WIN32 || _WIN64
+    Raligned_malloc=_aligned_malloc;
+    Raligned_realloc=_aligned_realloc;
+    Taligned_free=_aligned_free;
+    Rposix_memalign=0;
+#elif  __APPLE__ || __sun || __ANDROID__
+// macOS, Solaris*, and Android* don't have posix_memalign
+    Raligned_malloc=0;
+    Raligned_realloc=0;
+    Taligned_free=0;
+    Rposix_memalign=0;
+#else
+    Raligned_malloc=0;
+    Raligned_realloc=0;
+    Taligned_free=0;
+    Rposix_memalign=posix_memalign;
+#endif
+}
+
+// check that realloc works as free and as malloc
+void ReallocParam()
+{
+    const int ITERS = 1000;
+    int i;
+    void *bufs[ITERS];
+
+    bufs[0] = Trealloc(NULL, 30*MByte);
+    ASSERT(bufs[0], "Can't get memory to start the test.");
+
+    for (i=1; i<ITERS; i++)
+    {
+        bufs[i] = Trealloc(NULL, 30*MByte);
+        if (NULL == bufs[i])
+            break;
+    }
+    ASSERT(i<ITERS, "Limits should be decreased for the test to work.");
+
+    Trealloc(bufs[0], 0);
+    /* There is a race for the free space between different threads at
+       this point. So, have to run the test sequentially.
+    */
+    bufs[0] = Trealloc(NULL, 30*MByte);
+    ASSERT(bufs[0], NULL);
+
+    for (int j=0; j<i; j++)
+        Trealloc(bufs[j], 0);
+}
+
+void CheckArgumentsOverflow()
+{
+    void *p;
+    const size_t params[] = {SIZE_MAX, SIZE_MAX-16};
+
+    for (unsigned i=0; i<Harness::array_length(params); i++) {
+        p = Tmalloc(params[i]);
+        ASSERT(!p, NULL);
+        ASSERT_ERRNO(errno==ENOMEM, NULL);
+        p = Trealloc(NULL, params[i]);
+        ASSERT(!p, NULL);
+        ASSERT_ERRNO(errno==ENOMEM, NULL);
+        p = Tcalloc(1, params[i]);
+        ASSERT(!p, NULL);
+        ASSERT_ERRNO(errno==ENOMEM, NULL);
+        p = Tcalloc(params[i], 1);
+        ASSERT(!p, NULL);
+        ASSERT_ERRNO(errno==ENOMEM, NULL);
+    }
+    const size_t max_alignment = size_t(1) << (sizeof(size_t)*CHAR_BIT - 1);
+    if (Rposix_memalign) {
+        int ret = Rposix_memalign(&p, max_alignment, ~max_alignment);
+        ASSERT(ret == ENOMEM, NULL);
+        for (unsigned i=0; i<Harness::array_length(params); i++) {
+            ret = Rposix_memalign(&p, max_alignment, params[i]);
+            ASSERT(ret == ENOMEM, NULL);
+            ret = Rposix_memalign(&p, sizeof(void*), params[i]);
+            ASSERT(ret == ENOMEM, NULL);
+        }
+    }
+    if (Raligned_malloc) {
+        p = Raligned_malloc(~max_alignment, max_alignment);
+        ASSERT(!p, NULL);
+        for (unsigned i=0; i<Harness::array_length(params); i++) {
+            p = Raligned_malloc(params[i], max_alignment);
+            ASSERT(!p, NULL);
+            ASSERT_ERRNO(errno==ENOMEM, NULL);
+            p = Raligned_malloc(params[i], sizeof(void*));
+            ASSERT(!p, NULL);
+            ASSERT_ERRNO(errno==ENOMEM, NULL);
+        }
+    }
+
+    p = Tcalloc(SIZE_MAX/2-16, SIZE_MAX/2-16);
+    ASSERT(!p, NULL);
+    ASSERT_ERRNO(errno==ENOMEM, NULL);
+    p = Tcalloc(SIZE_MAX/2, SIZE_MAX/2);
+    ASSERT(!p, NULL);
+    ASSERT_ERRNO(errno==ENOMEM, NULL);
+}
+
+void InvariantDataRealloc(bool aligned, size_t maxAllocSize, bool checkData)
+{
+    Harness::FastRandom fastRandom(1);
+    size_t size = 0, start = 0;
+    char *ptr = NULL,
+        // master to create copies and compare ralloc result against it
+        *master = (char*)Tmalloc(2*maxAllocSize);
+
+    ASSERT(master, NULL);
+    ASSERT(!(2*maxAllocSize%sizeof(unsigned short)),
+           "The loop below expects that 2*maxAllocSize contains sizeof(unsigned short)");
+    for (size_t k = 0; k<2*maxAllocSize; k+=sizeof(unsigned short))
+        *(unsigned short*)(master+k) = fastRandom.get();
+
+    for (int i=0; i<100; i++) {
+        // don't want sizeNew==0 here
+        const size_t sizeNew = fastRandom.get() % (maxAllocSize-1) + 1;
+        char *ptrNew = aligned?
+            (char*)Taligned_realloc(ptr, sizeNew, choose_random_alignment())
+            : (char*)Trealloc(ptr, sizeNew);
+        ASSERT(ptrNew, NULL);
+        // check that old data not changed
+        if (checkData)
+            ASSERT(!memcmp(ptrNew, master+start, min(size, sizeNew)), "broken data");
+
+        // prepare fresh data, copying them from random position in master
+        size = sizeNew;
+        ptr = ptrNew;
+        if (checkData) {
+            start = fastRandom.get() % maxAllocSize;
+            memcpy(ptr, master+start, size);
+        }
+    }
+    if (aligned)
+        Taligned_realloc(ptr, 0, choose_random_alignment());
+    else
+        Trealloc(ptr, 0);
+    Tfree(master);
+}
+
+#include "harness_memory.h"
+
+void CheckReallocLeak()
+{
+    int i;
+    const int ITER_TO_STABILITY = 10;
+    // do bootstrap
+    for (int k=0; k<3; k++)
+        InvariantDataRealloc(/*aligned=*/false, 128*MByte, /*checkData=*/false);
+    size_t prev = GetMemoryUsage(peakUsage);
+    // expect realloc to not increase peak memory consumption after ITER_TO_STABILITY-1 iterations
+    for (i=0; i<ITER_TO_STABILITY; i++) {
+        for (int k=0; k<3; k++)
+            InvariantDataRealloc(/*aligned=*/false, 128*MByte, /*checkData=*/false);
+        size_t curr = GetMemoryUsage(peakUsage);
+        if (prev == curr)
+            break;
+        prev = curr;
+    }
+    ASSERT(i < ITER_TO_STABILITY, "Can't stabilize memory consumption.");
+}
+
+HARNESS_EXPORT
+int main(int argc, char* argv[]) {
+    argC=argc;
+    argV=argv;
+    MaxThread = MinThread = 1;
+    Rmalloc=scalable_malloc;
+    Rrealloc=scalable_realloc;
+    Rcalloc=scalable_calloc;
+    Tfree=scalable_free;
+    Rposix_memalign=scalable_posix_memalign;
+    Raligned_malloc=scalable_aligned_malloc;
+    Raligned_realloc=scalable_aligned_realloc;
+    Taligned_free=scalable_aligned_free;
+
+    // check if we were called to test standard behavior
+    for (int i=1; i< argc; i++) {
+        if (strcmp((char*)*(argv+i),"-s")==0)
+        {
+#if __INTEL_COMPILER == 1400 && __linux__
+            // Workaround for Intel(R) C++ Compiler XE, version 14.0.0.080:
+            // unable to call setSystemAllocs() in such configuration.
+            REPORT("Known issue: Standard allocator testing is not supported.\n");
+            REPORT( "skip\n" );
+            return 0;
+#else
+            setSystemAllocs();
+            argC--;
+            break;
+#endif
+        }
+    }
+
+    ParseCommandLine( argC, argV );
+#if __linux__
+    /* According to man pthreads
+       "NPTL threads do not share resource limits (fixed in kernel 2.6.10)".
+       Use per-threads limits for affected systems.
+     */
+    if ( LinuxKernelVersion() < 2*1000000 + 6*1000 + 10)
+        perProcessLimits = false;
+#endif
+    //-------------------------------------
+#if __APPLE__
+    /* Skip due to lack of memory limit enforcing under macOS. */
+#else
+    limitMem(200);
+    ReallocParam();
+    limitMem(0);
+#endif
+
+//for linux and dynamic runtime errno is used to check allocator functions
+//check if library compiled with /MD(d) and we can use errno
+#if _MSC_VER
+#if defined(_MT) && defined(_DLL) //check errno if test itself compiled with /MD(d) only
+    char*  version_info_block = NULL;
+    int version_info_block_size;
+    LPVOID comments_block = NULL;
+    UINT comments_block_size;
+#ifdef _DEBUG
+#define __TBBMALLOCDLL "tbbmalloc_debug.dll"
+#else  //_DEBUG
+#define __TBBMALLOCDLL "tbbmalloc.dll"
+#endif //_DEBUG
+    version_info_block_size = GetFileVersionInfoSize( __TBBMALLOCDLL, (LPDWORD)&version_info_block_size );
+    if( version_info_block_size
+        && ((version_info_block = (char*)malloc(version_info_block_size)) != NULL)
+        && GetFileVersionInfo(  __TBBMALLOCDLL, NULL, version_info_block_size, version_info_block )
+        && VerQueryValue( version_info_block, "\\StringFileInfo\\000004b0\\Comments", &comments_block, &comments_block_size )
+        && strstr( (char*)comments_block, "/MD" )
+        ){
+            __tbb_test_errno = true;
+     }
+     if( version_info_block ) free( version_info_block );
+#endif // defined(_MT) && defined(_DLL)
+#else  // _MSC_VER
+    __tbb_test_errno = true;
+#endif // _MSC_VER
+
+    CheckArgumentsOverflow();
+    CheckReallocLeak();
+    for( int p=MaxThread; p>=MinThread; --p ) {
+        REMARK("testing with %d threads\n", p );
+        for (int limit=0; limit<2; limit++) {
+            int ret = scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT,
+                                               16*1024*limit);
+            ASSERT(ret==TBBMALLOC_OK, NULL);
+            Harness::SpinBarrier *barrier = new Harness::SpinBarrier(p);
+            NativeParallelFor( p, RoundRobin(p, barrier, Verbose) );
+            delete barrier;
+        }
+    }
+    int ret = scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT, 0);
+    ASSERT(ret==TBBMALLOC_OK, NULL);
+    if( !error_occurred )
+        REPORT("done\n");
+    return 0;
+}
+
+// if non-zero byte found, returns bad value address plus 1
+size_t NonZero(void *ptr, size_t size)
+{
+    size_t words = size / sizeof(intptr_t);
+    size_t tailSz = size % sizeof(intptr_t);
+    intptr_t *buf =(intptr_t*)ptr;
+    char *bufTail =(char*)(buf+words);
+
+    for (size_t i=0; i<words; i++)
+        if (buf[i]) {
+            for (unsigned b=0; b<sizeof(intptr_t); b++)
+                if (((char*)(buf+i))[b])
+                    return sizeof(intptr_t)*i + b + 1;
+        }
+    for (size_t i=0; i<tailSz; i++)
+        if (bufTail[i]) {
+            return words*sizeof(intptr_t)+i+1;
+        }
+    return 0;
+}
+
+struct TestStruct
+{
+    DWORD field1:2;
+    DWORD field2:6;
+    double field3;
+    UCHAR field4[100];
+    TestStruct* field5;
+    std::vector<int> field7;
+    double field8;
+};
+
+void* Tmalloc(size_t size)
+{
+    // For compatibility, on 64-bit systems malloc should align to 16 bytes
+    size_t alignment = (sizeof(intptr_t)>4 && size>8) ? 16 : 8;
+    void *ret = Rmalloc(size);
+    if (0 != ret)
+        ASSERT(0==((uintptr_t)ret & (alignment-1)),
+               "allocation result should be properly aligned");
+    return ret;
+}
+void* Tcalloc(size_t num, size_t size)
+{
+    // For compatibility, on 64-bit systems calloc should align to 16 bytes
+    size_t alignment = (sizeof(intptr_t)>4 && num && size>8) ? 16 : 8;
+    void *ret = Rcalloc(num, size);
+    if (0 != ret)
+        ASSERT(0==((uintptr_t)ret & (alignment-1)),
+               "allocation result should be properly aligned");
+    return ret;
+}
+void* Trealloc(void* memblock, size_t size)
+{
+    // For compatibility, on 64-bit systems realloc should align to 16 bytes
+    size_t alignment = (sizeof(intptr_t)>4 && size>8) ? 16 : 8;
+    void *ret = Rrealloc(memblock, size);
+    if (0 != ret)
+        ASSERT(0==((uintptr_t)ret & (alignment-1)),
+               "allocation result should be properly aligned");
+    return ret;
+}
+int Tposix_memalign(void **memptr, size_t alignment, size_t size)
+{
+    int ret = Rposix_memalign(memptr, alignment, size);
+    if (0 == ret)
+        ASSERT(0==((uintptr_t)*memptr & (alignment-1)),
+               "allocation result should be aligned");
+    return ret;
+}
+void* Taligned_malloc(size_t size, size_t alignment)
+{
+    void *ret = Raligned_malloc(size, alignment);
+    if (0 != ret)
+        ASSERT(0==((uintptr_t)ret & (alignment-1)),
+               "allocation result should be aligned");
+    return ret;
+}
+void* Taligned_realloc(void* memblock, size_t size, size_t alignment)
+{
+    void *ret = Raligned_realloc(memblock, size, alignment);
+    if (0 != ret)
+        ASSERT(0==((uintptr_t)ret & (alignment-1)),
+               "allocation result should be aligned");
+    return ret;
+}
+
+struct PtrSize {
+    void  *ptr;
+    size_t size;
+};
+
+static int cmpAddrs(const void *p1, const void *p2)
+{
+    const PtrSize *a = (const PtrSize *)p1;
+    const PtrSize *b = (const PtrSize *)p2;
+
+    return a->ptr < b->ptr ? -1 : ( a->ptr == b->ptr ? 0 : 1);
+}
+
+void CMemTest::AddrArifm()
+{
+    PtrSize *arr = (PtrSize*)Tmalloc(COUNT_ELEM*sizeof(PtrSize));
+
+    if (FullLog) REPORT("\nUnique pointer using Address arithmetics\n");
+    if (FullLog) REPORT("malloc....");
+    ASSERT(arr, NULL);
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        arr[i].size=rand()%MAX_SIZE;
+        arr[i].ptr=Tmalloc(arr[i].size);
+    }
+    qsort(arr, COUNT_ELEM, sizeof(PtrSize), cmpAddrs);
+
+    for (int i=0; i<COUNT_ELEM-1; i++)
+    {
+        if (NULL!=arr[i].ptr && NULL!=arr[i+1].ptr)
+            ASSERT((uintptr_t)arr[i].ptr+arr[i].size <= (uintptr_t)arr[i+1].ptr,
+                   "intersection detected");
+    }
+    //----------------------------------------------------------------
+    if (FullLog) REPORT("realloc....");
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        size_t count=arr[i].size*2;
+        void *tmpAddr=Trealloc(arr[i].ptr,count);
+        if (NULL!=tmpAddr) {
+            arr[i].ptr = tmpAddr;
+            arr[i].size = count;
+        } else if (count==0) { // because realloc(..., 0) works as free
+            arr[i].ptr = NULL;
+            arr[i].size = 0;
+        }
+    }
+    qsort(arr, COUNT_ELEM, sizeof(PtrSize), cmpAddrs);
+
+    for (int i=0; i<COUNT_ELEM-1; i++)
+    {
+        if (NULL!=arr[i].ptr && NULL!=arr[i+1].ptr)
+            ASSERT((uintptr_t)arr[i].ptr+arr[i].size <= (uintptr_t)arr[i+1].ptr,
+                   "intersection detected");
+    }
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        Tfree(arr[i].ptr);
+    }
+    //-------------------------------------------
+    if (FullLog) REPORT("calloc....");
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        arr[i].size=rand()%MAX_SIZE;
+        arr[i].ptr=Tcalloc(arr[i].size,1);
+    }
+    qsort(arr, COUNT_ELEM, sizeof(PtrSize), cmpAddrs);
+
+    for (int i=0; i<COUNT_ELEM-1; i++)
+    {
+        if (NULL!=arr[i].ptr && NULL!=arr[i+1].ptr)
+            ASSERT((uintptr_t)arr[i].ptr+arr[i].size <= (uintptr_t)arr[i+1].ptr,
+                   "intersection detected");
+    }
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        Tfree(arr[i].ptr);
+    }
+    Tfree(arr);
+}
+
+void CMemTest::Zerofilling()
+{
+    TestStruct* TSMas;
+    size_t CountElement;
+    CountErrors=0;
+    if (FullLog) REPORT("\nzeroings elements of array....");
+    //test struct
+    for (int i=0; i<COUNTEXPERIMENT; i++)
+    {
+        CountElement=rand()%MAX_SIZE;
+        TSMas=(TestStruct*)Tcalloc(CountElement,sizeof(TestStruct));
+        if (NULL == TSMas)
+            continue;
+        for (size_t j=0; j<CountElement; j++)
+        {
+            if (NonZero(TSMas+j, sizeof(TestStruct)))
+            {
+                CountErrors++;
+                if (ShouldReportError()) REPORT("detect nonzero element at TestStruct\n");
+            }
+        }
+        Tfree(TSMas);
+    }
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+}
+
+#if !__APPLE__
+
+void myMemset(void *ptr, int c, size_t n)
+{
+#if  __linux__ &&  __i386__
+// memset in Fedora 13 not always correctly sets memory to required values.
+    char *p = (char*)ptr;
+    for (size_t i=0; i<n; i++)
+        p[i] = c;
+#else
+    memset(ptr, c, n);
+#endif
+}
+
+// This test requires more than TOTAL_MB_ALLOC MB of RAM.
+#if __ANDROID__
+// Android requires lower limit due to lack of virtual memory.
+#define TOTAL_MB_ALLOC	200
+#else
+#define TOTAL_MB_ALLOC  800
+#endif
+void CMemTest::NULLReturn(UINT MinSize, UINT MaxSize, int total_threads)
+{
+    const int MB_PER_THREAD = TOTAL_MB_ALLOC / total_threads;
+    // find size to guarantee getting NULL for 1024 B allocations
+    const int MAXNUM_1024 = (MB_PER_THREAD + (MB_PER_THREAD>>2)) * 1024;
+
+    std::vector<MemStruct> PointerList;
+    void *tmp;
+    CountErrors=0;
+    int CountNULL, num_1024;
+    if (FullLog) REPORT("\nNULL return & check errno:\n");
+    UINT Size;
+    Limit limit_total(TOTAL_MB_ALLOC), no_limit(0);
+    void **buf_1024 = (void**)Tmalloc(MAXNUM_1024*sizeof(void*));
+
+    ASSERT(buf_1024, NULL);
+    /* We must have space for pointers when memory limit is hit.
+       Reserve enough for the worst case, taking into account race for
+       limited space between threads.
+    */
+    PointerList.reserve(TOTAL_MB_ALLOC*MByte/MinSize);
+
+    /* There is a bug in the specific version of GLIBC (2.5-12) shipped
+       with RHEL5 that leads to erroneous working of the test
+       on Intel(R) 64 and Itanium(R) architecture when setrlimit-related part is enabled.
+       Switching to GLIBC 2.5-18 from RHEL5.1 resolved the issue.
+     */
+    if (perProcessLimits)
+        limitBarrier->wait(limit_total);
+    else
+        limitMem(MB_PER_THREAD);
+
+    /* regression test against the bug in allocator when it dereference NULL
+       while lack of memory
+    */
+    for (num_1024=0; num_1024<MAXNUM_1024; num_1024++) {
+        buf_1024[num_1024] = Tcalloc(1024, 1);
+        if (! buf_1024[num_1024]) {
+            ASSERT_ERRNO(errno == ENOMEM, NULL);
+            break;
+        }
+    }
+    for (int i=0; i<num_1024; i++)
+        Tfree(buf_1024[i]);
+    Tfree(buf_1024);
+
+    do {
+        Size=rand()%(MaxSize-MinSize)+MinSize;
+        tmp=Tmalloc(Size);
+        if (tmp != NULL)
+        {
+            myMemset(tmp, 0, Size);
+            PointerList.push_back(MemStruct(tmp, Size));
+        }
+    } while(tmp != NULL);
+    ASSERT_ERRNO(errno == ENOMEM, NULL);
+    if (FullLog) REPORT("\n");
+
+    // preparation complete, now running tests
+    // malloc
+    if (FullLog) REPORT("malloc....");
+    CountNULL = 0;
+    while (CountNULL==0)
+        for (int j=0; j<COUNT_TESTS; j++)
+        {
+            Size=rand()%(MaxSize-MinSize)+MinSize;
+            errno = ENOMEM+j+1;
+            tmp=Tmalloc(Size);
+            if (tmp == NULL)
+            {
+                CountNULL++;
+                if ( CHECK_ERRNO(errno != ENOMEM) ) {
+                    CountErrors++;
+                    if (ShouldReportError()) REPORT("NULL returned, error: errno (%d) != ENOMEM\n", errno);
+                }
+            }
+            else
+            {
+                // Technically, if malloc returns a non-NULL pointer, it is allowed to set errno anyway.
+                // However, on most systems it does not set errno.
+                bool known_issue = false;
+#if __linux__ || __ANDROID__
+                if( CHECK_ERRNO(errno==ENOMEM) ) known_issue = true;
+#endif /* __linux__ */
+                if ( CHECK_ERRNO(errno != ENOMEM+j+1) && !known_issue) {
+                    CountErrors++;
+                    if (ShouldReportError()) REPORT("error: errno changed to %d though valid pointer was returned\n", errno);
+                }
+                myMemset(tmp, 0, Size);
+                PointerList.push_back(MemStruct(tmp, Size));
+            }
+        }
+    if (FullLog) REPORT("end malloc\n");
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+
+    CountErrors=0;
+    //calloc
+    if (FullLog) REPORT("calloc....");
+    CountNULL = 0;
+    while (CountNULL==0)
+        for (int j=0; j<COUNT_TESTS; j++)
+        {
+            Size=rand()%(MaxSize-MinSize)+MinSize;
+            errno = ENOMEM+j+1;
+            tmp=Tcalloc(COUNT_ELEM_CALLOC,Size);
+            if (tmp == NULL)
+            {
+                CountNULL++;
+                if ( CHECK_ERRNO(errno != ENOMEM) ){
+                    CountErrors++;
+                    if (ShouldReportError()) REPORT("NULL returned, error: errno(%d) != ENOMEM\n", errno);
+                }
+            }
+            else
+            {
+                // Technically, if calloc returns a non-NULL pointer, it is allowed to set errno anyway.
+                // However, on most systems it does not set errno.
+                bool known_issue = false;
+#if __linux__
+                if( CHECK_ERRNO(errno==ENOMEM) ) known_issue = true;
+#endif /* __linux__ */
+                if ( CHECK_ERRNO(errno != ENOMEM+j+1) && !known_issue ) {
+                    CountErrors++;
+                    if (ShouldReportError()) REPORT("error: errno changed to %d though valid pointer was returned\n", errno);
+                }
+                PointerList.push_back(MemStruct(tmp, Size));
+            }
+        }
+    if (FullLog) REPORT("end calloc\n");
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+    CountErrors=0;
+    if (FullLog) REPORT("realloc....");
+    CountNULL = 0;
+    if (PointerList.size() > 0)
+        while (CountNULL==0)
+            for (size_t i=0; i<(size_t)COUNT_TESTS && i<PointerList.size(); i++)
+            {
+                errno = 0;
+                tmp=Trealloc(PointerList[i].Pointer,PointerList[i].Size*2);
+                if (tmp != NULL) // same or another place
+                {
+                    bool known_issue = false;
+#if __linux__
+                    if( errno==ENOMEM ) known_issue = true;
+#endif /* __linux__ */
+                    if (errno != 0 && !known_issue) {
+                        CountErrors++;
+                        if (ShouldReportError()) REPORT("valid pointer returned, error: errno not kept\n");
+                    }
+                    // newly allocated area have to be zeroed
+                    myMemset((char*)tmp + PointerList[i].Size, 0, PointerList[i].Size);
+                    PointerList[i].Pointer = tmp;
+                    PointerList[i].Size *= 2;
+                } else {
+                    CountNULL++;
+                    if ( CHECK_ERRNO(errno != ENOMEM) )
+                    {
+                        CountErrors++;
+                        if (ShouldReportError()) REPORT("NULL returned, error: errno(%d) != ENOMEM\n", errno);
+                    }
+                    // check data integrity
+                    if (NonZero(PointerList[i].Pointer, PointerList[i].Size)) {
+                        CountErrors++;
+                        if (ShouldReportError()) REPORT("NULL returned, error: data changed\n");
+                    }
+                }
+            }
+    if (FullLog) REPORT("realloc end\n");
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+    for (UINT i=0; i<PointerList.size(); i++)
+    {
+        Tfree(PointerList[i].Pointer);
+    }
+
+    if (perProcessLimits)
+        limitBarrier->wait(no_limit);
+    else
+        limitMem(0);
+}
+#endif /* #if !__APPLE__ */
+
+void CMemTest::UniquePointer()
+{
+    CountErrors=0;
+    int **MasPointer = (int **)Tmalloc(sizeof(int*)*COUNT_ELEM);
+    size_t *MasCountElem = (size_t*)Tmalloc(sizeof(size_t)*COUNT_ELEM);
+    if (FullLog) REPORT("\nUnique pointer using 0\n");
+    ASSERT(MasCountElem && MasPointer, NULL);
+    //
+    //-------------------------------------------------------
+    //malloc
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        MasCountElem[i]=rand()%MAX_SIZE;
+        MasPointer[i]=(int*)Tmalloc(MasCountElem[i]*sizeof(int));
+        if (NULL == MasPointer[i])
+            MasCountElem[i]=0;
+        memset(MasPointer[i], 0, sizeof(int)*MasCountElem[i]);
+    }
+    if (FullLog) REPORT("malloc....");
+    for (UINT i=0; i<COUNT_ELEM-1; i++)
+    {
+        if (size_t badOff = NonZero(MasPointer[i], sizeof(int)*MasCountElem[i])) {
+            CountErrors++;
+            if (ShouldReportError())
+                REPORT("error, detect non-zero at %p\n", (char*)MasPointer[i]+badOff-1);
+        }
+        memset(MasPointer[i], 1, sizeof(int)*MasCountElem[i]);
+    }
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+    //----------------------------------------------------------
+    //calloc
+    for (int i=0; i<COUNT_ELEM; i++)
+        Tfree(MasPointer[i]);
+    CountErrors=0;
+    for (long i=0; i<COUNT_ELEM; i++)
+    {
+        MasPointer[i]=(int*)Tcalloc(MasCountElem[i]*sizeof(int),2);
+        if (NULL == MasPointer[i])
+            MasCountElem[i]=0;
+    }
+    if (FullLog) REPORT("calloc....");
+    for (int i=0; i<COUNT_ELEM-1; i++)
+    {
+        if (size_t badOff = NonZero(MasPointer[i], sizeof(int)*MasCountElem[i])) {
+            CountErrors++;
+            if (ShouldReportError())
+                REPORT("error, detect non-zero at %p\n", (char*)MasPointer[i]+badOff-1);
+        }
+        memset(MasPointer[i], 1, sizeof(int)*MasCountElem[i]);
+    }
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+    //---------------------------------------------------------
+    //realloc
+    CountErrors=0;
+    for (int i=0; i<COUNT_ELEM; i++)
+    {
+        MasCountElem[i]*=2;
+        *(MasPointer+i)=
+            (int*)Trealloc(*(MasPointer+i),MasCountElem[i]*sizeof(int));
+        if (NULL == MasPointer[i])
+            MasCountElem[i]=0;
+        memset(MasPointer[i], 0, sizeof(int)*MasCountElem[i]);
+    }
+    if (FullLog) REPORT("realloc....");
+    for (int i=0; i<COUNT_ELEM-1; i++)
+    {
+        if (NonZero(MasPointer[i], sizeof(int)*MasCountElem[i]))
+            CountErrors++;
+        memset(MasPointer[i], 1, sizeof(int)*MasCountElem[i]);
+    }
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+    for (int i=0; i<COUNT_ELEM; i++)
+        Tfree(MasPointer[i]);
+    Tfree(MasCountElem);
+    Tfree(MasPointer);
+}
+
+bool CMemTest::ShouldReportError()
+{
+    if (FullLog)
+        return true;
+    else
+        if (firstTime) {
+            firstTime = false;
+            return true;
+        } else
+            return false;
+}
+
+void CMemTest::Free_NULL()
+{
+    CountErrors=0;
+    if (FullLog) REPORT("\ncall free with parameter NULL....");
+    errno = 0;
+    for (int i=0; i<COUNTEXPERIMENT; i++)
+    {
+        Tfree(NULL);
+        if (CHECK_ERRNO(errno))
+        {
+            CountErrors++;
+            if (ShouldReportError()) REPORT("error is found by a call free with parameter NULL\n");
+        }
+    }
+    if (CountErrors) REPORT("%s\n",strError);
+    else if (FullLog) REPORT("%s\n",strOk);
+    error_occurred |= ( CountErrors>0 ) ;
+}
+
+void CMemTest::TestAlignedParameters()
+{
+    void *memptr;
+    int ret;
+
+    if (Rposix_memalign) {
+        // alignment isn't power of 2
+        for (int bad_align=3; bad_align<16; bad_align++)
+            if (bad_align&(bad_align-1)) {
+                ret = Tposix_memalign(NULL, bad_align, 100);
+                ASSERT(EINVAL==ret, NULL);
+            }
+
+        memptr = &ret;
+        ret = Tposix_memalign(&memptr, 5*sizeof(void*), 100);
+        ASSERT(memptr == &ret,
+               "memptr should not be changed after unsuccessful call");
+        ASSERT(EINVAL==ret, NULL);
+
+        // alignment is power of 2, but not a multiple of sizeof(void *),
+        // we expect that sizeof(void*) > 2
+        ret = Tposix_memalign(NULL, 2, 100);
+        ASSERT(EINVAL==ret, NULL);
+    }
+    if (Raligned_malloc) {
+        // alignment isn't power of 2
+        for (int bad_align=3; bad_align<16; bad_align++)
+            if (bad_align&(bad_align-1)) {
+                memptr = Taligned_malloc(100, bad_align);
+                ASSERT(NULL==memptr, NULL);
+                ASSERT_ERRNO(EINVAL==errno, NULL);
+            }
+
+        // size is zero
+        memptr = Taligned_malloc(0, 16);
+        ASSERT(NULL==memptr, "size is zero, so must return NULL");
+        ASSERT_ERRNO(EINVAL==errno, NULL);
+    }
+    if (Taligned_free) {
+        // NULL pointer is OK to free
+        errno = 0;
+        Taligned_free(NULL);
+        /* As there is no return value for free, strictly speaking we can't
+           check errno here. But checked implementations obey the assertion.
+        */
+        ASSERT_ERRNO(0==errno, NULL);
+    }
+    if (Raligned_realloc) {
+        for (int i=1; i<20; i++) {
+            // checks that calls work correctly in presence of non-zero errno
+            errno = i;
+            void *ptr = Taligned_malloc(i*10, 128);
+            ASSERT(NULL!=ptr, NULL);
+            ASSERT_ERRNO(0!=errno, NULL);
+            // if size is zero and pointer is not NULL, works like free
+            memptr = Taligned_realloc(ptr, 0, 64);
+            ASSERT(NULL==memptr, NULL);
+            ASSERT_ERRNO(0!=errno, NULL);
+        }
+        // alignment isn't power of 2
+        for (int bad_align=3; bad_align<16; bad_align++)
+            if (bad_align&(bad_align-1)) {
+                void *ptr = &bad_align;
+                memptr = Taligned_realloc(&ptr, 100, bad_align);
+                ASSERT(NULL==memptr, NULL);
+                ASSERT(&bad_align==ptr, NULL);
+                ASSERT_ERRNO(EINVAL==errno, NULL);
+            }
+    }
+}
+
+void CMemTest::RunAllTests(int total_threads)
+{
+    Zerofilling();
+    Free_NULL();
+    InvariantDataRealloc(/*aligned=*/false, 8*MByte, /*checkData=*/true);
+    if (Raligned_realloc)
+        InvariantDataRealloc(/*aligned=*/true, 8*MByte, /*checkData=*/true);
+    TestAlignedParameters();
+    UniquePointer();
+    AddrArifm();
+#if __APPLE__
+    REPORT("Known issue: some tests are skipped on macOS\n");
+#else
+    NULLReturn(1*MByte,100*MByte,total_threads);
+#endif
+    if (FullLog) REPORT("Tests for %d threads ended\n", total_threads);
+}
+
+#endif /* __TBB_WIN8UI_SUPPORT	 */
diff --git a/xdl/third_party/tbb/src/test/test_malloc_init_shutdown.cpp b/xdl/third_party/tbb/src/test/test_malloc_init_shutdown.cpp
new file mode 100644
index 00000000..067deafe
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_init_shutdown.cpp
@@ -0,0 +1,176 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/scalable_allocator.h"
+#include "tbb/atomic.h"
+#include "tbb/aligned_space.h"
+
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+#include "harness.h"
+#include "harness_barrier.h"
+#if !__TBB_SOURCE_DIRECTLY_INCLUDED
+#include "harness_tbb_independence.h"
+#endif
+
+tbb::atomic<int> FinishedTasks;
+const int MaxTasks = 16;
+
+/*--------------------------------------------------------------------*/
+// The regression test against a bug triggered when malloc initialization
+// and thread shutdown were called simultaneously, in which case
+// Windows dynamic loader lock and allocator initialization/termination lock
+// were taken in different order.
+
+class TestFunc1 {
+    Harness::SpinBarrier* my_barr;
+public:
+    TestFunc1 (Harness::SpinBarrier& barr) : my_barr(&barr) {}
+    void operator() (bool do_malloc) const {
+        my_barr->wait();
+        if (do_malloc) scalable_malloc(10);
+        ++FinishedTasks;
+    }
+};
+
+typedef NativeParallelForTask<bool,TestFunc1> TestTask1;
+
+void Test1 () {
+    int NTasks = min(MaxTasks, max(2, MaxThread));
+    Harness::SpinBarrier barr(NTasks);
+    TestFunc1 tf(barr);
+    FinishedTasks = 0;
+    tbb::aligned_space<TestTask1,MaxTasks> tasks;
+
+    for(int i=0; i<NTasks; ++i) {
+        TestTask1* t = tasks.begin()+i;
+        new(t) TestTask1(i%2==0, tf);
+        t->start();
+    }
+
+    Harness::Sleep(1000); // wait a second :)
+    ASSERT( FinishedTasks==NTasks, "Some threads appear to deadlock" );
+
+    for(int i=0; i<NTasks; ++i) {
+        TestTask1* t = tasks.begin()+i;
+        t->wait_to_finish();
+        t->~TestTask1();
+    }
+}
+
+/*--------------------------------------------------------------------*/
+// The regression test against a bug when cross-thread deallocation
+// caused livelock at thread shutdown.
+
+void* gPtr = NULL;
+
+class TestFunc2a {
+    Harness::SpinBarrier* my_barr;
+public:
+    TestFunc2a (Harness::SpinBarrier& barr) : my_barr(&barr) {}
+    void operator() (int) const {
+        gPtr = scalable_malloc(8);
+        my_barr->wait();
+        ++FinishedTasks;
+    }
+};
+
+typedef NativeParallelForTask<int,TestFunc2a> TestTask2a;
+
+class TestFunc2b: NoAssign {
+    Harness::SpinBarrier* my_barr;
+    TestTask2a& my_ward;
+public:
+    TestFunc2b (Harness::SpinBarrier& barr, TestTask2a& t) : my_barr(&barr), my_ward(t) {}
+    void operator() (int) const {
+        tbb::internal::spin_wait_while_eq(gPtr, (void*)NULL);
+        scalable_free(gPtr);
+        my_barr->wait();
+        my_ward.wait_to_finish();
+        ++FinishedTasks;
+    }
+};
+void Test2() {
+    Harness::SpinBarrier barr(2);
+    TestFunc2a func2a(barr);
+    TestTask2a t2a(0, func2a);
+    TestFunc2b func2b(barr, t2a);
+    NativeParallelForTask<int,TestFunc2b> t2b(1, func2b);
+    FinishedTasks = 0;
+    t2a.start(); t2b.start();
+    Harness::Sleep(1000); // wait a second :)
+    ASSERT( FinishedTasks==2, "Threads appear to deadlock" );
+    t2b.wait_to_finish(); // t2a is monitored by t2b
+}
+
+#if _WIN32||_WIN64
+
+void TestKeyDtor() {}
+
+#else
+
+void *currSmall, *prevSmall, *currLarge, *prevLarge;
+
+extern "C" void threadDtor(void*) {
+    // First, release memory that was allocated before;
+    // it will not re-initialize the thread-local data if already deleted
+    prevSmall = currSmall;
+    scalable_free(currSmall);
+    prevLarge = currLarge;
+    scalable_free(currLarge);
+    // Then, allocate more memory.
+    // It will re-initialize the allocator data in the thread.
+    scalable_free(scalable_malloc(8));
+}
+
+inline bool intersectingObjects(const void *p1, const void *p2, size_t n)
+{
+    return p1>p2 ? ((uintptr_t)p1-(uintptr_t)p2)<n : ((uintptr_t)p2-(uintptr_t)p1)<n;
+}
+
+struct TestThread: NoAssign {
+    TestThread(int ) {}
+
+    void operator()( int /*id*/ ) const {
+        pthread_key_t key;
+
+        currSmall = scalable_malloc(8);
+        ASSERT(!prevSmall || currSmall==prevSmall, "Possible memory leak");
+        currLarge = scalable_malloc(32*1024);
+        // intersectingObjects takes into account object shuffle
+        ASSERT(!prevLarge || intersectingObjects(currLarge, prevLarge, 32*1024), "Possible memory leak");
+        pthread_key_create( &key, &threadDtor );
+        pthread_setspecific(key, (const void*)42);
+    }
+};
+
+// test releasing memory from pthread key destructor
+void TestKeyDtor() {
+    for (int i=0; i<4; i++)
+        NativeParallelFor( 1, TestThread(1) );
+}
+
+#endif // _WIN32||_WIN64
+
+int TestMain () {
+    Test1(); // requires malloc initialization so should be first
+    Test2();
+    TestKeyDtor();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_malloc_lib_unload.cpp b/xdl/third_party/tbb/src/test/test_malloc_lib_unload.cpp
new file mode 100644
index 00000000..8d331cbf
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_lib_unload.cpp
@@ -0,0 +1,222 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _USRDLL
+
+#include <stdlib.h> // for NULL
+#include "harness_assert.h"
+#define HARNESS_CUSTOM_MAIN 1
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+
+const char *globalCallMsg = "A TBB allocator function call is resolved into wrong implementation.";
+
+#if _WIN32||_WIN64
+// must be defined in DLL for linker to not drop the dependency on the DLL.
+extern "C" {
+    extern __declspec(dllexport) void *scalable_malloc(size_t);
+    extern __declspec(dllexport) void scalable_free (void *);
+    extern __declspec(dllexport) void safer_scalable_free (void *, void (*)(void*));
+    extern __declspec(dllexport) void *scalable_realloc(void *, size_t);
+    extern __declspec(dllexport) void *safer_scalable_realloc(void *, size_t, void *);
+    extern __declspec(dllexport) void *scalable_calloc(size_t, size_t);
+    extern __declspec(dllexport) int scalable_posix_memalign(void **, size_t, size_t);
+    extern __declspec(dllexport) void *scalable_aligned_malloc(size_t, size_t);
+    extern __declspec(dllexport) void *scalable_aligned_realloc(void *, size_t, size_t);
+    extern __declspec(dllexport) void *safer_scalable_aligned_realloc(void *, size_t, size_t, void *);
+    extern __declspec(dllexport) void scalable_aligned_free(void *);
+    extern __declspec(dllexport) size_t scalable_msize(void *);
+    extern __declspec(dllexport) size_t safer_scalable_msize (void *, size_t (*)(void*));
+}
+#endif
+
+// Those functions must not be called instead of presented in dynamic library.
+extern "C" void *scalable_malloc(size_t)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" void scalable_free (void *)
+{
+    ASSERT(0, globalCallMsg);
+}
+extern "C" void safer_scalable_free (void *, void (*)(void*))
+{
+    ASSERT(0, globalCallMsg);
+}
+extern "C" void *scalable_realloc(void *, size_t)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" void *safer_scalable_realloc(void *, size_t, void *)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" void *scalable_calloc(size_t, size_t)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" int scalable_posix_memalign(void **, size_t, size_t)
+{
+    ASSERT(0, globalCallMsg);
+    return 0;
+}
+extern "C" void *scalable_aligned_malloc(size_t, size_t)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" void *scalable_aligned_realloc(void *, size_t, size_t)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" void *safer_scalable_aligned_realloc(void *, size_t, size_t, void *)
+{
+    ASSERT(0, globalCallMsg);
+    return NULL;
+}
+extern "C" void scalable_aligned_free(void *)
+{
+    ASSERT(0, globalCallMsg);
+}
+extern "C" size_t scalable_msize(void *)
+{
+    ASSERT(0, globalCallMsg);
+    return 0;
+}
+extern "C" size_t safer_scalable_msize (void *, size_t (*)(void*))
+{
+    ASSERT(0, globalCallMsg);
+    return 0;
+}
+
+#else  // _USRDLL
+
+// harness_defs.h must be included before tbb_stddef.h to overcome exception-dependent
+// system headers that come from tbb_stddef.h
+#include "harness_defs.h"
+#include "tbb/tbb_stddef.h"
+#if __TBB_WIN8UI_SUPPORT || __TBB_SOURCE_DIRECTLY_INCLUDED || __TBB_MIC_OFFLOAD
+// The test does not work if dynamic load is unavailable.
+// For MIC offload, it fails because liboffload brings libiomp which observes and uses the fake scalable_* calls.
+#define HARNESS_SKIP_TEST 1
+#endif
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+#include "harness.h"
+
+#if !HARNESS_SKIP_TEST
+
+#include "harness_dynamic_libs.h"
+#include "harness_memory.h"
+
+extern "C" {
+#if _WIN32||_WIN64
+extern __declspec(dllimport)
+#endif
+void *scalable_malloc(size_t);
+}
+
+struct Run {
+    void operator()( int /*id*/ ) const {
+        using namespace Harness;
+
+        void* (*malloc_ptr)(std::size_t);
+        void (*free_ptr)(void*);
+
+        void* (*aligned_malloc_ptr)(size_t size, size_t alignment);
+        void  (*aligned_free_ptr)(void*);
+
+        const char* actual_name;
+        LIBRARY_HANDLE lib = OpenLibrary(actual_name = MALLOCLIB_NAME1);
+        if (!lib)      lib = OpenLibrary(actual_name = MALLOCLIB_NAME2);
+        if (!lib) {
+            REPORT("Can't load " MALLOCLIB_NAME1 " or " MALLOCLIB_NAME2 "\n");
+            exit(1);
+        }
+        GetAddress(lib, "scalable_malloc", malloc_ptr);
+        GetAddress(lib, "scalable_free", free_ptr);
+        GetAddress(lib, "scalable_aligned_malloc", aligned_malloc_ptr);
+        GetAddress(lib, "scalable_aligned_free", aligned_free_ptr);
+
+        for (size_t sz = 1024; sz <= 10*1024 ; sz*=10) {
+            void *p1 = aligned_malloc_ptr(sz, 16);
+            memset(p1, 0, sz);
+            aligned_free_ptr(p1);
+        }
+
+        void *p = malloc_ptr(100);
+        memset(p, 1, 100);
+        free_ptr(p);
+
+        CloseLibrary(lib);
+#if _WIN32 || _WIN64
+        ASSERT(GetModuleHandle(actual_name),
+               "allocator library must not be unloaded");
+#else
+        ASSERT(dlsym(RTLD_DEFAULT, "scalable_malloc"),
+               "allocator library must not be unloaded");
+#endif
+    }
+};
+
+int TestMain () {
+    int i;
+    std::ptrdiff_t memory_leak;
+
+    // warm-up run
+    NativeParallelFor( 1, Run() );
+
+    {
+      /* 1st call to GetMemoryUsage() allocate some memory,
+         but it seems memory consumption stabilized after this.
+      */
+      GetMemoryUsage();
+      std::size_t memory_in_use = GetMemoryUsage();
+      ASSERT(memory_in_use == GetMemoryUsage(),
+             "Memory consumption should not increase after 1st GetMemoryUsage() call");
+    }
+    {
+        // expect that memory consumption stabilized after several runs
+        for (i=0; i<3; i++) {
+            std::size_t memory_in_use = GetMemoryUsage();
+            for (int j=0; j<10; j++)
+                NativeParallelFor( 1, Run() );
+            memory_leak = GetMemoryUsage() - memory_in_use;
+            if (memory_leak == 0)  // possibly too strong?
+                break;
+        }
+    }
+    if(3==i) {
+        // not stabilized, could be leak
+        REPORT( "Error: memory leak of up to %ld bytes\n", static_cast<long>(memory_leak));
+        exit(1);
+    }
+
+    return Harness::Done;
+}
+
+#endif /* HARNESS_SKIP_TEST */
+
+#endif // _USRDLL
diff --git a/xdl/third_party/tbb/src/test/test_malloc_new_handler.cpp b/xdl/third_party/tbb/src/test/test_malloc_new_handler.cpp
new file mode 100644
index 00000000..49e29c8c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_new_handler.cpp
@@ -0,0 +1,85 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_allocator_overload.h"
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+
+#include "harness.h"
+
+#if !HARNESS_SKIP_TEST && TBB_USE_EXCEPTIONS
+
+#include "harness_tbb_independence.h"
+#include "harness_assert.h"
+#include "harness_barrier.h"
+
+#include "../tbb/tls.h"
+
+tbb::internal::tls<bool> new_handler_called;
+void customNewHandler() {
+    new_handler_called = true;
+    throw std::bad_alloc();
+}
+
+// Return true if operator new threw exception
+bool allocateWithException(size_t big_mem) {
+    bool exception_caught = false;
+    try {
+        // Allocate big array (should throw exception)
+        char* volatile big_array = new char[big_mem];
+        // If succeeded, double the size (unless it overflows) and recursively retry
+        if (big_mem * 2 > big_mem) {
+            exception_caught = allocateWithException(big_mem * 2);
+        }
+        delete[] big_array;
+    } catch (const std::bad_alloc&) {
+        ASSERT(new_handler_called, "User provided new_handler was not called.");
+        exception_caught = true;
+    }
+    return exception_caught;
+}
+
+class AllocLoopBody : NoAssign {
+public:
+    void operator()(int) const {
+        size_t BIG_MEM = 100 * 1024 * 1024;
+        new_handler_called = false;
+        ASSERT(allocateWithException(BIG_MEM), "Operator new did not throw bad_alloc.");
+    }
+};
+
+int TestMain() {
+#if __TBB_CPP11_GET_NEW_HANDLER_PRESENT
+    std::new_handler default_handler = std::get_new_handler();
+    ASSERT(default_handler == NULL, "No handler should be set at this point.");
+#endif
+    // Define the handler for new operations
+    std::set_new_handler(customNewHandler);
+    // Run the test
+    NativeParallelFor(8, AllocLoopBody());
+    // Undo custom handler
+    std::set_new_handler(0);
+    return Harness::Done;
+}
+#else
+int TestMain() {
+    return Harness::Skipped;
+}
+#endif // !HARNESS_SKIP_TEST && TBB_USE_EXCEPTIONS
diff --git a/xdl/third_party/tbb/src/test/test_malloc_overload.cpp b/xdl/third_party/tbb/src/test/test_malloc_overload.cpp
new file mode 100644
index 00000000..4359cf1d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_overload.cpp
@@ -0,0 +1,443 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+#if (_WIN32 || _WIN64)
+// As the test is intentionally build with /EHs-, suppress multiple VS2005's
+// warnings like C4530: C++ exception handler used, but unwind semantics are not enabled
+#if defined(_MSC_VER) && !__INTEL_COMPILER
+/* ICC 10.1 and 11.0 generates code that uses std::_Raise_handler,
+   but it's only defined in libcpmt(d), which the test doesn't linked with.
+ */
+#undef  _HAS_EXCEPTIONS
+#define _HAS_EXCEPTIONS _CPPUNWIND
+#endif
+// to use strdup w/o warnings
+#define _CRT_NONSTDC_NO_DEPRECATE 1
+#endif // _WIN32 || _WIN64
+
+#define _ISOC11_SOURCE 1 // to get C11 declarations for GLIBC
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+
+#include "harness_allocator_overload.h"
+
+#if MALLOC_WINDOWS_OVERLOAD_ENABLED
+#include "tbb/tbbmalloc_proxy.h"
+#endif
+
+#include "harness.h"
+
+#if !HARNESS_SKIP_TEST
+
+#if __ANDROID__
+  #include <android/api-level.h> // for __ANDROID_API__
+#endif
+
+#define __TBB_POSIX_MEMALIGN_PRESENT (__linux__ && !__ANDROID__) || __APPLE__
+#define __TBB_PVALLOC_PRESENT __linux__ && !__ANDROID__
+#if __GLIBC__
+  // aligned_alloc available since GLIBC 2.16
+  #define __TBB_ALIGNED_ALLOC_PRESENT __GLIBC_PREREQ(2, 16)
+#endif // __GLIBC__
+ // later Android doesn't have valloc or dlmalloc_usable_size
+#define __TBB_VALLOC_PRESENT (__linux__ && __ANDROID_API__<21) || __APPLE__
+#define __TBB_DLMALLOC_USABLE_SIZE_PRESENT  __ANDROID__ && __ANDROID_API__<21
+
+#include "harness_report.h"
+#include "harness_assert.h"
+#include <stdlib.h>
+#include <string.h>
+#if !__APPLE__
+#include <malloc.h>
+#endif
+#include <stdio.h>
+#include <new>
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+#include <unistd.h> // for sysconf
+#include <dlfcn.h>
+#endif
+
+#if __linux__
+#include <stdint.h> // for uintptr_t
+
+extern "C" {
+void *__libc_malloc(size_t size);
+void *__libc_realloc(void *ptr, size_t size);
+void *__libc_calloc(size_t num, size_t size);
+void __libc_free(void *ptr);
+void *__libc_memalign(size_t alignment, size_t size);
+void *__libc_pvalloc(size_t size);
+void *__libc_valloc(size_t size);
+#if __TBB_DLMALLOC_USABLE_SIZE_PRESENT
+#define malloc_usable_size(p) dlmalloc_usable_size(p)
+size_t dlmalloc_usable_size(const void *ptr);
+#endif
+}
+
+#elif __APPLE__
+
+#include <malloc/malloc.h>
+#define malloc_usable_size(p) malloc_size(p)
+
+#elif _WIN32
+#include <stddef.h>
+#if __MINGW32__
+#include <unistd.h>
+#else
+typedef unsigned __int16 uint16_t;
+typedef unsigned __int32 uint32_t;
+typedef unsigned __int64 uint64_t;
+#endif
+
+#endif /* OS selection */
+
+#if _WIN32
+// On Windows, the trick with string "dependency on msvcpXX.dll" is necessary to create
+// dependency on msvcpXX.dll, for sake of a regression test.
+// On Linux, C++ RTL headers are undesirable because of breaking strict ANSI mode.
+#if defined(_MSC_VER) && _MSC_VER >= 1300 && _MSC_VER <= 1310 && !defined(__INTEL_COMPILER)
+/* Fixing compilation error reported by VS2003 for exception class
+   when _HAS_EXCEPTIONS is 0:
+   bad_cast that inherited from exception is not in std namespace.
+*/
+using namespace std;
+#endif
+#include <string>
+#endif
+
+#include "../tbbmalloc/shared_utils.h"  // alignDown, alignUp, estimatedCacheLineSize
+
+/* start of code replicated from src/tbbmalloc */
+
+class BackRefIdx { // composite index to backreference array
+private:
+    uint16_t master;      // index in BackRefMaster
+    uint16_t largeObj:1;  // is this object "large"?
+    uint16_t offset  :15; // offset from beginning of BackRefBlock
+public:
+    BackRefIdx() : master((uint16_t)-1) {}
+    bool isInvalid() { return master == (uint16_t)-1; }
+    bool isLargeObject() const { return largeObj; }
+    uint16_t getMaster() const { return master; }
+    uint16_t getOffset() const { return offset; }
+
+    // only newBackRef can modify BackRefIdx
+    static BackRefIdx newBackRef(bool largeObj);
+};
+
+class MemoryPool;
+class ExtMemoryPool;
+
+struct BlockI {
+    intptr_t     blockState[2];
+};
+
+struct LargeMemoryBlock : public BlockI {
+    MemoryPool       *pool;          // owner pool
+    LargeMemoryBlock *next,          // ptrs in list of cached blocks
+                     *prev,
+                     *gPrev,         // in pool's global list
+                     *gNext;
+    uintptr_t         age;           // age of block while in cache
+    size_t            objectSize;    // the size requested by a client
+    size_t            unalignedSize; // the size requested from getMemory
+    bool              fromMapMemory;
+    BackRefIdx        backRefIdx;    // cached here, used copy is in LargeObjectHdr
+    void registerInPool(ExtMemoryPool *extMemPool);
+    void unregisterFromPool(ExtMemoryPool *extMemPool);
+};
+
+struct LargeObjectHdr {
+    LargeMemoryBlock *memoryBlock;
+    /* Have to duplicate it here from CachedObjectHdr,
+       as backreference must be checked without further pointer dereference.
+       Points to LargeObjectHdr. */
+    BackRefIdx       backRefIdx;
+};
+
+/*
+ * Objects of size minLargeObjectSize and larger are considered large objects.
+ */
+const uintptr_t blockSize = 16*1024;
+const uint32_t fittingAlignment = rml::internal::estimatedCacheLineSize;
+#define SET_FITTING_SIZE(N) ( (blockSize-2*rml::internal::estimatedCacheLineSize)/N ) & ~(fittingAlignment-1)
+const uint32_t fittingSize5 = SET_FITTING_SIZE(2); // 8128/8064
+#undef SET_FITTING_SIZE
+const uint32_t minLargeObjectSize = fittingSize5 + 1;
+
+/* end of code replicated from src/tbbmalloc */
+
+static void scalableMallocCheckSize(void *object, size_t size)
+{
+#if __clang__
+// This prevents Clang from throwing out the calls to new & delete in CheckNewDeleteOverload().
+    static void *v = object;
+    Harness::suppress_unused_warning(v);
+#endif
+    ASSERT(object, NULL);
+    if (size >= minLargeObjectSize) {
+        LargeMemoryBlock *lmb = ((LargeObjectHdr*)object-1)->memoryBlock;
+        ASSERT(uintptr_t(lmb)<uintptr_t(((LargeObjectHdr*)object-1))
+               && lmb->objectSize >= size, NULL);
+    }
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+    ASSERT(malloc_usable_size(object) >= size, NULL);
+#elif MALLOC_WINDOWS_OVERLOAD_ENABLED
+    // Check that _msize works correctly
+    ASSERT(_msize(object) >= size, NULL);
+    ASSERT(size<8 || _aligned_msize(object,8,0) >= size, NULL);
+#endif
+}
+
+void CheckStdFuncOverload(void *(*malloc_p)(size_t), void *(*calloc_p)(size_t, size_t),
+                          void *(*realloc_p)(void *, size_t), void (*free_p)(void *))
+{
+    void *ptr = malloc_p(minLargeObjectSize);
+    scalableMallocCheckSize(ptr, minLargeObjectSize);
+    free(ptr);
+
+    ptr = calloc_p(minLargeObjectSize, 2);
+    scalableMallocCheckSize(ptr, 2*minLargeObjectSize);
+    void *ptr1 = realloc_p(ptr, 10*minLargeObjectSize);
+    scalableMallocCheckSize(ptr1, 10*minLargeObjectSize);
+    free_p(ptr1);
+}
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+
+void CheckMemalignFuncOverload(void *(*memalign_p)(size_t, size_t),
+                               void (*free_p)(void*))
+{
+    void *ptr = memalign_p(128, 4*minLargeObjectSize);
+    scalableMallocCheckSize(ptr, 4*minLargeObjectSize);
+    ASSERT(is_aligned(ptr, 128), NULL);
+    free_p(ptr);
+}
+
+void CheckVallocFuncOverload(void *(*valloc_p)(size_t), void (*free_p)(void*))
+{
+    void *ptr = valloc_p(minLargeObjectSize);
+    scalableMallocCheckSize(ptr, minLargeObjectSize);
+    ASSERT(is_aligned(ptr, sysconf(_SC_PAGESIZE)), NULL);
+    free_p(ptr);
+}
+
+void CheckPvalloc(void *(*pvalloc_p)(size_t), void (*free_p)(void*))
+{
+    const long memoryPageSize = sysconf(_SC_PAGESIZE);
+    // request large object with not power-of-2 size
+    const size_t largeSz = alignUp(minLargeObjectSize, 16*1024) + 1;
+
+    for (size_t sz = 0; sz<=largeSz; sz+=largeSz) {
+        void *ptr = pvalloc_p(sz);
+        scalableMallocCheckSize(ptr, sz? alignUp(sz, memoryPageSize) : memoryPageSize);
+        ASSERT(is_aligned(ptr, memoryPageSize), NULL);
+        free_p(ptr);
+    }
+}
+
+#endif // MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+
+// regression test: on macOS scalable_free() treated small aligned object,
+// placed in large block, as small block
+void CheckFreeAligned() {
+    size_t sz[] = {8, 4*1024, 16*1024, 0};
+    size_t align[] = {8, 4*1024, 16*1024, 0};
+
+    for (int s=0; sz[s]; s++)
+        for (int a=0; align[a]; a++) {
+            void *ptr = NULL;
+#if __TBB_POSIX_MEMALIGN_PRESENT
+            int ret = posix_memalign(&ptr, align[a], sz[s]);
+            ASSERT(!ret, NULL);
+#elif MALLOC_WINDOWS_OVERLOAD_ENABLED
+            ptr = _aligned_malloc(sz[s], align[a]);
+#endif
+            ASSERT(is_aligned(ptr, align[a]), NULL);
+            free(ptr);
+        }
+}
+
+#if __ANDROID__
+// Workaround for an issue with strdup somehow bypassing our malloc replacement on Android.
+char *strdup(const char *str) {
+    REPORT( "Known issue: malloc replacement does not work for strdup on Android.\n" );
+    size_t len = strlen(str)+1;
+    void *new_str = malloc(len);
+    return new_str ? reinterpret_cast<char *>(memcpy(new_str, str, len)) : 0;
+}
+#endif
+
+#if __APPLE__
+#include <mach/mach.h>
+
+// regression test: malloc_usable_size() that was passed to zone interface
+// called system malloc_usable_size(), so for object that was not allocated
+// by tbbmalloc non-zero was returned, so such objects were passed to
+// tbbmalloc's free(), that is incorrect
+void TestZoneOverload() {
+    vm_address_t *zones;
+    unsigned zones_num;
+
+    kern_return_t ret = malloc_get_all_zones(mach_task_self(), NULL, &zones, &zones_num);
+    ASSERT(!ret && zones_num>1, NULL);
+    malloc_zone_t *sys_zone = (malloc_zone_t*)zones[1];
+    ASSERT(strcmp("tbbmalloc", malloc_get_zone_name(sys_zone)),
+                  "zone 1 expected to be not tbbmalloc");
+    void *p = malloc_zone_malloc(sys_zone, 16);
+    free(p);
+}
+#else
+#define TestZoneOverload()
+#endif
+
+#if _WIN32
+// regression test: certain MSVC runtime functions use "public" allocation functions
+// but internal free routines, causing crashes if tbbmalloc_proxy does not intercept the latter.
+void TestRuntimeRoutines() {
+    system("rem should be a safe command to call");
+}
+#else
+#define TestRuntimeRoutines()
+#endif
+
+struct BigStruct {
+    char f[minLargeObjectSize];
+};
+
+void CheckNewDeleteOverload() {
+    BigStruct *s1, *s2, *s3, *s4;
+
+    s1 = new BigStruct;
+    scalableMallocCheckSize(s1, sizeof(BigStruct));
+    delete s1;
+
+    s2 = new BigStruct[10];
+    scalableMallocCheckSize(s2, 10*sizeof(BigStruct));
+    delete []s2;
+
+    s3 = new(std::nothrow) BigStruct;
+    scalableMallocCheckSize(s3, sizeof(BigStruct));
+    delete s3;
+
+    s4 = new(std::nothrow) BigStruct[2];
+    scalableMallocCheckSize(s4, 2*sizeof(BigStruct));
+    delete []s4;
+}
+
+int TestMain() {
+    void *ptr = NULL;
+
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+    ASSERT(dlsym(RTLD_DEFAULT, "scalable_malloc"),
+           "Lost dependency on malloc_proxy or LD_PRELOAD was not set?");
+#endif
+
+/* On Windows, memory block size returned by _msize() is sometimes used
+   to calculate the size for an extended block. Substituting _msize,
+   scalable_msize initially returned 0 for regions not allocated by the scalable
+   allocator, which led to incorrect memory reallocation and subsequent crashes.
+   It was found that adding a new environment variable triggers the error.
+*/
+    ASSERT(getenv("PATH"), "We assume that PATH is set everywhere.");
+    char *pathCopy = strdup(getenv("PATH"));
+#if __ANDROID__
+    ASSERT(strcmp(pathCopy,getenv("PATH")) == 0, "strdup workaround does not work as expected.");
+#endif
+    const char *newEnvName = "__TBBMALLOC_OVERLOAD_REGRESSION_TEST_FOR_REALLOC_AND_MSIZE";
+    ASSERT(!getenv(newEnvName), "Environment variable should not be used before.");
+    int r = Harness::SetEnv(newEnvName,"1");
+    ASSERT(!r, NULL);
+    char *path = getenv("PATH");
+    ASSERT(path && 0==strcmp(path, pathCopy), "Environment was changed erroneously.");
+    free(pathCopy);
+
+    CheckStdFuncOverload(malloc, calloc, realloc, free);
+#if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
+
+#if __TBB_POSIX_MEMALIGN_PRESENT
+    int ret = posix_memalign(&ptr, 1024, 3*minLargeObjectSize);
+    ASSERT(0 == ret, NULL);
+    scalableMallocCheckSize(ptr, 3*minLargeObjectSize);
+    ASSERT(is_aligned(ptr, 1024), NULL);
+    free(ptr);
+#endif
+
+#if __TBB_VALLOC_PRESENT
+    CheckVallocFuncOverload(valloc, free);
+#endif
+#if __TBB_PVALLOC_PRESENT
+    CheckPvalloc(pvalloc, free);
+#endif
+#if __linux__
+    CheckMemalignFuncOverload(memalign, free);
+#if __TBB_ALIGNED_ALLOC_PRESENT
+    CheckMemalignFuncOverload(aligned_alloc, free);
+#endif
+
+    struct mallinfo info = mallinfo();
+    // right now mallinfo initialized by zero
+    ASSERT(!info.arena && !info.ordblks && !info.smblks && !info.hblks
+           && !info.hblkhd && !info.usmblks && !info.fsmblks
+           && !info.uordblks && !info.fordblks && !info.keepcost, NULL);
+
+ #if !__ANDROID__
+    // These non-standard functions are exported by GLIBC, and might be used
+    // in conjunction with standard malloc/free. Test that we overload them as well.
+    // Bionic doesn't have them.
+    CheckStdFuncOverload(__libc_malloc, __libc_calloc, __libc_realloc, __libc_free);
+    CheckMemalignFuncOverload(__libc_memalign, __libc_free);
+    CheckVallocFuncOverload(__libc_valloc, __libc_free);
+    CheckPvalloc(__libc_pvalloc, __libc_free);
+ #endif
+#endif // __linux__
+
+#else // MALLOC_WINDOWS_OVERLOAD_ENABLED
+
+    ptr = _aligned_malloc(minLargeObjectSize, 16);
+    scalableMallocCheckSize(ptr, minLargeObjectSize);
+    ASSERT(is_aligned(ptr, 16), NULL);
+
+    // Testing of workaround for vs "is power of 2 pow N" bug that accepts zeros
+    void* ptr1 = _aligned_malloc(minLargeObjectSize, 0);
+    scalableMallocCheckSize(ptr, minLargeObjectSize);
+    ASSERT(is_aligned(ptr, sizeof(void*)), NULL);
+    _aligned_free(ptr1);
+
+    ptr1 = _aligned_realloc(ptr, minLargeObjectSize*10, 16);
+    scalableMallocCheckSize(ptr1, minLargeObjectSize*10);
+    ASSERT(is_aligned(ptr, 16), NULL);
+    _aligned_free(ptr1);
+
+#endif
+    CheckFreeAligned();
+
+    CheckNewDeleteOverload();
+
+#if _WIN32
+    std::string stdstring = "dependency on msvcpXX.dll";
+    ASSERT(strcmp(stdstring.c_str(), "dependency on msvcpXX.dll") == 0, NULL);
+#endif
+    TestZoneOverload();
+    TestRuntimeRoutines();
+
+    return Harness::Done;
+}
+#endif // !HARNESS_SKIP_TEST
diff --git a/xdl/third_party/tbb/src/test/test_malloc_overload_disable.cpp b/xdl/third_party/tbb/src/test/test_malloc_overload_disable.cpp
new file mode 100644
index 00000000..18836989
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_overload_disable.cpp
@@ -0,0 +1,73 @@
+/*
+    Copyright (c) 2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_allocator_overload.h"
+#include "harness.h"
+
+// Disabling malloc proxy via env variable is available only on Windows for now
+#if MALLOC_WINDOWS_OVERLOAD_ENABLED
+
+#define TEST_SYSTEM_COMMAND "test_malloc_overload_disable.exe"
+
+#include "tbb/tbbmalloc_proxy.h"
+#include "../tbb/tbb_environment.h"
+
+const size_t SmallObjectSize = 16;
+const size_t LargeObjectSize = 2*8*1024;
+const size_t HugeObjectSize = 2*1024*1024;
+
+void CheckWindowsProxyDisablingViaMemSize( size_t ObjectSize ) {
+    void* ptr = malloc(ObjectSize);
+    /*
+     * If msize returns 0 - tbbmalloc doesn't contain this object in it`s memory
+     * Also msize check that proxy lib is linked
+     */
+    ASSERT(!__TBB_malloc_safer_msize(ptr,NULL), "Malloc replacement is not deactivated");
+    free(ptr);
+
+}
+
+int TestMain() {
+    if (!tbb::internal::GetBoolEnvironmentVariable("TBB_MALLOC_DISABLE_REPLACEMENT"))
+    {
+        Harness::SetEnv("TBB_MALLOC_DISABLE_REPLACEMENT","1");
+        if ((system(TEST_SYSTEM_COMMAND)) != 0) {
+            REPORT("Test error: unable to run the command: %s", TEST_SYSTEM_COMMAND);
+            exit(-1);
+        }
+        // We must execute exit(0) to avoid duplicate "Done" printing.
+        exit(0);
+    }
+    else
+    {
+        // Check SMALL objects replacement disable
+        CheckWindowsProxyDisablingViaMemSize(SmallObjectSize);
+        // Check LARGE objects replacement disable
+        CheckWindowsProxyDisablingViaMemSize(LargeObjectSize);
+        // Check HUGE objects replacement disable
+        CheckWindowsProxyDisablingViaMemSize(HugeObjectSize);
+    }
+    return Harness::Done;
+}
+#else // MALLOC_WINDOWS_OVERLOAD_ENABLED
+int TestMain() {
+    return Harness::Skipped;
+}
+#endif // MALLOC_WINDOWS_OVERLOAD_ENABLED
diff --git a/xdl/third_party/tbb/src/test/test_malloc_pools.cpp b/xdl/third_party/tbb/src/test/test_malloc_pools.cpp
new file mode 100644
index 00000000..037c259e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_pools.cpp
@@ -0,0 +1,863 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/scalable_allocator.h"
+#include "tbb/atomic.h"
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+#include "harness.h"
+#include "harness_barrier.h"
+#include "harness_tls.h"
+#if !__TBB_SOURCE_DIRECTLY_INCLUDED
+#include "harness_tbb_independence.h"
+#endif
+
+template<typename T>
+static inline T alignUp  (T arg, uintptr_t alignment) {
+    return T(((uintptr_t)arg+(alignment-1)) & ~(alignment-1));
+}
+
+struct PoolSpace: NoCopy {
+    size_t pos;
+    int    regions;
+    size_t bufSize;
+    char  *space;
+
+    static const size_t BUF_SIZE = 8*1024*1024;
+
+    PoolSpace(size_t bufSz = BUF_SIZE) :
+        pos(0), regions(0),
+        bufSize(bufSz), space(new char[bufSize]) {
+        memset(space, 0, bufSize);
+    }
+    ~PoolSpace() {
+        delete []space;
+    }
+};
+
+static PoolSpace *poolSpace;
+
+struct MallocPoolHeader {
+    void  *rawPtr;
+    size_t userSize;
+};
+
+static tbb::atomic<int> liveRegions;
+
+static void *getMallocMem(intptr_t /*pool_id*/, size_t &bytes)
+{
+    void *rawPtr = malloc(bytes+sizeof(MallocPoolHeader)+1);
+    if (!rawPtr)
+        return NULL;
+    // +1 to check working with unaligned space
+    void *ret = (void *)((uintptr_t)rawPtr+sizeof(MallocPoolHeader)+1);
+
+    MallocPoolHeader *hdr = (MallocPoolHeader*)ret-1;
+    hdr->rawPtr = rawPtr;
+    hdr->userSize = bytes;
+
+    liveRegions++;
+
+    return ret;
+}
+
+static int putMallocMem(intptr_t /*pool_id*/, void *ptr, size_t bytes)
+{
+    MallocPoolHeader *hdr = (MallocPoolHeader*)ptr-1;
+    ASSERT(bytes == hdr->userSize, "Invalid size in pool callback.");
+    free(hdr->rawPtr);
+
+    liveRegions--;
+
+    return 0;
+}
+
+void TestPoolReset()
+{
+    rml::MemPoolPolicy pol(getMallocMem, putMallocMem);
+    rml::MemoryPool *pool;
+
+    pool_create_v1(0, &pol, &pool);
+    for (int i=0; i<100; i++) {
+        ASSERT(pool_malloc(pool, 8), NULL);
+        ASSERT(pool_malloc(pool, 50*1024), NULL);
+    }
+    int regionsBeforeReset = liveRegions;
+    bool ok = pool_reset(pool);
+    ASSERT(ok, NULL);
+    for (int i=0; i<100; i++) {
+        ASSERT(pool_malloc(pool, 8), NULL);
+        ASSERT(pool_malloc(pool, 50*1024), NULL);
+    }
+    ASSERT(regionsBeforeReset == liveRegions,
+           "Expected no new regions allocation.");
+    ok = pool_destroy(pool);
+    ASSERT(ok, NULL);
+    ASSERT(!liveRegions, "Expected all regions were released.");
+}
+
+class SharedPoolRun: NoAssign {
+    static long                 threadNum;
+    static Harness::SpinBarrier startB,
+                                mallocDone;
+    static rml::MemoryPool     *pool;
+    static void               **crossThread,
+                              **afterTerm;
+public:
+    static const int OBJ_CNT = 100;
+
+    static void init(int num, rml::MemoryPool *pl, void **crThread, void **aTerm) {
+        threadNum = num;
+        pool = pl;
+        crossThread = crThread;
+        afterTerm = aTerm;
+        startB.initialize(threadNum);
+        mallocDone.initialize(threadNum);
+    }
+
+    void operator()( int id ) const {
+        const int ITERS = 1000;
+        void *local[ITERS];
+
+        startB.wait();
+        for (int i=id*OBJ_CNT; i<(id+1)*OBJ_CNT; i++) {
+            afterTerm[i] = pool_malloc(pool, i%2? 8*1024 : 9*1024);
+            memset(afterTerm[i], i, i%2? 8*1024 : 9*1024);
+            crossThread[i] = pool_malloc(pool, i%2? 9*1024 : 8*1024);
+            memset(crossThread[i], i, i%2? 9*1024 : 8*1024);
+        }
+
+        for (int i=1; i<ITERS; i+=2) {
+            local[i-1] = pool_malloc(pool, 6*1024);
+            memset(local[i-1], i, 6*1024);
+            local[i] = pool_malloc(pool, 16*1024);
+            memset(local[i], i, 16*1024);
+        }
+        mallocDone.wait();
+        int myVictim = threadNum-id-1;
+        for (int i=myVictim*OBJ_CNT; i<(myVictim+1)*OBJ_CNT; i++)
+            pool_free(pool, crossThread[i]);
+        for (int i=0; i<ITERS; i++)
+            pool_free(pool, local[i]);
+    }
+};
+
+long                 SharedPoolRun::threadNum;
+Harness::SpinBarrier SharedPoolRun::startB,
+                     SharedPoolRun::mallocDone;
+rml::MemoryPool     *SharedPoolRun::pool;
+void               **SharedPoolRun::crossThread,
+                   **SharedPoolRun::afterTerm;
+
+// single pool shared by different threads
+void TestSharedPool()
+{
+    rml::MemPoolPolicy pol(getMallocMem, putMallocMem);
+    rml::MemoryPool *pool;
+
+    pool_create_v1(0, &pol, &pool);
+    void **crossThread = new void*[MaxThread * SharedPoolRun::OBJ_CNT];
+    void **afterTerm = new void*[MaxThread * SharedPoolRun::OBJ_CNT];
+
+    for (int p=MinThread; p<=MaxThread; p++) {
+        SharedPoolRun::init(p, pool, crossThread, afterTerm);
+        SharedPoolRun thr;
+
+        void *hugeObj = pool_malloc(pool, 10*1024*1024);
+        ASSERT(hugeObj, NULL);
+
+        NativeParallelFor( p, thr );
+
+        pool_free(pool, hugeObj);
+        for (int i=0; i<p*SharedPoolRun::OBJ_CNT; i++)
+            pool_free(pool, afterTerm[i]);
+    }
+    delete []afterTerm;
+    delete []crossThread;
+
+    bool ok = pool_destroy(pool);
+    ASSERT(ok, NULL);
+    ASSERT(!liveRegions, "Expected all regions were released.");
+}
+
+void *CrossThreadGetMem(intptr_t pool_id, size_t &bytes)
+{
+    if (poolSpace[pool_id].pos + bytes > poolSpace[pool_id].bufSize)
+        return NULL;
+
+    void *ret = poolSpace[pool_id].space + poolSpace[pool_id].pos;
+    poolSpace[pool_id].pos += bytes;
+    poolSpace[pool_id].regions++;
+
+    return ret;
+}
+
+int CrossThreadPutMem(intptr_t pool_id, void* /*raw_ptr*/, size_t /*raw_bytes*/)
+{
+    poolSpace[pool_id].regions--;
+    return 0;
+}
+
+class CrossThreadRun: NoAssign {
+    static long number_of_threads;
+    static Harness::SpinBarrier barrier;
+    static rml::MemoryPool **pool;
+    static char **obj;
+public:
+    static void initBarrier(unsigned thrds) { barrier.initialize(thrds); }
+    static void init(long num) {
+        number_of_threads = num;
+        pool = new rml::MemoryPool*[number_of_threads];
+        poolSpace = new PoolSpace[number_of_threads];
+        obj = new char*[number_of_threads];
+    }
+    static void destroy() {
+        for (long i=0; i<number_of_threads; i++)
+            ASSERT(!poolSpace[i].regions, "Memory leak detected");
+        delete []pool;
+        delete []poolSpace;
+        delete []obj;
+    }
+    CrossThreadRun() {}
+    void operator()( int id ) const {
+        rml::MemPoolPolicy pol(CrossThreadGetMem, CrossThreadPutMem);
+        const int objLen = 10*id;
+
+        pool_create_v1(id, &pol, &pool[id]);
+        obj[id] = (char*)pool_malloc(pool[id], objLen);
+        ASSERT(obj[id], NULL);
+        memset(obj[id], id, objLen);
+
+        {
+            const size_t lrgSz = 2*16*1024;
+            void *ptrLarge = pool_malloc(pool[id], lrgSz);
+            ASSERT(ptrLarge, NULL);
+            memset(ptrLarge, 1, lrgSz);
+
+            // consume all small objects
+            while (pool_malloc(pool[id], 5*1024))
+                ;
+            // releasing of large object can give a chance to allocate more
+            pool_free(pool[id], ptrLarge);
+
+            ASSERT(pool_malloc(pool[id], 5*1024), NULL);
+        }
+
+        barrier.wait();
+        int myPool = number_of_threads-id-1;
+        for (int i=0; i<10*myPool; i++)
+            ASSERT(myPool==obj[myPool][i], NULL);
+        pool_free(pool[myPool], obj[myPool]);
+        bool ok = pool_destroy(pool[myPool]);
+        ASSERT(ok, NULL);
+    }
+};
+
+long CrossThreadRun::number_of_threads;
+Harness::SpinBarrier CrossThreadRun::barrier;
+rml::MemoryPool **CrossThreadRun::pool;
+char **CrossThreadRun::obj;
+
+// pools created, used and destroyed by different threads
+void TestCrossThreadPools()
+{
+    for (int p=MinThread; p<=MaxThread; p++) {
+        CrossThreadRun::initBarrier(p);
+        CrossThreadRun::init(p);
+        NativeParallelFor( p, CrossThreadRun() );
+        for (int i=0; i<p; i++)
+            ASSERT(!poolSpace[i].regions, "Region leak detected");
+        CrossThreadRun::destroy();
+    }
+}
+
+// buffer is too small to pool be created, but must not leak resources
+void TestTooSmallBuffer()
+{
+    poolSpace = new PoolSpace(8*1024);
+
+    rml::MemPoolPolicy pol(CrossThreadGetMem, CrossThreadPutMem);
+    rml::MemoryPool *pool;
+    pool_create_v1(0, &pol, &pool);
+    bool ok = pool_destroy(pool);
+    ASSERT(ok, NULL);
+    ASSERT(!poolSpace[0].regions, "No leaks.");
+
+    delete poolSpace;
+}
+
+class FixedPoolHeadBase : NoAssign {
+    size_t   size;
+    intptr_t used;
+    char    *data;
+public:
+    FixedPoolHeadBase(size_t s) : size(s), used(false) {
+        data = new char[size];
+    }
+    void *useData(size_t &bytes) {
+        intptr_t wasUsed = __TBB_FetchAndStoreW(&used, true);
+        ASSERT(!wasUsed, "The buffer must not be used twice.");
+        bytes = size;
+        return data;
+    }
+    ~FixedPoolHeadBase() {
+        delete []data;
+    }
+};
+
+template<size_t SIZE>
+class FixedPoolHead : FixedPoolHeadBase {
+public:
+    FixedPoolHead() : FixedPoolHeadBase(SIZE) { }
+};
+
+static void *fixedBufGetMem(intptr_t pool_id, size_t &bytes)
+{
+    return ((FixedPoolHeadBase*)pool_id)->useData(bytes);
+}
+
+class FixedPoolUse: NoAssign {
+    static Harness::SpinBarrier startB;
+    rml::MemoryPool *pool;
+    size_t reqSize;
+    int iters;
+public:
+    FixedPoolUse(unsigned threads, rml::MemoryPool *p, size_t sz, int it) :
+        pool(p), reqSize(sz), iters(it) {
+        startB.initialize(threads);
+    }
+    void operator()( int /*id*/ ) const {
+        startB.wait();
+        for (int i=0; i<iters; i++) {
+            void *o = pool_malloc(pool, reqSize);
+            ASSERT(o, NULL);
+            pool_free(pool, o);
+        }
+    }
+};
+
+Harness::SpinBarrier FixedPoolUse::startB;
+
+class FixedPoolNomem: NoAssign {
+    Harness::SpinBarrier *startB;
+    rml::MemoryPool *pool;
+public:
+    FixedPoolNomem(Harness::SpinBarrier *b, rml::MemoryPool *p) :
+        startB(b), pool(p) {}
+    void operator()(int id) const {
+        startB->wait();
+        void *o = pool_malloc(pool, id%2? 64 : 128*1024);
+        ASSERT(!o, "All memory must be consumed.");
+    }
+};
+
+class FixedPoolSomeMem: NoAssign {
+    Harness::SpinBarrier *barrier;
+    rml::MemoryPool *pool;
+public:
+    FixedPoolSomeMem(Harness::SpinBarrier *b, rml::MemoryPool *p) :
+        barrier(b), pool(p) {}
+    void operator()(int id) const {
+        barrier->wait();
+        Harness::Sleep(2*id);
+        void *o = pool_malloc(pool, id%2? 64 : 128*1024);
+        barrier->wait();
+        pool_free(pool, o);
+    }
+};
+
+bool haveEnoughSpace(rml::MemoryPool *pool, size_t sz)
+{
+    if (void *p = pool_malloc(pool, sz)) {
+        pool_free(pool, p);
+        return true;
+    }
+    return false;
+}
+
+void TestFixedBufferPool()
+{
+    const int ITERS = 7;
+    const size_t MAX_OBJECT = 7*1024*1024;
+    void *ptrs[ITERS];
+    rml::MemPoolPolicy pol(fixedBufGetMem, NULL, 0, /*fixedSizePool=*/true,
+                           /*keepMemTillDestroy=*/false);
+    rml::MemoryPool *pool;
+    {
+        FixedPoolHead<MAX_OBJECT + 1024*1024> head;
+
+        pool_create_v1((intptr_t)&head, &pol, &pool);
+        {
+            NativeParallelFor( 1, FixedPoolUse(1, pool, MAX_OBJECT, 2) );
+
+            for (int i=0; i<ITERS; i++) {
+                ptrs[i] = pool_malloc(pool, MAX_OBJECT/ITERS);
+                ASSERT(ptrs[i], NULL);
+            }
+            for (int i=0; i<ITERS; i++)
+                pool_free(pool, ptrs[i]);
+
+            NativeParallelFor( 1, FixedPoolUse(1, pool, MAX_OBJECT, 1) );
+        }
+        // each thread asks for an MAX_OBJECT/p/2 object,
+        // /2 is to cover fragmentation
+        for (int p=MinThread; p<=MaxThread; p++)
+            NativeParallelFor( p, FixedPoolUse(p, pool, MAX_OBJECT/p/2, 10000) );
+        {
+            const int p=128;
+            NativeParallelFor( p, FixedPoolUse(p, pool, MAX_OBJECT/p/2, 1) );
+        }
+        {
+            size_t maxSz;
+            const int p = 512;
+            Harness::SpinBarrier barrier(p);
+
+            // Find maximal useful object size. Start with MAX_OBJECT/2,
+            // as the pool might be fragmented by BootStrapBlocks consumed during
+            // FixedPoolRun.
+            size_t l, r;
+            ASSERT(haveEnoughSpace(pool, MAX_OBJECT/2), NULL);
+            for (l = MAX_OBJECT/2, r = MAX_OBJECT + 1024*1024; l < r-1; ) {
+                size_t mid = (l+r)/2;
+                if (haveEnoughSpace(pool, mid))
+                    l = mid;
+                else
+                    r = mid;
+            }
+            maxSz = l;
+            ASSERT(!haveEnoughSpace(pool, maxSz+1), "Expect to find boundary value.");
+            // consume all available memory
+            void *largeObj = pool_malloc(pool, maxSz);
+            ASSERT(largeObj, NULL);
+            void *o = pool_malloc(pool, 64);
+            if (o) // pool fragmented, skip FixedPoolNomem
+                pool_free(pool, o);
+            else
+                NativeParallelFor( p, FixedPoolNomem(&barrier, pool) );
+            pool_free(pool, largeObj);
+            // keep some space unoccupied
+            largeObj = pool_malloc(pool, maxSz-512*1024);
+            ASSERT(largeObj, NULL);
+            NativeParallelFor( p, FixedPoolSomeMem(&barrier, pool) );
+            pool_free(pool, largeObj);
+        }
+        bool ok = pool_destroy(pool);
+        ASSERT(ok, NULL);
+    }
+    // check that fresh untouched pool can successfully fulfil requests from 128 threads
+    {
+        FixedPoolHead<MAX_OBJECT + 1024*1024> head;
+        pool_create_v1((intptr_t)&head, &pol, &pool);
+        int p=128;
+        NativeParallelFor( p, FixedPoolUse(p, pool, MAX_OBJECT/p/2, 1) );
+        bool ok = pool_destroy(pool);
+        ASSERT(ok, NULL);
+    }
+}
+
+static size_t currGranularity;
+
+static void *getGranMem(intptr_t /*pool_id*/, size_t &bytes)
+{
+    ASSERT(!(bytes%currGranularity), "Region size mismatch granularity.");
+    return malloc(bytes);
+}
+
+static int putGranMem(intptr_t /*pool_id*/, void *ptr, size_t bytes)
+{
+    ASSERT(!(bytes%currGranularity), "Region size mismatch granularity.");
+    free(ptr);
+    return 0;
+}
+
+void TestPoolGranularity()
+{
+    rml::MemPoolPolicy pol(getGranMem, putGranMem);
+    const size_t grans[] = {4*1024, 2*1024*1024, 6*1024*1024, 10*1024*1024};
+
+    for (unsigned i=0; i<sizeof(grans)/sizeof(grans[0]); i++) {
+        pol.granularity = currGranularity = grans[i];
+        rml::MemoryPool *pool;
+
+        pool_create_v1(0, &pol, &pool);
+        for (int sz=500*1024; sz<16*1024*1024; sz+=101*1024) {
+            void *p = pool_malloc(pool, sz);
+            ASSERT(p, "Can't allocate memory in pool.");
+            pool_free(pool, p);
+        }
+        bool ok = pool_destroy(pool);
+        ASSERT(ok, NULL);
+    }
+}
+
+static size_t putMemAll, getMemAll, getMemSuccessful;
+
+static void *getMemMalloc(intptr_t /*pool_id*/, size_t &bytes)
+{
+    getMemAll++;
+    void *p = malloc(bytes);
+    if (p)
+        getMemSuccessful++;
+    return p;
+}
+
+static int putMemFree(intptr_t /*pool_id*/, void *ptr, size_t /*bytes*/)
+{
+    putMemAll++;
+    free(ptr);
+    return 0;
+}
+
+void TestPoolKeepTillDestroy()
+{
+    const int ITERS = 50*1024;
+    void *ptrs[2*ITERS+1];
+    rml::MemPoolPolicy pol(getMemMalloc, putMemFree);
+    rml::MemoryPool *pool;
+
+    // 1st create default pool that returns memory back to callback,
+    // then use keepMemTillDestroy policy
+    for (int keep=0; keep<2; keep++) {
+        getMemAll = putMemAll = 0;
+        if (keep)
+            pol.keepAllMemory = 1;
+        pool_create_v1(0, &pol, &pool);
+        for (int i=0; i<2*ITERS; i+=2) {
+            ptrs[i] = pool_malloc(pool, 7*1024);
+            ptrs[i+1] = pool_malloc(pool, 10*1024);
+        }
+        ptrs[2*ITERS] = pool_malloc(pool, 8*1024*1024);
+        ASSERT(!putMemAll, NULL);
+        for (int i=0; i<2*ITERS; i++)
+            pool_free(pool, ptrs[i]);
+        pool_free(pool, ptrs[2*ITERS]);
+        size_t totalPutMemCalls = putMemAll;
+        if (keep)
+            ASSERT(!putMemAll, NULL);
+        else {
+            ASSERT(putMemAll, NULL);
+            putMemAll = 0;
+        }
+        size_t getCallsBefore = getMemAll;
+        void *p = pool_malloc(pool, 8*1024*1024);
+        ASSERT(p, NULL);
+        if (keep)
+            ASSERT(getCallsBefore == getMemAll, "Must not lead to new getMem call");
+        size_t putCallsBefore = putMemAll;
+        bool ok = pool_reset(pool);
+        ASSERT(ok, NULL);
+        ASSERT(putCallsBefore == putMemAll, "Pool is not releasing memory during reset.");
+        ok = pool_destroy(pool);
+        ASSERT(ok, NULL);
+        ASSERT(putMemAll, NULL);
+        totalPutMemCalls += putMemAll;
+        ASSERT(getMemAll == totalPutMemCalls, "Memory leak detected.");
+    }
+
+}
+
+static bool memEqual(char *buf, size_t size, int val)
+{
+    bool memEq = true;
+    for (size_t k=0; k<size; k++)
+        if (buf[k] != val)
+             memEq = false;
+    return memEq;
+}
+
+void TestEntries()
+{
+    const int SZ = 4;
+    const int ALGN = 4;
+    size_t size[SZ] = {8, 8000, 9000, 100*1024};
+    size_t algn[ALGN] = {8, 64, 4*1024, 8*1024*1024};
+
+    rml::MemPoolPolicy pol(getGranMem, putGranMem);
+    currGranularity = 1; // not check granularity in the test
+    rml::MemoryPool *pool;
+
+    pool_create_v1(0, &pol, &pool);
+    for (int i=0; i<SZ; i++)
+        for (int j=0; j<ALGN; j++) {
+            char *p = (char*)pool_aligned_malloc(pool, size[i], algn[j]);
+            ASSERT(p && 0==((uintptr_t)p & (algn[j]-1)), NULL);
+            memset(p, j, size[i]);
+
+            size_t curr_algn = algn[rand() % ALGN];
+            size_t curr_sz = size[rand() % SZ];
+            char *p1 = (char*)pool_aligned_realloc(pool, p, curr_sz, curr_algn);
+            ASSERT(p1 && 0==((uintptr_t)p1 & (curr_algn-1)), NULL);
+            ASSERT(memEqual(p1, min(size[i], curr_sz), j), NULL);
+
+            memset(p1, j+1, curr_sz);
+            size_t curr_sz1 = size[rand() % SZ];
+            char *p2 = (char*)pool_realloc(pool, p1, curr_sz1);
+            ASSERT(p2, NULL);
+            ASSERT(memEqual(p2, min(curr_sz1, curr_sz), j+1), NULL);
+
+            pool_free(pool, p2);
+        }
+
+    bool ok = pool_destroy(pool);
+    ASSERT(ok, NULL);
+
+    bool fail = rml::pool_destroy(NULL);
+    ASSERT(!fail, NULL);
+    fail = rml::pool_reset(NULL);
+    ASSERT(!fail, NULL);
+}
+
+rml::MemoryPool *CreateUsablePool(size_t size)
+{
+    rml::MemoryPool *pool;
+    rml::MemPoolPolicy okPolicy(getMemMalloc, putMemFree);
+
+    putMemAll = getMemAll = getMemSuccessful = 0;
+    rml::MemPoolError res = pool_create_v1(0, &okPolicy, &pool);
+    if (res != rml::POOL_OK) {
+        ASSERT(!getMemAll && !putMemAll, "No callbacks after fail.");
+        return NULL;
+    }
+    void *o = pool_malloc(pool, size);
+    if (!getMemSuccessful) {
+        // no memory from callback, valid reason to leave
+        ASSERT(!o, "The pool must be unusable.");
+        return NULL;
+    }
+    ASSERT(o, "Created pool must be useful.");
+    ASSERT(getMemSuccessful == 1 || getMemAll > getMemSuccessful,
+           "Multiple requests are allowed only when unsuccessful request occurred.");
+    ASSERT(!putMemAll, NULL);
+    pool_free(pool, o);
+
+    return pool;
+}
+
+void CheckPoolLeaks(size_t poolsAlwaysAvailable)
+{
+    const size_t MAX_POOLS = 16*1000;
+    const int ITERS = 20, CREATED_STABLE = 3;
+    rml::MemoryPool *pools[MAX_POOLS];
+    size_t created, maxCreated = MAX_POOLS;
+    int maxNotChangedCnt = 0;
+
+    // expecting that for ITERS runs, max number of pools that can be created
+    // can be stabilized and still stable CREATED_STABLE times
+    for (int j=0; j<ITERS && maxNotChangedCnt<CREATED_STABLE; j++) {
+        for (created=0; created<maxCreated; created++) {
+            rml::MemoryPool *p = CreateUsablePool(1024);
+            if (!p)
+                break;
+            pools[created] = p;
+        }
+        ASSERT(created>=poolsAlwaysAvailable,
+               "Expect that the reasonable number of pools can be always created.");
+        for (size_t i=0; i<created; i++) {
+            bool ok = pool_destroy(pools[i]);
+            ASSERT(ok, NULL);
+        }
+        if (created < maxCreated) {
+            maxCreated = created;
+            maxNotChangedCnt = 0;
+        } else
+            maxNotChangedCnt++;
+    }
+    ASSERT(maxNotChangedCnt == CREATED_STABLE, "The number of created pools must be stabilized.");
+}
+
+void TestPoolCreation()
+{
+    putMemAll = getMemAll = getMemSuccessful = 0;
+
+    rml::MemPoolPolicy nullPolicy(NULL, putMemFree),
+        emptyFreePolicy(getMemMalloc, NULL),
+        okPolicy(getMemMalloc, putMemFree);
+    rml::MemoryPool *pool;
+
+    rml::MemPoolError res = pool_create_v1(0, &nullPolicy, &pool);
+    ASSERT(res==rml::INVALID_POLICY, "pool with empty pAlloc can't be created");
+    res = pool_create_v1(0, &emptyFreePolicy, &pool);
+    ASSERT(res==rml::INVALID_POLICY, "pool with empty pFree can't be created");
+    ASSERT(!putMemAll && !getMemAll, "no callback calls are expected");
+    res = pool_create_v1(0, &okPolicy, &pool);
+    ASSERT(res==rml::POOL_OK, NULL);
+    bool ok = pool_destroy(pool);
+    ASSERT(ok, NULL);
+    ASSERT(putMemAll == getMemSuccessful, "no leaks after pool_destroy");
+
+    // 32 is a guess for a number of pools that is acceptable everywere
+    CheckPoolLeaks(32);
+    // try to consume all but 16 TLS keys
+    LimitTLSKeysTo limitTLSTo(16);
+    // ...and check that we can create at least 16 pools
+    CheckPoolLeaks(16);
+}
+
+struct AllocatedObject {
+    rml::MemoryPool *pool;
+};
+
+const size_t BUF_SIZE = 1024*1024;
+
+class PoolIdentityCheck : NoAssign {
+    rml::MemoryPool** const pools;
+    AllocatedObject** const objs;
+public:
+    PoolIdentityCheck(rml::MemoryPool** p, AllocatedObject** o) : pools(p), objs(o) {}
+    void operator()(int id) const {
+        objs[id] = (AllocatedObject*)pool_malloc(pools[id], BUF_SIZE/2);
+        ASSERT(objs[id], NULL);
+        rml::MemoryPool *act_pool = rml::pool_identify(objs[id]);
+        ASSERT(act_pool == pools[id], NULL);
+
+        for (size_t total=0; total<2*BUF_SIZE; total+=256) {
+            AllocatedObject *o = (AllocatedObject*)pool_malloc(pools[id], 256);
+            ASSERT(o, NULL);
+            act_pool = rml::pool_identify(o);
+            ASSERT(act_pool == pools[id], NULL);
+            pool_free(act_pool, o);
+        }
+        if( id&1 ) { // make every second returned object "small"
+            pool_free(act_pool, objs[id]);
+            objs[id] = (AllocatedObject*)pool_malloc(pools[id], 16);
+            ASSERT(objs[id], NULL);
+        }
+        objs[id]->pool = act_pool;
+    }
+};
+
+void TestPoolDetection()
+{
+    const int POOLS = 4;
+    rml::MemPoolPolicy pol(fixedBufGetMem, NULL, 0, /*fixedSizePool=*/true,
+                           /*keepMemTillDestroy=*/false);
+    rml::MemoryPool *pools[POOLS];
+    FixedPoolHead<BUF_SIZE*POOLS> head[POOLS];
+    AllocatedObject *objs[POOLS];
+
+    for (int i=0; i<POOLS; i++)
+        pool_create_v1((intptr_t)(head+i), &pol, &pools[i]);
+    // if object somehow released to different pools, subsequent allocation
+    // from affected pools became impossible
+    for (int k=0; k<10; k++) {
+        PoolIdentityCheck check(pools, objs);
+        if( k&1 )
+            NativeParallelFor( POOLS, check);
+        else 
+            for (int i=0; i<POOLS; i++) check(i);
+
+        for (int i=0; i<POOLS; i++) {
+            rml::MemoryPool *p = rml::pool_identify(objs[i]);
+            ASSERT(p == objs[i]->pool, NULL);
+            pool_free(p, objs[i]);
+        }
+    }
+    for (int i=0; i<POOLS; i++) {
+        bool ok = pool_destroy(pools[i]);
+        ASSERT(ok, NULL);
+    }
+}
+
+void TestLazyBootstrap()
+{
+    rml::MemPoolPolicy pol(getMemMalloc, putMemFree);
+    const size_t sizes[] = {8, 9*1024, 0};
+
+    for (int i=0; sizes[i]; i++) {
+        rml::MemoryPool *pool = CreateUsablePool(sizes[i]);
+        bool ok = pool_destroy(pool);
+        ASSERT(ok, NULL);
+        ASSERT(getMemSuccessful == putMemAll, "No leak.");
+    }
+}
+
+class NoLeakOnDestroyRun: NoAssign {
+    rml::MemoryPool      *pool;
+    Harness::SpinBarrier *barrier;
+public:
+    NoLeakOnDestroyRun(rml::MemoryPool *p, Harness::SpinBarrier *b) : pool(p), barrier(b) {}
+    void operator()(int id) const {
+        void *p = pool_malloc(pool, id%2? 8 : 9000);
+        ASSERT(p && liveRegions, NULL);
+        barrier->wait();
+        if (!id) {
+            bool ok = pool_destroy(pool);
+            ASSERT(ok, NULL);
+            ASSERT(!liveRegions, "Expected all regions were released.");
+        }
+        // other threads must wait till pool destruction,
+        // to not call thread destruction cleanup before this
+        barrier->wait();
+    }
+};
+
+void TestNoLeakOnDestroy()
+{
+    liveRegions = 0;
+    for (int p=MinThread; p<=MaxThread; p++) {
+        rml::MemPoolPolicy pol(getMallocMem, putMallocMem);
+        Harness::SpinBarrier barrier(p);
+        rml::MemoryPool *pool;
+
+        pool_create_v1(0, &pol, &pool);
+        NativeParallelFor(p, NoLeakOnDestroyRun(pool, &barrier));
+    }
+}
+
+
+static int putMallocMemError(intptr_t /*pool_id*/, void *ptr, size_t bytes)
+{
+    MallocPoolHeader *hdr = (MallocPoolHeader*)ptr-1;
+    ASSERT(bytes == hdr->userSize, "Invalid size in pool callback.");
+    free(hdr->rawPtr);
+
+    liveRegions--;
+
+    return -1;
+}
+
+void TestDestroyFailed()
+{
+    rml::MemPoolPolicy pol(getMallocMem, putMallocMemError);
+    rml::MemoryPool *pool;
+    pool_create_v1(0, &pol, &pool);
+    void *ptr = pool_malloc(pool, 16);
+    ASSERT(ptr, NULL);
+    bool fail = pool_destroy(pool);
+    ASSERT(fail==false, "putMemPolicyError callback returns error, "
+           "expect pool_destroy() failure");
+}
+
+int TestMain () {
+    TestTooSmallBuffer();
+    TestPoolReset();
+    TestSharedPool();
+    TestCrossThreadPools();
+    TestFixedBufferPool();
+    TestPoolGranularity();
+    TestPoolKeepTillDestroy();
+    TestEntries();
+    TestPoolCreation();
+    TestPoolDetection();
+    TestLazyBootstrap();
+    TestNoLeakOnDestroy();
+    TestDestroyFailed();
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_malloc_pure_c.c b/xdl/third_party/tbb/src/test/test_malloc_pure_c.c
new file mode 100644
index 00000000..3cf6e741
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_pure_c.c
@@ -0,0 +1,132 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifdef __cplusplus
+#error For testing purpose, this file should be compiled with a C compiler, not C++
+#endif /*__cplusplus */
+
+#include "tbb/scalable_allocator.h"
+#include <stdio.h>
+#include <assert.h>
+#include <stdlib.h> /* for atexit */
+
+/*
+ *  The test is to check if the scalable_allocator.h and its functions
+ *  can be used from pure C programs; also some regression checks are done
+ */
+
+#if __linux__
+/* huge pages supported only under Linux so far */
+const int ExpectedResultHugePages = TBBMALLOC_OK;
+#else
+const int ExpectedResultHugePages = TBBMALLOC_NO_EFFECT;
+#endif
+
+/* bool type definition for C */
+#if (defined(_MSC_VER) && _MSC_VER < 1800) || __sun || __SUNPRO_CC
+typedef int bool;
+#define false 0
+#define true 1
+#else
+#include <stdbool.h>
+#endif
+
+#if __TBB_SOURCE_DIRECTLY_INCLUDED
+#include "../tbbmalloc/tbbmalloc_internal_api.h"
+#else
+#define __TBB_mallocProcessShutdownNotification(bool)
+#endif
+
+/* test that it's possible to call allocation function from atexit
+   after mallocProcessShutdownNotification() called */
+static void MyExit(void) {
+    void *p = scalable_malloc(32);
+    assert(p);
+    scalable_free(p);
+    __TBB_mallocProcessShutdownNotification(false);
+}
+
+int main(void) {
+    size_t i, j;
+    int curr_mode, res;
+    void *p1, *p2;
+
+    atexit( MyExit );
+    for ( curr_mode = 0; curr_mode<=1; curr_mode++) {
+        assert(ExpectedResultHugePages ==
+               scalable_allocation_mode(TBBMALLOC_USE_HUGE_PAGES, !curr_mode));
+        p1 = scalable_malloc(10*1024*1024);
+        assert(p1);
+        assert(ExpectedResultHugePages ==
+               scalable_allocation_mode(TBBMALLOC_USE_HUGE_PAGES, curr_mode));
+        scalable_free(p1);
+    }
+    /* note that huge pages (if supported) are still enabled at this point */
+#if __TBB_SOURCE_DIRECTLY_INCLUDED
+    assert(TBBMALLOC_OK ==
+           scalable_allocation_mode(TBBMALLOC_INTERNAL_SOURCE_INCLUDED, 0));
+#endif
+
+    for( i=0; i<=1<<16; ++i) {
+        p1 = scalable_malloc(i);
+        if( !p1 )
+            printf("Warning: there should be memory but scalable_malloc returned NULL\n");
+        scalable_free(p1);
+    }
+    p1 = p2 = NULL;
+    for( i=1024*1024; ; i/=2 )
+    {
+        scalable_free(p1);
+        p1 = scalable_realloc(p2, i);
+        p2 = scalable_calloc(i, 32);
+        if (p2) {
+            if (i<sizeof(size_t)) {
+                for (j=0; j<i; j++)
+                    assert(0==*((char*)p2+j));
+            } else {
+                for (j=0; j<i; j+=sizeof(size_t))
+                    assert(0==*((size_t*)p2+j));
+            }
+        }
+        scalable_free(p2);
+        p2 = scalable_malloc(i);
+        if (i==0) break;
+    }
+    for( i=1; i<1024*1024; i*=2 )
+    {
+        scalable_free(p1);
+        p1 = scalable_realloc(p2, i);
+        p2 = scalable_malloc(i);
+    }
+    scalable_free(p1);
+    scalable_free(p2);
+    res = scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS, NULL);
+    assert(res == TBBMALLOC_OK);
+    res = scalable_allocation_command(TBBMALLOC_CLEAN_THREAD_BUFFERS, NULL);
+    /* expect all caches cleaned before, so got nothing from CLEAN_THREAD_BUFFERS */
+    assert(res == TBBMALLOC_NO_EFFECT);
+    /* check that invalid param argument give expected result*/
+    res = scalable_allocation_command(TBBMALLOC_CLEAN_THREAD_BUFFERS,
+                                      (void*)(intptr_t)1);
+    assert(res == TBBMALLOC_INVALID_PARAM);
+    __TBB_mallocProcessShutdownNotification(false);
+    printf("done\n");
+    return 0;
+}
diff --git a/xdl/third_party/tbb/src/test/test_malloc_regression.cpp b/xdl/third_party/tbb/src/test/test_malloc_regression.cpp
new file mode 100644
index 00000000..33a0ee4c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_regression.cpp
@@ -0,0 +1,190 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+
+#include <stdio.h>
+#include "tbb/scalable_allocator.h"
+
+class minimalAllocFree {
+public:
+    void operator()(int size) const {
+        tbb::scalable_allocator<char> a;
+        char* str = a.allocate( size );
+        a.deallocate( str, size );
+    }
+};
+
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+#include "harness.h"
+
+template<typename Body, typename Arg>
+void RunThread(const Body& body, const Arg& arg) {
+    NativeParallelForTask<Arg,Body> job(arg, body);
+    job.start();
+    job.wait_to_finish();
+}
+
+/*--------------------------------------------------------------------*/
+// The regression test against bug #1518 where thread bootstrap allocations "leaked"
+
+#include "harness_memory.h"
+
+bool TestBootstrapLeak() {
+    /* In the bug 1518, each thread leaked ~384 bytes.
+       Initially, scalable allocator maps 1MB. Thus it is necessary to take out most of this space.
+       1MB is chunked into 16K blocks; of those, one block is for thread bootstrap, and one more
+       should be reserved for the test body. 62 blocks left, each can serve 15 objects of 1024 bytes.
+    */
+    const int alloc_size = 1024;
+    const int take_out_count = 15*62;
+
+    tbb::scalable_allocator<char> a;
+    char* array[take_out_count];
+    for( int i=0; i<take_out_count; ++i )
+        array[i] = a.allocate( alloc_size );
+
+    RunThread( minimalAllocFree(), alloc_size ); // for threading library to take some memory
+    size_t memory_in_use = GetMemoryUsage();
+    // Wait for memory usage data to "stabilize". The test number (1000) has nothing underneath.
+    for( int i=0; i<1000; i++) {
+        if( GetMemoryUsage()!=memory_in_use ) {
+            memory_in_use = GetMemoryUsage();
+            i = -1;
+        }
+    }
+
+    ptrdiff_t memory_leak = 0;
+    // Note that 16K bootstrap memory block is enough to serve 42 threads.
+    const int num_thread_runs = 200;
+    for (int run=0; run<3; run++) {
+        memory_in_use = GetMemoryUsage();
+        for( int i=0; i<num_thread_runs; ++i )
+            RunThread( minimalAllocFree(), alloc_size );
+
+        memory_leak = GetMemoryUsage() - memory_in_use;
+        if (!memory_leak)
+            break;
+    }
+    if( memory_leak>0 ) { // possibly too strong?
+        REPORT( "Error: memory leak of up to %ld bytes\n", static_cast<long>(memory_leak));
+    }
+
+    for( int i=0; i<take_out_count; ++i )
+        a.deallocate( array[i], alloc_size );
+
+    return memory_leak<=0;
+}
+
+/*--------------------------------------------------------------------*/
+// The regression test against a bug with incompatible semantics of msize and realloc
+
+bool TestReallocMsize(size_t startSz) {
+    bool passed = true;
+
+    char *buf = (char*)scalable_malloc(startSz);
+    ASSERT(buf, "");
+    size_t realSz = scalable_msize(buf);
+    ASSERT(realSz>=startSz, "scalable_msize must be not less then allocated size");
+    memset(buf, 'a', realSz-1);
+    buf[realSz-1] = 0;
+    char *buf1 = (char*)scalable_realloc(buf, 2*realSz);
+    ASSERT(buf1, "");
+    ASSERT(scalable_msize(buf1)>=2*realSz,
+           "scalable_msize must be not less then allocated size");
+    buf1[2*realSz-1] = 0;
+    if ( strspn(buf1, "a") < realSz-1 ) {
+        REPORT( "Error: data broken for %d Bytes object.\n", startSz);
+        passed = false;
+    }
+    scalable_free(buf1);
+
+    return passed;
+}
+
+// regression test against incorrect work of msize/realloc
+// for aligned objects
+void TestAlignedMsize()
+{
+    const int NUM = 4;
+    char *p[NUM];
+    size_t objSizes[NUM];
+    size_t allocSz[] = {4, 8, 512, 2*1024, 4*1024, 8*1024, 16*1024, 0};
+    size_t align[] = {8, 512, 2*1024, 4*1024, 8*1024, 16*1024, 0};
+
+    for (int a=0; align[a]; a++)
+        for (int s=0; allocSz[s]; s++) {
+            for (int i=0; i<NUM; i++) {
+                p[i] = (char*)scalable_aligned_malloc(allocSz[s], align[a]);
+                ASSERT(is_aligned(p[i], align[a]), NULL);
+            }
+
+            for (int i=0; i<NUM; i++) {
+                objSizes[i] = scalable_msize(p[i]);
+                ASSERT(objSizes[i] >= allocSz[s],
+                       "allocated size must be not less than requested");
+                memset(p[i], i, objSizes[i]);
+            }
+            for (int i=0; i<NUM; i++) {
+                for (unsigned j=0; j<objSizes[i]; j++)
+                    ASSERT(((char*)p[i])[j] == i, "Error: data broken");
+            }
+
+            for (int i=0; i<NUM; i++) {
+                p[i] = (char*)scalable_aligned_realloc(p[i], 2*allocSz[s], align[a]);
+                ASSERT(is_aligned(p[i], align[a]), NULL);
+                memset((char*)p[i]+allocSz[s], i+1, allocSz[s]);
+            }
+            for (int i=0; i<NUM; i++) {
+                for (unsigned j=0; j<allocSz[s]; j++)
+                    ASSERT(((char*)p[i])[j] == i, "Error: data broken");
+                for (size_t j=allocSz[s]; j<2*allocSz[s]; j++)
+                    ASSERT(((char*)p[i])[j] == i+1, "Error: data broken");
+            }
+            for (int i=0; i<NUM; i++)
+                scalable_free(p[i]);
+        }
+}
+
+/*--------------------------------------------------------------------*/
+// The main test function
+
+int TestMain () {
+    bool passed = true;
+    // Check whether memory usage data can be obtained; if not, skip test_bootstrap_leak.
+    if( GetMemoryUsage() )
+        passed &= TestBootstrapLeak();
+
+    // TestReallocMsize runs for each power of 2 and each Fibonacci number below 64K
+    for (size_t a=1, b=1, sum=1; sum<=64*1024; ) {
+        passed &= TestReallocMsize(sum);
+        a = b;
+        b = sum;
+        sum = a+b;
+    }
+    for (size_t a=2; a<=64*1024; a*=2)
+        passed &= TestReallocMsize(a);
+
+    ASSERT( passed, "Test failed" );
+
+    TestAlignedMsize();
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_malloc_shutdown_hang.cpp b/xdl/third_party/tbb/src/test/test_malloc_shutdown_hang.cpp
new file mode 100644
index 00000000..01a7424d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_shutdown_hang.cpp
@@ -0,0 +1,129 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_CUSTOM_MAIN 1
+#include "harness.h"
+
+#include <tbb/task.h>
+#include <tbb/scalable_allocator.h>
+#include <tbb/task_scheduler_init.h>
+
+// Lets slow down the main thread on exit
+const int MAX_DELAY = 5;
+struct GlobalObject {
+    ~GlobalObject() {
+        Harness::Sleep(rand( ) % MAX_DELAY);
+    }
+} go;
+
+void allocatorRandomThrashing() {
+    const int ARRAY_SIZE = 1000;
+    const int MAX_ITER = 10000;
+    const int MAX_ALLOC = 10 * 1024 * 1024;
+
+    void *arr[ARRAY_SIZE] = {0};
+    for (int i = 0; i < rand() % MAX_ITER; ++i) {
+        // Random allocation size for random arrays
+        for (int j = 0; j < rand() % ARRAY_SIZE; ++j) {
+            arr[j] = scalable_malloc(rand() % MAX_ALLOC);
+        }
+        // Deallocate everything
+        for (int j = 0; j < ARRAY_SIZE; ++j) {
+            scalable_free(arr[j]);
+            arr[j] = NULL;
+        }
+    }
+}
+
+struct AllocatorThrashTask : tbb::task {
+    tbb::task* execute() __TBB_override {
+        allocatorRandomThrashing();
+        return NULL;
+    }
+};
+
+void hangOnExitReproducer() {
+    const int P = tbb::task_scheduler_init::default_num_threads();
+    for (int i = 0; i < P-1; i++) {
+        // Enqueue tasks for workers
+        tbb::task::enqueue(*new (tbb::task::allocate_root()) AllocatorThrashTask());
+    }
+}
+
+#if (_WIN32 || _WIN64) && !__TBB_WIN8UI_SUPPORT
+#include <process.h> // _spawnl
+void processSpawn(const char* self) {
+    _spawnl(_P_WAIT, self, self, "1", NULL);
+}
+#elif __linux__ || __APPLE__
+#include <unistd.h> // fork/exec
+#include <sys/wait.h> // waitpid
+void processSpawn(const char* self) {
+    pid_t pid = fork();
+    if (pid == -1) {
+        REPORT("ERROR: fork failed.\n");
+    } else if (pid == 0) { // child
+        execl(self, self, "1", NULL);
+        REPORT("ERROR: exec never returns\n");
+        exit(1);
+    } else { // parent
+        int status;
+        waitpid(pid, &status, 0);
+    }
+}
+#else
+void processSpawn(const char* /*self*/) {
+    REPORT("Known issue: no support for process spawn on this platform.\n");
+    REPORT("done\n");
+    exit(0);
+}
+#endif
+
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (push)
+#pragma warning (disable: 4702)  /* Unreachable code */
+#endif
+
+HARNESS_EXPORT
+int main(int argc, char* argv[]) {
+    ParseCommandLine( argc, argv );
+
+    // Executed from child processes
+    if (argc == 2 && strcmp(argv[1],"1") == 0) {
+        hangOnExitReproducer();
+        return 0;
+    }
+
+    // The number of executions is a tradeoff
+    // between execution time and NBTS statistics
+    const int EXEC_TIMES = 100;
+    const char* self = argv[0];
+    for (int i = 0; i < EXEC_TIMES; i++) {
+        processSpawn(self);
+    }
+
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (pop)
+#endif
+
+    REPORT("done\n");
+    return 0;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_malloc_used_by_lib.cpp b/xdl/third_party/tbb/src/test/test_malloc_used_by_lib.cpp
new file mode 100644
index 00000000..3c14dd30
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_used_by_lib.cpp
@@ -0,0 +1,171 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _USRDLL
+
+#include <stdlib.h>
+#include "harness_defs.h"
+#include "tbb/scalable_allocator.h"
+#if __TBB_SOURCE_DIRECTLY_INCLUDED
+#include "../tbbmalloc/tbbmalloc_internal_api.h"
+#endif
+
+#define HARNESS_CUSTOM_MAIN 1
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+#include "harness_assert.h"
+
+#if _WIN32||_WIN64
+extern "C" {
+    extern __declspec(dllexport) void callDll();
+}
+#endif
+
+extern "C" void callDll()
+{
+    static const int NUM = 20;
+    void *ptrs[NUM];
+
+    for (int i=0; i<NUM; i++) {
+        ptrs[i] = scalable_malloc(i*1024);
+        ASSERT(ptrs[i], NULL);
+    }
+    for (int i=0; i<NUM; i++)
+        scalable_free(ptrs[i]);
+}
+
+#if __TBB_SOURCE_DIRECTLY_INCLUDED
+
+struct RegisterProcessShutdownNotification {
+    ~RegisterProcessShutdownNotification() {
+        __TBB_mallocProcessShutdownNotification();
+    }
+};
+
+static RegisterProcessShutdownNotification reg;
+
+#endif
+
+#else // _USRDLL
+
+#define __TBB_NO_IMPLICIT_LINKAGE 1
+#include "harness_dynamic_libs.h"
+#if __TBB_WIN8UI_SUPPORT
+// FIXME: fix the test to support Windows* 8 Store Apps mode.
+#define HARNESS_SKIP_TEST 1
+#endif
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+
+#if !HARNESS_SKIP_TEST
+
+#include "harness_memory.h"
+#include "harness_tbb_independence.h"
+#include "harness_barrier.h"
+
+class UseDll {
+    Harness::FunctionAddress run;
+public:
+    UseDll(Harness::FunctionAddress runPtr) : run(runPtr) { }
+    void operator()( int /*id*/ ) const {
+        (*run)();
+    }
+};
+
+void LoadThreadsUnload()
+{
+    Harness::LIBRARY_HANDLE lib =
+        Harness::OpenLibrary(TEST_LIBRARY_NAME("test_malloc_used_by_lib_dll"));
+    ASSERT(lib, "Can't load " TEST_LIBRARY_NAME("test_malloc_used_by_lib_dll"));
+    NativeParallelFor( 4, UseDll( Harness::GetAddress(lib, "callDll") ) );
+    Harness::CloseLibrary(lib);
+}
+
+struct UnloadCallback {
+    Harness::LIBRARY_HANDLE lib;
+
+    void operator() () const {
+        Harness::CloseLibrary(lib);
+    }
+};
+
+struct RunWithLoad : NoAssign {
+    static Harness::SpinBarrier startBarr, endBarr;
+    static UnloadCallback unloadCallback;
+    static Harness::FunctionAddress runPtr;
+
+    void operator()(int id) const {
+        if (!id) {
+            Harness::LIBRARY_HANDLE lib =
+                Harness::OpenLibrary(TEST_LIBRARY_NAME("test_malloc_used_by_lib_dll"));
+            ASSERT(lib, "Can't load " TEST_LIBRARY_NAME("test_malloc_used_by_lib_dll"));
+            runPtr = Harness::GetAddress(lib, "callDll");
+            unloadCallback.lib = lib;
+        }
+        startBarr.wait();
+        (*runPtr)();
+        endBarr.wait(unloadCallback);
+    }
+};
+
+Harness::SpinBarrier RunWithLoad::startBarr, RunWithLoad::endBarr;
+UnloadCallback RunWithLoad::unloadCallback;
+Harness::FunctionAddress RunWithLoad::runPtr;
+
+void ThreadsLoadUnload()
+{
+    const int threads = 4;
+
+    RunWithLoad::startBarr.initialize(threads);
+    RunWithLoad::endBarr.initialize(threads);
+    NativeParallelFor(threads, RunWithLoad());
+}
+
+int TestMain () {
+    const int ITERS = 20;
+    int i;
+    std::ptrdiff_t memory_leak = 0;
+
+    GetMemoryUsage();
+
+    for (int run = 0; run<2; run++) {
+        // expect that memory consumption stabilized after several runs
+        for (i=0; i<ITERS; i++) {
+            std::size_t memory_in_use = GetMemoryUsage();
+            if (run)
+                LoadThreadsUnload();
+            else
+                ThreadsLoadUnload();
+            memory_leak = GetMemoryUsage() - memory_in_use;
+            if (memory_leak == 0)  // possibly too strong?
+                break;
+        }
+        if(i==ITERS) {
+            // not stabilized, could be leak
+            REPORT( "Error: memory leak of up to %ld bytes\n", static_cast<long>(memory_leak));
+            exit(1);
+        }
+    }
+
+    return Harness::Done;
+}
+
+#endif /* HARNESS_SKIP_TEST */
+#endif // _USRDLL
diff --git a/xdl/third_party/tbb/src/test/test_malloc_whitebox.cpp b/xdl/third_party/tbb/src/test/test_malloc_whitebox.cpp
new file mode 100644
index 00000000..5626ec78
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_malloc_whitebox.cpp
@@ -0,0 +1,1328 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* to prevent loading dynamic TBBmalloc at startup, that is not needed
+   for the whitebox test */
+#define __TBB_SOURCE_DIRECTLY_INCLUDED 1
+
+// According to C99 standard INTPTR_MIN defined for C++
+// iff __STDC_LIMIT_MACROS pre-defined
+#define __STDC_LIMIT_MACROS 1
+
+#define HARNESS_TBBMALLOC_THREAD_SHUTDOWN 1
+
+#include "harness.h"
+#include "harness_barrier.h"
+
+// To not depends on ITT support stuff
+#ifdef DO_ITT_NOTIFY
+#undef DO_ITT_NOTIFY
+#endif
+
+#define __TBB_MALLOC_WHITEBOX_TEST 1 // to get access to allocator internals
+// help trigger rare race condition
+#define WhiteboxTestingYield() (__TBB_Yield(), __TBB_Yield(), __TBB_Yield(), __TBB_Yield())
+
+#if __INTEL_COMPILER && __TBB_MIC_OFFLOAD
+// 2571 is variable has not been declared with compatible "target" attribute
+// 3218 is class/struct may fail when offloaded because this field is misaligned
+//         or contains data that is misaligned
+    #pragma warning(push)
+    #pragma warning(disable:2571 3218)
+#endif
+#define protected public
+#define private public
+#include "../tbbmalloc/frontend.cpp"
+#undef protected
+#undef private
+#if __INTEL_COMPILER && __TBB_MIC_OFFLOAD
+    #pragma warning(pop)
+#endif
+#include "../tbbmalloc/backend.cpp"
+#include "../tbbmalloc/backref.cpp"
+
+namespace tbbmalloc_whitebox {
+    size_t locGetProcessed = 0;
+    size_t locPutProcessed = 0;
+}
+#include "../tbbmalloc/large_objects.cpp"
+#include "../tbbmalloc/tbbmalloc.cpp"
+
+const int LARGE_MEM_SIZES_NUM = 10;
+
+class AllocInfo {
+    int *p;
+    int val;
+    int size;
+public:
+    AllocInfo() : p(NULL), val(0), size(0) {}
+    explicit AllocInfo(int sz) : p((int*)scalable_malloc(sz*sizeof(int))),
+                                   val(rand()), size(sz) {
+        ASSERT(p, NULL);
+        for (int k=0; k<size; k++)
+            p[k] = val;
+    }
+    void check() const {
+        for (int k=0; k<size; k++)
+            ASSERT(p[k] == val, NULL);
+    }
+    void clear() {
+        scalable_free(p);
+    }
+};
+
+class SimpleBarrier: NoAssign {
+protected:
+    static Harness::SpinBarrier barrier;
+public:
+    static void initBarrier(unsigned thrds) { barrier.initialize(thrds); }
+};
+
+Harness::SpinBarrier SimpleBarrier::barrier;
+
+class TestLargeObjCache: public SimpleBarrier {
+public:
+    static int largeMemSizes[LARGE_MEM_SIZES_NUM];
+
+    TestLargeObjCache( ) {}
+
+    void operator()( int /*mynum*/ ) const {
+        AllocInfo allocs[LARGE_MEM_SIZES_NUM];
+
+        // push to maximal cache limit
+        for (int i=0; i<2; i++) {
+            const int sizes[] = { MByte/sizeof(int),
+                                  (MByte-2*LargeObjectCache::largeBlockCacheStep)/sizeof(int) };
+            for (int q=0; q<2; q++) {
+                size_t curr = 0;
+                for (int j=0; j<LARGE_MEM_SIZES_NUM; j++, curr++)
+                    new (allocs+curr) AllocInfo(sizes[q]);
+
+                for (size_t j=0; j<curr; j++) {
+                    allocs[j].check();
+                    allocs[j].clear();
+                }
+            }
+        }
+
+        barrier.wait();
+
+        // check caching correctness
+        for (int i=0; i<1000; i++) {
+            size_t curr = 0;
+            for (int j=0; j<LARGE_MEM_SIZES_NUM-1; j++, curr++)
+                new (allocs+curr) AllocInfo(largeMemSizes[j]);
+
+            new (allocs+curr)
+                AllocInfo((int)(4*minLargeObjectSize +
+                                2*minLargeObjectSize*(1.*rand()/RAND_MAX)));
+            curr++;
+
+            for (size_t j=0; j<curr; j++) {
+                allocs[j].check();
+                allocs[j].clear();
+            }
+        }
+    }
+};
+
+int TestLargeObjCache::largeMemSizes[LARGE_MEM_SIZES_NUM];
+
+void TestLargeObjectCache()
+{
+    for (int i=0; i<LARGE_MEM_SIZES_NUM; i++)
+        TestLargeObjCache::largeMemSizes[i] =
+            (int)(minLargeObjectSize + 2*minLargeObjectSize*(1.*rand()/RAND_MAX));
+
+    for( int p=MaxThread; p>=MinThread; --p ) {
+        TestLargeObjCache::initBarrier( p );
+        NativeParallelFor( p, TestLargeObjCache() );
+    }
+}
+
+#if MALLOC_CHECK_RECURSION
+
+class TestStartupAlloc: public SimpleBarrier {
+    struct TestBlock {
+        void *ptr;
+        size_t sz;
+    };
+    static const int ITERS = 100;
+public:
+    TestStartupAlloc() {}
+    void operator()(int) const {
+        TestBlock blocks1[ITERS], blocks2[ITERS];
+
+        barrier.wait();
+
+        for (int i=0; i<ITERS; i++) {
+            blocks1[i].sz = rand() % minLargeObjectSize;
+            blocks1[i].ptr = StartupBlock::allocate(blocks1[i].sz);
+            ASSERT(blocks1[i].ptr && StartupBlock::msize(blocks1[i].ptr)>=blocks1[i].sz
+                   && 0==(uintptr_t)blocks1[i].ptr % sizeof(void*), NULL);
+            memset(blocks1[i].ptr, i, blocks1[i].sz);
+        }
+        for (int i=0; i<ITERS; i++) {
+            blocks2[i].sz = rand() % minLargeObjectSize;
+            blocks2[i].ptr = StartupBlock::allocate(blocks2[i].sz);
+            ASSERT(blocks2[i].ptr && StartupBlock::msize(blocks2[i].ptr)>=blocks2[i].sz
+                   && 0==(uintptr_t)blocks2[i].ptr % sizeof(void*), NULL);
+            memset(blocks2[i].ptr, i, blocks2[i].sz);
+
+            for (size_t j=0; j<blocks1[i].sz; j++)
+                ASSERT(*((char*)blocks1[i].ptr+j) == i, NULL);
+            Block *block = (Block *)alignDown(blocks1[i].ptr, slabSize);
+            ((StartupBlock *)block)->free(blocks1[i].ptr);
+        }
+        for (int i=ITERS-1; i>=0; i--) {
+            for (size_t j=0; j<blocks2[i].sz; j++)
+                ASSERT(*((char*)blocks2[i].ptr+j) == i, NULL);
+            Block *block = (Block *)alignDown(blocks2[i].ptr, slabSize);
+            ((StartupBlock *)block)->free(blocks2[i].ptr);
+        }
+    }
+};
+
+#endif /* MALLOC_CHECK_RECURSION */
+
+#include <deque>
+
+template<int ITERS>
+class BackRefWork: NoAssign {
+    struct TestBlock {
+        BackRefIdx idx;
+        char       data;
+        TestBlock(BackRefIdx idx_) : idx(idx_) {}
+    };
+public:
+    BackRefWork() {}
+    void operator()(int) const {
+        size_t cnt;
+        // it's important to not invalidate pointers to the contents of the container
+        std::deque<TestBlock> blocks;
+
+        // for ITERS==0 consume all available backrefs
+        for (cnt=0; !ITERS || cnt<ITERS; cnt++) {
+            BackRefIdx idx = BackRefIdx::newBackRef(/*largeObj=*/false);
+            if (idx.isInvalid())
+                break;
+            blocks.push_back(TestBlock(idx));
+            setBackRef(blocks.back().idx, &blocks.back().data);
+        }
+        for (size_t i=0; i<cnt; i++)
+            ASSERT((Block*)&blocks[i].data == getBackRef(blocks[i].idx), NULL);
+        for (size_t i=cnt; i>0; i--)
+            removeBackRef(blocks[i-1].idx);
+    }
+};
+
+class LocalCachesHit: NoAssign {
+    // set ITERS to trigger possible leak of backreferences
+    // during cleanup on cache overflow and on thread termination
+    static const int ITERS = 2*(FreeBlockPool::POOL_HIGH_MARK +
+                                LocalLOC::LOC_HIGH_MARK);
+public:
+    LocalCachesHit() {}
+    void operator()(int) const {
+        void *objsSmall[ITERS], *objsLarge[ITERS];
+
+        for (int i=0; i<ITERS; i++) {
+            objsSmall[i] = scalable_malloc(minLargeObjectSize-1);
+            objsLarge[i] = scalable_malloc(minLargeObjectSize);
+        }
+        for (int i=0; i<ITERS; i++) {
+            scalable_free(objsSmall[i]);
+            scalable_free(objsLarge[i]);
+        }
+    }
+};
+
+static size_t allocatedBackRefCount()
+{
+    size_t cnt = 0;
+    for (int i=0; i<=backRefMaster->lastUsed; i++)
+        cnt += backRefMaster->backRefBl[i]->allocatedCount;
+    return cnt;
+}
+
+class TestInvalidBackrefs: public SimpleBarrier {
+#if __ANDROID__
+    // Android requires lower iters due to lack of virtual memory.
+    static const int BACKREF_GROWTH_ITERS = 50*1024;
+#else
+    static const int BACKREF_GROWTH_ITERS = 200*1024;
+#endif
+
+    static tbb::atomic<bool> backrefGrowthDone;
+    static void *ptrs[BACKREF_GROWTH_ITERS];
+public:
+    TestInvalidBackrefs() {}
+    void operator()(int id) const {
+
+        if (!id) {
+            backrefGrowthDone = false;
+            barrier.wait();
+
+            for (int i=0; i<BACKREF_GROWTH_ITERS; i++)
+                ptrs[i] = scalable_malloc(minLargeObjectSize);
+            backrefGrowthDone = true;
+            for (int i=0; i<BACKREF_GROWTH_ITERS; i++)
+                scalable_free(ptrs[i]);
+        } else {
+            void *p2 = scalable_malloc(minLargeObjectSize-1);
+            char *p1 = (char*)scalable_malloc(minLargeObjectSize-1);
+            LargeObjectHdr *hdr =
+                (LargeObjectHdr*)(p1+minLargeObjectSize-1 - sizeof(LargeObjectHdr));
+            hdr->backRefIdx.master = 7;
+            hdr->backRefIdx.largeObj = 1;
+            hdr->backRefIdx.offset = 2000;
+
+            barrier.wait();
+
+            while (!backrefGrowthDone) {
+                scalable_free(p2);
+                p2 = scalable_malloc(minLargeObjectSize-1);
+            }
+            scalable_free(p1);
+            scalable_free(p2);
+        }
+    }
+};
+
+tbb::atomic<bool> TestInvalidBackrefs::backrefGrowthDone;
+void *TestInvalidBackrefs::ptrs[BACKREF_GROWTH_ITERS];
+
+void TestBackRef() {
+    size_t beforeNumBackRef, afterNumBackRef;
+
+    beforeNumBackRef = allocatedBackRefCount();
+    for( int p=MaxThread; p>=MinThread; --p )
+        NativeParallelFor( p, BackRefWork<2*BR_MAX_CNT+2>() );
+    afterNumBackRef = allocatedBackRefCount();
+    ASSERT(beforeNumBackRef==afterNumBackRef, "backreference leak detected");
+
+    // lastUsed marks peak resource consumption. As we allocate below the mark,
+    // it must not move up, otherwise there is a resource leak.
+    int sustLastUsed = backRefMaster->lastUsed;
+    NativeParallelFor( 1, BackRefWork<2*BR_MAX_CNT+2>() );
+    ASSERT(sustLastUsed == backRefMaster->lastUsed, "backreference leak detected");
+
+    // check leak of back references while per-thread caches are in use
+    // warm up needed to cover bootStrapMalloc call
+    NativeParallelFor( 1, LocalCachesHit() );
+    beforeNumBackRef = allocatedBackRefCount();
+    NativeParallelFor( 2, LocalCachesHit() );
+    int res = scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS, NULL);
+    ASSERT(res == TBBMALLOC_OK, NULL);
+    afterNumBackRef = allocatedBackRefCount();
+    ASSERT(beforeNumBackRef>=afterNumBackRef, "backreference leak detected");
+
+    // This is a regression test against race condition between backreference
+    // extension and checking invalid BackRefIdx.
+    // While detecting is object large or small, scalable_free 1st check for
+    // large objects, so there is a chance to prepend small object with
+    // seems valid BackRefIdx for large objects, and thus trigger the bug.
+    TestInvalidBackrefs::initBarrier(MaxThread);
+    NativeParallelFor( MaxThread, TestInvalidBackrefs() );
+    // Consume all available backrefs and check they work correctly.
+    // For now test 32-bit machines only, because for 64-bit memory consumption is too high.
+    if (sizeof(uintptr_t) == 4)
+        NativeParallelFor( MaxThread, BackRefWork<0>() );
+}
+
+void *getMem(intptr_t /*pool_id*/, size_t &bytes)
+{
+    const size_t BUF_SIZE = 8*1024*1024;
+    static char space[BUF_SIZE];
+    static size_t pos;
+
+    if (pos + bytes > BUF_SIZE)
+        return NULL;
+
+    void *ret = space + pos;
+    pos += bytes;
+
+    return ret;
+}
+
+int putMem(intptr_t /*pool_id*/, void* /*raw_ptr*/, size_t /*raw_bytes*/)
+{
+    return 0;
+}
+
+struct MallocPoolHeader {
+    void  *rawPtr;
+    size_t userSize;
+};
+
+void *getMallocMem(intptr_t /*pool_id*/, size_t &bytes)
+{
+    void *rawPtr = malloc(bytes+sizeof(MallocPoolHeader));
+    void *ret = (void *)((uintptr_t)rawPtr+sizeof(MallocPoolHeader));
+
+    MallocPoolHeader *hdr = (MallocPoolHeader*)ret-1;
+    hdr->rawPtr = rawPtr;
+    hdr->userSize = bytes;
+
+    return ret;
+}
+
+int putMallocMem(intptr_t /*pool_id*/, void *ptr, size_t bytes)
+{
+    MallocPoolHeader *hdr = (MallocPoolHeader*)ptr-1;
+    ASSERT(bytes == hdr->userSize, "Invalid size in pool callback.");
+    free(hdr->rawPtr);
+
+    return 0;
+}
+
+class StressLOCacheWork: NoAssign {
+    rml::MemoryPool *my_mallocPool;
+public:
+    StressLOCacheWork(rml::MemoryPool *mallocPool) : my_mallocPool(mallocPool) {}
+    void operator()(int) const {
+        for (size_t sz=minLargeObjectSize; sz<1*1024*1024;
+             sz+=LargeObjectCache::largeBlockCacheStep) {
+            void *ptr = pool_malloc(my_mallocPool, sz);
+            ASSERT(ptr, "Memory was not allocated");
+            memset(ptr, sz, sz);
+            pool_free(my_mallocPool, ptr);
+        }
+    }
+};
+
+void TestPools() {
+    rml::MemPoolPolicy pol(getMem, putMem);
+    size_t beforeNumBackRef, afterNumBackRef;
+
+    rml::MemoryPool *pool1;
+    rml::MemoryPool *pool2;
+    pool_create_v1(0, &pol, &pool1);
+    pool_create_v1(0, &pol, &pool2);
+    pool_destroy(pool1);
+    pool_destroy(pool2);
+
+    scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS, NULL);
+    beforeNumBackRef = allocatedBackRefCount();
+    rml::MemoryPool *fixedPool;
+
+    pool_create_v1(0, &pol, &fixedPool);
+    pol.pAlloc = getMallocMem;
+    pol.pFree = putMallocMem;
+    pol.granularity = 8;
+    rml::MemoryPool *mallocPool;
+
+    pool_create_v1(0, &pol, &mallocPool);
+/* check that large object cache (LOC) returns correct size for cached objects
+   passBackendSz Byte objects are cached in LOC, but bypassed the backend, so
+   memory requested directly from allocation callback.
+   nextPassBackendSz Byte objects must fit to another LOC bin,
+   so that their allocation/realeasing leads to cache cleanup.
+   All this is expecting to lead to releasing of passBackendSz Byte object
+   from LOC during LOC cleanup, and putMallocMem checks that returned size
+   is correct.
+*/
+    const size_t passBackendSz = Backend::maxBinned_HugePage+1,
+        anotherLOCBinSz = minLargeObjectSize+1;
+    for (int i=0; i<10; i++) { // run long enough to be cached
+        void *p = pool_malloc(mallocPool, passBackendSz);
+        ASSERT(p, "Memory was not allocated");
+        pool_free(mallocPool, p);
+    }
+    // run long enough to passBackendSz allocation was cleaned from cache
+    // and returned back to putMallocMem for size checking
+    for (int i=0; i<1000; i++) {
+        void *p = pool_malloc(mallocPool, anotherLOCBinSz);
+        ASSERT(p, "Memory was not allocated");
+        pool_free(mallocPool, p);
+    }
+
+    void *smallObj =  pool_malloc(fixedPool, 10);
+    ASSERT(smallObj, "Memory was not allocated");
+    memset(smallObj, 1, 10);
+    void *ptr = pool_malloc(fixedPool, 1024);
+    ASSERT(ptr, "Memory was not allocated");
+    memset(ptr, 1, 1024);
+    void *largeObj = pool_malloc(fixedPool, minLargeObjectSize);
+    ASSERT(largeObj, "Memory was not allocated");
+    memset(largeObj, 1, minLargeObjectSize);
+    ptr = pool_malloc(fixedPool, minLargeObjectSize);
+    ASSERT(ptr, "Memory was not allocated");
+    memset(ptr, minLargeObjectSize, minLargeObjectSize);
+    pool_malloc(fixedPool, 10*minLargeObjectSize); // no leak for unsuccessful allocations
+    pool_free(fixedPool, smallObj);
+    pool_free(fixedPool, largeObj);
+
+    // provoke large object cache cleanup and hope no leaks occurs
+    for( int p=MaxThread; p>=MinThread; --p )
+        NativeParallelFor( p, StressLOCacheWork(mallocPool) );
+    pool_destroy(mallocPool);
+    pool_destroy(fixedPool);
+
+    scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS, NULL);
+    afterNumBackRef = allocatedBackRefCount();
+    ASSERT(beforeNumBackRef==afterNumBackRef, "backreference leak detected");
+
+    {
+        // test usedSize/cachedSize and LOC bitmask correctness
+        void *p[5];
+        pool_create_v1(0, &pol, &mallocPool);
+        const LargeObjectCache *loc = &((rml::internal::MemoryPool*)mallocPool)->extMemPool.loc;
+        p[3] = pool_malloc(mallocPool, minLargeObjectSize+2*LargeObjectCache::largeBlockCacheStep);
+        for (int i=0; i<10; i++) {
+            p[0] = pool_malloc(mallocPool, minLargeObjectSize);
+            p[1] = pool_malloc(mallocPool, minLargeObjectSize+LargeObjectCache::largeBlockCacheStep);
+            pool_free(mallocPool, p[0]);
+            pool_free(mallocPool, p[1]);
+        }
+        ASSERT(loc->getUsedSize(), NULL);
+        pool_free(mallocPool, p[3]);
+        ASSERT(loc->getLOCSize() < 3*(minLargeObjectSize+LargeObjectCache::largeBlockCacheStep), NULL);
+        const size_t maxLocalLOCSize = LocalLOCImpl<3,30>::getMaxSize();
+        ASSERT(loc->getUsedSize() <= maxLocalLOCSize, NULL);
+        for (int i=0; i<3; i++)
+            p[i] = pool_malloc(mallocPool, minLargeObjectSize+i*LargeObjectCache::largeBlockCacheStep);
+        size_t currUser = loc->getUsedSize();
+        ASSERT(!loc->getLOCSize() && currUser >= 3*(minLargeObjectSize+LargeObjectCache::largeBlockCacheStep), NULL);
+        p[4] = pool_malloc(mallocPool, minLargeObjectSize+3*LargeObjectCache::largeBlockCacheStep);
+        ASSERT(loc->getUsedSize() - currUser >= minLargeObjectSize+3*LargeObjectCache::largeBlockCacheStep, NULL);
+        pool_free(mallocPool, p[4]);
+        ASSERT(loc->getUsedSize() <= currUser+maxLocalLOCSize, NULL);
+        pool_reset(mallocPool);
+        ASSERT(!loc->getLOCSize() && !loc->getUsedSize(), NULL);
+        pool_destroy(mallocPool);
+    }
+    // To test LOC we need bigger lists than released by current LocalLOC
+    //   in production code. Create special LocalLOC.
+    {
+        LocalLOCImpl<2, 20> lLOC;
+        pool_create_v1(0, &pol, &mallocPool);
+        rml::internal::ExtMemoryPool *mPool = &((rml::internal::MemoryPool*)mallocPool)->extMemPool;
+        const LargeObjectCache *loc = &((rml::internal::MemoryPool*)mallocPool)->extMemPool.loc;
+        for (int i=0; i<22; i++) {
+            void *o = pool_malloc(mallocPool, minLargeObjectSize+i*LargeObjectCache::largeBlockCacheStep);
+            bool ret = lLOC.put(((LargeObjectHdr*)o - 1)->memoryBlock, mPool);
+            ASSERT(ret, NULL);
+
+            o = pool_malloc(mallocPool, minLargeObjectSize+i*LargeObjectCache::largeBlockCacheStep);
+            ret = lLOC.put(((LargeObjectHdr*)o - 1)->memoryBlock, mPool);
+            ASSERT(ret, NULL);
+        }
+        lLOC.externalCleanup(mPool);
+        ASSERT(!loc->getUsedSize(), NULL);
+
+        pool_destroy(mallocPool);
+    }
+}
+
+void TestObjectRecognition() {
+    size_t headersSize = sizeof(LargeMemoryBlock)+sizeof(LargeObjectHdr);
+    unsigned falseObjectSize = 113; // unsigned is the type expected by getObjectSize
+    size_t obtainedSize;
+
+    ASSERT(sizeof(BackRefIdx)==sizeof(uintptr_t), "Unexpected size of BackRefIdx");
+    ASSERT(getObjectSize(falseObjectSize)!=falseObjectSize, "Error in test: bad choice for false object size");
+
+    void* mem = scalable_malloc(2*slabSize);
+    ASSERT(mem, "Memory was not allocated");
+    Block* falseBlock = (Block*)alignUp((uintptr_t)mem, slabSize);
+    falseBlock->objectSize = falseObjectSize;
+    char* falseSO = (char*)falseBlock + falseObjectSize*7;
+    ASSERT(alignDown(falseSO, slabSize)==(void*)falseBlock, "Error in test: false object offset is too big");
+
+    void* bufferLOH = scalable_malloc(2*slabSize + headersSize);
+    ASSERT(bufferLOH, "Memory was not allocated");
+    LargeObjectHdr* falseLO =
+        (LargeObjectHdr*)alignUp((uintptr_t)bufferLOH + headersSize, slabSize);
+    LargeObjectHdr* headerLO = (LargeObjectHdr*)falseLO-1;
+    headerLO->memoryBlock = (LargeMemoryBlock*)bufferLOH;
+    headerLO->memoryBlock->unalignedSize = 2*slabSize + headersSize;
+    headerLO->memoryBlock->objectSize = slabSize + headersSize;
+    headerLO->backRefIdx = BackRefIdx::newBackRef(/*largeObj=*/true);
+    setBackRef(headerLO->backRefIdx, headerLO);
+    ASSERT(scalable_msize(falseLO) == slabSize + headersSize,
+           "Error in test: LOH falsification failed");
+    removeBackRef(headerLO->backRefIdx);
+
+    const int NUM_OF_IDX = BR_MAX_CNT+2;
+    BackRefIdx idxs[NUM_OF_IDX];
+    for (int cnt=0; cnt<2; cnt++) {
+        for (int master = -10; master<10; master++) {
+            falseBlock->backRefIdx.master = (uint16_t)master;
+            headerLO->backRefIdx.master = (uint16_t)master;
+
+            for (int bl = -10; bl<BR_MAX_CNT+10; bl++) {
+                falseBlock->backRefIdx.offset = (uint16_t)bl;
+                headerLO->backRefIdx.offset = (uint16_t)bl;
+
+                for (int largeObj = 0; largeObj<2; largeObj++) {
+                    falseBlock->backRefIdx.largeObj = largeObj;
+                    headerLO->backRefIdx.largeObj = largeObj;
+
+                    obtainedSize = __TBB_malloc_safer_msize(falseSO, NULL);
+                    ASSERT(obtainedSize==0, "Incorrect pointer accepted");
+                    obtainedSize = __TBB_malloc_safer_msize(falseLO, NULL);
+                    ASSERT(obtainedSize==0, "Incorrect pointer accepted");
+                }
+            }
+        }
+        if (cnt == 1) {
+            for (int i=0; i<NUM_OF_IDX; i++)
+                removeBackRef(idxs[i]);
+            break;
+        }
+        for (int i=0; i<NUM_OF_IDX; i++) {
+            idxs[i] = BackRefIdx::newBackRef(/*largeObj=*/false);
+            setBackRef(idxs[i], NULL);
+        }
+    }
+    char *smallPtr = (char*)scalable_malloc(falseObjectSize);
+    obtainedSize = __TBB_malloc_safer_msize(smallPtr, NULL);
+    ASSERT(obtainedSize==getObjectSize(falseObjectSize), "Correct pointer not accepted?");
+    scalable_free(smallPtr);
+
+    obtainedSize = __TBB_malloc_safer_msize(mem, NULL);
+    ASSERT(obtainedSize>=2*slabSize, "Correct pointer not accepted?");
+    scalable_free(mem);
+    scalable_free(bufferLOH);
+}
+
+class TestBackendWork: public SimpleBarrier {
+    struct TestBlock {
+        intptr_t   data;
+        BackRefIdx idx;
+    };
+    static const int ITERS = 20;
+
+    rml::internal::Backend *backend;
+public:
+    TestBackendWork(rml::internal::Backend *bknd) : backend(bknd) {}
+    void operator()(int) const {
+        barrier.wait();
+
+        for (int i=0; i<ITERS; i++) {
+            BlockI *slabBlock = backend->getSlabBlock(1);
+            ASSERT(slabBlock, "Memory was not allocated");
+            LargeMemoryBlock *lmb = backend->getLargeBlock(8*1024);
+            backend->putSlabBlock(slabBlock);
+            backend->putLargeBlock(lmb);
+        }
+    }
+};
+
+void TestBackend()
+{
+    rml::MemPoolPolicy pol(getMallocMem, putMallocMem);
+    rml::MemoryPool *mPool;
+    pool_create_v1(0, &pol, &mPool);
+    rml::internal::ExtMemoryPool *ePool =
+        &((rml::internal::MemoryPool*)mPool)->extMemPool;
+    rml::internal::Backend *backend = &ePool->backend;
+
+    for( int p=MaxThread; p>=MinThread; --p ) {
+        // regression test against an race condition in backend synchronization,
+        // triggered only when WhiteboxTestingYield() call yields
+        for (int i=0; i<100; i++) {
+            TestBackendWork::initBarrier(p);
+            NativeParallelFor( p, TestBackendWork(backend) );
+        }
+    }
+
+    BlockI *block = backend->getSlabBlock(1);
+    ASSERT(block, "Memory was not allocated");
+    backend->putSlabBlock(block);
+
+    // Checks if the backend increases and decreases the amount of allocated memory when memory is allocated.
+    const size_t memSize0 = backend->getTotalMemSize();
+    LargeMemoryBlock *lmb = backend->getLargeBlock(4*MByte);
+    ASSERT( lmb, ASSERT_TEXT );
+
+    const size_t memSize1 = backend->getTotalMemSize();
+    ASSERT( (intptr_t)(memSize1-memSize0) >= 4*MByte, "The backend has not increased the amount of using memory." );
+
+    backend->putLargeBlock(lmb);
+    const size_t memSize2 = backend->getTotalMemSize();
+    ASSERT( memSize2 == memSize0, "The backend has not decreased the amount of using memory." );
+
+    pool_destroy(mPool);
+}
+
+void TestBitMask()
+{
+    BitMaskMin<256> mask;
+
+    mask.reset();
+    mask.set(10, 1);
+    mask.set(5, 1);
+    mask.set(1, 1);
+    ASSERT(mask.getMinTrue(2) == 5, NULL);
+
+    mask.reset();
+    mask.set(0, 1);
+    mask.set(64, 1);
+    mask.set(63, 1);
+    mask.set(200, 1);
+    mask.set(255, 1);
+    ASSERT(mask.getMinTrue(0) == 0, NULL);
+    ASSERT(mask.getMinTrue(1) == 63, NULL);
+    ASSERT(mask.getMinTrue(63) == 63, NULL);
+    ASSERT(mask.getMinTrue(64) == 64, NULL);
+    ASSERT(mask.getMinTrue(101) == 200, NULL);
+    ASSERT(mask.getMinTrue(201) == 255, NULL);
+    mask.set(255, 0);
+    ASSERT(mask.getMinTrue(201) == -1, NULL);
+}
+
+size_t getMemSize()
+{
+    return defaultMemPool->extMemPool.backend.getTotalMemSize();
+}
+
+class CheckNotCached {
+    static size_t memSize;
+public:
+    void operator() () const {
+        int res = scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT, 1);
+        ASSERT(res == TBBMALLOC_OK, NULL);
+        if (memSize==(size_t)-1) {
+            memSize = getMemSize();
+        } else {
+            ASSERT(getMemSize() == memSize, NULL);
+            memSize=(size_t)-1;
+        }
+    }
+};
+
+size_t CheckNotCached::memSize = (size_t)-1;
+
+class RunTestHeapLimit: public SimpleBarrier {
+public:
+    void operator()( int /*mynum*/ ) const {
+        // Provoke bootstrap heap initialization before recording memory size.
+        // NOTE: The initialization should be processed only with a "large"
+        // object. Since the "small" object allocation lead to blocking of a
+        // slab as an active block and it is impossible to release it with
+        // foreign thread.
+        scalable_free(scalable_malloc(minLargeObjectSize));
+        barrier.wait(CheckNotCached());
+        for (size_t n = minLargeObjectSize; n < 5*1024*1024; n += 128*1024)
+            scalable_free(scalable_malloc(n));
+        barrier.wait(CheckNotCached());
+    }
+};
+
+void TestHeapLimit()
+{
+    if(!isMallocInitialized()) doInitialization();
+    // tiny limit to stop caching
+    int res = scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT, 1);
+    ASSERT(res == TBBMALLOC_OK, NULL);
+     // Provoke bootstrap heap initialization before recording memory size.
+    scalable_free(scalable_malloc(8));
+    size_t n, sizeBefore = getMemSize();
+
+    // Try to provoke call to OS for memory to check that
+    // requests are not fulfilled from caches.
+    // Single call is not enough here because of backend fragmentation.
+    for (n = minLargeObjectSize; n < 10*1024*1024; n += 16*1024) {
+        void *p = scalable_malloc(n);
+        bool leave = (sizeBefore != getMemSize());
+        scalable_free(p);
+        if (leave)
+            break;
+        ASSERT(sizeBefore == getMemSize(), "No caching expected");
+    }
+    ASSERT(n < 10*1024*1024, "scalable_malloc doesn't provoke OS request for memory, "
+           "is some internal cache still used?");
+
+    for( int p=MaxThread; p>=MinThread; --p ) {
+        RunTestHeapLimit::initBarrier( p );
+        NativeParallelFor( p, RunTestHeapLimit() );
+    }
+    // it's try to match limit as well as set limit, so call here
+    res = scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT, 1);
+    ASSERT(res == TBBMALLOC_OK, NULL);
+    size_t m = getMemSize();
+    ASSERT(sizeBefore == m, NULL);
+    // restore default
+    res = scalable_allocation_mode(TBBMALLOC_SET_SOFT_HEAP_LIMIT, 0);
+    ASSERT(res == TBBMALLOC_OK, NULL);
+}
+
+void checkNoHugePages()
+{
+    ASSERT(!hugePages.isEnabled, "scalable_allocation_mode "
+           "must have priority over environment variable");
+}
+
+/*---------------------------------------------------------------------------*/
+// The regression test against bugs in TBBMALLOC_CLEAN_ALL_BUFFERS allocation command.
+// The idea is to allocate and deallocate a set of objects randomly in parallel.
+// For large sizes (16K), it forces conflicts in backend during coalescing.
+// For small sizes (4K), it forces cross-thread deallocations and then orphaned slabs.
+// Global cleanup should process orphaned slabs and the queue of postponed coalescing
+// requests, otherwise it will not be able to unmap all unused memory.
+
+const int num_allocs = 10*1024;
+void *ptrs[num_allocs];
+tbb::atomic<int> alloc_counter;
+
+template<int AllocSize>
+struct TestCleanAllBuffersBody : public SimpleBarrier {
+    void operator() ( int ) const {
+        barrier.wait();
+        for( int i = alloc_counter++; i < num_allocs; i = alloc_counter++ ) {
+           ptrs[i] = scalable_malloc( AllocSize );
+           ASSERT( ptrs[i] != NULL, "scalable_malloc returned zero." );
+        }
+        barrier.wait();
+        for( int i = --alloc_counter; i >= 0; i = --alloc_counter )
+           if (i<num_allocs) scalable_free( ptrs[i] );
+    }
+};
+
+template<int AllocSize>
+void TestCleanAllBuffers() {
+    const int num_threads = 8;
+    // Clean up if something was allocated before the test
+    scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS,0);
+
+    size_t memory_in_use_before = getMemSize();
+    alloc_counter = 0;
+    TestCleanAllBuffersBody<AllocSize>::initBarrier(num_threads);
+    NativeParallelFor(num_threads, TestCleanAllBuffersBody<AllocSize>());
+    // TODO: reproduce the bug conditions more reliably
+    if ( defaultMemPool->extMemPool.backend.coalescQ.blocksToFree == NULL )
+        REMARK( "Warning: The queue of postponed coalescing requests is empty. Unable to create the condition for bug reproduction.\n" );
+    int result = scalable_allocation_command(TBBMALLOC_CLEAN_ALL_BUFFERS,0);
+    ASSERT( result == TBBMALLOC_OK, "The cleanup request has not cleaned anything." );
+    size_t memory_in_use_after = getMemSize();
+
+    size_t memory_leak = memory_in_use_after - memory_in_use_before;
+    REMARK( "memory_in_use_before = %ld\nmemory_in_use_after = %ld\n", memory_in_use_before, memory_in_use_after );
+    ASSERT( memory_leak == 0, "Cleanup was unable to release all allocated memory." );
+}
+/*---------------------------------------------------------------------------*/
+/*------------------------- Large Object Cache tests ------------------------*/
+#if _MSC_VER==1600 || _MSC_VER==1500
+    // ignore C4275: non dll-interface class 'stdext::exception' used as
+    // base for dll-interface class 'std::bad_cast'
+    #pragma warning (disable: 4275)
+#endif
+#include <vector>
+#include <list>
+#include __TBB_STD_SWAP_HEADER
+
+// default constructor of CacheBin
+template<typename Props>
+rml::internal::LargeObjectCacheImpl<Props>::CacheBin::CacheBin() {}
+
+template<typename Props>
+class CacheBinModel {
+
+    typedef typename rml::internal::LargeObjectCacheImpl<Props>::CacheBin CacheBinType;
+
+    // The emulated cache bin.
+    CacheBinType cacheBinModel;
+    // The reference to real cahce bin inside the large object cache.
+    CacheBinType &cacheBin;
+
+    const size_t size;
+
+    // save only current time
+    std::list<uintptr_t> objects;
+
+    void doCleanup() {
+        if ( cacheBinModel.cachedSize > Props::TooLargeFactor*cacheBinModel.usedSize ) tooLargeLOC++;
+        else tooLargeLOC = 0;
+
+        if (tooLargeLOC>3 && cacheBinModel.ageThreshold)
+            cacheBinModel.ageThreshold = (cacheBinModel.ageThreshold + cacheBinModel.meanHitRange)/2;
+
+        uintptr_t currTime = cacheCurrTime;
+        while (!objects.empty() && (intptr_t)(currTime - objects.front()) > cacheBinModel.ageThreshold) {
+            cacheBinModel.cachedSize -= size;
+            cacheBinModel.lastCleanedAge = objects.front();
+            objects.pop_front();
+        }
+
+        cacheBinModel.oldest = objects.empty() ? 0 : objects.front();
+    }
+
+public:
+    CacheBinModel(CacheBinType &_cacheBin, size_t allocSize) : cacheBin(_cacheBin), size(allocSize) {
+        cacheBinModel.oldest = cacheBin.oldest;
+        cacheBinModel.lastCleanedAge = cacheBin.lastCleanedAge;
+        cacheBinModel.ageThreshold = cacheBin.ageThreshold;
+        cacheBinModel.usedSize = cacheBin.usedSize;
+        cacheBinModel.cachedSize = cacheBin.cachedSize;
+        cacheBinModel.meanHitRange = cacheBin.meanHitRange;
+        cacheBinModel.lastGet = cacheBin.lastGet;
+    }
+    void get() {
+        uintptr_t currTime = ++cacheCurrTime;
+
+        if ( objects.empty() ) {
+            const uintptr_t sinceLastGet = currTime - cacheBinModel.lastGet;
+            if ( ( cacheBinModel.ageThreshold && sinceLastGet > Props::LongWaitFactor*cacheBinModel.ageThreshold ) ||
+                 ( cacheBinModel.lastCleanedAge && sinceLastGet > Props::LongWaitFactor*(cacheBinModel.lastCleanedAge - cacheBinModel.lastGet) ) )
+                cacheBinModel.lastCleanedAge = cacheBinModel.ageThreshold = 0;
+
+            if (cacheBinModel.lastCleanedAge)
+                cacheBinModel.ageThreshold = Props::OnMissFactor*(currTime - cacheBinModel.lastCleanedAge);
+        } else {
+            uintptr_t obj_age = objects.back();
+            objects.pop_back();
+            if ( objects.empty() ) cacheBinModel.oldest = 0;
+
+            intptr_t hitRange = currTime - obj_age;
+            cacheBinModel.meanHitRange = cacheBinModel.meanHitRange? (cacheBinModel.meanHitRange + hitRange)/2 : hitRange;
+
+            cacheBinModel.cachedSize -= size;
+        }
+
+        cacheBinModel.usedSize += size;
+        cacheBinModel.lastGet = currTime;
+
+        if ( currTime % rml::internal::cacheCleanupFreq == 0 ) doCleanup();
+    }
+
+    void putList( int num ) {
+        uintptr_t currTime = cacheCurrTime;
+        cacheCurrTime += num;
+
+        cacheBinModel.usedSize -= num*size;
+
+        bool cleanUpNeeded = false;
+        if ( !cacheBinModel.lastCleanedAge ) {
+            cacheBinModel.lastCleanedAge = ++currTime;
+            cleanUpNeeded |= currTime % rml::internal::cacheCleanupFreq == 0;
+            num--;
+        }
+
+        for ( int i=1; i<=num; ++i ) {
+            currTime+=1;
+            cleanUpNeeded |= currTime % rml::internal::cacheCleanupFreq == 0;
+            if ( objects.empty() )
+                cacheBinModel.oldest = currTime;
+            objects.push_back(currTime);
+        }
+
+        cacheBinModel.cachedSize += num*size;
+
+        if ( cleanUpNeeded ) doCleanup();
+    }
+
+    void check() {
+        ASSERT(cacheBinModel.oldest == cacheBin.oldest, ASSERT_TEXT);
+        ASSERT(cacheBinModel.lastCleanedAge == cacheBin.lastCleanedAge, ASSERT_TEXT);
+        ASSERT(cacheBinModel.ageThreshold == cacheBin.ageThreshold, ASSERT_TEXT);
+        ASSERT(cacheBinModel.usedSize == cacheBin.usedSize, ASSERT_TEXT);
+        ASSERT(cacheBinModel.cachedSize == cacheBin.cachedSize, ASSERT_TEXT);
+        ASSERT(cacheBinModel.meanHitRange == cacheBin.meanHitRange, ASSERT_TEXT);
+        ASSERT(cacheBinModel.lastGet == cacheBin.lastGet, ASSERT_TEXT);
+    }
+
+    static uintptr_t cacheCurrTime;
+    static intptr_t tooLargeLOC;
+};
+
+template<typename Props> uintptr_t CacheBinModel<Props>::cacheCurrTime;
+template<typename Props> intptr_t CacheBinModel<Props>::tooLargeLOC;
+
+template <typename Scenarion>
+void LOCModelTester() {
+    defaultMemPool->extMemPool.loc.cleanAll();
+    defaultMemPool->extMemPool.loc.reset();
+
+    const size_t size = 16 * 1024;
+    const size_t headersSize = sizeof(rml::internal::LargeMemoryBlock)+sizeof(rml::internal::LargeObjectHdr);
+    const size_t allocationSize = LargeObjectCache::alignToBin(size+headersSize+rml::internal::largeObjectAlignment);
+    const int binIdx = defaultMemPool->extMemPool.loc.largeCache.sizeToIdx( allocationSize );
+
+    CacheBinModel<rml::internal::LargeObjectCache::LargeCacheTypeProps>::cacheCurrTime = defaultMemPool->extMemPool.loc.cacheCurrTime;
+    CacheBinModel<rml::internal::LargeObjectCache::LargeCacheTypeProps>::tooLargeLOC = defaultMemPool->extMemPool.loc.largeCache.tooLargeLOC;
+    CacheBinModel<rml::internal::LargeObjectCache::LargeCacheTypeProps> cacheBinModel(defaultMemPool->extMemPool.loc.largeCache.bin[binIdx], allocationSize);
+
+    Scenarion scen;
+    for (rml::internal::LargeMemoryBlock *lmb = scen.next(); (intptr_t)lmb != (intptr_t)-1; lmb = scen.next()) {
+        if ( lmb ) {
+            int num=1;
+            for (rml::internal::LargeMemoryBlock *curr = lmb; curr->next; curr=curr->next) num+=1;
+            defaultMemPool->extMemPool.freeLargeObject(lmb);
+            cacheBinModel.putList(num);
+        } else {
+            scen.saveLmb(defaultMemPool->extMemPool.mallocLargeObject(defaultMemPool, allocationSize));
+            cacheBinModel.get();
+        }
+
+        cacheBinModel.check();
+    }
+}
+
+class TestBootstrap {
+    bool allocating;
+    std::vector<rml::internal::LargeMemoryBlock*> lmbArray;
+public:
+    TestBootstrap() : allocating(true) {}
+
+    rml::internal::LargeMemoryBlock* next() {
+        if ( allocating )
+            return NULL;
+        if ( !lmbArray.empty() ) {
+            rml::internal::LargeMemoryBlock *ret = lmbArray.back();
+            lmbArray.pop_back();
+            return ret;
+        }
+        return (rml::internal::LargeMemoryBlock*)-1;
+    }
+
+    void saveLmb( rml::internal::LargeMemoryBlock *lmb ) {
+        lmb->next = NULL;
+        lmbArray.push_back(lmb);
+        if ( lmbArray.size() == 1000 ) allocating = false;
+    }
+};
+
+class TestRandom {
+    std::vector<rml::internal::LargeMemoryBlock*> lmbArray;
+    int numOps;
+public:
+    TestRandom() : numOps(100000) {
+        srand(1234);
+    }
+
+    rml::internal::LargeMemoryBlock* next() {
+        if ( numOps-- ) {
+            if ( lmbArray.empty() || rand() / (RAND_MAX>>1) == 0 )
+                return NULL;
+            size_t ind = rand()%lmbArray.size();
+            if ( ind != lmbArray.size()-1 ) std::swap(lmbArray[ind],lmbArray[lmbArray.size()-1]);
+            rml::internal::LargeMemoryBlock *lmb = lmbArray.back();
+            lmbArray.pop_back();
+            return lmb;
+        }
+        return (rml::internal::LargeMemoryBlock*)-1;
+    }
+
+    void saveLmb( rml::internal::LargeMemoryBlock *lmb ) {
+        lmb->next = NULL;
+        lmbArray.push_back(lmb);
+    }
+};
+
+class TestCollapsingMallocFree : public SimpleBarrier {
+public:
+    static const int NUM_ALLOCS = 100000;
+    const int num_threads;
+
+    TestCollapsingMallocFree( int _num_threads ) : num_threads(_num_threads) {
+        initBarrier( num_threads );
+    }
+
+    void operator() ( int ) const {
+        const size_t size = 16 * 1024;
+        const size_t headersSize = sizeof(rml::internal::LargeMemoryBlock)+sizeof(rml::internal::LargeObjectHdr);
+        const size_t allocationSize = LargeObjectCache::alignToBin(size+headersSize+rml::internal::largeObjectAlignment);
+
+        barrier.wait();
+        for ( int i=0; i<NUM_ALLOCS; ++i ) {
+            defaultMemPool->extMemPool.freeLargeObject(
+                defaultMemPool->extMemPool.mallocLargeObject(defaultMemPool, allocationSize) );
+        }
+    }
+
+    void check() {
+        ASSERT( tbbmalloc_whitebox::locGetProcessed == tbbmalloc_whitebox::locPutProcessed, ASSERT_TEXT );
+        ASSERT( tbbmalloc_whitebox::locGetProcessed < num_threads*NUM_ALLOCS, "No one Malloc/Free pair was collapsed." );
+    }
+};
+
+class TestCollapsingBootstrap : public SimpleBarrier {
+    class CheckNumAllocs {
+        const int num_threads;
+    public:
+        CheckNumAllocs( int _num_threads ) : num_threads(_num_threads) {}
+        void operator()() const {
+            ASSERT( tbbmalloc_whitebox::locGetProcessed == num_threads*NUM_ALLOCS, ASSERT_TEXT );
+            ASSERT( tbbmalloc_whitebox::locPutProcessed == 0, ASSERT_TEXT );
+        }
+    };
+public:
+    static const int NUM_ALLOCS = 1000;
+    const int num_threads;
+
+    TestCollapsingBootstrap( int _num_threads ) : num_threads(_num_threads) {
+        initBarrier( num_threads );
+    }
+
+    void operator() ( int ) const {
+        const size_t size = 16 * 1024;
+        size_t headersSize = sizeof(rml::internal::LargeMemoryBlock)+sizeof(rml::internal::LargeObjectHdr);
+        size_t allocationSize = LargeObjectCache::alignToBin(size+headersSize+rml::internal::largeObjectAlignment);
+
+        barrier.wait();
+        rml::internal::LargeMemoryBlock *lmbArray[NUM_ALLOCS];
+        for ( int i=0; i<NUM_ALLOCS; ++i )
+            lmbArray[i] = defaultMemPool->extMemPool.mallocLargeObject(defaultMemPool, allocationSize);
+
+        barrier.wait(CheckNumAllocs(num_threads));
+        for ( int i=0; i<NUM_ALLOCS; ++i )
+            defaultMemPool->extMemPool.freeLargeObject( lmbArray[i] );
+    }
+
+    void check() {
+        ASSERT( tbbmalloc_whitebox::locGetProcessed == tbbmalloc_whitebox::locPutProcessed, ASSERT_TEXT );
+        ASSERT( tbbmalloc_whitebox::locGetProcessed == num_threads*NUM_ALLOCS, ASSERT_TEXT );
+    }
+};
+
+template <typename Scenario>
+void LOCCollapsingTester( int num_threads ) {
+    tbbmalloc_whitebox::locGetProcessed = 0;
+    tbbmalloc_whitebox::locPutProcessed = 0;
+    defaultMemPool->extMemPool.loc.cleanAll();
+    defaultMemPool->extMemPool.loc.reset();
+
+    Scenario scen(num_threads);
+    NativeParallelFor(num_threads, scen);
+
+    scen.check();
+}
+
+void TestLOC() {
+    LOCModelTester<TestBootstrap>();
+    LOCModelTester<TestRandom>();
+
+    const int num_threads = 16;
+    LOCCollapsingTester<TestCollapsingBootstrap>( num_threads );
+    if ( num_threads > 1 ) {
+        REMARK( "num_threads = %d\n", num_threads );
+        LOCCollapsingTester<TestCollapsingMallocFree>( num_threads );
+    } else {
+        REPORT( "Warning: concurrency is too low for TestMallocFreeCollapsing ( num_threads = %d )\n", num_threads );
+    }
+}
+/*---------------------------------------------------------------------------*/
+
+void *findCacheLine(void *p) {
+    return (void*)alignDown((uintptr_t)p, estimatedCacheLineSize);
+}
+
+// test that internals of Block are at expected cache lines
+void TestSlabAlignment() {
+    const size_t min_sz = 8;
+    const int space = 2*16*1024; // fill at least 2 slabs
+    void *pointers[space / min_sz];  // the worst case is min_sz byte object
+
+    for (size_t sz = min_sz; sz <= 64; sz *= 2) {
+        for (size_t i = 0; i < space/sz; i++) {
+            pointers[i] = scalable_malloc(sz);
+            Block *block = (Block *)alignDown(pointers[i], slabSize);
+            MALLOC_ASSERT(findCacheLine(&block->isFull) != findCacheLine(pointers[i]),
+                          "A user object must not share a cache line with slab control structures.");
+            MALLOC_ASSERT(findCacheLine(&block->next) != findCacheLine(&block->nextPrivatizable),
+                          "GlobalBlockFields and LocalBlockFields must be on different cache lines.");
+        }
+        for (size_t i = 0; i < space/sz; i++)
+            scalable_free(pointers[i]);
+    }
+}
+
+#include "harness_memory.h"
+
+// TODO: Consider adding Huge Pages support on macOS (special mmap flag).
+// Transparent Huge pages support could be enabled by different system parsing mechanism,
+// because there is no /proc/meminfo on macOS
+#if __linux__
+void TestTHP() {
+    // Get backend from default memory pool
+    rml::internal::Backend *backend = &(defaultMemPool->extMemPool.backend);
+
+    // Configure malloc to use huge pages
+    scalable_allocation_mode(USE_HUGE_PAGES, 1);
+    MALLOC_ASSERT(hugePages.isEnabled, "Huge pages should be enabled via scalable_allocation_mode");
+
+    const int HUGE_PAGE_SIZE = 2 * 1024 * 1024;
+
+    // allocCount transparent huge pages should be allocated
+    const int allocCount = 10;
+
+    // Allocate huge page aligned memory regions to track system
+    // counters for transparent huge pages
+    void*  allocPtrs[allocCount];
+
+    // Wait for the system to update process memory info files after other tests
+    Harness::Sleep(4000);
+
+    // Parse system info regarding current THP status
+    size_t currentSystemTHPCount = getSystemTHPCount();
+    size_t currentSystemTHPAllocatedSize = getSystemTHPAllocatedSize();
+
+    for (int i = 0; i < allocCount; i++) {
+        // Allocation size have to be aligned on page size
+        size_t allocSize = HUGE_PAGE_SIZE - (i * 1000);
+
+        // Map memory
+        allocPtrs[i] = backend->allocRawMem(allocSize);
+
+        MALLOC_ASSERT(allocPtrs[i], "Allocation not succeded.");
+        MALLOC_ASSERT(allocSize == HUGE_PAGE_SIZE,
+            "Allocation size have to be aligned on Huge Page size internaly.");
+
+        // First touch policy - no real pages allocated by OS without accessing the region
+        memset(allocPtrs[i], 1, allocSize);
+
+        MALLOC_ASSERT(isAligned(allocPtrs[i], HUGE_PAGE_SIZE),
+            "The pointer returned by scalable_malloc is not alligned on huge page size.");
+    }
+
+    // Wait for the system to update process memory info files after allocations
+    Harness::Sleep(4000);
+
+    // Generaly, kernel tries to allocate transparent huge pages, but sometimes it cannot do this
+    // (tested on SLES 11/12), so consider this system info checks as a remark.
+    // Also, some systems can allocate more memory then needed in background (tested on Ubuntu 14.04)
+    size_t newSystemTHPCount = getSystemTHPCount();
+    size_t newSystemTHPAllocatedSize = getSystemTHPAllocatedSize();
+    if ((newSystemTHPCount - currentSystemTHPCount) < allocCount
+            && (newSystemTHPAllocatedSize - currentSystemTHPAllocatedSize) / (2 * 1024) < allocCount) {
+        REPORT( "Warning: the system didn't allocate needed amount of THPs.\n" );
+    }
+
+    // Test memory unmap
+    for (int i = 0; i < allocCount; i++) {
+        MALLOC_ASSERT(backend->freeRawMem(allocPtrs[i], HUGE_PAGE_SIZE),
+                "Something went wrong during raw memory free");
+    }
+}
+#endif // __linux__
+
+inline size_t getStabilizedMemUsage() {
+    for (int i = 0; i < 3; i++) GetMemoryUsage();
+    return GetMemoryUsage();
+}
+
+inline void* reallocAndRetrieve(void* origPtr, size_t reallocSize, size_t& origBlockSize, size_t& reallocBlockSize) {
+    rml::internal::LargeMemoryBlock* origLmb = ((rml::internal::LargeObjectHdr *)origPtr - 1)->memoryBlock;
+    origBlockSize = origLmb->unalignedSize;
+
+    void* reallocPtr = rml::internal::reallocAligned(defaultMemPool, origPtr, reallocSize, 0);
+
+    // Retrieved reallocated block information
+    rml::internal::LargeMemoryBlock* reallocLmb = ((rml::internal::LargeObjectHdr *)reallocPtr - 1)->memoryBlock;
+    reallocBlockSize = reallocLmb->unalignedSize;
+
+    return reallocPtr;
+}
+
+void TestReallocDecreasing() {
+
+    /* Testing that actual reallocation happens for large objects that do not fit the backend cache
+       but decrease in size by a factor of >= 2. */
+
+    size_t startSize = 100 * 1024 * 1024;
+    size_t maxBinnedSize = defaultMemPool->extMemPool.backend.getMaxBinnedSize();
+    void*  origPtr = scalable_malloc(startSize);
+    void*  reallocPtr = NULL;
+
+    // Realloc on 1MB less size
+    size_t origBlockSize = 42;
+    size_t reallocBlockSize = 43;
+    reallocPtr = reallocAndRetrieve(origPtr, startSize - 1 * 1024 * 1024, origBlockSize, reallocBlockSize);
+    MALLOC_ASSERT(origBlockSize == reallocBlockSize, "Reallocated block size shouldn't change");
+    MALLOC_ASSERT(reallocPtr == origPtr, "Original pointer shouldn't change");
+
+    // Repeated decreasing reallocation while max cache bin size reached
+    size_t reallocSize = (startSize / 2) - 1000; // exact realloc
+    while(reallocSize > maxBinnedSize) {
+
+        // Prevent huge/large objects caching 
+        defaultMemPool->extMemPool.loc.cleanAll();
+        // Prevent local large object caching
+        TLSData *tls = defaultMemPool->getTLS(/*create=*/false);
+        tls->lloc.externalCleanup(&defaultMemPool->extMemPool);
+
+        size_t sysMemUsageBefore = getStabilizedMemUsage();
+        size_t totalMemSizeBefore = defaultMemPool->extMemPool.backend.getTotalMemSize();
+
+        reallocPtr = reallocAndRetrieve(origPtr, reallocSize, origBlockSize, reallocBlockSize);
+
+        MALLOC_ASSERT(origBlockSize > reallocBlockSize, "Reallocated block size should descrease.");
+
+        size_t sysMemUsageAfter = getStabilizedMemUsage();
+        size_t totalMemSizeAfter = defaultMemPool->extMemPool.backend.getTotalMemSize();
+
+        // Prevent false checking when backend caching occurred or could not read system memory usage info
+        if (totalMemSizeBefore > totalMemSizeAfter && sysMemUsageAfter != 0 && sysMemUsageBefore != 0) {
+            MALLOC_ASSERT(sysMemUsageBefore > sysMemUsageAfter, "Memory were not released");
+        }
+
+        origPtr = reallocPtr;
+        reallocSize = (reallocSize / 2) - 1000; // exact realloc
+    }
+    scalable_free(reallocPtr);
+
+    /* TODO: Decreasing reallocation of large objects that fit backend cache */
+    /* TODO: Small objects decreasing reallocation test */
+}
+
+int TestMain () {
+    scalable_allocation_mode(USE_HUGE_PAGES, 0);
+#if !__TBB_WIN8UI_SUPPORT
+    Harness::SetEnv("TBB_MALLOC_USE_HUGE_PAGES","yes");
+#endif
+    checkNoHugePages();
+    // backreference requires that initialization was done
+    if(!isMallocInitialized()) doInitialization();
+    checkNoHugePages();
+    // to succeed, leak detection must be the 1st memory-intensive test
+    TestBackRef();
+    TestCleanAllBuffers<4*1024>();
+    TestCleanAllBuffers<16*1024>();
+    TestPools();
+    TestBackend();
+
+#if MALLOC_CHECK_RECURSION
+    for( int p=MaxThread; p>=MinThread; --p ) {
+        TestStartupAlloc::initBarrier( p );
+        NativeParallelFor( p, TestStartupAlloc() );
+        ASSERT(!firstStartupBlock, "Startup heap memory leak detected");
+    }
+#endif
+
+    TestLargeObjectCache();
+    TestObjectRecognition();
+    TestBitMask();
+    TestHeapLimit();
+    TestLOC();
+    TestSlabAlignment();
+    TestReallocDecreasing();
+
+#if __linux__
+    if (isTHPEnabledOnMachine()) {
+        TestTHP();
+    } else {
+        REMARK("Transparent Huge Pages is not supported on the system - skipped the test\n");
+    }
+#endif
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_model_plugin.cpp b/xdl/third_party/tbb/src/test/test_model_plugin.cpp
new file mode 100644
index 00000000..664bb5f5
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_model_plugin.cpp
@@ -0,0 +1,220 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 4
+#define HARNESS_DEFAULT_MAX_THREADS 4
+
+// Need to include "tbb/tbb_config.h" to obtain the definition of __TBB_DEFINE_MIC.
+#include "tbb/tbb_config.h"
+
+#if !__TBB_TODO || __TBB_WIN8UI_SUPPORT
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+int TestMain() {
+    return Harness::Skipped;
+}
+#else /* __TBB_TODO */
+// TODO: There are a lot of problems with unloading DLL which uses TBB with automatic initialization
+
+#if __TBB_DEFINE_MIC
+
+#ifndef _USRDLL
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+int TestMain() {
+    return Harness::Skipped;
+}
+#endif
+
+#else /* !__MIC__ */
+
+#if _WIN32 || _WIN64
+#include "tbb/machine/windows_api.h"
+#else
+#include <dlfcn.h>
+#endif
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <stdexcept>
+
+#if TBB_USE_EXCEPTIONS
+    #include "harness_report.h"
+#endif
+
+#ifdef _USRDLL
+#include "tbb/task_scheduler_init.h"
+
+class CModel {
+public:
+    CModel(void) {};
+    static tbb::task_scheduler_init tbb_init;
+
+    void init_and_terminate( int );
+};
+
+tbb::task_scheduler_init CModel::tbb_init(1);
+
+//! Test that task::initialize and task::terminate work when doing nothing else.
+/** maxthread is treated as the "maximum" number of worker threads. */
+void CModel::init_and_terminate( int maxthread ) {
+    for( int i=0; i<200; ++i ) {
+        switch( i&3 ) {
+            default: {
+                tbb::task_scheduler_init init( rand() % maxthread + 1 );
+                break;
+            }
+            case 0: {
+                tbb::task_scheduler_init init;
+                break;
+            }
+            case 1: {
+                tbb::task_scheduler_init init( tbb::task_scheduler_init::automatic );
+                break;
+            }
+            case 2: {
+                tbb::task_scheduler_init init( tbb::task_scheduler_init::deferred );
+                init.initialize( rand() % maxthread + 1 );
+                init.terminate();
+                break;
+            }
+        }
+    }
+}
+
+extern "C"
+#if _WIN32 || _WIN64
+__declspec(dllexport)
+#endif
+void plugin_call(int maxthread)
+{
+    srand(2);
+    __TBB_TRY {
+        CModel model;
+        model.init_and_terminate(maxthread);
+    } __TBB_CATCH( std::runtime_error& error ) {
+#if TBB_USE_EXCEPTIONS
+        REPORT("ERROR: %s\n", error.what());
+#endif /* TBB_USE_EXCEPTIONS */
+    }
+}
+
+#else /* _USRDLL undefined */
+
+#include "harness.h"
+#include "harness_dynamic_libs.h"
+#include "harness_tls.h"
+
+extern "C" void plugin_call(int);
+
+void report_error_in(const char* function_name)
+{
+#if _WIN32 || _WIN64
+    char* message;
+    int code = GetLastError();
+
+    FormatMessage(
+        FORMAT_MESSAGE_ALLOCATE_BUFFER | FORMAT_MESSAGE_FROM_SYSTEM,
+        NULL, code,MAKELANGID(LANG_NEUTRAL, SUBLANG_DEFAULT),
+        (char*)&message, 0, NULL );
+#else
+    char* message = (char*)dlerror();
+    int code = 0;
+#endif
+    REPORT( "%s failed with error %d: %s\n", function_name, code, message);
+
+#if _WIN32 || _WIN64
+    LocalFree(message);
+#endif
+}
+
+typedef void (*PLUGIN_CALL)(int);
+
+#if __linux__
+    #define RML_LIBRARY_NAME(base) TEST_LIBRARY_NAME(base) ".1"
+#else
+    #define RML_LIBRARY_NAME(base) TEST_LIBRARY_NAME(base)
+#endif
+
+int TestMain () {
+#if !RML_USE_WCRM
+    PLUGIN_CALL my_plugin_call;
+
+    LimitTLSKeysTo limitTLS(10);
+
+    Harness::LIBRARY_HANDLE hLib;
+#if _WIN32 || _WIN64
+    hLib = LoadLibrary("irml.dll");
+    if ( !hLib )
+        hLib = LoadLibrary("irml_debug.dll");
+    if ( !hLib )
+        return Harness::Skipped; // No shared RML, skip the test
+    FreeLibrary(hLib);
+#else /* !WIN */
+#if __TBB_ARENA_PER_MASTER
+    hLib = dlopen(RML_LIBRARY_NAME("libirml"), RTLD_LAZY);
+    if ( !hLib )
+        hLib = dlopen(RML_LIBRARY_NAME("libirml_debug"), RTLD_LAZY);
+    if ( !hLib )
+        return Harness::Skipped;
+    dlclose(hLib);
+#endif /* __TBB_ARENA_PER_MASTER */
+#endif /* OS */
+    for( int i=1; i<100; ++i ) {  
+        REMARK("Iteration %d, loading plugin library...\n", i);
+        hLib = Harness::OpenLibrary(TEST_LIBRARY_NAME("test_model_plugin_dll"));
+        if ( !hLib ) {
+#if !__TBB_NO_IMPLICIT_LINKAGE
+#if _WIN32 || _WIN64
+            report_error_in("LoadLibrary");
+#else
+            report_error_in("dlopen");
+#endif
+            return -1;
+#else
+            return Harness::Skipped;
+#endif
+        }
+        my_plugin_call = (PLUGIN_CALL)Harness::GetAddress(hLib, "plugin_call");
+        if (my_plugin_call==NULL) {
+#if _WIN32 || _WIN64
+            report_error_in("GetProcAddress");
+#else
+            report_error_in("dlsym");
+#endif
+            return -1;
+        }
+        REMARK("Calling plugin method...\n");
+        my_plugin_call(MaxThread);
+
+        REMARK("Unloading plugin library...\n");
+        Harness::CloseLibrary(hLib);
+    } // end for(1,100)
+
+    return Harness::Done;
+#else
+    return Harness::Skipped;
+#endif /* !RML_USE_WCRM */
+}
+
+#endif//_USRDLL
+#endif//__MIC__
+
+#endif /*__TBB_WIN8UI_SUPPORT*/
diff --git a/xdl/third_party/tbb/src/test/test_multifunction_node.cpp b/xdl/third_party/tbb/src/test/test_multifunction_node.cpp
new file mode 100644
index 00000000..17b1f106
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_multifunction_node.cpp
@@ -0,0 +1,706 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/spin_rw_mutex.h"
+
+#if TBB_USE_DEBUG
+#define N 16
+#else
+#define N 100
+#endif
+#define MAX_NODES 4
+
+//! Performs test on function nodes with limited concurrency and buffering
+/** Theses tests check:
+    1) that the number of executing copies never exceed the concurrency limit
+    2) that the node never rejects
+    3) that no items are lost
+    and 4) all of this happens even if there are multiple predecessors and successors
+*/
+
+template< typename InputType >
+struct parallel_put_until_limit : private NoAssign {
+
+    harness_counting_sender<InputType> *my_senders;
+
+    parallel_put_until_limit( harness_counting_sender<InputType> *senders ) : my_senders(senders) {}
+
+    void operator()( int i ) const  {
+        if ( my_senders ) {
+            my_senders[i].try_put_until_limit();
+        }
+    }
+
+};
+
+//! exercise buffered multifunction_node.
+template< typename InputType, typename OutputTuple, typename Body >
+void buffered_levels( size_t concurrency, Body body ) {
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type OutputType;
+    // Do for lc = 1 to concurrency level
+    for ( size_t lc = 1; lc <= concurrency; ++lc ) {
+        tbb::flow::graph g;
+
+        // Set the execute_counter back to zero in the harness
+        harness_graph_multifunction_executor<InputType, OutputTuple>::execute_count = 0;
+        // Set the number of current executors to zero.
+        harness_graph_multifunction_executor<InputType, OutputTuple>::current_executors = 0;
+        // Set the max allowed executors to lc.  There is a check in the functor to make sure this is never exceeded.
+        harness_graph_multifunction_executor<InputType, OutputTuple>::max_executors = lc;
+
+        // Create the function_node with the appropriate concurrency level, and use default buffering
+        tbb::flow::multifunction_node< InputType, OutputTuple > exe_node( g, lc, body );
+
+        //Create a vector of identical exe_nodes
+        std::vector< tbb::flow::multifunction_node< InputType, OutputTuple > > exe_vec(2, exe_node);
+
+        // exercise each of the copied nodes
+        for (size_t node_idx=0; node_idx<exe_vec.size(); ++node_idx) {
+            for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+                // Create num_receivers counting receivers and connect the exe_vec[node_idx] to them.
+                std::vector< harness_mapped_receiver<OutputType>* > receivers(num_receivers);
+                for (size_t i = 0; i < num_receivers; i++) {
+                    receivers[i] = new harness_mapped_receiver<OutputType>(g);
+                }
+
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    tbb::flow::make_edge( tbb::flow::output_port<0>(exe_vec[node_idx]), *receivers[r] );
+                }
+
+                // Do the test with varying numbers of senders
+                harness_counting_sender<InputType> *senders = NULL;
+                for (size_t num_senders = 1; num_senders <= MAX_NODES; ++num_senders ) {
+                    // Create num_senders senders, set their message limit each to N, and connect them to the exe_vec[node_idx]
+                    senders = new harness_counting_sender<InputType>[num_senders];
+                    for (size_t s = 0; s < num_senders; ++s ) {
+                        senders[s].my_limit = N;
+                        tbb::flow::make_edge( senders[s], exe_vec[node_idx] );
+                    }
+
+                    // Initialize the receivers so they know how many senders and messages to check for
+                    for (size_t r = 0; r < num_receivers; ++r ) {
+                         receivers[r]->initialize_map( N, num_senders );
+                    }
+
+                    // Do the test
+                    NativeParallelFor( (int)num_senders, parallel_put_until_limit<InputType>(senders) );
+                    g.wait_for_all();
+
+                    // confirm that each sender was requested from N times
+                    for (size_t s = 0; s < num_senders; ++s ) {
+                        size_t n = senders[s].my_received;
+                        ASSERT( n == N, NULL );
+                        ASSERT( senders[s].my_receiver == &exe_vec[node_idx], NULL );
+                    }
+                    // validate the receivers
+                    for (size_t r = 0; r < num_receivers; ++r ) {
+                        receivers[r]->validate();
+                    }
+                    delete [] senders;
+                }
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    tbb::flow::remove_edge( tbb::flow::output_port<0>(exe_vec[node_idx]), *receivers[r] );
+                }
+                ASSERT( exe_vec[node_idx].try_put( InputType() ) == true, NULL );
+                g.wait_for_all();
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    // since it's detached, nothing should have changed
+                    receivers[r]->validate();
+                }
+
+                for (size_t i = 0; i < num_receivers; i++) {
+                    delete receivers[i];
+                }
+            }
+        }
+    }
+}
+
+const size_t Offset = 123;
+tbb::atomic<size_t> global_execute_count;
+
+struct inc_functor {
+
+    tbb::atomic<size_t> local_execute_count;
+    inc_functor( ) { local_execute_count = 0; }
+    inc_functor( const inc_functor &f ) { local_execute_count = f.local_execute_count; }
+
+    template<typename output_ports_type>
+    void operator()( int i, output_ports_type &p ) {
+       ++global_execute_count;
+       ++local_execute_count;
+       (void)tbb::flow::get<0>(p).try_put(i);
+    }
+
+};
+
+template< typename InputType, typename OutputTuple >
+void buffered_levels_with_copy( size_t concurrency ) {
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type OutputType;
+    // Do for lc = 1 to concurrency level
+    for ( size_t lc = 1; lc <= concurrency; ++lc ) {
+        tbb::flow::graph g;
+
+        inc_functor cf;
+        cf.local_execute_count = Offset;
+        global_execute_count = Offset;
+
+        tbb::flow::multifunction_node< InputType, OutputTuple > exe_node( g, lc, cf );
+
+        for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+
+            std::vector< harness_mapped_receiver<OutputType>* > receivers(num_receivers);
+            for (size_t i = 0; i < num_receivers; i++) {
+                receivers[i] = new harness_mapped_receiver<OutputType>(g);
+            }
+
+            for (size_t r = 0; r < num_receivers; ++r ) {
+               tbb::flow::make_edge( tbb::flow::output_port<0>(exe_node), *receivers[r] );
+            }
+
+            harness_counting_sender<InputType> *senders = NULL;
+            for (size_t num_senders = 1; num_senders <= MAX_NODES; ++num_senders ) {
+                senders = new harness_counting_sender<InputType>[num_senders];
+                for (size_t s = 0; s < num_senders; ++s ) {
+                    senders[s].my_limit = N;
+                    tbb::flow::make_edge( senders[s], exe_node );
+                }
+
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    receivers[r]->initialize_map( N, num_senders );
+                }
+
+                NativeParallelFor( (int)num_senders, parallel_put_until_limit<InputType>(senders) );
+                g.wait_for_all();
+
+                for (size_t s = 0; s < num_senders; ++s ) {
+                    size_t n = senders[s].my_received;
+                    ASSERT( n == N, NULL );
+                    ASSERT( senders[s].my_receiver == &exe_node, NULL );
+                }
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    receivers[r]->validate();
+                }
+                delete [] senders;
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( tbb::flow::output_port<0>(exe_node), *receivers[r] );
+            }
+            ASSERT( exe_node.try_put( InputType() ) == true, NULL );
+            g.wait_for_all();
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                receivers[r]->validate();
+            }
+
+            for (size_t i = 0; i < num_receivers; i++) {
+                delete receivers[i];
+            }
+        }
+
+        // validate that the local body matches the global execute_count and both are correct
+        inc_functor body_copy = tbb::flow::copy_body<inc_functor>( exe_node );
+        const size_t expected_count = N/2 * MAX_NODES * MAX_NODES * ( MAX_NODES + 1 ) + MAX_NODES + Offset;
+        size_t global_count = global_execute_count;
+        size_t inc_count = body_copy.local_execute_count;
+        ASSERT( global_count == expected_count && global_count == inc_count, NULL );
+    }
+}
+
+template< typename InputType, typename OutputTuple >
+void run_buffered_levels( int c ) {
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    typedef typename tbb::flow::multifunction_node<InputType,OutputTuple>::output_ports_type output_ports_type;
+    buffered_levels<InputType,OutputTuple>( c, []( InputType i, output_ports_type &p ) { harness_graph_multifunction_executor<InputType, OutputTuple>::func(i,p); } );
+    #endif
+    buffered_levels<InputType,OutputTuple>( c, &harness_graph_multifunction_executor<InputType, OutputTuple>::func );
+    buffered_levels<InputType,OutputTuple>( c, typename harness_graph_multifunction_executor<InputType, OutputTuple>::functor() );
+    buffered_levels_with_copy<InputType,OutputTuple>( c );
+}
+
+
+//! Performs test on executable nodes with limited concurrency
+/** Theses tests check:
+    1) that the nodes will accepts puts up to the concurrency limit,
+    2) the nodes do not exceed the concurrency limit even when run with more threads (this is checked in the harness_graph_executor),
+    3) the nodes will receive puts from multiple successors simultaneously,
+    and 4) the nodes will send to multiple predecessors.
+    There is no checking of the contents of the messages for corruption.
+*/
+
+template< typename InputType, typename OutputTuple, typename Body >
+void concurrency_levels( size_t concurrency, Body body ) {
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type OutputType;
+    for ( size_t lc = 1; lc <= concurrency; ++lc ) {
+        tbb::flow::graph g;
+
+        // Set the execute_counter back to zero in the harness
+        harness_graph_multifunction_executor<InputType, OutputTuple>::execute_count = 0;
+        // Set the number of current executors to zero.
+        harness_graph_multifunction_executor<InputType, OutputTuple>::current_executors = 0;
+        // Set the max allowed executors to lc.  There is a check in the functor to make sure this is never exceeded.
+        harness_graph_multifunction_executor<InputType, OutputTuple>::max_executors = lc;
+
+
+        tbb::flow::multifunction_node< InputType, OutputTuple, tbb::flow::rejecting > exe_node( g, lc, body );
+
+        for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+
+            std::vector< harness_counting_receiver<OutputType> > receivers(num_receivers, harness_counting_receiver<OutputType>(g));
+
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::make_edge( tbb::flow::output_port<0>(exe_node), receivers[r] );
+            }
+
+            harness_counting_sender<InputType> *senders = NULL;
+
+            for (size_t num_senders = 1; num_senders <= MAX_NODES; ++num_senders ) {
+                {
+                    // Exclusively lock m to prevent exe_node from finishing
+                    tbb::spin_rw_mutex::scoped_lock l( harness_graph_multifunction_executor< InputType, OutputTuple>::template mutex_holder<tbb::spin_rw_mutex>::mutex );
+
+                    // put to lc level, it will accept and then block at m
+                    for ( size_t c = 0 ; c < lc ; ++c ) {
+                        ASSERT( exe_node.try_put( InputType() ) == true, NULL );
+                    }
+                    // it only accepts to lc level
+                    ASSERT( exe_node.try_put( InputType() ) == false, NULL );
+
+                    senders = new harness_counting_sender<InputType>[num_senders];
+                    for (size_t s = 0; s < num_senders; ++s ) {
+                       // register a sender
+                       senders[s].my_limit = N;
+                       exe_node.register_predecessor( senders[s] );
+                    }
+
+                } // release lock at end of scope, setting the exe node free to continue
+                // wait for graph to settle down
+                g.wait_for_all();
+
+                // confirm that each sender was requested from N times
+                for (size_t s = 0; s < num_senders; ++s ) {
+                    size_t n = senders[s].my_received;
+                    ASSERT( n == N, NULL );
+                    ASSERT( senders[s].my_receiver == &exe_node, NULL );
+                }
+                // confirm that each receivers got N * num_senders + the initial lc puts
+                for (size_t r = 0; r < num_receivers; ++r ) {
+                    size_t n = receivers[r].my_count;
+                    ASSERT( n == num_senders*N+lc, NULL );
+                    receivers[r].my_count = 0;
+                }
+                delete [] senders;
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( tbb::flow::output_port<0>(exe_node), receivers[r] );
+            }
+            ASSERT( exe_node.try_put( InputType() ) == true, NULL );
+            g.wait_for_all();
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                ASSERT( int(receivers[r].my_count) == 0, NULL );
+            }
+        }
+    }
+}
+
+template< typename InputType, typename OutputTuple >
+void run_concurrency_levels( int c ) {
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    typedef typename tbb::flow::multifunction_node<InputType,OutputTuple>::output_ports_type output_ports_type;
+    concurrency_levels<InputType,OutputTuple>( c, []( InputType i, output_ports_type &p ) { harness_graph_multifunction_executor<InputType, OutputTuple>::template tfunc<tbb::spin_rw_mutex>(i,p); } );
+    #endif
+    concurrency_levels<InputType,OutputTuple>( c, &harness_graph_multifunction_executor<InputType, OutputTuple>::template tfunc<tbb::spin_rw_mutex> );
+    concurrency_levels<InputType,OutputTuple>( c, typename harness_graph_multifunction_executor<InputType, OutputTuple>::template tfunctor<tbb::spin_rw_mutex>() );
+}
+
+
+struct empty_no_assign {
+   empty_no_assign() {}
+   empty_no_assign( int ) {}
+   operator int() { return 0; }
+   operator int() const { return 0; }
+};
+
+template< typename InputType >
+struct parallel_puts : private NoAssign {
+
+    tbb::flow::receiver< InputType > * const my_exe_node;
+
+    parallel_puts( tbb::flow::receiver< InputType > &exe_node ) : my_exe_node(&exe_node) {}
+
+    void operator()( int ) const  {
+        for ( int i = 0; i < N; ++i ) {
+            // the nodes will accept all puts
+            ASSERT( my_exe_node->try_put( InputType() ) == true, NULL );
+        }
+    }
+
+};
+
+//! Performs test on executable nodes with unlimited concurrency
+/** These tests check:
+    1) that the nodes will accept all puts
+    2) the nodes will receive puts from multiple predecessors simultaneously,
+    and 3) the nodes will send to multiple successors.
+    There is no checking of the contents of the messages for corruption.
+*/
+
+template< typename InputType, typename OutputTuple, typename Body >
+void unlimited_concurrency( Body body ) {
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type OutputType;
+
+    for (int p = 1; p < 2*MaxThread; ++p) {
+        tbb::flow::graph g;
+        tbb::flow::multifunction_node< InputType, OutputTuple, tbb::flow::rejecting > exe_node( g, tbb::flow::unlimited, body );
+
+        for (size_t num_receivers = 1; num_receivers <= MAX_NODES; ++num_receivers ) {
+            std::vector< harness_counting_receiver<OutputType> > receivers(num_receivers, harness_counting_receiver<OutputType>(g));
+
+            harness_graph_multifunction_executor<InputType, OutputTuple>::execute_count = 0;
+
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::make_edge( tbb::flow::output_port<0>(exe_node), receivers[r] );
+            }
+
+            NativeParallelFor( p, parallel_puts<InputType>(exe_node) );
+            g.wait_for_all();
+
+            // 2) the nodes will receive puts from multiple predecessors simultaneously,
+            size_t ec = harness_graph_multifunction_executor<InputType, OutputTuple>::execute_count;
+            ASSERT( (int)ec == p*N, NULL );
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                size_t c = receivers[r].my_count;
+                // 3) the nodes will send to multiple successors.
+                ASSERT( (int)c == p*N, NULL );
+            }
+            for (size_t r = 0; r < num_receivers; ++r ) {
+                tbb::flow::remove_edge( tbb::flow::output_port<0>(exe_node), receivers[r] );
+            }
+        }
+    }
+}
+
+template< typename InputType, typename OutputTuple >
+void run_unlimited_concurrency() {
+    harness_graph_multifunction_executor<InputType, OutputTuple>::max_executors = 0;
+    #if __TBB_CPP11_LAMBDAS_PRESENT
+    typedef typename tbb::flow::multifunction_node<InputType,OutputTuple>::output_ports_type output_ports_type;
+    unlimited_concurrency<InputType,OutputTuple>( []( InputType i, output_ports_type &p ) { harness_graph_multifunction_executor<InputType, OutputTuple>::func(i,p); } );
+    #endif
+    unlimited_concurrency<InputType,OutputTuple>( &harness_graph_multifunction_executor<InputType, OutputTuple>::func );
+    unlimited_concurrency<InputType,OutputTuple>( typename harness_graph_multifunction_executor<InputType, OutputTuple>::functor() );
+}
+
+template<typename InputType, typename OutputTuple>
+struct oddEvenBody {
+    typedef typename tbb::flow::multifunction_node<InputType,OutputTuple>::output_ports_type output_ports_type;
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type EvenType;
+    typedef typename tbb::flow::tuple_element<1,OutputTuple>::type OddType;
+    void operator() (const InputType &i, output_ports_type &p) {
+        if((int)i % 2) {
+            (void)tbb::flow::get<1>(p).try_put(OddType(i));
+        }
+        else {
+            (void)tbb::flow::get<0>(p).try_put(EvenType(i));
+        }
+    }
+};
+
+template<typename InputType, typename OutputTuple >
+void run_multiport_test(int num_threads) {
+    typedef typename tbb::flow::multifunction_node<InputType, OutputTuple> mo_node_type;
+    typedef typename tbb::flow::tuple_element<0,OutputTuple>::type EvenType;
+    typedef typename tbb::flow::tuple_element<1,OutputTuple>::type OddType;
+    tbb::task_scheduler_init init(num_threads);
+    tbb::flow::graph g;
+    mo_node_type mo_node(g, tbb::flow::unlimited, oddEvenBody<InputType, OutputTuple>() );
+
+    tbb::flow::queue_node<EvenType> q0(g);
+    tbb::flow::queue_node<OddType> q1(g);
+
+    tbb::flow::make_edge(tbb::flow::output_port<0>(mo_node), q0);
+    tbb::flow::make_edge(tbb::flow::output_port<1>(mo_node), q1);
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    ASSERT(mo_node.predecessor_count() == 0, NULL);
+    ASSERT(tbb::flow::output_port<0>(mo_node).successor_count() == 1, NULL);
+    typedef typename mo_node_type::output_ports_type oports_type;
+    typedef typename tbb::flow::tuple_element<0,oports_type>::type port0_type;
+    typename port0_type::successor_list_type my_0succs;
+    tbb::flow::output_port<0>(mo_node).copy_successors(my_0succs);
+    ASSERT(my_0succs.size() == 1, NULL);
+    typename mo_node_type::predecessor_list_type my_preds;
+    mo_node.copy_predecessors(my_preds);
+    ASSERT(my_preds.size() == 0, NULL);
+#endif
+
+    for(InputType i = 0; i < N; ++i) {
+        mo_node.try_put(i);
+    }
+
+    g.wait_for_all();
+    for(int i = 0; i < N/2; ++i) {
+        EvenType e;
+        OddType o;
+        ASSERT(q0.try_get(e) && (int)e % 2 == 0, NULL);
+        ASSERT(q1.try_get(o) && (int)o % 2 == 1, NULL);
+    }
+}
+
+//! Tests limited concurrency cases for nodes that accept data messages
+void test_concurrency(int num_threads) {
+    tbb::task_scheduler_init init(num_threads);
+    run_concurrency_levels<int,tbb::flow::tuple<int> >(num_threads);
+    run_concurrency_levels<int,tbb::flow::tuple<tbb::flow::continue_msg> >(num_threads);
+    run_buffered_levels<int, tbb::flow::tuple<int> >(num_threads);
+    run_unlimited_concurrency<int, tbb::flow::tuple<int> >();
+    run_unlimited_concurrency<int,tbb::flow::tuple<empty_no_assign> >();
+    run_unlimited_concurrency<empty_no_assign,tbb::flow::tuple<int> >();
+    run_unlimited_concurrency<empty_no_assign,tbb::flow::tuple<empty_no_assign> >();
+    run_unlimited_concurrency<int,tbb::flow::tuple<tbb::flow::continue_msg> >();
+    run_unlimited_concurrency<empty_no_assign,tbb::flow::tuple<tbb::flow::continue_msg> >();
+    run_multiport_test<int, tbb::flow::tuple<int, int> >(num_threads);
+    run_multiport_test<float, tbb::flow::tuple<int, double> >(num_threads);
+}
+
+template<typename Policy>
+void test_ports_return_references() {
+    tbb::flow::graph g;
+    typedef int InputType;
+    typedef tbb::flow::tuple<int> OutputTuple;
+    tbb::flow::multifunction_node<InputType, OutputTuple, Policy> mf_node(
+        g, tbb::flow::unlimited,
+        &harness_graph_multifunction_executor<InputType, OutputTuple>::empty_func );
+    test_output_ports_return_ref(mf_node);
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+// the integer received indicates which output ports should succeed and which should fail
+// on try_put().
+typedef tbb::flow::multifunction_node<int, tbb::flow::tuple<int, int> > mf_node_type;
+
+struct add_to_counter {
+    int my_invocations;
+    int *counter;
+    add_to_counter(int& var):counter(&var){ my_invocations = 0;}
+    void operator()(const int &i, mf_node_type::output_ports_type &outports) {
+        *counter+=1;
+        ++my_invocations;
+        if(i & 0x1) {
+            ASSERT(tbb::flow::get<0>(outports).try_put(i), "port 0 expected to succeed");
+        }
+        else {
+            ASSERT(!tbb::flow::get<0>(outports).try_put(i), "port 0 expected to fail");
+        }
+        if(i & 0x2) {
+            ASSERT(tbb::flow::get<1>(outports).try_put(i), "port 1 expected to succeed");
+        }
+        else {
+            ASSERT(!tbb::flow::get<1>(outports).try_put(i), "port 1 expected to fail");
+        }
+    }
+    int my_inner() { return my_invocations; }
+};
+
+template<class FTYPE>
+void test_extract() {
+    int my_count = 0;
+    int cm;
+    tbb::flow::graph g;
+    tbb::flow::broadcast_node<int> b0(g);
+    tbb::flow::broadcast_node<int> b1(g);
+    tbb::flow::multifunction_node<int, tbb::flow::tuple<int,int>, FTYPE> mf0(g, tbb::flow::unlimited, add_to_counter(my_count));
+    tbb::flow::queue_node<int> q0(g);
+    tbb::flow::queue_node<int> q1(g);
+
+    tbb::flow::make_edge(b0, mf0);
+    tbb::flow::make_edge(b1, mf0);
+    tbb::flow::make_edge(tbb::flow::output_port<0>(mf0), q0);
+    tbb::flow::make_edge(tbb::flow::output_port<1>(mf0), q1);
+    for( int i = 0; i < 2; ++i ) {
+
+        /* b0          */
+        /*   \   |--q0 */
+        /*    mf0+     */
+        /*   /   |--q1 */
+        /* b1          */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 1, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(mf0.predecessor_count() == 2
+                && tbb::flow::output_port<0>(mf0).successor_count() == 1
+                && tbb::flow::output_port<1>(mf0).successor_count() == 1
+                , "mf0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 1 && q0.successor_count() == 0, "q0 has incorrect counts");
+        ASSERT(q1.predecessor_count() == 1 && q1.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(3);
+        g.wait_for_all();
+        ASSERT(my_count == 1, "multifunction_node didn't fire");
+        ASSERT(q0.try_get(cm), "multifunction_node didn't forward to 0");
+        ASSERT(q1.try_get(cm), "multifunction_node didn't forward to 1");
+        b1.try_put(3);
+        g.wait_for_all();
+        ASSERT(my_count == 2, "multifunction_node didn't fire");
+        ASSERT(q0.try_get(cm), "multifunction_node didn't forward to 0");
+        ASSERT(q1.try_get(cm), "multifunction_node didn't forward to 1");
+
+        b0.extract();
+
+
+        /* b0          */
+        /*       |--q0 */
+        /*    mf0+     */
+        /*   /   |--q1 */
+        /* b1          */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(mf0.predecessor_count() == 1
+                && tbb::flow::output_port<0>(mf0).successor_count() == 1
+                && tbb::flow::output_port<1>(mf0).successor_count() == 1
+                , "mf0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 1 && q0.successor_count() == 0, "q0 has incorrect counts");
+        ASSERT(q1.predecessor_count() == 1 && q1.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(1);
+        b0.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 2, "b0 messages being forwarded to multifunction_node even though it is disconnected");
+        b1.try_put(3);
+        g.wait_for_all();
+        ASSERT(my_count == 3, "multifunction_node didn't fire though it has only one predecessor");
+        ASSERT(q0.try_get(cm), "multifunction_node didn't forward second time");
+        ASSERT(q1.try_get(cm), "multifunction_node didn't forward second time");
+
+        q0.extract();
+
+        /* b0          */
+        /*       |  q0 */
+        /*    mf0+     */
+        /*   /   |--q1 */
+        /* b1          */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 1, "b1 has incorrect counts");
+        ASSERT(mf0.predecessor_count() == 1
+                && tbb::flow::output_port<0>(mf0).successor_count() == 0
+                && tbb::flow::output_port<1>(mf0).successor_count() == 1
+                , "mf0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+        ASSERT(q1.predecessor_count() == 1 && q1.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(1);
+        b0.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 3, "b0 messages being forwarded to multifunction_node even though it is disconnected");
+        b1.try_put(2);
+        g.wait_for_all();
+        ASSERT(my_count == 4, "multifunction_node didn't fire though it has one predecessor");
+        ASSERT(!q0.try_get(cm), "multifunction_node forwarded");
+        ASSERT(q1.try_get(cm), "multifunction_node forwarded");
+        mf0.extract();
+
+        if(i == 0) {
+        }
+        else {
+            g.reset(tbb::flow::rf_reset_bodies);
+        }
+
+
+        /* b0          */
+        /*       |  q0 */
+        /*    mf0+     */
+        /*       |  q1 */
+        /* b1          */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 0, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 0, "b1 has incorrect counts");
+        ASSERT(mf0.predecessor_count() == 0
+                && tbb::flow::output_port<0>(mf0).successor_count() == 0
+                && tbb::flow::output_port<1>(mf0).successor_count() == 0
+                , "mf0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+        ASSERT(q1.predecessor_count() == 0 && q1.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(1);
+        b0.try_put(1);
+        g.wait_for_all();
+        ASSERT(my_count == 4, "b0 messages being forwarded to multifunction_node even though it is disconnected");
+        b1.try_put(2);
+        g.wait_for_all();
+        ASSERT(my_count == 4, "b1 messages being forwarded to multifunction_node even though it is disconnected");
+        ASSERT(!q0.try_get(cm), "multifunction_node forwarded");
+        ASSERT(!q1.try_get(cm), "multifunction_node forwarded");
+        make_edge(b0, mf0);
+
+        /* b0          */
+        /*   \   |  q0 */
+        /*    mf0+     */
+        /*       |  q1 */
+        /* b1          */
+
+        ASSERT(b0.predecessor_count() == 0 && b0.successor_count() == 1, "b0 has incorrect counts");
+        ASSERT(b1.predecessor_count() == 0 && b1.successor_count() == 0, "b1 has incorrect counts");
+        ASSERT(mf0.predecessor_count() == 1
+                && tbb::flow::output_port<0>(mf0).successor_count() == 0
+                && tbb::flow::output_port<1>(mf0).successor_count() == 0
+                , "mf0 has incorrect counts");
+        ASSERT(q0.predecessor_count() == 0 && q0.successor_count() == 0, "q0 has incorrect counts");
+        ASSERT(q1.predecessor_count() == 0 && q1.successor_count() == 0, "q0 has incorrect counts");
+        b0.try_put(0);
+        g.wait_for_all();
+        ASSERT(my_count == 5, "multifunction_node didn't fire though it has one predecessor");
+        b1.try_put(2);
+        g.wait_for_all();
+        ASSERT(my_count == 5, "multifunction_node fired though it has only one predecessor");
+        ASSERT(!q0.try_get(cm), "multifunction_node forwarded");
+        ASSERT(!q1.try_get(cm), "multifunction_node forwarded");
+
+        tbb::flow::make_edge(b1, mf0);
+        tbb::flow::make_edge(tbb::flow::output_port<0>(mf0), q0);
+        tbb::flow::make_edge(tbb::flow::output_port<1>(mf0), q1);
+        ASSERT( ( i == 0 && tbb::flow::copy_body<add_to_counter>(mf0).my_inner() == 5 ) ||
+               ( i == 1 && tbb::flow::copy_body<add_to_counter>(mf0).my_inner() == 1 ) , "reset_bodies failed");
+        my_count = 0;
+    }
+}
+#endif
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+       test_concurrency(p);
+    }
+    test_ports_return_references<tbb::flow::queueing>();
+    test_ports_return_references<tbb::flow::rejecting>();
+    lightweight_testing::test<tbb::flow::multifunction_node>(10);
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_extract<tbb::flow::rejecting>();
+    test_extract<tbb::flow::queueing>();
+#endif
+   return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_mutex.cpp b/xdl/third_party/tbb/src/test/test_mutex.cpp
new file mode 100644
index 00000000..52b55796
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_mutex.cpp
@@ -0,0 +1,684 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//------------------------------------------------------------------------
+// Test TBB mutexes when used with parallel_for.h
+//
+// Usage: test_Mutex.exe [-v] nthread
+//
+// The -v option causes timing information to be printed.
+//
+// Compile with _OPENMP and -openmp
+//------------------------------------------------------------------------
+#include "harness_defs.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/critical_section.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/queuing_rw_mutex.h"
+#include "tbb/queuing_mutex.h"
+#include "tbb/mutex.h"
+#include "tbb/recursive_mutex.h"
+#include "tbb/null_mutex.h"
+#include "tbb/null_rw_mutex.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/tick_count.h"
+#include "tbb/atomic.h"
+#include "harness.h"
+#include <cstdlib>
+#include <cstdio>
+#if _OPENMP
+#include "test/OpenMP_Mutex.h"
+#endif /* _OPENMP */
+#include "tbb/tbb_profiling.h"
+
+#ifndef TBB_TEST_LOW_WORKLOAD
+    #define TBB_TEST_LOW_WORKLOAD TBB_USE_THREADING_TOOLS
+#endif
+
+// This test deliberately avoids a "using tbb" statement,
+// so that the error of putting types in the wrong namespace will be caught.
+
+template<typename M>
+struct Counter {
+    typedef M mutex_type;
+    M mutex;
+    volatile long value;
+};
+
+//! Function object for use with parallel_for.h.
+template<typename C>
+struct AddOne: NoAssign {
+    C& counter;
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            if( i&1 ) {
+                // Try implicit acquire and explicit release
+                typename C::mutex_type::scoped_lock lock(counter.mutex);
+                counter.value = counter.value+1;
+                lock.release();
+            } else {
+                // Try explicit acquire and implicit release
+                typename C::mutex_type::scoped_lock lock;
+                lock.acquire(counter.mutex);
+                counter.value = counter.value+1;
+            }
+        }
+    }
+    AddOne( C& counter_ ) : counter(counter_) {}
+};
+
+//! Adaptor for using ISO C++0x style mutex as a TBB-style mutex.
+template<typename M>
+class TBB_MutexFromISO_Mutex {
+    M my_iso_mutex;
+public:
+    typedef TBB_MutexFromISO_Mutex mutex_type;
+
+    class scoped_lock;
+    friend class scoped_lock;
+
+    class scoped_lock {
+        mutex_type* my_mutex;
+    public:
+        scoped_lock() : my_mutex(NULL) {}
+        scoped_lock( mutex_type& m ) : my_mutex(NULL) {
+            acquire(m);
+        }
+        scoped_lock( mutex_type& m, bool is_writer ) : my_mutex(NULL) {
+            acquire(m,is_writer);
+        }
+        void acquire( mutex_type& m ) {
+            m.my_iso_mutex.lock();
+            my_mutex = &m;
+        }
+        bool try_acquire( mutex_type& m ) {
+            if( m.my_iso_mutex.try_lock() ) {
+                my_mutex = &m;
+                return true;
+            } else {
+                return false;
+            }
+        }
+        void release() {
+            my_mutex->my_iso_mutex.unlock();
+            my_mutex = NULL;
+        }
+
+        // Methods for reader-writer mutex
+        // These methods can be instantiated only if M supports lock_read() and try_lock_read().
+
+        void acquire( mutex_type& m, bool is_writer ) {
+            if( is_writer ) m.my_iso_mutex.lock();
+            else m.my_iso_mutex.lock_read();
+            my_mutex = &m;
+        }
+        bool try_acquire( mutex_type& m, bool is_writer ) {
+            if( is_writer ? m.my_iso_mutex.try_lock() : m.my_iso_mutex.try_lock_read() ) {
+                my_mutex = &m;
+                return true;
+            } else {
+                return false;
+            }
+        }
+        bool upgrade_to_writer() {
+            my_mutex->my_iso_mutex.unlock();
+            my_mutex->my_iso_mutex.lock();
+            return false;
+        }
+        bool downgrade_to_reader() {
+            my_mutex->my_iso_mutex.unlock();
+            my_mutex->my_iso_mutex.lock_read();
+            return false;
+        }
+        ~scoped_lock() {
+            if( my_mutex )
+                release();
+        }
+    };
+
+    static const bool is_recursive_mutex = M::is_recursive_mutex;
+    static const bool is_rw_mutex = M::is_rw_mutex;
+};
+
+namespace tbb {
+    namespace profiling {
+        template<typename M>
+        void set_name( const TBB_MutexFromISO_Mutex<M>&, const char* ) {}
+    }
+}
+
+//! Generic test of a TBB mutex type M.
+/** Does not test features specific to reader-writer locks. */
+template<typename M>
+void Test( const char * name ) {
+    REMARK("%s size == %d, time = ",name, sizeof(M));
+    Counter<M> counter;
+    counter.value = 0;
+    tbb::profiling::set_name(counter.mutex, name);
+#if TBB_TEST_LOW_WORKLOAD
+    const int n = 10000;
+#else
+    const int n = 100000;
+#endif /* TBB_TEST_LOW_WORKLOAD */
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,n,n/10),AddOne<Counter<M> >(counter));
+    tbb::tick_count t1 = tbb::tick_count::now();
+    REMARK("%g usec\n",(t1-t0).seconds());
+    if( counter.value!=n )
+        REPORT("ERROR for %s: counter.value=%ld\n",name,counter.value);
+}
+
+template<typename M, size_t N>
+struct Invariant {
+    typedef M mutex_type;
+    M mutex;
+    const char* mutex_name;
+    volatile long value[N];
+    Invariant( const char* mutex_name_ ) :
+        mutex_name(mutex_name_)
+    {
+        for( size_t k=0; k<N; ++k )
+            value[k] = 0;
+        tbb::profiling::set_name(mutex, mutex_name_);
+    }
+    ~Invariant() {
+    }
+    void update() {
+        for( size_t k=0; k<N; ++k )
+            ++value[k];
+    }
+    bool value_is( long expected_value ) const {
+        long tmp;
+        for( size_t k=0; k<N; ++k )
+            if( (tmp=value[k])!=expected_value ) {
+                REPORT("ERROR: %ld!=%ld\n", tmp, expected_value);
+                return false;
+            }
+        return true;
+    }
+    bool is_okay() {
+        return value_is( value[0] );
+    }
+};
+
+//! Function object for use with parallel_for.h.
+template<typename I>
+struct TwiddleInvariant: NoAssign {
+    I& invariant;
+    TwiddleInvariant( I& invariant_ ) : invariant(invariant_) {}
+
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            //! Every 8th access is a write access
+            const bool write = (i%8)==7;
+            bool okay = true;
+            bool lock_kept = true;
+            if( (i/8)&1 ) {
+                // Try implicit acquire and explicit release
+                typename I::mutex_type::scoped_lock lock(invariant.mutex,write);
+                execute_aux(lock, i, write, /*ref*/okay, /*ref*/lock_kept);
+                lock.release();
+            } else {
+                // Try explicit acquire and implicit release
+                typename I::mutex_type::scoped_lock lock;
+                lock.acquire(invariant.mutex,write);
+                execute_aux(lock, i, write, /*ref*/okay, /*ref*/lock_kept);
+            }
+            if( !okay ) {
+                REPORT( "ERROR for %s at %ld: %s %s %s %s\n",invariant.mutex_name, long(i),
+                        write     ? "write,"                  : "read,",
+                        write     ? (i%16==7?"downgrade,":"") : (i%8==3?"upgrade,":""),
+                        lock_kept ? "lock kept,"              : "lock not kept,", // TODO: only if downgrade/upgrade
+                        (i/8)&1   ? "impl/expl"               : "expl/impl" );
+            }
+        }
+    }
+private:
+    void execute_aux(typename I::mutex_type::scoped_lock & lock, const size_t i, const bool write, bool & okay, bool & lock_kept) const {
+        if( write ) {
+            long my_value = invariant.value[0];
+            invariant.update();
+            if( i%16==7 ) {
+                lock_kept = lock.downgrade_to_reader();
+                if( !lock_kept )
+                    my_value = invariant.value[0] - 1;
+                okay = invariant.value_is(my_value+1);
+            }
+        } else {
+            okay = invariant.is_okay();
+            if( i%8==3 ) {
+                long my_value = invariant.value[0];
+                lock_kept = lock.upgrade_to_writer();
+                if( !lock_kept )
+                    my_value = invariant.value[0];
+                invariant.update();
+                okay = invariant.value_is(my_value+1);
+            }
+        }
+    }
+};
+
+/** This test is generic so that we can test any other kinds of ReaderWriter locks we write later. */
+template<typename M>
+void TestReaderWriterLock( const char * mutex_name ) {
+    REMARK( "%s readers & writers time = ", mutex_name );
+    Invariant<M,8> invariant(mutex_name);
+#if TBB_TEST_LOW_WORKLOAD
+    const size_t n = 10000;
+#else
+    const size_t n = 500000;
+#endif /* TBB_TEST_LOW_WORKLOAD */
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,n,n/100),TwiddleInvariant<Invariant<M,8> >(invariant));
+    tbb::tick_count t1 = tbb::tick_count::now();
+    // There is either a writer or a reader upgraded to a writer for each 4th iteration
+    long expected_value = n/4;
+    if( !invariant.value_is(expected_value) )
+        REPORT("ERROR for %s: final invariant value is wrong\n",mutex_name);
+    REMARK( "%g usec\n", (t1-t0).seconds() );
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress "conditional expression is constant" warning.
+    #pragma warning( push )
+    #pragma warning( disable: 4127 )
+#endif
+
+/** Test try_acquire_reader functionality of a non-reenterable reader-writer mutex */
+template<typename M>
+void TestTryAcquireReader_OneThread( const char * mutex_name ) {
+    M tested_mutex;
+    typename M::scoped_lock lock1;
+    if( M::is_rw_mutex ) {
+        if( lock1.try_acquire(tested_mutex, false) )
+            lock1.release();
+        else
+            REPORT("ERROR for %s: try_acquire failed though it should not\n", mutex_name);
+        {
+            typename M::scoped_lock lock2(tested_mutex, false);   // read lock
+            if( lock1.try_acquire(tested_mutex) )                 // attempt to acquire read
+                REPORT("ERROR for %s: try_acquire succeeded though it should not (1)\n", mutex_name);
+            lock2.release();                                      // unlock
+            lock2.acquire(tested_mutex, true);                    // write lock
+            if( lock1.try_acquire(tested_mutex, false) )          // attempt to acquire read
+                REPORT("ERROR for %s: try_acquire succeeded though it should not (2)\n", mutex_name);
+        }
+        if( lock1.try_acquire(tested_mutex, false) )
+            lock1.release();
+        else
+            REPORT("ERROR for %s: try_acquire failed though it should not\n", mutex_name);
+    }
+}
+
+/** Test try_acquire functionality of a non-reenterable mutex */
+template<typename M>
+void TestTryAcquire_OneThread( const char * mutex_name ) {
+    M tested_mutex;
+    typename M::scoped_lock lock1;
+    if( lock1.try_acquire(tested_mutex) )
+        lock1.release();
+    else
+        REPORT("ERROR for %s: try_acquire failed though it should not\n", mutex_name);
+    {
+        if( M::is_recursive_mutex ) {
+            typename M::scoped_lock lock2(tested_mutex);
+            if( lock1.try_acquire(tested_mutex) )
+                lock1.release();
+            else
+                REPORT("ERROR for %s: try_acquire on recursive lock failed though it should not\n", mutex_name);
+            //windows.. -- both are recursive
+        } else {
+            typename M::scoped_lock lock2(tested_mutex);
+            if( lock1.try_acquire(tested_mutex) )
+                REPORT("ERROR for %s: try_acquire succeeded though it should not (3)\n", mutex_name);
+        }
+    }
+    if( lock1.try_acquire(tested_mutex) )
+        lock1.release();
+    else
+        REPORT("ERROR for %s: try_acquire failed though it should not\n", mutex_name);
+}
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif
+
+const int RecurN = 4;
+int RecurArray[ RecurN ];
+tbb::recursive_mutex RecurMutex[ RecurN ];
+
+struct RecursiveAcquisition {
+    /** x = number being decoded in base N
+        max_lock = index of highest lock acquired so far
+        mask = bit mask; ith bit set if lock i has been acquired. */
+    void Body( size_t x, int max_lock=-1, unsigned int mask=0 ) const
+    {
+        int i = (int) (x % RecurN);
+        bool first = (mask&1U<<i)==0;
+        if( first ) {
+            // first time to acquire lock
+            if( i<max_lock )
+                // out of order acquisition might lead to deadlock, so stop
+                return;
+            max_lock = i;
+        }
+
+        if( (i&1)!=0 ) {
+            // acquire lock on location RecurArray[i] using explicit acquire
+            tbb::recursive_mutex::scoped_lock r_lock;
+            r_lock.acquire( RecurMutex[i] );
+            int a = RecurArray[i];
+            ASSERT( (a==0)==first, "should be either a==0 if it is the first time to acquire the lock or a!=0 otherwise" );
+            ++RecurArray[i];
+            if( x )
+                Body( x/RecurN, max_lock, mask|1U<<i );
+            --RecurArray[i];
+            ASSERT( a==RecurArray[i], "a is not equal to RecurArray[i]" );
+
+            // release lock on location RecurArray[i] using explicit release; otherwise, use implicit one
+            if( (i&2)!=0 ) r_lock.release();
+        } else {
+            // acquire lock on location RecurArray[i] using implicit acquire
+            tbb::recursive_mutex::scoped_lock r_lock( RecurMutex[i] );
+            int a = RecurArray[i];
+
+            ASSERT( (a==0)==first, "should be either a==0 if it is the first time to acquire the lock or a!=0 otherwise" );
+
+            ++RecurArray[i];
+            if( x )
+                Body( x/RecurN, max_lock, mask|1U<<i );
+            --RecurArray[i];
+
+            ASSERT( a==RecurArray[i], "a is not equal to RecurArray[i]" );
+
+            // release lock on location RecurArray[i] using explicit release; otherwise, use implicit one
+            if( (i&2)!=0 ) r_lock.release();
+        }
+    }
+
+    void operator()( const tbb::blocked_range<size_t> &r ) const
+    {
+        for( size_t x=r.begin(); x<r.end(); x++ ) {
+            Body( x );
+        }
+    }
+};
+
+/** This test is generic so that we may test other kinds of recursive mutexes.*/
+template<typename M>
+void TestRecursiveMutex( const char * mutex_name )
+{
+    for ( int i = 0; i < RecurN; ++i ) {
+        tbb::profiling::set_name(RecurMutex[i], mutex_name);
+    }
+    tbb::tick_count t0 = tbb::tick_count::now();
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,10000,500), RecursiveAcquisition());
+    tbb::tick_count t1 = tbb::tick_count::now();
+    REMARK( "%s recursive mutex time = %g usec\n", mutex_name, (t1-t0).seconds() );
+}
+
+template<typename C>
+struct NullRecursive: NoAssign {
+    void recurse_till( size_t i, size_t till ) const {
+        if( i==till ) {
+            counter.value = counter.value+1;
+            return;
+        }
+        if( i&1 ) {
+            typename C::mutex_type::scoped_lock lock2(counter.mutex);
+            recurse_till( i+1, till );
+            lock2.release();
+        } else {
+            typename C::mutex_type::scoped_lock lock2;
+            lock2.acquire(counter.mutex);
+            recurse_till( i+1, till );
+        }
+    }
+
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        typename C::mutex_type::scoped_lock lock(counter.mutex);
+        recurse_till( range.begin(), range.end() );
+    }
+    NullRecursive( C& counter_ ) : counter(counter_) {
+        ASSERT( C::mutex_type::is_recursive_mutex, "Null mutex should be a recursive mutex." );
+    }
+    C& counter;
+};
+
+template<typename M>
+struct NullUpgradeDowngrade: NoAssign {
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        typename M::scoped_lock lock2;
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            if( i&1 ) {
+                typename M::scoped_lock lock1(my_mutex, true) ;
+                if( lock1.downgrade_to_reader()==false )
+                    REPORT("ERROR for %s: downgrade should always succeed\n", name);
+            } else {
+                lock2.acquire( my_mutex, false );
+                if( lock2.upgrade_to_writer()==false )
+                    REPORT("ERROR for %s: upgrade should always succeed\n", name);
+                lock2.release();
+            }
+        }
+    }
+
+    NullUpgradeDowngrade( M& m_, const char* n_ ) : my_mutex(m_), name(n_) {}
+    M& my_mutex;
+    const char* name;
+} ;
+
+template<typename M>
+void TestNullMutex( const char * name ) {
+    Counter<M> counter;
+    counter.value = 0;
+    const int n = 100;
+    REMARK("TestNullMutex<%s>",name);
+    {
+        tbb::parallel_for(tbb::blocked_range<size_t>(0,n,10),AddOne<Counter<M> >(counter));
+    }
+    counter.value = 0;
+    {
+        tbb::parallel_for(tbb::blocked_range<size_t>(0,n,10),NullRecursive<Counter<M> >(counter));
+    }
+    REMARK("\n");
+}
+
+template<typename M>
+void TestNullRWMutex( const char * name ) {
+    REMARK("TestNullRWMutex<%s>",name);
+    const int n = 100;
+    M m;
+    tbb::parallel_for(tbb::blocked_range<size_t>(0,n,10),NullUpgradeDowngrade<M>(m, name));
+    REMARK("\n");
+}
+
+//! Test ISO C++0x compatibility portion of TBB mutex
+template<typename M>
+void TestISO( const char * name ) {
+    typedef TBB_MutexFromISO_Mutex<M> tbb_from_iso;
+    Test<tbb_from_iso>( name );
+}
+
+//! Test ISO C++0x try_lock functionality of a non-reenterable mutex */
+template<typename M>
+void TestTryAcquire_OneThreadISO( const char * name ) {
+    typedef TBB_MutexFromISO_Mutex<M> tbb_from_iso;
+    TestTryAcquire_OneThread<tbb_from_iso>( name );
+}
+
+//! Test ISO-like C++0x compatibility portion of TBB reader-writer mutex
+template<typename M>
+void TestReaderWriterLockISO( const char * name ) {
+    typedef TBB_MutexFromISO_Mutex<M> tbb_from_iso;
+    TestReaderWriterLock<tbb_from_iso>( name );
+    TestTryAcquireReader_OneThread<tbb_from_iso>( name );
+}
+
+//! Test ISO C++0x compatibility portion of TBB recursive mutex
+template<typename M>
+void TestRecursiveMutexISO( const char * name ) {
+    typedef TBB_MutexFromISO_Mutex<M> tbb_from_iso;
+    TestRecursiveMutex<tbb_from_iso>(name);
+}
+
+#include "harness_tsx.h"
+#include "tbb/task_scheduler_init.h"
+
+#if __TBB_TSX_TESTING_ENABLED_FOR_THIS_COMPILER
+
+//! Function object for use with parallel_for.h to see if a transaction is actually attempted.
+tbb::atomic<size_t> n_transactions_attempted;
+template<typename C>
+struct AddOne_CheckTransaction: NoAssign {
+    C& counter;
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( tbb::blocked_range<size_t>& range ) const {
+        for( size_t i=range.begin(); i!=range.end(); ++i ) {
+            bool transaction_attempted = false;
+            {
+              typename C::mutex_type::scoped_lock lock(counter.mutex);
+              if( IsInsideTx() ) transaction_attempted = true;
+              counter.value = counter.value+1;
+            }
+            if( transaction_attempted ) ++n_transactions_attempted;
+            __TBB_Pause(i);
+        }
+    }
+    AddOne_CheckTransaction( C& counter_ ) : counter(counter_) {}
+};
+
+/* TestTransaction() checks if a speculative mutex actually uses transactions. */
+template<typename M>
+void TestTransaction( const char * name )
+{
+    Counter<M> counter;
+#if TBB_TEST_LOW_WORKLOAD
+    const int n = 100;
+#else
+    const int n = 1000;
+#endif
+    REMARK("TestTransaction with %s: ",name);
+
+    n_transactions_attempted = 0;
+    tbb::tick_count start, stop;
+    for( int i=0; i<5 && n_transactions_attempted==0; ++i ) {
+        counter.value = 0;
+        start = tbb::tick_count::now();
+        tbb::parallel_for(tbb::blocked_range<size_t>(0,n,2),AddOne_CheckTransaction<Counter<M> >(counter));
+        stop = tbb::tick_count::now();
+        if( counter.value!=n ) {
+            REPORT("ERROR for %s: counter.value=%ld\n",name,counter.value);
+            break;
+        }
+    }
+
+    if( n_transactions_attempted==0 )
+        REPORT( "ERROR: transactions were never attempted\n" );
+    else
+        REMARK("%d successful transactions in %6.6f seconds\n", (int)n_transactions_attempted, (stop - start).seconds());
+}
+#endif  /* __TBB_TSX_TESTING_ENABLED_FOR_THIS_COMPILER */
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init( p );
+        REMARK( "testing with %d workers\n", static_cast<int>(p) );
+#if TBB_TEST_LOW_WORKLOAD
+        // The amount of work is decreased in this mode to bring the length
+        // of the runs under tools into the tolerable limits.
+        const int n = 1;
+#else
+        const int n = 3;
+#endif
+        // Run each test several times.
+        for( int i=0; i<n; ++i ) {
+            TestNullMutex<tbb::null_mutex>( "Null Mutex" );
+            TestNullMutex<tbb::null_rw_mutex>( "Null RW Mutex" );
+            TestNullRWMutex<tbb::null_rw_mutex>( "Null RW Mutex" );
+            Test<tbb::spin_mutex>( "Spin Mutex" );
+            Test<tbb::speculative_spin_mutex>( "Spin Mutex/speculative" );
+#if _OPENMP
+            Test<OpenMP_Mutex>( "OpenMP_Mutex" );
+#endif /* _OPENMP */
+            Test<tbb::queuing_mutex>( "Queuing Mutex" );
+            Test<tbb::mutex>( "Wrapper Mutex" );
+            Test<tbb::recursive_mutex>( "Recursive Mutex" );
+            Test<tbb::queuing_rw_mutex>( "Queuing RW Mutex" );
+            Test<tbb::spin_rw_mutex>( "Spin RW Mutex" );
+            Test<tbb::speculative_spin_rw_mutex>( "Spin RW Mutex/speculative" );
+
+            TestTryAcquire_OneThread<tbb::spin_mutex>("Spin Mutex");
+            TestTryAcquire_OneThread<tbb::speculative_spin_mutex>("Spin Mutex/speculative");
+            TestTryAcquire_OneThread<tbb::queuing_mutex>("Queuing Mutex");
+#if USE_PTHREAD
+            // under ifdef because on Windows tbb::mutex is reenterable and the test will fail
+            TestTryAcquire_OneThread<tbb::mutex>("Wrapper Mutex");
+#endif /* USE_PTHREAD */
+            TestTryAcquire_OneThread<tbb::recursive_mutex>( "Recursive Mutex" );
+            TestTryAcquire_OneThread<tbb::spin_rw_mutex>("Spin RW Mutex"); // only tests try_acquire for writers
+            TestTryAcquire_OneThread<tbb::speculative_spin_rw_mutex>("Spin RW Mutex/speculative"); // only tests try_acquire for writers
+            TestTryAcquire_OneThread<tbb::queuing_rw_mutex>("Queuing RW Mutex"); // only tests try_acquire for writers
+
+            TestTryAcquireReader_OneThread<tbb::spin_rw_mutex>("Spin RW Mutex");
+            TestTryAcquireReader_OneThread<tbb::speculative_spin_rw_mutex>("Spin RW Mutex/speculative");
+            TestTryAcquireReader_OneThread<tbb::queuing_rw_mutex>("Queuing RW Mutex");
+
+            TestReaderWriterLock<tbb::queuing_rw_mutex>( "Queuing RW Mutex" );
+            TestReaderWriterLock<tbb::spin_rw_mutex>( "Spin RW Mutex" );
+            TestReaderWriterLock<tbb::speculative_spin_rw_mutex>( "Spin RW Mutex/speculative" );
+
+            TestRecursiveMutex<tbb::recursive_mutex>( "Recursive Mutex" );
+
+            // Test ISO C++11 interface
+            TestISO<tbb::spin_mutex>( "ISO Spin Mutex" );
+            TestISO<tbb::mutex>( "ISO Mutex" );
+            TestISO<tbb::spin_rw_mutex>( "ISO Spin RW Mutex" );
+            TestISO<tbb::recursive_mutex>( "ISO Recursive Mutex" );
+            TestISO<tbb::critical_section>( "ISO Critical Section" );
+            TestTryAcquire_OneThreadISO<tbb::spin_mutex>( "ISO Spin Mutex" );
+#if USE_PTHREAD
+            // under ifdef because on Windows tbb::mutex is reenterable and the test will fail
+            TestTryAcquire_OneThreadISO<tbb::mutex>( "ISO Mutex" );
+#endif /* USE_PTHREAD */
+            TestTryAcquire_OneThreadISO<tbb::spin_rw_mutex>( "ISO Spin RW Mutex" );
+            TestTryAcquire_OneThreadISO<tbb::recursive_mutex>( "ISO Recursive Mutex" );
+            TestTryAcquire_OneThreadISO<tbb::critical_section>( "ISO Critical Section" );
+            TestReaderWriterLockISO<tbb::spin_rw_mutex>( "ISO Spin RW Mutex" );
+            TestRecursiveMutexISO<tbb::recursive_mutex>( "ISO Recursive Mutex" );
+        }
+    }
+
+#if __TBB_TSX_TESTING_ENABLED_FOR_THIS_COMPILER
+    // additional test for speculative mutexes to see if we actually attempt lock elisions
+    if( have_TSX() ) {
+        tbb::task_scheduler_init init( MaxThread );
+        TestTransaction<tbb::speculative_spin_mutex>( "Spin Mutex/speculative" );
+        TestTransaction<tbb::speculative_spin_rw_mutex>( "Spin RW Mutex/speculative" );
+    }
+    else {
+        REMARK("Hardware transactions not supported\n");
+    }
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_mutex_native_threads.cpp b/xdl/third_party/tbb/src/test/test_mutex_native_threads.cpp
new file mode 100644
index 00000000..23622a1c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_mutex_native_threads.cpp
@@ -0,0 +1,221 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/spin_mutex.h"
+#include "tbb/queuing_mutex.h"
+#include "tbb/queuing_rw_mutex.h"
+#include "tbb/spin_rw_mutex.h"
+#include "tbb/mutex.h"
+
+#include "tbb/tick_count.h"
+#include "tbb/atomic.h"
+
+#include "harness.h"
+
+// This test deliberately avoids a "using tbb" statement,
+// so that the error of putting types in the wrong namespace will be caught.
+
+template<typename M>
+struct Counter {
+    typedef M mutex_type;
+    M mutex;
+    volatile long value;
+    void flog_once( size_t mode );
+};
+
+template<typename M>
+void Counter<M>::flog_once(size_t mode)
+/** Increments counter once for each iteration in the iteration space. */
+{
+    if( mode&1 ) {
+        // Try implicit acquire and explicit release
+        typename mutex_type::scoped_lock lock(mutex);
+        value = value+1;
+        lock.release();
+    } else {
+        // Try explicit acquire and implicit release
+        typename mutex_type::scoped_lock lock;
+        lock.acquire(mutex);
+        value = value+1;
+    }
+}
+
+template<typename M, long N>
+struct Invariant {
+    typedef M mutex_type;
+    M mutex;
+    const char* mutex_name;
+    volatile long value[N];
+    Invariant( const char* mutex_name_ ) :
+        mutex_name(mutex_name_)
+    {
+        for( long k=0; k<N; ++k )
+            value[k] = 0;
+    }
+    void update() {
+        for( long k=0; k<N; ++k )
+            ++value[k];
+    }
+    bool value_is( long expected_value ) const {
+        long tmp;
+        for( long k=0; k<N; ++k )
+            if( (tmp=value[k])!=expected_value ) {
+                REPORT("ERROR: %ld!=%ld\n", tmp, expected_value);
+                return false;
+            }
+        return true;
+    }
+    bool is_okay() {
+        return value_is( value[0] );
+    }
+    void flog_once( size_t mode );
+};
+
+template<typename M, long N>
+void Invariant<M,N>::flog_once( size_t mode )
+{
+    //! Every 8th access is a write access
+    bool write = (mode%8)==7;
+    bool okay = true;
+    bool lock_kept = true;
+    if( (mode/8)&1 ) {
+        // Try implicit acquire and explicit release
+        typename mutex_type::scoped_lock lock(mutex,write);
+        if( write ) {
+            long my_value = value[0];
+            update();
+            if( mode%16==7 ) {
+                lock_kept = lock.downgrade_to_reader();
+                if( !lock_kept )
+                    my_value = value[0] - 1;
+                okay = value_is(my_value+1);
+            }
+        } else {
+            okay = is_okay();
+            if( mode%8==3 ) {
+                long my_value = value[0];
+                lock_kept = lock.upgrade_to_writer();
+                if( !lock_kept )
+                    my_value = value[0];
+                update();
+                okay = value_is(my_value+1);
+            }
+        }
+        lock.release();
+    } else {
+        // Try explicit acquire and implicit release
+        typename mutex_type::scoped_lock lock;
+        lock.acquire(mutex,write);
+        if( write ) {
+            long my_value = value[0];
+            update();
+            if( mode%16==7 ) {
+                lock_kept = lock.downgrade_to_reader();
+                if( !lock_kept )
+                    my_value = value[0] - 1;
+                okay = value_is(my_value+1);
+            }
+        } else {
+            okay = is_okay();
+            if( mode%8==3 ) {
+                long my_value = value[0];
+                lock_kept = lock.upgrade_to_writer();
+                if( !lock_kept )
+                    my_value = value[0];
+                update();
+                okay = value_is(my_value+1);
+            }
+        }
+    }
+    if( !okay ) {
+        REPORT( "ERROR for %s at %ld: %s %s %s %s\n",mutex_name, long(mode),
+                write?"write,":"read,", write?(mode%16==7?"downgrade,":""):(mode%8==3?"upgrade,":""),
+                lock_kept?"lock kept,":"lock not kept,", (mode/8)&1?"imp/exp":"exp/imp" );
+    }
+}
+
+static tbb::atomic<size_t> Order;
+
+template<typename State, long TestSize>
+struct Work: NoAssign {
+    static const size_t chunk = 100;
+    State& state;
+    Work( State& state_ ) : state(state_) {}
+    void operator()( int ) const {
+        size_t step;
+        while( (step=Order.fetch_and_add<tbb::acquire>(chunk))<TestSize )
+            for( size_t i=0; i<chunk && step<TestSize; ++i, ++step )
+                state.flog_once(step);
+    }
+};
+
+//! Generic test of a TBB Mutex type M.
+/** Does not test features specific to reader-writer locks. */
+template<typename M>
+void Test( const char * name, int nthread ) {
+    REMARK("testing %s\n",name);
+    Counter<M> counter;
+    counter.value = 0;
+    Order = 0;
+    // use the macro because of a gcc 4.6 bug
+#define TEST_SIZE 100000
+    tbb::tick_count t0 = tbb::tick_count::now();
+    NativeParallelFor( nthread, Work<Counter<M>, TEST_SIZE>(counter) );
+    tbb::tick_count t1 = tbb::tick_count::now();
+
+    REMARK("%s time = %g usec\n",name, (t1-t0).seconds() );
+    if( counter.value!=TEST_SIZE )
+        REPORT("ERROR for %s: counter.value=%ld != %ld=test_size\n",name,counter.value,TEST_SIZE);
+#undef TEST_SIZE
+}
+
+
+//! Generic test of TBB ReaderWriterMutex type M
+template<typename M>
+void TestReaderWriter( const char * mutex_name, int nthread ) {
+    REMARK("testing %s\n",mutex_name);
+    Invariant<M,8> invariant(mutex_name);
+    Order = 0;
+    // use the macro because of a gcc 4.6 bug
+#define TEST_SIZE 1000000
+    tbb::tick_count t0 = tbb::tick_count::now();
+    NativeParallelFor( nthread, Work<Invariant<M,8>, TEST_SIZE>(invariant) );
+    tbb::tick_count t1 = tbb::tick_count::now();
+    // There is either a writer or a reader upgraded to a writer for each 4th iteration
+    long expected_value = TEST_SIZE/4;
+    if( !invariant.value_is(expected_value) )
+        REPORT("ERROR for %s: final invariant value is wrong\n",mutex_name);
+    REMARK("%s readers & writers time = %g usec\n",mutex_name,(t1-t0).seconds());
+#undef TEST_SIZE
+}
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK( "testing with %d threads\n", p );
+        Test<tbb::spin_mutex>( "spin_mutex", p );
+        Test<tbb::queuing_mutex>( "queuing_mutex", p );
+        Test<tbb::queuing_rw_mutex>( "queuing_rw_mutex", p );
+        Test<tbb::spin_rw_mutex>( "spin_rw_mutex", p );
+        Test<tbb::mutex>( "mutex", p );
+        TestReaderWriter<tbb::queuing_rw_mutex>( "queuing_rw_mutex", p );
+        TestReaderWriter<tbb::spin_rw_mutex>( "spin_rw_mutex", p );
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_opencl_kernel_32.spir b/xdl/third_party/tbb/src/test/test_opencl_kernel_32.spir
new file mode 100644
index 00000000..99055396
Binary files /dev/null and b/xdl/third_party/tbb/src/test/test_opencl_kernel_32.spir differ
diff --git a/xdl/third_party/tbb/src/test/test_opencl_kernel_64.spir b/xdl/third_party/tbb/src/test/test_opencl_kernel_64.spir
new file mode 100644
index 00000000..0f62ab5d
Binary files /dev/null and b/xdl/third_party/tbb/src/test/test_opencl_kernel_64.spir differ
diff --git a/xdl/third_party/tbb/src/test/test_opencl_node.cl b/xdl/third_party/tbb/src/test/test_opencl_node.cl
new file mode 100644
index 00000000..b3a76602
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_opencl_node.cl
@@ -0,0 +1,189 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+static size_t my_strlen( __constant char* str ) {
+    size_t len = 0;
+    if ( str ) while ( *str++ ) ++len;
+    return len;
+}
+
+static void my_strcpy(__global char *dest, __constant char *src, size_t n) {
+    while ( n-- ) *dest++ = *src++;
+}
+
+static void set_error_msg( __global char *error_msg, size_t error_msg_size, __constant char *msg ) {
+    const size_t msg_len = my_strlen(msg);
+    const size_t len  = msg_len < error_msg_size ? msg_len : error_msg_size-1;
+    my_strcpy( error_msg, msg, len );
+    error_msg[len] = 0;
+}
+
+__kernel
+void TestArgumentPassing( 
+    __global int *b1, __global int *b2, int stride_x, int stride_y, int stride_z, int dim, __global char *error_msg, int error_msg_size ) {
+    const int x = get_global_id(0);
+    const int y = get_global_id(1);
+    const int z = get_global_id(2);
+    
+    if ( dim < 2 ) {
+        if ( y != 0 ) {
+            set_error_msg( error_msg, (size_t)error_msg_size, "Y dimension does not equal 0" );
+            return;
+        }
+        if ( stride_y != 0 ) {
+            set_error_msg( error_msg, (size_t)error_msg_size, "stride_y does not equal 0" );
+            return;
+        }
+    }
+    
+    if ( dim < 3 ) {
+        if ( z != 0 ) {
+            set_error_msg( error_msg, (size_t)error_msg_size, "Z dimension does not equal 0" );
+            return;
+        }
+        if ( stride_z != 0 ) {
+            set_error_msg( error_msg, (size_t)error_msg_size, "stride_z does not equal 0" );
+            return;
+        }
+    }
+    
+    const int index = x*stride_x+y*stride_y+z*stride_z;
+    b2[index] = b1[index];
+    
+    set_error_msg( error_msg, (size_t)error_msg_size, "Done" );
+}
+
+__kernel
+void Sum(
+       __global float *b1, __global float *b2 )
+{
+    const int index = get_global_id(0);
+    b2[index] += b1[index];
+}
+
+__kernel
+void Mul(
+       __global int *b1, __global int *b2 )
+{
+    const int index = get_global_id(0);
+    b1[index] *= b2[index];
+}
+
+__kernel
+void Sqr(
+    __global float *b2, __global float *b3   )
+{
+    const int index = get_global_id(0);
+    b3[index] = b2[index]*b2[index];
+}
+
+__kernel
+void DiamondDependencyTestFill(
+    __global short *b, short v )
+{
+    const int index = get_global_id(0);
+    b[index] = v;
+}
+
+__kernel
+void DiamondDependencyTestSquare(
+    __global short *b1, __global int *b2 )
+{
+    const int index = get_global_id(0);
+    b2[index] = b1[index]*b1[index];
+}
+
+__kernel
+void DiamondDependencyTestCube(
+    __global short *b1, __global int *b2 )
+{
+    const int index = get_global_id(0);
+    b2[index] = b1[index]*b1[index]*b1[index];
+}
+
+__kernel
+void DiamondDependencyTestDivision(
+    __global short *b, __global int *b1, __global int *b2 )
+{
+    const int index = get_global_id(0);
+    b[index] *= b2[index]/b1[index];
+}
+
+__kernel
+void LoopTestIter( __global long *b1, __global long *b2 ) {
+    const int index = get_global_id(0);
+    b1[index] += b2[index]++;
+}
+
+__kernel
+void ConcurrencyTestIter( __global char *b1, __global short *b2 ) {
+    const int index = get_global_id(0);
+    b2[index] += b1[index];
+}
+
+__kernel
+void BroadcastTest( __global int *b1, __global int *b2 ) {
+    const int index = get_global_id(0);
+    b2[index] = b1[index];
+}
+
+#if __IMAGE_SUPPORT__
+const sampler_t sampler = CLK_NORMALIZED_COORDS_FALSE | CLK_ADDRESS_NONE | CLK_FILTER_NEAREST;
+
+__kernel
+void Image2dTest (
+    __read_only image2d_t src,
+    __write_only image2d_t dst,
+    char type)
+{
+    const int x = get_global_id(0);
+    const int y = get_global_id(1);
+    int2 coord = (int2)(x, y);
+    switch ( type ) { 
+    case 'f':
+        write_imagef(dst, coord, read_imagef( src, sampler, coord )) ;
+        break;
+    case 'i':
+        write_imagei(dst, coord, read_imagei( src, sampler, coord )) ;
+        break;
+    case 'u':
+        write_imageui(dst, coord, read_imageui( src, sampler, coord )) ;
+        break;
+    }
+
+}
+
+__kernel
+void Image2dTestDepth (
+#if __OPENCL_VERSION__ >= 200
+    __read_only image2d_depth_t src,
+    __write_only image2d_depth_t dst,
+#else
+    __read_only image2d_t src,
+    __write_only image2d_t dst,
+#endif
+    char type )
+{
+    const int x = get_global_id(0);
+    const int y = get_global_id(1);
+    int2 coord = (int2)(x, y);
+    write_imagef(dst, coord, read_imagef( src, sampler, coord )) ;
+}
+#endif /* __IMAGE_SUPPORT__ */
diff --git a/xdl/third_party/tbb/src/test/test_opencl_node.cpp b/xdl/third_party/tbb/src/test/test_opencl_node.cpp
new file mode 100644
index 00000000..6564e312
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_opencl_node.cpp
@@ -0,0 +1,915 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_FLOW_GRAPH_NODES 1
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+
+#include "tbb/tbb_config.h"
+
+// The old versions of MSVC 2013 fail to compile the test with fatal error
+#define __TBB_MSVC_TEST_COMPILATION_BROKEN (_MSC_VER && _MSC_FULL_VER <= 180021005 && !__INTEL_COMPILER)
+
+#if __TBB_PREVIEW_OPENCL_NODE && !__TBB_MSVC_TEST_COMPILATION_BROKEN
+#if _MSC_VER
+#pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#endif
+#include <iterator>
+#include "tbb/task_scheduler_init.h"
+#include <vector>
+#include <iostream>
+
+#include "tbb/flow_graph_opencl_node.h"
+using namespace tbb::flow;
+
+#include "harness_assert.h"
+
+#if ( __INTEL_COMPILER && __INTEL_COMPILER <= 1500 ) || __clang__
+// In some corner cases the compiler fails to perform automatic type deduction for function pointer.
+// Workaround is to replace a function pointer with a function call.
+#define BROKEN_FUNCTION_POINTER_DEDUCTION(...) __VA_ARGS__()
+#else
+#define BROKEN_FUNCTION_POINTER_DEDUCTION(...) __VA_ARGS__
+#endif
+
+#if _MSC_VER <= 1800 && !__INTEL_COMPILER
+// In some corner cases the compiler fails to perform automatic std::initializer_list deduction for curly brackets.
+// Workaround is to perform implicit conversion.
+template <typename T>
+std::initializer_list<T> make_initializer_list( std::initializer_list<T> il ) { return il; }
+#define BROKEN_INITIALIZER_LIST_DEDUCTION(...) make_initializer_list(__VA_ARGS__)
+#else
+#define BROKEN_INITIALIZER_LIST_DEDUCTION(...) __VA_ARGS__
+#endif
+
+#include "harness.h"
+
+#include <mutex>
+std::once_flag tbbRootFlag;
+char *tbbRoot = NULL;
+std::string PathToFile(const std::string& fileName) {
+    std::call_once(tbbRootFlag, [] { tbbRoot = Harness::GetEnv("tbb_root"); });
+    std::string prefix = tbbRoot ? tbbRoot : "../..";
+    return prefix + "/src/test/" + fileName;
+}
+
+// Global test variables and types
+typedef tbb::flow::opencl_range OCLRange;
+struct test_default_device_filter {
+    opencl_device_list operator()(const opencl_device_list &devices) {
+        opencl_device_list dl;
+        dl.add(*devices.begin());
+        return dl;
+    }
+};
+typedef opencl_factory<test_default_device_filter> DefaultFactoryType;
+
+struct test_default_device_selector {
+public:
+    template <typename DeviceFilter>
+    tbb::flow::opencl_device operator()(tbb::flow::opencl_factory<DeviceFilter>& f) {
+        // This is the device filter result
+        const tbb::flow::opencl_device_list &devices = f.devices();
+
+        // Get total number of available platforms:
+        cl_uint num_of_platforms = 0;
+        clGetPlatformIDs(0, 0, &num_of_platforms);
+        cl_platform_id* platforms = new cl_platform_id[num_of_platforms];
+
+        // Get IDs for all platforms:
+        clGetPlatformIDs(num_of_platforms, platforms, 0);
+
+        // By default device filter selects the first platform
+        cl_uint selected_platform_index = 0;
+        cl_platform_id platform = platforms[selected_platform_index];
+
+        // Count the number of plaform devices and compare with selector list
+        cl_uint device_count;
+        clGetDeviceIDs(platform, CL_DEVICE_TYPE_ALL, 0, NULL, &device_count);
+        // It should be the same
+        ASSERT(device_count == devices.size(), "Default device filter returned not all devices from the platform");
+
+        // Retrieve device ids from the platform
+        cl_device_id* queuered_devices = (cl_device_id*) malloc(sizeof(cl_device_id) * device_count);
+        clGetDeviceIDs(platform, CL_DEVICE_TYPE_ALL, device_count, queuered_devices, NULL);
+
+        // Compare retrieved device ids with defaults
+        for (unsigned int i = 0; i < device_count; i++) {
+            cl_device_id searched_id = queuered_devices[i];
+
+            tbb::flow::opencl_device_list::const_iterator it = std::find_if(devices.cbegin(), devices.cend(),
+                [&searched_id](const tbb::flow::opencl_device &d) {
+                    return d.device_id() == searched_id;
+            });
+
+            ASSERT(it != devices.cend(), "Devices parsed from the first platform and filtered devices are not the same");
+        }
+
+        return *(f.devices().begin());
+    }
+};
+
+void TestArgumentPassing() {
+    REMARK( "TestArgumentPassing: " );
+
+    graph g;
+    test_default_device_selector test_device_selector;
+    opencl_node <tuple<opencl_buffer<int>, opencl_buffer<int>, OCLRange>> k( g,
+        opencl_program<>( PathToFile( "test_opencl_node.cl" ) ).get_kernel( "TestArgumentPassing" ), test_device_selector );
+    split_node <tuple<opencl_buffer<int>, opencl_buffer<int>, OCLRange>> s( g );
+
+    make_edge( output_port<0>( s ), input_port<0>( k ) );
+    make_edge( output_port<1>( s ), input_port<1>( k ) );
+    make_edge( output_port<2>( s ), input_port<2>( k ) );
+
+    const int N = 1 * 1024 * 1024;
+    opencl_buffer<int> b1( N ), b2( N );
+
+    const int err_size = 128;
+    opencl_buffer<char> err( err_size );
+
+    OCLRange l;
+
+    *err.data() = 0; ASSERT( err.data() != std::string( "Done" ), NULL );
+    std::fill( b1.begin(), b1.end(), 1 );
+    k.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }), BROKEN_INITIALIZER_LIST_DEDUCTION({ 16 }) } );
+    k.set_args( port_ref<0, 1>(), /* stride_x */ 1, /* stride_y */ 0, /* stride_z */ 0, /* dim */ 1, err, err_size );
+    s.try_put( std::tie( b1, b2, l ) );
+    g.wait_for_all();
+    ASSERT( err.data() == std::string( "Done" ), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin(), b2.end(), []( int c ) { return c == 1; } ), "Validation has failed" );
+
+    // By default, the first device is used.
+    opencl_device d = *interface10::opencl_info::available_devices().begin();
+    std::array<size_t, 3> maxSizes = d.max_work_item_sizes();
+
+    *err.data() = 0; ASSERT( err.data() != std::string( "Done" ), NULL );
+    std::fill( b1.begin(), b1.end(), 2 );
+    int stride_x = 1;
+    k.set_args( port_ref<0>(), BROKEN_FUNCTION_POINTER_DEDUCTION( port_ref<1, 1> ), stride_x, /* stride_y */ 1024, /* stride_z */ 0, /* dim */ 2, err, err_size );
+    k.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ 1024, 1024 }),
+                   BROKEN_INITIALIZER_LIST_DEDUCTION({ 16, min( (int)maxSizes[1], 16 ) }) } );
+    s.try_put( std::tie( b1, b2, l ) );
+    g.wait_for_all();
+    ASSERT( err.data() == std::string( "Done" ), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin(), b2.end(), []( int c ) { return c == 2; } ), "Validation has failed" );
+
+    *err.data() = 0; ASSERT( err.data() != std::string( "Done" ), NULL );
+    std::fill( b1.begin(), b1.end(), 3 );
+    stride_x = 2; // Nothing should be changed
+    s.try_put( std::tie( b1, b2, l ) );
+    g.wait_for_all();
+    ASSERT( err.data() == std::string( "Done" ), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin(), b2.end(), []( int c ) { return c == 3; } ), "Validation has failed" );
+
+    *err.data() = 0; ASSERT( err.data() != std::string( "Done" ), NULL );
+    std::fill( b1.begin(), b1.end(), 4 );
+    int stride_z = 64 * 64;
+    ASSERT( stride_z * 64 < N, NULL );
+    k.set_args( port_ref<0>(), BROKEN_FUNCTION_POINTER_DEDUCTION( port_ref<1> ), /* stride_x */ 1, /* stride_y */ 64, /* stride_z */ stride_z, /* dim */ 3, err, err_size );
+    k.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ 64, 64, 64 }),
+                   BROKEN_INITIALIZER_LIST_DEDUCTION({ 4, min( (int)maxSizes[1], 4 ), min( (int)maxSizes[2], 4 ) }) } );
+    s.try_put( std::make_tuple( b1, b2, OCLRange() ) );
+    g.wait_for_all();
+    ASSERT( err.data() == std::string( "Done" ), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin(), b2.begin() + stride_z * 64, []( int c ) { return c == 4; } ), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin() + stride_z * 64, b2.end(), []( int c ) { return c == 3; } ), "Validation has failed" );
+
+    *err.data() = 0; ASSERT( err.data() != std::string( "Done" ), NULL );
+    std::fill( b1.begin(), b1.end(), 5 );
+    ASSERT( 2 * 64 * 64 < N, NULL );
+    k.set_args( port_ref<0, 1>(), /* stride_x */ 2, /* stride_y */ 2 * 64, /* stride_z */ 2 * 64 * 64, /* dim */ 3, err, err_size );
+    k.set_range( BROKEN_FUNCTION_POINTER_DEDUCTION( port_ref<2> ) );
+    l = { BROKEN_INITIALIZER_LIST_DEDUCTION({ 64, 64, 64 }),
+          BROKEN_INITIALIZER_LIST_DEDUCTION({ 4, min( (int)maxSizes[1], 4 ), min( (int)maxSizes[2], 4 ) }) };
+    s.try_put( std::make_tuple( b1, b2, l ) );
+    g.wait_for_all();
+    ASSERT( err.data() == std::string( "Done" ), "Validation has failed" );
+    auto it = b2.begin();
+    for ( size_t i = 0; i < 64 * 64 * 64; ++i ) ASSERT( it[i] == (i % 2 ? 4 : 5), "Validation has failed" );
+    for ( size_t i = 64 * 64 * 64; i < 2 * 64 * 64 * 64; ++i ) ASSERT( it[i] == (i % 2 ? 3 : 5), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin() + 2 * stride_z * 64, b2.end(), []( int c ) { return c == 3; } ), "Validation has failed" );
+
+    *err.data() = 0; ASSERT( err.data() != std::string( "Done" ), NULL );
+    std::fill( b1.begin(), b1.end(), 6 );
+    k.set_args( port_ref<0, 1>(), /* stride_x */ 1, /* stride_y */ 1024, /* stride_z */ 0, /* dim */ 2, err, err_size );
+    k.set_range( std::deque<int>( { 1024, 1024 } ) );
+    s.try_put( std::make_tuple( b1, b2, l ) );
+    g.wait_for_all();
+    ASSERT( err.data() == std::string( "Done" ), "Validation has failed" );
+    ASSERT( std::all_of( b2.begin(), b2.end(), []( int c ) { return c == 6; } ), "Validation has failed" );
+    REMARK( "done\n" );
+}
+
+void SimpleDependencyTest() {
+    REMARK( "SimpleDependencyTest: " );
+
+    const int N = 1 * 1024 * 1024;
+    opencl_buffer<float> b1( N ), b2( N ), b3( N );
+    std::vector<float> v1( N ), v2( N ), v3( N );
+
+    auto i1 = b1.access<write_only>();
+    auto i2 = b2.access<write_only>();
+
+    for ( int i = 0; i < N; ++i ) {
+        i1[i] = v1[i] = float( i );
+        i2[i] = v2[i] = float( 2 * i );
+    }
+
+    graph g;
+    opencl_program<> p( PathToFile("test_opencl_node.cl") ) ;
+    opencl_node< tuple<opencl_buffer<float>, opencl_buffer<float>> > k1( g, p.get_kernel( "Sum" ) );
+    k1.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }), BROKEN_INITIALIZER_LIST_DEDUCTION({ 16 }) } );
+
+    opencl_node < tuple<opencl_buffer<float>, opencl_buffer<float>> > k2( g, p.get_kernel( "Sqr" ) );
+    k2.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }), BROKEN_INITIALIZER_LIST_DEDUCTION({ 16 }) } );
+
+    make_edge( output_port<1>( k1 ), input_port<0>( k2 ) );
+
+    split_node< tuple<opencl_buffer<float>, opencl_buffer<float>, opencl_buffer<float>> > s( g );
+
+    make_edge( output_port<0>( s ), input_port<0>( k1 ) );
+    make_edge( output_port<1>( s ), input_port<1>( k1 ) );
+    make_edge( output_port<2>( s ), input_port<1>( k2 ) );
+
+    s.try_put( std::tie( b1, b2, b3 ) );
+
+    g.wait_for_all();
+
+    // validation
+    for ( int i = 0; i < N; ++i ) {
+        v2[i] += v1[i];
+        v3[i] = v2[i] * v2[i];
+    }
+
+    auto o2 = b2.access<read_only>();
+    auto o3 = b3.access<read_only>();
+
+    ASSERT( memcmp( &o2[0], &v2[0], N*sizeof( float ) ) == 0, "Validation has failed" );
+    ASSERT( memcmp( &o3[0], &v3[0], N*sizeof( float ) ) == 0, "Validation has failed" );
+    REMARK( "done\n" );
+}
+
+class device_selector {
+    enum state {
+        DEFAULT_INITIALIZED,
+        COPY_INITIALIZED,
+        DELETED
+    };
+    state my_state;
+public:
+    device_selector() : my_state( DEFAULT_INITIALIZED ) {}
+    device_selector( const device_selector& ) : my_state( COPY_INITIALIZED ) {}
+    device_selector( device_selector&& ) : my_state( COPY_INITIALIZED ) {}
+    ~device_selector() { my_state = DELETED; }
+
+    template <typename D>
+    opencl_device operator()( opencl_factory<D> &f ) {
+        ASSERT( my_state == COPY_INITIALIZED, NULL );
+        ASSERT( ! f.devices().empty(), NULL );
+        return *( f.devices().begin() );
+    }
+};
+
+void BroadcastTest() {
+    REMARK( "BroadcastTest: " );
+
+    graph g;
+
+    const int N = 1 * 1024;
+    opencl_buffer<cl_int> b( N );
+
+    const int numNodes = 4 * tbb::task_scheduler_init::default_num_threads();
+    typedef opencl_node <tuple<opencl_buffer<cl_int>, opencl_buffer<cl_int>>> NodeType;
+    std::vector<NodeType> nodes( numNodes, NodeType( g,
+        opencl_program<>( PathToFile("test_opencl_node.cl") ).get_kernel( "BroadcastTest" ),
+        device_selector() ) );
+
+    for ( std::vector<NodeType>::iterator it = nodes.begin(); it != nodes.end(); ++it )
+        it->set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }), BROKEN_INITIALIZER_LIST_DEDUCTION({ 16 }) } );
+
+    broadcast_node<opencl_buffer<cl_int>> bc( g );
+    for ( auto &x : nodes ) make_edge( bc, x );
+
+    std::vector<opencl_buffer<cl_int>> res;
+    for ( int i = 0; i < numNodes; ++i ) res.emplace_back( N );
+
+    for ( cl_int r = 1; r < 100; ++r ) {
+        std::fill( b.begin(), b.end(), r );
+        bc.try_put( b );
+        for ( int i = 0; i < numNodes; ++i ) input_port<1>( nodes[i] ).try_put( res[i] );
+        g.wait_for_all();
+
+        ASSERT( std::all_of( res.begin(), res.end(), [r]( const opencl_buffer<cl_int> &buf ) {
+            return std::all_of( buf.begin(), buf.end(), [r]( cl_int c ) { return c == r; } );
+        } ), "Validation has failed" );
+    }
+    REMARK( "done\n" );
+}
+
+void DiamondDependencyTest() {
+    REMARK( "DiamondDependencyTest: " );
+
+    const int N = 1 * 1024 * 1024;
+    opencl_buffer<cl_short> b( N );
+    opencl_buffer<cl_int> b1( N ), b2( N );
+
+    graph g;
+    device_selector d;
+    opencl_program<> p( PathToFile("test_opencl_node.cl") );
+    opencl_node <tuple<opencl_buffer<cl_short>, cl_short>> k0( g, p.get_kernel( "DiamondDependencyTestFill" ), d );
+    k0.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+    opencl_node <tuple<opencl_buffer<cl_short>, opencl_buffer<cl_int>>> k1( g, p.get_kernel( "DiamondDependencyTestSquare" ) );
+    k1.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+    opencl_node <tuple<opencl_buffer<cl_short>, opencl_buffer<cl_int>>> k2( g, p.get_kernel( "DiamondDependencyTestCube" ) );
+    k2.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+    opencl_node <tuple<opencl_buffer<cl_short>, opencl_buffer<cl_int>, opencl_buffer<cl_int>>> k3( g, p.get_kernel( "DiamondDependencyTestDivision" ) );
+    k3.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+
+    make_edge( output_port<0>( k0 ), input_port<0>( k1 ) );
+    make_edge( output_port<0>( k0 ), input_port<0>( k2 ) );
+    make_edge( output_port<0>( k0 ), input_port<0>( k3 ) );
+
+    make_edge( output_port<1>( k1 ), input_port<1>( k3 ) );
+    make_edge( output_port<1>( k2 ), input_port<2>( k3 ) );
+
+    split_node< tuple<opencl_buffer<cl_short>, cl_short, opencl_buffer<cl_int>, opencl_buffer<cl_int>> > s( g );
+
+    make_edge( output_port<0>( s ), input_port<0>( k0 ) );
+    make_edge( output_port<1>( s ), input_port<1>( k0 ) );
+    make_edge( output_port<2>( s ), input_port<1>( k1 ) );
+    make_edge( output_port<3>( s ), input_port<1>( k2 ) );
+
+    for ( cl_short i = 1; i < 10; ++i ) {
+        s.try_put( std::tie( b, i, b1, b2 ) );
+        g.wait_for_all();
+        ASSERT( std::all_of( b.begin(), b.end(), [i]( cl_short c ) {return c == i*i; } ), "Validation has failed" );
+    }
+    REMARK( "done\n" );
+}
+
+void LoopTest() {
+    REMARK( "LoopTest: " );
+
+    const int N = 1 * 1024;
+    opencl_buffer<cl_long> b1( N ), b2( N );
+
+    std::fill( b1.begin(), b1.end(), 0 );
+    std::fill( b2.begin(), b2.end(), 1 );
+
+    graph g;
+    opencl_node <tuple<opencl_buffer<cl_long>, opencl_buffer<cl_long>>> k( g,
+        opencl_program<>( PathToFile("test_opencl_node.cl") ).get_kernel( "LoopTestIter" ) );
+    k.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+
+    make_edge( output_port<1>( k ), input_port<1>( k ) );
+
+    const cl_long numIters = 1000;
+    cl_long iter = 0;
+    typedef multifunction_node < opencl_buffer<cl_long>, tuple < opencl_buffer<cl_long>, opencl_buffer<cl_long> > > multinode;
+    multinode mf( g, serial, [&iter, numIters]( const opencl_buffer<cl_long> &b, multinode::output_ports_type& op ) {
+        if ( ++iter < numIters ) get<1>( op ).try_put( b );
+        else get<0>( op ).try_put( b );
+    } );
+
+    make_edge( output_port<1>( mf ), input_port<0>( k ) );
+    make_edge( output_port<0>( k ), mf );
+
+    function_node<opencl_buffer<cl_long>> f( g, unlimited, [numIters]( const opencl_buffer<cl_long> &b ) {
+        ASSERT( std::all_of( b.begin(), b.end(), [numIters]( cl_long c ) { return c == numIters*(numIters + 1) / 2; } ), "Validation has failed" );
+    } );
+
+    make_edge( output_port<0>( mf ), f );
+
+    split_node< tuple<opencl_buffer<cl_long>, opencl_buffer<cl_long> > > s( g );
+
+    make_edge( output_port<0>( s ), input_port<0>( k ) );
+    make_edge( output_port<1>( s ), input_port<1>( k ) );
+
+    s.try_put( std::tie( b1, b2 ) );
+    g.wait_for_all();
+    REMARK( "done\n" );
+}
+
+#include "harness_barrier.h"
+
+template <typename Factory>
+struct ConcurrencyTestBodyData {
+    typedef opencl_node< tuple<opencl_buffer<cl_char, Factory>, opencl_subbuffer<cl_short, Factory>>, queueing, Factory > NodeType;
+    typedef std::vector< NodeType* > VectorType;
+
+    Harness::SpinBarrier barrier;
+    VectorType nodes;
+    function_node< opencl_subbuffer<cl_short, Factory> > validationNode;
+    tbb::atomic<int> numChecks;
+
+    ConcurrencyTestBodyData( graph &g, int numThreads ) : barrier( numThreads ), nodes(numThreads),
+        validationNode( g, unlimited, [numThreads, this]( const opencl_subbuffer<cl_short, Factory> &b ) {
+            ASSERT( std::all_of( b.begin(), b.end(), [numThreads]( cl_short c ) { return c == numThreads; } ), "Validation has failed" );
+            --numChecks;
+        } )
+    {
+        numChecks = 100;
+        // The test creates subbers in pairs so numChecks should be even.
+        ASSERT( numChecks % 2 == 0, NULL );
+    }
+
+    ~ConcurrencyTestBodyData() {
+        ASSERT( numChecks == 0, NULL );
+        for ( NodeType *n : nodes ) delete n;
+    }
+};
+
+template <typename Factory>
+class ConcurrencyTestBody : NoAssign {
+    graph &g;
+    std::shared_ptr<ConcurrencyTestBodyData<Factory>> data;
+    Factory &f;
+    const std::vector<opencl_device> &filteredDevices;
+
+    class RoundRobinDeviceSelector : NoAssign {
+    public:
+        RoundRobinDeviceSelector( size_t cnt_, int num_checks_, const std::vector<opencl_device> &filteredDevices_ )
+            : cnt( cnt_ ), num_checks( num_checks_ ), filteredDevices( filteredDevices_ ) {
+        }
+        RoundRobinDeviceSelector( const RoundRobinDeviceSelector &src )
+            : cnt( src.cnt ), num_checks( src.num_checks ), filteredDevices( src.filteredDevices ) {
+            ASSERT( src.num_checks, "The source has already been copied" );
+            src.num_checks = 0;
+        }
+        ~RoundRobinDeviceSelector() {
+            ASSERT( !num_checks, "Device Selector has not been called required number of times" );
+        }
+        opencl_device operator()( Factory &f ) {
+            const opencl_device_list& devices = f.devices();
+            ASSERT( filteredDevices.size() == devices.size(), "Incorrect list of devices" );
+            std::vector<opencl_device>::const_iterator it = filteredDevices.cbegin();
+            for ( auto d = devices.begin(); d != devices.end(); ++d ) ASSERT( (*d) == *it++, "Incorrect list of devices" );
+            --num_checks;
+            return *(devices.begin() + cnt++ % devices.size());
+        }
+    private:
+        size_t cnt;
+        mutable int num_checks;
+        const std::vector<opencl_device> &filteredDevices;
+    };
+
+public:
+    ConcurrencyTestBody( graph &g_, int numThreads, Factory &f_, const std::vector<opencl_device> &filteredDevices_ )
+        : g( g_ )
+        , data( std::make_shared<ConcurrencyTestBodyData<Factory>>( g, numThreads ) )
+        , f( f_ )
+        , filteredDevices( filteredDevices_ ) {
+    }
+    void operator()( int idx ) const {
+        data->barrier.wait();
+
+        const int N = 1 * 1024;
+        const int numChecks = data->numChecks;
+
+        typedef typename ConcurrencyTestBodyData<Factory>::NodeType NodeType;
+        NodeType *n1 = new NodeType( g,
+            opencl_program<Factory>( f, PathToFile( "test_opencl_node.cl" ) ).get_kernel( "ConcurrencyTestIter" ),
+            RoundRobinDeviceSelector( idx, numChecks, filteredDevices ), f );
+        // n2 is used to test the copy constructor
+        NodeType *n2 = new NodeType( *n1 );
+        delete n1;
+        data->nodes[idx] = n2;
+        n2->set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+
+        data->barrier.wait();
+
+        for ( size_t i = 0; i < data->nodes.size() - 1; ++i ) {
+            make_edge( output_port<0>( *data->nodes[i] ), input_port<0>( *data->nodes[i + 1] ) );
+            make_edge( output_port<1>( *data->nodes[i] ), input_port<1>( *data->nodes[i + 1] ) );
+        }
+        make_edge( output_port<1>( *data->nodes.back() ), data->validationNode );
+        for ( size_t i = 0; i < data->nodes.size() - 1; ++i ) {
+            remove_edge( output_port<0>( *data->nodes[i] ), input_port<0>( *data->nodes[i + 1] ) );
+            if ( i != (size_t)idx )
+                remove_edge( output_port<1>( *data->nodes[i] ), input_port<1>( *data->nodes[i + 1] ) );
+        }
+        if ( (size_t)idx != data->nodes.size() - 1 )
+            remove_edge( output_port<1>( *data->nodes.back() ), data->validationNode );
+
+        data->barrier.wait();
+        if ( idx == 0 ) {
+            // The first node needs two buffers.
+           Harness::FastRandom rnd(42);
+            cl_uint alignment = 0;
+            for (  auto d = filteredDevices.begin(); d != filteredDevices.end(); ++d ) {
+                cl_uint deviceAlignment;
+                (*d).info( CL_DEVICE_MEM_BASE_ADDR_ALIGN, deviceAlignment );
+                alignment = max( alignment, deviceAlignment );
+            }
+            alignment /= CHAR_BIT;
+            cl_uint alignmentMask = ~(alignment-1);
+            for ( int i = 0; i < numChecks; i += 2 ) {
+                for ( int j = 0; j < 2; ++j ) {
+                    opencl_buffer<cl_char, Factory> b1( f, N );
+                    std::fill( b1.begin(), b1.end(), cl_char(1) );
+                    input_port<0>( *n2 ).try_put( b1 );
+                }
+
+                // The subbers are created in pairs from one big buffer
+                opencl_buffer<cl_short, Factory> b( f, 4*N );
+                size_t id0 = (rnd.get() % N) & alignmentMask;
+                opencl_subbuffer<cl_short, Factory> sb1( b, id0, N );
+                std::fill( sb1.begin(), sb1.end(), cl_short(0) );
+                input_port<1>( *n2 ).try_put( sb1 );
+
+                size_t id1 = (rnd.get() % N) & alignmentMask;
+                opencl_subbuffer<cl_short, Factory> sb2 = b.subbuffer( 2*N + id1, N );
+                std::fill( sb2.begin(), sb2.end(), cl_short(0) );
+                input_port<1>( *n2 ).try_put( sb2 );
+            }
+        } else {
+            // Other nodes need only one buffer each because input_port<1> is connected with
+            // output_port<1> of the previous node.
+            for ( int i = 0; i < numChecks; ++i ) {
+                opencl_buffer<cl_char, Factory> b( f, N );
+                std::fill( b.begin(), b.end(), cl_char(1) );
+                input_port<0>( *n2 ).try_put( b );
+            }
+        }
+
+        g.wait_for_all();
+
+        // n2 will be deleted in destructor of ConcurrencyTestBodyData
+    }
+};
+
+const int concurrencyTestNumRepeats = 5;
+
+template <typename Factory = DefaultFactoryType>
+void ConcurrencyTest( const std::vector<opencl_device> &filteredDevices ) {
+    const int numThreads = min( tbb::task_scheduler_init::default_num_threads(), 8 );
+    for ( int i = 0; i < concurrencyTestNumRepeats; ++i ) {
+        tbb::task_group_context ctx( tbb::task_group_context::isolated, tbb::task_group_context::default_traits | tbb::task_group_context::concurrent_wait );
+        graph g( ctx );
+        opencl_device_list dl;
+        Factory f;
+        ConcurrencyTestBody<Factory> body( g, numThreads, f, filteredDevices );
+        NativeParallelFor( numThreads, body );
+    }
+}
+
+#include <unordered_map>
+
+enum FilterPolicy {
+    MAX_DEVICES,
+    ONE_DEVICE
+};
+
+template <FilterPolicy Policy>
+struct DeviceFilter {
+    DeviceFilter() {
+        filteredDevices.clear();
+    }
+    opencl_device_list operator()( opencl_device_list device_list ) {
+        ASSERT( filteredDevices.size() == 0, NULL );
+        switch ( Policy ) {
+        case MAX_DEVICES:
+        {
+            std::unordered_map<std::string, std::vector<opencl_device>> platforms;
+            for (auto d = device_list.begin(); d != device_list.end(); ++d) {
+                platforms[(*d).platform_name()].push_back(*d);
+            }
+
+            // Select a platform with maximum number of devices.
+            filteredDevices = std::max_element( platforms.begin(), platforms.end(),
+                []( const std::pair<std::string, std::vector<opencl_device>>& p1, const std::pair<std::string, std::vector<opencl_device>>& p2 ) {
+                return p1.second.size() < p2.second.size();
+            } )->second;
+
+            if ( !numRuns ) {
+                REMARK( "  Chosen devices from the same platform (%s):\n", filteredDevices[0].platform_name().c_str() );
+                for ( auto d = filteredDevices.begin(); d != filteredDevices.end(); d++ ) {
+                    REMARK( "    %s\n", (*d).name().c_str() );
+                }
+            }
+
+            if ( filteredDevices.size() < 2 )
+                REPORT_ONCE( "Known issue: the system does not have several devices in one platform\n" );
+            break;
+        }
+        case ONE_DEVICE:
+        {
+            ASSERT( deviceNum < device_list.size(), NULL );
+            opencl_device_list::iterator it = device_list.begin();
+            std::advance( it, deviceNum );
+            filteredDevices.push_back( *it );
+            break;
+        }
+        default:
+            ASSERT( false, NULL );
+        }
+        opencl_device_list dl;
+        for ( auto d = filteredDevices.begin(); d != filteredDevices.end(); ++d ) dl.add( *d );
+
+        ++numRuns;
+
+        return dl;
+    }
+    static opencl_device_list::size_type deviceNum;
+    static int numRuns;
+    static std::vector<opencl_device> filteredDevices;
+};
+
+template <FilterPolicy Policy>
+opencl_device_list::size_type DeviceFilter<Policy>::deviceNum;
+template <FilterPolicy Policy>
+int DeviceFilter<Policy>::numRuns;
+template <FilterPolicy Policy>
+std::vector<opencl_device> DeviceFilter<Policy>::filteredDevices;
+
+void CustomFactoryTest() {
+    REMARK( "CustomFactoryTest:\n" );
+    REMARK( "  Multi device test:\n" );
+    DeviceFilter<MAX_DEVICES>::numRuns = 0;
+    typedef tbb::flow::opencl_factory <DeviceFilter<MAX_DEVICES>> custom_factory;
+    ConcurrencyTest<custom_factory>( DeviceFilter<MAX_DEVICES>::filteredDevices );
+    ASSERT( DeviceFilter<MAX_DEVICES>::numRuns == concurrencyTestNumRepeats, NULL );
+
+    REMARK( "  One device tests:\n" );
+    graph g;
+    opencl_device_list all_devices = interface10::opencl_info::available_devices();
+    for ( int i = 0; i < (int)all_devices.size(); ++i ) {
+        opencl_device_list::const_iterator it = all_devices.begin();
+        std::advance( it, i );
+        REMARK( "    %s: ", it->name().c_str() );
+        DeviceFilter<ONE_DEVICE>::numRuns = 0;
+        DeviceFilter<ONE_DEVICE>::deviceNum = i;
+        typedef tbb::flow::opencl_factory <DeviceFilter<ONE_DEVICE>> one_device_factory;
+        ConcurrencyTest<one_device_factory>( DeviceFilter<ONE_DEVICE>::filteredDevices );
+        ASSERT( DeviceFilter<ONE_DEVICE>::numRuns == concurrencyTestNumRepeats, NULL );
+        ASSERT( DeviceFilter<ONE_DEVICE>::filteredDevices[0] == *it, NULL );
+        REMARK( "done\n" );
+    }
+    REMARK( "CustomFactoryTest: done\n" );
+}
+
+void DefaultConcurrencyTest() {
+    REMARK( "DefaultConcurrencyTest: " );
+    // By default, the first device is selected.
+    ConcurrencyTest( { *interface10::opencl_info::available_devices().begin() } );
+    REMARK( "done\n" );
+}
+
+
+void SpirKernelTest() {
+    REMARK( "SpirKernelTest:\n" );
+
+    const opencl_device_list devices = interface10::opencl_info::available_devices();
+
+    for( auto d = devices.begin(); d != devices.end(); d++ ) {
+        if( !(*d).extension_available( "cl_khr_spir" ) ) {
+            REMARK( "  Extension 'cl_khr_spir' is not available on the device '%s'\n", (*d).name().c_str() );
+            continue;
+        }
+
+        graph g;
+        DefaultFactoryType factory;
+
+        bool init = factory.init( { *d } );
+        ASSERT( init, "It should be the first initialization" );
+
+        std::string path_to_file = PathToFile(std::string("test_opencl_kernel_") +
+                                              std::to_string((*d).address_bits()) + std::string(".spir") );
+        REMARK("  Using SPIR file '%s' on device '%s'\n", path_to_file.c_str(), (*d).name().c_str());
+        const int N = 1 * 1024 * 1024;
+        opencl_buffer<float, DefaultFactoryType> b1( factory, N ), b2( factory, N );
+        std::vector<float> v1( N ), v2( N );
+
+        auto i1 = b1.access<write_only>();
+        auto i2 = b2.access<write_only>();
+
+        for ( int i = 0; i < N; ++i ) {
+            i1[i] = v1[i] = float( i );
+            i2[i] = v2[i] = float( 2 * i );
+        }
+
+        typedef opencl_node< tuple<opencl_buffer<float, DefaultFactoryType>, opencl_buffer<float, DefaultFactoryType> >, queueing, DefaultFactoryType > OpenCLNodeType;
+
+        OpenCLNodeType k1( g, opencl_program<DefaultFactoryType>( factory, opencl_program_type::SPIR, path_to_file ).get_kernel( "custom_summer" ), factory );
+        k1.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+
+        input_port<0>(k1).try_put( b1 );
+        input_port<1>(k1).try_put( b2 );
+
+        g.wait_for_all();
+
+        // validation
+        for ( int i = 0; i < N; ++i ) {
+            v2[i] += v1[i];
+        }
+
+        ASSERT( memcmp( &b2[0], &v2[0], N*sizeof( float ) ) == 0, "Validation has failed" );
+    }
+    REMARK( "done\n" );
+}
+
+void PrecompiledKernelTest() {
+    REMARK( "PrecompiledKernelTest:\n" );
+
+    graph g;
+    DefaultFactoryType factory;
+
+    const opencl_device_list devices = interface10::opencl_info::available_devices();
+    opencl_device_list::const_iterator it = std::find_if(
+        devices.cbegin(), devices.cend(),
+        []( const opencl_device &d ) {
+            std::string vendor_name = d.vendor();
+            return std::string::npos != vendor_name.find( "Intel" ) && CL_DEVICE_TYPE_GPU == d.type();
+        } );
+
+    if ( it == devices.cend() ) {
+        REPORT( "Known issue: there is no device in the system that supports the precompiled GPU kernel.\n" );
+        return;
+    }
+    bool init = factory.init( { *it } );
+    ASSERT( init, "It should be the first initialization" );
+    REMARK( "  Device name '%s', %s:", it->name().c_str(), it->version().c_str() );
+
+    const int N = 1 * 1024 * 1024;
+    opencl_buffer<float, DefaultFactoryType> b1( factory, N ), b2( factory, N );
+    std::vector<float> v1( N ), v2( N );
+
+    auto i1 = b1.access<write_only>();
+    auto i2 = b2.access<write_only>();
+
+    for ( int i = 0; i < N; ++i ) {
+        i1[i] = v1[i] = float( i );
+        i2[i] = v2[i] = float( 2 * i );
+    }
+
+    std::string path_to_file = PathToFile(std::string("test_opencl_precompiled_kernel_gpu_") + std::to_string((*it).address_bits()) + std::string(".ir"));
+
+    opencl_program<DefaultFactoryType> p( factory, opencl_program_type::PRECOMPILED, path_to_file);
+    opencl_node < tuple<opencl_buffer<float, DefaultFactoryType>, opencl_buffer<float, DefaultFactoryType> >, queueing, DefaultFactoryType > k1(g, p.get_kernel("custom_subtractor"), factory);
+    k1.set_range({ BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) });
+
+    input_port<0>(k1).try_put( b1 );
+    input_port<1>(k1).try_put( b2 );
+
+    g.wait_for_all();
+
+    // validation
+    for ( int i = 0; i < N; ++i ) {
+        v2[i] -= v1[i];
+    }
+
+    ASSERT( memcmp( &b2[0], &v2[0], N*sizeof( float ) ) == 0, "Validation has failed" );
+    REMARK( " done\n" );
+}
+
+/*
+    /--functional_node-\   /-functional_node-\                       /--functional_node-\
+    |                  |   |                 |   /--opencl_node--\   |                  |
+    O Buffer generator O---O  Buffer filler  O---O               O---O Result validator O
+    |                  |   |                 |   |               |   |                  |
+    \------------------/   \-----------------/   |               |   \------------------/
+    |   Multiplier  |
+    /--functional_node-\   /-functional_node-\   |               |
+    |                  |   |                 |   |               |
+    O Buffer generator O---O  Buffer filler  O---O               O
+    |                  |   |                 |   \---------------/
+    \------------------/   \-----------------/
+    */
+
+template <typename Key>
+struct BufferWithKey : public opencl_buffer<int> {
+    typedef typename std::decay<Key>::type KeyType;
+    KeyType my_key;
+    int my_idx;
+
+    // TODO: investigate why defaul ctor is required
+    BufferWithKey() {}
+    BufferWithKey( size_t N, int idx ) : opencl_buffer<int>( N ), my_idx( idx ) {}
+    const KeyType& key() const { return my_key; }
+};
+
+template <typename Key>
+Key KeyGenerator( int i );
+
+template <>
+int KeyGenerator<int>( int i ) { return i; }
+
+template <>
+std::string KeyGenerator<std::string>( int i ) { return std::to_string( i ); }
+
+template <typename Key>
+BufferWithKey<Key> GenerateRandomBuffer( BufferWithKey<Key> b ) {
+    b.my_key = KeyGenerator<typename std::decay<Key>::type>( b.my_idx );
+    Harness::FastRandom r( b.my_idx );
+    std::generate( b.begin(), b.end(), [&r]() { return r.get(); } );
+    return b;
+}
+
+template <typename Key, typename JP>
+bool KeyMatchingTest() {
+    const int N = 1000;
+    const int numMessages = 100;
+
+    graph g;
+    broadcast_node<int> b( g );
+
+    // Use opencl_async_msg's to have non-blocking map to host
+    function_node<int, opencl_async_msg<BufferWithKey<Key>>>
+        bufGenerator1( g, unlimited, [N]( int i ) { return opencl_async_msg<BufferWithKey<Key>>( BufferWithKey<Key >(N, i) ); } ),
+        bufGenerator2 = bufGenerator1;
+
+    function_node<BufferWithKey<Key>, BufferWithKey<Key>>
+        bufFiller1( g, unlimited, []( const BufferWithKey<Key> &b ) { return GenerateRandomBuffer<Key>( b ); } ),
+        bufFiller2 = bufFiller1;
+
+    opencl_node< tuple< BufferWithKey<Key>, BufferWithKey<Key> >, JP > k( g,
+        opencl_program<>( PathToFile( "test_opencl_node.cl" ) ).get_kernel( "Mul" ) );
+    k.set_range( { BROKEN_INITIALIZER_LIST_DEDUCTION({ N }) } );
+
+    bool success = true;
+    function_node<BufferWithKey<Key>> checker( g, unlimited, [&success, N]( BufferWithKey<Key> b ) {
+        Harness::FastRandom r( b.my_idx );
+        std::for_each( b.begin(), b.end(), [&success, &r]( int bv ) {
+            const int rv = r.get();
+            if ( bv != rv*rv ) {
+                success = false;
+                return;
+            }
+        } );
+    } );
+
+    make_edge( bufGenerator1, bufFiller1 );
+    make_edge( bufGenerator2, bufFiller2 );
+    make_edge( bufFiller1, input_port<0>( k ) );
+    make_edge( bufFiller2, input_port<1>( k ) );
+    make_edge( output_port<0>( k ), checker );
+
+    for ( int i = 0; i < numMessages; ++i ) {
+        bufGenerator1.try_put( i );
+        bufGenerator2.try_put( numMessages - i - 1 );
+    }
+
+    g.wait_for_all();
+
+    return success;
+}
+
+void KeyMatchingTest() {
+    REMARK( "KeyMatchingTest:\n" );
+    REMARK( "  Queueing negative test: " );
+    bool res = !KeyMatchingTest<int, queueing>(); // The test should fail with the queueing policy, so the negative result is expected.
+    ASSERT( res, "Queueing negative test has failed" );
+    REMARK( "done\n  key_matching<int> test: " );
+    res = KeyMatchingTest<int, key_matching<int>>();
+    ASSERT( res, "key_matching<int> test has failed" );
+    REMARK( "done\n  key_matching<string&> test: " );
+    res = KeyMatchingTest<std::string&, key_matching<std::string&>>();
+    ASSERT( res, "key_matching<string&> test has failed" );
+    REMARK( "done\n" );
+    REMARK( "KeyMatchingTest: done\n" );
+}
+
+int TestMain() {
+
+
+    TestArgumentPassing();
+
+    SimpleDependencyTest();
+    BroadcastTest();
+    DiamondDependencyTest();
+    LoopTest();
+
+    DefaultConcurrencyTest();
+    CustomFactoryTest();
+
+    SpirKernelTest();
+#if !__APPLE__
+    // Consider better support for precompiled programs on Apple
+    PrecompiledKernelTest();
+#endif
+
+    KeyMatchingTest();
+
+    return Harness::Done;
+}
+#else
+#define HARNESS_SKIP_TEST 1
+#include "harness.h"
+#endif
diff --git a/xdl/third_party/tbb/src/test/test_opencl_precompiled_kernel_gpu_32.ir b/xdl/third_party/tbb/src/test/test_opencl_precompiled_kernel_gpu_32.ir
new file mode 100644
index 00000000..d65513a8
Binary files /dev/null and b/xdl/third_party/tbb/src/test/test_opencl_precompiled_kernel_gpu_32.ir differ
diff --git a/xdl/third_party/tbb/src/test/test_opencl_precompiled_kernel_gpu_64.ir b/xdl/third_party/tbb/src/test/test_opencl_precompiled_kernel_gpu_64.ir
new file mode 100644
index 00000000..f05cdc69
Binary files /dev/null and b/xdl/third_party/tbb/src/test/test_opencl_precompiled_kernel_gpu_64.ir differ
diff --git a/xdl/third_party/tbb/src/test/test_openmp.cpp b/xdl/third_party/tbb/src/test/test_openmp.cpp
new file mode 100644
index 00000000..0c11a1db
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_openmp.cpp
@@ -0,0 +1,250 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test mixing OpenMP and TBB
+
+/* SCR #471
+ Below is workaround to compile test within environment of Intel Compiler
+ but by Microsoft Compiler. So, there is wrong "omp.h" file included and
+ manifest section is missed from .exe file - restoring here.
+
+ As of Visual Studio 2010, crtassem.h is no longer shipped.
+ */
+#if !defined(__INTEL_COMPILER) && _MSC_VER >= 1400 && _MSC_VER < 1600
+    #include <crtassem.h>
+    #if !defined(_OPENMP)
+        #define _OPENMP
+        #if defined(_DEBUG)
+            #pragma comment(lib, "vcompd")
+        #else   // _DEBUG
+            #pragma comment(lib, "vcomp")
+        #endif  // _DEBUG
+    #endif // _OPENMP
+
+    #if defined(_DEBUG)
+        #if defined(_M_IX86)
+            #pragma comment(linker,"/manifestdependency:\"type='win32' "        \
+                "name='" __LIBRARIES_ASSEMBLY_NAME_PREFIX ".DebugOpenMP' "      \
+                "version='" _CRT_ASSEMBLY_VERSION "' "                          \
+                "processorArchitecture='x86' "                                  \
+                "publicKeyToken='" _VC_ASSEMBLY_PUBLICKEYTOKEN "'\"")
+        #elif defined(_M_X64)
+            #pragma comment(linker,"/manifestdependency:\"type='win32' "        \
+                "name='" __LIBRARIES_ASSEMBLY_NAME_PREFIX ".DebugOpenMP' "      \
+                "version='" _CRT_ASSEMBLY_VERSION "' "                          \
+                "processorArchitecture='amd64' "                                \
+                "publicKeyToken='" _VC_ASSEMBLY_PUBLICKEYTOKEN "'\"")
+        #elif defined(_M_IA64)
+            #pragma comment(linker,"/manifestdependency:\"type='win32' "        \
+                "name='" __LIBRARIES_ASSEMBLY_NAME_PREFIX ".DebugOpenMP' "      \
+                "version='" _CRT_ASSEMBLY_VERSION "' "                          \
+                "processorArchitecture='ia64' "                                 \
+                "publicKeyToken='" _VC_ASSEMBLY_PUBLICKEYTOKEN "'\"")
+        #endif
+    #else   // _DEBUG
+        #if defined(_M_IX86)
+            #pragma comment(linker,"/manifestdependency:\"type='win32' "        \
+                "name='" __LIBRARIES_ASSEMBLY_NAME_PREFIX ".OpenMP' "           \
+                "version='" _CRT_ASSEMBLY_VERSION "' "                          \
+                "processorArchitecture='x86' "                                  \
+                "publicKeyToken='" _VC_ASSEMBLY_PUBLICKEYTOKEN "'\"")
+        #elif defined(_M_X64)
+            #pragma comment(linker,"/manifestdependency:\"type='win32' "        \
+                "name='" __LIBRARIES_ASSEMBLY_NAME_PREFIX ".OpenMP' "           \
+                "version='" _CRT_ASSEMBLY_VERSION "' "                          \
+                "processorArchitecture='amd64' "                                \
+                "publicKeyToken='" _VC_ASSEMBLY_PUBLICKEYTOKEN "'\"")
+        #elif defined(_M_IA64)
+            #pragma comment(linker,"/manifestdependency:\"type='win32' "        \
+                "name='" __LIBRARIES_ASSEMBLY_NAME_PREFIX ".OpenMP' "           \
+                "version='" _CRT_ASSEMBLY_VERSION "' "                          \
+                "processorArchitecture='ia64' "                                 \
+                "publicKeyToken='" _VC_ASSEMBLY_PUBLICKEYTOKEN "'\"")
+        #endif
+    #endif  // _DEBUG
+    #define _OPENMP_NOFORCE_MANIFEST
+#endif
+
+#include <omp.h>
+
+
+typedef short T;
+
+void SerialConvolve( T c[], const T a[], int m, const T b[], int n ) {
+    for( int i=0; i<m+n-1; ++i ) {
+        int start = i<n ? 0 : i-n+1;
+        int finish = i<m ? i+1 : m;
+        T sum = 0;
+        for( int j=start; j<finish; ++j )
+            sum += a[j]*b[i-j];
+        c[i] = sum;
+    }
+}
+
+#define OPENMP_ASYNC_SHUTDOWN_BROKEN (__INTEL_COMPILER<=1400 && __linux__)
+#define TBB_PREVIEW_WAITING_FOR_WORKERS 1
+
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+#include "tbb/parallel_reduce.h"
+#include "tbb/task_scheduler_init.h"
+#include "harness.h"
+
+using namespace tbb;
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Suppress overzealous warning about short+=short
+    #pragma warning( push )
+    #pragma warning( disable: 4244 )
+#endif
+
+class InnerBody: NoAssign {
+    const T* my_a;
+    const T* my_b;
+    const int i;
+public:
+    T sum;
+    InnerBody( T /*c*/[], const T a[], const T b[], int ii ) :
+        my_a(a), my_b(b), i(ii), sum(0)
+    {}
+    InnerBody( InnerBody& x, split ) :
+        my_a(x.my_a), my_b(x.my_b), i(x.i), sum(0)
+    {
+    }
+    void join( InnerBody& x ) {sum += x.sum;}
+    void operator()( const blocked_range<int>& range ) {
+        for( int j=range.begin(); j!=range.end(); ++j )
+            sum += my_a[j]*my_b[i-j];
+    }
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif
+
+//! Test OpenMMP loop around TBB loop
+void OpenMP_TBB_Convolve( T c[], const T a[], int m, const T b[], int n ) {
+    REMARK("testing OpenMP loop around TBB loop\n");
+#pragma omp parallel
+    {
+        task_scheduler_init init;
+#pragma omp for
+        for( int i=0; i<m+n-1; ++i ) {
+            int start = i<n ? 0 : i-n+1;
+            int finish = i<m ? i+1 : m;
+            InnerBody body(c,a,b,i);
+            parallel_reduce( blocked_range<int>(start,finish,10), body );
+            c[i] = body.sum;
+        }
+    }
+}
+
+class OuterBody: NoAssign {
+    const T* my_a;
+    const T* my_b;
+    T* my_c;
+    const int m;
+    const int n;
+public:
+    OuterBody( T c[], const T a[], int m_, const T b[], int n_ ) :
+        my_a(a), my_b(b), my_c(c), m(m_), n(n_)
+    {}
+    void operator()( const blocked_range<int>& range ) const {
+        for( int i=range.begin(); i!=range.end(); ++i ) {
+            int start = i<n ? 0 : i-n+1;
+            int finish = i<m ? i+1 : m;
+            T sum = 0;
+#pragma omp parallel for reduction(+:sum)
+            for( int j=start; j<finish; ++j )
+                sum += my_a[j]*my_b[i-j];
+            my_c[i] = sum;
+        }
+    }
+};
+
+//! Test TBB loop around OpenMP loop
+void TBB_OpenMP_Convolve( T c[], const T a[], int m, const T b[], int n ) {
+    REMARK("testing TBB loop around OpenMP loop\n");
+    parallel_for( blocked_range<int>(0,m+n-1,10), OuterBody( c, a, m, b, n ) );
+}
+
+#if __INTEL_COMPILER
+// A regression test on OpenMP affinity settings affecting TBB.
+// Testing only with __INTEL_COMPILER because we do not provide interoperability with other OpenMP implementations.
+
+#define __TBB_NUM_THREADS_AFFECTED_BY_LIBIOMP (KMP_VERSION_BUILD<20150922)
+
+void TestNumThreads() {
+#if __TBB_NUM_THREADS_AFFECTED_BY_LIBIOMP
+    REPORT("Known issue: the default number of threads is affected by OpenMP affinity\n");
+#else
+    REMARK("Compare default number of threads for OpenMP and TBB\n");
+    Harness::SetEnv("KMP_AFFINITY","compact");
+    // Make an OpenMP call before initializing TBB
+    int omp_nthreads = omp_get_max_threads();
+    #pragma omp parallel
+    {}
+    int tbb_nthreads = tbb::task_scheduler_init::default_num_threads();
+    REMARK("# of threads (OpenMP): %d\n", omp_nthreads);
+    REMARK("# of threads (TBB): %d\n", tbb_nthreads);
+    // For the purpose of testing, assume that OpenMP and TBB should utilize the same # of threads.
+    // If it's not true on some platforms, the test will need to be adjusted.
+    ASSERT( tbb_nthreads==omp_nthreads, "Initialization of TBB is possibly affected by OpenMP");
+#endif
+}
+#endif // __INTEL_COMPILER
+
+const int M = 17*17;
+const int N = 13*13;
+T A[M], B[N];
+T expected[M+N], actual[M+N];
+
+template <class Func>
+void RunTest( Func F, int m, int n, int p, bool wait_workers = false ) {
+    task_scheduler_init init( p );
+    memset( actual, -1, (m+n)*sizeof(T) );
+    F( actual, A, m, B, n );
+    ASSERT( memcmp(actual, expected, (m+n-1)*sizeof(T))==0, NULL );
+    if (wait_workers) init.blocking_terminate(std::nothrow);
+    else              init.terminate();
+}
+
+int TestMain () {
+#if __INTEL_COMPILER
+    TestNumThreads(); // Testing initialization-related behavior; must be the first
+#endif // __INTEL_COMPILER
+    MinThread = 1;
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        for( int m=1; m<=M; m*=17 ) {
+            for( int n=1; n<=N; n*=13 ) {
+                for( int i=0; i<m; ++i ) A[i] = T(1+i/5);
+                for( int i=0; i<n; ++i ) B[i] = T(1+i/7);
+                SerialConvolve( expected, A, m, B, n );
+                RunTest( OpenMP_TBB_Convolve, m, n, p );
+                RunTest( TBB_OpenMP_Convolve, m, n, p
+#if OPENMP_ASYNC_SHUTDOWN_BROKEN
+                    ,true
+#endif
+                    );
+            }
+        }
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_overwrite_node.cpp b/xdl/third_party/tbb/src/test/test_overwrite_node.cpp
new file mode 100644
index 00000000..9cd0aafa
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_overwrite_node.cpp
@@ -0,0 +1,165 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+
+#define N 300
+#define T 4
+#define M 5
+
+template< typename R >
+void simple_read_write_tests() {
+    tbb::flow::graph g;
+    tbb::flow::overwrite_node<R> n(g);
+
+    for ( int t = 0; t < T; ++t ) {
+        R v0(N+1);
+        std::vector< harness_counting_receiver<R> > r(M, harness_counting_receiver<R>(g));
+
+        ASSERT( n.is_valid() == false, NULL );
+        ASSERT( n.try_get( v0 ) == false, NULL );
+        if ( t % 2 ) {
+            ASSERT( n.try_put( static_cast<R>(N) ), NULL );
+            ASSERT( n.is_valid() == true, NULL );
+            ASSERT( n.try_get( v0 ) == true, NULL );
+            ASSERT( v0 == R(N), NULL );
+       }
+
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::make_edge( n, r[i] );
+        }
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+        ASSERT(n.successor_count() == M, NULL);
+        typename tbb::flow::overwrite_node<R>::successor_list_type my_succs;
+        n.copy_successors(my_succs);
+        ASSERT(my_succs.size() == M, NULL);
+        ASSERT(n.predecessor_count() == 0, NULL);
+#endif
+
+        for (int i = 0; i < N; ++i ) {
+            R v1(static_cast<R>(i));
+            ASSERT( n.try_put( v1 ), NULL );
+            ASSERT( n.is_valid() == true, NULL );
+            for (int j = 0; j < N; ++j ) {
+                R v2(0);
+                ASSERT( n.try_get( v2 ), NULL );
+                ASSERT( v1 == v2, NULL );
+            }
+        }
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == N+t%2, NULL );
+        }
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::remove_edge( n, r[i] );
+        }
+        ASSERT( n.try_put( R(0) ), NULL );
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == N+t%2, NULL );
+        }
+        n.clear();
+        ASSERT( n.is_valid() == false, NULL );
+        ASSERT( n.try_get( v0 ) == false, NULL );
+    }
+}
+
+template< typename R >
+class native_body : NoAssign {
+    tbb::flow::overwrite_node<R> &my_node;
+
+public:
+
+     native_body( tbb::flow::overwrite_node<R> &n ) : my_node(n) {}
+
+     void operator()( int i ) const {
+         R v1(static_cast<R>(i));
+         ASSERT( my_node.try_put( v1 ), NULL );
+         ASSERT( my_node.is_valid() == true, NULL );
+     }
+};
+
+template< typename R >
+void parallel_read_write_tests() {
+    tbb::flow::graph g;
+    tbb::flow::overwrite_node<R> n(g);
+    //Create a vector of identical nodes
+    std::vector< tbb::flow::overwrite_node<R> > ow_vec(2, n);
+
+    for (size_t node_idx=0; node_idx<ow_vec.size(); ++node_idx) {
+    for ( int t = 0; t < T; ++t ) {
+        std::vector< harness_counting_receiver<R> > r(M, harness_counting_receiver<R>(g));
+
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::make_edge( ow_vec[node_idx], r[i] );
+        }
+        R v0;
+        ASSERT( ow_vec[node_idx].is_valid() == false, NULL );
+        ASSERT( ow_vec[node_idx].try_get( v0 ) == false, NULL );
+
+        NativeParallelFor( N, native_body<R>( ow_vec[node_idx] ) );
+
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == N, NULL );
+        }
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::remove_edge( ow_vec[node_idx], r[i] );
+        }
+        ASSERT( ow_vec[node_idx].try_put( R(0) ), NULL );
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == N, NULL );
+        }
+        ow_vec[node_idx].clear();
+        ASSERT( ow_vec[node_idx].is_valid() == false, NULL );
+        ASSERT( ow_vec[node_idx].try_get( v0 ) == false, NULL );
+    }
+    }
+}
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    simple_read_write_tests<int>();
+    simple_read_write_tests<float>();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        parallel_read_write_tests<int>();
+        parallel_read_write_tests<float>();
+        test_reserving_nodes<tbb::flow::overwrite_node, size_t>();
+    }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_extract_on_node<tbb::flow::overwrite_node, int>();
+    test_extract_on_node<tbb::flow::overwrite_node, float>();
+#endif
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_parallel_do.cpp b/xdl/third_party/tbb/src/test/test_parallel_do.cpp
new file mode 100644
index 00000000..949ef00c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_do.cpp
@@ -0,0 +1,428 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/parallel_do.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/atomic.h"
+#include "harness.h"
+#include "harness_cpu.h"
+
+#if defined(_MSC_VER) && defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif /* _MSC_VER && _Wp64 */
+
+#define N_DEPTHS     20
+
+static tbb::atomic<int> g_values_counter;
+
+class value_t {
+    size_t x;
+    value_t& operator= ( const value_t& );
+public:
+    value_t ( size_t xx ) : x(xx) { ++g_values_counter; }
+    value_t ( const value_t& v ) : x(v.x) { ++g_values_counter; }
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    value_t ( value_t&& v ) : x(v.x) { ++g_values_counter; }
+#endif
+    ~value_t () { --g_values_counter; }
+    size_t value() const volatile { return x; }
+};
+
+#include "harness_iterator.h"
+
+static size_t g_tasks_expected = 0;
+static tbb::atomic<size_t> g_tasks_observed;
+
+size_t FindNumOfTasks ( size_t max_depth ) {
+    if( max_depth == 0 )
+        return 1;
+    return  max_depth * FindNumOfTasks( max_depth - 1 ) + 1;
+}
+
+//! Simplest form of the parallel_do functor object.
+class FakeTaskGeneratorBody {
+public:
+    //! The simplest form of the function call operator
+    /** It does not allow adding new tasks during its execution. **/
+    void operator() ( value_t depth ) const {
+        g_tasks_observed += FindNumOfTasks(depth.value());
+    }
+};
+
+/** Work item is passed by reference here. **/
+class FakeTaskGeneratorBody_RefVersion {
+public:
+    void operator() ( value_t& depth ) const {
+        g_tasks_observed += FindNumOfTasks(depth.value());
+    }
+};
+
+/** Work item is passed by reference to const here. **/
+class FakeTaskGeneratorBody_ConstRefVersion {
+public:
+    void operator() ( const value_t& depth ) const {
+        g_tasks_observed += FindNumOfTasks(depth.value());
+    }
+};
+
+/** Work item is passed by reference to volatile here. **/
+class FakeTaskGeneratorBody_VolatileRefVersion {
+public:
+    void operator() ( volatile value_t& depth, tbb::parallel_do_feeder<value_t>& ) const {
+        g_tasks_observed += FindNumOfTasks(depth.value());
+    }
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+/** Work item is passed by rvalue reference here. **/
+class FakeTaskGeneratorBody_RvalueRefVersion {
+public:
+    void operator() ( value_t&& depth ) const {
+        g_tasks_observed += FindNumOfTasks(depth.value());
+    }
+};
+#endif
+
+void do_work ( const value_t& depth, tbb::parallel_do_feeder<value_t>& feeder ) {
+    ++g_tasks_observed;
+    value_t new_value(depth.value()-1);
+    for( size_t i = 0; i < depth.value(); ++i) {
+        if (i%2) feeder.add( new_value ); // pass lvalue
+        else     feeder.add( value_t(depth.value()-1) ); // pass rvalue
+    }
+}
+
+//! Standard form of the parallel_do functor object.
+/** Allows adding new work items on the fly. **/
+class TaskGeneratorBody
+{
+public:
+    //! This form of the function call operator can be used when the body needs to add more work during the processing
+    void operator() ( value_t depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(depth, feeder);
+    }
+private:
+    // Assert that parallel_do does not ever access body constructors
+    TaskGeneratorBody () {}
+    TaskGeneratorBody ( const TaskGeneratorBody& );
+    // These functions need access to the default constructor
+    template<class Body, class Iterator> friend void TestBody( size_t );
+    template<class Body, class Iterator> friend void TestBody_MoveOnly( size_t );
+};
+
+/** Work item is passed by reference here. **/
+class TaskGeneratorBody_RefVersion
+{
+public:
+    void operator() ( value_t& depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(depth, feeder);
+    }
+};
+
+/** Work item is passed as const here. Compilers must ignore the const qualifier. **/
+class TaskGeneratorBody_ConstVersion
+{
+public:
+    void operator() ( const value_t depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(depth, feeder);
+    }
+};
+
+/** Work item is passed by reference to const here. **/
+class TaskGeneratorBody_ConstRefVersion
+{
+public:
+    void operator() ( const value_t& depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(depth, feeder);
+    }
+};
+
+/** Work item is passed by reference to volatile here. **/
+class TaskGeneratorBody_VolatileRefVersion
+{
+public:
+    void operator() ( volatile value_t& depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(const_cast<value_t&>(depth), feeder);
+    }
+};
+
+/** Work item is passed by reference to const volatile here. **/
+class TaskGeneratorBody_ConstVolatileRefVersion
+{
+public:
+    void operator() ( const volatile value_t& depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(const_cast<value_t&>(depth), feeder);
+    }
+};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+/** Work item is passed by rvalue reference here. **/
+class TaskGeneratorBody_RvalueRefVersion
+{
+public:
+    void operator() ( value_t&& depth, tbb::parallel_do_feeder<value_t>& feeder ) const {
+        do_work(depth, feeder);
+    }
+};
+#endif
+
+static value_t g_depths[N_DEPTHS] = {0, 1, 2, 3, 4, 0, 1, 0, 1, 2, 0, 1, 2, 3, 0, 1, 2, 0, 1, 2};
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+template<class Body, class Iterator>
+void TestBody_MoveIter ( const Body& body, Iterator begin, Iterator end  ) {
+    typedef std::move_iterator<Iterator> MoveIterator;
+    MoveIterator mbegin(begin);
+    MoveIterator mend(end);
+    g_tasks_observed = 0;
+    tbb::parallel_do(mbegin, mend, body);
+    ASSERT (g_tasks_observed == g_tasks_expected, NULL);
+}
+
+template<class Body, class Iterator>
+void TestBody_MoveOnly ( size_t depth ) {
+    typedef typename std::iterator_traits<Iterator>::value_type value_type;
+    value_type a_depths[N_DEPTHS] = {0, 1, 2, 3, 4, 0, 1, 0, 1, 2, 0, 1, 2, 3, 0, 1, 2, 0, 1, 2};
+    TestBody_MoveIter( Body(), Iterator(a_depths), Iterator(a_depths + depth));
+}
+#endif
+
+template<class Body, class Iterator>
+void TestBody ( size_t depth ) {
+    typedef typename std::iterator_traits<Iterator>::value_type value_type;
+    value_type a_depths[N_DEPTHS] = {0, 1, 2, 3, 4, 0, 1, 0, 1, 2, 0, 1, 2, 3, 0, 1, 2, 0, 1, 2};
+    Body body;
+    Iterator begin(a_depths);
+    Iterator end(a_depths + depth);
+    g_tasks_observed = 0;
+    tbb::parallel_do(begin, end, body);
+    ASSERT (g_tasks_observed == g_tasks_expected, NULL);
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestBody_MoveIter( body, Iterator(a_depths), Iterator(a_depths + depth) );
+#endif
+}
+
+template<class Iterator>
+void TestIterator_Common ( size_t depth ) {
+    TestBody<FakeTaskGeneratorBody, Iterator> (depth);
+    TestBody<FakeTaskGeneratorBody_ConstRefVersion, Iterator> (depth);
+    TestBody<TaskGeneratorBody, Iterator> (depth);
+    TestBody<TaskGeneratorBody_ConstVersion, Iterator> (depth);
+    TestBody<TaskGeneratorBody_ConstRefVersion, Iterator> (depth);
+}
+
+template<class Iterator>
+void TestIterator_Const ( size_t depth ) {
+    TestIterator_Common<Iterator>(depth);
+    TestBody<TaskGeneratorBody_ConstVolatileRefVersion, Iterator> (depth);
+}
+
+template<class Iterator>
+void TestIterator_Modifiable ( size_t depth ) {
+    TestIterator_Const<Iterator>(depth);
+    TestBody<FakeTaskGeneratorBody_RefVersion, Iterator> (depth);
+    TestBody<FakeTaskGeneratorBody_VolatileRefVersion, Iterator> (depth);
+    TestBody<TaskGeneratorBody_RefVersion, Iterator> (depth);
+    TestBody<TaskGeneratorBody_VolatileRefVersion, Iterator> (depth);
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestBody_MoveOnly<FakeTaskGeneratorBody_RvalueRefVersion, Iterator> (depth);
+    TestBody_MoveOnly<TaskGeneratorBody_RvalueRefVersion, Iterator> (depth);
+#endif
+}
+
+template<class Iterator>
+void TestIterator_Movable ( size_t depth ) {
+    TestIterator_Common<Iterator>(depth);
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestBody<FakeTaskGeneratorBody_RvalueRefVersion, Iterator> (depth);
+    TestBody<TaskGeneratorBody_RvalueRefVersion, Iterator> (depth);
+#endif
+}
+
+void Run( int /*nthread*/ ) {
+    for( size_t depth = 0; depth <= N_DEPTHS; ++depth ) {
+        g_tasks_expected = 0;
+        for ( size_t i=0; i < depth; ++i )
+            g_tasks_expected += FindNumOfTasks( g_depths[i].value() );
+        // Test for iterators over values convertible to work item type
+        TestIterator_Movable<size_t*>(depth);
+        // Test for random access iterators
+        TestIterator_Modifiable<value_t*>(depth);
+        // Test for input iterators
+        TestIterator_Modifiable<Harness::InputIterator<value_t> >(depth);
+        // Test for forward iterators
+        TestIterator_Modifiable<Harness::ForwardIterator<value_t> >(depth);
+        // Test for const random access iterators
+        TestIterator_Const<Harness::ConstRandomIterator<value_t> >(depth);
+    }
+}
+
+const size_t elements = 10000;
+const size_t init_sum = 0;
+tbb::atomic<size_t> element_counter;
+
+template<size_t K>
+struct set_to {
+    void operator()(size_t& x) const {
+        x = K;
+        ++element_counter;
+    }
+};
+
+#include "test_range_based_for.h"
+#include <functional>
+#include <deque>
+
+void range_do_test() {
+    using namespace range_based_for_support_tests;
+    std::deque<size_t> v(elements, 0);
+
+    // iterator, const and non-const range check
+    element_counter = 0;
+    tbb::parallel_do(v.begin(), v.end(), set_to<1>());
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == v.size(), "elements of v not all ones");
+
+    element_counter = 0;
+    tbb::parallel_do(v, set_to<0>());
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == init_sum, "elements of v not all zeros");
+
+    element_counter = 0;
+    tbb::parallel_do(tbb::blocked_range<std::deque<size_t>::iterator>(v.begin(), v.end()), set_to<1>());
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == v.size(), "elements of v not all ones");
+
+    // same as above with context group
+    element_counter = 0;
+    tbb::task_group_context context;
+    tbb::parallel_do(v.begin(), v.end(), set_to<0>(), context);
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == init_sum, "elements of v not all ones");
+
+    element_counter = 0;
+    tbb::parallel_do(v, set_to<1>(), context);
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == v.size(), "elements of v not all ones");
+
+    element_counter = 0;
+    tbb::parallel_do(tbb::blocked_range<std::deque<size_t>::iterator>(v.begin(), v.end()), set_to<0>(), context);
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == init_sum, "elements of v not all zeros");
+}
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+namespace TestMoveSem {
+    struct MovePreferable : Movable {
+        MovePreferable() : Movable(), addtofeed(true) {}
+        MovePreferable(bool addtofeed_) : Movable(), addtofeed(addtofeed_) {}
+        MovePreferable(MovePreferable&& other) : Movable(std::move(other)), addtofeed(other.addtofeed) {};
+        // base class is explicitly initialized in the copy ctor to avoid -Wextra warnings
+        MovePreferable(const MovePreferable& other) : Movable(other) { REPORT("Error: copy ctor prefered.\n"); };
+        MovePreferable& operator=(const MovePreferable&) { REPORT("Error: copy assing operator prefered.\n"); return *this; }
+        bool addtofeed;
+    };
+    struct MoveOnly : MovePreferable, NoCopy {
+        MoveOnly() : MovePreferable() {}
+        MoveOnly(bool addtofeed_) : MovePreferable(addtofeed_) {}
+        MoveOnly(MoveOnly&& other) : MovePreferable(std::move(other)) {};
+    };
+}
+
+template<typename T>
+void RecordAndAdd(const T& in, tbb::parallel_do_feeder<T>& feeder) {
+    ASSERT(in.alive, "Got dead object in body");
+    size_t i = ++g_tasks_observed;
+    if (in.addtofeed) {
+        if (i%2) feeder.add(T(false));
+        else {
+            T a(false);
+            feeder.add(std::move(a));
+        }
+    }
+}
+// Take an item by rvalue reference
+template<typename T>
+struct TestMoveIteratorBody {
+    void operator() (T&& in, tbb::parallel_do_feeder<T>& feeder) const { RecordAndAdd(in, feeder); }
+};
+// Take an item by value
+template<typename T>
+struct TestMoveIteratorBodyByValue {
+    void operator() (T in, tbb::parallel_do_feeder<T>& feeder) const { RecordAndAdd(in, feeder); }
+};
+
+template<typename Iterator, typename Body>
+void TestMoveIterator() {
+    typedef typename std::iterator_traits<Iterator>::value_type value_type;
+
+    Body body;
+    const size_t size = 65;
+    g_tasks_observed = 0;
+    value_type a[size];
+    tbb::parallel_do( std::make_move_iterator(Iterator(a)), std::make_move_iterator(Iterator(a+size)), body );
+    ASSERT(size * 2  == g_tasks_observed, NULL);
+}
+
+template<typename T>
+void DoTestMoveSemantics() {
+    TestMoveIterator< Harness::InputIterator<T>, TestMoveIteratorBody<T> >();
+    TestMoveIterator< Harness::ForwardIterator<T>, TestMoveIteratorBody<T> >();
+    TestMoveIterator< Harness::RandomIterator<T>, TestMoveIteratorBody<T> >();
+
+    TestMoveIterator< Harness::InputIterator<T>, TestMoveIteratorBodyByValue<T> >();
+    TestMoveIterator< Harness::ForwardIterator<T>, TestMoveIteratorBodyByValue<T> >();
+    TestMoveIterator< Harness::RandomIterator<T>, TestMoveIteratorBodyByValue<T> >();
+}
+
+void TestMoveSemantics() {
+    DoTestMoveSemantics<TestMoveSem::MovePreferable>();
+#if __TBB_CPP11_IS_COPY_CONSTRUCTIBLE_PRESENT && !__TBB_IS_COPY_CONSTRUCTIBLE_BROKEN
+    //  parallel_do uses is_copy_constructible to support non-copyable types
+    DoTestMoveSemantics<TestMoveSem::MoveOnly>();
+#endif
+}
+#else /* __TBB_CPP11_RVALUE_REF_PRESENT */
+void TestMoveSemantics() {
+    REPORT("Known issue: move support tests are skipped.\n");
+}
+#endif
+
+int TestMain () {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    g_values_counter = 0;
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init( p );
+        Run(p);
+        range_do_test();
+        // Test that all workers sleep when no work
+        TestCPUUserTime(p);
+    }
+    // This check must be performed after the scheduler terminated because only in this
+    // case there is a guarantee that the workers already destroyed their last tasks.
+    ASSERT( g_values_counter == 0, "Value objects were leaked" );
+
+    TestMoveSemantics();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_parallel_for.cpp b/xdl/third_party/tbb/src/test/test_parallel_for.cpp
new file mode 100644
index 00000000..8a7857fa
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_for.cpp
@@ -0,0 +1,765 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test for function template parallel_for.h
+
+// These features are pure additions and thus can be always "on" in the test
+#define TBB_PREVIEW_SERIAL_SUBSET 1
+#include "harness_defs.h"
+
+#if _MSC_VER
+#pragma warning (push)
+#if __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+    // Suppress pointless "unreachable code" warning.
+    #pragma warning (disable: 4702)
+#endif
+#if defined(_Wp64)
+    // Workaround for overzealous compiler warnings in /Wp64 mode
+    #pragma warning (disable: 4267)
+#endif
+
+#define _SCL_SECURE_NO_WARNINGS
+#endif //#if _MSC_VER
+
+#include "harness_defs.h"
+#include "tbb/parallel_for.h"
+#include "tbb/atomic.h"
+#include "harness_assert.h"
+#include "harness.h"
+
+static tbb::atomic<int> FooBodyCount;
+
+//! A range object whose only public members are those required by the Range concept.
+template<size_t Pad>
+class FooRange {
+    //! Start of range
+    int start;
+
+    //! Size of range
+    int size;
+    FooRange( int start_, int size_ ) : start(start_), size(size_) {
+        zero_fill<char>(pad, Pad);
+        pad[Pad-1] = 'x';
+    }
+    template<typename Flavor_, size_t Pad_> friend void Flog( int nthread );
+    template<size_t Pad_> friend class FooBody;
+    void operator&();
+
+    char pad[Pad];
+public:
+    bool empty() const {return size==0;}
+    bool is_divisible() const {return size>1;}
+    FooRange( FooRange& original, tbb::split ) : size(original.size/2) {
+        original.size -= size;
+        start = original.start+original.size;
+        ASSERT( original.pad[Pad-1]=='x', NULL );
+        pad[Pad-1] = 'x';
+    }
+};
+
+//! A range object whose only public members are those required by the parallel_for.h body concept.
+template<size_t Pad>
+class FooBody {
+    static const int LIVE = 0x1234;
+    tbb::atomic<int>* array;
+    int state;
+    friend class FooRange<Pad>;
+    template<typename Flavor_, size_t Pad_> friend void Flog( int nthread );
+    FooBody( tbb::atomic<int>* array_ ) : array(array_), state(LIVE) {}
+public:
+    ~FooBody() {
+        --FooBodyCount;
+        for( size_t i=0; i<sizeof(*this); ++i )
+            reinterpret_cast<char*>(this)[i] = -1;
+    }
+    //! Copy constructor
+    FooBody( const FooBody& other ) : array(other.array), state(other.state) {
+        ++FooBodyCount;
+        ASSERT( state==LIVE, NULL );
+    }
+    void operator()( FooRange<Pad>& r ) const {
+        for( int k=0; k<r.size; ++k ) {
+            const int i = array[r.start+k]++;
+            ASSERT( i==0, NULL );
+        }
+    }
+};
+
+#include "tbb/tick_count.h"
+
+static const int N = 500;
+static tbb::atomic<int> Array[N];
+
+struct serial_tag {};
+struct parallel_tag {};
+struct empty_partitioner_tag {};
+
+template <typename Flavor, typename Partitioner, typename Range, typename Body>
+struct Invoker;
+
+#if TBB_PREVIEW_SERIAL_SUBSET
+template <typename Range, typename Body>
+struct Invoker<serial_tag, empty_partitioner_tag, Range, Body> {
+    void operator()( const Range& r, const Body& body, empty_partitioner_tag& ) {
+        tbb::serial:: parallel_for( r, body );
+    }
+};
+template <typename Partitioner, typename Range, typename Body>
+struct Invoker<serial_tag, Partitioner, Range, Body> {
+    void operator()( const Range& r, const Body& body, Partitioner& p ) {
+        tbb::serial:: parallel_for( r, body, p );
+    }
+};
+#endif
+
+template <typename Range, typename Body>
+struct Invoker<parallel_tag, empty_partitioner_tag, Range, Body> {
+    void operator()( const Range& r, const Body& body, empty_partitioner_tag& ) {
+        tbb:: parallel_for( r, body );
+    }
+};
+
+template <typename Partitioner, typename Range, typename Body>
+struct Invoker<parallel_tag, Partitioner, Range, Body> {
+    void operator()( const Range& r, const Body& body, Partitioner& p ) {
+        tbb:: parallel_for( r, body, p );
+    }
+};
+
+template <typename Flavor, typename Partitioner, typename T, typename Body>
+struct InvokerStep;
+
+#if TBB_PREVIEW_SERIAL_SUBSET
+template <typename T, typename Body>
+struct InvokerStep<serial_tag, empty_partitioner_tag, T, Body> {
+    void operator()( const T& first, const T& last, const Body& f, empty_partitioner_tag& ) {
+        tbb::serial:: parallel_for( first, last, f );
+    }
+    void operator()( const T& first, const T& last, const T& step, const Body& f, empty_partitioner_tag& ) {
+        tbb::serial:: parallel_for( first, last, step, f );
+    }
+};
+
+template <typename Partitioner, typename T, typename Body>
+struct InvokerStep<serial_tag, Partitioner, T, Body> {
+    void operator()( const T& first, const T& last, const Body& f, Partitioner& p ) {
+        tbb::serial:: parallel_for( first, last, f, p);
+    }
+    void operator()( const T& first, const T& last, const T& step, const Body& f, Partitioner& p ) {
+        tbb::serial:: parallel_for( first, last, step, f, p );
+    }
+};
+#endif
+
+template <typename T, typename Body>
+struct InvokerStep<parallel_tag, empty_partitioner_tag, T, Body> {
+    void operator()( const T& first, const T& last, const Body& f, empty_partitioner_tag& ) {
+        tbb:: parallel_for( first, last, f );
+    }
+    void operator()( const T& first, const T& last, const T& step, const Body& f, empty_partitioner_tag& ) {
+        tbb:: parallel_for( first, last, step, f );
+    }
+};
+
+template <typename Partitioner, typename T, typename Body>
+struct InvokerStep<parallel_tag, Partitioner, T, Body> {
+    void operator()( const T& first, const T& last, const Body& f, Partitioner& p ) {
+        tbb:: parallel_for( first, last, f, p );
+    }
+    void operator()( const T& first, const T& last, const T& step, const Body& f, Partitioner& p ) {
+        tbb:: parallel_for( first, last, step, f, p );
+    }
+};
+
+template<typename Flavor, size_t Pad>
+void Flog( int nthread ) {
+    tbb::tick_count T0 = tbb::tick_count::now();
+    for( int i=0; i<N; ++i ) {
+        for ( int mode = 0; mode < 4; ++mode) {
+            FooRange<Pad> r( 0, i );
+            const FooRange<Pad> rc = r;
+            FooBody<Pad> f( Array );
+            const FooBody<Pad> fc = f;
+            memset( Array, 0, sizeof(Array) );
+            FooBodyCount = 1;
+            switch (mode) {
+            case 0: {
+                empty_partitioner_tag p;
+                Invoker< Flavor, empty_partitioner_tag, FooRange<Pad>, FooBody<Pad> > invoke_for;
+                invoke_for( rc, fc, p );
+            }
+                break;
+            case 1: {
+                Invoker< Flavor, const tbb::simple_partitioner, FooRange<Pad>, FooBody<Pad> > invoke_for;
+                invoke_for( rc, fc, tbb::simple_partitioner() );
+            }
+                break;
+            case 2: {
+                Invoker< Flavor, const tbb::auto_partitioner, FooRange<Pad>, FooBody<Pad> > invoke_for;
+                invoke_for( rc, fc, tbb::auto_partitioner() );
+            }
+                break;
+            case 3: {
+                static tbb::affinity_partitioner affinity;
+                Invoker< Flavor, tbb::affinity_partitioner, FooRange<Pad>, FooBody<Pad> > invoke_for;
+                invoke_for( rc, fc, affinity );
+            }
+                break;
+            }
+            for( int j=0; j<i; ++j )
+                ASSERT( Array[j]==1, NULL );
+            for( int j=i; j<N; ++j )
+                ASSERT( Array[j]==0, NULL );
+            ASSERT( FooBodyCount==1, NULL );
+        }
+    }
+    tbb::tick_count T1 = tbb::tick_count::now();
+    REMARK("time=%g\tnthread=%d\tpad=%d\n",(T1-T0).seconds(),nthread,int(Pad));
+}
+
+// Testing parallel_for with step support
+const size_t PFOR_BUFFER_TEST_SIZE = 1024;
+// test_buffer has some extra items beyond its right bound
+const size_t PFOR_BUFFER_ACTUAL_SIZE = PFOR_BUFFER_TEST_SIZE + 1024;
+size_t pfor_buffer[PFOR_BUFFER_ACTUAL_SIZE];
+
+template<typename T>
+class TestFunctor{
+public:
+    void operator ()(T index) const {
+        pfor_buffer[index]++;
+    }
+};
+
+#include <stdexcept> // std::invalid_argument
+
+template <typename Flavor, typename T, typename Partitioner>
+void TestParallelForWithStepSupportHelper(Partitioner& p)
+{
+    const T pfor_buffer_test_size = static_cast<T>(PFOR_BUFFER_TEST_SIZE);
+    const T pfor_buffer_actual_size = static_cast<T>(PFOR_BUFFER_ACTUAL_SIZE);
+    // Testing parallel_for with different step values
+    InvokerStep< Flavor, Partitioner, T, TestFunctor<T> > invoke_for;
+    for (T begin = 0; begin < pfor_buffer_test_size - 1; begin += pfor_buffer_test_size / 10 + 1) {
+        T step;
+        for (step = 1; step < pfor_buffer_test_size; step++) {
+            memset(pfor_buffer, 0, pfor_buffer_actual_size * sizeof(size_t));
+            if (step == 1){
+                invoke_for(begin, pfor_buffer_test_size, TestFunctor<T>(), p);
+            } else {
+                invoke_for(begin, pfor_buffer_test_size, step, TestFunctor<T>(), p);
+            }
+            // Verifying that parallel_for processed all items it should
+            for (T i = begin; i < pfor_buffer_test_size; i = i + step) {
+                ASSERT(pfor_buffer[i] == 1, "parallel_for didn't process all required elements");
+                pfor_buffer[i] = 0;
+            }
+            // Verifying that no extra items were processed and right bound of array wasn't crossed
+            for (T i = 0; i < pfor_buffer_actual_size; i++) {
+                ASSERT(pfor_buffer[i] == 0, "parallel_for processed an extra element");
+            }
+        }
+    }
+}
+
+template <typename Flavor, typename T>
+void TestParallelForWithStepSupport()
+{
+    static tbb::affinity_partitioner affinity_p;
+    tbb::auto_partitioner auto_p;
+    tbb::simple_partitioner simple_p;
+    empty_partitioner_tag p;
+
+    // Try out all partitioner combinations
+    TestParallelForWithStepSupportHelper< Flavor,T,empty_partitioner_tag >(p);
+    TestParallelForWithStepSupportHelper< Flavor,T,const tbb::auto_partitioner >(auto_p);
+    TestParallelForWithStepSupportHelper< Flavor,T,const tbb::simple_partitioner >(simple_p);
+    TestParallelForWithStepSupportHelper< Flavor,T,tbb::affinity_partitioner >(affinity_p);
+
+    // Testing some corner cases
+    tbb::parallel_for(static_cast<T>(2), static_cast<T>(1), static_cast<T>(1), TestFunctor<T>());
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    try{
+        tbb::parallel_for(static_cast<T>(1), static_cast<T>(100), static_cast<T>(0), TestFunctor<T>());  // should cause std::invalid_argument
+    }catch(std::invalid_argument&){
+        return;
+    }
+    catch ( ... ) {
+        ASSERT ( __TBB_EXCEPTION_TYPE_INFO_BROKEN, "Unrecognized exception. std::invalid_argument is expected" );
+    }
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+// Exception support test
+#define HARNESS_EH_SIMPLE_MODE 1
+#include "tbb/tbb_exception.h"
+#include "harness_eh.h"
+
+#if TBB_USE_EXCEPTIONS
+class test_functor_with_exception {
+public:
+    void operator ()(size_t) const { ThrowTestException(); }
+};
+
+void TestExceptionsSupport() {
+    REMARK (__FUNCTION__);
+    { // Tests version with a step provided
+        ResetEhGlobals();
+        TRY();
+            tbb::parallel_for((size_t)0, (size_t)PFOR_BUFFER_TEST_SIZE, (size_t)1, test_functor_with_exception());
+        CATCH_AND_ASSERT();
+    }
+    { // Tests version without a step
+        ResetEhGlobals();
+        TRY();
+            tbb::parallel_for((size_t)0, (size_t)PFOR_BUFFER_TEST_SIZE, test_functor_with_exception());
+        CATCH_AND_ASSERT();
+    }
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+// Cancellation support test
+class functor_to_cancel {
+public:
+    void operator()(size_t) const {
+        ++g_CurExecuted;
+        CancellatorTask::WaitUntilReady();
+    }
+};
+
+size_t g_worker_task_step = 0;
+
+class my_worker_pfor_step_task : public tbb::task
+{
+    tbb::task_group_context &my_ctx;
+
+    tbb::task* execute () __TBB_override {
+        if (g_worker_task_step == 0){
+            tbb::parallel_for((size_t)0, (size_t)PFOR_BUFFER_TEST_SIZE, functor_to_cancel(), my_ctx);
+        }else{
+            tbb::parallel_for((size_t)0, (size_t)PFOR_BUFFER_TEST_SIZE, g_worker_task_step, functor_to_cancel(), my_ctx);
+        }
+        return NULL;
+    }
+public:
+    my_worker_pfor_step_task ( tbb::task_group_context &context_) : my_ctx(context_) { }
+};
+
+void TestCancellation()
+{
+    // tests version without a step
+    g_worker_task_step = 0;
+    ResetEhGlobals();
+    RunCancellationTest<my_worker_pfor_step_task, CancellatorTask>();
+
+    // tests version with step
+    g_worker_task_step = 1;
+    ResetEhGlobals();
+    RunCancellationTest<my_worker_pfor_step_task, CancellatorTask>();
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#include "harness_m128.h"
+
+#if (HAVE_m128 || HAVE_m256) && !__TBB_SSE_STACK_ALIGNMENT_BROKEN
+template<typename ClassWithVectorType>
+struct SSE_Functor {
+    ClassWithVectorType* Src, * Dst;
+    SSE_Functor( ClassWithVectorType* src, ClassWithVectorType* dst ) : Src(src), Dst(dst) {}
+
+    void operator()( tbb::blocked_range<int>& r ) const {
+        for( int i=r.begin(); i!=r.end(); ++i )
+            Dst[i] = Src[i];
+    }
+};
+
+//! Test that parallel_for works with stack-allocated __m128
+template<typename ClassWithVectorType>
+void TestVectorTypes() {
+	const int aSize = 300;
+    ClassWithVectorType Array1[aSize], Array2[aSize];
+    for( int i=0; i<aSize; ++i ) {
+        // VC8 does not properly align a temporary value; to work around, use explicit variable
+        ClassWithVectorType foo(i);
+        Array1[i] = foo;
+    }
+    tbb::parallel_for( tbb::blocked_range<int>(0,aSize), SSE_Functor<ClassWithVectorType>(Array1, Array2) );
+    for( int i=0; i<aSize; ++i ) {
+        ClassWithVectorType foo(i);
+        ASSERT( Array2[i]==foo, NULL ) ;
+    }
+}
+#endif /* HAVE_m128 || HAVE_m256 */
+
+#include <vector>
+#include <sstream>
+#include <tbb/blocked_range.h>
+
+struct TestSimplePartitionerStabilityFunctor:NoAssign{
+  std::vector<int> & ranges;
+  TestSimplePartitionerStabilityFunctor(std::vector<int> & theRanges):ranges(theRanges){}
+  void operator()(tbb::blocked_range<size_t>& r)const{
+      ranges.at(r.begin())=true;
+  }
+};
+void TestSimplePartitionerStability(){
+    const std::size_t repeat_count= 10;
+    const std::size_t rangeToSplitSize=1000000;
+    const std::size_t grainsizeStep=rangeToSplitSize/repeat_count;
+    typedef TestSimplePartitionerStabilityFunctor FunctorType;
+
+    for (std::size_t i=0 , grainsize=grainsizeStep; i<repeat_count;i++, grainsize+=grainsizeStep){
+        std::vector<int> firstSeries(rangeToSplitSize,0);
+        std::vector<int> secondSeries(rangeToSplitSize,0);
+
+        tbb::parallel_for(tbb::blocked_range<size_t>(0,rangeToSplitSize,grainsize),FunctorType(firstSeries),tbb::simple_partitioner());
+        tbb::parallel_for(tbb::blocked_range<size_t>(0,rangeToSplitSize,grainsize),FunctorType(secondSeries),tbb::simple_partitioner());
+        std::stringstream str; str<<i;
+        ASSERT(firstSeries==secondSeries,("splitting range with tbb::simple_partitioner must be reproducible; i=" +str.str()).c_str() );
+    }
+}
+#include <cstdio>
+#include "tbb/task_scheduler_init.h"
+#include "harness_cpu.h"
+#include "harness_barrier.h"
+#include "test_partitioner.h"
+
+namespace interaction_with_range_and_partitioner {
+
+// Test checks compatibility of parallel_for algorithm with various range implementations
+
+void test() {
+    using namespace test_partitioner_utils::interaction_with_range_and_partitioner;
+
+    test_partitioner_utils::SimpleBody b;
+    tbb::affinity_partitioner ap;
+
+    parallel_for(Range1(true, false), b, ap);
+    parallel_for(Range2(true, false), b, ap);
+    parallel_for(Range3(true, false), b, ap);
+    parallel_for(Range4(false, true), b, ap);
+    parallel_for(Range5(false, true), b, ap);
+    parallel_for(Range6(false, true), b, ap);
+
+    parallel_for(Range1(false, true), b, tbb::simple_partitioner());
+    parallel_for(Range2(false, true), b, tbb::simple_partitioner());
+    parallel_for(Range3(false, true), b, tbb::simple_partitioner());
+    parallel_for(Range4(false, true), b, tbb::simple_partitioner());
+    parallel_for(Range5(false, true), b, tbb::simple_partitioner());
+    parallel_for(Range6(false, true), b, tbb::simple_partitioner());
+
+    parallel_for(Range1(false, true), b, tbb::auto_partitioner());
+    parallel_for(Range2(false, true), b, tbb::auto_partitioner());
+    parallel_for(Range3(false, true), b, tbb::auto_partitioner());
+    parallel_for(Range4(false, true), b, tbb::auto_partitioner());
+    parallel_for(Range5(false, true), b, tbb::auto_partitioner());
+    parallel_for(Range6(false, true), b, tbb::auto_partitioner());
+}
+
+} // namespace interaction_with_range_and_partitioner
+
+namespace various_range_implementations {
+
+using namespace test_partitioner_utils;
+using namespace test_partitioner_utils::TestRanges;
+
+// Body ensures that initial work distribution is done uniformly through affinity mechanism and not
+// through work stealing
+class Body {
+    Harness::SpinBarrier &m_sb;
+public:
+    Body(Harness::SpinBarrier& sb) : m_sb(sb) { }
+    Body(Body& b, tbb::split) : m_sb(b.m_sb) { }
+    Body& operator =(const Body&) { return *this; }
+    template <typename Range>
+    void operator()(Range& r) const {
+        REMARK("Executing range [%lu, %lu)\n", r.begin(), r.end());
+        m_sb.timed_wait(10); // waiting for all threads
+    }
+};
+
+namespace correctness {
+
+/* Testing only correctness (that is parallel_for does not hang) */
+template <typename RangeType, bool /* feedback */, bool ensure_non_emptiness>
+void test() {
+    static const int thread_num = tbb::task_scheduler_init::default_num_threads();
+    RangeType range( 0, thread_num, NULL, false, ensure_non_emptiness );
+    tbb::affinity_partitioner ap;
+    tbb::parallel_for( range, SimpleBody(), ap );
+}
+
+} // namespace correctness
+
+namespace uniform_distribution {
+
+/* Body of parallel_for algorithm would hang if non-uniform work distribution happened  */
+template <typename RangeType, bool feedback, bool ensure_non_emptiness>
+void test() {
+    static const int thread_num = tbb::task_scheduler_init::default_num_threads();
+    Harness::SpinBarrier sb( thread_num );
+    RangeType range(0, thread_num, NULL, feedback, ensure_non_emptiness);
+    const Body sync_body( sb );
+    tbb::affinity_partitioner ap;
+    tbb::parallel_for( range, sync_body, ap );
+    tbb::parallel_for( range, sync_body, tbb::static_partitioner() );
+}
+
+} // namespace uniform_distribution
+
+void test() {
+    const bool provide_feedback = __TBB_ENABLE_RANGE_FEEDBACK;
+    const bool ensure_non_empty_range = true;
+
+    // BlockedRange does not take into account feedback and non-emptiness settings but uses the
+    // tbb::blocked_range implementation
+    uniform_distribution::test<BlockedRange, !provide_feedback, !ensure_non_empty_range>();
+
+#if __TBB_ENABLE_RANGE_FEEDBACK
+    using uniform_distribution::test; // if feedback is enabled ensure uniform work distribution
+#else
+    using correctness::test;
+#endif
+
+    {
+        test<RoundedDownRange, provide_feedback, ensure_non_empty_range>();
+        test<RoundedDownRange, provide_feedback, !ensure_non_empty_range>();
+#if __TBB_ENABLE_RANGE_FEEDBACK && !__TBB_MIC_NATIVE
+        // due to fast division algorithm on MIC
+        test<RoundedDownRange, !provide_feedback, ensure_non_empty_range>();
+        test<RoundedDownRange, !provide_feedback, !ensure_non_empty_range>();
+#endif
+    }
+
+    {
+        test<RoundedUpRange, provide_feedback, ensure_non_empty_range>();
+        test<RoundedUpRange, provide_feedback, !ensure_non_empty_range>();
+#if __TBB_ENABLE_RANGE_FEEDBACK && !__TBB_MIC_NATIVE
+        // due to fast division algorithm on MIC
+        test<RoundedUpRange, !provide_feedback, ensure_non_empty_range>();
+        test<RoundedUpRange, !provide_feedback, !ensure_non_empty_range>();
+#endif
+    }
+
+    // Testing that parallel_for algorithm works with such weird ranges
+    correctness::test<Range1_2, /* provide_feedback= */ false, !ensure_non_empty_range>();
+    correctness::test<Range1_999, /* provide_feedback= */ false, !ensure_non_empty_range>();
+    correctness::test<Range999_1, /* provide_feedback= */ false, !ensure_non_empty_range>();
+
+    // The following ranges do not comply with the proportion suggested by partitioner. Therefore
+    // they have to provide the proportion in which they were actually split back to partitioner and
+    // ensure theirs non-emptiness
+    test<Range1_2, provide_feedback, ensure_non_empty_range>();
+    test<Range1_999, provide_feedback, ensure_non_empty_range>();
+    test<Range999_1, provide_feedback, ensure_non_empty_range>();
+}
+
+} // namespace various_range_implementations
+
+#include <map>
+#include <utility>
+#include "tbb/task_arena.h"
+#include "tbb/enumerable_thread_specific.h"
+
+namespace parallel_for_within_task_arena {
+
+using namespace test_partitioner_utils::TestRanges;
+using tbb::split;
+using tbb::proportional_split;
+
+class BlockedRangeWhitebox;
+
+typedef std::pair<size_t, size_t> range_borders;
+typedef std::multimap<BlockedRangeWhitebox*, range_borders> MapType;
+typedef tbb::enumerable_thread_specific<MapType> ETSType;
+ETSType ets;
+
+class BlockedRangeWhitebox : public BlockedRange {
+public:
+    static const bool is_splittable_in_proportion = true;
+    BlockedRangeWhitebox(size_t _begin, size_t _end)
+        : BlockedRange(_begin, _end, NULL, false, false) { }
+
+    BlockedRangeWhitebox(BlockedRangeWhitebox& r, proportional_split& p)
+        :BlockedRange(r, p) {
+        update_ets(r);
+        update_ets(*this);
+    }
+
+    BlockedRangeWhitebox(BlockedRangeWhitebox& r, split)
+        :BlockedRange(r, split()) { }
+
+    void update_ets(BlockedRangeWhitebox& range) {
+        std::pair<MapType::iterator, MapType::iterator> equal_range = ets.local().equal_range(&range);
+        for (MapType::iterator it = equal_range.first; it != equal_range.second;++it) {
+            if (it->second.first <= range.begin() && range.end() <= it->second.second) {
+                ASSERT(!(it->second.first == range.begin() && it->second.second == range.end()), "Only one border of the range should be equal to the original");
+                it->second.first = range.begin();
+                it->second.second = range.end();
+                return;
+            }
+        }
+        ets.local().insert(std::make_pair<BlockedRangeWhitebox*, range_borders>(&range, range_borders(range.begin(), range.end())));
+    }
+};
+
+template <typename Partitioner>
+struct ArenaBody {
+    size_t range_begin;
+    size_t range_end;
+
+    ArenaBody(size_t _range_begin, size_t _range_end)
+        :range_begin(_range_begin), range_end(_range_end) { }
+
+    void operator()() const {
+        Partitioner my_partitioner;
+        tbb::parallel_for(BlockedRangeWhitebox(range_begin, range_end), test_partitioner_utils::SimpleBody(), my_partitioner);
+    }
+};
+
+struct CombineBody {
+    MapType operator()(MapType x, const MapType& y) const {
+        x.insert(y.begin(), y.end());
+        for (MapType::iterator it = x.begin(); it != x.end();++it)
+            for (MapType::iterator internal_it = x.begin(); internal_it != x.end(); ++internal_it) {
+                if (it != internal_it && internal_it->second.first <= it->second.first && it->second.second <= internal_it->second.second) {
+                    x.erase(internal_it);
+                    break;
+                }
+            }
+        return x;
+    }
+};
+
+range_borders combine_range(const MapType& map) {
+    range_borders result_range = map.begin()->second;
+    for (MapType::const_iterator it = map.begin(); it != map.end(); it++)
+        result_range = range_borders((std::min)(result_range.first, it->second.first), (std::max)(result_range.second, it->second.second));
+    return result_range;
+}
+
+template <typename Partitioner>
+void test_body() {
+    for (unsigned int num_threads = tbb::tbb_thread::hardware_concurrency() / 4 + 1; num_threads < tbb::tbb_thread::hardware_concurrency(); num_threads *= 2)
+        for (size_t range_begin = 0, range_end = num_threads * 10 - 1, i = 0; i < 3; range_begin += num_threads, range_end += num_threads + 1, ++i) {
+            ets = ETSType(MapType());
+            tbb::task_arena limited(num_threads);
+            limited.execute(ArenaBody<Partitioner>(range_begin, range_end));
+            MapType combined_map = ets.combine(CombineBody());
+            range_borders result_borders = combine_range(combined_map);
+            ASSERT(result_borders.first == range_begin, "Restored range begin does not match initial one");
+            ASSERT(result_borders.second == range_end, "Restored range end does not match initial one");
+            ASSERT((combined_map.size() == num_threads), "Incorrect number or post-proportional split ranges");
+            size_t expected_size = (range_end - range_begin) / num_threads;
+            for (MapType::iterator it = combined_map.begin(); it != combined_map.end(); ++it) {
+                size_t size = it->second.second - it->second.first;
+                ASSERT((size == expected_size || size == expected_size + 1), "Incorrect post-proportional range size");
+            }
+        }
+
+}
+
+void test() {
+    test_body<tbb::affinity_partitioner>();
+    test_body<tbb::static_partitioner>();
+}
+
+} // namespace parallel_for_within_task_arena
+
+int TestMain () {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        if( p>0 ) {
+            tbb::task_scheduler_init init( p );
+            Flog<parallel_tag,1>(p);
+            Flog<parallel_tag,10>(p);
+            Flog<parallel_tag,100>(p);
+            Flog<parallel_tag,1000>(p);
+            Flog<parallel_tag,10000>(p);
+
+            // Testing with different integer types
+            TestParallelForWithStepSupport<parallel_tag,short>();
+            TestParallelForWithStepSupport<parallel_tag,unsigned short>();
+            TestParallelForWithStepSupport<parallel_tag,int>();
+            TestParallelForWithStepSupport<parallel_tag,unsigned int>();
+            TestParallelForWithStepSupport<parallel_tag,long>();
+            TestParallelForWithStepSupport<parallel_tag,unsigned long>();
+            TestParallelForWithStepSupport<parallel_tag,long long>();
+            TestParallelForWithStepSupport<parallel_tag,unsigned long long>();
+            TestParallelForWithStepSupport<parallel_tag,size_t>();
+
+#if TBB_PREVIEW_SERIAL_SUBSET
+            // This is for testing serial implementation.
+            if( p == MaxThread ) {
+                Flog<serial_tag,1>(p);
+                Flog<serial_tag,10>(p);
+                Flog<serial_tag,100>(p);
+                TestParallelForWithStepSupport<serial_tag,short>();
+                TestParallelForWithStepSupport<serial_tag,unsigned short>();
+                TestParallelForWithStepSupport<serial_tag,int>();
+                TestParallelForWithStepSupport<serial_tag,unsigned int>();
+                TestParallelForWithStepSupport<serial_tag,long>();
+                TestParallelForWithStepSupport<serial_tag,unsigned long>();
+                TestParallelForWithStepSupport<serial_tag,long long>();
+                TestParallelForWithStepSupport<serial_tag,unsigned long long>();
+                TestParallelForWithStepSupport<serial_tag,size_t>();
+            }
+#endif
+
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+            TestExceptionsSupport();
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+#if __TBB_TASK_GROUP_CONTEXT
+            if ( p > 1 )
+                TestCancellation();
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+#if !__TBB_SSE_STACK_ALIGNMENT_BROKEN
+    #if HAVE_m128
+            TestVectorTypes<ClassWithSSE>();
+    #endif
+    #if HAVE_m256
+            if (have_AVX()) TestVectorTypes<ClassWithAVX>();
+    #endif
+#endif /*!__TBB_SSE_STACK_ALIGNMENT_BROKEN*/
+            // Test that all workers sleep when no work
+            TestCPUUserTime(p);
+            TestSimplePartitionerStability();
+        }
+    }
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception handling tests are skipped.\n");
+#endif
+#if (HAVE_m128 || HAVE_m256) && __TBB_SSE_STACK_ALIGNMENT_BROKEN
+    REPORT("Known issue: stack alignment for SIMD instructions not tested.\n");
+#endif
+
+    various_range_implementations::test();
+    interaction_with_range_and_partitioner::test();
+    parallel_for_within_task_arena::test();
+    return Harness::Done;
+}
+
+#if _MSC_VER
+#pragma warning (pop)
+#endif
diff --git a/xdl/third_party/tbb/src/test/test_parallel_for_each.cpp b/xdl/third_party/tbb/src/test/test_parallel_for_each.cpp
new file mode 100644
index 00000000..df5d545d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_for_each.cpp
@@ -0,0 +1,248 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning(disable: 4180) // "qualifier applied to function type has no meaning; ignored"
+#endif
+
+#include "tbb/parallel_for_each.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/atomic.h"
+#include "harness.h"
+#include "harness_iterator.h"
+#include <list>
+
+// Some old compilers can't deduce template paremeter type for parallel_for_each
+// if the function name is passed without explicit cast to function pointer.
+typedef void (*TestFunctionType)(size_t);
+
+tbb::atomic<size_t> sum;
+
+// This function is called via parallel_for_each
+void TestFunction (size_t value) {
+    sum += (unsigned int)value;
+}
+
+const size_t NUMBER_OF_ELEMENTS = 1000;
+
+// Tests tbb::parallel_for_each functionality
+template <typename Iterator>
+void RunPForEachTests()
+{
+    size_t test_vector[NUMBER_OF_ELEMENTS + 1];
+
+    sum = 0;
+    size_t test_sum = 0;
+
+    for (size_t i =0; i < NUMBER_OF_ELEMENTS; i++) {
+        test_vector[i] = i;
+        test_sum += i;
+    }
+    test_vector[NUMBER_OF_ELEMENTS] = 1000000; // parallel_for_each shouldn't touch this element
+
+    Iterator begin(&test_vector[0]);
+    Iterator end(&test_vector[NUMBER_OF_ELEMENTS]);
+
+    tbb::parallel_for_each(begin, end, (TestFunctionType)TestFunction);
+    ASSERT(sum == test_sum, "Not all items of test vector were processed by parallel_for_each");
+    ASSERT(test_vector[NUMBER_OF_ELEMENTS] == 1000000, "parallel_for_each processed an extra element");
+}
+
+typedef void (*TestMutatorType)(size_t&);
+
+void TestMutator(size_t& value) {
+    ASSERT(value==0,NULL);
+    ++sum;
+    ++value;
+}
+
+//! Test that tbb::parallel_for_each works for mutable iterators.
+template <typename Iterator>
+void RunMutablePForEachTests() {
+    size_t test_vector[NUMBER_OF_ELEMENTS];
+    for( size_t i=0; i<NUMBER_OF_ELEMENTS; ++i )
+        test_vector[i] = 0;
+    sum = 0;
+    tbb::parallel_for_each( Iterator(test_vector), Iterator(test_vector+NUMBER_OF_ELEMENTS), (TestMutatorType)TestMutator );
+    ASSERT( sum==NUMBER_OF_ELEMENTS, "parallel_for_each called function wrong number of times" );
+    for( size_t i=0; i<NUMBER_OF_ELEMENTS; ++i )
+        ASSERT( test_vector[i]==1, "parallel_for_each did not process each element exactly once" );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+#define HARNESS_EH_SIMPLE_MODE 1
+#include "tbb/tbb_exception.h"
+#include "harness_eh.h"
+
+#if TBB_USE_EXCEPTIONS
+void test_function_with_exception(size_t) {
+    ThrowTestException();
+}
+
+template <typename Iterator>
+void TestExceptionsSupport()
+{
+    REMARK (__FUNCTION__);
+    size_t test_vector[NUMBER_OF_ELEMENTS + 1];
+
+    for (size_t i = 0; i < NUMBER_OF_ELEMENTS; i++) {
+        test_vector[i] = i;
+    }
+
+    Iterator begin(&test_vector[0]);
+    Iterator end(&test_vector[NUMBER_OF_ELEMENTS]);
+
+    TRY();
+       tbb::parallel_for_each(begin, end, (TestFunctionType)test_function_with_exception);
+    CATCH_AND_ASSERT();
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+// Cancellation support test
+void function_to_cancel(size_t ) {
+    ++g_CurExecuted;
+    CancellatorTask::WaitUntilReady();
+}
+
+template <typename Iterator>
+class my_worker_pforeach_task : public tbb::task
+{
+    tbb::task_group_context &my_ctx;
+
+    tbb::task* execute () __TBB_override {
+        size_t test_vector[NUMBER_OF_ELEMENTS + 1];
+        for (size_t i = 0; i < NUMBER_OF_ELEMENTS; i++) {
+            test_vector[i] = i;
+        }
+        Iterator begin(&test_vector[0]);
+        Iterator end(&test_vector[NUMBER_OF_ELEMENTS]);
+
+        tbb::parallel_for_each(begin, end, (TestFunctionType)function_to_cancel);
+
+        return NULL;
+    }
+public:
+    my_worker_pforeach_task ( tbb::task_group_context &ctx) : my_ctx(ctx) { }
+};
+
+template <typename Iterator>
+void TestCancellation()
+{
+    REMARK (__FUNCTION__);
+    ResetEhGlobals();
+    RunCancellationTest<my_worker_pforeach_task<Iterator>, CancellatorTask>();
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+#include "harness_cpu.h"
+
+const size_t elements = 10000;
+const size_t init_sum = 0;
+tbb::atomic<size_t> element_counter;
+
+template<size_t K>
+struct set_to {
+    void operator()(size_t& x) const {
+        x = K;
+        ++element_counter;
+    }
+};
+
+#include "test_range_based_for.h"
+#include <functional>
+
+void range_for_each_test() {
+    using namespace range_based_for_support_tests;
+    std::list<size_t> v(elements, 0);
+
+    // iterator, const and non-const range check
+    element_counter = 0;
+    tbb::parallel_for_each(v.begin(), v.end(), set_to<1>());
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == v.size(), "elements of v not all ones");
+
+    element_counter = 0;
+    tbb::parallel_for_each(v, set_to<0>());
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == init_sum , "elements of v not all zeros");
+
+    element_counter = 0;
+    tbb::parallel_for_each(tbb::blocked_range<std::list<size_t>::iterator>(v.begin(), v.end()), set_to<1>());
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == v.size(), "elements of v not all ones");
+
+    // iterator, const and non-const range check with context
+    element_counter = 0;
+    tbb::task_group_context context;
+    tbb::parallel_for_each(v.begin(), v.end(), set_to<0>(), context);
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == init_sum , "elements of v not all zeros");
+
+    element_counter = 0;
+    tbb::parallel_for_each(v, set_to<1>(), context);
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == v.size(), "elements of v not all ones");
+
+    element_counter = 0;
+    tbb::parallel_for_each(tbb::blocked_range<std::list<size_t>::iterator>(v.begin(), v.end()), set_to<0>(), context);
+    ASSERT(element_counter == v.size() && element_counter == elements, "not all elements were set");
+    ASSERT(range_based_for_accumulate(v, std::plus<size_t>(), init_sum) == init_sum , "elements of v not all zeros");
+}
+
+int TestMain () {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init( p );
+
+        RunPForEachTests<Harness::RandomIterator<size_t> >();
+        RunPForEachTests<Harness::ConstRandomIterator<size_t> >();
+        RunPForEachTests<Harness::InputIterator<size_t> >();
+        RunPForEachTests<Harness::ForwardIterator<size_t> >();
+
+        RunMutablePForEachTests<Harness::RandomIterator<size_t> >();
+        RunMutablePForEachTests<Harness::ForwardIterator<size_t> >();
+
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+        TestExceptionsSupport<Harness::RandomIterator<size_t> >();
+        TestExceptionsSupport<Harness::InputIterator<size_t> >();
+        TestExceptionsSupport<Harness::ForwardIterator<size_t> >();
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+
+#if __TBB_TASK_GROUP_CONTEXT
+        if (p > 1) {
+            TestCancellation<Harness::RandomIterator<size_t> >();
+            TestCancellation<Harness::InputIterator<size_t> >();
+            TestCancellation<Harness::ForwardIterator<size_t> >();
+        }
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+        range_for_each_test();
+
+        // Test that all workers sleep when no work
+        TestCPUUserTime(p);
+    }
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception handling tests are skipped.\n");
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_parallel_for_vectorization.cpp b/xdl/third_party/tbb/src/test/test_parallel_for_vectorization.cpp
new file mode 100644
index 00000000..13897ec6
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_for_vectorization.cpp
@@ -0,0 +1,75 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// The test checks if the vectorization happens when PPL-style parallel_for is
+// used. The test implements two ideas:
+// 1. "pragma always assert" issues a compiler-time error if the vectorization
+// cannot be produced;
+// 2. "#pragma ivdep" has a peculiarity which also can be used for detection of
+// successful vectorization. See the comment below.
+
+// For now, only Intel(R) C++ Compiler 14.0 and later is supported. Also, no
+// sense to run the test in debug mode.
+#define HARNESS_SKIP_TEST ( __INTEL_COMPILER < 1400  || TBB_USE_DEBUG )
+
+// __TBB_ASSERT_ON_VECTORIZATION_FAILURE enables "pragma always assert" for
+// Intel(R) C++ Compiler.
+#define __TBB_ASSERT_ON_VECTORIZATION_FAILURE ( !HARNESS_SKIP_TEST )
+#include "tbb/parallel_for.h"
+#include "tbb/task_scheduler_init.h"
+
+#include "harness.h"
+#include "harness_assert.h"
+
+#include <algorithm>
+
+class Body : NoAssign {
+    int *out_, *in_;
+public:
+    Body( int* out, int *in ) : out_(out), in_(in) {}
+    void operator() ( int i ) const {
+        out_[i] = in_[i] + 1;
+    }
+};
+
+int TestMain () {
+    // Should be big enough that the partitioner generated at least a one range
+    // with a size greater than 1. See the comment below.
+    const int N = 10000;
+    tbb::task_scheduler_init init(1);
+    int array1[N];
+    std::fill( array1, array1+N, 0 );
+    // Use the same array (with a shift) for both input and output
+    tbb::parallel_for( 0, N-1, Body(array1+1, array1) );
+
+    int array2[N];
+    std::fill( array2, array2+N, 0 );
+    Body b(array2+1, array2);
+    for ( int i=0; i<N-1; ++i )
+        b(i);
+
+    // The ppl-style parallel_for implementation has pragma ivdep before the
+    // range loop. This pragma suppresses the dependency of overlapping arrays
+    // in "Body". Thus the vectorizer should generate code that produces incorrect
+    // results.
+    ASSERT( !std::equal( array1, array1+N, array2 ), "The loop was not vectorized." );
+
+    return  Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_parallel_invoke.cpp b/xdl/third_party/tbb/src/test/test_parallel_invoke.cpp
new file mode 100644
index 00000000..b814d6de
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_invoke.cpp
@@ -0,0 +1,321 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+#pragma warning(disable: 4180) // "qualifier applied to function type has no meaning; ignored"
+#endif
+
+#ifndef TBB_PREVIEW_VARIADIC_PARALLEL_INVOKE
+    #define TBB_PREVIEW_VARIADIC_PARALLEL_INVOKE __TBB_CPF_BUILD
+#endif
+
+#include "tbb/parallel_invoke.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/atomic.h"
+#include "tbb/tbb_exception.h"
+#include "harness.h"
+
+#if !__INTEL_COMPILER && (_MSC_VER && _MSC_VER <= 1400 || __GNUC__==3 && __GNUC_MINOR__<=3 || __SUNPRO_CC)
+    #define __TBB_FUNCTION_BY_CONSTREF_IN_TEMPLATE_BROKEN 1
+#endif
+
+tbb::atomic<size_t> function_counter;
+
+// Some macros to make the test easier to read
+
+// 10 functions test0 ... test9 are defined
+// pointer to each function is also defined
+
+#define TEST_FUNCTION(value) void test##value () \
+{   \
+    ASSERT(!(function_counter & (1 << value)), "Test function has already been called"); \
+    function_counter += 1 << value; \
+}   \
+void (*test_pointer##value)(void) = test##value;
+
+TEST_FUNCTION(0)
+TEST_FUNCTION(1)
+TEST_FUNCTION(2)
+TEST_FUNCTION(3)
+TEST_FUNCTION(4)
+TEST_FUNCTION(5)
+TEST_FUNCTION(6)
+TEST_FUNCTION(7)
+TEST_FUNCTION(8)
+TEST_FUNCTION(9)
+
+// The same with functors
+#define TEST_FUNCTOR(value) class test_functor##value  \
+{   \
+public: \
+    void operator() () const {  \
+        function_counter += 1 << value;   \
+    }   \
+} functor##value;
+
+TEST_FUNCTOR(0)
+TEST_FUNCTOR(1)
+TEST_FUNCTOR(2)
+TEST_FUNCTOR(3)
+TEST_FUNCTOR(4)
+TEST_FUNCTOR(5)
+TEST_FUNCTOR(6)
+TEST_FUNCTOR(7)
+TEST_FUNCTOR(8)
+TEST_FUNCTOR(9)
+
+#define INIT_TEST function_counter = 0;
+
+#define VALIDATE_INVOKE_RUN(number_of_args, test_type) \
+    ASSERT( size_t(function_counter) == (size_t(1) << number_of_args) - 1, "parallel_invoke called with " #number_of_args " arguments didn't process all " #test_type);
+
+// Calls parallel_invoke for different number of arguments
+// It can be called with and without user context
+template <typename F0, typename F1, typename F2, typename F3, typename F4, typename F5,
+    typename F6, typename F7, typename F8, typename F9>
+void call_parallel_invoke( size_t n, F0& f0, F1& f1, F2& f2, F3& f3, F4 &f4, F5 &f5,
+                          F6& f6, F7 &f7, F8 &f8, F9 &f9, tbb::task_group_context* context) {
+    switch(n) {
+    case 2:
+        if (context)
+            tbb::parallel_invoke (f0, f1, *context);
+        else
+            tbb::parallel_invoke (f0, f1);
+        break;
+    case 3:
+        if (context)
+            tbb::parallel_invoke (f0, f1, f2, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2);
+        break;
+    case 4:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3);
+        break;
+    case 5:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3, f4);
+        break;
+    case 6:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5);
+        break;
+    case 7:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6);
+        break;
+    case 8:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, f7, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, f7);
+        break;
+    case 9:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, f7, f8, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, f7, f8);
+        break;
+    case 10:
+        if(context)
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, f7, f8, f9, *context);
+        else
+            tbb::parallel_invoke (f0, f1, f2, f3, f4, f5, f6, f7, f8, f9);
+        break;
+    default:
+        ASSERT(false, "number of arguments must be between 2 and 10");
+    }
+}
+
+#if !__TBB_FUNCTION_BY_CONSTREF_IN_TEMPLATE_BROKEN
+template<typename function> void aux_invoke(const function& f) {
+    f();
+}
+
+bool function_by_constref_in_template_codegen_broken() {
+    function_counter = 0;
+    aux_invoke(test1);
+    return function_counter==0;
+}
+#endif /* !__TBB_FUNCTION_BY_CONSTREF_IN_TEMPLATE_BROKEN */
+
+void test_parallel_invoke()
+{
+    REMARK (__FUNCTION__);
+    // Testing with pointers to functions
+    for (int n = 2; n <=10; n++)
+    {
+        INIT_TEST;
+        call_parallel_invoke(n, test_pointer0, test_pointer1, test_pointer2, test_pointer3, test_pointer4,
+            test_pointer5, test_pointer6, test_pointer7, test_pointer8, test_pointer9, NULL);
+        VALIDATE_INVOKE_RUN(n, "pointers to function");
+    }
+
+    // Testing parallel_invoke with functors
+    for (int n = 2; n <=10; n++)
+    {
+        INIT_TEST;
+        call_parallel_invoke(n, functor0, functor1, functor2, functor3, functor4,
+            functor5, functor6, functor7, functor8, functor9, NULL);
+        VALIDATE_INVOKE_RUN(n, "functors");
+    }
+
+#if __TBB_FUNCTION_BY_CONSTREF_IN_TEMPLATE_BROKEN
+    // some old compilers can't cope with passing function name into parallel_invoke
+#else
+    // and some compile but generate broken code that does not call the function
+    if (function_by_constref_in_template_codegen_broken())
+        return;
+
+    // Testing parallel_invoke with functions
+    for (int n = 2; n <=10; n++)
+    {
+        INIT_TEST;
+        call_parallel_invoke(n, test0, test1, test2, test3, test4, test5, test6, test7, test8, test9, NULL);
+        VALIDATE_INVOKE_RUN(n, "functions");
+    }
+#endif
+}
+
+// Exception handling support test
+
+#if __TBB_TASK_GROUP_CONTEXT
+#define HARNESS_EH_SIMPLE_MODE 1
+#include "harness_eh.h"
+
+#if TBB_USE_EXCEPTIONS
+volatile size_t exception_mask; // each bit represents whether the function should throw exception or not
+
+// throws exception if corresponding exception_mask bit is set
+#define TEST_FUNCTOR_WITH_THROW(value) \
+struct throwing_functor##value { \
+    void operator() () const {  \
+        if (exception_mask & (1 << value))   \
+            ThrowTestException();    \
+    }   \
+} test_with_throw##value;
+
+TEST_FUNCTOR_WITH_THROW(0)
+TEST_FUNCTOR_WITH_THROW(1)
+TEST_FUNCTOR_WITH_THROW(2)
+TEST_FUNCTOR_WITH_THROW(3)
+TEST_FUNCTOR_WITH_THROW(4)
+TEST_FUNCTOR_WITH_THROW(5)
+TEST_FUNCTOR_WITH_THROW(6)
+TEST_FUNCTOR_WITH_THROW(7)
+TEST_FUNCTOR_WITH_THROW(8)
+TEST_FUNCTOR_WITH_THROW(9)
+
+void TestExceptionHandling()
+{
+    REMARK (__FUNCTION__);
+    for( size_t n = 2; n <= 10; ++n ) {
+        for( exception_mask = 1; exception_mask < (size_t(1) << n); ++exception_mask ) {
+            ResetEhGlobals();
+            TRY();
+                REMARK("Calling parallel_invoke, number of functions = %d, exception_mask = %d\n", n, exception_mask);
+                call_parallel_invoke(n, test_with_throw0, test_with_throw1, test_with_throw2, test_with_throw3,
+                    test_with_throw4, test_with_throw5, test_with_throw6, test_with_throw7, test_with_throw8, test_with_throw9, NULL);
+            CATCH_AND_ASSERT();
+        }
+    }
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+// Cancellation support test
+void function_to_cancel() {
+    ++g_CurExecuted;
+    CancellatorTask::WaitUntilReady();
+}
+
+// The function is used to test cancellation
+void simple_test_nothrow (){
+    ++g_CurExecuted;
+}
+
+size_t g_numFunctions,
+       g_functionToCancel;
+
+class ParInvokeLauncherTask : public tbb::task
+{
+    tbb::task_group_context &my_ctx;
+    void(*func_array[10])(void);
+
+    tbb::task* execute () __TBB_override {
+        func_array[g_functionToCancel] = &function_to_cancel;
+        call_parallel_invoke(g_numFunctions, func_array[0], func_array[1], func_array[2], func_array[3],
+            func_array[4], func_array[5], func_array[6], func_array[7], func_array[8], func_array[9], &my_ctx);
+        return NULL;
+    }
+public:
+    ParInvokeLauncherTask ( tbb::task_group_context& ctx ) : my_ctx(ctx) {
+        for (int i = 0; i <=9; ++i)
+            func_array[i] = &simple_test_nothrow;
+    }
+};
+
+void TestCancellation ()
+{
+    REMARK (__FUNCTION__);
+    for ( int n = 2; n <= 10; ++n ) {
+        for ( int m = 0; m <= n - 1; ++m ) {
+            g_numFunctions = n;
+            g_functionToCancel = m;
+            ResetEhGlobals();
+            RunCancellationTest<ParInvokeLauncherTask, CancellatorTask>();
+        }
+    }
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+//------------------------------------------------------------------------
+// Entry point
+//------------------------------------------------------------------------
+
+#include "harness_cpu.h"
+
+int TestMain () {
+    MinThread = min(MinThread, MaxThread);
+    ASSERT (MinThread>=1, "Minimal number of threads must be 1 or more");
+    for ( int p = MinThread; p <= MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        test_parallel_invoke();
+        if (p > 1) {
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+            REPORT("Known issue: exception handling tests are skipped.\n");
+#elif TBB_USE_EXCEPTIONS
+            TestExceptionHandling();
+#endif /* TBB_USE_EXCEPTIONS */
+#if __TBB_TASK_GROUP_CONTEXT
+            TestCancellation();
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+        }
+        TestCPUUserTime(p);
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_parallel_pipeline.cpp b/xdl/third_party/tbb/src/test/test_parallel_pipeline.cpp
new file mode 100644
index 00000000..f297abe7
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_pipeline.cpp
@@ -0,0 +1,668 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Before including pipeline.h, set up the variable to count heap allocated
+// filter_node objects, and make it known for the header.
+int filter_node_count = 0;
+#define __TBB_TEST_FILTER_NODE_COUNT filter_node_count
+#include "tbb/pipeline.h"
+
+#include "tbb/atomic.h"
+#include "harness.h"
+#include <string.h>
+
+#include "tbb/tbb_allocator.h"
+#include "tbb/spin_mutex.h"
+
+const unsigned n_tokens = 8;
+// we can conceivably have two buffers used in the middle filter for every token in flight, so
+// we must allocate two buffers for every token.  Unlikely, but possible.
+const unsigned n_buffers = 2*n_tokens;
+const int max_counter = 16;
+static tbb::atomic<int> output_counter;
+static tbb::atomic<int> input_counter;
+static tbb::atomic<int> non_pointer_specialized_calls;
+static tbb::atomic<int> pointer_specialized_calls;
+static tbb::atomic<int> first_pointer_specialized_calls;
+static tbb::atomic<int> second_pointer_specialized_calls;
+static tbb::spin_mutex buffer_mutex;
+
+static int intbuffer[max_counter];  // store results for <int,int> parallel pipeline test
+static bool check_intbuffer;
+
+static void* buffers[n_buffers];
+static bool buf_available[n_buffers];
+
+void *fetchNextBuffer() {
+    tbb::spin_mutex::scoped_lock sl1(buffer_mutex);
+    for(size_t icnt = 0; icnt < n_buffers; ++icnt) {
+        if(buf_available[icnt]) {
+            buf_available[icnt] = false;
+            return buffers[icnt];
+        }
+    }
+    ASSERT(0, "Ran out of buffers");
+    return 0;
+}
+void freeBuffer(void *buf) {
+    for(size_t i=0; i < n_buffers;++i) {
+        if(buffers[i] == buf) {
+            buf_available[i] = true;
+            return;
+        }
+    }
+    ASSERT(0, "Tried to free a buffer not in our list");
+}
+
+template<typename T>
+class free_on_scope_exit {
+public:
+    free_on_scope_exit(T *p) : my_p(p) {}
+    ~free_on_scope_exit() { if(!my_p) return; my_p->~T(); freeBuffer(my_p); }
+private:
+    T *my_p;
+};
+
+#include "harness_checktype.h"
+
+// methods for testing check_type< >, that return okay values for other types.
+template<typename T>
+bool middle_is_ready(T &/*p*/) { return false; }
+
+template<typename U>
+bool middle_is_ready(check_type<U> &p) { return p.is_ready(); }
+
+template<typename T>
+bool output_is_ready(T &/*p*/) { return true; }
+
+template<typename U>
+bool output_is_ready(check_type<U> &p) { return p.is_ready(); }
+
+template<typename T>
+int middle_my_id( T &/*p*/) { return 0; }
+
+template<typename U>
+int middle_my_id(check_type<U> &p) { return p.my_id(); }
+
+template<typename T>
+int output_my_id( T &/*p*/) { return 1; }
+
+template<typename U>
+int output_my_id(check_type<U> &p) { return p.my_id(); }
+
+template<typename T>
+void my_function(T &p) { p = 0; }
+
+template<typename U>
+void my_function(check_type<U> &p) { p.function(); }
+
+// Filters must be copy-constructible, and be const-qualifiable.
+template<typename U>
+class input_filter : Harness::NoAfterlife {
+public:
+    U operator()( tbb::flow_control& control ) const {
+        AssertLive();
+        if( --input_counter < 0 ) {
+            control.stop();
+        }
+        else  // only count successful reads
+            ++non_pointer_specialized_calls;
+        return U();  // default constructed
+    }
+
+};
+
+// specialization for pointer
+template<typename U>
+class input_filter<U*> : Harness::NoAfterlife {
+public:
+    U* operator()(tbb::flow_control& control) const {
+        AssertLive();
+        int ival = --input_counter;
+        if(ival < 0) {
+            control.stop();
+            return NULL;
+        }
+        ++pointer_specialized_calls;
+        if(ival == max_counter / 2) {
+            return NULL;  // non-stop NULL
+        }
+        U* myReturn = new(fetchNextBuffer()) U();
+        return myReturn;
+    }
+};
+
+template<>
+class input_filter<void> : Harness::NoAfterlife {
+public:
+    void operator()( tbb::flow_control& control ) const {
+        AssertLive();
+        if( --input_counter < 0 ) {
+            control.stop();
+        }
+        else
+            ++non_pointer_specialized_calls;
+    }
+
+};
+
+// specialization for int that passes back a sequence of integers
+template<>
+class input_filter<int> : Harness::NoAfterlife {
+public:
+    int
+    operator()(tbb::flow_control& control ) const {
+        AssertLive();
+        int oldval = --input_counter;
+        if( oldval < 0 ) {
+            control.stop();
+        }
+        else
+            ++non_pointer_specialized_calls;
+        return oldval+1;
+    }
+};
+
+template<typename T, typename U>
+class middle_filter : Harness::NoAfterlife {
+public:
+    U operator()(T t) const {
+        AssertLive();
+        ASSERT(!middle_my_id(t), "bad id value");
+        ASSERT(!middle_is_ready(t), "Already ready" );
+        U out;
+        my_function(out);
+        ++non_pointer_specialized_calls;
+        return out;
+    }
+};
+
+template<typename T, typename U>
+class middle_filter<T*,U> : Harness::NoAfterlife {
+public:
+    U operator()(T* my_storage) const {
+        free_on_scope_exit<T> my_ptr(my_storage);  // free_on_scope_exit marks the buffer available
+        AssertLive();
+        if(my_storage) {  // may have been passed in a NULL
+            ASSERT(!middle_my_id(*my_storage), "bad id value");
+            ASSERT(!middle_is_ready(*my_storage), "Already ready" );
+        }
+        ++first_pointer_specialized_calls;
+        U out;
+        my_function(out);
+        return out;
+    }
+};
+
+template<typename T, typename U>
+class middle_filter<T,U*> : Harness::NoAfterlife {
+public:
+    U* operator()(T my_storage) const {
+        AssertLive();
+        ASSERT(!middle_my_id(my_storage), "bad id value");
+        ASSERT(!middle_is_ready(my_storage), "Already ready" );
+        // allocate new space from buffers
+        U* my_return = new(fetchNextBuffer()) U();
+        my_function(*my_return);
+        ++second_pointer_specialized_calls;
+        return my_return;
+    }
+};
+
+template<typename T, typename U>
+class middle_filter<T*,U*> : Harness::NoAfterlife {
+public:
+    U* operator()(T* my_storage) const {
+        free_on_scope_exit<T> my_ptr(my_storage);  // free_on_scope_exit marks the buffer available
+        AssertLive();
+        if(my_storage) {
+            ASSERT(!middle_my_id(*my_storage), "bad id value");
+            ASSERT(!middle_is_ready(*my_storage), "Already ready" );
+        }
+        // may have been passed a NULL
+        ++pointer_specialized_calls;
+        if(!my_storage) return NULL;
+        ASSERT(!middle_my_id(*my_storage), "bad id value");
+        ASSERT(!middle_is_ready(*my_storage), "Already ready" );
+        U* my_return = new(fetchNextBuffer()) U();
+        my_function(*my_return);
+        return my_return;
+    }
+};
+
+// specialization for int that squares the input and returns that.
+template<>
+class middle_filter<int,int> : Harness::NoAfterlife {
+public:
+    int operator()(int my_input) const {
+        AssertLive();
+        ++non_pointer_specialized_calls;
+        return my_input*my_input;
+    }
+};
+
+// ---------------------------------
+template<typename T>
+class output_filter : Harness::NoAfterlife {
+public:
+    void operator()(T c) const {
+        AssertLive();
+        ASSERT(output_my_id(c), "unset id value");
+        ASSERT(output_is_ready(c), "not yet ready");
+        ++non_pointer_specialized_calls;
+        output_counter++;
+    }
+};
+
+// specialization for int that puts the received value in an array
+template<>
+class output_filter<int> : Harness::NoAfterlife {
+public:
+    void operator()(int my_input) const {
+        AssertLive();
+        ++non_pointer_specialized_calls;
+        int myindx = output_counter++;
+        intbuffer[myindx] = my_input;
+    }
+};
+
+
+template<typename T>
+class output_filter<T*> : Harness::NoAfterlife {
+public:
+    void operator()(T* c) const {
+        free_on_scope_exit<T> my_ptr(c);
+        AssertLive();
+        if(c) {
+            ASSERT(output_my_id(*c), "unset id value");
+            ASSERT(output_is_ready(*c), "not yet ready");
+        }
+        output_counter++;
+        ++pointer_specialized_calls;
+    }
+};
+
+typedef enum {
+    no_pointer_counts,
+    assert_nonpointer,
+    assert_firstpointer,
+    assert_secondpointer,
+    assert_allpointer
+} final_assert_type;
+
+void resetCounters() {
+    output_counter = 0;
+    input_counter = max_counter;
+    non_pointer_specialized_calls = 0;
+    pointer_specialized_calls = 0;
+    first_pointer_specialized_calls = 0;
+    second_pointer_specialized_calls = 0;
+    // we have to reset the buffer flags because our input filters return allocated space on end-of-input,
+    // (on eof a default-constructed object is returned) and they do not pass through the filter further.
+    for(size_t i = 0; i < n_buffers; ++i)
+        buf_available[i] = true;
+}
+
+void checkCounters(final_assert_type my_t) {
+    ASSERT(output_counter == max_counter, "not all tokens were passed through pipeline");
+    switch(my_t) {
+        case assert_nonpointer:
+            ASSERT(pointer_specialized_calls+first_pointer_specialized_calls+second_pointer_specialized_calls == 0, "non-pointer filters specialized to pointer");
+            ASSERT(non_pointer_specialized_calls == 3*max_counter, "bad count for non-pointer filters");
+            if(check_intbuffer) {
+                for(int i = 1; i <= max_counter; ++i) {
+                    int j = i*i;
+                    bool found_val = false;
+                    for(int k = 0; k < max_counter; ++k) {
+                        if(intbuffer[k] == j) {
+                            found_val = true;
+                            break;
+                        }
+                    }
+                    ASSERT(found_val, "Missing value in output array" );
+                }
+            }
+            break;
+        case assert_firstpointer:
+            ASSERT(pointer_specialized_calls == max_counter &&  // input filter extra invocation
+                    first_pointer_specialized_calls == max_counter &&
+                    non_pointer_specialized_calls == max_counter &&
+                    second_pointer_specialized_calls == 0, "incorrect specialization for firstpointer");
+            break;
+        case assert_secondpointer:
+            ASSERT(pointer_specialized_calls == max_counter &&
+                    first_pointer_specialized_calls == 0 &&
+                    non_pointer_specialized_calls == max_counter &&  // input filter
+                    second_pointer_specialized_calls == max_counter, "incorrect specialization for firstpointer");
+            break;
+        case assert_allpointer:
+            ASSERT(non_pointer_specialized_calls+first_pointer_specialized_calls+second_pointer_specialized_calls == 0, "pointer filters specialized to non-pointer");
+            ASSERT(pointer_specialized_calls == 3*max_counter, "bad count for pointer filters");
+            break;
+        case no_pointer_counts:
+            break;
+    }
+}
+
+static const tbb::filter::mode filter_table[] = { tbb::filter::parallel, tbb::filter::serial_in_order, tbb::filter::serial_out_of_order};
+const unsigned number_of_filter_types = sizeof(filter_table)/sizeof(filter_table[0]);
+
+typedef tbb::filter_t<void, void> filter_chain;
+typedef tbb::filter::mode mode_array;
+
+// The filters are passed by value, which forces a temporary copy to be created.  This is
+// to reproduce the bug where a filter_chain uses refs to filters, which after a call
+// would be references to destructed temporaries.
+template<typename type1, typename type2>
+void fill_chain( filter_chain &my_chain, mode_array *filter_type, input_filter<type1> i_filter,
+         middle_filter<type1, type2> m_filter, output_filter<type2> o_filter ) {
+    my_chain = tbb::make_filter<void, type1>(filter_type[0], i_filter) &
+        tbb::make_filter<type1, type2>(filter_type[1], m_filter) &
+        tbb::make_filter<type2, void>(filter_type[2], o_filter);
+}
+
+void run_function_spec() {
+    ASSERT(!filter_node_count, NULL);
+    REMARK("Testing < void, void > (single filter in pipeline)");
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    REMARK( " ( + lambdas)");
+#endif
+    REMARK("\n");
+    input_filter<void> i_filter;
+    // Test pipeline that contains only one filter
+    for( unsigned i = 0; i<number_of_filter_types; i++) {
+        tbb::filter_t<void, void> one_filter( filter_table[i], i_filter );
+        ASSERT(filter_node_count==1, "some filter nodes left after previous iteration?");
+        resetCounters();
+        tbb::parallel_pipeline( n_tokens, one_filter );
+        // no need to check counters
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        tbb::atomic<int> counter;
+        counter = max_counter;
+        // Construct filter using lambda-syntax when parallel_pipeline() is being run;
+        tbb::parallel_pipeline( n_tokens,
+            tbb::make_filter<void, void>(filter_table[i], [&counter]( tbb::flow_control& control ) {
+                    if( counter-- == 0 )
+                        control.stop();
+                    }
+            )
+        );
+#endif
+    }
+    ASSERT(!filter_node_count, "filter_node objects leaked");
+}
+
+template<typename t1, typename t2>
+void run_filter_set(
+        input_filter<t1>& i_filter,
+        middle_filter<t1,t2>& m_filter,
+        output_filter<t2>& o_filter,
+        mode_array *filter_type,
+        final_assert_type my_t) {
+    tbb::filter_t<void, t1> filter1( filter_type[0], i_filter );
+    tbb::filter_t<t1, t2> filter2( filter_type[1], m_filter );
+    tbb::filter_t<t2, void> filter3( filter_type[2], o_filter );
+    ASSERT(filter_node_count==3, "some filter nodes left after previous iteration?");
+    resetCounters();
+    // Create filters sequence when parallel_pipeline() is being run
+    tbb::parallel_pipeline( n_tokens, filter1 & filter2 & filter3 );
+    checkCounters(my_t);
+
+    // Create filters sequence partially outside parallel_pipeline() and also when parallel_pipeline() is being run
+    tbb::filter_t<void, t2> filter12;
+    filter12 = filter1 & filter2;
+    resetCounters();
+    tbb::parallel_pipeline( n_tokens, filter12 & filter3 );
+    checkCounters(my_t);
+
+    tbb::filter_t<void, void> filter123 = filter12 & filter3;
+    // Run pipeline twice with the same filter sequence
+    for( unsigned i = 0; i<2; i++ ) {
+        resetCounters();
+        tbb::parallel_pipeline( n_tokens, filter123 );
+        checkCounters(my_t);
+    }
+
+    // Now copy-construct another filter_t instance, and use it to run pipeline
+    {
+        tbb::filter_t<void, void> copy123( filter123 );
+        resetCounters();
+        tbb::parallel_pipeline( n_tokens, copy123 );
+        checkCounters(my_t);
+    }
+
+    // Construct filters and create the sequence when parallel_pipeline() is being run
+    resetCounters();
+    tbb::parallel_pipeline( n_tokens,
+               tbb::make_filter<void, t1>(filter_type[0], i_filter) &
+               tbb::make_filter<t1, t2>(filter_type[1], m_filter) &
+               tbb::make_filter<t2, void>(filter_type[2], o_filter) );
+    checkCounters(my_t);
+
+    // Construct filters, make a copy, destroy the original filters, and run with the copy
+    int cnt = filter_node_count;
+    {
+        tbb::filter_t<void, void>* p123 = new tbb::filter_t<void,void> (
+               tbb::make_filter<void, t1>(filter_type[0], i_filter) &
+               tbb::make_filter<t1, t2>(filter_type[1], m_filter) &
+               tbb::make_filter<t2, void>(filter_type[2], o_filter) );
+        ASSERT(filter_node_count==cnt+5, "filter node accounting error?");
+        tbb::filter_t<void, void> copy123( *p123 );
+        delete p123;
+        ASSERT(filter_node_count==cnt+5, "filter nodes deleted prematurely?");
+        resetCounters();
+        tbb::parallel_pipeline( n_tokens, copy123 );
+        checkCounters(my_t);
+    }
+
+    // construct a filter with temporaries
+    {
+        tbb::filter_t<void, void> my_filter;
+        fill_chain<t1,t2>( my_filter, filter_type, i_filter, m_filter, o_filter );
+        resetCounters();
+        tbb::parallel_pipeline( n_tokens, my_filter );
+        checkCounters(my_t);
+    }
+    ASSERT(filter_node_count==cnt, "scope ended but filter nodes not deleted?");
+}
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+template <typename t1, typename t2>
+void run_lambdas_test( mode_array *filter_type ) {
+    tbb::atomic<int> counter;
+    counter = max_counter;
+    // Construct filters using lambda-syntax and create the sequence when parallel_pipeline() is being run;
+    resetCounters();  // only need the output_counter reset.
+    tbb::parallel_pipeline( n_tokens,
+        tbb::make_filter<void, t1>(filter_type[0], [&counter]( tbb::flow_control& control ) -> t1 {
+                if( --counter < 0 )
+                    control.stop();
+                return t1(); }
+        ) &
+        tbb::make_filter<t1, t2>(filter_type[1], []( t1 /*my_storage*/ ) -> t2 {
+                return t2(); }
+        ) &
+        tbb::make_filter<t2, void>(filter_type[2], [] ( t2 ) -> void {
+                output_counter++; }
+        )
+    );
+    checkCounters(no_pointer_counts);  // don't have to worry about specializations
+    counter = max_counter;
+    // pointer filters
+    resetCounters();
+    tbb::parallel_pipeline( n_tokens,
+        tbb::make_filter<void, t1*>(filter_type[0], [&counter]( tbb::flow_control& control ) -> t1* {
+                if( --counter < 0 ) {
+                    control.stop();
+                    return NULL;
+                }
+                return new(fetchNextBuffer()) t1(); }
+        ) &
+        tbb::make_filter<t1*, t2*>(filter_type[1], []( t1* my_storage ) -> t2* {
+                tbb::tbb_allocator<t1>().destroy(my_storage); // my_storage->~t1();
+                return new(my_storage) t2(); }
+        ) &
+        tbb::make_filter<t2*, void>(filter_type[2], [] ( t2* my_storage ) -> void {
+                tbb::tbb_allocator<t2>().destroy(my_storage);  // my_storage->~t2();
+                freeBuffer(my_storage);
+                output_counter++; }
+        )
+    );
+    checkCounters(no_pointer_counts);
+    // first filter outputs pointer
+    counter = max_counter;
+    resetCounters();
+    tbb::parallel_pipeline( n_tokens,
+        tbb::make_filter<void, t1*>(filter_type[0], [&counter]( tbb::flow_control& control ) -> t1* {
+                if( --counter < 0 ) {
+                    control.stop();
+                    return NULL;
+                }
+                return new(fetchNextBuffer()) t1(); }
+        ) &
+        tbb::make_filter<t1*, t2>(filter_type[1], []( t1* my_storage ) -> t2 {
+                tbb::tbb_allocator<t1>().destroy(my_storage);   // my_storage->~t1();
+                freeBuffer(my_storage);
+                return t2(); }
+        ) &
+        tbb::make_filter<t2, void>(filter_type[2], [] ( t2 /*my_storage*/) -> void {
+                output_counter++; }
+        )
+    );
+    checkCounters(no_pointer_counts);
+    // second filter outputs pointer
+    counter = max_counter;
+    resetCounters();
+    tbb::parallel_pipeline( n_tokens,
+        tbb::make_filter<void, t1>(filter_type[0], [&counter]( tbb::flow_control& control ) -> t1 {
+                if( --counter < 0 ) {
+                    control.stop();
+                }
+                return t1(); }
+        ) &
+        tbb::make_filter<t1, t2*>(filter_type[1], []( t1 /*my_storage*/ ) -> t2* {
+                return new(fetchNextBuffer()) t2(); }
+        ) &
+        tbb::make_filter<t2*, void>(filter_type[2], [] ( t2* my_storage) -> void {
+                tbb::tbb_allocator<t2>().destroy(my_storage);  // my_storage->~t2();
+                freeBuffer(my_storage);
+                output_counter++; }
+        )
+    );
+    checkCounters(no_pointer_counts);
+}
+#endif
+
+template<typename type1, typename type2>
+void run_function(const char *l1, const char *l2) {
+    ASSERT(!filter_node_count, NULL);
+    REMARK("Testing < %s, %s >", l1, l2 );
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    REMARK( " ( + lambdas)");
+#endif
+    check_intbuffer = (!strcmp(l1,"int") && !strcmp(l2,"int"));
+    if(check_intbuffer) REMARK(", check output of filters");
+    REMARK("\n");
+
+    Check<type1> check1;  // check constructions/destructions
+    Check<type2> check2;  // for type1 or type2 === check_type<T>
+
+    const size_t number_of_filters = 3;
+
+    input_filter<type1> i_filter;
+    input_filter<type1*> p_i_filter;
+
+    middle_filter<type1, type2> m_filter;
+    middle_filter<type1*, type2> pr_m_filter;
+    middle_filter<type1, type2*> rp_m_filter;
+    middle_filter<type1*, type2*> pp_m_filter;
+
+    output_filter<type2> o_filter;
+    output_filter<type2*> p_o_filter;
+
+    // allocate the buffers for the filters
+    unsigned max_size = (sizeof(type1) > sizeof(type2) ) ? sizeof(type1) : sizeof(type2);
+    for(unsigned i = 0; i < (unsigned)n_buffers; ++i) {
+        buffers[i] = malloc(max_size);
+        buf_available[i] = true;
+    }
+
+    unsigned limit = 1;
+    // Test pipeline that contains number_of_filters filters
+    for( unsigned i=0; i<number_of_filters; ++i)
+        limit *= number_of_filter_types;
+    // Iterate over possible filter sequences
+    for( unsigned numeral=0; numeral<limit; ++numeral ) {
+        unsigned temp = numeral;
+        tbb::filter::mode filter_type[number_of_filter_types];
+        for( unsigned i=0; i<number_of_filters; ++i, temp/=number_of_filter_types )
+            filter_type[i] = filter_table[temp%number_of_filter_types];
+
+        run_filter_set<type1,type2>(i_filter, m_filter, o_filter, filter_type, assert_nonpointer );
+        run_filter_set<type1*,type2>(p_i_filter, pr_m_filter, o_filter, filter_type, assert_firstpointer);
+        run_filter_set<type1,type2*>(i_filter, rp_m_filter, p_o_filter, filter_type, assert_secondpointer);
+        run_filter_set<type1*,type2*>(p_i_filter, pp_m_filter, p_o_filter, filter_type, assert_allpointer);
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        run_lambdas_test<type1,type2>(filter_type);
+#endif
+    }
+    ASSERT(!filter_node_count, "filter_node objects leaked");
+
+    for(unsigned i = 0; i < (unsigned)n_buffers; ++i) {
+        free(buffers[i]);
+    }
+}
+
+#include "tbb/task_scheduler_init.h"
+
+int TestMain() {
+#if TBB_USE_DEBUG
+    // size and copyability.
+    REMARK("is_large_object<int>::value=%d\n", tbb::interface6::internal::is_large_object<int>::value);
+    REMARK("is_large_object<double>::value=%d\n", tbb::interface6::internal::is_large_object<double>::value);
+    REMARK("is_large_object<int *>::value=%d\n", tbb::interface6::internal::is_large_object<int *>::value);
+    REMARK("is_large_object<check_type<int> >::value=%d\n", tbb::interface6::internal::is_large_object<check_type<int> >::value);
+    REMARK("is_large_object<check_type<int>* >::value=%d\n", tbb::interface6::internal::is_large_object<check_type<int>* >::value);
+    REMARK("is_large_object<check_type<short> >::value=%d\n\n", tbb::interface6::internal::is_large_object<check_type<short> >::value);
+#endif
+    // Test with varying number of threads.
+    for( int nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        // Initialize TBB task scheduler
+        REMARK("\nTesting with nthread=%d\n", nthread);
+        tbb::task_scheduler_init init(nthread);
+
+        // Run test several times with different types
+        run_function_spec();
+        run_function<size_t,int>("size_t", "int");
+        run_function<int,double>("int", "double");
+        run_function<size_t,double>("size_t", "double");
+        run_function<size_t,bool>("size_t", "bool");
+        run_function<int,int>("int","int");
+        run_function<check_type<unsigned int>,size_t>("check_type<unsigned int>", "size_t");
+        run_function<check_type<unsigned short>,size_t>("check_type<unsigned short>", "size_t");
+        run_function<check_type<unsigned int>, check_type<unsigned int> >("check_type<unsigned int>", "check_type<unsigned int>");
+        run_function<check_type<unsigned int>, check_type<unsigned short> >("check_type<unsigned int>", "check_type<unsigned short>");
+        run_function<check_type<unsigned short>, check_type<unsigned short> >("check_type<unsigned short>", "check_type<unsigned short>");
+        run_function<double, check_type<unsigned short> >("double", "check_type<unsigned short>");
+    }
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_parallel_reduce.cpp b/xdl/third_party/tbb/src/test/test_parallel_reduce.cpp
new file mode 100644
index 00000000..66fb1801
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_reduce.cpp
@@ -0,0 +1,495 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+
+#include "tbb/parallel_reduce.h"
+#include "tbb/atomic.h"
+#include "harness_assert.h"
+
+using namespace std;
+
+static tbb::atomic<long> ForkCount;
+static tbb::atomic<long> FooBodyCount;
+
+//! Class with public interface that is exactly minimal requirements for Range concept
+class MinimalRange {
+    size_t begin, end;
+    friend class FooBody;
+    explicit MinimalRange( size_t i ) : begin(0), end(i) {}
+    friend void Flog( int nthread, bool inteference );
+public:
+    MinimalRange( MinimalRange& r, tbb::split ) : end(r.end) {
+        begin = r.end = (r.begin+r.end)/2;
+    }
+    bool is_divisible() const {return end-begin>=2;}
+    bool empty() const {return begin==end;}
+};
+
+//! Class with public interface that is exactly minimal requirements for Body of a parallel_reduce
+class FooBody {
+private:
+    FooBody( const FooBody& );          // Deny access
+    void operator=( const FooBody& );   // Deny access
+    friend void Flog( int nthread, bool interference );
+    //! Parent that created this body via split operation.  NULL if original body.
+    FooBody* parent;
+    //! Total number of index values processed by body and its children.
+    size_t sum;
+    //! Number of join operations done so far on this body and its children.
+    long join_count;
+    //! Range that has been processed so far by this body and its children.
+    size_t begin, end;
+    //! True if body has not yet been processed at least once by operator().
+    bool is_new;
+    //! 1 if body was created by split; 0 if original body.
+    int forked;
+    FooBody() {++FooBodyCount;}
+public:
+    ~FooBody() {
+        forked = 0xDEADBEEF;
+        sum=0xDEADBEEF;
+        join_count=0xDEADBEEF;
+        --FooBodyCount;
+    }
+    FooBody( FooBody& other, tbb::split ) {
+        ++FooBodyCount;
+        ++ForkCount;
+        sum = 0;
+        parent = &other;
+        join_count = 0;
+        is_new = true;
+        forked = 1;
+    }
+    void join( FooBody& s ) {
+        ASSERT( s.forked==1, NULL );
+        ASSERT( this!=&s, NULL );
+        ASSERT( this==s.parent, NULL );
+        ASSERT( end==s.begin, NULL );
+        end = s.end;
+        sum += s.sum;
+        join_count += s.join_count + 1;
+        s.forked = 2;
+    }
+    void operator()( const MinimalRange& r ) {
+        for( size_t k=r.begin; k<r.end; ++k )
+            ++sum;
+        if( is_new ) {
+            is_new = false;
+            begin = r.begin;
+        } else
+            ASSERT( end==r.begin, NULL );
+        end = r.end;
+    }
+};
+
+#include <cstdio>
+#include "harness.h"
+#include "tbb/tick_count.h"
+
+void Flog( int nthread, bool interference=false ) {
+    for (int mode = 0;  mode < 4; mode++) {
+        tbb::tick_count T0 = tbb::tick_count::now();
+        long join_count = 0;
+        tbb::affinity_partitioner ap;
+        for( size_t i=0; i<=1000; ++i ) {
+            FooBody f;
+            f.sum = 0;
+            f.parent = NULL;
+            f.join_count = 0;
+            f.is_new = true;
+            f.forked = 0;
+            f.begin = ~size_t(0);
+            f.end = ~size_t(0);
+            ASSERT( FooBodyCount==1, NULL );
+            switch (mode) {
+                case 0:
+                    tbb::parallel_reduce( MinimalRange(i), f );
+                    break;
+                case 1:
+                    tbb::parallel_reduce( MinimalRange(i), f, tbb::simple_partitioner() );
+                    break;
+                case 2:
+                    tbb::parallel_reduce( MinimalRange(i), f, tbb::auto_partitioner() );
+                    break;
+                case 3:
+                    tbb::parallel_reduce( MinimalRange(i), f, ap );
+                    break;
+            }
+            join_count += f.join_count;
+            ASSERT( FooBodyCount==1, NULL );
+            ASSERT( f.sum==i, NULL );
+            ASSERT( f.begin==(i==0 ? ~size_t(0) : 0), NULL );
+            ASSERT( f.end==(i==0 ? ~size_t(0) : i), NULL );
+        }
+        tbb::tick_count T1 = tbb::tick_count::now();
+        REMARK("time=%g join_count=%ld ForkCount=%ld nthread=%d%s\n",
+                   (T1-T0).seconds(),join_count,long(ForkCount), nthread, interference ? " with interference":"");
+    }
+}
+
+#include "tbb/blocked_range.h"
+
+#if _MSC_VER
+    typedef tbb::internal::uint64_t ValueType;
+#else
+    typedef uint64_t ValueType;
+#endif
+
+struct Sum {
+    template<typename T>
+    T operator() ( const T& v1, const T& v2 ) const {
+        return v1 + v2;
+    }
+};
+
+struct Accumulator {
+    ValueType operator() ( const tbb::blocked_range<ValueType*>& r, ValueType value ) const {
+        for ( ValueType* pv = r.begin(); pv != r.end(); ++pv )
+            value += *pv;
+        return value;
+    }
+};
+
+class ParallelSumTester: public NoAssign {
+public:
+    ParallelSumTester() : m_range(NULL, NULL) {
+        m_array = new ValueType[unsigned(N)];
+        for ( ValueType i = 0; i < N; ++i )
+            m_array[i] = i + 1;
+        m_range = tbb::blocked_range<ValueType*>( m_array, m_array + N );
+    }
+    ~ParallelSumTester() { delete[] m_array; }
+    template<typename Partitioner>
+    void CheckParallelReduce() {
+        Partitioner partitioner;
+        ValueType r1 = tbb::parallel_reduce( m_range, I, Accumulator(), Sum(), partitioner );
+        ASSERT( r1 == R, NULL );
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        ValueType r2 = tbb::parallel_reduce(
+            m_range, I,
+            [](const tbb::blocked_range<ValueType*>& r, ValueType value) -> ValueType {
+                for ( const ValueType* pv = r.begin(); pv != r.end(); ++pv )
+                    value += *pv;
+                return value;
+            },
+            Sum(),
+            partitioner
+        );
+        ASSERT( r2 == R, NULL );
+#endif /* LAMBDAS */
+    }
+    void CheckParallelReduceDefault() {
+        ValueType r1 = tbb::parallel_reduce( m_range, I, Accumulator(), Sum() );
+        ASSERT( r1 == R, NULL );
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        ValueType r2 = tbb::parallel_reduce(
+            m_range, I,
+            [](const tbb::blocked_range<ValueType*>& r, ValueType value) -> ValueType {
+                for ( const ValueType* pv = r.begin(); pv != r.end(); ++pv )
+                    value += *pv;
+                return value;
+            },
+            Sum()
+        );
+        ASSERT( r2 == R, NULL );
+#endif /* LAMBDAS */
+    }
+private:
+    ValueType* m_array;
+    tbb::blocked_range<ValueType*> m_range;
+    static const ValueType I, N, R;
+};
+
+const ValueType ParallelSumTester::I = 0;
+const ValueType ParallelSumTester::N = 1000000;
+const ValueType ParallelSumTester::R = N * (N + 1) / 2;
+
+void ParallelSum () {
+    ParallelSumTester pst;
+    pst.CheckParallelReduceDefault();
+    pst.CheckParallelReduce<tbb::simple_partitioner>();
+    pst.CheckParallelReduce<tbb::auto_partitioner>();
+    pst.CheckParallelReduce<tbb::affinity_partitioner>();
+    pst.CheckParallelReduce<tbb::static_partitioner>();
+}
+
+#include "harness_concurrency_tracker.h"
+
+class RotOp {
+public:
+    typedef int Type;
+    int operator() ( int x, int i ) const {
+        return ( x<<1 ) ^ i;
+    }
+    int join( int x, int y ) const {
+        return operator()( x, y );
+    }
+};
+
+template <class Op>
+struct ReduceBody {
+    typedef typename Op::Type result_type;
+    result_type my_value;
+
+    ReduceBody() : my_value() {}
+    ReduceBody( ReduceBody &, tbb::split ) : my_value() {}
+
+    void operator() ( const tbb::blocked_range<int>& r ) {
+        Harness::ConcurrencyTracker ct;
+        for ( int i = r.begin(); i != r.end(); ++i ) {
+            Op op;
+            my_value = op(my_value, i);
+        }
+    }
+
+    void join( const ReduceBody& y ) {
+        Op op;
+        my_value = op.join(my_value, y.my_value);
+    }
+};
+
+//! Type-tag for automatic testing algorithm deduction
+struct harness_default_partitioner {};
+
+template<typename Body, typename Partitioner>
+struct parallel_deterministic_reduce_invoker {
+    template<typename Range>
+    static typename Body::result_type run( const Range& range ) {
+        Body body;
+        tbb::parallel_deterministic_reduce(range, body, Partitioner());
+        return body.my_value;
+    }
+};
+
+template<typename Body>
+struct parallel_deterministic_reduce_invoker<Body, harness_default_partitioner> {
+    template<typename Range>
+    static typename Body::result_type run( const Range& range ) {
+        Body body;
+        tbb::parallel_deterministic_reduce(range, body);
+        return body.my_value;
+    }
+};
+
+template<typename ResultType, typename Partitioner>
+struct parallel_deterministic_reduce_lambda_invoker {
+    template<typename Range, typename Func, typename Reduction>
+    static ResultType run( const Range& range, Func f, Reduction r ) {
+        return tbb::parallel_deterministic_reduce(range, ResultType(), f, r, Partitioner());
+    }
+};
+
+template<typename ResultType>
+struct parallel_deterministic_reduce_lambda_invoker<ResultType, harness_default_partitioner> {
+    template<typename Range, typename Func, typename Reduction>
+    static ResultType run(const Range& range, Func f, Reduction r) {
+        return tbb::parallel_deterministic_reduce(range, ResultType(), f, r);
+    }
+};
+
+//! Define overloads of parallel_deterministic_reduce that accept "undesired" types of partitioners
+namespace unsupported {
+
+    template<typename Range, typename Body>
+    void parallel_deterministic_reduce(const Range&, Body&, const tbb::auto_partitioner&) { }
+
+    template<typename Range, typename Body>
+    void parallel_deterministic_reduce(const Range&, Body&, tbb::affinity_partitioner&) { }
+
+    template<typename Range, typename Value, typename RealBody, typename Reduction>
+    Value parallel_deterministic_reduce(const Range& , const Value& identity, const RealBody& , const Reduction& , const tbb::auto_partitioner&) {
+        return identity;
+    }
+
+    template<typename Range, typename Value, typename RealBody, typename Reduction>
+    Value parallel_deterministic_reduce(const Range& , const Value& identity, const RealBody& , const Reduction& , tbb::affinity_partitioner&) {
+        return identity;
+    }
+
+}
+
+struct Body {
+    float value;
+    Body() : value(0) {}
+    Body(Body&, tbb::split) { value = 0; }
+    void operator()(const tbb::blocked_range<int>&) {}
+    void join(Body&) {}
+};
+
+//! Check that other types of partitioners are not supported (auto, affinity)
+//! In the case of "unsupported" API unexpectedly sneaking into namespace tbb,
+//! this test should result in a compilation error due to overload resolution ambiguity
+static void TestUnsupportedPartitioners() {
+    using namespace tbb;
+    using namespace unsupported;
+    Body body;
+    parallel_deterministic_reduce(blocked_range<int>(0, 10), body, tbb::auto_partitioner());
+
+    tbb::affinity_partitioner ap;
+    parallel_deterministic_reduce(blocked_range<int>(0, 10), body, ap);
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+    parallel_deterministic_reduce(
+        blocked_range<int>(0, 10),
+        0,
+        [](const blocked_range<int>&, int init)->int {
+            return init;
+        },
+        [](int x, int y)->int {
+            return x + y;
+        },
+        tbb::auto_partitioner()
+    );
+    parallel_deterministic_reduce(
+        blocked_range<int>(0, 10),
+        0,
+        [](const blocked_range<int>&, int init)->int {
+            return init;
+        },
+        [](int x, int y)->int {
+            return x + y;
+        },
+        ap
+    );
+#endif /* LAMBDAS */
+}
+
+template <class Partitioner>
+void TestDeterministicReductionFor() {
+    const int N = 1000;
+    const tbb::blocked_range<int> range(0, N);
+    typedef ReduceBody<RotOp> BodyType;
+    BodyType::result_type R1 =
+        parallel_deterministic_reduce_invoker<BodyType, Partitioner>::run(range);
+    for ( int i=0; i<100; ++i ) {
+        BodyType::result_type R2 =
+            parallel_deterministic_reduce_invoker<BodyType, Partitioner>::run(range);
+        ASSERT( R1 == R2, "parallel_deterministic_reduce behaves differently from run to run" );
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        typedef RotOp::Type Type;
+        Type R3 = parallel_deterministic_reduce_lambda_invoker<Type, Partitioner>::run(
+            range,
+            [](const tbb::blocked_range<int>& br, Type value) -> Type {
+                Harness::ConcurrencyTracker ct;
+                for ( int ii = br.begin(); ii != br.end(); ++ii ) {
+                    RotOp op;
+                    value = op(value, ii);
+                }
+                return value;
+            },
+            [](const Type& v1, const Type& v2) -> Type {
+                RotOp op;
+                return op.join(v1,v2);
+            }
+        );
+        ASSERT( R1 == R3, "lambda-based parallel_deterministic_reduce behaves differently from run to run" );
+#endif /* LAMBDAS */
+    }
+}
+
+void TestDeterministicReduction () {
+    TestDeterministicReductionFor<tbb::simple_partitioner>();
+    TestDeterministicReductionFor<tbb::static_partitioner>();
+    TestDeterministicReductionFor<harness_default_partitioner>();
+    ASSERT_WARNING((Harness::ConcurrencyTracker::PeakParallelism() > 1), "no parallel execution\n");
+}
+
+#include "tbb/task_scheduler_init.h"
+#include "harness_cpu.h"
+#include "test_partitioner.h"
+
+namespace interaction_with_range_and_partitioner {
+
+// Test checks compatibility of parallel_reduce algorithm with various range implementations
+
+void test() {
+    using namespace test_partitioner_utils::interaction_with_range_and_partitioner;
+
+    test_partitioner_utils::SimpleReduceBody body;
+    tbb::affinity_partitioner ap;
+
+    parallel_reduce(Range1(/*assert_in_split*/ true, /*assert_in_proportional_split*/ false), body, ap);
+    parallel_reduce(Range2(true, false), body, ap);
+    parallel_reduce(Range3(true, false), body, ap);
+    parallel_reduce(Range4(false, true), body, ap);
+    parallel_reduce(Range5(false, true), body, ap);
+    parallel_reduce(Range6(false, true), body, ap);
+
+    parallel_reduce(Range1(/*assert_in_split*/ true, /*assert_in_proportional_split*/ false),
+                           body, tbb::static_partitioner());
+    parallel_reduce(Range2(true, false), body, tbb::static_partitioner());
+    parallel_reduce(Range3(true, false), body, tbb::static_partitioner());
+    parallel_reduce(Range4(false, true), body, tbb::static_partitioner());
+    parallel_reduce(Range5(false, true), body, tbb::static_partitioner());
+    parallel_reduce(Range6(false, true), body, tbb::static_partitioner());
+
+    parallel_reduce(Range1(/*assert_in_split*/ false, /*assert_in_proportional_split*/ true),
+                           body, tbb::simple_partitioner());
+    parallel_reduce(Range2(false, true), body, tbb::simple_partitioner());
+    parallel_reduce(Range3(false, true), body, tbb::simple_partitioner());
+    parallel_reduce(Range4(false, true), body, tbb::simple_partitioner());
+    parallel_reduce(Range5(false, true), body, tbb::simple_partitioner());
+    parallel_reduce(Range6(false, true), body, tbb::simple_partitioner());
+
+    parallel_reduce(Range1(/*assert_in_split*/ false, /*assert_in_proportional_split*/ true),
+                           body, tbb::auto_partitioner());
+    parallel_reduce(Range2(false, true), body, tbb::auto_partitioner());
+    parallel_reduce(Range3(false, true), body, tbb::auto_partitioner());
+    parallel_reduce(Range4(false, true), body, tbb::auto_partitioner());
+    parallel_reduce(Range5(false, true), body, tbb::auto_partitioner());
+    parallel_reduce(Range6(false, true), body, tbb::auto_partitioner());
+
+    parallel_deterministic_reduce(Range1(/*assert_in_split*/true, /*assert_in_proportional_split*/ false),
+                                         body, tbb::static_partitioner());
+    parallel_deterministic_reduce(Range2(true, false), body, tbb::static_partitioner());
+    parallel_deterministic_reduce(Range3(true, false), body, tbb::static_partitioner());
+    parallel_deterministic_reduce(Range4(false, true), body, tbb::static_partitioner());
+    parallel_deterministic_reduce(Range5(false, true), body, tbb::static_partitioner());
+    parallel_deterministic_reduce(Range6(false, true), body, tbb::static_partitioner());
+
+    parallel_deterministic_reduce(Range1(/*assert_in_split*/false, /*assert_in_proportional_split*/ true),
+                                         body, tbb::simple_partitioner());
+    parallel_deterministic_reduce(Range2(false, true), body, tbb::simple_partitioner());
+    parallel_deterministic_reduce(Range3(false, true), body, tbb::simple_partitioner());
+    parallel_deterministic_reduce(Range4(false, true), body, tbb::simple_partitioner());
+    parallel_deterministic_reduce(Range5(false, true), body, tbb::simple_partitioner());
+    parallel_deterministic_reduce(Range6(false, true), body, tbb::simple_partitioner());
+}
+
+} // interaction_with_range_and_partitioner
+
+int TestMain () {
+    TestUnsupportedPartitioners();
+    if( MinThread<0 ) {
+        REPORT("Usage: nthread must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init( p );
+        Flog(p);
+        ParallelSum();
+        if ( p>=2 )
+            TestDeterministicReduction();
+        // Test that all workers sleep when no work
+        TestCPUUserTime(p);
+    }
+    interaction_with_range_and_partitioner::test();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_parallel_scan.cpp b/xdl/third_party/tbb/src/test/test_parallel_scan.cpp
new file mode 100644
index 00000000..a9a5d040
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_scan.cpp
@@ -0,0 +1,463 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/parallel_scan.h"
+#include "tbb/blocked_range.h"
+#include "harness_assert.h"
+#include <vector>
+
+typedef tbb::blocked_range<long> Range;
+
+static volatile bool ScanIsRunning = false;
+
+//! Sum of 0..i with wrap around on overflow.
+inline int TriangularSum( int i ) {
+    return i&1 ? ((i>>1)+1)*i : (i>>1)*(i+1);
+}
+
+#include "harness.h"
+
+//! Verify that sum is init plus sum of integers in closed interval [0..finish_index].
+/** line should be the source line of the caller */
+void VerifySum( int init, long finish_index, int sum, int line ) {
+    int expected = init + TriangularSum(finish_index);
+    if (expected != sum) {
+        REPORT("line %d: sum[0..%ld] should be = %d, but was computed as %d\n",
+            line, finish_index, expected, sum);
+        abort();
+    }
+}
+
+const int MAXN = 2000;
+
+enum AddendFlag {
+    UNUSED=0,
+    USED_NONFINAL=1,
+    USED_FINAL=2
+};
+
+//! Array recording how each addend was used.
+/** 'unsigned char' instead of AddendFlag for sake of compactness. */
+static unsigned char AddendHistory[MAXN];
+
+//! Set to 1 for debugging output
+#define PRINT_DEBUG 0
+
+#include "tbb/atomic.h"
+#if PRINT_DEBUG
+#include <stdio.h>
+#include "harness_report.h"
+tbb::atomic<long> NextBodyId;
+#endif /* PRINT_DEBUG */
+
+struct BodyId {
+#if PRINT_DEBUG
+    const int id;
+    BodyId() : id(NextBodyId++) {}
+#endif /* PRINT_DEBUG */
+};
+
+tbb::atomic<long> NumberOfLiveStorage;
+
+static void Snooze( bool scan_should_be_running ) {
+    ASSERT( ScanIsRunning==scan_should_be_running, NULL );
+}
+
+template<typename T>
+struct Storage {
+    T my_total;
+    Range my_range;
+    Storage(T init) :
+        my_total(init), my_range(-1, -1, 1) {
+        ++NumberOfLiveStorage;
+    }
+    ~Storage() {
+        --NumberOfLiveStorage;
+    }
+    Storage(const Storage& strg) :
+        my_total(strg.my_total), my_range(strg.my_range) {
+        ++NumberOfLiveStorage;
+    }
+    Storage & operator=(const Storage& strg) {
+        my_total = strg.my_total;
+        my_range = strg.my_range;
+        return *this;
+    }
+};
+
+template<typename T>
+void JoinStorages(const Storage<T>& left, Storage<T>& right) {
+    Snooze(true);
+    ASSERT(ScanIsRunning, NULL);
+    ASSERT(left.my_range.end() == right.my_range.begin(), NULL);
+    right.my_total += left.my_total;
+    right.my_range = Range(left.my_range.begin(), right.my_range.end(), 1);
+    ASSERT(ScanIsRunning, NULL);
+    Snooze(true);
+    ASSERT(ScanIsRunning, NULL);
+}
+
+template<typename T>
+void Scan(const Range & r, bool is_final, Storage<T> & storage, std::vector<T> & sum, const std::vector<T> & addend) {
+    ASSERT(!is_final || (storage.my_range.begin() == 0 && storage.my_range.end() == r.begin()) || (storage.my_range.empty() && r.begin() == 0), NULL);
+    for (long i = r.begin(); i < r.end(); ++i) {
+        storage.my_total += addend[i];
+        if (is_final) {
+            ASSERT(AddendHistory[i] < USED_FINAL, "addend used 'finally' twice?");
+            AddendHistory[i] |= USED_FINAL;
+            sum[i] = storage.my_total;
+            VerifySum(42, i, int(sum[i]), __LINE__);
+        }
+        else {
+            ASSERT(AddendHistory[i] == UNUSED, "addend used too many times");
+            AddendHistory[i] |= USED_NONFINAL;
+        }
+    }
+    if (storage.my_range.empty())
+        storage.my_range = r;
+    else
+        storage.my_range = Range(storage.my_range.begin(), r.end(), 1);
+    Snooze(true);
+}
+
+template<typename T>
+Storage<T> ScanWithInit(const Range & r, T init, bool is_final, Storage<T> & storage, std::vector<T> & sum, const std::vector<T> & addend) {
+    if (r.begin() == 0)
+        storage.my_total = init;
+    Scan(r, is_final, storage, sum, addend);
+    return storage;
+}
+
+template<typename T>
+class Accumulator: BodyId {
+    const  std::vector<T> &my_array;
+    std::vector<T> & my_sum;
+    Storage<T> storage;
+    enum state_type {
+        full,       // Accumulator has sufficient information for final scan,
+                    // i.e. has seen all iterations to its left.
+                    // It's either the original Accumulator provided by the user
+                    // or a Accumulator constructed by a splitting constructor *and* subsequently
+                    // subjected to a reverse_join with a full accumulator.
+
+        partial,    // Accumulator has only enough information for pre_scan.
+                    // i.e. has not seen all iterations to its left.
+                    // It's an Accumulator created by a splitting constructor that
+                    // has not yet been subjected to a reverse_join with a full accumulator.
+
+        summary,    // Accumulator has summary of iterations processed, but not necessarily
+                    // the information required for a final_scan or pre_scan.
+                    // It's the result of "assign".
+
+        trash       // Accumulator with possibly no useful information.
+                    // It was the source for "assign".
+
+    };
+    mutable state_type my_state;
+    //! Equals this while object is fully constructed, NULL otherwise.
+    /** Used to detect premature destruction and accidental bitwise copy. */
+    Accumulator* self;
+    Accumulator& operator= (const Accumulator& other);
+public:
+    Accumulator( T init, const std::vector<T> & array, std::vector<T> & sum ) :
+        my_array(array), my_sum(sum), storage(init), my_state(full)
+    {
+        // Set self as last action of constructor, to indicate that object is fully constructed.
+        self = this;
+    }
+#if PRINT_DEBUG
+    void print() const {
+        REPORT("%d [%ld..%ld)\n", id, storage.my_range.begin(), storage.my_range.end() );
+    }
+#endif /* PRINT_DEBUG */
+    ~Accumulator() {
+#if PRINT_DEBUG
+        REPORT("%d [%ld..%ld) destroyed\n",id, storage.my_range.begin(), storage.my_range.end() );
+#endif /* PRINT_DEBUG */
+        // Clear self as first action of destructor, to indicate that object is not fully constructed.
+        self = 0;
+    }
+    Accumulator( Accumulator& a, tbb::split ) :
+        my_array(a.my_array), my_sum(a.my_sum), storage(0), my_state(partial)
+    {
+        ASSERT(a.my_state==full || a.my_state==partial, NULL);
+#if PRINT_DEBUG
+        REPORT("%d forked from %d\n",id,a.id);
+#endif /* PRINT_DEBUG */
+        Snooze(true);
+        // Set self as last action of constructor, to indicate that object is fully constructed.
+        self = this;
+    }
+    template<typename Tag>
+    void operator()( const Range& r, Tag /*tag*/ ) {
+        ASSERT( Tag::is_final_scan() ? my_state==full : my_state==partial, NULL );
+#if PRINT_DEBUG
+        if(storage.my_range.empty() )
+            REPORT("%d computing %s [%ld..%ld)\n",id,Tag::is_final_scan()?"final":"lookahead",r.begin(),r.end() );
+        else
+            REPORT("%d computing %s [%ld..%ld) [%ld..%ld)\n",id,Tag::is_final_scan()?"final":"lookahead", storage.my_range.begin(), storage.my_range.end(),r.begin(),r.end());
+#endif /* PRINT_DEBUG */
+        Scan(r, Tag::is_final_scan(), storage, my_sum, my_array);
+        ASSERT( self==this, "this Accumulator corrupted or prematurely destroyed" );
+    }
+    void reverse_join( const Accumulator& left_body) {
+#if PRINT_DEBUG
+        REPORT("reverse join %d [%ld..%ld) %d [%ld..%ld)\n",
+               left_body.id, left_body.storage.my_range.begin(), left_body.storage.my_range.end(),
+               id, storage.my_range.begin(), storage.my_range.end());
+#endif /* PRINT_DEBUG */
+        const Storage<T> & left = left_body.storage;
+        Storage<T> & right = storage;
+        ASSERT(my_state==partial, NULL );
+        ASSERT(left_body.my_state==full || left_body.my_state==partial, NULL );
+
+        JoinStorages(left, right);
+
+        ASSERT(left_body.self==&left_body, NULL );
+        my_state = left_body.my_state;
+    }
+    void assign( const Accumulator& other ) {
+        ASSERT(other.my_state==full, NULL);
+        ASSERT(my_state==full, NULL);
+        storage.my_total = other.storage.my_total;
+        storage.my_range = other.storage.my_range;
+        ASSERT( self==this, NULL );
+        ASSERT( other.self==&other, "other Accumulator corrupted or prematurely destroyed" );
+        my_state = summary;
+        other.my_state = trash;
+    }
+    T get_total() {
+        return storage.my_total;
+    }
+};
+
+#include "tbb/tick_count.h"
+
+template<typename T, typename Scan, typename ReverseJoin>
+T ParallelScanFunctionalInvoker(const Range& range, T idx, const Scan& scan, const ReverseJoin& reverse_join, int mode) {
+    switch (mode%3) {
+    case 0:
+        return tbb::parallel_scan(range, idx, scan, reverse_join);
+        break;
+    case 1:
+        return tbb::parallel_scan(range, idx, scan, reverse_join, tbb::simple_partitioner());
+        break;
+    default:
+        return tbb::parallel_scan(range, idx, scan, reverse_join, tbb::auto_partitioner());
+    }
+}
+
+template<typename T>
+class ScanBody {
+    const std::vector<T> &my_addend;
+    std::vector<T> &my_sum;
+    const T my_init;
+    ScanBody& operator= (const ScanBody&);
+public:
+    ScanBody(T init, const std::vector<T> &addend, std::vector<T> &sum) :my_addend(addend), my_sum(sum), my_init(init) {}
+    template<typename Tag>
+    Storage<T> operator()(const Range& r, Storage<T> storage, Tag) const {
+        return ScanWithInit(r, my_init, Tag::is_final_scan(), storage, my_sum, my_addend);
+    }
+};
+
+template<typename T>
+class JoinBody {
+public:
+    Storage<T> operator()(const Storage<T>& left, Storage<T>& right) const {
+        JoinStorages(left, right);
+        return right;
+    }
+};
+
+template<typename T>
+T ParallelScanTemplateFunctor(Range range, T init, const std::vector<T> &addend, std::vector<T> &sum, int mode) {
+    for (long i = 0; i<MAXN; ++i) {
+        AddendHistory[i] = UNUSED;
+    }
+    ScanIsRunning = true;
+    ScanBody<T> sb(init, addend, sum);
+    JoinBody<T> jb;
+    Storage<T> res = ParallelScanFunctionalInvoker(range, Storage<T>(0), sb, jb, mode);
+    ScanIsRunning = false;
+    if (range.empty())
+        res.my_total = init;
+    return res.my_total;
+}
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+template<typename T>
+T ParallelScanLambda(Range range, T init, const std::vector<T> &addend, std::vector<T> &sum, int mode) {
+    for (long i = 0; i<MAXN; ++i) {
+        AddendHistory[i] = UNUSED;
+    }
+    ScanIsRunning = true;
+    Storage<T> res = ParallelScanFunctionalInvoker(range, Storage<T>(0),
+        [&addend, &sum, init](const Range& r, Storage<T> storage, bool is_final_scan /*tag*/) -> Storage<T> {
+            return ScanWithInit(r, init, is_final_scan, storage, sum, addend);
+        },
+        [](const Storage<T>& left, Storage<T>& right) -> Storage<T> {
+            JoinStorages(left, right);
+            return right;
+        },
+        mode);
+    ScanIsRunning = false;
+    if (range.empty())
+        res.my_total = init;
+    return res.my_total;
+}
+
+#if __TBB_CPP14_GENERIC_LAMBDAS_PRESENT
+template<typename T>
+T ParallelScanGenericLambda(Range range, T init, const std::vector<T> &addend, std::vector<T> &sum, int mode) {
+    for (long i = 0; i<MAXN; ++i) {
+        AddendHistory[i] = UNUSED;
+    }
+    ScanIsRunning = true;
+    Storage<T> res = ParallelScanFunctionalInvoker(range, Storage<T>(0),
+        [&addend, &sum, init](const Range& rng, Storage<T> storage, auto scan_tag) {
+            return ScanWithInit(rng, init, scan_tag.is_final_scan(), storage, sum, addend);
+        },
+        [](const Storage<T>& left, Storage<T>& right) {
+            JoinStorages(left, right);
+            return right;
+        },
+        mode);
+    ScanIsRunning = false;
+    if (range.empty())
+        res.my_total = init;
+    return res.my_total;
+}
+#endif/* GENERIC_LAMBDAS */
+#endif/* LAMBDAS */
+
+void TestAccumulator( int mode, int nthread ) {
+    typedef int T;
+    std::vector<T> addend(MAXN);
+    std::vector<T> sum(MAXN);
+    for( long n=0; n<=MAXN; ++n ) {
+        for( long i=0; i<MAXN; ++i ) {
+            addend[i] = -1;
+            sum[i] = -2;
+            AddendHistory[i] = UNUSED;
+        }
+        for( long i=0; i<n; ++i )
+            addend[i] = i;
+
+        Accumulator<T> acc( 42, addend, sum );
+        tbb::tick_count t0 = tbb::tick_count::now();
+#if PRINT_DEBUG
+        REPORT("--------- mode=%d range=[0..%ld)\n",mode,n);
+#endif /* PRINT_DEBUG */
+        ScanIsRunning = true;
+
+        switch (mode) {
+            case 0:
+                tbb::parallel_scan( Range( 0, n, 1 ), acc );
+            break;
+            case 1:
+                tbb::parallel_scan( Range( 0, n, 1 ), acc, tbb::simple_partitioner() );
+            break;
+            case 2:
+                tbb::parallel_scan( Range( 0, n, 1 ), acc, tbb::auto_partitioner() );
+            break;
+        }
+
+        ScanIsRunning = false;
+#if PRINT_DEBUG
+        REPORT("=========\n");
+#endif /* PRINT_DEBUG */
+        Snooze(false);
+        tbb::tick_count t1 = tbb::tick_count::now();
+        long used_once_count = 0;
+        for( long i=0; i<n; ++i )
+            if( !(AddendHistory[i]&USED_FINAL) ) {
+                REPORT("failed to use addend[%ld] %s\n",i,AddendHistory[i]&USED_NONFINAL?"(but used nonfinal)":"");
+            }
+        for( long i=0; i<n; ++i ) {
+            VerifySum( 42, i, sum[i], __LINE__ );
+            used_once_count += AddendHistory[i]==USED_FINAL;
+        }
+        if( n )
+            ASSERT( acc.get_total()==sum[n-1], NULL );
+        else
+            ASSERT( acc.get_total()==42, NULL );
+        REMARK("time [n=%ld] = %g\tused_once%% = %g\tnthread=%d\n",n,(t1-t0).seconds(), n==0 ? 0 : 100.0*used_once_count/n,nthread);
+
+
+       std::vector<T> sum_tmplt(MAXN);
+        for (long i = 0; i<MAXN; ++i)
+            sum_tmplt[i] = -2;
+        T total_tmplt = ParallelScanTemplateFunctor(Range(0, n, 1), 42, addend, sum_tmplt, mode);
+
+        ASSERT(acc.get_total() == total_tmplt, "Parallel prefix sum with lambda interface is not equal to body interface");
+        ASSERT(sum == sum_tmplt, "Parallel prefix vector with lambda interface is not equal to body interface");
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        std::vector<T> sum_lambda(MAXN);
+        for (long i = 0; i<MAXN; ++i)
+            sum_lambda[i] = -2;
+        T total_lambda = ParallelScanLambda(Range(0, n, 1), 42, addend, sum_lambda, mode);
+
+        ASSERT(acc.get_total() == total_lambda, "Parallel prefix sum with lambda interface is not equal to body interface");
+        ASSERT(sum == sum_lambda, "Parallel prefix vector with lambda interface is not equal to body interface");
+
+#if __TBB_CPP14_GENERIC_LAMBDAS_PRESENT
+        std::vector<T> sum_generic_lambda(MAXN);
+        for (long i = 0; i<MAXN; ++i)
+            sum_generic_lambda[i] = -2;
+        T total_generic_lambda = ParallelScanGenericLambda(Range(0, n, 1), 42, addend, sum_generic_lambda, mode);
+
+        ASSERT(acc.get_total() == total_generic_lambda, "Parallel prefix sum with lambda (generic) interface is not equal to body interface");
+        ASSERT(sum == sum_generic_lambda, "Parallel prefix vector with lambda (generic) interface is not equal to body interface");
+
+#endif /* GENERIC_LAMBDAS */
+#endif /* LAMBDAS */
+    }
+}
+
+static void TestScanTags() {
+    ASSERT( tbb::pre_scan_tag::is_final_scan()==false, NULL );
+    ASSERT( tbb::final_scan_tag::is_final_scan()==true, NULL );
+    ASSERT( tbb::pre_scan_tag() == false, NULL );
+    ASSERT( tbb::final_scan_tag() == true, NULL );
+}
+
+#include "tbb/task_scheduler_init.h"
+#include "harness_cpu.h"
+
+int TestMain () {
+    TestScanTags();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        for (int mode = 0; mode < 3; mode++) {
+            tbb::task_scheduler_init init(p);
+            NumberOfLiveStorage = 0;
+            TestAccumulator(mode, p);
+            // Test that all workers sleep when no work
+            TestCPUUserTime(p);
+
+            // Checking has to be done late, because when parallel_scan makes copies of
+            // the user's "Body", the copies might be destroyed slightly after parallel_scan
+            // returns.
+            ASSERT( NumberOfLiveStorage==0, NULL );
+        }
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_parallel_sort.cpp b/xdl/third_party/tbb/src/test/test_parallel_sort.cpp
new file mode 100644
index 00000000..1bf90ad2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_sort.cpp
@@ -0,0 +1,560 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/parallel_sort.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/concurrent_vector.h"
+#include "harness.h"
+#include <math.h>
+#include <vector>
+#include <exception>
+#include <algorithm>
+#include <iterator>
+#include <functional>
+#include <string>
+#include <cstring>
+
+/** Has tightly controlled interface so that we can verify
+    that parallel_sort uses only the required interface. */
+class Minimal {
+    int val;
+public:
+    Minimal() {}
+    void set_val(int i) { val = i; }
+    static bool CompareWith (const Minimal &a, const Minimal &b) {
+        return (a.val < b.val);
+    }
+    static bool AreEqual( Minimal &a,  Minimal &b) {
+       return a.val == b.val;
+    }
+};
+
+//! Defines a comparison function object for Minimal
+class MinimalCompare {
+public:
+    bool operator() (const Minimal &a, const Minimal &b) const {
+        return Minimal::CompareWith(a,b);
+    }
+};
+
+//! The default validate; but it uses operator== which is not required
+template<typename RandomAccessIterator>
+bool Validate(RandomAccessIterator a, RandomAccessIterator b, size_t n) {
+    for (size_t i = 0; i < n; i++) {
+        ASSERT( a[i] == b[i], NULL );
+    }
+    return true;
+}
+
+//! A Validate specialized to string for debugging-only
+template<>
+bool Validate<std::string *>(std::string * a, std::string * b, size_t n) {
+    for (size_t i = 0; i < n; i++) {
+        if ( Verbose && a[i] != b[i]) {
+          for (size_t j = 0; j < n; j++) {
+              REPORT("a[%llu] == %s and b[%llu] == %s\n", static_cast<unsigned long long>(j), a[j].c_str(), static_cast<unsigned long long>(j), b[j].c_str());
+          }
+        }
+        ASSERT( a[i] == b[i], NULL );
+    }
+    return true;
+}
+
+//! A Validate specialized to Minimal since it does not define an operator==
+template<>
+bool Validate<Minimal *>(Minimal *a, Minimal *b, size_t n) {
+    for (size_t i = 0; i < n; i++) {
+        ASSERT( Minimal::AreEqual(a[i],b[i]), NULL );
+    }
+    return true;
+}
+
+//! A Validate specialized to concurrent_vector<Minimal> since it does not define an operator==
+template<>
+bool Validate<tbb::concurrent_vector<Minimal>::iterator>(tbb::concurrent_vector<Minimal>::iterator a,
+                                                         tbb::concurrent_vector<Minimal>::iterator b, size_t n) {
+    for (size_t i = 0; i < n; i++) {
+        ASSERT( Minimal::AreEqual(a[i],b[i]), NULL );
+    }
+    return true;
+}
+
+//! used in Verbose mode for identifying which data set is being used
+static std::string test_type;
+
+//! The default initialization routine.
+/*! This routine assumes that you can assign to the elements from a float.
+    It assumes that iter and sorted_list have already been allocated. It fills
+    them according to the current data set (tracked by a local static variable).
+    Returns true if a valid test has been setup, or false if there is no test to
+    perform.
+*/
+
+template < typename RandomAccessIterator, typename Compare >
+bool init_iter(RandomAccessIterator iter, RandomAccessIterator sorted_list, size_t n, const Compare &compare, bool reset) {
+    static char test_case = 0;
+    const char num_cases = 3;
+
+    if (reset) test_case = 0;
+
+    if (test_case < num_cases) {
+        // switch on the current test case, filling the iter and sorted_list appropriately
+        switch(test_case) {
+            case 0:
+                /* use sin to generate the values */
+                test_type = "sin";
+                for (size_t i = 0; i < n; i++)
+                    iter[i] = sorted_list[i] = static_cast<typename std::iterator_traits< RandomAccessIterator >::value_type>(sin(float(i)));
+                break;
+            case 1:
+                /* presorted list */
+                test_type = "pre-sorted";
+                for (size_t i = 0; i < n; i++)
+                    iter[i] = sorted_list[i] = static_cast<typename std::iterator_traits< RandomAccessIterator >::value_type>(i);
+                break;
+            case 2:
+                /* reverse-sorted list */
+                test_type = "reverse-sorted";
+                for (size_t i = 0; i < n; i++)
+                    iter[i] = sorted_list[i] = static_cast<typename std::iterator_traits< RandomAccessIterator >::value_type>(n - i);
+                break;
+        }
+
+        // pre-sort sorted_list for later validity testing
+        std::sort(sorted_list, sorted_list + n, compare);
+        test_case++;
+        return true;
+    }
+    return false;
+}
+
+template < typename T, typename Compare >
+bool init_iter(T * iter, T * sorted_list, size_t n, const Compare &compare, bool reset) {
+    static char test_case = 0;
+    const char num_cases = 3;
+
+    if (reset) test_case = 0;
+
+    if (test_case < num_cases) {
+        // switch on the current test case, filling the iter and sorted_list appropriately
+        switch(test_case) {
+            case 0:
+                /* use sin to generate the values */
+                test_type = "sin";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i] = T(sin(float(i)));
+                    sorted_list[i] = T(sin(float(i)));
+                }
+                break;
+            case 1:
+                /* presorted list */
+                test_type = "pre-sorted";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i] = T(i);
+                    sorted_list[i] = T(i);
+                }
+                break;
+            case 2:
+                /* reverse-sorted list */
+                test_type = "reverse-sorted";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i] = T(n - i);
+                    sorted_list[i] = T(n - i);
+                }
+                break;
+        }
+
+        // pre-sort sorted_list for later validity testing
+        std::sort(sorted_list, sorted_list + n, compare);
+        test_case++;
+        return true;
+    }
+    return false;
+}
+
+
+//! The initialization routine specialized to the class Minimal
+/*! Minimal cannot have floats assigned to it.  This function uses the set_val method
+*/
+
+template < >
+bool init_iter(Minimal* iter, Minimal * sorted_list, size_t n, const MinimalCompare &compare, bool reset) {
+    static char test_case = 0;
+    const char num_cases = 3;
+
+    if (reset) test_case = 0;
+
+    if (test_case < num_cases) {
+        switch(test_case) {
+            case 0:
+                /* use sin to generate the values */
+                test_type = "sin";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i].set_val( int( sin( float(i) ) * 1000.f) );
+                    sorted_list[i].set_val( int ( sin( float(i) ) * 1000.f) );
+                }
+                break;
+            case 1:
+                /* presorted list */
+                test_type = "pre-sorted";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i].set_val( int(i) );
+                    sorted_list[i].set_val( int(i) );
+                }
+                break;
+            case 2:
+                /* reverse-sorted list */
+                test_type = "reverse-sorted";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i].set_val( int(n-i) );
+                    sorted_list[i].set_val( int(n-i) );
+                }
+                break;
+        }
+        std::sort(sorted_list, sorted_list + n, compare);
+        test_case++;
+        return true;
+    }
+    return false;
+}
+
+//! The initialization routine specialized to the class concurrent_vector<Minimal>
+/*! Minimal cannot have floats assigned to it.  This function uses the set_val method
+*/
+
+template < >
+bool init_iter(tbb::concurrent_vector<Minimal>::iterator iter, tbb::concurrent_vector<Minimal>::iterator sorted_list,
+               size_t n, const MinimalCompare &compare, bool reset) {
+    static char test_case = 0;
+    const char num_cases = 3;
+
+    if (reset) test_case = 0;
+
+    if (test_case < num_cases) {
+        switch(test_case) {
+            case 0:
+                /* use sin to generate the values */
+                test_type = "sin";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i].set_val( int( sin( float(i) ) * 1000.f) );
+                    sorted_list[i].set_val( int ( sin( float(i) ) * 1000.f) );
+                }
+                break;
+            case 1:
+                /* presorted list */
+                test_type = "pre-sorted";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i].set_val( int(i) );
+                    sorted_list[i].set_val( int(i) );
+                }
+                break;
+            case 2:
+                /* reverse-sorted list */
+                test_type = "reverse-sorted";
+                for (size_t i = 0; i < n; i++) {
+                    iter[i].set_val( int(n-i) );
+                    sorted_list[i].set_val( int(n-i) );
+                }
+                break;
+        }
+        std::sort(sorted_list, sorted_list + n, compare);
+        test_case++;
+        return true;
+    }
+    return false;
+}
+
+//! The initialization routine specialized to the class string
+/*! strings are created from floats.
+*/
+
+template<>
+bool init_iter(std::string *iter, std::string *sorted_list, size_t n, const std::less<std::string> &compare, bool reset) {
+    static char test_case = 0;
+    const char num_cases = 1;
+
+    if (reset) test_case = 0;
+
+    if (test_case < num_cases) {
+        switch(test_case) {
+            case 0:
+                /* use sin to generate the values */
+                test_type = "sin";
+                for (size_t i = 0; i < n; i++) {
+                    char buffer[20];
+// Getting rid of secure warning issued by VC 14 and newer
+#if _MSC_VER && __STDC_SECURE_LIB__>=200411
+                    sprintf_s(buffer, sizeof(buffer), "%f", float(sin(float(i))));
+#else
+                    sprintf(buffer, "%f", float(sin(float(i))));
+#endif
+                    sorted_list[i] = iter[i] = std::string(buffer);
+                }
+                break;
+        }
+        std::sort(sorted_list, sorted_list + n, compare);
+        test_case++;
+        return true;
+    }
+    return false;
+}
+
+//! The current number of threads in use (for Verbose only)
+static size_t current_p;
+
+//! The current data type being sorted (for Verbose only)
+static std::string current_type;
+
+//! The default test routine.
+/*! Tests all data set sizes from 0 to N, all grainsizes from 0 to G=10, and selects from
+    all possible interfaces to parallel_sort depending on whether a scratch space and
+    compare have been provided.
+*/
+template<typename RandomAccessIterator, typename Compare>
+bool parallel_sortTest(size_t n, RandomAccessIterator iter, RandomAccessIterator sorted_list, const Compare *comp) {
+    bool passed = true;
+
+    Compare local_comp;
+
+    init_iter(iter, sorted_list, n, local_comp, true);
+    do {
+        REMARK("%s %s p=%llu n=%llu :",current_type.c_str(), test_type.c_str(),
+                   static_cast<unsigned long long>(current_p), static_cast<unsigned long long>(n));
+        if (comp != NULL) {
+            tbb::parallel_sort(iter, iter + n, local_comp );
+         } else {
+            tbb::parallel_sort(iter, iter + n );
+         }
+        if (!Validate(iter, sorted_list, n))
+            passed = false;
+        REMARK("passed\n");
+    } while (init_iter(iter, sorted_list, n, local_comp, false));
+    return passed;
+}
+
+//! The test routine specialize to Minimal, since it does not have a less defined for it
+template<>
+bool parallel_sortTest(size_t n, Minimal * iter, Minimal * sorted_list, const MinimalCompare *compare) {
+    bool passed = true;
+
+    if (compare == NULL) return passed;
+
+    init_iter(iter, sorted_list, n, *compare, true);
+    do {
+        REMARK("%s %s p=%llu n=%llu :",current_type.c_str(), test_type.c_str(),
+                    static_cast<unsigned long long>(current_p), static_cast<unsigned long long>(n));
+
+        tbb::parallel_sort(iter, iter + n, *compare );
+
+        if (!Validate(iter, sorted_list, n))
+            passed = false;
+        REMARK("passed\n");
+    } while (init_iter(iter, sorted_list, n, *compare, false));
+    return passed;
+}
+
+//! The test routine specialize to concurrent_vector of Minimal, since it does not have a less defined for it
+template<>
+bool parallel_sortTest(size_t n, tbb::concurrent_vector<Minimal>::iterator iter,
+                       tbb::concurrent_vector<Minimal>::iterator sorted_list, const MinimalCompare *compare) {
+    bool passed = true;
+
+    if (compare == NULL) return passed;
+
+    init_iter(iter, sorted_list, n, *compare, true);
+    do {
+        REMARK("%s %s p=%llu n=%llu :",current_type.c_str(), test_type.c_str(),
+                    static_cast<unsigned long long>(current_p), static_cast<unsigned long long>(n));
+
+        tbb::parallel_sort(iter, iter + n, *compare );
+
+        if (!Validate(iter, sorted_list, n))
+            passed = false;
+        REMARK("passed\n");
+    } while (init_iter(iter, sorted_list, n, *compare, false));
+    return passed;
+}
+
+//! The main driver for the tests.
+/*! Minimal, float and string types are used.  All interfaces to parallel_sort that are usable
+    by each type are tested.
+*/
+void Flog() {
+    // For each type create:
+    // the list to be sorted by parallel_sort (array)
+    // the list to be sort by STL sort (array_2)
+    // and a less function object
+
+    const size_t N = 50000;
+
+    Minimal *minimal_array = new Minimal[N];
+    Minimal *minimal_array_2 = new Minimal[N];
+    MinimalCompare minimal_less;
+
+    float *float_array = new float[N];
+    float *float_array_2 = new float[N];
+    std::less<float> float_less;
+
+    tbb::concurrent_vector<float> float_cv1;
+    tbb::concurrent_vector<float> float_cv2;
+    float_cv1.grow_to_at_least(N);
+    float_cv2.grow_to_at_least(N);
+
+    std::string *string_array = new std::string[N];
+    std::string *string_array_2 = new std::string[N];
+    std::less<std::string> string_less;
+
+    tbb::concurrent_vector<Minimal> minimal_cv1;
+    tbb::concurrent_vector<Minimal> minimal_cv2;
+    minimal_cv1.grow_to_at_least(N);
+    minimal_cv2.grow_to_at_least(N);
+
+
+    // run the appropriate tests for each type
+
+    current_type = "Minimal(less)";
+    parallel_sortTest(0, minimal_array, minimal_array_2, &minimal_less);
+    parallel_sortTest(1, minimal_array, minimal_array_2, &minimal_less);
+    parallel_sortTest(10, minimal_array, minimal_array_2, &minimal_less);
+    parallel_sortTest(9999, minimal_array, minimal_array_2, &minimal_less);
+    parallel_sortTest(50000, minimal_array, minimal_array_2, &minimal_less);
+
+    current_type = "float (no less)";
+    parallel_sortTest(0, float_array, float_array_2, static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(1, float_array, float_array_2, static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(10, float_array, float_array_2, static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(9999, float_array, float_array_2, static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(50000, float_array, float_array_2, static_cast<std::less<float> *>(NULL));
+
+    current_type = "float (less)";
+    parallel_sortTest(0, float_array, float_array_2, &float_less);
+    parallel_sortTest(1, float_array, float_array_2, &float_less);
+    parallel_sortTest(10, float_array, float_array_2, &float_less);
+    parallel_sortTest(9999, float_array, float_array_2, &float_less);
+    parallel_sortTest(50000, float_array, float_array_2, &float_less);
+
+    current_type = "concurrent_vector<float> (no less)";
+    parallel_sortTest(0, float_cv1.begin(), float_cv2.begin(), static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(1, float_cv1.begin(), float_cv2.begin(), static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(10, float_cv1.begin(), float_cv2.begin(), static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(9999, float_cv1.begin(), float_cv2.begin(), static_cast<std::less<float> *>(NULL));
+    parallel_sortTest(50000, float_cv1.begin(), float_cv2.begin(), static_cast<std::less<float> *>(NULL));
+
+    current_type = "concurrent_vector<float> (less)";
+    parallel_sortTest(0, float_cv1.begin(), float_cv2.begin(), &float_less);
+    parallel_sortTest(1, float_cv1.begin(), float_cv2.begin(), &float_less);
+    parallel_sortTest(10, float_cv1.begin(), float_cv2.begin(), &float_less);
+    parallel_sortTest(9999, float_cv1.begin(), float_cv2.begin(), &float_less);
+    parallel_sortTest(50000, float_cv1.begin(), float_cv2.begin(), &float_less);
+
+    current_type = "string (no less)";
+    parallel_sortTest(0, string_array, string_array_2, static_cast<std::less<std::string> *>(NULL));
+    parallel_sortTest(1, string_array, string_array_2, static_cast<std::less<std::string> *>(NULL));
+    parallel_sortTest(10, string_array, string_array_2, static_cast<std::less<std::string> *>(NULL));
+    parallel_sortTest(9999, string_array, string_array_2, static_cast<std::less<std::string> *>(NULL));
+    parallel_sortTest(50000, string_array, string_array_2, static_cast<std::less<std::string> *>(NULL));
+
+    current_type = "string (less)";
+    parallel_sortTest(0, string_array, string_array_2, &string_less);
+    parallel_sortTest(1, string_array, string_array_2, &string_less);
+    parallel_sortTest(10, string_array, string_array_2, &string_less);
+    parallel_sortTest(9999, string_array, string_array_2, &string_less);
+    parallel_sortTest(50000, string_array, string_array_2, &string_less);
+
+    current_type = "concurrent_vector<Minimal> (less)";
+    parallel_sortTest(0, minimal_cv1.begin(), minimal_cv2.begin(), &minimal_less);
+    parallel_sortTest(1, minimal_cv1.begin(), minimal_cv2.begin(), &minimal_less);
+    parallel_sortTest(10, minimal_cv1.begin(), minimal_cv2.begin(), &minimal_less);
+    parallel_sortTest(9999, minimal_cv1.begin(), minimal_cv2.begin(), &minimal_less);
+    parallel_sortTest(50000, minimal_cv1.begin(), minimal_cv2.begin(), &minimal_less);
+
+    delete [] minimal_array;
+    delete [] minimal_array_2;
+
+    delete [] float_array;
+    delete [] float_array_2;
+
+    delete [] string_array;
+    delete [] string_array_2;
+}
+
+const int elements = 10000;
+
+void rand_vec(std::vector<int> &v) {
+    for (int i=0; i<elements; ++i) {
+        (v.push_back(rand()%elements*10));
+    }
+}
+
+void range_sort_test() {
+    std::vector<int> v;
+
+    typedef std::vector<int>::iterator itor;
+    // iterator checks
+    rand_vec(v);
+    tbb::parallel_sort(v.begin(), v.end());
+    for(itor a=v.begin(); a<v.end()-1; ++a) ASSERT(*a <= *(a+1), "v not sorted");
+    v.clear();
+
+    rand_vec(v);
+    tbb::parallel_sort(v.begin(), v.end(), std::greater<int>());
+    for(itor a=v.begin(); a<v.end()-1; ++a) ASSERT(*a >= *(a+1), "v not sorted");
+    v.clear();
+
+    // range checks
+    rand_vec(v);
+    tbb::parallel_sort(v);
+    for(itor a=v.begin(); a<v.end()-1; ++a) ASSERT(*a <= *(a+1), "v not sorted");
+    v.clear();
+
+    rand_vec(v);
+    tbb::parallel_sort(v, std::greater<int>());
+    for(itor a=v.begin(); a<v.end()-1; ++a) ASSERT(*a >= *(a+1), "v not sorted");
+    v.clear();
+
+    // array tests
+    int arr[elements];
+    for(int i=0; i<elements; ++i) arr[i] = rand()%(elements*10);
+    tbb::parallel_sort(arr);
+    for(int i=0; i<elements-1; ++i) ASSERT(arr[i] <= arr[i+1], "arr not sorted");
+}
+
+#include <cstdio>
+#include "harness_cpu.h"
+
+int TestMain () {
+    if( MinThread<1 ) {
+        REPORT("Usage: number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        if( p>0 ) {
+            tbb::task_scheduler_init init( p );
+            current_p = p;
+            Flog();
+            range_sort_test();
+
+            // Test that all workers sleep when no work
+            TestCPUUserTime(p);
+        }
+    }
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_parallel_while.cpp b/xdl/third_party/tbb/src/test/test_parallel_while.cpp
new file mode 100644
index 00000000..2a9cd6a4
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_parallel_while.cpp
@@ -0,0 +1,171 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/parallel_while.h"
+#include "harness.h"
+
+const int N = 200;
+
+typedef int Element;
+
+//! Representation of an array index with only those signatures required by parallel_while.
+class MinimalArgumentType {
+    void operator=( const MinimalArgumentType& );
+    long my_value;
+    enum {
+        DEAD=0xDEAD,
+        LIVE=0x2718,
+        INITIALIZED=0x3141
+    } my_state;
+public:
+    ~MinimalArgumentType() {
+        ASSERT( my_state==LIVE||my_state==INITIALIZED, NULL );
+        my_state = DEAD;
+    }
+    MinimalArgumentType() {
+        my_state = LIVE;
+    }
+    void set_value( long i ) {
+        ASSERT( my_state==LIVE||my_state==INITIALIZED, NULL );
+        my_value = i;
+        my_state = INITIALIZED;
+    }
+    long get_value() const {
+        ASSERT( my_state==INITIALIZED, NULL );
+        return my_value;
+    }
+};
+
+class IntegerStream {
+    long my_limit;
+    long my_index;
+public:
+    IntegerStream( long n ) : my_limit(n), my_index(0) {}
+    bool pop_if_present( MinimalArgumentType& v ) {
+        if( my_index>=my_limit )
+            return false;
+        v.set_value( my_index );
+        my_index+=2;
+        return true;
+    }
+};
+
+class MatrixMultiplyBody: NoAssign {
+    Element (*a)[N];
+    Element (*b)[N];
+    Element (*c)[N];
+    const int n;
+    tbb::parallel_while<MatrixMultiplyBody>& my_while;
+public:
+    typedef MinimalArgumentType argument_type;
+    void operator()( argument_type i_arg ) const {
+        long i = i_arg.get_value();
+        if( (i&1)==0 && i+1<N ) {
+            MinimalArgumentType value;
+            value.set_value(i+1);
+            my_while.add( value );
+        }
+        for( int j=0; j<n; ++j )
+            c[i][j] = 0;
+        for( int k=0; k<n; ++k ) {
+            Element aik = a[i][k];
+            for( int j=0; j<n; ++j )
+                c[i][j] += aik*b[k][j];
+        }
+    }
+    MatrixMultiplyBody( tbb::parallel_while<MatrixMultiplyBody>& w, Element c_[N][N], Element a_[N][N], Element b_[N][N], int n_ ) :
+        a(a_), b(b_), c(c_), n(n_),  my_while(w)
+    {}
+};
+
+void WhileMatrixMultiply( Element c[N][N], Element a[N][N], Element b[N][N], int n ) {
+    IntegerStream stream( N );
+    tbb::parallel_while<MatrixMultiplyBody> w;
+    MatrixMultiplyBody body(w,c,a,b,n);
+    w.run( stream, body );
+}
+
+#include "tbb/tick_count.h"
+#include <cstdlib>
+#include <cstdio>
+using namespace std;
+
+static long Iterations = 5;
+
+static void SerialMatrixMultiply( Element c[N][N], Element a[N][N], Element b[N][N], int n ) {
+    for( int i=0; i<n; ++i ) {
+        for( int j=0; j<n; ++j )
+            c[i][j] = 0;
+        for( int k=0; k<n; ++k ) {
+            Element aik = a[i][k];
+            for( int j=0; j<n; ++j )
+                c[i][j] += aik*b[k][j];
+        }
+    }
+}
+
+static void InitializeMatrix( Element x[N][N], int n, int salt ) {
+    for( int i=0; i<n; ++i )
+        for( int j=0; j<n; ++j )
+            x[i][j] = (i*n+j)^salt;
+}
+
+static Element A[N][N], B[N][N], C[N][N], D[N][N];
+
+static void Run( int nthread, int n ) {
+    /* Initialize matrices */
+    InitializeMatrix(A,n,5);
+    InitializeMatrix(B,n,10);
+    InitializeMatrix(C,n,0);
+    InitializeMatrix(D,n,15);
+
+    tbb::tick_count t0 = tbb::tick_count::now();
+    for( long i=0; i<Iterations; ++i ) {
+        WhileMatrixMultiply( C, A, B, n );
+    }
+    tbb::tick_count t1 = tbb::tick_count::now();
+    SerialMatrixMultiply( D, A, B, n );
+
+    // Check result
+    for( int i=0; i<n; ++i )
+        for( int j=0; j<n; ++j )
+            ASSERT( C[i][j]==D[i][j], NULL );
+    REMARK("time=%g\tnthread=%d\tn=%d\n",(t1-t0).seconds(),nthread,n);
+}
+
+#include "tbb/task_scheduler_init.h"
+#include "harness_cpu.h"
+
+int TestMain () {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init( p );
+        for( int n=N/4; n<=N; n+=N/4 )
+            Run(p,n);
+
+        // Test that all workers sleep when no work
+        TestCPUUserTime(p);
+    }
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_partitioner.h b/xdl/third_party/tbb/src/test/test_partitioner.h
new file mode 100644
index 00000000..6b907dc2
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_partitioner.h
@@ -0,0 +1,611 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    // VS2008/VC9 has an issue in math.h
+    #pragma warning( push )
+    #pragma warning( disable: 4985 )
+#endif
+#include <cmath>
+#if _MSC_VER==1500 && !__INTEL_COMPILER
+    #pragma warning( pop )
+#endif
+#include "tbb/tbb_stddef.h"
+#include "harness.h"
+#include <vector>
+
+namespace test_partitioner_utils {
+
+struct RangeStatisticData {
+    // denotes the number of range objects
+    size_t m_rangeNum;
+
+    // store minimal and maximal range sizes (in terms of number of iterations)
+    size_t m_minRangeSize;
+    size_t m_maxRangeSize;
+
+    bool m_wasMinRangeSizeWritten; // shows whether relevant field was written or not
+};
+
+using tbb::internal::uint64_t;
+using tbb::split;
+using tbb::proportional_split;
+using tbb::blocked_range;
+
+// helper for calculating number of range objects created before balancing phase is started
+// and for finding maximum and minimum number of iterations among all such ranges
+// Note: class does not provide exclusive access to members
+class RangeStatisticCollector {
+public:
+    RangeStatisticCollector(RangeStatisticData *statisticData) :
+        m_statData(statisticData)
+    {
+        m_called = false;
+        if (m_statData)
+            m_statData->m_rangeNum = 1;
+    }
+
+    // constructor is called from non-proportional split constructor of derived Range
+    RangeStatisticCollector(RangeStatisticCollector& sc, size_t rangeSize) {
+        if (!sc.m_called) {
+            // this is the first time non-proportional split constructor is called
+            // it means that work distribution phase has been completed and
+            // work balancing phase has been just started
+            sc.m_called = true;
+
+            if (sc.m_statData) {
+                size_t *minRangeSize = &sc.m_statData->m_minRangeSize;
+                if (*minRangeSize > rangeSize || !sc.m_statData->m_wasMinRangeSizeWritten) { // if minimum is not an actual minimum
+                    *minRangeSize = rangeSize;
+                    sc.m_statData->m_wasMinRangeSizeWritten = true;
+                }
+                size_t *maxRangeSize = &sc.m_statData->m_maxRangeSize;
+                if (*maxRangeSize < rangeSize) { // if maximum is not an actual maximum
+                    *maxRangeSize = rangeSize;
+                }
+            }
+        }
+        *this = sc;
+        // constructor is used on work balancing phase only, so no need to increment
+        // number of range objects created
+    }
+
+    RangeStatisticCollector(RangeStatisticCollector& sc, proportional_split&) {
+        if (sc.m_statData)
+            sc.m_statData->m_rangeNum++;
+        *this = sc;
+    }
+
+private:
+    RangeStatisticData *m_statData;
+
+    // turns to 'true' when non-proportional split constructor is called first time
+    bool m_called;
+};
+
+// Base class for fake ranges used in vaious tests for parallel
+// algorithms as well as for partitioner
+template <typename DerivedRange, typename T>
+class RangeBase: public RangeStatisticCollector {
+protected:
+    size_t my_begin, my_end;
+    bool m_provide_feedback;
+    bool m_ensure_non_empty_size;
+public:
+    RangeBase(size_t _begin, size_t _end, RangeStatisticData *statData,
+              bool provide_feedback, bool ensure_non_empty_size)
+        : RangeStatisticCollector(statData)
+        , my_begin(_begin), my_end(_end)
+        , m_provide_feedback(provide_feedback)
+        , m_ensure_non_empty_size(ensure_non_empty_size)
+        { }
+    RangeBase(RangeBase& r, tbb::split) : RangeStatisticCollector(r, r.size()) {
+        *this = r;
+        size_t middle = r.my_begin + (r.my_end - r.my_begin) / 2u;
+        r.my_end = my_begin = middle;
+    }
+
+    RangeBase(RangeBase& r, proportional_split& p) : RangeStatisticCollector(r, p) {
+        *this = r;
+        size_t original_size = r.size();
+        T right = self().compute_right_part(r, p);
+        size_t right_part = self().round(right);
+        if( m_ensure_non_empty_size ) {
+            right_part = (original_size == right_part) ? (original_size - 1) : right_part;
+            right_part = (right_part != 0) ? right_part : 1;
+        }
+        r.my_end = my_begin = r.my_end - right_part;
+#if __TBB_ENABLE_RANGE_FEEDBACK
+        if( m_provide_feedback )
+            p.set_proportion(original_size - right_part, right_part);
+#endif
+        if( m_ensure_non_empty_size )
+            ASSERT(r.my_end != r.my_begin && my_end != my_begin, "Incorrect range split");
+    }
+
+    size_t begin() const { return my_begin; }
+    size_t end() const { return my_end; }
+    bool is_divisible() const { return (my_end - my_begin) > 1; }
+    bool empty() const { return my_end == my_begin; }
+    size_t size() const { return my_end - my_begin; }
+
+    // helper methods (not part of the range concept)
+    DerivedRange& self() { return static_cast<DerivedRange&>(*this); }
+    size_t round(T part) { return size_t(part); }
+    T compute_right_part(RangeBase& r, proportional_split& p) {
+        return T(r.size() * T(p.right())) / T(p.left() + p.right());
+    }
+    bool is_ensure_non_emptiness() { return m_ensure_non_empty_size; }
+};
+
+namespace TestRanges {
+/*
+ * RoundedUpRange rounds result up
+ * RoundedDownRange rounds result down
+ * Range1_2 forces proportion always to be 1:2 and rounds up
+ * Range1_999 uses weird proportion 1:999 and rounds up
+ * Range1_999 uses weird proportion 999:1 and rounds up
+ * BlockedRange uses tbb::blocked_range formula for proportion calculation
+ * InvertedProportionRange inverts proportion suggested by partitioner (e.g. 1:3 --> 3:1)
+ * ExactSplitRange uses integer arithmetic for accurate splitting
+ */
+
+class RoundedDownRange: public RangeBase<RoundedDownRange, float> {
+public:
+    RoundedDownRange(size_t _begin, size_t _end, RangeStatisticData *statData,
+                     bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<RoundedDownRange, float>(_begin, _end, statData, provide_feedback,
+                                             ensure_non_empty_size) { }
+    RoundedDownRange(RoundedDownRange& r, tbb::split)
+        : RangeBase<RoundedDownRange, float>(r, tbb::split()) { }
+    RoundedDownRange(RoundedDownRange& r, proportional_split& p)
+        : RangeBase<RoundedDownRange, float>(r, p) { }
+    // uses default implementation of RangeBase::round() which rounds down
+    static const bool is_splittable_in_proportion = true;
+};
+
+class RoundedUpRange: public RangeBase<RoundedUpRange, float> {
+public:
+    RoundedUpRange(size_t _begin, size_t _end, RangeStatisticData *statData,
+                   bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<RoundedUpRange, float>(_begin, _end, statData, provide_feedback,
+                                           ensure_non_empty_size) { }
+    RoundedUpRange(RoundedUpRange& r, tbb::split)
+        : RangeBase<RoundedUpRange, float>(r, tbb::split()) { }
+    RoundedUpRange(RoundedUpRange& r, proportional_split& p)
+        : RangeBase<RoundedUpRange, float>(r, p) { }
+    size_t round(float part) { return size_t(std::ceil(part)); }
+    static const bool is_splittable_in_proportion = true;
+};
+
+class Range1_2: public RangeBase<Range1_2, float> {
+public:
+    Range1_2(size_t _begin, size_t _end, RangeStatisticData *statData,
+             bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<Range1_2, float>(_begin, _end, statData, provide_feedback,
+                                     ensure_non_empty_size) { }
+    Range1_2(Range1_2& r, tbb::split) : RangeBase<Range1_2, float>(r, tbb::split()) { }
+    Range1_2(Range1_2& r, proportional_split& p) : RangeBase<Range1_2, float>(r, p) { }
+    static const bool is_splittable_in_proportion = true;
+    float compute_right_part(RangeBase<Range1_2, float>& r, proportional_split&) {
+        return float(r.size() * 2) / 3.0f;
+    }
+    // uses default implementation of RangeBase::round() which rounds down
+};
+
+class Range1_999: public RangeBase<Range1_999, float> {
+public:
+    Range1_999(size_t _begin, size_t _end, RangeStatisticData *statData,
+               bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<Range1_999, float>(_begin, _end, statData, provide_feedback,
+                                       ensure_non_empty_size) { }
+    Range1_999(Range1_999& r, tbb::split) : RangeBase<Range1_999, float>(r, tbb::split()) { }
+    Range1_999(Range1_999& r, proportional_split& p) : RangeBase<Range1_999, float>(r, p) { }
+    static const bool is_splittable_in_proportion = true;
+    float compute_right_part(RangeBase<Range1_999, float>& r, proportional_split&) {
+        return float(r.size() * 999) / 1000.0f;
+    }
+    // uses default implementation of RangeBase::round() which rounds down
+};
+
+class Range999_1: public RangeBase<Range999_1, float> {
+public:
+    Range999_1(size_t _begin, size_t _end, RangeStatisticData *statData,
+               bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<Range999_1, float>(_begin, _end, statData, provide_feedback,
+                                       ensure_non_empty_size) { }
+    Range999_1(Range999_1& r, tbb::split) : RangeBase<Range999_1, float>(r, tbb::split()) { }
+    Range999_1(Range999_1& r, proportional_split& p) : RangeBase<Range999_1, float>(r, p) { }
+    static const bool is_splittable_in_proportion = true;
+    float compute_right_part(RangeBase<Range999_1, float>& r, proportional_split&) {
+        return float(r.size()) / 1000.0f;
+    }
+    // uses default implementation of RangeBase::round() which rounds down
+};
+
+class BlockedRange: public RangeStatisticCollector, public blocked_range<size_t>  {
+public:
+    BlockedRange(size_t _begin, size_t _end, RangeStatisticData *statData, bool, bool)
+        : RangeStatisticCollector(statData), blocked_range<size_t>(_begin, _end) { }
+    BlockedRange(BlockedRange& r, split)
+        : RangeStatisticCollector(r, r.size()), blocked_range<size_t>(r, split()) { }
+    BlockedRange(BlockedRange& r, proportional_split& p)
+        : RangeStatisticCollector(r, p), blocked_range<size_t>(r, p) { }
+    static const bool is_splittable_in_proportion = true;
+    bool is_ensure_non_emptiness() { return false; }
+};
+
+class InvertedProportionRange: public RangeBase<InvertedProportionRange, float> {
+public:
+    InvertedProportionRange(size_t _begin, size_t _end, RangeStatisticData *statData,
+                            bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<InvertedProportionRange, float>(_begin, _end, statData, provide_feedback,
+                                                    ensure_non_empty_size) { }
+    InvertedProportionRange(InvertedProportionRange& r, split)
+        : RangeBase<InvertedProportionRange, float>(r, split()) { }
+    InvertedProportionRange(InvertedProportionRange& r, proportional_split& p)
+        : RangeBase<InvertedProportionRange, float>(r, p) { }
+    float compute_right_part(RangeBase<InvertedProportionRange, float>& r,
+                             proportional_split& p) {
+        return float(r.size() * float(p.left())) / float(p.left() + p.right());
+    }
+    static const bool is_splittable_in_proportion = true;
+};
+
+class ExactSplitRange: public RangeBase<ExactSplitRange, size_t> {
+public:
+    ExactSplitRange(size_t _begin, size_t _end, RangeStatisticData *statData,
+                    bool provide_feedback, bool ensure_non_empty_size)
+        : RangeBase<ExactSplitRange, size_t>(_begin, _end, statData, provide_feedback,
+                                             ensure_non_empty_size) { }
+    ExactSplitRange(ExactSplitRange& r, split)
+        : RangeBase<ExactSplitRange, size_t>(r, split()) { }
+    ExactSplitRange(ExactSplitRange& r, proportional_split& p)
+        : RangeBase<ExactSplitRange, size_t>(r, p) { }
+    size_t compute_right_part(RangeBase<ExactSplitRange, size_t>& r, proportional_split& p) {
+        size_t parts = size_t(p.left() + p.right());
+        size_t currSize = r.size();
+        size_t int_part = currSize / parts * p.right();
+        size_t remainder = currSize % parts * p.right();
+        int_part += remainder / parts;
+        remainder %= parts;
+        size_t right_part = int_part + (remainder > parts/2 ? 1 : 0);
+        return right_part;
+    }
+    static const bool is_splittable_in_proportion = true;
+};
+
+} // namespace TestRanges
+
+struct TreeNode {
+    size_t m_affinity;
+    size_t m_range_begin, m_range_end;
+    TreeNode *m_left, *m_right;
+private:
+    TreeNode(size_t range_begin, size_t range_end, size_t affinity,
+             TreeNode* left, TreeNode* right)
+        : m_affinity(affinity), m_range_begin(range_begin), m_range_end(range_end),
+          m_left(left), m_right(right) { }
+
+    friend TreeNode* make_node(size_t range_begin, size_t range_end, size_t affinity,
+                               TreeNode *left, TreeNode *right);
+};
+
+TreeNode* make_node(size_t range_begin, size_t range_end, size_t affinity,
+                    TreeNode* left = NULL, TreeNode* right = NULL) {
+    ASSERT(range_begin <= range_end, "Incorrect range interval");
+    return new TreeNode(range_begin, range_end, affinity, left, right);
+}
+
+// Class stores nodes as a binary tree
+// (marshals TreeNode objects in accordance with values of range intervals)
+// Note: BinaryTree deletes all TreeNode objects pushed into it in a destruction phase
+class BinaryTree {
+public:
+    BinaryTree() : m_root(NULL) { }
+    ~BinaryTree() {
+        if (m_root)
+            remove_node_recursively(m_root);
+    }
+
+    // pushed node must be within subrange of the parent nodes
+    void push_node(TreeNode* node) {
+        if (!node)
+            return;
+
+        if (m_root) {
+            ASSERT(node->m_range_begin >= m_root->m_range_begin &&
+                         node->m_range_end <= m_root->m_range_end,
+                         "Cannot push node not from subrange");
+        }
+
+        push_subnode(m_root, node);
+    }
+
+    void visualize() {
+        if (!m_root) { // nothing to visualize
+            REPORT("Tree is empty\n");
+            return;
+        }
+        visualize_node(m_root);
+    }
+
+    bool operator ==(const BinaryTree& other_tree) const { return compare_nodes(m_root, other_tree.m_root); }
+    void fill_leafs(std::vector<TreeNode*>& leafs) const { fill_leafs_impl(m_root, leafs); }
+
+private:
+    TreeNode *m_root;
+
+    void push_subnode(TreeNode *&root_node, TreeNode *node) {
+        if (!root_node) {
+            root_node = node;
+            return;
+        } else if (are_nodes_equal(root_node, node)) {
+            // no need to push the same node
+            return;
+        }
+
+        if (!has_children(root_node)) {
+            // if current root_node does not have children passed node
+            // should has one of the interval bounds to be equal to
+            // the same bound in the root_node
+            if (is_look_like_left_sibling(root_node, node))
+                push_subnode(root_node->m_left, node);
+            else
+                push_subnode(root_node->m_right, node);
+            return;
+        }
+
+        if (has_left_child(root_node)) {
+            if (is_subnode(root_node->m_left, node)) {
+                push_subnode(root_node->m_left, node);
+                return;
+            }
+            push_subnode(root_node->m_right, node);
+            return;
+        }
+
+        ASSERT(root_node->m_right != NULL, "Right child is NULL but must be present");
+        if (is_subnode(root_node->m_right, node)) {
+            push_subnode(root_node->m_right, node);
+            return;
+        }
+        push_subnode(root_node->m_left, node);
+        return;
+    }
+
+    bool has_children(TreeNode *node) { return node->m_left || node->m_right; }
+
+    bool is_look_like_left_sibling(TreeNode *root_node, TreeNode *node) {
+        if (root_node->m_range_begin == node->m_range_begin)
+            return true;
+        ASSERT(root_node->m_range_end == node->m_range_end, NULL);
+        return false;
+    }
+
+    bool has_left_child(TreeNode *node) { return node->m_left != NULL; }
+
+    bool is_subnode(TreeNode *root_node, TreeNode *node) {
+        return root_node->m_range_begin <= node->m_range_begin &&
+            node->m_range_end <= root_node->m_range_end;
+    }
+
+    bool are_nodes_equal(TreeNode *node1, TreeNode *node2) const {
+        return node1->m_range_begin == node2->m_range_begin &&
+            node1->m_range_end == node2->m_range_end;
+    }
+
+    void remove_node_recursively(TreeNode *node) {
+        if (node->m_left)
+            remove_node_recursively(node->m_left);
+        if (node->m_right)
+            remove_node_recursively(node->m_right);
+        delete node;
+    }
+
+    static void visualize_node(const TreeNode* node, unsigned indent = 0) {
+        // respecting indent
+        const char *indentStep = "    ";
+        for (unsigned i = 0; i < indent; ++i)
+            REPORT("%s", indentStep);
+
+        size_t rangeSize = node->m_range_end - node->m_range_begin;
+        REPORT("[%llu, %llu)%%%llu@%llu\n", uint64_t(node->m_range_begin), uint64_t(node->m_range_end),
+               uint64_t(rangeSize), uint64_t(node->m_affinity));
+
+        if (node->m_left)
+            visualize_node(node->m_left, indent + 1);
+        if (node->m_right)
+            visualize_node(node->m_right, indent + 1);
+    }
+
+    bool compare_nodes(TreeNode* node1, TreeNode* node2) const {
+        if (node1 == NULL && node2 == NULL) return true;
+        if (node1 == NULL || node2 == NULL) return false;
+        return are_nodes_equal(node1, node2) && compare_nodes(node1->m_left, node2->m_left)
+            && compare_nodes(node1->m_right, node2->m_right);
+    }
+
+    void fill_leafs_impl(TreeNode* node, std::vector<TreeNode*>& leafs) const {
+        if (node->m_left == NULL && node->m_right == NULL)
+            leafs.push_back(node);
+        if (node->m_left != NULL) fill_leafs_impl(node->m_left, leafs);
+        if (node->m_right != NULL) fill_leafs_impl(node->m_right, leafs);
+    }
+};
+
+class SimpleBody {
+public:
+    SimpleBody() { }
+    template <typename Range>
+    void operator()(Range&) const { }
+};
+
+class SimpleReduceBody {
+public:
+    SimpleReduceBody() { }
+    SimpleReduceBody(SimpleReduceBody&, tbb::split) { }
+    template <typename Range>
+    void operator()(Range&) { }
+    void join(SimpleReduceBody&) { }
+};
+
+namespace interaction_with_range_and_partitioner {
+
+class SplitConstructorAssertedRange {
+    mutable bool is_divisible_called;
+    mutable bool is_empty_called;
+    bool my_assert_in_nonproportional, my_assert_in_proportional;
+public:
+    SplitConstructorAssertedRange(bool assert_in_nonproportional, bool assert_in_proportional)
+        : is_divisible_called(false),
+          is_empty_called(false),
+          my_assert_in_nonproportional(assert_in_nonproportional),
+          my_assert_in_proportional(assert_in_proportional) { }
+    SplitConstructorAssertedRange(SplitConstructorAssertedRange& r, tbb::split) {
+        *this = r;
+        ASSERT( !my_assert_in_nonproportional, "Disproportional splitting constructor was called but should not been" );
+    }
+    SplitConstructorAssertedRange(SplitConstructorAssertedRange& r, proportional_split&) {
+        *this = r;
+        ASSERT( !my_assert_in_proportional, "Proportional splitting constructor was called but should not been" );
+    }
+    bool is_divisible() const {
+        if (!is_divisible_called) {
+            is_divisible_called = true;
+            return true;
+        }
+        return false;
+    }
+    bool empty() const {
+        if (!is_empty_called) {
+            is_empty_called = true;
+            return false;
+        }
+        return true;
+    }
+};
+
+/*
+ * Possible use cases are:
+ * -------------------------------------------------------------------------------------------------------------
+ * Range#  is_splittable_in_proportion   Range proportional ctor      Used partitioner          Result Effect
+ * -------------------------------------------------------------------------------------------------------------
+ *   1           true                       available                proportional             pMN, r(p), part(p)
+ * -------------------------------------------------------------------------------------------------------------
+ *   2           false                      available                proportional             p11, r(p), part(p)
+ * -------------------------------------------------------------------------------------------------------------
+ *   3        not defined                   available                proportional             p11, r(p), part(p)
+ * -------------------------------------------------------------------------------------------------------------
+ *   4           true                     not available              proportional             pMN, r(s), part(p)  *
+ * -------------------------------------------------------------------------------------------------------------
+ *   5           false                    not available              proportional             p11, r(s), part(p)
+ * -------------------------------------------------------------------------------------------------------------
+ *   6        not defined                 not available              proportional             p11, r(s), part(p)
+ * -------------------------------------------------------------------------------------------------------------
+ *   1           true                       available                   simple                s, r(s), part(s)
+ * -------------------------------------------------------------------------------------------------------------
+ *   2           false                      available                   simple                s, r(s), part(s)
+ * -------------------------------------------------------------------------------------------------------------
+ *   3        not defined                   available                   simple                s, r(s), part(s)
+ * -------------------------------------------------------------------------------------------------------------
+ *   4           true                     not available                 simple                s, r(s), part(s)
+ * -------------------------------------------------------------------------------------------------------------
+ *   5           false                    not available                 simple                s, r(s), part(s)
+ * -------------------------------------------------------------------------------------------------------------
+ *   6        not defined                 not available                 simple                s, r(s), part(s)
+ * -------------------------------------------------------------------------------------------------------------
+ *
+ * Legend:
+ *   proportional - with proportional splits (e.g. affinity_partitioner)
+ *   simple  - without proportional splits (e.g. simple_partitioner, auto_partitioner)
+ *   pMN     - proportional_split object with proportion M to N is created. (p11 - proportion 1 to 1)
+ *   s       - split object is created
+ *   r(p)    - range's proportional split constructor is called
+ *   r(s)    - range's ordinary split constructor is called
+ *   part(p) - partitioner's proportional split constructor is called
+ *   part(s) - partitioner's ordinary split constructor is called
+ *      *    - incorrect split behavior is possible (e.g. partitioner divides at an arbitrary ratio while
+ *             range divides into halves)
+ */
+
+
+// is_splittable_in_proportion = true, proportional_split ctor
+class Range1: public SplitConstructorAssertedRange {
+public:
+    Range1(bool assert_in_nonproportional, bool assert_in_proportional)
+        : SplitConstructorAssertedRange(assert_in_nonproportional, assert_in_proportional) { }
+    Range1( Range1& r, tbb::split ) : SplitConstructorAssertedRange(r, tbb::split()) { }
+    Range1( Range1& r, proportional_split& proportion ) : SplitConstructorAssertedRange(r, proportion) { }
+    static const bool is_splittable_in_proportion = true;
+};
+
+// is_splittable_in_proportion = false, proportional_split ctor
+class Range2: public SplitConstructorAssertedRange {
+public:
+    Range2(bool assert_in_nonproportional, bool assert_in_proportional)
+        : SplitConstructorAssertedRange(assert_in_nonproportional, assert_in_proportional) { }
+    Range2(Range2& r, tbb::split) : SplitConstructorAssertedRange(r, tbb::split()) { }
+    Range2(Range2& r, proportional_split& p) : SplitConstructorAssertedRange(r, p) {
+        // TODO: add check that 'is_splittable_in_proportion==false' results only in 1:1 proportions
+    }
+    static const bool is_splittable_in_proportion = false;
+};
+
+// is_splittable_in_proportion is not defined, proportional_split ctor
+class Range3: public SplitConstructorAssertedRange {
+public:
+    Range3(bool assert_in_nonproportional, bool assert_in_proportional)
+        : SplitConstructorAssertedRange(assert_in_nonproportional, assert_in_proportional) { }
+    Range3(Range3& r, tbb::split) : SplitConstructorAssertedRange(r, tbb::split()) { }
+    Range3(Range3& r, proportional_split& p) : SplitConstructorAssertedRange(r, p) {
+        // TODO: add check that absence of 'is_splittable_in_proportion' results only in 1:1 proportions
+    }
+};
+
+// is_splittable_in_proportion = true, proportional_split ctor is not defined
+class Range4: public SplitConstructorAssertedRange {
+public:
+    Range4(bool assert_in_nonproportional, bool assert_in_proportional)
+        : SplitConstructorAssertedRange(assert_in_nonproportional, assert_in_proportional) { }
+    Range4(Range4& r, tbb::split) : SplitConstructorAssertedRange(r, tbb::split()) { }
+    static const bool is_splittable_in_proportion = true;
+};
+
+// is_splittable_in_proportion = false, proportional_split ctor is not defined
+class Range5: public SplitConstructorAssertedRange {
+public:
+    Range5(bool assert_in_nonproportional, bool assert_in_proportional)
+        : SplitConstructorAssertedRange(assert_in_nonproportional, assert_in_proportional) { }
+    Range5(Range5& r, tbb::split) : SplitConstructorAssertedRange(r, tbb::split()) { }
+    static const bool is_splittable_in_proportion = false;
+};
+
+// is_splittable_in_proportion is not defined, proportional_split ctor is not defined
+class Range6: public SplitConstructorAssertedRange {
+public:
+    Range6(bool assert_in_nonproportional, bool assert_in_proportional)
+        : SplitConstructorAssertedRange(assert_in_nonproportional, assert_in_proportional) { }
+    Range6(Range6& r, tbb::split) : SplitConstructorAssertedRange(r, tbb::split()) { }
+};
+
+} // namespace interaction_with_range_and_partitioner
+
+} // namespace test_partitioner_utils
diff --git a/xdl/third_party/tbb/src/test/test_partitioner_whitebox.cpp b/xdl/third_party/tbb/src/test/test_partitioner_whitebox.cpp
new file mode 100644
index 00000000..b922a20c
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_partitioner_whitebox.cpp
@@ -0,0 +1,151 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_assert.h"
+#include "test_partitioner_whitebox.h"
+
+using uniform_iterations_distribution::ParallelTestBody;
+
+template<typename Partitioner>
+class ParallelBody: public ParallelTestBody {
+public:
+    ParallelBody(size_t parallel_group_thread_starting_index)
+        : ParallelTestBody(parallel_group_thread_starting_index) { }
+
+    void operator()(size_t relative_thread_index) const {
+        use_case_settings_t settings = {
+            m_parallel_group_thread_starting_index + relative_thread_index, // thread_num
+            0,                                                              // factors_array_len
+            0,                                                              // range_begin
+            false,                                                          // provide_feedback (disabled)
+            true,                                                           // ensure_non_empty_size
+            0,                                                              // above_threads_size_tolerance
+            0,                                                              // below_threads_size_tolerance
+            0,                                                              // between_min_max_ranges_tolerance
+            &ParallelTestBody::uniform_distribution_checker                 // checker function for a particular test case
+        };
+        g_threadNums.local() = settings.thread_num;
+        using namespace test_partitioner_utils::TestRanges;
+        {
+            size_t factors[] = { 1, 2, 3, 4, 5, 7, 9, 13, 27, 29, 30, 31, 32 };
+            settings.factors_array_len = sizeof(factors) / sizeof(factors[0]);
+
+            settings.between_min_max_ranges_tolerance = 0; // it should be equal to zero for blocked_range
+            test<BlockedRange, Partitioner>(settings, factors);
+
+            settings.checker = &ParallelTestBody::nonuniform_distribution_checker;
+            test<InvertedProportionRange, Partitioner>(settings, factors);
+            test<RoundedDownRange, Partitioner>(settings, factors);
+            test<RoundedUpRange, Partitioner>(settings, factors);
+
+            test<Range1_2, Partitioner>(settings, factors);
+            test<Range1_999, Partitioner>(settings, factors);
+            test<Range999_1, Partitioner>(settings, factors);
+        }
+
+        {
+            // iterations might not be distributed uniformly
+            float factors[] = { 1.2f, 2.5f, 3.7f, 4.2f, 5.1f, 8.9f, 27.8f };
+            settings.factors_array_len = sizeof(factors) / sizeof(factors[0]);
+
+            settings.between_min_max_ranges_tolerance = 1; // it should be equal to one for blocked_range
+            settings.checker = &ParallelTestBody::uniform_distribution_checker;
+            test<BlockedRange, Partitioner>(settings, factors);
+
+            settings.checker = &ParallelTestBody::nonuniform_distribution_checker;
+            test<InvertedProportionRange, Partitioner>(settings, factors);
+            test<RoundedDownRange, Partitioner>(settings, factors);
+            test<RoundedUpRange, Partitioner>(settings, factors);
+
+            test<Range1_2, Partitioner>(settings, factors);
+            test<Range1_999, Partitioner>(settings, factors);
+            test<Range999_1, Partitioner>(settings, factors);
+        }
+
+        {
+            // iterations might not be distributed uniformly
+            size_t factors[] = { 1, 2, 3, 4, 5, 7, 9, 11, 13, 27, 29, 30, 31, 32 };
+            settings.factors_array_len = sizeof(factors) / sizeof(factors[0]);
+
+            settings.checker = &ParallelTestBody::uniform_distribution_checker;
+            test<BlockedRange, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<BlockedRange, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+
+            settings.checker = &ParallelTestBody::nonuniform_distribution_checker;
+            test<InvertedProportionRange, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<InvertedProportionRange, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+
+            test<RoundedDownRange, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<RoundedDownRange, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+
+            test<RoundedUpRange, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<RoundedUpRange, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+
+            test<Range1_2, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<Range1_2, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+
+            test<Range1_999, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<Range1_999, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+
+            test<Range999_1, Partitioner>(settings, factors, &shifted_left_range_size_generator);
+            test<Range999_1, Partitioner>(settings, factors, &shifted_right_range_size_generator);
+        }
+
+        {
+            settings.factors_array_len = 1;
+            settings.between_min_max_ranges_tolerance = 1; // since range iterations are not divided without remainder
+            settings.checker = &ParallelTestBody::uniform_distribution_checker;
+            test<ExactSplitRange, Partitioner, size_t>(settings, NULL, &max_range_size_generator);
+            settings.range_begin = size_t(-1) - 10000;
+            test<ExactSplitRange, Partitioner, size_t>(settings, NULL, &max_range_size_generator);
+        }
+
+        {
+            settings.range_begin = 0;
+            settings.factors_array_len = 2 * unsigned(settings.thread_num);
+            settings.checker = &ParallelTestBody::nonuniform_distribution_checker;
+
+            test<RoundedUpRange, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<RoundedDownRange, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+
+            test<InvertedProportionRange, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<Range1_2, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<Range1_999, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<Range999_1, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+
+            settings.ensure_non_empty_size = false;
+            test<RoundedUpRange, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<RoundedDownRange, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+
+            test<InvertedProportionRange, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<Range1_2, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<Range1_999, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+            test<Range999_1, Partitioner, size_t>(settings, NULL, &simple_size_generator);
+        }
+    }
+};
+
+int TestMain() {
+    uniform_iterations_distribution::test<ParallelBody <tbb::affinity_partitioner> >();
+    uniform_iterations_distribution::test<ParallelBody <tbb::static_partitioner> >();
+    uniform_iterations_distribution::test_task_affinity<tbb::affinity_partitioner>();
+    uniform_iterations_distribution::test_task_affinity<tbb::static_partitioner>();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_partitioner_whitebox.h b/xdl/third_party/tbb/src/test/test_partitioner_whitebox.h
new file mode 100644
index 00000000..f42e063d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_partitioner_whitebox.h
@@ -0,0 +1,471 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/* Common part for the partitioner whitebox tests */
+
+#include <typeinfo>
+
+#include "tbb/tbb_thread.h"
+#include "tbb/enumerable_thread_specific.h"
+
+#include "string.h"
+#include "harness_assert.h"
+#include "test_partitioner.h"
+#include <numeric>
+
+#if TBB_USE_DEBUG
+// reducing number of simulations due to test timeout
+const size_t max_simulated_threads = 256;
+#else
+const size_t max_simulated_threads = 640;
+#endif
+
+typedef tbb::enumerable_thread_specific<size_t> ThreadNumsType;
+size_t g_threadNumInitialValue = 10;
+ThreadNumsType g_threadNums(g_threadNumInitialValue);
+
+namespace whitebox_simulation {
+size_t whitebox_thread_index = 0;
+test_partitioner_utils::BinaryTree reference_tree;
+}
+
+// simulate a subset of task.h
+namespace tbb {
+namespace internal {
+typedef unsigned short affinity_id;
+}
+class fake_task {
+public:
+    typedef internal::affinity_id affinity_id;
+    void set_affinity(affinity_id a) { my_affinity = a; }
+    affinity_id affinity() const { return my_affinity; }
+    void set_parent(fake_task* p) { my_parent = p; }
+    fake_task *parent() const { return my_parent; }
+    bool is_stolen_task() const { return false; }
+    intptr_t ref_count() const { return 1; }
+    bool is_cancelled() const { return false; }
+    static void spawn(fake_task &) {} // for legacy in partitioner.h
+    virtual fake_task* execute() = 0; // enables dynamic_cast
+
+    fake_task() : my_parent(0), my_affinity(0) {}
+    virtual ~fake_task() {}
+private:
+    fake_task *my_parent;
+    affinity_id my_affinity;
+};
+namespace task_arena {
+static const int not_initialized = -2;//should match corresponding value in task_arena.h
+}//namespace task_arena
+namespace this_task_arena {
+inline int current_thread_index() { return (int)whitebox_simulation::whitebox_thread_index; }
+}
+}//namespace tbb
+
+#define __TBB_task_H
+#define __TBB_task_arena_H
+#define get_initial_auto_partitioner_divisor my_get_initial_auto_partitioner_divisor
+#define affinity_partitioner_base_v3 my_affinity_partitioner_base_v3
+#define task fake_task
+#define __TBB_STATIC_THRESHOLD 0
+#include "tbb/partitioner.h"
+#undef __TBB_STATIC_THRESHOLD
+#undef task
+#undef affinity_partitioner_base_v3
+#undef get_initial_auto_partitioner_divisor
+
+// replace library functions to simulate concurrency
+namespace tbb {
+namespace internal {
+size_t my_get_initial_auto_partitioner_divisor() {
+    const size_t X_FACTOR = 4;
+    return X_FACTOR * g_threadNums.local();
+}
+
+void* __TBB_EXPORTED_FUNC NFS_Allocate( size_t n_element, size_t element_size, void* hint );
+void __TBB_EXPORTED_FUNC NFS_Free( void* );
+
+void my_affinity_partitioner_base_v3::resize( unsigned factor ) {
+    // Check factor to avoid asking for number of workers while there might be no arena.
+    size_t new_size = factor ? factor * g_threadNums.local() : 0;
+    if (new_size != my_size) {
+        if (my_array) {
+            NFS_Free(my_array);
+            // Following two assignments must be done here for sake of exception safety.
+            my_array = NULL;
+            my_size = 0;
+        }
+        if (new_size) {
+            my_array = static_cast<affinity_id*>(NFS_Allocate(new_size, sizeof(affinity_id), NULL ));
+            memset(my_array, 0, sizeof(affinity_id) * new_size);
+            my_size = new_size;
+        }
+    }
+}
+
+} //namespace internal
+// simulate a subset of parallel_for
+namespace interface9 {
+namespace internal {
+
+// parallel_for algorithm that executes sequentially
+template<typename Range, typename Body, typename Partitioner>
+class start_for : public fake_task {
+    Range my_range;
+    Body my_body;
+    typename Partitioner::task_partition_type my_partition;
+    size_t m_executedBegin, m_executedEnd;
+    bool m_firstTimeRun;
+    size_t m_joinedBegin, m_joinedEnd;
+    test_partitioner_utils::BinaryTree* m_tree;
+public:
+    start_for( const Range& range, const Body& body, Partitioner& partitioner,
+               test_partitioner_utils::BinaryTree* tree ) :
+        my_range(range), my_body(body), my_partition(partitioner),
+        m_executedBegin(0), m_executedEnd(0), m_firstTimeRun(true),
+        m_joinedBegin(/* grows left */ range.end()), m_joinedEnd(range.end()), m_tree(tree)
+    {
+        if (m_tree) {
+            m_tree->push_node( test_partitioner_utils::make_node(my_range.begin(), my_range.end(), affinity()) );
+        }
+    }
+    //! Splitting constructor used to generate children.
+    /** parent_ becomes left child.  Newly constructed object is right child. */
+    start_for( start_for& parent_, typename Partitioner::split_type& split_obj) :
+        my_range(parent_.my_range, split_obj),
+        my_body(parent_.my_body),
+        my_partition(parent_.my_partition, split_obj),
+        m_executedBegin(0), m_executedEnd(0), m_firstTimeRun(true),
+        m_joinedBegin(/* grows left */ my_range.end()), m_joinedEnd(my_range.end()),
+        m_tree(parent_.m_tree)
+    {
+        set_parent(parent_.parent());
+        my_partition.set_affinity(*this);
+
+        if (m_tree) {
+            // collecting splitting statistics
+            m_tree->push_node( test_partitioner_utils::make_node(my_range.begin(),
+                                                                 my_range.end(),
+                                                                 affinity()) );
+            m_tree->push_node( test_partitioner_utils::make_node(parent_.my_range.begin(),
+                                                                 parent_.my_range.end(),
+                                                                 parent_.affinity()) );
+        }
+    }
+    //! Construct right child from the given range as response to the demand.
+    /** parent_ remains left child.  Newly constructed object is right child. */
+    start_for( start_for& parent_, const Range& r, depth_t d ) :
+        my_range(r),
+        my_body(parent_.my_body),
+        my_partition(parent_.my_partition, tbb::split()),
+        m_executedBegin(0), m_executedEnd(0), m_firstTimeRun(true),
+        m_joinedBegin(/* grows left */ r.end()), m_joinedEnd(r.end()),
+        m_tree(parent_.m_tree)
+    {
+        set_parent(parent_.parent());
+        my_partition.set_affinity(*this);
+        my_partition.align_depth( d );
+    }
+    fake_task* execute() __TBB_override {
+        my_partition.check_being_stolen( *this );
+        size_t origBegin = my_range.begin();
+        size_t origEnd = my_range.end();
+
+        my_partition.execute(*this, my_range);
+
+        ASSERT(m_executedEnd == m_joinedBegin, "Non-continuous execution");
+        m_executedEnd = m_joinedEnd;
+
+        ASSERT(origBegin == m_executedBegin && origEnd == m_executedEnd,
+               "Not all iterations were processed");
+        return NULL;
+    }
+    //! Run body for range, serves as callback for partitioner
+    void run_body( Range &r ) {
+        if( r.is_ensure_non_emptiness() )
+            ASSERT( !r.empty(), "Empty ranges are not allowed" );
+        my_body(r);
+        if (m_firstTimeRun) {
+            m_firstTimeRun = false;
+            m_executedBegin = m_executedEnd = r.begin();
+        }
+        ASSERT(m_executedBegin <= r.begin() && m_executedEnd <= r.end(),
+               "Non-continuous execution");
+        m_executedEnd = r.end();
+    }
+    //! spawn right task, serves as callback for partitioner
+    void offer_work(typename Partitioner::split_type& split_obj) {
+        start_for sibling(*this, split_obj);
+        sibling.execute();
+        join(sibling.m_executedBegin, sibling.m_executedEnd);
+    }
+    //! spawn right task, serves as callback for partitioner
+    void offer_work(const Range& r, depth_t d = 0) {
+        start_for sibling(*this, r, d);
+        sibling.execute();
+        join(sibling.m_executedBegin, sibling.m_executedEnd);
+    }
+    void join(size_t siblingExecutedBegin, size_t siblingExecutedEnd) {
+        ASSERT(siblingExecutedEnd == m_joinedBegin, "?");
+        m_joinedBegin = siblingExecutedBegin;
+    }
+};
+
+} //namespace internal
+} //namespace interfaceX
+} //namespace tbb
+
+namespace whitebox_simulation {
+using namespace tbb::interface9::internal;
+template<typename Range, typename Body, typename Partitioner>
+void parallel_for( const Range& range, const Body& body, Partitioner& partitioner,
+                   test_partitioner_utils::BinaryTree* tree = NULL) {
+    if (!range.empty()) {
+        flag_task parent;
+        start_for<Range, Body, Partitioner> start(range, body, partitioner, tree);
+        start.set_parent(&parent);
+        start.execute();
+    }
+}
+
+} //namespace whitebox_simulation
+
+template <typename Range, typename Body, typename Partitioner>
+void test_case(Range& range, const Body& body, Partitioner& partitioner,
+               test_partitioner_utils::BinaryTree* tree = NULL) {
+    whitebox_simulation::parallel_for(range, body, partitioner, tree);
+}
+
+// Functions generate size for range objects used in tests
+template <typename T>
+size_t default_range_size_generator(T* factor, unsigned index, size_t thread_num) {
+    return size_t(factor[index] * thread_num);
+}
+
+size_t shifted_left_range_size_generator(size_t* factor, unsigned index, size_t thread_num) {
+    return factor[index] * thread_num - 1;
+}
+
+size_t shifted_right_range_size_generator(size_t* factor, unsigned index, size_t thread_num) {
+    return factor[index] * thread_num + 1;
+}
+
+size_t max_range_size_generator(size_t*, unsigned, size_t) {
+    return size_t(-1);
+}
+
+size_t simple_size_generator(size_t*, unsigned index, size_t) {
+    return index;
+}
+
+namespace uniform_iterations_distribution {
+
+/*
+ * Test checks uniform distribution of range's iterations among all tasks just after
+ * work distribution phase has been completed and just before work balancing phase has been started
+ */
+
+using namespace test_partitioner_utils;
+
+class ParallelTestBody {
+public:
+    struct use_case_settings_t;
+
+    typedef void (*CheckerFuncType)(const char*, size_t, const use_case_settings_t*, const RangeStatisticData&);
+
+    struct use_case_settings_t {
+        size_t thread_num;                         // number of threads used during current use case
+        unsigned factors_array_len;                // size of 'factors' array
+        size_t range_begin;                        // beginning of range iterations
+        bool provide_feedback;                     // 'true' if range should give feedback
+        bool ensure_non_empty_size;                // don't allow empty size ranges
+
+        size_t above_threads_size_tolerance;       // allowed value for number of created ranges
+                                                   // when initial size of the range was greater or
+                                                   // equal to number of threads
+
+        size_t below_threads_size_tolerance;       // allowed value for number of created ranges
+                                                   // when initial size of the range was less than
+                                                   // number of threads
+
+        size_t between_min_max_ranges_tolerance;   // allowed value for difference of iterations
+                                                   // between bigger and lesser ranges
+
+        CheckerFuncType checker;                   // checker function for a particular test case
+    };
+
+    ParallelTestBody(size_t parallel_group_thread_starting_index)
+        : m_parallel_group_thread_starting_index(parallel_group_thread_starting_index) { }
+
+    void operator()(size_t) const { ASSERT( false, "Empty ParallelTestBody called" ); }
+
+    static void uniform_distribution_checker(const char* rangeName, size_t rangeSize, const use_case_settings_t* settings,
+        const RangeStatisticData& stat)
+    {
+        // Checking that all threads were given a task
+        if (rangeSize >= settings->thread_num) {
+            uint64_t disparity =
+                max(stat.m_rangeNum, settings->thread_num) - min(stat.m_rangeNum, settings->thread_num);
+            if (disparity > settings->above_threads_size_tolerance) {
+                REPORT("ERROR: '%s (f=%d|e=%d)': |#ranges(%llu)-#threads(%llu)|=%llu > %llu=tolerance\n",
+                    rangeName, int(settings->provide_feedback), int(settings->ensure_non_empty_size), stat.m_rangeNum,
+                    settings->thread_num, disparity, uint64_t(settings->above_threads_size_tolerance));
+                ASSERT(disparity <= settings->above_threads_size_tolerance, "Incorrect number of range "
+                    "objects was created before work balancing phase started");
+            }
+        } else if (settings->ensure_non_empty_size && rangeSize != 0) {
+            uint64_t disparity = max(stat.m_rangeNum, rangeSize) - min(stat.m_rangeNum, rangeSize);
+            if (disparity > settings->below_threads_size_tolerance ) {
+                REPORT("ERROR: '%s (f=%d|e=%d)': |#ranges-range size|=%llu > %llu=tolerance\n",
+                    rangeName, int(settings->provide_feedback), int(settings->ensure_non_empty_size),
+                    disparity, uint64_t(settings->below_threads_size_tolerance));
+                ASSERT(disparity <= settings->below_threads_size_tolerance, "Incorrect number of range objects"
+                    " was created before work balancing phase started");
+            }
+        }
+        // Checking difference between min and max number of range iterations
+        size_t diff = stat.m_maxRangeSize - stat.m_minRangeSize;
+        if (diff > settings->between_min_max_ranges_tolerance) {
+            REPORT("ERROR: '%s (f=%d|e=%d)': range size difference=%llu > %llu=tolerance\n",
+                rangeName, int(settings->provide_feedback), int(settings->ensure_non_empty_size),
+                uint64_t(diff), uint64_t(settings->between_min_max_ranges_tolerance));
+            ASSERT(diff <= settings->between_min_max_ranges_tolerance, "Uniform iteration distribution error");
+        }
+    }
+    // Checker for test cases where ranges don't provide feedback during proportional split to
+    // partitioner and differ from tbb::blocked_range implementation in their splitting algorithm
+    static void nonuniform_distribution_checker(const char* rangeName, size_t rangeSize, const use_case_settings_t* settings,
+        const RangeStatisticData& stat)
+    {
+        if (stat.m_rangeNum > settings->thread_num) {
+            REPORT("ERROR: '%s (f=%d|e=%d)': %llu=#ranges > #threads=%llu\n",
+                rangeName, int(settings->provide_feedback), int(settings->ensure_non_empty_size),
+                uint64_t(stat.m_rangeNum), uint64_t(settings->thread_num));
+            ASSERT(stat.m_rangeNum <= settings->thread_num,
+                "Incorrect number of range objects was created before work balancing phase started");
+        }
+        // Checking difference between min and max number of range iterations
+        size_t diff = stat.m_maxRangeSize - stat.m_minRangeSize;
+        if (diff > rangeSize) {
+            REPORT("ERROR: '%s (f=%d|e=%d)': range size difference=%llu > %llu=initial range size\n",
+                rangeName, int(settings->provide_feedback), int(settings->ensure_non_empty_size),
+                uint64_t(diff), uint64_t(rangeSize));
+            ASSERT(diff <= rangeSize, "Iteration distribution error");
+        }
+    }
+
+protected:
+    size_t m_parallel_group_thread_starting_index; // starting index of thread
+
+    template <typename Range, typename Partitioner, typename T>
+    void test(use_case_settings_t& settings, T factors[], size_t (*rsgFunc)(T*, unsigned, size_t)
+        = &default_range_size_generator<T>) const
+    {
+        for (unsigned i = 0; i < settings.factors_array_len; ++i) {
+            size_t range_end = rsgFunc(factors, i, settings.thread_num);
+            RangeStatisticData stat = { /*range num=*/ 0, /*minimal size of range=*/ 0,
+                /*maximal size of range=*/ 0, /*minimal size of range was not rewritten yet=*/ false };
+            Range range = Range(settings.range_begin, range_end, &stat, settings.provide_feedback,
+                                settings.ensure_non_empty_size);
+            Partitioner my_partitioner;
+            test_case(range, SimpleBody(), my_partitioner, NULL);
+            size_t range_size = range_end - settings.range_begin;
+            const char* rangeName = typeid(range).name();
+            settings.checker(rangeName, range_size, &settings, stat);
+        }
+    }
+};
+
+template <typename ParallelTestBody>
+void test() {
+    size_t hw_threads_num = tbb::tbb_thread::hardware_concurrency();
+    size_t threadsToRunOn = std::min<size_t>(max_simulated_threads, hw_threads_num);
+
+    size_t parallel_group_thread_starting_index = 1;
+    while( parallel_group_thread_starting_index <= max_simulated_threads - threadsToRunOn ) {
+        NativeParallelFor(threadsToRunOn, ParallelTestBody(parallel_group_thread_starting_index));
+        parallel_group_thread_starting_index += threadsToRunOn;
+    }
+    NativeParallelFor(max_simulated_threads - parallel_group_thread_starting_index,
+        ParallelTestBody(parallel_group_thread_starting_index));
+}
+
+namespace task_affinity_whitebox {
+size_t range_begin = 0;
+size_t range_end = 20;
+}
+
+template<typename Partitioner>
+void check_tree(const test_partitioner_utils::BinaryTree&);
+
+template<>
+void check_tree<tbb::affinity_partitioner>(const test_partitioner_utils::BinaryTree& tree) {
+    ASSERT(tree == whitebox_simulation::reference_tree,
+        "affinity_partitioner distributes tasks differently from run to run");
+}
+
+template<>
+void check_tree<tbb::static_partitioner>(const test_partitioner_utils::BinaryTree& tree) {
+    std::vector<test_partitioner_utils::TreeNode* > tree_leafs;
+    tree.fill_leafs(tree_leafs);
+    typedef std::vector<size_t> Slots;
+    Slots affinity_slots(tree_leafs.size() + 1, 0);
+
+    for (std::vector<test_partitioner_utils::TreeNode*>::iterator i = tree_leafs.begin(); i != tree_leafs.end(); ++i) {
+        affinity_slots[(*i)->m_affinity]++;
+        if ((*i)->m_affinity == 0)
+            ASSERT((*i)->m_range_begin == task_affinity_whitebox::range_begin,
+                "Task with affinity 0 was executed with wrong range");
+    }
+
+    typedef std::iterator_traits<Slots::iterator>::difference_type slots_difference_type;
+    ASSERT(std::count(affinity_slots.begin(), affinity_slots.end(), size_t(0)) == slots_difference_type(1),
+        "static_partitioner incorrectly distributed tasks by threads");
+    ASSERT(std::count(affinity_slots.begin(), affinity_slots.end(), size_t(1)) == slots_difference_type(g_threadNums.local()),
+        "static_partitioner incorrectly distributed tasks by threads");
+    ASSERT(affinity_slots[tbb::this_task_arena::current_thread_index() + 1] == 0,
+        "static_partitioner incorrectly assigns task with 0 affinity");
+    ASSERT(std::accumulate(affinity_slots.begin(), affinity_slots.end(), size_t(0)) == g_threadNums.local(),
+        "static_partitioner has created more tasks than the number of threads");
+}
+
+template<typename Partitioner>
+void test_task_affinity() {
+    using namespace task_affinity_whitebox;
+    test_partitioner_utils::SimpleBody body;
+    for (size_t p = 1; p <= 50; ++p) {
+        g_threadNums.local() = p;
+        whitebox_simulation::whitebox_thread_index = 0;
+        test_partitioner_utils::TestRanges::BlockedRange range(range_begin, range_end, /*statData*/NULL,
+                                            /*provide_feedback*/false, /*ensure_non_empty_size*/false);
+        Partitioner partitioner;
+        whitebox_simulation::reference_tree = test_partitioner_utils::BinaryTree();
+        whitebox_simulation::parallel_for(range, body, partitioner, &(whitebox_simulation::reference_tree));
+        while (whitebox_simulation::whitebox_thread_index < p) {
+            test_partitioner_utils::BinaryTree tree;
+            whitebox_simulation::parallel_for(range, body, partitioner, &tree);
+            check_tree<Partitioner>(tree);
+            whitebox_simulation::whitebox_thread_index++;
+        }
+        range_begin++;
+        range_end += 2;
+    }
+}
+
+} /* namespace uniform_iterations_distribution */
diff --git a/xdl/third_party/tbb/src/test/test_pipeline.cpp b/xdl/third_party/tbb/src/test/test_pipeline.cpp
new file mode 100644
index 00000000..26a51115
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_pipeline.cpp
@@ -0,0 +1,313 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_stddef.h"
+#include "tbb/pipeline.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/atomic.h"
+#include <cstdlib>
+#include <cstdio>
+#include "harness.h"
+
+// In the test, variables related to token counting are declared
+// as unsigned long to match definition of tbb::internal::Token.
+
+struct Buffer {
+    //! Indicates that the buffer is not used.
+    static const unsigned long unused = ~0ul;
+    unsigned long id;
+    //! True if Buffer is in use.
+    bool is_busy;
+    unsigned long sequence_number;
+    Buffer() : id(unused), is_busy(false), sequence_number(unused) {}
+};
+
+class waiting_probe {
+    size_t check_counter;
+public:
+    waiting_probe() : check_counter(0) {}
+    bool required( ) {
+        ++check_counter;
+        return !((check_counter+1)&size_t(0x7FFF));
+    }
+    void probe( ); // defined below
+};
+
+static const unsigned MaxStreamSize = 8000;
+static const unsigned MaxStreamItemsPerThread = 1000;
+//! Maximum number of filters allowed
+static const unsigned MaxFilters = 5;
+static unsigned StreamSize;
+static const unsigned MaxBuffer = 8;
+static bool Done[MaxFilters][MaxStreamSize];
+static waiting_probe WaitTest;
+static unsigned out_of_order_count;
+
+#include "harness_concurrency_tracker.h"
+
+class BaseFilter: public tbb::filter {
+    bool* const my_done;
+    const bool my_is_last;
+    bool my_is_running;
+public:
+    tbb::atomic<tbb::internal::Token> current_token;
+    BaseFilter( tbb::filter::mode type, bool done[], bool is_last ) :
+        filter(type),
+        my_done(done),
+        my_is_last(is_last),
+        my_is_running(false),
+        current_token()
+    {}
+    virtual Buffer* get_buffer( void* item ) {
+        current_token++;
+        return static_cast<Buffer*>(item);
+    }
+    void* operator()( void* item ) __TBB_override {
+        Harness::ConcurrencyTracker ct;
+        if( is_serial() )
+            ASSERT( !my_is_running, "premature entry to serial stage" );
+        my_is_running = true;
+        Buffer* b = get_buffer(item);
+        if( b ) {
+            if( is_ordered() ) {
+                if( b->sequence_number == Buffer::unused )
+                    b->sequence_number = current_token-1;
+                else
+                    ASSERT( b->sequence_number==current_token-1, "item arrived out of order" );
+            } else if( is_serial() ) {
+                if( b->sequence_number != current_token-1 && b->sequence_number != Buffer::unused )
+                    out_of_order_count++;
+            }
+            ASSERT( b->id < StreamSize, NULL );
+            ASSERT( !my_done[b->id], "duplicate processing of token?" );
+            ASSERT( b->is_busy, NULL );
+            my_done[b->id] = true;
+            if( my_is_last ) {
+                b->id = Buffer::unused;
+                b->sequence_number = Buffer::unused;
+                __TBB_store_with_release(b->is_busy, false);
+            }
+        }
+        my_is_running = false;
+        return b;
+    }
+};
+
+class InputFilter: public BaseFilter {
+    tbb::spin_mutex input_lock;
+    Buffer buffer[MaxBuffer];
+    const tbb::internal::Token my_number_of_tokens;
+public:
+    InputFilter( tbb::filter::mode type, tbb::internal::Token ntokens, bool done[], bool is_last ) :
+        BaseFilter(type, done, is_last),
+        my_number_of_tokens(ntokens)
+    {}
+    Buffer* get_buffer( void* ) __TBB_override {
+        unsigned long next_input;
+        unsigned free_buffer = 0;
+        { // lock protected scope
+            tbb::spin_mutex::scoped_lock lock(input_lock);
+            if( current_token>=StreamSize )
+                return NULL;
+            next_input = current_token++;
+            // once in a while, emulate waiting for input; this only makes sense for serial input
+            if( is_serial() && WaitTest.required() )
+                WaitTest.probe( );
+            while( free_buffer<MaxBuffer )
+                if( __TBB_load_with_acquire(buffer[free_buffer].is_busy) )
+                    ++free_buffer;
+                else {
+                    buffer[free_buffer].is_busy = true;
+                    break;
+                }
+        }
+        ASSERT( free_buffer<my_number_of_tokens, "premature reuse of buffer" );
+        Buffer* b = &buffer[free_buffer];
+        ASSERT( &buffer[0] <= b, NULL );
+        ASSERT( b <= &buffer[MaxBuffer-1], NULL );
+        ASSERT( b->id == Buffer::unused, NULL);
+        b->id = next_input;
+        ASSERT( b->sequence_number == Buffer::unused, NULL);
+        return b;
+    }
+};
+
+//! The struct below repeats layout of tbb::pipeline.
+struct hacked_pipeline {
+    tbb::filter* filter_list;
+    tbb::filter* filter_end;
+    tbb::empty_task* end_counter;
+    tbb::atomic<tbb::internal::Token> input_tokens;
+    tbb::atomic<tbb::internal::Token> token_counter;
+    bool end_of_input;
+    bool has_thread_bound_filters;
+
+    virtual ~hacked_pipeline();
+};
+
+//! The struct below repeats layout of tbb::internal::input_buffer.
+struct hacked_input_buffer {
+    void* array; // This should be changed to task_info* if ever used
+    void* my_sem; // This should be changed to semaphore* if ever used
+    tbb::internal::Token array_size;
+    tbb::internal::Token low_token;
+    tbb::spin_mutex array_mutex;
+    tbb::internal::Token high_token;
+    bool is_ordered;
+    bool is_bound;
+};
+
+//! The struct below repeats layout of tbb::filter.
+struct hacked_filter {
+    tbb::filter* next_filter_in_pipeline;
+    hacked_input_buffer* my_input_buffer;
+    unsigned char my_filter_mode;
+    tbb::filter* prev_filter_in_pipeline;
+    tbb::pipeline* my_pipeline;
+    tbb::filter* next_segment;
+
+    virtual ~hacked_filter();
+};
+
+bool do_hacking_tests = true;
+const tbb::internal::Token tokens_before_wraparound = 0xF;
+
+void TestTrivialPipeline( unsigned nthread, unsigned number_of_filters ) {
+    // There are 3 filter types: parallel, serial_in_order and serial_out_of_order
+    static const tbb::filter::mode filter_table[] = { tbb::filter::parallel, tbb::filter::serial_in_order, tbb::filter::serial_out_of_order};
+    const unsigned number_of_filter_types = sizeof(filter_table)/sizeof(filter_table[0]);
+    REMARK( "testing with %lu threads and %lu filters\n", nthread, number_of_filters );
+    ASSERT( number_of_filters<=MaxFilters, "too many filters" );
+    ASSERT( sizeof(hacked_pipeline) == sizeof(tbb::pipeline), "layout changed for tbb::pipeline?" );
+    ASSERT( sizeof(hacked_filter) == sizeof(tbb::filter), "layout changed for tbb::filter?" );
+    tbb::internal::Token ntokens = nthread<MaxBuffer ? nthread : MaxBuffer;
+    // Count maximum iterations number
+    unsigned limit = 1;
+    for( unsigned i=0; i<number_of_filters; ++i)
+        limit *= number_of_filter_types;
+    // Iterate over possible filter sequences
+    for( unsigned numeral=0; numeral<limit; ++numeral ) {
+        // Build pipeline
+        tbb::pipeline pipeline;
+        if( do_hacking_tests ) {
+            // A private member of pipeline is hacked there for sake of testing wrap-around immunity.
+            tbb::internal::punned_cast<hacked_pipeline*>(&pipeline)->token_counter = ~tokens_before_wraparound;
+        }
+        tbb::filter* filter[MaxFilters];
+        unsigned temp = numeral;
+        // parallelism_limit is the upper bound on the possible parallelism
+        unsigned parallelism_limit = 0;
+        for( unsigned i=0; i<number_of_filters; ++i, temp/=number_of_filter_types ) {
+            tbb::filter::mode filter_type = filter_table[temp%number_of_filter_types];
+            const bool is_last = i==number_of_filters-1;
+            if( i==0 )
+                filter[i] = new InputFilter(filter_type,ntokens,Done[i],is_last);
+            else
+                filter[i] = new BaseFilter(filter_type,Done[i],is_last);
+            pipeline.add_filter(*filter[i]);
+            // The ordered buffer of serial filters is hacked as well.
+            if ( filter[i]->is_serial() ) {
+                if( do_hacking_tests ) {
+                    ((hacked_filter*)(void*)filter[i])->my_input_buffer->low_token = ~tokens_before_wraparound;
+                    ((hacked_filter*)(void*)filter[i])->my_input_buffer->high_token = ~tokens_before_wraparound;
+                }
+                parallelism_limit += 1;
+            } else {
+                parallelism_limit = nthread;
+            }
+        }
+        // Account for clipping of parallelism.
+        if( parallelism_limit>nthread )
+            parallelism_limit = nthread;
+        if( parallelism_limit>ntokens )
+            parallelism_limit = (unsigned)ntokens;
+        Harness::ConcurrencyTracker::Reset();
+        unsigned streamSizeLimit = min( MaxStreamSize, nthread * MaxStreamItemsPerThread );
+        for( StreamSize=0; StreamSize<=streamSizeLimit; ) {
+            memset( Done, 0, sizeof(Done) );
+            for( unsigned i=0; i<number_of_filters; ++i ) {
+                static_cast<BaseFilter*>(filter[i])->current_token=0;
+            }
+            pipeline.run( ntokens );
+            ASSERT( !Harness::ConcurrencyTracker::InstantParallelism(), "filter still running?" );
+            for( unsigned i=0; i<number_of_filters; ++i )
+                ASSERT( static_cast<BaseFilter*>(filter[i])->current_token==StreamSize, NULL );
+            for( unsigned i=0; i<MaxFilters; ++i )
+                for( unsigned j=0; j<StreamSize; ++j ) {
+                    ASSERT( Done[i][j]==(i<number_of_filters), NULL );
+                }
+            if( StreamSize < min(nthread*8, 32u) ) {
+                ++StreamSize;
+            } else {
+                StreamSize = StreamSize*8/3;
+            }
+        }
+        if( Harness::ConcurrencyTracker::PeakParallelism() < parallelism_limit )
+            REMARK( "nthread=%lu ntokens=%lu MaxParallelism=%lu parallelism_limit=%lu\n",
+                nthread, ntokens, Harness::ConcurrencyTracker::PeakParallelism(), parallelism_limit );
+        for( unsigned i=0; i < number_of_filters; ++i ) {
+            delete filter[i];
+            filter[i] = NULL;
+        }
+        pipeline.clear();
+    }
+}
+
+#include "harness_cpu.h"
+
+static int nthread; // knowing number of threads is necessary to call TestCPUUserTime
+
+void waiting_probe::probe( ) {
+    if( nthread==1 ) return;
+    REMARK("emulating wait for input\n");
+    // Test that threads sleep while no work.
+    // The master doesn't sleep so there could be 2 active threads if a worker is waiting for input
+    TestCPUUserTime(nthread, 2);
+}
+
+#include "tbb/task_scheduler_init.h"
+
+int TestMain () {
+    out_of_order_count = 0;
+    if( MinThread<1 ) {
+        REPORT("must have at least one thread");
+        exit(1);
+    }
+    if( tbb::TBB_runtime_interface_version()>TBB_INTERFACE_VERSION) {
+        REMARK("Warning: implementation dependent tests disabled\n");
+        do_hacking_tests = false;
+    }
+
+    // Test with varying number of threads.
+    for( nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        // Initialize TBB task scheduler
+        tbb::task_scheduler_init init(nthread);
+
+        // Test pipelines with n filters
+        for( unsigned n=0; n<=MaxFilters; ++n )
+            TestTrivialPipeline(nthread,n);
+
+        // Test that all workers sleep when no work
+        TestCPUUserTime(nthread);
+    }
+    if( !out_of_order_count )
+        REPORT("Warning: out of order serial filter received tokens in order\n");
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_pipeline_with_tbf.cpp b/xdl/third_party/tbb/src/test/test_pipeline_with_tbf.cpp
new file mode 100644
index 00000000..9d5492cb
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_pipeline_with_tbf.cpp
@@ -0,0 +1,527 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/pipeline.h"
+#include "tbb/spin_mutex.h"
+#include "tbb/atomic.h"
+#include "tbb/tbb_thread.h"
+#include <cstdlib>
+#include <cstdio>
+#include "harness.h"
+
+// In the test, variables related to token counting are declared
+// as unsigned long to match definition of tbb::internal::Token.
+
+//! Id of thread that first executes work on non-thread-bound stages
+tbb::tbb_thread::id thread_id;
+//! Zero thread id
+tbb::tbb_thread::id id0;
+//! True if non-thread-bound stages must be executed on one thread
+bool is_serial_execution;
+double sleeptime; // how long is a non-thread-bound stage to sleep?
+
+struct Buffer {
+    //! Indicates that the buffer is not used.
+    static const unsigned long unused = ~0ul;
+    unsigned long id;
+    //! True if Buffer is in use.
+    bool is_busy;
+    unsigned long sequence_number;
+    Buffer() : id(unused), is_busy(false), sequence_number(unused) {}
+};
+
+class waiting_probe {
+    size_t check_counter;
+public:
+    waiting_probe() : check_counter(0) {}
+    bool required( ) {
+        ++check_counter;
+        return !((check_counter+1)&size_t(0x7FFF));
+    }
+    void probe( ); // defined below
+};
+
+static const unsigned MaxStreamSize = 8000;
+//! Maximum number of filters allowed
+static const unsigned MaxFilters = 4;
+static unsigned StreamSize;
+static const unsigned MaxBuffer = 8;
+static bool Done[MaxFilters][MaxStreamSize];
+static waiting_probe WaitTest;
+static unsigned out_of_order_count;
+
+#include "harness_concurrency_tracker.h"
+
+template<typename T>
+class BaseFilter: public T {
+    bool* const my_done;
+    const bool my_is_last;
+    bool my_is_running;
+public:
+    tbb::atomic<tbb::internal::Token> current_token;
+    BaseFilter( tbb::filter::mode type, bool done[], bool is_last ) :
+        T(type),
+        my_done(done),
+        my_is_last(is_last),
+        my_is_running(false),
+        current_token()
+    {}
+    virtual Buffer* get_buffer( void* item ) {
+        current_token++;
+        return static_cast<Buffer*>(item);
+    }
+    void* operator()( void* item ) __TBB_override {
+        // Check if work is done only on one thread when ntokens==1 or
+        // when pipeline has only one filter that is serial and non-thread-bound
+        if( is_serial_execution && !this->is_bound() ) {
+            // Get id of current thread
+            tbb::tbb_thread::id id = tbb::this_tbb_thread::get_id();
+            // At first execution, set thread_id to current thread id.
+            // Serialized execution is expected, so there should be no race.
+            if( thread_id == id0 )
+                thread_id = id;
+            // Check if work is done on one thread
+            ASSERT( thread_id == id, "non-thread-bound stages executed on different threads when must be executed on a single one");
+        }
+        Harness::ConcurrencyTracker ct;
+        if( this->is_serial() )
+            ASSERT( !my_is_running, "premature entry to serial stage" );
+        my_is_running = true;
+        Buffer* b = get_buffer(item);
+        if( b ) {
+            if(!this->is_bound() && sleeptime > 0) {
+                if(this->is_serial()) {
+                    Harness::Sleep((int)sleeptime);
+                }
+                else {
+                    // early parallel tokens sleep longer...
+                    int i = (int)((5 - b->sequence_number) * sleeptime);
+                    if(i < (int)sleeptime) i = (int)sleeptime;
+                    Harness::Sleep(i);
+                }
+            }
+            if( this->is_ordered() ) {
+                if( b->sequence_number == Buffer::unused )
+                    b->sequence_number = current_token-1;
+                else
+                    ASSERT( b->sequence_number==current_token-1, "item arrived out of order" );
+            } else if( this->is_serial() ) {
+                if( b->sequence_number != current_token-1 && b->sequence_number != Buffer::unused )
+                    out_of_order_count++;
+            }
+            ASSERT( b->id < StreamSize, NULL );
+            ASSERT( !my_done[b->id], "duplicate processing of token?" );
+            ASSERT( b->is_busy, NULL );
+            my_done[b->id] = true;
+            if( my_is_last ) {
+                b->id = Buffer::unused;
+                b->sequence_number = Buffer::unused;
+                __TBB_store_with_release(b->is_busy, false);
+            }
+        }
+        my_is_running = false;
+        return b;
+    }
+};
+
+template<typename T>
+class InputFilter: public BaseFilter<T> {
+    tbb::spin_mutex input_lock;
+    Buffer buffer[MaxBuffer];
+    const tbb::internal::Token my_number_of_tokens;
+public:
+    InputFilter( tbb::filter::mode type, tbb::internal::Token ntokens, bool done[], bool is_last ) :
+        BaseFilter<T>(type, done, is_last),
+        my_number_of_tokens(ntokens)
+    {}
+    Buffer* get_buffer( void* ) __TBB_override {
+        unsigned long next_input;
+        unsigned free_buffer = 0;
+        { // lock protected scope
+            tbb::spin_mutex::scoped_lock lock(input_lock);
+            if( this->current_token>=StreamSize )
+                return NULL;
+            next_input = this->current_token++;
+            // once in a while, emulate waiting for input; this only makes sense for serial input
+            if( this->is_serial() && WaitTest.required() )
+                WaitTest.probe( );
+            while( free_buffer<MaxBuffer )
+                if( __TBB_load_with_acquire(buffer[free_buffer].is_busy) )
+                    ++free_buffer;
+                else {
+                    buffer[free_buffer].is_busy = true;
+                    break;
+                }
+        }
+        ASSERT( free_buffer<my_number_of_tokens, "premature reuse of buffer" );
+        Buffer* b = &buffer[free_buffer];
+        ASSERT( &buffer[0] <= b, NULL );
+        ASSERT( b <= &buffer[MaxBuffer-1], NULL );
+        ASSERT( b->id == Buffer::unused, NULL);
+        b->id = next_input;
+        ASSERT( b->sequence_number == Buffer::unused, NULL);
+        return b;
+    }
+};
+
+class process_loop {
+public:
+    void operator()( tbb::thread_bound_filter* tbf ) {
+        tbb::thread_bound_filter::result_type flag;
+        do
+            flag = tbf->process_item();
+        while( flag != tbb::thread_bound_filter::end_of_stream );
+    }
+};
+
+//! The struct below repeats layout of tbb::pipeline.
+struct hacked_pipeline {
+    tbb::filter* filter_list;
+    tbb::filter* filter_end;
+    tbb::empty_task* end_counter;
+    tbb::atomic<tbb::internal::Token> input_tokens;
+    tbb::atomic<tbb::internal::Token> global_token_counter;
+    bool end_of_input;
+    bool has_thread_bound_filters;
+
+    virtual ~hacked_pipeline();
+};
+
+//! The struct below repeats layout of tbb::internal::ordered_buffer.
+struct hacked_ordered_buffer {
+    void* array; // This should be changed to task_info* if ever used
+    tbb::internal::Token array_size;
+    tbb::internal::Token low_token;
+    tbb::spin_mutex array_mutex;
+    tbb::internal::Token high_token;
+    bool is_ordered;
+    bool is_bound;
+};
+
+//! The struct below repeats layout of tbb::filter.
+struct hacked_filter {
+    tbb::filter* next_filter_in_pipeline;
+    hacked_ordered_buffer* input_buffer;
+    unsigned char my_filter_mode;
+    tbb::filter* prev_filter_in_pipeline;
+    tbb::pipeline* my_pipeline;
+    tbb::filter* next_segment;
+
+    virtual ~hacked_filter();
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for overzealous compiler warnings
+    // Suppress compiler warning about constant conditional expression
+    #pragma warning (disable: 4127)
+#endif
+
+void clear_global_state() {
+    Harness::ConcurrencyTracker::Reset();
+    memset( Done, 0, sizeof(Done) );
+    thread_id = id0;
+    is_serial_execution = false;
+}
+
+
+class PipelineTest {
+    // There are 3 non-thread-bound filter types: serial_in_order and serial_out_of_order, parallel
+    static const tbb::filter::mode non_tb_filters_table[3]; // = { tbb::filter::serial_in_order, tbb::filter::serial_out_of_order, tbb::filter::parallel};
+    // There are 2 thread-bound filter types: serial_in_order and serial_out_of_order
+    static const tbb::filter::mode tb_filters_table[2]; // = { tbb::filter::serial_in_order, tbb::filter::serial_out_of_order };
+
+    static const unsigned number_of_non_tb_filter_types = sizeof(non_tb_filters_table)/sizeof(non_tb_filters_table[0]);
+    static const unsigned number_of_tb_filter_types = sizeof(tb_filters_table)/sizeof(tb_filters_table[0]);
+    static const unsigned number_of_filter_types = number_of_non_tb_filter_types + number_of_tb_filter_types;
+    // static unsigned my_nthread;
+    public:
+    static double TestOneConfiguration( unsigned numeral, unsigned nthread, unsigned number_of_filters, tbb::internal::Token ntokens);
+    static void TestTrivialPipeline( unsigned nthread, unsigned number_of_filters );
+    static void TestIdleSpinning(unsigned nthread);
+
+    static void PrintConfiguration(unsigned numeral, unsigned nFilters) {
+        REMARK( "{ ");
+        for( unsigned i = 0; i < nFilters; ++i) {
+            switch( numeral % number_of_filter_types ) {
+                case 0: REMARK("s  "); break;
+                case 1: REMARK("B  "); break;
+                case 2: REMARK("o  "); break;
+                case 3: REMARK("Bo "); break;
+                case 4: REMARK("P  "); break;
+                default: REMARK(" ** ERROR** "); break;
+            }
+            numeral /= number_of_filter_types;
+        }
+        REMARK("}");
+    }
+    static bool ContainsBoundFilter(unsigned numeral) {
+        for( ;numeral != 0; numeral /= number_of_filter_types)
+            if(numeral & 0x1) return true;
+        return false;
+    }
+};
+
+const tbb::filter::mode PipelineTest::non_tb_filters_table[3] = {
+    tbb::filter::serial_in_order,       // 0
+    tbb::filter::serial_out_of_order,   // 2
+    tbb::filter::parallel               // 4
+};
+const tbb::filter::mode PipelineTest::tb_filters_table[2] = {
+    tbb::filter::serial_in_order,       // 1
+    tbb::filter::serial_out_of_order    // 3
+};
+
+#include "harness_cpu.h"
+
+double PipelineTest::TestOneConfiguration(unsigned numeral, unsigned nthread, unsigned number_of_filters, tbb::internal::Token ntokens)
+{
+    // Build pipeline
+    tbb::pipeline pipeline;
+    tbb::filter* filter[MaxFilters];
+    unsigned temp = numeral;
+    // parallelism_limit is the upper bound on the possible parallelism
+    unsigned parallelism_limit = 0;
+    // number of thread-bound-filters in the current sequence
+    unsigned number_of_tb_filters = 0;
+    // ordinal numbers of thread-bound-filters in the current sequence
+    unsigned array_of_tb_filter_numbers[MaxFilters];
+    if(!ContainsBoundFilter(numeral)) return 0.0;
+    for( unsigned i=0; i<number_of_filters; ++i, temp/=number_of_filter_types ) {
+        bool is_bound = temp%number_of_filter_types&0x1;
+        tbb::filter::mode filter_type;
+        if( is_bound ) {
+            filter_type = tb_filters_table[temp%number_of_filter_types/number_of_non_tb_filter_types];
+        } else
+            filter_type = non_tb_filters_table[temp%number_of_filter_types/number_of_tb_filter_types];
+        const bool is_last = i==number_of_filters-1;
+        if( is_bound ) {
+            if( i == 0 )
+                filter[i] = new InputFilter<tbb::thread_bound_filter>(filter_type,ntokens,Done[i],is_last);
+            else
+                filter[i] = new BaseFilter<tbb::thread_bound_filter>(filter_type,Done[i],is_last);
+            array_of_tb_filter_numbers[number_of_tb_filters] = i;
+            number_of_tb_filters++;
+        } else {
+            if( i == 0 )
+                filter[i] = new InputFilter<tbb::filter>(filter_type,ntokens,Done[i],is_last);
+            else
+                filter[i] = new BaseFilter<tbb::filter>(filter_type,Done[i],is_last);
+        }
+        pipeline.add_filter(*filter[i]);
+        if ( filter[i]->is_serial() ) {
+            parallelism_limit += 1;
+        } else {
+            parallelism_limit = nthread;
+        }
+    }
+    ASSERT(number_of_tb_filters,NULL);
+    clear_global_state();
+    // Account for clipping of parallelism.
+    if( parallelism_limit>nthread )
+        parallelism_limit = nthread;
+    if( parallelism_limit>ntokens )
+        parallelism_limit = (unsigned)ntokens;
+    StreamSize = nthread; // min( MaxStreamSize, nthread * MaxStreamItemsPerThread );
+
+    for( unsigned i=0; i<number_of_filters; ++i ) {
+        static_cast<BaseFilter<tbb::filter>*>(filter[i])->current_token=0;
+    }
+    tbb::tbb_thread* t[MaxFilters];
+    for( unsigned j = 0; j<number_of_tb_filters; j++)
+        t[j] = new tbb::tbb_thread(process_loop(), static_cast<tbb::thread_bound_filter*>(filter[array_of_tb_filter_numbers[j]]));
+    if( ntokens == 1 || ( number_of_filters == 1 && number_of_tb_filters == 0 && filter[0]->is_serial() ))
+        is_serial_execution = true;
+    double strttime = GetCPUUserTime();
+    pipeline.run( ntokens );
+    double endtime = GetCPUUserTime();
+    for( unsigned j = 0; j<number_of_tb_filters; j++)
+        t[j]->join();
+    ASSERT( !Harness::ConcurrencyTracker::InstantParallelism(), "filter still running?" );
+    for( unsigned i=0; i<number_of_filters; ++i )
+        ASSERT( static_cast<BaseFilter<tbb::filter>*>(filter[i])->current_token==StreamSize, NULL );
+    for( unsigned i=0; i<MaxFilters; ++i )
+        for( unsigned j=0; j<StreamSize; ++j ) {
+            ASSERT( Done[i][j]==(i<number_of_filters), NULL );
+        }
+    if( Harness::ConcurrencyTracker::PeakParallelism() < parallelism_limit )
+        REMARK( "nthread=%lu ntokens=%lu MaxParallelism=%lu parallelism_limit=%lu\n",
+            nthread, ntokens, Harness::ConcurrencyTracker::PeakParallelism(), parallelism_limit );
+    for( unsigned i=0; i < number_of_filters; ++i ) {
+        delete filter[i];
+        filter[i] = NULL;
+    }
+    for( unsigned j = 0; j<number_of_tb_filters; j++)
+        delete t[j];
+    pipeline.clear();
+    return endtime - strttime;
+} // TestOneConfiguration
+
+void PipelineTest::TestTrivialPipeline( unsigned nthread, unsigned number_of_filters ) {
+
+    REMARK( "testing with %lu threads and %lu filters\n", nthread, number_of_filters );
+    ASSERT( number_of_filters<=MaxFilters, "too many filters" );
+    tbb::internal::Token max_tokens = nthread < MaxBuffer ? nthread : MaxBuffer;
+    // The loop has 1 iteration if max_tokens=1 and 2 iterations if max_tokens>1:
+    // one iteration for ntokens=1 and second for ntokens=max_tokens
+    // Iteration for ntokens=1 is required in each test case to check if pipeline run only on one thread
+    unsigned max_iteration = max_tokens > 1 ? 2 : 1;
+    tbb::internal::Token ntokens = 1;
+    for( unsigned iteration = 0; iteration < max_iteration; iteration++) {
+        if( iteration > 0 )
+            ntokens = max_tokens;
+        // Count maximum iterations number
+        unsigned limit = 1;
+        for( unsigned i=0; i<number_of_filters; ++i)
+            limit *= number_of_filter_types;
+        // Iterate over possible filter sequences
+        for( unsigned numeral=0; numeral<limit; ++numeral ) {
+            REMARK( "testing configuration %lu of %lu\n", numeral, limit );
+            (void)TestOneConfiguration(numeral, nthread, number_of_filters, ntokens);
+        }
+    }
+}
+
+// varying times for sleep result in different user times for all pipelines.
+// So we compare the running time of an all non-TBF pipeline with different (with
+// luck representative) TBF configurations.
+//
+// We run the tests multiple times and compare the average runtimes for those cases
+// that don't return 0 user time.  configurations that exceed the allowable extra
+// time are reported.
+void PipelineTest::TestIdleSpinning( unsigned nthread)  {
+    unsigned sample_setups[] = {
+        // in the comments below, s == serial, o == serial out-of-order,
+        // B == thread bound, Bo == thread bound out-of-order, p == parallel
+        1,   // B  s  s  s
+        5,   // s  B  s  s
+        25,  // s  s  B  s
+        125, // s  s  s  B
+        6,   // B  B  s  s
+        26,  // B  s  B  s
+        126, // B  s  s  B
+        30,  // s  B  B  s
+        130, // s  B  s  B
+        150, // s  s  B  B
+        31,  // B  B  B  s
+        131, // B  B  s  B
+        155, // s  B  B  B
+        495, // s  p  p  Bo
+        71,  // B  p  o  s
+        355, // s  B  p  o
+        95,  // s  p  Bo s
+        475, // s  s  p  Bo
+    };
+    const int nsetups = sizeof(sample_setups) / sizeof(unsigned);
+    const int ntests = 4;
+    const double bignum = 1000000000.0;
+    const double allowable_slowdown = 3.5;
+    unsigned zero_count = 0;
+
+    REMARK( "testing idle spinning with %lu threads\n", nthread );
+    tbb::internal::Token max_tokens = nthread < MaxBuffer ? nthread : MaxBuffer;
+    for( int i=0; i<nsetups; ++i ) {
+        unsigned numeral = sample_setups[i];
+        unsigned temp = numeral;
+        unsigned nbound = 0;
+        while(temp) {
+            if((temp%number_of_filter_types)&0x01) nbound++;
+            temp /= number_of_filter_types;
+        }
+        sleeptime = 20.0;
+        double s0 = bignum;
+        double s1 = bignum;
+        int v0cnt = 0;
+        int v1cnt = 0;
+        double s0sum = 0.0;
+        double s1sum = 0.0;
+        REMARK(" TestOneConfiguration, pipeline == ");
+        PrintConfiguration(numeral, MaxFilters);
+        REMARK(", max_tokens== %d\n", (int)max_tokens);
+        for(int j = 0; j < ntests; ++j) {
+            double s1a = TestOneConfiguration(numeral, nthread, MaxFilters, max_tokens);
+            double s0a = TestOneConfiguration((unsigned)0, nthread, MaxFilters, max_tokens);
+            s1sum += s1a;
+            s0sum += s0a;
+            if(s0a > 0.0) {
+                ++v0cnt;
+                s0 = (s0a < s0) ? s0a : s0;
+            }
+            else {
+                ++zero_count;
+            }
+            if(s1a > 0.0) {
+                ++v1cnt;
+                s1 = (s1a < s1) ? s1a : s1;
+            }
+            else {
+                ++zero_count;
+            }
+        }
+        if(s0 == bignum || s1 == bignum) continue;
+        s0sum /= (double)v0cnt;
+        s1sum /= (double)v1cnt;
+        double slowdown = (s1sum-s0sum)/s0sum;
+        if(slowdown > allowable_slowdown)
+            REMARK( "with %lu threads configuration %lu has slowdown > %g (%g)\n", nthread, numeral, allowable_slowdown, slowdown );
+    }
+    REMARK("Total of %lu zero times\n", zero_count);
+}
+
+static int nthread; // knowing number of threads is necessary to call TestCPUUserTime
+
+void waiting_probe::probe( ) {
+    if( nthread==1 ) return;
+    REMARK("emulating wait for input\n");
+    // Test that threads sleep while no work.
+    // The master doesn't sleep so there could be 2 active threads if a worker is waiting for input
+    TestCPUUserTime(nthread, 2);
+}
+
+#include "tbb/task_scheduler_init.h"
+
+int TestMain () {
+    out_of_order_count = 0;
+    if( MinThread<1 ) {
+        REPORT("must have at least one thread");
+        exit(1);
+    }
+
+    // Test with varying number of threads.
+    for( nthread=MinThread; nthread<=MaxThread; ++nthread ) {
+        // Initialize TBB task scheduler
+        tbb::task_scheduler_init init(nthread);
+        sleeptime = 0.0;  // msec : 0 == no_timing, > 0, each filter stage sleeps for sleeptime
+
+        // Test pipelines with 1 and maximal number of filters
+        for( unsigned n=1; n<=MaxFilters; n*=MaxFilters ) {
+            // Thread-bound stages are serviced by user-created threads; those
+            // don't run the pipeline and don't service non-thread-bound stages
+            PipelineTest::TestTrivialPipeline(nthread,n);
+        }
+
+        // Test that all workers sleep when no work
+        TestCPUUserTime(nthread);
+        if((unsigned)nthread >= MaxFilters)  // test works when number of threads >= number of stages
+            PipelineTest::TestIdleSpinning(nthread);
+    }
+    if( !out_of_order_count )
+        REPORT("Warning: out of order serial filter received tokens in order\n");
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_priority_queue_node.cpp b/xdl/third_party/tbb/src/test/test_priority_queue_node.cpp
new file mode 100644
index 00000000..8a646f81
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_priority_queue_node.cpp
@@ -0,0 +1,357 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// TO DO: Add overlapping put / receive tests
+
+#include "harness.h"
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "tbb/flow_graph.h"
+#include "harness_checktype.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "harness_graph.h"
+
+#include <cstdio>
+
+#define N 10
+#define C 10
+
+template< typename T >
+void spin_try_get( tbb::flow::priority_queue_node<T> &q, T &value ) {
+    while ( q.try_get(value) != true ) ;
+}
+
+template< typename T >
+void check_item( T* next_value, T &value ) {
+    int tid = value / N;
+    int offset = value % N;
+    ASSERT( next_value[tid] == T(offset), NULL );
+    ++next_value[tid];
+}
+
+template< typename T >
+struct parallel_puts : NoAssign {
+    tbb::flow::priority_queue_node<T> &my_q;
+    parallel_puts( tbb::flow::priority_queue_node<T> &q ) : my_q(q) {}
+    void operator()(int i) const {
+        for (int j = 0; j < N; ++j) {
+            bool msg = my_q.try_put( T(N*i + j) );
+            ASSERT( msg == true, NULL );
+        }
+    }
+};
+
+template< typename T >
+struct parallel_gets : NoAssign {
+    tbb::flow::priority_queue_node<T> &my_q;
+    parallel_gets( tbb::flow::priority_queue_node<T> &q) : my_q(q) {}
+    void operator()(int) const {
+        T prev;
+        spin_try_get( my_q, prev );
+        for (int j = 0; j < N-1; ++j) {
+            T v;
+            spin_try_get( my_q, v );
+            ASSERT(v < prev, NULL);
+        }
+    }
+};
+
+template< typename T >
+struct parallel_put_get : NoAssign {
+    tbb::flow::priority_queue_node<T> &my_q;
+    parallel_put_get( tbb::flow::priority_queue_node<T> &q ) : my_q(q) {}
+    void operator()(int tid) const {
+        for ( int i = 0; i < N; i+=C ) {
+            int j_end = ( N < i + C ) ? N : i + C;
+            // dump about C values into the Q
+            for ( int j = i; j < j_end; ++j ) {
+                ASSERT( my_q.try_put( T (N*tid + j ) ) == true, NULL );
+            }
+            // receive about C values from the Q
+            for ( int j = i; j < j_end; ++j ) {
+                T v;
+                spin_try_get( my_q, v );
+            }
+        }
+    }
+};
+
+//
+// Tests
+//
+// Item can be reserved, released, consumed ( single serial receiver )
+//
+template< typename T >
+int test_reservation(int) {
+    tbb::flow::graph g;
+
+    // Simple tests
+    tbb::flow::priority_queue_node<T> q(g);
+
+    {
+
+        T bogus_value(-1);
+
+        q.try_put(T(1));
+        q.try_put(T(2));
+        q.try_put(T(3));
+        g.wait_for_all();
+
+        T v=bogus_value, w=bogus_value;
+        ASSERT( q.try_reserve(v) == true, NULL );
+        ASSERT( v == T(3), NULL );
+        ASSERT( q.try_release() == true, NULL );
+        v = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_reserve(v) == true, NULL );
+        ASSERT( v == T(3), NULL );
+        ASSERT( q.try_consume() == true, NULL );
+        v = bogus_value;
+        g.wait_for_all();
+
+        ASSERT( q.try_get(v) == true, NULL );
+        ASSERT( v == T(2), NULL );
+        v = bogus_value;
+        g.wait_for_all();
+
+        ASSERT( q.try_reserve(v) == true, NULL );
+        ASSERT( v == T(1), NULL );
+        ASSERT( q.try_reserve(w) == false, NULL );
+        ASSERT( w == bogus_value, NULL );
+        ASSERT( q.try_get(w) == false, NULL );
+        ASSERT( w == bogus_value, NULL );
+        ASSERT( q.try_release() == true, NULL );
+        v = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_reserve(v) == true, NULL );
+        ASSERT( v == T(1), NULL );
+        ASSERT( q.try_consume() == true, NULL );
+        v = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_get(v) == false, NULL );
+    }
+    return 0;
+}
+
+//
+// Tests
+//
+// multilpe parallel senders, items in FIFO (relatively to sender) order
+// multilpe parallel senders, multiple parallel receivers, items in FIFO order (relative to sender/receiver) and all items received
+//   * overlapped puts / gets
+//   * all puts finished before any getS
+//
+template< typename T >
+int test_parallel(int num_threads) {
+    tbb::flow::graph g;
+    tbb::flow::priority_queue_node<T> q(g);
+    tbb::flow::priority_queue_node<T> q2(g);
+    tbb::flow::priority_queue_node<T> q3(g);
+    T bogus_value(-1);
+    T j = bogus_value;
+
+    NativeParallelFor( num_threads, parallel_puts<T>(q) );
+    for (int i = num_threads*N -1; i>=0; --i) {
+        spin_try_get( q, j );
+        ASSERT(j == i, NULL);
+        j = bogus_value;
+    }
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    NativeParallelFor( num_threads, parallel_puts<T>(q) );
+    g.wait_for_all();
+    NativeParallelFor( num_threads, parallel_gets<T>(q) );
+    g.wait_for_all();
+    j = bogus_value;
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    NativeParallelFor( num_threads, parallel_put_get<T>(q) );
+    g.wait_for_all();
+    j = bogus_value;
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::make_edge( q, q2 );
+    tbb::flow::make_edge( q2, q3 );
+    NativeParallelFor( num_threads, parallel_puts<T>(q) );
+    g.wait_for_all();
+    NativeParallelFor( num_threads, parallel_gets<T>(q3) );
+    g.wait_for_all();
+    j = bogus_value;
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( q2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( q3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    // test copy constructor
+    ASSERT( q.remove_successor( q2 ) == true, NULL );
+    NativeParallelFor( num_threads, parallel_puts<T>(q) );
+    tbb::flow::priority_queue_node<T> q_copy(q);
+    g.wait_for_all();
+    j = bogus_value;
+    ASSERT( q_copy.try_get( j ) == false, NULL );
+    ASSERT( q.register_successor( q_copy ) == true, NULL );
+    for (int i = num_threads*N -1; i>=0; --i) {
+        spin_try_get( q_copy, j );
+        ASSERT(j == i, NULL);
+        j = bogus_value;
+    }
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( q_copy.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    return 0;
+}
+
+//
+// Tests
+//
+// Predecessors cannot be registered
+// Empty Q rejects item requests
+// Single serial sender, items in FIFO order
+// Chained Qs ( 2 & 3 ), single sender, items at last Q in FIFO order
+//
+
+template< typename T >
+int test_serial() {
+    tbb::flow::graph g;
+    T bogus_value(-1);
+
+    tbb::flow::priority_queue_node<T> q(g);
+    tbb::flow::priority_queue_node<T> q2(g);
+    T j = bogus_value;
+
+    //
+    // Rejects attempts to add / remove predecessor
+    // Rejects request from empty Q
+    //
+    ASSERT( q.register_predecessor( q2 ) == false, NULL );
+    ASSERT( q.remove_predecessor( q2 ) == false, NULL );
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    //
+    // Simple puts and gets
+    //
+
+    for (int i = 0; i < N; ++i)
+        ASSERT( q.try_put( T(i) ), NULL );
+    for (int i = N-1; i >=0; --i) {
+        j = bogus_value;
+        spin_try_get( q, j );
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::make_edge( q, q2 );
+
+    for (int i = 0; i < N; ++i)
+        ASSERT( q.try_put( T(i) ), NULL );
+    g.wait_for_all();
+    for (int i = N-1; i >= 0; --i) {
+        j = bogus_value;
+        spin_try_get( q2, j );
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( q2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::remove_edge( q, q2 );
+    ASSERT( q.try_put( 1 ) == true, NULL );
+    g.wait_for_all();
+    ASSERT( q2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == true, NULL );
+    ASSERT( j == 1, NULL );
+
+    tbb::flow::priority_queue_node<T> q3(g);
+    tbb::flow::make_edge( q, q2 );
+    tbb::flow::make_edge( q2, q3 );
+
+    for (int i = 0; i < N; ++i)
+        ASSERT(  q.try_put( T(i) ), NULL );
+    g.wait_for_all();
+    for (int i = N-1; i >= 0; --i) {
+        j = bogus_value;
+        spin_try_get( q3, j );
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( q2.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( q3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    tbb::flow::remove_edge( q,  q2 );
+    ASSERT( q.try_put( 1 ) == true, NULL );
+    g.wait_for_all();
+    ASSERT( q2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+    ASSERT( q3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+    ASSERT( q.try_get( j ) == true, NULL );
+    ASSERT( j == 1, NULL );
+
+    return 0;
+}
+
+int TestMain() {
+    tbb::tick_count start = tbb::tick_count::now(), stop;
+    for (int p = 2; p <= 4; ++p) {
+        tbb::task_scheduler_init init(p);
+        test_serial<int>();
+        test_reservation<int>(p);
+        test_reservation<check_type<int> >(p);
+        test_parallel<int>(p);
+    }
+    stop = tbb::tick_count::now();
+    REMARK("Priority_Queue_Node Time=%6.6f\n", (stop-start).seconds());
+    REMARK("Testing resets\n");
+    test_resets<int,tbb::flow::priority_queue_node<int> >();
+    test_resets<float,tbb::flow::priority_queue_node<float> >();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_buffer_extract<tbb::flow::priority_queue_node<int> >().run_tests();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_queue_node.cpp b/xdl/third_party/tbb/src/test/test_queue_node.cpp
new file mode 100644
index 00000000..7a0f8b3d
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_queue_node.cpp
@@ -0,0 +1,472 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// TO DO: Add overlapping put / receive tests
+
+#include "harness.h"
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "harness_checktype.h"
+#include "harness_graph.h"
+
+#include <cstdio>
+
+#define N 1000
+#define C 10
+
+template< typename T >
+void spin_try_get( tbb::flow::queue_node<T> &q, T &value ) {
+    while ( q.try_get(value) != true ) ;
+}
+
+template< typename T >
+void check_item( T* next_value, T &value ) {
+    int tid = value / N;
+    int offset = value % N;
+    ASSERT( next_value[tid] == T(offset), NULL );
+    ++next_value[tid];
+}
+
+template< typename T >
+struct parallel_puts : NoAssign {
+
+    tbb::flow::queue_node<T> &my_q;
+
+    parallel_puts( tbb::flow::queue_node<T> &q ) : my_q(q) {}
+
+    void operator()(int i) const {
+        for (int j = 0; j < N; ++j) {
+            bool msg = my_q.try_put( T(N*i + j) );
+            ASSERT( msg == true, NULL );
+        }
+    }
+
+};
+
+
+
+template< typename T >
+struct touches {
+
+    bool **my_touches;
+    T **my_last_touch;
+    int my_num_threads;
+
+    touches( int num_threads ) : my_num_threads(num_threads) {
+        my_last_touch = new T* [my_num_threads];
+        my_touches = new bool* [my_num_threads];
+        for ( int p = 0; p < my_num_threads; ++p) {
+            my_last_touch[p] = new T[my_num_threads];
+            for ( int p2 = 0; p2 < my_num_threads; ++p2)
+                my_last_touch[p][p2] = -1;
+
+            my_touches[p] = new bool[N*my_num_threads];
+            for ( int n = 0; n < N*my_num_threads; ++n)
+                my_touches[p][n] = false;
+        }
+    }
+
+    ~touches() {
+        for ( int p = 0; p < my_num_threads; ++p) {
+            delete [] my_touches[p];
+            delete [] my_last_touch[p];
+        }
+        delete [] my_touches;
+        delete [] my_last_touch;
+    }
+
+    bool check( int tid, T v ) {
+        int v_tid = v / N;
+        if ( my_touches[tid][v] != false ) {
+            printf("Error: value seen twice by local thread\n");
+            return false;
+        }
+        if ( v <= my_last_touch[tid][v_tid] ) {
+            printf("Error: value seen in wrong order by local thread\n");
+            return false;
+        }
+        my_last_touch[tid][v_tid] = v;
+        my_touches[tid][v] = true;
+        return true;
+    }
+
+    bool validate_touches() {
+        bool *all_touches = new bool[N*my_num_threads];
+        for ( int n = 0; n < N*my_num_threads; ++n)
+            all_touches[n] = false;
+
+        for ( int p = 0; p < my_num_threads; ++p) {
+            for ( int n = 0; n < N*my_num_threads; ++n) {
+                if ( my_touches[p][n] == true ) {
+                    ASSERT( all_touches[n] == false, "value see by more than one thread\n" );
+                    all_touches[n] = true;
+                }
+            }
+        }
+        for ( int n = 0; n < N*my_num_threads; ++n) {
+            if ( !all_touches[n] )
+                printf("No touch at %d, my_num_threads = %d\n", n, my_num_threads);
+            //ASSERT( all_touches[n] == true, "value not seen by any thread\n" );
+        }
+        delete [] all_touches;
+        return true;
+    }
+
+};
+
+template< typename T >
+struct parallel_gets : NoAssign {
+
+    tbb::flow::queue_node<T> &my_q;
+    touches<T> &my_touches;
+
+    parallel_gets( tbb::flow::queue_node<T> &q, touches<T> &t) : my_q(q), my_touches(t) {}
+
+    void operator()(int tid) const {
+        for (int j = 0; j < N; ++j) {
+            T v;
+            spin_try_get( my_q, v );
+            my_touches.check( tid, v );
+        }
+    }
+
+};
+
+template< typename T >
+struct parallel_put_get : NoAssign {
+
+    tbb::flow::queue_node<T> &my_q;
+    touches<T> &my_touches;
+
+    parallel_put_get( tbb::flow::queue_node<T> &q, touches<T> &t ) : my_q(q), my_touches(t) {}
+
+    void operator()(int tid) const {
+
+        for ( int i = 0; i < N; i+=C ) {
+            int j_end = ( N < i + C ) ? N : i + C;
+            // dump about C values into the Q
+            for ( int j = i; j < j_end; ++j ) {
+                ASSERT( my_q.try_put( T (N*tid + j ) ) == true, NULL );
+            }
+            // receiver about C values from the Q
+            for ( int j = i; j < j_end; ++j ) {
+                T v;
+                spin_try_get( my_q, v );
+                my_touches.check( tid, v );
+            }
+        }
+    }
+
+};
+
+//
+// Tests
+//
+// Item can be reserved, released, consumed ( single serial receiver )
+//
+template< typename T >
+int test_reservation() {
+    tbb::flow::graph g;
+    T bogus_value(-1);
+
+    // Simple tests
+    tbb::flow::queue_node<T> q(g);
+
+    q.try_put(T(1));
+    q.try_put(T(2));
+    q.try_put(T(3));
+
+    T v;
+    ASSERT( q.reserve_item(v) == true, NULL );
+    ASSERT( v == T(1), NULL );
+    ASSERT( q.release_reservation() == true, NULL );
+    v = bogus_value;
+    g.wait_for_all();
+    ASSERT( q.reserve_item(v) == true, NULL );
+    ASSERT( v == T(1), NULL );
+    ASSERT( q.consume_reservation() == true, NULL );
+    v = bogus_value;
+    g.wait_for_all();
+
+    ASSERT( q.try_get(v) == true, NULL );
+    ASSERT( v == T(2), NULL );
+    v = bogus_value;
+    g.wait_for_all();
+
+    ASSERT( q.reserve_item(v) == true, NULL );
+    ASSERT( v == T(3), NULL );
+    ASSERT( q.release_reservation() == true, NULL );
+    v = bogus_value;
+    g.wait_for_all();
+    ASSERT( q.reserve_item(v) == true, NULL );
+    ASSERT( v == T(3), NULL );
+    ASSERT( q.consume_reservation() == true, NULL );
+    v = bogus_value;
+    g.wait_for_all();
+
+    return 0;
+}
+
+//
+// Tests
+//
+// multilpe parallel senders, items in FIFO (relatively to sender) order
+// multilpe parallel senders, multiple parallel receivers, items in FIFO order (relative to sender/receiver) and all items received
+//   * overlapped puts / gets
+//   * all puts finished before any getS
+//
+template< typename T >
+int test_parallel(int num_threads) {
+    tbb::flow::graph g;
+    tbb::flow::queue_node<T> q(g);
+    tbb::flow::queue_node<T> q2(g);
+    tbb::flow::queue_node<T> q3(g);
+    {
+        Check< T > my_check;
+        T bogus_value(-1);
+        T j = bogus_value;
+        NativeParallelFor( num_threads, parallel_puts<T>(q) );
+
+        T *next_value = new T[num_threads];
+        for (int tid = 0; tid < num_threads; ++tid) next_value[tid] = T(0);
+
+        for (int i = 0; i < num_threads * N; ++i ) {
+            spin_try_get( q, j );
+            check_item( next_value, j );
+            j = bogus_value;
+        }
+        for (int tid = 0; tid < num_threads; ++tid)  {
+            ASSERT( next_value[tid] == T(N), NULL );
+        }
+        delete[] next_value;
+
+        j = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        NativeParallelFor( num_threads, parallel_puts<T>(q) );
+
+        {
+            touches< T > t( num_threads );
+            NativeParallelFor( num_threads, parallel_gets<T>(q, t) );
+            g.wait_for_all();
+            ASSERT( t.validate_touches(), NULL );
+        }
+        j = bogus_value;
+        ASSERT( q.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        g.wait_for_all();
+        {
+            touches< T > t2( num_threads );
+            NativeParallelFor( num_threads, parallel_put_get<T>(q, t2) );
+            g.wait_for_all();
+            ASSERT( t2.validate_touches(), NULL );
+        }
+        j = bogus_value;
+        ASSERT( q.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        tbb::flow::make_edge( q, q2 );
+        tbb::flow::make_edge( q2, q3 );
+
+        NativeParallelFor( num_threads, parallel_puts<T>(q) );
+        {
+            touches< T > t3( num_threads );
+            NativeParallelFor( num_threads, parallel_gets<T>(q3, t3) );
+            g.wait_for_all();
+            ASSERT( t3.validate_touches(), NULL );
+        }
+        j = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == false, NULL );
+        g.wait_for_all();
+        ASSERT( q2.try_get( j ) == false, NULL );
+        g.wait_for_all();
+        ASSERT( q3.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        // test copy constructor
+        ASSERT( q.remove_successor( q2 ), NULL );
+        NativeParallelFor( num_threads, parallel_puts<T>(q) );
+        tbb::flow::queue_node<T> q_copy(q);
+        j = bogus_value;
+        g.wait_for_all();
+        ASSERT( q_copy.try_get( j ) == false, NULL );
+        ASSERT( q.register_successor( q_copy ) == true, NULL );
+        {
+            touches< T > t( num_threads );
+            NativeParallelFor( num_threads, parallel_gets<T>(q_copy, t) );
+            g.wait_for_all();
+            ASSERT( t.validate_touches(), NULL );
+        }
+        j = bogus_value;
+        ASSERT( q.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+        ASSERT( q_copy.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+    }
+
+    return 0;
+}
+
+//
+// Tests
+//
+// Predecessors cannot be registered
+// Empty Q rejects item requests
+// Single serial sender, items in FIFO order
+// Chained Qs ( 2 & 3 ), single sender, items at last Q in FIFO order
+//
+
+template< typename T >
+int test_serial() {
+    tbb::flow::graph g;
+    tbb::flow::queue_node<T> q(g);
+    tbb::flow::queue_node<T> q2(g);
+    {   // destroy the graph after manipulating it, and see if all the items in the buffers
+        // have been destroyed before the graph
+        Check<T> my_check;  // if check_type< U > count constructions and destructions
+        T bogus_value(-1);
+        T j = bogus_value;
+
+        //
+        // Rejects attempts to add / remove predecessor
+        // Rejects request from empty Q
+        //
+        ASSERT( q.register_predecessor( q2 ) == false, NULL );
+        ASSERT( q.remove_predecessor( q2 ) == false, NULL );
+        ASSERT( q.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        //
+        // Simple puts and gets
+        //
+
+        for (int i = 0; i < N; ++i) {
+            bool msg = q.try_put( T(i) );
+            ASSERT( msg == true, NULL );
+        }
+
+
+        for (int i = 0; i < N; ++i) {
+            j = bogus_value;
+            spin_try_get( q, j );
+            ASSERT( i == j, NULL );
+        }
+        j = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        tbb::flow::make_edge( q, q2 );
+
+        for (int i = 0; i < N; ++i) {
+            bool msg = q.try_put( T(i) );
+            ASSERT( msg == true, NULL );
+        }
+
+
+        for (int i = 0; i < N; ++i) {
+            j = bogus_value;
+            spin_try_get( q2, j );
+            ASSERT( i == j, NULL );
+        }
+        j = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == false, NULL );
+        g.wait_for_all();
+        ASSERT( q2.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        tbb::flow::remove_edge( q, q2 );
+        ASSERT( q.try_put( 1 ) == true, NULL );
+        g.wait_for_all();
+        ASSERT( q2.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == true, NULL );
+        ASSERT( j == 1, NULL );
+
+        tbb::flow::queue_node<T> q3(g);
+        tbb::flow::make_edge( q, q2 );
+        tbb::flow::make_edge( q2, q3 );
+
+        for (int i = 0; i < N; ++i) {
+            bool msg = q.try_put( T(i) );
+            ASSERT( msg == true, NULL );
+        }
+
+        for (int i = 0; i < N; ++i) {
+            j = bogus_value;
+            spin_try_get( q3, j );
+            ASSERT( i == j, NULL );
+        }
+        j = bogus_value;
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == false, NULL );
+        g.wait_for_all();
+        ASSERT( q2.try_get( j ) == false, NULL );
+        g.wait_for_all();
+        ASSERT( q3.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+
+        tbb::flow::remove_edge( q,  q2 );
+        ASSERT( q.try_put( 1 ) == true, NULL );
+        g.wait_for_all();
+        ASSERT( q2.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+        g.wait_for_all();
+        ASSERT( q3.try_get( j ) == false, NULL );
+        ASSERT( j == bogus_value, NULL );
+        g.wait_for_all();
+        ASSERT( q.try_get( j ) == true, NULL );
+        ASSERT( j == 1, NULL );
+    }
+
+    return 0;
+}
+
+int TestMain() {
+    tbb::tick_count start = tbb::tick_count::now(), stop;
+    for (int p = 2; p <= 4; ++p) {
+        tbb::task_scheduler_init init(p);
+        test_serial<int>();
+        test_serial<check_type<int> >();
+        test_parallel<int>(p);
+        test_parallel<check_type<int> >(p);
+    }
+    stop = tbb::tick_count::now();
+    REMARK("Queue_Node Time=%6.6f\n", (stop-start).seconds());
+    REMARK("Testing resets\n");
+    test_resets<int, tbb::flow::queue_node<int> >();
+    test_resets<float, tbb::flow::queue_node<float> >();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_buffer_extract<tbb::flow::queue_node<int> >().run_tests();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_range_based_for.h b/xdl/third_party/tbb/src/test/test_range_based_for.h
new file mode 100644
index 00000000..e9f213bc
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_range_based_for.h
@@ -0,0 +1,64 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#ifndef __TBB_test_range_based_for_H
+#define __TBB_test_range_based_for_H
+
+#include <utility> //for std::pair
+namespace range_based_for_support_tests{
+
+    template<typename value_type, typename container, typename binary_op_type, typename init_value_type>
+    inline init_value_type range_based_for_accumulate(container const& c, binary_op_type accumulator, init_value_type init )
+    {
+        init_value_type range_for_accumulated = init;
+        #if __TBB_RANGE_BASED_FOR_PRESENT
+        for (value_type  x : c) {
+            range_for_accumulated = accumulator(range_for_accumulated, x);
+        }
+        #else
+        for (typename container::const_iterator x =c.begin(); x != c.end(); ++x) {
+            range_for_accumulated = accumulator(range_for_accumulated, *x);
+        }
+        #endif
+        return range_for_accumulated;
+    }
+
+    template<typename container, typename binary_op_type, typename init_value_type>
+    inline init_value_type range_based_for_accumulate(container const& c, binary_op_type accumulator, init_value_type init )
+    {
+        typedef typename container::value_type value_type;
+        return range_based_for_accumulate<value_type>(c,accumulator,init);
+    }
+
+    template <typename integral_type >
+    integral_type gauss_summ_of_int_sequence(integral_type sequence_length){
+        return (sequence_length +1)* sequence_length /2;
+    }
+
+    struct pair_second_summer{
+        template<typename first_type, typename second_type>
+        second_type operator() (second_type const& lhs, std::pair<first_type, second_type> const& rhs) const
+        {
+            return lhs + rhs.second;
+        }
+    };
+}
+
+#endif /* __TBB_test_range_based_for_H */
diff --git a/xdl/third_party/tbb/src/test/test_reader_writer_lock.cpp b/xdl/third_party/tbb/src/test/test_reader_writer_lock.cpp
new file mode 100644
index 00000000..3911aee1
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_reader_writer_lock.cpp
@@ -0,0 +1,238 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// test reader_writer_lock
+#include "tbb/reader_writer_lock.h"
+#include "tbb/atomic.h"
+#include "tbb/tbb_exception.h"
+#include "harness.h"
+#include "harness_barrier.h"
+
+tbb::reader_writer_lock the_mutex;
+const int MAX_WORK = 10000;
+
+tbb::atomic<size_t> active_readers, active_writers;
+tbb::atomic<bool> sim_readers;
+size_t n_tested__sim_readers;
+
+
+int BusyWork(int percentOfMaxWork) {
+  int iters = 0;
+  for (int i=0; i<MAX_WORK*((double)percentOfMaxWork/100.0); ++i) {
+      iters++;
+  }
+  return iters;
+}
+
+struct StressRWLBody : NoAssign {
+    const int nThread;
+    const int percentMax;
+
+    StressRWLBody(int nThread_, int percentMax_) : nThread(nThread_), percentMax(percentMax_) {}
+
+    void operator()(const int /* threadID */ ) const {
+        int nIters = 100;
+        int r_result=0, w_result=0;
+        for(int i=0; i<nIters; ++i) {
+            // test unscoped blocking write lock
+            the_mutex.lock();
+            w_result += BusyWork(percentMax);
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+            // test exception for recursive write lock
+            bool was_caught = false;
+            try {
+                the_mutex.lock();
+            }
+            catch(tbb::improper_lock& ex) {
+                REMARK("improper_lock: %s\n", ex.what());
+                was_caught = true;
+            }
+            catch(...) {
+                REPORT("Wrong exception caught during recursive lock attempt.");
+            }
+            ASSERT(was_caught, "Recursive lock attempt exception not caught properly.");
+            // test exception for recursive read lock
+            was_caught = false;
+            try {
+                the_mutex.lock_read();
+            }
+            catch(tbb::improper_lock& ex) {
+                REMARK("improper_lock: %s\n", ex.what());
+                was_caught = true;
+            }
+            catch(...) {
+                REPORT("Wrong exception caught during recursive lock attempt.");
+            }
+            ASSERT(was_caught, "Recursive lock attempt exception not caught properly.");
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+            the_mutex.unlock();
+            // test unscoped non-blocking write lock
+            if (the_mutex.try_lock()) {
+                w_result += BusyWork(percentMax);
+                the_mutex.unlock();
+            }
+            // test unscoped blocking read lock
+            the_mutex.lock_read();
+            r_result += BusyWork(percentMax);
+            the_mutex.unlock();
+            // test unscoped non-blocking read lock
+            if(the_mutex.try_lock_read()) {
+                r_result += BusyWork(percentMax);
+                the_mutex.unlock();
+            }
+            { // test scoped blocking write lock
+                tbb::reader_writer_lock::scoped_lock my_lock(the_mutex);
+                w_result += BusyWork(percentMax);
+            }
+            { // test scoped blocking read lock
+                tbb::reader_writer_lock::scoped_lock_read my_lock(the_mutex);
+                r_result += BusyWork(percentMax);
+            }
+        }
+        REMARK(" R%d/W%d", r_result, w_result); // reader/writer iterations of busy work completed
+    }
+};
+
+struct CorrectRWLScopedBody : NoAssign {
+    const int nThread;
+    Harness::SpinBarrier& my_barrier;
+
+    CorrectRWLScopedBody(int nThread_, Harness::SpinBarrier& b_) : nThread(nThread_),my_barrier(b_) {}
+
+    void operator()(const int /* threadID */ ) const {
+        my_barrier.wait();
+        for (int i=0; i<50; i++) {
+            const bool is_reader = i%5==0; // 1 writer for every 4 readers
+
+            if (is_reader) {
+                tbb::reader_writer_lock::scoped_lock_read my_lock(the_mutex);
+                active_readers++;
+                if (active_readers > 1) sim_readers = true;
+                ASSERT(active_writers==0, "Active writers in read-locked region.");
+                Harness::Sleep(10);
+                active_readers--;
+            }
+            else { // is writer
+                tbb::reader_writer_lock::scoped_lock my_lock(the_mutex);
+                active_writers++;
+                ASSERT(active_readers==0, "Active readers in write-locked region.");
+                ASSERT(active_writers<=1, "More than one active writer in write-locked region.");
+                Harness::Sleep(10);
+                active_writers--;
+            }
+        }
+    }
+};
+
+struct CorrectRWLBody : NoAssign {
+    const int nThread;
+    Harness::SpinBarrier& my_barrier;
+
+    CorrectRWLBody(int nThread_, Harness::SpinBarrier& b_ ) : nThread(nThread_), my_barrier(b_) {}
+
+    void operator()(const int /* threadID */ ) const {
+        my_barrier.wait();
+        for (int i=0; i<50; i++) {
+            const bool is_reader = i%5==0; // 1 writer for every 4 readers
+
+            if (is_reader) {
+                the_mutex.lock_read();
+                active_readers++;
+                if (active_readers > 1) sim_readers = true;
+                ASSERT(active_writers==0, "Active writers in read-locked region.");
+            }
+            else { // is writer
+                the_mutex.lock();
+                active_writers++;
+                ASSERT(active_readers==0, "Active readers in write-locked region.");
+                ASSERT(active_writers<=1, "More than one active writer in write-locked region.");
+            }
+            Harness::Sleep(10);
+            if (is_reader) {
+                active_readers--;
+            }
+            else { // is writer
+                active_writers--;
+            }
+            the_mutex.unlock();
+        }
+    }
+};
+
+void TestReaderWriterLockOnNThreads(int nThreads) {
+    // Stress-test all interfaces
+    for (int pc=0; pc<=100; pc+=20) {
+        REMARK("Testing with %d threads, percent of MAX_WORK=%d...", nThreads, pc);
+        StressRWLBody myStressBody(nThreads, pc);
+        NativeParallelFor(nThreads, myStressBody);
+        REMARK(" OK.\n");
+    }
+
+    int i;
+    n_tested__sim_readers = 0;
+    REMARK("Testing with %d threads, direct/unscoped locking mode...", nThreads); // TODO: choose direct or unscoped?
+    // TODO: refactor the following two for loops into a shared function 
+    for( i=0; i<100; ++i ) {
+        Harness::SpinBarrier bar0(nThreads);
+
+        CorrectRWLBody myCorrectBody(nThreads,bar0);
+        active_writers = active_readers = 0;
+        sim_readers = false;
+        NativeParallelFor(nThreads, myCorrectBody);
+
+        if( sim_readers || nThreads==1 ) {
+            if( ++n_tested__sim_readers>5 )
+                break;
+        }
+    }
+    ASSERT(i<100, "There were no simultaneous readers.");
+    REMARK(" OK.\n");
+
+    n_tested__sim_readers = 0;
+    REMARK("Testing with %d threads, scoped locking mode...", nThreads);
+    for( i=0; i<100; ++i ) {
+        Harness::SpinBarrier bar0(nThreads);
+        CorrectRWLScopedBody myCorrectScopedBody(nThreads, bar0);
+        active_writers = active_readers = 0;
+        sim_readers = false;
+        NativeParallelFor(nThreads, myCorrectScopedBody);
+        if( sim_readers || nThreads==1 ) {
+            if( ++n_tested__sim_readers>5 )
+                break;
+        }
+    }
+    ASSERT(i<100, "There were no simultaneous readers.");
+    REMARK(" OK.\n");
+}
+
+void TestReaderWriterLock() {
+    for(int p = MinThread; p <= MaxThread; p++) {
+        TestReaderWriterLockOnNThreads(p);
+    }
+}
+
+
+int TestMain() {
+    if(MinThread <= 0) MinThread = 1;
+    if(MaxThread > 0) {
+        TestReaderWriterLock();
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_runtime_loader.cpp b/xdl/third_party/tbb/src/test/test_runtime_loader.cpp
new file mode 100644
index 00000000..1a63b211
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_runtime_loader.cpp
@@ -0,0 +1,283 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if !(_WIN32||_WIN64) || (__MINGW64__||__MINGW32__)
+
+#include "harness.h"
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#else // !(_WIN32||_WIN64)
+
+#define TBB_PREVIEW_RUNTIME_LOADER 1
+#include "tbb/runtime_loader.h"
+#include "tbb/tbb_stddef.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tbb_exception.h"
+
+#include <cstdio>
+#include <cstdlib>
+#include <cerrno>
+#include <vector>
+#include <string>
+#include <utility>
+#include <typeinfo>
+#include <stdexcept>
+
+#ifdef HARNESS_USE_RUNTIME_LOADER
+    #undef HARNESS_USE_RUNTIME_LOADER    // We do not want harness to preload tbb.
+#endif
+#include "harness.h"
+
+static int errors = 0;
+
+#define CHECK( cond ) {                                                  \
+    if ( ! (cond) ) {                                                    \
+        ++ errors;                                                       \
+        REPORT( "%s:%d: --- TEST FAILED ---\n", __FILE__, __LINE__ );    \
+    };                                                                   \
+}
+
+#define SAY( msg ) \
+    REMARK( "%s:%d: %s\n", __FILE__, __LINE__, msg )
+
+typedef int (*int_func_t)();
+
+namespace tbb {
+namespace interface6 {
+namespace internal {
+namespace runtime_loader {
+    extern tbb::runtime_loader::error_mode stub_mode;
+} } } } // namespaces runtime_loader, internal, interface6, tbb
+
+using tbb::interface6::internal::runtime_loader::stub_mode;
+
+#define _CHECK_TBB( code ) {                           \
+    stub_mode = tbb::runtime_loader::em_status;        \
+    int ver = tbb::TBB_runtime_interface_version();    \
+    stub_mode = tbb::runtime_loader::em_abort;         \
+    CHECK( ver == code );                              \
+}
+
+#define CHECK_TBB_IS_LOADED()                          \
+    _CHECK_TBB( TBB_INTERFACE_VERSION )
+
+#define CHECK_TBB_IS_NOT_LOADED()                      \
+    _CHECK_TBB( tbb::runtime_loader::ec_no_lib )
+
+int TestMain() {
+
+
+    __TBB_TRY {
+
+        {
+            SAY( "Call a function when library is not yet loaded, stub should return a error." );
+            CHECK_TBB_IS_NOT_LOADED();
+        }
+
+        {
+            SAY( "Create a runtime_loader object, do not load library but make some bad calls." );
+            tbb::runtime_loader rtl( tbb::runtime_loader::em_status );
+            SAY( "After creating status should be ok." );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_ok );
+            SAY( "Call a function, stub should return a error." );
+            CHECK_TBB_IS_NOT_LOADED();
+        }
+
+        {
+            SAY( "Create a runtime_loader object and call load() with bad arguments." );
+            char const * path[] = { ".", NULL };
+            tbb::runtime_loader rtl( tbb::runtime_loader::em_status );
+            SAY( "Min version is bad." );
+            rtl.load( path, -1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_bad_arg );
+            SAY( "Max version is bad." );
+            rtl.load( path, TBB_INTERFACE_VERSION, -1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_bad_arg );
+            SAY( "Both versions are bad." );
+            rtl.load( path, -1, -1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_bad_arg );
+            SAY( "Min is bigger than max." );
+            rtl.load( path, TBB_INTERFACE_VERSION + 1, TBB_INTERFACE_VERSION - 1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_bad_arg );
+        }
+
+        {
+            SAY( "Create a proxy object and call load() with good arguments but not available version." );
+            char const * path[] = { ".", NULL };
+            tbb::runtime_loader rtl( tbb::runtime_loader::em_status );
+            SAY( "Min version too big." );
+            rtl.load( path, TBB_INTERFACE_VERSION + 1, TBB_INTERFACE_VERSION + 1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_no_lib );
+            SAY( "Max version is too small." );
+            rtl.load( path, TBB_INTERFACE_VERSION - 1, TBB_INTERFACE_VERSION - 1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_no_lib );
+        }
+
+        {
+            SAY( "Test em_throw mode." );
+            char const * path[] = { ".", NULL };
+            tbb::runtime_loader rtl( tbb::runtime_loader::em_throw );
+            tbb::runtime_loader::error_code code = tbb::runtime_loader::ec_ok;
+            __TBB_TRY {
+                rtl.load( path, -1 );
+            } __TBB_CATCH ( tbb::runtime_loader::error_code c ) {
+                code = c;
+            }; // __TBB_TRY
+            CHECK( code == tbb::runtime_loader::ec_bad_arg );
+            __TBB_TRY {
+                rtl.load( path, TBB_INTERFACE_VERSION + 1 );
+            } __TBB_CATCH ( tbb::runtime_loader::error_code c ) {
+                code = c;
+            }; // __TBB_TRY
+            CHECK( code == tbb::runtime_loader::ec_no_lib );
+        }
+
+        {
+            SAY( "Load current version, but specify wrong directories." );
+            tbb::runtime_loader rtl( tbb::runtime_loader::em_status );
+            SAY( "Specify no directories." );
+            char const * path0[] = { NULL };
+            rtl.load( path0 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_no_lib );
+            SAY( "Specify directories without library." );
+            char const * path1[] = { "..", "/", NULL };
+            rtl.load( path1 );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_no_lib );
+        }
+
+        {
+            SAY( "Now really load library and do various tests." );
+            char const * path[] = { ".", NULL };
+            tbb::runtime_loader rtl( tbb::runtime_loader::em_status );
+            SAY( "Load current version." );
+            rtl.load( path, TBB_INTERFACE_VERSION, TBB_INTERFACE_VERSION );
+            CHECK( rtl.status() == tbb::runtime_loader::ec_ok );
+            if ( rtl.status() == tbb::runtime_loader::ec_ok ) {
+                {
+                    SAY( "Make sure the library really loaded." );
+                    CHECK_TBB_IS_LOADED();
+                }
+                SAY( "Call load() again, it should return a error." );
+                rtl.load( path, TBB_INTERFACE_VERSION, TBB_INTERFACE_VERSION );
+                CHECK( rtl.status() == tbb::runtime_loader::ec_bad_call );
+                {
+                    SAY( "Initialize task_scheduler." );
+                    tbb::task_scheduler_init init( 1 );
+                    // Check what?
+                }
+
+                // There was a problem on Linux* OS, and still a problem on macOS*.
+                SAY( "Throw an exception." );
+                // Iterate through all the ids first.
+                for ( int id = 1; id < tbb::internal::eid_max; ++ id ) {
+                    bool ex_caught = false;
+                    __TBB_TRY {
+                        tbb::internal::throw_exception( tbb::internal::exception_id( id ) );
+                    } __TBB_CATCH ( std::exception const & ) {
+                        SAY( "Expected exception caught." );
+                        ex_caught = true;
+                    } __TBB_CATCH ( ... ) {
+                        SAY( "Unexpected exception caught." );
+                    }; // try
+                    CHECK( ex_caught );
+                }; // for
+                // Now try to catch exceptions of specific types.
+                #define CHECK_EXCEPTION( id, type )                                 \
+                    {                                                               \
+                        SAY( "Trowing " #id " exception of " #type " type..." );    \
+                        bool ex_caught = false;                                     \
+                        __TBB_TRY {                                                 \
+                            tbb::internal::throw_exception( tbb::internal::id );    \
+                        } __TBB_CATCH ( type const & ) {                            \
+                            SAY( #type " exception caught." );                      \
+                            ex_caught = true;                                       \
+                        } __TBB_CATCH ( ... ) {                                     \
+                            SAY( "Unexpected exception caught." );                  \
+                        }; /* try */                                                \
+                        CHECK( ex_caught );                                         \
+                    }
+                CHECK_EXCEPTION( eid_bad_alloc,                   std::bad_alloc                   );
+                CHECK_EXCEPTION( eid_bad_last_alloc,              tbb::bad_last_alloc              );
+                CHECK_EXCEPTION( eid_nonpositive_step,            std::invalid_argument            );
+                CHECK_EXCEPTION( eid_out_of_range,                std::out_of_range                );
+                CHECK_EXCEPTION( eid_segment_range_error,         std::range_error                 );
+                CHECK_EXCEPTION( eid_missing_wait,                tbb::missing_wait                );
+                CHECK_EXCEPTION( eid_invalid_multiple_scheduling, tbb::invalid_multiple_scheduling );
+                CHECK_EXCEPTION( eid_improper_lock,               tbb::improper_lock               );
+                CHECK_EXCEPTION( eid_possible_deadlock,           std::runtime_error               );
+                CHECK_EXCEPTION( eid_reservation_length_error,    std::length_error                );
+                CHECK_EXCEPTION( eid_user_abort,                  tbb::user_abort                  );
+                #undef CHECK_EXCEPTION
+                {
+                    bool ex_caught = false;
+                    __TBB_TRY {
+                        tbb::internal::handle_perror( EAGAIN, "apple" );
+                    } __TBB_CATCH ( std::runtime_error const & ) {
+                        SAY( "Expected exception caught." );
+                        ex_caught = true;
+                    } __TBB_CATCH ( ... ) {
+                        SAY( "Unexpected exception caught." );
+                    }; // try
+                    CHECK( ex_caught );
+                }
+            }; // if
+        }
+
+        {
+            SAY( "Test multiple proxies." );
+            char const * path[] = { ".", NULL };
+            tbb::runtime_loader rtl0( tbb::runtime_loader::em_status );
+            tbb::runtime_loader rtl1( tbb::runtime_loader::em_status );
+            CHECK( rtl0.status() == tbb::runtime_loader::ec_ok );
+            CHECK( rtl1.status() == tbb::runtime_loader::ec_ok );
+            SAY( "Load current version with the first rtl." );
+            rtl0.load( path );
+            CHECK( rtl0.status() == tbb::runtime_loader::ec_ok );
+            CHECK_TBB_IS_LOADED();
+            SAY( "Load another version with the second proxy, it should return a error." );
+            rtl1.load( path, TBB_INTERFACE_VERSION + 1 );
+            CHECK( rtl1.status() == tbb::runtime_loader::ec_bad_ver );
+            SAY( "Load the same version with the second proxy, it should return ok." );
+            rtl1.load( path );
+            CHECK( rtl1.status() == tbb::runtime_loader::ec_ok );
+            CHECK_TBB_IS_LOADED();
+        }
+
+    } __TBB_CATCH( ... ) {
+
+        ASSERT( 0, "unexpected exception" );
+
+    }; // __TBB_TRY
+
+    if ( errors > 0 ) {
+        REPORT( "Some tests failed.\n" );
+        exit( 1 );
+    }; // if
+
+    return Harness::Done;
+
+} // main
+
+#endif // !(_WIN32||_WIN64)
+
+// end of file //
diff --git a/xdl/third_party/tbb/src/test/test_rwm_upgrade_downgrade.cpp b/xdl/third_party/tbb/src/test/test_rwm_upgrade_downgrade.cpp
new file mode 100644
index 00000000..7ae0b7a3
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_rwm_upgrade_downgrade.cpp
@@ -0,0 +1,74 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS 4
+#define HARNESS_DEFAULT_MAX_THREADS 4
+
+#include "tbb/queuing_rw_mutex.h"
+#include "tbb/spin_rw_mutex.h"
+#include "harness.h"
+
+using namespace tbb;
+
+volatile int Count;
+
+template<typename RWMutex>
+struct Hammer: NoAssign {
+    RWMutex &MutexProtectingCount;
+    mutable volatile int dummy;
+
+    Hammer(RWMutex &m): MutexProtectingCount(m) {}
+    void operator()( int /*thread_id*/ ) const {
+        for( int j=0; j<100000; ++j ) {
+            typename RWMutex::scoped_lock lock(MutexProtectingCount,false);
+            int c = Count;
+            for( int k=0; k<10; ++k ) {
+                ++dummy;
+            }
+            if( lock.upgrade_to_writer() ) {
+                // The upgrade succeeded without any intervening writers
+                ASSERT( c==Count, "another thread modified Count while I held a read lock" );
+            } else {
+                c = Count;
+            }
+            for( int k=0; k<10; ++k ) {
+                ++Count;
+            }
+            lock.downgrade_to_reader();
+            for( int k=0; k<10; ++k ) {
+                ++dummy;
+            }
+        }
+    }
+};
+
+queuing_rw_mutex QRW_mutex;
+spin_rw_mutex SRW_mutex;
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK("Testing on %d threads", p);
+        Count = 0;
+        NativeParallelFor( p, Hammer<queuing_rw_mutex>(QRW_mutex) );
+        Count = 0;
+        NativeParallelFor( p, Hammer<spin_rw_mutex>(SRW_mutex) );
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_semaphore.cpp b/xdl/third_party/tbb/src/test/test_semaphore.cpp
new file mode 100644
index 00000000..d24526ce
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_semaphore.cpp
@@ -0,0 +1,316 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+//
+// Test for counting semaphore.
+//
+// set semaphore to N
+// create N + M threads
+// have each thread
+//   A. P()
+//   B. increment atomic count
+//   C. spin for awhile checking the value of the count; make sure it doesn't exceed N
+//   D. decrement atomic count
+//   E. V()
+//
+
+#include "../tbb/semaphore.h"
+#include "tbb/atomic.h"
+#include "tbb/blocked_range.h"
+
+#include <vector>
+using std::vector;
+
+#include "harness_assert.h"
+#include "harness.h"
+
+using tbb::internal::semaphore;
+
+#include "harness_barrier.h"
+
+tbb::atomic<int> pCount;
+
+Harness::SpinBarrier sBarrier;
+
+#include "tbb/tick_count.h"
+// semaphore basic function:
+//   set semaphore to initial value
+//   see that semaphore only allows that number of threads to be active
+class Body: NoAssign {
+    const int nThreads;
+    const int nIters;
+    tbb::internal::semaphore &mySem;
+    vector<int> &ourCounts;
+    vector<double> &tottime;
+    static const int tickCounts = 1;  // millisecond
+    static const int innerWait = 5; // millisecond
+public:
+    Body(int nThread_, int nIter_, semaphore &mySem_,
+            vector<int>& ourCounts_,
+            vector<double>& tottime_
+            ) : nThreads(nThread_), nIters(nIter_), mySem(mySem_), ourCounts(ourCounts_), tottime(tottime_) { sBarrier.initialize(nThread_); pCount = 0; }
+void operator()(const int tid) const {
+    sBarrier.wait();
+    for(int i=0; i < nIters; ++i) {
+        Harness::Sleep( tid * tickCounts );
+        tbb::tick_count t0 = tbb::tick_count::now();
+        mySem.P();
+        tbb::tick_count t1 = tbb::tick_count::now();
+        tottime[tid] += (t1-t0).seconds();
+        int curval = ++pCount;
+        if(curval > ourCounts[tid]) ourCounts[tid] = curval;
+        Harness::Sleep( innerWait );
+        --pCount;
+        ASSERT((int)pCount >= 0, NULL);
+        mySem.V();
+    }
+}
+};
+
+
+void testSemaphore( int semInitCnt, int extraThreads ) {
+    semaphore my_sem(semInitCnt);
+    // tbb::task_scheduler_init init(tbb::task_scheduler_init::deferred);
+    int nThreads = semInitCnt + extraThreads;
+    vector<int> maxVals(nThreads);
+    vector<double> totTimes(nThreads);
+    int nIters = 10;
+    Body myBody(nThreads, nIters, my_sem, maxVals, totTimes);
+
+    REMARK( " sem(%d) with %d extra threads\n", semInitCnt, extraThreads);
+    pCount = 0;
+    NativeParallelFor(nThreads, myBody);
+    if(extraThreads == 0) {
+        double allPWaits = 0;
+        for(vector<double>::const_iterator j = totTimes.begin(); j != totTimes.end(); ++j) {
+            allPWaits += *j;
+        }
+        allPWaits /= static_cast<double>(nThreads * nIters);
+        REMARK("Average wait for P() in uncontested case for nThreads = %d is %g\n", nThreads, allPWaits);
+    }
+    ASSERT(!pCount, "not all threads decremented pCount");
+    int maxCount = -1;
+    for(vector<int>::const_iterator i=maxVals.begin(); i!= maxVals.end();++i) {
+        maxCount = max(maxCount,*i);
+    }
+    ASSERT(maxCount <= semInitCnt,"too many threads in semaphore-protected increment");
+    if(maxCount < semInitCnt) {
+        REMARK("Not enough threads in semaphore-protected region (%d < %d)\n", static_cast<int>(maxCount), semInitCnt);
+    }
+}
+
+#include "../tbb/semaphore.cpp"
+#if _WIN32||_WIN64
+#include "../tbb/dynamic_link.cpp"
+
+void testOSVersion() {
+#if __TBB_USE_SRWLOCK
+     BOOL bIsWindowsVistaOrLater;
+#if  __TBB_WIN8UI_SUPPORT
+     bIsWindowsVistaOrLater = true;
+#else
+     OSVERSIONINFO osvi;
+
+     memset( (void*)&osvi, 0, sizeof(OSVERSIONINFO) );
+     osvi.dwOSVersionInfoSize = sizeof(OSVERSIONINFO);
+     GetVersionEx(&osvi);
+     bIsWindowsVistaOrLater = (osvi.dwMajorVersion >= 6 );
+#endif
+
+     if( bIsWindowsVistaOrLater ) {
+        REMARK("Checking SRWLock is loaded\n");
+        tbb::internal::binary_semaphore s;
+        ASSERT( (uintptr_t)tbb::internal::__TBB_init_binsem!=(uintptr_t)&tbb::internal::init_binsem_using_event, NULL );
+        ASSERT( (uintptr_t)tbb::internal::__TBB_acquire_binsem!=(uintptr_t)&tbb::internal::acquire_binsem_using_event, NULL );
+        ASSERT( (uintptr_t)tbb::internal::__TBB_release_binsem!=(uintptr_t)&tbb::internal::release_binsem_using_event, NULL );
+     }
+#endif /* __TBB_USE_SRWLOCK */
+}
+#endif /* _WIN32||_WIN64 */
+
+#define N_TIMES 1000
+
+template<typename S>
+struct Counter {
+    volatile long value;
+    S my_sem;
+    Counter() : value(0) {}
+};
+
+//! Function object for use with parallel_for.h.
+template<typename C>
+struct AddOne: NoAssign {
+    C& my_counter;
+    /** Increments counter once for each iteration in the iteration space. */
+    void operator()( int /*tid*/ ) const {
+        for( size_t i=0; i<N_TIMES; ++i ) {
+            my_counter.my_sem.P();
+            my_counter.value = my_counter.value + 1;
+            my_counter.my_sem.V();
+        }
+    }
+    AddOne( C& c_ ) : my_counter(c_) { my_counter.my_sem.V(); }
+};
+
+void testBinarySemaphore( int nThreads ) {
+    REMARK("Testing binary semaphore\n");
+    Counter<tbb::internal::binary_semaphore> counter;
+    AddOne<Counter<tbb::internal::binary_semaphore> > myAddOne(counter);
+    NativeParallelFor( nThreads, myAddOne );
+    ASSERT( nThreads*N_TIMES==counter.value, "Binary semaphore operations P()/V() have a race");
+}
+
+// Power of 2, the most tokens that can be in flight.
+#define MAX_TOKENS 32
+enum FilterType { imaProducer, imaConsumer };
+class FilterBase : NoAssign {
+protected:
+    FilterType ima;
+    unsigned totTokens;  // total number of tokens to be emitted, only used by producer
+    tbb::atomic<unsigned>& myTokens;
+    tbb::atomic<unsigned>& otherTokens;
+    unsigned myWait;
+    semaphore &mySem;
+    semaphore &nextSem;
+    unsigned* myBuffer;
+    unsigned* nextBuffer;
+    unsigned curToken;
+public:
+    FilterBase( FilterType ima_
+            ,unsigned totTokens_
+            ,tbb::atomic<unsigned>& myTokens_
+            ,tbb::atomic<unsigned>& otherTokens_
+            ,unsigned myWait_
+            ,semaphore &mySem_
+            ,semaphore &nextSem_
+            ,unsigned* myBuffer_
+            ,unsigned* nextBuffer_
+            )
+        : ima(ima_),totTokens(totTokens_),myTokens(myTokens_),otherTokens(otherTokens_),myWait(myWait_),mySem(mySem_),
+          nextSem(nextSem_),myBuffer(myBuffer_),nextBuffer(nextBuffer_)
+    {
+        curToken = 0;
+    }
+    void Produce(const int tid);
+    void Consume(const int tid);
+    void operator()(const int tid) { if(ima == imaConsumer) Consume(tid); else Produce(tid); }
+};
+
+class ProduceConsumeBody {
+    FilterBase** myFilters;
+    public:
+    ProduceConsumeBody(FilterBase** myFilters_) : myFilters(myFilters_) {}
+    void operator()(const int tid) const {
+        myFilters[tid]->operator()(tid);
+    }
+};
+
+// send a bunch of non-Null "tokens" to consumer, then a NULL.
+void FilterBase::Produce(const int /*tid*/) {
+    nextBuffer[0] = 0;  // just in case we provide no tokens
+    sBarrier.wait();
+    while(totTokens) {
+        while(!myTokens)
+            mySem.P();
+        // we have a slot available.
+        --myTokens;  // moving this down reduces spurious wakeups
+        --totTokens;
+        if(totTokens)
+            nextBuffer[curToken&(MAX_TOKENS-1)] = curToken*3+1;
+        else
+            nextBuffer[curToken&(MAX_TOKENS-1)] = 0;
+        ++curToken;
+        Harness::Sleep(myWait);
+        unsigned temp = ++otherTokens;
+        if(temp == 1)
+            nextSem.V();
+    }
+    nextSem.V();  // final wakeup
+}
+
+void FilterBase::Consume(const int /*tid*/) {
+    unsigned myToken;
+    sBarrier.wait();
+    do {
+        while(!myTokens)
+            mySem.P();
+        // we have a slot available.
+        --myTokens;  // moving this down reduces spurious wakeups
+        myToken = myBuffer[curToken&(MAX_TOKENS-1)];
+        if(myToken) {
+            ASSERT(myToken == curToken*3+1, "Error in received token");
+            ++curToken;
+            Harness::Sleep(myWait);
+            unsigned temp = ++otherTokens;
+            if(temp == 1)
+                nextSem.V();
+        }
+    } while(myToken);
+    // end of processing
+    ASSERT(curToken + 1 == totTokens, "Didn't receive enough tokens");
+}
+
+// -- test of producer/consumer with atomic buffer cnt and semaphore
+// nTokens are total number of tokens through the pipe
+// pWait is the wait time for the producer
+// cWait is the wait time for the consumer
+void testProducerConsumer( unsigned totTokens, unsigned nTokens, unsigned pWait, unsigned cWait) {
+    semaphore pSem;
+    semaphore cSem;
+    tbb::atomic<unsigned> pTokens;
+    tbb::atomic<unsigned> cTokens;
+    cTokens = 0;
+    unsigned cBuffer[MAX_TOKENS];
+    FilterBase* myFilters[2];  // one producer, one consumer
+    REMARK("Testing producer/consumer with %lu total tokens, %lu tokens at a time, producer wait(%lu), consumer wait (%lu)\n", totTokens, nTokens, pWait, cWait);
+    ASSERT(nTokens <= MAX_TOKENS, "Not enough slots for tokens");
+    myFilters[0] = new FilterBase(imaProducer, totTokens, pTokens, cTokens, pWait, cSem, pSem, (unsigned *)NULL, &(cBuffer[0]));
+    myFilters[1] = new FilterBase(imaConsumer, totTokens, cTokens, pTokens, cWait, pSem, cSem, cBuffer, (unsigned *)NULL);
+    pTokens = nTokens;
+    ProduceConsumeBody myBody(myFilters);
+    sBarrier.initialize(2);
+    NativeParallelFor(2, myBody);
+    delete myFilters[0];
+    delete myFilters[1];
+}
+
+int TestMain() {
+    REMARK("Started\n");
+#if _WIN32||_WIN64
+    testOSVersion();
+#endif
+    if(MaxThread > 0) {
+        testBinarySemaphore( MaxThread );
+        for(int semSize = 1; semSize <= MaxThread; ++semSize) {
+            for(int exThreads = 0; exThreads <= MaxThread - semSize; ++exThreads) {
+                testSemaphore( semSize, exThreads );
+            }
+        }
+    }
+    // Test producer/consumer with varying execution times and buffer sizes
+    // ( total tokens, tokens in buffer, sleep for producer, sleep for consumer )
+    testProducerConsumer( 10, 2, 5, 5 );
+    testProducerConsumer( 10, 2, 20, 5 );
+    testProducerConsumer( 10, 2, 5, 20 );
+    testProducerConsumer( 10, 1, 5, 5 );
+    testProducerConsumer( 20, 10, 5, 20 );
+    testProducerConsumer( 64, 32, 1, 20 );
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_sequencer_node.cpp b/xdl/third_party/tbb/src/test/test_sequencer_node.cpp
new file mode 100644
index 00000000..788f1e89
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_sequencer_node.cpp
@@ -0,0 +1,409 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+#include "tbb/atomic.h"
+#if TBB_PREVIEW_FLOW_GRAPH_FEATURES
+#include "harness_graph.h"
+#endif
+
+#include <cstdio>
+
+#define N 1000
+#define C 10
+
+template< typename T >
+struct seq_inspector {
+    size_t operator()(const T &v) const { return size_t(v); }
+};
+
+template< typename T >
+bool wait_try_get( tbb::flow::graph &g, tbb::flow::sequencer_node<T> &q, T &value ) {
+    g.wait_for_all();
+    return q.try_get(value);
+}
+
+template< typename T >
+void spin_try_get( tbb::flow::queue_node<T> &q, T &value ) {
+    while ( q.try_get(value) != true ) ;
+}
+
+template< typename T >
+struct parallel_puts : NoAssign {
+
+    tbb::flow::sequencer_node<T> &my_q;
+    int my_num_threads;
+
+    parallel_puts( tbb::flow::sequencer_node<T> &q, int num_threads ) : my_q(q), my_num_threads(num_threads) {}
+
+    void operator()(int tid) const {
+        for (int j = tid; j < N; j+=my_num_threads) {
+            bool msg = my_q.try_put( T(j) );
+            ASSERT( msg == true, NULL );
+        }
+    }
+
+};
+
+template< typename T >
+struct touches {
+
+    bool **my_touches;
+    T *my_last_touch;
+    int my_num_threads;
+
+    touches( int num_threads ) : my_num_threads(num_threads) {
+        my_last_touch = new T[my_num_threads];
+        my_touches = new bool* [my_num_threads];
+        for ( int p = 0; p < my_num_threads; ++p) {
+            my_last_touch[p] = T(-1);
+            my_touches[p] = new bool[N];
+            for ( int n = 0; n < N; ++n)
+                my_touches[p][n] = false;
+        }
+    }
+
+    ~touches() {
+        for ( int p = 0; p < my_num_threads; ++p) {
+            delete [] my_touches[p];
+        }
+        delete [] my_touches;
+        delete [] my_last_touch;
+    }
+
+    bool check( int tid, T v ) {
+        if ( my_touches[tid][v] != false ) {
+            printf("Error: value seen twice by local thread\n");
+            return false;
+        }
+        if ( v <= my_last_touch[tid] ) {
+            printf("Error: value seen in wrong order by local thread\n");
+            return false;
+        }
+        my_last_touch[tid] = v;
+        my_touches[tid][v] = true;
+        return true;
+    }
+
+    bool validate_touches() {
+        bool *all_touches = new bool[N];
+        for ( int n = 0; n < N; ++n)
+            all_touches[n] = false;
+
+        for ( int p = 0; p < my_num_threads; ++p) {
+            for ( int n = 0; n < N; ++n) {
+                if ( my_touches[p][n] == true ) {
+                    ASSERT( all_touches[n] == false, "value see by more than one thread\n" );
+                    all_touches[n] = true;
+                }
+            }
+        }
+        for ( int n = 0; n < N; ++n) {
+            if ( !all_touches[n] )
+                printf("No touch at %d, my_num_threads = %d\n", n, my_num_threads);
+            //ASSERT( all_touches[n] == true, "value not seen by any thread\n" );
+        }
+        delete [] all_touches;
+        return true;
+    }
+
+};
+
+template< typename T >
+struct parallel_gets : NoAssign {
+
+    tbb::flow::sequencer_node<T> &my_q;
+    int my_num_threads;
+    touches<T> &my_touches;
+
+    parallel_gets( tbb::flow::sequencer_node<T> &q, int num_threads, touches<T> &t ) : my_q(q), my_num_threads(num_threads), my_touches(t) {}
+
+    void operator()(int tid) const {
+        for (int j = tid; j < N; j+=my_num_threads) {
+            T v;
+            spin_try_get( my_q, v );
+            my_touches.check( tid, v );
+        }
+    }
+
+};
+
+template< typename T >
+struct parallel_put_get : NoAssign {
+
+    tbb::flow::sequencer_node<T> &my_s1;
+    tbb::flow::sequencer_node<T> &my_s2;
+    int my_num_threads;
+    tbb::atomic< int > &my_counter;
+    touches<T> &my_touches;
+
+    parallel_put_get( tbb::flow::sequencer_node<T> &s1, tbb::flow::sequencer_node<T> &s2, int num_threads,
+                      tbb::atomic<int> &counter, touches<T> &t ) : my_s1(s1), my_s2(s2), my_num_threads(num_threads), my_counter(counter), my_touches(t) {}
+
+    void operator()(int tid) const {
+        int i_start = 0;
+
+        while ( (i_start = my_counter.fetch_and_add(C)) < N ) {
+            int i_end = ( N < i_start + C ) ? N : i_start + C;
+            for (int i = i_start; i < i_end; ++i) {
+                bool msg = my_s1.try_put( T(i) );
+                ASSERT( msg == true, NULL );
+            }
+
+            for (int i = i_start; i < i_end; ++i) {
+                T v;
+                spin_try_get( my_s2, v );
+                my_touches.check( tid, v );
+            }
+        }
+    }
+
+};
+
+//
+// Tests
+//
+// multiple parallel senders, multiple receivers, properly sequenced (relative to receiver) at output
+// chained sequencers, multiple parallel senders, multiple receivers, properly sequenced (relative to receiver) at output
+//
+
+template< typename T >
+int test_parallel(int num_threads) {
+    tbb::flow::graph g;
+
+    tbb::flow::sequencer_node<T> s(g, seq_inspector<T>());
+    NativeParallelFor( num_threads, parallel_puts<T>(s, num_threads) );
+    {
+        touches<T> t( num_threads );
+        NativeParallelFor( num_threads, parallel_gets<T>(s, num_threads, t) );
+        g.wait_for_all();
+        ASSERT( t.validate_touches(), NULL );
+    }
+    T bogus_value(-1);
+    T j = bogus_value;
+    ASSERT( s.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    g.wait_for_all();
+
+    tbb::flow::sequencer_node<T> s1(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s2(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s3(g, seq_inspector<T>());
+    tbb::flow::make_edge( s1, s2 );
+    tbb::flow::make_edge( s2, s3 );
+
+    {
+        touches<T> t( num_threads );
+        tbb::atomic<int> counter;
+        counter = 0;
+        NativeParallelFor( num_threads, parallel_put_get<T>(s1, s3, num_threads, counter, t) );
+        g.wait_for_all();
+        t.validate_touches();
+    }
+    g.wait_for_all();
+    ASSERT( s1.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( s2.try_get( j ) == false, NULL );
+    g.wait_for_all();
+    ASSERT( s3.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    // test copy constructor
+    tbb::flow::sequencer_node<T> s_copy(s);
+    NativeParallelFor( num_threads, parallel_puts<T>(s_copy, num_threads) );
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        spin_try_get( s_copy, j );
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( s_copy.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    return 0;
+}
+
+
+//
+// Tests
+//
+// No predecessors can be registered
+// Request from empty buffer fails
+// In-order puts, single sender, single receiver, properly sequenced at output
+// Reverse-order puts, single sender, single receiver, properly sequenced at output
+// Chained sequencers (3), in-order and reverse-order tests, properly sequenced at output
+//
+
+template< typename T >
+int test_serial() {
+    tbb::flow::graph g;
+    T bogus_value(-1);
+
+    tbb::flow::sequencer_node<T> s(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s2(g, seq_inspector<T>());
+    T j = bogus_value;
+
+    //
+    // Rejects attempts to add / remove predecessor
+    // Rejects request from empty Q
+    //
+    ASSERT( s.register_predecessor( s2 ) == false, NULL );
+    ASSERT( s.remove_predecessor( s2 ) == false, NULL );
+    ASSERT( s.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    //
+    // In-order simple puts and gets
+    //
+
+    for (int i = 0; i < N; ++i) {
+        bool msg = s.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+        ASSERT(!s.try_put( T(i) ), NULL);  // second attempt to put should reject
+    }
+
+
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        ASSERT(wait_try_get( g, s, j ) == true, NULL);
+        ASSERT( i == j, NULL );
+        ASSERT(!s.try_put( T(i) ),NULL );  // after retrieving value, subsequent put should fail
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( s.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    //
+    // Reverse-order simple puts and gets
+    //
+
+    for (int i = N-1; i >= 0; --i) {
+        bool msg = s2.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+    }
+
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        ASSERT(wait_try_get( g, s2, j ) == true, NULL);
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    g.wait_for_all();
+    ASSERT( s2.try_get( j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    //
+    // Chained in-order simple puts and gets
+    //
+
+    tbb::flow::sequencer_node<T> s3(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s4(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s5(g, seq_inspector<T>());
+    tbb::flow::make_edge( s3, s4 );
+    tbb::flow::make_edge( s4, s5 );
+
+    for (int i = 0; i < N; ++i) {
+        bool msg = s3.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+    }
+
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        ASSERT(wait_try_get( g, s5, j ) == true, NULL);
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    ASSERT( wait_try_get( g, s3, j ) == false, NULL );
+    ASSERT( wait_try_get( g, s4, j ) == false, NULL );
+    ASSERT( wait_try_get( g, s5, j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    g.wait_for_all();
+    tbb::flow::remove_edge( s3, s4 );
+    ASSERT( s3.try_put( N ) == true, NULL );
+    ASSERT( wait_try_get( g, s4, j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( wait_try_get( g, s5, j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( wait_try_get( g, s3, j ) == true, NULL );
+    ASSERT( j == N, NULL );
+
+    //
+    // Chained reverse-order simple puts and gets
+    //
+
+    tbb::flow::sequencer_node<T> s6(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s7(g, seq_inspector<T>());
+    tbb::flow::sequencer_node<T> s8(g, seq_inspector<T>());
+    tbb::flow::make_edge( s6, s7 );
+    tbb::flow::make_edge( s7, s8 );
+
+    for (int i = N-1; i >= 0; --i) {
+        bool msg = s6.try_put( T(i) );
+        ASSERT( msg == true, NULL );
+    }
+
+    for (int i = 0; i < N; ++i) {
+        j = bogus_value;
+        ASSERT( wait_try_get( g, s8, j ) == true, NULL );
+        ASSERT( i == j, NULL );
+    }
+    j = bogus_value;
+    ASSERT( wait_try_get( g, s6, j ) == false, NULL );
+    ASSERT( wait_try_get( g, s7, j ) == false, NULL );
+    ASSERT( wait_try_get( g, s8, j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+
+    g.wait_for_all();
+    tbb::flow::remove_edge( s6, s7 );
+    ASSERT( s6.try_put( N ) == true, NULL );
+    ASSERT( wait_try_get( g, s7, j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( wait_try_get( g, s8, j ) == false, NULL );
+    ASSERT( j == bogus_value, NULL );
+    ASSERT( wait_try_get( g, s6, j ) == true, NULL );
+    ASSERT( j == N, NULL );
+
+    return 0;
+}
+
+int TestMain() {
+    tbb::tick_count start = tbb::tick_count::now(), stop;
+    for (int p = 2; p <= 4; ++p) {
+        tbb::task_scheduler_init init(p);
+        test_serial<int>();
+        test_parallel<int>(p);
+    }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_buffer_extract<tbb::flow::sequencer_node<int> >().run_tests();
+#endif
+    stop = tbb::tick_count::now();
+    REMARK("Sequencer_Node Time=%6.6f\n", (stop-start).seconds());
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_source_node.cpp b/xdl/third_party/tbb/src/test/test_source_node.cpp
new file mode 100644
index 00000000..3d19c4cc
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_source_node.cpp
@@ -0,0 +1,424 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// have to expose the reset_node method to be able to reset a function_body
+#include "harness.h"
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+#include "tbb/flow_graph.h"
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+
+const int N = 1000;
+
+template< typename T >
+class test_push_receiver : public tbb::flow::receiver<T>, NoAssign {
+
+    tbb::atomic<int> my_counters[N];
+    tbb::flow::graph& my_graph;
+
+public:
+
+    test_push_receiver(tbb::flow::graph& g) : my_graph(g) {
+        for (int i = 0; i < N; ++i )
+            my_counters[i] = 0;
+    }
+
+    int get_count( int i ) {
+       int v = my_counters[i];
+       return v;
+    }
+
+    typedef typename tbb::flow::receiver<T>::predecessor_type predecessor_type;
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    typedef typename tbb::flow::receiver<T>::built_predecessors_type built_predecessors_type;
+    typedef typename tbb::flow::receiver<T>::predecessor_list_type predecessor_list_type;
+    built_predecessors_type bpt;
+    built_predecessors_type &built_predecessors() __TBB_override { return bpt; }
+    void internal_add_built_predecessor( predecessor_type & ) __TBB_override { }
+    void internal_delete_built_predecessor( predecessor_type & ) __TBB_override { }
+    void copy_predecessors( predecessor_list_type & ) __TBB_override { }
+    size_t predecessor_count() __TBB_override { return 0; }
+#endif
+
+    tbb::task *try_put_task( const T &v ) __TBB_override {
+       int i = (int)v;
+       ++my_counters[i];
+       return const_cast<tbb::task *>(SUCCESSFULLY_ENQUEUED);
+    }
+
+    tbb::flow::graph& graph_reference() __TBB_override {
+        return my_graph;
+    }
+
+    void reset_receiver(tbb::flow::reset_flags /*f*/) __TBB_override {}
+};
+
+template< typename T >
+class source_body {
+
+   tbb::atomic<int> my_count;
+   int *ninvocations;
+
+public:
+
+   source_body() : ninvocations(NULL) { my_count = 0; }
+   source_body(int &_inv) : ninvocations(&_inv)  { my_count = 0; }
+
+   bool operator()( T &v ) {
+      v = (T)my_count.fetch_and_increment();
+      if(ninvocations) ++(*ninvocations);
+      if ( (int)v < N )
+         return true;
+      else
+         return false;
+   }
+
+};
+
+template< typename T >
+class function_body {
+
+    tbb::atomic<int> *my_counters;
+
+public:
+
+    function_body( tbb::atomic<int> *counters ) : my_counters(counters) {
+        for (int i = 0; i < N; ++i )
+            my_counters[i] = 0;
+    }
+
+    bool operator()( T v ) {
+        ++my_counters[(int)v];
+        return true;
+    }
+
+};
+
+template< typename T >
+void test_single_dest() {
+
+   // push only
+   tbb::flow::graph g;
+   tbb::flow::source_node<T> src(g, source_body<T>() );
+   test_push_receiver<T> dest(g);
+   tbb::flow::make_edge( src, dest );
+   g.wait_for_all();
+   for (int i = 0; i < N; ++i ) {
+       ASSERT( dest.get_count(i) == 1, NULL );
+   }
+
+   // push only
+   tbb::atomic<int> counters3[N];
+   tbb::flow::source_node<T> src3(g, source_body<T>() );
+   function_body<T> b3( counters3 );
+   tbb::flow::function_node<T,bool> dest3(g, tbb::flow::unlimited, b3 );
+   tbb::flow::make_edge( src3, dest3 );
+   g.wait_for_all();
+   for (int i = 0; i < N; ++i ) {
+       int v = counters3[i];
+       ASSERT( v == 1, NULL );
+   }
+
+   // push & pull
+   tbb::flow::source_node<T> src2(g, source_body<T>() );
+   tbb::atomic<int> counters2[N];
+   function_body<T> b2( counters2 );
+   tbb::flow::function_node<T,bool> dest2(g, tbb::flow::serial, b2 );
+   tbb::flow::make_edge( src2, dest2 );
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+   ASSERT(src2.successor_count() == 1, NULL);
+   typename tbb::flow::source_node<T>::successor_list_type my_succs;
+   src2.copy_successors(my_succs);
+   ASSERT(my_succs.size() == 1, NULL);
+#endif
+   g.wait_for_all();
+   for (int i = 0; i < N; ++i ) {
+       int v = counters2[i];
+       ASSERT( v == 1, NULL );
+   }
+
+   // test copy constructor
+   tbb::flow::source_node<T> src_copy(src);
+   test_push_receiver<T> dest_c(g);
+   ASSERT( src_copy.register_successor(dest_c), NULL );
+   g.wait_for_all();
+   for (int i = 0; i < N; ++i ) {
+       ASSERT( dest_c.get_count(i) == 1, NULL );
+   }
+}
+
+void test_reset() {
+    //    source_node -> function_node
+    tbb::flow::graph g;
+    tbb::atomic<int> counters3[N];
+    tbb::flow::source_node<int> src3(g, source_body<int>() );
+    tbb::flow::source_node<int> src_inactive(g, source_body<int>(), /*active*/ false );
+    function_body<int> b3( counters3 );
+    tbb::flow::function_node<int,bool> dest3(g, tbb::flow::unlimited, b3 );
+    tbb::flow::make_edge( src3, dest3 );
+    //    source_node already in active state.  Let the graph run,
+    g.wait_for_all();
+    //    check the array for each value.
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 1, NULL );
+        counters3[i] = 0;
+    }
+    g.reset(tbb::flow::rf_reset_bodies);  // <-- re-initializes the counts.
+    // and spawns task to run source
+    g.wait_for_all();
+    //    check output queue again.  Should be the same contents.
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 1, NULL );
+        counters3[i] = 0;
+    }
+    g.reset();  // doesn't reset the source_node_body to initial state, but does spawn a task
+                // to run the source_node.
+
+    g.wait_for_all();
+    // array should be all zero
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 0, NULL );
+    }
+
+    remove_edge(src3, dest3);
+    make_edge(src_inactive, dest3);
+
+    // src_inactive doesn't run
+    g.wait_for_all();
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 0, NULL );
+    }
+
+    // run graph
+    src_inactive.activate();
+    g.wait_for_all();
+    // check output
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 1, NULL );
+        counters3[i] = 0;
+    }
+    g.reset(tbb::flow::rf_reset_bodies);  // <-- reinitializes the counts
+    // src_inactive doesn't run
+    g.wait_for_all();
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 0, NULL );
+    }
+
+    // start it up
+    src_inactive.activate();
+    g.wait_for_all();
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 1, NULL );
+        counters3[i] = 0;
+    }
+    g.reset();  // doesn't reset the source_node_body to initial state, and doesn't
+                // spawn a task to run the source_node.
+
+    g.wait_for_all();
+    // array should be all zero
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 0, NULL );
+    }
+    src_inactive.activate();
+    // source_node_body is already in final state, so source_node will not forward a message.
+    g.wait_for_all();
+    for (int i = 0; i < N; ++i ) {
+        int v = counters3[i];
+        ASSERT( v == 0, NULL );
+    }
+}
+
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+void test_extract() {
+    int counts = 0;
+    tbb::flow::tuple<int,int> dont_care;
+    tbb::flow::graph g;
+    typedef tbb::flow::source_node<int> snode_type;
+    typedef snode_type::successor_list_type successor_list_type;
+    snode_type s0(g, source_body<int>(counts), /*is_active*/false );
+    tbb::flow::join_node< tbb::flow::tuple<int,int>, tbb::flow::reserving > j0(g);
+    tbb::flow::join_node< tbb::flow::tuple<int,int>, tbb::flow::reserving > j1(g);
+    tbb::flow::join_node< tbb::flow::tuple<int,int>, tbb::flow::reserving > j2(g);
+    tbb::flow::queue_node<int> q0(g);
+    tbb::flow::queue_node<tbb::flow::tuple<int,int> > q1(g);
+    tbb::flow::make_edge(s0, tbb::flow::get<0>(j0.input_ports()));
+    /*  s0 ----+    */
+    /*         | j0 */
+    /*         +    */
+    ASSERT(!counts, "source_node activated too soon");
+    s0.activate();
+    g.wait_for_all();  // should produce one value, buffer it.
+    ASSERT(counts == 1, "source_node did not react to activation");
+
+    g.reset(tbb::flow::rf_reset_bodies);
+    counts = 0;
+    s0.extract();
+    /*  s0     +    */
+    /*         | j0 */
+    /*         +    */
+    s0.activate();
+    g.wait_for_all();  // no successors, so the body will not execute
+    ASSERT(counts == 0, "source_node shouldn't forward (no successors)");
+    g.reset(tbb::flow::rf_reset_bodies);
+
+    tbb::flow::make_edge(s0, tbb::flow::get<0>(j0.input_ports()));
+    tbb::flow::make_edge(s0, tbb::flow::get<0>(j1.input_ports()));
+    tbb::flow::make_edge(s0, tbb::flow::get<0>(j2.input_ports()));
+
+    /*        /+    */
+    /*       / | j0 */
+    /*      /  +    */
+    /*     /        */
+    /*    / /--+    */
+    /*  s0-/   | j1 */
+    /*    \    +    */
+    /*     \        */
+    /*      \--+    */
+    /*         | j2 */
+    /*         +    */
+
+    // do all joins appear in successor list?
+    successor_list_type jv1;
+    jv1.push_back(&(tbb::flow::get<0>(j0.input_ports())));
+    jv1.push_back(&(tbb::flow::get<0>(j1.input_ports())));
+    jv1.push_back(&(tbb::flow::get<0>(j2.input_ports())));
+    snode_type::successor_list_type sv;
+    s0.copy_successors(sv);
+    ASSERT(lists_match(sv, jv1), "mismatch in successor list");
+
+    tbb::flow::make_edge(q0, tbb::flow::get<1>(j2.input_ports()));
+    tbb::flow::make_edge(j2, q1);
+    s0.activate();
+
+    /*        /+           */
+    /*       / | j0        */
+    /*      /  +           */
+    /*     /               */
+    /*    / /--+           */
+    /*  s0-/   | j1        */
+    /*    \    +           */
+    /*     \               */
+    /*      \--+           */
+    /*         | j2----q1  */
+    /*  q0-----+           */
+
+    q0.try_put(1);
+    g.wait_for_all();
+    ASSERT(q1.try_get(dont_care), "join did not emit result");
+    j2.extract();
+    tbb::flow::make_edge(q0, tbb::flow::get<1>(j2.input_ports()));
+    tbb::flow::make_edge(j2, q1);
+
+    /*        /+           */
+    /*       / | j0        */
+    /*      /  +           */
+    /*     /               */
+    /*    / /--+           */
+    /*  s0-/   | j1        */
+    /*         +           */
+    /*                     */
+    /*         +           */
+    /*         | j2----q1  */
+    /*  q0-----+           */
+
+    jv1.clear();
+    jv1.push_back(&(tbb::flow::get<0>(j0.input_ports())));
+    jv1.push_back(&(tbb::flow::get<0>(j1.input_ports())));
+    s0.copy_successors(sv);
+    ASSERT(lists_match(sv, jv1), "mismatch in successor list");
+
+    q0.try_put(1);
+    g.wait_for_all();
+    ASSERT(!q1.try_get(dont_care), "extract of successor did not remove pred link");
+
+    s0.extract();
+
+    /*         +           */
+    /*         | j0        */
+    /*         +           */
+    /*                     */
+    /*         +           */
+    /*  s0     | j1        */
+    /*         +           */
+    /*                     */
+    /*         +           */
+    /*         | j2----q1  */
+    /*  q0-----+           */
+
+    ASSERT(s0.successor_count() == 0, "successor list not cleared");
+    s0.copy_successors(sv);
+    ASSERT(sv.size() == 0, "non-empty successor list");
+
+    tbb::flow::make_edge(s0, tbb::flow::get<0>(j2.input_ports()));
+
+    /*         +           */
+    /*         | j0        */
+    /*         +           */
+    /*                     */
+    /*         +           */
+    /*  s0     | j1        */
+    /*    \    +           */
+    /*     \               */
+    /*      \--+           */
+    /*         | j2----q1  */
+    /*  q0-----+           */
+
+    jv1.clear();
+    jv1.push_back(&(tbb::flow::get<0>(j2.input_ports())));
+    s0.copy_successors(sv);
+    ASSERT(lists_match(sv, jv1), "mismatch in successor list");
+
+    q0.try_put(1);
+    g.wait_for_all();
+    ASSERT(!q1.try_get(dont_care), "extract of successor did not remove pred link");
+}
+#endif  /* TBB_DEPRECATED_FLOW_NODE_EXTRACTION */
+
+int TestMain() {
+    if( MinThread<1 ) {
+        REPORT("number of threads must be positive\n");
+        exit(1);
+    }
+    for ( int p = MinThread; p < MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        test_single_dest<int>();
+        test_single_dest<float>();
+    }
+    test_reset();
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_extract();
+#endif
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_split_node.cpp b/xdl/third_party/tbb/src/test/test_split_node.cpp
new file mode 100644
index 00000000..76d0fae7
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_split_node.cpp
@@ -0,0 +1,359 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness.h"
+#include "harness_graph.h"
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+
+#if defined(_MSC_VER) && _MSC_VER < 1600
+    #pragma warning (disable : 4503) //disabling the "decorated name length exceeded" warning for VS2008 and earlier
+#endif
+
+//
+// Tests
+//
+
+const int Count = 300;
+const int MaxPorts = 10;
+const int MaxNSources = 5; // max # of source_nodes to register for each split_node input in parallel test
+
+std::vector<bool> flags;   // for checking output
+
+template<typename T>
+class name_of {
+public:
+    static const char* name() { return  "Unknown"; }
+};
+template<>
+class name_of<int> {
+public:
+    static const char* name() { return  "int"; }
+};
+template<>
+class name_of<float> {
+public:
+    static const char* name() { return  "float"; }
+};
+template<>
+class name_of<double> {
+public:
+    static const char* name() { return  "double"; }
+};
+template<>
+class name_of<long> {
+public:
+    static const char* name() { return  "long"; }
+};
+template<>
+class name_of<short> {
+public:
+    static const char* name() { return  "short"; }
+};
+
+// T must be arithmetic, and shouldn't wrap around for reasonable sizes of Count (which is now 150, and maxPorts is 10,
+// so the max number generated right now is 1500 or so.)  Source will generate a series of TT with value
+// (init_val + (i-1)*addend) * my_mult, where i is the i-th invocation of the body.  We are attaching addend
+// source nodes to a join_port, and each will generate part of the numerical series the port is expecting
+// to receive.  If there is only one source node, the series order will be maintained; if more than one,
+// this is not guaranteed.
+
+template<int N>
+struct tuple_helper {
+    template<typename TupleType>
+    static void set_element( TupleType &t, int i) {
+        tbb::flow::get<N-1>(t) = (typename tbb::flow::tuple_element<N-1,TupleType>::type)(i * (N+1));
+        tuple_helper<N-1>::set_element(t, i);
+    }
+};
+
+template<>
+struct tuple_helper<1> {
+    template<typename TupleType>
+    static void set_element(TupleType &t, int i) {
+        tbb::flow::get<0>(t) = (typename tbb::flow::tuple_element<0,TupleType>::type)(i * 2);
+    }
+};
+
+// if we start N source_bodys they will all have the addend N, and my_count should be initialized to 0 .. N-1.
+// the output tuples should have all the sequence, but the order will in general vary.
+template<typename TupleType>
+class source_body {
+    typedef TupleType TT;
+    static const int N = tbb::flow::tuple_size<TT>::value;
+    int my_count;
+    int addend;
+public:
+    source_body(int init_val, int addto) : my_count(init_val), addend(addto) { }
+    void operator=( const source_body& other) { my_count = other.my_count; addend = other.addend; }
+    bool operator()( TT &v) {
+        if(my_count >= Count) return false;
+        tuple_helper<N>::set_element(v, my_count);
+        my_count += addend;
+        return true;
+    }
+};
+
+// allocator for split_node.
+
+template<int N, typename SType>
+class makeSplit {
+public:
+    static SType *create(tbb::flow::graph& g) {
+        SType *temp = new SType(g);
+        return temp;
+    }
+    static void destroy(SType *p) { delete p; }
+};
+
+// holder for sink_node pointers for eventual deletion
+
+static void* all_sink_nodes[MaxPorts];
+
+
+template<int ELEM, typename SType>
+class sink_node_helper {
+public:
+    typedef typename SType::input_type TT;
+    typedef typename tbb::flow::tuple_element<ELEM-1,TT>::type IT;
+    typedef typename tbb::flow::queue_node<IT> my_sink_node_type;
+    static void print_parallel_remark() {
+        sink_node_helper<ELEM-1,SType>::print_parallel_remark();
+        REMARK(", %s", name_of<IT>::name());
+    }
+    static void print_serial_remark() {
+        sink_node_helper<ELEM-1,SType>::print_serial_remark();
+        REMARK(", %s", name_of<IT>::name());
+    }
+    static void add_sink_nodes(SType &my_split, tbb::flow::graph &g) {
+        my_sink_node_type *new_node = new my_sink_node_type(g);
+        tbb::flow::make_edge( tbb::flow::output_port<ELEM-1>(my_split) , *new_node);
+        all_sink_nodes[ELEM-1] = (void *)new_node;
+        sink_node_helper<ELEM-1, SType>::add_sink_nodes(my_split, g);
+    }
+
+    static void check_sink_values() {
+        my_sink_node_type *dp = reinterpret_cast<my_sink_node_type *>(all_sink_nodes[ELEM-1]);
+        for(int i = 0; i < Count; ++i) {
+            IT v;
+            ASSERT(dp->try_get(v), NULL);
+            flags[((int)v) / (ELEM+1)] = true;
+        }
+        for(int i = 0; i < Count; ++i) {
+            ASSERT(flags[i], NULL);
+            flags[i] = false;  // reset for next test
+        }
+        sink_node_helper<ELEM-1,SType>::check_sink_values();
+    }
+    static void remove_sink_nodes(SType& my_split) {
+        my_sink_node_type *dp = reinterpret_cast<my_sink_node_type *>(all_sink_nodes[ELEM-1]);
+        tbb::flow::remove_edge( tbb::flow::output_port<ELEM-1>(my_split) , *dp);
+        delete dp;
+        sink_node_helper<ELEM-1, SType>::remove_sink_nodes(my_split);
+    }
+};
+
+template<typename SType>
+class sink_node_helper<1, SType> {
+    typedef typename SType::input_type TT;
+    typedef typename tbb::flow::tuple_element<0,TT>::type IT;
+    typedef typename tbb::flow::queue_node<IT> my_sink_node_type;
+public:
+    static void print_parallel_remark() {
+        REMARK("Parallel test of split_node< %s", name_of<IT>::name());
+    }
+    static void print_serial_remark() {
+        REMARK("Serial test of split_node< %s", name_of<IT>::name());
+    }
+    static void add_sink_nodes(SType &my_split, tbb::flow::graph &g) {
+        my_sink_node_type *new_node = new my_sink_node_type(g);
+        tbb::flow::make_edge( tbb::flow::output_port<0>(my_split) , *new_node);
+        all_sink_nodes[0] = (void *)new_node;
+    }
+    static void check_sink_values() {
+        my_sink_node_type *dp = reinterpret_cast<my_sink_node_type *>(all_sink_nodes[0]);
+        for(int i = 0; i < Count; ++i) {
+            IT v;
+            ASSERT(dp->try_get(v), NULL);
+            flags[((int)v) / 2] = true;
+        }
+        for(int i = 0; i < Count; ++i) {
+            ASSERT(flags[i], NULL);
+            flags[i] = false;  // reset for next test
+        }
+    }
+    static void remove_sink_nodes(SType& my_split) {
+        my_sink_node_type *dp = reinterpret_cast<my_sink_node_type *>(all_sink_nodes[0]);
+        tbb::flow::remove_edge( tbb::flow::output_port<0>(my_split) , *dp);
+        delete dp;
+    }
+};
+
+// parallel_test: create source_nodes that feed tuples into the split node
+//    and queue_nodes that receive the output.
+template<typename SType>
+class parallel_test {
+public:
+    typedef typename SType::input_type TType;
+    typedef tbb::flow::source_node<TType> source_type;
+    static const int N = tbb::flow::tuple_size<TType>::value;
+    static void test() {
+        source_type* all_source_nodes[MaxNSources];
+        sink_node_helper<N,SType>::print_parallel_remark();
+        REMARK(" >\n");
+        for(int i=0; i < MaxPorts; ++i) {
+            all_sink_nodes[i] = NULL;
+        }
+        // try test for # sources 1 .. MaxNSources
+        for(int nInputs = 1; nInputs <= MaxNSources; ++nInputs) {
+            tbb::flow::graph g;
+            SType* my_split = makeSplit<N,SType>::create(g);
+
+            // add sinks first so when sources start spitting out values they are there to catch them
+            sink_node_helper<N, SType>::add_sink_nodes((*my_split), g);
+
+            // now create nInputs source_nodes, each spitting out i, i+nInputs, i+2*nInputs ...
+            // each element of the tuple is i*(n+1), where n is the tuple element index (1-N)
+            for(int i = 0; i < nInputs; ++i) {
+                // create source node
+                source_type *s = new source_type(g, source_body<TType>(i, nInputs) );
+                tbb::flow::make_edge(*s, *my_split);
+                all_source_nodes[i] = s;
+            }
+
+            g.wait_for_all();
+
+            // check that we got Count values in each output queue, and all the index values
+            // are there.
+            sink_node_helper<N, SType>::check_sink_values();
+
+            sink_node_helper<N, SType>::remove_sink_nodes(*my_split);
+            for(int i = 0; i < nInputs; ++i) {
+                delete all_source_nodes[i];
+            }
+            makeSplit<N,SType>::destroy(my_split);
+        }
+    }
+};
+
+//
+// Single predecessor, single accepting successor at each port
+
+template<typename SType>
+void test_one_serial( SType &my_split, tbb::flow::graph &g) {
+    typedef typename SType::input_type TType;
+    static const int TUPLE_SIZE = tbb::flow::tuple_size<TType>::value;
+    sink_node_helper<TUPLE_SIZE, SType>::add_sink_nodes(my_split,g);
+    typedef TType q3_input_type;
+    tbb::flow::queue_node< q3_input_type >  q3(g);
+
+    tbb::flow::make_edge( q3, my_split );
+
+    // fill the  queue with its value one-at-a-time
+    flags.clear();
+    for (int i = 0; i < Count; ++i ) {
+        TType v;
+        tuple_helper<TUPLE_SIZE>::set_element(v, i);
+        ASSERT(my_split.try_put(v), NULL);
+        flags.push_back(false);
+    }
+
+    g.wait_for_all();
+
+    sink_node_helper<TUPLE_SIZE,SType>::check_sink_values();
+
+    sink_node_helper<TUPLE_SIZE, SType>::remove_sink_nodes(my_split);
+
+}
+
+template<typename SType>
+class serial_test {
+    typedef typename SType::input_type TType;
+    static const int TUPLE_SIZE = tbb::flow::tuple_size<TType>::value;
+    static const int ELEMS = 3;
+public:
+static void test() {
+    tbb::flow::graph g;
+    flags.reserve(Count);
+    SType* my_split = makeSplit<TUPLE_SIZE,SType>::create(g);
+    sink_node_helper<TUPLE_SIZE, SType>::print_serial_remark(); REMARK(" >\n");
+
+    test_output_ports_return_ref(*my_split);
+
+    test_one_serial<SType>(*my_split, g);
+    // build the vector with copy construction from the used split node.
+    std::vector<SType>split_vector(ELEMS, *my_split);
+    // destroy the tired old split_node in case we're accidentally reusing pieces of it.
+    makeSplit<TUPLE_SIZE,SType>::destroy(my_split);
+
+
+    for(int e = 0; e < ELEMS; ++e) {  // exercise each of the vector elements
+        test_one_serial<SType>(split_vector[e], g);
+    }
+}
+
+}; // serial_test
+
+template<
+      template<typename> class TestType,  // serial_test or parallel_test
+      typename TupleType >                               // type of the input of the split
+struct generate_test {
+    typedef tbb::flow::split_node<TupleType> split_node_type;
+    static void do_test() {
+        TestType<split_node_type>::test();
+    }
+}; // generate_test
+
+int TestMain() {
+#if __TBB_USE_TBB_TUPLE
+    REMARK("  Using TBB tuple\n");
+#else
+    REMARK("  Using platform tuple\n");
+#endif
+   for (int p = 0; p < 2; ++p) {
+       generate_test<serial_test, tbb::flow::tuple<float, double> >::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 4
+       generate_test<serial_test, tbb::flow::tuple<float, double, int, long> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 6
+       generate_test<serial_test, tbb::flow::tuple<double, double, int, long, int, short> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 8
+       generate_test<serial_test, tbb::flow::tuple<float, double, double, double, float, int, float, long> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 10
+       generate_test<serial_test, tbb::flow::tuple<float, double, int, double, double, float, long, int, float, long> >::do_test();
+#endif
+       generate_test<parallel_test, tbb::flow::tuple<float, double> >::do_test();
+#if MAX_TUPLE_TEST_SIZE >= 3
+       generate_test<parallel_test, tbb::flow::tuple<float, int, long> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 5
+       generate_test<parallel_test, tbb::flow::tuple<double, double, int, int, short> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 7
+       generate_test<parallel_test, tbb::flow::tuple<float, int, double, float, long, float, long> >::do_test();
+#endif
+#if MAX_TUPLE_TEST_SIZE >= 9
+       generate_test<parallel_test, tbb::flow::tuple<float, double, int, double, double, long, int, float, long> >::do_test();
+#endif
+   }
+   return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_static_assert.cpp b/xdl/third_party/tbb/src/test/test_static_assert.cpp
new file mode 100644
index 00000000..3c99bbf0
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_static_assert.cpp
@@ -0,0 +1,89 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_stddef.h"
+
+void TestInsideFunction(){
+    __TBB_STATIC_ASSERT(sizeof(char)>=1,"");
+}
+void TestTwiceAtTheSameLine(){
+//    for current implementation it is not possible to use
+//    two __TBB_STATIC_ASSERT on a same line
+//    __TBB_STATIC_ASSERT(true,""); __TBB_STATIC_ASSERT(true,"");
+}
+
+void TestInsideStructure(){
+    struct helper{
+        __TBB_STATIC_ASSERT(true,"");
+    };
+}
+
+void TestTwiceInsideStructure(){
+    struct helper{
+        //for current implementation it is not possible to use
+        //two __TBB_STATIC_ASSERT on a same line inside a class definition
+        //__TBB_STATIC_ASSERT(true,"");__TBB_STATIC_ASSERT(true,"");
+
+        __TBB_STATIC_ASSERT(true,"");
+        __TBB_STATIC_ASSERT(true,"");
+    };
+}
+
+namespace TestTwiceInsideNamespaceHelper{
+    __TBB_STATIC_ASSERT(true,"");
+    __TBB_STATIC_ASSERT(true,"");
+}
+
+namespace TestTwiceInsideClassTemplateHelper{
+    template <typename T>
+    struct template_struct{
+        __TBB_STATIC_ASSERT(true,"");
+        __TBB_STATIC_ASSERT(true,"");
+    };
+}
+
+void TestTwiceInsideTemplateClass(){
+    using namespace TestTwiceInsideClassTemplateHelper;
+    typedef template_struct<int> template_struct_int_typedef;
+    typedef template_struct<char> template_struct_char_typedef;
+    tbb::internal::suppress_unused_warning(template_struct_int_typedef(), template_struct_char_typedef());
+}
+
+template<typename T>
+void TestTwiceInsideTemplateFunction(){
+    __TBB_STATIC_ASSERT(sizeof(T)>=1,"");
+    __TBB_STATIC_ASSERT(true,"");
+}
+
+#include "harness.h"
+int TestMain() {
+    #if __TBB_STATIC_ASSERT_PRESENT
+        REPORT("Known issue: %s\n", "no need to test ad-hoc implementation as native feature of C++11 is used");
+        return Harness::Skipped;
+    #else
+        TestInsideFunction();
+        TestInsideStructure();
+        TestTwiceAtTheSameLine();
+        TestTwiceInsideStructure();
+        TestTwiceInsideTemplateClass();
+        TestTwiceInsideTemplateFunction<char>();
+        return Harness::Done;
+    #endif
+}
diff --git a/xdl/third_party/tbb/src/test/test_std_thread.cpp b/xdl/third_party/tbb/src/test/test_std_thread.cpp
new file mode 100644
index 00000000..463a215e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_std_thread.cpp
@@ -0,0 +1,43 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_IMPLEMENT_CPP0X 1
+#include "tbb/tbb_config.h"
+
+#if __TBB_WIN8UI_SUPPORT
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+int TestMain() {
+    return Harness::Skipped;
+}
+#else
+#include "tbb/compat/thread"
+#define THREAD std::thread
+#define THIS_THREAD std::this_thread
+#define THIS_THREAD_SLEEP THIS_THREAD::sleep_for
+#include "test_thread.h"
+#include "harness.h"
+
+int TestMain () {
+    CheckSignatures();
+    RunTests();
+    return Harness::Done;
+}
+#endif
diff --git a/xdl/third_party/tbb/src/test/test_streaming_node.cpp b/xdl/third_party/tbb/src/test/test_streaming_node.cpp
new file mode 100644
index 00000000..6c2420aa
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_streaming_node.cpp
@@ -0,0 +1,917 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_FLOW_GRAPH_NODES 1
+#define TBB_PREVIEW_FLOW_GRAPH_FEATURES 1
+
+#include "tbb/tbb_config.h"
+
+#if __TBB_PREVIEW_STREAMING_NODE
+
+#if _MSC_VER
+#pragma warning (disable: 4503) // Suppress "decorated name length exceeded, name was truncated" warning
+#pragma warning (disable: 4702) // Suppress "unreachable code" warning
+#endif
+
+#include <functional>
+#include <iostream>
+
+#include "harness.h"
+#include "harness_assert.h"
+
+#include "tbb/concurrent_queue.h"
+#include "tbb/flow_graph.h"
+#include "tbb/tbb_thread.h"
+
+using namespace tbb::flow;
+
+//--------------------------------------------------------------------------------
+//--------------------------------TEST HELPERS------------------------------------
+//--------------------------------------------------------------------------------
+
+template <typename ...A>
+struct tuples_equal : std::false_type { };
+
+template <typename ...A>
+struct tuples_equal<std::tuple<A...>, std::tuple<>> : std::false_type { };
+
+template <typename ...B>
+struct tuples_equal<std::tuple<>, std::tuple<B...>> : std::false_type { };
+
+template <>
+struct tuples_equal<std::tuple<>, std::tuple<>> : std::true_type { };
+
+template <typename A1, typename ...Aother, typename B1, typename ...Bother>
+struct tuples_equal<std::tuple<A1, Aother...>, std::tuple<B1, Bother...>>
+{
+    static const bool value = std::is_same<A1, B1>::value && tuples_equal<std::tuple<Aother...>, std::tuple<Bother...>>::value;
+};
+
+template<typename...A>
+struct first_variadic {
+    template<typename...B>
+    static void is_equal_to_second()
+    {
+        ASSERT((tuples_equal< std::tuple<A...>, std::tuple<B...> >::value), "Unexpected variadic types");
+    }
+};
+
+//--------------------------------------------------------------------------------
+
+template<typename T>
+class factory_msg : public async_msg<T> {
+public:
+    factory_msg() {}
+    factory_msg(const T& input_data) : m_data(input_data) {}
+
+    const T& data() const { return m_data; }
+    void update_data(T value) { m_data = value; }
+private:
+    T m_data;
+};
+
+//--------------------------------------------------------------------------------
+
+class base_streaming_factory : NoCopy {
+public:
+
+    typedef int device_type;
+    typedef int kernel_type;
+
+    template<typename T> using async_msg_type = factory_msg<T>;
+
+    base_streaming_factory() : devices_list(1) {}
+
+    std::vector<device_type> devices() {
+        return devices_list;
+    }
+
+    template <typename ...Args>
+    void send_result_forward(Args&... args) {
+        deviceResult = doDeviceWork();
+        send_result(args...);
+    }
+
+    void clear_factory() {
+        arguments_list.clear();
+    }
+
+    void process_arg_list() {}
+
+    template <typename T, typename ...Rest>
+    void process_arg_list(T& arg, Rest&... args) {
+        process_one_arg(arg);
+        process_arg_list(args...);
+    }
+
+private:
+
+    int doDeviceWork() {
+        int result = 0;
+        for (size_t i = 0; i < arguments_list.size(); i++)
+            result += arguments_list[i];
+        return result;
+    }
+
+    // Pass calculation result to the next node
+    template <typename ...Args>
+    void set_result(Args...) {}
+
+    template <typename T>
+    void set_result(async_msg_type<T>& msg) {
+        msg.set(deviceResult);
+    }
+
+    // Variadic functions for result processing
+    // and sending them to all async_msgs
+    void send_result() {}
+
+    template <typename T, typename ...Rest>
+    void send_result(T& arg, Rest&... args) {
+        set_result(arg);
+        send_result(args...);
+    }
+
+    // Retrieve values from async_msg objects
+    // and store them in vector
+    template <typename T>
+    void process_one_arg(async_msg_type<T>& msg) {
+        arguments_list.push_back(msg.data());
+    }
+
+    template <typename T>
+    void process_one_arg(const async_msg_type<T>& msg) {
+        arguments_list.push_back(msg.data());
+    }
+
+    std::vector<device_type> devices_list;
+    std::vector<int> arguments_list;
+
+    int deviceResult;
+};
+
+template<typename ...ExpectedArgs>
+class test_streaming_factory : public base_streaming_factory {
+public:
+
+    template <typename ...Args>
+    void send_data(device_type /*device*/, Args&... /*args*/) {}
+
+    template <typename ...Args>
+    void send_kernel(device_type /*device*/, const kernel_type& /*kernel*/, Args&... args) {
+        check_arguments(args...);
+        process_arg_list(args...);
+        send_result_forward(args...);
+        clear_factory();
+    }
+
+    template <typename FinalizeFn, typename ...Args>
+    void finalize(device_type /*device*/, FinalizeFn fn, Args&... args) {
+        check_arguments(args...);
+        fn();
+    }
+
+    template<typename ...Args>
+    void check_arguments(Args&... /*args*/) {
+        first_variadic< Args... >::template is_equal_to_second< ExpectedArgs... >();
+    }
+};
+
+//--------------------------------------------------------------------------------
+
+template<typename Factory>
+class device_selector {
+public:
+    device_selector() : my_state(DEFAULT_INITIALIZED) {}
+    device_selector(const device_selector&) : my_state(COPY_INITIALIZED) {}
+    device_selector(device_selector&&) : my_state(COPY_INITIALIZED) {}
+    ~device_selector() { my_state = DELETED; }
+
+    typename Factory::device_type operator()(Factory &f) {
+        ASSERT(my_state == COPY_INITIALIZED, NULL);
+        ASSERT(!f.devices().empty(), NULL);
+        return *(f.devices().begin());
+    }
+
+private:
+    enum state {
+        DEFAULT_INITIALIZED,
+        COPY_INITIALIZED,
+        DELETED
+    };
+    state my_state;
+};
+
+//--------------------------------------------------------------------------------
+
+void TestWithoutSetArgs() {
+    graph g;
+
+    typedef test_streaming_factory< factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n));
+
+    const int first_arg = 10;
+    const int second_arg = 20;
+    std::tuple<int, int> args_tuple = std::make_tuple(first_arg, second_arg);
+
+    // test finalize function
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    make_edge(output_port<0>(streaming_n), function_n);
+    expected_result = 30;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSetArgsOnly() {
+    graph g;
+
+    typedef test_streaming_factory< const factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    split_node < tuple<int, int> > split_n(g);
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n));
+
+    const int first_arg = 10;
+    const int second_arg = 20;
+    std::tuple<int, int> args_tuple = std::make_tuple(first_arg, second_arg);
+
+    streaming_n.set_args(100);
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSetPortRefOnly() {
+    graph g;
+
+    typedef test_streaming_factory< factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n));
+
+    const int first_arg = 10;
+    const int second_arg = 20;
+    std::tuple<int, int> args_tuple = std::make_tuple(first_arg, second_arg);
+
+
+    streaming_n.set_args(port_ref<0, 1>());
+
+    // test finalize function
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    make_edge(output_port<0>(streaming_n), function_n);
+    expected_result = 30;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSetArgsAndPortRef1() {
+    graph g;
+
+    typedef test_streaming_factory< const factory_msg<int>, factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n));
+
+    const int first_arg = 10;
+    const int second_arg = 20;
+    std::tuple<int, int> args_tuple = std::make_tuple(first_arg, second_arg);
+
+    streaming_n.set_args(100, port_ref<0, 1>());
+
+    // test finalize function
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    make_edge(output_port<0>(streaming_n), function_n);
+    expected_result = 130;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSetArgsAndPortRef2() {
+    graph g;
+
+    typedef test_streaming_factory< const factory_msg<int>, factory_msg<int>,
+        const factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n));
+
+    const int first_arg = 10;
+    const int second_arg = 20;
+    std::tuple<int, int> args_tuple = std::make_tuple(first_arg, second_arg);
+
+    streaming_n.set_args(100, port_ref<0>(), 200, port_ref<1>());
+
+    // test finalize function
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    make_edge(output_port<0>(streaming_n), function_n);
+    expected_result = 330;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+template <typename ...ExpectedArgs>
+class send_data_factory : public base_streaming_factory {
+public:
+
+    send_data_factory() : send_data_counter(0) {}
+
+    template <typename ...Args>
+    void send_data(device_type /*device*/, Args&... /*args*/) {
+        switch (send_data_counter) {
+        case 0:
+            first_variadic< Args... >::template is_equal_to_second< ExpectedArgs... >();
+            break;
+        case 1:
+            first_variadic< Args... >::template is_equal_to_second< factory_msg<int> >();
+            break;
+        case 2:
+            first_variadic< Args... >::template is_equal_to_second< factory_msg<int> >();
+            break;
+        default:
+            break;
+        }
+        send_data_counter++;
+    }
+
+    template <typename ...Args>
+    void send_kernel(device_type /*device*/, const kernel_type& /*kernel*/, Args&... /*args*/) {
+        ASSERT(send_data_counter == 3, "send_data() was called not enough times");
+        send_data_counter = 0;
+    }
+
+    template <typename FinalizeFn, typename ...Args>
+    void finalize(device_type /*device*/, FinalizeFn fn, Args&... /*args*/) {
+        fn();
+    }
+
+private:
+    int send_data_counter;
+};
+
+void TestSendData_withoutSetArgs() {
+    graph g;
+
+    typedef send_data_factory< tbb::flow::interface10::internal::port_ref_impl<0, 1> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    input_port<0>(streaming_n).try_put(10);
+    input_port<1>(streaming_n).try_put(20);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSendData_setArgsOnly() {
+    graph g;
+
+    typedef send_data_factory< factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    streaming_n.set_args(100);
+    input_port<0>(streaming_n).try_put(10);
+    input_port<1>(streaming_n).try_put(20);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSendData_portRefOnly() {
+    graph g;
+
+    typedef send_data_factory< tbb::flow::interface10::internal::port_ref_impl<0,1> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    streaming_n.set_args(port_ref<0,1>());
+    input_port<0>(streaming_n).try_put(10);
+    input_port<1>(streaming_n).try_put(20);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSendData_setArgsAndPortRef1() {
+    graph g;
+
+    typedef send_data_factory< factory_msg<int>, tbb::flow::interface10::internal::port_ref_impl<0, 1> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    streaming_n.set_args(100, port_ref<0,1>());
+    input_port<0>(streaming_n).try_put(10);
+    input_port<1>(streaming_n).try_put(20);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestSendData_setArgsAndPortRef2() {
+    graph g;
+
+    typedef send_data_factory< factory_msg<int>, tbb::flow::interface10::internal::port_ref_impl<0,0>,
+                               factory_msg<int>, tbb::flow::interface10::internal::port_ref_impl<1,1> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    streaming_n.set_args(100, port_ref<0>(), 200, port_ref<1>());
+    input_port<0>(streaming_n).try_put(10);
+    input_port<1>(streaming_n).try_put(20);
+    g.wait_for_all();
+}
+
+//--------------------------------------------------------------------------------
+
+void TestArgumentsPassing() {
+    REMARK("TestArgumentsPassing: ");
+    TestWithoutSetArgs();
+    TestSetArgsOnly();
+    TestSetPortRefOnly();
+    TestSetArgsAndPortRef1();
+    TestSetArgsAndPortRef2();
+
+    TestSendData_withoutSetArgs();
+    TestSendData_setArgsOnly();
+    TestSendData_portRefOnly();
+    TestSendData_setArgsAndPortRef1();
+    TestSendData_setArgsAndPortRef2();
+    REMARK("done\n");
+}
+
+//--------------------------------------------------------------------------------
+
+template<typename... ExpectedArgs>
+class range_streaming_factory : public base_streaming_factory {
+public:
+
+    typedef std::array<int, 2> range_type;
+
+    template <typename ...Args>
+    void send_data(device_type /*device*/, Args&... /*args*/) {
+    }
+
+    template <typename ...Args>
+    void send_kernel(device_type /*device*/, const kernel_type& /*kernel*/, const range_type& work_size, Args&... args) {
+        ASSERT(work_size[0] == 1024, "Range was set incorrectly");
+        ASSERT(work_size[1] == 720, "Range was set incorrectly");
+        first_variadic< Args... >::template is_equal_to_second< ExpectedArgs... >();
+        process_arg_list(args...);
+        send_result_forward(args...);
+        clear_factory();
+    }
+
+    template <typename FinalizeFn, typename ...Args>
+    void finalize(device_type /*device*/, FinalizeFn fn, Args&... /*args*/) {
+        first_variadic< Args... >::template is_equal_to_second< ExpectedArgs... >();
+        fn();
+    }
+
+};
+
+void TestSetRange() {
+    REMARK("TestSetRange: ");
+
+    graph g;
+
+    typedef range_streaming_factory< const factory_msg<int>, factory_msg<int>,
+        const factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n));
+
+    const int first_arg = 10;
+    const int second_arg = 20;
+    std::tuple<int, int> args_tuple = std::make_tuple(first_arg, second_arg);
+
+    streaming_n.set_args(100, port_ref<0>(), 200, port_ref<1>());
+
+    // test version for GCC <= 4.7.2 (unsupported conversion from initializer_list to std::array)
+#if __GNUC__ < 4 || (__GNUC__ == 4 && (__GNUC_MINOR__ <= 7 || (__GNUC_MINOR__ == 7 && __GNUC_PATCHLEVEL__ <= 2)))
+    std::array<int, 2> device_range;
+    device_range[0] = 1024;
+    device_range[1] = 720;
+    streaming_n.set_range(device_range);
+#else
+    std::array<int, 2> device_range = { 1024,720 };
+    streaming_n.set_range(device_range);
+#endif
+
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    make_edge(output_port<0>(streaming_n), function_n);
+    expected_result = 330;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    REMARK("done\n");
+}
+
+//-------------------------------------------------------------------------------------------------------------------------------------------
+
+template <typename T>
+class user_async_msg : public tbb::flow::async_msg<T>
+{
+public:
+    user_async_msg() {}
+    user_async_msg(T value) : m_data(value) {}
+    void finalize() const __TBB_override;
+private:
+    T m_data;
+};
+
+class user_async_activity { // Async activity singleton
+public:
+
+    static user_async_activity* instance() {
+        if (s_Activity == NULL) {
+            s_Activity = new user_async_activity();
+        }
+        return s_Activity;
+    }
+
+    static void destroy() {
+        ASSERT(s_Activity != NULL, "destroyed twice");
+        s_Activity->myThread.join();
+        delete s_Activity;
+        s_Activity = NULL;
+    }
+
+    template <typename FinalizeFn>
+    static void finish(FinalizeFn fn) {
+        ASSERT(user_async_activity::s_Activity != NULL, "activity must be alive");
+        user_async_activity::s_Activity->finishTaskQueue(fn);
+    }
+
+    static void finish(const user_async_msg<int>& msg) {
+        ASSERT(user_async_activity::s_Activity != NULL, "activity must be alive");
+        user_async_activity::s_Activity->finishTaskQueue(msg);
+    }
+
+    static int getResult() {
+        ASSERT(user_async_activity::s_Activity != NULL, "activity must be alive");
+        return user_async_activity::s_Activity->myQueueSum;
+    }
+
+    void addWork(int addValue, int timeout = 0) {
+        myQueue.push(my_task(addValue, timeout));
+    }
+
+    template <typename FinalizeFn>
+    void finishTaskQueue(FinalizeFn fn) {
+        myFinalizer = fn;
+        myQueue.push(my_task(0, 0, true));
+    }
+
+    void finishTaskQueue(const user_async_msg<int>& msg) {
+        myMsg = msg;
+        myQueue.push(my_task(0, 0, true));
+    }
+
+private:
+
+    struct my_task {
+        my_task(int addValue = 0, int timeout = 0, bool finishFlag = false)
+            : myAddValue(addValue), myTimeout(timeout), myFinishFlag(finishFlag) {}
+
+        int     myAddValue;
+        int     myTimeout;
+        bool    myFinishFlag;
+    };
+
+    static void threadFunc(user_async_activity* activity) {
+        for (;;) {
+            my_task work;
+            activity->myQueue.pop(work);
+            Harness::Sleep(work.myTimeout);
+            if (work.myFinishFlag) {
+                break;
+            }
+            activity->myQueueSum += work.myAddValue;
+        }
+
+        // Send result back to the graph
+        if (activity->myFinalizer) {
+            activity->myFinalizer();
+        }
+        activity->myMsg.set(activity->myQueueSum);
+
+    }
+
+    user_async_activity() : myQueueSum(0), myThread(&user_async_activity::threadFunc, this) {}
+
+    tbb::concurrent_bounded_queue<my_task>   myQueue;
+    int                                      myQueueSum;
+    user_async_msg<int>                      myMsg;
+    std::function<void(void)>                myFinalizer;
+    tbb::tbb_thread                          myThread;
+
+    static user_async_activity*              s_Activity;
+};
+
+user_async_activity* user_async_activity::s_Activity = NULL;
+
+template <typename T>
+void user_async_msg<T>::finalize() const {
+    user_async_activity::finish(*this);
+}
+
+class data_streaming_factory {
+public:
+
+    typedef int device_type;
+    typedef int kernel_type;
+
+    template<typename T> using async_msg_type = user_async_msg<T>;
+
+    data_streaming_factory() : devices_list(1) {}
+
+    template <typename ...Args>
+    void send_data(device_type /*device*/, Args&... /*args*/) {}
+
+    template <typename ...Args>
+    void send_kernel(device_type /*device*/, const kernel_type& /*kernel*/, Args&... args) {
+        process_arg_list(args...);
+    }
+
+    template <typename FinalizeFn, typename ...Args>
+    void finalize(device_type /*device*/, FinalizeFn fn, Args&... /*args*/) {
+        user_async_activity::finish(fn);
+    }
+
+    // Retrieve values from async_msg objects
+    // and store them in vector
+    void process_arg_list() {}
+
+    template <typename T, typename ...Rest>
+    void process_arg_list(T& arg, Rest&... args) {
+        process_one_arg(arg);
+        process_arg_list(args...);
+    }
+
+    template <typename T>
+    void process_one_arg(async_msg_type<T>& /*msg*/) {
+        user_async_activity::instance()->addWork(1, 10);
+    }
+
+    template <typename ...Args>
+    void process_one_arg(Args&... /*args*/) {}
+
+    std::vector<device_type> devices() {
+        return devices_list;
+    }
+
+private:
+    std::vector<device_type> devices_list;
+};
+
+void TestChaining() {
+    REMARK("TestChaining: ");
+
+    graph g;
+    typedef streaming_node< tuple<int>, queueing, data_streaming_factory > streaming_node_type;
+    typedef std::vector< streaming_node_type > nodes_vector_type;
+
+    data_streaming_factory factory;
+    device_selector<data_streaming_factory> device_selector;
+    data_streaming_factory::kernel_type kernel(0);
+
+    const int STREAMING_GRAPH_CHAIN_LENGTH = 1000;
+    nodes_vector_type nodes_vector;
+    for (int i = 0; i < STREAMING_GRAPH_CHAIN_LENGTH; i++) {
+        nodes_vector.emplace_back(g, kernel, device_selector, factory);
+    }
+
+    function_node< int, int > source_n(g, unlimited, [&g](const int& value) -> int {
+        return value;
+    });
+
+    function_node< int > destination_n(g, unlimited, [&g, &STREAMING_GRAPH_CHAIN_LENGTH](const int& result) {
+        ASSERT(result == STREAMING_GRAPH_CHAIN_LENGTH, "calculation chain result is wrong");
+    });
+
+    make_edge(source_n, input_port<0>(nodes_vector.front()));
+    for (size_t i = 0; i < nodes_vector.size() - 1; i++) {
+        make_edge(output_port<0>(nodes_vector[i]), input_port<0>(nodes_vector[i + 1]));
+        nodes_vector[i].set_args(port_ref<0>());
+    }
+    nodes_vector.back().set_args(port_ref<0>());
+    make_edge(output_port<0>(nodes_vector.back()), destination_n);
+
+    source_n.try_put(0);
+    g.wait_for_all();
+
+    REMARK("result = %d; expected = %d\n", user_async_activity::getResult(), STREAMING_GRAPH_CHAIN_LENGTH);
+    ASSERT(user_async_activity::getResult() == STREAMING_GRAPH_CHAIN_LENGTH, "calculation chain result is wrong");
+
+    user_async_activity::destroy();
+
+    REMARK("done\n");
+}
+
+//--------------------------------------------------------------------------------
+
+void TestCopyConstructor() {
+    REMARK("TestCopyConstructor: ");
+
+    graph g;
+
+    typedef test_streaming_factory< factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    // Testing copy constructor
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n_copied(streaming_n);
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n_copied));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n_copied));
+    make_edge(output_port<0>(streaming_n_copied), function_n);
+
+    std::tuple<int, int> args_tuple = std::make_tuple(10, 20);
+    expected_result = 30;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    REMARK("done\n");
+}
+
+void TestMoveConstructor() {
+    REMARK("TestMoveConstructor: ");
+
+    graph g;
+
+    typedef test_streaming_factory< factory_msg<int>, factory_msg<int> > device_factory;
+
+    device_factory factory;
+    device_selector<device_factory> device_selector;
+    device_factory::kernel_type kernel(0);
+
+    int expected_result;
+    split_node < tuple<int, int> > split_n(g);
+    function_node< int > function_n(g, unlimited, [&expected_result](const int& result) {
+        ASSERT(expected_result == result, "Validation has failed");
+    });
+
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n(g, kernel, device_selector, factory);
+
+    // Testing move constructor
+    streaming_node< tuple<int, int>, queueing, device_factory > streaming_n_moved(std::move(streaming_n));
+
+    make_edge(output_port<0>(split_n), input_port<0>(streaming_n_moved));
+    make_edge(output_port<1>(split_n), input_port<1>(streaming_n_moved));
+    make_edge(output_port<0>(streaming_n_moved), function_n);
+
+    std::tuple<int, int> args_tuple = std::make_tuple(10, 20);
+    expected_result = 30;
+    split_n.try_put(args_tuple);
+    g.wait_for_all();
+
+    REMARK("done\n");
+}
+
+void TestConstructor() {
+    TestCopyConstructor();
+    TestMoveConstructor();
+}
+
+//--------------------------------------------------------------------------------
+
+int TestMain() {
+    TestArgumentsPassing();
+    TestSetRange();
+    TestChaining();
+    TestConstructor();
+    return Harness::Done;
+}
+#else
+#define HARNESS_SKIP_TEST 1
+#include "harness.h"
+#endif
diff --git a/xdl/third_party/tbb/src/test/test_tagged_msg.cpp b/xdl/third_party/tbb/src/test/test_tagged_msg.cpp
new file mode 100644
index 00000000..db03834f
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tagged_msg.cpp
@@ -0,0 +1,263 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define _VARIADIC_MAX 10   // Visual Studio 2012
+#include "harness.h"
+#include "tbb/atomic.h"
+#include "harness_checktype.h"
+
+#include "tbb/flow_graph.h"
+#include <cstdio>
+#include <stdexcept>
+#include <vector>
+
+#if __TBB_GCC_STRICT_ALIASING_BROKEN
+    #pragma GCC diagnostic ignored "-Wstrict-aliasing"
+#endif
+
+// given a tuple, return the type of the element that has the maximum alignment requirement.
+// Given a tuple and that type, return the number of elements of the object with the max
+// alignment requirement that is at least as big as the largest object in the tuple.
+
+using tbb::flow::tuple_element;
+using tbb::flow::tuple_size;
+using tbb::flow::cast_to;
+using tbb::flow::is_a;
+
+typedef int *int_ptr;
+typedef char odd_array_type[15];
+typedef char odder_array[17];
+typedef check_type<int> counted_array_type[12];
+typedef std::vector<double> d_vector;
+typedef std::vector<int> i_vector;
+typedef i_vector i_vector_array[2];
+typedef tbb::flow::tagged_msg<size_t, int, char, double, odd_array_type, odder_array, d_vector, check_type<int>, counted_array_type, i_vector_array> tagged_msg_type;
+
+// test base of tagged_msg
+void TestWrapper() {
+    using tbb::flow::interface10::internal::Wrapper;
+    Wrapper<int> wi(42);
+    Wrapper<int> wic(23);
+
+    REMARK("Value of wic is %d\n", wic.value());
+
+    // pointer-type creation
+    int point_to_me = 23;
+    Wrapper<int_ptr> wip(&point_to_me);
+    ASSERT(*(wip.value()) == 23, "Error in wip value");
+
+    odd_array_type ww;
+    for(int ii = 0; ii < 15; ++ii) { ww[ii] = char('0' + ii); } ww[14] = 0;
+
+    Wrapper<odd_array_type> ci(ww);
+    ASSERT(!strncmp(ci.value(), ww, 14), "odd_array_type ci not properly-constructed" );
+
+    Wrapper<odd_array_type> ci2(ci);
+
+    ASSERT(!strncmp(ci2.value(), ww, 14), "odd_array_type ci2 not properly-constructed" );
+
+    d_vector di;
+    di.clear();
+    di.push_back(2.0);
+    Wrapper<d_vector> dvec(di);
+    ASSERT(dvec.value()[0] == 2.0, "incorrect value in vector");
+
+    // test array of non-PODs.
+    i_vector_array oia;
+    oia[0].clear();
+    oia[1].clear();
+    oia[0].push_back(3);
+    oia[1].push_back(2);
+    Wrapper<i_vector_array> ia(oia);
+    ASSERT((ia.value()[1])[0] == 2, "integer vector array element[1] misbehaved");
+    ASSERT((ia.value()[0])[0] == 3, "integer vector array element[0] misbehaved");
+    Wrapper<i_vector_array> iac(ia);
+    ASSERT((iac.value()[1])[0] == 2, "integer vector array element[1] misbehaved");
+    ASSERT((iac.value()[0])[0] == 3, "integer vector array element[0] misbehaved");
+
+    // counted_array
+    counted_array_type cat_orig;
+    for(int i = 0; i < 12; ++i) cat_orig[i] = i + 1;
+    Wrapper<counted_array_type> cat(cat_orig);
+    for(int j = 0; j < 12; ++j)
+        ASSERT(1 + j == cat.value()[j], "Error in cat array");
+
+    int i = wi.value();
+    ASSERT(i == 42, "Assignment to i failed");
+    ASSERT(wi.value() == 42, "Assignment to wi failed");
+    double d = wi.value();
+    ASSERT(d == 42, "Implicit cast in assign to double failed");
+    int_ptr ip = wip.value();
+    ASSERT(ip == &(point_to_me), "Error in assignment of pointer");
+}
+
+void RunTests() {
+    tagged_msg_type def;
+    tagged_msg_type i(1,3);
+    check_type<int>::check_type_counter = 0;
+    int z;
+    #if TBB_USE_EXCEPTIONS
+    try {
+        z = cast_to<int>(def); // disallowed (non-array returning int)
+        ASSERT(false, "should not allow cast to int of non-array");
+    }
+    catch(...) {
+        REMARK("cast of non-array to int disallowed (okay)\n");
+    }
+    #endif
+    z = cast_to<int>(i);
+    ASSERT(is_a<int>(i), "wrong type for i ( == int)");
+    ASSERT(!(is_a<double>(i)), "Wrong type for i ( != double)");
+    z = 5;
+    z = cast_to<int>(i);
+
+    const int &ref_i(cast_to<int>(i));
+    ASSERT(ref_i == 3, "ref_i got wrong value");
+    tagged_msg_type j(2,4);
+    i = j;
+    ASSERT(ref_i == 4, "assign to i did not affect ref_i");
+
+    ASSERT( z == 3, "Error retrieving value from i");
+
+    //updating and retrieving tags
+    ASSERT(j.tag() == 2, "Error retrieving tag for j");
+    j.set_tag(10);
+    ASSERT(j.tag() == 10, "Error updating tag for j");
+
+    tbb::flow::tagged_msg<char, int, char, double> k('a', 4);
+    k.set_tag('b');
+    ASSERT(k.tag() == 'b', "Error updating char tag");
+
+    tagged_msg_type double_tagged_msg(3, 8.0);
+    ASSERT(is_a<double>(double_tagged_msg), "Wrong type for double_tagged_msg (== double)");
+    ASSERT(!is_a<char>(double_tagged_msg), "Wrong type for double_tagged_msg (!= char)");
+    ASSERT(!is_a<int>(double_tagged_msg), "Wrong type for double_tagged_msg (!= int)");
+    tagged_msg_type copytype(double_tagged_msg);
+    ASSERT(is_a<double>(copytype), "Wrong type for double_tagged_msg (== double)");
+    ASSERT(!is_a<char>(copytype), "Wrong type for double_tagged_msg (!= char)");
+    ASSERT(!is_a<int>(copytype), "Wrong type for double_tagged_msg (!= int)");
+    tagged_msg_type default_tagged_msg;
+    ASSERT(!(is_a<double>(default_tagged_msg)), "wrong type for default ( != double)");
+    ASSERT(!(is_a<int>(default_tagged_msg)), "wrong type for default ( != int)");
+    ASSERT(!(is_a<bool>(default_tagged_msg)), "wrong type for default ( != bool)");
+    check_type<int> c;
+    ASSERT(check_type<int>::check_type_counter == 1, "Incorrect number of check_type<int>s created");
+    tagged_msg_type cnt_type(4, c);
+    ASSERT(check_type<int>::check_type_counter == 2, "Incorrect number of check_type<int>s created");
+    ASSERT(is_a<check_type<int> >(cnt_type), "Incorrect type for cnt_type");
+    cnt_type = default_tagged_msg;
+    ASSERT(check_type<int>::check_type_counter == 1, "Incorrect number of check_type<int>s after reassignment");
+    ASSERT(cnt_type.is_default_constructed(), "Assigned check_type<int>s is not default-constructed");
+    // having problem with init on gcc 3.4.6 (fxeolin16)  constructor for elements of array not called
+    // for this version.
+    // counted_array_type counted_array;
+    check_type<int> counted_array[12];  // this is okay
+    ASSERT(check_type<int>::check_type_counter == 13, "Incorrect number of check_type<int>s after counted_array construction");
+    tagged_msg_type counted_array_tagged_msg(5, counted_array);
+    // the is_a<>() should return exact type matches.
+    ASSERT(!is_a<check_type<int> *>(counted_array_tagged_msg), "Test of is_a for counted_array_tagged_msg fails");
+    #if TBB_USE_EXCEPTIONS
+    try {
+        int *iip = cast_to<int *>(counted_array_tagged_msg);
+        ASSERT(false, "did not throw on invalid cast");
+        *iip = 2;  // avoids "ipp set but not used" warning
+    }
+    catch(std::runtime_error &re) {
+        REMARK("attempt to cast to invalid type caught %s\n", re.what());
+    }
+    ASSERT(is_a<counted_array_type>(counted_array_tagged_msg), "testing");
+    const check_type<int> *ctip = cast_to<counted_array_type>(counted_array_tagged_msg);
+
+    ASSERT((int)(*ctip) == 0, "ctip incorrect");
+
+    ASSERT(check_type<int>::check_type_counter == 25, "Incorrect number of check_type<int>s after counted_array_tagged_msg construction");
+    counted_array_tagged_msg = default_tagged_msg;
+    ASSERT(check_type<int>::check_type_counter == 13, "Incorrect number of check_type<int>s after counted_array_tagged_msg destruction");
+    ASSERT(counted_array_tagged_msg.is_default_constructed(), "Assigned counted_array_type is not default-constructed");
+
+    default_tagged_msg = double_tagged_msg;
+    const double my_dval = cast_to<double>(default_tagged_msg);
+    ASSERT(my_dval == 8.0, "did not retrieve correct value from assigned default_tagged_msg");
+
+    {
+        odd_array_type my_b;
+        for(size_t ii=0; ii < 14;++ii) {
+            my_b[ii] = (char)('0' + ii);
+        }
+        my_b[14] = 0;
+        {
+            tagged_msg_type odd_array_tagged_msg(6, my_b);
+            const char *my_copy = cast_to<odd_array_type>(odd_array_tagged_msg);
+            ASSERT(!strncmp(my_b, my_copy, 14), "copied char array not correct value");
+            default_tagged_msg = odd_array_tagged_msg;
+            try {
+                const char *my_copy2 = cast_to<odd_array_type>(default_tagged_msg);
+                ASSERT(!strncmp(my_b, my_copy2, 14), "char array from default tagged_msg assign not correct value");
+            }
+            catch(...) {
+                ASSERT(false, "Bad cast");
+            }
+        }
+    }
+
+    ASSERT(!is_a<double>(i), "bad type for i");
+    try {
+        double y = cast_to<double>(i);
+        // use '&' to force eval of RHS (fixes "initialized but not referenced" vs2012 warnings)
+        ASSERT(false & (0 != y), "Error: cast to type in tuple did not get exception");
+    }
+    catch(std::runtime_error &bc) {
+        ASSERT(0 == strcmp(bc.what(), "Illegal tagged_msg cast"), "Incorrect std:runtime_error");
+    }
+    catch(...) {
+        ASSERT(false & cast_to<int>(i), "Error: improper exception thrown");
+    }
+
+    try {
+        int *ip = cast_to<int *>(i);
+        ASSERT(false & (NULL!=ip), "Error: non-array cast to pointer type.");
+    }
+    catch(std::runtime_error &bc) {
+        ASSERT(0 == strcmp(bc.what(), "Illegal tagged_msg cast"), "Incorrect std:runtime_error");
+    }
+    catch(...) {
+        ASSERT(false, "did not get runtime_error exception in casting non-array to pointer");
+    }
+
+    try {
+        bool b = cast_to<bool>(i);
+        ASSERT(false & b, "Error: cast against type did not get exception");
+    }
+    catch(std::runtime_error &bc) {
+        ASSERT(0 == strcmp(bc.what(), "Illegal tagged_msg cast"), "Incorrect std:runtime_error");
+    }
+    catch(...) {
+        ASSERT(false, "did not get runtime_error exception casting to disparate types");
+    }
+    #endif //TBB_USE_EXCEPTIONS
+}
+
+int TestMain() {
+    TestWrapper();
+    ASSERT(check_type<int>::check_type_counter == 0, "After TestWrapper return not all check_type<int>s were destroyed");
+    RunTests();
+    ASSERT(check_type<int>::check_type_counter == 0, "After RunTests return not all check_type<int>s were destroyed");
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_task.cpp b/xdl/third_party/tbb/src/test/test_task.cpp
new file mode 100644
index 00000000..66823cf4
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task.cpp
@@ -0,0 +1,1349 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_task.h"
+#include "tbb/atomic.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/task_scheduler_init.h"
+#include <cstdlib>
+
+//------------------------------------------------------------------------
+// Test for task::spawn_children and task_list
+//------------------------------------------------------------------------
+
+class UnboundedlyRecursiveOnUnboundedStealingTask : public tbb::task {
+    typedef UnboundedlyRecursiveOnUnboundedStealingTask this_type;
+
+    this_type *m_Parent;
+    const int m_Depth;
+    volatile bool m_GoAhead;
+
+    // Well, virtually unboundedly, for any practical purpose
+    static const int max_depth = 1000000;
+
+public:
+    UnboundedlyRecursiveOnUnboundedStealingTask( this_type *parent_ = NULL, int depth_ = max_depth )
+        : m_Parent(parent_)
+        , m_Depth(depth_)
+        , m_GoAhead(true)
+    {}
+
+    tbb::task* execute() __TBB_override {
+        // Using large padding array speeds up reaching stealing limit
+        const int paddingSize = 16 * 1024;
+        volatile char padding[paddingSize];
+        if( !m_Parent || (m_Depth > 0 &&  m_Parent->m_GoAhead) ) {
+            if ( m_Parent ) {
+                // We are stolen, let our parent start waiting for us
+                m_Parent->m_GoAhead = false;
+            }
+            tbb::task &t = *new( allocate_child() ) this_type(this, m_Depth - 1);
+            set_ref_count( 2 );
+            spawn( t );
+            // Give a willing thief a chance to steal
+            for( int i = 0; i < 1000000 && m_GoAhead; ++i ) {
+                ++padding[i % paddingSize];
+                __TBB_Yield();
+            }
+            // If our child has not been stolen yet, then prohibit it siring ones
+            // of its own (when this thread executes it inside the next wait_for_all)
+            m_GoAhead = false;
+            wait_for_all();
+        }
+        return NULL;
+    }
+}; // UnboundedlyRecursiveOnUnboundedStealingTask
+
+tbb::atomic<int> Count;
+
+class RecursiveTask: public tbb::task {
+    const int m_ChildCount;
+    const int m_Depth;
+    //! Spawn tasks in list.  Exact method depends upon m_Depth&bit_mask.
+    void SpawnList( tbb::task_list& list, int bit_mask ) {
+        if( m_Depth&bit_mask ) {
+            // Take address to check that signature of spawn(task_list&) is static.
+            void (*s)(tbb::task_list&) = &tbb::task::spawn;
+            (*s)(list);
+            ASSERT( list.empty(), NULL );
+            wait_for_all();
+        } else {
+            spawn_and_wait_for_all(list);
+            ASSERT( list.empty(), NULL );
+        }
+    }
+public:
+    RecursiveTask( int child_count, int depth_ ) : m_ChildCount(child_count), m_Depth(depth_) {}
+    tbb::task* execute() __TBB_override {
+        ++Count;
+        if( m_Depth>0 ) {
+            tbb::task_list list;
+            ASSERT( list.empty(), NULL );
+            for( int k=0; k<m_ChildCount; ++k ) {
+                list.push_back( *new( allocate_child() ) RecursiveTask(m_ChildCount/2,m_Depth-1 ) );
+                ASSERT( !list.empty(), NULL );
+            }
+            set_ref_count( m_ChildCount+1 );
+            SpawnList( list, 1 );
+            // Now try reusing this as the parent.
+            set_ref_count(2);
+            list.push_back( *new ( allocate_child() ) tbb::empty_task() );
+            SpawnList( list, 2 );
+        }
+        return NULL;
+    }
+};
+
+//! Compute what Count should be after RecursiveTask(child_count,depth) runs.
+static int Expected( int child_count, int depth ) {
+    return depth<=0 ? 1 : 1+child_count*Expected(child_count/2,depth-1);
+}
+
+void TestStealLimit( int nthread ) {
+#if __TBB_DEFINE_MIC
+    REMARK( "skipping steal limiting heuristics for %d threads\n", nthread );
+#else// !_TBB_DEFINE_MIC
+    REMARK( "testing steal limiting heuristics for %d threads\n", nthread );
+    tbb::task_scheduler_init init(nthread);
+    tbb::task &t = *new( tbb::task::allocate_root() ) UnboundedlyRecursiveOnUnboundedStealingTask();
+    tbb::task::spawn_root_and_wait(t);
+#endif// _TBB_DEFINE_MIC
+}
+
+//! Test task::spawn( task_list& )
+void TestSpawnChildren( int nthread ) {
+    REMARK("testing task::spawn(task_list&) for %d threads\n",nthread);
+    tbb::task_scheduler_init init(nthread);
+    for( int j=0; j<50; ++j ) {
+        Count = 0;
+        RecursiveTask& p = *new( tbb::task::allocate_root() ) RecursiveTask(j,4);
+        tbb::task::spawn_root_and_wait(p);
+        int expected = Expected(j,4);
+        ASSERT( Count==expected, NULL );
+    }
+}
+
+//! Test task::spawn_root_and_wait( task_list& )
+void TestSpawnRootList( int nthread ) {
+    REMARK("testing task::spawn_root_and_wait(task_list&) for %d threads\n",nthread);
+    tbb::task_scheduler_init init(nthread);
+    for( int j=0; j<5; ++j )
+        for( int k=0; k<10; ++k ) {
+            Count = 0;
+            tbb::task_list list;
+            for( int i=0; i<k; ++i )
+                list.push_back( *new( tbb::task::allocate_root() ) RecursiveTask(j,4) );
+            tbb::task::spawn_root_and_wait(list);
+            int expected = k*Expected(j,4);
+            ASSERT( Count==expected, NULL );
+        }
+}
+
+//------------------------------------------------------------------------
+// Test for task::recycle_as_safe_continuation
+//------------------------------------------------------------------------
+
+void TestSafeContinuation( int nthread ) {
+    REMARK("testing task::recycle_as_safe_continuation for %d threads\n",nthread);
+    tbb::task_scheduler_init init(nthread);
+    for( int j=8; j<33; ++j ) {
+        TaskGenerator& p = *new( tbb::task::allocate_root() ) TaskGenerator(j,5);
+        tbb::task::spawn_root_and_wait(p);
+    }
+}
+
+//------------------------------------------------------------------------
+// Test affinity interface
+//------------------------------------------------------------------------
+tbb::atomic<int> TotalCount;
+
+struct AffinityTask: public tbb::task {
+    const affinity_id expected_affinity_id;
+    bool noted;
+    /** Computing affinities is NOT supported by TBB, and may disappear in the future.
+        It is done here for sake of unit testing. */
+    AffinityTask( int expected_affinity_id_ ) :
+        expected_affinity_id(affinity_id(expected_affinity_id_)),
+        noted(false)
+    {
+        set_affinity(expected_affinity_id);
+        ASSERT( 0u-expected_affinity_id>0u, "affinity_id not an unsigned integral type?" );
+        ASSERT( affinity()==expected_affinity_id, NULL );
+    }
+    tbb::task* execute() __TBB_override {
+        ++TotalCount;
+        return NULL;
+    }
+    void note_affinity( affinity_id id ) __TBB_override {
+        // There is no guarantee in TBB that a task runs on its affinity thread.
+        // However, the current implementation does accidentally guarantee it
+        // under certain conditions, such as the conditions here.
+        // We exploit those conditions for sake of unit testing.
+        ASSERT( id!=expected_affinity_id, NULL );
+        ASSERT( !noted, "note_affinity_id called twice!" );
+        ASSERT ( &self() == (tbb::task*)this, "Wrong innermost running task" );
+        noted = true;
+    }
+};
+
+/** Note: This test assumes a lot about the internal implementation of affinity.
+    Do NOT use this as an example of good programming practice with TBB */
+void TestAffinity( int nthread ) {
+    TotalCount = 0;
+    int n = tbb::task_scheduler_init::default_num_threads();
+    if( n>nthread )
+        n = nthread;
+    tbb::task_scheduler_init init(n);
+    tbb::empty_task* t = new( tbb::task::allocate_root() ) tbb::empty_task;
+    tbb::task::affinity_id affinity_id = t->affinity();
+    ASSERT( affinity_id==0, NULL );
+    // Set ref_count for n-1 children, plus 1 for the wait.
+    t->set_ref_count(n);
+    // Spawn n-1 affinitized children.
+    for( int i=1; i<n; ++i )
+        tbb::task::spawn( *new(t->allocate_child()) AffinityTask(i) );
+    if( n>1 ) {
+        // Keep master from stealing
+        while( TotalCount!=n-1 )
+            __TBB_Yield();
+    }
+    // Wait for the children
+    t->wait_for_all();
+    int k = 0;
+    GetTaskPtr(k)->destroy(*t);
+    ASSERT(k==1,NULL);
+}
+
+struct NoteAffinityTask: public tbb::task {
+    bool noted;
+    NoteAffinityTask( int id ) : noted(false)
+    {
+        set_affinity(affinity_id(id));
+    }
+    ~NoteAffinityTask () {
+        ASSERT (noted, "note_affinity has not been called");
+    }
+    tbb::task* execute() __TBB_override {
+        return NULL;
+    }
+    void note_affinity( affinity_id /*id*/ ) __TBB_override {
+        noted = true;
+        ASSERT ( &self() == (tbb::task*)this, "Wrong innermost running task" );
+    }
+};
+
+// This test checks one of the paths inside the scheduler by affinitizing the child task
+// to non-existent thread so that it is proxied in the local task pool but not retrieved
+// by another thread.
+// If no workers requested, the extra slot #2 is allocated for a worker thread to serve
+// "enqueued" tasks. In this test, it is used only for the affinity purpose.
+void TestNoteAffinityContext() {
+    tbb::task_scheduler_init init(1);
+    tbb::empty_task* t = new( tbb::task::allocate_root() ) tbb::empty_task;
+    t->set_ref_count(2);
+    // This master in the absence of workers will have an affinity id of 1.
+    // So use another number to make the task get proxied.
+    tbb::task::spawn( *new(t->allocate_child()) NoteAffinityTask(2) );
+    t->wait_for_all();
+    tbb::task::destroy(*t);
+}
+
+//------------------------------------------------------------------------
+// Test that recovery actions work correctly for task::allocate_* methods
+// when a task's constructor throws an exception.
+//------------------------------------------------------------------------
+
+#if TBB_USE_EXCEPTIONS
+static int TestUnconstructibleTaskCount;
+
+struct ConstructionFailure {
+};
+
+#if __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+    // Suppress pointless "unreachable code" warning.
+    #pragma warning (push)
+    #pragma warning (disable: 4702)
+#endif
+
+//! Task that cannot be constructed.
+template<size_t N>
+struct UnconstructibleTask: public tbb::empty_task {
+    char space[N];
+    UnconstructibleTask() {
+        throw ConstructionFailure();
+    }
+};
+
+#if __TBB_MSVC_UNREACHABLE_CODE_IGNORED
+    #pragma warning (pop)
+#endif
+
+#define TRY_BAD_CONSTRUCTION(x)                  \
+    {                                            \
+        try {                                    \
+            new(x) UnconstructibleTask<N>;       \
+        } catch( const ConstructionFailure& ) {                                                    \
+            ASSERT( parent()==original_parent, NULL ); \
+            ASSERT( ref_count()==original_ref_count, "incorrectly changed ref_count" );\
+            ++TestUnconstructibleTaskCount;      \
+        }                                        \
+    }
+
+template<size_t N>
+struct RootTaskForTestUnconstructibleTask: public tbb::task {
+    tbb::task* execute() __TBB_override {
+        tbb::task* original_parent = parent();
+        ASSERT( original_parent!=NULL, NULL );
+        int original_ref_count = ref_count();
+        TRY_BAD_CONSTRUCTION( allocate_root() );
+        TRY_BAD_CONSTRUCTION( allocate_child() );
+        TRY_BAD_CONSTRUCTION( allocate_continuation() );
+        TRY_BAD_CONSTRUCTION( allocate_additional_child_of(*this) );
+        return NULL;
+    }
+};
+
+template<size_t N>
+void TestUnconstructibleTask() {
+    TestUnconstructibleTaskCount = 0;
+    tbb::task_scheduler_init init;
+    tbb::task* t = new( tbb::task::allocate_root() ) RootTaskForTestUnconstructibleTask<N>;
+    tbb::task::spawn_root_and_wait(*t);
+    ASSERT( TestUnconstructibleTaskCount==4, NULL );
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+//------------------------------------------------------------------------
+// Test for alignment problems with task objects.
+//------------------------------------------------------------------------
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    // Workaround for pointless warning "structure was padded due to __declspec(align())
+    #pragma warning (push)
+    #pragma warning (disable: 4324)
+#endif
+
+//! Task with members of type T.
+/** The task recursively creates tasks. */
+template<typename T>
+class TaskWithMember: public tbb::task {
+    T x;
+    T y;
+    unsigned char count;
+    tbb::task* execute() __TBB_override {
+        x = y;
+        if( count>0 ) {
+            set_ref_count(2);
+            tbb::task* t = new( allocate_child() ) TaskWithMember<T>(count-1);
+            spawn_and_wait_for_all(*t);
+        }
+        return NULL;
+    }
+public:
+    TaskWithMember( unsigned char n ) : count(n) {}
+};
+
+#if _MSC_VER && !defined(__INTEL_COMPILER)
+    #pragma warning (pop)
+#endif
+
+template<typename T>
+void TestAlignmentOfOneClass() {
+    typedef TaskWithMember<T> task_type;
+    tbb::task* t = new( tbb::task::allocate_root() ) task_type(10);
+    tbb::task::spawn_root_and_wait(*t);
+}
+
+#include "harness_m128.h"
+
+void TestAlignment() {
+    REMARK("testing alignment\n");
+    tbb::task_scheduler_init init;
+    // Try types that have variety of alignments
+    TestAlignmentOfOneClass<char>();
+    TestAlignmentOfOneClass<short>();
+    TestAlignmentOfOneClass<int>();
+    TestAlignmentOfOneClass<long>();
+    TestAlignmentOfOneClass<void*>();
+    TestAlignmentOfOneClass<float>();
+    TestAlignmentOfOneClass<double>();
+#if HAVE_m128
+    TestAlignmentOfOneClass<__m128>();
+#endif
+#if HAVE_m256
+    if (have_AVX()) TestAlignmentOfOneClass<__m256>();
+#endif
+}
+
+//------------------------------------------------------------------------
+// Test for recursing on left while spawning on right
+//------------------------------------------------------------------------
+
+int Fib( int n );
+
+struct RightFibTask: public tbb::task {
+    int* y;
+    const int n;
+    RightFibTask( int* y_, int n_ ) : y(y_), n(n_) {}
+    task* execute() __TBB_override {
+        *y = Fib(n-1);
+        return 0;
+    }
+};
+
+int Fib( int n ) {
+    if( n<2 ) {
+        return n;
+    } else {
+        // y actually does not need to be initialized.  It is initialized solely to suppress
+        // a gratuitous warning "potentially uninitialized local variable".
+        int y=-1;
+        tbb::task* root_task = new( tbb::task::allocate_root() ) tbb::empty_task;
+        root_task->set_ref_count(2);
+        tbb::task::spawn( *new( root_task->allocate_child() ) RightFibTask(&y,n) );
+        int x = Fib(n-2);
+        root_task->wait_for_all();
+        tbb::task::destroy(*root_task);
+        return y+x;
+    }
+}
+
+void TestLeftRecursion( int p ) {
+    REMARK("testing non-spawned roots for %d threads\n",p);
+    tbb::task_scheduler_init init(p);
+    int sum = 0;
+    for( int i=0; i<100; ++i )
+        sum +=Fib(10);
+    ASSERT( sum==5500, NULL );
+}
+
+//------------------------------------------------------------------------
+// Test for computing with DAG of tasks.
+//------------------------------------------------------------------------
+
+class DagTask: public tbb::task {
+    typedef unsigned long long number_t;
+    const int i, j;
+    number_t sum_from_left, sum_from_above;
+    void check_sum( number_t sum ) {
+        number_t expected_sum = 1;
+        for( int k=i+1; k<=i+j; ++k )
+            expected_sum *= k;
+        for( int k=1; k<=j; ++k )
+            expected_sum /= k;
+        ASSERT(sum==expected_sum, NULL);
+    }
+public:
+    DagTask *successor_to_below, *successor_to_right;
+    DagTask( int i_, int j_ ) : i(i_), j(j_), sum_from_left(0), sum_from_above(0) {}
+    task* execute() __TBB_override {
+        ASSERT( ref_count()==0, NULL );
+        number_t sum = i==0 && j==0 ? 1 : sum_from_left+sum_from_above;
+        check_sum(sum);
+        ++execution_count;
+        if( DagTask* t = successor_to_right ) {
+            t->sum_from_left = sum;
+            if( t->decrement_ref_count()==0 )
+                // Test using spawn to evaluate DAG
+                spawn( *t );
+        }
+        if( DagTask* t = successor_to_below ) {
+            t->sum_from_above = sum;
+            if( t->add_ref_count(-1)==0 )
+                // Test using bypass to evaluate DAG
+                return t;
+        }
+        return NULL;
+    }
+    ~DagTask() {++destruction_count;}
+    static tbb::atomic<int> execution_count;
+    static tbb::atomic<int> destruction_count;
+};
+
+tbb::atomic<int> DagTask::execution_count;
+tbb::atomic<int> DagTask::destruction_count;
+
+void TestDag( int p ) {
+    REMARK("testing evaluation of DAG for %d threads\n",p);
+    tbb::task_scheduler_init init(p);
+    DagTask::execution_count=0;
+    DagTask::destruction_count=0;
+    const int n = 10;
+    DagTask* a[n][n];
+    for( int i=0; i<n; ++i )
+        for( int j=0; j<n; ++j )
+            a[i][j] = new( tbb::task::allocate_root() ) DagTask(i,j);
+    for( int i=0; i<n; ++i )
+        for( int j=0; j<n; ++j ) {
+            a[i][j]->successor_to_below = i+1<n ? a[i+1][j] : NULL;
+            a[i][j]->successor_to_right = j+1<n ? a[i][j+1] : NULL;
+            a[i][j]->set_ref_count((i>0)+(j>0));
+        }
+    a[n-1][n-1]->increment_ref_count();
+    a[n-1][n-1]->spawn_and_wait_for_all(*a[0][0]);
+    ASSERT( DagTask::execution_count == n*n - 1, NULL );
+    tbb::task::destroy(*a[n-1][n-1]);
+    ASSERT( DagTask::destruction_count > n*n - p, NULL );
+    while ( DagTask::destruction_count != n*n )
+        __TBB_Yield();
+}
+
+#include "harness_barrier.h"
+
+class RelaxedOwnershipTask: public tbb::task {
+    tbb::task &m_taskToSpawn,
+              &m_taskToDestroy,
+              &m_taskToExecute;
+    static Harness::SpinBarrier m_barrier;
+
+    tbb::task* execute () __TBB_override {
+        tbb::task &p = *parent();
+        tbb::task &r = *new( allocate_root() ) tbb::empty_task;
+        r.set_ref_count( 1 );
+        m_barrier.wait();
+        p.spawn( *new(p.allocate_child()) tbb::empty_task );
+        p.spawn( *new(task::allocate_additional_child_of(p)) tbb::empty_task );
+        p.spawn( m_taskToSpawn );
+        p.destroy( m_taskToDestroy );
+        r.spawn_and_wait_for_all( m_taskToExecute );
+        p.destroy( r );
+        return NULL;
+    }
+public:
+    RelaxedOwnershipTask ( tbb::task& toSpawn, tbb::task& toDestroy, tbb::task& toExecute )
+        : m_taskToSpawn(toSpawn)
+        , m_taskToDestroy(toDestroy)
+        , m_taskToExecute(toExecute)
+    {}
+    static void SetBarrier ( int numThreads ) { m_barrier.initialize( numThreads ); }
+};
+
+Harness::SpinBarrier RelaxedOwnershipTask::m_barrier;
+
+void TestRelaxedOwnership( int p ) {
+    if ( p < 2 )
+        return;
+
+    if( unsigned(p)>tbb::tbb_thread::hardware_concurrency() )
+        return;
+
+    REMARK("testing tasks exercising relaxed ownership freedom for %d threads\n", p);
+    tbb::task_scheduler_init init(p);
+    RelaxedOwnershipTask::SetBarrier(p);
+    tbb::task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    tbb::task_list tl;
+    for ( int i = 0; i < p; ++i ) {
+        tbb::task &tS = *new( r.allocate_child() ) tbb::empty_task,
+                  &tD = *new( r.allocate_child() ) tbb::empty_task,
+                  &tE = *new( r.allocate_child() ) tbb::empty_task;
+        tl.push_back( *new( r.allocate_child() ) RelaxedOwnershipTask(tS, tD, tE) );
+    }
+    r.set_ref_count( 5 * p + 1 );
+    int k=0;
+    GetTaskPtr(k)->spawn( tl );
+    ASSERT(k==1,NULL);
+    r.wait_for_all();
+    r.destroy( r );
+}
+
+//------------------------------------------------------------------------
+// Test for running TBB scheduler on user-created thread.
+//------------------------------------------------------------------------
+
+void RunSchedulerInstanceOnUserThread( int n_child ) {
+    tbb::task* e = new( tbb::task::allocate_root() ) tbb::empty_task;
+    e->set_ref_count(1+n_child);
+    for( int i=0; i<n_child; ++i )
+        tbb::task::spawn( *new(e->allocate_child()) tbb::empty_task );
+    e->wait_for_all();
+    e->destroy(*e);
+}
+
+void TestUserThread( int p ) {
+    tbb::task_scheduler_init init(p);
+    // Try with both 0 and 1 children.  Only the latter scenario permits stealing.
+    for( int n_child=0; n_child<2; ++n_child ) {
+        tbb::tbb_thread t( RunSchedulerInstanceOnUserThread, n_child );
+        t.join();
+    }
+}
+
+class TaskWithChildToSteal : public tbb::task {
+    const int m_Depth;
+    volatile bool m_GoAhead;
+
+public:
+    TaskWithChildToSteal( int depth_ )
+        : m_Depth(depth_)
+        , m_GoAhead(false)
+    {}
+
+    tbb::task* execute() __TBB_override {
+        m_GoAhead = true;
+        if ( m_Depth > 0 ) {
+            TaskWithChildToSteal &t = *new( allocate_child() ) TaskWithChildToSteal(m_Depth - 1);
+            t.SpawnAndWaitOnParent();
+        }
+        else
+            Harness::Sleep(50); // The last task in chain sleeps for 50 ms
+        return NULL;
+    }
+
+    void SpawnAndWaitOnParent() {
+        parent()->set_ref_count( 2 );
+        parent()->spawn( *this );
+        while (!this->m_GoAhead )
+            __TBB_Yield();
+        parent()->wait_for_all();
+    }
+}; // TaskWithChildToSteal
+
+// Success criterion of this test is not hanging
+void TestDispatchLoopResponsiveness() {
+    REMARK("testing that dispatch loops do not go into eternal sleep when all remaining children are stolen\n");
+    // Recursion depth values test the following sorts of dispatch loops
+    // 0 - master's outermost
+    // 1 - worker's nested
+    // 2 - master's nested
+    tbb::task_scheduler_init init(2);
+    tbb::task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    for ( int depth = 0; depth < 3; ++depth ) {
+        TaskWithChildToSteal &t = *new( r.allocate_child() ) TaskWithChildToSteal(depth);
+        t.SpawnAndWaitOnParent();
+    }
+    r.destroy(r);
+}
+
+void TestWaitDiscriminativenessWithoutStealing() {
+    REMARK( "testing that task::wait_for_all is specific to the root it is called on (no workers)\n" );
+    // The test relies on the strict LIFO scheduling order in the absence of workers
+    tbb::task_scheduler_init init(1);
+    tbb::task &r1 = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    tbb::task &r2 = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    const int NumChildren = 10;
+    r1.set_ref_count( NumChildren + 1 );
+    r2.set_ref_count( NumChildren + 1 );
+    for( int i=0; i < NumChildren; ++i ) {
+        tbb::empty_task &t1 = *new( r1.allocate_child() ) tbb::empty_task;
+        tbb::empty_task &t2 = *new( r2.allocate_child() ) tbb::empty_task;
+        tbb::task::spawn(t1);
+        tbb::task::spawn(t2);
+    }
+    r2.wait_for_all();
+    ASSERT( r2.ref_count() <= 1, "Not all children of r2 executed" );
+    ASSERT( r1.ref_count() > 1, "All children of r1 prematurely executed" );
+    r1.wait_for_all();
+    ASSERT( r1.ref_count() <= 1, "Not all children of r1 executed" );
+    r1.destroy(r1);
+    r2.destroy(r2);
+}
+
+
+using tbb::internal::spin_wait_until_eq;
+
+//! Deterministic emulation of a long running task
+class LongRunningTask : public tbb::task {
+    volatile bool& m_CanProceed;
+
+    tbb::task* execute() __TBB_override {
+        spin_wait_until_eq( m_CanProceed, true );
+        return NULL;
+    }
+public:
+    LongRunningTask ( volatile bool& canProceed ) : m_CanProceed(canProceed) {}
+};
+
+void TestWaitDiscriminativenessWithStealing() {
+    if( tbb::tbb_thread::hardware_concurrency() < 2 )
+        return;
+    REMARK( "testing that task::wait_for_all is specific to the root it is called on (one worker)\n" );
+    volatile bool canProceed = false;
+    tbb::task_scheduler_init init(2);
+    tbb::task &r1 = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    tbb::task &r2 = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    r1.set_ref_count( 2 );
+    r2.set_ref_count( 2 );
+    tbb::task& t1 = *new( r1.allocate_child() ) tbb::empty_task;
+    tbb::task& t2 = *new( r2.allocate_child() ) LongRunningTask(canProceed);
+    tbb::task::spawn(t2);
+    tbb::task::spawn(t1);
+    r1.wait_for_all();
+    ASSERT( r1.ref_count() <= 1, "Not all children of r1 executed" );
+    ASSERT( r2.ref_count() == 2, "All children of r2 prematurely executed" );
+    canProceed = true;
+    r2.wait_for_all();
+    ASSERT( r2.ref_count() <= 1, "Not all children of r2 executed" );
+    r1.destroy(r1);
+    r2.destroy(r2);
+}
+
+struct MasterBody : NoAssign, Harness::NoAfterlife {
+    static Harness::SpinBarrier my_barrier;
+
+    class BarrenButLongTask : public tbb::task {
+        volatile bool& m_Started;
+        volatile bool& m_CanProceed;
+
+        tbb::task* execute() __TBB_override {
+            m_Started = true;
+            spin_wait_until_eq( m_CanProceed, true );
+            volatile int k = 0;
+            for ( int i = 0; i < 1000000; ++i ) ++k;
+            return NULL;
+        }
+    public:
+        BarrenButLongTask ( volatile bool& started, volatile bool& can_proceed )
+            : m_Started(started), m_CanProceed(can_proceed)
+        {}
+    };
+
+    class BinaryRecursiveTask : public tbb::task {
+        int m_Depth;
+
+        tbb::task* execute() __TBB_override {
+            if( !m_Depth )
+                return NULL;
+            set_ref_count(3);
+            spawn( *new( allocate_child() ) BinaryRecursiveTask(m_Depth - 1) );
+            spawn( *new( allocate_child() ) BinaryRecursiveTask(m_Depth - 1) );
+            wait_for_all();
+            return NULL;
+        }
+
+        void note_affinity( affinity_id ) __TBB_override {
+            ASSERT( false, "These tasks cannot be stolen" );
+        }
+    public:
+        BinaryRecursiveTask ( int depth_ ) : m_Depth(depth_) {}
+    };
+
+    void operator() ( int id ) const {
+        if ( id ) {
+            tbb::task_scheduler_init init(2);
+            volatile bool child_started = false,
+                          can_proceed = false;
+            tbb::task& r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+            r.set_ref_count(2);
+            r.spawn( *new(r.allocate_child()) BarrenButLongTask(child_started, can_proceed) );
+            spin_wait_until_eq( child_started, true );
+            my_barrier.wait();
+            can_proceed = true;
+            r.wait_for_all();
+            r.destroy(r);
+        }
+        else {
+            my_barrier.wait();
+            tbb::task_scheduler_init init(1);
+            Count = 0;
+            int depth = 16;
+            BinaryRecursiveTask& r = *new( tbb::task::allocate_root() ) BinaryRecursiveTask(depth);
+            tbb::task::spawn_root_and_wait(r);
+        }
+    }
+public:
+    MasterBody ( int num_masters ) { my_barrier.initialize(num_masters); }
+};
+
+Harness::SpinBarrier MasterBody::my_barrier;
+
+/** Ensures that tasks spawned by a master thread or one of the workers servicing
+    it cannot be stolen by another master thread. **/
+void TestMastersIsolation ( int p ) {
+    // The test requires at least 3-way parallelism to work correctly
+    if ( p > 2 && tbb::task_scheduler_init::default_num_threads() >= p ) {
+        tbb::task_scheduler_init init(p);
+        NativeParallelFor( p, MasterBody(p) );
+    }
+}
+
+struct waitable_task : tbb::task {
+    tbb::task* execute() __TBB_override {
+        recycle_as_safe_continuation(); // do not destroy the task after execution
+        set_parent(this);               // decrement its own ref_count after completion
+        __TBB_Yield();
+        return NULL;
+    }
+};
+void TestWaitableTask() {
+    waitable_task &wt = *new( tbb::task::allocate_root() ) waitable_task;
+    for( int i = 0; i < 100000; i++ ) {
+        wt.set_ref_count(2);            // prepare for waiting on it
+        wt.spawn(wt);
+        if( i&1 ) __TBB_Yield();
+        wt.wait_for_all();
+    }
+    wt.set_parent(NULL);                // prevents assertions and atomics in task::destroy
+    tbb::task::destroy(wt);
+}
+
+#if __TBB_PREVIEW_CRITICAL_TASKS
+#include <stdexcept>
+#include <vector>
+#include <map>
+#include "tbb/parallel_for.h"
+
+namespace CriticalTaskSupport {
+
+using tbb::task;
+task* g_root_task = NULL;
+
+// markers to capture execution profile (declaration order is important)
+enum task_marker_t {
+    no_task, regular_task, isolated_regular_task,
+    outer_critical_task, nested_critical_task, critical_from_isolated_task, bypassed_critical_task
+};
+enum bypassed_critical_task_stage_t { not_bypassed, bypassed, executed };
+
+typedef std::vector< std::vector<task_marker_t> > task_map_t;
+task_map_t g_execution_profile;
+
+const int g_per_thread_regular_tasks_num = 5;
+const int g_isolated_regular_task_num = 3;
+tbb::atomic<bool> g_is_critical_task_submitted;
+size_t g_bypassed_critical_task_index = size_t(-1);
+task* g_bypassed_task_pointer = NULL;
+int g_bypassed_task_creator = -1;
+tbb::atomic<bypassed_critical_task_stage_t> g_bypassed_critical_task_stage;
+tbb::task_arena g_arena;
+Harness::SpinBarrier g_spin_barrier;
+
+struct parallel_for_body {
+    parallel_for_body(task_marker_t task_marker, bool submit_critical = false)
+        : my_task_marker(task_marker), my_submit_critical(submit_critical) {}
+    void operator()( int i ) const;
+private:
+    task_marker_t my_task_marker;
+    bool my_submit_critical;
+};
+
+struct IsolatedFunctor {
+    void operator()() const {
+        parallel_for_body body(isolated_regular_task, /*submit_critical=*/ true);
+        tbb::parallel_for( 0, g_isolated_regular_task_num, body, tbb::simple_partitioner() );
+    }
+};
+
+struct CriticalTaskBody : public task {
+    CriticalTaskBody(task_marker_t task_marker) : my_task_mark(task_marker) {}
+    task* execute() __TBB_override {
+        task* ret_task = NULL;
+        task* nested_task = NULL;
+        int thread_idx = tbb::this_task_arena::current_thread_index();
+        g_execution_profile[thread_idx].push_back(my_task_mark);
+        switch( my_task_mark ) {
+        case outer_critical_task:
+            g_spin_barrier.wait(); // allow each thread to take its own critical task
+            // prefill queue with critical tasks
+            nested_task = new( task::allocate_additional_child_of(*g_root_task) )
+                CriticalTaskBody(nested_critical_task);
+            enqueue( *nested_task, tbb::priority_t(tbb::internal::priority_critical) );
+            if( not_bypassed ==
+                g_bypassed_critical_task_stage.compare_and_swap(bypassed, not_bypassed) ) {
+
+                // first, should process all the work from isolated region
+                tbb::this_task_arena::isolate( IsolatedFunctor() );
+
+                CriticalTaskBody* bypassed_task =
+                    new( task::allocate_additional_child_of(*g_root_task) )
+                    CriticalTaskBody(bypassed_critical_task);
+                g_bypassed_task_pointer = bypassed_task;
+                g_bypassed_critical_task_index = g_execution_profile[thread_idx].size() + 1;
+                g_bypassed_task_creator = thread_idx;
+                tbb::internal::make_critical(*bypassed_task);
+                ret_task = bypassed_task;
+            }
+            g_spin_barrier.wait(); // allow thread to execute isolated region
+            break;
+        case nested_critical_task:
+            // wait until bypassed critical task has been executed
+            g_spin_barrier.wait();
+            break;
+        case bypassed_critical_task:
+            ASSERT( bypassed == g_bypassed_critical_task_stage, "Unexpected bypassed critical task" );
+            g_bypassed_critical_task_stage = executed;
+            ASSERT( thread_idx == g_bypassed_task_creator,
+                    "Bypassed critical task is not being executed by the thread that bypassed it." );
+            ASSERT( g_bypassed_task_pointer == this, "This is not bypassed task." );
+            ASSERT( g_bypassed_critical_task_index == g_execution_profile[thread_idx].size(),
+                    "Bypassed critical task was not selected as the next task." );
+            break;
+        case critical_from_isolated_task:
+            break;
+        default:
+            ASSERT( false, "Incorrect critical task id." );
+        }
+        return ret_task;
+    }
+private:
+    task_marker_t my_task_mark;
+};
+
+void parallel_for_body::operator()( int i ) const {
+    int thread_idx = tbb::this_task_arena::current_thread_index();
+    g_execution_profile[thread_idx].push_back(my_task_marker);
+    if( my_submit_critical && i == 0 ) {
+        task* isolated_task = new( task::allocate_additional_child_of(*g_root_task) )
+            CriticalTaskBody(critical_from_isolated_task);
+        task::enqueue( *isolated_task, tbb::priority_t(tbb::internal::priority_critical) );
+    }
+}
+
+struct TaskBody: public task {
+    TaskBody() {}
+    TaskBody(task_marker_t /*mark*/) {}
+    task* execute() __TBB_override {
+        int thread_idx = tbb::this_task_arena::current_thread_index();
+        g_execution_profile[thread_idx].push_back(regular_task);
+        if( !g_is_critical_task_submitted ) {
+            g_spin_barrier.wait(); // allow each thread to take its own task.
+            // prefill task pools with regular tasks
+            int half = g_per_thread_regular_tasks_num / 2;
+            for( int i = 0; i < half; ++i ) {
+                task& t = *new( task::allocate_additional_child_of(*g_root_task) )
+                    TaskBody;
+                spawn(t);
+            }
+            {
+                // prefill with critical tasks
+                task& t = *new( task::allocate_additional_child_of(*g_root_task) )
+                    CriticalTaskBody(outer_critical_task);
+                tbb::internal::make_critical(t);
+                tbb::task::spawn(t);
+            }
+            // prefill task pools with regular tasks
+            for( int i = half; i < g_per_thread_regular_tasks_num; ++i ) {
+                task& t = *new( task::allocate_additional_child_of(*g_root_task) )
+                    TaskBody;
+                spawn(t);
+            }
+            g_is_critical_task_submitted.store<tbb::relaxed>(true);
+            g_spin_barrier.wait();
+        }
+        return NULL;
+    }
+};
+
+template<typename TaskType, void(*submit_task)(task&)>
+struct WorkCreator {
+    WorkCreator(task*& root_task, size_t num_tasks, size_t num_critical_tasks = 0,
+                tbb::task_group_context* ctx = NULL)
+        : my_root_task(root_task), my_num_tasks(num_tasks), my_num_critical_tasks(num_critical_tasks),
+          my_context(ctx) {}
+    void operator()() const {
+        ASSERT( my_root_task == NULL, "Incorrect test set up." );
+        task* root_task = NULL;
+        if( my_context )
+            root_task = new( task::allocate_root(*my_context) ) TaskType(regular_task);
+        else
+            root_task = new( task::allocate_root() ) TaskType(regular_task);
+        root_task->increment_ref_count();
+        for( size_t i = 0; i < my_num_tasks; ++i ) {
+            task& t = *new( task::allocate_additional_child_of(*root_task) ) TaskType(regular_task);
+            submit_task(t);
+        }
+        for( size_t i = 0; i < my_num_critical_tasks; ++i ) {
+            task& t = *new( task::allocate_additional_child_of(*root_task) )
+                TaskType( outer_critical_task );
+            tbb::task::enqueue( t, tbb::priority_t(tbb::internal::priority_critical) );
+        }
+        my_root_task = root_task;
+    }
+private:
+    task*& my_root_task;
+    size_t my_num_tasks;
+    size_t my_num_critical_tasks;
+    tbb::task_group_context* my_context;
+};
+
+struct WorkAwaiter {
+    WorkAwaiter(task*& root_task) : my_root_task(root_task) {}
+    void operator()() const {
+        while( !my_root_task ) __TBB_Yield(); // waiting on a tree construction
+        my_root_task->wait_for_all();
+        task::destroy(*my_root_task);
+        my_root_task = NULL;
+    }
+private:
+    task*& my_root_task;
+};
+
+void TestSchedulerTaskSelectionWhenSpawn() {
+    REMARK( "\tPreferring critical tasks among spawned\n" );
+    typedef std::multimap<task_marker_t, task_marker_t> state_machine_t;
+    typedef state_machine_t::iterator states_it;
+    task_marker_t from_to_pairs[] = {
+        // from regular
+        regular_task, regular_task,
+        regular_task, outer_critical_task,
+        // from outermost critical
+        outer_critical_task, isolated_regular_task,
+        outer_critical_task, critical_from_isolated_task,
+        outer_critical_task, nested_critical_task,
+        // from isolated regular
+        isolated_regular_task, isolated_regular_task,
+        isolated_regular_task, critical_from_isolated_task,
+        isolated_regular_task, bypassed_critical_task,
+        // from critical that was enqueued from isolated region
+        critical_from_isolated_task, isolated_regular_task,
+        critical_from_isolated_task, nested_critical_task,
+        critical_from_isolated_task, regular_task,
+        critical_from_isolated_task, bypassed_critical_task,
+        // from bypassed critical
+        bypassed_critical_task, nested_critical_task,
+        bypassed_critical_task, critical_from_isolated_task,
+        // from nested critical
+        nested_critical_task, critical_from_isolated_task,
+        nested_critical_task, regular_task
+    };
+
+    state_machine_t allowed_transitions;
+    for( size_t i = 0; i < sizeof(from_to_pairs) / sizeof(from_to_pairs[0]); i += 2 )
+        allowed_transitions.insert( std::make_pair( from_to_pairs[i], from_to_pairs[i+1] ) );
+
+    for( int num_threads = MinThread; num_threads <= MaxThread; ++num_threads ) {
+        for( int repeat = 0; repeat < 10; ++repeat ) {
+            // test initialization
+            g_bypassed_critical_task_stage = not_bypassed;
+            g_is_critical_task_submitted = false;
+            g_bypassed_critical_task_index = size_t(-1);
+            g_bypassed_task_creator = -1;
+            g_bypassed_task_pointer = NULL;
+            g_execution_profile.resize(num_threads);
+            g_spin_barrier.initialize(num_threads);
+            g_arena.initialize(num_threads);
+
+            // test execution
+            g_arena.execute(
+                WorkCreator<TaskBody, task::spawn>(g_root_task, /*num_tasks=*/size_t(num_threads)) );
+            g_arena.execute( WorkAwaiter(g_root_task) );
+
+            // checking how execution went
+            int critical_task_count = 0;
+            for( int thread = 0; thread < num_threads; ++thread ) {
+                bool started_critical_region = false;
+                bool pass_through_critical_region = false;
+                size_t thread_task_num = g_execution_profile[thread].size();
+                for( size_t task_index = 0; task_index < thread_task_num; ++task_index ) {
+                    const task_marker_t& executed_task = g_execution_profile[thread][task_index];
+
+                    if( pass_through_critical_region ) {
+                        ASSERT( executed_task < outer_critical_task,
+                                "Thread did not process all the critical work at once." );
+                    } else if( isolated_regular_task <= executed_task &&
+                               executed_task <= bypassed_critical_task) {
+                        started_critical_region = true;
+                        if( isolated_regular_task < executed_task )
+                            ++critical_task_count;
+                        if( bypassed_critical_task == executed_task ) {
+                            size_t expected_bypass_task_min_index =
+                                /* number of regular task before critical region */1 +
+                                /* number of outermost critical tasks before isolated region */ 1 +
+                                g_isolated_regular_task_num;
+                            size_t expected_bypass_task_max_index = expected_bypass_task_min_index +
+                                /* number of critical tasks inside isolated region */ 1;
+                            ASSERT( expected_bypass_task_min_index <= task_index &&
+                                    task_index <= expected_bypass_task_max_index,
+                                    "Bypassed critical task has been executed in wrong order" );
+                        }
+                    } else if( started_critical_region ) {
+                        pass_through_critical_region = true;
+                        started_critical_region = false;
+                    }
+
+                    if( thread_task_num - 1 == task_index )
+                        continue;   // no transition check for the last executed task
+                    const task_marker_t& next_task = g_execution_profile[thread][task_index + 1];
+                    std::pair<states_it, states_it> range =
+                        allowed_transitions.equal_range( executed_task );
+                    bool is_choosen_task_allowed = false;
+                    for (states_it it = range.first; it != range.second; ++it) {
+                        is_choosen_task_allowed |= next_task == it->second;
+                    }
+                    ASSERT( is_choosen_task_allowed, "Thread chose incorrect task for execution." );
+                }
+            }
+            ASSERT( critical_task_count == 2 * num_threads + 2, "Wrong number of critical tasks" );
+            ASSERT( g_bypassed_critical_task_stage == executed, "Was bypassed critical task executed?" );
+
+            // test deinitialization
+            g_execution_profile.clear();
+            g_arena.terminate();
+        }
+    }
+}
+
+struct TaskTypeExecutionMarker : public task {
+    TaskTypeExecutionMarker( task_marker_t mark ) : my_mark( mark ) {}
+    task* execute() __TBB_override {
+        g_execution_profile[tbb::this_task_arena::current_thread_index()].push_back( my_mark );
+        return NULL;
+    }
+private:
+    task_marker_t my_mark;
+};
+
+struct RegularTaskMarkChecker {
+    bool operator()(const task_marker_t& m) { return regular_task == m; }
+};
+
+void TestSchedulerTaskSelectionWhenEnqueue() {
+    REMARK( "\tPreferring critical tasks among enqueued\n" );
+    g_execution_profile.clear();
+    // creating two profiles because of enforced concurrency
+    g_execution_profile.resize(2);
+    g_root_task = NULL;
+    unsigned task_num = 99;
+    unsigned num_critical_tasks = 1;
+    g_arena.initialize( /*num_threads=*/1, /*reserved_for_masters=*/0 );
+    g_arena.enqueue(
+        WorkCreator<TaskTypeExecutionMarker, task::enqueue>(
+            g_root_task, task_num, num_critical_tasks)
+    );
+    WorkAwaiter awaiter(g_root_task); awaiter(); // waiting outside arena
+    g_arena.terminate();
+
+    unsigned idx = !g_execution_profile[1].empty();
+    ASSERT( g_execution_profile[!idx].empty(), "" );
+
+    ASSERT( g_execution_profile[idx].size() == task_num + num_critical_tasks,
+            "Incorrect number of tasks executed" );
+    ASSERT( g_execution_profile[idx][0] == outer_critical_task,
+            "Critical task was executed in wrong order." );
+    bool all_regular = true;
+    for( std::vector<task_marker_t>::const_iterator it = g_execution_profile[idx].begin() + 1;
+         it != g_execution_profile[idx].end(); ++it )
+        all_regular &= regular_task == *it;
+    ASSERT( all_regular, "Critical task was executed in wrong order." );
+}
+
+enum ways_to_cancel_t {
+    by_explicit_call = 0,
+    by_exception,
+    no_cancellation
+};
+
+tbb::atomic<size_t> g_num_executed_from_cancelled_context;
+tbb::atomic<size_t> g_num_executed_from_working_context;
+int g_cancelling_task_id = -1;
+
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (push)
+#pragma warning (disable: 4127)  /* suppress conditional expression is constant */
+#endif
+
+template<bool cancelled_group>
+struct ATask : public task {
+    ATask( task_marker_t /*mark*/ ) : my_cancellation_method( no_cancellation ) {}
+    ATask( ways_to_cancel_t cancellation_method ) : my_cancellation_method( cancellation_method ) {}
+    task* execute() __TBB_override {
+        while( ! g_is_critical_task_submitted ) __TBB_Yield();
+        // scheduler should take critical task as the next task for execution.
+        bypassed_critical_task_stage_t previous_critical_task_stage =
+            g_bypassed_critical_task_stage.compare_and_swap(bypassed, not_bypassed);
+        while(
+            cancelled_group                             // Only tasks from cancelled group wait
+            && !this->is_cancelled()                    // for their group to be cancelled
+            && !tbb::internal::is_critical(*this)       // allowing thread that took critical task
+            && bypassed == previous_critical_task_stage // to proceed and cancel the whole group.
+        ) __TBB_Yield();
+        if( cancelled_group )
+            ++g_num_executed_from_cancelled_context;
+        else
+            ++g_num_executed_from_working_context;
+        switch( my_cancellation_method ) {
+        case by_explicit_call:
+            g_cancelling_task_id = int(g_num_executed_from_cancelled_context);
+            self().cancel_group_execution();
+            break;
+        case by_exception:
+            g_cancelling_task_id = int(g_num_executed_from_cancelled_context);
+            throw std::runtime_error("Exception data");
+            break;
+        case no_cancellation: break;
+        default:
+            ASSERT( false, "Should not be here!" );
+            break;
+        }
+        return NULL;
+    }
+private:
+    ways_to_cancel_t my_cancellation_method;
+};
+
+#if _MSC_VER && !__INTEL_COMPILER
+#pragma warning (pop)
+#endif
+
+template<void(*submit_task)(task&)>
+struct SubmitTaskFunctor {
+    SubmitTaskFunctor( task& t ) : my_task( t ) {}
+    void operator()() const {
+        submit_task(my_task);
+    }
+private:
+    task& my_task;
+};
+
+void TestCancellation(bool cancel_by_exception) {
+    g_is_critical_task_submitted = false;
+    g_bypassed_critical_task_stage = not_bypassed;
+    tbb::task_group_context context_to_leave_working;
+    tbb::task_group_context context_to_cancel;
+    task* root_task_of_to_be_cancelled_context = NULL;
+    task* root_task_of_working_to_completion_context = NULL;
+    size_t task_num = 64;
+    size_t task_num_for_cancelled_context = 2 * MaxThread;
+    g_num_executed_from_cancelled_context = g_num_executed_from_working_context = 0;
+    g_cancelling_task_id = -1;
+    g_arena.initialize( MaxThread ); // leaving one slot to be occupied by master to submit the work
+    g_arena.execute(
+        WorkCreator<ATask</*cancelled_group=*/true>, task::spawn>
+        (root_task_of_to_be_cancelled_context, task_num_for_cancelled_context,
+         /*num_critical_tasks=*/0, &context_to_cancel)
+    );
+    g_arena.execute(
+        WorkCreator<ATask</*cancelled_group=*/false>, task::spawn>
+        (root_task_of_working_to_completion_context, task_num, /*num_critical_tasks=*/1,
+         &context_to_leave_working)
+    );
+    ways_to_cancel_t cancellation_method = ways_to_cancel_t( cancel_by_exception );
+    task& terminating_task = *new( task::allocate_additional_child_of(*root_task_of_to_be_cancelled_context) )
+        ATask</*cancelled_group=*/true>( cancellation_method );
+    tbb::internal::make_critical( terminating_task ); // stop the work as soon as possible!
+    g_arena.enqueue( SubmitTaskFunctor<task::enqueue>(terminating_task),
+                     tbb::priority_t(tbb::internal::priority_critical) );
+    g_is_critical_task_submitted = true;
+    try {
+        g_arena.execute( WorkAwaiter(root_task_of_to_be_cancelled_context) );
+    } catch( const std::runtime_error& e ) {
+        ASSERT( cancel_by_exception, "Exception was not expected!" );
+        ASSERT( std::string(e.what()) == "Exception data", "Unexpected exception data!" );
+    } catch( const tbb::captured_exception& e ) {
+        ASSERT( cancel_by_exception, "Exception was not expected!" );
+        ASSERT( std::string(e.what()) == "Exception data", "Unexpected exception data!" );
+    } catch( ... ) {
+        ASSERT( false, "Failed to catch specific exception" );
+    }
+    g_arena.execute( WorkAwaiter(root_task_of_working_to_completion_context) );
+    g_arena.terminate();
+
+    if( !cancel_by_exception ) {
+        ASSERT( context_to_cancel.is_group_execution_cancelled(), "Execution must be cancelled" );
+    }
+    ASSERT( !context_to_leave_working.is_group_execution_cancelled(),
+            "Execution must NOT be cancelled" );
+
+    ASSERT( g_num_executed_from_working_context == task_num + /*one critical*/1,
+            "Incorrect number of tasks executed!" );
+    ASSERT( g_num_executed_from_cancelled_context < task_num_for_cancelled_context,
+            "Number of executed tasks from the cancelled context should be less than submitted!" );
+    ASSERT( 0 < g_cancelling_task_id && g_cancelling_task_id < MaxThread + 1,
+            "Critical task was executed in wrong order." );
+}
+
+void TestCancellationSupport(bool cancel_by_exception) {
+    const char* test_type[] = { "by explicit call to cancel", "by throwing an exception" };
+    REMARK( "\tCancellation support %s\n", test_type[!!cancel_by_exception] );
+    TestCancellation( cancel_by_exception );
+}
+
+namespace NestedArenaCase {
+
+static const size_t g_num_critical_tasks = 10;
+static const size_t g_num_critical_nested = 5;
+
+struct CriticalTask : public task {
+    CriticalTask(task_marker_t /*mark*/) {}
+    task* execute() __TBB_override {
+        ++g_num_executed_from_working_context;
+        task* nested_root = NULL;
+        if( !g_is_critical_task_submitted ) {
+            g_is_critical_task_submitted = true;
+            g_arena.execute(
+                WorkCreator<CriticalTask, task::spawn>(nested_root, /*num_tasks=*/size_t(0),
+                                                       g_num_critical_nested) );
+            g_arena.execute( WorkAwaiter(nested_root) );
+        }
+        return NULL;
+    }
+};
+
+void TestInNestedArena(tbb::task_arena& outer_arena) {
+    g_root_task = NULL;
+    g_is_critical_task_submitted = false;
+    g_num_executed_from_working_context = 0;
+    g_arena.initialize( 1 );
+    outer_arena.execute(
+        WorkCreator<CriticalTask, task::spawn>(
+            g_root_task, /*num_tasks=*/size_t(0), g_num_critical_tasks) );
+    outer_arena.execute( WorkAwaiter(g_root_task) );
+    ASSERT( g_num_executed_from_working_context == g_num_critical_tasks + g_num_critical_nested,
+            "Mismatch in number of critical tasks executed in nested and outer arenas." );
+    g_arena.terminate();
+}
+
+void test() {
+    REMARK( "\tWork in nested arenas\n" );
+    TestInNestedArena( g_arena );
+
+    tbb::task_arena a( 1 );
+    TestInNestedArena( a );
+}
+} // namespace NestedArenaCase
+
+void test() {
+    REMARK("Testing support for critical tasks\n");
+    TestSchedulerTaskSelectionWhenSpawn();
+    TestSchedulerTaskSelectionWhenEnqueue();
+    TestCancellationSupport(/*cancel_by_exception=*/false);
+    TestCancellationSupport(/*cancel_by_exception=*/true);
+    NestedArenaCase::test();
+}
+} // namespace CriticalTaskSupport
+#endif /* __TBB_PREVIEW_CRITICAL_TASKS */
+
+int TestMain () {
+#if TBB_USE_EXCEPTIONS
+    TestUnconstructibleTask<1>();
+    TestUnconstructibleTask<10000>();
+#endif
+    TestAlignment();
+    TestNoteAffinityContext();
+    TestDispatchLoopResponsiveness();
+    TestWaitDiscriminativenessWithoutStealing();
+    TestWaitDiscriminativenessWithStealing();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        TestSpawnChildren( p );
+        TestSpawnRootList( p );
+        TestSafeContinuation( p );
+        TestLeftRecursion( p );
+        TestDag( p );
+        TestAffinity( p );
+        TestUserThread( p );
+        TestStealLimit( p );
+        TestRelaxedOwnership( p );
+        TestMastersIsolation( p );
+    }
+    TestWaitableTask();
+#if __TBB_PREVIEW_CRITICAL_TASKS
+    CriticalTaskSupport::test();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_task_arena.cpp b/xdl/third_party/tbb/src/test/test_task_arena.cpp
new file mode 100644
index 00000000..24e78b78
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_arena.cpp
@@ -0,0 +1,1618 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_LOCAL_OBSERVER 1
+#define __TBB_EXTRA_DEBUG 1
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+
+#include <stdexcept>
+#include <cstdlib>
+#include <cstdio>
+#include <vector>
+#include <set>
+
+#include "harness_fp.h"
+
+#if __TBB_TASK_ISOLATION
+// Whitebox stuff for TestIsolatedExecuteNS::ContinuationTest().
+// TODO: Consider better approach instead of the whitebox approach.
+#define private public
+#include "tbb/task.h"
+#undef private
+#endif /* __TBB_TASK_ISOLATION */
+
+#include "tbb/task_arena.h"
+#include "tbb/atomic.h"
+#include "tbb/task_scheduler_observer.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/parallel_for.h"
+#include "tbb/blocked_range.h"
+#include "tbb/enumerable_thread_specific.h"
+
+#include "harness_assert.h"
+#include "harness.h"
+#include "harness_barrier.h"
+
+#if _MSC_VER
+// plays around __TBB_NO_IMPLICIT_LINKAGE. __TBB_LIB_NAME should be defined (in makefiles)
+#pragma comment(lib, __TBB_STRING(__TBB_LIB_NAME))
+#endif
+
+#include "tbb/global_control.h"
+//--------------------------------------------------//
+// Test that task_arena::initialize and task_arena::terminate work when doing nothing else.
+/* maxthread is treated as the biggest possible concurrency level. */
+void InitializeAndTerminate( int maxthread ) {
+    __TBB_TRY {
+        for( int i=0; i<200; ++i ) {
+            switch( i&3 ) {
+                // Arena is created inactive, initialization is always explicit. Lazy initialization is covered by other test functions.
+                // Explicit initialization can either keep the original values or change those.
+                // Arena termination can be explicit or implicit (in the destructor).
+                // TODO: extend with concurrency level checks if such a method is added.
+                default: {
+                    tbb::task_arena arena( std::rand() % maxthread + 1 );
+                    ASSERT(!arena.is_active(), "arena should not be active until initialized");
+                    arena.initialize();
+                    ASSERT(arena.is_active(), NULL);
+                    arena.terminate();
+                    ASSERT(!arena.is_active(), "arena should not be active; it was terminated");
+                    break;
+                }
+                case 0: {
+                    tbb::task_arena arena( 1 );
+                    ASSERT(!arena.is_active(), "arena should not be active until initialized");
+                    arena.initialize( std::rand() % maxthread + 1 ); // change the parameters
+                    ASSERT(arena.is_active(), NULL);
+                    break;
+                }
+                case 1: {
+                    tbb::task_arena arena( tbb::task_arena::automatic );
+                    ASSERT(!arena.is_active(), NULL);
+                    arena.initialize();
+                    ASSERT(arena.is_active(), NULL);
+                    break;
+                }
+                case 2: {
+                    tbb::task_arena arena;
+                    ASSERT(!arena.is_active(), "arena should not be active until initialized");
+                    arena.initialize( std::rand() % maxthread + 1 );
+                    ASSERT(arena.is_active(), NULL);
+                    arena.terminate();
+                    ASSERT(!arena.is_active(), "arena should not be active; it was terminated");
+                    break;
+                }
+            }
+        }
+    } __TBB_CATCH( std::runtime_error& error ) {
+#if TBB_USE_EXCEPTIONS
+        REPORT("ERROR: %s\n", error.what() );
+#endif /* TBB_USE_EXCEPTIONS */
+    }
+}
+
+//--------------------------------------------------//
+// Definitions used in more than one test
+typedef tbb::blocked_range<int> Range;
+
+// slot_id value: -1 is reserved by current_slot(), -2 is set in on_scheduler_exit() below
+static tbb::enumerable_thread_specific<int> local_id, old_id, slot_id(-3);
+
+void ResetTLS() {
+    local_id.clear();
+    old_id.clear();
+    slot_id.clear();
+}
+
+class ArenaObserver : public tbb::task_scheduler_observer {
+    int myId;               // unique observer/arena id within a test
+    int myMaxConcurrency;   // concurrency of the associated arena
+    int myNumReservedSlots; // reserved slots in the associated arena
+    void on_scheduler_entry( bool is_worker ) __TBB_override {
+        int current_index = tbb::this_task_arena::current_thread_index();
+        REMARK("a %s #%p is entering arena %d from %d on slot %d\n", is_worker?"worker":"master",
+                &local_id.local(), myId, local_id.local(), current_index );
+        ASSERT(current_index<(myMaxConcurrency>1?myMaxConcurrency:2), NULL);
+        if(is_worker) ASSERT(current_index>=myNumReservedSlots, NULL);
+
+        ASSERT(!old_id.local(), "double call to on_scheduler_entry");
+        old_id.local() = local_id.local();
+        ASSERT(old_id.local() != myId, "double entry to the same arena");
+        local_id.local() = myId;
+        slot_id.local() = current_index;
+    }
+    void on_scheduler_exit( bool is_worker ) __TBB_override {
+        REMARK("a %s #%p is leaving arena %d to %d\n", is_worker?"worker":"master",
+                &local_id.local(), myId, old_id.local());
+        ASSERT(local_id.local() == myId, "nesting of arenas is broken");
+        ASSERT(slot_id.local() == tbb::this_task_arena::current_thread_index(), NULL);
+         //!deprecated, remove when tbb::task_arena::current_thread_index is removed.
+        ASSERT(slot_id.local() == tbb::task_arena::current_thread_index(), NULL);
+        slot_id.local() = -2;
+        local_id.local() = old_id.local();
+        old_id.local() = 0;
+    }
+public:
+    ArenaObserver(tbb::task_arena &a, int maxConcurrency, int numReservedSlots, int id)
+        : tbb::task_scheduler_observer(a)
+        , myId(id)
+        , myMaxConcurrency(maxConcurrency)
+        , myNumReservedSlots(numReservedSlots) {
+        ASSERT(myId, NULL);
+        observe(true);
+    }
+    ~ArenaObserver () {
+        ASSERT(!old_id.local(), "inconsistent observer state");
+    }
+};
+
+struct IndexTrackingBody { // Must be used together with ArenaObserver
+    void operator() ( const Range& ) const {
+        ASSERT(slot_id.local() == tbb::this_task_arena::current_thread_index(), NULL);
+        //!deprecated, remove when tbb::task_arena::current_thread_index is removed.
+        ASSERT(slot_id.local() == tbb::task_arena::current_thread_index(), NULL);
+        for ( volatile int i = 0; i < 50000; ++i )
+            ;
+    }
+};
+
+struct AsynchronousWork : NoAssign {
+    Harness::SpinBarrier &my_barrier;
+    bool my_is_blocking;
+    AsynchronousWork(Harness::SpinBarrier &a_barrier, bool blocking = true)
+    : my_barrier(a_barrier), my_is_blocking(blocking) {}
+    void operator()() const {
+        ASSERT(local_id.local() != 0, "not in explicit arena");
+        tbb::parallel_for(Range(0,500), IndexTrackingBody(), tbb::simple_partitioner(), *tbb::task::self().group());
+        if(my_is_blocking) my_barrier.timed_wait(10); // must be asynchronous to master thread
+        else my_barrier.signal_nowait();
+    }
+};
+
+//--------------------------------------------------//
+// Test that task_arenas might be created and used from multiple application threads.
+// Also tests arena observers. The parameter p is the index of an app thread running this test.
+void TestConcurrentArenasFunc(int idx) {
+    // A regression test for observer activation order:
+    // check that arena observer can be activated before local observer
+    struct LocalObserver : public tbb::task_scheduler_observer {
+        LocalObserver() : tbb::task_scheduler_observer(/*local=*/true) { observe(true); }
+    };
+    tbb::task_arena a1;
+    a1.initialize(1,0);
+    ArenaObserver o1(a1, 1, 0, idx*2+1); // the last argument is a "unique" observer/arena id for the test
+    ASSERT(o1.is_observing(), "Arena observer has not been activated");
+    LocalObserver lo;
+    ASSERT(lo.is_observing(), "Local observer has not been activated");
+    tbb::task_arena a2(2,1);
+    ArenaObserver o2(a2, 2, 1, idx*2+2);
+    ASSERT(o2.is_observing(), "Arena observer has not been activated");
+    Harness::SpinBarrier barrier(2);
+    AsynchronousWork work(barrier);
+    a1.enqueue(work); // put async work
+    barrier.timed_wait(10);
+    a2.enqueue(work); // another work
+    a2.execute(work); // my_barrier.timed_wait(10) inside
+    a1.debug_wait_until_empty();
+    a2.debug_wait_until_empty();
+}
+
+void TestConcurrentArenas(int p) {
+    ResetTLS();
+    NativeParallelFor( p, &TestConcurrentArenasFunc );
+}
+
+//--------------------------------------------------//
+// Test multiple application threads working with a single arena at the same time.
+class MultipleMastersPart1 : NoAssign {
+    tbb::task_arena &my_a;
+    Harness::SpinBarrier &my_b1, &my_b2;
+public:
+    MultipleMastersPart1( tbb::task_arena &a, Harness::SpinBarrier &b1, Harness::SpinBarrier &b2)
+        : my_a(a), my_b1(b1), my_b2(b2) {}
+    void operator()(int) const {
+        my_a.execute(AsynchronousWork(my_b2, /*blocking=*/false));
+        my_b1.timed_wait(10);
+        // A regression test for bugs 1954 & 1971
+        my_a.enqueue(AsynchronousWork(my_b2, /*blocking=*/false));
+    }
+};
+
+class MultipleMastersPart2 : NoAssign {
+    tbb::task_arena &my_a;
+    Harness::SpinBarrier &my_b;
+public:
+    MultipleMastersPart2( tbb::task_arena &a, Harness::SpinBarrier &b) : my_a(a), my_b(b) {}
+    void operator()(int) const {
+        my_a.execute(AsynchronousWork(my_b, /*blocking=*/false));
+    }
+};
+
+class MultipleMastersPart3 : NoAssign {
+    tbb::task_arena &my_a;
+    Harness::SpinBarrier &my_b;
+
+    struct Runner : NoAssign {
+        tbb::task* const a_task;
+        Runner(tbb::task* const t) : a_task(t) {}
+        void operator()() const {
+            for ( volatile int i = 0; i < 10000; ++i )
+                ;
+            a_task->decrement_ref_count();
+        }
+    };
+
+    struct Waiter : NoAssign {
+        tbb::task* const a_task;
+        Waiter(tbb::task* const t) : a_task(t) {}
+        void operator()() const {
+            a_task->wait_for_all();
+        }
+    };
+
+public:
+    MultipleMastersPart3(tbb::task_arena &a, Harness::SpinBarrier &b)
+        : my_a(a), my_b(b) {}
+    void operator()(int idx) const {
+        tbb::empty_task* root_task = new(tbb::task::allocate_root()) tbb::empty_task;
+        my_b.timed_wait(10); // increases chances for task_arena initialization contention
+        for( int i=0; i<100; ++i) {
+            root_task->set_ref_count(2);
+            my_a.enqueue(Runner(root_task));
+            my_a.execute(Waiter(root_task));
+        }
+        tbb::task::destroy(*root_task);
+        REMARK("Master #%d: job completed, wait for others\n", idx);
+        my_b.timed_wait(10);
+    }
+};
+
+class MultipleMastersPart4 : NoAssign {
+    tbb::task_arena &my_a;
+    Harness::SpinBarrier &my_b;
+    tbb::task_group_context *my_ag;
+
+    struct Getter : NoAssign {
+        tbb::task_group_context *& my_g;
+        Getter(tbb::task_group_context *&a_g) : my_g(a_g) {}
+        void operator()() const {
+            my_g = tbb::task::self().group();
+        }
+    };
+    struct Checker : NoAssign {
+        tbb::task_group_context *my_g;
+        Checker(tbb::task_group_context *a_g) : my_g(a_g) {}
+        void operator()() const {
+            ASSERT(my_g == tbb::task::self().group(), NULL);
+            tbb::task *t = new( tbb::task::allocate_root() ) tbb::empty_task;
+            ASSERT(my_g == t->group(), NULL);
+            tbb::task::destroy(*t);
+        }
+    };
+    struct NestedChecker : NoAssign {
+        const MultipleMastersPart4 &my_body;
+        NestedChecker(const MultipleMastersPart4 &b) : my_body(b) {}
+        void operator()() const {
+            tbb::task_group_context *nested_g = tbb::task::self().group();
+            ASSERT(my_body.my_ag != nested_g, NULL);
+            tbb::task *t = new( tbb::task::allocate_root() ) tbb::empty_task;
+            ASSERT(nested_g == t->group(), NULL);
+            tbb::task::destroy(*t);
+            my_body.my_a.enqueue(Checker(my_body.my_ag));
+        }
+    };
+public:
+    MultipleMastersPart4( tbb::task_arena &a, Harness::SpinBarrier &b) : my_a(a), my_b(b) {
+        my_a.execute(Getter(my_ag));
+    }
+    // NativeParallelFor's functor
+    void operator()(int) const {
+        my_a.execute(*this);
+    }
+    // Arena's functor
+    void operator()() const {
+        Checker check(my_ag);
+        check();
+        tbb::task_arena nested(1,1);
+        nested.execute(NestedChecker(*this)); // change arena
+        tbb::parallel_for(Range(0,1),*this); // change group context only
+        my_b.timed_wait(10);
+        my_a.execute(check);
+        check();
+    }
+    // parallel_for's functor
+    void operator()(const Range &) const {
+        NestedChecker(*this)();
+        my_a.execute(Checker(my_ag)); // restore arena context
+    }
+};
+
+void TestMultipleMasters(int p) {
+    {
+        REMARK("multiple masters, part 1\n");
+        ResetTLS();
+        tbb::task_arena a(1,0);
+        a.initialize();
+        ArenaObserver o(a, 1, 0, 1);
+        Harness::SpinBarrier barrier1(p), barrier2(2*p+1); // each of p threads will submit two tasks signaling the barrier
+        NativeParallelFor( p, MultipleMastersPart1(a, barrier1, barrier2) );
+        barrier2.timed_wait(10);
+        a.debug_wait_until_empty();
+    } {
+        REMARK("multiple masters, part 2\n");
+        ResetTLS();
+        tbb::task_arena a(2,1);
+        ArenaObserver o(a, 2, 1, 2);
+        Harness::SpinBarrier barrier(p+2);
+        a.enqueue(AsynchronousWork(barrier, /*blocking=*/true)); // occupy the worker, a regression test for bug 1981
+        NativeParallelFor( p, MultipleMastersPart2(a, barrier) );
+        barrier.timed_wait(10);
+        a.debug_wait_until_empty();
+    } {
+        // Regression test for the bug 1981 part 2 (task_arena::execute() with wait_for_all for an enqueued task)
+        REMARK("multiple masters, part 3: wait_for_all() in execute()\n");
+        tbb::task_arena a(p,1);
+        Harness::SpinBarrier barrier(p+1); // for masters to avoid endless waiting at least in some runs
+        // "Oversubscribe" the arena by 1 master thread
+        NativeParallelFor( p+1, MultipleMastersPart3(a, barrier) );
+        a.debug_wait_until_empty();
+    } {
+        int c = p%3? (p%2? p : 2) : 3;
+        REMARK("multiple masters, part 4: contexts, arena(%d)\n", c);
+        ResetTLS();
+        tbb::task_arena a(c, 1);
+        ArenaObserver o(a, c, 1, c);
+        Harness::SpinBarrier barrier(c);
+        MultipleMastersPart4 test(a, barrier);
+        NativeParallelFor(p, test);
+        a.debug_wait_until_empty();
+    }
+}
+
+//--------------------------------------------------//
+// TODO: explain what TestArenaEntryConsistency does
+#include <sstream>
+#if TBB_USE_EXCEPTIONS
+#include <stdexcept>
+#include "tbb/tbb_exception.h"
+#endif
+
+struct TestArenaEntryBody : FPModeContext {
+    tbb::atomic<int> &my_stage; // each execute increases it
+    std::stringstream my_id;
+    bool is_caught, is_expected;
+    enum { arenaFPMode = 1 };
+
+    TestArenaEntryBody(tbb::atomic<int> &s, int idx, int i)  // init thread-specific instance
+    :   FPModeContext(idx+i)
+    ,   my_stage(s)
+    ,   is_caught(false)
+    ,   is_expected( (idx&(1<<i)) != 0 && (TBB_USE_EXCEPTIONS) != 0 )
+    {
+        my_id << idx << ':' << i << '@';
+    }
+    void operator()() { // inside task_arena::execute()
+        // synchronize with other stages
+        int stage = my_stage++;
+        int slot = tbb::this_task_arena::current_thread_index();
+        ASSERT(slot >= 0 && slot <= 1, "master or the only worker");
+        // wait until the third stage is delegated and then starts on slot 0
+        while(my_stage < 2+slot) __TBB_Yield();
+        // deduct its entry type and put it into id, it helps to find source of a problem
+        my_id << (stage < 3 ? (tbb::this_task_arena::current_thread_index()?
+                              "delegated_to_worker" : stage < 2? "direct" : "delegated_to_master")
+                            : stage == 3? "nested_same_ctx" : "nested_alien_ctx");
+        REMARK("running %s\n", my_id.str().c_str());
+        AssertFPMode(arenaFPMode);
+        if(is_expected)
+            __TBB_THROW(std::logic_error(my_id.str()));
+        // no code can be put here since exceptions can be thrown
+    }
+    void on_exception(const char *e) { // outside arena, in catch block
+        is_caught = true;
+        REMARK("caught %s\n", e);
+        ASSERT(my_id.str() == e, NULL);
+        assertFPMode();
+    }
+    void after_execute() { // outside arena and catch block
+        REMARK("completing %s\n", my_id.str().c_str() );
+        ASSERT(is_caught == is_expected, NULL);
+        assertFPMode();
+    }
+};
+
+class ForEachArenaEntryBody : NoAssign {
+    tbb::task_arena &my_a; // expected task_arena(2,1)
+    tbb::atomic<int> &my_stage; // each execute increases it
+    int my_idx;
+
+public:
+    ForEachArenaEntryBody(tbb::task_arena &a, tbb::atomic<int> &c)
+    : my_a(a), my_stage(c), my_idx(0) {}
+
+    void test(int idx) {
+        my_idx = idx;
+        my_stage = 0;
+        NativeParallelFor(3, *this); // test cross-arena calls
+        ASSERT(my_stage == 3, NULL);
+        my_a.execute(*this); // test nested calls
+        ASSERT(my_stage == 5, NULL);
+    }
+
+    // task_arena functor for nested tests
+    void operator()() const {
+        test_arena_entry(3); // in current task group context
+        tbb::parallel_for(4, 5, *this); // in different context
+    }
+
+    // NativeParallelFor & parallel_for functor
+    void operator()(int i) const {
+        test_arena_entry(i);
+    }
+
+private:
+    void test_arena_entry(int i) const {
+        TestArenaEntryBody scoped_functor(my_stage, my_idx, i);
+        __TBB_TRY {
+            my_a.execute(scoped_functor);
+        }
+#if TBB_USE_EXCEPTIONS
+        catch(tbb::captured_exception &e) {
+            scoped_functor.on_exception(e.what());
+            ASSERT_WARNING(TBB_USE_CAPTURED_EXCEPTION, "Caught captured_exception while expecting exact one");
+        } catch(std::logic_error &e) {
+            scoped_functor.on_exception(e.what());
+            ASSERT(!TBB_USE_CAPTURED_EXCEPTION, "Caught exception of wrong type");
+        } catch(...) { ASSERT(false, "Unexpected exception type"); }
+#endif //TBB_USE_EXCEPTIONS
+        scoped_functor.after_execute();
+    }
+};
+
+void TestArenaEntryConsistency() {
+    REMARK("test arena entry consistency\n");
+
+    tbb::task_arena a(2, 1);
+    tbb::atomic<int> c;
+    ForEachArenaEntryBody body(a, c);
+
+    FPModeContext fp_scope(TestArenaEntryBody::arenaFPMode);
+    a.initialize(); // capture FP settings to arena
+    fp_scope.setNextFPMode();
+
+    for (int i = 0; i < 100; i++) // not less than 32 = 2^5 of entry types
+        body.test(i);
+}
+
+//--------------------------------------------------
+// Test that the requested degree of concurrency for task_arena is achieved in various conditions
+class TestArenaConcurrencyBody : NoAssign {
+    tbb::task_arena &my_a;
+    int my_max_concurrency;
+    int my_reserved_slots;
+    Harness::SpinBarrier *my_barrier;
+    Harness::SpinBarrier *my_worker_barrier;
+public:
+    TestArenaConcurrencyBody( tbb::task_arena &a, int max_concurrency, int reserved_slots, Harness::SpinBarrier *b = NULL, Harness::SpinBarrier *wb = NULL )
+    : my_a(a), my_max_concurrency(max_concurrency), my_reserved_slots(reserved_slots), my_barrier(b), my_worker_barrier(wb) {}
+    // NativeParallelFor's functor
+    void operator()( int ) const {
+        ASSERT( local_id.local() == 0, "TLS was not cleaned?" );
+        local_id.local() = 1;
+        my_a.execute( *this );
+    }
+    // Arena's functor
+    void operator()() const {
+        ASSERT( tbb::task_arena::current_thread_index() == tbb::this_task_arena::current_thread_index(), NULL );
+        int idx = tbb::this_task_arena::current_thread_index();
+        ASSERT( idx < (my_max_concurrency > 1 ? my_max_concurrency : 2), NULL );
+        ASSERT( my_a.max_concurrency() == tbb::this_task_arena::max_concurrency(), NULL );
+        int max_arena_concurrency = tbb::this_task_arena::max_concurrency();
+        ASSERT( max_arena_concurrency == my_max_concurrency, NULL );
+        if ( my_worker_barrier ) {
+            if ( local_id.local() == 1 ) {
+                // Master thread in a reserved slot
+                ASSERT( idx < my_reserved_slots, "Masters are supposed to use only reserved slots in this test" );
+            } else {
+                // Worker thread
+                ASSERT( idx >= my_reserved_slots, NULL );
+                my_worker_barrier->timed_wait( 10 );
+            }
+        } else if ( my_barrier )
+            ASSERT( local_id.local() == 1, "Workers are not supposed to enter the arena in this test" );
+        if ( my_barrier ) my_barrier->timed_wait( 10 );
+        else Harness::Sleep( 10 );
+    }
+};
+
+void TestArenaConcurrency( int p, int reserved = 0, int step = 1) {
+    for (; reserved <= p; reserved += step) {
+        REMARK("TestArenaConcurrency: %d slots, %d reserved\n", p, reserved);
+        tbb::task_arena a( p, reserved );
+        { // Check concurrency with worker & reserved master threads.
+            ResetTLS();
+            Harness::SpinBarrier b( p );
+            Harness::SpinBarrier wb( p-reserved );
+            TestArenaConcurrencyBody test( a, p, reserved, &b, &wb );
+            for ( int i = reserved; i < p; ++i )
+                a.enqueue( test );
+            if ( reserved==1 )
+                test( 0 ); // calls execute()
+            else
+                NativeParallelFor( reserved, test );
+            a.debug_wait_until_empty();
+        } { // Check if multiple masters alone can achieve maximum concurrency.
+            ResetTLS();
+            Harness::SpinBarrier b( p );
+            NativeParallelFor( p, TestArenaConcurrencyBody( a, p, reserved, &b ) );
+            a.debug_wait_until_empty();
+        } { // Check oversubscription by masters.
+            ResetTLS();
+            NativeParallelFor( 2*p, TestArenaConcurrencyBody( a, p, reserved ) );
+            a.debug_wait_until_empty();
+        }
+    }
+}
+
+//--------------------------------------------------//
+// Test creation/initialization of a task_arena that references an existing arena (aka attach).
+// This part of the test uses the knowledge of task_arena internals
+
+typedef tbb::interface7::internal::task_arena_base task_arena_internals;
+
+struct TaskArenaValidator : public task_arena_internals {
+    int my_slot_at_construction;
+    TaskArenaValidator( const task_arena_internals& other )
+    : task_arena_internals(other) /*copies the internal state of other*/ {
+        my_slot_at_construction = tbb::this_task_arena::current_thread_index();
+    }
+    // Inspect the internal state
+    int concurrency() { return my_max_concurrency; }
+    int reserved_for_masters() { return (int)my_master_slots; }
+
+    // This method should be called in task_arena::execute() for a captured arena
+    // by the same thread that created the validator.
+    void operator()() {
+        ASSERT( tbb::this_task_arena::current_thread_index()==my_slot_at_construction,
+                "Current thread index has changed since the validator construction" );
+        //!deprecated
+        ASSERT( tbb::task_arena::current_thread_index()==my_slot_at_construction,
+                "Current thread index has changed since the validator construction" );
+    }
+};
+
+void ValidateAttachedArena( tbb::task_arena& arena, bool expect_activated,
+                            int expect_concurrency, int expect_masters ) {
+    ASSERT( arena.is_active()==expect_activated, "Unexpected activation state" );
+    if( arena.is_active() ) {
+        TaskArenaValidator validator( arena );
+        ASSERT( validator.concurrency()==expect_concurrency, "Unexpected arena size" );
+        ASSERT( validator.reserved_for_masters()==expect_masters, "Unexpected # of reserved slots" );
+        if ( tbb::this_task_arena::current_thread_index() != tbb::task_arena::not_initialized ) {
+            ASSERT( tbb::task_arena::current_thread_index() >= 0 &&
+                tbb::this_task_arena::current_thread_index() >= 0, NULL);
+            // for threads already in arena, check that the thread index remains the same
+            arena.execute( validator );
+        } else { // not_initialized
+            // Test the deprecated method
+            ASSERT( tbb::task_arena::current_thread_index()==-1, NULL);
+        }
+
+        // Ideally, there should be a check for having the same internal arena object,
+        // but that object is not easily accessible for implicit arenas.
+    }
+}
+
+struct TestAttachBody : NoAssign {
+    mutable int my_idx; // safe to modify and use within the NativeParallelFor functor
+    const int maxthread;
+    TestAttachBody( int max_thr ) : maxthread(max_thr) {}
+
+    // The functor body for NativeParallelFor
+    void operator()( int idx ) const {
+        my_idx = idx;
+        int default_threads = tbb::task_scheduler_init::default_num_threads();
+
+        tbb::task_arena arena = tbb::task_arena( tbb::task_arena::attach() );
+        ValidateAttachedArena( arena, false, -1, -1 ); // Nothing yet to attach to
+
+        { // attach to an arena created via task_scheduler_init
+            tbb::task_scheduler_init init( idx+1 );
+
+            tbb::task_arena arena2 = tbb::task_arena( tbb::task_arena::attach() );
+            ValidateAttachedArena( arena2, true, idx+1, 1 );
+
+            arena.initialize( tbb::task_arena::attach() );
+        }
+        ValidateAttachedArena( arena, true, idx+1, 1 );
+
+        arena.terminate();
+        ValidateAttachedArena( arena, false, -1, -1 );
+
+        // Check default behavior when attach cannot succeed
+        switch (idx%2) {
+        case 0:
+            { // construct as attached, then initialize
+                tbb::task_arena arena2 = tbb::task_arena( tbb::task_arena::attach() );
+                ValidateAttachedArena( arena2, false, -1, -1 );
+                arena2.initialize(); // must be initialized with default parameters
+                ValidateAttachedArena( arena2, true, default_threads, 1 );
+            }
+            break;
+        case 1:
+            { // default-construct, then initialize as attached
+                tbb::task_arena arena2;
+                ValidateAttachedArena( arena2, false, -1, -1 );
+                arena2.initialize( tbb::task_arena::attach() ); // must use default parameters
+                ValidateAttachedArena( arena2, true, default_threads, 1 );
+            }
+            break;
+        } // switch
+
+        // attach to an auto-initialized arena
+        tbb::empty_task& tsk = *new (tbb::task::allocate_root()) tbb::empty_task;
+        tbb::task::spawn_root_and_wait(tsk);
+        tbb::task_arena arena2 = tbb::task_arena( tbb::task_arena::attach() );
+        ValidateAttachedArena( arena2, true, default_threads, 1 );
+
+        // attach to another task_arena
+        arena.initialize( maxthread, min(maxthread,idx) );
+        arena.execute( *this );
+    }
+
+    // The functor body for task_arena::execute above
+    void operator()() const {
+        tbb::task_arena arena2 = tbb::task_arena( tbb::task_arena::attach() );
+        ValidateAttachedArena( arena2, true, maxthread, min(maxthread,my_idx) );
+    }
+
+    // The functor body for tbb::parallel_for
+    void operator()( const Range& r ) const {
+        for( int i = r.begin(); i<r.end(); ++i ) {
+            tbb::task_arena arena2 = tbb::task_arena( tbb::task_arena::attach() );
+            ValidateAttachedArena( arena2, true, maxthread+1, 1 ); // +1 to match initialization in TestMain
+        }
+    }
+};
+
+void TestAttach( int maxthread ) {
+    REMARK( "Testing attached task_arenas\n" );
+    // Externally concurrent, but no concurrency within a thread
+    NativeParallelFor( max(maxthread,4), TestAttachBody( maxthread ) );
+    // Concurrent within the current arena; may also serve as a stress test
+    tbb::parallel_for( Range(0,10000*maxthread), TestAttachBody( maxthread ) );
+}
+
+//--------------------------------------------------//
+// Test that task_arena::enqueue does not tolerate a non-const functor.
+// TODO: can it be reworked as SFINAE-based compile-time check?
+struct TestFunctor {
+    void operator()() { ASSERT( false, "Non-const operator called" ); }
+    void operator()() const { /* library requires this overload only */ }
+};
+
+void TestConstantFunctorRequirement() {
+    tbb::task_arena a;
+    TestFunctor tf;
+    a.enqueue( tf );
+#if __TBB_TASK_PRIORITY
+    a.enqueue( tf, tbb::priority_normal );
+#endif
+}
+//--------------------------------------------------//
+#if __TBB_TASK_ISOLATION
+#include "tbb/parallel_reduce.h"
+#include "tbb/parallel_invoke.h"
+// Test this_task_arena::isolate
+namespace TestIsolatedExecuteNS {
+    //--------------------------------------------------//
+    template <typename NestedPartitioner>
+    class NestedParFor : NoAssign {
+    public:
+        NestedParFor() {}
+        void operator()() const {
+            NestedPartitioner p;
+            tbb::parallel_for( 0, 10, Harness::DummyBody( 10 ), p );
+        }
+    };
+
+    template <typename NestedPartitioner>
+    class ParForBody : NoAssign {
+        bool myOuterIsolation;
+        tbb::enumerable_thread_specific<int> &myEts;
+        tbb::atomic<bool> &myIsStolen;
+    public:
+        ParForBody( bool outer_isolation, tbb::enumerable_thread_specific<int> &ets, tbb::atomic<bool> &is_stolen )
+            : myOuterIsolation( outer_isolation ), myEts( ets ), myIsStolen( is_stolen ) {}
+        void operator()( int ) const {
+            int &e = myEts.local();
+            if ( e++ > 0 ) myIsStolen = true;
+            if ( myOuterIsolation )
+                NestedParFor<NestedPartitioner>()();
+            else
+                tbb::this_task_arena::isolate( NestedParFor<NestedPartitioner>() );
+            --e;
+        }
+    };
+
+    template <typename OuterPartitioner, typename NestedPartitioner>
+    class OuterParFor : NoAssign {
+        bool myOuterIsolation;
+        tbb::atomic<bool> &myIsStolen;
+    public:
+        OuterParFor( bool outer_isolation, tbb::atomic<bool> &is_stolen ) : myOuterIsolation( outer_isolation ), myIsStolen( is_stolen ) {}
+        void operator()() const {
+            tbb::enumerable_thread_specific<int> ets( 0 );
+            OuterPartitioner p;
+            tbb::parallel_for( 0, 1000, ParForBody<NestedPartitioner>( myOuterIsolation, ets, myIsStolen ), p );
+        }
+    };
+
+    template <typename OuterPartitioner, typename NestedPartitioner>
+    void TwoLoopsTest( bool outer_isolation ) {
+        tbb::atomic<bool> is_stolen;
+        is_stolen = false;
+        const int max_repeats = 100;
+        if ( outer_isolation ) {
+            for ( int i = 0; i <= max_repeats; ++i ) {
+                tbb::this_task_arena::isolate( OuterParFor<OuterPartitioner, NestedPartitioner>( outer_isolation, is_stolen ) );
+                if ( is_stolen ) break;
+            }
+            ASSERT_WARNING( is_stolen, "isolate() should not block stealing on nested levels without isolation" );
+        } else {
+            for ( int i = 0; i <= max_repeats; ++i ) {
+                OuterParFor<OuterPartitioner, NestedPartitioner>( outer_isolation, is_stolen )();
+            }
+            ASSERT( !is_stolen, "isolate() on nested levels should prevent stealing from outer leves" );
+        }
+    }
+
+    void TwoLoopsTest( bool outer_isolation ) {
+        TwoLoopsTest<tbb::simple_partitioner, tbb::simple_partitioner>( outer_isolation );
+        TwoLoopsTest<tbb::simple_partitioner, tbb::affinity_partitioner>( outer_isolation );
+        TwoLoopsTest<tbb::affinity_partitioner, tbb::simple_partitioner>( outer_isolation );
+        TwoLoopsTest<tbb::affinity_partitioner, tbb::affinity_partitioner>( outer_isolation );
+    }
+
+    void TwoLoopsTest() {
+        TwoLoopsTest( true );
+        TwoLoopsTest( false );
+    }
+    //--------------------------------------------------//
+    class HeavyMixTestBody : NoAssign {
+        tbb::enumerable_thread_specific<Harness::FastRandom>& myRandom;
+        tbb::enumerable_thread_specific<int>& myIsolatedLevel;
+        int myNestedLevel;
+        bool myHighPriority;
+
+        template <typename Partitioner, typename Body>
+        static void RunTwoBodies( Harness::FastRandom& rnd, const Body &body, Partitioner& p, tbb::task_group_context* ctx = NULL ) {
+            if ( rnd.get() % 2 )
+                if  (ctx )
+                    tbb::parallel_for( 0, 2, body, p, *ctx );
+                else
+                    tbb::parallel_for( 0, 2, body, p );
+            else
+                tbb::parallel_invoke( body, body );
+        }
+
+        template <typename Partitioner>
+        class IsolatedBody : NoAssign {
+            const HeavyMixTestBody &myHeavyMixTestBody;
+            Partitioner &myPartitioner;
+        public:
+            IsolatedBody( const HeavyMixTestBody &body, Partitioner &partitioner )
+                : myHeavyMixTestBody( body ), myPartitioner( partitioner ) {}
+            void operator()() const {
+                RunTwoBodies( myHeavyMixTestBody.myRandom.local(),
+                    HeavyMixTestBody( myHeavyMixTestBody.myRandom, myHeavyMixTestBody.myIsolatedLevel,
+                        myHeavyMixTestBody.myNestedLevel + 1, myHeavyMixTestBody.myHighPriority ),
+                    myPartitioner );
+            }
+        };
+
+        template <typename Partitioner>
+        void RunNextLevel( Harness::FastRandom& rnd, int &isolated_level ) const {
+            Partitioner p;
+            switch ( rnd.get() % 3 ) {
+                case 0: {
+                    // No features
+                    tbb::task_group_context ctx;
+                    if ( myHighPriority )
+                        ctx.set_priority( tbb::priority_high );
+                    RunTwoBodies( rnd, HeavyMixTestBody(myRandom, myIsolatedLevel, myNestedLevel + 1, myHighPriority), p, &ctx );
+                    break;
+                }
+                case 1: {
+                    // High priority
+                    tbb::task_group_context ctx;
+                    ctx.set_priority( tbb::priority_high );
+                    RunTwoBodies( rnd, HeavyMixTestBody(myRandom, myIsolatedLevel, myNestedLevel + 1, true), p, &ctx );
+                    break;
+                }
+                case 2: {
+                    // Isolation
+                    int previous_isolation = isolated_level;
+                    isolated_level = myNestedLevel;
+                    tbb::this_task_arena::isolate( IsolatedBody<Partitioner>( *this, p ) );
+                    isolated_level = previous_isolation;
+                    break;
+                }
+            }
+        }
+    public:
+        HeavyMixTestBody( tbb::enumerable_thread_specific<Harness::FastRandom>& random,
+            tbb::enumerable_thread_specific<int>& isolated_level, int nested_level, bool high_priority )
+            : myRandom( random ), myIsolatedLevel( isolated_level )
+            , myNestedLevel( nested_level ), myHighPriority( high_priority ) {}
+        void operator()() const {
+            int &isolated_level = myIsolatedLevel.local();
+            ASSERT( myNestedLevel > isolated_level, "The outer-level task should not be stolen on isolated level" );
+            if ( myNestedLevel == 20 )
+                return;
+            Harness::FastRandom &rnd = myRandom.local();
+            if ( rnd.get() % 2 == 1 ) {
+                RunNextLevel<tbb::auto_partitioner>( rnd, isolated_level );
+            } else {
+                RunNextLevel<tbb::affinity_partitioner>( rnd, isolated_level );
+            }
+        }
+        void operator()(int) const {
+            this->operator()();
+        }
+    };
+
+    struct RandomInitializer {
+        Harness::FastRandom operator()() {
+            return Harness::FastRandom( tbb::this_task_arena::current_thread_index() );
+        }
+    };
+
+    void HeavyMixTest() {
+        tbb::task_scheduler_init init( tbb::task_scheduler_init::default_num_threads() < 3 ? 3 : tbb::task_scheduler_init::automatic );
+        RandomInitializer init_random;
+        tbb::enumerable_thread_specific<Harness::FastRandom> random( init_random );
+        tbb::enumerable_thread_specific<int> isolated_level( 0 );
+        for ( int i = 0; i < 5; ++i ) {
+            HeavyMixTestBody b( random, isolated_level, 1, false );
+            b( 0 );
+            REMARK( "." );
+        }
+    }
+    //--------------------------------------------------//
+    struct ContinuationTestReduceBody : NoAssign {
+        tbb::internal::isolation_tag myIsolation;
+        ContinuationTestReduceBody( tbb::internal::isolation_tag isolation ) : myIsolation( isolation ) {}
+        ContinuationTestReduceBody( ContinuationTestReduceBody& b, tbb::split ) : myIsolation( b.myIsolation ) {}
+        void operator()( tbb::blocked_range<int> ) {}
+        void join( ContinuationTestReduceBody& ) {
+            tbb::internal::isolation_tag isolation = tbb::task::self().prefix().isolation;
+            ASSERT( isolation == myIsolation, "The continuations should preserve children's isolation" );
+        }
+    };
+    struct ContinuationTestIsolated {
+        void operator()() const {
+            ContinuationTestReduceBody b( tbb::task::self().prefix().isolation );
+            tbb::parallel_deterministic_reduce( tbb::blocked_range<int>( 0, 100 ), b );
+        }
+    };
+    struct ContinuationTestParForBody : NoAssign {
+        tbb::enumerable_thread_specific<int> &myEts;
+    public:
+        ContinuationTestParForBody( tbb::enumerable_thread_specific<int> &ets ) : myEts( ets ){}
+        void operator()( int ) const {
+            int &e = myEts.local();
+            ++e;
+            ASSERT( e==1, "The task is stolen on isolated level" );
+            tbb::this_task_arena::isolate( ContinuationTestIsolated() );
+            --e;
+        }
+    };
+    void ContinuationTest() {
+        for ( int i = 0; i < 5; ++i ) {
+            tbb::enumerable_thread_specific<int> myEts;
+            tbb::parallel_for( 0, 100, ContinuationTestParForBody( myEts ), tbb::simple_partitioner() );
+        }
+    }
+    //--------------------------------------------------//
+#if TBB_USE_EXCEPTIONS
+    struct MyException {};
+    struct IsolatedBodyThrowsException {
+        void operator()() const {
+            __TBB_THROW( MyException() );
+        }
+    };
+    struct ExceptionTestBody : NoAssign {
+        tbb::enumerable_thread_specific<int>& myEts;
+        tbb::atomic<bool>& myIsStolen;
+        ExceptionTestBody( tbb::enumerable_thread_specific<int>& ets, tbb::atomic<bool>& is_stolen )
+            : myEts( ets ), myIsStolen( is_stolen ) {}
+        void operator()( int i ) const {
+            try {
+                tbb::this_task_arena::isolate( IsolatedBodyThrowsException() );
+                ASSERT( false, "The exception has been lost" );
+            }
+            catch ( MyException ) {}
+            catch ( ... ) {
+                ASSERT( false, "Unexpected exception" );
+            }
+            // Check that nested algorithms can steal outer-level tasks
+            int &e = myEts.local();
+            if ( e++ > 0 ) myIsStolen = true;
+            // work imbalance increases chances for stealing
+            tbb::parallel_for( 0, 10+i, Harness::DummyBody( 100 ) );
+            --e;
+        }
+    };
+
+#endif /* TBB_USE_EXCEPTIONS */
+    void ExceptionTest() {
+#if TBB_USE_EXCEPTIONS
+        tbb::enumerable_thread_specific<int> ets;
+        tbb::atomic<bool> is_stolen;
+        is_stolen = false;
+        for ( int i = 0; i<10; ++i ) {
+            tbb::parallel_for( 0, 1000, ExceptionTestBody( ets, is_stolen ) );
+            if ( is_stolen ) break;
+        }
+        ASSERT( is_stolen, "isolate should not affect non-isolated work" );
+#endif /* TBB_USE_EXCEPTIONS */
+    }
+
+    struct NonConstBody {
+        unsigned int state;
+        void operator()() {
+            state ^= ~0u;
+        }
+    };
+
+    void TestNonConstBody() {
+        NonConstBody body;
+        body.state = 0x6c97d5ed;
+        tbb::this_task_arena::isolate(body);
+        ASSERT(body.state == 0x93682a12, "The wrong state");
+    }
+
+    class TestEnqueueTask : public tbb::task {
+        bool enqueued;
+        tbb::enumerable_thread_specific<bool>& executed;
+        tbb::atomic<int>& completed;
+    public:
+        static const int N = 100;
+
+        TestEnqueueTask(bool enq, tbb::enumerable_thread_specific<bool>& exe, tbb::atomic<int>& c)
+            : enqueued(enq), executed(exe), completed(c) {}
+        tbb::task* execute() __TBB_override {
+            if (enqueued) {
+                executed.local() = true;
+                ++completed;
+                __TBB_Yield();
+            } else {
+                parent()->add_ref_count(N);
+                for (int i = 0; i < N; ++i)
+                    tbb::task::enqueue(*new (parent()->allocate_child()) TestEnqueueTask(true, executed, completed));
+            }
+            return NULL;
+        }
+    };
+
+    class TestEnqueueIsolateBody : NoCopy {
+        tbb::enumerable_thread_specific<bool>& executed;
+        tbb::atomic<int>& completed;
+    public:
+        TestEnqueueIsolateBody(tbb::enumerable_thread_specific<bool>& exe, tbb::atomic<int>& c)
+            : executed(exe), completed(c) {}
+        void operator()() {
+            tbb::task::spawn_root_and_wait(*new (tbb::task::allocate_root()) TestEnqueueTask(false, executed, completed));
+        }
+    };
+
+    void TestEnqueue() {
+        tbb::enumerable_thread_specific<bool> executed(false);
+        tbb::atomic<int> completed;
+
+        // Check that the main thread can process enqueued tasks.
+        completed = 0;
+        TestEnqueueIsolateBody b1(executed, completed);
+        b1();
+        if (!executed.local())
+            REPORT("Warning: No one enqueued task has executed by the main thread.\n");
+
+        executed.local() = false;
+        completed = 0;
+        const int N = 100;
+        // Create enqueued tasks out of isolation.
+        for (int i = 0; i < N; ++i)
+            tbb::task::enqueue(*new (tbb::task::allocate_root()) TestEnqueueTask(true, executed, completed));
+        TestEnqueueIsolateBody b2(executed, completed);
+        tbb::this_task_arena::isolate(b2);
+        ASSERT(executed.local() == false, "An enqueued task was executed within isolate.");
+
+        while (completed < TestEnqueueTask::N + N) __TBB_Yield();
+    }
+}
+
+void TestIsolatedExecute() {
+    REMARK("TestIsolatedExecute");
+    // At least 3 threads (owner + 2 thieves) are required to reproduce a situation when the owner steals outer
+    // level task on a nested level. If we have only one thief then it will execute outer level tasks first and
+    // the owner will not have a possibility to steal outer level tasks.
+    int num_threads = min( tbb::task_scheduler_init::default_num_threads(), 3 );
+    {
+        // Too many threads require too many work to reproduce the stealing from outer level.
+        tbb::task_scheduler_init init( max(num_threads, 7) );
+        REMARK("."); TestIsolatedExecuteNS::TwoLoopsTest();
+        REMARK("."); TestIsolatedExecuteNS::HeavyMixTest();
+        REMARK("."); TestIsolatedExecuteNS::ContinuationTest();
+        REMARK("."); TestIsolatedExecuteNS::ExceptionTest();
+    }
+    tbb::task_scheduler_init init(num_threads);
+    REMARK("."); TestIsolatedExecuteNS::HeavyMixTest();
+    REMARK("."); TestIsolatedExecuteNS::ContinuationTest();
+    REMARK("."); TestIsolatedExecuteNS::TestNonConstBody();
+    REMARK("."); TestIsolatedExecuteNS::TestEnqueue();
+    REMARK("\rTestIsolatedExecute: done                                                  \n");
+}
+#endif /* __TBB_TASK_ISOLATION */
+//--------------------------------------------------//
+//--------------------------------------------------//
+
+class TestDelegatedSpawnWaitBody : NoAssign {
+    tbb::task_arena &my_a;
+    Harness::SpinBarrier &my_b1, &my_b2;
+
+    struct Spawner : NoAssign {
+        tbb::task* const a_task;
+        Spawner(tbb::task* const t) : a_task(t) {}
+        void operator()() const {
+            tbb::task::spawn( *new(a_task->allocate_child()) tbb::empty_task );
+        }
+    };
+
+    struct Waiter : NoAssign {
+        tbb::task* const a_task;
+        Waiter(tbb::task* const t) : a_task(t) {}
+        void operator()() const {
+            a_task->wait_for_all();
+        }
+    };
+
+public:
+    TestDelegatedSpawnWaitBody( tbb::task_arena &a, Harness::SpinBarrier &b1, Harness::SpinBarrier &b2)
+        : my_a(a), my_b1(b1), my_b2(b2) {}
+    // NativeParallelFor's functor
+    void operator()(int idx) const {
+        if ( idx==0 ) { // thread 0 works in the arena, thread 1 waits for it (to prevent test hang)
+            for( int i=0; i<2; ++i ) my_a.enqueue(*this); // tasks to sync with workers
+            tbb::empty_task* root_task = new(tbb::task::allocate_root()) tbb::empty_task;
+            root_task->set_ref_count(100001);
+            my_b1.timed_wait(10); // sync with the workers
+            for( int i=0; i<100000; ++i) {
+                my_a.execute(Spawner(root_task));
+            }
+            my_a.execute(Waiter(root_task));
+            tbb::task::destroy(*root_task);
+        }
+        my_b2.timed_wait(10); // sync both threads
+    }
+    // Arena's functor
+    void operator()() const {
+        my_b1.timed_wait(10); // sync with the arena master
+    }
+};
+
+void TestDelegatedSpawnWait() {
+    // Regression test for a bug with missed wakeup notification from a delegated task
+    REMARK( "Testing delegated spawn & wait\n" );
+    tbb::task_arena a(2,0);
+    a.initialize();
+    Harness::SpinBarrier barrier1(3), barrier2(2);
+    NativeParallelFor( 2, TestDelegatedSpawnWaitBody(a, barrier1, barrier2) );
+    a.debug_wait_until_empty();
+}
+
+class TestMultipleWaitsArenaWait : NoAssign {
+public:
+    TestMultipleWaitsArenaWait( int idx, int bunch_size, int num_tasks, tbb::task** waiters, tbb::atomic<int>& processed )
+        : my_idx( idx ), my_bunch_size( bunch_size ), my_num_tasks(num_tasks), my_waiters( waiters ), my_processed( processed ) {}
+    void operator()() const {
+        ++my_processed;
+        // Wait for all tasks
+        if ( my_idx < my_num_tasks )
+            my_waiters[my_idx]->wait_for_all();
+        // Signal waiting tasks
+        if ( my_idx >= my_bunch_size )
+            my_waiters[my_idx-my_bunch_size]->decrement_ref_count();
+    }
+private:
+    int my_idx;
+    int my_bunch_size;
+    int my_num_tasks;
+    tbb::task** my_waiters;
+    tbb::atomic<int>& my_processed;
+};
+
+class TestMultipleWaitsThreadBody : NoAssign {
+public:
+    TestMultipleWaitsThreadBody( int bunch_size, int num_tasks, tbb::task_arena& a, tbb::task** waiters, tbb::atomic<int>& processed )
+        : my_bunch_size( bunch_size ), my_num_tasks( num_tasks ), my_arena( a ), my_waiters( waiters ), my_processed( processed ) {}
+    void operator()( int idx ) const {
+        my_arena.execute( TestMultipleWaitsArenaWait( idx, my_bunch_size, my_num_tasks, my_waiters, my_processed ) );
+        --my_processed;
+    }
+private:
+    int my_bunch_size;
+    int my_num_tasks;
+    tbb::task_arena& my_arena;
+    tbb::task** my_waiters;
+    tbb::atomic<int>& my_processed;
+};
+
+#include "tbb/tbb_thread.h"
+
+void TestMultipleWaits( int num_threads, int num_bunches, int bunch_size ) {
+    tbb::task_arena a( num_threads );
+    const int num_tasks = (num_bunches-1)*bunch_size;
+    tbb::task** tasks = new tbb::task*[num_tasks];
+    for ( int i = 0; i<num_tasks; ++i )
+        tasks[i] = new (tbb::task::allocate_root()) tbb::empty_task();
+    tbb::atomic<int> processed;
+    processed = 0;
+    for ( int repeats = 0; repeats<10; ++repeats ) {
+        int idx = 0;
+        for ( int bunch = 0; bunch < num_bunches-1; ++bunch ) {
+            // Sync with the previous bunch of tasks to prevent "false" nested dependicies (when a nested task waits for an outer task).
+            while ( processed < bunch*bunch_size ) __TBB_Yield();
+            // Run the bunch of threads/tasks that depend on the next bunch of threads/tasks.
+            for ( int i = 0; i<bunch_size; ++i ) {
+                tasks[idx]->set_ref_count( 2 );
+                tbb::tbb_thread( TestMultipleWaitsThreadBody( bunch_size, num_tasks, a, tasks, processed ), idx++ ).detach();
+            }
+        }
+        // No sync because the threads of the last bunch do not call wait_for_all.
+        // Run the last bunch of threads.
+        for ( int i = 0; i<bunch_size; ++i )
+            tbb::tbb_thread( TestMultipleWaitsThreadBody( bunch_size, num_tasks, a, tasks, processed ), idx++ ).detach();
+        while ( processed ) __TBB_Yield();
+    }
+    for ( int i = 0; i<num_tasks; ++i )
+        tbb::task::destroy( *tasks[i] );
+    delete[] tasks;
+}
+
+void TestMultipleWaits() {
+    REMARK( "Testing multiple waits\n" );
+    // Limit the number of threads to prevent heavy oversubscription.
+    const int max_threads = min( 16, tbb::task_scheduler_init::default_num_threads() );
+
+    Harness::FastRandom rnd(1234);
+    for ( int threads = 1; threads <= max_threads; threads += max( threads/2, 1 ) ) {
+        for ( int i = 0; i<3; ++i ) {
+            const int num_bunches = 3 + rnd.get()%3;
+            const int bunch_size = max_threads + rnd.get()%max_threads;
+            TestMultipleWaits( threads, num_bunches, bunch_size );
+        }
+    }
+}
+//--------------------------------------------------//
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#include "tbb/global_control.h"
+
+void TestSmallStackSize() {
+    tbb::task_scheduler_init init(tbb::task_scheduler_init::automatic,
+        tbb::global_control::active_value(tbb::global_control::thread_stack_size) / 2 );
+    // The test produces the warning (not a error) if fails. So the test is run many times
+    // to make the log annoying (to force to consider it as an error).
+    for (int i = 0; i < 100; ++i) {
+        tbb::task_arena a;
+        a.initialize();
+    }
+}
+//--------------------------------------------------//
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+namespace TestMoveSemanticsNS {
+    struct TestFunctor {
+        void operator()() const {};
+    };
+
+    struct MoveOnlyFunctor : MoveOnly, TestFunctor {
+        MoveOnlyFunctor() : MoveOnly() {};
+        MoveOnlyFunctor(MoveOnlyFunctor&& other) : MoveOnly(std::move(other)) {};
+    };
+
+    struct MovePreferableFunctor : Movable, TestFunctor {
+        MovePreferableFunctor() : Movable() {};
+        MovePreferableFunctor(MovePreferableFunctor&& other) : Movable( std::move(other) ) {};
+        MovePreferableFunctor(const MovePreferableFunctor& other) : Movable(other) {};
+    };
+
+    struct NoMoveNoCopyFunctor : NoCopy, TestFunctor {
+        NoMoveNoCopyFunctor() : NoCopy() {};
+        // mv ctor is not allowed as cp ctor from parent NoCopy
+    private:
+        NoMoveNoCopyFunctor(NoMoveNoCopyFunctor&&);
+    };
+
+
+    void TestFunctors() {
+        tbb::task_arena ta;
+        MovePreferableFunctor mpf;
+        // execute() doesn't have any copies or moves of arguments inside the impl
+        ta.execute( NoMoveNoCopyFunctor() );
+
+        ta.enqueue( MoveOnlyFunctor() );
+        ta.enqueue( mpf );
+        ASSERT(mpf.alive, "object was moved when was passed by lval");
+        mpf.Reset();
+        ta.enqueue( std::move(mpf) );
+        ASSERT(!mpf.alive, "object was copied when was passed by rval");
+        mpf.Reset();
+#if __TBB_TASK_PRIORITY
+        ta.enqueue( MoveOnlyFunctor(), tbb::priority_normal );
+        ta.enqueue( mpf, tbb::priority_normal );
+        ASSERT(mpf.alive, "object was moved when was passed by lval");
+        mpf.Reset();
+        ta.enqueue( std::move(mpf), tbb::priority_normal );
+        ASSERT(!mpf.alive, "object was copied when was passed by rval");
+        mpf.Reset();
+#endif
+    }
+}
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+void TestMoveSemantics() {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestMoveSemanticsNS::TestFunctors();
+#else
+    REPORT("Known issue: move support tests are skipped.\n");
+#endif
+}
+//--------------------------------------------------//
+#if __TBB_CPP11_DECLTYPE_PRESENT && !__TBB_CPP11_DECLTYPE_OF_FUNCTION_RETURN_TYPE_BROKEN
+#include <vector>
+#include "harness_state_trackable.h"
+
+namespace TestReturnValueNS {
+    struct noDefaultTag {};
+    class ReturnType : public Harness::StateTrackable<> {
+        static const int SIZE = 42;
+        std::vector<int> data;
+    public:
+        ReturnType(noDefaultTag) : Harness::StateTrackable<>(0) {}
+#if !__TBB_IMPLICIT_MOVE_PRESENT
+        // Define copy constructor to test that it is never called
+        ReturnType(const ReturnType& r) : Harness::StateTrackable<>(r), data(r.data) {}
+        ReturnType(ReturnType&& r) : Harness::StateTrackable<>(std::move(r)), data(std::move(r.data)) {}
+#endif
+        void fill() {
+            for (int i = 0; i < SIZE; ++i)
+                data.push_back(i);
+        }
+        void check() {
+            ASSERT(data.size() == unsigned(SIZE), NULL);
+            for (int i = 0; i < SIZE; ++i)
+                ASSERT(data[i] == i, NULL);
+            Harness::StateTrackableCounters::counters_t& cnts = Harness::StateTrackableCounters::counters;
+            ASSERT((cnts[Harness::StateTrackableBase::DefaultInitialized] == 0), NULL);
+            ASSERT(cnts[Harness::StateTrackableBase::DirectInitialized] == 1, NULL);
+            std::size_t copied = cnts[Harness::StateTrackableBase::CopyInitialized];
+            std::size_t moved = cnts[Harness::StateTrackableBase::MoveInitialized];
+            ASSERT(cnts[Harness::StateTrackableBase::Destroyed] == copied + moved, NULL);
+            // The number of copies/moves should not exceed 3: function return, store to an internal storage,
+            // acquire internal storage.
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+            ASSERT(copied == 0 && moved <=3, NULL);
+#else
+            ASSERT(copied <= 3 && moved == 0, NULL);
+#endif
+        }
+    };
+
+    template <typename R>
+    R function() {
+        noDefaultTag tag;
+        R r(tag);
+        r.fill();
+        return r;
+    }
+
+    template <>
+    void function<void>() {}
+
+    template <typename R>
+    struct Functor {
+        R operator()() const {
+            return function<R>();
+        }
+    };
+
+    tbb::task_arena& arena() {
+        static tbb::task_arena a;
+        return a;
+    }
+
+    template <typename F>
+    void TestExecute(F &f) {
+        Harness::StateTrackableCounters::reset();
+        ReturnType r = arena().execute(f);
+        r.check();
+    }
+
+    template <typename F>
+    void TestExecute(const F &f) {
+        Harness::StateTrackableCounters::reset();
+        ReturnType r = arena().execute(f);
+        r.check();
+    }
+#if TBB_PREVIEW_TASK_ISOLATION
+    template <typename F>
+    void TestIsolate(F &f) {
+        Harness::StateTrackableCounters::reset();
+        ReturnType r = tbb::this_task_arena::isolate(f);
+        r.check();
+    }
+
+    template <typename F>
+    void TestIsolate(const F &f) {
+        Harness::StateTrackableCounters::reset();
+        ReturnType r = tbb::this_task_arena::isolate(f);
+        r.check();
+    }
+#endif
+
+    void Test() {
+        TestExecute(Functor<ReturnType>());
+        Functor<ReturnType> f1;
+        TestExecute(f1);
+        TestExecute(function<ReturnType>);
+
+        arena().execute(Functor<void>());
+        Functor<void> f2;
+        arena().execute(f2);
+        arena().execute(function<void>);
+#if TBB_PREVIEW_TASK_ISOLATION
+        TestIsolate(Functor<ReturnType>());
+        TestIsolate(f1);
+        TestIsolate(function<ReturnType>);
+        tbb::this_task_arena::isolate(Functor<void>());
+        tbb::this_task_arena::isolate(f2);
+        tbb::this_task_arena::isolate(function<void>);
+#endif
+    }
+}
+#endif /* __TBB_CPP11_DECLTYPE_PRESENT */
+
+void TestReturnValue() {
+#if __TBB_CPP11_DECLTYPE_PRESENT && !__TBB_CPP11_DECLTYPE_OF_FUNCTION_RETURN_TYPE_BROKEN
+    TestReturnValueNS::Test();
+#endif
+}
+//--------------------------------------------------//
+void TestConcurrentFunctionality(int min_thread_num = MinThread, int max_thread_num = MaxThread) {
+    InitializeAndTerminate(max_thread_num);
+    for (int p = min_thread_num; p <= max_thread_num; ++p) {
+        REMARK("testing with %d threads\n", p);
+        TestConcurrentArenas(p);
+        TestMultipleMasters(p);
+        TestArenaConcurrency(p);
+    }
+}
+//--------------------------------------------------//
+struct DefaultCreatedWorkersAmountBody {
+    int my_threadnum;
+    DefaultCreatedWorkersAmountBody(int threadnum) : my_threadnum(threadnum) {}
+    void operator()(int) const {
+        ASSERT(my_threadnum == tbb::this_task_arena::max_concurrency(), "concurrency level is not equal specified threadnum");
+        ASSERT(tbb::this_task_arena::current_thread_index() < tbb::this_task_arena::max_concurrency(), "amount of created threads is more than specified by default");
+        local_id.local() = 1;
+        Harness::Sleep(1);
+    }
+};
+
+struct NativeParallelForBody {
+    int my_thread_num;
+    int iterations;
+    NativeParallelForBody(int thread_num, int multiplier = 100) : my_thread_num(thread_num), iterations(multiplier * thread_num) {}
+    void operator()(int idx) const {
+        ASSERT(idx == 0, "more than 1 thread is going to reset TLS");
+        ResetTLS();
+        tbb::parallel_for(0, iterations, DefaultCreatedWorkersAmountBody(my_thread_num), tbb::simple_partitioner());
+        ASSERT(local_id.size() == size_t(my_thread_num), "amount of created threads is not equal to default num");
+    }
+};
+
+void TestDefaultCreatedWorkersAmount() {
+    NativeParallelFor(1, NativeParallelForBody(tbb::task_scheduler_init::default_num_threads()));
+}
+
+void TestAbilityToCreateWorkers(int thread_num) {
+    tbb::task_scheduler_init init_market_with_necessary_amount_plus_one(thread_num);
+    // Checks only some part of reserved-master threads amount:
+    // 0 and 1 reserved threads are important cases but it is also needed
+    // to collect some statistic data with other amount and to not consume
+    // whole test sesion time checking each amount
+    TestArenaConcurrency(thread_num - 1, 0, int(thread_num / 2.72));
+    TestArenaConcurrency(thread_num, 1, int(thread_num / 3.14));
+}
+
+void TestDefaultWorkersLimit() {
+    TestDefaultCreatedWorkersAmount();
+    // Shared RML might limit the number of workers even if you specify the limits
+    // by the reason of (default_concurrency==max_concurrency) for shared RML
+#ifndef RML_USE_WCRM
+    TestAbilityToCreateWorkers(256);
+#endif
+}
+//--------------------------------------------------//
+
+// MyObserver checks if threads join to the same arena
+struct MyObserver: public tbb::task_scheduler_observer {
+    tbb::enumerable_thread_specific<tbb::task_arena*>& my_tls;
+    tbb::task_arena& my_arena;
+    tbb::atomic<int>& my_failure_counter;
+    tbb::atomic<int>& my_counter;
+
+    MyObserver(tbb::task_arena& a,
+        tbb::enumerable_thread_specific<tbb::task_arena*>& tls,
+        tbb::atomic<int>& failure_counter,
+        tbb::atomic<int>& counter)
+        : tbb::task_scheduler_observer(a), my_tls(tls), my_arena(a),
+        my_failure_counter(failure_counter), my_counter(counter) {
+        observe(true);
+    }
+    void on_scheduler_entry(bool worker) __TBB_override {
+        if (worker) {
+            ++my_counter;
+            tbb::task_arena*& cur_arena = my_tls.local();
+            if (cur_arena != 0 && cur_arena != &my_arena) {
+                ++my_failure_counter;
+            }
+            cur_arena = &my_arena;
+        }
+    }
+};
+
+struct MyLoopBody {
+    Harness::SpinBarrier& m_barrier;
+    MyLoopBody(Harness::SpinBarrier& b):m_barrier(b) { }
+    void operator()(int) const {
+        m_barrier.wait();
+    }
+};
+
+struct TaskForArenaExecute {
+    Harness::SpinBarrier& m_barrier;
+    TaskForArenaExecute(Harness::SpinBarrier& b):m_barrier(b) { }
+    void operator()() const {
+         tbb::parallel_for(0, tbb::this_task_arena::max_concurrency(),
+             MyLoopBody(m_barrier), tbb::simple_partitioner()
+         );
+    }
+};
+
+struct ExecuteParallelFor {
+    int n_per_thread;
+    int n_repetitions;
+    std::vector<tbb::task_arena>& arenas;
+    Harness::SpinBarrier& arena_barrier;
+    Harness::SpinBarrier& master_barrier;
+    ExecuteParallelFor(const int n_per_thread_, const int n_repetitions_,
+        std::vector<tbb::task_arena>& arenas_,
+        Harness::SpinBarrier& arena_barrier_, Harness::SpinBarrier& master_barrier_)
+            : n_per_thread(n_per_thread_), n_repetitions(n_repetitions_), arenas(arenas_),
+              arena_barrier(arena_barrier_), master_barrier(master_barrier_){ }
+    void operator()(int i) const {
+        for (int j = 0; j < n_repetitions; ++j) {
+            arenas[i].execute(TaskForArenaExecute(arena_barrier));
+            for(volatile int k = 0; k < n_per_thread; ++k){/* waiting until workers fall asleep */}
+            master_barrier.wait();
+        }
+    }
+};
+
+// if n_threads == -1 then global_control initialized with default value
+void TestArenaWorkersMigrationWithNumThreads(int n_threads = 0) {
+    if (n_threads == 0) {
+        n_threads = tbb::task_scheduler_init::default_num_threads();
+    }
+    const int max_n_arenas = 8;
+    int n_arenas = 2;
+    if(n_threads >= 16)
+        n_arenas = max_n_arenas;
+    else if (n_threads >= 8)
+        n_arenas = 4;
+    n_threads = n_arenas * (n_threads / n_arenas);
+    const int n_per_thread = 10000000;
+    const int n_repetitions = 100;
+    const int n_outer_repetitions = 20;
+    std::multiset<float> failure_ratio; // for median calculating
+    tbb::global_control control(tbb::global_control::max_allowed_parallelism, n_threads - (n_arenas - 1));
+    Harness::SpinBarrier master_barrier(n_arenas);
+    Harness::SpinBarrier arena_barrier(n_threads);
+    MyObserver* observer[max_n_arenas];
+    std::vector<tbb::task_arena> arenas(n_arenas);
+    tbb::atomic<int> failure_counter;
+    tbb::atomic<int> counter;
+    tbb::enumerable_thread_specific<tbb::task_arena*> tls;
+    for (int i = 0; i < n_arenas; ++i) {
+        arenas[i].initialize(n_threads / n_arenas);
+        observer[i] = new MyObserver(arenas[i], tls, failure_counter, counter);
+    }
+    int ii = 0;
+    for (; ii < n_outer_repetitions; ++ii) {
+        failure_counter = 0;
+        counter = 0;
+        // Main code
+        NativeParallelFor(n_arenas, ExecuteParallelFor(n_per_thread, n_repetitions,
+            arenas, arena_barrier, master_barrier));
+		// TODO: get rid of check below by setting ratio between n_threads and n_arenas
+        failure_ratio.insert((counter != 0 ? float(failure_counter) / counter : 1.0f));
+        tls.clear();
+        // collect 3 elements in failure_ratio before calculating median
+        if (ii > 1) {
+            std::multiset<float>::iterator it = failure_ratio.begin();
+            std::advance(it, failure_ratio.size() / 2);
+            if (*it < 0.02)
+                break;
+        }
+    }
+    for (int i = 0; i < n_arenas; ++i) {
+        delete observer[i];
+    }
+    // check if median is so big
+    std::multiset<float>::iterator it = failure_ratio.begin();
+    std::advance(it, failure_ratio.size() / 2);
+	// TODO: decrease constants 0.05 and 0.3 by setting ratio between n_threads and n_arenas
+    if (*it > 0.05) {
+        REPORT("Warning: So many cases when threads join to different arenas.\n");
+        ASSERT(*it <= 0.3, "A lot of cases when threads join to different arenas.\n");
+    }
+}
+
+void TestArenaWorkersMigration() {
+    TestArenaWorkersMigrationWithNumThreads(4);
+    if (tbb::task_scheduler_init::default_num_threads() != 4) {
+        TestArenaWorkersMigrationWithNumThreads();
+    }
+}
+
+//--------------------------------------------------//
+
+int TestMain() {
+#if __TBB_TASK_ISOLATION
+    TestIsolatedExecute();
+#endif /* __TBB_TASK_ISOLATION */
+    TestSmallStackSize();
+    TestDefaultWorkersLimit();
+    // The test uses up to MaxThread workers (in arenas with no master thread),
+    // so the runtime should be initialized appropriately.
+    tbb::task_scheduler_init init_market_p_plus_one(MaxThread + 1);
+    TestConcurrentFunctionality();
+    TestArenaEntryConsistency();
+    TestAttach(MaxThread);
+    TestConstantFunctorRequirement();
+    TestDelegatedSpawnWait();
+    TestMultipleWaits();
+    TestMoveSemantics();
+    TestReturnValue();
+    TestArenaWorkersMigration();
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_task_assertions.cpp b/xdl/third_party/tbb/src/test/test_task_assertions.cpp
new file mode 100644
index 00000000..3371e976
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_assertions.cpp
@@ -0,0 +1,94 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test correctness of forceful TBB initialization before any dynamic initialization
+// of static objects inside the library took place.
+namespace tbb {
+namespace internal {
+    // Forward declaration of the TBB general initialization routine from task.cpp
+    void DoOneTimeInitializations();
+}}
+
+struct StaticInitializationChecker {
+    StaticInitializationChecker () { tbb::internal::DoOneTimeInitializations(); }
+} theChecker;
+
+//------------------------------------------------------------------------
+// Test that important assertions in class task fail as expected.
+//------------------------------------------------------------------------
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness_inject_scheduler.h"
+#include "harness.h"
+#include "harness_bad_expr.h"
+
+#if TRY_BAD_EXPR_ENABLED
+//! Task that will be abused.
+tbb::task* volatile AbusedTask;
+
+//! Number of times that AbuseOneTask
+int AbuseOneTaskRan;
+
+//! Body used to create task in thread 0 and abuse it in thread 1.
+struct AbuseOneTask {
+    void operator()( int ) const {
+        tbb::task_scheduler_init init;
+        // Thread 1 attempts to incorrectly use the task created by thread 0.
+        tbb::task_list list;
+        // spawn_root_and_wait over empty list should vacuously succeed.
+        tbb::task::spawn_root_and_wait(list);
+
+        // Check that spawn_root_and_wait fails on non-empty list.
+        list.push_back(*AbusedTask);
+
+        // Try abusing recycle_as_continuation
+        TRY_BAD_EXPR(AbusedTask->recycle_as_continuation(), "execute" );
+        TRY_BAD_EXPR(AbusedTask->recycle_as_safe_continuation(), "execute" );
+        TRY_BAD_EXPR(AbusedTask->recycle_to_reexecute(), "execute" );
+        ++AbuseOneTaskRan;
+    }
+};
+
+//! Test various __TBB_ASSERT assertions related to class tbb::task.
+void TestTaskAssertions() {
+    // Catch assertion failures
+    tbb::set_assertion_handler( AssertionFailureHandler );
+    tbb::task_scheduler_init init;
+    // Create task to be abused
+    AbusedTask = new( tbb::task::allocate_root() ) tbb::empty_task;
+    NativeParallelFor( 1, AbuseOneTask() );
+    ASSERT( AbuseOneTaskRan==1, NULL );
+    tbb::task::destroy(*AbusedTask);
+    // Restore normal assertion handling
+    tbb::set_assertion_handler( ReportError );
+}
+
+int TestMain () {
+    TestTaskAssertions();
+    return Harness::Done;
+}
+
+#else /* !TRY_BAD_EXPR_ENABLED */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !TRY_BAD_EXPR_ENABLED */
diff --git a/xdl/third_party/tbb/src/test/test_task_auto_init.cpp b/xdl/third_party/tbb/src/test/test_task_auto_init.cpp
new file mode 100644
index 00000000..269778e5
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_auto_init.cpp
@@ -0,0 +1,202 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Testing automatic initialization of TBB task scheduler, so do not use task_scheduler_init anywhere.
+
+#include "tbb/task.h"
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+#include "tbb/atomic.h"
+
+static tbb::atomic<int> g_NumTestsExecuted;
+
+#define TEST_PROLOGUE() ++g_NumTestsExecuted
+
+// Global data used in testing use cases with cross-thread usage of TBB objects
+static tbb::task *g_Root1 = NULL,
+                 *g_Root2 = NULL,
+                 *g_Root3 = NULL,
+                 *g_Task = NULL;
+
+#if __TBB_TASK_GROUP_CONTEXT
+static tbb::task_group_context* g_Ctx = NULL;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+
+void TestTaskSelf () {
+    TEST_PROLOGUE();
+    tbb::task& t = tbb::task::self();
+    ASSERT( !t.parent() && t.ref_count() == 1 && !t.affinity(), "Master's default task properties changed?" );
+}
+
+void TestRootAllocation () {
+    TEST_PROLOGUE();
+    tbb::task &r = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    tbb::task::spawn_root_and_wait(r);
+}
+
+inline void ExecuteChildAndCleanup ( tbb::task &r, tbb::task &t ) {
+    r.set_ref_count(2);
+    r.spawn_and_wait_for_all(t);
+    r.destroy(r);
+}
+
+void TestChildAllocation () {
+    TEST_PROLOGUE();
+    tbb::task &t = *new( g_Root1->allocate_child() ) tbb::empty_task;
+    ExecuteChildAndCleanup( *g_Root1, t );
+}
+
+void TestAdditionalChildAllocation () {
+    TEST_PROLOGUE();
+    tbb::task &t = *new( tbb::task::allocate_additional_child_of(*g_Root2) ) tbb::empty_task;
+    ExecuteChildAndCleanup( *g_Root2, t );
+}
+
+#if __TBB_TASK_GROUP_CONTEXT
+void TestTaskGroupContextCreation () {
+    TEST_PROLOGUE();
+    tbb::task_group_context ctx;
+    tbb::task &r = *new( tbb::task::allocate_root(ctx) ) tbb::empty_task;
+    tbb::task::spawn_root_and_wait(r);
+}
+
+void TestRootAllocationWithContext () {
+    TEST_PROLOGUE();
+    tbb::task* root = new( tbb::task::allocate_root(*g_Ctx) ) tbb::empty_task;
+    tbb::task::spawn_root_and_wait(*root);
+}
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+
+void TestSpawn () {
+    TEST_PROLOGUE();
+    tbb::task::spawn(*g_Task);
+}
+
+void TestWaitForAll () {
+    TEST_PROLOGUE();
+    g_Root3->wait_for_all();
+    tbb::task::destroy(*g_Root3);
+}
+
+typedef void (*TestFnPtr)();
+
+const TestFnPtr TestFuncsTable[] = {
+        TestTaskSelf, TestRootAllocation, TestChildAllocation, TestAdditionalChildAllocation,
+#if __TBB_TASK_GROUP_CONTEXT
+        TestTaskGroupContextCreation, TestRootAllocationWithContext,
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+        TestSpawn, TestWaitForAll };
+
+const int NumTestFuncs = sizeof(TestFuncsTable) / sizeof(TestFnPtr);
+
+struct TestThreadBody : NoAssign, Harness::NoAfterlife {
+    // Each invocation of operator() happens in a fresh thread with zero-based ID
+    // id, and checks a specific auto-initialization scenario.
+    void operator() ( int id ) const {
+        ASSERT( id >= 0 && id < NumTestFuncs, "Test diver: NativeParallelFor is used incorrectly" );
+        TestFuncsTable[id]();
+    }
+};
+
+
+#include "../tbb/tls.h"
+
+void UseAFewNewTlsKeys () {
+    tbb::internal::tls<intptr_t> tls1, tls2, tls3, tls4;
+    tls1 = tls2 = tls3 = tls4 = -1;
+}
+
+using tbb::internal::spin_wait_until_eq;
+
+volatile bool FafStarted   = false,
+              FafCanFinish = false,
+              FafCompleted = false;
+
+//! This task is supposed to be executed during termination of an auto-initialized master thread
+class FireAndForgetTask : public tbb::task {
+    tbb::task* execute () __TBB_override {
+        // Let another master thread proceed requesting new TLS keys
+        FafStarted = true;
+        UseAFewNewTlsKeys();
+        // Wait while another master thread dirtied its new TLS slots
+        spin_wait_until_eq( FafCanFinish, true );
+        FafCompleted = true;
+        return NULL;
+    }
+public: // to make gcc 3.2.3 happy
+    ~FireAndForgetTask() {
+        ASSERT(FafCompleted, "FireAndForgetTask got erroneously cancelled?");
+    }
+};
+
+#include "harness_barrier.h"
+Harness::SpinBarrier driver_barrier(2);
+
+struct DriverThreadBody : NoAssign, Harness::NoAfterlife {
+    void operator() ( int id ) const {
+        ASSERT( id < 2, "Only two test driver threads are expected" );
+        // a barrier is required to ensure both threads started; otherwise the test may deadlock:
+        // the first thread would execute FireAndForgetTask at shutdown and wait for FafCanFinish,
+        // while the second thread wouldn't even start waiting for the loader lock hold by the first one.
+        if ( id == 0 ) {
+            driver_barrier.wait();
+            // Prepare global data
+            g_Root1 = new( tbb::task::allocate_root() ) tbb::empty_task;
+            g_Root2 = new( tbb::task::allocate_root() ) tbb::empty_task;
+            g_Root3 = new( tbb::task::allocate_root() ) tbb::empty_task;
+            g_Task = new( g_Root3->allocate_child() ) tbb::empty_task;
+            g_Root3->set_ref_count(2);
+            // Run tests
+            NativeParallelFor( NumTestFuncs, TestThreadBody() );
+            ASSERT( g_NumTestsExecuted == NumTestFuncs, "Test driver: Wrong number of tests executed" );
+
+            // This test checks the validity of temporarily restoring the value of
+            // the last TLS slot for a given key during the termination of an
+            // auto-initialized master thread (in governor::auto_terminate).
+            // If anything goes wrong, generic_scheduler::cleanup_master() will assert.
+            // The context for this task must be valid till the task completion.
+#if __TBB_TASK_GROUP_CONTEXT
+            tbb::task &r = *new( tbb::task::allocate_root(*g_Ctx) ) FireAndForgetTask;
+#else
+            tbb::task &r = *new( tbb::task::allocate_root() ) FireAndForgetTask;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+            tbb::task::spawn(r);
+        }
+        else {
+#if __TBB_TASK_GROUP_CONTEXT
+            tbb::task_group_context ctx;
+            g_Ctx = &ctx;
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+            driver_barrier.wait();
+            spin_wait_until_eq( FafStarted, true );
+            UseAFewNewTlsKeys();
+            FafCanFinish = true;
+            spin_wait_until_eq( FafCompleted, true );
+        }
+    }
+};
+
+int TestMain () {
+    // Do not use any TBB functionality in the main thread!
+    NativeParallelFor( 2, DriverThreadBody() );
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_task_enqueue.cpp b/xdl/third_party/tbb/src/test/test_task_enqueue.cpp
new file mode 100644
index 00000000..eac86a22
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_enqueue.cpp
@@ -0,0 +1,381 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_task.h"
+#include "harness_barrier.h"
+#include "tbb/atomic.h"
+#include "tbb/tbb_thread.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/tick_count.h"
+
+////////////////////////////////////////////////////////////////////////////////
+// Test for basic FIFO scheduling functionality
+
+const int PairsPerTrack = 100;
+
+class EnqueuedTask : public tbb::task {
+    task* my_successor;
+    int my_enqueue_order;
+    int* my_track;
+    tbb::task* execute() __TBB_override {
+        // Capture execution order in the very beginning
+        int execution_order = 2 - my_successor->decrement_ref_count();
+        // Create some local work.
+        TaskGenerator& p = *new( allocate_root() ) TaskGenerator(2,2);
+        spawn_root_and_wait(p);
+        if( execution_order==2 ) { // the "slower" of two peer tasks
+            ++nCompletedPairs;
+            // Of course execution order can differ from dequeue order.
+            // But there is no better approximation at hand; and a single worker
+            // will execute in dequeue order, which is enough for our check.
+            if (my_enqueue_order==execution_order)
+                ++nOrderedPairs;
+            FireTwoTasks(my_track);
+            destroy(*my_successor);
+        }
+        return NULL;
+    }
+public:
+    EnqueuedTask( task* successor, int enq_order, int* track )
+    : my_successor(successor), my_enqueue_order(enq_order), my_track(track) {}
+
+    // Create and enqueue two tasks
+    static void FireTwoTasks( int* track ) {
+        int progress = ++*track;
+        if( progress < PairsPerTrack ) {
+            task* successor = new (allocate_root()) tbb::empty_task;
+            successor->set_ref_count(2);
+            enqueue( *new (allocate_root()) EnqueuedTask(successor, 1, track) );
+            enqueue( *new (allocate_root()) EnqueuedTask(successor, 2, track) );
+        }
+    }
+
+    static tbb::atomic<int> nCompletedPairs;
+    static tbb::atomic<int> nOrderedPairs;
+};
+
+tbb::atomic<int> EnqueuedTask::nCompletedPairs;
+tbb::atomic<int> EnqueuedTask::nOrderedPairs;
+
+const int nTracks = 10;
+static int TaskTracks[nTracks];
+const int stall_threshold = 1000000; // 1 sec
+
+void TimedYield( double pause_time ) {
+    tbb::tick_count start = tbb::tick_count::now();
+    while( (tbb::tick_count::now()-start).seconds() < pause_time )
+        tbb::this_tbb_thread::sleep(tbb::tick_count::interval_t(pause_time));
+}
+
+class ProgressMonitor {
+public:
+    void operator() ( ) {
+        int track_snapshot[nTracks];
+        int stall_count = 0, uneven_progress_count = 0, last_progress_mask = 0;
+        for(int i=0; i<nTracks; ++i)
+            track_snapshot[i]=0;
+        bool completed;
+        do {
+            // Yield repeatedly for at least 1 usec
+            TimedYield( 1E-6 );
+            int overall_progress = 0, progress_mask = 0;
+            const int all_progressed = (1<<nTracks) - 1;
+            completed = true;
+            for(int i=0; i<nTracks; ++i) {
+                int ti = TaskTracks[i];
+                int pi = ti-track_snapshot[i];
+                if( pi ) progress_mask |= 1<<i;
+                overall_progress += pi;
+                completed = completed && ti==PairsPerTrack;
+                track_snapshot[i]=ti;
+            }
+            // The constants in the next asserts are subjective and may need correction.
+            if( overall_progress )
+                stall_count=0;
+            else {
+                ++stall_count;
+                // no progress; consider it dead.
+                ASSERT(stall_count < stall_threshold, "no progress on enqueued tasks; deadlock, or the machine is heavily oversubscribed?");
+            }
+            if( progress_mask==all_progressed || progress_mask^last_progress_mask ) {
+                uneven_progress_count = 0;
+                last_progress_mask = progress_mask;
+            }
+            else if ( overall_progress > 2 ) {
+                ++uneven_progress_count;
+                // The threshold of 32 is 4x bigger than what was observed on a 8-core machine with oversubscription.
+                ASSERT_WARNING(uneven_progress_count < 32,
+                    "some enqueued tasks seem stalling; no simultaneous progress, or the machine is oversubscribed? Investigate if repeated");
+            }
+        } while( !completed );
+    }
+};
+
+void TestEnqueue( int p ) {
+    REMARK("Testing task::enqueue for %d threads\n", p);
+    for(int mode=0;mode<3;++mode) {
+        tbb::task_scheduler_init init(p);
+        EnqueuedTask::nCompletedPairs = EnqueuedTask::nOrderedPairs = 0;
+        for(int i=0; i<nTracks; ++i) {
+            TaskTracks[i] = -1; // to accommodate for the starting call
+            EnqueuedTask::FireTwoTasks(TaskTracks+i);
+        }
+        ProgressMonitor pm;
+        tbb::tbb_thread thr( pm );
+        if(mode==1) {
+            // do some parallel work in the meantime
+            for(int i=0; i<10; i++) {
+                TaskGenerator& g = *new( tbb::task::allocate_root() ) TaskGenerator(2,5);
+                tbb::task::spawn_root_and_wait(g);
+                TimedYield( 1E-6 );
+            }
+        }
+        if( mode==2 ) {
+            // Additionally enqueue a bunch of empty tasks. The goal is to test that tasks
+            // allocated and enqueued by a thread are safe to use after the thread leaves TBB.
+            tbb::task* root = new (tbb::task::allocate_root()) tbb::empty_task;
+            root->set_ref_count(100);
+            for( int i=0; i<100; ++i )
+                tbb::task::enqueue( *new (root->allocate_child()) tbb::empty_task );
+            init.terminate(); // master thread deregistered
+        }
+        thr.join();
+        ASSERT(EnqueuedTask::nCompletedPairs==nTracks*PairsPerTrack, NULL);
+        ASSERT(EnqueuedTask::nOrderedPairs<EnqueuedTask::nCompletedPairs,
+            "all task pairs executed in enqueue order; de facto guarantee is too strong?");
+    }
+}
+
+////////////////////////////////////////////////////////////////////////////////
+// Tests for Fire-And-Forget scheduling functionality
+
+int NumRepeats = 200;
+const int MaxNumThreads = 16;
+static volatile bool Finished[MaxNumThreads] = {};
+
+static volatile bool CanStart;
+
+//! Custom user task interface
+class ITask {
+public:
+    virtual ~ITask() {}
+    virtual void Execute() = 0;
+    virtual void Release() { delete this; }
+};
+
+class TestTask : public ITask {
+    volatile bool *m_pDone;
+public:
+    TestTask ( volatile bool *pDone ) : m_pDone(pDone) {}
+
+    void Execute() __TBB_override {
+        *m_pDone = true;
+    }
+};
+
+class CarrierTask : public tbb::task {
+    ITask* m_pTask;
+public:
+    CarrierTask(ITask* pTask) : m_pTask(pTask) {}
+
+    task* execute() __TBB_override {
+        m_pTask->Execute();
+        m_pTask->Release();
+        return NULL;
+    }
+};
+
+class SpawnerTask : public ITask {
+    ITask* m_taskToSpawn;
+public:
+    SpawnerTask(ITask* job) : m_taskToSpawn(job) {}
+
+    void Execute() __TBB_override {
+        while ( !CanStart )
+            __TBB_Yield();
+        Harness::Sleep(10); // increases probability of the bug
+        tbb::task::enqueue( *new( tbb::task::allocate_root() ) CarrierTask(m_taskToSpawn) );
+    }
+};
+
+class EnqueuerBody {
+public:
+    void operator() ( int id ) const {
+        tbb::task_scheduler_init init(tbb::task_scheduler_init::default_num_threads() + 1);
+
+        SpawnerTask* pTask = new SpawnerTask( new TestTask(Finished + id) );
+        tbb::task::enqueue( *new( tbb::task::allocate_root() ) CarrierTask(pTask) );
+    }
+};
+
+//! Regression test for a bug that caused premature arena destruction
+void TestCascadedEnqueue () {
+    REMARK("Testing cascaded enqueue\n");
+    tbb::task_scheduler_init init(tbb::task_scheduler_init::default_num_threads() + 1);
+
+    int minNumThreads = min(tbb::task_scheduler_init::default_num_threads(), MaxNumThreads) / 2;
+    int maxNumThreads = min(tbb::task_scheduler_init::default_num_threads() * 2, MaxNumThreads);
+
+    for ( int numThreads = minNumThreads; numThreads <= maxNumThreads; ++numThreads ) {
+        for ( int i = 0; i < NumRepeats; ++i ) {
+            CanStart = false;
+            __TBB_Yield();
+            NativeParallelFor( numThreads, EnqueuerBody() );
+            CanStart = true;
+            int j = 0;
+            while ( j < numThreads ) {
+                if ( Finished[j] )
+                    ++j;
+                else
+                    __TBB_Yield();
+            }
+            for ( j = 0; j < numThreads; ++j )
+                Finished[j] = false;
+            REMARK("\r%02d threads; Iteration %03d", numThreads, i);
+        }
+    }
+    REMARK( "\r                                 \r" );
+}
+
+class DummyTask : public tbb::task {
+public:
+    task *execute() __TBB_override {
+        Harness::Sleep(1);
+        return NULL;
+    }
+};
+
+class SharedRootBody {
+    tbb::task *my_root;
+public:
+    SharedRootBody ( tbb::task *root ) : my_root(root) {}
+
+    void operator() ( int ) const {
+        tbb::task::enqueue( *new( tbb::task::allocate_additional_child_of(*my_root) ) DummyTask );
+    }
+};
+
+//! Test for enqueuing children of the same root from different master threads
+void TestSharedRoot ( int p ) {
+    REMARK("Testing enqueuing siblings from different masters\n");
+    tbb::task_scheduler_init init(p);
+    tbb::task *root =  new ( tbb::task::allocate_root() ) tbb::empty_task;
+    root->set_ref_count(1);
+    for( int n = MinThread; n <= MaxThread; ++n ) {
+        REMARK("%d masters, %d requested workers\r", n, p-1);
+        NativeParallelFor( n, SharedRootBody(root) );
+    }
+    REMARK( "                                    \r" );
+    root->wait_for_all();
+    tbb::task::destroy(*root);
+}
+
+class BlockingTask : public tbb::task {
+    Harness::SpinBarrier &m_Barrier;
+
+    tbb::task* execute () __TBB_override {
+        m_Barrier.wait();
+        return 0;
+    }
+
+public:
+    BlockingTask ( Harness::SpinBarrier& bar ) : m_Barrier(bar) {}
+};
+
+//! Test making sure that masters can dequeue tasks
+/** Success criterion is not hanging. **/
+void TestDequeueByMaster () {
+    REMARK("Testing task dequeuing by master\n");
+    tbb::task_scheduler_init init(1);
+    Harness::SpinBarrier bar(2);
+    tbb::task &r = *new ( tbb::task::allocate_root() ) tbb::empty_task;
+    r.set_ref_count(3);
+    tbb::task::enqueue( *new(r.allocate_child()) BlockingTask(bar) );
+    tbb::task::enqueue( *new(r.allocate_child()) BlockingTask(bar) );
+    r.wait_for_all();
+    tbb::task::destroy(r);
+}
+
+////////////////////// Missed wake-ups ///////
+#include "tbb/blocked_range.h"
+#include "tbb/parallel_for.h"
+
+static const int NUM_TASKS    = 4;
+static const size_t NUM_REPEATS = TBB_USE_DEBUG ? 50000 : 100000;
+static tbb::task_group_context persistent_context(tbb::task_group_context::isolated);
+
+struct Functor : NoAssign
+{
+    Harness::SpinBarrier &my_barrier;
+    Functor(Harness::SpinBarrier &a_barrier) : my_barrier(a_barrier) { }
+    void operator()(const tbb::blocked_range<int>& r) const
+    {
+        ASSERT(r.size() == 1, NULL);
+        // allocate_root() uses current context of parallel_for which is destroyed when it finishes.
+        // But enqueued tasks can outlive parallel_for execution. Thus, use a persistent context.
+        tbb::task *t = new(tbb::task::allocate_root(persistent_context)) tbb::empty_task();
+        tbb::task::enqueue(*t); // ensure no missing wake-ups
+        my_barrier.timed_wait(10, "Attention: poorly reproducible event, if seen stress testing required" );
+    }
+};
+
+void TestWakeups()
+{
+    tbb::task_scheduler_init my(tbb::task_scheduler_init::deferred);
+    if( tbb::task_scheduler_init::default_num_threads() <= NUM_TASKS )
+        my.initialize(NUM_TASKS*2);
+    else // workaround issue #1996 for TestCascadedEnqueue
+        my.initialize(tbb::task_scheduler_init::default_num_threads()+1);
+    Harness::SpinBarrier barrier(NUM_TASKS);
+    REMARK("Missing wake-up: affinity_partitioner\n");
+    tbb::affinity_partitioner aff;
+    for (size_t i = 0; i < NUM_REPEATS; ++i)
+        tbb::parallel_for(tbb::blocked_range<int>(0, NUM_TASKS), Functor(barrier), aff);
+    REMARK("Missing wake-up: simple_partitioner\n");
+    for (size_t i = 0; i < NUM_REPEATS; ++i)
+        tbb::parallel_for(tbb::blocked_range<int>(0, NUM_TASKS), Functor(barrier), tbb::simple_partitioner());
+    REMARK("Missing wake-up: auto_partitioner\n");
+    for (size_t i = 0; i < NUM_REPEATS; ++i)
+        tbb::parallel_for(tbb::blocked_range<int>(0, NUM_TASKS), Functor(barrier)); // auto
+}
+
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#include "tbb/global_control.h"
+
+int TestMain () {
+
+    TestWakeups();         // 1st because requests oversubscription
+    for (int i=0; i<2; i++) {
+        tbb::global_control *c = i?
+            new tbb::global_control(tbb::global_control::max_allowed_parallelism, 1) : NULL;
+        if (i) // decrease workload for max_allowed_parallelism == 1
+            NumRepeats = 10;
+
+        TestCascadedEnqueue(); // needs oversubscription
+        if (!c)
+            TestDequeueByMaster(); // no oversubscription needed
+        for( int p=MinThread; p<=MaxThread; ++p ) {
+            TestEnqueue(p);
+            TestSharedRoot(p);
+        }
+        delete c;
+    }
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_task_group.cpp b/xdl/third_party/tbb/src/test/test_task_group.cpp
new file mode 100644
index 00000000..1a88accf
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_group.cpp
@@ -0,0 +1,1028 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "harness_defs.h"
+
+//Concurrency scheduler is not supported by Windows* new UI apps
+//TODO: check whether we can test anything here
+#include "tbb/tbb_config.h"
+#if !__TBB_WIN8UI_SUPPORT
+#ifndef TBBTEST_USE_TBB
+    #define TBBTEST_USE_TBB 1
+#endif
+#else
+    #define TBBTEST_USE_TBB 0
+    #undef __TBB_TASK_GROUP_CONTEXT
+    #define __TBB_TASK_GROUP_CONTEXT 0
+#endif
+
+#if !TBBTEST_USE_TBB
+    #if defined(_MSC_VER) && _MSC_VER < 1600
+        #ifdef TBBTEST_USE_TBB
+            #undef TBBTEST_USE_TBB
+        #endif
+        #define TBBTEST_USE_TBB 1
+    #endif
+#endif
+
+#if TBBTEST_USE_TBB
+
+    #include "tbb/compat/ppl.h"
+    #include "tbb/task_scheduler_init.h"
+
+    #if _MSC_VER
+        typedef tbb::internal::uint32_t uint_t;
+    #else
+        typedef uint32_t uint_t;
+    #endif
+
+#else /* !TBBTEST_USE_TBB */
+
+    #if defined(_MSC_VER)
+    #pragma warning(disable: 4100 4180)
+    #endif
+
+    #include <ppl.h>
+
+    typedef unsigned int uint_t;
+
+    // Bug in this ConcRT version results in task_group::wait() rethrowing
+    // internal cancellation exception propagated by the scheduler from the nesting
+    // task group.
+    #define __TBB_SILENT_CANCELLATION_BROKEN  (_MSC_VER == 1600)
+
+#endif /* !TBBTEST_USE_TBB */
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+#include "tbb/atomic.h"
+#include "tbb/aligned_space.h"
+#include "harness.h"
+#include "harness_concurrency_tracker.h"
+
+unsigned g_MaxConcurrency = 0;
+
+typedef tbb::atomic<uint_t> atomic_t;
+typedef Concurrency::task_handle<void(*)()> handle_type;
+
+//------------------------------------------------------------------------
+// Tests for the thread safety of the task_group manipulations
+//------------------------------------------------------------------------
+
+#include "harness_barrier.h"
+
+enum SharingMode {
+    VagabondGroup = 1,
+    ParallelWait = 2
+};
+
+class  SharedGroupBodyImpl : NoCopy, Harness::NoAfterlife {
+    static const uint_t c_numTasks0 = 4096,
+                        c_numTasks1 = 1024;
+
+    const uint_t m_numThreads;
+    const uint_t m_sharingMode;
+
+    Concurrency::task_group *m_taskGroup;
+    atomic_t m_tasksSpawned,
+             m_threadsReady;
+    Harness::SpinBarrier m_barrier;
+
+    static atomic_t s_tasksExecuted;
+
+    struct TaskFunctor {
+        SharedGroupBodyImpl *m_pOwner;
+        void operator () () const {
+            if ( m_pOwner->m_sharingMode & ParallelWait ) {
+                while ( Harness::ConcurrencyTracker::PeakParallelism() < m_pOwner->m_numThreads )
+                    __TBB_Yield();
+            }
+            ++s_tasksExecuted;
+        }
+    };
+
+    TaskFunctor m_taskFunctor;
+
+    void Spawn ( uint_t numTasks ) {
+        for ( uint_t i = 0; i < numTasks; ++i ) {
+            ++m_tasksSpawned;
+            Harness::ConcurrencyTracker ct;
+            m_taskGroup->run( m_taskFunctor );
+        }
+        ++m_threadsReady;
+    }
+
+    void DeleteTaskGroup () {
+        delete m_taskGroup;
+        m_taskGroup = NULL;
+    }
+
+    void Wait () {
+        while ( m_threadsReady != m_numThreads )
+            __TBB_Yield();
+        const uint_t numSpawned = c_numTasks0 + c_numTasks1 * (m_numThreads - 1);
+        ASSERT ( m_tasksSpawned == numSpawned, "Wrong number of spawned tasks. The test is broken" );
+        REMARK("Max spawning parallelism is %u out of %u\n", Harness::ConcurrencyTracker::PeakParallelism(), g_MaxConcurrency);
+        if ( m_sharingMode & ParallelWait ) {
+            m_barrier.wait( &Harness::ConcurrencyTracker::Reset );
+            {
+                Harness::ConcurrencyTracker ct;
+                m_taskGroup->wait();
+            }
+            if ( Harness::ConcurrencyTracker::PeakParallelism() == 1 )
+                REPORT ( "Warning: No parallel waiting detected in TestParallelWait\n" );
+            m_barrier.wait();
+        }
+        else
+            m_taskGroup->wait();
+        ASSERT ( m_tasksSpawned == numSpawned, "No tasks should be spawned after wait starts. The test is broken" );
+        ASSERT ( s_tasksExecuted == numSpawned, "Not all spawned tasks were executed" );
+    }
+
+public:
+    SharedGroupBodyImpl ( uint_t numThreads, uint_t sharingMode = 0 )
+        : m_numThreads(numThreads)
+        , m_sharingMode(sharingMode)
+        , m_taskGroup(NULL)
+        , m_barrier(numThreads)
+    {
+        ASSERT ( m_numThreads > 1, "SharedGroupBody tests require concurrency" );
+        ASSERT ( !(m_sharingMode & VagabondGroup) || m_numThreads == 2, "In vagabond mode SharedGroupBody must be used with 2 threads only" );
+        Harness::ConcurrencyTracker::Reset();
+        s_tasksExecuted = 0;
+        m_tasksSpawned = 0;
+        m_threadsReady = 0;
+        m_taskFunctor.m_pOwner = this;
+    }
+
+    void Run ( uint_t idx ) {
+#if TBBTEST_USE_TBB
+        tbb::task_scheduler_init init(g_MaxConcurrency);
+#endif
+        AssertLive();
+        if ( idx == 0 ) {
+            ASSERT ( !m_taskGroup && !m_tasksSpawned, "SharedGroupBody must be reset before reuse");
+            m_taskGroup = new Concurrency::task_group;
+            Spawn( c_numTasks0 );
+            Wait();
+            if ( m_sharingMode & VagabondGroup )
+                m_barrier.wait();
+            else
+                DeleteTaskGroup();
+        }
+        else {
+            while ( m_tasksSpawned == 0 )
+                __TBB_Yield();
+            ASSERT ( m_taskGroup, "Task group is not initialized");
+            Spawn (c_numTasks1);
+            if ( m_sharingMode & ParallelWait )
+                Wait();
+            if ( m_sharingMode & VagabondGroup ) {
+                ASSERT ( idx == 1, "In vagabond mode SharedGroupBody must be used with 2 threads only" );
+                m_barrier.wait();
+                DeleteTaskGroup();
+            }
+        }
+        AssertLive();
+    }
+};
+
+atomic_t SharedGroupBodyImpl::s_tasksExecuted;
+
+class  SharedGroupBody : NoAssign, Harness::NoAfterlife {
+    bool m_bOwner;
+    SharedGroupBodyImpl *m_pImpl;
+public:
+    SharedGroupBody ( uint_t numThreads, uint_t sharingMode = 0 )
+        : m_bOwner(true)
+        , m_pImpl( new SharedGroupBodyImpl(numThreads, sharingMode) )
+    {}
+    SharedGroupBody ( const SharedGroupBody& src )
+        : NoAssign()
+        , Harness::NoAfterlife()
+        , m_bOwner(false)
+        , m_pImpl(src.m_pImpl)
+    {}
+    ~SharedGroupBody () {
+        if ( m_bOwner )
+            delete m_pImpl;
+    }
+    void operator() ( uint_t idx ) const { m_pImpl->Run(idx); }
+};
+
+class RunAndWaitSyncronizationTestBody : NoAssign {
+    Harness::SpinBarrier& m_barrier;
+    tbb::atomic<bool>& m_completed;
+    tbb::task_group& m_tg;
+public:
+    RunAndWaitSyncronizationTestBody(Harness::SpinBarrier& barrier, tbb::atomic<bool>& completed, tbb::task_group& tg)
+        : m_barrier(barrier), m_completed(completed), m_tg(tg) {}
+
+    void operator()() const {
+        m_barrier.wait();
+        for (volatile int i = 0; i < 100000; ++i) {}
+        m_completed = true;
+    }
+
+    void operator()(int id) const {
+        if (id == 0) {
+            m_tg.run_and_wait(*this);
+        } else {
+            m_barrier.wait();
+            m_tg.wait();
+            ASSERT(m_completed, "A concurrent waiter has left the wait method earlier than work has finished");
+        }
+    }
+};
+
+void TestParallelSpawn () {
+    NativeParallelFor( g_MaxConcurrency, SharedGroupBody(g_MaxConcurrency) );
+}
+
+void TestParallelWait () {
+    NativeParallelFor( g_MaxConcurrency, SharedGroupBody(g_MaxConcurrency, ParallelWait) );
+
+    Harness::SpinBarrier barrier(g_MaxConcurrency);
+    tbb::atomic<bool> completed;
+    completed = false;
+    tbb::task_group tg;
+    RunAndWaitSyncronizationTestBody b(barrier, completed, tg);
+    NativeParallelFor( g_MaxConcurrency, b );
+}
+
+// Tests non-stack-bound task group (the group that is allocated by one thread and destroyed by the other)
+void TestVagabondGroup () {
+    NativeParallelFor( 2, SharedGroupBody(2, VagabondGroup) );
+}
+
+//------------------------------------------------------------------------
+// Common requisites of the Fibonacci tests
+//------------------------------------------------------------------------
+
+const uint_t N = 20;
+const uint_t F = 6765;
+
+atomic_t g_Sum;
+
+#define FIB_TEST_PROLOGUE() \
+    const unsigned numRepeats = g_MaxConcurrency * (TBB_USE_DEBUG ? 4 : 16);    \
+    Harness::ConcurrencyTracker::Reset()
+
+#define FIB_TEST_EPILOGUE(sum) \
+    ASSERT( sum == numRepeats * F, NULL ); \
+    REMARK("Realized parallelism in Fib test is %u out of %u\n", Harness::ConcurrencyTracker::PeakParallelism(), g_MaxConcurrency)
+
+//------------------------------------------------------------------------
+// Test for a complex tree of task groups
+//
+// The test executes a tree of task groups of the same sort with asymmetric
+// descendant nodes distribution at each level at each level.
+//
+// The chores are specified as functor objects. Each task group contains only one chore.
+//------------------------------------------------------------------------
+
+template<uint_t Func(uint_t)>
+struct FibTask : NoAssign, Harness::NoAfterlife {
+    uint_t* m_pRes;
+    const uint_t m_Num;
+    FibTask( uint_t* y, uint_t n ) : m_pRes(y), m_Num(n) {}
+    void operator() () const {
+        *m_pRes = Func(m_Num);
+    }
+};
+
+uint_t Fib_SpawnRightChildOnly ( uint_t n ) {
+    Harness::ConcurrencyTracker ct;
+    if( n<2 ) {
+        return n;
+    } else {
+        uint_t y = ~0u;
+        Concurrency::task_group tg;
+        tg.run( FibTask<Fib_SpawnRightChildOnly>(&y, n-1) );
+        uint_t x = Fib_SpawnRightChildOnly(n-2);
+        tg.wait();
+        return y+x;
+    }
+}
+
+void TestFib1 () {
+    FIB_TEST_PROLOGUE();
+    uint_t sum = 0;
+    for( unsigned i = 0; i < numRepeats; ++i )
+        sum += Fib_SpawnRightChildOnly(N);
+    FIB_TEST_EPILOGUE(sum);
+}
+
+
+//------------------------------------------------------------------------
+// Test for a mixed tree of task groups.
+//
+// The test executes a tree with multiple task of one sort at the first level,
+// each of which originates in its turn a binary tree of descendant task groups.
+//
+// The chores are specified both as functor objects and as function pointers
+//------------------------------------------------------------------------
+
+uint_t Fib_SpawnBothChildren( uint_t n ) {
+    Harness::ConcurrencyTracker ct;
+    if( n<2 ) {
+        return n;
+    } else {
+        uint_t  y = ~0u,
+                x = ~0u;
+        Concurrency::task_group tg;
+        tg.run( FibTask<Fib_SpawnBothChildren>(&x, n-2) );
+        tg.run( FibTask<Fib_SpawnBothChildren>(&y, n-1) );
+        tg.wait();
+        return y + x;
+    }
+}
+
+void RunFib2 () {
+    g_Sum += Fib_SpawnBothChildren(N);
+}
+
+void TestFib2 () {
+    FIB_TEST_PROLOGUE();
+    g_Sum = 0;
+    Concurrency::task_group rg;
+    for( unsigned i = 0; i < numRepeats - 1; ++i )
+        rg.run( &RunFib2 );
+    rg.wait();
+    rg.run( &RunFib2 );
+    rg.wait();
+    FIB_TEST_EPILOGUE(g_Sum);
+}
+
+
+//------------------------------------------------------------------------
+// Test for a complex tree of task groups
+// The chores are specified as task handles for recursive functor objects.
+//------------------------------------------------------------------------
+
+class FibTask_SpawnRightChildOnly : NoAssign, Harness::NoAfterlife {
+    uint_t* m_pRes;
+    mutable uint_t m_Num;
+
+public:
+    FibTask_SpawnRightChildOnly( uint_t* y, uint_t n ) : m_pRes(y), m_Num(n) {}
+    void operator() () const {
+        Harness::ConcurrencyTracker ct;
+        AssertLive();
+        if( m_Num < 2 ) {
+            *m_pRes = m_Num;
+        } else {
+            uint_t y = ~0u;
+            Concurrency::task_group tg;
+            Concurrency::task_handle<FibTask_SpawnRightChildOnly> h = FibTask_SpawnRightChildOnly(&y, m_Num-1);
+            tg.run( h );
+            m_Num -= 2;
+            tg.run_and_wait( *this );
+            *m_pRes += y;
+        }
+    }
+};
+
+uint_t RunFib3 ( uint_t n ) {
+    uint_t res = ~0u;
+    FibTask_SpawnRightChildOnly func(&res, n);
+    func();
+    return res;
+}
+
+void TestTaskHandle () {
+    FIB_TEST_PROLOGUE();
+    uint_t sum = 0;
+    for( unsigned i = 0; i < numRepeats; ++i )
+        sum += RunFib3(N);
+    FIB_TEST_EPILOGUE(sum);
+}
+
+//------------------------------------------------------------------------
+// Test for a mixed tree of task groups.
+// The chores are specified as task handles for both functor objects and function pointers
+//------------------------------------------------------------------------
+
+template<class task_group_type>
+class FibTask_SpawnBothChildren : NoAssign, Harness::NoAfterlife {
+    uint_t* m_pRes;
+    uint_t m_Num;
+public:
+    FibTask_SpawnBothChildren( uint_t* y, uint_t n ) : m_pRes(y), m_Num(n) {}
+    void operator() () const {
+        Harness::ConcurrencyTracker ct;
+        AssertLive();
+        if( m_Num < 2 ) {
+            *m_pRes = m_Num;
+        } else {
+            uint_t  x = ~0u, // initialized only to suppress warning
+                    y = ~0u;
+            task_group_type tg;
+            Concurrency::task_handle<FibTask_SpawnBothChildren> h1 = FibTask_SpawnBothChildren(&y, m_Num-1),
+                                                                h2 = FibTask_SpawnBothChildren(&x, m_Num-2);
+            tg.run( h1 );
+            tg.run( h2 );
+            tg.wait();
+            *m_pRes = x + y;
+        }
+    }
+};
+
+template<class task_group_type>
+void RunFib4 () {
+    uint_t res = ~0u;
+    FibTask_SpawnBothChildren<task_group_type> func(&res, N);
+    func();
+    g_Sum += res;
+}
+
+template<class task_group_type>
+void TestTaskHandle2 () {
+    FIB_TEST_PROLOGUE();
+    g_Sum = 0;
+    task_group_type rg;
+    typedef tbb::aligned_space<handle_type> handle_space_t;
+    handle_space_t *handles = new handle_space_t[numRepeats];
+    handle_type *h = NULL;
+#if __TBB_ipf && __TBB_GCC_VERSION==40601
+    volatile // Workaround for unexpected exit from the loop below after the exception was caught
+#endif
+    unsigned i = 0;
+    for( ;; ++i ) {
+        h = handles[i].begin();
+#if __TBB_FUNC_PTR_AS_TEMPL_PARAM_BROKEN
+        new ( h ) handle_type((void(*)())RunFib4<task_group_type>);
+#else
+        new ( h ) handle_type(RunFib4<task_group_type>);
+#endif
+        if ( i == numRepeats - 1 )
+            break;
+        rg.run( *h );
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+        bool caught = false;
+        try {
+            if( i&1 ) rg.run( *h );
+            else rg.run_and_wait( *h );
+        }
+        catch ( Concurrency::invalid_multiple_scheduling& e ) {
+            ASSERT( e.what(), "Error message is absent" );
+            caught = true;
+        }
+        catch ( ... ) {
+            ASSERT ( __TBB_EXCEPTION_TYPE_INFO_BROKEN, "Unrecognized exception" );
+        }
+        ASSERT ( caught, "Expected invalid_multiple_scheduling exception is missing" );
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+    }
+    ASSERT( i == numRepeats - 1, "unexpected exit from the loop" );
+    rg.run_and_wait( *h );
+
+    for( i = 0; i < numRepeats; ++i )
+#if __TBB_UNQUALIFIED_CALL_OF_DTOR_BROKEN
+        handles[i].begin()->Concurrency::task_handle<void(*)()>::~task_handle();
+#else
+        handles[i].begin()->~handle_type();
+#endif
+    delete []handles;
+    FIB_TEST_EPILOGUE(g_Sum);
+}
+
+#if __TBB_CPP11_LAMBDAS_PRESENT
+//------------------------------------------------------------------------
+// Test for a mixed tree of task groups.
+// The chores are specified as lambdas
+//------------------------------------------------------------------------
+
+void TestFibWithLambdas () {
+    REMARK ("Lambdas test");
+    FIB_TEST_PROLOGUE();
+    atomic_t sum;
+    sum = 0;
+    Concurrency::task_group rg;
+    for( unsigned i = 0; i < numRepeats; ++i )
+        rg.run( [&](){sum += Fib_SpawnBothChildren(N);} );
+    rg.wait();
+    FIB_TEST_EPILOGUE(sum);
+}
+
+//------------------------------------------------------------------------
+// Test for make_task.
+// The chores are specified as lambdas converted to task_handles.
+//------------------------------------------------------------------------
+
+void TestFibWithMakeTask () {
+    REMARK ("Make_task test\n");
+    atomic_t sum;
+    sum = 0;
+    Concurrency::task_group rg;
+    const auto &h1 = Concurrency::make_task( [&](){sum += Fib_SpawnBothChildren(N);} );
+    const auto &h2 = Concurrency::make_task( [&](){sum += Fib_SpawnBothChildren(N);} );
+    rg.run( h1 );
+    rg.run_and_wait( h2 );
+    ASSERT( sum == 2 * F, NULL );
+}
+#endif /* __TBB_CPP11_LAMBDAS_PRESENT */
+
+
+//------------------------------------------------------------------------
+// Tests for exception handling and cancellation behavior.
+//------------------------------------------------------------------------
+
+class test_exception : public std::exception
+{
+    const char* m_strDescription;
+public:
+    test_exception ( const char* descr ) : m_strDescription(descr) {}
+
+    const char* what() const throw() __TBB_override { return m_strDescription; }
+};
+
+#if TBB_USE_CAPTURED_EXCEPTION
+    #include "tbb/tbb_exception.h"
+    typedef tbb::captured_exception TestException;
+#else
+    typedef test_exception TestException;
+#endif
+
+#include <string.h>
+
+#define NUM_CHORES      512
+#define NUM_GROUPS      64
+#define SKIP_CHORES     (NUM_CHORES/4)
+#define SKIP_GROUPS     (NUM_GROUPS/4)
+#define EXCEPTION_DESCR1 "Test exception 1"
+#define EXCEPTION_DESCR2 "Test exception 2"
+
+atomic_t g_ExceptionCount;
+atomic_t g_TaskCount;
+unsigned g_ExecutedAtCancellation;
+bool g_Rethrow;
+bool g_Throw;
+#if __TBB_SILENT_CANCELLATION_BROKEN
+    volatile bool g_CancellationPropagationInProgress;
+    #define CATCH_ANY()                                     \
+        __TBB_CATCH( ... ) {                                \
+            if ( g_CancellationPropagationInProgress ) {    \
+                if ( g_Throw ) {                            \
+                    exceptionCaught = true;                 \
+                    ++g_ExceptionCount;                     \
+                }                                           \
+            } else                                          \
+                ASSERT( false, "Unknown exception" );       \
+        }
+#else
+    #define CATCH_ANY()  __TBB_CATCH( ... ) { ASSERT( __TBB_EXCEPTION_TYPE_INFO_BROKEN, "Unknown exception" ); }
+#endif
+
+inline
+void ResetGlobals ( bool bThrow, bool bRethrow ) {
+    g_Throw = bThrow;
+    g_Rethrow = bRethrow;
+#if __TBB_SILENT_CANCELLATION_BROKEN
+    g_CancellationPropagationInProgress = false;
+#endif
+    g_ExceptionCount = 0;
+    g_TaskCount = 0;
+    Harness::ConcurrencyTracker::Reset();
+}
+
+class ThrowingTask : NoAssign, Harness::NoAfterlife {
+    atomic_t &m_TaskCount;
+public:
+    ThrowingTask( atomic_t& counter ) : m_TaskCount(counter) {}
+    void operator() () const {
+        Harness::ConcurrencyTracker ct;
+        AssertLive();
+        if ( g_Throw ) {
+            if ( ++m_TaskCount == SKIP_CHORES )
+                __TBB_THROW( test_exception(EXCEPTION_DESCR1) );
+            __TBB_Yield();
+        }
+        else {
+            ++g_TaskCount;
+            while( !Concurrency::is_current_task_group_canceling() )
+                __TBB_Yield();
+        }
+    }
+};
+
+void LaunchChildren () {
+    atomic_t count;
+    count = 0;
+    Concurrency::task_group g;
+    bool exceptionCaught = false;
+    for( unsigned i = 0; i < NUM_CHORES; ++i )
+        g.run( ThrowingTask(count) );
+    Concurrency::task_group_status status = Concurrency::not_complete;
+    __TBB_TRY {
+        status = g.wait();
+    } __TBB_CATCH ( TestException& e ) {
+#if TBB_USE_EXCEPTIONS
+        ASSERT( e.what(), "Empty what() string" );
+        ASSERT( __TBB_EXCEPTION_TYPE_INFO_BROKEN || strcmp(e.what(), EXCEPTION_DESCR1) == 0, "Unknown exception" );
+#endif /* TBB_USE_EXCEPTIONS */
+        exceptionCaught = true;
+        ++g_ExceptionCount;
+    } CATCH_ANY();
+    ASSERT( !g_Throw || exceptionCaught || status == Concurrency::canceled, "No exception in the child task group" );
+    if ( g_Rethrow && g_ExceptionCount > SKIP_GROUPS ) {
+#if __TBB_SILENT_CANCELLATION_BROKEN
+        g_CancellationPropagationInProgress = true;
+#endif
+        __TBB_THROW( test_exception(EXCEPTION_DESCR2) );
+    }
+}
+
+#if TBB_USE_EXCEPTIONS
+void TestEh1 () {
+    ResetGlobals( true, false );
+    Concurrency::task_group rg;
+    for( unsigned i = 0; i < NUM_GROUPS; ++i )
+        // TBB version does not require taking function address
+        rg.run( &LaunchChildren );
+    try {
+        rg.wait();
+    } catch ( ... ) {
+        ASSERT( false, "Unexpected exception" );
+    }
+    ASSERT( g_ExceptionCount <= NUM_GROUPS, "Too many exceptions from the child groups. The test is broken" );
+    ASSERT( g_ExceptionCount == NUM_GROUPS, "Not all child groups threw the exception" );
+}
+
+void TestEh2 () {
+    ResetGlobals( true, true );
+    Concurrency::task_group rg;
+    bool exceptionCaught = false;
+    for( unsigned i = 0; i < NUM_GROUPS; ++i )
+        // TBB version does not require taking function address
+        rg.run( &LaunchChildren );
+    try {
+        rg.wait();
+    } catch ( TestException& e ) {
+        ASSERT( e.what(), "Empty what() string" );
+        ASSERT( __TBB_EXCEPTION_TYPE_INFO_BROKEN || strcmp(e.what(), EXCEPTION_DESCR2) == 0, "Unknown exception" );
+        ASSERT ( !rg.is_canceling(), "wait() has not reset cancellation state" );
+        exceptionCaught = true;
+    } CATCH_ANY();
+    ASSERT( exceptionCaught, "No exception thrown from the root task group" );
+    ASSERT( g_ExceptionCount >= SKIP_GROUPS, "Too few exceptions from the child groups. The test is broken" );
+    ASSERT( g_ExceptionCount <= NUM_GROUPS - SKIP_GROUPS, "Too many exceptions from the child groups. The test is broken" );
+    ASSERT( g_ExceptionCount < NUM_GROUPS - SKIP_GROUPS, "None of the child groups was cancelled" );
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+//------------------------------------------------------------------------
+// Tests for manual cancellation of the task_group hierarchy
+//------------------------------------------------------------------------
+
+void TestCancellation1 () {
+    ResetGlobals( false, false );
+    Concurrency::task_group rg;
+    for( unsigned i = 0; i < NUM_GROUPS; ++i )
+        // TBB version does not require taking function address
+        rg.run( &LaunchChildren );
+    ASSERT ( !Concurrency::is_current_task_group_canceling(), "Unexpected cancellation" );
+    ASSERT ( !rg.is_canceling(), "Unexpected cancellation" );
+#if __TBB_SILENT_CANCELLATION_BROKEN
+    g_CancellationPropagationInProgress = true;
+#endif
+    while ( g_MaxConcurrency > 1 && g_TaskCount == 0 )
+        __TBB_Yield();
+    rg.cancel();
+    g_ExecutedAtCancellation = g_TaskCount;
+    ASSERT ( rg.is_canceling(), "No cancellation reported" );
+    rg.wait();
+    ASSERT( g_TaskCount <= NUM_GROUPS * NUM_CHORES, "Too many tasks reported. The test is broken" );
+    ASSERT( g_TaskCount < NUM_GROUPS * NUM_CHORES, "No tasks were cancelled. Cancellation model changed?" );
+    ASSERT( g_TaskCount <= g_ExecutedAtCancellation + Harness::ConcurrencyTracker::PeakParallelism(), "Too many tasks survived cancellation" );
+}
+
+//------------------------------------------------------------------------
+// Tests for manual cancellation of the structured_task_group hierarchy
+//------------------------------------------------------------------------
+
+void StructuredLaunchChildren () {
+    atomic_t count;
+    count = 0;
+    Concurrency::structured_task_group g;
+    bool exceptionCaught = false;
+    typedef Concurrency::task_handle<ThrowingTask> throwing_handle_type;
+    tbb::aligned_space<throwing_handle_type,NUM_CHORES> handles;
+    for( unsigned i = 0; i < NUM_CHORES; ++i ) {
+        throwing_handle_type *h = handles.begin()+i;
+        new ( h ) throwing_handle_type( ThrowingTask(count) );
+        g.run( *h );
+    }
+    __TBB_TRY {
+        g.wait();
+    } __TBB_CATCH( TestException& e ) {
+#if TBB_USE_EXCEPTIONS
+        ASSERT( e.what(), "Empty what() string" );
+        ASSERT( __TBB_EXCEPTION_TYPE_INFO_BROKEN || strcmp(e.what(), EXCEPTION_DESCR1) == 0, "Unknown exception" );
+#endif /* TBB_USE_EXCEPTIONS */
+#if __TBB_SILENT_CANCELLATION_BROKEN
+        ASSERT ( !g.is_canceling() || g_CancellationPropagationInProgress, "wait() has not reset cancellation state" );
+#else
+        ASSERT ( !g.is_canceling(), "wait() has not reset cancellation state" );
+#endif
+        exceptionCaught = true;
+        ++g_ExceptionCount;
+    } CATCH_ANY();
+    ASSERT( !g_Throw || exceptionCaught, "No exception in the child task group" );
+    for( unsigned i = 0; i < NUM_CHORES; ++i )
+        (handles.begin()+i)->~throwing_handle_type();
+    if ( g_Rethrow && g_ExceptionCount > SKIP_GROUPS ) {
+#if __TBB_SILENT_CANCELLATION_BROKEN
+        g_CancellationPropagationInProgress = true;
+#endif
+        __TBB_THROW( test_exception(EXCEPTION_DESCR2) );
+    }
+}
+
+class StructuredCancellationTestDriver {
+    tbb::aligned_space<handle_type,NUM_CHORES> m_handles;
+
+public:
+    void Launch ( Concurrency::structured_task_group& rg ) {
+        ResetGlobals( false, false );
+        for( unsigned i = 0; i < NUM_GROUPS; ++i ) {
+            handle_type *h = m_handles.begin()+i;
+            new ( h ) handle_type( StructuredLaunchChildren );
+            rg.run( *h );
+        }
+        ASSERT ( !Concurrency::is_current_task_group_canceling(), "Unexpected cancellation" );
+        ASSERT ( !rg.is_canceling(), "Unexpected cancellation" );
+#if __TBB_SILENT_CANCELLATION_BROKEN
+        g_CancellationPropagationInProgress = true;
+#endif
+        while ( g_MaxConcurrency > 1 && g_TaskCount == 0 )
+            __TBB_Yield();
+    }
+
+    void Finish () {
+        for( unsigned i = 0; i < NUM_GROUPS; ++i )
+            (m_handles.begin()+i)->~handle_type();
+        ASSERT( g_TaskCount <= NUM_GROUPS * NUM_CHORES, "Too many tasks reported. The test is broken" );
+        ASSERT( g_TaskCount < NUM_GROUPS * NUM_CHORES, "No tasks were cancelled. Cancellation model changed?" );
+        ASSERT( g_TaskCount <= g_ExecutedAtCancellation + g_MaxConcurrency, "Too many tasks survived cancellation" );
+    }
+}; // StructuredCancellationTestDriver
+
+void TestStructuredCancellation1 () {
+    StructuredCancellationTestDriver driver;
+    Concurrency::structured_task_group sg;
+    driver.Launch( sg );
+    sg.cancel();
+    g_ExecutedAtCancellation = g_TaskCount;
+    ASSERT ( sg.is_canceling(), "No cancellation reported" );
+    sg.wait();
+    driver.Finish();
+}
+
+#if TBB_USE_EXCEPTIONS
+#if defined(_MSC_VER)
+    #pragma warning (disable: 4127)
+#endif
+
+template<bool Throw>
+void TestStructuredCancellation2 () {
+    bool exception_occurred = false,
+         unexpected_exception = false;
+    StructuredCancellationTestDriver driver;
+    try {
+        Concurrency::structured_task_group tg;
+        driver.Launch( tg );
+        if ( Throw )
+            throw int(); // Initiate stack unwinding
+    }
+    catch ( const Concurrency::missing_wait& e ) {
+        ASSERT( e.what(), "Error message is absent" );
+        exception_occurred = true;
+        unexpected_exception = Throw;
+    }
+    catch ( int ) {
+        exception_occurred = true;
+        unexpected_exception = !Throw;
+    }
+    catch ( ... ) {
+        exception_occurred = unexpected_exception = true;
+    }
+    ASSERT( exception_occurred, NULL );
+    ASSERT( !unexpected_exception, NULL );
+    driver.Finish();
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+void EmptyFunction () {}
+
+void TestStructuredWait () {
+    Concurrency::structured_task_group sg;
+    handle_type h(EmptyFunction);
+    sg.run(h);
+    sg.wait();
+    handle_type h2(EmptyFunction);
+    sg.run(h2);
+    sg.wait();
+}
+
+struct TestFunctor {
+    void operator()() { ASSERT( false, "Non-const operator called" ); }
+    void operator()() const { /* library requires this overload only */ }
+};
+
+void TestConstantFunctorRequirement() {
+    tbb::task_group g;
+    TestFunctor tf;
+    g.run( tf ); g.wait();
+    g.run_and_wait( tf );
+}
+//------------------------------------------------------------------------
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+namespace TestMoveSemanticsNS {
+    struct TestFunctor {
+        void operator()() const {};
+    };
+
+    struct MoveOnlyFunctor : MoveOnly, TestFunctor {
+        MoveOnlyFunctor() : MoveOnly() {};
+        MoveOnlyFunctor(MoveOnlyFunctor&& other) : MoveOnly(std::move(other)) {};
+    };
+
+    struct MovePreferableFunctor : Movable, TestFunctor {
+        MovePreferableFunctor() : Movable() {};
+        MovePreferableFunctor(MovePreferableFunctor&& other) : Movable(std::move(other)) {};
+        MovePreferableFunctor(const MovePreferableFunctor& other) : Movable(other) {};
+    };
+
+    struct NoMoveNoCopyFunctor : NoCopy, TestFunctor {
+        NoMoveNoCopyFunctor() : NoCopy() {};
+        // mv ctor is not allowed as cp ctor from parent NoCopy
+    private:
+        NoMoveNoCopyFunctor(NoMoveNoCopyFunctor&&);
+    };
+
+    void TestFunctorsWithinTaskHandles() {
+        // working with task_handle rvalues is not supported in task_group
+
+        tbb::task_group tg;
+        MovePreferableFunctor mpf;
+        typedef tbb::task_handle<MoveOnlyFunctor> th_mv_only_type;
+        typedef tbb::task_handle<MovePreferableFunctor> th_mv_pref_type;
+
+        th_mv_only_type th_mv_only = th_mv_only_type(MoveOnlyFunctor());
+        tg.run_and_wait(th_mv_only);
+
+        th_mv_only_type th_mv_only1 = th_mv_only_type(MoveOnlyFunctor());
+        tg.run(th_mv_only1);
+        tg.wait();
+
+        th_mv_pref_type th_mv_pref = th_mv_pref_type(mpf);
+        tg.run_and_wait(th_mv_pref);
+        ASSERT(mpf.alive, "object was moved when was passed by lval");
+        mpf.Reset();
+
+        th_mv_pref_type th_mv_pref1 = th_mv_pref_type(std::move(mpf));
+        tg.run_and_wait(th_mv_pref1);
+        ASSERT(!mpf.alive, "object was copied when was passed by rval");
+        mpf.Reset();
+
+        th_mv_pref_type th_mv_pref2 = th_mv_pref_type(mpf);
+        tg.run(th_mv_pref2);
+        tg.wait();
+        ASSERT(mpf.alive, "object was moved when was passed by lval");
+        mpf.Reset();
+
+        th_mv_pref_type th_mv_pref3 = th_mv_pref_type(std::move(mpf));
+        tg.run(th_mv_pref3);
+        tg.wait();
+        ASSERT(!mpf.alive, "object was copied when was passed by rval");
+        mpf.Reset();
+    }
+
+    void TestBareFunctors() {
+        tbb::task_group tg;
+        MovePreferableFunctor mpf;
+        // run_and_wait() doesn't have any copies or moves of arguments inside the impl
+        tg.run_and_wait( NoMoveNoCopyFunctor() );
+
+        tg.run( MoveOnlyFunctor() );
+        tg.wait();
+
+        tg.run( mpf );
+        tg.wait();
+        ASSERT(mpf.alive, "object was moved when was passed by lval");
+        mpf.Reset();
+
+        tg.run( std::move(mpf) );
+        tg.wait();
+        ASSERT(!mpf.alive, "object was copied when was passed by rval");
+        mpf.Reset();
+    }
+
+    void TestMakeTask() {
+        MovePreferableFunctor mpf;
+
+        tbb::make_task( MoveOnly() );
+
+        tbb::make_task( mpf );
+        ASSERT(mpf.alive, "object was moved when was passed by lval");
+        mpf.Reset();
+
+        tbb::make_task( std::move(mpf) );
+        ASSERT(!mpf.alive, "object was copied when was passed by rval");
+        mpf.Reset();
+    }
+}
+#endif /* __TBB_CPP11_RVALUE_REF_PRESENT */
+
+void TestMoveSemantics() {
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    TestMoveSemanticsNS::TestBareFunctors();
+    TestMoveSemanticsNS::TestFunctorsWithinTaskHandles();
+    TestMoveSemanticsNS::TestMakeTask();
+#else
+    REPORT("Known issue: move support tests are skipped.\n");
+#endif
+}
+//------------------------------------------------------------------------
+
+
+int TestMain () {
+    REMARK ("Testing %s task_group functionality\n", TBBTEST_USE_TBB ? "TBB" : "PPL");
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        g_MaxConcurrency = p;
+#if TBBTEST_USE_TBB
+        tbb::task_scheduler_init init(p);
+#else
+        Concurrency::SchedulerPolicy sp( 4,
+                                Concurrency::SchedulerKind, Concurrency::ThreadScheduler,
+                                Concurrency::MinConcurrency, 1,
+                                Concurrency::MaxConcurrency, p,
+                                Concurrency::TargetOversubscriptionFactor, 1);
+        Concurrency::Scheduler  *s = Concurrency::Scheduler::Create( sp );
+#endif /* !TBBTEST_USE_TBB */
+        if ( p > 1 ) {
+            TestParallelSpawn();
+            TestParallelWait();
+            TestVagabondGroup();
+        }
+        TestFib1();
+        TestFib2();
+        TestTaskHandle();
+        TestTaskHandle2<Concurrency::task_group>();
+        TestTaskHandle2<Concurrency::structured_task_group>();
+#if __TBB_CPP11_LAMBDAS_PRESENT
+        TestFibWithLambdas();
+        TestFibWithMakeTask();
+#endif
+        TestCancellation1();
+        TestStructuredCancellation1();
+#if TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+        TestEh1();
+        TestEh2();
+        TestStructuredWait();
+        TestStructuredCancellation2<true>();
+#if !(__TBB_THROW_FROM_DTOR_BROKEN || __TBB_STD_UNCAUGHT_EXCEPTION_BROKEN)
+        TestStructuredCancellation2<false>();
+#else
+        REPORT("Known issue: TestStructuredCancellation2<false>() is skipped.\n");
+#endif
+#endif /* TBB_USE_EXCEPTIONS && !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN */
+#if !TBBTEST_USE_TBB
+        s->Release();
+#endif
+    }
+    TestConstantFunctorRequirement();
+#if __TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+    REPORT("Known issue: exception handling tests are skipped.\n");
+#endif
+    TestMoveSemantics();
+    return Harness::Done;
+}
+
+#else /* !__TBB_TASK_GROUP_CONTEXT */
+
+#include "harness.h"
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
diff --git a/xdl/third_party/tbb/src/test/test_task_leaks.cpp b/xdl/third_party/tbb/src/test/test_task_leaks.cpp
new file mode 100644
index 00000000..aaf00589
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_leaks.cpp
@@ -0,0 +1,272 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/*  The test uses "single produces multiple consumers" (SPMC )pattern to check
+    if the memory of the tasks stolen by consumer threads is returned to the
+    producer thread and is reused.
+
+    The test consists of a series of iterations, which execute a task tree.
+    the test fails is the memory consumption is not stabilized during some
+    number of iterations.
+
+    After the memory consumption stabilized the memory state is perturbed by
+    switching producer thread, and the check is repeated.
+*/
+
+#define HARNESS_DEFAULT_MIN_THREADS -1
+
+#define  __TBB_COUNT_TASK_NODES 1
+#include "harness_inject_scheduler.h"
+
+#include "tbb/atomic.h"
+#include "harness_assert.h"
+#include <cstdlib>
+
+
+// Test configuration parameters
+
+//! Maximal number of test iterations
+const int MaxIterations = 600;
+//! Number of iterations during which the memory consumption must stabilize
+const int AsymptoticRange = 100;
+//! Number of times the memory state is perturbed to repeat the check
+const int NumProducerSwitches = 2;
+//! Number of iterations after which the success of producer switch is checked
+const int ProducerCheckTimeout = 10;
+//! Number of initial iteration used to collect statistics to be used in later checks
+const int InitialStatsIterations = 20;
+//! Inner iterations of RunTaskGenerators()
+const int TaskGeneratorsIterations = TBB_USE_DEBUG ? 30 : 100;
+
+tbb::atomic<int> Count;
+tbb::atomic<tbb::task*> Exchanger;
+tbb::internal::scheduler* Producer;
+
+#include "tbb/task_scheduler_init.h"
+
+#include "harness.h"
+
+using namespace tbb;
+using namespace tbb::internal;
+
+class ChangeProducer: public tbb::task {
+public:
+    tbb::task* execute() __TBB_override {
+        if( is_stolen_task() ) {
+            Producer = internal::governor::local_scheduler();
+        }
+        return NULL;
+    }
+};
+
+class TaskGenerator: public tbb::task {
+    const int my_child_count;
+    int my_depth;
+public:
+    TaskGenerator(int child_count, int d) : my_child_count(child_count), my_depth(d) {
+        ASSERT(my_child_count>1, "The TaskGenerator should produce at least two children");
+    }
+    tbb::task* execute() __TBB_override {
+        if( my_depth>0 ) {
+            int child_count = my_child_count;
+            scheduler* my_sched = internal::governor::local_scheduler();
+            tbb::task& c  = *new( allocate_continuation() ) tbb::empty_task;
+            c.set_ref_count( child_count );
+            recycle_as_child_of(c);
+            --child_count;
+            if( Producer==my_sched ) {
+                // produce a task and put it into Exchanger
+                tbb::task* t = new( c.allocate_child() ) tbb::empty_task;
+                --child_count;
+                t = Exchanger.fetch_and_store(t);
+                if( t ) spawn(*t);
+            } else {
+                tbb::task* t = Exchanger.fetch_and_store(NULL);
+                if( t ) spawn(*t);
+            }
+            while( child_count ) {
+                tbb::task* t = new( c.allocate_child() ) TaskGenerator(my_child_count, my_depth-1);
+                if( my_depth >4 ) enqueue(*t);
+                else              spawn(*t);
+                --child_count;
+            }
+            --my_depth;
+            return this;
+        } else {
+            tbb::task* t = Exchanger.fetch_and_store(NULL);
+            if( t ) spawn(*t);
+            return NULL;
+        }
+    }
+};
+
+#include "harness_memory.h"
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+    // VS2008/VC9 seems to have an issue
+    #pragma warning( push )
+    #pragma warning( disable: 4985 )
+#endif
+#include <math.h>
+#if _MSC_VER==1500 && !defined(__INTEL_COMPILER)
+    #pragma warning( pop )
+#endif
+
+void RunTaskGenerators( bool switchProducer = false, bool checkProducer = false ) {
+    if( switchProducer )
+        Producer = NULL;
+    tbb::task* dummy_root = new( tbb::task::allocate_root() ) tbb::empty_task;
+    dummy_root->set_ref_count( 2 );
+    // If no producer, start elections; some worker will take the role
+    if( Producer )
+        tbb::task::spawn( *new( dummy_root->allocate_child() ) tbb::empty_task );
+    else
+        tbb::task::spawn( *new( dummy_root->allocate_child() ) ChangeProducer );
+    if( checkProducer && !Producer )
+        REPORT("Warning: producer has not changed after 10 attempts; running on a single core?\n");
+    for( int j=0; j<TaskGeneratorsIterations; ++j ) {
+        if( j&1 ) {
+            tbb::task& t = *new( tbb::task::allocate_root() ) TaskGenerator(/*child_count=*/4, /*depth=*/6);
+            tbb::task::spawn_root_and_wait(t);
+        } else {
+            tbb::task& t = *new (tbb::task::allocate_additional_child_of(*dummy_root))
+                                TaskGenerator(/*child_count=*/4, /*depth=*/6);
+            tbb::task::enqueue(t);
+        }
+    }
+    dummy_root->wait_for_all();
+    tbb::task::destroy( *dummy_root );
+}
+
+class TaskList: public tbb::task {
+    const int my_num_childs;
+public:
+    TaskList(const int num_childs) : my_num_childs(num_childs) {}
+    tbb::task* execute() __TBB_override {
+        tbb::task_list list;
+        for (int i=0; i<my_num_childs; ++i)
+        {
+            list.push_back( *new( allocate_child() ) tbb::empty_task );
+        }
+        set_ref_count(my_num_childs+1);
+        spawn(list);
+
+        wait_for_all();
+        return 0;
+    }
+};
+
+void RunTaskListGenerator()
+{
+    const int max_num_childs = 10000;
+    int num_childs=3;
+
+    while ( num_childs < max_num_childs )
+    {
+        tbb::task& root = *new( tbb::task::allocate_root() ) TaskList(num_childs);
+
+        tbb::task::spawn_root_and_wait(root);
+
+        num_childs = 3 * num_childs;
+    }
+}
+
+//! Tests whether task scheduler allows thieves to hoard task objects.
+/** The test takes a while to run, so we run it only with the default
+    number of threads. */
+void TestTaskReclamation() {
+    REMARK("testing task reclamation\n");
+
+    size_t initial_amount_of_memory = 0;
+    double task_count_sum = 0;
+    double task_count_sum_square = 0;
+    double average, sigma;
+
+    tbb::task_scheduler_init init (MinThread);
+    REMARK("Starting with %d threads\n", MinThread);
+    // For now, the master will produce "additional" tasks; later a worker will replace it;
+    Producer  = internal::governor::local_scheduler();
+    int N = InitialStatsIterations;
+    // First N iterations fill internal buffers and collect initial statistics
+    for( int i=0; i<N; ++i ) {
+        // First N iterations fill internal buffers and collect initial statistics
+        RunTaskGenerators();
+        RunTaskListGenerator();
+
+        size_t m = GetMemoryUsage();
+        if( m-initial_amount_of_memory > 0)
+            initial_amount_of_memory = m;
+
+        intptr_t n = internal::governor::local_scheduler()->get_task_node_count( /*count_arena_workers=*/true );
+        task_count_sum += n;
+        task_count_sum_square += n*n;
+
+        REMARK( "Consumed %ld bytes and %ld objects (iteration=%d)\n", long(m), long(n), i );
+    }
+    // Calculate statistical values
+    average = task_count_sum / N;
+    sigma   = sqrt( (task_count_sum_square - task_count_sum*task_count_sum/N)/N );
+    REMARK("Average task count: %g, sigma: %g, sum: %g, square sum:%g \n", average, sigma, task_count_sum, task_count_sum_square);
+
+    int     last_error_iteration = 0,
+            producer_switch_iteration = 0,
+            producer_switches = 0;
+    bool    switchProducer = false,
+            checkProducer = false;
+    for( int i=0; i < MaxIterations; ++i ) {
+        // These iterations check for excessive memory use and unreasonable task count
+        RunTaskGenerators( switchProducer, checkProducer );
+        RunTaskListGenerator();
+
+        intptr_t n = internal::governor::local_scheduler()->get_task_node_count( /*count_arena_workers=*/true );
+        size_t m = GetMemoryUsage();
+
+        if( (m-initial_amount_of_memory > 0) && (n > average+4*sigma) ) {
+            // Use 4*sigma interval (for normal distribution, 3*sigma contains ~99% of values).
+            REMARK( "Warning: possible leak of up to %ld bytes; currently %ld cached task objects (iteration=%d)\n",
+                    static_cast<unsigned long>(m-initial_amount_of_memory), long(n), i );
+            last_error_iteration = i;
+            initial_amount_of_memory = m;
+        } else {
+            REMARK( "Consumed %ld bytes and %ld objects (iteration=%d)\n", long(m), long(n), i );
+        }
+        if ( i == last_error_iteration + AsymptoticRange ) {
+            if ( producer_switches++ == NumProducerSwitches )
+                break;
+            else {
+                last_error_iteration = producer_switch_iteration = i;
+                switchProducer = true;
+            }
+        }
+        else {
+            switchProducer = false;
+            checkProducer = producer_switch_iteration && (i == producer_switch_iteration + ProducerCheckTimeout);
+        }
+    }
+    ASSERT( last_error_iteration < MaxIterations - AsymptoticRange, "The amount of allocated tasks keeps growing. Leak is possible." );
+}
+
+int TestMain () {
+    if( !GetMemoryUsage() ) {
+        REMARK("GetMemoryUsage is not implemented for this platform\n");
+        return Harness::Skipped;
+    }
+    TestTaskReclamation();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_task_priority.cpp b/xdl/third_party/tbb/src/test/test_task_priority.cpp
new file mode 100644
index 00000000..ba5c27c4
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_priority.cpp
@@ -0,0 +1,676 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+#include "harness.h"
+
+#if __TBB_GCC_STRICT_ALIASING_BROKEN
+    #pragma GCC diagnostic ignored "-Wstrict-aliasing"
+#endif
+
+#if __TBB_TASK_GROUP_CONTEXT
+
+#include "tbb/task.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/atomic.h"
+#include <cstdlib>
+
+#if _MSC_VER && __TBB_NO_IMPLICIT_LINKAGE
+// plays around __TBB_NO_IMPLICIT_LINKAGE. __TBB_LIB_NAME should be defined (in makefiles)
+    #pragma comment(lib, __TBB_STRING(__TBB_LIB_NAME))
+#endif
+
+const int NumIterations = 100;
+const int NumLeafTasks = 2;
+int MinBaseDepth = 8;
+int MaxBaseDepth = 10;
+int BaseDepth = 0;
+
+const int DesiredNumThreads = 12;
+
+const int NumTests = 8;
+int TestSwitchBetweenMastersRepeats = 4;
+
+int g_NumMasters = 0;
+volatile intptr_t *g_LeavesExecuted = NULL;
+
+int g_TestFailures[NumTests];
+int g_CurConfig = 0;
+
+int P = 0;
+
+#if !__TBB_TASK_PRIORITY
+namespace tbb {
+    enum priority_t {
+        priority_low = 0,
+        priority_normal = 1,
+        priority_high = 2
+    };
+}
+#endif /* __TBB_TASK_PRIORITY */
+
+tbb::priority_t Low,
+                High;
+int PreemptionActivatorId = 1;
+
+enum Options {
+    NoPriorities = 0,
+    TestPreemption = 1,
+    Flog = 2,
+    FlogEncloser = Flog | 4
+};
+
+const char *PriorityName(tbb::priority_t p) {
+    if( p == tbb::priority_high ) return "high";
+    if( p == tbb::priority_normal ) return "normal";
+    if( p == tbb::priority_low ) return "low";
+    return "bad";
+}
+
+void PrepareGlobals ( int numMasters ) {
+    ASSERT( !g_NumMasters && !g_LeavesExecuted, NULL );
+    g_NumMasters = numMasters;
+    if ( !g_LeavesExecuted )
+        g_LeavesExecuted = new intptr_t[numMasters];
+    g_CurConfig = 0;
+    memset( const_cast<intptr_t*>(g_LeavesExecuted), 0, sizeof(intptr_t) * numMasters );
+    memset( g_TestFailures, 0, sizeof(int) * NumTests );
+}
+
+void ClearGlobals () {
+    ASSERT( g_LeavesExecuted, NULL );
+    delete [] g_LeavesExecuted;
+    g_LeavesExecuted = NULL;
+    g_NumMasters = 0;
+    REMARK("\r                                                             \r");
+}
+
+class LeafTask : public tbb::task {
+    int m_tid;
+    uintptr_t m_opts;
+
+    tbb::task* execute () __TBB_override {
+        volatile int anchor = 0;
+        for ( int i = 0; i < NumIterations; ++i )
+            anchor += i;
+        __TBB_FetchAndAddW(g_LeavesExecuted + m_tid, 1);
+#if __TBB_TASK_PRIORITY
+        ASSERT( !m_opts || (m_opts & Flog) || (!(m_opts & TestPreemption) ^ (m_tid == PreemptionActivatorId)), NULL );
+        if ( (m_opts & TestPreemption) && g_LeavesExecuted[0] > P && group_priority() == tbb::priority_normal ) {
+            ASSERT( m_tid == PreemptionActivatorId, NULL );
+            ASSERT( (PreemptionActivatorId == 1 ? High > tbb::priority_normal : Low < tbb::priority_normal), NULL );
+            set_group_priority( PreemptionActivatorId == 1 ? High : Low );
+        }
+#endif /* __TBB_TASK_PRIORITY */
+        return NULL;
+    }
+public:
+    LeafTask ( int tid, uintptr_t opts ) : m_tid(tid), m_opts(opts) {
+        ASSERT( tid < g_NumMasters, NULL );
+    }
+};
+
+template<class NodeType>
+class NodeTask : public tbb::task {
+protected:
+    int m_tid;
+    int m_depth;
+    uintptr_t m_opts;
+    task *m_root;
+
+    void SpawnChildren ( task* parent_node ) {
+        ASSERT( m_depth > 0, NULL );
+        if ( g_LeavesExecuted[m_tid] % (100 / m_depth) == 0 ) {
+            if ( m_opts & Flog ) {
+#if __TBB_TASK_PRIORITY
+                task *r = m_opts & FlogEncloser ? this : m_root;
+                tbb::priority_t p = r->group_priority();
+                r->set_group_priority( p == Low ? High : Low );
+#endif /* __TBB_TASK_PRIORITY */
+            }
+            else
+                __TBB_Yield();
+        }
+        parent_node->set_ref_count(NumLeafTasks + 1);
+        --m_depth;
+        for ( int i = 0; i < NumLeafTasks; ++i ) {
+            task *t = m_depth ? (task*) new(parent_node->allocate_child()) NodeType(m_tid, m_depth, m_opts, m_root)
+                              : (task*) new(parent_node->allocate_child()) LeafTask(m_tid, m_opts);
+            task::spawn(*t);
+        }
+    }
+
+public:
+    NodeTask ( int tid, int _depth, uintptr_t opts, task *r = NULL )
+        : m_tid(tid), m_depth(_depth), m_opts(opts), m_root(r)
+    {}
+};
+
+class NestedGroupNodeTask : public NodeTask<NestedGroupNodeTask> {
+    task* execute () __TBB_override {
+        tbb::task_group_context ctx; // Use bound context
+        tbb::empty_task &r = *new( task::allocate_root(ctx) ) tbb::empty_task;
+        SpawnChildren(&r);
+        r.wait_for_all();
+        task::destroy(r);
+        return NULL;
+    }
+public:
+    NestedGroupNodeTask ( int tid, int _depth, uintptr_t opts, task *r = NULL )
+        : NodeTask<NestedGroupNodeTask>(tid, _depth, opts, r)
+    {}
+};
+
+class BlockingNodeTask : public NodeTask<BlockingNodeTask> {
+    task* execute () __TBB_override {
+        SpawnChildren(this);
+        wait_for_all();
+        return NULL;
+    }
+public:
+    BlockingNodeTask ( int tid, int _depth, uintptr_t opts, task *r = NULL )
+        : NodeTask<BlockingNodeTask>(tid, _depth, opts, r) {}
+};
+
+class NonblockingNodeTask : public NodeTask<NonblockingNodeTask> {
+    task* execute () __TBB_override {
+        if ( m_depth < 0 )
+            return NULL; // I'm just a continuation now
+        recycle_as_safe_continuation();
+        SpawnChildren(this);
+        m_depth = -1;
+        return NULL;
+    }
+public:
+    NonblockingNodeTask ( int tid, int _depth, uintptr_t opts, task *r = NULL )
+        : NodeTask<NonblockingNodeTask>(tid, _depth, opts, r)
+    {}
+};
+
+template<class NodeType>
+class MasterBodyBase : NoAssign, Harness::NoAfterlife {
+protected:
+    uintptr_t m_opts;
+
+public:
+    void RunTaskForest ( int id ) const {
+        ASSERT( id < g_NumMasters, NULL );
+        g_LeavesExecuted[id] = 0;
+        int d = BaseDepth + id;
+        tbb::task_scheduler_init init(P-1);
+        tbb::task_group_context ctx (tbb::task_group_context::isolated);
+        tbb::empty_task &r = *new( tbb::task::allocate_root(ctx) ) tbb::empty_task;
+        const int R = 4;
+        r.set_ref_count( R * P + 1 );
+        // Only PreemptionActivator thread changes its task tree priority in preemption test mode
+        const uintptr_t opts = (id == PreemptionActivatorId) ? m_opts : (m_opts & ~(uintptr_t)TestPreemption);
+        for ( int i = 0; i < R; ++i ) {
+            for ( int j = 1; j < P; ++j )
+                r.spawn( *new(r.allocate_child()) NodeType(id, MinBaseDepth + id, opts, &r) );
+            r.spawn( *new(r.allocate_child()) NodeType(id, d, opts, &r) );
+        }
+        int count = 1;
+        intptr_t lastExecuted = 0;
+        while ( r.ref_count() > 1 ) {
+            // Give workers time to make some progress.
+            for ( int i = 0; i < 10 * count; ++i )
+                __TBB_Yield();
+#if __TBB_TASK_PRIORITY
+            if ( lastExecuted == g_LeavesExecuted[id] ) {
+                // No progress. Likely all workers left to higher priority arena,
+                // and then returned to RML. Request workers back from RML.
+                tbb::task::enqueue( *new(tbb::task::allocate_root() ) tbb::empty_task, id == 0 ? Low : High );
+                Harness::Sleep(count);
+#if __TBB_ipf
+                // Increased sleep periods are required on systems with unfair hyperthreading (Itanium(R) 2 processor)
+                count += 10;
+#endif
+            }
+            else {
+                count = 1;
+                lastExecuted = g_LeavesExecuted[id];
+            }
+#else /* !__TBB_TASK_PRIORITY */
+            (void)lastExecuted;
+            tbb::task::enqueue( *new(tbb::task::allocate_root() ) tbb::empty_task );
+#endif /* !__TBB_TASK_PRIORITY */
+        }
+        ASSERT( g_LeavesExecuted[id] == R * ((1 << d) + ((P - 1) * (1 << (MinBaseDepth + id)))), NULL );
+        g_LeavesExecuted[id] = -1;
+        tbb::task::destroy(r);
+    }
+
+    MasterBodyBase ( uintptr_t opts ) : m_opts(opts) {}
+};
+
+template<class NodeType>
+class MasterBody : public MasterBodyBase<NodeType> {
+    int m_testIndex;
+public:
+    void operator() ( int id ) const {
+        this->RunTaskForest(id);
+        if ( this->m_opts & Flog )
+            return;
+        if ( this->m_opts & TestPreemption ) {
+            if ( id == 1 && g_LeavesExecuted[0] == -1 ) {
+                //REMARK( "Warning: Low priority master finished too early [depth %d]\n", Depth );
+                ++g_TestFailures[m_testIndex];
+            }
+        }
+        else {
+            if ( id == 0 && g_LeavesExecuted[1] == -1 ) {
+                //REMARK( "Warning: Faster master takes too long [depth %d]\n", Depth );
+                ++g_TestFailures[m_testIndex];
+            }
+        }
+    }
+
+    MasterBody ( int idx, uintptr_t opts ) : MasterBodyBase<NodeType>(opts), m_testIndex(idx) {}
+};
+
+template<class NodeType>
+void RunPrioritySwitchBetweenTwoMasters ( int idx, uintptr_t opts ) {
+    ASSERT( idx < NumTests, NULL );
+    REMARK( "Config %d: idx=%i, opts=%u\r", ++g_CurConfig, idx, (unsigned)opts );
+    NativeParallelFor ( 2, MasterBody<NodeType>(idx, opts) );
+    Harness::Sleep(50);
+}
+
+void TestPrioritySwitchBetweenTwoMasters () {
+    if ( P > DesiredNumThreads ) {
+        REPORT_ONCE( "Known issue: TestPrioritySwitchBetweenTwoMasters is skipped for big number of threads\n" );
+        return;
+    }
+    tbb::task_scheduler_init init; // keeps the market alive to reduce the amount of TBB warnings
+    REMARK( "Stress tests: %s / %s \n", Low == tbb::priority_low ? "Low" : "Normal", High == tbb::priority_normal ? "Normal" : "High" );
+    PrepareGlobals( 2 );
+    for ( int i = 0; i < TestSwitchBetweenMastersRepeats; ++i ) {
+        for ( BaseDepth = MinBaseDepth; BaseDepth <= MaxBaseDepth; ++BaseDepth ) {
+            RunPrioritySwitchBetweenTwoMasters<BlockingNodeTask>( 0, NoPriorities );
+            RunPrioritySwitchBetweenTwoMasters<BlockingNodeTask>( 1, TestPreemption );
+            RunPrioritySwitchBetweenTwoMasters<NonblockingNodeTask>( 2, NoPriorities );
+            RunPrioritySwitchBetweenTwoMasters<NonblockingNodeTask>( 3, TestPreemption );
+            if ( i == 0 ) {
+                RunPrioritySwitchBetweenTwoMasters<BlockingNodeTask>( 4, Flog );
+                RunPrioritySwitchBetweenTwoMasters<NonblockingNodeTask>( 5, Flog );
+                RunPrioritySwitchBetweenTwoMasters<NestedGroupNodeTask>( 6, Flog );
+                RunPrioritySwitchBetweenTwoMasters<NestedGroupNodeTask>( 7, FlogEncloser );
+            }
+        }
+    }
+#if __TBB_TASK_PRIORITY
+    const int NumRuns = TestSwitchBetweenMastersRepeats * (MaxBaseDepth - MinBaseDepth + 1);
+    for ( int i = 0; i < NumTests; ++i ) {
+        if ( g_TestFailures[i] )
+            REMARK( "Test %d: %d failures in %d runs\n", i, g_TestFailures[i], NumRuns );
+        if ( g_TestFailures[i] * 100 / NumRuns > 50 ) {
+            if ( i == 1 )
+                REPORT_ONCE( "Known issue: priority effect is limited in case of blocking-style nesting\n" );
+            else
+                REPORT( "Warning: test %d misbehaved too often (%d out of %d)\n", i, g_TestFailures[i], NumRuns );
+        }
+    }
+#endif /* __TBB_TASK_PRIORITY */
+    ClearGlobals();
+}
+
+class SingleChildRootTask : public tbb::task {
+    tbb::task* execute () __TBB_override {
+        set_ref_count(2);
+        spawn ( *new(allocate_child()) tbb::empty_task );
+        wait_for_all();
+        return NULL;
+    }
+};
+
+int TestSimplePriorityOps ( tbb::priority_t prio ) {
+    tbb::task_scheduler_init init;
+    tbb::task_group_context ctx;
+#if __TBB_TASK_PRIORITY
+    ctx.set_priority( prio );
+#else /* !__TBB_TASK_PRIORITY */
+    (void)prio;
+#endif /* !__TBB_TASK_PRIORITY */
+    tbb::task *r = new( tbb::task::allocate_root(ctx) ) tbb::empty_task;
+    r->set_ref_count(2);
+    r->spawn ( *new(r->allocate_child()) tbb::empty_task );
+    REMARK( "TestSimplePriorityOps: waiting for a child\n" );
+    r->wait_for_all();
+    ASSERT( !r->ref_count(), NULL );
+    REMARK( "TestLowPriority: executing an empty root\n" );
+    tbb::task::spawn_root_and_wait(*r);
+    r = new( tbb::task::allocate_root(ctx) ) SingleChildRootTask;
+    REMARK( "TestLowPriority: executing a root with a single child\n" );
+    tbb::task::spawn_root_and_wait(*r);
+    return 0;
+}
+
+#include "tbb/parallel_for.h"
+
+void EmulateWork( int ) {
+    for ( int i = 0; i < 1000; ++i )
+        __TBB_Yield();
+}
+
+class PeriodicActivitiesBody {
+public:
+    static const int parallelIters[2];
+    static const int seqIters[2];
+    static int mode;
+    void operator() ( int id ) const {
+        tbb::task_group_context ctx;
+#if __TBB_TASK_PRIORITY
+        ctx.set_priority( id ? High : Low );
+#else /* !__TBB_TASK_PRIORITY */
+        (void)id;
+#endif /* !__TBB_TASK_PRIORITY */
+        for ( int i = 0; i < seqIters[mode]; ++i ) {
+            tbb::task_scheduler_init init;
+            tbb::parallel_for( 1, parallelIters[mode], &EmulateWork, ctx );
+        }
+    }
+};
+
+const int PeriodicActivitiesBody::parallelIters[] = {10000, 100};
+const int PeriodicActivitiesBody::seqIters[] = {5, 2};
+int PeriodicActivitiesBody::mode = 0;
+
+void TestPeriodicConcurrentActivities () {
+    REMARK( "TestPeriodicConcurrentActivities: %s / %s \n", Low == tbb::priority_low ? "Low" : "Normal", High == tbb::priority_normal ? "Normal" : "High" );
+    NativeParallelFor ( 2, PeriodicActivitiesBody() );
+}
+
+#include "harness_bad_expr.h"
+
+void TestPriorityAssertions () {
+#if TRY_BAD_EXPR_ENABLED && __TBB_TASK_PRIORITY
+    REMARK( "TestPriorityAssertions\n" );
+    tbb::task_scheduler_init init; // to avoid autoinit that'd affect subsequent tests
+    tbb::priority_t bad_low_priority = tbb::priority_t( tbb::priority_low - 1 ),
+                    bad_high_priority = tbb::priority_t( tbb::priority_high + 1 );
+    tbb::task_group_context ctx;
+    // Catch assertion failures
+    tbb::set_assertion_handler( AssertionFailureHandler );
+    TRY_BAD_EXPR( ctx.set_priority( bad_low_priority ), "Invalid priority level value" );
+    tbb::task &t = *new( tbb::task::allocate_root() ) tbb::empty_task;
+    TRY_BAD_EXPR( tbb::task::enqueue( t, bad_high_priority ), "Invalid priority level value" );
+    // Restore normal assertion handling
+    tbb::set_assertion_handler( ReportError );
+#endif /* TRY_BAD_EXPR_ENABLED && __TBB_TASK_PRIORITY */
+}
+
+#if __TBB_TASK_PRIORITY
+
+tbb::atomic<tbb::priority_t> g_order;
+tbb::atomic<bool> g_order_established;
+tbb::atomic<int> g_num_tasks;
+tbb::atomic<bool> g_all_tasks_enqueued;
+int g_failures;
+class OrderedTask : public tbb::task {
+    tbb::priority_t my_priority;
+public:
+    OrderedTask(tbb::priority_t p) : my_priority(p) {
+        ++g_num_tasks;
+    }
+    tbb::task* execute() __TBB_override {
+        tbb::priority_t prev = g_order.fetch_and_store(my_priority);
+        if( my_priority != prev) {
+            REMARK("prev:%s --> new:%s\n", PriorityName(prev), PriorityName(my_priority));
+            // TODO: improve the test for concurrent workers
+            if(!g_order_established) {
+                // initial transition path allowed low->[normal]->high
+                if(my_priority == tbb::priority_high)
+                    g_order_established = true;
+                else ASSERT(my_priority == tbb::priority_normal && prev == tbb::priority_low, NULL);
+            } else { //transition path allowed high->normal->low
+                bool fail = prev==tbb::priority_high && my_priority!=tbb::priority_normal; // previous priority is high - bad order
+                fail |= prev==tbb::priority_normal && my_priority!=tbb::priority_low; // previous priority is normal - bad order
+                fail |= prev==tbb::priority_low; // transition from low priority but not during initialization
+                if ( fail ) {
+                    if ( g_all_tasks_enqueued )
+                        REPORT_ONCE( "ERROR: Bad order: prev = %s, my_priority = %s\n", PriorityName( prev ), PriorityName( my_priority ) );
+                    ++g_failures;
+                }
+            }
+        }
+        EmulateWork(0);
+        --g_num_tasks;
+        return NULL;
+    }
+    static void start(int i) {
+        tbb::priority_t p = i%3==0? tbb::priority_low : (i%3==1? tbb::priority_normal : tbb::priority_high );
+        OrderedTask &t = *new(tbb::task::allocate_root()) OrderedTask(p);
+        tbb::task::enqueue(t, p);
+    }
+};
+
+//Look for discussion of the issue at http://software.intel.com/en-us/forums/showthread.php?t=102159
+void TestEnqueueOrder () {
+    REMARK("Testing order of enqueued tasks\n");
+    tbb::task_scheduler_init init(1); // to simplify transition checks only one extra worker for enqueue
+    g_order = tbb::priority_low;
+    g_order_established = false;
+    g_all_tasks_enqueued = false;
+    g_failures = 0;
+    for( int i = 0; i < 1000; i++)
+        OrderedTask::start(i);
+    if ( int curr_num_tasks = g_num_tasks ) {
+        // Sync with worker not to set g_all_tasks_enqueued too early.
+        while ( curr_num_tasks == g_num_tasks ) __TBB_Yield();
+    }
+    g_all_tasks_enqueued = true;
+    while( g_order == tbb::priority_low && g_num_tasks>0 ) __TBB_Yield();
+    while( g_order != tbb::priority_low && g_num_tasks>0 ) __TBB_Yield();
+    // We cannot differentiate if this misbehavior is caused by the test or by the implementation.
+    // Howerever, we do not promise mandatory priorities so we can state that the misbehavior in less
+    // than 1% cases is our best effort.
+    ASSERT( g_failures < 5, "Too many failures" );
+}
+
+namespace test_propagation {
+
+// This test creates two binary trees of task_group_context objects.
+// Indices in a binary tree have the following layout:
+//  [1]--> [2] -> [4],[5]
+//     \-> [3] -> [6],[7]
+static const int first = 1, last = 7;
+tbb::task_group_context* g_trees[2][/*last+1*/8];
+tbb::task_group_context* g_default_ctx;
+tbb::atomic<int> g_barrier;
+tbb::atomic<bool> is_finished;
+
+class TestSetPriorityTask : public tbb::task {
+    const int m_tree, m_i;
+public:
+    TestSetPriorityTask(int t, int i) : m_tree(t), m_i(i) {}
+    tbb::task* execute() __TBB_override {
+        if( !m_i ) { // the first task creates two trees
+            g_default_ctx = group();
+            for( int i = 0; i <= 1; ++i ) {
+                g_trees[i][1] = new tbb::task_group_context( tbb::task_group_context::isolated );
+                tbb::task::spawn(*new(tbb::task::allocate_root(*g_trees[i][1])) TestSetPriorityTask(i, 1));
+            }
+        }
+        else if( m_i <= last/2 ) { // is divisible
+            for( int i = 0; i <= 1; ++i ) {
+                const int index = 2*m_i + i;
+                g_trees[m_tree][index] = new tbb::task_group_context ( tbb::task_group_context::bound );
+                tbb::task::spawn(*new(tbb::task::allocate_root(*g_trees[m_tree][index])) TestSetPriorityTask(m_tree, index));
+            }
+        }
+        --g_barrier;
+        //REMARK("Task %i executing\n", m_i);
+        while (!is_finished) __TBB_Yield();
+        change_group(*g_default_ctx); // avoid races with destruction of custom contexts
+        --g_barrier;
+        return NULL;
+    }
+};
+
+// Tests task_group_context state propagation, also for cancellation.
+void TestSetPriority() {
+    REMARK("Testing set_priority() with existing forest\n");
+    const int workers = last*2+1; // +1 is worker thread executing the first task
+    const int max_workers = 4*tbb::task_scheduler_init::default_num_threads();
+    if ( workers+1 > max_workers ) {
+        REPORT( "Known issue: TestSetPriority requires %d threads but due to 4P hard limit the maximum number of threads is %d\n", workers+1, max_workers );
+        return;
+    }
+    tbb::task_scheduler_init init(workers+1); // +1 is master thread
+    g_barrier = workers;
+    is_finished = false;
+    tbb::task::spawn(*new(tbb::task::allocate_root()) TestSetPriorityTask(0,0));
+    while(g_barrier) __TBB_Yield();
+    g_trees[0][2]->set_priority(tbb::priority_high);
+    g_trees[0][4]->set_priority(tbb::priority_normal);
+    g_trees[1][3]->set_priority(tbb::priority_high); // Regression test: it must not set priority_high to g_trees[0][4]
+    //                                         -  1  2  3  4  5  6  7
+    const int expected_priority[2][last+1] = {{0, 0, 1, 0, 0, 1, 0, 0},
+                                              {0, 0, 0, 1, 0, 0, 1, 1}};
+    for (int t = 0; t < 2; ++t)
+        for (int i = first; i <= last; ++i) {
+            REMARK("\r                    \rTask %i... ", i);
+            ASSERT(g_trees[t][i]->priority() == (expected_priority[t][i]? tbb::priority_high : tbb::priority_normal), NULL);
+            REMARK("OK");
+        }
+    REMARK("\r                    \r");
+    REMARK("Also testing cancel_group_execution()\n"); // cancellation shares propagation logic with set_priority() but there are also differences
+    g_trees[0][4]->cancel_group_execution();
+    g_trees[0][5]->cancel_group_execution();
+    g_trees[1][3]->cancel_group_execution();
+    //                                             -  1  2  3  4  5  6  7
+    const int expected_cancellation[2][last+1] = {{0, 0, 0, 0, 1, 1, 0, 0},
+                                                  {0, 0, 0, 1, 0, 0, 1, 1}};
+    for (int t = 0; t < 2; ++t)
+        for (int i = first; i <= last; ++i) {
+            REMARK("\r                    \rTask %i... ", i);
+            ASSERT( g_trees[t][i]->is_group_execution_cancelled() == (expected_cancellation[t][i]==1), NULL);
+            REMARK("OK");
+        }
+    REMARK("\r                    \r");
+    g_barrier = workers;
+    is_finished = true;
+    REMARK("waiting tasks to terminate\n");
+    while(g_barrier) __TBB_Yield();
+    for (int t = 0; t < 2; ++t)
+        for (int i = first; i <= last; ++i)
+            delete g_trees[t][i];
+}
+}//namespace test_propagation
+
+struct OuterParFor {
+    void operator()(int) const {
+        tbb::affinity_partitioner ap;
+        tbb::task_group_context ctx;
+        ctx.set_priority(tbb::priority_high);
+        tbb::parallel_for(0, 100, Harness::DummyBody(1000), ap, ctx);
+    }
+};
+
+// Test priorities with affinity tasks.
+void TestAffinityTasks() {
+    REMARK("Test priorities with affinity tasks\n");
+    tbb::task_scheduler_init init;
+    tbb::affinity_partitioner ap;
+    for (int i = 0; i < 10; ++i)
+        tbb::parallel_for(0, 100, OuterParFor(), ap);
+}
+
+namespace regression {
+// This is a regression test for a bug with task_group_context used from a thread that created its local scheduler but not the implicit arena
+class TestTGContext {
+public:
+    void operator() (int) const {
+        tbb::task_group_context ctx;
+        ctx.cancel_group_execution();   // initializes the local weak scheduler on the thread
+        ctx.set_priority(tbb::priority_high);
+    }
+};
+
+void TestTGContextOnNewThread() {
+    REMARK("Testing a regression for a bug with task_group_context\n");
+    TestTGContext body;
+    NativeParallelFor(1, body);
+}
+}//namespace regression_priorities
+#endif /* __TBB_TASK_PRIORITY */
+
+#if !__TBB_TEST_SKIP_AFFINITY
+#include "harness_concurrency.h"
+#endif
+
+int RunTests () {
+#if __TBB_TASK_PRIORITY
+    TestEnqueueOrder();
+#endif /* __TBB_TASK_PRIORITY */
+    TestPriorityAssertions();
+    TestSimplePriorityOps(tbb::priority_low);
+    TestSimplePriorityOps(tbb::priority_high);
+    P = tbb::task_scheduler_init::default_num_threads();
+    REMARK( "The number of threads: %d\n", P );
+    if ( P < 3 )
+        return Harness::Skipped;
+    Low = tbb::priority_normal;
+    High = tbb::priority_high;
+    TestPeriodicConcurrentActivities();
+    TestPrioritySwitchBetweenTwoMasters();
+    Low = tbb::priority_low;
+    High = tbb::priority_normal;
+    PreemptionActivatorId = 0;
+    TestPeriodicConcurrentActivities();
+    TestPrioritySwitchBetweenTwoMasters();
+    High = tbb::priority_high;
+    TestPeriodicConcurrentActivities();
+    TestPrioritySwitchBetweenTwoMasters();
+    PreemptionActivatorId = 1;
+    TestPrioritySwitchBetweenTwoMasters();
+    TestAffinityTasks();
+    regression::TestTGContextOnNewThread();
+
+    return Harness::Done;
+}
+
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#include "tbb/global_control.h"
+
+int TestMain () {
+#if !__TBB_TEST_SKIP_AFFINITY
+    Harness::LimitNumberOfThreads( DesiredNumThreads );
+#endif
+#if !__TBB_TASK_PRIORITY
+    REMARK( "Priorities disabled: Running as just yet another task scheduler test\n" );
+#else
+    test_propagation::TestSetPriority(); // TODO: move down when bug 1996 is fixed
+#endif /* __TBB_TASK_PRIORITY */
+
+    RunTests();
+    tbb::global_control c(tbb::global_control::max_allowed_parallelism, 1);
+    PeriodicActivitiesBody::mode = 1;
+    TestSwitchBetweenMastersRepeats = 1;
+    return RunTests();
+}
+
+#else /* !__TBB_TASK_GROUP_CONTEXT */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+
+#endif /* !__TBB_TASK_GROUP_CONTEXT */
diff --git a/xdl/third_party/tbb/src/test/test_task_scheduler_init.cpp b/xdl/third_party/tbb/src/test/test_task_scheduler_init.cpp
new file mode 100644
index 00000000..5c4196a0
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_scheduler_init.cpp
@@ -0,0 +1,371 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// We want to test waiting for workers feature with non-preview binaries. However,
+// we want to have some testing of task_scheduler_init without this macro.
+#if !__TBB_CPF_BUILD
+#define TBB_PREVIEW_WAITING_FOR_WORKERS 1
+#endif
+
+#include "tbb/task_scheduler_init.h"
+#include <cstdlib>
+#include <cstdio>
+#if TBB_USE_EXCEPTIONS
+#include <stdexcept>
+#endif
+
+#include "harness_assert.h"
+#if _MSC_VER
+#pragma warning (push)
+    // MSVC discovers that ASSERT(false) inside TestBlockingTerminateNS::ExceptionTest2::Body makes the code
+    // in parallel_for after the body call unreachable. So supress the warning.
+#pragma warning (disable: 4702)
+#endif
+#include "tbb/parallel_for.h"
+#if _MSC_VER
+#pragma warning (pop)
+#endif
+
+#include "harness_concurrency_tracker.h"
+#include "harness_task.h"
+#include "harness.h"
+
+const int DefaultThreads = tbb::task_scheduler_init::default_num_threads();
+
+namespace tbb { namespace internal {
+size_t __TBB_EXPORTED_FUNC get_initial_auto_partitioner_divisor();
+}}
+
+int ArenaConcurrency() {
+    return int(tbb::internal::get_initial_auto_partitioner_divisor()/4); // TODO: expose through task_arena interface?
+}
+
+// Generally, TBB does not guarantee mandatory parallelism. This test uses some whitebox knowledge about when all the threads can be available
+bool test_mandatory_parallelism = true;
+
+//! Test that task::initialize and task::terminate work when doing nothing else.
+/** maxthread is treated as the "maximum" number of worker threads. */
+void InitializeAndTerminate( int maxthread ) {
+    __TBB_TRY {
+        for( int i=0; i<256; ++i ) {
+            int threads = (std::rand() % maxthread) + 1;
+            switch( i&3 ) {
+                default: {
+                    tbb::task_scheduler_init init( threads );
+                    ASSERT(init.is_active(), NULL);
+                    ASSERT(ArenaConcurrency()==(threads==1?2:threads), NULL);
+                    if (test_mandatory_parallelism)
+                        Harness::ExactConcurrencyLevel::check(threads, Harness::ExactConcurrencyLevel::Serialize);
+                    if(i&0x20) tbb::task::enqueue( (*new( tbb::task::allocate_root() ) TaskGenerator(2,6)) ); // a work deferred to workers
+                    break;
+                }
+                case 0: {
+                    tbb::task_scheduler_init init;
+                    ASSERT(init.is_active(), NULL);
+                    ASSERT(ArenaConcurrency()==(DefaultThreads==1?2:init.default_num_threads()), NULL);
+                    if (test_mandatory_parallelism)
+                        Harness::ExactConcurrencyLevel::check(init.default_num_threads(), Harness::ExactConcurrencyLevel::Serialize);
+                    if(i&0x40) tbb::task::enqueue( (*new( tbb::task::allocate_root() ) TaskGenerator(3,5)) ); // a work deferred to workers
+                    break;
+                }
+                case 1: {
+                    tbb::task_scheduler_init init( tbb::task_scheduler_init::deferred );
+                    ASSERT(!init.is_active(), "init should not be active; initialization was deferred");
+                    init.initialize( threads );
+                    ASSERT(init.is_active(), NULL);
+                    ASSERT(ArenaConcurrency()==(threads==1?2:threads), NULL);
+                    if (test_mandatory_parallelism)
+                        Harness::ExactConcurrencyLevel::check(threads, Harness::ExactConcurrencyLevel::Serialize);
+                    init.terminate();
+                    ASSERT(!init.is_active(), "init should not be active; it was terminated");
+                    break;
+                }
+                case 2: {
+                    tbb::task_scheduler_init init( tbb::task_scheduler_init::automatic );
+                    ASSERT(init.is_active(), NULL);
+                    ASSERT(ArenaConcurrency()==(DefaultThreads==1?2:init.default_num_threads()), NULL);
+                    if (test_mandatory_parallelism)
+                        Harness::ExactConcurrencyLevel::check(init.default_num_threads(), Harness::ExactConcurrencyLevel::Serialize);
+                    break;
+                }
+            }
+        }
+    } __TBB_CATCH( std::runtime_error& error ) {
+#if TBB_USE_EXCEPTIONS
+        REPORT("ERROR: %s\n", error.what() );
+#endif /* TBB_USE_EXCEPTIONS */
+    }
+}
+
+#if _WIN64
+namespace std {      // 64-bit Windows compilers have not caught up with 1998 ISO C++ standard
+    using ::srand;
+}
+#endif /* _WIN64 */
+
+struct ThreadedInit {
+    void operator()( int ) const {
+        InitializeAndTerminate(MaxThread);
+    }
+};
+
+#if _MSC_VER
+#include "tbb/machine/windows_api.h"
+#include <tchar.h>
+#endif /* _MSC_VER */
+
+/** The test will fail in particular if task_scheduler_init mistakenly hooks up
+    auto-initialization mechanism. **/
+void AssertExplicitInitIsNotSupplanted () {
+    tbb::task_scheduler_init init(1);
+
+    Harness::ExactConcurrencyLevel::check(1);
+}
+
+struct TestNoWorkerSurplusRun {
+    void operator() (int) const {
+        const unsigned THREADS = tbb::tbb_thread::hardware_concurrency()*2/3;
+        for (int j=0; j<10; j++) {
+            tbb::task_scheduler_init t(THREADS);
+            Harness::ExactConcurrencyLevel::Combinable unique;
+
+            for (int i=0; i<50; i++)
+                Harness::ExactConcurrencyLevel::checkLessOrEqual(THREADS, &unique);
+        }
+    }
+};
+
+void TestNoWorkerSurplus () {
+    // Run the test in a special thread because otherwise the surplus issue
+    // is not observed for some hardware configurations
+    NativeParallelFor( 1, TestNoWorkerSurplusRun() );
+}
+
+#if TBB_PREVIEW_WAITING_FOR_WORKERS
+#include "tbb/task_group.h"
+#include "tbb/task_arena.h"
+
+namespace TestBlockingTerminateNS {
+    struct EmptyBody {
+        void operator()() const {}
+        void operator()( int ) const {}
+    };
+
+    struct TestAutoInitBody {
+        void operator()( int ) const {
+            tbb::parallel_for( 0, 100, EmptyBody() );
+        }
+    };
+
+    static tbb::atomic<int> gSeed;
+    static tbb::atomic<int> gNumSuccesses;
+
+    class TestMultpleWaitBody {
+        bool myAutoInit;
+    public:
+        TestMultpleWaitBody( bool autoInit = false ) : myAutoInit( autoInit ) {}
+        void operator()( int ) const {
+            tbb::task_scheduler_init init( tbb::task_scheduler_init::deferred );
+            if ( !myAutoInit )
+                init.initialize( tbb::task_scheduler_init::automatic );
+            Harness::FastRandom rnd( ++gSeed );
+            // In case of auto init sub-tests we skip
+            //  - case #4 to avoid recursion
+            //  - case #5 because it is explicit initialization
+            const int numCases = myAutoInit ? 4 : 6;
+            switch ( rnd.get() % numCases ) {
+            case 0: {
+                tbb::task_arena a;
+                a.enqueue( EmptyBody() );
+                break;
+            }
+            case 1: {
+                tbb::task_group tg;
+                tg.run( EmptyBody() );
+                tg.wait();
+                break;
+            }
+            case 2:
+                tbb::parallel_for( 0, 100, EmptyBody() );
+                break;
+            case 3:
+                /* do nothing */
+                break;
+            case 4:
+                // Create and join several threads with auto initialized scheduler.
+                NativeParallelFor( rnd.get() % 5 + 1, TestMultpleWaitBody( true ) );
+                break;
+            case 5:
+                {
+                    tbb::task_scheduler_init init2;
+                    bool res = init2.blocking_terminate( std::nothrow );
+                    ASSERT( !res, NULL );
+                }
+                break;
+            }
+            if ( !myAutoInit && init.blocking_terminate( std::nothrow ) )
+                ++gNumSuccesses;
+        }
+    };
+
+    void TestMultpleWait() {
+        const int minThreads = 1;
+        const int maxThreads = 16;
+        const int numRepeats = 5;
+        // Initialize seed with different values on different machines.
+        gSeed = tbb::task_scheduler_init::default_num_threads();
+        for ( int repeats = 0; repeats<numRepeats; ++repeats ) {
+            for ( int threads = minThreads; threads<maxThreads; ++threads ) {
+                gNumSuccesses = 0;
+                NativeParallelFor( threads, TestMultpleWaitBody() );
+                ASSERT( gNumSuccesses > 0, "At least one blocking terminate must return 'true'" );
+            }
+        }
+    }
+
+#if TBB_USE_EXCEPTIONS
+    template <typename F>
+    void TestException( F &f ) {
+        Harness::suppress_unused_warning( f );
+        bool caught = false;
+        try {
+            f();
+            ASSERT( false, NULL );
+        }
+        catch ( const std::runtime_error& ) {
+            caught = true;
+        }
+#if TBB_USE_CAPTURED_EXCEPTION
+        catch ( const tbb::captured_exception& ) {
+            caught = true;
+        }
+#endif
+        catch ( ... ) {
+            ASSERT( false, NULL );
+        }
+        ASSERT( caught, NULL );
+    }
+
+    class ExceptionTest1 {
+        tbb::task_scheduler_init tsi1;
+        int myIndex;
+    public:
+        ExceptionTest1( int index ) : myIndex( index ) {}
+
+        void operator()() {
+            tbb::task_scheduler_init tsi2;
+            (myIndex == 0 ? tsi1 : tsi2).blocking_terminate();
+            ASSERT( false, "Blocking terminate did not throw the exception" );
+        }
+    };
+
+    struct ExceptionTest2 {
+        class Body {
+            Harness::SpinBarrier& myBarrier;
+        public:
+            Body( Harness::SpinBarrier& barrier ) : myBarrier( barrier ) {}
+            void operator()( int ) const {
+                myBarrier.wait();
+                tbb::task_scheduler_init init;
+                init.blocking_terminate();
+                ASSERT( false, "Blocking terminate did not throw the exception inside the parallel region" );
+            }
+        };
+        void operator()() {
+            const int numThreads = 4;
+            tbb::task_scheduler_init init( numThreads );
+            Harness::SpinBarrier barrier( numThreads );
+            tbb::parallel_for( 0, numThreads, Body( barrier ) );
+            ASSERT( false, "Parallel loop did not throw the exception" );
+        }
+    };
+#endif /* TBB_USE_EXCEPTIONS */
+
+    void TestExceptions() {
+        for ( int i = 0; i<2; ++i ) {
+            tbb::task_scheduler_init tsi[2];
+            bool res1 = tsi[i].blocking_terminate( std::nothrow );
+            ASSERT( !res1, NULL );
+            bool res2 = tsi[1-i].blocking_terminate( std::nothrow );
+            ASSERT( res2, NULL );
+        }
+#if TBB_USE_EXCEPTIONS
+        ExceptionTest1 Test1(0), Test2(1);
+        TestException( Test1 );
+        TestException( Test2 );
+        ExceptionTest2 Test3;
+        TestException( Test3 );
+#endif
+    }
+}
+
+void TestBlockingTerminate() {
+    TestBlockingTerminateNS::TestExceptions();
+    TestBlockingTerminateNS::TestMultpleWait();
+}
+#endif /* TBB_PREVIEW_WAITING_FOR_WORKERS */
+
+int TestMain () {
+    // Do not use tbb::task_scheduler_init directly in the scope of main's body,
+    // as a static variable, or as a member of a static variable.
+#if _MSC_VER && !__TBB_NO_IMPLICIT_LINKAGE && !defined(__TBB_LIB_NAME)
+    #ifdef _DEBUG
+        ASSERT(!GetModuleHandle(_T("tbb.dll")) && GetModuleHandle(_T("tbb_debug.dll")),
+            "test linked with wrong (non-debug) tbb library");
+    #else
+        ASSERT(!GetModuleHandle(_T("tbb_debug.dll")) && GetModuleHandle(_T("tbb.dll")),
+            "test linked with wrong (debug) tbb library");
+    #endif
+#endif /* _MSC_VER && !__TBB_NO_IMPLICIT_LINKAGE && !__TBB_LIB_NAME */
+    std::srand(2);
+    REMARK("testing master thread\n");
+    int threads = DefaultThreads*2;
+    {   // work-around shared RML
+        tbb::task_scheduler_init init( threads );
+        if( !Harness::ExactConcurrencyLevel::isEqual( threads ) ) {
+            threads = DefaultThreads;
+            if( MaxThread > DefaultThreads )
+                MaxThread = DefaultThreads;
+#if RML_USE_WCRM
+            REPORT("Known issue: shared RML for ConcRT does not support oversubscription\n");
+            test_mandatory_parallelism = false; // we cannot rely on ConcRT to provide all the requested threads
+#else
+            REPORT("Known issue: machine is heavy loaded or shared RML which does not support oversubscription is loaded\n");
+#endif
+        }
+    }
+    InitializeAndTerminate( threads ); // test initialization of more than default number of threads
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK("testing with %d threads\n", p );
+        // protect market with excess threads from default initializations
+        // TODO IDEA: enhance task_scheduler_init to serve as global_control setting so that
+        // number of threads > default concurrency will be requested from market.
+        // Such settings must be aggregated via 'max' function and 'max_allowed_parallelism' control
+        // (which has 'min' aggregation) will have precedence over it.
+        tbb::task_scheduler_init init( tbb::task_scheduler_init::deferred );
+        if( MaxThread > DefaultThreads ) init.initialize( MaxThread );
+        NativeParallelFor( p, ThreadedInit() );
+    }
+    AssertExplicitInitIsNotSupplanted();
+#if TBB_PREVIEW_WAITING_FOR_WORKERS
+    TestBlockingTerminate();
+#endif
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_task_scheduler_observer.cpp b/xdl/third_party/tbb/src/test/test_task_scheduler_observer.cpp
new file mode 100644
index 00000000..998e5d96
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_scheduler_observer.cpp
@@ -0,0 +1,424 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TEST_SLEEP_PERMISSION 1
+#define TBB_USE_PREVIEW_BINARY 1
+#endif
+// undefine __TBB_CPF_BUILD to simulate user's setup
+#undef __TBB_CPF_BUILD
+
+#define TBB_PREVIEW_LOCAL_OBSERVER 1
+
+#include "tbb/tbb_config.h"
+#include "harness.h"
+
+#if __TBB_SCHEDULER_OBSERVER
+#include "tbb/task_scheduler_observer.h"
+#include "tbb/task_scheduler_init.h"
+#include "tbb/atomic.h"
+#include "tbb/task.h"
+#include "tbb/enumerable_thread_specific.h"
+#include "../tbb/tls.h"
+#include "tbb/tick_count.h"
+#include "harness_barrier.h"
+
+#if _MSC_VER && __TBB_NO_IMPLICIT_LINKAGE
+// plays around __TBB_NO_IMPLICIT_LINKAGE. __TBB_LIB_NAME should be defined (in makefiles)
+    #pragma comment(lib, __TBB_STRING(__TBB_LIB_NAME))
+#endif
+
+const int MaxFlagIndex = sizeof(uintptr_t)*8-1;
+
+struct ObserverStats {
+    tbb::atomic<int> m_entries;
+    tbb::atomic<int> m_exits;
+    tbb::atomic<int> m_workerEntries;
+    tbb::atomic<int> m_workerSleeps;
+    tbb::atomic<int> m_workerExits;
+
+    void Reset () {
+        m_entries = m_exits = m_workerEntries = m_workerSleeps = m_workerExits = 0;
+    }
+
+    void operator += ( const ObserverStats& s ) {
+        m_entries += s.m_entries;
+        m_exits += s.m_exits;
+        m_workerEntries += s.m_workerEntries;
+        m_workerSleeps += s.m_workerSleeps;
+        m_workerExits += s.m_workerExits;
+    }
+};
+
+struct ThreadState {
+    uintptr_t m_flags;
+    tbb::task_scheduler_observer *m_dyingObserver;
+    uintptr_t m_maySleepCalls;
+    bool m_canSleep;
+    bool m_isMaster;
+    ThreadState() { reset(); }
+    void reset() {
+        m_maySleepCalls = m_flags = 0;
+        m_dyingObserver = NULL;
+        m_canSleep = m_isMaster = false;
+    }
+    static ThreadState &get();
+};
+
+tbb::enumerable_thread_specific<ThreadState> theLocalState;
+tbb::internal::tls<intptr_t> theThreadPrivate;
+
+ThreadState &ThreadState::get() {
+    bool exists;
+    ThreadState& state = theLocalState.local(exists);
+    // ETS will not detect that a thread was allocated with the same id as a destroyed thread
+    if( exists && theThreadPrivate.get() == 0 ) state.reset();
+    theThreadPrivate = 1; // mark thread constructed
+    return state;
+}
+
+static ObserverStats theStats;
+static tbb::atomic<int> theNumObservers;
+
+const int P = min( tbb::task_scheduler_init::default_num_threads(), (int)sizeof(int) * CHAR_BIT );
+
+enum TestMode {
+    //! Ensure timely workers destruction in order to guarantee all exit notification are fired.
+    tmSynchronized = 1,
+    //! Use local observer.
+    tmLocalObservation = 2,
+    //! Observer causes autoinitialization of the scheduler
+    tmAutoinitialization = 4,
+    //! test may_sleep
+    tmLeavingControl = 8
+};
+
+uintptr_t theTestMode,
+          thePrevMode = 0;
+
+class MyObserver : public tbb::task_scheduler_observer, public ObserverStats {
+    uintptr_t m_flag;
+    tbb::atomic<int> m_leave_ticket;
+    tbb::atomic<bool> m_dying;
+
+    void on_scheduler_entry( bool is_worker ) __TBB_override {
+        ThreadState& state = ThreadState::get();
+        ASSERT( is_worker==!state.m_isMaster, NULL );
+        if ( theTestMode & tmLeavingControl )
+            ASSERT( m_leave_ticket, NULL );
+        if ( thePrevMode & tmSynchronized ) {
+            ASSERT( !(state.m_flags & m_flag), "Observer repeatedly invoked for the same thread" );
+            if ( theTestMode & tmLocalObservation )
+                ASSERT( !state.m_flags, "Observer locality breached" );
+        }
+        if ( m_dying && theTestMode & tmLocalObservation ) {
+            // In case of local observation a worker may enter the arena after
+            // the wait for lagging on_entry calls in the MyObserver destructor
+            // succeeds but before its base class tbb::task_scheduler_observer
+            // destructor removes it from the internal list maintained by the
+            // task scheduler. This will result in on_entry notification without,
+            // subsequent on_exit as the observer is likely to be destroyed before
+            // the worker discovers that the arena is empty and leaves it.
+            //
+            // To prevent statistics distortion, ignore the notifications for
+            // observers about to be destroyed.
+            ASSERT( !state.m_dyingObserver || state.m_dyingObserver != this || thePrevMode & tmSynchronized, NULL );
+            state.m_dyingObserver = this;
+            return;
+        }
+        state.m_dyingObserver = NULL;
+        ++m_entries;
+        state.m_flags |= m_flag;
+        if ( is_worker )
+            ++m_workerEntries;
+    }
+    void on_scheduler_exit( bool is_worker ) __TBB_override {
+        ThreadState& state = ThreadState::get();
+        ASSERT( is_worker==!state.m_isMaster, NULL );
+        if ( m_dying && state.m_dyingObserver ) {
+            ASSERT( state.m_dyingObserver == this, "Exit without entry (for a dying observer)" );
+            state.m_dyingObserver = NULL;
+            return;
+        }
+        ASSERT( state.m_flags & m_flag, "Exit without entry" );
+        state.m_flags &= ~m_flag;
+        ++m_exits;
+        if ( is_worker )
+            ++m_workerExits;
+    }
+    bool may_sleep() __TBB_override {
+        ThreadState& state = ThreadState::get();
+        ++state.m_maySleepCalls;
+        Harness::Sleep(10);     // helps to reproduce the issues
+        ASSERT( !state.m_isMaster, NULL );
+        if( m_dying ) {         // check the anti-starvation logic
+            return keep_awake;  // thread should exit despite the return value
+        }
+        if( state.m_canSleep ) {// the permission for sleep was previously received
+            // though, it is an important check for the test, we still do not guarantee this condition
+            ASSERT_WARNING( !(theTestMode & tmLeavingControl), "may_sleep() called again after leaving permission was granted once, check if repeated");
+            return allow_sleep;
+        }
+        // note, may_sleep can be called before on_entry()
+        if( !(theTestMode & tmLeavingControl) || m_leave_ticket.fetch_and_store(-1) > 0 ) {
+            state.m_canSleep = true;
+            ++m_workerSleeps;
+            return allow_sleep;
+        }
+        return keep_awake;
+    }
+public:
+    // the method is called before the work in new arena starts enabling the leaving test mode
+    // in this mode may_sleep() does not allow a thread to fall asleep unless permitted below
+    void enable_leaving_test() {
+        ASSERT(theTestMode & tmLeavingControl, NULL);
+        m_leave_ticket.store<tbb::relaxed>(-1);
+        ASSERT(!is_observing(), NULL);
+        observe(true);
+    }
+
+    // the work is just done in the only arena, assume workers start entering may_sleep
+    void test_leaving() {
+#if TEST_SLEEP_PERMISSION
+        if( !(theTestMode & tmLeavingControl) )
+            return; // second call to the test TODO: extend the test for the second round as well
+        REMARK( "Testing may_sleep()\n");
+        ASSERT( !m_workerSleeps, "permission for sleep was given before the test starts?");
+        ASSERT( (theTestMode & tmSynchronized) && m_workerEntries >= P-1, "test_leaving assumes full subscription of the only arena");
+        for ( int j = 0; j < m_workerEntries; j++ ) {
+            REMARK( "Round %d: entries %d, sleeps %d\n", j, (int)m_workerEntries, (int)m_workerSleeps );
+            ASSERT( m_leave_ticket == -1, "unexpected mode, signal was not consumed by a worker?" );
+            m_leave_ticket = 1; // dismiss one
+            double n_seconds = 10;
+            (Harness::TimedWaitWhileEq(n_seconds))(m_workerSleeps, j);
+            ASSERT( n_seconds >= 0, "Time out while waiting for a worker to call may_sleep for the first time");
+            __TBB_Yield();
+        }
+        // the first time this method is called the work will be executed again,
+        // the next time time, the scheduler will start shutting down
+        theTestMode &= ~tmLeavingControl;
+        m_leave_ticket = m_workerSleeps = 0; // reset for the next round
+#endif
+    }
+
+    MyObserver( uintptr_t flag )
+        : tbb::task_scheduler_observer(theTestMode & tmLocalObservation ? true : false)
+        , m_flag(flag)
+    {
+        m_leave_ticket.store<tbb::relaxed>(0);
+        ++theNumObservers;
+        Reset();
+        m_dying = false;
+        // Local observer causes automatic scheduler initialization
+        // in the current thread, so here, we must postpone the activation.
+        if ( !(theTestMode & tmLocalObservation) && !(theTestMode & tmLeavingControl) )
+            observe(true);
+    }
+
+    ~MyObserver () {
+        m_dying = true;
+        ASSERT( m_exits <= m_entries, NULL );
+        if ( theTestMode & tmSynchronized ) {
+            tbb::tick_count t0 = tbb::tick_count::now();
+            while ( m_exits < m_entries && (tbb::tick_count::now() - t0).seconds() < 5 )
+                Harness::Sleep(10);
+            if ( m_exits < m_entries )
+                REPORT( "Warning: Entry/exit count mismatch (%d, %d). Observer is broken or machine is overloaded.\n", (int)m_entries, (int)m_exits );
+        }
+        theStats += *this;
+        --theNumObservers;
+        // it is recommended to disable observation before destructor of the base class starts,
+        // otherwise it can lead to concurrent notification callback on partly destroyed object,
+        // which in turn can harm (in addition) if derived class has new virtual methods.
+        // This class has no, and for test purposes we rely on implementation failsafe mechanism.
+        //observe(false);
+    }
+}; // class MyObserver
+
+Harness::SpinBarrier theGlobalBarrier;
+bool theGlobalBarrierActive = true;
+
+class FibTask : public tbb::task {
+    const int N;
+    uintptr_t m_flag;
+    MyObserver &m_observer;
+public:
+    FibTask( int n, uintptr_t flags, MyObserver &obs ) : N(n), m_flag(flags), m_observer(obs) {}
+
+    tbb::task* execute() __TBB_override {
+        ThreadState& s = ThreadState::get();
+        ASSERT( !(~s.m_flags & m_flag), NULL );
+        if( N < 2 )
+            return NULL;
+        bool globalBarrierActive = false;
+        if ( s.m_isMaster ) {
+            if ( theGlobalBarrierActive ) {
+                // This is the root task. Its N is equal to the number of threads.
+                // Spawn a task for each worker.
+                set_ref_count(N);
+                for ( int i = 1; i < N; ++i )
+                    spawn( *new( allocate_child() ) FibTask(20, m_flag, m_observer) );
+                if ( theTestMode & tmSynchronized ) {
+                    theGlobalBarrier.wait();
+                    ASSERT( m_observer.m_entries >= N, "Wrong number of on_entry calls after the first barrier" );
+                    // All the spawned tasks have been stolen by workers.
+                    // Now wait for workers to spawn some more tasks for this thread to steal back.
+                    theGlobalBarrier.wait();
+                    ASSERT( !theGlobalBarrierActive, "Workers are expected to have reset this flag" );
+                }
+                else
+                    theGlobalBarrierActive = false;
+                wait_for_all();
+                return NULL;
+            }
+        }
+        else {
+            if ( theGlobalBarrierActive ) {
+                if ( theTestMode & tmSynchronized ) {
+                    theGlobalBarrier.wait();
+                    globalBarrierActive = true;
+                }
+                theGlobalBarrierActive = false;
+            }
+        }
+        set_ref_count(3);
+        spawn( *new( allocate_child() ) FibTask(N-1, m_flag, m_observer) );
+        spawn( *new( allocate_child() ) FibTask(N-2, m_flag, m_observer) );
+        if ( globalBarrierActive ) {
+            // It's the first task executed by a worker. Release the master thread.
+            theGlobalBarrier.wait();
+        }
+        wait_for_all();
+        return NULL;
+    }
+}; // class FibTask
+
+Harness::SpinBarrier theMasterBarrier;
+
+class TestBody {
+    int m_numThreads;
+public:
+    TestBody( int numThreads ) : m_numThreads(numThreads) {}
+
+    void operator()( int i ) const {
+        ThreadState &state = ThreadState::get();
+        ASSERT( !state.m_isMaster, "should be newly initialized thread");
+        state.m_isMaster = true;
+        uintptr_t f = i <= MaxFlagIndex ? 1<<i : 0;
+        MyObserver o(f);
+        if ( theTestMode & tmSynchronized )
+            theMasterBarrier.wait();
+        // when mode is local observation but not synchronized and when num threads == default
+        if ( theTestMode & tmAutoinitialization )
+            o.observe(true); // test autoinitialization can be done by observer
+        // when mode is synchronized observation and when num threads == default
+        if ( theTestMode & tmLeavingControl )
+            o.enable_leaving_test();
+        // Observer in enabled state must outlive the scheduler to ensure that
+        // all exit notifications are called.
+        tbb::task_scheduler_init init(m_numThreads);
+        // when local & non-autoinitialized observation mode
+        if ( theTestMode & tmLocalObservation )
+            o.observe(true);
+        for ( int j = 0; j < 2; ++j ) {
+            tbb::task &t = *new( tbb::task::allocate_root() ) FibTask(m_numThreads, f, o);
+            tbb::task::spawn_root_and_wait(t);
+            if ( theTestMode & tmLeavingControl )
+                o.test_leaving();
+            thePrevMode = theTestMode;
+        }
+    }
+}; // class TestBody
+
+void TestObserver( int M, int T, uintptr_t testMode ) {
+    theLocalState.clear();
+    theStats.Reset();
+    theGlobalBarrierActive = true;
+    theTestMode = testMode;
+    NativeParallelFor( M, TestBody(T) );
+    // When T (number of threads in arena, i.e. master + workers) is less than P
+    // (hardware concurrency), more than T-1 workers can visit the same arena. This
+    // is possible in case of imbalance or when other arenas are activated/deactivated
+    // concurrently).
+    ASSERT( !theNumObservers, "Unexpected alive observer(s)" );
+    REMARK( "Entries %d / %d, exits %d\n", (int)theStats.m_entries, (int)theStats.m_workerEntries, (int)theStats.m_exits );
+    if ( testMode & tmSynchronized ) {
+        if ( testMode & tmLocalObservation ) {
+            ASSERT( theStats.m_entries >= M * T, "Too few on_entry calls" );
+            ASSERT( theStats.m_workerEntries >= M * (T - 1), "Too few worker entries" );
+        }
+        else {
+            ASSERT( theStats.m_entries >= M * M * T, "Too few on_entry calls" );
+            ASSERT( theStats.m_entries <= M * (P + 1), "Too many on_entry calls" );
+            ASSERT( theStats.m_workerEntries >= M * M * (T - 1), "Too few worker entries" );
+            ASSERT( theStats.m_workerEntries <= M * (P - 1), "Too many worker entries" );
+        }
+        ASSERT( theStats.m_entries == theStats.m_exits, "Entries/exits mismatch" );
+    }
+    else {
+        ASSERT( theStats.m_entries >= M, "Too few on_entry calls" );
+        ASSERT( theStats.m_exits >= M || (testMode & tmAutoinitialization), "Too few on_exit calls" );
+        if ( !(testMode & tmLocalObservation) ) {
+            ASSERT( theStats.m_entries <= M * M * P, "Too many on_entry calls" );
+            ASSERT( theStats.m_exits <= M * M * T, "Too many on_exit calls" );
+        }
+        ASSERT( theStats.m_entries >= theStats.m_exits, "More exits than entries" );
+    }
+}
+
+int TestMain () {
+    if ( P < 2 )
+        return Harness::Skipped;
+    theNumObservers = 0;
+    // Fully- and under-utilized mode
+    for ( int M = 1; M < P; M <<= 1 ) {
+        if ( M > P/2 ) {
+            ASSERT( P & (P-1), "Can get here only in case of non power of two cores" );
+            M = P/2;
+            if ( M==1 || (M & (M-1)) )
+                break; // Already tested this configuration
+        }
+        int T = P / M;
+        ASSERT( T > 1, NULL );
+        REMARK( "Masters: %d; Arena size: %d\n", M, T );
+        theMasterBarrier.initialize(M);
+        theGlobalBarrier.initialize(M * T);
+        TestObserver(M, T, 0);
+        TestObserver(M, T, tmSynchronized | tmLocalObservation );
+        TestObserver(M, T, tmSynchronized | ( T==P? tmLeavingControl : 0));
+        // keep tmAutoInitialization the last, as it does not release worker threads
+        TestObserver(M, T, tmLocalObservation | ( T==P? tmAutoinitialization : 0) );
+    }
+    // Oversubscribed mode
+    for ( int i = 0; i < 4; ++i ) {
+        REMARK( "Masters: %d; Arena size: %d\n", P-1, P );
+        TestObserver(P-1, P, 0);
+        TestObserver(P-1, P, tmLocalObservation);
+    }
+    Harness::Sleep(20);
+    return Harness::Done;
+}
+
+#else /* !__TBB_SCHEDULER_OBSERVER */
+
+int TestMain () {
+    return Harness::Skipped;
+}
+#endif /* !__TBB_SCHEDULER_OBSERVER */
diff --git a/xdl/third_party/tbb/src/test/test_task_steal_limit.cpp b/xdl/third_party/tbb/src/test/test_task_steal_limit.cpp
new file mode 100644
index 00000000..18b46564
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_task_steal_limit.cpp
@@ -0,0 +1,79 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/task.h"
+#include "harness.h"
+#include "tbb/task_scheduler_init.h"
+
+using tbb::task;
+
+#if __TBB_ipf
+    const unsigned StackSize = 1024*1024*6;
+#else /*  */
+    const unsigned StackSize = 1024*1024*3;
+#endif
+
+// GCC and ICC on Linux store TLS data in the stack space. This test makes sure
+// that the stealing limiting heuristic used by the task scheduler does not
+// switch off stealing when a large amount of TLS data is reserved.
+#if _MSC_VER
+__declspec(thread)
+#elif __linux__ || ((__MINGW32__ || __MINGW64__) && __TBB_GCC_VERSION >= 40500)
+__thread
+#endif
+    char map2[1024*1024*2];
+
+class TestTask : public task {
+public:
+    static volatile int completed;
+    task* execute() __TBB_override {
+        completed = 1;
+        return NULL;
+    };
+};
+
+volatile int TestTask::completed = 0;
+
+void TestStealingIsEnabled () {
+    tbb::task_scheduler_init init(2, StackSize);
+    task &r = *new( task::allocate_root() ) tbb::empty_task;
+    task &t = *new( r.allocate_child() ) TestTask;
+    r.set_ref_count(2);
+    r.spawn(t);
+    int count = 0;
+    while ( !TestTask::completed && ++count < 6 )
+        Harness::Sleep(1000);
+    ASSERT( TestTask::completed, "Stealing is disabled or the machine is heavily oversubscribed" );
+    r.wait_for_all();
+    task::destroy(r);
+}
+
+int TestMain () {
+#if !__TBB_THREAD_LOCAL_VARIABLES_PRESENT
+    REPORT( "Known issue: Test skipped because no compiler support for __thread keyword.\n" );
+    return Harness::Skipped;
+#endif
+    if ( tbb::task_scheduler_init::default_num_threads() == 1 ) {
+        REPORT( "Known issue: Test requires at least 2 hardware threads.\n" );
+        return Harness::Skipped;
+    }
+    TestStealingIsEnabled();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_tbb_condition_variable.cpp b/xdl/third_party/tbb/src/test/test_tbb_condition_variable.cpp
new file mode 100644
index 00000000..c5f46d8e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tbb_condition_variable.cpp
@@ -0,0 +1,29 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_config.h"
+
+#include "test_condition_variable.h"
+
+int TestMain() {
+    REMARK( "testing with tbb condvar\n" );
+    DoCondVarTest<tbb::mutex,tbb::recursive_mutex>();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_tbb_fork.cpp b/xdl/third_party/tbb/src/test/test_tbb_fork.cpp
new file mode 100644
index 00000000..6e1bd627
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tbb_fork.cpp
@@ -0,0 +1,330 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#define TBB_PREVIEW_WAITING_FOR_WORKERS 1
+#include "tbb/task_scheduler_init.h"
+#include "tbb/blocked_range.h"
+#include "tbb/cache_aligned_allocator.h"
+#include "tbb/parallel_for.h"
+
+#define HARNESS_DEFAULT_MIN_THREADS (tbb::task_scheduler_init::default_num_threads())
+#define HARNESS_DEFAULT_MAX_THREADS (4*tbb::task_scheduler_init::default_num_threads())
+#if __bg__
+// CNK does not support fork()
+#define HARNESS_SKIP_TEST 1
+#endif
+#include "harness.h"
+
+#if _WIN32||_WIN64
+#include "tbb/concurrent_hash_map.h"
+
+HANDLE getCurrentThreadHandle()
+{
+    HANDLE hProc = GetCurrentProcess(), hThr = INVALID_HANDLE_VALUE;
+#if TBB_USE_ASSERT
+    BOOL res =
+#endif
+    DuplicateHandle( hProc, GetCurrentThread(), hProc, &hThr, 0, FALSE, DUPLICATE_SAME_ACCESS );
+    __TBB_ASSERT( res, "Retrieving current thread handle failed" );
+    return hThr;
+}
+
+bool threadTerminated(HANDLE h)
+{
+    DWORD ret = WaitForSingleObjectEx(h, 0, FALSE);
+    return WAIT_OBJECT_0 == ret;
+}
+
+struct Data {
+    HANDLE h;
+};
+
+typedef tbb::concurrent_hash_map<DWORD, Data> TidTableType;
+
+static TidTableType tidTable;
+
+#else
+
+#if __sun || __SUNPRO_CC
+#define _POSIX_PTHREAD_SEMANTICS 1 // to get standard-conforming sigwait(2)
+#endif
+#include <signal.h>
+#include <sys/types.h>
+#include <unistd.h>
+#include <sys/wait.h>
+#include <sched.h>
+
+#include "tbb/tick_count.h"
+
+void SigHandler(int) { }
+
+#endif // _WIN32||_WIN64
+
+class AllocTask {
+public:
+    void operator() (const tbb::blocked_range<int> &r) const {
+#if _WIN32||_WIN64
+        HANDLE h = getCurrentThreadHandle();
+        DWORD tid = GetCurrentThreadId();
+        {
+            TidTableType::accessor acc;
+            if (tidTable.insert(acc, tid)) {
+                acc->second.h = h;
+            }
+        }
+#endif
+        for (int y = r.begin(); y != r.end(); ++y) {
+            void *p = tbb::internal::NFS_Allocate(1, 7000, NULL);
+            tbb::internal::NFS_Free(p);
+        }
+    }
+    AllocTask() {}
+};
+
+void CallParallelFor()
+{
+    tbb::parallel_for(tbb::blocked_range<int>(0, 10000, 1), AllocTask(),
+                      tbb::simple_partitioner());
+}
+
+/* Regression test against data race between termination of workers
+   and setting blocking terination mode in main thread. */
+class RunWorkersBody : NoAssign {
+    bool wait_workers;
+public:
+    RunWorkersBody(bool waitWorkers) : wait_workers(waitWorkers) {}
+    void operator()(const int /*threadID*/) const {
+        tbb::task_scheduler_init sch(MaxThread);
+        CallParallelFor();
+        if (wait_workers) {
+            bool ok = sch.blocking_terminate(std::nothrow);
+            ASSERT(ok, NULL);
+        }
+    }
+};
+
+void TestBlockNonblock()
+{
+    for (int i=0; i<100; i++) {
+        REMARK("\rIteration %d ", i);
+        NativeParallelFor(4, RunWorkersBody(/*wait_workers=*/false));
+        RunWorkersBody(/*wait_workers=*/true)(0);
+    }
+}
+
+class RunInNativeThread : NoAssign {
+    bool create_tsi,
+        blocking;
+public:
+    RunInNativeThread(bool create_tsi_, bool blocking_) :
+        create_tsi(create_tsi_), blocking(blocking_) {}
+    void operator()(const int /*threadID*/) const {
+        // nested TSI or auto-initialized TSI can be terminated when
+        // wait_workers is true (deferred TSI means auto-initialization)
+        tbb::task_scheduler_init tsi(create_tsi? 2 : tbb::task_scheduler_init::deferred);
+        CallParallelFor();
+        if (blocking) {
+            bool ok = tsi.blocking_terminate(std::nothrow);
+            // all usages are nested
+            ASSERT(!ok, "Nested blocking terminate must fail.");
+        }
+    }
+};
+
+void TestTasksInThread()
+{
+    tbb::task_scheduler_init sch(2);
+    CallParallelFor();
+    for (int i=0; i<2; i++)
+        NativeParallelFor(2, RunInNativeThread(/*create_tsi=*/1==i, /*blocking=*/false));
+    bool ok = sch.blocking_terminate(std::nothrow);
+    ASSERT(ok, NULL);
+}
+
+#include "harness_memory.h"
+
+// check for memory leak during TBB task scheduler init/terminate life cycle
+// TODO: move to test_task_scheduler_init after workers waiting productization
+void TestSchedulerMemLeaks()
+{
+    const int ITERS = 10;
+    int it;
+
+    for (it=0; it<ITERS; it++) {
+        size_t memBefore = GetMemoryUsage();
+#if _MSC_VER && _DEBUG
+        // _CrtMemCheckpoint() and _CrtMemDifference are non-empty only in _DEBUG
+        _CrtMemState stateBefore, stateAfter, diffState;
+        _CrtMemCheckpoint(&stateBefore);
+#endif
+        for (int i=0; i<100; i++) {
+            tbb::task_scheduler_init sch(1);
+            for (int k=0; k<10; k++) {
+                tbb::empty_task *t = new( tbb::task::allocate_root() ) tbb::empty_task();
+                tbb::task::enqueue(*t);
+            }
+            bool ok = sch.blocking_terminate(std::nothrow);
+            ASSERT(ok, NULL);
+        }
+#if _MSC_VER && _DEBUG
+        _CrtMemCheckpoint(&stateAfter);
+        int ret = _CrtMemDifference(&diffState, &stateBefore, &stateAfter);
+        ASSERT(!ret, "It must be no memory leaks at this point.");
+#endif
+        if (GetMemoryUsage() <= memBefore)
+            break;
+    }
+    ASSERT(it < ITERS, "Memory consumption has not stabilized. Memory Leak?");
+}
+
+void TestNestingTSI()
+{
+    // nesting with and without blocking is possible
+    for (int i=0; i<2; i++) {
+        tbb::task_scheduler_init schBlock(2);
+        CallParallelFor();
+        tbb::task_scheduler_init schBlock1(2);
+        CallParallelFor();
+        if (i)
+            schBlock1.terminate();
+        else {
+            bool ok = schBlock1.blocking_terminate(std::nothrow);
+            ASSERT(!ok, "Nested blocking terminate must fail.");
+        }
+        bool ok = schBlock.blocking_terminate(std::nothrow);
+        ASSERT(ok, NULL);
+    }
+    {
+        tbb::task_scheduler_init schBlock(2);
+        NativeParallelFor(1, RunInNativeThread(/*create_tsi=*/true, /*blocking=*/true));
+        bool ok = schBlock.blocking_terminate(std::nothrow);
+        ASSERT(ok, NULL);
+    }
+}
+
+void TestAutoInit()
+{
+    CallParallelFor(); // autoinit
+    // creation of blocking scheduler is possible, but one is not block
+    NativeParallelFor(1, RunInNativeThread(/*create_tsi=*/true, /*blocking=*/true));
+}
+
+int TestMain()
+{
+    using namespace Harness;
+
+    TestNestingTSI();
+    TestBlockNonblock();
+    TestTasksInThread();
+    TestSchedulerMemLeaks();
+
+    bool child = false;
+#if _WIN32||_WIN64
+    DWORD masterTid = GetCurrentThreadId();
+#else
+    struct sigaction sa;
+    sigset_t sig_set;
+
+    sigemptyset(&sa.sa_mask);
+    sa.sa_flags = 0;
+    sa.sa_handler = SigHandler;
+    if (sigaction(SIGCHLD, &sa, NULL))
+        ASSERT(0, "sigaction failed");
+    if (sigaction(SIGALRM, &sa, NULL))
+        ASSERT(0, "sigaction failed");
+    // block SIGCHLD and SIGALRM, the mask is inherited by worker threads
+    sigemptyset(&sig_set);
+    sigaddset(&sig_set, SIGCHLD);
+    sigaddset(&sig_set, SIGALRM);
+    if (pthread_sigmask(SIG_BLOCK, &sig_set, NULL))
+        ASSERT(0, "pthread_sigmask failed");
+#endif
+    for (int threads=MinThread; threads<=MaxThread; threads+=MinThread) {
+        for (int i=0; i<20; i++) {
+            if (!child)
+                REMARK("\rThreads %d %d ", threads, i);
+            {
+                tbb::task_scheduler_init sch(threads);
+                bool ok = sch.blocking_terminate(std::nothrow);
+                ASSERT(ok, NULL);
+            }
+            tbb::task_scheduler_init sch(threads);
+
+            CallParallelFor();
+            bool ok = sch.blocking_terminate(std::nothrow);
+            ASSERT(ok, NULL);
+
+#if _WIN32||_WIN64
+            // check that there is no alive threads after terminate()
+            for (TidTableType::const_iterator it = tidTable.begin();
+                 it != tidTable.end(); ++it) {
+                if (masterTid != it->first) {
+                    ASSERT(threadTerminated(it->second.h), NULL);
+                }
+            }
+            tidTable.clear();
+#else // _WIN32||_WIN64
+            if (child)
+                exit(0);
+            else {
+                pid_t pid = fork();
+                if (!pid) {
+                    i = -1;
+                    child = true;
+                } else {
+                    int sig;
+                    pid_t w_ret = 0;
+                    // wait for SIGCHLD up to timeout
+                    alarm(30);
+                    if (0 != sigwait(&sig_set, &sig))
+                        ASSERT(0, "sigwait failed");
+                    alarm(0);
+                    w_ret = waitpid(pid, NULL, WNOHANG);
+                    ASSERT(w_ret>=0, "waitpid failed");
+                    if (!w_ret) {
+                        ASSERT(!kill(pid, SIGKILL), NULL);
+                        w_ret = waitpid(pid, NULL, 0);
+                        ASSERT(w_ret!=-1, "waitpid failed");
+
+                        ASSERT(0, "Hang after fork");
+                    }
+                    // clean pending signals (if any occurs since sigwait)
+                    sigset_t p_mask;
+                    for (;;) {
+                        sigemptyset(&p_mask);
+                        sigpending(&p_mask);
+                        if (sigismember(&p_mask, SIGALRM)
+                            || sigismember(&p_mask, SIGCHLD)) {
+                            if (0 != sigwait(&p_mask, &sig))
+                                ASSERT(0, "sigwait failed");
+                        } else
+                            break;
+                    }
+                }
+            }
+#endif // _WIN32||_WIN64
+        }
+    }
+    // auto initialization at this point
+    TestAutoInit();
+
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_tbb_header.cpp b/xdl/third_party/tbb/src/test/test_tbb_header.cpp
new file mode 100644
index 00000000..a114106e
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tbb_header.cpp
@@ -0,0 +1,360 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+/**
+    This test ensures that tbb.h brings in all the public TBB interface definitions,
+    and if all the necessary symbols are exported from the library.
+
+    Most of the checks happen at the compilation or link phases.
+**/
+#if __TBB_CPF_BUILD
+// Add testing of preview features
+#define TBB_PREVIEW_AGGREGATOR 1
+#define TBB_PREVIEW_CONCURRENT_LRU_CACHE 1
+#define TBB_PREVIEW_VARIADIC_PARALLEL_INVOKE 1
+#define TBB_PREVIEW_FLOW_GRAPH_NODES 1
+#define TBB_PREVIEW_GLOBAL_CONTROL 1
+#define TBB_PREVIEW_BLOCKED_RANGE_ND 1
+#define TBB_PREVIEW_WAITING_FOR_WORKERS 1
+#endif
+
+#if __TBB_TEST_SECONDARY
+    // Test _DEBUG macro custom definitions.
+    #if TBB_USE_DEBUG
+        #ifdef _DEBUG
+            #undef _DEBUG
+        #endif /* _DEBUG */
+        // Check that empty value successfully enables the debug mode.
+        #define _DEBUG
+        static bool isDebugExpected = true;
+    #else
+        // Check that zero value does not enable the debug mode.
+        #define _DEBUG 0x0
+        static bool isDebugExpected = false;
+    #endif /* TBB_USE_DEBUG */
+    #define DO_TEST_DEBUG_MACRO 1
+#else
+    // Test default definitions of _DEBUG.
+    #if _DEBUG
+        static bool isDebugExpected = true;
+        #define DO_TEST_DEBUG_MACRO 1
+    #elif _MSC_VER
+        // for MSVC, _DEBUG not defined indicates a release mode.
+        static bool isDebugExpected = false;
+        #define DO_TEST_DEBUG_MACRO 1
+    #endif /* _DEBUG */
+#endif /* __TBB_TEST_SECONDARY */
+
+#if DO_TEST_DEBUG_MACRO
+// Reset TBB_USE_DEBUG defined in makefiles.
+#undef TBB_USE_DEBUG
+#endif /* DO_TEST_DEBUG_MACRO */
+#define __TBB_CONFIG_PREPROC_ONLY _MSC_VER // For MSVC, prevent including standard headers in tbb_config.h
+#include "tbb/tbb_config.h"
+
+#if !TBB_USE_DEBUG && defined(_DEBUG)
+// TBB_USE_DEBUG is 0 but _DEBUG is defined, it means that _DEBUG is 0
+// MSVC C++ headers consider any definition of _DEBUG, including 0, as debug mode
+#undef _DEBUG
+#endif /* !TBB_USE_DEBUG && defined(_DEBUG) */
+
+#include "harness_defs.h"
+#if _MSC_VER
+#pragma warning (disable : 4503)      // decorated name length exceeded, name was truncated
+#endif
+
+#if !(__TBB_TEST_SECONDARY && __TBB_CPP11_STD_PLACEHOLDERS_LINKAGE_BROKEN)
+
+#include "tbb/tbb.h"
+
+static volatile size_t g_sink;
+
+#define TestTypeDefinitionPresence( Type ) g_sink = sizeof(tbb::Type);
+#define TestTypeDefinitionPresence2(TypeStart, TypeEnd) g_sink = sizeof(tbb::TypeStart,TypeEnd);
+#define TestTypeDefinitionPresence3(TypeStart, TypeMid, TypeEnd) g_sink = sizeof(tbb::TypeStart,TypeMid,TypeEnd);
+#define TestFuncDefinitionPresence(Fn, Args, ReturnType) { ReturnType (*pfn)Args = &tbb::Fn; (void)pfn; }
+
+struct Body {
+    void operator() () const {}
+};
+struct Body1 {
+    void operator() ( int ) const {}
+};
+struct Body1a { // feeder body for parallel_do
+    void operator() ( int, tbb::parallel_do_feeder<int>& ) const {}
+};
+struct Body1b { // binary operator for reduction and comparison
+    int operator() ( const int, const int ) const { return 0; }
+};
+struct Body2 {
+    Body2 () {}
+    Body2 ( const Body2&, tbb::split ) {}
+    void operator() ( const tbb::blocked_range<int>& ) const {}
+    void join( const Body2& ) {}
+};
+struct Body2a { // for lambda-friendly parallel_reduce
+    int operator() ( const tbb::blocked_range<int>&, const int ) const { return 0; }
+};
+struct Body3 { // for parallel_scan
+    Body3 () {}
+    Body3 ( const Body3&, tbb::split ) {}
+    void operator() ( const tbb::blocked_range2d<int>&, tbb::pre_scan_tag ) const {}
+    void operator() ( const tbb::blocked_range2d<int>&, tbb::final_scan_tag ) const {}
+    void reverse_join( Body3& ) {}
+    void assign( const Body3& ) {}
+};
+struct Body3a { // for lambda-friednly parallel_scan
+    int operator() ( const tbb::blocked_range<int>&, const int, bool ) const { return 0; }
+};
+struct Msg {};
+
+#if !__TBB_TEST_SECONDARY
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+
+// Test if all the necessary symbols are exported for the exceptions thrown by TBB.
+// Missing exports result either in link error or in runtime assertion failure.
+#include <stdexcept>
+
+template <typename E>
+void TestExceptionClassExports ( const E& exc, tbb::internal::exception_id eid ) {
+    // The assertion here serves to shut up warnings about "eid not used".
+    ASSERT( eid<tbb::internal::eid_max, NULL );
+#if TBB_USE_EXCEPTIONS
+    for ( int i = 0; i < 2; ++i ) {
+        try {
+            if ( i == 0 )
+                throw exc;
+#if !__TBB_THROW_ACROSS_MODULE_BOUNDARY_BROKEN
+            else
+                tbb::internal::throw_exception( eid );
+#endif
+        }
+        catch ( E& e ) {
+            ASSERT ( e.what(), "Missing what() string" );
+        }
+        catch ( ... ) {
+            ASSERT ( __TBB_EXCEPTION_TYPE_INFO_BROKEN, "Unrecognized exception. Likely RTTI related exports are missing" );
+        }
+    }
+#else /* TBB_USE_EXCEPTIONS */
+    (void)exc;
+#endif /* TBB_USE_EXCEPTIONS */
+}
+
+void TestExceptionClassesExports () {
+    TestExceptionClassExports( std::bad_alloc(), tbb::internal::eid_bad_alloc );
+    TestExceptionClassExports( tbb::bad_last_alloc(), tbb::internal::eid_bad_last_alloc );
+    TestExceptionClassExports( std::invalid_argument("test"), tbb::internal::eid_nonpositive_step );
+    TestExceptionClassExports( std::out_of_range("test"), tbb::internal::eid_out_of_range );
+    TestExceptionClassExports( std::range_error("test"), tbb::internal::eid_segment_range_error );
+    TestExceptionClassExports( std::range_error("test"), tbb::internal::eid_index_range_error );
+    TestExceptionClassExports( tbb::missing_wait(), tbb::internal::eid_missing_wait );
+    TestExceptionClassExports( tbb::invalid_multiple_scheduling(), tbb::internal::eid_invalid_multiple_scheduling );
+    TestExceptionClassExports( tbb::improper_lock(), tbb::internal::eid_improper_lock );
+    TestExceptionClassExports( std::runtime_error("test"), tbb::internal::eid_possible_deadlock );
+    TestExceptionClassExports( std::runtime_error("test"), tbb::internal::eid_operation_not_permitted );
+    TestExceptionClassExports( std::runtime_error("test"), tbb::internal::eid_condvar_wait_failed );
+    TestExceptionClassExports( std::out_of_range("test"), tbb::internal::eid_invalid_load_factor );
+    TestExceptionClassExports( std::invalid_argument("test"), tbb::internal::eid_invalid_swap );
+    TestExceptionClassExports( std::length_error("test"), tbb::internal::eid_reservation_length_error );
+    TestExceptionClassExports( std::out_of_range("test"), tbb::internal::eid_invalid_key );
+    TestExceptionClassExports( tbb::user_abort(), tbb::internal::eid_user_abort );
+    TestExceptionClassExports( std::runtime_error("test"), tbb::internal::eid_bad_tagged_msg_cast );
+}
+#endif /* !__TBB_TEST_SECONDARY */
+
+#if __TBB_CPF_BUILD
+// These names are only tested in "preview" configuration
+// When a feature becomes fully supported, its names should be moved to the main test
+struct Handler {
+    void operator()( tbb::aggregator_operation* ) {}
+};
+static void TestPreviewNames() {
+    TestTypeDefinitionPresence( aggregator );
+    TestTypeDefinitionPresence( aggregator_ext<Handler> );
+#if __TBB_CPP11_PRESENT
+    TestTypeDefinitionPresence2(blocked_rangeNd<int,4> );
+#endif
+    TestTypeDefinitionPresence2(concurrent_lru_cache<int, int> );
+    TestTypeDefinitionPresence( global_control );
+#if !__TBB_TEST_SECONDARY
+    TestExceptionClassExports( std::runtime_error("test"), tbb::internal::eid_blocking_thread_join_impossible );
+#endif
+}
+#endif
+
+#if __TBB_TEST_SECONDARY
+/* This mode is used to produce a secondary object file that is linked with
+   the main one in order to detect "multiple definition" linker error.
+*/
+#include "harness_assert.h"
+bool Secondary()
+#else
+bool Secondary();
+int TestMain ()
+#endif
+{
+    #if __TBB_CPP11_STD_PLACEHOLDERS_LINKAGE_BROKEN
+        REPORT("Known issue: \"multiple definition\" linker error detection test skipped.\n");
+    #endif
+    TestTypeDefinitionPresence( aligned_space<int> );
+    TestTypeDefinitionPresence( atomic<int> );
+    TestTypeDefinitionPresence( cache_aligned_allocator<int> );
+    TestTypeDefinitionPresence( tbb_hash_compare<int> );
+    TestTypeDefinitionPresence2(concurrent_hash_map<int, int> );
+    TestTypeDefinitionPresence2(concurrent_unordered_map<int, int> );
+    TestTypeDefinitionPresence2(concurrent_unordered_multimap<int, int> );
+    TestTypeDefinitionPresence( concurrent_unordered_set<int> );
+    TestTypeDefinitionPresence( concurrent_unordered_multiset<int> );
+    TestTypeDefinitionPresence( concurrent_bounded_queue<int> );
+    TestTypeDefinitionPresence( concurrent_queue<int> );
+    TestTypeDefinitionPresence( strict_ppl::concurrent_queue<int> );
+    TestTypeDefinitionPresence( concurrent_priority_queue<int> );
+    TestTypeDefinitionPresence( concurrent_vector<int> );
+    TestTypeDefinitionPresence( combinable<int> );
+    TestTypeDefinitionPresence( enumerable_thread_specific<int> );
+    /* Flow graph names */
+    TestTypeDefinitionPresence( flow::graph );
+    TestTypeDefinitionPresence( flow::continue_msg );
+    TestTypeDefinitionPresence2(flow::tagged_msg<int, int> );
+    TestFuncDefinitionPresence( flow::make_edge, (tbb::flow::sender<Msg>&, tbb::flow::receiver<Msg>&), void );
+    TestFuncDefinitionPresence( flow::remove_edge, (tbb::flow::sender<Msg>&, tbb::flow::receiver<Msg>&), void );
+    typedef tbb::flow::tuple<int, int> intpair;
+    TestTypeDefinitionPresence( flow::source_node<int> );
+    TestTypeDefinitionPresence3(flow::function_node<int, int, tbb::flow::rejecting> );
+    TestTypeDefinitionPresence3(flow::multifunction_node<int, intpair, tbb::flow::queueing> );
+    TestTypeDefinitionPresence3(flow::async_node<int, int, tbb::flow::queueing_lightweight> );
+    TestTypeDefinitionPresence2(flow::continue_node<int, tbb::flow::lightweight> );
+    TestTypeDefinitionPresence2(flow::join_node<intpair, tbb::flow::reserving> );
+    TestTypeDefinitionPresence2(flow::join_node<intpair, tbb::flow::key_matching<int> > );
+    TestTypeDefinitionPresence( flow::split_node<intpair> );
+    TestTypeDefinitionPresence( flow::overwrite_node<int> );
+    TestTypeDefinitionPresence( flow::write_once_node<int> );
+    TestTypeDefinitionPresence( flow::broadcast_node<int> );
+    TestTypeDefinitionPresence( flow::buffer_node<int> );
+    TestTypeDefinitionPresence( flow::queue_node<int> );
+    TestTypeDefinitionPresence( flow::sequencer_node<int> );
+    TestTypeDefinitionPresence( flow::priority_queue_node<int> );
+    TestTypeDefinitionPresence( flow::limiter_node<int> );
+    TestTypeDefinitionPresence2(flow::indexer_node<int, int> );
+#if __TBB_FLOW_GRAPH_CPP11_FEATURES
+    TestTypeDefinitionPresence2(flow::composite_node<tbb::flow::tuple<int>, tbb::flow::tuple<int> > );
+#endif
+    /* Mutex names */
+    TestTypeDefinitionPresence( mutex );
+    TestTypeDefinitionPresence( null_mutex );
+    TestTypeDefinitionPresence( null_rw_mutex );
+    TestTypeDefinitionPresence( queuing_mutex );
+    TestTypeDefinitionPresence( queuing_rw_mutex );
+    TestTypeDefinitionPresence( recursive_mutex );
+    TestTypeDefinitionPresence( spin_mutex );
+    TestTypeDefinitionPresence( spin_rw_mutex );
+    TestTypeDefinitionPresence( speculative_spin_mutex );
+    TestTypeDefinitionPresence( speculative_spin_rw_mutex );
+    TestTypeDefinitionPresence( critical_section );
+    TestTypeDefinitionPresence( reader_writer_lock );
+#if __TBB_TASK_GROUP_CONTEXT
+    TestTypeDefinitionPresence( tbb_exception );
+    TestTypeDefinitionPresence( captured_exception );
+    TestTypeDefinitionPresence( movable_exception<int> );
+#if !TBB_USE_CAPTURED_EXCEPTION
+    TestTypeDefinitionPresence( internal::tbb_exception_ptr );
+#endif /* !TBB_USE_CAPTURED_EXCEPTION */
+    TestTypeDefinitionPresence( task_group_context );
+    TestTypeDefinitionPresence( task_group );
+    TestTypeDefinitionPresence( structured_task_group );
+    TestTypeDefinitionPresence( task_handle<Body> );
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    /* Algorithm related names */
+    TestTypeDefinitionPresence( blocked_range<int> );
+    TestTypeDefinitionPresence( blocked_range2d<int> );
+    TestTypeDefinitionPresence( blocked_range3d<int> );
+    TestFuncDefinitionPresence( parallel_invoke, (const Body&, const Body&, const Body&), void );
+    TestFuncDefinitionPresence( parallel_do, (int*, int*, const Body1&), void );
+    TestFuncDefinitionPresence( parallel_for_each, (int*, int*, const Body1&), void );
+    TestFuncDefinitionPresence( parallel_for, (int, int, int, const Body1&), void );
+    TestFuncDefinitionPresence( parallel_for, (const tbb::blocked_range<int>&, const Body2&, const tbb::simple_partitioner&), void );
+    TestFuncDefinitionPresence( parallel_reduce, (const tbb::blocked_range<int>&, const int&, const Body2a&, const Body1b&), int );
+    TestFuncDefinitionPresence( parallel_reduce, (const tbb::blocked_range<int>&, Body2&, tbb::affinity_partitioner&), void );
+    TestFuncDefinitionPresence( parallel_deterministic_reduce, (const tbb::blocked_range<int>&, const int&, const Body2a&, const Body1b&), int );
+    TestFuncDefinitionPresence( parallel_deterministic_reduce, (const tbb::blocked_range<int>&, Body2&, const tbb::static_partitioner&), void );
+    TestFuncDefinitionPresence( parallel_scan, (const tbb::blocked_range2d<int>&, Body3&, const tbb::auto_partitioner&), void );
+    TestFuncDefinitionPresence( parallel_scan, (const tbb::blocked_range<int>&, const int&, const Body3a&, const Body1b&), int );
+    typedef int intarray[10];
+    TestFuncDefinitionPresence( parallel_sort, (int*, int*), void );
+    TestFuncDefinitionPresence( parallel_sort, (intarray&, const Body1b&), void );
+    TestTypeDefinitionPresence( pipeline );
+    TestFuncDefinitionPresence( parallel_pipeline, (size_t, const tbb::filter_t<void,void>&), void );
+#if __TBB_TASK_GROUP_CONTEXT
+    TestFuncDefinitionPresence( parallel_invoke, (const Body&, const Body&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_do, (const intarray&, const Body1a&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_for_each, (const intarray&, const Body1&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_for, (int, int, const Body1&, const tbb::auto_partitioner&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_for, (int, int, const Body1&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_reduce, (const tbb::blocked_range<int>&, Body2&, const tbb::auto_partitioner&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_reduce, (const tbb::blocked_range<int>&, Body2&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_deterministic_reduce, (const tbb::blocked_range<int>&, Body2&, const tbb::simple_partitioner&, tbb::task_group_context&), void );
+    TestFuncDefinitionPresence( parallel_deterministic_reduce, (const tbb::blocked_range<int>&, Body2&, tbb::task_group_context&), void );
+#endif /* __TBB_TASK_GROUP_CONTEXT */
+    TestTypeDefinitionPresence( proportional_split );
+
+    TestTypeDefinitionPresence( task );
+    TestTypeDefinitionPresence( empty_task );
+    TestTypeDefinitionPresence( task_list );
+    TestTypeDefinitionPresence( task_arena );
+    TestFuncDefinitionPresence( this_task_arena::current_thread_index, (), int );
+    TestFuncDefinitionPresence( this_task_arena::max_concurrency, (), int );
+#if !__TBB_GCC_OVERLOADED_TEMPLATE_FUNCTION_ADDRESS_BROKEN
+    TestFuncDefinitionPresence( this_task_arena::isolate, (const Body&), void );
+#endif
+    TestTypeDefinitionPresence( task_scheduler_init );
+    TestTypeDefinitionPresence( task_scheduler_observer );
+    TestTypeDefinitionPresence( tbb_thread );
+    TestFuncDefinitionPresence( tbb_thread::hardware_concurrency, (), unsigned );
+    TestFuncDefinitionPresence( this_tbb_thread::yield, (), void );
+    TestTypeDefinitionPresence( tbb_allocator<int> );
+    TestTypeDefinitionPresence( zero_allocator<int> );
+    TestTypeDefinitionPresence( tick_count );
+#if __TBB_CPP11_PRESENT
+    TestTypeDefinitionPresence( counting_iterator<int> );
+    TestTypeDefinitionPresence2(zip_iterator<int*,int*> );
+#endif
+
+#if __TBB_CPF_BUILD
+    TestPreviewNames();
+#endif
+#ifdef DO_TEST_DEBUG_MACRO
+#if TBB_USE_DEBUG
+    ASSERT( isDebugExpected, "Debug mode is observed while release mode is expected." );
+#else
+    ASSERT( !isDebugExpected, "Release mode is observed while debug mode is expected." );
+#endif /* TBB_USE_DEBUG */
+#endif /* DO_TEST_DEBUG_MACRO */
+#if __TBB_TEST_SECONDARY
+    return true;
+#else
+    TestExceptionClassesExports();
+    Secondary();
+    return Harness::Done;
+#endif /* __TBB_TEST_SECONDARY */
+}
+#endif //!(__TBB_TEST_SECONDARY && __TBB_CPP11_STD_PLACEHOLDERS_LINKING_BROKEN)
diff --git a/xdl/third_party/tbb/src/test/test_tbb_thread.cpp b/xdl/third_party/tbb/src/test/test_tbb_thread.cpp
new file mode 100644
index 00000000..19bb15c5
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tbb_thread.cpp
@@ -0,0 +1,33 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_thread.h"
+#define THREAD tbb::tbb_thread
+#define THIS_THREAD tbb::this_tbb_thread
+#define THIS_THREAD_SLEEP THIS_THREAD::sleep
+#include "test_thread.h"
+#include "harness.h"
+
+/* we want to test tbb::tbb_thread */
+int TestMain () {
+    CheckSignatures();
+    RunTests();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_tbb_version.cpp b/xdl/third_party/tbb/src/test/test_tbb_version.cpp
new file mode 100644
index 00000000..e6230cbc
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tbb_version.cpp
@@ -0,0 +1,288 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tbb_stddef.h"
+
+#if __TBB_WIN8UI_SUPPORT
+// TODO: figure out how the test can be enabled for win8ui
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness.h"
+int TestMain() {
+    return Harness::Skipped;
+}
+#else
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <vector>
+#include <string>
+#include <utility>
+
+#include "tbb/task_scheduler_init.h"
+
+#define HARNESS_CUSTOM_MAIN 1
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#define HARNESS_NO_MAIN_ARGS 0
+#include "harness.h"
+
+#if defined (_WIN32) || defined (_WIN64)
+#define TEST_SYSTEM_COMMAND "test_tbb_version.exe @"
+#elif __APPLE__
+// DYLD_LIBRARY_PATH is purged for OS X 10.11, set it again
+#define TEST_SYSTEM_COMMAND "DYLD_LIBRARY_PATH=. ./test_tbb_version.exe @"
+#else
+#define TEST_SYSTEM_COMMAND "./test_tbb_version.exe @"
+#endif
+
+enum string_required {
+    required,
+    optional,
+    optional_multiple
+    };
+
+typedef std::pair <std::string, string_required> string_pair;
+
+void initialize_strings_vector(std::vector <string_pair>* vector);
+
+const char stderr_stream[] = "version_test.err";
+const char stdout_stream[] = "version_test.out";
+
+HARNESS_EXPORT
+int main(int argc, char *argv[] ) {
+    const size_t psBuffer_len = 2048;
+    char psBuffer[psBuffer_len];
+/* We first introduced runtime version identification in 3014 */
+#if TBB_INTERFACE_VERSION>=3014
+    // For now, just test that run-time TBB version matches the compile-time version,
+    // since otherwise the subsequent test of "TBB: INTERFACE VERSION" string will fail anyway.
+    // We need something more clever in future.
+    if ( tbb::TBB_runtime_interface_version()!=TBB_INTERFACE_VERSION ){
+        snprintf( psBuffer, psBuffer_len,
+                  "%s %s %d %s %d.",
+                  "Running with the library of different version than the test was compiled against.",
+                  "Expected",
+                  TBB_INTERFACE_VERSION,
+                  "- got",
+                  tbb::TBB_runtime_interface_version()
+                  );
+        ASSERT( tbb::TBB_runtime_interface_version()==TBB_INTERFACE_VERSION, psBuffer );
+    }
+#endif
+#if __TBB_MIC_OFFLOAD
+    // Skip the test in offload mode.
+    // Run the test in 'true' native mode (because 'system()' works in 'true' native mode).
+    (argc, argv);
+    REPORT("skip\n");
+#elif __TBB_MPI_INTEROP || __bg__
+    (void) argc; // unused
+    (void) argv; // unused
+    REPORT("skip\n");
+#else
+    __TBB_TRY {
+        FILE *stream_out;
+        FILE *stream_err;
+
+        if(argc>1 && argv[1][0] == '@' ) {
+            stream_err = freopen( stderr_stream, "w", stderr );
+            if( stream_err == NULL ){
+                REPORT( "Internal test error (freopen)\n" );
+                exit( 1 );
+            }
+            stream_out = freopen( stdout_stream, "w", stdout );
+            if( stream_out == NULL ){
+                REPORT( "Internal test error (freopen)\n" );
+                exit( 1 );
+            }
+            {
+                tbb::task_scheduler_init init(1);
+            }
+            fclose( stream_out );
+            fclose( stream_err );
+            exit(0);
+        }
+        //1st step check that output is empty if TBB_VERSION is not defined.
+        if ( getenv("TBB_VERSION") ){
+            REPORT( "TBB_VERSION defined, skipping step 1 (empty output check)\n" );
+        }else{
+            if( ( system(TEST_SYSTEM_COMMAND) ) != 0 ){
+                REPORT( "Error (step 1): Internal test error\n" );
+                exit( 1 );
+            }
+            //Checking output streams - they should be empty
+            stream_err = fopen( stderr_stream, "r" );
+            if( stream_err == NULL ){
+                REPORT( "Error (step 1):Internal test error (stderr open)\n" );
+                exit( 1 );
+            }
+            while( !feof( stream_err ) ) {
+                if( fgets( psBuffer, psBuffer_len, stream_err ) != NULL ){
+                    REPORT( "Error (step 1): stderr should be empty\n" );
+                    exit( 1 );
+                }
+            }
+            fclose( stream_err );
+            stream_out = fopen( stdout_stream, "r" );
+            if( stream_out == NULL ){
+                REPORT( "Error (step 1):Internal test error (stdout open)\n" );
+                exit( 1 );
+            }
+            while( !feof( stream_out ) ) {
+                if( fgets( psBuffer, psBuffer_len, stream_out ) != NULL ){
+                    REPORT( "Error (step 1): stdout should be empty\n" );
+                    exit( 1 );
+                }
+            }
+            fclose( stream_out );
+        }
+
+        //Setting TBB_VERSION in case it is not set
+        if ( !getenv("TBB_VERSION") ){
+            Harness::SetEnv("TBB_VERSION","1");
+        }
+
+        if( ( system(TEST_SYSTEM_COMMAND) ) != 0 ){
+            REPORT( "Error (step 2):Internal test error\n" );
+            exit( 1 );
+        }
+        //Checking pipe - it should contain version data
+        std::vector <string_pair> strings_vector;
+        std::vector <string_pair>::iterator strings_iterator;
+
+        initialize_strings_vector( &strings_vector );
+        strings_iterator = strings_vector.begin();
+
+        stream_out = fopen( stdout_stream, "r" );
+        if( stream_out == NULL ){
+            REPORT( "Error (step 2):Internal test error (stdout open)\n" );
+            exit( 1 );
+        }
+        while( !feof( stream_out ) ) {
+            if( fgets( psBuffer, psBuffer_len, stream_out ) != NULL ){
+                REPORT( "Error (step 2): stdout should be empty\n" );
+                exit( 1 );
+            }
+        }
+        fclose( stream_out );
+
+        stream_err = fopen( stderr_stream, "r" );
+        if( stream_err == NULL ){
+            REPORT( "Error (step 1):Internal test error (stderr open)\n" );
+            exit( 1 );
+        }
+
+        while( !feof( stream_err ) ) {
+            if( fgets( psBuffer, psBuffer_len, stream_err ) != NULL ){
+                if (strstr( psBuffer, "TBBmalloc: " )) {
+                    // TBB allocator might or might not be here, ignore it
+                    continue;
+                }
+                bool match_found = false;
+                do{
+                    if ( strings_iterator == strings_vector.end() ){
+                        REPORT( "Error: version string dictionary ended prematurely.\n" );
+                        REPORT( "No match for: \t%s", psBuffer );
+                        exit( 1 );
+                    }
+                    if ( strstr( psBuffer, strings_iterator->first.c_str() ) == NULL ){ // mismatch
+                        if( strings_iterator->second == required ){
+                            REPORT( "Error: version strings do not match.\n" );
+                            REPORT( "Expected \"%s\" not found in:\n\t%s", strings_iterator->first.c_str(), psBuffer );
+                            exit( 1 );
+                        }
+                        ++strings_iterator;
+                    }else{
+                        match_found = true;
+                        if( strings_iterator->second != optional_multiple )
+                            ++strings_iterator;
+                    }
+                }while( !match_found );
+            }
+        }
+        fclose( stream_err );
+    } __TBB_CATCH(...) {
+        ASSERT( 0,"unexpected exception" );
+    }
+    REPORT("done\n");
+#endif //__TBB_MIC_OFFLOAD, __TBB_MPI_INTEROP etc
+    return 0;
+}
+
+
+// Fill dictionary with version strings for platforms
+void initialize_strings_vector(std::vector <string_pair>* vector)
+{
+    vector->push_back(string_pair("TBB: VERSION\t\t2019.0", required));       // check TBB_VERSION
+    vector->push_back(string_pair("TBB: INTERFACE VERSION\t11003", required)); // check TBB_INTERFACE_VERSION
+    vector->push_back(string_pair("TBB: BUILD_DATE", required));
+    vector->push_back(string_pair("TBB: BUILD_HOST", required));
+    vector->push_back(string_pair("TBB: BUILD_OS", required));
+#if _WIN32||_WIN64
+#if !__MINGW32__
+    vector->push_back(string_pair("TBB: BUILD_CL", required));
+    vector->push_back(string_pair("TBB: BUILD_COMPILER", required));
+#else
+    vector->push_back(string_pair("TBB: BUILD_GCC", required));
+#endif
+#elif __APPLE__
+    vector->push_back(string_pair("TBB: BUILD_KERNEL", required));
+    vector->push_back(string_pair("TBB: BUILD_CLANG", required));
+    vector->push_back(string_pair("TBB: BUILD_XCODE", optional));
+    vector->push_back(string_pair("TBB: BUILD_COMPILER", optional)); //if( getenv("COMPILER_VERSION") )
+#elif __sun
+    vector->push_back(string_pair("TBB: BUILD_KERNEL", required));
+    vector->push_back(string_pair("TBB: BUILD_SUNCC", required));
+    vector->push_back(string_pair("TBB: BUILD_COMPILER", optional)); //if( getenv("COMPILER_VERSION") )
+#else // We use version_info_linux.sh for unsupported OSes
+#if !__ANDROID__
+    vector->push_back(string_pair("TBB: BUILD_KERNEL", required));
+#endif
+    vector->push_back(string_pair("TBB: BUILD_GCC", optional));
+    vector->push_back(string_pair("TBB: BUILD_CLANG", optional));
+    vector->push_back(string_pair("TBB: BUILD_TARGET_CXX", optional));
+    vector->push_back(string_pair("TBB: BUILD_COMPILER", optional)); //if( getenv("COMPILER_VERSION") )
+#if __ANDROID__
+    vector->push_back(string_pair("TBB: BUILD_NDK", optional));
+    vector->push_back(string_pair("TBB: BUILD_LD", optional));
+#else
+    vector->push_back(string_pair("TBB: BUILD_LIBC", required));
+    vector->push_back(string_pair("TBB: BUILD_LD", required));
+#endif // !__ANDROID__
+#endif // OS
+    vector->push_back(string_pair("TBB: BUILD_TARGET", required));
+    vector->push_back(string_pair("TBB: BUILD_COMMAND", required));
+    vector->push_back(string_pair("TBB: TBB_USE_DEBUG", required));
+    vector->push_back(string_pair("TBB: TBB_USE_ASSERT", required));
+#if __TBB_CPF_BUILD
+    vector->push_back(string_pair("TBB: TBB_PREVIEW_BINARY", required));
+#endif
+    vector->push_back(string_pair("TBB: DO_ITT_NOTIFY", required));
+    vector->push_back(string_pair("TBB: ITT", optional)); //#ifdef DO_ITT_NOTIFY
+    vector->push_back(string_pair("TBB: ALLOCATOR", required));
+#if _WIN32||_WIN64
+    vector->push_back(string_pair("TBB: Processor groups", required));
+    vector->push_back(string_pair("TBB: ----- Group", optional_multiple));
+#endif
+    vector->push_back(string_pair("TBB: RML", optional));
+    vector->push_back(string_pair("TBB: Intel(R) RML library built:", optional));
+    vector->push_back(string_pair("TBB: Intel(R) RML library version:", optional));
+    vector->push_back(string_pair("TBB: Tools support", required));
+    return;
+}
+#endif /* __TBB_WIN8UI_SUPPORT */
diff --git a/xdl/third_party/tbb/src/test/test_thread.h b/xdl/third_party/tbb/src/test/test_thread.h
new file mode 100644
index 00000000..dff8ae41
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_thread.h
@@ -0,0 +1,309 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/atomic.h"
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+#include <utility> // std::move
+#endif
+
+#define HARNESS_NO_PARSE_COMMAND_LINE 1
+#include "harness_report.h"
+#include "harness_assert.h"
+
+bool CheckSignatures() {
+    // Checks that thread ids can be compared, in the way users would do it
+    THREAD::id id1, id2;
+    bool result = id1 == id2;
+    result |= id1 != id2;
+    result |= id1 < id2;
+    result |= id1 > id2;
+    result |= id1 <= id2;
+    result |= id1 >= id2;
+    tbb::tbb_hash<THREAD::id> hash;
+    return result |= hash(id1)==hash(id2);
+}
+
+static const int THRDS = 3;
+static const int THRDS_DETACH = 2;
+static tbb::atomic<int> sum;
+static tbb::atomic<int> BaseCount;
+static THREAD::id real_ids[THRDS+THRDS_DETACH];
+
+class Base {
+    mutable int copy_throws;
+    friend void RunTests();
+    friend void CheckExceptionSafety();
+    void operator=( const Base& );   // Deny access
+protected:
+    Base() : copy_throws(100) {++BaseCount;}
+    Base( const Base& c ) : copy_throws(c.copy_throws) {
+        if( --copy_throws<=0 )
+            __TBB_THROW(0);
+        ++BaseCount;
+    }
+    ~Base() {--BaseCount;}
+};
+
+template<int N>
+class Data: Base {
+    Data();                          // Deny access
+    explicit Data(int v) : value(v) {}
+
+    friend void RunTests();
+    friend void CheckExceptionSafety();
+public:
+    int value;
+};
+
+#include "harness_barrier.h"
+
+class ThreadFunc: Base {
+    ThreadFunc() {}
+
+    static Harness::SpinBarrier init_barrier;
+
+    friend void RunTests();
+public:
+    void operator()(){
+        real_ids[0] = THIS_THREAD::get_id();
+        init_barrier.wait();
+
+        sum.fetch_and_add(1);
+    }
+    void operator()(int num){
+        real_ids[num] = THIS_THREAD::get_id();
+        init_barrier.wait();
+
+        sum.fetch_and_add(num);
+    }
+    void operator()(int num, Data<0> dx) {
+        real_ids[num] = THIS_THREAD::get_id();
+
+        const double WAIT = .1;
+#if _WIN32 || _WIN64
+        const double LONG_TOLERANCE = 0.120;  // maximal scheduling quantum for Windows Server
+#else
+        const double LONG_TOLERANCE = 0.200;  // reasonable upper bound
+#endif
+        tbb::tick_count::interval_t test_interval(WAIT);
+        tbb::tick_count t0 = tbb::tick_count::now();
+        THIS_THREAD_SLEEP ( test_interval );
+        tbb::tick_count t1 = tbb::tick_count::now();
+        double delta = ((t1-t0)-test_interval).seconds();
+        if(delta < 0.0)
+            REPORT("ERROR: Sleep interval too short (%g < %g)\n",
+                (t1-t0).seconds(), test_interval.seconds() );
+        if(delta > LONG_TOLERANCE)
+            REPORT("Warning: Sleep interval too long (%g outside long tolerance(%g))\n",
+                (t1-t0).seconds(), test_interval.seconds() + LONG_TOLERANCE);
+        init_barrier.wait();
+
+        sum.fetch_and_add(num);
+        sum.fetch_and_add(dx.value);
+    }
+    void operator()(Data<0> d) {
+        THIS_THREAD_SLEEP ( tbb::tick_count::interval_t(d.value*1.) );
+    }
+};
+
+Harness::SpinBarrier ThreadFunc::init_barrier(THRDS);
+
+void CheckRelations( const THREAD::id ids[], int n, bool duplicates_allowed ) {
+    for( int i=0; i<n; ++i ) {
+        const THREAD::id x = ids[i];
+        for( int j=0; j<n; ++j ) {
+            const THREAD::id y = ids[j];
+            ASSERT( (x==y)==!(x!=y), NULL );
+            ASSERT( (x<y)==!(x>=y), NULL );
+            ASSERT( (x>y)==!(x<=y), NULL );
+            ASSERT( (x<y)+(x==y)+(x>y)==1, NULL );
+            ASSERT( x!=y || i==j || duplicates_allowed, NULL );
+            for( int k=0; k<n; ++k ) {
+                const THREAD::id z = ids[j];
+                ASSERT( !(x<y && y<z) || x<z, "< is not transitive" );
+            }
+        }
+    }
+}
+
+class AnotherThreadFunc: Base {
+public:
+    void operator()() {}
+    void operator()(const Data<1>&) {}
+    void operator()(const Data<1>&, const Data<2>&) {}
+    friend void CheckExceptionSafety();
+};
+
+#if TBB_USE_EXCEPTIONS
+void CheckExceptionSafety() {
+    int original_count = BaseCount;
+    // d loops over number of copies before throw occurs
+    for( int d=1; d<=3; ++d ) {
+        // Try all combinations of throw/nothrow for f, x, and y's copy constructor.
+        for( int i=0; i<8; ++i ) {
+            {
+                const AnotherThreadFunc f = AnotherThreadFunc();
+                if( i&1 ) f.copy_throws = d;
+                const Data<1> x(0);
+                if( i&2 ) x.copy_throws = d;
+                const Data<2> y(0);
+                if( i&4 ) y.copy_throws = d;
+                bool exception_caught = false;
+                for( int j=0; j<3; ++j ) {
+                    try {
+                        switch(j) {
+                            case 0: {THREAD t(f); t.join();} break;
+                            case 1: {THREAD t(f,x); t.join();} break;
+                            case 2: {THREAD t(f,x,y); t.join();} break;
+                        }
+                    } catch(...) {
+                        exception_caught = true;
+                    }
+                    ASSERT( !exception_caught||(i&((1<<(j+1))-1))!=0, NULL );
+                }
+            }
+            ASSERT( BaseCount==original_count, "object leak detected" );
+        }
+    }
+}
+#endif /* TBB_USE_EXCEPTIONS */
+
+#include <cstdio>
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+THREAD returnThread() {
+    return THREAD();
+}
+#endif
+
+void RunTests() {
+
+    ThreadFunc t;
+    Data<0> d100(100), d1(1), d0(0);
+    const THREAD::id id_zero;
+    THREAD::id id0, uniq_ids[THRDS];
+
+    THREAD thrs[THRDS];
+    THREAD thr;
+    THREAD thr0(t);
+    THREAD thr1(t, 2);
+    THREAD thr2(t, 1, d100);
+
+    ASSERT( thr0.get_id() != id_zero, NULL );
+    id0 = thr0.get_id();
+    tbb::move(thrs[0], thr0);
+    ASSERT( thr0.get_id() == id_zero, NULL );
+    ASSERT( thrs[0].get_id() == id0, NULL );
+
+    THREAD::native_handle_type h1 = thr1.native_handle();
+    THREAD::native_handle_type h2 = thr2.native_handle();
+    THREAD::id id1 = thr1.get_id();
+    THREAD::id id2 = thr2.get_id();
+    tbb::swap(thr1, thr2);
+    ASSERT( thr1.native_handle() == h2, NULL );
+    ASSERT( thr2.native_handle() == h1, NULL );
+    ASSERT( thr1.get_id() == id2, NULL );
+    ASSERT( thr2.get_id() == id1, NULL );
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    {
+        THREAD tmp_thr(std::move(thr1));
+        ASSERT( tmp_thr.native_handle() == h2 && tmp_thr.get_id() == id2, NULL );
+        thr1 = std::move(tmp_thr);
+        ASSERT( thr1.native_handle() == h2 && thr1.get_id() == id2, NULL );
+    }
+#endif
+
+    thr1.swap(thr2);
+    ASSERT( thr1.native_handle() == h1, NULL );
+    ASSERT( thr2.native_handle() == h2, NULL );
+    ASSERT( thr1.get_id() == id1, NULL );
+    ASSERT( thr2.get_id() == id2, NULL );
+    thr1.swap(thr2);
+
+    tbb::move(thrs[1], thr1);
+    ASSERT( thr1.get_id() == id_zero, NULL );
+
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+    thrs[2] = returnThread();
+    ASSERT( thrs[2].get_id() == id_zero, NULL );
+#endif
+    tbb::move(thrs[2], thr2);
+    ASSERT( thr2.get_id() == id_zero, NULL );
+
+    for (int i=0; i<THRDS; i++)
+        uniq_ids[i] = thrs[i].get_id();
+
+    ASSERT( thrs[2].joinable(), NULL );
+
+    for (int i=0; i<THRDS; i++)
+        thrs[i].join();
+
+#if !__TBB_WIN8UI_SUPPORT
+    //  TODO: to find out the way to find thread_id without GetThreadId and other
+    //  desktop functions.
+    //  Now tbb_thread does have its own thread_id that stores std::thread object
+    //  Test will fail in case it is run in desktop mode against New Windows*8 UI library
+    for (int i=0; i<THRDS; i++)
+        ASSERT(  real_ids[i] == uniq_ids[i], NULL );
+#endif
+
+    int current_sum = sum;
+    ASSERT( current_sum == 104, NULL );
+    ASSERT( ! thrs[2].joinable(), NULL );
+    ASSERT( BaseCount==4, "object leak detected" );
+
+#if TBB_USE_EXCEPTIONS
+    CheckExceptionSafety();
+#endif
+
+    // Note: all tests involving BaseCount should be put before the tests
+    // involing detached threads, because there is no way of knowing when
+    // a detached thread destroys its arguments.
+
+    THREAD thr_detach_0(t, d0);
+    real_ids[THRDS] = thr_detach_0.get_id();
+    thr_detach_0.detach();
+    ASSERT( thr_detach_0.get_id() == id_zero, NULL );
+
+    THREAD thr_detach_1(t, d1);
+    real_ids[THRDS+1] = thr_detach_1.get_id();
+    thr_detach_1.detach();
+    ASSERT( thr_detach_1.get_id() == id_zero, NULL );
+
+    CheckRelations(real_ids, THRDS+THRDS_DETACH, true);
+
+    CheckRelations(uniq_ids, THRDS, false);
+
+    for (int i=0; i<2; i++) {
+        AnotherThreadFunc empty_func;
+        THREAD thr_to(empty_func), thr_from(empty_func);
+        THREAD::id from_id = thr_from.get_id();
+        if (i) thr_to.join();
+#if __TBB_CPP11_RVALUE_REF_PRESENT
+        thr_to = std::move(thr_from);
+#else
+        thr_to = thr_from;
+#endif
+        ASSERT( thr_from.get_id() == THREAD::id(), NULL );
+        ASSERT( thr_to.get_id() == from_id, NULL );
+    }
+
+    ASSERT( THREAD::hardware_concurrency() > 0, NULL);
+}
diff --git a/xdl/third_party/tbb/src/test/test_tick_count.cpp b/xdl/third_party/tbb/src/test/test_tick_count.cpp
new file mode 100644
index 00000000..68b23022
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tick_count.cpp
@@ -0,0 +1,209 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#include "tbb/tick_count.h"
+#include "harness_assert.h"
+
+//! Assert that two times in seconds are very close.
+void AssertNear( double x, double y ) {
+    ASSERT( -1.0E-10 <= x-y && x-y <=1.0E-10, NULL );
+}
+
+//! Test arithmetic operators on tick_count::interval_t
+void TestArithmetic( const tbb::tick_count& t0, const tbb::tick_count& t1, const tbb::tick_count& t2 ) {
+    tbb::tick_count::interval_t i= t1-t0;
+    tbb::tick_count::interval_t j = t2-t1;
+    tbb::tick_count::interval_t k = t2-t0;
+    AssertSameType( tbb::tick_count::interval_t(), i-j );
+    AssertSameType( tbb::tick_count::interval_t(), i+j );
+    ASSERT( i.seconds()>1E-9, NULL );
+    ASSERT( j.seconds()>1E-9, NULL );
+    ASSERT( k.seconds()>2E-9, NULL );
+    AssertNear( (i+j).seconds(), k.seconds() );
+    AssertNear( (k-j).seconds(), i.seconds() );
+    AssertNear( ((k-j)+(j-i)).seconds(), k.seconds()-i.seconds() );
+    tbb::tick_count::interval_t sum;
+    sum += i;
+    sum += j;
+    AssertNear( sum.seconds(), k.seconds() );
+    sum -= i;
+    AssertNear( sum.seconds(), j.seconds() );
+    sum -= j;
+    AssertNear( sum.seconds(), 0.0 );
+}
+
+//------------------------------------------------------------------------
+// Test for overhead in calls to tick_count
+//------------------------------------------------------------------------
+
+//! Wait for given duration.
+/** The duration parameter is in units of seconds. */
+static void WaitForDuration( double duration ) {
+    tbb::tick_count start = tbb::tick_count::now();
+    while( (tbb::tick_count::now()-start).seconds() < duration )
+        continue;
+}
+
+#include "harness.h"
+
+//! Test that average timer overhead is within acceptable limit.
+/** The 'tolerance' value inside the test specifies the limit. */
+void TestSimpleDelay( int ntrial, double duration, double tolerance ) {
+    double total_worktime = 0;
+    // Iteration -1 warms up the code cache.
+    for( int trial=-1; trial<ntrial; ++trial ) {
+        tbb::tick_count t0 = tbb::tick_count::now();
+        if( duration ) WaitForDuration(duration);
+        tbb::tick_count t1 = tbb::tick_count::now();
+        if( trial>=0 ) {
+            total_worktime += (t1-t0).seconds();
+        }
+    }
+    // Compute average worktime and average delta
+    double worktime = total_worktime/ntrial;
+    double delta = worktime-duration;
+    REMARK("worktime=%g delta=%g tolerance=%g\n", worktime, delta, tolerance);
+
+    // Check that delta is acceptable
+    if( delta<0 )
+        REPORT("ERROR: delta=%g < 0\n",delta);
+    if( delta>tolerance )
+        REPORT("%s: delta=%g > %g=tolerance where duration=%g\n",delta>3*tolerance?"ERROR":"Warning",delta,tolerance,duration);
+}
+
+//------------------------------------------------------------------------
+// Test for subtracting calls to tick_count from different threads.
+//------------------------------------------------------------------------
+
+#include "tbb/atomic.h"
+static tbb::atomic<int> Counter1, Counter2;
+static tbb::atomic<bool> Flag1, Flag2;
+static tbb::tick_count *tick_count_array;
+static double barrier_time;
+
+struct TickCountDifferenceBody {
+    TickCountDifferenceBody( int num_threads ) {
+        Counter1 = Counter2 = num_threads;
+        Flag1 = Flag2 = false;
+    }
+    void operator()( int id ) const {
+        bool last = false;
+        // The first barrier.
+        if ( --Counter1 == 0 ) last = true;
+        while ( !last && !Flag1.load<tbb::acquire>() ) __TBB_Pause( 1 );
+        // Save a time stamp of the first barrier releasing.
+        tick_count_array[id] = tbb::tick_count::now();
+
+        // The second barrier.
+        if ( --Counter2 == 0 ) Flag2.store<tbb::release>(true);
+        // The last thread should release threads from the first barrier after it reaches the second
+        // barrier to avoid a deadlock.
+        if ( last ) Flag1.store<tbb::release>(true);
+        // After the last thread releases threads from the first barrier it waits for a signal from
+        // the second barrier.
+        while ( !Flag2.load<tbb::acquire>() ) __TBB_Pause( 1 );
+
+        if ( last )
+            // We suppose that the barrier time is a time interval between the moment when the last
+            // thread reaches the first barrier and the moment when the same thread is released from
+            // the second barrier. This time is not accurate time of two barriers but it is
+            // guaranteed that it does not exceed it.
+            barrier_time = (tbb::tick_count::now() - tick_count_array[id]).seconds() / 2;
+    }
+    ~TickCountDifferenceBody() {
+        ASSERT( Counter1 == 0 && Counter2 == 0, NULL );
+    }
+};
+
+//! Test that two tick_count values recorded on different threads can be meaningfully subtracted.
+void TestTickCountDifference( int n ) {
+    const double tolerance = 3E-4;
+    tick_count_array = new tbb::tick_count[n];
+
+    int num_trials = 0;
+    tbb::tick_count start_time = tbb::tick_count::now();
+    do {
+        NativeParallelFor( n, TickCountDifferenceBody( n ) );
+        if ( barrier_time > tolerance )
+            // The machine seems to be oversubscibed so skip the test.
+            continue;
+        for ( int i = 0; i < n; ++i ) {
+            for ( int j = 0; j < i; ++j ) {
+                double diff = (tick_count_array[i] - tick_count_array[j]).seconds();
+                if ( diff < 0 ) diff = -diff;
+                if ( diff > tolerance )
+                    REPORT( "Warning: cross-thread tick_count difference = %g > %g = tolerance\n", diff, tolerance );
+                ASSERT( diff < 3 * tolerance, "Too big difference." );
+            }
+        }
+        // During 5 seconds we are trying to get 10 successful trials.
+    } while ( ++num_trials < 10 && (tbb::tick_count::now() - start_time).seconds() < 5 );
+    REMARK( "Difference test time: %g sec\n", (tbb::tick_count::now() - start_time).seconds() );
+    ASSERT( num_trials == 10, "The machine seems to be heavily oversubscibed, difference test was skipped." );
+    delete[] tick_count_array;
+}
+
+void TestResolution() {
+    static double target_value = 0.314159265358979323846264338327950288419;
+    static double step_value = 0.00027182818284590452353602874713526624977572;
+    static int range_value = 100;
+    double avg_diff = 0.0;
+    double max_diff = 0.0;
+    for( int i = -range_value; i <= range_value; ++i ) {
+        double my_time = target_value + step_value * i;
+        tbb::tick_count::interval_t t0(my_time);
+        double interval_time = t0.seconds();
+        avg_diff += (my_time - interval_time);
+        if ( max_diff < my_time-interval_time) max_diff = my_time-interval_time;
+        // time always truncates
+        ASSERT(interval_time >= 0 && my_time - interval_time < tbb::tick_count::resolution(), "tick_count resolution out of range");
+    }
+    avg_diff = (avg_diff/(2*range_value+1))/tbb::tick_count::resolution();
+    max_diff /= tbb::tick_count::resolution();
+    REMARK("avg_diff = %g ticks, max_diff = %g ticks\n", avg_diff, max_diff);
+}
+
+#include "tbb/tbb_thread.h"
+
+int TestMain () {
+    // Increased tolerance for Virtual Machines
+    double tolerance_multiplier = Harness::GetEnv( "VIRTUAL_MACHINE" ) ? 50. : 1.;
+    REMARK( "tolerance_multiplier = %g \n", tolerance_multiplier );
+
+    tbb::tick_count t0 = tbb::tick_count::now();
+    TestSimpleDelay(/*ntrial=*/1000000,/*duration=*/0,    /*tolerance=*/2E-6 * tolerance_multiplier);
+    tbb::tick_count t1 = tbb::tick_count::now();
+    TestSimpleDelay(/*ntrial=*/1000,   /*duration=*/0.001,/*tolerance=*/5E-6 * tolerance_multiplier);
+    tbb::tick_count t2 = tbb::tick_count::now();
+    TestArithmetic(t0,t1,t2);
+
+    TestResolution();
+
+    int num_threads = tbb::tbb_thread::hardware_concurrency();
+    ASSERT( num_threads > 0, "tbb::thread::hardware_concurrency() has returned an incorrect value" );
+    if ( num_threads > 1 ) {
+        REMARK( "num_threads = %d\n", num_threads );
+        TestTickCountDifference( num_threads );
+    } else {
+        REPORT( "Warning: concurrency is too low for TestTickCountDifference ( num_threads = %d )\n", num_threads );
+    }
+
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_tuple.cpp b/xdl/third_party/tbb/src/test/test_tuple.cpp
new file mode 100644
index 00000000..74f54fca
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_tuple.cpp
@@ -0,0 +1,204 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// tbb::flow::tuple (implementation used in tbb::flow)
+// if <tuple> is available on the compiler/platform, that version should be the
+// one tested.
+
+#include "harness.h"
+// this test should match that in graph.h, so we test whatever tuple is
+// being used by the join_node.
+#if __TBB_CPP11_TUPLE_PRESENT
+#define __TESTING_STD_TUPLE__ 1
+#include <tuple>
+using namespace std;
+#else
+#define __TESTING_STD_TUPLE__ 0
+#include "tbb/compat/tuple"
+using namespace tbb::flow;
+#endif /*!__TBB_CPP11_TUPLE_PRESENT*/
+#include <string>
+#include <iostream>
+
+class non_trivial {
+public:
+    non_trivial() {}
+    ~non_trivial() {}
+    non_trivial(const non_trivial& other) : my_int(other.my_int), my_float(other.my_float) { }
+    int get_int() const { return my_int; }
+    float get_float() const { return my_float; }
+    void set_int(int newval) { my_int = newval; }
+    void set_float(float newval) { my_float = newval; }
+private:
+    int my_int;
+    float my_float;
+};
+
+template<typename T1, typename T2, typename T3, typename U1, typename U2, typename U3>
+void RunOneComparisonTest() {
+    typedef tuple<T1,T2,T3> t_tuple;
+    typedef tuple<U1,U2,U3> u_tuple;
+
+    ASSERT(t_tuple((T1)1,(T2)1,(T3)1) == u_tuple((U1)1,(U2)1,(U3)1),NULL);
+    ASSERT(t_tuple((T1)1,(T2)0,(T3)1) <  u_tuple((U1)1,(U2)1,(U3)1),NULL);
+    ASSERT(t_tuple((T1)1,(T2)1,(T3)1) >  u_tuple((U1)1,(U2)1,(U3)0),NULL);
+    ASSERT(t_tuple((T1)1,(T2)0,(T3)1) != u_tuple((U1)1,(U2)1,(U3)1),NULL);
+    ASSERT(t_tuple((T1)1,(T2)0,(T3)1) <= u_tuple((U1)1,(U2)1,(U3)0),NULL);
+    ASSERT(t_tuple((T1)1,(T2)0,(T3)0) <= u_tuple((U1)1,(U2)0,(U3)0),NULL);
+    ASSERT(t_tuple((T1)1,(T2)1,(T3)1) >= u_tuple((U1)1,(U2)0,(U3)1),NULL);
+    ASSERT(t_tuple((T1)0,(T2)1,(T3)1) >= u_tuple((U1)0,(U2)1,(U3)1),NULL);
+
+    ASSERT(!(t_tuple((T1)2,(T2)1,(T3)1) == u_tuple((U1)1,(U2)1,(U3)1)),NULL);
+    ASSERT(!(t_tuple((T1)1,(T2)2,(T3)1) == u_tuple((U1)1,(U2)1,(U3)1)),NULL);
+    ASSERT(!(t_tuple((T1)1,(T2)1,(T3)2) == u_tuple((U1)1,(U2)1,(U3)1)),NULL);
+
+    ASSERT(!(t_tuple((T1)1,(T2)1,(T3)1) <  u_tuple((U1)1,(U2)1,(U3)1)),NULL);
+    ASSERT(!(t_tuple((T1)1,(T2)1,(T3)1) >  u_tuple((U1)1,(U2)1,(U3)1)),NULL);
+    ASSERT(!(t_tuple((T1)1,(T2)1,(T3)1) !=  u_tuple((U1)1,(U2)1,(U3)1)),NULL);
+
+    ASSERT(t_tuple((T1)1,(T2)1,(T3)1) <= u_tuple((U1)1,(U2)1,(U3)1),NULL);
+    ASSERT(t_tuple((T1)1,(T2)1,(T3)1) >= u_tuple((U1)1,(U2)1,(U3)1),NULL);
+
+}
+
+#include "harness_defs.h"
+
+void RunTests() {
+
+#if __TESTING_STD_TUPLE__
+    REMARK("Testing platform tuple\n");
+#else
+    REMARK("Testing compat/tuple\n");
+#endif
+    tuple<int> ituple1(3);
+    tuple<int> ituple2(5);
+    tuple<double> ftuple2(4.1);
+
+    ASSERT(!(ituple1 == ituple2), NULL);
+    ASSERT(ituple1 != ituple2, NULL);
+    ASSERT(!(ituple1 > ituple2), NULL);
+    ASSERT(ituple1 < ituple2, NULL);
+    ASSERT(ituple1 <= ituple2, NULL);
+    ASSERT(!(ituple1 >= ituple2), NULL);
+    ASSERT(ituple1 < ftuple2, NULL);
+
+    typedef tuple<int,double,float> tuple_type1;
+    typedef tuple<int,int,int> int_tuple_type;
+    typedef tuple<int,non_trivial,int> non_trivial_tuple_type;
+    typedef tuple<double,std::string,char> stringy_tuple_type;
+    const tuple_type1 tup1(42,3.14159,2.0f);
+    int_tuple_type int_tup(4, 5, 6);
+    non_trivial_tuple_type nti;
+    stringy_tuple_type stv;
+    get<1>(stv) = "hello";
+    get<2>(stv) = 'x';
+
+    ASSERT(get<0>(stv) == 0.0, NULL);
+    ASSERT(get<1>(stv) == "hello", NULL);
+    ASSERT(get<2>(stv) == 'x', NULL);
+
+    ASSERT(tuple_size<tuple_type1>::value == 3, NULL);
+    ASSERT(get<0>(tup1) == 42, NULL);
+    ASSERT(get<1>(tup1) == 3.14159, NULL);
+    ASSERT(get<2>(tup1) == 2.0, NULL);
+
+    get<1>(nti).set_float(1.0);
+    get<1>(nti).set_int(32);
+    ASSERT(get<1>(nti).get_int() == 32, NULL);
+    ASSERT(get<1>(nti).get_float() == 1.0, NULL);
+
+    // converting constructor
+    tuple<double,double,double> tup2(1,2.0,3.0f);
+    tuple<double,double,double> tup3(9,4.0,7.0f);
+    ASSERT(tup2 != tup3, NULL);
+
+    ASSERT(tup2 < tup3, NULL);
+
+    // assignment
+    tup2 = tup3;
+    ASSERT(tup2 == tup3, NULL);
+
+    tup2 = int_tup;
+    ASSERT(get<0>(tup2) == 4, NULL);
+    ASSERT(get<1>(tup2) == 5, NULL);
+    ASSERT(get<2>(tup2) == 6, NULL);
+
+    // increment component of tuple
+    get<0>(tup2) += 1;
+    ASSERT(get<0>(tup2) == 5, NULL);
+
+    std::pair<int,int> two_pair( 4, 8);
+    tuple<int,int> two_pair_tuple;
+    two_pair_tuple = two_pair;
+    ASSERT(get<0>(two_pair_tuple) == 4, NULL);
+    ASSERT(get<1>(two_pair_tuple) == 8, NULL);
+
+    //relational ops
+    ASSERT(int_tuple_type(1,1,0) == int_tuple_type(1,1,0),NULL);
+    ASSERT(int_tuple_type(1,0,1) <  int_tuple_type(1,1,1),NULL);
+    ASSERT(int_tuple_type(1,0,0) >  int_tuple_type(0,1,0),NULL);
+    ASSERT(int_tuple_type(0,0,0) != int_tuple_type(1,0,1),NULL);
+    ASSERT(int_tuple_type(0,1,0) <= int_tuple_type(0,1,1),NULL);
+    ASSERT(int_tuple_type(0,0,1) <= int_tuple_type(0,0,1),NULL);
+    ASSERT(int_tuple_type(1,1,1) >= int_tuple_type(1,0,0),NULL);
+    ASSERT(int_tuple_type(0,1,1) >= int_tuple_type(0,1,1),NULL);
+
+#if !__TBB_TUPLE_COMPARISON_COMPILATION_BROKEN
+    typedef tuple<int,float,double,char> mixed_tuple_left;
+    typedef tuple<float,int,char,double> mixed_tuple_right;
+
+    ASSERT(mixed_tuple_left(1,1.f,1,char(1)) == mixed_tuple_right(1.f,1,char(1),1),NULL);
+    ASSERT(mixed_tuple_left(1,0.f,1,char(1)) <  mixed_tuple_right(1.f,1,char(1),1),NULL);
+    ASSERT(mixed_tuple_left(1,1.f,1,char(1)) >  mixed_tuple_right(1.f,1,char(0),1),NULL);
+    ASSERT(mixed_tuple_left(1,1.f,1,char(0)) != mixed_tuple_right(1.f,1,char(1),1),NULL);
+    ASSERT(mixed_tuple_left(1,0.f,1,char(1)) <= mixed_tuple_right(1.f,1,char(0),1),NULL);
+    ASSERT(mixed_tuple_left(1,0.f,0,char(1)) <= mixed_tuple_right(1.f,0,char(0),1),NULL);
+    ASSERT(mixed_tuple_left(1,1.f,1,char(0)) >= mixed_tuple_right(1.f,0,char(1),1),NULL);
+    ASSERT(mixed_tuple_left(0,1.f,1,char(0)) >= mixed_tuple_right(0.f,1,char(1),0),NULL);
+
+    ASSERT(!(mixed_tuple_left(2,1.f,1,char(1)) == mixed_tuple_right(1.f,1,char(1),1)),NULL);
+    ASSERT(!(mixed_tuple_left(1,2.f,1,char(1)) == mixed_tuple_right(1.f,1,char(1),1)),NULL);
+    ASSERT(!(mixed_tuple_left(1,1.f,2,char(1)) == mixed_tuple_right(1.f,1,char(1),1)),NULL);
+    ASSERT(!(mixed_tuple_left(1,1.f,1,char(2)) == mixed_tuple_right(1.f,1,char(1),1)),NULL);
+
+    ASSERT(!(mixed_tuple_left(1,1.f,1,char(1)) <  mixed_tuple_right(1.f,1,char(1),1)),NULL);
+    ASSERT(!(mixed_tuple_left(1,1.f,1,char(1)) >  mixed_tuple_right(1.f,1,char(1),1)),NULL);
+    ASSERT(!(mixed_tuple_left(1,1.f,1,char(1)) != mixed_tuple_right(1.f,1,char(1),1)),NULL);
+
+    ASSERT(mixed_tuple_left(1,1.f,1,char(1)) <= mixed_tuple_right(1.f,1,char(1),1),NULL);
+    ASSERT(mixed_tuple_left(1,1.f,1,char(1)) >= mixed_tuple_right(1.f,1,char(1),1),NULL);
+
+    RunOneComparisonTest<int,float,char,float,char,int>();
+    RunOneComparisonTest<double,float,char,float,double,int>();
+    RunOneComparisonTest<int,float,char,short,char,short>();
+    RunOneComparisonTest<double,float,short,float,char,int>();
+#endif /* __TBB_TUPLE_COMPARISON_COMPILATION_BROKEN */
+
+
+    // the following should result in a syntax error
+    // typedef tuple<float,float> mixed_short_tuple;
+    // ASSERT(mixed_tuple_left(1,1.f,1,1) != mixed_short_tuple(1.f,1.f),NULL);
+
+}
+
+int TestMain() {
+    RunTests();
+    return Harness::Done;
+}
diff --git a/xdl/third_party/tbb/src/test/test_write_once_node.cpp b/xdl/third_party/tbb/src/test/test_write_once_node.cpp
new file mode 100644
index 00000000..b5a7e7f6
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_write_once_node.cpp
@@ -0,0 +1,174 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+#if __TBB_CPF_BUILD
+#define TBB_DEPRECATED_FLOW_NODE_EXTRACTION 1
+#endif
+
+#include "harness_graph.h"
+
+#include "tbb/flow_graph.h"
+#include "tbb/task_scheduler_init.h"
+
+#define N 300
+#define T 4
+#define M 4
+
+template< typename R >
+void simple_read_write_tests() {
+    tbb::flow::graph g;
+    tbb::flow::write_once_node<R> n(g);
+
+    for ( int t = 0; t < T; ++t ) {
+        R v0(0);
+        std::vector< harness_counting_receiver<R> > r(M, harness_counting_receiver<R>(g));
+
+        ASSERT( n.is_valid() == false, NULL );
+        ASSERT( n.try_get( v0 ) == false, NULL );
+
+        if ( t % 2 ) {
+            ASSERT( n.try_put( static_cast<R>(N+1) ), NULL );
+            ASSERT( n.is_valid() == true, NULL );
+            ASSERT( n.try_get( v0 ) == true, NULL );
+            ASSERT( v0 == R(N+1), NULL );
+        }
+
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::make_edge( n, r[i] );
+        }
+
+        if ( t%2 ) {
+            for (int i = 0; i < M; ++i) {
+                 size_t c = r[i].my_count;
+                 ASSERT( int(c) == 1, NULL );
+            }
+        }
+
+        for (int i = 1; i <= N; ++i ) {
+            R v1(static_cast<R>(i));
+
+            bool result = n.try_put( v1 );
+            if ( !(t%2) && i == 1 )
+                ASSERT( result == true, NULL );
+            else
+                ASSERT( result == false, NULL );
+
+            ASSERT( n.is_valid() == true, NULL );
+
+            for (int j = 0; j < N; ++j ) {
+                R v2(0);
+                ASSERT( n.try_get( v2 ), NULL );
+                if ( t%2 )
+                    ASSERT( R(N+1) == v2, NULL );
+                else
+                    ASSERT( R(1) == v2, NULL );
+            }
+        }
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == 1, NULL );
+        }
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::remove_edge( n, r[i] );
+        }
+        ASSERT( n.try_put( R(0) ) == false, NULL );
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == 1, NULL );
+        }
+        n.clear();
+        ASSERT( n.is_valid() == false, NULL );
+        ASSERT( n.try_get( v0 ) == false, NULL );
+    }
+}
+
+template< typename R >
+class native_body : NoAssign {
+    tbb::flow::write_once_node<R> &my_node;
+
+public:
+
+     native_body( tbb::flow::write_once_node<R> &n ) : my_node(n) {}
+
+     void operator()( int i ) const {
+         R v1(static_cast<R>(i));
+         ASSERT( my_node.try_put( v1 ) == false, NULL );
+         ASSERT( my_node.is_valid() == true, NULL );
+         ASSERT( my_node.try_get( v1 ) == true, NULL );
+         ASSERT( v1 == R(-1), NULL );
+     }
+};
+
+template< typename R >
+void parallel_read_write_tests() {
+    tbb::flow::graph g;
+    tbb::flow::write_once_node<R> n(g);
+    //Create a vector of identical nodes
+    std::vector< tbb::flow::write_once_node<R> > wo_vec(2, n);
+
+    for (size_t node_idx=0; node_idx<wo_vec.size(); ++node_idx) {
+    for ( int t = 0; t < T; ++t ) {
+        std::vector< harness_counting_receiver<R> > r(M, harness_counting_receiver<R>(g));
+
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::make_edge( wo_vec[node_idx], r[i] );
+        }
+        R v0;
+        ASSERT( wo_vec[node_idx].is_valid() == false, NULL );
+        ASSERT( wo_vec[node_idx].try_get( v0 ) == false, NULL );
+
+        ASSERT( wo_vec[node_idx].try_put( R(-1) ), NULL );
+
+        NativeParallelFor( N, native_body<R>( wo_vec[node_idx] ) );
+
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == 1, NULL );
+        }
+        for (int i = 0; i < M; ++i) {
+           tbb::flow::remove_edge( wo_vec[node_idx], r[i] );
+        }
+        ASSERT( wo_vec[node_idx].try_put( R(0) ) == false, NULL );
+        for (int i = 0; i < M; ++i) {
+             size_t c = r[i].my_count;
+             ASSERT( int(c) == 1, NULL );
+        }
+        wo_vec[node_idx].clear();
+        ASSERT( wo_vec[node_idx].is_valid() == false, NULL );
+        ASSERT( wo_vec[node_idx].try_get( v0 ) == false, NULL );
+    }
+    }
+}
+
+int TestMain() {
+    simple_read_write_tests<int>();
+    simple_read_write_tests<float>();
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        tbb::task_scheduler_init init(p);
+        parallel_read_write_tests<int>();
+        parallel_read_write_tests<float>();
+        test_reserving_nodes<tbb::flow::write_once_node, size_t>();
+    }
+#if TBB_DEPRECATED_FLOW_NODE_EXTRACTION
+    test_extract_on_node<tbb::flow::write_once_node, int>();
+#endif
+    return Harness::Done;
+}
+
diff --git a/xdl/third_party/tbb/src/test/test_yield.cpp b/xdl/third_party/tbb/src/test/test_yield.cpp
new file mode 100644
index 00000000..f8faea14
--- /dev/null
+++ b/xdl/third_party/tbb/src/test/test_yield.cpp
@@ -0,0 +1,68 @@
+/*
+    Copyright (c) 2005-2018 Intel Corporation
+
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+
+
+
+*/
+
+// Test that __TBB_Yield works.
+// On Red Hat EL4 U1, it does not work, because sched_yield is broken.
+
+#define HARNESS_DEFAULT_MIN_THREADS 4
+#define HARNESS_DEFAULT_MAX_THREADS 8
+
+#include "tbb/tbb_machine.h"
+#include "tbb/tick_count.h"
+#include "harness.h"
+
+static volatile long CyclicCounter;
+static volatile bool Quit;
+double SingleThreadTime;
+
+struct RoundRobin: NoAssign {
+    const int number_of_threads;
+    RoundRobin( long p ) : number_of_threads(p) {}
+    void operator()( long k ) const {
+        tbb::tick_count t0 = tbb::tick_count::now();
+        for( long i=0; i<10000; ++i ) {
+            // Wait for previous thread to notify us
+            for( int j=0; CyclicCounter!=k && !Quit; ++j ) {
+                __TBB_Yield();
+                if( j%100==0 ) {
+                    tbb::tick_count t1 = tbb::tick_count::now();
+                    if( (t1-t0).seconds()>=1.0*number_of_threads ) {
+                        REPORT("Warning: __TBB_Yield failing to yield with %d threads (or system is heavily loaded)\n",number_of_threads);
+                        Quit = true;
+                        return;
+                    }
+                }
+            }
+            // Notify next thread that it can run
+            CyclicCounter = (k+1)%number_of_threads;
+        }
+    }
+};
+
+int TestMain () {
+    for( int p=MinThread; p<=MaxThread; ++p ) {
+        REMARK("testing with %d threads\n", p );
+        CyclicCounter = 0;
+        Quit = false;
+        NativeParallelFor( long(p), RoundRobin(p) );
+    }
+    return Harness::Done;
+}
+
diff --git a/xdl/xdl/core/CMakeLists.txt b/xdl/xdl/core/CMakeLists.txt
index 03a990e5..0d6ebc05 100644
--- a/xdl/xdl/core/CMakeLists.txt
+++ b/xdl/xdl/core/CMakeLists.txt
@@ -1,7 +1,6 @@
 xdl_option(BUILD_SHARED "build shared library" OFF)
 
 aux_source_directory(lib SRC_XDL_CORE_LIB)
-aux_source_directory(inference SRC_XDL_INFERENCE_LIB)
 aux_source_directory(ops/ps_ops SRC_XDL_CORE_PS_OPS)
 aux_source_directory(ops/ps_ops/model_server SRC_XDL_CORE_PS_MODEL_SERVER_OPS)
 aux_source_directory(framework SRC_XDL_CORE_FRAMEWORK)
@@ -11,11 +10,12 @@ aux_source_directory(utils SRC_XDL_CORE_UTILS)
 aux_source_directory(lib/base SRC_XDL_BASE_LIB)
 file(GLOB SRC_XDL_CORE_OPS "ops/*.cc")
 
-set(SOURCE_LIST ${SRC_XDL_CORE_LIB} ${SRC_XDL_INFERENCE_LIB} ${SRC_XDL_CORE_FRAMEWORK} ${SRC_XDL_CORE_GRAPPLER} ${SRC_XDL_CORE_OPS} ${SRC_XDL_CORE_UTILS})
+set(SOURCE_LIST ${SRC_XDL_CORE_LIB} ${SRC_XDL_CORE_FRAMEWORK} ${SRC_XDL_CORE_GRAPPLER} ${SRC_XDL_CORE_OPS} ${SRC_XDL_CORE_UTILS})
 
 IF (USE_GPU)
    file(GLOB CUDA_SOURCE "ops/*.cu")
    set(CUDA_NVCC_FLAGS ${XDL_CUDA_NVCC_FLAGS})
+   #set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS}  "-Xcompiler;-fPIC;-std=c++11;-D_GLIBCXX_USE_CXX11_ABI=0;-w")
    cuda_compile(cuda_objs ${CUDA_SOURCE})
    list(APPEND SOURCE_LIST ${cuda_objs})
    list(APPEND SOURCE_LIST ${SRC_XDL_CORE_FRAMEWORK_GPU})
@@ -50,7 +50,7 @@ add_library(xdl_core_proto OBJECT ${PROTO_SRCS})
 
 IF (BUILD_SHARED)
    add_library(xdl_core SHARED ${SOURCE_LIST} $<TARGET_OBJECTS:xdl_core_proto>)
-   target_link_libraries(xdl_core glog libprotobuf ${PS_LIBRARYS} ${BACKEND_LIB} python2.7 cudart)
+   target_link_libraries(xdl_core libprotobuf ${PS_LIBRARYS} ${BACKEND_LIB} python2.7 cudart)
 ELSE()
    add_library(xdl_core STATIC ${SOURCE_LIST} $<TARGET_OBJECTS:xdl_core_proto>)
 ENDIF()
diff --git a/xdl/xdl/core/backend/device_singleton.h b/xdl/xdl/core/backend/device_singleton.h
index 3ca09a06..448cdc6f 100644
--- a/xdl/xdl/core/backend/device_singleton.h
+++ b/xdl/xdl/core/backend/device_singleton.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/backend/mxnet/backend_gpu_op.cc b/xdl/xdl/core/backend/mxnet/backend_gpu_op.cc
index 31860ee6..419b972b 100644
--- a/xdl/xdl/core/backend/mxnet/backend_gpu_op.cc
+++ b/xdl/xdl/core/backend/mxnet/backend_gpu_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -21,6 +21,7 @@ limitations under the License.
 #include "xdl/core/ops/ps_ops/define_op.h"
 #include "xdl/core/backend/device_singleton.h"
 #include "xdl/core/backend/mxnet/mxnet_runner.h"
+#include "xdl/core/backend/mxnet/mxnet_runner_holder.h"
 #include "xdl/core/backend/mxnet/convert_utils.h"
 #include "xdl/core/framework/gpu/gpu_device.h"
 
@@ -29,50 +30,57 @@ namespace xdl {
 class MxnetBackendGpuOp : public xdl::GpuOpKernel {
  public:
   Status Init(OpKernelConstruction* ctx) {
-    std::string var_name;
-    XDL_CHECK_STATUS(ctx->GetAttr("var_name_str", &var_name));
-    XDL_CHECK_STATUS(ctx->GetAttr("graph_def", &graph_def_));
-    XDL_CHECK_STATUS(ctx->GetAttr("device_type", &device_type_));
-    XDL_CHECK_STATUS(ctx->GetAttr("gradient_size", &gradient_size_));
-    XDL_CHECK_STATUS(ctx->GetAttr("is_training", &is_training_));
-    XDL_CHECK_STATUS(ctx->GetAttr("has_init_grad", &has_init_grad_));
-    XDL_CHECK_COND(device_type_ == "gpu", 
-                   Status::ArgumentError("device type must be gpu"));
-    var_names_ = StringUtils::split(var_name, ",");
-    mxnet_runner_.reset(new MxnetRunner(is_training_));
-    XDL_CHECK_STATUS(mxnet_runner_->Init(graph_def_, device_type_));
-    context_.reset(new mxnet::cpp::Context(mxnet::cpp::Context::gpu()));
-    return Status::Ok();
+    int64_t id;
+    XDL_CHECK_STATUS(ctx->GetAttr("id", &id));
+    std::function<Status(MxnetRunnerHolder&)> init = 
+    [ctx](MxnetRunnerHolder& holder)->Status{
+      std::string var_name;
+      XDL_CHECK_STATUS(ctx->GetAttr("var_name_str", &var_name));
+      XDL_CHECK_STATUS(ctx->GetAttr("graph_def", &holder.graph_def_));
+      XDL_CHECK_STATUS(ctx->GetAttr("device_type", &holder.device_type_));
+      XDL_CHECK_STATUS(ctx->GetAttr("gradient_size", &holder.gradient_size_));
+      XDL_CHECK_STATUS(ctx->GetAttr("is_training", &holder.is_training_));
+      XDL_CHECK_STATUS(ctx->GetAttr("has_init_grad", &holder.has_init_grad_));
+      XDL_CHECK_COND(holder.device_type_ == "gpu", 
+                     Status::ArgumentError("device type must be gpu"));
+      holder.var_names_ = StringUtils::split(var_name, ",");
+      holder.mxnet_runner_.reset(new MxnetRunner(holder.is_training_));
+      XDL_CHECK_STATUS(holder.mxnet_runner_->Init(holder.graph_def_, holder.device_type_));
+      holder.context_.reset(new mxnet::cpp::Context(mxnet::cpp::Context::cpu()));
+      holder.context_.reset(new mxnet::cpp::Context(mxnet::cpp::Context::gpu()));
+      return Status::Ok();
+    };
+    return MxnetRunnerHolderManager::GetRunner(id, &holder, init);
   }
 
   Status LaunchKernel(OpKernelContext* ctx, CudaStream* stream) {
     std::vector<Tensor> inputs;
     XDL_CHECK_STATUS(ctx->GetInputList("inputs", &inputs));
-    XDL_CHECK_COND(inputs.size() == var_names_.size(), 
+    XDL_CHECK_COND(inputs.size() == holder->var_names_.size(), 
                    Status::Internal("input size not equal"));
     MxnetRunner::InputList input_list;
-    input_list.resize(var_names_.size());
-    for (size_t i = 0; i < var_names_.size(); ++i) {
-      input_list[i] = std::make_pair(var_names_[i], inputs[i]);
+    input_list.resize(holder->var_names_.size());
+    for (size_t i = 0; i < holder->var_names_.size(); ++i) {
+      input_list[i] = std::make_pair(holder->var_names_[i], inputs[i]);
     }
 
     std::vector<mxnet::cpp::NDArray> init_grads;
-    if (has_init_grad_) {
+    if (holder->has_init_grad_) {
       Tensor init_grad;
       mxnet::cpp::NDArray converted_init_grad;
       XDL_CHECK_STATUS(ctx->GetInput("init_grad", &init_grad));      
       XDL_CHECK_STATUS(XDL2MX::ConvertTensor(
-                           context_.get(), 
+                           holder->context_.get(), 
                            init_grad, &converted_init_grad));
       XDL_CHECK_STATUS(XDL2MX::CopyGpuTensorSync(init_grad, &converted_init_grad));
       init_grads.clear();
       init_grads.push_back(converted_init_grad);
-      mxnet_runner_->SetInitGrad(&init_grads);
+      holder->mxnet_runner_->SetInitGrad(&init_grads);
     }
 
     MxnetRunner::DataList outputs;
     MxnetRunner::DataList gradients;    
-    XDL_CHECK_STATUS(mxnet_runner_->Run(
+    XDL_CHECK_STATUS(holder->mxnet_runner_->Run(
                          input_list, 
                          &outputs, 
                          &gradients, 
@@ -100,14 +108,7 @@ class MxnetBackendGpuOp : public xdl::GpuOpKernel {
   }
 
  private:
-  std::unique_ptr<MxnetRunner> mxnet_runner_;
-  std::string graph_def_;
-  std::string device_type_;
-  std::vector<std::string> var_names_;
-  std::unique_ptr<mxnet::cpp::Context> context_;
-  bool is_training_;
-  bool has_init_grad_;
-  int64_t gradient_size_;
+  MxnetRunnerHolder* holder;
 };
 
 XDL_DEFINE_OP(MxnetBackendGpuOp)
@@ -122,7 +123,8 @@ XDL_DEFINE_OP(MxnetBackendGpuOp)
   .Attr("device_type", AttrValue::kString)
   .Attr("is_training", AttrValue::kBool)
   .Attr("has_init_grad", AttrValue::kBool)
-  .Attr("graph_def", AttrValue::kString);
+  .Attr("graph_def", AttrValue::kString)
+  .Attr("id", AttrValue::kInt);
 
 XDL_REGISTER_KERNEL(MxnetBackendOp, MxnetBackendGpuOp).Device("GPU");
 
diff --git a/xdl/xdl/core/backend/mxnet/backend_op.cc b/xdl/xdl/core/backend/mxnet/backend_op.cc
index 19a25a50..e9bd9d0a 100644
--- a/xdl/xdl/core/backend/mxnet/backend_op.cc
+++ b/xdl/xdl/core/backend/mxnet/backend_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -23,6 +23,7 @@ limitations under the License.
 #include "xdl/core/ops/ps_ops/define_op.h"
 #include "xdl/core/backend/device_singleton.h"
 #include "xdl/core/backend/mxnet/mxnet_runner.h"
+#include "xdl/core/backend/mxnet/mxnet_runner_holder.h"
 #include "xdl/core/backend/mxnet/convert_utils.h"
 
 namespace xdl {
@@ -30,54 +31,60 @@ namespace xdl {
 class MxnetBackendOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) {
-    std::string var_name;
-    XDL_CHECK_STATUS(ctx->GetAttr("var_name_str", &var_name));
-    XDL_CHECK_STATUS(ctx->GetAttr("graph_def", &graph_def_));
-    XDL_CHECK_STATUS(ctx->GetAttr("device_type", &device_type_));
-    XDL_CHECK_STATUS(ctx->GetAttr("gradient_size", &gradient_size_));
-    XDL_CHECK_STATUS(ctx->GetAttr("is_training", &is_training_));
-    XDL_CHECK_STATUS(ctx->GetAttr("has_init_grad", &has_init_grad_));
-    XDL_CHECK_COND(device_type_ == "cpu", 
-                   Status::ArgumentError("device type must be cpu"));
-    var_names_ = StringUtils::split(var_name, ",");
-    mxnet_runner_.reset(new MxnetRunner(is_training_));
-    XDL_CHECK_STATUS(mxnet_runner_->Init(graph_def_, device_type_));
-    context_.reset(new mxnet::cpp::Context(mxnet::cpp::Context::cpu()));
-    return Status::Ok();
+    int64_t id;
+    XDL_CHECK_STATUS(ctx->GetAttr("id", &id));
+    std::function<Status(MxnetRunnerHolder&)> init = 
+    [ctx](MxnetRunnerHolder& holder)->Status{
+      std::string var_name;
+      XDL_CHECK_STATUS(ctx->GetAttr("var_name_str", &var_name));
+      XDL_CHECK_STATUS(ctx->GetAttr("graph_def", &holder.graph_def_));
+      XDL_CHECK_STATUS(ctx->GetAttr("device_type", &holder.device_type_));
+      XDL_CHECK_STATUS(ctx->GetAttr("gradient_size", &holder.gradient_size_));
+      XDL_CHECK_STATUS(ctx->GetAttr("is_training", &holder.is_training_));
+      XDL_CHECK_STATUS(ctx->GetAttr("has_init_grad", &holder.has_init_grad_));
+      XDL_CHECK_COND(holder.device_type_ == "cpu", 
+                     Status::ArgumentError("device type must be cpu"));
+      holder.var_names_ = StringUtils::split(var_name, ",");
+      holder.mxnet_runner_.reset(new MxnetRunner(holder.is_training_));
+      XDL_CHECK_STATUS(holder.mxnet_runner_->Init(holder.graph_def_, holder.device_type_));
+      holder.context_.reset(new mxnet::cpp::Context(mxnet::cpp::Context::cpu()));
+      return Status::Ok();
+    };
+    return MxnetRunnerHolderManager::GetRunner(id, &holder, init);
   }
 
   void Compute(OpKernelContext* ctx, Callback done) override {
     std::vector<Tensor> inputs;
     XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("inputs", &inputs), done);
-    XDL_CHECK_COND_ASYNC(inputs.size() == var_names_.size(), 
+    XDL_CHECK_COND_ASYNC(inputs.size() == holder->var_names_.size(), 
                          Status::Internal("input size not equal"), 
                          done);
     MxnetRunner::InputList input_list;
-    input_list.resize(var_names_.size());
-    for (size_t i = 0; i < var_names_.size(); ++i) {
-      input_list[i] = std::make_pair(var_names_[i], inputs[i]);
+    input_list.resize(holder->var_names_.size());
+    for (size_t i = 0; i < holder->var_names_.size(); ++i) {
+      input_list[i] = std::make_pair(holder->var_names_[i], inputs[i]);
     }
 
     std::vector<mxnet::cpp::NDArray> init_grads;
-    if (has_init_grad_) {
+    if (holder->has_init_grad_) {
       Tensor init_grad;
       mxnet::cpp::NDArray converted_init_grad;
       XDL_CHECK_STATUS_ASYNC(ctx->GetInput("init_grad", &init_grad), done);      
       XDL_CHECK_STATUS_ASYNC(
           XDL2MX::ConvertTensor(
-              context_.get(), 
+              holder->context_.get(), 
               init_grad, &converted_init_grad), done);
       XDL_CHECK_STATUS_ASYNC(
           XDL2MX::CopyTensor(init_grad, &converted_init_grad), done);
       init_grads.clear();
       init_grads.push_back(converted_init_grad);
-      mxnet_runner_->SetInitGrad(&init_grads);
+      holder->mxnet_runner_->SetInitGrad(&init_grads);
     }
 
     MxnetRunner::DataList outputs;
     MxnetRunner::DataList gradients;    
     XDL_CHECK_STATUS_ASYNC(
-        mxnet_runner_->Run(input_list, &outputs, &gradients), done);
+        holder->mxnet_runner_->Run(input_list, &outputs, &gradients), done);
     std::vector<Tensor> output_list;
     output_list.resize(outputs.size());
     for (size_t i = 0; i < outputs.size(); ++i) {
@@ -97,14 +104,7 @@ class MxnetBackendOp : public xdl::OpKernelAsync {
   }
 
  private:
-  std::unique_ptr<MxnetRunner> mxnet_runner_;
-  std::string graph_def_;
-  std::string device_type_;
-  std::vector<std::string> var_names_;
-  std::unique_ptr<mxnet::cpp::Context> context_;
-  bool is_training_;
-  bool has_init_grad_;
-  int64_t gradient_size_;
+  MxnetRunnerHolder* holder;
 };
 
 XDL_DEFINE_OP(MxnetBackendOp)
@@ -119,7 +119,8 @@ XDL_DEFINE_OP(MxnetBackendOp)
   .Attr("device_type", AttrValue::kString)
   .Attr("is_training", AttrValue::kBool)
   .Attr("has_init_grad", AttrValue::kBool)
-  .Attr("graph_def", AttrValue::kString);
+  .Attr("graph_def", AttrValue::kString)
+  .Attr("id", AttrValue::kInt);
 
 XDL_REGISTER_KERNEL(MxnetBackendOp, MxnetBackendOp).Device("CPU");
 
diff --git a/xdl/xdl/core/backend/mxnet/convert_utils.cc b/xdl/xdl/core/backend/mxnet/convert_utils.cc
index 8aabe708..3298fa26 100644
--- a/xdl/xdl/core/backend/mxnet/convert_utils.cc
+++ b/xdl/xdl/core/backend/mxnet/convert_utils.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /* Copyright 2018 Alibaba Group. All Rights Reserved.
 
    Licensed under the Apache License, Version 2.0 (the "License");
diff --git a/xdl/xdl/core/backend/mxnet/convert_utils.h b/xdl/xdl/core/backend/mxnet/convert_utils.h
index 0ba55661..965bbe2c 100644
--- a/xdl/xdl/core/backend/mxnet/convert_utils.h
+++ b/xdl/xdl/core/backend/mxnet/convert_utils.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/backend/mxnet/merge_copy_util.h b/xdl/xdl/core/backend/mxnet/merge_copy_util.h
new file mode 100644
index 00000000..a12a0873
--- /dev/null
+++ b/xdl/xdl/core/backend/mxnet/merge_copy_util.h
@@ -0,0 +1,194 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_BACKEND_MXNET_MERGE_COPY_UTIL_H_
+#define XDL_BACKEND_MXNET_MERGE_COPY_UTIL_H_
+
+#include <omp.h>
+#include <vector>
+#include <string>
+#include <unordered_map>
+#include <cuda_runtime.h>
+#include "xdl/core/utils/logging.h"
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/lib/common_defines.h"
+#include "xdl/core/framework/tensor.h"
+#include "xdl/core/framework/gpu/gpu_stream.h"
+#include "xdl/core/utils/time_utils.h"
+
+namespace xdl {
+
+class MergeCopyUtil {
+ public:
+  MergeCopyUtil() 
+    : forward_size_(0) 
+    , backward_size_(0)
+    , forward_device_buf_(nullptr)
+    , backward_device_buf_(nullptr) {}
+
+  inline void RegisterForwardMemInfo(const std::string& name,
+                              void* device_addr,
+                              size_t size);
+  inline void RegisterBackwardMemInfo(const std::string& name,
+                               void* device_addr,
+                               size_t size);
+  inline void Initialize() {
+    // forward
+    forward_buf_.resize(forward_size_);
+    cudaError_t e = cudaMalloc(&forward_device_buf_, forward_size_);
+    if (e != cudaSuccess && e != cudaErrorCudartUnloading) {
+      size_t avail, total;
+      cudaMemGetInfo(&avail, &total);
+      LOG(ERROR) << "cudaMalloc failed, size=" << forward_size_
+                 << " avail=" << avail
+                 << " total=" << total
+                 << " err=" << e;
+    }
+
+    CudaStream::RunOrAbort(e, "Cuda Memory Allocate Error");
+    // backward
+    backward_buf_.resize(backward_size_);
+    e = cudaMalloc(&backward_device_buf_, backward_size_);
+    if (e != cudaSuccess && e != cudaErrorCudartUnloading) {
+      size_t avail, total;
+      cudaMemGetInfo(&avail, &total);
+      LOG(ERROR) << "cudaMalloc failed, size=" << backward_size_
+                 << " avail=" << avail
+                 << " total=" << total
+                 << " err=" << e;
+    }
+
+    CudaStream::RunOrAbort(e, "Cuda Memory Allocate Error");
+
+    // cuda stream
+    CudaStream::RunOrAbort(cudaStreamCreate(&stream_), "Cuda Stream Create Error");    
+  }
+
+  inline Status CopyHost2Device(const std::vector<std::pair<std::string, Tensor> >& tensors);
+  inline Status CopyDevice2Host(const std::vector<std::string>& output_order,
+                                std::vector<Tensor>* tensors);
+
+ private:
+  struct DeviceMemInfo {
+    DeviceMemInfo() : device_addr_(nullptr), size_(0), offset_(0) {}
+    DeviceMemInfo(void* device_addr,
+                  size_t size,
+                  size_t offset) 
+      : device_addr_(device_addr)
+      , size_(size)
+      , offset_(offset) {}
+    void* device_addr_;
+    size_t size_;
+    size_t offset_;
+  };
+
+  std::unordered_map<std::string, DeviceMemInfo> forward_mem_info_;
+  std::unordered_map<std::string, DeviceMemInfo> backward_mem_info_;
+  size_t forward_size_;
+  size_t backward_size_;
+  std::vector<char> forward_buf_;
+  std::vector<char> backward_buf_;  
+  void* forward_device_buf_;
+  void* backward_device_buf_;
+  cudaStream_t stream_;  
+};
+
+void MergeCopyUtil::RegisterForwardMemInfo(
+    const std::string& name,
+    void* device_addr,
+    size_t size) {
+  forward_mem_info_.insert(std::make_pair(name, DeviceMemInfo(device_addr, size, forward_size_)));
+  forward_size_ += size;
+}
+
+void MergeCopyUtil::RegisterBackwardMemInfo(
+    const std::string& name,
+    void* device_addr,
+    size_t size) {
+  backward_mem_info_.insert(std::make_pair(name, DeviceMemInfo(device_addr, size, backward_size_)));
+  backward_size_ += size;
+}
+
+Status MergeCopyUtil::CopyHost2Device(const std::vector<std::pair<std::string, Tensor> >& tensors) {
+  size_t beg = TimeUtils::NowMicros();    
+  //#pragma omp parallel for num_threads(2)
+  for (size_t i = 0; i < tensors.size(); ++i) {
+    auto it = forward_mem_info_.find(tensors[i].first);
+    if (it == forward_mem_info_.end()) {
+//      return Status::ArgumentError("no input:" + tensors[i].first + " registered!");
+      continue;
+    }
+
+    void* dst = (void*)forward_buf_.data() + it->second.offset_;
+    memcpy(dst, tensors[i].second.Raw<char>(), it->second.size_);
+  }
+
+  size_t beg1 = TimeUtils::NowMicros();
+  CUDA_CHECK(cudaMemcpy(forward_device_buf_,
+                        forward_buf_.data(),
+                        forward_size_,
+                        cudaMemcpyHostToDevice));
+
+  size_t beg2 = TimeUtils::NowMicros();
+  for (auto& item: forward_mem_info_) {
+    CUDA_CHECK(cudaMemcpyAsync(item.second.device_addr_,
+                               forward_device_buf_ + item.second.offset_,
+                               item.second.size_,
+                               cudaMemcpyDeviceToDevice,
+                               stream_));
+  }
+  
+  CUDA_CHECK(cudaStreamSynchronize(stream_));
+  return Status::Ok();
+}
+
+Status MergeCopyUtil::CopyDevice2Host(const std::vector<std::string>& output_order,
+                                      std::vector<Tensor>* outputs) {
+  size_t beg = TimeUtils::NowMicros();    
+  for (auto& item: backward_mem_info_) {
+    CUDA_CHECK(cudaMemcpyAsync(backward_device_buf_ + item.second.offset_,
+                               item.second.device_addr_,
+                               item.second.size_,
+                               cudaMemcpyDeviceToDevice,
+                               stream_));
+  }
+
+  CUDA_CHECK(cudaStreamSynchronize(stream_));
+  size_t beg1 = TimeUtils::NowMicros();    
+  CUDA_CHECK(cudaMemcpy(backward_buf_.data(),
+                        backward_device_buf_,
+                        backward_size_,
+                        cudaMemcpyDeviceToHost));
+
+  size_t beg2 = TimeUtils::NowMicros();    
+  //#pragma omp parallel for num_threads(2)
+  for (size_t i = 0; i < output_order.size(); ++i) {
+    auto it = backward_mem_info_.find(output_order[i]);
+    if (it == backward_mem_info_.end()) {
+      // return Status::ArgumentError("no input:" + output_order[i] + " registered!");
+      continue;
+    }
+
+    memcpy(outputs->at(i).Raw<void>(), backward_buf_.data() + it->second.offset_, it->second.size_);
+  }
+
+  return Status::Ok();
+}
+
+
+} // namespace xdl
+
+#endif // XDL_BACKEND_MXNET_MERGE_COPY_UTIL_H_
diff --git a/xdl/xdl/core/backend/mxnet/mxnet_runner.cc b/xdl/xdl/core/backend/mxnet/mxnet_runner.cc
index bcfeedb8..b768a491 100644
--- a/xdl/xdl/core/backend/mxnet/mxnet_runner.cc
+++ b/xdl/xdl/core/backend/mxnet/mxnet_runner.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -15,7 +15,7 @@ limitations under the License.
 
 #include "xdl/core/backend/mxnet/mxnet_runner.h"
 
-#include <xdl/core/utils/logging.h>
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 
@@ -64,6 +64,7 @@ Status MxnetRunner::Bind(mxnet::cpp::Executor *&exec,
       mxnet::cpp::NDArray nd_array;
       XDL2MX::ConvertTensor(&ctx, item.second, &nd_array);
       args[item.first] = nd_array;
+      //LOG(INFO) << "bind " << item.first << nd_array.GetData();
     }
   }
 
diff --git a/xdl/xdl/core/backend/mxnet/mxnet_runner.h b/xdl/xdl/core/backend/mxnet/mxnet_runner.h
index 537a07f0..424945d9 100644
--- a/xdl/xdl/core/backend/mxnet/mxnet_runner.h
+++ b/xdl/xdl/core/backend/mxnet/mxnet_runner.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/backend/mxnet/mxnet_runner_holder.h b/xdl/xdl/core/backend/mxnet/mxnet_runner_holder.h
new file mode 100644
index 00000000..f92853c9
--- /dev/null
+++ b/xdl/xdl/core/backend/mxnet/mxnet_runner_holder.h
@@ -0,0 +1,55 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/backend/mxnet/mxnet_runner.h"
+#include "xdl/core/backend/mxnet/convert_utils.h"
+#include <memory>
+#include <string>
+
+namespace xdl {
+
+struct MxnetRunnerHolder {
+  std::unique_ptr<MxnetRunner> mxnet_runner_;
+  std::string graph_def_;
+  std::string device_type_;
+  std::vector<std::string> var_names_;
+  std::unique_ptr<mxnet::cpp::Context> context_;
+  bool is_training_;
+  bool has_init_grad_;
+  int64_t gradient_size_;
+};
+
+class MxnetRunnerHolderManager : Singleton<MxnetRunnerHolderManager> {
+ public:
+  static Status
+  GetRunner(int64_t id, MxnetRunnerHolder** holder, std::function<Status(MxnetRunnerHolder&)> init) {
+    return Get()->GetRunnerImpl(id, holder, init);
+  }
+ private:
+  Status
+  GetRunnerImpl(int64_t id, MxnetRunnerHolder** holder, std::function<Status(MxnetRunnerHolder&)> init) {
+    std::unique_lock<std::mutex> lock(mu_);
+    if (holders_[id] == nullptr) {
+      holders_[id].reset(new MxnetRunnerHolder);
+      XDL_CHECK_STATUS(init(*holders_[id]));
+    }
+    *holder = holders_[id].get();
+    return Status::Ok();
+  }
+  std::mutex mu_;
+  std::unordered_map<int64_t, std::unique_ptr<MxnetRunnerHolder>> holders_;
+};
+
+}
diff --git a/xdl/xdl/core/backend/tf/backend_op.cc b/xdl/xdl/core/backend/tf/backend_op.cc
index 0f0dffe8..917f0a19 100644
--- a/xdl/xdl/core/backend/tf/backend_op.cc
+++ b/xdl/xdl/core/backend/tf/backend_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -84,15 +84,15 @@ class TFBackendOp : public xdl::OpKernelAsync {
                            gradient_op_names_.begin(), 
                            gradient_op_names_.end());
     
-    std::vector<tensorflow::Tensor> results;
+	results_.clear();
     XDL_CHECK_STATUS_ASYNC(
-        tf_runner_.Run(tf_inputs, output_op_names, &results), 
+        tf_runner_.Run(tf_inputs, output_op_names, &results_), 
         done);
     
     TensorList outputs;
     for (size_t i = 0; i < target_op_size; ++i) {
       Tensor t;
-      XDL_CHECK_STATUS_ASYNC(TF2XDL::ConvertTensor(results[i], &t), done);
+      XDL_CHECK_STATUS_ASYNC(TF2XDL::ConvertTensor(results_[i], &t), done);
       outputs.emplace_back(t);
     }
 
@@ -102,7 +102,7 @@ class TFBackendOp : public xdl::OpKernelAsync {
     #pragma omp parallel for
     for (size_t i = 0; i < gradient_op_size; ++i) {
       Tensor t;
-      TF2XDL::ConvertTensor(results[i + target_op_size], &t);
+      TF2XDL::ConvertTensor(results_[i + target_op_size], &t);
       gradients[i] = std::move(t);
     }
 
@@ -117,18 +117,19 @@ class TFBackendOp : public xdl::OpKernelAsync {
   std::vector<std::string> target_op_names_;
   std::vector<std::string> gradient_op_names_;
   std::vector<std::string> local_init_op_names_;
+  std::vector<tensorflow::Tensor> results_;
 };
 
 XDL_DEFINE_OP(TFBackendOp)
   .InputListV2("inputs", "input_type")
-  .OutputList("targets", DataType::kFloat, "target_size")
+  .OutputListV2("targets", "output_type")
   .OutputList("gradients", DataType::kFloat, "gradient_size")
   .Attr("input_type", AttrValue::kDataTypeList)
+  .Attr("output_type", AttrValue::kDataTypeList)
   .Attr("input_op_names", AttrValue::kString)
   .Attr("target_op_names", AttrValue::kString)
   .Attr("gradient_op_names", AttrValue::kString)
   .Attr("local_init_op_names", AttrValue::kString)
-  .Attr("target_size", AttrValue::kInt)
   .Attr("gradient_size", AttrValue::kInt)
   .Attr("graph_def", AttrValue::kString)
   .Attr("gpu_memory_fraction", AttrValue::kFloat);
diff --git a/xdl/xdl/core/backend/tf/convert_utils.cc b/xdl/xdl/core/backend/tf/convert_utils.cc
index 5181a2bd..005de74f 100644
--- a/xdl/xdl/core/backend/tf/convert_utils.cc
+++ b/xdl/xdl/core/backend/tf/convert_utils.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -15,9 +15,47 @@ limitations under the License.
 
 #include "xdl/core/backend/tf/convert_utils.h"
 #include "xdl/core/backend/device_singleton.h"
+#include "xdl/core/framework/allocator.h"
+
+#include <tensorflow/core/framework/allocator.h>
+
 
 namespace xdl {
 
+class FakeAllocator:public tensorflow::Allocator {
+  public:
+    FakeAllocator() {}
+    void* AllocateRaw(size_t alignment, size_t num_bytes) override { 
+		return buffer_;
+	}
+			   
+	std::string Name() override {
+		return "FakeAllocator";
+	}
+	void DeallocateRaw(void*) override {}
+	void SetBuffer(void* buffer) {
+		buffer_ = buffer;
+		return;
+	}
+  private:
+	void* buffer_ = nullptr;
+};
+
+class FakeXDLAllocator:public Allocator {
+  public:
+    void* Allocate(size_t num_bytes) override {
+		return buffer_;
+	}
+	void Deallocate(void*) override {}
+	void SetBuffer(void* buffer) {
+		buffer_ = buffer;
+		return;
+	}
+  private:
+    void* buffer_ = nullptr;
+};
+
+
 Status XDL2TF::ConvertType(const xdl::DataType s, tensorflow::DataType* d) {
   switch(s) {
   case DataType::kInt8: 
@@ -58,10 +96,10 @@ Status XDL2TF::ConvertTensor(const xdl::Tensor& s, tensorflow::Tensor* d) {
   tensorflow::TensorShape shape;
   XDL_CHECK_STATUS(ConvertType(s.Type(), &type));
   XDL_CHECK_STATUS(ConvertShape(s.Shape(), &shape));
-  *d = tensorflow::Tensor(type, shape);
-  void* dst = (void*)d->tensor_data().data();
-  size_t size = d->tensor_data().size();
-  memcpy(dst, s.Raw<void>(), size);
+  //avoid memcopy 
+  static __thread FakeAllocator fakeAlloc;
+  fakeAlloc.SetBuffer(s.Raw<void>());
+  *d = tensorflow::Tensor(&fakeAlloc, type, shape);
   return Status::Ok();
 }
 
@@ -105,10 +143,10 @@ Status TF2XDL::ConvertTensor(const tensorflow::Tensor& s, xdl::Tensor* d) {
   XDL_CHECK_STATUS(ConvertType(s.dtype(), &type));
   TensorShape shape;
   XDL_CHECK_STATUS(ConvertShape(s.shape(), &shape));
-  *d = Tensor(DeviceSingleton::CpuInstance(), shape, type);
-  void* src = (void*)s.tensor_data().data();
-  size_t size = s.tensor_data().size();
-  memcpy(d->Raw<int8_t>(), src, size);
+  //avoid memcopy
+  static __thread FakeXDLAllocator xAllocator;
+  xAllocator.SetBuffer((void*)s.tensor_data().data());
+  *d = Tensor(&xAllocator, shape, type);
   return Status::Ok();
 }
 
diff --git a/xdl/xdl/core/backend/tf/convert_utils.h b/xdl/xdl/core/backend/tf/convert_utils.h
index 66e3f933..1ea01f50 100644
--- a/xdl/xdl/core/backend/tf/convert_utils.h
+++ b/xdl/xdl/core/backend/tf/convert_utils.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/backend/tf/tf_runner.cc b/xdl/xdl/core/backend/tf/tf_runner.cc
index ce656dfa..42e599f3 100644
--- a/xdl/xdl/core/backend/tf/tf_runner.cc
+++ b/xdl/xdl/core/backend/tf/tf_runner.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/backend/tf/tf_runner.h b/xdl/xdl/core/backend/tf/tf_runner.h
index fdabaf64..77cbdbd6 100644
--- a/xdl/xdl/core/backend/tf/tf_runner.h
+++ b/xdl/xdl/core/backend/tf/tf_runner.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/framework/cpu_device.cc b/xdl/xdl/core/framework/cpu_device.cc
index 09404442..20c0cfc2 100644
--- a/xdl/xdl/core/framework/cpu_device.cc
+++ b/xdl/xdl/core/framework/cpu_device.cc
@@ -16,15 +16,19 @@ limitations under the License.
 #include "xdl/core/framework/cpu_device.h"
 
 #include <string>
+#include <malloc.h>
 
 namespace xdl {
 
 void* CpuAllocator::Allocate(size_t size) {
-  return static_cast<void*>(new char[size]);
+  //return static_cast<void*>(new char[size]);
+  return static_cast<void*>(memalign(64, ((size+63)/64)*64));
 }
 
 void CpuAllocator::Deallocate(void* buf) {
-  delete [] static_cast<char*>(buf);
+  //delete [] static_cast<char*>(buf);
+  free(buf);
+  return;
 }
 
 CpuDevice::CpuDevice()
diff --git a/xdl/xdl/core/framework/executor.cc b/xdl/xdl/core/framework/executor.cc
index bdf43e8c..7472ff4d 100644
--- a/xdl/xdl/core/framework/executor.cc
+++ b/xdl/xdl/core/framework/executor.cc
@@ -27,42 +27,26 @@ void Executor::Run(const GraphDef& graph,
                    const OutputSpec& output,
                    const RunOption& run_option,
                    Callback done) {
-  Run(graph, {}, output, run_option, done);
-}
-
-void Executor::Run(const GraphDef& graph,
-                   const Feeds& feeds,
-                   const OutputSpec& output,
-                   const RunOption& run_option,
-                   Callback done) {
   auto graph_creator = 
-    [](const GraphDef& def, const InputSpec& input, 
-       const OutputSpec& output, Graph** g) -> Status {
+  [](const GraphDef& def, const OutputSpec& output, Graph** g) -> Status {
     GraphDef real_def = def;
     OutputSpec real_output = output;
     XDL_CHECK_STATUS(
-        GrapplerRegistry::Get()->Process(input, &real_def, &real_output));
+        GrapplerRegistry::Get()->Process(&real_def, &real_output));
     std::unique_ptr<Graph> ret(new Graph);
-    GraphBuilder builder(real_def, input, real_output, ret.get());
+    GraphBuilder builder(real_def, real_output, ret.get());
     XDL_CHECK_STATUS(builder.Build());
     *g = ret.release();
     return Status::Ok();
   };
-
   Graph* g;
-  InputSpec input(feeds.size());
-  for (auto& item: feeds) {
-    input.push_back(item.first);
-  }
-
   Status build_status =
-    GraphCache::Get()->GetGraph(graph_creator, graph, input, output, &g);
+    GraphCache::Get()->GetGraph(graph_creator, graph, output, &g);
   if (!build_status.IsOk()) {
     done(build_status, std::vector<Tensor>(), SimpleExecutor::ExtraInfo());
     return;
   }
-
-  SimpleExecutor::Run(g, feeds, run_option, done, thread_pool_);
+  SimpleExecutor::Run(g, run_option, done, thread_pool_);
 }
 
 }  // namespace xdl
diff --git a/xdl/xdl/core/framework/executor.h b/xdl/xdl/core/framework/executor.h
index 65c54090..32f2afe8 100644
--- a/xdl/xdl/core/framework/executor.h
+++ b/xdl/xdl/core/framework/executor.h
@@ -20,6 +20,7 @@ limitations under the License.
 #include "xdl/core/lib/thread_pool.h"
 #include "xdl/core/framework/graph_def.h"
 #include "xdl/core/framework/simple_executor.h"
+#include "xdl/core/framework/run_option.h"
 
 namespace xdl {
 
@@ -30,16 +31,6 @@ class Executor {
     : thread_pool_(thread_pool) {}
   void Run(const GraphDef& graph, const OutputSpec& output, 
            const RunOption& run_option, Callback done);
-
-  using Feed = std::pair<std::string, Tensor>;
-  using Feeds = std::vector<Feed>;
-  /* 
-   * predict
-   */
-  void Run(const GraphDef& graph, 
-           const Feeds& feeds,
-           const OutputSpec& output, 
-           const RunOption& run_option, Callback done);
  private:
   ThreadPool* thread_pool_;
 };
diff --git a/xdl/xdl/core/framework/gpu/gpu_device.cc b/xdl/xdl/core/framework/gpu/gpu_device.cc
index 23667380..935aa472 100644
--- a/xdl/xdl/core/framework/gpu/gpu_device.cc
+++ b/xdl/xdl/core/framework/gpu/gpu_device.cc
@@ -68,6 +68,7 @@ GpuDevice::GpuDevice(int id)
       stream_(CudaStreamManager::Instance()->GetCudaStream(id)) {}
 
 void GpuOpKernel::Launch(OpKernelContext* ctx) {
+#if 0
   Device* device = ctx->GetDevice();
   GpuDevice* gpu = dynamic_cast<GpuDevice*>(device);
   if (gpu == nullptr) {
@@ -86,6 +87,18 @@ void GpuOpKernel::Launch(OpKernelContext* ctx) {
     stream->Unlock();
     ctx->LaunchDone(Status::Ok());
   }
+#else
+  CudaStream* stream = CudaStreams::GetInstance()->GetCudaStream();
+  Status st = LaunchKernel(ctx, stream);
+  if (!st.IsOk()) {
+    ctx->LaunchDone(st);
+    ctx->RunDone(Status::Ok());
+  } else {
+    stream->AddCallback(
+        [=](Status st) { ctx->RunDone(st); ctx->LaunchDone(Status::Ok()); });
+    //ctx->LaunchDone(Status::Ok());
+  }
+#endif
 }
 
 XDL_DEVICE_FACTORY(GPU, GpuDevice::CreateDevice);
diff --git a/xdl/xdl/core/framework/gpu/gpu_device_converter.cc b/xdl/xdl/core/framework/gpu/gpu_device_converter.cc
index 69723149..a428b84d 100644
--- a/xdl/xdl/core/framework/gpu/gpu_device_converter.cc
+++ b/xdl/xdl/core/framework/gpu/gpu_device_converter.cc
@@ -13,16 +13,124 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+#include <time.h>
+#include <thread>
+#include <unistd.h>
+
 #include "xdl/core/framework/device_converter.h"
 #include "xdl/core/framework/gpu/gpu_stream.h"
 #include "xdl/core/framework/gpu/gpu_device.h"
 #include "xdl/core/framework/cpu_device.h"
+#include "xdl/core/lib/blocking_queue.h"
 
 namespace xdl {
 
+static double GetTime() {
+  timespec ts;
+  clock_gettime(CLOCK_REALTIME, &ts);
+  return static_cast<double>(ts.tv_sec) + static_cast<double>(ts.tv_nsec) * 1e-9;
+}
+
+class GpuTransferManager {
+ public:
+  struct TransferMsg {
+    Buffer* src_buffer;
+    Buffer* dst_buffer;
+    std::function<void(Status)> cb;
+    TransferMsg(Buffer* src_buffer = nullptr,Buffer* dst_buffer = nullptr,
+                std::function<void(Status)> cb = nullptr)
+    : src_buffer(src_buffer), dst_buffer(dst_buffer), cb(cb) {}
+  };
+
+  GpuTransferManager(CudaStream* stream, enum cudaMemcpyKind kind)
+  : stream_(stream), kind_(kind), alive_(true) {
+    queue_ = new BlockingQueue<TransferMsg>(kQueueCapacity);
+    cb_queue_ = new BlockingQueue<TransferMsg>(kQueueCapacity);
+    thread_ = std::thread(&GpuTransferManager::TransferMain, this);
+    cb_thread_ = std::thread(&GpuTransferManager::CallbackMain, this);
+  }
+  virtual ~GpuTransferManager() {
+    alive_ = false;
+    queue_->Clear();
+    cb_queue_->Clear();
+    thread_.join();
+    cb_thread_.join();
+    delete queue_;
+    delete cb_queue_;
+  }
+
+  void Enqueue(Buffer* src_buffer, Buffer* dst_buffer,
+               std::function<void(Status)> cb) {
+    while (!queue_->TryEnqueue(TransferMsg(src_buffer, dst_buffer, cb), 1) && alive_) {
+      printf("Warning: transfer queue %d is full!\n", kind_);
+    }
+  }
+
+  void TransferMain() {
+    TransferMsg transfer_msg;
+    std::vector<TransferMsg> cb_msgs;
+    cb_msgs.reserve(kQueueCapacity);
+    while (alive_) {
+      double btime = GetTime();
+      while (queue_->TryDequeue(&transfer_msg, 0)) {
+        CudaStream::RunOrAbort(
+            cudaMemcpyAsync(transfer_msg.dst_buffer->begin(), transfer_msg.src_buffer->begin(),
+                            transfer_msg.src_buffer->size(), kind_,
+                            stream_->GetInternal()),
+            "cudaMemcpyAsync error");
+        total_size_ += transfer_msg.src_buffer->size();
+        ++round_;
+        cb_msgs.push_back(transfer_msg);
+      }
+      size_t cb_msgs_size = cb_msgs.size();
+      if (cb_msgs_size > 0) {
+        CudaStream::RunOrAbort(
+            cudaStreamSynchronize(stream_->GetInternal()),
+            "cudaStreamSynchronize error");
+        total_time_ += GetTime() - btime;
+        if (round_ % 10000000 < cb_msgs_size) {
+          printf("Transfer %d (1:CPU=>GPU,2:GPU=>CPU) speed = %g MB/s, %g round/s\n",
+                 kind_, total_size_ / 1024 / 1024 / total_time_, round_ / total_time_);
+        }
+        for (size_t i = 0; i < cb_msgs_size; ++i) {
+          while (!cb_queue_->TryEnqueue(cb_msgs[i], 1) && alive_) {
+            printf("Warning: callback queue %d is full!\n", kind_);
+          }
+        }
+        cb_msgs.clear();
+      } else {
+        usleep(1000);
+      }
+    }
+  }
+
+  void CallbackMain() {
+    TransferMsg transfer_msg;
+    while (alive_) {
+      if (cb_queue_->TryDequeue(&transfer_msg, 1)) {
+        transfer_msg.cb(Status());
+      }
+    }
+  }
+
+ private:
+  CudaStream* stream_;
+  enum cudaMemcpyKind kind_;
+  bool alive_;
+  BlockingQueue<TransferMsg>* queue_;
+  BlockingQueue<TransferMsg>* cb_queue_;
+  std::thread thread_;
+  std::thread cb_thread_;
+  static constexpr int kQueueCapacity = 65536;
+
+  double total_time_ = 0.;
+  size_t total_size_ = 0;
+  size_t round_ = 0;
+};
+
 class GpuCpuConverter : public DeviceConverter {
  public:
-  GpuCpuConverter() : stream_(nullptr) {}
+  GpuCpuConverter() : stream_(nullptr), transfer_manager_(nullptr) {}
   void Convert(Device* src_device, Device* dst_device,
                Tensor src, Tensor* dst,
                ThreadPool* tp, std::function<void(Status)> cb) override {
@@ -38,27 +146,42 @@ class GpuCpuConverter : public DeviceConverter {
         stream_ = CudaStreamManager::Instance()->GetCudaStream(kStream);
       }
     }
+    if (transfer_manager_ == nullptr) {
+      std::unique_lock<std::mutex> lock(mu_);
+      if (transfer_manager_ == nullptr) {
+        transfer_manager_ = new GpuTransferManager(stream_, cudaMemcpyDeviceToHost);
+      }
+    }
     *dst = Tensor(dst_cpu, src.Shape(), src.Type());
-    stream_->Lock();
+    //stream_->Lock();
     Buffer* src_buffer = src.GetBuffer();
-    Buffer* dst_buffer = dst->GetBuffer();
-    CudaStream::RunOrAbort(
-        cudaMemcpyAsync(dst_buffer->begin(), src_buffer->begin(),
-                        src_buffer->size(), cudaMemcpyDeviceToHost,
-                        stream_->GetInternal()),
-        "cuda Memcpy device to host Error");
-    stream_->AddCallback(tp, cb);
-    stream_->Unlock();
+    if (src_buffer->size() > 0) {
+      Buffer* dst_buffer = dst->GetBuffer();
+#if 0
+      CudaStream::RunOrAbort(
+          cudaMemcpyAsync(dst_buffer->begin(), src_buffer->begin(),
+                          src_buffer->size(), cudaMemcpyDeviceToHost,
+                          stream_->GetInternal()),
+          "cuda Memcpy device to host Error");
+      stream_->AddCallback(tp, cb);
+#else
+      transfer_manager_->Enqueue(src_buffer, dst_buffer, cb);
+#endif
+    } else {
+      cb(Status());
+    }
+    //stream_->Unlock();
   }
  private:
   static constexpr int kStream = -2;
   std::mutex mu_;
   CudaStream* stream_;
+  GpuTransferManager* transfer_manager_;
 };
 
 class CpuGpuConverter : public DeviceConverter {
  public:
-  CpuGpuConverter() : stream_(nullptr) {}
+  CpuGpuConverter() : stream_(nullptr), transfer_manager_(nullptr) {}
   void Convert(Device* src_device, Device* dst_device,
                Tensor src, Tensor* dst,
                ThreadPool* tp, std::function<void(Status)> cb) override {
@@ -74,22 +197,37 @@ class CpuGpuConverter : public DeviceConverter {
         stream_ = CudaStreamManager::Instance()->GetCudaStream(kStream);
       }
     }
+    if (transfer_manager_ == nullptr) {
+      std::unique_lock<std::mutex> lock(mu_);
+      if (transfer_manager_ == nullptr) {
+        transfer_manager_ = new GpuTransferManager(stream_, cudaMemcpyHostToDevice);
+      }
+    }
     *dst = Tensor(dst_gpu, src.Shape(), src.Type());
-    stream_->Lock();
+    //stream_->Lock();
     Buffer* src_buffer = src.GetBuffer();
-    Buffer* dst_buffer = dst->GetBuffer();
-    CudaStream::RunOrAbort(
-        cudaMemcpyAsync(dst_buffer->begin(), src_buffer->begin(),
-                        src_buffer->size(), cudaMemcpyHostToDevice,
-                        stream_->GetInternal()),
-        "cuda Memcpy host to device Error");
-    stream_->AddCallback(tp, cb);
-    stream_->Unlock();
+    if (src_buffer->size() > 0) {
+      Buffer* dst_buffer = dst->GetBuffer();
+#if 0
+      CudaStream::RunOrAbort(
+          cudaMemcpyAsync(dst_buffer->begin(), src_buffer->begin(),
+                          src_buffer->size(), cudaMemcpyHostToDevice,
+                          stream_->GetInternal()),
+          "cuda Memcpy host to device Error");
+      stream_->AddCallback(tp, cb);
+#else
+      transfer_manager_->Enqueue(src_buffer, dst_buffer, cb);
+#endif
+    } else {
+      cb(Status());
+    }
+    //stream_->Unlock();
   }
  private:
   static constexpr int kStream = -3;
   std::mutex mu_;
   CudaStream* stream_;
+  GpuTransferManager* transfer_manager_;
 };
 
 class GpuGpuConverter : public DeviceConverter {
diff --git a/xdl/xdl/core/framework/gpu/gpu_stream.cc b/xdl/xdl/core/framework/gpu/gpu_stream.cc
index 43b06e41..27713cbb 100644
--- a/xdl/xdl/core/framework/gpu/gpu_stream.cc
+++ b/xdl/xdl/core/framework/gpu/gpu_stream.cc
@@ -56,11 +56,30 @@ CudaStream::CudaStream() {
 }
 
 void CudaStream::AddCallback(
-    ThreadPool* tp,
+    //ThreadPool* tp,
     std::function<void(Status)> func) {
+#if 0
   RunOrAbort(cudaStreamAddCallback(
       internal_, CudaCallback, new CudaCallbackClosure(tp, func), 0),
       "Cuda Add Callback Erro");
+#else
+  std::lock_guard<std::mutex> lock(mu_);
+  callbacks_.push_back(func);
+  ++ callbacks_num_;
+#endif
+}
+
+bool CudaStream::QueryAndRunCallbacks() {
+  if (callbacks_num_ > 0) {
+    std::lock_guard<std::mutex> lock(mu_);
+    if (cudaStreamQuery(internal_) == cudaSuccess) {
+      for (auto& callback : callbacks_) callback(Status::Ok());
+      callbacks_.clear();
+      callbacks_num_ = 0;
+      return true;
+    }
+  }
+  return false;
 }
 
 void CudaStream::RunOrAbort(cudaError_t status, const char* msg) {
diff --git a/xdl/xdl/core/framework/gpu/gpu_stream.h b/xdl/xdl/core/framework/gpu/gpu_stream.h
index 840f92f0..97f04963 100644
--- a/xdl/xdl/core/framework/gpu/gpu_stream.h
+++ b/xdl/xdl/core/framework/gpu/gpu_stream.h
@@ -16,8 +16,11 @@ limitations under the License.
 #ifndef XDL_CORE_FRAMEWORK_GPU_STREAM_H_
 #define XDL_CORE_FRAMEWORK_GPU_STREAM_H_
 
+#include <atomic>
 #include <string>
+#include <thread>
 #include <mutex>
+#include <unistd.h>
 #include <unordered_map>
 #include "cuda_runtime.h"
 #include "xdl/core/utils/logging.h"
@@ -31,14 +34,19 @@ namespace xdl {
 class CudaStream {
  public:
   CudaStream();
-  void AddCallback(ThreadPool* tp, std::function<void(Status)> func);
+  void AddCallback(std::function<void(Status)> func);
   cudaStream_t GetInternal() { return internal_; }
   void Lock() { mu_.lock(); }
   void Unlock() { mu_.unlock(); }
   static void RunOrAbort(cudaError_t status, const char* msg);
+  bool QueryAndRunCallbacks();
+
  private:
   cudaStream_t internal_;
   std::mutex mu_;
+
+  std::vector<std::function<void(Status)>> callbacks_;
+  size_t callbacks_num_ = 0;
 };
 
 class CudaStreamManager : public Singleton<CudaStreamManager> {
@@ -58,6 +66,56 @@ class CudaStreamManager : public Singleton<CudaStreamManager> {
   std::unordered_map<int, std::unique_ptr<CudaStream>> streams_;
 };
 
+class CudaStreams {
+ public:
+  static CudaStreams* GetInstance() {
+   static CudaStreams instance;
+   return &instance;
+  }
+  CudaStream* GetCudaStream() {
+    size_t index = index_.fetch_add(1) % kStreamsCapacity;
+    CudaStream* cuda_stream = cuda_streams_[index];
+    //cudaStreamSynchronize(cuda_stream->GetInternal());
+    return cuda_stream;
+  }
+  virtual ~CudaStreams() {
+    alive_ = false;
+    cb_thread_.join();
+    for (int i = 0; i < kStreamsCapacity; ++i) {
+      delete cuda_streams_[i];
+    }
+  }
+
+ private:
+  CudaStreams() : alive_(true), index_(0) {
+    cuda_streams_.reserve(kStreamsCapacity);
+    for (int i = 0; i < kStreamsCapacity; ++i) {
+      cuda_streams_.push_back(new CudaStream());
+    }
+    cb_thread_ = std::thread(&CudaStreams::CallbackMain, this);
+  }
+  void CallbackMain() {
+    while (alive_) {
+      bool ret = false;
+      size_t index = index_ % kStreamsCapacity;
+      size_t i = index;
+      while (alive_) {
+        ret |= cuda_streams_[i]->QueryAndRunCallbacks();
+        if (++i >= kStreamsCapacity) i -= kStreamsCapacity;
+        if (i == index) break;
+      }
+      if (!ret) {
+        usleep(100);
+      }
+    }
+  }
+  bool alive_;
+  std::thread cb_thread_;
+  std::atomic<size_t> index_;
+  std::vector<CudaStream*> cuda_streams_;
+  static constexpr int kStreamsCapacity = 64;
+};
+
 }  // namespace xdl
 
 #endif  // XDL_CORE_FRAMEWORK_GPU_STREAM_H_
diff --git a/xdl/xdl/core/framework/graph.h b/xdl/xdl/core/framework/graph.h
index 25221b7c..7eb8b57d 100644
--- a/xdl/xdl/core/framework/graph.h
+++ b/xdl/xdl/core/framework/graph.h
@@ -27,11 +27,9 @@ namespace xdl {
 
 struct Node {
   static constexpr int kDependency = -1;
-  static constexpr int kFeed = -2;
   struct Input {
     int node_id;
     int output_id;
-    std::string feed_name;
   };
   struct Output {
     int output_id;
@@ -53,8 +51,6 @@ struct Graph {
   static constexpr int kSource = 0;
   static constexpr int kSink = 1;
   std::vector<Node> nodes;
-  std::map<std::string, std::vector<std::pair<int, int> > > feeds;
-  std::vector<int> node_inputs;
   std::map<std::pair<Device*, Device*>, DeviceConverter*> device_converter;
 };
 
diff --git a/xdl/xdl/core/framework/graph_builder.cc b/xdl/xdl/core/framework/graph_builder.cc
index cf89ae93..6473eafb 100644
--- a/xdl/xdl/core/framework/graph_builder.cc
+++ b/xdl/xdl/core/framework/graph_builder.cc
@@ -55,33 +55,26 @@ Status GraphBuilder::BuildNodes() {
     graph_->nodes.emplace_back();
     XDL_CHECK_STATUS(BuildNode(item, &graph_->nodes.back()));
   }
-
-  graph_->node_inputs.reserve(graph_->nodes.size());
-  for (size_t i = 0; i < graph_->nodes.size(); ++i) {
-    auto& item = graph_->nodes[i];
-    size_t input_size = item.inputs.size();
-    for (auto& in: item.inputs) {
-      if (inputs_.find(GetInputName(in)) != inputs_.end()) {
-        input_size--;
-      }
-    }
-
-    graph_->node_inputs.push_back(input_size);
-  }
-
   return Status::Ok();
 }
 
 Status GraphBuilder::AddDeviceConverter() {
-  for (size_t i = 1; i < graph_->nodes.size(); ++i) {
-    auto& item = graph_->nodes[i];
+  for (auto&& item : graph_->nodes) {
     for (auto&& output : item.outputs) {
       if (output.output_id == Node::kDependency) {
         continue;
       }
-      if (item.arg.device != graph_->nodes[output.node_id].arg.device) {
-        XDL_CHECK_STATUS(CreateDeviceConverter(
-              item.arg.device, graph_->nodes[output.node_id].arg.device));
+      Device* src_device = item.arg.device;
+      Device* dst_device = graph_->nodes[output.node_id].arg.device;
+      if (src_device != dst_device) {
+        XDL_CHECK_STATUS(CreateDeviceConverter(src_device, dst_device));
+      }
+      for (int input_id = 0; input_id < graph_->nodes[output.node_id].inputs.size(); ++input_id) {
+        if (input_id >= graph_->nodes[output.node_id].arg.input_devices.size()) break;
+        dst_device = graph_->nodes[output.node_id].arg.input_devices[input_id];
+        if (dst_device != nullptr && src_device != dst_device) {
+          XDL_CHECK_STATUS(CreateDeviceConverter(src_device, dst_device));
+        }
       }
     }
   }
@@ -101,6 +94,17 @@ Status GraphBuilder::BuildNode(const NodeDef& def, Node* node) {
     XDL_CHECK_STATUS(ParseInput(item, &node->inputs.back()));
   }
   node->input_size = node->arg.input_name.size();
+  for (const std::string& input_dev_desc : def.input_dev_descs) {
+    if (input_dev_desc == "CPU") {
+      DeviceDef device;
+      device.device_name = "CPU";
+      node->arg.input_devices.emplace_back();
+      XDL_CHECK_STATUS(DeviceRegistry::Get()->GetDevice(
+            device, &node->arg.input_devices[node->arg.input_devices.size() - 1]));
+    } else {
+      node->arg.input_devices.emplace_back(nullptr);
+    }
+  }
   OpKernelBase* op;
   XDL_CHECK_STATUS(OpRegistry::Get()->CreateKernel(
         def, node->arg.device->DeviceType(), &op));
@@ -137,15 +141,14 @@ Status GraphBuilder::AppendOutputs() {
       } else {
         input_id = input_size++;
       }
-
       graph_->nodes[input.node_id].outputs.push_back(Node::Output{
-        .output_id = input.output_id,
+          .output_id = input.output_id,
           .node_id = static_cast<int>(i),
           .input_id = input_id});
     }
     XDL_CHECK_COND(item.input_size == input_size,
-                   Status::ArgumentError("Node Input Size Check Error "
-                                         + item.name));
+                   Status::ArgumentError("Node Input Size Check Error " + item.name
+                                         + ", " + std::to_string(item.input_size) + " != " + std::to_string(input_size)));
   }
   XDL_CHECK_STATUS(BuildSource(&graph_->nodes[Graph::kSource]));
   return Status::Ok();
@@ -157,23 +160,14 @@ Status GraphBuilder::BuildSource(Node* node) {
     if (i == Graph::kSource || i == Graph::kSink) {
       continue;
     }
-
     if (graph_->nodes[i].inputs.empty()) {
       node->outputs.push_back(Node::Output{
           .output_id = Node::kDependency,
           .node_id = i,
           .input_id = Node::kDependency
       });
-    } else {
-      for (size_t j = 0; j < graph_->nodes[i].inputs.size(); ++j) {
-        std::string input = GetInputName(graph_->nodes[i].inputs[j]);
-        if (inputs_.find(input) != inputs_.end()) {
-          graph_->feeds[input].push_back({i, j});
-        }
-      }
     }
   }
-
   return Status::Ok();
 }
 
@@ -195,17 +189,9 @@ Status GraphBuilder::ParseInput(const std::string& spec, Node::Input* result) {
     std::string name = spec.substr(0, pos);
     std::string id_str = spec.substr(pos + 1);
     auto iter = node_id_.find(name);
-    if (iter == node_id_.end()) {
-      XDL_CHECK_COND(inputs_.find(spec) != inputs_.end(),
-                     Status::ArgumentError("Node Input Error, "
-                                           "input node not found " + spec));
-      result->output_id = Node::kFeed;
-      result->node_id = 0;
-      result->feed_name = spec;
-      return Status::Ok();
-    }
-
-    result->node_id = iter->second;
+    XDL_CHECK_COND(iter != node_id_.end(),
+                   Status::ArgumentError("Node Input Error, "
+                                         "input node not found " + spec));
     int id = std::atoi(id_str.c_str());
     XDL_CHECK_COND(std::to_string(id) == id_str,
                    Status::ArgumentError("Node Input Error, "
@@ -213,6 +199,7 @@ Status GraphBuilder::ParseInput(const std::string& spec, Node::Input* result) {
     XDL_CHECK_COND(id >= 0,
                    Status::ArgumentError("Node Input Error, "
                                          "id must not be negative."));
+    result->node_id = iter->second;
     result->output_id = id;
     return Status::Ok();
   }
diff --git a/xdl/xdl/core/framework/graph_builder.h b/xdl/xdl/core/framework/graph_builder.h
index a4874c46..80351a10 100644
--- a/xdl/xdl/core/framework/graph_builder.h
+++ b/xdl/xdl/core/framework/graph_builder.h
@@ -26,14 +26,8 @@ namespace xdl {
 
 class GraphBuilder {
  public:
-  GraphBuilder(const GraphDef& def, const InputSpec& input, 
-               const OutputSpec& output, Graph* graph)
-    : def_(def), output_(output), graph_(graph) {
-    for (size_t i = 0; i < input.size(); ++i) {
-      inputs_.insert(std::make_pair(input[i], i));
-    }
-  }
-
+  GraphBuilder(const GraphDef& def, const OutputSpec& output, Graph* graph)
+    : def_(def), output_(output), graph_(graph) {}
   Status Build();
  private:
   Status Prepare();
@@ -47,21 +41,10 @@ class GraphBuilder {
   Status CreateDeviceConverter(Device* src, Device* dst);
   Status CheckDAG();
   Status CheckOutputOverflow();
-  inline std::string GetInputName(const Node::Input& input) {
-    if (input.output_id != Node::kFeed) {
-      return graph_->nodes[input.node_id].name + ":" +
-        std::to_string(input.output_id);
-    } else {
-      return input.feed_name;
-    }
-  }
-
   GraphDef def_;
-  std::unordered_map<std::string, int> inputs_;
   OutputSpec output_;
   Graph* graph_;
   std::unordered_map<std::string, int> node_id_;
-  std::set<int> sink_outputs_;
 };
 
 }  // namespace xdl
diff --git a/xdl/xdl/core/framework/graph_cache.cc b/xdl/xdl/core/framework/graph_cache.cc
index 4edfda40..7dcd037b 100644
--- a/xdl/xdl/core/framework/graph_cache.cc
+++ b/xdl/xdl/core/framework/graph_cache.cc
@@ -19,21 +19,18 @@ namespace xdl {
 
 Status GraphCache::GetGraph(GraphCreator creator,
                             const GraphDef& def,
-                            const InputSpec& input,
                             const OutputSpec& output,
                             Graph** g) {
   std::unique_lock<std::mutex> lock(mu_);
   GraphToken token;
   token.graph_hash = def.hash;
-  token.inputs = input;
   token.outputs = output.output;
   auto iter = graph_map_.find(token);
   if (iter != graph_map_.end()) {
     *g = iter->second.get();
     return Status::Ok();
   }
-
-  XDL_CHECK_STATUS(creator(def, input, output, g));
+  XDL_CHECK_STATUS(creator(def, output, g));
   graph_map_[token].reset(*g);
   return Status::Ok();
 }
@@ -42,14 +39,9 @@ size_t GraphCache::GraphTokenHash::operator()(const GraphToken& token) const {
   std::hash<std::string> hasher;
   constexpr size_t P = 10240319;
   size_t r = token.graph_hash;
-  for (auto&& item : token.inputs) {
-    r = r * P + hasher(item);
-  }
-
   for (auto&& item : token.outputs) {
     r = r * P + hasher(item);
   }
-
   return r;
 }
 
@@ -58,27 +50,14 @@ bool GraphCache::GraphTokenEqual::operator()(const GraphToken& lhs,
   if (lhs.graph_hash != rhs.graph_hash) {
     return false;
   }
-
-  if (lhs.inputs.size() != rhs.inputs.size()) {
-    return false;
-  }
-  
   if (lhs.outputs.size() != rhs.outputs.size()) {
     return false;
   }
-
-  for (size_t i = 0; i < lhs.inputs.size(); i++) {
-    if (lhs.inputs[i] != rhs.inputs[i]) {
-      return false;
-    }
-  }
-
   for (size_t i = 0; i < lhs.outputs.size(); i++) {
     if (lhs.outputs[i] != rhs.outputs[i]) {
       return false;
     }
   }
-
   return true;
 }
 
diff --git a/xdl/xdl/core/framework/graph_cache.h b/xdl/xdl/core/framework/graph_cache.h
index 2b2fb370..52e684fe 100644
--- a/xdl/xdl/core/framework/graph_cache.h
+++ b/xdl/xdl/core/framework/graph_cache.h
@@ -30,19 +30,14 @@ namespace xdl {
 class GraphCache : public Singleton<GraphCache> {
  public:
   using GraphCreator =
-    std::function<Status(const GraphDef&, 
-                         const InputSpec& input, 
-                         const OutputSpec& output, 
-                         Graph**)>;
+    std::function<Status(const GraphDef&, const OutputSpec& output, Graph**)>;
   Status GetGraph(GraphCreator creator,
                   const GraphDef& def,
-                  const InputSpec& input,
                   const OutputSpec& output,
                   Graph** g);
  private:
   struct GraphToken {
     int64_t graph_hash;
-    std::vector<std::string> inputs;
     std::vector<std::string> outputs;
   };
   struct GraphTokenHash {
diff --git a/xdl/xdl/core/framework/graph_def.cc b/xdl/xdl/core/framework/graph_def.cc
index c5210d7f..3627e619 100644
--- a/xdl/xdl/core/framework/graph_def.cc
+++ b/xdl/xdl/core/framework/graph_def.cc
@@ -140,6 +140,9 @@ proto::NodeDef NodeDef::ToProto() const {
   for (auto&& item : this->input) {
     result.add_input(item);
   }
+  for (auto&& item : this->output_type) {
+    result.add_output_type(DataTypeToProto(item));
+  }
   (*result.mutable_device()) = this->device.ToProto();
   for (auto&& item : this->attr) {
     (*result.mutable_attr())[item.first] = item.second.ToProto();
@@ -154,6 +157,10 @@ void NodeDef::FromProto(const proto::NodeDef& pb) {
   for (auto&& item : pb.input()) {
     this->input.push_back(item);
   }
+  this->output_type.clear();
+  for (auto&& item : pb.output_type()) {
+    this->output_type.push_back((DataType)(item));
+  }
   this->device.FromProto(pb.device());
   this->attr.clear();
   for (auto&& item : pb.attr()) {
@@ -166,8 +173,6 @@ proto::GraphDef GraphDef::ToProto() const {
   for (auto&& item : this->node) {
     (*result.add_node()) = item.ToProto();
   }
-
-  *(result.mutable_tag()) = tag.ToProto();
   result.set_hash(hash);
   return result;
 }
@@ -185,30 +190,17 @@ void GraphDef::FromProto(const proto::GraphDef& pb) {
     this->node.back().FromProto(item);
   }
   this->hash = pb.hash();
-
-  if (pb.has_tag()) {
-    this->tag.FromProto(pb.tag());
-  }
-}
-
-bool GraphDef::FromProtoString(const std::string& pb_str) {
-  proto::GraphDef pb;
-  if (!pb.ParseFromString(pb_str)) {
-    return false;
-  }
-
-  FromProto(pb);
-  return true;
 }
 
-bool GraphDef::FromTextString(const std::string& text) {
+void GraphDef::FromProtoTxtString(const std::string& pb_string) {
   proto::GraphDef pb;
-  if (!google::protobuf::TextFormat::ParseFromString(text, &pb)) {
-    return false;
+  google::protobuf::TextFormat::ParseFromString(pb_string, &pb);
+  this->node.clear();
+  for (auto&& item : pb.node()) {
+    this->node.emplace_back();
+    this->node.back().FromProto(item);
   }
-
-  FromProto(pb);
-  return true;
+  this->hash = pb.hash();
 }
 
 }  // namespace xdl
diff --git a/xdl/xdl/core/framework/graph_def.h b/xdl/xdl/core/framework/graph_def.h
index 98ca96ae..ceb268d0 100644
--- a/xdl/xdl/core/framework/graph_def.h
+++ b/xdl/xdl/core/framework/graph_def.h
@@ -65,117 +65,28 @@ struct NodeDef {
   std::string op;
   std::vector<std::string> input;
   DeviceDef device;
+  std::vector<std::string> input_dev_descs;  // NOT IN PROTO
   std::unordered_map<std::string, AttrValue> attr;
+  std::vector<DataType> output_type;
 
   proto::NodeDef ToProto() const;
   void FromProto(const proto::NodeDef& pb);
 };
 
-enum InputType {
-  kInputSparse = 0,
-  kInputDense,
-  kInputOther
-};
-
-struct InputDef {
-  std::string op_name;
-  std::string input_name;
-  InputType input_type;
-  int size;
-  int table;
-  std::vector<uint32_t> mask;
-  void FromProto(const proto::InputDef& def) {
-    op_name = def.op_name();
-    input_name = def.input_name();
-    input_type = static_cast<InputType>(def.input_type());
-    size = def.size();
-    table = def.table();
-    for (size_t i = 0; i < def.mask_size(); ++i) {
-      mask.push_back(def.mask(i));
-    }
-  }
-
-  proto::InputDef ToProto() const {
-    proto::InputDef proto;
-    proto.set_op_name(op_name);
-    proto.set_input_name(input_name);
-    proto.set_input_type(static_cast<proto::InputType>(input_type));
-    proto.set_size(size);
-    proto.set_table(table);
-    for (auto& item: mask) {
-      proto.add_mask(item);
-    }
-
-    return proto;
-  }
-};
-
-struct OutputDef {
-  std::string op_name;
-  void FromProto(const proto::OutputDef& def) {
-    op_name = def.op_name();
-  }
-
-  proto::OutputDef ToProto() const {
-    proto::OutputDef proto;
-    proto.set_op_name(op_name);
-    return proto;
-  }
-};
-
-struct TagDef {
-  std::vector<InputDef> inputs;
-  std::vector<OutputDef> outputs;
-  void FromProto(const proto::TagDef& def) {
-    for (size_t i = 0; i < def.input_size(); ++i) {
-      inputs.emplace_back();
-      inputs.back().FromProto(def.input(i));
-    }
-
-    for (size_t i = 0; i < def.output_size(); ++i) {
-      outputs.emplace_back();
-      outputs.back().FromProto(def.output(i));
-    }
-  }
-
-  proto::TagDef ToProto() const {
-    proto::TagDef proto;    
-    for (auto& item: inputs) {
-      *(proto.add_input()) = item.ToProto();
-    }
-
-    for (auto& item: outputs) {
-      *(proto.add_output()) = item.ToProto();
-    }
-
-    return proto;
-  }
-};
-
 struct GraphDef {
   std::vector<NodeDef> node;
   int64_t hash;
-  TagDef tag;
   proto::GraphDef ToProto() const;
   void FromProto(const proto::GraphDef& pb);
-  bool FromProtoString(const std::string& pb);
-  bool FromTextString(const std::string& txt);
   std::string ToProtoString() const;
+  void FromProtoTxtString(const std::string& pb_string);
 };
 
-using InputSpec = std::vector<std::string>;
-
 struct OutputSpec {
   std::vector<std::string> output;
   DeviceDef output_device;
 };
 
-struct RunOption {
-  RunOption() : perf(false) {}
-  RunOption(bool perf) : perf(perf) {}
-  bool perf;
-};
-
 }  // namespace xdl
 
 #endif  // XDL_CORE_FRAMEWORK_GRAPH_DEF_H_
diff --git a/xdl/xdl/core/framework/grappler.h b/xdl/xdl/core/framework/grappler.h
index ed243851..42460c6e 100644
--- a/xdl/xdl/core/framework/grappler.h
+++ b/xdl/xdl/core/framework/grappler.h
@@ -28,8 +28,7 @@ namespace xdl {
 class Grappler {
  public:
   virtual ~Grappler() {}
-  virtual Status Process(
-      const InputSpec& input, GraphDef* graph, OutputSpec* output) = 0;
+  virtual Status Process(GraphDef* graph, OutputSpec* output) = 0;
 };
 
 class GrapplerRegistry : public Singleton<GrapplerRegistry> {
@@ -37,10 +36,9 @@ class GrapplerRegistry : public Singleton<GrapplerRegistry> {
   void RegisterGrappler(int priority, Grappler* grappler) {
     grapplers_.insert({priority, grappler});
   }
-
-  Status Process(const InputSpec& input, GraphDef* graph, OutputSpec* output) {
+  Status Process(GraphDef* graph, OutputSpec* output) {
     for (auto&& item : grapplers_) {
-      XDL_CHECK_STATUS(item.second->Process(input, graph, output));
+      XDL_CHECK_STATUS(item.second->Process(graph, output));
     }
     return Status::Ok();
   }
diff --git a/xdl/xdl/core/framework/op_kernel.cc b/xdl/xdl/core/framework/op_kernel.cc
index a490e960..2445a24c 100644
--- a/xdl/xdl/core/framework/op_kernel.cc
+++ b/xdl/xdl/core/framework/op_kernel.cc
@@ -236,6 +236,10 @@ void OpKernelContext::RunDone(Status st) {
   run_done_(st);
 }
 
+const RunOption& OpKernelContext::GetRunOption() {
+  return executor_->GetRunOption();
+}
+
 void OpKernelContext::SetLaunchDone(OpKernelBase::Callback launch_done) {
   launch_done_ = launch_done;
 }
diff --git a/xdl/xdl/core/framework/op_kernel.h b/xdl/xdl/core/framework/op_kernel.h
index 41dddbad..e82032b0 100644
--- a/xdl/xdl/core/framework/op_kernel.h
+++ b/xdl/xdl/core/framework/op_kernel.h
@@ -25,6 +25,7 @@ limitations under the License.
 #include "xdl/core/framework/device.h"
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/framework/graph_def.h"
+#include "xdl/core/framework/run_option.h"
 
 namespace xdl {
 
@@ -75,6 +76,7 @@ class OpKernelConstruction {
 
 struct OpKernelContextArg {
   Device* device;
+  std::vector<Device*> input_devices;
   std::vector<std::string> input_name;
   std::vector<DataType> input_type;
   std::unordered_map<std::string, int> input_id;
@@ -109,6 +111,7 @@ class OpKernelContext : public RefCounted {
   Device* GetDevice();
   void LaunchDone(Status st);
   void RunDone(Status st);
+  const RunOption& GetRunOption();
 
   void SetLaunchDone(OpKernelBase::Callback launch_done);
   void SetRunDone(OpKernelBase::Callback run_done);
diff --git a/xdl/xdl/core/framework/run_option.h b/xdl/xdl/core/framework/run_option.h
new file mode 100644
index 00000000..c02dcc24
--- /dev/null
+++ b/xdl/xdl/core/framework/run_option.h
@@ -0,0 +1,39 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_FRAMEWORK_RUN_OPTION_H_
+#define XDL_CORE_FRAMEWORK_RUN_OPTION_H_
+
+#include "xdl/core/framework/tensor.h"
+
+namespace xdl {
+
+struct ExecutorContext {
+  ExecutorContext(int size) : tensors(size) {}
+  std::vector<Tensor> tensors;
+};
+
+struct RunOption {
+  RunOption() : perf(false) {}
+  RunOption(bool perf) : perf(perf) {}
+  bool perf;
+  ExecutorContext* in_ctx;
+  ExecutorContext* out_ctx;
+};
+
+}  // namespace xdl
+
+#endif  // XDL_CORE_FRAMEWORK_RUN_OPTION_H_
+
diff --git a/xdl/xdl/core/framework/simple_executor.cc b/xdl/xdl/core/framework/simple_executor.cc
index 21999573..74b17c09 100644
--- a/xdl/xdl/core/framework/simple_executor.cc
+++ b/xdl/xdl/core/framework/simple_executor.cc
@@ -18,7 +18,9 @@ limitations under the License.
 #include <thread>
 #include <google/protobuf/text_format.h>
 
+#include "xdl/core/framework/device.h"
 #include "xdl/core/utils/time_utils.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 
@@ -40,17 +42,7 @@ void SimpleExecutor::Run(Graph* graph,
                          ThreadPool* thread_pool) {
   SimpleExecutor* executor = new SimpleExecutor(
       graph, run_option, done, thread_pool);
-  executor->Run({});
-}
-
-void SimpleExecutor::Run(Graph* graph, 
-                         const Feeds& feeds,
-                         const RunOption& run_option, 
-                         Callback done, 
-                         ThreadPool* thread_pool) {
-  SimpleExecutor* executor = new SimpleExecutor(
-      graph, run_option, done, thread_pool);
-  executor->Run(feeds);
+  executor->Run();
 }
 
 void SimpleExecutor::Run(Graph* graph, 
@@ -59,20 +51,16 @@ void SimpleExecutor::Run(Graph* graph,
   Run(graph, run_option, done, ThreadPool::Global());
 }
 
-void SimpleExecutor::Run(const Feeds& feeds) {
+void SimpleExecutor::Run() {
   Init();
   if (!status_.IsOk()) {
     Done();
     return;
   }
-  FeedInput(feeds);
   running_counter_ = 1;
   for (auto item : graph_->nodes[Graph::kSource].outputs) {
-    if (graph_->node_inputs[item.node_id] == 0) {
-      Launch(item.node_id);
-    }
+    Launch(item.node_id);
   }
-
   DecreaseRunningCounter();
 }
 
@@ -85,23 +73,12 @@ Status SimpleExecutor::InitImpl() {
   running_counter_ = 0;
   ref_.reset(new std::atomic<int>[graph_->nodes.size()]);
   for (size_t i = 0; i < graph_->nodes.size(); i++) {
-    //input_.emplace_back(graph_->nodes[i].inputs.size());
     input_.emplace_back(graph_->nodes[i].input_size);
-    ref_[i] = graph_->node_inputs[i];
+    ref_[i] = graph_->nodes[i].inputs.size();
   }
-
   return Status::Ok();
 }
 
-void SimpleExecutor::FeedInput(const Feeds& feeds) {
-  for (auto& feed: feeds) {
-    auto& p = graph_->feeds[feed.first];
-    for (auto& info: p) {
-      input_[info.first][info.second] = feed.second;
-    }
-  }
-}
-
 void SimpleExecutor::Launch(int node_id) {
   if (node_id == Graph::kSink) {
     return;
@@ -113,10 +90,9 @@ void SimpleExecutor::Launch(int node_id) {
     return;
   }
   running_counter_ += 2;
-  OpKernelContext* ctx = 
-    new OpKernelContext(&(graph_->nodes[node_id].arg),
-                        this,
-                        std::move(input_[node_id]));
+  OpKernelContext* ctx = new OpKernelContext(&(graph_->nodes[node_id].arg),
+                                             this,
+                                             std::move(input_[node_id]));
   ctx->SetLaunchDone(
       [this, node_id, ctx](Status st){LaunchDone(node_id, ctx, st);});
   ctx->SetRunDone(
@@ -138,15 +114,22 @@ void SimpleExecutor::LaunchDone(int node_id, OpKernelContext* ctx, Status st) {
     CheckStatus(CheckOutputs(node_id, outputs));
   }
   if (!failed_) {
-    for (auto item : graph_->nodes[node_id].outputs) {
-      // Process on RunDone
-      if (graph_->nodes[node_id].arg.device !=
-          graph_->nodes[item.node_id].arg.device) {
+    for (auto&& item : graph_->nodes[node_id].outputs) {
+      if (item.input_id == Node::kDependency) {
+        UnRef(item.node_id);
         continue;
       }
-      if (item.input_id != Node::kDependency) {
-        input_[item.node_id][item.input_id] = outputs[item.output_id];
+      // Process on RunDone
+      Device* src_device = graph_->nodes[node_id].arg.device;
+      Device* dst_device = graph_->nodes[item.node_id].arg.device;
+      const std::vector<Device*>& input_devices = graph_->nodes[item.node_id].arg.input_devices;
+      if (item.input_id < input_devices.size() && input_devices[item.input_id] != nullptr) {
+        dst_device = input_devices[item.input_id];
+      }
+      if (src_device != dst_device) {
+        continue;
       }
+      input_[item.node_id][item.input_id] = outputs[item.output_id];
       UnRef(item.node_id);
     }
   }
@@ -165,10 +148,14 @@ void SimpleExecutor::RunDone(int node_id, OpKernelContext* ctx, Status st) {
     ctx->UnRef();
   });
   if (!failed_) {
-    for (auto item : graph_->nodes[node_id].outputs) {
+    for (auto&& item : graph_->nodes[node_id].outputs) {
       // Process on LaunchDone
       Device* src_device = graph_->nodes[node_id].arg.device;
       Device* dst_device = graph_->nodes[item.node_id].arg.device;
+      const std::vector<Device*>& input_devices = graph_->nodes[item.node_id].arg.input_devices;
+      if (item.input_id < input_devices.size() && input_devices[item.input_id] != nullptr) {
+        dst_device = input_devices[item.input_id];
+      }
       if (src_device == dst_device) {
         continue;
       }
@@ -277,7 +264,6 @@ void SimpleExecutor::Done() {
     if (IsPerfOn()) {
       info["PERF_RESULT"] = perf_info;
     }
-
     done_(status_, input_[Graph::kSink], info);
   } else {
     done_(status_, std::vector<Tensor>(), ExtraInfo());
diff --git a/xdl/xdl/core/framework/simple_executor.h b/xdl/xdl/core/framework/simple_executor.h
index 21f45508..2e7e9304 100644
--- a/xdl/xdl/core/framework/simple_executor.h
+++ b/xdl/xdl/core/framework/simple_executor.h
@@ -25,6 +25,7 @@ limitations under the License.
 #include "xdl/core/framework/tensor.h"
 #include "xdl/core/proto/perf_stats.pb.h"
 #include "xdl/core/lib/any.h"
+#include "xdl/core/framework/run_option.h"
 
 namespace xdl {
 
@@ -33,21 +34,19 @@ class SimpleExecutor {
   using ExtraInfo = std::unordered_map<std::string, Any>;
   using Callback = std::function<void(Status, const std::vector<Tensor>&, const ExtraInfo&)>;
   using DoneHandler = std::function<void(Status)>;
-  using Feed = std::pair<std::string, Tensor>;
-  using Feeds = std::vector<Feed>;
 
   static void Run(Graph* graph, const RunOption& run_option, Callback done, ThreadPool* thread_pool);
   static void Run(Graph* graph, const RunOption& run_option, Callback done);
-  static void Run(Graph* graph, const Feeds& feeds, 
-                  const RunOption& run_option, 
-                  Callback done, 
-                  ThreadPool* thread_pool);
 
   void AddDoneHandler(DoneHandler handler_) {
     std::unique_lock<std::mutex> lock(done_handler_mu_);
     done_handler_.push_back(handler_);
   }
 
+  const RunOption& GetRunOption() {
+    return run_option_;
+  }
+
  private:
   explicit SimpleExecutor(Graph* graph, const RunOption& run_option, 
                           Callback done, ThreadPool* thread_pool)
@@ -60,10 +59,9 @@ class SimpleExecutor {
     }
   }
 
-  void Run(const Feeds& feeds);
+  void Run();
   void Init();
   Status InitImpl();
-  void FeedInput(const Feeds& feeds);
   void Launch(int node_id);
   void LaunchDone(int node_id, OpKernelContext* ctx, Status st);
   void RunDone(int node_id, OpKernelContext* ctx, Status st);
diff --git a/xdl/xdl/core/framework/tensor.cc b/xdl/xdl/core/framework/tensor.cc
index 3d442976..1b56f9fa 100644
--- a/xdl/xdl/core/framework/tensor.cc
+++ b/xdl/xdl/core/framework/tensor.cc
@@ -27,8 +27,8 @@ Buffer::Buffer(Allocator* allocator, void* begin, size_t size, bool own)
   : allocator_(allocator), begin_(begin),
     size_(size), own_(own), parent_(nullptr) {}
 
-Buffer::Buffer(Allocator* allocator, void* begin, size_t size, Buffer* parent)
-  : allocator_(allocator), begin_(begin),
+Buffer::Buffer(void* begin, size_t size, Buffer* parent)
+  : allocator_(nullptr), begin_(begin),
     size_(size), own_(false), parent_(parent) {}
 
 Buffer::~Buffer() {
@@ -46,11 +46,6 @@ Tensor::Tensor(Device* device, const TensorShape& shape, DataType type)
                                       shape.NumElements() * SizeOfType(type)),
                                       shape, type)) {}
 
-Tensor::Tensor(Device* device, const TensorShape& shape, DataType type,
-               Buffer* buffer)
-  : state_(RefCountedPtr<State>::Create(
-        RefCountedPtr<Buffer>(buffer), shape, type)) {}
-
 Tensor::Tensor(Device* device, const TensorShape& shape, DataType type,
                void* data, bool own)
   : state_(RefCountedPtr<State>::Create(
@@ -64,11 +59,6 @@ Tensor::Tensor(Allocator* allocator, const TensorShape& shape, DataType type)
                                       shape.NumElements() * SizeOfType(type)),
                                       shape, type)) {}
 
-Tensor::Tensor(Allocator* allocator, const TensorShape& shape, DataType type,
-               Buffer* buffer)
-  : state_(RefCountedPtr<State>::Create(
-        RefCountedPtr<Buffer>(buffer), shape, type)) {}
-
 Tensor::Tensor(Allocator* allocator, const TensorShape& shape, DataType type,
                void* data, bool own)
   : state_(RefCountedPtr<State>::Create(
@@ -76,5 +66,10 @@ Tensor::Tensor(Allocator* allocator, const TensorShape& shape, DataType type,
                                       shape.NumElements() * SizeOfType(type),
                                       own), shape, type)) {}
 
+Tensor::Tensor(const TensorShape& shape, DataType type,
+               Buffer* buffer)
+  : state_(RefCountedPtr<State>::Create(
+        RefCountedPtr<Buffer>(buffer), shape, type)) {}
+
 }  // namespace xdl
 
diff --git a/xdl/xdl/core/framework/tensor.h b/xdl/xdl/core/framework/tensor.h
index 3b442bca..f7363044 100644
--- a/xdl/xdl/core/framework/tensor.h
+++ b/xdl/xdl/core/framework/tensor.h
@@ -28,7 +28,7 @@ class Buffer : public RefCounted {
  public:
   Buffer(Allocator* allocator, size_t size);
   Buffer(Allocator* allocator, void* begin, size_t size, bool own);
-  Buffer(Allocator* allocator, void* begin, size_t size, Buffer* parent);
+  Buffer(void* begin, size_t size, Buffer* parent);
   ~Buffer();
 
   void* begin() {
@@ -55,15 +55,13 @@ class Tensor {
  public:
   Tensor();
   Tensor(Device* device, const TensorShape& shape, DataType type);
-  Tensor(Device* device, const TensorShape& shape, DataType type,
-         Buffer* buffer);
   Tensor(Device* device, const TensorShape& shape, DataType type,
          void* data, bool own);
   Tensor(Allocator* allocator, const TensorShape& shape, DataType type);
-  Tensor(Allocator* allocator, const TensorShape& shape, DataType type,
-         Buffer* buffer);
   Tensor(Allocator* allocator, const TensorShape& shape, DataType type,
          void* data, bool own);
+  Tensor(const TensorShape& shape, DataType type,
+         Buffer* buffer);
 
   bool Initialized() const {
     return state_.get() != nullptr;
diff --git a/xdl/xdl/core/framework/types.h b/xdl/xdl/core/framework/types.h
index b6905f30..09fd7295 100644
--- a/xdl/xdl/core/framework/types.h
+++ b/xdl/xdl/core/framework/types.h
@@ -86,7 +86,7 @@ MATCH_TYPE_AND_ENUM(bool, kBool);
         XDL_TYPE_CASE(float, XDL_TYPE_SINGLE_ARG(STMTS))          \
         XDL_TYPE_CASE(double, XDL_TYPE_SINGLE_ARG(STMTS))         \
         XDL_TYPE_CASE(bool, XDL_TYPE_SINGLE_ARG(STMTS))           \
-    default: XDL_CHECK(false) << "type error";                    \
+        default: XDL_CHECK(false) << "type error";                    \
     }
 
 inline size_t SizeOfType(DataType type) {
diff --git a/xdl/xdl/core/grappler/hash_pull_fusion_worker.cc b/xdl/xdl/core/grappler/hash_pull_fusion_worker.cc
new file mode 100644
index 00000000..1a8ac76d
--- /dev/null
+++ b/xdl/xdl/core/grappler/hash_pull_fusion_worker.cc
@@ -0,0 +1,177 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/grappler/hash_pull_fusion_worker.h"
+
+namespace xdl {
+
+Status HashPullFusionWorker::Process(
+    GraphDef* graph, OutputSpec* output) {
+  XDL_CHECK_STATUS(Init(graph, output));
+  std::vector<std::set<NodeDef*> > clusters;
+  XDL_CHECK_STATUS(
+      ClusterNodes(std::bind(&HashPullFusionWorker::NodeMatcher, 
+                             this, 
+                             std::placeholders::_1),
+                   graph, 
+                   &clusters));
+  std::vector<std::set<NodeDef*> > post_clusters;
+  XDL_CHECK_STATUS(PostCluster(clusters, &post_clusters));
+  XDL_CHECK_STATUS(DoFusion(post_clusters));
+  XDL_CHECK_STATUS(DeleteNodes());
+  XDL_CHECK_STATUS(RenameInput());
+  return Status::Ok();
+}
+
+Status HashPullFusionWorker::PostCluster(
+    const std::vector<std::set<NodeDef*> >& clusters,
+    std::vector<std::set<NodeDef*> >* sub_clusters) {
+  int cluster_id = 0;
+  std::vector<std::set<NodeDef*> > tmp;
+  for (auto& cluster: clusters) {
+    std::map<std::pair<int, int>, int> type_2_cluster_id;
+    for (auto& node: cluster) {
+      DataType itype;
+      XDL_CHECK_STATUS(
+          GetAttrValue<DataType>(node, "dtype", &itype));    
+      DataType otype;
+      XDL_CHECK_STATUS(
+          GetAttrValue<DataType>(node, "otype", &otype));    
+      std::pair<int, int> type = std::make_pair(itype, otype);
+      auto it = type_2_cluster_id.find(type);
+      if (it != type_2_cluster_id.end()) {
+        tmp[it->second].insert(node);
+      } else {
+        tmp.push_back(std::set<NodeDef*>());
+        type_2_cluster_id.insert({type, cluster_id++});
+        tmp.back().insert(node);
+      }
+    }
+  }
+
+  for (auto&& cluster: tmp) {
+    if (cluster.size() > 1) { 
+      sub_clusters->emplace_back(cluster);
+    }
+  }
+
+  // std::cout << "post cluster size:" << sub_clusters->size() << std::endl;
+  // for (auto& cluster: (*sub_clusters)) {
+  //   std::cout << "cluster:" << std::endl;
+  //   for (auto& item: cluster) {
+  //     std::cout << item->name << std::endl;
+  //   }
+  // }
+  return Status::Ok();
+}
+
+Status HashPullFusionWorker::DoFusion(
+    const std::vector<std::set<NodeDef*> >& clusters) {
+  for (auto& cluster: clusters) {
+    XDL_CHECK_STATUS(FuseOneCluster(cluster));
+  }
+
+  return Status::Ok();
+}
+
+Status HashPullFusionWorker::FuseOneCluster(
+    const std::set<NodeDef*>& cluster) {
+  NodeDef* n = *(cluster.begin());
+  DataType itype;
+  XDL_CHECK_STATUS(
+      GetAttrValue<DataType>(n, "dtype", &itype));    
+  DataType otype;
+  XDL_CHECK_STATUS(
+      GetAttrValue<DataType>(n, "otype", &otype));    
+  std::string var_name_str;
+  for (auto& item: cluster) {
+    std::string var_name;
+    XDL_CHECK_STATUS(
+        GetAttrValue<std::string>(item, "var_name", &var_name));    
+    var_name_str += var_name + ",";
+  }
+  var_name_str.pop_back();
+
+  NodeDef fused_node;
+  XDL_CHECK_STATUS(
+      FuseImpl(var_name_str,
+               itype, otype, 
+               cluster,
+               &fused_node));
+  XDL_CHECK_STATUS(
+      MarkDeleteNode(cluster, fused_node));
+  return Status::Ok();
+}
+
+Status HashPullFusionWorker::FuseImpl(
+    const std::string& var_name_str,
+    DataType itype,
+    DataType otype,
+    const std::set<NodeDef*>& cluster,
+    NodeDef* node) {
+  if (id_ == 0) {
+    node->name = "PsMergedSparsePullOp";
+    id_++;
+  } else {
+    node->name = "PsMergedSparsePullOp_" + std::to_string(id_++);
+  }
+
+  node->op = "PsMergedSparsePullOp";
+  int output_idx = 0;
+  std::vector<DataType> input_type_0;
+  std::vector<DataType> input_type_1;
+  std::vector<std::string> input_0;
+  std::vector<std::string> input_1;
+  std::vector<std::string> dependencies;
+
+  for (auto& item: cluster) {
+    std::vector<std::string> non_depend_input;
+    for (auto& input : item->input) {
+      if (input.size() > 0 && input[0] == '^') {
+        dependencies.push_back(input);
+      } else {
+        non_depend_input.push_back(input);
+      }
+    }
+    XDL_CHECK_COND(non_depend_input.size() == 2,
+                   Status::ArgumentError(item->name + " Input Error, not a PsSparsePullOp"));
+
+    input_0.push_back(non_depend_input[0]);
+    input_1.push_back(non_depend_input[1]);
+    MarkRenameInput(item->name + ":0", node->name + ":" + std::to_string(output_idx));
+    MarkRenameInput("^" + item->name, "^" + node->name);
+
+    output_idx++;
+    input_type_0.push_back(itype);
+    input_type_1.push_back(DataType::kFloat);
+  }
+  node->input.insert(node->input.end(), input_0.begin(), input_0.end());
+  node->input.insert(node->input.end(), input_1.begin(), input_1.end());
+  node->input.insert(node->input.end(), dependencies.begin(), dependencies.end());
+
+  SetAttrValue<std::vector<DataType> >(
+      node, "input_type_0", input_type_0);
+  SetAttrValue<std::vector<DataType> >(
+      node, "input_type_1", input_type_1);
+  SetAttrValue<DataType>(node, "otype", otype);
+  SetAttrValue<std::string>(node, "var_type", "hash");
+  SetAttrValue<std::string>(node, "var_name", "hash_variable");
+  SetAttrValue<std::string>(node, "var_names", var_name_str);
+  SetAttrValue<int>(node, "output_size", input_type_0.size());
+  node->device.device_name = "CPU";
+  return Status::Ok();
+}
+
+} //namespace xdl
diff --git a/xdl/xdl/core/grappler/hash_pull_fusion_worker.h b/xdl/xdl/core/grappler/hash_pull_fusion_worker.h
new file mode 100644
index 00000000..b2ba0e4e
--- /dev/null
+++ b/xdl/xdl/core/grappler/hash_pull_fusion_worker.h
@@ -0,0 +1,58 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_GRAPPLER_HASH_PULL_FUSION_WORKER
+#define XDL_CORE_GRAPPLER_HASH_PULL_FUSION_WORKER
+
+#include "xdl/core/framework/grappler.h"
+#include "xdl/core/grappler/ps_fusion_worker.h"
+
+#include <atomic>
+
+namespace xdl {
+
+class HashPullFusionWorker: public FusionWorker {
+ public:
+  Status Process(GraphDef* graph, OutputSpec* output) override;
+
+ private:
+  bool NodeMatcher(NodeDef* n) {
+    std::string var_type;
+    if (!GetAttrValue(n, "var_type", &var_type).IsOk()) {
+      return false;
+    }
+      
+    return n->op == "PsSparsePullOp" && (var_type == "hash128" || 
+      var_type == "hash64" || var_type == "hash");
+  }
+
+  Status PostCluster(
+      const std::vector<std::set<NodeDef*> >& clusters,
+      std::vector<std::set<NodeDef*> >* sub_clusters);
+  Status DoFusion(
+      const std::vector<std::set<NodeDef*> >& clusters);
+  Status FuseOneCluster(
+      const std::set<NodeDef*>& clusters);
+  Status FuseImpl(
+      const std::string& var_name_str,
+      DataType itype,
+      DataType otype,
+      const std::set<NodeDef*>& cluster,
+      NodeDef* fused_node);
+};
+
+} //namespace XDL_CORE_GRAPPLER_PS_FUSION_WORKER
+
+#endif
diff --git a/xdl/xdl/core/grappler/hash_push_fusion_worker.cc b/xdl/xdl/core/grappler/hash_push_fusion_worker.cc
new file mode 100644
index 00000000..e8e079fb
--- /dev/null
+++ b/xdl/xdl/core/grappler/hash_push_fusion_worker.cc
@@ -0,0 +1,198 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/grappler/hash_push_fusion_worker.h"
+
+namespace xdl {
+
+Status HashPushFusionWorker::Process(
+    GraphDef* graph, OutputSpec* output) {
+  XDL_CHECK_STATUS(Init(graph, output));
+  std::vector<std::set<NodeDef*> > clusters;
+  XDL_CHECK_STATUS(
+      ClusterNodes(std::bind(&HashPushFusionWorker::NodeMatcher, 
+                             this, 
+                             std::placeholders::_1),
+                   graph, 
+                   &clusters));
+  std::vector<std::set<NodeDef*> > post_clusters;
+  XDL_CHECK_STATUS(PostCluster(clusters, &post_clusters));
+  XDL_CHECK_STATUS(DoFusion(post_clusters));
+  XDL_CHECK_STATUS(DeleteNodes());
+  XDL_CHECK_STATUS(RenameInput());
+  return Status::Ok();
+}
+
+Status HashPushFusionWorker::PostCluster(
+    const std::vector<std::set<NodeDef*> >& clusters,
+    std::vector<std::set<NodeDef*> >* sub_clusters) {
+  int cluster_id = 0;
+  std::vector<std::set<NodeDef*> > tmp;
+  for (auto& cluster: clusters) {
+    std::map<std::pair<int, std::string>, int> type_2_cluster_id;
+    for (auto& node: cluster) {
+      DataType itype;
+      XDL_CHECK_STATUS(
+          GetAttrValue<DataType>(node, "dtype", &itype)); 
+      std::pair<int, std::string> type = std::make_pair(itype, node->op);
+      auto it = type_2_cluster_id.find(type);
+      if (it != type_2_cluster_id.end()) {
+        tmp[it->second].insert(node);
+      } else {
+        tmp.push_back(std::set<NodeDef*>());
+        type_2_cluster_id.insert({type, cluster_id++});
+        tmp.back().insert(node);
+      }
+    }
+  }
+
+  for (auto&& cluster: tmp) {
+    if (cluster.size() > 1) { 
+      sub_clusters->emplace_back(cluster);
+    }
+  }
+
+  // std::cout << "post cluster size:" << sub_clusters->size() << std::endl;
+  // for (auto& cluster: (*sub_clusters)) {
+  //   std::cout << "cluster:" << std::endl;
+  //   for (auto& item: cluster) {
+  //     std::cout << item->name << std::endl;
+  //   }
+  // }
+  return Status::Ok();
+}
+
+Status HashPushFusionWorker::DoFusion(
+    const std::vector<std::set<NodeDef*> >& clusters) {
+  for (auto& cluster: clusters) {
+    XDL_CHECK_STATUS(FuseOneCluster(cluster));
+  }
+
+  return Status::Ok();
+}
+
+Status HashPushFusionWorker::FuseOneCluster(
+    const std::set<NodeDef*>& cluster) {
+  NodeDef* n = *(cluster.begin());
+  DataType itype;
+  XDL_CHECK_STATUS(
+      GetAttrValue<DataType>(n, "dtype", &itype));   
+  std::string op_name = n->op;
+  std::string var_name_str;
+  for (auto& item: cluster) {
+    std::string var_name;
+    XDL_CHECK_STATUS(
+        GetAttrValue<std::string>(item, "var_name", &var_name));    
+    var_name_str += var_name + ",";
+  }
+  var_name_str.pop_back();
+
+  NodeDef fused_node;
+  XDL_CHECK_STATUS(
+      FuseImpl(var_name_str, op_name,
+               itype,
+               cluster,
+               &fused_node));
+  XDL_CHECK_STATUS(
+      MarkDeleteNode(cluster, fused_node));
+  return Status::Ok();
+}
+
+namespace {
+struct FusionStrategy {
+  std::string op;
+  std::vector<DataType> input_types;
+};
+
+const std::unordered_map<std::string, FusionStrategy> kFusionStrategies = {
+  {"PsSparseApplyAdagradOp", {.op="PsSparseApplyAdagradMergedOp",
+   .input_types={DataType::kDouble, DataType::kDouble, DataType::kFloat}}},
+  {"PsSparseApplyAdamOp", {.op="PsSparseApplyAdamMergedOp",
+   .input_types={DataType::kDouble, DataType::kDouble, DataType::kDouble,
+                 DataType::kDouble, DataType::kBool, DataType::kFloat}}},
+  {"PsSparseApplyFtrlOp", {.op="PsSparseApplyFtrlMergedOp",
+   .input_types={DataType::kDouble, DataType::kDouble, DataType::kDouble,
+                 DataType::kDouble, DataType::kDouble, DataType::kFloat}}},
+  {"PsSparseApplyMomentumOp", {.op="PsSparseApplyMomentumMergedOp",
+   .input_types={DataType::kDouble, DataType::kDouble,
+                 DataType::kBool, DataType::kFloat}}},
+  {"PsSparseApplyRmspropOp", {.op="PsSparseApplyRmspropMergedOp",
+   .input_types={DataType::kDouble, DataType::kDouble, DataType::kDouble,
+                 DataType::kDouble, DataType::kFloat}}}
+};
+}
+
+Status HashPushFusionWorker::FuseImpl(
+    const std::string& var_name_str,
+    const std::string& op_name,
+    DataType itype,
+    const std::set<NodeDef*>& cluster,
+    NodeDef* node) {
+  auto iter = kFusionStrategies.find(op_name);
+  if (iter == kFusionStrategies.end()) {
+    return Status::ArgumentError("Fused op_name " + op_name + " unsupported");
+  }
+  const FusionStrategy& strategy = iter->second;
+  if (id_ == 0) {
+    node->name = strategy.op;
+  } else {
+    node->name = strategy.op + "_" + std::to_string(id_);
+  }
+  id_++;
+
+  node->op = strategy.op;
+
+  std::vector<DataType> dtypes(strategy.input_types.begin(), strategy.input_types.end());
+  dtypes.push_back(itype);
+
+  std::vector<std::vector<DataType>> input_types(strategy.input_types.size() + 1);
+  std::vector<std::vector<std::string>> inputs(strategy.input_types.size() + 1);
+  std::vector<std::string> dependencies;
+  int output_idx = 0;
+
+  for (auto& item: cluster) {
+    std::vector<std::string> non_depend_input;
+    for (auto& input : item->input) {
+      if (input.size() > 0 && input[0] == '^') {
+        dependencies.push_back(input);
+      } else {
+        non_depend_input.push_back(input);
+      }
+    }
+    XDL_CHECK_COND(non_depend_input.size() == strategy.input_types.size() + 1,
+                   Status::ArgumentError(item->name + " Input Error, not a " + op_name));
+
+    for (size_t i = 0; i < strategy.input_types.size() + 1; i++) {
+      input_types[i].push_back(dtypes[i]);
+      inputs[i].push_back(non_depend_input[i]);
+    }
+
+    MarkRenameInput("^" + item->name, "^" + node->name);
+  }
+
+  for (size_t i = 0; i < strategy.input_types.size() + 1; i++) {
+    SetAttrValue<std::vector<DataType>>(
+      node, "input_type_" + std::to_string(i), input_types[i]);
+    node->input.insert(node->input.end(), inputs[i].begin(), inputs[i].end());
+  }
+  node->input.insert(node->input.end(), dependencies.begin(), dependencies.end());
+  SetAttrValue<std::string>(node, "var_type", "hash");
+  SetAttrValue<std::string>(node, "var_name", "hash_variable");
+  SetAttrValue<std::string>(node, "var_names", var_name_str);
+  node->device.device_name = "CPU";
+  return Status::Ok();
+}
+
+} //namespace xdl
diff --git a/xdl/xdl/core/grappler/hash_push_fusion_worker.h b/xdl/xdl/core/grappler/hash_push_fusion_worker.h
new file mode 100644
index 00000000..295add93
--- /dev/null
+++ b/xdl/xdl/core/grappler/hash_push_fusion_worker.h
@@ -0,0 +1,64 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_GRAPPLER_HASH_PUSH_FUSION_WORKER
+#define XDL_CORE_GRAPPLER_HASH_PUSH_FUSION_WORKER
+
+#include "xdl/core/framework/grappler.h"
+#include "xdl/core/grappler/ps_fusion_worker.h"
+
+#include <atomic>
+
+namespace xdl {
+
+class HashPushFusionWorker: public FusionWorker {
+ public:
+  Status Process(GraphDef* graph, OutputSpec* output) override;
+
+ private:
+  bool NodeMatcher(NodeDef* n) {
+    std::string var_type;
+    if (!GetAttrValue(n, "var_type", &var_type).IsOk()) {
+      return false;
+    }
+
+    std::set<std::string> push_op = {"PsSparseApplyAdagradOp",
+                                     "PsSparseApplyAdamOp",
+                                     "PsSparseApplyFtrlOp",
+                                     "PsSparseApplyMomentumOp",
+                                     "PsSparseApplyRmspropOp"};
+    auto iter = push_op.find(n->op);
+    return iter != push_op.end() && (var_type == "hash128" || 
+      var_type == "hash64" || var_type == "hash");
+  }
+
+  Status PostCluster(
+      const std::vector<std::set<NodeDef*> >& clusters,
+      std::vector<std::set<NodeDef*> >* sub_clusters);
+  Status DoFusion(
+      const std::vector<std::set<NodeDef*> >& clusters);
+  Status FuseOneCluster(
+      const std::set<NodeDef*>& clusters);
+  Status FuseImpl(
+      const std::string& var_name_str,
+	  const std::string& op_name,
+      DataType itype,
+      const std::set<NodeDef*>& cluster,
+      NodeDef* fused_node);
+};
+
+} //namespace XDL_CORE_GRAPPLER_PS_FUSION_WORKER
+
+#endif
diff --git a/xdl/xdl/core/grappler/hash_statis_fusion_worker.cc b/xdl/xdl/core/grappler/hash_statis_fusion_worker.cc
new file mode 100644
index 00000000..b60958fb
--- /dev/null
+++ b/xdl/xdl/core/grappler/hash_statis_fusion_worker.cc
@@ -0,0 +1,195 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/grappler/hash_statis_fusion_worker.h"
+
+namespace xdl {
+
+Status HashStatisFusionWorker::Process(
+    GraphDef* graph, OutputSpec* output) {
+  XDL_CHECK_STATUS(Init(graph, output));
+  std::vector<std::set<NodeDef*> > clusters;
+  XDL_CHECK_STATUS(
+      ClusterNodes(std::bind(&HashStatisFusionWorker::NodeMatcher,
+                             this, 
+                             std::placeholders::_1),
+                   graph, 
+                   &clusters));
+  std::vector<std::set<NodeDef*> > post_clusters;
+  XDL_CHECK_STATUS(PostCluster(clusters, &post_clusters));
+  XDL_CHECK_STATUS(DoFusion(post_clusters));
+  XDL_CHECK_STATUS(DeleteNodes());
+  XDL_CHECK_STATUS(RenameInput());
+  return Status::Ok();
+}
+
+Status HashStatisFusionWorker::PostCluster(
+    const std::vector<std::set<NodeDef*> >& clusters,
+    std::vector<std::set<NodeDef*> >* sub_clusters) {
+  int cluster_id = 0;
+  std::vector<std::set<NodeDef*> > tmp;
+  for (auto& cluster: clusters) {
+    std::map<std::pair<int, int>, int> type_2_cluster_id;
+    for (auto& node: cluster) {
+      DataType itype;
+      XDL_CHECK_STATUS(
+          GetAttrValue<DataType>(node, "dtype", &itype));    
+      DataType otype;
+      XDL_CHECK_STATUS(
+          GetAttrValue<DataType>(node, "otype", &otype));    
+      std::pair<int, int> type = std::make_pair(itype, otype);
+      auto it = type_2_cluster_id.find(type);
+      if (it != type_2_cluster_id.end()) {
+        tmp[it->second].insert(node);
+      } else {
+        tmp.push_back(std::set<NodeDef*>());
+        type_2_cluster_id.insert({type, cluster_id++});
+        tmp.back().insert(node);
+      }
+    }
+  }
+
+  for (auto&& cluster: tmp) {
+    if (cluster.size() >= 1) {
+      sub_clusters->emplace_back(cluster);
+    }
+  }
+
+  // std::cout << "post cluster size:" << sub_clusters->size() << std::endl;
+  // for (auto& cluster: (*sub_clusters)) {
+  //   std::cout << "cluster:" << std::endl;
+  //   for (auto& item: cluster) {
+  //     std::cout << item->name << std::endl;
+  //   }
+  // }
+  return Status::Ok();
+}
+
+Status HashStatisFusionWorker::DoFusion(
+    const std::vector<std::set<NodeDef*> >& clusters) {
+  for (auto& cluster: clusters) {
+    XDL_CHECK_STATUS(FuseOneCluster(cluster));
+  }
+
+  return Status::Ok();
+}
+
+Status HashStatisFusionWorker::FuseOneCluster(
+    const std::set<NodeDef*>& cluster) {
+  NodeDef* n = *(cluster.begin());
+  DataType itype;
+  XDL_CHECK_STATUS(
+      GetAttrValue<DataType>(n, "dtype", &itype));    
+  DataType otype;
+  XDL_CHECK_STATUS(
+      GetAttrValue<DataType>(n, "otype", &otype));    
+  std::string var_name_str;
+  for (auto& item: cluster) {
+    std::string var_name;
+    XDL_CHECK_STATUS(
+        GetAttrValue<std::string>(item, "var_name", &var_name));    
+    var_name_str += var_name + ",";
+  }
+  var_name_str.pop_back();
+
+  NodeDef fused_node;
+  XDL_CHECK_STATUS(
+      FuseImpl(var_name_str,
+               itype, otype, 
+               cluster,
+               &fused_node));
+  XDL_CHECK_STATUS(
+      MarkDeleteNode(cluster, fused_node));
+  return Status::Ok();
+}
+
+Status HashStatisFusionWorker::FuseImpl(
+    const std::string& var_name_str,
+    DataType itype,
+    DataType otype,
+    const std::set<NodeDef*>& cluster,
+    NodeDef* node) {
+  node->name = "PsMergedSparseStatisOp_" + statis_type_ + "_" + std::to_string(id_++);
+  node->op = "PsMergedSparseStatisOp";
+  int output_idx = 0;
+  std::vector<DataType> input_type, input_type_1, input_type_2, input_type_3, input_type_4, input_type_5, input_type_6;
+  std::vector<std::vector<std::string>> inputs;
+  const size_t input_lists_size = 7;
+  inputs.resize(input_lists_size);
+  std::vector<std::string> dependencies;
+
+  for (auto& item: cluster) {
+    std::vector<std::string> non_depend_input;
+    for (auto& input : item->input) {
+      if (input.size() > 0 && input[0] == '^') {
+        dependencies.push_back(input);
+      } else {
+        non_depend_input.push_back(input);
+      }
+    }
+    XDL_CHECK_COND(non_depend_input.size() == 10,
+                   Status::ArgumentError(item->name + " Input Error, not a PsSparseStatisOp"));
+
+    for (size_t i = 0; i < input_lists_size; ++i) {
+      inputs[i].push_back(non_depend_input[i]);
+      MarkRenameInput(item->name + ":" + std::to_string(i), node->name + ":" + std::to_string(output_idx));
+    }
+    MarkRenameInput("^" + item->name, "^" + node->name);
+
+    output_idx++;
+    input_type.push_back(itype);
+    input_type_1.push_back(DataType::kInt32);
+    input_type_2.push_back(DataType::kInt32);
+    input_type_3.push_back(DataType::kInt32);
+    input_type_4.push_back(DataType::kInt32);
+    input_type_5.push_back(DataType::kFloat);
+    input_type_6.push_back(DataType::kFloat);
+  }
+  for (size_t i = 0; i < input_lists_size; ++i) {
+    node->input.insert(node->input.end(), inputs[i].begin(), inputs[i].end());
+  }
+  for (auto& item: cluster) {
+    std::vector<std::string> non_depend_input;
+    for (auto& input : item->input) {
+      if (input.size() > 0 && input[0] == '^') {
+        dependencies.push_back(input);
+      } else {
+        non_depend_input.push_back(input);
+      }
+    }
+    for (size_t i = input_lists_size; i < non_depend_input.size(); ++i) {
+      node->input.push_back(non_depend_input[i]);
+    }
+    break;
+  }
+  node->input.insert(node->input.end(), dependencies.begin(), dependencies.end());
+
+  SetAttrValue<std::vector<DataType>>(node, "input_type", input_type);
+  SetAttrValue<std::vector<DataType>>(node, "input_type_1", input_type_1);
+  SetAttrValue<std::vector<DataType>>(node, "input_type_2", input_type_2);
+  SetAttrValue<std::vector<DataType>>(node, "input_type_3", input_type_3);
+  SetAttrValue<std::vector<DataType>>(node, "input_type_4", input_type_4);  
+  SetAttrValue<std::vector<DataType>>(node, "input_type_5", input_type_5);
+  SetAttrValue<std::vector<DataType>>(node, "input_type_6", input_type_6);
+  SetAttrValue<std::string>(node, "statis_type", statis_type_);
+  SetAttrValue<std::string>(node, "var_type", "hash");
+  SetAttrValue<std::string>(node, "var_name", "hash_variable");
+  SetAttrValue<std::string>(node, "var_names", var_name_str);
+  SetAttrValue<int>(node, "output_size", input_type.size());
+  node->device.device_name = "CPU";
+  return Status::Ok();
+}
+
+} //namespace xdl
diff --git a/xdl/xdl/core/grappler/hash_statis_fusion_worker.h b/xdl/xdl/core/grappler/hash_statis_fusion_worker.h
new file mode 100644
index 00000000..d913efde
--- /dev/null
+++ b/xdl/xdl/core/grappler/hash_statis_fusion_worker.h
@@ -0,0 +1,66 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_GRAPPLER_HASH_STATIS_FUSION_WORKER
+#define XDL_CORE_GRAPPLER_HASH_STATIS_FUSION_WORKER
+
+#include "xdl/core/framework/grappler.h"
+#include "xdl/core/grappler/ps_fusion_worker.h"
+
+#include <atomic>
+
+namespace xdl {
+
+class HashStatisFusionWorker: public FusionWorker {
+ public:
+  HashStatisFusionWorker(const std::string& statis_type)
+    : statis_type_(statis_type) {}
+  Status Process(GraphDef* graph, OutputSpec* output) override;
+
+ private:
+  std::string statis_type_;
+
+  bool NodeMatcher(NodeDef* n) {
+    std::string var_type;
+    if (!GetAttrValue(n, "var_type", &var_type).IsOk()) {
+      return false;
+    }
+    std::string statis_type;
+    if (!GetAttrValue(n, "statis_type", &statis_type).IsOk()) {
+      return false;
+    }
+      
+    return n->op == "PsSparseStatisOp" && statis_type_ == statis_type
+      && (var_type == "hash128" || var_type == "hash64" || var_type == "hash");
+  }
+
+  Status PostCluster(
+      const std::vector<std::set<NodeDef*> >& clusters,
+      std::vector<std::set<NodeDef*> >* sub_clusters);
+  Status DoFusion(
+      const std::vector<std::set<NodeDef*> >& clusters);
+  Status FuseOneCluster(
+      const std::set<NodeDef*>& clusters);
+  Status FuseImpl(
+      const std::string& var_name_str,
+      DataType itype,
+      DataType otype,
+      const std::set<NodeDef*>& cluster,
+      NodeDef* fused_node);
+};
+
+}
+
+#endif
diff --git a/xdl/xdl/core/grappler/input_device_grappler.cc b/xdl/xdl/core/grappler/input_device_grappler.cc
new file mode 100644
index 00000000..559576d6
--- /dev/null
+++ b/xdl/xdl/core/grappler/input_device_grappler.cc
@@ -0,0 +1,41 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <memory>
+
+#include "xdl/core/framework/grappler.h"
+
+namespace xdl {
+
+class InputDeviceGrappler : public Grappler {
+ public:
+  Status Process(GraphDef* graph, OutputSpec* output) override {
+    for (NodeDef& node : graph->node) {
+      if (node.op == "TakeGrad") {
+        node.input_dev_descs.emplace_back("");
+        node.input_dev_descs.emplace_back("");
+        node.input_dev_descs.emplace_back("CPU");
+      } else if (node.op == "KSumGrad") {
+        node.input_dev_descs.emplace_back("CPU");
+      }
+    }
+    return Status::Ok();
+  }
+};
+
+}  // namespace xdl
+
+XDL_REGISTER_GRAPPLER(20000, xdl::InputDeviceGrappler);
+
diff --git a/xdl/xdl/core/grappler/mark_op_fusion_worker.cc b/xdl/xdl/core/grappler/mark_op_fusion_worker.cc
new file mode 100644
index 00000000..27ae67ee
--- /dev/null
+++ b/xdl/xdl/core/grappler/mark_op_fusion_worker.cc
@@ -0,0 +1,168 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/grappler/mark_op_fusion_worker.h"
+
+namespace xdl {
+
+Status MarkOpFusionWorker::Process(
+    GraphDef* graph, OutputSpec* output) {
+  XDL_CHECK_STATUS(Init(graph, output));
+  std::vector<std::set<NodeDef*> > clusters;
+  XDL_CHECK_STATUS(
+      ClusterNodes(std::bind(&MarkOpFusionWorker::NodeMatcher, 
+                             this, 
+                             std::placeholders::_1),
+                   graph, 
+                   &clusters));
+  std::vector<std::set<NodeDef*> > post_clusters;
+  XDL_CHECK_STATUS(PostCluster(clusters, &post_clusters));
+  XDL_CHECK_STATUS(DoFusion(post_clusters));
+  XDL_CHECK_STATUS(DeleteNodes());
+  XDL_CHECK_STATUS(RenameInput());
+  return Status::Ok();
+}
+
+Status MarkOpFusionWorker::PostCluster(
+    const std::vector<std::set<NodeDef*> >& clusters,
+    std::vector<std::set<NodeDef*> >* sub_clusters) {
+  int cluster_id = 0;
+  std::vector<std::set<NodeDef*> > tmp;
+  for (auto& cluster: clusters) {
+    std::map<int, int> type_2_cluster_id;
+    for (auto& node: cluster) {
+      DataType itype;
+      XDL_CHECK_STATUS(
+          GetAttrValue<DataType>(node, "dtype", &itype));      
+      auto it = type_2_cluster_id.find(itype);
+      if (it != type_2_cluster_id.end()) {
+        tmp[it->second].insert(node);
+      } else {
+        tmp.push_back(std::set<NodeDef*>());
+        type_2_cluster_id.insert({itype, cluster_id++});
+        tmp.back().insert(node);
+      }
+    }
+  }
+
+  for (auto&& cluster: tmp) {
+    if (cluster.size() > 1) { 
+      sub_clusters->emplace_back(cluster);
+    }
+  }
+
+  return Status::Ok();
+}
+
+Status MarkOpFusionWorker::DoFusion(
+    const std::vector<std::set<NodeDef*> >& clusters) {
+  for (auto& cluster: clusters) {
+    XDL_CHECK_STATUS(FuseOneCluster(cluster));
+  }
+
+  return Status::Ok();
+}
+
+Status MarkOpFusionWorker::FuseOneCluster(
+    const std::set<NodeDef*>& cluster) {
+  NodeDef* n = *(cluster.begin());
+  DataType itype;
+  XDL_CHECK_STATUS(
+      GetAttrValue<DataType>(n, "dtype", &itype));    
+  std::string var_name_str;
+  for (auto& item: cluster) {
+    std::string var_name;
+    XDL_CHECK_STATUS(
+        GetAttrValue<std::string>(item, "var_name", &var_name));    
+    var_name_str += var_name + ",";
+  }
+  var_name_str.pop_back();
+
+  std::string pattern_str;
+  for (auto& item: cluster) {
+    std::string pattern;
+    XDL_CHECK_STATUS(
+        GetAttrValue<std::string>(item, "pattern", &pattern));    
+    pattern_str += pattern + ",";
+  }
+  pattern_str.pop_back();
+
+  NodeDef fused_node;
+  XDL_CHECK_STATUS(
+      FuseImpl(var_name_str,
+               pattern_str,
+               itype,
+               cluster,
+               &fused_node));
+  XDL_CHECK_STATUS(
+      MarkDeleteNode(cluster, fused_node));
+  return Status::Ok();
+}
+
+Status MarkOpFusionWorker::FuseImpl(
+    const std::string& var_name_str,
+    const std::string& pattern_str,
+    DataType itype,
+    const std::set<NodeDef*>& cluster,
+    NodeDef* node) {
+  if (id_ == 0) {
+    node->name = "PsMergedMarkOp";
+    id_++;
+  } else {
+    node->name = "PsMergedMarkOp_" + std::to_string(id_++);
+  }
+
+  node->op = "PsMergedMarkOp";
+  std::vector<DataType> input_type_0;
+  std::vector<DataType> input_type_1;
+  std::vector<std::string> input_0;
+  std::vector<std::string> input_1;
+  std::vector<std::string> dependencies;
+
+  for (auto& item: cluster) {
+    std::vector<std::string> non_depend_input;
+    for (auto& input : item->input) {
+      if (input.size() > 0 && input[0] == '^') {
+        dependencies.push_back(input);
+      } else {
+        non_depend_input.push_back(input);
+      }
+    }
+    XDL_CHECK_COND(non_depend_input.size() == 2,
+                   Status::ArgumentError(item->name + " Input Error, not a PsMarkOp"));
+
+    input_0.push_back(non_depend_input[0]);
+    input_1.push_back(non_depend_input[1]);
+    MarkRenameInput("^" + item->name, "^" + node->name);
+
+    input_type_0.push_back(itype);
+    input_type_1.push_back(DataType::kInt64);
+  }
+  node->input.insert(node->input.end(), input_0.begin(), input_0.end());
+  node->input.insert(node->input.end(), input_1.begin(), input_1.end());
+  node->input.insert(node->input.end(), dependencies.begin(), dependencies.end());
+
+  SetAttrValue<std::vector<DataType> >(
+      node, "input_type_0", input_type_0);
+  SetAttrValue<std::vector<DataType> >(
+      node, "input_type_1", input_type_1);
+  SetAttrValue<std::string>(node, "var_names", var_name_str);
+  SetAttrValue<std::string>(node, "patterns", pattern_str);
+  node->device.device_name = "CPU";
+  return Status::Ok();
+}
+
+} //namespace xdl
+
diff --git a/xdl/xdl/core/grappler/mark_op_fusion_worker.h b/xdl/xdl/core/grappler/mark_op_fusion_worker.h
new file mode 100644
index 00000000..7c17521f
--- /dev/null
+++ b/xdl/xdl/core/grappler/mark_op_fusion_worker.h
@@ -0,0 +1,53 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_GRAPPLER_MARK_OP_FUSION_WORKER
+#define XDL_CORE_GRAPPLER_MARK_OP_FUSION_WORKER
+
+#include "xdl/core/framework/grappler.h"
+#include "xdl/core/grappler/ps_fusion_worker.h"
+
+#include <atomic>
+
+namespace xdl {
+
+class MarkOpFusionWorker: public FusionWorker {
+ public:
+  Status Process(GraphDef* graph, OutputSpec* output) override;
+
+ private:
+  bool NodeMatcher(NodeDef* n) {
+    return n->op == "PsMarkOp";
+  }
+
+  Status PostCluster(
+      const std::vector<std::set<NodeDef*> >& clusters,
+      std::vector<std::set<NodeDef*> >* sub_clusters);
+  Status DoFusion(
+      const std::vector<std::set<NodeDef*> >& clusters);
+  Status FuseOneCluster(
+      const std::set<NodeDef*>& clusters);
+  Status FuseImpl(
+      const std::string& var_name_str,
+      const std::string& pattern_str,
+      DataType itype,
+      const std::set<NodeDef*>& cluster,
+      NodeDef* node);
+};
+
+} //namespace XDL_CORE_GRAPPLER_MARK_OP_FUSION_WORKER
+
+#endif
+
diff --git a/xdl/xdl/core/grappler/prune_grappler.cc b/xdl/xdl/core/grappler/prune_grappler.cc
index 213a9997..60d9c81a 100644
--- a/xdl/xdl/core/grappler/prune_grappler.cc
+++ b/xdl/xdl/core/grappler/prune_grappler.cc
@@ -21,25 +21,14 @@ namespace {
 
 class PruneExecutor {
  public:
-  PruneExecutor(const InputSpec& input, 
-                GraphDef* graph, 
-                OutputSpec* output)
-    : graph_(graph), 
-      output_(output) {
-    inputs_.insert(input.begin(), input.end());
-  }
-
+  PruneExecutor(GraphDef* graph, OutputSpec* output)
+    : graph_(graph), output_(output) {}
   Status Run() {
     XDL_CHECK_STATUS(Init());
-    if (!inputs_.empty()) {
-      XDL_CHECK_STATUS(InitNodeDepOutputs());      
-    }
-
     XDL_CHECK_STATUS(Bfs());
     XDL_CHECK_STATUS(Build());
     return Status::Ok();
   }
-
  private:
   Status Init() {
     for (auto&& item : graph_->node) {
@@ -49,39 +38,6 @@ class PruneExecutor {
     return Status::Ok();
   }
 
-  Status GetNodeByName(
-      const std::string& name,
-      NodeDef** node) {
-    std::string node_name;
-    if (name.size() > 0 && name[0] == '^') {
-      node_name = name.substr(1);
-    } else {
-      size_t pos = name.find(':');
-      XDL_CHECK_COND(pos != std::string::npos,
-                     Status::ArgumentError("Node Input Error, "
-                                           ": not found " + name));
-      node_name = name.substr(0, pos);
-    }
-
-    auto iter = node_def_.find(node_name);
-    XDL_CHECK_COND(iter != node_def_.end(),
-                   Status::ArgumentError("not found node:" + name));
-    *node = iter->second;
-    return Status::Ok();
-  }
-
-  Status InitNodeDepOutputs() {
-    for (auto& item: graph_->node) {
-      for (auto& in: item.input) {
-        NodeDef* n = nullptr;
-        XDL_CHECK_STATUS(GetNodeByName(in, &n));
-        node_dep_outputs_[n].insert(in);
-      }
-    }
-
-    return Status::Ok();
-  }
-
   Status Bfs() {
     size_t i = 0;
     while (i < bfs_list_.size()) {
@@ -108,32 +64,13 @@ class PruneExecutor {
       }
       auto iter = node_def_.find(real_name);
       XDL_CHECK_COND(iter != node_def_.end(),
-                     Status::ArgumentError("node def has invalid input"));
+                     Status::ArgumentError("not found node:" + real_name));
       avaliable_node_.insert(real_name);
-      if (inputs_.find(name) != inputs_.end()) {
-        if (!IsFeededAll(iter->second)) {
-          return Status::ArgumentError(
-              "all outputs of node:" + iter->second->name + " must be feeded");
-        }
-      } else {
-        bfs_list_.push_back(iter->second);
-      }
+      bfs_list_.push_back(iter->second);
     }
-
     return Status::Ok();
   }
 
-  bool IsFeededAll(NodeDef* n) {
-    auto& output_nodes = node_dep_outputs_[n];
-    for (auto& item: output_nodes) {
-      if (inputs_.find(item) == inputs_.end()) {
-        return false;
-      }
-    }
-    
-    return true;
-  }
-
   Status Build() {
     std::vector<NodeDef> nodes;
     for (auto ptr : bfs_list_) {
@@ -144,11 +81,9 @@ class PruneExecutor {
   }
 
   GraphDef *graph_;
-  std::set<std::string> inputs_;
   OutputSpec *output_;
   std::unordered_map<std::string, NodeDef*> node_def_;
   std::unordered_set<std::string> avaliable_node_;
-  std::unordered_map<NodeDef*, std::set<std::string> > node_dep_outputs_;
   std::vector<NodeDef*> bfs_list_;
 };
 
@@ -157,11 +92,8 @@ class PruneExecutor {
 
 class PruneGrappler : public Grappler {
  public:
-  Status Process(
-      const InputSpec& input, 
-      GraphDef* graph, 
-      OutputSpec* output) override {
-    PruneExecutor executor(input, graph, output);
+  Status Process(GraphDef* graph, OutputSpec* output) override {
+    PruneExecutor executor(graph, output);
     XDL_CHECK_STATUS(executor.Run());
     return Status::Ok();
   }
diff --git a/xdl/xdl/core/grappler/ps_fusion_grappler.cc b/xdl/xdl/core/grappler/ps_fusion_grappler.cc
new file mode 100644
index 00000000..6363f513
--- /dev/null
+++ b/xdl/xdl/core/grappler/ps_fusion_grappler.cc
@@ -0,0 +1,46 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <memory>
+
+#include "xdl/core/framework/grappler.h"
+#include "xdl/core/grappler/hash_pull_fusion_worker.h"
+#include "xdl/core/grappler/hash_push_fusion_worker.h"
+#include "xdl/core/grappler/hash_statis_fusion_worker.h"
+#include "xdl/core/grappler/mark_op_fusion_worker.h"
+
+namespace xdl {
+
+class PsFusionGrappler : public Grappler {
+ public:
+  Status Process(GraphDef* graph, OutputSpec* output) override {
+    std::vector<std::unique_ptr<FusionWorker> > workers;
+    workers.emplace_back(new HashStatisFusionWorker("pv"));
+    workers.emplace_back(new HashStatisFusionWorker("click"));
+    workers.emplace_back(new HashPullFusionWorker);
+    workers.emplace_back(new HashPushFusionWorker);
+    workers.emplace_back(new MarkOpFusionWorker);
+    for (auto& worker: workers) {
+      XDL_CHECK_STATUS(worker->Process(graph, output));
+    }
+
+    return Status::Ok();
+  }
+};
+
+}  // namespace xdl
+
+XDL_REGISTER_GRAPPLER(5000, xdl::PsFusionGrappler);
+
diff --git a/xdl/xdl/core/grappler/ps_fusion_worker.cc b/xdl/xdl/core/grappler/ps_fusion_worker.cc
new file mode 100644
index 00000000..ba65dec9
--- /dev/null
+++ b/xdl/xdl/core/grappler/ps_fusion_worker.cc
@@ -0,0 +1,170 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/grappler/ps_fusion_worker.h"
+#include <unordered_map>
+#include <unordered_set>
+
+namespace xdl {
+
+Status FusionWorker::Init(
+    GraphDef* graph, 
+    OutputSpec* output) {
+  for (auto& item: graph->node) {
+    nodes_[item.name] = &item;
+  }
+
+  for (auto& name : output->output) {
+    output_names_.push_back(name);
+    NodeDef* node = nullptr;
+    XDL_CHECK_STATUS(GetNodeByName(name, &node));
+    output_nodes_.push_back(node);
+  }
+
+  graph_ = graph;
+  output_ = output;
+  return Status::Ok();
+}
+
+Status FusionWorker::GetNodeByName(
+    const std::string& name,
+    NodeDef** node) {
+  std::string node_name;
+  if (name.size() > 0 && name[0] == '^') {
+    node_name = name.substr(1);
+  } else {
+    size_t pos = name.find(':');
+    XDL_CHECK_COND(pos != std::string::npos,
+                   Status::ArgumentError("Node Input Error, "
+                                         ": not found " + name));
+    node_name = name.substr(0, pos);
+  }
+
+  auto iter = nodes_.find(node_name);
+  XDL_CHECK_COND(iter != nodes_.end(),
+                 Status::ArgumentError("not found node:" + name));
+  *node = iter->second;
+  return Status::Ok();
+}
+
+Status FusionWorker::ClusterNodes(
+    const std::function<bool(NodeDef*)>& match_func,
+    GraphDef* graph, 
+    std::vector<std::set<NodeDef*> >* clusters) {
+  std::unordered_set<NodeDef*> nodes_set(output_nodes_.begin(), output_nodes_.end());
+  std::vector<NodeDef*> bfs(nodes_set.begin(), nodes_set.end());
+  std::unordered_map<NodeDef*, std::vector<NodeDef*>> outputs;
+  for (size_t p = 0; p < bfs.size(); p++) {
+    NodeDef* cur = bfs[p];
+    for (auto&& in : cur->input) {
+      NodeDef* in_node;
+      XDL_CHECK_STATUS(GetNodeByName(in, &in_node));
+      if (nodes_set.find(in_node) == nodes_set.end()) {
+        nodes_set.insert(in_node);
+        bfs.push_back(in_node);
+      }
+      outputs[in_node].push_back(cur);
+    }
+  }
+
+  std::vector<NodeDef*> queue;
+  std::unordered_map<NodeDef*, size_t> ref;
+  std::unordered_map<NodeDef*, size_t> level;
+  for (auto item : bfs) {
+    if (item->input.empty()) {
+      queue.push_back(item);
+    }
+    ref[item] = item->input.size();
+  }
+  for (size_t p = 0; p < queue.size(); p++) {
+    NodeDef* cur = queue[p];
+    size_t cur_level = level[cur];
+    if (match_func(cur)) {
+      if (clusters->size() <= cur_level) {
+        clusters->resize(cur_level + 1);
+      }
+      (*clusters)[cur_level].insert(cur);
+      cur_level = cur_level + 1;
+    }
+    for (auto output : outputs[cur]) {
+      if (--ref[output] == 0) {
+        queue.push_back(output);
+      }
+      level[output] = std::max(cur_level, level[output]);
+    }
+  }
+  return Status::Ok();
+}
+
+
+Status FusionWorker::MarkDeleteNode(
+      const std::set<NodeDef*>& cluster, 
+      const NodeDef& fused_node) {
+  for (size_t i = 0; i < graph_->node.size(); ++i) {
+    if (cluster.find(&(graph_->node[i])) != cluster.end()) {
+      graph_->node[i].name = "__delete__";
+    }
+  }
+
+  new_nodes_.emplace_back(new NodeDef(fused_node));
+  nodes_.insert(std::make_pair(fused_node.name, new_nodes_.back().get()));
+
+  return Status::Ok();
+}
+
+Status FusionWorker::DeleteNodes() {
+  std::vector<NodeDef> nodes;
+  for (auto& item: graph_->node) {
+    if (item.name != "__delete__") {
+      nodes.push_back(item);
+    }
+  }
+  for (auto&& item : new_nodes_) {
+    nodes.push_back(*item.get());
+  }
+
+  graph_->node = std::move(nodes);
+  return Status::Ok();
+}
+
+Status FusionWorker::MarkRenameInput(
+    const std::string& in_name, const std::string& out_name) {
+  rename_map_[in_name] = out_name;
+  return Status::Ok();
+}
+
+Status FusionWorker::RenameInput() {
+  for (auto& item: graph_->node) {
+    for (auto& input: item.input) {
+      auto iter = rename_map_.find(input);
+      if (iter != rename_map_.end()) {
+        input = iter->second;
+      }
+    }
+  }
+  for (auto& input: output_names_) {
+    auto iter = rename_map_.find(input);
+    if (iter != rename_map_.end()) {
+      input = iter->second;
+    }
+  }
+  output_->output = std::move(output_names_);
+  return Status::Ok();
+}
+
+}  // namespace xdl
+
+
+
diff --git a/xdl/xdl/core/grappler/ps_fusion_worker.h b/xdl/xdl/core/grappler/ps_fusion_worker.h
new file mode 100644
index 00000000..71d660cd
--- /dev/null
+++ b/xdl/xdl/core/grappler/ps_fusion_worker.h
@@ -0,0 +1,252 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_GRAPPLER_PS_FUSION_WORKER
+#define XDL_CORE_GRAPPLER_PS_FUSION_WORKER
+
+#include <atomic>
+#include <set>
+#include <map>
+#include <vector>
+#include <functional>
+#include <unordered_map>
+
+#include "xdl/core/framework/graph_def.h"
+#include "xdl/core/lib/status.h"
+
+namespace xdl {
+
+class FusionWorker {
+ public:
+  using NodeDependency = std::unordered_map<NodeDef*, std::set<NodeDef*> >;
+  using NodeInput = std::pair<NodeDef*, int>;  
+  using PredecessorMap = std::unordered_map<NodeDef*, std::set<NodeInput> >;
+
+  FusionWorker() : id_(0) {}
+  virtual ~FusionWorker() {}
+  virtual Status Process(GraphDef* graph, OutputSpec* output) = 0;
+  
+protected:
+  Status Init(GraphDef* graph, OutputSpec* output);
+  Status ClusterNodes(
+      const std::function<bool(NodeDef*)>& match_func,
+      GraphDef* graph, 
+      std::vector<std::set<NodeDef*> >* clusters);
+  Status GetNodeByName(
+      const std::string& name, 
+      NodeDef** node);
+  Status GetNodeAttr(
+      NodeDef* node, 
+      const std::string& name,
+      AttrValue* value);
+  template <typename T>
+  Status GetAttrValue(
+      NodeDef* node, 
+      const std::string& name,
+      T* value);
+  template <typename T>
+  void SetAttrValue(
+      NodeDef* node, 
+      const std::string& name,
+      const T& value);
+  Status MarkDeleteNode(
+      const std::set<NodeDef*>& cluster, 
+      const NodeDef& fused_node);
+  Status DeleteNodes();
+  Status MarkRenameInput(
+      const std::string& in_name, const std::string& out_name);
+  Status RenameInput();
+  
+ protected:
+  std::unordered_map<std::string, NodeDef*> nodes_;
+  std::unordered_map<std::string, std::string> rename_map_;
+  std::vector<NodeDef*> output_nodes_;
+  std::vector<std::string> output_names_;
+  std::atomic<int> id_;
+  std::vector<std::unique_ptr<NodeDef>> new_nodes_;
+  GraphDef* graph_;
+  OutputSpec* output_;
+};
+
+template <>
+inline Status FusionWorker::GetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    std::string* attr) {
+  AttrValue value;
+  XDL_CHECK_STATUS(GetNodeAttr(node, name, &value));
+  XDL_CHECK_COND(value.attr_type == AttrValue::kString, 
+                 Status::ArgumentError("attr:" + name + " is not string"));
+  *attr = value.s;
+  return Status::Ok();
+}
+
+template <>
+inline Status FusionWorker::GetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    int* attr) {
+  AttrValue value;
+  XDL_CHECK_STATUS(GetNodeAttr(node, name, &value));
+  XDL_CHECK_COND(value.attr_type == AttrValue::kInt, 
+                 Status::ArgumentError("attr:" + name + " is not int"));
+  *attr = value.i;
+  return Status::Ok();
+}
+
+template <>
+inline Status FusionWorker::GetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    float* attr) {
+  AttrValue value;
+  XDL_CHECK_STATUS(GetNodeAttr(node, name, &value));
+  XDL_CHECK_COND(value.attr_type == AttrValue::kFloat, 
+                 Status::ArgumentError("attr:" + name + " is not float"));
+  *attr = value.f;
+  return Status::Ok();
+}
+
+template <>
+inline Status FusionWorker::GetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    bool* attr) {
+  AttrValue value;
+  XDL_CHECK_STATUS(GetNodeAttr(node, name, &value));
+  XDL_CHECK_COND(value.attr_type == AttrValue::kBool, 
+                 Status::ArgumentError("attr:" + name + " is not bool"));
+  *attr = value.b;
+  return Status::Ok();
+}
+
+template <>
+inline Status FusionWorker::GetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    DataType* attr) {
+  AttrValue value;
+  XDL_CHECK_STATUS(GetNodeAttr(node, name, &value));
+  XDL_CHECK_COND(value.attr_type == AttrValue::kDataType, 
+                 Status::ArgumentError("attr:" + name + " is not DataType"));
+  *attr = value.type;
+  return Status::Ok();
+}
+
+template <>
+inline Status FusionWorker::GetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    TensorShape* attr) {
+  AttrValue value;
+  XDL_CHECK_STATUS(GetNodeAttr(node, name, &value));
+  XDL_CHECK_COND(value.attr_type == AttrValue::kTensorShape, 
+                 Status::ArgumentError("attr:" + name + " is not TensorShape"));
+  *attr = value.shape;
+  return Status::Ok();
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const std::string& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kString;
+  value.s = attr;
+  node->attr[name] = value;
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const int& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kInt;
+  value.i = attr;
+  node->attr[name] = value;
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const float& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kFloat;
+  value.f = attr;
+  node->attr[name] = value;
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const bool& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kBool;
+  value.b = attr;
+  node->attr[name] = value;
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const DataType& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kDataType;
+  value.type = attr;
+  node->attr[name] = value;
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const TensorShape& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kTensorShape;
+  value.shape = attr;
+  node->attr[name] = value;
+}
+
+template <>
+inline void FusionWorker::SetAttrValue(
+    NodeDef* node,
+    const std::string& name,
+    const std::vector<DataType>& attr) {
+  AttrValue value;
+  value.attr_type = AttrValue::kDataTypeList;
+  value.type_list = attr;
+  node->attr[name] = value;
+}
+
+inline Status FusionWorker::GetNodeAttr(
+    NodeDef* node, 
+    const std::string& name,
+    AttrValue* value) {
+  const auto& it = node->attr.find(name);
+  XDL_CHECK_COND(it != node->attr.end(), 
+                 Status::ArgumentError("attr:" + name + " not found"));
+  *value = it->second;
+  return Status::Ok();
+}
+
+}  // namespace XDL_CORE_GRAPPLER_PS_FUSION_WORKER
+
+#endif
+
diff --git a/xdl/xdl/core/inference/serving.cc b/xdl/xdl/core/inference/serving.cc
deleted file mode 100644
index 0b732ad8..00000000
--- a/xdl/xdl/core/inference/serving.cc
+++ /dev/null
@@ -1,154 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include "xdl/core/inference/serving.h"
-
-#include "xdl/core/utils/logging.h"
-#include "xdl/core/utils/file_utils.h"
-
-namespace xdl {
-
-Serving::Serving(const std::string& ckpt_dir)
-  : ckpt_dir_(ckpt_dir)
-  , client_(nullptr) {
-  executor_.reset(new Executor(ThreadPool::Global()));
-}
-
-Status Serving::Init(const std::string& graph_path,
-                     const std::string& ckpt_version) {
-  XDL_CHECK_COND(
-      ConnectToClient("localhost", ckpt_dir_),
-      Status::Internal("connect to client failed"));
-  XDL_CHECK_COND(
-      GetClient(&client_).IsOk(),
-      Status::Internal("get client failed"));
-
-  XDL_CHECK_STATUS(LoadGraph(graph_path));
-  std::promise<bool> p;
-  auto cb = [&p](const ps::Status& st) {
-    bool ret = st.IsOk() ? true : false;
-    if (!ret) {
-      XDL_LOG(ERROR) << st.ToString();
-    }
-    
-    p.set_value(ret);
-  };
-
-  client_->Restore(ckpt_version, cb);
-  bool ret = p.get_future().get();
-  if (!ret) {
-    return Status::Internal("local_client restore failed");
-  }
-
-  return Status::Ok();
-}
-
-Status Serving::LoadGraph(
-    const std::string& graph_path,
-    bool text_format) {
-  std::string graph_str = FileUtils::ReadLocalBinaryFile(graph_path);
-  XDL_CHECK_COND(
-      !graph_str.empty(),
-      Status::ArgumentError("failed to read graph:" + graph_path));
-  if (text_format) {
-    XDL_CHECK_COND(
-        graph_.FromTextString(graph_str),
-        Status::ArgumentError("cant't parse graph"));
-  } else {
-    XDL_CHECK_COND(
-        graph_.FromProtoString(graph_str),
-        Status::ArgumentError("cant't parse graph"));
-  }
-
-  XDL_CHECK_STATUS(ParseInferenceTag());
-  return Status::Ok();
-}
-
-Status Serving::ParseInferenceTag() {
-  for (size_t i = 0; i < graph_.tag.inputs.size(); ++i) {
-    const InputDef& input= graph_.tag.inputs[i];
-    input_tag_.insert(make_pair(input.input_name, input.op_name));
-  }
-
-  for (size_t i = 0; i < graph_.tag.outputs.size(); ++i) {
-    output_spec_.output.push_back(graph_.tag.outputs[i].op_name);
-  }
-
-  output_spec_.output_device.device_name = "CPU";
-  return Status::Ok();
-}
-
-Status Serving::Predict(
-    const Executor::Feeds& feeds, 
-    std::vector<Tensor>* results) {
-  XDL_CHECK_COND(
-      !input_tag_.empty() && !output_spec_.output.empty(),
-      Status::ArgumentError("no TagDef found in graph def"));
-
-  Executor::Feeds real_feeds;
-  real_feeds.reserve(feeds.size());
-  for (auto& feed: feeds) {
-    auto it = input_tag_.find(feed.first);
-    XDL_CHECK_COND(
-        it != input_tag_.end(),
-        Status::ArgumentError("input tag not found:" + feed.first));
-    real_feeds.push_back({it->second, feed.second});
-  }
-
-  return Predict(real_feeds, output_spec_, results);
-}
-
-Status Serving::Predict(
-    const Executor::Feeds& feeds, 
-    const std::vector<std::string>& output_op_names,
-    std::vector<Tensor>* results) {
-  OutputSpec output_spec;
-  output_spec.output = output_op_names;
-  output_spec.output_device.device_name = "CPU";
-  return Predict(feeds, output_spec, results);
-}
-
-Status Serving::Predict(
-    const Executor::Feeds& feeds,
-    const OutputSpec output_spec,
-    std::vector<Tensor>* results) {
-  RunOption run_option;
-  std::promise<bool> p;
-  auto cb = [&p, results](
-      Status st, 
-      const std::vector<Tensor>& outputs, 
-      const SimpleExecutor::ExtraInfo& exinfo) {
-    bool ret = st.IsOk();
-    if (ret) {
-      for (size_t i = 0; i < outputs.size(); ++i) {
-        results->emplace_back(outputs[i]);
-      }
-    } else {
-      printf("%s\n", st.ToString().c_str());
-    }
-
-    p.set_value(ret);
-  };
-
-  executor_->Run(graph_, feeds, output_spec, run_option, cb);
-  if (p.get_future().get()) {
-    return Status::Ok();
-  } else {
-    return Status::Internal("executor run failed");
-  }
-}
-
-}  // namespace xdl
-
diff --git a/xdl/xdl/core/inference/serving.h b/xdl/xdl/core/inference/serving.h
deleted file mode 100644
index ecf61014..00000000
--- a/xdl/xdl/core/inference/serving.h
+++ /dev/null
@@ -1,65 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#ifndef XDL_CORE_INFERENCE_SERVING_H_
-#define XDL_CORE_INFERENCE_SERVING_H_
-
-#include "xdl/core/utils/logging.h"
-#include "xdl/core/framework/tensor.h"
-#include "xdl/core/framework/cpu_device.h"
-#include "xdl/core/framework/executor.h"
-#include "xdl/core/ops/ps_ops/client.h"
-
-namespace xdl {
-
-class Serving {
- public:
-  Serving(const std::string& ckpt_dir);
-  ~Serving() = default;
-
-  Status Init(const std::string& graph_path,
-              const std::string& ckpt_version);
-
-  // used when GraphDef has inference TagDef defined
-  // in training 
-  Status Predict(const Executor::Feeds& feeds, 
-                 std::vector<Tensor>* outputs);
-
-  // used in common case
-  Status Predict(const Executor::Feeds& feeds, 
-                 const std::vector<std::string>& output_op_names,
-                 std::vector<Tensor>* results);
-
- private:
-  Status LoadGraph(const std::string& graph_path, 
-                   bool text_format = true);
-  Status ParseInferenceTag();
-  Status Predict(const Executor::Feeds& feeds,
-                 const OutputSpec output_spec,
-                 std::vector<Tensor>* results);
-
- private:
-  GraphDef graph_;
-  std::string ckpt_dir_;
-  ps::client::BaseClient* client_;
-  std::unique_ptr<Executor> executor_;
-  std::unordered_map<std::string, std::string> input_tag_;
-  OutputSpec output_spec_;
-};
-
-}  // namespace xdl
-
-#endif  // XDL_CORE_INFERENCE_SERVING_H_
-
diff --git a/xdl/xdl/core/lib/any.h b/xdl/xdl/core/lib/any.h
index 0ddc624b..a5b311c1 100644
--- a/xdl/xdl/core/lib/any.h
+++ b/xdl/xdl/core/lib/any.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2018 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/atomic.h b/xdl/xdl/core/lib/atomic.h
index a1cf45e6..b71f5252 100644
--- a/xdl/xdl/core/lib/atomic.h
+++ b/xdl/xdl/core/lib/atomic.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/base64.cc b/xdl/xdl/core/lib/base64.cc
new file mode 100644
index 00000000..f420be2e
--- /dev/null
+++ b/xdl/xdl/core/lib/base64.cc
@@ -0,0 +1,190 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/base64.h"
+
+namespace xdl {
+
+static const char basis64[] =
+  "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
+
+int32_t Base64Encode(unsigned char *dst, const uint32_t &dsize,
+     const unsigned char *src, const uint32_t &size) {
+  // check the output buffer size
+  uint32_t len = size / 3;
+  uint32_t encode_len = 0;
+  if (size % 3) {
+    len++;
+  }
+  if (len * 4  >= dsize) {
+    return -1;
+  }
+
+  len = size;
+  const unsigned char *s = src;
+  unsigned char *d = dst;
+  while (len > 2) {
+    *d++ = basis64[(s[0] >> 2) & 0x3f];
+    *d++ = basis64[((s[0] & 3) << 4) | (s[1] >> 4)];
+    *d++ = basis64[((s[1] & 0x0f) << 2) | (s[2] >> 6)];
+    *d++ = basis64[s[2] & 0x3f];
+    s += 3;
+    len -= 3;
+    encode_len += 4;
+  }
+
+  if (len) {
+    *d++ = basis64[(s[0] >> 2) & 0x3f];
+    encode_len += 1;
+
+    if (len == 1) {
+      *d++ = basis64[(s[0] & 3) << 4];
+      *d++ = '=';
+      encode_len += 2;
+    } else {
+      *d++ = basis64[((s[0] & 3) << 4) | (s[1] >> 4)];
+      *d++ = basis64[(s[1] & 0x0f) << 2];
+      encode_len += 2;
+    }
+    *d++ = '=';
+    encode_len += 1;
+  }
+  *d = 0;
+  return encode_len;
+}
+
+int32_t Base64Encode(std::string *dst,  const std::string &src) {
+  *dst = "";
+  if (src.empty()) {
+    return 0;
+  }
+  uint32_t size = 16;
+  if (4 < src.length() * 2 + 1) {
+    size =  src.length() * 2 + 1;
+  }
+  unsigned char *buffer = new unsigned char[size];
+  if (NULL == buffer) {
+    return -1;
+  }
+  const unsigned char *s = reinterpret_cast<const unsigned char *>(src.c_str());
+  int32_t len = Base64Encode(buffer, size, s, src.length());
+  if (len > 0) {
+    *dst = std::string(reinterpret_cast<char *>(buffer));
+  }
+  delete [] buffer;
+  buffer = NULL;
+  return len;
+}
+
+static uint32_t DecodeInternal(unsigned char *dst, const uint32_t &dsize,
+         const unsigned char *src, const uint32_t &size, const unsigned char *basis) {
+  // length(src) * 3/4 < length(dst);
+  if (size == 0) {
+    *dst = 0;
+    return 0;
+  }
+  if (size < 4) {
+    return -1;
+  }
+  if (size == 4 && dsize < 4) {
+    return -1;
+  }
+  if (size > 4 && size * 3 >= dsize * 4) {
+    return -1;
+  }
+  uint32_t len;
+
+  for (len = 0; len < size; len++) {
+    if (src[len] == '=') {
+      break;
+    }
+    if (basis[src[len]] == 77) {
+      return -1;
+    }
+  }
+
+  if (len % 4 == 1) {
+    return -1;
+  }
+
+  const unsigned char *s = src;
+  unsigned char *d = dst;
+  int decode_len = 0;
+  while (len > 3) {
+    *d++ = (unsigned char) (basis[s[0]] << 2 | basis[s[1]] >> 4);
+    *d++ = (unsigned char) (basis[s[1]] << 4 | basis[s[2]] >> 2);
+    *d++ = (unsigned char) (basis[s[2]] << 6 | basis[s[3]]);
+    s += 4;
+    len -= 4;
+    decode_len += 3;
+  }
+
+  if (len > 1) {
+    *d++ = (u_char) (basis[s[0]] << 2 | basis[s[1]] >> 4);
+    decode_len += 1;
+  }
+
+  if (len > 2) {
+    *d++ = (u_char) (basis[s[1]] << 4 | basis[s[2]] >> 2);
+    decode_len += 1;
+  }
+
+  *d = 0;
+  return decode_len;
+}
+
+int32_t Base64Decode(unsigned char *dst, const uint32_t &dsize,
+     const unsigned char *src, const uint32_t &size) {
+  static unsigned char basis64[] = {
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 62, 77, 77, 77, 63,
+    52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 77, 77, 77, 77, 77, 77,
+    77,  0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12, 13, 14,
+    15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 77, 77, 77, 77, 77,
+    77, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40,
+    41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 77, 77, 77, 77, 77,
+
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77,
+    77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77, 77
+  };
+  return DecodeInternal(dst, dsize, src, size, basis64);
+}
+
+int32_t Base64Decode(std::string *dst, const std::string &src) {
+  if (src.empty()) {
+    return 0;
+  }
+  unsigned char *buffer = new unsigned char[src.length()];
+  if (NULL == buffer) {
+    return -1;
+  }
+  const unsigned char *s = reinterpret_cast<const unsigned char *>(src.c_str());
+  int32_t len = Base64Decode(buffer, src.length(), s, src.length());
+  if (len > 0) {
+    *dst = std::string(reinterpret_cast<char *>(buffer), len);
+  }
+  delete [] buffer;
+  buffer = NULL;
+  return len;
+}
+
+}  // namespace xdl
diff --git a/xdl/xdl/core/lib/base64.h b/xdl/xdl/core/lib/base64.h
new file mode 100644
index 00000000..b781cbfd
--- /dev/null
+++ b/xdl/xdl/core/lib/base64.h
@@ -0,0 +1,33 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_LIB_BASE64_H_
+#define XDL_CORE_LIB_BASE64_H_
+
+#include <string>
+
+namespace xdl {
+  int32_t Base64Encode(unsigned char *dst, const uint32_t &dsize,
+                       const unsigned char *src, const uint32_t &size);
+
+  int32_t Base64Encode(std::string *dst, const std::string &src);
+
+  int32_t Base64Decode(unsigned char *dst, const uint32_t &dsize,
+                       const unsigned char *src, const uint32_t &size);
+
+  int32_t Base64Decode(std::string *dst, const std::string &src);
+}  // namespace xdl
+
+#endif  // XDL_CORE_LIB_BASE64_H_
diff --git a/xdl/xdl/core/lib/binary_search.h b/xdl/xdl/core/lib/binary_search.h
index 3cce739e..a51ce447 100644
--- a/xdl/xdl/core/lib/binary_search.h
+++ b/xdl/xdl/core/lib/binary_search.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -53,6 +38,39 @@ __host__ __device__ ForwardIt LowerBound(ForwardIt first,
   return first;
 }
 
+template <typename T>
+__host__ __device__ int BinarySearch(const T* src, size_t sz, const T& v) {
+  int l = 0, r = sz - 1, m;
+  while (l <= r) {
+    m = l + (r - l) / 2;
+    if (v == src[m]) {
+      return m;
+    } else if (v < src[m]) {
+      r = m - 1;
+    } else {
+      l = m + 1;
+    }
+  }
+  return -1;
+}
+
+template <typename T>
+__host__ __device__ int BinarySearch2(const T* src, size_t sz,
+                                      const T& v1, const T& v2) {
+  int l = 0, r = sz - 1, m;
+  while (l <= r) {
+    m = l + (r - l) / 2;
+    if (v1 == src[2*m] && v2 == src[2*m+1]) {
+      return m;
+    } else if (v1 < src[2*m] || (v1 == src[2*m] && v2 < src[2*m+1])) {
+      r = m - 1;
+    } else {
+      l = m + 1;
+    }
+  }
+  return -1;
+}
+
 }  // namespace xdl
 
 #endif  // XDL_CORE_LIB_BINARY_SEARCH_H_
diff --git a/xdl/xdl/core/lib/blocking_queue.h b/xdl/xdl/core/lib/blocking_queue.h
index cc7c7249..8216468d 100644
--- a/xdl/xdl/core/lib/blocking_queue.h
+++ b/xdl/xdl/core/lib/blocking_queue.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2018 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/common_defines.cc b/xdl/xdl/core/lib/common_defines.cc
index 8b242231..7cfdb058 100644
--- a/xdl/xdl/core/lib/common_defines.cc
+++ b/xdl/xdl/core/lib/common_defines.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/common_defines.h b/xdl/xdl/core/lib/common_defines.h
index 447706ad..f67a6eb0 100644
--- a/xdl/xdl/core/lib/common_defines.h
+++ b/xdl/xdl/core/lib/common_defines.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -62,9 +47,11 @@ limitations under the License.
 
 #ifdef USE_GPU
 // CUDA: use 512 threads per block
-#define CUDA_NUM_THREADS 512
-// CUDA: number of blocks for threads
-#define CUDA_GET_BLOCKS(N) (N + CUDA_NUM_THREADS - 1) / CUDA_NUM_THREADS
+#define CUDA_NUM_THREADS 1024
+// CUDA: number of blocks
+#define CUDA_GET_BLOCKS(N) ((N + CUDA_NUM_THREADS - 1) / CUDA_NUM_THREADS)
+// CUDA: number of threads in blocks
+#define CUDA_GET_THREADS(N, BLOCKS) ((N + BLOCKS - 1) / BLOCKS)
 // CUDA: grid stride loop
 #define CUDA_KERNEL_LOOP(i, n) \
   for (size_t i = blockIdx.x * blockDim.x + threadIdx.x; i < (n); i += blockDim.x * gridDim.x)
diff --git a/xdl/xdl/core/lib/concurrent_queue.h b/xdl/xdl/core/lib/concurrent_queue.h
index 59fcc7c5..c9544fcd 100644
--- a/xdl/xdl/core/lib/concurrent_queue.h
+++ b/xdl/xdl/core/lib/concurrent_queue.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/initializer.h b/xdl/xdl/core/lib/initializer.h
index fc2c549b..e77251af 100644
--- a/xdl/xdl/core/lib/initializer.h
+++ b/xdl/xdl/core/lib/initializer.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/object_pool.h b/xdl/xdl/core/lib/object_pool.h
index b2ecbe03..4a22313f 100644
--- a/xdl/xdl/core/lib/object_pool.h
+++ b/xdl/xdl/core/lib/object_pool.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2018 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/parallel.h b/xdl/xdl/core/lib/parallel.h
new file mode 100644
index 00000000..33bc3d27
--- /dev/null
+++ b/xdl/xdl/core/lib/parallel.h
@@ -0,0 +1,45 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_LIB_PARALLEL_H_
+#define XDL_CORE_LIB_PARALLEL_H_
+
+#include <vector>
+#include <tuple>
+
+namespace xdl {
+namespace common {
+
+  /* Generate splits for parallelly running */
+  __inline__
+  void parallel_split_generate(size_t nr_ele, size_t threads,
+                   std::vector<std::tuple<size_t, size_t, size_t>>* vec) {
+    size_t step = nr_ele / threads;
+    for (size_t index = 0; index < threads; index++) {
+      size_t begin, end;
+      begin = index * step;
+      if (index == (threads - 1)) {
+        end = nr_ele;
+      } else {
+        end = (index + 1) * step;
+      }
+      vec->push_back(std::make_tuple(index, begin, end));
+    }
+  }
+
+}
+}
+
+#endif
diff --git a/xdl/xdl/core/lib/singleton.h b/xdl/xdl/core/lib/singleton.h
index 9e44bcbd..d99c14bb 100644
--- a/xdl/xdl/core/lib/singleton.h
+++ b/xdl/xdl/core/lib/singleton.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/status.h b/xdl/xdl/core/lib/status.h
index 58b342de..1ebec92d 100644
--- a/xdl/xdl/core/lib/status.h
+++ b/xdl/xdl/core/lib/status.h
@@ -31,7 +31,8 @@ class Status {
     kIndexOverflow,
     kInternal,
     kPsError,
-    kOutOfRange
+    kOutOfRange,
+    kReachEnd
   };
 
   Status() : state_(nullptr) {}
@@ -88,6 +89,8 @@ class Status {
       { return Status(kPsError, msg); }
   static Status OutOfRange(const std::string& msg)
       { return Status(kOutOfRange, msg); }
+  static Status ReachEnd(const std::string& msg)
+      { return Status(kReachEnd, msg); }
 
  private:
   struct State {
diff --git a/xdl/xdl/core/lib/tbb_concurrent_queue.h b/xdl/xdl/core/lib/tbb_concurrent_queue.h
new file mode 100644
index 00000000..2fe19509
--- /dev/null
+++ b/xdl/xdl/core/lib/tbb_concurrent_queue.h
@@ -0,0 +1,42 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <vector>
+#include "tbb/concurrent_queue.h"
+#include "xdl/core/framework/tensor.h"
+
+namespace xdl {
+
+class TBBConcurrentQueue {
+public:
+  TBBConcurrentQueue() {finished = false;}
+  ~TBBConcurrentQueue() {};
+
+  void SetFinished() {finished = true;}
+  bool Finished() {return finished;}
+  tbb::concurrent_bounded_queue<std::vector<Tensor>>* Raw() {return &queue;}
+  static TBBConcurrentQueue* Global() {
+    static TBBConcurrentQueue queue;
+    return &queue;
+  }
+  
+private:
+  tbb::concurrent_bounded_queue<std::vector<Tensor>> queue;  
+  bool finished;
+};
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/lib/thread_local.h b/xdl/xdl/core/lib/thread_local.h
index 9ea1822b..9d2b725f 100644
--- a/xdl/xdl/core/lib/thread_local.h
+++ b/xdl/xdl/core/lib/thread_local.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/thread_pool.h b/xdl/xdl/core/lib/thread_pool.h
index 674ff23a..6f7abf05 100644
--- a/xdl/xdl/core/lib/thread_pool.h
+++ b/xdl/xdl/core/lib/thread_pool.h
@@ -32,7 +32,6 @@ typedef NonBlockingThreadPool ThreadPool;
 
 namespace xdl {
 
-// TODO(dongyue.wdy): use stronger performance thread pool.
 class ThreadPool {
  public:
   explicit ThreadPool(size_t threads);
diff --git a/xdl/xdl/core/lib/timer.cc b/xdl/xdl/core/lib/timer.cc
index 2858123d..05cf3a07 100644
--- a/xdl/xdl/core/lib/timer.cc
+++ b/xdl/xdl/core/lib/timer.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/timer.h b/xdl/xdl/core/lib/timer.h
index c69acb3c..f3e481f0 100644
--- a/xdl/xdl/core/lib/timer.h
+++ b/xdl/xdl/core/lib/timer.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/lib/unique.cc b/xdl/xdl/core/lib/unique.cc
new file mode 100644
index 00000000..08b190db
--- /dev/null
+++ b/xdl/xdl/core/lib/unique.cc
@@ -0,0 +1,132 @@
+/*
+ * Copyright 1999-2018 Alibaba Group.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+*/
+
+#include "xdl/core/lib/unique.h"
+
+namespace xdl {
+namespace functor {
+
+template <typename I> struct UniqueID {
+  std::vector<I> samples;
+  std::vector<I> idxs;  
+};
+
+template <typename T, typename I>
+void UniqueFunctor<CpuDevice, T, I>::operator()(CpuDevice* d,
+                                                const Tensor& in,
+                                                const Tensor& segment,
+                                                Tensor* out,
+                                                Tensor* out_index,
+                                                Tensor* sample_index,
+                                                Tensor* sample_segment) {
+  size_t id_num = in.Shape()[0];
+  size_t id_dim = in.Shape().Size() == 1 ? 1 : in.Shape()[1];
+  size_t total_num = in.Shape().NumElements();
+  I current_sample = 0;
+  T* pin = in.Raw<T>();
+  *out_index = Tensor(d, TensorShape({id_num}), DataTypeToEnum<I>::v());
+  I* pindex = out_index->Raw<I>();
+  I* psegment = segment.Raw<I>();
+  *sample_index = Tensor(d, TensorShape({id_num}), DataTypeToEnum<I>::v());
+  I* psample_index = sample_index->Raw<I>();
+
+  if (id_dim == 1) {
+    std::unordered_map<T, UniqueID<I> > uniq(id_num);
+    for (I i = 0; i < id_num; ++i) {
+      while (psegment[current_sample] == i) {
+        ++current_sample;
+      }
+      auto iter = uniq.insert(std::make_pair(pin[i], UniqueID<I>{.samples={current_sample}, .idxs={i}}));
+      if (!iter.second) {
+        iter.first->second.samples.push_back(current_sample);
+        iter.first->second.idxs.push_back(i);
+      }
+    }
+    TensorShape out_shape({uniq.size()});
+    *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
+    *sample_segment = Tensor(d, out_shape, DataTypeToEnum<I>::v());
+    I accum = 0;  
+    T* pout = out->Raw<T>();
+    I* psample_segment = sample_segment->Raw<I>();
+    I j = 0;
+    for (const auto& it : uniq) {
+      pout[j] = it.first;
+      for (size_t i = 0; i < it.second.samples.size(); ++i, ++accum) {
+        psample_index[accum] = it.second.samples[i];
+      }
+      for (size_t i = 0; i < it.second.idxs.size(); ++i) {
+        pindex[it.second.idxs[i]] = j;
+      }
+      psample_segment[j] = accum;
+      j++;
+    }
+  } else {
+    auto hash_fn = [pin](const size_t& index) {
+      size_t x = std::hash<T>()(pin[index * 2]);
+      size_t y = std::hash<T>()(pin[index * 2 + 1]);
+      x = ((x & 0xAAAAAAAAAAAAAAAAL) >> 1) + ((x & 0x5555555555555555L) << 1);
+      y = ((y & 0xFFFFFFFF00000000L) >> 32) + ((y & 0x00000000FFFFFFFFL) << 32);
+      return x ^ y;
+    };
+    auto key_equal_fn = [pin](const size_t& lhs, const size_t& rhs) {
+      return pin[lhs * 2] == pin[rhs * 2] &&
+             pin[lhs * 2 + 1] == pin[rhs * 2 + 1];
+    };
+
+    std::unordered_map<size_t, UniqueID<I>, decltype(hash_fn), decltype(key_equal_fn)>
+        uniq(id_num, hash_fn, key_equal_fn);
+
+    for (I i = 0; i < id_num; ++i) {
+      while (psegment[current_sample] == i) {
+        ++current_sample;
+      }
+      auto iter = uniq.insert(std::make_pair(i, UniqueID<I>{.samples={current_sample}, .idxs={i}}));
+      if (!iter.second) {
+        iter.first->second.samples.push_back(current_sample);
+        iter.first->second.idxs.push_back(i);
+      }
+    }
+    TensorShape out_shape({uniq.size(), id_dim});
+    *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
+    TensorShape sample_segment_shape({uniq.size()});    
+    *sample_segment = Tensor(d, sample_segment_shape, DataTypeToEnum<I>::v());
+    I accum = 0;  
+    T* pout = out->Raw<T>();
+    I* psample_segment = sample_segment->Raw<I>();
+    I j = 0;
+    for (const auto& it : uniq) {
+      pout[2*j] = pin[2*it.first];
+      pout[2*j+1] = pin[2*it.first+1];
+      for (size_t i = 0; i < it.second.samples.size(); ++i, ++accum) {
+        psample_index[accum] = it.second.samples[i];
+      }
+      for (size_t i = 0; i < it.second.idxs.size(); ++i) {
+        pindex[it.second.idxs[i]] = j;
+      }
+      psample_segment[j] = accum;
+      j++;
+    }
+  }
+}
+
+template struct UniqueFunctor<CpuDevice, int64_t, int64_t>;
+template struct UniqueFunctor<CpuDevice, int32_t, int32_t>;
+template struct UniqueFunctor<CpuDevice, int64_t, int32_t>;
+template struct UniqueFunctor<CpuDevice, int32_t, int64_t>;
+
+}  // namespace functor
+
+}  // namespace xdl
diff --git a/xdl/xdl/core/lib/unique.h b/xdl/xdl/core/lib/unique.h
new file mode 100644
index 00000000..631679e3
--- /dev/null
+++ b/xdl/xdl/core/lib/unique.h
@@ -0,0 +1,36 @@
+/*
+ * Copyright 1999-2018 Alibaba Group.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+*/
+#ifndef XDL_IO_MERGER_UNIQUE_H_
+#define XDL_IO_MERGER_UNIQUE_H_
+
+#include "xdl/core/framework/cpu_device.h"
+#include "xdl/core/framework/tensor.h"
+
+namespace xdl {
+namespace functor {
+
+template <typename Device, typename T, typename I>
+struct UniqueFunctor;
+
+template <typename T, typename I>
+struct UniqueFunctor<CpuDevice, T, I> {
+  void operator()(CpuDevice* d, const Tensor& in, const Tensor& segment, Tensor* out, Tensor* out_index, Tensor* sample_index, Tensor* sample_segment);
+};
+
+}  // namespace functor
+}  // namespace xdl
+
+#endif  // XDL_IO_MERGER_UNIQUE_H_
diff --git a/xdl/xdl/core/ops/add_sparse_gradient.cc b/xdl/xdl/core/ops/add_sparse_gradient.cc
index d90e0a27..b79718ee 100644
--- a/xdl/xdl/core/ops/add_sparse_gradient.cc
+++ b/xdl/xdl/core/ops/add_sparse_gradient.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/add_sparse_gradient.h b/xdl/xdl/core/ops/add_sparse_gradient.h
index e0f13fb8..dbdb46f4 100644
--- a/xdl/xdl/core/ops/add_sparse_gradient.h
+++ b/xdl/xdl/core/ops/add_sparse_gradient.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -39,90 +24,90 @@ limitations under the License.
 
 namespace xdl {
 
+struct Indice {
+  unsigned int i;
+  unsigned int j;
+  Indice(size_t i, size_t j) : i(i), j(j) {}
+};
+
 template <typename T, typename I>
 void HostAddSparse(const std::vector<Tensor>& in_grads,
                    const std::vector<Tensor>& in_ids,
                    Tensor* out_grads, Tensor* out_ids) {
-  std::vector<std::vector<size_t>> indices;
   size_t count = 0;
-
-  if (in_ids[0].Shape().Size() == 1) {
-    // make unique id
+  std::vector<std::vector<Indice>> indices_vec;
+  bool is_hash64 = (in_ids[0].Shape().Size() == 1);
+  if (is_hash64) {
     std::unordered_map<I, size_t> uniq_map;
     for (size_t i = 0; i < in_ids.size(); ++i) {
       size_t n = in_ids[i].Shape()[0];
       I* pid = in_ids[i].Raw<I>();
-      std::vector<size_t> index;
-      index.reserve(n);
-      for (size_t k = 0; k < n; ++k) {
-        auto iter = uniq_map.insert(std::make_pair(pid[k], count));
-        index.push_back(iter.first->second);
-        if (iter.second) ++count;
+      for (size_t j = 0; j < n; ++j) {
+        auto iter = uniq_map.insert(std::make_pair(pid[j], count));
+        if (iter.second) {
+          ++count;
+          indices_vec.push_back(std::vector<Indice>{Indice(i, j)});
+        } else {
+          indices_vec[iter.first->second].push_back(Indice(i, j));
+        }
       }
-      indices.push_back(index);
-    }
-    TensorShape id_shape = in_ids[0].Shape();
-    id_shape.Set(0, count);
-    *out_ids = Tensor(DeviceSingleton::CpuInstance(), id_shape,
-                      in_ids[0].Type());
-    I* pid = out_ids->Raw<I>();
-    for (auto&& iter : uniq_map) {
-      pid[iter.second] = iter.first;
     }
   } else {
-    // make unique id
     auto hash_fn = [](const std::pair<I, I>& id) {
       size_t x = std::hash<I>()(id.first);
       size_t y = std::hash<I>()(id.second);
       x = ((x & 0xAAAAAAAAAAAAAAAAL) >> 1) + ((x & 0x5555555555555555L) << 1);
-      y = ((y & 0xFFFFFFFF00000000L) >> 32) + ((y & 0x00000000FFFFFFFFL) << 32);
+      y = ((y & 0xCCCCCCCCCCCCCCCCL) >> 2) + ((y & 0x3333333333333333L) << 2);
       return x ^ y;
     };
     auto equal_fn = [](const std::pair<I, I>& lhs,
                        const std::pair<I, I>& rhs) {
       return lhs.first == rhs.first && lhs.second == rhs.second;
     };
-    std::unordered_map<std::pair<I, I>, size_t, decltype(hash_fn),
-        decltype(equal_fn)> uniq_map(0, hash_fn, equal_fn);
+    std::unordered_map<std::pair<I, I>, size_t, decltype(hash_fn), decltype(equal_fn)> uniq_map(0, hash_fn, equal_fn);
     for (size_t i = 0; i < in_ids.size(); ++i) {
       size_t n = in_ids[i].Shape()[0];
       I* pid = in_ids[i].Raw<I>();
-      std::vector<size_t> index;
-      index.reserve(n);
-      for (size_t k = 0; k < n; ++k) {
-        auto key = std::make_pair(pid[2 * k], pid[2 * k + 1]);
-        auto iter = uniq_map.insert(std::make_pair(key, count));
-        index.push_back(iter.first->second);
-        if (iter.second) ++count;
+      for (size_t j = 0; j < n; ++j) {
+        auto iter = uniq_map.insert(std::make_pair(std::make_pair(pid[j*2], pid[j*2+1]), count));
+        if (iter.second) {
+          ++count;
+          indices_vec.push_back(std::vector<Indice>{Indice(i, j)});
+        } else {
+          indices_vec[iter.first->second].push_back(Indice(i, j));
+        }
       }
-      indices.push_back(index);
-    }
-    TensorShape id_shape = in_ids[0].Shape();
-    id_shape.Set(0, count);
-    *out_ids = Tensor(DeviceSingleton::CpuInstance(), id_shape,
-                      in_ids[0].Type());
-    I* pid = out_ids->Raw<I>();
-    for (auto&& iter : uniq_map) {
-      pid[2*iter.second] = iter.first.first;
-      pid[2*iter.second+1] = iter.first.second;
     }
   }
-  // add to unique grad
+  TensorShape id_shape = in_ids[0].Shape();
+  id_shape.Set(0, count);
+  *out_ids = Tensor(DeviceSingleton::CpuInstance(), id_shape, in_ids[0].Type());
+  I* pid_out = out_ids->Raw<I>();
+
   size_t eb_dim = in_grads[0].Shape()[1];
   TensorShape uniq_shape({count, eb_dim});
   *out_grads = Tensor(DeviceSingleton::CpuInstance(), uniq_shape,
                       in_grads[0].Type());
   T* puniq = out_grads->Raw<T>();
-  std::memset(puniq, 0, sizeof(T) * uniq_shape.NumElements());
-  for (size_t i = 0; i < in_ids.size(); ++i) {
-    size_t n = in_ids[i].Shape()[0];
-    T* pgrad = in_grads[i].Raw<T>();
-    I* pid = in_ids[i].Raw<I>();
-//    #pragma omp parallel for
-    for (size_t j = 0; j < n; ++j) {
-      size_t idx = indices[i][j];
+  #pragma omp parallel for
+  for (size_t c = 0; c < count; ++c) {
+    const std::vector<Indice>& indices = indices_vec[c];
+    size_t s = 0;
+    const unsigned int i = indices[s].i, j = indices[s].j;
+    if (is_hash64) {
+      pid_out[c] = in_ids[i].Raw<I>()[j];
+    } else {
+      pid_out[c*2] = in_ids[i].Raw<I>()[j*2];
+      pid_out[c*2+1] = in_ids[i].Raw<I>()[j*2+1];
+    }
+    T* p = puniq + c*eb_dim;
+    T* pgrad = in_grads[i].Raw<T>() + j*eb_dim;
+    memcpy(p, pgrad, eb_dim * sizeof(T));
+    //for (size_t k = 0; k < eb_dim; ++k)  p[k] = pgrad[k];
+    for (s = 1; s < indices.size(); ++s) {
+      T* pgrad = in_grads[indices[s].i].Raw<T>() + indices[s].j*eb_dim;
       for (size_t k = 0; k < eb_dim; ++k) {
-        common::cpu_atomic_add<T>(pgrad[j*eb_dim+k], puniq+idx*eb_dim+k);
+        p[k] += pgrad[k];
       }
     }
   }
diff --git a/xdl/xdl/core/ops/concat.cc b/xdl/xdl/core/ops/concat.cc
new file mode 100644
index 00000000..995b99e5
--- /dev/null
+++ b/xdl/xdl/core/ops/concat.cc
@@ -0,0 +1,109 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class ConcatOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("axis", &axis_));
+    XDL_CHECK_STATUS(ctx->GetAttr("dtype", &dtype_));
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    std::vector<Tensor> tensors;
+    XDL_CHECK_STATUS(ctx->GetInputList("tensors", &tensors));
+    if (tensors.size() == 0) {
+      return Status::ArgumentError("Concat should have at least 1 tensor");
+    }
+    std::vector<size_t> dims = tensors[0].Shape().Dims();
+    int64_t real_axis;
+    if (axis_ < 0) {
+      if (-axis_ > dims.size()) {
+        return Status::ArgumentError("Concat axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = dims.size() + axis_;
+    } else {
+      if (axis_ >= dims.size()) {
+        return Status::ArgumentError("Concat axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = axis_;
+    }
+    dims[real_axis] = 0;
+    std::vector<int64_t> slice;
+    for (auto&& item : tensors) {
+      if (item.Shape().Size() != dims.size()) {
+        return Status::ArgumentError("Concat dims size mismatch");
+      }
+      for (size_t i = 0; i < dims.size(); i++) {
+        if (i == real_axis) {
+          continue;
+        }
+        if (item.Shape()[i] != dims[i]) {
+          return Status::ArgumentError("Concat dims mismatch");
+        }
+      }
+      dims[real_axis] += item.Shape()[real_axis];
+      slice.push_back(item.Shape()[real_axis]);
+    }
+    int64_t repeat = 1, one_slice = SizeOfType(dtype_);
+    for (size_t i = 0; i < real_axis; i++) {
+      repeat *= dims[i];
+    }
+    for (size_t i = real_axis + 1; i < dims.size(); i++) {
+      one_slice *= dims[i];
+    }
+    for (auto&& item : slice) {
+      item *= one_slice;
+    }
+    Tensor output;
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, TensorShape(dims), &output));
+    std::vector<char*> org_ptr;
+    for (auto&& item : tensors) {
+      org_ptr.push_back(item.Raw<char>());
+    }
+    char* ptr = output.Raw<char>();
+    for (int64_t i = 0; i < repeat; i++) {
+      for (size_t j = 0; j < tensors.size(); j++) {
+        memcpy(ptr, org_ptr[j], slice[j]);
+        org_ptr[j] += slice[j];
+        ptr += slice[j];
+      }
+    }
+    return Status::Ok();
+  }
+ private:
+  int64_t axis_;
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(Concat)
+  .InputList("tensors", "dtype", "size")
+  .Attr("axis", AttrValue::kInt)
+  .Attr("dtype", AttrValue::kDataType)
+  .Attr("size", AttrValue::kInt)
+  .Output("result", "dtype");
+
+XDL_REGISTER_KERNEL(Concat, ConcatOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/confusion_matrix_op.cc b/xdl/xdl/core/ops/confusion_matrix_op.cc
index f27db0c0..527c8074 100644
--- a/xdl/xdl/core/ops/confusion_matrix_op.cc
+++ b/xdl/xdl/core/ops/confusion_matrix_op.cc
@@ -13,7 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-#include <xdl/core/utils/logging.h>
+#include "xdl/core/utils/logging.h"
 
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
diff --git a/xdl/xdl/core/ops/context_op.cc b/xdl/xdl/core/ops/context_op.cc
new file mode 100644
index 00000000..be7fd059
--- /dev/null
+++ b/xdl/xdl/core/ops/context_op.cc
@@ -0,0 +1,75 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class ReadContextOp : public OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("ctx_id", &id_));
+    return Status::Ok();
+  }
+  
+  Status Compute(OpKernelContext* ctx) override {
+    // TODO: Check Error
+    ExecutorContext* ectx = ctx->GetRunOption().in_ctx;
+    ctx->SetOutput(0, ectx->tensors[id_]);
+    return Status::Ok();
+  }
+ private:
+  int64_t id_;
+};
+
+XDL_DEFINE_OP(ReadContextOp)
+  .Output("input", "dtype")
+  .Attr("dtype", AttrValue::kDataType)
+  .Attr("ctx_id", AttrValue::kInt);
+
+XDL_REGISTER_KERNEL(ReadContextOp, ReadContextOp).Device("CPU");
+
+class WriteContextOp : public OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("ctx_id", &id_));
+    return Status::Ok();
+  }
+  
+  Status Compute(OpKernelContext* ctx) override {
+    // TODO: Check Error
+    ExecutorContext* ectx = ctx->GetRunOption().out_ctx;
+    if (id_ >= ectx->tensors.size()) {
+      ectx->tensors.resize(id_ + 1);
+    }
+    ctx->GetInput(0, &ectx->tensors[id_]);
+    return Status::Ok();
+  }
+ private:
+  int64_t id_;
+};
+
+XDL_DEFINE_OP(WriteContextOp)
+  .Input("input", "dtype")
+  .Attr("dtype", AttrValue::kDataType)
+  .Attr("ctx_id", AttrValue::kInt);
+
+XDL_REGISTER_KERNEL(WriteContextOp, WriteContextOp).Device("CPU");
+
+
+}  // namespace xdl
+
diff --git a/xdl/xdl/core/ops/dequeue_op.cc b/xdl/xdl/core/ops/dequeue_op.cc
new file mode 100644
index 00000000..8c7bcc9f
--- /dev/null
+++ b/xdl/xdl/core/ops/dequeue_op.cc
@@ -0,0 +1,67 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/partitioner/broadcast.h"
+#include "ps-plus/client/partitioner/reduce.h"
+#include "xdl/core/utils/string_utils.h"
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include <tbb/concurrent_queue.h>
+#include "xdl/core/lib/tbb_concurrent_queue.h"
+
+namespace xdl {
+
+class DequeueOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    std::vector<Tensor> tensors;
+    bool success = false;
+    while (!TBBConcurrentQueue::Global()->Finished() || TBBConcurrentQueue::Global()->Raw()->size() != 0) {
+      if (TBBConcurrentQueue::Global()->Raw()->try_pop(tensors)) {
+        success = true;
+        break;
+      }
+    }
+    if (success) {
+      XDL_CHECK_STATUS_ASYNC(ctx->SetOutputList("tensors", tensors), done);
+      done(Status::Ok());      
+    } else {
+      done(Status::OutOfRange("Dequeue finished"));      
+    }
+  }
+
+ private:
+  std::vector<std::string> names_;
+};
+
+XDL_DEFINE_OP(DequeueOp)
+  .OutputListV2("tensors", "types")
+  .Attr("types", AttrValue::kDataTypeList);
+
+XDL_REGISTER_KERNEL(DequeueOp, DequeueOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/emb_take.cc b/xdl/xdl/core/ops/emb_take.cc
index fe3f8aae..1a765cea 100644
--- a/xdl/xdl/core/ops/emb_take.cc
+++ b/xdl/xdl/core/ops/emb_take.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/enqueue_op.cc b/xdl/xdl/core/ops/enqueue_op.cc
new file mode 100644
index 00000000..5d68cb03
--- /dev/null
+++ b/xdl/xdl/core/ops/enqueue_op.cc
@@ -0,0 +1,56 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/utils/string_utils.h"
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/lib/tbb_concurrent_queue.h"
+
+namespace xdl {
+
+class EnqueueOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    std::string names_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("names", &names_str));
+    names_ = StringUtils::split(names_str, ";");
+    TBBConcurrentQueue::Global()->Raw()->set_capacity(1000);
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    std::vector<Tensor> tensors;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("tensors", &tensors), done);
+    XDL_CHECK_COND_ASYNC(tensors.size() == names_.size(), Status::ArgumentError("EnqueueOp: tensors and names size not match."), done);
+    TBBConcurrentQueue::Global()->Raw()->push(tensors);
+    done(Status::Ok());
+  }
+
+ private:
+  std::vector<std::string> names_;
+};
+
+XDL_DEFINE_OP(EnqueueOp)
+  .InputListV2("tensors", "types")
+  .Attr("names", AttrValue::kString)
+  .Attr("types", AttrValue::kDataTypeList);
+
+XDL_REGISTER_KERNEL(EnqueueOp, EnqueueOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/expand_dims.cc b/xdl/xdl/core/ops/expand_dims.cc
new file mode 100644
index 00000000..8eb69d26
--- /dev/null
+++ b/xdl/xdl/core/ops/expand_dims.cc
@@ -0,0 +1,66 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class ExpandDimsOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("axis", &axis_));
+    XDL_CHECK_STATUS(ctx->GetAttr("dtype", &dtype_));
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor tensor;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &tensor));
+    std::vector<size_t> shape = tensor.Shape().Dims();
+    int64_t real_axis;
+    if (axis_ < 0) {
+      if (-axis_ > shape.size() + 1) {
+        return Status::ArgumentError("ExpandDims axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = shape.size() + axis_ + 1;
+    } else {
+      if (axis_ >= shape.size() + 1) {
+        return Status::ArgumentError("ExpandDims axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = axis_;
+    }
+    shape.insert(shape.begin() + real_axis, 1);
+    XDL_CHECK_STATUS(ctx->SetOutput(0, Tensor(TensorShape(shape), dtype_, tensor.GetBuffer())));
+    return Status::Ok();
+  }
+ private:
+  int64_t axis_;
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(ExpandDims)
+  .Input("tensor", "dtype")
+  .Attr("axis", AttrValue::kInt)
+  .Attr("dtype", AttrValue::kDataType)
+  .Output("result", "dtype");
+
+XDL_REGISTER_KERNEL(ExpandDims, ExpandDimsOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/feature_mask_op.cc b/xdl/xdl/core/ops/feature_mask_op.cc
new file mode 100644
index 00000000..cd6f0807
--- /dev/null
+++ b/xdl/xdl/core/ops/feature_mask_op.cc
@@ -0,0 +1,96 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/utils/string_utils.h"
+
+namespace xdl {
+
+class FeatureMaskOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    std::string mask_conf;
+    XDL_CHECK_STATUS(ctx->GetAttr("mask_conf", &mask_conf));    
+    XDL_CHECK_STATUS(ctx->GetAttr("index", &index_));    
+    std::vector<std::string> fields = StringUtils::split(mask_conf, ";");
+    for (auto& field: fields) {
+      std::vector<std::string> kv = StringUtils::split(field, ":");
+      XDL_CHECK_COND(kv.size() == 2, Status::ArgumentError("mask conf error"));
+      std::vector<std::string> vlist = StringUtils::split(kv[1], ",");
+      XDL_CHECK_COND(vlist.size() > 0, Status::ArgumentError("mask conf error"));
+      int32_t tag = atoi(kv[0].c_str());
+      for (auto& v: vlist) {
+        tag_2_mask_[tag].push_back(atoi(v.c_str()));
+      }
+    }
+
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor input;
+    XDL_CHECK_STATUS(ctx->GetInput("input", &input));
+    Tensor tag_tensor;
+    XDL_CHECK_STATUS(ctx->GetInput("tag", &tag_tensor));    
+    XDL_CHECK_COND(
+        tag_tensor.Shape().IsScalar(), 
+        Status::ArgumentError("tag must be scalar"));
+    int32_t tag = tag_tensor.Scalar<int32_t>();
+    bool need_mask = false;
+    auto it = tag_2_mask_.find(tag);
+    if(it != tag_2_mask_.end()) {
+      for (auto index: it->second) {
+        if (index == index_) {
+          need_mask = true;
+          break;
+        }
+      }
+    }
+
+    Tensor output;
+    XDL_CHECK_STATUS(ctx->AllocateOutput("output", input.Shape(), &output));
+    if (!need_mask) {
+      memcpy(output.Raw<char*>(), 
+             input.Raw<char*>(), 
+             output.Shape().NumElements() * SizeOfType(output.Type()));
+    } else {
+      memset(output.Raw<char*>(), 
+             0, 
+             output.Shape().NumElements() * SizeOfType(output.Type()));
+    }
+
+    return Status::Ok();
+  }
+
+ private:
+  std::unordered_map<int32_t, std::vector<int32_t> > tag_2_mask_;
+  int64_t index_;
+};
+
+XDL_DEFINE_OP(FeatureMaskOp)
+  .Input("input", DataType::kFloat)
+  .Input("tag", DataType::kInt32)
+  .Output("output", DataType::kFloat)
+  .Attr("index", AttrValue::kInt)
+  .Attr("mask_conf", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(FeatureMaskOp, FeatureMaskOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/gauc_calc_op.cc b/xdl/xdl/core/ops/gauc_calc_op.cc
index aa8c34b1..d54cc143 100644
--- a/xdl/xdl/core/ops/gauc_calc_op.cc
+++ b/xdl/xdl/core/ops/gauc_calc_op.cc
@@ -1,19 +1,20 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include <xdl/core/utils/logging.h>
+/*
+ * Copyright 1999-2017 Alibaba Group.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+*/
+
+#include "xdl/core/utils/logging.h"
 
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
diff --git a/xdl/xdl/core/ops/gauc_op.cc b/xdl/xdl/core/ops/gauc_op.cc
index 49b66fae..2fb74deb 100644
--- a/xdl/xdl/core/ops/gauc_op.cc
+++ b/xdl/xdl/core/ops/gauc_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -29,7 +14,7 @@ limitations under the License.
  * limitations under the License.
 */
 
-#include <xdl/core/utils/logging.h>
+#include "xdl/core/utils/logging.h"
 
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
diff --git a/xdl/xdl/core/ops/identity_op.cc b/xdl/xdl/core/ops/identity_op.cc
new file mode 100644
index 00000000..f3c9071c
--- /dev/null
+++ b/xdl/xdl/core/ops/identity_op.cc
@@ -0,0 +1,60 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+template <typename T>
+class IdentityOp : public OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor input;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &input));    
+    Tensor output;
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, input.Shape(), &output));
+    memcpy(output.Raw<char>(), 
+           input.Raw<char>(), 
+           output.Shape().NumElements() * SizeOfType(output.Type()));
+    return Status::Ok();
+  }
+};
+
+XDL_DEFINE_OP(IdentityOp)
+  .Input("input", "dtype")
+  .Output("output", "dtype")
+  .Attr("dtype", AttrValue::kDataType);
+
+#define REGISTER_CPU_KERNEL(T)                      \
+  XDL_REGISTER_KERNEL(IdentityOp, IdentityOp<T>)    \
+    .Device("CPU")                                    \
+    .AttrDataType<T>("dtype");
+
+REGISTER_CPU_KERNEL(int8_t)
+REGISTER_CPU_KERNEL(int16_t)
+REGISTER_CPU_KERNEL(int32_t)
+REGISTER_CPU_KERNEL(int64_t)
+REGISTER_CPU_KERNEL(float)
+REGISTER_CPU_KERNEL(double)
+
+}  // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/identity_op.cu b/xdl/xdl/core/ops/identity_op.cu
new file mode 100644
index 00000000..238f3695
--- /dev/null
+++ b/xdl/xdl/core/ops/identity_op.cu
@@ -0,0 +1,58 @@
+/*
+ * Copyright 1999-2017 Alibaba Group.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+*/
+
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/framework/gpu/gpu_device.h"
+#include "xdl/core/lib/common_defines.h"
+#include "xdl/core/utils/logging.h"
+
+namespace xdl {
+
+template <typename T>
+class IdentityGpuOp : public GpuOpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  Status LaunchKernel(OpKernelContext* ctx, CudaStream* stream) override {
+    Tensor input;    
+    XDL_CHECK_STATUS(ctx->GetInput(0, &input));
+    Tensor output;
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, input.Shape(), &output));
+    CUDA_CHECK(cudaMemcpy(output.Raw<char>(), input.Raw<char>(), 
+                          output.Shape().NumElements() * SizeOfType(output.Type()),
+                          cudaMemcpyDeviceToDevice));
+    return Status::Ok();
+  }
+};
+
+#define REGISTER_GPU_KERNEL(T)                     \
+  XDL_REGISTER_KERNEL(IdentityOp, IdentityGpuOp<T>) \
+  .Device("GPU")                                   \
+  .AttrDataType<T>("dtype");
+
+REGISTER_GPU_KERNEL(int8_t)
+REGISTER_GPU_KERNEL(int16_t)
+REGISTER_GPU_KERNEL(int32_t)
+REGISTER_GPU_KERNEL(int64_t)
+REGISTER_GPU_KERNEL(float)
+REGISTER_GPU_KERNEL(double)
+
+#undef REGISTER_GPU_KERNEL
+
+}  // namespace
diff --git a/xdl/xdl/core/ops/ksum_grad_op.cc b/xdl/xdl/core/ops/ksum_grad_op.cc
index d7875524..d4d895ee 100644
--- a/xdl/xdl/core/ops/ksum_grad_op.cc
+++ b/xdl/xdl/core/ops/ksum_grad_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -33,12 +18,13 @@ limitations under the License.
 
 #include <omp.h>
 #include <cstring>
-#include <xdl/core/utils/logging.h>
+#include "xdl/core/utils/logging.h"
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
 #include "xdl/core/framework/op_registry.h"
 #include "xdl/core/framework/cpu_device.h"
 #include "xdl/core/lib/atomic.h"
+#include "ps-plus/ps-plus/common/thread_pool.h"
 
 namespace xdl {
 
@@ -48,12 +34,43 @@ Status KSumGradOp<T, I>::Init(OpKernelConstruction* ctx) {
   return Status::Ok();
 }
 
+template <typename T, typename I>
+class Cal {
+public:
+  Cal(size_t eb_dim, size_t start, bool average, I* sidx, T* pgrad, T* dst, I* pgrp): eb_dim_(eb_dim), start_(start), average_(average), sidx_(sidx), pgrad_(pgrad), dst_(dst), pgrp_(pgrp) {}
+  ps::Status operator()(const ps::Range& r) const {
+    std::vector<T> tmp(eb_dim_, T());
+    for (size_t j = start_ + r.begin; j < start_ + r.end; j++) {
+      I idx = sidx_[j];
+      for (size_t k = 0; k < eb_dim_; k++) {
+        T val = pgrad_[idx*eb_dim_ + k];
+        size_t grp_width = idx == 0 ? pgrp_[idx] : pgrp_[idx] - pgrp_[idx-1];
+        if (average_) val /= grp_width;
+        tmp[k] += val;
+      }
+    }
+    for (size_t k = 0; k < eb_dim_; k++) {
+      common::cpu_atomic_add<T>(tmp[k], dst_ + k);
+    }
+    return ps::Status::Ok();
+  }
+private:
+  size_t eb_dim_;
+  size_t start_;
+  bool average_;
+  I* sidx_;
+  T* pgrad_;
+  T* dst_;
+  I* pgrp_;
+};
+
+
 template <typename T, typename I>
 Status KSumGradOp<T, I>::Compute(OpKernelContext* ctx) {
-  Tensor embed, index, value, segment, group, grad, out_grad;
+  Tensor embed, index, value, segment, group, grad, sample_index, sample_segment, out_grad;
   XDL_CHECK_STATUS(ctx->GetInput(0, &embed));
-  XDL_CHECK_COND(2 == embed.Shape().Size(),
-                 Status::ArgumentError("embed input dim must be 2"));
+  XDL_CHECK_COND(1 == embed.Shape().Size(),
+                 Status::ArgumentError("embed input dim must be 1"));
   XDL_CHECK_STATUS(ctx->GetInput(1, &index));
   XDL_CHECK_COND(1 == index.Shape().Size(),
                  Status::ArgumentError("index input dim must be 1"));
@@ -67,7 +84,13 @@ Status KSumGradOp<T, I>::Compute(OpKernelContext* ctx) {
   XDL_CHECK_STATUS(ctx->GetInput(4, &group));
   XDL_CHECK_COND(1 == group.Shape().Size(),
                  Status::ArgumentError("group input dim must be 1"));
-  XDL_CHECK_STATUS(ctx->GetInput(5, &grad));
+  XDL_CHECK_STATUS(ctx->GetInput(5, &sample_index));
+  XDL_CHECK_COND(1 == sample_index.Shape().Size(),
+                 Status::ArgumentError("sample_index input dim must be 1"));
+  XDL_CHECK_STATUS(ctx->GetInput(6, &sample_segment));
+  XDL_CHECK_COND(1 == sample_segment.Shape().Size(),
+                 Status::ArgumentError("sample_segment input dim must be 1"));  
+  XDL_CHECK_STATUS(ctx->GetInput(7, &grad));
   XDL_CHECK_COND(2 == grad.Shape().Size(),
                  Status::ArgumentError("grad input dim must be 2"));
 
@@ -76,16 +99,35 @@ Status KSumGradOp<T, I>::Compute(OpKernelContext* ctx) {
   T* pval = value.Raw<T>();
   I* pseg = segment.Raw<I>();
   I* pgrp = group.Raw<I>();
-
-  if (value.Shape().NumElements() == 0) {
+  I* sidx = sample_index.Raw<I>();
+  I* sseg = sample_segment.Raw<I>();
+
+  bool all_one = true;
+  float FLOAT_EPSILON = 1.192092896e-07f;
+  for (size_t i = 0; i < value.Shape().NumElements(); i++) {
+    if ((pval[i] > (1 + FLOAT_EPSILON)) || (pval[i] < (1 - FLOAT_EPSILON))) {
+      all_one = false;
+      break;
+    }
+  }
+  
+  if (value.Shape().NumElements() == 0 || all_one) {
     pval = nullptr;
   }
 
-  size_t eb_dim = embed.Shape()[1];
+  std::vector<size_t> dims;
+  int64_t* ebs_ptr = embed.Raw<int64_t>();
+  for (size_t i = 0; i < embed.Shape().NumElements(); ++i) {
+    dims.push_back(*ebs_ptr++);
+  }
+
+  TensorShape embed_shape(dims);
+
+  size_t eb_dim = embed_shape[1];
   size_t seg_size = segment.Shape().NumElements();
   size_t id_size = index.Shape().NumElements();
   size_t grp_size = seg_size;
-  XDL_CHECK(seg_size == grad.Shape()[0]) << "grad dim 0 is not equal to batch size";
+  XDL_CHECK(seg_size == grad.Shape()[0]) << "grad dim 0 is not equal to batch size ";
 
   if (group.Shape().NumElements() == 0) {
     pgrp = pseg;
@@ -93,35 +135,85 @@ Status KSumGradOp<T, I>::Compute(OpKernelContext* ctx) {
     grp_size = group.Shape().NumElements();
     XDL_CHECK(grp_size % seg_size == 0) << "group must be divided by segment";
   }
+  XDL_CHECK(grad.Shape()[1] % eb_dim == 0) << "grad shape[1] not equal to emb_dim";
+  XDL_CHECK(sample_segment.Shape()[0] == embed_shape[0]) << "sample_segment size is not equal to eb_dim[0]";
 
-  XDL_CHECK_STATUS(ctx->AllocateOutput(0, embed.Shape(), &out_grad));
+  XDL_CHECK_STATUS(ctx->AllocateOutput(0, embed_shape, &out_grad));
   T* pout = out_grad.Raw<T>();
-  std::memset(pout, 0, sizeof(T) * embed.Shape().NumElements());
-
-  #pragma omp parallel for
-  for(size_t i = 0; i < id_size; ++i) {
-    size_t grp_idx = std::lower_bound(pgrp, pgrp + grp_size, i + 1) - pgrp;
-    size_t grp_width = (grp_idx == 0) ? pgrp[grp_idx]
-                                      : (pgrp[grp_idx] - pgrp[grp_idx - 1]);
-    if (grp_width == 0) continue;
-    const T* src = pgrad + grp_idx * eb_dim;
-    T* dst = pout + pidx[i] * eb_dim;
-    for (size_t k = 0; k < eb_dim; ++k) {
-      T val = (pval != nullptr) ? pval[i] * src[k] : src[k];
-      if (average_) val /= grp_width;
-      common::cpu_atomic_add<T>(val, dst + k);
+  std::memset(pout, 0, sizeof(T) * embed_shape.NumElements());
+  if (pval != nullptr) {
+    if (id_size < 1000) {
+      auto func = [pgrad, pout, pidx, eb_dim, pval, this] (I i, size_t grp_idx, size_t grp_width, const T* src) {
+        T* dst = pout + pidx[i] * eb_dim;
+        for (size_t k = 0; k < eb_dim; ++k) {
+          T val = (pval != nullptr) ? pval[i] * src[k] : src[k];
+          if (this->average_) val /= grp_width;
+          dst[k] += val;
+        }
+      };
+      I i = 0;
+      const I* p = pgrp;
+      const I* q;
+      for (size_t grp_width, grp_idx = 0; grp_idx < grp_size; ++grp_idx, q = p++) {
+        grp_width = grp_idx == 0 ? *p : *p - *q;
+        if (grp_width == 0) continue;
+        const T* src = pgrad + grp_idx * eb_dim;
+        for (; i < *p; ++i) {
+          func(i, grp_idx, grp_width, src);
+        }
+      }
+      return Status::Ok();
     }
-  }
   
+    #pragma omp parallel for
+    for(size_t i = 0; i < id_size; ++i) {
+      size_t grp_idx = std::lower_bound(pgrp, pgrp + grp_size, i + 1) - pgrp;
+      size_t grp_width = (grp_idx == 0) ? pgrp[grp_idx] : (pgrp[grp_idx] - pgrp[grp_idx - 1]);
+      if (grp_width == 0) continue;
+      const T* src = pgrad + grp_idx * eb_dim;
+      T* dst = pout + pidx[i] * eb_dim;
+      for (size_t k = 0; k < eb_dim; ++k) {
+        T val = (pval != nullptr) ? pval[i] * src[k] : src[k];
+        if (average_) val /= grp_width;
+        common::cpu_atomic_add<T>(val, dst + k);
+      }
+    }
+  } else {
+    //auto time_start = std::chrono::system_clock::now();
+    #pragma omp parallel for
+    for(size_t i = 0; i < sample_segment.Shape()[0]; i++) {
+      size_t start = i == 0 ? 0 : sseg[i-1];
+      size_t end = sseg[i];
+      T* dst = pout + i * eb_dim;
+      if (end-start > 300) {
+        Cal<T,I> c(eb_dim, start, average_, sidx, pgrad, dst, pgrp);
+        ps::MultiThreadDo(end-start, c, 300);
+      } else {
+        for (size_t j = start; j < end; j++) {
+          I idx = sidx[j];
+          for (size_t k = 0; k < eb_dim; k++) {
+            T val = pgrad[idx*eb_dim + k];
+            size_t grp_width = idx == 0 ? pgrp[idx] : pgrp[idx] - pgrp[idx-1];
+            if (average_) val /= grp_width;
+            dst[k] += val;
+          }
+        }
+      }
+    }
+    //auto time_end = std::chrono::system_clock::now();
+    //printf("ksum time %ld\n", (time_end-time_start).count());
+  }
   return Status::Ok();
 }
 
 XDL_DEFINE_OP(KSumGrad)
-  .Input("embed", "dtype")
+  .Input("embed", DataType::kInt64)
   .Input("index", "itype")
   .Input("value", "dtype")
   .Input("segment", "itype")
   .Input("group", "itype")
+  .Input("sample_index", "itype")
+  .Input("sample_segment", "itype")
   .Input("grad", "dtype")
   .Output("out_grad", "dtype")
   .Attr("dtype", AttrValue::kDataType)
diff --git a/xdl/xdl/core/ops/ksum_grad_op.cu b/xdl/xdl/core/ops/ksum_grad_op.cu
index ff0e5558..5b745099 100644
--- a/xdl/xdl/core/ops/ksum_grad_op.cu
+++ b/xdl/xdl/core/ops/ksum_grad_op.cu
@@ -34,9 +34,10 @@ __global__ void KSumGradKernel(const T* pgrad, const I* pidx, const T* pval,
   int idx = blockIdx.x * blockDim.x + threadIdx.x;
   if (idx >= pgrp[grp_size - 1]) return;
 
-  size_t grp_idx = LowerBound(pgrp, pgrp + grp_size, idx + 1) - pgrp;
-  size_t grp_width = (grp_idx == 0) ? pgrp[grp_idx]
-                                    : (pgrp[grp_idx] - pgrp[grp_idx - 1]);
+  const I* p = LowerBound(pgrp, pgrp + grp_size, idx + 1);
+  size_t grp_idx = p - pgrp;
+  size_t grp_width = (grp_idx == 0) ? p[0]
+                                    : (p[0] - p[-1]);
   if (grp_width == 0) return;
 
   const T* src = pgrad + grp_idx * eb_dim;
@@ -69,8 +70,8 @@ template <typename T, typename I>
 Status KSumGradGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* stream) {
   Tensor embed, index, value, segment, group, grad, out_grad;
   XDL_CHECK_STATUS(ctx->GetInput(0, &embed));
-  XDL_CHECK_COND(2 == embed.Shape().Size(),
-                 Status::ArgumentError("embed input dim must be 2"));
+  XDL_CHECK_COND(1 == embed.Shape().Size(),
+                 Status::ArgumentError("embed input dim must be 1"));
   XDL_CHECK_STATUS(ctx->GetInput(1, &index));
   XDL_CHECK_COND(1 == index.Shape().Size(),
                  Status::ArgumentError("index input dim must be 1"));
@@ -84,7 +85,7 @@ Status KSumGradGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* strea
   XDL_CHECK_STATUS(ctx->GetInput(4, &group));
   XDL_CHECK_COND(1 == group.Shape().Size(),
                  Status::ArgumentError("group input dim must be 1"));
-  XDL_CHECK_STATUS(ctx->GetInput(5, &grad));
+  XDL_CHECK_STATUS(ctx->GetInput(7, &grad));
   XDL_CHECK_COND(2 == grad.Shape().Size(),
                  Status::ArgumentError("grad input dim must be 2"));
   
@@ -98,7 +99,19 @@ Status KSumGradGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* strea
     pval = nullptr;
   }
 
-  size_t eb_dim = embed.Shape()[1];
+  //std::vector<int64_t> dims;
+  //dims.resize(embed.Shape().NumElements());
+  int64_t* pe = embed.Raw<int64_t>();
+  //CUDA_CHECK(cudaMemcpy((void*)dims.data(), (void*)pe, 8 * embed.Shape().NumElements(), cudaMemcpyDeviceToHost));  
+  std::vector<size_t> sdims;
+  for (size_t i = 0; i < embed.Shape().NumElements(); ++i) {
+    sdims.push_back(pe[i]);
+  }
+  //for (auto item: dims) {
+  //  sdims.push_back(item);
+  //}
+  TensorShape embed_shape(sdims);
+  size_t eb_dim = embed_shape[1];
   size_t seg_size = segment.Shape().NumElements();
   size_t id_size = index.Shape().NumElements();
   size_t grp_size = seg_size;
@@ -111,14 +124,16 @@ Status KSumGradGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* strea
     XDL_CHECK(grp_size % seg_size == 0) << "group must be divided by segment";
   }
 
-  XDL_CHECK_STATUS(ctx->AllocateOutput(0, embed.Shape(), &out_grad));
+  XDL_CHECK_STATUS(ctx->AllocateOutput(0, embed_shape, &out_grad));
   T* pout = out_grad.Raw<T>();
-  size_t bytes = sizeof(T) * embed.Shape().NumElements();
+  size_t bytes = sizeof(T) * embed_shape.NumElements();
   CUDA_CHECK(cudaMemsetAsync(pout, 0, bytes, stream->GetInternal()));
+  if (id_size == 0) return Status::Ok();
 
+  size_t blocks = CUDA_GET_BLOCKS(id_size);
   KSumGradKernel<T, I><<<
-      CUDA_GET_BLOCKS(id_size),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(id_size, blocks),
       0,
       stream->GetInternal()>>>(pgrad, pidx, pval, pgrp, grp_size,
                                eb_dim, average_, pout);
diff --git a/xdl/xdl/core/ops/ksum_grad_op.h b/xdl/xdl/core/ops/ksum_grad_op.h
index 2579d1a7..1e7693a4 100644
--- a/xdl/xdl/core/ops/ksum_grad_op.h
+++ b/xdl/xdl/core/ops/ksum_grad_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/ksum_op.cc b/xdl/xdl/core/ops/ksum_op.cc
index 9deba562..c45873ce 100644
--- a/xdl/xdl/core/ops/ksum_op.cc
+++ b/xdl/xdl/core/ops/ksum_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -96,18 +81,27 @@ Status KSumOp<T, I>::Compute(OpKernelContext* ctx) {
   T* pout = output.Raw<T>();
   std::memset(pout, 0, sizeof(T) * out_shape.NumElements());
 
-  #pragma omp parallel for
-  for (size_t i = 0; i < id_size; ++i) {
-    size_t grp_idx = std::lower_bound(pgrp, pgrp + grp_size, i + 1) - pgrp;
-    size_t grp_width = (grp_idx == 0) ? pgrp[grp_idx]
-                                      : pgrp[grp_idx] - pgrp[grp_idx - 1];
-    if (grp_width == 0) continue;
-    const T* src = peb + pidx[i] * eb_dim;
-    T* dst = pout + grp_idx * eb_dim;
-    for (size_t k = 0; k < eb_dim; ++k) {
-      T val = (pval != nullptr) ? pval[i] * src[k] : src[k];
-      if (average_) val /= grp_width;
-      common::cpu_atomic_add<T>(val, dst + k);
+  std::function<void(size_t)> func = [=] (size_t sample_id) {
+    size_t beg = sample_id == 0 ? 0 : pgrp[sample_id - 1];
+    size_t end = pgrp[sample_id];
+    T* dst = pout + sample_id * eb_dim;
+    for (size_t i = beg; i < end; ++i) {
+      const T* src = peb + pidx[i] * eb_dim;
+      for (size_t k = 0; k < eb_dim; ++k) {
+        T val = (pval != nullptr) ? pval[i] * src[k] : src[k];
+        if (average_) val /= (end - beg);
+        dst[k] += val;
+      }
+    }
+  };
+  if (grp_size < 100) {
+    for (size_t sample_id = 0; sample_id < grp_size; ++sample_id) {
+      func(sample_id);
+    }
+  } else {
+    #pragma omp parallel for
+    for (size_t sample_id = 0; sample_id < grp_size; ++sample_id) {
+      func(sample_id);
     }
   }
 
@@ -120,6 +114,8 @@ XDL_DEFINE_OP(KSum)
   .Input("value", "dtype")
   .Input("segment", "itype")
   .Input("group", "itype")
+  .Input("sample_index", "itype")
+  .Input("sample_segment", "itype")
   .Output("output", "dtype")
   .Attr("dtype", AttrValue::kDataType)
   .Attr("itype", AttrValue::kDataType)
diff --git a/xdl/xdl/core/ops/ksum_op.cu b/xdl/xdl/core/ops/ksum_op.cu
index 13a603ab..4759ad74 100644
--- a/xdl/xdl/core/ops/ksum_op.cu
+++ b/xdl/xdl/core/ops/ksum_op.cu
@@ -33,10 +33,11 @@ __global__ void KSumKernel(const T* peb, const I* pidx, const T* pval,
   int idx = blockIdx.x * blockDim.x + threadIdx.x;
   if (idx >= pgrp[grp_size - 1]) return;
 
-  size_t grp_idx = LowerBound(pgrp, pgrp + grp_size, idx + 1) - pgrp;
+  const I* p = LowerBound(pgrp, pgrp + grp_size, idx + 1);
+  size_t grp_idx = p - pgrp;
 
-  size_t grp_width = (grp_idx == 0) ? pgrp[grp_idx]
-                                    : (pgrp[grp_idx] - pgrp[grp_idx- 1]);
+  size_t grp_width = (grp_idx == 0) ? p[0]
+                                    : (p[0] - p[-1]);
   if (grp_width == 0) return;
 
   const T* src = peb + pidx[idx] * eb_dim;
@@ -113,10 +114,12 @@ Status KSumGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* stream) {
   T* pout = output.Raw<T>();
   size_t bytes = sizeof(T) * out_shape.NumElements();
   CUDA_CHECK(cudaMemsetAsync(pout, 0, bytes, stream->GetInternal()));
+  if (id_size == 0) return Status::Ok();
 
+  size_t blocks = CUDA_GET_BLOCKS(id_size);
   KSumKernel<T, I><<<
-      CUDA_GET_BLOCKS(id_size),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(id_size, blocks),
       0,
       stream->GetInternal()>>>(peb, pidx, pval, pgrp, grp_size,
                                eb_dim, average_, pout);
diff --git a/xdl/xdl/core/ops/ksum_op.h b/xdl/xdl/core/ops/ksum_op.h
index 4bd1670f..ce8164b4 100644
--- a/xdl/xdl/core/ops/ksum_op.h
+++ b/xdl/xdl/core/ops/ksum_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/merge_sparse_op.cc b/xdl/xdl/core/ops/merge_sparse_op.cc
index f73b7a9e..0e9500aa 100644
--- a/xdl/xdl/core/ops/merge_sparse_op.cc
+++ b/xdl/xdl/core/ops/merge_sparse_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/merge_sparse_op.cu b/xdl/xdl/core/ops/merge_sparse_op.cu
index 8d8d4227..79e43808 100644
--- a/xdl/xdl/core/ops/merge_sparse_op.cu
+++ b/xdl/xdl/core/ops/merge_sparse_op.cu
@@ -30,10 +30,11 @@ template <typename I>
 __global__ void MergeGroupKernel(I** seg_list,
                                  size_t seg_size,
                                  size_t grp_size,
+                                 size_t num,
                                  I* out_seg,
                                  I* out_grp) {
   int idx = threadIdx.x + blockIdx.x * blockDim.x;
-  if (idx >= seg_size * grp_size) return;
+  if (idx >= num) return;
   int grp_idx = idx / seg_size;
   int seg_idx = idx % seg_size;
   int grp_off = seg_idx * grp_size + grp_idx;
@@ -61,11 +62,12 @@ __global__ void MergeSparseKernel(T** id_list,
                                   I* pgrp,
                                   size_t seg_size,
                                   size_t grp_size,
+                                  size_t num,
                                   size_t id_dim,
                                   T* out_id,
                                   V* out_val) {
   int idx = threadIdx.x + blockIdx.x * blockDim.x;
-  if (idx >= grp_size * seg_size) return;
+  if (idx >= num) return;
   int grp_idx = idx / seg_size;
   int seg_idx = idx % seg_size;
   int grp_off = seg_idx * grp_size + grp_idx;
@@ -170,19 +172,21 @@ Status MergeSparseGpuOp<T, V, I>::LaunchKernel(OpKernelContext* ctx,
                                cudaMemcpyHostToDevice, st));
   }
 
+  size_t num = seg_size * group_size;
+  size_t blocks = CUDA_GET_BLOCKS(num);
   MergeGroupKernel<I><<<
-      CUDA_GET_BLOCKS(seg_size * group_size),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(num, blocks),
       0,
-      st>>>(pseg_list, seg_size, group_size, pseg, pgrp);
+      st>>>(pseg_list, seg_size, group_size, num, pseg, pgrp);
   ReduceKernel<I><<<1, 1, 0, st>>>(pseg, seg_size);
-  ReduceKernel<I><<<1, 1, 0, st>>>(pgrp, seg_size * group_size);
+  ReduceKernel<I><<<1, 1, 0, st>>>(pgrp, num);
   MergeSparseKernel<T, V, I><<<
-      CUDA_GET_BLOCKS(seg_size * group_size),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(num, blocks),
       0,
       st>>>(pid_list, pval_list, pseg_list, pgrp,
-            seg_size, group_size, id_num, pid, pvalue);
+            seg_size, group_size, num, id_num, pid, pvalue);
 
   return Status::Ok();
 }
diff --git a/xdl/xdl/core/ops/merge_sparse_op.h b/xdl/xdl/core/ops/merge_sparse_op.h
index 10591865..ef66a418 100644
--- a/xdl/xdl/core/ops/merge_sparse_op.h
+++ b/xdl/xdl/core/ops/merge_sparse_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/mfeature_to_hash64.cc b/xdl/xdl/core/ops/mfeature_to_hash64.cc
new file mode 100644
index 00000000..57c9f9af
--- /dev/null
+++ b/xdl/xdl/core/ops/mfeature_to_hash64.cc
@@ -0,0 +1,71 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class MfeatureToHash64 : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("default_value", &default_value_));
+    XDL_CHECK_STATUS(ctx->GetAttr("pad", &pad_len_));
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor t_ids, t_segment, t_output;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &t_ids));
+    XDL_CHECK_STATUS(ctx->GetInput(1, &t_segment));
+    size_t batch_size = t_segment.Shape()[0];
+    TensorShape output_shape{batch_size, pad_len_};
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, output_shape, &t_output));
+    int32_t* segment = t_segment.Raw<int32_t>();
+    int64_t* ids = t_ids.Raw<int64_t>();
+    int64_t* output = t_output.Raw<int64_t>();
+    for (size_t i = 0; i < batch_size; i++) {
+      int32_t seg_size = i == 0 ? segment[i] : segment[i] - segment[i - 1];
+      int32_t start = i == 0 ? 0 : segment[i - 1];
+      for (size_t j = 0; j < pad_len_; j++) {
+        if (j < seg_size) {
+          output[i * pad_len_ + j] = ids[2 * (start + j)];
+        } else {
+          output[i * pad_len_ + j] = default_value_;
+        }
+      }
+    }
+    return Status::Ok();
+  }
+ private:
+  int64_t default_value_;
+  int64_t pad_len_;  
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(MfeatureToHash64)
+  .Input("ids", DataType::kInt64)
+  .Input("segment", DataType::kInt32)
+  .Attr("default_value", AttrValue::kInt)
+  .Attr("pad", AttrValue::kInt)
+  .Output("result", DataType::kInt64);
+
+XDL_REGISTER_KERNEL(MfeatureToHash64, MfeatureToHash64)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/mock_dense_op.cc b/xdl/xdl/core/ops/mock_dense_op.cc
index 5481ae69..5ea66405 100644
--- a/xdl/xdl/core/ops/mock_dense_op.cc
+++ b/xdl/xdl/core/ops/mock_dense_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -13,7 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-#include <xdl/core/utils/logging.h>
+#include "xdl/core/utils/logging.h"
 #include "xdl/core/lib/status.h"
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
diff --git a/xdl/xdl/core/ops/mock_sparse_op.cc b/xdl/xdl/core/ops/mock_sparse_op.cc
index a549012e..015d4333 100644
--- a/xdl/xdl/core/ops/mock_sparse_op.cc
+++ b/xdl/xdl/core/ops/mock_sparse_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/no_op.cc b/xdl/xdl/core/ops/no_op.cc
new file mode 100644
index 00000000..29745103
--- /dev/null
+++ b/xdl/xdl/core/ops/no_op.cc
@@ -0,0 +1,38 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class NoOp : public OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    return Status::Ok();
+  }
+ private:
+};
+
+XDL_DEFINE_OP(NoOp);
+XDL_REGISTER_KERNEL(NoOp, NoOp);
+
+}  // namespace xdl
+
diff --git a/xdl/xdl/core/ops/ps_ops/client.cc b/xdl/xdl/core/ops/ps_ops/client.cc
index 0d9f958a..36ac8a5e 100644
--- a/xdl/xdl/core/ops/ps_ops/client.cc
+++ b/xdl/xdl/core/ops/ps_ops/client.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -65,6 +65,11 @@ bool RestartClient() {
   return true;
 }
 
+bool ResetClient() {
+  current_client = nullptr;
+  return true;
+}
+
 bool Connected() {
   return current_client != nullptr;
 }
diff --git a/xdl/xdl/core/ops/ps_ops/client.h b/xdl/xdl/core/ops/ps_ops/client.h
index 4621ee4f..43ae8cfb 100644
--- a/xdl/xdl/core/ops/ps_ops/client.h
+++ b/xdl/xdl/core/ops/ps_ops/client.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -27,6 +27,7 @@ bool ConnectToClient(const std::string& addr, const std::string& ckpt_path);
 bool RestartClient();
 bool Connected();
 Status GetClient(ps::client::BaseClient** result);
+bool ResetClient();
 
 }
 
diff --git a/xdl/xdl/core/ops/ps_ops/convert_utils.cc b/xdl/xdl/core/ops/ps_ops/convert_utils.cc
index 2d89fade..788443ba 100644
--- a/xdl/xdl/core/ops/ps_ops/convert_utils.cc
+++ b/xdl/xdl/core/ops/ps_ops/convert_utils.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -59,12 +59,22 @@ Status PS2XDL::ConvertTensor(const ps::Tensor& s, xdl::Tensor* d) {
   TensorShape shape;
   XDL_CHECK_STATUS(ConvertShape(s.Shape(), &shape));
   *d = xdl::Tensor(DeviceSingleton::CpuInstance(), shape, type);
-  memcpy(d->Raw<void>(), 
-         s.Raw<void>(), 
+  memcpy(d->Raw<void>(),
+         s.Raw<void>(),
          SizeOfType(d->Type()) * shape.NumElements());
   return Status::Ok();
 }
 
+Status PS2XDL::ConvertTensorZC(ps::Tensor& s, xdl::Tensor* d) {
+  DataType type;
+  XDL_CHECK_STATUS(ConvertType(s.Type(), &type));
+  TensorShape shape;
+  XDL_CHECK_STATUS(ConvertShape(s.Shape(), &shape));
+  s.SetOwnBuffer(false);
+  *d = xdl::Tensor(DeviceSingleton::CpuInstance(), shape, type, s.Raw<void>(), true);
+  return Status::Ok();
+}
+
 Status PS2XDL::ConvertTensorWithCtx(const ps::Tensor& src, 
                                     OpKernelContext* ctx, 
                                     int output_id) {
@@ -146,12 +156,22 @@ Status XDL2PS::ConvertTensor(const xdl::Tensor& s, ps::Tensor* d) {
   ps::TensorShape shape;
   XDL_CHECK_STATUS(ConvertShape(s.Shape(), &shape));
   *d = ps::Tensor(type, shape, new ps::initializer::NoneInitializer());
-  memcpy(d->Raw<void>(), 
-         s.Raw<void>(), 
+  memcpy(d->Raw<void>(),
+         s.Raw<void>(),
          SizeOfType(s.Type()) * shape.NumElements());
   return Status::Ok();
 }
 
+// zero copy version, by steal buffer
+Status XDL2PS::ConvertTensorZC(xdl::Tensor& s, ps::Tensor* d) {
+  ps::DataType type;
+  XDL_CHECK_STATUS(ConvertType(s.Type(), &type));
+  ps::TensorShape shape;
+  XDL_CHECK_STATUS(ConvertShape(s.Shape(), &shape));
+  *d = ps::Tensor(type, shape, s.Raw<char>(), new ps::initializer::NoneInitializer());
+  return Status::Ok();
+}
+
 ps::Status XDL2PS::ConvertStatus(const Status& st) {
   if (st.IsOk()) {
     return ps::Status::Ok();
diff --git a/xdl/xdl/core/ops/ps_ops/convert_utils.h b/xdl/xdl/core/ops/ps_ops/convert_utils.h
index 4f3bdc18..00040bae 100644
--- a/xdl/xdl/core/ops/ps_ops/convert_utils.h
+++ b/xdl/xdl/core/ops/ps_ops/convert_utils.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -30,6 +30,7 @@ class PS2XDL {
   static Status ConvertType(ps::DataType src, xdl::DataType* dst);
   static Status ConvertShape(const ps::TensorShape& src, xdl::TensorShape* dst);
   static Status ConvertTensor(const ps::Tensor& src, xdl::Tensor* dst);
+  static Status ConvertTensorZC(ps::Tensor& src, xdl::Tensor* dst);  
   static Status ConvertStatus(const ps::Status& st);
   static Status ConvertTensorWithCtx(const ps::Tensor& src, 
                                      OpKernelContext* ctx, 
@@ -41,6 +42,7 @@ class XDL2PS {
   static Status ConvertType(xdl::DataType src, ps::DataType* dst);
   static Status ConvertShape(const xdl::TensorShape& src, ps::TensorShape* dst);
   static Status ConvertTensor(const xdl::Tensor& src, ps::Tensor* dst);
+  static Status ConvertTensorZC(xdl::Tensor& src, ps::Tensor* dst);  
   static ps::Status ConvertStatus(const Status& st);
 };
 
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/hdfs_data_source.cc b/xdl/xdl/core/ops/ps_ops/model_server/hdfs_data_source.cc
index e2c87571..faed012d 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/hdfs_data_source.cc
+++ b/xdl/xdl/core/ops/ps_ops/model_server/hdfs_data_source.cc
@@ -76,7 +76,7 @@ class HdfsDataSourceOp : public OpKernel {
     std::vector<int64_t> inputx(input.Raw<int64_t>(), input.Raw<int64_t>() + len);
     std::vector<ps::DataClosure> data_closures;
     XDL_CHECK_STATUS(PS2XDL::ConvertStatus(data_source_->BatchGet(inputx, &data_closures)));
-    #pragma omp parallel for num_threads(64)
+    #pragma omp parallel for num_threads(8)
     for (size_t i = 0; i < data_closures.size(); i++) {
       memcpy(rst.Raw<char>() + value_length_ * i, data_closures[i].data, value_length_);
     }
@@ -128,7 +128,7 @@ class HdfsDataSourceOpV2 : public OpKernel {
     data_source_->BatchGetV2(inputx, &data_closures, &ids);
     XDL_CHECK_STATUS(ctx->AllocateOutput(0, TensorShape({data_closures.size(), size_}), &rst));
     XDL_CHECK_STATUS(ctx->AllocateOutput(1, TensorShape({ids.size()}), &ids_rst));
-    #pragma omp parallel for num_threads(64)
+    #pragma omp parallel for num_threads(8)
     for (size_t i = 0; i < data_closures.size(); i++) {
       memcpy(rst.Raw<char>() + value_length_ * i, data_closures[i].data, value_length_);
     }
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server.cc b/xdl/xdl/core/ops/ps_ops/model_server/model_server.cc
index 8179cd0f..700777ab 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server.cc
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server.cc
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+#include "xdl/core/ops/ps_ops/convert_utils.h"
 #include "xdl/core/ops/ps_ops/model_server/model_server.h"
 #include "xdl/core/ops/ps_ops/model_server/model_server_forward.h"
 #include "xdl/core/ops/ps_ops/model_server/model_server_backward.h"
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server.h b/xdl/xdl/core/ops/ps_ops/model_server/model_server.h
index cafb0dd3..eeb3351a 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server.h
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -22,7 +22,6 @@ limitations under the License.
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
 #include "xdl/core/framework/op_registry.h"
-#include "xdl/core/ops/ps_ops/convert_utils.h"
 #include "ps-plus/model_server/model_server_service.h"
 
 namespace xdl {
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.cc b/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.cc
index bc68140c..420c99e9 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.cc
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.h b/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.h
index fd4bd624..379510f6 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.h
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server_backward.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_backward.cc b/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_backward.cc
index 0222fbda..1304b3b1 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_backward.cc
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_backward.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_forward.cc b/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_forward.cc
index 31c22a04..86332c5a 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_forward.cc
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server_client_forward.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.cc b/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.cc
index 7b8690ec..6193ffa5 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.cc
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.h b/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.h
index 52aaa3d8..ccc259fa 100644
--- a/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.h
+++ b/xdl/xdl/core/ops/ps_ops/model_server/model_server_forward.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_apply_moving_average_op.cc b/xdl/xdl/core/ops/ps_ops/ps_apply_moving_average_op.cc
index 1d41fdfb..aa4ef2b5 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_apply_moving_average_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_apply_moving_average_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -46,9 +46,12 @@ class PsApplyMovingAverageOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<float> moment_vec = {moment_};
+    std::vector<ps::Tensor> value_vec = {converted_value};
+
     client->DensePush(var_name_, 
                       "MovingAverageUpdater", 
-                      client->Args(moment_, converted_value),
+                      client->Args(moment_vec, value_vec),
                       cb);
   }
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_assign_add_op.cc b/xdl/xdl/core/ops/ps_ops/ps_assign_add_op.cc
index 84c49b97..217047f1 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_assign_add_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_assign_add_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -47,11 +47,13 @@ class PsAssignAddOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> delta_vec = {converted_delta};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->DensePush(var_name_, 
                         "AssignAddUpdater", 
-                        client->Args(converted_delta), 
+                        client->Args(delta_vec), 
                         cb);
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_assign_op.cc b/xdl/xdl/core/ops/ps_ops/ps_assign_op.cc
index 6dfa481e..680de779 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_assign_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_assign_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -47,11 +47,13 @@ class PsAssignOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> value_vec = {converted_value};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->DensePush(var_name_, 
                         "AssignUpdater", 
-                        client->Args(converted_value), 
+                        client->Args(value_vec), 
                         cb);
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_assign_sub_op.cc b/xdl/xdl/core/ops/ps_ops/ps_assign_sub_op.cc
index 7c703e8c..5a44bfae 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_assign_sub_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_assign_sub_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -47,11 +47,13 @@ class PsAssignSubOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> delta_vec = {converted_delta};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->DensePush(var_name_, 
                         "AssignSubUpdater", 
-                        client->Args(converted_delta), 
+                        client->Args(delta_vec), 
                         cb);
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_constant_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_constant_initializer_op.cc
index 8dfd8433..f61d8f66 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_constant_initializer_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_constant_initializer_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -53,7 +53,8 @@ class PsConstantInitializerOp : public xdl::OpKernelAsync {
     case VarType::kIndex:
       client->IndexInitializer(var_name_, initializer, cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashInitializer(var_name_, initializer, cb);
       break;              
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_convert_ckpt_variable_op.cc b/xdl/xdl/core/ops/ps_ops/ps_convert_ckpt_variable_op.cc
index 3ce43bb5..025d1293 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_convert_ckpt_variable_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_convert_ckpt_variable_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -14,6 +14,7 @@ limitations under the License.
 ==============================================================================*/
 
 #include "xdl/core/lib/status.h"
+#include "xdl/core/utils/time_utils.h"
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
 #include "xdl/core/framework/op_registry.h"
@@ -21,28 +22,35 @@ limitations under the License.
 #include "xdl/core/ops/ps_ops/convert_utils.h"
 #include "xdl/core/ops/ps_ops/client.h"
 #include "xdl/core/ops/ps_ops/var_type.h"
+#include "xdl/core/utils/string_utils.h"
 
 #include <ps-plus/common/file_system.h>
 #include <ps-plus/common/string_utils.h>
+#define private public
 #include <ps-plus/server/checkpoint_utils.h>
+#include <ps-plus/scheduler/scheduler_impl.h>
+#undef private
 #include <ps-plus/message/variable_info.h>
 #include <ps-plus/common/data.h>
 #include <ps-plus/common/serializer.h>
+#include <stdexcept>
 
 namespace xdl {
 
 class PsConvertCkptVariableOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
-    XDL_CHECK_STATUS(ctx->GetAttr("hash64", &hash64_));
+    XDL_CHECK_STATUS(ctx->GetAttr("with_slots", &with_slots_));
+    XDL_CHECK_STATUS(ctx->GetAttr("convert_index_with_enter", &convert_index_with_enter_));
     return Status::Ok();
   }
 
   void Compute(OpKernelContext* ctx, Callback done) override {
+    uint64_t start_time = TimeUtils::NowMicros();
     Tensor t_ckpt_dir, t_output_dir, t_variables;
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_ckpt_dir), done);
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_output_dir), done);
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &t_variables), done);        
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &t_variables), done);
     std::string ckpt_dir = t_ckpt_dir.Scalar<std::string>();
     if (ckpt_dir.back() != '/') {
       ckpt_dir += "/";
@@ -52,38 +60,44 @@ class PsConvertCkptVariableOp : public xdl::OpKernelAsync {
     std::string ckpt;
     XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(GetLatestCheckpoint(ckpt_dir, &ckpt)), done);
     std::vector<ps::VariableInfo> infos;
-    XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(LoadMeta(ckpt, &infos)), done);
-    ps::server::CheckpointUtils utils(ckpt, ps::VariableInfoCollection{.infos=infos});
+    size_t server_num;
+    XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(ps::scheduler::SchedulerImpl::ReadVariableInfoMeta(ckpt, &server_num, &infos)), done);
+    for (auto& item : infos) {
+      item.args[ps::VariableInfo::ORIGIN_FILE_PATH] = ckpt;
+    }
+    ps::server::CheckpointUtils utils(ps::VariableInfoCollection{.infos=infos});
     std::vector<std::string> variables = ps::StringUtils::split(s_variables, ",");
-    for (std::string variable: variables) {
+    Status::ErrorCode error_code = Status::kOk;
+    #pragma omp parallel for
+    for (size_t i = 0; i < variables.size(); ++i) {
+      std::string& variable = variables[i];
       for(auto info : infos) {
         if (info.name == variable) {
-          XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(ConvertVariable(info, utils, output_dir)), done);
+          Status st = PS2XDL::ConvertStatus(ConvertVariable(info, utils, output_dir, with_slots_, convert_index_with_enter_));
+          if (!st.IsOk()) {
+            error_code = st.Code();
+            printf("ErrorMsg: %s\n", st.Msg().c_str());
+          }
         }
       }
     }
-    done(Status::Ok());
+    Status status = error_code == Status::kOk ? Status::Ok()
+                                              : Status(error_code, "ps_convert_ckpt_variable_op failed.");
+    done(status);
+    printf("finish convert ckpt[%s], duration[%dms]\n", ckpt_dir.c_str(), (TimeUtils::NowMicros() - start_time) / 1000);
   }
 
  private:    
   ps::Status GetLatestCheckpoint(const std::string& checkpoint_dir, std::string* checkpoint) {
-    std::unique_ptr<ps::FileSystem::ReadStream> s;
-    ps::Status st = ps::FileSystem::OpenReadStreamAny(checkpoint_dir + "checkpoints", &s);
-    if (!st.IsOk()) {
-        *checkpoint = checkpoint_dir;
-        printf("Converting [%s]\n", checkpoint->c_str());        
-        return ps::Status::Ok();
-    }
-    size_t size;
-    PS_CHECK_STATUS(s->ReadRaw(&size));
-    if (size == 0) {
-      return ps::Status::ArgumentError("Read checkpoints size is 0");
+    std::vector<std::string> checkpoints;
+    PS_CHECK_STATUS(ps::scheduler::SchedulerImpl::ReadCheckpoints(checkpoint_dir, true, &checkpoints));
+    if (checkpoints.size() == 0) {
+      *checkpoint = checkpoint_dir;
+      printf("Converting [%s]\n", checkpoint->c_str());
+    } else {
+      *checkpoint = checkpoint_dir + "/" + checkpoints.back();
+      printf("GetLatestCheckpoint [%s]\n", checkpoint->c_str());
     }
-    for (size_t i = 0; i < size; i++) {
-      PS_CHECK_STATUS(s->ReadStr(checkpoint));
-    }
-    *checkpoint = checkpoint_dir + *checkpoint + "/";
-    printf("GetLatestCheckpoint [%s]\n", checkpoint->c_str());
     return ps::Status::Ok();
   }
 
@@ -96,125 +110,203 @@ class PsConvertCkptVariableOp : public xdl::OpKernelAsync {
         ret.append(1, c);
       }
     }
-
     return ret;
   }
 
-  ps::Status ConvertVariable(const ps::VariableInfo& info, ps::server::CheckpointUtils& utils, const std::string& output_dir) {
+  template<typename KeyType>
+  std::string ToString(KeyType key) {
+    return "";
+  }
+
+  ps::Status ConvertVariable(const ps::VariableInfo& info, ps::server::CheckpointUtils& utils, const std::string& output_dir,
+                             bool with_slots=false, bool convert_index_with_enter=false) {
     ps::FileSystem::WriteStream* output_stream;
     std::string file_name = output_dir + "/" + ReplaceVariableName(info.name);
     ps::FileSystem::RemoveAny(file_name);
     PS_CHECK_STATUS(ps::FileSystem::OpenWriteStreamAny(file_name, &output_stream));
+    std::map<std::string, ps::FileSystem::WriteStream*> slot_stream_map;
     for (size_t i = 0; i < info.parts.size(); i++) {
       ps::server::CheckpointUtils::VariableStruct vs;
-      printf("Start convert [%s], part[%ld]\n", info.name.c_str(), i);
-      PS_CHECK_STATUS(utils.LoadVariable(info.name, i, &vs));
+      printf("Start convert [%s], part[%d]\n", info.name.c_str(), i);
+      uint64_t start_time = TimeUtils::NowMicros();
+      PS_CHECK_STATUS(utils.LoadVariable(info, i, &vs));
       if (!vs.initialized) {
         return ps::Status::DataLoss("Load variable " + info.name + " failed.");
       }
+      if (i == 0 && with_slots) {
+        for (const auto& iter : vs.slots) {
+          ps::FileSystem::WriteStream* slot_stream;            
+          std::string file_name = output_dir + "/" + ReplaceVariableName(info.name) + "&" + ReplaceVariableName(iter.first);
+          ps::FileSystem::RemoveAny(file_name);
+          PS_CHECK_STATUS(ps::FileSystem::OpenWriteStreamAny(file_name, &slot_stream));
+          slot_stream_map[iter.first] = slot_stream;
+        }
+      }
+
+      int sparse_id_cnt = 0;
       switch (vs.type) {
-        case ps::server::CheckpointUtils::VariableStruct::kHashSlicer: {
-          PS_CHECK_STATUS(ConvertHashSparseVariable(vs, output_stream));
-          continue;
+        case ps::server::CheckpointUtils::VariableStruct::kHashSlicer128: {
+          sparse_id_cnt = vs.hash_slicer128.items.size();
+          PS_CHECK_STATUS(ConvertHashVariable(vs, vs.hash_slicer128, output_stream, with_slots, slot_stream_map));
+          break;
         }
+        case ps::server::CheckpointUtils::VariableStruct::kHashSlicer64: {
+          sparse_id_cnt = vs.hash_slicer64.items.size();
+          PS_CHECK_STATUS(ConvertHashVariable(vs, vs.hash_slicer64, output_stream, with_slots, slot_stream_map));
+          break;
+        }          
         case ps::server::CheckpointUtils::VariableStruct::kIndexSlicer: {
-          PS_CHECK_STATUS(ConvertIndexVariable(vs, output_stream));
-          continue;
+          PS_CHECK_STATUS(ConvertIndexVariable(vs, output_stream, i, info.parts.size(), with_slots, convert_index_with_enter, slot_stream_map));
+          break;
         }
         default:
           return ps::Status::NotImplemented("Not Implemented variable slicer type");
       }
-    }
-    output_stream->Close();
-    return ps::Status::Ok();
-  }
 
-  ps::Status LoadMeta(const std::string& checkpoint_path, std::vector<ps::VariableInfo>* infos) {
-    std::unique_ptr<ps::FileSystem::ReadStream> s;
-    PS_CHECK_STATUS(ps::FileSystem::OpenReadStreamAny(checkpoint_path  + "__meta__", &s));
-    size_t server_count;
-
-    {
-      size_t infos_type;
-      std::string infos_buf;
-      PS_CHECK_STATUS(s->ReadRaw(&server_count));
-      PS_CHECK_STATUS(s->ReadRaw(&infos_type));
-      PS_CHECK_STATUS(s->ReadStr(&infos_buf));
-      ps::Data* info_wrapper;
-      size_t len;
-      ps::serializer::MemGuard mem;
-      ps::serializer::Fragment frag(&infos_buf[0], infos_buf.size());
-      PS_CHECK_STATUS(ps::serializer::DeserializeAny<ps::Data>(infos_type, &frag, 0, &info_wrapper, &len, mem));
-      std::unique_ptr<ps::Data> info_wrapper_deleter(info_wrapper);
-      ps::WrapperData<ps::VariableInfoCollection>* info_wrapper_converted = dynamic_cast<ps::WrapperData<ps::VariableInfoCollection>*>(info_wrapper);
-      if (info_wrapper_converted == nullptr) {
-        return ps::Status::Unknown("Variable Info Load Error");
-      }
-      *infos = info_wrapper_converted->Internal().infos;
+      printf("finish convert [%s], part[%d], id_cnt[%d], duration[%dms]\n", 
+             info.name.c_str(), i, 
+             sparse_id_cnt, 
+             (TimeUtils::NowMicros() - start_time) / 1000);      
+    }
+    for (auto& iter : slot_stream_map) {
+      iter.second->Close();  
     }
+    output_stream->Close();
     return ps::Status::Ok();
   }
 
-  ps::Status ConvertHashSparseVariable(ps::server::CheckpointUtils::VariableStruct& vs, ps::FileSystem::WriteStream* output_stream) {
+  template<typename KeyType>
+  ps::Status ConvertHashVariable(ps::server::CheckpointUtils::VariableStruct& vs, const ps::HashMapStruct<KeyType>& slicer, ps::FileSystem::WriteStream* output_stream, bool with_slots, std::map<std::string, ps::FileSystem::WriteStream*>& slot_stream_map) {
     std::vector<size_t> dims = vs.data.Shape().Dims();
     size_t slicer_size = 1;
     for (size_t dim = 1; dim < dims.size(); dim++) {
       slicer_size *= dims[dim];
     }
-    for (size_t i = 0; i < vs.hash_slicer.items.size(); i++) {
-      ps::HashMapItem& item = vs.hash_slicer.items[i];
+
+    
+
+    for (size_t i = 0; i < slicer.items.size(); i++) {
+      const ps::HashMapItem<KeyType>& item = slicer.items[i];
       CASES(vs.data.Type(),
         do {
-          std::stringstream ss;
-          T* raw = vs.data.Raw<T>();
-          if (!hash64_) {
-            ss << std::to_string(item.x) << ",";
-          }
-          ss << std::to_string(item.y);
+          std::string ss;
+          T* raw = vs.data.Raw<T>(item.id);
+          ss += ToString<KeyType>(item.key);
           for (size_t j = 0; j < slicer_size; j++) {
-            ss << "," << std::to_string(raw[item.id * slicer_size + j]);
+            ss += "," + StringUtils::ToStringPrecision(*raw++);
           }
-          ss << std::endl;
-          output_stream->Write(ss.str().c_str(), ss.str().size());
+          ss += "\n";
+          output_stream->Write(ss.c_str(), ss.size());
         } while (0));
+      if (with_slots) {
+        for (const auto& iter: vs.slots) {
+          CASES(iter.second.tensor->Type(),
+                do {
+                  std::string slot_stream;
+                  if (iter.second.joiner == ps::server::Variable::SlotJoiner::kVariableLike) {
+                    std::vector<size_t> sdims = iter.second.tensor->Shape().Dims();
+                    size_t ssize = 1;
+                    for (size_t dim = 1; dim < sdims.size(); dim++) {
+                      ssize *= sdims[dim];
+                    }
+                    T* raw = iter.second.tensor->Raw<T>(item.id);
+                    slot_stream += ToString<KeyType>(item.key);
+                    for (size_t j = 0; j < ssize; j++) {
+                      slot_stream += "," + StringUtils::ToStringPrecision(*raw++);
+                    }
+                    slot_stream += "\n";
+                  } else {
+                    // for kAnyOne slot, only print first one
+                    if (i == 0) {
+                      T* raw = iter.second.tensor->Raw<T>();
+                      slot_stream += StringUtils::ToStringPrecision(*raw++);
+                      for (size_t j = 1; j < iter.second.tensor->Shape().NumElements(); j++) {
+                        slot_stream += "," + StringUtils::ToStringPrecision(*raw++);
+                      }
+                    }
+                  }
+                  slot_stream_map[iter.first]->Write(slot_stream.c_str(), slot_stream.size());
+                } while (0));
+        }
+      }
     }
     return ps::Status::Ok();
   }
 
-  ps::Status ConvertIndexVariable(ps::server::CheckpointUtils::VariableStruct& vs, ps::FileSystem::WriteStream* output_stream) {
+  ps::Status ConvertIndexVariable(ps::server::CheckpointUtils::VariableStruct& vs, ps::FileSystem::WriteStream* output_stream, int index, int total,
+                                  bool with_slots, bool convert_index_with_enter, std::map<std::string, ps::FileSystem::WriteStream*>& slot_stream_map) {
+    std::string ss;
     CASES(vs.data.Type(), do {
       if (vs.data.Shape().Size() == 0) {
-        std::string value = std::to_string(vs.data.Raw<T>()[0]);
+        std::string value = StringUtils::ToStringPrecision(vs.data.Raw<T>()[0]);
         value += "\n";
         output_stream->Write(value.c_str(), value.size());        
       } else {
-        std::stringstream ss;
+        if (vs.data.Shape().Size() > 2) {
+          printf("Warning: vs.data.Shape().Size() = %ld\n", vs.data.Shape().Size());
+        }
         for (int i = 0; i < vs.data.Shape().NumElements(); ++i) {
-          if (i > 0) {
-            ss << ",";
-          } 
-          ss << std::to_string(vs.data.Raw<T>()[i]);
+          if (i > 0 || index != 0) {
+            ss += (convert_index_with_enter && vs.data.Shape().Size() == 2 && i % vs.data.Shape()[1] == 0) ? "\n" : ",";
+          }
+          ss += StringUtils::ToStringPrecision(vs.data.Raw<T>()[i]);
         }
-
-        ss << std::endl;
-        output_stream->Write(ss.str().c_str(), ss.str().size());
+        if (index == total - 1) {
+          ss += "\n";
+        }
+        output_stream->Write(ss.c_str(), ss.size());
       }
     } while (0));
-
+    if (with_slots) {
+      for (const auto& iter: vs.slots) {
+        std::string slot_stream;
+        CASES(iter.second.tensor->Type(), do {
+          if (iter.second.tensor->Shape().Size() == 0) {
+            std::string value = StringUtils::ToStringPrecision(iter.second.tensor->Raw<T>()[0]);
+            value += "\n";
+            slot_stream_map[iter.first]->Write(value.c_str(), value.size());
+          } else {
+            for (int i = 0; i < iter.second.tensor->Shape().NumElements(); ++i) {
+              if (i > 0 || index != 0) {
+                slot_stream += ",";
+              }
+              slot_stream += StringUtils::ToStringPrecision(iter.second.tensor->Raw<T>()[i]);
+            }
+          }
+        } while (0));
+        if (index == total - 1) {
+          slot_stream += "\n";
+        }
+        slot_stream_map[iter.first]->Write(slot_stream.c_str(), slot_stream.size());
+      }
+    }
     return ps::Status::Ok();
   }
 
-  bool hash64_;
+  bool with_slots_;    
+  bool convert_index_with_enter_;
 };
 
+template<>  
+std::string PsConvertCkptVariableOp::ToString<int64_t>(int64_t key) {
+  return std::to_string(key);
+}
+
+template<>  
+std::string PsConvertCkptVariableOp::ToString<ps::Hash128Key>(ps::Hash128Key key) {
+  return std::to_string(key.hash1) + "," + std::to_string(key.hash2);
+}
+
 XDL_DEFINE_OP(PsConvertCkptVariableOp)
    .Input("checkpoint_dir", DataType::kInt8)
    .Input("output_dir", DataType::kInt8)
    .Input("variables", DataType::kInt8)
-   .Attr("hash64", AttrValue::kBool, false);
+   .Attr("with_slots", AttrValue::kBool, false)
+   .Attr("convert_index_with_enter", AttrValue::kBool, false);
 
 XDL_REGISTER_KERNEL(PsConvertCkptVariableOp, PsConvertCkptVariableOp).Device("CPU");
 
+
 } // namespace xdl
 
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adagrad_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adagrad_op.cc
index 7b3956db..26096d94 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adagrad_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adagrad_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -52,12 +52,16 @@ class PsDenseApplyAdagradOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> acc_vec = {init_acc};
+
     switch (var_type_) {
     case VarType::kIndex:
       client->DensePush(
           var_name_, 
           "AdagradUpdater", 
-          client->Args(convert_grad, lr, init_acc), 
+          client->Args(grad_vec, lr_vec, acc_vec), 
           cb);
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adam_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adam_op.cc
index 264744a4..90a4a2ce 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adam_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adam_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -28,7 +28,6 @@ class PsDenseApplyAdamOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
     XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
-    XDL_CHECK_STATUS(ctx->GetAttr("lr_decay", &lr_decay_));
     XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
     return Status::Ok();
   }
@@ -48,8 +47,11 @@ class PsDenseApplyAdamOp : public xdl::OpKernelAsync {
     Tensor t_lr;
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &t_lr), done);
     double lr = t_lr.Scalar<double>();
+    Tensor t_lr_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &t_lr_decay), done);
+    bool lr_decay = t_lr_decay.Scalar<bool>();
     Tensor grad;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &grad), done);
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(5, &grad), done);
     ps::Tensor convert_grad;
     XDL_CHECK_STATUS_ASYNC(
         XDL2PS::ConvertTensor(grad, &convert_grad), 
@@ -59,12 +61,19 @@ class PsDenseApplyAdamOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> epsilon_vec = {epsilon};
+    std::vector<double> beta1_vec = {beta1};
+    std::vector<double> beta2_vec = {beta2};
+    std::vector<bool> lr_decay_vec = {lr_decay};
+
     switch (var_type_) {
     case VarType::kIndex:
       client->DensePush(
           var_name_, 
           "AdamUpdater", 
-          client->Args(convert_grad, lr, epsilon, beta1, beta2, lr_decay_), 
+          client->Args(grad_vec, lr_vec, epsilon_vec, beta1_vec, beta2_vec, lr_decay_vec), 
           cb);
       break;
     default:
@@ -78,7 +87,6 @@ class PsDenseApplyAdamOp : public xdl::OpKernelAsync {
  private:
   std::string var_name_;
   VarType var_type_;
-  bool lr_decay_;
 };
 
 XDL_DEFINE_OP(PsDenseApplyAdamOp)
@@ -86,9 +94,9 @@ XDL_DEFINE_OP(PsDenseApplyAdamOp)
   .Input("beta2", DataType::kDouble)
   .Input("epsilon", DataType::kDouble)
   .Input("learning_rate", DataType::kDouble)
+  .Input("lr_decay", DataType::kBool)
   .Input("grad", DataType::kFloat)
   .Attr("var_name", AttrValue::kString)
-  .Attr("lr_decay", AttrValue::kBool)
   .Attr("var_type", AttrValue::kString);
 
 XDL_REGISTER_KERNEL(PsDenseApplyAdamOp, PsDenseApplyAdamOp)
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_op.cc
index 5e48a41b..48441fcf 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -61,13 +61,18 @@ class PsDenseApplyAdaptiveRevisionOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> acc_vec = {init_acc};
+    std::vector<double> ratio_vec = {max_revision_ratio};
+
     switch (var_type_) {
     case VarType::kIndex:
       client->DensePush(
           var_name_, 
           "AdaptiveRevisionUpdater", 
-          client->Args(convert_grad, lr, init_acc, 
-                       max_revision_ratio, 
+          client->Args(grad_vec, lr_vec, acc_vec, 
+                       ratio_vec, 
                        worker_cnt, 
                        worker_idx), 
           cb);
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_pull_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_pull_op.cc
index 896e14a4..0aa3437d 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_pull_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_adaptive_revision_pull_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_ftrl_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_ftrl_op.cc
index a6330993..8b7662d7 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_ftrl_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_ftrl_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -61,12 +61,19 @@ class PsDenseApplyFtrlOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> lr_power_vec = {lr_power};
+    std::vector<double> acc_vec = {init_acc};
+    std::vector<double> l1_vec = {l1_reg};
+    std::vector<double> l2_vec = {l2_reg};
+
     switch (var_type_) {
     case VarType::kIndex:
       client->DensePush(
           var_name_, 
           "FtrlUpdater", 
-          client->Args(convert_grad, lr, lr_power, init_acc, l1_reg, l2_reg), 
+          client->Args(grad_vec, lr_vec, lr_power_vec, acc_vec, l1_vec, l2_vec), 
           cb);
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_momentum_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_momentum_op.cc
index 75214626..a5ae779a 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_momentum_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_momentum_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -27,7 +27,6 @@ namespace xdl {
 class PsDenseApplyMomentumOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
-    XDL_CHECK_STATUS(ctx->GetAttr("use_nesterov", &use_nesterov_));
     XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
     XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
     return Status::Ok();
@@ -42,8 +41,11 @@ class PsDenseApplyMomentumOp : public xdl::OpKernelAsync {
     Tensor t_momentum;
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_momentum), done);
     double momentum = t_momentum.Scalar<double>();
+    Tensor t_use_nesterov;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &t_use_nesterov), done);
+    bool use_nesterov = t_use_nesterov.Scalar<bool>();
     Tensor grad;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &grad), done);
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &grad), done);
     ps::Tensor convert_grad;
     XDL_CHECK_STATUS_ASYNC(
         XDL2PS::ConvertTensor(grad, &convert_grad), 
@@ -53,12 +55,17 @@ class PsDenseApplyMomentumOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> momentum_vec = {momentum};
+    std::vector<bool> use_nesterov_vec = {use_nesterov};
+
     switch (var_type_) {
     case VarType::kIndex:
       client->DensePush(
           var_name_, 
           "MomentumUpdater", 
-          client->Args(convert_grad, lr, momentum, use_nesterov_), 
+          client->Args(grad_vec, lr_vec, momentum_vec, use_nesterov_vec), 
           cb);
       break;
     default:
@@ -72,16 +79,15 @@ class PsDenseApplyMomentumOp : public xdl::OpKernelAsync {
  private:
   std::string var_name_;
   VarType var_type_;
-  bool use_nesterov_;
 };
 
 XDL_DEFINE_OP(PsDenseApplyMomentumOp)
   .Input("learning_rate", DataType::kDouble)
   .Input("momentum", DataType::kDouble)
+  .Input("use_nesterov", DataType::kBool)
   .Input("grad", DataType::kFloat)
   .Attr("var_name", AttrValue::kString)
-  .Attr("var_type", AttrValue::kString)
-  .Attr("use_nesterov", AttrValue::kBool);
+  .Attr("var_type", AttrValue::kString);
 
 XDL_REGISTER_KERNEL(PsDenseApplyMomentumOp, PsDenseApplyMomentumOp)
   .Device("CPU");
diff --git a/xdl/xdl/core/ops/ps_ops/ps_dense_apply_rmsprop_op.cc b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_rmsprop_op.cc
new file mode 100644
index 00000000..01e5c45a
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_dense_apply_rmsprop_op.cc
@@ -0,0 +1,102 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+class PsDenseApplyRmspropOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    Tensor t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_lr), done);
+    double lr = t_lr.Scalar<double>();
+    Tensor t_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_decay), done);
+    double decay = t_decay.Scalar<double>();
+    Tensor t_momentum;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &t_momentum), done);
+    double momentum = t_momentum.Scalar<double>();
+    Tensor t_epsilon;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &t_epsilon), done);
+    double epsilon = t_epsilon.Scalar<double>();
+    Tensor grad;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &grad), done);
+    ps::Tensor convert_grad;
+    XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensor(grad, &convert_grad), 
+        done);
+    auto cb = [ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> decay_vec = {decay};
+    std::vector<double> momentum_vec = {momentum};
+    std::vector<double> epsilon_vec = {epsilon};
+
+    switch (var_type_) {
+    case VarType::kIndex:
+      client->DensePush(
+          var_name_, 
+          "RmspropUpdater", 
+          client->Args(grad_vec, lr_vec, decay_vec, momentum_vec, epsilon_vec),
+          cb);
+      break;
+    default:
+      XDL_CHECK_COND_ASYNC(
+          false, 
+          Status::ArgumentError("variable type error"), 
+          done);
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+};
+
+XDL_DEFINE_OP(PsDenseApplyRmspropOp)
+  .Input("learning_rate", DataType::kDouble)
+  .Input("decay", DataType::kDouble)
+  .Input("momentum", DataType::kDouble)
+  .Input("epsilon", DataType::kDouble)
+  .Input("grad", DataType::kFloat)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsDenseApplyRmspropOp, PsDenseApplyRmspropOp)
+  .Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_filter_op.cc b/xdl/xdl/core/ops/ps_ops/ps_filter_op.cc
index 03c2ab4b..cb9b22d7 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_filter_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_filter_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -14,6 +14,8 @@ limitations under the License.
 ==============================================================================*/
 
 #include "ps-plus/client/partitioner/broadcast.h"
+#include "ps-plus/client/partitioner/reduce.h"
+#include "xdl/core/utils/string_utils.h"
 #include "xdl/core/lib/status.h"
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
@@ -29,49 +31,83 @@ class PsFilterOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
     XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
-    XDL_CHECK_STATUS(ctx->GetAttr("pattern", &pattern_));
+    XDL_CHECK_STATUS(ctx->GetAttr("func_def", &func_def_));
+    XDL_CHECK_STATUS(ctx->GetAttr("func_name", &func_name_));
+    std::string func_args;
+    XDL_CHECK_STATUS(ctx->GetAttr("func_args", &func_args));
+    func_args_ = StringUtils::split(func_args, ";");
+    std::string payload_name;
+    XDL_CHECK_STATUS(ctx->GetAttr("payload_name", &payload_name));
+    payload_name_ = StringUtils::split(payload_name, ";");
     return Status::Ok();
   }
 
   void Compute(OpKernelContext* ctx, Callback done) override {
     ps::client::BaseClient* client;
     XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
-    Tensor t_d;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_d), done);
-    double d = t_d.Scalar<double>();
-    Tensor t_i;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_i), done);
-    int64_t i = t_i.Scalar<int64_t>();
+    std::vector<Tensor> payload_org;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("payload", &payload_org), done);
+    std::vector<ps::Tensor> payload;
+    for (auto& p : payload_org) {
+      payload.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(p, &payload.back()),
+        done);
+    }
+    ps::client::UdfData udf("HashSimpleFilter", 
+                            ps::client::UdfData(0), 
+                            ps::client::UdfData(1), 
+                            ps::client::UdfData(2),
+                            ps::client::UdfData(3),
+                            ps::client::UdfData(4)
+                            );
+    std::vector<ps::client::Partitioner*> spliters{
+      new ps::client::partitioner::Broadcast, 
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast
+    };
+    std::vector<ps::client::Partitioner*> combiners{
+      new ps::client::partitioner::ReduceSum<size_t>
+    };
     std::vector<std::unique_ptr<ps::Data>>* outputs = 
-      new std::vector<std::unique_ptr<ps::Data>>;
-    auto cb = [ctx, outputs, done](const ps::Status& st) {
+      new std::vector<std::unique_ptr<ps::Data>>;    
+    auto cb = [ctx, done, outputs](const ps::Status& st) {
+      std::vector<std::unique_ptr<ps::Data>> o = std::move(*outputs);
       delete outputs;
       XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      ps::WrapperData<size_t>* rst = dynamic_cast<ps::WrapperData<size_t>*>(o[0].get());
+      if (rst == nullptr) {
+        done(Status::ArgumentError("HashSimpleFilter Return Error"));
+        return;
+      }
+      Tensor t;
+      XDL_CHECK_STATUS_ASYNC(ctx->AllocateOutput(0, TensorShape({}), &t), done);
+      t.Raw<int64_t>()[0] = rst->Internal();
       done(Status::Ok());
     };
-    ps::client::UdfData udf("HashUnaryFilter", 
-                            ps::client::UdfData(0), 
-                            ps::client::UdfData(1), 
-                            ps::client::UdfData(2));
-    std::vector<ps::client::Partitioner*> spliters{
-      new ps::client::partitioner::Broadcast, 
-        new ps::client::partitioner::Broadcast,
-        new ps::client::partitioner::Broadcast};
-    client->Process(udf, var_name_, client->Args(pattern_, d, i), 
-                    spliters, {}, outputs, cb);
+    client->Process(udf, var_name_, client->Args(func_def_, func_name_, func_args_, payload_name_, payload),
+                    spliters, combiners, outputs, cb);
   }
 
  private:
   std::string var_name_;
-  std::string pattern_;
-  VarType var_type_;
+  std::string func_def_;
+  std::string func_name_;
+  std::vector<std::string> func_args_;
+  std::vector<std::string> payload_name_;
 };
 
 XDL_DEFINE_OP(PsFilterOp)
-  .Input("d", DataType::kDouble)
-  .Input("i", DataType::kInt64)
+  .InputListV2("payload", "payload_type")
   .Attr("var_name", AttrValue::kString)
-  .Attr("pattern", AttrValue::kString);
+  .Attr("func_def", AttrValue::kString)
+  .Attr("func_name", AttrValue::kString)
+  .Attr("func_args", AttrValue::kString)
+  .Attr("payload_name", AttrValue::kString)
+  .Attr("payload_type", AttrValue::kDataTypeList)
+  .Output("del_size", DataType::kInt64);
 
 XDL_REGISTER_KERNEL(PsFilterOp, PsFilterOp).Device("CPU");
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_identity_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_identity_initializer_op.cc
index 613731ba..f97989c5 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_identity_initializer_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_identity_initializer_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_is_initialized_op.cc b/xdl/xdl/core/ops/ps_ops/ps_is_initialized_op.cc
index d7656f80..0bb7fe06 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_is_initialized_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_is_initialized_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_mark_op.cc b/xdl/xdl/core/ops/ps_ops/ps_mark_op.cc
index 26f96721..b6d80e2c 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_mark_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_mark_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -55,23 +55,33 @@ class PsMarkOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> id_vec = {convert_ids};
+    std::vector<std::string> name_vec = {var_name_};
+    std::vector<float> save_ratio_vec = {0.0};    
+    std::vector<std::string> pattern_vec = {pattern_};
+    std::vector<int64_t> i_vec = {i};
+
     ps::client::UdfData slice_udf("BuildHashSlice", 
                                   ps::client::UdfData(0), 
                                   ps::client::UdfData(3),
-                                  ps::client::UdfData(4));
+                                  ps::client::UdfData(4),                                  
+                                  ps::client::UdfData(5),
+                                  ps::client::UdfData(6));
     ps::client::UdfData udf("ScalarIntegerLogger", 
                             slice_udf, 
                             ps::client::UdfData(1), 
                             ps::client::UdfData(2));
     std::vector<ps::client::Partitioner*> spliters{
-      new ps::client::partitioner::HashId, 
+      new ps::client::partitioner::HashId,
+        new ps::client::partitioner::Broadcast,
+        new ps::client::partitioner::Broadcast,
         new ps::client::partitioner::Broadcast,
         new ps::client::partitioner::Broadcast,
         new ps::client::partitioner::Broadcast,
         new ps::client::partitioner::Broadcast};
     client->Process(
         udf, var_name_, 
-        client->Args(convert_ids, pattern_, i, false, 0.0), 
+        client->Args(id_vec, pattern_vec, i_vec, name_vec, save_ratio_vec, true, false),
         spliters, {}, outputs, cb);
   }
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_merged_mark_op.cc b/xdl/xdl/core/ops/ps_ops/ps_merged_mark_op.cc
new file mode 100644
index 00000000..9cc52503
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_merged_mark_op.cc
@@ -0,0 +1,114 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/partitioner/merged_broadcast.h"
+#include "ps-plus/client/partitioner/merged_hash.h"
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/utils/string_utils.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+class PsMergedMarkOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+
+    std::string pattern_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("patterns", &pattern_str));
+    patterns_ = StringUtils::split(pattern_str, ",");
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+
+    std::vector<Tensor> raw_ids;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("ids", &raw_ids), done);
+    std::vector<Tensor> raw_i;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("i", &raw_i), done);
+    std::vector<int64_t> i_vec;
+    std::vector<float> save_ratio_vec;
+    for (size_t i = 0; i < raw_i.size(); ++i) {
+      i_vec.push_back(raw_i[i].Scalar<int64_t>());
+      save_ratio_vec.push_back(0.0);
+    }
+       
+    std::vector<ps::Tensor> id_vec;
+    for (auto& id: raw_ids) {
+      id_vec.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+          XDL2PS::ConvertTensorZC(id, &id_vec.back()),
+          done);
+    }
+
+    std::vector<std::vector<std::unique_ptr<ps::Data>>>* outputs = 
+      new std::vector<std::vector<std::unique_ptr<ps::Data>>>;
+    auto cb = [ctx, outputs, done](const ps::Status& st) {
+      delete outputs;
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    ps::client::UdfData slice_udf("BuildHashSlice", 
+                                  ps::client::UdfData(0), 
+                                  ps::client::UdfData(3),
+                                  ps::client::UdfData(4),                                  
+                                  ps::client::UdfData(5),
+                                  ps::client::UdfData(6));
+    ps::client::UdfData udf("ScalarIntegerLogger", 
+                            slice_udf, 
+                            ps::client::UdfData(1), 
+                            ps::client::UdfData(2));
+    std::vector<ps::client::MergedPartitioner*> spliters{
+        new ps::client::partitioner::MergedHashId,
+        new ps::client::partitioner::MergedBroadcast,
+        new ps::client::partitioner::MergedBroadcast,
+        new ps::client::partitioner::MergedBroadcast,
+        new ps::client::partitioner::MergedBroadcast,
+        new ps::client::partitioner::MergedBroadcast,
+        new ps::client::partitioner::MergedBroadcast};
+    client->Process(
+        udf, var_names_, 
+        client->Args(id_vec, patterns_, i_vec, var_names_, save_ratio_vec, true, false),
+        spliters, {}, outputs, cb);
+  }
+
+ private:
+  std::vector<std::string> var_names_;
+  std::vector<std::string> patterns_;
+};
+
+XDL_DEFINE_OP(PsMergedMarkOp)
+  .InputListV2("ids", "input_type_0")
+  .InputListV2("i", "input_type_1")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("var_names", AttrValue::kString)
+  .Attr("patterns", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsMergedMarkOp, PsMergedMarkOp).Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_merged_sparse_pull_op.cc b/xdl/xdl/core/ops/ps_ops/ps_merged_sparse_pull_op.cc
new file mode 100644
index 00000000..477f19a5
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_merged_sparse_pull_op.cc
@@ -0,0 +1,104 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/utils/string_utils.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+class PsMergedSparsePullOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> raw_ids;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("ids", &raw_ids), done);
+    std::vector<Tensor> t_sr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("save_ratios", &t_sr), done);
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < t_sr.size(); ++i) {
+      save_ratios.push_back(t_sr[i].Scalar<float>());
+    }
+    
+    
+    std::vector<ps::Tensor> converted_ids;
+    for (auto& id: raw_ids) {
+      converted_ids.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+          XDL2PS::ConvertTensorZC(id, &converted_ids.back()),
+          done);
+    }
+
+    std::vector<ps::Tensor>* ps_result = new std::vector<ps::Tensor>();
+    auto cb = [raw_ids, ps_result, ctx, done](const ps::Status& st) {
+      std::vector<Tensor> result;
+      std::unique_ptr<std::vector<ps::Tensor> > result_deleter(ps_result);
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      std::chrono::time_point<std::chrono::system_clock> time_start, time_end;
+      for (auto& item: *ps_result) {
+        result.emplace_back();
+        XDL_CHECK_STATUS_ASYNC(
+            PS2XDL::ConvertTensorZC(item, &result.back()),
+            done);
+      }
+      ctx->SetOutputList("outputs", result);
+      done(Status::Ok());
+    };
+
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashPull(var_names_, converted_ids, save_ratios, ps_result, cb);
+    } else {
+      done(Status::ArgumentError("PsMergedSparsePullOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+  std::vector<std::string> var_names_;
+};
+
+XDL_DEFINE_OP(PsMergedSparsePullOp)
+  .InputListV2("ids", "input_type_0")
+  .InputListV2("save_ratios", "input_type_1")
+  .OutputList("outputs", DataType::kFloat, "output_size")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("output_size", AttrValue::kInt)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsMergedSparsePullOp, PsMergedSparsePullOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_merged_sparse_statis_op.cc b/xdl/xdl/core/ops/ps_ops/ps_merged_sparse_statis_op.cc
new file mode 100644
index 00000000..8cd5c905
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_merged_sparse_statis_op.cc
@@ -0,0 +1,214 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/cpu_device.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/utils/string_utils.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+class PsMergedSparseStatisOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(ctx->GetAttr("statis_type", &statis_type_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+
+    std::vector<Tensor> ids;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("ids", &ids), done);
+    std::vector<Tensor> indexs;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("indexs", &indexs), done);
+    std::vector<Tensor> segments;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("segments", &segments), done);
+    std::vector<Tensor> sample_indexs;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("sample_indexs", &sample_indexs), done);
+    std::vector<Tensor> sample_segments;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("sample_segments", &sample_segments), done);
+    std::vector<Tensor> labels;
+    if (statis_type_ == "click") {
+      XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("labels", &labels), done);
+    }
+    std::vector<Tensor> t_save_ratios;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("save_ratios", &t_save_ratios), done);
+    Tensor global_step;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput("global_step", &global_step), done);
+    Tensor statis_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput("statis_decay", &statis_decay), done);
+    Tensor statis_decay_period;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput("statis_decay_period", &statis_decay_period), done);
+
+    std::vector<Tensor> clicks;
+    auto check = [](bool b) {
+      return b ? Status::Ok()
+          : Status::ArgumentError("Illegal check ps_merged_sparse_statis_op");
+    };
+    XDL_CHECK_STATUS_ASYNC(check(indexs.size() == ids.size()), done);
+    XDL_CHECK_STATUS_ASYNC(check(segments.size() == ids.size()), done);
+    XDL_CHECK_STATUS_ASYNC(check(sample_indexs.size() == ids.size()), done);
+    XDL_CHECK_STATUS_ASYNC(check(sample_segments.size() == ids.size()), done);
+    XDL_CHECK_STATUS_ASYNC(check(t_save_ratios.size() == ids.size()), done);
+    if (statis_type_ == "click") {
+      XDL_CHECK_STATUS_ASYNC(check(labels.size() == ids.size()), done);
+    }
+
+    clicks.resize(ids.size());
+    #pragma omp parallel for
+    for (size_t i = 0; i < ids.size(); ++i) {  // number of var
+      int32_t last_segment = 0;
+      const size_t bs = segments[i].Shape().NumElements();
+      const size_t index_num = indexs[i].Shape().Dims()[0];
+      const size_t uniq_num = ids[i].Shape().Dims()[0];
+      size_t label_dim = 0;
+      float* plabel = nullptr;                         // {bs,2}
+      int32_t* psegment = segments[i].Raw<int32_t>();  // {bs}
+      int32_t* psample_index = sample_indexs[i].Raw<int32_t>();      // {index_num}
+      int32_t* psample_segment = sample_segments[i].Raw<int32_t>();  // {uniq_num}
+      if (statis_type_ == "click") {
+        //XDL_CHECK_STATUS_ASYNC(check(labels[i].Shape().Dims().size() <= 2), done);
+        plabel = labels[i].Raw<float>();
+        label_dim = labels[i].Shape().Size() == 1 ? 1 : labels[i].Shape().Dims()[1];
+        //XDL_CHECK_STATUS_ASYNC(check(labels[i].Shape().Dims()[0] == bs), done);
+      }
+      //XDL_CHECK_STATUS_ASYNC(check(sample_indexs[i].Shape().Dims()[0] == index_num), done);
+      //XDL_CHECK_STATUS_ASYNC(check(sample_segments[i].Shape().Dims()[0] == uniq_num), done);
+      Tensor click(ctx->GetDevice(), TensorShape({uniq_num}), DataType::kInt32);
+      int32_t* pclick = click.Raw<int32_t>();
+      for (size_t j = 0; j < uniq_num; ++j) {
+        int32_t nclick = 0;
+        if (plabel == nullptr) {
+          nclick = psample_segment[j] - (j == 0 ? 0 : psample_segment[j-1]);
+        } else {
+          for (int32_t k = j == 0 ? 0 : psample_segment[j-1]; k < psample_segment[j]; ++k) {
+            float flabel = plabel[psample_index[k] * label_dim + label_dim - 1];
+            nclick += flabel > 0.5 ? 1 : 0;
+          }
+        }
+        pclick[j] = nclick;
+      }
+      clicks[i] = std::move(click);
+    }
+
+    std::vector<ps::Tensor> converted_ids;
+    for (auto& id: ids) {
+      converted_ids.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+          XDL2PS::ConvertTensorZC(id, &converted_ids.back()),
+          done);
+    }
+
+    std::vector<ps::Tensor> converted_clicks;
+    for (auto& click: clicks) {
+      converted_clicks.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+          XDL2PS::ConvertTensorZC(click, &converted_clicks.back()),
+          done);
+    }
+
+    ps::Tensor converted_global_step;
+    XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(global_step, &converted_global_step),
+        done);
+
+    ps::Tensor converted_statis_decay;
+    XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(statis_decay, &converted_statis_decay),
+        done);
+
+    ps::Tensor converted_statis_decay_period;
+    XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(statis_decay_period, &converted_statis_decay_period),
+        done);
+
+    std::vector<ps::Tensor>* ps_result = new std::vector<ps::Tensor>();
+    auto cb = [ps_result, ctx, done](const ps::Status& st) {
+      std::vector<Tensor> result;
+      std::unique_ptr<std::vector<ps::Tensor> > result_deleter(ps_result);
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      for (auto& item: *ps_result) {
+        result.emplace_back();
+        XDL_CHECK_STATUS_ASYNC(
+            PS2XDL::ConvertTensorZC(item, &result.back()),
+            done);
+      }
+      ctx->SetOutputList("outputs", result);
+      done(Status::Ok());
+    };
+
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < t_save_ratios.size(); ++i) {
+      save_ratios.push_back(t_save_ratios[i].Scalar<float>());
+    }    
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashStatis(var_names_, converted_ids, save_ratios, converted_clicks, converted_global_step,
+                               converted_statis_decay, converted_statis_decay_period,
+                               statis_type_, ps_result, cb);
+    } else {
+      done(Status::ArgumentError("PsMergedSparseStatisOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  std::string statis_type_;
+  VarType var_type_;
+  std::vector<std::string> var_names_;
+};
+
+XDL_DEFINE_OP(PsMergedSparseStatisOp)
+  .InputListV2("ids", "input_type")
+  .InputListV2("indexs", "input_type_1")
+  .InputListV2("segments", "input_type_2")
+  .InputListV2("sample_indexs", "input_type_3")
+  .InputListV2("sample_segments", "input_type_4")
+  .InputListV2("labels", "input_type_5")
+  .InputListV2("save_ratios", "input_type_6")
+  .Input("global_step", DataType::kInt64)
+  .Input("statis_decay", DataType::kDouble)
+  .Input("statis_decay_period", DataType::kInt64)
+  .OutputList("outputs", DataType::kFloat, "output_size")
+  .Attr("input_type", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("input_type_2", AttrValue::kDataTypeList)
+  .Attr("input_type_3", AttrValue::kDataTypeList)
+  .Attr("input_type_4", AttrValue::kDataTypeList)
+  .Attr("input_type_5", AttrValue::kDataTypeList)
+  .Attr("input_type_6", AttrValue::kDataTypeList)
+  .Attr("output_size", AttrValue::kInt)
+  .Attr("statis_type", AttrValue::kString)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsMergedSparseStatisOp, PsMergedSparseStatisOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/normal_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_normal_initializer_op.cc
similarity index 96%
rename from xdl/xdl/core/ops/ps_ops/normal_initializer_op.cc
rename to xdl/xdl/core/ops/ps_ops/ps_normal_initializer_op.cc
index 2b7bcafb..a9b6ca52 100644
--- a/xdl/xdl/core/ops/ps_ops/normal_initializer_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_normal_initializer_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -56,7 +56,8 @@ class PsNormalInitializerOp : public xdl::OpKernelAsync {
     case VarType::kIndex:
       client->IndexInitializer(var_name_, initializer, cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashInitializer(var_name_, initializer, cb);
       break;              
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_orthogonal_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_orthogonal_initializer_op.cc
new file mode 100644
index 00000000..7717bf94
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_orthogonal_initializer_op.cc
@@ -0,0 +1,91 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include "ps-plus/common/initializer/orthogonal_initializer.h"
+
+namespace xdl {
+
+class PsOrthogonalInitializerOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(ctx->GetAttr("seed", &seed_));
+    XDL_CHECK_STATUS(ctx->GetAttr("gain", &gain_));
+    XDL_CHECK_STATUS(ctx->GetAttr("dim", &dim_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    auto cb = [ctx, done](const ps::Status& st) {
+      if (st.Code() == ps::Status::kAlreadyExist) {
+        done(Status::Ok());
+        return;
+      }
+
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    ps::Initializer* initializer = 
+      new ps::initializer::OrthogonalInitializer(
+          dim_, seed_, gain_);
+    switch (var_type_) {
+    case VarType::kIndex:
+      client->IndexInitializer(var_name_, initializer, cb);
+      break;
+    case VarType::kHash128:
+    case VarType::kHash64:
+      client->HashInitializer(var_name_, initializer, cb);
+      break;              
+    default:
+      XDL_CHECK_COND_ASYNC(
+          false,
+          Status::ArgumentError("unsupported var type"),
+          done);
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+  int64_t seed_;
+  float gain_;
+  int64_t dim_;
+};
+
+XDL_DEFINE_OP(PsOrthogonalInitializerOp)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("seed", AttrValue::kInt)
+  .Attr("gain", AttrValue::kFloat)
+  .Attr("dim", AttrValue::kInt)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsOrthogonalInitializerOp, PsOrthogonalInitializerOp)
+  .Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_pull_op.cc b/xdl/xdl/core/ops/ps_ops/ps_pull_op.cc
index 80534279..ee78fb4f 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_pull_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_pull_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_register_variable_op.cc b/xdl/xdl/core/ops/ps_ops/ps_register_variable_op.cc
index fb7d5c55..14b2de02 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_register_variable_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_register_variable_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -62,8 +62,11 @@ class PsRegisterVariableOp : public xdl::OpKernel {
     case VarType::kIndex:
       vi.type = ps::VariableInfo::kIndex;
       break;
-    case VarType::kHash:
-      vi.type = ps::VariableInfo::kHash;
+    case VarType::kHash128:
+      vi.type = ps::VariableInfo::kHash128;
+      break;
+    case VarType::kHash64:
+      vi.type = ps::VariableInfo::kHash64;
       break;
     default:
       XDL_CHECK_COND(
diff --git a/xdl/xdl/core/ops/ps_ops/ps_restore_op.cc b/xdl/xdl/core/ops/ps_ops/ps_restore_op.cc
index b9c22abf..b71cc1bd 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_restore_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_restore_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_save_op.cc b/xdl/xdl/core/ops/ps_ops/ps_save_op.cc
index 1c5b1e5a..60272e9a 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_save_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_save_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/ps_ops/ps_slot_filter_op.cc b/xdl/xdl/core/ops/ps_ops/ps_slot_filter_op.cc
new file mode 100644
index 00000000..da9cb566
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_slot_filter_op.cc
@@ -0,0 +1,126 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "ps-plus/client/partitioner/broadcast.h"
+#include "ps-plus/client/partitioner/reduce.h"
+#include "xdl/core/utils/string_utils.h"
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+class PsSlotFilterOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(ctx->GetAttr("func_def", &func_def_));
+    XDL_CHECK_STATUS(ctx->GetAttr("func_name", &func_name_));
+    std::string func_args;
+    XDL_CHECK_STATUS(ctx->GetAttr("func_args", &func_args));
+    func_args_ = StringUtils::split(func_args, ";");
+    std::string payload_name;
+    XDL_CHECK_STATUS(ctx->GetAttr("payload_name", &payload_name));
+    payload_name_ = StringUtils::split(payload_name, ";");
+    XDL_CHECK_STATUS(ctx->GetAttr("slot_name", &slot_name_));
+    XDL_CHECK_STATUS(ctx->GetAttr("slot_size", &slot_size_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> payload_org;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("payload", &payload_org), done);
+    std::vector<ps::Tensor> payload;
+    for (auto& p : payload_org) {
+      payload.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(p, &payload.back()),
+        done);
+    }
+    ps::client::UdfData udf("HashSlotFilter", 
+                            ps::client::UdfData(0), 
+                            ps::client::UdfData(1), 
+                            ps::client::UdfData(2),
+                            ps::client::UdfData(3),
+                            ps::client::UdfData(4),
+                            ps::client::UdfData(5),
+                            ps::client::UdfData(6)
+                            );
+    std::vector<ps::client::Partitioner*> spliters{
+      new ps::client::partitioner::Broadcast, 
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast,
+      new ps::client::partitioner::Broadcast
+    };
+    std::vector<ps::client::Partitioner*> combiners{
+      new ps::client::partitioner::ReduceSum<size_t>
+    };
+    std::vector<std::unique_ptr<ps::Data>>* outputs = 
+      new std::vector<std::unique_ptr<ps::Data>>;    
+    auto cb = [ctx, done, outputs](const ps::Status& st) {
+      std::vector<std::unique_ptr<ps::Data>> o = std::move(*outputs);
+      delete outputs;
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      ps::WrapperData<size_t>* rst = dynamic_cast<ps::WrapperData<size_t>*>(o[0].get());
+      if (rst == nullptr) {
+        done(Status::ArgumentError("HashSimpleFilter Return Error"));
+        return;
+      }
+      Tensor t;
+      XDL_CHECK_STATUS_ASYNC(ctx->AllocateOutput(0, TensorShape({}), &t), done);
+      t.Raw<int64_t>()[0] = rst->Internal();
+      done(Status::Ok());
+    };
+    client->Process(udf, var_name_, client->Args(func_def_, func_name_, func_args_, payload_name_, payload, slot_name_, (size_t)slot_size_),
+                    spliters, combiners, outputs, cb);
+  }
+
+ private:
+  std::string var_name_;
+  std::string func_def_;
+  std::string func_name_;
+  std::vector<std::string> func_args_;
+  std::vector<std::string> payload_name_;
+  std::string slot_name_;
+  int64_t slot_size_;
+};
+
+XDL_DEFINE_OP(PsSlotFilterOp)
+  .InputListV2("payload", "payload_type")
+  .Attr("var_name", AttrValue::kString)
+  .Attr("func_def", AttrValue::kString)
+  .Attr("func_name", AttrValue::kString)
+  .Attr("func_args", AttrValue::kString)
+  .Attr("payload_name", AttrValue::kString)
+  .Attr("payload_type", AttrValue::kDataTypeList)
+  .Attr("slot_name", AttrValue::kString)
+  .Attr("slot_size", AttrValue::kInt)
+  .Output("del_size", DataType::kInt64);
+
+XDL_REGISTER_KERNEL(PsSlotFilterOp, PsSlotFilterOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_merged_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_merged_op.cc
new file mode 100644
index 00000000..dd70a9ef
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_merged_op.cc
@@ -0,0 +1,116 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include "xdl/core/utils/string_utils.h"
+
+namespace xdl {
+
+class PsSparseApplyAdagradMergedOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("learning_rate", &t_lr), done);
+    std::vector<Tensor> t_init_acc;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("initial_accumulator_value", &t_init_acc), done);
+    std::vector<Tensor> grads;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("grad", &grads), done);
+    std::vector<Tensor> indices;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("indices", &indices), done);
+    std::vector<double> lr_vec;
+    for (size_t i = 0; i < t_lr.size(); ++i) {
+      lr_vec.push_back(t_lr[i].Scalar<double>());
+    }
+    std::vector<double> acc_vec;
+    for (size_t i = 0; i < t_init_acc.size(); ++i) {
+      acc_vec.push_back(t_init_acc[i].Scalar<double>());
+    }
+    std::vector<ps::Tensor> grad_vec;
+    for (auto& grad : grads) {
+      grad_vec.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(grad, &grad_vec.back()),
+        done);
+    }
+    std::vector<ps::Tensor> convert_indices;
+    for (auto& indice : indices) {
+      convert_indices.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(indice, &convert_indices.back()),
+        done);
+    }
+    auto cb = [grads, indices, ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < var_names_.size(); i++) {
+      save_ratios.push_back(0.0);
+    }    
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashPush(var_names_,
+                             convert_indices,
+                             save_ratios,
+                             "AdagradUpdater", 
+                             client->Args(grad_vec, lr_vec, acc_vec), 
+                             cb);
+    } else {
+      done(Status::ArgumentError("PsSparseApplyAdagradMergedOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  std::vector<std::string> var_names_;
+  VarType var_type_;
+};
+
+XDL_DEFINE_OP(PsSparseApplyAdagradMergedOp)
+  .InputListV2("learning_rate", "input_type_0")
+  .InputListV2("initial_accumulator_value", "input_type_1")
+  .InputListV2("grad", "input_type_2")
+  .InputListV2("indices", "input_type_3")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("input_type_2", AttrValue::kDataTypeList)
+  .Attr("input_type_3", AttrValue::kDataTypeList)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsSparseApplyAdagradMergedOp, PsSparseApplyAdagradMergedOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_op.cc
index d28c1dde..5baa86b6 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adagrad_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -59,21 +59,28 @@ class PsSparseApplyAdagradOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> acc_vec = {init_acc};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->SparsePush(
           var_name_, 
           convert_indices, 
           "AdagradUpdater", 
-          client->Args(convert_grad, lr, init_acc), 
+          client->Args(grad_vec, lr_vec, acc_vec), 
           cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashPush(
           var_name_, 
-          convert_indices, 
-          "AdagradUpdater", 
-          client->Args(convert_grad, lr, init_acc), 
+          convert_indices,
+          0.0,
+          false,
+          "AdagradUpdater",
+          client->Args(grad_vec, lr_vec, acc_vec), 
           cb);      
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_merged_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_merged_op.cc
new file mode 100644
index 00000000..3dcf8b11
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_merged_op.cc
@@ -0,0 +1,138 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include "xdl/core/utils/string_utils.h"
+
+namespace xdl {
+
+class PsSparseApplyAdamMergedOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> t_beta1;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("beta1", &t_beta1), done);
+    std::vector<double> beta1;
+    for (size_t i = 0; i < t_beta1.size(); ++i) {
+      beta1.push_back(t_beta1[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_beta2;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("beta2", &t_beta2), done);
+    std::vector<double> beta2;
+    for (size_t i = 0; i < t_beta2.size(); ++i) {
+      beta2.push_back(t_beta2[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_epsilon;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("epsilon", &t_epsilon), done);
+    std::vector<double> epsilon;
+    for (size_t i = 0; i < t_epsilon.size(); ++i) {
+      epsilon.push_back(t_epsilon[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("learning_rate", &t_lr), done);
+    std::vector<double> lr;
+    for (size_t i = 0; i < t_lr.size(); ++i) {
+      lr.push_back(t_lr[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_lr_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("lr_decay", &t_lr_decay), done);
+    std::vector<bool> lr_decay;
+    for (size_t i = 0; i < t_lr_decay.size(); ++i) {
+      lr_decay.push_back(t_lr_decay[i].Scalar<bool>());
+    }
+    std::vector<Tensor> grads;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("grad", &grads), done);
+    std::vector<Tensor> indices;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("indices", &indices), done);    
+    std::vector<ps::Tensor> convert_grad;
+    for (auto& grad : grads) {
+      convert_grad.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(grad, &convert_grad.back()),
+        done);
+    }
+    std::vector<ps::Tensor> convert_indices;
+    for (auto& indice : indices) {
+      convert_indices.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(indice, &convert_indices.back()),
+        done);
+    }
+    auto cb = [grads, indices, ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < var_names_.size(); i++) {
+      save_ratios.push_back(0.0);
+    }
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashPush(var_names_,
+                             convert_indices,
+                             save_ratios,
+                             "AdamUpdater", 
+                             client->Args(convert_grad, lr, epsilon, beta1, beta2, lr_decay), 
+                             cb);
+    } else {
+      done(Status::ArgumentError("PsSparseApplyAdamMergedOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+  std::vector<std::string> var_names_;
+};
+
+XDL_DEFINE_OP(PsSparseApplyAdamMergedOp)
+  .InputListV2("beta1", "input_type_0")
+  .InputListV2("beta2", "input_type_1")
+  .InputListV2("epsilon", "input_type_2")
+  .InputListV2("learning_rate", "input_type_3")
+  .InputListV2("lr_decay", "input_type_4")
+  .InputListV2("grad", "input_type_5")
+  .InputListV2("indices", "input_type_6")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("input_type_2", AttrValue::kDataTypeList)
+  .Attr("input_type_3", AttrValue::kDataTypeList)
+  .Attr("input_type_4", AttrValue::kDataTypeList)
+  .Attr("input_type_5", AttrValue::kDataTypeList)
+  .Attr("input_type_6", AttrValue::kDataTypeList)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsSparseApplyAdamMergedOp, PsSparseApplyAdamMergedOp).Device("CPU");
+
+} // namespace xdl
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_op.cc
index 571bc0bb..b58afff0 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_adam_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -29,7 +29,6 @@ class PsSparseApplyAdamOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
     XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
-    XDL_CHECK_STATUS(ctx->GetAttr("lr_decay", &lr_decay_));
     XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
     return Status::Ok();
   }
@@ -49,10 +48,13 @@ class PsSparseApplyAdamOp : public xdl::OpKernelAsync {
     Tensor t_lr;
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &t_lr), done);
     double lr = t_lr.Scalar<double>();
+    Tensor t_lr_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &t_lr_decay), done);
+    bool lr_decay = t_lr_decay.Scalar<bool>();
     Tensor grad;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &grad), done);
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(5, &grad), done);
     Tensor indices;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(5, &indices), done);    
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(6, &indices), done);    
     ps::Tensor convert_grad;
     XDL_CHECK_STATUS_ASYNC(
         XDL2PS::ConvertTensor(grad, &convert_grad),
@@ -66,21 +68,31 @@ class PsSparseApplyAdamOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> epsilon_vec = {epsilon};
+    std::vector<double> beta1_vec = {beta1};
+    std::vector<double> beta2_vec = {beta2};
+    std::vector<bool> lr_decay_vec = {lr_decay};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->SparsePush(
           var_name_, 
           convert_indices, 
           "AdamUpdater", 
-          client->Args(convert_grad, lr, epsilon, beta1, beta2, lr_decay_), 
+          client->Args(grad_vec, lr_vec, epsilon_vec, beta1_vec, beta2_vec, lr_decay_vec),
           cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashPush(
           var_name_, 
-          convert_indices, 
-          "AdamUpdater", 
-          client->Args(convert_grad, lr, epsilon, beta1, beta2, lr_decay_), 
+          convert_indices,
+          0.0,
+          false,
+          "AdamUpdater",
+          client->Args(grad_vec, lr_vec, epsilon_vec, beta1_vec, beta2_vec, lr_decay_vec),
           cb);      
       break;
     default:
@@ -94,7 +106,6 @@ class PsSparseApplyAdamOp : public xdl::OpKernelAsync {
  private:
   std::string var_name_;
   VarType var_type_;
-  bool lr_decay_;
 };
 
 XDL_DEFINE_OP(PsSparseApplyAdamOp)
@@ -102,10 +113,10 @@ XDL_DEFINE_OP(PsSparseApplyAdamOp)
   .Input("beta2", DataType::kDouble)
   .Input("epsilon", DataType::kDouble)
   .Input("learning_rate", DataType::kDouble)
+  .Input("lr_decay", DataType::kBool)
   .Input("grad", DataType::kFloat)
   .Input("indices", "dtype")
   .Attr("var_name", AttrValue::kString)
-  .Attr("lr_decay", AttrValue::kBool)
   .Attr("var_type", AttrValue::kString)
   .Attr("dtype", AttrValue::kDataType);
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_merged_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_merged_op.cc
new file mode 100644
index 00000000..8fc527ad
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_merged_op.cc
@@ -0,0 +1,138 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include "xdl/core/utils/string_utils.h"
+
+namespace xdl {
+
+class PsSparseApplyFtrlMergedOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("learning_rate", &t_lr), done);
+    std::vector<double> lr;
+    for (size_t i = 0; i < t_lr.size(); ++i) {
+      lr.push_back(t_lr[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_lr_power;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("learning_rate_power", &t_lr_power), done);
+    std::vector<double> lr_power;
+    for (size_t i = 0; i < t_lr_power.size(); ++i) {
+      lr_power.push_back(t_lr_power[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_init_acc;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("initial_accumulator_value", &t_init_acc), done);
+    std::vector<double> init_acc;
+    for (size_t i = 0; i < t_init_acc.size(); ++i) {
+      init_acc.push_back(t_init_acc[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_l1_reg;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("l1_reg", &t_l1_reg), done);
+    std::vector<double> l1_reg;
+    for (size_t i = 0; i < t_l1_reg.size(); ++i) {
+      l1_reg.push_back(t_l1_reg[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_l2_reg;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("l2_reg", &t_l2_reg), done);
+    std::vector<double> l2_reg;
+    for (size_t i = 0; i < t_l2_reg.size(); ++i) {
+      l2_reg.push_back(t_l2_reg[i].Scalar<double>());
+    }
+    std::vector<Tensor> grads;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("grad", &grads), done);
+    std::vector<Tensor> indices;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("indices", &indices), done);    
+    std::vector<ps::Tensor> convert_grad;
+    for (auto& grad : grads) {
+      convert_grad.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(grad, &convert_grad.back()),
+        done);
+    }
+    std::vector<ps::Tensor> convert_indices;
+    for (auto& indice : indices) {
+      convert_indices.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(indice, &convert_indices.back()),
+        done);
+    }
+    auto cb = [grads, indices, ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < var_names_.size(); i++) {
+      save_ratios.push_back(0.0);
+    }
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashPush(var_names_,
+                             convert_indices,
+                             save_ratios,
+                             "FtrlUpdater", 
+                             client->Args(convert_grad, lr, lr_power, init_acc, l1_reg, l2_reg), 
+                             cb);
+    } else {
+      done(Status::ArgumentError("PsSparseApplyFtrlMergedOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+  std::vector<std::string> var_names_;
+};
+
+XDL_DEFINE_OP(PsSparseApplyFtrlMergedOp)
+  .InputListV2("learning_rate", "input_type_0")
+  .InputListV2("learning_rate_power", "input_type_1")
+  .InputListV2("initial_accumulator_value", "input_type_2")
+  .InputListV2("l1_reg", "input_type_3")
+  .InputListV2("l2_reg", "input_type_4")
+  .InputListV2("grad", "input_type_5")
+  .InputListV2("indices", "input_type_6")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("input_type_2", AttrValue::kDataTypeList)
+  .Attr("input_type_3", AttrValue::kDataTypeList)
+  .Attr("input_type_4", AttrValue::kDataTypeList)
+  .Attr("input_type_5", AttrValue::kDataTypeList)
+  .Attr("input_type_6", AttrValue::kDataTypeList)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsSparseApplyFtrlMergedOp, PsSparseApplyFtrlMergedOp).Device("CPU");
+
+} // namespace xdl
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_op.cc
index 6ca73c61..34865f26 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_ftrl_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -68,21 +68,31 @@ class PsSparseApplyFtrlOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> lr_power_vec = {lr_power};
+    std::vector<double> acc_vec = {init_acc};
+    std::vector<double> l1_vec = {l1_reg};
+    std::vector<double> l2_vec = {l2_reg};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->SparsePush(
           var_name_, 
           convert_indices, 
           "FtrlUpdater", 
-          client->Args(convert_grad, lr, lr_power, init_acc, l1_reg, l2_reg), 
+          client->Args(grad_vec, lr_vec, lr_power_vec, acc_vec, l1_vec, l2_vec), 
           cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashPush(
           var_name_, 
-          convert_indices, 
-          "FtrlUpdater", 
-          client->Args(convert_grad, lr, lr_power, init_acc, l1_reg, l2_reg), 
+          convert_indices,
+          0.0,
+          false,
+          "FtrlUpdater",
+          client->Args(grad_vec, lr_vec, lr_power_vec, acc_vec, l1_vec, l2_vec), 
           cb);      
       break;
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_merged_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_merged_op.cc
new file mode 100644
index 00000000..15248df7
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_merged_op.cc
@@ -0,0 +1,125 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include "xdl/core/utils/string_utils.h"
+
+namespace xdl {
+
+class PsSparseApplyMomentumMergedOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("learning_rate", &t_lr), done);
+    std::vector<double> lr;
+    for (size_t i = 0; i < t_lr.size(); ++i) {
+      lr.push_back(t_lr[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_momentum;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("momentum", &t_momentum), done);
+    std::vector<double> momentum;
+    for (size_t i = 0; i < t_momentum.size(); ++i) {
+      momentum.push_back(t_momentum[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_use_nesterov;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("use_nesterov", &t_use_nesterov), done);
+    std::vector<bool> use_nesterov;
+    for (size_t i = 0; i < t_use_nesterov.size(); ++i) {
+      use_nesterov.push_back(t_use_nesterov[i].Scalar<bool>());
+    }
+    std::vector<Tensor> grads;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("grad", &grads), done);
+    std::vector<Tensor> indices;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("indices", &indices), done);    
+    std::vector<ps::Tensor> convert_grad;
+    for (auto& grad : grads) {
+      convert_grad.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(grad, &convert_grad.back()),
+        done);
+    }
+    std::vector<ps::Tensor> convert_indices;
+    for (auto& indice : indices) {
+      convert_indices.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(indice, &convert_indices.back()),
+        done);
+    }
+    auto cb = [grads, indices, ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < var_names_.size(); i++) {
+      save_ratios.push_back(0.0);
+    }
+
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashPush(var_names_,
+                             convert_indices,
+                             save_ratios,
+                             "MomentumUpdater", 
+                             client->Args(convert_grad, lr, momentum, use_nesterov),  
+                             cb);
+    } else {
+      done(Status::ArgumentError("PsSparseApplyMomentumMergedOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+  std::vector<std::string> var_names_;
+};
+
+XDL_DEFINE_OP(PsSparseApplyMomentumMergedOp)
+  .InputListV2("learning_rate", "input_type_0")
+  .InputListV2("momentum", "input_type_1")
+  .InputListV2("use_nesterov", "input_type_2")
+  .InputListV2("grad", "input_type_3")
+  .InputListV2("indices", "input_type_4")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("input_type_2", AttrValue::kDataTypeList)
+  .Attr("input_type_3", AttrValue::kDataTypeList)
+  .Attr("input_type_4", AttrValue::kDataTypeList)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsSparseApplyMomentumMergedOp, PsSparseApplyMomentumMergedOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_op.cc
index 5656734d..96b61e5a 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_momentum_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -29,7 +29,6 @@ class PsSparseApplyMomentumOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
     XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
-    XDL_CHECK_STATUS(ctx->GetAttr("use_nesterov", &use_nesterov_));
     XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
     return Status::Ok();
   }
@@ -43,10 +42,13 @@ class PsSparseApplyMomentumOp : public xdl::OpKernelAsync {
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_momentum), done);    
     double lr = t_lr.Scalar<double>();
     double momentum = t_momentum.Scalar<double>();
+    Tensor t_use_nesterov;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &t_use_nesterov), done);
+    bool use_nesterov = t_use_nesterov.Scalar<bool>();
     Tensor grad;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &grad), done);
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &grad), done);
     Tensor indices;
-    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &indices), done);    
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &indices), done);    
     ps::Tensor convert_grad;
     XDL_CHECK_STATUS_ASYNC(
         XDL2PS::ConvertTensor(grad, &convert_grad),
@@ -60,21 +62,29 @@ class PsSparseApplyMomentumOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> momentum_vec = {momentum};
+    std::vector<bool> use_nesterov_vec = {use_nesterov};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->SparsePush(
           var_name_, 
           convert_indices, 
           "MomentumUpdater", 
-          client->Args(convert_grad, lr, momentum, use_nesterov_), 
+          client->Args(grad_vec, lr_vec, momentum_vec, use_nesterov_vec), 
           cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashPush(
-          var_name_, 
-          convert_indices, 
-          "MomentumUpdater", 
-          client->Args(convert_grad, lr, momentum, use_nesterov_), 
+          var_name_,
+          convert_indices,
+          0.0,
+          false,
+          "MomentumUpdater",
+          client->Args(grad_vec, lr_vec, momentum_vec, use_nesterov_vec), 
           cb);      
       break;
     default:
@@ -88,18 +98,17 @@ class PsSparseApplyMomentumOp : public xdl::OpKernelAsync {
  private:
   std::string var_name_;
   VarType var_type_;
-  bool use_nesterov_;
 };
 
 XDL_DEFINE_OP(PsSparseApplyMomentumOp)
   .Input("learning_rate", DataType::kDouble)
   .Input("momentum", DataType::kDouble)
+  .Input("use_nesterov", DataType::kBool)
   .Input("grad", DataType::kFloat)
   .Input("indices", "dtype")
   .Attr("var_name", AttrValue::kString)
   .Attr("var_type", AttrValue::kString)
-  .Attr("dtype", AttrValue::kDataType)
-  .Attr("use_nesterov", AttrValue::kBool);
+  .Attr("dtype", AttrValue::kDataType);
 
 DEFINE_INT_OP(XDL_REGISTER_KERNEL(PsSparseApplyMomentumOp, PsSparseApplyMomentumOp<T>)
               .Device("CPU")
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_rmsprop_merged_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_rmsprop_merged_op.cc
new file mode 100644
index 00000000..2cf646de
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_rmsprop_merged_op.cc
@@ -0,0 +1,132 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+#include "xdl/core/utils/string_utils.h"
+
+namespace xdl {
+
+class PsSparseApplyRmspropMergedOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    std::string var_name_str;
+    XDL_CHECK_STATUS(ctx->GetAttr("var_names", &var_name_str));
+    var_names_ = StringUtils::split(var_name_str, ",");
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    std::vector<Tensor> t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("learning_rate", &t_lr), done);
+    std::vector<double> lr;
+    for (size_t i = 0; i < t_lr.size(); ++i) {
+      lr.push_back(t_lr[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("decay", &t_decay), done);
+    std::vector<double> decay;
+    for (size_t i = 0; i < t_decay.size(); ++i) {
+      decay.push_back(t_decay[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_momentum;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("momentum", &t_momentum), done);
+    std::vector<double> momentum;
+    for (size_t i = 0; i < t_momentum.size(); ++i) {
+      momentum.push_back(t_momentum[i].Scalar<double>());
+    }
+    std::vector<Tensor> t_epsilon;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("epsilon", &t_epsilon), done);
+    std::vector<double> epsilon;
+    for (size_t i = 0; i < t_epsilon.size(); ++i) {
+      epsilon.push_back(t_epsilon[i].Scalar<double>());
+    }
+    std::vector<Tensor> grads;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("grad", &grads), done);
+    std::vector<Tensor> indices;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInputList("indices", &indices), done);    
+    std::vector<ps::Tensor> convert_grad;
+    for (auto& grad : grads) {
+      convert_grad.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(grad, &convert_grad.back()),
+        done);
+    }
+    std::vector<ps::Tensor> convert_indices;
+    for (auto& indice : indices) {
+      convert_indices.emplace_back();
+      XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensorZC(indice, &convert_indices.back()),
+        done);
+    }
+    auto cb = [grads, indices, ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<float> save_ratios;
+    for (size_t i = 0; i < var_names_.size(); i++) {
+      save_ratios.push_back(0.0);
+    }
+    if (var_type_ == VarType::kHash128 || var_type_ == VarType::kHash64) {
+      client->MergedHashPush(var_names_,
+                             convert_indices,
+                             save_ratios,
+                             "RmspropUpdater", 
+                             client->Args(convert_grad, lr, decay, momentum, epsilon),   
+                             cb);
+    } else {
+      done(Status::ArgumentError("PsSparseApplyRmspropMergedOp var_type must be hash"));
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+  std::vector<std::string> var_names_;
+};
+
+XDL_DEFINE_OP(PsSparseApplyRmspropMergedOp)
+  .InputListV2("learning_rate", "input_type_0")
+  .InputListV2("decay", "input_type_1")
+  .InputListV2("momentum", "input_type_2")
+  .InputListV2("epsilon", "input_type_3")
+  .InputListV2("grad", "input_type_4")
+  .InputListV2("indices", "input_type_5")
+  .Attr("input_type_0", AttrValue::kDataTypeList)
+  .Attr("input_type_1", AttrValue::kDataTypeList)
+  .Attr("input_type_2", AttrValue::kDataTypeList)
+  .Attr("input_type_3", AttrValue::kDataTypeList)
+  .Attr("input_type_4", AttrValue::kDataTypeList)
+  .Attr("input_type_5", AttrValue::kDataTypeList)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_names", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(PsSparseApplyRmspropMergedOp, PsSparseApplyRmspropMergedOp).Device("CPU");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_rmsprop_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_rmsprop_op.cc
new file mode 100644
index 00000000..8595d8cf
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_apply_rmsprop_op.cc
@@ -0,0 +1,124 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+template <typename T>
+class PsSparseApplyRmspropOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
+    XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    Tensor t_lr;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_lr), done);
+    Tensor t_decay;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_decay), done);
+    Tensor t_momentum;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(2, &t_momentum), done);
+    Tensor t_epsilon;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(3, &t_epsilon), done);
+    Tensor grad;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(4, &grad), done);
+    Tensor indices;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(5, &indices), done);    
+    double lr = t_lr.Scalar<double>();
+    double decay = t_decay.Scalar<double>();
+    double momentum = t_momentum.Scalar<double>();
+    double epsilon = t_epsilon.Scalar<double>();
+    ps::Tensor convert_grad;
+    XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensor(grad, &convert_grad),
+        done);
+    ps::Tensor convert_indices;
+    XDL_CHECK_STATUS_ASYNC(
+        XDL2PS::ConvertTensor(indices, &convert_indices),
+        done);
+    auto cb = [ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+
+    std::vector<ps::Tensor> grad_vec = {convert_grad};
+    std::vector<double> lr_vec = {lr};
+    std::vector<double> decay_vec = {decay};
+    std::vector<double> momentum_vec = {momentum};
+    std::vector<double> epsilon_vec = {epsilon};
+
+    switch(var_type_) {
+    case VarType::kIndex:
+      client->SparsePush(
+          var_name_, 
+          convert_indices, 
+          "RmspropUpdater", 
+          client->Args(grad_vec, lr_vec, decay_vec, momentum_vec, epsilon_vec), 
+          cb);
+      break;
+    case VarType::kHash128:
+    case VarType::kHash64:
+      client->HashPush(
+          var_name_,
+          convert_indices,
+          0.0,
+          false,
+          "RmspropUpdater",
+          client->Args(grad_vec, lr_vec, decay_vec, momentum_vec, epsilon_vec), 
+          cb);      
+      break;
+    default:
+      XDL_CHECK_COND_ASYNC(
+          false, 
+          Status::ArgumentError("unsupported vartype"),
+          done);
+    }
+  }
+
+ private:
+  std::string var_name_;
+  VarType var_type_;
+};
+
+XDL_DEFINE_OP(PsSparseApplyRmspropOp)
+  .Input("learning_rate", DataType::kDouble)
+  .Input("decay", DataType::kDouble)
+  .Input("momentum", DataType::kDouble)
+  .Input("epsilon", DataType::kDouble)
+  .Input("grad", DataType::kFloat)
+  .Input("indices", "dtype")
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString)
+  .Attr("dtype", AttrValue::kDataType);
+
+DEFINE_INT_OP(XDL_REGISTER_KERNEL(PsSparseApplyRmspropOp, PsSparseApplyRmspropOp<T>)
+              .Device("CPU")
+              .AttrDataType<T>("dtype"))
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_assign_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_assign_op.cc
index c59849e5..28ec7358 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_sparse_assign_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_assign_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -54,21 +54,26 @@ class PsSparseAssignOp : public xdl::OpKernelAsync {
       done(Status::Ok());
     };
 
+    std::vector<ps::Tensor> value_vec = {convert_values};
+
     switch(var_type_) {
     case VarType::kIndex:
       client->SparsePush(
           var_name_, 
           convert_ids, 
           "AssignUpdater", 
-          client->Args(convert_values), 
+          client->Args(value_vec), 
           cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashPush(
-          var_name_, 
+          var_name_,
           convert_ids, 
-          "AssignUpdater", 
-          client->Args(convert_values), 
+          1.0,
+          true,
+          "AssignUpdater",
+          client->Args(value_vec), 
           cb);
       break;
     }
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_pull_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_pull_op.cc
index 38bc8a3c..12fb9a19 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_sparse_pull_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_pull_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -28,7 +28,6 @@ class PsSparsePullOp : public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
     XDL_CHECK_STATUS(ctx->GetAttr("var_name", &var_name_));
-    XDL_CHECK_STATUS(ctx->GetAttr("save_ratio", &save_ratio_));
     XDL_CHECK_STATUS(XdlGetVarType(ctx, &var_type_));
     return Status::Ok();
   }
@@ -38,6 +37,9 @@ class PsSparsePullOp : public xdl::OpKernelAsync {
     XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
     Tensor ids;
     XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &ids), done);
+    Tensor t_save_ratio;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(1, &t_save_ratio), done);
+    float save_ratio = t_save_ratio.Scalar<float>();
     ps::Tensor convert_ids;
     XDL_CHECK_STATUS_ASYNC(
         XDL2PS::ConvertTensor(ids, &convert_ids),
@@ -56,8 +58,9 @@ class PsSparsePullOp : public xdl::OpKernelAsync {
     case VarType::kIndex:
       client->SparsePull(var_name_, convert_ids, result, cb);
       break;
-    case VarType::kHash:
-      client->HashPull(var_name_, convert_ids, save_ratio_, result, cb);
+    case VarType::kHash128:
+    case VarType::kHash64:
+      client->HashPull(var_name_, convert_ids, save_ratio, result, cb);
       break;      
     default:
       XDL_CHECK_COND_ASYNC(
@@ -70,15 +73,14 @@ class PsSparsePullOp : public xdl::OpKernelAsync {
  private:
   std::string var_name_;
   VarType var_type_;
-  float save_ratio_;
 };
 
 XDL_DEFINE_OP(PsSparsePullOp)
   .Input("ids", "dtype")
+  .Input("save_ratio", DataType::kFloat)
   .Output("output", "otype")
   .Attr("var_name", AttrValue::kString)
   .Attr("var_type", AttrValue::kString)
-  .Attr("save_ratio", AttrValue::kFloat)
   .Attr("dtype", AttrValue::kDataType)
   .Attr("otype", AttrValue::kDataType);
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_sparse_statis_op.cc b/xdl/xdl/core/ops/ps_ops/ps_sparse_statis_op.cc
new file mode 100644
index 00000000..10136f66
--- /dev/null
+++ b/xdl/xdl/core/ops/ps_ops/ps_sparse_statis_op.cc
@@ -0,0 +1,74 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/ops/ps_ops/define_op.h"
+#include "xdl/core/ops/ps_ops/convert_utils.h"
+#include "xdl/core/ops/ps_ops/client.h"
+#include "xdl/core/ops/ps_ops/var_type.h"
+
+namespace xdl {
+
+class PsSparseStatisOp : public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+  }
+};
+
+XDL_DEFINE_OP(PsSparseStatisOp)
+  .Input("ids", "dtype")
+  .Input("indexs", DataType::kInt32)
+  .Input("segments", DataType::kInt32)
+  .Input("sample_indexs", DataType::kInt32)
+  .Input("sample_segments", DataType::kInt32)
+  .Input("labels", DataType::kFloat)
+  .Input("save_ratio", DataType::kFloat)
+  .Input("global_step", DataType::kInt64)
+  .Input("statis_decay", DataType::kDouble)
+  .Input("statis_decay_period", DataType::kInt64)
+  .Output("output", "otype")
+  .Attr("statis_type", AttrValue::kString)
+  .Attr("var_name", AttrValue::kString)
+  .Attr("var_type", AttrValue::kString)
+  .Attr("dtype", AttrValue::kDataType)
+  .Attr("otype", AttrValue::kDataType);
+
+#define REGISTER_KERNEL(ITYPE, OTYPE) \
+  XDL_REGISTER_KERNEL(PsSparseStatisOp, PsSparseStatisOp)  \
+  .Device("CPU")                                       \
+  .AttrDataType<ITYPE>("dtype")                        \
+  .AttrDataType<OTYPE>("otype");                       \
+
+REGISTER_KERNEL(int32_t, int8_t);
+REGISTER_KERNEL(int32_t, int16_t);
+REGISTER_KERNEL(int32_t, int32_t);
+REGISTER_KERNEL(int32_t, int64_t);
+REGISTER_KERNEL(int32_t, float);
+REGISTER_KERNEL(int64_t, int8_t);
+REGISTER_KERNEL(int64_t, int16_t);
+REGISTER_KERNEL(int64_t, int32_t);
+REGISTER_KERNEL(int64_t, int64_t);
+REGISTER_KERNEL(int64_t, float);
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_dense.cc b/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_dense.cc
index 05da235d..75f3cf0f 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_dense.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_dense.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -34,17 +34,22 @@ class PsStreamingTriggerDenseOp : public xdl::OpKernelAsync {
   void Compute(OpKernelContext* ctx, Callback done) override {
     ps::client::BaseClient* client;
     XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
-    std::cout << "PsStreamingTriggerDenseOp called" << std::endl;
+    
+    Tensor t_inc_version;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_inc_version), done);
+    std::string inc_version = t_inc_version.Scalar<std::string>();
+
     auto cb = [ctx, done](const ps::Status& st) {
       XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
       done(Status::Ok());
     };
 
-    client->TriggerStreamingModelDense(cb);
+    client->TriggerStreamingModelDense(inc_version, cb);
   }
 };
 
-XDL_DEFINE_OP(PsStreamingTriggerDenseOp);
+XDL_DEFINE_OP(PsStreamingTriggerDenseOp)
+  .Input("inc_version", DataType::kInt8);
 
 XDL_REGISTER_KERNEL(
     PsStreamingTriggerDenseOp, 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_hash.cc b/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_hash.cc
index b42f6c33..7b62bbd2 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_hash.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_hash.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -34,17 +34,21 @@ class PsStreamingTriggerHashOp : public xdl::OpKernelAsync {
   void Compute(OpKernelContext* ctx, Callback done) override {
     ps::client::BaseClient* client;
     XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
-    std::cout << "PsStreamingTriggerHashOp called" << std::endl;
     auto cb = [ctx, done](const ps::Status& st) {
       XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
       done(Status::Ok());
     };
 
-    client->TriggerStreamingModelHash(cb);
+    Tensor t_inc_version;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_inc_version), done);
+    std::string inc_version = t_inc_version.Scalar<std::string>();
+
+    client->TriggerStreamingModelHash(inc_version, cb);
   }
 };
 
-XDL_DEFINE_OP(PsStreamingTriggerHashOp);
+XDL_DEFINE_OP(PsStreamingTriggerHashOp)
+  .Input("inc_version", DataType::kInt8);
 
 XDL_REGISTER_KERNEL(
     PsStreamingTriggerHashOp, 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_sparse.cc b/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_sparse.cc
index 45de01a5..d9351ca8 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_sparse.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_streaming_trigger_sparse.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -34,17 +34,21 @@ class PsStreamingTriggerSparseOp : public xdl::OpKernelAsync {
   void Compute(OpKernelContext* ctx, Callback done) override {
     ps::client::BaseClient* client;
     XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
-    std::cout << "PsStreamingTriggerSparseOp called" << std::endl;
     auto cb = [ctx, done](const ps::Status& st) {
       XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
       done(Status::Ok());
     };
 
-    client->TriggerStreamingModelSparse(cb);
+    Tensor t_inc_version;
+    XDL_CHECK_STATUS_ASYNC(ctx->GetInput(0, &t_inc_version), done);
+    std::string inc_version = t_inc_version.Scalar<std::string>();
+
+    client->TriggerStreamingModelSparse(inc_version, cb);
   }
 };
 
-XDL_DEFINE_OP(PsStreamingTriggerSparseOp);
+XDL_DEFINE_OP(PsStreamingTriggerSparseOp)
+  .Input("inc_version", DataType::kInt8);
 
 XDL_REGISTER_KERNEL(
     PsStreamingTriggerSparseOp, 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_synchronizer_ops.cc b/xdl/xdl/core/ops/ps_ops/ps_synchronizer_ops.cc
index 1fe8b1d2..d5e69a2c 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_synchronizer_ops.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_synchronizer_ops.cc
@@ -108,11 +108,31 @@ class WorkerReportFinishOp: public xdl::OpKernelAsync {
   }
 };
 
+class GetWorkerFinishCountOp: public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);
+    auto cb = [ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };
+    Tensor tcount;
+    XDL_CHECK_STATUS_ASYNC(ctx->AllocateOutput(0, TensorShape({}), &tcount), done);
+    client->GetWorkerFinishCount(tcount.Raw<int64_t>(), cb);
+  }
+};
+
 class WorkerBarrierOp: public xdl::OpKernelAsync {
  public:
   Status Init(OpKernelConstruction* ctx) override {
     return Status::Ok();
   }
+
   void Compute(OpKernelContext* ctx, Callback done) override {
     ps::client::BaseClient* client;
     XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);    
@@ -122,10 +142,33 @@ class WorkerBarrierOp: public xdl::OpKernelAsync {
       XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
       done(Status::Ok());
     };    
+
     client->WorkerBarrier(id, worker_count, cb);
   }
 };
 
+class WorkerBarrierV2Op: public xdl::OpKernelAsync {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  void Compute(OpKernelContext* ctx, Callback done) override {
+    ps::client::BaseClient* client;
+    XDL_CHECK_STATUS_ASYNC(GetClient(&client), done);    
+    int barrier_id = IntArg(ctx, 0, done);
+    int task_id = IntArg(ctx, 1, done);
+    int task_num = IntArg(ctx, 2, done);
+    int token = IntArg(ctx, 3, done);
+    auto cb = [ctx, done](const ps::Status& st) {
+      XDL_CHECK_STATUS_ASYNC(PS2XDL::ConvertStatus(st), done);
+      done(Status::Ok());
+    };    
+
+    client->WorkerBarrierV2(barrier_id, task_id, task_num, token, cb);
+  }
+};
+
 XDL_DEFINE_OP(PsAsynchronizeEnterOp)
   .Input("id", DataType::kInt32)
   .Input("staleness", DataType::kInt32)
@@ -138,6 +181,9 @@ XDL_DEFINE_OP(PsSynchronizeEnterOp)
 XDL_DEFINE_OP(PsSynchronizeLeaveOp)
   .Input("id", DataType::kInt32);
 
+XDL_DEFINE_OP(GetWorkerFinishCountOp)
+  .Output("count", DataType::kInt64);
+
 XDL_DEFINE_OP(WorkerReportFinishOp)
   .Input("id", DataType::kInt32);
 
@@ -145,11 +191,19 @@ XDL_DEFINE_OP(WorkerBarrierOp)
   .Input("id", DataType::kInt32)
   .Input("worker_count", DataType::kInt32);
 
+XDL_DEFINE_OP(WorkerBarrierV2Op)
+  .Input("barrier_id", DataType::kInt32)
+  .Input("task_id", DataType::kInt32)
+  .Input("task_num", DataType::kInt32)
+  .Input("token", DataType::kInt32);
+
 XDL_REGISTER_KERNEL(PsAsynchronizeEnterOp, PsAsynchronizeEnterOp).Device("CPU");
 XDL_REGISTER_KERNEL(PsSynchronizeEnterOp, PsSynchronizeEnterOp).Device("CPU");
 XDL_REGISTER_KERNEL(PsSynchronizeLeaveOp, PsSynchronizeLeaveOp).Device("CPU");
 XDL_REGISTER_KERNEL(WorkerReportFinishOp, WorkerReportFinishOp).Device("CPU");
 XDL_REGISTER_KERNEL(WorkerBarrierOp, WorkerBarrierOp).Device("CPU");
+XDL_REGISTER_KERNEL(WorkerBarrierV2Op, WorkerBarrierV2Op).Device("CPU");
+XDL_REGISTER_KERNEL(GetWorkerFinishCountOp, GetWorkerFinishCountOp).Device("CPU");
 
 }
 
diff --git a/xdl/xdl/core/ops/ps_ops/ps_truncated_normal_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_truncated_normal_initializer_op.cc
index cadc146e..77f27d1a 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_truncated_normal_initializer_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_truncated_normal_initializer_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -56,7 +56,8 @@ class PsTruncatedNormalInitializerOp : public xdl::OpKernelAsync {
     case VarType::kIndex:
       client->IndexInitializer(var_name_, initializer, cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashInitializer(var_name_, initializer, cb);
       break;              
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_uniform_unit_scaling_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_uniform_unit_scaling_initializer_op.cc
index a45b16e7..ebfe9942 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_uniform_unit_scaling_initializer_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_uniform_unit_scaling_initializer_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -58,7 +58,8 @@ class PsUniformUnitScalingInitializerOp : public xdl::OpKernelAsync {
     case VarType::kIndex:
       client->IndexInitializer(var_name_, initializer, cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashInitializer(var_name_, initializer, cb);
       break;              
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/ps_variance_scaling_initializer_op.cc b/xdl/xdl/core/ops/ps_ops/ps_variance_scaling_initializer_op.cc
index 78b124c0..e272e00e 100644
--- a/xdl/xdl/core/ops/ps_ops/ps_variance_scaling_initializer_op.cc
+++ b/xdl/xdl/core/ops/ps_ops/ps_variance_scaling_initializer_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -62,7 +62,8 @@ class PsVarianceScalingInitializerOp : public xdl::OpKernelAsync {
     case VarType::kIndex:
       client->IndexInitializer(var_name_, initializer, cb);
       break;
-    case VarType::kHash:
+    case VarType::kHash128:
+    case VarType::kHash64:
       client->HashInitializer(var_name_, initializer, cb);
       break;              
     default:
diff --git a/xdl/xdl/core/ops/ps_ops/var_type.h b/xdl/xdl/core/ops/ps_ops/var_type.h
index 93b75ee1..960f4d85 100644
--- a/xdl/xdl/core/ops/ps_ops/var_type.h
+++ b/xdl/xdl/core/ops/ps_ops/var_type.h
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -23,14 +23,17 @@ namespace xdl {
 
 enum VarType {
   kIndex = 0,
-  kHash,
+  kHash128 = 1,
+  kHash64 = 2,
 };
 
 inline Status XdlGetVarType(OpKernelConstruction* ctx, VarType* vtype) {
   std::string var_type;
   XDL_CHECK_STATUS(ctx->GetAttr("var_type", &var_type));
-  if (var_type == "hash") {
-    *vtype = VarType::kHash;
+  if (var_type == "hash128" or var_type == "hash") {
+    *vtype = VarType::kHash128;
+  } else if (var_type == "hash64") {
+    *vtype = VarType::kHash64;
   } else if (var_type == "index") {
     *vtype = VarType::kIndex;
   } else {
diff --git a/xdl/xdl/core/ops/reshape.cc b/xdl/xdl/core/ops/reshape.cc
new file mode 100644
index 00000000..d9cd1a1f
--- /dev/null
+++ b/xdl/xdl/core/ops/reshape.cc
@@ -0,0 +1,85 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class ReshapeOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("dtype", &dtype_));
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor tensor, shape;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &tensor));
+    XDL_CHECK_STATUS(ctx->GetInput(1, &shape));
+    if (shape.Shape().Size() != 1) {
+        return Status::ArgumentError("Reshape shape should be 1-D");
+    }
+    std::vector<size_t> shapex;
+    int64_t num_ele = 1, loc = -1;
+    for (int64_t i = 0; i < shape.Shape()[0]; i++) {
+      int64_t x = shape.Raw<int64_t>()[i];
+      if (x < -1) {
+        return Status::ArgumentError("Reshape shape[i] < -1");
+      }
+      if (x == -1) {
+        shapex.push_back(0);
+        if (loc != -1) {
+          return Status::ArgumentError("Reshape shape has only 1 '-1'");
+        }
+        loc = i;
+      } else {
+        num_ele *= x;
+        shapex.push_back(x);
+      }
+    }
+    if (loc == -1) {
+      if (num_ele != tensor.Shape().NumElements()) {
+        return Status::ArgumentError("Reshape shape Mismatch");
+      }
+    } else {
+      if (num_ele == 0) {
+        return Status::ArgumentError("Reshape shape cannot have 0 and -1");
+      }
+      if (tensor.Shape().NumElements() % num_ele != 0) {
+        return Status::ArgumentError("Reshape shape Mismatch, cannot be divided");
+      }
+      shapex[loc] = tensor.Shape().NumElements() / num_ele;
+    }
+    XDL_CHECK_STATUS(ctx->SetOutput(0, Tensor(TensorShape(shapex), dtype_, tensor.GetBuffer())));
+    return Status::Ok();
+  }
+ private:
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(Reshape)
+  .Input("tensor", "dtype")
+  .Input("shape", DataType::kInt64)
+  .Attr("dtype", AttrValue::kDataType)
+  .Output("result", "dtype");
+
+XDL_REGISTER_KERNEL(Reshape, ReshapeOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/shape_op.cc b/xdl/xdl/core/ops/shape_op.cc
new file mode 100644
index 00000000..5a74f28a
--- /dev/null
+++ b/xdl/xdl/core/ops/shape_op.cc
@@ -0,0 +1,72 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/utils/logging.h"
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include <sstream>
+
+namespace xdl {
+
+class ShapeOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor input;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &input));
+    Tensor shape;
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, TensorShape({input.Shape().Size()}), &shape));    
+    int64_t* ptr = shape.Raw<int64_t>();
+    for (size_t i = 0; i < input.Shape().Size(); ++i) {
+      *ptr++ = input.Shape()[i];
+    }
+
+    return Status::Ok();
+  }
+};
+
+XDL_DEFINE_OP(ShapeOp)
+  .Input("input", "dtype")
+  .Output("shape", DataType::kInt64)
+  .Attr("dtype", AttrValue::kDataType);
+
+XDL_REGISTER_KERNEL(ShapeOp, ShapeOp)
+  .Device("CPU")
+  .AttrDataType<int8_t>("dtype");
+XDL_REGISTER_KERNEL(ShapeOp, ShapeOp)
+  .Device("CPU")
+  .AttrDataType<int16_t>("dtype");
+XDL_REGISTER_KERNEL(ShapeOp, ShapeOp)
+  .Device("CPU")
+  .AttrDataType<int32_t>("dtype");
+XDL_REGISTER_KERNEL(ShapeOp, ShapeOp)
+  .Device("CPU")
+  .AttrDataType<int64_t>("dtype");
+XDL_REGISTER_KERNEL(ShapeOp, ShapeOp)
+  .Device("CPU")
+  .AttrDataType<float>("dtype");
+XDL_REGISTER_KERNEL(ShapeOp, ShapeOp)
+  .Device("CPU")
+  .AttrDataType<double>("dtype");
+
+} // namespace xdl
+
+
diff --git a/xdl/xdl/core/ops/simple_ksum_op.cc b/xdl/xdl/core/ops/simple_ksum_op.cc
index ba7d9509..741eebec 100644
--- a/xdl/xdl/core/ops/simple_ksum_op.cc
+++ b/xdl/xdl/core/ops/simple_ksum_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/simple_unique_op.cc b/xdl/xdl/core/ops/simple_unique_op.cc
index 0bf18f69..65b22674 100644
--- a/xdl/xdl/core/ops/simple_unique_op.cc
+++ b/xdl/xdl/core/ops/simple_unique_op.cc
@@ -1,4 +1,4 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/xdl/xdl/core/ops/split.cc b/xdl/xdl/core/ops/split.cc
new file mode 100644
index 00000000..e4244375
--- /dev/null
+++ b/xdl/xdl/core/ops/split.cc
@@ -0,0 +1,143 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class SplitOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("dtype", &dtype_));
+    XDL_CHECK_STATUS(ctx->GetAttr("axis", &axis_));
+    XDL_CHECK_STATUS(ctx->GetAttr("num", &num_));
+    if (num_ <= 0) {
+      return Status::ArgumentError("Split num should greater than 0");
+    }
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor value, num_or_size_splits;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &value));
+    XDL_CHECK_STATUS(ctx->GetInput(1, &num_or_size_splits));
+    int64_t real_axis;
+    if (axis_ < 0) {
+      if (-axis_ > value.Shape().Size()) {
+        return Status::ArgumentError("Split axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = value.Shape().Size() + axis_;
+    } else {
+      if (axis_ >= value.Shape().Size()) {
+        return Status::ArgumentError("Split axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = axis_;
+    }
+    int64_t dim = value.Shape()[real_axis];
+    std::vector<int64_t> dims;
+    if (num_or_size_splits.Shape().Size() == 0) {
+      if (num_or_size_splits.Raw<int64_t>()[0] != num_) {
+        return Status::ArgumentError("Split num_or_size_splits should equal to num");
+      }
+      if (dim % num_ != 0) {
+        return Status::ArgumentError("Split dim should evenly divide num");
+      }
+      for (int64_t i = 0; i < num_; i++) {
+        dims.push_back(dim / num_);
+      }
+    } else if (num_or_size_splits.Shape().Size() == 1) {
+      if (num_or_size_splits.Shape()[0] != num_) {
+        return Status::ArgumentError("Split num_or_size_splits should be scalar or [num_] shaped");
+      }
+      int64_t sum = 0;
+      for (int64_t i = 0; i < num_; i++) {
+        sum += num_or_size_splits.Raw<int64_t>()[i];
+        dims.push_back(num_or_size_splits.Raw<int64_t>()[i]);
+      }
+      if (sum != dim) {
+        return Status::ArgumentError("Split num_or_size_splits is not matched");
+      }
+    } else {
+        return Status::ArgumentError("Split num_or_size_splits should be scalar or 1-D");
+    }
+    int64_t slice_size = SizeOfType(dtype_), repeat = 1;
+    for (int64_t i = real_axis + 1; i < value.Shape().Size(); i++) {
+      slice_size *= value.Shape()[i];
+    }
+    for (int64_t i = 0; i < real_axis; i++) {
+      repeat *= value.Shape()[i];
+    }
+    std::vector<int64_t> slice;
+    TensorShape shape = value.Shape();
+    std::vector<TensorShape> shapes;
+    for (auto&& item : dims) {
+      slice.push_back(item * slice_size);
+      shape.Set(real_axis, item);
+      shapes.push_back(shape);
+    }
+    if (repeat == 0 || slice_size == 0) {
+      for (int64_t i = 0; i < num_; i++) {
+        Tensor output;
+        XDL_CHECK_STATUS(ctx->AllocateOutput(i, shapes[i], &output));
+      }
+    } else if (repeat == 1) {
+      Buffer* parent = value.GetBuffer();
+      char* ptr = (char*)parent->begin();
+      for (int64_t i = 0; i < num_; i++) {
+        Buffer* buf = new Buffer(ptr, slice[i], parent);
+        XDL_CHECK_STATUS(ctx->SetOutput(i, Tensor(shapes[i], dtype_, buf)));
+        buf->UnRef();
+        ptr += slice[i];
+      }
+    } else {
+      char* ptr = value.Raw<char>();
+      std::vector<char*> ptrs;
+      for (int64_t i = 0; i < num_; i++) {
+        Tensor output;
+        XDL_CHECK_STATUS(ctx->AllocateOutput(i, shapes[i], &output));
+        ptrs.push_back(output.Raw<char>());
+      }
+      for (int64_t k = 0; k < repeat; k++) {
+        for (int64_t i = 0; i < num_; i++) {
+          memcpy(ptrs[i], ptr, slice[i]);
+          ptr += slice[i];
+          ptrs[i] += slice[i];
+        }
+      }
+    }
+    return Status::Ok();
+  }
+ private:
+  int64_t axis_;
+  int64_t num_;
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(Split)
+  .Input("value", "dtype")
+  .Input("num_or_size_splits", DataType::kInt64)
+  .Attr("axis", AttrValue::kInt)
+  .Attr("num", AttrValue::kInt)
+  .Attr("dtype", AttrValue::kDataType)
+  .OutputList("result", "dtype", "num");
+
+XDL_REGISTER_KERNEL(Split, SplitOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/stack.cc b/xdl/xdl/core/ops/stack.cc
new file mode 100644
index 00000000..0699e83b
--- /dev/null
+++ b/xdl/xdl/core/ops/stack.cc
@@ -0,0 +1,100 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class StackOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("axis", &axis_));
+    XDL_CHECK_STATUS(ctx->GetAttr("dtype", &dtype_));
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    std::vector<Tensor> tensors;
+    XDL_CHECK_STATUS(ctx->GetInputList("tensors", &tensors));
+    if (tensors.size() == 0) {
+      return Status::ArgumentError("Stack should have at least 1 tensor");
+    }
+    std::vector<size_t> dims = tensors[0].Shape().Dims();
+    int64_t real_axis;
+    if (axis_ < 0) {
+      if (-axis_ > dims.size() + 1) {
+        return Status::ArgumentError("Stack axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = dims.size() + axis_ + 1;
+    } else {
+      if (axis_ >= dims.size() + 1) {
+        return Status::ArgumentError("Stack axis_ should be [-value_dims, value_dims)");
+      }
+      real_axis = axis_;
+    }
+    for (auto&& item : tensors) {
+      if (item.Shape().Size() != dims.size()) {
+        return Status::ArgumentError("Stack dims size mismatch");
+      }
+      for (size_t i = 0; i < dims.size(); i++) {
+        if (item.Shape()[i] != dims[i]) {
+          return Status::ArgumentError("Stack dims mismatch");
+        }
+      }
+    }
+    dims.insert(dims.begin() + real_axis, tensors.size());
+    int64_t repeat = 1, one_slice = SizeOfType(dtype_);
+    for (size_t i = 0; i < real_axis; i++) {
+      repeat *= dims[i];
+    }
+    for (size_t i = real_axis + 1; i < dims.size(); i++) {
+      one_slice *= dims[i];
+    }
+    Tensor output;
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, TensorShape(dims), &output));
+    std::vector<char*> org_ptr;
+    for (auto&& item : tensors) {
+      org_ptr.push_back(item.Raw<char>());
+    }
+    char* ptr = output.Raw<char>();
+    for (int64_t i = 0; i < repeat; i++) {
+      for (size_t j = 0; j < tensors.size(); j++) {
+        memcpy(ptr, org_ptr[j], one_slice);
+        org_ptr[j] += one_slice;
+        ptr += one_slice;
+      }
+    }
+    return Status::Ok();
+  }
+ private:
+  int64_t axis_;
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(Stack)
+  .InputList("tensors", "dtype", "size")
+  .Attr("axis", AttrValue::kInt)
+  .Attr("dtype", AttrValue::kDataType)
+  .Attr("size", AttrValue::kInt)
+  .Output("result", "dtype");
+
+XDL_REGISTER_KERNEL(Stack, StackOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/ops/take_grad_op.cc b/xdl/xdl/core/ops/take_grad_op.cc
index 34966710..89d120cd 100644
--- a/xdl/xdl/core/ops/take_grad_op.cc
+++ b/xdl/xdl/core/ops/take_grad_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -57,7 +42,7 @@ Status TakeGradOp<T, I>::Compute(OpKernelContext* ctx) {
   T* pin = grad.Raw<T>();
   I* pind = indicator.Raw<I>();
   std::vector<size_t> dims(grad_dims.begin(), grad_dims.end());
-  dims[0] = feature.Shape()[0];
+  dims[0] = *(feature.Raw<int64_t>());
   TensorShape out_shape(dims);
   XDL_CHECK_STATUS(ctx->AllocateOutput(0, out_shape, &output));
   T* pout = output.Raw<T>();
@@ -76,7 +61,7 @@ Status TakeGradOp<T, I>::Compute(OpKernelContext* ctx) {
 XDL_DEFINE_OP(TakeGrad)
   .Input("grad", "dtype")
   .Input("indicator", "itype")
-  .Input("feature", "dtype")
+  .Input("feature", DataType::kInt64)
   .Output("output", "dtype")
   .Attr("dtype", AttrValue::kDataType)
   .Attr("itype", AttrValue::kDataType);
diff --git a/xdl/xdl/core/ops/take_grad_op.cu b/xdl/xdl/core/ops/take_grad_op.cu
index ab0fe44f..98a64698 100644
--- a/xdl/xdl/core/ops/take_grad_op.cu
+++ b/xdl/xdl/core/ops/take_grad_op.cu
@@ -25,18 +25,15 @@ namespace xdl {
 namespace {
 
 template <typename T, typename I>
-__global__ void TakeGradOpKernel(const T* in,
-                                 const I* indicator,
-                                 size_t row,
+__global__ void TakeGradOpKernel(const T* pin,
+                                 const I* pind,
                                  size_t col,
-                                 T* out) {
-  size_t id_num = row * col;
-  CUDA_KERNEL_LOOP(k, id_num) {
-    size_t i = k / col;
-    size_t j = k % col;
-    I rrow = indicator[i];
-    common::gpu_atomic_add<T>(in[k], out + rrow * col + j);
-  }
+                                 size_t num,
+                                 T* pout) {
+  const size_t k = blockIdx.x * blockDim.x + threadIdx.x;
+  if (k >= num) return;
+  const size_t i = k / col, j = k % col;
+  common::gpu_atomic_add<T>(pin[k], pout + pind[i] * col + j);
 }
 
 }  // namespace 
@@ -62,21 +59,30 @@ Status TakeGradGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx,
   auto grad_dims = grad.Shape().Dims();
   size_t row = grad_dims[0];
   size_t col = grad.Shape().NumElements() / row;
+  size_t num = grad.Shape().NumElements();
   T* pin = grad.Raw<T>();
   I* pind = indicator.Raw<I>();
   std::vector<size_t> dims(grad_dims.begin(), grad_dims.end());
-  dims[0] = feature.Shape()[0];
+  int64_t* pf = feature.Raw<int64_t>();
+  int64_t dim = *pf;
+  //CUDA_CHECK(cudaMemcpy((void*)&dim, (void*)pf, 8, cudaMemcpyDeviceToHost));
+  dims[0] = dim;
   TensorShape out_shape(dims);
   XDL_CHECK_STATUS(ctx->AllocateOutput(0, out_shape, &output));
   T* pout = output.Raw<T>();
 
   cudaStream_t st = stream->GetInternal();
   CUDA_CHECK(cudaMemsetAsync(pout, 0, sizeof(T) * out_shape.NumElements(), st));
+  if (num == 0) {
+    return Status::Ok();
+  }
+  size_t blocks = CUDA_GET_BLOCKS(num);
   TakeGradOpKernel<T, I><<<
-      CUDA_GET_BLOCKS(row * col),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(num, blocks),
       0,
-      st>>>(pin, pind, row, col, pout);
+      st>>>(pin, pind, col, num, pout);
+
   return Status::Ok();
 }
 
diff --git a/xdl/xdl/core/ops/take_grad_op.h b/xdl/xdl/core/ops/take_grad_op.h
index 1e3da532..a901222d 100644
--- a/xdl/xdl/core/ops/take_grad_op.h
+++ b/xdl/xdl/core/ops/take_grad_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/take_op.cc b/xdl/xdl/core/ops/take_op.cc
index 5832cca4..eba405c2 100644
--- a/xdl/xdl/core/ops/take_op.cc
+++ b/xdl/xdl/core/ops/take_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -63,14 +48,17 @@ Status TakeOp<T, I>::Compute(OpKernelContext* ctx) {
   size_t col = feature.Shape().NumElements() / feature.Shape()[0];
   T* pin = feature.Raw<T>(), *pout = output.Raw<T>();
   I* pind = indicator.Raw<I>();
-  std::memset(pout, 0, sizeof(T) * out_shape.NumElements());
+  if (row == 0 || col == 0) {
+    std::memset(pout, 0, sizeof(T) * out_shape.NumElements());
+    return Status::Ok();
+  }
 
   #pragma omp parallel for
-  for (size_t k = 0; k < row * col; ++k) {
-    size_t i = k / col;
-    size_t j = k % col;
-    I rrow = pind[i];
-    pout[k] = pin[rrow * col + j];
+  for (size_t i = 0; i < row; ++i) {
+    const size_t a = i * col, b = pind[i] * col;
+    for (size_t j = 0; j < col; ++j) {
+      pout[a + j] = pin[b + j];
+    }
   }
   return Status::Ok();
 }
@@ -92,6 +80,8 @@ REGISTER_KERNEL(float, int32_t);
 REGISTER_KERNEL(float, int64_t);
 REGISTER_KERNEL(double, int32_t);
 REGISTER_KERNEL(double, int64_t);
+REGISTER_KERNEL(int64_t, int32_t);
+REGISTER_KERNEL(int64_t, int64_t);
 
 #undef REGISTER_KERNEL
 
diff --git a/xdl/xdl/core/ops/take_op.cu b/xdl/xdl/core/ops/take_op.cu
index a490e772..80a31d05 100644
--- a/xdl/xdl/core/ops/take_op.cu
+++ b/xdl/xdl/core/ops/take_op.cu
@@ -23,18 +23,15 @@ namespace xdl {
 namespace {
 
 template <typename T, typename I>
-__global__ void TakeOpKernel(const T* in,
-                             const I* indicator,
-                             size_t row,
+__global__ void TakeOpKernel(const T* pin,
+                             const I* pind,
                              size_t col,
-                             T* out) {
-  size_t id_num = row * col;
-  CUDA_KERNEL_LOOP(k, id_num) {
-    size_t i = k / col;
-    size_t j = k % col;
-    I rrow = indicator[i];
-    out[k] = in[rrow * col + j];
-  }
+                             size_t num,
+                             T* pout) {
+  const size_t k = blockIdx.x * blockDim.x + threadIdx.x;
+  if (k >= num) return;
+  const size_t i = k / col, j = k % col;
+  pout[k] = pin[pind[i] * col + j];
 }
 
 }  // namespace
@@ -64,16 +61,21 @@ Status TakeGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* stream) {
 
   size_t row = dims[0];
   size_t col = feature.Shape().NumElements() / feature.Shape()[0];
+  size_t num = row * col;
   T* pin = feature.Raw<T>(), *pout = output.Raw<T>();
   I* pind = indicator.Raw<I>();
 
   cudaStream_t st = stream->GetInternal();
-  CUDA_CHECK(cudaMemsetAsync(pout, 0, sizeof(T) * out_shape.NumElements(), st));
+  if (num == 0) {
+    CUDA_CHECK(cudaMemsetAsync(pout, 0, sizeof(T) * out_shape.NumElements(), st));
+    return Status::Ok();
+  }
+  size_t blocks = CUDA_GET_BLOCKS(num);
   TakeOpKernel<T, I><<<
-      CUDA_GET_BLOCKS(row * col),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(num, blocks),
       0,
-      st>>>(pin, pind, row, col, pout);
+      st>>>(pin, pind, col, num, pout);
   return Status::Ok();
 }
 
diff --git a/xdl/xdl/core/ops/take_op.h b/xdl/xdl/core/ops/take_op.h
index 9697a907..7db54c15 100644
--- a/xdl/xdl/core/ops/take_op.h
+++ b/xdl/xdl/core/ops/take_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/tile_grad_op.cc b/xdl/xdl/core/ops/tile_grad_op.cc
index f83b3dc6..f7e40b6a 100644
--- a/xdl/xdl/core/ops/tile_grad_op.cc
+++ b/xdl/xdl/core/ops/tile_grad_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -96,7 +81,7 @@ Status TileGradOp<T, I>::Compute(OpKernelContext* ctx) {
   T* pout = out_grad.Raw<T>();
   std::memset(pout, 0, sizeof(T) * embed.Shape().NumElements());
 
-  #pragma omp parallel for
+  //#pragma omp parallel for
   for (size_t i = 0; i < id_size; ++i) {
     size_t grp_idx = std::lower_bound(pgrp, pgrp + grp_size, i + 1) - pgrp;
     size_t src_begin = grp_idx * length_;
diff --git a/xdl/xdl/core/ops/tile_grad_op.cu b/xdl/xdl/core/ops/tile_grad_op.cu
index 7b4110ef..f2e38e6a 100644
--- a/xdl/xdl/core/ops/tile_grad_op.cu
+++ b/xdl/xdl/core/ops/tile_grad_op.cu
@@ -127,12 +127,16 @@ Status TileGradGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx,
   T* pout = out_grad.Raw<T>();
   size_t bytes = sizeof(T) * embed.Shape().NumElements();
   CUDA_CHECK(cudaMemsetAsync(pout, 0, bytes, stream->GetInternal()));
+  if (id_size == 0) {
+    return Status::Ok();
+  }
 
   GpuDevice* device = dynamic_cast<GpuDevice*>(ctx->GetDevice());
   XDL_CHECK(device != nullptr) << "gpu device nullptr";
+  size_t blocks = CUDA_GET_BLOCKS(id_size);
   TileGradKernel<T, I><<<
-      CUDA_GET_BLOCKS(id_size),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(id_size, blocks),
       0,
       stream->GetInternal()>>>(pgrad, pidx, pval, pgrp, grp_size,
                                eb_dim, length_, reverse_, pout);
diff --git a/xdl/xdl/core/ops/tile_grad_op.h b/xdl/xdl/core/ops/tile_grad_op.h
index c6de91a2..a3307774 100644
--- a/xdl/xdl/core/ops/tile_grad_op.h
+++ b/xdl/xdl/core/ops/tile_grad_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/tile_op.cc b/xdl/xdl/core/ops/tile_op.cc
index df6f43c2..a153442d 100644
--- a/xdl/xdl/core/ops/tile_op.cc
+++ b/xdl/xdl/core/ops/tile_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -94,7 +79,7 @@ Status TileOp<T, I>::Compute(OpKernelContext* ctx) {
   T* pout = output.Raw<T>();
   std::memset(pout, 0, sizeof(T) * out_shape.NumElements());
 
-  #pragma omp parallel for
+  //#pragma omp parallel for
   for (size_t i = 0; i < id_size; ++i) {
     size_t grp_idx = std::lower_bound(pgrp, pgrp + grp_size, i + 1) - pgrp;
     size_t dst_begin = grp_idx * length_;
diff --git a/xdl/xdl/core/ops/tile_op.cu b/xdl/xdl/core/ops/tile_op.cu
index d53e168f..8978aabe 100644
--- a/xdl/xdl/core/ops/tile_op.cu
+++ b/xdl/xdl/core/ops/tile_op.cu
@@ -122,12 +122,16 @@ Status TileGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* stream) {
   T* pout = output.Raw<T>();
   size_t bytes = sizeof(T) * out_shape.NumElements();
   CUDA_CHECK(cudaMemsetAsync(pout, 0, bytes, stream->GetInternal()));
+  if (id_size == 0) {
+    return Status::Ok();
+  }
   
   GpuDevice* device = dynamic_cast<GpuDevice*>(ctx->GetDevice());
   XDL_CHECK(device != nullptr) << "gpu device null ptr";
+  size_t blocks = CUDA_GET_BLOCKS(id_size);
   TileKernel<T, I><<<
-      CUDA_GET_BLOCKS(id_size),
-      CUDA_NUM_THREADS,
+      blocks,
+      CUDA_GET_THREADS(id_size, blocks),
       0,
       stream->GetInternal()>>>(peb, pidx, pval, pgrp, grp_size,
                                eb_dim, length_, reverse_, pout);
diff --git a/xdl/xdl/core/ops/tile_op.h b/xdl/xdl/core/ops/tile_op.h
index bf768c79..d7a33dd9 100644
--- a/xdl/xdl/core/ops/tile_op.h
+++ b/xdl/xdl/core/ops/tile_op.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/ops/unique_op.cc b/xdl/xdl/core/ops/unique_op.cc
index 295c5272..874acbf5 100644
--- a/xdl/xdl/core/ops/unique_op.cc
+++ b/xdl/xdl/core/ops/unique_op.cc
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
@@ -29,105 +14,53 @@ limitations under the License.
  * limitations under the License.
 */
 
-#include "xdl/core/ops/unique_op.h"
-
+#include "xdl/core/lib/unique.h"
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
 #include "xdl/core/framework/op_registry.h"
 
+#include <chrono>
+#include <vector>
+#include <utility>
+
 namespace xdl {
-namespace functor {
 
 template <typename T, typename I>
-void UniqueFunctor<CpuDevice, T, I>::operator()(CpuDevice* d,
-                                                const Tensor& in,
-                                                Tensor* out,
-                                                Tensor& out_index) {
-  size_t id_num = in.Shape()[0];
-  size_t id_dim = in.Shape().Size() == 1 ? 1 : in.Shape()[1];
-  size_t total_num = in.Shape().NumElements();
-  T* pin = in.Raw<T>();
-  I* pindex = out_index.Raw<I>();
-  if (id_dim == 1) {
-    std::unordered_map<T, I> uniq(id_num);
-    I j = 0;
-    for (size_t i = 0; i < id_num; ++i) {
-      auto iter = uniq.insert(std::make_pair(pin[i], j));
-      pindex[i] = iter.first->second;
-      if (iter.second) {
-        ++j;
-      }
-    }
-    TensorShape out_shape({uniq.size()});
-    *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
-
-    T* buf = out->Raw<T>();
-    for (const auto& it : uniq) {
-      buf[it.second] = it.first;
-    }
-  } else {
-    auto hash_fn = [pin](const size_t& index) {
-      size_t x = std::hash<T>()(pin[index * 2]);
-      size_t y = std::hash<T>()(pin[index * 2 + 1]);
-      x = ((x & 0xAAAAAAAAAAAAAAAAL) >> 1) + ((x & 0x5555555555555555L) << 1);
-      y = ((y & 0xFFFFFFFF00000000L) >> 32) + ((y & 0x00000000FFFFFFFFL) << 32);
-      return x ^ y;
-    };
-
-    auto key_equal_fn = [pin](const size_t& lhs, const size_t& rhs) {
-      return pin[lhs * 2] == pin[rhs * 2] &&
-             pin[lhs * 2 + 1] == pin[rhs * 2 + 1];
-    };
-
-    std::unordered_map<size_t, I, decltype(hash_fn), decltype(key_equal_fn)>
-        uniq(id_num, hash_fn, key_equal_fn);
-    I j = 0;
-    for(size_t i = 0; i < id_num; ++i) {
-      auto iter = uniq.insert(std::make_pair(i, j));
-      pindex[i] = iter.first->second;
-      if (iter.second) {
-        ++j;
-      }
-    }
-    TensorShape out_shape({uniq.size(), id_dim});
-    *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
-
-    T* buf = out->Raw<T>();
-    for (const auto& it : uniq) {
-      buf[it.second * 2] = pin[it.first * 2];
-      buf[it.second * 2 + 1] = pin[it.first * 2 + 1];
-    }
-  }
-}
-
-template struct UniqueFunctor<CpuDevice, int64_t, int64_t>;
-template struct UniqueFunctor<CpuDevice, int32_t, int32_t>;
-template struct UniqueFunctor<CpuDevice, int64_t, int32_t>;
-template struct UniqueFunctor<CpuDevice, int32_t, int64_t>;
-
-}  // namespace functor
+class UniqueCpuOp : public OpKernel {
+ public:
+  Status Compute(OpKernelContext* ctx) override;
+};
 
 template <typename T, typename I>
 Status UniqueCpuOp<T, I>::Compute(OpKernelContext* ctx) {
-  Tensor input, output, out_index;
+  //auto t0 = std::chrono::high_resolution_clock::now();
+  Tensor input, segment, output, out_index, sample_index, sample_segment;
   XDL_CHECK_STATUS(ctx->GetInput(0, &input));
+  XDL_CHECK_STATUS(ctx->GetInput(1, &segment));
   XDL_CHECK_COND(2 >= input.Shape().Size(),
                  Status::ArgumentError("input dim cann't be greater than 2"));
-  TensorShape index_shape({input.Shape()[0]});
-  XDL_CHECK_STATUS(ctx->AllocateOutput(1, index_shape, &out_index));
 
   CpuDevice* device = dynamic_cast<CpuDevice*>(ctx->GetDevice());
   auto fn = functor::UniqueFunctor<CpuDevice, T, I>();
-  fn(device, input, &output, out_index);
+  fn(device, input, segment, &output, &out_index, &sample_index, &sample_segment);
 
   ctx->SetOutput(0, output);
+  ctx->SetOutput(1, out_index);  
+  ctx->SetOutput(2, sample_index);
+  ctx->SetOutput(3, sample_segment);  
+  //auto t1 = std::chrono::high_resolution_clock::now();
+  //std::chrono::duration<double, std::milli> diff = t1 - t0;
+  //LOG(INFO) << "cpu unique op time:" << diff.count() << "ms";
   return Status::Ok();
 }
 
 XDL_DEFINE_OP(Unique)
   .Input("input", "dtype")
+  .Input("segment", "itype")
   .Output("output", "dtype")
   .Output("index", "itype")
+  .Output("sample_index", "itype")
+  .Output("sample_segment", "itype")
   .Attr("dtype", AttrValue::kDataType)
   .Attr("itype", AttrValue::kDataType);
 
diff --git a/xdl/xdl/core/ops/unique_op.cu b/xdl/xdl/core/ops/unique_op.cu
index 20a91daf..def9c1c7 100644
--- a/xdl/xdl/core/ops/unique_op.cu
+++ b/xdl/xdl/core/ops/unique_op.cu
@@ -14,143 +14,171 @@
  * limitations under the License.
 */
 
-#include "xdl/core/ops/unique_op.h"
+#include "xdl/core/lib/unique.h"
 #include "xdl/core/framework/op_registry.h"
+#include "xdl/core/lib/atomic.h"
+#include "xdl/core/lib/binary_search.h"
 
 #include <thrust/sort.h>
+#include <thrust/unique.h>
 #include <thrust/device_ptr.h>
+#include <thrust/pair.h>
 #include <thrust/system/cuda/execution_policy.h>
 #include "xdl/core/framework/gpu/gpu_device.h"
 #include "xdl/core/lib/common_defines.h"
 
+#include <chrono>
+
 namespace xdl {
 namespace functor {
 
-template <typename T, typename I, int dim>
-struct UniqueLess;
-
 template <typename T, typename I>
-struct UniqueLess<T, I, 1> {
-  UniqueLess(const T* data) : data_(data) {}
-  __host__ __device__ bool operator()(const I& lhs, const I& rhs) {
-    return data_[lhs] < data_[rhs];
-  }
-  const T* data_;
+struct UniqueFunctor<GpuDevice, T, I> {
+  void operator()(GpuDevice* d, const Tensor& in, const Tensor& segment, Tensor* out, Tensor* out_index, Tensor* sample_index, Tensor* sample_segment);
 };
 
-template <typename T, typename I>
-struct UniqueLess<T, I, 2> {
-  UniqueLess(const T* data) : data_(data) {}
-  __host__ __device__ bool operator()(const I& lhs, const I& rhs) {
-    return (data_[lhs * 2] < data_[rhs * 2]) || 
-           (data_[lhs * 2] == data_[rhs * 2] && 
-            data_[lhs * 2 + 1] < data_[rhs * 2 + 1]);
+template <typename T>
+struct Less {
+  __host__ __device__ bool operator()(const thrust::pair<T, T>& l,
+                                      const thrust::pair<T, T>& r) {
+    return l.first < r.first || (l.first == r.first && l.second < r.second);
   }
-  const T* data_;
 };
 
-template <typename T, int dim>
-struct UniqueEqual;
-
 template <typename T>
-struct UniqueEqual<T, 1> {
-  __host__ __device__ bool operator()(const T* raw, const T* uniq) {
-    return raw[0] == uniq[0];
+struct Equal {
+  __host__ __device__ bool operator()(const thrust::pair<T, T>& l,
+                                      const thrust::pair<T, T>& r) {
+    return l.first == r.first && l.second == r.second;
   }
 };
 
-template <typename T> 
-struct UniqueEqual<T, 2> {
-  __host__ __device__ bool operator()(const T* raw, const T* uniq) {
-    return raw[0] == uniq[0] && raw[1] == uniq[1];
+template <typename T, typename I>
+__global__ void FindIndex(const T* src, size_t sz, const T* uniqs,
+                          size_t uniq_sz, I* out_index, I* sample_segment) {
+  int idx = blockIdx.x * blockDim.x + threadIdx.x;
+  if (idx >= sz) return;
+  out_index[idx] = static_cast<I>(BinarySearch(uniqs, uniq_sz, src[idx]));
+  common::gpu_atomic_add<I>(1, sample_segment + out_index[idx]);
+}
+
+template <typename T, typename I>
+__global__ void FindPairIndex(const T* src, size_t sz, const T* uniqs,
+                              size_t uniq_sz, I* out_index, I* sample_segment) {
+  int idx = blockIdx.x * blockDim.x + threadIdx.x;
+  if (idx >= sz) return;
+  out_index[idx] = static_cast<I>(BinarySearch2(uniqs, uniq_sz,
+                                                src[2*idx], src[2*idx+1]));
+  common::gpu_atomic_add<I>(1, sample_segment + out_index[idx]);
+}
+
+template <typename I>
+__global__ void FindSampleIndex(const I* segment, const I* out_index, size_t sz, size_t uniq_size, size_t segment_size,
+                                I* cur, I* sample_index, I* sample_segment) {
+  cur[0] = 0;
+  for (size_t i = 1; i < uniq_size; ++i) {
+    cur[i] = sample_segment[i-1];
+    sample_segment[i] += sample_segment[i-1];
   }
-};
+  I segment_idx = 0;
+  for (I i = 0; i < sz; ++i) {
+    while (i == *segment) {
+      if (++segment_idx > segment_size) return;
+      ++segment;
+    }
+    sample_index[cur[out_index[i]]] = segment_idx;
+    cur[out_index[i]]++;
+  }
+}
 
 template <typename T, typename I>
 void UniqueFunctor<GpuDevice, T, I>::operator()(GpuDevice* d,
                                                 const Tensor& in,
+                                                const Tensor& segment,
                                                 Tensor* out,
-                                                Tensor& out_index) {
+                                                Tensor* out_index,
+                                                Tensor* sample_index,
+                                                Tensor* sample_segment) {
+  cudaStream_t stream = d->Stream()->GetInternal();
+  //CUDA_CHECK(cudaStreamSynchronize(stream));
+  //auto t0 = std::chrono::high_resolution_clock::now();
+  Tensor temp(d, in.Shape(), in.Type());
+  *out_index = Tensor(d, TensorShape({in.Shape()[0]}), DataTypeToEnum<I>::v());
+  *sample_index = Tensor(d, TensorShape({in.Shape()[0]}), DataTypeToEnum<I>::v());
+  T* ptr_in = in.Raw<T>();
+  T* ptr_temp = temp.Raw<T>();
+  CUDA_CHECK(cudaMemcpyAsync(ptr_temp,
+                             ptr_in,
+                             in.Shape().NumElements() * sizeof(T),
+                             cudaMemcpyDeviceToDevice));
   size_t id_num = in.Shape()[0];
   size_t id_dim = in.Shape().Size() == 1 ? 1 : in.Shape()[1];
-  size_t total_num = in.Shape().NumElements();
-  T* tin = in.Raw<T>();
-  std::vector<I> index(id_num);
-  for (size_t i = 0; i < id_num; ++i) {
-    index[i] = static_cast<I>(i);
-  }
-  size_t bytes = sizeof(I) * id_num;
-  cudaStream_t stream = d->Stream()->GetInternal();
-  I* d_index = reinterpret_cast<I*>(d->Allocate(bytes));
-  CUDA_CHECK(cudaMemcpyAsync(d_index,
-                             index.data(),
-                             bytes,
-                             cudaMemcpyHostToDevice,
-                             stream));
-  thrust::device_ptr<I> dptr_i(d_index);
+  size_t segment_size = segment.Shape()[0];
   if (id_dim == 1) {
+    thrust::device_ptr<T> dptr_temp(ptr_temp), dptr_end;
     thrust::sort(thrust::cuda::par.on(stream),
-                 dptr_i,
-                 dptr_i + id_num,
-                 UniqueLess<T, I, 1>(tin));
+                 dptr_temp, dptr_temp + id_num);
+    dptr_end = thrust::unique(thrust::cuda::par.on(stream),
+                              dptr_temp, dptr_temp + id_num);
+    size_t uniq_size = dptr_end - dptr_temp;
+    TensorShape out_shape({uniq_size});
+    *out = Tensor(d, out_shape, in.Type());
+    TensorShape sseg_shape({uniq_size});
+    *sample_segment = Tensor(d, sseg_shape, out_index->Type());
+    Tensor cur(d, sseg_shape, out_index->Type());
+    CUDA_CHECK(cudaMemsetAsync(sample_segment->Raw<I>(), 0, sizeof(I) * uniq_size, stream));
+    size_t blocks = CUDA_GET_BLOCKS(id_num);
+    FindIndex<T, I><<<
+        blocks,
+        CUDA_GET_THREADS(id_num, blocks),
+        0,
+        stream>>>(ptr_in, id_num, ptr_temp, uniq_size, out_index->Raw<I>(), sample_segment->Raw<I>());
+    FindSampleIndex<I><<<
+        1,
+        1,
+        0,
+        stream>>>(segment.Raw<I>(), out_index->Raw<I>(), id_num, uniq_size, segment_size,
+                  cur.Raw<I>(), sample_index->Raw<I>(), sample_segment->Raw<I>());
+    CUDA_CHECK(cudaMemcpyAsync(out->Raw<T>(),
+                               ptr_temp,
+                               out_shape.NumElements() * sizeof(T),
+                               cudaMemcpyDeviceToDevice));
   } else if (id_dim == 2) {
-    thrust::sort(thrust::cuda::par.on(stream),
-                 dptr_i,
-                 dptr_i + id_num,
-                 UniqueLess<T, I, 2>(tin));
+    thrust::pair<T, T>* ptr_pair = reinterpret_cast<thrust::pair<T, T>*>(ptr_temp);
+    thrust::device_ptr<thrust::pair<T, T>> dptr_temp(ptr_pair), dptr_end;
+    thrust::sort(thrust::cuda::par.on(stream), dptr_temp, dptr_temp + id_num,
+                 Less<T>());
+    dptr_end = thrust::unique(thrust::cuda::par.on(stream), dptr_temp, dptr_temp + id_num,
+                   Equal<T>());
+    size_t uniq_size = dptr_end - dptr_temp;
+    TensorShape out_shape({uniq_size, 2});
+    *out = Tensor(d, out_shape, in.Type());
+    TensorShape sseg_shape({uniq_size});
+    *sample_segment = Tensor(d, sseg_shape, out_index->Type());
+    Tensor cur(d, sseg_shape, out_index->Type());
+    CUDA_CHECK(cudaMemsetAsync(sample_segment->Raw<I>(), 0, sizeof(I) * uniq_size, stream));
+    size_t blocks = CUDA_GET_BLOCKS(id_num);
+    FindPairIndex<T, I><<<
+        blocks,
+        CUDA_GET_THREADS(id_num, blocks),
+        0,
+        stream>>>(ptr_in, id_num, ptr_temp, uniq_size, out_index->Raw<I>(), sample_segment->Raw<I>());
+    FindSampleIndex<I><<<
+        1,
+        1,
+        0,
+        stream>>>(segment.Raw<I>(), out_index->Raw<I>(), id_num, uniq_size, segment_size,
+                  cur.Raw<I>(), sample_index->Raw<I>(), sample_segment->Raw<I>());
+    CUDA_CHECK(cudaMemcpyAsync(out->Raw<T>(),
+                               ptr_temp,
+                               out_shape.NumElements() * sizeof(T),
+                               cudaMemcpyDeviceToDevice));
   }
 
-  std::vector<T> values(total_num), output(total_num);
-  std::vector<I> output_index(id_num);
-  CUDA_CHECK(cudaMemcpyAsync(index.data(),
-                             d_index,
-                             bytes,
-                             cudaMemcpyDeviceToHost,
-                             stream));
-  CUDA_CHECK(cudaMemcpyAsync(values.data(),
-                             tin,
-                             sizeof(T) * total_num,
-                             cudaMemcpyDeviceToHost,
-                             stream));
-  CUDA_CHECK(cudaStreamSynchronize(stream));
-  size_t k = 0;
-  if (id_dim == 1) {
-    auto equal_fn = UniqueEqual<T, 1>();
-    for (size_t i = 0; i < id_num; ++i) {
-      if (k == 0 || !equal_fn(values.data() + index[i],
-                             output.data() + k - 1)) {
-        output[k++] = values[index[i]];
-      }
-      output_index[index[i]] = k - 1;
-    }
-  } else {
-    auto equal_fn = UniqueEqual<T, 2>(); 
-    for (size_t i = 0; i < id_num; ++i) {
-      if (k == 0 || !equal_fn(values.data() + index[i] * 2,
-                             output.data() + (k - 1) * 2)) {
-        output[k * 2] = values[index[i] * 2];
-        output[k * 2 + 1] = values[index[i] * 2 + 1];
-        ++k;
-      }
-      output_index[index[i]] = k - 1;
-    }
-  }
-  std::vector<size_t> shape({k});
-  if (id_dim > 1) shape.push_back(id_dim);
-  TensorShape out_shape(shape);
-  *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
-  CUDA_CHECK(cudaMemcpyAsync(out->Raw<T>(),
-                             output.data(),
-                             sizeof(T) * out_shape.NumElements(),
-                             cudaMemcpyHostToDevice,
-                             stream));
-  CUDA_CHECK(cudaMemcpyAsync(out_index.Raw<I>(),
-                             output_index.data(),
-                             bytes,
-                             cudaMemcpyHostToDevice,
-                             stream));
-  d->Deallocate(d_index);
-  CUDA_CHECK(cudaStreamSynchronize(stream));
+  //CUDA_CHECK(cudaStreamSynchronize(stream));
+  //auto t1 = std::chrono::high_resolution_clock::now();
+  //std::chrono::duration<double, std::milli> diff = t1 - t0;
+  //LOG(INFO) << "unique op time:" << diff.count() << "ms, size=" << id_num;
 }
 
 template struct UniqueFunctor<GpuDevice, int64_t, int64_t>;
@@ -168,18 +196,21 @@ class UniqueGpuOp : public GpuOpKernel {
 
 template <typename T, typename I>
 Status UniqueGpuOp<T, I>::LaunchKernel(OpKernelContext* ctx, CudaStream* stream) {
-  Tensor input, output, out_index;
+  Tensor input, segment, output, out_index, sample_index, sample_segment;
   XDL_CHECK_STATUS(ctx->GetInput(0, &input));
+  XDL_CHECK_STATUS(ctx->GetInput(1, &segment));
   XDL_CHECK_COND(2 >= input.Shape().Size(),
                  Status::ArgumentError("input dim can't be greater than 2"));
   TensorShape index_shape({input.Shape()[0]});
-  XDL_CHECK_STATUS(ctx->AllocateOutput(1, index_shape, &out_index));
 
   GpuDevice* device = dynamic_cast<GpuDevice*>(ctx->GetDevice());
   auto fn = functor::UniqueFunctor<GpuDevice, T, I>();
-  fn(device, input, &output, out_index);
+  fn(device, input, segment, &output, &out_index, &sample_index, &sample_segment);
 
   ctx->SetOutput(0, output);
+  ctx->SetOutput(1, out_index);
+  ctx->SetOutput(2, sample_index);
+  ctx->SetOutput(3, sample_segment);
   return Status::Ok();
 }
 
diff --git a/xdl/xdl/core/ops/unique_op.h b/xdl/xdl/core/ops/unique_op.h
deleted file mode 100644
index 796f4642..00000000
--- a/xdl/xdl/core/ops/unique_op.h
+++ /dev/null
@@ -1,64 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-/*
- * Copyright 1999-2017 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
-#ifndef XDL_CORE_OPS_UNIQUE_OP_H_
-#define XDL_CORE_OPS_UNIQUE_OP_H_
-
-#include "xdl/core/framework/cpu_device.h"
-
-namespace xdl {
-
-class GpuDevice;
-namespace functor {
-
-template <typename Device, typename T, typename I>
-struct UniqueFunctor;
-
-template <typename T, typename I>
-struct UniqueFunctor<CpuDevice, T, I> {
-  void operator()(CpuDevice* d, const Tensor& in, Tensor* out, Tensor& out_index);
-};
-
-template <typename T, typename I>
-struct UniqueFunctor<GpuDevice, T, I> {
-  void operator()(GpuDevice* d, const Tensor& in, Tensor* out, Tensor& out_index);
-};
-
-}  // namespace functor
-
-template <typename T, typename I>
-class UniqueCpuOp : public OpKernel {
- public:
-  Status Compute(OpKernelContext* ctx) override;
-};
-
-}  // namespace xdl
-
-#endif  // XDL_CORE_OPS_UNIQUE_OP_H_
diff --git a/xdl/xdl/core/ops/zeros.cc b/xdl/xdl/core/ops/zeros.cc
new file mode 100644
index 00000000..50a700ae
--- /dev/null
+++ b/xdl/xdl/core/ops/zeros.cc
@@ -0,0 +1,63 @@
+/* Copyright 2018 Alibaba Group. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/core/lib/status.h"
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+
+namespace xdl {
+
+class ZerosOp : public xdl::OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    XDL_CHECK_STATUS(ctx->GetAttr("dtype", &dtype_));
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    Tensor shape;
+    XDL_CHECK_STATUS(ctx->GetInput(0, &shape));
+    if (shape.Shape().Size() != 1) {
+        return Status::ArgumentError("Zeros shape should be 1-D");
+    }
+    std::vector<size_t> shapex;
+    int64_t num_ele = 1, loc = -1;
+    for (int64_t i = 0; i < shape.Shape()[0]; i++) {
+      int64_t x = shape.Raw<int64_t>()[i];
+      if (x < 0) {
+        return Status::ArgumentError("Zeros shape[i] < 0");
+      }
+      shapex.push_back(x);
+    }
+    Tensor output;
+    XDL_CHECK_STATUS(ctx->AllocateOutput(0, TensorShape(shapex), &output));
+    memset(output.Raw<void>(), 0, SizeOfType(dtype_) * output.Shape().NumElements());
+    return Status::Ok();
+  }
+ private:
+  DataType dtype_;
+};
+
+XDL_DEFINE_OP(Zeros)
+  .Input("shape", DataType::kInt64)
+  .Attr("dtype", AttrValue::kDataType)
+  .Output("result", "dtype");
+
+XDL_REGISTER_KERNEL(Zeros, ZerosOp)
+  .Device("CPU");
+
+} // namespace xdl
+
diff --git a/xdl/xdl/core/proto/graph_def.proto b/xdl/xdl/core/proto/graph_def.proto
index 3aa493e7..d2d2b369 100644
--- a/xdl/xdl/core/proto/graph_def.proto
+++ b/xdl/xdl/core/proto/graph_def.proto
@@ -47,8 +47,9 @@ message NodeDef {
   string name = 1;
   string op = 2;
   repeated string input = 3;
-  DeviceDef device = 4;
-  map<string, AttrValue> attr = 5;
+  repeated DataType output_type = 4;
+  DeviceDef device = 5;
+  map<string, AttrValue> attr = 6;
 }
 
 message InputDef {
@@ -66,7 +67,7 @@ message OutputDef {
 
 message TagDef {
   repeated InputDef input = 1;
-  repeated OutputDef output = 2;
+  OutputDef output = 2;
 }
 
 message GraphDef {
diff --git a/xdl/xdl/core/utils/logging.cc b/xdl/xdl/core/utils/logging.cc
index c72c7113..b85ce37f 100644
--- a/xdl/xdl/core/utils/logging.cc
+++ b/xdl/xdl/core/utils/logging.cc
@@ -37,7 +37,7 @@ void LogMessage::GenerateLogMessage() {
   strftime(time_buffer, time_buffer_size, "%Y-%m-%d %H:%M:%S",
            localtime(&now_seconds));
   fprintf(stderr, "%s.%06d: %c %s:%d] %s\n", time_buffer, micros_remainder,
-          "IWEF"[severity_], fname_, line_, str().c_str());
+          "DIWEF"[severity_], fname_, line_, str().c_str());
 }
 
 namespace {
diff --git a/xdl/xdl/core/utils/logging.h b/xdl/xdl/core/utils/logging.h
index 0788cdca..d4461e0f 100644
--- a/xdl/xdl/core/utils/logging.h
+++ b/xdl/xdl/core/utils/logging.h
@@ -32,6 +32,47 @@ class LogMessage : public std::basic_ostringstream<char> {
   LogMessage(const char* fname, int line, int severity);
   ~LogMessage();
 
+#define TO_STRING_AND_RETURN(value)             \
+  printf("enter logmessage ...\n");             \
+  *this << std::to_string(value);               \
+  return *this;                                 \
+  
+  basic_ostream& operator<<(short value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(unsigned short value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(int value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(unsigned int value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(long value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(unsigned long value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(long long value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(unsigned long long value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(float value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(double value) {
+    TO_STRING_AND_RETURN(value);
+  }
+  basic_ostream& operator<<(long double value) {
+    TO_STRING_AND_RETURN(value);
+  }
+
+#undef TO_STRING_AND_RETURN
+
  protected:
   void GenerateLogMessage();
 
diff --git a/xdl/xdl/core/utils/mock_data_utils.h b/xdl/xdl/core/utils/mock_data_utils.h
index e3a8e321..1cc0afe5 100644
--- a/xdl/xdl/core/utils/mock_data_utils.h
+++ b/xdl/xdl/core/utils/mock_data_utils.h
@@ -1,18 +1,3 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
 /*
  * Copyright 1999-2017 Alibaba Group.
  *
diff --git a/xdl/xdl/core/utils/string_utils.h b/xdl/xdl/core/utils/string_utils.h
index 4e9630c8..aafb0c34 100644
--- a/xdl/xdl/core/utils/string_utils.h
+++ b/xdl/xdl/core/utils/string_utils.h
@@ -37,11 +37,18 @@ class StringUtils {
   static bool strToUInt64(const char* str, uint64_t& value);
   static bool strToFloat(const char *str, float &value);
   static bool strToDouble(const char *str, double &value);    
+  
   static std::vector<std::string> split(
       const std::string& text, 
       const std::string &sepStr, 
       bool ignoreEmpty = true);
 
+
+  template<typename T>
+  static std::string ToStringPrecision(T a, int precision=6) {
+    return std::to_string(a);
+  }
+
   template<typename T>
   static std::string toString(const T &x);
 
@@ -210,6 +217,150 @@ inline std::string StringUtils::toString(
   return toString(strVec, delim2);
 }
 
+template<>
+inline std::string StringUtils::ToStringPrecision<float>(float a, int precision) {
+  if(precision < 0) {
+    throw std::logic_error("Pass illegal parameter precision!");
+  }
+  std::string temp = "";
+  long b = (long)a;
+  float c = a-b;
+  //if a belows zero, then change its
+  //integer part and float part to
+  //positive
+  if(a < 0) {
+    b = -b;
+    c = -c;
+  }
+  //if( !(b <= (1<<30)) ) {
+  //  throw std::logic_error("Pass illegal parameter a!");
+  //}
+  //change a's integer part into string
+  do{
+    temp += (char)(b%10+'0');
+    b = b/10;
+  }while(b>0);
+  size_t i = temp.length();
+  for(size_t j=0; j<i/2; j++){
+    temp[j] = temp[j] + temp[i-j-1];
+    temp[i-j-1] = temp[j]-temp[i-j-1];
+    temp[j] = temp[j]-temp[i-j-1];
+  }
+  //memorize the pointer's position
+  int pointpos = temp.length();
+  //convert a's float part into string
+  bool not_in_zero = (long)a != 0;
+  if (-1e-7 < c && c < 1e-7) {
+    if (a < 0) {
+      temp.insert(0, "-");
+    }
+    return temp;
+  }
+  do{
+    c = c*10;
+    temp += (char)((int)c + '0');
+    if ((int)c != 0) {
+      not_in_zero = true;
+    }
+    c -= (int)c;
+    if (not_in_zero) {
+      precision--;
+    }
+    if(precision == 0 && c*10 >= 5) {//computer carrier
+      int len = temp.length()-1;
+      while(len>=0 && (++temp[len]) > '9') {
+        temp[len] = '0';
+        len--;
+      }
+    }
+  }while(precision > 0);
+  //add the pointer of a float number to string
+  temp.insert(pointpos, ".");
+  //add negtive sign '-'
+  if(a<0) {
+    temp.insert(0, "-");
+  }
+  while(temp[temp.size()-1] == '0') {
+    temp.erase(temp.size()-1);
+  }
+  if (temp[temp.size()-1] == '.') {
+    temp.erase(temp.size()-1);    
+  }
+  return temp;
+}
+
+template<>
+inline std::string StringUtils::ToStringPrecision<double>(double a, int precision) {
+  if(precision < 0) {
+    throw std::logic_error("Pass illegal parameter precision!");
+  }
+  std::string temp = "";
+  long b = (long)a;
+  double c = a-b;
+  //if a belows zero, then change its
+  //integer part and float part to
+  //positive
+  if(a < 0) {
+    b = -b;
+    c = -c;
+  }
+  if( !(b <= (1<<30)) ) {
+    throw std::logic_error("Pass illegal parameter a!");
+  }
+  //change a's integer part into string
+  do{
+    temp += (char)(b%10+'0');
+    b = b/10;
+  }while(b>0);
+  size_t i = temp.length();
+  for(size_t j=0; j<i/2; j++){
+    temp[j] = temp[j] + temp[i-j-1];
+    temp[i-j-1] = temp[j]-temp[i-j-1];
+    temp[j] = temp[j]-temp[i-j-1];
+  }
+  //memorize the pointer's position
+  int pointpos = temp.length();
+  //convert a's float part into string
+  bool not_in_zero = (long)a != 0;
+  if (-1e-7 < c && c < 1e-7) {
+    if (a < 0) {
+      temp.insert(0, "-");
+    }
+    return temp;
+  }
+  do{
+    c = c*10;
+    temp += (char)((int)c + '0');
+    if ((int)c != 0) {
+      not_in_zero = true;
+    }
+    c -= (int)c;
+    if (not_in_zero) {
+      precision--;
+    }
+    if(precision == 0 && c*10 >= 5) {//computer carrier
+      int len = temp.length()-1;
+      while(len>=0 && (++temp[len]) > '9') {
+        temp[len] = '0';
+        len--;
+      }
+    }
+  }while(precision > 0);
+  //add the pointer of a float number to string
+  temp.insert(pointpos, ".");
+  //add negtive sign '-'
+  if(a<0) {
+    temp.insert(0, "-");
+  }
+  while(temp[temp.size()-1] == '0') {
+    temp.erase(temp.size()-1);
+  }
+  if (temp[temp.size()-1] == '.') {
+    temp.erase(temp.size()-1);    
+  }
+  return temp;
+}
+
 } // xdl
 
 #endif  // XDL_CORE_UTILS_STRING_UTILS_H_
diff --git a/xdl/xdl/data_io/CMakeLists.txt b/xdl/xdl/data_io/CMakeLists.txt
index feecdbac..346d6579 100644
--- a/xdl/xdl/data_io/CMakeLists.txt
+++ b/xdl/xdl/data_io/CMakeLists.txt
@@ -3,16 +3,16 @@ file(GLOB_RECURSE SRC_XDL_IO_LIB
     "op/*.cc"
     "fs/*.cc"
     "parser/*.cc"
-    "log/*.cc"
 )
 
-include_directories(${PROJECT_SOURCE_DIR}/ps-plus/third_party/jsoncpp/include)
-link_directories(${PROJECT_BINARY_DIR}/ps-plus/third_party/jsoncpp/lib64)   
+IF (NOT USE_PS_PLUS)
+    list(REMOVE_ITEM SRC_XDL_IO_LIB "${CMAKE_CURRENT_SOURCE_DIR}/global_scheduler.cc")
+ENDIF()
 
 IF (BUILD_SHARED)
     add_library(xdl_io SHARED ${SRC_XDL_IO_LIB} $<TARGET_OBJECTS:xdl_proto>)
-    target_link_libraries(xdl_io dl rdkafka++ jsoncpp)
+	target_link_libraries(xdl_io ${XDL_IO_DEPEND_LIB})
 ELSE()
     add_library(xdl_io STATIC ${SRC_XDL_IO_LIB} $<TARGET_OBJECTS:xdl_proto>)
-    target_link_libraries(xdl_io dl rdkafka++ jsoncpp)
+    target_link_libraries(xdl_io ${XDL_IO_DEPEND_LIB})
 ENDIF()
diff --git a/xdl/xdl/data_io/batch.cc b/xdl/xdl/data_io/batch.cc
index d50dd97b..18f499ca 100644
--- a/xdl/xdl/data_io/batch.cc
+++ b/xdl/xdl/data_io/batch.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 #include "xdl/data_io/batch.h"
 #include "xdl/data_io/pool.h"
 
@@ -68,8 +53,9 @@ bool Batch::Reuse() {
   }
   sgroups_.clear();
   ts_count_ = 0;
+  abandon_ = false;
   BatchPool::Get()->Release(this);
-  XDL_DLOG(DEBUG) << "release batch=" << this;
+  XDL_LOG(DEBUG) << "release batch=" << this;
   return true;
 }
 
diff --git a/xdl/xdl/data_io/batch.h b/xdl/xdl/data_io/batch.h
index 71fe2677..90c87da8 100644
--- a/xdl/xdl/data_io/batch.h
+++ b/xdl/xdl/data_io/batch.h
@@ -13,27 +13,11 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 #ifndef XDL_IO_BATCH_H_
 #define XDL_IO_BATCH_H_
 
 #include "xdl/data_io/sgroup.h"
 #include "xdl/core/framework/tensor.h"
-#include "xdl/core/utils/logging.h"
 
 #include <atomic>
 
@@ -43,15 +27,21 @@ namespace io {
 static const char *kSKeyName = "skey";
 static const char *kLabelName = "label";
 static const char *kIndicatorPrefix = "ind.";
+static const char *kCoordPrefix = "coord.";
+static const char *kCoordL1 = "coord.l1";
+static const char *kCoordL2 = "coord.l2";
 
 struct Block {
   enum Type {
     kValue = 0,      // float dense, sparse, label
-    kIndex,          // int32/int64 sample key index, indicator, uniq index
-    kSegment,        // int32 sparse
+    kIndex,          // int32/int64 sample key index, indicator, uniq index, coord
+    kSegment,        // int32 sparse, seq length
     kKey,            // int64 key, sparse key
     kUKey,           // int64 key, unique sparse key
     kSBuf,           // int8 sample key
+    kShape,          // int32 shape
+    kSIndex,         // unique id's sample_ids
+    kSSegment,       // unique id's sample_ids segment
     kTypes,          // number of type
   };
   Tensor *ts_[kTypes];
@@ -68,12 +58,15 @@ class Batch {
   bool Add(const std::string &name, const Block &block);
   bool Keep(SGroup *sgroup);
   bool Reuse();
+  void Abandon(bool b) { abandon_ = true; }
+  bool Abandon() const { return abandon_; }
   std::vector<SGroup *> &sgroups();
   std::map<std::string, Block> &blocks();
   std::atomic<size_t> ts_count_;
  protected:
   std::map<std::string, Block> blocks_;
   std::vector<SGroup *> sgroups_;
+  bool abandon_ = false;
 };
 
 }  // namespace io
diff --git a/xdl/xdl/data_io/check_finish_op.cc b/xdl/xdl/data_io/check_finish_op.cc
new file mode 100644
index 00000000..f8c24ace
--- /dev/null
+++ b/xdl/xdl/data_io/check_finish_op.cc
@@ -0,0 +1,57 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/lib/timer.h"
+#include "xdl/data_io/data_io.h"
+
+namespace xdl {
+
+class CheckFinishOp: public OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    std::string ds;
+    XDL_CHECK_STATUS(ctx->GetAttr("ds", &ds));
+
+    data_io_ = io::DataIOMap::Instance()->Get(ds);
+    XDL_CHECK(data_io_ != nullptr);
+
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    XDL_TIMER_SCOPE(get_batch_timer);
+    auto batch = data_io_->GetBatchNext();
+    if (data_io_->finished()) {
+      XDL_LOG(DEBUG) << "game over";
+      return Status::OutOfRange("game over ");
+    }
+
+    return Status::Ok();
+  }
+
+ private:
+  io::DataIO *data_io_;
+};
+
+XDL_DEFINE_OP(CheckFinish)
+  .Attr("ds", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(CheckFinish, CheckFinishOp).Device("CPU");
+
+}  // namespace xdl
diff --git a/xdl/xdl/data_io/constant.h b/xdl/xdl/data_io/constant.h
index 34e9b22c..af2a2248 100644
--- a/xdl/xdl/data_io/constant.h
+++ b/xdl/xdl/data_io/constant.h
@@ -12,10 +12,12 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
+
 #ifndef XDL_IO_CONSTANT_H_
 #define XDL_IO_CONSTANT_H_
 
 #include <string>
+#include <limits>
 
 namespace xdl {
 namespace io {
@@ -51,6 +53,14 @@ enum ParserType {
   kSPB = 0x05,
 };
 
+enum ZType {
+  kRaw = 0x00,
+  kZLib = 0x01,
+  kGZip = 0x02,
+};
+
+const size_t MAX_END_TIME = std::numeric_limits<size_t>::max() / 8;
+
 
 }  // namespace io
 }  // namespace xdl
diff --git a/xdl/xdl/data_io/data_io.cc b/xdl/xdl/data_io/data_io.cc
index e658ff0e..c7dc2d9d 100644
--- a/xdl/xdl/data_io/data_io.cc
+++ b/xdl/xdl/data_io/data_io.cc
@@ -13,67 +13,93 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #include "xdl/data_io/data_io.h"
 
+#include "xdl/core/lib/timer.h"
 #include "xdl/core/framework/cpu_device.h"
+#ifdef USE_PS_PLUS
+#include "xdl/data_io/global_scheduler.h"
+#endif
 
 #include "google/protobuf/text_format.h"
-#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
 
 static const unsigned kTimeWait = 60000; /// millisecond
+static const unsigned kTimeWaitTORetry = 100; /// millisecond
 
 DataIO::DataIO(const std::string &ds_name, ParserType parser_type,
-               FSType fs_type, const std::string &namenode)
-    : ds_name_(ds_name), parser_type_(parser_type) {
+               FSType fs_type, const std::string &namenode,
+               size_t worker_id, bool global_schedule)
+    : ds_name_(ds_name), parser_type_(parser_type),
+      fs_type_(fs_type) {
   fs_ = GetFileSystem(fs_type, namenode.empty()?nullptr:namenode.c_str());
-  sched_ = new Scheduler(fs_);
-  schema_ = new Schema();
+#ifdef USE_PS_PLUS
+  if (global_schedule) {
+    sched_.reset(new GlobalScheduler(fs_, ds_name, 1, worker_id));
+  }
+#endif
+  if (sched_ == nullptr) {
+    sched_.reset(new Scheduler(fs_));
+  }
+  schema_.reset(new Schema);
   DataIOMap::Add(ds_name, this);
 }
 
 DataIO::~DataIO() {
-  Shutdown();
+  XDL_LOG(DEBUG) << ds_name_ << " destroyed!";
+  Shutdown(true);
   DataIOMap::Delete(ds_name_);
 }
 
 bool DataIO::Init() {
-  XDL_CHECK(parsers_.empty() && packers_.empty()) << "double init";
-  sgroup_q_ = new BlockingQueue<SGroup *>(schema_->batch_size_);
-  batch_q_ = new BlockingQueue<Batch *>(10);
+  if (sgroup_q_ == nullptr) {
+    sgroup_q_ = new BlockingQueue<SGroup *>(schema_->batch_size_*threads_read_);
+  }
 
-  std::string meta = "";
-  if (!meta_path_.empty()) {
-    meta = fs_->Read(meta_path_);
+  
+  if (batch_q_ == nullptr) {
+    batch_q_ = new BlockingQueue<Batch *>(threads_);
   }
-  for (size_t i = 0; i < threads_; ++i) {
-    auto parser = new Parser(parser_type_, schema_);
-    XDL_CHECK(parser->InitMeta(meta));
-    parsers_.push_back(parser);
+
+  if (meta_data_.empty() && !meta_path_.empty()) {
+    meta_data_ = fs_->Read(meta_path_);
   }
 
+  parsers_.clear();
+  for (size_t i = 0; i < threads_read_; ++i) {
+    Parser* parser = new Parser(parser_type_, schema_.get());
+    XDL_CHECK(parser->InitMeta(meta_data_));
+    parsers_.emplace_back(parser);
+  }
+
+  packers_.clear();
   for (size_t i = 0; i < threads_; ++i) {
-    auto packer = new Packer(schema_, new CpuDevice());
-    packers_.push_back(packer);
+    auto packer = new Packer(schema_.get(), new CpuDevice());
+    packers_.emplace_back(packer);
   }
 
-  for (size_t i = 0; unique_ && i < threads_; ++i) {
-    auto merger = new Merger(schema_, new CpuDevice());
-    mergers_.push_back(merger);
+  mergers_.clear();
+  for (size_t i = 0; unique_ && i < packers_.size(); ++i) {
+    auto merger = new Merger(schema_.get(), new CpuDevice());
+    mergers_.emplace_back(merger);
   }
 
   sched_->Schedule();
+
+  curr_ = (Batch*)-1;
+  next_ = (Batch*)-1;
   return true;
 }
 
 /// finish while rparam is nullptr, or shutdown
 bool DataIO::DoParse(size_t tid) {
   XDL_LOG(DEBUG) << "parser." << tid << " startup";
-  assert(tid < threads_);
-  auto parser = parsers_[tid];
-  XDL_DLOG(DEBUG) << "this=" << this << ", parser=" << parser;
+  assert(tid < parsers_.size());
+  auto parser = parsers_[tid].get();
+  XDL_LOG(DEBUG) << "this=" << this << ", parser=" << parser;
   size_t count_rparam = 0;
   size_t count_sgroup = 0;
   while(running_) {
@@ -96,7 +122,7 @@ bool DataIO::DoParse(size_t tid) {
       while (pause_) {
         cv_.wait(lck);
       }
-      while(!sgroup_q_->TryEnqueue(sgroup, kTimeWait)) {
+      while(!sgroup_q_->TryEnqueue(sgroup, kTimeWaitTORetry)) {
         if (!running_) { break; }
       } 
 
@@ -119,13 +145,14 @@ bool DataIO::DoParse(size_t tid) {
  */
 bool DataIO::DoPack(size_t tid) {
   XDL_LOG(DEBUG) << "packer." << tid << " startup";
-  assert(tid < threads_);
-  auto packer = packers_[tid];
-  auto merger = unique_ ? mergers_[tid] : nullptr;
-  //XDL_DLOG(DEBUG) << "this=" << this << ", packer=" << packer;
+  assert(tid < packers_.size());
+  auto packer = packers_[tid].get();
+  auto merger = unique_ ? mergers_[tid].get() : nullptr;
+  //XDL_LOG(DEBUG) << "this=" << this << ", packer=" << packer;
   size_t count_sgroup = 0;
   size_t count_batch = 0;
   while(running_) {
+    //XDL_TIMER_NOW(deque_sgroup);
    again:
     SGroup *sgroup = nullptr;
     if (!sgroup_q_->TryDequeue(&sgroup, kTimeWait)) {
@@ -138,7 +165,9 @@ bool DataIO::DoPack(size_t tid) {
       XDL_LOG(DEBUG) << "wait exactly timeout, push END to packer";
     }
     XDL_CHECK(sgroup != nullptr);
+    //XDL_TIMER_STOP(deque_sgroup);
 
+    //XDL_TIMER_NOW(run_ops);
     if (sgroup != END) {
       ++count_sgroup;
       if (!RunOps(sgroup)) {
@@ -153,23 +182,36 @@ bool DataIO::DoPack(size_t tid) {
           XDL_LOG(DEBUG) << "all re parsers done, notify packers exit ...";
           NotifyPacker();
         }
-        XDL_DLOG(DEBUG) << "sgroup="<< sgroup << " -parse_count=" << parse_count_;
+        XDL_LOG(DEBUG) << "sgroup="<< sgroup << " -parse_count=" << parse_count_;
         continue;
       } else {
-        XDL_DLOG(DEBUG) << "sgroup="<< sgroup << " parse_count=" << parse_count_;
+        XDL_LOG(DEBUG) << "sgroup="<< sgroup << " parse_count=" << parse_count_;
+      }
+      if (sgroup->size_ != sgroup->Get()->labels_size()) {
+        if (sgroup->Get()->labels_size() == 0) {
+          // Ops del all
+          SGroupPool::Get()->Release(sgroup);
+          continue;
+        }
+        XDL_DLOG(DEBUG) << "rebuild sgroup " << sgroup->size_ 
+            << " -> " << sgroup->Get()->labels_size();
+        sgroup->Reset(sgroup->begin_);
       }
     }
+    //XDL_TIMER_STOP(run_ops);
 
+    //XDL_TIMER_NOW(run_pack);
     std::vector<Batch *> batchs = packer->Run(sgroup);
     for(auto &batch: batchs) {
       ++count_batch;
       if (unique_) {
         batch = merger->Run(batch);
       }
-      while (!batch_q_->TryEnqueue(batch, kTimeWait)) {
+      while (!batch_q_->TryEnqueue(batch, kTimeWaitTORetry)) {
         if (!running_) { break; }
       }
     }
+    //XDL_TIMER_STOP(run_pack);
 
     if (sgroup == END && parsers_done_ && (parse_count_ == 0 || !wait_exactly_)) {
       XDL_LOG(DEBUG) << "quit, wait_exactly=" << wait_exactly_ << " parse_count=" << parse_count_;
@@ -184,13 +226,15 @@ bool DataIO::DoPack(size_t tid) {
 bool DataIO::Startup() {
   XDL_CHECK(!running_);
   Init();
+  XDL_CHECK(sgroup_q_->Size() == 0) << "sgroup_q_ is not empty before start";
+  XDL_CHECK(batch_q_->Size() == 0) << "batch_q_ is not empty before start";
   running_ = true;
 
-  for (size_t i = 0; i < threads_; ++i) {
+  for (size_t i = 0; i < parsers_.size(); ++i) {
     th_parsers_.push_back(std::thread([this, i](){this->DoParse(i);}));
   }
 
-  for (size_t i = 0; i < threads_; ++i) {
+  for (size_t i = 0; i < packers_.size(); ++i) {
     th_packers_.push_back(std::thread([this, i](){this->DoPack(i);}));
   }
 
@@ -204,7 +248,7 @@ bool DataIO::Startup() {
 
 bool DataIO::Wait() {
   /// wait to done
-  for (size_t i = 0; i < threads_; ++i) {
+  for (size_t i = 0; i < parsers_.size(); ++i) {
     th_parsers_[i].join();
   }
 
@@ -217,11 +261,13 @@ bool DataIO::Wait() {
     NotifyPacker();
   }
 
-  for (size_t i = 0; i < threads_; ++i) {
+  for (size_t i = 0; i < packers_.size(); ++i) {
     th_packers_[i].join();
   }
 
   packers_done_ = true;
+  th_parsers_.clear();
+  th_packers_.clear();
 
   /// all packers done, notify get_batch_op
   batch_q_->ForceEnqueue(nullptr);
@@ -229,6 +275,14 @@ bool DataIO::Wait() {
   return true;
 }
 
+bool DataIO::Restart(size_t start) {
+  XDL_LOG(DEBUG) << "restart data_io " << ds_name_ << ", start_time=" << start;
+  Shutdown(true);
+  SetStartTime(start);
+  Startup();
+  return true;
+}
+
 bool DataIO::Shutdown(bool force) {
   if (!running_) {
     /// never startup
@@ -244,6 +298,17 @@ bool DataIO::Shutdown(bool force) {
   }
 
   th_wait_.join();
+  sgroup_q_->ClearAndDelete([](SGroup* sg) {
+      if (sg != nullptr && sg != END) {
+        SGroupPool::Get()->Release(sg);
+      }
+  });
+  batch_q_->ClearAndDelete([](Batch* batch) {
+      if (batch != nullptr) {
+        BatchPool::Get()->Release(batch);
+      }
+  });
+  sched_->Clear();
   XDL_LOG(DEBUG) << "xdl.data_io shutdown";
   return true;
 }
@@ -251,7 +316,7 @@ bool DataIO::Shutdown(bool force) {
 bool DataIO::AddOp(Operator *op) {
   XDL_CHECK(!running_);
   XDL_CHECK(op != nullptr);
-  if (op->set_schema(schema_) == false)  return false;
+  if (op->set_schema(schema_.get()) == false)  return false;
   ops_.push_back(op);
   return true;
 }
@@ -262,6 +327,12 @@ bool DataIO::SetMeta(const std::string &path) {
   return false;
 }
 
+bool DataIO::SetMetaData(const std::string& data) {
+  XDL_CHECK(!running_);
+  meta_data_ = data;
+  return true;
+}
+
 bool DataIO::AddPath(const std::string &path) {
   XDL_CHECK(!running_);
   sched_->AddPath(path);
@@ -274,6 +345,18 @@ bool DataIO::SetEpochs(size_t epochs) {
   return true;
 }
 
+bool DataIO::SetShuffle(bool shuffle) {
+  XDL_CHECK(!running_);
+  sched_->SetShuffle(shuffle);
+  return true;
+}
+
+bool DataIO::SetZType(ZType ztype) {
+  XDL_CHECK(!running_);
+  sched_->SetZType(ztype);
+  return true;
+}
+
 bool DataIO::SetBatchSize(size_t batch_size) {
   XDL_CHECK(!running_);
   schema_->batch_size_ = batch_size;
@@ -328,26 +411,52 @@ bool DataIO::SetPause(size_t limit, bool wait_exactly) {
   XDL_CHECK(schema_->keep_sgroup_ || !wait_exactly);
   parse_limit_ = limit;
   wait_exactly_ = wait_exactly;
-  if (wait_exactly_ && !finish_delay_) {
+  if (wait_exactly_ && !check_finish_delay_) {
     XDL_LOG(WARNING) << "wait exactly must finish delay, set it";
-    finish_delay_ = true;
+    check_finish_delay_ = true;
   }
   pause_ = false;
   return true;
 }
 
-bool DataIO::SetThreads(size_t threads) {
+bool DataIO::SetThreads(size_t threads,  size_t threads_read) {
   XDL_CHECK(!running_);
-  XDL_CHECK(threads > 0 && threads <= 32);
+  XDL_CHECK(threads > 0 && threads <= 32 && threads_read > 0 && threads_read <= 64) 
+      << "threads=" << threads << " threads_read=" << threads_read;
   threads_ = threads;
+  threads_read_ = threads_read;
+  return true;
+}
+
+bool DataIO::SetStartTime(size_t ts) {
+  return true;
+}
+
+bool DataIO::SetEndTime(size_t ts) {
   return true;
 }
 
+size_t DataIO::GetLatestTime() {
+  return 0;
+}
+
+size_t DataIO::GetReaderOffset() {
+  return 0;
+}
+
+bool DataIO::SetDuration(size_t dur) {
+  return true;
+}
+
+bool DataIO::IsStreaming() {
+  return false;
+}
+
 bool DataIO::SetFinishDelay(bool delay) {
   XDL_CHECK(!running_);
-  finish_delay_ = delay;
-  if (wait_exactly_ && !finish_delay_) {
-    XDL_LOG(FATAL) << "wait exactly must finish delay";
+  check_finish_delay_ = delay;
+  if (wait_exactly_ && !check_finish_delay_) {
+    XDL_LOG(FATAL) << "wait exactly must check finish delay";
   }
   return true;
 }
@@ -357,14 +466,19 @@ const FeatureOption *DataIO::GetFeatureOpt(const std::string &name) {
 }
 
 bool DataIO::AddFeatureOpt(const std::string &name, FeatureType type, int table, 
-                           int nvec, bool serialized, const std::string &dsl) {
+                           int nvec, const std::string &mask, bool serialized,
+                           int cutoff, const std::string &dsl) {
   FeatureOption *opt = new FeatureOption();
   opt->set_name(name);
   opt->set_type(type);
   opt->set_serialized(serialized);
-  if (nvec > 0)  opt->set_nvec(nvec);
-  if (table >= 0)  opt->set_table(table);
-  if (!dsl.empty())  opt->set_dsl(dsl);
+  XDL_CHECK(type == kSparse || nvec > 0);
+  if (table >= 0)  { opt->set_table(table); }
+  if (nvec > 0) { opt->set_nvec(nvec); }
+  if (!mask.empty()) { XDL_CHECK(mask.size() == nvec) << "mask size=" << mask.size();
+    opt->set_mask(mask); }
+  if (cutoff != 0) { opt->set_cutoff(cutoff); }
+  if (!dsl.empty()) { opt->set_dsl(dsl); }
   schema_->Add(opt);
   return true;
 }
@@ -401,62 +515,108 @@ bool DataIO::RunOps(SGroup *sgroup) {
       return false;
     }
   }
-  if (sgroup->size_ != sgroup->Get()->labels_size()) {
-    XDL_CHECK(!schema_->split_group_) 
-        << "must set split group to false while rebuilding";
-    XDL_DLOG(DEBUG) << "rebuild sgroup " << sgroup->size_ 
-        << " -> " << sgroup->Get()->labels_size();
-    sgroup->Reset(sgroup->begin_);
-  }
   return true;
 }
 
-/// make sure thread-safe by user
-const Batch *DataIO::GetBatch(unsigned msec) {
-  if (curr_ != nullptr) {
-    ReParse(curr_);
-    curr_->Reuse();
-    curr_ = next_;
+const Batch *DataIO::GetBatch() {
+  if (curr_ == nullptr) {
+    return nullptr;
   }
 
-  if (count_ == 0 || finish_delay_) {
-    /// first time or finish delay
-    curr_ = batch_q_->Dequeue(); 
-  }
+  /// release prev
+  ReleaseBatch();
 
-  // get next while no finish_delay
-  if (!finish_delay_ && curr_ != nullptr) {
+  if (next_ == (Batch *)-1) {
+    /// first time or check_finish_delay
     next_ = batch_q_->Dequeue(); 
-  } else {
-    next_ = nullptr;
   }
+
+  /// get curr from next
+  curr_ = next_;
+  next_ = (Batch *)-1;
+
+  // get next while no check_finish_delay
+  if (curr_!=nullptr && !check_finish_delay_) {
+    next_ = batch_q_->Dequeue();
+  }
+
   ++ count_;
-  XDL_LOG(DEBUG) << "get " << count_ << "th batch, curr=" << curr_ << " next=" << next_;
+
   return curr_;
 }
 
+bool DataIO::ReleaseBatch() {
+  XDL_CHECK(curr_ != nullptr);
+  if (curr_ == (Batch *)-1) {
+    // has been release
+    return false;
+  }
+  ReParse(curr_);
+  curr_->Reuse();
+  curr_ = (Batch *)-1;
+  return true;
+}
+
+const Batch *DataIO::GetBatchNext() {
+  if (!check_finish_delay_) {
+    XDL_LOG(WARNING) << "next batch has been retrivaled, while 'check_finish_delay' not set";
+    XDL_CHECK(next_ != (Batch *)-1);
+    return next_;
+  }
+  if (curr_ != nullptr) {
+    next_ = batch_q_->Dequeue();
+  }
+  return next_;
+}
+
+/// make sure thread-safe by user
+//const Batch *DataIO::GetBatch() {
+//  if (curr_ != nullptr) {
+//    ReParse(curr_);
+//    curr_->Reuse();
+//    curr_ = next_;
+//  }
+//
+//  if (count_ == 0 || check_finish_delay_) {
+//    /// first time or finish delay
+//    curr_ = batch_q_->Dequeue(); 
+//  }
+//
+//  // get next while no finish_delay
+//  if (!check_finish_delay_ && curr_ != nullptr) {
+//    next_ = batch_q_->Dequeue(); 
+//  } else {
+//    next_ = nullptr;
+//  }
+//  ++ count_;
+//  //XDL_LOG(DEBUG) << "get " << count_ << "th batch, curr=" << curr_ << " next=" << next_;
+//  return curr_;
+//}
+
 Batch *DataIO::CurrBatch() {
   return curr_;
 }
 
-bool DataIO::finish() const {
+bool DataIO::finished() const {
   if (!running_ || curr_ == nullptr) {
+    XDL_LOG(DEBUG) << "check_finish by curr";
     return true;
   }
-  if (!finish_delay_ && curr_ != nullptr && next_ == nullptr) {
+  if (check_finish_delay_ && curr_ != nullptr && next_ == nullptr) {
+    XDL_LOG(DEBUG) << "check_finish by next";
     return true;
   }
   return false;
 }
 
 bool DataIO::ReParse(SGroup *sgroup) {
-  XDL_DLOG(DEBUG) << "reparse sgroup=" << sgroup;
+  XDL_LOG(DEBUG) << "reparse sgroup=" << sgroup;
   sgroup_q_->ForceEnqueue(sgroup);
   return true;
 }
 
 bool DataIO::ReParse(Batch *batch) {
-  XDL_DLOG(DEBUG) << "reparse batch=" << batch;
+  XDL_LOG(DEBUG) << "reparse batch=" << batch;
   if (!schema_->keep_sgroup_) {
     return false;
   }
@@ -470,14 +630,14 @@ bool DataIO::ReParse(Batch *batch) {
 }
 
 bool DataIO::NotifyParser() {
-  for (size_t i = 0; i < threads_; ++i) {
+  for (size_t i = 0; i < parsers_.size(); ++i) {
     parsers_[i]->Shutdown();
   }
   return true;
 }
 
 bool DataIO::NotifyPacker() {
-  for (size_t i = 0; i < threads_; ++i) {
+  for (size_t i = 0; i < packers_.size(); ++i) {
     sgroup_q_->ForceEnqueue((SGroup *)END);
   }
   return true;
@@ -488,22 +648,30 @@ std::string DataIO::Store() {
   ds_state.set_ds_name(ds_name_);
   sched_->Store(&ds_state);
   std::string text;
-  google::protobuf::TextFormat::PrintToString(ds_state, &text);
+  if (state_as_text_) {
+    google::protobuf::TextFormat::PrintToString(ds_state, &text);
+  } else {
+    ds_state.SerializeToString(&text);
+  }
   return text;
 }
 
 bool DataIO::Restore(const std::string &text) {
-  if (running_) {
-    XDL_LOG(DEBUG) << "runing without restore, only load parameters";
-    return false;
-  }
   DSState ds_state;
-  google::protobuf::TextFormat::ParseFromString(text, &ds_state);
-  XDL_CHECK(ds_name_ == ds_state.ds_name());
-
-  return sched_->Restore(ds_state);
+  if (state_as_text_) {
+    google::protobuf::TextFormat::ParseFromString(text, &ds_state);
+  } else {
+    ds_state.ParseFromString(text);
+  }
+  bool ret = sched_->Restore(ds_state);
+  
+  return ret;
 }
 
+void DataIO::Destroy() {
+  Shutdown(true);
+  DataIOMap::Delete(ds_name_);
+}
 
 }  // namespace io
 }  // namespace xdl
diff --git a/xdl/xdl/data_io/data_io.h b/xdl/xdl/data_io/data_io.h
index f05a5f3a..6bad445c 100644
--- a/xdl/xdl/data_io/data_io.h
+++ b/xdl/xdl/data_io/data_io.h
@@ -32,21 +32,26 @@ limitations under the License.
 #include "xdl/data_io/op/op.h"
 #include "xdl/data_io/scheduler.h"
 #include "xdl/proto/sample.pb.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
 
-
 class DataIO {
  public:
   DataIO() = delete;
   DataIO(const std::string &ds_name, ParserType parser_type=kPB,
-         FSType fs_type=kLocal, const std::string &namenode="");
+         FSType fs_type=kLocal, const std::string &namenode="", 
+         size_t worker_id=0, bool global_schedule=false);
   virtual ~DataIO();
 
   bool Init();
+  /*!\brief destroy data io */
+  void Destroy();
   /*!\brief start data io */
   bool Startup();
+  /*!\brief restart data io from a timestamp */
+  bool Restart(size_t start);
   /*!\brief stop data io */
   bool Shutdown(bool force=false);
 
@@ -55,12 +60,19 @@ class DataIO {
   /*!\brief add meta to read */
   bool SetMeta(const std::string &path);
 
+
+  /*!\brief add meta data to read */
+  bool SetMetaData(const std::string &data);
+
   /*!\brief add path to read */
   bool AddPath(const std::string &path);
 
   /*!\brief set epochs, 0 means loop forever */
   bool SetEpochs(size_t epochs);
 
+  /*!\brief set shuffle */
+  bool SetShuffle(bool shuffle);
+
   /*!\brief set batch size, 0 means variable size without padding */
   bool SetBatchSize(size_t batch_size=1024);
 
@@ -86,15 +98,36 @@ class DataIO {
   /*!\brief set if padding to batch size, default true */
   bool SetPadding(bool pad=true);
 
+  /*!\brief set compress format */
+  bool SetZType(ZType ztype);
+
   /*!\brief set pause limit of sample, this will also unpause parser currently */
   bool SetPause(size_t limit, bool wait_exactly = false);
 
   /*!\brief set num of threads */
-  bool SetThreads(size_t threads);
+  bool SetThreads(size_t threads, size_t threads_read=8);
+
+  /*!\brief set start point for online learning */
+  bool SetStartTime(size_t ts);
+
+  /*!\brief set end point for online learning */
+  bool SetEndTime(size_t ts);
+
+  /*!\brief get latest time of streaming reader */
+  size_t GetLatestTime();
+
+  /*!\brief get io offset of current reader */
+  size_t GetReaderOffset();
+
+  /*!\brief set time window for online learning */
+  bool SetDuration(size_t dur);
+
+  /*!\brief check if streaming io */
+  bool IsStreaming();
 
-  bool AddFeatureOpt(const std::string &name, FeatureType type,
-                     int table = 0, int nvec = 0, bool serialized = false,
-                     const std::string &dsl = "");
+  bool AddFeatureOpt(const std::string &name, FeatureType type, int table = 0,
+                     int nvec = 0, const std::string &mask = "", bool serialized = false,
+                     int cutoff=0, const std::string &dsl = "");
 
   const FeatureOption *GetFeatureOpt(const std::string &name);
 
@@ -111,9 +144,11 @@ class DataIO {
 
   bool Wait();
 
-  const Batch *GetBatch(unsigned msec=0);
+  const Batch *GetBatch();
+  const Batch *GetBatchNext();
+  bool ReleaseBatch();
   Batch *CurrBatch();
-  bool finish() const;
+  bool finished() const;
 
   bool ReParse(Batch *batch);
   bool ReParse(SGroup *sgroup);
@@ -127,19 +162,22 @@ class DataIO {
  protected:
   std::string ds_name_;
   ParserType parser_type_ = kPB;
-  Scheduler *sched_ = nullptr;
-  Schema *schema_ = nullptr;
+  std::unique_ptr<Scheduler> sched_;
+  std::unique_ptr<Schema> schema_;
+  FSType fs_type_ = kLocal;
   FileSystem *fs_ = nullptr;
 
   size_t threads_ = 1;
+  size_t threads_read_ = 8;
   bool unique_ = false;
-  bool finish_delay_ = false;
+  bool check_finish_delay_ = false;
   std::vector<Operator *> ops_;
 
   std::string meta_path_;
-  std::vector<Parser*> parsers_;
-  std::vector<Packer*> packers_;
-  std::vector<Merger*> mergers_;
+  std::string meta_data_;
+  std::vector<std::unique_ptr<Parser>> parsers_;
+  std::vector<std::unique_ptr<Packer>> packers_;
+  std::vector<std::unique_ptr<Merger>> mergers_;
 
   std::vector<std::thread> th_parsers_;
   std::vector<std::thread> th_packers_;
@@ -151,11 +189,13 @@ class DataIO {
 
   BlockingQueue<SGroup*> *sgroup_q_ = nullptr;
   BlockingQueue<Batch*> *batch_q_ = nullptr;
-  Batch *curr_ = nullptr;
-  Batch *next_ = nullptr;
+  /// -1 : begin, nullptr: end
+  Batch *curr_ = (Batch *)-1;
+  Batch *next_ = (Batch *)-1;
   size_t count_ = 0;
 
   bool wait_exactly_ = false;
+  bool state_as_text_ = false;
 
   std::mutex mutex_;
   std::condition_variable cv_;
@@ -180,6 +220,7 @@ class DataIOMap: public std::map<const std::string, DataIO *>, public Singleton<
   }
 
   static void Delete(const std::string &ds_name) {
+    XDL_LOG(DEBUG) << "delete data_io " << ds_name;
     DataIOMap &data_io_map = *DataIOMap::Instance();
     data_io_map.erase(ds_name);
   }
diff --git a/xdl/xdl/data_io/fs/file_system.cc b/xdl/xdl/data_io/fs/file_system.cc
index f1519463..49447ced 100644
--- a/xdl/xdl/data_io/fs/file_system.cc
+++ b/xdl/xdl/data_io/fs/file_system.cc
@@ -21,6 +21,7 @@ limitations under the License.
 #include "xdl/data_io/fs/file_system_hdfs.h"
 #include "xdl/data_io/fs/file_system_local.h"
 #include "xdl/data_io/fs/file_system_kafka.h"
+#include "xdl/data_io/fs/zlib_ant.h"
 #include "xdl/core/utils/logging.h"
 
 namespace xdl {
@@ -39,7 +40,7 @@ std::string FileSystem::Read(const std::string &path) {
   ret.resize(len);
   return ret;
 }
-  
+
 bool FileSystem::Write(const std::string &path, const std::string &content) {
   std::unique_ptr<IOAnt> io(GetAnt(path.c_str(), 'w'));
   size_t len = content.size();
@@ -47,6 +48,14 @@ bool FileSystem::Write(const std::string &path, const std::string &content) {
   return true;
 }
 
+IOAnt *FileSystem::GetZAnt(const char *path, ZType ztype) {
+  auto *ant = GetAnt(path);
+  if (ztype == kZLib) {
+    ant = new ZlibAnt(ant);
+  }
+  return ant;
+}
+
 /*!\brief Get the related filesystem */
 FileSystem *GetFileSystem(FSType type, const char *ext) {
   if (gfs.find(type) != gfs.end()) {
@@ -60,8 +69,6 @@ FileSystem *GetFileSystem(FSType type, const char *ext) {
     fs = FileSystemLocal::Get();
   } else if (type == kKafka) {
     fs = FileSystemKafka::Get(ext);
-  } else if (type == kSwift) {
-    XDL_LOG(ERROR) << "not support now, type=" << type;
   } else {
     XDL_LOG(ERROR) << "Unkown file system, type=" << type;
   }
diff --git a/xdl/xdl/data_io/fs/file_system.h b/xdl/xdl/data_io/fs/file_system.h
index 596818c1..28d526b5 100644
--- a/xdl/xdl/data_io/fs/file_system.h
+++ b/xdl/xdl/data_io/fs/file_system.h
@@ -38,6 +38,7 @@ class IOAnt {
   virtual ssize_t Write(const char* data, size_t len) = 0;
   /*!\brief seek to offset */
   virtual off_t Seek(off_t offset) = 0;
+  virtual off_t SeekRange(off_t begin, off_t end) {}
 
   /*! set ref */
   void set_ref(bool ref) { ref_ = ref; }
@@ -56,6 +57,9 @@ class FileSystem {
   virtual ~FileSystem() { }
   virtual IOAnt *GetAnt(const char *path, char mode='r') = 0;
 
+  /// only support zlib with read
+  IOAnt *GetZAnt(const char *path, ZType ztype);
+
   virtual bool IsDir(const char *path) = 0;
   virtual bool IsReg(const char *path) = 0;
   virtual std::vector<std::string> Dir(const char *path) = 0;
@@ -74,4 +78,4 @@ FileSystem *GetFileSystem(FSType type, const char *ext=nullptr);
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_FS_FILE_SYSTEM_H_
+#endif  // XDL_IO_FS_FILE_SYSTEM_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/fs/file_system_hdfs.h b/xdl/xdl/data_io/fs/file_system_hdfs.h
index 4d1124b2..f1dfa5cc 100644
--- a/xdl/xdl/data_io/fs/file_system_hdfs.h
+++ b/xdl/xdl/data_io/fs/file_system_hdfs.h
@@ -71,4 +71,4 @@ std::string HdfsRead(const std::string& name);
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_FS_FILE_SYSTEM_HDFS_H_
+#endif  // XDL_IO_FS_FILE_SYSTEM_HDFS_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/fs/file_system_local.cc b/xdl/xdl/data_io/fs/file_system_local.cc
index e709a6b4..9f709128 100644
--- a/xdl/xdl/data_io/fs/file_system_local.cc
+++ b/xdl/xdl/data_io/fs/file_system_local.cc
@@ -110,7 +110,7 @@ size_t FileSystemLocal::Size(const char *path) {
 FileSystemLocal::~FileSystemLocal() { }
 
 FileSystem *FileSystemLocal::Get() {
-  static std::shared_ptr<FileSystemLocal> inst(new FileSystemLocal());
+  static std::unique_ptr<FileSystemLocal> inst(new FileSystemLocal());
   return inst.get();
 }
   
diff --git a/xdl/xdl/data_io/fs/file_system_local.h b/xdl/xdl/data_io/fs/file_system_local.h
index f632e7bd..edfca18d 100644
--- a/xdl/xdl/data_io/fs/file_system_local.h
+++ b/xdl/xdl/data_io/fs/file_system_local.h
@@ -45,4 +45,4 @@ class FileSystemLocal : public FileSystem {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_FS_LOCAL_FILE_SYSTEM_H_
+#endif  // XDL_IO_FS_LOCAL_FILE_SYSTEM_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/fs/libhdfs.cc b/xdl/xdl/data_io/fs/libhdfs.cc
index 0a796302..86f40f0c 100644
--- a/xdl/xdl/data_io/fs/libhdfs.cc
+++ b/xdl/xdl/data_io/fs/libhdfs.cc
@@ -12,13 +12,13 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-
 #include <dlfcn.h>
 #include <cstdlib>
 #include <string>
 #include <iostream>
 
 #include "xdl/data_io/fs/libhdfs.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
@@ -74,17 +74,12 @@ Status LibHDFS::LoadSymbols(void* dl) {
 
 Status LibHDFS::LoadAndBind() {
   const char* hdfs_root = getenv("HADOOP_HDFS_HOME");
-  if (hdfs_root == nullptr) {
-    return Status::Internal("HADOOP_HDFS_HOME is not set");
-  }
+  XDL_CHECK(hdfs_root != nullptr) << "HADOOP_HDFS_HOME is not set";
   const std::string& libhdfs = std::string(hdfs_root) + "/lib/native/libhdfs.so";
   void* dl = dlopen(libhdfs.c_str(), RTLD_LAZY);
-  if (dl == nullptr) {
-    return Status::Internal("cannot find $HADOOP_HDFS_HOME/lib/native/libhdfs.so");
-  }
+  XDL_CHECK(dl != nullptr) << dlerror();
   return LoadSymbols(dl);
 }
 
 }
-}
-
+}
\ No newline at end of file
diff --git a/xdl/xdl/data_io/fs/libhdfs.h b/xdl/xdl/data_io/fs/libhdfs.h
index 8b95b42e..4d0fb5ad 100644
--- a/xdl/xdl/data_io/fs/libhdfs.h
+++ b/xdl/xdl/data_io/fs/libhdfs.h
@@ -12,7 +12,6 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-
 #ifndef XDL_DATA_IO_FS_LIBHDFS_H_
 #define XDL_DATA_IO_FS_LIBHDFS_H_
 
@@ -57,4 +56,3 @@ class LibHDFS {
 }
 
 #endif
-
diff --git a/xdl/xdl/data_io/fs/zlib_ant.cc b/xdl/xdl/data_io/fs/zlib_ant.cc
new file mode 100644
index 00000000..48a93c24
--- /dev/null
+++ b/xdl/xdl/data_io/fs/zlib_ant.cc
@@ -0,0 +1,160 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/fs/zlib_ant.h"
+#include "xdl/core/utils/logging.h"
+#include <iostream>
+
+namespace xdl {
+namespace io {
+
+ZlibAnt::ZlibAnt(
+    IOAnt* input_stream,
+    const ZlibCompressionOptions& zlib_options)
+    : input_stream_(input_stream),
+      input_buffer_capacity_(zlib_options.input_buffer_size),
+      output_buffer_capacity_(zlib_options.output_buffer_size),
+      z_stream_input_(new Bytef[input_buffer_capacity_]),
+      z_stream_output_(new Bytef[output_buffer_capacity_]),
+      zlib_options_(zlib_options),
+      z_stream_(new z_stream) {
+  InitZlibBuffer();
+}
+
+ZlibAnt::~ZlibAnt() {
+  if (z_stream_.get()) {
+    inflateEnd(z_stream_.get());
+  }
+}
+
+void ZlibAnt::InitZlibBuffer() {
+  memset(z_stream_.get(), 0, sizeof(z_stream));
+
+  z_stream_->zalloc = Z_NULL;
+  z_stream_->zfree = Z_NULL;
+  z_stream_->opaque = Z_NULL;
+  z_stream_->next_in = Z_NULL;
+  z_stream_->avail_in = 0;
+
+  int status = inflateInit2(z_stream_.get(), zlib_options_.window_bits);
+  if (status != Z_OK) {
+    XDL_LOG(FATAL) << "inflateInit failed with status " << status;
+    z_stream_.reset(NULL);
+  } else {
+    z_stream_->next_in = z_stream_input_.get();
+    z_stream_->next_out = z_stream_output_.get();
+    next_unread_byte_ = reinterpret_cast<char*>(z_stream_output_.get());
+    z_stream_->avail_in = 0;
+    z_stream_->avail_out = output_buffer_capacity_;
+  }
+}
+
+ssize_t ZlibAnt::ReadFromStream() {
+  int bytes_to_read = input_buffer_capacity_;
+  char* read_location = reinterpret_cast<char*>(z_stream_input_.get());
+
+  if (z_stream_->avail_in > 0) {
+    uLong read_bytes = z_stream_->next_in - z_stream_input_.get();
+    if (read_bytes > 0) {
+      memmove(z_stream_input_.get(), z_stream_->next_in, z_stream_->avail_in);
+    }
+
+    bytes_to_read -= z_stream_->avail_in;
+    read_location += z_stream_->avail_in;
+  }
+  ssize_t read_size = input_stream_->Read(read_location, bytes_to_read);
+  if (read_size <= 0) {
+    return read_size;
+  }
+
+  z_stream_->next_in = z_stream_input_.get();
+
+  z_stream_->avail_in += read_size;
+  return read_size;
+}
+
+size_t ZlibAnt::ReadBytesFromCache(size_t bytes_to_read, char* result) {
+  size_t unread_bytes =
+      reinterpret_cast<char*>(z_stream_->next_out) - next_unread_byte_;
+  size_t can_read_bytes = std::min(bytes_to_read, unread_bytes);
+  if (can_read_bytes > 0) {
+    if (result != nullptr) {
+      memcpy(result, next_unread_byte_, can_read_bytes);
+    }
+    next_unread_byte_ += can_read_bytes;
+  }
+  return can_read_bytes;
+}
+
+size_t ZlibAnt::NumUnreadBytes() const {
+  size_t read_bytes =
+      next_unread_byte_ - reinterpret_cast<char*>(z_stream_output_.get());
+  return output_buffer_capacity_ - z_stream_->avail_out - read_bytes;
+}
+
+ssize_t ZlibAnt::Read(char* data, size_t bytes_to_read) {
+  ssize_t origin_request_bytes = bytes_to_read;
+  bytes_to_read -= ReadBytesFromCache(bytes_to_read, data);
+
+  bool eof = false;
+  while (bytes_to_read > 0 && !eof) {
+    if (NumUnreadBytes() != 0) {
+      return -1;
+    }
+    if (z_stream_->avail_in == 0) {
+      ssize_t read_size = ReadFromStream();
+      if (read_size < 0) {
+        return read_size;
+      } else if (read_size == 0) {
+        eof = true;
+      }
+    }
+    z_stream_->next_out = z_stream_output_.get();
+    next_unread_byte_ = reinterpret_cast<char*>(z_stream_output_.get());
+    z_stream_->avail_out = output_buffer_capacity_;
+
+    Inflate();
+    ssize_t ret = ReadBytesFromCache(bytes_to_read, data == nullptr ? nullptr
+                                     : data + origin_request_bytes - bytes_to_read);
+    bytes_to_read -= ret;
+  }
+  return origin_request_bytes - bytes_to_read;
+}
+
+void ZlibAnt::Inflate() {
+  int error = inflate(z_stream_.get(), zlib_options_.flush_mode);
+  if (error != Z_OK && error != Z_STREAM_END) {
+    std::string error_string = "inflate() failed with error " + std::to_string(error);
+    if (z_stream_->msg != NULL) {
+      error_string += ": " + std::string(z_stream_->msg);
+    }
+    XDL_CHECK(false) << error_string;
+  }
+}
+
+ssize_t ZlibAnt::Write(const char* data, size_t len) {
+  return input_stream_->Write(data, len);
+}
+
+off_t ZlibAnt::Seek(off_t offset) {
+  input_stream_->Seek(0);
+  InitZlibBuffer();
+  auto len = Read(nullptr, offset);
+  XDL_CHECK(len == offset);
+  return offset;
+}
+
+}
+}
diff --git a/xdl/xdl/data_io/fs/zlib_ant.h b/xdl/xdl/data_io/fs/zlib_ant.h
new file mode 100644
index 00000000..1860d067
--- /dev/null
+++ b/xdl/xdl/data_io/fs/zlib_ant.h
@@ -0,0 +1,55 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_IO_FS_ZLIB_ANT_H_
+#define XDL_IO_FS_ZLIB_ANT_H_
+
+#include "xdl/core/lib/common_defines.h"
+#include "xdl/data_io/fs/file_system.h"
+#include "xdl/data_io/fs/zlib_compression_options.h"
+#include <memory>
+
+namespace xdl {
+namespace io {
+
+class ZlibAnt : public IOAnt {
+ public:
+  ZlibAnt(IOAnt* input_stream, const ZlibCompressionOptions& zlib_options = ZlibCompressionOptions::DEFAULT());
+  virtual ~ZlibAnt();
+  virtual ssize_t Read(char* data, size_t len);
+  virtual ssize_t Write(const char* data, size_t len);
+  virtual off_t Seek(off_t offset);
+  DISALLOW_COPY_AND_ASSIGN(ZlibAnt);
+ private:
+  void InitZlibBuffer();
+  ssize_t ReadFromStream();
+  void Inflate();
+  size_t ReadBytesFromCache(size_t bytes_to_read, char* result);
+  size_t NumUnreadBytes() const;
+  
+  std::unique_ptr<IOAnt> input_stream_;
+  size_t input_buffer_capacity_;        // Size of z_stream_input_
+  size_t output_buffer_capacity_;       // Size of z_stream_output_
+  char* next_unread_byte_;              // Next unread byte in z_stream_output_
+  std::unique_ptr<Bytef[]> z_stream_input_;
+  std::unique_ptr<Bytef[]> z_stream_output_;
+  ZlibCompressionOptions const zlib_options_;
+  std::unique_ptr<z_stream> z_stream_;
+};
+
+}  // namespace io
+}  // namespace xdl
+
+#endif  // XDL_IO_FS_FILE_SYSTEM_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/fs/zlib_compression_options.h b/xdl/xdl/data_io/fs/zlib_compression_options.h
new file mode 100644
index 00000000..d4683549
--- /dev/null
+++ b/xdl/xdl/data_io/fs/zlib_compression_options.h
@@ -0,0 +1,58 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+
+#ifndef XDL_IO_FS_ZLIB_COMPRESSION_OPTIONS_H_
+#define XDL_IO_FS_ZLIB_COMPRESSION_OPTIONS_H_
+
+#include <zlib.h>
+
+namespace xdl {
+namespace io {
+class ZlibCompressionOptions {
+ public:
+  static ZlibCompressionOptions DEFAULT();
+  static ZlibCompressionOptions RAW();
+  static ZlibCompressionOptions GZIP();
+
+  char flush_mode = Z_NO_FLUSH;
+  int64_t input_buffer_size = 256 << 10;
+  int64_t output_buffer_size = 256 << 10;
+  char window_bits = MAX_WBITS;
+  char compression_level = Z_DEFAULT_COMPRESSION;
+  char compression_method = Z_DEFLATED;
+  char mem_level = 9;
+  char compression_strategy = Z_DEFAULT_STRATEGY;
+};
+
+inline ZlibCompressionOptions ZlibCompressionOptions::DEFAULT() {
+  return ZlibCompressionOptions();
+}
+
+inline ZlibCompressionOptions ZlibCompressionOptions::RAW() {
+  ZlibCompressionOptions options = ZlibCompressionOptions();
+  options.window_bits = -options.window_bits;
+  return options;
+}
+
+inline ZlibCompressionOptions ZlibCompressionOptions::GZIP() {
+  ZlibCompressionOptions options = ZlibCompressionOptions();
+  options.window_bits = options.window_bits + 16;
+  return options;
+}
+}
+}
+
+#endif  //XDL_IO_FS_ZLIB_COMPRESSION_OPTIONS_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/get_batch_op.cc b/xdl/xdl/data_io/get_batch_op.cc
index d3b7c7ea..e24e63bf 100644
--- a/xdl/xdl/data_io/get_batch_op.cc
+++ b/xdl/xdl/data_io/get_batch_op.cc
@@ -16,8 +16,9 @@ limitations under the License.
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
 #include "xdl/core/framework/op_registry.h"
+#include "xdl/core/lib/timer.h"
+#include "xdl/core/lib/tbb_concurrent_queue.h"
 #include "xdl/data_io/data_io.h"
-#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 
@@ -30,21 +31,27 @@ class GetBatchOp: public OpKernel {
     XDL_CHECK_STATUS(ctx->GetAttr("sparse_count", &sparse_count_));
     XDL_CHECK_STATUS(ctx->GetAttr("dense_count", &dense_count_));
     XDL_CHECK_STATUS(ctx->GetAttr("indicator_count", &indicator_count_));
+    XDL_CHECK_STATUS(ctx->GetAttr("tag_cnt", &tag_cnt_));
 
     data_io_ = io::DataIOMap::Instance()->Get(ds);
     XDL_CHECK(data_io_ != nullptr);
 
     unique_ids_ = data_io_->GetUniqueIds();
-
+    sample_id_ = 0;
     return Status::Ok();
   }
 
   Status Compute(OpKernelContext* ctx) override {
+    //XDL_TIMER_SCOPE(get_batch_timer);
     using TensorList = std::vector<Tensor>;
 
     auto batch = data_io_->GetBatch();
-    if (data_io_->finish()) {
+    if (data_io_->finished()) {
       XDL_LOG(DEBUG) << "game over";
+      TBBConcurrentQueue::Global()->SetFinished();
+      if (data_io_->IsStreaming()) {
+        return Status::ReachEnd("reach end of current window");
+      }
       return Status::OutOfRange("game over ");
     }
 
@@ -54,11 +61,9 @@ class GetBatchOp: public OpKernel {
     auto blk = batch->Get(io::kSKeyName);
     if (blk == nullptr) {
       ctx->SetOutput("skbuf", Tensor(ctx->GetDevice(), TensorShape({0}), types::kInt8));
-      ctx->SetOutput("sklen", Tensor(ctx->GetDevice(), TensorShape({0}), types::kInt32));
     } else {
-      XDL_DCHECK(blk->ts_[io::Block::kIndex] != nullptr && blk->ts_[io::Block::kSBuf] != nullptr);
+      XDL_DCHECK(blk->ts_[io::Block::kSBuf] != nullptr);
       ctx->SetOutput("skbuf", *blk->ts_[io::Block::kSBuf]);
-      ctx->SetOutput("sklen", *blk->ts_[io::Block::kIndex]);
     }
 
     /// label
@@ -66,6 +71,12 @@ class GetBatchOp: public OpKernel {
     XDL_CHECK(blk != nullptr && blk->ts_[io::Block::kValue] != nullptr);
     ctx->SetOutput("label", *blk->ts_[io::Block::kValue]);
 
+    // tag
+    Tensor tag;
+    ctx->AllocateOutput("tag", TensorShape({}), &tag);
+    *(tag.Raw<int32_t>()) = (tag_cnt_ == 0 ? 0 : sample_id_++ % tag_cnt_);
+    ctx->SetOutput("tag", tag);
+
     /// feature
     TensorList out_indices;
     TensorList out_ids;
@@ -73,6 +84,8 @@ class GetBatchOp: public OpKernel {
     TensorList out_svalues;
     TensorList out_dvalues;
     TensorList out_indicators;
+    TensorList out_sample_indices;
+    TensorList out_sample_segments;
 
     auto out_list = data_io_->sparse_list();
     XDL_CHECK(out_list.size() == sparse_count_);
@@ -83,13 +96,21 @@ class GetBatchOp: public OpKernel {
       if (unique_ids_) {
         XDL_DCHECK(blk->ts_[io::Block::kUKey] != nullptr && blk->ts_[io::Block::kUKey]->Type() == types::kInt64);
         XDL_DCHECK(blk->ts_[io::Block::kIndex] != nullptr && blk->ts_[io::Block::kIndex]->Type() == types::kInt32);
+        XDL_DCHECK(blk->ts_[io::Block::kSIndex] != nullptr && blk->ts_[io::Block::kSIndex]->Type() == types::kInt32);
+        XDL_DCHECK(blk->ts_[io::Block::kSSegment] != nullptr && blk->ts_[io::Block::kSSegment]->Type() == types::kInt32);
         out_ids.push_back(*blk->ts_[io::Block::kUKey]);
         out_indices.push_back(*blk->ts_[io::Block::kIndex]);
+        out_sample_indices.push_back(*blk->ts_[io::Block::kSIndex]);
+        out_sample_segments.push_back(*blk->ts_[io::Block::kSSegment]);
       } else {
         XDL_DCHECK(blk->ts_[io::Block::kKey] != nullptr && blk->ts_[io::Block::kKey]->Type() == types::kInt64);
         XDL_DCHECK(blk->ts_[io::Block::kIndex] == nullptr);
+        XDL_DCHECK(blk->ts_[io::Block::kSIndex] == nullptr);
+        XDL_DCHECK(blk->ts_[io::Block::kSSegment] == nullptr);
         out_ids.push_back(*blk->ts_[io::Block::kKey]);
         out_indices.push_back(Tensor(ctx->GetDevice(), TensorShape({0}), types::kInt32));
+        out_sample_indices.push_back(Tensor(ctx->GetDevice(), TensorShape({0}), types::kInt32));
+        out_sample_segments.push_back(Tensor(ctx->GetDevice(), TensorShape({0}), types::kInt32));
       }
 
       if (blk->ts_[io::Block::kValue] != nullptr) {
@@ -107,6 +128,8 @@ class GetBatchOp: public OpKernel {
     XDL_CHECK_STATUS(ctx->SetOutputList("ids", out_ids));
     XDL_CHECK_STATUS(ctx->SetOutputList("segments", out_segments));
     XDL_CHECK_STATUS(ctx->SetOutputList("svalues", out_svalues));
+    XDL_CHECK_STATUS(ctx->SetOutputList("sample_indices", out_sample_indices));
+    XDL_CHECK_STATUS(ctx->SetOutputList("sample_segments", out_sample_segments));
 
     out_list = data_io_->dense_list();
     XDL_DCHECK(out_list.size() == dense_count_);
@@ -139,6 +162,8 @@ class GetBatchOp: public OpKernel {
   long dense_count_;
   long indicator_count_;
   bool unique_ids_;
+  int64_t tag_cnt_;
+  int64_t sample_id_;
   io::DataIO *data_io_;
 };
 
@@ -148,20 +173,23 @@ XDL_DEFINE_OP(GetBatch)
   .Attr("dense_count", AttrValue::kInt)
   .Attr("indicator_count", AttrValue::kInt)
   .Attr("dtype", AttrValue::kDataType)
+  .Attr("tag_cnt", AttrValue::kInt, 0)
   .OutputList("indicators", DataType::kInt32, "indicator_count")
   .OutputList("indices", DataType::kInt32, "sparse_count")
   .OutputList("ids", DataType::kInt64, "sparse_count")
   .OutputList("segments", DataType::kInt32, "sparse_count")
   .OutputList("svalues", "dtype", "sparse_count")
   .OutputList("dvalues", "dtype", "dense_count")
+  .OutputList("sample_indices", DataType::kInt32, "sparse_count")
+  .OutputList("sample_segments", DataType::kInt32, "sparse_count")
   .Output("skbuf", DataType::kInt8)
-  .Output("sklen", DataType::kInt32)
-  .Output("label", "dtype");
+  .Output("label", "dtype")
+  .Output("tag", DataType::kInt32);
 
 #define REGISTER_KERNEL(T)                     \
   XDL_REGISTER_KERNEL(GetBatch, GetBatchOp<T>) \
   .Device("CPU")                               \
-  .AttrDataType<T>("dtype")
+  .AttrDataType<T>("dtype");
 
 REGISTER_KERNEL(int32_t);
 REGISTER_KERNEL(int64_t);
diff --git a/xdl/xdl/data_io/global_scheduler.cc b/xdl/xdl/data_io/global_scheduler.cc
new file mode 100644
index 00000000..e47ab2c1
--- /dev/null
+++ b/xdl/xdl/data_io/global_scheduler.cc
@@ -0,0 +1,154 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/global_scheduler.h"
+
+#include <string.h>
+#include <chrono>
+#include <thread>
+
+#include "ps-plus/client/base_client.h"
+#include "xdl/core/ops/ps_ops/client.h"
+
+namespace xdl {
+namespace io {
+
+GlobalScheduler::GlobalScheduler(
+    FileSystem *fs, 
+    const std::string& name,
+    size_t epochs, 
+    size_t worker_id) 
+  : Scheduler(fs, epochs)
+  , name_(name)
+  , client_(nullptr)
+  , epoch_isolate_(false)
+  , worker_id_(worker_id) {
+  XDL_CHECK(fs != nullptr);
+  fs_ = fs;
+  XDL_CHECK(GetClient(&client_).IsOk());
+}
+
+GlobalScheduler::GlobalScheduler(
+    const std::string& name,
+    FSType fs_type, 
+    const std::string &namenode, 
+    size_t epochs,
+    size_t worker_id)
+  : Scheduler(fs_type, namenode, epochs)
+  , name_(name)
+  , client_(nullptr)
+  , epoch_isolate_(false)
+  , worker_id_(worker_id) {
+  fs_ = GetFileSystem(
+      fs_type, 
+      namenode.empty() ? nullptr : namenode.c_str());
+  XDL_CHECK(GetClient(&client_).IsOk());
+}
+
+bool GlobalScheduler::SetEpochIsolate(bool value) {
+  epoch_isolate_ = value;
+  return true;
+}
+
+bool GlobalScheduler::Schedule() {
+  finished_ = false;
+  XDL_CHECK(client_->InitGlobalQueue(
+            name_, paths_, epochs_, 
+            epoch_isolate_).IsOk());
+  return true;
+}
+
+ReadParam *GlobalScheduler::Acquire() {
+  if (finished_) {
+    return nullptr;
+  }
+
+  std::string path;
+  size_t begin;
+  size_t epoch;
+  ps::Status st = client_->GetNextFile(
+      name_, worker_id_, &path, &begin, &epoch);
+  while (st.Code() == ps::Status::kFileQueueNeedWait) {
+    std::this_thread::sleep_for(std::chrono::seconds(5));
+    st = client_->GetNextFile(name_, worker_id_, &path, &begin, &epoch);    
+  }
+  
+  XDL_CHECK(st.IsOk());
+  if (path.empty()) {
+    finished_ = true;
+    return nullptr;
+  }
+
+  ReadParam *rparam = new ReadParam();
+  rparam->path_ = strdup(path.c_str());
+  rparam->epoch_ = epoch;
+  rparam->begin_ = begin;
+  rparam->ant_ = fs_->GetZAnt(rparam->path_, ztype_);
+  if (ztype_ == kZLib) {
+    rparam->end_ = ULONG_MAX;
+  } else {
+    rparam->end_ = fs_->Size(rparam->path_);
+  }
+
+  XDL_CHECK(rparam->end_ > rparam->begin_);
+  std::unique_lock<std::mutex> lck(mutex_);
+  using_.insert(rparam);
+  XDL_LOG(DEBUG) << "acquire " << rparam->DebugString();
+  return rparam;
+}
+
+void GlobalScheduler::Release(ReadParam *rparam) {
+  XDL_LOG(DEBUG) << "release " << rparam->DebugString();
+  XDL_CHECK(rparam != nullptr);
+  std::unique_lock<std::mutex> lck(mutex_);
+  auto it = using_.find(rparam);
+  if (it != using_.end()) {
+    using_.erase(it);
+  }
+
+  delete rparam;
+}
+
+bool GlobalScheduler::Store(DSState *ds_state) {
+  std::unique_lock<std::mutex> lock(mutex_);
+  std::vector<ps::WorkerState> worker_states;
+  for (auto &it : using_) {
+    ps::WorkerState ws;
+    ws.begin_ = it->begin_;
+    ws.end_ = it->end_;
+    ws.epoch_ = it->epoch_;
+    ws.path_ = it->path_;    
+    worker_states.push_back(ws);
+  }
+
+  XDL_CHECK(client_->ReportWorkerState(
+            name_, worker_id_, worker_states).IsOk());
+  return true;
+}
+
+bool GlobalScheduler::Restore(const DSState &ds_state) {
+  std::unique_lock<std::mutex> lock(mutex_);
+  XDL_CHECK(client_->RestoreWorkerState(name_, worker_id_).IsOk());
+  // for (auto& it: using_) {
+  //   delete it;
+  // }
+
+  using_.clear();
+  XDL_LOG(DEBUG) << "global scheduler restore worker id:" << worker_id_;
+  return true;
+}
+
+}  // namespace io
+}  // namespace xdl
diff --git a/xdl/xdl/data_io/global_scheduler.h b/xdl/xdl/data_io/global_scheduler.h
new file mode 100644
index 00000000..41761f66
--- /dev/null
+++ b/xdl/xdl/data_io/global_scheduler.h
@@ -0,0 +1,72 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_IO_GLOBAL_SCHEDULER_H_
+#define XDL_IO_GLOBAL_SCHEDULER_H_
+
+#include <set>
+#include <vector>
+#include <list>
+#include <string>
+#include <atomic>
+
+#include "xdl/core/lib/blocking_queue.h"
+#include "xdl/data_io/constant.h"
+#include "xdl/data_io/scheduler.h"
+#include "xdl/data_io/parser/parser.h"
+#include "xdl/proto/io_state.pb.h"
+
+namespace ps {
+namespace client {
+class BaseClient;
+}
+}
+
+namespace xdl {
+namespace io {
+
+class GlobalScheduler: public Scheduler {
+ public:
+  GlobalScheduler() = delete;
+  GlobalScheduler(FileSystem *fs, 
+                  const std::string& name,
+                  size_t epochs = 1, 
+                  size_t worker_id = 0);
+  GlobalScheduler(const std::string& name,
+                  FSType fs_type = kLocal, 
+                  const std::string& namenode = "", 
+                  size_t epochs = 1,
+                  size_t worker_id = 0);
+
+  bool SetEpochIsolate(bool value);
+
+  bool Schedule() override;
+  ReadParam *Acquire() override;
+  void Release(ReadParam *) override;
+  bool Store(DSState *ds_state) override;
+  bool Restore(const DSState &ds_state) override;
+
+ protected:
+  std::string name_;
+  std::unordered_set<ReadParam*> using_;
+  ps::client::BaseClient* client_;
+  bool epoch_isolate_;
+  size_t worker_id_;
+};
+
+}  // namespace io
+}  // namespace xdl
+
+#endif  // XDL_IO_GLOBAL_SCHEDULER_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/merger/merger.cc b/xdl/xdl/data_io/merger/merger.cc
index ee1932de..b8b6bfb3 100644
--- a/xdl/xdl/data_io/merger/merger.cc
+++ b/xdl/xdl/data_io/merger/merger.cc
@@ -14,12 +14,15 @@ limitations under the License.
 ==============================================================================*/
 
 #include "xdl/data_io/merger/merger.h"
-#include "xdl/data_io/merger/unique.h"
+#include "xdl/core/lib/unique.h"
 
 #include "xdl/data_io/constant.h"
 #include "xdl/core/framework/cpu_device.h"
+#include "xdl/core/lib/timer.h"
 #include "xdl/core/utils/logging.h"
 
+//#include "xdl/core/framework/gpu/gpu_device.h"
+
 namespace xdl {
 namespace io {
 
@@ -32,6 +35,7 @@ bool Merger::Init() {
 }
 
 Batch *Merger::Run(Batch *batch) {
+  //XDL_TIMER_SCOPE(merger_run);
   auto &blocks = batch->blocks();
   XDL_CHECK(blocks.size() != 0);
   for (auto &kv : blocks) {
@@ -46,8 +50,14 @@ Batch *Merger::Run(Batch *batch) {
     if (blk.ts_[Block::kUKey] == nullptr) {
       blk.ts_[Block::kUKey] = new Tensor();
     }
+    if (blk.ts_[Block::kSIndex] == nullptr) {
+      blk.ts_[Block::kSIndex] = new Tensor();
+    }
+    if (blk.ts_[Block::kSSegment] == nullptr) {
+      blk.ts_[Block::kSSegment] = new Tensor();
+    }
     auto fn = functor::UniqueFunctor<CpuDevice, int64_t, int32_t>();
-    fn((CpuDevice *)dev_, *blk.ts_[Block::kKey], blk.ts_[Block::kUKey], blk.ts_[Block::kIndex]);
+    fn((CpuDevice *)dev_, *blk.ts_[Block::kKey], *blk.ts_[Block::kSegment], blk.ts_[Block::kUKey], blk.ts_[Block::kIndex], blk.ts_[Block::kSIndex], blk.ts_[Block::kSSegment]);
   }
   return batch;
 }
diff --git a/xdl/xdl/data_io/merger/merger.h b/xdl/xdl/data_io/merger/merger.h
index 55bf6022..46635778 100644
--- a/xdl/xdl/data_io/merger/merger.h
+++ b/xdl/xdl/data_io/merger/merger.h
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #ifndef XDL_CORE_IO_MERGER_H_
 #define XDL_CORE_IO_MERGER_H_
 
@@ -42,4 +43,4 @@ class Merger {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_MERGER_H_
+#endif  // XDL_CORE_IO_MERGER_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/merger/unique.cc b/xdl/xdl/data_io/merger/unique.cc
deleted file mode 100644
index baab1124..00000000
--- a/xdl/xdl/data_io/merger/unique.cc
+++ /dev/null
@@ -1,114 +0,0 @@
-/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-
-#include "xdl/data_io/merger/unique.h"
-#include "xdl/core/utils/logging.h"
-
-namespace xdl {
-namespace functor {
-
-template <typename T, typename I>
-void UniqueFunctor<CpuDevice, T, I>::operator()(CpuDevice* d,
-                                                const Tensor &in,
-                                                Tensor *out,
-                                                Tensor *out_index) {
-  auto shape = in.Shape();
-  XDL_CHECK(shape.Size() == 1 || shape.Size() == 2);
-  size_t id_num = shape[0];
-  size_t id_dim = shape.Size() == 1 ? 1 : shape[1];
-  size_t total_num = shape.NumElements();
-  XDL_CHECK(in.Type() == DataTypeToEnum<T>::v());
-  T* pin = in.Raw<T>();
-  *out_index = Tensor(d, TensorShape({id_num}), DataTypeToEnum<I>::v());
-  I* pindex = out_index->Raw<I>();
-  if (id_dim == 1) {
-    std::unordered_map<T, I> uniq(id_num);
-    I j = 0;
-    for (size_t i = 0; i < id_num; ++i) {
-      auto iter = uniq.insert(std::make_pair(pin[i], j));
-      pindex[i] = iter.first->second;
-      if (iter.second) {
-        ++j;
-      }
-    }
-    TensorShape out_shape({uniq.size()});
-    *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
-
-    T* buf = out->Raw<T>();
-    for (const auto& it : uniq) {
-      buf[it.second] = it.first;
-    }
-  } else {
-    auto hash_fn = [pin](const size_t& index) {
-      size_t x = std::hash<T>()(pin[index * 2]);
-      size_t y = std::hash<T>()(pin[index * 2 + 1]);
-      x = ((x & 0xAAAAAAAAAAAAAAAAL) >> 1) + ((x & 0x5555555555555555L) << 1);
-      y = ((y & 0xFFFFFFFF00000000L) >> 32) + ((y & 0x00000000FFFFFFFFL) << 32);
-      return x ^ y;
-    };
-
-    auto key_equal_fn = [pin](const size_t& lhs, const size_t& rhs) {
-      return pin[lhs * 2] == pin[rhs * 2] &&
-             pin[lhs * 2 + 1] == pin[rhs * 2 + 1];
-    };
-
-    std::unordered_map<size_t, I, decltype(hash_fn), decltype(key_equal_fn)>
-        uniq(id_num, hash_fn, key_equal_fn);
-    I j = 0;
-    for(size_t i = 0; i < id_num; ++i) {
-      auto iter = uniq.insert(std::make_pair(i, j));
-      pindex[i] = iter.first->second;
-      if (iter.second) {
-        ++j;
-      }
-    }
-    TensorShape out_shape({uniq.size(), id_dim});
-    *out = Tensor(d, out_shape, DataTypeToEnum<T>::v());
-
-    T* buf = out->Raw<T>();
-    for (const auto& it : uniq) {
-      buf[it.second * 2] = pin[it.first * 2];
-      buf[it.second * 2 + 1] = pin[it.first * 2 + 1];
-    }
-  }
-}
-
-template struct UniqueFunctor<CpuDevice, int64_t, int64_t>;
-template struct UniqueFunctor<CpuDevice, int32_t, int32_t>;
-template struct UniqueFunctor<CpuDevice, int64_t, int32_t>;
-template struct UniqueFunctor<CpuDevice, int32_t, int64_t>;
-
-}  // namespace functor
-
-/*
-template <typename T, typename I>
-Status UniqueCpuOp<T, I>::Compute(OpKernelContext* ctx) {
-  Tensor input, output, out_index;
-  XDL_CHECK_STATUS(ctx->GetInput(0, &input));
-  XDL_CHECK_COND(2 >= input.Shape().Size(),
-                 Status::ArgumentError("input dim cann't be greater than 2"));
-  TensorShape index_shape({input.Shape()[0]});
-  XDL_CHECK_STATUS(ctx->AllocateOutput(1, index_shape, &out_index));
-
-  CpuDevice* device = dynamic_cast<CpuDevice*>(ctx->GetDevice());
-  auto fn = functor::UniqueFunctor<CpuDevice, T, I>();
-  fn(device, input, &output, out_index);
-
-  ctx->SetOutput(0, output);
-  return Status::Ok();
-}
-*/
-
-}  // namespace xdl
diff --git a/xdl/xdl/data_io/merger/unique.h b/xdl/xdl/data_io/merger/unique.h
index e15d5720..3d1041b6 100644
--- a/xdl/xdl/data_io/merger/unique.h
+++ b/xdl/xdl/data_io/merger/unique.h
@@ -33,4 +33,4 @@ struct UniqueFunctor<CpuDevice, T, I> {
 }  // namespace functor
 }  // namespace xdl
 
-#endif  // XDL_IO_MERGER_UNIQUE_H_
+#endif  // XDL_IO_MERGER_UNIQUE_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/debug_op.cc b/xdl/xdl/data_io/op/debug_op.cc
index 71307424..8b10aca3 100644
--- a/xdl/xdl/data_io/op/debug_op.cc
+++ b/xdl/xdl/data_io/op/debug_op.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/debug_op.h"
 
@@ -52,4 +37,4 @@ bool DebugOP::Run(SampleGroup *sample_group) {
 XDL_REGISTER_IOP(DebugOP)
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/debug_op.h b/xdl/xdl/data_io/op/debug_op.h
index decd1e59..9a33e4eb 100644
--- a/xdl/xdl/data_io/op/debug_op.h
+++ b/xdl/xdl/data_io/op/debug_op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #ifndef XDL_CORE_IO_DEBUGOP_H_
 #define XDL_CORE_IO_DEBUGOP_H_
@@ -49,4 +34,4 @@ class DebugOP : public Operator {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_DEMO_H_
+#endif  // XDL_CORE_IO_DEMO_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/debug_rebuild_op.cc b/xdl/xdl/data_io/op/debug_rebuild_op.cc
index b028c2f4..48f2a68d 100644
--- a/xdl/xdl/data_io/op/debug_rebuild_op.cc
+++ b/xdl/xdl/data_io/op/debug_rebuild_op.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/debug_rebuild_op.h"
 #include "xdl/core/utils/logging.h"
diff --git a/xdl/xdl/data_io/op/debug_rebuild_op.h b/xdl/xdl/data_io/op/debug_rebuild_op.h
index 159f809c..152c06ad 100644
--- a/xdl/xdl/data_io/op/debug_rebuild_op.h
+++ b/xdl/xdl/data_io/op/debug_rebuild_op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #ifndef XDL_CORE_IO_DEBUG_REBUILD_OP_H_
 #define XDL_CORE_IO_DEBUG_REBUILD_OP_H_
@@ -56,4 +41,4 @@ class DebugRebuildOP : public Operator {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_DEMO_H_
+#endif  // XDL_CORE_IO_DEMO_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/dense_to_sparse_op.cc b/xdl/xdl/data_io/op/dense_to_sparse_op.cc
new file mode 100644
index 00000000..a94b5644
--- /dev/null
+++ b/xdl/xdl/data_io/op/dense_to_sparse_op.cc
@@ -0,0 +1,77 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/op/dense_to_sparse_op.h"
+
+#include <iostream>
+
+namespace xdl {
+namespace io {
+
+bool DenseToSparseOP::Init(const std::map<std::string, std::string> &params) {
+  for (auto kv: params) {
+    std::vector<float> bounds;
+    std::cout << "init: " << kv.first << "->" << kv.second << std::endl;
+    auto &stags = kv.second;
+    std::string::size_type end, beg = 0;
+    do {
+      end = stags.find(',', beg);
+      bounds.push_back(atof(stags.substr(beg, end-beg).c_str()));
+      beg = end + 1;
+    } while (end != std::string::npos);
+    boundaries_[kv.first]=bounds;
+
+  }
+  return true;
+}
+
+bool DenseToSparseOP::Run(SampleGroup *sg) {
+  if (boundaries_.empty()) {
+    return true;
+  }
+
+  auto ft = sg->mutable_feature_tables(0);
+  int count = ft->feature_lines_size();
+  for(int i = 0; i < count; ++i){
+      auto fl = ft->mutable_feature_lines(i);
+	  int f_count = fl->features_size();
+	  for(int m = 0; m < f_count; m++){
+		  auto feature = fl->mutable_features(m);
+          if(feature->has_name()){
+             auto itt = boundaries_.find(*(feature->mutable_name()));
+             if (itt != boundaries_.end()){
+                 auto f = fl->add_features();
+                 f->set_name(itt->first);
+                 f->set_type(kSparse);
+                 auto float_values = feature->values(0).vector();
+                 for(auto value : float_values){
+                      auto pos = std::upper_bound(itt->second.begin(), itt->second.end(), value);
+                      auto fv = f->add_values();
+                      fv->set_key(pos - itt->second.begin());
+                 }
+			     feature->set_name(itt->first + "Dtos");
+             }
+          }
+      }
+  }
+
+  return true;
+}
+
+XDL_REGISTER_IOP(DenseToSparseOP)
+
+}  // namespace io
+}  // namespace xdl
+
diff --git a/xdl/xdl/data_io/op/dense_to_sparse_op.h b/xdl/xdl/data_io/op/dense_to_sparse_op.h
new file mode 100644
index 00000000..638dfe16
--- /dev/null
+++ b/xdl/xdl/data_io/op/dense_to_sparse_op.h
@@ -0,0 +1,43 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_IO_DENSETOSPARSEOP_H_
+#define XDL_CORE_IO_DENSETOSPARSEOP_H_
+
+#include "xdl/data_io/op/op.h"
+
+#include <string>
+#include <vector>
+#include <set>
+
+namespace xdl {
+namespace io {
+
+class DenseToSparseOP : public Operator {
+ public:
+  DenseToSparseOP() {}
+  virtual ~DenseToSparseOP() {}
+
+  virtual bool Init(const std::map<std::string, std::string> &params) override;
+  virtual bool Run(SampleGroup *sample_group) override;
+
+ private:
+  std::map<std::string, std::vector<float>> boundaries_; 
+};
+
+}  // namespace io
+}  // namespace xdl
+
+#endif
diff --git a/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.cc b/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.cc
index 6a95a6c8..8c4306db 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.cc
+++ b/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/expr/dsl_parser.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.h b/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.h
index 30b622c9..cd7ae915 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/dsl_parser.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -54,4 +39,4 @@ class DslParser {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/dsl_unit.h b/xdl/xdl/data_io/op/feature_op/expr/dsl_unit.h
index e24442de..a36bce0f 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/dsl_unit.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/dsl_unit.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -51,4 +36,4 @@ struct DslUnit {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/expr_graph.cc b/xdl/xdl/data_io/op/feature_op/expr/expr_graph.cc
index a2a46e32..9d549a35 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/expr_graph.cc
+++ b/xdl/xdl/data_io/op/feature_op/expr/expr_graph.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/expr/expr_graph.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/expr/expr_graph.h b/xdl/xdl/data_io/op/feature_op/expr/expr_graph.h
index 7c3721da..c6aa8eae 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/expr_graph.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/expr_graph.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -76,4 +61,4 @@ class ExprGraph {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/expr_node.cc b/xdl/xdl/data_io/op/feature_op/expr/expr_node.cc
index dae443dd..236308bb 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/expr_node.cc
+++ b/xdl/xdl/data_io/op/feature_op/expr/expr_node.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/expr/expr_node.h"
 
@@ -163,4 +148,4 @@ void ExprNode::ReleaseOp() {
 }
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/expr_node.h b/xdl/xdl/data_io/op/feature_op/expr/expr_node.h
index f52278b9..c20329cd 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/expr_node.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/expr_node.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -105,4 +90,4 @@ struct ExprNode {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/expr_parser.cc b/xdl/xdl/data_io/op/feature_op/expr/expr_parser.cc
index 61ab7b5c..eb60c4a8 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/expr_parser.cc
+++ b/xdl/xdl/data_io/op/feature_op/expr/expr_parser.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/expr/expr_parser.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/expr/expr_parser.h b/xdl/xdl/data_io/op/feature_op/expr/expr_parser.h
index 8195212d..408ad12e 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/expr_parser.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/expr_parser.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -59,4 +44,4 @@ class ExprParser {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/internal_feature.h b/xdl/xdl/data_io/op/feature_op/expr/internal_feature.h
index 32bed714..2d91284c 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/internal_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/internal_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -68,4 +53,4 @@ struct InternalFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/expr/internal_nodes.h b/xdl/xdl/data_io/op/feature_op/expr/internal_nodes.h
index 0fb24ace..cae19adc 100644
--- a/xdl/xdl/data_io/op/feature_op/expr/internal_nodes.h
+++ b/xdl/xdl/data_io/op/feature_op/expr/internal_nodes.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -65,4 +50,4 @@ class InternalNodes {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/feature_op.cc b/xdl/xdl/data_io/op/feature_op/feature_op.cc
index 0a21f146..269438b2 100644
--- a/xdl/xdl/data_io/op/feature_op/feature_op.cc
+++ b/xdl/xdl/data_io/op/feature_op/feature_op.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/feature_op.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/feature_op.h b/xdl/xdl/data_io/op/feature_op/feature_op.h
index 251fe10e..d05ca773 100644
--- a/xdl/xdl/data_io/op/feature_op/feature_op.h
+++ b/xdl/xdl/data_io/op/feature_op/feature_op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -59,4 +44,4 @@ class FeatureOP : public Operator {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/feature_op_constant.h b/xdl/xdl/data_io/op/feature_op/feature_op_constant.h
index e3bd6ea3..dbb15535 100644
--- a/xdl/xdl/data_io/op/feature_op/feature_op_constant.h
+++ b/xdl/xdl/data_io/op/feature_op/feature_op_constant.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -41,4 +26,4 @@ const float kDefaultValue = 1.;
 const float kTraceFloat = 0.00000001;
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/feature_op_type.h b/xdl/xdl/data_io/op/feature_op/feature_op_type.h
index b1310f94..01dff1cc 100644
--- a/xdl/xdl/data_io/op/feature_op/feature_op_type.h
+++ b/xdl/xdl/data_io/op/feature_op/feature_op_type.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -68,4 +53,4 @@ using FeatureValueCacheMap = std::unordered_map<int64_t, const FeatureValue *>;
 using FeatureCacheMap = std::unordered_map<const Feature *, FeatureValueCacheMap>;
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/feature_util.h b/xdl/xdl/data_io/op/feature_op/feature_util.h
index 23aebe03..c4cb73d9 100644
--- a/xdl/xdl/data_io/op/feature_op/feature_util.h
+++ b/xdl/xdl/data_io/op/feature_op/feature_util.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -50,4 +35,4 @@ class FeatureUtil {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.cc b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.cc
index 17025134..2753171a 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.cc
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.h"
 
@@ -83,4 +68,4 @@ bool CrossFeature::Combine(std::vector<const ExprNode *> &source_nodes, ExprNode
 }
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.h
index a6e1d238..cc4e0c30 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/cross_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -42,4 +27,4 @@ class CrossFeature : public MultiFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.cc b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.cc
index eb993ffa..ec343c28 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.cc
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.h"
 
@@ -108,4 +93,4 @@ bool MergeFeature::CombineOne(const ExprNode *node0, const ExprNode *node1, Expr
 }
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.h
index b50928a1..342e6d8b 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/merge_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -45,4 +30,4 @@ class MergeFeature : public MultiFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/multi_feature.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/multi_feature.h
index 33d1c4c8..048d215f 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/multi_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/multi_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -53,4 +38,4 @@ class MultiFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.cc b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.cc
index 89c68684..aec9b2ba 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.cc
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.h
index 9632230f..a7bcd467 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature/vector_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -42,4 +27,4 @@ class VectorFeature : public MultiFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/cartesian_product.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/cartesian_product.h
index 65ed954b..a1a78547 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/cartesian_product.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/cartesian_product.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -47,4 +32,4 @@ class CartesianProduct {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/dot_product.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/dot_product.h
index d1aa4d85..17705284 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/dot_product.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/dot_product.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -42,4 +27,4 @@ class DotProduct {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/intersect.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/intersect.h
index 23f80ac8..c607f8c5 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/intersect.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_func/intersect.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -47,4 +32,4 @@ class Intersect {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.cc b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.cc
index 7c2acc71..364502db 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.cc
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.h
index f5676065..2291d68a 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -62,4 +47,4 @@ class MultiFeatureOp {
 
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op_factory.h b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op_factory.h
index ba5708b8..6abfc645 100644
--- a/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op_factory.h
+++ b/xdl/xdl/data_io/op/feature_op/multi_feature_op/multi_feature_op_factory.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -55,4 +40,4 @@ class MultiFeatureOpFactory {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/single_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/single_feature.h
index b710e1c2..121282fa 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/single_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/single_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -61,4 +46,4 @@ class SingleFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.cc b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.cc
index efcb1065..8cfb38f3 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.cc
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.h
index d1b5f790..937e14ea 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/statis_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -49,4 +34,4 @@ class StatisFeature : public SingleFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.cc b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.cc
index 26dd35be..1fb381b7 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.cc
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.h"
 
@@ -51,4 +36,4 @@ bool TraversalFeature::Transform(const ExprNode *source_node, ExprNode *result_n
 }
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.h
index fae5b44e..bc073b3a 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature/traversal_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -42,4 +27,4 @@ class TraversalFeature : public SingleFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/log_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/log_feature.h
index a977392e..e20a93f9 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/log_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/log_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -50,4 +35,4 @@ class LogFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/max_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/max_feature.h
index bef18828..0d6188b4 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/max_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/max_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -48,4 +33,4 @@ class MaxFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/min_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/min_feature.h
index 58f310f8..61b7fb6c 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/min_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/min_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -48,4 +33,4 @@ class MinFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sqrt_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sqrt_feature.h
index 6a372bd7..68c766e9 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sqrt_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sqrt_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -48,4 +33,4 @@ class SqrtFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sum_feature.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sum_feature.h
index 06269c52..c1f017d9 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sum_feature.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_func/sum_feature.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -43,4 +28,4 @@ class SumFeature {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.cc b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.cc
index 198eaa95..2adc6c62 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.cc
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/single_feature_op/single_feature_op.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.h
index 803c043e..79c55582 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -63,4 +48,4 @@ class SingleFeatureOp {
 
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op_factory.h b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op_factory.h
index 16d09458..e50e665f 100644
--- a/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op_factory.h
+++ b/xdl/xdl/data_io/op/feature_op/single_feature_op/single_feature_op_factory.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -59,4 +44,4 @@ class SingleFeatureOpFactory {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.cc b/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.cc
index 64b6be87..c722d4e1 100644
--- a/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.cc
+++ b/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/source_feature_op/source_feature_op.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.h b/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.h
index 63c1ddd9..95ed0af7 100644
--- a/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.h
+++ b/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -51,4 +36,4 @@ class SourceFeatureOp {
 
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op_factory.h b/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op_factory.h
index f1428d90..7992f41c 100644
--- a/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op_factory.h
+++ b/xdl/xdl/data_io/op/feature_op/source_feature_op/source_feature_op_factory.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -51,4 +36,4 @@ class SourceFeatureOpFactory {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/feature_op/string_util.cc b/xdl/xdl/data_io/op/feature_op/string_util.cc
index 4fbb1ac7..d88c09e4 100644
--- a/xdl/xdl/data_io/op/feature_op/string_util.cc
+++ b/xdl/xdl/data_io/op/feature_op/string_util.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #include "xdl/data_io/op/feature_op/string_util.h"
 
diff --git a/xdl/xdl/data_io/op/feature_op/string_util.h b/xdl/xdl/data_io/op/feature_op/string_util.h
index 47cbca69..02612437 100644
--- a/xdl/xdl/data_io/op/feature_op/string_util.h
+++ b/xdl/xdl/data_io/op/feature_op/string_util.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #pragma once
 
@@ -55,4 +40,4 @@ class StringUtil {
 };
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/op/filter_op.cc b/xdl/xdl/data_io/op/filter_op.cc
new file mode 100644
index 00000000..505c33f2
--- /dev/null
+++ b/xdl/xdl/data_io/op/filter_op.cc
@@ -0,0 +1,148 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "xdl/data_io/op/filter_op.h"
+
+#include <iostream>
+
+#include "xdl/core/utils/logging.h"
+
+namespace xdl {
+namespace io {
+
+static const char CTRL_A = '\001';
+
+static std::string GetStag(const std::string &skey) {
+  auto pos = strchr(skey.c_str(), CTRL_A);
+  if (pos == nullptr) {
+    return skey;
+  }
+  int len = pos - skey.c_str();
+  XDL_CHECK(len > 0 && len < 1024) << len;
+  return std::string(skey.c_str(), len);
+}
+
+bool FilterOP::Init(const std::map<std::string, std::string> &params) {
+  for (auto &kv: params) {
+    std::cout << "init: " << kv.first << "->" << kv.second << std::endl;
+    if (kv.first == "stag") {
+      auto &stags = kv.second;
+      std::string::size_type end, beg = 0;
+      do {
+        end = stags.find(',', beg);
+        del_skeys_.insert(stags.substr(beg, end-beg));
+        beg = end + 1;
+      } while (end != std::string::npos);
+    } else {
+      XDL_LOG(FATAL) << "unkown param: " << kv.first;
+    }
+  }
+  return true;
+}
+
+bool FilterOP::Run(SampleGroup *sg) {
+  if (del_skeys_.empty()) {
+    return true;
+  }
+
+  std::vector<bool> dels;
+
+  auto &sample_ids = sg->sample_ids();
+  auto &labels = sg->labels();
+
+  unsigned filtered = 0;
+  unsigned passed = 0;
+
+  for (int i = 0; i < sample_ids.size(); ++i) {
+    auto stag = GetStag(sample_ids.Get(i));
+    if (del_skeys_.find(stag) != del_skeys_.end()) {
+      dels.push_back(true);
+      ++ filtered;
+    } else {
+      dels.push_back(false);
+      ++ passed;
+    }
+  }
+
+  if (filtered == 0) {
+    passed_ += passed;
+    return true;
+  }
+
+  google::protobuf::RepeatedPtrField<std::string> passed_sample_ids;
+  google::protobuf::RepeatedPtrField<Label> passed_labels;
+  google::protobuf::RepeatedPtrField<FeatureLine> passed_fls;
+
+  /// rewrite sample ids
+  passed_sample_ids.Reserve(passed);
+  for (int i = 0; i < sample_ids.size(); ++i) {
+    if (dels[i]) {
+      continue;
+    }
+    auto *val = passed_sample_ids.Add();
+    *val = sample_ids[i];
+  }
+  sg->mutable_sample_ids()->CopyFrom(passed_sample_ids);
+
+
+  /// rewrite labels
+  passed_labels.Reserve(passed);
+  for (int i = 0; i < labels.size(); ++i) {
+    if (dels[i]) {
+      continue;
+    }
+    auto *val = passed_labels.Add();
+    //val->CopyFrom(labels.Get(i));
+    *val = labels.Get(i);
+  }
+  sg->mutable_labels()->CopyFrom(passed_labels);
+
+  /// rewrite feature tables
+  auto ft = sg->mutable_feature_tables(0);
+  auto &fls = ft->feature_lines();
+  for (int i = 0; i < fls.size(); ++i) {
+    if (dels[i]) {
+      continue;
+    }
+    auto *val = passed_fls.Add();
+    //val->CopyFrom(fls.Get(i));
+    *val = fls.Get(i);
+  }
+  ft->mutable_feature_lines()->CopyFrom(passed_fls);
+
+  size_t n = sg->labels_size();
+  XDL_CHECK(sg->sample_ids_size() == 0 || sg->sample_ids_size() == n)
+      << "sample_id.size=" << sg->sample_ids_size() << " n=" << n;
+  XDL_CHECK(sg->feature_tables(0).feature_lines_size() == n)
+      << "table[0].size=" << sg->feature_tables(0).feature_lines_size() << " n=" << n;
+
+  passed_ += passed;
+  filtered_ += filtered;
+  //std::cout << "passed=" << passed_ << " filtered=" << filtered_ << std::endl;
+
+  return true;
+}
+
+std::map<std::string, std::string> FilterOP::URun(const std::map<std::string, std::string> &params) {
+  std::map<std::string, std::string> ret;
+  ret["filtered"] = std::to_string(filtered_);
+  ret["passed"] = std::to_string(passed_);
+  return ret;
+} 
+
+XDL_REGISTER_IOP(FilterOP)
+
+}  // namespace io
+}  // namespace xdl
diff --git a/xdl/xdl/data_io/op/filter_op.h b/xdl/xdl/data_io/op/filter_op.h
new file mode 100644
index 00000000..d900c881
--- /dev/null
+++ b/xdl/xdl/data_io/op/filter_op.h
@@ -0,0 +1,47 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef XDL_CORE_IO_FILTEROP_H_
+#define XDL_CORE_IO_FILTEROP_H_
+
+#include "xdl/data_io/op/op.h"
+
+#include <atomic>
+#include <string>
+#include <set>
+#include <vector>
+
+namespace xdl {
+namespace io {
+
+class FilterOP : public Operator {
+ public:
+  FilterOP() {filtered_ = 0; passed_ = 0;}
+  virtual ~FilterOP() {}
+
+  virtual bool Init(const std::map<std::string, std::string> &params) override;
+  virtual bool Run(SampleGroup *sample_group) override;
+  virtual std::map<std::string, std::string> URun(const std::map<std::string, std::string> &params) override;
+
+ private:
+  std::set<std::string> del_skeys_;
+  std::atomic<unsigned long> filtered_;
+  std::atomic<unsigned long> passed_;
+};
+
+}  // namespace io
+}  // namespace xdl
+
+#endif  // XDL_CORE_IO_FILTER_H_
diff --git a/xdl/xdl/data_io/op/op.h b/xdl/xdl/data_io/op/op.h
index 7685e5c0..31011948 100644
--- a/xdl/xdl/data_io/op/op.h
+++ b/xdl/xdl/data_io/op/op.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #ifndef XDL_CORE_IO_OP_H_
 #define XDL_CORE_IO_OP_H_
@@ -96,4 +81,4 @@ class IOPRegistry: public Singleton<IOPRegistry> {
 static auto p = xdl::io::IOPRegistry::Get()->AddCreator(#type, []()->xdl::io::Operator *{return new type();});
 
 
-#endif  // XDL_CORE_IO_OP_H_
+#endif  // XDL_CORE_IO_OP_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/packer/pack_feature.cc b/xdl/xdl/data_io/packer/pack_feature.cc
index 82967f08..f7f3c0fd 100644
--- a/xdl/xdl/data_io/packer/pack_feature.cc
+++ b/xdl/xdl/data_io/packer/pack_feature.cc
@@ -12,22 +12,6 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 #include "xdl/data_io/packer/pack_feature.h"
 
 namespace xdl {
@@ -36,19 +20,20 @@ namespace io {
 bool PackFeature::Init(Batch *batch) {
   Pack::Init(batch);
 
-  memset(tables_n_, 0, sizeof(tables_n_));
-  memset(tables_off_, 0, sizeof(tables_off_));
-
-  InitFStats();
+  InitStats();
 
   return true;
 }
 
-bool PackFeature::InitFStats() {
+bool PackFeature::InitStats() {
+  for (auto &stat : table_stats_) {
+    stat.Reset();
+  } 
   for (auto &it : feature_stats_) {
     auto &stat = it.second;
     stat.Reset();
-  } 
+  }
+
   if (feature_stats_.size() != 0) {
     return true;
   }
@@ -56,14 +41,31 @@ bool PackFeature::InitFStats() {
   auto &opts = schema_->feature_opts();
   for (auto &it: opts) {
     auto &opt = it.second;
-    //std::cout << opt->name() << std::endl;
+    if (table_stats_.size() < opt->table()+1) {
+      table_stats_.resize(opt->table()+1);
+    }
+
     auto &stat = feature_stats_[opt->name()];
+    auto &tstat = table_stats_[opt->table()];
     stat.opt_ = opt;
-    stat.seq_ = tables_seq_[opt->table()].size();
+    stat.seq_ = tstat.seq_.size();
     size_t nvec = stat.opt_->has_nvec() ? stat.opt_->nvec() : 1;
     stat.w_ = nvec;
+    if (stat.opt_->has_mask()) {
+      XDL_CHECK(stat.opt_->mask().size() <= nvec && nvec <= kNVecMax) << "mask length=" << stat.opt_->mask().size()
+          << " nvec=" << nvec;
+      std::string mask = stat.opt_->mask();
+      //if (mask.size() < kNVecMax) {
+      //  mask = std::string(kNVecMax-mask.size(), '1')+mask;
+      //}
+      XDL_LOG(DEBUG) << "mask: " << mask;
+      stat.mask_ = std::bitset<kNVecMax>(stat.opt_->mask());
+      XDL_CHECK(stat.mask_.any() && stat.mask_.count() <= nvec) << stat.mask_.count();
+      stat.w_ = stat.mask_.count();
+    }
     XDL_CHECK(stat.w_ > 0);
-    tables_seq_[opt->table()].push_back(&stat);
+    tstat.k_ = opt->table();
+    tstat.seq_.push_back(&stat);
   }
 
   XDL_CHECK(feature_stats_.size() != 0);
@@ -71,29 +73,76 @@ bool PackFeature::InitFStats() {
   return true;
 }
 
-inline size_t PackFeature::TableN(const FStat &stat) const {
-  return tables_n_[stat.opt_->table()];
-}
+bool PackFeature::Setup() {
+  batch_->ts_count_ = 0;
+  for (auto &it: feature_stats_) {
+    const std::string &name = it.first;
+    auto &stat = it.second;
+    auto ktable = stat.opt_->table();
 
-inline size_t PackFeature::TableN(size_t ktable) const {
-  return tables_n_[ktable];
-}
+    stat.blk_ = batch_->GetMutable(name);
+    stat.blk_->valid_ = true;
+    if (stat.opt_->type() == kSparse) {
+      if (stat.blk_->ts_[Block::kValue] != nullptr) {
+        delete stat.blk_->ts_[Block::kValue];
+      }
+      auto value = new Tensor(dev_, TensorShape({stat.n_, stat.w_}), types::kFloat);
+      stat.blk_->ts_[Block::kValue] = value;
 
-inline size_t PackFeature::BatchSize(const FStat &stat) const {
-  return BatchSize(stat.opt_->table());
-}
+      if (stat.blk_->ts_[Block::kKey] != nullptr) {
+        delete stat.blk_->ts_[Block::kKey];
+      }
+
+      auto key = new Tensor(dev_, stat.opt_->serialized()
+                              ?TensorShape({stat.n_}):TensorShape({stat.n_, 2}), types::kInt64);
+      stat.blk_->ts_[Block::kKey] = key;
 
-inline size_t PackFeature::BatchSize(size_t ktable) const {
-  if (ktable == 0 && schema_->padding_) {
-    return schema_->batch_size_;
+      if (stat.blk_->ts_[Block::kSegment] != nullptr) {
+        delete stat.blk_->ts_[Block::kSegment];
+      }
+      size_t N = TableSize(stat);
+      auto segment = new Tensor(dev_, TensorShape({N}), types::kInt32);
+      stat.blk_->ts_[Block::kSegment] = segment;
+
+      stat.blk_->ts_count_ = 3;
+      batch_->ts_count_ += stat.blk_->ts_count_;
+      //XDL_LOG(DEBUG) << "create " << name << ".val " << value->Shape()
+      //    << " " << name << ".idx " << key->Shape()
+      //    << " " << name << ".seg " << segment->Shape();
+    } else {
+      if (stat.blk_->ts_[Block::kValue] != nullptr) {
+        delete stat.blk_->ts_[Block::kValue];
+      }
+      auto value = new Tensor(dev_, TensorShape({TableSize(stat), stat.w_}), types::kFloat);
+      stat.blk_->ts_[Block::kValue] = value;
+      stat.blk_->ts_count_ = 1;
+      batch_->ts_count_ += stat.blk_->ts_count_;
+      //XDL_LOG(DEBUG) << "create " << name << ".val " << value->Shape();
+    }
   }
-  size_t bs = tables_n_[ktable];
-  if (ktable > 0 && tables_n_[0] < schema_->batch_size_ && tables_n_[ktable] < schema_->batch_size_ && schema_->padding_) {
-    XDL_DLOG(DEBUG) << "extend a zero line, ktable=" << ktable
-        << " table_n=" << tables_n_[ktable];
-    bs += 1;
+
+  /// indicator
+  for (int k = 0; k < table_stats_.size() && TableN(k+1) > 0; ++k) {
+    XDL_DCHECK(k < table_stats_.size());
+    auto& tstat = table_stats_[k];
+    const std::string &name = kIndicatorPrefix + std::to_string(k);
+    XDL_DCHECK(tstat.n_ > 0);
+    if (tstat.blk_ == nullptr) {
+      auto blk = batch_->GetMutable(name);
+      tstat.blk_ = blk;
+    }
+
+    auto blk = tstat.blk_;
+    if (blk->ts_[Block::kIndex] != nullptr) {
+      delete blk->ts_[Block::kIndex];
+    }
+    auto indicator = new Tensor(dev_, TensorShape({TableSize(k)}), types::kInt32);
+    blk->ts_[Block::kIndex] = indicator;
+    blk->ts_count_ = 1;
+    batch_->ts_count_ += blk->ts_count_;
+    //XDL_LOG(DEBUG) << "create " << name << " " << indicator->Shape();
   }
-  return bs;
+  return true;
 }
 
 std::pair<int, int> PackFeature::Stat(const PParam &pparam) {
@@ -101,117 +150,179 @@ std::pair<int, int> PackFeature::Stat(const PParam &pparam) {
 
   auto ktable = pparam.ktable_;
   auto ftable = pparam.ftable_;
-  XDL_CHECK(pparam.end_ <= ftable->feature_lines_size());
-
+  XDL_CHECK(pparam.end_ <= ftable->feature_lines_size()) << "ktable=" << ktable
+      << " pparam.end=" << pparam.end_ << " feature_lines=" << ftable->feature_lines_size();
 
   int ref_l = INT_MAX, ref_r = INT_MIN;
   int begin = std::max(pparam.begin_, 0);
   int end = std::min(pparam.end_, ftable->feature_lines_size());
 
-  //XDL_DLOG(DEBUG) << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ <<
+  //XDL_LOG(DEBUG) << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ <<
   //    " -> " <<  pparam.end_ << "(" << ftable->feature_lines_size() << ")";
+  XDL_DCHECK(ktable < table_stats_.size());
+  auto &tstat = table_stats_[ktable];
 
   for (int n = begin; n < end; ++n) {
     auto &fl = ftable->feature_lines(n);
-    if (fl.has_refer()) {
+    if (ktable < schema_->ntable() - 1) {
+      XDL_CHECK(fl.has_refer()) << "ktable=" << ktable << " ntable=" << schema_->ntable();
       ref_l = std::min(ref_l, fl.refer());
       ref_r = std::max(ref_r, fl.refer());
     }
 
     /// foreach feature
-    for (int f = 0; f < fl.features_size(); ++f) {
-      auto &fea = fl.features(f);
-      auto it = feature_stats_.find(fea.name());
+    for (auto &f: fl.features()) {
+      auto it = feature_stats_.find(f.name());
       if (it == feature_stats_.end()) {
         continue;
       }
 
       auto &stat = it->second;
-      XDL_CHECK(stat.opt_->table() == ktable) << "feature=" << fea.name()
+      XDL_CHECK(stat.opt_->table() == ktable) << "feature=" << f.name()
           << " opt=" << stat.opt_
           << " opt.table=" << stat.opt_->table() << " ktable=" << ktable;
 
       if (stat.opt_->type() == kDense) {
-        XDL_CHECK(fea.values_size() == 1) << "dense feature=" << stat.opt_->name() 
-            << " must be presented as vector of one value, value size=" << fea.values_size();
+        XDL_CHECK(f.values_size() == 1) << "dense feature=" << stat.opt_->name() 
+            << " must be presented as vector of one value, value size=" << f.values_size();
+      }
+      size_t vcount = f.values_size();
+      if (stat.opt_->has_cutoff() && stat.opt_->cutoff() != 0 && abs(stat.opt_->cutoff()) < vcount) {
+        stat.n_ += abs(stat.opt_->cutoff());
+      } else {
+        stat.n_ += f.values_size();
       }
-      stat.n_ += fea.values_size();
     }
-
-    ++tables_n_[ktable];
-    XDL_CHECK(tables_n_[ktable] <= schema_->batch_size_)
-        << "table[" << ktable << "]" << " n=" << tables_n_[ktable]
-        << " batch_size=" << schema_->batch_size_;
+    ++tstat.n_;
   }
 
-  //XDL_DLOG(DEBUG) << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] " << ref_l <<
-  //    " -> " <<  ref_r + 1;
+  XDL_CHECK(tstat.n_ <= schema_->batch_size_) << "table[" << ktable << "]" << " n="
+      << tstat.n_ << " batch_size=" << schema_->batch_size_;
 
+  //XDL_LOG(DEBUG) << "stat[" << pparam.isgroup_ << ", " << ktable <<  "] " << ref_l <<
+  //    " -> " <<  ref_r + 1;
   return {ref_l, ref_r+1};
 }
 
-bool PackFeature::Setup() {
-  batch_->ts_count_ = 0;
-  for (auto &it: feature_stats_) {
-    const std::string &name = it.first;
-    auto &stat = it.second;
-    auto ktable = stat.opt_->table();
+size_t PackFeature::OnFeature(FStat *stat, off_t offset, const Feature &f, int cutoff) {
+  auto blk = stat->blk_;
 
-    if (stat.blk_ == nullptr) {
-      stat.blk_ = batch_->GetMutable(name);
-      stat.blk_->ts_count_ = 0;
-    }
+  /// foreach feature value
+  bool sparse = stat->opt_->type() == kSparse;
+  if (!sparse) {
+    XDL_CHECK(f.values_size() == 1);
+  }
 
-    stat.blk_->valid_ = true;
-    if (stat.opt_->type() == kSparse) {
-      if (stat.blk_->ts_[Block::kValue] != nullptr) {
-        delete stat.blk_->ts_[Block::kValue];
+  XDL_CHECK(cutoff != 0);
+  size_t vcount = std::min(f.values_size(), abs(cutoff));
+  if (vcount < f.values_size()) {
+    XDL_LOG(DEBUG) << "cutoff feature=" << stat->opt_->name() << " cutoff=" << cutoff << "/" << f.values_size();
+  }
+  size_t vbegin = cutoff > 0 ? 0 : std::max(f.values_size()+cutoff, 0);
+
+  for (size_t i = 0; i < vcount; ++i) {
+    const auto &v = f.values(i+vbegin);
+    if (sparse) {
+      XDL_CHECK(v.has_key());
+      XDL_CHECK(blk->ts_[Block::kKey] != nullptr && blk->ts_[Block::kSegment] != nullptr);
+      auto keys = blk->ts_[Block::kKey]->Raw<int64_t >();
+      if (stat->opt_->serialized()) {
+        keys[stat->off_] = v.key();
+      } else {
+        keys[stat->off_*2] = v.hkey();
+        keys[stat->off_*2+1] = v.key();
       }
-      auto value = new Tensor(dev_, TensorShape({stat.n_, stat.w_}), types::kFloat);
-      stat.blk_->ts_[Block::kValue] = value;
+      sparse = true;
+    } else {
+      XDL_CHECK(stat->off_ <= offset) << "feature=" << stat->opt_->name() <<
+          " stat.off=" << stat->off_ << " != table.off=" << offset;
+    }
 
-      if (stat.blk_->ts_[Block::kKey] != nullptr) {
-        delete stat.blk_->ts_[Block::kKey];
+    if (v.has_value()) {
+      XDL_CHECK(blk->ts_[Block::kValue] != nullptr);
+      auto values = blk->ts_[Block::kValue]->Raw<float>();
+      values[stat->off_] = v.value();
+    } else if (v.vector_size() > 0) {
+      XDL_CHECK(blk->ts_[Block::kValue] != nullptr);
+      XDL_DCHECK(stat->opt_->nvec() == v.vector_size()) 
+          << "dense feature=" << stat->opt_->name() << " vector_size=" << v.vector_size()
+          << " nvec=" << stat->opt_->nvec()  << " width=" << stat->w_;
+      auto values = blk->ts_[Block::kValue]->Raw<float>();
+      int p = 0;
+      for (int m = 0; m < v.vector_size(); ++m) {
+        if (stat->opt_->has_mask() && !stat->mask_.test(m)) {
+          continue;
+        }
+        values[offset*stat->w_+p] = v.vector(m);
+        ++p;
       }
+      XDL_CHECK(p == stat->w_) << "dense feature=" << stat->opt_->name()
+            << " vector_size=" << v.vector_size() << " p=" << p << " width=" << stat->w_;
+    } else if (!v.has_value()) {
+      XDL_CHECK(blk->ts_[Block::kValue] != nullptr);
+      auto values = blk->ts_[Block::kValue]->Raw<float>();
+      values[stat->off_] = 1.0;
+    }
+    ++stat->off_;
+  }  // feature_value
 
-      auto key = new Tensor(dev_, stat.opt_->serialized()
-                              ?TensorShape({stat.n_}):TensorShape({stat.n_, 2}), types::kInt64);
-      stat.blk_->ts_[Block::kKey] = key;
+  if (sparse) {
+    auto segments = blk->ts_[Block::kSegment]->Raw<int32_t>();
+    segments[offset] = stat->off_;
+  }
 
-      if (stat.blk_->ts_[Block::kSegment] != nullptr) {
-        delete stat.blk_->ts_[Block::kSegment];
-      }
-      auto segment = new Tensor(dev_, TensorShape({BatchSize(stat)}), types::kInt32);
-      stat.blk_->ts_[Block::kSegment] = segment;
+  return vcount;
+}
 
-      stat.blk_->ts_count_ = 3;
-      batch_->ts_count_ += stat.blk_->ts_count_;
-      //XDL_DLOG(DEBUG) << "create " << name << ".val " << value->Shape()
-      //    << " " << name << ".idx " << key->Shape()
-      //    << " " << name << ".seg " << segment->Shape();
-    } else {
-      if (stat.blk_->ts_[Block::kValue] != nullptr) {
-        delete stat.blk_->ts_[Block::kValue];
+bool PackFeature::FeaturePad(FStat *stat, size_t offset, size_t end) {
+  XDL_DCHECK(offset < end) << "offset=" << offset << " end=" << end;
+  if (stat->opt_->type() == kSparse) {
+    XDL_CHECK(stat->off_ <= stat->n_) << "feature=" << stat->opt_->name()
+        << " off=" << stat->off_ << " n=" << stat->n_ << " end=" << end;
+
+    auto segment = stat->blk_->ts_[Block::kSegment];
+    XDL_DCHECK(segment != nullptr && end <= segment->Shape()[0])
+        << "shape=(" << segment->Shape()[0] << ") end=" << end;
+    auto segments = segment->Raw<int32_t>();
+    for (int p = offset; p < end; ++p) {
+      segments[p] = stat->off_;
+    }
+  } else {
+    XDL_CHECK(stat->off_ <= offset) << "feature=" << stat->opt_->name()
+        << " stat.off=" << stat->off_ << " != offset=" << offset;
+
+    auto value = stat->blk_->ts_[Block::kValue];
+    XDL_DCHECK(value != nullptr && end <= value->Shape()[0] && value->Shape()[1] == stat->w_);
+    for (int p = offset; p < end; ++p) {
+      auto values = value->Raw<float>();
+      for (int m = 0; m < stat->w_; ++m) {
+        values[p*stat->w_+m] = 0;
       }
-      auto value = new Tensor(dev_, TensorShape({BatchSize(stat), stat.w_}), types::kFloat);
-      stat.blk_->ts_[Block::kValue] = value;
-      stat.blk_->ts_count_ = 1;
-      batch_->ts_count_ += stat.blk_->ts_count_;
-      //XDL_DLOG(DEBUG) << "create " << name << ".val " << value->Shape();
     }
   }
 
-  for (int k = 0; k < kTablesMax - 1 && TableN(k+1) > 0; ++k) {
-    std::string name = kIndicatorPrefix + std::to_string(k);
-    auto blk = batch_->GetMutable(name);
-    if (blk->ts_[Block::kIndex] != nullptr) {
-      delete blk->ts_[Block::kIndex];
-    }
-    auto indicator = new Tensor(dev_, TensorShape({BatchSize(k)}), types::kInt32);
-    blk->ts_[Block::kIndex] = indicator;
-    blk->ts_count_ = 1;
-    batch_->ts_count_ += blk->ts_count_;
-    //XDL_DLOG(DEBUG) << "create " << name << " " << indicator->Shape();
+  return true;
+}
+
+bool PackFeature::OnIndicator(TStat *stat, const FeatureLine &fl) {
+  auto indicator = stat->blk_->ts_[Block::kIndex];
+  XDL_DCHECK(indicator != nullptr && indicator->Shape()[0]>= stat->n_)
+      << "tstat.n=" << stat->n_ << " > indicator."
+      << stat->k_ << "(" << indicator->Shape()[0] << ")";
+  auto indicators = indicator->Raw<uint32_t>();
+  indicators[stat->off_] = stat[1].off_ + fl.refer(); 
+  return true;
+}
+
+bool PackFeature::IndicatorPad(TStat *stat, off_t end) {
+  auto indicator = stat->blk_->ts_[Block::kIndex];
+  XDL_DCHECK(indicator != nullptr && end <= indicator->Shape()[0])
+      << indicator->Shape()[0] << " != " << end;
+  auto indicators = indicator->Raw<uint32_t>();
+  int padding_refer = indicators[stat->off_-1]+1;
+  for (int i = stat->off_; i < end; ++i) {
+    //indicators[i] = padding_refer;
+    indicators[i] = indicators[stat->off_-1];  // TODO: should be indicators[i] = padding_refer;
   }
   return true;
 }
@@ -222,7 +333,7 @@ std::pair<int, int> PackFeature::Run(const PParam &pparam) {
 
   auto ktable = pparam.ktable_;
   auto ftable = pparam.ftable_;
-  size_t batch_size = BatchSize(ktable);
+  size_t table_size = TableSize(ktable);
 
   XDL_CHECK(pparam.end_ <= ftable->feature_lines_size());
 
@@ -230,8 +341,10 @@ std::pair<int, int> PackFeature::Run(const PParam &pparam) {
   int begin = std::max(pparam.begin_, 0);
   int end = std::min(pparam.end_, ftable->feature_lines_size());
 
-  //XDL_DLOG(DEBUG) << "run[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ <<
+  //XDL_LOG(DEBUG) << "run[" << pparam.isgroup_ << ", " << ktable <<  "] (0)" << pparam.begin_ <<
   //    " -> " <<  pparam.end_ << "(" << ftable->feature_lines_size() << ")";
+  XDL_DCHECK(ktable < table_stats_.size());
+  auto &tstat = table_stats_[ktable];
 
   for (int n = begin; n < end; ++n) {
     auto &fl = ftable->feature_lines(n);
@@ -240,177 +353,66 @@ std::pair<int, int> PackFeature::Run(const PParam &pparam) {
       ref_r = std::max(ref_r, fl.refer());
     }
 
-    std::vector<int8_t> feature_hits(tables_seq_[ktable].size());
+    std::vector<int8_t> feature_hits(tstat.seq_.size());
     memset(&feature_hits[0], feature_hits.size(), 0);
 
     /// foreach feature
-    for (int f = 0; f < fl.features_size(); ++f) {
-      auto &fea = fl.features(f);
-      auto it = feature_stats_.find(fea.name());
+    for (auto &f: fl.features()) {
+      auto it = feature_stats_.find(f.name());
       if (it == feature_stats_.end()) {
         continue;
       }
       auto &stat = it->second;
       XDL_CHECK(stat.opt_->table() == ktable);
 
-      //XDL_DLOG(DEBUG) << "feature["<< stat.seq_ << "]=" << stat.opt_->name() << " stat.off_=" << stat.off_;
+      //XDL_LOG(DEBUG) << "feature["<< stat.seq_ << "]=" << stat.opt_->name() << " stat.off_=" << stat.off_;
 
       XDL_CHECK(stat.seq_ < feature_hits.size());
       feature_hits[stat.seq_] = 1;
 
-      auto blk = stat.blk_;
-      XDL_CHECK(blk != nullptr);
-
-      /// foreach feature value
-      bool sparse = stat.opt_->type() == kSparse;
-      if (!sparse) {
-        XDL_CHECK(fea.values_size() == 1);
-      }
-
-      for (int v = 0; v < fea.values_size(); ++v, ++stat.off_) {
-        auto &val = fea.values(v);
-        if (sparse) {
-          XDL_CHECK(val.has_key());
-          XDL_CHECK(blk->ts_[Block::kKey] != nullptr && blk->ts_[Block::kSegment] != nullptr);
-          auto keys = blk->ts_[Block::kKey]->Raw<int64_t >();
-          if (stat.opt_->serialized()) {
-            keys[stat.off_] = val.key();
-          } else {
-            keys[stat.off_*2] = val.hkey();
-            keys[stat.off_*2+1] = val.key();
-          }
-          sparse = true;
-        } else {
-          XDL_CHECK(stat.off_ == tables_off_[ktable]) << "feature=" << stat.opt_->name() <<
-              " stat.off=" << stat.off_ << " != table[" << ktable << "].off=" << tables_off_[ktable];
-        }
-
-        if (val.has_value()) {
-          XDL_CHECK(blk->ts_[Block::kValue] != nullptr);
-          auto values = blk->ts_[Block::kValue]->Raw<float>();
-          values[stat.off_] = val.value();
-        } else if (val.vector_size() > 0) {
-          XDL_CHECK(blk->ts_[Block::kValue] != nullptr);
-          XDL_DCHECK(blk->ts_[Block::kValue]->Shape()[1] == val.vector_size()) 
-              << "dense feature=" << stat.opt_->name() << " vector_size=" << val.vector_size()
-              << " != " << " width=" << blk->ts_[Block::kValue]->Shape()[1];
-          auto values = blk->ts_[Block::kValue]->Raw<float>();
-          for (int m = 0; m < val.vector_size(); ++m) {
-            values[stat.off_*val.vector_size()+m] = val.vector(m);
-          }
-        } else if (!val.has_value()) {
-          XDL_CHECK(blk->ts_[Block::kValue] != nullptr);
-          auto values = blk->ts_[Block::kValue]->Raw<float>();
-          values[stat.off_] = 1.0;
-        }
-      }  // feature_value
-
-      if (sparse) {
-        auto segments = blk->ts_[Block::kSegment]->Raw<int32_t>();
-        segments[tables_off_[ktable]] = stat.off_;
-      }
-
+      size_t vcount = OnFeature(&stat, tstat.off_, f, stat.opt_->cutoff()!=0?stat.opt_->cutoff():INT_MAX);
     }  // feature
 
     // miss
     for (size_t i = 0; i < feature_hits.size(); ++i) {
       if (feature_hits[i] > 0) {
-        //auto &stat = *(tables_seq_[ktable][i]);
-        //XDL_DLOG(DEBUG) << "hit feature["<< stat.seq_ << "]=" << stat.opt_->name() << " stat.off_=" << stat.off_;
+        //auto &stat = *(table_stats_[ktable].seq_[i]);
+        //XDL_LOG(DEBUG) << "hit feature["<< stat.seq_ << "]=" << stat.opt_->name() << " stat.off_=" << stat.off_;
         continue;
       }
-      auto &stat = *(tables_seq_[ktable][i]);
-
-      //XDL_DLOG(DEBUG) << "missed feature["<< stat.seq_ << "]=" << stat.opt_->name() << " stat.off_=" << stat.off_;
+      XDL_DCHECK(ktable < table_stats_.size());
+      auto &stat = *(table_stats_[ktable].seq_[i]);
 
-      if (stat.opt_->type() == kSparse) {
-        auto segment = stat.blk_->ts_[Block::kSegment];
-        XDL_DCHECK(segment != nullptr && segment->Shape()[0] == batch_size);
-        auto segments = segment->Raw<int32_t>();
-        segments[tables_off_[ktable]] = stat.off_;
-      } else {
-        XDL_CHECK(stat.off_ == tables_off_[ktable]) << "feature=" << stat.opt_->name() <<
-            " stat.off=" << stat.off_ << " != table[" << ktable << "].off=" << tables_off_[ktable];
-
-        auto value = stat.blk_->ts_[Block::kValue];
-        XDL_DCHECK(value != nullptr && value->Shape()[0] == batch_size && value->Shape()[1] == stat.w_);
-        auto values = value->Raw<float>();
-        for (int m = 0; m < stat.w_; ++m) {
-          values[stat.off_*stat.w_+m] = 0;
-        }
-        ++stat.off_;
-      }
+      //XDL_LOG(DEBUG) << "missed feature["<< stat.seq_ << "]=" << stat.opt_->name() << " stat.off_=" << stat.off_;
+      XDL_CHECK(FeaturePad(&stat, tstat.off_, tstat.off_+1));
     }
 
     if (fl.has_refer()) {
       XDL_CHECK(ktable < kTablesMax - 1 && TableN(ktable+1) > 0) 
-          << "table[" << ktable << "].n=" << TableN(ktable) << " -> "
-          << "table[" << ktable+1 << "].n=" << TableN(ktable+1);
-
-      std::string name = kIndicatorPrefix + std::to_string(ktable);
-      auto blk = batch_->GetMutable(name);
-      auto indicator = blk->ts_[Block::kIndex];
-      XDL_DCHECK(indicator != nullptr && indicator->Shape()[0]>= tables_n_[ktable])
-          << "table[" << ktable << "].n=" << TableN(ktable) << " > "
-          << name << "(" << indicator->Shape()[0] << ")";
-      auto indicators = indicator->Raw<uint32_t>();
-      indicators[tables_off_[ktable]] = tables_off_[ktable+1] + fl.refer(); 
+          << "tstats[" << ktable << "].n=" << TableN(ktable) << " -> "
+          << "tstats[" << ktable+1 << "].n=" << TableN(ktable+1);
+      XDL_CHECK(OnIndicator(&tstat, fl));
     }
 
-    ++tables_off_[ktable];
-    //XDL_DLOG(DEBUG) << "table[" << ktable << "].off=" << tables_off_[ktable];
+    ++tstat.off_;
+    //XDL_LOG(DEBUG) << "table[" << ktable << "].off=" << table_stats_[ktable].off_;
+  } /// for each feature_line
 
-  }  /// for each feature_line
 
   /// padding main table & indicator
-  if (tables_off_[ktable] == tables_n_[ktable] &&
-      schema_->padding_ && tables_n_[ktable] < batch_size) {
-    XDL_DLOG(DEBUG) << "batch finish, ktable=" << ktable 
-        << " padding " << tables_n_[ktable] << " -> " << batch_size;
-
-    for (auto &kv: tables_seq_[ktable]) {
-      auto &stat = *kv;
-      if (stat.opt_->type() == kSparse) {
-        XDL_CHECK(stat.off_ == stat.n_) << "feature=" << stat.opt_->name()
-            << " off=" << stat.off_ << " n=" << stat.n_;
-
-        auto segment = stat.blk_->ts_[Block::kSegment];
-        XDL_DCHECK(segment != nullptr && segment->Shape()[0] == batch_size)
-            << "shape=(" << segment->Shape()[0] << ") batch_size=" << batch_size;
-        auto segments = segment->Raw<int32_t>();
-        for (int p = tables_off_[ktable]; p < batch_size; ++p) {
-          segments[p] = 0;
-          if (p > 0) {
-            segments[p] += segments[p-1];
-          }
-        }
-      } else {
-        XDL_CHECK(stat.off_ == tables_off_[ktable]) << "feature=" << stat.opt_->name() <<
-            " stat.off=" << stat.off_ << " != table[" << ktable << "].off=" << tables_off_[ktable];
-
-        auto value = stat.blk_->ts_[Block::kValue];
-        XDL_DCHECK(value != nullptr && value->Shape()[0] == batch_size && value->Shape()[1] == stat.w_);
-        for (int p = tables_off_[ktable]; p < batch_size; ++p) {
-          auto values = value->Raw<float>();
-          for (int m = 0; m < stat.w_; ++m) {
-            values[p*stat.w_+m] = 0;
-          }
-        }
-      }
-
-    }  /// for each stat in tables_seq_
-
-    /// padding indicator to the padding line
-    if (TableN(ktable + 1) > 0) {
-      std::string name = kIndicatorPrefix + std::to_string(ktable);
-      auto blk = batch_->GetMutable(name);
-      auto indicator = blk->ts_[Block::kIndex];
-      XDL_DCHECK(indicator != nullptr && indicator->Shape()[0] == batch_size)
-          << indicator->Shape()[0] << " != " << batch_size;
-      auto indicators = indicator->Raw<uint32_t>();
-      int padding_refer = indicators[tables_off_[ktable]-1]+1;
-      for (int i = tables_off_[ktable]; i < batch_size; ++i) {
-        indicators[i] = indicators[tables_off_[ktable]-1];  // TODO: should be indicators[i] = padding_refer;
+  if (tstat.off_ == tstat.n_) {
+    if (/* ktable == 0 && */schema_->padding_ && tstat.n_ < table_size) {
+      XDL_LOG(DEBUG) << "batch finish, ktable=" << ktable 
+          << " padding " << tstat.n_ << " -> " << table_size;
+
+      for (auto &kv: tstat.seq_) {
+        auto &stat = *kv;
+        XDL_CHECK(FeaturePad(&stat, tstat.off_, table_size));
+      }  /// for each stat in tstat.seq_
+
+      /// padding indicator to the padding line
+      if (TableN(ktable + 1) > 0) {
+        XDL_CHECK(IndicatorPad(&tstat, table_size));
       }
     }
   }
@@ -418,5 +420,6 @@ std::pair<int, int> PackFeature::Run(const PParam &pparam) {
   return {ref_l, ref_r+1};
 }
 
+
 }  // namespace io
 }  // namespace xdl
diff --git a/xdl/xdl/data_io/packer/pack_feature.h b/xdl/xdl/data_io/packer/pack_feature.h
index d85a6146..bd7f66c7 100644
--- a/xdl/xdl/data_io/packer/pack_feature.h
+++ b/xdl/xdl/data_io/packer/pack_feature.h
@@ -13,28 +13,14 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
-
 #ifndef XDL_CORE_IO_PACK_FEATURE_H_
 #define XDL_CORE_IO_PACK_FEATURE_H_
 
 #include "xdl/data_io/packer/packer.h"
+#include "xdl/core/utils/logging.h"
 
-#include <map>
+#include <unordered_map>
+#include <bitset>
 
 namespace xdl {
 namespace io {
@@ -57,32 +43,91 @@ class PackFeature : public Pack {
   virtual std::pair<int, int> Run(const PParam &pparam) override;
 
  protected:
-  struct FStat {
+  /// stat
+  struct Stat {
     inline void Reset() {
       n_ = 0;
       off_ = 0;
       blk_ = nullptr;
     }
-    size_t w_ = 0;     // nvec
-    size_t n_ = 0;     // feature count of this batch
-    off_t off_ = 0;    // write offset of this batch
-    size_t seq_ = 0;   // seq point to tables_seq_[ktable]
-    const FeatureOption *opt_ = nullptr;
-    Block *blk_ = nullptr;
+    size_t n_ = 0;                        // count of feature value in feature, group size, table size, counting while <Stat>
+    off_t off_ = 0;                       // inner offset of state, updating while <Run>
+    Block *blk_ = nullptr;                // block for feature, coordinates, indicator, updating while <Run>
+  };
+
+  /// feature stat
+  struct FStat : public Stat {
+    inline void Reset() {
+      Stat::Reset();
+    }
+    const FeatureOption *opt_ = nullptr;  // feature option
+    size_t w_ = 0;                        // nvec
+    size_t seq_ = 0;                      // seq point to table_stat.seq_
+    std::bitset<kNVecMax> mask_;          // mask for dense
+  };
+  
+  /// table stat
+  struct TStat : public Stat {
+    inline void Reset() {
+      Stat::Reset();
+    }
+    std::vector<FStat *> seq_;            // feature seq of this table
+    unsigned k_ = 0;                      // ktable
   };
 
-  bool InitFStats();
   inline size_t TableN(const FStat &stat) const;
   inline size_t TableN(size_t ktable) const;
-  inline size_t BatchSize(const FStat &stat) const;
-  inline size_t BatchSize(size_t ktable) const;
-
-  size_t tables_n_[kTablesMax];
-  size_t tables_off_[kTablesMax];
+  inline size_t TableSize(const FStat &stat) const;
+  inline size_t TableSize(size_t ktable) const;
+  inline size_t GroupSize() const;
+
+  bool InitStats();
+  /// return value count
+  size_t OnFeature(FStat *stat, off_t offset, const Feature &f, int cutoff);
+  bool FeaturePad(FStat *stat, size_t offset, size_t end);
+  bool OnIndicator(TStat *stat, const FeatureLine &fl);
+  bool IndicatorPad(TStat *stat, off_t end);
+
+  //size_t tables_n_[kTablesMax];
+  //size_t tables_off_[kTablesMax];
   std::vector<FStat *> tables_seq_[kTablesMax];
-  std::map<std::string, FStat> feature_stats_;
+
+  std::vector<TStat> table_stats_;
+  std::unordered_map<std::string, FStat> feature_stats_;
 };
 
+inline size_t PackFeature::TableN(const FStat &stat) const {
+  if (stat.opt_->table() >= table_stats_.size()) {
+    return 0;
+  }
+  return table_stats_[stat.opt_->table()].n_;
+}
+
+inline size_t PackFeature::TableN(size_t ktable) const {
+  if (ktable >= table_stats_.size()) {
+    return 0;
+  }
+  return table_stats_[ktable].n_;
+}
+
+inline size_t PackFeature::TableSize(const FStat &stat) const {
+  return TableSize(stat.opt_->table());
+}
+
+inline size_t PackFeature::TableSize(size_t ktable) const {
+  if (ktable == 0 && schema_->padding_) {
+    return schema_->batch_size_;
+  }
+  XDL_CHECK(ktable < table_stats_.size());
+  size_t bs = table_stats_[ktable].n_;
+  if (ktable > 0 && table_stats_[0].n_ < schema_->batch_size_ && table_stats_[ktable].n_ < schema_->batch_size_ && schema_->padding_) {
+    XDL_DLOG(DEBUG) << "extend a zero line for padding, ktable=" << ktable
+        << " table.n=" << table_stats_[ktable].n_;
+    bs += 1;
+  }
+  return bs;
+}
+
 }  // namespace io
 }  // namespace xdl
 
diff --git a/xdl/xdl/data_io/packer/pack_label.cc b/xdl/xdl/data_io/packer/pack_label.cc
index 4650e030..31173539 100644
--- a/xdl/xdl/data_io/packer/pack_label.cc
+++ b/xdl/xdl/data_io/packer/pack_label.cc
@@ -13,22 +13,8 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 #include "xdl/data_io/packer/pack_label.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
@@ -40,15 +26,24 @@ std::pair<int, int> PackLabel::Stat(const PParam &pparam) {
   int begin = std::max(pparam.begin_, 0);
   int end = std::min(pparam.end_, labels->size());
 
-  for (int n = begin; n < end; ++n, ++n_) {
+  XDL_CHECK(end - begin <= schema_->batch_size_) << "n=" << (end - begin)
+      << " schema.batch_size=" << schema_->batch_size_;
+
+  for (int n = begin; n < end; ++n) {
     auto &label = labels->Get(n);
     size_t label_count = label.values_size();
     if (label_count_ == 0) {
       label_count_ = label_count;
     } else {
-      XDL_CHECK(label_count_ == label_count);
+      XDL_CHECK(label_count == label_count_) << label_count << " " << label_count_;
     }
-    XDL_CHECK(n_ <= schema_->batch_size_);
+    ++ n_;
+  }
+  XDL_CHECK(label_count_ >= schema_->label_count_) << "label.values_size=" << label_count_
+      << " schema.label_count=" << schema_->label_count_;
+  if (label_count_ > schema_->label_count_) {
+    XDL_LOG(WARNING) << "label.values_size=" << label_count_
+      << " schema.label_count=" << schema_->label_count_;
   }
 
   return {0, 0};
@@ -84,7 +79,7 @@ std::pair<int, int> PackLabel::Run(const PParam &pparam) {
   XDL_CHECK(blk_->ts_[Block::kValue] != nullptr);
   auto value = (blk_->ts_[Block::kValue]->Raw<float>());
 
-  auto labels = pparam.labels_;
+  auto &labels = pparam.labels_;
   int begin = std::max(pparam.begin_, 0);
   int end = std::min(pparam.end_, labels->size());
 
@@ -112,4 +107,3 @@ std::pair<int, int> PackLabel::Run(const PParam &pparam) {
 
 }  // namespace io
 }  // namespace xdl
-
diff --git a/xdl/xdl/data_io/packer/pack_label.h b/xdl/xdl/data_io/packer/pack_label.h
index a3d60dcb..6e6e2dbd 100644
--- a/xdl/xdl/data_io/packer/pack_label.h
+++ b/xdl/xdl/data_io/packer/pack_label.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #ifndef XDL_CORE_IO_PACK_LABEL_H_
 #define XDL_CORE_IO_PACK_LABEL_H_
@@ -55,8 +40,8 @@ class PackLabel : public Pack {
   virtual std::pair<int, int> Run(const PParam &pparam) override;
 
  protected:
-  size_t label_count_ = 0;
   size_t n_ = 0;
+  size_t label_count_ = 0;
   off_t offset_ = 0;
   Block *blk_ = nullptr;
 };
@@ -64,4 +49,4 @@ class PackLabel : public Pack {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PACK_LABEL_H_
+#endif  // XDL_CORE_IO_PACK_LABEL_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/packer/pack_skey.cc b/xdl/xdl/data_io/packer/pack_skey.cc
index 136da5a5..041e1d28 100644
--- a/xdl/xdl/data_io/packer/pack_skey.cc
+++ b/xdl/xdl/data_io/packer/pack_skey.cc
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 #include "xdl/data_io/packer/pack_skey.h"
 #include "xdl/core/utils/logging.h"
 
@@ -41,36 +26,29 @@ std::pair<int, int> PackSKey::Stat(const PParam &pparam) {
   int begin = std::max(pparam.begin_, 0);
   int end = std::min(pparam.end_, sample_ids->size());
 
-  for (int n = begin; n < end; ++n, ++n_) {
+  for (int n = begin; n < end; ++n) {
     auto &skey = sample_ids->Get(n);
-    if (skey_len_max_ < skey.size()) {
-      skey_len_max_ = skey.size();
-    }
-    XDL_CHECK(n_ <= schema_->batch_size_);
+    skey_len_max_ = std::max(skey_len_max_, skey.size() + 1);
+    ++ n_;
   }
+  XDL_CHECK(n_ <= schema_->batch_size_);
 
-  XDL_CHECK(skey_len_max_ != 0);
   return {0, 0};
 }
 
 bool PackSKey::Init(Batch *batch) {
   Pack::Init(batch);
-  skey_len_max_ = 0;
+  skey_len_max_ = 1;
   n_ = 0;
   offset_ = 0;
   return true;
 };
 
 bool PackSKey::Setup() {
-  XDL_CHECK(skey_len_max_ != 0);
   size_t batch_size = schema_->padding_?schema_->batch_size_:n_;
 
   auto blk = batch_->GetMutable(kSKeyName);
   XDL_CHECK(blk != nullptr);
-  if (blk->ts_[Block::kIndex] != nullptr) {
-    delete blk->ts_[Block::kIndex];
-  }
-  blk->ts_[Block::kIndex] = new Tensor(dev_, TensorShape({batch_size}), types::kInt32);
 
   if (blk->ts_[Block::kSBuf] != nullptr) {
     delete blk->ts_[Block::kSBuf];
@@ -78,7 +56,7 @@ bool PackSKey::Setup() {
   blk->ts_[Block::kSBuf] = new Tensor(dev_, TensorShape({batch_size, skey_len_max_}), types::kInt8);
 
   blk_ = blk;
-  blk_->ts_count_ = 2;
+  blk_->ts_count_ = 1;
   batch_->ts_count_ += blk_->ts_count_;
   return true;
 }
@@ -86,25 +64,27 @@ bool PackSKey::Setup() {
 std::pair<int, int> PackSKey::Run(const PParam &pparam) {
   XDL_CHECK(pparam.sample_ids_ != nullptr && skey_len_max_ > 0 && blk_ != nullptr)
       << "skey_len_max=" << skey_len_max_ << ", blk=" << (void *)blk_;
+  size_t batch_size = schema_->padding_?schema_->batch_size_:n_;
 
-  auto slen = blk_->ts_[Block::kIndex]->Raw<int32_t>();
   auto sbuf = (char *)blk_->ts_[Block::kSBuf]->Raw<int8_t>();
 
   auto sample_ids = pparam.sample_ids_;
   int begin = std::max(pparam.begin_, 0);
   int end = std::min(pparam.end_, sample_ids->size());
 
-  for (int n = begin; n < end; ++n, ++offset_) {
-    XDL_CHECK(offset_ <= n_);
+  for (int n = begin; n < end; ++n) {
+    XDL_CHECK(offset_ <= n_) << offset_ << " " << n_;
     auto &skey = sample_ids->Get(n);
-    XDL_CHECK(skey.size() <= skey_len_max_);
-    slen[offset_] = skey.size();
-    strncpy(&sbuf[skey_len_max_*offset_], skey.c_str(), skey.size());
+    XDL_CHECK(skey.size() < skey_len_max_);
+    strcpy(&sbuf[skey_len_max_*offset_], skey.c_str());
+    ++ offset_;
   }
 
   //padding
-  if (schema_->padding_ && offset_== n_ && n_ < schema_->batch_size_) {
-    memset(slen + offset_, 0, (schema_->batch_size_ - n_) * sizeof(int32_t));
+  if (schema_->padding_ && offset_ == n_ && n_ < batch_size) {
+    for (; offset_ < batch_size; ++offset_) {
+      sbuf[skey_len_max_*offset_] = '\0';
+    }
   }
 
   return {0, 0};
@@ -112,4 +92,3 @@ std::pair<int, int> PackSKey::Run(const PParam &pparam) {
 
 }  // namespace io
 }  // namespace xdl
-
diff --git a/xdl/xdl/data_io/packer/pack_skey.h b/xdl/xdl/data_io/packer/pack_skey.h
index 2e95ae77..15f200d4 100644
--- a/xdl/xdl/data_io/packer/pack_skey.h
+++ b/xdl/xdl/data_io/packer/pack_skey.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #ifndef XDL_CORE_IO_PACK_SKEY_H_
 #define XDL_CORE_IO_PACK_SKEY_H_
@@ -55,7 +40,7 @@ class PackSKey : public Pack {
   virtual std::pair<int, int> Run(const PParam &pparam) override;
 
  protected:
-  size_t skey_len_max_ = 0;
+  size_t skey_len_max_ = 1;
   size_t n_ = 0;
   off_t offset_ = 0;
   Block *blk_ = nullptr;
@@ -64,4 +49,4 @@ class PackSKey : public Pack {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PACK_SKEY_H_
+#endif  // XDL_CORE_IO_PACK_SKEY_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/packer/packer.cc b/xdl/xdl/data_io/packer/packer.cc
index 21fa96d2..e0fc08f7 100644
--- a/xdl/xdl/data_io/packer/packer.cc
+++ b/xdl/xdl/data_io/packer/packer.cc
@@ -13,22 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
-
 #include "xdl/data_io/packer/packer.h"
 #include "xdl/data_io/packer/pack_skey.h"
 #include "xdl/data_io/packer/pack_label.h"
@@ -37,6 +21,9 @@ limitations under the License.
 #include "xdl/data_io/constant.h"
 #include "xdl/data_io/pool.h"
 
+#include "xdl/core/lib/timer.h"
+#include "xdl/core/utils/logging.h"
+
 namespace xdl {
 namespace io {
 
@@ -52,14 +39,18 @@ bool Packer::Init() {
 }
 
 Batch *Packer::Run(std::vector<SGroup*> *sgroups, size_t *total_size_p) {
+  //XDL_TIMER_SCOPE(packer_run);
   size_t total_size = *total_size_p;
   if (total_size == 0) {
     return nullptr;
   }
   assert(total_size <= schema_->batch_size_);
-
   /// init
   Batch *batch = BatchPool::Get()->Acquire();
+  if (total_size < schema_->batch_size_) {
+    batch->Abandon(true);
+  }
+
   batch->ts_count_ = 0;
   for (int i = 0; i < kPackCount; ++i) {
     packs_[i]->Init(batch);
@@ -74,6 +65,7 @@ Batch *Packer::Run(std::vector<SGroup*> *sgroups, size_t *total_size_p) {
     assert(sgroup->end_ > sgroup->begin_);
     total_size -= (sgroup->end_ - sgroup->begin_);
 
+    pparam.ntable_ = sg->feature_tables_size();
     pparam.begin_ = sgroup->begin_;
     pparam.end_ = sgroup->end_;
     pparam.isgroup_ = i;
@@ -84,7 +76,26 @@ Batch *Packer::Run(std::vector<SGroup*> *sgroups, size_t *total_size_p) {
     pparam.labels_ = &sg->labels();
     packs_[kPackLabel]->Stat(pparam);
 
-    for (int k = 0; k < sg->feature_tables_size(); ++k) {
+    for (int k = 0; k < schema_->ntable(); ++k) {
+      /// padding for fully empty aux feature table & feature line
+      if (k == sg->feature_tables_size()) {
+        sg->add_feature_tables();
+      }
+
+      auto ftable = sg->mutable_feature_tables(k);
+      if (ftable->feature_lines_size() == 0) {
+        XDL_CHECK (k == sg->feature_tables_size() - 1) << "k=" << k << " table_size=" << sg->feature_tables_size();
+        ftable->add_feature_lines();
+        XDL_LOG(DEBUG) << "padding empty feature_line for table[" << k << "] ";
+        ftable = sg->mutable_feature_tables(k-1);
+        for (int n = 0; n < ftable->feature_lines_size(); ++n) {
+          auto fl = ftable->mutable_feature_lines(n);
+          if (!fl->has_refer()) {
+            fl->set_refer(0);
+          }
+        }
+      }
+
       pparam.ftable_ = &sg->feature_tables(k);
       pparam.ktable_ = k;
       auto range = packs_[kPackFeature]->Stat(pparam);
@@ -104,6 +115,7 @@ Batch *Packer::Run(std::vector<SGroup*> *sgroups, size_t *total_size_p) {
     auto sgroup = sgroups->at(i);
     auto sg = sgroup->Get();
 
+    pparam.ntable_ = sg->feature_tables_size();
     pparam.begin_ = sgroup->begin_;
     pparam.end_ = sgroup->end_;
     pparam.isgroup_ = i;
@@ -114,6 +126,7 @@ Batch *Packer::Run(std::vector<SGroup*> *sgroups, size_t *total_size_p) {
     pparam.labels_ = &sg->labels();
     packs_[kPackLabel]->Run(pparam);
 
+    XDL_CHECK(sg->feature_tables_size() == schema_->ntable());
     for (int k = 0; k < sg->feature_tables_size(); ++k) {
       pparam.ftable_ = &sg->feature_tables(k);
       pparam.ktable_ = k;
@@ -140,7 +153,7 @@ std::vector<Batch *>Packer::Run(SGroup *sgroup) {
   assert(sgroup != nullptr);
 
   if (sgroup != END) {
-    assert(sgroup->end_ > sgroup->begin_);
+    XDL_CHECK(sgroup->end_ > sgroup->begin_);
     XDL_DLOG(DEBUG) << "sgroups.size=[" << sgroups_.size() << "], total_size="  << total_size_
         << ", add sgroup[" << sgroup->begin_ << "," << sgroup->end_ << ")";
     sgroups_.push_back(sgroup);
@@ -152,7 +165,7 @@ std::vector<Batch *>Packer::Run(SGroup *sgroup) {
     assert(sgroups_.size() != 0);
     SGroup *tail = nullptr;
 
-    /// fit size
+    /// fits batch size
     if (total_size_ > schema_->batch_size_) {
       assert(sgroup != END);
       if (schema_->split_group_) {
@@ -195,7 +208,7 @@ std::vector<Batch *>Packer::Run(SGroup *sgroup) {
     assert(sgroups_.size() == 0 && total_size_ == 0);
     out.push_back(batch);
 
-    /// push tail
+    /// leave tail for next
     if (tail != nullptr) {
       sgroups_.push_back(tail);
       total_size_ = tail->end_ - tail->begin_;
diff --git a/xdl/xdl/data_io/packer/packer.h b/xdl/xdl/data_io/packer/packer.h
index 1d24a445..47f479b0 100644
--- a/xdl/xdl/data_io/packer/packer.h
+++ b/xdl/xdl/data_io/packer/packer.h
@@ -13,21 +13,6 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-/*
- * Copyright 1999-2018 Alibaba Group.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
-*/
 
 #ifndef XDL_CORE_IO_PACKER_H_
 #define XDL_CORE_IO_PACKER_H_
@@ -36,7 +21,6 @@ limitations under the License.
 #include "xdl/data_io/batch.h"
 #include "xdl/data_io/schema.h"
 #include "xdl/core/framework/tensor.h"
-#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
@@ -46,6 +30,7 @@ struct PParam {
   const ::google::protobuf::RepeatedPtrField<Label> *labels_;
   const FeatureTable *ftable_;
   int ktable_;
+  int ntable_;
   int isgroup_;
   int begin_;
   int end_;
@@ -108,4 +93,4 @@ class Packer {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PACKER_H_
+#endif  // XDL_CORE_IO_PACKER_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/parser/parse_pb.cc b/xdl/xdl/data_io/parser/parse_pb.cc
index 585c1713..fa87a000 100644
--- a/xdl/xdl/data_io/parser/parse_pb.cc
+++ b/xdl/xdl/data_io/parser/parse_pb.cc
@@ -18,6 +18,7 @@ limitations under the License.
 #include <assert.h>
 
 #include "xdl/data_io/pool.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
diff --git a/xdl/xdl/data_io/parser/parse_pb.h b/xdl/xdl/data_io/parser/parse_pb.h
index d55b9231..789d9781 100644
--- a/xdl/xdl/data_io/parser/parse_pb.h
+++ b/xdl/xdl/data_io/parser/parse_pb.h
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #ifndef XDL_CORE_IO_PARSE_PB_H_
 #define XDL_CORE_IO_PARSE_PB_H_
 
@@ -35,4 +36,4 @@ class ParsePB : public Parse {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PARSE_PB_H_
+#endif  // XDL_CORE_IO_PARSE_PB_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/parser/parse_simple.cc b/xdl/xdl/data_io/parser/parse_simple.cc
index 96f957cb..973d010f 100644
--- a/xdl/xdl/data_io/parser/parse_simple.cc
+++ b/xdl/xdl/data_io/parser/parse_simple.cc
@@ -13,6 +13,8 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
+
 #include "xdl/data_io/parser/parse_simple.h"
 
 #include <assert.h>
@@ -58,4 +60,4 @@ SGroup *ParseSimple::Run(const char *str, size_t len) {
 }
 
 }  // namespace xdl
-}  // namespace io
+}  // namespace io
\ No newline at end of file
diff --git a/xdl/xdl/data_io/parser/parse_simple.h b/xdl/xdl/data_io/parser/parse_simple.h
index adf4fcbb..af7f97f5 100644
--- a/xdl/xdl/data_io/parser/parse_simple.h
+++ b/xdl/xdl/data_io/parser/parse_simple.h
@@ -13,6 +13,8 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
+
 #ifndef XDL_CORE_IO_PARSE_SIMPLE_H_
 #define XDL_CORE_IO_PARSE_SIMPLE_H_
 
@@ -34,4 +36,4 @@ class ParseSimple : public Parse {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PARSE_SIMPLE_H_
+#endif  // XDL_CORE_IO_PARSE_SIMPLE_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/parser/parse_txt.cc b/xdl/xdl/data_io/parser/parse_txt.cc
index 4042edb1..e09b5059 100644
--- a/xdl/xdl/data_io/parser/parse_txt.cc
+++ b/xdl/xdl/data_io/parser/parse_txt.cc
@@ -19,6 +19,7 @@ limitations under the License.
 #include <functional>
 
 #include "xdl/data_io/pool.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
@@ -101,7 +102,7 @@ SGroup *ParseTxt::Run(const char *str, size_t len) {
       last_sgroup_->size_ >= MAX_NUM_SAMPLE_OF_GROUP ||
       strncmp(seg_ptrs[1], last_group_key_.c_str(), seg_lens[1]) != 0) {
     if (last_sgroup_ != nullptr) {
-      XDL_DLOG(DEBUG) << "will return, key=" << last_group_key_
+      XDL_LOG(DEBUG) << "will return, key=" << last_group_key_
           << " size=" << last_sgroup_->size_;
     }
     sgroup = SGroupPool::Get()->Acquire();
diff --git a/xdl/xdl/data_io/parser/parse_txt.h b/xdl/xdl/data_io/parser/parse_txt.h
index 46d9989c..ca8f9988 100644
--- a/xdl/xdl/data_io/parser/parse_txt.h
+++ b/xdl/xdl/data_io/parser/parse_txt.h
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #ifndef XDL_CORE_IO_PARSE_TXT_H_
 #define XDL_CORE_IO_PARSE_TXT_H_
 
@@ -72,4 +73,4 @@ class ParseTxt : public Parse {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PARSE_TXT_H_
+#endif  // XDL_CORE_IO_PARSE_TXT_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/parser/parse_v4.cc b/xdl/xdl/data_io/parser/parse_v4.cc
index a95df94b..7a05c19f 100644
--- a/xdl/xdl/data_io/parser/parse_v4.cc
+++ b/xdl/xdl/data_io/parser/parse_v4.cc
@@ -18,6 +18,7 @@ limitations under the License.
 #include <assert.h>
 
 #include "xdl/data_io/pool.h"
+#include "xdl/core/utils/logging.h"
 
 namespace xdl {
 namespace io {
@@ -74,12 +75,12 @@ SGroup *ParseV4::Run(const char *str, size_t len) {
   for (int i = 0; i < v4sg.data_block_size(); ++i) {
     auto &block = v4sg.data_block(i);
     switch (block.data_block_type()) {
-      case v4::kLabel:
-        OnLabel(block, sg);
-        break;
       case v4::kSampleInfo:
         OnSKey(block, sg);
         break;
+      case v4::kLabel:
+        OnLabel(block, sg);
+        break;
       case v4::kNCommonFeature:
         if (sg->feature_tables_size() == 0) {
           sg->add_feature_tables();
@@ -98,10 +99,15 @@ SGroup *ParseV4::Run(const char *str, size_t len) {
   }
 
   size_t n = sg->labels_size();
-  XDL_CHECK(n > 0);
+  if (n == 0) {
+    SGroupPool::Get()->Release(sgroup);
+    return nullptr;
+  }
 
-  XDL_CHECK(sg->sample_ids_size() == 0 || sg->sample_ids_size() == n);
-  XDL_CHECK(sg->feature_tables_size() > 0 && sg->feature_tables(0).feature_lines_size() == n);
+  XDL_CHECK(sg->sample_ids_size() == 0 || sg->sample_ids_size() == n)
+      << "sample_id.size=" << sg->sample_ids_size() << " n=" << n;
+  XDL_CHECK(sg->feature_tables(0).feature_lines_size() == n)
+      << "table[0].size=" << sg->feature_tables(0).feature_lines_size() << " n=" << n;
 
   sgroup->Reset();
   return sgroup;
@@ -110,13 +116,12 @@ SGroup *ParseV4::Run(const char *str, size_t len) {
 bool ParseV4::OnLabel(const v4::DataBlock &block, SampleGroup *sg) {
   for (int i = 0; i < block.label_block_size(); ++i) {
     auto &lb = block.label_block(i);
-    XDL_CHECK(lb.data_size() == schema_->label_count_);
     auto lb_ = sg->add_labels();
     for (int j = 0; j < lb.data_size(); ++j) {
       lb_->add_values(lb.data(j));
     }
   }
-  return false;
+  return true;
 }
 
 bool ParseV4::OnSKey(const v4::DataBlock &block, SampleGroup *sg) {
@@ -124,7 +129,7 @@ bool ParseV4::OnSKey(const v4::DataBlock &block, SampleGroup *sg) {
     auto &sb = block.sample_info_block(i);
     sg->add_sample_ids(sb.info());
   }
-  return false;
+  return true;
 }
 
 bool ParseV4::OnTable(const v4::DataBlock &block, FeatureTable *tab) {
@@ -132,6 +137,7 @@ bool ParseV4::OnTable(const v4::DataBlock &block, FeatureTable *tab) {
   if (block.data_block_type() == v4::kNCommonFeature) {
     names = &ncomm_;
   } else if (block.data_block_type() == v4::kCommonFeature) {
+    XDL_CHECK(block.feature_block_size() == 1);
     names = &comm_;
   }
 
@@ -142,7 +148,6 @@ bool ParseV4::OnTable(const v4::DataBlock &block, FeatureTable *tab) {
       auto &fg = fb.feature_group(j);
       auto fg_ = fl_->add_features();
       fg_->set_type(kSparse);
-      // TODO convert feature name
       unsigned fi = fg.feature_index();
       XDL_CHECK(fi < names->size());
       fg_->set_name(names->at(fi));
@@ -157,7 +162,7 @@ bool ParseV4::OnTable(const v4::DataBlock &block, FeatureTable *tab) {
       fl_->set_refer(0);
     }
   }
-  return false;
+  return true;
 }
 
 }  // namespace xdl
diff --git a/xdl/xdl/data_io/parser/parse_v4.h b/xdl/xdl/data_io/parser/parse_v4.h
index c92ed6cb..62b84241 100644
--- a/xdl/xdl/data_io/parser/parse_v4.h
+++ b/xdl/xdl/data_io/parser/parse_v4.h
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #ifndef XDL_CORE_IO_PARSE_V4_H_
 #define XDL_CORE_IO_PARSE_V4_H_
 
@@ -35,6 +36,7 @@ class ParseV4 : public Parse {
   v4::SampleMeta meta_;
   std::vector<std::string> ncomm_;
   std::vector<std::string> comm_;
+
   bool OnLabel(const v4::DataBlock &block, SampleGroup *sg);
   bool OnSKey(const v4::DataBlock &block, SampleGroup *sg);
   bool OnTable(const v4::DataBlock &block, FeatureTable *tab);
@@ -43,4 +45,4 @@ class ParseV4 : public Parse {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_PARSE_V4_H_
+#endif  // XDL_CORE_IO_PARSE_V4_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/parser/parser.cc b/xdl/xdl/data_io/parser/parser.cc
index 6db2196b..f2668111 100644
--- a/xdl/xdl/data_io/parser/parser.cc
+++ b/xdl/xdl/data_io/parser/parser.cc
@@ -13,35 +13,36 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-#include "xdl/data_io/parser/parser.h"
-
 #include <unistd.h>
-
+#include "xdl/data_io/parser/parser.h"
 #include "xdl/data_io/parser/parse_pb.h"
 #include "xdl/data_io/parser/parse_txt.h"
-#include "xdl/data_io/parser/parse_v4.h"
 #include "xdl/data_io/parser/parse_simple.h"
+#include "xdl/data_io/parser/parse_v4.h"
 #include "xdl/data_io/pool.h"
+#include "xdl/core/lib/timer.h"
 
 #include "xdl/core/utils/logging.h"
 
+///TODO return nullptr not END
+
 namespace xdl {
 namespace io {
 
 Parser::Parser(ParserType type, const Schema *schema) : schema_(schema) {
   switch(type) {
     case kPB:
-      parse_ = new ParsePB(schema);
+      parse_.reset(new ParsePB(schema));
       break;
     case kTxt:
-      parse_ = new ParseTxt(schema);
-      break;
-    case kV4:
-      parse_ = new ParseV4(schema);
+      parse_.reset(new ParseTxt(schema));
       break;
     case kSPB:
-      parse_ = new ParseSimple(schema);
+      parse_.reset(new ParseSimple(schema));
       break;
+    case kV4:
+      parse_.reset(new ParseV4(schema));
+      break;      
     default:
       XDL_LOG(FATAL) << "invalid parser_type=" << type;
   }
@@ -58,61 +59,29 @@ bool Parser::Init(ReadParam *rparam) {
   return true;
 }
 
-SGroup *Parser::Run1() {
-  uint32_t len = ((uint32_t *)(buf_+begin_))[0];
-  XDL_CHECK(len < kBufSize && len < kReadSize);
-  if (len + sizeof(uint32_t) + begin_ > (size_t)end_) {
-    if (rparam_->begin_ == rparam_->end_) {
-      return (SGroup *)END;
-    }
-    /// read more
-    uint64_t read_len = (rparam_->begin_ + kReadSize) < (size_t)rparam_->end_ ?
-        kReadSize : (rparam_->end_ - rparam_->begin_);
-
-    XDL_DLOG(DEBUG) << "read more, len=" << len << " read=" <<  read_len
-        << " begin=" << rparam_->begin_ << " end=" << rparam_->end_ << std::endl;
-
-    if (end_ + read_len > kBufSize) {
-      size_t left = end_ - begin_;
-      memmove(buf_, buf_+begin_, left);
-      begin_ = 0;
-      end_ = left;
-    }
-
-    read_len = rparam_->ant_->Read(buf_+end_, read_len);
-    rparam_->begin_ += read_len;
-    end_ += read_len;
-
-    len = ((uint32_t *)(buf_+begin_))[0];
-  }
-
-  SGroup *sgroup = SGroupPool::Get()->Acquire();
-  SampleGroup *sg = sgroup->New();
-  XDL_CHECK(sg->ParseFromArray(buf_ + begin_ + sizeof(uint32_t), len))
-      << "parse sample group failed, len=" << len;
-
-  sgroup->Reset();
-
-  begin_ += sizeof(uint32_t) + len;
-
-  return sgroup;
-}
-
 SGroup *Parser::Read2Parse() {
   ssize_t size = -1;
   while (running_) {
+again:
+    /// try to get size
     size = parse_->GetSize(buf_+begin_, end_-begin_);
-    XDL_DLOG(DEBUG) << "GetSize=" << size << " begin=" << begin_ << " end=" << end_ << std::endl;
-
+    XDL_LOG(DEBUG) << "GetSize=" << size << " begin=" << begin_ << " end=" << end_ << std::endl;
     XDL_CHECK(size != 0 && size < (ssize_t)kBufSize) << "size=" << size;
-    if (size > 0 && size <= end_-begin_) {
+
+    XDL_DCHECK(end_-begin_ >= 0);
+    if (end_ == begin_ || size > end_-begin_) {
+      /// buffer not enough
+      size = -1;
+    } else if (size > 0) {
       /// read enough
+      XDL_CHECK(size <= end_-begin_) << "size=" << size;
       break;
     }
 
     if (rparam_->begin_ == rparam_->end_) {
       XDL_LOG(DEBUG) << "rparam read over, path=" << rparam_->path_
-          << " size=" << rparam_->end_;
+          << " size=" << rparam_->end_ << " parsed=" << rparam_->parsed_;
+      rparam_->parsed_ += size;
       SGroup *sgroup = parse_->Run(nullptr, 0);
       if (sgroup == nullptr) {
         return (SGroup *)END;
@@ -124,13 +93,13 @@ SGroup *Parser::Read2Parse() {
     uint64_t read_len = (rparam_->begin_ + kReadSize) < (size_t)rparam_->end_ ?
         kReadSize : (rparam_->end_ - rparam_->begin_);
 
-    XDL_DLOG(DEBUG) << "try read=" <<  read_len << " rp.begin=" << rparam_->begin_
+    XDL_LOG(DEBUG) << "try read=" <<  read_len << " rp.begin=" << rparam_->begin_
         << " rp.end=" << rparam_->end_ << std::endl;
 
     if (end_ + read_len > kBufSize) {
       size_t left = end_ - begin_;
       memmove(buf_, buf_ + begin_, left);
-      XDL_DLOG(DEBUG) << "move from (" << begin_ << ", " << end_ << ")"
+      XDL_LOG(DEBUG) << "move from (" << begin_ << ", " << end_ << ")"
           << " to (0, " << left << ")";
       begin_ = 0;
       end_ = left;
@@ -138,15 +107,21 @@ SGroup *Parser::Read2Parse() {
 
     read_len = rparam_->ant_->Read(buf_ + end_, read_len);
     if (read_len == 0) {
-      XDL_DLOG(DEBUG) << "read 0 from ant " << running_;
-      sleep(1);
+      XDL_LOG(DEBUG) << "read 0 from ant " << running_;
+      if (rparam_->end_ == ULONG_MAX) {
+        rparam_->end_ = rparam_->begin_;
+        XDL_LOG(DEBUG) << "read 0 from zant, end of file, size=" << rparam_->end_;
+      } else {
+        sleep(1);
+      }
       continue;
     }
+    XDL_CHECK(read_len > 0 && read_len < kBufSize) << "read len=" << read_len;
 
     rparam_->begin_ += read_len;
     end_ += read_len;
 
-    XDL_DLOG(DEBUG) << "have read=" <<  read_len << " rp.begin=" << rparam_->begin_
+    XDL_LOG(DEBUG) << "have read=" <<  read_len << " rp.begin=" << rparam_->begin_
         << " rp.end=" << rparam_->end_ << "end=" << end_ << std::endl;
   }
   
@@ -155,17 +130,24 @@ SGroup *Parser::Read2Parse() {
     return (SGroup *)END;
   }
 
+  XDL_CHECK(size > 0) << "size=" << size;
+
+  rparam_->parsed_ += size;
   SGroup *sgroup = parse_->Run(buf_+begin_, size);
-  XDL_DLOG(DEBUG) << "Run=" << sgroup << " begin=" << begin_ << " end=" << end_ << std::endl;
+  XDL_LOG(DEBUG) << "Run=" << sgroup << " begin=" << begin_ << " end=" << end_ << std::endl;
 
-  XDL_DLOG(DEBUG) << "increase begin=" << begin_ << " size=" <<  size
+  XDL_LOG(DEBUG) << "increase begin=" << begin_ << " size=" <<  size
       << "to begin=" << begin_ + size << std::endl;
   begin_ += size;
 
+  if (sgroup == nullptr) {
+    goto again;
+  }
   return sgroup;
 }
 
 SGroup *Parser::Run() {
+  //XDL_TIMER_SCOPE(parser_run);
   SGroup *sgroup = nullptr;
   do {
     sgroup = Read2Parse();
diff --git a/xdl/xdl/data_io/parser/parser.h b/xdl/xdl/data_io/parser/parser.h
index 213d7e89..72f999a5 100644
--- a/xdl/xdl/data_io/parser/parser.h
+++ b/xdl/xdl/data_io/parser/parser.h
@@ -13,13 +13,13 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #ifndef XDL_CORE_IO_PARSER_H_
 #define XDL_CORE_IO_PARSER_H_
 
 #include "xdl/data_io/sgroup.h"
 #include "xdl/data_io/schema.h"
 #include "xdl/data_io/fs/file_system.h"
-#include "xdl/core/utils/logging.h"
 
 #include <sstream>
 
@@ -29,23 +29,25 @@ namespace io {
 /*!\brief the read args */
 struct ReadParam {
   ~ReadParam() {
-    delete path_;
     delete ant_;
     ant_ = nullptr;
   }
   size_t begin_ = 0;
+  size_t parsed_ = 0;
   size_t end_ = 0;
-  size_t epoch_ = 0;
-  const char *path_;
+  unsigned epoch_ = 0;
+  unsigned pathid_ = 0;
+  const char *path_ = nullptr;
   IOAnt *ant_ = nullptr;
 
   std::string DebugString() const {
     std::stringstream ss;
-    ss << " begin=" << begin_
-       << " end=" << end_
-       << " epoch=" << epoch_
-       << " path=" << path_ 
-       << " io_ant=" << (void*)ant_;
+    ss << " begin=" << std::to_string(begin_)
+       << " end=" << std::to_string(end_)
+       << " parsed=" << std::to_string(parsed_)
+       << " epoch=" << std::to_string(epoch_)
+       << " path=" << path_
+       << " io_ant=" << (void *)ant_;
     return ss.str();
   }
 };
@@ -70,18 +72,17 @@ class Parser {
   Parser(ParserType type, const Schema *schema);
   virtual ~Parser() {}
 
-  bool InitMeta(const std::string &meta);
-  bool Init(ReadParam *rparam);
-  SGroup *Run();
-  SGroup *Run1();
-  bool Shutdown();
+  virtual bool InitMeta(const std::string &meta);
+  virtual bool Init(ReadParam *rparam);
+  virtual SGroup *Run();
+  virtual bool Shutdown();
 
  protected:
   bool running_ = true;
   const Schema *schema_ = nullptr;
   SGroup *Read2Parse();
 
-  Parse *parse_ = nullptr;
+  std::unique_ptr<Parse> parse_;
   ReadParam *rparam_ = nullptr;
   char buf_[kBufSize] = {0};
   off_t begin_ = 0;
@@ -91,4 +92,4 @@ class Parser {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_CORE_IO_OP_H_
+#endif  // XDL_CORE_IO_OP_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/pool.h b/xdl/xdl/data_io/pool.h
index cb279df7..e59ca988 100644
--- a/xdl/xdl/data_io/pool.h
+++ b/xdl/xdl/data_io/pool.h
@@ -37,5 +37,4 @@ class CachePool: public ObjectPool<Batch>, public Singleton<BatchPool> {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_DATA_POOL_H_
-
+#endif  // XDL_IO_DATA_POOL_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/release_batch_op.cc b/xdl/xdl/data_io/release_batch_op.cc
new file mode 100644
index 00000000..89140f80
--- /dev/null
+++ b/xdl/xdl/data_io/release_batch_op.cc
@@ -0,0 +1,51 @@
+/* Copyright (C) 2016-2018 Alibaba Group Holding Limited
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+
+#include "xdl/core/framework/op_kernel.h"
+#include "xdl/core/framework/op_define.h"
+#include "xdl/core/framework/op_registry.h"
+#include "xdl/core/lib/timer.h"
+#include "xdl/data_io/data_io.h"
+
+namespace xdl {
+
+class ReleaseBatchOp: public OpKernel {
+ public:
+  Status Init(OpKernelConstruction* ctx) override {
+    std::string ds;
+    XDL_CHECK_STATUS(ctx->GetAttr("ds", &ds));
+
+    data_io_ = io::DataIOMap::Instance()->Get(ds);
+    XDL_CHECK(data_io_ != nullptr);
+
+    return Status::Ok();
+  }
+
+  Status Compute(OpKernelContext* ctx) override {
+    data_io_->ReleaseBatch();
+    return Status::Ok();
+  }
+
+ private:
+  io::DataIO *data_io_;
+};
+
+XDL_DEFINE_OP(ReleaseBatch)
+  .Attr("ds", AttrValue::kString);
+
+XDL_REGISTER_KERNEL(ReleaseBatch, ReleaseBatchOp).Device("CPU");
+
+}  // namespace xdl
diff --git a/xdl/xdl/data_io/scheduler.cc b/xdl/xdl/data_io/scheduler.cc
index c4fe4c73..c9e21c9c 100644
--- a/xdl/xdl/data_io/scheduler.cc
+++ b/xdl/xdl/data_io/scheduler.cc
@@ -14,11 +14,10 @@ limitations under the License.
 ==============================================================================*/
 
 #include "xdl/data_io/scheduler.h"
+#include "xdl/core/utils/logging.h"
 
 #include <string.h>
 
-#include "xdl/core/utils/logging.h"
-
 namespace xdl {
 namespace io {
 
@@ -52,75 +51,93 @@ bool Scheduler::AddPath(const std::string &path) {
 }
 
 bool Scheduler::SetEpochs(size_t epochs) {
-  XDL_CHECK(epochs < kEpochMax);
   epochs_ = epochs;
   return true;
 }
 
-std::vector<ReadParam *>Scheduler::Schedule(const char *path, size_t epochs) {
-  std::vector<ReadParam *> rparams;
-  size_t size = fs_->Size(path);
-  for (size_t epoch = 0; epoch < (epochs==0?1:epochs); ++epoch) {
-    ReadParam *rparam = new ReadParam();
-    rparam->path_ = strdup(path);
-    rparam->epoch_ = epoch;
-    rparam->ant_ = (epoch == 0 ? fs_->GetAnt(path) : nullptr);  /// open later
-    rparam->begin_ = 0;
-    rparam->end_ = size;
-    XDL_CHECK(rparam->end_ > rparam->begin_);
-
-    rparams.push_back(rparam);
-  }
+bool Scheduler::SetShuffle(bool shuffle) {
+  shuffle_ = shuffle;
+  return true;
+}
 
-  return rparams;
+bool Scheduler::SetZType(ZType ztype) {
+  ztype_ = ztype;
+  return true;
 }
 
 bool Scheduler::Schedule() {
+  std::sort(paths_.begin(), paths_.end());
   finished_ = false;
+
   std::unique_lock<std::mutex> lck(mutex_);
   if (restored_) {
     XDL_LOG(DEBUG) << "Has been restored, no need to scheduled again";
     return false;
   }
-  if (rparams_.Size() > 0) {
-    XDL_LOG(DEBUG) << "Already scheduled, size=" << rparams_.Size();
+  if (rparams_.Size() > 0 || using_.size() > 0) {
+    XDL_LOG(DEBUG) << "Already scheduled, size=" << using_.size() << " + "<< rparams_.Size();
     return false;
   }
-  std::vector<std::vector<ReadParam *>>rparams_list;
-  for (auto &path: paths_) {
-    std::vector<ReadParam *>rparams = Schedule(path.c_str(), epochs_);
-    assert(rparams.size() == epochs_==0?1:epochs_);
-    rparams_list.push_back(rparams);
+
+  for (unsigned i = 0; i < paths_.size(); ++i) {
+    XDL_LOG(DEBUG) << "{" << i << "} " << paths_[i];
   }
 
-  size_t count = 0;
-  for (size_t epoch = 0; epoch < (epochs_==0?1:epochs_); ++epoch) {
-    for (size_t i = 0; i < rparams_list.size(); ++i, ++count) {
-      ReadParam *rparam = rparams_list[i][epoch];
-      rparams_.Enqueue(rparam);
-      XDL_LOG(DEBUG) << "schedule " << rparam->DebugString();
-    }
+  std::vector<ReadParam *>rparams;
+  for (unsigned i = 0; i < paths_.size(); ++i) {
+    ReadParam *rparam = new ReadParam();
+    rparam->pathid_ = i;
+    rparam->path_ = paths_[i].c_str();
+    rparam->epoch_ = 0;
+    rparam->ant_ = nullptr;
+    rparam->begin_ = 0;
+    rparam->end_ = 0;
+    rparam->parsed_ = 0;
+    rparams.push_back(rparam);
   }
-  if (epochs_ != 0 || count == 0) {
-    /// end of data
-    rparams_.Enqueue(nullptr);
-    XDL_LOG(DEBUG) << "schedule nullptr as end";
+
+  if (rparams.size() == 0) {
+    finished_ = true;
+    return false;
   }
+
+  if (shuffle_) {
+    std::random_shuffle(rparams.begin(), rparams.end());
+  }
+
+  for (auto rparam : rparams) {
+    rparams_.Enqueue(rparam);
+    XDL_LOG(DEBUG) << "schedule " << rparam->DebugString();
+  }
+
   return true;
 }
 
 ReadParam *Scheduler::Acquire() {
-  if (finished_) {
-    return nullptr;
+  ReadParam *rparam =  nullptr;
+  while (!finished_) {
+    if (rparams_.TryDequeue(&rparam, 1000)) {
+      break;
+    }
   }
-  ReadParam *rparam = rparams_.Dequeue();
+
   if (rparam == nullptr) {
     finished_ = true;
     return nullptr;
   }
   if (rparam->ant_ == nullptr) {
-    rparam->ant_ = fs_->GetAnt(rparam->path_);
+    rparam->ant_ = fs_->GetZAnt(rparam->path_, ztype_);
+    rparam->ant_->Seek(rparam->begin_);
+  }
+  if (rparam->end_ == 0) {
+    if (ztype_ == kZLib) {
+      rparam->end_ = ULONG_MAX;
+    } else {
+      rparam->end_ = fs_->Size(rparam->path_);
+    }
+    XDL_CHECK(rparam->end_ > rparam->begin_);
   }
+
   std::unique_lock<std::mutex> lck(mutex_);
   using_.insert(rparam);
   XDL_LOG(DEBUG) << "acquire " << rparam->DebugString();
@@ -138,13 +155,21 @@ void Scheduler::Release(ReadParam *rparam) {
   using_.erase(it);
 
   /* reuse or delete */
-  if (epochs_ == 0) {
+  if (epochs_ == 0 || rparam->epoch_ < epochs_ - 1) {
+    ++ rparam->epoch_;
     rparam->begin_ = 0;
+    rparam->parsed_ = 0;
     XDL_CHECK(rparam->ant_ != nullptr);
     rparam->ant_->Seek(0);
     rparams_.Enqueue(rparam);
     XDL_LOG(DEBUG) << "re schedule " << rparam->DebugString();
   } else {
+    /* insert nullptr while all paths done */
+    XDL_LOG(DEBUG) << "finish " << rparam->DebugString();
+    if (using_.empty()) {
+      rparams_.Enqueue(nullptr);
+      XDL_LOG(DEBUG) << "finish all, schedule nullptr as end";
+    }
     delete rparam;
   }
 }
@@ -158,53 +183,63 @@ bool Scheduler::Store(DSState *ds_state) {
   ds_state->set_epochs(epochs_);
   for (auto &rparam : using_) {
     auto state = ds_state->add_states();
-    state->set_begin(rparam->begin_);
+    state->set_begin(rparam->parsed_);
     state->set_end(rparam->end_);
     state->set_epoch(rparam->epoch_);
-    state->set_path(rparam->path_);
+    state->set_pathid(rparam->pathid_);
   }
 
-  rparams_.Travel([ds_state](const ReadParam *rparam, size_t i) {
+  rparams_.Travel([ds_state, this](const ReadParam *rparam, size_t i) {
                   if (rparam == nullptr) {
                     return;
                   }
                   auto state = ds_state->add_states();
-                  state->set_begin(rparam->begin_);
+                  state->set_begin(rparam->parsed_);
                   state->set_end(rparam->end_);
                   state->set_epoch(rparam->epoch_);
-                  state->set_path(rparam->path_);
+                  XDL_CHECK(rparam->pathid_ < this->paths_.size());
+                  state->set_pathid(rparam->pathid_);
                   });
   XDL_LOG(DEBUG) << "schedule store " << ds_state->DebugString();
+
   return true;
 }
 
 bool Scheduler::Restore(const DSState &ds_state) {
+  Clear();
   std::unique_lock<std::mutex> lck(mutex_);
-  XDL_CHECK(rparams_.Empty());
   epochs_ = ds_state.epochs();
-  XDL_CHECK(epochs_ < kEpochMax);
   size_t count = 0;
   for (int i = 0; i < ds_state.states_size(); ++i, ++count) {
     auto &state = ds_state.states(i);
     ReadParam *rparam = new ReadParam();
-    rparam->path_ = strdup(state.path().c_str());
+    rparam->pathid_ = state.pathid();
+    XDL_CHECK(rparam->pathid_ < paths_.size()) << "pathid=" << rparam->pathid_ << " size=" << paths_.size();
+    rparam->path_ = paths_[rparam->pathid_].c_str();
     rparam->epoch_ = state.epoch();
     XDL_CHECK(epochs_ == 0 || rparam->epoch_ < epochs_);
-    rparam->ant_ = (rparam->epoch_ == 0 ? fs_->GetAnt(rparam->path_) : nullptr);
-    rparam->begin_ = state.begin();
+    rparam->ant_ = nullptr;
+    rparam->parsed_ = rparam->begin_ = state.begin();
     rparam->end_ = state.end();
-    XDL_CHECK(rparam->end_ > rparam->begin_);
+    XDL_CHECK(rparam->end_ >= rparam->begin_);
 
     rparams_.Enqueue(rparam);
   }
-  if (epochs_ != 0 || count == 0) {
-    rparams_.Enqueue(nullptr);
-    XDL_LOG(DEBUG) << "schedule restore nullptr as end";
-  }
   restored_ = true;
   XDL_LOG(DEBUG) << "schedule restore " << ds_state.DebugString();
+  if (rparams_.Size() == 0) {
+    finished_ = true;
+    return false;
+  }
   return true;
 }
 
+void Scheduler::Clear() {
+  std::unique_lock<std::mutex> lck(mutex_);
+  //TODO: free
+  rparams_.Clear();
+  using_.clear();
+}
+
 }  // namespace io
 }  // namespace xdl
diff --git a/xdl/xdl/data_io/scheduler.h b/xdl/xdl/data_io/scheduler.h
index 703e5f7b..63ed3bb6 100644
--- a/xdl/xdl/data_io/scheduler.h
+++ b/xdl/xdl/data_io/scheduler.h
@@ -30,7 +30,6 @@ limitations under the License.
 namespace xdl {
 namespace io {
 
-static const size_t kEpochMax = 1024;
 static const size_t kSchedCap = 1024*128;
 
 class Scheduler {
@@ -41,18 +40,22 @@ class Scheduler {
 
   virtual bool AddPath(const std::string &path);
   virtual bool SetEpochs(size_t epochs);
+  virtual bool SetZType(ZType ztype);
+  virtual bool SetShuffle(bool shuffle);
 
   virtual bool Store(DSState *ds_state);
   virtual bool Restore(const DSState &ds_state);
 
-  std::vector<ReadParam *>Schedule(const char *path, size_t epochs);
   virtual bool Schedule();
   virtual ReadParam *Acquire();
   virtual void Release(ReadParam *);
   virtual bool finished() const;
+  virtual void Clear();
  protected:
   bool restored_ = false;
+  bool shuffle_ = false;
   size_t epochs_ = 1;
+  ZType ztype_ = kRaw;
   FileSystem *fs_ = nullptr;
   std::vector<std::string> paths_;
 
@@ -65,4 +68,4 @@ class Scheduler {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_SCHEDULER_H_
+#endif  // XDL_IO_SCHEDULER_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/schema.cc b/xdl/xdl/data_io/schema.cc
index 24012eb6..54d50add 100644
--- a/xdl/xdl/data_io/schema.cc
+++ b/xdl/xdl/data_io/schema.cc
@@ -68,4 +68,4 @@ const std::vector<std::string> &Schema::dense_list() const {
 }
 
 }  // namespace io
-}  // namespace xdl
+}  // namespace xdl
\ No newline at end of file
diff --git a/xdl/xdl/data_io/schema.h b/xdl/xdl/data_io/schema.h
index 7ad95885..690c0d09 100644
--- a/xdl/xdl/data_io/schema.h
+++ b/xdl/xdl/data_io/schema.h
@@ -62,4 +62,4 @@ class Schema {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_SCHEMA_H_
+#endif  // XDL_IO_SCHEMA_H_
\ No newline at end of file
diff --git a/xdl/xdl/data_io/set_prop_op.cc b/xdl/xdl/data_io/set_prop_op.cc
index eee222c5..5714f80c 100644
--- a/xdl/xdl/data_io/set_prop_op.cc
+++ b/xdl/xdl/data_io/set_prop_op.cc
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+
 #include "xdl/core/framework/op_kernel.h"
 #include "xdl/core/framework/op_define.h"
 #include "xdl/core/framework/op_registry.h"
diff --git a/xdl/xdl/data_io/sgroup.cc b/xdl/xdl/data_io/sgroup.cc
index 46365273..4ada249f 100644
--- a/xdl/xdl/data_io/sgroup.cc
+++ b/xdl/xdl/data_io/sgroup.cc
@@ -59,7 +59,7 @@ void SGroup::Reset(int begin, int end) {
 
 bool SGroup::Reuse() {
   SGroupPool::Get()->Release(this);
-  //XDL_DLOG(DEBUG) << "release sgroup=" << this;
+  //XDL_LOG(DEBUG) << "release sgroup=" << this;
   return true;
 }
 
@@ -82,7 +82,11 @@ const SampleGroup *SGroup::Get() const {
   return sg_;
 }
 
+const bool SGroup::empty() const {
+  XDL_CHECK(sg_ != nullptr);
+  return size_ == 0;
+}
+
 
 }  // namespace io
 }  // namespace xdl
-
diff --git a/xdl/xdl/data_io/sgroup.h b/xdl/xdl/data_io/sgroup.h
index b7ce5051..3c157018 100644
--- a/xdl/xdl/data_io/sgroup.h
+++ b/xdl/xdl/data_io/sgroup.h
@@ -27,6 +27,7 @@ class SGroup {
   SampleGroup *Get();
   const SampleGroup *Get() const;
   SampleGroup *New();
+  const bool empty() const;
 
   void Reset(int begin=0, int end=0);
   void CloneTail(SGroup *sg, int end=0);
@@ -45,4 +46,4 @@ class SGroup {
 }  // namespace io
 }  // namespace xdl
 
-#endif  // XDL_IO_DATA_SGROUP_H_
+#endif  // XDL_IO_DATA_SGROUP_H_
\ No newline at end of file
diff --git a/xdl/xdl/proto/builder.py b/xdl/xdl/proto/builder.py
index 624edf02..afd41cdb 100644
--- a/xdl/xdl/proto/builder.py
+++ b/xdl/xdl/proto/builder.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/proto/decode_v4.py b/xdl/xdl/proto/decode_v4.py
index 8442fbda..01d63578 100644
--- a/xdl/xdl/proto/decode_v4.py
+++ b/xdl/xdl/proto/decode_v4.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/proto/feaconf.proto b/xdl/xdl/proto/feaconf.proto
index 97643b16..c6314393 100644
--- a/xdl/xdl/proto/feaconf.proto
+++ b/xdl/xdl/proto/feaconf.proto
@@ -2,7 +2,8 @@ syntax = "proto2";
 package xdl.io;
 
 enum Constants {
-    kTablesMax=4;
+    kTablesMax = 4;
+    kNVecMax = 1024;
 }
 
 enum FeatureType {
@@ -17,5 +18,7 @@ message FeatureOption {
     optional int32 nvec = 4;
     optional int32 table = 5;
     optional string dsl = 6;
-    repeated uint32 mask = 7;
+    optional bytes mask = 7;
+    optional int32 reserve = 8;
+    optional int32 cutoff = 9;
 }
diff --git a/xdl/xdl/proto/io_state.proto b/xdl/xdl/proto/io_state.proto
index 79fb20f6..16f0335b 100644
--- a/xdl/xdl/proto/io_state.proto
+++ b/xdl/xdl/proto/io_state.proto
@@ -2,16 +2,22 @@ syntax = "proto2";
 package xdl.io;
 
 message State {
-    required uint64 begin = 1;
-    required uint64 end = 2;
-    required uint64 epoch = 3;
-    required string path  = 4;
+    required uint64 begin = 1 [default = 0];
+    required uint64 end = 2 [default = 0];
+    required uint32 epoch = 3 [default = 0];
+    optional string path  = 4;
+    optional uint32 pathid = 5;
 }
 
 message DSState {
     required string ds_name = 1;
     required uint32 epochs = 2;
     repeated State states = 3;
+    optional uint64 start_time = 4;
+    optional uint64 end_time = 5;
+    optional uint64 next_start_time = 6;
+    optional uint64 duration = 7;
+    repeated string path = 8;
 }
 
 message IOState {
diff --git a/xdl/xdl/proto/sample.proto b/xdl/xdl/proto/sample.proto
index c4ee6863..e5bfa713 100644
--- a/xdl/xdl/proto/sample.proto
+++ b/xdl/xdl/proto/sample.proto
@@ -19,7 +19,6 @@ message SampleSimple {
     required FeatureLine feature_line = 3;     // 样本的特征行
 }
 
-
 message Extensions {
     map<string, string> extension = 1;
 }
@@ -31,20 +30,21 @@ message Label {
 
 // 特征表
 message FeatureTable {
-    repeated FeatureLine feature_lines = 1; // 每个样本的特征行
+    repeated FeatureLine feature_lines = 1;    // 每个样本的特征行
 }
 
 // 特征行
 message FeatureLine {
-    repeated Feature features = 1;         // 每个特征行里的特征(组)
-    optional int32 refer = 2;              // 引用下层辅表的哪个特征行
+    repeated Feature features = 1;             // 每个特征行里的特征(组)
+    optional int32 refer = 2;                  // 引用下层辅表的哪个特征行
+    repeated int32 reserve = 3;
 }
 
 // 特征(组)
 message Feature {
-    required FeatureType type = 1;         // 特征类型
-    optional string name = 2;              // 特征(组)名字，与field_id二选一
-    repeated FeatureValue values = 3;      // 特征值, 一个特征(组)可能有多个特征值
+    required FeatureType type = 1;              // 特征类型
+    optional string name = 2;                   // 特征(组)名字，如果使用feature group, 可以不填
+    repeated FeatureValue values = 3;           // 特征值, 一个特征(组)可能有多个特征值
 }
 
 // 特征值
@@ -52,6 +52,6 @@ message FeatureValue {
    optional int64 key = 1;                 // 特征ID, dense可以没有
    optional float value = 2;               // 特征值，没有默认是1
    repeated float vector = 3;              // 特征向量，向量类型的特征才有，也可以用来表示稠密特征
-   optional int64 hkey = 4;                // 特征ID高64位, 只有kgb的序列化ID才有
+   optional int64 hkey = 4;                // 特征ID高64位, (仅hash稀疏特征用，不填为0)
 }
 
diff --git a/xdl/xdl/proto/trace.proto b/xdl/xdl/proto/trace.proto
new file mode 100644
index 00000000..0a6edb06
--- /dev/null
+++ b/xdl/xdl/proto/trace.proto
@@ -0,0 +1,39 @@
+syntax = "proto3";
+package xdl.proto;
+
+message Header {
+    repeated string key = 1; // 每个key对应一个trace的variable
+}
+
+message Meta {
+    int64 lstep_begin = 1;
+    int64 lstep_end = 2;
+    int64 gstep_begin = 3;
+    int64 gstep_end = 4;
+    int64 timestamp_begin = 5;
+    int64 timestamp_end = 6;
+}
+
+enum Type {
+    Int8 = 0;
+    Int16 = 1;
+    Int32 = 2;
+    Int64 = 3;
+    Float = 4;
+    Double = 5;
+    Bool = 6;
+    Byte = 7;
+}
+
+message Column {
+    Type dtype = 1;
+    repeated int32 shape = 2;
+    bytes data = 3;
+}
+
+message Record {
+    int64 gstep = 1;  // global step
+    int64 lstep = 2;  // local step
+    repeated Column column = 3;  // 与header对应的每个tensor
+    int64 timestamp = 4;  // run timestamp
+}
diff --git a/xdl/xdl/python/CMakeLists.txt b/xdl/xdl/python/CMakeLists.txt
index 56453289..8e77dc13 100644
--- a/xdl/xdl/python/CMakeLists.txt
+++ b/xdl/xdl/python/CMakeLists.txt
@@ -1,26 +1,28 @@
 aux_source_directory(pybind SRC_XDL_PYTHON_PYBIND)
-add_library(xdl_python_pybind SHARED ${SRC_XDL_PYTHON_PYBIND})
-target_link_libraries(xdl_python_pybind ${XDL_IO_LIB} ${XDL_CORE_LIB} rdkafka++ ${PYTHON_LIBRARIES})
+IF (USE_PS_PLUS)
+ELSE ()
+   LIST (REMOVE_ITEM SRC_XDL_PYTHON_PYBIND pybind/model_server_wrapper.cc)
+ENDIF ()
 
-set(TAG_PS python_ps_lib)
-add_custom_target(python_ps_lib ALL
-  DEPENDS xdl_core xdl_python_pybind ps
-  COMMAND ${CMAKE_COMMAND} -E remove_directory "${CMAKE_BINARY_DIR}/python_lib"
-  COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl"
-  COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl/bin"
-  COMMAND ${CMAKE_COMMAND} -E copy "${CMAKE_BINARY_DIR}/ps-plus/ps" "${CMAKE_BINARY_DIR}/python_lib/xdl/bin/ps"
-)
+add_library(xdl_python_pybind SHARED ${SRC_XDL_PYTHON_PYBIND})
+target_link_libraries(xdl_python_pybind ${XDL_IO_LIB} ${XDL_CORE_LIB} libprotobuf rdkafka++ ${PYTHON_LIBRARIES})
 
 add_custom_target(python_lib ALL
-  DEPENDS xdl_core xdl_python_pybind ${TAG_PS}
+  DEPENDS xdl_core xdl_python_pybind
+  COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl"
   COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl/include"
+  COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl/include/third_party"
   COMMAND cp -r "${CMAKE_SOURCE_DIR}/xdl" "${CMAKE_BINARY_DIR}/python_lib/xdl/include/"
   COMMAND cp -r "${PROTOBUF_INCLUDE_DIR}/google" "${CMAKE_BINARY_DIR}/python_lib/xdl/include/"
   COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl/bin"
   COMMAND ${CMAKE_COMMAND} -E copy "${PROTOBUF_PROTOC_PATH}" "${CMAKE_BINARY_DIR}/python_lib/xdl/bin/protoc"
   COMMAND cp -r "${CMAKE_BINARY_DIR}/xdl/proto" "${CMAKE_BINARY_DIR}/python_lib/xdl/include/xdl/"
+  COMMAND cp -r "${CMAKE_SOURCE_DIR}/third_party/eigen" "${CMAKE_BINARY_DIR}/python_lib/xdl/include/third_party/"
   COMMAND cp -r "${CMAKE_CURRENT_SOURCE_DIR}" "${CMAKE_BINARY_DIR}/python_lib/xdl/"
-  COMMAND cp -r "${CMAKE_BINARY_DIR}/xdl/core/proto" "${CMAKE_BINARY_DIR}/python_lib/xdl/python/proto"
+  COMMAND cp "${CMAKE_BINARY_DIR}/xdl/core/proto/*" "${CMAKE_BINARY_DIR}/python_lib/xdl/include/xdl/core/proto"
+  COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl/python/proto"
+  COMMAND cp "${CMAKE_BINARY_DIR}/xdl/proto/*.py" "${CMAKE_BINARY_DIR}/python_lib/xdl/python/proto"
+  COMMAND cp "${CMAKE_BINARY_DIR}/xdl/core/proto/*.py" "${CMAKE_BINARY_DIR}/python_lib/xdl/python/proto"
   COMMAND touch "${CMAKE_BINARY_DIR}/python_lib/xdl/python/proto/__init__.py"
   COMMAND sed -i "s/#{tf_backend_import}/${TF_BACKEND_IMPORT}/g" ${CMAKE_BINARY_DIR}/python_lib/xdl/python/init.py
   COMMAND sed -i "s/#{mxnet_backend_import}/${MXNET_BACKEND_IMPORT}/g" ${CMAKE_BINARY_DIR}/python_lib/xdl/python/init.py
@@ -30,8 +32,24 @@ add_custom_target(python_lib ALL
   COMMAND ${CMAKE_COMMAND} -E copy "$<TARGET_FILE:xdl_python_pybind>" "${CMAKE_BINARY_DIR}/python_lib/xdl/python/pybind/$<TARGET_FILE_NAME:xdl_python_pybind>"
 )
 
+IF (USE_PS_PLUS)
+  set(TAG_PS python_ps_lib)
+  add_custom_target(python_ps_lib ALL
+    DEPENDS python_lib ps
+    COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_BINARY_DIR}/python_lib/xdl/bin"
+    COMMAND ${CMAKE_COMMAND} -E copy "${CMAKE_BINARY_DIR}/ps-plus/ps" "${CMAKE_BINARY_DIR}/python_lib/xdl/bin/ps"
+  )
+ELSE ()
+  set(TAG_PS python_no_ps_lib)
+  add_custom_target(python_no_ps_lib ALL
+    DEPENDS python_lib
+    COMMAND ${CMAKE_COMMAND} -E copy "${CMAKE_BINARY_DIR}/python_lib/xdl/python/init_local.py" "${CMAKE_BINARY_DIR}/python_lib/xdl/python/init.py"
+  )
+ENDIF ()
+
+
 add_custom_target(install_python_lib
-  DEPENDS python_lib
-  COMMAND python setup.py install post_install
+  DEPENDS ${TAG_PS}
+  COMMAND python setup.py install
   WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/python_lib"
 )
diff --git a/xdl/xdl/python/__init__.py b/xdl/xdl/python/__init__.py
index cbca45f4..4cae669c 100644
--- a/xdl/xdl/python/__init__.py
+++ b/xdl/xdl/python/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/__setup__.py b/xdl/xdl/python/__setup__.py
index 274b5bde..ebe1f579 100644
--- a/xdl/xdl/python/__setup__.py
+++ b/xdl/xdl/python/__setup__.py
@@ -23,12 +23,24 @@
 
 allowed_extensions = [".so", ".h"]
 
-kwargs = {'install_requires': 'protobuf==3.6.1', 'zip_safe': False}
+kwargs = {'install_requires': ['protobuf==3.6.1', 'pyhdfs', 'matplotlib==2.0.0'], 'zip_safe': False}
 
 class PostCmd(install):
   def run(self):
     dir_name = os.path.dirname(os.path.abspath(__file__))
     self.spawn(['cp', os.path.join(dir_name, '../third_party/librdkafka/src/librdkafka.so'), '/usr/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_release/libtbbmalloc_proxy.so.2"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_release/libtbbmalloc_proxy.so"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_release/libtbb.so.2"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_release/libtbb.so"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_release/libtbbmalloc.so.2"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_release/libtbbmalloc.so"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_debug/libtbbmalloc_proxy_debug.so.2"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_debug/libtbbmalloc_proxy_debug.so"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_debug/libtbb_debug.so.2"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_debug/libtbb_debug.so"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_debug/libtbbmalloc_debug.so.2"), '/lib/'])
+    self.spawn(['cp', os.path.join(dir_name, "../../build/tbb_cmake_build/tbb_cmake_build_subdir_debug/libtbbmalloc_debug.so"), '/lib/'])        
     install.run(self)
 
 def find_package_data():
@@ -37,15 +49,15 @@ def find_package_data():
     root = root[6:]
     for name in files:
       ext = os.path.splitext(name)[1]
-      if ext in allowed_extensions:
+      if ext in allowed_extensions or root.find('third_party/eigen') != -1:
         ret.append(root + '/' + name)
   ret.append("bin/ps")
   ret.append("bin/protoc")
   return ret
 
 setup(name='xdl',
-      version='1.0',
+      version='1.2',
       packages=find_packages(where='.'),
       package_data={'xdl':find_package_data()},
-      cmdclass={'post_install': PostCmd},
+      cmdclass={'install': PostCmd},
       **kwargs)
diff --git a/xdl/xdl/python/backend/__init__.py b/xdl/xdl/python/backend/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/backend/__init__.py
+++ b/xdl/xdl/python/backend/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/backend/backend_type.py b/xdl/xdl/python/backend/backend_type.py
new file mode 100644
index 00000000..89406b2f
--- /dev/null
+++ b/xdl/xdl/python/backend/backend_type.py
@@ -0,0 +1,24 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+backend_type = ''
+
+def get_backend_type():
+  global backend_type
+  return backend_type
+
+def set_backend_type(type):
+  global backend_type
+  backend_type = type
diff --git a/xdl/xdl/python/backend/model_scope.py b/xdl/xdl/python/backend/model_scope.py
index 15d166b7..e8ea47d3 100644
--- a/xdl/xdl/python/backend/model_scope.py
+++ b/xdl/xdl/python/backend/model_scope.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/backend/mxnet/__init__.py b/xdl/xdl/python/backend/mxnet/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/backend/mxnet/__init__.py
+++ b/xdl/xdl/python/backend/mxnet/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/backend/mxnet/batchnorm_hook.py b/xdl/xdl/python/backend/mxnet/batchnorm_hook.py
index d1c827a1..86e4048d 100644
--- a/xdl/xdl/python/backend/mxnet/batchnorm_hook.py
+++ b/xdl/xdl/python/backend/mxnet/batchnorm_hook.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/backend/mxnet/convert_utils.py b/xdl/xdl/python/backend/mxnet/convert_utils.py
index 9059a45a..1182f929 100644
--- a/xdl/xdl/python/backend/mxnet/convert_utils.py
+++ b/xdl/xdl/python/backend/mxnet/convert_utils.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/backend/mxnet/mxnet_backend.py b/xdl/xdl/python/backend/mxnet/mxnet_backend.py
index 5f2dfb1e..359d3397 100644
--- a/xdl/xdl/python/backend/mxnet/mxnet_backend.py
+++ b/xdl/xdl/python/backend/mxnet/mxnet_backend.py
@@ -1,18 +1,3 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-# 
-#     http://www.apache.org/licenses/LICENSE-2.0
-# 
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
 # Copyright 2018 Alibaba Group. All Rights Reserved.
 # # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -46,6 +31,9 @@
 from xdl.python.lib.tensor import Tensor
 from xdl.python.utils.collections import *
 from xdl.python.backend.model_scope import cur_model_scope
+from xdl.python.training import trace
+import random
+from xdl.python.backend.backend_type import set_backend_type
 
 """python adapter for mxnet."""
 
@@ -91,8 +79,8 @@ def make_placeholder(x, sym_input_dict, gear):
     add_var_mapping(emb_info.var, name)
     sym_input_dict[name] = x
     return mx.sym.Variable(
-      name, 
-      shape=[x.shape[0], emb_info.emb_dim], 
+      name,
+      shape=[x.shape[0], emb_info.emb_dim],
       dtype='float32',
       __create_by_xdl__=True)
   else:
@@ -104,8 +92,8 @@ def make_placeholder(x, sym_input_dict, gear):
     import xdl.python.backend.mxnet.convert_utils as cu
     sym_input_dict[name] = x
     return mx.sym.Variable(
-      name, 
-      shape=x.shape, 
+      name,
+      shape=x.shape,
       dtype=cu.XDL2MX.convert_type(x.dtype),
       __create_by_xdl__=True)
 
@@ -116,8 +104,8 @@ def serialize_graph(symbol):
 def add_variable_inputs(sym, sym_input_dict, is_training):
   arg_shape, _, aux_shape = sym.infer_shape()
   arg_type, _, aux_type = sym.infer_type()
-  arg_shape_type = zip(sym.list_arguments(), 
-                       arg_shape, 
+  arg_shape_type = zip(sym.list_arguments(),
+                       arg_shape,
                        arg_type)
   aux_shape_type = zip(sym.list_auxiliary_states(),
                        aux_shape,
@@ -138,6 +126,7 @@ def add_variable_inputs(sym, sym_input_dict, is_training):
           initializer_and_args[0],
           initializer_and_args[1]))
       sym_input_dict[item[0]] = xdl_var.value
+
   for item in aux_shape_type:
     if item[0].endswith('_moving_mean') or \
           item[0].endswith('_moving_var'):
@@ -179,9 +168,55 @@ def flatten_list(inputs):
       output.append(x)
   return output
 
+def get_symbol_list(model_outputs):
+  symbol_list = list(model_outputs)
+  bn_statistic = get_collection(MXNET_BN_STATISTIC)
+  bn_var_names = []
+  bn_syms = []
+  moments = []
+  if bn_statistic is not None and len(bn_statistic) > 0:
+    bn_var_names.extend([x[0] for x in bn_statistic])
+    bn_syms.extend([x[1] for x in bn_statistic])
+    moments.extend([x[2] for x in bn_statistic])
+
+  symbol_list.extend([mx.sym.BlockGrad(x) for x in bn_syms])
+  return symbol_list, bn_var_names, bn_syms, moments
+
+def get_trace_outputs(sym):
+  args = sym.list_arguments()
+  auxs = sym.list_auxiliary_states()
+  trace_names = trace.get_names('mxnet')
+  trace_syms = trace.get_tensors('mxnet')
+  res = []
+  for i in xrange(len(trace_names)):
+    name = trace_names[i]
+    sym_name = trace_syms[i].name
+    if name in args or name in auxs or sym_name in args or sym_name in auxs:
+      continue
+    res.append(trace_syms[i])
+  return res
+
+def set_trace_outputs(sym_input_dict, outputs):
+  trace_output = []
+  trace_names = trace.get_names('mxnet')
+  trace_syms = trace.get_tensors('mxnet')
+  k = 0
+  for i in xrange(len(trace_names)):
+    name = trace_names[i]
+    sym_name = trace_syms[i].name
+    if name in sym_input_dict:
+      trace_output.append(sym_input_dict[name])
+    elif sym_name in sym_input_dict:
+      trace_output.append(sym_input_dict[sym_name])
+    else:
+      trace_output.append(outputs[k])
+      k += 1
+  assert k == len(outputs)
+  trace.set_values('mxnet', trace_output)
+
 def mxnet_wrapper(device_type='cpu', is_training=True, init_grad=None):
   """python decorator to adapt a mxnet-model define function to xdl.
-  
+
   Args:
   device_type: on which device the mxnet-model whill run, can only be cpu/gpu
 
@@ -189,13 +224,14 @@ def mxnet_wrapper(device_type='cpu', is_training=True, init_grad=None):
   a decorator
 
   Raises:
-  raise exception when model_func return none 
+  raise exception when model_func return none
   """
   def decorator(model_func):
     """ model_func: a function define a mxnet model using native mxnet api
     return value must be loss
     """
     def _wrapper(*inputs, **kwargs):
+      set_backend_type('mxnet')
       add_to_collection(BACKEND_DEVICE_TYPE, device_type.lower())
       sym_input_dict = {}
       placeholders = []
@@ -204,7 +240,7 @@ def _wrapper(*inputs, **kwargs):
         placeholders.append(placeholder)
 
       gear_input_num = 0
-      if 'gear_inputs' in kwargs:      
+      if 'gear_inputs' in kwargs:
         gear_inputs = kwargs['gear_inputs']
         gear_placeholder = recursive_make_placeholder(gear_inputs, sym_input_dict, True)
         kwargs['gear_inputs'] = gear_placeholder
@@ -213,35 +249,32 @@ def _wrapper(*inputs, **kwargs):
       model_outputs = model_func(*placeholders, **kwargs)
       if len(model_outputs) == 0:
         raise Exception('model_func must return loss')
-      symbol_list = list(model_outputs)
-      bn_statistic = get_collection(MXNET_BN_STATISTIC)
-      bn_var_names = []
-      bn_syms = []
-      moments = []
-      if bn_statistic is not None and len(bn_statistic) > 0:
-        bn_var_names.extend([x[0] for x in bn_statistic])
-        bn_syms.extend([x[1] for x in bn_statistic])
-        moments.extend([x[2] for x in bn_statistic])
-
-      symbol_list.extend([mx.sym.BlockGrad(x) for x in bn_syms])
+      symbol_list, bn_var_names, bn_syms, moments = get_symbol_list(model_outputs)
+
+      # add trace symbols
+      trace_outputs = get_trace_outputs(mx.sym.Group(symbol_list))
+      trace_size = len(trace_outputs)
+      symbol_list.extend(trace_outputs)
+
       symbol = mx.sym.Group(symbol_list)
       executor = symbol.simple_bind(ctx=mx.cpu())
       add_variable_inputs(symbol, sym_input_dict, is_training=is_training)
+
       sym_names = symbol.list_arguments()
       xdl_inputs = []
       for sym in sym_names:
         xdl_inputs.append(sym_input_dict[sym])
-      
+
       for aux in symbol.list_auxiliary_states():
         if aux in sym_input_dict:
           xdl_inputs.append(sym_input_dict[aux])
           sym_names.append(aux)
 
       target_size = len(executor.outputs)
-      gradient_size=len(executor.grad_arrays)      
+      gradient_size=len(executor.grad_arrays)
       if device_type.lower() == 'cpu':
         outputs, gradients = xdl.mxnet_backend_op(
-          inputs = xdl_inputs, 
+          inputs = xdl_inputs,
           var_name_str = ','.join(sym_names),
           device_type = device_type.lower(),
           graph_def=serialize_graph(symbol),
@@ -249,11 +282,12 @@ def _wrapper(*inputs, **kwargs):
           gradient_size=gradient_size if is_training else 0,
           is_training=is_training,
           init_grad=init_grad if init_grad is not None else np.array([], dtype=np.float32),
-          has_init_grad=True if init_grad is not None else False)
+          has_init_grad=True if init_grad is not None else False,
+          id = random.randint(0, 2 ** 60))
       else:
         with xdl.device('GPU'):
           outputs, gradients = xdl.mxnet_backend_op(
-            inputs = xdl_inputs, 
+            inputs = xdl_inputs,
             var_name_str = ','.join(sym_names),
             device_type = device_type.lower(),
             graph_def=serialize_graph(symbol),
@@ -261,7 +295,13 @@ def _wrapper(*inputs, **kwargs):
             gradient_size=gradient_size if is_training else 0,
             is_training=is_training,
             init_grad=init_grad if init_grad is not None else np.array([], dtype=np.float32),
-            has_init_grad=True if init_grad is not None else False)
+            has_init_grad=True if init_grad is not None else False,
+            id = random.randint(0, 2 ** 60))
+
+      # set trace outputs
+      trace_outputs = [] if trace_size == 0 else outputs[-trace_size:]
+      set_trace_outputs(sym_input_dict, trace_outputs)
+      outputs = outputs if trace_size == 0 else outputs[:-trace_size]
 
       bn_var_num = len(bn_var_names)
       if bn_var_num > 0:
diff --git a/xdl/xdl/python/backend/tf/__init__.py b/xdl/xdl/python/backend/tf/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/backend/tf/__init__.py
+++ b/xdl/xdl/python/backend/tf/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/backend/tf/convert_utils.py b/xdl/xdl/python/backend/tf/convert_utils.py
index 136ef1a0..45d70bf3 100644
--- a/xdl/xdl/python/backend/tf/convert_utils.py
+++ b/xdl/xdl/python/backend/tf/convert_utils.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -20,6 +20,7 @@
 import os
 import sys
 
+import numpy as np
 import tensorflow as tf
 from tensorflow.python.ops.init_ops import Constant
 from tensorflow.python.ops.init_ops import Ones
@@ -83,6 +84,8 @@ def convert_initializer(initializer):
             return xi.Null
         elif type(initializer) == Constant:
             value = getattr(initializer, 'value')
+            if isinstance(value, (np.ndarray, np.generic)):
+                return xi.Identity(value=value)
             return xi.Constant(value)
         elif type(initializer) == Ones:
             return xi.Ones()
@@ -105,14 +108,14 @@ def convert_initializer(initializer):
             return xi.TruncatedNormal(mean, stddev, seed)
         elif type(initializer) == UniformUnitScaling:
             factor = getattr(initializer, 'factor')
-            seed = getattr(initializer, 'seed')  
+            seed = getattr(initializer, 'seed')
             return xi.UniformUnitScaling(factor, seed)
         elif type(initializer) == VarianceScaling:
             scale = getattr(initializer, 'scale')
-            mode = getattr(initializer, 'mode')  
-            distribution = getattr(initializer, 'distribution')      
-            seed = getattr(initializer, 'seed')  
+            mode = getattr(initializer, 'mode')
+            distribution = getattr(initializer, 'distribution')
+            seed = getattr(initializer, 'seed')
             return xi.VarianceScaling(scale, mode, distribution, seed)
-        else:        
+        else:
             raise Exception('unsupport tf initializer:' + str(initializer))
 
diff --git a/xdl/xdl/python/backend/tf/tf_backend.py b/xdl/xdl/python/backend/tf/tf_backend.py
index 11028128..244b9d6b 100644
--- a/xdl/xdl/python/backend/tf/tf_backend.py
+++ b/xdl/xdl/python/backend/tf/tf_backend.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -31,23 +31,52 @@
 from tensorflow.python.saved_model import utils as tensor_utils
 
 import xdl
-from xdl.python.backend.tf.convert_utils import XDL2TF
+from xdl.python.backend.tf.convert_utils import XDL2TF, TF2XDL
 from xdl.python.training.gradient_utils import set_gradients, set_gear_gradient
 from xdl.python.training.gradient_utils import set_gradients, add_var_mapping
 from xdl.python.lib.tensor import Tensor
 from xdl.python.utils.collections import *
 from xdl.python.sparse_engine.embedding import is_embedding_var, get_embedding_info
 from xdl.python.backend.model_scope import cur_model_scope
+from xdl.python.training import trace
 import xdl.python.backend.tf.tf_hook
 from xdl.python.backend.tf import tf_batchnorm_hook
+from xdl.python.backend.backend_type import set_backend_type
 
 """python adapter for tensorflow."""
 
+_TF_GRAPH_DICT = {}
+_PLACEHOLDER_INFOS = {}
+
+class PlaceHolderInfo(object):
+  def __init__(self, placeholder, shape, dtype, xdl_tensor):
+    self.placeholder_ = placeholder
+    self.shape_ = shape
+    self.dtype_ = dtype
+    self.xdl_tensor_ = xdl_tensor
+
+def get_placeholder_infos(model_scope=''):
+  global _PLACEHOLDER_INFOS
+  if model_scope not in _PLACEHOLDER_INFOS:
+    raise ValueError('no placeholder info found under model_scope[%s]' % model_scope)
+  return _PLACEHOLDER_INFOS[model_scope]
+
 def recursive_make_placeholder(x, xdl_inputs, tf_inputs):
+  global _PLACEHOLDER_INFOS
+  if isinstance(x, dict):
+    ret = {}
+    for key in x.keys():
+      ret[key] = recursive_make_placeholder(x[key], xdl_inputs, tf_inputs)
+    return ret
   if isinstance(x, (tuple, list)):
     return [recursive_make_placeholder(item, xdl_inputs, tf_inputs) for item in x]
   elif isinstance(x, Tensor):
     placeholder = make_placeholder(x)
+    model_scope = cur_model_scope()
+    if model_scope not in _PLACEHOLDER_INFOS:
+      _PLACEHOLDER_INFOS[model_scope] = []
+    _PLACEHOLDER_INFOS[model_scope].append(
+      PlaceHolderInfo(placeholder, x.shape, x.dtype, x))
     xdl_inputs.append(x)
     tf_inputs.append(placeholder)
     return placeholder
@@ -65,33 +94,62 @@ def make_placeholder(x):
   """
   emb_info = get_embedding_info(x)
   if emb_info is not None:
-    placeholder = tf.placeholder(
-      tf.float32,
-      name=emb_info.name, 
-      shape=[None, emb_info.emb_dim])
+    if emb_info.combiner != 'tile':
+      placeholder = tf.placeholder(
+        tf.float32,
+        name=emb_info.name,
+        shape=[None, emb_info.emb_dim])
+    else:
+      placeholder = tf.placeholder(
+        tf.float32,
+        name=emb_info.name,
+        shape=[None, emb_info.tile_length])
     emb_info._output_tensor = x
     add_var_mapping(emb_info.var, placeholder.name)
-    add_to_collection(BACKPROP_VARS, (placeholder.name, placeholder))        
+    add_to_collection(BACKPROP_VARS, (placeholder.name, placeholder))
     return placeholder
   else:
-    if x.shape is not None and len(x.shape) > 1:
-      return tf.placeholder(XDL2TF.convert_type(x.dtype), shape=[None] + list(x.shape[1:]))
+    if x.shape is None:
+      shape = None
+    elif len(x.shape) == 0:
+      shape = x.shape
     else:
-      return tf.placeholder(XDL2TF.convert_type(x.dtype), shape=x.shape)      
+      shape = [None]
+      if len(x.shape) > 1:
+        shape.extend(x.shape[1:])
+    return tf.placeholder(XDL2TF.convert_type(x.dtype), shape=shape)
 
-def serialize_graph(clear_devices=False, as_text=False):
+def serialize_graph(clear_devices=False, as_text=False, model_scope=''):
   """serialize tf graph to path."""
-  saver = tf_saver.Saver(
-    variables._all_saveable_objects(),
-    sharded=True,
-    write_version=saver_pb2.SaverDef.V2,
-    allow_empty=True)
-  meta_graph_def = saver.export_meta_graph(clear_devices=clear_devices)
+  global _TF_GRAPH_DICT
+  cur_graph = _TF_GRAPH_DICT[model_scope]
+  if cur_graph is None:
+    raise ValueError('get tf graph under model scope[%s] failed!' % model_scope)
+  with cur_graph.as_default():
+    saver = tf_saver.Saver(
+      variables._all_saveable_objects(),
+      sharded=True,
+      write_version=saver_pb2.SaverDef.V2,
+      allow_empty=True)
+    meta_graph_def = saver.export_meta_graph(clear_devices=clear_devices)
   if as_text:
     return str(meta_graph_def)
   else:
     return meta_graph_def.SerializeToString()
 
+def get_tf_graph(clear_devices=False, model_scope=''):
+  global _TF_GRAPH_DICT
+  cur_graph = _TF_GRAPH_DICT[model_scope]
+  if cur_graph is None:
+    raise ValueError('get tf graph under model scope[%s] failed!' % model_scope)
+  with cur_graph.as_default():
+    saver = tf_saver.Saver(
+      variables._all_saveable_objects(),
+      sharded=True,
+      write_version=saver_pb2.SaverDef.V2,
+      allow_empty=True)
+    return saver.export_meta_graph(clear_devices=clear_devices)
+
 def get_op_name(op):
   """get tf op name in op_list"""
   return tensor_utils.build_tensor_info(op).name
@@ -101,6 +159,15 @@ def get_op_names(op_list):
   flatten_op_list = flatten_list(op_list)
   return [get_op_name(x) for x in flatten_op_list]
 
+def get_op_type(op):
+  """get tf op type"""
+  return TF2XDL.convert_type(tensor_utils.build_tensor_info(op).dtype)
+
+def get_op_types(op_list):
+  """get tf op type in op_list"""
+  flatten_op_list = flatten_list(op_list)
+  return [get_op_type(x) for x in flatten_op_list]
+
 def flatten(input):
   if isinstance(input, list):
     return flatten_list(input)
@@ -140,7 +207,7 @@ def add_variable_inputs(inputs, input_op_names):
 
 def tf_wrapper(is_training=True, init_grad=None, gpu_memory_fraction=0.5, device_type='cpu'):
   """python decorator to adapt a tf-model define function to xdl.
-  
+
   Args:
   model_func: a tf-model define function, the first return value must be loss
 
@@ -152,83 +219,101 @@ def tf_wrapper(is_training=True, init_grad=None, gpu_memory_fraction=0.5, device
   """
   def decorator(model_func):
     def _wrapper(*inputs, **kwargs):
-      add_to_collection(BACKEND_DEVICE_TYPE, device_type.lower())
-      model_fn_inputs = []
-      xdl_inputs = []
-      placeholders = []
-
-      for x in inputs:
-        input = recursive_make_placeholder(x, xdl_inputs, placeholders)
-        model_fn_inputs.append(input)
-
-      gear_placeholders = []
-      if 'gear_inputs' in kwargs:
-        gear_inputs = kwargs['gear_inputs']
-        input = recursive_make_placeholder(gear_inputs, xdl_inputs, placeholders)
-        gear_placeholders = flatten(placeholders[-len(gear_inputs):])
-        kwargs['gear_inputs'] = input
-
-      init_grad_placeholder = None
-      if init_grad is not None:
-        init_grad_placeholder = recursive_make_placeholder(
-          init_grad, xdl_inputs, placeholders)
-
-      targets = model_func(*model_fn_inputs, **kwargs)
-      local_init_op_names = [x.initializer.name for x in tf.local_variables()]
-      if isinstance(targets, tuple):
-        targets = list(targets)
-      else:
-        targets = [targets]
-      # add batch_normalization
-      batchnorm_begin = len(targets)
-      batchnorm_tensors = tf_batchnorm_hook.get_batchnorm_tensors()
-      batchnorm_size = len(batchnorm_tensors)
-      targets.extend(batchnorm_tensors)
-
-      var_names = []
-      gradient_op_names = []
-      if is_training:
-        loss = targets[0]
-        if isinstance(loss, (list, tuple, dict)):
-          raise 'model function must reture loss as first output'
-        for gear_placeholder in gear_placeholders:
-          add_to_collection(BACKPROP_VARS, ("gear_grad", gear_placeholder))        
-        var_names, gradient_op_names = add_backprop_ops(
-          loss,
-          get_collection(BACKPROP_VARS, ['', cur_model_scope()]),
-          init_grad_placeholder)
-      input_op_names = get_op_names(placeholders)
-      target_op_names = get_op_names(targets)
-      op_inputs = xdl_inputs
-      add_variable_inputs(op_inputs, input_op_names)
-      outputs, gradients = xdl.tfbackend_op(
-        inputs = list(op_inputs),
-        input_op_names = ','.join(input_op_names),
-        target_op_names = ','.join(target_op_names),
-        gradient_op_names = ','.join(gradient_op_names),
-        local_init_op_names = ','.join(local_init_op_names),
-        graph_def=serialize_graph(),
-        target_size=len(target_op_names),
-        gradient_size=len(gradient_op_names),
-        gpu_memory_fraction=gpu_memory_fraction)
-
-      gradients_size = len(gradients)
-      gear_size = len(gear_placeholders)
-      gear_grads = gradients[gradients_size - gear_size:]
-      gradients = gradients[0: gradients_size - gear_size]
-      var_names = var_names[0: gradients_size - gear_size]
-      if len(gear_grads) > 0:
-        add_to_collection(GEAR_GRAD, gear_grads, cur_model_scope())
-        for i in range(len(gear_inputs)):
-          set_gear_gradient(gear_inputs[i], gear_grads[i])
-      if is_training:
-        set_gradients(var_names, gradients, cur_model_scope())
-      if batchnorm_size == 0:
-        batchnorm_output = []
-      else:
-        batchnorm_output = outputs[-batchnorm_size:]
-      tf_batchnorm_hook.set_tf_output(batchnorm_output)
-      return outputs if batchnorm_size == 0 else outputs[:-batchnorm_size]
+      global _TF_GRAPH_DICT
+      model_scope = cur_model_scope()
+      if model_scope not in _TF_GRAPH_DICT:
+        _TF_GRAPH_DICT[model_scope] = tf.Graph()
+      cur_graph = _TF_GRAPH_DICT[model_scope]
+      with cur_graph.as_default():
+        set_backend_type('tensorflow')
+        add_to_collection(BACKEND_DEVICE_TYPE, device_type.lower())
+        model_fn_inputs = []
+        xdl_inputs = []
+        placeholders = []
+        
+        for x in inputs:
+          input = recursive_make_placeholder(x, xdl_inputs, placeholders)
+          model_fn_inputs.append(input)
+        
+        gear_placeholders = []
+        if 'gear_inputs' in kwargs:
+          gear_inputs = kwargs['gear_inputs']
+          input = recursive_make_placeholder(gear_inputs, xdl_inputs, placeholders)
+          gear_placeholders = flatten(placeholders[-len(gear_inputs):])
+          #gear_placeholders = flatten(placeholders[-1:])
+          kwargs['gear_inputs'] = input
+        
+        init_grad_placeholder = None
+        if init_grad is not None:
+          init_grad_placeholder = recursive_make_placeholder(
+            init_grad, xdl_inputs, placeholders)
+        
+        targets = model_func(*model_fn_inputs, **kwargs)
+        local_init_op_names = [x.initializer.name for x in tf.local_variables()]
+        if isinstance(targets, tuple):
+          targets = list(targets)
+        else:
+          targets = [targets]
+        # add batch_normalization
+        batchnorm_begin = len(targets)
+        batchnorm_tensors = tf_batchnorm_hook.get_batchnorm_tensors()
+        batchnorm_size = len(batchnorm_tensors)
+        targets.extend(batchnorm_tensors)
+        # add trace tensors
+        trace_tensors = trace.get_tensors(['tf', 'tf_sparse_assign'])
+        trace_size = len(trace_tensors)
+        targets.extend(trace_tensors)
+        
+        var_names = []
+        gradient_op_names = []
+        if is_training:
+          loss = targets[0]
+          if isinstance(loss, (list, tuple, dict)):
+            raise 'model function must reture loss as first output'
+          for gear_placeholder in gear_placeholders:
+            add_to_collection(BACKPROP_VARS, ("gear_grad", gear_placeholder))
+          var_names, gradient_op_names = add_backprop_ops(
+            loss,
+            get_collection(BACKPROP_VARS, ['', model_scope]),
+            init_grad_placeholder)
+        input_op_names = get_op_names(placeholders)
+        target_op_names = get_op_names(targets)
+        target_op_types = get_op_types(targets)
+        op_inputs = xdl_inputs
+        add_variable_inputs(op_inputs, input_op_names)
+        outputs, gradients = xdl.tfbackend_op(
+          inputs = list(op_inputs),
+          output_type=target_op_types,
+          input_op_names = ','.join(input_op_names),
+          target_op_names = ','.join(target_op_names),
+          gradient_op_names = ','.join(gradient_op_names),
+          local_init_op_names = ','.join(local_init_op_names),
+          graph_def=serialize_graph(model_scope=model_scope),
+          gradient_size=len(gradient_op_names),
+          gpu_memory_fraction=gpu_memory_fraction)
+        
+        gradients_size = len(gradients)
+        gear_size = len(gear_placeholders)
+        gear_grads = gradients[gradients_size - gear_size:]
+        gradients = gradients[0: gradients_size - gear_size]
+        var_names = var_names[0: gradients_size - gear_size]
+        if len(gear_grads) > 0:
+          add_to_collection(GEAR_GRAD, gear_grads, cur_model_scope())
+          for i in range(len(gear_inputs)):
+            set_gear_gradient(gear_inputs[i], gear_grads[i])
+        if is_training:
+          set_gradients(var_names, gradients, cur_model_scope())
+        # set trace output
+        trace_output = [] if trace_size == 0 else outputs[-trace_size:]
+        trace.set_values(['tf', 'tf_sparse_assign'], trace_output)
+        if batchnorm_size == 0:
+          batchnorm_output = []
+        elif trace_size !=0:
+          batchnorm_output = outputs[-(trace_size+batchnorm_size):-trace_size]
+        else:
+          batchnorm_output = outputs[-(trace_size+batchnorm_size):]
+        tf_batchnorm_hook.set_tf_output(batchnorm_output)
+        return outputs if (trace_size == 0 and batchnorm_size == 0) else outputs[:-(trace_size + batchnorm_size)]
     return _wrapper
   return decorator
 
@@ -251,6 +336,6 @@ def _wrapper(*inputs, **kwargs):
       return forward_results
     return _wrapper
   return decorator
-        
-        
-    
+
+
+
diff --git a/xdl/xdl/python/framework/__init__.py b/xdl/xdl/python/framework/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/framework/__init__.py
+++ b/xdl/xdl/python/framework/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/framework/gradient.py b/xdl/xdl/python/framework/gradient.py
index 857a7d71..eaa6d5d1 100644
--- a/xdl/xdl/python/framework/gradient.py
+++ b/xdl/xdl/python/framework/gradient.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -14,7 +14,7 @@
 # ==============================================================================
 
 from collections import defaultdict
-from xdl.python.lib.graph import current_graph
+from xdl.python.lib.graph import current_graph, device
 from xdl.python.utils.collections import get_collection
 
 class SparseGrad(object):
@@ -108,7 +108,7 @@ def result(self):
     return list(self._result)
 
   def feed_output_list(self):
-    ops = current_graph().nodes()
+    ops = current_graph().ops()
     for op in ops.values():
       for i in range(len(op.inputs)):
         self._output_list[op.inputs[i]].append((op, i))
@@ -119,7 +119,17 @@ def get_op_gradient(self, op):
       if func is None:
         self._op_gradients[op] = None
       else:
-        self._op_gradients[op] = func(op, self.get_gradient)
+        grads = [self.get_gradient(i) for i in op.outputs]
+        has_grad = False
+        for grad in grads:
+          if grad is not None:
+            has_grad = True
+            break
+        if has_grad:
+          with device(op.device_name):
+            self._op_gradients[op] = func(op, self.get_gradient)
+        else:
+          self._op_gradients[op] = None
     return self._op_gradients[op]
 
   def calc_gradient(self, node):
diff --git a/xdl/xdl/python/framework/pulsing_runner.py b/xdl/xdl/python/framework/pulsing_runner.py
new file mode 100644
index 00000000..14cf3a0c
--- /dev/null
+++ b/xdl/xdl/python/framework/pulsing_runner.py
@@ -0,0 +1,273 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+from xdl.python.lib.graph import current_graph, Graph
+from xdl.python.lib.tensor import Tensor
+from collections import defaultdict
+from xdl.python.lib.gen_attr import gen_int, gen_type, DataType
+from xdl.python import pybind
+from xdl.python.utils.timeline import Timeline
+
+def _decode_input(name):
+  if name[0] == '^':
+    return name[1:], -1
+  else:
+    x = name.find(':')
+    return name[:x], int(name[x+1:])
+
+def _flatten_outs(outs):
+  if isinstance(outs, Tensor):
+    return [outs.define]
+  elif isinstance(outs, (list, tuple, set)):
+    return sum([_flatten_outs(i) for i in outs], [])
+  elif isinstance(outs, dict):
+    return sum([_flatten_outs(i) for i in outs.values()], [])
+  else:
+    raise ValueError("Unknown Type: " + str(outs.__class__))
+
+class PulsingRunner(object):
+  def __init__(self, outs, g = None, weak_variable = False, slow_start = 1000):
+    if g is None:
+      g = current_graph()
+    self._g = g
+    self._outs = _flatten_outs(outs)
+    self._real_outs = []
+    self._weak_variable = weak_variable
+    self._slow_start = slow_start
+    self._step = False
+    self._build()
+    self._run_time = 0
+
+  def step(self, perf = None):
+    if self._slow_start > 0:
+      self._slow_start -= 1
+      self._run_time += 1
+      if perf:
+        run_option = pybind.RunOption()
+        run_option.perf = True
+        run_statistic = pybind.RunStatistic()
+        rst = self._g.execute(self._outs, run_option=run_option, run_statistic=run_statistic)
+        Timeline(run_statistic.perf_result).save(str(perf))
+      else:
+        rst = self._g.execute(self._outs)
+      return rst
+    if self._step is False:
+      self._step = True
+      self._run_ops = []
+      for i in self._level_nums[:-1]:
+        run_option = pybind.RunOption()
+        new_ctx = pybind.ExecutorContext(self._channel_count)
+        run_option.set_in_ctx(self._ctx)
+        run_option.set_out_ctx(new_ctx)
+        self._run_ops.extend(self._level_run[i])
+        self._new_graph[i].execute(self._run_ops, run_option=run_option)
+        self._ctx = new_ctx
+      self._run_ops = self._real_outs + ["^" + self._dst_node.name]
+    run_option = pybind.RunOption()
+    new_ctx = pybind.ExecutorContext(self._channel_count)
+    run_option.set_in_ctx(self._ctx)
+    run_option.set_out_ctx(new_ctx)
+    # timeline start
+    self._run_time += 1
+    if perf:
+      run_option.perf = True
+      run_statistic = pybind.RunStatistic()
+      rst = self._dst_graph.execute(self._run_ops, run_option=run_option, run_statistic=run_statistic)[:-1]
+      Timeline(run_statistic.perf_result).save(str(perf))
+    else:
+      rst = self._dst_graph.execute(self._run_ops, run_option=run_option)[:-1]
+    self._ctx = new_ctx
+    return rst
+
+  def _build(self):
+    self._level_nodes = defaultdict(lambda:[])
+    levels = self._g.levels()
+    nodes = self._g.nodes()
+    self._nodes, self._levels = self._prune_node(self._outs, nodes, levels)
+    for k, v in self._levels.items():
+      self._level_nodes[v].append(k)
+    self._level_nums = list(self._level_nodes.keys())
+    self._level_nums.sort()
+    self._level_id = dict(zip(self._level_nums, range(len(self._level_nums))))
+    self._level_channel = {k:{} for k in self._level_nums}
+    self._level_run = {k:set() for k in self._level_nums}
+    self._channel_count = 0
+    self._new_nodes = []
+    self._level_nodes = defaultdict(lambda:[])
+    self._xnodes = {}
+    self._ctx = pybind.ExecutorContext(self._channel_count)
+
+    self._process_nodes()
+    self._process_outs()
+    
+    self._new_graph = {}
+    for level in self._level_nums:
+      self._add_var_dependencies(level)
+      self._new_graph[level] = self._build_graph(level)
+
+    self._add_channel_dst()
+    self._dst_graph = self._build_all_graph()
+
+  def _process_nodes(self):
+    for k, v in self._levels.items():
+      self._process_node(self._nodes[k], v)
+
+  def _process_outs(self):
+    level = self._level_nums[-1]
+    for i in self._outs:
+      out = self._get_output(i, level, "output")
+      if out is not None:
+        self._real_outs.append(out)
+
+  def _build_graph(self, level):
+    ret = Graph()
+    for l in self._level_nums:
+      if l > level:
+        break
+      for node in self._level_nodes[l]:
+        ret.add_node_internal(pybind.NodeDef(node), 0)
+    return ret
+
+  def _build_all_graph(self):
+    ret = Graph()
+    for node in self._xnodes.values():
+      ret.add_node_internal(pybind.NodeDef(node), 0)
+    return ret
+
+  def _prune_node(self, outs, nodes, levels):
+    dfs_list = [_decode_input(i)[0] for i in outs]
+    dfs_set = set(dfs_list)
+    p = 0
+    while p < len(dfs_list):
+      cur_node = dfs_list[p]
+      p += 1
+      inputs = [_decode_input(i)[0] for i in nodes[cur_node].input]
+      for i in inputs:
+        if i not in dfs_set:
+          dfs_set.add(i)
+          dfs_list.append(i)
+
+    nodes = {k:v for k, v in nodes.items() if k in dfs_set}
+    levels = {k:v for k, v in levels.items() if k in dfs_set}
+    return nodes, levels
+
+  def _process_node(self, node, level):
+    new_node = self._add_node(node.name, level)
+    new_node.op = node.op
+    for inx in node.input:
+      iny = self._get_output(inx, level, node.name)
+      if iny is not None:
+        new_node.input.append(iny)
+    for ot in node.output_type:
+      new_node.output_type.append(ot)
+    for k, v in node.attr.items():
+      new_node.attr[k] = v
+    new_node.device = node.device
+
+  def _get_output(self, spec, level, from_node):
+    node, idx = _decode_input(spec)
+    if (self._levels[node] > level):
+      raise ValueError("Cannot Get Output {} at Level {}, from node {}".format(spec, level, from_node))
+    if (self._levels[node] == level):
+      return spec
+    if idx == -1:
+      self._level_run[self._levels[node]].add(spec)
+      return None
+    else:
+      x = spec
+      for i in range(self._level_id[self._levels[node]], self._level_id[level]):
+        lin = self._level_nums[i]
+        lout = self._level_nums[i + 1]
+        if spec in self._level_channel[lin]:
+          x = self._level_channel[lin][spec][1]
+        else:
+          self._level_channel[lin][spec] = self._add_channel(x, lin, lout)
+          x = self._level_channel[lin][spec][1]
+          self._level_run[lin].add(self._level_channel[lin][spec][0])
+      return x
+
+  def _add_channel(self, x_node, src_level, dst_level):
+    node_name = _decode_input(x_node)[0]
+    if node_name in self._nodes:
+      node_def = self._nodes[node_name]
+    else:
+      node_def = self._xnodes[node_name]
+    node_type = node_def.output_type[_decode_input(x_node)[1]]
+    channel = self._channel_count
+    in_node = self._add_node("/pulsing/channel{}/in".format(channel), src_level)
+    out_node = self._add_node("/pulsing/channel{}/out".format(channel), dst_level)
+    self._channel_count += 1
+    in_node.op = "WriteContextOp"
+    in_node.input.append(x_node)
+    in_node.attr["ctx_id"] = gen_int(channel, "ctx_id")
+    in_node.attr["dtype"] = gen_type(node_type, "dtype")
+    in_node.device = node_def.device
+    out_node.op = "ReadContextOp"
+    out_node.attr["ctx_id"] = gen_int(channel, "ctx_id")
+    out_node.attr["dtype"] = gen_type(node_type, "dtype")
+    out_node.output_type.append(node_type)
+    out_node.device = node_def.device
+    return "^/pulsing/channel{}/in".format(channel), "/pulsing/channel{}/out:0".format(channel)
+
+  def _add_node(self, name, level):
+    node = pybind.NodeDef()
+    node.name = name
+    self._new_nodes.append(node)
+    self._level_nodes[level].append(node)
+    self._xnodes[name] = node
+    return node
+
+  def _add_var_dependencies(self, level):
+    src_nodes = defaultdict(lambda:[])
+    dst_nodes = defaultdict(lambda:[])
+    for node_name in self._nodes:
+      node = self._xnodes[node_name]
+      node_level = self._levels[node_name]
+      nm = node.name
+      op = node.op
+      if op[:2] == "Ps" and op[-2:] == "Op":
+        var_name = node.attr["var_name"].s
+        if node_level == level:
+          src_nodes[var_name].append(node)
+        elif node_level < level:
+          dst_nodes[var_name].append(node)
+    for var_name in src_nodes:
+      src_name = ["^" + i.name for i in src_nodes[var_name]]
+      for node in dst_nodes[var_name]:
+        for namex in src_name:
+          node.input.append(namex)
+
+    for node_name in self._nodes:
+      node = self._xnodes[node_name]
+      process = True
+      for i in node.input:
+        pos = i.find("/pulsing/channel")
+        if pos != 0 and pos != 1:
+          process = False
+          break
+      if process:
+        level_id = self._level_id[level]
+        if level_id != 0:
+          xlevel = self._level_nums[level_id - 1]
+          for channel in self._level_channel[xlevel].values():
+            node.input.append("^" + channel[1][:-2])
+
+  def _add_channel_dst(self):
+    self._dst_node = self._add_node("/pulsing/dst", None)
+    self._dst_node.op = "NoOp"
+    self._dst_node.device.device_name = "CPU"
+    for level in self._level_nums:
+      for dst in self._level_run[level]:
+        self._dst_node.input.append("^" + _decode_input(dst)[0])
diff --git a/xdl/xdl/python/framework/session.py b/xdl/xdl/python/framework/session.py
index ed615ea9..2c83a7f2 100644
--- a/xdl/xdl/python/framework/session.py
+++ b/xdl/xdl/python/framework/session.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -14,9 +14,11 @@
 # ==============================================================================
 
 from xdl.python.lib.graph import execute
-from xdl.python.lib.graph import execute_with_feeds
 
 class Hook(object):
+  def __init__(self, priority = 2000):
+    self._priority = priority
+
   def create_session(self):
     pass
 
@@ -43,17 +45,14 @@ def _create_session(self):
     for hook in self._hooks:
       hook.create_session()
 
-  def run(self, v, run_option=None, run_statistic=None, feed_dict=None):
+  def run(self, v, run_option=None, run_statistic=None):
     run_item = [v]
     cbs = []
     for hook in self._hooks:
       run, cb = hook.run(v)
       run_item.append(run)
       cbs.append(cb)
-    if feed_dict is None:
-      results = execute(run_item, run_option, run_statistic)
-    else:
-      results = execute_with_feeds(run_item, run_option, run_statistic, feed_dict=feed_dict)      
+    results = execute(run_item, run_option, run_statistic)
     for i in range(len(cbs)):
       cbs[i](results[i + 1])
     return results[0]
@@ -61,3 +60,4 @@ def run(self, v, run_option=None, run_statistic=None, feed_dict=None):
   def end(self):
     for hook in self._hooks:
       hook.end()
+    
diff --git a/xdl/xdl/python/framework/variable.py b/xdl/xdl/python/framework/variable.py
index 39d39f03..34bb71b8 100644
--- a/xdl/xdl/python/framework/variable.py
+++ b/xdl/xdl/python/framework/variable.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -20,17 +20,35 @@
 import contextlib
 
 import xdl
+import numpy as np
 from xdl.python.lib.graph import control_dependencies
 from xdl.python.backend.model_scope import cur_model_scope
 from xdl.python.utils.collections import *
 from xdl.python.lib.tensor import register_converter
 
 class VarType:
-  Hash = "hash"
+  Hash128 = "hash128"
+  Hash64 = "hash64"
   Index = "index"
 
 _VARIABLE_INFOS = [{}]
 
+_VARIABLE_SCOPE = []
+
+@contextlib.contextmanager
+def variable_scope(scope):
+  try:
+    _VARIABLE_SCOPE.append(scope)
+    yield
+  finally:
+    _VARIABLE_SCOPE.pop()
+
+def get_variable_scope():
+  scopes = ''
+  for scope in _VARIABLE_SCOPE:
+    scopes += scope + '/'
+  return scopes
+
 @contextlib.contextmanager
 def variable_info(**kargs):
   try:
@@ -51,14 +69,26 @@ def get_variable_info(key):
       return item[key]
   return None
 
+'''
+    statis_type = None / 'pv' / 'click'
+'''
+
+_VAR_NAME_SET = set([])
 class Variable(object):
   def __init__(self, name, dtype=None, shape=None, 
                initializer=None, regularizer=None, 
                vtype=VarType.Index,
                trainable=True, collections=None, 
                scope=None,
+               statis_type=None,
+               statis_decay=0.7,
+               statis_decay_period=10,
                **kargs):
-    self._name = name
+    self._variable_scope = get_variable_scope()
+    self._name = get_variable_scope() + (name if statis_type == None else name + '.' + statis_type)
+    self._statis_type = statis_type
+    self._statis_decay = statis_decay
+    self._statis_decay_period = statis_decay_period
     self._dtype = dtype
     self._shape = shape
     self._initializer = initializer
@@ -75,9 +105,15 @@ def __init__(self, name, dtype=None, shape=None,
     self._scope = scope
     self._is_initialized_op = xdl.ps_is_initialized_op(
       var_name=self.name)
+    global _VAR_NAME_SET
+    self._share = True if self._name in _VAR_NAME_SET else False
+    _VAR_NAME_SET.add(self._name)
     self._do_init()
 
   @property
+  def variable_scope(self):
+    return self._variable_scope
+  @property
   def name(self):
     return self._name
   @property
@@ -111,6 +147,12 @@ def extra_info(self):
   def value(self):
     return self._value
   @property
+  def pull_value(self):
+    return xdl.ps_pull_op(
+      var_name = self.name,
+      var_type = self.vtype,
+      dtype = self.dtype)
+  @property
   def var_register(self):
     return self._var_register
   @property
@@ -129,6 +171,8 @@ def _do_init(self):
     extra_info = ''
     for k,v in self._extra_info.items():
       extra_info += '%s=%s;' % (k, v)
+    if self._vtype == VarType.Hash64:
+      extra_info += 'hash64=true;'
     self._var_register = xdl.ps_register_variable_op(
       var_name = self.name,
       var_type = self.vtype,
@@ -161,7 +205,8 @@ def _do_init(self):
         self._name, self._dtype, 
         self._vtype, self._shape)
 
-    add_to_collection(GLOBAL_INITIALIZERS, self._init_value, self._scope)
+    if not self._share:
+      add_to_collection(GLOBAL_INITIALIZERS, self._init_value, self._scope)
     add_to_collection(VAR_REGISTERS, self._var_register, self._scope)
 
     if self._trainable and TRAINABLE_VARIABLES not in self._collections:
@@ -170,10 +215,7 @@ def _do_init(self):
       self._collections.append(GLOBAL_VARIABLES)
     add_to_collections(self._collections, self, self._scope)
 
-    self._value = xdl.ps_pull_op(
-      var_name = self.name,
-      var_type = self.vtype,
-      dtype = self.dtype)
+    self._value = self.pull_value
 
     if self._regularizer is not None:
       if not callable(self._regularizer):
@@ -181,30 +223,80 @@ def _do_init(self):
       self._regularizer_loss = self._regularizer(self)
       add_to_collection(REGULARIZER_LOSS, self._regularizer_loss, self._scope)
 
-  def gather(self, ids, save_ratio=None):
+  def gather(self, ids):
     self._grad_tensor = ids
+    save_ratio = self.get_extra_info("save_ratio")
     return xdl.ps_sparse_pull_op(
       ids,
+      np.array(save_ratio, dtype=np.float32),
       var_name = self.name, 
       var_type = self.vtype,
-      otype = self.dtype,
-      save_ratio = float(save_ratio) if save_ratio is not None else float(self.get_extra_info('save_ratio', '1.0')))
+      otype = self.dtype)
 
-def trainable_variables():
-  return trainable_variables_with_scope(['', cur_model_scope()])
+  def statis(self, ids, indexs, segments, sample_indexs, sample_segments, labels, global_step):
+    save_ratio = self.get_extra_info("save_ratio")    
+    uniq_result = xdl.ps_sparse_statis_op(
+      ids,
+      indexs,
+      segments,
+      sample_indexs,
+      sample_segments,
+      labels,
+      np.array(save_ratio, dtype=np.float32),
+      global_step,
+      statis_type = self._statis_type,
+      statis_decay = self._statis_decay,
+      statis_decay_period = self._statis_decay_period,
+      var_name = self.name, 
+      var_type = self.vtype,
+      otype = self.dtype)
+    return xdl.take_op(uniq_result, indexs)
+
+def trainable_variables(scopes=None):
+  if scopes is None:
+    return trainable_variables_with_scope(['', cur_model_scope()])
+  else:
+    return trainable_variables_with_scope(scopes)
 
-def global_variables():
-  return global_variables_with_scope(['', cur_model_scope()])
+def global_variables(scopes=None):
+  if scopes is None:
+    return global_variables_with_scope(['', cur_model_scope()])
+  else:
+    return global_variables_with_scope(scopes)  
 
-def global_initializers():
-  return global_initializers_with_scope(['', cur_model_scope()])
+def global_initializers(scopes=None):
+  if scopes is None:
+    return global_initializers_with_scope(['', cur_model_scope()])
+  else:
+    return global_initializers_with_scope(scopes)
     
-def variable_registers():
-  return variable_registers_with_scope(['', cur_model_scope()])
+def variable_registers(scopes=None):
+  if scopes is None:
+    return variable_registers_with_scope(['', cur_model_scope()])
+  else:
+    return variable_registers_with_scope(scopes)    
 
 def trainable_variables_with_scope(scope):
   return get_collection(TRAINABLE_VARIABLES, scope)
 
+def trainable_variables_with_variable_scope(scope):
+  total_vars = trainable_variables()
+  scope_vars = []
+  for var in total_vars:
+    if var.name.startswith(scope):
+      scope_vars.append(var)
+  return scope_vars
+
+def trainable_variables_with_variable_scopes(scopes):
+  scope_vars = []
+  for scope in scopes:
+    var = trainable_variables_with_variable_scope(scope)
+    if var is not None:
+      scope_vars.extend(var)
+  if len(scope_vars) == 0:
+    return None
+  return scope_vars
+
 def global_variables_with_scope(scope):
   return get_collection(GLOBAL_VARIABLES, scope)
 
diff --git a/xdl/xdl/python/init.py b/xdl/xdl/python/init.py
index 101afeed..de49a8bd 100644
--- a/xdl/xdl/python/init.py
+++ b/xdl/xdl/python/init.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,17 +19,19 @@
 from xdl.python.lib.internal_ops import *
 from xdl.python.lib.datatype import *
 from xdl.python.ops.ps_ops import *
-from xdl.python.libinfo import include_path, lib_path, bin_path
+from xdl.python.libinfo import include_path, lib_path, bin_path, cflags
 from xdl.python.lib.op_generate import load_op_library
-from xdl.python.lib.graph import Graph, execute, execute_loop, execute_loop_wait, namescope, device, control_dependencies
+from xdl.python.lib.graph import Graph, execute, execute_loop, execute_loop_wait, namescope, device, control_dependencies, level
 from xdl.python.lib.tensor import Tensor, convert_to_tensor
 from xdl.python.framework.gradient import def_gradient, def_gradient_internal, gradient, get_sparse_grads
 from xdl.python.framework.session import Session, Hook
 from xdl.python.framework.variable import Variable, trainable_variables, global_variables, global_initializers, variable_registers, get_variable_by_name
+from xdl.python.framework.pulsing_runner import PulsingRunner
 from xdl.python.sparse_engine.base import SparseTensor, MergedSparseTensor
 from xdl.python.sparse_engine.embedding import embedding, merged_embedding
 from xdl.python.training.gradient_utils import get_gradient, get_gradients
 from xdl.python.ops.init_ops import *
+from xdl.python.utils.metrics import add_metrics
 from xdl.python.utils.config import *
 from xdl.python.utils.timeline import Timeline
 from xdl.python.utils.collections import *
@@ -37,12 +39,13 @@
 from xdl.python.ops.auc import auc, batch_auc
 from xdl.python.ops.gauc import gauc, batch_gauc
 from xdl.python import preload as _preload
-from xdl.python.training.optimizer_impls import SGD, Momentum, Adagrad, Adam, Ftrl
+from xdl.python.training.optimizer_impls import SGD, Momentum, Adagrad, Adam, Ftrl, RMSProp
 from xdl.python.training.gradient_utils import get_gradients, get_gradient
-from xdl.python.training.train_session import TrainSession, LoggerHook, SyncRunHook, SemiSyncRunHook, BarrierHook
+from xdl.python.training.train_session import TrainSession, LoggerHook, SyncRunHook, SemiSyncRunHook, BarrierHook, WorkerFinishHook, QpsMetricsHook, MetricsHook, MetricsPrinterHook
 from xdl.python.training.feature_expire import GlobalStepMarkHook, GlobalStepFilterHook
 from xdl.python.training.estimator import Estimator
 from xdl.python.training.env import current_env
+from xdl.python.training.hash_filter import hash_filter, hash_slot_filter
 import xdl.python.ops.ops_grad
 from xdl.python.ops.py_func import py_func
 from xdl.python.io.data_io import DataIO
@@ -51,8 +54,12 @@
 from xdl.python.pybind import parsers
 from xdl.python.pybind import features
 from xdl.python.pybind import GetIOP
-from xdl.python.io.data_sharding import DataSharding
-from xdl.python.training.saver import graph_tag, Saver, CheckpointHook
+from xdl.python.io.data_sharding import DataSharding, SwiftSharding
+from xdl.python.training.saver import graph_tag, Saver, CheckpointHook, CheckpointMeta, RestoreFromHook
 from xdl.python.lib.error import ArgumentError, IndexOverflow, PsError, InternalError, OutOfRange
 from xdl.python.model_server.model_server import ModelServer
+from xdl.python.training.trace_hook import TraceHook
+from xdl.python.training.tf_summary_hook import TFSummaryHook
+from xdl.python.training.trace import *
+from xdl.python.backend.backend_type import get_backend_type
 
diff --git a/xdl/xdl/python/init_local.py b/xdl/xdl/python/init_local.py
new file mode 100644
index 00000000..b27479fd
--- /dev/null
+++ b/xdl/xdl/python/init_local.py
@@ -0,0 +1,58 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+from xdl.python.pybind import DataType, RunOption, RunStatistic
+from xdl.python.lib.internal_ops import *
+from xdl.python.lib.datatype import *
+from xdl.python.libinfo import include_path, lib_path, bin_path
+from xdl.python.lib.error import ArgumentError, IndexOverflow, PsError, InternalError, OutOfRange
+from xdl.python.lib.op_generate import load_op_library
+from xdl.python.lib.graph import Graph, execute, execute_loop, execute_loop_wait, namescope, device, control_dependencies
+from xdl.python.lib.tensor import Tensor, convert_to_tensor
+from xdl.python.ops.py_func import py_func
+from xdl.python.pybind import fs
+from xdl.python.pybind import parsers
+from xdl.python.pybind import features
+from xdl.python.pybind import GetIOP
+from xdl.python.sparse_engine.base import SparseTensor, MergedSparseTensor
+from xdl.python.io.data_io import DataIO
+from xdl.python.io.data_reader import DataReader
+from xdl.python.io.data_sharding import DataSharding, SwiftSharding
+from xdl.python.framework.session import Session, Hook
+
+'''
+from xdl.python.ops.ps_ops import *
+from xdl.python.framework.gradient import def_gradient, def_gradient_internal, gradient, get_sparse_grads
+from xdl.python.framework.variable import Variable, trainable_variables, global_variables, global_initializers, variable_registers, get_variable_by_name
+from xdl.python.sparse_engine.embedding import embedding, merged_embedding
+from xdl.python.training.gradient_utils import get_gradient, get_gradients
+from xdl.python.ops.init_ops import *
+from xdl.python.utils.config import *
+from xdl.python.utils.timeline import Timeline
+from xdl.python.utils.collections import *
+from xdl.python.backend.model_scope import model_scope
+from xdl.python.ops.auc import auc, batch_auc
+from xdl.python.ops.gauc import gauc, batch_gauc
+from xdl.python import preload as _preload
+from xdl.python.training.optimizer_impls import SGD, Momentum, Adagrad, Adam, Ftrl
+from xdl.python.training.gradient_utils import get_gradients, get_gradient
+from xdl.python.training.train_session import TrainSession, LoggerHook, SyncRunHook, SemiSyncRunHook, BarrierHook
+from xdl.python.training.estimator import Estimator
+from xdl.python.training.env import current_env
+import xdl.python.ops.ops_grad
+from xdl.python.training.saver import graph_tag, Saver, CheckpointHook
+from xdl.python.model_server.model_server import ModelServer
+'''
+
diff --git a/xdl/xdl/python/io/__init__.py b/xdl/xdl/python/io/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/io/__init__.py
+++ b/xdl/xdl/python/io/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/io/data_io.py b/xdl/xdl/python/io/data_io.py
index 7b6c7f46..9c41e22a 100644
--- a/xdl/xdl/python/io/data_io.py
+++ b/xdl/xdl/python/io/data_io.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -16,31 +16,52 @@
 import xdl
 from xdl.python import pybind
 from xdl.python.utils.collections import READER_HOOKS, add_to_collection
+from xdl.python.framework.variable import Variable
+from xdl.python.lib.graph import execute
+import numpy as np
+import copy
 
 class DataIO(pybind.DataIO):
     def __init__(self, ds_name, file_type=pybind.parsers.txt,
-                 fs_type = pybind.fs.local, namenode="", enable_state=True):
+                 fs_type = pybind.fs.local, namenode="", enable_state=True,
+                 save_state_interval=100, global_schedule=False):
         self._ds_name = ds_name
         self._fs_type = fs_type
         super(DataIO, self).__init__(name=ds_name, file_type=file_type,
-                                     fs_type=fs_type, namenode=namenode)
+                                     fs_type=fs_type, namenode=namenode,
+                                     worker_id=xdl.get_task_index(),
+                                     global_schedule=global_schedule)
         self._sparse_list = list()
         self._dense_list = list()
         self._fea_dict = dict()
         self._nindicator = 0
         self._batch_size = 0
         self._label_count = 1
-        self._unique_ids = False 
-        self._keep_skey = False 
+        self._unique_ids = False
+        self._keep_skey = False
 
         self._init_tags()
+        self._hook = None
+
+        if isinstance(enable_state, DataIO):
+            self.failover_with(enable_state)
+        elif enable_state:
+            self._init_reader_state_hook(global_schedule, save_state_interval)
+
+    def _init_reader_state_hook(self, global_schedule, save_state_interval):
+        if global_schedule:
+            from xdl.python.io.global_reader_state_hook import GlobalReaderStateHook
+            self._hook = GlobalReaderStateHook(self)
+            add_to_collection(READER_HOOKS, self._hook)
+        else:
+            from xdl.python.io.reader_state_hook import ReaderStateHook
+            self._hook = ReaderStateHook(self, save_state_interval)
+            add_to_collection(READER_HOOKS, self._hook)
 
-        if enable_state:
-            self._init_reader_state_hook()
-
-    def _init_reader_state_hook(self):
-        from xdl.python.io.reader_state_hook import ReaderStateHook
-        add_to_collection(READER_HOOKS, ReaderStateHook(self))
+    def failover_with(self, io):
+        assert isinstance(io, DataIO)
+        hook = copy.copy(io._hook)
+        add_to_collection(READER_HOOKS, hook)
 
     def add_path(self, path):
         '''
@@ -55,7 +76,7 @@ def add_path(self, path):
             super(DataIO, self).add_path(p)
         return self
 
-    def feature(self, name, type, table=0, nvec=0, serialized=False, dsl=""):
+    def feature(self, name, type, table=0, nvec=0, mask="", serialized=False, cutoff=0, dsl=""):
         assert type in (pybind.features.sparse, pybind.features.dense)
         if type == pybind.features.sparse:
             self._sparse_list.append(name)
@@ -63,12 +84,17 @@ def feature(self, name, type, table=0, nvec=0, serialized=False, dsl=""):
             assert nvec > 0
             self._dense_list.append(name)
 
-        self._fea_dict[name] = {'type':type, 'table':table, 'nvec':nvec, 'serialized':serialized}
+        if len(mask) != 0:
+            assert len(mask) == nvec, "mask length(%d) must equal to nvec(%d)"%(nvec, len(mask))
+            mask = mask[::-1] # as std::bitset init from end of string
+
+        self._fea_dict[name] = {'type':type, 'table':table, 'nvec':nvec, 'mask':mask,
+                                'serialized':serialized, 'cutoff': cutoff}
 
         if self._nindicator < table:
             self._nindicator = table
 
-        super(DataIO, self).feature(name, type, table, nvec, serialized, dsl)
+        super(DataIO, self).feature(name, type, table, nvec, mask, serialized, cutoff, dsl)
         return self
 
     def epochs(self, epochs):
@@ -76,15 +102,15 @@ def epochs(self, epochs):
         super(DataIO, self).epochs(epochs);
         return self
 
+    def threads(self, threads):
+        super(DataIO, self).threads(threads);
+        return self
+
     def batch_size(self, batch_size):
         self._batch_size = batch_size
         super(DataIO, self).batch_size(batch_size)
         return self
 
-    def threads(self, thread_num):
-        super(DataIO, self).threads(thread_num)
-        return self
-
     def label_count(self, label_count):
         self._label_count = label_count
         super(DataIO, self).label_count(label_count)
@@ -137,8 +163,8 @@ def load_feature(self, feature_description):
         if dict.has_key('Serialized'):
             serialized = True
         else:
-            serialized = False 
-    
+            serialized = False
+
         has_key = dict.has_key('Expr')
         dsl = ''
         if has_key:
@@ -161,7 +187,7 @@ def load_feature_conf(self, feature_conf):
         if has_expr:
             self._feature_op = pybind.GetIOP("FeatureOP")
             self.add_op(self._feature_op)
-    
+
     @property
     def ds_name(self):
         return self._ds_name
@@ -175,8 +201,13 @@ def cache_count(self):
         return self._cache_count
 
     def set_prop(self, prop):
-        out = xdl.set_prop(ds=self._ds_name, prop=prop)
-        return out
+        return xdl.set_prop(ds=self._ds_name, prop=prop)
+
+    def check_finish(self):
+        return xdl.check_finish(ds=self._ds_name)
+
+    def release_batch(self):
+        return xdl.release_batch(ds=self._ds_name)
 
     @property
     def tags(self):
@@ -215,7 +246,6 @@ def append_tags(self):
             self._append_tag("%s.values" % name, fea_dict['type'], fea_dict['nvec'], fea_dict['table'])
 
         self._append_tag("skbuf", pybind.features.dense)
-        self._append_tag("sklen", pybind.features.dense)
         self._append_tag("label", pybind.features.dense)
 
     def feature_option(self, feature_name):
@@ -223,12 +253,20 @@ def feature_option(self, feature_name):
             return None
         return self._fea_dict[feature_name]
 
+    def get_reader_offset(self):
+      assert self._hook is not None, "get reader offset needs enable state"
+      return self._hook.get_reader_offset()
+
     def read(self):
         assert self._batch_size > 0
         assert self._label_count > 0
 
-        out = xdl.get_batch(ds=self._ds_name, sparse_count=len(self._sparse_list), dense_count=len(self._dense_list),
-                            indicator_count=self._nindicator, dtype=xdl.DataType.float)
+        out = xdl.get_batch(ds=self._ds_name,
+                            sparse_count=len(self._sparse_list),
+                            dense_count=len(self._dense_list),
+                            indicator_count=self._nindicator,
+                            tag_cnt=None,
+                            dtype=xdl.DataType.float)
         batch = dict()
         batch["indicators"] = out[0]
         batch["_indices"] = out[1]
@@ -236,10 +274,12 @@ def read(self):
         batch["_segments"] = out[3]
         batch["_svalues"] = out[4]
         batch["_dvalues"] = out[5]
+        batch["_sidx"] = out[6]
+        batch["_sseg"] = out[7]
         if self._keep_skey:
-            batch["skbuf"] = out[6]
-            batch["sklen"] = out[7]
-        batch["label"] = out[8]
+            batch["skbuf"] = out[8]
+        batch["label"] = out[9]
+        batch["_tag_"] = out[10]
 
         ### indicator
         for i in range(len(batch["indicators"])):
@@ -250,19 +290,27 @@ def read(self):
         assert len(self._sparse_list) == len(batch['_ids'])
         assert len(self._sparse_list) == len(batch['_svalues'])
         assert len(self._sparse_list) == len(batch['_segments'])
+        assert len(self._sparse_list) == len(batch['_sidx'])
+        assert len(self._sparse_list) == len(batch['_sseg'])
+
         for i in range(len(self._sparse_list)):
             name = self._sparse_list[i]
             batch[name] = xdl.SparseTensor(batch['_ids'][i], batch["_svalues"][i], batch['_segments'][i],
-                                           batch['_indices'][i] if self._unique_ids else None)
-
+                                           batch['_indices'][i] if self._unique_ids else None,
+                                           batch['_sidx'][i] if self._unique_ids else None,
+                                           batch['_sseg'][i] if self._unique_ids else None)
             opt = self._fea_dict.get(name)
             assert opt != None
             assert opt['type'] == pybind.features.sparse
 
             batch[name].set_shape([self._batch_size])
             batch[name].set_name(name)
+            batch['_ids'][i].set_name(name)
+            batch['_indices'][i].set_name(name)
+            batch['_sidx'][i].set_name(name)
+            batch['_sseg'][i].set_name(name)
 
-        ### dense 
+        ### dense
         assert len(self._dense_list) == len(batch['_dvalues'])
         for i in range(len(self._dense_list)):
             name = self._dense_list[i]
@@ -274,9 +322,14 @@ def read(self):
             assert opt['nvec'] > 0
 
             batch[name].set_shape((self._batch_size, opt['nvec']))
+            batch[name].set_name(name)
 
         ### label
         batch['label'].set_shape([self._batch_size, self._label_count])
+        batch['label'].set_name('label')
+
+        ### sample_tag
+        batch["_tag_"].set_shape([])
 
         ### tags
         self.append_tags()
diff --git a/xdl/xdl/python/io/data_reader.py b/xdl/xdl/python/io/data_reader.py
index f5ec47a1..04e83ce4 100644
--- a/xdl/xdl/python/io/data_reader.py
+++ b/xdl/xdl/python/io/data_reader.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -26,7 +26,8 @@ def __init__(self, ds_name, file_type=pybind.parsers.txt,
                  namenode="",
                  paths=None,
                  meta=None,
-                 enable_state=True):
+                 enable_state=True,
+                 global_schedule=False):
         self._ds_name = ds_name
         self._paths = list()
         self._meta = meta
@@ -54,19 +55,25 @@ def __init__(self, ds_name, file_type=pybind.parsers.txt,
 
         if self._fs_type is None:
             self._fs_type = pybind.fs.local
+        #print "%s://%s"%(self._fs_type, self._namenode)
 
         super(DataReader, self).__init__(ds_name, file_type=file_type,
                                          fs_type=self._fs_type, namenode=self._namenode,
-                                         enable_state=enable_state)
+                                         enable_state=enable_state,
+                                         global_schedule=global_schedule)
 
         # add path after failover
+        print self._paths
+
         self._sharding = DataSharding(self.fs())
         self._sharding.add_path(self._paths)
 
         paths = self._sharding.partition(
             rank=xdl.get_task_index(), size=xdl.get_task_num())
-        print('data paths:', paths)
+        print paths
+
         self.add_path(paths)
+
         if self._meta is not None:
             self.set_meta(self._meta)
 
@@ -93,5 +100,6 @@ def _decode_path(self, path):
             assert '://' not in path, "Unsupported path: %s" % path
             fpath = path
 
+        print "%s://%s/%s"%(fs_type, namenode, fpath)
         return fs_type, namenode, fpath
 
diff --git a/xdl/xdl/python/io/data_sharding.py b/xdl/xdl/python/io/data_sharding.py
index a2d33608..2eab8027 100644
--- a/xdl/xdl/python/io/data_sharding.py
+++ b/xdl/xdl/python/io/data_sharding.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -30,7 +30,7 @@ def _add_path(self, path):
             assert len(lst) > 0
             self._full_dirs.append([path, lst])
             print "data parallel for dir: ", path
-        elif self._fs.is_reg(path): 
+        elif self._fs.is_reg(path):
             self._full_paths.append(path)
             print "data parallel for file: ", path
         else:
@@ -53,7 +53,7 @@ def _add_path(self, path):
                     relst.append(f)
 
             self._full_dirs.append([path, relst])
-            
+
 
     def add_path(self, path):
         if isinstance(path, basestring):
@@ -92,3 +92,25 @@ def partition(self, rank, size):
 
         return self._paths
 
+class SwiftSharding(object):
+    def __init__(self, client_config):
+        self._client_config = client_config
+
+    def partition(self, rank, size, threads, max_range=65536):
+        assert size > 0 and rank >= 0 and rank < size and threads > 0
+        worker_step = max_range / size
+        res = []
+        start = rank * worker_step
+        local_step = worker_step if rank < size - 1 else max_range - start
+
+        thread_step = local_step / threads
+        for i in xrange(threads):
+            thread_start = start + i * thread_step
+            thread_local_step = thread_step if i < threads - 1 else local_step - i * thread_step
+            thread_client_config = self._client_config + \
+                     ";from={};to={}".format(thread_start, thread_start + \
+                     thread_local_step - 1)
+            res.append(thread_client_config)
+
+        return res
+
diff --git a/xdl/xdl/python/io/global_reader_state_hook.py b/xdl/xdl/python/io/global_reader_state_hook.py
new file mode 100644
index 00000000..dca9cc9b
--- /dev/null
+++ b/xdl/xdl/python/io/global_reader_state_hook.py
@@ -0,0 +1,49 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import numpy as np
+from xdl.python.framework.session import Hook
+from xdl.python.framework.variable import Variable
+from xdl.python.lib.datatype import DataType
+from xdl.python.ops.init_ops import Zeros
+from xdl.python.lib.graph import execute
+from xdl.python.utils.config import get_task_num, get_task_index
+from xdl.python.proto import io_state_pb2 
+
+class GlobalReaderStateHook(Hook):
+    def __init__(self, data_io, save_interval=100):
+        super(GlobalReaderStateHook, self).__init__()
+        self._worker_num = get_task_num()
+        self._worker_index = get_task_index()
+        self._step = 0
+        self._save_interval = save_interval
+        self._data_io = data_io
+        self._state = io_state_pb2.DSState()
+        self._state.ds_name = data_io.ds_name
+        self._state.epochs = 0
+
+    def create_session(self):
+        self._data_io.shutdown(True)
+        self._data_io.restore_from_state(str(self._state))
+        self._data_io.startup()
+
+    def before_run(self, v):
+        return []
+
+    def after_run(self, v):
+        self._step = self._step + 1
+        if self._step % self._save_interval == 0:
+            self._data_io.serialize_state()
diff --git a/xdl/xdl/python/io/reader_state_hook.py b/xdl/xdl/python/io/reader_state_hook.py
index b58be198..566cba9b 100644
--- a/xdl/xdl/python/io/reader_state_hook.py
+++ b/xdl/xdl/python/io/reader_state_hook.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -14,23 +14,27 @@
 # ==============================================================================
 
 import xdl
+import struct
 import numpy as np
 from xdl.python.framework.session import Hook
 from xdl.python.framework.variable import Variable
-from xdl.python.lib.datatype import DataType 
+from xdl.python.lib.datatype import DataType
 from xdl.python.ops.init_ops import Zeros
 from xdl.python.lib.graph import execute
 from xdl.python.utils.config import get_task_num, get_task_index
 
-_STATE_SIZE = 256*1024
+
+_STATE_SIZE = 128*1024
 
 def _string_to_int8_array(s, capacity):
+    assert len(s) < _STATE_SIZE, "len=%d"%len(s)
     arr = np.zeros((1, capacity), dtype=np.int8)
     for i in range(len(s)):
         arr[0][i] = ord(s[i])
     return arr
 
 def _int8_array_to_string(arr):
+    assert len(arr) < _STATE_SIZE, "len=%d"%len(arr)
     i = 0
     while i < len(arr):
         if arr[i] == 0:
@@ -38,28 +42,55 @@ def _int8_array_to_string(arr):
         i = i + 1
     return ''.join([chr(x) for x in arr[0:i]])
 
+def _save(s, capacity):
+    n = len(s)
+    assert n + struct.calcsize('I') <= capacity, "len=%d"%n
+    arr = np.zeros((1, capacity), dtype=np.int8)
+    struct.pack_into("I%ds"%n, arr.data, 0, n, s)
+    return arr
+
+def _load(arr):
+    n, = struct.unpack_from("I", arr.data)
+    if n == 0:
+        return None
+    s, = struct.unpack_from("%ds"%n, arr.data, offset=struct.calcsize('I'))
+    return s
+
+
 class ReaderStateHook(Hook):
     def __init__(self, data_io, save_interval=100):
+        super(ReaderStateHook, self).__init__()
         self._worker_num = get_task_num()
         self._worker_index = get_task_index()
         self._step = 0
         self._save_interval = save_interval
+        self._last_state = np.zeros((1, _STATE_SIZE), dtype=np.int8)
         self._data_io = data_io
-        self._state_var = Variable(
-            name=self._data_io.ds_name + "/reader_state", 
-            shape=[self._worker_num, _STATE_SIZE],
-            dtype=DataType.int8,
-            initializer=Zeros(),
-            trainable=False)
+        with xdl.python.framework.variable.variable_info(io_ratio=0.5/save_interval):
+            self._state_var = Variable(
+                name=self._data_io.ds_name + "/reader_state",
+                shape=[self._worker_num, _STATE_SIZE],
+                dtype=DataType.int8,
+                initializer=Zeros(),
+                trainable=False)
+            self._offset_var = Variable(
+                name=self._data_io.ds_name + '/reader_offset',
+                shape=[self._worker_num],
+                dtype=DataType.int64,
+                initializer=Zeros(),
+                trainable=False,
+                vtype='index')
 
     def create_session(self):
         state_op = self._state_var.gather(
             np.array([self._worker_index], dtype=np.int32))
         state = execute(state_op)
-        if (state == np.zeros((_STATE_SIZE), dtype=np.int8)).all():
-            return
-        else:
-            self._data_io.restore_from_state(_int8_array_to_string(state[0]))
+        self._data_io.shutdown(True)
+        if state.any():
+            #self._data_io.restore_from_state(_int8_array_to_string(state[0]))
+            pb = _load(state)
+            self._data_io.restore_from_state(pb)
+        self._data_io.startup()
 
     def before_run(self, v):
         return []
@@ -68,14 +99,35 @@ def after_run(self, v):
         self._step = self._step + 1
         if self._step % self._save_interval == 0:
             self._save_state()
+            self._save_offset()
 
     def _save_state(self):
-        state = _string_to_int8_array(self._data_io.serialize_state(), 
-                                      _STATE_SIZE)
+        #state = _string_to_int8_array(self._data_io.serialize_state(), _STATE_SIZE)
+        pb = self._data_io.serialize_state()
+        state = _save(pb, _STATE_SIZE)
+        if np.equal(state, self._last_state).all():
+          print "state equal to last, skip save ..."
+          return
+        self._last_state = state
         update_op = xdl.ps_sparse_assign_op(
             var_name=self._state_var.name,
             var_type=self._state_var.vtype,
             ids=np.array([self._worker_index], dtype=np.int32),
             values=state)
         execute(update_op)
-        
+
+    def _save_offset(self):
+      offset = self._data_io.get_offset()
+      update_op = xdl.ps_sparse_assign_op(
+          var_name=self._offset_var.name,
+          var_type=self._offset_var.vtype,
+          ids=np.array([self._worker_index], dtype=np.int64),
+          values=np.array([offset], dtype=np.int64))
+      execute(update_op)
+
+    def get_reader_offset(self):
+      res = xdl.ps_pull_op(var_name=self._offset_var.name,
+          var_type=self._offset_var.vtype,
+          dtype=self._offset_var.dtype)
+      return res
+
diff --git a/xdl/xdl/python/lib/__init__.py b/xdl/xdl/python/lib/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/lib/__init__.py
+++ b/xdl/xdl/python/lib/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/lib/datatype.py b/xdl/xdl/python/lib/datatype.py
index 08b196fa..2fb6e334 100644
--- a/xdl/xdl/python/lib/datatype.py
+++ b/xdl/xdl/python/lib/datatype.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/lib/error.py b/xdl/xdl/python/lib/error.py
index 6c38019d..a87a10c4 100644
--- a/xdl/xdl/python/lib/error.py
+++ b/xdl/xdl/python/lib/error.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -21,6 +21,7 @@
 PS_ERROR = pybind.Status.ErrorCode.PsError
 INTERNAL_ERROR = pybind.Status.ErrorCode.Internal
 OUT_OF_RANGE = pybind.Status.ErrorCode.OutOfRange
+REACH_END = pybind.Status.ErrorCode.ReachEnd
 
 def check_error(status):
   if status.code == OK:
@@ -34,7 +35,9 @@ def check_error(status):
   elif status.code == INTERNAL_ERROR:
     raise InternalError(status.msg)
   elif status.code == OUT_OF_RANGE:
-    raise OutOfRange(status.msg)    
+    raise OutOfRange(status.msg)
+  elif status.code == REACH_END:
+    raise ReachEnd(status.msg)
   else:
     raise UnhandledError(status.code, status.msg)
 
@@ -76,6 +79,11 @@ def __init__(self, msg):
     self._code = OUT_OF_RANGE
     self._msg = msg
 
+class ReachEnd(XdlException):
+  def __init__(self, msg):
+    self._code = REACH_END
+    self._msg = msg
+
 class UnhandledError(XdlException):
   def __init__(self, code, msg):
     self._code = code
diff --git a/xdl/xdl/python/lib/gen_attr.py b/xdl/xdl/python/lib/gen_attr.py
index a3f74b7b..8bfaf2d6 100644
--- a/xdl/xdl/python/lib/gen_attr.py
+++ b/xdl/xdl/python/lib/gen_attr.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/lib/graph.py b/xdl/xdl/python/lib/graph.py
index 79d16fec..58537dcf 100644
--- a/xdl/xdl/python/lib/graph.py
+++ b/xdl/xdl/python/lib/graph.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -24,7 +24,7 @@
 
 class Graph(object):
   _current_graph = []
-  
+
   @staticmethod
   def current_graph():
     return Graph._current_graph[-1]
@@ -39,9 +39,12 @@ def __init__(self):
     self._graph_def = pybind.GraphDef()
     self._graph_def.hash = random.randint(0, 2 ** 60)
     self._device = Graph.default_device()
+    self._ops = {}
     self._nodes = {}
     self._namescope = '/'
     self._control_dependencies = []
+    self._level = 0
+    self._levels = {}
     self._finalize = False
 
   def __enter__(self):
@@ -62,9 +65,9 @@ def device(self, device_name, **kwargs):
     try:
       old_device = self._device
       ret = pybind.DeviceDef()
-      ret.device_name = device_name
+      ret.device_name = device_name.upper()
       for k, v in kwargs.items():
-        ret.attrs[k] = str(v)
+        ret.attr[k] = str(v)
       self._device = ret
       yield
     finally:
@@ -99,6 +102,15 @@ def control_dependencies(self, deps):
     finally:
       self._control_dependencies = old_cotrol_dependencies
 
+  @contextlib.contextmanager
+  def level(self, l):
+    try:
+      old_level = self._level
+      self._level = l
+      yield
+    finally:
+      self._level = old_level
+
   def _create_name(self, name, name_hint):
     if name is None:
       k = 0
@@ -116,33 +128,52 @@ def _create_name(self, name, name_hint):
     else:
       return self._namescope + name
 
-  def add_node(self, op_def, name, inputs, attrs):
+  def add_node(self, op_def, name, inputs, attrs, output_types):
     if self._finalize:
       raise Exception("graph has been finalized")
     name = self._create_name(name, op_def.name)
     if name in self._nodes:
       raise Value("Duplicate Define Op " + name)
-    node = pybind.NodeDef()
-    node.name = name
-    node.op = op_def.name
+    real_inputs = []
     for i in inputs:
-      node.input.append(i.define)
+      real_inputs.append(i.define)
     for i in self._control_dependencies:
-      node.input.append(i.op.depend().define)
-    node.device = self._device
+      real_inputs.append(i.op.depend().define)
     attr_hint = {}
+    real_attrs = {}
     for attr in op_def.attrs:
       attr_hint[attr.name] = attr.type
     for k, v in attrs.items():
-      node.attr[k] = gen_attr(v, k, attr_hint[k])
-    self._graph_def.node.append(node)
-    op = Op(inputs, attrs, name, op_def.name)
-    self._nodes[name] = op
+      real_attrs[k] = gen_attr(v, k, attr_hint[k])
+    node = pybind.NodeDef()
+    node.name = name
+    node.op = op_def.name
+    for i in output_types:
+      node.output_type.append(i)
+    for i in real_inputs:
+      node.input.append(i)
+    node.device = self._device
+    for k, v in real_attrs.items():
+      node.attr[k] = v
+    self.add_node_internal(node, self._level)
+    op = Op(inputs, attrs, name, op_def.name, node.device.device_name)
+    self._ops[name] = op
     return op
 
+  def add_node_internal(self, node, level):
+    self._graph_def.node.append(node)
+    self._nodes[node.name] = node
+    self._levels[node.name] = level
+
+  def ops(self):
+    return dict(self._ops)
+
   def nodes(self):
     return dict(self._nodes)
 
+  def levels(self):
+    return dict(self._levels)
+
   def execute(self, outputs, run_option=None, run_statistic=None):
     if run_option and run_option.perf:
       if run_statistic is None:
@@ -150,8 +181,10 @@ def execute(self, outputs, run_option=None, run_statistic=None):
     output_define = []
     def recursive_feed_output(x, k):
       if isinstance(x, Tensor):
-        output_define.append(x.define)
-        if x.define[0] == '^':
+        x = x.define
+      if isinstance(x, (str, unicode)):
+        output_define.append(x)
+        if x[0] == '^':
           return None, k
         else:
           return k, k + 1
@@ -200,69 +233,6 @@ def recursive_build_result(x):
         raise ValueError("Internal Error")
     return recursive_build_result(output_spec)
 
-  def execute_with_feeds(self, outputs, feed_dict={}, run_option=None, run_statistic=None):
-    if run_option and run_option.perf:
-      if run_statistic is None:
-        raise 'run_statistic must be specified when perf is turned on'
-    output_define = []
-    def recursive_feed_output(x, k):
-      if isinstance(x, Tensor):
-        output_define.append(x.define)
-        if x.define[0] == '^':
-          return None, k
-        else:
-          return k, k + 1
-      elif isinstance(x, (list, tuple, set)):
-        rst = []
-        for i in x:
-          y, k = recursive_feed_output(i, k)
-          rst += [y]
-        return x.__class__(rst), k
-      elif isinstance(x, dict):
-        rst = {}
-        for i in x:
-          y, k = recursive_feed_output(x[i], k)
-          rst[i] = y
-        return rst, k
-      else:
-        raise ValueError("cannot execute type {}".format(x))
-    output_spec, _ = recursive_feed_output(outputs, 0)
-    xdl_output_spec = pybind.OutputSpec();
-    xdl_output_spec.output = pybind.StringVector(output_define)
-    xdl_output_spec.output_device = Graph.default_device()
-    run_option = run_option if run_option is not None else pybind.RunOption()
-    feeds = pybind.FeedDict()
-    for key in feed_dict.keys():
-      if isinstance(key, Tensor):
-        feeds[key.define] = pybind.Tensor(feed_dict[key])
-      else:
-        feeds[key] = pybind.Tensor(feed_dict[key])        
-    result = pybind.execute_with_feeds(self._graph_def, feeds, xdl_output_spec, run_option)
-    check_error(result.status)
-    outputs = result.outputs
-    if run_option and run_option.perf:
-      run_statistic.perf_result = result.run_statistic.perf_result;
-    def recursive_build_result(x):
-      if x is None:
-        return None
-      if isinstance(x, (int, long)):
-        return numpy.array(outputs[x], copy = False)
-      elif isinstance(x, (list, tuple, set)):
-        rst = []
-        for i in x:
-          y = recursive_build_result(i)
-          rst += [y]
-        return x.__class__(rst)
-      elif isinstance(x, dict):
-        rst = {}
-        for i in x:
-          y = recursive_build_result(x[i])
-          rst[i] = y
-        return rst
-      else:
-        raise ValueError("Internal Error")
-    return recursive_build_result(output_spec)
-
   def execute_loop(self, *outputs):
     def recursive_feed_output(x, output_define):
       if isinstance(x, Tensor):
@@ -301,12 +271,12 @@ def device(name, **kwargs):
 def control_dependencies(deps):
   return current_graph().control_dependencies(deps)
 
+def level(l):
+  return current_graph().level(l)
+
 def execute(outputs, run_option=None, run_statistic=None):
   return current_graph().execute(outputs, run_option, run_statistic)
 
-def execute_with_feeds(outputs, run_option=None, run_statistic=None, feed_dict={}):
-  return current_graph().execute_with_feeds(outputs, feed_dict, run_option, run_statistic)
-
 def execute_loop(*outputs):
   return current_graph().execute_loop(*outputs)
 
@@ -319,7 +289,7 @@ def _recursive_list(x):
       return sum([_recursive_list(i) for i in x], [])
     else:
       return [x]
-  ret = current_graph().add_node(op_def, name, _recursive_list(inputs), attrs)
+  ret = current_graph().add_node(op_def, name, _recursive_list(inputs), attrs, _recursive_list(output_spec))
   def _recursive_create_output(x, k):
     if isinstance(x, (list, tuple)):
       l = []
diff --git a/xdl/xdl/python/lib/internal_ops.py b/xdl/xdl/python/lib/internal_ops.py
index 6b29de5a..7b7ef70f 100644
--- a/xdl/xdl/python/lib/internal_ops.py
+++ b/xdl/xdl/python/lib/internal_ops.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/lib/op.py b/xdl/xdl/python/lib/op.py
index 375af1bc..fd9dd3b3 100644
--- a/xdl/xdl/python/lib/op.py
+++ b/xdl/xdl/python/lib/op.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -17,12 +17,13 @@
 from xdl.python.lib.tensor import Tensor
 
 class Op(object):
-  def __init__(self, inputs, attrs, name, op):
+  def __init__(self, inputs, attrs, name, op, device_name='CPU'):
     self._inputs = inputs
     self._outputs = []
     self._attrs = attrs
     self._name = name
     self._op = op
+    self._device_name = device_name
 
   def set_outputs(self, outputs):
     self._outputs = outputs
@@ -52,3 +53,8 @@ def name(self):
   @property
   def op(self):
     return self._op
+
+  @property
+  def device_name(self):
+    return self._device_name
+
diff --git a/xdl/xdl/python/lib/op_generate.py b/xdl/xdl/python/lib/op_generate.py
index 9c0714ec..c19ff77d 100644
--- a/xdl/xdl/python/lib/op_generate.py
+++ b/xdl/xdl/python/lib/op_generate.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/lib/tensor.py b/xdl/xdl/python/lib/tensor.py
index 8c5fc220..54f8037d 100644
--- a/xdl/xdl/python/lib/tensor.py
+++ b/xdl/xdl/python/lib/tensor.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -19,6 +19,7 @@ def __init__(self, define, dtype, op):
     self._dtype = dtype
     self._op = op
     self._shape = None
+    self._name = None
 
   def __repr__(self):
     return '<Tensor "{0}" dtype={1}>'.format(self._define, repr(self._dtype))
@@ -42,9 +43,16 @@ def op(self):
   def shape(self):
     return self._shape
 
+  @property
+  def name(self):
+    return self._name
+
   def set_shape(self, shape):
     self._shape = shape
 
+  def set_name(self, name):
+    self._name = name
+
 class TensorConverter(object):
   _convert_map = []
 
diff --git a/xdl/xdl/python/lib/tensorshape.py b/xdl/xdl/python/lib/tensorshape.py
index 776c9360..b432ad8e 100644
--- a/xdl/xdl/python/lib/tensorshape.py
+++ b/xdl/xdl/python/lib/tensorshape.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/libinfo.py b/xdl/xdl/python/libinfo.py
index 190e018c..d1e5273e 100644
--- a/xdl/xdl/python/libinfo.py
+++ b/xdl/xdl/python/libinfo.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -27,4 +27,6 @@
     os.path.dirname(os.path.dirname(os.path.realpath(__file__))),
     'bin')
 
-__version__ = 1.0
+cflags = '-std=c++11 -D_GLIBCXX_USE_CXX11_ABI=0 -I%(include_path)s -L%(lib_path)s -I%(include_path)s/third_party/eigen -lxdl_python_pybind' % {'include_path': include_path, 'lib_path': lib_path}
+
+__version__ = 1.2
diff --git a/xdl/xdl/python/model_server/__init__.py b/xdl/xdl/python/model_server/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/model_server/__init__.py
+++ b/xdl/xdl/python/model_server/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/model_server/model_server.py b/xdl/xdl/python/model_server/model_server.py
index 9c9a0761..23cb8a54 100644
--- a/xdl/xdl/python/model_server/model_server.py
+++ b/xdl/xdl/python/model_server/model_server.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/model_server/model_server_adapter.py b/xdl/xdl/python/model_server/model_server_adapter.py
index 0a80c59d..73f46bd6 100644
--- a/xdl/xdl/python/model_server/model_server_adapter.py
+++ b/xdl/xdl/python/model_server/model_server_adapter.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/ops/__init__.py b/xdl/xdl/python/ops/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/ops/__init__.py
+++ b/xdl/xdl/python/ops/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/ops/auc.py b/xdl/xdl/python/ops/auc.py
index 8c49ab97..e30f317d 100644
--- a/xdl/xdl/python/ops/auc.py
+++ b/xdl/xdl/python/ops/auc.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -22,7 +22,8 @@ def _create_auc_variable(name, num_thresholds):
     return Variable(name, shape=[num_thresholds],
                     dtype=xdl.DataType.int64,
                     initializer=Zeros(),
-                    trainable=False)
+                    trainable=False,
+                    save="false")
 
 def _update_auc(var, delta):
     return xdl.ps_assign_add_op(
@@ -65,6 +66,10 @@ def auc(predictions, labels, **kwargs):
     tn = _create_auc_variable(namescope + "/tn", num_thresholds)
     fn = _create_auc_variable(namescope + "/fn", num_thresholds)
 
+    if predictions is None and labels is None:
+      auc = xdl.auc_op(tp.value, fp.value, tn.value, fn.value)
+      return auc
+
     cur_tp, cur_fp, cur_tn, cur_fn = xdl.confusion_matrix_op(
         predictions=predictions,
         labels=labels,
diff --git a/xdl/xdl/python/ops/constant_converter.py b/xdl/xdl/python/ops/constant_converter.py
index e7bc0d36..d9c03bfd 100644
--- a/xdl/xdl/python/ops/constant_converter.py
+++ b/xdl/xdl/python/ops/constant_converter.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/ops/gauc.py b/xdl/xdl/python/ops/gauc.py
index 53a610c2..5cb0e8d0 100644
--- a/xdl/xdl/python/ops/gauc.py
+++ b/xdl/xdl/python/ops/gauc.py
@@ -1,4 +1,4 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
+# Copyright 2018 Alibaba Group. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -31,18 +31,30 @@ def _update_var(var, delta):
         var_type=var.vtype,
         delta=delta)
 
+def reset_gauc_variables_op(namescope='gauc'):
+    ops = []
+    ops.append(xdl.ps_assign_op(var_name=namescope + '/auc',
+        var_type='index', delta=np.zeros([], dtype=np.float64)))
+    ops.append(xdl.ps_assign_op(var_name=namescope + '/pv_num',
+        var_type='index', delta=np.zeros([], dtype=np.int64)))
+    return ops
+
 def gauc(predicts, labels, indicator, **kwargs):
     namescope = "gauc"
     if "namescope" in kwargs:
         namescope = kwargs["namescope"]
 
+    auc    = _create_variable(namescope + "/auc", xdl.DataType.double)
+    pv_num = _create_variable(namescope + "/pv_num", xdl.DataType.int64)
+
+    if predicts is None and labels is None and indicator is None:
+      gauc = xdl.gauc_op(auc.value, pv_num.value)
+      return gauc
+
     label_filter = np.array([], dtype=dtype_xdl_2_np(labels.dtype))
     if "filter" in kwargs:
         label_filter = kwargs["filter"]
 
-    auc    = _create_variable(namescope + "/auc", xdl.DataType.double)
-    pv_num = _create_variable(namescope + "/pv_num", xdl.DataType.int64)
-
     cur_auc, cur_pv_num = xdl.gauc_calc_op(labels, predicts, indicator,
             label_filter)
 
diff --git a/xdl/xdl/python/ops/init_ops.py b/xdl/xdl/python/ops/init_ops.py
index 660835c6..f97b8c87 100644
--- a/xdl/xdl/python/ops/init_ops.py
+++ b/xdl/xdl/python/ops/init_ops.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -23,6 +23,7 @@
 from xdl.python.ops.initializer_impls import NormalInitializer as Normal
 from xdl.python.ops.initializer_impls import UniformUnitScalingInitializer as UniformUnitScaling
 from xdl.python.ops.initializer_impls import VarianceScalingInitializer as VarianceScaling
+from xdl.python.ops.initializer_impls import OrthogonalInitializer as Orthogonal
 
 
 
diff --git a/xdl/xdl/python/ops/initializer.py b/xdl/xdl/python/ops/initializer.py
index 9fd7978d..6d0f888f 100644
--- a/xdl/xdl/python/ops/initializer.py
+++ b/xdl/xdl/python/ops/initializer.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/ops/initializer_impls.py b/xdl/xdl/python/ops/initializer_impls.py
index 08bfaf43..f8c8668c 100644
--- a/xdl/xdl/python/ops/initializer_impls.py
+++ b/xdl/xdl/python/ops/initializer_impls.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -29,7 +29,7 @@ def __init__(self, value):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_identity_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
             value = self.value_)
 
@@ -39,7 +39,7 @@ def __init__(self):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_constant_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
             value = 0.0)
 
@@ -49,7 +49,7 @@ def __init__(self):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_constant_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
             value = 1.0)
 
@@ -60,7 +60,7 @@ def __init__(self, value):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_constant_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
             value = self._value)
 
@@ -72,12 +72,13 @@ def __init__(self, mean=0.0, stddev=1.0, seed=None):
         self._seed = _DEFAULT_SEED if seed is None else seed
 
     def __call__(self, var_name, dtype, vtype, shape):
-        return xdl.ps_normal_initializer_op(
-            var_name = var_name, 
-            var_type = vtype,
-            seed = int(self._seed), 
-            mean = float(self._mean), 
-            stddev = float(self._stddev))
+      return xdl.ps_normal_initializer_op(
+          var_name=var_name,
+          var_type=vtype,
+          seed=self._seed,
+          mean=self._mean,
+          stddev=self._stddev
+      )
 
 class RandomUniformInitializer(Initializer):
     def __init__(self, minval=0.0, maxval=None, seed=None):
@@ -98,10 +99,10 @@ def __init__(self, mean=0.0, stddev=1.0, seed=None):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_truncated_normal_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
-            seed = self._seed, 
-            mean = self._mean, 
+            seed = self._seed,
+            mean = self._mean,
             stddev = self._stddev)
 
 class NormalInitializer(Initializer):
@@ -113,10 +114,10 @@ def __init__(self, mean=0.0, stddev=1.0, seed=None):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_normal_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
-            seed = self._seed, 
-            mean = self._mean, 
+            seed = self._seed,
+            mean = self._mean,
             stddev = self._stddev)
 
 class UniformUnitScalingInitializer(Initializer):
@@ -127,16 +128,16 @@ def __init__(self, factor=1.0, seed=None):
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_uniform_unit_scaling_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
-            seed = self._seed, 
+            seed = self._seed,
             factor = self._factor,
             shape = shape)
 
 class VarianceScalingInitializer(Initializer):
-    def __init__(self, scale=1.0, 
-                 mode='fan_in', 
-                 distribution='truncated_normal', 
+    def __init__(self, scale=1.0,
+                 mode='fan_in',
+                 distribution='truncated_normal',
                  seed=None):
         super(VarianceScalingInitializer, self).__init__()
         self._scale = scale
@@ -146,15 +147,34 @@ def __init__(self, scale=1.0,
 
     def __call__(self, var_name, dtype, vtype, shape):
         return xdl.ps_variance_scaling_initializer_op(
-            var_name = var_name, 
+            var_name = var_name,
             var_type = vtype,
-            seed = self._seed, 
-            scale = self._scale, 
-            mode = self._mode, 
+            seed = self._seed,
+            scale = self._scale,
+            mode = self._mode,
             distribution = self._distribution,
             shape = shape)
 
+class OrthogonalInitializer(Initializer):
+    def __init__(self, shape, gain=1.0, seed=None):
+        super(OrthogonalInitializer, self).__init__()
+        if len(shape) < 2:
+            raise Exception('dimension must > 1')
+        self._dim = 1
+        for dim in shape[1:]:
+            self._dim *= dim
+        self._gain = gain
+        self._seed = _DEFAULT_SEED if seed is None else seed
+
+    def __call__(self, var_name, dtype, vtype, shape):
+        return xdl.ps_orthogonal_initializer_op(
+            var_name = var_name,
+            var_type = vtype,
+            seed = self._seed,
+            gain = self._gain,
+            dim = self._dim)
+
+
 
 
 
-    
diff --git a/xdl/xdl/python/ops/ops_grad.py b/xdl/xdl/python/ops/ops_grad.py
index 3f7533eb..3d6a7588 100644
--- a/xdl/xdl/python/ops/ops_grad.py
+++ b/xdl/xdl/python/ops/ops_grad.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -25,11 +25,15 @@
 
 @def_gradient("KSum")
 def KSumGrad(op, grad):
-    return [xdl.ksum_grad(op.inputs[0],
+    with xdl.device('CPU'):
+        shape = xdl.shape_op(op.inputs[0])
+    return [xdl.ksum_grad(shape,
                           op.inputs[1],
                           op.inputs[2],
                           op.inputs[3],
                           op.inputs[4],
+                          op.inputs[5],
+                          op.inputs[6],
                           grad[0],
                           average=op.attrs['average'])]
 
@@ -44,6 +48,18 @@ def TileGrad(op, grad):
                           length=op.attrs['length'],
                           reverse=op.attrs['reverse'])]
 
+@def_gradient("FeatureMaskOp")
+def FeatureMaskOpGrad(op, grad):
+    return [xdl.feature_mask_op(
+            grad[0],
+            op.inputs[1],
+            mask_conf=op.attrs['mask_conf'],
+            index=op.attrs['index'])]
+
+@def_gradient("IdentityOp")
+def IdentityOpGrad(op, grad):
+    return [xdl.identity_op(grad[0])]
+
 @def_gradient("PsSparsePullOp")
 def PsSparsePullOpGrad(op, grad):
     indices = op.inputs[0]
@@ -51,5 +67,7 @@ def PsSparsePullOpGrad(op, grad):
 
 @def_gradient("TakeOp")
 def TakeGrad(op, grad):
-    g = xdl.take_grad(grad[0], op.inputs[1], op.inputs[0])
+    with xdl.device('CPU'):
+        shape = xdl.shape_op(op.inputs[0])
+    g = xdl.take_grad(grad[0], op.inputs[1], shape)
     return [g]
diff --git a/xdl/xdl/python/ops/ps_ops.py b/xdl/xdl/python/ops/ps_ops.py
index 5437d3b1..d858ad0b 100644
--- a/xdl/xdl/python/ops/ps_ops.py
+++ b/xdl/xdl/python/ops/ps_ops.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -14,16 +14,51 @@
 # ==============================================================================
 
 import xdl
+import time
 import numpy as np
 from xdl.python.lib.graph import execute
 
 def _string_to_int8(src):
     return np.array([ord(ch) for ch in src], dtype=np.int8)
 
-def convert_ps_variable(var_list, ckpt_dir, output_dir):
+def convert_ps_variable(var_list, ckpt_dir, output_dir, with_slots=False):
     var_str_list = ','.join(var_list)
     op = xdl.ps_convert_ckpt_variable_op(
         variables = _string_to_int8(var_str_list),
         checkpoint_dir=_string_to_int8(ckpt_dir),
-        output_dir=_string_to_int8(output_dir))
+        output_dir=_string_to_int8(output_dir),
+        with_slots=with_slots)
     execute(op)
+
+_BARRIER_NAME_2_ID = {}
+_BARRIER_TOKEN = int(time.time())
+
+def barrier(task_id, task_num, name=None):
+    global _BARRIER_NAME_2_ID
+    global _BARRIER_TOKEN
+    if name is None:
+        name = '_default_barrier_'
+    if name not in _BARRIER_NAME_2_ID:
+        _BARRIER_NAME_2_ID[name] = len(_BARRIER_NAME_2_ID)
+    barrier_id = _BARRIER_NAME_2_ID[name]
+    barrier_op = xdl.worker_barrier_v2op(
+        barrier_id=np.array(barrier_id, dtype=np.int32), 
+        task_id=np.array(task_id, dtype=np.int32),
+        task_num=np.array(task_num, dtype=np.int32), 
+        token=np.array(_BARRIER_TOKEN, dtype=np.int32))
+    execute(barrier_op)
+
+def barrier_op_v2(task_id, task_num, name=None):
+    global _BARRIER_NAME_2_ID
+    global _BARRIER_TOKEN
+    if name is None:
+        name = '_default_barrier_'
+    if name not in _BARRIER_NAME_2_ID:
+        _BARRIER_NAME_2_ID[name] = len(_BARRIER_NAME_2_ID)
+    barrier_id = _BARRIER_NAME_2_ID[name]
+    barrier_op = xdl.worker_barrier_v2op(
+        barrier_id=np.array(barrier_id, dtype=np.int32), 
+        task_id=np.array(task_id, dtype=np.int32),
+        task_num=np.array(task_num, dtype=np.int32), 
+        token=np.array(_BARRIER_TOKEN, dtype=np.int32))
+    return barrier_op
diff --git a/xdl/xdl/python/ops/py_func.py b/xdl/xdl/python/ops/py_func.py
index e66dcdcb..631e55b4 100644
--- a/xdl/xdl/python/ops/py_func.py
+++ b/xdl/xdl/python/ops/py_func.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/ops/regularizer.py b/xdl/xdl/python/ops/regularizer.py
index d5bd45f4..c2b5d553 100644
--- a/xdl/xdl/python/ops/regularizer.py
+++ b/xdl/xdl/python/ops/regularizer.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/preload.py b/xdl/xdl/python/preload.py
index c502a3a3..b50ddb90 100644
--- a/xdl/xdl/python/preload.py
+++ b/xdl/xdl/python/preload.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/pybind/__init__.py b/xdl/xdl/python/pybind/__init__.py
index 5406fd9c..d70f9c8e 100644
--- a/xdl/xdl/python/pybind/__init__.py
+++ b/xdl/xdl/python/pybind/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/pybind/core_wrapper.cc b/xdl/xdl/python/pybind/core_wrapper.cc
index 087a45dd..bc044783 100644
--- a/xdl/xdl/python/pybind/core_wrapper.cc
+++ b/xdl/xdl/python/pybind/core_wrapper.cc
@@ -15,15 +15,13 @@ limitations under the License.
 
 #include "xdl/python/pybind/core_wrapper.h"
 
-#include <glog/logging.h>
+#include "xdl/core/utils/logging.h"
 
 #include "pybind11/stl.h"
 #include "pybind11/stl_bind.h"
-#include "pybind11/numpy.h"
 
 #include "xdl/core/lib/status.h"
 #include "xdl/core/framework/tensor.h"
-#include "xdl/core/backend/device_singleton.h"
 
 #define ONE_ARG(...) __VA_ARGS__
 PYBIND11_MAKE_OPAQUE(ONE_ARG(std::unordered_map<std::string, std::string>));
@@ -34,10 +32,6 @@ PYBIND11_MAKE_OPAQUE(std::vector<size_t>);
 namespace xdl {
 namespace python_lib {
 
-void log_to_stderr() {
-  FLAGS_logtostderr = 1;
-}
-
 void CorePybind(pybind11::module& m) {
   pybind11::class_<Status> status(m, "Status");
   status
@@ -52,42 +46,10 @@ void CorePybind(pybind11::module& m) {
     .value("IndexOverflow", Status::ErrorCode::kIndexOverflow)
     .value("PsError", Status::ErrorCode::kPsError)
     .value("OutOfRange", Status::ErrorCode::kOutOfRange)
+    .value("ReachEnd", Status::ErrorCode::kReachEnd)
     .value("Internal", Status::ErrorCode::kInternal);
 
   pybind11::class_<Tensor>(m, "Tensor", pybind11::buffer_protocol())
-    .def("__init__", [](Tensor& m, pybind11::array arr) {
-      DataType type = DataType::kFloat;
-      int itemsize = arr.dtype().itemsize();
-      switch(arr.dtype().kind()) {
-      case 'f':
-        if (itemsize == 4) {
-          type = DataType::kFloat;
-        } else {
-          type = DataType::kDouble;
-        }
-        break;
-      case 'i':
-        if (itemsize == 1) {
-          type = DataType::kInt8;
-        } else if (itemsize == 4) {
-          type = DataType::kInt32;
-        } else {
-          type = DataType::kInt64;
-        }
-        break;        
-      default:
-        XDL_LOG(FATAL) << "unsupported numpy type:" << arr.dtype().kind();
-      }
-      
-      std::vector<size_t> dims;
-      for (size_t i = 0; i < arr.ndim(); ++i) {
-        dims.push_back(arr.shape(i));
-      }
-
-      Tensor t(DeviceSingleton::CpuInstance(), TensorShape(dims), type);
-      memcpy(t.Raw<void>(), arr.data(), arr.nbytes());
-      new (&m) Tensor(t);
-    })
     .def_property_readonly("initialized", &Tensor::Initialized)
     .def_property_readonly("shape", &Tensor::Shape)
     .def_property_readonly("type", &Tensor::Type)
@@ -105,7 +67,7 @@ void CorePybind(pybind11::module& m) {
           pybind11::format_descriptor<T>::format(),
           shape.size(), shape, stride);
       });
-      CHECK(false) << "Unreachable code for Tensor numpy bind";
+      XDL_CHECK(false) << "Unreachable code for Tensor numpy bind";
     });
 
   pybind11::bind_vector<std::vector<Tensor>>(
@@ -119,12 +81,8 @@ void CorePybind(pybind11::module& m) {
 
   pybind11::bind_map<std::unordered_map<std::string, std::string>>(
       m, "StringStringMap");
-
-  m.def("log_to_stderr", &log_to_stderr, "log to stderr");
 }
 
 }  // namespace python_lib
 }  // namespace xdl
 
-
-
diff --git a/xdl/xdl/python/pybind/data_io_wrapper.cc b/xdl/xdl/python/pybind/data_io_wrapper.cc
index 149894bc..46e9343e 100644
--- a/xdl/xdl/python/pybind/data_io_wrapper.cc
+++ b/xdl/xdl/python/pybind/data_io_wrapper.cc
@@ -34,27 +34,27 @@ io::Operator *GetIOP(const std::string &key) {
 }
 
 void DataIOPybind(pybind11::module& m) {
-  //pybind11::enum_<FSType>(m, "FSType")
   pybind11::enum_<FSType>(m, "fs")
     .value("local", kLocal)
     .value("hdfs", kHdfs)
-    .value("kafka", kKafka)
-    .value("swift", kSwift)
-    .value("odps", kOdps);
+    .value("kafka", kKafka);
 
-  //pybind11::enum_<ParserType>(m, "ParserType")
   pybind11::enum_<ParserType>(m, "parsers")
     .value("pb", kPB)
     .value("txt", kTxt)
     .value("spb", kSPB)
     .value("v4", kV4);  
 
-  //pybind11::enum_<FeatureType>(m, "FeatureType")
   pybind11::enum_<FeatureType>(m, "features")
     .value("sparse", kSparse)
     .value("dense", kDense);
 
+  pybind11::enum_<ZType>(m, "ztype")
+    .value("raw", kRaw)
+    .value("zlib", kZLib);
+
   pybind11::class_<FileSystem>(m, "FileSystem")
+    .def("get_ant", &FileSystem::GetAnt)
     .def("is_dir", &FileSystem::IsDir)
     .def("is_reg", &FileSystem::IsReg)
     .def("dir", &FileSystem::Dir)
@@ -62,6 +62,11 @@ void DataIOPybind(pybind11::module& m) {
     .def("read", &FileSystem::Read)
     .def("write", &FileSystem::Write);
 
+  pybind11::class_<IOAnt>(m, "IOAnt")
+    .def("read", &IOAnt::Read)
+    .def("write", &IOAnt::Write)
+    .def("seek", &IOAnt::Seek);
+
   pybind11::class_<Block>(m, "Block");
 
   pybind11::class_<Batch>(m, "Batch")
@@ -70,19 +75,27 @@ void DataIOPybind(pybind11::module& m) {
 
   pybind11::class_<DataIO>(m, "DataIO")
     .def(pybind11::init<const std::string &, ParserType,
-         FSType, const std::string &>(), "creat a dataio",
+         FSType, const std::string &, size_t, bool >(), "creat a dataio",
          pybind11::arg("name"),
          pybind11::arg("file_type")=kPB,
          pybind11::arg("fs_type")=kLocal,
-         pybind11::arg("namenode")="")
+         pybind11::arg("namenode")="",
+         pybind11::arg("worker_id")=0,
+         pybind11::arg("global_schedule")=false)
+    .def("destroy", &DataIO::Destroy)
     .def("startup", &DataIO::Startup)
+    .def("restart", &DataIO::Restart)
     .def("shutdown", &DataIO::Shutdown, "shutdown",
          pybind11::arg("force")=false)
     .def("add_path", &DataIO::AddPath)
     .def("set_meta", &DataIO::SetMeta)
+    .def("set_meta_data", &DataIO::SetMetaData)
     .def("add_op", &DataIO::AddOp)
     .def("batch_size", &DataIO::SetBatchSize)
+    .def("shuffle", &DataIO::SetShuffle, "set shuffle", pybind11::arg("shuffle")=true)
+    .def("pad", &DataIO::SetPadding, "set padding", pybind11::arg("pad")=true)
     .def("epochs", &DataIO::SetEpochs)
+    .def("z", &DataIO::SetZType, "set compression type", pybind11::arg("type")=kZLib)
     .def("label_count", &DataIO::SetLabelCount)
     .def("split_group", &DataIO::SetSplitGroup)
     .def("unique_ids", &DataIO::SetUniqueIds)
@@ -93,22 +106,30 @@ void DataIOPybind(pybind11::module& m) {
          "pause reading after read limit sg, not exactly wait all sg exausted by default",
          pybind11::arg("limit"),
          pybind11::arg("wait_exactly")=false)
-    .def("threads", &DataIO::SetThreads)
+    .def("threads", &DataIO::SetThreads, "set threads", 
+         pybind11::arg("threads"),
+         pybind11::arg("threads_read")=8)
+    .def("start_time", &DataIO::SetStartTime)
+    .def("end_time", &DataIO::SetEndTime)
+    .def("duration", &DataIO::SetDuration)
+    .def("latest_time", &DataIO::GetLatestTime)
+    .def("get_offset", &DataIO::GetReaderOffset)
     .def("sparse_list", &DataIO::sparse_list)
     .def("dense_list", &DataIO::dense_list)
     .def("ntable", &DataIO::ntable)
     .def("name", &DataIO::name)
     .def("fs", &DataIO::fs, pybind11::return_value_policy::reference_internal)
-    .def("get_batch", &DataIO::GetBatch, pybind11::return_value_policy::reference,
-         pybind11::arg("msec")=0)
-    .def("serialize_state", &DataIO::Store)
+    .def("get_batch", &DataIO::GetBatch, pybind11::return_value_policy::reference)
+    .def("serialize_state", [](DataIO *io){ return pybind11::bytes(io->Store()); })
     .def("restore_from_state", &DataIO::Restore)
     .def("feature", &DataIO::AddFeatureOpt, "add feature option",
          pybind11::arg("name"),
          pybind11::arg("type"),
          pybind11::arg("table")=0,
          pybind11::arg("nvec")=0,
+         pybind11::arg("mask")="",
          pybind11::arg("serialized")=false,
+         pybind11::arg("cutoff")=0,
          pybind11::arg("dsl")="");
 
   pybind11::class_<io::Operator>(m, "IOperator")
@@ -126,6 +147,7 @@ void DataIOPybind(pybind11::module& m) {
 
   m.def("hdfs_write", &HdfsWrite, "write string to hdfs");
   m.def("hdfs_read", &HdfsRead, "read string from hdfs");
+  m.def("get_file_system", &GetFileSystem, pybind11::return_value_policy::reference);
 }
 
 }  // namespace python_lib
diff --git a/xdl/xdl/python/pybind/executor_wrapper.cc b/xdl/xdl/python/pybind/executor_wrapper.cc
index 1385e75a..5397d8e4 100644
--- a/xdl/xdl/python/pybind/executor_wrapper.cc
+++ b/xdl/xdl/python/pybind/executor_wrapper.cc
@@ -16,6 +16,7 @@ limitations under the License.
 #include "xdl/python/pybind/executor_wrapper.h"
 
 #include <future>
+#include "xdl/core/utils/logging.h"
 
 #include "pybind11/stl.h"
 #include "pybind11/stl_bind.h"
@@ -25,7 +26,6 @@ limitations under the License.
 
 #define ONE_ARG(...) __VA_ARGS__
 PYBIND11_MAKE_OPAQUE(ONE_ARG(std::unordered_map<std::string, std::string>));
-PYBIND11_MAKE_OPAQUE(ONE_ARG(std::unordered_map<std::string, xdl::Tensor>));
 PYBIND11_MAKE_OPAQUE(ONE_ARG(std::unordered_map<std::string, xdl::AttrValue>));
 PYBIND11_MAKE_OPAQUE(std::vector<xdl::DataType>);
 PYBIND11_MAKE_OPAQUE(std::vector<xdl::NodeDef>);
@@ -95,38 +95,6 @@ ExecuteResult Execute(const GraphDef& def,
   return ret;
 }
 
-ExecuteResult ExecuteWithFeeds(
-    const GraphDef& def, 
-    const std::unordered_map<std::string, xdl::Tensor>& feed_dict,
-    const OutputSpec& output,
-    const RunOption& run_option) {
-  static Executor executor(ThreadPool::Global());
-  ExecuteResult ret;
-  std::promise<int> result;
-  std::vector<std::pair<std::string, xdl::Tensor> > feeds(feed_dict.size());
-  for (auto item: feed_dict) {
-    feeds.push_back({item.first, item.second});
-  }
-
-  ExecutorInstance::Instance()->executor()->Run(
-      def, feeds, output, run_option,
-      [&](Status st, const std::vector<Tensor>& outputs, 
-          const std::unordered_map<std::string, Any>& extra_info) {
-    ret.status = st;
-    ret.outputs = outputs;
-    if (run_option.perf) {
-      auto it = extra_info.find("PERF_RESULT");
-      if (it != extra_info.end()) {
-        ret.run_statistic.perf_result = it->second.AnyCast<std::string>();
-      }
-    }
-
-    result.set_value(1);
-  });
-  result.get_future().wait();
-  return ret;
-}
-
 void ExecuteLoopImpl(ExecuteLoopSpec* spec) {
   static Executor executor(ThreadPool::Global());
   RunOption run_option;
@@ -144,6 +112,8 @@ void ExecuteLoopImpl(ExecuteLoopSpec* spec) {
         result->status_set = true;
         result->status->set_value(st);
       }
+      std::cout << "WARN: ExecuteLoop encountered error, status[" << st.ToString() << "]";
+      return;
     }
     spec->id = (spec->id + 1) % spec->outputs.size();
     ExecuteLoopImpl(spec);
@@ -178,6 +148,11 @@ Status ExecuteLoopWait() {
   return ret;
 }
 
+struct ExecutorContextWrapper {
+  std::shared_ptr<ExecutorContext> internal;
+  ExecutorContextWrapper(int size) : internal(std::make_shared<ExecutorContext>(size)) {}
+};
+
 void ExecutorPybind(pybind11::module& m) {
   pybind11::enum_<DataType>(m, "DataType")
     .value("int8", DataType::kInt8)
@@ -222,15 +197,28 @@ void ExecutorPybind(pybind11::module& m) {
 
   pybind11::class_<NodeDef>(m, "NodeDef")
     .def(pybind11::init<>())
+    .def(pybind11::init<const NodeDef&>())
     .def_readwrite("name", &NodeDef::name)
     .def_readwrite("op", &NodeDef::op)
     .def_readwrite("input", &NodeDef::input)
+    .def_readwrite("output_type", &NodeDef::output_type)
     .def_readwrite("device", &NodeDef::device)
     .def_readwrite("attr", &NodeDef::attr);
 
+  pybind11::class_<ExecutorContextWrapper>(m, "ExecutorContext")
+    .def(pybind11::init<int>());
+
   pybind11::class_<RunOption>(m, "RunOption")
     .def(pybind11::init<bool>())
     .def(pybind11::init<>())
+    .def("set_in_ctx",
+      [](RunOption& a, const ExecutorContextWrapper& b) {
+        a.in_ctx = b.internal.get();
+      })
+    .def("set_out_ctx",
+      [](RunOption& a, const ExecutorContextWrapper& b) {
+        a.out_ctx = b.internal.get();
+      })
     .def_readwrite("perf", &RunOption::perf);
 
   pybind11::class_<GraphDef>(m, "GraphDef")
@@ -265,13 +253,8 @@ void ExecutorPybind(pybind11::module& m) {
   pybind11::bind_map<std::unordered_map<std::string, AttrValue>>(
       m, "StringAttrValueMap");
 
-  pybind11::bind_map<std::unordered_map<std::string, xdl::Tensor>>(
-      m, "FeedDict");
-
   m.def("execute", &Execute, "Execute the GraphDef");
 
-  m.def("execute_with_feeds", &ExecuteWithFeeds, "Execute the GraphDef with feeds");
-
   m.def("execute_loop", &ExecuteLoop, "Execute the GraphDef on loop");
 
   m.def("execute_loop_wait", &ExecuteLoopWait, "Wait execute_loop error");
diff --git a/xdl/xdl/python/pybind/model_server_wrapper.cc b/xdl/xdl/python/pybind/model_server_wrapper.cc
index 81da58d8..7b671b00 100644
--- a/xdl/xdl/python/pybind/model_server_wrapper.cc
+++ b/xdl/xdl/python/pybind/model_server_wrapper.cc
@@ -15,7 +15,7 @@ limitations under the License.
 
 #include "xdl/python/pybind/model_server_wrapper.h"
 
-#include <glog/logging.h>
+#include "xdl/core/utils/logging.h"
 
 #include "pybind11/stl.h"
 #include "pybind11/stl_bind.h"
diff --git a/xdl/xdl/python/pybind/module_main.cc b/xdl/xdl/python/pybind/module_main.cc
index 9367942d..e1574c41 100644
--- a/xdl/xdl/python/pybind/module_main.cc
+++ b/xdl/xdl/python/pybind/module_main.cc
@@ -36,6 +36,8 @@ PYBIND11_MODULE(libxdl_python_pybind, m) {
 
   DataIOPybind(m);
 
+#ifdef USE_PS_PLUS
   ModelServerPybind(m);
+#endif
 }
 
diff --git a/xdl/xdl/python/sparse_engine/__init__.py b/xdl/xdl/python/sparse_engine/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/sparse_engine/__init__.py
+++ b/xdl/xdl/python/sparse_engine/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/sparse_engine/base.py b/xdl/xdl/python/sparse_engine/base.py
index 23062d90..32bf8423 100644
--- a/xdl/xdl/python/sparse_engine/base.py
+++ b/xdl/xdl/python/sparse_engine/base.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -25,11 +25,13 @@ class SparseTensor(object):
             t._values = None
             t._segments = [3,6,7]
     """
-    def __init__(self, ids, values, segments, indices=None):
+    def __init__(self, ids, values, segments, indices=None, sidx=None, sseg=None):
         self._ids = ids
         self._values = values
         self._segments = segments
-        self._indices = indices 
+        self._indices = indices
+        self._sidx = sidx
+        self._sseg = sseg
         self._shape = None
         self._name = None
 
@@ -48,6 +50,12 @@ def segments(self):
     @property
     def indices(self):
         return self._indices
+    @property
+    def sidx(self):
+        return self._sidx
+    @property
+    def sseg(self):
+        return self._sseg
 
     @property
     def shape(self):
@@ -76,14 +84,20 @@ class MergedSparseTensor(object):
             t._segments = [3,6,9]
             t._groups = [2,3,5,6,7,9]
     """
-    def __init__(self, ids, values, segments, groups):
+    def __init__(self, ids, values, segments, groups, indices=None, sidx=None, sseg=None):
         self._ids = ids
         self._values = values
         self._segments = segments
         self._groups = groups
+        self._indices = indices
+        self._sidx = sidx
+        self._sseg = sseg
         self._shape = None
         self._name = None
 
+    def has_unique_ids(self):
+        return self._indices != None
+
     @property
     def ids(self):
         return self._ids
@@ -96,7 +110,15 @@ def segments(self):
     @property
     def groups(self):
         return self._groups
-
+    @property
+    def indices(self):
+        return self._indices
+    @property
+    def sidx(self):
+        return self._sidx
+    @property
+    def sseg(self):
+        return self._sseg
     @property
     def shape(self):
         return self._shape
diff --git a/xdl/xdl/python/sparse_engine/embedding.py b/xdl/xdl/python/sparse_engine/embedding.py
index 83ceb010..5740e968 100644
--- a/xdl/xdl/python/sparse_engine/embedding.py
+++ b/xdl/xdl/python/sparse_engine/embedding.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -20,12 +20,13 @@
 import xdl
 from xdl.python.lib.datatype import *
 from xdl.python.framework.variable import VarType
+from xdl.python.sparse_engine.embedding_ops import merge_sparse
 
 _EMBEDDING_INFO = {}
 _EMBEDDING_TENSOR = {}
 
 class EmbeddingInfo(object):
-    def __init__(self, name, feature_dim, emb_dim, combiner, output_tensor, xdl_var, embedding):
+    def __init__(self, name, feature_dim, emb_dim, combiner, output_tensor, xdl_var, tile_length, embedding):
         """used to save some embedding information needed by ps."""
         self._name = name
         self._feature_dim = feature_dim
@@ -33,6 +34,7 @@ def __init__(self, name, feature_dim, emb_dim, combiner, output_tensor, xdl_var,
         self._combiner = combiner
         self._output_tensor = output_tensor
         self._var = xdl_var
+        self._tile_length = tile_length
         self._embedding = embedding
     @property
     def name(self):
@@ -53,6 +55,9 @@ def output_tensor(self):
     def var(self):
         return self._var
     @property
+    def tile_length(self):
+        return self._tile_length
+    @property
     def embedding(self):
         return self._embedding
 
@@ -62,13 +67,6 @@ def get_embedding_info(key):
         return get_embedding_info_by_var(var)
     return None
 
-def get_embedding_info_by_name(name):
-    global _EMBEDDING_INFO
-    for var in _EMBEDDING_INFO:
-        if var.name == name:
-            return _EMBEDDING_INFO[var]
-    return None
-
 def get_embedding_info_by_var(key):
     global _EMBEDDING_INFO
     if key in _EMBEDDING_INFO:
@@ -82,6 +80,13 @@ def get_embedding_output(key):
         return None
     return info.output_tensor
 
+def get_embedding_info_by_name(name):
+    global _EMBEDDING_INFO
+    for var in _EMBEDDING_INFO:
+        if var.name == name:
+            return _EMBEDDING_INFO[var]
+    return None
+
 def set_embedding_info(inputs, name, feature_dim, emb_dim, combiner):
     global _EMBEDDING_INFO
     for item in inputs:
@@ -109,15 +114,30 @@ def induce_emb_var_from_tensor(t):
         q.extend(i.op.inputs)
         if i in _EMBEDDING_TENSOR:
             return _EMBEDDING_TENSOR[i]
-    return None
-        
+    return None    
+
+EMBEDDING_LIST = list()
+EMBEDDING_SET = set()
+
+def embedding_list():
+    global EMBEDDING_LIST
+    return EMBEDDING_LIST
+
 def embedding(name, sparse_input, initializer, emb_dim, feature_dim,
-              combiner='sum', 
-              vtype=VarType.Index, 
-              length=50, 
-              reverse=False, 
+              combiner='sum',
+              vtype=VarType.Index,
+              length=50,
+              reverse=False,
               batch_read=3000,
-              feature_add_probability=1.0):
+              feature_add_probability=1.0,
+              cbf=0,
+              device='CPU',
+              statis_list=None,
+              statis_decay=0.07,
+              statis_decay_period=100,
+              labels=None,
+              save=True,
+              **device_attr):
     """xdl embedding
        Args:
          name: name for embedding, will be used for declaring variable on ps-plus
@@ -131,58 +151,103 @@ def embedding(name, sparse_input, initializer, emb_dim, feature_dim,
        Raises:
          None
     """
+
+    global EMBEDDING_LIST, EMBEDDING_SET
+    if name not in EMBEDDING_SET:
+        EMBEDDING_SET.add(name)
+        EMBEDDING_LIST.append(name)
+
     import xdl.python.framework.variable as variable
-    with variable.variable_info(batch_read=batch_read):
+    with variable.variable_info(batch_read=batch_read, save_ratio=feature_add_probability, bloom_filter=cbf, save="true" if save else "false"):
         var = variable.Variable(name=name,
                                 dtype=DataType.float,
                                 shape=[feature_dim, emb_dim],
                                 initializer=initializer,
                                 vtype=vtype,
                                 trainable=True)
+        if statis_list is not None:
+            statis_vars = []
+            for statis_type in statis_list:
+                statis_var = variable.Variable(name=name,
+                                               dtype=DataType.float,
+                                               shape=[feature_dim, 1],
+                                               initializer=xdl.Zeros(),
+                                               vtype=vtype,
+                                               trainable=False,
+                                               statis_type=statis_type,
+                                               statis_decay=statis_decay,
+                                               statis_decay_period=statis_decay_period)
+                statis_vars.append(statis_var)
+
     if sparse_input.has_unique_ids():
-        unique_ids = sparse_input.ids
+        unique_ids = xdl.identity_op(sparse_input.ids)
         idx = sparse_input.indices
-        embeddings = var.gather(unique_ids, save_ratio=feature_add_probability)
+        embeddings = var.gather(unique_ids)
+        sidx = sparse_input.sidx
+        sseg = sparse_input.sseg
     else:
-        unique_ids, idx = xdl.unique(sparse_input.ids, itype=DataType.int32)
-        embeddings = var.gather(unique_ids, save_ratio=feature_add_probability)
+        with xdl.device(device, **device_attr):
+            unique_ids, idx, sidx, sseg = xdl.unique(sparse_input.ids, sparse_input.segments, itype=DataType.int32)
+        embeddings = var.gather(unique_ids)
+        
+    if statis_list is not None:
+        assert labels is not None
+        from xdl.python.training.training_utils import get_global_step
+        global_step = get_global_step()
+        statis_results = []
+        for statis_var in statis_vars:
+            statis_result = statis_var.statis(sparse_input.ids, idx, sparse_input.segments, sidx, sseg, labels, global_step.value)
+            statis_results.append(statis_result)
 
     global _EMBEDDING_TENSOR
     _EMBEDDING_TENSOR[embeddings] = var
 
     import xdl.python.sparse_engine.embedding_ops as embedding_ops
+    import numpy as np
     if combiner == 'sum':
         embeddings = embedding_ops.ksum(
             embeddings,
             idx,
             sparse_input.values,
-            sparse_input.segments)
+            sparse_input.segments,
+            sidx,
+            sseg,
+            device, **device_attr)
     elif combiner == 'mean':
         embeddings = embedding_ops.kmean(
             embeddings,
             idx,
             sparse_input.values,
-            sparse_input.segments)
+            sparse_input.segments,
+            sidx,
+            sseg,
+            device, **device_attr)
     elif combiner == 'tile':
         embeddings = embedding_ops.tile(
             embeddings,
             idx,
-            sparse_input.values,
+            np.array([], dtype=np.float32),
+            #sparse_input.values,
             sparse_input.segments,
             length,
-            reverse)
+            reverse,
+            device, **device_attr)
     else:
         raise Exception("Unrecognized combiner:" + str(combiner))
 
     if sparse_input.shape is not None and len(sparse_input.shape) > 0:
         embeddings.set_shape([sparse_input.shape[0], emb_dim]);
 
-    emb_info = EmbeddingInfo(name, feature_dim, emb_dim, combiner, None, var, embeddings)
+    emb_info = EmbeddingInfo(name, feature_dim, emb_dim, combiner, None, var, length, embeddings)
     set_embedding_info([var], emb_info)
+    if statis_list is not None:
+        return embeddings, statis_results
     return embeddings
 
+#TODO delete. With sidx and sseg, following code will ill function.
 def merged_embedding(name, sparse_inputs, initializer, emb_dim, feature_dim,
-                     combiner='sum', vtype=VarType.Index, length=50, reverse=False):
+                     combiner='sum', vtype=VarType.Index, length=50, reverse=False,
+                     batch_read=3000, feature_add_probability=1.0, cbf=0, device='CPU', **device_attr):
     """xdl embedding
        Args:
          name: name for embedding, will be used for declaring variable on ps-plus
@@ -197,16 +262,29 @@ def merged_embedding(name, sparse_inputs, initializer, emb_dim, feature_dim,
          None
     """
     import xdl.python.framework.variable as variable
-    var = variable.Variable(name=name,
-                            dtype=DataType.float,
-                            shape=[feature_dim, emb_dim],
-                            initializer=initializer,
-                            vtype=vtype,
-                            trainable = True)
-    merged_sparse_inputs = merge_sparse(sparse_inputs)
-    ids = merged_sparse_inputs.ids
-    unique_ids, idx = xdl.unique(ids, itype=DataType.int32)
-    embeddings = var.gather(unique_ids, save_ratio=feature_add_probability)
+    with variable.variable_info(batch_read=batch_read, save_ratio=feature_add_probability, bloom_filter=cbf):
+        var = variable.Variable(name=name,
+                                dtype=DataType.float,
+                                shape=[feature_dim, emb_dim],
+                                initializer=initializer,
+                                vtype=vtype,
+                                trainable = True)
+    if isinstance(sparse_inputs, (list, tuple)):
+        merged_sparse_inputs = merge_sparse(sparse_inputs)
+        emb_dim *= len(sparse_inputs)
+    else:
+        assert(isinstance(sparse_inputs, MergedSparseTensor))
+        merged_sparse_inputs = sparse_inputs
+    if merged_sparse_inputs.has_unique_ids():
+        unique_ids = merged_sparse_inputs.ids
+        idx = merged_sparse_inputs.indices
+        sidx = merged_sparse_inputs.sidx
+        sseg = merged_sparse_inputs.sseg
+    else:
+        with xdl.device(device, **device_attr):
+            unique_ids, idx, sidx, sseg = xdl.unique(ids, merged_sparse_inputs.groups, itype=DataType.int32)
+    
+    embeddings = var.gather(unique_ids)
     global _EMBEDDING_TENSOR
     _EMBEDDING_TENSOR[embeddings] = var
     import xdl.python.sparse_engine.embedding_ops as embedding_ops
@@ -216,14 +294,20 @@ def merged_embedding(name, sparse_inputs, initializer, emb_dim, feature_dim,
             idx,
             merged_sparse_inputs.values,
             merged_sparse_inputs.segments,
-            merged_sparse_inputs.groups)
+            merged_sparse_inputs.groups,
+            sidx,
+            sseg,
+            device, **device_attr)
     elif combiner == 'mean':
         embeddings = embedding_ops.merged_kmean(
             embeddings,
             idx,
             merged_sparse_inputs.values,
             merged_sparse_inputs.segments,
-            merged_sparse_inputs.groups)
+            merged_sparse_inputs.groups,
+            sidx,
+            sseg,
+            device, **device_attr)
     elif combiner == 'tile':
         embeddings = embedding_ops.merged_tile(
             embeddings,
@@ -232,11 +316,13 @@ def merged_embedding(name, sparse_inputs, initializer, emb_dim, feature_dim,
             merged_sparse_inputs.segments,
             merged_sparse_inputs.groups,
             length,
-            reverse)
+            reverse,
+            device, **device_attr)
     else:
         raise Exception("Unrecognized combiner:" + str(combiner))
 
-    emb_info = EmbeddingInfo(name, feature_dim, emb_dim, combiner, None, var, embeddings)
+    emb_info = EmbeddingInfo(name, feature_dim, emb_dim, combiner, None, var, length, embeddings)
     set_embedding_info([var], emb_info)
     return embeddings
 
+
diff --git a/xdl/xdl/python/sparse_engine/embedding_ops.py b/xdl/xdl/python/sparse_engine/embedding_ops.py
index 1bd144bf..70a2b2bc 100644
--- a/xdl/xdl/python/sparse_engine/embedding_ops.py
+++ b/xdl/xdl/python/sparse_engine/embedding_ops.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -20,40 +20,59 @@
 import xdl
 import numpy as np
 from xdl.python.ops.py_func import dtype_xdl_2_np
+from xdl.python.sparse_engine.base import MergedSparseTensor
 
 """ python wrapper for op used in sparse_engine."""
 
-def ksum(embeddings, idx, values, segments):
+def ksum(embeddings, idx, values, segments, sidx, sseg, device='CPU', **device_attrs):
     groups = np.array([], dtype=dtype_xdl_2_np(segments.dtype))
-    return xdl.ksum(embeddings, idx, values, segments, groups)
+    with xdl.device(device, **device_attrs):
+        res = xdl.ksum(embeddings, idx, values, segments, groups, sidx, sseg)
+    return res
 
-def kmean(embeddings, idx, values, segments):
+def kmean(embeddings, idx, values, segments, sidx, sseg, device='CPU', **device_attrs):
     groups = np.array([], dtype=dtype_xdl_2_np(segments.dtype))
-    return xdl.ksum(embeddings, idx, values, segments, groups, average=True)
+    with xdl.device(device, **device_attrs):
+        res = xdl.ksum(embeddings, idx, values, segments, groups, sidx, sseg, average=True)
+    return res
 
-def merged_ksum(embeddings, idx, values, segments, groups):
-    return xdl.ksum(embeddings, idx, values, segments, groups)
+def merged_ksum(embeddings, idx, values, segments,
+                groups, sidx, sseg, device='CPU', **device_attrs):
+    with xdl.device(device, **device_attrs):
+        res = xdl.ksum(embeddings, idx, values, segments, groups, sidx, sseg)
+    return res
 
-def merged_kmean(embeddings, idx, values, segments, groups):
-    return xdl.ksum(embeddings, idx, values, segments, groups, average=True)
+def merged_kmean(embeddings, idx, values, segments,
+                 groups, sidx, sseg, device='CPU', **device_attrs):
+    with xdl.device(device, **device_attrs):
+        res = xdl.ksum(embeddings, idx, values, segments, groups, sidx, sseg, average=True)
+    return res
 
-def tile(embeddings, idx, values, segments, length, reverse=False):
+def tile(embeddings, idx, values, segments, length,
+         reverse=False, device='CPU', **device_attrs):
     groups = np.array([], dtype=dtype_xdl_2_np(segments.dtype))
-    return xdl.tile(embeddings, idx, values, segments, groups,
-                    reverse=reverse, length=length)
+    with xdl.device(device, **device_attrs):
+        res = xdl.tile(embeddings, idx, values, segments, groups,
+                        reverse=reverse, length=length)
+    return res
 
-def merged_tile(embeddings, idx, values, segments, groups, length, reverse=False):
-    return xdl.tile(embeddings, idx, values, segments, groups,
-                    reverse=reverse, length=length)
+def merged_tile(embeddings, idx, values, segments, groups, length,
+                reverse=False, device='CPU', **device_attrs):
+    with xdl.device(device, **device_attrs):
+        res = xdl.tile(embeddings, idx, values, segments, groups,
+                        reverse=reverse, length=length)
+    return res
 
-
-def merge_sparse(sparse_inputs):
+def merge_sparse(sparse_inputs, device='CPU', **device_attrs):
     id_list = [x.ids for x in sparse_inputs]
     value_list = [x.values for x in sparse_inputs]
     segment_list = [x.segments for x in sparse_inputs]
-    ids, values, segments, groups = \
-        xdl.merge_sparse_op(id_list, value_list, segment_list)
+    with xdl.device(device, **device_attrs):
+        ids, values, segments, groups = \
+            xdl.merge_sparse_op(id_list, value_list, segment_list)
     return MergedSparseTensor(ids, values, segments, groups)
 
-def take(feature, indicator):
-    return xdl.take_op(feature, indicator)
+def take(feature, indicator, device='CPU', **device_attrs):
+    with xdl.device(device, **device_attrs):
+        res = xdl.take_op(feature, indicator)
+    return res
diff --git a/xdl/xdl/python/test/local_dummy.py b/xdl/xdl/python/test/local_dummy.py
new file mode 100644
index 00000000..4d42e676
--- /dev/null
+++ b/xdl/xdl/python/test/local_dummy.py
@@ -0,0 +1,157 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import mxnet as mx
+import time
+
+import sys
+import os
+import ctypes
+from xdl.python.utils.collections import READER_HOOKS, get_collection
+
+'''
+--run_mode=local --ckpt_dir=./ckpt --task_num=1
+'''
+
+data_io = xdl.DataIO("tdm", file_type=xdl.parsers.txt, fs_type=xdl.fs.local, enable_state=False)
+data_io.epochs(1)
+data_io.batch_size(4)
+data_io.label_count(1)
+#data_io.serialized(True)
+
+embs_len = 4
+for i in xrange(1, embs_len + 1):
+    name = "item_%d" % i
+    data_io.feature(name=name, type=xdl.features.sparse, dim=1)
+data_io.add_path('tdm.dat')
+data_io.startup()
+
+def train():
+    batch = data_io.read()
+    print batch 
+
+    embs = list()
+
+    for i in range(1, embs_len + 1):
+        name = "item_%d" % i
+        emb = xdl.embedding(name, batch[name], xdl.Ones(), 1, 1000, 'sum', vtype='hash')
+        embs.append(emb)
+        print "emb =", name, ", shape =", emb.shape
+    print "origin batch[label].shape =", batch["label"].shape
+
+    loss, prop, label, indicator, din, dout, fc1_weight, fc1_bias, fc2_weight, fc2_bias = model(embs, batch["label"], 4, 7)
+    train_op=xdl.SGD(0.5).optimize()
+
+    item1_grad = xdl.get_gradient('item_1')
+    item2_grad = xdl.get_gradient('item_2')
+    item3_grad = xdl.get_gradient('item_3')
+    item4_grad = xdl.get_gradient('item_4')
+    fc1_weight_grad = xdl.get_gradient('fc1_weight')
+    fc1_bias_grad = xdl.get_gradient('fc1_bias')
+    fc2_weight_grad = xdl.get_gradient('fc2_weight')
+    fc2_bias_grad = xdl.get_gradient('fc2_bias')
+
+    sess = xdl.TrainSession()
+    
+    loop_num = 0
+    while not sess.should_stop():
+        if loop_num == 5:
+            break
+        print "\n>>>>>>>>>>>> loop_num = %d" % loop_num
+        result = sess.run([train_op, loss, prop, batch['label'], label, indicator, din, dout, \
+                           batch['item_1'].ids, batch['item_1'].segments, batch['item_1'].values, \
+                           batch['item_2'].ids, batch['item_2'].segments, batch['item_2'].values, \
+                           batch['item_3'].ids, batch['item_3'].segments, batch['item_3'].values, \
+                           batch['item_4'].ids, batch['item_4'].segments, batch['item_4'].values, \
+                           item1_grad, item2_grad, item3_grad, item4_grad, \
+                           fc1_weight, fc1_bias, fc1_weight_grad, fc1_bias_grad, \
+                           fc2_weight, fc2_bias, fc2_weight_grad, fc2_bias_grad])
+        if result is None:
+            break
+        print "loss:", result[-31]
+        print "prop:", result[-30]
+        print "origin label:", result[-29]
+        print "label:", result[-28]
+        print "indicator:", result[-27]
+        print "din:", result[-26] 
+        print "dout:", result[-25]
+        print "item_1: ids=", result[-24], "\n        segments=", result[-23], "\n        values=", result[-22]
+        print "item_2: ids=", result[-21], "\n        segments=", result[-20], "\n        values=", result[-19]
+        print "item_3: ids=", result[-18], "\n        segments=", result[-17], "\n        values=", result[-16]
+        print "item_4: ids=", result[-15], "\n        segments=", result[-14], "\n        values=", result[-13]
+        print "item1_grad", result[-12]
+        print "item2_grad", result[-11]
+        print "item1_grad", result[-10]
+        print "item2_grad", result[-9]
+        print "fc1_weight", result[-8]
+        print "fc1_bias", result[-7]
+        print "fc1_weight_grad", result[-6]
+        print "fc1_bias_grad", result[-5]
+        print "fc2_weight", result[-4]
+        print "fc2_bias", result[-3]
+        print "fc2_weight_grad", result[-2]
+        print "fc2_bias_grad", result[-1]
+        loop_num += 1
+
+@xdl.mxnet_wrapper(is_training=True)
+def model(embs, label1, comm_bs, bs):
+    indicator = mx.sym.zeros(shape=(bs-comm_bs+1,))
+    indicator = mx.sym.concat(indicator, mx.sym.ones(shape=(comm_bs-1,)), dim=0)
+    #for i in xrange(2, comm_bs):
+    #    indicator = mx.sym.concat(indicator, mx.sym.var(name='var%d' % i, shape=(1,), init=mx.init.Constant(i-1)), dim=0)
+    
+    ## concat, take
+    din = embs[0]
+    for i in xrange(1, len(embs)):
+        din = mx.sym.concat(din, embs[i])
+    din = mx.sym.take(din, indicator)
+    
+    ## fc1
+    output_dim = 3
+    fc1_weight = mx.sym.var(name='fc1_weight', init=mx.init.One())
+    fc1_bias = mx.sym.var(name='fc1_bias', init=mx.init.Constant(0.0))
+    dout = mx.sym.FullyConnected(data=din, weight=fc1_weight, bias=fc1_bias, num_hidden=output_dim, name='fc1')
+    
+    alpha = mx.sym.var(name='alpha_1', shape=(output_dim, ), init=mx.init.Constant(0.25))
+    dout = mx.symbol.LeakyReLU(data=dout, act_type='prelu', slope=0.25, name=('prelu_1_d'), gamma=alpha)
+    
+    bn_gamma = mx.sym.var(name='bn_gamma_1', shape=(output_dim, ), init=mx.init.Constant(1.))
+    bn_bias = mx.sym.var(name='bn_bias_1', shape=(output_dim, ), init=mx.init.Constant(0.))
+    dout = mx.sym.BatchNorm(data=dout, fix_gamma=False, name=('bn_1_d'), gamma=bn_gamma, beta=bn_bias)
+
+    ## fc2
+    output_dim = 2
+    fc2_weight = mx.sym.var(name='fc2_weight', init=mx.init.One())
+    fc2_bias = mx.sym.var(name='fc2_bias', init=mx.init.Constant(0.0))
+    dout = mx.sym.FullyConnected(data=dout, weight=fc2_weight, bias=fc2_bias, num_hidden=output_dim, name='fc2')
+    
+    ## label
+    label0 = mx.sym.zeros(shape=(comm_bs,1))
+    label1_expand = mx.sym.ones(shape=(bs-comm_bs,1))
+    label0_expand = mx.sym.zeros(shape=(bs-comm_bs,1))
+    label = mx.sym.concat(label0, label1)
+    label_expand = mx.sym.concat(label1_expand, label0_expand)
+    label = mx.sym.concat(label, label_expand, dim=0)
+    
+    ## prop, loss
+    prop = mx.sym.SoftmaxOutput(data=dout, label=label, grad_scale=(1.0))
+    loss = - mx.sym.sum(mx.sym.log(prop) * label) / bs
+    return mx.sym.MakeLoss(loss), prop, label, indicator, din, dout, fc1_weight, fc1_bias, fc2_weight, fc2_bias
+
+train()
+sys.stdout.flush()
+sys.stderr.flush()
+os._exit(0)
diff --git a/xdl/xdl/python/test/mxnet_dummy.py b/xdl/xdl/python/test/mxnet_dummy.py
new file mode 100644
index 00000000..f46cfedc
--- /dev/null
+++ b/xdl/xdl/python/test/mxnet_dummy.py
@@ -0,0 +1,115 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import mxnet as mx
+
+def copy_data(executor):
+    embs = []
+    embs.append(mx.nd.array([[1.], [1.], [1.], [1.]]))
+    embs.append(mx.nd.array([[1.], [1.], [1.], [1.]]))
+    embs.append(mx.nd.array([[1.], [1.], [1.], [1.]]))
+    embs.append(mx.nd.array([[2.], [2.], [2.], [2.]]))
+    for i in xrange(len(embs)):
+        embs[i].copyto(executor.arg_dict['emb%d' % (i+1)])
+
+    label = mx.nd.array([[0., 1.], [0., 1.], [0., 1.], [0., 1.], [1., 0.], [1., 0.], [1., 0.]])
+    label.copyto(executor.arg_dict['label'])
+
+    fc1_weight = mx.nd.array([[1., 1., 1., 1.], [1., 1., 1., 1.], [1., 1., 1., 1.]])
+    fc1_weight.copyto(executor.arg_dict['fc1_weight'])
+    fc1_bias = mx.nd.array([0., 0., 0.])
+    fc1_bias.copyto(executor.arg_dict['fc1_bias'])
+
+    fc2_weight = mx.nd.array([[1., 1., 1.], [1., 1., 1.]])
+    fc2_weight.copyto(executor.arg_dict['fc2_weight'])
+    fc2_bias = mx.nd.array([0., 0.])
+    fc2_bias.copyto(executor.arg_dict['fc2_bias'])
+
+    print "executor.arg_dict:", executor.arg_dict
+    print "executor.grad_dict:", executor.grad_dict
+    print "executor.aux_dict:", executor.aux_dict
+
+def train():
+    model_outputs = model(embs_len=4, comm_bs=4, bs=7)
+    symbol_list = []
+    symbol_list.append(model_outputs[0])
+    symbol_list.append(model_outputs[1])
+    if len(model_outputs) > 2:
+        symbol_list.extend([mx.sym.BlockGrad(x) for x in model_outputs[2:]])
+    symbol = mx.sym.Group(symbol_list)
+    print 'symbol.tojson() =', symbol.tojson()
+    
+    executor = symbol.simple_bind(ctx=mx.cpu(), grad_req='write')
+    
+    for itr in xrange(1, 2):
+        print "<<<<<<<", itr, ">>>>>>>>"
+        copy_data(executor)
+        executor.forward(is_train=True)
+        print "loss:", executor.outputs[0]
+        print "prop:", executor.outputs[1]
+        print "label:", executor.outputs[2]
+        print "indicator:", executor.outputs[3]
+        print "din:", executor.outputs[4]
+        print "dout:", executor.outputs[5]
+        print "fc1_weight:", executor.outputs[6]
+        print "fc1_bias:", executor.outputs[7]
+        print "fc2_weight:", executor.outputs[8]
+        print "fc2_bias:", executor.outputs[9]
+        executor.backward()
+        print "\n## args:", executor.arg_dict
+        print "\n## grads:", executor.grad_dict
+        print "\n## auxs:", executor.aux_dict
+    
+def model(embs_len, comm_bs, bs):
+    embs = []
+    for i in xrange(embs_len):
+        embs.append(mx.sym.var(name='emb%d' % (i+1), shape=[comm_bs, 1]))
+    label = mx.sym.var(name='label', shape=[bs, 2])
+    label = mx.sym.BlockGrad(label)
+    
+    indicator = mx.sym.zeros(shape=(bs-comm_bs+1,))
+    indicator = mx.sym.concat(indicator, mx.sym.ones(shape=(comm_bs-1,)), dim=0)
+    
+    ## concat, take
+    din = embs[0]
+    for i in xrange(1, embs_len):
+        din = mx.sym.concat(din, embs[i])
+    din = mx.sym.take(din, indicator)
+    
+    ## fc1
+    output_dim = 3
+    fc1_weight = mx.sym.var(name='fc1_weight', init=mx.init.One())
+    fc1_bias = mx.sym.var(name='fc1_bias', init=mx.init.Constant(0.0))
+    dout = mx.sym.FullyConnected(data=din, weight=fc1_weight, bias=fc1_bias, num_hidden=output_dim, name='fc1')
+    
+    alpha = mx.sym.var(name='alpha_1', shape=(output_dim, ), init=mx.init.Constant(0.25))
+    dout = mx.symbol.LeakyReLU(data=dout, act_type='prelu', slope=0.25, name=('prelu_1_d'), gamma=alpha)
+    
+    bn_gamma = mx.sym.var(name='bn_gamma_1', shape=(output_dim, ), init=mx.init.Constant(1.))
+    bn_bias = mx.sym.var(name='bn_bias_1', shape=(output_dim, ), init=mx.init.Constant(0.))
+    dout = mx.sym.BatchNorm(data=dout, fix_gamma=False, name=('bn_1_d'), gamma=bn_gamma, beta=bn_bias)
+    
+    ## fc2
+    output_dim = 2
+    fc2_weight = mx.sym.var(name='fc2_weight', init=mx.init.One())
+    fc2_bias = mx.sym.var(name='fc2_bias', init=mx.init.Constant(0.0))
+    dout = mx.sym.FullyConnected(data=dout, weight=fc2_weight, bias=fc2_bias, num_hidden=output_dim, name='fc2')
+
+    ## prop, loss
+    prop = mx.sym.SoftmaxOutput(data=dout, label=label, grad_scale=(1.0))
+    loss = - mx.sym.sum(mx.sym.log(prop) * label) / bs
+    return mx.sym.MakeLoss(loss), prop, label, indicator, din, dout, fc1_weight, fc1_bias, fc2_weight, fc2_bias
+
+train()
diff --git a/xdl/xdl/python/training/__init__.py b/xdl/xdl/python/training/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/training/__init__.py
+++ b/xdl/xdl/python/training/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/training/async_graph.py b/xdl/xdl/python/training/async_graph.py
new file mode 100644
index 00000000..cbbecf71
--- /dev/null
+++ b/xdl/xdl/python/training/async_graph.py
@@ -0,0 +1,195 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+from xdl.python.lib.datatype import DataType
+from xdl.python.sparse_engine.base import SparseTensor
+from xdl.python.lib.graph import current_graph, Graph
+import xdl
+
+class Offset():
+  global_offset = 0
+  def __init__(self, type_name, name, obj):
+    self._type = type_name
+    self._name = name
+    self._offset = self.global_offset
+    self._length = 0
+    if type_name == "sparse_list":
+      self._length = len(obj)
+    elif type_name == "sparse":
+      if obj.indices is not None:
+        Offset.global_offset += 6
+        self._has_unique_id = True
+      else:
+        Offset.global_offset += 3
+        self._has_unique_id = False
+    elif type_name == "merged_sparse":
+      if obj.indices is not None:
+        Offset.global_offset += 7
+        self._has_unique_id = True
+      else:
+        Offset.global_offset += 4
+        self._has_unique_id = False
+    elif type_name == "dense":
+      Offset.global_offset += 1
+    else:
+      raise ValueError("invalid type " + str(type_name))
+  @property
+  def offset(self):
+    return self._offset
+  @property
+  def type(self):
+    return self._type
+  @property
+  def name(self):
+    return self._name
+  @property
+  def length(self):
+    return self._length
+  @property
+  def has_unique_id(self):
+    return self._has_unique_id
+
+class AsyncGraph():
+  def __init__(self):
+    self._enqueue_tensors = []
+    self._names = []
+    self._output_types = []
+    self._offsets_map = {}
+
+  def _regist_in_map(self, name, offset_obj):
+    if name in self._offsets_map:
+      raise ValueError(name + " encountered again")
+    else:
+      self._offsets_map[name] = offset_obj
+
+  def enqueue_sparse(self, name, sparse_tensor, regist=True):
+    self._enqueue_tensors.append(sparse_tensor.ids)
+    self._enqueue_tensors.append(sparse_tensor.values)
+    self._enqueue_tensors.append(sparse_tensor.segments)
+    self._names.append(name + "_ids")
+    self._names.append(name + "_values")
+    self._names.append(name + "_segments")
+    self._output_types.append(DataType.int64)
+    self._output_types.append(DataType.float)
+    self._output_types.append(DataType.int32)
+    if sparse_tensor.indices is not None:
+      self._enqueue_tensors.append(sparse_tensor.indices)
+      self._enqueue_tensors.append(sparse_tensor.sidx)
+      self._enqueue_tensors.append(sparse_tensor.sseg)
+      self._names.append(name + "_indices")
+      self._names.append(name + "_sidx")
+      self._names.append(name + "_sseg")
+      self._output_types.append(DataType.int32)
+      self._output_types.append(DataType.int32)
+      self._output_types.append(DataType.int32)
+    if regist:
+      self._regist_in_map(name, Offset("sparse", name, sparse_tensor))
+
+  def enqueue_merged_sparse(self, name, sparse_tensor, regist=True):
+    self._enqueue_tensors.append(sparse_tensor.ids)
+    self._enqueue_tensors.append(sparse_tensor.values)
+    self._enqueue_tensors.append(sparse_tensor.segments)
+    self._enqueue_tensors.append(sparse_tensor.groups)    
+    self._names.append(name + "_ids")
+    self._names.append(name + "_values")
+    self._names.append(name + "_segments")
+    self._names.append(name + "_groups")    
+    self._output_types.append(DataType.int64)
+    self._output_types.append(DataType.float)
+    self._output_types.append(DataType.int32)
+    self._output_types.append(DataType.int32)    
+    if sparse_tensor.indices is not None:
+      self._enqueue_tensors.append(sparse_tensor.indices)
+      self._enqueue_tensors.append(sparse_tensor.sidx)
+      self._enqueue_tensors.append(sparse_tensor.sseg)
+      self._names.append(name + "_indices")
+      self._names.append(name + "_sidx")
+      self._names.append(name + "_sseg")
+      self._output_types.append(DataType.int32)
+      self._output_types.append(DataType.int32)
+      self._output_types.append(DataType.int32)
+    if regist:
+      self._regist_in_map(name, Offset("merged_sparse", name, sparse_tensor))
+
+  def enqueue_sparse_list(self, name, sparse_list):
+    for i in range(len(sparse_list)):
+      sparse_tensor = sparse_list[i]
+      unique_ids, idx, sidx, sseg = xdl.unique(sparse_tensor.ids, sparse_tensor.segments, itype=DataType.int32)
+      sparse_tensor._ids = unique_ids
+      sparse_tensor._indices = idx
+      self.enqueue_sparse("__" + name + "_" + str(i), sparse_tensor)
+    self._regist_in_map(name, Offset("sparse_list", name, sparse_list))
+
+  def enqueue_dense(self, name, dense_tensor, regist=True):
+    self._enqueue_tensors.append(dense_tensor)
+    self._names.append(name)
+    self._output_types.append(DataType.float)
+    if regist:
+      self._regist_in_map(name, Offset("dense", name, dense_tensor))
+
+  def dequeue(self):
+    tensors = xdl.dequeue_op(types=self._output_types)
+    ret = {}
+    for name in self._offsets_map.keys():
+      if name.startswith("__"):
+        continue
+      offset = self._offsets_map[name]
+      if offset.type == "sparse":
+        ret[name] = self._dequeue_sparse(tensors, offset)
+      elif offset.type == "merged_sparse":
+        ret[name] = self._dequeue_merged_sparse(tensors, offset)        
+      elif offset.type == "sparse_list":
+        ret[name] = self._dequeue_sparse_list(tensors, offset, offset.length)
+      elif offset.type == "dense":
+        ret[name] = tensors[offset.offset]
+    print("--------AsyncGraph--------")
+    print(ret.keys())
+    print("--------AsyncGraph--------")  
+    return ret
+
+  def _dequeue_sparse(self, tensors, offset):
+    offset_idx = offset.offset
+    if offset.has_unique_id:
+      return xdl.SparseTensor(tensors[offset_idx], tensors[offset_idx + 1], tensors[offset_idx + 2], tensors[offset_idx + 3], tensors[offset_idx + 4], tensors[offset_idx + 5])
+    else:
+      return xdl.SparseTensor(tensors[offset_idx], tensors[offset_idx + 1], tensors[offset_idx + 2])
+
+  def _dequeue_merged_sparse(self, tensors, offset):
+    offset_idx = offset.offset
+    if offset.has_unique_id:
+      return xdl.MergedSparseTensor(tensors[offset_idx], tensors[offset_idx + 1], tensors[offset_idx + 2], tensors[offset_idx + 3], tensors[offset_idx + 4], tensors[offset_idx + 5], tensors[offset_idx + 6])
+    else:
+      return xdl.MergedSparseTensor(tensors[offset_idx], tensors[offset_idx + 1], tensors[offset_idx + 2], tensors[offset_idx + 3])
+
+  def _dequeue_sparse_list(self, tensors, offset, length):
+    ret = []
+    for i in range(length):
+      key = "__" + offset.name + "_" + str(i)
+      tmp_offset = self._offsets_map[key]
+      ret.append(self._dequeue_sparse(tensors, tmp_offset))
+    return ret
+
+  def enqueue_start(self):
+    enqueue = xdl.enqueue_op(tensors=self._enqueue_tensors, names=";".join(self._names))
+    current_graph().execute_loop(enqueue)
+    xdl.Graph._current_graph.pop()
+
+  def __enter__(self):
+    return self    
+
+  def __exit__(self, exc_type, exc_val, exc_tb):
+    self.enqueue_start()
+    xdl.Graph._current_graph.append(xdl.Graph())
+
diff --git a/xdl/xdl/python/training/env.py b/xdl/xdl/python/training/env.py
index b2976761..380a3aa9 100644
--- a/xdl/xdl/python/training/env.py
+++ b/xdl/xdl/python/training/env.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -59,7 +59,7 @@ def _start(self):
     elif self._task_name in self._model_server:
       self._model_server_do()
     else:
-      raise Exception("wrong argument:task_name[%s]" % self._task_name)
+      pass
 
   def sess_start(self):
     if self._task_name == 'ps':
@@ -71,7 +71,7 @@ def sess_start(self):
     elif self._task_name in self._model_server:
       self._model_server_sess()
     else:
-      raise Exception("wrong argument:task_name[%s]" % self._task_name)
+      pass
 
   @property
   def is_chief(self):
@@ -99,6 +99,7 @@ def __init__(self):
     self._task_name = get_task_name()
     self._task_index = get_task_index()
     self._bind_core = get_config("bind_cores")
+    self._model_bank = get_config("checkpoint", "model_bank")
     if self._bind_core is None:
       self._bind_core = False
     self._is_chief = True if self._task_index == 0 else False
@@ -148,6 +149,8 @@ def __init__(self):
     self._start()
 
   def _ps_do(self):
+    if not get_ps_mode():
+      return
     run_ps_server(
         scheduler_kv_path = self._zk_addr,
         server_id = self._task_index,
@@ -157,6 +160,8 @@ def _ps_do(self):
         bind_cores = self._bind_core)
 
   def _scheduler_do(self):
+    if not get_ps_mode():
+      return
     run_ps_scheduler(
         scheduler_kv_path = self._zk_addr,
         server_num = ','.join([str(self._ps_num)] + [str(i) for i in self._model_server_num]),
@@ -167,9 +172,11 @@ def _scheduler_do(self):
         sm_dense = self._sm_dense,
         sm_sparse = self._sm_sparse,
         sm_hash = self._sm_hash,
-        bind_cores=self._bind_core)
+        bind_cores = self._bind_core)
 
   def _worker_do(self):
+    if not get_ps_mode():
+      return
     if self._zk_addr:
       connect_to_client(self._zk_addr, '')
 
diff --git a/xdl/xdl/python/training/estimator.py b/xdl/xdl/python/training/estimator.py
index ba519b44..39f832c9 100644
--- a/xdl/xdl/python/training/estimator.py
+++ b/xdl/xdl/python/training/estimator.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/training/export.py b/xdl/xdl/python/training/export.py
index f9a00f54..7d9eff6e 100644
--- a/xdl/xdl/python/training/export.py
+++ b/xdl/xdl/python/training/export.py
@@ -1,8 +1,24 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
 import multiprocessing
 import numpy as np
 import os
 import struct
 import sys
+import time
 import xdl
 
 def _popen(cmd):
@@ -21,31 +37,25 @@ def _cmd(cmd):
 def _is_hdfs(dir):
     return dir.startswith('hdfs:')
 
+def _is_exist(dir):
+    if _is_hdfs(dir):
+        return _system('hadoop fs -ls %s 1>/dev/null 2>/dev/null' % dir) == 0
+    else:
+        return _system('ls %s 1>/dev/null 2>/dev/null' % dir) == 0
+
 def _put_to_hdfs(output_dir, file):
-    def _mkdir_hdfs(output_dir):
-        ret = _system('hadoop fs -ls %s 1>/dev/null' % output_dir)
-        if ret != 0:
-            _system('hadoop fs -mkdir %s' % output_dir)
-    _mkdir_hdfs(output_dir)
+    _cmd('hadoop fs -mkdir -p %s' % output_dir)
     _cmd('hadoop fs -put -f %s %s' % (file, output_dir))
 
 def _mv_to_dir(output_dir, file):
-    def _mkdir(output_dir):
-        ret = _system('ls %s 1>/dev/null' % output_dir)
-        if ret != 0:
-            _cmd('mkdir -p %s' % output_dir)
-    _mkdir(output_dir)
+    _cmd('mkdir -p %s' % output_dir)
     _cmd('mv %s %s' % (file, output_dir))
 
 def output(output_dir, fname):
-    md5 = fname + '.md5'
-    _cmd("md5sum %s |awk '{print $1}' >%s" % (fname, md5))
     if _is_hdfs(output_dir):
         _put_to_hdfs(output_dir, fname)
-        _put_to_hdfs(output_dir, md5)
-    else:
+    elif not os.path.exists(os.path.join(output_dir, fname)):
         _mv_to_dir(output_dir, fname)
-        _mv_to_dir(output_dir, md5)
 
 def get_latest_ckpt_v2(ckpt_dir):
     def _readSize(f):
@@ -79,6 +89,8 @@ def _read_dense_file(f):
     dtype = struct.Struct('i').unpack(f[12:16])[0]
     shape_size = struct.Struct('q').unpack(f[16:24])[0]
     shape = struct.Struct('q' * shape_size).unpack(f[24:24+shape_size * 8])
+    if len(shape) == 0:
+        raise ValueError("shape == 0, pass")
     init_str = struct.Struct('q').unpack(f[24+shape_size * 8 + 8:24+shape_size * 8 + 16])[0]
     f = f[24 + shape_size * 8 + 16 + init_str:]
 
@@ -110,17 +122,18 @@ def _update_save_dict(ckpt, var, save_dict, backend='debug', title='var'):
     k = 0
     while True:
         f = ''
-        fn = os.path.join(ckpt, "%s^%s" % (var, k)).replace("$", "\\$")
-        if _is_hdfs(fn):
+        if _is_hdfs(ckpt):
+            fn = os.path.join(ckpt, "%s^%s" % (var, k)).replace("$", "\\$")
             ret = _system('hadoop fs -ls %s 1>/dev/null 2>/dev/null' % fn)
             if ret != 0:
                 break
             f = _popen("hadoop fs -cat %s" % fn).read()
         else:
-            ret = _system('ls %s 1>/dev/null 2>/dev/null' % fn)
-            if ret != 0:
+            fn = os.path.join(ckpt, "%s^%s" % (var, k))
+            if os.path.exists(fn) == False:
                 break
-            f = _popen("cat %s" % fn).read()
+            with open(fn, 'rb') as fr:
+                f = fr.read()
         if f == '':
             break
         try:
@@ -186,14 +199,16 @@ def export_dense_mx(ckpt_dir, arg_list, aux_list, output_dir):
 
 def export_dense_tf(checkpoints_dir, output_dir):
     ckpt = get_latest_ckpt_v2(checkpoints_dir)
-    print 'export dense tf from %s' % ckpt
+    print '[%s] export dense tf from %s' % (time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(time.time())), ckpt)
     if _is_hdfs(ckpt):
-        arg_list = _popen("hadoop fs -ls %s |awk -F'/' '{print $NF}' |grep '\$' |grep '\^0'" % ckpt).readlines()
-    else:
-        arg_list = _popen("ls %s" % ckpt).readlines()
+        if _is_exist('dense_dir'):
+            _system('rm -rf dense_dir')
+        _system("mkdir dense_dir; cd dense_dir; hadoop fs -get %s/*\$*; cd .." % ckpt)
+        ckpt = 'dense_dir'
+    arg_list = _popen("ls %s |grep '\^0' |awk -F'/' '{print $NF}'" % ckpt).readlines()
     arg_list = [i[:-3].split(' ')[-1] for i in arg_list]
-    
-    print '# export tf arg:', arg_list
+
+    print '[%s] # export tf arg:' % time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(time.time())), arg_list
     manager = multiprocessing.Manager()
     save_dict = manager.dict()
     p_list = []
@@ -238,12 +253,14 @@ def _export_sparse_var(ckpt_dir, output_dir, var, vtype='hash', dim=18):
     def _string_to_int8(src):
         return np.array([ord(ch) for ch in src], dtype=np.int8)
     print(var)
-    op = xdl.ps_convert_ckpt_variable_op(checkpoint_dir=_string_to_int8(ckpt_dir),
-                                         output_dir=_string_to_int8(output_dir),
-                                         variables=_string_to_int8(var))
+    op = xdl.ps_convert_ckpt_variable_op(
+        checkpoint_dir=_string_to_int8(ckpt_dir),
+        output_dir=_string_to_int8(output_dir),
+        variables=_string_to_int8(var))
     xdl.execute(op)
-    if vtype != 'hash':
-        _transfer_sparse_idx_to_hash(os.path.join(output_dir, var), dim, offset=0)
+    if vtype.startswith('hash') == False:
+        for v in var.split(','):
+            _transfer_sparse_idx_to_hash(os.path.join(output_dir, v), dim, offset=0)
 
 def export_sparse(ckpt_dir, output_dir, var_list, vtype='hash', dim=18):
     with open('sparse.txt', 'w') as f:
@@ -253,3 +270,7 @@ def export_sparse(ckpt_dir, output_dir, var_list, vtype='hash', dim=18):
     #for var in var_list:
     _export_sparse_var(ckpt_dir, output_dir, (',').join(var_list), vtype, dim)
 
+def export_file_list(fname, output_dir):
+    _cmd("hadoop fs -ls %s |awk -F'/' '{print $NF}' |grep -v 'Found' >%s" % (output_dir, fname))
+    output(output_dir, fname)
+
diff --git a/xdl/xdl/python/training/feature_expire.py b/xdl/xdl/python/training/feature_expire.py
index ad470f22..72a53a5e 100644
--- a/xdl/xdl/python/training/feature_expire.py
+++ b/xdl/xdl/python/training/feature_expire.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -16,6 +16,8 @@
 import xdl
 from xdl.python.framework.session import Hook
 from xdl.python.training.training_utils import get_global_step
+import os
+import numpy as np
 
 class GlobalStepMarkHook(Hook):
   def __init__(self, var_name, ids):
@@ -33,21 +35,21 @@ def before_run(self, v):
       return self._update
   
 class GlobalStepFilterHook(Hook):
-  def __init__(self, vars, interval_steps, expire_steps, cond):
-    super(GlobalStepFilterHook, self).__init__()
+  def __init__(self, vars, interval_steps, expire_steps):
+    super(GlobalStepFilterHook, self).__init__(priority=2999)
     self._interval_steps = interval_steps
     self._expire_steps = expire_steps
     self._vars = vars
     self._global_step = get_global_step()
     self._last_filter_step = 0
-    self._cond = cond
 
     self.gstep_val = 0
 
   def generate_filter_ops(self, current_step):
     all_ops = []
     for var_name in self._vars:
-      filter_op = xdl.ps_filter_op(0.0, current_step - self._expire_steps, var_name, self._cond)
+      filter_op = xdl.hash_filter(var_name, os.path.dirname(os.path.realpath(__file__)) +
+        "/filter.py", "filter", {"x":np.array(self._expire_steps), "y":np.array(current_step)})
       all_ops.append(filter_op)
     return all_ops
 
@@ -64,5 +66,4 @@ def after_run(self, v):
   def end(self):
     self.gstep_val = xdl.execute(self._global_step.value)
     print("GlobalStepFilterHook running all")
-    xdl.execute(self.generate_filter_ops(self.gstep_val))
-
+    xdl.execute(self.generate_filter_ops(self.gstep_val))
\ No newline at end of file
diff --git a/xdl/xdl/python/training/filter.py b/xdl/xdl/python/training/filter.py
new file mode 100644
index 00000000..43789d90
--- /dev/null
+++ b/xdl/xdl/python/training/filter.py
@@ -0,0 +1,17 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+def filter(global_step, x, y):
+  return y - global_step > x
\ No newline at end of file
diff --git a/xdl/xdl/python/training/gradient_utils.py b/xdl/xdl/python/training/gradient_utils.py
index 01bd3fac..7a3570e5 100644
--- a/xdl/xdl/python/training/gradient_utils.py
+++ b/xdl/xdl/python/training/gradient_utils.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -60,15 +60,22 @@ def get_gear_gradient(x):
   return _GEAR_GRADS[x]
 
 _VAR_MAPPING = {}
-def add_var_mapping(name, var):
+def add_var_mapping(name, var, scope=None):
   global _VAR_MAPPING
-  if name in _VAR_MAPPING:
+  scope = scope if scope is not None else cur_model_scope()
+  if scope not in _VAR_MAPPING:
+    _VAR_MAPPING[scope] = {}
+  if name in _VAR_MAPPING[scope]:
     raise 'duplicate key:', name
-  _VAR_MAPPING[name] = var
+  _VAR_MAPPING[scope][name] = var
 
-def get_var_mapping(key):
+def get_var_mapping(key, scope=None):
   global _VAR_MAPPING
-  if key in _VAR_MAPPING:
-    return _VAR_MAPPING[key]
+  scope = scope if scope is not None else cur_model_scope()
+  if scope not in _VAR_MAPPING:
+    return None
+  var_mapping = _VAR_MAPPING[scope]
+  if key in var_mapping:
+    return var_mapping[key]
   return None
   
diff --git a/xdl/xdl/python/training/hash_filter.py b/xdl/xdl/python/training/hash_filter.py
new file mode 100644
index 00000000..719a522e
--- /dev/null
+++ b/xdl/xdl/python/training/hash_filter.py
@@ -0,0 +1,41 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+from xdl.python.lib import internal_ops
+import inspect
+
+def hash_filter(var_name, fdef, func_name, payload={}):
+  func_def = open(fdef).read()
+  exec(func_def)
+  f = locals()[func_name]
+  f_args = inspect.getargspec(f)
+  if f_args.keywords is not None or f_args.varargs is not None:
+    raise ValueError("function should not have varargs or keywords")
+  f_args = f_args.args
+  payload_name = payload.keys()
+  payload_value = [payload[i] for i in payload_name]
+  return internal_ops.ps_filter_op(payload_value, var_name, func_def, func_name, ";".join(f_args), ";".join(payload_name))
+
+def hash_slot_filter(var_name, fdef, func_name, slot_name, slot_size, payload={}):
+  func_def = open(fdef).read()
+  exec(func_def)
+  f = locals()[func_name]
+  f_args = inspect.getargspec(f)
+  if f_args.keywords is not None or f_args.varargs is not None:
+    raise ValueError("function should not have varargs or keywords")
+  f_args = f_args.args
+  payload_name = payload.keys()
+  payload_value = [payload[i] for i in payload_name]
+  return internal_ops.ps_slot_filter_op(payload_value, var_name, func_def, func_name, ";".join(f_args), ";".join(payload_name), slot_name, slot_size)
diff --git a/xdl/xdl/python/training/increaser.py b/xdl/xdl/python/training/increaser.py
new file mode 100644
index 00000000..f4284a41
--- /dev/null
+++ b/xdl/xdl/python/training/increaser.py
@@ -0,0 +1,119 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+
+import os
+import numpy as np
+from xdl.python.framework.session import Hook
+from xdl.python.training.training_utils import get_global_step
+from xdl.python.lib.graph import execute
+
+
+def _string_to_int8(src):
+    return np.array([ord(ch) for ch in src], dtype=np.int8)
+
+
+class DenseIncreaser(object):
+    def increase(self, inc_version):
+        execute(self.increase_op(inc_version))
+    def increase_op(self, inc_version):
+        return xdl.ps_streaming_trigger_dense_op(_string_to_int8(inc_version))
+
+class DenseIncreaseStreamHook(Hook):
+    def __init__(self, save_interval_step, is_training=True):
+        super(DenseIncreaseStreamHook, self).__init__()
+        self._global_step = get_global_step()
+        self._save_interval = save_interval_step
+        self._saver = DenseIncreaser()
+        self._is_training = is_training
+        self._last_save_step = 0
+
+    def before_run(self, v):
+        if (self._is_training):
+            return self._global_step.value
+
+    def after_run(self, v):
+        global_step = v[0] if isinstance(v, list) else v
+        if global_step - self._last_save_step >= self._save_interval:
+            inc_version = self._create_version(global_step)
+            print('increase stream at global_step[%d], increase version[%s]' % (global_step, inc_version))
+            self._saver.increase(inc_version)
+            self._last_save_step = global_step
+
+    def _create_version(self, global_step):
+        return "inc-{:.>20}".format(global_step)
+
+
+class HashIncreaser(object):
+    def increase(self, inc_version):
+        execute(self.increase_op(inc_version))
+    def increase_op(self, inc_version):
+        return xdl.ps_streaming_trigger_hash_op(_string_to_int8(inc_version))
+
+class HashIncreaseStreamHook(Hook):
+    def __init__(self, save_interval_step, is_training=True):
+        super(HashIncreaseStreamHook, self).__init__()
+        self._global_step = get_global_step()
+        self._save_interval = save_interval_step
+        self._saver = HashIncreaser()
+        self._is_training = is_training
+        self._last_save_step = 0
+
+    def before_run(self, v):
+        if (self._is_training):
+            return self._global_step.value
+
+    def after_run(self, v):
+        global_step = v[0] if isinstance(v, list) else v
+        if global_step - self._last_save_step >= self._save_interval:
+            inc_version = self._create_version(global_step)
+            print('increase stream at global_step[%d], increase version[%s]' % (global_step, inc_version))
+            self._saver.increase(inc_version)
+            self._last_save_step = global_step
+
+    def _create_version(self, global_step):
+        return "inc-{:.>20}".format(global_step)
+
+
+class SparseIncreaser(object):
+    def increase(self, inc_version):
+        execute(self.increase_op(inc_version))
+    def increase_op(self, inc_version):
+        return xdl.ps_streaming_trigger_sparse_op(_string_to_int8(inc_version))
+
+class SparseIncreaseStreamHook(Hook):
+    def __init__(self, save_interval_step, is_training=True):
+        super(SparseIncreaseStreamHook, self).__init__()
+        self._global_step = get_global_step()
+        self._save_interval = save_interval_step
+        self._saver = SparseIncreaser()
+        self._is_training = is_training
+        self._last_save_step = 0
+
+    def before_run(self, v):
+        if (self._is_training):
+            return self._global_step.value
+
+    def after_run(self, v):
+        global_step = v[0] if isinstance(v, list) else v
+        if global_step - self._last_save_step >= self._save_interval:
+            inc_version = self._create_version(global_step)
+            print('increase stream at global_step[%d], increase version[%s]' % (global_step, inc_version))
+            self._saver.increase(inc_version)
+            self._last_save_step = global_step
+
+    def _create_version(self, global_step):
+        return "inc-{:.>20}".format(global_step)
diff --git a/xdl/xdl/python/training/optimizer.py b/xdl/xdl/python/training/optimizer.py
index 13a5f876..13d6c974 100644
--- a/xdl/xdl/python/training/optimizer.py
+++ b/xdl/xdl/python/training/optimizer.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -29,6 +29,9 @@
 from xdl.python.utils.collections import *
 
 class Optimizer(object):
+  def __init__(self):
+    self.gpu_ = None
+
   def optimize(self, var_list=None, update_global_step=True):
     if var_list == None:
       var_list = trainable_variables()
@@ -114,12 +117,13 @@ def compute_sparse_grad(self, sparse_var_grad):
         raise Exception('embedding output is None for var:', var.name)
       in_grads[outputs[-1]] = grad
     backend_device_type = get_collection(BACKEND_DEVICE_TYPE)[0]
-    if backend_device_type == 'gpu':
-      with xdl.device('GPU'):
-        return gradient(inputs, outputs, in_grads)
-    else:
-      with xdl.device('CPU'):      
-        return gradient(inputs, outputs, in_grads)
+    return gradient(inputs, outputs, in_grads)
+    #if backend_device_type == 'gpu':
+    #  with xdl.device('GPU'):
+    #    return gradient(inputs, outputs, in_grads)
+    #else:
+    #  with xdl.device('CPU'):
+    #    return gradient(inputs, outputs, in_grads)
 
   def dense_update(self, var, grad):
     """update dense gradient to ps
@@ -129,7 +133,7 @@ def dense_update(self, var, grad):
     Returns:
     a dense_update op
     """
-    raise Exception("unimplemented")
+    raise Exception("unemplement")
 
   def sparse_update(self, var, grad, indices):
     """update sparse gradient to ps
@@ -140,5 +144,5 @@ def sparse_update(self, var, grad, indices):
     Returns:
     a sparse_update op
     """
-    raise Exception("unimplemented")
+    raise Exception("unemplement")
 
diff --git a/xdl/xdl/python/training/optimizer_impls.py b/xdl/xdl/python/training/optimizer_impls.py
index 7668de15..bfddb0e7 100644
--- a/xdl/xdl/python/training/optimizer_impls.py
+++ b/xdl/xdl/python/training/optimizer_impls.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -109,6 +109,46 @@ def sparse_update(self, var, grad, indices):
             var_name = var.name,
             var_type = var.vtype)
 
+class RMSProp(Optimizer):
+    def __init__(self,
+                 learning_rate,
+                 decay = 0.9,
+                 momentum = 0.0,
+                 epsilon = 1e-10):
+        """construct a rmsprop optimizer
+           Args:
+             learning_rate: a float value indicat learning rate
+             decay: a float value, discounting factor for history gradient
+             momentum: a float value, momentum coefficient
+             epsilon: a small constant for numerical stability
+        """
+        super(RMSProp, self).__init__()
+        self._lr = learning_rate
+        self._decay = decay
+        self._momentum = momentum
+        self._epsilon = epsilon
+
+    def dense_update(self, var, grad):
+      return xdl.ps_dense_apply_rmsprop_op(
+          learning_rate = self._lr,
+          decay = self._decay,
+          momentum = self._momentum,
+          epsilon = self._epsilon,
+          grad = grad,
+          var_name = var.name,
+          var_type = var.vtype)
+
+    def sparse_update(self, var, grad, indices):
+      return xdl.ps_sparse_apply_rmsprop_op(
+          learning_rate = self._lr,
+          decay = self._decay,
+          momentum = self._momentum,
+          epsilon = self._epsilon,
+          grad = grad,
+          indices = indices,
+          var_name = var.name,
+          var_type = var.vtype)
+
 class Adam(Optimizer):
     def __init__(self, 
                  learning_rate=0.001, 
@@ -160,7 +200,7 @@ def __init__(self,
                  initial_accumulator_value=0.1,
                  l1_regularization_strength=0.0,
                  l2_regularization_strength=0.0):
-        """construct a ftrl optimizer
+        """construct a adam optimizer
            Args:
              learning_rate: a float value indicate learning rate
              learning_rate_power: a float value, must be less or equal to zero
diff --git a/xdl/xdl/python/training/saver.py b/xdl/xdl/python/training/saver.py
index cd89f96e..3312445f 100644
--- a/xdl/xdl/python/training/saver.py
+++ b/xdl/xdl/python/training/saver.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -14,17 +14,23 @@
 # ==============================================================================
 
 import xdl
+
 import os
 import numpy as np
+import json
+import time
+import datetime
 from xdl.python.lib.graph import current_graph
 from xdl.python.proto import graph_def_pb2
 from google.protobuf.text_format import Parse as TextParse
 from xdl.python.utils.file_io import write_string_to_file
 from xdl.python.framework.session import Hook
+from xdl.python.training.export import output
 from xdl.python.training.training_utils import get_global_step
 from xdl.python.lib.graph import execute
 from xdl.python.utils.config import get_ckpt_dir
-from xdl.python.io.data_io import DataIO
+from xdl.python.lib.tensor import Tensor
+from xdl.python.utils.file_io import write_string_to_file
 
 def _string_to_int8(src):
     return np.array([ord(ch) for ch in src], dtype=np.int8)
@@ -36,32 +42,31 @@ def _graphdef_to_pb(graph_def):
 
 '''
 Usage:
-    xdl.graph_tag().set_dataio_input(data_io)
-    xdl.graph_tag().set_output(prop) 
+    xdl.graph_tag().set_input(data_io)
+    xdl.graph_tag().set_mx_output(prop)    # in xdl.mxnet_wrapper
+    xdl.graph_tag().set_tf_output(prop)    # in xdl.tf_wrapper
 '''
 class GraphTag(object):
     def __init__(self):
         self._inputs = list()
-        self._output_op_names = list()
+        self._output_op_name = 'default'
+        self._sparse_list = list()
+        self._fea_dict = dict()
     def append_input(self, op_name, input_name, type, size=1, table=0):
         if type == xdl.features.sparse:
             input_type = graph_def_pb2.kSparse
         else:
             input_type = graph_def_pb2.kDense
         self._inputs.append((op_name, input_name, input_type, size, table))
-    def set_dataio_input(self, data_io):
-        if not isinstance(data_io, DataIO):
-            raise ValueError('set_dataio_input only accept data_io as parameter')
+    def set_input(self, data_io):
         for (idx, name, type, nvec, table) in data_io.tags:
             if type == xdl.features.sparse:
                 input_type = graph_def_pb2.kSparse
             else:
                 input_type = graph_def_pb2.kDense
             self._inputs.append(('/GetBatch:%d' % idx, name, input_type, nvec, table))
-    def set_input(self, op, tag_name):
-        self._inputs.append((op.define, tag_name, graph_def_pb2.kDense, 0, 0))
-    def set_output(self, op):
-        self._output_op_names.append(op.define)
+        self._sparse_list = data_io._sparse_list
+        self._fea_dict = data_io._fea_dict
     def set_mx_output(self, backend_symbol):
         import mxnet
         if isinstance(backend_symbol, mxnet.symbol.symbol.Symbol):
@@ -70,14 +75,18 @@ def set_tf_output(self, backend_symbol):
         import tensorflow
         if isinstance(backend_symbol, tensorflow.Tensor):
             self._output_op_name = backend_symbol.name
-
     @property
     def inputs(self):
         return self._inputs
-
     @property
-    def output_op_names(self):
-        return self._output_op_names
+    def output_op_name(self):
+        return self._output_op_name
+    @property
+    def sparse_list(self):
+        return self._sparse_list
+    @property
+    def fea_dict(self):
+        return self._fea_dict
 
 _GRAPH_TAG = GraphTag()
 
@@ -85,42 +94,64 @@ def graph_tag():
     global _GRAPH_TAG
     return _GRAPH_TAG
 
+class EmbedOpArg(object):
+    def __init__(self, str, dig, desc):
+        self.str = str
+        self.dig = dig
+        self.desc = desc
+
+class EmbedCodeConf(object):
+    def __init__(self, name, fea_type, emb_dim, fea_groupids, op, op_args=None):
+        self.name = name
+        self.fea_type = fea_type
+        self.emb_dim = emb_dim
+        self.fea_groupids = fea_groupids
+        self.op = op
+        self.op_args = op_args
+
 class Saver(object):
-    def __init__(self):
-        self._ckpt_dir = xdl.get_ckpt_dir()
+    def __init__(self, ckpt_dir=None, tf_graph_name=None):
+        self._ckpt_dir = ckpt_dir
         if self._ckpt_dir is None:
-            raise ValueError('must specify ckpt_dir arg in cmdline')
+          self._ckpt_dir = get_ckpt_dir()
         self._graph_def = _graphdef_to_pb(current_graph()._graph_def)
+        self._tf_graph_name = tf_graph_name
     def save(self, version):
         execute(self.save_op(version))
+    
+    def save_meta(self, version, **kwargs):
+      kwargs['xdl_global_step'] = get_global_step().value
+      values = []
+      for k, v in kwargs.iteritems():
+        if isinstance(v, Tensor):
+          v = execute(v)
+          values.append(v)
+        else:
+          values.append(np.array(v))
+      values = [min(v.flatten().tolist()) for v in values]
+      keys = kwargs.keys()
+      assert len(keys) == len(values)
+      buf = json.dumps(dict(zip(keys, values)))
+      path = os.path.join(self._ckpt_dir, version, '.meta')
+      write_string_to_file(path, buf)
     def restore(self, version):
         execute(self.restore_op(version))
     def save_op(self, version):
         return xdl.ps_save_op(_string_to_int8(version))
     def restore_op(self, version):
         return xdl.ps_restore_op(_string_to_int8(version))
-    def tag_reader_input(self, reader):
-        graph_tag().set_dataio_input(reader)
-    def tag_input(self, op, tag_name):
-        graph_tag().set_input(op, tag_name)
-    def tag_output(self, op):
-        if isinstance(op, list):
-            for item in op:
-                graph_tag().set_output(item)
-        else:
-            graph_tag().set_output(op)            
-    def export_graph(self, as_text=True):
+    def export_graph(self, output_dir, as_text=False):
+        print 'start export graph'
         for (op_name, input_name, input_type, size, table) in graph_tag().inputs:
             self.append_input(op_name, input_name, input_type, size, table)
-        for output in graph_tag().output_op_names:
-            output_tag = self._graph_def.tag.output.add()
-            output_tag.op_name = output
+        self._graph_def.tag.output.op_name = graph_tag().output_op_name
         if as_text:
-            path = os.path.join(self._ckpt_dir, "graph.txt")
-            write_string_to_file(path, str(self._graph_def))
+            write_string_to_file("graph.txt", str(self._graph_def))
+            output(output_dir, "graph.txt")
         else:
-            path = os.path.join(self._ckpt_dir, "graph.pb")
-            write_string_to_file(path, self._graph_def.SerializeToString())
+            write_string_to_file("graph.pb", self._graph_def.SerializeToString())
+            output(output_dir, "graph.pb")
+        print 'finish export graph'
     def append_input(self, op_name, input_name, input_type, size=1, table=0):
         inp = self._graph_def.tag.input.add()
         inp.op_name = op_name
@@ -128,48 +159,239 @@ def append_input(self, op_name, input_name, input_type, size=1, table=0):
         inp.input_type = input_type
         inp.size = size
         inp.table = table
+    def export_sparse_conf_v4(self, sparse_v4_dir, space_list=list(list())):
+        print 'start export sparse conf v4'
+        from xdl.python.training.v4 import f2id_pb2
+        from google.protobuf.text_format import MessageToString
+        f2id_list = f2id_pb2.F2IdList()
+        for gid in xrange(len(space_list)):
+            for feature_groupid in space_list[gid]:
+                f2_id = f2id_list.item.add()
+                f2_id.feature_groupid = feature_groupid
+                f2_id.fid = gid
+        with open('embed.best.meta', 'wb') as f:  # f2id.pb
+            f.write(MessageToString(f2id_list))
+        output(sparse_v4_dir, 'embed.best.meta')
+        print 'finish export sparse conf v4'
+    def export_dense_conf_v4(self, dense_v4_dir, embed_code_conf_list):
+        print 'start export dense conf v4'
+        from xdl.python.training.v4 import dense_input_conf_pb2, embed_dimension_xdl_code_pb2
+        from google.protobuf.text_format import MessageToString
+        embed_dim_list = embed_dimension_xdl_code_pb2.EmbedDimList()
+        embed_dim_list.model_signature = str(long(time.mktime(datetime.datetime.utcnow().timetuple()) * 1000000))
+        global_offset = 1
+        index = 0
+        block = None
+        for embed_conf in embed_code_conf_list:
+            if block is None or embed_conf.name != block.name:
+                block = embed_dim_list.dense_input.input_blocks.add()
+                block.name = embed_conf.name
+                if embed_conf.fea_type == 'common':
+                    block.hint_type = dense_input_conf_pb2.COMMON
+                elif embed_conf.fea_type == 'ncommon':
+                    block.hint_type = dense_input_conf_pb2.UNCOMMON
+                else:
+                    block.hint_type = dense_input_conf_pb2.UNKNOWN
+                index = 0
+            for fea_groupid in embed_conf.fea_groupids:
+                embed_dim = embed_dim_list.embed_dim_list.add()
+                embed_dim.embed_dim = embed_conf.emb_dim
+                embed_dim.fea_groupid = fea_groupid
+                embed_dim.fea_type = 'common' if embed_conf.fea_type == 'unknown' else embed_conf.fea_type  # 'common' | 'ncommon'
+                embed_dim.fea_group_global_offset = global_offset
+                global_offset += 1
+                embed_field = block.embed_fields.add()
+                embed_field.index = index
+                index += 1
+                embed_field.dim = embed_conf.emb_dim
+                embed_field.fea_group_id = fea_groupid
+                embed_field.op = dense_input_conf_pb2.KSUM if embed_conf.op == 'ksum' else dense_input_conf_pb2.ASSIGN
+                if embed_conf.op_args is not None:
+                    for arg in embed_conf.op_args:
+                        op_arg = embed_field.op_args.add()
+                        if arg.str is not None:
+                           op_arg.str = arg.str
+                        if arg.dig is not None:
+                           op_arg.dig = arg.dig
+                        if arg.desc is not None:
+                           op_arg.desc = arg.desc
+        with open('embed-dim-xdl-code-conf', 'wb') as f:  # dense_input_conf.pb
+            f.write(MessageToString(embed_dim_list))
+        output(dense_v4_dir, 'embed-dim-xdl-code-conf')
+        output(dense_v4_dir, 'network_desc.pb')
+        print 'finish export dense conf v4'
+    def export_graph_v4(self, output_v4_dir, emb_dim, space_list=list(list()), order=1, comm_hint_type='common'):
+        print 'start export graph v4 @deprecated'
+        self.export_sparse_graph_v4(output_v4_dir, emb_dim, space_list, order, comm_hint_type)
+        print 'finish export graph v4 @deprecated'
+    def export_sparse_graph_v4(self, output_v4_dir, emb_dim, space_list, order=1, comm_hint_type='common'):
+        from xdl.python.training.v4 import dense_input_conf_pb2, embed_dimension_xdl_code_pb2, f2id_pb2
+        from google.protobuf.text_format import MessageToString
+        embed_dim_list = embed_dimension_xdl_code_pb2.EmbedDimList()
+        embed_dim_list.model_signature = str(long(time.mktime(datetime.datetime.utcnow().timetuple()) * 1000000))
+        if order == 1:
+            comm_block = embed_dim_list.dense_input.input_blocks.add()
+            ncomm_block = embed_dim_list.dense_input.input_blocks.add()
+        else:
+            ncomm_block = embed_dim_list.dense_input.input_blocks.add()
+            comm_block = embed_dim_list.dense_input.input_blocks.add()
+        comm_block.name = 'comm'
+        ncomm_block.name = 'ncomm'
+        comm_block.hint_type = dense_input_conf_pb2.UNKNOWN if comm_hint_type == 'unknown' else dense_input_conf_pb2.COMMON
+        ncomm_block.hint_type = dense_input_conf_pb2.UNCOMMON
+        comm_index = 0
+        ncomm_index = 0
+        for i in xrange(len(graph_tag().sparse_list)):
+            name = graph_tag().sparse_list[i]
+            table = graph_tag().fea_dict[name]['table']
+            embed_dim = embed_dim_list.embed_dim_list.add()
+            embed_dim.embed_dim = emb_dim
+            embed_dim.fea_groupid = name
+            embed_dim.fea_group_global_offset = i + 1
+            embed_dim.fea_type = "ncommon" if table == 0 else "common"
+            embed_field = ncomm_block.embed_fields.add() if table == 0 else comm_block.embed_fields.add()
+            if table == 0:
+                embed_field.index = ncomm_index
+                ncomm_index += 1
+            else:
+                embed_field.index = comm_index
+                comm_index += 1
+            embed_field.dim = emb_dim
+            embed_field.fea_group_id = name
+            embed_field.op = dense_input_conf_pb2.KSUM
+        with open('embed-dim-xdl-code-conf', 'wb') as f:  # dense_input_conf.pb
+            f.write(MessageToString(embed_dim_list))
+        output(output_v4_dir, 'embed-dim-xdl-code-conf')
+        f2id_list = f2id_pb2.F2IdList()
+        for gid in xrange(len(space_list)):
+            for feature_groupid in space_list[gid]:
+                f2_id = f2id_list.item.add()
+                f2_id.feature_groupid = feature_groupid
+                f2_id.fid = gid
+        with open('embed.best.meta', 'wb') as f:  # f2id.pb
+            f.write(MessageToString(f2id_list))
+        output(output_v4_dir, 'embed.best.meta')
+
+class CheckpointMeta:
+  def __init__(self, **kwargs):
+    self._meta = {}
+    for k, v in kwargs.iteritems():
+      if not isinstance(v, Tensor):
+        continue
+      self._meta[k] = v
+    self._meta['xdl_global_step'] = get_global_step().value
+
+  def save(self, ckpt_dir, version, values):
+    if len(self._meta) == 0:
+      return
+    keys = self._meta.keys()
+    values = [min(v.flatten().tolist()) for v in values]
+
+    assert len(keys) == len(values)
+    buf = json.dumps(dict(zip(keys, values)))
+    path = os.path.join(ckpt_dir, version, '.meta')
+    write_string_to_file(path, buf)
+
+  def values(self):
+    return self._meta.values()
 
 class CheckpointHook(Hook):
-    def __init__(self, save_interval_step, is_training=True, export_graph=True, as_text=True):
-        super(CheckpointHook, self).__init__()
+    def __init__(self, save_interval_step=None, save_interval_secs=None,
+                 is_training=True, meta=None, tf_backend=False, max_to_keep=5,
+                 tf_graph_name=None):
+        super(CheckpointHook, self).__init__(priority=3000)
         self._global_step = get_global_step()
-        self._save_interval = save_interval_step
+        self._save_interval_step = save_interval_step
+        self._save_interval_secs = save_interval_secs
         self._ckpt_dir = get_ckpt_dir()
-        self._saver = Saver()
+        self._saver = Saver(self._ckpt_dir, tf_graph_name)
         self._is_training = is_training
-        self._save_cnt = 0
-        self._first_run = True
-        self._export_graph = export_graph
-        self._as_text = as_text
+        self._last_save_step = 0
+        self._last_save_time = time.time()
+        self._meta = meta
+        self._max_to_keep = max_to_keep
+        self._ckpt_queue = []
+
+        if self._save_interval_step is None and self._save_interval_secs is None:
+            print("Checkpoint interval_steps and interval_secs both not set, use default 10000 steps.")
+            self._save_interval_step = 10000
+        elif self._save_interval_step is not None and self._save_interval_secs is not None:
+            raise ValueError("Checkpoint interval_steps and interval_secs can't be both set.")
+
+        self.gstep_val = 0
+        self.meta_val = None
 
     def before_run(self, v):
         if self._ckpt_dir is None:
             return []
 
         if (self._is_training):
-            return self._global_step.value
-        else:
-            update_op = xdl.ps_assign_add_op(
-                var_name = self._global_step.name,
-                var_type = self._global_step.vtype,
-                delta = np.array(1, dtype=np.int64))
-            return [self._global_step.value, update_op]
+            res = [self._global_step.value]
+            if self._meta is not None:
+              res.extend(self._meta.values())
+            return res
 
     def after_run(self, v):
         if self._ckpt_dir is None:
             return
-        global_step = v[0] if isinstance(v, list) else v
-        if self._first_run:
-            self._save_cnt = global_step / self._save_interval
-            self._first_run = False
-        if global_step > 0 and global_step / self._save_interval > self._save_cnt:
-            version = self._create_version(global_step)
-            print('save checkpoint at global_step[%d], ckpt version[%s]' % 
-                  (global_step, version))
-            self._saver.save(version)
-            self._save_cnt = self._save_cnt + 1
-            if self._export_graph:
-                self._saver.export_graph(as_text=self._as_text);
+        self.gstep_val = v[0] if isinstance(v, list) else v
+        if self._meta:
+            self.meta_val = v[1:]
+        if self._save_interval_step is not None:
+            if self.gstep_val - self._last_save_step >= self._save_interval_step:
+                self._save_ckpt(self.gstep_val, self.meta_val)
+                self._last_save_step = self.gstep_val
+                self._ckpt_queue.append(self._create_version(self.gstep_val))
+                self._check_ckpt_queue()
+        elif self._save_interval_secs is not None:
+            if time.time() - self._last_save_time >= self._save_interval_secs:
+                self._save_ckpt(self.gstep_val, self.meta_val)
+                self._last_save_time = time.time()
+                self._ckpt_queue.append(self._create_version(self.gstep_val))
+                self._check_ckpt_queue()
+
+    def end(self):
+        self.gstep_val = xdl.execute(self._global_step.value) + 1
+        if self._meta is not None:
+            self.meta_val = xdl.execute(self._meta.values())
+        self._save_ckpt(self.gstep_val, self.meta_val)
+        if self.gstep_val != self._last_save_step:
+            self._ckpt_queue.append(self._create_version(self.gstep_val))
+        self._check_ckpt_queue()
+
+    def _check_ckpt_queue(self):
+        while len(self._ckpt_queue) > self._max_to_keep:
+            del_version = self._ckpt_queue.pop(0)
+            del_ckpt = self._ckpt_dir.rstrip("/") + "/" + del_version
+            if self._ckpt_dir.startswith('hdfs://'):
+                cmd = "hadoop fs -rm -r %s" % del_ckpt
+            else:
+                cmd = "rm -rf %s" % del_ckpt
+            ret = os.system(cmd)
+            if ret == 0:
+                print("ckpt number is larger than max_to_keep setting, delete oldest ckpt %s" % del_ckpt)
+            else:
+                raise ValueError("Failed: %s" % cmd)
+
+    def _save_ckpt(self, global_step, meta_values):
+        version = self._create_version(global_step)
+        print('save checkpoint at global_step[%d], ckpt version[%s]' % (global_step, version))
+        self._saver.save(version)
+        if meta_values:
+            self._meta.save(self._ckpt_dir, version, meta_values)
 
     def _create_version(self, global_step):
         return "ckpt-{:.>20}".format(global_step)
+
+class RestoreFromHook(Hook):
+    def __init__(self, ckp_model):
+        super(RestoreFromHook, self).__init__(priority=1000)
+        self._ckp_model = ckp_model
+        self._saver = Saver(get_ckpt_dir())
+    def create_session(self):
+        if self._ckp_model and len(self._ckp_model) > 0:
+            if xdl.get_task_index() == 0:
+                self._saver.restore(self._ckp_model)
+                print("restore checkpoint from " + str(self._ckp_model))
+            else:
+                time.sleep(120)
diff --git a/xdl/xdl/python/training/tf_summary_hook.py b/xdl/xdl/python/training/tf_summary_hook.py
new file mode 100644
index 00000000..c882e5cc
--- /dev/null
+++ b/xdl/xdl/python/training/tf_summary_hook.py
@@ -0,0 +1,90 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import numpy as np
+import matplotlib
+import os
+from xdl.python.framework.session import Hook
+from xdl.python.training.training_utils import get_global_step
+from xdl.python.utils.collections import *
+
+class TFSummaryHook(Hook):
+    def __init__(self, config, is_training=True, save_interval=1):
+        super(TFSummaryHook, self).__init__()
+        self._keys = []
+        self._values = []
+        self._types = []
+        self._bins = []
+        if 'output_dir' not in config:
+            raise RuntimeError('summary output directory not set')
+        self._lstep = 0
+        self._output_dir = config['output_dir']
+        import tensorflow as tf
+        self._writer = tf.summary.FileWriter(self._output_dir)
+        self._save_interval = save_interval
+
+    def before_run(self, v):
+        return [self._values]
+
+    def after_run(self, v):
+        import tensorflow as tf
+        self._lstep += 1
+        if self._lstep % self._save_interval != 0:
+            return
+        values = v[0]
+        for i in range(len(self._keys)):
+            key = self._keys[i]
+            stype = self._types[i]
+            val = values[i]
+            bins = self._bins[i]
+            if stype == 'scalar':
+                summary = tf.Summary(value=[tf.Summary.Value(tag=key,
+                    simple_value=val)])
+            elif stype == 'histogram':
+                hist = tf.HistogramProto()
+                hist.min = float(np.min(val))
+                hist.max = float(np.max(val))
+                hist.num = float(np.prod(val.shape))
+                hist.sum = float(np.sum(val))
+                hist.sum_squares = float(np.sum(val**2))
+                counts, edges = np.histogram(val,bins=bins)
+                edges = edges[1:]
+                for edge in edges:
+                    hist.bucket_limit.append(edge)
+                for c in counts:
+                    hist.bucket.append(c)
+                summary = tf.Summary(value=[tf.Summary.Value(tag=key,
+                    histo=hist)])
+            elif stype == 'image':
+                s = StringIO()
+                matplotlib.image.imsave(s, val, format='png')
+                img = tf.Summary.Image(encoded_image_string=s.getvalue(),
+                        height=val.shape[0],
+                        width=val.shape[1])
+                summary = tf.Summary(val=[tf.Summary.Value(tag=key,
+                    image=img)])
+            self._writer.add_summary(summary, self._lstep)
+
+    def summary(self, tag, value, stype='histogram', bins=10):
+        self._keys.append(tag)
+        self._values.append(value)
+        if stype not in ['scalar', 'histogram', 'image']:
+            raise RuntimeError('unknown summary type %s' % stype)
+        self._types.append(stype)
+        if stype == 'histogram':
+            self._bins.append(bins)
+        else:
+            self._bins.append(None)
diff --git a/xdl/xdl/python/training/trace.py b/xdl/xdl/python/training/trace.py
new file mode 100644
index 00000000..973cd632
--- /dev/null
+++ b/xdl/xdl/python/training/trace.py
@@ -0,0 +1,174 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+from xdl.python.utils.collections import *
+from xdl.python.lib.tensor import Tensor
+from xdl.python.framework.variable import Variable
+from xdl.python.training.gradient_utils import get_gradient
+
+TRACE_INFOS = "trace_infos"
+
+class TraceInfo(object):
+  def __init__(self, info):
+    self._info = info
+
+  @property
+  def name(self):
+    assert 'name' in self._info
+    return self._info['name']
+
+  @property
+  def tensor(self):
+    assert 'tensor' in self._info
+    return self._info['tensor']
+
+  @property
+  def value(self):
+    assert 'value' in self._info
+    return self._info['value']
+
+  @property
+  def vtype(self):
+    assert 'vtype' in self._info
+    return self._info['vtype']
+
+  @property
+  def function(self):
+    assert 'function' in self._info
+    return self._info['function']
+
+  @property
+  def variable(self):
+    assert 'variable' in self._info
+    return self._info['variable']
+
+  def set_value(self, value):
+    self._info['value'] = value
+
+def get_names(vtypes, scope=None):
+  info = get_collection(TRACE_INFOS, scope)
+  if info is None:
+    return []
+  vtypes = list(vtypes) if isinstance(vtypes, (list, tuple)) else [vtypes]
+  return [v.name for v in info if v.vtype in vtypes]
+
+def get_values(vtypes, scope=None):
+  info = get_collection(TRACE_INFOS, scope)
+  if info is None:
+    return []
+  vtypes = list(vtypes) if isinstance(vtypes, (list, tuple)) else [vtypes]
+  return [v.value for v in info if v.vtype in vtypes]
+
+def get_variables(vtypes, scope=None):
+  info = get_collection(TRACE_INFOS, scope)
+  if info is None:
+    return []
+  vtypes = list(vtypes) if isinstance(vtypes, (list, tuple)) else [vtypes]
+  return [v.variable for v in info if v.vtype in vtypes]
+
+def get_tensors(vtypes, scope=None):
+  info = get_collection(TRACE_INFOS, scope)
+  if info is None:
+    return []
+  vtypes = list(vtypes) if isinstance(vtypes, (list, tuple)) else [vtypes]
+  return [v.tensor for v in info if v.vtype in vtypes]
+
+def get_functions(vtypes, scope=None):
+  info = get_collection(TRACE_INFOS, scope)
+  if info is None:
+    return []
+  vtypes = list(vtypes) if isinstance(vtypes, (list, tuple)) else [vtypes]
+  return [v.function for v in info if v.vtype in vtypes]
+
+def set_values(vtypes, values, scope=None):
+  info = get_collection(TRACE_INFOS, scope)
+  if info is None:
+    assert len(values) == 0
+    return
+  vtypes = list(vtypes) if isinstance(vtypes, (list, tuple)) else [vtypes]
+  k = 0
+  for v in info:
+    if v.vtype in vtypes:
+      v.set_value(values[k])
+      k += 1
+  assert k == len(values)
+
+def trace_tensor(name, t, scope=None, backend='xdl', summary=None, variable=None):
+  info = {'name': name}
+  if backend in ['tf', 'tf_sparse_assign']:
+    import tensorflow as tf
+    assert isinstance(t, (tf.Tensor, tf.Variable))
+    t = tf.identity(t)
+  elif backend == 'mxnet':
+    import mxnet as mx
+    assert isinstance(t, mx.sym.Symbol)
+    assert name == t.name, 'mxnet symbol names must keep in trace'
+    t = mx.sym.BlockGrad(t)
+  else:
+    assert isinstance(t, Tensor)
+    info['value'] = t
+  info['tensor'] = t
+  info['vtype'] = backend
+  info['function'] = summary
+  info['variable'] = variable
+  add_to_collection(TRACE_INFOS, TraceInfo(info), scope)
+
+def trace_tf_tensor(name, value, scope=None, summary=None):
+  trace_tensor(name, value, scope, backend='tf', summary=summary)
+
+def trace_mxnet_tensor(name, value, scope=None, summary=None):
+  trace_tensor(name, value, scope, backend='mxnet', summary=summary)
+
+def trace_variable(name, var, scope=None, summary=None):
+  trace_tensor(name, var.value, scope=scope, backend='xdl', summary=summary)
+
+def trace_gradient(name, key=None, scope=None, summary=None):
+  if key is None:
+    if scope is not None and scope != '':
+      key = scope + '/gradient/' + name
+    else:
+      key = 'gradient/' + name
+  gradient = get_gradient(name, scope)
+  trace_tensor(key, gradient, scope=scope, backend='xdl', summary=summary)
+
+def trace_collection(collection, scope=None):
+  coll = get_collection(collection, scope)
+  for var in coll:
+    key = var.name
+    if scope is not None and scope != '':
+      key = scope + '/' + key
+    trace_tensor(key, var.value, scope=scope, backend='xdl')
+
+def trace_callback(name, callback, scope=None):
+  info = {'name': name, 'vtype': 'function', 'function': callback}
+  add_to_collection(TRACE_INFOS, TraceInfo(info), scope)
+
+def trace_once(name, value, scope=None, summary=None):
+  assert isinstance(value, Tensor)
+  info = {'name': name, 'vtype': 'once', 'tensor': value, 'value': value}
+  add_to_collection(TRACE_INFOS, TraceInfo(info), scope)
+
+def trace_sparse_assign(name, ids, values, shape, dtype, vtype, scope=None):
+  import tensorflow as tf
+  from xdl.python.ops.init_ops import Zeros
+  assert isinstance(ids, tf.Tensor)
+  assert isinstance(values, tf.Tensor)
+  shape = [1] + list(shape)
+  var = Variable(name=name,shape=shape,dtype=dtype,initializer=Zeros(),
+      trainable=False,vtype=vtype,scope=scope)
+  trace_tensor(name + '_ids', ids, scope=scope, backend='tf_sparse_assign',
+      variable=var)
+  trace_tensor(name + '_values', values, scope=scope,
+      backend='tf_sparse_assign', variable=var)
diff --git a/xdl/xdl/python/training/trace_hook.py b/xdl/xdl/python/training/trace_hook.py
new file mode 100644
index 00000000..bff11417
--- /dev/null
+++ b/xdl/xdl/python/training/trace_hook.py
@@ -0,0 +1,446 @@
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import xdl
+import numpy as np
+import struct
+import os
+import threading
+import Queue
+import time
+import datetime
+from xdl.python.framework.session import Hook
+from xdl.python.training.training_utils import get_global_step
+from xdl.python.utils.collections import *
+from xdl.python.proto import trace_pb2
+from xdl.python.pybind import get_file_system
+from xdl.python.training.trace import *
+from xdl.python.lib.graph import execute
+
+def nptype2trace(np_type):
+  if np_type == np.int8:
+    return trace_pb2.Int8
+  elif np_type == np.int16:
+    return trace_pb2.Int16
+  elif np_type == np.int32:
+    return trace_pb2.Int32
+  elif np_type == np.int64:
+    return trace_pb2.Int64
+  elif np_type == np.float32:
+    return trace_pb2.Float
+  elif np_type == np.float64:
+    return trace_pb2.Double
+  elif np_type == np.bool:
+    return trace_pb2.Bool
+  elif np_type == np.byte:
+    return trace_pb2.Byte
+  else:
+    raise RuntimeError('unknown numpy dtype: {}'.format(np_type))
+
+class TraceWriterThread(threading.Thread):
+  def __init__(self, queue):
+    threading.Thread.__init__(self)
+    self._queue = queue
+    #self.daemon = True
+    self._total_len = 0
+
+  def run(self):
+    while True:
+      msg = self._queue.get()
+      if msg is None:
+        self._queue.task_done()
+        break
+      writer = msg[0]
+      buf = msg[1]
+      self._total_len += len(buf)
+      writer.write(buf, len(buf))
+      self._queue.task_done()
+
+class TraceWriter(object):
+  def __init__(self, config, is_training=True):
+    if 'output_dir' not in config:
+      raise RuntimeError('trace output_dir not specified')
+    path = config['output_dir']
+    if path.startswith('hdfs://'):
+      pos = path.find('/', len('hdfs://'))
+      self._fs = get_file_system(xdl.fs.hdfs, path[:pos + 1])
+      self._fs_type = xdl.fs.hdfs
+    elif path.startswith('swift://'):
+      temp_path = path[len('swift://'):]
+      pos = temp_path.find('@')
+      self._writer_config = temp_path[:pos]
+      namenode = temp_path[pos+1:]
+      self._fs = get_file_system(xdl.fs.swift, namenode)
+      self._fs_type = xdl.fs.swift
+    else:
+      if path.startswith('file://'):
+        path = path[len('file://'):]
+      self._fs = get_file_system(xdl.fs.local, '')
+      self._fs_type = xdl.fs.local
+
+    self._max_file_size = 300
+    if 'max_file_m_size' in config:
+      self._max_file_size = config['max_file_m_size']
+    self._output_file_name = 'trace'
+    if 'output_file_name' in config:
+      self._output_file_name = config['output_file_name']
+    self._rank = xdl.get_task_index()
+    prefix = 'train' if is_training else 'test'
+    self._out_prefix = os.path.join(
+        path, '{}.{}.{}'.format(prefix, self._output_file_name, self._rank)
+    )
+    self._cur_file_index = 0
+    self._new_file()
+    self._headers = []
+
+    self._lstep_begin = -1
+    self._lstep_end = -1
+    self._gstep_begin = -1
+    self._gstep_end = -1
+    self._timestamp_begin = -1
+    self._timestamp_end = -1
+
+    self._last_lstep = -1
+    self._last_gstep = -1
+    self._last_timestamp = -1
+
+    self._queue = Queue.Queue()
+    self._thread = TraceWriterThread(self._queue)
+    self._thread.start()
+
+  def wait_done(self):
+    self._lstep_end = self._last_lstep
+    self._gstep_end = self._last_gstep
+    self._timestamp_end = self._last_timestamp
+    self.write_meta()
+    self._queue.put_nowait(None)
+    self._queue.join()
+    self._lstep_begin = -1
+    self._gstep_begin = -1
+    self._timestamp_begin = -1
+    self._thread.join()
+
+  def _new_file(self):
+    self._cur_size = 0
+    self._cur_file_index += 1
+    if self._fs_type != xdl.fs.swift:
+      self._cur_path = '{}.{}'.format(self._out_prefix, self._cur_file_index)
+      self._cur_meta_path = '{}.meta'.format(self._cur_path)
+      self._writer = self._fs.get_ant(self._cur_path, 'w')
+      self._meta_writer = self._fs.get_ant(self._cur_meta_path, 'w')
+    else:
+      self._cur_path = self._writer_config
+      self._cur_meta_path = self._cur_path
+      self._writer = self._fs.get_ant(self._cur_path, 'w')
+      self._meta_writer = self._writer
+
+  def _write_buf(self, buf):
+    self._cur_size += len(buf)
+    self._queue.put_nowait((self._writer, buf))
+
+  def _write_size(self, size):
+    buf = struct.pack('<I', size)
+    self._write_buf(buf)
+
+  def _write_protobuf(self, msg):
+    buf = msg.SerializeToString()
+    self._write_size(len(buf))
+    self._write_buf(buf)
+
+  def write_headers(self, headers):
+    self._headers = headers
+    header = trace_pb2.Header()
+    header.key.extend(headers)
+    self._write_protobuf(header)
+
+  def write_meta(self):
+    meta = trace_pb2.Meta()
+    meta.lstep_begin = self._lstep_begin
+    meta.lstep_end = self._lstep_end
+    meta.gstep_begin = self._gstep_begin
+    meta.gstep_end = self._gstep_end
+    meta.timestamp_begin = self._timestamp_begin
+    meta.timestamp_end = self._timestamp_end
+    buf = meta.SerializeToString()
+    self._queue.put_nowait((self._meta_writer, buf))
+
+  def write_records(self, columns, gstep, lstep, timestamp):
+    if self._last_lstep == -1:
+      self._last_lstep = lstep
+    if self._last_gstep == -1:
+      self._last_gstep = gstep
+    if self._last_timestamp == -1:
+      self._last_timestamp = timestamp
+    if self._lstep_begin == -1:
+      self._lstep_begin = self._last_lstep
+    if self._gstep_begin == -1:
+      self._gstep_begin = self._last_gstep
+    if self._timestamp_begin == -1:
+      self._timestamp_begin = self._last_timestamp
+    if self._cur_size >= self._max_file_size * 1e6:
+      self._lstep_end = self._last_lstep
+      self._gstep_end = self._last_gstep
+      self._timestamp_end = self._last_timestamp
+      self.write_meta()
+      self._new_file()
+      self.write_headers(self._headers)
+      self._lstep_begin = -1
+      self._gstep_begin = -1
+      self._timestamp_begin = -1
+    assert len(self._headers) == len(columns)
+    record = trace_pb2.Record()
+    record.gstep = gstep
+    record.lstep = lstep
+    record.timestamp = timestamp
+    for arr in columns:
+      col = record.column.add()
+      col.dtype = nptype2trace(arr.dtype)
+      col.shape.extend(list(arr.shape))
+      col.data = arr.tobytes()
+    self._write_protobuf(record)
+    self._last_lstep = lstep
+    self._last_gstep = gstep
+    self._last_timestamp = timestamp
+
+class TraceFilter(object):
+  def filtered(self, **kwargs):
+    return False
+
+class SamplingFilter(TraceFilter):
+  def __init__(self, ratio=1.0):
+    self._ratio = ratio
+
+  def filtered(self, **kwargs):
+    import random
+    v = random.uniform(0, 1)
+    return v > ratio
+
+class StepFilter(TraceFilter):
+  def __init__(self, step_size=100):
+    self._step_size = step_size
+
+  def filtered(self, **kwargs):
+    lstep = kwargs['lstep']
+    return lstep % self._step_size != 0
+
+class RangeFilter(TraceFilter):
+  def __init__(self, start, end):
+    self._start = start
+    self._end = end
+
+  def filtered(self, **kwargs):
+    lstep = kwargs('lstep')
+    return lstep < self._start or lstep > self._end
+
+class TimeFilter(TraceFilter):
+  def __init__(self, window):
+    self._window = window
+    self._start = datetime.datetime.now()
+
+  def filtered(self, **kwargs):
+    cur = datetime.datetime.now()
+    diff = cur - self._start
+    if diff.total_seconds() >= self._window:
+      self._start = datetime.datetime.now()
+      return True
+    return False
+
+_default_filter = TraceFilter()
+
+class TraceHook(Hook):
+  def __init__(
+      self,
+      config=None,
+      is_training=True,
+      gstep=None,
+      filter=_default_filter,
+      scope=None
+  ):
+    super(TraceHook, self).__init__()
+    self._keys = []
+    self._values = []
+    self._summaries = []
+    # callbacks
+    self._cb_keys = []
+    self._cbs = []
+
+    # once
+    self._once_keys = []
+    self._once_values = []
+
+    # sparse assign
+    self._sparse_assign_vars = []
+    self._sparse_assign_ids = []
+    self._sparse_assign_values = []
+
+    if is_training or gstep is None:
+      self._gstep = get_global_step()
+      self._use_gstep = True
+    else:
+      self._gstep = gstep
+      self._use_gstep = False
+    self._lstep = 0
+    if config is None or 'output_dir' not in config:
+      print('WARNING: no output_dir found, trace will not work!!!')
+      self._writer = None
+    else:
+      self._writer = TraceWriter(config, is_training)
+
+    self._filter = filter
+
+    scope = list(scope) if isinstance(scope, (list, tuple)) else [scope]
+    for s in scope:
+      info = get_values('tf_sparse_assign', s)
+      vars = get_variables('tf_sparse_assign', s)
+      self._sparse_assign_ids.extend([info[i] for i in range(len(info)) if i % 2 == 0])
+      self._sparse_assign_values.extend([info[i] for i in range(len(info)) if i % 2 == 1])
+      self._sparse_assign_vars.extend([vars[i] for i in range(len(vars)) if i % 2 == 0])
+
+      for vtype in ['xdl', 'tf', 'mxnet']:
+        self._keys.extend(get_names(vtype, s))
+        self._values.extend(get_values(vtype, s))
+        self._summaries.extend(get_functions(vtype, s))
+      self._cb_keys.extend(get_names('function', s))
+      self._cbs.extend(get_functions('function', s))
+
+      self._once_keys.extend(get_names('once', s))
+      self._once_values.extend(get_values('once', s))
+
+      assert len(self._sparse_assign_ids) == len(self._sparse_assign_values)
+      assert len(self._sparse_assign_ids) == len(self._sparse_assign_vars)
+
+      assert len(self._keys) == len(self._values)
+      assert len(self._keys) == len(self._summaries)
+      assert len(self._cb_keys) == len(self._cbs)
+      assert len(self._once_keys) == len(self._once_values)
+
+    print 'before_run_tensors:', self._values
+
+  def __del__(self):
+    self.wait_done()
+
+  def _execute_sparse_assign(self, sparse_ids, sparse_vals):
+    assert len(sparse_ids) == len(self._sparse_assign_ids)
+    assert len(sparse_vals) == len(self._sparse_assign_values)
+    for i in xrange(len(self._sparse_assign_ids)):
+      ids = sparse_ids[i]
+      values = sparse_vals[i]
+      var = self._sparse_assign_vars[i]
+      op = xdl.ps_sparse_assign_op(
+          var_name=var.name, var_type=var.vtype, ids=ids, values=values
+      )
+      execute(op)
+
+  def before_run(self, v):
+    res = []
+    if self._use_gstep:
+      res = [self._gstep.value, self._values]
+    else:
+      res = [self._values]
+    if self._lstep == 0 and len(self._once_keys) > 0:
+      res.append(self._once_values)
+    if len(self._sparse_assign_ids) > 0:
+      res.append(self._sparse_assign_ids)
+      res.append(self._sparse_assign_values)
+    return res
+
+  def after_run(self, v):
+    self._lstep += 1
+    if self._filter.filtered(lstep=self._lstep):
+      return
+    if self._use_gstep:
+      gstep, values = v[0], v[1]
+      if len(self._sparse_assign_ids) > 0:
+        sparse_ids, sparse_vals = v[2], v[3]
+    else:
+      gstep, values = self._gstep, v[0]
+      if len(self._sparse_assign_ids) > 0:
+        sparse_ids, sparse_vals = v[1], v[2]
+    if len(self._sparse_assign_ids) > 0:
+      self._execute_sparse_assign(sparse_ids, sparse_vals)
+    once_values = []
+    if len(self._once_keys) > 0:
+      if self._lstep == 1:
+        once_values = v[2]
+      else:
+        once_values = len(self._once_keys) * [np.array([], dtype=np.float32)]
+    assert len(self._keys) == len(values)
+    cb_values = []
+    for cb in self._cbs:
+      cb_values.append(cb())
+    assert len(self._cb_keys) == len(cb_values)
+    if self._writer is None:
+      return
+    if self._lstep == 1:
+      self._writer.write_headers(self._keys + self._cb_keys + self._once_keys)
+    # execute user summary function
+    temp_values = []
+    for v, func in zip(values, self._summaries):
+      if callable(func):
+        temp_values.append(func(v))
+      else:
+        temp_values.append(v)
+    self._writer.write_records(
+        temp_values + cb_values + once_values, gstep, self._lstep,
+        int(time.time() * 1000)
+    )
+
+  def wait_done(self):
+    return self._writer.wait_done()
+
+  def add_variable(self, var_name, key=None, scope=None):
+    if key is None:
+      if scope is not None and scope != '':
+        key = scope + '/' + var_name
+      else:
+        key = var_name
+    global_vars = get_collection(GLOBAL_VARIABLES, scope)
+    not_found = True
+    for var in global_vars:
+      if var.name == var_name:
+        not_found = False
+        # add to keys and values
+        self._keys.append(key)
+        self._values.append(var.value)
+        break
+    if not_found:
+      print('WARNING: variable %s not found to trace' % var_name)
+
+  def add_tensor(self, value, key):
+    self._keys.append(key)
+    self._values.append(value)
+
+  def add_gradient(self, var_name, key=None, scope=None):
+    if key is None:
+      if scope is not None and scope != '':
+        key = scope + '/gradient/' + var_name
+      else:
+        key = 'gradient/' + var_name
+    gradient = xdl.get_gradient(var_name, scope)
+    self._keys.append(key)
+    self._values.append(gradient)
+
+  def add_collection(self, coll_name, scope=None):
+    coll = get_collection(coll_name, scope)
+    for var in coll:
+      key = var.name
+      if scope is not None and scope != '':
+        key = scope + '/' + key
+      self._keys.append(key)
+      self._values.append(var.value)
+
+  def add_callback(self, callback, key):
+    self._cb_keys.append(key)
+    self._cbs.append(callback)
diff --git a/xdl/xdl/python/training/train_session.py b/xdl/xdl/python/training/train_session.py
index e6096394..9a384a4f 100644
--- a/xdl/xdl/python/training/train_session.py
+++ b/xdl/xdl/python/training/train_session.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -14,9 +14,9 @@
 # ==============================================================================
 
 import time
-import datetime
 import xdl
 import numpy as np
+import math
 from xdl.python.lib.graph import execute
 from xdl.python.training.env import current_env, is_local_mode
 from xdl.python.framework.session import Hook, Session
@@ -25,12 +25,24 @@
 from xdl.python.utils.ps_utils import restart_client
 from xdl.python.utils.metrics import add_metrics, get_all_metrics
 from xdl.python.training.training_utils import get_global_step
+from xdl.python.training.saver import Saver
 from xdl.python.lib.graph import current_graph
-from xdl.python.backend.model_scope import cur_model_scope
+from xdl.python.backend.model_scope import cur_model_scope, model_scope, get_model_scopes
+from xdl.python.utils.config import get_ckpt_dir
+from xdl.python.utils.collections import get_collection, READER_HOOKS, reset_collections
 
+def _restart_client(retry_cnt=3, interval=10):
+    i = 0
+    while (i < retry_cnt and not restart_client()):
+        i += 1
+        time.sleep(interval)
+        if i >= 3:
+            raise InternalError("restart client failed")
 
 class SyncRunHook(Hook):
     def __init__(self, index, worker_count):
+        super(SyncRunHook, self).__init__()
+        self._index = index
         self._before = xdl.ps_synchronize_enter_op(
             np.array(index, dtype=np.int32), np.array(worker_count, dtype=np.int32))
         self._after = xdl.ps_synchronize_leave_op(
@@ -44,9 +56,45 @@ def after_run(self, v):
         execute([self._after])
         return None
 
+    def end(self):
+        execute(xdl.worker_report_finish_op(id = np.array(self._index, dtype=np.int32)))
+
+class WorkerFinishHook(Hook):
+    def __init__(self, index, worker_count, finish_rate):
+        super(WorkerFinishHook, self).__init__()
+        self._is_chief = False
+        if index == 0:
+            self._is_chief = True
+        self._index = index
+        self._worker_count = worker_count
+        self._op = xdl.get_worker_finish_count_op()
+        self._finish_rate = finish_rate
+
+    def before_run(self, v):
+        if self._is_chief:
+            return [self._op]
+        else:
+            return []
+
+    def after_run(self, v):
+        if self._is_chief and v[0] >= math.ceil(self._finish_rate * self._worker_count / 100.0):
+            print("Finish_num is [%ld] limit is [%d], request_stop" % (v[0], math.ceil(self._finish_rate * self._worker_count / 100.0)))
+            raise OutOfRange("WorkerFinished")
+
+    def end(self):
+        execute(xdl.worker_report_finish_op(id = np.array(self._index, dtype=np.int32)))
+        if self._is_chief:
+            finish_num = execute(self._op)
+            while finish_num < math.ceil(self._finish_rate * self._worker_count / 100.0):
+                print("Finish_num is [%ld] limit is [%d], waiting..." % (finish_num, math.ceil(self._finish_rate * self._worker_count / 100.0)))
+                finish_num = execute(self._op)
+                time.sleep(10)
+            print("Finish_num is [%ld] limit is [%d], exiting..." % (finish_num, math.ceil(self._finish_rate * self._worker_count / 100.0)))
 
 class SemiSyncRunHook(Hook):
     def __init__(self, index, worker_count, staleness=0):
+        super(SemiSyncRunHook, self).__init__()
+        self._index = index
         self._before = xdl.ps_asynchronize_enter_op(
             np.array(index, dtype=np.int32),
             np.array(staleness, dtype=np.int32),
@@ -56,8 +104,12 @@ def before_run(self, v):
         execute([self._before])
         return []
 
+    def end(self):
+        execute(xdl.worker_report_finish_op(id = np.array(self._index, dtype=np.int32)))
+
 class BarrierHook(Hook):
     def __init__(self, index, worker_count):
+        super(BarrierHook, self).__init__()
         self._before = xdl.worker_barrier_op(
             np.array(index, dtype=np.int32),
             np.array(worker_count, dtype=np.int32))
@@ -68,6 +120,7 @@ def before_run(self, v):
 
 class MetricsHook(Hook):
     def __init__(self, name, op, interval):
+        super(MetricsHook, self).__init__(priority=1003)
         self._op = op
         self._name = name
         self._interval = interval
@@ -82,27 +135,65 @@ def before_run(self, v):
 
     def after_run(self, v):
         if isinstance(v, list) and len(v) == 0:
+            add_metrics(self._name, '')
             return
         add_metrics(self._name, str(v))
 
-
 class MetricsPrinterHook(Hook):
-    def __init__(self, log_fmt, interval=100):
+    def __init__(self, log_fmt, interval=100, file_path=''):
+        super(MetricsPrinterHook, self).__init__()
         self._log_fmt = log_fmt
         self._interval = interval
         self._counter = 0
+        self._protocol, self._hostname, self._path = self.parse_path(file_path)
+        if self._protocol == 'local':
+            self._local_file = open(self._path, 'w')
+        elif self._protocol == 'hdfs':
+            import pyhdfs
+            self._hdfs_client = pyhdfs.HdfsClient(hosts=self._hostname.replace(':', ','))
+            self._hdfs_file = self._hdfs_client.create(self._path, '', overwrite=True)
+        elif self._protocol != '':
+            raise ValueError('not supportted file system:%s' % self._protocol)
+
+    def parse_path(self, file_path):
+        if file_path == '':
+            return '', '', ''
+        protocol = ''
+        hostname = ''
+        path = ''
+        pos = file_path.find('://')
+        if pos != -1:
+            protocol = file_path[:pos]
+            pos2 = file_path.find('/', pos + 3)
+            if pos2 != -1:
+                hostname = file_path[pos+3:pos2]
+                path = file_path[pos2:]
+            else:
+                hostname = file_path[pos+3:]
+        else:
+            protocol = 'local'
+            path = file_path
+        return protocol, hostname, path
 
     def before_run(self, v):
+        self._counter = self._counter + 1
         return []
 
     def after_run(self, v):
-        self._counter = self._counter + 1
         if self._counter % self._interval == 0:
-            print(self._log_fmt % get_all_metrics())
-
+            msg = self._log_fmt % get_all_metrics()
+            print(msg)
+            if self._path != '':
+                if self._protocol == 'local':
+                    self._local_file.write(msg + '\n')
+                elif self._protocol == 'hdfs':
+                    self._hdfs_client.append(self._path, msg + '\n')
+                else:
+                    pass
 
 class QpsMetricsHook(Hook):
     def __init__(self):
+        super(QpsMetricsHook, self).__init__()
         self._lstep = 0
         self._gstep = 0
         self._lsteps = []
@@ -127,12 +218,10 @@ def after_run(self, v):
             self._gsteps.pop(0)
             self._gsteps.append(self._gstep)
         if len(self._times) < self._interval:
-            dt = datetime.datetime.now()
-            self._times.append(dt.microsecond + dt.second * 1000000)
+            self._times.append(int(round(time.time() * 1000)))
         else:
             self._times.pop(0)
-            dt = datetime.datetime.now()
-            self._times.append(dt.microsecond + dt.second * 1000000)
+            self._times.append(int(round(time.time() * 1000)))
 
         add_metrics("lstep", self._lstep)
         add_metrics("gstep", self._gstep)
@@ -142,10 +231,10 @@ def after_run(self, v):
                 interval = 1
             gsteps = self._gsteps[-1] - self._gsteps[0]
             lsteps = self._lsteps[-1] - self._lsteps[0]
-            gqps = int(gsteps * 1000000.0 / interval)
-            lqps = int(lsteps * 1000000.0 / interval)
-            add_metrics("gqps", str(gqps))
-            add_metrics("lqps", str(lqps))
+            gqps = gsteps * 1000.0 / interval
+            lqps = lsteps * 1000.0 / interval
+            add_metrics("gqps", '%.1f' % gqps)
+            add_metrics("lqps", '%.1f' % lqps)
         else:
             add_metrics("gqps", "0")
             add_metrics("lqps", "0")
@@ -161,19 +250,24 @@ def execute_with_retry(ops, retry_cnt=6):
             i = i + 1
             if i == retry_cnt:
                 raise e
-            print('execute fail retry cnt[%d]' % i)
-            time.sleep(30)
-            restart_client()
+            print('run ops:', ops, ' fail, retry cnt:', i)
+            time.sleep(10)
+            _restart_client()
 
 
 class WorkerHook(Hook):
+    def __init__(self):
+        super(WorkerHook, self).__init__(priority=1002)
+
     def create_session(self):
-        if global_variables() is None or len(global_variables()) == 0:
+        scopes = list(get_model_scopes())
+        if global_variables(scopes) is None or \
+                len(global_variables(scopes)) == 0:
             return
-        execute_with_retry(variable_registers())
-        var_set = set(global_variables())
+        execute_with_retry(variable_registers(scopes))
+        var_set = set(global_variables(scopes))
         while len(var_set) > 0:
-            for var in global_variables():
+            for var in global_variables(scopes):
                 if var not in var_set:
                     continue
                 inited = execute_with_retry([var.is_initialized_op])
@@ -188,16 +282,21 @@ def create_session(self):
 
 
 class ChiefHook(Hook):
+    def __init__(self):
+        super(ChiefHook, self).__init__(priority=1001)
+
     def create_session(self):
-        if global_variables() is None or\
-                len(global_variables()) == 0:
+        scopes = list(get_model_scopes())
+        if global_variables(scopes) is None or\
+                len(global_variables(scopes)) == 0:
             return
-        execute_with_retry(variable_registers())
-        execute_with_retry(global_initializers())
+        execute_with_retry(variable_registers(scopes))
+        execute_with_retry(global_initializers(scopes))
 
 
 class LoggerHook(Hook):
     def __init__(self, ops, fmt, interval=1):
+        super(LoggerHook, self).__init__()
         if not isinstance(ops, list):
             self._ops = [ops]
         else:
@@ -220,7 +319,6 @@ def after_run(self, v):
             msg = msg.replace("{%d}" % i, str(v[i]))
         print(msg)
 
-
 class SimpleSession(object):
     def __init__(self, hooks=None):
         env = current_env()
@@ -232,40 +330,41 @@ def __init__(self, hooks=None):
             hooks = []
         self._hooks = hooks
         if self._is_chief:
-            self._hooks = [ChiefHook(), WorkerHook()] + self._hooks
+            #self._hooks = self._hooks + [ChiefHook(), WorkerHook()]
+            self._hooks = self._hooks + [ChiefHook()]
         else:
-            self._hooks = [WorkerHook()] + self._hooks
+            self._hooks = self._hooks + [WorkerHook()]
+        def take_priority(elem):
+            return elem._priority
+        self._hooks.sort(key=take_priority)
         self._session = Session(self._hooks)
 
-    def run(self, v, run_option=None, run_statistic=None, feed_dict=None):
-        return self._session.run(v, run_option, run_statistic, feed_dict=feed_dict)
+    def run(self, v, run_option=None, run_statistic=None):
+        return self._session.run(v, run_option, run_statistic)
 
     def end(self):
         return self._session.end()
 
+
 class TrainSession(object):
     def __init__(self, hooks=None):
         current_env().sess_start()
-        self._hooks = hooks
+        self._hooks = [] if hooks is None else hooks
+        reader_hooks = get_collection(READER_HOOKS)
+        if reader_hooks is not None:
+            self._hooks.extend(reader_hooks)
+        self._cur_scope = cur_model_scope()
         self._session = SimpleSession(hooks)
         self._finish = False
-#    current_graph().finalize()
 
-    def _restart_client(self, retry_cnt=3, interval=10):
-        i = 0
-        while (i < retry_cnt and not restart_client()):
-            i += 1
-            time.sleep(interval)
-            if i >= 3:
-                raise InternalError("restart client failed")
-
-    def run(self, v, run_option=None, run_statistic=None, feed_dict=None):
+    def run(self, v, run_option=None, run_statistic=None):
         current_graph().unfinalize()
         try:
             if self._session is None:
-                self._restart_client()
-                self._session = SimpleSession(self._hooks)
-            return self._session.run(v, run_option, run_statistic, feed_dict=feed_dict)
+                _restart_client()
+                with model_scope(self._cur_scope):
+                    self._session = SimpleSession(self._hooks)
+            return self._session.run(v, run_option, run_statistic)
         except (PsError) as e:
             print('An error was raised. This may be due to a preemption in '
                   'a connected worker or parameter server. The current '
@@ -278,5 +377,9 @@ def run(self, v, run_option=None, run_statistic=None, feed_dict=None):
             self._finish = True
             return None
 
+    def end(self):
+        self._session.end()
+        self._finish = True
+        
     def should_stop(self):
         return self._finish
diff --git a/xdl/xdl/python/training/training_utils.py b/xdl/xdl/python/training/training_utils.py
index fd59df5a..94677121 100644
--- a/xdl/xdl/python/training/training_utils.py
+++ b/xdl/xdl/python/training/training_utils.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/utils/__init__.py b/xdl/xdl/python/utils/__init__.py
index 22a71c18..75e146c5 100644
--- a/xdl/xdl/python/utils/__init__.py
+++ b/xdl/xdl/python/utils/__init__.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/utils/collections.py b/xdl/xdl/python/utils/collections.py
index da13d4c9..2f6503ae 100644
--- a/xdl/xdl/python/utils/collections.py
+++ b/xdl/xdl/python/utils/collections.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -54,14 +54,14 @@ def name_with_scope(name, scope):
 def add_to_collection(name, value, scope=None):
   scopes = get_scopes(scope)
   for scope in scopes:
-    name = name_with_scope(name, scope)
+    new_name = name_with_scope(name, scope)
     global GLOBAL_COLLECTION
-    if name not in GLOBAL_COLLECTION:
-      GLOBAL_COLLECTION[name] = []        
+    if new_name not in GLOBAL_COLLECTION:
+      GLOBAL_COLLECTION[new_name] = []        
     if isinstance(value, list):
-      GLOBAL_COLLECTION[name].extend(value)
+      GLOBAL_COLLECTION[new_name].extend(value)
     else:
-      GLOBAL_COLLECTION[name].append(value)
+      GLOBAL_COLLECTION[new_name].append(value)
 
 def add_to_collections(names, value, scope=None):
   scopes = get_scopes(scope)
@@ -73,10 +73,10 @@ def get_collection(name, scope=None):
   scopes = get_scopes(scope)
   result = []
   for scope in scopes:
-    name = name_with_scope(name, scope)
+    new_name = name_with_scope(name, scope)
     global GLOBAL_COLLECTION
-    if name in GLOBAL_COLLECTION:
-      result.extend(GLOBAL_COLLECTION[name])
+    if new_name in GLOBAL_COLLECTION:
+      result.extend(GLOBAL_COLLECTION[new_name])
   if len(result) == 0:
     return None
   return result
@@ -84,10 +84,10 @@ def get_collection(name, scope=None):
 def delete_collection(name, scope=None):
   scopes = get_scopes(scope)
   for scope in scopes:
-    name = name_with_scope(name, scope)
+    new_name = name_with_scope(name, scope)
     global GLOBAL_COLLECTION
-    if name in GLOBAL_COLLECTION:
-      del GLOBAL_COLLECTION[name]
+    if new_name in GLOBAL_COLLECTION:
+      del GLOBAL_COLLECTION[new_name]
 
 def delete_collections(names, scope=None):
   scopes = get_scopes(scope)
diff --git a/xdl/xdl/python/utils/config.py b/xdl/xdl/python/utils/config.py
index d54088cb..ba291e39 100644
--- a/xdl/xdl/python/utils/config.py
+++ b/xdl/xdl/python/utils/config.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -31,16 +31,13 @@
 parser.add_argument("-tt", "--task_type", help="task type", default="train")
 parser.add_argument("-ms", "--model_server", help="model server", default="")
 parser.add_argument("-msn", "--model_server_num", help="model server num", default="")
-_BASE_ARGS = parser.parse_args()
+parser.add_argument("-f", "--notebook_file", help="notebook file", default="")
+_BASE_ARGS, options = parser.parse_known_args()
 
 def get_task_name():
-  if get_run_mode() == 'local':
-    return 'worker'
   return _BASE_ARGS.task_name
 
 def get_task_index():
-  if get_run_mode() == 'local':
-    return 0
   return _BASE_ARGS.task_index
 
 def get_app_id():
@@ -79,14 +76,23 @@ def get_task_type():
   return _BASE_ARGS.task_type
 
 def get_task_num():
-  if get_run_mode() == 'local':
-    return 1
   if _BASE_ARGS.task_num is not None:
     return _BASE_ARGS.task_num
-  return get_config("worker", "instance_num")
+  task_num = get_config("worker", "instance_num")
+  if task_num is None:
+    return 1
+  return task_num
+
+def get_ps_mode():
+  if get_config('ps_mode') == False:
+    return False
+  return True
 
 _BASE_CONFIG = None
-def get_config(*keys): 
+def get_config(*keys, **kwargs): 
+  default_value = None
+  if 'default_value' in kwargs:
+    default_value = kwargs['default_value']
   global _BASE_CONFIG 
   if _BASE_CONFIG is None:
     if _BASE_ARGS.config:
@@ -103,10 +109,10 @@ def get_config(*keys):
   value = _BASE_CONFIG
   for key in keys:
     if key is None or value is None: 
-      return None
+      return None if not default_value else default_value
     if key in value:
       value = value[key]
     else:
-      return None
+      return None if not default_value else default_value
   return value
 
diff --git a/xdl/xdl/python/utils/file_io.py b/xdl/xdl/python/utils/file_io.py
index 166adac6..fcd6bd5c 100644
--- a/xdl/xdl/python/utils/file_io.py
+++ b/xdl/xdl/python/utils/file_io.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -13,7 +13,7 @@
 # limitations under the License.
 # ==============================================================================
 
-from xdl.python.pybind import hdfs_read, hdfs_write
+from xdl.python.pybind import hdfs_read, hdfs_write, get_file_system
 
 def write_string_to_file(name, content):
     if name.startswith("hdfs://"):
@@ -28,3 +28,35 @@ def read_string_from_file(name):
     else:
         with open(name, 'r') as f:
             return f.read()
+
+class FileSystemClient(object):
+  def __init__(self, fs_type, namenode, reader_path=None, writer_path=None):
+    self._client = get_file_system(fs_type, namenode)
+    self._reader_path = reader_path
+    self._writer_path = writer_path
+    self._reader = None
+    self._writer = None
+    if reader_path is not None:
+      self._reader = self._client.get_ant(reader_path, 'r')
+    if writer_path is not None:
+      self._writer = self._client.get_ant(writer_path, 'w')
+
+  def read(self, path=None):
+    if path is None:
+      path = self._reader_path
+    if path is None:
+      print('ERROR: cannot read without reader path')
+      return
+    # TODO
+
+  def write(self, msg, size, path=None):
+    if path is None:
+      writer = self._writer
+    else:
+      writer = self._client.get_ant(path, 'w')
+    if writer is None:
+      print('ERROR: cannot write without writer path')
+      return
+    res = writer.write(msg, size)
+    if res == -1:
+      print('ERROR: write to swift failed')
diff --git a/xdl/xdl/python/utils/metrics.py b/xdl/xdl/python/utils/metrics.py
index 128400f2..a4c4fc27 100644
--- a/xdl/xdl/python/utils/metrics.py
+++ b/xdl/xdl/python/utils/metrics.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/utils/ps_utils.py b/xdl/xdl/python/utils/ps_utils.py
index 43db1a22..1b37ed54 100644
--- a/xdl/xdl/python/utils/ps_utils.py
+++ b/xdl/xdl/python/utils/ps_utils.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -77,6 +77,7 @@ def run_ps_server(scheduler_kv_path, server_id,
                       smhash=sm_hash,
                       bc=bind_cores)
 
+
 def run_ps_scheduler(scheduler_kv_path, server_num,
                      checkpoint_path, smem, snet,
                      sqps, sm_dense, sm_sparse,
diff --git a/xdl/xdl/python/utils/timeline.py b/xdl/xdl/python/utils/timeline.py
index 30a3ba68..8d8b868c 100644
--- a/xdl/xdl/python/utils/timeline.py
+++ b/xdl/xdl/python/utils/timeline.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
diff --git a/xdl/xdl/python/utils/utils.py b/xdl/xdl/python/utils/utils.py
index 712af897..2324dd26 100644
--- a/xdl/xdl/python/utils/utils.py
+++ b/xdl/xdl/python/utils/utils.py
@@ -1,11 +1,11 @@
-# Copyright (C) 2016-2018 Alibaba Group Holding Limited
-# 
+# Copyright 2018 Alibaba Group. All Rights Reserved.
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
-# 
+#
 #     http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -13,12 +13,73 @@
 # limitations under the License.
 # ==============================================================================
 
+import xdl
+import numpy as np
+import time
+from datetime import datetime
+from xdl.python.framework.variable import Variable
+from xdl.python.lib.datatype import *
+from xdl.python.ops.init_ops import *
+from xdl.python.utils.config import *
+from xdl.python.lib.graph import control_dependencies, execute
+from xdl.python.ops.ps_ops import barrier_op_v2
+
 def decode_strings_from_buf(addrs, lens):
-    """ get string at index by addrs and lens
+  """ get string at index by addrs and lens
     """
-    strings = list()
-    assert len(addrs) == len(lens)
-    for i in range(len(lens)):
-        if lens[i] > 0:
-            strings.append("".join(map(chr, addrs[i, 0:lens[i]])))
-    return strings
+  strings = list()
+  assert len(addrs) == len(lens)
+  for i in range(len(lens)):
+    if lens[i] > 0:
+      strings.append("".join(map(chr, addrs[i, 0:lens[i]])))
+  return strings
+
+def str_to_timestamp(s, format='%Y%m%d%H%M%S', accuracy='us'):
+  t = datetime.strptime(s, format)
+  ts = int(time.mktime(t.timetuple()))
+  if accuracy == 's':
+    return ts
+  elif accuracy == 'ms':
+    return ts * 1000
+  elif accuracy == 'us':
+    return ts * 1000 * 1000
+  else:
+    raise RuntimeError('unknown accuracy %s' % accuracy)
+
+def timestamp_to_str(ts, format='%Y%m%d%H%M%S', accuracy='us'):
+  if accuracy == 'us':
+    ts = ts / 1000 / 1000
+  elif accuracy == 'ms':
+    ts = ts / 1000
+  t = datetime.fromtimestamp(ts)
+  return datetime.strftime(t, format)
+
+BARRIER_VARIABLES = {}
+__BARRIER_TOKEN__ = int(time.time())
+
+def add_barrier_variable(name):
+  global BARRIER_VARIABLES
+  if name not in BARRIER_VARIABLES:
+    BARRIER_VARIABLES[name] = Variable(
+        name,
+        dtype=DataType.int64,
+        shape=[get_task_num()],
+        initializer=Zeros(),
+        trainable=False
+    )
+
+def barrier_with_timestamp(name, timestamp, token=None):
+  var = BARRIER_VARIABLES[name]
+  update_op = xdl.ps_sparse_assign_op(
+      var_name=var.name,
+      var_type=var.vtype,
+      ids=np.array([get_task_index()], dtype=np.int32),
+      values=np.array([timestamp], dtype=np.int64)
+  )
+  with control_dependencies([update_op]):
+    barrier_op = barrier_op_v2(get_task_index(), get_task_num(), token)
+  with control_dependencies([barrier_op]):
+    pull_op = xdl.ps_pull_op(
+        var_name=var.name, var_type=var.vtype, dtype=var.dtype
+    )
+  return np.max(execute(pull_op))